{"train_loss": 1.4553358554840088, "global_step": 0, "epoch": 0} {"train_loss": 1.4284049272537231, "global_step": 1, "epoch": 0} {"train_loss": 1.450287103652954, "global_step": 2, "epoch": 0} {"train_loss": 1.4287457466125488, "global_step": 3, "epoch": 0} {"train_loss": 1.4652185440063477, "global_step": 4, "epoch": 0} {"train_loss": 1.4266324043273926, "global_step": 5, "epoch": 0} {"train_loss": 1.4101310968399048, "global_step": 6, "epoch": 0} {"train_loss": 1.4400880336761475, "global_step": 7, "epoch": 0} {"train_loss": 1.450518250465393, "global_step": 8, "epoch": 0} {"train_loss": 1.4252634048461914, "global_step": 9, "epoch": 0} {"train_loss": 1.439825177192688, "global_step": 10, "epoch": 0} {"train_loss": 1.4373276233673096, "global_step": 11, "epoch": 0} {"train_loss": 1.4353092908859253, "global_step": 12, "epoch": 0} {"train_loss": 1.455334186553955, "global_step": 13, "epoch": 0} {"train_loss": 1.4134043455123901, "global_step": 14, "epoch": 0} {"train_loss": 1.3859390020370483, "global_step": 15, "epoch": 0} {"train_loss": 1.4314393997192383, "global_step": 16, "epoch": 0} {"train_loss": 1.3701198101043701, "global_step": 17, "epoch": 0} {"train_loss": 1.3708679676055908, "global_step": 18, "epoch": 0} {"train_loss": 1.383209466934204, "global_step": 19, "epoch": 0} {"train_loss": 1.3864147663116455, "global_step": 20, "epoch": 0} {"train_loss": 1.396727442741394, "global_step": 21, "epoch": 0} {"train_loss": 1.3258874416351318, "global_step": 22, "epoch": 0} {"train_loss": 1.331321120262146, "global_step": 23, "epoch": 0} {"train_loss": 1.347754955291748, "global_step": 24, "epoch": 0} {"train_loss": 1.3577944040298462, "global_step": 25, "epoch": 0} {"train_loss": 1.3127765655517578, "global_step": 26, "epoch": 0} {"train_loss": 1.3302305936813354, "global_step": 27, "epoch": 0} {"train_loss": 1.2999956607818604, "global_step": 28, "epoch": 0} {"train_loss": 1.3009612560272217, "global_step": 29, "epoch": 0} {"train_loss": 1.2681808471679688, "global_step": 30, "epoch": 0} {"train_loss": 1.2855250835418701, "global_step": 31, "epoch": 0} {"train_loss": 1.2514896392822266, "global_step": 32, "epoch": 0} {"train_loss": 1.2698523998260498, "global_step": 33, "epoch": 0} {"train_loss": 1.2405507564544678, "global_step": 34, "epoch": 0} {"train_loss": 1.205207347869873, "global_step": 35, "epoch": 0} {"train_loss": 1.1877565383911133, "global_step": 36, "epoch": 0} {"train_loss": 1.1430823802947998, "global_step": 37, "epoch": 0} {"train_loss": 1.1398346424102783, "global_step": 38, "epoch": 0} {"train_loss": 1.1094850301742554, "global_step": 39, "epoch": 0} {"train_loss": 1.095122218132019, "global_step": 40, "epoch": 0} {"train_loss": 1.337122965426672, "global_step": 41, "epoch": 0, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.00034764066590660674, "train/sim_max_reward_3": 0.11757319368999389, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.6257370909204435, "test/sim_max_reward_4400000": 0.08842786286054531, "test/sim_max_reward_4400001": 0.014021135271422376, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.5967638406997704, "test/sim_max_reward_4400009": 0.020704568089157497, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.05569209882391426, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3857105753198741, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.19002713605017188, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0010513858461071415, "test/sim_max_reward_4400028": 0.29482665684494397, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.00011585420771179685, "test/sim_max_reward_4400031": 1.2890978942579066e-05, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.000580526080550122, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.38815072915163495, "test/sim_max_reward_4400037": 0.0, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.022485346008863004, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.0, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.0, "test/sim_max_reward_4400047": 0.0005351012849106201, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.15735570177915412, "test/mean_score": 0.07721404441118089, "val_loss": 11441586.0} {"train_loss": 1.090126872062683, "global_step": 42, "epoch": 1} {"train_loss": 1.024315357208252, "global_step": 43, "epoch": 1} {"train_loss": 1.026357650756836, "global_step": 44, "epoch": 1} {"train_loss": 1.0076258182525635, "global_step": 45, "epoch": 1} {"train_loss": 1.0029003620147705, "global_step": 46, "epoch": 1} {"train_loss": 1.0109071731567383, "global_step": 47, "epoch": 1} {"train_loss": 0.9280210733413696, "global_step": 48, "epoch": 1} {"train_loss": 0.8922097682952881, "global_step": 49, "epoch": 1} {"train_loss": 0.8946560025215149, "global_step": 50, "epoch": 1} {"train_loss": 0.9061793088912964, "global_step": 51, "epoch": 1} {"train_loss": 0.8959782719612122, "global_step": 52, "epoch": 1} {"train_loss": 0.8681607842445374, "global_step": 53, "epoch": 1} {"train_loss": 0.8102174997329712, "global_step": 54, "epoch": 1} {"train_loss": 0.7962092161178589, "global_step": 55, "epoch": 1} {"train_loss": 0.7935338020324707, "global_step": 56, "epoch": 1} {"train_loss": 0.7893689870834351, "global_step": 57, "epoch": 1} {"train_loss": 0.7514796853065491, "global_step": 58, "epoch": 1} {"train_loss": 0.6730944514274597, "global_step": 59, "epoch": 1} {"train_loss": 0.7242342233657837, "global_step": 60, "epoch": 1} {"train_loss": 0.6489130258560181, "global_step": 61, "epoch": 1} {"train_loss": 0.6485254764556885, "global_step": 62, "epoch": 1} {"train_loss": 0.6135025024414062, "global_step": 63, "epoch": 1} {"train_loss": 0.6078102588653564, "global_step": 64, "epoch": 1} {"train_loss": 0.5739595890045166, "global_step": 65, "epoch": 1} {"train_loss": 0.5471118688583374, "global_step": 66, "epoch": 1} {"train_loss": 0.5159038305282593, "global_step": 67, "epoch": 1} {"train_loss": 0.46464383602142334, "global_step": 68, "epoch": 1} {"train_loss": 0.4965456426143646, "global_step": 69, "epoch": 1} {"train_loss": 0.45079565048217773, "global_step": 70, "epoch": 1} {"train_loss": 0.37334710359573364, "global_step": 71, "epoch": 1} {"train_loss": 0.38355255126953125, "global_step": 72, "epoch": 1} {"train_loss": 0.37763404846191406, "global_step": 73, "epoch": 1} {"train_loss": 0.32305455207824707, "global_step": 74, "epoch": 1} {"train_loss": 0.2959320545196533, "global_step": 75, "epoch": 1} {"train_loss": 0.3187207579612732, "global_step": 76, "epoch": 1} {"train_loss": 0.3859589695930481, "global_step": 77, "epoch": 1} {"train_loss": 0.24861101806163788, "global_step": 78, "epoch": 1} {"train_loss": 0.3486785292625427, "global_step": 79, "epoch": 1} {"train_loss": 0.3420024514198303, "global_step": 80, "epoch": 1} {"train_loss": 0.32357674837112427, "global_step": 81, "epoch": 1} {"train_loss": 0.2633894085884094, "global_step": 82, "epoch": 1} {"train_loss": 0.6348453866583961, "global_step": 83, "epoch": 1, "val_loss": 6081241.0} {"train_loss": 0.2711314558982849, "global_step": 84, "epoch": 2} {"train_loss": 0.27207958698272705, "global_step": 85, "epoch": 2} {"train_loss": 0.20876666903495789, "global_step": 86, "epoch": 2} {"train_loss": 0.29237908124923706, "global_step": 87, "epoch": 2} {"train_loss": 0.18829426169395447, "global_step": 88, "epoch": 2} {"train_loss": 0.18749096989631653, "global_step": 89, "epoch": 2} {"train_loss": 0.18803565204143524, "global_step": 90, "epoch": 2} {"train_loss": 0.15808218717575073, "global_step": 91, "epoch": 2} {"train_loss": 0.17494526505470276, "global_step": 92, "epoch": 2} {"train_loss": 0.21131116151809692, "global_step": 93, "epoch": 2} {"train_loss": 0.17841067910194397, "global_step": 94, "epoch": 2} {"train_loss": 0.15789107978343964, "global_step": 95, "epoch": 2} {"train_loss": 0.07623434066772461, "global_step": 96, "epoch": 2} {"train_loss": 0.1654820442199707, "global_step": 97, "epoch": 2} {"train_loss": 0.13181573152542114, "global_step": 98, "epoch": 2} {"train_loss": 0.12672874331474304, "global_step": 99, "epoch": 2} {"train_loss": 0.0988544151186943, "global_step": 100, "epoch": 2} {"train_loss": 0.08458246290683746, "global_step": 101, "epoch": 2} {"train_loss": 0.07156303524971008, "global_step": 102, "epoch": 2} {"train_loss": 0.0621456503868103, "global_step": 103, "epoch": 2} {"train_loss": 0.09955679625272751, "global_step": 104, "epoch": 2} {"train_loss": 0.06457291543483734, "global_step": 105, "epoch": 2} {"train_loss": 0.12609128654003143, "global_step": 106, "epoch": 2} {"train_loss": 0.031147507950663567, "global_step": 107, "epoch": 2} {"train_loss": 0.09962660074234009, "global_step": 108, "epoch": 2} {"train_loss": 0.06553985923528671, "global_step": 109, "epoch": 2} {"train_loss": 0.04464017599821091, "global_step": 110, "epoch": 2} {"train_loss": -0.028241800144314766, "global_step": 111, "epoch": 2} {"train_loss": -0.024760521948337555, "global_step": 112, "epoch": 2} {"train_loss": -0.013629637658596039, "global_step": 113, "epoch": 2} {"train_loss": -0.04169416055083275, "global_step": 114, "epoch": 2} {"train_loss": 0.011142335832118988, "global_step": 115, "epoch": 2} {"train_loss": 0.01843070238828659, "global_step": 116, "epoch": 2} {"train_loss": -0.07788535207509995, "global_step": 117, "epoch": 2} {"train_loss": -0.05293232202529907, "global_step": 118, "epoch": 2} {"train_loss": -0.08217989653348923, "global_step": 119, "epoch": 2} {"train_loss": -0.10560576617717743, "global_step": 120, "epoch": 2} {"train_loss": -0.017764586955308914, "global_step": 121, "epoch": 2} {"train_loss": -0.20153269171714783, "global_step": 122, "epoch": 2} {"train_loss": -0.07091106474399567, "global_step": 123, "epoch": 2} {"train_loss": -0.17417174577713013, "global_step": 124, "epoch": 2} {"train_loss": 0.06990014194023042, "global_step": 125, "epoch": 2, "val_loss": 4919778.5} {"train_loss": -0.1438038945198059, "global_step": 126, "epoch": 3} {"train_loss": -0.07592632621526718, "global_step": 127, "epoch": 3} {"train_loss": -0.09682749211788177, "global_step": 128, "epoch": 3} {"train_loss": -0.15490156412124634, "global_step": 129, "epoch": 3} {"train_loss": -0.1605113297700882, "global_step": 130, "epoch": 3} {"train_loss": -0.07468193024396896, "global_step": 131, "epoch": 3} {"train_loss": -0.16005170345306396, "global_step": 132, "epoch": 3} {"train_loss": -0.10878217965364456, "global_step": 133, "epoch": 3} {"train_loss": -0.1972365528345108, "global_step": 134, "epoch": 3} {"train_loss": -0.16230972111225128, "global_step": 135, "epoch": 3} {"train_loss": -0.17351195216178894, "global_step": 136, "epoch": 3} {"train_loss": -0.2704504728317261, "global_step": 137, "epoch": 3} {"train_loss": -0.19390614330768585, "global_step": 138, "epoch": 3} {"train_loss": -0.2900758385658264, "global_step": 139, "epoch": 3} {"train_loss": -0.2334844321012497, "global_step": 140, "epoch": 3} {"train_loss": -0.18255198001861572, "global_step": 141, "epoch": 3} {"train_loss": -0.22187471389770508, "global_step": 142, "epoch": 3} {"train_loss": -0.36156153678894043, "global_step": 143, "epoch": 3} {"train_loss": -0.24893727898597717, "global_step": 144, "epoch": 3} {"train_loss": -0.27530577778816223, "global_step": 145, "epoch": 3} {"train_loss": -0.28751498460769653, "global_step": 146, "epoch": 3} {"train_loss": -0.27370157837867737, "global_step": 147, "epoch": 3} {"train_loss": -0.3694072961807251, "global_step": 148, "epoch": 3} {"train_loss": -0.3188818693161011, "global_step": 149, "epoch": 3} {"train_loss": -0.21347539126873016, "global_step": 150, "epoch": 3} {"train_loss": -0.3772282600402832, "global_step": 151, "epoch": 3} {"train_loss": -0.36780059337615967, "global_step": 152, "epoch": 3} {"train_loss": -0.2723783254623413, "global_step": 153, "epoch": 3} {"train_loss": -0.2208855301141739, "global_step": 154, "epoch": 3} {"train_loss": -0.2727092504501343, "global_step": 155, "epoch": 3} {"train_loss": -0.44257670640945435, "global_step": 156, "epoch": 3} {"train_loss": -0.35938194394111633, "global_step": 157, "epoch": 3} {"train_loss": -0.32719284296035767, "global_step": 158, "epoch": 3} {"train_loss": -0.300002783536911, "global_step": 159, "epoch": 3} {"train_loss": -0.39153093099594116, "global_step": 160, "epoch": 3} {"train_loss": -0.3784732520580292, "global_step": 161, "epoch": 3} {"train_loss": -0.43235063552856445, "global_step": 162, "epoch": 3} {"train_loss": -0.4807592034339905, "global_step": 163, "epoch": 3} {"train_loss": -0.3150671720504761, "global_step": 164, "epoch": 3} {"train_loss": -0.35234084725379944, "global_step": 165, "epoch": 3} {"train_loss": -0.3541284501552582, "global_step": 166, "epoch": 3} {"train_loss": -0.26881673417630647, "global_step": 167, "epoch": 3, "val_loss": 4016529.5} {"train_loss": -0.35174840688705444, "global_step": 168, "epoch": 4} {"train_loss": -0.4256170988082886, "global_step": 169, "epoch": 4} {"train_loss": -0.3899725079536438, "global_step": 170, "epoch": 4} {"train_loss": -0.4200555086135864, "global_step": 171, "epoch": 4} {"train_loss": -0.608771562576294, "global_step": 172, "epoch": 4} {"train_loss": -0.46803778409957886, "global_step": 173, "epoch": 4} {"train_loss": -0.38313430547714233, "global_step": 174, "epoch": 4} {"train_loss": -0.39055731892585754, "global_step": 175, "epoch": 4} {"train_loss": -0.4117504060268402, "global_step": 176, "epoch": 4} {"train_loss": -0.3936222791671753, "global_step": 177, "epoch": 4} {"train_loss": -0.38727614283561707, "global_step": 178, "epoch": 4} {"train_loss": -0.3888799548149109, "global_step": 179, "epoch": 4} {"train_loss": -0.49620312452316284, "global_step": 180, "epoch": 4} {"train_loss": -0.48916804790496826, "global_step": 181, "epoch": 4} {"train_loss": -0.46027278900146484, "global_step": 182, "epoch": 4} {"train_loss": -0.43069860339164734, "global_step": 183, "epoch": 4} {"train_loss": -0.45517387986183167, "global_step": 184, "epoch": 4} {"train_loss": -0.5846148729324341, "global_step": 185, "epoch": 4} {"train_loss": -0.5287935733795166, "global_step": 186, "epoch": 4} {"train_loss": -0.48399341106414795, "global_step": 187, "epoch": 4} {"train_loss": -0.5319443941116333, "global_step": 188, "epoch": 4} {"train_loss": -0.6430544257164001, "global_step": 189, "epoch": 4} {"train_loss": -0.5118618607521057, "global_step": 190, "epoch": 4} {"train_loss": -0.5569066405296326, "global_step": 191, "epoch": 4} {"train_loss": -0.5129459500312805, "global_step": 192, "epoch": 4} {"train_loss": -0.5176061391830444, "global_step": 193, "epoch": 4} {"train_loss": -0.5022526979446411, "global_step": 194, "epoch": 4} {"train_loss": -0.5743697881698608, "global_step": 195, "epoch": 4} {"train_loss": -0.48646366596221924, "global_step": 196, "epoch": 4} {"train_loss": -0.6415316462516785, "global_step": 197, "epoch": 4} {"train_loss": -0.5953288078308105, "global_step": 198, "epoch": 4} {"train_loss": -0.5943329334259033, "global_step": 199, "epoch": 4} {"train_loss": -0.5981863737106323, "global_step": 200, "epoch": 4} {"train_loss": -0.6410253047943115, "global_step": 201, "epoch": 4} {"train_loss": -0.5986403226852417, "global_step": 202, "epoch": 4} {"train_loss": -0.6129131317138672, "global_step": 203, "epoch": 4} {"train_loss": -0.4250521957874298, "global_step": 204, "epoch": 4} {"train_loss": -0.6283206939697266, "global_step": 205, "epoch": 4} {"train_loss": -0.6817045211791992, "global_step": 206, "epoch": 4} {"train_loss": -0.5890135169029236, "global_step": 207, "epoch": 4} {"train_loss": -0.6785891056060791, "global_step": 208, "epoch": 4} {"train_loss": -0.5151146196183705, "global_step": 209, "epoch": 4, "val_loss": 3466598.0} {"train_loss": -0.6580734252929688, "global_step": 210, "epoch": 5} {"train_loss": -0.6284456849098206, "global_step": 211, "epoch": 5} {"train_loss": -0.5682816505432129, "global_step": 212, "epoch": 5} {"train_loss": -0.6122725605964661, "global_step": 213, "epoch": 5} {"train_loss": -0.631715714931488, "global_step": 214, "epoch": 5} {"train_loss": -0.6123191118240356, "global_step": 215, "epoch": 5} {"train_loss": -0.6860443949699402, "global_step": 216, "epoch": 5} {"train_loss": -0.6282761096954346, "global_step": 217, "epoch": 5} {"train_loss": -0.6189041137695312, "global_step": 218, "epoch": 5} {"train_loss": -0.6610952615737915, "global_step": 219, "epoch": 5} {"train_loss": -0.559447169303894, "global_step": 220, "epoch": 5} {"train_loss": -0.6656152009963989, "global_step": 221, "epoch": 5} {"train_loss": -0.7443739175796509, "global_step": 222, "epoch": 5} {"train_loss": -0.6528406143188477, "global_step": 223, "epoch": 5} {"train_loss": -0.6600395441055298, "global_step": 224, "epoch": 5} {"train_loss": -0.6657983660697937, "global_step": 225, "epoch": 5} {"train_loss": -0.7358099222183228, "global_step": 226, "epoch": 5} {"train_loss": -0.6766595840454102, "global_step": 227, "epoch": 5} {"train_loss": -0.6933856010437012, "global_step": 228, "epoch": 5} {"train_loss": -0.7435463666915894, "global_step": 229, "epoch": 5} {"train_loss": -0.7420130968093872, "global_step": 230, "epoch": 5} {"train_loss": -0.7304596900939941, "global_step": 231, "epoch": 5} {"train_loss": -0.6380326747894287, "global_step": 232, "epoch": 5} {"train_loss": -0.648201584815979, "global_step": 233, "epoch": 5} {"train_loss": -0.7192098498344421, "global_step": 234, "epoch": 5} {"train_loss": -0.5802749395370483, "global_step": 235, "epoch": 5} {"train_loss": -0.7080080509185791, "global_step": 236, "epoch": 5} {"train_loss": -0.7436631321907043, "global_step": 237, "epoch": 5} {"train_loss": -0.7367742657661438, "global_step": 238, "epoch": 5} {"train_loss": -0.7112104892730713, "global_step": 239, "epoch": 5} {"train_loss": -0.7758231163024902, "global_step": 240, "epoch": 5} {"train_loss": -0.7728086709976196, "global_step": 241, "epoch": 5} {"train_loss": -0.7970385551452637, "global_step": 242, "epoch": 5} {"train_loss": -0.7686655521392822, "global_step": 243, "epoch": 5} {"train_loss": -0.8247129917144775, "global_step": 244, "epoch": 5} {"train_loss": -0.8231751918792725, "global_step": 245, "epoch": 5} {"train_loss": -0.779710054397583, "global_step": 246, "epoch": 5} {"train_loss": -0.7909900546073914, "global_step": 247, "epoch": 5} {"train_loss": -0.8286511898040771, "global_step": 248, "epoch": 5} {"train_loss": -0.8088642358779907, "global_step": 249, "epoch": 5} {"train_loss": -0.7676597237586975, "global_step": 250, "epoch": 5} {"train_loss": -0.7049812944162459, "global_step": 251, "epoch": 5, "val_loss": 3072183.75} {"train_loss": -0.7677528858184814, "global_step": 252, "epoch": 6} {"train_loss": -0.8330885767936707, "global_step": 253, "epoch": 6} {"train_loss": -0.7743661403656006, "global_step": 254, "epoch": 6} {"train_loss": -0.8442385196685791, "global_step": 255, "epoch": 6} {"train_loss": -0.7232406139373779, "global_step": 256, "epoch": 6} {"train_loss": -0.8101706504821777, "global_step": 257, "epoch": 6} {"train_loss": -0.7729748487472534, "global_step": 258, "epoch": 6} {"train_loss": -0.916092038154602, "global_step": 259, "epoch": 6} {"train_loss": -0.8380815982818604, "global_step": 260, "epoch": 6} {"train_loss": -0.7872966527938843, "global_step": 261, "epoch": 6} {"train_loss": -0.8740889430046082, "global_step": 262, "epoch": 6} {"train_loss": -0.8203660249710083, "global_step": 263, "epoch": 6} {"train_loss": -0.8131096959114075, "global_step": 264, "epoch": 6} {"train_loss": -0.8422027826309204, "global_step": 265, "epoch": 6} {"train_loss": -0.7853728532791138, "global_step": 266, "epoch": 6} {"train_loss": -0.8148059844970703, "global_step": 267, "epoch": 6} {"train_loss": -0.9059722423553467, "global_step": 268, "epoch": 6} {"train_loss": -0.8670823574066162, "global_step": 269, "epoch": 6} {"train_loss": -0.7838895916938782, "global_step": 270, "epoch": 6} {"train_loss": -1.0304300785064697, "global_step": 271, "epoch": 6} {"train_loss": -0.8645247220993042, "global_step": 272, "epoch": 6} {"train_loss": -0.8903625011444092, "global_step": 273, "epoch": 6} {"train_loss": -0.8467745780944824, "global_step": 274, "epoch": 6} {"train_loss": -0.9435306787490845, "global_step": 275, "epoch": 6} {"train_loss": -0.981721818447113, "global_step": 276, "epoch": 6} {"train_loss": -0.9157743453979492, "global_step": 277, "epoch": 6} {"train_loss": -0.903809666633606, "global_step": 278, "epoch": 6} {"train_loss": -0.8158130049705505, "global_step": 279, "epoch": 6} {"train_loss": -0.8601258993148804, "global_step": 280, "epoch": 6} {"train_loss": -0.8689553737640381, "global_step": 281, "epoch": 6} {"train_loss": -0.8722617626190186, "global_step": 282, "epoch": 6} {"train_loss": -0.9570367336273193, "global_step": 283, "epoch": 6} {"train_loss": -0.8006277680397034, "global_step": 284, "epoch": 6} {"train_loss": -0.8687241077423096, "global_step": 285, "epoch": 6} {"train_loss": -0.9162251949310303, "global_step": 286, "epoch": 6} {"train_loss": -0.9401922225952148, "global_step": 287, "epoch": 6} {"train_loss": -0.8801304697990417, "global_step": 288, "epoch": 6} {"train_loss": -0.8436715602874756, "global_step": 289, "epoch": 6} {"train_loss": -0.7703123688697815, "global_step": 290, "epoch": 6} {"train_loss": -0.7741301655769348, "global_step": 291, "epoch": 6} {"train_loss": -0.898124635219574, "global_step": 292, "epoch": 6} {"train_loss": -0.8559023709524245, "global_step": 293, "epoch": 6, "val_loss": 2740844.5} {"train_loss": -0.8801636695861816, "global_step": 294, "epoch": 7} {"train_loss": -0.833611011505127, "global_step": 295, "epoch": 7} {"train_loss": -0.8571834564208984, "global_step": 296, "epoch": 7} {"train_loss": -0.9283109903335571, "global_step": 297, "epoch": 7} {"train_loss": -0.8870270848274231, "global_step": 298, "epoch": 7} {"train_loss": -1.0007643699645996, "global_step": 299, "epoch": 7} {"train_loss": -0.9218206405639648, "global_step": 300, "epoch": 7} {"train_loss": -1.0015335083007812, "global_step": 301, "epoch": 7} {"train_loss": -0.9272891283035278, "global_step": 302, "epoch": 7} {"train_loss": -0.9101675748825073, "global_step": 303, "epoch": 7} {"train_loss": -0.9671788811683655, "global_step": 304, "epoch": 7} {"train_loss": -0.9475462436676025, "global_step": 305, "epoch": 7} {"train_loss": -0.9775627255439758, "global_step": 306, "epoch": 7} {"train_loss": -0.9642548561096191, "global_step": 307, "epoch": 7} {"train_loss": -1.0770106315612793, "global_step": 308, "epoch": 7} {"train_loss": -0.9750613570213318, "global_step": 309, "epoch": 7} {"train_loss": -0.9650771021842957, "global_step": 310, "epoch": 7} {"train_loss": -0.9767295122146606, "global_step": 311, "epoch": 7} {"train_loss": -1.1097497940063477, "global_step": 312, "epoch": 7} {"train_loss": -0.9692240357398987, "global_step": 313, "epoch": 7} {"train_loss": -1.0487749576568604, "global_step": 314, "epoch": 7} {"train_loss": -1.0713725090026855, "global_step": 315, "epoch": 7} {"train_loss": -1.0801372528076172, "global_step": 316, "epoch": 7} {"train_loss": -0.9191031455993652, "global_step": 317, "epoch": 7} {"train_loss": -1.0260567665100098, "global_step": 318, "epoch": 7} {"train_loss": -1.1428749561309814, "global_step": 319, "epoch": 7} {"train_loss": -0.9649633169174194, "global_step": 320, "epoch": 7} {"train_loss": -0.9808555245399475, "global_step": 321, "epoch": 7} {"train_loss": -1.030362606048584, "global_step": 322, "epoch": 7} {"train_loss": -0.999401330947876, "global_step": 323, "epoch": 7} {"train_loss": -0.9857748746871948, "global_step": 324, "epoch": 7} {"train_loss": -1.008439302444458, "global_step": 325, "epoch": 7} {"train_loss": -1.1028683185577393, "global_step": 326, "epoch": 7} {"train_loss": -1.0322726964950562, "global_step": 327, "epoch": 7} {"train_loss": -1.0479092597961426, "global_step": 328, "epoch": 7} {"train_loss": -1.0631043910980225, "global_step": 329, "epoch": 7} {"train_loss": -0.968732476234436, "global_step": 330, "epoch": 7} {"train_loss": -1.0569031238555908, "global_step": 331, "epoch": 7} {"train_loss": -1.0040792226791382, "global_step": 332, "epoch": 7} {"train_loss": -0.9931032061576843, "global_step": 333, "epoch": 7} {"train_loss": -1.0570714473724365, "global_step": 334, "epoch": 7} {"train_loss": -0.9953457741510301, "global_step": 335, "epoch": 7, "val_loss": 2440352.5} {"train_loss": -1.0269417762756348, "global_step": 336, "epoch": 8} {"train_loss": -1.107823133468628, "global_step": 337, "epoch": 8} {"train_loss": -0.9308358430862427, "global_step": 338, "epoch": 8} {"train_loss": -0.9716522693634033, "global_step": 339, "epoch": 8} {"train_loss": -1.012400507926941, "global_step": 340, "epoch": 8} {"train_loss": -1.1943142414093018, "global_step": 341, "epoch": 8} {"train_loss": -1.0173662900924683, "global_step": 342, "epoch": 8} {"train_loss": -0.9760974645614624, "global_step": 343, "epoch": 8} {"train_loss": -1.024300456047058, "global_step": 344, "epoch": 8} {"train_loss": -1.0906920433044434, "global_step": 345, "epoch": 8} {"train_loss": -1.046409010887146, "global_step": 346, "epoch": 8} {"train_loss": -1.2421398162841797, "global_step": 347, "epoch": 8} {"train_loss": -1.0714359283447266, "global_step": 348, "epoch": 8} {"train_loss": -1.0980501174926758, "global_step": 349, "epoch": 8} {"train_loss": -1.0782040357589722, "global_step": 350, "epoch": 8} {"train_loss": -1.0738847255706787, "global_step": 351, "epoch": 8} {"train_loss": -1.0885412693023682, "global_step": 352, "epoch": 8} {"train_loss": -1.0727753639221191, "global_step": 353, "epoch": 8} {"train_loss": -1.1193382740020752, "global_step": 354, "epoch": 8} {"train_loss": -1.0774023532867432, "global_step": 355, "epoch": 8} {"train_loss": -1.1412780284881592, "global_step": 356, "epoch": 8} {"train_loss": -1.0813512802124023, "global_step": 357, "epoch": 8} {"train_loss": -1.1344443559646606, "global_step": 358, "epoch": 8} {"train_loss": -1.2107584476470947, "global_step": 359, "epoch": 8} {"train_loss": -1.1687369346618652, "global_step": 360, "epoch": 8} {"train_loss": -1.1508245468139648, "global_step": 361, "epoch": 8} {"train_loss": -1.0508489608764648, "global_step": 362, "epoch": 8} {"train_loss": -1.0869683027267456, "global_step": 363, "epoch": 8} {"train_loss": -1.0073407888412476, "global_step": 364, "epoch": 8} {"train_loss": -1.0632717609405518, "global_step": 365, "epoch": 8} {"train_loss": -1.1473267078399658, "global_step": 366, "epoch": 8} {"train_loss": -1.2473036050796509, "global_step": 367, "epoch": 8} {"train_loss": -1.0961823463439941, "global_step": 368, "epoch": 8} {"train_loss": -1.0680121183395386, "global_step": 369, "epoch": 8} {"train_loss": -1.2371790409088135, "global_step": 370, "epoch": 8} {"train_loss": -1.02931547164917, "global_step": 371, "epoch": 8} {"train_loss": -1.1067306995391846, "global_step": 372, "epoch": 8} {"train_loss": -1.1947262287139893, "global_step": 373, "epoch": 8} {"train_loss": -1.0619901418685913, "global_step": 374, "epoch": 8} {"train_loss": -1.2582939863204956, "global_step": 375, "epoch": 8} {"train_loss": -1.14365816116333, "global_step": 376, "epoch": 8} {"train_loss": -1.1040310150101071, "global_step": 377, "epoch": 8, "val_loss": 2222747.0} {"train_loss": -1.1444389820098877, "global_step": 378, "epoch": 9} {"train_loss": -1.197512149810791, "global_step": 379, "epoch": 9} {"train_loss": -1.2341461181640625, "global_step": 380, "epoch": 9} {"train_loss": -1.1751587390899658, "global_step": 381, "epoch": 9} {"train_loss": -1.1838610172271729, "global_step": 382, "epoch": 9} {"train_loss": -1.2317030429840088, "global_step": 383, "epoch": 9} {"train_loss": -1.2556369304656982, "global_step": 384, "epoch": 9} {"train_loss": -1.2298552989959717, "global_step": 385, "epoch": 9} {"train_loss": -1.234473466873169, "global_step": 386, "epoch": 9} {"train_loss": -1.0383734703063965, "global_step": 387, "epoch": 9} {"train_loss": -1.2337359189987183, "global_step": 388, "epoch": 9} {"train_loss": -1.3096781969070435, "global_step": 389, "epoch": 9} {"train_loss": -1.2012639045715332, "global_step": 390, "epoch": 9} {"train_loss": -1.0288702249526978, "global_step": 391, "epoch": 9} {"train_loss": -1.2471811771392822, "global_step": 392, "epoch": 9} {"train_loss": -1.1129939556121826, "global_step": 393, "epoch": 9} {"train_loss": -1.334872841835022, "global_step": 394, "epoch": 9} {"train_loss": -1.1961560249328613, "global_step": 395, "epoch": 9} {"train_loss": -1.2598689794540405, "global_step": 396, "epoch": 9} {"train_loss": -1.3014721870422363, "global_step": 397, "epoch": 9} {"train_loss": -1.1293256282806396, "global_step": 398, "epoch": 9} {"train_loss": -1.2426881790161133, "global_step": 399, "epoch": 9} {"train_loss": -1.238468885421753, "global_step": 400, "epoch": 9} {"train_loss": -1.392366647720337, "global_step": 401, "epoch": 9} {"train_loss": -1.2501864433288574, "global_step": 402, "epoch": 9} {"train_loss": -1.318760633468628, "global_step": 403, "epoch": 9} {"train_loss": -1.2639076709747314, "global_step": 404, "epoch": 9} {"train_loss": -1.2471678256988525, "global_step": 405, "epoch": 9} {"train_loss": -1.2585229873657227, "global_step": 406, "epoch": 9} {"train_loss": -1.239696979522705, "global_step": 407, "epoch": 9} {"train_loss": -1.3652317523956299, "global_step": 408, "epoch": 9} {"train_loss": -1.2548327445983887, "global_step": 409, "epoch": 9} {"train_loss": -1.4465303421020508, "global_step": 410, "epoch": 9} {"train_loss": -1.391021728515625, "global_step": 411, "epoch": 9} {"train_loss": -1.288896083831787, "global_step": 412, "epoch": 9} {"train_loss": -1.2407525777816772, "global_step": 413, "epoch": 9} {"train_loss": -1.1592848300933838, "global_step": 414, "epoch": 9} {"train_loss": -1.3462532758712769, "global_step": 415, "epoch": 9} {"train_loss": -1.2912002801895142, "global_step": 416, "epoch": 9} {"train_loss": -1.2497810125350952, "global_step": 417, "epoch": 9} {"train_loss": -1.3591816425323486, "global_step": 418, "epoch": 9} {"train_loss": -1.2483103984878177, "global_step": 419, "epoch": 9, "val_loss": 2044191.5} {"train_loss": -1.250596046447754, "global_step": 420, "epoch": 10} {"train_loss": -1.2310998439788818, "global_step": 421, "epoch": 10} {"train_loss": -1.1537959575653076, "global_step": 422, "epoch": 10} {"train_loss": -1.3494572639465332, "global_step": 423, "epoch": 10} {"train_loss": -1.2565239667892456, "global_step": 424, "epoch": 10} {"train_loss": -1.342287302017212, "global_step": 425, "epoch": 10} {"train_loss": -1.2102762460708618, "global_step": 426, "epoch": 10} {"train_loss": -1.3302000761032104, "global_step": 427, "epoch": 10} {"train_loss": -1.341352939605713, "global_step": 428, "epoch": 10} {"train_loss": -1.2966498136520386, "global_step": 429, "epoch": 10} {"train_loss": -1.3154375553131104, "global_step": 430, "epoch": 10} {"train_loss": -1.3660411834716797, "global_step": 431, "epoch": 10} {"train_loss": -1.405604600906372, "global_step": 432, "epoch": 10} {"train_loss": -1.458922028541565, "global_step": 433, "epoch": 10} {"train_loss": -1.217618465423584, "global_step": 434, "epoch": 10} {"train_loss": -1.3546596765518188, "global_step": 435, "epoch": 10} {"train_loss": -1.364830732345581, "global_step": 436, "epoch": 10} {"train_loss": -1.3876609802246094, "global_step": 437, "epoch": 10} {"train_loss": -1.339396595954895, "global_step": 438, "epoch": 10} {"train_loss": -1.2196861505508423, "global_step": 439, "epoch": 10} {"train_loss": -1.368074893951416, "global_step": 440, "epoch": 10} {"train_loss": -1.3937968015670776, "global_step": 441, "epoch": 10} {"train_loss": -1.3843400478363037, "global_step": 442, "epoch": 10} {"train_loss": -1.4984203577041626, "global_step": 443, "epoch": 10} {"train_loss": -1.3639111518859863, "global_step": 444, "epoch": 10} {"train_loss": -1.4456483125686646, "global_step": 445, "epoch": 10} {"train_loss": -1.3075627088546753, "global_step": 446, "epoch": 10} {"train_loss": -1.282704472541809, "global_step": 447, "epoch": 10} {"train_loss": -1.3941161632537842, "global_step": 448, "epoch": 10} {"train_loss": -1.384602665901184, "global_step": 449, "epoch": 10} {"train_loss": -1.2594677209854126, "global_step": 450, "epoch": 10} {"train_loss": -1.479688048362732, "global_step": 451, "epoch": 10} {"train_loss": -1.2443797588348389, "global_step": 452, "epoch": 10} {"train_loss": -1.411789059638977, "global_step": 453, "epoch": 10} {"train_loss": -1.350239634513855, "global_step": 454, "epoch": 10} {"train_loss": -1.5595097541809082, "global_step": 455, "epoch": 10} {"train_loss": -1.4426820278167725, "global_step": 456, "epoch": 10} {"train_loss": -1.3580923080444336, "global_step": 457, "epoch": 10} {"train_loss": -1.481581211090088, "global_step": 458, "epoch": 10} {"train_loss": -1.3386905193328857, "global_step": 459, "epoch": 10} {"train_loss": -1.351120948791504, "global_step": 460, "epoch": 10} {"train_loss": -1.3508549644833518, "global_step": 461, "epoch": 10, "val_loss": 1863458.125} {"train_loss": -1.306554913520813, "global_step": 462, "epoch": 11} {"train_loss": -1.4484879970550537, "global_step": 463, "epoch": 11} {"train_loss": -1.3465518951416016, "global_step": 464, "epoch": 11} {"train_loss": -1.4785051345825195, "global_step": 465, "epoch": 11} {"train_loss": -1.487121820449829, "global_step": 466, "epoch": 11} {"train_loss": -1.482191801071167, "global_step": 467, "epoch": 11} {"train_loss": -1.3024892807006836, "global_step": 468, "epoch": 11} {"train_loss": -1.4418343305587769, "global_step": 469, "epoch": 11} {"train_loss": -1.6234180927276611, "global_step": 470, "epoch": 11} {"train_loss": -1.3347359895706177, "global_step": 471, "epoch": 11} {"train_loss": -1.3925774097442627, "global_step": 472, "epoch": 11} {"train_loss": -1.4596632719039917, "global_step": 473, "epoch": 11} {"train_loss": -1.4679216146469116, "global_step": 474, "epoch": 11} {"train_loss": -1.2802152633666992, "global_step": 475, "epoch": 11} {"train_loss": -1.45879065990448, "global_step": 476, "epoch": 11} {"train_loss": -1.4979428052902222, "global_step": 477, "epoch": 11} {"train_loss": -1.304030179977417, "global_step": 478, "epoch": 11} {"train_loss": -1.371572494506836, "global_step": 479, "epoch": 11} {"train_loss": -1.3436243534088135, "global_step": 480, "epoch": 11} {"train_loss": -1.5801849365234375, "global_step": 481, "epoch": 11} {"train_loss": -1.4256279468536377, "global_step": 482, "epoch": 11} {"train_loss": -1.481343150138855, "global_step": 483, "epoch": 11} {"train_loss": -1.3790156841278076, "global_step": 484, "epoch": 11} {"train_loss": -1.4525978565216064, "global_step": 485, "epoch": 11} {"train_loss": -1.5166528224945068, "global_step": 486, "epoch": 11} {"train_loss": -1.4576647281646729, "global_step": 487, "epoch": 11} {"train_loss": -1.4970574378967285, "global_step": 488, "epoch": 11} {"train_loss": -1.615657925605774, "global_step": 489, "epoch": 11} {"train_loss": -1.453589677810669, "global_step": 490, "epoch": 11} {"train_loss": -1.5954670906066895, "global_step": 491, "epoch": 11} {"train_loss": -1.46622896194458, "global_step": 492, "epoch": 11} {"train_loss": -1.5020673274993896, "global_step": 493, "epoch": 11} {"train_loss": -1.5533788204193115, "global_step": 494, "epoch": 11} {"train_loss": -1.363495111465454, "global_step": 495, "epoch": 11} {"train_loss": -1.4313418865203857, "global_step": 496, "epoch": 11} {"train_loss": -1.4857481718063354, "global_step": 497, "epoch": 11} {"train_loss": -1.3729904890060425, "global_step": 498, "epoch": 11} {"train_loss": -1.5095691680908203, "global_step": 499, "epoch": 11} {"train_loss": -1.5809913873672485, "global_step": 500, "epoch": 11} {"train_loss": -1.5198793411254883, "global_step": 501, "epoch": 11} {"train_loss": -1.554933786392212, "global_step": 502, "epoch": 11} {"train_loss": -1.457343822433835, "global_step": 503, "epoch": 11, "val_loss": 1742416.125} {"train_loss": -1.489402413368225, "global_step": 504, "epoch": 12} {"train_loss": -1.4105128049850464, "global_step": 505, "epoch": 12} {"train_loss": -1.4235687255859375, "global_step": 506, "epoch": 12} {"train_loss": -1.4600543975830078, "global_step": 507, "epoch": 12} {"train_loss": -1.4342808723449707, "global_step": 508, "epoch": 12} {"train_loss": -1.4393939971923828, "global_step": 509, "epoch": 12} {"train_loss": -1.6019535064697266, "global_step": 510, "epoch": 12} {"train_loss": -1.5130178928375244, "global_step": 511, "epoch": 12} {"train_loss": -1.4558236598968506, "global_step": 512, "epoch": 12} {"train_loss": -1.4848861694335938, "global_step": 513, "epoch": 12} {"train_loss": -1.5190035104751587, "global_step": 514, "epoch": 12} {"train_loss": -1.3237333297729492, "global_step": 515, "epoch": 12} {"train_loss": -1.526397466659546, "global_step": 516, "epoch": 12} {"train_loss": -1.4740307331085205, "global_step": 517, "epoch": 12} {"train_loss": -1.6026420593261719, "global_step": 518, "epoch": 12} {"train_loss": -1.4149763584136963, "global_step": 519, "epoch": 12} {"train_loss": -1.466942310333252, "global_step": 520, "epoch": 12} {"train_loss": -1.5494441986083984, "global_step": 521, "epoch": 12} {"train_loss": -1.436628818511963, "global_step": 522, "epoch": 12} {"train_loss": -1.5910414457321167, "global_step": 523, "epoch": 12} {"train_loss": -1.6341606378555298, "global_step": 524, "epoch": 12} {"train_loss": -1.53253173828125, "global_step": 525, "epoch": 12} {"train_loss": -1.6197154521942139, "global_step": 526, "epoch": 12} {"train_loss": -1.535595178604126, "global_step": 527, "epoch": 12} {"train_loss": -1.5538685321807861, "global_step": 528, "epoch": 12} {"train_loss": -1.525789737701416, "global_step": 529, "epoch": 12} {"train_loss": -1.6404380798339844, "global_step": 530, "epoch": 12} {"train_loss": -1.5274118185043335, "global_step": 531, "epoch": 12} {"train_loss": -1.630211591720581, "global_step": 532, "epoch": 12} {"train_loss": -1.4418660402297974, "global_step": 533, "epoch": 12} {"train_loss": -1.6709972620010376, "global_step": 534, "epoch": 12} {"train_loss": -1.5688111782073975, "global_step": 535, "epoch": 12} {"train_loss": -1.5853962898254395, "global_step": 536, "epoch": 12} {"train_loss": -1.5860165357589722, "global_step": 537, "epoch": 12} {"train_loss": -1.6191320419311523, "global_step": 538, "epoch": 12} {"train_loss": -1.4721238613128662, "global_step": 539, "epoch": 12} {"train_loss": -1.5152714252471924, "global_step": 540, "epoch": 12} {"train_loss": -1.510457158088684, "global_step": 541, "epoch": 12} {"train_loss": -1.615508794784546, "global_step": 542, "epoch": 12} {"train_loss": -1.449128270149231, "global_step": 543, "epoch": 12} {"train_loss": -1.561061143875122, "global_step": 544, "epoch": 12} {"train_loss": -1.5241436305500211, "global_step": 545, "epoch": 12, "val_loss": 1626538.375} {"train_loss": -1.551013708114624, "global_step": 546, "epoch": 13} {"train_loss": -1.5854101181030273, "global_step": 547, "epoch": 13} {"train_loss": -1.6996575593948364, "global_step": 548, "epoch": 13} {"train_loss": -1.689382553100586, "global_step": 549, "epoch": 13} {"train_loss": -1.5634208917617798, "global_step": 550, "epoch": 13} {"train_loss": -1.6266810894012451, "global_step": 551, "epoch": 13} {"train_loss": -1.5814762115478516, "global_step": 552, "epoch": 13} {"train_loss": -1.5268458127975464, "global_step": 553, "epoch": 13} {"train_loss": -1.6183159351348877, "global_step": 554, "epoch": 13} {"train_loss": -1.530668020248413, "global_step": 555, "epoch": 13} {"train_loss": -1.5341522693634033, "global_step": 556, "epoch": 13} {"train_loss": -1.4311418533325195, "global_step": 557, "epoch": 13} {"train_loss": -1.5822631120681763, "global_step": 558, "epoch": 13} {"train_loss": -1.5800528526306152, "global_step": 559, "epoch": 13} {"train_loss": -1.547757625579834, "global_step": 560, "epoch": 13} {"train_loss": -1.732791781425476, "global_step": 561, "epoch": 13} {"train_loss": -1.6338942050933838, "global_step": 562, "epoch": 13} {"train_loss": -1.5922044515609741, "global_step": 563, "epoch": 13} {"train_loss": -1.6136457920074463, "global_step": 564, "epoch": 13} {"train_loss": -1.6545552015304565, "global_step": 565, "epoch": 13} {"train_loss": -1.741363763809204, "global_step": 566, "epoch": 13} {"train_loss": -1.7801272869110107, "global_step": 567, "epoch": 13} {"train_loss": -1.608919620513916, "global_step": 568, "epoch": 13} {"train_loss": -1.6024527549743652, "global_step": 569, "epoch": 13} {"train_loss": -1.5014728307724, "global_step": 570, "epoch": 13} {"train_loss": -1.6660466194152832, "global_step": 571, "epoch": 13} {"train_loss": -1.5212068557739258, "global_step": 572, "epoch": 13} {"train_loss": -1.5756981372833252, "global_step": 573, "epoch": 13} {"train_loss": -1.6716411113739014, "global_step": 574, "epoch": 13} {"train_loss": -1.6261489391326904, "global_step": 575, "epoch": 13} {"train_loss": -1.8484046459197998, "global_step": 576, "epoch": 13} {"train_loss": -1.620816946029663, "global_step": 577, "epoch": 13} {"train_loss": -1.6858248710632324, "global_step": 578, "epoch": 13} {"train_loss": -1.6100986003875732, "global_step": 579, "epoch": 13} {"train_loss": -1.7420759201049805, "global_step": 580, "epoch": 13} {"train_loss": -1.6247080564498901, "global_step": 581, "epoch": 13} {"train_loss": -1.7213096618652344, "global_step": 582, "epoch": 13} {"train_loss": -1.6840846538543701, "global_step": 583, "epoch": 13} {"train_loss": -1.6459851264953613, "global_step": 584, "epoch": 13} {"train_loss": -1.8058526515960693, "global_step": 585, "epoch": 13} {"train_loss": -1.6149027347564697, "global_step": 586, "epoch": 13} {"train_loss": -1.6276639387721108, "global_step": 587, "epoch": 13, "val_loss": 1524590.75} {"train_loss": -1.7450790405273438, "global_step": 588, "epoch": 14} {"train_loss": -1.7169805765151978, "global_step": 589, "epoch": 14} {"train_loss": -1.7191470861434937, "global_step": 590, "epoch": 14} {"train_loss": -1.6721274852752686, "global_step": 591, "epoch": 14} {"train_loss": -1.625706672668457, "global_step": 592, "epoch": 14} {"train_loss": -1.6271835565567017, "global_step": 593, "epoch": 14} {"train_loss": -1.7571542263031006, "global_step": 594, "epoch": 14} {"train_loss": -1.5698299407958984, "global_step": 595, "epoch": 14} {"train_loss": -1.5704853534698486, "global_step": 596, "epoch": 14} {"train_loss": -1.729964017868042, "global_step": 597, "epoch": 14} {"train_loss": -1.7181298732757568, "global_step": 598, "epoch": 14} {"train_loss": -1.5193774700164795, "global_step": 599, "epoch": 14} {"train_loss": -1.7600033283233643, "global_step": 600, "epoch": 14} {"train_loss": -1.6100261211395264, "global_step": 601, "epoch": 14} {"train_loss": -1.7210357189178467, "global_step": 602, "epoch": 14} {"train_loss": -1.6267049312591553, "global_step": 603, "epoch": 14} {"train_loss": -1.607832431793213, "global_step": 604, "epoch": 14} {"train_loss": -1.6294105052947998, "global_step": 605, "epoch": 14} {"train_loss": -1.6886022090911865, "global_step": 606, "epoch": 14} {"train_loss": -1.6462825536727905, "global_step": 607, "epoch": 14} {"train_loss": -1.7294942140579224, "global_step": 608, "epoch": 14} {"train_loss": -1.7899948358535767, "global_step": 609, "epoch": 14} {"train_loss": -1.6973803043365479, "global_step": 610, "epoch": 14} {"train_loss": -1.677577257156372, "global_step": 611, "epoch": 14} {"train_loss": -1.7448339462280273, "global_step": 612, "epoch": 14} {"train_loss": -1.6889920234680176, "global_step": 613, "epoch": 14} {"train_loss": -1.8292968273162842, "global_step": 614, "epoch": 14} {"train_loss": -1.768269419670105, "global_step": 615, "epoch": 14} {"train_loss": -1.7534617185592651, "global_step": 616, "epoch": 14} {"train_loss": -1.8045766353607178, "global_step": 617, "epoch": 14} {"train_loss": -1.7219526767730713, "global_step": 618, "epoch": 14} {"train_loss": -1.6599946022033691, "global_step": 619, "epoch": 14} {"train_loss": -1.703810214996338, "global_step": 620, "epoch": 14} {"train_loss": -1.7338823080062866, "global_step": 621, "epoch": 14} {"train_loss": -1.733104944229126, "global_step": 622, "epoch": 14} {"train_loss": -1.6353861093521118, "global_step": 623, "epoch": 14} {"train_loss": -1.7320201396942139, "global_step": 624, "epoch": 14} {"train_loss": -1.737518310546875, "global_step": 625, "epoch": 14} {"train_loss": -1.7797890901565552, "global_step": 626, "epoch": 14} {"train_loss": -1.8446755409240723, "global_step": 627, "epoch": 14} {"train_loss": -1.7171032428741455, "global_step": 628, "epoch": 14} {"train_loss": -1.7041377794174921, "global_step": 629, "epoch": 14, "val_loss": 1422848.5} {"train_loss": -1.6718730926513672, "global_step": 630, "epoch": 15} {"train_loss": -1.7976211309432983, "global_step": 631, "epoch": 15} {"train_loss": -1.8683642148971558, "global_step": 632, "epoch": 15} {"train_loss": -1.6929614543914795, "global_step": 633, "epoch": 15} {"train_loss": -1.7451828718185425, "global_step": 634, "epoch": 15} {"train_loss": -1.7082555294036865, "global_step": 635, "epoch": 15} {"train_loss": -1.71922767162323, "global_step": 636, "epoch": 15} {"train_loss": -1.767045497894287, "global_step": 637, "epoch": 15} {"train_loss": -1.871891975402832, "global_step": 638, "epoch": 15} {"train_loss": -1.881174921989441, "global_step": 639, "epoch": 15} {"train_loss": -1.744147777557373, "global_step": 640, "epoch": 15} {"train_loss": -1.8344182968139648, "global_step": 641, "epoch": 15} {"train_loss": -1.866344690322876, "global_step": 642, "epoch": 15} {"train_loss": -1.7164108753204346, "global_step": 643, "epoch": 15} {"train_loss": -1.7331891059875488, "global_step": 644, "epoch": 15} {"train_loss": -1.8752906322479248, "global_step": 645, "epoch": 15} {"train_loss": -1.8141082525253296, "global_step": 646, "epoch": 15} {"train_loss": -1.8346748352050781, "global_step": 647, "epoch": 15} {"train_loss": -1.7272658348083496, "global_step": 648, "epoch": 15} {"train_loss": -1.788329005241394, "global_step": 649, "epoch": 15} {"train_loss": -1.8588056564331055, "global_step": 650, "epoch": 15} {"train_loss": -1.8279595375061035, "global_step": 651, "epoch": 15} {"train_loss": -1.715327501296997, "global_step": 652, "epoch": 15} {"train_loss": -1.9164704084396362, "global_step": 653, "epoch": 15} {"train_loss": -1.9389240741729736, "global_step": 654, "epoch": 15} {"train_loss": -1.805382490158081, "global_step": 655, "epoch": 15} {"train_loss": -1.8279825448989868, "global_step": 656, "epoch": 15} {"train_loss": -1.7396221160888672, "global_step": 657, "epoch": 15} {"train_loss": -1.801376223564148, "global_step": 658, "epoch": 15} {"train_loss": -1.9191824197769165, "global_step": 659, "epoch": 15} {"train_loss": -1.791572093963623, "global_step": 660, "epoch": 15} {"train_loss": -1.7250102758407593, "global_step": 661, "epoch": 15} {"train_loss": -1.9182085990905762, "global_step": 662, "epoch": 15} {"train_loss": -1.7368717193603516, "global_step": 663, "epoch": 15} {"train_loss": -1.7573636770248413, "global_step": 664, "epoch": 15} {"train_loss": -1.7302253246307373, "global_step": 665, "epoch": 15} {"train_loss": -1.8749980926513672, "global_step": 666, "epoch": 15} {"train_loss": -1.7647632360458374, "global_step": 667, "epoch": 15} {"train_loss": -1.8660775423049927, "global_step": 668, "epoch": 15} {"train_loss": -1.9102885723114014, "global_step": 669, "epoch": 15} {"train_loss": -1.8474968671798706, "global_step": 670, "epoch": 15} {"train_loss": -1.8043163106555031, "global_step": 671, "epoch": 15, "val_loss": 1341478.375} {"train_loss": -1.7569758892059326, "global_step": 672, "epoch": 16} {"train_loss": -1.8629846572875977, "global_step": 673, "epoch": 16} {"train_loss": -1.9465398788452148, "global_step": 674, "epoch": 16} {"train_loss": -1.8053005933761597, "global_step": 675, "epoch": 16} {"train_loss": -1.8220787048339844, "global_step": 676, "epoch": 16} {"train_loss": -1.9385883808135986, "global_step": 677, "epoch": 16} {"train_loss": -1.7011796236038208, "global_step": 678, "epoch": 16} {"train_loss": -1.8398826122283936, "global_step": 679, "epoch": 16} {"train_loss": -1.7925384044647217, "global_step": 680, "epoch": 16} {"train_loss": -1.9834988117218018, "global_step": 681, "epoch": 16} {"train_loss": -1.7474093437194824, "global_step": 682, "epoch": 16} {"train_loss": -1.950938105583191, "global_step": 683, "epoch": 16} {"train_loss": -1.8513017892837524, "global_step": 684, "epoch": 16} {"train_loss": -1.9415403604507446, "global_step": 685, "epoch": 16} {"train_loss": -1.912156343460083, "global_step": 686, "epoch": 16} {"train_loss": -1.7724671363830566, "global_step": 687, "epoch": 16} {"train_loss": -1.8177253007888794, "global_step": 688, "epoch": 16} {"train_loss": -1.8728625774383545, "global_step": 689, "epoch": 16} {"train_loss": -1.7564899921417236, "global_step": 690, "epoch": 16} {"train_loss": -2.016852378845215, "global_step": 691, "epoch": 16} {"train_loss": -1.7543197870254517, "global_step": 692, "epoch": 16} {"train_loss": -1.928523063659668, "global_step": 693, "epoch": 16} {"train_loss": -1.9847850799560547, "global_step": 694, "epoch": 16} {"train_loss": -1.7845908403396606, "global_step": 695, "epoch": 16} {"train_loss": -1.9260025024414062, "global_step": 696, "epoch": 16} {"train_loss": -1.8943705558776855, "global_step": 697, "epoch": 16} {"train_loss": -1.912219762802124, "global_step": 698, "epoch": 16} {"train_loss": -1.975909948348999, "global_step": 699, "epoch": 16} {"train_loss": -1.9693875312805176, "global_step": 700, "epoch": 16} {"train_loss": -1.9546525478363037, "global_step": 701, "epoch": 16} {"train_loss": -1.9649478197097778, "global_step": 702, "epoch": 16} {"train_loss": -1.851022481918335, "global_step": 703, "epoch": 16} {"train_loss": -1.985398292541504, "global_step": 704, "epoch": 16} {"train_loss": -1.8472576141357422, "global_step": 705, "epoch": 16} {"train_loss": -2.015814781188965, "global_step": 706, "epoch": 16} {"train_loss": -1.898655652999878, "global_step": 707, "epoch": 16} {"train_loss": -1.9274115562438965, "global_step": 708, "epoch": 16} {"train_loss": -1.8850929737091064, "global_step": 709, "epoch": 16} {"train_loss": -1.9989569187164307, "global_step": 710, "epoch": 16} {"train_loss": -1.8654574155807495, "global_step": 711, "epoch": 16} {"train_loss": -1.926833152770996, "global_step": 712, "epoch": 16} {"train_loss": -1.8876495900608243, "global_step": 713, "epoch": 16, "val_loss": 1256056.75} {"train_loss": -1.8783912658691406, "global_step": 714, "epoch": 17} {"train_loss": -1.941756248474121, "global_step": 715, "epoch": 17} {"train_loss": -2.020313262939453, "global_step": 716, "epoch": 17} {"train_loss": -1.840309500694275, "global_step": 717, "epoch": 17} {"train_loss": -1.9525624513626099, "global_step": 718, "epoch": 17} {"train_loss": -2.0157060623168945, "global_step": 719, "epoch": 17} {"train_loss": -1.9663317203521729, "global_step": 720, "epoch": 17} {"train_loss": -1.995664119720459, "global_step": 721, "epoch": 17} {"train_loss": -1.8640162944793701, "global_step": 722, "epoch": 17} {"train_loss": -1.961695909500122, "global_step": 723, "epoch": 17} {"train_loss": -1.9240676164627075, "global_step": 724, "epoch": 17} {"train_loss": -1.9855804443359375, "global_step": 725, "epoch": 17} {"train_loss": -2.032189130783081, "global_step": 726, "epoch": 17} {"train_loss": -1.8875170946121216, "global_step": 727, "epoch": 17} {"train_loss": -1.9001405239105225, "global_step": 728, "epoch": 17} {"train_loss": -2.0208206176757812, "global_step": 729, "epoch": 17} {"train_loss": -1.8774018287658691, "global_step": 730, "epoch": 17} {"train_loss": -1.97014319896698, "global_step": 731, "epoch": 17} {"train_loss": -1.8957452774047852, "global_step": 732, "epoch": 17} {"train_loss": -1.8928635120391846, "global_step": 733, "epoch": 17} {"train_loss": -1.960076093673706, "global_step": 734, "epoch": 17} {"train_loss": -1.9476635456085205, "global_step": 735, "epoch": 17} {"train_loss": -1.943306803703308, "global_step": 736, "epoch": 17} {"train_loss": -1.9611315727233887, "global_step": 737, "epoch": 17} {"train_loss": -1.9153012037277222, "global_step": 738, "epoch": 17} {"train_loss": -1.8706475496292114, "global_step": 739, "epoch": 17} {"train_loss": -2.071948528289795, "global_step": 740, "epoch": 17} {"train_loss": -2.013455390930176, "global_step": 741, "epoch": 17} {"train_loss": -2.0714621543884277, "global_step": 742, "epoch": 17} {"train_loss": -2.0214385986328125, "global_step": 743, "epoch": 17} {"train_loss": -1.9724396467208862, "global_step": 744, "epoch": 17} {"train_loss": -1.9284456968307495, "global_step": 745, "epoch": 17} {"train_loss": -1.821840524673462, "global_step": 746, "epoch": 17} {"train_loss": -1.911346673965454, "global_step": 747, "epoch": 17} {"train_loss": -1.9617953300476074, "global_step": 748, "epoch": 17} {"train_loss": -1.9079785346984863, "global_step": 749, "epoch": 17} {"train_loss": -2.059720277786255, "global_step": 750, "epoch": 17} {"train_loss": -1.9457522630691528, "global_step": 751, "epoch": 17} {"train_loss": -1.8840868473052979, "global_step": 752, "epoch": 17} {"train_loss": -1.900216817855835, "global_step": 753, "epoch": 17} {"train_loss": -1.8534760475158691, "global_step": 754, "epoch": 17} {"train_loss": -1.9446396004585993, "global_step": 755, "epoch": 17, "val_loss": 1189641.75} {"train_loss": -2.01389217376709, "global_step": 756, "epoch": 18} {"train_loss": -1.9173791408538818, "global_step": 757, "epoch": 18} {"train_loss": -1.9071261882781982, "global_step": 758, "epoch": 18} {"train_loss": -1.838620901107788, "global_step": 759, "epoch": 18} {"train_loss": -1.9042682647705078, "global_step": 760, "epoch": 18} {"train_loss": -1.8530348539352417, "global_step": 761, "epoch": 18} {"train_loss": -1.927748680114746, "global_step": 762, "epoch": 18} {"train_loss": -2.071681022644043, "global_step": 763, "epoch": 18} {"train_loss": -2.051158905029297, "global_step": 764, "epoch": 18} {"train_loss": -1.8370190858840942, "global_step": 765, "epoch": 18} {"train_loss": -2.0255889892578125, "global_step": 766, "epoch": 18} {"train_loss": -1.9645854234695435, "global_step": 767, "epoch": 18} {"train_loss": -2.038078784942627, "global_step": 768, "epoch": 18} {"train_loss": -1.9993215799331665, "global_step": 769, "epoch": 18} {"train_loss": -2.0582518577575684, "global_step": 770, "epoch": 18} {"train_loss": -2.1030960083007812, "global_step": 771, "epoch": 18} {"train_loss": -2.0198421478271484, "global_step": 772, "epoch": 18} {"train_loss": -2.0361433029174805, "global_step": 773, "epoch": 18} {"train_loss": -1.922170639038086, "global_step": 774, "epoch": 18} {"train_loss": -1.9811267852783203, "global_step": 775, "epoch": 18} {"train_loss": -2.037835121154785, "global_step": 776, "epoch": 18} {"train_loss": -2.039907932281494, "global_step": 777, "epoch": 18} {"train_loss": -2.229506731033325, "global_step": 778, "epoch": 18} {"train_loss": -1.9905805587768555, "global_step": 779, "epoch": 18} {"train_loss": -1.988289475440979, "global_step": 780, "epoch": 18} {"train_loss": -2.090178966522217, "global_step": 781, "epoch": 18} {"train_loss": -2.0378782749176025, "global_step": 782, "epoch": 18} {"train_loss": -2.0440053939819336, "global_step": 783, "epoch": 18} {"train_loss": -2.0138626098632812, "global_step": 784, "epoch": 18} {"train_loss": -2.0944411754608154, "global_step": 785, "epoch": 18} {"train_loss": -1.9742178916931152, "global_step": 786, "epoch": 18} {"train_loss": -1.946266770362854, "global_step": 787, "epoch": 18} {"train_loss": -1.955256700515747, "global_step": 788, "epoch": 18} {"train_loss": -1.9978617429733276, "global_step": 789, "epoch": 18} {"train_loss": -1.9304286241531372, "global_step": 790, "epoch": 18} {"train_loss": -1.9038337469100952, "global_step": 791, "epoch": 18} {"train_loss": -1.979099988937378, "global_step": 792, "epoch": 18} {"train_loss": -1.9397571086883545, "global_step": 793, "epoch": 18} {"train_loss": -1.8782787322998047, "global_step": 794, "epoch": 18} {"train_loss": -1.8856439590454102, "global_step": 795, "epoch": 18} {"train_loss": -2.085221529006958, "global_step": 796, "epoch": 18} {"train_loss": -1.9859402832530795, "global_step": 797, "epoch": 18, "val_loss": 1134714.625} {"train_loss": -2.004728078842163, "global_step": 798, "epoch": 19} {"train_loss": -1.991495132446289, "global_step": 799, "epoch": 19} {"train_loss": -1.9089505672454834, "global_step": 800, "epoch": 19} {"train_loss": -1.9972729682922363, "global_step": 801, "epoch": 19} {"train_loss": -2.0938615798950195, "global_step": 802, "epoch": 19} {"train_loss": -2.041065216064453, "global_step": 803, "epoch": 19} {"train_loss": -1.9740233421325684, "global_step": 804, "epoch": 19} {"train_loss": -2.0763585567474365, "global_step": 805, "epoch": 19} {"train_loss": -2.111443281173706, "global_step": 806, "epoch": 19} {"train_loss": -1.9365509748458862, "global_step": 807, "epoch": 19} {"train_loss": -2.0999927520751953, "global_step": 808, "epoch": 19} {"train_loss": -2.0496366024017334, "global_step": 809, "epoch": 19} {"train_loss": -2.0941781997680664, "global_step": 810, "epoch": 19} {"train_loss": -1.9864704608917236, "global_step": 811, "epoch": 19} {"train_loss": -2.0498039722442627, "global_step": 812, "epoch": 19} {"train_loss": -2.1012675762176514, "global_step": 813, "epoch": 19} {"train_loss": -2.127495765686035, "global_step": 814, "epoch": 19} {"train_loss": -2.0756731033325195, "global_step": 815, "epoch": 19} {"train_loss": -2.184291362762451, "global_step": 816, "epoch": 19} {"train_loss": -2.0361833572387695, "global_step": 817, "epoch": 19} {"train_loss": -2.044090747833252, "global_step": 818, "epoch": 19} {"train_loss": -2.14229679107666, "global_step": 819, "epoch": 19} {"train_loss": -1.9165226221084595, "global_step": 820, "epoch": 19} {"train_loss": -1.9999643564224243, "global_step": 821, "epoch": 19} {"train_loss": -2.1005492210388184, "global_step": 822, "epoch": 19} {"train_loss": -2.059192657470703, "global_step": 823, "epoch": 19} {"train_loss": -2.1256093978881836, "global_step": 824, "epoch": 19} {"train_loss": -2.0848984718322754, "global_step": 825, "epoch": 19} {"train_loss": -2.0735039710998535, "global_step": 826, "epoch": 19} {"train_loss": -2.060237407684326, "global_step": 827, "epoch": 19} {"train_loss": -2.1358842849731445, "global_step": 828, "epoch": 19} {"train_loss": -2.1997227668762207, "global_step": 829, "epoch": 19} {"train_loss": -2.062913179397583, "global_step": 830, "epoch": 19} {"train_loss": -1.9680559635162354, "global_step": 831, "epoch": 19} {"train_loss": -2.1738781929016113, "global_step": 832, "epoch": 19} {"train_loss": -2.0940709114074707, "global_step": 833, "epoch": 19} {"train_loss": -2.1588101387023926, "global_step": 834, "epoch": 19} {"train_loss": -2.1306850910186768, "global_step": 835, "epoch": 19} {"train_loss": -2.02909517288208, "global_step": 836, "epoch": 19} {"train_loss": -2.030275344848633, "global_step": 837, "epoch": 19} {"train_loss": -2.090607166290283, "global_step": 838, "epoch": 19} {"train_loss": -2.0672185789971125, "global_step": 839, "epoch": 19, "val_loss": 1060632.75} {"train_loss": -2.007167339324951, "global_step": 840, "epoch": 20} {"train_loss": -2.2325291633605957, "global_step": 841, "epoch": 20} {"train_loss": -2.1386868953704834, "global_step": 842, "epoch": 20} {"train_loss": -2.0305747985839844, "global_step": 843, "epoch": 20} {"train_loss": -1.9706676006317139, "global_step": 844, "epoch": 20} {"train_loss": -2.1386594772338867, "global_step": 845, "epoch": 20} {"train_loss": -2.1644694805145264, "global_step": 846, "epoch": 20} {"train_loss": -2.0849123001098633, "global_step": 847, "epoch": 20} {"train_loss": -2.197410821914673, "global_step": 848, "epoch": 20} {"train_loss": -2.146517753601074, "global_step": 849, "epoch": 20} {"train_loss": -2.1797075271606445, "global_step": 850, "epoch": 20} {"train_loss": -2.0941522121429443, "global_step": 851, "epoch": 20} {"train_loss": -2.0670392513275146, "global_step": 852, "epoch": 20} {"train_loss": -2.1112914085388184, "global_step": 853, "epoch": 20} {"train_loss": -2.0749340057373047, "global_step": 854, "epoch": 20} {"train_loss": -2.310908079147339, "global_step": 855, "epoch": 20} {"train_loss": -2.0668492317199707, "global_step": 856, "epoch": 20} {"train_loss": -2.089359998703003, "global_step": 857, "epoch": 20} {"train_loss": -2.1659669876098633, "global_step": 858, "epoch": 20} {"train_loss": -2.1746623516082764, "global_step": 859, "epoch": 20} {"train_loss": -2.0880465507507324, "global_step": 860, "epoch": 20} {"train_loss": -2.1223933696746826, "global_step": 861, "epoch": 20} {"train_loss": -2.2700319290161133, "global_step": 862, "epoch": 20} {"train_loss": -1.925661563873291, "global_step": 863, "epoch": 20} {"train_loss": -2.101841926574707, "global_step": 864, "epoch": 20} {"train_loss": -2.207040309906006, "global_step": 865, "epoch": 20} {"train_loss": -2.238529920578003, "global_step": 866, "epoch": 20} {"train_loss": -2.128448963165283, "global_step": 867, "epoch": 20} {"train_loss": -2.0795321464538574, "global_step": 868, "epoch": 20} {"train_loss": -2.113241672515869, "global_step": 869, "epoch": 20} {"train_loss": -2.1054887771606445, "global_step": 870, "epoch": 20} {"train_loss": -2.2790706157684326, "global_step": 871, "epoch": 20} {"train_loss": -2.124699592590332, "global_step": 872, "epoch": 20} {"train_loss": -2.1910462379455566, "global_step": 873, "epoch": 20} {"train_loss": -2.223690986633301, "global_step": 874, "epoch": 20} {"train_loss": -2.2176506519317627, "global_step": 875, "epoch": 20} {"train_loss": -2.176269054412842, "global_step": 876, "epoch": 20} {"train_loss": -2.10986328125, "global_step": 877, "epoch": 20} {"train_loss": -2.2977209091186523, "global_step": 878, "epoch": 20} {"train_loss": -2.2301390171051025, "global_step": 879, "epoch": 20} {"train_loss": -2.102776288986206, "global_step": 880, "epoch": 20} {"train_loss": -2.142149266742525, "global_step": 881, "epoch": 20, "val_loss": 1013154.5625} {"train_loss": -2.189359188079834, "global_step": 882, "epoch": 21} {"train_loss": -2.221632957458496, "global_step": 883, "epoch": 21} {"train_loss": -1.9868898391723633, "global_step": 884, "epoch": 21} {"train_loss": -2.199094295501709, "global_step": 885, "epoch": 21} {"train_loss": -2.0971033573150635, "global_step": 886, "epoch": 21} {"train_loss": -2.229780673980713, "global_step": 887, "epoch": 21} {"train_loss": -2.2757551670074463, "global_step": 888, "epoch": 21} {"train_loss": -1.9761139154434204, "global_step": 889, "epoch": 21} {"train_loss": -2.272066116333008, "global_step": 890, "epoch": 21} {"train_loss": -2.0344834327697754, "global_step": 891, "epoch": 21} {"train_loss": -2.0936989784240723, "global_step": 892, "epoch": 21} {"train_loss": -2.184359550476074, "global_step": 893, "epoch": 21} {"train_loss": -2.2323131561279297, "global_step": 894, "epoch": 21} {"train_loss": -2.215702533721924, "global_step": 895, "epoch": 21} {"train_loss": -2.083186149597168, "global_step": 896, "epoch": 21} {"train_loss": -2.2170250415802, "global_step": 897, "epoch": 21} {"train_loss": -2.1421124935150146, "global_step": 898, "epoch": 21} {"train_loss": -2.2194578647613525, "global_step": 899, "epoch": 21} {"train_loss": -2.2391207218170166, "global_step": 900, "epoch": 21} {"train_loss": -2.138376235961914, "global_step": 901, "epoch": 21} {"train_loss": -2.1712863445281982, "global_step": 902, "epoch": 21} {"train_loss": -2.242171287536621, "global_step": 903, "epoch": 21} {"train_loss": -2.4372549057006836, "global_step": 904, "epoch": 21} {"train_loss": -2.254395008087158, "global_step": 905, "epoch": 21} {"train_loss": -2.335646152496338, "global_step": 906, "epoch": 21} {"train_loss": -2.1604840755462646, "global_step": 907, "epoch": 21} {"train_loss": -2.256788969039917, "global_step": 908, "epoch": 21} {"train_loss": -2.0775341987609863, "global_step": 909, "epoch": 21} {"train_loss": -2.2734673023223877, "global_step": 910, "epoch": 21} {"train_loss": -2.202641487121582, "global_step": 911, "epoch": 21} {"train_loss": -2.2350475788116455, "global_step": 912, "epoch": 21} {"train_loss": -2.2162365913391113, "global_step": 913, "epoch": 21} {"train_loss": -2.0751068592071533, "global_step": 914, "epoch": 21} {"train_loss": -2.2536253929138184, "global_step": 915, "epoch": 21} {"train_loss": -2.3621065616607666, "global_step": 916, "epoch": 21} {"train_loss": -2.2749381065368652, "global_step": 917, "epoch": 21} {"train_loss": -2.1659340858459473, "global_step": 918, "epoch": 21} {"train_loss": -2.163515090942383, "global_step": 919, "epoch": 21} {"train_loss": -2.2800841331481934, "global_step": 920, "epoch": 21} {"train_loss": -2.2233357429504395, "global_step": 921, "epoch": 21} {"train_loss": -2.2453935146331787, "global_step": 922, "epoch": 21} {"train_loss": -2.200685929684412, "global_step": 923, "epoch": 21, "val_loss": 965318.4375} {"train_loss": -2.315037250518799, "global_step": 924, "epoch": 22} {"train_loss": -2.1678109169006348, "global_step": 925, "epoch": 22} {"train_loss": -2.2489395141601562, "global_step": 926, "epoch": 22} {"train_loss": -2.2525315284729004, "global_step": 927, "epoch": 22} {"train_loss": -2.218719482421875, "global_step": 928, "epoch": 22} {"train_loss": -2.0981175899505615, "global_step": 929, "epoch": 22} {"train_loss": -2.295363426208496, "global_step": 930, "epoch": 22} {"train_loss": -2.1107068061828613, "global_step": 931, "epoch": 22} {"train_loss": -2.199146270751953, "global_step": 932, "epoch": 22} {"train_loss": -2.110867500305176, "global_step": 933, "epoch": 22} {"train_loss": -2.1955299377441406, "global_step": 934, "epoch": 22} {"train_loss": -2.1768407821655273, "global_step": 935, "epoch": 22} {"train_loss": -2.2230875492095947, "global_step": 936, "epoch": 22} {"train_loss": -2.3082573413848877, "global_step": 937, "epoch": 22} {"train_loss": -2.160015106201172, "global_step": 938, "epoch": 22} {"train_loss": -2.166313886642456, "global_step": 939, "epoch": 22} {"train_loss": -2.333956241607666, "global_step": 940, "epoch": 22} {"train_loss": -2.112786293029785, "global_step": 941, "epoch": 22} {"train_loss": -2.188721179962158, "global_step": 942, "epoch": 22} {"train_loss": -2.2210702896118164, "global_step": 943, "epoch": 22} {"train_loss": -2.248504400253296, "global_step": 944, "epoch": 22} {"train_loss": -2.3509254455566406, "global_step": 945, "epoch": 22} {"train_loss": -2.4266910552978516, "global_step": 946, "epoch": 22} {"train_loss": -2.2482070922851562, "global_step": 947, "epoch": 22} {"train_loss": -2.1976685523986816, "global_step": 948, "epoch": 22} {"train_loss": -2.209686279296875, "global_step": 949, "epoch": 22} {"train_loss": -2.373265266418457, "global_step": 950, "epoch": 22} {"train_loss": -2.2631359100341797, "global_step": 951, "epoch": 22} {"train_loss": -2.246429443359375, "global_step": 952, "epoch": 22} {"train_loss": -2.305962324142456, "global_step": 953, "epoch": 22} {"train_loss": -2.147094488143921, "global_step": 954, "epoch": 22} {"train_loss": -2.2607057094573975, "global_step": 955, "epoch": 22} {"train_loss": -2.3286681175231934, "global_step": 956, "epoch": 22} {"train_loss": -2.2873477935791016, "global_step": 957, "epoch": 22} {"train_loss": -2.375049114227295, "global_step": 958, "epoch": 22} {"train_loss": -2.4169583320617676, "global_step": 959, "epoch": 22} {"train_loss": -2.2369585037231445, "global_step": 960, "epoch": 22} {"train_loss": -2.3277177810668945, "global_step": 961, "epoch": 22} {"train_loss": -2.230764627456665, "global_step": 962, "epoch": 22} {"train_loss": -2.3080663681030273, "global_step": 963, "epoch": 22} {"train_loss": -2.2551379203796387, "global_step": 964, "epoch": 22} {"train_loss": -2.251561232975551, "global_step": 965, "epoch": 22, "val_loss": 918496.875} {"train_loss": -2.1550328731536865, "global_step": 966, "epoch": 23} {"train_loss": -2.197455883026123, "global_step": 967, "epoch": 23} {"train_loss": -2.233752727508545, "global_step": 968, "epoch": 23} {"train_loss": -2.3272273540496826, "global_step": 969, "epoch": 23} {"train_loss": -2.0822339057922363, "global_step": 970, "epoch": 23} {"train_loss": -2.3281617164611816, "global_step": 971, "epoch": 23} {"train_loss": -2.2209577560424805, "global_step": 972, "epoch": 23} {"train_loss": -2.343095302581787, "global_step": 973, "epoch": 23} {"train_loss": -2.1649856567382812, "global_step": 974, "epoch": 23} {"train_loss": -2.2344536781311035, "global_step": 975, "epoch": 23} {"train_loss": -2.2624568939208984, "global_step": 976, "epoch": 23} {"train_loss": -2.3447742462158203, "global_step": 977, "epoch": 23} {"train_loss": -2.385009288787842, "global_step": 978, "epoch": 23} {"train_loss": -2.3716375827789307, "global_step": 979, "epoch": 23} {"train_loss": -2.3383054733276367, "global_step": 980, "epoch": 23} {"train_loss": -2.2585489749908447, "global_step": 981, "epoch": 23} {"train_loss": -2.242161989212036, "global_step": 982, "epoch": 23} {"train_loss": -2.2743349075317383, "global_step": 983, "epoch": 23} {"train_loss": -2.371776580810547, "global_step": 984, "epoch": 23} {"train_loss": -2.2541637420654297, "global_step": 985, "epoch": 23} {"train_loss": -2.351409912109375, "global_step": 986, "epoch": 23} {"train_loss": -2.498462677001953, "global_step": 987, "epoch": 23} {"train_loss": -2.3462796211242676, "global_step": 988, "epoch": 23} {"train_loss": -2.374392509460449, "global_step": 989, "epoch": 23} {"train_loss": -2.3928511142730713, "global_step": 990, "epoch": 23} {"train_loss": -2.3547821044921875, "global_step": 991, "epoch": 23} {"train_loss": -2.1469945907592773, "global_step": 992, "epoch": 23} {"train_loss": -2.3452205657958984, "global_step": 993, "epoch": 23} {"train_loss": -2.3039896488189697, "global_step": 994, "epoch": 23} {"train_loss": -2.1581735610961914, "global_step": 995, "epoch": 23} {"train_loss": -2.3639092445373535, "global_step": 996, "epoch": 23} {"train_loss": -2.213118553161621, "global_step": 997, "epoch": 23} {"train_loss": -2.2963669300079346, "global_step": 998, "epoch": 23} {"train_loss": -2.4291839599609375, "global_step": 999, "epoch": 23} {"train_loss": -2.310567617416382, "global_step": 1000, "epoch": 23} {"train_loss": -2.3856866359710693, "global_step": 1001, "epoch": 23} {"train_loss": -2.301494598388672, "global_step": 1002, "epoch": 23} {"train_loss": -2.4360365867614746, "global_step": 1003, "epoch": 23} {"train_loss": -2.2757976055145264, "global_step": 1004, "epoch": 23} {"train_loss": -2.2192718982696533, "global_step": 1005, "epoch": 23} {"train_loss": -2.4331767559051514, "global_step": 1006, "epoch": 23} {"train_loss": -2.3021334523246404, "global_step": 1007, "epoch": 23, "val_loss": 870455.375} {"train_loss": -2.300614833831787, "global_step": 1008, "epoch": 24} {"train_loss": -2.4203243255615234, "global_step": 1009, "epoch": 24} {"train_loss": -2.2839956283569336, "global_step": 1010, "epoch": 24} {"train_loss": -2.3873181343078613, "global_step": 1011, "epoch": 24} {"train_loss": -2.428373336791992, "global_step": 1012, "epoch": 24} {"train_loss": -2.3892784118652344, "global_step": 1013, "epoch": 24} {"train_loss": -2.263096332550049, "global_step": 1014, "epoch": 24} {"train_loss": -2.4077534675598145, "global_step": 1015, "epoch": 24} {"train_loss": -2.410719394683838, "global_step": 1016, "epoch": 24} {"train_loss": -2.3633193969726562, "global_step": 1017, "epoch": 24} {"train_loss": -2.507582187652588, "global_step": 1018, "epoch": 24} {"train_loss": -2.239772319793701, "global_step": 1019, "epoch": 24} {"train_loss": -2.3004817962646484, "global_step": 1020, "epoch": 24} {"train_loss": -2.3851184844970703, "global_step": 1021, "epoch": 24} {"train_loss": -2.383635997772217, "global_step": 1022, "epoch": 24} {"train_loss": -2.322119951248169, "global_step": 1023, "epoch": 24} {"train_loss": -2.417008876800537, "global_step": 1024, "epoch": 24} {"train_loss": -2.4813032150268555, "global_step": 1025, "epoch": 24} {"train_loss": -2.3270723819732666, "global_step": 1026, "epoch": 24} {"train_loss": -2.339036464691162, "global_step": 1027, "epoch": 24} {"train_loss": -2.4090733528137207, "global_step": 1028, "epoch": 24} {"train_loss": -2.314638137817383, "global_step": 1029, "epoch": 24} {"train_loss": -2.4525835514068604, "global_step": 1030, "epoch": 24} {"train_loss": -2.36311674118042, "global_step": 1031, "epoch": 24} {"train_loss": -2.440843105316162, "global_step": 1032, "epoch": 24} {"train_loss": -2.4029173851013184, "global_step": 1033, "epoch": 24} {"train_loss": -2.3271324634552, "global_step": 1034, "epoch": 24} {"train_loss": -2.316169500350952, "global_step": 1035, "epoch": 24} {"train_loss": -2.349167823791504, "global_step": 1036, "epoch": 24} {"train_loss": -2.4207215309143066, "global_step": 1037, "epoch": 24} {"train_loss": -2.237133264541626, "global_step": 1038, "epoch": 24} {"train_loss": -2.398728370666504, "global_step": 1039, "epoch": 24} {"train_loss": -2.4496147632598877, "global_step": 1040, "epoch": 24} {"train_loss": -2.30879545211792, "global_step": 1041, "epoch": 24} {"train_loss": -2.3975696563720703, "global_step": 1042, "epoch": 24} {"train_loss": -2.275284767150879, "global_step": 1043, "epoch": 24} {"train_loss": -2.530668020248413, "global_step": 1044, "epoch": 24} {"train_loss": -2.2771596908569336, "global_step": 1045, "epoch": 24} {"train_loss": -2.3280739784240723, "global_step": 1046, "epoch": 24} {"train_loss": -2.2659752368927, "global_step": 1047, "epoch": 24} {"train_loss": -2.364119052886963, "global_step": 1048, "epoch": 24} {"train_loss": -2.3658657244273593, "global_step": 1049, "epoch": 24, "val_loss": 829110.625} {"train_loss": -2.4019198417663574, "global_step": 1050, "epoch": 25} {"train_loss": -2.5766496658325195, "global_step": 1051, "epoch": 25} {"train_loss": -2.228381872177124, "global_step": 1052, "epoch": 25} {"train_loss": -2.434692859649658, "global_step": 1053, "epoch": 25} {"train_loss": -2.283414363861084, "global_step": 1054, "epoch": 25} {"train_loss": -2.4125466346740723, "global_step": 1055, "epoch": 25} {"train_loss": -2.3614187240600586, "global_step": 1056, "epoch": 25} {"train_loss": -2.4761013984680176, "global_step": 1057, "epoch": 25} {"train_loss": -2.3455934524536133, "global_step": 1058, "epoch": 25} {"train_loss": -2.3767623901367188, "global_step": 1059, "epoch": 25} {"train_loss": -2.2654004096984863, "global_step": 1060, "epoch": 25} {"train_loss": -2.390493392944336, "global_step": 1061, "epoch": 25} {"train_loss": -2.316707134246826, "global_step": 1062, "epoch": 25} {"train_loss": -2.484842300415039, "global_step": 1063, "epoch": 25} {"train_loss": -2.268575668334961, "global_step": 1064, "epoch": 25} {"train_loss": -2.223228931427002, "global_step": 1065, "epoch": 25} {"train_loss": -2.362393379211426, "global_step": 1066, "epoch": 25} {"train_loss": -2.147947072982788, "global_step": 1067, "epoch": 25} {"train_loss": -2.3358840942382812, "global_step": 1068, "epoch": 25} {"train_loss": -2.37500262260437, "global_step": 1069, "epoch": 25} {"train_loss": -2.1962733268737793, "global_step": 1070, "epoch": 25} {"train_loss": -2.4372177124023438, "global_step": 1071, "epoch": 25} {"train_loss": -2.283266544342041, "global_step": 1072, "epoch": 25} {"train_loss": -2.471903085708618, "global_step": 1073, "epoch": 25} {"train_loss": -2.331831216812134, "global_step": 1074, "epoch": 25} {"train_loss": -2.4735000133514404, "global_step": 1075, "epoch": 25} {"train_loss": -2.263878583908081, "global_step": 1076, "epoch": 25} {"train_loss": -2.334657669067383, "global_step": 1077, "epoch": 25} {"train_loss": -2.338186264038086, "global_step": 1078, "epoch": 25} {"train_loss": -2.483635902404785, "global_step": 1079, "epoch": 25} {"train_loss": -2.305081605911255, "global_step": 1080, "epoch": 25} {"train_loss": -2.475738525390625, "global_step": 1081, "epoch": 25} {"train_loss": -2.3404340744018555, "global_step": 1082, "epoch": 25} {"train_loss": -2.4537575244903564, "global_step": 1083, "epoch": 25} {"train_loss": -2.383303642272949, "global_step": 1084, "epoch": 25} {"train_loss": -2.3759777545928955, "global_step": 1085, "epoch": 25} {"train_loss": -2.6251425743103027, "global_step": 1086, "epoch": 25} {"train_loss": -2.471679925918579, "global_step": 1087, "epoch": 25} {"train_loss": -2.3802294731140137, "global_step": 1088, "epoch": 25} {"train_loss": -2.4957504272460938, "global_step": 1089, "epoch": 25} {"train_loss": -2.4491147994995117, "global_step": 1090, "epoch": 25} {"train_loss": -2.3754319009326754, "global_step": 1091, "epoch": 25, "val_loss": 791706.5625} {"train_loss": -2.446946144104004, "global_step": 1092, "epoch": 26} {"train_loss": -2.5607900619506836, "global_step": 1093, "epoch": 26} {"train_loss": -2.259610652923584, "global_step": 1094, "epoch": 26} {"train_loss": -2.3044893741607666, "global_step": 1095, "epoch": 26} {"train_loss": -2.477449893951416, "global_step": 1096, "epoch": 26} {"train_loss": -2.400461435317993, "global_step": 1097, "epoch": 26} {"train_loss": -2.4385151863098145, "global_step": 1098, "epoch": 26} {"train_loss": -2.3909246921539307, "global_step": 1099, "epoch": 26} {"train_loss": -2.3746204376220703, "global_step": 1100, "epoch": 26} {"train_loss": -2.360093593597412, "global_step": 1101, "epoch": 26} {"train_loss": -2.5191993713378906, "global_step": 1102, "epoch": 26} {"train_loss": -2.461857795715332, "global_step": 1103, "epoch": 26} {"train_loss": -2.5643815994262695, "global_step": 1104, "epoch": 26} {"train_loss": -2.458432197570801, "global_step": 1105, "epoch": 26} {"train_loss": -2.4859399795532227, "global_step": 1106, "epoch": 26} {"train_loss": -2.434330463409424, "global_step": 1107, "epoch": 26} {"train_loss": -2.5272841453552246, "global_step": 1108, "epoch": 26} {"train_loss": -2.6349990367889404, "global_step": 1109, "epoch": 26} {"train_loss": -2.5025787353515625, "global_step": 1110, "epoch": 26} {"train_loss": -2.5102005004882812, "global_step": 1111, "epoch": 26} {"train_loss": -2.6649341583251953, "global_step": 1112, "epoch": 26} {"train_loss": -2.42099666595459, "global_step": 1113, "epoch": 26} {"train_loss": -2.5679619312286377, "global_step": 1114, "epoch": 26} {"train_loss": -2.46638822555542, "global_step": 1115, "epoch": 26} {"train_loss": -2.5775747299194336, "global_step": 1116, "epoch": 26} {"train_loss": -2.4307572841644287, "global_step": 1117, "epoch": 26} {"train_loss": -2.4066085815429688, "global_step": 1118, "epoch": 26} {"train_loss": -2.69391131401062, "global_step": 1119, "epoch": 26} {"train_loss": -2.449734926223755, "global_step": 1120, "epoch": 26} {"train_loss": -2.402538537979126, "global_step": 1121, "epoch": 26} {"train_loss": -2.4175615310668945, "global_step": 1122, "epoch": 26} {"train_loss": -2.423053741455078, "global_step": 1123, "epoch": 26} {"train_loss": -2.600450038909912, "global_step": 1124, "epoch": 26} {"train_loss": -2.2380499839782715, "global_step": 1125, "epoch": 26} {"train_loss": -2.431725025177002, "global_step": 1126, "epoch": 26} {"train_loss": -2.495177984237671, "global_step": 1127, "epoch": 26} {"train_loss": -2.181157112121582, "global_step": 1128, "epoch": 26} {"train_loss": -2.2715365886688232, "global_step": 1129, "epoch": 26} {"train_loss": -2.4875168800354004, "global_step": 1130, "epoch": 26} {"train_loss": -2.163647174835205, "global_step": 1131, "epoch": 26} {"train_loss": -2.3439316749572754, "global_step": 1132, "epoch": 26} {"train_loss": -2.438146085966201, "global_step": 1133, "epoch": 26, "val_loss": 767588.25} {"train_loss": -2.504077196121216, "global_step": 1134, "epoch": 27} {"train_loss": -2.3923468589782715, "global_step": 1135, "epoch": 27} {"train_loss": -2.4760541915893555, "global_step": 1136, "epoch": 27} {"train_loss": -2.2547693252563477, "global_step": 1137, "epoch": 27} {"train_loss": -2.482070207595825, "global_step": 1138, "epoch": 27} {"train_loss": -2.297219753265381, "global_step": 1139, "epoch": 27} {"train_loss": -2.540095329284668, "global_step": 1140, "epoch": 27} {"train_loss": -2.4902822971343994, "global_step": 1141, "epoch": 27} {"train_loss": -2.4177539348602295, "global_step": 1142, "epoch": 27} {"train_loss": -2.477296829223633, "global_step": 1143, "epoch": 27} {"train_loss": -2.4405882358551025, "global_step": 1144, "epoch": 27} {"train_loss": -2.467104434967041, "global_step": 1145, "epoch": 27} {"train_loss": -2.5380325317382812, "global_step": 1146, "epoch": 27} {"train_loss": -2.436394214630127, "global_step": 1147, "epoch": 27} {"train_loss": -2.5482144355773926, "global_step": 1148, "epoch": 27} {"train_loss": -2.517146587371826, "global_step": 1149, "epoch": 27} {"train_loss": -2.5465879440307617, "global_step": 1150, "epoch": 27} {"train_loss": -2.5647811889648438, "global_step": 1151, "epoch": 27} {"train_loss": -2.521516799926758, "global_step": 1152, "epoch": 27} {"train_loss": -2.5456342697143555, "global_step": 1153, "epoch": 27} {"train_loss": -2.539734363555908, "global_step": 1154, "epoch": 27} {"train_loss": -2.513720989227295, "global_step": 1155, "epoch": 27} {"train_loss": -2.5477170944213867, "global_step": 1156, "epoch": 27} {"train_loss": -2.4773640632629395, "global_step": 1157, "epoch": 27} {"train_loss": -2.6505420207977295, "global_step": 1158, "epoch": 27} {"train_loss": -2.51540207862854, "global_step": 1159, "epoch": 27} {"train_loss": -2.4847400188446045, "global_step": 1160, "epoch": 27} {"train_loss": -2.5057311058044434, "global_step": 1161, "epoch": 27} {"train_loss": -2.523922920227051, "global_step": 1162, "epoch": 27} {"train_loss": -2.527385711669922, "global_step": 1163, "epoch": 27} {"train_loss": -2.5689241886138916, "global_step": 1164, "epoch": 27} {"train_loss": -2.447686195373535, "global_step": 1165, "epoch": 27} {"train_loss": -2.604588031768799, "global_step": 1166, "epoch": 27} {"train_loss": -2.5180134773254395, "global_step": 1167, "epoch": 27} {"train_loss": -2.5728166103363037, "global_step": 1168, "epoch": 27} {"train_loss": -2.5101318359375, "global_step": 1169, "epoch": 27} {"train_loss": -2.5682387351989746, "global_step": 1170, "epoch": 27} {"train_loss": -2.6409318447113037, "global_step": 1171, "epoch": 27} {"train_loss": -2.4456281661987305, "global_step": 1172, "epoch": 27} {"train_loss": -2.5561025142669678, "global_step": 1173, "epoch": 27} {"train_loss": -2.506281852722168, "global_step": 1174, "epoch": 27} {"train_loss": -2.5064090320042203, "global_step": 1175, "epoch": 27, "val_loss": 722049.5625} {"train_loss": -2.442288398742676, "global_step": 1176, "epoch": 28} {"train_loss": -2.6485939025878906, "global_step": 1177, "epoch": 28} {"train_loss": -2.6531763076782227, "global_step": 1178, "epoch": 28} {"train_loss": -2.6454949378967285, "global_step": 1179, "epoch": 28} {"train_loss": -2.410278558731079, "global_step": 1180, "epoch": 28} {"train_loss": -2.4157989025115967, "global_step": 1181, "epoch": 28} {"train_loss": -2.8276278972625732, "global_step": 1182, "epoch": 28} {"train_loss": -2.427246570587158, "global_step": 1183, "epoch": 28} {"train_loss": -2.5437397956848145, "global_step": 1184, "epoch": 28} {"train_loss": -2.6681580543518066, "global_step": 1185, "epoch": 28} {"train_loss": -2.551112651824951, "global_step": 1186, "epoch": 28} {"train_loss": -2.5318167209625244, "global_step": 1187, "epoch": 28} {"train_loss": -2.6207730770111084, "global_step": 1188, "epoch": 28} {"train_loss": -2.52508544921875, "global_step": 1189, "epoch": 28} {"train_loss": -2.4546728134155273, "global_step": 1190, "epoch": 28} {"train_loss": -2.7248592376708984, "global_step": 1191, "epoch": 28} {"train_loss": -2.435645818710327, "global_step": 1192, "epoch": 28} {"train_loss": -2.582742691040039, "global_step": 1193, "epoch": 28} {"train_loss": -2.5969624519348145, "global_step": 1194, "epoch": 28} {"train_loss": -2.5934255123138428, "global_step": 1195, "epoch": 28} {"train_loss": -2.7034616470336914, "global_step": 1196, "epoch": 28} {"train_loss": -2.6715173721313477, "global_step": 1197, "epoch": 28} {"train_loss": -2.6194777488708496, "global_step": 1198, "epoch": 28} {"train_loss": -2.558680534362793, "global_step": 1199, "epoch": 28} {"train_loss": -2.431553840637207, "global_step": 1200, "epoch": 28} {"train_loss": -2.6404428482055664, "global_step": 1201, "epoch": 28} {"train_loss": -2.4986777305603027, "global_step": 1202, "epoch": 28} {"train_loss": -2.640887975692749, "global_step": 1203, "epoch": 28} {"train_loss": -2.474090099334717, "global_step": 1204, "epoch": 28} {"train_loss": -2.521052837371826, "global_step": 1205, "epoch": 28} {"train_loss": -2.639435291290283, "global_step": 1206, "epoch": 28} {"train_loss": -2.6045660972595215, "global_step": 1207, "epoch": 28} {"train_loss": -2.6239748001098633, "global_step": 1208, "epoch": 28} {"train_loss": -2.522634506225586, "global_step": 1209, "epoch": 28} {"train_loss": -2.5750277042388916, "global_step": 1210, "epoch": 28} {"train_loss": -2.551790237426758, "global_step": 1211, "epoch": 28} {"train_loss": -2.6620116233825684, "global_step": 1212, "epoch": 28} {"train_loss": -2.6046557426452637, "global_step": 1213, "epoch": 28} {"train_loss": -2.3979878425598145, "global_step": 1214, "epoch": 28} {"train_loss": -2.58967924118042, "global_step": 1215, "epoch": 28} {"train_loss": -2.3556320667266846, "global_step": 1216, "epoch": 28} {"train_loss": -2.5676103205907914, "global_step": 1217, "epoch": 28, "val_loss": 696298.0625} {"train_loss": -2.7609939575195312, "global_step": 1218, "epoch": 29} {"train_loss": -2.592690944671631, "global_step": 1219, "epoch": 29} {"train_loss": -2.639727830886841, "global_step": 1220, "epoch": 29} {"train_loss": -2.5673258304595947, "global_step": 1221, "epoch": 29} {"train_loss": -2.547698974609375, "global_step": 1222, "epoch": 29} {"train_loss": -2.510664224624634, "global_step": 1223, "epoch": 29} {"train_loss": -2.6556811332702637, "global_step": 1224, "epoch": 29} {"train_loss": -2.5142574310302734, "global_step": 1225, "epoch": 29} {"train_loss": -2.5964818000793457, "global_step": 1226, "epoch": 29} {"train_loss": -2.5844013690948486, "global_step": 1227, "epoch": 29} {"train_loss": -2.494523525238037, "global_step": 1228, "epoch": 29} {"train_loss": -2.696934938430786, "global_step": 1229, "epoch": 29} {"train_loss": -2.4575374126434326, "global_step": 1230, "epoch": 29} {"train_loss": -2.5989131927490234, "global_step": 1231, "epoch": 29} {"train_loss": -2.527769088745117, "global_step": 1232, "epoch": 29} {"train_loss": -2.5609490871429443, "global_step": 1233, "epoch": 29} {"train_loss": -2.582900047302246, "global_step": 1234, "epoch": 29} {"train_loss": -2.597412109375, "global_step": 1235, "epoch": 29} {"train_loss": -2.732861042022705, "global_step": 1236, "epoch": 29} {"train_loss": -2.5920016765594482, "global_step": 1237, "epoch": 29} {"train_loss": -2.5880472660064697, "global_step": 1238, "epoch": 29} {"train_loss": -2.625851631164551, "global_step": 1239, "epoch": 29} {"train_loss": -2.6899356842041016, "global_step": 1240, "epoch": 29} {"train_loss": -2.758240222930908, "global_step": 1241, "epoch": 29} {"train_loss": -2.613448143005371, "global_step": 1242, "epoch": 29} {"train_loss": -2.5639665126800537, "global_step": 1243, "epoch": 29} {"train_loss": -2.6696462631225586, "global_step": 1244, "epoch": 29} {"train_loss": -2.592806577682495, "global_step": 1245, "epoch": 29} {"train_loss": -2.6864845752716064, "global_step": 1246, "epoch": 29} {"train_loss": -2.468831777572632, "global_step": 1247, "epoch": 29} {"train_loss": -2.5378518104553223, "global_step": 1248, "epoch": 29} {"train_loss": -2.647552013397217, "global_step": 1249, "epoch": 29} {"train_loss": -2.4359188079833984, "global_step": 1250, "epoch": 29} {"train_loss": -2.520925283432007, "global_step": 1251, "epoch": 29} {"train_loss": -2.3848190307617188, "global_step": 1252, "epoch": 29} {"train_loss": -2.6684577465057373, "global_step": 1253, "epoch": 29} {"train_loss": -2.422214984893799, "global_step": 1254, "epoch": 29} {"train_loss": -2.760171413421631, "global_step": 1255, "epoch": 29} {"train_loss": -2.4417366981506348, "global_step": 1256, "epoch": 29} {"train_loss": -2.7476553916931152, "global_step": 1257, "epoch": 29} {"train_loss": -2.6883459091186523, "global_step": 1258, "epoch": 29} {"train_loss": -2.5943956942785356, "global_step": 1259, "epoch": 29, "val_loss": 655208.5} {"train_loss": -2.6405391693115234, "global_step": 1260, "epoch": 30} {"train_loss": -2.541276454925537, "global_step": 1261, "epoch": 30} {"train_loss": -2.5889992713928223, "global_step": 1262, "epoch": 30} {"train_loss": -2.5407934188842773, "global_step": 1263, "epoch": 30} {"train_loss": -2.6650171279907227, "global_step": 1264, "epoch": 30} {"train_loss": -2.6423678398132324, "global_step": 1265, "epoch": 30} {"train_loss": -2.5940134525299072, "global_step": 1266, "epoch": 30} {"train_loss": -2.550400733947754, "global_step": 1267, "epoch": 30} {"train_loss": -2.66567325592041, "global_step": 1268, "epoch": 30} {"train_loss": -2.647364616394043, "global_step": 1269, "epoch": 30} {"train_loss": -2.690995693206787, "global_step": 1270, "epoch": 30} {"train_loss": -2.6312806606292725, "global_step": 1271, "epoch": 30} {"train_loss": -2.6400341987609863, "global_step": 1272, "epoch": 30} {"train_loss": -2.824014186859131, "global_step": 1273, "epoch": 30} {"train_loss": -2.798640727996826, "global_step": 1274, "epoch": 30} {"train_loss": -2.6919803619384766, "global_step": 1275, "epoch": 30} {"train_loss": -2.6193785667419434, "global_step": 1276, "epoch": 30} {"train_loss": -2.4294161796569824, "global_step": 1277, "epoch": 30} {"train_loss": -2.674447536468506, "global_step": 1278, "epoch": 30} {"train_loss": -2.5494608879089355, "global_step": 1279, "epoch": 30} {"train_loss": -2.548092842102051, "global_step": 1280, "epoch": 30} {"train_loss": -2.742487668991089, "global_step": 1281, "epoch": 30} {"train_loss": -2.7279317378997803, "global_step": 1282, "epoch": 30} {"train_loss": -2.7890267372131348, "global_step": 1283, "epoch": 30} {"train_loss": -2.617920398712158, "global_step": 1284, "epoch": 30} {"train_loss": -2.732671022415161, "global_step": 1285, "epoch": 30} {"train_loss": -2.4803037643432617, "global_step": 1286, "epoch": 30} {"train_loss": -2.7354736328125, "global_step": 1287, "epoch": 30} {"train_loss": -2.6973989009857178, "global_step": 1288, "epoch": 30} {"train_loss": -2.5421223640441895, "global_step": 1289, "epoch": 30} {"train_loss": -2.5910496711730957, "global_step": 1290, "epoch": 30} {"train_loss": -2.722076416015625, "global_step": 1291, "epoch": 30} {"train_loss": -2.790433883666992, "global_step": 1292, "epoch": 30} {"train_loss": -2.7736737728118896, "global_step": 1293, "epoch": 30} {"train_loss": -2.7082483768463135, "global_step": 1294, "epoch": 30} {"train_loss": -2.7422022819519043, "global_step": 1295, "epoch": 30} {"train_loss": -2.639512538909912, "global_step": 1296, "epoch": 30} {"train_loss": -2.6195006370544434, "global_step": 1297, "epoch": 30} {"train_loss": -2.4766788482666016, "global_step": 1298, "epoch": 30} {"train_loss": -2.788544178009033, "global_step": 1299, "epoch": 30} {"train_loss": -2.454400062561035, "global_step": 1300, "epoch": 30} {"train_loss": -2.652097463607788, "global_step": 1301, "epoch": 30, "val_loss": 629323.0} {"train_loss": -2.4875688552856445, "global_step": 1302, "epoch": 31} {"train_loss": -2.6275475025177, "global_step": 1303, "epoch": 31} {"train_loss": -2.7188878059387207, "global_step": 1304, "epoch": 31} {"train_loss": -2.6878252029418945, "global_step": 1305, "epoch": 31} {"train_loss": -2.718099594116211, "global_step": 1306, "epoch": 31} {"train_loss": -2.6042871475219727, "global_step": 1307, "epoch": 31} {"train_loss": -2.716190814971924, "global_step": 1308, "epoch": 31} {"train_loss": -2.7844743728637695, "global_step": 1309, "epoch": 31} {"train_loss": -2.5241923332214355, "global_step": 1310, "epoch": 31} {"train_loss": -2.699263334274292, "global_step": 1311, "epoch": 31} {"train_loss": -2.8450927734375, "global_step": 1312, "epoch": 31} {"train_loss": -2.743976593017578, "global_step": 1313, "epoch": 31} {"train_loss": -2.63424015045166, "global_step": 1314, "epoch": 31} {"train_loss": -2.6162898540496826, "global_step": 1315, "epoch": 31} {"train_loss": -2.667484760284424, "global_step": 1316, "epoch": 31} {"train_loss": -2.7886266708374023, "global_step": 1317, "epoch": 31} {"train_loss": -2.8377766609191895, "global_step": 1318, "epoch": 31} {"train_loss": -2.5797924995422363, "global_step": 1319, "epoch": 31} {"train_loss": -2.6892549991607666, "global_step": 1320, "epoch": 31} {"train_loss": -2.7442688941955566, "global_step": 1321, "epoch": 31} {"train_loss": -2.665925979614258, "global_step": 1322, "epoch": 31} {"train_loss": -2.7311973571777344, "global_step": 1323, "epoch": 31} {"train_loss": -2.5387392044067383, "global_step": 1324, "epoch": 31} {"train_loss": -2.7418971061706543, "global_step": 1325, "epoch": 31} {"train_loss": -2.7802908420562744, "global_step": 1326, "epoch": 31} {"train_loss": -2.5487470626831055, "global_step": 1327, "epoch": 31} {"train_loss": -2.563297748565674, "global_step": 1328, "epoch": 31} {"train_loss": -2.5044212341308594, "global_step": 1329, "epoch": 31} {"train_loss": -2.635225772857666, "global_step": 1330, "epoch": 31} {"train_loss": -2.451040029525757, "global_step": 1331, "epoch": 31} {"train_loss": -2.549783706665039, "global_step": 1332, "epoch": 31} {"train_loss": -2.6308116912841797, "global_step": 1333, "epoch": 31} {"train_loss": -2.6199755668640137, "global_step": 1334, "epoch": 31} {"train_loss": -2.749899387359619, "global_step": 1335, "epoch": 31} {"train_loss": -2.5546693801879883, "global_step": 1336, "epoch": 31} {"train_loss": -2.6541004180908203, "global_step": 1337, "epoch": 31} {"train_loss": -2.5618398189544678, "global_step": 1338, "epoch": 31} {"train_loss": -2.5507209300994873, "global_step": 1339, "epoch": 31} {"train_loss": -2.4591126441955566, "global_step": 1340, "epoch": 31} {"train_loss": -2.8358447551727295, "global_step": 1341, "epoch": 31} {"train_loss": -2.53366756439209, "global_step": 1342, "epoch": 31} {"train_loss": -2.647708257039388, "global_step": 1343, "epoch": 31, "val_loss": 591497.4375} {"train_loss": -2.5931856632232666, "global_step": 1344, "epoch": 32} {"train_loss": -2.6609132289886475, "global_step": 1345, "epoch": 32} {"train_loss": -2.8764028549194336, "global_step": 1346, "epoch": 32} {"train_loss": -2.6091325283050537, "global_step": 1347, "epoch": 32} {"train_loss": -2.724215507507324, "global_step": 1348, "epoch": 32} {"train_loss": -2.6883530616760254, "global_step": 1349, "epoch": 32} {"train_loss": -2.6755363941192627, "global_step": 1350, "epoch": 32} {"train_loss": -2.684760093688965, "global_step": 1351, "epoch": 32} {"train_loss": -2.6988582611083984, "global_step": 1352, "epoch": 32} {"train_loss": -2.708369255065918, "global_step": 1353, "epoch": 32} {"train_loss": -2.8685903549194336, "global_step": 1354, "epoch": 32} {"train_loss": -2.815439462661743, "global_step": 1355, "epoch": 32} {"train_loss": -2.7993998527526855, "global_step": 1356, "epoch": 32} {"train_loss": -2.818021297454834, "global_step": 1357, "epoch": 32} {"train_loss": -2.6108734607696533, "global_step": 1358, "epoch": 32} {"train_loss": -2.7925703525543213, "global_step": 1359, "epoch": 32} {"train_loss": -2.633837938308716, "global_step": 1360, "epoch": 32} {"train_loss": -2.613067626953125, "global_step": 1361, "epoch": 32} {"train_loss": -2.6719212532043457, "global_step": 1362, "epoch": 32} {"train_loss": -2.5822436809539795, "global_step": 1363, "epoch": 32} {"train_loss": -2.771714687347412, "global_step": 1364, "epoch": 32} {"train_loss": -2.579883575439453, "global_step": 1365, "epoch": 32} {"train_loss": -2.7215609550476074, "global_step": 1366, "epoch": 32} {"train_loss": -2.8731861114501953, "global_step": 1367, "epoch": 32} {"train_loss": -2.551483631134033, "global_step": 1368, "epoch": 32} {"train_loss": -2.805023670196533, "global_step": 1369, "epoch": 32} {"train_loss": -2.618220329284668, "global_step": 1370, "epoch": 32} {"train_loss": -2.723663330078125, "global_step": 1371, "epoch": 32} {"train_loss": -2.7498605251312256, "global_step": 1372, "epoch": 32} {"train_loss": -2.4762492179870605, "global_step": 1373, "epoch": 32} {"train_loss": -2.7034311294555664, "global_step": 1374, "epoch": 32} {"train_loss": -2.724043846130371, "global_step": 1375, "epoch": 32} {"train_loss": -2.741997241973877, "global_step": 1376, "epoch": 32} {"train_loss": -2.894153118133545, "global_step": 1377, "epoch": 32} {"train_loss": -2.614535093307495, "global_step": 1378, "epoch": 32} {"train_loss": -2.87454891204834, "global_step": 1379, "epoch": 32} {"train_loss": -2.683565855026245, "global_step": 1380, "epoch": 32} {"train_loss": -2.7161426544189453, "global_step": 1381, "epoch": 32} {"train_loss": -2.735330104827881, "global_step": 1382, "epoch": 32} {"train_loss": -2.6796579360961914, "global_step": 1383, "epoch": 32} {"train_loss": -2.7550721168518066, "global_step": 1384, "epoch": 32} {"train_loss": -2.7084149519602456, "global_step": 1385, "epoch": 32, "val_loss": 572175.3125} {"train_loss": -2.599979877471924, "global_step": 1386, "epoch": 33} {"train_loss": -2.765467882156372, "global_step": 1387, "epoch": 33} {"train_loss": -2.750835418701172, "global_step": 1388, "epoch": 33} {"train_loss": -2.6888017654418945, "global_step": 1389, "epoch": 33} {"train_loss": -2.802948474884033, "global_step": 1390, "epoch": 33} {"train_loss": -2.8072986602783203, "global_step": 1391, "epoch": 33} {"train_loss": -2.683905601501465, "global_step": 1392, "epoch": 33} {"train_loss": -2.8192596435546875, "global_step": 1393, "epoch": 33} {"train_loss": -2.7532737255096436, "global_step": 1394, "epoch": 33} {"train_loss": -2.8163294792175293, "global_step": 1395, "epoch": 33} {"train_loss": -2.6935620307922363, "global_step": 1396, "epoch": 33} {"train_loss": -2.715402841567993, "global_step": 1397, "epoch": 33} {"train_loss": -2.823570489883423, "global_step": 1398, "epoch": 33} {"train_loss": -2.833082675933838, "global_step": 1399, "epoch": 33} {"train_loss": -2.7392356395721436, "global_step": 1400, "epoch": 33} {"train_loss": -2.810908794403076, "global_step": 1401, "epoch": 33} {"train_loss": -2.87330961227417, "global_step": 1402, "epoch": 33} {"train_loss": -2.769753932952881, "global_step": 1403, "epoch": 33} {"train_loss": -2.9310836791992188, "global_step": 1404, "epoch": 33} {"train_loss": -2.783949851989746, "global_step": 1405, "epoch": 33} {"train_loss": -2.818507671356201, "global_step": 1406, "epoch": 33} {"train_loss": -2.8873941898345947, "global_step": 1407, "epoch": 33} {"train_loss": -2.868535280227661, "global_step": 1408, "epoch": 33} {"train_loss": -2.848569869995117, "global_step": 1409, "epoch": 33} {"train_loss": -2.8016364574432373, "global_step": 1410, "epoch": 33} {"train_loss": -3.0196433067321777, "global_step": 1411, "epoch": 33} {"train_loss": -2.846452474594116, "global_step": 1412, "epoch": 33} {"train_loss": -2.7967309951782227, "global_step": 1413, "epoch": 33} {"train_loss": -2.855553150177002, "global_step": 1414, "epoch": 33} {"train_loss": -2.777904510498047, "global_step": 1415, "epoch": 33} {"train_loss": -2.70263934135437, "global_step": 1416, "epoch": 33} {"train_loss": -2.849714756011963, "global_step": 1417, "epoch": 33} {"train_loss": -2.879655599594116, "global_step": 1418, "epoch": 33} {"train_loss": -2.6934542655944824, "global_step": 1419, "epoch": 33} {"train_loss": -2.8503684997558594, "global_step": 1420, "epoch": 33} {"train_loss": -2.7197773456573486, "global_step": 1421, "epoch": 33} {"train_loss": -2.7261974811553955, "global_step": 1422, "epoch": 33} {"train_loss": -3.0351972579956055, "global_step": 1423, "epoch": 33} {"train_loss": -2.6834402084350586, "global_step": 1424, "epoch": 33} {"train_loss": -2.8729851245880127, "global_step": 1425, "epoch": 33} {"train_loss": -2.7715840339660645, "global_step": 1426, "epoch": 33} {"train_loss": -2.796441089539301, "global_step": 1427, "epoch": 33, "val_loss": 542926.1875} {"train_loss": -2.780076503753662, "global_step": 1428, "epoch": 34} {"train_loss": -2.8510117530822754, "global_step": 1429, "epoch": 34} {"train_loss": -2.7193851470947266, "global_step": 1430, "epoch": 34} {"train_loss": -2.8040146827697754, "global_step": 1431, "epoch": 34} {"train_loss": -2.8644165992736816, "global_step": 1432, "epoch": 34} {"train_loss": -2.8760972023010254, "global_step": 1433, "epoch": 34} {"train_loss": -2.852356433868408, "global_step": 1434, "epoch": 34} {"train_loss": -2.777937889099121, "global_step": 1435, "epoch": 34} {"train_loss": -2.889126777648926, "global_step": 1436, "epoch": 34} {"train_loss": -2.98008394241333, "global_step": 1437, "epoch": 34} {"train_loss": -2.8529679775238037, "global_step": 1438, "epoch": 34} {"train_loss": -2.7433252334594727, "global_step": 1439, "epoch": 34} {"train_loss": -2.9106497764587402, "global_step": 1440, "epoch": 34} {"train_loss": -2.8100926876068115, "global_step": 1441, "epoch": 34} {"train_loss": -2.8141672611236572, "global_step": 1442, "epoch": 34} {"train_loss": -2.788196325302124, "global_step": 1443, "epoch": 34} {"train_loss": -2.781550407409668, "global_step": 1444, "epoch": 34} {"train_loss": -2.813295841217041, "global_step": 1445, "epoch": 34} {"train_loss": -2.8365676403045654, "global_step": 1446, "epoch": 34} {"train_loss": -2.742978572845459, "global_step": 1447, "epoch": 34} {"train_loss": -2.850081443786621, "global_step": 1448, "epoch": 34} {"train_loss": -2.8772120475769043, "global_step": 1449, "epoch": 34} {"train_loss": -2.7868802547454834, "global_step": 1450, "epoch": 34} {"train_loss": -2.6003799438476562, "global_step": 1451, "epoch": 34} {"train_loss": -2.9965226650238037, "global_step": 1452, "epoch": 34} {"train_loss": -2.7982444763183594, "global_step": 1453, "epoch": 34} {"train_loss": -2.8725571632385254, "global_step": 1454, "epoch": 34} {"train_loss": -2.8969614505767822, "global_step": 1455, "epoch": 34} {"train_loss": -2.910238265991211, "global_step": 1456, "epoch": 34} {"train_loss": -2.8132448196411133, "global_step": 1457, "epoch": 34} {"train_loss": -2.756959915161133, "global_step": 1458, "epoch": 34} {"train_loss": -2.8324127197265625, "global_step": 1459, "epoch": 34} {"train_loss": -2.8220958709716797, "global_step": 1460, "epoch": 34} {"train_loss": -2.8356504440307617, "global_step": 1461, "epoch": 34} {"train_loss": -2.7893877029418945, "global_step": 1462, "epoch": 34} {"train_loss": -2.942833662033081, "global_step": 1463, "epoch": 34} {"train_loss": -2.884031295776367, "global_step": 1464, "epoch": 34} {"train_loss": -2.824465274810791, "global_step": 1465, "epoch": 34} {"train_loss": -2.8407797813415527, "global_step": 1466, "epoch": 34} {"train_loss": -2.9813432693481445, "global_step": 1467, "epoch": 34} {"train_loss": -2.939281463623047, "global_step": 1468, "epoch": 34} {"train_loss": -2.8387429543903897, "global_step": 1469, "epoch": 34, "val_loss": 517261.9375} {"train_loss": -2.8109331130981445, "global_step": 1470, "epoch": 35} {"train_loss": -2.7554399967193604, "global_step": 1471, "epoch": 35} {"train_loss": -2.6304590702056885, "global_step": 1472, "epoch": 35} {"train_loss": -2.9522671699523926, "global_step": 1473, "epoch": 35} {"train_loss": -2.872270107269287, "global_step": 1474, "epoch": 35} {"train_loss": -2.7705330848693848, "global_step": 1475, "epoch": 35} {"train_loss": -2.888218641281128, "global_step": 1476, "epoch": 35} {"train_loss": -2.803806781768799, "global_step": 1477, "epoch": 35} {"train_loss": -2.8824682235717773, "global_step": 1478, "epoch": 35} {"train_loss": -2.897890329360962, "global_step": 1479, "epoch": 35} {"train_loss": -2.952976703643799, "global_step": 1480, "epoch": 35} {"train_loss": -2.7401387691497803, "global_step": 1481, "epoch": 35} {"train_loss": -2.758167028427124, "global_step": 1482, "epoch": 35} {"train_loss": -2.969487190246582, "global_step": 1483, "epoch": 35} {"train_loss": -2.854898691177368, "global_step": 1484, "epoch": 35} {"train_loss": -2.9047932624816895, "global_step": 1485, "epoch": 35} {"train_loss": -2.9029836654663086, "global_step": 1486, "epoch": 35} {"train_loss": -2.8077585697174072, "global_step": 1487, "epoch": 35} {"train_loss": -2.930577278137207, "global_step": 1488, "epoch": 35} {"train_loss": -2.7451798915863037, "global_step": 1489, "epoch": 35} {"train_loss": -2.8115556240081787, "global_step": 1490, "epoch": 35} {"train_loss": -2.9592432975769043, "global_step": 1491, "epoch": 35} {"train_loss": -2.6226391792297363, "global_step": 1492, "epoch": 35} {"train_loss": -2.8098983764648438, "global_step": 1493, "epoch": 35} {"train_loss": -2.87168550491333, "global_step": 1494, "epoch": 35} {"train_loss": -2.7491395473480225, "global_step": 1495, "epoch": 35} {"train_loss": -2.792135715484619, "global_step": 1496, "epoch": 35} {"train_loss": -2.922973155975342, "global_step": 1497, "epoch": 35} {"train_loss": -2.859004020690918, "global_step": 1498, "epoch": 35} {"train_loss": -2.8209192752838135, "global_step": 1499, "epoch": 35} {"train_loss": -2.882363796234131, "global_step": 1500, "epoch": 35} {"train_loss": -2.841780185699463, "global_step": 1501, "epoch": 35} {"train_loss": -2.6364946365356445, "global_step": 1502, "epoch": 35} {"train_loss": -2.9999852180480957, "global_step": 1503, "epoch": 35} {"train_loss": -2.8246524333953857, "global_step": 1504, "epoch": 35} {"train_loss": -2.7361128330230713, "global_step": 1505, "epoch": 35} {"train_loss": -2.8443217277526855, "global_step": 1506, "epoch": 35} {"train_loss": -2.7441325187683105, "global_step": 1507, "epoch": 35} {"train_loss": -2.8701438903808594, "global_step": 1508, "epoch": 35} {"train_loss": -2.796173572540283, "global_step": 1509, "epoch": 35} {"train_loss": -2.8427481651306152, "global_step": 1510, "epoch": 35} {"train_loss": -2.830886801083883, "global_step": 1511, "epoch": 35, "val_loss": 489511.40625} {"train_loss": -2.9986181259155273, "global_step": 1512, "epoch": 36} {"train_loss": -2.6998131275177, "global_step": 1513, "epoch": 36} {"train_loss": -2.930049180984497, "global_step": 1514, "epoch": 36} {"train_loss": -2.750807762145996, "global_step": 1515, "epoch": 36} {"train_loss": -2.9937949180603027, "global_step": 1516, "epoch": 36} {"train_loss": -2.826730966567993, "global_step": 1517, "epoch": 36} {"train_loss": -2.936190605163574, "global_step": 1518, "epoch": 36} {"train_loss": -2.7737088203430176, "global_step": 1519, "epoch": 36} {"train_loss": -2.8566441535949707, "global_step": 1520, "epoch": 36} {"train_loss": -2.862736701965332, "global_step": 1521, "epoch": 36} {"train_loss": -2.949314594268799, "global_step": 1522, "epoch": 36} {"train_loss": -2.9063844680786133, "global_step": 1523, "epoch": 36} {"train_loss": -2.834434747695923, "global_step": 1524, "epoch": 36} {"train_loss": -2.9132232666015625, "global_step": 1525, "epoch": 36} {"train_loss": -2.778402328491211, "global_step": 1526, "epoch": 36} {"train_loss": -2.8548989295959473, "global_step": 1527, "epoch": 36} {"train_loss": -3.014238119125366, "global_step": 1528, "epoch": 36} {"train_loss": -3.024970054626465, "global_step": 1529, "epoch": 36} {"train_loss": -2.695309638977051, "global_step": 1530, "epoch": 36} {"train_loss": -2.8828606605529785, "global_step": 1531, "epoch": 36} {"train_loss": -2.9221887588500977, "global_step": 1532, "epoch": 36} {"train_loss": -3.0058109760284424, "global_step": 1533, "epoch": 36} {"train_loss": -2.861395835876465, "global_step": 1534, "epoch": 36} {"train_loss": -2.7760324478149414, "global_step": 1535, "epoch": 36} {"train_loss": -2.878500461578369, "global_step": 1536, "epoch": 36} {"train_loss": -3.007744789123535, "global_step": 1537, "epoch": 36} {"train_loss": -2.917667865753174, "global_step": 1538, "epoch": 36} {"train_loss": -2.8034911155700684, "global_step": 1539, "epoch": 36} {"train_loss": -2.959136724472046, "global_step": 1540, "epoch": 36} {"train_loss": -2.9323487281799316, "global_step": 1541, "epoch": 36} {"train_loss": -2.9420971870422363, "global_step": 1542, "epoch": 36} {"train_loss": -2.866434097290039, "global_step": 1543, "epoch": 36} {"train_loss": -2.9969611167907715, "global_step": 1544, "epoch": 36} {"train_loss": -2.887706756591797, "global_step": 1545, "epoch": 36} {"train_loss": -2.915966272354126, "global_step": 1546, "epoch": 36} {"train_loss": -2.873061180114746, "global_step": 1547, "epoch": 36} {"train_loss": -3.039881944656372, "global_step": 1548, "epoch": 36} {"train_loss": -2.9469523429870605, "global_step": 1549, "epoch": 36} {"train_loss": -2.924302816390991, "global_step": 1550, "epoch": 36} {"train_loss": -3.034193992614746, "global_step": 1551, "epoch": 36} {"train_loss": -3.06384539604187, "global_step": 1552, "epoch": 36} {"train_loss": -2.9071316719055176, "global_step": 1553, "epoch": 36, "val_loss": 468614.75} {"train_loss": -2.8469316959381104, "global_step": 1554, "epoch": 37} {"train_loss": -2.8363614082336426, "global_step": 1555, "epoch": 37} {"train_loss": -2.864015579223633, "global_step": 1556, "epoch": 37} {"train_loss": -2.817336320877075, "global_step": 1557, "epoch": 37} {"train_loss": -3.014511823654175, "global_step": 1558, "epoch": 37} {"train_loss": -2.6621413230895996, "global_step": 1559, "epoch": 37} {"train_loss": -2.8970284461975098, "global_step": 1560, "epoch": 37} {"train_loss": -2.8653905391693115, "global_step": 1561, "epoch": 37} {"train_loss": -2.8566904067993164, "global_step": 1562, "epoch": 37} {"train_loss": -2.9445955753326416, "global_step": 1563, "epoch": 37} {"train_loss": -2.97021484375, "global_step": 1564, "epoch": 37} {"train_loss": -2.9857723712921143, "global_step": 1565, "epoch": 37} {"train_loss": -2.8818514347076416, "global_step": 1566, "epoch": 37} {"train_loss": -2.878748893737793, "global_step": 1567, "epoch": 37} {"train_loss": -2.940182685852051, "global_step": 1568, "epoch": 37} {"train_loss": -2.836113929748535, "global_step": 1569, "epoch": 37} {"train_loss": -3.018693447113037, "global_step": 1570, "epoch": 37} {"train_loss": -2.984524726867676, "global_step": 1571, "epoch": 37} {"train_loss": -2.9584224224090576, "global_step": 1572, "epoch": 37} {"train_loss": -2.941225051879883, "global_step": 1573, "epoch": 37} {"train_loss": -3.0070409774780273, "global_step": 1574, "epoch": 37} {"train_loss": -2.9832515716552734, "global_step": 1575, "epoch": 37} {"train_loss": -2.9257616996765137, "global_step": 1576, "epoch": 37} {"train_loss": -2.9733071327209473, "global_step": 1577, "epoch": 37} {"train_loss": -2.8415403366088867, "global_step": 1578, "epoch": 37} {"train_loss": -2.9343981742858887, "global_step": 1579, "epoch": 37} {"train_loss": -2.9351868629455566, "global_step": 1580, "epoch": 37} {"train_loss": -2.952759027481079, "global_step": 1581, "epoch": 37} {"train_loss": -3.0697808265686035, "global_step": 1582, "epoch": 37} {"train_loss": -2.9320926666259766, "global_step": 1583, "epoch": 37} {"train_loss": -2.9274892807006836, "global_step": 1584, "epoch": 37} {"train_loss": -2.8000869750976562, "global_step": 1585, "epoch": 37} {"train_loss": -3.0604376792907715, "global_step": 1586, "epoch": 37} {"train_loss": -2.9429383277893066, "global_step": 1587, "epoch": 37} {"train_loss": -2.8587546348571777, "global_step": 1588, "epoch": 37} {"train_loss": -2.9631171226501465, "global_step": 1589, "epoch": 37} {"train_loss": -2.8439245223999023, "global_step": 1590, "epoch": 37} {"train_loss": -2.9094398021698, "global_step": 1591, "epoch": 37} {"train_loss": -3.0225179195404053, "global_step": 1592, "epoch": 37} {"train_loss": -2.987067699432373, "global_step": 1593, "epoch": 37} {"train_loss": -2.963653087615967, "global_step": 1594, "epoch": 37} {"train_loss": -2.9252802360625494, "global_step": 1595, "epoch": 37, "val_loss": 443645.9375} {"train_loss": -2.7509732246398926, "global_step": 1596, "epoch": 38} {"train_loss": -3.039137363433838, "global_step": 1597, "epoch": 38} {"train_loss": -2.9903407096862793, "global_step": 1598, "epoch": 38} {"train_loss": -2.8505687713623047, "global_step": 1599, "epoch": 38} {"train_loss": -2.8398072719573975, "global_step": 1600, "epoch": 38} {"train_loss": -2.8300256729125977, "global_step": 1601, "epoch": 38} {"train_loss": -2.8152565956115723, "global_step": 1602, "epoch": 38} {"train_loss": -2.948819160461426, "global_step": 1603, "epoch": 38} {"train_loss": -3.0616707801818848, "global_step": 1604, "epoch": 38} {"train_loss": -3.006049633026123, "global_step": 1605, "epoch": 38} {"train_loss": -2.866577386856079, "global_step": 1606, "epoch": 38} {"train_loss": -3.0856385231018066, "global_step": 1607, "epoch": 38} {"train_loss": -2.8325493335723877, "global_step": 1608, "epoch": 38} {"train_loss": -3.0775840282440186, "global_step": 1609, "epoch": 38} {"train_loss": -2.9802632331848145, "global_step": 1610, "epoch": 38} {"train_loss": -2.9779844284057617, "global_step": 1611, "epoch": 38} {"train_loss": -2.939819097518921, "global_step": 1612, "epoch": 38} {"train_loss": -3.1356325149536133, "global_step": 1613, "epoch": 38} {"train_loss": -2.9556870460510254, "global_step": 1614, "epoch": 38} {"train_loss": -3.03702974319458, "global_step": 1615, "epoch": 38} {"train_loss": -3.0156078338623047, "global_step": 1616, "epoch": 38} {"train_loss": -2.9764811992645264, "global_step": 1617, "epoch": 38} {"train_loss": -2.9434666633605957, "global_step": 1618, "epoch": 38} {"train_loss": -2.7282121181488037, "global_step": 1619, "epoch": 38} {"train_loss": -2.9382565021514893, "global_step": 1620, "epoch": 38} {"train_loss": -2.850032329559326, "global_step": 1621, "epoch": 38} {"train_loss": -2.7353262901306152, "global_step": 1622, "epoch": 38} {"train_loss": -2.9654839038848877, "global_step": 1623, "epoch": 38} {"train_loss": -2.790565252304077, "global_step": 1624, "epoch": 38} {"train_loss": -2.782421112060547, "global_step": 1625, "epoch": 38} {"train_loss": -3.0670254230499268, "global_step": 1626, "epoch": 38} {"train_loss": -2.6309316158294678, "global_step": 1627, "epoch": 38} {"train_loss": -2.7131335735321045, "global_step": 1628, "epoch": 38} {"train_loss": -2.9363274574279785, "global_step": 1629, "epoch": 38} {"train_loss": -2.7620913982391357, "global_step": 1630, "epoch": 38} {"train_loss": -2.917203664779663, "global_step": 1631, "epoch": 38} {"train_loss": -2.7943825721740723, "global_step": 1632, "epoch": 38} {"train_loss": -2.9198989868164062, "global_step": 1633, "epoch": 38} {"train_loss": -2.924947500228882, "global_step": 1634, "epoch": 38} {"train_loss": -3.034681558609009, "global_step": 1635, "epoch": 38} {"train_loss": -2.8586199283599854, "global_step": 1636, "epoch": 38} {"train_loss": -2.9139473097664967, "global_step": 1637, "epoch": 38, "val_loss": 417626.90625} {"train_loss": -2.9162731170654297, "global_step": 1638, "epoch": 39} {"train_loss": -2.9730961322784424, "global_step": 1639, "epoch": 39} {"train_loss": -2.9281601905822754, "global_step": 1640, "epoch": 39} {"train_loss": -2.9638209342956543, "global_step": 1641, "epoch": 39} {"train_loss": -3.01320743560791, "global_step": 1642, "epoch": 39} {"train_loss": -3.0108535289764404, "global_step": 1643, "epoch": 39} {"train_loss": -2.988635540008545, "global_step": 1644, "epoch": 39} {"train_loss": -3.0773510932922363, "global_step": 1645, "epoch": 39} {"train_loss": -3.012629270553589, "global_step": 1646, "epoch": 39} {"train_loss": -3.0215682983398438, "global_step": 1647, "epoch": 39} {"train_loss": -3.026395559310913, "global_step": 1648, "epoch": 39} {"train_loss": -3.0665488243103027, "global_step": 1649, "epoch": 39} {"train_loss": -2.9794201850891113, "global_step": 1650, "epoch": 39} {"train_loss": -3.053218126296997, "global_step": 1651, "epoch": 39} {"train_loss": -2.931467294692993, "global_step": 1652, "epoch": 39} {"train_loss": -3.118649959564209, "global_step": 1653, "epoch": 39} {"train_loss": -2.9807333946228027, "global_step": 1654, "epoch": 39} {"train_loss": -2.8766188621520996, "global_step": 1655, "epoch": 39} {"train_loss": -3.022754430770874, "global_step": 1656, "epoch": 39} {"train_loss": -3.0407631397247314, "global_step": 1657, "epoch": 39} {"train_loss": -2.9396982192993164, "global_step": 1658, "epoch": 39} {"train_loss": -3.066652774810791, "global_step": 1659, "epoch": 39} {"train_loss": -3.0807411670684814, "global_step": 1660, "epoch": 39} {"train_loss": -3.090423822402954, "global_step": 1661, "epoch": 39} {"train_loss": -2.9959685802459717, "global_step": 1662, "epoch": 39} {"train_loss": -3.016782760620117, "global_step": 1663, "epoch": 39} {"train_loss": -2.997406005859375, "global_step": 1664, "epoch": 39} {"train_loss": -3.110586404800415, "global_step": 1665, "epoch": 39} {"train_loss": -3.041245460510254, "global_step": 1666, "epoch": 39} {"train_loss": -3.2068252563476562, "global_step": 1667, "epoch": 39} {"train_loss": -2.955512046813965, "global_step": 1668, "epoch": 39} {"train_loss": -2.9520440101623535, "global_step": 1669, "epoch": 39} {"train_loss": -3.216052770614624, "global_step": 1670, "epoch": 39} {"train_loss": -3.13580322265625, "global_step": 1671, "epoch": 39} {"train_loss": -3.0260841846466064, "global_step": 1672, "epoch": 39} {"train_loss": -3.1202900409698486, "global_step": 1673, "epoch": 39} {"train_loss": -3.058995246887207, "global_step": 1674, "epoch": 39} {"train_loss": -2.9833462238311768, "global_step": 1675, "epoch": 39} {"train_loss": -3.0758352279663086, "global_step": 1676, "epoch": 39} {"train_loss": -2.943049192428589, "global_step": 1677, "epoch": 39} {"train_loss": -2.9626858234405518, "global_step": 1678, "epoch": 39} {"train_loss": -3.027320526895069, "global_step": 1679, "epoch": 39, "val_loss": 399262.90625} {"train_loss": -2.9658541679382324, "global_step": 1680, "epoch": 40} {"train_loss": -3.0059945583343506, "global_step": 1681, "epoch": 40} {"train_loss": -3.040574550628662, "global_step": 1682, "epoch": 40} {"train_loss": -3.11708402633667, "global_step": 1683, "epoch": 40} {"train_loss": -3.0199053287506104, "global_step": 1684, "epoch": 40} {"train_loss": -2.9564008712768555, "global_step": 1685, "epoch": 40} {"train_loss": -2.9818406105041504, "global_step": 1686, "epoch": 40} {"train_loss": -2.991981029510498, "global_step": 1687, "epoch": 40} {"train_loss": -3.0826735496520996, "global_step": 1688, "epoch": 40} {"train_loss": -3.029930591583252, "global_step": 1689, "epoch": 40} {"train_loss": -2.9598171710968018, "global_step": 1690, "epoch": 40} {"train_loss": -3.0890235900878906, "global_step": 1691, "epoch": 40} {"train_loss": -2.7377090454101562, "global_step": 1692, "epoch": 40} {"train_loss": -3.0375232696533203, "global_step": 1693, "epoch": 40} {"train_loss": -2.8104543685913086, "global_step": 1694, "epoch": 40} {"train_loss": -3.132852077484131, "global_step": 1695, "epoch": 40} {"train_loss": -3.0215044021606445, "global_step": 1696, "epoch": 40} {"train_loss": -2.9164769649505615, "global_step": 1697, "epoch": 40} {"train_loss": -2.918010950088501, "global_step": 1698, "epoch": 40} {"train_loss": -2.9225175380706787, "global_step": 1699, "epoch": 40} {"train_loss": -3.115291118621826, "global_step": 1700, "epoch": 40} {"train_loss": -2.897179126739502, "global_step": 1701, "epoch": 40} {"train_loss": -2.9566597938537598, "global_step": 1702, "epoch": 40} {"train_loss": -3.0082714557647705, "global_step": 1703, "epoch": 40} {"train_loss": -3.178957223892212, "global_step": 1704, "epoch": 40} {"train_loss": -2.8829097747802734, "global_step": 1705, "epoch": 40} {"train_loss": -3.0097246170043945, "global_step": 1706, "epoch": 40} {"train_loss": -2.9668593406677246, "global_step": 1707, "epoch": 40} {"train_loss": -3.0377883911132812, "global_step": 1708, "epoch": 40} {"train_loss": -3.1090989112854004, "global_step": 1709, "epoch": 40} {"train_loss": -2.9887337684631348, "global_step": 1710, "epoch": 40} {"train_loss": -3.080648422241211, "global_step": 1711, "epoch": 40} {"train_loss": -3.0313801765441895, "global_step": 1712, "epoch": 40} {"train_loss": -3.122478485107422, "global_step": 1713, "epoch": 40} {"train_loss": -3.1103148460388184, "global_step": 1714, "epoch": 40} {"train_loss": -3.079040050506592, "global_step": 1715, "epoch": 40} {"train_loss": -3.070673942565918, "global_step": 1716, "epoch": 40} {"train_loss": -3.197610378265381, "global_step": 1717, "epoch": 40} {"train_loss": -2.9062023162841797, "global_step": 1718, "epoch": 40} {"train_loss": -3.0841758251190186, "global_step": 1719, "epoch": 40} {"train_loss": -3.087769031524658, "global_step": 1720, "epoch": 40} {"train_loss": -3.0188148532594954, "global_step": 1721, "epoch": 40, "val_loss": 377757.125} {"train_loss": -3.163186550140381, "global_step": 1722, "epoch": 41} {"train_loss": -3.20664119720459, "global_step": 1723, "epoch": 41} {"train_loss": -2.9183483123779297, "global_step": 1724, "epoch": 41} {"train_loss": -3.130723476409912, "global_step": 1725, "epoch": 41} {"train_loss": -3.119762897491455, "global_step": 1726, "epoch": 41} {"train_loss": -3.0781545639038086, "global_step": 1727, "epoch": 41} {"train_loss": -3.103060483932495, "global_step": 1728, "epoch": 41} {"train_loss": -3.287156105041504, "global_step": 1729, "epoch": 41} {"train_loss": -3.0635643005371094, "global_step": 1730, "epoch": 41} {"train_loss": -3.143606185913086, "global_step": 1731, "epoch": 41} {"train_loss": -3.1166398525238037, "global_step": 1732, "epoch": 41} {"train_loss": -3.066969871520996, "global_step": 1733, "epoch": 41} {"train_loss": -2.8670268058776855, "global_step": 1734, "epoch": 41} {"train_loss": -3.171806812286377, "global_step": 1735, "epoch": 41} {"train_loss": -3.2122113704681396, "global_step": 1736, "epoch": 41} {"train_loss": -2.9057388305664062, "global_step": 1737, "epoch": 41} {"train_loss": -3.114015579223633, "global_step": 1738, "epoch": 41} {"train_loss": -3.1297168731689453, "global_step": 1739, "epoch": 41} {"train_loss": -3.072751522064209, "global_step": 1740, "epoch": 41} {"train_loss": -3.1674890518188477, "global_step": 1741, "epoch": 41} {"train_loss": -3.072445869445801, "global_step": 1742, "epoch": 41} {"train_loss": -3.2257606983184814, "global_step": 1743, "epoch": 41} {"train_loss": -3.128514051437378, "global_step": 1744, "epoch": 41} {"train_loss": -3.111509323120117, "global_step": 1745, "epoch": 41} {"train_loss": -3.127548933029175, "global_step": 1746, "epoch": 41} {"train_loss": -3.0472800731658936, "global_step": 1747, "epoch": 41} {"train_loss": -3.1777546405792236, "global_step": 1748, "epoch": 41} {"train_loss": -2.9652462005615234, "global_step": 1749, "epoch": 41} {"train_loss": -3.0432446002960205, "global_step": 1750, "epoch": 41} {"train_loss": -3.1692004203796387, "global_step": 1751, "epoch": 41} {"train_loss": -3.00819993019104, "global_step": 1752, "epoch": 41} {"train_loss": -3.0833961963653564, "global_step": 1753, "epoch": 41} {"train_loss": -3.1904311180114746, "global_step": 1754, "epoch": 41} {"train_loss": -3.031121253967285, "global_step": 1755, "epoch": 41} {"train_loss": -3.131488800048828, "global_step": 1756, "epoch": 41} {"train_loss": -3.1974334716796875, "global_step": 1757, "epoch": 41} {"train_loss": -3.120621681213379, "global_step": 1758, "epoch": 41} {"train_loss": -3.217556953430176, "global_step": 1759, "epoch": 41} {"train_loss": -2.9333062171936035, "global_step": 1760, "epoch": 41} {"train_loss": -3.1163265705108643, "global_step": 1761, "epoch": 41} {"train_loss": -3.1632089614868164, "global_step": 1762, "epoch": 41} {"train_loss": -3.1042096558071317, "global_step": 1763, "epoch": 41, "val_loss": 356756.4375} {"train_loss": -3.149766445159912, "global_step": 1764, "epoch": 42} {"train_loss": -3.3165054321289062, "global_step": 1765, "epoch": 42} {"train_loss": -3.2682297229766846, "global_step": 1766, "epoch": 42} {"train_loss": -3.127654552459717, "global_step": 1767, "epoch": 42} {"train_loss": -3.0972137451171875, "global_step": 1768, "epoch": 42} {"train_loss": -3.0044384002685547, "global_step": 1769, "epoch": 42} {"train_loss": -3.148592948913574, "global_step": 1770, "epoch": 42} {"train_loss": -3.1647868156433105, "global_step": 1771, "epoch": 42} {"train_loss": -2.8229103088378906, "global_step": 1772, "epoch": 42} {"train_loss": -3.0730888843536377, "global_step": 1773, "epoch": 42} {"train_loss": -2.9065990447998047, "global_step": 1774, "epoch": 42} {"train_loss": -3.183699369430542, "global_step": 1775, "epoch": 42} {"train_loss": -2.985366106033325, "global_step": 1776, "epoch": 42} {"train_loss": -3.076028347015381, "global_step": 1777, "epoch": 42} {"train_loss": -3.0344150066375732, "global_step": 1778, "epoch": 42} {"train_loss": -2.9576966762542725, "global_step": 1779, "epoch": 42} {"train_loss": -3.1734824180603027, "global_step": 1780, "epoch": 42} {"train_loss": -2.9371604919433594, "global_step": 1781, "epoch": 42} {"train_loss": -3.1159021854400635, "global_step": 1782, "epoch": 42} {"train_loss": -2.9967269897460938, "global_step": 1783, "epoch": 42} {"train_loss": -3.161318302154541, "global_step": 1784, "epoch": 42} {"train_loss": -3.165780544281006, "global_step": 1785, "epoch": 42} {"train_loss": -3.0760300159454346, "global_step": 1786, "epoch": 42} {"train_loss": -3.09420108795166, "global_step": 1787, "epoch": 42} {"train_loss": -3.0927658081054688, "global_step": 1788, "epoch": 42} {"train_loss": -3.063697576522827, "global_step": 1789, "epoch": 42} {"train_loss": -3.0953221321105957, "global_step": 1790, "epoch": 42} {"train_loss": -3.1778950691223145, "global_step": 1791, "epoch": 42} {"train_loss": -3.215135097503662, "global_step": 1792, "epoch": 42} {"train_loss": -3.1976070404052734, "global_step": 1793, "epoch": 42} {"train_loss": -2.963414192199707, "global_step": 1794, "epoch": 42} {"train_loss": -3.218787670135498, "global_step": 1795, "epoch": 42} {"train_loss": -3.122497081756592, "global_step": 1796, "epoch": 42} {"train_loss": -3.163233518600464, "global_step": 1797, "epoch": 42} {"train_loss": -3.1392788887023926, "global_step": 1798, "epoch": 42} {"train_loss": -3.149240493774414, "global_step": 1799, "epoch": 42} {"train_loss": -3.1013472080230713, "global_step": 1800, "epoch": 42} {"train_loss": -3.2360005378723145, "global_step": 1801, "epoch": 42} {"train_loss": -3.047910213470459, "global_step": 1802, "epoch": 42} {"train_loss": -3.001631021499634, "global_step": 1803, "epoch": 42} {"train_loss": -3.1595582962036133, "global_step": 1804, "epoch": 42} {"train_loss": -3.103185318765186, "global_step": 1805, "epoch": 42, "val_loss": 343067.6875} {"train_loss": -2.945175886154175, "global_step": 1806, "epoch": 43} {"train_loss": -3.291184663772583, "global_step": 1807, "epoch": 43} {"train_loss": -3.1233553886413574, "global_step": 1808, "epoch": 43} {"train_loss": -3.042865753173828, "global_step": 1809, "epoch": 43} {"train_loss": -3.1870477199554443, "global_step": 1810, "epoch": 43} {"train_loss": -3.062617301940918, "global_step": 1811, "epoch": 43} {"train_loss": -3.1398110389709473, "global_step": 1812, "epoch": 43} {"train_loss": -2.9623758792877197, "global_step": 1813, "epoch": 43} {"train_loss": -3.0674853324890137, "global_step": 1814, "epoch": 43} {"train_loss": -3.2289645671844482, "global_step": 1815, "epoch": 43} {"train_loss": -3.0046274662017822, "global_step": 1816, "epoch": 43} {"train_loss": -3.280595302581787, "global_step": 1817, "epoch": 43} {"train_loss": -2.953104257583618, "global_step": 1818, "epoch": 43} {"train_loss": -2.9763240814208984, "global_step": 1819, "epoch": 43} {"train_loss": -3.016829013824463, "global_step": 1820, "epoch": 43} {"train_loss": -2.840693950653076, "global_step": 1821, "epoch": 43} {"train_loss": -3.172978401184082, "global_step": 1822, "epoch": 43} {"train_loss": -2.7442445755004883, "global_step": 1823, "epoch": 43} {"train_loss": -3.1775481700897217, "global_step": 1824, "epoch": 43} {"train_loss": -2.9673280715942383, "global_step": 1825, "epoch": 43} {"train_loss": -3.1349642276763916, "global_step": 1826, "epoch": 43} {"train_loss": -2.9671359062194824, "global_step": 1827, "epoch": 43} {"train_loss": -3.032829999923706, "global_step": 1828, "epoch": 43} {"train_loss": -3.0519862174987793, "global_step": 1829, "epoch": 43} {"train_loss": -3.0472664833068848, "global_step": 1830, "epoch": 43} {"train_loss": -3.0836126804351807, "global_step": 1831, "epoch": 43} {"train_loss": -2.9530444145202637, "global_step": 1832, "epoch": 43} {"train_loss": -3.1744959354400635, "global_step": 1833, "epoch": 43} {"train_loss": -3.0200743675231934, "global_step": 1834, "epoch": 43} {"train_loss": -3.028444528579712, "global_step": 1835, "epoch": 43} {"train_loss": -3.1367311477661133, "global_step": 1836, "epoch": 43} {"train_loss": -3.268935203552246, "global_step": 1837, "epoch": 43} {"train_loss": -3.291069269180298, "global_step": 1838, "epoch": 43} {"train_loss": -3.1858129501342773, "global_step": 1839, "epoch": 43} {"train_loss": -3.270322322845459, "global_step": 1840, "epoch": 43} {"train_loss": -3.106576442718506, "global_step": 1841, "epoch": 43} {"train_loss": -3.2355239391326904, "global_step": 1842, "epoch": 43} {"train_loss": -3.188297748565674, "global_step": 1843, "epoch": 43} {"train_loss": -3.0770950317382812, "global_step": 1844, "epoch": 43} {"train_loss": -3.2638087272644043, "global_step": 1845, "epoch": 43} {"train_loss": -3.1130783557891846, "global_step": 1846, "epoch": 43} {"train_loss": -3.095132526897249, "global_step": 1847, "epoch": 43, "val_loss": 318555.125} {"train_loss": -3.2572176456451416, "global_step": 1848, "epoch": 44} {"train_loss": -3.3198766708374023, "global_step": 1849, "epoch": 44} {"train_loss": -3.0999836921691895, "global_step": 1850, "epoch": 44} {"train_loss": -3.1717679500579834, "global_step": 1851, "epoch": 44} {"train_loss": -3.2540454864501953, "global_step": 1852, "epoch": 44} {"train_loss": -3.2704110145568848, "global_step": 1853, "epoch": 44} {"train_loss": -3.1179895401000977, "global_step": 1854, "epoch": 44} {"train_loss": -3.0156521797180176, "global_step": 1855, "epoch": 44} {"train_loss": -3.1668615341186523, "global_step": 1856, "epoch": 44} {"train_loss": -3.142596483230591, "global_step": 1857, "epoch": 44} {"train_loss": -3.068816661834717, "global_step": 1858, "epoch": 44} {"train_loss": -3.2991602420806885, "global_step": 1859, "epoch": 44} {"train_loss": -3.116854429244995, "global_step": 1860, "epoch": 44} {"train_loss": -3.0084588527679443, "global_step": 1861, "epoch": 44} {"train_loss": -3.2918777465820312, "global_step": 1862, "epoch": 44} {"train_loss": -3.0856552124023438, "global_step": 1863, "epoch": 44} {"train_loss": -3.040001392364502, "global_step": 1864, "epoch": 44} {"train_loss": -3.097827196121216, "global_step": 1865, "epoch": 44} {"train_loss": -3.1461434364318848, "global_step": 1866, "epoch": 44} {"train_loss": -3.1038217544555664, "global_step": 1867, "epoch": 44} {"train_loss": -3.10208797454834, "global_step": 1868, "epoch": 44} {"train_loss": -3.0803165435791016, "global_step": 1869, "epoch": 44} {"train_loss": -3.183257579803467, "global_step": 1870, "epoch": 44} {"train_loss": -3.110764980316162, "global_step": 1871, "epoch": 44} {"train_loss": -3.252849817276001, "global_step": 1872, "epoch": 44} {"train_loss": -3.169200897216797, "global_step": 1873, "epoch": 44} {"train_loss": -3.0896005630493164, "global_step": 1874, "epoch": 44} {"train_loss": -3.3587136268615723, "global_step": 1875, "epoch": 44} {"train_loss": -3.072556495666504, "global_step": 1876, "epoch": 44} {"train_loss": -3.218268394470215, "global_step": 1877, "epoch": 44} {"train_loss": -3.1241202354431152, "global_step": 1878, "epoch": 44} {"train_loss": -3.268552780151367, "global_step": 1879, "epoch": 44} {"train_loss": -3.318206310272217, "global_step": 1880, "epoch": 44} {"train_loss": -3.0033109188079834, "global_step": 1881, "epoch": 44} {"train_loss": -3.1163225173950195, "global_step": 1882, "epoch": 44} {"train_loss": -3.297638416290283, "global_step": 1883, "epoch": 44} {"train_loss": -3.277562141418457, "global_step": 1884, "epoch": 44} {"train_loss": -3.2212905883789062, "global_step": 1885, "epoch": 44} {"train_loss": -3.2110953330993652, "global_step": 1886, "epoch": 44} {"train_loss": -3.305452585220337, "global_step": 1887, "epoch": 44} {"train_loss": -3.1984241008758545, "global_step": 1888, "epoch": 44} {"train_loss": -3.1768255631128945, "global_step": 1889, "epoch": 44, "val_loss": 306920.4375} {"train_loss": -3.2445051670074463, "global_step": 1890, "epoch": 45} {"train_loss": -3.375075340270996, "global_step": 1891, "epoch": 45} {"train_loss": -3.2552103996276855, "global_step": 1892, "epoch": 45} {"train_loss": -3.3679909706115723, "global_step": 1893, "epoch": 45} {"train_loss": -3.229471445083618, "global_step": 1894, "epoch": 45} {"train_loss": -3.328657627105713, "global_step": 1895, "epoch": 45} {"train_loss": -2.986231565475464, "global_step": 1896, "epoch": 45} {"train_loss": -3.2441344261169434, "global_step": 1897, "epoch": 45} {"train_loss": -3.320239543914795, "global_step": 1898, "epoch": 45} {"train_loss": -3.198319911956787, "global_step": 1899, "epoch": 45} {"train_loss": -3.3343024253845215, "global_step": 1900, "epoch": 45} {"train_loss": -3.230175018310547, "global_step": 1901, "epoch": 45} {"train_loss": -3.2145771980285645, "global_step": 1902, "epoch": 45} {"train_loss": -3.319458484649658, "global_step": 1903, "epoch": 45} {"train_loss": -3.15645694732666, "global_step": 1904, "epoch": 45} {"train_loss": -3.0362727642059326, "global_step": 1905, "epoch": 45} {"train_loss": -3.1907436847686768, "global_step": 1906, "epoch": 45} {"train_loss": -2.908111572265625, "global_step": 1907, "epoch": 45} {"train_loss": -3.2878313064575195, "global_step": 1908, "epoch": 45} {"train_loss": -3.0035252571105957, "global_step": 1909, "epoch": 45} {"train_loss": -3.1516571044921875, "global_step": 1910, "epoch": 45} {"train_loss": -3.3003690242767334, "global_step": 1911, "epoch": 45} {"train_loss": -3.1626157760620117, "global_step": 1912, "epoch": 45} {"train_loss": -3.352203607559204, "global_step": 1913, "epoch": 45} {"train_loss": -3.175361156463623, "global_step": 1914, "epoch": 45} {"train_loss": -3.1385507583618164, "global_step": 1915, "epoch": 45} {"train_loss": -3.3232269287109375, "global_step": 1916, "epoch": 45} {"train_loss": -3.326216459274292, "global_step": 1917, "epoch": 45} {"train_loss": -3.4052202701568604, "global_step": 1918, "epoch": 45} {"train_loss": -3.162815809249878, "global_step": 1919, "epoch": 45} {"train_loss": -3.289788007736206, "global_step": 1920, "epoch": 45} {"train_loss": -3.129851818084717, "global_step": 1921, "epoch": 45} {"train_loss": -3.221414804458618, "global_step": 1922, "epoch": 45} {"train_loss": -3.234645128250122, "global_step": 1923, "epoch": 45} {"train_loss": -3.1210622787475586, "global_step": 1924, "epoch": 45} {"train_loss": -3.2376351356506348, "global_step": 1925, "epoch": 45} {"train_loss": -3.245983600616455, "global_step": 1926, "epoch": 45} {"train_loss": -3.057968854904175, "global_step": 1927, "epoch": 45} {"train_loss": -3.0670485496520996, "global_step": 1928, "epoch": 45} {"train_loss": -3.468289852142334, "global_step": 1929, "epoch": 45} {"train_loss": -3.293867826461792, "global_step": 1930, "epoch": 45} {"train_loss": -3.223025776091076, "global_step": 1931, "epoch": 45, "val_loss": 288692.21875} {"train_loss": -3.166771173477173, "global_step": 1932, "epoch": 46} {"train_loss": -3.381442070007324, "global_step": 1933, "epoch": 46} {"train_loss": -3.2052903175354004, "global_step": 1934, "epoch": 46} {"train_loss": -3.299403667449951, "global_step": 1935, "epoch": 46} {"train_loss": -3.2121572494506836, "global_step": 1936, "epoch": 46} {"train_loss": -3.2667319774627686, "global_step": 1937, "epoch": 46} {"train_loss": -3.2537097930908203, "global_step": 1938, "epoch": 46} {"train_loss": -3.328381299972534, "global_step": 1939, "epoch": 46} {"train_loss": -3.315091133117676, "global_step": 1940, "epoch": 46} {"train_loss": -3.3174126148223877, "global_step": 1941, "epoch": 46} {"train_loss": -3.182112216949463, "global_step": 1942, "epoch": 46} {"train_loss": -3.179872989654541, "global_step": 1943, "epoch": 46} {"train_loss": -3.3625855445861816, "global_step": 1944, "epoch": 46} {"train_loss": -3.447427272796631, "global_step": 1945, "epoch": 46} {"train_loss": -3.195235013961792, "global_step": 1946, "epoch": 46} {"train_loss": -3.1685709953308105, "global_step": 1947, "epoch": 46} {"train_loss": -3.2200233936309814, "global_step": 1948, "epoch": 46} {"train_loss": -3.38983154296875, "global_step": 1949, "epoch": 46} {"train_loss": -3.346787929534912, "global_step": 1950, "epoch": 46} {"train_loss": -3.2472012042999268, "global_step": 1951, "epoch": 46} {"train_loss": -3.0690879821777344, "global_step": 1952, "epoch": 46} {"train_loss": -3.3067708015441895, "global_step": 1953, "epoch": 46} {"train_loss": -3.1728506088256836, "global_step": 1954, "epoch": 46} {"train_loss": -3.4147708415985107, "global_step": 1955, "epoch": 46} {"train_loss": -3.191232204437256, "global_step": 1956, "epoch": 46} {"train_loss": -3.189798355102539, "global_step": 1957, "epoch": 46} {"train_loss": -3.276374340057373, "global_step": 1958, "epoch": 46} {"train_loss": -3.1519572734832764, "global_step": 1959, "epoch": 46} {"train_loss": -3.183807373046875, "global_step": 1960, "epoch": 46} {"train_loss": -3.427959442138672, "global_step": 1961, "epoch": 46} {"train_loss": -3.3831586837768555, "global_step": 1962, "epoch": 46} {"train_loss": -3.2119970321655273, "global_step": 1963, "epoch": 46} {"train_loss": -3.1575393676757812, "global_step": 1964, "epoch": 46} {"train_loss": -3.3841288089752197, "global_step": 1965, "epoch": 46} {"train_loss": -3.331974744796753, "global_step": 1966, "epoch": 46} {"train_loss": -3.0614564418792725, "global_step": 1967, "epoch": 46} {"train_loss": -3.280097484588623, "global_step": 1968, "epoch": 46} {"train_loss": -2.9775807857513428, "global_step": 1969, "epoch": 46} {"train_loss": -3.0813279151916504, "global_step": 1970, "epoch": 46} {"train_loss": -3.206254482269287, "global_step": 1971, "epoch": 46} {"train_loss": -3.253774642944336, "global_step": 1972, "epoch": 46} {"train_loss": -3.249877861567906, "global_step": 1973, "epoch": 46, "val_loss": 274491.71875} {"train_loss": -3.177341938018799, "global_step": 1974, "epoch": 47} {"train_loss": -3.0892744064331055, "global_step": 1975, "epoch": 47} {"train_loss": -3.253143787384033, "global_step": 1976, "epoch": 47} {"train_loss": -3.3537402153015137, "global_step": 1977, "epoch": 47} {"train_loss": -3.217123031616211, "global_step": 1978, "epoch": 47} {"train_loss": -3.358067035675049, "global_step": 1979, "epoch": 47} {"train_loss": -3.309900999069214, "global_step": 1980, "epoch": 47} {"train_loss": -3.335045099258423, "global_step": 1981, "epoch": 47} {"train_loss": -3.394667148590088, "global_step": 1982, "epoch": 47} {"train_loss": -3.2613182067871094, "global_step": 1983, "epoch": 47} {"train_loss": -3.298172950744629, "global_step": 1984, "epoch": 47} {"train_loss": -3.2820053100585938, "global_step": 1985, "epoch": 47} {"train_loss": -3.3432388305664062, "global_step": 1986, "epoch": 47} {"train_loss": -3.304776191711426, "global_step": 1987, "epoch": 47} {"train_loss": -3.3613226413726807, "global_step": 1988, "epoch": 47} {"train_loss": -3.3498764038085938, "global_step": 1989, "epoch": 47} {"train_loss": -3.336824893951416, "global_step": 1990, "epoch": 47} {"train_loss": -3.4227452278137207, "global_step": 1991, "epoch": 47} {"train_loss": -3.3286685943603516, "global_step": 1992, "epoch": 47} {"train_loss": -3.260591983795166, "global_step": 1993, "epoch": 47} {"train_loss": -3.3609695434570312, "global_step": 1994, "epoch": 47} {"train_loss": -3.483733654022217, "global_step": 1995, "epoch": 47} {"train_loss": -3.375164270401001, "global_step": 1996, "epoch": 47} {"train_loss": -3.278451442718506, "global_step": 1997, "epoch": 47} {"train_loss": -3.2639403343200684, "global_step": 1998, "epoch": 47} {"train_loss": -3.1549108028411865, "global_step": 1999, "epoch": 47} {"train_loss": -3.345506191253662, "global_step": 2000, "epoch": 47} {"train_loss": -3.315699338912964, "global_step": 2001, "epoch": 47} {"train_loss": -3.3953676223754883, "global_step": 2002, "epoch": 47} {"train_loss": -3.2651305198669434, "global_step": 2003, "epoch": 47} {"train_loss": -3.4245314598083496, "global_step": 2004, "epoch": 47} {"train_loss": -3.2317168712615967, "global_step": 2005, "epoch": 47} {"train_loss": -3.2247321605682373, "global_step": 2006, "epoch": 47} {"train_loss": -3.469081401824951, "global_step": 2007, "epoch": 47} {"train_loss": -3.245884418487549, "global_step": 2008, "epoch": 47} {"train_loss": -3.277146339416504, "global_step": 2009, "epoch": 47} {"train_loss": -3.150186061859131, "global_step": 2010, "epoch": 47} {"train_loss": -3.3016061782836914, "global_step": 2011, "epoch": 47} {"train_loss": -3.4382615089416504, "global_step": 2012, "epoch": 47} {"train_loss": -3.573633909225464, "global_step": 2013, "epoch": 47} {"train_loss": -3.176723003387451, "global_step": 2014, "epoch": 47} {"train_loss": -3.317276602699643, "global_step": 2015, "epoch": 47, "val_loss": 253431.46875} {"train_loss": -3.3576180934906006, "global_step": 2016, "epoch": 48} {"train_loss": -3.247119426727295, "global_step": 2017, "epoch": 48} {"train_loss": -3.2304277420043945, "global_step": 2018, "epoch": 48} {"train_loss": -3.3972201347351074, "global_step": 2019, "epoch": 48} {"train_loss": -3.391653060913086, "global_step": 2020, "epoch": 48} {"train_loss": -3.3090295791625977, "global_step": 2021, "epoch": 48} {"train_loss": -3.3544044494628906, "global_step": 2022, "epoch": 48} {"train_loss": -3.3709259033203125, "global_step": 2023, "epoch": 48} {"train_loss": -3.2946510314941406, "global_step": 2024, "epoch": 48} {"train_loss": -3.411679744720459, "global_step": 2025, "epoch": 48} {"train_loss": -3.3202643394470215, "global_step": 2026, "epoch": 48} {"train_loss": -3.3829710483551025, "global_step": 2027, "epoch": 48} {"train_loss": -3.3906612396240234, "global_step": 2028, "epoch": 48} {"train_loss": -3.41911244392395, "global_step": 2029, "epoch": 48} {"train_loss": -3.4221301078796387, "global_step": 2030, "epoch": 48} {"train_loss": -3.3918423652648926, "global_step": 2031, "epoch": 48} {"train_loss": -3.4391684532165527, "global_step": 2032, "epoch": 48} {"train_loss": -3.3470306396484375, "global_step": 2033, "epoch": 48} {"train_loss": -3.472864866256714, "global_step": 2034, "epoch": 48} {"train_loss": -3.3895297050476074, "global_step": 2035, "epoch": 48} {"train_loss": -3.401911973953247, "global_step": 2036, "epoch": 48} {"train_loss": -3.4110071659088135, "global_step": 2037, "epoch": 48} {"train_loss": -3.175276279449463, "global_step": 2038, "epoch": 48} {"train_loss": -3.368457555770874, "global_step": 2039, "epoch": 48} {"train_loss": -3.3517556190490723, "global_step": 2040, "epoch": 48} {"train_loss": -3.275157928466797, "global_step": 2041, "epoch": 48} {"train_loss": -3.334254741668701, "global_step": 2042, "epoch": 48} {"train_loss": -3.25641131401062, "global_step": 2043, "epoch": 48} {"train_loss": -3.0552446842193604, "global_step": 2044, "epoch": 48} {"train_loss": -3.5535969734191895, "global_step": 2045, "epoch": 48} {"train_loss": -3.0496668815612793, "global_step": 2046, "epoch": 48} {"train_loss": -3.2307820320129395, "global_step": 2047, "epoch": 48} {"train_loss": -3.512005090713501, "global_step": 2048, "epoch": 48} {"train_loss": -3.0635292530059814, "global_step": 2049, "epoch": 48} {"train_loss": -3.08205509185791, "global_step": 2050, "epoch": 48} {"train_loss": -3.277672290802002, "global_step": 2051, "epoch": 48} {"train_loss": -3.0452451705932617, "global_step": 2052, "epoch": 48} {"train_loss": -3.2859184741973877, "global_step": 2053, "epoch": 48} {"train_loss": -2.940392017364502, "global_step": 2054, "epoch": 48} {"train_loss": -3.174560308456421, "global_step": 2055, "epoch": 48} {"train_loss": -2.907594680786133, "global_step": 2056, "epoch": 48} {"train_loss": -3.293588394210452, "global_step": 2057, "epoch": 48, "val_loss": 248522.84375} {"train_loss": -3.122727632522583, "global_step": 2058, "epoch": 49} {"train_loss": -3.1997199058532715, "global_step": 2059, "epoch": 49} {"train_loss": -3.2110707759857178, "global_step": 2060, "epoch": 49} {"train_loss": -3.1390628814697266, "global_step": 2061, "epoch": 49} {"train_loss": -3.336428642272949, "global_step": 2062, "epoch": 49} {"train_loss": -3.2448394298553467, "global_step": 2063, "epoch": 49} {"train_loss": -3.411834955215454, "global_step": 2064, "epoch": 49} {"train_loss": -3.2140965461730957, "global_step": 2065, "epoch": 49} {"train_loss": -3.2688841819763184, "global_step": 2066, "epoch": 49} {"train_loss": -3.1750612258911133, "global_step": 2067, "epoch": 49} {"train_loss": -3.3977928161621094, "global_step": 2068, "epoch": 49} {"train_loss": -3.294924020767212, "global_step": 2069, "epoch": 49} {"train_loss": -3.412426471710205, "global_step": 2070, "epoch": 49} {"train_loss": -3.30770206451416, "global_step": 2071, "epoch": 49} {"train_loss": -3.3046278953552246, "global_step": 2072, "epoch": 49} {"train_loss": -3.311673641204834, "global_step": 2073, "epoch": 49} {"train_loss": -3.373868227005005, "global_step": 2074, "epoch": 49} {"train_loss": -3.2998995780944824, "global_step": 2075, "epoch": 49} {"train_loss": -3.4668257236480713, "global_step": 2076, "epoch": 49} {"train_loss": -3.4593725204467773, "global_step": 2077, "epoch": 49} {"train_loss": -3.3647942543029785, "global_step": 2078, "epoch": 49} {"train_loss": -3.2994136810302734, "global_step": 2079, "epoch": 49} {"train_loss": -3.327993154525757, "global_step": 2080, "epoch": 49} {"train_loss": -3.393049716949463, "global_step": 2081, "epoch": 49} {"train_loss": -3.3738608360290527, "global_step": 2082, "epoch": 49} {"train_loss": -3.398923397064209, "global_step": 2083, "epoch": 49} {"train_loss": -3.566277503967285, "global_step": 2084, "epoch": 49} {"train_loss": -3.468327522277832, "global_step": 2085, "epoch": 49} {"train_loss": -3.5951340198516846, "global_step": 2086, "epoch": 49} {"train_loss": -3.406036138534546, "global_step": 2087, "epoch": 49} {"train_loss": -3.4227685928344727, "global_step": 2088, "epoch": 49} {"train_loss": -3.4280288219451904, "global_step": 2089, "epoch": 49} {"train_loss": -3.49937105178833, "global_step": 2090, "epoch": 49} {"train_loss": -3.3517751693725586, "global_step": 2091, "epoch": 49} {"train_loss": -3.316362142562866, "global_step": 2092, "epoch": 49} {"train_loss": -3.3474984169006348, "global_step": 2093, "epoch": 49} {"train_loss": -3.341425657272339, "global_step": 2094, "epoch": 49} {"train_loss": -3.494459390640259, "global_step": 2095, "epoch": 49} {"train_loss": -3.455660343170166, "global_step": 2096, "epoch": 49} {"train_loss": -3.3921422958374023, "global_step": 2097, "epoch": 49} {"train_loss": -3.2217226028442383, "global_step": 2098, "epoch": 49} {"train_loss": -3.355369414602007, "global_step": 2099, "epoch": 49, "val_loss": 229256.578125} {"train_loss": -3.532465696334839, "global_step": 2100, "epoch": 50} {"train_loss": -3.0953145027160645, "global_step": 2101, "epoch": 50} {"train_loss": -3.512037754058838, "global_step": 2102, "epoch": 50} {"train_loss": -3.1045737266540527, "global_step": 2103, "epoch": 50} {"train_loss": -3.4343185424804688, "global_step": 2104, "epoch": 50} {"train_loss": -3.246495008468628, "global_step": 2105, "epoch": 50} {"train_loss": -3.0943121910095215, "global_step": 2106, "epoch": 50} {"train_loss": -3.2294154167175293, "global_step": 2107, "epoch": 50} {"train_loss": -3.101811647415161, "global_step": 2108, "epoch": 50} {"train_loss": -3.1789751052856445, "global_step": 2109, "epoch": 50} {"train_loss": -3.321648597717285, "global_step": 2110, "epoch": 50} {"train_loss": -3.46260929107666, "global_step": 2111, "epoch": 50} {"train_loss": -3.177295684814453, "global_step": 2112, "epoch": 50} {"train_loss": -3.3912079334259033, "global_step": 2113, "epoch": 50} {"train_loss": -3.2208824157714844, "global_step": 2114, "epoch": 50} {"train_loss": -3.3128225803375244, "global_step": 2115, "epoch": 50} {"train_loss": -3.125154972076416, "global_step": 2116, "epoch": 50} {"train_loss": -3.3898415565490723, "global_step": 2117, "epoch": 50} {"train_loss": -3.3513777256011963, "global_step": 2118, "epoch": 50} {"train_loss": -3.489220142364502, "global_step": 2119, "epoch": 50} {"train_loss": -3.3417704105377197, "global_step": 2120, "epoch": 50} {"train_loss": -3.3473737239837646, "global_step": 2121, "epoch": 50} {"train_loss": -3.45935320854187, "global_step": 2122, "epoch": 50} {"train_loss": -3.426755428314209, "global_step": 2123, "epoch": 50} {"train_loss": -3.37789249420166, "global_step": 2124, "epoch": 50} {"train_loss": -3.4163973331451416, "global_step": 2125, "epoch": 50} {"train_loss": -3.4056949615478516, "global_step": 2126, "epoch": 50} {"train_loss": -3.3537888526916504, "global_step": 2127, "epoch": 50} {"train_loss": -3.4733057022094727, "global_step": 2128, "epoch": 50} {"train_loss": -3.430051803588867, "global_step": 2129, "epoch": 50} {"train_loss": -3.341224193572998, "global_step": 2130, "epoch": 50} {"train_loss": -3.5708260536193848, "global_step": 2131, "epoch": 50} {"train_loss": -3.3727405071258545, "global_step": 2132, "epoch": 50} {"train_loss": -3.449307680130005, "global_step": 2133, "epoch": 50} {"train_loss": -3.4567677974700928, "global_step": 2134, "epoch": 50} {"train_loss": -3.4393157958984375, "global_step": 2135, "epoch": 50} {"train_loss": -3.324908971786499, "global_step": 2136, "epoch": 50} {"train_loss": -3.5485124588012695, "global_step": 2137, "epoch": 50} {"train_loss": -3.4730448722839355, "global_step": 2138, "epoch": 50} {"train_loss": -3.48736310005188, "global_step": 2139, "epoch": 50} {"train_loss": -3.4671902656555176, "global_step": 2140, "epoch": 50} {"train_loss": -3.3627935761497136, "global_step": 2141, "epoch": 50, "train/sim_max_reward_0": 0.20072886147220637, "train/sim_max_reward_1": 0.02421399006775237, "train/sim_max_reward_2": 0.19035337023852975, "train/sim_max_reward_3": 0.1297551205067955, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.32799242057724987, "test/sim_max_reward_4400000": 0.08842786286054531, "test/sim_max_reward_4400001": 0.014021135271422376, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.05980559919624764, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.01955546926210679, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3790527451622899, "test/sim_max_reward_4400009": 0.2670901441762299, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.07303396680694195, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.15614163815340495, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.018847833367539663, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.12080925927260766, "test/sim_max_reward_4400018": 0.27700202539923524, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0005902508818570494, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.5756704434788589, "test/sim_max_reward_4400028": 0.11018143155997313, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.3853590968555274, "test/sim_max_reward_4400031": 0.2548014139301188, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.13459891488778805, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.6255796181516892, "test/sim_max_reward_4400036": 0.41104225657163546, "test/sim_max_reward_4400037": 0.3606999372386999, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.5184526368736442, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.01889308926184006, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.010414354270247225, "test/sim_max_reward_4400044": 0.4328457373847731, "test/sim_max_reward_4400045": 0.04006516143120823, "test/sim_max_reward_4400046": 0.19081247656830896, "test/sim_max_reward_4400047": 0.0005351012849106201, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.14709117840554387, "test/mean_score": 0.1346328401740711, "val_loss": 216947.546875} {"train_loss": -3.3549928665161133, "global_step": 2142, "epoch": 51} {"train_loss": -3.5551562309265137, "global_step": 2143, "epoch": 51} {"train_loss": -3.5113754272460938, "global_step": 2144, "epoch": 51} {"train_loss": -3.4628489017486572, "global_step": 2145, "epoch": 51} {"train_loss": -3.4334545135498047, "global_step": 2146, "epoch": 51} {"train_loss": -3.4278626441955566, "global_step": 2147, "epoch": 51} {"train_loss": -3.4803080558776855, "global_step": 2148, "epoch": 51} {"train_loss": -3.434587001800537, "global_step": 2149, "epoch": 51} {"train_loss": -3.5939972400665283, "global_step": 2150, "epoch": 51} {"train_loss": -3.2745048999786377, "global_step": 2151, "epoch": 51} {"train_loss": -3.236720561981201, "global_step": 2152, "epoch": 51} {"train_loss": -3.3860182762145996, "global_step": 2153, "epoch": 51} {"train_loss": -3.6147823333740234, "global_step": 2154, "epoch": 51} {"train_loss": -3.506112575531006, "global_step": 2155, "epoch": 51} {"train_loss": -3.3316702842712402, "global_step": 2156, "epoch": 51} {"train_loss": -3.2966504096984863, "global_step": 2157, "epoch": 51} {"train_loss": -3.5444183349609375, "global_step": 2158, "epoch": 51} {"train_loss": -3.3384175300598145, "global_step": 2159, "epoch": 51} {"train_loss": -3.2687032222747803, "global_step": 2160, "epoch": 51} {"train_loss": -3.349763870239258, "global_step": 2161, "epoch": 51} {"train_loss": -3.5952329635620117, "global_step": 2162, "epoch": 51} {"train_loss": -3.3379669189453125, "global_step": 2163, "epoch": 51} {"train_loss": -3.410709857940674, "global_step": 2164, "epoch": 51} {"train_loss": -3.496098279953003, "global_step": 2165, "epoch": 51} {"train_loss": -3.3049745559692383, "global_step": 2166, "epoch": 51} {"train_loss": -3.435100555419922, "global_step": 2167, "epoch": 51} {"train_loss": -3.5822434425354004, "global_step": 2168, "epoch": 51} {"train_loss": -3.447824478149414, "global_step": 2169, "epoch": 51} {"train_loss": -3.2833192348480225, "global_step": 2170, "epoch": 51} {"train_loss": -3.4145615100860596, "global_step": 2171, "epoch": 51} {"train_loss": -3.466846466064453, "global_step": 2172, "epoch": 51} {"train_loss": -3.3708972930908203, "global_step": 2173, "epoch": 51} {"train_loss": -3.5961785316467285, "global_step": 2174, "epoch": 51} {"train_loss": -3.3445191383361816, "global_step": 2175, "epoch": 51} {"train_loss": -3.46769642829895, "global_step": 2176, "epoch": 51} {"train_loss": -3.3314406871795654, "global_step": 2177, "epoch": 51} {"train_loss": -3.5286214351654053, "global_step": 2178, "epoch": 51} {"train_loss": -3.381742000579834, "global_step": 2179, "epoch": 51} {"train_loss": -3.255512237548828, "global_step": 2180, "epoch": 51} {"train_loss": -3.505092144012451, "global_step": 2181, "epoch": 51} {"train_loss": -3.4505467414855957, "global_step": 2182, "epoch": 51} {"train_loss": -3.4233162630172003, "global_step": 2183, "epoch": 51, "val_loss": 210971.0625} {"train_loss": -3.4439139366149902, "global_step": 2184, "epoch": 52} {"train_loss": -3.3303141593933105, "global_step": 2185, "epoch": 52} {"train_loss": -3.388463258743286, "global_step": 2186, "epoch": 52} {"train_loss": -3.2486634254455566, "global_step": 2187, "epoch": 52} {"train_loss": -3.3738224506378174, "global_step": 2188, "epoch": 52} {"train_loss": -3.230010986328125, "global_step": 2189, "epoch": 52} {"train_loss": -3.388448476791382, "global_step": 2190, "epoch": 52} {"train_loss": -3.3459787368774414, "global_step": 2191, "epoch": 52} {"train_loss": -3.4658782482147217, "global_step": 2192, "epoch": 52} {"train_loss": -3.4606966972351074, "global_step": 2193, "epoch": 52} {"train_loss": -3.3143177032470703, "global_step": 2194, "epoch": 52} {"train_loss": -3.46187162399292, "global_step": 2195, "epoch": 52} {"train_loss": -3.3527660369873047, "global_step": 2196, "epoch": 52} {"train_loss": -3.4534707069396973, "global_step": 2197, "epoch": 52} {"train_loss": -3.6007940769195557, "global_step": 2198, "epoch": 52} {"train_loss": -3.418168067932129, "global_step": 2199, "epoch": 52} {"train_loss": -3.440591335296631, "global_step": 2200, "epoch": 52} {"train_loss": -3.4802231788635254, "global_step": 2201, "epoch": 52} {"train_loss": -3.534860610961914, "global_step": 2202, "epoch": 52} {"train_loss": -3.452921152114868, "global_step": 2203, "epoch": 52} {"train_loss": -3.4977054595947266, "global_step": 2204, "epoch": 52} {"train_loss": -3.3594512939453125, "global_step": 2205, "epoch": 52} {"train_loss": -3.3731353282928467, "global_step": 2206, "epoch": 52} {"train_loss": -3.527998685836792, "global_step": 2207, "epoch": 52} {"train_loss": -3.382153034210205, "global_step": 2208, "epoch": 52} {"train_loss": -3.4541614055633545, "global_step": 2209, "epoch": 52} {"train_loss": -3.516559600830078, "global_step": 2210, "epoch": 52} {"train_loss": -3.650254249572754, "global_step": 2211, "epoch": 52} {"train_loss": -3.3914084434509277, "global_step": 2212, "epoch": 52} {"train_loss": -3.568227529525757, "global_step": 2213, "epoch": 52} {"train_loss": -3.452702760696411, "global_step": 2214, "epoch": 52} {"train_loss": -3.4976463317871094, "global_step": 2215, "epoch": 52} {"train_loss": -3.54424786567688, "global_step": 2216, "epoch": 52} {"train_loss": -3.498849868774414, "global_step": 2217, "epoch": 52} {"train_loss": -3.39656400680542, "global_step": 2218, "epoch": 52} {"train_loss": -3.5440549850463867, "global_step": 2219, "epoch": 52} {"train_loss": -3.3812944889068604, "global_step": 2220, "epoch": 52} {"train_loss": -3.566279411315918, "global_step": 2221, "epoch": 52} {"train_loss": -3.378047466278076, "global_step": 2222, "epoch": 52} {"train_loss": -3.5013551712036133, "global_step": 2223, "epoch": 52} {"train_loss": -3.538116216659546, "global_step": 2224, "epoch": 52} {"train_loss": -3.4425382897967385, "global_step": 2225, "epoch": 52, "val_loss": 205753.15625} {"train_loss": -3.550654411315918, "global_step": 2226, "epoch": 53} {"train_loss": -3.3039135932922363, "global_step": 2227, "epoch": 53} {"train_loss": -3.355299711227417, "global_step": 2228, "epoch": 53} {"train_loss": -3.4383177757263184, "global_step": 2229, "epoch": 53} {"train_loss": -3.3053293228149414, "global_step": 2230, "epoch": 53} {"train_loss": -3.5521793365478516, "global_step": 2231, "epoch": 53} {"train_loss": -3.3457908630371094, "global_step": 2232, "epoch": 53} {"train_loss": -3.504784107208252, "global_step": 2233, "epoch": 53} {"train_loss": -3.3845677375793457, "global_step": 2234, "epoch": 53} {"train_loss": -3.4265830516815186, "global_step": 2235, "epoch": 53} {"train_loss": -3.6066813468933105, "global_step": 2236, "epoch": 53} {"train_loss": -3.391106605529785, "global_step": 2237, "epoch": 53} {"train_loss": -3.474606513977051, "global_step": 2238, "epoch": 53} {"train_loss": -3.4245314598083496, "global_step": 2239, "epoch": 53} {"train_loss": -3.6490964889526367, "global_step": 2240, "epoch": 53} {"train_loss": -3.4193835258483887, "global_step": 2241, "epoch": 53} {"train_loss": -3.467407703399658, "global_step": 2242, "epoch": 53} {"train_loss": -3.5815629959106445, "global_step": 2243, "epoch": 53} {"train_loss": -3.4610042572021484, "global_step": 2244, "epoch": 53} {"train_loss": -3.370692491531372, "global_step": 2245, "epoch": 53} {"train_loss": -3.4296271800994873, "global_step": 2246, "epoch": 53} {"train_loss": -3.737887382507324, "global_step": 2247, "epoch": 53} {"train_loss": -3.4642174243927, "global_step": 2248, "epoch": 53} {"train_loss": -3.4522154331207275, "global_step": 2249, "epoch": 53} {"train_loss": -3.575178623199463, "global_step": 2250, "epoch": 53} {"train_loss": -3.6480488777160645, "global_step": 2251, "epoch": 53} {"train_loss": -3.5009701251983643, "global_step": 2252, "epoch": 53} {"train_loss": -3.3413844108581543, "global_step": 2253, "epoch": 53} {"train_loss": -3.356476306915283, "global_step": 2254, "epoch": 53} {"train_loss": -3.479990005493164, "global_step": 2255, "epoch": 53} {"train_loss": -3.4740915298461914, "global_step": 2256, "epoch": 53} {"train_loss": -3.6257004737854004, "global_step": 2257, "epoch": 53} {"train_loss": -3.540189743041992, "global_step": 2258, "epoch": 53} {"train_loss": -3.4797439575195312, "global_step": 2259, "epoch": 53} {"train_loss": -3.5371146202087402, "global_step": 2260, "epoch": 53} {"train_loss": -3.5446999073028564, "global_step": 2261, "epoch": 53} {"train_loss": -3.527487277984619, "global_step": 2262, "epoch": 53} {"train_loss": -3.604097366333008, "global_step": 2263, "epoch": 53} {"train_loss": -3.510502576828003, "global_step": 2264, "epoch": 53} {"train_loss": -3.564138650894165, "global_step": 2265, "epoch": 53} {"train_loss": -3.4030954837799072, "global_step": 2266, "epoch": 53} {"train_loss": -3.4847045909790766, "global_step": 2267, "epoch": 53, "val_loss": 195808.546875} {"train_loss": -3.6161048412323, "global_step": 2268, "epoch": 54} {"train_loss": -3.5321922302246094, "global_step": 2269, "epoch": 54} {"train_loss": -3.5409903526306152, "global_step": 2270, "epoch": 54} {"train_loss": -3.742602825164795, "global_step": 2271, "epoch": 54} {"train_loss": -3.695438861846924, "global_step": 2272, "epoch": 54} {"train_loss": -3.3858232498168945, "global_step": 2273, "epoch": 54} {"train_loss": -3.573566198348999, "global_step": 2274, "epoch": 54} {"train_loss": -3.5869946479797363, "global_step": 2275, "epoch": 54} {"train_loss": -3.5253584384918213, "global_step": 2276, "epoch": 54} {"train_loss": -3.488555431365967, "global_step": 2277, "epoch": 54} {"train_loss": -3.5366854667663574, "global_step": 2278, "epoch": 54} {"train_loss": -3.5079398155212402, "global_step": 2279, "epoch": 54} {"train_loss": -3.439495086669922, "global_step": 2280, "epoch": 54} {"train_loss": -3.639530658721924, "global_step": 2281, "epoch": 54} {"train_loss": -3.4400718212127686, "global_step": 2282, "epoch": 54} {"train_loss": -3.417847156524658, "global_step": 2283, "epoch": 54} {"train_loss": -3.634855031967163, "global_step": 2284, "epoch": 54} {"train_loss": -3.6192264556884766, "global_step": 2285, "epoch": 54} {"train_loss": -3.5251407623291016, "global_step": 2286, "epoch": 54} {"train_loss": -3.6055541038513184, "global_step": 2287, "epoch": 54} {"train_loss": -3.601086139678955, "global_step": 2288, "epoch": 54} {"train_loss": -3.3078508377075195, "global_step": 2289, "epoch": 54} {"train_loss": -3.5635461807250977, "global_step": 2290, "epoch": 54} {"train_loss": -3.603567600250244, "global_step": 2291, "epoch": 54} {"train_loss": -3.5459673404693604, "global_step": 2292, "epoch": 54} {"train_loss": -3.4190335273742676, "global_step": 2293, "epoch": 54} {"train_loss": -3.5496463775634766, "global_step": 2294, "epoch": 54} {"train_loss": -3.563601016998291, "global_step": 2295, "epoch": 54} {"train_loss": -3.581552505493164, "global_step": 2296, "epoch": 54} {"train_loss": -3.4624476432800293, "global_step": 2297, "epoch": 54} {"train_loss": -3.667618751525879, "global_step": 2298, "epoch": 54} {"train_loss": -3.594944715499878, "global_step": 2299, "epoch": 54} {"train_loss": -3.6698617935180664, "global_step": 2300, "epoch": 54} {"train_loss": -3.5819993019104004, "global_step": 2301, "epoch": 54} {"train_loss": -3.3986902236938477, "global_step": 2302, "epoch": 54} {"train_loss": -3.5601627826690674, "global_step": 2303, "epoch": 54} {"train_loss": -3.466909646987915, "global_step": 2304, "epoch": 54} {"train_loss": -3.5362391471862793, "global_step": 2305, "epoch": 54} {"train_loss": -3.534268856048584, "global_step": 2306, "epoch": 54} {"train_loss": -3.372898817062378, "global_step": 2307, "epoch": 54} {"train_loss": -3.7098515033721924, "global_step": 2308, "epoch": 54} {"train_loss": -3.539842974571955, "global_step": 2309, "epoch": 54, "val_loss": 193760.5625} {"train_loss": -3.624279260635376, "global_step": 2310, "epoch": 55} {"train_loss": -3.5864622592926025, "global_step": 2311, "epoch": 55} {"train_loss": -3.3948771953582764, "global_step": 2312, "epoch": 55} {"train_loss": -3.696223497390747, "global_step": 2313, "epoch": 55} {"train_loss": -3.3152027130126953, "global_step": 2314, "epoch": 55} {"train_loss": -3.599116086959839, "global_step": 2315, "epoch": 55} {"train_loss": -3.620706558227539, "global_step": 2316, "epoch": 55} {"train_loss": -3.279536724090576, "global_step": 2317, "epoch": 55} {"train_loss": -3.6299095153808594, "global_step": 2318, "epoch": 55} {"train_loss": -3.434805393218994, "global_step": 2319, "epoch": 55} {"train_loss": -3.5806546211242676, "global_step": 2320, "epoch": 55} {"train_loss": -3.1911916732788086, "global_step": 2321, "epoch": 55} {"train_loss": -3.501838207244873, "global_step": 2322, "epoch": 55} {"train_loss": -3.364907741546631, "global_step": 2323, "epoch": 55} {"train_loss": -3.5448684692382812, "global_step": 2324, "epoch": 55} {"train_loss": -3.3811347484588623, "global_step": 2325, "epoch": 55} {"train_loss": -3.5066418647766113, "global_step": 2326, "epoch": 55} {"train_loss": -3.5457539558410645, "global_step": 2327, "epoch": 55} {"train_loss": -3.63002872467041, "global_step": 2328, "epoch": 55} {"train_loss": -3.4529974460601807, "global_step": 2329, "epoch": 55} {"train_loss": -3.5374813079833984, "global_step": 2330, "epoch": 55} {"train_loss": -3.499070644378662, "global_step": 2331, "epoch": 55} {"train_loss": -3.65010929107666, "global_step": 2332, "epoch": 55} {"train_loss": -3.381049871444702, "global_step": 2333, "epoch": 55} {"train_loss": -3.492795467376709, "global_step": 2334, "epoch": 55} {"train_loss": -3.455005168914795, "global_step": 2335, "epoch": 55} {"train_loss": -3.663985252380371, "global_step": 2336, "epoch": 55} {"train_loss": -3.5381155014038086, "global_step": 2337, "epoch": 55} {"train_loss": -3.6049108505249023, "global_step": 2338, "epoch": 55} {"train_loss": -3.6717944145202637, "global_step": 2339, "epoch": 55} {"train_loss": -3.4855427742004395, "global_step": 2340, "epoch": 55} {"train_loss": -3.608588695526123, "global_step": 2341, "epoch": 55} {"train_loss": -3.6219120025634766, "global_step": 2342, "epoch": 55} {"train_loss": -3.7123045921325684, "global_step": 2343, "epoch": 55} {"train_loss": -3.3910510540008545, "global_step": 2344, "epoch": 55} {"train_loss": -3.622170925140381, "global_step": 2345, "epoch": 55} {"train_loss": -3.593698501586914, "global_step": 2346, "epoch": 55} {"train_loss": -3.4552648067474365, "global_step": 2347, "epoch": 55} {"train_loss": -3.6320106983184814, "global_step": 2348, "epoch": 55} {"train_loss": -3.7143263816833496, "global_step": 2349, "epoch": 55} {"train_loss": -3.2563023567199707, "global_step": 2350, "epoch": 55} {"train_loss": -3.525448208763486, "global_step": 2351, "epoch": 55, "val_loss": 194378.65625} {"train_loss": -3.2882699966430664, "global_step": 2352, "epoch": 56} {"train_loss": -3.506547689437866, "global_step": 2353, "epoch": 56} {"train_loss": -3.4763758182525635, "global_step": 2354, "epoch": 56} {"train_loss": -3.5174307823181152, "global_step": 2355, "epoch": 56} {"train_loss": -3.7075281143188477, "global_step": 2356, "epoch": 56} {"train_loss": -3.5053069591522217, "global_step": 2357, "epoch": 56} {"train_loss": -3.5538699626922607, "global_step": 2358, "epoch": 56} {"train_loss": -3.543189287185669, "global_step": 2359, "epoch": 56} {"train_loss": -3.3097002506256104, "global_step": 2360, "epoch": 56} {"train_loss": -3.512176513671875, "global_step": 2361, "epoch": 56} {"train_loss": -3.6578691005706787, "global_step": 2362, "epoch": 56} {"train_loss": -3.319689989089966, "global_step": 2363, "epoch": 56} {"train_loss": -3.7119479179382324, "global_step": 2364, "epoch": 56} {"train_loss": -3.5749073028564453, "global_step": 2365, "epoch": 56} {"train_loss": -3.342607259750366, "global_step": 2366, "epoch": 56} {"train_loss": -3.5344958305358887, "global_step": 2367, "epoch": 56} {"train_loss": -3.5751590728759766, "global_step": 2368, "epoch": 56} {"train_loss": -3.485938787460327, "global_step": 2369, "epoch": 56} {"train_loss": -3.8222432136535645, "global_step": 2370, "epoch": 56} {"train_loss": -3.4704654216766357, "global_step": 2371, "epoch": 56} {"train_loss": -3.588414192199707, "global_step": 2372, "epoch": 56} {"train_loss": -3.5656161308288574, "global_step": 2373, "epoch": 56} {"train_loss": -3.5444562435150146, "global_step": 2374, "epoch": 56} {"train_loss": -3.6206696033477783, "global_step": 2375, "epoch": 56} {"train_loss": -3.430148124694824, "global_step": 2376, "epoch": 56} {"train_loss": -3.6526923179626465, "global_step": 2377, "epoch": 56} {"train_loss": -3.6194326877593994, "global_step": 2378, "epoch": 56} {"train_loss": -3.4310948848724365, "global_step": 2379, "epoch": 56} {"train_loss": -3.5775208473205566, "global_step": 2380, "epoch": 56} {"train_loss": -3.2303285598754883, "global_step": 2381, "epoch": 56} {"train_loss": -3.280414581298828, "global_step": 2382, "epoch": 56} {"train_loss": -3.37800931930542, "global_step": 2383, "epoch": 56} {"train_loss": -3.5573201179504395, "global_step": 2384, "epoch": 56} {"train_loss": -3.5251879692077637, "global_step": 2385, "epoch": 56} {"train_loss": -3.491654872894287, "global_step": 2386, "epoch": 56} {"train_loss": -3.394935131072998, "global_step": 2387, "epoch": 56} {"train_loss": -3.7180159091949463, "global_step": 2388, "epoch": 56} {"train_loss": -3.3811092376708984, "global_step": 2389, "epoch": 56} {"train_loss": -3.6776227951049805, "global_step": 2390, "epoch": 56} {"train_loss": -3.118870973587036, "global_step": 2391, "epoch": 56} {"train_loss": -3.6948819160461426, "global_step": 2392, "epoch": 56} {"train_loss": -3.5067656607854936, "global_step": 2393, "epoch": 56, "val_loss": 187457.265625} {"train_loss": -3.6155433654785156, "global_step": 2394, "epoch": 57} {"train_loss": -3.6256401538848877, "global_step": 2395, "epoch": 57} {"train_loss": -3.596341371536255, "global_step": 2396, "epoch": 57} {"train_loss": -3.5313713550567627, "global_step": 2397, "epoch": 57} {"train_loss": -3.631175994873047, "global_step": 2398, "epoch": 57} {"train_loss": -3.6364216804504395, "global_step": 2399, "epoch": 57} {"train_loss": -3.544429302215576, "global_step": 2400, "epoch": 57} {"train_loss": -3.4597063064575195, "global_step": 2401, "epoch": 57} {"train_loss": -3.6927831172943115, "global_step": 2402, "epoch": 57} {"train_loss": -3.5318329334259033, "global_step": 2403, "epoch": 57} {"train_loss": -3.6913352012634277, "global_step": 2404, "epoch": 57} {"train_loss": -3.547088623046875, "global_step": 2405, "epoch": 57} {"train_loss": -3.4966554641723633, "global_step": 2406, "epoch": 57} {"train_loss": -3.695802688598633, "global_step": 2407, "epoch": 57} {"train_loss": -3.7542965412139893, "global_step": 2408, "epoch": 57} {"train_loss": -3.676360607147217, "global_step": 2409, "epoch": 57} {"train_loss": -3.6991963386535645, "global_step": 2410, "epoch": 57} {"train_loss": -3.701894998550415, "global_step": 2411, "epoch": 57} {"train_loss": -3.626467704772949, "global_step": 2412, "epoch": 57} {"train_loss": -3.68489933013916, "global_step": 2413, "epoch": 57} {"train_loss": -3.5396015644073486, "global_step": 2414, "epoch": 57} {"train_loss": -3.723393678665161, "global_step": 2415, "epoch": 57} {"train_loss": -3.8853886127471924, "global_step": 2416, "epoch": 57} {"train_loss": -3.64992356300354, "global_step": 2417, "epoch": 57} {"train_loss": -3.6557517051696777, "global_step": 2418, "epoch": 57} {"train_loss": -3.7721829414367676, "global_step": 2419, "epoch": 57} {"train_loss": -3.7646877765655518, "global_step": 2420, "epoch": 57} {"train_loss": -3.4580235481262207, "global_step": 2421, "epoch": 57} {"train_loss": -3.4702308177948, "global_step": 2422, "epoch": 57} {"train_loss": -3.453958511352539, "global_step": 2423, "epoch": 57} {"train_loss": -3.562932014465332, "global_step": 2424, "epoch": 57} {"train_loss": -3.6067724227905273, "global_step": 2425, "epoch": 57} {"train_loss": -3.631865978240967, "global_step": 2426, "epoch": 57} {"train_loss": -3.4520297050476074, "global_step": 2427, "epoch": 57} {"train_loss": -3.805046558380127, "global_step": 2428, "epoch": 57} {"train_loss": -3.479473114013672, "global_step": 2429, "epoch": 57} {"train_loss": -3.6059353351593018, "global_step": 2430, "epoch": 57} {"train_loss": -3.4807205200195312, "global_step": 2431, "epoch": 57} {"train_loss": -3.6866183280944824, "global_step": 2432, "epoch": 57} {"train_loss": -3.5382649898529053, "global_step": 2433, "epoch": 57} {"train_loss": -3.64882230758667, "global_step": 2434, "epoch": 57} {"train_loss": -3.6167659759521484, "global_step": 2435, "epoch": 57, "val_loss": 181522.578125} {"train_loss": -3.6830761432647705, "global_step": 2436, "epoch": 58} {"train_loss": -3.6518337726593018, "global_step": 2437, "epoch": 58} {"train_loss": -3.6232213973999023, "global_step": 2438, "epoch": 58} {"train_loss": -3.7415194511413574, "global_step": 2439, "epoch": 58} {"train_loss": -3.6806869506835938, "global_step": 2440, "epoch": 58} {"train_loss": -3.704735517501831, "global_step": 2441, "epoch": 58} {"train_loss": -3.7979683876037598, "global_step": 2442, "epoch": 58} {"train_loss": -3.598118305206299, "global_step": 2443, "epoch": 58} {"train_loss": -3.6407456398010254, "global_step": 2444, "epoch": 58} {"train_loss": -3.5836424827575684, "global_step": 2445, "epoch": 58} {"train_loss": -3.663034677505493, "global_step": 2446, "epoch": 58} {"train_loss": -3.489041805267334, "global_step": 2447, "epoch": 58} {"train_loss": -3.481945037841797, "global_step": 2448, "epoch": 58} {"train_loss": -3.7682271003723145, "global_step": 2449, "epoch": 58} {"train_loss": -3.5062742233276367, "global_step": 2450, "epoch": 58} {"train_loss": -3.58317494392395, "global_step": 2451, "epoch": 58} {"train_loss": -3.5903823375701904, "global_step": 2452, "epoch": 58} {"train_loss": -3.574777603149414, "global_step": 2453, "epoch": 58} {"train_loss": -3.66161847114563, "global_step": 2454, "epoch": 58} {"train_loss": -3.6896347999572754, "global_step": 2455, "epoch": 58} {"train_loss": -3.626999855041504, "global_step": 2456, "epoch": 58} {"train_loss": -3.6149539947509766, "global_step": 2457, "epoch": 58} {"train_loss": -3.641728162765503, "global_step": 2458, "epoch": 58} {"train_loss": -3.6060843467712402, "global_step": 2459, "epoch": 58} {"train_loss": -3.628659248352051, "global_step": 2460, "epoch": 58} {"train_loss": -3.7191238403320312, "global_step": 2461, "epoch": 58} {"train_loss": -3.6521925926208496, "global_step": 2462, "epoch": 58} {"train_loss": -3.615049362182617, "global_step": 2463, "epoch": 58} {"train_loss": -3.711775302886963, "global_step": 2464, "epoch": 58} {"train_loss": -3.7503104209899902, "global_step": 2465, "epoch": 58} {"train_loss": -3.695760726928711, "global_step": 2466, "epoch": 58} {"train_loss": -3.7410073280334473, "global_step": 2467, "epoch": 58} {"train_loss": -3.688023090362549, "global_step": 2468, "epoch": 58} {"train_loss": -3.4906649589538574, "global_step": 2469, "epoch": 58} {"train_loss": -3.9144792556762695, "global_step": 2470, "epoch": 58} {"train_loss": -3.634593963623047, "global_step": 2471, "epoch": 58} {"train_loss": -3.6746463775634766, "global_step": 2472, "epoch": 58} {"train_loss": -3.685512065887451, "global_step": 2473, "epoch": 58} {"train_loss": -3.649277925491333, "global_step": 2474, "epoch": 58} {"train_loss": -3.7113966941833496, "global_step": 2475, "epoch": 58} {"train_loss": -3.70597767829895, "global_step": 2476, "epoch": 58} {"train_loss": -3.65443522021884, "global_step": 2477, "epoch": 58, "val_loss": 180552.703125} {"train_loss": -3.538980484008789, "global_step": 2478, "epoch": 59} {"train_loss": -3.6823277473449707, "global_step": 2479, "epoch": 59} {"train_loss": -3.376910924911499, "global_step": 2480, "epoch": 59} {"train_loss": -3.521367311477661, "global_step": 2481, "epoch": 59} {"train_loss": -3.800898313522339, "global_step": 2482, "epoch": 59} {"train_loss": -3.2656209468841553, "global_step": 2483, "epoch": 59} {"train_loss": -3.5345211029052734, "global_step": 2484, "epoch": 59} {"train_loss": -3.204319477081299, "global_step": 2485, "epoch": 59} {"train_loss": -3.5819506645202637, "global_step": 2486, "epoch": 59} {"train_loss": -3.2177510261535645, "global_step": 2487, "epoch": 59} {"train_loss": -3.4544425010681152, "global_step": 2488, "epoch": 59} {"train_loss": -3.344614267349243, "global_step": 2489, "epoch": 59} {"train_loss": -3.6225240230560303, "global_step": 2490, "epoch": 59} {"train_loss": -3.4700074195861816, "global_step": 2491, "epoch": 59} {"train_loss": -3.6318793296813965, "global_step": 2492, "epoch": 59} {"train_loss": -3.6135151386260986, "global_step": 2493, "epoch": 59} {"train_loss": -3.704822540283203, "global_step": 2494, "epoch": 59} {"train_loss": -3.3951261043548584, "global_step": 2495, "epoch": 59} {"train_loss": -3.7329304218292236, "global_step": 2496, "epoch": 59} {"train_loss": -3.551081895828247, "global_step": 2497, "epoch": 59} {"train_loss": -3.6155102252960205, "global_step": 2498, "epoch": 59} {"train_loss": -3.5656566619873047, "global_step": 2499, "epoch": 59} {"train_loss": -3.7007157802581787, "global_step": 2500, "epoch": 59} {"train_loss": -3.581976890563965, "global_step": 2501, "epoch": 59} {"train_loss": -3.7109627723693848, "global_step": 2502, "epoch": 59} {"train_loss": -3.550632953643799, "global_step": 2503, "epoch": 59} {"train_loss": -3.735342025756836, "global_step": 2504, "epoch": 59} {"train_loss": -3.6428933143615723, "global_step": 2505, "epoch": 59} {"train_loss": -3.77486515045166, "global_step": 2506, "epoch": 59} {"train_loss": -3.5795392990112305, "global_step": 2507, "epoch": 59} {"train_loss": -3.6768481731414795, "global_step": 2508, "epoch": 59} {"train_loss": -3.7011618614196777, "global_step": 2509, "epoch": 59} {"train_loss": -3.743950366973877, "global_step": 2510, "epoch": 59} {"train_loss": -3.8160078525543213, "global_step": 2511, "epoch": 59} {"train_loss": -3.676056146621704, "global_step": 2512, "epoch": 59} {"train_loss": -3.5155889987945557, "global_step": 2513, "epoch": 59} {"train_loss": -3.69167160987854, "global_step": 2514, "epoch": 59} {"train_loss": -3.537764549255371, "global_step": 2515, "epoch": 59} {"train_loss": -3.6209096908569336, "global_step": 2516, "epoch": 59} {"train_loss": -3.71769380569458, "global_step": 2517, "epoch": 59} {"train_loss": -3.5566020011901855, "global_step": 2518, "epoch": 59} {"train_loss": -3.5812554472968694, "global_step": 2519, "epoch": 59, "val_loss": 176710.125} {"train_loss": -3.4992806911468506, "global_step": 2520, "epoch": 60} {"train_loss": -3.671194076538086, "global_step": 2521, "epoch": 60} {"train_loss": -3.673846960067749, "global_step": 2522, "epoch": 60} {"train_loss": -3.645129680633545, "global_step": 2523, "epoch": 60} {"train_loss": -3.7470245361328125, "global_step": 2524, "epoch": 60} {"train_loss": -3.709575653076172, "global_step": 2525, "epoch": 60} {"train_loss": -3.69309139251709, "global_step": 2526, "epoch": 60} {"train_loss": -3.7408697605133057, "global_step": 2527, "epoch": 60} {"train_loss": -3.6238481998443604, "global_step": 2528, "epoch": 60} {"train_loss": -3.7691402435302734, "global_step": 2529, "epoch": 60} {"train_loss": -3.593404769897461, "global_step": 2530, "epoch": 60} {"train_loss": -3.8020219802856445, "global_step": 2531, "epoch": 60} {"train_loss": -3.6521382331848145, "global_step": 2532, "epoch": 60} {"train_loss": -3.7414069175720215, "global_step": 2533, "epoch": 60} {"train_loss": -3.6648902893066406, "global_step": 2534, "epoch": 60} {"train_loss": -3.5697906017303467, "global_step": 2535, "epoch": 60} {"train_loss": -3.6352694034576416, "global_step": 2536, "epoch": 60} {"train_loss": -3.6804542541503906, "global_step": 2537, "epoch": 60} {"train_loss": -3.5340988636016846, "global_step": 2538, "epoch": 60} {"train_loss": -3.7618982791900635, "global_step": 2539, "epoch": 60} {"train_loss": -3.6726675033569336, "global_step": 2540, "epoch": 60} {"train_loss": -3.6303153038024902, "global_step": 2541, "epoch": 60} {"train_loss": -3.6854066848754883, "global_step": 2542, "epoch": 60} {"train_loss": -3.6487317085266113, "global_step": 2543, "epoch": 60} {"train_loss": -3.668449878692627, "global_step": 2544, "epoch": 60} {"train_loss": -3.7892627716064453, "global_step": 2545, "epoch": 60} {"train_loss": -3.7681808471679688, "global_step": 2546, "epoch": 60} {"train_loss": -3.7226905822753906, "global_step": 2547, "epoch": 60} {"train_loss": -3.6024394035339355, "global_step": 2548, "epoch": 60} {"train_loss": -3.7056925296783447, "global_step": 2549, "epoch": 60} {"train_loss": -3.730403423309326, "global_step": 2550, "epoch": 60} {"train_loss": -3.7903409004211426, "global_step": 2551, "epoch": 60} {"train_loss": -3.926387310028076, "global_step": 2552, "epoch": 60} {"train_loss": -3.774984359741211, "global_step": 2553, "epoch": 60} {"train_loss": -3.8061909675598145, "global_step": 2554, "epoch": 60} {"train_loss": -3.8230605125427246, "global_step": 2555, "epoch": 60} {"train_loss": -3.7107491493225098, "global_step": 2556, "epoch": 60} {"train_loss": -3.886385440826416, "global_step": 2557, "epoch": 60} {"train_loss": -3.8721601963043213, "global_step": 2558, "epoch": 60} {"train_loss": -3.7387986183166504, "global_step": 2559, "epoch": 60} {"train_loss": -3.8380520343780518, "global_step": 2560, "epoch": 60} {"train_loss": -3.7090285505567278, "global_step": 2561, "epoch": 60, "val_loss": 171105.515625} {"train_loss": -3.687472105026245, "global_step": 2562, "epoch": 61} {"train_loss": -3.574960231781006, "global_step": 2563, "epoch": 61} {"train_loss": -3.689790725708008, "global_step": 2564, "epoch": 61} {"train_loss": -3.7159600257873535, "global_step": 2565, "epoch": 61} {"train_loss": -3.614638090133667, "global_step": 2566, "epoch": 61} {"train_loss": -3.60770320892334, "global_step": 2567, "epoch": 61} {"train_loss": -3.7726891040802, "global_step": 2568, "epoch": 61} {"train_loss": -3.703023910522461, "global_step": 2569, "epoch": 61} {"train_loss": -3.7014851570129395, "global_step": 2570, "epoch": 61} {"train_loss": -3.675380229949951, "global_step": 2571, "epoch": 61} {"train_loss": -3.771088123321533, "global_step": 2572, "epoch": 61} {"train_loss": -3.7364249229431152, "global_step": 2573, "epoch": 61} {"train_loss": -3.7145802974700928, "global_step": 2574, "epoch": 61} {"train_loss": -3.632984161376953, "global_step": 2575, "epoch": 61} {"train_loss": -3.764246702194214, "global_step": 2576, "epoch": 61} {"train_loss": -3.7753262519836426, "global_step": 2577, "epoch": 61} {"train_loss": -3.7139296531677246, "global_step": 2578, "epoch": 61} {"train_loss": -3.7739758491516113, "global_step": 2579, "epoch": 61} {"train_loss": -3.836411476135254, "global_step": 2580, "epoch": 61} {"train_loss": -3.8833818435668945, "global_step": 2581, "epoch": 61} {"train_loss": -3.578068494796753, "global_step": 2582, "epoch": 61} {"train_loss": -3.9361281394958496, "global_step": 2583, "epoch": 61} {"train_loss": -3.6146178245544434, "global_step": 2584, "epoch": 61} {"train_loss": -3.5719614028930664, "global_step": 2585, "epoch": 61} {"train_loss": -3.6215553283691406, "global_step": 2586, "epoch": 61} {"train_loss": -3.6191213130950928, "global_step": 2587, "epoch": 61} {"train_loss": -3.6785495281219482, "global_step": 2588, "epoch": 61} {"train_loss": -3.6290674209594727, "global_step": 2589, "epoch": 61} {"train_loss": -3.7368836402893066, "global_step": 2590, "epoch": 61} {"train_loss": -3.825284719467163, "global_step": 2591, "epoch": 61} {"train_loss": -3.7635316848754883, "global_step": 2592, "epoch": 61} {"train_loss": -3.7597501277923584, "global_step": 2593, "epoch": 61} {"train_loss": -3.780351161956787, "global_step": 2594, "epoch": 61} {"train_loss": -3.8129711151123047, "global_step": 2595, "epoch": 61} {"train_loss": -3.681952476501465, "global_step": 2596, "epoch": 61} {"train_loss": -3.741611957550049, "global_step": 2597, "epoch": 61} {"train_loss": -3.8376986980438232, "global_step": 2598, "epoch": 61} {"train_loss": -3.7319908142089844, "global_step": 2599, "epoch": 61} {"train_loss": -3.9617254734039307, "global_step": 2600, "epoch": 61} {"train_loss": -3.7784926891326904, "global_step": 2601, "epoch": 61} {"train_loss": -3.7414755821228027, "global_step": 2602, "epoch": 61} {"train_loss": -3.7245099317459833, "global_step": 2603, "epoch": 61, "val_loss": 168069.171875} {"train_loss": -3.817377805709839, "global_step": 2604, "epoch": 62} {"train_loss": -3.6868534088134766, "global_step": 2605, "epoch": 62} {"train_loss": -3.6970314979553223, "global_step": 2606, "epoch": 62} {"train_loss": -3.679253101348877, "global_step": 2607, "epoch": 62} {"train_loss": -3.8731422424316406, "global_step": 2608, "epoch": 62} {"train_loss": -3.7020387649536133, "global_step": 2609, "epoch": 62} {"train_loss": -3.482797622680664, "global_step": 2610, "epoch": 62} {"train_loss": -3.7966227531433105, "global_step": 2611, "epoch": 62} {"train_loss": -3.9138288497924805, "global_step": 2612, "epoch": 62} {"train_loss": -3.742912769317627, "global_step": 2613, "epoch": 62} {"train_loss": -3.6970648765563965, "global_step": 2614, "epoch": 62} {"train_loss": -3.820087432861328, "global_step": 2615, "epoch": 62} {"train_loss": -3.8943989276885986, "global_step": 2616, "epoch": 62} {"train_loss": -3.749569892883301, "global_step": 2617, "epoch": 62} {"train_loss": -3.6739258766174316, "global_step": 2618, "epoch": 62} {"train_loss": -3.958691120147705, "global_step": 2619, "epoch": 62} {"train_loss": -3.7508625984191895, "global_step": 2620, "epoch": 62} {"train_loss": -3.7715418338775635, "global_step": 2621, "epoch": 62} {"train_loss": -3.7493085861206055, "global_step": 2622, "epoch": 62} {"train_loss": -3.5163683891296387, "global_step": 2623, "epoch": 62} {"train_loss": -3.6797094345092773, "global_step": 2624, "epoch": 62} {"train_loss": -3.723064661026001, "global_step": 2625, "epoch": 62} {"train_loss": -3.510155439376831, "global_step": 2626, "epoch": 62} {"train_loss": -3.8974132537841797, "global_step": 2627, "epoch": 62} {"train_loss": -3.6970839500427246, "global_step": 2628, "epoch": 62} {"train_loss": -3.651066780090332, "global_step": 2629, "epoch": 62} {"train_loss": -3.778801918029785, "global_step": 2630, "epoch": 62} {"train_loss": -3.344514846801758, "global_step": 2631, "epoch": 62} {"train_loss": -3.7193822860717773, "global_step": 2632, "epoch": 62} {"train_loss": -3.7831149101257324, "global_step": 2633, "epoch": 62} {"train_loss": -3.4868388175964355, "global_step": 2634, "epoch": 62} {"train_loss": -3.7652788162231445, "global_step": 2635, "epoch": 62} {"train_loss": -3.370248794555664, "global_step": 2636, "epoch": 62} {"train_loss": -3.6470837593078613, "global_step": 2637, "epoch": 62} {"train_loss": -3.7861664295196533, "global_step": 2638, "epoch": 62} {"train_loss": -3.5902562141418457, "global_step": 2639, "epoch": 62} {"train_loss": -3.61572265625, "global_step": 2640, "epoch": 62} {"train_loss": -3.485501766204834, "global_step": 2641, "epoch": 62} {"train_loss": -3.765153169631958, "global_step": 2642, "epoch": 62} {"train_loss": -3.3932127952575684, "global_step": 2643, "epoch": 62} {"train_loss": -3.7184152603149414, "global_step": 2644, "epoch": 62} {"train_loss": -3.688562796229408, "global_step": 2645, "epoch": 62, "val_loss": 165606.25} {"train_loss": -3.6228647232055664, "global_step": 2646, "epoch": 63} {"train_loss": -3.5599045753479004, "global_step": 2647, "epoch": 63} {"train_loss": -3.6607699394226074, "global_step": 2648, "epoch": 63} {"train_loss": -3.615431308746338, "global_step": 2649, "epoch": 63} {"train_loss": -3.7307069301605225, "global_step": 2650, "epoch": 63} {"train_loss": -3.556851863861084, "global_step": 2651, "epoch": 63} {"train_loss": -3.817960262298584, "global_step": 2652, "epoch": 63} {"train_loss": -3.759263038635254, "global_step": 2653, "epoch": 63} {"train_loss": -3.716111183166504, "global_step": 2654, "epoch": 63} {"train_loss": -3.6973211765289307, "global_step": 2655, "epoch": 63} {"train_loss": -3.867062568664551, "global_step": 2656, "epoch": 63} {"train_loss": -3.63954496383667, "global_step": 2657, "epoch": 63} {"train_loss": -3.739386558532715, "global_step": 2658, "epoch": 63} {"train_loss": -3.8699731826782227, "global_step": 2659, "epoch": 63} {"train_loss": -3.793442726135254, "global_step": 2660, "epoch": 63} {"train_loss": -3.905343532562256, "global_step": 2661, "epoch": 63} {"train_loss": -3.7990965843200684, "global_step": 2662, "epoch": 63} {"train_loss": -3.7791366577148438, "global_step": 2663, "epoch": 63} {"train_loss": -3.7544679641723633, "global_step": 2664, "epoch": 63} {"train_loss": -3.714240074157715, "global_step": 2665, "epoch": 63} {"train_loss": -3.7533059120178223, "global_step": 2666, "epoch": 63} {"train_loss": -3.7006211280822754, "global_step": 2667, "epoch": 63} {"train_loss": -3.7223105430603027, "global_step": 2668, "epoch": 63} {"train_loss": -3.8175899982452393, "global_step": 2669, "epoch": 63} {"train_loss": -3.4697117805480957, "global_step": 2670, "epoch": 63} {"train_loss": -3.589848518371582, "global_step": 2671, "epoch": 63} {"train_loss": -3.571113348007202, "global_step": 2672, "epoch": 63} {"train_loss": -3.760385274887085, "global_step": 2673, "epoch": 63} {"train_loss": -3.6634583473205566, "global_step": 2674, "epoch": 63} {"train_loss": -3.8356847763061523, "global_step": 2675, "epoch": 63} {"train_loss": -3.901007890701294, "global_step": 2676, "epoch": 63} {"train_loss": -3.8679444789886475, "global_step": 2677, "epoch": 63} {"train_loss": -3.916624069213867, "global_step": 2678, "epoch": 63} {"train_loss": -3.7591423988342285, "global_step": 2679, "epoch": 63} {"train_loss": -3.7312674522399902, "global_step": 2680, "epoch": 63} {"train_loss": -3.58674955368042, "global_step": 2681, "epoch": 63} {"train_loss": -3.664771556854248, "global_step": 2682, "epoch": 63} {"train_loss": -3.944927215576172, "global_step": 2683, "epoch": 63} {"train_loss": -3.8130295276641846, "global_step": 2684, "epoch": 63} {"train_loss": -3.674164295196533, "global_step": 2685, "epoch": 63} {"train_loss": -3.826368808746338, "global_step": 2686, "epoch": 63} {"train_loss": -3.7376475788298107, "global_step": 2687, "epoch": 63, "val_loss": 162772.0} {"train_loss": -3.749573230743408, "global_step": 2688, "epoch": 64} {"train_loss": -3.846663236618042, "global_step": 2689, "epoch": 64} {"train_loss": -3.7937746047973633, "global_step": 2690, "epoch": 64} {"train_loss": -3.6171512603759766, "global_step": 2691, "epoch": 64} {"train_loss": -3.8187294006347656, "global_step": 2692, "epoch": 64} {"train_loss": -3.670197010040283, "global_step": 2693, "epoch": 64} {"train_loss": -3.856160879135132, "global_step": 2694, "epoch": 64} {"train_loss": -3.6293225288391113, "global_step": 2695, "epoch": 64} {"train_loss": -3.9241390228271484, "global_step": 2696, "epoch": 64} {"train_loss": -3.9632155895233154, "global_step": 2697, "epoch": 64} {"train_loss": -3.8491978645324707, "global_step": 2698, "epoch": 64} {"train_loss": -3.7407774925231934, "global_step": 2699, "epoch": 64} {"train_loss": -3.9057974815368652, "global_step": 2700, "epoch": 64} {"train_loss": -3.931809902191162, "global_step": 2701, "epoch": 64} {"train_loss": -3.9719605445861816, "global_step": 2702, "epoch": 64} {"train_loss": -3.4549312591552734, "global_step": 2703, "epoch": 64} {"train_loss": -3.689269542694092, "global_step": 2704, "epoch": 64} {"train_loss": -3.70935320854187, "global_step": 2705, "epoch": 64} {"train_loss": -3.6511998176574707, "global_step": 2706, "epoch": 64} {"train_loss": -3.749002456665039, "global_step": 2707, "epoch": 64} {"train_loss": -3.725771427154541, "global_step": 2708, "epoch": 64} {"train_loss": -3.759613513946533, "global_step": 2709, "epoch": 64} {"train_loss": -3.9152047634124756, "global_step": 2710, "epoch": 64} {"train_loss": -3.7841596603393555, "global_step": 2711, "epoch": 64} {"train_loss": -3.9062042236328125, "global_step": 2712, "epoch": 64} {"train_loss": -3.816547393798828, "global_step": 2713, "epoch": 64} {"train_loss": -3.7511396408081055, "global_step": 2714, "epoch": 64} {"train_loss": -3.7312426567077637, "global_step": 2715, "epoch": 64} {"train_loss": -3.876241683959961, "global_step": 2716, "epoch": 64} {"train_loss": -3.7502574920654297, "global_step": 2717, "epoch": 64} {"train_loss": -3.6053261756896973, "global_step": 2718, "epoch": 64} {"train_loss": -3.8954174518585205, "global_step": 2719, "epoch": 64} {"train_loss": -3.7616496086120605, "global_step": 2720, "epoch": 64} {"train_loss": -3.7835230827331543, "global_step": 2721, "epoch": 64} {"train_loss": -3.6794614791870117, "global_step": 2722, "epoch": 64} {"train_loss": -3.567568063735962, "global_step": 2723, "epoch": 64} {"train_loss": -3.7766287326812744, "global_step": 2724, "epoch": 64} {"train_loss": -3.7624306678771973, "global_step": 2725, "epoch": 64} {"train_loss": -3.455110549926758, "global_step": 2726, "epoch": 64} {"train_loss": -3.7988946437835693, "global_step": 2727, "epoch": 64} {"train_loss": -3.445711135864258, "global_step": 2728, "epoch": 64} {"train_loss": -3.7543474038441977, "global_step": 2729, "epoch": 64, "val_loss": 162817.90625} {"train_loss": -3.62384033203125, "global_step": 2730, "epoch": 65} {"train_loss": -3.590534210205078, "global_step": 2731, "epoch": 65} {"train_loss": -3.8409981727600098, "global_step": 2732, "epoch": 65} {"train_loss": -3.6145496368408203, "global_step": 2733, "epoch": 65} {"train_loss": -3.86242413520813, "global_step": 2734, "epoch": 65} {"train_loss": -3.508553981781006, "global_step": 2735, "epoch": 65} {"train_loss": -3.9219164848327637, "global_step": 2736, "epoch": 65} {"train_loss": -3.5793418884277344, "global_step": 2737, "epoch": 65} {"train_loss": -3.952425241470337, "global_step": 2738, "epoch": 65} {"train_loss": -3.7084250450134277, "global_step": 2739, "epoch": 65} {"train_loss": -3.794931173324585, "global_step": 2740, "epoch": 65} {"train_loss": -3.663407564163208, "global_step": 2741, "epoch": 65} {"train_loss": -3.859384059906006, "global_step": 2742, "epoch": 65} {"train_loss": -3.7569799423217773, "global_step": 2743, "epoch": 65} {"train_loss": -3.9043970108032227, "global_step": 2744, "epoch": 65} {"train_loss": -3.710339307785034, "global_step": 2745, "epoch": 65} {"train_loss": -3.944453239440918, "global_step": 2746, "epoch": 65} {"train_loss": -3.702760696411133, "global_step": 2747, "epoch": 65} {"train_loss": -3.81138277053833, "global_step": 2748, "epoch": 65} {"train_loss": -3.921513557434082, "global_step": 2749, "epoch": 65} {"train_loss": -3.8595829010009766, "global_step": 2750, "epoch": 65} {"train_loss": -3.7676262855529785, "global_step": 2751, "epoch": 65} {"train_loss": -3.744321346282959, "global_step": 2752, "epoch": 65} {"train_loss": -3.9627349376678467, "global_step": 2753, "epoch": 65} {"train_loss": -3.8317408561706543, "global_step": 2754, "epoch": 65} {"train_loss": -3.7999343872070312, "global_step": 2755, "epoch": 65} {"train_loss": -3.814042329788208, "global_step": 2756, "epoch": 65} {"train_loss": -3.7863006591796875, "global_step": 2757, "epoch": 65} {"train_loss": -3.8932833671569824, "global_step": 2758, "epoch": 65} {"train_loss": -3.9459900856018066, "global_step": 2759, "epoch": 65} {"train_loss": -3.821491241455078, "global_step": 2760, "epoch": 65} {"train_loss": -3.76606822013855, "global_step": 2761, "epoch": 65} {"train_loss": -3.803262710571289, "global_step": 2762, "epoch": 65} {"train_loss": -3.806485652923584, "global_step": 2763, "epoch": 65} {"train_loss": -4.00190544128418, "global_step": 2764, "epoch": 65} {"train_loss": -3.890887498855591, "global_step": 2765, "epoch": 65} {"train_loss": -3.6845245361328125, "global_step": 2766, "epoch": 65} {"train_loss": -3.8225951194763184, "global_step": 2767, "epoch": 65} {"train_loss": -3.747107982635498, "global_step": 2768, "epoch": 65} {"train_loss": -3.846742868423462, "global_step": 2769, "epoch": 65} {"train_loss": -3.910679817199707, "global_step": 2770, "epoch": 65} {"train_loss": -3.7948712962014333, "global_step": 2771, "epoch": 65, "val_loss": 157090.4375} {"train_loss": -3.896898031234741, "global_step": 2772, "epoch": 66} {"train_loss": -3.938640594482422, "global_step": 2773, "epoch": 66} {"train_loss": -3.8750548362731934, "global_step": 2774, "epoch": 66} {"train_loss": -3.78939151763916, "global_step": 2775, "epoch": 66} {"train_loss": -3.6971547603607178, "global_step": 2776, "epoch": 66} {"train_loss": -3.7937865257263184, "global_step": 2777, "epoch": 66} {"train_loss": -3.857637882232666, "global_step": 2778, "epoch": 66} {"train_loss": -3.729825019836426, "global_step": 2779, "epoch": 66} {"train_loss": -3.7777976989746094, "global_step": 2780, "epoch": 66} {"train_loss": -3.8961260318756104, "global_step": 2781, "epoch": 66} {"train_loss": -3.9004054069519043, "global_step": 2782, "epoch": 66} {"train_loss": -3.7959976196289062, "global_step": 2783, "epoch": 66} {"train_loss": -3.815805435180664, "global_step": 2784, "epoch": 66} {"train_loss": -3.677715301513672, "global_step": 2785, "epoch": 66} {"train_loss": -3.9223272800445557, "global_step": 2786, "epoch": 66} {"train_loss": -3.794279098510742, "global_step": 2787, "epoch": 66} {"train_loss": -3.671828269958496, "global_step": 2788, "epoch": 66} {"train_loss": -3.950680732727051, "global_step": 2789, "epoch": 66} {"train_loss": -3.7293176651000977, "global_step": 2790, "epoch": 66} {"train_loss": -3.7432353496551514, "global_step": 2791, "epoch": 66} {"train_loss": -3.7466020584106445, "global_step": 2792, "epoch": 66} {"train_loss": -3.7164559364318848, "global_step": 2793, "epoch": 66} {"train_loss": -3.58052921295166, "global_step": 2794, "epoch": 66} {"train_loss": -3.895782470703125, "global_step": 2795, "epoch": 66} {"train_loss": -3.511327028274536, "global_step": 2796, "epoch": 66} {"train_loss": -3.6248650550842285, "global_step": 2797, "epoch": 66} {"train_loss": -3.9425148963928223, "global_step": 2798, "epoch": 66} {"train_loss": -3.4182820320129395, "global_step": 2799, "epoch": 66} {"train_loss": -3.780653238296509, "global_step": 2800, "epoch": 66} {"train_loss": -3.661198616027832, "global_step": 2801, "epoch": 66} {"train_loss": -3.6120376586914062, "global_step": 2802, "epoch": 66} {"train_loss": -3.415151596069336, "global_step": 2803, "epoch": 66} {"train_loss": -3.6274821758270264, "global_step": 2804, "epoch": 66} {"train_loss": -3.500943183898926, "global_step": 2805, "epoch": 66} {"train_loss": -3.8004112243652344, "global_step": 2806, "epoch": 66} {"train_loss": -3.5521936416625977, "global_step": 2807, "epoch": 66} {"train_loss": -3.7179741859436035, "global_step": 2808, "epoch": 66} {"train_loss": -3.627030849456787, "global_step": 2809, "epoch": 66} {"train_loss": -4.005293369293213, "global_step": 2810, "epoch": 66} {"train_loss": -3.6972036361694336, "global_step": 2811, "epoch": 66} {"train_loss": -3.8647289276123047, "global_step": 2812, "epoch": 66} {"train_loss": -3.7436050517218455, "global_step": 2813, "epoch": 66, "val_loss": 157030.15625} {"train_loss": -3.922050952911377, "global_step": 2814, "epoch": 67} {"train_loss": -3.726314067840576, "global_step": 2815, "epoch": 67} {"train_loss": -3.825934648513794, "global_step": 2816, "epoch": 67} {"train_loss": -3.7759151458740234, "global_step": 2817, "epoch": 67} {"train_loss": -3.857612133026123, "global_step": 2818, "epoch": 67} {"train_loss": -3.769960641860962, "global_step": 2819, "epoch": 67} {"train_loss": -3.8605828285217285, "global_step": 2820, "epoch": 67} {"train_loss": -3.759681224822998, "global_step": 2821, "epoch": 67} {"train_loss": -3.7686703205108643, "global_step": 2822, "epoch": 67} {"train_loss": -3.9966063499450684, "global_step": 2823, "epoch": 67} {"train_loss": -3.7599477767944336, "global_step": 2824, "epoch": 67} {"train_loss": -3.930588722229004, "global_step": 2825, "epoch": 67} {"train_loss": -3.7388882637023926, "global_step": 2826, "epoch": 67} {"train_loss": -3.829771041870117, "global_step": 2827, "epoch": 67} {"train_loss": -3.8231115341186523, "global_step": 2828, "epoch": 67} {"train_loss": -3.7177343368530273, "global_step": 2829, "epoch": 67} {"train_loss": -4.000088691711426, "global_step": 2830, "epoch": 67} {"train_loss": -3.8626976013183594, "global_step": 2831, "epoch": 67} {"train_loss": -3.7331793308258057, "global_step": 2832, "epoch": 67} {"train_loss": -3.760913848876953, "global_step": 2833, "epoch": 67} {"train_loss": -3.8289408683776855, "global_step": 2834, "epoch": 67} {"train_loss": -3.8713507652282715, "global_step": 2835, "epoch": 67} {"train_loss": -3.763491630554199, "global_step": 2836, "epoch": 67} {"train_loss": -3.744589328765869, "global_step": 2837, "epoch": 67} {"train_loss": -3.8953466415405273, "global_step": 2838, "epoch": 67} {"train_loss": -3.733915328979492, "global_step": 2839, "epoch": 67} {"train_loss": -3.8887481689453125, "global_step": 2840, "epoch": 67} {"train_loss": -3.765937328338623, "global_step": 2841, "epoch": 67} {"train_loss": -3.7189877033233643, "global_step": 2842, "epoch": 67} {"train_loss": -3.9400861263275146, "global_step": 2843, "epoch": 67} {"train_loss": -3.7521770000457764, "global_step": 2844, "epoch": 67} {"train_loss": -3.6735339164733887, "global_step": 2845, "epoch": 67} {"train_loss": -3.988482713699341, "global_step": 2846, "epoch": 67} {"train_loss": -3.6601405143737793, "global_step": 2847, "epoch": 67} {"train_loss": -3.8279786109924316, "global_step": 2848, "epoch": 67} {"train_loss": -3.9401326179504395, "global_step": 2849, "epoch": 67} {"train_loss": -3.793652057647705, "global_step": 2850, "epoch": 67} {"train_loss": -3.8120298385620117, "global_step": 2851, "epoch": 67} {"train_loss": -3.6190147399902344, "global_step": 2852, "epoch": 67} {"train_loss": -3.9009647369384766, "global_step": 2853, "epoch": 67} {"train_loss": -3.964512348175049, "global_step": 2854, "epoch": 67} {"train_loss": -3.8196582283292497, "global_step": 2855, "epoch": 67, "val_loss": 158330.53125} {"train_loss": -3.8875279426574707, "global_step": 2856, "epoch": 68} {"train_loss": -3.820387363433838, "global_step": 2857, "epoch": 68} {"train_loss": -3.7609081268310547, "global_step": 2858, "epoch": 68} {"train_loss": -3.872272491455078, "global_step": 2859, "epoch": 68} {"train_loss": -3.889148712158203, "global_step": 2860, "epoch": 68} {"train_loss": -3.867711067199707, "global_step": 2861, "epoch": 68} {"train_loss": -3.65885066986084, "global_step": 2862, "epoch": 68} {"train_loss": -3.8584156036376953, "global_step": 2863, "epoch": 68} {"train_loss": -3.6112465858459473, "global_step": 2864, "epoch": 68} {"train_loss": -3.8727264404296875, "global_step": 2865, "epoch": 68} {"train_loss": -3.6081924438476562, "global_step": 2866, "epoch": 68} {"train_loss": -3.628075122833252, "global_step": 2867, "epoch": 68} {"train_loss": -3.7975142002105713, "global_step": 2868, "epoch": 68} {"train_loss": -3.7438430786132812, "global_step": 2869, "epoch": 68} {"train_loss": -3.8018321990966797, "global_step": 2870, "epoch": 68} {"train_loss": -3.853435754776001, "global_step": 2871, "epoch": 68} {"train_loss": -3.8331408500671387, "global_step": 2872, "epoch": 68} {"train_loss": -3.8781604766845703, "global_step": 2873, "epoch": 68} {"train_loss": -3.754851818084717, "global_step": 2874, "epoch": 68} {"train_loss": -4.013672351837158, "global_step": 2875, "epoch": 68} {"train_loss": -3.520707130432129, "global_step": 2876, "epoch": 68} {"train_loss": -3.9168591499328613, "global_step": 2877, "epoch": 68} {"train_loss": -3.7761831283569336, "global_step": 2878, "epoch": 68} {"train_loss": -3.738032579421997, "global_step": 2879, "epoch": 68} {"train_loss": -3.6763858795166016, "global_step": 2880, "epoch": 68} {"train_loss": -3.935136318206787, "global_step": 2881, "epoch": 68} {"train_loss": -3.7360920906066895, "global_step": 2882, "epoch": 68} {"train_loss": -3.8962759971618652, "global_step": 2883, "epoch": 68} {"train_loss": -3.637070655822754, "global_step": 2884, "epoch": 68} {"train_loss": -3.8551268577575684, "global_step": 2885, "epoch": 68} {"train_loss": -3.641160488128662, "global_step": 2886, "epoch": 68} {"train_loss": -3.932588815689087, "global_step": 2887, "epoch": 68} {"train_loss": -3.705765724182129, "global_step": 2888, "epoch": 68} {"train_loss": -3.7403247356414795, "global_step": 2889, "epoch": 68} {"train_loss": -3.6903915405273438, "global_step": 2890, "epoch": 68} {"train_loss": -3.763867139816284, "global_step": 2891, "epoch": 68} {"train_loss": -3.768232822418213, "global_step": 2892, "epoch": 68} {"train_loss": -3.9725124835968018, "global_step": 2893, "epoch": 68} {"train_loss": -3.662252902984619, "global_step": 2894, "epoch": 68} {"train_loss": -4.038493633270264, "global_step": 2895, "epoch": 68} {"train_loss": -3.6358702182769775, "global_step": 2896, "epoch": 68} {"train_loss": -3.790554716473534, "global_step": 2897, "epoch": 68, "val_loss": 152393.640625} {"train_loss": -3.816044330596924, "global_step": 2898, "epoch": 69} {"train_loss": -4.034999370574951, "global_step": 2899, "epoch": 69} {"train_loss": -3.7082581520080566, "global_step": 2900, "epoch": 69} {"train_loss": -4.0803070068359375, "global_step": 2901, "epoch": 69} {"train_loss": -3.736441135406494, "global_step": 2902, "epoch": 69} {"train_loss": -3.789271354675293, "global_step": 2903, "epoch": 69} {"train_loss": -3.8564043045043945, "global_step": 2904, "epoch": 69} {"train_loss": -3.955103874206543, "global_step": 2905, "epoch": 69} {"train_loss": -3.7445454597473145, "global_step": 2906, "epoch": 69} {"train_loss": -3.9342715740203857, "global_step": 2907, "epoch": 69} {"train_loss": -3.8940799236297607, "global_step": 2908, "epoch": 69} {"train_loss": -3.768141031265259, "global_step": 2909, "epoch": 69} {"train_loss": -3.8990094661712646, "global_step": 2910, "epoch": 69} {"train_loss": -4.010952472686768, "global_step": 2911, "epoch": 69} {"train_loss": -3.9934606552124023, "global_step": 2912, "epoch": 69} {"train_loss": -3.8512275218963623, "global_step": 2913, "epoch": 69} {"train_loss": -3.8937325477600098, "global_step": 2914, "epoch": 69} {"train_loss": -3.964850425720215, "global_step": 2915, "epoch": 69} {"train_loss": -3.917358875274658, "global_step": 2916, "epoch": 69} {"train_loss": -3.906384229660034, "global_step": 2917, "epoch": 69} {"train_loss": -3.898650646209717, "global_step": 2918, "epoch": 69} {"train_loss": -3.8639254570007324, "global_step": 2919, "epoch": 69} {"train_loss": -3.875913381576538, "global_step": 2920, "epoch": 69} {"train_loss": -3.8811838626861572, "global_step": 2921, "epoch": 69} {"train_loss": -3.810237407684326, "global_step": 2922, "epoch": 69} {"train_loss": -3.9009251594543457, "global_step": 2923, "epoch": 69} {"train_loss": -3.7847414016723633, "global_step": 2924, "epoch": 69} {"train_loss": -3.7576792240142822, "global_step": 2925, "epoch": 69} {"train_loss": -3.9558959007263184, "global_step": 2926, "epoch": 69} {"train_loss": -3.8034048080444336, "global_step": 2927, "epoch": 69} {"train_loss": -3.882115364074707, "global_step": 2928, "epoch": 69} {"train_loss": -4.002628326416016, "global_step": 2929, "epoch": 69} {"train_loss": -3.828544855117798, "global_step": 2930, "epoch": 69} {"train_loss": -3.868947982788086, "global_step": 2931, "epoch": 69} {"train_loss": -3.698272705078125, "global_step": 2932, "epoch": 69} {"train_loss": -3.9423866271972656, "global_step": 2933, "epoch": 69} {"train_loss": -3.7622549533843994, "global_step": 2934, "epoch": 69} {"train_loss": -3.85850191116333, "global_step": 2935, "epoch": 69} {"train_loss": -3.994696617126465, "global_step": 2936, "epoch": 69} {"train_loss": -3.8904953002929688, "global_step": 2937, "epoch": 69} {"train_loss": -3.771251678466797, "global_step": 2938, "epoch": 69} {"train_loss": -3.871100221361433, "global_step": 2939, "epoch": 69, "val_loss": 148015.34375} {"train_loss": -4.0514726638793945, "global_step": 2940, "epoch": 70} {"train_loss": -3.9607527256011963, "global_step": 2941, "epoch": 70} {"train_loss": -3.957789182662964, "global_step": 2942, "epoch": 70} {"train_loss": -4.067472457885742, "global_step": 2943, "epoch": 70} {"train_loss": -3.9701428413391113, "global_step": 2944, "epoch": 70} {"train_loss": -4.110301971435547, "global_step": 2945, "epoch": 70} {"train_loss": -3.8436660766601562, "global_step": 2946, "epoch": 70} {"train_loss": -3.9363579750061035, "global_step": 2947, "epoch": 70} {"train_loss": -3.9538681507110596, "global_step": 2948, "epoch": 70} {"train_loss": -3.9117484092712402, "global_step": 2949, "epoch": 70} {"train_loss": -3.9998884201049805, "global_step": 2950, "epoch": 70} {"train_loss": -3.865851879119873, "global_step": 2951, "epoch": 70} {"train_loss": -3.6363813877105713, "global_step": 2952, "epoch": 70} {"train_loss": -3.890143871307373, "global_step": 2953, "epoch": 70} {"train_loss": -3.84234881401062, "global_step": 2954, "epoch": 70} {"train_loss": -3.792320728302002, "global_step": 2955, "epoch": 70} {"train_loss": -3.935086250305176, "global_step": 2956, "epoch": 70} {"train_loss": -3.884737014770508, "global_step": 2957, "epoch": 70} {"train_loss": -3.9546971321105957, "global_step": 2958, "epoch": 70} {"train_loss": -3.659118890762329, "global_step": 2959, "epoch": 70} {"train_loss": -3.8007171154022217, "global_step": 2960, "epoch": 70} {"train_loss": -3.9774041175842285, "global_step": 2961, "epoch": 70} {"train_loss": -3.5785531997680664, "global_step": 2962, "epoch": 70} {"train_loss": -3.7112936973571777, "global_step": 2963, "epoch": 70} {"train_loss": -3.6711878776550293, "global_step": 2964, "epoch": 70} {"train_loss": -3.778202772140503, "global_step": 2965, "epoch": 70} {"train_loss": -3.633435010910034, "global_step": 2966, "epoch": 70} {"train_loss": -3.9264473915100098, "global_step": 2967, "epoch": 70} {"train_loss": -3.3813562393188477, "global_step": 2968, "epoch": 70} {"train_loss": -3.8913378715515137, "global_step": 2969, "epoch": 70} {"train_loss": -3.5013134479522705, "global_step": 2970, "epoch": 70} {"train_loss": -3.994889974594116, "global_step": 2971, "epoch": 70} {"train_loss": -3.624978542327881, "global_step": 2972, "epoch": 70} {"train_loss": -3.7336268424987793, "global_step": 2973, "epoch": 70} {"train_loss": -3.5465097427368164, "global_step": 2974, "epoch": 70} {"train_loss": -3.9277868270874023, "global_step": 2975, "epoch": 70} {"train_loss": -3.6713712215423584, "global_step": 2976, "epoch": 70} {"train_loss": -3.8806586265563965, "global_step": 2977, "epoch": 70} {"train_loss": -3.8226447105407715, "global_step": 2978, "epoch": 70} {"train_loss": -3.9448890686035156, "global_step": 2979, "epoch": 70} {"train_loss": -3.999617576599121, "global_step": 2980, "epoch": 70} {"train_loss": -3.836590494428362, "global_step": 2981, "epoch": 70, "val_loss": 150914.4375} {"train_loss": -3.8832449913024902, "global_step": 2982, "epoch": 71} {"train_loss": -3.9093127250671387, "global_step": 2983, "epoch": 71} {"train_loss": -3.7508511543273926, "global_step": 2984, "epoch": 71} {"train_loss": -3.868224620819092, "global_step": 2985, "epoch": 71} {"train_loss": -3.803886890411377, "global_step": 2986, "epoch": 71} {"train_loss": -3.8400590419769287, "global_step": 2987, "epoch": 71} {"train_loss": -3.7341296672821045, "global_step": 2988, "epoch": 71} {"train_loss": -3.918428659439087, "global_step": 2989, "epoch": 71} {"train_loss": -3.86112117767334, "global_step": 2990, "epoch": 71} {"train_loss": -4.0183796882629395, "global_step": 2991, "epoch": 71} {"train_loss": -3.976100444793701, "global_step": 2992, "epoch": 71} {"train_loss": -3.8261780738830566, "global_step": 2993, "epoch": 71} {"train_loss": -4.018721103668213, "global_step": 2994, "epoch": 71} {"train_loss": -3.908047914505005, "global_step": 2995, "epoch": 71} {"train_loss": -3.999427080154419, "global_step": 2996, "epoch": 71} {"train_loss": -3.8327488899230957, "global_step": 2997, "epoch": 71} {"train_loss": -3.9037718772888184, "global_step": 2998, "epoch": 71} {"train_loss": -3.7829020023345947, "global_step": 2999, "epoch": 71} {"train_loss": -3.9433255195617676, "global_step": 3000, "epoch": 71} {"train_loss": -3.786249876022339, "global_step": 3001, "epoch": 71} {"train_loss": -3.8524420261383057, "global_step": 3002, "epoch": 71} {"train_loss": -4.088901042938232, "global_step": 3003, "epoch": 71} {"train_loss": -3.967702865600586, "global_step": 3004, "epoch": 71} {"train_loss": -3.860489845275879, "global_step": 3005, "epoch": 71} {"train_loss": -4.087303161621094, "global_step": 3006, "epoch": 71} {"train_loss": -3.948216438293457, "global_step": 3007, "epoch": 71} {"train_loss": -3.7540106773376465, "global_step": 3008, "epoch": 71} {"train_loss": -3.9970028400421143, "global_step": 3009, "epoch": 71} {"train_loss": -3.959469795227051, "global_step": 3010, "epoch": 71} {"train_loss": -3.8400769233703613, "global_step": 3011, "epoch": 71} {"train_loss": -3.9384546279907227, "global_step": 3012, "epoch": 71} {"train_loss": -3.792987823486328, "global_step": 3013, "epoch": 71} {"train_loss": -4.058180332183838, "global_step": 3014, "epoch": 71} {"train_loss": -3.975236177444458, "global_step": 3015, "epoch": 71} {"train_loss": -3.8964221477508545, "global_step": 3016, "epoch": 71} {"train_loss": -3.978093147277832, "global_step": 3017, "epoch": 71} {"train_loss": -3.8073692321777344, "global_step": 3018, "epoch": 71} {"train_loss": -3.855966091156006, "global_step": 3019, "epoch": 71} {"train_loss": -4.07204532623291, "global_step": 3020, "epoch": 71} {"train_loss": -3.894331455230713, "global_step": 3021, "epoch": 71} {"train_loss": -3.911607503890991, "global_step": 3022, "epoch": 71} {"train_loss": -3.9077762762705484, "global_step": 3023, "epoch": 71, "val_loss": 147538.71875} {"train_loss": -4.018457412719727, "global_step": 3024, "epoch": 72} {"train_loss": -3.8408045768737793, "global_step": 3025, "epoch": 72} {"train_loss": -4.114536285400391, "global_step": 3026, "epoch": 72} {"train_loss": -4.094515800476074, "global_step": 3027, "epoch": 72} {"train_loss": -3.974355697631836, "global_step": 3028, "epoch": 72} {"train_loss": -4.004495620727539, "global_step": 3029, "epoch": 72} {"train_loss": -4.073356628417969, "global_step": 3030, "epoch": 72} {"train_loss": -3.9766626358032227, "global_step": 3031, "epoch": 72} {"train_loss": -3.691192626953125, "global_step": 3032, "epoch": 72} {"train_loss": -3.8890414237976074, "global_step": 3033, "epoch": 72} {"train_loss": -3.813905715942383, "global_step": 3034, "epoch": 72} {"train_loss": -3.947026252746582, "global_step": 3035, "epoch": 72} {"train_loss": -4.086488723754883, "global_step": 3036, "epoch": 72} {"train_loss": -3.886003017425537, "global_step": 3037, "epoch": 72} {"train_loss": -3.7772655487060547, "global_step": 3038, "epoch": 72} {"train_loss": -4.055280685424805, "global_step": 3039, "epoch": 72} {"train_loss": -3.4076485633850098, "global_step": 3040, "epoch": 72} {"train_loss": -3.867215633392334, "global_step": 3041, "epoch": 72} {"train_loss": -3.8496830463409424, "global_step": 3042, "epoch": 72} {"train_loss": -3.7598161697387695, "global_step": 3043, "epoch": 72} {"train_loss": -4.006803512573242, "global_step": 3044, "epoch": 72} {"train_loss": -3.962667465209961, "global_step": 3045, "epoch": 72} {"train_loss": -3.8231945037841797, "global_step": 3046, "epoch": 72} {"train_loss": -4.012351036071777, "global_step": 3047, "epoch": 72} {"train_loss": -3.9214119911193848, "global_step": 3048, "epoch": 72} {"train_loss": -3.8564252853393555, "global_step": 3049, "epoch": 72} {"train_loss": -3.819631338119507, "global_step": 3050, "epoch": 72} {"train_loss": -3.948747396469116, "global_step": 3051, "epoch": 72} {"train_loss": -3.949075222015381, "global_step": 3052, "epoch": 72} {"train_loss": -3.9618642330169678, "global_step": 3053, "epoch": 72} {"train_loss": -3.8723156452178955, "global_step": 3054, "epoch": 72} {"train_loss": -3.944166421890259, "global_step": 3055, "epoch": 72} {"train_loss": -4.009963512420654, "global_step": 3056, "epoch": 72} {"train_loss": -3.9192380905151367, "global_step": 3057, "epoch": 72} {"train_loss": -3.9392638206481934, "global_step": 3058, "epoch": 72} {"train_loss": -3.8736157417297363, "global_step": 3059, "epoch": 72} {"train_loss": -3.9119386672973633, "global_step": 3060, "epoch": 72} {"train_loss": -3.9785923957824707, "global_step": 3061, "epoch": 72} {"train_loss": -3.941946506500244, "global_step": 3062, "epoch": 72} {"train_loss": -3.9130897521972656, "global_step": 3063, "epoch": 72} {"train_loss": -3.9057531356811523, "global_step": 3064, "epoch": 72} {"train_loss": -3.920187246231806, "global_step": 3065, "epoch": 72, "val_loss": 143896.234375} {"train_loss": -4.072678565979004, "global_step": 3066, "epoch": 73} {"train_loss": -4.033472537994385, "global_step": 3067, "epoch": 73} {"train_loss": -4.00465202331543, "global_step": 3068, "epoch": 73} {"train_loss": -4.006612777709961, "global_step": 3069, "epoch": 73} {"train_loss": -3.9142093658447266, "global_step": 3070, "epoch": 73} {"train_loss": -3.931662082672119, "global_step": 3071, "epoch": 73} {"train_loss": -4.124621868133545, "global_step": 3072, "epoch": 73} {"train_loss": -3.9891738891601562, "global_step": 3073, "epoch": 73} {"train_loss": -3.9864025115966797, "global_step": 3074, "epoch": 73} {"train_loss": -4.037808418273926, "global_step": 3075, "epoch": 73} {"train_loss": -3.7498250007629395, "global_step": 3076, "epoch": 73} {"train_loss": -4.127666473388672, "global_step": 3077, "epoch": 73} {"train_loss": -4.056085109710693, "global_step": 3078, "epoch": 73} {"train_loss": -4.077924728393555, "global_step": 3079, "epoch": 73} {"train_loss": -3.7443342208862305, "global_step": 3080, "epoch": 73} {"train_loss": -3.84653377532959, "global_step": 3081, "epoch": 73} {"train_loss": -3.913080930709839, "global_step": 3082, "epoch": 73} {"train_loss": -3.892941474914551, "global_step": 3083, "epoch": 73} {"train_loss": -3.991090774536133, "global_step": 3084, "epoch": 73} {"train_loss": -4.131419658660889, "global_step": 3085, "epoch": 73} {"train_loss": -3.921389102935791, "global_step": 3086, "epoch": 73} {"train_loss": -4.072737216949463, "global_step": 3087, "epoch": 73} {"train_loss": -4.001982688903809, "global_step": 3088, "epoch": 73} {"train_loss": -3.9721121788024902, "global_step": 3089, "epoch": 73} {"train_loss": -4.095646858215332, "global_step": 3090, "epoch": 73} {"train_loss": -4.0316362380981445, "global_step": 3091, "epoch": 73} {"train_loss": -4.006750583648682, "global_step": 3092, "epoch": 73} {"train_loss": -3.9139866828918457, "global_step": 3093, "epoch": 73} {"train_loss": -3.95737361907959, "global_step": 3094, "epoch": 73} {"train_loss": -4.051516532897949, "global_step": 3095, "epoch": 73} {"train_loss": -3.96551513671875, "global_step": 3096, "epoch": 73} {"train_loss": -3.965315580368042, "global_step": 3097, "epoch": 73} {"train_loss": -4.112420082092285, "global_step": 3098, "epoch": 73} {"train_loss": -4.127155780792236, "global_step": 3099, "epoch": 73} {"train_loss": -4.0160017013549805, "global_step": 3100, "epoch": 73} {"train_loss": -3.8309454917907715, "global_step": 3101, "epoch": 73} {"train_loss": -3.8849997520446777, "global_step": 3102, "epoch": 73} {"train_loss": -3.95853590965271, "global_step": 3103, "epoch": 73} {"train_loss": -3.8668384552001953, "global_step": 3104, "epoch": 73} {"train_loss": -3.872939109802246, "global_step": 3105, "epoch": 73} {"train_loss": -3.9204535484313965, "global_step": 3106, "epoch": 73} {"train_loss": -3.9796523934318904, "global_step": 3107, "epoch": 73, "val_loss": 143450.46875} {"train_loss": -3.9424259662628174, "global_step": 3108, "epoch": 74} {"train_loss": -3.9031119346618652, "global_step": 3109, "epoch": 74} {"train_loss": -3.696521282196045, "global_step": 3110, "epoch": 74} {"train_loss": -3.9742989540100098, "global_step": 3111, "epoch": 74} {"train_loss": -4.050959587097168, "global_step": 3112, "epoch": 74} {"train_loss": -3.688009738922119, "global_step": 3113, "epoch": 74} {"train_loss": -4.031693458557129, "global_step": 3114, "epoch": 74} {"train_loss": -3.6950154304504395, "global_step": 3115, "epoch": 74} {"train_loss": -3.9420042037963867, "global_step": 3116, "epoch": 74} {"train_loss": -3.969550132751465, "global_step": 3117, "epoch": 74} {"train_loss": -3.9036121368408203, "global_step": 3118, "epoch": 74} {"train_loss": -3.8200764656066895, "global_step": 3119, "epoch": 74} {"train_loss": -3.9429843425750732, "global_step": 3120, "epoch": 74} {"train_loss": -3.9235167503356934, "global_step": 3121, "epoch": 74} {"train_loss": -3.9898436069488525, "global_step": 3122, "epoch": 74} {"train_loss": -3.949747085571289, "global_step": 3123, "epoch": 74} {"train_loss": -3.915729284286499, "global_step": 3124, "epoch": 74} {"train_loss": -4.030404090881348, "global_step": 3125, "epoch": 74} {"train_loss": -3.957198143005371, "global_step": 3126, "epoch": 74} {"train_loss": -4.053694248199463, "global_step": 3127, "epoch": 74} {"train_loss": -4.010080337524414, "global_step": 3128, "epoch": 74} {"train_loss": -4.011473655700684, "global_step": 3129, "epoch": 74} {"train_loss": -4.0370354652404785, "global_step": 3130, "epoch": 74} {"train_loss": -4.019108772277832, "global_step": 3131, "epoch": 74} {"train_loss": -3.934800386428833, "global_step": 3132, "epoch": 74} {"train_loss": -3.7959394454956055, "global_step": 3133, "epoch": 74} {"train_loss": -3.922278881072998, "global_step": 3134, "epoch": 74} {"train_loss": -3.9719157218933105, "global_step": 3135, "epoch": 74} {"train_loss": -4.002167701721191, "global_step": 3136, "epoch": 74} {"train_loss": -3.9380569458007812, "global_step": 3137, "epoch": 74} {"train_loss": -4.1343159675598145, "global_step": 3138, "epoch": 74} {"train_loss": -3.935514450073242, "global_step": 3139, "epoch": 74} {"train_loss": -4.00334358215332, "global_step": 3140, "epoch": 74} {"train_loss": -4.1557512283325195, "global_step": 3141, "epoch": 74} {"train_loss": -4.058048248291016, "global_step": 3142, "epoch": 74} {"train_loss": -4.182363986968994, "global_step": 3143, "epoch": 74} {"train_loss": -3.8960072994232178, "global_step": 3144, "epoch": 74} {"train_loss": -4.0301513671875, "global_step": 3145, "epoch": 74} {"train_loss": -3.928514003753662, "global_step": 3146, "epoch": 74} {"train_loss": -4.208822250366211, "global_step": 3147, "epoch": 74} {"train_loss": -4.0392255783081055, "global_step": 3148, "epoch": 74} {"train_loss": -3.9638610567365373, "global_step": 3149, "epoch": 74, "val_loss": 138110.375} {"train_loss": -4.235405921936035, "global_step": 3150, "epoch": 75} {"train_loss": -3.717012882232666, "global_step": 3151, "epoch": 75} {"train_loss": -3.8718678951263428, "global_step": 3152, "epoch": 75} {"train_loss": -3.786813259124756, "global_step": 3153, "epoch": 75} {"train_loss": -3.7986505031585693, "global_step": 3154, "epoch": 75} {"train_loss": -3.856177806854248, "global_step": 3155, "epoch": 75} {"train_loss": -4.057924270629883, "global_step": 3156, "epoch": 75} {"train_loss": -3.8385305404663086, "global_step": 3157, "epoch": 75} {"train_loss": -3.8780369758605957, "global_step": 3158, "epoch": 75} {"train_loss": -4.07036018371582, "global_step": 3159, "epoch": 75} {"train_loss": -3.9485294818878174, "global_step": 3160, "epoch": 75} {"train_loss": -4.072241306304932, "global_step": 3161, "epoch": 75} {"train_loss": -3.956831693649292, "global_step": 3162, "epoch": 75} {"train_loss": -3.9762966632843018, "global_step": 3163, "epoch": 75} {"train_loss": -3.9867684841156006, "global_step": 3164, "epoch": 75} {"train_loss": -3.9654881954193115, "global_step": 3165, "epoch": 75} {"train_loss": -4.0194549560546875, "global_step": 3166, "epoch": 75} {"train_loss": -4.204047203063965, "global_step": 3167, "epoch": 75} {"train_loss": -3.927041530609131, "global_step": 3168, "epoch": 75} {"train_loss": -3.9627466201782227, "global_step": 3169, "epoch": 75} {"train_loss": -3.8029866218566895, "global_step": 3170, "epoch": 75} {"train_loss": -3.983825445175171, "global_step": 3171, "epoch": 75} {"train_loss": -3.8212995529174805, "global_step": 3172, "epoch": 75} {"train_loss": -3.8667163848876953, "global_step": 3173, "epoch": 75} {"train_loss": -4.089054584503174, "global_step": 3174, "epoch": 75} {"train_loss": -3.899686098098755, "global_step": 3175, "epoch": 75} {"train_loss": -4.13142204284668, "global_step": 3176, "epoch": 75} {"train_loss": -4.065586090087891, "global_step": 3177, "epoch": 75} {"train_loss": -4.145101547241211, "global_step": 3178, "epoch": 75} {"train_loss": -4.0850677490234375, "global_step": 3179, "epoch": 75} {"train_loss": -4.018991947174072, "global_step": 3180, "epoch": 75} {"train_loss": -4.055331707000732, "global_step": 3181, "epoch": 75} {"train_loss": -4.139759063720703, "global_step": 3182, "epoch": 75} {"train_loss": -4.054296493530273, "global_step": 3183, "epoch": 75} {"train_loss": -3.9233243465423584, "global_step": 3184, "epoch": 75} {"train_loss": -3.811617851257324, "global_step": 3185, "epoch": 75} {"train_loss": -4.1837053298950195, "global_step": 3186, "epoch": 75} {"train_loss": -3.974911689758301, "global_step": 3187, "epoch": 75} {"train_loss": -4.09002685546875, "global_step": 3188, "epoch": 75} {"train_loss": -4.029452323913574, "global_step": 3189, "epoch": 75} {"train_loss": -3.9376142024993896, "global_step": 3190, "epoch": 75} {"train_loss": -3.9816153673898604, "global_step": 3191, "epoch": 75, "val_loss": 136504.671875} {"train_loss": -4.0576276779174805, "global_step": 3192, "epoch": 76} {"train_loss": -3.9444985389709473, "global_step": 3193, "epoch": 76} {"train_loss": -3.8757376670837402, "global_step": 3194, "epoch": 76} {"train_loss": -4.145525932312012, "global_step": 3195, "epoch": 76} {"train_loss": -3.9945201873779297, "global_step": 3196, "epoch": 76} {"train_loss": -3.9810445308685303, "global_step": 3197, "epoch": 76} {"train_loss": -3.9306516647338867, "global_step": 3198, "epoch": 76} {"train_loss": -3.9017748832702637, "global_step": 3199, "epoch": 76} {"train_loss": -4.0781569480896, "global_step": 3200, "epoch": 76} {"train_loss": -3.926525592803955, "global_step": 3201, "epoch": 76} {"train_loss": -3.863595724105835, "global_step": 3202, "epoch": 76} {"train_loss": -4.130296230316162, "global_step": 3203, "epoch": 76} {"train_loss": -4.146419525146484, "global_step": 3204, "epoch": 76} {"train_loss": -4.111588478088379, "global_step": 3205, "epoch": 76} {"train_loss": -3.954289197921753, "global_step": 3206, "epoch": 76} {"train_loss": -4.0893168449401855, "global_step": 3207, "epoch": 76} {"train_loss": -3.988171100616455, "global_step": 3208, "epoch": 76} {"train_loss": -3.9530601501464844, "global_step": 3209, "epoch": 76} {"train_loss": -4.018661022186279, "global_step": 3210, "epoch": 76} {"train_loss": -4.031301498413086, "global_step": 3211, "epoch": 76} {"train_loss": -3.9320056438446045, "global_step": 3212, "epoch": 76} {"train_loss": -4.00517463684082, "global_step": 3213, "epoch": 76} {"train_loss": -4.030046463012695, "global_step": 3214, "epoch": 76} {"train_loss": -3.8953471183776855, "global_step": 3215, "epoch": 76} {"train_loss": -4.005702018737793, "global_step": 3216, "epoch": 76} {"train_loss": -4.083081245422363, "global_step": 3217, "epoch": 76} {"train_loss": -3.9396886825561523, "global_step": 3218, "epoch": 76} {"train_loss": -4.036762237548828, "global_step": 3219, "epoch": 76} {"train_loss": -4.009468078613281, "global_step": 3220, "epoch": 76} {"train_loss": -4.028349876403809, "global_step": 3221, "epoch": 76} {"train_loss": -4.152829170227051, "global_step": 3222, "epoch": 76} {"train_loss": -4.071203231811523, "global_step": 3223, "epoch": 76} {"train_loss": -3.935274362564087, "global_step": 3224, "epoch": 76} {"train_loss": -4.2027692794799805, "global_step": 3225, "epoch": 76} {"train_loss": -3.9230613708496094, "global_step": 3226, "epoch": 76} {"train_loss": -3.939426898956299, "global_step": 3227, "epoch": 76} {"train_loss": -3.9656739234924316, "global_step": 3228, "epoch": 76} {"train_loss": -3.9859066009521484, "global_step": 3229, "epoch": 76} {"train_loss": -4.182347774505615, "global_step": 3230, "epoch": 76} {"train_loss": -4.009194850921631, "global_step": 3231, "epoch": 76} {"train_loss": -4.043980121612549, "global_step": 3232, "epoch": 76} {"train_loss": -4.014570434888204, "global_step": 3233, "epoch": 76, "val_loss": 136460.625} {"train_loss": -4.053564071655273, "global_step": 3234, "epoch": 77} {"train_loss": -3.9804320335388184, "global_step": 3235, "epoch": 77} {"train_loss": -3.882842540740967, "global_step": 3236, "epoch": 77} {"train_loss": -4.038544654846191, "global_step": 3237, "epoch": 77} {"train_loss": -4.131961345672607, "global_step": 3238, "epoch": 77} {"train_loss": -4.256204605102539, "global_step": 3239, "epoch": 77} {"train_loss": -3.863663673400879, "global_step": 3240, "epoch": 77} {"train_loss": -3.9866673946380615, "global_step": 3241, "epoch": 77} {"train_loss": -3.987652540206909, "global_step": 3242, "epoch": 77} {"train_loss": -3.9062564373016357, "global_step": 3243, "epoch": 77} {"train_loss": -3.7557473182678223, "global_step": 3244, "epoch": 77} {"train_loss": -3.8720250129699707, "global_step": 3245, "epoch": 77} {"train_loss": -3.732919692993164, "global_step": 3246, "epoch": 77} {"train_loss": -3.4502334594726562, "global_step": 3247, "epoch": 77} {"train_loss": -3.909724235534668, "global_step": 3248, "epoch": 77} {"train_loss": -3.786956310272217, "global_step": 3249, "epoch": 77} {"train_loss": -3.777329921722412, "global_step": 3250, "epoch": 77} {"train_loss": -3.8640873432159424, "global_step": 3251, "epoch": 77} {"train_loss": -3.7994537353515625, "global_step": 3252, "epoch": 77} {"train_loss": -3.539267063140869, "global_step": 3253, "epoch": 77} {"train_loss": -4.145750999450684, "global_step": 3254, "epoch": 77} {"train_loss": -3.524082660675049, "global_step": 3255, "epoch": 77} {"train_loss": -3.9675498008728027, "global_step": 3256, "epoch": 77} {"train_loss": -3.5250847339630127, "global_step": 3257, "epoch": 77} {"train_loss": -3.6991748809814453, "global_step": 3258, "epoch": 77} {"train_loss": -3.948639392852783, "global_step": 3259, "epoch": 77} {"train_loss": -3.768540382385254, "global_step": 3260, "epoch": 77} {"train_loss": -3.9313712120056152, "global_step": 3261, "epoch": 77} {"train_loss": -3.904430389404297, "global_step": 3262, "epoch": 77} {"train_loss": -3.886826992034912, "global_step": 3263, "epoch": 77} {"train_loss": -3.9802286624908447, "global_step": 3264, "epoch": 77} {"train_loss": -3.898024320602417, "global_step": 3265, "epoch": 77} {"train_loss": -3.87776255607605, "global_step": 3266, "epoch": 77} {"train_loss": -3.9306640625, "global_step": 3267, "epoch": 77} {"train_loss": -4.059232711791992, "global_step": 3268, "epoch": 77} {"train_loss": -4.019806861877441, "global_step": 3269, "epoch": 77} {"train_loss": -3.939701557159424, "global_step": 3270, "epoch": 77} {"train_loss": -3.9641571044921875, "global_step": 3271, "epoch": 77} {"train_loss": -3.8319783210754395, "global_step": 3272, "epoch": 77} {"train_loss": -4.038125991821289, "global_step": 3273, "epoch": 77} {"train_loss": -4.120865821838379, "global_step": 3274, "epoch": 77} {"train_loss": -3.8925060147330877, "global_step": 3275, "epoch": 77, "val_loss": 132384.703125} {"train_loss": -3.9974093437194824, "global_step": 3276, "epoch": 78} {"train_loss": -4.027092933654785, "global_step": 3277, "epoch": 78} {"train_loss": -4.000566482543945, "global_step": 3278, "epoch": 78} {"train_loss": -4.069573402404785, "global_step": 3279, "epoch": 78} {"train_loss": -4.122488498687744, "global_step": 3280, "epoch": 78} {"train_loss": -3.9466745853424072, "global_step": 3281, "epoch": 78} {"train_loss": -4.091650009155273, "global_step": 3282, "epoch": 78} {"train_loss": -4.0441389083862305, "global_step": 3283, "epoch": 78} {"train_loss": -4.097637176513672, "global_step": 3284, "epoch": 78} {"train_loss": -3.909538745880127, "global_step": 3285, "epoch": 78} {"train_loss": -4.140468597412109, "global_step": 3286, "epoch": 78} {"train_loss": -4.2281341552734375, "global_step": 3287, "epoch": 78} {"train_loss": -4.219818592071533, "global_step": 3288, "epoch": 78} {"train_loss": -3.9980602264404297, "global_step": 3289, "epoch": 78} {"train_loss": -4.157154560089111, "global_step": 3290, "epoch": 78} {"train_loss": -4.010515213012695, "global_step": 3291, "epoch": 78} {"train_loss": -3.916041612625122, "global_step": 3292, "epoch": 78} {"train_loss": -3.9310038089752197, "global_step": 3293, "epoch": 78} {"train_loss": -3.906013250350952, "global_step": 3294, "epoch": 78} {"train_loss": -4.03603458404541, "global_step": 3295, "epoch": 78} {"train_loss": -3.942852020263672, "global_step": 3296, "epoch": 78} {"train_loss": -3.952465057373047, "global_step": 3297, "epoch": 78} {"train_loss": -4.128223419189453, "global_step": 3298, "epoch": 78} {"train_loss": -4.0766191482543945, "global_step": 3299, "epoch": 78} {"train_loss": -4.0009660720825195, "global_step": 3300, "epoch": 78} {"train_loss": -3.9051718711853027, "global_step": 3301, "epoch": 78} {"train_loss": -4.1000165939331055, "global_step": 3302, "epoch": 78} {"train_loss": -3.9693777561187744, "global_step": 3303, "epoch": 78} {"train_loss": -4.099340438842773, "global_step": 3304, "epoch": 78} {"train_loss": -4.069021701812744, "global_step": 3305, "epoch": 78} {"train_loss": -4.070381164550781, "global_step": 3306, "epoch": 78} {"train_loss": -4.106528282165527, "global_step": 3307, "epoch": 78} {"train_loss": -4.139465808868408, "global_step": 3308, "epoch": 78} {"train_loss": -4.05224609375, "global_step": 3309, "epoch": 78} {"train_loss": -4.052896022796631, "global_step": 3310, "epoch": 78} {"train_loss": -4.092889785766602, "global_step": 3311, "epoch": 78} {"train_loss": -4.162178993225098, "global_step": 3312, "epoch": 78} {"train_loss": -4.147311210632324, "global_step": 3313, "epoch": 78} {"train_loss": -4.233519077301025, "global_step": 3314, "epoch": 78} {"train_loss": -4.124405860900879, "global_step": 3315, "epoch": 78} {"train_loss": -4.130571365356445, "global_step": 3316, "epoch": 78} {"train_loss": -4.059816888400486, "global_step": 3317, "epoch": 78, "val_loss": 130741.7734375} {"train_loss": -4.080255508422852, "global_step": 3318, "epoch": 79} {"train_loss": -4.224392890930176, "global_step": 3319, "epoch": 79} {"train_loss": -4.052755832672119, "global_step": 3320, "epoch": 79} {"train_loss": -3.9703426361083984, "global_step": 3321, "epoch": 79} {"train_loss": -4.139665603637695, "global_step": 3322, "epoch": 79} {"train_loss": -4.0832953453063965, "global_step": 3323, "epoch": 79} {"train_loss": -4.018418312072754, "global_step": 3324, "epoch": 79} {"train_loss": -4.087228775024414, "global_step": 3325, "epoch": 79} {"train_loss": -4.1192522048950195, "global_step": 3326, "epoch": 79} {"train_loss": -3.9718310832977295, "global_step": 3327, "epoch": 79} {"train_loss": -4.14089298248291, "global_step": 3328, "epoch": 79} {"train_loss": -4.1234636306762695, "global_step": 3329, "epoch": 79} {"train_loss": -4.014383792877197, "global_step": 3330, "epoch": 79} {"train_loss": -4.048036098480225, "global_step": 3331, "epoch": 79} {"train_loss": -3.9342408180236816, "global_step": 3332, "epoch": 79} {"train_loss": -4.198904991149902, "global_step": 3333, "epoch": 79} {"train_loss": -3.9202733039855957, "global_step": 3334, "epoch": 79} {"train_loss": -4.0459699630737305, "global_step": 3335, "epoch": 79} {"train_loss": -4.032796859741211, "global_step": 3336, "epoch": 79} {"train_loss": -4.224669933319092, "global_step": 3337, "epoch": 79} {"train_loss": -4.139596462249756, "global_step": 3338, "epoch": 79} {"train_loss": -4.148353099822998, "global_step": 3339, "epoch": 79} {"train_loss": -4.146031856536865, "global_step": 3340, "epoch": 79} {"train_loss": -4.020151138305664, "global_step": 3341, "epoch": 79} {"train_loss": -4.144401550292969, "global_step": 3342, "epoch": 79} {"train_loss": -4.2261433601379395, "global_step": 3343, "epoch": 79} {"train_loss": -4.18695068359375, "global_step": 3344, "epoch": 79} {"train_loss": -4.133131980895996, "global_step": 3345, "epoch": 79} {"train_loss": -4.052208423614502, "global_step": 3346, "epoch": 79} {"train_loss": -4.054656982421875, "global_step": 3347, "epoch": 79} {"train_loss": -4.162781715393066, "global_step": 3348, "epoch": 79} {"train_loss": -4.021337985992432, "global_step": 3349, "epoch": 79} {"train_loss": -4.1468024253845215, "global_step": 3350, "epoch": 79} {"train_loss": -4.287589073181152, "global_step": 3351, "epoch": 79} {"train_loss": -4.098854064941406, "global_step": 3352, "epoch": 79} {"train_loss": -4.055542945861816, "global_step": 3353, "epoch": 79} {"train_loss": -4.1065568923950195, "global_step": 3354, "epoch": 79} {"train_loss": -4.090892791748047, "global_step": 3355, "epoch": 79} {"train_loss": -3.9688425064086914, "global_step": 3356, "epoch": 79} {"train_loss": -4.065481185913086, "global_step": 3357, "epoch": 79} {"train_loss": -4.027564525604248, "global_step": 3358, "epoch": 79} {"train_loss": -4.091632178851536, "global_step": 3359, "epoch": 79, "val_loss": 127201.765625} {"train_loss": -4.179274559020996, "global_step": 3360, "epoch": 80} {"train_loss": -4.20918607711792, "global_step": 3361, "epoch": 80} {"train_loss": -4.055580139160156, "global_step": 3362, "epoch": 80} {"train_loss": -4.200716972351074, "global_step": 3363, "epoch": 80} {"train_loss": -4.1050591468811035, "global_step": 3364, "epoch": 80} {"train_loss": -4.175908088684082, "global_step": 3365, "epoch": 80} {"train_loss": -4.008571147918701, "global_step": 3366, "epoch": 80} {"train_loss": -4.104331970214844, "global_step": 3367, "epoch": 80} {"train_loss": -3.994255781173706, "global_step": 3368, "epoch": 80} {"train_loss": -4.176158905029297, "global_step": 3369, "epoch": 80} {"train_loss": -4.159446716308594, "global_step": 3370, "epoch": 80} {"train_loss": -4.141437530517578, "global_step": 3371, "epoch": 80} {"train_loss": -4.044048309326172, "global_step": 3372, "epoch": 80} {"train_loss": -4.038163661956787, "global_step": 3373, "epoch": 80} {"train_loss": -4.120341777801514, "global_step": 3374, "epoch": 80} {"train_loss": -3.9616146087646484, "global_step": 3375, "epoch": 80} {"train_loss": -3.943169116973877, "global_step": 3376, "epoch": 80} {"train_loss": -4.100250244140625, "global_step": 3377, "epoch": 80} {"train_loss": -4.082059860229492, "global_step": 3378, "epoch": 80} {"train_loss": -3.8530631065368652, "global_step": 3379, "epoch": 80} {"train_loss": -3.8703951835632324, "global_step": 3380, "epoch": 80} {"train_loss": -4.153163909912109, "global_step": 3381, "epoch": 80} {"train_loss": -4.034947395324707, "global_step": 3382, "epoch": 80} {"train_loss": -4.072084426879883, "global_step": 3383, "epoch": 80} {"train_loss": -3.937849521636963, "global_step": 3384, "epoch": 80} {"train_loss": -4.2418212890625, "global_step": 3385, "epoch": 80} {"train_loss": -4.1048078536987305, "global_step": 3386, "epoch": 80} {"train_loss": -4.066983222961426, "global_step": 3387, "epoch": 80} {"train_loss": -4.096656799316406, "global_step": 3388, "epoch": 80} {"train_loss": -4.184548377990723, "global_step": 3389, "epoch": 80} {"train_loss": -3.9868812561035156, "global_step": 3390, "epoch": 80} {"train_loss": -4.133365154266357, "global_step": 3391, "epoch": 80} {"train_loss": -4.097668647766113, "global_step": 3392, "epoch": 80} {"train_loss": -4.116724014282227, "global_step": 3393, "epoch": 80} {"train_loss": -4.0849456787109375, "global_step": 3394, "epoch": 80} {"train_loss": -4.195058345794678, "global_step": 3395, "epoch": 80} {"train_loss": -4.122733116149902, "global_step": 3396, "epoch": 80} {"train_loss": -4.111590385437012, "global_step": 3397, "epoch": 80} {"train_loss": -4.136444091796875, "global_step": 3398, "epoch": 80} {"train_loss": -4.07000207901001, "global_step": 3399, "epoch": 80} {"train_loss": -4.002974510192871, "global_step": 3400, "epoch": 80} {"train_loss": -4.088248860268366, "global_step": 3401, "epoch": 80, "val_loss": 129344.5390625} {"train_loss": -4.143482208251953, "global_step": 3402, "epoch": 81} {"train_loss": -4.12392520904541, "global_step": 3403, "epoch": 81} {"train_loss": -4.063509941101074, "global_step": 3404, "epoch": 81} {"train_loss": -4.166741371154785, "global_step": 3405, "epoch": 81} {"train_loss": -4.187540054321289, "global_step": 3406, "epoch": 81} {"train_loss": -4.197518348693848, "global_step": 3407, "epoch": 81} {"train_loss": -4.136467456817627, "global_step": 3408, "epoch": 81} {"train_loss": -4.273144721984863, "global_step": 3409, "epoch": 81} {"train_loss": -4.125077247619629, "global_step": 3410, "epoch": 81} {"train_loss": -4.077016830444336, "global_step": 3411, "epoch": 81} {"train_loss": -4.1752166748046875, "global_step": 3412, "epoch": 81} {"train_loss": -4.153231620788574, "global_step": 3413, "epoch": 81} {"train_loss": -4.073731899261475, "global_step": 3414, "epoch": 81} {"train_loss": -4.171872138977051, "global_step": 3415, "epoch": 81} {"train_loss": -4.055346488952637, "global_step": 3416, "epoch": 81} {"train_loss": -3.965001106262207, "global_step": 3417, "epoch": 81} {"train_loss": -4.059793949127197, "global_step": 3418, "epoch": 81} {"train_loss": -4.066903591156006, "global_step": 3419, "epoch": 81} {"train_loss": -4.145617485046387, "global_step": 3420, "epoch": 81} {"train_loss": -4.183876037597656, "global_step": 3421, "epoch": 81} {"train_loss": -3.938476800918579, "global_step": 3422, "epoch": 81} {"train_loss": -3.9429216384887695, "global_step": 3423, "epoch": 81} {"train_loss": -4.165320873260498, "global_step": 3424, "epoch": 81} {"train_loss": -3.9988603591918945, "global_step": 3425, "epoch": 81} {"train_loss": -4.091331958770752, "global_step": 3426, "epoch": 81} {"train_loss": -4.173226356506348, "global_step": 3427, "epoch": 81} {"train_loss": -3.9203665256500244, "global_step": 3428, "epoch": 81} {"train_loss": -3.8821609020233154, "global_step": 3429, "epoch": 81} {"train_loss": -4.222695350646973, "global_step": 3430, "epoch": 81} {"train_loss": -3.9055304527282715, "global_step": 3431, "epoch": 81} {"train_loss": -4.126345634460449, "global_step": 3432, "epoch": 81} {"train_loss": -4.103392601013184, "global_step": 3433, "epoch": 81} {"train_loss": -4.158740520477295, "global_step": 3434, "epoch": 81} {"train_loss": -4.048764228820801, "global_step": 3435, "epoch": 81} {"train_loss": -4.131481170654297, "global_step": 3436, "epoch": 81} {"train_loss": -4.042787551879883, "global_step": 3437, "epoch": 81} {"train_loss": -4.1054487228393555, "global_step": 3438, "epoch": 81} {"train_loss": -4.10538387298584, "global_step": 3439, "epoch": 81} {"train_loss": -4.020340919494629, "global_step": 3440, "epoch": 81} {"train_loss": -4.229797840118408, "global_step": 3441, "epoch": 81} {"train_loss": -4.172800540924072, "global_step": 3442, "epoch": 81} {"train_loss": -4.09933770838238, "global_step": 3443, "epoch": 81, "val_loss": 127380.71875} {"train_loss": -4.286476135253906, "global_step": 3444, "epoch": 82} {"train_loss": -3.922687530517578, "global_step": 3445, "epoch": 82} {"train_loss": -4.318568229675293, "global_step": 3446, "epoch": 82} {"train_loss": -4.19064998626709, "global_step": 3447, "epoch": 82} {"train_loss": -4.050492286682129, "global_step": 3448, "epoch": 82} {"train_loss": -4.215938568115234, "global_step": 3449, "epoch": 82} {"train_loss": -4.111566543579102, "global_step": 3450, "epoch": 82} {"train_loss": -4.10078239440918, "global_step": 3451, "epoch": 82} {"train_loss": -4.077839374542236, "global_step": 3452, "epoch": 82} {"train_loss": -4.132842540740967, "global_step": 3453, "epoch": 82} {"train_loss": -4.231488227844238, "global_step": 3454, "epoch": 82} {"train_loss": -4.0758161544799805, "global_step": 3455, "epoch": 82} {"train_loss": -4.217495441436768, "global_step": 3456, "epoch": 82} {"train_loss": -4.178858757019043, "global_step": 3457, "epoch": 82} {"train_loss": -4.123973846435547, "global_step": 3458, "epoch": 82} {"train_loss": -4.198212623596191, "global_step": 3459, "epoch": 82} {"train_loss": -4.169049263000488, "global_step": 3460, "epoch": 82} {"train_loss": -4.128457546234131, "global_step": 3461, "epoch": 82} {"train_loss": -4.146455764770508, "global_step": 3462, "epoch": 82} {"train_loss": -4.1854400634765625, "global_step": 3463, "epoch": 82} {"train_loss": -4.303591728210449, "global_step": 3464, "epoch": 82} {"train_loss": -4.152487277984619, "global_step": 3465, "epoch": 82} {"train_loss": -4.224032402038574, "global_step": 3466, "epoch": 82} {"train_loss": -3.8748598098754883, "global_step": 3467, "epoch": 82} {"train_loss": -4.156552314758301, "global_step": 3468, "epoch": 82} {"train_loss": -4.195126533508301, "global_step": 3469, "epoch": 82} {"train_loss": -3.792398691177368, "global_step": 3470, "epoch": 82} {"train_loss": -4.120684623718262, "global_step": 3471, "epoch": 82} {"train_loss": -4.328364849090576, "global_step": 3472, "epoch": 82} {"train_loss": -4.174818515777588, "global_step": 3473, "epoch": 82} {"train_loss": -4.1183319091796875, "global_step": 3474, "epoch": 82} {"train_loss": -4.115649223327637, "global_step": 3475, "epoch": 82} {"train_loss": -4.083958625793457, "global_step": 3476, "epoch": 82} {"train_loss": -4.137118339538574, "global_step": 3477, "epoch": 82} {"train_loss": -4.0896453857421875, "global_step": 3478, "epoch": 82} {"train_loss": -4.126319885253906, "global_step": 3479, "epoch": 82} {"train_loss": -4.195456027984619, "global_step": 3480, "epoch": 82} {"train_loss": -4.243010520935059, "global_step": 3481, "epoch": 82} {"train_loss": -4.020307540893555, "global_step": 3482, "epoch": 82} {"train_loss": -4.048617839813232, "global_step": 3483, "epoch": 82} {"train_loss": -3.94036865234375, "global_step": 3484, "epoch": 82} {"train_loss": -4.134655833244324, "global_step": 3485, "epoch": 82, "val_loss": 126505.921875} {"train_loss": -4.111005783081055, "global_step": 3486, "epoch": 83} {"train_loss": -3.9434428215026855, "global_step": 3487, "epoch": 83} {"train_loss": -3.8471522331237793, "global_step": 3488, "epoch": 83} {"train_loss": -4.084651947021484, "global_step": 3489, "epoch": 83} {"train_loss": -4.106925964355469, "global_step": 3490, "epoch": 83} {"train_loss": -3.924198865890503, "global_step": 3491, "epoch": 83} {"train_loss": -4.17211389541626, "global_step": 3492, "epoch": 83} {"train_loss": -4.209136486053467, "global_step": 3493, "epoch": 83} {"train_loss": -4.099682807922363, "global_step": 3494, "epoch": 83} {"train_loss": -4.242680549621582, "global_step": 3495, "epoch": 83} {"train_loss": -4.002729415893555, "global_step": 3496, "epoch": 83} {"train_loss": -4.147237300872803, "global_step": 3497, "epoch": 83} {"train_loss": -4.203768730163574, "global_step": 3498, "epoch": 83} {"train_loss": -4.011801719665527, "global_step": 3499, "epoch": 83} {"train_loss": -4.322310447692871, "global_step": 3500, "epoch": 83} {"train_loss": -4.185182094573975, "global_step": 3501, "epoch": 83} {"train_loss": -4.159607887268066, "global_step": 3502, "epoch": 83} {"train_loss": -4.132932662963867, "global_step": 3503, "epoch": 83} {"train_loss": -4.284116268157959, "global_step": 3504, "epoch": 83} {"train_loss": -4.12709903717041, "global_step": 3505, "epoch": 83} {"train_loss": -4.2474260330200195, "global_step": 3506, "epoch": 83} {"train_loss": -4.196203231811523, "global_step": 3507, "epoch": 83} {"train_loss": -4.138751983642578, "global_step": 3508, "epoch": 83} {"train_loss": -4.170459747314453, "global_step": 3509, "epoch": 83} {"train_loss": -4.214365005493164, "global_step": 3510, "epoch": 83} {"train_loss": -4.183728218078613, "global_step": 3511, "epoch": 83} {"train_loss": -4.257660865783691, "global_step": 3512, "epoch": 83} {"train_loss": -4.362582683563232, "global_step": 3513, "epoch": 83} {"train_loss": -4.160082817077637, "global_step": 3514, "epoch": 83} {"train_loss": -4.077887535095215, "global_step": 3515, "epoch": 83} {"train_loss": -4.192564964294434, "global_step": 3516, "epoch": 83} {"train_loss": -4.169005393981934, "global_step": 3517, "epoch": 83} {"train_loss": -4.137284278869629, "global_step": 3518, "epoch": 83} {"train_loss": -4.145960330963135, "global_step": 3519, "epoch": 83} {"train_loss": -4.18584680557251, "global_step": 3520, "epoch": 83} {"train_loss": -4.178661823272705, "global_step": 3521, "epoch": 83} {"train_loss": -4.230936050415039, "global_step": 3522, "epoch": 83} {"train_loss": -4.114635944366455, "global_step": 3523, "epoch": 83} {"train_loss": -4.0053911209106445, "global_step": 3524, "epoch": 83} {"train_loss": -4.105810165405273, "global_step": 3525, "epoch": 83} {"train_loss": -4.169137477874756, "global_step": 3526, "epoch": 83} {"train_loss": -4.141625285148621, "global_step": 3527, "epoch": 83, "val_loss": 127106.2265625} {"train_loss": -4.046172618865967, "global_step": 3528, "epoch": 84} {"train_loss": -4.010512351989746, "global_step": 3529, "epoch": 84} {"train_loss": -4.270302772521973, "global_step": 3530, "epoch": 84} {"train_loss": -4.186149597167969, "global_step": 3531, "epoch": 84} {"train_loss": -3.952472686767578, "global_step": 3532, "epoch": 84} {"train_loss": -4.112612724304199, "global_step": 3533, "epoch": 84} {"train_loss": -4.092690467834473, "global_step": 3534, "epoch": 84} {"train_loss": -4.003631114959717, "global_step": 3535, "epoch": 84} {"train_loss": -4.308278560638428, "global_step": 3536, "epoch": 84} {"train_loss": -4.288801193237305, "global_step": 3537, "epoch": 84} {"train_loss": -4.042362213134766, "global_step": 3538, "epoch": 84} {"train_loss": -4.1302900314331055, "global_step": 3539, "epoch": 84} {"train_loss": -4.021557807922363, "global_step": 3540, "epoch": 84} {"train_loss": -4.146126747131348, "global_step": 3541, "epoch": 84} {"train_loss": -4.318572521209717, "global_step": 3542, "epoch": 84} {"train_loss": -3.9334311485290527, "global_step": 3543, "epoch": 84} {"train_loss": -4.165992736816406, "global_step": 3544, "epoch": 84} {"train_loss": -4.102133750915527, "global_step": 3545, "epoch": 84} {"train_loss": -4.206822872161865, "global_step": 3546, "epoch": 84} {"train_loss": -4.095991134643555, "global_step": 3547, "epoch": 84} {"train_loss": -3.931772470474243, "global_step": 3548, "epoch": 84} {"train_loss": -4.083618640899658, "global_step": 3549, "epoch": 84} {"train_loss": -3.831768035888672, "global_step": 3550, "epoch": 84} {"train_loss": -4.217716693878174, "global_step": 3551, "epoch": 84} {"train_loss": -3.927427291870117, "global_step": 3552, "epoch": 84} {"train_loss": -4.171504974365234, "global_step": 3553, "epoch": 84} {"train_loss": -3.943905830383301, "global_step": 3554, "epoch": 84} {"train_loss": -4.118699073791504, "global_step": 3555, "epoch": 84} {"train_loss": -4.075194358825684, "global_step": 3556, "epoch": 84} {"train_loss": -4.141468524932861, "global_step": 3557, "epoch": 84} {"train_loss": -4.145410537719727, "global_step": 3558, "epoch": 84} {"train_loss": -4.058917045593262, "global_step": 3559, "epoch": 84} {"train_loss": -4.217842102050781, "global_step": 3560, "epoch": 84} {"train_loss": -4.041419982910156, "global_step": 3561, "epoch": 84} {"train_loss": -4.100325584411621, "global_step": 3562, "epoch": 84} {"train_loss": -4.158030033111572, "global_step": 3563, "epoch": 84} {"train_loss": -4.165993690490723, "global_step": 3564, "epoch": 84} {"train_loss": -4.026192665100098, "global_step": 3565, "epoch": 84} {"train_loss": -4.204429626464844, "global_step": 3566, "epoch": 84} {"train_loss": -4.110138893127441, "global_step": 3567, "epoch": 84} {"train_loss": -4.0796613693237305, "global_step": 3568, "epoch": 84} {"train_loss": -4.106881635529654, "global_step": 3569, "epoch": 84, "val_loss": 124694.3046875} {"train_loss": -4.216222286224365, "global_step": 3570, "epoch": 85} {"train_loss": -4.203587532043457, "global_step": 3571, "epoch": 85} {"train_loss": -3.9718449115753174, "global_step": 3572, "epoch": 85} {"train_loss": -4.240396499633789, "global_step": 3573, "epoch": 85} {"train_loss": -4.123908996582031, "global_step": 3574, "epoch": 85} {"train_loss": -4.023409843444824, "global_step": 3575, "epoch": 85} {"train_loss": -4.1641950607299805, "global_step": 3576, "epoch": 85} {"train_loss": -4.054445266723633, "global_step": 3577, "epoch": 85} {"train_loss": -4.270145416259766, "global_step": 3578, "epoch": 85} {"train_loss": -4.208942413330078, "global_step": 3579, "epoch": 85} {"train_loss": -4.194564342498779, "global_step": 3580, "epoch": 85} {"train_loss": -4.169739723205566, "global_step": 3581, "epoch": 85} {"train_loss": -4.125913619995117, "global_step": 3582, "epoch": 85} {"train_loss": -4.024467468261719, "global_step": 3583, "epoch": 85} {"train_loss": -4.314597129821777, "global_step": 3584, "epoch": 85} {"train_loss": -3.995875358581543, "global_step": 3585, "epoch": 85} {"train_loss": -4.357006072998047, "global_step": 3586, "epoch": 85} {"train_loss": -4.074735164642334, "global_step": 3587, "epoch": 85} {"train_loss": -4.128896713256836, "global_step": 3588, "epoch": 85} {"train_loss": -3.903282642364502, "global_step": 3589, "epoch": 85} {"train_loss": -4.1882476806640625, "global_step": 3590, "epoch": 85} {"train_loss": -3.7665181159973145, "global_step": 3591, "epoch": 85} {"train_loss": -3.6559226512908936, "global_step": 3592, "epoch": 85} {"train_loss": -4.107271194458008, "global_step": 3593, "epoch": 85} {"train_loss": -3.227430820465088, "global_step": 3594, "epoch": 85} {"train_loss": -4.14656400680542, "global_step": 3595, "epoch": 85} {"train_loss": -2.998814105987549, "global_step": 3596, "epoch": 85} {"train_loss": -3.660782814025879, "global_step": 3597, "epoch": 85} {"train_loss": -3.5451087951660156, "global_step": 3598, "epoch": 85} {"train_loss": -3.3954458236694336, "global_step": 3599, "epoch": 85} {"train_loss": -3.4138102531433105, "global_step": 3600, "epoch": 85} {"train_loss": -3.5507900714874268, "global_step": 3601, "epoch": 85} {"train_loss": -3.6473937034606934, "global_step": 3602, "epoch": 85} {"train_loss": -3.5697245597839355, "global_step": 3603, "epoch": 85} {"train_loss": -3.643221378326416, "global_step": 3604, "epoch": 85} {"train_loss": -3.7600510120391846, "global_step": 3605, "epoch": 85} {"train_loss": -3.840951919555664, "global_step": 3606, "epoch": 85} {"train_loss": -3.7560391426086426, "global_step": 3607, "epoch": 85} {"train_loss": -3.8778040409088135, "global_step": 3608, "epoch": 85} {"train_loss": -3.7932088375091553, "global_step": 3609, "epoch": 85} {"train_loss": -3.8576154708862305, "global_step": 3610, "epoch": 85} {"train_loss": -3.9048507724489485, "global_step": 3611, "epoch": 85, "val_loss": 122791.421875} {"train_loss": -3.9502973556518555, "global_step": 3612, "epoch": 86} {"train_loss": -3.93418550491333, "global_step": 3613, "epoch": 86} {"train_loss": -3.977736711502075, "global_step": 3614, "epoch": 86} {"train_loss": -3.890843629837036, "global_step": 3615, "epoch": 86} {"train_loss": -4.041595935821533, "global_step": 3616, "epoch": 86} {"train_loss": -3.9861598014831543, "global_step": 3617, "epoch": 86} {"train_loss": -4.110014915466309, "global_step": 3618, "epoch": 86} {"train_loss": -4.148700714111328, "global_step": 3619, "epoch": 86} {"train_loss": -4.020676136016846, "global_step": 3620, "epoch": 86} {"train_loss": -3.979790210723877, "global_step": 3621, "epoch": 86} {"train_loss": -3.91827130317688, "global_step": 3622, "epoch": 86} {"train_loss": -3.9534196853637695, "global_step": 3623, "epoch": 86} {"train_loss": -4.161822319030762, "global_step": 3624, "epoch": 86} {"train_loss": -4.032084941864014, "global_step": 3625, "epoch": 86} {"train_loss": -3.9453701972961426, "global_step": 3626, "epoch": 86} {"train_loss": -4.041668891906738, "global_step": 3627, "epoch": 86} {"train_loss": -4.076637268066406, "global_step": 3628, "epoch": 86} {"train_loss": -4.051236629486084, "global_step": 3629, "epoch": 86} {"train_loss": -3.848270893096924, "global_step": 3630, "epoch": 86} {"train_loss": -4.106717109680176, "global_step": 3631, "epoch": 86} {"train_loss": -3.900670051574707, "global_step": 3632, "epoch": 86} {"train_loss": -3.9064598083496094, "global_step": 3633, "epoch": 86} {"train_loss": -4.202415466308594, "global_step": 3634, "epoch": 86} {"train_loss": -3.8069353103637695, "global_step": 3635, "epoch": 86} {"train_loss": -4.039887428283691, "global_step": 3636, "epoch": 86} {"train_loss": -4.018062114715576, "global_step": 3637, "epoch": 86} {"train_loss": -4.113016128540039, "global_step": 3638, "epoch": 86} {"train_loss": -3.8988184928894043, "global_step": 3639, "epoch": 86} {"train_loss": -4.140573024749756, "global_step": 3640, "epoch": 86} {"train_loss": -3.6981360912323, "global_step": 3641, "epoch": 86} {"train_loss": -3.867846965789795, "global_step": 3642, "epoch": 86} {"train_loss": -3.8821260929107666, "global_step": 3643, "epoch": 86} {"train_loss": -4.107370376586914, "global_step": 3644, "epoch": 86} {"train_loss": -3.8427085876464844, "global_step": 3645, "epoch": 86} {"train_loss": -4.210822105407715, "global_step": 3646, "epoch": 86} {"train_loss": -3.866863489151001, "global_step": 3647, "epoch": 86} {"train_loss": -4.025676727294922, "global_step": 3648, "epoch": 86} {"train_loss": -3.79207706451416, "global_step": 3649, "epoch": 86} {"train_loss": -3.8896751403808594, "global_step": 3650, "epoch": 86} {"train_loss": -4.158465385437012, "global_step": 3651, "epoch": 86} {"train_loss": -3.8380444049835205, "global_step": 3652, "epoch": 86} {"train_loss": -3.9873647633053007, "global_step": 3653, "epoch": 86, "val_loss": 124860.640625} {"train_loss": -3.8893957138061523, "global_step": 3654, "epoch": 87} {"train_loss": -4.006496906280518, "global_step": 3655, "epoch": 87} {"train_loss": -4.08338737487793, "global_step": 3656, "epoch": 87} {"train_loss": -3.980571985244751, "global_step": 3657, "epoch": 87} {"train_loss": -4.223166465759277, "global_step": 3658, "epoch": 87} {"train_loss": -4.120198726654053, "global_step": 3659, "epoch": 87} {"train_loss": -4.236291408538818, "global_step": 3660, "epoch": 87} {"train_loss": -4.143469333648682, "global_step": 3661, "epoch": 87} {"train_loss": -3.9952449798583984, "global_step": 3662, "epoch": 87} {"train_loss": -4.207608699798584, "global_step": 3663, "epoch": 87} {"train_loss": -4.0026140213012695, "global_step": 3664, "epoch": 87} {"train_loss": -4.237344264984131, "global_step": 3665, "epoch": 87} {"train_loss": -4.177300453186035, "global_step": 3666, "epoch": 87} {"train_loss": -4.174465179443359, "global_step": 3667, "epoch": 87} {"train_loss": -4.178182601928711, "global_step": 3668, "epoch": 87} {"train_loss": -4.138633728027344, "global_step": 3669, "epoch": 87} {"train_loss": -4.283400535583496, "global_step": 3670, "epoch": 87} {"train_loss": -4.017989158630371, "global_step": 3671, "epoch": 87} {"train_loss": -4.053891181945801, "global_step": 3672, "epoch": 87} {"train_loss": -4.098893642425537, "global_step": 3673, "epoch": 87} {"train_loss": -4.169883728027344, "global_step": 3674, "epoch": 87} {"train_loss": -4.336566925048828, "global_step": 3675, "epoch": 87} {"train_loss": -4.127490997314453, "global_step": 3676, "epoch": 87} {"train_loss": -3.9362001419067383, "global_step": 3677, "epoch": 87} {"train_loss": -4.190108776092529, "global_step": 3678, "epoch": 87} {"train_loss": -4.166286468505859, "global_step": 3679, "epoch": 87} {"train_loss": -4.151215553283691, "global_step": 3680, "epoch": 87} {"train_loss": -4.06036901473999, "global_step": 3681, "epoch": 87} {"train_loss": -4.122350215911865, "global_step": 3682, "epoch": 87} {"train_loss": -4.196247100830078, "global_step": 3683, "epoch": 87} {"train_loss": -4.222021579742432, "global_step": 3684, "epoch": 87} {"train_loss": -4.0810465812683105, "global_step": 3685, "epoch": 87} {"train_loss": -4.2386393547058105, "global_step": 3686, "epoch": 87} {"train_loss": -4.212316989898682, "global_step": 3687, "epoch": 87} {"train_loss": -4.066817283630371, "global_step": 3688, "epoch": 87} {"train_loss": -4.0959320068359375, "global_step": 3689, "epoch": 87} {"train_loss": -4.32109260559082, "global_step": 3690, "epoch": 87} {"train_loss": -4.20327615737915, "global_step": 3691, "epoch": 87} {"train_loss": -4.266127586364746, "global_step": 3692, "epoch": 87} {"train_loss": -4.188470840454102, "global_step": 3693, "epoch": 87} {"train_loss": -4.236876964569092, "global_step": 3694, "epoch": 87} {"train_loss": -4.144841744786217, "global_step": 3695, "epoch": 87, "val_loss": 119869.171875} {"train_loss": -4.227672576904297, "global_step": 3696, "epoch": 88} {"train_loss": -4.335197448730469, "global_step": 3697, "epoch": 88} {"train_loss": -4.177874565124512, "global_step": 3698, "epoch": 88} {"train_loss": -4.296967029571533, "global_step": 3699, "epoch": 88} {"train_loss": -4.386896133422852, "global_step": 3700, "epoch": 88} {"train_loss": -4.165117263793945, "global_step": 3701, "epoch": 88} {"train_loss": -4.217166423797607, "global_step": 3702, "epoch": 88} {"train_loss": -4.409743309020996, "global_step": 3703, "epoch": 88} {"train_loss": -4.239246368408203, "global_step": 3704, "epoch": 88} {"train_loss": -4.281671047210693, "global_step": 3705, "epoch": 88} {"train_loss": -4.104235649108887, "global_step": 3706, "epoch": 88} {"train_loss": -4.169407844543457, "global_step": 3707, "epoch": 88} {"train_loss": -4.299100875854492, "global_step": 3708, "epoch": 88} {"train_loss": -4.242523670196533, "global_step": 3709, "epoch": 88} {"train_loss": -4.295993328094482, "global_step": 3710, "epoch": 88} {"train_loss": -4.216549396514893, "global_step": 3711, "epoch": 88} {"train_loss": -4.1584367752075195, "global_step": 3712, "epoch": 88} {"train_loss": -4.245545387268066, "global_step": 3713, "epoch": 88} {"train_loss": -4.182839393615723, "global_step": 3714, "epoch": 88} {"train_loss": -4.195346832275391, "global_step": 3715, "epoch": 88} {"train_loss": -4.297418594360352, "global_step": 3716, "epoch": 88} {"train_loss": -4.140498638153076, "global_step": 3717, "epoch": 88} {"train_loss": -4.140074729919434, "global_step": 3718, "epoch": 88} {"train_loss": -4.144598484039307, "global_step": 3719, "epoch": 88} {"train_loss": -4.155579566955566, "global_step": 3720, "epoch": 88} {"train_loss": -4.094788551330566, "global_step": 3721, "epoch": 88} {"train_loss": -4.254649639129639, "global_step": 3722, "epoch": 88} {"train_loss": -4.253129005432129, "global_step": 3723, "epoch": 88} {"train_loss": -4.15858268737793, "global_step": 3724, "epoch": 88} {"train_loss": -4.0007853507995605, "global_step": 3725, "epoch": 88} {"train_loss": -4.178036689758301, "global_step": 3726, "epoch": 88} {"train_loss": -4.052280902862549, "global_step": 3727, "epoch": 88} {"train_loss": -4.365489959716797, "global_step": 3728, "epoch": 88} {"train_loss": -4.04555606842041, "global_step": 3729, "epoch": 88} {"train_loss": -4.19972562789917, "global_step": 3730, "epoch": 88} {"train_loss": -4.34185791015625, "global_step": 3731, "epoch": 88} {"train_loss": -4.2513017654418945, "global_step": 3732, "epoch": 88} {"train_loss": -4.364923000335693, "global_step": 3733, "epoch": 88} {"train_loss": -4.206009387969971, "global_step": 3734, "epoch": 88} {"train_loss": -4.233330726623535, "global_step": 3735, "epoch": 88} {"train_loss": -4.279262542724609, "global_step": 3736, "epoch": 88} {"train_loss": -4.22208275113787, "global_step": 3737, "epoch": 88, "val_loss": 119248.6640625} {"train_loss": -4.252673149108887, "global_step": 3738, "epoch": 89} {"train_loss": -4.2983880043029785, "global_step": 3739, "epoch": 89} {"train_loss": -4.252992630004883, "global_step": 3740, "epoch": 89} {"train_loss": -4.267139911651611, "global_step": 3741, "epoch": 89} {"train_loss": -4.3073601722717285, "global_step": 3742, "epoch": 89} {"train_loss": -4.2156171798706055, "global_step": 3743, "epoch": 89} {"train_loss": -4.265674591064453, "global_step": 3744, "epoch": 89} {"train_loss": -4.254713535308838, "global_step": 3745, "epoch": 89} {"train_loss": -4.2507781982421875, "global_step": 3746, "epoch": 89} {"train_loss": -4.138044357299805, "global_step": 3747, "epoch": 89} {"train_loss": -4.1949334144592285, "global_step": 3748, "epoch": 89} {"train_loss": -4.284499168395996, "global_step": 3749, "epoch": 89} {"train_loss": -4.253602027893066, "global_step": 3750, "epoch": 89} {"train_loss": -4.18747615814209, "global_step": 3751, "epoch": 89} {"train_loss": -4.141467094421387, "global_step": 3752, "epoch": 89} {"train_loss": -4.163042068481445, "global_step": 3753, "epoch": 89} {"train_loss": -4.16475248336792, "global_step": 3754, "epoch": 89} {"train_loss": -4.223633766174316, "global_step": 3755, "epoch": 89} {"train_loss": -4.141209602355957, "global_step": 3756, "epoch": 89} {"train_loss": -4.249424457550049, "global_step": 3757, "epoch": 89} {"train_loss": -4.2136921882629395, "global_step": 3758, "epoch": 89} {"train_loss": -4.14046573638916, "global_step": 3759, "epoch": 89} {"train_loss": -4.126090049743652, "global_step": 3760, "epoch": 89} {"train_loss": -4.0616559982299805, "global_step": 3761, "epoch": 89} {"train_loss": -4.234898567199707, "global_step": 3762, "epoch": 89} {"train_loss": -4.357178688049316, "global_step": 3763, "epoch": 89} {"train_loss": -4.190570831298828, "global_step": 3764, "epoch": 89} {"train_loss": -4.109628677368164, "global_step": 3765, "epoch": 89} {"train_loss": -4.277304649353027, "global_step": 3766, "epoch": 89} {"train_loss": -4.1861724853515625, "global_step": 3767, "epoch": 89} {"train_loss": -4.193326473236084, "global_step": 3768, "epoch": 89} {"train_loss": -4.352150917053223, "global_step": 3769, "epoch": 89} {"train_loss": -4.237903118133545, "global_step": 3770, "epoch": 89} {"train_loss": -4.2735748291015625, "global_step": 3771, "epoch": 89} {"train_loss": -4.361664295196533, "global_step": 3772, "epoch": 89} {"train_loss": -4.21993350982666, "global_step": 3773, "epoch": 89} {"train_loss": -4.4118218421936035, "global_step": 3774, "epoch": 89} {"train_loss": -4.182866096496582, "global_step": 3775, "epoch": 89} {"train_loss": -4.085203170776367, "global_step": 3776, "epoch": 89} {"train_loss": -4.292798042297363, "global_step": 3777, "epoch": 89} {"train_loss": -4.150564193725586, "global_step": 3778, "epoch": 89} {"train_loss": -4.224117279052734, "global_step": 3779, "epoch": 89, "val_loss": 117240.3046875} {"train_loss": -4.3725786209106445, "global_step": 3780, "epoch": 90} {"train_loss": -4.221310615539551, "global_step": 3781, "epoch": 90} {"train_loss": -4.359006881713867, "global_step": 3782, "epoch": 90} {"train_loss": -4.242178916931152, "global_step": 3783, "epoch": 90} {"train_loss": -4.317724704742432, "global_step": 3784, "epoch": 90} {"train_loss": -4.357150077819824, "global_step": 3785, "epoch": 90} {"train_loss": -4.35699462890625, "global_step": 3786, "epoch": 90} {"train_loss": -4.342085838317871, "global_step": 3787, "epoch": 90} {"train_loss": -4.370586395263672, "global_step": 3788, "epoch": 90} {"train_loss": -4.318646430969238, "global_step": 3789, "epoch": 90} {"train_loss": -4.235749244689941, "global_step": 3790, "epoch": 90} {"train_loss": -4.2844390869140625, "global_step": 3791, "epoch": 90} {"train_loss": -4.246734619140625, "global_step": 3792, "epoch": 90} {"train_loss": -4.222332954406738, "global_step": 3793, "epoch": 90} {"train_loss": -4.3024420738220215, "global_step": 3794, "epoch": 90} {"train_loss": -4.252727031707764, "global_step": 3795, "epoch": 90} {"train_loss": -4.168401718139648, "global_step": 3796, "epoch": 90} {"train_loss": -4.284509658813477, "global_step": 3797, "epoch": 90} {"train_loss": -4.175748825073242, "global_step": 3798, "epoch": 90} {"train_loss": -4.191097259521484, "global_step": 3799, "epoch": 90} {"train_loss": -4.087221622467041, "global_step": 3800, "epoch": 90} {"train_loss": -4.256762504577637, "global_step": 3801, "epoch": 90} {"train_loss": -4.300635814666748, "global_step": 3802, "epoch": 90} {"train_loss": -4.152449131011963, "global_step": 3803, "epoch": 90} {"train_loss": -4.138086318969727, "global_step": 3804, "epoch": 90} {"train_loss": -4.332137107849121, "global_step": 3805, "epoch": 90} {"train_loss": -4.242730140686035, "global_step": 3806, "epoch": 90} {"train_loss": -4.215550422668457, "global_step": 3807, "epoch": 90} {"train_loss": -4.191082954406738, "global_step": 3808, "epoch": 90} {"train_loss": -4.208698272705078, "global_step": 3809, "epoch": 90} {"train_loss": -4.202770233154297, "global_step": 3810, "epoch": 90} {"train_loss": -4.225551605224609, "global_step": 3811, "epoch": 90} {"train_loss": -4.156885147094727, "global_step": 3812, "epoch": 90} {"train_loss": -4.364941596984863, "global_step": 3813, "epoch": 90} {"train_loss": -4.1649627685546875, "global_step": 3814, "epoch": 90} {"train_loss": -4.396347999572754, "global_step": 3815, "epoch": 90} {"train_loss": -4.2103681564331055, "global_step": 3816, "epoch": 90} {"train_loss": -4.320645332336426, "global_step": 3817, "epoch": 90} {"train_loss": -4.258199214935303, "global_step": 3818, "epoch": 90} {"train_loss": -4.238738536834717, "global_step": 3819, "epoch": 90} {"train_loss": -4.332147121429443, "global_step": 3820, "epoch": 90} {"train_loss": -4.2572496845608665, "global_step": 3821, "epoch": 90, "val_loss": 115140.8125} {"train_loss": -4.400010108947754, "global_step": 3822, "epoch": 91} {"train_loss": -4.212297439575195, "global_step": 3823, "epoch": 91} {"train_loss": -3.948002815246582, "global_step": 3824, "epoch": 91} {"train_loss": -4.300002574920654, "global_step": 3825, "epoch": 91} {"train_loss": -4.225616931915283, "global_step": 3826, "epoch": 91} {"train_loss": -3.989107847213745, "global_step": 3827, "epoch": 91} {"train_loss": -4.372165679931641, "global_step": 3828, "epoch": 91} {"train_loss": -4.175930976867676, "global_step": 3829, "epoch": 91} {"train_loss": -4.045431613922119, "global_step": 3830, "epoch": 91} {"train_loss": -4.145569324493408, "global_step": 3831, "epoch": 91} {"train_loss": -3.8457887172698975, "global_step": 3832, "epoch": 91} {"train_loss": -4.229696273803711, "global_step": 3833, "epoch": 91} {"train_loss": -4.006170749664307, "global_step": 3834, "epoch": 91} {"train_loss": -4.184053421020508, "global_step": 3835, "epoch": 91} {"train_loss": -4.056295394897461, "global_step": 3836, "epoch": 91} {"train_loss": -4.162777900695801, "global_step": 3837, "epoch": 91} {"train_loss": -4.280240058898926, "global_step": 3838, "epoch": 91} {"train_loss": -4.076879024505615, "global_step": 3839, "epoch": 91} {"train_loss": -4.381106853485107, "global_step": 3840, "epoch": 91} {"train_loss": -4.130900859832764, "global_step": 3841, "epoch": 91} {"train_loss": -4.246988296508789, "global_step": 3842, "epoch": 91} {"train_loss": -4.080392837524414, "global_step": 3843, "epoch": 91} {"train_loss": -4.263819694519043, "global_step": 3844, "epoch": 91} {"train_loss": -4.0880937576293945, "global_step": 3845, "epoch": 91} {"train_loss": -4.380160808563232, "global_step": 3846, "epoch": 91} {"train_loss": -4.30967903137207, "global_step": 3847, "epoch": 91} {"train_loss": -4.208216667175293, "global_step": 3848, "epoch": 91} {"train_loss": -4.229203701019287, "global_step": 3849, "epoch": 91} {"train_loss": -4.315471649169922, "global_step": 3850, "epoch": 91} {"train_loss": -4.276885032653809, "global_step": 3851, "epoch": 91} {"train_loss": -4.460047721862793, "global_step": 3852, "epoch": 91} {"train_loss": -4.193483829498291, "global_step": 3853, "epoch": 91} {"train_loss": -4.315159320831299, "global_step": 3854, "epoch": 91} {"train_loss": -4.314057350158691, "global_step": 3855, "epoch": 91} {"train_loss": -4.227532386779785, "global_step": 3856, "epoch": 91} {"train_loss": -4.291745185852051, "global_step": 3857, "epoch": 91} {"train_loss": -4.39146089553833, "global_step": 3858, "epoch": 91} {"train_loss": -4.314291000366211, "global_step": 3859, "epoch": 91} {"train_loss": -4.246907711029053, "global_step": 3860, "epoch": 91} {"train_loss": -4.321450233459473, "global_step": 3861, "epoch": 91} {"train_loss": -4.322018623352051, "global_step": 3862, "epoch": 91} {"train_loss": -4.219325167792184, "global_step": 3863, "epoch": 91, "val_loss": 115253.890625} {"train_loss": -4.267025947570801, "global_step": 3864, "epoch": 92} {"train_loss": -4.314332008361816, "global_step": 3865, "epoch": 92} {"train_loss": -4.056789398193359, "global_step": 3866, "epoch": 92} {"train_loss": -4.099583148956299, "global_step": 3867, "epoch": 92} {"train_loss": -4.130514144897461, "global_step": 3868, "epoch": 92} {"train_loss": -4.270071029663086, "global_step": 3869, "epoch": 92} {"train_loss": -4.244737148284912, "global_step": 3870, "epoch": 92} {"train_loss": -4.004175662994385, "global_step": 3871, "epoch": 92} {"train_loss": -4.184545993804932, "global_step": 3872, "epoch": 92} {"train_loss": -4.1809821128845215, "global_step": 3873, "epoch": 92} {"train_loss": -4.065002918243408, "global_step": 3874, "epoch": 92} {"train_loss": -4.154919147491455, "global_step": 3875, "epoch": 92} {"train_loss": -4.105581760406494, "global_step": 3876, "epoch": 92} {"train_loss": -4.042207717895508, "global_step": 3877, "epoch": 92} {"train_loss": -4.143855094909668, "global_step": 3878, "epoch": 92} {"train_loss": -4.073999404907227, "global_step": 3879, "epoch": 92} {"train_loss": -4.274501800537109, "global_step": 3880, "epoch": 92} {"train_loss": -3.9495410919189453, "global_step": 3881, "epoch": 92} {"train_loss": -4.27695894241333, "global_step": 3882, "epoch": 92} {"train_loss": -4.230558395385742, "global_step": 3883, "epoch": 92} {"train_loss": -4.10867977142334, "global_step": 3884, "epoch": 92} {"train_loss": -4.414899826049805, "global_step": 3885, "epoch": 92} {"train_loss": -4.262286186218262, "global_step": 3886, "epoch": 92} {"train_loss": -4.269394397735596, "global_step": 3887, "epoch": 92} {"train_loss": -4.274421691894531, "global_step": 3888, "epoch": 92} {"train_loss": -4.101373195648193, "global_step": 3889, "epoch": 92} {"train_loss": -4.302822113037109, "global_step": 3890, "epoch": 92} {"train_loss": -4.228766441345215, "global_step": 3891, "epoch": 92} {"train_loss": -4.201521396636963, "global_step": 3892, "epoch": 92} {"train_loss": -4.1879801750183105, "global_step": 3893, "epoch": 92} {"train_loss": -4.26511287689209, "global_step": 3894, "epoch": 92} {"train_loss": -4.349772930145264, "global_step": 3895, "epoch": 92} {"train_loss": -4.304852485656738, "global_step": 3896, "epoch": 92} {"train_loss": -4.493586540222168, "global_step": 3897, "epoch": 92} {"train_loss": -4.284428119659424, "global_step": 3898, "epoch": 92} {"train_loss": -4.358258247375488, "global_step": 3899, "epoch": 92} {"train_loss": -4.23111629486084, "global_step": 3900, "epoch": 92} {"train_loss": -4.323849678039551, "global_step": 3901, "epoch": 92} {"train_loss": -4.398305892944336, "global_step": 3902, "epoch": 92} {"train_loss": -4.3131232261657715, "global_step": 3903, "epoch": 92} {"train_loss": -4.425363540649414, "global_step": 3904, "epoch": 92} {"train_loss": -4.226758525485084, "global_step": 3905, "epoch": 92, "val_loss": 112827.5546875} {"train_loss": -4.268361568450928, "global_step": 3906, "epoch": 93} {"train_loss": -4.230185508728027, "global_step": 3907, "epoch": 93} {"train_loss": -4.331355094909668, "global_step": 3908, "epoch": 93} {"train_loss": -4.334447860717773, "global_step": 3909, "epoch": 93} {"train_loss": -4.389376163482666, "global_step": 3910, "epoch": 93} {"train_loss": -4.362705230712891, "global_step": 3911, "epoch": 93} {"train_loss": -4.429676532745361, "global_step": 3912, "epoch": 93} {"train_loss": -4.333527565002441, "global_step": 3913, "epoch": 93} {"train_loss": -4.2433624267578125, "global_step": 3914, "epoch": 93} {"train_loss": -4.34971809387207, "global_step": 3915, "epoch": 93} {"train_loss": -4.3741044998168945, "global_step": 3916, "epoch": 93} {"train_loss": -4.189237594604492, "global_step": 3917, "epoch": 93} {"train_loss": -4.423882484436035, "global_step": 3918, "epoch": 93} {"train_loss": -4.326793193817139, "global_step": 3919, "epoch": 93} {"train_loss": -4.17525577545166, "global_step": 3920, "epoch": 93} {"train_loss": -4.344583511352539, "global_step": 3921, "epoch": 93} {"train_loss": -4.242644309997559, "global_step": 3922, "epoch": 93} {"train_loss": -4.34758186340332, "global_step": 3923, "epoch": 93} {"train_loss": -4.402317047119141, "global_step": 3924, "epoch": 93} {"train_loss": -4.129195213317871, "global_step": 3925, "epoch": 93} {"train_loss": -4.309411525726318, "global_step": 3926, "epoch": 93} {"train_loss": -4.316470623016357, "global_step": 3927, "epoch": 93} {"train_loss": -4.456125259399414, "global_step": 3928, "epoch": 93} {"train_loss": -4.296385288238525, "global_step": 3929, "epoch": 93} {"train_loss": -3.930302381515503, "global_step": 3930, "epoch": 93} {"train_loss": -4.268786430358887, "global_step": 3931, "epoch": 93} {"train_loss": -4.072071075439453, "global_step": 3932, "epoch": 93} {"train_loss": -4.132716178894043, "global_step": 3933, "epoch": 93} {"train_loss": -4.347630500793457, "global_step": 3934, "epoch": 93} {"train_loss": -4.225286483764648, "global_step": 3935, "epoch": 93} {"train_loss": -4.301342010498047, "global_step": 3936, "epoch": 93} {"train_loss": -4.416537284851074, "global_step": 3937, "epoch": 93} {"train_loss": -4.478791236877441, "global_step": 3938, "epoch": 93} {"train_loss": -4.220612525939941, "global_step": 3939, "epoch": 93} {"train_loss": -4.358392715454102, "global_step": 3940, "epoch": 93} {"train_loss": -4.259736061096191, "global_step": 3941, "epoch": 93} {"train_loss": -4.099995136260986, "global_step": 3942, "epoch": 93} {"train_loss": -4.204558372497559, "global_step": 3943, "epoch": 93} {"train_loss": -4.2870097160339355, "global_step": 3944, "epoch": 93} {"train_loss": -4.434074401855469, "global_step": 3945, "epoch": 93} {"train_loss": -4.207036018371582, "global_step": 3946, "epoch": 93} {"train_loss": -4.286515877360389, "global_step": 3947, "epoch": 93, "val_loss": 115121.6796875} {"train_loss": -4.271557331085205, "global_step": 3948, "epoch": 94} {"train_loss": -4.340221881866455, "global_step": 3949, "epoch": 94} {"train_loss": -4.347688674926758, "global_step": 3950, "epoch": 94} {"train_loss": -4.362227439880371, "global_step": 3951, "epoch": 94} {"train_loss": -4.3864850997924805, "global_step": 3952, "epoch": 94} {"train_loss": -4.234454154968262, "global_step": 3953, "epoch": 94} {"train_loss": -4.374438762664795, "global_step": 3954, "epoch": 94} {"train_loss": -4.447848320007324, "global_step": 3955, "epoch": 94} {"train_loss": -4.360707759857178, "global_step": 3956, "epoch": 94} {"train_loss": -4.242967128753662, "global_step": 3957, "epoch": 94} {"train_loss": -4.377823829650879, "global_step": 3958, "epoch": 94} {"train_loss": -4.2791361808776855, "global_step": 3959, "epoch": 94} {"train_loss": -4.366704940795898, "global_step": 3960, "epoch": 94} {"train_loss": -4.05531120300293, "global_step": 3961, "epoch": 94} {"train_loss": -3.8526101112365723, "global_step": 3962, "epoch": 94} {"train_loss": -3.975940465927124, "global_step": 3963, "epoch": 94} {"train_loss": -4.042361259460449, "global_step": 3964, "epoch": 94} {"train_loss": -4.194855690002441, "global_step": 3965, "epoch": 94} {"train_loss": -4.121886253356934, "global_step": 3966, "epoch": 94} {"train_loss": -4.213062286376953, "global_step": 3967, "epoch": 94} {"train_loss": -4.170755386352539, "global_step": 3968, "epoch": 94} {"train_loss": -4.293420791625977, "global_step": 3969, "epoch": 94} {"train_loss": -4.1127777099609375, "global_step": 3970, "epoch": 94} {"train_loss": -4.277219772338867, "global_step": 3971, "epoch": 94} {"train_loss": -4.174886703491211, "global_step": 3972, "epoch": 94} {"train_loss": -4.191440582275391, "global_step": 3973, "epoch": 94} {"train_loss": -4.232710838317871, "global_step": 3974, "epoch": 94} {"train_loss": -4.07627534866333, "global_step": 3975, "epoch": 94} {"train_loss": -4.27363395690918, "global_step": 3976, "epoch": 94} {"train_loss": -4.207754611968994, "global_step": 3977, "epoch": 94} {"train_loss": -4.11384916305542, "global_step": 3978, "epoch": 94} {"train_loss": -4.432992935180664, "global_step": 3979, "epoch": 94} {"train_loss": -4.232400417327881, "global_step": 3980, "epoch": 94} {"train_loss": -4.224989891052246, "global_step": 3981, "epoch": 94} {"train_loss": -4.301427841186523, "global_step": 3982, "epoch": 94} {"train_loss": -4.3135986328125, "global_step": 3983, "epoch": 94} {"train_loss": -4.152388572692871, "global_step": 3984, "epoch": 94} {"train_loss": -4.362766265869141, "global_step": 3985, "epoch": 94} {"train_loss": -4.240201950073242, "global_step": 3986, "epoch": 94} {"train_loss": -4.251413345336914, "global_step": 3987, "epoch": 94} {"train_loss": -4.28446102142334, "global_step": 3988, "epoch": 94} {"train_loss": -4.240331212679545, "global_step": 3989, "epoch": 94, "val_loss": 113750.5546875} {"train_loss": -4.180891036987305, "global_step": 3990, "epoch": 95} {"train_loss": -4.330760955810547, "global_step": 3991, "epoch": 95} {"train_loss": -4.324128150939941, "global_step": 3992, "epoch": 95} {"train_loss": -4.365527629852295, "global_step": 3993, "epoch": 95} {"train_loss": -4.402538299560547, "global_step": 3994, "epoch": 95} {"train_loss": -4.294712066650391, "global_step": 3995, "epoch": 95} {"train_loss": -4.410466194152832, "global_step": 3996, "epoch": 95} {"train_loss": -4.296460151672363, "global_step": 3997, "epoch": 95} {"train_loss": -4.193568229675293, "global_step": 3998, "epoch": 95} {"train_loss": -4.313386917114258, "global_step": 3999, "epoch": 95} {"train_loss": -4.373125076293945, "global_step": 4000, "epoch": 95} {"train_loss": -4.2734904289245605, "global_step": 4001, "epoch": 95} {"train_loss": -4.362793922424316, "global_step": 4002, "epoch": 95} {"train_loss": -4.201645374298096, "global_step": 4003, "epoch": 95} {"train_loss": -4.405372619628906, "global_step": 4004, "epoch": 95} {"train_loss": -4.425357818603516, "global_step": 4005, "epoch": 95} {"train_loss": -4.289922714233398, "global_step": 4006, "epoch": 95} {"train_loss": -4.338903427124023, "global_step": 4007, "epoch": 95} {"train_loss": -4.36032772064209, "global_step": 4008, "epoch": 95} {"train_loss": -4.333561897277832, "global_step": 4009, "epoch": 95} {"train_loss": -4.326468467712402, "global_step": 4010, "epoch": 95} {"train_loss": -4.330925941467285, "global_step": 4011, "epoch": 95} {"train_loss": -4.25389289855957, "global_step": 4012, "epoch": 95} {"train_loss": -4.473659515380859, "global_step": 4013, "epoch": 95} {"train_loss": -4.0326924324035645, "global_step": 4014, "epoch": 95} {"train_loss": -4.316900253295898, "global_step": 4015, "epoch": 95} {"train_loss": -4.34683084487915, "global_step": 4016, "epoch": 95} {"train_loss": -4.219393730163574, "global_step": 4017, "epoch": 95} {"train_loss": -4.321233749389648, "global_step": 4018, "epoch": 95} {"train_loss": -4.343724727630615, "global_step": 4019, "epoch": 95} {"train_loss": -4.476134300231934, "global_step": 4020, "epoch": 95} {"train_loss": -4.347486972808838, "global_step": 4021, "epoch": 95} {"train_loss": -4.420684337615967, "global_step": 4022, "epoch": 95} {"train_loss": -4.290618896484375, "global_step": 4023, "epoch": 95} {"train_loss": -4.328207015991211, "global_step": 4024, "epoch": 95} {"train_loss": -4.24399995803833, "global_step": 4025, "epoch": 95} {"train_loss": -4.402187824249268, "global_step": 4026, "epoch": 95} {"train_loss": -4.34773063659668, "global_step": 4027, "epoch": 95} {"train_loss": -4.336579322814941, "global_step": 4028, "epoch": 95} {"train_loss": -4.439442157745361, "global_step": 4029, "epoch": 95} {"train_loss": -4.331242561340332, "global_step": 4030, "epoch": 95} {"train_loss": -4.322678270794096, "global_step": 4031, "epoch": 95, "val_loss": 110960.5625} {"train_loss": -4.450580596923828, "global_step": 4032, "epoch": 96} {"train_loss": -4.441403865814209, "global_step": 4033, "epoch": 96} {"train_loss": -4.20396089553833, "global_step": 4034, "epoch": 96} {"train_loss": -4.400497913360596, "global_step": 4035, "epoch": 96} {"train_loss": -4.312283039093018, "global_step": 4036, "epoch": 96} {"train_loss": -4.188629150390625, "global_step": 4037, "epoch": 96} {"train_loss": -4.320804595947266, "global_step": 4038, "epoch": 96} {"train_loss": -4.357479095458984, "global_step": 4039, "epoch": 96} {"train_loss": -4.385346412658691, "global_step": 4040, "epoch": 96} {"train_loss": -4.577948570251465, "global_step": 4041, "epoch": 96} {"train_loss": -4.338160514831543, "global_step": 4042, "epoch": 96} {"train_loss": -4.375125885009766, "global_step": 4043, "epoch": 96} {"train_loss": -4.511052131652832, "global_step": 4044, "epoch": 96} {"train_loss": -4.279508590698242, "global_step": 4045, "epoch": 96} {"train_loss": -4.353834629058838, "global_step": 4046, "epoch": 96} {"train_loss": -4.290923118591309, "global_step": 4047, "epoch": 96} {"train_loss": -4.32661247253418, "global_step": 4048, "epoch": 96} {"train_loss": -4.363524436950684, "global_step": 4049, "epoch": 96} {"train_loss": -4.375384330749512, "global_step": 4050, "epoch": 96} {"train_loss": -4.407856464385986, "global_step": 4051, "epoch": 96} {"train_loss": -4.396941184997559, "global_step": 4052, "epoch": 96} {"train_loss": -4.276049613952637, "global_step": 4053, "epoch": 96} {"train_loss": -4.3630051612854, "global_step": 4054, "epoch": 96} {"train_loss": -4.315634250640869, "global_step": 4055, "epoch": 96} {"train_loss": -4.327211856842041, "global_step": 4056, "epoch": 96} {"train_loss": -4.274328231811523, "global_step": 4057, "epoch": 96} {"train_loss": -4.429901123046875, "global_step": 4058, "epoch": 96} {"train_loss": -4.422427177429199, "global_step": 4059, "epoch": 96} {"train_loss": -4.271537780761719, "global_step": 4060, "epoch": 96} {"train_loss": -4.283968448638916, "global_step": 4061, "epoch": 96} {"train_loss": -4.375776290893555, "global_step": 4062, "epoch": 96} {"train_loss": -4.357212066650391, "global_step": 4063, "epoch": 96} {"train_loss": -4.321474075317383, "global_step": 4064, "epoch": 96} {"train_loss": -4.237994194030762, "global_step": 4065, "epoch": 96} {"train_loss": -4.251182556152344, "global_step": 4066, "epoch": 96} {"train_loss": -4.272946357727051, "global_step": 4067, "epoch": 96} {"train_loss": -4.305293083190918, "global_step": 4068, "epoch": 96} {"train_loss": -4.332808494567871, "global_step": 4069, "epoch": 96} {"train_loss": -4.398089408874512, "global_step": 4070, "epoch": 96} {"train_loss": -4.380491256713867, "global_step": 4071, "epoch": 96} {"train_loss": -4.331425189971924, "global_step": 4072, "epoch": 96} {"train_loss": -4.34510452406747, "global_step": 4073, "epoch": 96, "val_loss": 110548.90625} {"train_loss": -4.561397552490234, "global_step": 4074, "epoch": 97} {"train_loss": -4.259554862976074, "global_step": 4075, "epoch": 97} {"train_loss": -4.342352867126465, "global_step": 4076, "epoch": 97} {"train_loss": -4.374260902404785, "global_step": 4077, "epoch": 97} {"train_loss": -4.31182861328125, "global_step": 4078, "epoch": 97} {"train_loss": -4.227221965789795, "global_step": 4079, "epoch": 97} {"train_loss": -4.174386024475098, "global_step": 4080, "epoch": 97} {"train_loss": -4.381406307220459, "global_step": 4081, "epoch": 97} {"train_loss": -4.348172664642334, "global_step": 4082, "epoch": 97} {"train_loss": -4.192976951599121, "global_step": 4083, "epoch": 97} {"train_loss": -4.474699020385742, "global_step": 4084, "epoch": 97} {"train_loss": -4.290622711181641, "global_step": 4085, "epoch": 97} {"train_loss": -4.443023681640625, "global_step": 4086, "epoch": 97} {"train_loss": -4.345669746398926, "global_step": 4087, "epoch": 97} {"train_loss": -4.343103408813477, "global_step": 4088, "epoch": 97} {"train_loss": -4.309974670410156, "global_step": 4089, "epoch": 97} {"train_loss": -4.322689056396484, "global_step": 4090, "epoch": 97} {"train_loss": -4.419577598571777, "global_step": 4091, "epoch": 97} {"train_loss": -4.363986015319824, "global_step": 4092, "epoch": 97} {"train_loss": -4.404491424560547, "global_step": 4093, "epoch": 97} {"train_loss": -4.401390075683594, "global_step": 4094, "epoch": 97} {"train_loss": -4.176932334899902, "global_step": 4095, "epoch": 97} {"train_loss": -4.318568706512451, "global_step": 4096, "epoch": 97} {"train_loss": -4.259722709655762, "global_step": 4097, "epoch": 97} {"train_loss": -4.301766872406006, "global_step": 4098, "epoch": 97} {"train_loss": -4.218430519104004, "global_step": 4099, "epoch": 97} {"train_loss": -4.34123420715332, "global_step": 4100, "epoch": 97} {"train_loss": -4.297752380371094, "global_step": 4101, "epoch": 97} {"train_loss": -4.1475725173950195, "global_step": 4102, "epoch": 97} {"train_loss": -4.3611860275268555, "global_step": 4103, "epoch": 97} {"train_loss": -4.253938674926758, "global_step": 4104, "epoch": 97} {"train_loss": -4.1036224365234375, "global_step": 4105, "epoch": 97} {"train_loss": -4.328768730163574, "global_step": 4106, "epoch": 97} {"train_loss": -4.215356826782227, "global_step": 4107, "epoch": 97} {"train_loss": -4.178779125213623, "global_step": 4108, "epoch": 97} {"train_loss": -4.355501174926758, "global_step": 4109, "epoch": 97} {"train_loss": -4.077262878417969, "global_step": 4110, "epoch": 97} {"train_loss": -4.411156177520752, "global_step": 4111, "epoch": 97} {"train_loss": -4.289491176605225, "global_step": 4112, "epoch": 97} {"train_loss": -4.171902656555176, "global_step": 4113, "epoch": 97} {"train_loss": -4.410173416137695, "global_step": 4114, "epoch": 97} {"train_loss": -4.30131931531997, "global_step": 4115, "epoch": 97, "val_loss": 109843.96875} {"train_loss": -4.391794681549072, "global_step": 4116, "epoch": 98} {"train_loss": -4.0218329429626465, "global_step": 4117, "epoch": 98} {"train_loss": -4.353250503540039, "global_step": 4118, "epoch": 98} {"train_loss": -4.231903553009033, "global_step": 4119, "epoch": 98} {"train_loss": -4.268354415893555, "global_step": 4120, "epoch": 98} {"train_loss": -4.195835113525391, "global_step": 4121, "epoch": 98} {"train_loss": -4.263924598693848, "global_step": 4122, "epoch": 98} {"train_loss": -4.366663455963135, "global_step": 4123, "epoch": 98} {"train_loss": -4.433837890625, "global_step": 4124, "epoch": 98} {"train_loss": -4.414542198181152, "global_step": 4125, "epoch": 98} {"train_loss": -4.299315929412842, "global_step": 4126, "epoch": 98} {"train_loss": -4.350973129272461, "global_step": 4127, "epoch": 98} {"train_loss": -4.3402628898620605, "global_step": 4128, "epoch": 98} {"train_loss": -4.3946309089660645, "global_step": 4129, "epoch": 98} {"train_loss": -4.307459831237793, "global_step": 4130, "epoch": 98} {"train_loss": -4.350050926208496, "global_step": 4131, "epoch": 98} {"train_loss": -4.343059062957764, "global_step": 4132, "epoch": 98} {"train_loss": -4.467071056365967, "global_step": 4133, "epoch": 98} {"train_loss": -4.594250202178955, "global_step": 4134, "epoch": 98} {"train_loss": -4.391898155212402, "global_step": 4135, "epoch": 98} {"train_loss": -4.416007995605469, "global_step": 4136, "epoch": 98} {"train_loss": -4.231545925140381, "global_step": 4137, "epoch": 98} {"train_loss": -4.461867809295654, "global_step": 4138, "epoch": 98} {"train_loss": -4.327381610870361, "global_step": 4139, "epoch": 98} {"train_loss": -4.327265739440918, "global_step": 4140, "epoch": 98} {"train_loss": -4.491983413696289, "global_step": 4141, "epoch": 98} {"train_loss": -4.4224138259887695, "global_step": 4142, "epoch": 98} {"train_loss": -4.342836380004883, "global_step": 4143, "epoch": 98} {"train_loss": -4.2663397789001465, "global_step": 4144, "epoch": 98} {"train_loss": -4.123392105102539, "global_step": 4145, "epoch": 98} {"train_loss": -4.289137363433838, "global_step": 4146, "epoch": 98} {"train_loss": -4.282462120056152, "global_step": 4147, "epoch": 98} {"train_loss": -4.432272911071777, "global_step": 4148, "epoch": 98} {"train_loss": -4.223909378051758, "global_step": 4149, "epoch": 98} {"train_loss": -4.37111234664917, "global_step": 4150, "epoch": 98} {"train_loss": -4.324918270111084, "global_step": 4151, "epoch": 98} {"train_loss": -4.385997772216797, "global_step": 4152, "epoch": 98} {"train_loss": -4.300105094909668, "global_step": 4153, "epoch": 98} {"train_loss": -4.307074069976807, "global_step": 4154, "epoch": 98} {"train_loss": -4.304001331329346, "global_step": 4155, "epoch": 98} {"train_loss": -4.423522472381592, "global_step": 4156, "epoch": 98} {"train_loss": -4.336177417210171, "global_step": 4157, "epoch": 98, "val_loss": 108645.4140625} {"train_loss": -4.505725860595703, "global_step": 4158, "epoch": 99} {"train_loss": -4.4166364669799805, "global_step": 4159, "epoch": 99} {"train_loss": -4.346905708312988, "global_step": 4160, "epoch": 99} {"train_loss": -4.431149005889893, "global_step": 4161, "epoch": 99} {"train_loss": -4.431766510009766, "global_step": 4162, "epoch": 99} {"train_loss": -4.425138473510742, "global_step": 4163, "epoch": 99} {"train_loss": -4.4827165603637695, "global_step": 4164, "epoch": 99} {"train_loss": -4.319561004638672, "global_step": 4165, "epoch": 99} {"train_loss": -4.331299304962158, "global_step": 4166, "epoch": 99} {"train_loss": -4.408802509307861, "global_step": 4167, "epoch": 99} {"train_loss": -4.508120536804199, "global_step": 4168, "epoch": 99} {"train_loss": -4.50287389755249, "global_step": 4169, "epoch": 99} {"train_loss": -4.210678577423096, "global_step": 4170, "epoch": 99} {"train_loss": -4.428940773010254, "global_step": 4171, "epoch": 99} {"train_loss": -4.523602485656738, "global_step": 4172, "epoch": 99} {"train_loss": -4.329164981842041, "global_step": 4173, "epoch": 99} {"train_loss": -4.433884143829346, "global_step": 4174, "epoch": 99} {"train_loss": -4.420268535614014, "global_step": 4175, "epoch": 99} {"train_loss": -4.343052387237549, "global_step": 4176, "epoch": 99} {"train_loss": -4.44179105758667, "global_step": 4177, "epoch": 99} {"train_loss": -4.341034412384033, "global_step": 4178, "epoch": 99} {"train_loss": -4.39252233505249, "global_step": 4179, "epoch": 99} {"train_loss": -4.310555458068848, "global_step": 4180, "epoch": 99} {"train_loss": -4.376494884490967, "global_step": 4181, "epoch": 99} {"train_loss": -4.424023628234863, "global_step": 4182, "epoch": 99} {"train_loss": -4.374706268310547, "global_step": 4183, "epoch": 99} {"train_loss": -4.233746528625488, "global_step": 4184, "epoch": 99} {"train_loss": -4.416249752044678, "global_step": 4185, "epoch": 99} {"train_loss": -4.364673614501953, "global_step": 4186, "epoch": 99} {"train_loss": -4.274418354034424, "global_step": 4187, "epoch": 99} {"train_loss": -4.247522354125977, "global_step": 4188, "epoch": 99} {"train_loss": -4.43240213394165, "global_step": 4189, "epoch": 99} {"train_loss": -4.242094993591309, "global_step": 4190, "epoch": 99} {"train_loss": -4.315454959869385, "global_step": 4191, "epoch": 99} {"train_loss": -4.375833511352539, "global_step": 4192, "epoch": 99} {"train_loss": -4.490274906158447, "global_step": 4193, "epoch": 99} {"train_loss": -4.394156455993652, "global_step": 4194, "epoch": 99} {"train_loss": -4.211989402770996, "global_step": 4195, "epoch": 99} {"train_loss": -4.372896194458008, "global_step": 4196, "epoch": 99} {"train_loss": -4.231462478637695, "global_step": 4197, "epoch": 99} {"train_loss": -4.21544885635376, "global_step": 4198, "epoch": 99} {"train_loss": -4.372097094853719, "global_step": 4199, "epoch": 99, "val_loss": 108476.7578125} {"train_loss": -4.345939636230469, "global_step": 4200, "epoch": 100} {"train_loss": -4.256591796875, "global_step": 4201, "epoch": 100} {"train_loss": -4.290626525878906, "global_step": 4202, "epoch": 100} {"train_loss": -4.448722839355469, "global_step": 4203, "epoch": 100} {"train_loss": -4.401599407196045, "global_step": 4204, "epoch": 100} {"train_loss": -4.454918384552002, "global_step": 4205, "epoch": 100} {"train_loss": -4.329994201660156, "global_step": 4206, "epoch": 100} {"train_loss": -4.376577377319336, "global_step": 4207, "epoch": 100} {"train_loss": -4.472700595855713, "global_step": 4208, "epoch": 100} {"train_loss": -4.445634365081787, "global_step": 4209, "epoch": 100} {"train_loss": -4.374691486358643, "global_step": 4210, "epoch": 100} {"train_loss": -4.348046779632568, "global_step": 4211, "epoch": 100} {"train_loss": -4.336219787597656, "global_step": 4212, "epoch": 100} {"train_loss": -4.448582649230957, "global_step": 4213, "epoch": 100} {"train_loss": -4.4474077224731445, "global_step": 4214, "epoch": 100} {"train_loss": -4.4474334716796875, "global_step": 4215, "epoch": 100} {"train_loss": -4.314613342285156, "global_step": 4216, "epoch": 100} {"train_loss": -4.406153678894043, "global_step": 4217, "epoch": 100} {"train_loss": -4.362950325012207, "global_step": 4218, "epoch": 100} {"train_loss": -4.353525161743164, "global_step": 4219, "epoch": 100} {"train_loss": -4.378288745880127, "global_step": 4220, "epoch": 100} {"train_loss": -4.3938212394714355, "global_step": 4221, "epoch": 100} {"train_loss": -4.386905670166016, "global_step": 4222, "epoch": 100} {"train_loss": -4.489980697631836, "global_step": 4223, "epoch": 100} {"train_loss": -4.4496235847473145, "global_step": 4224, "epoch": 100} {"train_loss": -4.401437759399414, "global_step": 4225, "epoch": 100} {"train_loss": -4.428400993347168, "global_step": 4226, "epoch": 100} {"train_loss": -4.409091949462891, "global_step": 4227, "epoch": 100} {"train_loss": -4.368145942687988, "global_step": 4228, "epoch": 100} {"train_loss": -4.41349983215332, "global_step": 4229, "epoch": 100} {"train_loss": -4.525582313537598, "global_step": 4230, "epoch": 100} {"train_loss": -4.514606475830078, "global_step": 4231, "epoch": 100} {"train_loss": -4.388792037963867, "global_step": 4232, "epoch": 100} {"train_loss": -4.4377336502075195, "global_step": 4233, "epoch": 100} {"train_loss": -4.467596530914307, "global_step": 4234, "epoch": 100} {"train_loss": -4.411628723144531, "global_step": 4235, "epoch": 100} {"train_loss": -4.409010410308838, "global_step": 4236, "epoch": 100} {"train_loss": -4.301182746887207, "global_step": 4237, "epoch": 100} {"train_loss": -4.41997766494751, "global_step": 4238, "epoch": 100} {"train_loss": -4.474874973297119, "global_step": 4239, "epoch": 100} {"train_loss": -4.383757591247559, "global_step": 4240, "epoch": 100} {"train_loss": -4.399993896484375, "global_step": 4241, "epoch": 100, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.014442519011309843, "train/sim_max_reward_2": 0.29745610200857636, "train/sim_max_reward_3": 0.13731518690905306, "train/sim_max_reward_4": 0.1889848815126889, "train/sim_max_reward_5": 0.6811656392348563, "test/sim_max_reward_4400000": 0.08842786286054531, "test/sim_max_reward_4400001": 0.1803459165878376, "test/sim_max_reward_4400002": 0.1970916460312713, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.42697182538105705, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.4933788590286422, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.38451300751292744, "test/sim_max_reward_4400009": 0.14558047789702463, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.3000500958194678, "test/sim_max_reward_4400012": 0.15800576648515058, "test/sim_max_reward_4400013": 0.1526350609681335, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2819869714668124, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.5992455483430951, "test/sim_max_reward_4400028": 0.37991251805978854, "test/sim_max_reward_4400029": 0.0017743440180097525, "test/sim_max_reward_4400030": 0.0620701476556299, "test/sim_max_reward_4400031": 1.2890978942579066e-05, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.12207621325612739, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.48153852215811704, "test/sim_max_reward_4400036": 0.36697528876923374, "test/sim_max_reward_4400037": 0.09417543245759505, "test/sim_max_reward_4400038": 0.17737218272572744, "test/sim_max_reward_4400039": 0.5018595443939142, "test/sim_max_reward_4400040": 0.00012906409800388652, "test/sim_max_reward_4400041": 0.05754084889364093, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.2743298595238854, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.2029139165357663, "test/sim_max_reward_4400047": 0.16644817544984147, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.2516103042137561, "test/mean_score": 0.14253594603373748, "val_loss": 106990.171875} {"train_loss": -4.513172626495361, "global_step": 4242, "epoch": 101} {"train_loss": -4.304441452026367, "global_step": 4243, "epoch": 101} {"train_loss": -4.417471885681152, "global_step": 4244, "epoch": 101} {"train_loss": -4.346195220947266, "global_step": 4245, "epoch": 101} {"train_loss": -4.357621669769287, "global_step": 4246, "epoch": 101} {"train_loss": -4.583413124084473, "global_step": 4247, "epoch": 101} {"train_loss": -4.467462062835693, "global_step": 4248, "epoch": 101} {"train_loss": -4.286530494689941, "global_step": 4249, "epoch": 101} {"train_loss": -4.44586181640625, "global_step": 4250, "epoch": 101} {"train_loss": -4.442750453948975, "global_step": 4251, "epoch": 101} {"train_loss": -4.30250358581543, "global_step": 4252, "epoch": 101} {"train_loss": -4.427087783813477, "global_step": 4253, "epoch": 101} {"train_loss": -4.46269416809082, "global_step": 4254, "epoch": 101} {"train_loss": -4.440427780151367, "global_step": 4255, "epoch": 101} {"train_loss": -4.378878593444824, "global_step": 4256, "epoch": 101} {"train_loss": -4.4114885330200195, "global_step": 4257, "epoch": 101} {"train_loss": -4.234889507293701, "global_step": 4258, "epoch": 101} {"train_loss": -4.468761920928955, "global_step": 4259, "epoch": 101} {"train_loss": -4.470330238342285, "global_step": 4260, "epoch": 101} {"train_loss": -4.299881935119629, "global_step": 4261, "epoch": 101} {"train_loss": -4.4626784324646, "global_step": 4262, "epoch": 101} {"train_loss": -4.575572490692139, "global_step": 4263, "epoch": 101} {"train_loss": -4.38676643371582, "global_step": 4264, "epoch": 101} {"train_loss": -4.244836807250977, "global_step": 4265, "epoch": 101} {"train_loss": -4.264298439025879, "global_step": 4266, "epoch": 101} {"train_loss": -4.472883701324463, "global_step": 4267, "epoch": 101} {"train_loss": -4.3631486892700195, "global_step": 4268, "epoch": 101} {"train_loss": -4.367833137512207, "global_step": 4269, "epoch": 101} {"train_loss": -4.178592205047607, "global_step": 4270, "epoch": 101} {"train_loss": -4.4220147132873535, "global_step": 4271, "epoch": 101} {"train_loss": -4.374024391174316, "global_step": 4272, "epoch": 101} {"train_loss": -4.466833591461182, "global_step": 4273, "epoch": 101} {"train_loss": -4.519258499145508, "global_step": 4274, "epoch": 101} {"train_loss": -4.36121940612793, "global_step": 4275, "epoch": 101} {"train_loss": -4.495079040527344, "global_step": 4276, "epoch": 101} {"train_loss": -4.396973609924316, "global_step": 4277, "epoch": 101} {"train_loss": -4.428493022918701, "global_step": 4278, "epoch": 101} {"train_loss": -4.276928901672363, "global_step": 4279, "epoch": 101} {"train_loss": -4.37355899810791, "global_step": 4280, "epoch": 101} {"train_loss": -4.13209867477417, "global_step": 4281, "epoch": 101} {"train_loss": -4.037446022033691, "global_step": 4282, "epoch": 101} {"train_loss": -4.381699721018474, "global_step": 4283, "epoch": 101, "val_loss": 113584.078125} {"train_loss": -4.124354362487793, "global_step": 4284, "epoch": 102} {"train_loss": -4.1618194580078125, "global_step": 4285, "epoch": 102} {"train_loss": -4.53021240234375, "global_step": 4286, "epoch": 102} {"train_loss": -4.274286270141602, "global_step": 4287, "epoch": 102} {"train_loss": -4.462808609008789, "global_step": 4288, "epoch": 102} {"train_loss": -4.239374160766602, "global_step": 4289, "epoch": 102} {"train_loss": -4.2699666023254395, "global_step": 4290, "epoch": 102} {"train_loss": -4.093904972076416, "global_step": 4291, "epoch": 102} {"train_loss": -4.401012420654297, "global_step": 4292, "epoch": 102} {"train_loss": -4.330458641052246, "global_step": 4293, "epoch": 102} {"train_loss": -4.324934959411621, "global_step": 4294, "epoch": 102} {"train_loss": -4.182265281677246, "global_step": 4295, "epoch": 102} {"train_loss": -4.263944625854492, "global_step": 4296, "epoch": 102} {"train_loss": -4.2286481857299805, "global_step": 4297, "epoch": 102} {"train_loss": -4.429106712341309, "global_step": 4298, "epoch": 102} {"train_loss": -4.40043830871582, "global_step": 4299, "epoch": 102} {"train_loss": -4.282614707946777, "global_step": 4300, "epoch": 102} {"train_loss": -4.1086745262146, "global_step": 4301, "epoch": 102} {"train_loss": -4.336945533752441, "global_step": 4302, "epoch": 102} {"train_loss": -4.414105415344238, "global_step": 4303, "epoch": 102} {"train_loss": -4.238277912139893, "global_step": 4304, "epoch": 102} {"train_loss": -4.280988693237305, "global_step": 4305, "epoch": 102} {"train_loss": -4.484971046447754, "global_step": 4306, "epoch": 102} {"train_loss": -4.415824890136719, "global_step": 4307, "epoch": 102} {"train_loss": -4.348453521728516, "global_step": 4308, "epoch": 102} {"train_loss": -4.166286945343018, "global_step": 4309, "epoch": 102} {"train_loss": -4.524663925170898, "global_step": 4310, "epoch": 102} {"train_loss": -4.319189071655273, "global_step": 4311, "epoch": 102} {"train_loss": -4.369086265563965, "global_step": 4312, "epoch": 102} {"train_loss": -4.324115753173828, "global_step": 4313, "epoch": 102} {"train_loss": -4.531251907348633, "global_step": 4314, "epoch": 102} {"train_loss": -4.298330307006836, "global_step": 4315, "epoch": 102} {"train_loss": -4.411844253540039, "global_step": 4316, "epoch": 102} {"train_loss": -4.629420757293701, "global_step": 4317, "epoch": 102} {"train_loss": -4.353404998779297, "global_step": 4318, "epoch": 102} {"train_loss": -4.308302879333496, "global_step": 4319, "epoch": 102} {"train_loss": -4.522556304931641, "global_step": 4320, "epoch": 102} {"train_loss": -4.263535022735596, "global_step": 4321, "epoch": 102} {"train_loss": -4.213330268859863, "global_step": 4322, "epoch": 102} {"train_loss": -4.305069923400879, "global_step": 4323, "epoch": 102} {"train_loss": -4.372226715087891, "global_step": 4324, "epoch": 102} {"train_loss": -4.330377317610241, "global_step": 4325, "epoch": 102, "val_loss": 108816.046875} {"train_loss": -4.37232780456543, "global_step": 4326, "epoch": 103} {"train_loss": -4.437880992889404, "global_step": 4327, "epoch": 103} {"train_loss": -4.437793254852295, "global_step": 4328, "epoch": 103} {"train_loss": -4.594149589538574, "global_step": 4329, "epoch": 103} {"train_loss": -4.381219863891602, "global_step": 4330, "epoch": 103} {"train_loss": -4.449243068695068, "global_step": 4331, "epoch": 103} {"train_loss": -4.296988487243652, "global_step": 4332, "epoch": 103} {"train_loss": -4.465944766998291, "global_step": 4333, "epoch": 103} {"train_loss": -4.298346042633057, "global_step": 4334, "epoch": 103} {"train_loss": -4.319021224975586, "global_step": 4335, "epoch": 103} {"train_loss": -4.300038814544678, "global_step": 4336, "epoch": 103} {"train_loss": -4.54155969619751, "global_step": 4337, "epoch": 103} {"train_loss": -4.407809257507324, "global_step": 4338, "epoch": 103} {"train_loss": -4.14951229095459, "global_step": 4339, "epoch": 103} {"train_loss": -4.311866760253906, "global_step": 4340, "epoch": 103} {"train_loss": -4.394949913024902, "global_step": 4341, "epoch": 103} {"train_loss": -4.2451372146606445, "global_step": 4342, "epoch": 103} {"train_loss": -4.3448991775512695, "global_step": 4343, "epoch": 103} {"train_loss": -4.437288284301758, "global_step": 4344, "epoch": 103} {"train_loss": -4.331198215484619, "global_step": 4345, "epoch": 103} {"train_loss": -4.396883010864258, "global_step": 4346, "epoch": 103} {"train_loss": -4.3651652336120605, "global_step": 4347, "epoch": 103} {"train_loss": -4.415642738342285, "global_step": 4348, "epoch": 103} {"train_loss": -4.392861366271973, "global_step": 4349, "epoch": 103} {"train_loss": -4.469089984893799, "global_step": 4350, "epoch": 103} {"train_loss": -4.361835479736328, "global_step": 4351, "epoch": 103} {"train_loss": -4.341765403747559, "global_step": 4352, "epoch": 103} {"train_loss": -4.4238176345825195, "global_step": 4353, "epoch": 103} {"train_loss": -4.413596153259277, "global_step": 4354, "epoch": 103} {"train_loss": -4.37812614440918, "global_step": 4355, "epoch": 103} {"train_loss": -4.430879592895508, "global_step": 4356, "epoch": 103} {"train_loss": -4.565752029418945, "global_step": 4357, "epoch": 103} {"train_loss": -4.351386547088623, "global_step": 4358, "epoch": 103} {"train_loss": -4.447009563446045, "global_step": 4359, "epoch": 103} {"train_loss": -4.554149627685547, "global_step": 4360, "epoch": 103} {"train_loss": -4.45156192779541, "global_step": 4361, "epoch": 103} {"train_loss": -4.455113410949707, "global_step": 4362, "epoch": 103} {"train_loss": -4.514044284820557, "global_step": 4363, "epoch": 103} {"train_loss": -4.523468494415283, "global_step": 4364, "epoch": 103} {"train_loss": -4.4572649002075195, "global_step": 4365, "epoch": 103} {"train_loss": -4.432940483093262, "global_step": 4366, "epoch": 103} {"train_loss": -4.404857703617641, "global_step": 4367, "epoch": 103, "val_loss": 105963.7265625} {"train_loss": -4.3888349533081055, "global_step": 4368, "epoch": 104} {"train_loss": -4.566839218139648, "global_step": 4369, "epoch": 104} {"train_loss": -4.504755020141602, "global_step": 4370, "epoch": 104} {"train_loss": -4.572340488433838, "global_step": 4371, "epoch": 104} {"train_loss": -4.4991655349731445, "global_step": 4372, "epoch": 104} {"train_loss": -4.5262675285339355, "global_step": 4373, "epoch": 104} {"train_loss": -4.56695556640625, "global_step": 4374, "epoch": 104} {"train_loss": -4.617833614349365, "global_step": 4375, "epoch": 104} {"train_loss": -4.594952583312988, "global_step": 4376, "epoch": 104} {"train_loss": -4.47292423248291, "global_step": 4377, "epoch": 104} {"train_loss": -4.363296985626221, "global_step": 4378, "epoch": 104} {"train_loss": -4.1472272872924805, "global_step": 4379, "epoch": 104} {"train_loss": -4.270747184753418, "global_step": 4380, "epoch": 104} {"train_loss": -4.234687805175781, "global_step": 4381, "epoch": 104} {"train_loss": -4.310824394226074, "global_step": 4382, "epoch": 104} {"train_loss": -4.510140419006348, "global_step": 4383, "epoch": 104} {"train_loss": -4.3526387214660645, "global_step": 4384, "epoch": 104} {"train_loss": -4.295442581176758, "global_step": 4385, "epoch": 104} {"train_loss": -4.384795188903809, "global_step": 4386, "epoch": 104} {"train_loss": -4.328238487243652, "global_step": 4387, "epoch": 104} {"train_loss": -4.304466247558594, "global_step": 4388, "epoch": 104} {"train_loss": -4.306572914123535, "global_step": 4389, "epoch": 104} {"train_loss": -4.326944828033447, "global_step": 4390, "epoch": 104} {"train_loss": -4.376779556274414, "global_step": 4391, "epoch": 104} {"train_loss": -4.380632400512695, "global_step": 4392, "epoch": 104} {"train_loss": -4.402006149291992, "global_step": 4393, "epoch": 104} {"train_loss": -4.433514595031738, "global_step": 4394, "epoch": 104} {"train_loss": -4.209436893463135, "global_step": 4395, "epoch": 104} {"train_loss": -4.4606122970581055, "global_step": 4396, "epoch": 104} {"train_loss": -4.42133903503418, "global_step": 4397, "epoch": 104} {"train_loss": -4.246954441070557, "global_step": 4398, "epoch": 104} {"train_loss": -4.441712856292725, "global_step": 4399, "epoch": 104} {"train_loss": -4.381125450134277, "global_step": 4400, "epoch": 104} {"train_loss": -4.44382381439209, "global_step": 4401, "epoch": 104} {"train_loss": -4.478696823120117, "global_step": 4402, "epoch": 104} {"train_loss": -4.662814140319824, "global_step": 4403, "epoch": 104} {"train_loss": -4.445178985595703, "global_step": 4404, "epoch": 104} {"train_loss": -4.479717254638672, "global_step": 4405, "epoch": 104} {"train_loss": -4.490828514099121, "global_step": 4406, "epoch": 104} {"train_loss": -4.364460468292236, "global_step": 4407, "epoch": 104} {"train_loss": -4.343448162078857, "global_step": 4408, "epoch": 104} {"train_loss": -4.415307919184367, "global_step": 4409, "epoch": 104, "val_loss": 105109.625} {"train_loss": -4.469487190246582, "global_step": 4410, "epoch": 105} {"train_loss": -4.42888069152832, "global_step": 4411, "epoch": 105} {"train_loss": -4.421231269836426, "global_step": 4412, "epoch": 105} {"train_loss": -4.49069881439209, "global_step": 4413, "epoch": 105} {"train_loss": -4.533238410949707, "global_step": 4414, "epoch": 105} {"train_loss": -4.276069641113281, "global_step": 4415, "epoch": 105} {"train_loss": -4.545836448669434, "global_step": 4416, "epoch": 105} {"train_loss": -4.693449020385742, "global_step": 4417, "epoch": 105} {"train_loss": -4.438218593597412, "global_step": 4418, "epoch": 105} {"train_loss": -4.614710330963135, "global_step": 4419, "epoch": 105} {"train_loss": -4.397439002990723, "global_step": 4420, "epoch": 105} {"train_loss": -4.338054656982422, "global_step": 4421, "epoch": 105} {"train_loss": -4.462594509124756, "global_step": 4422, "epoch": 105} {"train_loss": -4.533842086791992, "global_step": 4423, "epoch": 105} {"train_loss": -4.308454513549805, "global_step": 4424, "epoch": 105} {"train_loss": -4.465001106262207, "global_step": 4425, "epoch": 105} {"train_loss": -4.4251227378845215, "global_step": 4426, "epoch": 105} {"train_loss": -4.376461982727051, "global_step": 4427, "epoch": 105} {"train_loss": -4.37158727645874, "global_step": 4428, "epoch": 105} {"train_loss": -4.381011009216309, "global_step": 4429, "epoch": 105} {"train_loss": -4.584100723266602, "global_step": 4430, "epoch": 105} {"train_loss": -4.398038387298584, "global_step": 4431, "epoch": 105} {"train_loss": -4.3551025390625, "global_step": 4432, "epoch": 105} {"train_loss": -4.318548202514648, "global_step": 4433, "epoch": 105} {"train_loss": -4.454334259033203, "global_step": 4434, "epoch": 105} {"train_loss": -4.234859466552734, "global_step": 4435, "epoch": 105} {"train_loss": -4.128599166870117, "global_step": 4436, "epoch": 105} {"train_loss": -4.409934997558594, "global_step": 4437, "epoch": 105} {"train_loss": -4.227133274078369, "global_step": 4438, "epoch": 105} {"train_loss": -4.268344879150391, "global_step": 4439, "epoch": 105} {"train_loss": -4.1562819480896, "global_step": 4440, "epoch": 105} {"train_loss": -4.4752726554870605, "global_step": 4441, "epoch": 105} {"train_loss": -4.342100143432617, "global_step": 4442, "epoch": 105} {"train_loss": -4.328603267669678, "global_step": 4443, "epoch": 105} {"train_loss": -4.458013534545898, "global_step": 4444, "epoch": 105} {"train_loss": -4.478829383850098, "global_step": 4445, "epoch": 105} {"train_loss": -4.614503860473633, "global_step": 4446, "epoch": 105} {"train_loss": -4.391330718994141, "global_step": 4447, "epoch": 105} {"train_loss": -4.6348443031311035, "global_step": 4448, "epoch": 105} {"train_loss": -4.41786003112793, "global_step": 4449, "epoch": 105} {"train_loss": -4.445940017700195, "global_step": 4450, "epoch": 105} {"train_loss": -4.417951436269851, "global_step": 4451, "epoch": 105, "val_loss": 104774.5} {"train_loss": -4.48183536529541, "global_step": 4452, "epoch": 106} {"train_loss": -4.337483882904053, "global_step": 4453, "epoch": 106} {"train_loss": -4.516604423522949, "global_step": 4454, "epoch": 106} {"train_loss": -4.540250778198242, "global_step": 4455, "epoch": 106} {"train_loss": -4.365970611572266, "global_step": 4456, "epoch": 106} {"train_loss": -4.439173221588135, "global_step": 4457, "epoch": 106} {"train_loss": -4.5296220779418945, "global_step": 4458, "epoch": 106} {"train_loss": -4.519108772277832, "global_step": 4459, "epoch": 106} {"train_loss": -4.389040946960449, "global_step": 4460, "epoch": 106} {"train_loss": -4.52655029296875, "global_step": 4461, "epoch": 106} {"train_loss": -4.565361976623535, "global_step": 4462, "epoch": 106} {"train_loss": -4.506513595581055, "global_step": 4463, "epoch": 106} {"train_loss": -4.453965187072754, "global_step": 4464, "epoch": 106} {"train_loss": -4.383657932281494, "global_step": 4465, "epoch": 106} {"train_loss": -4.279285430908203, "global_step": 4466, "epoch": 106} {"train_loss": -4.396111488342285, "global_step": 4467, "epoch": 106} {"train_loss": -4.5221662521362305, "global_step": 4468, "epoch": 106} {"train_loss": -4.401364803314209, "global_step": 4469, "epoch": 106} {"train_loss": -4.373796463012695, "global_step": 4470, "epoch": 106} {"train_loss": -4.364986896514893, "global_step": 4471, "epoch": 106} {"train_loss": -4.470795631408691, "global_step": 4472, "epoch": 106} {"train_loss": -4.296483993530273, "global_step": 4473, "epoch": 106} {"train_loss": -4.441130638122559, "global_step": 4474, "epoch": 106} {"train_loss": -4.368646621704102, "global_step": 4475, "epoch": 106} {"train_loss": -4.328851699829102, "global_step": 4476, "epoch": 106} {"train_loss": -4.349480152130127, "global_step": 4477, "epoch": 106} {"train_loss": -4.231086254119873, "global_step": 4478, "epoch": 106} {"train_loss": -4.299744606018066, "global_step": 4479, "epoch": 106} {"train_loss": -4.512876987457275, "global_step": 4480, "epoch": 106} {"train_loss": -4.305323600769043, "global_step": 4481, "epoch": 106} {"train_loss": -4.4964704513549805, "global_step": 4482, "epoch": 106} {"train_loss": -4.5885114669799805, "global_step": 4483, "epoch": 106} {"train_loss": -4.284862518310547, "global_step": 4484, "epoch": 106} {"train_loss": -4.474177360534668, "global_step": 4485, "epoch": 106} {"train_loss": -4.4754638671875, "global_step": 4486, "epoch": 106} {"train_loss": -4.3998870849609375, "global_step": 4487, "epoch": 106} {"train_loss": -4.395455837249756, "global_step": 4488, "epoch": 106} {"train_loss": -4.324681282043457, "global_step": 4489, "epoch": 106} {"train_loss": -4.480224609375, "global_step": 4490, "epoch": 106} {"train_loss": -4.432126998901367, "global_step": 4491, "epoch": 106} {"train_loss": -4.427462577819824, "global_step": 4492, "epoch": 106} {"train_loss": -4.423298756281535, "global_step": 4493, "epoch": 106, "val_loss": 104610.6796875} {"train_loss": -4.5976481437683105, "global_step": 4494, "epoch": 107} {"train_loss": -4.603635787963867, "global_step": 4495, "epoch": 107} {"train_loss": -4.413025856018066, "global_step": 4496, "epoch": 107} {"train_loss": -4.426601409912109, "global_step": 4497, "epoch": 107} {"train_loss": -4.571406364440918, "global_step": 4498, "epoch": 107} {"train_loss": -4.347378253936768, "global_step": 4499, "epoch": 107} {"train_loss": -4.576597213745117, "global_step": 4500, "epoch": 107} {"train_loss": -4.541761875152588, "global_step": 4501, "epoch": 107} {"train_loss": -4.580617904663086, "global_step": 4502, "epoch": 107} {"train_loss": -4.477949619293213, "global_step": 4503, "epoch": 107} {"train_loss": -4.623518943786621, "global_step": 4504, "epoch": 107} {"train_loss": -4.49538516998291, "global_step": 4505, "epoch": 107} {"train_loss": -4.432336330413818, "global_step": 4506, "epoch": 107} {"train_loss": -4.515894889831543, "global_step": 4507, "epoch": 107} {"train_loss": -4.509499549865723, "global_step": 4508, "epoch": 107} {"train_loss": -4.460041046142578, "global_step": 4509, "epoch": 107} {"train_loss": -4.651730060577393, "global_step": 4510, "epoch": 107} {"train_loss": -4.42380428314209, "global_step": 4511, "epoch": 107} {"train_loss": -4.486080169677734, "global_step": 4512, "epoch": 107} {"train_loss": -4.516400337219238, "global_step": 4513, "epoch": 107} {"train_loss": -4.4601850509643555, "global_step": 4514, "epoch": 107} {"train_loss": -4.479228496551514, "global_step": 4515, "epoch": 107} {"train_loss": -4.538672924041748, "global_step": 4516, "epoch": 107} {"train_loss": -4.397157669067383, "global_step": 4517, "epoch": 107} {"train_loss": -4.527838706970215, "global_step": 4518, "epoch": 107} {"train_loss": -4.52907657623291, "global_step": 4519, "epoch": 107} {"train_loss": -4.642282009124756, "global_step": 4520, "epoch": 107} {"train_loss": -4.512471675872803, "global_step": 4521, "epoch": 107} {"train_loss": -4.444990158081055, "global_step": 4522, "epoch": 107} {"train_loss": -4.542119026184082, "global_step": 4523, "epoch": 107} {"train_loss": -4.514570236206055, "global_step": 4524, "epoch": 107} {"train_loss": -4.479808807373047, "global_step": 4525, "epoch": 107} {"train_loss": -4.466385364532471, "global_step": 4526, "epoch": 107} {"train_loss": -4.321458339691162, "global_step": 4527, "epoch": 107} {"train_loss": -4.452159404754639, "global_step": 4528, "epoch": 107} {"train_loss": -4.6202898025512695, "global_step": 4529, "epoch": 107} {"train_loss": -4.392393112182617, "global_step": 4530, "epoch": 107} {"train_loss": -4.449481010437012, "global_step": 4531, "epoch": 107} {"train_loss": -4.37437629699707, "global_step": 4532, "epoch": 107} {"train_loss": -4.433594703674316, "global_step": 4533, "epoch": 107} {"train_loss": -4.410825729370117, "global_step": 4534, "epoch": 107} {"train_loss": -4.495827674865723, "global_step": 4535, "epoch": 107, "val_loss": 105037.515625} {"train_loss": -4.388005256652832, "global_step": 4536, "epoch": 108} {"train_loss": -4.4163289070129395, "global_step": 4537, "epoch": 108} {"train_loss": -4.55167293548584, "global_step": 4538, "epoch": 108} {"train_loss": -4.584444999694824, "global_step": 4539, "epoch": 108} {"train_loss": -4.430193901062012, "global_step": 4540, "epoch": 108} {"train_loss": -4.341100692749023, "global_step": 4541, "epoch": 108} {"train_loss": -4.3588032722473145, "global_step": 4542, "epoch": 108} {"train_loss": -4.556680679321289, "global_step": 4543, "epoch": 108} {"train_loss": -4.3567304611206055, "global_step": 4544, "epoch": 108} {"train_loss": -4.362983703613281, "global_step": 4545, "epoch": 108} {"train_loss": -4.513940334320068, "global_step": 4546, "epoch": 108} {"train_loss": -4.551051139831543, "global_step": 4547, "epoch": 108} {"train_loss": -4.0272722244262695, "global_step": 4548, "epoch": 108} {"train_loss": -4.564712047576904, "global_step": 4549, "epoch": 108} {"train_loss": -4.499811172485352, "global_step": 4550, "epoch": 108} {"train_loss": -4.389129638671875, "global_step": 4551, "epoch": 108} {"train_loss": -4.628198623657227, "global_step": 4552, "epoch": 108} {"train_loss": -4.334900856018066, "global_step": 4553, "epoch": 108} {"train_loss": -4.552829265594482, "global_step": 4554, "epoch": 108} {"train_loss": -4.496339797973633, "global_step": 4555, "epoch": 108} {"train_loss": -4.377080917358398, "global_step": 4556, "epoch": 108} {"train_loss": -4.336432456970215, "global_step": 4557, "epoch": 108} {"train_loss": -4.46469783782959, "global_step": 4558, "epoch": 108} {"train_loss": -4.297119617462158, "global_step": 4559, "epoch": 108} {"train_loss": -4.722124099731445, "global_step": 4560, "epoch": 108} {"train_loss": -4.271446228027344, "global_step": 4561, "epoch": 108} {"train_loss": -4.370166778564453, "global_step": 4562, "epoch": 108} {"train_loss": -4.340348720550537, "global_step": 4563, "epoch": 108} {"train_loss": -4.238874435424805, "global_step": 4564, "epoch": 108} {"train_loss": -4.468051910400391, "global_step": 4565, "epoch": 108} {"train_loss": -4.295633316040039, "global_step": 4566, "epoch": 108} {"train_loss": -4.454518795013428, "global_step": 4567, "epoch": 108} {"train_loss": -4.388523101806641, "global_step": 4568, "epoch": 108} {"train_loss": -4.3751678466796875, "global_step": 4569, "epoch": 108} {"train_loss": -4.3715643882751465, "global_step": 4570, "epoch": 108} {"train_loss": -4.3098344802856445, "global_step": 4571, "epoch": 108} {"train_loss": -4.502477645874023, "global_step": 4572, "epoch": 108} {"train_loss": -4.474735260009766, "global_step": 4573, "epoch": 108} {"train_loss": -4.544312477111816, "global_step": 4574, "epoch": 108} {"train_loss": -4.521444320678711, "global_step": 4575, "epoch": 108} {"train_loss": -4.470395565032959, "global_step": 4576, "epoch": 108} {"train_loss": -4.426546130861555, "global_step": 4577, "epoch": 108, "val_loss": 103791.734375} {"train_loss": -4.401886940002441, "global_step": 4578, "epoch": 109} {"train_loss": -4.616562843322754, "global_step": 4579, "epoch": 109} {"train_loss": -4.619411468505859, "global_step": 4580, "epoch": 109} {"train_loss": -4.487004280090332, "global_step": 4581, "epoch": 109} {"train_loss": -4.4836835861206055, "global_step": 4582, "epoch": 109} {"train_loss": -4.4808502197265625, "global_step": 4583, "epoch": 109} {"train_loss": -4.338011741638184, "global_step": 4584, "epoch": 109} {"train_loss": -4.498042583465576, "global_step": 4585, "epoch": 109} {"train_loss": -4.459506034851074, "global_step": 4586, "epoch": 109} {"train_loss": -4.440935134887695, "global_step": 4587, "epoch": 109} {"train_loss": -4.532373428344727, "global_step": 4588, "epoch": 109} {"train_loss": -4.58963680267334, "global_step": 4589, "epoch": 109} {"train_loss": -4.535727500915527, "global_step": 4590, "epoch": 109} {"train_loss": -4.711556911468506, "global_step": 4591, "epoch": 109} {"train_loss": -4.610438823699951, "global_step": 4592, "epoch": 109} {"train_loss": -4.680500507354736, "global_step": 4593, "epoch": 109} {"train_loss": -4.473696708679199, "global_step": 4594, "epoch": 109} {"train_loss": -4.457426071166992, "global_step": 4595, "epoch": 109} {"train_loss": -4.685664176940918, "global_step": 4596, "epoch": 109} {"train_loss": -4.560576915740967, "global_step": 4597, "epoch": 109} {"train_loss": -4.374001502990723, "global_step": 4598, "epoch": 109} {"train_loss": -4.5179290771484375, "global_step": 4599, "epoch": 109} {"train_loss": -4.470330238342285, "global_step": 4600, "epoch": 109} {"train_loss": -4.393730163574219, "global_step": 4601, "epoch": 109} {"train_loss": -4.385758876800537, "global_step": 4602, "epoch": 109} {"train_loss": -4.506283760070801, "global_step": 4603, "epoch": 109} {"train_loss": -4.503772735595703, "global_step": 4604, "epoch": 109} {"train_loss": -4.258674621582031, "global_step": 4605, "epoch": 109} {"train_loss": -4.2245402336120605, "global_step": 4606, "epoch": 109} {"train_loss": -4.447518348693848, "global_step": 4607, "epoch": 109} {"train_loss": -4.534931659698486, "global_step": 4608, "epoch": 109} {"train_loss": -4.2498626708984375, "global_step": 4609, "epoch": 109} {"train_loss": -4.403576374053955, "global_step": 4610, "epoch": 109} {"train_loss": -4.567366123199463, "global_step": 4611, "epoch": 109} {"train_loss": -4.34407901763916, "global_step": 4612, "epoch": 109} {"train_loss": -4.324268341064453, "global_step": 4613, "epoch": 109} {"train_loss": -4.447892189025879, "global_step": 4614, "epoch": 109} {"train_loss": -4.584607124328613, "global_step": 4615, "epoch": 109} {"train_loss": -4.428878307342529, "global_step": 4616, "epoch": 109} {"train_loss": -4.483462810516357, "global_step": 4617, "epoch": 109} {"train_loss": -4.581960678100586, "global_step": 4618, "epoch": 109} {"train_loss": -4.479893797919864, "global_step": 4619, "epoch": 109, "val_loss": 104512.8046875} {"train_loss": -4.434744834899902, "global_step": 4620, "epoch": 110} {"train_loss": -4.649226188659668, "global_step": 4621, "epoch": 110} {"train_loss": -4.582094669342041, "global_step": 4622, "epoch": 110} {"train_loss": -4.411520004272461, "global_step": 4623, "epoch": 110} {"train_loss": -4.504563331604004, "global_step": 4624, "epoch": 110} {"train_loss": -4.588900566101074, "global_step": 4625, "epoch": 110} {"train_loss": -4.3744683265686035, "global_step": 4626, "epoch": 110} {"train_loss": -4.483710289001465, "global_step": 4627, "epoch": 110} {"train_loss": -4.533089637756348, "global_step": 4628, "epoch": 110} {"train_loss": -4.440849304199219, "global_step": 4629, "epoch": 110} {"train_loss": -4.553511619567871, "global_step": 4630, "epoch": 110} {"train_loss": -4.495108604431152, "global_step": 4631, "epoch": 110} {"train_loss": -4.425658702850342, "global_step": 4632, "epoch": 110} {"train_loss": -4.438436508178711, "global_step": 4633, "epoch": 110} {"train_loss": -4.627490520477295, "global_step": 4634, "epoch": 110} {"train_loss": -4.5003557205200195, "global_step": 4635, "epoch": 110} {"train_loss": -4.472073554992676, "global_step": 4636, "epoch": 110} {"train_loss": -4.538479804992676, "global_step": 4637, "epoch": 110} {"train_loss": -4.401325225830078, "global_step": 4638, "epoch": 110} {"train_loss": -4.454712390899658, "global_step": 4639, "epoch": 110} {"train_loss": -4.473047256469727, "global_step": 4640, "epoch": 110} {"train_loss": -4.625133514404297, "global_step": 4641, "epoch": 110} {"train_loss": -4.560076713562012, "global_step": 4642, "epoch": 110} {"train_loss": -4.4027886390686035, "global_step": 4643, "epoch": 110} {"train_loss": -4.445516586303711, "global_step": 4644, "epoch": 110} {"train_loss": -4.584662914276123, "global_step": 4645, "epoch": 110} {"train_loss": -4.554558753967285, "global_step": 4646, "epoch": 110} {"train_loss": -4.488316535949707, "global_step": 4647, "epoch": 110} {"train_loss": -4.346792221069336, "global_step": 4648, "epoch": 110} {"train_loss": -4.508933067321777, "global_step": 4649, "epoch": 110} {"train_loss": -4.450625419616699, "global_step": 4650, "epoch": 110} {"train_loss": -4.451432228088379, "global_step": 4651, "epoch": 110} {"train_loss": -4.457706451416016, "global_step": 4652, "epoch": 110} {"train_loss": -4.644034385681152, "global_step": 4653, "epoch": 110} {"train_loss": -4.634751319885254, "global_step": 4654, "epoch": 110} {"train_loss": -4.445943832397461, "global_step": 4655, "epoch": 110} {"train_loss": -4.541572570800781, "global_step": 4656, "epoch": 110} {"train_loss": -4.566679000854492, "global_step": 4657, "epoch": 110} {"train_loss": -4.4581193923950195, "global_step": 4658, "epoch": 110} {"train_loss": -4.518910884857178, "global_step": 4659, "epoch": 110} {"train_loss": -4.571118354797363, "global_step": 4660, "epoch": 110} {"train_loss": -4.502876803988502, "global_step": 4661, "epoch": 110, "val_loss": 103387.7109375} {"train_loss": -4.477281093597412, "global_step": 4662, "epoch": 111} {"train_loss": -4.461507320404053, "global_step": 4663, "epoch": 111} {"train_loss": -4.454065799713135, "global_step": 4664, "epoch": 111} {"train_loss": -4.376614093780518, "global_step": 4665, "epoch": 111} {"train_loss": -4.423490524291992, "global_step": 4666, "epoch": 111} {"train_loss": -4.125338554382324, "global_step": 4667, "epoch": 111} {"train_loss": -4.466000556945801, "global_step": 4668, "epoch": 111} {"train_loss": -4.419883728027344, "global_step": 4669, "epoch": 111} {"train_loss": -4.312217712402344, "global_step": 4670, "epoch": 111} {"train_loss": -4.228609085083008, "global_step": 4671, "epoch": 111} {"train_loss": -4.104182243347168, "global_step": 4672, "epoch": 111} {"train_loss": -4.364598274230957, "global_step": 4673, "epoch": 111} {"train_loss": -4.238910675048828, "global_step": 4674, "epoch": 111} {"train_loss": -4.464146614074707, "global_step": 4675, "epoch": 111} {"train_loss": -4.506823539733887, "global_step": 4676, "epoch": 111} {"train_loss": -4.264804363250732, "global_step": 4677, "epoch": 111} {"train_loss": -4.476150035858154, "global_step": 4678, "epoch": 111} {"train_loss": -4.409186363220215, "global_step": 4679, "epoch": 111} {"train_loss": -4.417442798614502, "global_step": 4680, "epoch": 111} {"train_loss": -4.440048694610596, "global_step": 4681, "epoch": 111} {"train_loss": -4.435059547424316, "global_step": 4682, "epoch": 111} {"train_loss": -4.479162693023682, "global_step": 4683, "epoch": 111} {"train_loss": -4.424930572509766, "global_step": 4684, "epoch": 111} {"train_loss": -4.503757476806641, "global_step": 4685, "epoch": 111} {"train_loss": -4.423396587371826, "global_step": 4686, "epoch": 111} {"train_loss": -4.522120952606201, "global_step": 4687, "epoch": 111} {"train_loss": -4.50991153717041, "global_step": 4688, "epoch": 111} {"train_loss": -4.605352401733398, "global_step": 4689, "epoch": 111} {"train_loss": -4.459282875061035, "global_step": 4690, "epoch": 111} {"train_loss": -4.656068801879883, "global_step": 4691, "epoch": 111} {"train_loss": -4.543694496154785, "global_step": 4692, "epoch": 111} {"train_loss": -4.527342796325684, "global_step": 4693, "epoch": 111} {"train_loss": -4.637333869934082, "global_step": 4694, "epoch": 111} {"train_loss": -4.424076080322266, "global_step": 4695, "epoch": 111} {"train_loss": -4.672226905822754, "global_step": 4696, "epoch": 111} {"train_loss": -4.600932598114014, "global_step": 4697, "epoch": 111} {"train_loss": -4.5657477378845215, "global_step": 4698, "epoch": 111} {"train_loss": -4.5859293937683105, "global_step": 4699, "epoch": 111} {"train_loss": -4.519718170166016, "global_step": 4700, "epoch": 111} {"train_loss": -4.4890055656433105, "global_step": 4701, "epoch": 111} {"train_loss": -4.469661712646484, "global_step": 4702, "epoch": 111} {"train_loss": -4.4570437499455045, "global_step": 4703, "epoch": 111, "val_loss": 102687.625} {"train_loss": -4.4837799072265625, "global_step": 4704, "epoch": 112} {"train_loss": -4.54899787902832, "global_step": 4705, "epoch": 112} {"train_loss": -4.642119407653809, "global_step": 4706, "epoch": 112} {"train_loss": -4.5970354080200195, "global_step": 4707, "epoch": 112} {"train_loss": -4.507342338562012, "global_step": 4708, "epoch": 112} {"train_loss": -4.458122253417969, "global_step": 4709, "epoch": 112} {"train_loss": -4.569120407104492, "global_step": 4710, "epoch": 112} {"train_loss": -4.638176918029785, "global_step": 4711, "epoch": 112} {"train_loss": -4.564228057861328, "global_step": 4712, "epoch": 112} {"train_loss": -4.815736770629883, "global_step": 4713, "epoch": 112} {"train_loss": -4.748640060424805, "global_step": 4714, "epoch": 112} {"train_loss": -4.543310165405273, "global_step": 4715, "epoch": 112} {"train_loss": -4.395975112915039, "global_step": 4716, "epoch": 112} {"train_loss": -4.61782169342041, "global_step": 4717, "epoch": 112} {"train_loss": -4.510429382324219, "global_step": 4718, "epoch": 112} {"train_loss": -4.469505310058594, "global_step": 4719, "epoch": 112} {"train_loss": -4.333592414855957, "global_step": 4720, "epoch": 112} {"train_loss": -4.350395202636719, "global_step": 4721, "epoch": 112} {"train_loss": -4.326026916503906, "global_step": 4722, "epoch": 112} {"train_loss": -4.415583610534668, "global_step": 4723, "epoch": 112} {"train_loss": -4.441627502441406, "global_step": 4724, "epoch": 112} {"train_loss": -4.5351457595825195, "global_step": 4725, "epoch": 112} {"train_loss": -4.396813869476318, "global_step": 4726, "epoch": 112} {"train_loss": -4.414612770080566, "global_step": 4727, "epoch": 112} {"train_loss": -4.390761375427246, "global_step": 4728, "epoch": 112} {"train_loss": -4.5780510902404785, "global_step": 4729, "epoch": 112} {"train_loss": -4.444245338439941, "global_step": 4730, "epoch": 112} {"train_loss": -4.436344623565674, "global_step": 4731, "epoch": 112} {"train_loss": -4.603290557861328, "global_step": 4732, "epoch": 112} {"train_loss": -4.352092742919922, "global_step": 4733, "epoch": 112} {"train_loss": -4.459298133850098, "global_step": 4734, "epoch": 112} {"train_loss": -4.529425144195557, "global_step": 4735, "epoch": 112} {"train_loss": -4.221673011779785, "global_step": 4736, "epoch": 112} {"train_loss": -4.428694248199463, "global_step": 4737, "epoch": 112} {"train_loss": -4.480766296386719, "global_step": 4738, "epoch": 112} {"train_loss": -4.332276821136475, "global_step": 4739, "epoch": 112} {"train_loss": -4.544403553009033, "global_step": 4740, "epoch": 112} {"train_loss": -4.155400276184082, "global_step": 4741, "epoch": 112} {"train_loss": -4.453876495361328, "global_step": 4742, "epoch": 112} {"train_loss": -4.446596622467041, "global_step": 4743, "epoch": 112} {"train_loss": -4.329496383666992, "global_step": 4744, "epoch": 112} {"train_loss": -4.479913643428257, "global_step": 4745, "epoch": 112, "val_loss": 106037.6328125} {"train_loss": -4.404749393463135, "global_step": 4746, "epoch": 113} {"train_loss": -4.602212429046631, "global_step": 4747, "epoch": 113} {"train_loss": -4.36332893371582, "global_step": 4748, "epoch": 113} {"train_loss": -4.57003116607666, "global_step": 4749, "epoch": 113} {"train_loss": -4.60549259185791, "global_step": 4750, "epoch": 113} {"train_loss": -4.546406269073486, "global_step": 4751, "epoch": 113} {"train_loss": -4.690834045410156, "global_step": 4752, "epoch": 113} {"train_loss": -4.613687992095947, "global_step": 4753, "epoch": 113} {"train_loss": -4.686313629150391, "global_step": 4754, "epoch": 113} {"train_loss": -4.418638229370117, "global_step": 4755, "epoch": 113} {"train_loss": -4.619512557983398, "global_step": 4756, "epoch": 113} {"train_loss": -4.468648433685303, "global_step": 4757, "epoch": 113} {"train_loss": -4.596313953399658, "global_step": 4758, "epoch": 113} {"train_loss": -4.502863883972168, "global_step": 4759, "epoch": 113} {"train_loss": -4.586961269378662, "global_step": 4760, "epoch": 113} {"train_loss": -4.551314353942871, "global_step": 4761, "epoch": 113} {"train_loss": -4.486947059631348, "global_step": 4762, "epoch": 113} {"train_loss": -4.5378570556640625, "global_step": 4763, "epoch": 113} {"train_loss": -4.621661186218262, "global_step": 4764, "epoch": 113} {"train_loss": -4.689371585845947, "global_step": 4765, "epoch": 113} {"train_loss": -4.69043493270874, "global_step": 4766, "epoch": 113} {"train_loss": -4.49157190322876, "global_step": 4767, "epoch": 113} {"train_loss": -4.541930675506592, "global_step": 4768, "epoch": 113} {"train_loss": -4.652799129486084, "global_step": 4769, "epoch": 113} {"train_loss": -4.462203502655029, "global_step": 4770, "epoch": 113} {"train_loss": -4.612855434417725, "global_step": 4771, "epoch": 113} {"train_loss": -4.643774509429932, "global_step": 4772, "epoch": 113} {"train_loss": -4.499603271484375, "global_step": 4773, "epoch": 113} {"train_loss": -4.566811561584473, "global_step": 4774, "epoch": 113} {"train_loss": -4.649073123931885, "global_step": 4775, "epoch": 113} {"train_loss": -4.686551094055176, "global_step": 4776, "epoch": 113} {"train_loss": -4.501397132873535, "global_step": 4777, "epoch": 113} {"train_loss": -4.639036655426025, "global_step": 4778, "epoch": 113} {"train_loss": -4.576711654663086, "global_step": 4779, "epoch": 113} {"train_loss": -4.589731693267822, "global_step": 4780, "epoch": 113} {"train_loss": -4.61630392074585, "global_step": 4781, "epoch": 113} {"train_loss": -4.6406683921813965, "global_step": 4782, "epoch": 113} {"train_loss": -4.423639297485352, "global_step": 4783, "epoch": 113} {"train_loss": -4.2553606033325195, "global_step": 4784, "epoch": 113} {"train_loss": -4.409299373626709, "global_step": 4785, "epoch": 113} {"train_loss": -4.016453742980957, "global_step": 4786, "epoch": 113} {"train_loss": -4.524145540736971, "global_step": 4787, "epoch": 113, "val_loss": 111285.5078125} {"train_loss": -3.5909385681152344, "global_step": 4788, "epoch": 114} {"train_loss": -3.957845687866211, "global_step": 4789, "epoch": 114} {"train_loss": -3.2917606830596924, "global_step": 4790, "epoch": 114} {"train_loss": -3.4402270317077637, "global_step": 4791, "epoch": 114} {"train_loss": -3.9024786949157715, "global_step": 4792, "epoch": 114} {"train_loss": -3.3404507637023926, "global_step": 4793, "epoch": 114} {"train_loss": -3.931943893432617, "global_step": 4794, "epoch": 114} {"train_loss": -3.7127068042755127, "global_step": 4795, "epoch": 114} {"train_loss": -3.7185447216033936, "global_step": 4796, "epoch": 114} {"train_loss": -3.8694937229156494, "global_step": 4797, "epoch": 114} {"train_loss": -3.7442471981048584, "global_step": 4798, "epoch": 114} {"train_loss": -3.9580698013305664, "global_step": 4799, "epoch": 114} {"train_loss": -3.909432888031006, "global_step": 4800, "epoch": 114} {"train_loss": -4.163989543914795, "global_step": 4801, "epoch": 114} {"train_loss": -4.273208141326904, "global_step": 4802, "epoch": 114} {"train_loss": -4.1058502197265625, "global_step": 4803, "epoch": 114} {"train_loss": -4.042635917663574, "global_step": 4804, "epoch": 114} {"train_loss": -4.173379421234131, "global_step": 4805, "epoch": 114} {"train_loss": -4.301424980163574, "global_step": 4806, "epoch": 114} {"train_loss": -4.191068649291992, "global_step": 4807, "epoch": 114} {"train_loss": -4.164572238922119, "global_step": 4808, "epoch": 114} {"train_loss": -4.249063491821289, "global_step": 4809, "epoch": 114} {"train_loss": -4.232199192047119, "global_step": 4810, "epoch": 114} {"train_loss": -4.298148155212402, "global_step": 4811, "epoch": 114} {"train_loss": -4.3600921630859375, "global_step": 4812, "epoch": 114} {"train_loss": -4.301621913909912, "global_step": 4813, "epoch": 114} {"train_loss": -4.354227542877197, "global_step": 4814, "epoch": 114} {"train_loss": -4.35608434677124, "global_step": 4815, "epoch": 114} {"train_loss": -4.292658805847168, "global_step": 4816, "epoch": 114} {"train_loss": -4.438988208770752, "global_step": 4817, "epoch": 114} {"train_loss": -4.398453235626221, "global_step": 4818, "epoch": 114} {"train_loss": -4.336716651916504, "global_step": 4819, "epoch": 114} {"train_loss": -4.388031482696533, "global_step": 4820, "epoch": 114} {"train_loss": -4.521830081939697, "global_step": 4821, "epoch": 114} {"train_loss": -4.434685707092285, "global_step": 4822, "epoch": 114} {"train_loss": -4.449319839477539, "global_step": 4823, "epoch": 114} {"train_loss": -4.464395999908447, "global_step": 4824, "epoch": 114} {"train_loss": -4.356627464294434, "global_step": 4825, "epoch": 114} {"train_loss": -4.498040199279785, "global_step": 4826, "epoch": 114} {"train_loss": -4.475677013397217, "global_step": 4827, "epoch": 114} {"train_loss": -4.5680694580078125, "global_step": 4828, "epoch": 114} {"train_loss": -4.145389959925697, "global_step": 4829, "epoch": 114, "val_loss": 102255.3984375} {"train_loss": -4.525641441345215, "global_step": 4830, "epoch": 115} {"train_loss": -4.504852294921875, "global_step": 4831, "epoch": 115} {"train_loss": -4.570103168487549, "global_step": 4832, "epoch": 115} {"train_loss": -4.760255813598633, "global_step": 4833, "epoch": 115} {"train_loss": -4.622889041900635, "global_step": 4834, "epoch": 115} {"train_loss": -4.466141223907471, "global_step": 4835, "epoch": 115} {"train_loss": -4.608330726623535, "global_step": 4836, "epoch": 115} {"train_loss": -4.749072074890137, "global_step": 4837, "epoch": 115} {"train_loss": -4.638360977172852, "global_step": 4838, "epoch": 115} {"train_loss": -4.577690124511719, "global_step": 4839, "epoch": 115} {"train_loss": -4.690128326416016, "global_step": 4840, "epoch": 115} {"train_loss": -4.522040367126465, "global_step": 4841, "epoch": 115} {"train_loss": -4.565298557281494, "global_step": 4842, "epoch": 115} {"train_loss": -4.5144548416137695, "global_step": 4843, "epoch": 115} {"train_loss": -4.7185564041137695, "global_step": 4844, "epoch": 115} {"train_loss": -4.5096516609191895, "global_step": 4845, "epoch": 115} {"train_loss": -4.567424297332764, "global_step": 4846, "epoch": 115} {"train_loss": -4.571303367614746, "global_step": 4847, "epoch": 115} {"train_loss": -4.628629207611084, "global_step": 4848, "epoch": 115} {"train_loss": -4.491164207458496, "global_step": 4849, "epoch": 115} {"train_loss": -4.452556610107422, "global_step": 4850, "epoch": 115} {"train_loss": -4.637291431427002, "global_step": 4851, "epoch": 115} {"train_loss": -4.616604328155518, "global_step": 4852, "epoch": 115} {"train_loss": -4.536691188812256, "global_step": 4853, "epoch": 115} {"train_loss": -4.4180827140808105, "global_step": 4854, "epoch": 115} {"train_loss": -4.731682777404785, "global_step": 4855, "epoch": 115} {"train_loss": -4.298221111297607, "global_step": 4856, "epoch": 115} {"train_loss": -4.375156879425049, "global_step": 4857, "epoch": 115} {"train_loss": -4.601980209350586, "global_step": 4858, "epoch": 115} {"train_loss": -4.51115608215332, "global_step": 4859, "epoch": 115} {"train_loss": -4.357491493225098, "global_step": 4860, "epoch": 115} {"train_loss": -4.60883092880249, "global_step": 4861, "epoch": 115} {"train_loss": -4.612610816955566, "global_step": 4862, "epoch": 115} {"train_loss": -4.491337776184082, "global_step": 4863, "epoch": 115} {"train_loss": -4.404892921447754, "global_step": 4864, "epoch": 115} {"train_loss": -4.644844055175781, "global_step": 4865, "epoch": 115} {"train_loss": -4.48671293258667, "global_step": 4866, "epoch": 115} {"train_loss": -4.53436803817749, "global_step": 4867, "epoch": 115} {"train_loss": -4.502817153930664, "global_step": 4868, "epoch": 115} {"train_loss": -4.529345512390137, "global_step": 4869, "epoch": 115} {"train_loss": -4.552469253540039, "global_step": 4870, "epoch": 115} {"train_loss": -4.548939193998065, "global_step": 4871, "epoch": 115, "val_loss": 100536.4921875} {"train_loss": -4.562884330749512, "global_step": 4872, "epoch": 116} {"train_loss": -4.569371223449707, "global_step": 4873, "epoch": 116} {"train_loss": -4.605555534362793, "global_step": 4874, "epoch": 116} {"train_loss": -4.5831217765808105, "global_step": 4875, "epoch": 116} {"train_loss": -4.632192611694336, "global_step": 4876, "epoch": 116} {"train_loss": -4.518213748931885, "global_step": 4877, "epoch": 116} {"train_loss": -4.665231704711914, "global_step": 4878, "epoch": 116} {"train_loss": -4.423579216003418, "global_step": 4879, "epoch": 116} {"train_loss": -4.637939453125, "global_step": 4880, "epoch": 116} {"train_loss": -4.7565789222717285, "global_step": 4881, "epoch": 116} {"train_loss": -4.559469223022461, "global_step": 4882, "epoch": 116} {"train_loss": -4.649657249450684, "global_step": 4883, "epoch": 116} {"train_loss": -4.5665740966796875, "global_step": 4884, "epoch": 116} {"train_loss": -4.574008941650391, "global_step": 4885, "epoch": 116} {"train_loss": -4.560958385467529, "global_step": 4886, "epoch": 116} {"train_loss": -4.540275573730469, "global_step": 4887, "epoch": 116} {"train_loss": -4.505642890930176, "global_step": 4888, "epoch": 116} {"train_loss": -4.715723037719727, "global_step": 4889, "epoch": 116} {"train_loss": -4.5107741355896, "global_step": 4890, "epoch": 116} {"train_loss": -4.530681610107422, "global_step": 4891, "epoch": 116} {"train_loss": -4.757884979248047, "global_step": 4892, "epoch": 116} {"train_loss": -4.4909257888793945, "global_step": 4893, "epoch": 116} {"train_loss": -4.619739532470703, "global_step": 4894, "epoch": 116} {"train_loss": -4.500636100769043, "global_step": 4895, "epoch": 116} {"train_loss": -4.512801170349121, "global_step": 4896, "epoch": 116} {"train_loss": -4.728171348571777, "global_step": 4897, "epoch": 116} {"train_loss": -4.443100929260254, "global_step": 4898, "epoch": 116} {"train_loss": -4.352450370788574, "global_step": 4899, "epoch": 116} {"train_loss": -4.3015313148498535, "global_step": 4900, "epoch": 116} {"train_loss": -4.319426536560059, "global_step": 4901, "epoch": 116} {"train_loss": -4.208493232727051, "global_step": 4902, "epoch": 116} {"train_loss": -4.168457508087158, "global_step": 4903, "epoch": 116} {"train_loss": -4.4001617431640625, "global_step": 4904, "epoch": 116} {"train_loss": -4.34268856048584, "global_step": 4905, "epoch": 116} {"train_loss": -4.334968566894531, "global_step": 4906, "epoch": 116} {"train_loss": -4.438802719116211, "global_step": 4907, "epoch": 116} {"train_loss": -4.31062126159668, "global_step": 4908, "epoch": 116} {"train_loss": -4.346366882324219, "global_step": 4909, "epoch": 116} {"train_loss": -4.5448503494262695, "global_step": 4910, "epoch": 116} {"train_loss": -4.398222923278809, "global_step": 4911, "epoch": 116} {"train_loss": -4.551560878753662, "global_step": 4912, "epoch": 116} {"train_loss": -4.505955843698411, "global_step": 4913, "epoch": 116, "val_loss": 103439.7890625} {"train_loss": -4.701957702636719, "global_step": 4914, "epoch": 117} {"train_loss": -4.510071754455566, "global_step": 4915, "epoch": 117} {"train_loss": -4.446100234985352, "global_step": 4916, "epoch": 117} {"train_loss": -4.536831855773926, "global_step": 4917, "epoch": 117} {"train_loss": -4.592344760894775, "global_step": 4918, "epoch": 117} {"train_loss": -4.404838562011719, "global_step": 4919, "epoch": 117} {"train_loss": -4.622779846191406, "global_step": 4920, "epoch": 117} {"train_loss": -4.562193870544434, "global_step": 4921, "epoch": 117} {"train_loss": -4.437646389007568, "global_step": 4922, "epoch": 117} {"train_loss": -4.584988594055176, "global_step": 4923, "epoch": 117} {"train_loss": -4.597476959228516, "global_step": 4924, "epoch": 117} {"train_loss": -4.493481636047363, "global_step": 4925, "epoch": 117} {"train_loss": -4.645223617553711, "global_step": 4926, "epoch": 117} {"train_loss": -4.658511161804199, "global_step": 4927, "epoch": 117} {"train_loss": -4.3955979347229, "global_step": 4928, "epoch": 117} {"train_loss": -4.690201759338379, "global_step": 4929, "epoch": 117} {"train_loss": -4.732704162597656, "global_step": 4930, "epoch": 117} {"train_loss": -4.5812153816223145, "global_step": 4931, "epoch": 117} {"train_loss": -4.555374622344971, "global_step": 4932, "epoch": 117} {"train_loss": -4.642834663391113, "global_step": 4933, "epoch": 117} {"train_loss": -4.643794536590576, "global_step": 4934, "epoch": 117} {"train_loss": -4.572837829589844, "global_step": 4935, "epoch": 117} {"train_loss": -4.579107761383057, "global_step": 4936, "epoch": 117} {"train_loss": -4.821195125579834, "global_step": 4937, "epoch": 117} {"train_loss": -4.690598964691162, "global_step": 4938, "epoch": 117} {"train_loss": -4.539951801300049, "global_step": 4939, "epoch": 117} {"train_loss": -4.466719627380371, "global_step": 4940, "epoch": 117} {"train_loss": -4.691211700439453, "global_step": 4941, "epoch": 117} {"train_loss": -4.557164192199707, "global_step": 4942, "epoch": 117} {"train_loss": -4.505372047424316, "global_step": 4943, "epoch": 117} {"train_loss": -4.340453147888184, "global_step": 4944, "epoch": 117} {"train_loss": -4.662885665893555, "global_step": 4945, "epoch": 117} {"train_loss": -4.356005668640137, "global_step": 4946, "epoch": 117} {"train_loss": -4.447060585021973, "global_step": 4947, "epoch": 117} {"train_loss": -4.650781631469727, "global_step": 4948, "epoch": 117} {"train_loss": -4.498653411865234, "global_step": 4949, "epoch": 117} {"train_loss": -4.193794250488281, "global_step": 4950, "epoch": 117} {"train_loss": -4.758790016174316, "global_step": 4951, "epoch": 117} {"train_loss": -4.576057434082031, "global_step": 4952, "epoch": 117} {"train_loss": -4.400424003601074, "global_step": 4953, "epoch": 117} {"train_loss": -4.473618984222412, "global_step": 4954, "epoch": 117} {"train_loss": -4.555842479070027, "global_step": 4955, "epoch": 117, "val_loss": 99916.2890625} {"train_loss": -4.329474449157715, "global_step": 4956, "epoch": 118} {"train_loss": -4.648042678833008, "global_step": 4957, "epoch": 118} {"train_loss": -4.540897369384766, "global_step": 4958, "epoch": 118} {"train_loss": -4.6073317527771, "global_step": 4959, "epoch": 118} {"train_loss": -4.612828731536865, "global_step": 4960, "epoch": 118} {"train_loss": -4.535285949707031, "global_step": 4961, "epoch": 118} {"train_loss": -4.717146396636963, "global_step": 4962, "epoch": 118} {"train_loss": -4.515387058258057, "global_step": 4963, "epoch": 118} {"train_loss": -4.735965251922607, "global_step": 4964, "epoch": 118} {"train_loss": -4.663012981414795, "global_step": 4965, "epoch": 118} {"train_loss": -4.716436386108398, "global_step": 4966, "epoch": 118} {"train_loss": -4.634130477905273, "global_step": 4967, "epoch": 118} {"train_loss": -4.521854877471924, "global_step": 4968, "epoch": 118} {"train_loss": -4.430962562561035, "global_step": 4969, "epoch": 118} {"train_loss": -4.642208099365234, "global_step": 4970, "epoch": 118} {"train_loss": -4.558955669403076, "global_step": 4971, "epoch": 118} {"train_loss": -4.412807464599609, "global_step": 4972, "epoch": 118} {"train_loss": -4.59575891494751, "global_step": 4973, "epoch": 118} {"train_loss": -4.700268745422363, "global_step": 4974, "epoch": 118} {"train_loss": -4.413754940032959, "global_step": 4975, "epoch": 118} {"train_loss": -4.7107343673706055, "global_step": 4976, "epoch": 118} {"train_loss": -4.845865249633789, "global_step": 4977, "epoch": 118} {"train_loss": -4.655360698699951, "global_step": 4978, "epoch": 118} {"train_loss": -4.524357318878174, "global_step": 4979, "epoch": 118} {"train_loss": -4.527876853942871, "global_step": 4980, "epoch": 118} {"train_loss": -4.680450439453125, "global_step": 4981, "epoch": 118} {"train_loss": -4.61517858505249, "global_step": 4982, "epoch": 118} {"train_loss": -4.55435848236084, "global_step": 4983, "epoch": 118} {"train_loss": -4.466305255889893, "global_step": 4984, "epoch": 118} {"train_loss": -4.651463508605957, "global_step": 4985, "epoch": 118} {"train_loss": -4.621203422546387, "global_step": 4986, "epoch": 118} {"train_loss": -4.578168869018555, "global_step": 4987, "epoch": 118} {"train_loss": -4.581940650939941, "global_step": 4988, "epoch": 118} {"train_loss": -4.710443496704102, "global_step": 4989, "epoch": 118} {"train_loss": -4.599817276000977, "global_step": 4990, "epoch": 118} {"train_loss": -4.69316291809082, "global_step": 4991, "epoch": 118} {"train_loss": -4.710984230041504, "global_step": 4992, "epoch": 118} {"train_loss": -4.543670654296875, "global_step": 4993, "epoch": 118} {"train_loss": -4.518714904785156, "global_step": 4994, "epoch": 118} {"train_loss": -4.634513854980469, "global_step": 4995, "epoch": 118} {"train_loss": -4.793933868408203, "global_step": 4996, "epoch": 118} {"train_loss": -4.606060436793736, "global_step": 4997, "epoch": 118, "val_loss": 101324.5} {"train_loss": -4.420523643493652, "global_step": 4998, "epoch": 119} {"train_loss": -4.705470085144043, "global_step": 4999, "epoch": 119} {"train_loss": -4.696931838989258, "global_step": 5000, "epoch": 119} {"train_loss": -4.640840530395508, "global_step": 5001, "epoch": 119} {"train_loss": -4.647007942199707, "global_step": 5002, "epoch": 119} {"train_loss": -4.711193084716797, "global_step": 5003, "epoch": 119} {"train_loss": -4.671894073486328, "global_step": 5004, "epoch": 119} {"train_loss": -4.592288970947266, "global_step": 5005, "epoch": 119} {"train_loss": -4.720776081085205, "global_step": 5006, "epoch": 119} {"train_loss": -4.789884567260742, "global_step": 5007, "epoch": 119} {"train_loss": -4.844509601593018, "global_step": 5008, "epoch": 119} {"train_loss": -4.625699996948242, "global_step": 5009, "epoch": 119} {"train_loss": -4.695733070373535, "global_step": 5010, "epoch": 119} {"train_loss": -4.330479621887207, "global_step": 5011, "epoch": 119} {"train_loss": -4.49545431137085, "global_step": 5012, "epoch": 119} {"train_loss": -4.5217695236206055, "global_step": 5013, "epoch": 119} {"train_loss": -4.58108377456665, "global_step": 5014, "epoch": 119} {"train_loss": -4.310094356536865, "global_step": 5015, "epoch": 119} {"train_loss": -4.411613464355469, "global_step": 5016, "epoch": 119} {"train_loss": -4.565890312194824, "global_step": 5017, "epoch": 119} {"train_loss": -4.394565582275391, "global_step": 5018, "epoch": 119} {"train_loss": -4.637381076812744, "global_step": 5019, "epoch": 119} {"train_loss": -4.564714431762695, "global_step": 5020, "epoch": 119} {"train_loss": -4.507811546325684, "global_step": 5021, "epoch": 119} {"train_loss": -4.47113037109375, "global_step": 5022, "epoch": 119} {"train_loss": -4.507713317871094, "global_step": 5023, "epoch": 119} {"train_loss": -4.52952241897583, "global_step": 5024, "epoch": 119} {"train_loss": -4.489667892456055, "global_step": 5025, "epoch": 119} {"train_loss": -4.619427680969238, "global_step": 5026, "epoch": 119} {"train_loss": -4.582901954650879, "global_step": 5027, "epoch": 119} {"train_loss": -4.763664245605469, "global_step": 5028, "epoch": 119} {"train_loss": -4.693482398986816, "global_step": 5029, "epoch": 119} {"train_loss": -4.676383972167969, "global_step": 5030, "epoch": 119} {"train_loss": -4.517733573913574, "global_step": 5031, "epoch": 119} {"train_loss": -4.511129379272461, "global_step": 5032, "epoch": 119} {"train_loss": -4.628909111022949, "global_step": 5033, "epoch": 119} {"train_loss": -4.544643402099609, "global_step": 5034, "epoch": 119} {"train_loss": -4.499691009521484, "global_step": 5035, "epoch": 119} {"train_loss": -4.542511463165283, "global_step": 5036, "epoch": 119} {"train_loss": -4.498543739318848, "global_step": 5037, "epoch": 119} {"train_loss": -4.575687408447266, "global_step": 5038, "epoch": 119} {"train_loss": -4.581991513570149, "global_step": 5039, "epoch": 119, "val_loss": 99820.40625} {"train_loss": -4.564613342285156, "global_step": 5040, "epoch": 120} {"train_loss": -4.467923164367676, "global_step": 5041, "epoch": 120} {"train_loss": -4.582453727722168, "global_step": 5042, "epoch": 120} {"train_loss": -4.580938339233398, "global_step": 5043, "epoch": 120} {"train_loss": -4.702687740325928, "global_step": 5044, "epoch": 120} {"train_loss": -4.576208591461182, "global_step": 5045, "epoch": 120} {"train_loss": -4.478570938110352, "global_step": 5046, "epoch": 120} {"train_loss": -4.420289039611816, "global_step": 5047, "epoch": 120} {"train_loss": -4.591043472290039, "global_step": 5048, "epoch": 120} {"train_loss": -4.613728046417236, "global_step": 5049, "epoch": 120} {"train_loss": -4.484312534332275, "global_step": 5050, "epoch": 120} {"train_loss": -4.590848922729492, "global_step": 5051, "epoch": 120} {"train_loss": -4.692500114440918, "global_step": 5052, "epoch": 120} {"train_loss": -4.603288650512695, "global_step": 5053, "epoch": 120} {"train_loss": -4.4321513175964355, "global_step": 5054, "epoch": 120} {"train_loss": -4.68409538269043, "global_step": 5055, "epoch": 120} {"train_loss": -4.389771461486816, "global_step": 5056, "epoch": 120} {"train_loss": -4.515883445739746, "global_step": 5057, "epoch": 120} {"train_loss": -4.582078456878662, "global_step": 5058, "epoch": 120} {"train_loss": -4.611172676086426, "global_step": 5059, "epoch": 120} {"train_loss": -4.6272077560424805, "global_step": 5060, "epoch": 120} {"train_loss": -4.6168951988220215, "global_step": 5061, "epoch": 120} {"train_loss": -4.563102722167969, "global_step": 5062, "epoch": 120} {"train_loss": -4.661512851715088, "global_step": 5063, "epoch": 120} {"train_loss": -4.751157760620117, "global_step": 5064, "epoch": 120} {"train_loss": -4.628154277801514, "global_step": 5065, "epoch": 120} {"train_loss": -4.60939884185791, "global_step": 5066, "epoch": 120} {"train_loss": -4.626922130584717, "global_step": 5067, "epoch": 120} {"train_loss": -4.665759086608887, "global_step": 5068, "epoch": 120} {"train_loss": -4.59751033782959, "global_step": 5069, "epoch": 120} {"train_loss": -4.594597339630127, "global_step": 5070, "epoch": 120} {"train_loss": -4.775641441345215, "global_step": 5071, "epoch": 120} {"train_loss": -4.576518535614014, "global_step": 5072, "epoch": 120} {"train_loss": -4.6618332862854, "global_step": 5073, "epoch": 120} {"train_loss": -4.665322303771973, "global_step": 5074, "epoch": 120} {"train_loss": -4.551339626312256, "global_step": 5075, "epoch": 120} {"train_loss": -4.642180919647217, "global_step": 5076, "epoch": 120} {"train_loss": -4.512801170349121, "global_step": 5077, "epoch": 120} {"train_loss": -4.766242980957031, "global_step": 5078, "epoch": 120} {"train_loss": -4.552435874938965, "global_step": 5079, "epoch": 120} {"train_loss": -4.707137107849121, "global_step": 5080, "epoch": 120} {"train_loss": -4.603982959474836, "global_step": 5081, "epoch": 120, "val_loss": 98994.1484375} {"train_loss": -4.574916839599609, "global_step": 5082, "epoch": 121} {"train_loss": -4.612074375152588, "global_step": 5083, "epoch": 121} {"train_loss": -4.583658218383789, "global_step": 5084, "epoch": 121} {"train_loss": -4.7125563621521, "global_step": 5085, "epoch": 121} {"train_loss": -4.647176742553711, "global_step": 5086, "epoch": 121} {"train_loss": -4.716643810272217, "global_step": 5087, "epoch": 121} {"train_loss": -4.617547035217285, "global_step": 5088, "epoch": 121} {"train_loss": -4.648085117340088, "global_step": 5089, "epoch": 121} {"train_loss": -4.538764476776123, "global_step": 5090, "epoch": 121} {"train_loss": -4.631103515625, "global_step": 5091, "epoch": 121} {"train_loss": -4.655994892120361, "global_step": 5092, "epoch": 121} {"train_loss": -4.660161018371582, "global_step": 5093, "epoch": 121} {"train_loss": -4.831986427307129, "global_step": 5094, "epoch": 121} {"train_loss": -4.6963090896606445, "global_step": 5095, "epoch": 121} {"train_loss": -4.553089141845703, "global_step": 5096, "epoch": 121} {"train_loss": -4.708889961242676, "global_step": 5097, "epoch": 121} {"train_loss": -4.567720413208008, "global_step": 5098, "epoch": 121} {"train_loss": -4.812121868133545, "global_step": 5099, "epoch": 121} {"train_loss": -4.565132141113281, "global_step": 5100, "epoch": 121} {"train_loss": -4.460905075073242, "global_step": 5101, "epoch": 121} {"train_loss": -4.658652305603027, "global_step": 5102, "epoch": 121} {"train_loss": -4.346654891967773, "global_step": 5103, "epoch": 121} {"train_loss": -4.537003517150879, "global_step": 5104, "epoch": 121} {"train_loss": -4.442919731140137, "global_step": 5105, "epoch": 121} {"train_loss": -4.174818515777588, "global_step": 5106, "epoch": 121} {"train_loss": -4.515779972076416, "global_step": 5107, "epoch": 121} {"train_loss": -4.020856857299805, "global_step": 5108, "epoch": 121} {"train_loss": -4.4435319900512695, "global_step": 5109, "epoch": 121} {"train_loss": -4.6458740234375, "global_step": 5110, "epoch": 121} {"train_loss": -4.401156902313232, "global_step": 5111, "epoch": 121} {"train_loss": -4.563998699188232, "global_step": 5112, "epoch": 121} {"train_loss": -4.574272155761719, "global_step": 5113, "epoch": 121} {"train_loss": -4.107512474060059, "global_step": 5114, "epoch": 121} {"train_loss": -4.547176361083984, "global_step": 5115, "epoch": 121} {"train_loss": -4.232582092285156, "global_step": 5116, "epoch": 121} {"train_loss": -4.706750869750977, "global_step": 5117, "epoch": 121} {"train_loss": -4.50873327255249, "global_step": 5118, "epoch": 121} {"train_loss": -4.570931911468506, "global_step": 5119, "epoch": 121} {"train_loss": -4.577768325805664, "global_step": 5120, "epoch": 121} {"train_loss": -4.438576698303223, "global_step": 5121, "epoch": 121} {"train_loss": -4.669430732727051, "global_step": 5122, "epoch": 121} {"train_loss": -4.547444672811599, "global_step": 5123, "epoch": 121, "val_loss": 97768.6640625} {"train_loss": -4.644262790679932, "global_step": 5124, "epoch": 122} {"train_loss": -4.562188148498535, "global_step": 5125, "epoch": 122} {"train_loss": -4.679294586181641, "global_step": 5126, "epoch": 122} {"train_loss": -4.589405536651611, "global_step": 5127, "epoch": 122} {"train_loss": -4.642647743225098, "global_step": 5128, "epoch": 122} {"train_loss": -4.737656593322754, "global_step": 5129, "epoch": 122} {"train_loss": -4.511820316314697, "global_step": 5130, "epoch": 122} {"train_loss": -4.74134635925293, "global_step": 5131, "epoch": 122} {"train_loss": -4.779264450073242, "global_step": 5132, "epoch": 122} {"train_loss": -4.716491222381592, "global_step": 5133, "epoch": 122} {"train_loss": -4.723992347717285, "global_step": 5134, "epoch": 122} {"train_loss": -4.714468002319336, "global_step": 5135, "epoch": 122} {"train_loss": -4.6982502937316895, "global_step": 5136, "epoch": 122} {"train_loss": -4.666754722595215, "global_step": 5137, "epoch": 122} {"train_loss": -4.671177864074707, "global_step": 5138, "epoch": 122} {"train_loss": -4.580541610717773, "global_step": 5139, "epoch": 122} {"train_loss": -4.690854072570801, "global_step": 5140, "epoch": 122} {"train_loss": -4.766751289367676, "global_step": 5141, "epoch": 122} {"train_loss": -4.719444274902344, "global_step": 5142, "epoch": 122} {"train_loss": -4.606632709503174, "global_step": 5143, "epoch": 122} {"train_loss": -4.597851276397705, "global_step": 5144, "epoch": 122} {"train_loss": -4.714594841003418, "global_step": 5145, "epoch": 122} {"train_loss": -4.592560291290283, "global_step": 5146, "epoch": 122} {"train_loss": -4.482351303100586, "global_step": 5147, "epoch": 122} {"train_loss": -4.723857879638672, "global_step": 5148, "epoch": 122} {"train_loss": -4.695928573608398, "global_step": 5149, "epoch": 122} {"train_loss": -4.557592391967773, "global_step": 5150, "epoch": 122} {"train_loss": -4.672085285186768, "global_step": 5151, "epoch": 122} {"train_loss": -4.604701042175293, "global_step": 5152, "epoch": 122} {"train_loss": -4.767025470733643, "global_step": 5153, "epoch": 122} {"train_loss": -4.5984673500061035, "global_step": 5154, "epoch": 122} {"train_loss": -4.560390472412109, "global_step": 5155, "epoch": 122} {"train_loss": -4.7028350830078125, "global_step": 5156, "epoch": 122} {"train_loss": -4.681645393371582, "global_step": 5157, "epoch": 122} {"train_loss": -4.590907573699951, "global_step": 5158, "epoch": 122} {"train_loss": -4.633711338043213, "global_step": 5159, "epoch": 122} {"train_loss": -4.671482563018799, "global_step": 5160, "epoch": 122} {"train_loss": -4.666220664978027, "global_step": 5161, "epoch": 122} {"train_loss": -4.41915225982666, "global_step": 5162, "epoch": 122} {"train_loss": -4.649517059326172, "global_step": 5163, "epoch": 122} {"train_loss": -4.705074787139893, "global_step": 5164, "epoch": 122} {"train_loss": -4.6505346184685115, "global_step": 5165, "epoch": 122, "val_loss": 101887.2109375} {"train_loss": -4.418684959411621, "global_step": 5166, "epoch": 123} {"train_loss": -4.487078666687012, "global_step": 5167, "epoch": 123} {"train_loss": -4.516132354736328, "global_step": 5168, "epoch": 123} {"train_loss": -4.629632949829102, "global_step": 5169, "epoch": 123} {"train_loss": -4.694236755371094, "global_step": 5170, "epoch": 123} {"train_loss": -4.762331962585449, "global_step": 5171, "epoch": 123} {"train_loss": -4.546261787414551, "global_step": 5172, "epoch": 123} {"train_loss": -4.686722755432129, "global_step": 5173, "epoch": 123} {"train_loss": -4.260363578796387, "global_step": 5174, "epoch": 123} {"train_loss": -4.597137928009033, "global_step": 5175, "epoch": 123} {"train_loss": -4.586916446685791, "global_step": 5176, "epoch": 123} {"train_loss": -4.371999740600586, "global_step": 5177, "epoch": 123} {"train_loss": -4.402008056640625, "global_step": 5178, "epoch": 123} {"train_loss": -4.603275775909424, "global_step": 5179, "epoch": 123} {"train_loss": -4.7479400634765625, "global_step": 5180, "epoch": 123} {"train_loss": -4.451725959777832, "global_step": 5181, "epoch": 123} {"train_loss": -4.697922706604004, "global_step": 5182, "epoch": 123} {"train_loss": -4.674373626708984, "global_step": 5183, "epoch": 123} {"train_loss": -4.6489667892456055, "global_step": 5184, "epoch": 123} {"train_loss": -4.532253742218018, "global_step": 5185, "epoch": 123} {"train_loss": -4.632134437561035, "global_step": 5186, "epoch": 123} {"train_loss": -4.598170280456543, "global_step": 5187, "epoch": 123} {"train_loss": -4.623128890991211, "global_step": 5188, "epoch": 123} {"train_loss": -4.677837371826172, "global_step": 5189, "epoch": 123} {"train_loss": -4.6462178230285645, "global_step": 5190, "epoch": 123} {"train_loss": -4.632503032684326, "global_step": 5191, "epoch": 123} {"train_loss": -4.477870941162109, "global_step": 5192, "epoch": 123} {"train_loss": -4.624324321746826, "global_step": 5193, "epoch": 123} {"train_loss": -4.652261734008789, "global_step": 5194, "epoch": 123} {"train_loss": -4.758078575134277, "global_step": 5195, "epoch": 123} {"train_loss": -4.744284629821777, "global_step": 5196, "epoch": 123} {"train_loss": -4.623141765594482, "global_step": 5197, "epoch": 123} {"train_loss": -4.814694404602051, "global_step": 5198, "epoch": 123} {"train_loss": -4.828359603881836, "global_step": 5199, "epoch": 123} {"train_loss": -4.803993225097656, "global_step": 5200, "epoch": 123} {"train_loss": -4.80114221572876, "global_step": 5201, "epoch": 123} {"train_loss": -4.722797870635986, "global_step": 5202, "epoch": 123} {"train_loss": -4.75496244430542, "global_step": 5203, "epoch": 123} {"train_loss": -4.658444404602051, "global_step": 5204, "epoch": 123} {"train_loss": -4.746239185333252, "global_step": 5205, "epoch": 123} {"train_loss": -4.591006278991699, "global_step": 5206, "epoch": 123} {"train_loss": -4.6295412835620695, "global_step": 5207, "epoch": 123, "val_loss": 97928.046875} {"train_loss": -4.706547737121582, "global_step": 5208, "epoch": 124} {"train_loss": -4.708901882171631, "global_step": 5209, "epoch": 124} {"train_loss": -4.602521896362305, "global_step": 5210, "epoch": 124} {"train_loss": -4.524481773376465, "global_step": 5211, "epoch": 124} {"train_loss": -4.719897270202637, "global_step": 5212, "epoch": 124} {"train_loss": -4.471410274505615, "global_step": 5213, "epoch": 124} {"train_loss": -4.507017612457275, "global_step": 5214, "epoch": 124} {"train_loss": -4.770570278167725, "global_step": 5215, "epoch": 124} {"train_loss": -4.888817310333252, "global_step": 5216, "epoch": 124} {"train_loss": -4.599486351013184, "global_step": 5217, "epoch": 124} {"train_loss": -4.59861946105957, "global_step": 5218, "epoch": 124} {"train_loss": -4.685945510864258, "global_step": 5219, "epoch": 124} {"train_loss": -4.498552322387695, "global_step": 5220, "epoch": 124} {"train_loss": -4.643272399902344, "global_step": 5221, "epoch": 124} {"train_loss": -4.442059516906738, "global_step": 5222, "epoch": 124} {"train_loss": -4.392793655395508, "global_step": 5223, "epoch": 124} {"train_loss": -4.621733665466309, "global_step": 5224, "epoch": 124} {"train_loss": -4.719684600830078, "global_step": 5225, "epoch": 124} {"train_loss": -4.454847812652588, "global_step": 5226, "epoch": 124} {"train_loss": -4.582788944244385, "global_step": 5227, "epoch": 124} {"train_loss": -4.696304798126221, "global_step": 5228, "epoch": 124} {"train_loss": -4.378199577331543, "global_step": 5229, "epoch": 124} {"train_loss": -4.7501912117004395, "global_step": 5230, "epoch": 124} {"train_loss": -4.775121688842773, "global_step": 5231, "epoch": 124} {"train_loss": -4.563551902770996, "global_step": 5232, "epoch": 124} {"train_loss": -4.687809944152832, "global_step": 5233, "epoch": 124} {"train_loss": -4.78704833984375, "global_step": 5234, "epoch": 124} {"train_loss": -4.649435043334961, "global_step": 5235, "epoch": 124} {"train_loss": -4.675922870635986, "global_step": 5236, "epoch": 124} {"train_loss": -4.622791290283203, "global_step": 5237, "epoch": 124} {"train_loss": -4.6505913734436035, "global_step": 5238, "epoch": 124} {"train_loss": -4.844616889953613, "global_step": 5239, "epoch": 124} {"train_loss": -4.607116222381592, "global_step": 5240, "epoch": 124} {"train_loss": -4.57704496383667, "global_step": 5241, "epoch": 124} {"train_loss": -4.658524513244629, "global_step": 5242, "epoch": 124} {"train_loss": -4.762681007385254, "global_step": 5243, "epoch": 124} {"train_loss": -4.760217189788818, "global_step": 5244, "epoch": 124} {"train_loss": -4.720488548278809, "global_step": 5245, "epoch": 124} {"train_loss": -4.629363059997559, "global_step": 5246, "epoch": 124} {"train_loss": -4.751415252685547, "global_step": 5247, "epoch": 124} {"train_loss": -4.711831569671631, "global_step": 5248, "epoch": 124} {"train_loss": -4.644415492103214, "global_step": 5249, "epoch": 124, "val_loss": 96679.0390625} {"train_loss": -4.789083957672119, "global_step": 5250, "epoch": 125} {"train_loss": -4.4726409912109375, "global_step": 5251, "epoch": 125} {"train_loss": -4.534791946411133, "global_step": 5252, "epoch": 125} {"train_loss": -4.652350425720215, "global_step": 5253, "epoch": 125} {"train_loss": -4.834290504455566, "global_step": 5254, "epoch": 125} {"train_loss": -4.598566055297852, "global_step": 5255, "epoch": 125} {"train_loss": -4.640425682067871, "global_step": 5256, "epoch": 125} {"train_loss": -4.455264091491699, "global_step": 5257, "epoch": 125} {"train_loss": -4.687000751495361, "global_step": 5258, "epoch": 125} {"train_loss": -4.790328025817871, "global_step": 5259, "epoch": 125} {"train_loss": -4.577048301696777, "global_step": 5260, "epoch": 125} {"train_loss": -4.650425910949707, "global_step": 5261, "epoch": 125} {"train_loss": -4.7557291984558105, "global_step": 5262, "epoch": 125} {"train_loss": -4.669619560241699, "global_step": 5263, "epoch": 125} {"train_loss": -4.572544574737549, "global_step": 5264, "epoch": 125} {"train_loss": -4.812082767486572, "global_step": 5265, "epoch": 125} {"train_loss": -4.7080464363098145, "global_step": 5266, "epoch": 125} {"train_loss": -4.729098320007324, "global_step": 5267, "epoch": 125} {"train_loss": -4.698907375335693, "global_step": 5268, "epoch": 125} {"train_loss": -4.428404331207275, "global_step": 5269, "epoch": 125} {"train_loss": -4.580442428588867, "global_step": 5270, "epoch": 125} {"train_loss": -4.742454528808594, "global_step": 5271, "epoch": 125} {"train_loss": -4.762821674346924, "global_step": 5272, "epoch": 125} {"train_loss": -4.686684608459473, "global_step": 5273, "epoch": 125} {"train_loss": -4.537332534790039, "global_step": 5274, "epoch": 125} {"train_loss": -4.5843610763549805, "global_step": 5275, "epoch": 125} {"train_loss": -4.614972114562988, "global_step": 5276, "epoch": 125} {"train_loss": -4.576927185058594, "global_step": 5277, "epoch": 125} {"train_loss": -4.749260425567627, "global_step": 5278, "epoch": 125} {"train_loss": -4.665582656860352, "global_step": 5279, "epoch": 125} {"train_loss": -4.7220001220703125, "global_step": 5280, "epoch": 125} {"train_loss": -4.69914436340332, "global_step": 5281, "epoch": 125} {"train_loss": -4.658581733703613, "global_step": 5282, "epoch": 125} {"train_loss": -4.83243465423584, "global_step": 5283, "epoch": 125} {"train_loss": -4.762059211730957, "global_step": 5284, "epoch": 125} {"train_loss": -4.643704414367676, "global_step": 5285, "epoch": 125} {"train_loss": -4.742506980895996, "global_step": 5286, "epoch": 125} {"train_loss": -4.683598518371582, "global_step": 5287, "epoch": 125} {"train_loss": -4.501254558563232, "global_step": 5288, "epoch": 125} {"train_loss": -4.7351250648498535, "global_step": 5289, "epoch": 125} {"train_loss": -4.6672587394714355, "global_step": 5290, "epoch": 125} {"train_loss": -4.663477977116902, "global_step": 5291, "epoch": 125, "val_loss": 97532.640625} {"train_loss": -4.738579273223877, "global_step": 5292, "epoch": 126} {"train_loss": -4.72467041015625, "global_step": 5293, "epoch": 126} {"train_loss": -4.639073371887207, "global_step": 5294, "epoch": 126} {"train_loss": -4.772079944610596, "global_step": 5295, "epoch": 126} {"train_loss": -4.837474822998047, "global_step": 5296, "epoch": 126} {"train_loss": -4.567466735839844, "global_step": 5297, "epoch": 126} {"train_loss": -4.7762770652771, "global_step": 5298, "epoch": 126} {"train_loss": -4.55881404876709, "global_step": 5299, "epoch": 126} {"train_loss": -4.625395774841309, "global_step": 5300, "epoch": 126} {"train_loss": -4.528830528259277, "global_step": 5301, "epoch": 126} {"train_loss": -4.567577362060547, "global_step": 5302, "epoch": 126} {"train_loss": -4.589581489562988, "global_step": 5303, "epoch": 126} {"train_loss": -4.675240516662598, "global_step": 5304, "epoch": 126} {"train_loss": -4.79007625579834, "global_step": 5305, "epoch": 126} {"train_loss": -4.59015417098999, "global_step": 5306, "epoch": 126} {"train_loss": -4.747465133666992, "global_step": 5307, "epoch": 126} {"train_loss": -4.709228515625, "global_step": 5308, "epoch": 126} {"train_loss": -4.438349723815918, "global_step": 5309, "epoch": 126} {"train_loss": -4.7303361892700195, "global_step": 5310, "epoch": 126} {"train_loss": -4.7565598487854, "global_step": 5311, "epoch": 126} {"train_loss": -4.324470520019531, "global_step": 5312, "epoch": 126} {"train_loss": -4.645445346832275, "global_step": 5313, "epoch": 126} {"train_loss": -4.414421081542969, "global_step": 5314, "epoch": 126} {"train_loss": -4.6711626052856445, "global_step": 5315, "epoch": 126} {"train_loss": -4.528651237487793, "global_step": 5316, "epoch": 126} {"train_loss": -4.405838966369629, "global_step": 5317, "epoch": 126} {"train_loss": -4.599908351898193, "global_step": 5318, "epoch": 126} {"train_loss": -4.470446586608887, "global_step": 5319, "epoch": 126} {"train_loss": -4.688107490539551, "global_step": 5320, "epoch": 126} {"train_loss": -4.522762298583984, "global_step": 5321, "epoch": 126} {"train_loss": -4.521152496337891, "global_step": 5322, "epoch": 126} {"train_loss": -4.765076637268066, "global_step": 5323, "epoch": 126} {"train_loss": -4.518704414367676, "global_step": 5324, "epoch": 126} {"train_loss": -4.648181915283203, "global_step": 5325, "epoch": 126} {"train_loss": -4.49166202545166, "global_step": 5326, "epoch": 126} {"train_loss": -4.673769474029541, "global_step": 5327, "epoch": 126} {"train_loss": -4.420288562774658, "global_step": 5328, "epoch": 126} {"train_loss": -4.709112167358398, "global_step": 5329, "epoch": 126} {"train_loss": -4.531271934509277, "global_step": 5330, "epoch": 126} {"train_loss": -4.397400856018066, "global_step": 5331, "epoch": 126} {"train_loss": -4.7088942527771, "global_step": 5332, "epoch": 126} {"train_loss": -4.6072413467225575, "global_step": 5333, "epoch": 126, "val_loss": 98030.90625} {"train_loss": -4.589112281799316, "global_step": 5334, "epoch": 127} {"train_loss": -4.652139186859131, "global_step": 5335, "epoch": 127} {"train_loss": -4.787852764129639, "global_step": 5336, "epoch": 127} {"train_loss": -4.533885955810547, "global_step": 5337, "epoch": 127} {"train_loss": -4.523657321929932, "global_step": 5338, "epoch": 127} {"train_loss": -4.621551036834717, "global_step": 5339, "epoch": 127} {"train_loss": -4.4538774490356445, "global_step": 5340, "epoch": 127} {"train_loss": -4.621665954589844, "global_step": 5341, "epoch": 127} {"train_loss": -4.748880386352539, "global_step": 5342, "epoch": 127} {"train_loss": -4.509759902954102, "global_step": 5343, "epoch": 127} {"train_loss": -4.700298309326172, "global_step": 5344, "epoch": 127} {"train_loss": -4.579068183898926, "global_step": 5345, "epoch": 127} {"train_loss": -4.783231258392334, "global_step": 5346, "epoch": 127} {"train_loss": -4.982654094696045, "global_step": 5347, "epoch": 127} {"train_loss": -4.606393337249756, "global_step": 5348, "epoch": 127} {"train_loss": -4.753398895263672, "global_step": 5349, "epoch": 127} {"train_loss": -4.791538238525391, "global_step": 5350, "epoch": 127} {"train_loss": -4.626791954040527, "global_step": 5351, "epoch": 127} {"train_loss": -4.74537992477417, "global_step": 5352, "epoch": 127} {"train_loss": -4.746410369873047, "global_step": 5353, "epoch": 127} {"train_loss": -4.852948188781738, "global_step": 5354, "epoch": 127} {"train_loss": -4.619620323181152, "global_step": 5355, "epoch": 127} {"train_loss": -4.864386558532715, "global_step": 5356, "epoch": 127} {"train_loss": -4.6533708572387695, "global_step": 5357, "epoch": 127} {"train_loss": -4.791461944580078, "global_step": 5358, "epoch": 127} {"train_loss": -4.753512382507324, "global_step": 5359, "epoch": 127} {"train_loss": -4.7745208740234375, "global_step": 5360, "epoch": 127} {"train_loss": -4.605461120605469, "global_step": 5361, "epoch": 127} {"train_loss": -4.740060329437256, "global_step": 5362, "epoch": 127} {"train_loss": -4.748020172119141, "global_step": 5363, "epoch": 127} {"train_loss": -4.69760799407959, "global_step": 5364, "epoch": 127} {"train_loss": -4.61555290222168, "global_step": 5365, "epoch": 127} {"train_loss": -4.73293399810791, "global_step": 5366, "epoch": 127} {"train_loss": -4.635788917541504, "global_step": 5367, "epoch": 127} {"train_loss": -4.650056838989258, "global_step": 5368, "epoch": 127} {"train_loss": -4.6685333251953125, "global_step": 5369, "epoch": 127} {"train_loss": -4.719067573547363, "global_step": 5370, "epoch": 127} {"train_loss": -4.572871208190918, "global_step": 5371, "epoch": 127} {"train_loss": -4.723862648010254, "global_step": 5372, "epoch": 127} {"train_loss": -4.602188587188721, "global_step": 5373, "epoch": 127} {"train_loss": -4.340981483459473, "global_step": 5374, "epoch": 127} {"train_loss": -4.676641657238915, "global_step": 5375, "epoch": 127, "val_loss": 100836.7265625} {"train_loss": -4.575660705566406, "global_step": 5376, "epoch": 128} {"train_loss": -4.371204376220703, "global_step": 5377, "epoch": 128} {"train_loss": -4.505602836608887, "global_step": 5378, "epoch": 128} {"train_loss": -4.441814422607422, "global_step": 5379, "epoch": 128} {"train_loss": -4.704339027404785, "global_step": 5380, "epoch": 128} {"train_loss": -4.775036811828613, "global_step": 5381, "epoch": 128} {"train_loss": -4.523439407348633, "global_step": 5382, "epoch": 128} {"train_loss": -4.53844690322876, "global_step": 5383, "epoch": 128} {"train_loss": -4.654594421386719, "global_step": 5384, "epoch": 128} {"train_loss": -4.524755954742432, "global_step": 5385, "epoch": 128} {"train_loss": -4.588626384735107, "global_step": 5386, "epoch": 128} {"train_loss": -4.308282852172852, "global_step": 5387, "epoch": 128} {"train_loss": -4.566936492919922, "global_step": 5388, "epoch": 128} {"train_loss": -4.354334831237793, "global_step": 5389, "epoch": 128} {"train_loss": -4.39717960357666, "global_step": 5390, "epoch": 128} {"train_loss": -4.551971435546875, "global_step": 5391, "epoch": 128} {"train_loss": -4.546886444091797, "global_step": 5392, "epoch": 128} {"train_loss": -4.677004814147949, "global_step": 5393, "epoch": 128} {"train_loss": -4.579562664031982, "global_step": 5394, "epoch": 128} {"train_loss": -4.350671768188477, "global_step": 5395, "epoch": 128} {"train_loss": -4.679935455322266, "global_step": 5396, "epoch": 128} {"train_loss": -4.691779136657715, "global_step": 5397, "epoch": 128} {"train_loss": -4.645988464355469, "global_step": 5398, "epoch": 128} {"train_loss": -4.67559814453125, "global_step": 5399, "epoch": 128} {"train_loss": -4.7686448097229, "global_step": 5400, "epoch": 128} {"train_loss": -4.729095458984375, "global_step": 5401, "epoch": 128} {"train_loss": -4.700998306274414, "global_step": 5402, "epoch": 128} {"train_loss": -4.726109504699707, "global_step": 5403, "epoch": 128} {"train_loss": -4.714042663574219, "global_step": 5404, "epoch": 128} {"train_loss": -4.857358932495117, "global_step": 5405, "epoch": 128} {"train_loss": -4.777163982391357, "global_step": 5406, "epoch": 128} {"train_loss": -4.570261001586914, "global_step": 5407, "epoch": 128} {"train_loss": -4.723917007446289, "global_step": 5408, "epoch": 128} {"train_loss": -4.747873306274414, "global_step": 5409, "epoch": 128} {"train_loss": -4.579967975616455, "global_step": 5410, "epoch": 128} {"train_loss": -4.8120574951171875, "global_step": 5411, "epoch": 128} {"train_loss": -4.688708305358887, "global_step": 5412, "epoch": 128} {"train_loss": -4.702576637268066, "global_step": 5413, "epoch": 128} {"train_loss": -4.736823558807373, "global_step": 5414, "epoch": 128} {"train_loss": -4.600223064422607, "global_step": 5415, "epoch": 128} {"train_loss": -4.77337646484375, "global_step": 5416, "epoch": 128} {"train_loss": -4.622869275865101, "global_step": 5417, "epoch": 128, "val_loss": 94952.3125} {"train_loss": -4.699081897735596, "global_step": 5418, "epoch": 129} {"train_loss": -4.625105381011963, "global_step": 5419, "epoch": 129} {"train_loss": -4.802452087402344, "global_step": 5420, "epoch": 129} {"train_loss": -4.709038734436035, "global_step": 5421, "epoch": 129} {"train_loss": -4.8143486976623535, "global_step": 5422, "epoch": 129} {"train_loss": -4.777396202087402, "global_step": 5423, "epoch": 129} {"train_loss": -4.788321495056152, "global_step": 5424, "epoch": 129} {"train_loss": -4.790706634521484, "global_step": 5425, "epoch": 129} {"train_loss": -4.656647682189941, "global_step": 5426, "epoch": 129} {"train_loss": -4.682304382324219, "global_step": 5427, "epoch": 129} {"train_loss": -4.509425163269043, "global_step": 5428, "epoch": 129} {"train_loss": -4.585965156555176, "global_step": 5429, "epoch": 129} {"train_loss": -4.68248176574707, "global_step": 5430, "epoch": 129} {"train_loss": -4.712279319763184, "global_step": 5431, "epoch": 129} {"train_loss": -4.585816383361816, "global_step": 5432, "epoch": 129} {"train_loss": -4.787915229797363, "global_step": 5433, "epoch": 129} {"train_loss": -4.634036064147949, "global_step": 5434, "epoch": 129} {"train_loss": -4.660750389099121, "global_step": 5435, "epoch": 129} {"train_loss": -4.670503616333008, "global_step": 5436, "epoch": 129} {"train_loss": -4.784265995025635, "global_step": 5437, "epoch": 129} {"train_loss": -4.549558639526367, "global_step": 5438, "epoch": 129} {"train_loss": -4.781317234039307, "global_step": 5439, "epoch": 129} {"train_loss": -4.754280090332031, "global_step": 5440, "epoch": 129} {"train_loss": -4.755776405334473, "global_step": 5441, "epoch": 129} {"train_loss": -4.641228675842285, "global_step": 5442, "epoch": 129} {"train_loss": -4.665727138519287, "global_step": 5443, "epoch": 129} {"train_loss": -4.7686920166015625, "global_step": 5444, "epoch": 129} {"train_loss": -4.760601043701172, "global_step": 5445, "epoch": 129} {"train_loss": -4.760962009429932, "global_step": 5446, "epoch": 129} {"train_loss": -4.865629196166992, "global_step": 5447, "epoch": 129} {"train_loss": -4.729534149169922, "global_step": 5448, "epoch": 129} {"train_loss": -4.752021789550781, "global_step": 5449, "epoch": 129} {"train_loss": -4.775534152984619, "global_step": 5450, "epoch": 129} {"train_loss": -4.780035495758057, "global_step": 5451, "epoch": 129} {"train_loss": -4.660338401794434, "global_step": 5452, "epoch": 129} {"train_loss": -4.852359771728516, "global_step": 5453, "epoch": 129} {"train_loss": -4.642117500305176, "global_step": 5454, "epoch": 129} {"train_loss": -4.611237049102783, "global_step": 5455, "epoch": 129} {"train_loss": -4.674012184143066, "global_step": 5456, "epoch": 129} {"train_loss": -4.591004848480225, "global_step": 5457, "epoch": 129} {"train_loss": -4.678508758544922, "global_step": 5458, "epoch": 129} {"train_loss": -4.7070787861233665, "global_step": 5459, "epoch": 129, "val_loss": 95724.578125} {"train_loss": -4.888062953948975, "global_step": 5460, "epoch": 130} {"train_loss": -4.7302775382995605, "global_step": 5461, "epoch": 130} {"train_loss": -4.853442192077637, "global_step": 5462, "epoch": 130} {"train_loss": -4.656669616699219, "global_step": 5463, "epoch": 130} {"train_loss": -4.624806880950928, "global_step": 5464, "epoch": 130} {"train_loss": -4.805254936218262, "global_step": 5465, "epoch": 130} {"train_loss": -4.717495918273926, "global_step": 5466, "epoch": 130} {"train_loss": -4.696533679962158, "global_step": 5467, "epoch": 130} {"train_loss": -4.714143753051758, "global_step": 5468, "epoch": 130} {"train_loss": -4.78422737121582, "global_step": 5469, "epoch": 130} {"train_loss": -4.723520755767822, "global_step": 5470, "epoch": 130} {"train_loss": -4.804533004760742, "global_step": 5471, "epoch": 130} {"train_loss": -4.835733890533447, "global_step": 5472, "epoch": 130} {"train_loss": -4.761406898498535, "global_step": 5473, "epoch": 130} {"train_loss": -4.71729040145874, "global_step": 5474, "epoch": 130} {"train_loss": -4.749593734741211, "global_step": 5475, "epoch": 130} {"train_loss": -4.761144638061523, "global_step": 5476, "epoch": 130} {"train_loss": -4.55345344543457, "global_step": 5477, "epoch": 130} {"train_loss": -4.679121494293213, "global_step": 5478, "epoch": 130} {"train_loss": -4.697934150695801, "global_step": 5479, "epoch": 130} {"train_loss": -4.666579246520996, "global_step": 5480, "epoch": 130} {"train_loss": -4.762616157531738, "global_step": 5481, "epoch": 130} {"train_loss": -4.760164260864258, "global_step": 5482, "epoch": 130} {"train_loss": -4.6863508224487305, "global_step": 5483, "epoch": 130} {"train_loss": -4.738238334655762, "global_step": 5484, "epoch": 130} {"train_loss": -4.6699748039245605, "global_step": 5485, "epoch": 130} {"train_loss": -4.595330238342285, "global_step": 5486, "epoch": 130} {"train_loss": -4.8132524490356445, "global_step": 5487, "epoch": 130} {"train_loss": -4.697063446044922, "global_step": 5488, "epoch": 130} {"train_loss": -4.579742431640625, "global_step": 5489, "epoch": 130} {"train_loss": -4.886169910430908, "global_step": 5490, "epoch": 130} {"train_loss": -4.714722156524658, "global_step": 5491, "epoch": 130} {"train_loss": -4.46976375579834, "global_step": 5492, "epoch": 130} {"train_loss": -4.654478073120117, "global_step": 5493, "epoch": 130} {"train_loss": -4.441020965576172, "global_step": 5494, "epoch": 130} {"train_loss": -4.514452934265137, "global_step": 5495, "epoch": 130} {"train_loss": -4.795276165008545, "global_step": 5496, "epoch": 130} {"train_loss": -4.442743301391602, "global_step": 5497, "epoch": 130} {"train_loss": -4.458475112915039, "global_step": 5498, "epoch": 130} {"train_loss": -4.655880928039551, "global_step": 5499, "epoch": 130} {"train_loss": -4.712427139282227, "global_step": 5500, "epoch": 130} {"train_loss": -4.694545882088797, "global_step": 5501, "epoch": 130, "val_loss": 94221.546875} {"train_loss": -4.760300636291504, "global_step": 5502, "epoch": 131} {"train_loss": -4.740495681762695, "global_step": 5503, "epoch": 131} {"train_loss": -4.835299491882324, "global_step": 5504, "epoch": 131} {"train_loss": -4.655686855316162, "global_step": 5505, "epoch": 131} {"train_loss": -4.77042293548584, "global_step": 5506, "epoch": 131} {"train_loss": -4.636395454406738, "global_step": 5507, "epoch": 131} {"train_loss": -4.443422317504883, "global_step": 5508, "epoch": 131} {"train_loss": -4.591869354248047, "global_step": 5509, "epoch": 131} {"train_loss": -4.793193340301514, "global_step": 5510, "epoch": 131} {"train_loss": -4.737395286560059, "global_step": 5511, "epoch": 131} {"train_loss": -4.854454040527344, "global_step": 5512, "epoch": 131} {"train_loss": -4.718311309814453, "global_step": 5513, "epoch": 131} {"train_loss": -4.667665481567383, "global_step": 5514, "epoch": 131} {"train_loss": -4.712030410766602, "global_step": 5515, "epoch": 131} {"train_loss": -4.79449462890625, "global_step": 5516, "epoch": 131} {"train_loss": -4.690699100494385, "global_step": 5517, "epoch": 131} {"train_loss": -4.60158109664917, "global_step": 5518, "epoch": 131} {"train_loss": -4.697251319885254, "global_step": 5519, "epoch": 131} {"train_loss": -4.615261554718018, "global_step": 5520, "epoch": 131} {"train_loss": -4.816000461578369, "global_step": 5521, "epoch": 131} {"train_loss": -4.680912017822266, "global_step": 5522, "epoch": 131} {"train_loss": -4.840391159057617, "global_step": 5523, "epoch": 131} {"train_loss": -4.900475025177002, "global_step": 5524, "epoch": 131} {"train_loss": -4.78240966796875, "global_step": 5525, "epoch": 131} {"train_loss": -4.889372825622559, "global_step": 5526, "epoch": 131} {"train_loss": -4.742776870727539, "global_step": 5527, "epoch": 131} {"train_loss": -4.6575927734375, "global_step": 5528, "epoch": 131} {"train_loss": -4.6451735496521, "global_step": 5529, "epoch": 131} {"train_loss": -4.795886516571045, "global_step": 5530, "epoch": 131} {"train_loss": -4.828535079956055, "global_step": 5531, "epoch": 131} {"train_loss": -4.585247993469238, "global_step": 5532, "epoch": 131} {"train_loss": -4.708143711090088, "global_step": 5533, "epoch": 131} {"train_loss": -4.694911003112793, "global_step": 5534, "epoch": 131} {"train_loss": -4.7969207763671875, "global_step": 5535, "epoch": 131} {"train_loss": -4.820752143859863, "global_step": 5536, "epoch": 131} {"train_loss": -4.659933090209961, "global_step": 5537, "epoch": 131} {"train_loss": -4.665078163146973, "global_step": 5538, "epoch": 131} {"train_loss": -4.660032749176025, "global_step": 5539, "epoch": 131} {"train_loss": -4.760870933532715, "global_step": 5540, "epoch": 131} {"train_loss": -4.732366561889648, "global_step": 5541, "epoch": 131} {"train_loss": -4.663565635681152, "global_step": 5542, "epoch": 131} {"train_loss": -4.719688540413266, "global_step": 5543, "epoch": 131, "val_loss": 95909.6953125} {"train_loss": -4.5353593826293945, "global_step": 5544, "epoch": 132} {"train_loss": -4.644140243530273, "global_step": 5545, "epoch": 132} {"train_loss": -4.658205032348633, "global_step": 5546, "epoch": 132} {"train_loss": -4.597792148590088, "global_step": 5547, "epoch": 132} {"train_loss": -4.677228927612305, "global_step": 5548, "epoch": 132} {"train_loss": -4.564225196838379, "global_step": 5549, "epoch": 132} {"train_loss": -4.659864902496338, "global_step": 5550, "epoch": 132} {"train_loss": -4.7974443435668945, "global_step": 5551, "epoch": 132} {"train_loss": -4.623468399047852, "global_step": 5552, "epoch": 132} {"train_loss": -4.6526288986206055, "global_step": 5553, "epoch": 132} {"train_loss": -4.740720748901367, "global_step": 5554, "epoch": 132} {"train_loss": -4.6077141761779785, "global_step": 5555, "epoch": 132} {"train_loss": -4.638202667236328, "global_step": 5556, "epoch": 132} {"train_loss": -4.708766937255859, "global_step": 5557, "epoch": 132} {"train_loss": -4.729621410369873, "global_step": 5558, "epoch": 132} {"train_loss": -4.489657402038574, "global_step": 5559, "epoch": 132} {"train_loss": -4.683374881744385, "global_step": 5560, "epoch": 132} {"train_loss": -4.766260147094727, "global_step": 5561, "epoch": 132} {"train_loss": -4.783871650695801, "global_step": 5562, "epoch": 132} {"train_loss": -4.824305534362793, "global_step": 5563, "epoch": 132} {"train_loss": -4.655252933502197, "global_step": 5564, "epoch": 132} {"train_loss": -4.7532958984375, "global_step": 5565, "epoch": 132} {"train_loss": -4.778252601623535, "global_step": 5566, "epoch": 132} {"train_loss": -4.739603042602539, "global_step": 5567, "epoch": 132} {"train_loss": -4.940068244934082, "global_step": 5568, "epoch": 132} {"train_loss": -4.786951541900635, "global_step": 5569, "epoch": 132} {"train_loss": -4.758378028869629, "global_step": 5570, "epoch": 132} {"train_loss": -4.867038726806641, "global_step": 5571, "epoch": 132} {"train_loss": -4.811812400817871, "global_step": 5572, "epoch": 132} {"train_loss": -4.607732772827148, "global_step": 5573, "epoch": 132} {"train_loss": -4.668226718902588, "global_step": 5574, "epoch": 132} {"train_loss": -4.743104934692383, "global_step": 5575, "epoch": 132} {"train_loss": -4.929286003112793, "global_step": 5576, "epoch": 132} {"train_loss": -4.672508716583252, "global_step": 5577, "epoch": 132} {"train_loss": -4.704930305480957, "global_step": 5578, "epoch": 132} {"train_loss": -4.974881172180176, "global_step": 5579, "epoch": 132} {"train_loss": -4.640849590301514, "global_step": 5580, "epoch": 132} {"train_loss": -4.493183135986328, "global_step": 5581, "epoch": 132} {"train_loss": -4.811881065368652, "global_step": 5582, "epoch": 132} {"train_loss": -4.423609256744385, "global_step": 5583, "epoch": 132} {"train_loss": -4.661251068115234, "global_step": 5584, "epoch": 132} {"train_loss": -4.705527941385905, "global_step": 5585, "epoch": 132, "val_loss": 97708.3046875} {"train_loss": -4.567286968231201, "global_step": 5586, "epoch": 133} {"train_loss": -4.792647361755371, "global_step": 5587, "epoch": 133} {"train_loss": -4.85058069229126, "global_step": 5588, "epoch": 133} {"train_loss": -4.823557376861572, "global_step": 5589, "epoch": 133} {"train_loss": -4.674267292022705, "global_step": 5590, "epoch": 133} {"train_loss": -4.815512657165527, "global_step": 5591, "epoch": 133} {"train_loss": -4.80648136138916, "global_step": 5592, "epoch": 133} {"train_loss": -4.7706193923950195, "global_step": 5593, "epoch": 133} {"train_loss": -4.606576919555664, "global_step": 5594, "epoch": 133} {"train_loss": -4.680905342102051, "global_step": 5595, "epoch": 133} {"train_loss": -4.853020668029785, "global_step": 5596, "epoch": 133} {"train_loss": -4.817105293273926, "global_step": 5597, "epoch": 133} {"train_loss": -4.6670613288879395, "global_step": 5598, "epoch": 133} {"train_loss": -4.756265640258789, "global_step": 5599, "epoch": 133} {"train_loss": -4.9013566970825195, "global_step": 5600, "epoch": 133} {"train_loss": -4.8662919998168945, "global_step": 5601, "epoch": 133} {"train_loss": -4.619523525238037, "global_step": 5602, "epoch": 133} {"train_loss": -4.680927276611328, "global_step": 5603, "epoch": 133} {"train_loss": -4.7158966064453125, "global_step": 5604, "epoch": 133} {"train_loss": -4.722844123840332, "global_step": 5605, "epoch": 133} {"train_loss": -4.794806957244873, "global_step": 5606, "epoch": 133} {"train_loss": -4.684398651123047, "global_step": 5607, "epoch": 133} {"train_loss": -4.76093864440918, "global_step": 5608, "epoch": 133} {"train_loss": -4.513188362121582, "global_step": 5609, "epoch": 133} {"train_loss": -4.762567520141602, "global_step": 5610, "epoch": 133} {"train_loss": -4.7323784828186035, "global_step": 5611, "epoch": 133} {"train_loss": -4.499741077423096, "global_step": 5612, "epoch": 133} {"train_loss": -4.596164703369141, "global_step": 5613, "epoch": 133} {"train_loss": -4.714463233947754, "global_step": 5614, "epoch": 133} {"train_loss": -4.717124938964844, "global_step": 5615, "epoch": 133} {"train_loss": -4.744311332702637, "global_step": 5616, "epoch": 133} {"train_loss": -4.797743797302246, "global_step": 5617, "epoch": 133} {"train_loss": -4.72288703918457, "global_step": 5618, "epoch": 133} {"train_loss": -4.828990936279297, "global_step": 5619, "epoch": 133} {"train_loss": -4.729956150054932, "global_step": 5620, "epoch": 133} {"train_loss": -4.4713263511657715, "global_step": 5621, "epoch": 133} {"train_loss": -4.764817714691162, "global_step": 5622, "epoch": 133} {"train_loss": -4.764920234680176, "global_step": 5623, "epoch": 133} {"train_loss": -4.649355411529541, "global_step": 5624, "epoch": 133} {"train_loss": -4.489457130432129, "global_step": 5625, "epoch": 133} {"train_loss": -4.665223121643066, "global_step": 5626, "epoch": 133} {"train_loss": -4.710177455629621, "global_step": 5627, "epoch": 133, "val_loss": 96296.1875} {"train_loss": -4.528564929962158, "global_step": 5628, "epoch": 134} {"train_loss": -4.7369704246521, "global_step": 5629, "epoch": 134} {"train_loss": -4.488356113433838, "global_step": 5630, "epoch": 134} {"train_loss": -4.6575608253479, "global_step": 5631, "epoch": 134} {"train_loss": -4.562393665313721, "global_step": 5632, "epoch": 134} {"train_loss": -4.645120620727539, "global_step": 5633, "epoch": 134} {"train_loss": -4.6864423751831055, "global_step": 5634, "epoch": 134} {"train_loss": -4.722532272338867, "global_step": 5635, "epoch": 134} {"train_loss": -4.716794490814209, "global_step": 5636, "epoch": 134} {"train_loss": -4.794798851013184, "global_step": 5637, "epoch": 134} {"train_loss": -4.615078449249268, "global_step": 5638, "epoch": 134} {"train_loss": -4.795267105102539, "global_step": 5639, "epoch": 134} {"train_loss": -4.539137840270996, "global_step": 5640, "epoch": 134} {"train_loss": -4.8824334144592285, "global_step": 5641, "epoch": 134} {"train_loss": -4.684144020080566, "global_step": 5642, "epoch": 134} {"train_loss": -4.765567779541016, "global_step": 5643, "epoch": 134} {"train_loss": -4.700364112854004, "global_step": 5644, "epoch": 134} {"train_loss": -4.672016143798828, "global_step": 5645, "epoch": 134} {"train_loss": -4.79411506652832, "global_step": 5646, "epoch": 134} {"train_loss": -4.782698154449463, "global_step": 5647, "epoch": 134} {"train_loss": -4.847588539123535, "global_step": 5648, "epoch": 134} {"train_loss": -4.670475959777832, "global_step": 5649, "epoch": 134} {"train_loss": -4.856858253479004, "global_step": 5650, "epoch": 134} {"train_loss": -4.868346691131592, "global_step": 5651, "epoch": 134} {"train_loss": -4.701324939727783, "global_step": 5652, "epoch": 134} {"train_loss": -4.765260696411133, "global_step": 5653, "epoch": 134} {"train_loss": -4.815478324890137, "global_step": 5654, "epoch": 134} {"train_loss": -4.813932418823242, "global_step": 5655, "epoch": 134} {"train_loss": -4.768600940704346, "global_step": 5656, "epoch": 134} {"train_loss": -4.71530294418335, "global_step": 5657, "epoch": 134} {"train_loss": -4.743446350097656, "global_step": 5658, "epoch": 134} {"train_loss": -4.760895729064941, "global_step": 5659, "epoch": 134} {"train_loss": -4.82249641418457, "global_step": 5660, "epoch": 134} {"train_loss": -4.693758010864258, "global_step": 5661, "epoch": 134} {"train_loss": -4.86832857131958, "global_step": 5662, "epoch": 134} {"train_loss": -4.682425498962402, "global_step": 5663, "epoch": 134} {"train_loss": -4.597738742828369, "global_step": 5664, "epoch": 134} {"train_loss": -4.848423004150391, "global_step": 5665, "epoch": 134} {"train_loss": -4.859697341918945, "global_step": 5666, "epoch": 134} {"train_loss": -4.788569450378418, "global_step": 5667, "epoch": 134} {"train_loss": -4.759732246398926, "global_step": 5668, "epoch": 134} {"train_loss": -4.731238092694964, "global_step": 5669, "epoch": 134, "val_loss": 93677.0859375} {"train_loss": -4.900750160217285, "global_step": 5670, "epoch": 135} {"train_loss": -4.628196716308594, "global_step": 5671, "epoch": 135} {"train_loss": -4.567013263702393, "global_step": 5672, "epoch": 135} {"train_loss": -4.832792282104492, "global_step": 5673, "epoch": 135} {"train_loss": -4.96701717376709, "global_step": 5674, "epoch": 135} {"train_loss": -4.578076362609863, "global_step": 5675, "epoch": 135} {"train_loss": -4.546278953552246, "global_step": 5676, "epoch": 135} {"train_loss": -4.77280855178833, "global_step": 5677, "epoch": 135} {"train_loss": -4.6958160400390625, "global_step": 5678, "epoch": 135} {"train_loss": -4.566354751586914, "global_step": 5679, "epoch": 135} {"train_loss": -4.789796829223633, "global_step": 5680, "epoch": 135} {"train_loss": -4.890557765960693, "global_step": 5681, "epoch": 135} {"train_loss": -4.599585056304932, "global_step": 5682, "epoch": 135} {"train_loss": -4.593099117279053, "global_step": 5683, "epoch": 135} {"train_loss": -4.840154647827148, "global_step": 5684, "epoch": 135} {"train_loss": -4.69146728515625, "global_step": 5685, "epoch": 135} {"train_loss": -4.685498237609863, "global_step": 5686, "epoch": 135} {"train_loss": -4.729319095611572, "global_step": 5687, "epoch": 135} {"train_loss": -4.787588119506836, "global_step": 5688, "epoch": 135} {"train_loss": -4.891721725463867, "global_step": 5689, "epoch": 135} {"train_loss": -4.77204704284668, "global_step": 5690, "epoch": 135} {"train_loss": -4.562060356140137, "global_step": 5691, "epoch": 135} {"train_loss": -4.804636001586914, "global_step": 5692, "epoch": 135} {"train_loss": -4.723552227020264, "global_step": 5693, "epoch": 135} {"train_loss": -4.704600811004639, "global_step": 5694, "epoch": 135} {"train_loss": -4.54893684387207, "global_step": 5695, "epoch": 135} {"train_loss": -4.413573265075684, "global_step": 5696, "epoch": 135} {"train_loss": -4.716922760009766, "global_step": 5697, "epoch": 135} {"train_loss": -4.706228256225586, "global_step": 5698, "epoch": 135} {"train_loss": -4.410453796386719, "global_step": 5699, "epoch": 135} {"train_loss": -4.671769142150879, "global_step": 5700, "epoch": 135} {"train_loss": -4.578927993774414, "global_step": 5701, "epoch": 135} {"train_loss": -4.768329620361328, "global_step": 5702, "epoch": 135} {"train_loss": -4.8190155029296875, "global_step": 5703, "epoch": 135} {"train_loss": -4.6049041748046875, "global_step": 5704, "epoch": 135} {"train_loss": -4.721990585327148, "global_step": 5705, "epoch": 135} {"train_loss": -4.744901657104492, "global_step": 5706, "epoch": 135} {"train_loss": -4.775808334350586, "global_step": 5707, "epoch": 135} {"train_loss": -4.685120105743408, "global_step": 5708, "epoch": 135} {"train_loss": -4.677883625030518, "global_step": 5709, "epoch": 135} {"train_loss": -4.831804275512695, "global_step": 5710, "epoch": 135} {"train_loss": -4.701740151359921, "global_step": 5711, "epoch": 135, "val_loss": 93819.921875} {"train_loss": -4.79155158996582, "global_step": 5712, "epoch": 136} {"train_loss": -4.6987152099609375, "global_step": 5713, "epoch": 136} {"train_loss": -4.771228790283203, "global_step": 5714, "epoch": 136} {"train_loss": -4.790355682373047, "global_step": 5715, "epoch": 136} {"train_loss": -4.7080230712890625, "global_step": 5716, "epoch": 136} {"train_loss": -4.664172172546387, "global_step": 5717, "epoch": 136} {"train_loss": -4.807824611663818, "global_step": 5718, "epoch": 136} {"train_loss": -4.624279499053955, "global_step": 5719, "epoch": 136} {"train_loss": -4.854901313781738, "global_step": 5720, "epoch": 136} {"train_loss": -4.680878162384033, "global_step": 5721, "epoch": 136} {"train_loss": -4.692544460296631, "global_step": 5722, "epoch": 136} {"train_loss": -4.70229959487915, "global_step": 5723, "epoch": 136} {"train_loss": -4.642438888549805, "global_step": 5724, "epoch": 136} {"train_loss": -4.702364921569824, "global_step": 5725, "epoch": 136} {"train_loss": -4.730432987213135, "global_step": 5726, "epoch": 136} {"train_loss": -4.683358192443848, "global_step": 5727, "epoch": 136} {"train_loss": -4.8845062255859375, "global_step": 5728, "epoch": 136} {"train_loss": -4.785170555114746, "global_step": 5729, "epoch": 136} {"train_loss": -4.682677745819092, "global_step": 5730, "epoch": 136} {"train_loss": -4.832426071166992, "global_step": 5731, "epoch": 136} {"train_loss": -4.758241176605225, "global_step": 5732, "epoch": 136} {"train_loss": -4.6957831382751465, "global_step": 5733, "epoch": 136} {"train_loss": -4.631901741027832, "global_step": 5734, "epoch": 136} {"train_loss": -4.821521759033203, "global_step": 5735, "epoch": 136} {"train_loss": -4.806326866149902, "global_step": 5736, "epoch": 136} {"train_loss": -4.632652282714844, "global_step": 5737, "epoch": 136} {"train_loss": -4.68945837020874, "global_step": 5738, "epoch": 136} {"train_loss": -4.861440658569336, "global_step": 5739, "epoch": 136} {"train_loss": -4.621768474578857, "global_step": 5740, "epoch": 136} {"train_loss": -4.791882514953613, "global_step": 5741, "epoch": 136} {"train_loss": -4.78098726272583, "global_step": 5742, "epoch": 136} {"train_loss": -4.868203163146973, "global_step": 5743, "epoch": 136} {"train_loss": -4.713918685913086, "global_step": 5744, "epoch": 136} {"train_loss": -4.658758163452148, "global_step": 5745, "epoch": 136} {"train_loss": -4.918249130249023, "global_step": 5746, "epoch": 136} {"train_loss": -4.622249603271484, "global_step": 5747, "epoch": 136} {"train_loss": -4.830531597137451, "global_step": 5748, "epoch": 136} {"train_loss": -4.657130241394043, "global_step": 5749, "epoch": 136} {"train_loss": -4.791729927062988, "global_step": 5750, "epoch": 136} {"train_loss": -4.82199764251709, "global_step": 5751, "epoch": 136} {"train_loss": -4.710611343383789, "global_step": 5752, "epoch": 136} {"train_loss": -4.74158805892581, "global_step": 5753, "epoch": 136, "val_loss": 94668.625} {"train_loss": -4.781499862670898, "global_step": 5754, "epoch": 137} {"train_loss": -4.7678656578063965, "global_step": 5755, "epoch": 137} {"train_loss": -4.843512058258057, "global_step": 5756, "epoch": 137} {"train_loss": -4.64137077331543, "global_step": 5757, "epoch": 137} {"train_loss": -4.676794052124023, "global_step": 5758, "epoch": 137} {"train_loss": -4.81691837310791, "global_step": 5759, "epoch": 137} {"train_loss": -4.724869728088379, "global_step": 5760, "epoch": 137} {"train_loss": -4.743448257446289, "global_step": 5761, "epoch": 137} {"train_loss": -4.77559757232666, "global_step": 5762, "epoch": 137} {"train_loss": -4.785772800445557, "global_step": 5763, "epoch": 137} {"train_loss": -4.328153133392334, "global_step": 5764, "epoch": 137} {"train_loss": -4.568216323852539, "global_step": 5765, "epoch": 137} {"train_loss": -4.714223861694336, "global_step": 5766, "epoch": 137} {"train_loss": -4.631115913391113, "global_step": 5767, "epoch": 137} {"train_loss": -4.5528459548950195, "global_step": 5768, "epoch": 137} {"train_loss": -4.859485149383545, "global_step": 5769, "epoch": 137} {"train_loss": -4.793665885925293, "global_step": 5770, "epoch": 137} {"train_loss": -4.548070907592773, "global_step": 5771, "epoch": 137} {"train_loss": -4.698577880859375, "global_step": 5772, "epoch": 137} {"train_loss": -4.873202800750732, "global_step": 5773, "epoch": 137} {"train_loss": -4.701207637786865, "global_step": 5774, "epoch": 137} {"train_loss": -4.671629905700684, "global_step": 5775, "epoch": 137} {"train_loss": -4.918617248535156, "global_step": 5776, "epoch": 137} {"train_loss": -4.696407318115234, "global_step": 5777, "epoch": 137} {"train_loss": -4.715458393096924, "global_step": 5778, "epoch": 137} {"train_loss": -4.810521602630615, "global_step": 5779, "epoch": 137} {"train_loss": -4.792222499847412, "global_step": 5780, "epoch": 137} {"train_loss": -4.8247456550598145, "global_step": 5781, "epoch": 137} {"train_loss": -4.733306884765625, "global_step": 5782, "epoch": 137} {"train_loss": -4.766458511352539, "global_step": 5783, "epoch": 137} {"train_loss": -4.934780120849609, "global_step": 5784, "epoch": 137} {"train_loss": -4.862959861755371, "global_step": 5785, "epoch": 137} {"train_loss": -4.9033074378967285, "global_step": 5786, "epoch": 137} {"train_loss": -4.850722312927246, "global_step": 5787, "epoch": 137} {"train_loss": -4.794206619262695, "global_step": 5788, "epoch": 137} {"train_loss": -4.669580936431885, "global_step": 5789, "epoch": 137} {"train_loss": -4.734127044677734, "global_step": 5790, "epoch": 137} {"train_loss": -4.866242408752441, "global_step": 5791, "epoch": 137} {"train_loss": -4.556057453155518, "global_step": 5792, "epoch": 137} {"train_loss": -4.919276237487793, "global_step": 5793, "epoch": 137} {"train_loss": -4.790299415588379, "global_step": 5794, "epoch": 137} {"train_loss": -4.7516686689286, "global_step": 5795, "epoch": 137, "val_loss": 94663.984375} {"train_loss": -4.715246200561523, "global_step": 5796, "epoch": 138} {"train_loss": -4.845810890197754, "global_step": 5797, "epoch": 138} {"train_loss": -4.949923992156982, "global_step": 5798, "epoch": 138} {"train_loss": -4.664196968078613, "global_step": 5799, "epoch": 138} {"train_loss": -4.870390892028809, "global_step": 5800, "epoch": 138} {"train_loss": -4.752778053283691, "global_step": 5801, "epoch": 138} {"train_loss": -4.630809783935547, "global_step": 5802, "epoch": 138} {"train_loss": -4.732049942016602, "global_step": 5803, "epoch": 138} {"train_loss": -4.878380298614502, "global_step": 5804, "epoch": 138} {"train_loss": -4.636582374572754, "global_step": 5805, "epoch": 138} {"train_loss": -4.659211158752441, "global_step": 5806, "epoch": 138} {"train_loss": -4.828670501708984, "global_step": 5807, "epoch": 138} {"train_loss": -4.636191368103027, "global_step": 5808, "epoch": 138} {"train_loss": -4.804558277130127, "global_step": 5809, "epoch": 138} {"train_loss": -4.596858024597168, "global_step": 5810, "epoch": 138} {"train_loss": -4.847890853881836, "global_step": 5811, "epoch": 138} {"train_loss": -4.731565952301025, "global_step": 5812, "epoch": 138} {"train_loss": -4.723584175109863, "global_step": 5813, "epoch": 138} {"train_loss": -4.752296447753906, "global_step": 5814, "epoch": 138} {"train_loss": -4.707403182983398, "global_step": 5815, "epoch": 138} {"train_loss": -4.765287399291992, "global_step": 5816, "epoch": 138} {"train_loss": -4.8301191329956055, "global_step": 5817, "epoch": 138} {"train_loss": -4.636197090148926, "global_step": 5818, "epoch": 138} {"train_loss": -4.753158092498779, "global_step": 5819, "epoch": 138} {"train_loss": -4.66850471496582, "global_step": 5820, "epoch": 138} {"train_loss": -4.570759296417236, "global_step": 5821, "epoch": 138} {"train_loss": -4.780910491943359, "global_step": 5822, "epoch": 138} {"train_loss": -4.648639678955078, "global_step": 5823, "epoch": 138} {"train_loss": -4.595366477966309, "global_step": 5824, "epoch": 138} {"train_loss": -4.745843410491943, "global_step": 5825, "epoch": 138} {"train_loss": -4.810080051422119, "global_step": 5826, "epoch": 138} {"train_loss": -4.686100959777832, "global_step": 5827, "epoch": 138} {"train_loss": -4.779301643371582, "global_step": 5828, "epoch": 138} {"train_loss": -4.71893310546875, "global_step": 5829, "epoch": 138} {"train_loss": -4.652345180511475, "global_step": 5830, "epoch": 138} {"train_loss": -4.881710052490234, "global_step": 5831, "epoch": 138} {"train_loss": -4.802393436431885, "global_step": 5832, "epoch": 138} {"train_loss": -4.786473274230957, "global_step": 5833, "epoch": 138} {"train_loss": -4.870308876037598, "global_step": 5834, "epoch": 138} {"train_loss": -4.905097007751465, "global_step": 5835, "epoch": 138} {"train_loss": -4.730754852294922, "global_step": 5836, "epoch": 138} {"train_loss": -4.746606406711397, "global_step": 5837, "epoch": 138, "val_loss": 91963.96875} {"train_loss": -4.790384769439697, "global_step": 5838, "epoch": 139} {"train_loss": -4.703363418579102, "global_step": 5839, "epoch": 139} {"train_loss": -4.879828929901123, "global_step": 5840, "epoch": 139} {"train_loss": -4.78851842880249, "global_step": 5841, "epoch": 139} {"train_loss": -4.814657211303711, "global_step": 5842, "epoch": 139} {"train_loss": -4.635192394256592, "global_step": 5843, "epoch": 139} {"train_loss": -4.811130523681641, "global_step": 5844, "epoch": 139} {"train_loss": -4.866558074951172, "global_step": 5845, "epoch": 139} {"train_loss": -4.672062873840332, "global_step": 5846, "epoch": 139} {"train_loss": -4.882992744445801, "global_step": 5847, "epoch": 139} {"train_loss": -4.907436370849609, "global_step": 5848, "epoch": 139} {"train_loss": -4.887772560119629, "global_step": 5849, "epoch": 139} {"train_loss": -4.745847702026367, "global_step": 5850, "epoch": 139} {"train_loss": -4.719138145446777, "global_step": 5851, "epoch": 139} {"train_loss": -4.882168769836426, "global_step": 5852, "epoch": 139} {"train_loss": -4.7111124992370605, "global_step": 5853, "epoch": 139} {"train_loss": -4.815560340881348, "global_step": 5854, "epoch": 139} {"train_loss": -4.831205368041992, "global_step": 5855, "epoch": 139} {"train_loss": -4.974343299865723, "global_step": 5856, "epoch": 139} {"train_loss": -4.810348987579346, "global_step": 5857, "epoch": 139} {"train_loss": -4.834754943847656, "global_step": 5858, "epoch": 139} {"train_loss": -4.910795211791992, "global_step": 5859, "epoch": 139} {"train_loss": -4.681789398193359, "global_step": 5860, "epoch": 139} {"train_loss": -4.574172019958496, "global_step": 5861, "epoch": 139} {"train_loss": -5.0378828048706055, "global_step": 5862, "epoch": 139} {"train_loss": -4.728514671325684, "global_step": 5863, "epoch": 139} {"train_loss": -4.570590972900391, "global_step": 5864, "epoch": 139} {"train_loss": -4.7109174728393555, "global_step": 5865, "epoch": 139} {"train_loss": -4.494399070739746, "global_step": 5866, "epoch": 139} {"train_loss": -4.6150665283203125, "global_step": 5867, "epoch": 139} {"train_loss": -4.662711143493652, "global_step": 5868, "epoch": 139} {"train_loss": -4.587191581726074, "global_step": 5869, "epoch": 139} {"train_loss": -4.718494892120361, "global_step": 5870, "epoch": 139} {"train_loss": -4.670780181884766, "global_step": 5871, "epoch": 139} {"train_loss": -4.810677528381348, "global_step": 5872, "epoch": 139} {"train_loss": -4.805103302001953, "global_step": 5873, "epoch": 139} {"train_loss": -4.735608100891113, "global_step": 5874, "epoch": 139} {"train_loss": -4.758513927459717, "global_step": 5875, "epoch": 139} {"train_loss": -4.844097137451172, "global_step": 5876, "epoch": 139} {"train_loss": -4.614749908447266, "global_step": 5877, "epoch": 139} {"train_loss": -4.914261341094971, "global_step": 5878, "epoch": 139} {"train_loss": -4.767349072865078, "global_step": 5879, "epoch": 139, "val_loss": 91558.9375} {"train_loss": -4.953746318817139, "global_step": 5880, "epoch": 140} {"train_loss": -4.8541951179504395, "global_step": 5881, "epoch": 140} {"train_loss": -4.735978603363037, "global_step": 5882, "epoch": 140} {"train_loss": -4.788980484008789, "global_step": 5883, "epoch": 140} {"train_loss": -4.799554824829102, "global_step": 5884, "epoch": 140} {"train_loss": -4.873191833496094, "global_step": 5885, "epoch": 140} {"train_loss": -4.82756233215332, "global_step": 5886, "epoch": 140} {"train_loss": -4.755303382873535, "global_step": 5887, "epoch": 140} {"train_loss": -4.761052131652832, "global_step": 5888, "epoch": 140} {"train_loss": -4.835412502288818, "global_step": 5889, "epoch": 140} {"train_loss": -4.84724235534668, "global_step": 5890, "epoch": 140} {"train_loss": -4.73450231552124, "global_step": 5891, "epoch": 140} {"train_loss": -4.799699306488037, "global_step": 5892, "epoch": 140} {"train_loss": -4.717386722564697, "global_step": 5893, "epoch": 140} {"train_loss": -4.875261306762695, "global_step": 5894, "epoch": 140} {"train_loss": -4.943977355957031, "global_step": 5895, "epoch": 140} {"train_loss": -4.803589820861816, "global_step": 5896, "epoch": 140} {"train_loss": -4.74739408493042, "global_step": 5897, "epoch": 140} {"train_loss": -4.773675918579102, "global_step": 5898, "epoch": 140} {"train_loss": -4.754759788513184, "global_step": 5899, "epoch": 140} {"train_loss": -4.761211395263672, "global_step": 5900, "epoch": 140} {"train_loss": -4.876324653625488, "global_step": 5901, "epoch": 140} {"train_loss": -4.825010776519775, "global_step": 5902, "epoch": 140} {"train_loss": -4.786948204040527, "global_step": 5903, "epoch": 140} {"train_loss": -4.7950310707092285, "global_step": 5904, "epoch": 140} {"train_loss": -4.823245048522949, "global_step": 5905, "epoch": 140} {"train_loss": -4.834245681762695, "global_step": 5906, "epoch": 140} {"train_loss": -4.820754051208496, "global_step": 5907, "epoch": 140} {"train_loss": -4.833518028259277, "global_step": 5908, "epoch": 140} {"train_loss": -4.880867958068848, "global_step": 5909, "epoch": 140} {"train_loss": -4.8409905433654785, "global_step": 5910, "epoch": 140} {"train_loss": -4.826807022094727, "global_step": 5911, "epoch": 140} {"train_loss": -4.777706146240234, "global_step": 5912, "epoch": 140} {"train_loss": -4.719947338104248, "global_step": 5913, "epoch": 140} {"train_loss": -4.890826225280762, "global_step": 5914, "epoch": 140} {"train_loss": -4.85395622253418, "global_step": 5915, "epoch": 140} {"train_loss": -4.66642951965332, "global_step": 5916, "epoch": 140} {"train_loss": -4.531839370727539, "global_step": 5917, "epoch": 140} {"train_loss": -4.84381103515625, "global_step": 5918, "epoch": 140} {"train_loss": -4.840307712554932, "global_step": 5919, "epoch": 140} {"train_loss": -4.556241035461426, "global_step": 5920, "epoch": 140} {"train_loss": -4.798569906325567, "global_step": 5921, "epoch": 140, "val_loss": 91419.09375} {"train_loss": -4.758333206176758, "global_step": 5922, "epoch": 141} {"train_loss": -4.5787787437438965, "global_step": 5923, "epoch": 141} {"train_loss": -4.672147750854492, "global_step": 5924, "epoch": 141} {"train_loss": -4.582876205444336, "global_step": 5925, "epoch": 141} {"train_loss": -4.719783782958984, "global_step": 5926, "epoch": 141} {"train_loss": -4.732847213745117, "global_step": 5927, "epoch": 141} {"train_loss": -4.774489402770996, "global_step": 5928, "epoch": 141} {"train_loss": -4.574994087219238, "global_step": 5929, "epoch": 141} {"train_loss": -4.7530341148376465, "global_step": 5930, "epoch": 141} {"train_loss": -4.86032247543335, "global_step": 5931, "epoch": 141} {"train_loss": -4.720682144165039, "global_step": 5932, "epoch": 141} {"train_loss": -4.821898460388184, "global_step": 5933, "epoch": 141} {"train_loss": -4.864078044891357, "global_step": 5934, "epoch": 141} {"train_loss": -4.851716995239258, "global_step": 5935, "epoch": 141} {"train_loss": -4.8494110107421875, "global_step": 5936, "epoch": 141} {"train_loss": -4.755020618438721, "global_step": 5937, "epoch": 141} {"train_loss": -4.700626373291016, "global_step": 5938, "epoch": 141} {"train_loss": -4.659224510192871, "global_step": 5939, "epoch": 141} {"train_loss": -4.892766952514648, "global_step": 5940, "epoch": 141} {"train_loss": -4.796677112579346, "global_step": 5941, "epoch": 141} {"train_loss": -4.808898448944092, "global_step": 5942, "epoch": 141} {"train_loss": -4.913424491882324, "global_step": 5943, "epoch": 141} {"train_loss": -4.855417251586914, "global_step": 5944, "epoch": 141} {"train_loss": -4.956001281738281, "global_step": 5945, "epoch": 141} {"train_loss": -4.920228958129883, "global_step": 5946, "epoch": 141} {"train_loss": -4.80800724029541, "global_step": 5947, "epoch": 141} {"train_loss": -4.855153560638428, "global_step": 5948, "epoch": 141} {"train_loss": -4.893736839294434, "global_step": 5949, "epoch": 141} {"train_loss": -4.863983154296875, "global_step": 5950, "epoch": 141} {"train_loss": -4.847053050994873, "global_step": 5951, "epoch": 141} {"train_loss": -4.7560625076293945, "global_step": 5952, "epoch": 141} {"train_loss": -4.914886474609375, "global_step": 5953, "epoch": 141} {"train_loss": -4.786982536315918, "global_step": 5954, "epoch": 141} {"train_loss": -4.878262519836426, "global_step": 5955, "epoch": 141} {"train_loss": -4.785299301147461, "global_step": 5956, "epoch": 141} {"train_loss": -4.658384323120117, "global_step": 5957, "epoch": 141} {"train_loss": -4.782238006591797, "global_step": 5958, "epoch": 141} {"train_loss": -4.854761600494385, "global_step": 5959, "epoch": 141} {"train_loss": -4.519848823547363, "global_step": 5960, "epoch": 141} {"train_loss": -4.499408721923828, "global_step": 5961, "epoch": 141} {"train_loss": -4.818393707275391, "global_step": 5962, "epoch": 141} {"train_loss": -4.778136730194092, "global_step": 5963, "epoch": 141, "val_loss": 92483.71875} {"train_loss": -4.589501857757568, "global_step": 5964, "epoch": 142} {"train_loss": -4.948921203613281, "global_step": 5965, "epoch": 142} {"train_loss": -4.8121724128723145, "global_step": 5966, "epoch": 142} {"train_loss": -4.794846534729004, "global_step": 5967, "epoch": 142} {"train_loss": -4.7503437995910645, "global_step": 5968, "epoch": 142} {"train_loss": -4.731043338775635, "global_step": 5969, "epoch": 142} {"train_loss": -4.698296070098877, "global_step": 5970, "epoch": 142} {"train_loss": -4.850603103637695, "global_step": 5971, "epoch": 142} {"train_loss": -4.950583457946777, "global_step": 5972, "epoch": 142} {"train_loss": -4.701407432556152, "global_step": 5973, "epoch": 142} {"train_loss": -4.72909688949585, "global_step": 5974, "epoch": 142} {"train_loss": -4.642199993133545, "global_step": 5975, "epoch": 142} {"train_loss": -4.958430767059326, "global_step": 5976, "epoch": 142} {"train_loss": -4.811010360717773, "global_step": 5977, "epoch": 142} {"train_loss": -4.712740421295166, "global_step": 5978, "epoch": 142} {"train_loss": -4.82832670211792, "global_step": 5979, "epoch": 142} {"train_loss": -4.763004302978516, "global_step": 5980, "epoch": 142} {"train_loss": -4.823040962219238, "global_step": 5981, "epoch": 142} {"train_loss": -4.702338218688965, "global_step": 5982, "epoch": 142} {"train_loss": -4.784563064575195, "global_step": 5983, "epoch": 142} {"train_loss": -4.846952438354492, "global_step": 5984, "epoch": 142} {"train_loss": -4.57902717590332, "global_step": 5985, "epoch": 142} {"train_loss": -4.753403186798096, "global_step": 5986, "epoch": 142} {"train_loss": -4.790640830993652, "global_step": 5987, "epoch": 142} {"train_loss": -4.872640609741211, "global_step": 5988, "epoch": 142} {"train_loss": -4.7984938621521, "global_step": 5989, "epoch": 142} {"train_loss": -4.864075183868408, "global_step": 5990, "epoch": 142} {"train_loss": -4.901895523071289, "global_step": 5991, "epoch": 142} {"train_loss": -4.847517967224121, "global_step": 5992, "epoch": 142} {"train_loss": -4.609947204589844, "global_step": 5993, "epoch": 142} {"train_loss": -4.70109224319458, "global_step": 5994, "epoch": 142} {"train_loss": -4.876097679138184, "global_step": 5995, "epoch": 142} {"train_loss": -4.829806327819824, "global_step": 5996, "epoch": 142} {"train_loss": -4.781249523162842, "global_step": 5997, "epoch": 142} {"train_loss": -4.85868501663208, "global_step": 5998, "epoch": 142} {"train_loss": -4.819331169128418, "global_step": 5999, "epoch": 142} {"train_loss": -4.967606067657471, "global_step": 6000, "epoch": 142} {"train_loss": -4.836367607116699, "global_step": 6001, "epoch": 142} {"train_loss": -4.823489189147949, "global_step": 6002, "epoch": 142} {"train_loss": -4.815489768981934, "global_step": 6003, "epoch": 142} {"train_loss": -4.649073600769043, "global_step": 6004, "epoch": 142} {"train_loss": -4.790664525259109, "global_step": 6005, "epoch": 142, "val_loss": 90918.6484375} {"train_loss": -4.855172157287598, "global_step": 6006, "epoch": 143} {"train_loss": -4.931004524230957, "global_step": 6007, "epoch": 143} {"train_loss": -4.703936576843262, "global_step": 6008, "epoch": 143} {"train_loss": -4.768009185791016, "global_step": 6009, "epoch": 143} {"train_loss": -4.854564189910889, "global_step": 6010, "epoch": 143} {"train_loss": -4.886270523071289, "global_step": 6011, "epoch": 143} {"train_loss": -4.8319807052612305, "global_step": 6012, "epoch": 143} {"train_loss": -4.803003311157227, "global_step": 6013, "epoch": 143} {"train_loss": -4.804488658905029, "global_step": 6014, "epoch": 143} {"train_loss": -4.805919170379639, "global_step": 6015, "epoch": 143} {"train_loss": -4.609750270843506, "global_step": 6016, "epoch": 143} {"train_loss": -4.838626861572266, "global_step": 6017, "epoch": 143} {"train_loss": -4.820915699005127, "global_step": 6018, "epoch": 143} {"train_loss": -4.536561965942383, "global_step": 6019, "epoch": 143} {"train_loss": -4.971969127655029, "global_step": 6020, "epoch": 143} {"train_loss": -4.973968505859375, "global_step": 6021, "epoch": 143} {"train_loss": -4.676197052001953, "global_step": 6022, "epoch": 143} {"train_loss": -4.852975845336914, "global_step": 6023, "epoch": 143} {"train_loss": -4.688238143920898, "global_step": 6024, "epoch": 143} {"train_loss": -4.5215911865234375, "global_step": 6025, "epoch": 143} {"train_loss": -4.772233009338379, "global_step": 6026, "epoch": 143} {"train_loss": -4.584985733032227, "global_step": 6027, "epoch": 143} {"train_loss": -4.867392539978027, "global_step": 6028, "epoch": 143} {"train_loss": -4.662289619445801, "global_step": 6029, "epoch": 143} {"train_loss": -4.6662211418151855, "global_step": 6030, "epoch": 143} {"train_loss": -4.664278030395508, "global_step": 6031, "epoch": 143} {"train_loss": -4.389798641204834, "global_step": 6032, "epoch": 143} {"train_loss": -4.694418907165527, "global_step": 6033, "epoch": 143} {"train_loss": -4.511346817016602, "global_step": 6034, "epoch": 143} {"train_loss": -4.522209644317627, "global_step": 6035, "epoch": 143} {"train_loss": -4.5713791847229, "global_step": 6036, "epoch": 143} {"train_loss": -4.659365653991699, "global_step": 6037, "epoch": 143} {"train_loss": -4.662036895751953, "global_step": 6038, "epoch": 143} {"train_loss": -4.555538177490234, "global_step": 6039, "epoch": 143} {"train_loss": -4.755001544952393, "global_step": 6040, "epoch": 143} {"train_loss": -4.783289909362793, "global_step": 6041, "epoch": 143} {"train_loss": -4.829693794250488, "global_step": 6042, "epoch": 143} {"train_loss": -4.72379732131958, "global_step": 6043, "epoch": 143} {"train_loss": -4.732793807983398, "global_step": 6044, "epoch": 143} {"train_loss": -4.73972225189209, "global_step": 6045, "epoch": 143} {"train_loss": -4.60836124420166, "global_step": 6046, "epoch": 143} {"train_loss": -4.726109913417271, "global_step": 6047, "epoch": 143, "val_loss": 90301.046875} {"train_loss": -4.829371452331543, "global_step": 6048, "epoch": 144} {"train_loss": -4.908652305603027, "global_step": 6049, "epoch": 144} {"train_loss": -4.864013195037842, "global_step": 6050, "epoch": 144} {"train_loss": -4.782181739807129, "global_step": 6051, "epoch": 144} {"train_loss": -4.727359771728516, "global_step": 6052, "epoch": 144} {"train_loss": -4.81405782699585, "global_step": 6053, "epoch": 144} {"train_loss": -4.895200252532959, "global_step": 6054, "epoch": 144} {"train_loss": -4.885134220123291, "global_step": 6055, "epoch": 144} {"train_loss": -4.774177551269531, "global_step": 6056, "epoch": 144} {"train_loss": -4.78729248046875, "global_step": 6057, "epoch": 144} {"train_loss": -4.788857936859131, "global_step": 6058, "epoch": 144} {"train_loss": -4.953648567199707, "global_step": 6059, "epoch": 144} {"train_loss": -4.549914360046387, "global_step": 6060, "epoch": 144} {"train_loss": -4.730846405029297, "global_step": 6061, "epoch": 144} {"train_loss": -4.809385299682617, "global_step": 6062, "epoch": 144} {"train_loss": -4.731507778167725, "global_step": 6063, "epoch": 144} {"train_loss": -4.948511123657227, "global_step": 6064, "epoch": 144} {"train_loss": -4.803205490112305, "global_step": 6065, "epoch": 144} {"train_loss": -4.855164527893066, "global_step": 6066, "epoch": 144} {"train_loss": -4.679596900939941, "global_step": 6067, "epoch": 144} {"train_loss": -4.7601423263549805, "global_step": 6068, "epoch": 144} {"train_loss": -4.629735946655273, "global_step": 6069, "epoch": 144} {"train_loss": -4.752017974853516, "global_step": 6070, "epoch": 144} {"train_loss": -4.987314224243164, "global_step": 6071, "epoch": 144} {"train_loss": -4.697396755218506, "global_step": 6072, "epoch": 144} {"train_loss": -4.650460243225098, "global_step": 6073, "epoch": 144} {"train_loss": -4.713981628417969, "global_step": 6074, "epoch": 144} {"train_loss": -4.694882392883301, "global_step": 6075, "epoch": 144} {"train_loss": -4.887860298156738, "global_step": 6076, "epoch": 144} {"train_loss": -4.806414604187012, "global_step": 6077, "epoch": 144} {"train_loss": -4.739367485046387, "global_step": 6078, "epoch": 144} {"train_loss": -4.968984127044678, "global_step": 6079, "epoch": 144} {"train_loss": -4.835651397705078, "global_step": 6080, "epoch": 144} {"train_loss": -4.538875579833984, "global_step": 6081, "epoch": 144} {"train_loss": -4.653095245361328, "global_step": 6082, "epoch": 144} {"train_loss": -4.831727027893066, "global_step": 6083, "epoch": 144} {"train_loss": -4.700246810913086, "global_step": 6084, "epoch": 144} {"train_loss": -4.698050022125244, "global_step": 6085, "epoch": 144} {"train_loss": -4.735723495483398, "global_step": 6086, "epoch": 144} {"train_loss": -4.612613201141357, "global_step": 6087, "epoch": 144} {"train_loss": -4.8304338455200195, "global_step": 6088, "epoch": 144} {"train_loss": -4.777156852540516, "global_step": 6089, "epoch": 144, "val_loss": 90649.0859375} {"train_loss": -4.735118865966797, "global_step": 6090, "epoch": 145} {"train_loss": -4.816800117492676, "global_step": 6091, "epoch": 145} {"train_loss": -4.628741264343262, "global_step": 6092, "epoch": 145} {"train_loss": -4.741681098937988, "global_step": 6093, "epoch": 145} {"train_loss": -4.855593681335449, "global_step": 6094, "epoch": 145} {"train_loss": -4.720053672790527, "global_step": 6095, "epoch": 145} {"train_loss": -4.837650775909424, "global_step": 6096, "epoch": 145} {"train_loss": -4.828830718994141, "global_step": 6097, "epoch": 145} {"train_loss": -4.864772796630859, "global_step": 6098, "epoch": 145} {"train_loss": -4.774567604064941, "global_step": 6099, "epoch": 145} {"train_loss": -4.817911148071289, "global_step": 6100, "epoch": 145} {"train_loss": -4.925865173339844, "global_step": 6101, "epoch": 145} {"train_loss": -4.891122341156006, "global_step": 6102, "epoch": 145} {"train_loss": -4.859194755554199, "global_step": 6103, "epoch": 145} {"train_loss": -4.882735252380371, "global_step": 6104, "epoch": 145} {"train_loss": -4.887142658233643, "global_step": 6105, "epoch": 145} {"train_loss": -4.82414436340332, "global_step": 6106, "epoch": 145} {"train_loss": -4.807697772979736, "global_step": 6107, "epoch": 145} {"train_loss": -4.785541534423828, "global_step": 6108, "epoch": 145} {"train_loss": -4.788458347320557, "global_step": 6109, "epoch": 145} {"train_loss": -4.772693634033203, "global_step": 6110, "epoch": 145} {"train_loss": -4.999189376831055, "global_step": 6111, "epoch": 145} {"train_loss": -4.642824172973633, "global_step": 6112, "epoch": 145} {"train_loss": -4.6735615730285645, "global_step": 6113, "epoch": 145} {"train_loss": -4.843083381652832, "global_step": 6114, "epoch": 145} {"train_loss": -4.512026309967041, "global_step": 6115, "epoch": 145} {"train_loss": -4.786454200744629, "global_step": 6116, "epoch": 145} {"train_loss": -4.78005313873291, "global_step": 6117, "epoch": 145} {"train_loss": -4.707683563232422, "global_step": 6118, "epoch": 145} {"train_loss": -4.584766387939453, "global_step": 6119, "epoch": 145} {"train_loss": -4.517033576965332, "global_step": 6120, "epoch": 145} {"train_loss": -4.482338905334473, "global_step": 6121, "epoch": 145} {"train_loss": -4.494499206542969, "global_step": 6122, "epoch": 145} {"train_loss": -4.552372455596924, "global_step": 6123, "epoch": 145} {"train_loss": -4.395700454711914, "global_step": 6124, "epoch": 145} {"train_loss": -4.850693702697754, "global_step": 6125, "epoch": 145} {"train_loss": -4.655113220214844, "global_step": 6126, "epoch": 145} {"train_loss": -4.65479040145874, "global_step": 6127, "epoch": 145} {"train_loss": -4.650257110595703, "global_step": 6128, "epoch": 145} {"train_loss": -4.685702323913574, "global_step": 6129, "epoch": 145} {"train_loss": -4.6219482421875, "global_step": 6130, "epoch": 145} {"train_loss": -4.732404493150257, "global_step": 6131, "epoch": 145, "val_loss": 93816.8203125} {"train_loss": -4.741537570953369, "global_step": 6132, "epoch": 146} {"train_loss": -4.753243923187256, "global_step": 6133, "epoch": 146} {"train_loss": -4.782072067260742, "global_step": 6134, "epoch": 146} {"train_loss": -4.834804534912109, "global_step": 6135, "epoch": 146} {"train_loss": -4.697242259979248, "global_step": 6136, "epoch": 146} {"train_loss": -4.650453567504883, "global_step": 6137, "epoch": 146} {"train_loss": -4.795067310333252, "global_step": 6138, "epoch": 146} {"train_loss": -4.635180473327637, "global_step": 6139, "epoch": 146} {"train_loss": -4.941695690155029, "global_step": 6140, "epoch": 146} {"train_loss": -4.787688255310059, "global_step": 6141, "epoch": 146} {"train_loss": -4.674740791320801, "global_step": 6142, "epoch": 146} {"train_loss": -4.751559257507324, "global_step": 6143, "epoch": 146} {"train_loss": -4.892941474914551, "global_step": 6144, "epoch": 146} {"train_loss": -4.708510398864746, "global_step": 6145, "epoch": 146} {"train_loss": -4.925010681152344, "global_step": 6146, "epoch": 146} {"train_loss": -4.816128730773926, "global_step": 6147, "epoch": 146} {"train_loss": -4.854937553405762, "global_step": 6148, "epoch": 146} {"train_loss": -4.74461030960083, "global_step": 6149, "epoch": 146} {"train_loss": -4.769230365753174, "global_step": 6150, "epoch": 146} {"train_loss": -4.888742446899414, "global_step": 6151, "epoch": 146} {"train_loss": -4.78152322769165, "global_step": 6152, "epoch": 146} {"train_loss": -4.9638166427612305, "global_step": 6153, "epoch": 146} {"train_loss": -4.628585338592529, "global_step": 6154, "epoch": 146} {"train_loss": -4.800150394439697, "global_step": 6155, "epoch": 146} {"train_loss": -4.875007629394531, "global_step": 6156, "epoch": 146} {"train_loss": -4.7809858322143555, "global_step": 6157, "epoch": 146} {"train_loss": -4.86215877532959, "global_step": 6158, "epoch": 146} {"train_loss": -4.592471122741699, "global_step": 6159, "epoch": 146} {"train_loss": -4.725826740264893, "global_step": 6160, "epoch": 146} {"train_loss": -4.826889991760254, "global_step": 6161, "epoch": 146} {"train_loss": -4.653800010681152, "global_step": 6162, "epoch": 146} {"train_loss": -4.720454216003418, "global_step": 6163, "epoch": 146} {"train_loss": -4.730569839477539, "global_step": 6164, "epoch": 146} {"train_loss": -4.721548080444336, "global_step": 6165, "epoch": 146} {"train_loss": -4.686758041381836, "global_step": 6166, "epoch": 146} {"train_loss": -4.868635177612305, "global_step": 6167, "epoch": 146} {"train_loss": -4.902708053588867, "global_step": 6168, "epoch": 146} {"train_loss": -4.81610631942749, "global_step": 6169, "epoch": 146} {"train_loss": -4.873923301696777, "global_step": 6170, "epoch": 146} {"train_loss": -4.836252212524414, "global_step": 6171, "epoch": 146} {"train_loss": -5.023463249206543, "global_step": 6172, "epoch": 146} {"train_loss": -4.788805882136027, "global_step": 6173, "epoch": 146, "val_loss": 89538.9921875} {"train_loss": -4.825174331665039, "global_step": 6174, "epoch": 147} {"train_loss": -4.725308895111084, "global_step": 6175, "epoch": 147} {"train_loss": -4.622610569000244, "global_step": 6176, "epoch": 147} {"train_loss": -4.9704742431640625, "global_step": 6177, "epoch": 147} {"train_loss": -4.831125736236572, "global_step": 6178, "epoch": 147} {"train_loss": -4.732022285461426, "global_step": 6179, "epoch": 147} {"train_loss": -4.813776969909668, "global_step": 6180, "epoch": 147} {"train_loss": -4.73622465133667, "global_step": 6181, "epoch": 147} {"train_loss": -4.68346643447876, "global_step": 6182, "epoch": 147} {"train_loss": -4.824056625366211, "global_step": 6183, "epoch": 147} {"train_loss": -4.744184494018555, "global_step": 6184, "epoch": 147} {"train_loss": -4.719776153564453, "global_step": 6185, "epoch": 147} {"train_loss": -4.876160144805908, "global_step": 6186, "epoch": 147} {"train_loss": -4.682005405426025, "global_step": 6187, "epoch": 147} {"train_loss": -4.814404487609863, "global_step": 6188, "epoch": 147} {"train_loss": -4.785614490509033, "global_step": 6189, "epoch": 147} {"train_loss": -4.675014495849609, "global_step": 6190, "epoch": 147} {"train_loss": -4.7782721519470215, "global_step": 6191, "epoch": 147} {"train_loss": -4.832643508911133, "global_step": 6192, "epoch": 147} {"train_loss": -4.809329032897949, "global_step": 6193, "epoch": 147} {"train_loss": -4.798460006713867, "global_step": 6194, "epoch": 147} {"train_loss": -4.854337692260742, "global_step": 6195, "epoch": 147} {"train_loss": -4.848153591156006, "global_step": 6196, "epoch": 147} {"train_loss": -4.935178756713867, "global_step": 6197, "epoch": 147} {"train_loss": -4.868683815002441, "global_step": 6198, "epoch": 147} {"train_loss": -4.8736114501953125, "global_step": 6199, "epoch": 147} {"train_loss": -4.8902997970581055, "global_step": 6200, "epoch": 147} {"train_loss": -4.838608741760254, "global_step": 6201, "epoch": 147} {"train_loss": -4.924942970275879, "global_step": 6202, "epoch": 147} {"train_loss": -4.897961616516113, "global_step": 6203, "epoch": 147} {"train_loss": -4.860052108764648, "global_step": 6204, "epoch": 147} {"train_loss": -4.774789810180664, "global_step": 6205, "epoch": 147} {"train_loss": -4.842816352844238, "global_step": 6206, "epoch": 147} {"train_loss": -5.0210418701171875, "global_step": 6207, "epoch": 147} {"train_loss": -4.818374156951904, "global_step": 6208, "epoch": 147} {"train_loss": -4.680498123168945, "global_step": 6209, "epoch": 147} {"train_loss": -4.9409403800964355, "global_step": 6210, "epoch": 147} {"train_loss": -4.77632999420166, "global_step": 6211, "epoch": 147} {"train_loss": -4.5843424797058105, "global_step": 6212, "epoch": 147} {"train_loss": -5.010506629943848, "global_step": 6213, "epoch": 147} {"train_loss": -4.961438179016113, "global_step": 6214, "epoch": 147} {"train_loss": -4.8169792493184405, "global_step": 6215, "epoch": 147, "val_loss": 89691.171875} {"train_loss": -4.993927478790283, "global_step": 6216, "epoch": 148} {"train_loss": -4.850749969482422, "global_step": 6217, "epoch": 148} {"train_loss": -4.880067825317383, "global_step": 6218, "epoch": 148} {"train_loss": -4.813899040222168, "global_step": 6219, "epoch": 148} {"train_loss": -5.033499717712402, "global_step": 6220, "epoch": 148} {"train_loss": -4.974902153015137, "global_step": 6221, "epoch": 148} {"train_loss": -4.994487762451172, "global_step": 6222, "epoch": 148} {"train_loss": -4.8011884689331055, "global_step": 6223, "epoch": 148} {"train_loss": -4.776398658752441, "global_step": 6224, "epoch": 148} {"train_loss": -4.849651336669922, "global_step": 6225, "epoch": 148} {"train_loss": -4.8680524826049805, "global_step": 6226, "epoch": 148} {"train_loss": -4.807912349700928, "global_step": 6227, "epoch": 148} {"train_loss": -4.867242813110352, "global_step": 6228, "epoch": 148} {"train_loss": -4.813287734985352, "global_step": 6229, "epoch": 148} {"train_loss": -4.898617744445801, "global_step": 6230, "epoch": 148} {"train_loss": -4.815950393676758, "global_step": 6231, "epoch": 148} {"train_loss": -4.95413064956665, "global_step": 6232, "epoch": 148} {"train_loss": -4.9298529624938965, "global_step": 6233, "epoch": 148} {"train_loss": -4.71768856048584, "global_step": 6234, "epoch": 148} {"train_loss": -4.904794216156006, "global_step": 6235, "epoch": 148} {"train_loss": -5.017258644104004, "global_step": 6236, "epoch": 148} {"train_loss": -4.817538261413574, "global_step": 6237, "epoch": 148} {"train_loss": -4.83331298828125, "global_step": 6238, "epoch": 148} {"train_loss": -4.871954917907715, "global_step": 6239, "epoch": 148} {"train_loss": -4.872764587402344, "global_step": 6240, "epoch": 148} {"train_loss": -4.888906478881836, "global_step": 6241, "epoch": 148} {"train_loss": -4.746965408325195, "global_step": 6242, "epoch": 148} {"train_loss": -4.797637939453125, "global_step": 6243, "epoch": 148} {"train_loss": -4.981050491333008, "global_step": 6244, "epoch": 148} {"train_loss": -4.861764907836914, "global_step": 6245, "epoch": 148} {"train_loss": -4.670273780822754, "global_step": 6246, "epoch": 148} {"train_loss": -4.817169666290283, "global_step": 6247, "epoch": 148} {"train_loss": -4.773500919342041, "global_step": 6248, "epoch": 148} {"train_loss": -4.506616592407227, "global_step": 6249, "epoch": 148} {"train_loss": -4.634549617767334, "global_step": 6250, "epoch": 148} {"train_loss": -4.67549467086792, "global_step": 6251, "epoch": 148} {"train_loss": -4.527357578277588, "global_step": 6252, "epoch": 148} {"train_loss": -4.812209129333496, "global_step": 6253, "epoch": 148} {"train_loss": -4.871644020080566, "global_step": 6254, "epoch": 148} {"train_loss": -4.552692890167236, "global_step": 6255, "epoch": 148} {"train_loss": -4.887599945068359, "global_step": 6256, "epoch": 148} {"train_loss": -4.8224442799886065, "global_step": 6257, "epoch": 148, "val_loss": 92130.265625} {"train_loss": -4.647615432739258, "global_step": 6258, "epoch": 149} {"train_loss": -4.833884239196777, "global_step": 6259, "epoch": 149} {"train_loss": -4.587707996368408, "global_step": 6260, "epoch": 149} {"train_loss": -4.894229412078857, "global_step": 6261, "epoch": 149} {"train_loss": -4.708539009094238, "global_step": 6262, "epoch": 149} {"train_loss": -4.645491123199463, "global_step": 6263, "epoch": 149} {"train_loss": -5.0647430419921875, "global_step": 6264, "epoch": 149} {"train_loss": -4.607690811157227, "global_step": 6265, "epoch": 149} {"train_loss": -4.737362861633301, "global_step": 6266, "epoch": 149} {"train_loss": -4.794330596923828, "global_step": 6267, "epoch": 149} {"train_loss": -4.722606658935547, "global_step": 6268, "epoch": 149} {"train_loss": -4.871685981750488, "global_step": 6269, "epoch": 149} {"train_loss": -4.615025520324707, "global_step": 6270, "epoch": 149} {"train_loss": -4.896798133850098, "global_step": 6271, "epoch": 149} {"train_loss": -4.735498428344727, "global_step": 6272, "epoch": 149} {"train_loss": -4.732253074645996, "global_step": 6273, "epoch": 149} {"train_loss": -4.892126560211182, "global_step": 6274, "epoch": 149} {"train_loss": -4.852015495300293, "global_step": 6275, "epoch": 149} {"train_loss": -4.778796195983887, "global_step": 6276, "epoch": 149} {"train_loss": -4.816806793212891, "global_step": 6277, "epoch": 149} {"train_loss": -4.7754597663879395, "global_step": 6278, "epoch": 149} {"train_loss": -4.719374656677246, "global_step": 6279, "epoch": 149} {"train_loss": -4.931934356689453, "global_step": 6280, "epoch": 149} {"train_loss": -4.822349548339844, "global_step": 6281, "epoch": 149} {"train_loss": -4.742189407348633, "global_step": 6282, "epoch": 149} {"train_loss": -4.8810200691223145, "global_step": 6283, "epoch": 149} {"train_loss": -4.7850022315979, "global_step": 6284, "epoch": 149} {"train_loss": -4.914327621459961, "global_step": 6285, "epoch": 149} {"train_loss": -4.953849792480469, "global_step": 6286, "epoch": 149} {"train_loss": -4.839339256286621, "global_step": 6287, "epoch": 149} {"train_loss": -4.848903179168701, "global_step": 6288, "epoch": 149} {"train_loss": -4.686996936798096, "global_step": 6289, "epoch": 149} {"train_loss": -4.833487510681152, "global_step": 6290, "epoch": 149} {"train_loss": -4.808347225189209, "global_step": 6291, "epoch": 149} {"train_loss": -4.818901538848877, "global_step": 6292, "epoch": 149} {"train_loss": -4.873335838317871, "global_step": 6293, "epoch": 149} {"train_loss": -4.802334308624268, "global_step": 6294, "epoch": 149} {"train_loss": -4.758479595184326, "global_step": 6295, "epoch": 149} {"train_loss": -4.817378044128418, "global_step": 6296, "epoch": 149} {"train_loss": -4.920867919921875, "global_step": 6297, "epoch": 149} {"train_loss": -4.867026329040527, "global_step": 6298, "epoch": 149} {"train_loss": -4.803786379950387, "global_step": 6299, "epoch": 149, "val_loss": 88230.3046875} {"train_loss": -4.781386375427246, "global_step": 6300, "epoch": 150} {"train_loss": -4.929932594299316, "global_step": 6301, "epoch": 150} {"train_loss": -4.857386589050293, "global_step": 6302, "epoch": 150} {"train_loss": -4.708952903747559, "global_step": 6303, "epoch": 150} {"train_loss": -4.859646320343018, "global_step": 6304, "epoch": 150} {"train_loss": -4.78653621673584, "global_step": 6305, "epoch": 150} {"train_loss": -4.85893440246582, "global_step": 6306, "epoch": 150} {"train_loss": -4.851309776306152, "global_step": 6307, "epoch": 150} {"train_loss": -4.73230504989624, "global_step": 6308, "epoch": 150} {"train_loss": -4.908166408538818, "global_step": 6309, "epoch": 150} {"train_loss": -4.9430108070373535, "global_step": 6310, "epoch": 150} {"train_loss": -4.706927299499512, "global_step": 6311, "epoch": 150} {"train_loss": -4.93540096282959, "global_step": 6312, "epoch": 150} {"train_loss": -4.736959457397461, "global_step": 6313, "epoch": 150} {"train_loss": -4.69162654876709, "global_step": 6314, "epoch": 150} {"train_loss": -4.735939025878906, "global_step": 6315, "epoch": 150} {"train_loss": -4.913637638092041, "global_step": 6316, "epoch": 150} {"train_loss": -4.82138729095459, "global_step": 6317, "epoch": 150} {"train_loss": -4.762599945068359, "global_step": 6318, "epoch": 150} {"train_loss": -4.757164478302002, "global_step": 6319, "epoch": 150} {"train_loss": -4.789752006530762, "global_step": 6320, "epoch": 150} {"train_loss": -4.956287384033203, "global_step": 6321, "epoch": 150} {"train_loss": -4.955375671386719, "global_step": 6322, "epoch": 150} {"train_loss": -4.926424980163574, "global_step": 6323, "epoch": 150} {"train_loss": -4.955347061157227, "global_step": 6324, "epoch": 150} {"train_loss": -4.930300235748291, "global_step": 6325, "epoch": 150} {"train_loss": -4.972503662109375, "global_step": 6326, "epoch": 150} {"train_loss": -4.955326080322266, "global_step": 6327, "epoch": 150} {"train_loss": -4.848938941955566, "global_step": 6328, "epoch": 150} {"train_loss": -4.98146915435791, "global_step": 6329, "epoch": 150} {"train_loss": -4.918313980102539, "global_step": 6330, "epoch": 150} {"train_loss": -4.838235855102539, "global_step": 6331, "epoch": 150} {"train_loss": -4.9132208824157715, "global_step": 6332, "epoch": 150} {"train_loss": -4.82423734664917, "global_step": 6333, "epoch": 150} {"train_loss": -4.905198097229004, "global_step": 6334, "epoch": 150} {"train_loss": -4.993594169616699, "global_step": 6335, "epoch": 150} {"train_loss": -4.897190570831299, "global_step": 6336, "epoch": 150} {"train_loss": -4.834882736206055, "global_step": 6337, "epoch": 150} {"train_loss": -4.794278144836426, "global_step": 6338, "epoch": 150} {"train_loss": -4.967710971832275, "global_step": 6339, "epoch": 150} {"train_loss": -4.800660133361816, "global_step": 6340, "epoch": 150} {"train_loss": -4.860818908328102, "global_step": 6341, "epoch": 150, "train/sim_max_reward_0": 0.3671908069697362, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.3485024048141259, "train/sim_max_reward_3": 0.006525932240260836, "train/sim_max_reward_4": 0.267993870329265, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.13305310964220818, "test/sim_max_reward_4400001": 0.18331940348669437, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.05274729456438236, "test/sim_max_reward_4400006": 0.04864349725334085, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.4083163869877454, "test/sim_max_reward_4400009": 0.17415672193822604, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.3367386639496294, "test/sim_max_reward_4400012": 0.1486090414827902, "test/sim_max_reward_4400013": 0.38079652908652895, "test/sim_max_reward_4400014": 0.0041750489188490895, "test/sim_max_reward_4400015": 0.5612205152843593, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19436787880140133, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6147545784935139, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1960265980208025, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.537449853447807, "test/sim_max_reward_4400028": 0.37847119373291527, "test/sim_max_reward_4400029": 0.453853332771961, "test/sim_max_reward_4400030": 0.20600631588438253, "test/sim_max_reward_4400031": 1.2890978942579066e-05, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.19860602453174422, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.4682795305783269, "test/sim_max_reward_4400036": 0.365478645732947, "test/sim_max_reward_4400037": 0.12650765847746417, "test/sim_max_reward_4400038": 0.0003490032421345069, "test/sim_max_reward_4400039": 0.5072264915416881, "test/sim_max_reward_4400040": 0.13589361746416365, "test/sim_max_reward_4400041": 0.5279194482859523, "test/sim_max_reward_4400042": 0.05432206838871515, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.3308414022995964, "test/sim_max_reward_4400045": 0.3587438067050823, "test/sim_max_reward_4400046": 0.19618918291910015, "test/sim_max_reward_4400047": 0.17309801922344675, "test/sim_max_reward_4400048": 0.10507304801330923, "test/sim_max_reward_4400049": 0.004948320745260615, "train/mean_score": 0.19731220915622913, "test/mean_score": 0.18272776625539028, "val_loss": 88043.7890625} {"train_loss": -4.869231700897217, "global_step": 6342, "epoch": 151} {"train_loss": -4.942869186401367, "global_step": 6343, "epoch": 151} {"train_loss": -4.947685241699219, "global_step": 6344, "epoch": 151} {"train_loss": -4.81361722946167, "global_step": 6345, "epoch": 151} {"train_loss": -4.762166976928711, "global_step": 6346, "epoch": 151} {"train_loss": -4.881749629974365, "global_step": 6347, "epoch": 151} {"train_loss": -4.810788154602051, "global_step": 6348, "epoch": 151} {"train_loss": -4.868044376373291, "global_step": 6349, "epoch": 151} {"train_loss": -4.948436737060547, "global_step": 6350, "epoch": 151} {"train_loss": -4.952827453613281, "global_step": 6351, "epoch": 151} {"train_loss": -4.88055419921875, "global_step": 6352, "epoch": 151} {"train_loss": -4.9469990730285645, "global_step": 6353, "epoch": 151} {"train_loss": -4.836865425109863, "global_step": 6354, "epoch": 151} {"train_loss": -4.934356689453125, "global_step": 6355, "epoch": 151} {"train_loss": -4.939971923828125, "global_step": 6356, "epoch": 151} {"train_loss": -4.825588226318359, "global_step": 6357, "epoch": 151} {"train_loss": -5.00465202331543, "global_step": 6358, "epoch": 151} {"train_loss": -5.009818077087402, "global_step": 6359, "epoch": 151} {"train_loss": -4.714338779449463, "global_step": 6360, "epoch": 151} {"train_loss": -5.004876136779785, "global_step": 6361, "epoch": 151} {"train_loss": -4.974633693695068, "global_step": 6362, "epoch": 151} {"train_loss": -4.915362358093262, "global_step": 6363, "epoch": 151} {"train_loss": -4.954129219055176, "global_step": 6364, "epoch": 151} {"train_loss": -4.846362590789795, "global_step": 6365, "epoch": 151} {"train_loss": -4.871816158294678, "global_step": 6366, "epoch": 151} {"train_loss": -4.870193004608154, "global_step": 6367, "epoch": 151} {"train_loss": -4.842318534851074, "global_step": 6368, "epoch": 151} {"train_loss": -4.920248985290527, "global_step": 6369, "epoch": 151} {"train_loss": -4.9052228927612305, "global_step": 6370, "epoch": 151} {"train_loss": -4.949843883514404, "global_step": 6371, "epoch": 151} {"train_loss": -4.750046253204346, "global_step": 6372, "epoch": 151} {"train_loss": -4.636842727661133, "global_step": 6373, "epoch": 151} {"train_loss": -4.69321346282959, "global_step": 6374, "epoch": 151} {"train_loss": -4.817109107971191, "global_step": 6375, "epoch": 151} {"train_loss": -4.742237091064453, "global_step": 6376, "epoch": 151} {"train_loss": -4.568055152893066, "global_step": 6377, "epoch": 151} {"train_loss": -4.814098834991455, "global_step": 6378, "epoch": 151} {"train_loss": -4.839860916137695, "global_step": 6379, "epoch": 151} {"train_loss": -4.722444534301758, "global_step": 6380, "epoch": 151} {"train_loss": -4.871713638305664, "global_step": 6381, "epoch": 151} {"train_loss": -4.828889846801758, "global_step": 6382, "epoch": 151} {"train_loss": -4.8590416340600875, "global_step": 6383, "epoch": 151, "val_loss": 87832.8671875} {"train_loss": -4.942868232727051, "global_step": 6384, "epoch": 152} {"train_loss": -4.848898887634277, "global_step": 6385, "epoch": 152} {"train_loss": -4.8244099617004395, "global_step": 6386, "epoch": 152} {"train_loss": -4.735273361206055, "global_step": 6387, "epoch": 152} {"train_loss": -4.809629440307617, "global_step": 6388, "epoch": 152} {"train_loss": -4.936824321746826, "global_step": 6389, "epoch": 152} {"train_loss": -4.872372627258301, "global_step": 6390, "epoch": 152} {"train_loss": -4.816915512084961, "global_step": 6391, "epoch": 152} {"train_loss": -5.098084926605225, "global_step": 6392, "epoch": 152} {"train_loss": -4.828217506408691, "global_step": 6393, "epoch": 152} {"train_loss": -4.990386962890625, "global_step": 6394, "epoch": 152} {"train_loss": -4.788454532623291, "global_step": 6395, "epoch": 152} {"train_loss": -4.810329437255859, "global_step": 6396, "epoch": 152} {"train_loss": -4.913729190826416, "global_step": 6397, "epoch": 152} {"train_loss": -5.038194179534912, "global_step": 6398, "epoch": 152} {"train_loss": -4.721668243408203, "global_step": 6399, "epoch": 152} {"train_loss": -4.820371627807617, "global_step": 6400, "epoch": 152} {"train_loss": -4.79132080078125, "global_step": 6401, "epoch": 152} {"train_loss": -4.960453033447266, "global_step": 6402, "epoch": 152} {"train_loss": -4.826695919036865, "global_step": 6403, "epoch": 152} {"train_loss": -4.885774612426758, "global_step": 6404, "epoch": 152} {"train_loss": -4.868461608886719, "global_step": 6405, "epoch": 152} {"train_loss": -4.888755798339844, "global_step": 6406, "epoch": 152} {"train_loss": -4.865243911743164, "global_step": 6407, "epoch": 152} {"train_loss": -4.690846920013428, "global_step": 6408, "epoch": 152} {"train_loss": -4.5835466384887695, "global_step": 6409, "epoch": 152} {"train_loss": -4.794100761413574, "global_step": 6410, "epoch": 152} {"train_loss": -4.671095848083496, "global_step": 6411, "epoch": 152} {"train_loss": -4.732275009155273, "global_step": 6412, "epoch": 152} {"train_loss": -4.781815052032471, "global_step": 6413, "epoch": 152} {"train_loss": -4.5474982261657715, "global_step": 6414, "epoch": 152} {"train_loss": -4.866040229797363, "global_step": 6415, "epoch": 152} {"train_loss": -4.58134651184082, "global_step": 6416, "epoch": 152} {"train_loss": -4.708856582641602, "global_step": 6417, "epoch": 152} {"train_loss": -4.659436225891113, "global_step": 6418, "epoch": 152} {"train_loss": -4.767906665802002, "global_step": 6419, "epoch": 152} {"train_loss": -4.89259147644043, "global_step": 6420, "epoch": 152} {"train_loss": -4.783571243286133, "global_step": 6421, "epoch": 152} {"train_loss": -4.770823001861572, "global_step": 6422, "epoch": 152} {"train_loss": -4.844517707824707, "global_step": 6423, "epoch": 152} {"train_loss": -4.6940741539001465, "global_step": 6424, "epoch": 152} {"train_loss": -4.812881957916987, "global_step": 6425, "epoch": 152, "val_loss": 89168.28125} {"train_loss": -4.791214942932129, "global_step": 6426, "epoch": 153} {"train_loss": -4.844372749328613, "global_step": 6427, "epoch": 153} {"train_loss": -4.789130210876465, "global_step": 6428, "epoch": 153} {"train_loss": -4.886425971984863, "global_step": 6429, "epoch": 153} {"train_loss": -4.778095722198486, "global_step": 6430, "epoch": 153} {"train_loss": -4.7469072341918945, "global_step": 6431, "epoch": 153} {"train_loss": -4.838857650756836, "global_step": 6432, "epoch": 153} {"train_loss": -4.757969379425049, "global_step": 6433, "epoch": 153} {"train_loss": -4.6457977294921875, "global_step": 6434, "epoch": 153} {"train_loss": -4.740283966064453, "global_step": 6435, "epoch": 153} {"train_loss": -4.930514335632324, "global_step": 6436, "epoch": 153} {"train_loss": -4.961298942565918, "global_step": 6437, "epoch": 153} {"train_loss": -4.826988220214844, "global_step": 6438, "epoch": 153} {"train_loss": -4.997673511505127, "global_step": 6439, "epoch": 153} {"train_loss": -4.945757865905762, "global_step": 6440, "epoch": 153} {"train_loss": -5.063509464263916, "global_step": 6441, "epoch": 153} {"train_loss": -4.906425476074219, "global_step": 6442, "epoch": 153} {"train_loss": -4.943163871765137, "global_step": 6443, "epoch": 153} {"train_loss": -4.876117706298828, "global_step": 6444, "epoch": 153} {"train_loss": -4.704216957092285, "global_step": 6445, "epoch": 153} {"train_loss": -4.679507255554199, "global_step": 6446, "epoch": 153} {"train_loss": -4.765110015869141, "global_step": 6447, "epoch": 153} {"train_loss": -4.910484790802002, "global_step": 6448, "epoch": 153} {"train_loss": -4.856345176696777, "global_step": 6449, "epoch": 153} {"train_loss": -4.82822322845459, "global_step": 6450, "epoch": 153} {"train_loss": -4.829564094543457, "global_step": 6451, "epoch": 153} {"train_loss": -4.821693420410156, "global_step": 6452, "epoch": 153} {"train_loss": -4.877593994140625, "global_step": 6453, "epoch": 153} {"train_loss": -5.020786285400391, "global_step": 6454, "epoch": 153} {"train_loss": -4.969810962677002, "global_step": 6455, "epoch": 153} {"train_loss": -4.748715400695801, "global_step": 6456, "epoch": 153} {"train_loss": -4.9534454345703125, "global_step": 6457, "epoch": 153} {"train_loss": -4.874366760253906, "global_step": 6458, "epoch": 153} {"train_loss": -4.702714920043945, "global_step": 6459, "epoch": 153} {"train_loss": -4.849184989929199, "global_step": 6460, "epoch": 153} {"train_loss": -4.826862335205078, "global_step": 6461, "epoch": 153} {"train_loss": -4.79758882522583, "global_step": 6462, "epoch": 153} {"train_loss": -4.724882125854492, "global_step": 6463, "epoch": 153} {"train_loss": -4.714064598083496, "global_step": 6464, "epoch": 153} {"train_loss": -4.818437576293945, "global_step": 6465, "epoch": 153} {"train_loss": -4.800021171569824, "global_step": 6466, "epoch": 153} {"train_loss": -4.825849703380039, "global_step": 6467, "epoch": 153, "val_loss": 88008.3515625} {"train_loss": -4.815458297729492, "global_step": 6468, "epoch": 154} {"train_loss": -4.6114821434021, "global_step": 6469, "epoch": 154} {"train_loss": -4.461158752441406, "global_step": 6470, "epoch": 154} {"train_loss": -4.921387672424316, "global_step": 6471, "epoch": 154} {"train_loss": -4.600956916809082, "global_step": 6472, "epoch": 154} {"train_loss": -4.919342041015625, "global_step": 6473, "epoch": 154} {"train_loss": -4.680856227874756, "global_step": 6474, "epoch": 154} {"train_loss": -4.605968475341797, "global_step": 6475, "epoch": 154} {"train_loss": -4.884450435638428, "global_step": 6476, "epoch": 154} {"train_loss": -4.8800201416015625, "global_step": 6477, "epoch": 154} {"train_loss": -4.73591947555542, "global_step": 6478, "epoch": 154} {"train_loss": -4.854757308959961, "global_step": 6479, "epoch": 154} {"train_loss": -4.931987762451172, "global_step": 6480, "epoch": 154} {"train_loss": -4.728264331817627, "global_step": 6481, "epoch": 154} {"train_loss": -5.013045310974121, "global_step": 6482, "epoch": 154} {"train_loss": -4.887411594390869, "global_step": 6483, "epoch": 154} {"train_loss": -4.718620300292969, "global_step": 6484, "epoch": 154} {"train_loss": -4.7769269943237305, "global_step": 6485, "epoch": 154} {"train_loss": -4.948109149932861, "global_step": 6486, "epoch": 154} {"train_loss": -4.951519966125488, "global_step": 6487, "epoch": 154} {"train_loss": -4.809717178344727, "global_step": 6488, "epoch": 154} {"train_loss": -4.917006015777588, "global_step": 6489, "epoch": 154} {"train_loss": -4.920248985290527, "global_step": 6490, "epoch": 154} {"train_loss": -4.858210563659668, "global_step": 6491, "epoch": 154} {"train_loss": -4.786484718322754, "global_step": 6492, "epoch": 154} {"train_loss": -4.936798095703125, "global_step": 6493, "epoch": 154} {"train_loss": -4.718684196472168, "global_step": 6494, "epoch": 154} {"train_loss": -4.798588752746582, "global_step": 6495, "epoch": 154} {"train_loss": -4.879748344421387, "global_step": 6496, "epoch": 154} {"train_loss": -4.853575706481934, "global_step": 6497, "epoch": 154} {"train_loss": -4.706850528717041, "global_step": 6498, "epoch": 154} {"train_loss": -4.711081504821777, "global_step": 6499, "epoch": 154} {"train_loss": -4.886162757873535, "global_step": 6500, "epoch": 154} {"train_loss": -4.678261756896973, "global_step": 6501, "epoch": 154} {"train_loss": -4.943428993225098, "global_step": 6502, "epoch": 154} {"train_loss": -4.970922470092773, "global_step": 6503, "epoch": 154} {"train_loss": -4.980432033538818, "global_step": 6504, "epoch": 154} {"train_loss": -4.727890968322754, "global_step": 6505, "epoch": 154} {"train_loss": -4.658587455749512, "global_step": 6506, "epoch": 154} {"train_loss": -4.893515586853027, "global_step": 6507, "epoch": 154} {"train_loss": -4.93305778503418, "global_step": 6508, "epoch": 154} {"train_loss": -4.8177552336738225, "global_step": 6509, "epoch": 154, "val_loss": 86733.875} {"train_loss": -4.8181586265563965, "global_step": 6510, "epoch": 155} {"train_loss": -4.880870819091797, "global_step": 6511, "epoch": 155} {"train_loss": -4.973344802856445, "global_step": 6512, "epoch": 155} {"train_loss": -4.925141334533691, "global_step": 6513, "epoch": 155} {"train_loss": -5.042421340942383, "global_step": 6514, "epoch": 155} {"train_loss": -4.763882637023926, "global_step": 6515, "epoch": 155} {"train_loss": -4.896771430969238, "global_step": 6516, "epoch": 155} {"train_loss": -4.842123031616211, "global_step": 6517, "epoch": 155} {"train_loss": -4.837769508361816, "global_step": 6518, "epoch": 155} {"train_loss": -4.785530090332031, "global_step": 6519, "epoch": 155} {"train_loss": -4.876730918884277, "global_step": 6520, "epoch": 155} {"train_loss": -4.947953701019287, "global_step": 6521, "epoch": 155} {"train_loss": -4.824726581573486, "global_step": 6522, "epoch": 155} {"train_loss": -4.73038911819458, "global_step": 6523, "epoch": 155} {"train_loss": -4.891351699829102, "global_step": 6524, "epoch": 155} {"train_loss": -4.682623863220215, "global_step": 6525, "epoch": 155} {"train_loss": -5.051999568939209, "global_step": 6526, "epoch": 155} {"train_loss": -4.501693248748779, "global_step": 6527, "epoch": 155} {"train_loss": -4.849353790283203, "global_step": 6528, "epoch": 155} {"train_loss": -4.855381965637207, "global_step": 6529, "epoch": 155} {"train_loss": -4.663080215454102, "global_step": 6530, "epoch": 155} {"train_loss": -4.852954864501953, "global_step": 6531, "epoch": 155} {"train_loss": -4.732099533081055, "global_step": 6532, "epoch": 155} {"train_loss": -4.849306583404541, "global_step": 6533, "epoch": 155} {"train_loss": -4.8434038162231445, "global_step": 6534, "epoch": 155} {"train_loss": -4.8326520919799805, "global_step": 6535, "epoch": 155} {"train_loss": -4.862637042999268, "global_step": 6536, "epoch": 155} {"train_loss": -4.910770416259766, "global_step": 6537, "epoch": 155} {"train_loss": -4.767338275909424, "global_step": 6538, "epoch": 155} {"train_loss": -4.819114685058594, "global_step": 6539, "epoch": 155} {"train_loss": -4.759918212890625, "global_step": 6540, "epoch": 155} {"train_loss": -4.82271146774292, "global_step": 6541, "epoch": 155} {"train_loss": -4.867954254150391, "global_step": 6542, "epoch": 155} {"train_loss": -4.829174995422363, "global_step": 6543, "epoch": 155} {"train_loss": -5.017533302307129, "global_step": 6544, "epoch": 155} {"train_loss": -4.807839393615723, "global_step": 6545, "epoch": 155} {"train_loss": -4.924752235412598, "global_step": 6546, "epoch": 155} {"train_loss": -4.947652816772461, "global_step": 6547, "epoch": 155} {"train_loss": -4.7215657234191895, "global_step": 6548, "epoch": 155} {"train_loss": -4.954411029815674, "global_step": 6549, "epoch": 155} {"train_loss": -4.899143218994141, "global_step": 6550, "epoch": 155} {"train_loss": -4.844811110269456, "global_step": 6551, "epoch": 155, "val_loss": 86768.375} {"train_loss": -4.764449596405029, "global_step": 6552, "epoch": 156} {"train_loss": -4.844613552093506, "global_step": 6553, "epoch": 156} {"train_loss": -4.950911998748779, "global_step": 6554, "epoch": 156} {"train_loss": -4.887115478515625, "global_step": 6555, "epoch": 156} {"train_loss": -4.919236660003662, "global_step": 6556, "epoch": 156} {"train_loss": -4.80530309677124, "global_step": 6557, "epoch": 156} {"train_loss": -4.985735893249512, "global_step": 6558, "epoch": 156} {"train_loss": -4.87825870513916, "global_step": 6559, "epoch": 156} {"train_loss": -4.908545017242432, "global_step": 6560, "epoch": 156} {"train_loss": -4.876091003417969, "global_step": 6561, "epoch": 156} {"train_loss": -4.941269874572754, "global_step": 6562, "epoch": 156} {"train_loss": -4.912972927093506, "global_step": 6563, "epoch": 156} {"train_loss": -4.779433250427246, "global_step": 6564, "epoch": 156} {"train_loss": -4.8639631271362305, "global_step": 6565, "epoch": 156} {"train_loss": -4.846255302429199, "global_step": 6566, "epoch": 156} {"train_loss": -4.854977607727051, "global_step": 6567, "epoch": 156} {"train_loss": -4.911827564239502, "global_step": 6568, "epoch": 156} {"train_loss": -4.932400703430176, "global_step": 6569, "epoch": 156} {"train_loss": -4.989858627319336, "global_step": 6570, "epoch": 156} {"train_loss": -4.800593852996826, "global_step": 6571, "epoch": 156} {"train_loss": -4.794343948364258, "global_step": 6572, "epoch": 156} {"train_loss": -4.913713455200195, "global_step": 6573, "epoch": 156} {"train_loss": -4.987462043762207, "global_step": 6574, "epoch": 156} {"train_loss": -4.859365463256836, "global_step": 6575, "epoch": 156} {"train_loss": -4.968657970428467, "global_step": 6576, "epoch": 156} {"train_loss": -5.011363506317139, "global_step": 6577, "epoch": 156} {"train_loss": -4.8275275230407715, "global_step": 6578, "epoch": 156} {"train_loss": -4.794507026672363, "global_step": 6579, "epoch": 156} {"train_loss": -4.971624374389648, "global_step": 6580, "epoch": 156} {"train_loss": -4.864951133728027, "global_step": 6581, "epoch": 156} {"train_loss": -4.845827579498291, "global_step": 6582, "epoch": 156} {"train_loss": -4.74395751953125, "global_step": 6583, "epoch": 156} {"train_loss": -4.871389389038086, "global_step": 6584, "epoch": 156} {"train_loss": -4.835146903991699, "global_step": 6585, "epoch": 156} {"train_loss": -4.88138484954834, "global_step": 6586, "epoch": 156} {"train_loss": -4.8242692947387695, "global_step": 6587, "epoch": 156} {"train_loss": -4.770901203155518, "global_step": 6588, "epoch": 156} {"train_loss": -4.832314491271973, "global_step": 6589, "epoch": 156} {"train_loss": -4.741950511932373, "global_step": 6590, "epoch": 156} {"train_loss": -4.664532661437988, "global_step": 6591, "epoch": 156} {"train_loss": -4.985317230224609, "global_step": 6592, "epoch": 156} {"train_loss": -4.867367835271926, "global_step": 6593, "epoch": 156, "val_loss": 87315.546875} {"train_loss": -4.8034563064575195, "global_step": 6594, "epoch": 157} {"train_loss": -4.836733818054199, "global_step": 6595, "epoch": 157} {"train_loss": -4.868985176086426, "global_step": 6596, "epoch": 157} {"train_loss": -4.796796798706055, "global_step": 6597, "epoch": 157} {"train_loss": -4.909026622772217, "global_step": 6598, "epoch": 157} {"train_loss": -4.881120204925537, "global_step": 6599, "epoch": 157} {"train_loss": -4.845184803009033, "global_step": 6600, "epoch": 157} {"train_loss": -4.611492156982422, "global_step": 6601, "epoch": 157} {"train_loss": -4.948544502258301, "global_step": 6602, "epoch": 157} {"train_loss": -4.890002250671387, "global_step": 6603, "epoch": 157} {"train_loss": -4.905084609985352, "global_step": 6604, "epoch": 157} {"train_loss": -4.793972969055176, "global_step": 6605, "epoch": 157} {"train_loss": -4.755496025085449, "global_step": 6606, "epoch": 157} {"train_loss": -5.023691177368164, "global_step": 6607, "epoch": 157} {"train_loss": -4.95745325088501, "global_step": 6608, "epoch": 157} {"train_loss": -4.751659393310547, "global_step": 6609, "epoch": 157} {"train_loss": -4.735695838928223, "global_step": 6610, "epoch": 157} {"train_loss": -4.917982578277588, "global_step": 6611, "epoch": 157} {"train_loss": -4.980160713195801, "global_step": 6612, "epoch": 157} {"train_loss": -4.741127967834473, "global_step": 6613, "epoch": 157} {"train_loss": -4.950221061706543, "global_step": 6614, "epoch": 157} {"train_loss": -4.818294048309326, "global_step": 6615, "epoch": 157} {"train_loss": -4.9607954025268555, "global_step": 6616, "epoch": 157} {"train_loss": -4.9210028648376465, "global_step": 6617, "epoch": 157} {"train_loss": -4.865621089935303, "global_step": 6618, "epoch": 157} {"train_loss": -4.788125991821289, "global_step": 6619, "epoch": 157} {"train_loss": -4.977231979370117, "global_step": 6620, "epoch": 157} {"train_loss": -4.960721969604492, "global_step": 6621, "epoch": 157} {"train_loss": -4.955327987670898, "global_step": 6622, "epoch": 157} {"train_loss": -4.9388933181762695, "global_step": 6623, "epoch": 157} {"train_loss": -4.7778778076171875, "global_step": 6624, "epoch": 157} {"train_loss": -4.947603702545166, "global_step": 6625, "epoch": 157} {"train_loss": -5.085236549377441, "global_step": 6626, "epoch": 157} {"train_loss": -4.823620796203613, "global_step": 6627, "epoch": 157} {"train_loss": -4.813955783843994, "global_step": 6628, "epoch": 157} {"train_loss": -4.965703010559082, "global_step": 6629, "epoch": 157} {"train_loss": -5.037023544311523, "global_step": 6630, "epoch": 157} {"train_loss": -4.839612007141113, "global_step": 6631, "epoch": 157} {"train_loss": -4.931149482727051, "global_step": 6632, "epoch": 157} {"train_loss": -4.974616050720215, "global_step": 6633, "epoch": 157} {"train_loss": -4.953611373901367, "global_step": 6634, "epoch": 157} {"train_loss": -4.88354366166251, "global_step": 6635, "epoch": 157, "val_loss": 86747.453125} {"train_loss": -4.753682613372803, "global_step": 6636, "epoch": 158} {"train_loss": -4.735713005065918, "global_step": 6637, "epoch": 158} {"train_loss": -4.848851203918457, "global_step": 6638, "epoch": 158} {"train_loss": -4.7432427406311035, "global_step": 6639, "epoch": 158} {"train_loss": -4.919996738433838, "global_step": 6640, "epoch": 158} {"train_loss": -4.667063236236572, "global_step": 6641, "epoch": 158} {"train_loss": -4.627735137939453, "global_step": 6642, "epoch": 158} {"train_loss": -4.821410655975342, "global_step": 6643, "epoch": 158} {"train_loss": -4.722739219665527, "global_step": 6644, "epoch": 158} {"train_loss": -4.609947204589844, "global_step": 6645, "epoch": 158} {"train_loss": -4.7450385093688965, "global_step": 6646, "epoch": 158} {"train_loss": -4.701687812805176, "global_step": 6647, "epoch": 158} {"train_loss": -4.731902122497559, "global_step": 6648, "epoch": 158} {"train_loss": -4.5986175537109375, "global_step": 6649, "epoch": 158} {"train_loss": -4.789294719696045, "global_step": 6650, "epoch": 158} {"train_loss": -4.8179402351379395, "global_step": 6651, "epoch": 158} {"train_loss": -4.828829288482666, "global_step": 6652, "epoch": 158} {"train_loss": -4.893742561340332, "global_step": 6653, "epoch": 158} {"train_loss": -4.806456089019775, "global_step": 6654, "epoch": 158} {"train_loss": -4.86215877532959, "global_step": 6655, "epoch": 158} {"train_loss": -5.016002178192139, "global_step": 6656, "epoch": 158} {"train_loss": -4.760272026062012, "global_step": 6657, "epoch": 158} {"train_loss": -4.90468168258667, "global_step": 6658, "epoch": 158} {"train_loss": -5.0194091796875, "global_step": 6659, "epoch": 158} {"train_loss": -4.886249542236328, "global_step": 6660, "epoch": 158} {"train_loss": -4.8492021560668945, "global_step": 6661, "epoch": 158} {"train_loss": -4.995357513427734, "global_step": 6662, "epoch": 158} {"train_loss": -4.7651896476745605, "global_step": 6663, "epoch": 158} {"train_loss": -4.895092964172363, "global_step": 6664, "epoch": 158} {"train_loss": -4.901418685913086, "global_step": 6665, "epoch": 158} {"train_loss": -4.797120094299316, "global_step": 6666, "epoch": 158} {"train_loss": -4.832907676696777, "global_step": 6667, "epoch": 158} {"train_loss": -4.837214469909668, "global_step": 6668, "epoch": 158} {"train_loss": -4.892191410064697, "global_step": 6669, "epoch": 158} {"train_loss": -4.949090003967285, "global_step": 6670, "epoch": 158} {"train_loss": -4.853569030761719, "global_step": 6671, "epoch": 158} {"train_loss": -4.933722019195557, "global_step": 6672, "epoch": 158} {"train_loss": -4.855374813079834, "global_step": 6673, "epoch": 158} {"train_loss": -4.738030910491943, "global_step": 6674, "epoch": 158} {"train_loss": -4.880880355834961, "global_step": 6675, "epoch": 158} {"train_loss": -4.790240287780762, "global_step": 6676, "epoch": 158} {"train_loss": -4.820088727133615, "global_step": 6677, "epoch": 158, "val_loss": 86111.0546875} {"train_loss": -4.912775039672852, "global_step": 6678, "epoch": 159} {"train_loss": -4.799666881561279, "global_step": 6679, "epoch": 159} {"train_loss": -4.911671161651611, "global_step": 6680, "epoch": 159} {"train_loss": -5.000396251678467, "global_step": 6681, "epoch": 159} {"train_loss": -4.905902862548828, "global_step": 6682, "epoch": 159} {"train_loss": -5.066866874694824, "global_step": 6683, "epoch": 159} {"train_loss": -5.02455997467041, "global_step": 6684, "epoch": 159} {"train_loss": -4.954775810241699, "global_step": 6685, "epoch": 159} {"train_loss": -4.922764778137207, "global_step": 6686, "epoch": 159} {"train_loss": -4.878821849822998, "global_step": 6687, "epoch": 159} {"train_loss": -4.718305587768555, "global_step": 6688, "epoch": 159} {"train_loss": -4.868508338928223, "global_step": 6689, "epoch": 159} {"train_loss": -4.934268951416016, "global_step": 6690, "epoch": 159} {"train_loss": -4.91978645324707, "global_step": 6691, "epoch": 159} {"train_loss": -4.57083797454834, "global_step": 6692, "epoch": 159} {"train_loss": -4.697924613952637, "global_step": 6693, "epoch": 159} {"train_loss": -4.799069404602051, "global_step": 6694, "epoch": 159} {"train_loss": -4.844796657562256, "global_step": 6695, "epoch": 159} {"train_loss": -4.7939229011535645, "global_step": 6696, "epoch": 159} {"train_loss": -4.836019992828369, "global_step": 6697, "epoch": 159} {"train_loss": -4.871375560760498, "global_step": 6698, "epoch": 159} {"train_loss": -4.694436073303223, "global_step": 6699, "epoch": 159} {"train_loss": -4.855778694152832, "global_step": 6700, "epoch": 159} {"train_loss": -4.814352035522461, "global_step": 6701, "epoch": 159} {"train_loss": -4.899238109588623, "global_step": 6702, "epoch": 159} {"train_loss": -4.925258636474609, "global_step": 6703, "epoch": 159} {"train_loss": -4.868243217468262, "global_step": 6704, "epoch": 159} {"train_loss": -4.989377498626709, "global_step": 6705, "epoch": 159} {"train_loss": -5.015174388885498, "global_step": 6706, "epoch": 159} {"train_loss": -4.988616943359375, "global_step": 6707, "epoch": 159} {"train_loss": -4.9233903884887695, "global_step": 6708, "epoch": 159} {"train_loss": -4.8988847732543945, "global_step": 6709, "epoch": 159} {"train_loss": -4.8949761390686035, "global_step": 6710, "epoch": 159} {"train_loss": -4.877119064331055, "global_step": 6711, "epoch": 159} {"train_loss": -4.945642471313477, "global_step": 6712, "epoch": 159} {"train_loss": -4.9218926429748535, "global_step": 6713, "epoch": 159} {"train_loss": -4.885775566101074, "global_step": 6714, "epoch": 159} {"train_loss": -4.96439266204834, "global_step": 6715, "epoch": 159} {"train_loss": -4.815361022949219, "global_step": 6716, "epoch": 159} {"train_loss": -4.920601844787598, "global_step": 6717, "epoch": 159} {"train_loss": -4.887887954711914, "global_step": 6718, "epoch": 159} {"train_loss": -4.883040768759591, "global_step": 6719, "epoch": 159, "val_loss": 86467.46875} {"train_loss": -4.956911087036133, "global_step": 6720, "epoch": 160} {"train_loss": -5.038906097412109, "global_step": 6721, "epoch": 160} {"train_loss": -4.844210624694824, "global_step": 6722, "epoch": 160} {"train_loss": -4.8018341064453125, "global_step": 6723, "epoch": 160} {"train_loss": -4.943192481994629, "global_step": 6724, "epoch": 160} {"train_loss": -4.864152908325195, "global_step": 6725, "epoch": 160} {"train_loss": -4.7666802406311035, "global_step": 6726, "epoch": 160} {"train_loss": -4.852389335632324, "global_step": 6727, "epoch": 160} {"train_loss": -4.98907995223999, "global_step": 6728, "epoch": 160} {"train_loss": -4.876227855682373, "global_step": 6729, "epoch": 160} {"train_loss": -4.8893022537231445, "global_step": 6730, "epoch": 160} {"train_loss": -4.922930717468262, "global_step": 6731, "epoch": 160} {"train_loss": -4.931584358215332, "global_step": 6732, "epoch": 160} {"train_loss": -4.909841537475586, "global_step": 6733, "epoch": 160} {"train_loss": -4.954502582550049, "global_step": 6734, "epoch": 160} {"train_loss": -4.739555835723877, "global_step": 6735, "epoch": 160} {"train_loss": -4.881621837615967, "global_step": 6736, "epoch": 160} {"train_loss": -4.861152648925781, "global_step": 6737, "epoch": 160} {"train_loss": -4.6712646484375, "global_step": 6738, "epoch": 160} {"train_loss": -5.056558609008789, "global_step": 6739, "epoch": 160} {"train_loss": -4.759529113769531, "global_step": 6740, "epoch": 160} {"train_loss": -4.588107109069824, "global_step": 6741, "epoch": 160} {"train_loss": -4.722919464111328, "global_step": 6742, "epoch": 160} {"train_loss": -4.682365417480469, "global_step": 6743, "epoch": 160} {"train_loss": -4.7457990646362305, "global_step": 6744, "epoch": 160} {"train_loss": -4.748473167419434, "global_step": 6745, "epoch": 160} {"train_loss": -4.750143051147461, "global_step": 6746, "epoch": 160} {"train_loss": -4.802691459655762, "global_step": 6747, "epoch": 160} {"train_loss": -4.784512519836426, "global_step": 6748, "epoch": 160} {"train_loss": -4.872409820556641, "global_step": 6749, "epoch": 160} {"train_loss": -4.934314727783203, "global_step": 6750, "epoch": 160} {"train_loss": -4.93126106262207, "global_step": 6751, "epoch": 160} {"train_loss": -4.9609375, "global_step": 6752, "epoch": 160} {"train_loss": -4.855798721313477, "global_step": 6753, "epoch": 160} {"train_loss": -5.0041704177856445, "global_step": 6754, "epoch": 160} {"train_loss": -4.887264728546143, "global_step": 6755, "epoch": 160} {"train_loss": -4.950628280639648, "global_step": 6756, "epoch": 160} {"train_loss": -4.883245468139648, "global_step": 6757, "epoch": 160} {"train_loss": -4.881471633911133, "global_step": 6758, "epoch": 160} {"train_loss": -5.0788445472717285, "global_step": 6759, "epoch": 160} {"train_loss": -4.996450424194336, "global_step": 6760, "epoch": 160} {"train_loss": -4.866532234918504, "global_step": 6761, "epoch": 160, "val_loss": 86337.1953125} {"train_loss": -4.964971542358398, "global_step": 6762, "epoch": 161} {"train_loss": -5.007885932922363, "global_step": 6763, "epoch": 161} {"train_loss": -4.915327072143555, "global_step": 6764, "epoch": 161} {"train_loss": -4.916118144989014, "global_step": 6765, "epoch": 161} {"train_loss": -4.894840240478516, "global_step": 6766, "epoch": 161} {"train_loss": -4.892849922180176, "global_step": 6767, "epoch": 161} {"train_loss": -4.986584663391113, "global_step": 6768, "epoch": 161} {"train_loss": -4.8273186683654785, "global_step": 6769, "epoch": 161} {"train_loss": -4.980146408081055, "global_step": 6770, "epoch": 161} {"train_loss": -5.074952125549316, "global_step": 6771, "epoch": 161} {"train_loss": -4.877254486083984, "global_step": 6772, "epoch": 161} {"train_loss": -4.907697677612305, "global_step": 6773, "epoch": 161} {"train_loss": -4.991693496704102, "global_step": 6774, "epoch": 161} {"train_loss": -4.9436421394348145, "global_step": 6775, "epoch": 161} {"train_loss": -4.951964378356934, "global_step": 6776, "epoch": 161} {"train_loss": -4.938992500305176, "global_step": 6777, "epoch": 161} {"train_loss": -4.908194065093994, "global_step": 6778, "epoch": 161} {"train_loss": -4.8805646896362305, "global_step": 6779, "epoch": 161} {"train_loss": -4.925349235534668, "global_step": 6780, "epoch": 161} {"train_loss": -4.875611782073975, "global_step": 6781, "epoch": 161} {"train_loss": -5.119165420532227, "global_step": 6782, "epoch": 161} {"train_loss": -4.787318229675293, "global_step": 6783, "epoch": 161} {"train_loss": -4.830924034118652, "global_step": 6784, "epoch": 161} {"train_loss": -4.907837867736816, "global_step": 6785, "epoch": 161} {"train_loss": -4.798389434814453, "global_step": 6786, "epoch": 161} {"train_loss": -4.796712398529053, "global_step": 6787, "epoch": 161} {"train_loss": -4.891157150268555, "global_step": 6788, "epoch": 161} {"train_loss": -4.922375679016113, "global_step": 6789, "epoch": 161} {"train_loss": -4.777242660522461, "global_step": 6790, "epoch": 161} {"train_loss": -4.745636940002441, "global_step": 6791, "epoch": 161} {"train_loss": -4.923590660095215, "global_step": 6792, "epoch": 161} {"train_loss": -4.975188255310059, "global_step": 6793, "epoch": 161} {"train_loss": -4.937574863433838, "global_step": 6794, "epoch": 161} {"train_loss": -4.978157997131348, "global_step": 6795, "epoch": 161} {"train_loss": -4.865823745727539, "global_step": 6796, "epoch": 161} {"train_loss": -4.97706413269043, "global_step": 6797, "epoch": 161} {"train_loss": -4.867027759552002, "global_step": 6798, "epoch": 161} {"train_loss": -4.991343021392822, "global_step": 6799, "epoch": 161} {"train_loss": -5.015566825866699, "global_step": 6800, "epoch": 161} {"train_loss": -4.896836280822754, "global_step": 6801, "epoch": 161} {"train_loss": -4.82492733001709, "global_step": 6802, "epoch": 161} {"train_loss": -4.910118806929815, "global_step": 6803, "epoch": 161, "val_loss": 87109.921875} {"train_loss": -4.860757827758789, "global_step": 6804, "epoch": 162} {"train_loss": -4.848644733428955, "global_step": 6805, "epoch": 162} {"train_loss": -4.911978244781494, "global_step": 6806, "epoch": 162} {"train_loss": -4.779923439025879, "global_step": 6807, "epoch": 162} {"train_loss": -4.810918807983398, "global_step": 6808, "epoch": 162} {"train_loss": -4.802944660186768, "global_step": 6809, "epoch": 162} {"train_loss": -4.767616271972656, "global_step": 6810, "epoch": 162} {"train_loss": -4.803274154663086, "global_step": 6811, "epoch": 162} {"train_loss": -4.82122802734375, "global_step": 6812, "epoch": 162} {"train_loss": -4.794368743896484, "global_step": 6813, "epoch": 162} {"train_loss": -4.530936241149902, "global_step": 6814, "epoch": 162} {"train_loss": -4.8943681716918945, "global_step": 6815, "epoch": 162} {"train_loss": -4.696275234222412, "global_step": 6816, "epoch": 162} {"train_loss": -4.967691898345947, "global_step": 6817, "epoch": 162} {"train_loss": -4.637607574462891, "global_step": 6818, "epoch": 162} {"train_loss": -4.569976806640625, "global_step": 6819, "epoch": 162} {"train_loss": -4.859194755554199, "global_step": 6820, "epoch": 162} {"train_loss": -4.63564920425415, "global_step": 6821, "epoch": 162} {"train_loss": -4.892695903778076, "global_step": 6822, "epoch": 162} {"train_loss": -4.529298305511475, "global_step": 6823, "epoch": 162} {"train_loss": -4.790128707885742, "global_step": 6824, "epoch": 162} {"train_loss": -4.653808116912842, "global_step": 6825, "epoch": 162} {"train_loss": -4.864377975463867, "global_step": 6826, "epoch": 162} {"train_loss": -4.754195213317871, "global_step": 6827, "epoch": 162} {"train_loss": -4.831212997436523, "global_step": 6828, "epoch": 162} {"train_loss": -4.792697906494141, "global_step": 6829, "epoch": 162} {"train_loss": -4.752621173858643, "global_step": 6830, "epoch": 162} {"train_loss": -4.871524810791016, "global_step": 6831, "epoch": 162} {"train_loss": -4.954509258270264, "global_step": 6832, "epoch": 162} {"train_loss": -4.96602201461792, "global_step": 6833, "epoch": 162} {"train_loss": -4.990886688232422, "global_step": 6834, "epoch": 162} {"train_loss": -4.905947208404541, "global_step": 6835, "epoch": 162} {"train_loss": -4.826998710632324, "global_step": 6836, "epoch": 162} {"train_loss": -4.836453437805176, "global_step": 6837, "epoch": 162} {"train_loss": -4.874685764312744, "global_step": 6838, "epoch": 162} {"train_loss": -4.84257698059082, "global_step": 6839, "epoch": 162} {"train_loss": -4.719318389892578, "global_step": 6840, "epoch": 162} {"train_loss": -4.87771463394165, "global_step": 6841, "epoch": 162} {"train_loss": -4.924686431884766, "global_step": 6842, "epoch": 162} {"train_loss": -4.652647972106934, "global_step": 6843, "epoch": 162} {"train_loss": -4.747666835784912, "global_step": 6844, "epoch": 162} {"train_loss": -4.803377162842524, "global_step": 6845, "epoch": 162, "val_loss": 87227.2421875} {"train_loss": -4.721832752227783, "global_step": 6846, "epoch": 163} {"train_loss": -4.804222106933594, "global_step": 6847, "epoch": 163} {"train_loss": -5.056920051574707, "global_step": 6848, "epoch": 163} {"train_loss": -4.664421081542969, "global_step": 6849, "epoch": 163} {"train_loss": -5.002142906188965, "global_step": 6850, "epoch": 163} {"train_loss": -4.9388298988342285, "global_step": 6851, "epoch": 163} {"train_loss": -4.929971694946289, "global_step": 6852, "epoch": 163} {"train_loss": -4.914394378662109, "global_step": 6853, "epoch": 163} {"train_loss": -4.829733848571777, "global_step": 6854, "epoch": 163} {"train_loss": -4.991689205169678, "global_step": 6855, "epoch": 163} {"train_loss": -4.970667362213135, "global_step": 6856, "epoch": 163} {"train_loss": -4.967462539672852, "global_step": 6857, "epoch": 163} {"train_loss": -4.935805797576904, "global_step": 6858, "epoch": 163} {"train_loss": -4.9160051345825195, "global_step": 6859, "epoch": 163} {"train_loss": -4.911472320556641, "global_step": 6860, "epoch": 163} {"train_loss": -5.154182434082031, "global_step": 6861, "epoch": 163} {"train_loss": -4.980847358703613, "global_step": 6862, "epoch": 163} {"train_loss": -4.91656494140625, "global_step": 6863, "epoch": 163} {"train_loss": -4.956202030181885, "global_step": 6864, "epoch": 163} {"train_loss": -4.961021423339844, "global_step": 6865, "epoch": 163} {"train_loss": -4.9809041023254395, "global_step": 6866, "epoch": 163} {"train_loss": -4.824915409088135, "global_step": 6867, "epoch": 163} {"train_loss": -5.081627368927002, "global_step": 6868, "epoch": 163} {"train_loss": -5.006325721740723, "global_step": 6869, "epoch": 163} {"train_loss": -5.058891773223877, "global_step": 6870, "epoch": 163} {"train_loss": -4.892975807189941, "global_step": 6871, "epoch": 163} {"train_loss": -4.914048194885254, "global_step": 6872, "epoch": 163} {"train_loss": -4.90828275680542, "global_step": 6873, "epoch": 163} {"train_loss": -5.060760498046875, "global_step": 6874, "epoch": 163} {"train_loss": -4.881429672241211, "global_step": 6875, "epoch": 163} {"train_loss": -4.825067520141602, "global_step": 6876, "epoch": 163} {"train_loss": -4.969511985778809, "global_step": 6877, "epoch": 163} {"train_loss": -4.954395294189453, "global_step": 6878, "epoch": 163} {"train_loss": -4.953695297241211, "global_step": 6879, "epoch": 163} {"train_loss": -5.040738105773926, "global_step": 6880, "epoch": 163} {"train_loss": -4.866150379180908, "global_step": 6881, "epoch": 163} {"train_loss": -4.905529975891113, "global_step": 6882, "epoch": 163} {"train_loss": -5.014573097229004, "global_step": 6883, "epoch": 163} {"train_loss": -4.978085994720459, "global_step": 6884, "epoch": 163} {"train_loss": -4.798458099365234, "global_step": 6885, "epoch": 163} {"train_loss": -4.832932949066162, "global_step": 6886, "epoch": 163} {"train_loss": -4.926211050578526, "global_step": 6887, "epoch": 163, "val_loss": 85810.4921875} {"train_loss": -4.773382663726807, "global_step": 6888, "epoch": 164} {"train_loss": -5.000326633453369, "global_step": 6889, "epoch": 164} {"train_loss": -4.760339736938477, "global_step": 6890, "epoch": 164} {"train_loss": -4.930574417114258, "global_step": 6891, "epoch": 164} {"train_loss": -4.910238265991211, "global_step": 6892, "epoch": 164} {"train_loss": -4.916831970214844, "global_step": 6893, "epoch": 164} {"train_loss": -4.962891578674316, "global_step": 6894, "epoch": 164} {"train_loss": -4.857514381408691, "global_step": 6895, "epoch": 164} {"train_loss": -5.047067642211914, "global_step": 6896, "epoch": 164} {"train_loss": -4.872417449951172, "global_step": 6897, "epoch": 164} {"train_loss": -4.907427787780762, "global_step": 6898, "epoch": 164} {"train_loss": -5.047801494598389, "global_step": 6899, "epoch": 164} {"train_loss": -4.863840103149414, "global_step": 6900, "epoch": 164} {"train_loss": -5.0390167236328125, "global_step": 6901, "epoch": 164} {"train_loss": -4.893532752990723, "global_step": 6902, "epoch": 164} {"train_loss": -4.867792129516602, "global_step": 6903, "epoch": 164} {"train_loss": -4.9266438484191895, "global_step": 6904, "epoch": 164} {"train_loss": -5.039427280426025, "global_step": 6905, "epoch": 164} {"train_loss": -4.91282320022583, "global_step": 6906, "epoch": 164} {"train_loss": -4.755087375640869, "global_step": 6907, "epoch": 164} {"train_loss": -4.875858306884766, "global_step": 6908, "epoch": 164} {"train_loss": -4.919260501861572, "global_step": 6909, "epoch": 164} {"train_loss": -4.722769737243652, "global_step": 6910, "epoch": 164} {"train_loss": -4.93531608581543, "global_step": 6911, "epoch": 164} {"train_loss": -5.0570969581604, "global_step": 6912, "epoch": 164} {"train_loss": -4.854846954345703, "global_step": 6913, "epoch": 164} {"train_loss": -4.813419342041016, "global_step": 6914, "epoch": 164} {"train_loss": -4.842840671539307, "global_step": 6915, "epoch": 164} {"train_loss": -4.7748613357543945, "global_step": 6916, "epoch": 164} {"train_loss": -4.781833648681641, "global_step": 6917, "epoch": 164} {"train_loss": -4.957242488861084, "global_step": 6918, "epoch": 164} {"train_loss": -4.959836959838867, "global_step": 6919, "epoch": 164} {"train_loss": -4.7462263107299805, "global_step": 6920, "epoch": 164} {"train_loss": -4.823101997375488, "global_step": 6921, "epoch": 164} {"train_loss": -4.785886764526367, "global_step": 6922, "epoch": 164} {"train_loss": -4.6810832023620605, "global_step": 6923, "epoch": 164} {"train_loss": -4.992603302001953, "global_step": 6924, "epoch": 164} {"train_loss": -4.831549644470215, "global_step": 6925, "epoch": 164} {"train_loss": -4.77101993560791, "global_step": 6926, "epoch": 164} {"train_loss": -4.9967041015625, "global_step": 6927, "epoch": 164} {"train_loss": -4.957143306732178, "global_step": 6928, "epoch": 164} {"train_loss": -4.886639958336239, "global_step": 6929, "epoch": 164, "val_loss": 85659.53125} {"train_loss": -4.863905429840088, "global_step": 6930, "epoch": 165} {"train_loss": -4.865128517150879, "global_step": 6931, "epoch": 165} {"train_loss": -4.969261169433594, "global_step": 6932, "epoch": 165} {"train_loss": -4.9460577964782715, "global_step": 6933, "epoch": 165} {"train_loss": -4.910412788391113, "global_step": 6934, "epoch": 165} {"train_loss": -5.046624183654785, "global_step": 6935, "epoch": 165} {"train_loss": -4.75704288482666, "global_step": 6936, "epoch": 165} {"train_loss": -5.012477397918701, "global_step": 6937, "epoch": 165} {"train_loss": -5.05253791809082, "global_step": 6938, "epoch": 165} {"train_loss": -4.965993404388428, "global_step": 6939, "epoch": 165} {"train_loss": -4.961690902709961, "global_step": 6940, "epoch": 165} {"train_loss": -4.9343743324279785, "global_step": 6941, "epoch": 165} {"train_loss": -5.114523887634277, "global_step": 6942, "epoch": 165} {"train_loss": -4.850780487060547, "global_step": 6943, "epoch": 165} {"train_loss": -4.784486770629883, "global_step": 6944, "epoch": 165} {"train_loss": -4.753112316131592, "global_step": 6945, "epoch": 165} {"train_loss": -4.786423206329346, "global_step": 6946, "epoch": 165} {"train_loss": -4.899457931518555, "global_step": 6947, "epoch": 165} {"train_loss": -4.932544708251953, "global_step": 6948, "epoch": 165} {"train_loss": -4.948975086212158, "global_step": 6949, "epoch": 165} {"train_loss": -4.840267181396484, "global_step": 6950, "epoch": 165} {"train_loss": -4.6634650230407715, "global_step": 6951, "epoch": 165} {"train_loss": -5.027743339538574, "global_step": 6952, "epoch": 165} {"train_loss": -4.867484092712402, "global_step": 6953, "epoch": 165} {"train_loss": -4.861601829528809, "global_step": 6954, "epoch": 165} {"train_loss": -4.859745025634766, "global_step": 6955, "epoch": 165} {"train_loss": -4.869194030761719, "global_step": 6956, "epoch": 165} {"train_loss": -4.788743019104004, "global_step": 6957, "epoch": 165} {"train_loss": -4.987842559814453, "global_step": 6958, "epoch": 165} {"train_loss": -4.958670139312744, "global_step": 6959, "epoch": 165} {"train_loss": -4.958354949951172, "global_step": 6960, "epoch": 165} {"train_loss": -5.060344219207764, "global_step": 6961, "epoch": 165} {"train_loss": -4.85956335067749, "global_step": 6962, "epoch": 165} {"train_loss": -5.050702095031738, "global_step": 6963, "epoch": 165} {"train_loss": -4.9333086013793945, "global_step": 6964, "epoch": 165} {"train_loss": -4.846469879150391, "global_step": 6965, "epoch": 165} {"train_loss": -4.920566558837891, "global_step": 6966, "epoch": 165} {"train_loss": -4.993520736694336, "global_step": 6967, "epoch": 165} {"train_loss": -4.956254005432129, "global_step": 6968, "epoch": 165} {"train_loss": -4.983539581298828, "global_step": 6969, "epoch": 165} {"train_loss": -4.990996837615967, "global_step": 6970, "epoch": 165} {"train_loss": -4.918095815749395, "global_step": 6971, "epoch": 165, "val_loss": 85317.1484375} {"train_loss": -4.9147539138793945, "global_step": 6972, "epoch": 166} {"train_loss": -4.974045276641846, "global_step": 6973, "epoch": 166} {"train_loss": -4.926476001739502, "global_step": 6974, "epoch": 166} {"train_loss": -5.010219097137451, "global_step": 6975, "epoch": 166} {"train_loss": -4.975384712219238, "global_step": 6976, "epoch": 166} {"train_loss": -4.946680068969727, "global_step": 6977, "epoch": 166} {"train_loss": -5.007897853851318, "global_step": 6978, "epoch": 166} {"train_loss": -4.759287357330322, "global_step": 6979, "epoch": 166} {"train_loss": -4.965222358703613, "global_step": 6980, "epoch": 166} {"train_loss": -4.871837139129639, "global_step": 6981, "epoch": 166} {"train_loss": -4.753912925720215, "global_step": 6982, "epoch": 166} {"train_loss": -4.791962623596191, "global_step": 6983, "epoch": 166} {"train_loss": -4.754284381866455, "global_step": 6984, "epoch": 166} {"train_loss": -4.551904201507568, "global_step": 6985, "epoch": 166} {"train_loss": -4.821873664855957, "global_step": 6986, "epoch": 166} {"train_loss": -4.742733955383301, "global_step": 6987, "epoch": 166} {"train_loss": -4.867390155792236, "global_step": 6988, "epoch": 166} {"train_loss": -4.535789489746094, "global_step": 6989, "epoch": 166} {"train_loss": -4.8210625648498535, "global_step": 6990, "epoch": 166} {"train_loss": -4.819676399230957, "global_step": 6991, "epoch": 166} {"train_loss": -4.798038005828857, "global_step": 6992, "epoch": 166} {"train_loss": -4.9266743659973145, "global_step": 6993, "epoch": 166} {"train_loss": -4.7769551277160645, "global_step": 6994, "epoch": 166} {"train_loss": -4.767862319946289, "global_step": 6995, "epoch": 166} {"train_loss": -4.60931396484375, "global_step": 6996, "epoch": 166} {"train_loss": -4.881369590759277, "global_step": 6997, "epoch": 166} {"train_loss": -4.779858589172363, "global_step": 6998, "epoch": 166} {"train_loss": -4.799522876739502, "global_step": 6999, "epoch": 166} {"train_loss": -4.887378692626953, "global_step": 7000, "epoch": 166} {"train_loss": -4.983490467071533, "global_step": 7001, "epoch": 166} {"train_loss": -4.782090663909912, "global_step": 7002, "epoch": 166} {"train_loss": -4.793911933898926, "global_step": 7003, "epoch": 166} {"train_loss": -4.911843299865723, "global_step": 7004, "epoch": 166} {"train_loss": -4.848346710205078, "global_step": 7005, "epoch": 166} {"train_loss": -4.8549699783325195, "global_step": 7006, "epoch": 166} {"train_loss": -4.971148490905762, "global_step": 7007, "epoch": 166} {"train_loss": -4.88596248626709, "global_step": 7008, "epoch": 166} {"train_loss": -4.955071449279785, "global_step": 7009, "epoch": 166} {"train_loss": -5.067292213439941, "global_step": 7010, "epoch": 166} {"train_loss": -5.023865222930908, "global_step": 7011, "epoch": 166} {"train_loss": -4.90557336807251, "global_step": 7012, "epoch": 166} {"train_loss": -4.855999753588722, "global_step": 7013, "epoch": 166, "val_loss": 85317.2734375} {"train_loss": -4.964252471923828, "global_step": 7014, "epoch": 167} {"train_loss": -4.919933319091797, "global_step": 7015, "epoch": 167} {"train_loss": -4.9200053215026855, "global_step": 7016, "epoch": 167} {"train_loss": -4.955143928527832, "global_step": 7017, "epoch": 167} {"train_loss": -5.03809118270874, "global_step": 7018, "epoch": 167} {"train_loss": -4.797510147094727, "global_step": 7019, "epoch": 167} {"train_loss": -4.943686485290527, "global_step": 7020, "epoch": 167} {"train_loss": -5.0305047035217285, "global_step": 7021, "epoch": 167} {"train_loss": -4.844770431518555, "global_step": 7022, "epoch": 167} {"train_loss": -4.844223499298096, "global_step": 7023, "epoch": 167} {"train_loss": -5.067574977874756, "global_step": 7024, "epoch": 167} {"train_loss": -4.966980934143066, "global_step": 7025, "epoch": 167} {"train_loss": -5.053716659545898, "global_step": 7026, "epoch": 167} {"train_loss": -5.190497398376465, "global_step": 7027, "epoch": 167} {"train_loss": -4.931249141693115, "global_step": 7028, "epoch": 167} {"train_loss": -4.847488880157471, "global_step": 7029, "epoch": 167} {"train_loss": -4.8344645500183105, "global_step": 7030, "epoch": 167} {"train_loss": -4.989229679107666, "global_step": 7031, "epoch": 167} {"train_loss": -4.873922348022461, "global_step": 7032, "epoch": 167} {"train_loss": -4.978994369506836, "global_step": 7033, "epoch": 167} {"train_loss": -4.885015487670898, "global_step": 7034, "epoch": 167} {"train_loss": -4.889545440673828, "global_step": 7035, "epoch": 167} {"train_loss": -4.930144786834717, "global_step": 7036, "epoch": 167} {"train_loss": -5.027004718780518, "global_step": 7037, "epoch": 167} {"train_loss": -4.890982151031494, "global_step": 7038, "epoch": 167} {"train_loss": -4.761411666870117, "global_step": 7039, "epoch": 167} {"train_loss": -4.947155952453613, "global_step": 7040, "epoch": 167} {"train_loss": -5.045172691345215, "global_step": 7041, "epoch": 167} {"train_loss": -4.899946212768555, "global_step": 7042, "epoch": 167} {"train_loss": -4.783390998840332, "global_step": 7043, "epoch": 167} {"train_loss": -4.911957740783691, "global_step": 7044, "epoch": 167} {"train_loss": -4.93536376953125, "global_step": 7045, "epoch": 167} {"train_loss": -4.798615455627441, "global_step": 7046, "epoch": 167} {"train_loss": -4.802786350250244, "global_step": 7047, "epoch": 167} {"train_loss": -5.096714973449707, "global_step": 7048, "epoch": 167} {"train_loss": -4.72027587890625, "global_step": 7049, "epoch": 167} {"train_loss": -5.022947788238525, "global_step": 7050, "epoch": 167} {"train_loss": -4.914072036743164, "global_step": 7051, "epoch": 167} {"train_loss": -4.830900192260742, "global_step": 7052, "epoch": 167} {"train_loss": -4.868810653686523, "global_step": 7053, "epoch": 167} {"train_loss": -4.982718467712402, "global_step": 7054, "epoch": 167} {"train_loss": -4.927298625310262, "global_step": 7055, "epoch": 167, "val_loss": 86401.8515625} {"train_loss": -4.793558120727539, "global_step": 7056, "epoch": 168} {"train_loss": -4.9207329750061035, "global_step": 7057, "epoch": 168} {"train_loss": -4.948830604553223, "global_step": 7058, "epoch": 168} {"train_loss": -4.810647964477539, "global_step": 7059, "epoch": 168} {"train_loss": -4.881587982177734, "global_step": 7060, "epoch": 168} {"train_loss": -4.975226402282715, "global_step": 7061, "epoch": 168} {"train_loss": -5.024019241333008, "global_step": 7062, "epoch": 168} {"train_loss": -4.886667728424072, "global_step": 7063, "epoch": 168} {"train_loss": -5.094606399536133, "global_step": 7064, "epoch": 168} {"train_loss": -4.853931427001953, "global_step": 7065, "epoch": 168} {"train_loss": -4.9445695877075195, "global_step": 7066, "epoch": 168} {"train_loss": -5.010461807250977, "global_step": 7067, "epoch": 168} {"train_loss": -5.062253475189209, "global_step": 7068, "epoch": 168} {"train_loss": -4.78001594543457, "global_step": 7069, "epoch": 168} {"train_loss": -4.834318161010742, "global_step": 7070, "epoch": 168} {"train_loss": -4.908376693725586, "global_step": 7071, "epoch": 168} {"train_loss": -4.878817558288574, "global_step": 7072, "epoch": 168} {"train_loss": -4.944858074188232, "global_step": 7073, "epoch": 168} {"train_loss": -4.995616912841797, "global_step": 7074, "epoch": 168} {"train_loss": -4.939402103424072, "global_step": 7075, "epoch": 168} {"train_loss": -4.777955055236816, "global_step": 7076, "epoch": 168} {"train_loss": -4.897700786590576, "global_step": 7077, "epoch": 168} {"train_loss": -4.911599159240723, "global_step": 7078, "epoch": 168} {"train_loss": -4.981223106384277, "global_step": 7079, "epoch": 168} {"train_loss": -5.058248996734619, "global_step": 7080, "epoch": 168} {"train_loss": -5.011919021606445, "global_step": 7081, "epoch": 168} {"train_loss": -5.0706257820129395, "global_step": 7082, "epoch": 168} {"train_loss": -4.87010383605957, "global_step": 7083, "epoch": 168} {"train_loss": -4.92059326171875, "global_step": 7084, "epoch": 168} {"train_loss": -4.757144927978516, "global_step": 7085, "epoch": 168} {"train_loss": -4.879569053649902, "global_step": 7086, "epoch": 168} {"train_loss": -4.985126495361328, "global_step": 7087, "epoch": 168} {"train_loss": -4.928689002990723, "global_step": 7088, "epoch": 168} {"train_loss": -4.89963436126709, "global_step": 7089, "epoch": 168} {"train_loss": -4.970423221588135, "global_step": 7090, "epoch": 168} {"train_loss": -4.70720100402832, "global_step": 7091, "epoch": 168} {"train_loss": -4.909809589385986, "global_step": 7092, "epoch": 168} {"train_loss": -4.782437801361084, "global_step": 7093, "epoch": 168} {"train_loss": -4.841442108154297, "global_step": 7094, "epoch": 168} {"train_loss": -4.93693208694458, "global_step": 7095, "epoch": 168} {"train_loss": -4.903514385223389, "global_step": 7096, "epoch": 168} {"train_loss": -4.91008784657433, "global_step": 7097, "epoch": 168, "val_loss": 84149.9453125} {"train_loss": -5.008796691894531, "global_step": 7098, "epoch": 169} {"train_loss": -5.030457496643066, "global_step": 7099, "epoch": 169} {"train_loss": -4.812588691711426, "global_step": 7100, "epoch": 169} {"train_loss": -4.832027435302734, "global_step": 7101, "epoch": 169} {"train_loss": -4.9446635246276855, "global_step": 7102, "epoch": 169} {"train_loss": -4.869548797607422, "global_step": 7103, "epoch": 169} {"train_loss": -4.858420372009277, "global_step": 7104, "epoch": 169} {"train_loss": -4.905229568481445, "global_step": 7105, "epoch": 169} {"train_loss": -4.960670471191406, "global_step": 7106, "epoch": 169} {"train_loss": -4.980347633361816, "global_step": 7107, "epoch": 169} {"train_loss": -4.825991630554199, "global_step": 7108, "epoch": 169} {"train_loss": -4.859764099121094, "global_step": 7109, "epoch": 169} {"train_loss": -4.897568702697754, "global_step": 7110, "epoch": 169} {"train_loss": -4.845827102661133, "global_step": 7111, "epoch": 169} {"train_loss": -4.841419696807861, "global_step": 7112, "epoch": 169} {"train_loss": -4.854348659515381, "global_step": 7113, "epoch": 169} {"train_loss": -4.9806108474731445, "global_step": 7114, "epoch": 169} {"train_loss": -4.993358135223389, "global_step": 7115, "epoch": 169} {"train_loss": -4.69518518447876, "global_step": 7116, "epoch": 169} {"train_loss": -4.912942886352539, "global_step": 7117, "epoch": 169} {"train_loss": -4.8586297035217285, "global_step": 7118, "epoch": 169} {"train_loss": -4.877528190612793, "global_step": 7119, "epoch": 169} {"train_loss": -5.0121073722839355, "global_step": 7120, "epoch": 169} {"train_loss": -4.7726263999938965, "global_step": 7121, "epoch": 169} {"train_loss": -4.905585765838623, "global_step": 7122, "epoch": 169} {"train_loss": -4.780112266540527, "global_step": 7123, "epoch": 169} {"train_loss": -4.774978160858154, "global_step": 7124, "epoch": 169} {"train_loss": -4.866469383239746, "global_step": 7125, "epoch": 169} {"train_loss": -4.839391708374023, "global_step": 7126, "epoch": 169} {"train_loss": -4.858896732330322, "global_step": 7127, "epoch": 169} {"train_loss": -4.948206901550293, "global_step": 7128, "epoch": 169} {"train_loss": -4.894914627075195, "global_step": 7129, "epoch": 169} {"train_loss": -5.022922992706299, "global_step": 7130, "epoch": 169} {"train_loss": -4.77288293838501, "global_step": 7131, "epoch": 169} {"train_loss": -4.873178482055664, "global_step": 7132, "epoch": 169} {"train_loss": -4.959263324737549, "global_step": 7133, "epoch": 169} {"train_loss": -4.996519565582275, "global_step": 7134, "epoch": 169} {"train_loss": -4.785828113555908, "global_step": 7135, "epoch": 169} {"train_loss": -4.89268684387207, "global_step": 7136, "epoch": 169} {"train_loss": -4.926009178161621, "global_step": 7137, "epoch": 169} {"train_loss": -4.953808784484863, "global_step": 7138, "epoch": 169} {"train_loss": -4.889709835960751, "global_step": 7139, "epoch": 169, "val_loss": 86584.5546875} {"train_loss": -4.920839309692383, "global_step": 7140, "epoch": 170} {"train_loss": -5.0078511238098145, "global_step": 7141, "epoch": 170} {"train_loss": -5.040237903594971, "global_step": 7142, "epoch": 170} {"train_loss": -4.9211835861206055, "global_step": 7143, "epoch": 170} {"train_loss": -4.937451362609863, "global_step": 7144, "epoch": 170} {"train_loss": -4.913522720336914, "global_step": 7145, "epoch": 170} {"train_loss": -4.866103172302246, "global_step": 7146, "epoch": 170} {"train_loss": -5.071465015411377, "global_step": 7147, "epoch": 170} {"train_loss": -4.927579879760742, "global_step": 7148, "epoch": 170} {"train_loss": -4.958636283874512, "global_step": 7149, "epoch": 170} {"train_loss": -4.863323211669922, "global_step": 7150, "epoch": 170} {"train_loss": -4.921542167663574, "global_step": 7151, "epoch": 170} {"train_loss": -4.956853866577148, "global_step": 7152, "epoch": 170} {"train_loss": -5.032562255859375, "global_step": 7153, "epoch": 170} {"train_loss": -4.928378105163574, "global_step": 7154, "epoch": 170} {"train_loss": -4.878180503845215, "global_step": 7155, "epoch": 170} {"train_loss": -4.956987380981445, "global_step": 7156, "epoch": 170} {"train_loss": -4.893982410430908, "global_step": 7157, "epoch": 170} {"train_loss": -4.980463027954102, "global_step": 7158, "epoch": 170} {"train_loss": -4.916230201721191, "global_step": 7159, "epoch": 170} {"train_loss": -4.995180130004883, "global_step": 7160, "epoch": 170} {"train_loss": -4.965113639831543, "global_step": 7161, "epoch": 170} {"train_loss": -5.023279190063477, "global_step": 7162, "epoch": 170} {"train_loss": -4.925640106201172, "global_step": 7163, "epoch": 170} {"train_loss": -5.083099365234375, "global_step": 7164, "epoch": 170} {"train_loss": -5.049740791320801, "global_step": 7165, "epoch": 170} {"train_loss": -4.874566078186035, "global_step": 7166, "epoch": 170} {"train_loss": -5.024036407470703, "global_step": 7167, "epoch": 170} {"train_loss": -4.8217315673828125, "global_step": 7168, "epoch": 170} {"train_loss": -5.062771320343018, "global_step": 7169, "epoch": 170} {"train_loss": -5.050896644592285, "global_step": 7170, "epoch": 170} {"train_loss": -4.700692653656006, "global_step": 7171, "epoch": 170} {"train_loss": -4.988024711608887, "global_step": 7172, "epoch": 170} {"train_loss": -4.930846691131592, "global_step": 7173, "epoch": 170} {"train_loss": -4.943193435668945, "global_step": 7174, "epoch": 170} {"train_loss": -4.797235488891602, "global_step": 7175, "epoch": 170} {"train_loss": -4.982245445251465, "global_step": 7176, "epoch": 170} {"train_loss": -4.825900077819824, "global_step": 7177, "epoch": 170} {"train_loss": -4.786160945892334, "global_step": 7178, "epoch": 170} {"train_loss": -4.7697038650512695, "global_step": 7179, "epoch": 170} {"train_loss": -4.709912300109863, "global_step": 7180, "epoch": 170} {"train_loss": -4.927389712560744, "global_step": 7181, "epoch": 170, "val_loss": 84447.4921875} {"train_loss": -4.89711856842041, "global_step": 7182, "epoch": 171} {"train_loss": -4.86279821395874, "global_step": 7183, "epoch": 171} {"train_loss": -4.686628341674805, "global_step": 7184, "epoch": 171} {"train_loss": -4.913624286651611, "global_step": 7185, "epoch": 171} {"train_loss": -4.919754981994629, "global_step": 7186, "epoch": 171} {"train_loss": -4.878485679626465, "global_step": 7187, "epoch": 171} {"train_loss": -4.968435764312744, "global_step": 7188, "epoch": 171} {"train_loss": -5.025874614715576, "global_step": 7189, "epoch": 171} {"train_loss": -4.94329833984375, "global_step": 7190, "epoch": 171} {"train_loss": -5.013618469238281, "global_step": 7191, "epoch": 171} {"train_loss": -4.8899335861206055, "global_step": 7192, "epoch": 171} {"train_loss": -4.901668548583984, "global_step": 7193, "epoch": 171} {"train_loss": -4.979673385620117, "global_step": 7194, "epoch": 171} {"train_loss": -4.988798141479492, "global_step": 7195, "epoch": 171} {"train_loss": -4.859602451324463, "global_step": 7196, "epoch": 171} {"train_loss": -4.892546653747559, "global_step": 7197, "epoch": 171} {"train_loss": -4.893849849700928, "global_step": 7198, "epoch": 171} {"train_loss": -4.893500328063965, "global_step": 7199, "epoch": 171} {"train_loss": -4.955024242401123, "global_step": 7200, "epoch": 171} {"train_loss": -4.8722710609436035, "global_step": 7201, "epoch": 171} {"train_loss": -4.8376312255859375, "global_step": 7202, "epoch": 171} {"train_loss": -4.686408996582031, "global_step": 7203, "epoch": 171} {"train_loss": -4.902597904205322, "global_step": 7204, "epoch": 171} {"train_loss": -4.932981967926025, "global_step": 7205, "epoch": 171} {"train_loss": -4.928035736083984, "global_step": 7206, "epoch": 171} {"train_loss": -4.960216522216797, "global_step": 7207, "epoch": 171} {"train_loss": -4.917628288269043, "global_step": 7208, "epoch": 171} {"train_loss": -5.006443023681641, "global_step": 7209, "epoch": 171} {"train_loss": -4.790045738220215, "global_step": 7210, "epoch": 171} {"train_loss": -4.806425094604492, "global_step": 7211, "epoch": 171} {"train_loss": -5.063241004943848, "global_step": 7212, "epoch": 171} {"train_loss": -4.971363067626953, "global_step": 7213, "epoch": 171} {"train_loss": -4.935661792755127, "global_step": 7214, "epoch": 171} {"train_loss": -4.81752872467041, "global_step": 7215, "epoch": 171} {"train_loss": -4.972028732299805, "global_step": 7216, "epoch": 171} {"train_loss": -4.93198299407959, "global_step": 7217, "epoch": 171} {"train_loss": -4.925423622131348, "global_step": 7218, "epoch": 171} {"train_loss": -4.994699954986572, "global_step": 7219, "epoch": 171} {"train_loss": -5.019783973693848, "global_step": 7220, "epoch": 171} {"train_loss": -4.920243263244629, "global_step": 7221, "epoch": 171} {"train_loss": -4.861527442932129, "global_step": 7222, "epoch": 171} {"train_loss": -4.915642420450847, "global_step": 7223, "epoch": 171, "val_loss": 84155.921875} {"train_loss": -5.026426792144775, "global_step": 7224, "epoch": 172} {"train_loss": -4.8504109382629395, "global_step": 7225, "epoch": 172} {"train_loss": -5.002371311187744, "global_step": 7226, "epoch": 172} {"train_loss": -4.981971740722656, "global_step": 7227, "epoch": 172} {"train_loss": -4.9123687744140625, "global_step": 7228, "epoch": 172} {"train_loss": -5.033267021179199, "global_step": 7229, "epoch": 172} {"train_loss": -5.105511665344238, "global_step": 7230, "epoch": 172} {"train_loss": -4.962882041931152, "global_step": 7231, "epoch": 172} {"train_loss": -5.061085224151611, "global_step": 7232, "epoch": 172} {"train_loss": -4.83213472366333, "global_step": 7233, "epoch": 172} {"train_loss": -4.943802833557129, "global_step": 7234, "epoch": 172} {"train_loss": -4.963062286376953, "global_step": 7235, "epoch": 172} {"train_loss": -4.986025810241699, "global_step": 7236, "epoch": 172} {"train_loss": -4.91258430480957, "global_step": 7237, "epoch": 172} {"train_loss": -4.815381050109863, "global_step": 7238, "epoch": 172} {"train_loss": -4.739962100982666, "global_step": 7239, "epoch": 172} {"train_loss": -4.979465484619141, "global_step": 7240, "epoch": 172} {"train_loss": -4.965095520019531, "global_step": 7241, "epoch": 172} {"train_loss": -4.791973114013672, "global_step": 7242, "epoch": 172} {"train_loss": -4.873028755187988, "global_step": 7243, "epoch": 172} {"train_loss": -5.001110076904297, "global_step": 7244, "epoch": 172} {"train_loss": -4.990683555603027, "global_step": 7245, "epoch": 172} {"train_loss": -5.018850326538086, "global_step": 7246, "epoch": 172} {"train_loss": -4.967988967895508, "global_step": 7247, "epoch": 172} {"train_loss": -5.008315563201904, "global_step": 7248, "epoch": 172} {"train_loss": -4.963605880737305, "global_step": 7249, "epoch": 172} {"train_loss": -4.917577743530273, "global_step": 7250, "epoch": 172} {"train_loss": -4.811624526977539, "global_step": 7251, "epoch": 172} {"train_loss": -4.9538798332214355, "global_step": 7252, "epoch": 172} {"train_loss": -4.6766557693481445, "global_step": 7253, "epoch": 172} {"train_loss": -4.992464065551758, "global_step": 7254, "epoch": 172} {"train_loss": -4.8410139083862305, "global_step": 7255, "epoch": 172} {"train_loss": -4.6894636154174805, "global_step": 7256, "epoch": 172} {"train_loss": -4.923125267028809, "global_step": 7257, "epoch": 172} {"train_loss": -4.817121505737305, "global_step": 7258, "epoch": 172} {"train_loss": -5.006882667541504, "global_step": 7259, "epoch": 172} {"train_loss": -4.998969078063965, "global_step": 7260, "epoch": 172} {"train_loss": -4.8431172370910645, "global_step": 7261, "epoch": 172} {"train_loss": -4.885005950927734, "global_step": 7262, "epoch": 172} {"train_loss": -4.966546058654785, "global_step": 7263, "epoch": 172} {"train_loss": -4.958189964294434, "global_step": 7264, "epoch": 172} {"train_loss": -4.926999387286958, "global_step": 7265, "epoch": 172, "val_loss": 84915.453125} {"train_loss": -4.8066511154174805, "global_step": 7266, "epoch": 173} {"train_loss": -4.90789794921875, "global_step": 7267, "epoch": 173} {"train_loss": -4.91851806640625, "global_step": 7268, "epoch": 173} {"train_loss": -4.927892208099365, "global_step": 7269, "epoch": 173} {"train_loss": -4.97786808013916, "global_step": 7270, "epoch": 173} {"train_loss": -4.940622329711914, "global_step": 7271, "epoch": 173} {"train_loss": -4.9777302742004395, "global_step": 7272, "epoch": 173} {"train_loss": -5.013594627380371, "global_step": 7273, "epoch": 173} {"train_loss": -4.880661964416504, "global_step": 7274, "epoch": 173} {"train_loss": -5.048123359680176, "global_step": 7275, "epoch": 173} {"train_loss": -4.892435073852539, "global_step": 7276, "epoch": 173} {"train_loss": -4.8506975173950195, "global_step": 7277, "epoch": 173} {"train_loss": -5.090627193450928, "global_step": 7278, "epoch": 173} {"train_loss": -5.032904624938965, "global_step": 7279, "epoch": 173} {"train_loss": -4.891942024230957, "global_step": 7280, "epoch": 173} {"train_loss": -4.947264671325684, "global_step": 7281, "epoch": 173} {"train_loss": -4.986725807189941, "global_step": 7282, "epoch": 173} {"train_loss": -4.881528854370117, "global_step": 7283, "epoch": 173} {"train_loss": -5.033690452575684, "global_step": 7284, "epoch": 173} {"train_loss": -5.028914451599121, "global_step": 7285, "epoch": 173} {"train_loss": -5.052745819091797, "global_step": 7286, "epoch": 173} {"train_loss": -4.977568626403809, "global_step": 7287, "epoch": 173} {"train_loss": -4.995424270629883, "global_step": 7288, "epoch": 173} {"train_loss": -4.775673866271973, "global_step": 7289, "epoch": 173} {"train_loss": -4.961148262023926, "global_step": 7290, "epoch": 173} {"train_loss": -4.969569206237793, "global_step": 7291, "epoch": 173} {"train_loss": -4.788852691650391, "global_step": 7292, "epoch": 173} {"train_loss": -4.881231307983398, "global_step": 7293, "epoch": 173} {"train_loss": -4.885289192199707, "global_step": 7294, "epoch": 173} {"train_loss": -4.765000820159912, "global_step": 7295, "epoch": 173} {"train_loss": -4.916116237640381, "global_step": 7296, "epoch": 173} {"train_loss": -4.695960998535156, "global_step": 7297, "epoch": 173} {"train_loss": -4.549618721008301, "global_step": 7298, "epoch": 173} {"train_loss": -4.655542850494385, "global_step": 7299, "epoch": 173} {"train_loss": -4.92237663269043, "global_step": 7300, "epoch": 173} {"train_loss": -4.784131050109863, "global_step": 7301, "epoch": 173} {"train_loss": -4.6882853507995605, "global_step": 7302, "epoch": 173} {"train_loss": -5.003106117248535, "global_step": 7303, "epoch": 173} {"train_loss": -4.784180641174316, "global_step": 7304, "epoch": 173} {"train_loss": -4.777851104736328, "global_step": 7305, "epoch": 173} {"train_loss": -4.810198783874512, "global_step": 7306, "epoch": 173} {"train_loss": -4.893115781602406, "global_step": 7307, "epoch": 173, "val_loss": 85292.640625} {"train_loss": -4.839008808135986, "global_step": 7308, "epoch": 174} {"train_loss": -4.910526275634766, "global_step": 7309, "epoch": 174} {"train_loss": -4.8843584060668945, "global_step": 7310, "epoch": 174} {"train_loss": -4.947707176208496, "global_step": 7311, "epoch": 174} {"train_loss": -4.92817497253418, "global_step": 7312, "epoch": 174} {"train_loss": -4.952537536621094, "global_step": 7313, "epoch": 174} {"train_loss": -5.100396156311035, "global_step": 7314, "epoch": 174} {"train_loss": -5.099371910095215, "global_step": 7315, "epoch": 174} {"train_loss": -4.6640849113464355, "global_step": 7316, "epoch": 174} {"train_loss": -4.9035725593566895, "global_step": 7317, "epoch": 174} {"train_loss": -5.012105941772461, "global_step": 7318, "epoch": 174} {"train_loss": -4.809744834899902, "global_step": 7319, "epoch": 174} {"train_loss": -4.863261699676514, "global_step": 7320, "epoch": 174} {"train_loss": -4.966545104980469, "global_step": 7321, "epoch": 174} {"train_loss": -4.827310085296631, "global_step": 7322, "epoch": 174} {"train_loss": -4.883445739746094, "global_step": 7323, "epoch": 174} {"train_loss": -4.9572343826293945, "global_step": 7324, "epoch": 174} {"train_loss": -4.788386344909668, "global_step": 7325, "epoch": 174} {"train_loss": -4.853808403015137, "global_step": 7326, "epoch": 174} {"train_loss": -4.838668346405029, "global_step": 7327, "epoch": 174} {"train_loss": -4.986611843109131, "global_step": 7328, "epoch": 174} {"train_loss": -4.955023765563965, "global_step": 7329, "epoch": 174} {"train_loss": -4.786679267883301, "global_step": 7330, "epoch": 174} {"train_loss": -4.960265636444092, "global_step": 7331, "epoch": 174} {"train_loss": -4.97786808013916, "global_step": 7332, "epoch": 174} {"train_loss": -4.997982025146484, "global_step": 7333, "epoch": 174} {"train_loss": -4.9948811531066895, "global_step": 7334, "epoch": 174} {"train_loss": -4.98001766204834, "global_step": 7335, "epoch": 174} {"train_loss": -4.880615234375, "global_step": 7336, "epoch": 174} {"train_loss": -4.9481096267700195, "global_step": 7337, "epoch": 174} {"train_loss": -4.971949100494385, "global_step": 7338, "epoch": 174} {"train_loss": -5.112130165100098, "global_step": 7339, "epoch": 174} {"train_loss": -4.9610700607299805, "global_step": 7340, "epoch": 174} {"train_loss": -4.9807024002075195, "global_step": 7341, "epoch": 174} {"train_loss": -5.034283638000488, "global_step": 7342, "epoch": 174} {"train_loss": -4.930976390838623, "global_step": 7343, "epoch": 174} {"train_loss": -4.945764541625977, "global_step": 7344, "epoch": 174} {"train_loss": -4.949638843536377, "global_step": 7345, "epoch": 174} {"train_loss": -4.987496376037598, "global_step": 7346, "epoch": 174} {"train_loss": -4.958884239196777, "global_step": 7347, "epoch": 174} {"train_loss": -4.84876823425293, "global_step": 7348, "epoch": 174} {"train_loss": -4.93519800049918, "global_step": 7349, "epoch": 174, "val_loss": 83735.5546875} {"train_loss": -4.927229881286621, "global_step": 7350, "epoch": 175} {"train_loss": -4.848414421081543, "global_step": 7351, "epoch": 175} {"train_loss": -4.88230037689209, "global_step": 7352, "epoch": 175} {"train_loss": -5.044260501861572, "global_step": 7353, "epoch": 175} {"train_loss": -4.793127059936523, "global_step": 7354, "epoch": 175} {"train_loss": -4.780612945556641, "global_step": 7355, "epoch": 175} {"train_loss": -4.970245361328125, "global_step": 7356, "epoch": 175} {"train_loss": -4.8584489822387695, "global_step": 7357, "epoch": 175} {"train_loss": -4.557559490203857, "global_step": 7358, "epoch": 175} {"train_loss": -4.926434516906738, "global_step": 7359, "epoch": 175} {"train_loss": -4.7976531982421875, "global_step": 7360, "epoch": 175} {"train_loss": -4.996915817260742, "global_step": 7361, "epoch": 175} {"train_loss": -4.829236030578613, "global_step": 7362, "epoch": 175} {"train_loss": -4.988225936889648, "global_step": 7363, "epoch": 175} {"train_loss": -4.945181846618652, "global_step": 7364, "epoch": 175} {"train_loss": -4.868295669555664, "global_step": 7365, "epoch": 175} {"train_loss": -5.0368452072143555, "global_step": 7366, "epoch": 175} {"train_loss": -4.743044376373291, "global_step": 7367, "epoch": 175} {"train_loss": -4.833178520202637, "global_step": 7368, "epoch": 175} {"train_loss": -5.022253513336182, "global_step": 7369, "epoch": 175} {"train_loss": -4.784492492675781, "global_step": 7370, "epoch": 175} {"train_loss": -4.975432872772217, "global_step": 7371, "epoch": 175} {"train_loss": -4.956486701965332, "global_step": 7372, "epoch": 175} {"train_loss": -4.850484848022461, "global_step": 7373, "epoch": 175} {"train_loss": -4.925708770751953, "global_step": 7374, "epoch": 175} {"train_loss": -4.929850101470947, "global_step": 7375, "epoch": 175} {"train_loss": -4.8447675704956055, "global_step": 7376, "epoch": 175} {"train_loss": -4.93623161315918, "global_step": 7377, "epoch": 175} {"train_loss": -4.8168559074401855, "global_step": 7378, "epoch": 175} {"train_loss": -4.912014484405518, "global_step": 7379, "epoch": 175} {"train_loss": -5.079281806945801, "global_step": 7380, "epoch": 175} {"train_loss": -4.804311752319336, "global_step": 7381, "epoch": 175} {"train_loss": -4.863517761230469, "global_step": 7382, "epoch": 175} {"train_loss": -5.037237167358398, "global_step": 7383, "epoch": 175} {"train_loss": -4.894397735595703, "global_step": 7384, "epoch": 175} {"train_loss": -5.020342826843262, "global_step": 7385, "epoch": 175} {"train_loss": -5.034482002258301, "global_step": 7386, "epoch": 175} {"train_loss": -4.840597152709961, "global_step": 7387, "epoch": 175} {"train_loss": -5.022055149078369, "global_step": 7388, "epoch": 175} {"train_loss": -4.882696151733398, "global_step": 7389, "epoch": 175} {"train_loss": -4.985691070556641, "global_step": 7390, "epoch": 175} {"train_loss": -4.9038857846033, "global_step": 7391, "epoch": 175, "val_loss": 84579.4609375} {"train_loss": -4.947909832000732, "global_step": 7392, "epoch": 176} {"train_loss": -4.72847843170166, "global_step": 7393, "epoch": 176} {"train_loss": -4.88560152053833, "global_step": 7394, "epoch": 176} {"train_loss": -4.8926286697387695, "global_step": 7395, "epoch": 176} {"train_loss": -5.000552177429199, "global_step": 7396, "epoch": 176} {"train_loss": -4.994442939758301, "global_step": 7397, "epoch": 176} {"train_loss": -4.979589939117432, "global_step": 7398, "epoch": 176} {"train_loss": -4.904852390289307, "global_step": 7399, "epoch": 176} {"train_loss": -4.845926284790039, "global_step": 7400, "epoch": 176} {"train_loss": -4.9570207595825195, "global_step": 7401, "epoch": 176} {"train_loss": -4.862857818603516, "global_step": 7402, "epoch": 176} {"train_loss": -5.134035110473633, "global_step": 7403, "epoch": 176} {"train_loss": -5.0029096603393555, "global_step": 7404, "epoch": 176} {"train_loss": -4.832614898681641, "global_step": 7405, "epoch": 176} {"train_loss": -4.975821495056152, "global_step": 7406, "epoch": 176} {"train_loss": -4.91303825378418, "global_step": 7407, "epoch": 176} {"train_loss": -4.88209867477417, "global_step": 7408, "epoch": 176} {"train_loss": -4.8614091873168945, "global_step": 7409, "epoch": 176} {"train_loss": -5.083438873291016, "global_step": 7410, "epoch": 176} {"train_loss": -4.916421890258789, "global_step": 7411, "epoch": 176} {"train_loss": -4.785236358642578, "global_step": 7412, "epoch": 176} {"train_loss": -5.012211799621582, "global_step": 7413, "epoch": 176} {"train_loss": -4.865052223205566, "global_step": 7414, "epoch": 176} {"train_loss": -4.908064842224121, "global_step": 7415, "epoch": 176} {"train_loss": -4.879403114318848, "global_step": 7416, "epoch": 176} {"train_loss": -4.9306111335754395, "global_step": 7417, "epoch": 176} {"train_loss": -5.03435754776001, "global_step": 7418, "epoch": 176} {"train_loss": -4.976612567901611, "global_step": 7419, "epoch": 176} {"train_loss": -4.7930192947387695, "global_step": 7420, "epoch": 176} {"train_loss": -4.838327407836914, "global_step": 7421, "epoch": 176} {"train_loss": -5.002374649047852, "global_step": 7422, "epoch": 176} {"train_loss": -4.855386734008789, "global_step": 7423, "epoch": 176} {"train_loss": -4.961194038391113, "global_step": 7424, "epoch": 176} {"train_loss": -4.9339494705200195, "global_step": 7425, "epoch": 176} {"train_loss": -5.089964389801025, "global_step": 7426, "epoch": 176} {"train_loss": -4.9662580490112305, "global_step": 7427, "epoch": 176} {"train_loss": -4.98809289932251, "global_step": 7428, "epoch": 176} {"train_loss": -4.923558235168457, "global_step": 7429, "epoch": 176} {"train_loss": -5.0334272384643555, "global_step": 7430, "epoch": 176} {"train_loss": -4.741390705108643, "global_step": 7431, "epoch": 176} {"train_loss": -4.930840492248535, "global_step": 7432, "epoch": 176} {"train_loss": -4.923210734412784, "global_step": 7433, "epoch": 176, "val_loss": 86084.1875} {"train_loss": -4.74898624420166, "global_step": 7434, "epoch": 177} {"train_loss": -4.955802917480469, "global_step": 7435, "epoch": 177} {"train_loss": -4.525781631469727, "global_step": 7436, "epoch": 177} {"train_loss": -4.954916000366211, "global_step": 7437, "epoch": 177} {"train_loss": -4.897434234619141, "global_step": 7438, "epoch": 177} {"train_loss": -4.68369722366333, "global_step": 7439, "epoch": 177} {"train_loss": -4.909877777099609, "global_step": 7440, "epoch": 177} {"train_loss": -4.833742141723633, "global_step": 7441, "epoch": 177} {"train_loss": -4.879788398742676, "global_step": 7442, "epoch": 177} {"train_loss": -4.877345085144043, "global_step": 7443, "epoch": 177} {"train_loss": -5.00766658782959, "global_step": 7444, "epoch": 177} {"train_loss": -4.950492858886719, "global_step": 7445, "epoch": 177} {"train_loss": -4.923360824584961, "global_step": 7446, "epoch": 177} {"train_loss": -5.046536445617676, "global_step": 7447, "epoch": 177} {"train_loss": -5.017125129699707, "global_step": 7448, "epoch": 177} {"train_loss": -4.920932292938232, "global_step": 7449, "epoch": 177} {"train_loss": -4.896022796630859, "global_step": 7450, "epoch": 177} {"train_loss": -4.932784080505371, "global_step": 7451, "epoch": 177} {"train_loss": -4.902163505554199, "global_step": 7452, "epoch": 177} {"train_loss": -4.855337619781494, "global_step": 7453, "epoch": 177} {"train_loss": -4.733290195465088, "global_step": 7454, "epoch": 177} {"train_loss": -4.880078315734863, "global_step": 7455, "epoch": 177} {"train_loss": -5.082364082336426, "global_step": 7456, "epoch": 177} {"train_loss": -4.908052444458008, "global_step": 7457, "epoch": 177} {"train_loss": -4.872244834899902, "global_step": 7458, "epoch": 177} {"train_loss": -5.001447677612305, "global_step": 7459, "epoch": 177} {"train_loss": -4.841472625732422, "global_step": 7460, "epoch": 177} {"train_loss": -4.934487342834473, "global_step": 7461, "epoch": 177} {"train_loss": -4.745987892150879, "global_step": 7462, "epoch": 177} {"train_loss": -4.957164764404297, "global_step": 7463, "epoch": 177} {"train_loss": -4.958719730377197, "global_step": 7464, "epoch": 177} {"train_loss": -4.928010940551758, "global_step": 7465, "epoch": 177} {"train_loss": -5.005001068115234, "global_step": 7466, "epoch": 177} {"train_loss": -4.822905540466309, "global_step": 7467, "epoch": 177} {"train_loss": -4.829826354980469, "global_step": 7468, "epoch": 177} {"train_loss": -4.890419960021973, "global_step": 7469, "epoch": 177} {"train_loss": -4.970179557800293, "global_step": 7470, "epoch": 177} {"train_loss": -4.993060111999512, "global_step": 7471, "epoch": 177} {"train_loss": -5.045787811279297, "global_step": 7472, "epoch": 177} {"train_loss": -4.882420063018799, "global_step": 7473, "epoch": 177} {"train_loss": -4.956299781799316, "global_step": 7474, "epoch": 177} {"train_loss": -4.904261577697027, "global_step": 7475, "epoch": 177, "val_loss": 83815.4609375} {"train_loss": -4.911221027374268, "global_step": 7476, "epoch": 178} {"train_loss": -4.932991981506348, "global_step": 7477, "epoch": 178} {"train_loss": -5.041751861572266, "global_step": 7478, "epoch": 178} {"train_loss": -4.784272193908691, "global_step": 7479, "epoch": 178} {"train_loss": -5.022234916687012, "global_step": 7480, "epoch": 178} {"train_loss": -5.1150031089782715, "global_step": 7481, "epoch": 178} {"train_loss": -4.965638637542725, "global_step": 7482, "epoch": 178} {"train_loss": -4.963425636291504, "global_step": 7483, "epoch": 178} {"train_loss": -4.96967887878418, "global_step": 7484, "epoch": 178} {"train_loss": -5.122591972351074, "global_step": 7485, "epoch": 178} {"train_loss": -4.858349800109863, "global_step": 7486, "epoch": 178} {"train_loss": -4.968208312988281, "global_step": 7487, "epoch": 178} {"train_loss": -5.032533645629883, "global_step": 7488, "epoch": 178} {"train_loss": -4.9847798347473145, "global_step": 7489, "epoch": 178} {"train_loss": -4.955844879150391, "global_step": 7490, "epoch": 178} {"train_loss": -5.00847053527832, "global_step": 7491, "epoch": 178} {"train_loss": -5.064985275268555, "global_step": 7492, "epoch": 178} {"train_loss": -5.153604984283447, "global_step": 7493, "epoch": 178} {"train_loss": -4.941770553588867, "global_step": 7494, "epoch": 178} {"train_loss": -5.125094413757324, "global_step": 7495, "epoch": 178} {"train_loss": -5.001943588256836, "global_step": 7496, "epoch": 178} {"train_loss": -4.978226661682129, "global_step": 7497, "epoch": 178} {"train_loss": -4.809800148010254, "global_step": 7498, "epoch": 178} {"train_loss": -4.995804309844971, "global_step": 7499, "epoch": 178} {"train_loss": -4.796606063842773, "global_step": 7500, "epoch": 178} {"train_loss": -4.943564414978027, "global_step": 7501, "epoch": 178} {"train_loss": -4.963565826416016, "global_step": 7502, "epoch": 178} {"train_loss": -4.918878555297852, "global_step": 7503, "epoch": 178} {"train_loss": -5.0354790687561035, "global_step": 7504, "epoch": 178} {"train_loss": -4.871790409088135, "global_step": 7505, "epoch": 178} {"train_loss": -4.978045463562012, "global_step": 7506, "epoch": 178} {"train_loss": -5.05754280090332, "global_step": 7507, "epoch": 178} {"train_loss": -4.7247209548950195, "global_step": 7508, "epoch": 178} {"train_loss": -4.900423526763916, "global_step": 7509, "epoch": 178} {"train_loss": -4.823429107666016, "global_step": 7510, "epoch": 178} {"train_loss": -4.910335063934326, "global_step": 7511, "epoch": 178} {"train_loss": -4.739660263061523, "global_step": 7512, "epoch": 178} {"train_loss": -4.598305702209473, "global_step": 7513, "epoch": 178} {"train_loss": -4.618250846862793, "global_step": 7514, "epoch": 178} {"train_loss": -4.709347724914551, "global_step": 7515, "epoch": 178} {"train_loss": -4.697545528411865, "global_step": 7516, "epoch": 178} {"train_loss": -4.926169429506574, "global_step": 7517, "epoch": 178, "val_loss": 83940.3125} {"train_loss": -4.833166122436523, "global_step": 7518, "epoch": 179} {"train_loss": -4.753591060638428, "global_step": 7519, "epoch": 179} {"train_loss": -4.936710357666016, "global_step": 7520, "epoch": 179} {"train_loss": -4.708953380584717, "global_step": 7521, "epoch": 179} {"train_loss": -4.839248180389404, "global_step": 7522, "epoch": 179} {"train_loss": -4.913041114807129, "global_step": 7523, "epoch": 179} {"train_loss": -4.891573429107666, "global_step": 7524, "epoch": 179} {"train_loss": -4.883503437042236, "global_step": 7525, "epoch": 179} {"train_loss": -5.089202880859375, "global_step": 7526, "epoch": 179} {"train_loss": -5.011990547180176, "global_step": 7527, "epoch": 179} {"train_loss": -4.97395658493042, "global_step": 7528, "epoch": 179} {"train_loss": -4.940762519836426, "global_step": 7529, "epoch": 179} {"train_loss": -4.898530960083008, "global_step": 7530, "epoch": 179} {"train_loss": -5.037566661834717, "global_step": 7531, "epoch": 179} {"train_loss": -5.001471996307373, "global_step": 7532, "epoch": 179} {"train_loss": -4.906670093536377, "global_step": 7533, "epoch": 179} {"train_loss": -5.018124580383301, "global_step": 7534, "epoch": 179} {"train_loss": -4.952466011047363, "global_step": 7535, "epoch": 179} {"train_loss": -5.012136459350586, "global_step": 7536, "epoch": 179} {"train_loss": -4.884279251098633, "global_step": 7537, "epoch": 179} {"train_loss": -4.934543132781982, "global_step": 7538, "epoch": 179} {"train_loss": -5.051532745361328, "global_step": 7539, "epoch": 179} {"train_loss": -4.869561195373535, "global_step": 7540, "epoch": 179} {"train_loss": -4.892065048217773, "global_step": 7541, "epoch": 179} {"train_loss": -4.957529067993164, "global_step": 7542, "epoch": 179} {"train_loss": -5.027924537658691, "global_step": 7543, "epoch": 179} {"train_loss": -4.930377006530762, "global_step": 7544, "epoch": 179} {"train_loss": -4.854263782501221, "global_step": 7545, "epoch": 179} {"train_loss": -4.858919143676758, "global_step": 7546, "epoch": 179} {"train_loss": -4.852836608886719, "global_step": 7547, "epoch": 179} {"train_loss": -4.84019136428833, "global_step": 7548, "epoch": 179} {"train_loss": -4.908657550811768, "global_step": 7549, "epoch": 179} {"train_loss": -4.749497413635254, "global_step": 7550, "epoch": 179} {"train_loss": -4.779924392700195, "global_step": 7551, "epoch": 179} {"train_loss": -4.79927396774292, "global_step": 7552, "epoch": 179} {"train_loss": -4.717408180236816, "global_step": 7553, "epoch": 179} {"train_loss": -5.005615234375, "global_step": 7554, "epoch": 179} {"train_loss": -4.926016330718994, "global_step": 7555, "epoch": 179} {"train_loss": -4.829402923583984, "global_step": 7556, "epoch": 179} {"train_loss": -5.00331974029541, "global_step": 7557, "epoch": 179} {"train_loss": -5.002483367919922, "global_step": 7558, "epoch": 179} {"train_loss": -4.905648208799816, "global_step": 7559, "epoch": 179, "val_loss": 83244.1015625} {"train_loss": -5.020576477050781, "global_step": 7560, "epoch": 180} {"train_loss": -4.883012771606445, "global_step": 7561, "epoch": 180} {"train_loss": -5.009464263916016, "global_step": 7562, "epoch": 180} {"train_loss": -4.978783130645752, "global_step": 7563, "epoch": 180} {"train_loss": -4.8032989501953125, "global_step": 7564, "epoch": 180} {"train_loss": -4.864065170288086, "global_step": 7565, "epoch": 180} {"train_loss": -4.934720993041992, "global_step": 7566, "epoch": 180} {"train_loss": -4.956770896911621, "global_step": 7567, "epoch": 180} {"train_loss": -5.096757888793945, "global_step": 7568, "epoch": 180} {"train_loss": -4.981731414794922, "global_step": 7569, "epoch": 180} {"train_loss": -4.8421244621276855, "global_step": 7570, "epoch": 180} {"train_loss": -4.877020359039307, "global_step": 7571, "epoch": 180} {"train_loss": -4.8765363693237305, "global_step": 7572, "epoch": 180} {"train_loss": -4.977975845336914, "global_step": 7573, "epoch": 180} {"train_loss": -4.779780387878418, "global_step": 7574, "epoch": 180} {"train_loss": -4.992680549621582, "global_step": 7575, "epoch": 180} {"train_loss": -4.892828941345215, "global_step": 7576, "epoch": 180} {"train_loss": -4.945350170135498, "global_step": 7577, "epoch": 180} {"train_loss": -5.155664443969727, "global_step": 7578, "epoch": 180} {"train_loss": -4.897095680236816, "global_step": 7579, "epoch": 180} {"train_loss": -5.00393009185791, "global_step": 7580, "epoch": 180} {"train_loss": -4.9015960693359375, "global_step": 7581, "epoch": 180} {"train_loss": -5.062739372253418, "global_step": 7582, "epoch": 180} {"train_loss": -4.967735290527344, "global_step": 7583, "epoch": 180} {"train_loss": -4.765841960906982, "global_step": 7584, "epoch": 180} {"train_loss": -5.005387306213379, "global_step": 7585, "epoch": 180} {"train_loss": -5.118091106414795, "global_step": 7586, "epoch": 180} {"train_loss": -4.914566993713379, "global_step": 7587, "epoch": 180} {"train_loss": -4.940131664276123, "global_step": 7588, "epoch": 180} {"train_loss": -4.936962604522705, "global_step": 7589, "epoch": 180} {"train_loss": -4.9075493812561035, "global_step": 7590, "epoch": 180} {"train_loss": -5.034453392028809, "global_step": 7591, "epoch": 180} {"train_loss": -5.044968605041504, "global_step": 7592, "epoch": 180} {"train_loss": -4.968184471130371, "global_step": 7593, "epoch": 180} {"train_loss": -4.959622383117676, "global_step": 7594, "epoch": 180} {"train_loss": -5.113024711608887, "global_step": 7595, "epoch": 180} {"train_loss": -5.129881381988525, "global_step": 7596, "epoch": 180} {"train_loss": -4.90655517578125, "global_step": 7597, "epoch": 180} {"train_loss": -5.013984203338623, "global_step": 7598, "epoch": 180} {"train_loss": -4.987295150756836, "global_step": 7599, "epoch": 180} {"train_loss": -5.034601211547852, "global_step": 7600, "epoch": 180} {"train_loss": -4.961347795668102, "global_step": 7601, "epoch": 180, "val_loss": 83185.2421875} {"train_loss": -4.917834758758545, "global_step": 7602, "epoch": 181} {"train_loss": -5.097064018249512, "global_step": 7603, "epoch": 181} {"train_loss": -4.8116559982299805, "global_step": 7604, "epoch": 181} {"train_loss": -4.9723100662231445, "global_step": 7605, "epoch": 181} {"train_loss": -4.722245216369629, "global_step": 7606, "epoch": 181} {"train_loss": -4.944101333618164, "global_step": 7607, "epoch": 181} {"train_loss": -4.893638610839844, "global_step": 7608, "epoch": 181} {"train_loss": -4.880337238311768, "global_step": 7609, "epoch": 181} {"train_loss": -4.933432102203369, "global_step": 7610, "epoch": 181} {"train_loss": -4.911808013916016, "global_step": 7611, "epoch": 181} {"train_loss": -5.071133613586426, "global_step": 7612, "epoch": 181} {"train_loss": -4.960380554199219, "global_step": 7613, "epoch": 181} {"train_loss": -5.0685882568359375, "global_step": 7614, "epoch": 181} {"train_loss": -4.916822910308838, "global_step": 7615, "epoch": 181} {"train_loss": -4.636526107788086, "global_step": 7616, "epoch": 181} {"train_loss": -4.9767255783081055, "global_step": 7617, "epoch": 181} {"train_loss": -4.934379577636719, "global_step": 7618, "epoch": 181} {"train_loss": -4.981057167053223, "global_step": 7619, "epoch": 181} {"train_loss": -4.8506340980529785, "global_step": 7620, "epoch": 181} {"train_loss": -4.96090030670166, "global_step": 7621, "epoch": 181} {"train_loss": -4.7844696044921875, "global_step": 7622, "epoch": 181} {"train_loss": -4.920381546020508, "global_step": 7623, "epoch": 181} {"train_loss": -4.780645370483398, "global_step": 7624, "epoch": 181} {"train_loss": -4.939032077789307, "global_step": 7625, "epoch": 181} {"train_loss": -4.999741554260254, "global_step": 7626, "epoch": 181} {"train_loss": -4.835713863372803, "global_step": 7627, "epoch": 181} {"train_loss": -4.849350929260254, "global_step": 7628, "epoch": 181} {"train_loss": -4.943728923797607, "global_step": 7629, "epoch": 181} {"train_loss": -4.924246788024902, "global_step": 7630, "epoch": 181} {"train_loss": -4.88369083404541, "global_step": 7631, "epoch": 181} {"train_loss": -4.917585372924805, "global_step": 7632, "epoch": 181} {"train_loss": -4.877911567687988, "global_step": 7633, "epoch": 181} {"train_loss": -5.058593273162842, "global_step": 7634, "epoch": 181} {"train_loss": -5.069963455200195, "global_step": 7635, "epoch": 181} {"train_loss": -4.8402533531188965, "global_step": 7636, "epoch": 181} {"train_loss": -4.989499568939209, "global_step": 7637, "epoch": 181} {"train_loss": -4.927630424499512, "global_step": 7638, "epoch": 181} {"train_loss": -5.066788673400879, "global_step": 7639, "epoch": 181} {"train_loss": -4.879300117492676, "global_step": 7640, "epoch": 181} {"train_loss": -4.657744407653809, "global_step": 7641, "epoch": 181} {"train_loss": -4.966741561889648, "global_step": 7642, "epoch": 181} {"train_loss": -4.918730508713495, "global_step": 7643, "epoch": 181, "val_loss": 85832.015625} {"train_loss": -4.672868251800537, "global_step": 7644, "epoch": 182} {"train_loss": -4.914560317993164, "global_step": 7645, "epoch": 182} {"train_loss": -4.909140586853027, "global_step": 7646, "epoch": 182} {"train_loss": -4.76732063293457, "global_step": 7647, "epoch": 182} {"train_loss": -4.992334365844727, "global_step": 7648, "epoch": 182} {"train_loss": -4.85822868347168, "global_step": 7649, "epoch": 182} {"train_loss": -4.946584701538086, "global_step": 7650, "epoch": 182} {"train_loss": -4.709822654724121, "global_step": 7651, "epoch": 182} {"train_loss": -5.0506978034973145, "global_step": 7652, "epoch": 182} {"train_loss": -4.886615753173828, "global_step": 7653, "epoch": 182} {"train_loss": -4.921597003936768, "global_step": 7654, "epoch": 182} {"train_loss": -5.003057479858398, "global_step": 7655, "epoch": 182} {"train_loss": -4.86799430847168, "global_step": 7656, "epoch": 182} {"train_loss": -5.014323711395264, "global_step": 7657, "epoch": 182} {"train_loss": -5.009515762329102, "global_step": 7658, "epoch": 182} {"train_loss": -4.945064544677734, "global_step": 7659, "epoch": 182} {"train_loss": -4.998737335205078, "global_step": 7660, "epoch": 182} {"train_loss": -4.871133327484131, "global_step": 7661, "epoch": 182} {"train_loss": -5.0891313552856445, "global_step": 7662, "epoch": 182} {"train_loss": -5.055589199066162, "global_step": 7663, "epoch": 182} {"train_loss": -5.014369010925293, "global_step": 7664, "epoch": 182} {"train_loss": -5.030747413635254, "global_step": 7665, "epoch": 182} {"train_loss": -5.069265842437744, "global_step": 7666, "epoch": 182} {"train_loss": -4.872595310211182, "global_step": 7667, "epoch": 182} {"train_loss": -4.960927486419678, "global_step": 7668, "epoch": 182} {"train_loss": -4.883208274841309, "global_step": 7669, "epoch": 182} {"train_loss": -5.000894069671631, "global_step": 7670, "epoch": 182} {"train_loss": -4.985670566558838, "global_step": 7671, "epoch": 182} {"train_loss": -5.027383327484131, "global_step": 7672, "epoch": 182} {"train_loss": -4.886345863342285, "global_step": 7673, "epoch": 182} {"train_loss": -5.004537582397461, "global_step": 7674, "epoch": 182} {"train_loss": -5.0395307540893555, "global_step": 7675, "epoch": 182} {"train_loss": -5.006524085998535, "global_step": 7676, "epoch": 182} {"train_loss": -5.0895280838012695, "global_step": 7677, "epoch": 182} {"train_loss": -4.972476959228516, "global_step": 7678, "epoch": 182} {"train_loss": -4.856553554534912, "global_step": 7679, "epoch": 182} {"train_loss": -4.9625701904296875, "global_step": 7680, "epoch": 182} {"train_loss": -4.733031272888184, "global_step": 7681, "epoch": 182} {"train_loss": -4.996622085571289, "global_step": 7682, "epoch": 182} {"train_loss": -5.036884307861328, "global_step": 7683, "epoch": 182} {"train_loss": -4.7319488525390625, "global_step": 7684, "epoch": 182} {"train_loss": -4.9388846556345625, "global_step": 7685, "epoch": 182, "val_loss": 84033.1875} {"train_loss": -5.181765079498291, "global_step": 7686, "epoch": 183} {"train_loss": -4.705352306365967, "global_step": 7687, "epoch": 183} {"train_loss": -4.889679908752441, "global_step": 7688, "epoch": 183} {"train_loss": -5.037297248840332, "global_step": 7689, "epoch": 183} {"train_loss": -5.087535381317139, "global_step": 7690, "epoch": 183} {"train_loss": -4.959440231323242, "global_step": 7691, "epoch": 183} {"train_loss": -4.940089225769043, "global_step": 7692, "epoch": 183} {"train_loss": -4.98029899597168, "global_step": 7693, "epoch": 183} {"train_loss": -4.967530250549316, "global_step": 7694, "epoch": 183} {"train_loss": -4.924013614654541, "global_step": 7695, "epoch": 183} {"train_loss": -5.015940189361572, "global_step": 7696, "epoch": 183} {"train_loss": -4.992859363555908, "global_step": 7697, "epoch": 183} {"train_loss": -5.008955955505371, "global_step": 7698, "epoch": 183} {"train_loss": -4.887588024139404, "global_step": 7699, "epoch": 183} {"train_loss": -4.926234245300293, "global_step": 7700, "epoch": 183} {"train_loss": -4.917231559753418, "global_step": 7701, "epoch": 183} {"train_loss": -5.019920825958252, "global_step": 7702, "epoch": 183} {"train_loss": -4.9589385986328125, "global_step": 7703, "epoch": 183} {"train_loss": -4.8462066650390625, "global_step": 7704, "epoch": 183} {"train_loss": -5.011797904968262, "global_step": 7705, "epoch": 183} {"train_loss": -4.806295394897461, "global_step": 7706, "epoch": 183} {"train_loss": -4.896204948425293, "global_step": 7707, "epoch": 183} {"train_loss": -4.956969261169434, "global_step": 7708, "epoch": 183} {"train_loss": -4.79769229888916, "global_step": 7709, "epoch": 183} {"train_loss": -4.683879375457764, "global_step": 7710, "epoch": 183} {"train_loss": -4.696500301361084, "global_step": 7711, "epoch": 183} {"train_loss": -4.399585723876953, "global_step": 7712, "epoch": 183} {"train_loss": -4.743778228759766, "global_step": 7713, "epoch": 183} {"train_loss": -4.655467987060547, "global_step": 7714, "epoch": 183} {"train_loss": -4.827766418457031, "global_step": 7715, "epoch": 183} {"train_loss": -4.707513332366943, "global_step": 7716, "epoch": 183} {"train_loss": -4.537931442260742, "global_step": 7717, "epoch": 183} {"train_loss": -4.802859306335449, "global_step": 7718, "epoch": 183} {"train_loss": -4.913352012634277, "global_step": 7719, "epoch": 183} {"train_loss": -4.849428176879883, "global_step": 7720, "epoch": 183} {"train_loss": -4.846816539764404, "global_step": 7721, "epoch": 183} {"train_loss": -4.866495132446289, "global_step": 7722, "epoch": 183} {"train_loss": -4.906406402587891, "global_step": 7723, "epoch": 183} {"train_loss": -4.753003120422363, "global_step": 7724, "epoch": 183} {"train_loss": -4.757831573486328, "global_step": 7725, "epoch": 183} {"train_loss": -4.838550567626953, "global_step": 7726, "epoch": 183} {"train_loss": -4.86590515999567, "global_step": 7727, "epoch": 183, "val_loss": 83168.1953125} {"train_loss": -4.9597063064575195, "global_step": 7728, "epoch": 184} {"train_loss": -4.848297119140625, "global_step": 7729, "epoch": 184} {"train_loss": -5.023869514465332, "global_step": 7730, "epoch": 184} {"train_loss": -4.8454155921936035, "global_step": 7731, "epoch": 184} {"train_loss": -5.053129196166992, "global_step": 7732, "epoch": 184} {"train_loss": -4.877557754516602, "global_step": 7733, "epoch": 184} {"train_loss": -4.91372537612915, "global_step": 7734, "epoch": 184} {"train_loss": -5.036680221557617, "global_step": 7735, "epoch": 184} {"train_loss": -4.876949787139893, "global_step": 7736, "epoch": 184} {"train_loss": -4.928614616394043, "global_step": 7737, "epoch": 184} {"train_loss": -5.088720798492432, "global_step": 7738, "epoch": 184} {"train_loss": -4.936036109924316, "global_step": 7739, "epoch": 184} {"train_loss": -4.950367450714111, "global_step": 7740, "epoch": 184} {"train_loss": -5.037558555603027, "global_step": 7741, "epoch": 184} {"train_loss": -4.972833633422852, "global_step": 7742, "epoch": 184} {"train_loss": -5.068717002868652, "global_step": 7743, "epoch": 184} {"train_loss": -5.041614532470703, "global_step": 7744, "epoch": 184} {"train_loss": -4.9581074714660645, "global_step": 7745, "epoch": 184} {"train_loss": -5.125790119171143, "global_step": 7746, "epoch": 184} {"train_loss": -5.061694622039795, "global_step": 7747, "epoch": 184} {"train_loss": -5.034328460693359, "global_step": 7748, "epoch": 184} {"train_loss": -4.9742231369018555, "global_step": 7749, "epoch": 184} {"train_loss": -5.042798042297363, "global_step": 7750, "epoch": 184} {"train_loss": -4.919886112213135, "global_step": 7751, "epoch": 184} {"train_loss": -4.926936149597168, "global_step": 7752, "epoch": 184} {"train_loss": -5.035061359405518, "global_step": 7753, "epoch": 184} {"train_loss": -4.984039306640625, "global_step": 7754, "epoch": 184} {"train_loss": -4.923117637634277, "global_step": 7755, "epoch": 184} {"train_loss": -5.079379558563232, "global_step": 7756, "epoch": 184} {"train_loss": -4.955360412597656, "global_step": 7757, "epoch": 184} {"train_loss": -4.938499450683594, "global_step": 7758, "epoch": 184} {"train_loss": -5.021707534790039, "global_step": 7759, "epoch": 184} {"train_loss": -5.059892177581787, "global_step": 7760, "epoch": 184} {"train_loss": -5.02611780166626, "global_step": 7761, "epoch": 184} {"train_loss": -4.849082946777344, "global_step": 7762, "epoch": 184} {"train_loss": -5.056133270263672, "global_step": 7763, "epoch": 184} {"train_loss": -5.035264015197754, "global_step": 7764, "epoch": 184} {"train_loss": -4.910789966583252, "global_step": 7765, "epoch": 184} {"train_loss": -5.150893211364746, "global_step": 7766, "epoch": 184} {"train_loss": -4.99996280670166, "global_step": 7767, "epoch": 184} {"train_loss": -4.995840072631836, "global_step": 7768, "epoch": 184} {"train_loss": -4.984872840699696, "global_step": 7769, "epoch": 184, "val_loss": 82084.421875} {"train_loss": -5.1532206535339355, "global_step": 7770, "epoch": 185} {"train_loss": -5.015942573547363, "global_step": 7771, "epoch": 185} {"train_loss": -4.923628807067871, "global_step": 7772, "epoch": 185} {"train_loss": -5.161552906036377, "global_step": 7773, "epoch": 185} {"train_loss": -5.086063385009766, "global_step": 7774, "epoch": 185} {"train_loss": -4.872235298156738, "global_step": 7775, "epoch": 185} {"train_loss": -4.846208572387695, "global_step": 7776, "epoch": 185} {"train_loss": -4.965890884399414, "global_step": 7777, "epoch": 185} {"train_loss": -4.844264030456543, "global_step": 7778, "epoch": 185} {"train_loss": -4.625105857849121, "global_step": 7779, "epoch": 185} {"train_loss": -4.869107246398926, "global_step": 7780, "epoch": 185} {"train_loss": -4.695419788360596, "global_step": 7781, "epoch": 185} {"train_loss": -4.570462703704834, "global_step": 7782, "epoch": 185} {"train_loss": -4.773834705352783, "global_step": 7783, "epoch": 185} {"train_loss": -4.750565052032471, "global_step": 7784, "epoch": 185} {"train_loss": -4.764047622680664, "global_step": 7785, "epoch": 185} {"train_loss": -4.847051620483398, "global_step": 7786, "epoch": 185} {"train_loss": -4.899178504943848, "global_step": 7787, "epoch": 185} {"train_loss": -4.721755027770996, "global_step": 7788, "epoch": 185} {"train_loss": -4.861747741699219, "global_step": 7789, "epoch": 185} {"train_loss": -4.973263740539551, "global_step": 7790, "epoch": 185} {"train_loss": -4.799861431121826, "global_step": 7791, "epoch": 185} {"train_loss": -4.902670860290527, "global_step": 7792, "epoch": 185} {"train_loss": -4.736660957336426, "global_step": 7793, "epoch": 185} {"train_loss": -4.998512268066406, "global_step": 7794, "epoch": 185} {"train_loss": -4.952516555786133, "global_step": 7795, "epoch": 185} {"train_loss": -4.99521541595459, "global_step": 7796, "epoch": 185} {"train_loss": -4.822338104248047, "global_step": 7797, "epoch": 185} {"train_loss": -4.842458248138428, "global_step": 7798, "epoch": 185} {"train_loss": -4.943437576293945, "global_step": 7799, "epoch": 185} {"train_loss": -5.079866409301758, "global_step": 7800, "epoch": 185} {"train_loss": -4.880127906799316, "global_step": 7801, "epoch": 185} {"train_loss": -4.952582359313965, "global_step": 7802, "epoch": 185} {"train_loss": -4.996794700622559, "global_step": 7803, "epoch": 185} {"train_loss": -5.034951210021973, "global_step": 7804, "epoch": 185} {"train_loss": -5.015867233276367, "global_step": 7805, "epoch": 185} {"train_loss": -4.959228992462158, "global_step": 7806, "epoch": 185} {"train_loss": -4.900579929351807, "global_step": 7807, "epoch": 185} {"train_loss": -5.005570888519287, "global_step": 7808, "epoch": 185} {"train_loss": -4.962324142456055, "global_step": 7809, "epoch": 185} {"train_loss": -4.837344169616699, "global_step": 7810, "epoch": 185} {"train_loss": -4.901956717173259, "global_step": 7811, "epoch": 185, "val_loss": 82841.28125} {"train_loss": -4.867976665496826, "global_step": 7812, "epoch": 186} {"train_loss": -4.921448707580566, "global_step": 7813, "epoch": 186} {"train_loss": -4.9550557136535645, "global_step": 7814, "epoch": 186} {"train_loss": -4.909537315368652, "global_step": 7815, "epoch": 186} {"train_loss": -5.005166053771973, "global_step": 7816, "epoch": 186} {"train_loss": -5.10162353515625, "global_step": 7817, "epoch": 186} {"train_loss": -4.858310699462891, "global_step": 7818, "epoch": 186} {"train_loss": -5.012145042419434, "global_step": 7819, "epoch": 186} {"train_loss": -4.989697456359863, "global_step": 7820, "epoch": 186} {"train_loss": -4.964240550994873, "global_step": 7821, "epoch": 186} {"train_loss": -5.043702125549316, "global_step": 7822, "epoch": 186} {"train_loss": -4.953582763671875, "global_step": 7823, "epoch": 186} {"train_loss": -4.95992374420166, "global_step": 7824, "epoch": 186} {"train_loss": -5.021796226501465, "global_step": 7825, "epoch": 186} {"train_loss": -5.069642066955566, "global_step": 7826, "epoch": 186} {"train_loss": -5.042645454406738, "global_step": 7827, "epoch": 186} {"train_loss": -5.048773288726807, "global_step": 7828, "epoch": 186} {"train_loss": -4.915741920471191, "global_step": 7829, "epoch": 186} {"train_loss": -4.970504283905029, "global_step": 7830, "epoch": 186} {"train_loss": -5.001032829284668, "global_step": 7831, "epoch": 186} {"train_loss": -4.968889236450195, "global_step": 7832, "epoch": 186} {"train_loss": -4.9938201904296875, "global_step": 7833, "epoch": 186} {"train_loss": -5.003841400146484, "global_step": 7834, "epoch": 186} {"train_loss": -5.107553958892822, "global_step": 7835, "epoch": 186} {"train_loss": -4.916586875915527, "global_step": 7836, "epoch": 186} {"train_loss": -5.083096504211426, "global_step": 7837, "epoch": 186} {"train_loss": -4.987165451049805, "global_step": 7838, "epoch": 186} {"train_loss": -5.034144401550293, "global_step": 7839, "epoch": 186} {"train_loss": -4.983868598937988, "global_step": 7840, "epoch": 186} {"train_loss": -5.008947849273682, "global_step": 7841, "epoch": 186} {"train_loss": -4.982751846313477, "global_step": 7842, "epoch": 186} {"train_loss": -5.041367530822754, "global_step": 7843, "epoch": 186} {"train_loss": -4.950877666473389, "global_step": 7844, "epoch": 186} {"train_loss": -4.888962745666504, "global_step": 7845, "epoch": 186} {"train_loss": -4.821816444396973, "global_step": 7846, "epoch": 186} {"train_loss": -4.932448387145996, "global_step": 7847, "epoch": 186} {"train_loss": -4.94265079498291, "global_step": 7848, "epoch": 186} {"train_loss": -4.812097072601318, "global_step": 7849, "epoch": 186} {"train_loss": -4.820103645324707, "global_step": 7850, "epoch": 186} {"train_loss": -5.118772029876709, "global_step": 7851, "epoch": 186} {"train_loss": -4.977928638458252, "global_step": 7852, "epoch": 186} {"train_loss": -4.9745622135344005, "global_step": 7853, "epoch": 186, "val_loss": 81950.265625} {"train_loss": -5.0268449783325195, "global_step": 7854, "epoch": 187} {"train_loss": -5.111703872680664, "global_step": 7855, "epoch": 187} {"train_loss": -5.1350250244140625, "global_step": 7856, "epoch": 187} {"train_loss": -5.00151252746582, "global_step": 7857, "epoch": 187} {"train_loss": -5.02664852142334, "global_step": 7858, "epoch": 187} {"train_loss": -5.036750793457031, "global_step": 7859, "epoch": 187} {"train_loss": -4.867158889770508, "global_step": 7860, "epoch": 187} {"train_loss": -5.009348392486572, "global_step": 7861, "epoch": 187} {"train_loss": -4.801229476928711, "global_step": 7862, "epoch": 187} {"train_loss": -4.918691635131836, "global_step": 7863, "epoch": 187} {"train_loss": -5.005578994750977, "global_step": 7864, "epoch": 187} {"train_loss": -4.79020357131958, "global_step": 7865, "epoch": 187} {"train_loss": -4.889679431915283, "global_step": 7866, "epoch": 187} {"train_loss": -5.103234767913818, "global_step": 7867, "epoch": 187} {"train_loss": -4.8071699142456055, "global_step": 7868, "epoch": 187} {"train_loss": -4.731834411621094, "global_step": 7869, "epoch": 187} {"train_loss": -4.8839616775512695, "global_step": 7870, "epoch": 187} {"train_loss": -4.749429702758789, "global_step": 7871, "epoch": 187} {"train_loss": -4.944340705871582, "global_step": 7872, "epoch": 187} {"train_loss": -5.02114200592041, "global_step": 7873, "epoch": 187} {"train_loss": -4.6105780601501465, "global_step": 7874, "epoch": 187} {"train_loss": -4.754884719848633, "global_step": 7875, "epoch": 187} {"train_loss": -4.920759201049805, "global_step": 7876, "epoch": 187} {"train_loss": -4.788660049438477, "global_step": 7877, "epoch": 187} {"train_loss": -5.003940582275391, "global_step": 7878, "epoch": 187} {"train_loss": -4.84638786315918, "global_step": 7879, "epoch": 187} {"train_loss": -4.888330459594727, "global_step": 7880, "epoch": 187} {"train_loss": -4.907567501068115, "global_step": 7881, "epoch": 187} {"train_loss": -4.939580917358398, "global_step": 7882, "epoch": 187} {"train_loss": -5.060041904449463, "global_step": 7883, "epoch": 187} {"train_loss": -4.922933578491211, "global_step": 7884, "epoch": 187} {"train_loss": -5.072234153747559, "global_step": 7885, "epoch": 187} {"train_loss": -5.0404205322265625, "global_step": 7886, "epoch": 187} {"train_loss": -4.869104385375977, "global_step": 7887, "epoch": 187} {"train_loss": -4.977428913116455, "global_step": 7888, "epoch": 187} {"train_loss": -4.828951835632324, "global_step": 7889, "epoch": 187} {"train_loss": -4.916817665100098, "global_step": 7890, "epoch": 187} {"train_loss": -4.919620513916016, "global_step": 7891, "epoch": 187} {"train_loss": -4.958325386047363, "global_step": 7892, "epoch": 187} {"train_loss": -4.984307765960693, "global_step": 7893, "epoch": 187} {"train_loss": -5.097383975982666, "global_step": 7894, "epoch": 187} {"train_loss": -4.934630757286435, "global_step": 7895, "epoch": 187, "val_loss": 83028.2890625} {"train_loss": -4.975305080413818, "global_step": 7896, "epoch": 188} {"train_loss": -5.01194953918457, "global_step": 7897, "epoch": 188} {"train_loss": -4.981189250946045, "global_step": 7898, "epoch": 188} {"train_loss": -4.920900821685791, "global_step": 7899, "epoch": 188} {"train_loss": -5.166752338409424, "global_step": 7900, "epoch": 188} {"train_loss": -4.934102535247803, "global_step": 7901, "epoch": 188} {"train_loss": -4.957634925842285, "global_step": 7902, "epoch": 188} {"train_loss": -4.898813247680664, "global_step": 7903, "epoch": 188} {"train_loss": -4.918581962585449, "global_step": 7904, "epoch": 188} {"train_loss": -4.984796524047852, "global_step": 7905, "epoch": 188} {"train_loss": -5.0665507316589355, "global_step": 7906, "epoch": 188} {"train_loss": -4.920379638671875, "global_step": 7907, "epoch": 188} {"train_loss": -4.7741923332214355, "global_step": 7908, "epoch": 188} {"train_loss": -5.006124496459961, "global_step": 7909, "epoch": 188} {"train_loss": -5.006566524505615, "global_step": 7910, "epoch": 188} {"train_loss": -4.898497581481934, "global_step": 7911, "epoch": 188} {"train_loss": -5.0400238037109375, "global_step": 7912, "epoch": 188} {"train_loss": -4.915865898132324, "global_step": 7913, "epoch": 188} {"train_loss": -4.901272296905518, "global_step": 7914, "epoch": 188} {"train_loss": -4.955268859863281, "global_step": 7915, "epoch": 188} {"train_loss": -4.949557304382324, "global_step": 7916, "epoch": 188} {"train_loss": -4.92022180557251, "global_step": 7917, "epoch": 188} {"train_loss": -4.916471481323242, "global_step": 7918, "epoch": 188} {"train_loss": -4.958937644958496, "global_step": 7919, "epoch": 188} {"train_loss": -5.019158840179443, "global_step": 7920, "epoch": 188} {"train_loss": -4.852367877960205, "global_step": 7921, "epoch": 188} {"train_loss": -4.689370632171631, "global_step": 7922, "epoch": 188} {"train_loss": -4.980876922607422, "global_step": 7923, "epoch": 188} {"train_loss": -4.877039909362793, "global_step": 7924, "epoch": 188} {"train_loss": -4.962671756744385, "global_step": 7925, "epoch": 188} {"train_loss": -5.016719341278076, "global_step": 7926, "epoch": 188} {"train_loss": -4.830564498901367, "global_step": 7927, "epoch": 188} {"train_loss": -4.7998857498168945, "global_step": 7928, "epoch": 188} {"train_loss": -4.916611671447754, "global_step": 7929, "epoch": 188} {"train_loss": -4.968194007873535, "global_step": 7930, "epoch": 188} {"train_loss": -4.915231704711914, "global_step": 7931, "epoch": 188} {"train_loss": -5.033736228942871, "global_step": 7932, "epoch": 188} {"train_loss": -4.799996852874756, "global_step": 7933, "epoch": 188} {"train_loss": -5.0006561279296875, "global_step": 7934, "epoch": 188} {"train_loss": -4.922205448150635, "global_step": 7935, "epoch": 188} {"train_loss": -4.878548622131348, "global_step": 7936, "epoch": 188} {"train_loss": -4.936542703991845, "global_step": 7937, "epoch": 188, "val_loss": 83902.765625} {"train_loss": -4.865758895874023, "global_step": 7938, "epoch": 189} {"train_loss": -4.931341171264648, "global_step": 7939, "epoch": 189} {"train_loss": -4.894650459289551, "global_step": 7940, "epoch": 189} {"train_loss": -4.869637489318848, "global_step": 7941, "epoch": 189} {"train_loss": -5.000311851501465, "global_step": 7942, "epoch": 189} {"train_loss": -4.823230743408203, "global_step": 7943, "epoch": 189} {"train_loss": -4.933957576751709, "global_step": 7944, "epoch": 189} {"train_loss": -5.032373428344727, "global_step": 7945, "epoch": 189} {"train_loss": -5.017018795013428, "global_step": 7946, "epoch": 189} {"train_loss": -4.910347938537598, "global_step": 7947, "epoch": 189} {"train_loss": -5.010170936584473, "global_step": 7948, "epoch": 189} {"train_loss": -4.968008041381836, "global_step": 7949, "epoch": 189} {"train_loss": -4.927881240844727, "global_step": 7950, "epoch": 189} {"train_loss": -4.86799430847168, "global_step": 7951, "epoch": 189} {"train_loss": -4.970354080200195, "global_step": 7952, "epoch": 189} {"train_loss": -4.8285722732543945, "global_step": 7953, "epoch": 189} {"train_loss": -5.016321182250977, "global_step": 7954, "epoch": 189} {"train_loss": -5.028022289276123, "global_step": 7955, "epoch": 189} {"train_loss": -4.913205146789551, "global_step": 7956, "epoch": 189} {"train_loss": -5.037598609924316, "global_step": 7957, "epoch": 189} {"train_loss": -4.96212100982666, "global_step": 7958, "epoch": 189} {"train_loss": -4.936456680297852, "global_step": 7959, "epoch": 189} {"train_loss": -5.1834797859191895, "global_step": 7960, "epoch": 189} {"train_loss": -4.98344612121582, "global_step": 7961, "epoch": 189} {"train_loss": -4.923403739929199, "global_step": 7962, "epoch": 189} {"train_loss": -4.93547248840332, "global_step": 7963, "epoch": 189} {"train_loss": -4.918154716491699, "global_step": 7964, "epoch": 189} {"train_loss": -4.8680195808410645, "global_step": 7965, "epoch": 189} {"train_loss": -4.9537858963012695, "global_step": 7966, "epoch": 189} {"train_loss": -5.032385349273682, "global_step": 7967, "epoch": 189} {"train_loss": -4.946892738342285, "global_step": 7968, "epoch": 189} {"train_loss": -4.946815013885498, "global_step": 7969, "epoch": 189} {"train_loss": -4.998821258544922, "global_step": 7970, "epoch": 189} {"train_loss": -5.04071044921875, "global_step": 7971, "epoch": 189} {"train_loss": -5.121596336364746, "global_step": 7972, "epoch": 189} {"train_loss": -5.0062479972839355, "global_step": 7973, "epoch": 189} {"train_loss": -4.954058647155762, "global_step": 7974, "epoch": 189} {"train_loss": -4.911628723144531, "global_step": 7975, "epoch": 189} {"train_loss": -5.013917446136475, "global_step": 7976, "epoch": 189} {"train_loss": -4.962894439697266, "global_step": 7977, "epoch": 189} {"train_loss": -4.781830310821533, "global_step": 7978, "epoch": 189} {"train_loss": -4.957124971208119, "global_step": 7979, "epoch": 189, "val_loss": 81784.9453125} {"train_loss": -4.923698425292969, "global_step": 7980, "epoch": 190} {"train_loss": -5.0050554275512695, "global_step": 7981, "epoch": 190} {"train_loss": -4.782517433166504, "global_step": 7982, "epoch": 190} {"train_loss": -4.814432621002197, "global_step": 7983, "epoch": 190} {"train_loss": -5.123368740081787, "global_step": 7984, "epoch": 190} {"train_loss": -4.96772575378418, "global_step": 7985, "epoch": 190} {"train_loss": -4.870434761047363, "global_step": 7986, "epoch": 190} {"train_loss": -4.912725448608398, "global_step": 7987, "epoch": 190} {"train_loss": -4.8398518562316895, "global_step": 7988, "epoch": 190} {"train_loss": -4.623960971832275, "global_step": 7989, "epoch": 190} {"train_loss": -4.879916191101074, "global_step": 7990, "epoch": 190} {"train_loss": -5.131414890289307, "global_step": 7991, "epoch": 190} {"train_loss": -4.877581596374512, "global_step": 7992, "epoch": 190} {"train_loss": -4.991737365722656, "global_step": 7993, "epoch": 190} {"train_loss": -4.985419750213623, "global_step": 7994, "epoch": 190} {"train_loss": -4.912657737731934, "global_step": 7995, "epoch": 190} {"train_loss": -5.010990142822266, "global_step": 7996, "epoch": 190} {"train_loss": -4.897684574127197, "global_step": 7997, "epoch": 190} {"train_loss": -4.970236301422119, "global_step": 7998, "epoch": 190} {"train_loss": -4.843728065490723, "global_step": 7999, "epoch": 190} {"train_loss": -4.925780296325684, "global_step": 8000, "epoch": 190} {"train_loss": -5.040663719177246, "global_step": 8001, "epoch": 190} {"train_loss": -4.996097564697266, "global_step": 8002, "epoch": 190} {"train_loss": -4.989952087402344, "global_step": 8003, "epoch": 190} {"train_loss": -4.892232418060303, "global_step": 8004, "epoch": 190} {"train_loss": -4.937327861785889, "global_step": 8005, "epoch": 190} {"train_loss": -5.038751125335693, "global_step": 8006, "epoch": 190} {"train_loss": -4.856461524963379, "global_step": 8007, "epoch": 190} {"train_loss": -4.971926212310791, "global_step": 8008, "epoch": 190} {"train_loss": -5.042856216430664, "global_step": 8009, "epoch": 190} {"train_loss": -4.989664077758789, "global_step": 8010, "epoch": 190} {"train_loss": -4.9464874267578125, "global_step": 8011, "epoch": 190} {"train_loss": -5.038162708282471, "global_step": 8012, "epoch": 190} {"train_loss": -4.873680114746094, "global_step": 8013, "epoch": 190} {"train_loss": -5.076529502868652, "global_step": 8014, "epoch": 190} {"train_loss": -5.0432538986206055, "global_step": 8015, "epoch": 190} {"train_loss": -4.869516849517822, "global_step": 8016, "epoch": 190} {"train_loss": -5.031131744384766, "global_step": 8017, "epoch": 190} {"train_loss": -4.987429618835449, "global_step": 8018, "epoch": 190} {"train_loss": -4.646585464477539, "global_step": 8019, "epoch": 190} {"train_loss": -4.865241527557373, "global_step": 8020, "epoch": 190} {"train_loss": -4.93634185336885, "global_step": 8021, "epoch": 190, "val_loss": 82448.2109375} {"train_loss": -4.987953186035156, "global_step": 8022, "epoch": 191} {"train_loss": -4.913069725036621, "global_step": 8023, "epoch": 191} {"train_loss": -4.952442169189453, "global_step": 8024, "epoch": 191} {"train_loss": -4.8448028564453125, "global_step": 8025, "epoch": 191} {"train_loss": -5.028338432312012, "global_step": 8026, "epoch": 191} {"train_loss": -4.884548187255859, "global_step": 8027, "epoch": 191} {"train_loss": -5.007516860961914, "global_step": 8028, "epoch": 191} {"train_loss": -5.063288688659668, "global_step": 8029, "epoch": 191} {"train_loss": -5.098817825317383, "global_step": 8030, "epoch": 191} {"train_loss": -4.96034574508667, "global_step": 8031, "epoch": 191} {"train_loss": -4.814235687255859, "global_step": 8032, "epoch": 191} {"train_loss": -4.994198322296143, "global_step": 8033, "epoch": 191} {"train_loss": -4.976080417633057, "global_step": 8034, "epoch": 191} {"train_loss": -4.9659647941589355, "global_step": 8035, "epoch": 191} {"train_loss": -5.014350891113281, "global_step": 8036, "epoch": 191} {"train_loss": -4.921497344970703, "global_step": 8037, "epoch": 191} {"train_loss": -4.981507301330566, "global_step": 8038, "epoch": 191} {"train_loss": -5.014183521270752, "global_step": 8039, "epoch": 191} {"train_loss": -5.003602981567383, "global_step": 8040, "epoch": 191} {"train_loss": -4.961230278015137, "global_step": 8041, "epoch": 191} {"train_loss": -5.036721229553223, "global_step": 8042, "epoch": 191} {"train_loss": -5.046080112457275, "global_step": 8043, "epoch": 191} {"train_loss": -4.9681501388549805, "global_step": 8044, "epoch": 191} {"train_loss": -5.071290969848633, "global_step": 8045, "epoch": 191} {"train_loss": -4.9631500244140625, "global_step": 8046, "epoch": 191} {"train_loss": -4.856447219848633, "global_step": 8047, "epoch": 191} {"train_loss": -5.007635116577148, "global_step": 8048, "epoch": 191} {"train_loss": -4.857679843902588, "global_step": 8049, "epoch": 191} {"train_loss": -5.1361613273620605, "global_step": 8050, "epoch": 191} {"train_loss": -5.0831298828125, "global_step": 8051, "epoch": 191} {"train_loss": -5.128549575805664, "global_step": 8052, "epoch": 191} {"train_loss": -5.108156204223633, "global_step": 8053, "epoch": 191} {"train_loss": -5.124677658081055, "global_step": 8054, "epoch": 191} {"train_loss": -4.9546732902526855, "global_step": 8055, "epoch": 191} {"train_loss": -4.972504615783691, "global_step": 8056, "epoch": 191} {"train_loss": -5.20042610168457, "global_step": 8057, "epoch": 191} {"train_loss": -4.882460594177246, "global_step": 8058, "epoch": 191} {"train_loss": -4.850415229797363, "global_step": 8059, "epoch": 191} {"train_loss": -4.828880310058594, "global_step": 8060, "epoch": 191} {"train_loss": -4.814061164855957, "global_step": 8061, "epoch": 191} {"train_loss": -4.935758590698242, "global_step": 8062, "epoch": 191} {"train_loss": -4.978985831851051, "global_step": 8063, "epoch": 191, "val_loss": 81996.640625} {"train_loss": -4.920383453369141, "global_step": 8064, "epoch": 192} {"train_loss": -4.921816349029541, "global_step": 8065, "epoch": 192} {"train_loss": -4.673715114593506, "global_step": 8066, "epoch": 192} {"train_loss": -4.802129745483398, "global_step": 8067, "epoch": 192} {"train_loss": -4.805141448974609, "global_step": 8068, "epoch": 192} {"train_loss": -4.913362503051758, "global_step": 8069, "epoch": 192} {"train_loss": -4.8518524169921875, "global_step": 8070, "epoch": 192} {"train_loss": -4.987431526184082, "global_step": 8071, "epoch": 192} {"train_loss": -4.959516525268555, "global_step": 8072, "epoch": 192} {"train_loss": -4.737560749053955, "global_step": 8073, "epoch": 192} {"train_loss": -4.810756683349609, "global_step": 8074, "epoch": 192} {"train_loss": -4.749311447143555, "global_step": 8075, "epoch": 192} {"train_loss": -5.0755228996276855, "global_step": 8076, "epoch": 192} {"train_loss": -4.9885759353637695, "global_step": 8077, "epoch": 192} {"train_loss": -4.883260250091553, "global_step": 8078, "epoch": 192} {"train_loss": -5.090939521789551, "global_step": 8079, "epoch": 192} {"train_loss": -4.818246841430664, "global_step": 8080, "epoch": 192} {"train_loss": -4.9319233894348145, "global_step": 8081, "epoch": 192} {"train_loss": -5.093047618865967, "global_step": 8082, "epoch": 192} {"train_loss": -4.849862098693848, "global_step": 8083, "epoch": 192} {"train_loss": -5.021980285644531, "global_step": 8084, "epoch": 192} {"train_loss": -4.933679580688477, "global_step": 8085, "epoch": 192} {"train_loss": -5.097224235534668, "global_step": 8086, "epoch": 192} {"train_loss": -5.014713287353516, "global_step": 8087, "epoch": 192} {"train_loss": -5.046987533569336, "global_step": 8088, "epoch": 192} {"train_loss": -4.805110454559326, "global_step": 8089, "epoch": 192} {"train_loss": -4.928766250610352, "global_step": 8090, "epoch": 192} {"train_loss": -5.011277675628662, "global_step": 8091, "epoch": 192} {"train_loss": -4.9997406005859375, "global_step": 8092, "epoch": 192} {"train_loss": -4.918176651000977, "global_step": 8093, "epoch": 192} {"train_loss": -5.00333309173584, "global_step": 8094, "epoch": 192} {"train_loss": -4.934243202209473, "global_step": 8095, "epoch": 192} {"train_loss": -4.947302341461182, "global_step": 8096, "epoch": 192} {"train_loss": -4.919051647186279, "global_step": 8097, "epoch": 192} {"train_loss": -5.052701473236084, "global_step": 8098, "epoch": 192} {"train_loss": -5.009893894195557, "global_step": 8099, "epoch": 192} {"train_loss": -4.9819183349609375, "global_step": 8100, "epoch": 192} {"train_loss": -5.025320053100586, "global_step": 8101, "epoch": 192} {"train_loss": -4.7991790771484375, "global_step": 8102, "epoch": 192} {"train_loss": -4.851777076721191, "global_step": 8103, "epoch": 192} {"train_loss": -5.018195629119873, "global_step": 8104, "epoch": 192} {"train_loss": -4.928081750869751, "global_step": 8105, "epoch": 192, "val_loss": 82276.6953125} {"train_loss": -4.89156436920166, "global_step": 8106, "epoch": 193} {"train_loss": -5.116727828979492, "global_step": 8107, "epoch": 193} {"train_loss": -4.8441972732543945, "global_step": 8108, "epoch": 193} {"train_loss": -5.047858238220215, "global_step": 8109, "epoch": 193} {"train_loss": -4.91923189163208, "global_step": 8110, "epoch": 193} {"train_loss": -4.972393035888672, "global_step": 8111, "epoch": 193} {"train_loss": -5.057211875915527, "global_step": 8112, "epoch": 193} {"train_loss": -4.945291519165039, "global_step": 8113, "epoch": 193} {"train_loss": -4.96506404876709, "global_step": 8114, "epoch": 193} {"train_loss": -4.876657962799072, "global_step": 8115, "epoch": 193} {"train_loss": -5.166355609893799, "global_step": 8116, "epoch": 193} {"train_loss": -4.994404315948486, "global_step": 8117, "epoch": 193} {"train_loss": -4.902098655700684, "global_step": 8118, "epoch": 193} {"train_loss": -5.044908046722412, "global_step": 8119, "epoch": 193} {"train_loss": -5.014736175537109, "global_step": 8120, "epoch": 193} {"train_loss": -4.878446102142334, "global_step": 8121, "epoch": 193} {"train_loss": -4.943629264831543, "global_step": 8122, "epoch": 193} {"train_loss": -4.894722938537598, "global_step": 8123, "epoch": 193} {"train_loss": -5.026753902435303, "global_step": 8124, "epoch": 193} {"train_loss": -5.016201972961426, "global_step": 8125, "epoch": 193} {"train_loss": -4.935914039611816, "global_step": 8126, "epoch": 193} {"train_loss": -4.7106523513793945, "global_step": 8127, "epoch": 193} {"train_loss": -4.927762985229492, "global_step": 8128, "epoch": 193} {"train_loss": -4.8423662185668945, "global_step": 8129, "epoch": 193} {"train_loss": -4.894374847412109, "global_step": 8130, "epoch": 193} {"train_loss": -4.862673759460449, "global_step": 8131, "epoch": 193} {"train_loss": -4.930862903594971, "global_step": 8132, "epoch": 193} {"train_loss": -4.979313850402832, "global_step": 8133, "epoch": 193} {"train_loss": -4.941690444946289, "global_step": 8134, "epoch": 193} {"train_loss": -4.858882904052734, "global_step": 8135, "epoch": 193} {"train_loss": -4.860114097595215, "global_step": 8136, "epoch": 193} {"train_loss": -5.013943672180176, "global_step": 8137, "epoch": 193} {"train_loss": -4.8831706047058105, "global_step": 8138, "epoch": 193} {"train_loss": -5.039676666259766, "global_step": 8139, "epoch": 193} {"train_loss": -4.887669086456299, "global_step": 8140, "epoch": 193} {"train_loss": -5.015169143676758, "global_step": 8141, "epoch": 193} {"train_loss": -5.175191879272461, "global_step": 8142, "epoch": 193} {"train_loss": -4.749281883239746, "global_step": 8143, "epoch": 193} {"train_loss": -4.971019744873047, "global_step": 8144, "epoch": 193} {"train_loss": -4.991242408752441, "global_step": 8145, "epoch": 193} {"train_loss": -4.900881290435791, "global_step": 8146, "epoch": 193} {"train_loss": -4.949752796263922, "global_step": 8147, "epoch": 193, "val_loss": 83286.2890625} {"train_loss": -4.9550371170043945, "global_step": 8148, "epoch": 194} {"train_loss": -4.925711631774902, "global_step": 8149, "epoch": 194} {"train_loss": -4.923055648803711, "global_step": 8150, "epoch": 194} {"train_loss": -4.961669921875, "global_step": 8151, "epoch": 194} {"train_loss": -4.95916748046875, "global_step": 8152, "epoch": 194} {"train_loss": -4.965123653411865, "global_step": 8153, "epoch": 194} {"train_loss": -5.069829940795898, "global_step": 8154, "epoch": 194} {"train_loss": -5.036506652832031, "global_step": 8155, "epoch": 194} {"train_loss": -4.89633846282959, "global_step": 8156, "epoch": 194} {"train_loss": -4.964890956878662, "global_step": 8157, "epoch": 194} {"train_loss": -4.902218818664551, "global_step": 8158, "epoch": 194} {"train_loss": -4.928099632263184, "global_step": 8159, "epoch": 194} {"train_loss": -4.8224992752075195, "global_step": 8160, "epoch": 194} {"train_loss": -4.918246269226074, "global_step": 8161, "epoch": 194} {"train_loss": -5.024959564208984, "global_step": 8162, "epoch": 194} {"train_loss": -4.91143274307251, "global_step": 8163, "epoch": 194} {"train_loss": -4.6899261474609375, "global_step": 8164, "epoch": 194} {"train_loss": -4.877185821533203, "global_step": 8165, "epoch": 194} {"train_loss": -4.84092378616333, "global_step": 8166, "epoch": 194} {"train_loss": -4.942604064941406, "global_step": 8167, "epoch": 194} {"train_loss": -5.139707088470459, "global_step": 8168, "epoch": 194} {"train_loss": -5.057905197143555, "global_step": 8169, "epoch": 194} {"train_loss": -4.9836626052856445, "global_step": 8170, "epoch": 194} {"train_loss": -4.923343658447266, "global_step": 8171, "epoch": 194} {"train_loss": -5.077378273010254, "global_step": 8172, "epoch": 194} {"train_loss": -5.05148458480835, "global_step": 8173, "epoch": 194} {"train_loss": -4.973216533660889, "global_step": 8174, "epoch": 194} {"train_loss": -4.986763954162598, "global_step": 8175, "epoch": 194} {"train_loss": -5.113029479980469, "global_step": 8176, "epoch": 194} {"train_loss": -5.081253528594971, "global_step": 8177, "epoch": 194} {"train_loss": -4.972334861755371, "global_step": 8178, "epoch": 194} {"train_loss": -5.019874572753906, "global_step": 8179, "epoch": 194} {"train_loss": -4.958115577697754, "global_step": 8180, "epoch": 194} {"train_loss": -4.963448524475098, "global_step": 8181, "epoch": 194} {"train_loss": -5.018219470977783, "global_step": 8182, "epoch": 194} {"train_loss": -4.838708877563477, "global_step": 8183, "epoch": 194} {"train_loss": -4.995152950286865, "global_step": 8184, "epoch": 194} {"train_loss": -5.001832008361816, "global_step": 8185, "epoch": 194} {"train_loss": -5.0052313804626465, "global_step": 8186, "epoch": 194} {"train_loss": -5.075732231140137, "global_step": 8187, "epoch": 194} {"train_loss": -5.05104923248291, "global_step": 8188, "epoch": 194} {"train_loss": -4.97171535946074, "global_step": 8189, "epoch": 194, "val_loss": 81321.6640625} {"train_loss": -5.002406597137451, "global_step": 8190, "epoch": 195} {"train_loss": -5.075469017028809, "global_step": 8191, "epoch": 195} {"train_loss": -5.0020751953125, "global_step": 8192, "epoch": 195} {"train_loss": -5.040525436401367, "global_step": 8193, "epoch": 195} {"train_loss": -4.979108810424805, "global_step": 8194, "epoch": 195} {"train_loss": -5.138330936431885, "global_step": 8195, "epoch": 195} {"train_loss": -5.01460075378418, "global_step": 8196, "epoch": 195} {"train_loss": -4.859348297119141, "global_step": 8197, "epoch": 195} {"train_loss": -4.980619430541992, "global_step": 8198, "epoch": 195} {"train_loss": -5.023479461669922, "global_step": 8199, "epoch": 195} {"train_loss": -5.016228199005127, "global_step": 8200, "epoch": 195} {"train_loss": -4.870210647583008, "global_step": 8201, "epoch": 195} {"train_loss": -4.956998348236084, "global_step": 8202, "epoch": 195} {"train_loss": -5.012209892272949, "global_step": 8203, "epoch": 195} {"train_loss": -4.959261894226074, "global_step": 8204, "epoch": 195} {"train_loss": -4.893759250640869, "global_step": 8205, "epoch": 195} {"train_loss": -4.912928581237793, "global_step": 8206, "epoch": 195} {"train_loss": -5.008212566375732, "global_step": 8207, "epoch": 195} {"train_loss": -4.908157825469971, "global_step": 8208, "epoch": 195} {"train_loss": -5.03901481628418, "global_step": 8209, "epoch": 195} {"train_loss": -4.885010242462158, "global_step": 8210, "epoch": 195} {"train_loss": -4.950572490692139, "global_step": 8211, "epoch": 195} {"train_loss": -4.789545059204102, "global_step": 8212, "epoch": 195} {"train_loss": -4.982500076293945, "global_step": 8213, "epoch": 195} {"train_loss": -4.818885803222656, "global_step": 8214, "epoch": 195} {"train_loss": -5.0696024894714355, "global_step": 8215, "epoch": 195} {"train_loss": -5.103066444396973, "global_step": 8216, "epoch": 195} {"train_loss": -5.1224589347839355, "global_step": 8217, "epoch": 195} {"train_loss": -5.047983169555664, "global_step": 8218, "epoch": 195} {"train_loss": -4.826996326446533, "global_step": 8219, "epoch": 195} {"train_loss": -4.899658203125, "global_step": 8220, "epoch": 195} {"train_loss": -5.110867500305176, "global_step": 8221, "epoch": 195} {"train_loss": -5.111090660095215, "global_step": 8222, "epoch": 195} {"train_loss": -4.840246200561523, "global_step": 8223, "epoch": 195} {"train_loss": -5.016694068908691, "global_step": 8224, "epoch": 195} {"train_loss": -5.065888404846191, "global_step": 8225, "epoch": 195} {"train_loss": -5.046942710876465, "global_step": 8226, "epoch": 195} {"train_loss": -5.005930423736572, "global_step": 8227, "epoch": 195} {"train_loss": -5.060511589050293, "global_step": 8228, "epoch": 195} {"train_loss": -4.864816665649414, "global_step": 8229, "epoch": 195} {"train_loss": -5.077779293060303, "global_step": 8230, "epoch": 195} {"train_loss": -4.981525670914423, "global_step": 8231, "epoch": 195, "val_loss": 81307.921875} {"train_loss": -5.101861476898193, "global_step": 8232, "epoch": 196} {"train_loss": -5.043843746185303, "global_step": 8233, "epoch": 196} {"train_loss": -5.166059970855713, "global_step": 8234, "epoch": 196} {"train_loss": -4.927498817443848, "global_step": 8235, "epoch": 196} {"train_loss": -4.949747085571289, "global_step": 8236, "epoch": 196} {"train_loss": -5.051536560058594, "global_step": 8237, "epoch": 196} {"train_loss": -5.010740280151367, "global_step": 8238, "epoch": 196} {"train_loss": -4.678610801696777, "global_step": 8239, "epoch": 196} {"train_loss": -4.850190162658691, "global_step": 8240, "epoch": 196} {"train_loss": -4.966923236846924, "global_step": 8241, "epoch": 196} {"train_loss": -4.606917858123779, "global_step": 8242, "epoch": 196} {"train_loss": -5.047536373138428, "global_step": 8243, "epoch": 196} {"train_loss": -4.731601715087891, "global_step": 8244, "epoch": 196} {"train_loss": -4.815716743469238, "global_step": 8245, "epoch": 196} {"train_loss": -4.786593437194824, "global_step": 8246, "epoch": 196} {"train_loss": -4.855680465698242, "global_step": 8247, "epoch": 196} {"train_loss": -5.104739665985107, "global_step": 8248, "epoch": 196} {"train_loss": -4.9898271560668945, "global_step": 8249, "epoch": 196} {"train_loss": -5.073034286499023, "global_step": 8250, "epoch": 196} {"train_loss": -5.008246898651123, "global_step": 8251, "epoch": 196} {"train_loss": -4.97743034362793, "global_step": 8252, "epoch": 196} {"train_loss": -4.959991455078125, "global_step": 8253, "epoch": 196} {"train_loss": -4.850168228149414, "global_step": 8254, "epoch": 196} {"train_loss": -4.857468605041504, "global_step": 8255, "epoch": 196} {"train_loss": -4.965824604034424, "global_step": 8256, "epoch": 196} {"train_loss": -4.987508296966553, "global_step": 8257, "epoch": 196} {"train_loss": -5.037233352661133, "global_step": 8258, "epoch": 196} {"train_loss": -4.885385513305664, "global_step": 8259, "epoch": 196} {"train_loss": -5.0885772705078125, "global_step": 8260, "epoch": 196} {"train_loss": -4.959174156188965, "global_step": 8261, "epoch": 196} {"train_loss": -4.999352931976318, "global_step": 8262, "epoch": 196} {"train_loss": -5.014838218688965, "global_step": 8263, "epoch": 196} {"train_loss": -5.089171409606934, "global_step": 8264, "epoch": 196} {"train_loss": -5.181554794311523, "global_step": 8265, "epoch": 196} {"train_loss": -5.078678131103516, "global_step": 8266, "epoch": 196} {"train_loss": -5.083890914916992, "global_step": 8267, "epoch": 196} {"train_loss": -4.999415397644043, "global_step": 8268, "epoch": 196} {"train_loss": -5.130833625793457, "global_step": 8269, "epoch": 196} {"train_loss": -4.9674072265625, "global_step": 8270, "epoch": 196} {"train_loss": -5.015960693359375, "global_step": 8271, "epoch": 196} {"train_loss": -5.032049179077148, "global_step": 8272, "epoch": 196} {"train_loss": -4.9745538121178035, "global_step": 8273, "epoch": 196, "val_loss": 81085.578125} {"train_loss": -4.909976959228516, "global_step": 8274, "epoch": 197} {"train_loss": -5.055870056152344, "global_step": 8275, "epoch": 197} {"train_loss": -5.165846824645996, "global_step": 8276, "epoch": 197} {"train_loss": -4.98960542678833, "global_step": 8277, "epoch": 197} {"train_loss": -5.035034656524658, "global_step": 8278, "epoch": 197} {"train_loss": -5.0243682861328125, "global_step": 8279, "epoch": 197} {"train_loss": -5.047411918640137, "global_step": 8280, "epoch": 197} {"train_loss": -4.975414276123047, "global_step": 8281, "epoch": 197} {"train_loss": -5.069117546081543, "global_step": 8282, "epoch": 197} {"train_loss": -4.878429412841797, "global_step": 8283, "epoch": 197} {"train_loss": -4.939007759094238, "global_step": 8284, "epoch": 197} {"train_loss": -5.000197887420654, "global_step": 8285, "epoch": 197} {"train_loss": -4.801750183105469, "global_step": 8286, "epoch": 197} {"train_loss": -4.911555767059326, "global_step": 8287, "epoch": 197} {"train_loss": -5.137410640716553, "global_step": 8288, "epoch": 197} {"train_loss": -4.823971748352051, "global_step": 8289, "epoch": 197} {"train_loss": -4.848294258117676, "global_step": 8290, "epoch": 197} {"train_loss": -4.95943546295166, "global_step": 8291, "epoch": 197} {"train_loss": -4.900669097900391, "global_step": 8292, "epoch": 197} {"train_loss": -4.923413276672363, "global_step": 8293, "epoch": 197} {"train_loss": -4.691027641296387, "global_step": 8294, "epoch": 197} {"train_loss": -4.863860130310059, "global_step": 8295, "epoch": 197} {"train_loss": -4.905628204345703, "global_step": 8296, "epoch": 197} {"train_loss": -5.0294904708862305, "global_step": 8297, "epoch": 197} {"train_loss": -4.958520889282227, "global_step": 8298, "epoch": 197} {"train_loss": -4.982465744018555, "global_step": 8299, "epoch": 197} {"train_loss": -5.005632400512695, "global_step": 8300, "epoch": 197} {"train_loss": -5.090937614440918, "global_step": 8301, "epoch": 197} {"train_loss": -5.0264177322387695, "global_step": 8302, "epoch": 197} {"train_loss": -4.911581993103027, "global_step": 8303, "epoch": 197} {"train_loss": -4.928243637084961, "global_step": 8304, "epoch": 197} {"train_loss": -4.931026458740234, "global_step": 8305, "epoch": 197} {"train_loss": -5.046811103820801, "global_step": 8306, "epoch": 197} {"train_loss": -5.0581817626953125, "global_step": 8307, "epoch": 197} {"train_loss": -5.017045974731445, "global_step": 8308, "epoch": 197} {"train_loss": -4.9217658042907715, "global_step": 8309, "epoch": 197} {"train_loss": -5.065070152282715, "global_step": 8310, "epoch": 197} {"train_loss": -5.074429988861084, "global_step": 8311, "epoch": 197} {"train_loss": -4.995979309082031, "global_step": 8312, "epoch": 197} {"train_loss": -5.034686088562012, "global_step": 8313, "epoch": 197} {"train_loss": -5.0271148681640625, "global_step": 8314, "epoch": 197} {"train_loss": -4.979095572517032, "global_step": 8315, "epoch": 197, "val_loss": 81562.8125} {"train_loss": -5.125005722045898, "global_step": 8316, "epoch": 198} {"train_loss": -5.129715919494629, "global_step": 8317, "epoch": 198} {"train_loss": -5.071972370147705, "global_step": 8318, "epoch": 198} {"train_loss": -4.821627616882324, "global_step": 8319, "epoch": 198} {"train_loss": -5.061489105224609, "global_step": 8320, "epoch": 198} {"train_loss": -5.046576023101807, "global_step": 8321, "epoch": 198} {"train_loss": -4.968548774719238, "global_step": 8322, "epoch": 198} {"train_loss": -5.0794782638549805, "global_step": 8323, "epoch": 198} {"train_loss": -5.094573974609375, "global_step": 8324, "epoch": 198} {"train_loss": -5.075896263122559, "global_step": 8325, "epoch": 198} {"train_loss": -5.161808967590332, "global_step": 8326, "epoch": 198} {"train_loss": -4.93231201171875, "global_step": 8327, "epoch": 198} {"train_loss": -5.036514759063721, "global_step": 8328, "epoch": 198} {"train_loss": -4.994255542755127, "global_step": 8329, "epoch": 198} {"train_loss": -4.979098320007324, "global_step": 8330, "epoch": 198} {"train_loss": -4.8011674880981445, "global_step": 8331, "epoch": 198} {"train_loss": -5.026129722595215, "global_step": 8332, "epoch": 198} {"train_loss": -4.999063014984131, "global_step": 8333, "epoch": 198} {"train_loss": -4.9133734703063965, "global_step": 8334, "epoch": 198} {"train_loss": -5.101555347442627, "global_step": 8335, "epoch": 198} {"train_loss": -5.108037948608398, "global_step": 8336, "epoch": 198} {"train_loss": -4.978649139404297, "global_step": 8337, "epoch": 198} {"train_loss": -5.077624320983887, "global_step": 8338, "epoch": 198} {"train_loss": -4.9331231117248535, "global_step": 8339, "epoch": 198} {"train_loss": -5.038896560668945, "global_step": 8340, "epoch": 198} {"train_loss": -5.138589859008789, "global_step": 8341, "epoch": 198} {"train_loss": -4.974735260009766, "global_step": 8342, "epoch": 198} {"train_loss": -5.117392539978027, "global_step": 8343, "epoch": 198} {"train_loss": -5.1115827560424805, "global_step": 8344, "epoch": 198} {"train_loss": -4.923392295837402, "global_step": 8345, "epoch": 198} {"train_loss": -5.177086353302002, "global_step": 8346, "epoch": 198} {"train_loss": -4.9498748779296875, "global_step": 8347, "epoch": 198} {"train_loss": -5.05234432220459, "global_step": 8348, "epoch": 198} {"train_loss": -4.913849830627441, "global_step": 8349, "epoch": 198} {"train_loss": -4.952980995178223, "global_step": 8350, "epoch": 198} {"train_loss": -4.955345630645752, "global_step": 8351, "epoch": 198} {"train_loss": -4.93035888671875, "global_step": 8352, "epoch": 198} {"train_loss": -5.032747268676758, "global_step": 8353, "epoch": 198} {"train_loss": -4.876532554626465, "global_step": 8354, "epoch": 198} {"train_loss": -4.939140319824219, "global_step": 8355, "epoch": 198} {"train_loss": -5.079876899719238, "global_step": 8356, "epoch": 198} {"train_loss": -5.016344354266212, "global_step": 8357, "epoch": 198, "val_loss": 81191.875} {"train_loss": -4.995920181274414, "global_step": 8358, "epoch": 199} {"train_loss": -5.067566871643066, "global_step": 8359, "epoch": 199} {"train_loss": -4.907127380371094, "global_step": 8360, "epoch": 199} {"train_loss": -5.065845489501953, "global_step": 8361, "epoch": 199} {"train_loss": -4.993475914001465, "global_step": 8362, "epoch": 199} {"train_loss": -5.03751277923584, "global_step": 8363, "epoch": 199} {"train_loss": -4.7602033615112305, "global_step": 8364, "epoch": 199} {"train_loss": -4.815218925476074, "global_step": 8365, "epoch": 199} {"train_loss": -4.9401350021362305, "global_step": 8366, "epoch": 199} {"train_loss": -4.764796257019043, "global_step": 8367, "epoch": 199} {"train_loss": -4.899866104125977, "global_step": 8368, "epoch": 199} {"train_loss": -4.785462856292725, "global_step": 8369, "epoch": 199} {"train_loss": -4.791830062866211, "global_step": 8370, "epoch": 199} {"train_loss": -4.943337440490723, "global_step": 8371, "epoch": 199} {"train_loss": -4.688092231750488, "global_step": 8372, "epoch": 199} {"train_loss": -4.721634864807129, "global_step": 8373, "epoch": 199} {"train_loss": -4.847446441650391, "global_step": 8374, "epoch": 199} {"train_loss": -4.770102500915527, "global_step": 8375, "epoch": 199} {"train_loss": -4.74713134765625, "global_step": 8376, "epoch": 199} {"train_loss": -5.0284857749938965, "global_step": 8377, "epoch": 199} {"train_loss": -4.798770904541016, "global_step": 8378, "epoch": 199} {"train_loss": -4.947945594787598, "global_step": 8379, "epoch": 199} {"train_loss": -4.9660844802856445, "global_step": 8380, "epoch": 199} {"train_loss": -4.890806674957275, "global_step": 8381, "epoch": 199} {"train_loss": -5.029332160949707, "global_step": 8382, "epoch": 199} {"train_loss": -4.828967094421387, "global_step": 8383, "epoch": 199} {"train_loss": -4.8088812828063965, "global_step": 8384, "epoch": 199} {"train_loss": -5.029438495635986, "global_step": 8385, "epoch": 199} {"train_loss": -4.818633079528809, "global_step": 8386, "epoch": 199} {"train_loss": -5.037352085113525, "global_step": 8387, "epoch": 199} {"train_loss": -4.8855085372924805, "global_step": 8388, "epoch": 199} {"train_loss": -5.020538330078125, "global_step": 8389, "epoch": 199} {"train_loss": -5.034424781799316, "global_step": 8390, "epoch": 199} {"train_loss": -4.899378776550293, "global_step": 8391, "epoch": 199} {"train_loss": -4.9633564949035645, "global_step": 8392, "epoch": 199} {"train_loss": -4.975556373596191, "global_step": 8393, "epoch": 199} {"train_loss": -4.9721879959106445, "global_step": 8394, "epoch": 199} {"train_loss": -4.840689659118652, "global_step": 8395, "epoch": 199} {"train_loss": -4.931595802307129, "global_step": 8396, "epoch": 199} {"train_loss": -5.0572919845581055, "global_step": 8397, "epoch": 199} {"train_loss": -5.022923946380615, "global_step": 8398, "epoch": 199} {"train_loss": -4.914220037914458, "global_step": 8399, "epoch": 199, "val_loss": 80678.7421875} {"train_loss": -5.149604797363281, "global_step": 8400, "epoch": 200} {"train_loss": -4.958797454833984, "global_step": 8401, "epoch": 200} {"train_loss": -4.958295822143555, "global_step": 8402, "epoch": 200} {"train_loss": -5.04805850982666, "global_step": 8403, "epoch": 200} {"train_loss": -4.914848327636719, "global_step": 8404, "epoch": 200} {"train_loss": -4.989019870758057, "global_step": 8405, "epoch": 200} {"train_loss": -5.122714042663574, "global_step": 8406, "epoch": 200} {"train_loss": -4.974569320678711, "global_step": 8407, "epoch": 200} {"train_loss": -4.971845626831055, "global_step": 8408, "epoch": 200} {"train_loss": -4.976927757263184, "global_step": 8409, "epoch": 200} {"train_loss": -4.874106407165527, "global_step": 8410, "epoch": 200} {"train_loss": -4.884487152099609, "global_step": 8411, "epoch": 200} {"train_loss": -4.9733757972717285, "global_step": 8412, "epoch": 200} {"train_loss": -5.094377517700195, "global_step": 8413, "epoch": 200} {"train_loss": -4.965874195098877, "global_step": 8414, "epoch": 200} {"train_loss": -4.97032356262207, "global_step": 8415, "epoch": 200} {"train_loss": -5.027259826660156, "global_step": 8416, "epoch": 200} {"train_loss": -5.094937324523926, "global_step": 8417, "epoch": 200} {"train_loss": -4.889165878295898, "global_step": 8418, "epoch": 200} {"train_loss": -5.098007678985596, "global_step": 8419, "epoch": 200} {"train_loss": -5.15308952331543, "global_step": 8420, "epoch": 200} {"train_loss": -4.811082363128662, "global_step": 8421, "epoch": 200} {"train_loss": -4.975503921508789, "global_step": 8422, "epoch": 200} {"train_loss": -4.9063239097595215, "global_step": 8423, "epoch": 200} {"train_loss": -4.849086761474609, "global_step": 8424, "epoch": 200} {"train_loss": -5.015294075012207, "global_step": 8425, "epoch": 200} {"train_loss": -5.041389465332031, "global_step": 8426, "epoch": 200} {"train_loss": -4.78046989440918, "global_step": 8427, "epoch": 200} {"train_loss": -4.957159042358398, "global_step": 8428, "epoch": 200} {"train_loss": -4.957268714904785, "global_step": 8429, "epoch": 200} {"train_loss": -4.8179521560668945, "global_step": 8430, "epoch": 200} {"train_loss": -5.0188093185424805, "global_step": 8431, "epoch": 200} {"train_loss": -5.0509538650512695, "global_step": 8432, "epoch": 200} {"train_loss": -4.875167369842529, "global_step": 8433, "epoch": 200} {"train_loss": -5.105665683746338, "global_step": 8434, "epoch": 200} {"train_loss": -4.87092399597168, "global_step": 8435, "epoch": 200} {"train_loss": -4.953616142272949, "global_step": 8436, "epoch": 200} {"train_loss": -4.895267963409424, "global_step": 8437, "epoch": 200} {"train_loss": -5.031210899353027, "global_step": 8438, "epoch": 200} {"train_loss": -5.077463626861572, "global_step": 8439, "epoch": 200} {"train_loss": -4.95587682723999, "global_step": 8440, "epoch": 200} {"train_loss": -4.978648367382231, "global_step": 8441, "epoch": 200, "train/sim_max_reward_0": 0.40994307399583685, "train/sim_max_reward_1": 0.556492560436495, "train/sim_max_reward_2": 0.2756239552787644, "train/sim_max_reward_3": 0.059410731579894294, "train/sim_max_reward_4": 0.314233903267764, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.08842786286054531, "test/sim_max_reward_4400001": 0.21573406863747555, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.0, "test/sim_max_reward_4400010": 0.1608555189175478, "test/sim_max_reward_4400011": 0.07444930221154836, "test/sim_max_reward_4400012": 0.15971809331970138, "test/sim_max_reward_4400013": 0.08505138257046205, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.060045094578013894, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3084919338531987, "test/sim_max_reward_4400022": 0.013958017817960343, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.27598147085354124, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.001845948190695572, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.40775750273020894, "test/sim_max_reward_4400031": 0.23687823249651238, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.3008147651189276, "test/sim_max_reward_4400034": 0.4447504387557852, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.4169750492676326, "test/sim_max_reward_4400037": 0.38855059182036594, "test/sim_max_reward_4400038": 0.0036424907160993274, "test/sim_max_reward_4400039": 0.4885169564789804, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.5279480075820168, "test/sim_max_reward_4400042": 0.012787967447422196, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.5102796351125902, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.26111398924365287, "test/sim_max_reward_4400047": 0.029039071455165027, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.3014481639868236, "test/mean_score": 0.13161964269102192, "val_loss": 80959.421875} {"train_loss": -5.138429641723633, "global_step": 8442, "epoch": 201} {"train_loss": -4.848982810974121, "global_step": 8443, "epoch": 201} {"train_loss": -5.150496482849121, "global_step": 8444, "epoch": 201} {"train_loss": -4.975780487060547, "global_step": 8445, "epoch": 201} {"train_loss": -5.086569309234619, "global_step": 8446, "epoch": 201} {"train_loss": -4.975323677062988, "global_step": 8447, "epoch": 201} {"train_loss": -4.983633518218994, "global_step": 8448, "epoch": 201} {"train_loss": -4.961431980133057, "global_step": 8449, "epoch": 201} {"train_loss": -4.88624906539917, "global_step": 8450, "epoch": 201} {"train_loss": -5.080631732940674, "global_step": 8451, "epoch": 201} {"train_loss": -5.020913124084473, "global_step": 8452, "epoch": 201} {"train_loss": -4.968181610107422, "global_step": 8453, "epoch": 201} {"train_loss": -5.023930549621582, "global_step": 8454, "epoch": 201} {"train_loss": -4.996514320373535, "global_step": 8455, "epoch": 201} {"train_loss": -4.845610618591309, "global_step": 8456, "epoch": 201} {"train_loss": -4.897149562835693, "global_step": 8457, "epoch": 201} {"train_loss": -5.096530914306641, "global_step": 8458, "epoch": 201} {"train_loss": -5.011350631713867, "global_step": 8459, "epoch": 201} {"train_loss": -4.907352924346924, "global_step": 8460, "epoch": 201} {"train_loss": -5.004051208496094, "global_step": 8461, "epoch": 201} {"train_loss": -5.048938274383545, "global_step": 8462, "epoch": 201} {"train_loss": -5.004783630371094, "global_step": 8463, "epoch": 201} {"train_loss": -4.689341068267822, "global_step": 8464, "epoch": 201} {"train_loss": -4.958044052124023, "global_step": 8465, "epoch": 201} {"train_loss": -4.993229866027832, "global_step": 8466, "epoch": 201} {"train_loss": -4.874904632568359, "global_step": 8467, "epoch": 201} {"train_loss": -5.147937297821045, "global_step": 8468, "epoch": 201} {"train_loss": -5.044838905334473, "global_step": 8469, "epoch": 201} {"train_loss": -5.138201713562012, "global_step": 8470, "epoch": 201} {"train_loss": -4.962560653686523, "global_step": 8471, "epoch": 201} {"train_loss": -5.00040340423584, "global_step": 8472, "epoch": 201} {"train_loss": -5.043084621429443, "global_step": 8473, "epoch": 201} {"train_loss": -5.132501125335693, "global_step": 8474, "epoch": 201} {"train_loss": -5.087578773498535, "global_step": 8475, "epoch": 201} {"train_loss": -4.916280746459961, "global_step": 8476, "epoch": 201} {"train_loss": -4.946137428283691, "global_step": 8477, "epoch": 201} {"train_loss": -5.01692008972168, "global_step": 8478, "epoch": 201} {"train_loss": -4.961450576782227, "global_step": 8479, "epoch": 201} {"train_loss": -5.098490238189697, "global_step": 8480, "epoch": 201} {"train_loss": -4.983523368835449, "global_step": 8481, "epoch": 201} {"train_loss": -5.113687515258789, "global_step": 8482, "epoch": 201} {"train_loss": -4.999559413819086, "global_step": 8483, "epoch": 201, "val_loss": 80625.375} {"train_loss": -5.067676544189453, "global_step": 8484, "epoch": 202} {"train_loss": -5.18285608291626, "global_step": 8485, "epoch": 202} {"train_loss": -5.065715789794922, "global_step": 8486, "epoch": 202} {"train_loss": -4.7913994789123535, "global_step": 8487, "epoch": 202} {"train_loss": -4.766867160797119, "global_step": 8488, "epoch": 202} {"train_loss": -5.084412574768066, "global_step": 8489, "epoch": 202} {"train_loss": -4.998053550720215, "global_step": 8490, "epoch": 202} {"train_loss": -4.908936500549316, "global_step": 8491, "epoch": 202} {"train_loss": -4.935896396636963, "global_step": 8492, "epoch": 202} {"train_loss": -5.028406143188477, "global_step": 8493, "epoch": 202} {"train_loss": -4.890686511993408, "global_step": 8494, "epoch": 202} {"train_loss": -5.041839599609375, "global_step": 8495, "epoch": 202} {"train_loss": -5.013800621032715, "global_step": 8496, "epoch": 202} {"train_loss": -5.015560626983643, "global_step": 8497, "epoch": 202} {"train_loss": -4.862981796264648, "global_step": 8498, "epoch": 202} {"train_loss": -5.124383926391602, "global_step": 8499, "epoch": 202} {"train_loss": -5.067143440246582, "global_step": 8500, "epoch": 202} {"train_loss": -5.038444519042969, "global_step": 8501, "epoch": 202} {"train_loss": -4.819695472717285, "global_step": 8502, "epoch": 202} {"train_loss": -4.979713439941406, "global_step": 8503, "epoch": 202} {"train_loss": -4.841852188110352, "global_step": 8504, "epoch": 202} {"train_loss": -5.089004993438721, "global_step": 8505, "epoch": 202} {"train_loss": -5.005029678344727, "global_step": 8506, "epoch": 202} {"train_loss": -5.010290145874023, "global_step": 8507, "epoch": 202} {"train_loss": -4.987704753875732, "global_step": 8508, "epoch": 202} {"train_loss": -5.1572585105896, "global_step": 8509, "epoch": 202} {"train_loss": -4.990291118621826, "global_step": 8510, "epoch": 202} {"train_loss": -4.956980228424072, "global_step": 8511, "epoch": 202} {"train_loss": -5.017738342285156, "global_step": 8512, "epoch": 202} {"train_loss": -4.976619720458984, "global_step": 8513, "epoch": 202} {"train_loss": -5.024456024169922, "global_step": 8514, "epoch": 202} {"train_loss": -5.008334159851074, "global_step": 8515, "epoch": 202} {"train_loss": -4.898343086242676, "global_step": 8516, "epoch": 202} {"train_loss": -4.964655876159668, "global_step": 8517, "epoch": 202} {"train_loss": -5.06686544418335, "global_step": 8518, "epoch": 202} {"train_loss": -4.996343612670898, "global_step": 8519, "epoch": 202} {"train_loss": -4.943059921264648, "global_step": 8520, "epoch": 202} {"train_loss": -4.913367748260498, "global_step": 8521, "epoch": 202} {"train_loss": -5.033714294433594, "global_step": 8522, "epoch": 202} {"train_loss": -4.965528964996338, "global_step": 8523, "epoch": 202} {"train_loss": -4.868931770324707, "global_step": 8524, "epoch": 202} {"train_loss": -4.985132989429292, "global_step": 8525, "epoch": 202, "val_loss": 80507.6796875} {"train_loss": -5.109807014465332, "global_step": 8526, "epoch": 203} {"train_loss": -5.047126770019531, "global_step": 8527, "epoch": 203} {"train_loss": -4.973452091217041, "global_step": 8528, "epoch": 203} {"train_loss": -5.13514518737793, "global_step": 8529, "epoch": 203} {"train_loss": -5.092552185058594, "global_step": 8530, "epoch": 203} {"train_loss": -5.056987762451172, "global_step": 8531, "epoch": 203} {"train_loss": -4.964178085327148, "global_step": 8532, "epoch": 203} {"train_loss": -5.102056503295898, "global_step": 8533, "epoch": 203} {"train_loss": -4.967925548553467, "global_step": 8534, "epoch": 203} {"train_loss": -4.97261381149292, "global_step": 8535, "epoch": 203} {"train_loss": -4.994364261627197, "global_step": 8536, "epoch": 203} {"train_loss": -5.061492919921875, "global_step": 8537, "epoch": 203} {"train_loss": -5.110816955566406, "global_step": 8538, "epoch": 203} {"train_loss": -5.073702812194824, "global_step": 8539, "epoch": 203} {"train_loss": -5.1028547286987305, "global_step": 8540, "epoch": 203} {"train_loss": -5.019532203674316, "global_step": 8541, "epoch": 203} {"train_loss": -4.990140438079834, "global_step": 8542, "epoch": 203} {"train_loss": -5.0078444480896, "global_step": 8543, "epoch": 203} {"train_loss": -4.950076103210449, "global_step": 8544, "epoch": 203} {"train_loss": -4.850341796875, "global_step": 8545, "epoch": 203} {"train_loss": -4.731794357299805, "global_step": 8546, "epoch": 203} {"train_loss": -4.796926021575928, "global_step": 8547, "epoch": 203} {"train_loss": -4.81011962890625, "global_step": 8548, "epoch": 203} {"train_loss": -4.986294746398926, "global_step": 8549, "epoch": 203} {"train_loss": -4.679605484008789, "global_step": 8550, "epoch": 203} {"train_loss": -4.802637577056885, "global_step": 8551, "epoch": 203} {"train_loss": -4.905743598937988, "global_step": 8552, "epoch": 203} {"train_loss": -4.850368499755859, "global_step": 8553, "epoch": 203} {"train_loss": -4.836980819702148, "global_step": 8554, "epoch": 203} {"train_loss": -4.848349571228027, "global_step": 8555, "epoch": 203} {"train_loss": -4.901144027709961, "global_step": 8556, "epoch": 203} {"train_loss": -4.9331583976745605, "global_step": 8557, "epoch": 203} {"train_loss": -4.795512676239014, "global_step": 8558, "epoch": 203} {"train_loss": -4.792792797088623, "global_step": 8559, "epoch": 203} {"train_loss": -4.8205413818359375, "global_step": 8560, "epoch": 203} {"train_loss": -5.081543922424316, "global_step": 8561, "epoch": 203} {"train_loss": -4.918008804321289, "global_step": 8562, "epoch": 203} {"train_loss": -4.680438041687012, "global_step": 8563, "epoch": 203} {"train_loss": -4.909991264343262, "global_step": 8564, "epoch": 203} {"train_loss": -4.874320983886719, "global_step": 8565, "epoch": 203} {"train_loss": -5.095499038696289, "global_step": 8566, "epoch": 203} {"train_loss": -4.941623131434123, "global_step": 8567, "epoch": 203, "val_loss": 81396.8515625} {"train_loss": -5.049987316131592, "global_step": 8568, "epoch": 204} {"train_loss": -4.974763870239258, "global_step": 8569, "epoch": 204} {"train_loss": -4.9243011474609375, "global_step": 8570, "epoch": 204} {"train_loss": -5.028609275817871, "global_step": 8571, "epoch": 204} {"train_loss": -4.98740816116333, "global_step": 8572, "epoch": 204} {"train_loss": -4.99263334274292, "global_step": 8573, "epoch": 204} {"train_loss": -4.979282379150391, "global_step": 8574, "epoch": 204} {"train_loss": -5.0320563316345215, "global_step": 8575, "epoch": 204} {"train_loss": -4.95988130569458, "global_step": 8576, "epoch": 204} {"train_loss": -5.088592529296875, "global_step": 8577, "epoch": 204} {"train_loss": -4.889692306518555, "global_step": 8578, "epoch": 204} {"train_loss": -4.964383602142334, "global_step": 8579, "epoch": 204} {"train_loss": -5.0469560623168945, "global_step": 8580, "epoch": 204} {"train_loss": -5.150524139404297, "global_step": 8581, "epoch": 204} {"train_loss": -5.126603126525879, "global_step": 8582, "epoch": 204} {"train_loss": -5.056248664855957, "global_step": 8583, "epoch": 204} {"train_loss": -5.167635917663574, "global_step": 8584, "epoch": 204} {"train_loss": -4.915088176727295, "global_step": 8585, "epoch": 204} {"train_loss": -5.009694576263428, "global_step": 8586, "epoch": 204} {"train_loss": -4.994235038757324, "global_step": 8587, "epoch": 204} {"train_loss": -4.859031677246094, "global_step": 8588, "epoch": 204} {"train_loss": -5.037820339202881, "global_step": 8589, "epoch": 204} {"train_loss": -5.089851379394531, "global_step": 8590, "epoch": 204} {"train_loss": -5.081689357757568, "global_step": 8591, "epoch": 204} {"train_loss": -5.0010223388671875, "global_step": 8592, "epoch": 204} {"train_loss": -5.123213768005371, "global_step": 8593, "epoch": 204} {"train_loss": -4.9488606452941895, "global_step": 8594, "epoch": 204} {"train_loss": -5.106386184692383, "global_step": 8595, "epoch": 204} {"train_loss": -5.052294731140137, "global_step": 8596, "epoch": 204} {"train_loss": -4.823390960693359, "global_step": 8597, "epoch": 204} {"train_loss": -4.910699844360352, "global_step": 8598, "epoch": 204} {"train_loss": -4.931741714477539, "global_step": 8599, "epoch": 204} {"train_loss": -4.892788887023926, "global_step": 8600, "epoch": 204} {"train_loss": -4.823432445526123, "global_step": 8601, "epoch": 204} {"train_loss": -4.968935966491699, "global_step": 8602, "epoch": 204} {"train_loss": -4.9572978019714355, "global_step": 8603, "epoch": 204} {"train_loss": -4.980427265167236, "global_step": 8604, "epoch": 204} {"train_loss": -4.904187202453613, "global_step": 8605, "epoch": 204} {"train_loss": -4.926987648010254, "global_step": 8606, "epoch": 204} {"train_loss": -4.9868083000183105, "global_step": 8607, "epoch": 204} {"train_loss": -4.960882186889648, "global_step": 8608, "epoch": 204} {"train_loss": -4.992349590573992, "global_step": 8609, "epoch": 204, "val_loss": 80360.8515625} {"train_loss": -4.9219255447387695, "global_step": 8610, "epoch": 205} {"train_loss": -4.944327354431152, "global_step": 8611, "epoch": 205} {"train_loss": -4.8580708503723145, "global_step": 8612, "epoch": 205} {"train_loss": -4.896205902099609, "global_step": 8613, "epoch": 205} {"train_loss": -5.016602993011475, "global_step": 8614, "epoch": 205} {"train_loss": -5.002445220947266, "global_step": 8615, "epoch": 205} {"train_loss": -5.034001350402832, "global_step": 8616, "epoch": 205} {"train_loss": -5.075473785400391, "global_step": 8617, "epoch": 205} {"train_loss": -5.09318208694458, "global_step": 8618, "epoch": 205} {"train_loss": -4.952199459075928, "global_step": 8619, "epoch": 205} {"train_loss": -4.9333391189575195, "global_step": 8620, "epoch": 205} {"train_loss": -4.9453535079956055, "global_step": 8621, "epoch": 205} {"train_loss": -4.934927940368652, "global_step": 8622, "epoch": 205} {"train_loss": -4.9411821365356445, "global_step": 8623, "epoch": 205} {"train_loss": -4.982858180999756, "global_step": 8624, "epoch": 205} {"train_loss": -4.88059139251709, "global_step": 8625, "epoch": 205} {"train_loss": -4.969028472900391, "global_step": 8626, "epoch": 205} {"train_loss": -5.007272243499756, "global_step": 8627, "epoch": 205} {"train_loss": -4.82701301574707, "global_step": 8628, "epoch": 205} {"train_loss": -5.074626445770264, "global_step": 8629, "epoch": 205} {"train_loss": -5.032662868499756, "global_step": 8630, "epoch": 205} {"train_loss": -5.053814888000488, "global_step": 8631, "epoch": 205} {"train_loss": -5.097301006317139, "global_step": 8632, "epoch": 205} {"train_loss": -4.961465835571289, "global_step": 8633, "epoch": 205} {"train_loss": -5.182538032531738, "global_step": 8634, "epoch": 205} {"train_loss": -5.145968914031982, "global_step": 8635, "epoch": 205} {"train_loss": -5.086386203765869, "global_step": 8636, "epoch": 205} {"train_loss": -5.035237789154053, "global_step": 8637, "epoch": 205} {"train_loss": -5.046792030334473, "global_step": 8638, "epoch": 205} {"train_loss": -5.029531478881836, "global_step": 8639, "epoch": 205} {"train_loss": -5.149016380310059, "global_step": 8640, "epoch": 205} {"train_loss": -5.033024787902832, "global_step": 8641, "epoch": 205} {"train_loss": -5.010831356048584, "global_step": 8642, "epoch": 205} {"train_loss": -5.235933780670166, "global_step": 8643, "epoch": 205} {"train_loss": -5.15472412109375, "global_step": 8644, "epoch": 205} {"train_loss": -5.106925010681152, "global_step": 8645, "epoch": 205} {"train_loss": -5.048060417175293, "global_step": 8646, "epoch": 205} {"train_loss": -4.756028175354004, "global_step": 8647, "epoch": 205} {"train_loss": -4.869268417358398, "global_step": 8648, "epoch": 205} {"train_loss": -4.840363502502441, "global_step": 8649, "epoch": 205} {"train_loss": -4.929750919342041, "global_step": 8650, "epoch": 205} {"train_loss": -5.001348404657273, "global_step": 8651, "epoch": 205, "val_loss": 81419.546875} {"train_loss": -5.004865646362305, "global_step": 8652, "epoch": 206} {"train_loss": -5.0509467124938965, "global_step": 8653, "epoch": 206} {"train_loss": -5.0928168296813965, "global_step": 8654, "epoch": 206} {"train_loss": -4.8011322021484375, "global_step": 8655, "epoch": 206} {"train_loss": -5.026439189910889, "global_step": 8656, "epoch": 206} {"train_loss": -4.824517726898193, "global_step": 8657, "epoch": 206} {"train_loss": -4.721526622772217, "global_step": 8658, "epoch": 206} {"train_loss": -5.0587263107299805, "global_step": 8659, "epoch": 206} {"train_loss": -4.738900661468506, "global_step": 8660, "epoch": 206} {"train_loss": -4.959922790527344, "global_step": 8661, "epoch": 206} {"train_loss": -5.006396293640137, "global_step": 8662, "epoch": 206} {"train_loss": -4.637485027313232, "global_step": 8663, "epoch": 206} {"train_loss": -4.974188804626465, "global_step": 8664, "epoch": 206} {"train_loss": -4.758805751800537, "global_step": 8665, "epoch": 206} {"train_loss": -4.888747215270996, "global_step": 8666, "epoch": 206} {"train_loss": -4.729360103607178, "global_step": 8667, "epoch": 206} {"train_loss": -4.95200252532959, "global_step": 8668, "epoch": 206} {"train_loss": -4.908235549926758, "global_step": 8669, "epoch": 206} {"train_loss": -4.894608497619629, "global_step": 8670, "epoch": 206} {"train_loss": -5.0390729904174805, "global_step": 8671, "epoch": 206} {"train_loss": -4.905184745788574, "global_step": 8672, "epoch": 206} {"train_loss": -4.976520538330078, "global_step": 8673, "epoch": 206} {"train_loss": -4.972226142883301, "global_step": 8674, "epoch": 206} {"train_loss": -4.916567802429199, "global_step": 8675, "epoch": 206} {"train_loss": -4.91642951965332, "global_step": 8676, "epoch": 206} {"train_loss": -4.873873710632324, "global_step": 8677, "epoch": 206} {"train_loss": -4.969710350036621, "global_step": 8678, "epoch": 206} {"train_loss": -5.037327766418457, "global_step": 8679, "epoch": 206} {"train_loss": -5.008081436157227, "global_step": 8680, "epoch": 206} {"train_loss": -4.932991027832031, "global_step": 8681, "epoch": 206} {"train_loss": -4.866507530212402, "global_step": 8682, "epoch": 206} {"train_loss": -5.120465278625488, "global_step": 8683, "epoch": 206} {"train_loss": -4.983582973480225, "global_step": 8684, "epoch": 206} {"train_loss": -4.977822303771973, "global_step": 8685, "epoch": 206} {"train_loss": -5.080604553222656, "global_step": 8686, "epoch": 206} {"train_loss": -5.1172566413879395, "global_step": 8687, "epoch": 206} {"train_loss": -5.005293846130371, "global_step": 8688, "epoch": 206} {"train_loss": -5.0887770652771, "global_step": 8689, "epoch": 206} {"train_loss": -4.973936080932617, "global_step": 8690, "epoch": 206} {"train_loss": -5.2164154052734375, "global_step": 8691, "epoch": 206} {"train_loss": -5.001858711242676, "global_step": 8692, "epoch": 206} {"train_loss": -4.953145265579224, "global_step": 8693, "epoch": 206, "val_loss": 80049.7890625} {"train_loss": -4.948236465454102, "global_step": 8694, "epoch": 207} {"train_loss": -5.050411224365234, "global_step": 8695, "epoch": 207} {"train_loss": -5.024140357971191, "global_step": 8696, "epoch": 207} {"train_loss": -4.928164005279541, "global_step": 8697, "epoch": 207} {"train_loss": -5.0709333419799805, "global_step": 8698, "epoch": 207} {"train_loss": -4.971141338348389, "global_step": 8699, "epoch": 207} {"train_loss": -4.972021102905273, "global_step": 8700, "epoch": 207} {"train_loss": -4.8873138427734375, "global_step": 8701, "epoch": 207} {"train_loss": -4.9581451416015625, "global_step": 8702, "epoch": 207} {"train_loss": -5.074863433837891, "global_step": 8703, "epoch": 207} {"train_loss": -4.873566627502441, "global_step": 8704, "epoch": 207} {"train_loss": -4.870571136474609, "global_step": 8705, "epoch": 207} {"train_loss": -4.869619846343994, "global_step": 8706, "epoch": 207} {"train_loss": -5.044377326965332, "global_step": 8707, "epoch": 207} {"train_loss": -4.8905134201049805, "global_step": 8708, "epoch": 207} {"train_loss": -4.991451263427734, "global_step": 8709, "epoch": 207} {"train_loss": -4.786630153656006, "global_step": 8710, "epoch": 207} {"train_loss": -5.008490562438965, "global_step": 8711, "epoch": 207} {"train_loss": -4.880874156951904, "global_step": 8712, "epoch": 207} {"train_loss": -4.759057998657227, "global_step": 8713, "epoch": 207} {"train_loss": -4.759709358215332, "global_step": 8714, "epoch": 207} {"train_loss": -5.029057025909424, "global_step": 8715, "epoch": 207} {"train_loss": -4.935718536376953, "global_step": 8716, "epoch": 207} {"train_loss": -4.996849060058594, "global_step": 8717, "epoch": 207} {"train_loss": -4.826614856719971, "global_step": 8718, "epoch": 207} {"train_loss": -4.887383937835693, "global_step": 8719, "epoch": 207} {"train_loss": -4.860736846923828, "global_step": 8720, "epoch": 207} {"train_loss": -5.01685905456543, "global_step": 8721, "epoch": 207} {"train_loss": -5.012392520904541, "global_step": 8722, "epoch": 207} {"train_loss": -4.9517669677734375, "global_step": 8723, "epoch": 207} {"train_loss": -5.1357598304748535, "global_step": 8724, "epoch": 207} {"train_loss": -4.901830673217773, "global_step": 8725, "epoch": 207} {"train_loss": -4.9770894050598145, "global_step": 8726, "epoch": 207} {"train_loss": -5.110898017883301, "global_step": 8727, "epoch": 207} {"train_loss": -4.96511173248291, "global_step": 8728, "epoch": 207} {"train_loss": -5.016355991363525, "global_step": 8729, "epoch": 207} {"train_loss": -4.865448951721191, "global_step": 8730, "epoch": 207} {"train_loss": -4.959756851196289, "global_step": 8731, "epoch": 207} {"train_loss": -4.991255760192871, "global_step": 8732, "epoch": 207} {"train_loss": -4.996944427490234, "global_step": 8733, "epoch": 207} {"train_loss": -5.066636085510254, "global_step": 8734, "epoch": 207} {"train_loss": -4.956749053228469, "global_step": 8735, "epoch": 207, "val_loss": 80305.8984375} {"train_loss": -5.040608882904053, "global_step": 8736, "epoch": 208} {"train_loss": -4.994394302368164, "global_step": 8737, "epoch": 208} {"train_loss": -5.137032985687256, "global_step": 8738, "epoch": 208} {"train_loss": -5.0282158851623535, "global_step": 8739, "epoch": 208} {"train_loss": -5.153084754943848, "global_step": 8740, "epoch": 208} {"train_loss": -5.080432891845703, "global_step": 8741, "epoch": 208} {"train_loss": -4.949782371520996, "global_step": 8742, "epoch": 208} {"train_loss": -4.8300981521606445, "global_step": 8743, "epoch": 208} {"train_loss": -5.0056233406066895, "global_step": 8744, "epoch": 208} {"train_loss": -5.125919342041016, "global_step": 8745, "epoch": 208} {"train_loss": -5.0262861251831055, "global_step": 8746, "epoch": 208} {"train_loss": -5.16895055770874, "global_step": 8747, "epoch": 208} {"train_loss": -4.950918197631836, "global_step": 8748, "epoch": 208} {"train_loss": -5.0003156661987305, "global_step": 8749, "epoch": 208} {"train_loss": -4.974645614624023, "global_step": 8750, "epoch": 208} {"train_loss": -5.077661037445068, "global_step": 8751, "epoch": 208} {"train_loss": -5.040037631988525, "global_step": 8752, "epoch": 208} {"train_loss": -4.996372222900391, "global_step": 8753, "epoch": 208} {"train_loss": -5.021580219268799, "global_step": 8754, "epoch": 208} {"train_loss": -4.854058265686035, "global_step": 8755, "epoch": 208} {"train_loss": -5.0631303787231445, "global_step": 8756, "epoch": 208} {"train_loss": -5.081296443939209, "global_step": 8757, "epoch": 208} {"train_loss": -5.031679630279541, "global_step": 8758, "epoch": 208} {"train_loss": -5.082029819488525, "global_step": 8759, "epoch": 208} {"train_loss": -5.000262260437012, "global_step": 8760, "epoch": 208} {"train_loss": -4.957249164581299, "global_step": 8761, "epoch": 208} {"train_loss": -4.998164176940918, "global_step": 8762, "epoch": 208} {"train_loss": -4.96480131149292, "global_step": 8763, "epoch": 208} {"train_loss": -4.935088157653809, "global_step": 8764, "epoch": 208} {"train_loss": -4.963858604431152, "global_step": 8765, "epoch": 208} {"train_loss": -4.954903602600098, "global_step": 8766, "epoch": 208} {"train_loss": -4.865816593170166, "global_step": 8767, "epoch": 208} {"train_loss": -4.963202953338623, "global_step": 8768, "epoch": 208} {"train_loss": -5.026379108428955, "global_step": 8769, "epoch": 208} {"train_loss": -4.868448257446289, "global_step": 8770, "epoch": 208} {"train_loss": -4.982501983642578, "global_step": 8771, "epoch": 208} {"train_loss": -5.055364608764648, "global_step": 8772, "epoch": 208} {"train_loss": -4.826259613037109, "global_step": 8773, "epoch": 208} {"train_loss": -5.121100425720215, "global_step": 8774, "epoch": 208} {"train_loss": -4.975401878356934, "global_step": 8775, "epoch": 208} {"train_loss": -4.84005880355835, "global_step": 8776, "epoch": 208} {"train_loss": -4.997162614549909, "global_step": 8777, "epoch": 208, "val_loss": 80016.828125} {"train_loss": -5.020415306091309, "global_step": 8778, "epoch": 209} {"train_loss": -5.006908893585205, "global_step": 8779, "epoch": 209} {"train_loss": -5.020357608795166, "global_step": 8780, "epoch": 209} {"train_loss": -4.854668617248535, "global_step": 8781, "epoch": 209} {"train_loss": -5.045769691467285, "global_step": 8782, "epoch": 209} {"train_loss": -5.130216598510742, "global_step": 8783, "epoch": 209} {"train_loss": -4.993074417114258, "global_step": 8784, "epoch": 209} {"train_loss": -5.140972137451172, "global_step": 8785, "epoch": 209} {"train_loss": -5.002608299255371, "global_step": 8786, "epoch": 209} {"train_loss": -4.84304141998291, "global_step": 8787, "epoch": 209} {"train_loss": -5.009315490722656, "global_step": 8788, "epoch": 209} {"train_loss": -4.974246025085449, "global_step": 8789, "epoch": 209} {"train_loss": -4.76057243347168, "global_step": 8790, "epoch": 209} {"train_loss": -5.050446510314941, "global_step": 8791, "epoch": 209} {"train_loss": -5.114178657531738, "global_step": 8792, "epoch": 209} {"train_loss": -4.936431884765625, "global_step": 8793, "epoch": 209} {"train_loss": -4.97552490234375, "global_step": 8794, "epoch": 209} {"train_loss": -4.978139400482178, "global_step": 8795, "epoch": 209} {"train_loss": -4.985832214355469, "global_step": 8796, "epoch": 209} {"train_loss": -4.95175838470459, "global_step": 8797, "epoch": 209} {"train_loss": -4.988552570343018, "global_step": 8798, "epoch": 209} {"train_loss": -5.049967288970947, "global_step": 8799, "epoch": 209} {"train_loss": -5.000176906585693, "global_step": 8800, "epoch": 209} {"train_loss": -5.017393112182617, "global_step": 8801, "epoch": 209} {"train_loss": -4.9789323806762695, "global_step": 8802, "epoch": 209} {"train_loss": -4.994516849517822, "global_step": 8803, "epoch": 209} {"train_loss": -4.918295860290527, "global_step": 8804, "epoch": 209} {"train_loss": -5.080681800842285, "global_step": 8805, "epoch": 209} {"train_loss": -4.998777389526367, "global_step": 8806, "epoch": 209} {"train_loss": -4.976302623748779, "global_step": 8807, "epoch": 209} {"train_loss": -5.172884464263916, "global_step": 8808, "epoch": 209} {"train_loss": -5.056075572967529, "global_step": 8809, "epoch": 209} {"train_loss": -4.911405563354492, "global_step": 8810, "epoch": 209} {"train_loss": -5.067739486694336, "global_step": 8811, "epoch": 209} {"train_loss": -4.924386024475098, "global_step": 8812, "epoch": 209} {"train_loss": -5.021823883056641, "global_step": 8813, "epoch": 209} {"train_loss": -5.1757636070251465, "global_step": 8814, "epoch": 209} {"train_loss": -4.881888389587402, "global_step": 8815, "epoch": 209} {"train_loss": -4.9519243240356445, "global_step": 8816, "epoch": 209} {"train_loss": -5.020541667938232, "global_step": 8817, "epoch": 209} {"train_loss": -4.943234920501709, "global_step": 8818, "epoch": 209} {"train_loss": -4.9981952621823265, "global_step": 8819, "epoch": 209, "val_loss": 80457.46875} {"train_loss": -5.052919864654541, "global_step": 8820, "epoch": 210} {"train_loss": -4.955742359161377, "global_step": 8821, "epoch": 210} {"train_loss": -4.877532958984375, "global_step": 8822, "epoch": 210} {"train_loss": -5.0455708503723145, "global_step": 8823, "epoch": 210} {"train_loss": -4.97782564163208, "global_step": 8824, "epoch": 210} {"train_loss": -4.880153179168701, "global_step": 8825, "epoch": 210} {"train_loss": -5.054047584533691, "global_step": 8826, "epoch": 210} {"train_loss": -4.837602138519287, "global_step": 8827, "epoch": 210} {"train_loss": -5.0828399658203125, "global_step": 8828, "epoch": 210} {"train_loss": -4.917503356933594, "global_step": 8829, "epoch": 210} {"train_loss": -4.862065315246582, "global_step": 8830, "epoch": 210} {"train_loss": -5.202020168304443, "global_step": 8831, "epoch": 210} {"train_loss": -4.981267929077148, "global_step": 8832, "epoch": 210} {"train_loss": -4.959893226623535, "global_step": 8833, "epoch": 210} {"train_loss": -5.042635440826416, "global_step": 8834, "epoch": 210} {"train_loss": -4.980744361877441, "global_step": 8835, "epoch": 210} {"train_loss": -4.982958793640137, "global_step": 8836, "epoch": 210} {"train_loss": -5.124998092651367, "global_step": 8837, "epoch": 210} {"train_loss": -5.089168071746826, "global_step": 8838, "epoch": 210} {"train_loss": -4.8967742919921875, "global_step": 8839, "epoch": 210} {"train_loss": -5.142807960510254, "global_step": 8840, "epoch": 210} {"train_loss": -5.004316329956055, "global_step": 8841, "epoch": 210} {"train_loss": -5.0364298820495605, "global_step": 8842, "epoch": 210} {"train_loss": -5.1379523277282715, "global_step": 8843, "epoch": 210} {"train_loss": -5.015356063842773, "global_step": 8844, "epoch": 210} {"train_loss": -4.985092639923096, "global_step": 8845, "epoch": 210} {"train_loss": -5.183469772338867, "global_step": 8846, "epoch": 210} {"train_loss": -5.014163494110107, "global_step": 8847, "epoch": 210} {"train_loss": -5.138110160827637, "global_step": 8848, "epoch": 210} {"train_loss": -5.023982048034668, "global_step": 8849, "epoch": 210} {"train_loss": -5.005742073059082, "global_step": 8850, "epoch": 210} {"train_loss": -5.092687129974365, "global_step": 8851, "epoch": 210} {"train_loss": -5.03518009185791, "global_step": 8852, "epoch": 210} {"train_loss": -5.157431125640869, "global_step": 8853, "epoch": 210} {"train_loss": -5.065803527832031, "global_step": 8854, "epoch": 210} {"train_loss": -4.985361576080322, "global_step": 8855, "epoch": 210} {"train_loss": -4.935474395751953, "global_step": 8856, "epoch": 210} {"train_loss": -4.981400489807129, "global_step": 8857, "epoch": 210} {"train_loss": -5.044550895690918, "global_step": 8858, "epoch": 210} {"train_loss": -5.053855895996094, "global_step": 8859, "epoch": 210} {"train_loss": -4.956742763519287, "global_step": 8860, "epoch": 210} {"train_loss": -5.0212595122201105, "global_step": 8861, "epoch": 210, "val_loss": 80347.90625} {"train_loss": -4.920197010040283, "global_step": 8862, "epoch": 211} {"train_loss": -5.077596664428711, "global_step": 8863, "epoch": 211} {"train_loss": -5.063960075378418, "global_step": 8864, "epoch": 211} {"train_loss": -4.98422908782959, "global_step": 8865, "epoch": 211} {"train_loss": -4.8625288009643555, "global_step": 8866, "epoch": 211} {"train_loss": -5.013930797576904, "global_step": 8867, "epoch": 211} {"train_loss": -4.836856365203857, "global_step": 8868, "epoch": 211} {"train_loss": -4.9577531814575195, "global_step": 8869, "epoch": 211} {"train_loss": -5.04078483581543, "global_step": 8870, "epoch": 211} {"train_loss": -5.122751235961914, "global_step": 8871, "epoch": 211} {"train_loss": -5.050120830535889, "global_step": 8872, "epoch": 211} {"train_loss": -5.114497661590576, "global_step": 8873, "epoch": 211} {"train_loss": -5.205395698547363, "global_step": 8874, "epoch": 211} {"train_loss": -4.769950866699219, "global_step": 8875, "epoch": 211} {"train_loss": -4.8764543533325195, "global_step": 8876, "epoch": 211} {"train_loss": -4.890768051147461, "global_step": 8877, "epoch": 211} {"train_loss": -4.893661975860596, "global_step": 8878, "epoch": 211} {"train_loss": -4.959453105926514, "global_step": 8879, "epoch": 211} {"train_loss": -5.100492477416992, "global_step": 8880, "epoch": 211} {"train_loss": -4.907927989959717, "global_step": 8881, "epoch": 211} {"train_loss": -4.9872355461120605, "global_step": 8882, "epoch": 211} {"train_loss": -4.932949542999268, "global_step": 8883, "epoch": 211} {"train_loss": -4.951307773590088, "global_step": 8884, "epoch": 211} {"train_loss": -5.08687686920166, "global_step": 8885, "epoch": 211} {"train_loss": -4.947441101074219, "global_step": 8886, "epoch": 211} {"train_loss": -4.963397026062012, "global_step": 8887, "epoch": 211} {"train_loss": -5.078400611877441, "global_step": 8888, "epoch": 211} {"train_loss": -4.991540908813477, "global_step": 8889, "epoch": 211} {"train_loss": -5.002191543579102, "global_step": 8890, "epoch": 211} {"train_loss": -5.177504539489746, "global_step": 8891, "epoch": 211} {"train_loss": -4.981907844543457, "global_step": 8892, "epoch": 211} {"train_loss": -5.020922660827637, "global_step": 8893, "epoch": 211} {"train_loss": -5.002188682556152, "global_step": 8894, "epoch": 211} {"train_loss": -5.113868236541748, "global_step": 8895, "epoch": 211} {"train_loss": -5.004251480102539, "global_step": 8896, "epoch": 211} {"train_loss": -5.102177619934082, "global_step": 8897, "epoch": 211} {"train_loss": -4.9564971923828125, "global_step": 8898, "epoch": 211} {"train_loss": -5.07620906829834, "global_step": 8899, "epoch": 211} {"train_loss": -4.979247093200684, "global_step": 8900, "epoch": 211} {"train_loss": -4.86219596862793, "global_step": 8901, "epoch": 211} {"train_loss": -5.098076820373535, "global_step": 8902, "epoch": 211} {"train_loss": -4.999654645011539, "global_step": 8903, "epoch": 211, "val_loss": 80406.2421875} {"train_loss": -4.945916652679443, "global_step": 8904, "epoch": 212} {"train_loss": -5.124809741973877, "global_step": 8905, "epoch": 212} {"train_loss": -4.85579252243042, "global_step": 8906, "epoch": 212} {"train_loss": -5.089568138122559, "global_step": 8907, "epoch": 212} {"train_loss": -5.016449928283691, "global_step": 8908, "epoch": 212} {"train_loss": -4.861934661865234, "global_step": 8909, "epoch": 212} {"train_loss": -5.1278862953186035, "global_step": 8910, "epoch": 212} {"train_loss": -4.957163333892822, "global_step": 8911, "epoch": 212} {"train_loss": -4.836565017700195, "global_step": 8912, "epoch": 212} {"train_loss": -5.077998161315918, "global_step": 8913, "epoch": 212} {"train_loss": -4.919682502746582, "global_step": 8914, "epoch": 212} {"train_loss": -4.964915752410889, "global_step": 8915, "epoch": 212} {"train_loss": -5.1033935546875, "global_step": 8916, "epoch": 212} {"train_loss": -5.014339923858643, "global_step": 8917, "epoch": 212} {"train_loss": -5.058899402618408, "global_step": 8918, "epoch": 212} {"train_loss": -5.040430068969727, "global_step": 8919, "epoch": 212} {"train_loss": -4.974181175231934, "global_step": 8920, "epoch": 212} {"train_loss": -5.069548606872559, "global_step": 8921, "epoch": 212} {"train_loss": -5.115872383117676, "global_step": 8922, "epoch": 212} {"train_loss": -4.964123249053955, "global_step": 8923, "epoch": 212} {"train_loss": -4.931888103485107, "global_step": 8924, "epoch": 212} {"train_loss": -4.902644157409668, "global_step": 8925, "epoch": 212} {"train_loss": -4.904863357543945, "global_step": 8926, "epoch": 212} {"train_loss": -4.976847171783447, "global_step": 8927, "epoch": 212} {"train_loss": -4.84665060043335, "global_step": 8928, "epoch": 212} {"train_loss": -4.960278034210205, "global_step": 8929, "epoch": 212} {"train_loss": -5.039407253265381, "global_step": 8930, "epoch": 212} {"train_loss": -5.015014171600342, "global_step": 8931, "epoch": 212} {"train_loss": -5.090198993682861, "global_step": 8932, "epoch": 212} {"train_loss": -5.04656982421875, "global_step": 8933, "epoch": 212} {"train_loss": -5.022722244262695, "global_step": 8934, "epoch": 212} {"train_loss": -5.064279556274414, "global_step": 8935, "epoch": 212} {"train_loss": -5.118332386016846, "global_step": 8936, "epoch": 212} {"train_loss": -4.934361457824707, "global_step": 8937, "epoch": 212} {"train_loss": -4.995523929595947, "global_step": 8938, "epoch": 212} {"train_loss": -4.909540176391602, "global_step": 8939, "epoch": 212} {"train_loss": -4.8927812576293945, "global_step": 8940, "epoch": 212} {"train_loss": -4.951511859893799, "global_step": 8941, "epoch": 212} {"train_loss": -5.121730804443359, "global_step": 8942, "epoch": 212} {"train_loss": -5.120421409606934, "global_step": 8943, "epoch": 212} {"train_loss": -5.078176975250244, "global_step": 8944, "epoch": 212} {"train_loss": -5.00285656111581, "global_step": 8945, "epoch": 212, "val_loss": 79706.984375} {"train_loss": -4.9887471199035645, "global_step": 8946, "epoch": 213} {"train_loss": -4.932952880859375, "global_step": 8947, "epoch": 213} {"train_loss": -4.995521068572998, "global_step": 8948, "epoch": 213} {"train_loss": -5.153102397918701, "global_step": 8949, "epoch": 213} {"train_loss": -5.108119964599609, "global_step": 8950, "epoch": 213} {"train_loss": -5.050389289855957, "global_step": 8951, "epoch": 213} {"train_loss": -4.979307651519775, "global_step": 8952, "epoch": 213} {"train_loss": -5.094045639038086, "global_step": 8953, "epoch": 213} {"train_loss": -5.0544962882995605, "global_step": 8954, "epoch": 213} {"train_loss": -4.9317731857299805, "global_step": 8955, "epoch": 213} {"train_loss": -4.989704132080078, "global_step": 8956, "epoch": 213} {"train_loss": -4.965277194976807, "global_step": 8957, "epoch": 213} {"train_loss": -5.153966426849365, "global_step": 8958, "epoch": 213} {"train_loss": -5.202070236206055, "global_step": 8959, "epoch": 213} {"train_loss": -5.144828796386719, "global_step": 8960, "epoch": 213} {"train_loss": -4.965668678283691, "global_step": 8961, "epoch": 213} {"train_loss": -4.938080787658691, "global_step": 8962, "epoch": 213} {"train_loss": -5.1040358543396, "global_step": 8963, "epoch": 213} {"train_loss": -4.828961372375488, "global_step": 8964, "epoch": 213} {"train_loss": -5.04560661315918, "global_step": 8965, "epoch": 213} {"train_loss": -4.894706726074219, "global_step": 8966, "epoch": 213} {"train_loss": -5.145035743713379, "global_step": 8967, "epoch": 213} {"train_loss": -4.805884838104248, "global_step": 8968, "epoch": 213} {"train_loss": -4.94003963470459, "global_step": 8969, "epoch": 213} {"train_loss": -4.867293357849121, "global_step": 8970, "epoch": 213} {"train_loss": -4.733558654785156, "global_step": 8971, "epoch": 213} {"train_loss": -5.012519836425781, "global_step": 8972, "epoch": 213} {"train_loss": -4.7597808837890625, "global_step": 8973, "epoch": 213} {"train_loss": -4.947547912597656, "global_step": 8974, "epoch": 213} {"train_loss": -4.763692855834961, "global_step": 8975, "epoch": 213} {"train_loss": -4.8755645751953125, "global_step": 8976, "epoch": 213} {"train_loss": -5.16855525970459, "global_step": 8977, "epoch": 213} {"train_loss": -4.906717777252197, "global_step": 8978, "epoch": 213} {"train_loss": -4.844371795654297, "global_step": 8979, "epoch": 213} {"train_loss": -4.849145889282227, "global_step": 8980, "epoch": 213} {"train_loss": -4.834926605224609, "global_step": 8981, "epoch": 213} {"train_loss": -5.01082706451416, "global_step": 8982, "epoch": 213} {"train_loss": -5.051845550537109, "global_step": 8983, "epoch": 213} {"train_loss": -4.944794654846191, "global_step": 8984, "epoch": 213} {"train_loss": -4.873817443847656, "global_step": 8985, "epoch": 213} {"train_loss": -4.994199752807617, "global_step": 8986, "epoch": 213} {"train_loss": -4.970915272122338, "global_step": 8987, "epoch": 213, "val_loss": 79773.1640625} {"train_loss": -5.168445110321045, "global_step": 8988, "epoch": 214} {"train_loss": -4.865993022918701, "global_step": 8989, "epoch": 214} {"train_loss": -5.001804351806641, "global_step": 8990, "epoch": 214} {"train_loss": -4.933749675750732, "global_step": 8991, "epoch": 214} {"train_loss": -5.21754264831543, "global_step": 8992, "epoch": 214} {"train_loss": -4.888577461242676, "global_step": 8993, "epoch": 214} {"train_loss": -5.028048515319824, "global_step": 8994, "epoch": 214} {"train_loss": -4.960566997528076, "global_step": 8995, "epoch": 214} {"train_loss": -4.945890426635742, "global_step": 8996, "epoch": 214} {"train_loss": -4.916138172149658, "global_step": 8997, "epoch": 214} {"train_loss": -4.97430419921875, "global_step": 8998, "epoch": 214} {"train_loss": -4.967381477355957, "global_step": 8999, "epoch": 214} {"train_loss": -4.662946701049805, "global_step": 9000, "epoch": 214} {"train_loss": -5.019768714904785, "global_step": 9001, "epoch": 214} {"train_loss": -4.837919235229492, "global_step": 9002, "epoch": 214} {"train_loss": -4.847807884216309, "global_step": 9003, "epoch": 214} {"train_loss": -5.093141555786133, "global_step": 9004, "epoch": 214} {"train_loss": -4.815128326416016, "global_step": 9005, "epoch": 214} {"train_loss": -4.923110485076904, "global_step": 9006, "epoch": 214} {"train_loss": -4.897934913635254, "global_step": 9007, "epoch": 214} {"train_loss": -4.873678207397461, "global_step": 9008, "epoch": 214} {"train_loss": -5.0337677001953125, "global_step": 9009, "epoch": 214} {"train_loss": -4.8842573165893555, "global_step": 9010, "epoch": 214} {"train_loss": -4.987619400024414, "global_step": 9011, "epoch": 214} {"train_loss": -4.930569171905518, "global_step": 9012, "epoch": 214} {"train_loss": -4.992751121520996, "global_step": 9013, "epoch": 214} {"train_loss": -5.091165542602539, "global_step": 9014, "epoch": 214} {"train_loss": -4.9655232429504395, "global_step": 9015, "epoch": 214} {"train_loss": -5.084224224090576, "global_step": 9016, "epoch": 214} {"train_loss": -5.047538757324219, "global_step": 9017, "epoch": 214} {"train_loss": -5.023144721984863, "global_step": 9018, "epoch": 214} {"train_loss": -5.017655372619629, "global_step": 9019, "epoch": 214} {"train_loss": -5.005031108856201, "global_step": 9020, "epoch": 214} {"train_loss": -5.051060676574707, "global_step": 9021, "epoch": 214} {"train_loss": -4.965066909790039, "global_step": 9022, "epoch": 214} {"train_loss": -4.997076988220215, "global_step": 9023, "epoch": 214} {"train_loss": -5.063854217529297, "global_step": 9024, "epoch": 214} {"train_loss": -4.932445526123047, "global_step": 9025, "epoch": 214} {"train_loss": -5.0625176429748535, "global_step": 9026, "epoch": 214} {"train_loss": -4.99812650680542, "global_step": 9027, "epoch": 214} {"train_loss": -5.043951988220215, "global_step": 9028, "epoch": 214} {"train_loss": -4.978797674179077, "global_step": 9029, "epoch": 214, "val_loss": 79719.609375} {"train_loss": -5.045703411102295, "global_step": 9030, "epoch": 215} {"train_loss": -5.040688991546631, "global_step": 9031, "epoch": 215} {"train_loss": -5.0287065505981445, "global_step": 9032, "epoch": 215} {"train_loss": -4.995033264160156, "global_step": 9033, "epoch": 215} {"train_loss": -4.999714374542236, "global_step": 9034, "epoch": 215} {"train_loss": -5.080909252166748, "global_step": 9035, "epoch": 215} {"train_loss": -5.023687839508057, "global_step": 9036, "epoch": 215} {"train_loss": -4.940807342529297, "global_step": 9037, "epoch": 215} {"train_loss": -4.908669948577881, "global_step": 9038, "epoch": 215} {"train_loss": -4.998258590698242, "global_step": 9039, "epoch": 215} {"train_loss": -4.84975528717041, "global_step": 9040, "epoch": 215} {"train_loss": -4.971041679382324, "global_step": 9041, "epoch": 215} {"train_loss": -5.020279884338379, "global_step": 9042, "epoch": 215} {"train_loss": -4.989284992218018, "global_step": 9043, "epoch": 215} {"train_loss": -4.986332893371582, "global_step": 9044, "epoch": 215} {"train_loss": -5.046457767486572, "global_step": 9045, "epoch": 215} {"train_loss": -4.885865211486816, "global_step": 9046, "epoch": 215} {"train_loss": -5.050199508666992, "global_step": 9047, "epoch": 215} {"train_loss": -5.128473281860352, "global_step": 9048, "epoch": 215} {"train_loss": -4.969138145446777, "global_step": 9049, "epoch": 215} {"train_loss": -4.989191055297852, "global_step": 9050, "epoch": 215} {"train_loss": -5.02668571472168, "global_step": 9051, "epoch": 215} {"train_loss": -4.846976280212402, "global_step": 9052, "epoch": 215} {"train_loss": -5.113185882568359, "global_step": 9053, "epoch": 215} {"train_loss": -4.861958980560303, "global_step": 9054, "epoch": 215} {"train_loss": -5.101057052612305, "global_step": 9055, "epoch": 215} {"train_loss": -5.101507186889648, "global_step": 9056, "epoch": 215} {"train_loss": -5.023313999176025, "global_step": 9057, "epoch": 215} {"train_loss": -5.037952423095703, "global_step": 9058, "epoch": 215} {"train_loss": -5.044754981994629, "global_step": 9059, "epoch": 215} {"train_loss": -5.019457817077637, "global_step": 9060, "epoch": 215} {"train_loss": -5.022477149963379, "global_step": 9061, "epoch": 215} {"train_loss": -4.961997985839844, "global_step": 9062, "epoch": 215} {"train_loss": -5.165713787078857, "global_step": 9063, "epoch": 215} {"train_loss": -4.981799602508545, "global_step": 9064, "epoch": 215} {"train_loss": -5.1372880935668945, "global_step": 9065, "epoch": 215} {"train_loss": -4.986701011657715, "global_step": 9066, "epoch": 215} {"train_loss": -5.026839733123779, "global_step": 9067, "epoch": 215} {"train_loss": -5.082944869995117, "global_step": 9068, "epoch": 215} {"train_loss": -4.995616436004639, "global_step": 9069, "epoch": 215} {"train_loss": -5.0712127685546875, "global_step": 9070, "epoch": 215} {"train_loss": -5.016599087488084, "global_step": 9071, "epoch": 215, "val_loss": 79121.8984375} {"train_loss": -5.015824317932129, "global_step": 9072, "epoch": 216} {"train_loss": -5.122021198272705, "global_step": 9073, "epoch": 216} {"train_loss": -5.123169898986816, "global_step": 9074, "epoch": 216} {"train_loss": -4.934609413146973, "global_step": 9075, "epoch": 216} {"train_loss": -5.00413703918457, "global_step": 9076, "epoch": 216} {"train_loss": -5.025329113006592, "global_step": 9077, "epoch": 216} {"train_loss": -5.165555953979492, "global_step": 9078, "epoch": 216} {"train_loss": -5.09470796585083, "global_step": 9079, "epoch": 216} {"train_loss": -5.000648498535156, "global_step": 9080, "epoch": 216} {"train_loss": -4.9261016845703125, "global_step": 9081, "epoch": 216} {"train_loss": -5.1206159591674805, "global_step": 9082, "epoch": 216} {"train_loss": -5.2840576171875, "global_step": 9083, "epoch": 216} {"train_loss": -5.034205436706543, "global_step": 9084, "epoch": 216} {"train_loss": -5.18083381652832, "global_step": 9085, "epoch": 216} {"train_loss": -5.122254371643066, "global_step": 9086, "epoch": 216} {"train_loss": -4.962580680847168, "global_step": 9087, "epoch": 216} {"train_loss": -5.0724992752075195, "global_step": 9088, "epoch": 216} {"train_loss": -5.060379505157471, "global_step": 9089, "epoch": 216} {"train_loss": -5.111662864685059, "global_step": 9090, "epoch": 216} {"train_loss": -5.101810455322266, "global_step": 9091, "epoch": 216} {"train_loss": -5.198461055755615, "global_step": 9092, "epoch": 216} {"train_loss": -5.121912479400635, "global_step": 9093, "epoch": 216} {"train_loss": -5.059941291809082, "global_step": 9094, "epoch": 216} {"train_loss": -4.916149139404297, "global_step": 9095, "epoch": 216} {"train_loss": -5.185531139373779, "global_step": 9096, "epoch": 216} {"train_loss": -5.1392717361450195, "global_step": 9097, "epoch": 216} {"train_loss": -4.9101691246032715, "global_step": 9098, "epoch": 216} {"train_loss": -5.108578681945801, "global_step": 9099, "epoch": 216} {"train_loss": -5.089238166809082, "global_step": 9100, "epoch": 216} {"train_loss": -4.991894245147705, "global_step": 9101, "epoch": 216} {"train_loss": -5.185079097747803, "global_step": 9102, "epoch": 216} {"train_loss": -5.039501190185547, "global_step": 9103, "epoch": 216} {"train_loss": -5.050508499145508, "global_step": 9104, "epoch": 216} {"train_loss": -5.001166343688965, "global_step": 9105, "epoch": 216} {"train_loss": -4.8816728591918945, "global_step": 9106, "epoch": 216} {"train_loss": -5.009625434875488, "global_step": 9107, "epoch": 216} {"train_loss": -5.139638900756836, "global_step": 9108, "epoch": 216} {"train_loss": -4.9774980545043945, "global_step": 9109, "epoch": 216} {"train_loss": -5.014196395874023, "global_step": 9110, "epoch": 216} {"train_loss": -5.076584339141846, "global_step": 9111, "epoch": 216} {"train_loss": -5.241232872009277, "global_step": 9112, "epoch": 216} {"train_loss": -5.066294522512527, "global_step": 9113, "epoch": 216, "val_loss": 80412.9140625} {"train_loss": -5.062363624572754, "global_step": 9114, "epoch": 217} {"train_loss": -4.891377925872803, "global_step": 9115, "epoch": 217} {"train_loss": -4.898179054260254, "global_step": 9116, "epoch": 217} {"train_loss": -5.008145809173584, "global_step": 9117, "epoch": 217} {"train_loss": -4.994671821594238, "global_step": 9118, "epoch": 217} {"train_loss": -4.912405967712402, "global_step": 9119, "epoch": 217} {"train_loss": -4.825819969177246, "global_step": 9120, "epoch": 217} {"train_loss": -4.81813907623291, "global_step": 9121, "epoch": 217} {"train_loss": -5.088531017303467, "global_step": 9122, "epoch": 217} {"train_loss": -4.819486618041992, "global_step": 9123, "epoch": 217} {"train_loss": -4.952178955078125, "global_step": 9124, "epoch": 217} {"train_loss": -5.031799793243408, "global_step": 9125, "epoch": 217} {"train_loss": -4.844692230224609, "global_step": 9126, "epoch": 217} {"train_loss": -4.868644714355469, "global_step": 9127, "epoch": 217} {"train_loss": -4.730581283569336, "global_step": 9128, "epoch": 217} {"train_loss": -4.9551801681518555, "global_step": 9129, "epoch": 217} {"train_loss": -5.046228408813477, "global_step": 9130, "epoch": 217} {"train_loss": -4.704756736755371, "global_step": 9131, "epoch": 217} {"train_loss": -5.102165699005127, "global_step": 9132, "epoch": 217} {"train_loss": -4.681377410888672, "global_step": 9133, "epoch": 217} {"train_loss": -4.941434860229492, "global_step": 9134, "epoch": 217} {"train_loss": -4.885273456573486, "global_step": 9135, "epoch": 217} {"train_loss": -4.978397369384766, "global_step": 9136, "epoch": 217} {"train_loss": -4.966259002685547, "global_step": 9137, "epoch": 217} {"train_loss": -4.977126121520996, "global_step": 9138, "epoch": 217} {"train_loss": -4.874347686767578, "global_step": 9139, "epoch": 217} {"train_loss": -5.025284767150879, "global_step": 9140, "epoch": 217} {"train_loss": -4.9845380783081055, "global_step": 9141, "epoch": 217} {"train_loss": -5.001344680786133, "global_step": 9142, "epoch": 217} {"train_loss": -4.9704365730285645, "global_step": 9143, "epoch": 217} {"train_loss": -5.021402835845947, "global_step": 9144, "epoch": 217} {"train_loss": -5.077651023864746, "global_step": 9145, "epoch": 217} {"train_loss": -5.042801856994629, "global_step": 9146, "epoch": 217} {"train_loss": -4.965686798095703, "global_step": 9147, "epoch": 217} {"train_loss": -5.09110164642334, "global_step": 9148, "epoch": 217} {"train_loss": -4.969442367553711, "global_step": 9149, "epoch": 217} {"train_loss": -4.929793357849121, "global_step": 9150, "epoch": 217} {"train_loss": -5.0412397384643555, "global_step": 9151, "epoch": 217} {"train_loss": -5.126086711883545, "global_step": 9152, "epoch": 217} {"train_loss": -4.9791765213012695, "global_step": 9153, "epoch": 217} {"train_loss": -4.9561767578125, "global_step": 9154, "epoch": 217} {"train_loss": -4.955152318591163, "global_step": 9155, "epoch": 217, "val_loss": 78908.3125} {"train_loss": -5.057709217071533, "global_step": 9156, "epoch": 218} {"train_loss": -4.9701104164123535, "global_step": 9157, "epoch": 218} {"train_loss": -5.0458598136901855, "global_step": 9158, "epoch": 218} {"train_loss": -5.158978462219238, "global_step": 9159, "epoch": 218} {"train_loss": -5.015081405639648, "global_step": 9160, "epoch": 218} {"train_loss": -4.976283550262451, "global_step": 9161, "epoch": 218} {"train_loss": -4.955405235290527, "global_step": 9162, "epoch": 218} {"train_loss": -5.127364635467529, "global_step": 9163, "epoch": 218} {"train_loss": -5.019935607910156, "global_step": 9164, "epoch": 218} {"train_loss": -5.033258438110352, "global_step": 9165, "epoch": 218} {"train_loss": -5.165453910827637, "global_step": 9166, "epoch": 218} {"train_loss": -4.8854217529296875, "global_step": 9167, "epoch": 218} {"train_loss": -4.963127136230469, "global_step": 9168, "epoch": 218} {"train_loss": -5.129229545593262, "global_step": 9169, "epoch": 218} {"train_loss": -5.079936981201172, "global_step": 9170, "epoch": 218} {"train_loss": -5.025109767913818, "global_step": 9171, "epoch": 218} {"train_loss": -5.015557765960693, "global_step": 9172, "epoch": 218} {"train_loss": -5.114130973815918, "global_step": 9173, "epoch": 218} {"train_loss": -5.075485706329346, "global_step": 9174, "epoch": 218} {"train_loss": -5.112489700317383, "global_step": 9175, "epoch": 218} {"train_loss": -4.998496055603027, "global_step": 9176, "epoch": 218} {"train_loss": -5.078606605529785, "global_step": 9177, "epoch": 218} {"train_loss": -4.979214668273926, "global_step": 9178, "epoch": 218} {"train_loss": -5.101025104522705, "global_step": 9179, "epoch": 218} {"train_loss": -5.027924060821533, "global_step": 9180, "epoch": 218} {"train_loss": -5.058311462402344, "global_step": 9181, "epoch": 218} {"train_loss": -4.935291290283203, "global_step": 9182, "epoch": 218} {"train_loss": -5.118241310119629, "global_step": 9183, "epoch": 218} {"train_loss": -5.074408054351807, "global_step": 9184, "epoch": 218} {"train_loss": -5.170689582824707, "global_step": 9185, "epoch": 218} {"train_loss": -5.065571308135986, "global_step": 9186, "epoch": 218} {"train_loss": -4.848557472229004, "global_step": 9187, "epoch": 218} {"train_loss": -5.021816253662109, "global_step": 9188, "epoch": 218} {"train_loss": -5.063233375549316, "global_step": 9189, "epoch": 218} {"train_loss": -4.907161712646484, "global_step": 9190, "epoch": 218} {"train_loss": -5.043155670166016, "global_step": 9191, "epoch": 218} {"train_loss": -5.085198402404785, "global_step": 9192, "epoch": 218} {"train_loss": -5.19959831237793, "global_step": 9193, "epoch": 218} {"train_loss": -5.013175964355469, "global_step": 9194, "epoch": 218} {"train_loss": -5.032204627990723, "global_step": 9195, "epoch": 218} {"train_loss": -5.221412658691406, "global_step": 9196, "epoch": 218} {"train_loss": -5.048950490497408, "global_step": 9197, "epoch": 218, "val_loss": 78973.765625} {"train_loss": -5.12730598449707, "global_step": 9198, "epoch": 219} {"train_loss": -4.950655937194824, "global_step": 9199, "epoch": 219} {"train_loss": -4.975183963775635, "global_step": 9200, "epoch": 219} {"train_loss": -5.0345869064331055, "global_step": 9201, "epoch": 219} {"train_loss": -5.085747718811035, "global_step": 9202, "epoch": 219} {"train_loss": -4.949626922607422, "global_step": 9203, "epoch": 219} {"train_loss": -5.079226016998291, "global_step": 9204, "epoch": 219} {"train_loss": -5.073023796081543, "global_step": 9205, "epoch": 219} {"train_loss": -4.912492752075195, "global_step": 9206, "epoch": 219} {"train_loss": -5.072243690490723, "global_step": 9207, "epoch": 219} {"train_loss": -4.988836765289307, "global_step": 9208, "epoch": 219} {"train_loss": -4.948738098144531, "global_step": 9209, "epoch": 219} {"train_loss": -4.973234176635742, "global_step": 9210, "epoch": 219} {"train_loss": -5.050650596618652, "global_step": 9211, "epoch": 219} {"train_loss": -5.031093597412109, "global_step": 9212, "epoch": 219} {"train_loss": -4.916543483734131, "global_step": 9213, "epoch": 219} {"train_loss": -4.8795671463012695, "global_step": 9214, "epoch": 219} {"train_loss": -5.076830863952637, "global_step": 9215, "epoch": 219} {"train_loss": -4.925417900085449, "global_step": 9216, "epoch": 219} {"train_loss": -5.103989601135254, "global_step": 9217, "epoch": 219} {"train_loss": -4.796422004699707, "global_step": 9218, "epoch": 219} {"train_loss": -5.178462028503418, "global_step": 9219, "epoch": 219} {"train_loss": -4.963262557983398, "global_step": 9220, "epoch": 219} {"train_loss": -4.924191474914551, "global_step": 9221, "epoch": 219} {"train_loss": -5.036371231079102, "global_step": 9222, "epoch": 219} {"train_loss": -4.9633097648620605, "global_step": 9223, "epoch": 219} {"train_loss": -5.076934814453125, "global_step": 9224, "epoch": 219} {"train_loss": -5.088346481323242, "global_step": 9225, "epoch": 219} {"train_loss": -5.105551719665527, "global_step": 9226, "epoch": 219} {"train_loss": -4.9742913246154785, "global_step": 9227, "epoch": 219} {"train_loss": -5.042549133300781, "global_step": 9228, "epoch": 219} {"train_loss": -5.123073577880859, "global_step": 9229, "epoch": 219} {"train_loss": -5.067216396331787, "global_step": 9230, "epoch": 219} {"train_loss": -5.032683372497559, "global_step": 9231, "epoch": 219} {"train_loss": -5.062514781951904, "global_step": 9232, "epoch": 219} {"train_loss": -5.122257232666016, "global_step": 9233, "epoch": 219} {"train_loss": -4.927740573883057, "global_step": 9234, "epoch": 219} {"train_loss": -5.1279296875, "global_step": 9235, "epoch": 219} {"train_loss": -5.125593662261963, "global_step": 9236, "epoch": 219} {"train_loss": -5.0817413330078125, "global_step": 9237, "epoch": 219} {"train_loss": -5.09949254989624, "global_step": 9238, "epoch": 219} {"train_loss": -5.0259346053713845, "global_step": 9239, "epoch": 219, "val_loss": 78791.0546875} {"train_loss": -4.961648941040039, "global_step": 9240, "epoch": 220} {"train_loss": -4.9467902183532715, "global_step": 9241, "epoch": 220} {"train_loss": -5.15635347366333, "global_step": 9242, "epoch": 220} {"train_loss": -5.134987831115723, "global_step": 9243, "epoch": 220} {"train_loss": -4.9636735916137695, "global_step": 9244, "epoch": 220} {"train_loss": -5.138766288757324, "global_step": 9245, "epoch": 220} {"train_loss": -5.026679992675781, "global_step": 9246, "epoch": 220} {"train_loss": -4.9083099365234375, "global_step": 9247, "epoch": 220} {"train_loss": -5.01371955871582, "global_step": 9248, "epoch": 220} {"train_loss": -5.146754264831543, "global_step": 9249, "epoch": 220} {"train_loss": -5.131604194641113, "global_step": 9250, "epoch": 220} {"train_loss": -4.91677188873291, "global_step": 9251, "epoch": 220} {"train_loss": -5.079468727111816, "global_step": 9252, "epoch": 220} {"train_loss": -5.016607284545898, "global_step": 9253, "epoch": 220} {"train_loss": -4.874889373779297, "global_step": 9254, "epoch": 220} {"train_loss": -5.081055641174316, "global_step": 9255, "epoch": 220} {"train_loss": -4.817503929138184, "global_step": 9256, "epoch": 220} {"train_loss": -4.928223609924316, "global_step": 9257, "epoch": 220} {"train_loss": -5.008970260620117, "global_step": 9258, "epoch": 220} {"train_loss": -4.8654279708862305, "global_step": 9259, "epoch": 220} {"train_loss": -4.975499629974365, "global_step": 9260, "epoch": 220} {"train_loss": -4.972932815551758, "global_step": 9261, "epoch": 220} {"train_loss": -5.0153045654296875, "global_step": 9262, "epoch": 220} {"train_loss": -4.893819332122803, "global_step": 9263, "epoch": 220} {"train_loss": -4.911479949951172, "global_step": 9264, "epoch": 220} {"train_loss": -5.146970748901367, "global_step": 9265, "epoch": 220} {"train_loss": -5.021276473999023, "global_step": 9266, "epoch": 220} {"train_loss": -4.981441974639893, "global_step": 9267, "epoch": 220} {"train_loss": -5.055959701538086, "global_step": 9268, "epoch": 220} {"train_loss": -5.135973930358887, "global_step": 9269, "epoch": 220} {"train_loss": -5.144410133361816, "global_step": 9270, "epoch": 220} {"train_loss": -4.890838623046875, "global_step": 9271, "epoch": 220} {"train_loss": -5.0635528564453125, "global_step": 9272, "epoch": 220} {"train_loss": -4.974011421203613, "global_step": 9273, "epoch": 220} {"train_loss": -4.919017791748047, "global_step": 9274, "epoch": 220} {"train_loss": -5.025376319885254, "global_step": 9275, "epoch": 220} {"train_loss": -5.069260120391846, "global_step": 9276, "epoch": 220} {"train_loss": -5.004230499267578, "global_step": 9277, "epoch": 220} {"train_loss": -5.112025737762451, "global_step": 9278, "epoch": 220} {"train_loss": -5.107102394104004, "global_step": 9279, "epoch": 220} {"train_loss": -4.959381103515625, "global_step": 9280, "epoch": 220} {"train_loss": -5.012184074946812, "global_step": 9281, "epoch": 220, "val_loss": 78964.2421875} {"train_loss": -5.0788068771362305, "global_step": 9282, "epoch": 221} {"train_loss": -5.022677898406982, "global_step": 9283, "epoch": 221} {"train_loss": -5.1196088790893555, "global_step": 9284, "epoch": 221} {"train_loss": -5.091294288635254, "global_step": 9285, "epoch": 221} {"train_loss": -5.074345588684082, "global_step": 9286, "epoch": 221} {"train_loss": -5.033332824707031, "global_step": 9287, "epoch": 221} {"train_loss": -5.062215805053711, "global_step": 9288, "epoch": 221} {"train_loss": -5.102293968200684, "global_step": 9289, "epoch": 221} {"train_loss": -4.969770431518555, "global_step": 9290, "epoch": 221} {"train_loss": -5.128499984741211, "global_step": 9291, "epoch": 221} {"train_loss": -5.077188491821289, "global_step": 9292, "epoch": 221} {"train_loss": -5.2031049728393555, "global_step": 9293, "epoch": 221} {"train_loss": -4.975557327270508, "global_step": 9294, "epoch": 221} {"train_loss": -4.989618301391602, "global_step": 9295, "epoch": 221} {"train_loss": -5.080887794494629, "global_step": 9296, "epoch": 221} {"train_loss": -5.014039039611816, "global_step": 9297, "epoch": 221} {"train_loss": -5.098431587219238, "global_step": 9298, "epoch": 221} {"train_loss": -5.05232572555542, "global_step": 9299, "epoch": 221} {"train_loss": -4.970810890197754, "global_step": 9300, "epoch": 221} {"train_loss": -5.037930965423584, "global_step": 9301, "epoch": 221} {"train_loss": -5.128393173217773, "global_step": 9302, "epoch": 221} {"train_loss": -5.125968933105469, "global_step": 9303, "epoch": 221} {"train_loss": -5.190983772277832, "global_step": 9304, "epoch": 221} {"train_loss": -4.864020347595215, "global_step": 9305, "epoch": 221} {"train_loss": -5.001102924346924, "global_step": 9306, "epoch": 221} {"train_loss": -5.080683708190918, "global_step": 9307, "epoch": 221} {"train_loss": -5.0450310707092285, "global_step": 9308, "epoch": 221} {"train_loss": -4.901803016662598, "global_step": 9309, "epoch": 221} {"train_loss": -5.058067798614502, "global_step": 9310, "epoch": 221} {"train_loss": -5.106860637664795, "global_step": 9311, "epoch": 221} {"train_loss": -4.903548240661621, "global_step": 9312, "epoch": 221} {"train_loss": -4.9865922927856445, "global_step": 9313, "epoch": 221} {"train_loss": -4.831995010375977, "global_step": 9314, "epoch": 221} {"train_loss": -4.8442535400390625, "global_step": 9315, "epoch": 221} {"train_loss": -5.199747085571289, "global_step": 9316, "epoch": 221} {"train_loss": -4.944961071014404, "global_step": 9317, "epoch": 221} {"train_loss": -4.975889205932617, "global_step": 9318, "epoch": 221} {"train_loss": -4.969445705413818, "global_step": 9319, "epoch": 221} {"train_loss": -4.838805198669434, "global_step": 9320, "epoch": 221} {"train_loss": -5.0826802253723145, "global_step": 9321, "epoch": 221} {"train_loss": -4.997812747955322, "global_step": 9322, "epoch": 221} {"train_loss": -5.031319288980393, "global_step": 9323, "epoch": 221, "val_loss": 78885.625} {"train_loss": -4.986715793609619, "global_step": 9324, "epoch": 222} {"train_loss": -5.054316520690918, "global_step": 9325, "epoch": 222} {"train_loss": -4.921651363372803, "global_step": 9326, "epoch": 222} {"train_loss": -4.981505393981934, "global_step": 9327, "epoch": 222} {"train_loss": -5.003089904785156, "global_step": 9328, "epoch": 222} {"train_loss": -4.911979675292969, "global_step": 9329, "epoch": 222} {"train_loss": -5.085471153259277, "global_step": 9330, "epoch": 222} {"train_loss": -5.002258777618408, "global_step": 9331, "epoch": 222} {"train_loss": -5.076716423034668, "global_step": 9332, "epoch": 222} {"train_loss": -5.106807231903076, "global_step": 9333, "epoch": 222} {"train_loss": -5.173699378967285, "global_step": 9334, "epoch": 222} {"train_loss": -5.00280237197876, "global_step": 9335, "epoch": 222} {"train_loss": -4.986006736755371, "global_step": 9336, "epoch": 222} {"train_loss": -5.037804126739502, "global_step": 9337, "epoch": 222} {"train_loss": -5.041409015655518, "global_step": 9338, "epoch": 222} {"train_loss": -5.0511345863342285, "global_step": 9339, "epoch": 222} {"train_loss": -5.003115653991699, "global_step": 9340, "epoch": 222} {"train_loss": -5.113391876220703, "global_step": 9341, "epoch": 222} {"train_loss": -5.092756271362305, "global_step": 9342, "epoch": 222} {"train_loss": -5.095769882202148, "global_step": 9343, "epoch": 222} {"train_loss": -5.027324199676514, "global_step": 9344, "epoch": 222} {"train_loss": -5.108103275299072, "global_step": 9345, "epoch": 222} {"train_loss": -5.060891628265381, "global_step": 9346, "epoch": 222} {"train_loss": -5.100404262542725, "global_step": 9347, "epoch": 222} {"train_loss": -5.0424909591674805, "global_step": 9348, "epoch": 222} {"train_loss": -5.1044769287109375, "global_step": 9349, "epoch": 222} {"train_loss": -5.1802659034729, "global_step": 9350, "epoch": 222} {"train_loss": -4.982932090759277, "global_step": 9351, "epoch": 222} {"train_loss": -5.086031913757324, "global_step": 9352, "epoch": 222} {"train_loss": -4.962456703186035, "global_step": 9353, "epoch": 222} {"train_loss": -5.1169023513793945, "global_step": 9354, "epoch": 222} {"train_loss": -5.249320030212402, "global_step": 9355, "epoch": 222} {"train_loss": -5.180064678192139, "global_step": 9356, "epoch": 222} {"train_loss": -5.156123161315918, "global_step": 9357, "epoch": 222} {"train_loss": -4.900290489196777, "global_step": 9358, "epoch": 222} {"train_loss": -5.019092559814453, "global_step": 9359, "epoch": 222} {"train_loss": -5.043731689453125, "global_step": 9360, "epoch": 222} {"train_loss": -4.989396572113037, "global_step": 9361, "epoch": 222} {"train_loss": -4.773454666137695, "global_step": 9362, "epoch": 222} {"train_loss": -4.926977157592773, "global_step": 9363, "epoch": 222} {"train_loss": -4.951267242431641, "global_step": 9364, "epoch": 222} {"train_loss": -5.03443736121768, "global_step": 9365, "epoch": 222, "val_loss": 79068.875} {"train_loss": -5.13306999206543, "global_step": 9366, "epoch": 223} {"train_loss": -4.977985382080078, "global_step": 9367, "epoch": 223} {"train_loss": -4.973731994628906, "global_step": 9368, "epoch": 223} {"train_loss": -4.991944313049316, "global_step": 9369, "epoch": 223} {"train_loss": -4.95632266998291, "global_step": 9370, "epoch": 223} {"train_loss": -5.0369462966918945, "global_step": 9371, "epoch": 223} {"train_loss": -4.90892219543457, "global_step": 9372, "epoch": 223} {"train_loss": -5.080853462219238, "global_step": 9373, "epoch": 223} {"train_loss": -5.0071001052856445, "global_step": 9374, "epoch": 223} {"train_loss": -4.907788276672363, "global_step": 9375, "epoch": 223} {"train_loss": -5.203373908996582, "global_step": 9376, "epoch": 223} {"train_loss": -5.152867794036865, "global_step": 9377, "epoch": 223} {"train_loss": -5.014019012451172, "global_step": 9378, "epoch": 223} {"train_loss": -5.090353012084961, "global_step": 9379, "epoch": 223} {"train_loss": -5.0560808181762695, "global_step": 9380, "epoch": 223} {"train_loss": -5.097592353820801, "global_step": 9381, "epoch": 223} {"train_loss": -5.119022369384766, "global_step": 9382, "epoch": 223} {"train_loss": -4.924816608428955, "global_step": 9383, "epoch": 223} {"train_loss": -5.171091556549072, "global_step": 9384, "epoch": 223} {"train_loss": -5.109642505645752, "global_step": 9385, "epoch": 223} {"train_loss": -4.949697017669678, "global_step": 9386, "epoch": 223} {"train_loss": -5.081794261932373, "global_step": 9387, "epoch": 223} {"train_loss": -5.036899089813232, "global_step": 9388, "epoch": 223} {"train_loss": -5.066733360290527, "global_step": 9389, "epoch": 223} {"train_loss": -5.115555286407471, "global_step": 9390, "epoch": 223} {"train_loss": -5.088611602783203, "global_step": 9391, "epoch": 223} {"train_loss": -5.063081741333008, "global_step": 9392, "epoch": 223} {"train_loss": -5.020396709442139, "global_step": 9393, "epoch": 223} {"train_loss": -5.141408443450928, "global_step": 9394, "epoch": 223} {"train_loss": -5.092613697052002, "global_step": 9395, "epoch": 223} {"train_loss": -5.110787391662598, "global_step": 9396, "epoch": 223} {"train_loss": -5.076328277587891, "global_step": 9397, "epoch": 223} {"train_loss": -5.0807085037231445, "global_step": 9398, "epoch": 223} {"train_loss": -4.986876487731934, "global_step": 9399, "epoch": 223} {"train_loss": -4.9378461837768555, "global_step": 9400, "epoch": 223} {"train_loss": -5.068107604980469, "global_step": 9401, "epoch": 223} {"train_loss": -5.100284576416016, "global_step": 9402, "epoch": 223} {"train_loss": -5.140815734863281, "global_step": 9403, "epoch": 223} {"train_loss": -4.895506381988525, "global_step": 9404, "epoch": 223} {"train_loss": -4.880114555358887, "global_step": 9405, "epoch": 223} {"train_loss": -5.145025730133057, "global_step": 9406, "epoch": 223} {"train_loss": -5.04922832761492, "global_step": 9407, "epoch": 223, "val_loss": 79182.8046875} {"train_loss": -5.159122943878174, "global_step": 9408, "epoch": 224} {"train_loss": -4.785253524780273, "global_step": 9409, "epoch": 224} {"train_loss": -5.00478982925415, "global_step": 9410, "epoch": 224} {"train_loss": -4.987623691558838, "global_step": 9411, "epoch": 224} {"train_loss": -4.733243465423584, "global_step": 9412, "epoch": 224} {"train_loss": -4.85922908782959, "global_step": 9413, "epoch": 224} {"train_loss": -4.67417573928833, "global_step": 9414, "epoch": 224} {"train_loss": -4.997906684875488, "global_step": 9415, "epoch": 224} {"train_loss": -4.847968101501465, "global_step": 9416, "epoch": 224} {"train_loss": -4.797712802886963, "global_step": 9417, "epoch": 224} {"train_loss": -4.904804229736328, "global_step": 9418, "epoch": 224} {"train_loss": -4.962350845336914, "global_step": 9419, "epoch": 224} {"train_loss": -4.844511985778809, "global_step": 9420, "epoch": 224} {"train_loss": -4.909902572631836, "global_step": 9421, "epoch": 224} {"train_loss": -5.0267558097839355, "global_step": 9422, "epoch": 224} {"train_loss": -4.926426410675049, "global_step": 9423, "epoch": 224} {"train_loss": -4.940630912780762, "global_step": 9424, "epoch": 224} {"train_loss": -4.892378807067871, "global_step": 9425, "epoch": 224} {"train_loss": -4.989006042480469, "global_step": 9426, "epoch": 224} {"train_loss": -5.027831077575684, "global_step": 9427, "epoch": 224} {"train_loss": -5.0144853591918945, "global_step": 9428, "epoch": 224} {"train_loss": -4.9844536781311035, "global_step": 9429, "epoch": 224} {"train_loss": -5.01045560836792, "global_step": 9430, "epoch": 224} {"train_loss": -5.068879127502441, "global_step": 9431, "epoch": 224} {"train_loss": -5.211791038513184, "global_step": 9432, "epoch": 224} {"train_loss": -5.118456840515137, "global_step": 9433, "epoch": 224} {"train_loss": -5.119751930236816, "global_step": 9434, "epoch": 224} {"train_loss": -5.079533576965332, "global_step": 9435, "epoch": 224} {"train_loss": -5.1099467277526855, "global_step": 9436, "epoch": 224} {"train_loss": -5.063478469848633, "global_step": 9437, "epoch": 224} {"train_loss": -4.962536811828613, "global_step": 9438, "epoch": 224} {"train_loss": -4.988589763641357, "global_step": 9439, "epoch": 224} {"train_loss": -5.056890487670898, "global_step": 9440, "epoch": 224} {"train_loss": -5.035642147064209, "global_step": 9441, "epoch": 224} {"train_loss": -5.1020355224609375, "global_step": 9442, "epoch": 224} {"train_loss": -4.908560752868652, "global_step": 9443, "epoch": 224} {"train_loss": -5.020659923553467, "global_step": 9444, "epoch": 224} {"train_loss": -5.109479904174805, "global_step": 9445, "epoch": 224} {"train_loss": -5.089167594909668, "global_step": 9446, "epoch": 224} {"train_loss": -4.987339973449707, "global_step": 9447, "epoch": 224} {"train_loss": -5.0982561111450195, "global_step": 9448, "epoch": 224} {"train_loss": -4.98623530069987, "global_step": 9449, "epoch": 224, "val_loss": 78903.0859375} {"train_loss": -4.968448162078857, "global_step": 9450, "epoch": 225} {"train_loss": -5.182345390319824, "global_step": 9451, "epoch": 225} {"train_loss": -4.9669718742370605, "global_step": 9452, "epoch": 225} {"train_loss": -4.88075590133667, "global_step": 9453, "epoch": 225} {"train_loss": -4.916534423828125, "global_step": 9454, "epoch": 225} {"train_loss": -4.927944183349609, "global_step": 9455, "epoch": 225} {"train_loss": -4.969231605529785, "global_step": 9456, "epoch": 225} {"train_loss": -4.940413475036621, "global_step": 9457, "epoch": 225} {"train_loss": -4.966254234313965, "global_step": 9458, "epoch": 225} {"train_loss": -4.890892028808594, "global_step": 9459, "epoch": 225} {"train_loss": -5.105070114135742, "global_step": 9460, "epoch": 225} {"train_loss": -5.010791778564453, "global_step": 9461, "epoch": 225} {"train_loss": -4.926084518432617, "global_step": 9462, "epoch": 225} {"train_loss": -5.039968490600586, "global_step": 9463, "epoch": 225} {"train_loss": -5.144158363342285, "global_step": 9464, "epoch": 225} {"train_loss": -5.108599662780762, "global_step": 9465, "epoch": 225} {"train_loss": -5.209248065948486, "global_step": 9466, "epoch": 225} {"train_loss": -5.0822367668151855, "global_step": 9467, "epoch": 225} {"train_loss": -5.1070756912231445, "global_step": 9468, "epoch": 225} {"train_loss": -4.9931793212890625, "global_step": 9469, "epoch": 225} {"train_loss": -5.0458574295043945, "global_step": 9470, "epoch": 225} {"train_loss": -5.021144866943359, "global_step": 9471, "epoch": 225} {"train_loss": -4.980506896972656, "global_step": 9472, "epoch": 225} {"train_loss": -5.053215980529785, "global_step": 9473, "epoch": 225} {"train_loss": -5.126851558685303, "global_step": 9474, "epoch": 225} {"train_loss": -4.926070690155029, "global_step": 9475, "epoch": 225} {"train_loss": -5.043598175048828, "global_step": 9476, "epoch": 225} {"train_loss": -5.07573127746582, "global_step": 9477, "epoch": 225} {"train_loss": -5.075394630432129, "global_step": 9478, "epoch": 225} {"train_loss": -5.116323471069336, "global_step": 9479, "epoch": 225} {"train_loss": -5.158924102783203, "global_step": 9480, "epoch": 225} {"train_loss": -5.233003616333008, "global_step": 9481, "epoch": 225} {"train_loss": -4.91960334777832, "global_step": 9482, "epoch": 225} {"train_loss": -4.9140400886535645, "global_step": 9483, "epoch": 225} {"train_loss": -4.717972755432129, "global_step": 9484, "epoch": 225} {"train_loss": -4.875230312347412, "global_step": 9485, "epoch": 225} {"train_loss": -4.876633167266846, "global_step": 9486, "epoch": 225} {"train_loss": -5.1424760818481445, "global_step": 9487, "epoch": 225} {"train_loss": -5.108992099761963, "global_step": 9488, "epoch": 225} {"train_loss": -4.8671746253967285, "global_step": 9489, "epoch": 225} {"train_loss": -4.96356201171875, "global_step": 9490, "epoch": 225} {"train_loss": -5.014560472397577, "global_step": 9491, "epoch": 225, "val_loss": 81191.7890625} {"train_loss": -4.828509330749512, "global_step": 9492, "epoch": 226} {"train_loss": -5.185398101806641, "global_step": 9493, "epoch": 226} {"train_loss": -4.902759552001953, "global_step": 9494, "epoch": 226} {"train_loss": -4.903414726257324, "global_step": 9495, "epoch": 226} {"train_loss": -4.999342918395996, "global_step": 9496, "epoch": 226} {"train_loss": -5.043694496154785, "global_step": 9497, "epoch": 226} {"train_loss": -4.9853105545043945, "global_step": 9498, "epoch": 226} {"train_loss": -4.881631374359131, "global_step": 9499, "epoch": 226} {"train_loss": -4.992835998535156, "global_step": 9500, "epoch": 226} {"train_loss": -5.010150909423828, "global_step": 9501, "epoch": 226} {"train_loss": -4.77373743057251, "global_step": 9502, "epoch": 226} {"train_loss": -5.088587760925293, "global_step": 9503, "epoch": 226} {"train_loss": -5.015353202819824, "global_step": 9504, "epoch": 226} {"train_loss": -5.01511287689209, "global_step": 9505, "epoch": 226} {"train_loss": -4.908865451812744, "global_step": 9506, "epoch": 226} {"train_loss": -5.0005388259887695, "global_step": 9507, "epoch": 226} {"train_loss": -4.9994893074035645, "global_step": 9508, "epoch": 226} {"train_loss": -5.147789001464844, "global_step": 9509, "epoch": 226} {"train_loss": -4.949477195739746, "global_step": 9510, "epoch": 226} {"train_loss": -4.944565296173096, "global_step": 9511, "epoch": 226} {"train_loss": -5.137587547302246, "global_step": 9512, "epoch": 226} {"train_loss": -4.883377552032471, "global_step": 9513, "epoch": 226} {"train_loss": -4.846117973327637, "global_step": 9514, "epoch": 226} {"train_loss": -4.919930934906006, "global_step": 9515, "epoch": 226} {"train_loss": -5.109798908233643, "global_step": 9516, "epoch": 226} {"train_loss": -4.935847282409668, "global_step": 9517, "epoch": 226} {"train_loss": -4.961659908294678, "global_step": 9518, "epoch": 226} {"train_loss": -5.064487457275391, "global_step": 9519, "epoch": 226} {"train_loss": -4.922726631164551, "global_step": 9520, "epoch": 226} {"train_loss": -5.071815013885498, "global_step": 9521, "epoch": 226} {"train_loss": -4.994009971618652, "global_step": 9522, "epoch": 226} {"train_loss": -5.004673957824707, "global_step": 9523, "epoch": 226} {"train_loss": -5.0973005294799805, "global_step": 9524, "epoch": 226} {"train_loss": -5.085553169250488, "global_step": 9525, "epoch": 226} {"train_loss": -5.005308151245117, "global_step": 9526, "epoch": 226} {"train_loss": -5.091154098510742, "global_step": 9527, "epoch": 226} {"train_loss": -4.980937957763672, "global_step": 9528, "epoch": 226} {"train_loss": -5.080528259277344, "global_step": 9529, "epoch": 226} {"train_loss": -5.112030506134033, "global_step": 9530, "epoch": 226} {"train_loss": -4.99474573135376, "global_step": 9531, "epoch": 226} {"train_loss": -5.05103874206543, "global_step": 9532, "epoch": 226} {"train_loss": -4.994430564698719, "global_step": 9533, "epoch": 226, "val_loss": 78051.6953125} {"train_loss": -4.992457389831543, "global_step": 9534, "epoch": 227} {"train_loss": -5.064633369445801, "global_step": 9535, "epoch": 227} {"train_loss": -5.037578582763672, "global_step": 9536, "epoch": 227} {"train_loss": -5.092559814453125, "global_step": 9537, "epoch": 227} {"train_loss": -5.0523786544799805, "global_step": 9538, "epoch": 227} {"train_loss": -5.002555847167969, "global_step": 9539, "epoch": 227} {"train_loss": -5.066928386688232, "global_step": 9540, "epoch": 227} {"train_loss": -4.707954406738281, "global_step": 9541, "epoch": 227} {"train_loss": -5.049237251281738, "global_step": 9542, "epoch": 227} {"train_loss": -5.143886566162109, "global_step": 9543, "epoch": 227} {"train_loss": -4.957576274871826, "global_step": 9544, "epoch": 227} {"train_loss": -5.074897766113281, "global_step": 9545, "epoch": 227} {"train_loss": -4.986641883850098, "global_step": 9546, "epoch": 227} {"train_loss": -5.056497573852539, "global_step": 9547, "epoch": 227} {"train_loss": -5.081535816192627, "global_step": 9548, "epoch": 227} {"train_loss": -5.053731441497803, "global_step": 9549, "epoch": 227} {"train_loss": -5.108404159545898, "global_step": 9550, "epoch": 227} {"train_loss": -5.0497660636901855, "global_step": 9551, "epoch": 227} {"train_loss": -5.015200614929199, "global_step": 9552, "epoch": 227} {"train_loss": -5.0054731369018555, "global_step": 9553, "epoch": 227} {"train_loss": -5.053196430206299, "global_step": 9554, "epoch": 227} {"train_loss": -5.135711193084717, "global_step": 9555, "epoch": 227} {"train_loss": -5.054182052612305, "global_step": 9556, "epoch": 227} {"train_loss": -5.077340602874756, "global_step": 9557, "epoch": 227} {"train_loss": -5.078909397125244, "global_step": 9558, "epoch": 227} {"train_loss": -4.982394218444824, "global_step": 9559, "epoch": 227} {"train_loss": -4.999081134796143, "global_step": 9560, "epoch": 227} {"train_loss": -5.1214423179626465, "global_step": 9561, "epoch": 227} {"train_loss": -5.077869415283203, "global_step": 9562, "epoch": 227} {"train_loss": -4.966355323791504, "global_step": 9563, "epoch": 227} {"train_loss": -5.117525577545166, "global_step": 9564, "epoch": 227} {"train_loss": -5.010327339172363, "global_step": 9565, "epoch": 227} {"train_loss": -4.9953694343566895, "global_step": 9566, "epoch": 227} {"train_loss": -5.035008430480957, "global_step": 9567, "epoch": 227} {"train_loss": -5.058826923370361, "global_step": 9568, "epoch": 227} {"train_loss": -4.812955856323242, "global_step": 9569, "epoch": 227} {"train_loss": -4.831504821777344, "global_step": 9570, "epoch": 227} {"train_loss": -4.9971604347229, "global_step": 9571, "epoch": 227} {"train_loss": -5.051304340362549, "global_step": 9572, "epoch": 227} {"train_loss": -5.017000198364258, "global_step": 9573, "epoch": 227} {"train_loss": -4.966940879821777, "global_step": 9574, "epoch": 227} {"train_loss": -5.0249276501791815, "global_step": 9575, "epoch": 227, "val_loss": 79080.015625} {"train_loss": -5.042970180511475, "global_step": 9576, "epoch": 228} {"train_loss": -4.93281364440918, "global_step": 9577, "epoch": 228} {"train_loss": -4.859844207763672, "global_step": 9578, "epoch": 228} {"train_loss": -4.943270683288574, "global_step": 9579, "epoch": 228} {"train_loss": -4.997018814086914, "global_step": 9580, "epoch": 228} {"train_loss": -4.98930025100708, "global_step": 9581, "epoch": 228} {"train_loss": -5.013962745666504, "global_step": 9582, "epoch": 228} {"train_loss": -5.035199165344238, "global_step": 9583, "epoch": 228} {"train_loss": -5.072689056396484, "global_step": 9584, "epoch": 228} {"train_loss": -4.938117980957031, "global_step": 9585, "epoch": 228} {"train_loss": -5.0203423500061035, "global_step": 9586, "epoch": 228} {"train_loss": -4.88862943649292, "global_step": 9587, "epoch": 228} {"train_loss": -5.069336891174316, "global_step": 9588, "epoch": 228} {"train_loss": -5.125335693359375, "global_step": 9589, "epoch": 228} {"train_loss": -5.0540289878845215, "global_step": 9590, "epoch": 228} {"train_loss": -4.941798686981201, "global_step": 9591, "epoch": 228} {"train_loss": -4.887641906738281, "global_step": 9592, "epoch": 228} {"train_loss": -4.958118438720703, "global_step": 9593, "epoch": 228} {"train_loss": -5.159808158874512, "global_step": 9594, "epoch": 228} {"train_loss": -5.073287010192871, "global_step": 9595, "epoch": 228} {"train_loss": -5.018195152282715, "global_step": 9596, "epoch": 228} {"train_loss": -5.015481472015381, "global_step": 9597, "epoch": 228} {"train_loss": -5.052605628967285, "global_step": 9598, "epoch": 228} {"train_loss": -5.121730804443359, "global_step": 9599, "epoch": 228} {"train_loss": -5.0948920249938965, "global_step": 9600, "epoch": 228} {"train_loss": -5.167601585388184, "global_step": 9601, "epoch": 228} {"train_loss": -5.0553483963012695, "global_step": 9602, "epoch": 228} {"train_loss": -5.1109771728515625, "global_step": 9603, "epoch": 228} {"train_loss": -5.063678741455078, "global_step": 9604, "epoch": 228} {"train_loss": -5.1483635902404785, "global_step": 9605, "epoch": 228} {"train_loss": -5.142174243927002, "global_step": 9606, "epoch": 228} {"train_loss": -5.036621570587158, "global_step": 9607, "epoch": 228} {"train_loss": -4.994254112243652, "global_step": 9608, "epoch": 228} {"train_loss": -4.959543228149414, "global_step": 9609, "epoch": 228} {"train_loss": -5.139316558837891, "global_step": 9610, "epoch": 228} {"train_loss": -5.17983341217041, "global_step": 9611, "epoch": 228} {"train_loss": -5.13472843170166, "global_step": 9612, "epoch": 228} {"train_loss": -5.094858646392822, "global_step": 9613, "epoch": 228} {"train_loss": -4.898236274719238, "global_step": 9614, "epoch": 228} {"train_loss": -5.153386116027832, "global_step": 9615, "epoch": 228} {"train_loss": -5.056159019470215, "global_step": 9616, "epoch": 228} {"train_loss": -5.036749113173712, "global_step": 9617, "epoch": 228, "val_loss": 77934.671875} {"train_loss": -5.076345443725586, "global_step": 9618, "epoch": 229} {"train_loss": -4.893828392028809, "global_step": 9619, "epoch": 229} {"train_loss": -5.243922710418701, "global_step": 9620, "epoch": 229} {"train_loss": -5.087984085083008, "global_step": 9621, "epoch": 229} {"train_loss": -4.684688091278076, "global_step": 9622, "epoch": 229} {"train_loss": -5.081615924835205, "global_step": 9623, "epoch": 229} {"train_loss": -5.065808296203613, "global_step": 9624, "epoch": 229} {"train_loss": -5.01284646987915, "global_step": 9625, "epoch": 229} {"train_loss": -5.014677047729492, "global_step": 9626, "epoch": 229} {"train_loss": -5.122849464416504, "global_step": 9627, "epoch": 229} {"train_loss": -4.959545135498047, "global_step": 9628, "epoch": 229} {"train_loss": -5.035431861877441, "global_step": 9629, "epoch": 229} {"train_loss": -4.813020706176758, "global_step": 9630, "epoch": 229} {"train_loss": -5.222481727600098, "global_step": 9631, "epoch": 229} {"train_loss": -5.052614212036133, "global_step": 9632, "epoch": 229} {"train_loss": -5.023913860321045, "global_step": 9633, "epoch": 229} {"train_loss": -5.1393022537231445, "global_step": 9634, "epoch": 229} {"train_loss": -5.031006813049316, "global_step": 9635, "epoch": 229} {"train_loss": -5.0079474449157715, "global_step": 9636, "epoch": 229} {"train_loss": -5.142160415649414, "global_step": 9637, "epoch": 229} {"train_loss": -5.077140808105469, "global_step": 9638, "epoch": 229} {"train_loss": -5.105936050415039, "global_step": 9639, "epoch": 229} {"train_loss": -5.009230613708496, "global_step": 9640, "epoch": 229} {"train_loss": -5.064394474029541, "global_step": 9641, "epoch": 229} {"train_loss": -5.131890296936035, "global_step": 9642, "epoch": 229} {"train_loss": -5.064623832702637, "global_step": 9643, "epoch": 229} {"train_loss": -5.118978500366211, "global_step": 9644, "epoch": 229} {"train_loss": -5.162866115570068, "global_step": 9645, "epoch": 229} {"train_loss": -4.930141448974609, "global_step": 9646, "epoch": 229} {"train_loss": -5.133427619934082, "global_step": 9647, "epoch": 229} {"train_loss": -5.0043416023254395, "global_step": 9648, "epoch": 229} {"train_loss": -4.959339141845703, "global_step": 9649, "epoch": 229} {"train_loss": -5.149178504943848, "global_step": 9650, "epoch": 229} {"train_loss": -5.072934150695801, "global_step": 9651, "epoch": 229} {"train_loss": -5.060422897338867, "global_step": 9652, "epoch": 229} {"train_loss": -5.146761894226074, "global_step": 9653, "epoch": 229} {"train_loss": -4.986299514770508, "global_step": 9654, "epoch": 229} {"train_loss": -5.224088668823242, "global_step": 9655, "epoch": 229} {"train_loss": -5.162567615509033, "global_step": 9656, "epoch": 229} {"train_loss": -4.910432815551758, "global_step": 9657, "epoch": 229} {"train_loss": -4.9938764572143555, "global_step": 9658, "epoch": 229} {"train_loss": -5.053295532862346, "global_step": 9659, "epoch": 229, "val_loss": 78074.28125} {"train_loss": -5.101084232330322, "global_step": 9660, "epoch": 230} {"train_loss": -5.033824443817139, "global_step": 9661, "epoch": 230} {"train_loss": -4.9924492835998535, "global_step": 9662, "epoch": 230} {"train_loss": -5.108979225158691, "global_step": 9663, "epoch": 230} {"train_loss": -4.963586330413818, "global_step": 9664, "epoch": 230} {"train_loss": -5.012547492980957, "global_step": 9665, "epoch": 230} {"train_loss": -5.085513114929199, "global_step": 9666, "epoch": 230} {"train_loss": -4.983625411987305, "global_step": 9667, "epoch": 230} {"train_loss": -5.109877586364746, "global_step": 9668, "epoch": 230} {"train_loss": -5.223970413208008, "global_step": 9669, "epoch": 230} {"train_loss": -5.0730133056640625, "global_step": 9670, "epoch": 230} {"train_loss": -5.056148529052734, "global_step": 9671, "epoch": 230} {"train_loss": -5.112222194671631, "global_step": 9672, "epoch": 230} {"train_loss": -4.917755126953125, "global_step": 9673, "epoch": 230} {"train_loss": -4.934323787689209, "global_step": 9674, "epoch": 230} {"train_loss": -4.922839641571045, "global_step": 9675, "epoch": 230} {"train_loss": -5.105241298675537, "global_step": 9676, "epoch": 230} {"train_loss": -5.014897346496582, "global_step": 9677, "epoch": 230} {"train_loss": -5.104580879211426, "global_step": 9678, "epoch": 230} {"train_loss": -4.922121047973633, "global_step": 9679, "epoch": 230} {"train_loss": -5.242452621459961, "global_step": 9680, "epoch": 230} {"train_loss": -5.013868808746338, "global_step": 9681, "epoch": 230} {"train_loss": -4.978641510009766, "global_step": 9682, "epoch": 230} {"train_loss": -5.017264366149902, "global_step": 9683, "epoch": 230} {"train_loss": -5.140937328338623, "global_step": 9684, "epoch": 230} {"train_loss": -5.050712585449219, "global_step": 9685, "epoch": 230} {"train_loss": -5.018108367919922, "global_step": 9686, "epoch": 230} {"train_loss": -5.039091110229492, "global_step": 9687, "epoch": 230} {"train_loss": -5.121490478515625, "global_step": 9688, "epoch": 230} {"train_loss": -5.083415985107422, "global_step": 9689, "epoch": 230} {"train_loss": -4.96742057800293, "global_step": 9690, "epoch": 230} {"train_loss": -5.131649017333984, "global_step": 9691, "epoch": 230} {"train_loss": -4.966108322143555, "global_step": 9692, "epoch": 230} {"train_loss": -5.088089942932129, "global_step": 9693, "epoch": 230} {"train_loss": -5.113373279571533, "global_step": 9694, "epoch": 230} {"train_loss": -4.933460712432861, "global_step": 9695, "epoch": 230} {"train_loss": -5.127780437469482, "global_step": 9696, "epoch": 230} {"train_loss": -5.142777442932129, "global_step": 9697, "epoch": 230} {"train_loss": -5.045832633972168, "global_step": 9698, "epoch": 230} {"train_loss": -5.145601272583008, "global_step": 9699, "epoch": 230} {"train_loss": -5.0040130615234375, "global_step": 9700, "epoch": 230} {"train_loss": -5.049061128071377, "global_step": 9701, "epoch": 230, "val_loss": 77841.3125} {"train_loss": -5.04426383972168, "global_step": 9702, "epoch": 231} {"train_loss": -5.033228874206543, "global_step": 9703, "epoch": 231} {"train_loss": -5.027369499206543, "global_step": 9704, "epoch": 231} {"train_loss": -5.023611068725586, "global_step": 9705, "epoch": 231} {"train_loss": -5.166853904724121, "global_step": 9706, "epoch": 231} {"train_loss": -5.031394004821777, "global_step": 9707, "epoch": 231} {"train_loss": -5.1416802406311035, "global_step": 9708, "epoch": 231} {"train_loss": -5.056019306182861, "global_step": 9709, "epoch": 231} {"train_loss": -5.088202476501465, "global_step": 9710, "epoch": 231} {"train_loss": -5.027196407318115, "global_step": 9711, "epoch": 231} {"train_loss": -4.985929012298584, "global_step": 9712, "epoch": 231} {"train_loss": -5.05218505859375, "global_step": 9713, "epoch": 231} {"train_loss": -4.947172164916992, "global_step": 9714, "epoch": 231} {"train_loss": -4.979863166809082, "global_step": 9715, "epoch": 231} {"train_loss": -4.836113929748535, "global_step": 9716, "epoch": 231} {"train_loss": -4.994041919708252, "global_step": 9717, "epoch": 231} {"train_loss": -5.001678943634033, "global_step": 9718, "epoch": 231} {"train_loss": -4.892779350280762, "global_step": 9719, "epoch": 231} {"train_loss": -5.155908584594727, "global_step": 9720, "epoch": 231} {"train_loss": -5.175776958465576, "global_step": 9721, "epoch": 231} {"train_loss": -4.949217319488525, "global_step": 9722, "epoch": 231} {"train_loss": -5.120628356933594, "global_step": 9723, "epoch": 231} {"train_loss": -5.138354301452637, "global_step": 9724, "epoch": 231} {"train_loss": -4.966290473937988, "global_step": 9725, "epoch": 231} {"train_loss": -4.926388740539551, "global_step": 9726, "epoch": 231} {"train_loss": -4.887157440185547, "global_step": 9727, "epoch": 231} {"train_loss": -4.894414901733398, "global_step": 9728, "epoch": 231} {"train_loss": -5.112816333770752, "global_step": 9729, "epoch": 231} {"train_loss": -5.025774002075195, "global_step": 9730, "epoch": 231} {"train_loss": -4.958600044250488, "global_step": 9731, "epoch": 231} {"train_loss": -4.864458084106445, "global_step": 9732, "epoch": 231} {"train_loss": -5.04139518737793, "global_step": 9733, "epoch": 231} {"train_loss": -4.931997776031494, "global_step": 9734, "epoch": 231} {"train_loss": -5.016157150268555, "global_step": 9735, "epoch": 231} {"train_loss": -5.0889787673950195, "global_step": 9736, "epoch": 231} {"train_loss": -4.969293594360352, "global_step": 9737, "epoch": 231} {"train_loss": -4.902240753173828, "global_step": 9738, "epoch": 231} {"train_loss": -5.169239044189453, "global_step": 9739, "epoch": 231} {"train_loss": -5.0779924392700195, "global_step": 9740, "epoch": 231} {"train_loss": -5.207862854003906, "global_step": 9741, "epoch": 231} {"train_loss": -5.170153617858887, "global_step": 9742, "epoch": 231} {"train_loss": -5.0265902905237105, "global_step": 9743, "epoch": 231, "val_loss": 77603.59375} {"train_loss": -5.034404754638672, "global_step": 9744, "epoch": 232} {"train_loss": -5.178717613220215, "global_step": 9745, "epoch": 232} {"train_loss": -5.081352233886719, "global_step": 9746, "epoch": 232} {"train_loss": -5.016896724700928, "global_step": 9747, "epoch": 232} {"train_loss": -5.190459251403809, "global_step": 9748, "epoch": 232} {"train_loss": -5.084122657775879, "global_step": 9749, "epoch": 232} {"train_loss": -5.0776801109313965, "global_step": 9750, "epoch": 232} {"train_loss": -5.161381721496582, "global_step": 9751, "epoch": 232} {"train_loss": -5.048405647277832, "global_step": 9752, "epoch": 232} {"train_loss": -5.189495086669922, "global_step": 9753, "epoch": 232} {"train_loss": -5.090635299682617, "global_step": 9754, "epoch": 232} {"train_loss": -5.151595115661621, "global_step": 9755, "epoch": 232} {"train_loss": -5.02764892578125, "global_step": 9756, "epoch": 232} {"train_loss": -5.17958927154541, "global_step": 9757, "epoch": 232} {"train_loss": -5.057781219482422, "global_step": 9758, "epoch": 232} {"train_loss": -5.058791160583496, "global_step": 9759, "epoch": 232} {"train_loss": -5.08693790435791, "global_step": 9760, "epoch": 232} {"train_loss": -5.076216697692871, "global_step": 9761, "epoch": 232} {"train_loss": -5.007018566131592, "global_step": 9762, "epoch": 232} {"train_loss": -5.049583435058594, "global_step": 9763, "epoch": 232} {"train_loss": -4.976348876953125, "global_step": 9764, "epoch": 232} {"train_loss": -5.02937126159668, "global_step": 9765, "epoch": 232} {"train_loss": -5.013484954833984, "global_step": 9766, "epoch": 232} {"train_loss": -5.078341484069824, "global_step": 9767, "epoch": 232} {"train_loss": -4.92119026184082, "global_step": 9768, "epoch": 232} {"train_loss": -5.059880256652832, "global_step": 9769, "epoch": 232} {"train_loss": -5.181455612182617, "global_step": 9770, "epoch": 232} {"train_loss": -5.062077522277832, "global_step": 9771, "epoch": 232} {"train_loss": -5.034161567687988, "global_step": 9772, "epoch": 232} {"train_loss": -5.203726768493652, "global_step": 9773, "epoch": 232} {"train_loss": -5.0140252113342285, "global_step": 9774, "epoch": 232} {"train_loss": -4.961233139038086, "global_step": 9775, "epoch": 232} {"train_loss": -5.089021682739258, "global_step": 9776, "epoch": 232} {"train_loss": -5.111248016357422, "global_step": 9777, "epoch": 232} {"train_loss": -5.118746280670166, "global_step": 9778, "epoch": 232} {"train_loss": -5.000892162322998, "global_step": 9779, "epoch": 232} {"train_loss": -5.036770820617676, "global_step": 9780, "epoch": 232} {"train_loss": -5.066545486450195, "global_step": 9781, "epoch": 232} {"train_loss": -5.07027530670166, "global_step": 9782, "epoch": 232} {"train_loss": -5.031682968139648, "global_step": 9783, "epoch": 232} {"train_loss": -5.067244529724121, "global_step": 9784, "epoch": 232} {"train_loss": -5.07043659119379, "global_step": 9785, "epoch": 232, "val_loss": 77948.4375} {"train_loss": -5.061029434204102, "global_step": 9786, "epoch": 233} {"train_loss": -4.9845194816589355, "global_step": 9787, "epoch": 233} {"train_loss": -5.2978386878967285, "global_step": 9788, "epoch": 233} {"train_loss": -4.928584098815918, "global_step": 9789, "epoch": 233} {"train_loss": -5.159188270568848, "global_step": 9790, "epoch": 233} {"train_loss": -5.147201061248779, "global_step": 9791, "epoch": 233} {"train_loss": -5.007885456085205, "global_step": 9792, "epoch": 233} {"train_loss": -5.111726760864258, "global_step": 9793, "epoch": 233} {"train_loss": -5.074656009674072, "global_step": 9794, "epoch": 233} {"train_loss": -5.08944034576416, "global_step": 9795, "epoch": 233} {"train_loss": -5.053295135498047, "global_step": 9796, "epoch": 233} {"train_loss": -5.055364608764648, "global_step": 9797, "epoch": 233} {"train_loss": -5.179940223693848, "global_step": 9798, "epoch": 233} {"train_loss": -5.139665603637695, "global_step": 9799, "epoch": 233} {"train_loss": -5.008399963378906, "global_step": 9800, "epoch": 233} {"train_loss": -5.082655906677246, "global_step": 9801, "epoch": 233} {"train_loss": -5.1047043800354, "global_step": 9802, "epoch": 233} {"train_loss": -5.150376319885254, "global_step": 9803, "epoch": 233} {"train_loss": -4.930964469909668, "global_step": 9804, "epoch": 233} {"train_loss": -5.176172256469727, "global_step": 9805, "epoch": 233} {"train_loss": -5.112156391143799, "global_step": 9806, "epoch": 233} {"train_loss": -5.135601997375488, "global_step": 9807, "epoch": 233} {"train_loss": -5.092616081237793, "global_step": 9808, "epoch": 233} {"train_loss": -4.975665092468262, "global_step": 9809, "epoch": 233} {"train_loss": -5.1504902839660645, "global_step": 9810, "epoch": 233} {"train_loss": -5.158013343811035, "global_step": 9811, "epoch": 233} {"train_loss": -5.130378723144531, "global_step": 9812, "epoch": 233} {"train_loss": -5.089845657348633, "global_step": 9813, "epoch": 233} {"train_loss": -5.050291061401367, "global_step": 9814, "epoch": 233} {"train_loss": -5.052489280700684, "global_step": 9815, "epoch": 233} {"train_loss": -5.088655948638916, "global_step": 9816, "epoch": 233} {"train_loss": -4.962828159332275, "global_step": 9817, "epoch": 233} {"train_loss": -5.077402114868164, "global_step": 9818, "epoch": 233} {"train_loss": -4.927610397338867, "global_step": 9819, "epoch": 233} {"train_loss": -4.931791305541992, "global_step": 9820, "epoch": 233} {"train_loss": -5.016523361206055, "global_step": 9821, "epoch": 233} {"train_loss": -5.035151481628418, "global_step": 9822, "epoch": 233} {"train_loss": -4.866607666015625, "global_step": 9823, "epoch": 233} {"train_loss": -5.094672203063965, "global_step": 9824, "epoch": 233} {"train_loss": -5.008772850036621, "global_step": 9825, "epoch": 233} {"train_loss": -5.014894008636475, "global_step": 9826, "epoch": 233} {"train_loss": -5.065227145240421, "global_step": 9827, "epoch": 233, "val_loss": 77485.15625} {"train_loss": -4.946842670440674, "global_step": 9828, "epoch": 234} {"train_loss": -5.22244119644165, "global_step": 9829, "epoch": 234} {"train_loss": -4.997349739074707, "global_step": 9830, "epoch": 234} {"train_loss": -4.883414268493652, "global_step": 9831, "epoch": 234} {"train_loss": -4.947362422943115, "global_step": 9832, "epoch": 234} {"train_loss": -4.888289451599121, "global_step": 9833, "epoch": 234} {"train_loss": -5.092306137084961, "global_step": 9834, "epoch": 234} {"train_loss": -4.803103446960449, "global_step": 9835, "epoch": 234} {"train_loss": -4.953572750091553, "global_step": 9836, "epoch": 234} {"train_loss": -5.164178371429443, "global_step": 9837, "epoch": 234} {"train_loss": -4.912406921386719, "global_step": 9838, "epoch": 234} {"train_loss": -4.858218669891357, "global_step": 9839, "epoch": 234} {"train_loss": -5.067523002624512, "global_step": 9840, "epoch": 234} {"train_loss": -4.842964172363281, "global_step": 9841, "epoch": 234} {"train_loss": -4.905326843261719, "global_step": 9842, "epoch": 234} {"train_loss": -5.090609550476074, "global_step": 9843, "epoch": 234} {"train_loss": -5.1158294677734375, "global_step": 9844, "epoch": 234} {"train_loss": -5.038205146789551, "global_step": 9845, "epoch": 234} {"train_loss": -5.012624740600586, "global_step": 9846, "epoch": 234} {"train_loss": -5.020744323730469, "global_step": 9847, "epoch": 234} {"train_loss": -5.036269187927246, "global_step": 9848, "epoch": 234} {"train_loss": -5.035605430603027, "global_step": 9849, "epoch": 234} {"train_loss": -5.093578338623047, "global_step": 9850, "epoch": 234} {"train_loss": -5.082855224609375, "global_step": 9851, "epoch": 234} {"train_loss": -4.989528656005859, "global_step": 9852, "epoch": 234} {"train_loss": -5.078636169433594, "global_step": 9853, "epoch": 234} {"train_loss": -4.973712921142578, "global_step": 9854, "epoch": 234} {"train_loss": -4.971826553344727, "global_step": 9855, "epoch": 234} {"train_loss": -5.174177169799805, "global_step": 9856, "epoch": 234} {"train_loss": -5.1173882484436035, "global_step": 9857, "epoch": 234} {"train_loss": -5.091368675231934, "global_step": 9858, "epoch": 234} {"train_loss": -5.087381839752197, "global_step": 9859, "epoch": 234} {"train_loss": -5.08858585357666, "global_step": 9860, "epoch": 234} {"train_loss": -4.880262851715088, "global_step": 9861, "epoch": 234} {"train_loss": -5.077437400817871, "global_step": 9862, "epoch": 234} {"train_loss": -5.073616027832031, "global_step": 9863, "epoch": 234} {"train_loss": -5.236643314361572, "global_step": 9864, "epoch": 234} {"train_loss": -4.932381629943848, "global_step": 9865, "epoch": 234} {"train_loss": -5.100731372833252, "global_step": 9866, "epoch": 234} {"train_loss": -4.983410358428955, "global_step": 9867, "epoch": 234} {"train_loss": -4.931729316711426, "global_step": 9868, "epoch": 234} {"train_loss": -5.0187148707253595, "global_step": 9869, "epoch": 234, "val_loss": 78037.46875} {"train_loss": -4.849416255950928, "global_step": 9870, "epoch": 235} {"train_loss": -5.026484966278076, "global_step": 9871, "epoch": 235} {"train_loss": -5.068356990814209, "global_step": 9872, "epoch": 235} {"train_loss": -5.032687187194824, "global_step": 9873, "epoch": 235} {"train_loss": -5.017683506011963, "global_step": 9874, "epoch": 235} {"train_loss": -4.9512176513671875, "global_step": 9875, "epoch": 235} {"train_loss": -5.042296886444092, "global_step": 9876, "epoch": 235} {"train_loss": -5.038972854614258, "global_step": 9877, "epoch": 235} {"train_loss": -4.878118515014648, "global_step": 9878, "epoch": 235} {"train_loss": -5.078638076782227, "global_step": 9879, "epoch": 235} {"train_loss": -4.880393981933594, "global_step": 9880, "epoch": 235} {"train_loss": -5.101840019226074, "global_step": 9881, "epoch": 235} {"train_loss": -4.988615989685059, "global_step": 9882, "epoch": 235} {"train_loss": -5.011629104614258, "global_step": 9883, "epoch": 235} {"train_loss": -5.10498046875, "global_step": 9884, "epoch": 235} {"train_loss": -4.8958210945129395, "global_step": 9885, "epoch": 235} {"train_loss": -5.029946327209473, "global_step": 9886, "epoch": 235} {"train_loss": -4.820865631103516, "global_step": 9887, "epoch": 235} {"train_loss": -5.015355587005615, "global_step": 9888, "epoch": 235} {"train_loss": -5.034063816070557, "global_step": 9889, "epoch": 235} {"train_loss": -5.17286491394043, "global_step": 9890, "epoch": 235} {"train_loss": -5.176198959350586, "global_step": 9891, "epoch": 235} {"train_loss": -5.0134077072143555, "global_step": 9892, "epoch": 235} {"train_loss": -5.123585224151611, "global_step": 9893, "epoch": 235} {"train_loss": -5.040399551391602, "global_step": 9894, "epoch": 235} {"train_loss": -4.929836273193359, "global_step": 9895, "epoch": 235} {"train_loss": -4.96506404876709, "global_step": 9896, "epoch": 235} {"train_loss": -5.037161350250244, "global_step": 9897, "epoch": 235} {"train_loss": -5.094672679901123, "global_step": 9898, "epoch": 235} {"train_loss": -5.12065315246582, "global_step": 9899, "epoch": 235} {"train_loss": -5.246994972229004, "global_step": 9900, "epoch": 235} {"train_loss": -5.224979400634766, "global_step": 9901, "epoch": 235} {"train_loss": -5.159893035888672, "global_step": 9902, "epoch": 235} {"train_loss": -4.96499490737915, "global_step": 9903, "epoch": 235} {"train_loss": -5.028472900390625, "global_step": 9904, "epoch": 235} {"train_loss": -5.173066139221191, "global_step": 9905, "epoch": 235} {"train_loss": -5.059831142425537, "global_step": 9906, "epoch": 235} {"train_loss": -5.097468376159668, "global_step": 9907, "epoch": 235} {"train_loss": -4.970890998840332, "global_step": 9908, "epoch": 235} {"train_loss": -5.181033611297607, "global_step": 9909, "epoch": 235} {"train_loss": -5.095534324645996, "global_step": 9910, "epoch": 235} {"train_loss": -5.045181013288952, "global_step": 9911, "epoch": 235, "val_loss": 77519.171875} {"train_loss": -5.142014503479004, "global_step": 9912, "epoch": 236} {"train_loss": -5.185323238372803, "global_step": 9913, "epoch": 236} {"train_loss": -5.000370979309082, "global_step": 9914, "epoch": 236} {"train_loss": -4.954641819000244, "global_step": 9915, "epoch": 236} {"train_loss": -5.097001075744629, "global_step": 9916, "epoch": 236} {"train_loss": -4.9936089515686035, "global_step": 9917, "epoch": 236} {"train_loss": -4.9605393409729, "global_step": 9918, "epoch": 236} {"train_loss": -5.054962158203125, "global_step": 9919, "epoch": 236} {"train_loss": -5.1849541664123535, "global_step": 9920, "epoch": 236} {"train_loss": -4.9880828857421875, "global_step": 9921, "epoch": 236} {"train_loss": -4.950207233428955, "global_step": 9922, "epoch": 236} {"train_loss": -4.891765117645264, "global_step": 9923, "epoch": 236} {"train_loss": -5.188549995422363, "global_step": 9924, "epoch": 236} {"train_loss": -4.96677827835083, "global_step": 9925, "epoch": 236} {"train_loss": -5.0857744216918945, "global_step": 9926, "epoch": 236} {"train_loss": -4.980348587036133, "global_step": 9927, "epoch": 236} {"train_loss": -5.061097145080566, "global_step": 9928, "epoch": 236} {"train_loss": -5.150016784667969, "global_step": 9929, "epoch": 236} {"train_loss": -5.145600318908691, "global_step": 9930, "epoch": 236} {"train_loss": -5.181419372558594, "global_step": 9931, "epoch": 236} {"train_loss": -5.183382987976074, "global_step": 9932, "epoch": 236} {"train_loss": -5.191812515258789, "global_step": 9933, "epoch": 236} {"train_loss": -5.13558292388916, "global_step": 9934, "epoch": 236} {"train_loss": -5.024670124053955, "global_step": 9935, "epoch": 236} {"train_loss": -5.084358215332031, "global_step": 9936, "epoch": 236} {"train_loss": -5.096399784088135, "global_step": 9937, "epoch": 236} {"train_loss": -5.0457963943481445, "global_step": 9938, "epoch": 236} {"train_loss": -5.149241924285889, "global_step": 9939, "epoch": 236} {"train_loss": -5.132043838500977, "global_step": 9940, "epoch": 236} {"train_loss": -4.922163009643555, "global_step": 9941, "epoch": 236} {"train_loss": -5.072218894958496, "global_step": 9942, "epoch": 236} {"train_loss": -5.000410079956055, "global_step": 9943, "epoch": 236} {"train_loss": -4.932003974914551, "global_step": 9944, "epoch": 236} {"train_loss": -5.078803062438965, "global_step": 9945, "epoch": 236} {"train_loss": -5.060116291046143, "global_step": 9946, "epoch": 236} {"train_loss": -4.813688278198242, "global_step": 9947, "epoch": 236} {"train_loss": -4.9974212646484375, "global_step": 9948, "epoch": 236} {"train_loss": -5.064028739929199, "global_step": 9949, "epoch": 236} {"train_loss": -5.093994140625, "global_step": 9950, "epoch": 236} {"train_loss": -4.96937370300293, "global_step": 9951, "epoch": 236} {"train_loss": -4.9950127601623535, "global_step": 9952, "epoch": 236} {"train_loss": -5.052451894396827, "global_step": 9953, "epoch": 236, "val_loss": 77918.40625} {"train_loss": -5.092802047729492, "global_step": 9954, "epoch": 237} {"train_loss": -5.090576171875, "global_step": 9955, "epoch": 237} {"train_loss": -4.946308135986328, "global_step": 9956, "epoch": 237} {"train_loss": -4.892065048217773, "global_step": 9957, "epoch": 237} {"train_loss": -5.145793914794922, "global_step": 9958, "epoch": 237} {"train_loss": -5.000156402587891, "global_step": 9959, "epoch": 237} {"train_loss": -5.072093963623047, "global_step": 9960, "epoch": 237} {"train_loss": -5.079355716705322, "global_step": 9961, "epoch": 237} {"train_loss": -4.945836544036865, "global_step": 9962, "epoch": 237} {"train_loss": -5.116124153137207, "global_step": 9963, "epoch": 237} {"train_loss": -5.138036727905273, "global_step": 9964, "epoch": 237} {"train_loss": -5.0071563720703125, "global_step": 9965, "epoch": 237} {"train_loss": -5.121107578277588, "global_step": 9966, "epoch": 237} {"train_loss": -4.972214698791504, "global_step": 9967, "epoch": 237} {"train_loss": -5.120205879211426, "global_step": 9968, "epoch": 237} {"train_loss": -5.033205032348633, "global_step": 9969, "epoch": 237} {"train_loss": -4.958971977233887, "global_step": 9970, "epoch": 237} {"train_loss": -5.061180114746094, "global_step": 9971, "epoch": 237} {"train_loss": -5.046474456787109, "global_step": 9972, "epoch": 237} {"train_loss": -4.932095527648926, "global_step": 9973, "epoch": 237} {"train_loss": -4.933337211608887, "global_step": 9974, "epoch": 237} {"train_loss": -5.049906253814697, "global_step": 9975, "epoch": 237} {"train_loss": -4.932643890380859, "global_step": 9976, "epoch": 237} {"train_loss": -4.982922077178955, "global_step": 9977, "epoch": 237} {"train_loss": -5.00816535949707, "global_step": 9978, "epoch": 237} {"train_loss": -4.948343276977539, "global_step": 9979, "epoch": 237} {"train_loss": -4.99581241607666, "global_step": 9980, "epoch": 237} {"train_loss": -5.136186599731445, "global_step": 9981, "epoch": 237} {"train_loss": -4.921030521392822, "global_step": 9982, "epoch": 237} {"train_loss": -4.8685760498046875, "global_step": 9983, "epoch": 237} {"train_loss": -4.989152431488037, "global_step": 9984, "epoch": 237} {"train_loss": -5.006394386291504, "global_step": 9985, "epoch": 237} {"train_loss": -4.810721397399902, "global_step": 9986, "epoch": 237} {"train_loss": -4.993366241455078, "global_step": 9987, "epoch": 237} {"train_loss": -4.912313938140869, "global_step": 9988, "epoch": 237} {"train_loss": -4.911025047302246, "global_step": 9989, "epoch": 237} {"train_loss": -5.009206295013428, "global_step": 9990, "epoch": 237} {"train_loss": -5.017506122589111, "global_step": 9991, "epoch": 237} {"train_loss": -5.094003677368164, "global_step": 9992, "epoch": 237} {"train_loss": -5.110703468322754, "global_step": 9993, "epoch": 237} {"train_loss": -4.914630889892578, "global_step": 9994, "epoch": 237} {"train_loss": -5.011429650442941, "global_step": 9995, "epoch": 237, "val_loss": 78724.3828125} {"train_loss": -4.963972568511963, "global_step": 9996, "epoch": 238} {"train_loss": -5.087084770202637, "global_step": 9997, "epoch": 238} {"train_loss": -5.070801258087158, "global_step": 9998, "epoch": 238} {"train_loss": -4.9887285232543945, "global_step": 9999, "epoch": 238} {"train_loss": -5.006964683532715, "global_step": 10000, "epoch": 238} {"train_loss": -5.091241836547852, "global_step": 10001, "epoch": 238} {"train_loss": -5.03398323059082, "global_step": 10002, "epoch": 238} {"train_loss": -5.018735885620117, "global_step": 10003, "epoch": 238} {"train_loss": -5.145606517791748, "global_step": 10004, "epoch": 238} {"train_loss": -4.950268745422363, "global_step": 10005, "epoch": 238} {"train_loss": -5.115823745727539, "global_step": 10006, "epoch": 238} {"train_loss": -5.023820877075195, "global_step": 10007, "epoch": 238} {"train_loss": -5.056319713592529, "global_step": 10008, "epoch": 238} {"train_loss": -5.112658500671387, "global_step": 10009, "epoch": 238} {"train_loss": -5.096579551696777, "global_step": 10010, "epoch": 238} {"train_loss": -5.082987308502197, "global_step": 10011, "epoch": 238} {"train_loss": -4.999543190002441, "global_step": 10012, "epoch": 238} {"train_loss": -5.251273155212402, "global_step": 10013, "epoch": 238} {"train_loss": -5.109087944030762, "global_step": 10014, "epoch": 238} {"train_loss": -5.099843978881836, "global_step": 10015, "epoch": 238} {"train_loss": -5.089742660522461, "global_step": 10016, "epoch": 238} {"train_loss": -5.086210250854492, "global_step": 10017, "epoch": 238} {"train_loss": -5.03302001953125, "global_step": 10018, "epoch": 238} {"train_loss": -5.221948623657227, "global_step": 10019, "epoch": 238} {"train_loss": -5.045430660247803, "global_step": 10020, "epoch": 238} {"train_loss": -4.987754821777344, "global_step": 10021, "epoch": 238} {"train_loss": -5.026853561401367, "global_step": 10022, "epoch": 238} {"train_loss": -5.152820587158203, "global_step": 10023, "epoch": 238} {"train_loss": -5.145334243774414, "global_step": 10024, "epoch": 238} {"train_loss": -5.06434440612793, "global_step": 10025, "epoch": 238} {"train_loss": -5.164880752563477, "global_step": 10026, "epoch": 238} {"train_loss": -5.1726179122924805, "global_step": 10027, "epoch": 238} {"train_loss": -4.959362030029297, "global_step": 10028, "epoch": 238} {"train_loss": -4.921237945556641, "global_step": 10029, "epoch": 238} {"train_loss": -5.042341709136963, "global_step": 10030, "epoch": 238} {"train_loss": -4.870052814483643, "global_step": 10031, "epoch": 238} {"train_loss": -4.648672103881836, "global_step": 10032, "epoch": 238} {"train_loss": -5.068951606750488, "global_step": 10033, "epoch": 238} {"train_loss": -4.7965569496154785, "global_step": 10034, "epoch": 238} {"train_loss": -4.840673923492432, "global_step": 10035, "epoch": 238} {"train_loss": -5.039708137512207, "global_step": 10036, "epoch": 238} {"train_loss": -5.036691166105724, "global_step": 10037, "epoch": 238, "val_loss": 78565.640625} {"train_loss": -4.972594261169434, "global_step": 10038, "epoch": 239} {"train_loss": -4.988199234008789, "global_step": 10039, "epoch": 239} {"train_loss": -5.024261474609375, "global_step": 10040, "epoch": 239} {"train_loss": -4.991297245025635, "global_step": 10041, "epoch": 239} {"train_loss": -5.0697855949401855, "global_step": 10042, "epoch": 239} {"train_loss": -5.075721263885498, "global_step": 10043, "epoch": 239} {"train_loss": -5.087372779846191, "global_step": 10044, "epoch": 239} {"train_loss": -5.012337684631348, "global_step": 10045, "epoch": 239} {"train_loss": -5.072019577026367, "global_step": 10046, "epoch": 239} {"train_loss": -5.051024436950684, "global_step": 10047, "epoch": 239} {"train_loss": -5.156225204467773, "global_step": 10048, "epoch": 239} {"train_loss": -5.096314430236816, "global_step": 10049, "epoch": 239} {"train_loss": -5.1277570724487305, "global_step": 10050, "epoch": 239} {"train_loss": -5.102972984313965, "global_step": 10051, "epoch": 239} {"train_loss": -5.062677383422852, "global_step": 10052, "epoch": 239} {"train_loss": -5.11092472076416, "global_step": 10053, "epoch": 239} {"train_loss": -5.083984851837158, "global_step": 10054, "epoch": 239} {"train_loss": -4.985590934753418, "global_step": 10055, "epoch": 239} {"train_loss": -5.138664245605469, "global_step": 10056, "epoch": 239} {"train_loss": -5.175242900848389, "global_step": 10057, "epoch": 239} {"train_loss": -5.091602802276611, "global_step": 10058, "epoch": 239} {"train_loss": -5.091958999633789, "global_step": 10059, "epoch": 239} {"train_loss": -4.955535888671875, "global_step": 10060, "epoch": 239} {"train_loss": -5.1050944328308105, "global_step": 10061, "epoch": 239} {"train_loss": -4.966102123260498, "global_step": 10062, "epoch": 239} {"train_loss": -4.991386890411377, "global_step": 10063, "epoch": 239} {"train_loss": -5.08375883102417, "global_step": 10064, "epoch": 239} {"train_loss": -5.2887420654296875, "global_step": 10065, "epoch": 239} {"train_loss": -4.901058197021484, "global_step": 10066, "epoch": 239} {"train_loss": -5.05517053604126, "global_step": 10067, "epoch": 239} {"train_loss": -5.247200965881348, "global_step": 10068, "epoch": 239} {"train_loss": -5.167397499084473, "global_step": 10069, "epoch": 239} {"train_loss": -5.010486602783203, "global_step": 10070, "epoch": 239} {"train_loss": -5.08072566986084, "global_step": 10071, "epoch": 239} {"train_loss": -5.094017028808594, "global_step": 10072, "epoch": 239} {"train_loss": -5.031150817871094, "global_step": 10073, "epoch": 239} {"train_loss": -5.172275543212891, "global_step": 10074, "epoch": 239} {"train_loss": -4.952933311462402, "global_step": 10075, "epoch": 239} {"train_loss": -4.902331352233887, "global_step": 10076, "epoch": 239} {"train_loss": -5.113287925720215, "global_step": 10077, "epoch": 239} {"train_loss": -4.98643684387207, "global_step": 10078, "epoch": 239} {"train_loss": -5.065274181820097, "global_step": 10079, "epoch": 239, "val_loss": 77422.4453125} {"train_loss": -5.140017509460449, "global_step": 10080, "epoch": 240} {"train_loss": -4.969224452972412, "global_step": 10081, "epoch": 240} {"train_loss": -5.153650283813477, "global_step": 10082, "epoch": 240} {"train_loss": -5.055900573730469, "global_step": 10083, "epoch": 240} {"train_loss": -5.032644271850586, "global_step": 10084, "epoch": 240} {"train_loss": -5.119558334350586, "global_step": 10085, "epoch": 240} {"train_loss": -5.160510063171387, "global_step": 10086, "epoch": 240} {"train_loss": -5.03476619720459, "global_step": 10087, "epoch": 240} {"train_loss": -5.094912528991699, "global_step": 10088, "epoch": 240} {"train_loss": -5.09652042388916, "global_step": 10089, "epoch": 240} {"train_loss": -5.028599739074707, "global_step": 10090, "epoch": 240} {"train_loss": -5.095706939697266, "global_step": 10091, "epoch": 240} {"train_loss": -5.015898704528809, "global_step": 10092, "epoch": 240} {"train_loss": -5.009546756744385, "global_step": 10093, "epoch": 240} {"train_loss": -5.166115760803223, "global_step": 10094, "epoch": 240} {"train_loss": -5.094037055969238, "global_step": 10095, "epoch": 240} {"train_loss": -5.150153160095215, "global_step": 10096, "epoch": 240} {"train_loss": -5.044241905212402, "global_step": 10097, "epoch": 240} {"train_loss": -4.981821060180664, "global_step": 10098, "epoch": 240} {"train_loss": -5.267396450042725, "global_step": 10099, "epoch": 240} {"train_loss": -5.058322906494141, "global_step": 10100, "epoch": 240} {"train_loss": -5.167850494384766, "global_step": 10101, "epoch": 240} {"train_loss": -5.252596855163574, "global_step": 10102, "epoch": 240} {"train_loss": -5.077277660369873, "global_step": 10103, "epoch": 240} {"train_loss": -5.170397758483887, "global_step": 10104, "epoch": 240} {"train_loss": -5.130980491638184, "global_step": 10105, "epoch": 240} {"train_loss": -5.068242073059082, "global_step": 10106, "epoch": 240} {"train_loss": -5.227026462554932, "global_step": 10107, "epoch": 240} {"train_loss": -5.122678279876709, "global_step": 10108, "epoch": 240} {"train_loss": -5.221066474914551, "global_step": 10109, "epoch": 240} {"train_loss": -5.033664703369141, "global_step": 10110, "epoch": 240} {"train_loss": -5.005411148071289, "global_step": 10111, "epoch": 240} {"train_loss": -5.115898132324219, "global_step": 10112, "epoch": 240} {"train_loss": -5.201728820800781, "global_step": 10113, "epoch": 240} {"train_loss": -5.084552764892578, "global_step": 10114, "epoch": 240} {"train_loss": -5.044104099273682, "global_step": 10115, "epoch": 240} {"train_loss": -4.97039794921875, "global_step": 10116, "epoch": 240} {"train_loss": -5.012306213378906, "global_step": 10117, "epoch": 240} {"train_loss": -5.071160316467285, "global_step": 10118, "epoch": 240} {"train_loss": -5.045392990112305, "global_step": 10119, "epoch": 240} {"train_loss": -4.968786239624023, "global_step": 10120, "epoch": 240} {"train_loss": -5.0924840314047675, "global_step": 10121, "epoch": 240, "val_loss": 78256.8125} {"train_loss": -5.085824012756348, "global_step": 10122, "epoch": 241} {"train_loss": -4.955588340759277, "global_step": 10123, "epoch": 241} {"train_loss": -4.89298677444458, "global_step": 10124, "epoch": 241} {"train_loss": -5.075218200683594, "global_step": 10125, "epoch": 241} {"train_loss": -5.051640033721924, "global_step": 10126, "epoch": 241} {"train_loss": -4.921072483062744, "global_step": 10127, "epoch": 241} {"train_loss": -5.2849812507629395, "global_step": 10128, "epoch": 241} {"train_loss": -5.062379360198975, "global_step": 10129, "epoch": 241} {"train_loss": -5.082417011260986, "global_step": 10130, "epoch": 241} {"train_loss": -5.084781646728516, "global_step": 10131, "epoch": 241} {"train_loss": -5.008244514465332, "global_step": 10132, "epoch": 241} {"train_loss": -5.133173942565918, "global_step": 10133, "epoch": 241} {"train_loss": -5.042989730834961, "global_step": 10134, "epoch": 241} {"train_loss": -5.066522598266602, "global_step": 10135, "epoch": 241} {"train_loss": -4.984789848327637, "global_step": 10136, "epoch": 241} {"train_loss": -5.037557601928711, "global_step": 10137, "epoch": 241} {"train_loss": -4.964027404785156, "global_step": 10138, "epoch": 241} {"train_loss": -5.1318206787109375, "global_step": 10139, "epoch": 241} {"train_loss": -5.023338794708252, "global_step": 10140, "epoch": 241} {"train_loss": -5.132578372955322, "global_step": 10141, "epoch": 241} {"train_loss": -4.997346878051758, "global_step": 10142, "epoch": 241} {"train_loss": -5.028689384460449, "global_step": 10143, "epoch": 241} {"train_loss": -4.949941635131836, "global_step": 10144, "epoch": 241} {"train_loss": -5.127227306365967, "global_step": 10145, "epoch": 241} {"train_loss": -5.159626007080078, "global_step": 10146, "epoch": 241} {"train_loss": -5.048897743225098, "global_step": 10147, "epoch": 241} {"train_loss": -5.058879375457764, "global_step": 10148, "epoch": 241} {"train_loss": -5.064504623413086, "global_step": 10149, "epoch": 241} {"train_loss": -5.002612113952637, "global_step": 10150, "epoch": 241} {"train_loss": -5.254622459411621, "global_step": 10151, "epoch": 241} {"train_loss": -5.183886528015137, "global_step": 10152, "epoch": 241} {"train_loss": -5.14725399017334, "global_step": 10153, "epoch": 241} {"train_loss": -5.1806745529174805, "global_step": 10154, "epoch": 241} {"train_loss": -5.12870979309082, "global_step": 10155, "epoch": 241} {"train_loss": -5.173396110534668, "global_step": 10156, "epoch": 241} {"train_loss": -4.986154556274414, "global_step": 10157, "epoch": 241} {"train_loss": -4.911723613739014, "global_step": 10158, "epoch": 241} {"train_loss": -5.148343086242676, "global_step": 10159, "epoch": 241} {"train_loss": -5.092167854309082, "global_step": 10160, "epoch": 241} {"train_loss": -5.037740707397461, "global_step": 10161, "epoch": 241} {"train_loss": -4.986663341522217, "global_step": 10162, "epoch": 241} {"train_loss": -5.069538593292236, "global_step": 10163, "epoch": 241, "val_loss": 77484.7890625} {"train_loss": -5.093900680541992, "global_step": 10164, "epoch": 242} {"train_loss": -4.8733015060424805, "global_step": 10165, "epoch": 242} {"train_loss": -5.14254093170166, "global_step": 10166, "epoch": 242} {"train_loss": -5.1718058586120605, "global_step": 10167, "epoch": 242} {"train_loss": -5.087460517883301, "global_step": 10168, "epoch": 242} {"train_loss": -5.0424957275390625, "global_step": 10169, "epoch": 242} {"train_loss": -5.016876220703125, "global_step": 10170, "epoch": 242} {"train_loss": -4.9368181228637695, "global_step": 10171, "epoch": 242} {"train_loss": -5.004504203796387, "global_step": 10172, "epoch": 242} {"train_loss": -5.013381004333496, "global_step": 10173, "epoch": 242} {"train_loss": -4.886791229248047, "global_step": 10174, "epoch": 242} {"train_loss": -5.050411224365234, "global_step": 10175, "epoch": 242} {"train_loss": -4.785194396972656, "global_step": 10176, "epoch": 242} {"train_loss": -4.94326114654541, "global_step": 10177, "epoch": 242} {"train_loss": -4.974503517150879, "global_step": 10178, "epoch": 242} {"train_loss": -4.973912239074707, "global_step": 10179, "epoch": 242} {"train_loss": -5.140573978424072, "global_step": 10180, "epoch": 242} {"train_loss": -5.017279624938965, "global_step": 10181, "epoch": 242} {"train_loss": -4.985705375671387, "global_step": 10182, "epoch": 242} {"train_loss": -5.148683547973633, "global_step": 10183, "epoch": 242} {"train_loss": -5.0187273025512695, "global_step": 10184, "epoch": 242} {"train_loss": -5.010870456695557, "global_step": 10185, "epoch": 242} {"train_loss": -5.107082366943359, "global_step": 10186, "epoch": 242} {"train_loss": -4.997309684753418, "global_step": 10187, "epoch": 242} {"train_loss": -5.101104736328125, "global_step": 10188, "epoch": 242} {"train_loss": -5.0338311195373535, "global_step": 10189, "epoch": 242} {"train_loss": -4.834991455078125, "global_step": 10190, "epoch": 242} {"train_loss": -4.906392574310303, "global_step": 10191, "epoch": 242} {"train_loss": -5.141283988952637, "global_step": 10192, "epoch": 242} {"train_loss": -5.005266189575195, "global_step": 10193, "epoch": 242} {"train_loss": -4.981141090393066, "global_step": 10194, "epoch": 242} {"train_loss": -5.044571399688721, "global_step": 10195, "epoch": 242} {"train_loss": -4.9385528564453125, "global_step": 10196, "epoch": 242} {"train_loss": -5.063887596130371, "global_step": 10197, "epoch": 242} {"train_loss": -4.959172248840332, "global_step": 10198, "epoch": 242} {"train_loss": -5.140810966491699, "global_step": 10199, "epoch": 242} {"train_loss": -5.16689920425415, "global_step": 10200, "epoch": 242} {"train_loss": -5.118744850158691, "global_step": 10201, "epoch": 242} {"train_loss": -5.218713760375977, "global_step": 10202, "epoch": 242} {"train_loss": -5.118293762207031, "global_step": 10203, "epoch": 242} {"train_loss": -5.094143867492676, "global_step": 10204, "epoch": 242} {"train_loss": -5.033810808545067, "global_step": 10205, "epoch": 242, "val_loss": 77474.28125} {"train_loss": -5.181955814361572, "global_step": 10206, "epoch": 243} {"train_loss": -5.2866973876953125, "global_step": 10207, "epoch": 243} {"train_loss": -5.02916145324707, "global_step": 10208, "epoch": 243} {"train_loss": -5.158034324645996, "global_step": 10209, "epoch": 243} {"train_loss": -5.024112224578857, "global_step": 10210, "epoch": 243} {"train_loss": -5.150330066680908, "global_step": 10211, "epoch": 243} {"train_loss": -5.031994819641113, "global_step": 10212, "epoch": 243} {"train_loss": -5.013746738433838, "global_step": 10213, "epoch": 243} {"train_loss": -5.0995073318481445, "global_step": 10214, "epoch": 243} {"train_loss": -5.047253131866455, "global_step": 10215, "epoch": 243} {"train_loss": -5.1280903816223145, "global_step": 10216, "epoch": 243} {"train_loss": -5.058290481567383, "global_step": 10217, "epoch": 243} {"train_loss": -5.173158645629883, "global_step": 10218, "epoch": 243} {"train_loss": -5.029172897338867, "global_step": 10219, "epoch": 243} {"train_loss": -5.006572723388672, "global_step": 10220, "epoch": 243} {"train_loss": -4.959600925445557, "global_step": 10221, "epoch": 243} {"train_loss": -4.782836437225342, "global_step": 10222, "epoch": 243} {"train_loss": -4.797903060913086, "global_step": 10223, "epoch": 243} {"train_loss": -4.9938201904296875, "global_step": 10224, "epoch": 243} {"train_loss": -5.086509704589844, "global_step": 10225, "epoch": 243} {"train_loss": -4.997835159301758, "global_step": 10226, "epoch": 243} {"train_loss": -5.028277397155762, "global_step": 10227, "epoch": 243} {"train_loss": -4.950624942779541, "global_step": 10228, "epoch": 243} {"train_loss": -5.024013996124268, "global_step": 10229, "epoch": 243} {"train_loss": -5.0361175537109375, "global_step": 10230, "epoch": 243} {"train_loss": -4.99298620223999, "global_step": 10231, "epoch": 243} {"train_loss": -5.043248176574707, "global_step": 10232, "epoch": 243} {"train_loss": -4.969359397888184, "global_step": 10233, "epoch": 243} {"train_loss": -5.086730003356934, "global_step": 10234, "epoch": 243} {"train_loss": -4.9524383544921875, "global_step": 10235, "epoch": 243} {"train_loss": -5.083517551422119, "global_step": 10236, "epoch": 243} {"train_loss": -5.019137859344482, "global_step": 10237, "epoch": 243} {"train_loss": -5.0743088722229, "global_step": 10238, "epoch": 243} {"train_loss": -5.112582683563232, "global_step": 10239, "epoch": 243} {"train_loss": -5.083972454071045, "global_step": 10240, "epoch": 243} {"train_loss": -5.107504844665527, "global_step": 10241, "epoch": 243} {"train_loss": -5.024155616760254, "global_step": 10242, "epoch": 243} {"train_loss": -4.975874423980713, "global_step": 10243, "epoch": 243} {"train_loss": -5.066068172454834, "global_step": 10244, "epoch": 243} {"train_loss": -5.018180847167969, "global_step": 10245, "epoch": 243} {"train_loss": -4.902470111846924, "global_step": 10246, "epoch": 243} {"train_loss": -5.040374574207124, "global_step": 10247, "epoch": 243, "val_loss": 77231.953125} {"train_loss": -5.134500026702881, "global_step": 10248, "epoch": 244} {"train_loss": -5.03156852722168, "global_step": 10249, "epoch": 244} {"train_loss": -4.9871826171875, "global_step": 10250, "epoch": 244} {"train_loss": -4.9921441078186035, "global_step": 10251, "epoch": 244} {"train_loss": -5.257489204406738, "global_step": 10252, "epoch": 244} {"train_loss": -5.077892780303955, "global_step": 10253, "epoch": 244} {"train_loss": -5.0048041343688965, "global_step": 10254, "epoch": 244} {"train_loss": -5.030486106872559, "global_step": 10255, "epoch": 244} {"train_loss": -4.974444389343262, "global_step": 10256, "epoch": 244} {"train_loss": -5.125551700592041, "global_step": 10257, "epoch": 244} {"train_loss": -5.11082649230957, "global_step": 10258, "epoch": 244} {"train_loss": -4.97197151184082, "global_step": 10259, "epoch": 244} {"train_loss": -5.134177207946777, "global_step": 10260, "epoch": 244} {"train_loss": -5.108226776123047, "global_step": 10261, "epoch": 244} {"train_loss": -5.155329704284668, "global_step": 10262, "epoch": 244} {"train_loss": -5.182258129119873, "global_step": 10263, "epoch": 244} {"train_loss": -4.859748840332031, "global_step": 10264, "epoch": 244} {"train_loss": -5.12214994430542, "global_step": 10265, "epoch": 244} {"train_loss": -5.138504981994629, "global_step": 10266, "epoch": 244} {"train_loss": -4.857872009277344, "global_step": 10267, "epoch": 244} {"train_loss": -4.916700839996338, "global_step": 10268, "epoch": 244} {"train_loss": -5.028470039367676, "global_step": 10269, "epoch": 244} {"train_loss": -5.141593933105469, "global_step": 10270, "epoch": 244} {"train_loss": -5.107961654663086, "global_step": 10271, "epoch": 244} {"train_loss": -5.196873664855957, "global_step": 10272, "epoch": 244} {"train_loss": -5.189036846160889, "global_step": 10273, "epoch": 244} {"train_loss": -5.20583438873291, "global_step": 10274, "epoch": 244} {"train_loss": -5.057530403137207, "global_step": 10275, "epoch": 244} {"train_loss": -5.147315979003906, "global_step": 10276, "epoch": 244} {"train_loss": -5.105595588684082, "global_step": 10277, "epoch": 244} {"train_loss": -5.011986255645752, "global_step": 10278, "epoch": 244} {"train_loss": -5.135058879852295, "global_step": 10279, "epoch": 244} {"train_loss": -4.9250288009643555, "global_step": 10280, "epoch": 244} {"train_loss": -5.042070388793945, "global_step": 10281, "epoch": 244} {"train_loss": -5.000253200531006, "global_step": 10282, "epoch": 244} {"train_loss": -5.0384416580200195, "global_step": 10283, "epoch": 244} {"train_loss": -5.0310564041137695, "global_step": 10284, "epoch": 244} {"train_loss": -5.09407901763916, "global_step": 10285, "epoch": 244} {"train_loss": -4.999846935272217, "global_step": 10286, "epoch": 244} {"train_loss": -5.010194778442383, "global_step": 10287, "epoch": 244} {"train_loss": -5.178738594055176, "global_step": 10288, "epoch": 244} {"train_loss": -5.068342095329648, "global_step": 10289, "epoch": 244, "val_loss": 76961.921875} {"train_loss": -5.166592597961426, "global_step": 10290, "epoch": 245} {"train_loss": -4.932849884033203, "global_step": 10291, "epoch": 245} {"train_loss": -5.039963722229004, "global_step": 10292, "epoch": 245} {"train_loss": -5.118413925170898, "global_step": 10293, "epoch": 245} {"train_loss": -5.096559047698975, "global_step": 10294, "epoch": 245} {"train_loss": -4.79920768737793, "global_step": 10295, "epoch": 245} {"train_loss": -4.914462089538574, "global_step": 10296, "epoch": 245} {"train_loss": -4.907697677612305, "global_step": 10297, "epoch": 245} {"train_loss": -4.756865501403809, "global_step": 10298, "epoch": 245} {"train_loss": -5.012259483337402, "global_step": 10299, "epoch": 245} {"train_loss": -4.559879779815674, "global_step": 10300, "epoch": 245} {"train_loss": -4.922735214233398, "global_step": 10301, "epoch": 245} {"train_loss": -4.90960693359375, "global_step": 10302, "epoch": 245} {"train_loss": -4.85976505279541, "global_step": 10303, "epoch": 245} {"train_loss": -5.023162364959717, "global_step": 10304, "epoch": 245} {"train_loss": -4.901470184326172, "global_step": 10305, "epoch": 245} {"train_loss": -4.992653846740723, "global_step": 10306, "epoch": 245} {"train_loss": -4.94490909576416, "global_step": 10307, "epoch": 245} {"train_loss": -4.9561543464660645, "global_step": 10308, "epoch": 245} {"train_loss": -4.92472505569458, "global_step": 10309, "epoch": 245} {"train_loss": -5.007090091705322, "global_step": 10310, "epoch": 245} {"train_loss": -4.95893669128418, "global_step": 10311, "epoch": 245} {"train_loss": -5.100319862365723, "global_step": 10312, "epoch": 245} {"train_loss": -4.913737773895264, "global_step": 10313, "epoch": 245} {"train_loss": -5.032891273498535, "global_step": 10314, "epoch": 245} {"train_loss": -4.937014102935791, "global_step": 10315, "epoch": 245} {"train_loss": -4.879814624786377, "global_step": 10316, "epoch": 245} {"train_loss": -5.030361175537109, "global_step": 10317, "epoch": 245} {"train_loss": -5.087381362915039, "global_step": 10318, "epoch": 245} {"train_loss": -4.890195846557617, "global_step": 10319, "epoch": 245} {"train_loss": -5.109831809997559, "global_step": 10320, "epoch": 245} {"train_loss": -4.766443252563477, "global_step": 10321, "epoch": 245} {"train_loss": -4.910339832305908, "global_step": 10322, "epoch": 245} {"train_loss": -5.095736503601074, "global_step": 10323, "epoch": 245} {"train_loss": -4.837306976318359, "global_step": 10324, "epoch": 245} {"train_loss": -5.023006916046143, "global_step": 10325, "epoch": 245} {"train_loss": -5.061534881591797, "global_step": 10326, "epoch": 245} {"train_loss": -5.149765968322754, "global_step": 10327, "epoch": 245} {"train_loss": -5.068720817565918, "global_step": 10328, "epoch": 245} {"train_loss": -5.149883270263672, "global_step": 10329, "epoch": 245} {"train_loss": -4.995558738708496, "global_step": 10330, "epoch": 245} {"train_loss": -4.972595203490484, "global_step": 10331, "epoch": 245, "val_loss": 77197.234375} {"train_loss": -5.022470474243164, "global_step": 10332, "epoch": 246} {"train_loss": -5.119607925415039, "global_step": 10333, "epoch": 246} {"train_loss": -5.015171051025391, "global_step": 10334, "epoch": 246} {"train_loss": -5.029757499694824, "global_step": 10335, "epoch": 246} {"train_loss": -5.093789100646973, "global_step": 10336, "epoch": 246} {"train_loss": -4.990017890930176, "global_step": 10337, "epoch": 246} {"train_loss": -4.963020324707031, "global_step": 10338, "epoch": 246} {"train_loss": -5.192234992980957, "global_step": 10339, "epoch": 246} {"train_loss": -4.9260053634643555, "global_step": 10340, "epoch": 246} {"train_loss": -5.030875205993652, "global_step": 10341, "epoch": 246} {"train_loss": -5.065193176269531, "global_step": 10342, "epoch": 246} {"train_loss": -5.073231220245361, "global_step": 10343, "epoch": 246} {"train_loss": -5.204750061035156, "global_step": 10344, "epoch": 246} {"train_loss": -4.983198165893555, "global_step": 10345, "epoch": 246} {"train_loss": -4.948274612426758, "global_step": 10346, "epoch": 246} {"train_loss": -5.13731575012207, "global_step": 10347, "epoch": 246} {"train_loss": -5.1049275398254395, "global_step": 10348, "epoch": 246} {"train_loss": -5.010781764984131, "global_step": 10349, "epoch": 246} {"train_loss": -5.164827346801758, "global_step": 10350, "epoch": 246} {"train_loss": -5.0787200927734375, "global_step": 10351, "epoch": 246} {"train_loss": -5.14939546585083, "global_step": 10352, "epoch": 246} {"train_loss": -5.057640075683594, "global_step": 10353, "epoch": 246} {"train_loss": -5.112758159637451, "global_step": 10354, "epoch": 246} {"train_loss": -5.158028602600098, "global_step": 10355, "epoch": 246} {"train_loss": -5.2252092361450195, "global_step": 10356, "epoch": 246} {"train_loss": -5.228675842285156, "global_step": 10357, "epoch": 246} {"train_loss": -4.992012977600098, "global_step": 10358, "epoch": 246} {"train_loss": -5.155429840087891, "global_step": 10359, "epoch": 246} {"train_loss": -5.251072406768799, "global_step": 10360, "epoch": 246} {"train_loss": -5.07986307144165, "global_step": 10361, "epoch": 246} {"train_loss": -5.087140083312988, "global_step": 10362, "epoch": 246} {"train_loss": -4.982089996337891, "global_step": 10363, "epoch": 246} {"train_loss": -5.0478057861328125, "global_step": 10364, "epoch": 246} {"train_loss": -5.155223846435547, "global_step": 10365, "epoch": 246} {"train_loss": -5.023580074310303, "global_step": 10366, "epoch": 246} {"train_loss": -5.040349006652832, "global_step": 10367, "epoch": 246} {"train_loss": -5.0502238273620605, "global_step": 10368, "epoch": 246} {"train_loss": -4.714815139770508, "global_step": 10369, "epoch": 246} {"train_loss": -5.077330112457275, "global_step": 10370, "epoch": 246} {"train_loss": -4.913183212280273, "global_step": 10371, "epoch": 246} {"train_loss": -4.7749786376953125, "global_step": 10372, "epoch": 246} {"train_loss": -5.0624931653340655, "global_step": 10373, "epoch": 246, "val_loss": 79564.953125} {"train_loss": -4.8197760581970215, "global_step": 10374, "epoch": 247} {"train_loss": -5.125741958618164, "global_step": 10375, "epoch": 247} {"train_loss": -5.0165205001831055, "global_step": 10376, "epoch": 247} {"train_loss": -4.955004692077637, "global_step": 10377, "epoch": 247} {"train_loss": -5.140642166137695, "global_step": 10378, "epoch": 247} {"train_loss": -4.736787796020508, "global_step": 10379, "epoch": 247} {"train_loss": -5.087954521179199, "global_step": 10380, "epoch": 247} {"train_loss": -4.812751770019531, "global_step": 10381, "epoch": 247} {"train_loss": -4.959107398986816, "global_step": 10382, "epoch": 247} {"train_loss": -4.891437530517578, "global_step": 10383, "epoch": 247} {"train_loss": -5.123599529266357, "global_step": 10384, "epoch": 247} {"train_loss": -4.941145896911621, "global_step": 10385, "epoch": 247} {"train_loss": -5.107737064361572, "global_step": 10386, "epoch": 247} {"train_loss": -4.917525291442871, "global_step": 10387, "epoch": 247} {"train_loss": -5.074711799621582, "global_step": 10388, "epoch": 247} {"train_loss": -4.935544490814209, "global_step": 10389, "epoch": 247} {"train_loss": -4.964279651641846, "global_step": 10390, "epoch": 247} {"train_loss": -5.048102378845215, "global_step": 10391, "epoch": 247} {"train_loss": -4.9396257400512695, "global_step": 10392, "epoch": 247} {"train_loss": -4.90300178527832, "global_step": 10393, "epoch": 247} {"train_loss": -5.164878845214844, "global_step": 10394, "epoch": 247} {"train_loss": -5.0450239181518555, "global_step": 10395, "epoch": 247} {"train_loss": -5.082942008972168, "global_step": 10396, "epoch": 247} {"train_loss": -5.152801513671875, "global_step": 10397, "epoch": 247} {"train_loss": -5.236072540283203, "global_step": 10398, "epoch": 247} {"train_loss": -5.035438060760498, "global_step": 10399, "epoch": 247} {"train_loss": -5.172914505004883, "global_step": 10400, "epoch": 247} {"train_loss": -5.040544033050537, "global_step": 10401, "epoch": 247} {"train_loss": -5.204830646514893, "global_step": 10402, "epoch": 247} {"train_loss": -5.133833408355713, "global_step": 10403, "epoch": 247} {"train_loss": -5.101185321807861, "global_step": 10404, "epoch": 247} {"train_loss": -5.127740859985352, "global_step": 10405, "epoch": 247} {"train_loss": -5.045501232147217, "global_step": 10406, "epoch": 247} {"train_loss": -5.119297981262207, "global_step": 10407, "epoch": 247} {"train_loss": -5.0367431640625, "global_step": 10408, "epoch": 247} {"train_loss": -5.107063293457031, "global_step": 10409, "epoch": 247} {"train_loss": -5.084909439086914, "global_step": 10410, "epoch": 247} {"train_loss": -5.206143379211426, "global_step": 10411, "epoch": 247} {"train_loss": -5.023821830749512, "global_step": 10412, "epoch": 247} {"train_loss": -5.055870056152344, "global_step": 10413, "epoch": 247} {"train_loss": -5.108509063720703, "global_step": 10414, "epoch": 247} {"train_loss": -5.046840610958281, "global_step": 10415, "epoch": 247, "val_loss": 77091.1484375} {"train_loss": -5.021772384643555, "global_step": 10416, "epoch": 248} {"train_loss": -5.062243461608887, "global_step": 10417, "epoch": 248} {"train_loss": -4.795896530151367, "global_step": 10418, "epoch": 248} {"train_loss": -5.048855781555176, "global_step": 10419, "epoch": 248} {"train_loss": -5.198398113250732, "global_step": 10420, "epoch": 248} {"train_loss": -5.108166217803955, "global_step": 10421, "epoch": 248} {"train_loss": -5.073136329650879, "global_step": 10422, "epoch": 248} {"train_loss": -5.146346092224121, "global_step": 10423, "epoch": 248} {"train_loss": -5.164474010467529, "global_step": 10424, "epoch": 248} {"train_loss": -5.06452751159668, "global_step": 10425, "epoch": 248} {"train_loss": -5.036309242248535, "global_step": 10426, "epoch": 248} {"train_loss": -5.109308242797852, "global_step": 10427, "epoch": 248} {"train_loss": -5.0997490882873535, "global_step": 10428, "epoch": 248} {"train_loss": -4.981281757354736, "global_step": 10429, "epoch": 248} {"train_loss": -5.18853759765625, "global_step": 10430, "epoch": 248} {"train_loss": -5.047323226928711, "global_step": 10431, "epoch": 248} {"train_loss": -5.170162200927734, "global_step": 10432, "epoch": 248} {"train_loss": -5.067811965942383, "global_step": 10433, "epoch": 248} {"train_loss": -5.149770259857178, "global_step": 10434, "epoch": 248} {"train_loss": -5.1196722984313965, "global_step": 10435, "epoch": 248} {"train_loss": -5.173098564147949, "global_step": 10436, "epoch": 248} {"train_loss": -5.170928955078125, "global_step": 10437, "epoch": 248} {"train_loss": -5.018791675567627, "global_step": 10438, "epoch": 248} {"train_loss": -5.189141750335693, "global_step": 10439, "epoch": 248} {"train_loss": -4.947367191314697, "global_step": 10440, "epoch": 248} {"train_loss": -5.215632438659668, "global_step": 10441, "epoch": 248} {"train_loss": -5.115711212158203, "global_step": 10442, "epoch": 248} {"train_loss": -4.906050682067871, "global_step": 10443, "epoch": 248} {"train_loss": -4.982379913330078, "global_step": 10444, "epoch": 248} {"train_loss": -5.130825042724609, "global_step": 10445, "epoch": 248} {"train_loss": -5.166972637176514, "global_step": 10446, "epoch": 248} {"train_loss": -5.111363410949707, "global_step": 10447, "epoch": 248} {"train_loss": -5.151556491851807, "global_step": 10448, "epoch": 248} {"train_loss": -5.1979756355285645, "global_step": 10449, "epoch": 248} {"train_loss": -5.104424476623535, "global_step": 10450, "epoch": 248} {"train_loss": -5.154317378997803, "global_step": 10451, "epoch": 248} {"train_loss": -5.0423583984375, "global_step": 10452, "epoch": 248} {"train_loss": -5.167534828186035, "global_step": 10453, "epoch": 248} {"train_loss": -5.128312110900879, "global_step": 10454, "epoch": 248} {"train_loss": -5.147896766662598, "global_step": 10455, "epoch": 248} {"train_loss": -5.078171253204346, "global_step": 10456, "epoch": 248} {"train_loss": -5.0981209845769975, "global_step": 10457, "epoch": 248, "val_loss": 76665.0234375} {"train_loss": -5.074784278869629, "global_step": 10458, "epoch": 249} {"train_loss": -5.089251518249512, "global_step": 10459, "epoch": 249} {"train_loss": -5.12087869644165, "global_step": 10460, "epoch": 249} {"train_loss": -5.177460670471191, "global_step": 10461, "epoch": 249} {"train_loss": -5.14164924621582, "global_step": 10462, "epoch": 249} {"train_loss": -5.0775251388549805, "global_step": 10463, "epoch": 249} {"train_loss": -5.116161346435547, "global_step": 10464, "epoch": 249} {"train_loss": -5.114243507385254, "global_step": 10465, "epoch": 249} {"train_loss": -5.095739364624023, "global_step": 10466, "epoch": 249} {"train_loss": -5.098878383636475, "global_step": 10467, "epoch": 249} {"train_loss": -5.191012382507324, "global_step": 10468, "epoch": 249} {"train_loss": -5.1721110343933105, "global_step": 10469, "epoch": 249} {"train_loss": -5.116031646728516, "global_step": 10470, "epoch": 249} {"train_loss": -5.1783552169799805, "global_step": 10471, "epoch": 249} {"train_loss": -5.005043983459473, "global_step": 10472, "epoch": 249} {"train_loss": -4.998046875, "global_step": 10473, "epoch": 249} {"train_loss": -5.070894241333008, "global_step": 10474, "epoch": 249} {"train_loss": -4.944845199584961, "global_step": 10475, "epoch": 249} {"train_loss": -4.914252758026123, "global_step": 10476, "epoch": 249} {"train_loss": -5.1732940673828125, "global_step": 10477, "epoch": 249} {"train_loss": -5.112083435058594, "global_step": 10478, "epoch": 249} {"train_loss": -5.09136962890625, "global_step": 10479, "epoch": 249} {"train_loss": -5.133587837219238, "global_step": 10480, "epoch": 249} {"train_loss": -5.035388469696045, "global_step": 10481, "epoch": 249} {"train_loss": -4.961589813232422, "global_step": 10482, "epoch": 249} {"train_loss": -5.052451133728027, "global_step": 10483, "epoch": 249} {"train_loss": -5.0674543380737305, "global_step": 10484, "epoch": 249} {"train_loss": -5.09897518157959, "global_step": 10485, "epoch": 249} {"train_loss": -5.055269241333008, "global_step": 10486, "epoch": 249} {"train_loss": -5.2192864418029785, "global_step": 10487, "epoch": 249} {"train_loss": -5.039789199829102, "global_step": 10488, "epoch": 249} {"train_loss": -5.102593421936035, "global_step": 10489, "epoch": 249} {"train_loss": -5.070096015930176, "global_step": 10490, "epoch": 249} {"train_loss": -5.118487358093262, "global_step": 10491, "epoch": 249} {"train_loss": -5.144992828369141, "global_step": 10492, "epoch": 249} {"train_loss": -5.077005386352539, "global_step": 10493, "epoch": 249} {"train_loss": -5.172296524047852, "global_step": 10494, "epoch": 249} {"train_loss": -5.026266098022461, "global_step": 10495, "epoch": 249} {"train_loss": -5.179783821105957, "global_step": 10496, "epoch": 249} {"train_loss": -5.24149227142334, "global_step": 10497, "epoch": 249} {"train_loss": -5.131867408752441, "global_step": 10498, "epoch": 249} {"train_loss": -5.095010712033226, "global_step": 10499, "epoch": 249, "val_loss": 76241.6875} {"train_loss": -5.008162021636963, "global_step": 10500, "epoch": 250} {"train_loss": -4.980845928192139, "global_step": 10501, "epoch": 250} {"train_loss": -5.289737701416016, "global_step": 10502, "epoch": 250} {"train_loss": -5.119436264038086, "global_step": 10503, "epoch": 250} {"train_loss": -5.10258674621582, "global_step": 10504, "epoch": 250} {"train_loss": -4.978428840637207, "global_step": 10505, "epoch": 250} {"train_loss": -5.031113624572754, "global_step": 10506, "epoch": 250} {"train_loss": -5.141169548034668, "global_step": 10507, "epoch": 250} {"train_loss": -5.044803619384766, "global_step": 10508, "epoch": 250} {"train_loss": -5.119240760803223, "global_step": 10509, "epoch": 250} {"train_loss": -5.337610244750977, "global_step": 10510, "epoch": 250} {"train_loss": -5.0111002922058105, "global_step": 10511, "epoch": 250} {"train_loss": -4.882113933563232, "global_step": 10512, "epoch": 250} {"train_loss": -5.122882843017578, "global_step": 10513, "epoch": 250} {"train_loss": -5.2027363777160645, "global_step": 10514, "epoch": 250} {"train_loss": -4.900315284729004, "global_step": 10515, "epoch": 250} {"train_loss": -5.054366111755371, "global_step": 10516, "epoch": 250} {"train_loss": -5.018019676208496, "global_step": 10517, "epoch": 250} {"train_loss": -5.014923095703125, "global_step": 10518, "epoch": 250} {"train_loss": -4.851363182067871, "global_step": 10519, "epoch": 250} {"train_loss": -5.17555046081543, "global_step": 10520, "epoch": 250} {"train_loss": -5.020316123962402, "global_step": 10521, "epoch": 250} {"train_loss": -5.079623222351074, "global_step": 10522, "epoch": 250} {"train_loss": -5.093629837036133, "global_step": 10523, "epoch": 250} {"train_loss": -5.135654449462891, "global_step": 10524, "epoch": 250} {"train_loss": -5.1894378662109375, "global_step": 10525, "epoch": 250} {"train_loss": -5.176677703857422, "global_step": 10526, "epoch": 250} {"train_loss": -5.285695552825928, "global_step": 10527, "epoch": 250} {"train_loss": -5.193794250488281, "global_step": 10528, "epoch": 250} {"train_loss": -5.099655628204346, "global_step": 10529, "epoch": 250} {"train_loss": -5.154715538024902, "global_step": 10530, "epoch": 250} {"train_loss": -5.107392311096191, "global_step": 10531, "epoch": 250} {"train_loss": -4.993751525878906, "global_step": 10532, "epoch": 250} {"train_loss": -5.0810041427612305, "global_step": 10533, "epoch": 250} {"train_loss": -5.082040309906006, "global_step": 10534, "epoch": 250} {"train_loss": -5.136547088623047, "global_step": 10535, "epoch": 250} {"train_loss": -5.1978654861450195, "global_step": 10536, "epoch": 250} {"train_loss": -5.03115177154541, "global_step": 10537, "epoch": 250} {"train_loss": -5.042437553405762, "global_step": 10538, "epoch": 250} {"train_loss": -5.177903175354004, "global_step": 10539, "epoch": 250} {"train_loss": -4.98068380355835, "global_step": 10540, "epoch": 250} {"train_loss": -5.088086764017741, "global_step": 10541, "epoch": 250, "train/sim_max_reward_0": 0.19247049682713255, "train/sim_max_reward_1": 0.01346442557446529, "train/sim_max_reward_2": 0.312053239320524, "train/sim_max_reward_3": 0.04312239360317464, "train/sim_max_reward_4": 0.41988909018679293, "train/sim_max_reward_5": 0.33739017663943227, "test/sim_max_reward_4400000": 0.15944933657685492, "test/sim_max_reward_4400001": 0.421581597913477, "test/sim_max_reward_4400002": 0.2824541873978204, "test/sim_max_reward_4400003": 0.19619555655584445, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.5568836080551315, "test/sim_max_reward_4400009": 0.37650589390106365, "test/sim_max_reward_4400010": 0.1568874864133067, "test/sim_max_reward_4400011": 0.3392672325356835, "test/sim_max_reward_4400012": 0.1886192563549992, "test/sim_max_reward_4400013": 0.17560446662566517, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.41300552283315584, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.21338253176667454, "test/sim_max_reward_4400019": 0.26937393253058933, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5957498965194974, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.04510755698207826, "test/sim_max_reward_4400027": 0.07173778736061898, "test/sim_max_reward_4400028": 0.374997033418842, "test/sim_max_reward_4400029": 0.4386213922956073, "test/sim_max_reward_4400030": 0.031229597183181357, "test/sim_max_reward_4400031": 0.15093364398196935, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.11689705360137477, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.42927326734910426, "test/sim_max_reward_4400036": 0.3993891556950772, "test/sim_max_reward_4400037": 0.4904190140040054, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.4635165549604898, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.0283511494829989, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.21034663485497523, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.18110211008014843, "test/sim_max_reward_4400047": 0.2357920021345364, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.21973163702525358, "test/mean_score": 0.17242680643748606, "val_loss": 77095.6015625} {"train_loss": -4.977874755859375, "global_step": 10542, "epoch": 251} {"train_loss": -5.276731491088867, "global_step": 10543, "epoch": 251} {"train_loss": -5.112015724182129, "global_step": 10544, "epoch": 251} {"train_loss": -5.00059700012207, "global_step": 10545, "epoch": 251} {"train_loss": -5.088770866394043, "global_step": 10546, "epoch": 251} {"train_loss": -4.995411396026611, "global_step": 10547, "epoch": 251} {"train_loss": -4.9468302726745605, "global_step": 10548, "epoch": 251} {"train_loss": -5.060054779052734, "global_step": 10549, "epoch": 251} {"train_loss": -5.041329383850098, "global_step": 10550, "epoch": 251} {"train_loss": -4.940408706665039, "global_step": 10551, "epoch": 251} {"train_loss": -5.1217193603515625, "global_step": 10552, "epoch": 251} {"train_loss": -5.210195541381836, "global_step": 10553, "epoch": 251} {"train_loss": -5.292550563812256, "global_step": 10554, "epoch": 251} {"train_loss": -5.226492881774902, "global_step": 10555, "epoch": 251} {"train_loss": -5.046389102935791, "global_step": 10556, "epoch": 251} {"train_loss": -5.126794815063477, "global_step": 10557, "epoch": 251} {"train_loss": -5.116464614868164, "global_step": 10558, "epoch": 251} {"train_loss": -5.131333351135254, "global_step": 10559, "epoch": 251} {"train_loss": -5.0823869705200195, "global_step": 10560, "epoch": 251} {"train_loss": -5.181265830993652, "global_step": 10561, "epoch": 251} {"train_loss": -4.9693098068237305, "global_step": 10562, "epoch": 251} {"train_loss": -5.17970085144043, "global_step": 10563, "epoch": 251} {"train_loss": -5.1652421951293945, "global_step": 10564, "epoch": 251} {"train_loss": -4.989274501800537, "global_step": 10565, "epoch": 251} {"train_loss": -5.002992630004883, "global_step": 10566, "epoch": 251} {"train_loss": -5.004578113555908, "global_step": 10567, "epoch": 251} {"train_loss": -4.943976402282715, "global_step": 10568, "epoch": 251} {"train_loss": -4.872501850128174, "global_step": 10569, "epoch": 251} {"train_loss": -4.977416038513184, "global_step": 10570, "epoch": 251} {"train_loss": -5.01801872253418, "global_step": 10571, "epoch": 251} {"train_loss": -4.8672990798950195, "global_step": 10572, "epoch": 251} {"train_loss": -5.066375732421875, "global_step": 10573, "epoch": 251} {"train_loss": -5.06381893157959, "global_step": 10574, "epoch": 251} {"train_loss": -5.036012649536133, "global_step": 10575, "epoch": 251} {"train_loss": -4.950570106506348, "global_step": 10576, "epoch": 251} {"train_loss": -5.081982612609863, "global_step": 10577, "epoch": 251} {"train_loss": -4.979959487915039, "global_step": 10578, "epoch": 251} {"train_loss": -5.0873332023620605, "global_step": 10579, "epoch": 251} {"train_loss": -5.21181583404541, "global_step": 10580, "epoch": 251} {"train_loss": -5.118240833282471, "global_step": 10581, "epoch": 251} {"train_loss": -5.169053554534912, "global_step": 10582, "epoch": 251} {"train_loss": -5.0688588959830145, "global_step": 10583, "epoch": 251, "val_loss": 76755.1015625} {"train_loss": -5.14642858505249, "global_step": 10584, "epoch": 252} {"train_loss": -5.160182952880859, "global_step": 10585, "epoch": 252} {"train_loss": -5.052040100097656, "global_step": 10586, "epoch": 252} {"train_loss": -5.054939270019531, "global_step": 10587, "epoch": 252} {"train_loss": -5.004243850708008, "global_step": 10588, "epoch": 252} {"train_loss": -5.142946243286133, "global_step": 10589, "epoch": 252} {"train_loss": -5.109856605529785, "global_step": 10590, "epoch": 252} {"train_loss": -5.0895280838012695, "global_step": 10591, "epoch": 252} {"train_loss": -5.095271587371826, "global_step": 10592, "epoch": 252} {"train_loss": -5.147421836853027, "global_step": 10593, "epoch": 252} {"train_loss": -5.055349349975586, "global_step": 10594, "epoch": 252} {"train_loss": -4.956582069396973, "global_step": 10595, "epoch": 252} {"train_loss": -5.093585014343262, "global_step": 10596, "epoch": 252} {"train_loss": -4.81287145614624, "global_step": 10597, "epoch": 252} {"train_loss": -4.826342582702637, "global_step": 10598, "epoch": 252} {"train_loss": -5.191381931304932, "global_step": 10599, "epoch": 252} {"train_loss": -4.9379730224609375, "global_step": 10600, "epoch": 252} {"train_loss": -4.934655666351318, "global_step": 10601, "epoch": 252} {"train_loss": -5.06833553314209, "global_step": 10602, "epoch": 252} {"train_loss": -5.07735013961792, "global_step": 10603, "epoch": 252} {"train_loss": -5.123231410980225, "global_step": 10604, "epoch": 252} {"train_loss": -5.199898719787598, "global_step": 10605, "epoch": 252} {"train_loss": -5.056865692138672, "global_step": 10606, "epoch": 252} {"train_loss": -5.090747833251953, "global_step": 10607, "epoch": 252} {"train_loss": -5.064508438110352, "global_step": 10608, "epoch": 252} {"train_loss": -5.0086259841918945, "global_step": 10609, "epoch": 252} {"train_loss": -5.095686912536621, "global_step": 10610, "epoch": 252} {"train_loss": -5.021675109863281, "global_step": 10611, "epoch": 252} {"train_loss": -4.921220779418945, "global_step": 10612, "epoch": 252} {"train_loss": -5.0089111328125, "global_step": 10613, "epoch": 252} {"train_loss": -5.053449630737305, "global_step": 10614, "epoch": 252} {"train_loss": -5.052650451660156, "global_step": 10615, "epoch": 252} {"train_loss": -5.030035018920898, "global_step": 10616, "epoch": 252} {"train_loss": -5.106806755065918, "global_step": 10617, "epoch": 252} {"train_loss": -5.105838775634766, "global_step": 10618, "epoch": 252} {"train_loss": -5.098423480987549, "global_step": 10619, "epoch": 252} {"train_loss": -4.973588943481445, "global_step": 10620, "epoch": 252} {"train_loss": -5.175806045532227, "global_step": 10621, "epoch": 252} {"train_loss": -5.010371208190918, "global_step": 10622, "epoch": 252} {"train_loss": -4.946234226226807, "global_step": 10623, "epoch": 252} {"train_loss": -5.089033603668213, "global_step": 10624, "epoch": 252} {"train_loss": -5.057870388031006, "global_step": 10625, "epoch": 252, "val_loss": 76602.90625} {"train_loss": -5.034770965576172, "global_step": 10626, "epoch": 253} {"train_loss": -5.105940818786621, "global_step": 10627, "epoch": 253} {"train_loss": -5.03957462310791, "global_step": 10628, "epoch": 253} {"train_loss": -5.140867233276367, "global_step": 10629, "epoch": 253} {"train_loss": -5.070722579956055, "global_step": 10630, "epoch": 253} {"train_loss": -5.05974817276001, "global_step": 10631, "epoch": 253} {"train_loss": -5.201806545257568, "global_step": 10632, "epoch": 253} {"train_loss": -5.03193473815918, "global_step": 10633, "epoch": 253} {"train_loss": -5.053152084350586, "global_step": 10634, "epoch": 253} {"train_loss": -5.114954948425293, "global_step": 10635, "epoch": 253} {"train_loss": -5.037285804748535, "global_step": 10636, "epoch": 253} {"train_loss": -4.8411126136779785, "global_step": 10637, "epoch": 253} {"train_loss": -5.2306389808654785, "global_step": 10638, "epoch": 253} {"train_loss": -4.958574295043945, "global_step": 10639, "epoch": 253} {"train_loss": -5.055668830871582, "global_step": 10640, "epoch": 253} {"train_loss": -4.991001129150391, "global_step": 10641, "epoch": 253} {"train_loss": -5.047981262207031, "global_step": 10642, "epoch": 253} {"train_loss": -5.05895471572876, "global_step": 10643, "epoch": 253} {"train_loss": -5.1871747970581055, "global_step": 10644, "epoch": 253} {"train_loss": -5.019205570220947, "global_step": 10645, "epoch": 253} {"train_loss": -5.0984296798706055, "global_step": 10646, "epoch": 253} {"train_loss": -5.073077201843262, "global_step": 10647, "epoch": 253} {"train_loss": -4.9254374504089355, "global_step": 10648, "epoch": 253} {"train_loss": -5.069282054901123, "global_step": 10649, "epoch": 253} {"train_loss": -4.976011276245117, "global_step": 10650, "epoch": 253} {"train_loss": -4.84472131729126, "global_step": 10651, "epoch": 253} {"train_loss": -5.059185028076172, "global_step": 10652, "epoch": 253} {"train_loss": -4.860682964324951, "global_step": 10653, "epoch": 253} {"train_loss": -4.968783855438232, "global_step": 10654, "epoch": 253} {"train_loss": -4.882922172546387, "global_step": 10655, "epoch": 253} {"train_loss": -4.906044006347656, "global_step": 10656, "epoch": 253} {"train_loss": -4.947076797485352, "global_step": 10657, "epoch": 253} {"train_loss": -4.9770660400390625, "global_step": 10658, "epoch": 253} {"train_loss": -5.128058433532715, "global_step": 10659, "epoch": 253} {"train_loss": -5.1436767578125, "global_step": 10660, "epoch": 253} {"train_loss": -5.113766670227051, "global_step": 10661, "epoch": 253} {"train_loss": -5.020536422729492, "global_step": 10662, "epoch": 253} {"train_loss": -5.044618606567383, "global_step": 10663, "epoch": 253} {"train_loss": -5.034780502319336, "global_step": 10664, "epoch": 253} {"train_loss": -5.057040691375732, "global_step": 10665, "epoch": 253} {"train_loss": -5.057291030883789, "global_step": 10666, "epoch": 253} {"train_loss": -5.035723879223778, "global_step": 10667, "epoch": 253, "val_loss": 76376.2890625} {"train_loss": -5.091031551361084, "global_step": 10668, "epoch": 254} {"train_loss": -5.0431928634643555, "global_step": 10669, "epoch": 254} {"train_loss": -5.097809791564941, "global_step": 10670, "epoch": 254} {"train_loss": -4.916332244873047, "global_step": 10671, "epoch": 254} {"train_loss": -5.017226219177246, "global_step": 10672, "epoch": 254} {"train_loss": -5.045980453491211, "global_step": 10673, "epoch": 254} {"train_loss": -5.144797325134277, "global_step": 10674, "epoch": 254} {"train_loss": -4.957090854644775, "global_step": 10675, "epoch": 254} {"train_loss": -5.188611030578613, "global_step": 10676, "epoch": 254} {"train_loss": -5.001165390014648, "global_step": 10677, "epoch": 254} {"train_loss": -4.977672576904297, "global_step": 10678, "epoch": 254} {"train_loss": -5.050408363342285, "global_step": 10679, "epoch": 254} {"train_loss": -5.133058547973633, "global_step": 10680, "epoch": 254} {"train_loss": -4.9467926025390625, "global_step": 10681, "epoch": 254} {"train_loss": -4.990339279174805, "global_step": 10682, "epoch": 254} {"train_loss": -5.077171325683594, "global_step": 10683, "epoch": 254} {"train_loss": -5.075922012329102, "global_step": 10684, "epoch": 254} {"train_loss": -5.168733596801758, "global_step": 10685, "epoch": 254} {"train_loss": -5.1896653175354, "global_step": 10686, "epoch": 254} {"train_loss": -5.131799697875977, "global_step": 10687, "epoch": 254} {"train_loss": -5.129361152648926, "global_step": 10688, "epoch": 254} {"train_loss": -4.889918327331543, "global_step": 10689, "epoch": 254} {"train_loss": -4.96811580657959, "global_step": 10690, "epoch": 254} {"train_loss": -5.163012504577637, "global_step": 10691, "epoch": 254} {"train_loss": -5.1125922203063965, "global_step": 10692, "epoch": 254} {"train_loss": -5.030965805053711, "global_step": 10693, "epoch": 254} {"train_loss": -5.197298526763916, "global_step": 10694, "epoch": 254} {"train_loss": -5.146019458770752, "global_step": 10695, "epoch": 254} {"train_loss": -5.172754287719727, "global_step": 10696, "epoch": 254} {"train_loss": -5.1124467849731445, "global_step": 10697, "epoch": 254} {"train_loss": -5.260548114776611, "global_step": 10698, "epoch": 254} {"train_loss": -5.110783576965332, "global_step": 10699, "epoch": 254} {"train_loss": -5.145240783691406, "global_step": 10700, "epoch": 254} {"train_loss": -5.134145736694336, "global_step": 10701, "epoch": 254} {"train_loss": -5.047320365905762, "global_step": 10702, "epoch": 254} {"train_loss": -5.081805229187012, "global_step": 10703, "epoch": 254} {"train_loss": -5.051063537597656, "global_step": 10704, "epoch": 254} {"train_loss": -4.875608444213867, "global_step": 10705, "epoch": 254} {"train_loss": -5.135890007019043, "global_step": 10706, "epoch": 254} {"train_loss": -4.948539733886719, "global_step": 10707, "epoch": 254} {"train_loss": -5.022088050842285, "global_step": 10708, "epoch": 254} {"train_loss": -5.074894144421532, "global_step": 10709, "epoch": 254, "val_loss": 76659.9921875} {"train_loss": -5.132275581359863, "global_step": 10710, "epoch": 255} {"train_loss": -5.098711967468262, "global_step": 10711, "epoch": 255} {"train_loss": -5.154097557067871, "global_step": 10712, "epoch": 255} {"train_loss": -5.097033977508545, "global_step": 10713, "epoch": 255} {"train_loss": -5.075341701507568, "global_step": 10714, "epoch": 255} {"train_loss": -5.0659894943237305, "global_step": 10715, "epoch": 255} {"train_loss": -5.021110534667969, "global_step": 10716, "epoch": 255} {"train_loss": -5.107786178588867, "global_step": 10717, "epoch": 255} {"train_loss": -5.13673210144043, "global_step": 10718, "epoch": 255} {"train_loss": -5.005160808563232, "global_step": 10719, "epoch": 255} {"train_loss": -5.160839080810547, "global_step": 10720, "epoch": 255} {"train_loss": -5.319756507873535, "global_step": 10721, "epoch": 255} {"train_loss": -5.133293628692627, "global_step": 10722, "epoch": 255} {"train_loss": -5.042726516723633, "global_step": 10723, "epoch": 255} {"train_loss": -5.114557266235352, "global_step": 10724, "epoch": 255} {"train_loss": -5.070065498352051, "global_step": 10725, "epoch": 255} {"train_loss": -5.053001880645752, "global_step": 10726, "epoch": 255} {"train_loss": -5.198399066925049, "global_step": 10727, "epoch": 255} {"train_loss": -5.149928092956543, "global_step": 10728, "epoch": 255} {"train_loss": -5.061408042907715, "global_step": 10729, "epoch": 255} {"train_loss": -5.018638610839844, "global_step": 10730, "epoch": 255} {"train_loss": -5.128251075744629, "global_step": 10731, "epoch": 255} {"train_loss": -5.226865768432617, "global_step": 10732, "epoch": 255} {"train_loss": -5.178343772888184, "global_step": 10733, "epoch": 255} {"train_loss": -5.178752899169922, "global_step": 10734, "epoch": 255} {"train_loss": -5.132875919342041, "global_step": 10735, "epoch": 255} {"train_loss": -5.058476448059082, "global_step": 10736, "epoch": 255} {"train_loss": -5.2132039070129395, "global_step": 10737, "epoch": 255} {"train_loss": -5.115520000457764, "global_step": 10738, "epoch": 255} {"train_loss": -5.122652053833008, "global_step": 10739, "epoch": 255} {"train_loss": -5.0973591804504395, "global_step": 10740, "epoch": 255} {"train_loss": -4.957378387451172, "global_step": 10741, "epoch": 255} {"train_loss": -5.077941417694092, "global_step": 10742, "epoch": 255} {"train_loss": -5.018149375915527, "global_step": 10743, "epoch": 255} {"train_loss": -5.026811599731445, "global_step": 10744, "epoch": 255} {"train_loss": -4.924137592315674, "global_step": 10745, "epoch": 255} {"train_loss": -5.118878364562988, "global_step": 10746, "epoch": 255} {"train_loss": -5.004673004150391, "global_step": 10747, "epoch": 255} {"train_loss": -4.666666030883789, "global_step": 10748, "epoch": 255} {"train_loss": -4.943694114685059, "global_step": 10749, "epoch": 255} {"train_loss": -4.747798919677734, "global_step": 10750, "epoch": 255} {"train_loss": -5.073777516682942, "global_step": 10751, "epoch": 255, "val_loss": 76830.171875} {"train_loss": -5.008431911468506, "global_step": 10752, "epoch": 256} {"train_loss": -4.706284523010254, "global_step": 10753, "epoch": 256} {"train_loss": -5.016233444213867, "global_step": 10754, "epoch": 256} {"train_loss": -4.885611057281494, "global_step": 10755, "epoch": 256} {"train_loss": -5.035473823547363, "global_step": 10756, "epoch": 256} {"train_loss": -4.9788360595703125, "global_step": 10757, "epoch": 256} {"train_loss": -4.9590301513671875, "global_step": 10758, "epoch": 256} {"train_loss": -5.097127914428711, "global_step": 10759, "epoch": 256} {"train_loss": -5.003710746765137, "global_step": 10760, "epoch": 256} {"train_loss": -5.084969520568848, "global_step": 10761, "epoch": 256} {"train_loss": -5.011866569519043, "global_step": 10762, "epoch": 256} {"train_loss": -4.98604679107666, "global_step": 10763, "epoch": 256} {"train_loss": -5.000659942626953, "global_step": 10764, "epoch": 256} {"train_loss": -5.053676605224609, "global_step": 10765, "epoch": 256} {"train_loss": -4.952354431152344, "global_step": 10766, "epoch": 256} {"train_loss": -5.164233207702637, "global_step": 10767, "epoch": 256} {"train_loss": -5.220396995544434, "global_step": 10768, "epoch": 256} {"train_loss": -5.137944221496582, "global_step": 10769, "epoch": 256} {"train_loss": -5.125223159790039, "global_step": 10770, "epoch": 256} {"train_loss": -5.079701900482178, "global_step": 10771, "epoch": 256} {"train_loss": -5.004088401794434, "global_step": 10772, "epoch": 256} {"train_loss": -5.07054328918457, "global_step": 10773, "epoch": 256} {"train_loss": -5.244870185852051, "global_step": 10774, "epoch": 256} {"train_loss": -5.006280422210693, "global_step": 10775, "epoch": 256} {"train_loss": -5.204390048980713, "global_step": 10776, "epoch": 256} {"train_loss": -5.047725677490234, "global_step": 10777, "epoch": 256} {"train_loss": -5.14100980758667, "global_step": 10778, "epoch": 256} {"train_loss": -5.020864486694336, "global_step": 10779, "epoch": 256} {"train_loss": -5.054547309875488, "global_step": 10780, "epoch": 256} {"train_loss": -5.06461763381958, "global_step": 10781, "epoch": 256} {"train_loss": -5.211594581604004, "global_step": 10782, "epoch": 256} {"train_loss": -5.1873555183410645, "global_step": 10783, "epoch": 256} {"train_loss": -4.999606132507324, "global_step": 10784, "epoch": 256} {"train_loss": -5.012426376342773, "global_step": 10785, "epoch": 256} {"train_loss": -5.157808780670166, "global_step": 10786, "epoch": 256} {"train_loss": -4.991552352905273, "global_step": 10787, "epoch": 256} {"train_loss": -4.9639387130737305, "global_step": 10788, "epoch": 256} {"train_loss": -5.065016746520996, "global_step": 10789, "epoch": 256} {"train_loss": -5.082326889038086, "global_step": 10790, "epoch": 256} {"train_loss": -4.960812091827393, "global_step": 10791, "epoch": 256} {"train_loss": -5.080705642700195, "global_step": 10792, "epoch": 256} {"train_loss": -5.052105676560175, "global_step": 10793, "epoch": 256, "val_loss": 76551.515625} {"train_loss": -4.984827995300293, "global_step": 10794, "epoch": 257} {"train_loss": -5.0849714279174805, "global_step": 10795, "epoch": 257} {"train_loss": -5.075538635253906, "global_step": 10796, "epoch": 257} {"train_loss": -5.114565372467041, "global_step": 10797, "epoch": 257} {"train_loss": -5.129784107208252, "global_step": 10798, "epoch": 257} {"train_loss": -5.2231597900390625, "global_step": 10799, "epoch": 257} {"train_loss": -5.022409439086914, "global_step": 10800, "epoch": 257} {"train_loss": -4.9946441650390625, "global_step": 10801, "epoch": 257} {"train_loss": -5.190601348876953, "global_step": 10802, "epoch": 257} {"train_loss": -5.037432670593262, "global_step": 10803, "epoch": 257} {"train_loss": -5.093427658081055, "global_step": 10804, "epoch": 257} {"train_loss": -4.9620208740234375, "global_step": 10805, "epoch": 257} {"train_loss": -5.116669654846191, "global_step": 10806, "epoch": 257} {"train_loss": -5.051977634429932, "global_step": 10807, "epoch": 257} {"train_loss": -5.014910697937012, "global_step": 10808, "epoch": 257} {"train_loss": -4.9836320877075195, "global_step": 10809, "epoch": 257} {"train_loss": -5.31452751159668, "global_step": 10810, "epoch": 257} {"train_loss": -5.0188069343566895, "global_step": 10811, "epoch": 257} {"train_loss": -5.088762283325195, "global_step": 10812, "epoch": 257} {"train_loss": -5.209051609039307, "global_step": 10813, "epoch": 257} {"train_loss": -5.069189071655273, "global_step": 10814, "epoch": 257} {"train_loss": -4.986237049102783, "global_step": 10815, "epoch": 257} {"train_loss": -5.2182793617248535, "global_step": 10816, "epoch": 257} {"train_loss": -5.039411544799805, "global_step": 10817, "epoch": 257} {"train_loss": -5.099714756011963, "global_step": 10818, "epoch": 257} {"train_loss": -5.115130424499512, "global_step": 10819, "epoch": 257} {"train_loss": -5.129382133483887, "global_step": 10820, "epoch": 257} {"train_loss": -5.192355155944824, "global_step": 10821, "epoch": 257} {"train_loss": -5.226439476013184, "global_step": 10822, "epoch": 257} {"train_loss": -5.073102951049805, "global_step": 10823, "epoch": 257} {"train_loss": -5.178964138031006, "global_step": 10824, "epoch": 257} {"train_loss": -5.160125255584717, "global_step": 10825, "epoch": 257} {"train_loss": -5.162185192108154, "global_step": 10826, "epoch": 257} {"train_loss": -5.105504035949707, "global_step": 10827, "epoch": 257} {"train_loss": -5.085633277893066, "global_step": 10828, "epoch": 257} {"train_loss": -5.171792030334473, "global_step": 10829, "epoch": 257} {"train_loss": -5.055986404418945, "global_step": 10830, "epoch": 257} {"train_loss": -5.156425952911377, "global_step": 10831, "epoch": 257} {"train_loss": -5.168303489685059, "global_step": 10832, "epoch": 257} {"train_loss": -5.037051677703857, "global_step": 10833, "epoch": 257} {"train_loss": -5.265902996063232, "global_step": 10834, "epoch": 257} {"train_loss": -5.106946661358788, "global_step": 10835, "epoch": 257, "val_loss": 76471.53125} {"train_loss": -5.135724067687988, "global_step": 10836, "epoch": 258} {"train_loss": -4.979606628417969, "global_step": 10837, "epoch": 258} {"train_loss": -5.112616539001465, "global_step": 10838, "epoch": 258} {"train_loss": -4.969829559326172, "global_step": 10839, "epoch": 258} {"train_loss": -5.027172088623047, "global_step": 10840, "epoch": 258} {"train_loss": -5.152784824371338, "global_step": 10841, "epoch": 258} {"train_loss": -5.023800849914551, "global_step": 10842, "epoch": 258} {"train_loss": -5.269858360290527, "global_step": 10843, "epoch": 258} {"train_loss": -5.081882476806641, "global_step": 10844, "epoch": 258} {"train_loss": -5.182162284851074, "global_step": 10845, "epoch": 258} {"train_loss": -5.171389579772949, "global_step": 10846, "epoch": 258} {"train_loss": -5.188837051391602, "global_step": 10847, "epoch": 258} {"train_loss": -4.965297698974609, "global_step": 10848, "epoch": 258} {"train_loss": -4.942181587219238, "global_step": 10849, "epoch": 258} {"train_loss": -5.213171005249023, "global_step": 10850, "epoch": 258} {"train_loss": -4.9235076904296875, "global_step": 10851, "epoch": 258} {"train_loss": -5.112883567810059, "global_step": 10852, "epoch": 258} {"train_loss": -5.112261772155762, "global_step": 10853, "epoch": 258} {"train_loss": -5.224621772766113, "global_step": 10854, "epoch": 258} {"train_loss": -5.074901580810547, "global_step": 10855, "epoch": 258} {"train_loss": -5.231174468994141, "global_step": 10856, "epoch": 258} {"train_loss": -5.045387268066406, "global_step": 10857, "epoch": 258} {"train_loss": -4.978999137878418, "global_step": 10858, "epoch": 258} {"train_loss": -5.11447286605835, "global_step": 10859, "epoch": 258} {"train_loss": -5.155020236968994, "global_step": 10860, "epoch": 258} {"train_loss": -4.944761276245117, "global_step": 10861, "epoch": 258} {"train_loss": -5.2396016120910645, "global_step": 10862, "epoch": 258} {"train_loss": -5.140291213989258, "global_step": 10863, "epoch": 258} {"train_loss": -5.182394027709961, "global_step": 10864, "epoch": 258} {"train_loss": -4.959631443023682, "global_step": 10865, "epoch": 258} {"train_loss": -5.163654804229736, "global_step": 10866, "epoch": 258} {"train_loss": -5.174774169921875, "global_step": 10867, "epoch": 258} {"train_loss": -5.025773048400879, "global_step": 10868, "epoch": 258} {"train_loss": -5.16146183013916, "global_step": 10869, "epoch": 258} {"train_loss": -5.167070388793945, "global_step": 10870, "epoch": 258} {"train_loss": -5.007305145263672, "global_step": 10871, "epoch": 258} {"train_loss": -4.8645734786987305, "global_step": 10872, "epoch": 258} {"train_loss": -4.997419357299805, "global_step": 10873, "epoch": 258} {"train_loss": -4.909500598907471, "global_step": 10874, "epoch": 258} {"train_loss": -5.0946221351623535, "global_step": 10875, "epoch": 258} {"train_loss": -5.141327857971191, "global_step": 10876, "epoch": 258} {"train_loss": -5.083237625303722, "global_step": 10877, "epoch": 258, "val_loss": 76267.2421875} {"train_loss": -5.1721696853637695, "global_step": 10878, "epoch": 259} {"train_loss": -4.976951599121094, "global_step": 10879, "epoch": 259} {"train_loss": -5.116243362426758, "global_step": 10880, "epoch": 259} {"train_loss": -5.126150608062744, "global_step": 10881, "epoch": 259} {"train_loss": -5.148623466491699, "global_step": 10882, "epoch": 259} {"train_loss": -5.093667030334473, "global_step": 10883, "epoch": 259} {"train_loss": -5.025216102600098, "global_step": 10884, "epoch": 259} {"train_loss": -5.303662300109863, "global_step": 10885, "epoch": 259} {"train_loss": -5.09035587310791, "global_step": 10886, "epoch": 259} {"train_loss": -5.142053604125977, "global_step": 10887, "epoch": 259} {"train_loss": -5.02984094619751, "global_step": 10888, "epoch": 259} {"train_loss": -5.256527900695801, "global_step": 10889, "epoch": 259} {"train_loss": -5.141594886779785, "global_step": 10890, "epoch": 259} {"train_loss": -4.992475509643555, "global_step": 10891, "epoch": 259} {"train_loss": -5.090328693389893, "global_step": 10892, "epoch": 259} {"train_loss": -5.085813045501709, "global_step": 10893, "epoch": 259} {"train_loss": -5.113615036010742, "global_step": 10894, "epoch": 259} {"train_loss": -5.176474094390869, "global_step": 10895, "epoch": 259} {"train_loss": -4.93928337097168, "global_step": 10896, "epoch": 259} {"train_loss": -5.1907219886779785, "global_step": 10897, "epoch": 259} {"train_loss": -5.166438102722168, "global_step": 10898, "epoch": 259} {"train_loss": -5.138762474060059, "global_step": 10899, "epoch": 259} {"train_loss": -5.1334381103515625, "global_step": 10900, "epoch": 259} {"train_loss": -5.106083393096924, "global_step": 10901, "epoch": 259} {"train_loss": -5.17057991027832, "global_step": 10902, "epoch": 259} {"train_loss": -5.235034465789795, "global_step": 10903, "epoch": 259} {"train_loss": -5.153870582580566, "global_step": 10904, "epoch": 259} {"train_loss": -5.082493782043457, "global_step": 10905, "epoch": 259} {"train_loss": -5.126397609710693, "global_step": 10906, "epoch": 259} {"train_loss": -5.096231937408447, "global_step": 10907, "epoch": 259} {"train_loss": -5.214412689208984, "global_step": 10908, "epoch": 259} {"train_loss": -5.167231559753418, "global_step": 10909, "epoch": 259} {"train_loss": -5.146904945373535, "global_step": 10910, "epoch": 259} {"train_loss": -4.998530387878418, "global_step": 10911, "epoch": 259} {"train_loss": -5.002110004425049, "global_step": 10912, "epoch": 259} {"train_loss": -4.9725542068481445, "global_step": 10913, "epoch": 259} {"train_loss": -5.061739921569824, "global_step": 10914, "epoch": 259} {"train_loss": -5.102063179016113, "global_step": 10915, "epoch": 259} {"train_loss": -5.106539726257324, "global_step": 10916, "epoch": 259} {"train_loss": -5.070640563964844, "global_step": 10917, "epoch": 259} {"train_loss": -5.143697261810303, "global_step": 10918, "epoch": 259} {"train_loss": -5.1105319658915205, "global_step": 10919, "epoch": 259, "val_loss": 76216.3125} {"train_loss": -5.1527791023254395, "global_step": 10920, "epoch": 260} {"train_loss": -5.162710189819336, "global_step": 10921, "epoch": 260} {"train_loss": -5.032863616943359, "global_step": 10922, "epoch": 260} {"train_loss": -5.086501598358154, "global_step": 10923, "epoch": 260} {"train_loss": -5.018210411071777, "global_step": 10924, "epoch": 260} {"train_loss": -5.153755187988281, "global_step": 10925, "epoch": 260} {"train_loss": -5.141226768493652, "global_step": 10926, "epoch": 260} {"train_loss": -5.080846786499023, "global_step": 10927, "epoch": 260} {"train_loss": -4.998634338378906, "global_step": 10928, "epoch": 260} {"train_loss": -5.193676948547363, "global_step": 10929, "epoch": 260} {"train_loss": -5.017044544219971, "global_step": 10930, "epoch": 260} {"train_loss": -4.916928291320801, "global_step": 10931, "epoch": 260} {"train_loss": -5.151915550231934, "global_step": 10932, "epoch": 260} {"train_loss": -4.87867546081543, "global_step": 10933, "epoch": 260} {"train_loss": -4.834867477416992, "global_step": 10934, "epoch": 260} {"train_loss": -4.892946243286133, "global_step": 10935, "epoch": 260} {"train_loss": -4.945143699645996, "global_step": 10936, "epoch": 260} {"train_loss": -5.027755260467529, "global_step": 10937, "epoch": 260} {"train_loss": -4.8292083740234375, "global_step": 10938, "epoch": 260} {"train_loss": -5.123814582824707, "global_step": 10939, "epoch": 260} {"train_loss": -4.792437553405762, "global_step": 10940, "epoch": 260} {"train_loss": -5.181381702423096, "global_step": 10941, "epoch": 260} {"train_loss": -5.018343925476074, "global_step": 10942, "epoch": 260} {"train_loss": -4.900119304656982, "global_step": 10943, "epoch": 260} {"train_loss": -5.085827827453613, "global_step": 10944, "epoch": 260} {"train_loss": -4.932211875915527, "global_step": 10945, "epoch": 260} {"train_loss": -5.203585624694824, "global_step": 10946, "epoch": 260} {"train_loss": -5.0015716552734375, "global_step": 10947, "epoch": 260} {"train_loss": -4.986714839935303, "global_step": 10948, "epoch": 260} {"train_loss": -5.065098762512207, "global_step": 10949, "epoch": 260} {"train_loss": -4.847229480743408, "global_step": 10950, "epoch": 260} {"train_loss": -5.062009811401367, "global_step": 10951, "epoch": 260} {"train_loss": -5.163247585296631, "global_step": 10952, "epoch": 260} {"train_loss": -5.030230522155762, "global_step": 10953, "epoch": 260} {"train_loss": -5.083300590515137, "global_step": 10954, "epoch": 260} {"train_loss": -5.015598297119141, "global_step": 10955, "epoch": 260} {"train_loss": -5.130169868469238, "global_step": 10956, "epoch": 260} {"train_loss": -4.963862419128418, "global_step": 10957, "epoch": 260} {"train_loss": -5.06367301940918, "global_step": 10958, "epoch": 260} {"train_loss": -5.226250648498535, "global_step": 10959, "epoch": 260} {"train_loss": -5.2677717208862305, "global_step": 10960, "epoch": 260} {"train_loss": -5.041992232913063, "global_step": 10961, "epoch": 260, "val_loss": 76221.2578125} {"train_loss": -5.117270469665527, "global_step": 10962, "epoch": 261} {"train_loss": -5.199254989624023, "global_step": 10963, "epoch": 261} {"train_loss": -4.962253570556641, "global_step": 10964, "epoch": 261} {"train_loss": -4.9702043533325195, "global_step": 10965, "epoch": 261} {"train_loss": -5.15083122253418, "global_step": 10966, "epoch": 261} {"train_loss": -5.09464168548584, "global_step": 10967, "epoch": 261} {"train_loss": -5.044987201690674, "global_step": 10968, "epoch": 261} {"train_loss": -5.071362495422363, "global_step": 10969, "epoch": 261} {"train_loss": -5.176201820373535, "global_step": 10970, "epoch": 261} {"train_loss": -5.01568078994751, "global_step": 10971, "epoch": 261} {"train_loss": -5.060790538787842, "global_step": 10972, "epoch": 261} {"train_loss": -5.102409839630127, "global_step": 10973, "epoch": 261} {"train_loss": -5.155311584472656, "global_step": 10974, "epoch": 261} {"train_loss": -5.117224216461182, "global_step": 10975, "epoch": 261} {"train_loss": -5.095815658569336, "global_step": 10976, "epoch": 261} {"train_loss": -5.094554901123047, "global_step": 10977, "epoch": 261} {"train_loss": -5.110978126525879, "global_step": 10978, "epoch": 261} {"train_loss": -5.250245571136475, "global_step": 10979, "epoch": 261} {"train_loss": -5.049612045288086, "global_step": 10980, "epoch": 261} {"train_loss": -5.118315696716309, "global_step": 10981, "epoch": 261} {"train_loss": -5.142622470855713, "global_step": 10982, "epoch": 261} {"train_loss": -4.939356327056885, "global_step": 10983, "epoch": 261} {"train_loss": -5.22606086730957, "global_step": 10984, "epoch": 261} {"train_loss": -5.181999206542969, "global_step": 10985, "epoch": 261} {"train_loss": -4.985771656036377, "global_step": 10986, "epoch": 261} {"train_loss": -5.000879764556885, "global_step": 10987, "epoch": 261} {"train_loss": -5.039411544799805, "global_step": 10988, "epoch": 261} {"train_loss": -5.105804920196533, "global_step": 10989, "epoch": 261} {"train_loss": -4.910585403442383, "global_step": 10990, "epoch": 261} {"train_loss": -5.231998443603516, "global_step": 10991, "epoch": 261} {"train_loss": -5.082644939422607, "global_step": 10992, "epoch": 261} {"train_loss": -5.092903137207031, "global_step": 10993, "epoch": 261} {"train_loss": -4.8954596519470215, "global_step": 10994, "epoch": 261} {"train_loss": -5.060821533203125, "global_step": 10995, "epoch": 261} {"train_loss": -5.052276134490967, "global_step": 10996, "epoch": 261} {"train_loss": -5.086504936218262, "global_step": 10997, "epoch": 261} {"train_loss": -5.047406196594238, "global_step": 10998, "epoch": 261} {"train_loss": -5.125171184539795, "global_step": 10999, "epoch": 261} {"train_loss": -5.0401434898376465, "global_step": 11000, "epoch": 261} {"train_loss": -5.09990119934082, "global_step": 11001, "epoch": 261} {"train_loss": -5.054522514343262, "global_step": 11002, "epoch": 261} {"train_loss": -5.081243106297085, "global_step": 11003, "epoch": 261, "val_loss": 75359.1953125} {"train_loss": -5.058496952056885, "global_step": 11004, "epoch": 262} {"train_loss": -5.26653528213501, "global_step": 11005, "epoch": 262} {"train_loss": -5.200216293334961, "global_step": 11006, "epoch": 262} {"train_loss": -5.230648994445801, "global_step": 11007, "epoch": 262} {"train_loss": -5.083307266235352, "global_step": 11008, "epoch": 262} {"train_loss": -5.184192657470703, "global_step": 11009, "epoch": 262} {"train_loss": -5.169943809509277, "global_step": 11010, "epoch": 262} {"train_loss": -5.055750846862793, "global_step": 11011, "epoch": 262} {"train_loss": -5.066339492797852, "global_step": 11012, "epoch": 262} {"train_loss": -5.145688056945801, "global_step": 11013, "epoch": 262} {"train_loss": -5.186434745788574, "global_step": 11014, "epoch": 262} {"train_loss": -5.179173469543457, "global_step": 11015, "epoch": 262} {"train_loss": -4.9815897941589355, "global_step": 11016, "epoch": 262} {"train_loss": -5.093033790588379, "global_step": 11017, "epoch": 262} {"train_loss": -5.254814147949219, "global_step": 11018, "epoch": 262} {"train_loss": -5.1784563064575195, "global_step": 11019, "epoch": 262} {"train_loss": -4.84548282623291, "global_step": 11020, "epoch": 262} {"train_loss": -5.194761276245117, "global_step": 11021, "epoch": 262} {"train_loss": -4.888882637023926, "global_step": 11022, "epoch": 262} {"train_loss": -5.038081169128418, "global_step": 11023, "epoch": 262} {"train_loss": -4.937168598175049, "global_step": 11024, "epoch": 262} {"train_loss": -4.944954872131348, "global_step": 11025, "epoch": 262} {"train_loss": -4.973075866699219, "global_step": 11026, "epoch": 262} {"train_loss": -4.875627517700195, "global_step": 11027, "epoch": 262} {"train_loss": -4.8974103927612305, "global_step": 11028, "epoch": 262} {"train_loss": -5.119357585906982, "global_step": 11029, "epoch": 262} {"train_loss": -5.042449951171875, "global_step": 11030, "epoch": 262} {"train_loss": -4.960897445678711, "global_step": 11031, "epoch": 262} {"train_loss": -5.1563496589660645, "global_step": 11032, "epoch": 262} {"train_loss": -5.002668380737305, "global_step": 11033, "epoch": 262} {"train_loss": -5.054388046264648, "global_step": 11034, "epoch": 262} {"train_loss": -4.903438091278076, "global_step": 11035, "epoch": 262} {"train_loss": -5.007320404052734, "global_step": 11036, "epoch": 262} {"train_loss": -5.199751853942871, "global_step": 11037, "epoch": 262} {"train_loss": -4.933053016662598, "global_step": 11038, "epoch": 262} {"train_loss": -5.154906272888184, "global_step": 11039, "epoch": 262} {"train_loss": -5.027890205383301, "global_step": 11040, "epoch": 262} {"train_loss": -5.060082912445068, "global_step": 11041, "epoch": 262} {"train_loss": -5.012497901916504, "global_step": 11042, "epoch": 262} {"train_loss": -4.972253799438477, "global_step": 11043, "epoch": 262} {"train_loss": -5.205399990081787, "global_step": 11044, "epoch": 262} {"train_loss": -5.067454769497826, "global_step": 11045, "epoch": 262, "val_loss": 75789.9140625} {"train_loss": -5.087337017059326, "global_step": 11046, "epoch": 263} {"train_loss": -5.139272212982178, "global_step": 11047, "epoch": 263} {"train_loss": -4.939394474029541, "global_step": 11048, "epoch": 263} {"train_loss": -5.16292667388916, "global_step": 11049, "epoch": 263} {"train_loss": -4.986167907714844, "global_step": 11050, "epoch": 263} {"train_loss": -5.157085418701172, "global_step": 11051, "epoch": 263} {"train_loss": -5.114405632019043, "global_step": 11052, "epoch": 263} {"train_loss": -5.157269477844238, "global_step": 11053, "epoch": 263} {"train_loss": -5.091410160064697, "global_step": 11054, "epoch": 263} {"train_loss": -5.075360298156738, "global_step": 11055, "epoch": 263} {"train_loss": -5.205390930175781, "global_step": 11056, "epoch": 263} {"train_loss": -5.226553916931152, "global_step": 11057, "epoch": 263} {"train_loss": -5.208205223083496, "global_step": 11058, "epoch": 263} {"train_loss": -5.121248245239258, "global_step": 11059, "epoch": 263} {"train_loss": -5.059624195098877, "global_step": 11060, "epoch": 263} {"train_loss": -5.155725479125977, "global_step": 11061, "epoch": 263} {"train_loss": -5.189984321594238, "global_step": 11062, "epoch": 263} {"train_loss": -5.130188941955566, "global_step": 11063, "epoch": 263} {"train_loss": -5.013269424438477, "global_step": 11064, "epoch": 263} {"train_loss": -5.101262092590332, "global_step": 11065, "epoch": 263} {"train_loss": -5.211105823516846, "global_step": 11066, "epoch": 263} {"train_loss": -5.121297836303711, "global_step": 11067, "epoch": 263} {"train_loss": -5.040635585784912, "global_step": 11068, "epoch": 263} {"train_loss": -5.039445877075195, "global_step": 11069, "epoch": 263} {"train_loss": -5.088772296905518, "global_step": 11070, "epoch": 263} {"train_loss": -5.051346778869629, "global_step": 11071, "epoch": 263} {"train_loss": -5.0501837730407715, "global_step": 11072, "epoch": 263} {"train_loss": -4.978728294372559, "global_step": 11073, "epoch": 263} {"train_loss": -5.083171844482422, "global_step": 11074, "epoch": 263} {"train_loss": -5.0359625816345215, "global_step": 11075, "epoch": 263} {"train_loss": -4.993186950683594, "global_step": 11076, "epoch": 263} {"train_loss": -5.1407575607299805, "global_step": 11077, "epoch": 263} {"train_loss": -5.051485061645508, "global_step": 11078, "epoch": 263} {"train_loss": -5.166258811950684, "global_step": 11079, "epoch": 263} {"train_loss": -5.014115810394287, "global_step": 11080, "epoch": 263} {"train_loss": -5.02017068862915, "global_step": 11081, "epoch": 263} {"train_loss": -4.984294891357422, "global_step": 11082, "epoch": 263} {"train_loss": -5.078192710876465, "global_step": 11083, "epoch": 263} {"train_loss": -5.126072883605957, "global_step": 11084, "epoch": 263} {"train_loss": -4.984559059143066, "global_step": 11085, "epoch": 263} {"train_loss": -4.997794151306152, "global_step": 11086, "epoch": 263} {"train_loss": -5.082955871309553, "global_step": 11087, "epoch": 263, "val_loss": 75953.9375} {"train_loss": -4.962338447570801, "global_step": 11088, "epoch": 264} {"train_loss": -5.127367973327637, "global_step": 11089, "epoch": 264} {"train_loss": -4.909402370452881, "global_step": 11090, "epoch": 264} {"train_loss": -5.022760391235352, "global_step": 11091, "epoch": 264} {"train_loss": -5.17354154586792, "global_step": 11092, "epoch": 264} {"train_loss": -5.041563987731934, "global_step": 11093, "epoch": 264} {"train_loss": -5.235678672790527, "global_step": 11094, "epoch": 264} {"train_loss": -4.99455451965332, "global_step": 11095, "epoch": 264} {"train_loss": -5.073334693908691, "global_step": 11096, "epoch": 264} {"train_loss": -5.031368732452393, "global_step": 11097, "epoch": 264} {"train_loss": -5.025343894958496, "global_step": 11098, "epoch": 264} {"train_loss": -5.06149959564209, "global_step": 11099, "epoch": 264} {"train_loss": -4.887749195098877, "global_step": 11100, "epoch": 264} {"train_loss": -5.087948799133301, "global_step": 11101, "epoch": 264} {"train_loss": -5.122656345367432, "global_step": 11102, "epoch": 264} {"train_loss": -5.22007942199707, "global_step": 11103, "epoch": 264} {"train_loss": -5.245298385620117, "global_step": 11104, "epoch": 264} {"train_loss": -5.228614807128906, "global_step": 11105, "epoch": 264} {"train_loss": -4.999240875244141, "global_step": 11106, "epoch": 264} {"train_loss": -5.083410263061523, "global_step": 11107, "epoch": 264} {"train_loss": -5.182251453399658, "global_step": 11108, "epoch": 264} {"train_loss": -5.143004894256592, "global_step": 11109, "epoch": 264} {"train_loss": -5.176565170288086, "global_step": 11110, "epoch": 264} {"train_loss": -5.090648174285889, "global_step": 11111, "epoch": 264} {"train_loss": -5.259641647338867, "global_step": 11112, "epoch": 264} {"train_loss": -5.233613014221191, "global_step": 11113, "epoch": 264} {"train_loss": -5.236819267272949, "global_step": 11114, "epoch": 264} {"train_loss": -5.056168079376221, "global_step": 11115, "epoch": 264} {"train_loss": -5.295335292816162, "global_step": 11116, "epoch": 264} {"train_loss": -5.111114501953125, "global_step": 11117, "epoch": 264} {"train_loss": -5.034019947052002, "global_step": 11118, "epoch": 264} {"train_loss": -5.088665008544922, "global_step": 11119, "epoch": 264} {"train_loss": -4.975094795227051, "global_step": 11120, "epoch": 264} {"train_loss": -5.109118938446045, "global_step": 11121, "epoch": 264} {"train_loss": -5.157240867614746, "global_step": 11122, "epoch": 264} {"train_loss": -5.133050918579102, "global_step": 11123, "epoch": 264} {"train_loss": -4.906374931335449, "global_step": 11124, "epoch": 264} {"train_loss": -5.0925679206848145, "global_step": 11125, "epoch": 264} {"train_loss": -4.956323623657227, "global_step": 11126, "epoch": 264} {"train_loss": -4.810792922973633, "global_step": 11127, "epoch": 264} {"train_loss": -4.9836015701293945, "global_step": 11128, "epoch": 264} {"train_loss": -5.088293291273571, "global_step": 11129, "epoch": 264, "val_loss": 78330.7265625} {"train_loss": -4.934788227081299, "global_step": 11130, "epoch": 265} {"train_loss": -4.98809814453125, "global_step": 11131, "epoch": 265} {"train_loss": -5.039957523345947, "global_step": 11132, "epoch": 265} {"train_loss": -4.976508140563965, "global_step": 11133, "epoch": 265} {"train_loss": -5.096079349517822, "global_step": 11134, "epoch": 265} {"train_loss": -4.963448524475098, "global_step": 11135, "epoch": 265} {"train_loss": -5.093069076538086, "global_step": 11136, "epoch": 265} {"train_loss": -5.171817779541016, "global_step": 11137, "epoch": 265} {"train_loss": -5.187979698181152, "global_step": 11138, "epoch": 265} {"train_loss": -5.157742023468018, "global_step": 11139, "epoch": 265} {"train_loss": -5.084003925323486, "global_step": 11140, "epoch": 265} {"train_loss": -5.124745845794678, "global_step": 11141, "epoch": 265} {"train_loss": -5.1181793212890625, "global_step": 11142, "epoch": 265} {"train_loss": -5.080772399902344, "global_step": 11143, "epoch": 265} {"train_loss": -5.139636516571045, "global_step": 11144, "epoch": 265} {"train_loss": -5.035261154174805, "global_step": 11145, "epoch": 265} {"train_loss": -5.214893341064453, "global_step": 11146, "epoch": 265} {"train_loss": -5.215033531188965, "global_step": 11147, "epoch": 265} {"train_loss": -5.0286664962768555, "global_step": 11148, "epoch": 265} {"train_loss": -5.077297687530518, "global_step": 11149, "epoch": 265} {"train_loss": -5.07393217086792, "global_step": 11150, "epoch": 265} {"train_loss": -5.165026664733887, "global_step": 11151, "epoch": 265} {"train_loss": -5.076131820678711, "global_step": 11152, "epoch": 265} {"train_loss": -5.086521148681641, "global_step": 11153, "epoch": 265} {"train_loss": -5.03550910949707, "global_step": 11154, "epoch": 265} {"train_loss": -5.084906578063965, "global_step": 11155, "epoch": 265} {"train_loss": -5.136704444885254, "global_step": 11156, "epoch": 265} {"train_loss": -5.146331787109375, "global_step": 11157, "epoch": 265} {"train_loss": -5.0230712890625, "global_step": 11158, "epoch": 265} {"train_loss": -5.237196922302246, "global_step": 11159, "epoch": 265} {"train_loss": -5.049821853637695, "global_step": 11160, "epoch": 265} {"train_loss": -5.108777046203613, "global_step": 11161, "epoch": 265} {"train_loss": -5.209855556488037, "global_step": 11162, "epoch": 265} {"train_loss": -5.0508575439453125, "global_step": 11163, "epoch": 265} {"train_loss": -5.101223945617676, "global_step": 11164, "epoch": 265} {"train_loss": -5.056832313537598, "global_step": 11165, "epoch": 265} {"train_loss": -5.148099422454834, "global_step": 11166, "epoch": 265} {"train_loss": -5.042570114135742, "global_step": 11167, "epoch": 265} {"train_loss": -5.186668872833252, "global_step": 11168, "epoch": 265} {"train_loss": -5.133742332458496, "global_step": 11169, "epoch": 265} {"train_loss": -5.184915542602539, "global_step": 11170, "epoch": 265} {"train_loss": -5.102791820253644, "global_step": 11171, "epoch": 265, "val_loss": 75188.3671875} {"train_loss": -5.075867652893066, "global_step": 11172, "epoch": 266} {"train_loss": -5.060805320739746, "global_step": 11173, "epoch": 266} {"train_loss": -4.975006103515625, "global_step": 11174, "epoch": 266} {"train_loss": -5.174653053283691, "global_step": 11175, "epoch": 266} {"train_loss": -5.219577312469482, "global_step": 11176, "epoch": 266} {"train_loss": -5.219771862030029, "global_step": 11177, "epoch": 266} {"train_loss": -5.155185222625732, "global_step": 11178, "epoch": 266} {"train_loss": -5.063074111938477, "global_step": 11179, "epoch": 266} {"train_loss": -5.169403553009033, "global_step": 11180, "epoch": 266} {"train_loss": -5.067232608795166, "global_step": 11181, "epoch": 266} {"train_loss": -5.225495338439941, "global_step": 11182, "epoch": 266} {"train_loss": -5.1134257316589355, "global_step": 11183, "epoch": 266} {"train_loss": -4.949120998382568, "global_step": 11184, "epoch": 266} {"train_loss": -5.126007556915283, "global_step": 11185, "epoch": 266} {"train_loss": -5.1730499267578125, "global_step": 11186, "epoch": 266} {"train_loss": -5.153992652893066, "global_step": 11187, "epoch": 266} {"train_loss": -5.119134902954102, "global_step": 11188, "epoch": 266} {"train_loss": -5.220270156860352, "global_step": 11189, "epoch": 266} {"train_loss": -5.119263648986816, "global_step": 11190, "epoch": 266} {"train_loss": -5.10441780090332, "global_step": 11191, "epoch": 266} {"train_loss": -5.025184631347656, "global_step": 11192, "epoch": 266} {"train_loss": -5.154213905334473, "global_step": 11193, "epoch": 266} {"train_loss": -5.037487030029297, "global_step": 11194, "epoch": 266} {"train_loss": -5.129215240478516, "global_step": 11195, "epoch": 266} {"train_loss": -5.07357931137085, "global_step": 11196, "epoch": 266} {"train_loss": -5.190209865570068, "global_step": 11197, "epoch": 266} {"train_loss": -5.0727081298828125, "global_step": 11198, "epoch": 266} {"train_loss": -5.088099002838135, "global_step": 11199, "epoch": 266} {"train_loss": -5.11801815032959, "global_step": 11200, "epoch": 266} {"train_loss": -5.115195274353027, "global_step": 11201, "epoch": 266} {"train_loss": -5.053722858428955, "global_step": 11202, "epoch": 266} {"train_loss": -5.122753143310547, "global_step": 11203, "epoch": 266} {"train_loss": -5.078895568847656, "global_step": 11204, "epoch": 266} {"train_loss": -5.022245407104492, "global_step": 11205, "epoch": 266} {"train_loss": -5.167746067047119, "global_step": 11206, "epoch": 266} {"train_loss": -5.150842666625977, "global_step": 11207, "epoch": 266} {"train_loss": -5.08114767074585, "global_step": 11208, "epoch": 266} {"train_loss": -5.120396614074707, "global_step": 11209, "epoch": 266} {"train_loss": -5.204044342041016, "global_step": 11210, "epoch": 266} {"train_loss": -4.996082305908203, "global_step": 11211, "epoch": 266} {"train_loss": -4.9777116775512695, "global_step": 11212, "epoch": 266} {"train_loss": -5.110346453530448, "global_step": 11213, "epoch": 266, "val_loss": 75888.84375} {"train_loss": -5.077319145202637, "global_step": 11214, "epoch": 267} {"train_loss": -5.360173225402832, "global_step": 11215, "epoch": 267} {"train_loss": -5.143459320068359, "global_step": 11216, "epoch": 267} {"train_loss": -5.0900373458862305, "global_step": 11217, "epoch": 267} {"train_loss": -5.15175724029541, "global_step": 11218, "epoch": 267} {"train_loss": -5.186773777008057, "global_step": 11219, "epoch": 267} {"train_loss": -5.038816452026367, "global_step": 11220, "epoch": 267} {"train_loss": -5.075064659118652, "global_step": 11221, "epoch": 267} {"train_loss": -5.083793640136719, "global_step": 11222, "epoch": 267} {"train_loss": -4.903084754943848, "global_step": 11223, "epoch": 267} {"train_loss": -5.019219398498535, "global_step": 11224, "epoch": 267} {"train_loss": -4.8936004638671875, "global_step": 11225, "epoch": 267} {"train_loss": -5.052698612213135, "global_step": 11226, "epoch": 267} {"train_loss": -5.020357608795166, "global_step": 11227, "epoch": 267} {"train_loss": -4.969797134399414, "global_step": 11228, "epoch": 267} {"train_loss": -5.023090839385986, "global_step": 11229, "epoch": 267} {"train_loss": -5.134510040283203, "global_step": 11230, "epoch": 267} {"train_loss": -5.01401948928833, "global_step": 11231, "epoch": 267} {"train_loss": -5.122757911682129, "global_step": 11232, "epoch": 267} {"train_loss": -5.107375144958496, "global_step": 11233, "epoch": 267} {"train_loss": -5.154597282409668, "global_step": 11234, "epoch": 267} {"train_loss": -5.0204362869262695, "global_step": 11235, "epoch": 267} {"train_loss": -5.083880424499512, "global_step": 11236, "epoch": 267} {"train_loss": -5.143011093139648, "global_step": 11237, "epoch": 267} {"train_loss": -5.045095443725586, "global_step": 11238, "epoch": 267} {"train_loss": -5.149627208709717, "global_step": 11239, "epoch": 267} {"train_loss": -5.0568952560424805, "global_step": 11240, "epoch": 267} {"train_loss": -5.003777503967285, "global_step": 11241, "epoch": 267} {"train_loss": -5.025612831115723, "global_step": 11242, "epoch": 267} {"train_loss": -5.015653610229492, "global_step": 11243, "epoch": 267} {"train_loss": -4.893075942993164, "global_step": 11244, "epoch": 267} {"train_loss": -4.925180435180664, "global_step": 11245, "epoch": 267} {"train_loss": -5.106254577636719, "global_step": 11246, "epoch": 267} {"train_loss": -5.012333869934082, "global_step": 11247, "epoch": 267} {"train_loss": -5.114745140075684, "global_step": 11248, "epoch": 267} {"train_loss": -5.240138053894043, "global_step": 11249, "epoch": 267} {"train_loss": -5.030284404754639, "global_step": 11250, "epoch": 267} {"train_loss": -5.05001163482666, "global_step": 11251, "epoch": 267} {"train_loss": -4.979052543640137, "global_step": 11252, "epoch": 267} {"train_loss": -5.144023895263672, "global_step": 11253, "epoch": 267} {"train_loss": -5.062952041625977, "global_step": 11254, "epoch": 267} {"train_loss": -5.068698349453154, "global_step": 11255, "epoch": 267, "val_loss": 75840.1796875} {"train_loss": -5.169360160827637, "global_step": 11256, "epoch": 268} {"train_loss": -5.103108882904053, "global_step": 11257, "epoch": 268} {"train_loss": -5.069311618804932, "global_step": 11258, "epoch": 268} {"train_loss": -5.16196346282959, "global_step": 11259, "epoch": 268} {"train_loss": -4.91721773147583, "global_step": 11260, "epoch": 268} {"train_loss": -5.177003860473633, "global_step": 11261, "epoch": 268} {"train_loss": -5.205142974853516, "global_step": 11262, "epoch": 268} {"train_loss": -4.996230602264404, "global_step": 11263, "epoch": 268} {"train_loss": -5.171825408935547, "global_step": 11264, "epoch": 268} {"train_loss": -4.981212615966797, "global_step": 11265, "epoch": 268} {"train_loss": -5.063579559326172, "global_step": 11266, "epoch": 268} {"train_loss": -5.165043830871582, "global_step": 11267, "epoch": 268} {"train_loss": -5.00450325012207, "global_step": 11268, "epoch": 268} {"train_loss": -5.103490829467773, "global_step": 11269, "epoch": 268} {"train_loss": -4.9845194816589355, "global_step": 11270, "epoch": 268} {"train_loss": -5.186537742614746, "global_step": 11271, "epoch": 268} {"train_loss": -5.1047821044921875, "global_step": 11272, "epoch": 268} {"train_loss": -5.2272443771362305, "global_step": 11273, "epoch": 268} {"train_loss": -5.097096920013428, "global_step": 11274, "epoch": 268} {"train_loss": -5.081214904785156, "global_step": 11275, "epoch": 268} {"train_loss": -5.1703104972839355, "global_step": 11276, "epoch": 268} {"train_loss": -5.049983978271484, "global_step": 11277, "epoch": 268} {"train_loss": -5.02148962020874, "global_step": 11278, "epoch": 268} {"train_loss": -5.164430618286133, "global_step": 11279, "epoch": 268} {"train_loss": -4.983245849609375, "global_step": 11280, "epoch": 268} {"train_loss": -5.001438617706299, "global_step": 11281, "epoch": 268} {"train_loss": -5.053031921386719, "global_step": 11282, "epoch": 268} {"train_loss": -5.12785530090332, "global_step": 11283, "epoch": 268} {"train_loss": -5.193741798400879, "global_step": 11284, "epoch": 268} {"train_loss": -5.249547958374023, "global_step": 11285, "epoch": 268} {"train_loss": -5.146514892578125, "global_step": 11286, "epoch": 268} {"train_loss": -5.009622573852539, "global_step": 11287, "epoch": 268} {"train_loss": -5.160102844238281, "global_step": 11288, "epoch": 268} {"train_loss": -5.188963890075684, "global_step": 11289, "epoch": 268} {"train_loss": -5.213260650634766, "global_step": 11290, "epoch": 268} {"train_loss": -5.152224540710449, "global_step": 11291, "epoch": 268} {"train_loss": -5.2282023429870605, "global_step": 11292, "epoch": 268} {"train_loss": -5.086112976074219, "global_step": 11293, "epoch": 268} {"train_loss": -5.024321556091309, "global_step": 11294, "epoch": 268} {"train_loss": -5.166154861450195, "global_step": 11295, "epoch": 268} {"train_loss": -4.951181411743164, "global_step": 11296, "epoch": 268} {"train_loss": -5.106439919698806, "global_step": 11297, "epoch": 268, "val_loss": 75170.6875} {"train_loss": -5.196423530578613, "global_step": 11298, "epoch": 269} {"train_loss": -4.877708911895752, "global_step": 11299, "epoch": 269} {"train_loss": -5.12335205078125, "global_step": 11300, "epoch": 269} {"train_loss": -5.040081024169922, "global_step": 11301, "epoch": 269} {"train_loss": -5.0537943840026855, "global_step": 11302, "epoch": 269} {"train_loss": -5.174242973327637, "global_step": 11303, "epoch": 269} {"train_loss": -5.0443010330200195, "global_step": 11304, "epoch": 269} {"train_loss": -4.992110252380371, "global_step": 11305, "epoch": 269} {"train_loss": -5.079581260681152, "global_step": 11306, "epoch": 269} {"train_loss": -5.224617004394531, "global_step": 11307, "epoch": 269} {"train_loss": -4.986637115478516, "global_step": 11308, "epoch": 269} {"train_loss": -5.175291061401367, "global_step": 11309, "epoch": 269} {"train_loss": -5.141999244689941, "global_step": 11310, "epoch": 269} {"train_loss": -5.198352813720703, "global_step": 11311, "epoch": 269} {"train_loss": -5.227115154266357, "global_step": 11312, "epoch": 269} {"train_loss": -5.159305572509766, "global_step": 11313, "epoch": 269} {"train_loss": -5.174615859985352, "global_step": 11314, "epoch": 269} {"train_loss": -5.149852752685547, "global_step": 11315, "epoch": 269} {"train_loss": -4.961512565612793, "global_step": 11316, "epoch": 269} {"train_loss": -5.16180419921875, "global_step": 11317, "epoch": 269} {"train_loss": -5.010442733764648, "global_step": 11318, "epoch": 269} {"train_loss": -5.190493583679199, "global_step": 11319, "epoch": 269} {"train_loss": -5.010704040527344, "global_step": 11320, "epoch": 269} {"train_loss": -5.000009536743164, "global_step": 11321, "epoch": 269} {"train_loss": -5.048165321350098, "global_step": 11322, "epoch": 269} {"train_loss": -5.085498332977295, "global_step": 11323, "epoch": 269} {"train_loss": -5.1060380935668945, "global_step": 11324, "epoch": 269} {"train_loss": -5.167452812194824, "global_step": 11325, "epoch": 269} {"train_loss": -5.035780906677246, "global_step": 11326, "epoch": 269} {"train_loss": -5.081298351287842, "global_step": 11327, "epoch": 269} {"train_loss": -5.191125392913818, "global_step": 11328, "epoch": 269} {"train_loss": -5.077883243560791, "global_step": 11329, "epoch": 269} {"train_loss": -5.049356460571289, "global_step": 11330, "epoch": 269} {"train_loss": -5.090670585632324, "global_step": 11331, "epoch": 269} {"train_loss": -5.20542049407959, "global_step": 11332, "epoch": 269} {"train_loss": -5.180113315582275, "global_step": 11333, "epoch": 269} {"train_loss": -5.247968673706055, "global_step": 11334, "epoch": 269} {"train_loss": -5.387730598449707, "global_step": 11335, "epoch": 269} {"train_loss": -5.237517356872559, "global_step": 11336, "epoch": 269} {"train_loss": -5.317775726318359, "global_step": 11337, "epoch": 269} {"train_loss": -5.110828399658203, "global_step": 11338, "epoch": 269} {"train_loss": -5.11798822312128, "global_step": 11339, "epoch": 269, "val_loss": 75260.171875} {"train_loss": -5.127317428588867, "global_step": 11340, "epoch": 270} {"train_loss": -5.222580432891846, "global_step": 11341, "epoch": 270} {"train_loss": -4.98687744140625, "global_step": 11342, "epoch": 270} {"train_loss": -5.0604071617126465, "global_step": 11343, "epoch": 270} {"train_loss": -5.138887405395508, "global_step": 11344, "epoch": 270} {"train_loss": -5.166688919067383, "global_step": 11345, "epoch": 270} {"train_loss": -5.078980445861816, "global_step": 11346, "epoch": 270} {"train_loss": -5.006152629852295, "global_step": 11347, "epoch": 270} {"train_loss": -5.07508659362793, "global_step": 11348, "epoch": 270} {"train_loss": -5.085808277130127, "global_step": 11349, "epoch": 270} {"train_loss": -5.109755516052246, "global_step": 11350, "epoch": 270} {"train_loss": -5.220414638519287, "global_step": 11351, "epoch": 270} {"train_loss": -5.240945816040039, "global_step": 11352, "epoch": 270} {"train_loss": -5.0091938972473145, "global_step": 11353, "epoch": 270} {"train_loss": -5.2257490158081055, "global_step": 11354, "epoch": 270} {"train_loss": -5.2792649269104, "global_step": 11355, "epoch": 270} {"train_loss": -5.085124969482422, "global_step": 11356, "epoch": 270} {"train_loss": -5.21971321105957, "global_step": 11357, "epoch": 270} {"train_loss": -5.194237232208252, "global_step": 11358, "epoch": 270} {"train_loss": -5.033656120300293, "global_step": 11359, "epoch": 270} {"train_loss": -5.121096611022949, "global_step": 11360, "epoch": 270} {"train_loss": -4.921270370483398, "global_step": 11361, "epoch": 270} {"train_loss": -5.11103630065918, "global_step": 11362, "epoch": 270} {"train_loss": -5.102749824523926, "global_step": 11363, "epoch": 270} {"train_loss": -5.168811798095703, "global_step": 11364, "epoch": 270} {"train_loss": -4.984947681427002, "global_step": 11365, "epoch": 270} {"train_loss": -5.175411224365234, "global_step": 11366, "epoch": 270} {"train_loss": -5.125645637512207, "global_step": 11367, "epoch": 270} {"train_loss": -5.1828694343566895, "global_step": 11368, "epoch": 270} {"train_loss": -4.999493598937988, "global_step": 11369, "epoch": 270} {"train_loss": -5.189888000488281, "global_step": 11370, "epoch": 270} {"train_loss": -5.042929172515869, "global_step": 11371, "epoch": 270} {"train_loss": -5.0259785652160645, "global_step": 11372, "epoch": 270} {"train_loss": -5.040936470031738, "global_step": 11373, "epoch": 270} {"train_loss": -5.180219650268555, "global_step": 11374, "epoch": 270} {"train_loss": -5.041935920715332, "global_step": 11375, "epoch": 270} {"train_loss": -5.096381187438965, "global_step": 11376, "epoch": 270} {"train_loss": -4.9862284660339355, "global_step": 11377, "epoch": 270} {"train_loss": -5.053348541259766, "global_step": 11378, "epoch": 270} {"train_loss": -4.951728820800781, "global_step": 11379, "epoch": 270} {"train_loss": -5.279942035675049, "global_step": 11380, "epoch": 270} {"train_loss": -5.106594732829502, "global_step": 11381, "epoch": 270, "val_loss": 75592.828125} {"train_loss": -5.102997779846191, "global_step": 11382, "epoch": 271} {"train_loss": -5.123207092285156, "global_step": 11383, "epoch": 271} {"train_loss": -5.1416826248168945, "global_step": 11384, "epoch": 271} {"train_loss": -5.199234485626221, "global_step": 11385, "epoch": 271} {"train_loss": -5.0608720779418945, "global_step": 11386, "epoch": 271} {"train_loss": -4.969419956207275, "global_step": 11387, "epoch": 271} {"train_loss": -5.107878684997559, "global_step": 11388, "epoch": 271} {"train_loss": -5.075383186340332, "global_step": 11389, "epoch": 271} {"train_loss": -5.03124475479126, "global_step": 11390, "epoch": 271} {"train_loss": -5.170553207397461, "global_step": 11391, "epoch": 271} {"train_loss": -5.055727958679199, "global_step": 11392, "epoch": 271} {"train_loss": -4.983522415161133, "global_step": 11393, "epoch": 271} {"train_loss": -5.221787452697754, "global_step": 11394, "epoch": 271} {"train_loss": -5.062689304351807, "global_step": 11395, "epoch": 271} {"train_loss": -5.009983062744141, "global_step": 11396, "epoch": 271} {"train_loss": -5.168405532836914, "global_step": 11397, "epoch": 271} {"train_loss": -5.088108062744141, "global_step": 11398, "epoch": 271} {"train_loss": -5.161671161651611, "global_step": 11399, "epoch": 271} {"train_loss": -5.201744079589844, "global_step": 11400, "epoch": 271} {"train_loss": -5.097912311553955, "global_step": 11401, "epoch": 271} {"train_loss": -5.208412170410156, "global_step": 11402, "epoch": 271} {"train_loss": -5.242379665374756, "global_step": 11403, "epoch": 271} {"train_loss": -5.201848983764648, "global_step": 11404, "epoch": 271} {"train_loss": -5.071126937866211, "global_step": 11405, "epoch": 271} {"train_loss": -5.067434787750244, "global_step": 11406, "epoch": 271} {"train_loss": -5.132975101470947, "global_step": 11407, "epoch": 271} {"train_loss": -5.18755578994751, "global_step": 11408, "epoch": 271} {"train_loss": -5.004058361053467, "global_step": 11409, "epoch": 271} {"train_loss": -5.130925178527832, "global_step": 11410, "epoch": 271} {"train_loss": -4.907954216003418, "global_step": 11411, "epoch": 271} {"train_loss": -4.884411334991455, "global_step": 11412, "epoch": 271} {"train_loss": -5.0938591957092285, "global_step": 11413, "epoch": 271} {"train_loss": -4.935345649719238, "global_step": 11414, "epoch": 271} {"train_loss": -5.135712146759033, "global_step": 11415, "epoch": 271} {"train_loss": -5.175680160522461, "global_step": 11416, "epoch": 271} {"train_loss": -5.072687149047852, "global_step": 11417, "epoch": 271} {"train_loss": -5.018060684204102, "global_step": 11418, "epoch": 271} {"train_loss": -5.137707233428955, "global_step": 11419, "epoch": 271} {"train_loss": -5.182217121124268, "global_step": 11420, "epoch": 271} {"train_loss": -5.195951461791992, "global_step": 11421, "epoch": 271} {"train_loss": -5.071559906005859, "global_step": 11422, "epoch": 271} {"train_loss": -5.102706807000296, "global_step": 11423, "epoch": 271, "val_loss": 76450.6328125} {"train_loss": -5.109297275543213, "global_step": 11424, "epoch": 272} {"train_loss": -5.129485130310059, "global_step": 11425, "epoch": 272} {"train_loss": -5.138077259063721, "global_step": 11426, "epoch": 272} {"train_loss": -5.1403703689575195, "global_step": 11427, "epoch": 272} {"train_loss": -5.23059606552124, "global_step": 11428, "epoch": 272} {"train_loss": -5.151638984680176, "global_step": 11429, "epoch": 272} {"train_loss": -5.129265308380127, "global_step": 11430, "epoch": 272} {"train_loss": -5.11262321472168, "global_step": 11431, "epoch": 272} {"train_loss": -5.074366569519043, "global_step": 11432, "epoch": 272} {"train_loss": -5.080367088317871, "global_step": 11433, "epoch": 272} {"train_loss": -5.133491516113281, "global_step": 11434, "epoch": 272} {"train_loss": -5.015100479125977, "global_step": 11435, "epoch": 272} {"train_loss": -5.130467414855957, "global_step": 11436, "epoch": 272} {"train_loss": -5.172206401824951, "global_step": 11437, "epoch": 272} {"train_loss": -5.218066692352295, "global_step": 11438, "epoch": 272} {"train_loss": -5.173616409301758, "global_step": 11439, "epoch": 272} {"train_loss": -5.080127239227295, "global_step": 11440, "epoch": 272} {"train_loss": -5.258286476135254, "global_step": 11441, "epoch": 272} {"train_loss": -5.052398681640625, "global_step": 11442, "epoch": 272} {"train_loss": -5.256404876708984, "global_step": 11443, "epoch": 272} {"train_loss": -5.246330261230469, "global_step": 11444, "epoch": 272} {"train_loss": -5.071615219116211, "global_step": 11445, "epoch": 272} {"train_loss": -5.1261305809021, "global_step": 11446, "epoch": 272} {"train_loss": -5.161510467529297, "global_step": 11447, "epoch": 272} {"train_loss": -5.10434103012085, "global_step": 11448, "epoch": 272} {"train_loss": -5.302886962890625, "global_step": 11449, "epoch": 272} {"train_loss": -5.266757011413574, "global_step": 11450, "epoch": 272} {"train_loss": -5.078012466430664, "global_step": 11451, "epoch": 272} {"train_loss": -5.088301181793213, "global_step": 11452, "epoch": 272} {"train_loss": -5.083670616149902, "global_step": 11453, "epoch": 272} {"train_loss": -5.262612342834473, "global_step": 11454, "epoch": 272} {"train_loss": -5.049324035644531, "global_step": 11455, "epoch": 272} {"train_loss": -5.143425941467285, "global_step": 11456, "epoch": 272} {"train_loss": -5.137270927429199, "global_step": 11457, "epoch": 272} {"train_loss": -5.121830940246582, "global_step": 11458, "epoch": 272} {"train_loss": -5.113252639770508, "global_step": 11459, "epoch": 272} {"train_loss": -5.128678321838379, "global_step": 11460, "epoch": 272} {"train_loss": -5.12568998336792, "global_step": 11461, "epoch": 272} {"train_loss": -5.105022430419922, "global_step": 11462, "epoch": 272} {"train_loss": -5.109241485595703, "global_step": 11463, "epoch": 272} {"train_loss": -5.239991188049316, "global_step": 11464, "epoch": 272} {"train_loss": -5.143732002803257, "global_step": 11465, "epoch": 272, "val_loss": 76180.546875} {"train_loss": -4.981683731079102, "global_step": 11466, "epoch": 273} {"train_loss": -5.174375534057617, "global_step": 11467, "epoch": 273} {"train_loss": -5.21701717376709, "global_step": 11468, "epoch": 273} {"train_loss": -4.93140172958374, "global_step": 11469, "epoch": 273} {"train_loss": -5.026865005493164, "global_step": 11470, "epoch": 273} {"train_loss": -5.234805107116699, "global_step": 11471, "epoch": 273} {"train_loss": -5.179479598999023, "global_step": 11472, "epoch": 273} {"train_loss": -5.139434337615967, "global_step": 11473, "epoch": 273} {"train_loss": -5.054036617279053, "global_step": 11474, "epoch": 273} {"train_loss": -5.232146263122559, "global_step": 11475, "epoch": 273} {"train_loss": -5.34181022644043, "global_step": 11476, "epoch": 273} {"train_loss": -5.184544086456299, "global_step": 11477, "epoch": 273} {"train_loss": -5.195550918579102, "global_step": 11478, "epoch": 273} {"train_loss": -5.169809341430664, "global_step": 11479, "epoch": 273} {"train_loss": -5.056872844696045, "global_step": 11480, "epoch": 273} {"train_loss": -5.378430366516113, "global_step": 11481, "epoch": 273} {"train_loss": -5.123281002044678, "global_step": 11482, "epoch": 273} {"train_loss": -5.254439353942871, "global_step": 11483, "epoch": 273} {"train_loss": -5.240659713745117, "global_step": 11484, "epoch": 273} {"train_loss": -5.120797634124756, "global_step": 11485, "epoch": 273} {"train_loss": -5.1261677742004395, "global_step": 11486, "epoch": 273} {"train_loss": -5.088176727294922, "global_step": 11487, "epoch": 273} {"train_loss": -5.205962657928467, "global_step": 11488, "epoch": 273} {"train_loss": -5.266135215759277, "global_step": 11489, "epoch": 273} {"train_loss": -5.041097164154053, "global_step": 11490, "epoch": 273} {"train_loss": -5.178646087646484, "global_step": 11491, "epoch": 273} {"train_loss": -4.999225616455078, "global_step": 11492, "epoch": 273} {"train_loss": -5.0417890548706055, "global_step": 11493, "epoch": 273} {"train_loss": -5.127993583679199, "global_step": 11494, "epoch": 273} {"train_loss": -5.201986312866211, "global_step": 11495, "epoch": 273} {"train_loss": -5.155773639678955, "global_step": 11496, "epoch": 273} {"train_loss": -5.128505706787109, "global_step": 11497, "epoch": 273} {"train_loss": -5.249337196350098, "global_step": 11498, "epoch": 273} {"train_loss": -5.316415786743164, "global_step": 11499, "epoch": 273} {"train_loss": -5.0663957595825195, "global_step": 11500, "epoch": 273} {"train_loss": -5.12654972076416, "global_step": 11501, "epoch": 273} {"train_loss": -5.20706844329834, "global_step": 11502, "epoch": 273} {"train_loss": -5.181881427764893, "global_step": 11503, "epoch": 273} {"train_loss": -4.97278356552124, "global_step": 11504, "epoch": 273} {"train_loss": -5.0537214279174805, "global_step": 11505, "epoch": 273} {"train_loss": -5.239739418029785, "global_step": 11506, "epoch": 273} {"train_loss": -5.151067745117914, "global_step": 11507, "epoch": 273, "val_loss": 75772.6015625} {"train_loss": -4.979550838470459, "global_step": 11508, "epoch": 274} {"train_loss": -5.193449974060059, "global_step": 11509, "epoch": 274} {"train_loss": -5.138016223907471, "global_step": 11510, "epoch": 274} {"train_loss": -5.035262584686279, "global_step": 11511, "epoch": 274} {"train_loss": -5.134000301361084, "global_step": 11512, "epoch": 274} {"train_loss": -5.059332847595215, "global_step": 11513, "epoch": 274} {"train_loss": -5.159261703491211, "global_step": 11514, "epoch": 274} {"train_loss": -5.234245777130127, "global_step": 11515, "epoch": 274} {"train_loss": -5.159399032592773, "global_step": 11516, "epoch": 274} {"train_loss": -5.164556980133057, "global_step": 11517, "epoch": 274} {"train_loss": -5.179298400878906, "global_step": 11518, "epoch": 274} {"train_loss": -5.088237285614014, "global_step": 11519, "epoch": 274} {"train_loss": -5.066371917724609, "global_step": 11520, "epoch": 274} {"train_loss": -5.182117462158203, "global_step": 11521, "epoch": 274} {"train_loss": -5.258580684661865, "global_step": 11522, "epoch": 274} {"train_loss": -5.0312371253967285, "global_step": 11523, "epoch": 274} {"train_loss": -5.154732704162598, "global_step": 11524, "epoch": 274} {"train_loss": -5.109968185424805, "global_step": 11525, "epoch": 274} {"train_loss": -5.124506950378418, "global_step": 11526, "epoch": 274} {"train_loss": -4.99709415435791, "global_step": 11527, "epoch": 274} {"train_loss": -5.032558441162109, "global_step": 11528, "epoch": 274} {"train_loss": -4.995348930358887, "global_step": 11529, "epoch": 274} {"train_loss": -5.05682897567749, "global_step": 11530, "epoch": 274} {"train_loss": -4.887884140014648, "global_step": 11531, "epoch": 274} {"train_loss": -4.99038028717041, "global_step": 11532, "epoch": 274} {"train_loss": -5.069881439208984, "global_step": 11533, "epoch": 274} {"train_loss": -5.037792682647705, "global_step": 11534, "epoch": 274} {"train_loss": -5.071096420288086, "global_step": 11535, "epoch": 274} {"train_loss": -4.946549415588379, "global_step": 11536, "epoch": 274} {"train_loss": -5.225636959075928, "global_step": 11537, "epoch": 274} {"train_loss": -4.967432022094727, "global_step": 11538, "epoch": 274} {"train_loss": -5.141819000244141, "global_step": 11539, "epoch": 274} {"train_loss": -5.219935894012451, "global_step": 11540, "epoch": 274} {"train_loss": -5.023433685302734, "global_step": 11541, "epoch": 274} {"train_loss": -5.13992166519165, "global_step": 11542, "epoch": 274} {"train_loss": -5.007449150085449, "global_step": 11543, "epoch": 274} {"train_loss": -5.113680362701416, "global_step": 11544, "epoch": 274} {"train_loss": -5.160167694091797, "global_step": 11545, "epoch": 274} {"train_loss": -5.180696487426758, "global_step": 11546, "epoch": 274} {"train_loss": -5.044974327087402, "global_step": 11547, "epoch": 274} {"train_loss": -5.1022162437438965, "global_step": 11548, "epoch": 274} {"train_loss": -5.0957761492047995, "global_step": 11549, "epoch": 274, "val_loss": 74852.4921875} {"train_loss": -5.1421356201171875, "global_step": 11550, "epoch": 275} {"train_loss": -5.225864410400391, "global_step": 11551, "epoch": 275} {"train_loss": -5.271369934082031, "global_step": 11552, "epoch": 275} {"train_loss": -5.174490928649902, "global_step": 11553, "epoch": 275} {"train_loss": -5.1049957275390625, "global_step": 11554, "epoch": 275} {"train_loss": -5.120705604553223, "global_step": 11555, "epoch": 275} {"train_loss": -5.2137227058410645, "global_step": 11556, "epoch": 275} {"train_loss": -5.058866500854492, "global_step": 11557, "epoch": 275} {"train_loss": -5.036256790161133, "global_step": 11558, "epoch": 275} {"train_loss": -5.126636981964111, "global_step": 11559, "epoch": 275} {"train_loss": -5.143183708190918, "global_step": 11560, "epoch": 275} {"train_loss": -5.136839866638184, "global_step": 11561, "epoch": 275} {"train_loss": -5.114398956298828, "global_step": 11562, "epoch": 275} {"train_loss": -5.089545726776123, "global_step": 11563, "epoch": 275} {"train_loss": -5.249269962310791, "global_step": 11564, "epoch": 275} {"train_loss": -5.120800018310547, "global_step": 11565, "epoch": 275} {"train_loss": -5.122203826904297, "global_step": 11566, "epoch": 275} {"train_loss": -5.181967258453369, "global_step": 11567, "epoch": 275} {"train_loss": -5.13055419921875, "global_step": 11568, "epoch": 275} {"train_loss": -5.079342842102051, "global_step": 11569, "epoch": 275} {"train_loss": -4.98858118057251, "global_step": 11570, "epoch": 275} {"train_loss": -4.75216007232666, "global_step": 11571, "epoch": 275} {"train_loss": -5.108264446258545, "global_step": 11572, "epoch": 275} {"train_loss": -4.998880863189697, "global_step": 11573, "epoch": 275} {"train_loss": -4.776932716369629, "global_step": 11574, "epoch": 275} {"train_loss": -5.109569072723389, "global_step": 11575, "epoch": 275} {"train_loss": -4.735507965087891, "global_step": 11576, "epoch": 275} {"train_loss": -4.941556930541992, "global_step": 11577, "epoch": 275} {"train_loss": -5.11091423034668, "global_step": 11578, "epoch": 275} {"train_loss": -5.0506486892700195, "global_step": 11579, "epoch": 275} {"train_loss": -5.18979549407959, "global_step": 11580, "epoch": 275} {"train_loss": -4.996364593505859, "global_step": 11581, "epoch": 275} {"train_loss": -5.178976058959961, "global_step": 11582, "epoch": 275} {"train_loss": -5.088699817657471, "global_step": 11583, "epoch": 275} {"train_loss": -5.1454877853393555, "global_step": 11584, "epoch": 275} {"train_loss": -5.118071556091309, "global_step": 11585, "epoch": 275} {"train_loss": -5.018186092376709, "global_step": 11586, "epoch": 275} {"train_loss": -5.171004295349121, "global_step": 11587, "epoch": 275} {"train_loss": -5.053621768951416, "global_step": 11588, "epoch": 275} {"train_loss": -5.025869369506836, "global_step": 11589, "epoch": 275} {"train_loss": -5.1824235916137695, "global_step": 11590, "epoch": 275} {"train_loss": -5.089253618603661, "global_step": 11591, "epoch": 275, "val_loss": 75094.03125} {"train_loss": -5.230734825134277, "global_step": 11592, "epoch": 276} {"train_loss": -5.1852216720581055, "global_step": 11593, "epoch": 276} {"train_loss": -5.108212471008301, "global_step": 11594, "epoch": 276} {"train_loss": -5.20603084564209, "global_step": 11595, "epoch": 276} {"train_loss": -5.200706481933594, "global_step": 11596, "epoch": 276} {"train_loss": -5.275735378265381, "global_step": 11597, "epoch": 276} {"train_loss": -5.126278877258301, "global_step": 11598, "epoch": 276} {"train_loss": -5.245368957519531, "global_step": 11599, "epoch": 276} {"train_loss": -5.2384467124938965, "global_step": 11600, "epoch": 276} {"train_loss": -5.123920440673828, "global_step": 11601, "epoch": 276} {"train_loss": -5.207881927490234, "global_step": 11602, "epoch": 276} {"train_loss": -5.2100443840026855, "global_step": 11603, "epoch": 276} {"train_loss": -5.144223213195801, "global_step": 11604, "epoch": 276} {"train_loss": -5.106540679931641, "global_step": 11605, "epoch": 276} {"train_loss": -5.181521415710449, "global_step": 11606, "epoch": 276} {"train_loss": -5.105621814727783, "global_step": 11607, "epoch": 276} {"train_loss": -5.142046928405762, "global_step": 11608, "epoch": 276} {"train_loss": -5.089547634124756, "global_step": 11609, "epoch": 276} {"train_loss": -5.108310699462891, "global_step": 11610, "epoch": 276} {"train_loss": -5.127392768859863, "global_step": 11611, "epoch": 276} {"train_loss": -5.337386131286621, "global_step": 11612, "epoch": 276} {"train_loss": -5.158196926116943, "global_step": 11613, "epoch": 276} {"train_loss": -5.251596927642822, "global_step": 11614, "epoch": 276} {"train_loss": -5.33226203918457, "global_step": 11615, "epoch": 276} {"train_loss": -5.0873823165893555, "global_step": 11616, "epoch": 276} {"train_loss": -5.065820217132568, "global_step": 11617, "epoch": 276} {"train_loss": -5.115108489990234, "global_step": 11618, "epoch": 276} {"train_loss": -5.17866325378418, "global_step": 11619, "epoch": 276} {"train_loss": -5.168905258178711, "global_step": 11620, "epoch": 276} {"train_loss": -5.174683570861816, "global_step": 11621, "epoch": 276} {"train_loss": -4.964200019836426, "global_step": 11622, "epoch": 276} {"train_loss": -5.061138153076172, "global_step": 11623, "epoch": 276} {"train_loss": -5.163405418395996, "global_step": 11624, "epoch": 276} {"train_loss": -5.050362586975098, "global_step": 11625, "epoch": 276} {"train_loss": -4.968763828277588, "global_step": 11626, "epoch": 276} {"train_loss": -5.037544250488281, "global_step": 11627, "epoch": 276} {"train_loss": -5.059121131896973, "global_step": 11628, "epoch": 276} {"train_loss": -5.032924652099609, "global_step": 11629, "epoch": 276} {"train_loss": -5.038281440734863, "global_step": 11630, "epoch": 276} {"train_loss": -4.941776275634766, "global_step": 11631, "epoch": 276} {"train_loss": -5.196499347686768, "global_step": 11632, "epoch": 276} {"train_loss": -5.1401416801270985, "global_step": 11633, "epoch": 276, "val_loss": 75890.1953125} {"train_loss": -5.064869403839111, "global_step": 11634, "epoch": 277} {"train_loss": -5.066493988037109, "global_step": 11635, "epoch": 277} {"train_loss": -5.130627632141113, "global_step": 11636, "epoch": 277} {"train_loss": -5.217096328735352, "global_step": 11637, "epoch": 277} {"train_loss": -5.026963233947754, "global_step": 11638, "epoch": 277} {"train_loss": -5.1190972328186035, "global_step": 11639, "epoch": 277} {"train_loss": -5.112200736999512, "global_step": 11640, "epoch": 277} {"train_loss": -4.926126003265381, "global_step": 11641, "epoch": 277} {"train_loss": -5.150674819946289, "global_step": 11642, "epoch": 277} {"train_loss": -5.007086753845215, "global_step": 11643, "epoch": 277} {"train_loss": -4.979942321777344, "global_step": 11644, "epoch": 277} {"train_loss": -5.154735565185547, "global_step": 11645, "epoch": 277} {"train_loss": -4.942108154296875, "global_step": 11646, "epoch": 277} {"train_loss": -5.1654372215271, "global_step": 11647, "epoch": 277} {"train_loss": -5.135342597961426, "global_step": 11648, "epoch": 277} {"train_loss": -5.072037220001221, "global_step": 11649, "epoch": 277} {"train_loss": -5.172079563140869, "global_step": 11650, "epoch": 277} {"train_loss": -5.103913307189941, "global_step": 11651, "epoch": 277} {"train_loss": -5.067848205566406, "global_step": 11652, "epoch": 277} {"train_loss": -5.262555122375488, "global_step": 11653, "epoch": 277} {"train_loss": -5.163345813751221, "global_step": 11654, "epoch": 277} {"train_loss": -4.999822616577148, "global_step": 11655, "epoch": 277} {"train_loss": -5.123600482940674, "global_step": 11656, "epoch": 277} {"train_loss": -5.0159993171691895, "global_step": 11657, "epoch": 277} {"train_loss": -4.95231819152832, "global_step": 11658, "epoch": 277} {"train_loss": -5.0345611572265625, "global_step": 11659, "epoch": 277} {"train_loss": -4.973888397216797, "global_step": 11660, "epoch": 277} {"train_loss": -4.9684038162231445, "global_step": 11661, "epoch": 277} {"train_loss": -5.131883144378662, "global_step": 11662, "epoch": 277} {"train_loss": -4.944303512573242, "global_step": 11663, "epoch": 277} {"train_loss": -4.9615397453308105, "global_step": 11664, "epoch": 277} {"train_loss": -5.0703582763671875, "global_step": 11665, "epoch": 277} {"train_loss": -4.799893379211426, "global_step": 11666, "epoch": 277} {"train_loss": -5.125229835510254, "global_step": 11667, "epoch": 277} {"train_loss": -4.931183815002441, "global_step": 11668, "epoch": 277} {"train_loss": -5.1490654945373535, "global_step": 11669, "epoch": 277} {"train_loss": -5.014898777008057, "global_step": 11670, "epoch": 277} {"train_loss": -5.176494598388672, "global_step": 11671, "epoch": 277} {"train_loss": -5.113429546356201, "global_step": 11672, "epoch": 277} {"train_loss": -5.029914855957031, "global_step": 11673, "epoch": 277} {"train_loss": -5.238090991973877, "global_step": 11674, "epoch": 277} {"train_loss": -5.0693239484514505, "global_step": 11675, "epoch": 277, "val_loss": 74816.3203125} {"train_loss": -5.136231422424316, "global_step": 11676, "epoch": 278} {"train_loss": -5.140676498413086, "global_step": 11677, "epoch": 278} {"train_loss": -5.176258087158203, "global_step": 11678, "epoch": 278} {"train_loss": -5.211037635803223, "global_step": 11679, "epoch": 278} {"train_loss": -5.048603057861328, "global_step": 11680, "epoch": 278} {"train_loss": -5.211756706237793, "global_step": 11681, "epoch": 278} {"train_loss": -5.105789661407471, "global_step": 11682, "epoch": 278} {"train_loss": -5.077093124389648, "global_step": 11683, "epoch": 278} {"train_loss": -5.101448059082031, "global_step": 11684, "epoch": 278} {"train_loss": -5.0910444259643555, "global_step": 11685, "epoch": 278} {"train_loss": -5.180360317230225, "global_step": 11686, "epoch": 278} {"train_loss": -5.22032356262207, "global_step": 11687, "epoch": 278} {"train_loss": -5.119387626647949, "global_step": 11688, "epoch": 278} {"train_loss": -5.001601219177246, "global_step": 11689, "epoch": 278} {"train_loss": -5.131035327911377, "global_step": 11690, "epoch": 278} {"train_loss": -5.175660133361816, "global_step": 11691, "epoch": 278} {"train_loss": -5.149460792541504, "global_step": 11692, "epoch": 278} {"train_loss": -5.252320289611816, "global_step": 11693, "epoch": 278} {"train_loss": -5.11236572265625, "global_step": 11694, "epoch": 278} {"train_loss": -5.244811058044434, "global_step": 11695, "epoch": 278} {"train_loss": -5.256112575531006, "global_step": 11696, "epoch": 278} {"train_loss": -5.115194797515869, "global_step": 11697, "epoch": 278} {"train_loss": -5.2811126708984375, "global_step": 11698, "epoch": 278} {"train_loss": -5.0432233810424805, "global_step": 11699, "epoch": 278} {"train_loss": -5.023723125457764, "global_step": 11700, "epoch": 278} {"train_loss": -5.216254234313965, "global_step": 11701, "epoch": 278} {"train_loss": -5.062957763671875, "global_step": 11702, "epoch": 278} {"train_loss": -5.124083518981934, "global_step": 11703, "epoch": 278} {"train_loss": -5.194227695465088, "global_step": 11704, "epoch": 278} {"train_loss": -5.220279216766357, "global_step": 11705, "epoch": 278} {"train_loss": -5.17006254196167, "global_step": 11706, "epoch": 278} {"train_loss": -5.256980895996094, "global_step": 11707, "epoch": 278} {"train_loss": -5.061532020568848, "global_step": 11708, "epoch": 278} {"train_loss": -5.002532958984375, "global_step": 11709, "epoch": 278} {"train_loss": -5.208621025085449, "global_step": 11710, "epoch": 278} {"train_loss": -5.230905055999756, "global_step": 11711, "epoch": 278} {"train_loss": -5.0654616355896, "global_step": 11712, "epoch": 278} {"train_loss": -4.934836387634277, "global_step": 11713, "epoch": 278} {"train_loss": -5.215484619140625, "global_step": 11714, "epoch": 278} {"train_loss": -5.181092739105225, "global_step": 11715, "epoch": 278} {"train_loss": -4.992127418518066, "global_step": 11716, "epoch": 278} {"train_loss": -5.142052366620018, "global_step": 11717, "epoch": 278, "val_loss": 75432.734375} {"train_loss": -5.071244239807129, "global_step": 11718, "epoch": 279} {"train_loss": -5.080166339874268, "global_step": 11719, "epoch": 279} {"train_loss": -5.1172356605529785, "global_step": 11720, "epoch": 279} {"train_loss": -4.934792518615723, "global_step": 11721, "epoch": 279} {"train_loss": -5.087507247924805, "global_step": 11722, "epoch": 279} {"train_loss": -5.157650947570801, "global_step": 11723, "epoch": 279} {"train_loss": -5.197535991668701, "global_step": 11724, "epoch": 279} {"train_loss": -5.18803596496582, "global_step": 11725, "epoch": 279} {"train_loss": -5.047512054443359, "global_step": 11726, "epoch": 279} {"train_loss": -5.104485511779785, "global_step": 11727, "epoch": 279} {"train_loss": -5.135485649108887, "global_step": 11728, "epoch": 279} {"train_loss": -5.2267656326293945, "global_step": 11729, "epoch": 279} {"train_loss": -5.025190830230713, "global_step": 11730, "epoch": 279} {"train_loss": -5.283578872680664, "global_step": 11731, "epoch": 279} {"train_loss": -5.179083824157715, "global_step": 11732, "epoch": 279} {"train_loss": -5.206297874450684, "global_step": 11733, "epoch": 279} {"train_loss": -5.120638370513916, "global_step": 11734, "epoch": 279} {"train_loss": -5.092123985290527, "global_step": 11735, "epoch": 279} {"train_loss": -5.119126319885254, "global_step": 11736, "epoch": 279} {"train_loss": -4.955094337463379, "global_step": 11737, "epoch": 279} {"train_loss": -5.14163875579834, "global_step": 11738, "epoch": 279} {"train_loss": -5.12711763381958, "global_step": 11739, "epoch": 279} {"train_loss": -4.897891044616699, "global_step": 11740, "epoch": 279} {"train_loss": -5.174783229827881, "global_step": 11741, "epoch": 279} {"train_loss": -5.2052435874938965, "global_step": 11742, "epoch": 279} {"train_loss": -5.142867088317871, "global_step": 11743, "epoch": 279} {"train_loss": -5.185107231140137, "global_step": 11744, "epoch": 279} {"train_loss": -5.1693572998046875, "global_step": 11745, "epoch": 279} {"train_loss": -4.997495651245117, "global_step": 11746, "epoch": 279} {"train_loss": -5.021605491638184, "global_step": 11747, "epoch": 279} {"train_loss": -5.203700065612793, "global_step": 11748, "epoch": 279} {"train_loss": -4.906664848327637, "global_step": 11749, "epoch": 279} {"train_loss": -5.04530143737793, "global_step": 11750, "epoch": 279} {"train_loss": -5.031195640563965, "global_step": 11751, "epoch": 279} {"train_loss": -4.893219470977783, "global_step": 11752, "epoch": 279} {"train_loss": -5.20658016204834, "global_step": 11753, "epoch": 279} {"train_loss": -5.146975517272949, "global_step": 11754, "epoch": 279} {"train_loss": -4.992894172668457, "global_step": 11755, "epoch": 279} {"train_loss": -5.084928035736084, "global_step": 11756, "epoch": 279} {"train_loss": -5.034600257873535, "global_step": 11757, "epoch": 279} {"train_loss": -5.202549934387207, "global_step": 11758, "epoch": 279} {"train_loss": -5.101162376857939, "global_step": 11759, "epoch": 279, "val_loss": 75770.234375} {"train_loss": -5.089206695556641, "global_step": 11760, "epoch": 280} {"train_loss": -5.10753059387207, "global_step": 11761, "epoch": 280} {"train_loss": -4.981060028076172, "global_step": 11762, "epoch": 280} {"train_loss": -5.221060752868652, "global_step": 11763, "epoch": 280} {"train_loss": -5.087750434875488, "global_step": 11764, "epoch": 280} {"train_loss": -4.995000839233398, "global_step": 11765, "epoch": 280} {"train_loss": -5.025454521179199, "global_step": 11766, "epoch": 280} {"train_loss": -5.165732383728027, "global_step": 11767, "epoch": 280} {"train_loss": -5.133935928344727, "global_step": 11768, "epoch": 280} {"train_loss": -5.201555252075195, "global_step": 11769, "epoch": 280} {"train_loss": -5.227972984313965, "global_step": 11770, "epoch": 280} {"train_loss": -4.991793155670166, "global_step": 11771, "epoch": 280} {"train_loss": -5.106670379638672, "global_step": 11772, "epoch": 280} {"train_loss": -5.097627639770508, "global_step": 11773, "epoch": 280} {"train_loss": -5.218416213989258, "global_step": 11774, "epoch": 280} {"train_loss": -5.113441467285156, "global_step": 11775, "epoch": 280} {"train_loss": -5.254637718200684, "global_step": 11776, "epoch": 280} {"train_loss": -5.019599914550781, "global_step": 11777, "epoch": 280} {"train_loss": -4.9154582023620605, "global_step": 11778, "epoch": 280} {"train_loss": -5.130215644836426, "global_step": 11779, "epoch": 280} {"train_loss": -5.093324661254883, "global_step": 11780, "epoch": 280} {"train_loss": -4.906858444213867, "global_step": 11781, "epoch": 280} {"train_loss": -5.066643714904785, "global_step": 11782, "epoch": 280} {"train_loss": -4.709199905395508, "global_step": 11783, "epoch": 280} {"train_loss": -5.146982669830322, "global_step": 11784, "epoch": 280} {"train_loss": -5.044275283813477, "global_step": 11785, "epoch": 280} {"train_loss": -4.936306953430176, "global_step": 11786, "epoch": 280} {"train_loss": -5.036160469055176, "global_step": 11787, "epoch": 280} {"train_loss": -4.835709571838379, "global_step": 11788, "epoch": 280} {"train_loss": -5.103071689605713, "global_step": 11789, "epoch": 280} {"train_loss": -4.937660217285156, "global_step": 11790, "epoch": 280} {"train_loss": -5.134803771972656, "global_step": 11791, "epoch": 280} {"train_loss": -4.9933881759643555, "global_step": 11792, "epoch": 280} {"train_loss": -5.134599685668945, "global_step": 11793, "epoch": 280} {"train_loss": -5.120990753173828, "global_step": 11794, "epoch": 280} {"train_loss": -5.147401809692383, "global_step": 11795, "epoch": 280} {"train_loss": -5.088348865509033, "global_step": 11796, "epoch": 280} {"train_loss": -5.103031158447266, "global_step": 11797, "epoch": 280} {"train_loss": -5.138358116149902, "global_step": 11798, "epoch": 280} {"train_loss": -5.0522918701171875, "global_step": 11799, "epoch": 280} {"train_loss": -5.225156784057617, "global_step": 11800, "epoch": 280} {"train_loss": -5.073956739334833, "global_step": 11801, "epoch": 280, "val_loss": 75107.3828125} {"train_loss": -5.097681999206543, "global_step": 11802, "epoch": 281} {"train_loss": -5.050787925720215, "global_step": 11803, "epoch": 281} {"train_loss": -5.075678825378418, "global_step": 11804, "epoch": 281} {"train_loss": -4.979998588562012, "global_step": 11805, "epoch": 281} {"train_loss": -5.089766979217529, "global_step": 11806, "epoch": 281} {"train_loss": -5.110755443572998, "global_step": 11807, "epoch": 281} {"train_loss": -5.164761066436768, "global_step": 11808, "epoch": 281} {"train_loss": -5.0689167976379395, "global_step": 11809, "epoch": 281} {"train_loss": -5.147668361663818, "global_step": 11810, "epoch": 281} {"train_loss": -5.1324968338012695, "global_step": 11811, "epoch": 281} {"train_loss": -5.040713787078857, "global_step": 11812, "epoch": 281} {"train_loss": -5.150104522705078, "global_step": 11813, "epoch": 281} {"train_loss": -5.154982566833496, "global_step": 11814, "epoch": 281} {"train_loss": -5.015054702758789, "global_step": 11815, "epoch": 281} {"train_loss": -5.211321830749512, "global_step": 11816, "epoch": 281} {"train_loss": -5.139985084533691, "global_step": 11817, "epoch": 281} {"train_loss": -5.11796760559082, "global_step": 11818, "epoch": 281} {"train_loss": -5.1369476318359375, "global_step": 11819, "epoch": 281} {"train_loss": -5.1832733154296875, "global_step": 11820, "epoch": 281} {"train_loss": -5.116783618927002, "global_step": 11821, "epoch": 281} {"train_loss": -5.09304141998291, "global_step": 11822, "epoch": 281} {"train_loss": -5.161100387573242, "global_step": 11823, "epoch": 281} {"train_loss": -5.222332954406738, "global_step": 11824, "epoch": 281} {"train_loss": -5.121369361877441, "global_step": 11825, "epoch": 281} {"train_loss": -5.19333553314209, "global_step": 11826, "epoch": 281} {"train_loss": -5.028507232666016, "global_step": 11827, "epoch": 281} {"train_loss": -5.092883586883545, "global_step": 11828, "epoch": 281} {"train_loss": -5.240999698638916, "global_step": 11829, "epoch": 281} {"train_loss": -5.139447212219238, "global_step": 11830, "epoch": 281} {"train_loss": -5.11680793762207, "global_step": 11831, "epoch": 281} {"train_loss": -5.075900554656982, "global_step": 11832, "epoch": 281} {"train_loss": -5.197873115539551, "global_step": 11833, "epoch": 281} {"train_loss": -5.2314372062683105, "global_step": 11834, "epoch": 281} {"train_loss": -5.06889009475708, "global_step": 11835, "epoch": 281} {"train_loss": -5.143170356750488, "global_step": 11836, "epoch": 281} {"train_loss": -5.241018295288086, "global_step": 11837, "epoch": 281} {"train_loss": -5.235236167907715, "global_step": 11838, "epoch": 281} {"train_loss": -5.048089027404785, "global_step": 11839, "epoch": 281} {"train_loss": -5.296596527099609, "global_step": 11840, "epoch": 281} {"train_loss": -5.169184684753418, "global_step": 11841, "epoch": 281} {"train_loss": -5.105286598205566, "global_step": 11842, "epoch": 281} {"train_loss": -5.1330695719946, "global_step": 11843, "epoch": 281, "val_loss": 74379.8671875} {"train_loss": -5.153194904327393, "global_step": 11844, "epoch": 282} {"train_loss": -5.130004405975342, "global_step": 11845, "epoch": 282} {"train_loss": -5.012753486633301, "global_step": 11846, "epoch": 282} {"train_loss": -5.187089920043945, "global_step": 11847, "epoch": 282} {"train_loss": -5.17790412902832, "global_step": 11848, "epoch": 282} {"train_loss": -5.1894121170043945, "global_step": 11849, "epoch": 282} {"train_loss": -5.244307041168213, "global_step": 11850, "epoch": 282} {"train_loss": -5.247396469116211, "global_step": 11851, "epoch": 282} {"train_loss": -5.279448509216309, "global_step": 11852, "epoch": 282} {"train_loss": -5.2471923828125, "global_step": 11853, "epoch": 282} {"train_loss": -5.19386100769043, "global_step": 11854, "epoch": 282} {"train_loss": -5.0777387619018555, "global_step": 11855, "epoch": 282} {"train_loss": -5.184247016906738, "global_step": 11856, "epoch": 282} {"train_loss": -5.110702991485596, "global_step": 11857, "epoch": 282} {"train_loss": -5.029744625091553, "global_step": 11858, "epoch": 282} {"train_loss": -5.229330539703369, "global_step": 11859, "epoch": 282} {"train_loss": -5.175616264343262, "global_step": 11860, "epoch": 282} {"train_loss": -5.068310737609863, "global_step": 11861, "epoch": 282} {"train_loss": -4.935762405395508, "global_step": 11862, "epoch": 282} {"train_loss": -5.003969192504883, "global_step": 11863, "epoch": 282} {"train_loss": -4.902107238769531, "global_step": 11864, "epoch": 282} {"train_loss": -4.81565523147583, "global_step": 11865, "epoch": 282} {"train_loss": -4.896644592285156, "global_step": 11866, "epoch": 282} {"train_loss": -4.890080451965332, "global_step": 11867, "epoch": 282} {"train_loss": -5.100213527679443, "global_step": 11868, "epoch": 282} {"train_loss": -5.0611114501953125, "global_step": 11869, "epoch": 282} {"train_loss": -5.069751739501953, "global_step": 11870, "epoch": 282} {"train_loss": -5.08745002746582, "global_step": 11871, "epoch": 282} {"train_loss": -4.977156639099121, "global_step": 11872, "epoch": 282} {"train_loss": -4.868195533752441, "global_step": 11873, "epoch": 282} {"train_loss": -5.225451469421387, "global_step": 11874, "epoch": 282} {"train_loss": -5.125426292419434, "global_step": 11875, "epoch": 282} {"train_loss": -4.934990882873535, "global_step": 11876, "epoch": 282} {"train_loss": -5.132686138153076, "global_step": 11877, "epoch": 282} {"train_loss": -5.060591697692871, "global_step": 11878, "epoch": 282} {"train_loss": -5.211074352264404, "global_step": 11879, "epoch": 282} {"train_loss": -5.006438732147217, "global_step": 11880, "epoch": 282} {"train_loss": -5.202012538909912, "global_step": 11881, "epoch": 282} {"train_loss": -5.148208141326904, "global_step": 11882, "epoch": 282} {"train_loss": -5.117596626281738, "global_step": 11883, "epoch": 282} {"train_loss": -5.184235095977783, "global_step": 11884, "epoch": 282} {"train_loss": -5.094350440161569, "global_step": 11885, "epoch": 282, "val_loss": 74412.0} {"train_loss": -5.152006149291992, "global_step": 11886, "epoch": 283} {"train_loss": -5.161887168884277, "global_step": 11887, "epoch": 283} {"train_loss": -5.067129135131836, "global_step": 11888, "epoch": 283} {"train_loss": -5.169621467590332, "global_step": 11889, "epoch": 283} {"train_loss": -5.117162704467773, "global_step": 11890, "epoch": 283} {"train_loss": -5.23341178894043, "global_step": 11891, "epoch": 283} {"train_loss": -5.283684730529785, "global_step": 11892, "epoch": 283} {"train_loss": -5.214258193969727, "global_step": 11893, "epoch": 283} {"train_loss": -5.0942769050598145, "global_step": 11894, "epoch": 283} {"train_loss": -5.113655090332031, "global_step": 11895, "epoch": 283} {"train_loss": -5.143083095550537, "global_step": 11896, "epoch": 283} {"train_loss": -5.285891056060791, "global_step": 11897, "epoch": 283} {"train_loss": -5.14453649520874, "global_step": 11898, "epoch": 283} {"train_loss": -5.272486686706543, "global_step": 11899, "epoch": 283} {"train_loss": -5.153104782104492, "global_step": 11900, "epoch": 283} {"train_loss": -5.238097667694092, "global_step": 11901, "epoch": 283} {"train_loss": -4.990334510803223, "global_step": 11902, "epoch": 283} {"train_loss": -5.122875213623047, "global_step": 11903, "epoch": 283} {"train_loss": -4.949833869934082, "global_step": 11904, "epoch": 283} {"train_loss": -5.267457008361816, "global_step": 11905, "epoch": 283} {"train_loss": -5.148104667663574, "global_step": 11906, "epoch": 283} {"train_loss": -5.076816558837891, "global_step": 11907, "epoch": 283} {"train_loss": -5.215623378753662, "global_step": 11908, "epoch": 283} {"train_loss": -5.092740058898926, "global_step": 11909, "epoch": 283} {"train_loss": -5.058795928955078, "global_step": 11910, "epoch": 283} {"train_loss": -5.151483535766602, "global_step": 11911, "epoch": 283} {"train_loss": -5.098871231079102, "global_step": 11912, "epoch": 283} {"train_loss": -5.3188371658325195, "global_step": 11913, "epoch": 283} {"train_loss": -5.078784942626953, "global_step": 11914, "epoch": 283} {"train_loss": -5.157466888427734, "global_step": 11915, "epoch": 283} {"train_loss": -4.988103866577148, "global_step": 11916, "epoch": 283} {"train_loss": -5.002648830413818, "global_step": 11917, "epoch": 283} {"train_loss": -5.230424880981445, "global_step": 11918, "epoch": 283} {"train_loss": -4.990647315979004, "global_step": 11919, "epoch": 283} {"train_loss": -4.936827182769775, "global_step": 11920, "epoch": 283} {"train_loss": -5.21992301940918, "global_step": 11921, "epoch": 283} {"train_loss": -4.895159721374512, "global_step": 11922, "epoch": 283} {"train_loss": -5.034387111663818, "global_step": 11923, "epoch": 283} {"train_loss": -5.051538467407227, "global_step": 11924, "epoch": 283} {"train_loss": -5.111949920654297, "global_step": 11925, "epoch": 283} {"train_loss": -4.934283256530762, "global_step": 11926, "epoch": 283} {"train_loss": -5.119821275983538, "global_step": 11927, "epoch": 283, "val_loss": 76568.5625} {"train_loss": -5.11430025100708, "global_step": 11928, "epoch": 284} {"train_loss": -5.053791046142578, "global_step": 11929, "epoch": 284} {"train_loss": -5.131411075592041, "global_step": 11930, "epoch": 284} {"train_loss": -5.071285247802734, "global_step": 11931, "epoch": 284} {"train_loss": -5.2381510734558105, "global_step": 11932, "epoch": 284} {"train_loss": -4.965860843658447, "global_step": 11933, "epoch": 284} {"train_loss": -5.060110092163086, "global_step": 11934, "epoch": 284} {"train_loss": -5.135432243347168, "global_step": 11935, "epoch": 284} {"train_loss": -5.028191566467285, "global_step": 11936, "epoch": 284} {"train_loss": -5.136462211608887, "global_step": 11937, "epoch": 284} {"train_loss": -5.0457048416137695, "global_step": 11938, "epoch": 284} {"train_loss": -5.122397422790527, "global_step": 11939, "epoch": 284} {"train_loss": -5.027840614318848, "global_step": 11940, "epoch": 284} {"train_loss": -5.200697898864746, "global_step": 11941, "epoch": 284} {"train_loss": -5.186039924621582, "global_step": 11942, "epoch": 284} {"train_loss": -5.075584411621094, "global_step": 11943, "epoch": 284} {"train_loss": -5.04248046875, "global_step": 11944, "epoch": 284} {"train_loss": -5.097583293914795, "global_step": 11945, "epoch": 284} {"train_loss": -5.227626800537109, "global_step": 11946, "epoch": 284} {"train_loss": -5.07496452331543, "global_step": 11947, "epoch": 284} {"train_loss": -5.051114082336426, "global_step": 11948, "epoch": 284} {"train_loss": -5.143382549285889, "global_step": 11949, "epoch": 284} {"train_loss": -5.29778528213501, "global_step": 11950, "epoch": 284} {"train_loss": -5.212033271789551, "global_step": 11951, "epoch": 284} {"train_loss": -5.122319221496582, "global_step": 11952, "epoch": 284} {"train_loss": -5.31126594543457, "global_step": 11953, "epoch": 284} {"train_loss": -5.100829601287842, "global_step": 11954, "epoch": 284} {"train_loss": -5.087471961975098, "global_step": 11955, "epoch": 284} {"train_loss": -5.025936603546143, "global_step": 11956, "epoch": 284} {"train_loss": -5.187604904174805, "global_step": 11957, "epoch": 284} {"train_loss": -5.012773036956787, "global_step": 11958, "epoch": 284} {"train_loss": -5.154593467712402, "global_step": 11959, "epoch": 284} {"train_loss": -5.064126491546631, "global_step": 11960, "epoch": 284} {"train_loss": -5.1265950202941895, "global_step": 11961, "epoch": 284} {"train_loss": -5.170683860778809, "global_step": 11962, "epoch": 284} {"train_loss": -5.083550453186035, "global_step": 11963, "epoch": 284} {"train_loss": -5.15447998046875, "global_step": 11964, "epoch": 284} {"train_loss": -5.260663986206055, "global_step": 11965, "epoch": 284} {"train_loss": -5.071688652038574, "global_step": 11966, "epoch": 284} {"train_loss": -5.042771339416504, "global_step": 11967, "epoch": 284} {"train_loss": -5.0935797691345215, "global_step": 11968, "epoch": 284} {"train_loss": -5.118543954122634, "global_step": 11969, "epoch": 284, "val_loss": 75713.078125} {"train_loss": -5.054961204528809, "global_step": 11970, "epoch": 285} {"train_loss": -5.148722171783447, "global_step": 11971, "epoch": 285} {"train_loss": -5.137609481811523, "global_step": 11972, "epoch": 285} {"train_loss": -4.945408821105957, "global_step": 11973, "epoch": 285} {"train_loss": -5.102982521057129, "global_step": 11974, "epoch": 285} {"train_loss": -5.124963760375977, "global_step": 11975, "epoch": 285} {"train_loss": -5.043395042419434, "global_step": 11976, "epoch": 285} {"train_loss": -5.2516937255859375, "global_step": 11977, "epoch": 285} {"train_loss": -5.081840515136719, "global_step": 11978, "epoch": 285} {"train_loss": -5.0825114250183105, "global_step": 11979, "epoch": 285} {"train_loss": -5.124201774597168, "global_step": 11980, "epoch": 285} {"train_loss": -5.114993095397949, "global_step": 11981, "epoch": 285} {"train_loss": -5.090794086456299, "global_step": 11982, "epoch": 285} {"train_loss": -5.1857523918151855, "global_step": 11983, "epoch": 285} {"train_loss": -5.122003078460693, "global_step": 11984, "epoch": 285} {"train_loss": -4.917957305908203, "global_step": 11985, "epoch": 285} {"train_loss": -5.23738956451416, "global_step": 11986, "epoch": 285} {"train_loss": -5.170734405517578, "global_step": 11987, "epoch": 285} {"train_loss": -5.148439407348633, "global_step": 11988, "epoch": 285} {"train_loss": -5.135054588317871, "global_step": 11989, "epoch": 285} {"train_loss": -4.995510101318359, "global_step": 11990, "epoch": 285} {"train_loss": -5.112306118011475, "global_step": 11991, "epoch": 285} {"train_loss": -5.099495887756348, "global_step": 11992, "epoch": 285} {"train_loss": -5.1409759521484375, "global_step": 11993, "epoch": 285} {"train_loss": -5.053132057189941, "global_step": 11994, "epoch": 285} {"train_loss": -5.190903663635254, "global_step": 11995, "epoch": 285} {"train_loss": -5.210660457611084, "global_step": 11996, "epoch": 285} {"train_loss": -5.104053020477295, "global_step": 11997, "epoch": 285} {"train_loss": -5.007620334625244, "global_step": 11998, "epoch": 285} {"train_loss": -5.2706098556518555, "global_step": 11999, "epoch": 285} {"train_loss": -5.12758731842041, "global_step": 12000, "epoch": 285} {"train_loss": -5.207919120788574, "global_step": 12001, "epoch": 285} {"train_loss": -5.304389953613281, "global_step": 12002, "epoch": 285} {"train_loss": -5.059263229370117, "global_step": 12003, "epoch": 285} {"train_loss": -5.221541404724121, "global_step": 12004, "epoch": 285} {"train_loss": -5.230555534362793, "global_step": 12005, "epoch": 285} {"train_loss": -5.195586204528809, "global_step": 12006, "epoch": 285} {"train_loss": -5.21968412399292, "global_step": 12007, "epoch": 285} {"train_loss": -5.137779235839844, "global_step": 12008, "epoch": 285} {"train_loss": -5.333568572998047, "global_step": 12009, "epoch": 285} {"train_loss": -5.109968185424805, "global_step": 12010, "epoch": 285} {"train_loss": -5.133171274548485, "global_step": 12011, "epoch": 285, "val_loss": 74611.171875} {"train_loss": -5.091461181640625, "global_step": 12012, "epoch": 286} {"train_loss": -5.113916397094727, "global_step": 12013, "epoch": 286} {"train_loss": -5.307544708251953, "global_step": 12014, "epoch": 286} {"train_loss": -5.157476425170898, "global_step": 12015, "epoch": 286} {"train_loss": -5.171119213104248, "global_step": 12016, "epoch": 286} {"train_loss": -5.1640543937683105, "global_step": 12017, "epoch": 286} {"train_loss": -5.303689956665039, "global_step": 12018, "epoch": 286} {"train_loss": -5.218217849731445, "global_step": 12019, "epoch": 286} {"train_loss": -5.081057548522949, "global_step": 12020, "epoch": 286} {"train_loss": -5.114792823791504, "global_step": 12021, "epoch": 286} {"train_loss": -5.223664283752441, "global_step": 12022, "epoch": 286} {"train_loss": -5.178384780883789, "global_step": 12023, "epoch": 286} {"train_loss": -5.075308322906494, "global_step": 12024, "epoch": 286} {"train_loss": -5.112017631530762, "global_step": 12025, "epoch": 286} {"train_loss": -5.093387603759766, "global_step": 12026, "epoch": 286} {"train_loss": -5.17099666595459, "global_step": 12027, "epoch": 286} {"train_loss": -5.102588653564453, "global_step": 12028, "epoch": 286} {"train_loss": -5.177209854125977, "global_step": 12029, "epoch": 286} {"train_loss": -5.206055641174316, "global_step": 12030, "epoch": 286} {"train_loss": -5.17576265335083, "global_step": 12031, "epoch": 286} {"train_loss": -5.368253231048584, "global_step": 12032, "epoch": 286} {"train_loss": -5.159817218780518, "global_step": 12033, "epoch": 286} {"train_loss": -5.275399684906006, "global_step": 12034, "epoch": 286} {"train_loss": -5.111893653869629, "global_step": 12035, "epoch": 286} {"train_loss": -5.149837493896484, "global_step": 12036, "epoch": 286} {"train_loss": -5.2184247970581055, "global_step": 12037, "epoch": 286} {"train_loss": -5.234626770019531, "global_step": 12038, "epoch": 286} {"train_loss": -4.706991195678711, "global_step": 12039, "epoch": 286} {"train_loss": -5.074565887451172, "global_step": 12040, "epoch": 286} {"train_loss": -5.211973190307617, "global_step": 12041, "epoch": 286} {"train_loss": -4.936840057373047, "global_step": 12042, "epoch": 286} {"train_loss": -5.002863883972168, "global_step": 12043, "epoch": 286} {"train_loss": -4.972418785095215, "global_step": 12044, "epoch": 286} {"train_loss": -5.271379470825195, "global_step": 12045, "epoch": 286} {"train_loss": -4.945793151855469, "global_step": 12046, "epoch": 286} {"train_loss": -5.006743907928467, "global_step": 12047, "epoch": 286} {"train_loss": -4.977619171142578, "global_step": 12048, "epoch": 286} {"train_loss": -5.063205718994141, "global_step": 12049, "epoch": 286} {"train_loss": -5.187160968780518, "global_step": 12050, "epoch": 286} {"train_loss": -4.982819557189941, "global_step": 12051, "epoch": 286} {"train_loss": -5.0022501945495605, "global_step": 12052, "epoch": 286} {"train_loss": -5.125914289837792, "global_step": 12053, "epoch": 286, "val_loss": 74641.140625} {"train_loss": -5.044252395629883, "global_step": 12054, "epoch": 287} {"train_loss": -5.038574695587158, "global_step": 12055, "epoch": 287} {"train_loss": -5.175644874572754, "global_step": 12056, "epoch": 287} {"train_loss": -4.984238624572754, "global_step": 12057, "epoch": 287} {"train_loss": -5.212389945983887, "global_step": 12058, "epoch": 287} {"train_loss": -4.940698623657227, "global_step": 12059, "epoch": 287} {"train_loss": -5.052699089050293, "global_step": 12060, "epoch": 287} {"train_loss": -5.135931968688965, "global_step": 12061, "epoch": 287} {"train_loss": -4.908045291900635, "global_step": 12062, "epoch": 287} {"train_loss": -5.099587440490723, "global_step": 12063, "epoch": 287} {"train_loss": -5.030174732208252, "global_step": 12064, "epoch": 287} {"train_loss": -5.052436828613281, "global_step": 12065, "epoch": 287} {"train_loss": -5.083367347717285, "global_step": 12066, "epoch": 287} {"train_loss": -5.072542190551758, "global_step": 12067, "epoch": 287} {"train_loss": -5.144044876098633, "global_step": 12068, "epoch": 287} {"train_loss": -4.984864711761475, "global_step": 12069, "epoch": 287} {"train_loss": -5.085893630981445, "global_step": 12070, "epoch": 287} {"train_loss": -5.264379978179932, "global_step": 12071, "epoch": 287} {"train_loss": -5.054766654968262, "global_step": 12072, "epoch": 287} {"train_loss": -5.101024627685547, "global_step": 12073, "epoch": 287} {"train_loss": -5.117831230163574, "global_step": 12074, "epoch": 287} {"train_loss": -4.983558177947998, "global_step": 12075, "epoch": 287} {"train_loss": -5.071256160736084, "global_step": 12076, "epoch": 287} {"train_loss": -5.278582572937012, "global_step": 12077, "epoch": 287} {"train_loss": -5.17850399017334, "global_step": 12078, "epoch": 287} {"train_loss": -5.076590538024902, "global_step": 12079, "epoch": 287} {"train_loss": -5.079580783843994, "global_step": 12080, "epoch": 287} {"train_loss": -5.1148786544799805, "global_step": 12081, "epoch": 287} {"train_loss": -5.164746284484863, "global_step": 12082, "epoch": 287} {"train_loss": -5.194779872894287, "global_step": 12083, "epoch": 287} {"train_loss": -5.196059703826904, "global_step": 12084, "epoch": 287} {"train_loss": -5.150852203369141, "global_step": 12085, "epoch": 287} {"train_loss": -5.130825996398926, "global_step": 12086, "epoch": 287} {"train_loss": -5.071155548095703, "global_step": 12087, "epoch": 287} {"train_loss": -5.289989471435547, "global_step": 12088, "epoch": 287} {"train_loss": -5.078686714172363, "global_step": 12089, "epoch": 287} {"train_loss": -5.101829528808594, "global_step": 12090, "epoch": 287} {"train_loss": -5.136163234710693, "global_step": 12091, "epoch": 287} {"train_loss": -5.172811031341553, "global_step": 12092, "epoch": 287} {"train_loss": -5.1186933517456055, "global_step": 12093, "epoch": 287} {"train_loss": -5.203210830688477, "global_step": 12094, "epoch": 287} {"train_loss": -5.110798438390096, "global_step": 12095, "epoch": 287, "val_loss": 74412.8515625} {"train_loss": -5.014395713806152, "global_step": 12096, "epoch": 288} {"train_loss": -5.165009498596191, "global_step": 12097, "epoch": 288} {"train_loss": -5.273349761962891, "global_step": 12098, "epoch": 288} {"train_loss": -5.189703464508057, "global_step": 12099, "epoch": 288} {"train_loss": -5.22971248626709, "global_step": 12100, "epoch": 288} {"train_loss": -5.125577926635742, "global_step": 12101, "epoch": 288} {"train_loss": -5.202018737792969, "global_step": 12102, "epoch": 288} {"train_loss": -5.002499580383301, "global_step": 12103, "epoch": 288} {"train_loss": -5.035538673400879, "global_step": 12104, "epoch": 288} {"train_loss": -5.12534236907959, "global_step": 12105, "epoch": 288} {"train_loss": -5.143701553344727, "global_step": 12106, "epoch": 288} {"train_loss": -5.258882522583008, "global_step": 12107, "epoch": 288} {"train_loss": -5.047986030578613, "global_step": 12108, "epoch": 288} {"train_loss": -5.158822059631348, "global_step": 12109, "epoch": 288} {"train_loss": -4.9267072677612305, "global_step": 12110, "epoch": 288} {"train_loss": -5.09682035446167, "global_step": 12111, "epoch": 288} {"train_loss": -5.270471572875977, "global_step": 12112, "epoch": 288} {"train_loss": -5.127876281738281, "global_step": 12113, "epoch": 288} {"train_loss": -5.153897285461426, "global_step": 12114, "epoch": 288} {"train_loss": -5.1754536628723145, "global_step": 12115, "epoch": 288} {"train_loss": -5.152114391326904, "global_step": 12116, "epoch": 288} {"train_loss": -5.227909564971924, "global_step": 12117, "epoch": 288} {"train_loss": -5.206130027770996, "global_step": 12118, "epoch": 288} {"train_loss": -5.143778324127197, "global_step": 12119, "epoch": 288} {"train_loss": -5.223015785217285, "global_step": 12120, "epoch": 288} {"train_loss": -5.13072395324707, "global_step": 12121, "epoch": 288} {"train_loss": -5.144064426422119, "global_step": 12122, "epoch": 288} {"train_loss": -5.141597747802734, "global_step": 12123, "epoch": 288} {"train_loss": -5.000361442565918, "global_step": 12124, "epoch": 288} {"train_loss": -5.023305892944336, "global_step": 12125, "epoch": 288} {"train_loss": -5.171873092651367, "global_step": 12126, "epoch": 288} {"train_loss": -5.277186393737793, "global_step": 12127, "epoch": 288} {"train_loss": -5.187562465667725, "global_step": 12128, "epoch": 288} {"train_loss": -5.12067174911499, "global_step": 12129, "epoch": 288} {"train_loss": -5.354352951049805, "global_step": 12130, "epoch": 288} {"train_loss": -5.097305774688721, "global_step": 12131, "epoch": 288} {"train_loss": -5.0835771560668945, "global_step": 12132, "epoch": 288} {"train_loss": -5.148870468139648, "global_step": 12133, "epoch": 288} {"train_loss": -5.070950031280518, "global_step": 12134, "epoch": 288} {"train_loss": -5.065288543701172, "global_step": 12135, "epoch": 288} {"train_loss": -5.053397178649902, "global_step": 12136, "epoch": 288} {"train_loss": -5.141128381093343, "global_step": 12137, "epoch": 288, "val_loss": 74094.1640625} {"train_loss": -5.023830413818359, "global_step": 12138, "epoch": 289} {"train_loss": -5.148325443267822, "global_step": 12139, "epoch": 289} {"train_loss": -4.946393966674805, "global_step": 12140, "epoch": 289} {"train_loss": -5.121397018432617, "global_step": 12141, "epoch": 289} {"train_loss": -4.901547431945801, "global_step": 12142, "epoch": 289} {"train_loss": -4.995762825012207, "global_step": 12143, "epoch": 289} {"train_loss": -4.851737022399902, "global_step": 12144, "epoch": 289} {"train_loss": -4.982760906219482, "global_step": 12145, "epoch": 289} {"train_loss": -5.16513729095459, "global_step": 12146, "epoch": 289} {"train_loss": -4.866116523742676, "global_step": 12147, "epoch": 289} {"train_loss": -5.182379722595215, "global_step": 12148, "epoch": 289} {"train_loss": -5.096255302429199, "global_step": 12149, "epoch": 289} {"train_loss": -5.083237648010254, "global_step": 12150, "epoch": 289} {"train_loss": -5.22325325012207, "global_step": 12151, "epoch": 289} {"train_loss": -4.978768348693848, "global_step": 12152, "epoch": 289} {"train_loss": -5.20165491104126, "global_step": 12153, "epoch": 289} {"train_loss": -5.188899517059326, "global_step": 12154, "epoch": 289} {"train_loss": -5.108587265014648, "global_step": 12155, "epoch": 289} {"train_loss": -5.249911785125732, "global_step": 12156, "epoch": 289} {"train_loss": -5.249822616577148, "global_step": 12157, "epoch": 289} {"train_loss": -5.05136775970459, "global_step": 12158, "epoch": 289} {"train_loss": -5.123383045196533, "global_step": 12159, "epoch": 289} {"train_loss": -5.247345924377441, "global_step": 12160, "epoch": 289} {"train_loss": -5.228024005889893, "global_step": 12161, "epoch": 289} {"train_loss": -5.232479572296143, "global_step": 12162, "epoch": 289} {"train_loss": -5.274519443511963, "global_step": 12163, "epoch": 289} {"train_loss": -5.184713363647461, "global_step": 12164, "epoch": 289} {"train_loss": -5.113672256469727, "global_step": 12165, "epoch": 289} {"train_loss": -5.352110862731934, "global_step": 12166, "epoch": 289} {"train_loss": -5.127799987792969, "global_step": 12167, "epoch": 289} {"train_loss": -5.122485160827637, "global_step": 12168, "epoch": 289} {"train_loss": -5.065710067749023, "global_step": 12169, "epoch": 289} {"train_loss": -5.132966995239258, "global_step": 12170, "epoch": 289} {"train_loss": -5.185293197631836, "global_step": 12171, "epoch": 289} {"train_loss": -5.014861106872559, "global_step": 12172, "epoch": 289} {"train_loss": -5.054476737976074, "global_step": 12173, "epoch": 289} {"train_loss": -5.341566562652588, "global_step": 12174, "epoch": 289} {"train_loss": -5.028977394104004, "global_step": 12175, "epoch": 289} {"train_loss": -5.151096343994141, "global_step": 12176, "epoch": 289} {"train_loss": -5.096640586853027, "global_step": 12177, "epoch": 289} {"train_loss": -5.179444313049316, "global_step": 12178, "epoch": 289} {"train_loss": -5.120618570418585, "global_step": 12179, "epoch": 289, "val_loss": 74429.8359375} {"train_loss": -5.092436790466309, "global_step": 12180, "epoch": 290} {"train_loss": -5.2118239402771, "global_step": 12181, "epoch": 290} {"train_loss": -5.22677755355835, "global_step": 12182, "epoch": 290} {"train_loss": -5.262346267700195, "global_step": 12183, "epoch": 290} {"train_loss": -5.159378528594971, "global_step": 12184, "epoch": 290} {"train_loss": -5.168098449707031, "global_step": 12185, "epoch": 290} {"train_loss": -5.150196552276611, "global_step": 12186, "epoch": 290} {"train_loss": -5.095013618469238, "global_step": 12187, "epoch": 290} {"train_loss": -5.230395317077637, "global_step": 12188, "epoch": 290} {"train_loss": -4.999961853027344, "global_step": 12189, "epoch": 290} {"train_loss": -5.1659650802612305, "global_step": 12190, "epoch": 290} {"train_loss": -5.22799015045166, "global_step": 12191, "epoch": 290} {"train_loss": -5.2754807472229, "global_step": 12192, "epoch": 290} {"train_loss": -5.10560417175293, "global_step": 12193, "epoch": 290} {"train_loss": -5.083420753479004, "global_step": 12194, "epoch": 290} {"train_loss": -5.156482696533203, "global_step": 12195, "epoch": 290} {"train_loss": -5.032049655914307, "global_step": 12196, "epoch": 290} {"train_loss": -5.239372253417969, "global_step": 12197, "epoch": 290} {"train_loss": -5.0879998207092285, "global_step": 12198, "epoch": 290} {"train_loss": -5.056186676025391, "global_step": 12199, "epoch": 290} {"train_loss": -5.152145862579346, "global_step": 12200, "epoch": 290} {"train_loss": -5.169498443603516, "global_step": 12201, "epoch": 290} {"train_loss": -5.076572418212891, "global_step": 12202, "epoch": 290} {"train_loss": -5.0649542808532715, "global_step": 12203, "epoch": 290} {"train_loss": -4.979140281677246, "global_step": 12204, "epoch": 290} {"train_loss": -5.050512313842773, "global_step": 12205, "epoch": 290} {"train_loss": -5.003810882568359, "global_step": 12206, "epoch": 290} {"train_loss": -5.038246154785156, "global_step": 12207, "epoch": 290} {"train_loss": -5.150312423706055, "global_step": 12208, "epoch": 290} {"train_loss": -5.1068315505981445, "global_step": 12209, "epoch": 290} {"train_loss": -4.959729194641113, "global_step": 12210, "epoch": 290} {"train_loss": -5.05202579498291, "global_step": 12211, "epoch": 290} {"train_loss": -5.036819934844971, "global_step": 12212, "epoch": 290} {"train_loss": -5.149886131286621, "global_step": 12213, "epoch": 290} {"train_loss": -5.169989109039307, "global_step": 12214, "epoch": 290} {"train_loss": -5.0428667068481445, "global_step": 12215, "epoch": 290} {"train_loss": -5.077561378479004, "global_step": 12216, "epoch": 290} {"train_loss": -5.063600540161133, "global_step": 12217, "epoch": 290} {"train_loss": -5.082931995391846, "global_step": 12218, "epoch": 290} {"train_loss": -5.123182773590088, "global_step": 12219, "epoch": 290} {"train_loss": -5.198455810546875, "global_step": 12220, "epoch": 290} {"train_loss": -5.118165686016991, "global_step": 12221, "epoch": 290, "val_loss": 74938.3359375} {"train_loss": -5.1180100440979, "global_step": 12222, "epoch": 291} {"train_loss": -5.095233917236328, "global_step": 12223, "epoch": 291} {"train_loss": -5.186478614807129, "global_step": 12224, "epoch": 291} {"train_loss": -5.266984462738037, "global_step": 12225, "epoch": 291} {"train_loss": -5.217123031616211, "global_step": 12226, "epoch": 291} {"train_loss": -5.127725601196289, "global_step": 12227, "epoch": 291} {"train_loss": -5.07526159286499, "global_step": 12228, "epoch": 291} {"train_loss": -5.13848876953125, "global_step": 12229, "epoch": 291} {"train_loss": -5.208920478820801, "global_step": 12230, "epoch": 291} {"train_loss": -5.085977554321289, "global_step": 12231, "epoch": 291} {"train_loss": -4.925950050354004, "global_step": 12232, "epoch": 291} {"train_loss": -5.258321762084961, "global_step": 12233, "epoch": 291} {"train_loss": -5.178867340087891, "global_step": 12234, "epoch": 291} {"train_loss": -5.221174240112305, "global_step": 12235, "epoch": 291} {"train_loss": -5.1934895515441895, "global_step": 12236, "epoch": 291} {"train_loss": -4.892548561096191, "global_step": 12237, "epoch": 291} {"train_loss": -5.056191921234131, "global_step": 12238, "epoch": 291} {"train_loss": -5.127516746520996, "global_step": 12239, "epoch": 291} {"train_loss": -5.044266223907471, "global_step": 12240, "epoch": 291} {"train_loss": -5.183553218841553, "global_step": 12241, "epoch": 291} {"train_loss": -5.129872798919678, "global_step": 12242, "epoch": 291} {"train_loss": -5.130256652832031, "global_step": 12243, "epoch": 291} {"train_loss": -5.1730804443359375, "global_step": 12244, "epoch": 291} {"train_loss": -5.133368492126465, "global_step": 12245, "epoch": 291} {"train_loss": -5.025041103363037, "global_step": 12246, "epoch": 291} {"train_loss": -5.052524089813232, "global_step": 12247, "epoch": 291} {"train_loss": -4.928476333618164, "global_step": 12248, "epoch": 291} {"train_loss": -5.076693534851074, "global_step": 12249, "epoch": 291} {"train_loss": -5.036470890045166, "global_step": 12250, "epoch": 291} {"train_loss": -4.9623565673828125, "global_step": 12251, "epoch": 291} {"train_loss": -5.070409297943115, "global_step": 12252, "epoch": 291} {"train_loss": -5.060243606567383, "global_step": 12253, "epoch": 291} {"train_loss": -5.05897855758667, "global_step": 12254, "epoch": 291} {"train_loss": -5.044326305389404, "global_step": 12255, "epoch": 291} {"train_loss": -4.9913177490234375, "global_step": 12256, "epoch": 291} {"train_loss": -5.160305976867676, "global_step": 12257, "epoch": 291} {"train_loss": -4.870981216430664, "global_step": 12258, "epoch": 291} {"train_loss": -5.089874267578125, "global_step": 12259, "epoch": 291} {"train_loss": -5.2045979499816895, "global_step": 12260, "epoch": 291} {"train_loss": -5.1489787101745605, "global_step": 12261, "epoch": 291} {"train_loss": -5.085450172424316, "global_step": 12262, "epoch": 291} {"train_loss": -5.100423460914975, "global_step": 12263, "epoch": 291, "val_loss": 74633.0859375} {"train_loss": -4.94960880279541, "global_step": 12264, "epoch": 292} {"train_loss": -5.022737979888916, "global_step": 12265, "epoch": 292} {"train_loss": -5.024813652038574, "global_step": 12266, "epoch": 292} {"train_loss": -5.126317977905273, "global_step": 12267, "epoch": 292} {"train_loss": -5.09027099609375, "global_step": 12268, "epoch": 292} {"train_loss": -4.980542182922363, "global_step": 12269, "epoch": 292} {"train_loss": -5.143787860870361, "global_step": 12270, "epoch": 292} {"train_loss": -5.079977989196777, "global_step": 12271, "epoch": 292} {"train_loss": -5.213748455047607, "global_step": 12272, "epoch": 292} {"train_loss": -5.255918979644775, "global_step": 12273, "epoch": 292} {"train_loss": -5.014033317565918, "global_step": 12274, "epoch": 292} {"train_loss": -5.138497352600098, "global_step": 12275, "epoch": 292} {"train_loss": -5.180848121643066, "global_step": 12276, "epoch": 292} {"train_loss": -5.001623153686523, "global_step": 12277, "epoch": 292} {"train_loss": -5.186923503875732, "global_step": 12278, "epoch": 292} {"train_loss": -5.154786586761475, "global_step": 12279, "epoch": 292} {"train_loss": -4.936901569366455, "global_step": 12280, "epoch": 292} {"train_loss": -5.183228492736816, "global_step": 12281, "epoch": 292} {"train_loss": -5.198923110961914, "global_step": 12282, "epoch": 292} {"train_loss": -5.117486476898193, "global_step": 12283, "epoch": 292} {"train_loss": -5.080228805541992, "global_step": 12284, "epoch": 292} {"train_loss": -5.233697414398193, "global_step": 12285, "epoch": 292} {"train_loss": -5.05978536605835, "global_step": 12286, "epoch": 292} {"train_loss": -5.187387466430664, "global_step": 12287, "epoch": 292} {"train_loss": -5.165445327758789, "global_step": 12288, "epoch": 292} {"train_loss": -5.242682456970215, "global_step": 12289, "epoch": 292} {"train_loss": -5.145488739013672, "global_step": 12290, "epoch": 292} {"train_loss": -5.0185041427612305, "global_step": 12291, "epoch": 292} {"train_loss": -5.162619590759277, "global_step": 12292, "epoch": 292} {"train_loss": -5.130341053009033, "global_step": 12293, "epoch": 292} {"train_loss": -5.189408302307129, "global_step": 12294, "epoch": 292} {"train_loss": -5.238245964050293, "global_step": 12295, "epoch": 292} {"train_loss": -5.114380836486816, "global_step": 12296, "epoch": 292} {"train_loss": -5.158235549926758, "global_step": 12297, "epoch": 292} {"train_loss": -5.157644271850586, "global_step": 12298, "epoch": 292} {"train_loss": -5.0766777992248535, "global_step": 12299, "epoch": 292} {"train_loss": -5.2884416580200195, "global_step": 12300, "epoch": 292} {"train_loss": -4.9984259605407715, "global_step": 12301, "epoch": 292} {"train_loss": -5.030718803405762, "global_step": 12302, "epoch": 292} {"train_loss": -5.214443683624268, "global_step": 12303, "epoch": 292} {"train_loss": -5.105024337768555, "global_step": 12304, "epoch": 292} {"train_loss": -5.119020609628587, "global_step": 12305, "epoch": 292, "val_loss": 74319.890625} {"train_loss": -5.048662185668945, "global_step": 12306, "epoch": 293} {"train_loss": -5.09615421295166, "global_step": 12307, "epoch": 293} {"train_loss": -5.081037521362305, "global_step": 12308, "epoch": 293} {"train_loss": -5.169330596923828, "global_step": 12309, "epoch": 293} {"train_loss": -5.23544979095459, "global_step": 12310, "epoch": 293} {"train_loss": -5.004945755004883, "global_step": 12311, "epoch": 293} {"train_loss": -5.165655136108398, "global_step": 12312, "epoch": 293} {"train_loss": -5.0238423347473145, "global_step": 12313, "epoch": 293} {"train_loss": -5.178999900817871, "global_step": 12314, "epoch": 293} {"train_loss": -5.092253684997559, "global_step": 12315, "epoch": 293} {"train_loss": -5.111941814422607, "global_step": 12316, "epoch": 293} {"train_loss": -5.166630744934082, "global_step": 12317, "epoch": 293} {"train_loss": -5.2593512535095215, "global_step": 12318, "epoch": 293} {"train_loss": -5.096657752990723, "global_step": 12319, "epoch": 293} {"train_loss": -5.170279502868652, "global_step": 12320, "epoch": 293} {"train_loss": -5.239096164703369, "global_step": 12321, "epoch": 293} {"train_loss": -5.119533061981201, "global_step": 12322, "epoch": 293} {"train_loss": -5.21414041519165, "global_step": 12323, "epoch": 293} {"train_loss": -5.271777629852295, "global_step": 12324, "epoch": 293} {"train_loss": -5.222620964050293, "global_step": 12325, "epoch": 293} {"train_loss": -5.133881568908691, "global_step": 12326, "epoch": 293} {"train_loss": -5.201652526855469, "global_step": 12327, "epoch": 293} {"train_loss": -4.954192161560059, "global_step": 12328, "epoch": 293} {"train_loss": -5.139936923980713, "global_step": 12329, "epoch": 293} {"train_loss": -5.12877082824707, "global_step": 12330, "epoch": 293} {"train_loss": -5.111728191375732, "global_step": 12331, "epoch": 293} {"train_loss": -5.1883392333984375, "global_step": 12332, "epoch": 293} {"train_loss": -5.1116204261779785, "global_step": 12333, "epoch": 293} {"train_loss": -5.229809761047363, "global_step": 12334, "epoch": 293} {"train_loss": -5.282086372375488, "global_step": 12335, "epoch": 293} {"train_loss": -5.307676792144775, "global_step": 12336, "epoch": 293} {"train_loss": -5.227438926696777, "global_step": 12337, "epoch": 293} {"train_loss": -5.148099899291992, "global_step": 12338, "epoch": 293} {"train_loss": -5.252054214477539, "global_step": 12339, "epoch": 293} {"train_loss": -5.155275344848633, "global_step": 12340, "epoch": 293} {"train_loss": -5.19548225402832, "global_step": 12341, "epoch": 293} {"train_loss": -5.258070945739746, "global_step": 12342, "epoch": 293} {"train_loss": -5.2038373947143555, "global_step": 12343, "epoch": 293} {"train_loss": -5.242288112640381, "global_step": 12344, "epoch": 293} {"train_loss": -5.021455764770508, "global_step": 12345, "epoch": 293} {"train_loss": -5.088200092315674, "global_step": 12346, "epoch": 293} {"train_loss": -5.159909634363084, "global_step": 12347, "epoch": 293, "val_loss": 74433.5625} {"train_loss": -5.0731353759765625, "global_step": 12348, "epoch": 294} {"train_loss": -5.0132036209106445, "global_step": 12349, "epoch": 294} {"train_loss": -5.367176055908203, "global_step": 12350, "epoch": 294} {"train_loss": -5.314140319824219, "global_step": 12351, "epoch": 294} {"train_loss": -5.350732803344727, "global_step": 12352, "epoch": 294} {"train_loss": -5.173028945922852, "global_step": 12353, "epoch": 294} {"train_loss": -5.145214080810547, "global_step": 12354, "epoch": 294} {"train_loss": -5.057217597961426, "global_step": 12355, "epoch": 294} {"train_loss": -5.09388542175293, "global_step": 12356, "epoch": 294} {"train_loss": -5.089018821716309, "global_step": 12357, "epoch": 294} {"train_loss": -5.242746353149414, "global_step": 12358, "epoch": 294} {"train_loss": -5.16532039642334, "global_step": 12359, "epoch": 294} {"train_loss": -4.964456558227539, "global_step": 12360, "epoch": 294} {"train_loss": -5.320406913757324, "global_step": 12361, "epoch": 294} {"train_loss": -5.104069709777832, "global_step": 12362, "epoch": 294} {"train_loss": -5.0500688552856445, "global_step": 12363, "epoch": 294} {"train_loss": -5.081120491027832, "global_step": 12364, "epoch": 294} {"train_loss": -5.187501907348633, "global_step": 12365, "epoch": 294} {"train_loss": -5.268738746643066, "global_step": 12366, "epoch": 294} {"train_loss": -5.17996883392334, "global_step": 12367, "epoch": 294} {"train_loss": -5.189504146575928, "global_step": 12368, "epoch": 294} {"train_loss": -5.123588562011719, "global_step": 12369, "epoch": 294} {"train_loss": -5.086522579193115, "global_step": 12370, "epoch": 294} {"train_loss": -5.258266925811768, "global_step": 12371, "epoch": 294} {"train_loss": -5.074677467346191, "global_step": 12372, "epoch": 294} {"train_loss": -5.236482620239258, "global_step": 12373, "epoch": 294} {"train_loss": -5.185404300689697, "global_step": 12374, "epoch": 294} {"train_loss": -5.174257278442383, "global_step": 12375, "epoch": 294} {"train_loss": -5.053264141082764, "global_step": 12376, "epoch": 294} {"train_loss": -5.236965179443359, "global_step": 12377, "epoch": 294} {"train_loss": -5.1539998054504395, "global_step": 12378, "epoch": 294} {"train_loss": -5.160684108734131, "global_step": 12379, "epoch": 294} {"train_loss": -5.0891313552856445, "global_step": 12380, "epoch": 294} {"train_loss": -5.244953155517578, "global_step": 12381, "epoch": 294} {"train_loss": -5.288524627685547, "global_step": 12382, "epoch": 294} {"train_loss": -5.117762565612793, "global_step": 12383, "epoch": 294} {"train_loss": -5.12674617767334, "global_step": 12384, "epoch": 294} {"train_loss": -5.292827606201172, "global_step": 12385, "epoch": 294} {"train_loss": -5.082729339599609, "global_step": 12386, "epoch": 294} {"train_loss": -5.0034942626953125, "global_step": 12387, "epoch": 294} {"train_loss": -5.127003192901611, "global_step": 12388, "epoch": 294} {"train_loss": -5.156486000333514, "global_step": 12389, "epoch": 294, "val_loss": 74647.9921875} {"train_loss": -5.070408344268799, "global_step": 12390, "epoch": 295} {"train_loss": -5.135113716125488, "global_step": 12391, "epoch": 295} {"train_loss": -5.089873313903809, "global_step": 12392, "epoch": 295} {"train_loss": -5.165533065795898, "global_step": 12393, "epoch": 295} {"train_loss": -5.253816604614258, "global_step": 12394, "epoch": 295} {"train_loss": -5.086064338684082, "global_step": 12395, "epoch": 295} {"train_loss": -5.1075334548950195, "global_step": 12396, "epoch": 295} {"train_loss": -5.227259159088135, "global_step": 12397, "epoch": 295} {"train_loss": -5.098791122436523, "global_step": 12398, "epoch": 295} {"train_loss": -5.176169395446777, "global_step": 12399, "epoch": 295} {"train_loss": -5.191941261291504, "global_step": 12400, "epoch": 295} {"train_loss": -5.1122355461120605, "global_step": 12401, "epoch": 295} {"train_loss": -5.14973783493042, "global_step": 12402, "epoch": 295} {"train_loss": -5.108454704284668, "global_step": 12403, "epoch": 295} {"train_loss": -5.059473991394043, "global_step": 12404, "epoch": 295} {"train_loss": -5.090623378753662, "global_step": 12405, "epoch": 295} {"train_loss": -5.109102249145508, "global_step": 12406, "epoch": 295} {"train_loss": -4.975608825683594, "global_step": 12407, "epoch": 295} {"train_loss": -5.033018112182617, "global_step": 12408, "epoch": 295} {"train_loss": -5.22672176361084, "global_step": 12409, "epoch": 295} {"train_loss": -5.108870029449463, "global_step": 12410, "epoch": 295} {"train_loss": -5.188014030456543, "global_step": 12411, "epoch": 295} {"train_loss": -5.062948226928711, "global_step": 12412, "epoch": 295} {"train_loss": -5.028789520263672, "global_step": 12413, "epoch": 295} {"train_loss": -5.13081169128418, "global_step": 12414, "epoch": 295} {"train_loss": -4.85637092590332, "global_step": 12415, "epoch": 295} {"train_loss": -5.13637113571167, "global_step": 12416, "epoch": 295} {"train_loss": -4.978841781616211, "global_step": 12417, "epoch": 295} {"train_loss": -5.042607307434082, "global_step": 12418, "epoch": 295} {"train_loss": -5.139127731323242, "global_step": 12419, "epoch": 295} {"train_loss": -5.020322799682617, "global_step": 12420, "epoch": 295} {"train_loss": -4.924004554748535, "global_step": 12421, "epoch": 295} {"train_loss": -5.042304992675781, "global_step": 12422, "epoch": 295} {"train_loss": -4.954157829284668, "global_step": 12423, "epoch": 295} {"train_loss": -5.154315948486328, "global_step": 12424, "epoch": 295} {"train_loss": -5.019871711730957, "global_step": 12425, "epoch": 295} {"train_loss": -5.1888203620910645, "global_step": 12426, "epoch": 295} {"train_loss": -4.851885795593262, "global_step": 12427, "epoch": 295} {"train_loss": -5.192852973937988, "global_step": 12428, "epoch": 295} {"train_loss": -4.96968936920166, "global_step": 12429, "epoch": 295} {"train_loss": -5.131267547607422, "global_step": 12430, "epoch": 295} {"train_loss": -5.087074098132906, "global_step": 12431, "epoch": 295, "val_loss": 73901.09375} {"train_loss": -4.994982719421387, "global_step": 12432, "epoch": 296} {"train_loss": -5.2643327713012695, "global_step": 12433, "epoch": 296} {"train_loss": -5.101078033447266, "global_step": 12434, "epoch": 296} {"train_loss": -5.0339531898498535, "global_step": 12435, "epoch": 296} {"train_loss": -4.945323467254639, "global_step": 12436, "epoch": 296} {"train_loss": -5.126570701599121, "global_step": 12437, "epoch": 296} {"train_loss": -4.9899163246154785, "global_step": 12438, "epoch": 296} {"train_loss": -5.223715782165527, "global_step": 12439, "epoch": 296} {"train_loss": -5.025215148925781, "global_step": 12440, "epoch": 296} {"train_loss": -5.0829315185546875, "global_step": 12441, "epoch": 296} {"train_loss": -5.146580219268799, "global_step": 12442, "epoch": 296} {"train_loss": -4.987482070922852, "global_step": 12443, "epoch": 296} {"train_loss": -5.215250015258789, "global_step": 12444, "epoch": 296} {"train_loss": -5.125085830688477, "global_step": 12445, "epoch": 296} {"train_loss": -5.218977928161621, "global_step": 12446, "epoch": 296} {"train_loss": -5.067177772521973, "global_step": 12447, "epoch": 296} {"train_loss": -5.245545387268066, "global_step": 12448, "epoch": 296} {"train_loss": -5.348409175872803, "global_step": 12449, "epoch": 296} {"train_loss": -5.1226019859313965, "global_step": 12450, "epoch": 296} {"train_loss": -5.234611511230469, "global_step": 12451, "epoch": 296} {"train_loss": -5.195644378662109, "global_step": 12452, "epoch": 296} {"train_loss": -5.166744232177734, "global_step": 12453, "epoch": 296} {"train_loss": -5.037778854370117, "global_step": 12454, "epoch": 296} {"train_loss": -5.109025001525879, "global_step": 12455, "epoch": 296} {"train_loss": -5.14429235458374, "global_step": 12456, "epoch": 296} {"train_loss": -5.213898658752441, "global_step": 12457, "epoch": 296} {"train_loss": -5.137294292449951, "global_step": 12458, "epoch": 296} {"train_loss": -5.213227272033691, "global_step": 12459, "epoch": 296} {"train_loss": -5.1226019859313965, "global_step": 12460, "epoch": 296} {"train_loss": -5.385770797729492, "global_step": 12461, "epoch": 296} {"train_loss": -5.157410621643066, "global_step": 12462, "epoch": 296} {"train_loss": -5.360394477844238, "global_step": 12463, "epoch": 296} {"train_loss": -5.195374011993408, "global_step": 12464, "epoch": 296} {"train_loss": -5.059332370758057, "global_step": 12465, "epoch": 296} {"train_loss": -5.176603317260742, "global_step": 12466, "epoch": 296} {"train_loss": -5.016412734985352, "global_step": 12467, "epoch": 296} {"train_loss": -5.0228071212768555, "global_step": 12468, "epoch": 296} {"train_loss": -5.139923095703125, "global_step": 12469, "epoch": 296} {"train_loss": -5.268588542938232, "global_step": 12470, "epoch": 296} {"train_loss": -5.07971715927124, "global_step": 12471, "epoch": 296} {"train_loss": -5.053752422332764, "global_step": 12472, "epoch": 296} {"train_loss": -5.143394413448515, "global_step": 12473, "epoch": 296, "val_loss": 73985.96875} {"train_loss": -5.103177070617676, "global_step": 12474, "epoch": 297} {"train_loss": -5.1721391677856445, "global_step": 12475, "epoch": 297} {"train_loss": -5.191403388977051, "global_step": 12476, "epoch": 297} {"train_loss": -5.062648773193359, "global_step": 12477, "epoch": 297} {"train_loss": -5.046560287475586, "global_step": 12478, "epoch": 297} {"train_loss": -5.169618606567383, "global_step": 12479, "epoch": 297} {"train_loss": -5.0603532791137695, "global_step": 12480, "epoch": 297} {"train_loss": -5.098468780517578, "global_step": 12481, "epoch": 297} {"train_loss": -5.203611850738525, "global_step": 12482, "epoch": 297} {"train_loss": -5.165902137756348, "global_step": 12483, "epoch": 297} {"train_loss": -5.165571212768555, "global_step": 12484, "epoch": 297} {"train_loss": -5.222710609436035, "global_step": 12485, "epoch": 297} {"train_loss": -5.09783935546875, "global_step": 12486, "epoch": 297} {"train_loss": -5.23833703994751, "global_step": 12487, "epoch": 297} {"train_loss": -5.054329872131348, "global_step": 12488, "epoch": 297} {"train_loss": -5.001999378204346, "global_step": 12489, "epoch": 297} {"train_loss": -5.107417106628418, "global_step": 12490, "epoch": 297} {"train_loss": -5.123866558074951, "global_step": 12491, "epoch": 297} {"train_loss": -5.085622310638428, "global_step": 12492, "epoch": 297} {"train_loss": -5.166309833526611, "global_step": 12493, "epoch": 297} {"train_loss": -5.270380020141602, "global_step": 12494, "epoch": 297} {"train_loss": -5.211027145385742, "global_step": 12495, "epoch": 297} {"train_loss": -5.146495342254639, "global_step": 12496, "epoch": 297} {"train_loss": -5.175868988037109, "global_step": 12497, "epoch": 297} {"train_loss": -5.30034875869751, "global_step": 12498, "epoch": 297} {"train_loss": -5.069149971008301, "global_step": 12499, "epoch": 297} {"train_loss": -5.111258029937744, "global_step": 12500, "epoch": 297} {"train_loss": -5.172154426574707, "global_step": 12501, "epoch": 297} {"train_loss": -5.112418174743652, "global_step": 12502, "epoch": 297} {"train_loss": -5.0792083740234375, "global_step": 12503, "epoch": 297} {"train_loss": -5.27999210357666, "global_step": 12504, "epoch": 297} {"train_loss": -5.1094512939453125, "global_step": 12505, "epoch": 297} {"train_loss": -5.241019248962402, "global_step": 12506, "epoch": 297} {"train_loss": -5.23504638671875, "global_step": 12507, "epoch": 297} {"train_loss": -5.12614631652832, "global_step": 12508, "epoch": 297} {"train_loss": -5.20604133605957, "global_step": 12509, "epoch": 297} {"train_loss": -5.103853702545166, "global_step": 12510, "epoch": 297} {"train_loss": -5.158867835998535, "global_step": 12511, "epoch": 297} {"train_loss": -5.246598243713379, "global_step": 12512, "epoch": 297} {"train_loss": -5.0707316398620605, "global_step": 12513, "epoch": 297} {"train_loss": -5.291355133056641, "global_step": 12514, "epoch": 297} {"train_loss": -5.15635127112979, "global_step": 12515, "epoch": 297, "val_loss": 74165.03125} {"train_loss": -5.093012809753418, "global_step": 12516, "epoch": 298} {"train_loss": -5.098852634429932, "global_step": 12517, "epoch": 298} {"train_loss": -5.20089864730835, "global_step": 12518, "epoch": 298} {"train_loss": -5.008325576782227, "global_step": 12519, "epoch": 298} {"train_loss": -5.207272052764893, "global_step": 12520, "epoch": 298} {"train_loss": -5.215202808380127, "global_step": 12521, "epoch": 298} {"train_loss": -5.234588623046875, "global_step": 12522, "epoch": 298} {"train_loss": -5.123866558074951, "global_step": 12523, "epoch": 298} {"train_loss": -5.044631004333496, "global_step": 12524, "epoch": 298} {"train_loss": -5.206747055053711, "global_step": 12525, "epoch": 298} {"train_loss": -5.084007740020752, "global_step": 12526, "epoch": 298} {"train_loss": -4.9941725730896, "global_step": 12527, "epoch": 298} {"train_loss": -5.103964805603027, "global_step": 12528, "epoch": 298} {"train_loss": -5.235439300537109, "global_step": 12529, "epoch": 298} {"train_loss": -5.031126976013184, "global_step": 12530, "epoch": 298} {"train_loss": -5.21351432800293, "global_step": 12531, "epoch": 298} {"train_loss": -5.139130115509033, "global_step": 12532, "epoch": 298} {"train_loss": -5.0118913650512695, "global_step": 12533, "epoch": 298} {"train_loss": -5.121439456939697, "global_step": 12534, "epoch": 298} {"train_loss": -5.059823989868164, "global_step": 12535, "epoch": 298} {"train_loss": -5.167952060699463, "global_step": 12536, "epoch": 298} {"train_loss": -5.257254123687744, "global_step": 12537, "epoch": 298} {"train_loss": -5.1878437995910645, "global_step": 12538, "epoch": 298} {"train_loss": -5.192481994628906, "global_step": 12539, "epoch": 298} {"train_loss": -5.264556884765625, "global_step": 12540, "epoch": 298} {"train_loss": -5.236423969268799, "global_step": 12541, "epoch": 298} {"train_loss": -5.227217674255371, "global_step": 12542, "epoch": 298} {"train_loss": -5.122999668121338, "global_step": 12543, "epoch": 298} {"train_loss": -5.19312858581543, "global_step": 12544, "epoch": 298} {"train_loss": -5.141529083251953, "global_step": 12545, "epoch": 298} {"train_loss": -5.059667110443115, "global_step": 12546, "epoch": 298} {"train_loss": -5.24806022644043, "global_step": 12547, "epoch": 298} {"train_loss": -5.1219801902771, "global_step": 12548, "epoch": 298} {"train_loss": -5.15487813949585, "global_step": 12549, "epoch": 298} {"train_loss": -5.237911224365234, "global_step": 12550, "epoch": 298} {"train_loss": -5.121636390686035, "global_step": 12551, "epoch": 298} {"train_loss": -5.2541656494140625, "global_step": 12552, "epoch": 298} {"train_loss": -5.21974515914917, "global_step": 12553, "epoch": 298} {"train_loss": -5.2076311111450195, "global_step": 12554, "epoch": 298} {"train_loss": -5.2027482986450195, "global_step": 12555, "epoch": 298} {"train_loss": -5.13080358505249, "global_step": 12556, "epoch": 298} {"train_loss": -5.156623238608951, "global_step": 12557, "epoch": 298, "val_loss": 73989.9375} {"train_loss": -5.251148223876953, "global_step": 12558, "epoch": 299} {"train_loss": -5.196115970611572, "global_step": 12559, "epoch": 299} {"train_loss": -5.236386299133301, "global_step": 12560, "epoch": 299} {"train_loss": -5.109504699707031, "global_step": 12561, "epoch": 299} {"train_loss": -5.215723991394043, "global_step": 12562, "epoch": 299} {"train_loss": -5.122452259063721, "global_step": 12563, "epoch": 299} {"train_loss": -5.026297569274902, "global_step": 12564, "epoch": 299} {"train_loss": -5.113574504852295, "global_step": 12565, "epoch": 299} {"train_loss": -5.157944202423096, "global_step": 12566, "epoch": 299} {"train_loss": -5.293256759643555, "global_step": 12567, "epoch": 299} {"train_loss": -5.144139289855957, "global_step": 12568, "epoch": 299} {"train_loss": -5.151226997375488, "global_step": 12569, "epoch": 299} {"train_loss": -5.095335006713867, "global_step": 12570, "epoch": 299} {"train_loss": -5.077008247375488, "global_step": 12571, "epoch": 299} {"train_loss": -5.129281520843506, "global_step": 12572, "epoch": 299} {"train_loss": -5.1834001541137695, "global_step": 12573, "epoch": 299} {"train_loss": -5.1574931144714355, "global_step": 12574, "epoch": 299} {"train_loss": -5.083885192871094, "global_step": 12575, "epoch": 299} {"train_loss": -5.074553489685059, "global_step": 12576, "epoch": 299} {"train_loss": -5.1658782958984375, "global_step": 12577, "epoch": 299} {"train_loss": -5.132392406463623, "global_step": 12578, "epoch": 299} {"train_loss": -5.2843546867370605, "global_step": 12579, "epoch": 299} {"train_loss": -5.123283386230469, "global_step": 12580, "epoch": 299} {"train_loss": -5.027812957763672, "global_step": 12581, "epoch": 299} {"train_loss": -5.190740585327148, "global_step": 12582, "epoch": 299} {"train_loss": -4.987442970275879, "global_step": 12583, "epoch": 299} {"train_loss": -5.190835952758789, "global_step": 12584, "epoch": 299} {"train_loss": -5.110164642333984, "global_step": 12585, "epoch": 299} {"train_loss": -5.051015377044678, "global_step": 12586, "epoch": 299} {"train_loss": -5.165565490722656, "global_step": 12587, "epoch": 299} {"train_loss": -5.278317928314209, "global_step": 12588, "epoch": 299} {"train_loss": -5.104225158691406, "global_step": 12589, "epoch": 299} {"train_loss": -5.1564040184021, "global_step": 12590, "epoch": 299} {"train_loss": -5.14094352722168, "global_step": 12591, "epoch": 299} {"train_loss": -5.187810897827148, "global_step": 12592, "epoch": 299} {"train_loss": -5.140585899353027, "global_step": 12593, "epoch": 299} {"train_loss": -5.191765308380127, "global_step": 12594, "epoch": 299} {"train_loss": -5.037725448608398, "global_step": 12595, "epoch": 299} {"train_loss": -5.1600213050842285, "global_step": 12596, "epoch": 299} {"train_loss": -5.080511093139648, "global_step": 12597, "epoch": 299} {"train_loss": -5.160680770874023, "global_step": 12598, "epoch": 299} {"train_loss": -5.142637934003558, "global_step": 12599, "epoch": 299, "val_loss": 74586.2578125} {"train_loss": -5.040674209594727, "global_step": 12600, "epoch": 300} {"train_loss": -5.14146614074707, "global_step": 12601, "epoch": 300} {"train_loss": -5.168189525604248, "global_step": 12602, "epoch": 300} {"train_loss": -5.1423845291137695, "global_step": 12603, "epoch": 300} {"train_loss": -4.956221103668213, "global_step": 12604, "epoch": 300} {"train_loss": -5.113464832305908, "global_step": 12605, "epoch": 300} {"train_loss": -5.181490421295166, "global_step": 12606, "epoch": 300} {"train_loss": -5.200223922729492, "global_step": 12607, "epoch": 300} {"train_loss": -5.007091522216797, "global_step": 12608, "epoch": 300} {"train_loss": -5.184052467346191, "global_step": 12609, "epoch": 300} {"train_loss": -5.009418487548828, "global_step": 12610, "epoch": 300} {"train_loss": -5.130793571472168, "global_step": 12611, "epoch": 300} {"train_loss": -5.353581428527832, "global_step": 12612, "epoch": 300} {"train_loss": -5.1995768547058105, "global_step": 12613, "epoch": 300} {"train_loss": -5.249712944030762, "global_step": 12614, "epoch": 300} {"train_loss": -4.997123718261719, "global_step": 12615, "epoch": 300} {"train_loss": -5.172818183898926, "global_step": 12616, "epoch": 300} {"train_loss": -5.2502827644348145, "global_step": 12617, "epoch": 300} {"train_loss": -5.108407020568848, "global_step": 12618, "epoch": 300} {"train_loss": -5.292498588562012, "global_step": 12619, "epoch": 300} {"train_loss": -5.040731906890869, "global_step": 12620, "epoch": 300} {"train_loss": -5.199181079864502, "global_step": 12621, "epoch": 300} {"train_loss": -5.281533718109131, "global_step": 12622, "epoch": 300} {"train_loss": -5.155779838562012, "global_step": 12623, "epoch": 300} {"train_loss": -5.13216495513916, "global_step": 12624, "epoch": 300} {"train_loss": -4.984786033630371, "global_step": 12625, "epoch": 300} {"train_loss": -5.083307266235352, "global_step": 12626, "epoch": 300} {"train_loss": -5.1724324226379395, "global_step": 12627, "epoch": 300} {"train_loss": -5.244393825531006, "global_step": 12628, "epoch": 300} {"train_loss": -5.198630332946777, "global_step": 12629, "epoch": 300} {"train_loss": -5.178569316864014, "global_step": 12630, "epoch": 300} {"train_loss": -4.996831893920898, "global_step": 12631, "epoch": 300} {"train_loss": -5.229771614074707, "global_step": 12632, "epoch": 300} {"train_loss": -5.217885971069336, "global_step": 12633, "epoch": 300} {"train_loss": -4.968775749206543, "global_step": 12634, "epoch": 300} {"train_loss": -5.041942119598389, "global_step": 12635, "epoch": 300} {"train_loss": -5.1442670822143555, "global_step": 12636, "epoch": 300} {"train_loss": -5.0804948806762695, "global_step": 12637, "epoch": 300} {"train_loss": -5.010387420654297, "global_step": 12638, "epoch": 300} {"train_loss": -5.115069389343262, "global_step": 12639, "epoch": 300} {"train_loss": -5.179481029510498, "global_step": 12640, "epoch": 300} {"train_loss": -5.132479565484183, "global_step": 12641, "epoch": 300, "train/sim_max_reward_0": 0.5099811111154724, "train/sim_max_reward_1": 0.019828738216343008, "train/sim_max_reward_2": 0.1100454418581338, "train/sim_max_reward_3": 0.14319348486808597, "train/sim_max_reward_4": 0.23487056028396106, "train/sim_max_reward_5": 0.5673167381529364, "test/sim_max_reward_4400000": 0.08905318884574873, "test/sim_max_reward_4400001": 0.014021135271422376, "test/sim_max_reward_4400002": 0.1722292661585461, "test/sim_max_reward_4400003": 0.3608705790345213, "test/sim_max_reward_4400004": 0.17201862071134683, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.6283055950341597, "test/sim_max_reward_4400009": 0.3423557955726376, "test/sim_max_reward_4400010": 0.17542469364260396, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.39608605909624045, "test/sim_max_reward_4400013": 0.26060918797842514, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.42855780421655393, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.4030578830646057, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.2644449457369751, "test/sim_max_reward_4400024": 0.39304223834884944, "test/sim_max_reward_4400025": 0.26611113948840387, "test/sim_max_reward_4400026": 0.38761342215672945, "test/sim_max_reward_4400027": 0.09382079414631035, "test/sim_max_reward_4400028": 0.322174860270863, "test/sim_max_reward_4400029": 0.1578005823682385, "test/sim_max_reward_4400030": 0.19765961002286297, "test/sim_max_reward_4400031": 0.4012064996283907, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.11540846275254744, "test/sim_max_reward_4400034": 0.18478596727435365, "test/sim_max_reward_4400035": 0.46686053893510154, "test/sim_max_reward_4400036": 0.3830777704215591, "test/sim_max_reward_4400037": 0.32454961001282484, "test/sim_max_reward_4400038": 0.1506432235340239, "test/sim_max_reward_4400039": 0.5416924592821801, "test/sim_max_reward_4400040": 0.04639056985855768, "test/sim_max_reward_4400041": 0.33397335949928275, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.18083613535104967, "test/sim_max_reward_4400045": 0.24345786785074333, "test/sim_max_reward_4400046": 0.21204474601942042, "test/sim_max_reward_4400047": 0.27160869776655816, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.3157745401426349, "train/mean_score": 0.2642060124158221, "test/mean_score": 0.1996367143458799, "val_loss": 73938.9375} {"train_loss": -4.997056484222412, "global_step": 12642, "epoch": 301} {"train_loss": -5.189295768737793, "global_step": 12643, "epoch": 301} {"train_loss": -4.971761226654053, "global_step": 12644, "epoch": 301} {"train_loss": -4.990270614624023, "global_step": 12645, "epoch": 301} {"train_loss": -5.188846588134766, "global_step": 12646, "epoch": 301} {"train_loss": -5.046769142150879, "global_step": 12647, "epoch": 301} {"train_loss": -5.116376876831055, "global_step": 12648, "epoch": 301} {"train_loss": -5.189922332763672, "global_step": 12649, "epoch": 301} {"train_loss": -4.927489757537842, "global_step": 12650, "epoch": 301} {"train_loss": -5.106239318847656, "global_step": 12651, "epoch": 301} {"train_loss": -5.057069301605225, "global_step": 12652, "epoch": 301} {"train_loss": -5.016149520874023, "global_step": 12653, "epoch": 301} {"train_loss": -5.18936824798584, "global_step": 12654, "epoch": 301} {"train_loss": -4.995282173156738, "global_step": 12655, "epoch": 301} {"train_loss": -5.036368370056152, "global_step": 12656, "epoch": 301} {"train_loss": -5.120701789855957, "global_step": 12657, "epoch": 301} {"train_loss": -5.150607109069824, "global_step": 12658, "epoch": 301} {"train_loss": -5.182210922241211, "global_step": 12659, "epoch": 301} {"train_loss": -5.166173934936523, "global_step": 12660, "epoch": 301} {"train_loss": -5.243556499481201, "global_step": 12661, "epoch": 301} {"train_loss": -5.142516613006592, "global_step": 12662, "epoch": 301} {"train_loss": -5.234246253967285, "global_step": 12663, "epoch": 301} {"train_loss": -5.074736595153809, "global_step": 12664, "epoch": 301} {"train_loss": -5.212815761566162, "global_step": 12665, "epoch": 301} {"train_loss": -5.279356479644775, "global_step": 12666, "epoch": 301} {"train_loss": -5.168319225311279, "global_step": 12667, "epoch": 301} {"train_loss": -5.161378383636475, "global_step": 12668, "epoch": 301} {"train_loss": -5.266012191772461, "global_step": 12669, "epoch": 301} {"train_loss": -5.02065896987915, "global_step": 12670, "epoch": 301} {"train_loss": -5.093945503234863, "global_step": 12671, "epoch": 301} {"train_loss": -5.2492876052856445, "global_step": 12672, "epoch": 301} {"train_loss": -5.239933013916016, "global_step": 12673, "epoch": 301} {"train_loss": -5.191246032714844, "global_step": 12674, "epoch": 301} {"train_loss": -5.3251953125, "global_step": 12675, "epoch": 301} {"train_loss": -5.180857181549072, "global_step": 12676, "epoch": 301} {"train_loss": -5.064064979553223, "global_step": 12677, "epoch": 301} {"train_loss": -5.199486255645752, "global_step": 12678, "epoch": 301} {"train_loss": -5.306909561157227, "global_step": 12679, "epoch": 301} {"train_loss": -4.977387428283691, "global_step": 12680, "epoch": 301} {"train_loss": -5.074918270111084, "global_step": 12681, "epoch": 301} {"train_loss": -5.186855792999268, "global_step": 12682, "epoch": 301} {"train_loss": -5.136362280164446, "global_step": 12683, "epoch": 301, "val_loss": 74289.703125} {"train_loss": -4.928893089294434, "global_step": 12684, "epoch": 302} {"train_loss": -5.170236587524414, "global_step": 12685, "epoch": 302} {"train_loss": -5.118557453155518, "global_step": 12686, "epoch": 302} {"train_loss": -4.953886032104492, "global_step": 12687, "epoch": 302} {"train_loss": -5.046254634857178, "global_step": 12688, "epoch": 302} {"train_loss": -4.845202445983887, "global_step": 12689, "epoch": 302} {"train_loss": -5.064822673797607, "global_step": 12690, "epoch": 302} {"train_loss": -4.91244649887085, "global_step": 12691, "epoch": 302} {"train_loss": -5.071197509765625, "global_step": 12692, "epoch": 302} {"train_loss": -4.995730400085449, "global_step": 12693, "epoch": 302} {"train_loss": -4.941157817840576, "global_step": 12694, "epoch": 302} {"train_loss": -5.074184417724609, "global_step": 12695, "epoch": 302} {"train_loss": -4.908000469207764, "global_step": 12696, "epoch": 302} {"train_loss": -5.025361061096191, "global_step": 12697, "epoch": 302} {"train_loss": -5.138969421386719, "global_step": 12698, "epoch": 302} {"train_loss": -5.0037946701049805, "global_step": 12699, "epoch": 302} {"train_loss": -5.207546234130859, "global_step": 12700, "epoch": 302} {"train_loss": -4.94013786315918, "global_step": 12701, "epoch": 302} {"train_loss": -5.121982574462891, "global_step": 12702, "epoch": 302} {"train_loss": -5.072162628173828, "global_step": 12703, "epoch": 302} {"train_loss": -5.087370872497559, "global_step": 12704, "epoch": 302} {"train_loss": -4.939599514007568, "global_step": 12705, "epoch": 302} {"train_loss": -4.984165191650391, "global_step": 12706, "epoch": 302} {"train_loss": -4.905444145202637, "global_step": 12707, "epoch": 302} {"train_loss": -5.237085342407227, "global_step": 12708, "epoch": 302} {"train_loss": -5.144443511962891, "global_step": 12709, "epoch": 302} {"train_loss": -5.245035171508789, "global_step": 12710, "epoch": 302} {"train_loss": -5.060612678527832, "global_step": 12711, "epoch": 302} {"train_loss": -5.066976547241211, "global_step": 12712, "epoch": 302} {"train_loss": -5.113969802856445, "global_step": 12713, "epoch": 302} {"train_loss": -5.162755966186523, "global_step": 12714, "epoch": 302} {"train_loss": -5.199082851409912, "global_step": 12715, "epoch": 302} {"train_loss": -5.195245265960693, "global_step": 12716, "epoch": 302} {"train_loss": -5.240078926086426, "global_step": 12717, "epoch": 302} {"train_loss": -5.282403945922852, "global_step": 12718, "epoch": 302} {"train_loss": -4.9895453453063965, "global_step": 12719, "epoch": 302} {"train_loss": -5.0377068519592285, "global_step": 12720, "epoch": 302} {"train_loss": -5.088801383972168, "global_step": 12721, "epoch": 302} {"train_loss": -5.241179943084717, "global_step": 12722, "epoch": 302} {"train_loss": -5.161984920501709, "global_step": 12723, "epoch": 302} {"train_loss": -5.013251304626465, "global_step": 12724, "epoch": 302} {"train_loss": -5.076720941634405, "global_step": 12725, "epoch": 302, "val_loss": 74027.6171875} {"train_loss": -5.181058883666992, "global_step": 12726, "epoch": 303} {"train_loss": -5.194180488586426, "global_step": 12727, "epoch": 303} {"train_loss": -5.2550554275512695, "global_step": 12728, "epoch": 303} {"train_loss": -5.049149990081787, "global_step": 12729, "epoch": 303} {"train_loss": -4.981766223907471, "global_step": 12730, "epoch": 303} {"train_loss": -5.233140468597412, "global_step": 12731, "epoch": 303} {"train_loss": -5.215163230895996, "global_step": 12732, "epoch": 303} {"train_loss": -5.0664448738098145, "global_step": 12733, "epoch": 303} {"train_loss": -5.008458614349365, "global_step": 12734, "epoch": 303} {"train_loss": -5.1025848388671875, "global_step": 12735, "epoch": 303} {"train_loss": -5.200267791748047, "global_step": 12736, "epoch": 303} {"train_loss": -5.044356346130371, "global_step": 12737, "epoch": 303} {"train_loss": -5.169013023376465, "global_step": 12738, "epoch": 303} {"train_loss": -5.183046340942383, "global_step": 12739, "epoch": 303} {"train_loss": -5.057461738586426, "global_step": 12740, "epoch": 303} {"train_loss": -5.095405578613281, "global_step": 12741, "epoch": 303} {"train_loss": -5.246224880218506, "global_step": 12742, "epoch": 303} {"train_loss": -4.9521989822387695, "global_step": 12743, "epoch": 303} {"train_loss": -5.118478298187256, "global_step": 12744, "epoch": 303} {"train_loss": -4.805240631103516, "global_step": 12745, "epoch": 303} {"train_loss": -5.044639587402344, "global_step": 12746, "epoch": 303} {"train_loss": -4.9183149337768555, "global_step": 12747, "epoch": 303} {"train_loss": -5.088136672973633, "global_step": 12748, "epoch": 303} {"train_loss": -5.011546611785889, "global_step": 12749, "epoch": 303} {"train_loss": -5.006106376647949, "global_step": 12750, "epoch": 303} {"train_loss": -5.005430221557617, "global_step": 12751, "epoch": 303} {"train_loss": -4.968297958374023, "global_step": 12752, "epoch": 303} {"train_loss": -5.318033695220947, "global_step": 12753, "epoch": 303} {"train_loss": -5.045046806335449, "global_step": 12754, "epoch": 303} {"train_loss": -5.103395938873291, "global_step": 12755, "epoch": 303} {"train_loss": -5.0182294845581055, "global_step": 12756, "epoch": 303} {"train_loss": -4.95474910736084, "global_step": 12757, "epoch": 303} {"train_loss": -5.093390464782715, "global_step": 12758, "epoch": 303} {"train_loss": -5.161443710327148, "global_step": 12759, "epoch": 303} {"train_loss": -4.953403472900391, "global_step": 12760, "epoch": 303} {"train_loss": -5.009036064147949, "global_step": 12761, "epoch": 303} {"train_loss": -5.2721638679504395, "global_step": 12762, "epoch": 303} {"train_loss": -5.169414043426514, "global_step": 12763, "epoch": 303} {"train_loss": -5.022934436798096, "global_step": 12764, "epoch": 303} {"train_loss": -5.143496513366699, "global_step": 12765, "epoch": 303} {"train_loss": -5.266321659088135, "global_step": 12766, "epoch": 303} {"train_loss": -5.093490452993484, "global_step": 12767, "epoch": 303, "val_loss": 74892.6015625} {"train_loss": -5.32372522354126, "global_step": 12768, "epoch": 304} {"train_loss": -5.004546165466309, "global_step": 12769, "epoch": 304} {"train_loss": -5.255311012268066, "global_step": 12770, "epoch": 304} {"train_loss": -5.123553276062012, "global_step": 12771, "epoch": 304} {"train_loss": -5.199902534484863, "global_step": 12772, "epoch": 304} {"train_loss": -5.050055980682373, "global_step": 12773, "epoch": 304} {"train_loss": -5.178170204162598, "global_step": 12774, "epoch": 304} {"train_loss": -5.109943866729736, "global_step": 12775, "epoch": 304} {"train_loss": -5.196032524108887, "global_step": 12776, "epoch": 304} {"train_loss": -5.216748237609863, "global_step": 12777, "epoch": 304} {"train_loss": -5.228503227233887, "global_step": 12778, "epoch": 304} {"train_loss": -5.171428680419922, "global_step": 12779, "epoch": 304} {"train_loss": -5.146976470947266, "global_step": 12780, "epoch": 304} {"train_loss": -5.156030654907227, "global_step": 12781, "epoch": 304} {"train_loss": -5.207843780517578, "global_step": 12782, "epoch": 304} {"train_loss": -5.17111349105835, "global_step": 12783, "epoch": 304} {"train_loss": -5.194992542266846, "global_step": 12784, "epoch": 304} {"train_loss": -5.20021915435791, "global_step": 12785, "epoch": 304} {"train_loss": -5.146477699279785, "global_step": 12786, "epoch": 304} {"train_loss": -5.201019763946533, "global_step": 12787, "epoch": 304} {"train_loss": -5.154738426208496, "global_step": 12788, "epoch": 304} {"train_loss": -5.2999773025512695, "global_step": 12789, "epoch": 304} {"train_loss": -5.075875759124756, "global_step": 12790, "epoch": 304} {"train_loss": -5.225274562835693, "global_step": 12791, "epoch": 304} {"train_loss": -5.284134387969971, "global_step": 12792, "epoch": 304} {"train_loss": -5.045957565307617, "global_step": 12793, "epoch": 304} {"train_loss": -5.267460823059082, "global_step": 12794, "epoch": 304} {"train_loss": -5.147021293640137, "global_step": 12795, "epoch": 304} {"train_loss": -5.159275054931641, "global_step": 12796, "epoch": 304} {"train_loss": -5.05525016784668, "global_step": 12797, "epoch": 304} {"train_loss": -5.201057434082031, "global_step": 12798, "epoch": 304} {"train_loss": -5.173253536224365, "global_step": 12799, "epoch": 304} {"train_loss": -5.166891098022461, "global_step": 12800, "epoch": 304} {"train_loss": -5.1728105545043945, "global_step": 12801, "epoch": 304} {"train_loss": -5.228798866271973, "global_step": 12802, "epoch": 304} {"train_loss": -5.186032772064209, "global_step": 12803, "epoch": 304} {"train_loss": -5.300969123840332, "global_step": 12804, "epoch": 304} {"train_loss": -5.15186071395874, "global_step": 12805, "epoch": 304} {"train_loss": -4.979279041290283, "global_step": 12806, "epoch": 304} {"train_loss": -5.083627700805664, "global_step": 12807, "epoch": 304} {"train_loss": -5.168350696563721, "global_step": 12808, "epoch": 304} {"train_loss": -5.167991774422782, "global_step": 12809, "epoch": 304, "val_loss": 75311.46875} {"train_loss": -4.959123611450195, "global_step": 12810, "epoch": 305} {"train_loss": -5.1735639572143555, "global_step": 12811, "epoch": 305} {"train_loss": -5.12954568862915, "global_step": 12812, "epoch": 305} {"train_loss": -5.10191535949707, "global_step": 12813, "epoch": 305} {"train_loss": -5.253289699554443, "global_step": 12814, "epoch": 305} {"train_loss": -5.1396989822387695, "global_step": 12815, "epoch": 305} {"train_loss": -5.160422325134277, "global_step": 12816, "epoch": 305} {"train_loss": -5.238433837890625, "global_step": 12817, "epoch": 305} {"train_loss": -5.055709362030029, "global_step": 12818, "epoch": 305} {"train_loss": -5.096026420593262, "global_step": 12819, "epoch": 305} {"train_loss": -4.992034435272217, "global_step": 12820, "epoch": 305} {"train_loss": -5.20427131652832, "global_step": 12821, "epoch": 305} {"train_loss": -4.985256195068359, "global_step": 12822, "epoch": 305} {"train_loss": -4.968118190765381, "global_step": 12823, "epoch": 305} {"train_loss": -5.119561195373535, "global_step": 12824, "epoch": 305} {"train_loss": -5.063385963439941, "global_step": 12825, "epoch": 305} {"train_loss": -5.196356773376465, "global_step": 12826, "epoch": 305} {"train_loss": -5.0969133377075195, "global_step": 12827, "epoch": 305} {"train_loss": -5.116344928741455, "global_step": 12828, "epoch": 305} {"train_loss": -5.144048690795898, "global_step": 12829, "epoch": 305} {"train_loss": -4.995046615600586, "global_step": 12830, "epoch": 305} {"train_loss": -5.027337551116943, "global_step": 12831, "epoch": 305} {"train_loss": -5.08094596862793, "global_step": 12832, "epoch": 305} {"train_loss": -5.171660423278809, "global_step": 12833, "epoch": 305} {"train_loss": -5.208775997161865, "global_step": 12834, "epoch": 305} {"train_loss": -5.197842121124268, "global_step": 12835, "epoch": 305} {"train_loss": -5.241770267486572, "global_step": 12836, "epoch": 305} {"train_loss": -5.130782604217529, "global_step": 12837, "epoch": 305} {"train_loss": -5.140531539916992, "global_step": 12838, "epoch": 305} {"train_loss": -5.227809429168701, "global_step": 12839, "epoch": 305} {"train_loss": -5.185750961303711, "global_step": 12840, "epoch": 305} {"train_loss": -5.045797824859619, "global_step": 12841, "epoch": 305} {"train_loss": -5.279259204864502, "global_step": 12842, "epoch": 305} {"train_loss": -5.084298133850098, "global_step": 12843, "epoch": 305} {"train_loss": -5.227133750915527, "global_step": 12844, "epoch": 305} {"train_loss": -5.2725725173950195, "global_step": 12845, "epoch": 305} {"train_loss": -5.2164692878723145, "global_step": 12846, "epoch": 305} {"train_loss": -5.149852275848389, "global_step": 12847, "epoch": 305} {"train_loss": -5.276515960693359, "global_step": 12848, "epoch": 305} {"train_loss": -5.299084663391113, "global_step": 12849, "epoch": 305} {"train_loss": -5.264527797698975, "global_step": 12850, "epoch": 305} {"train_loss": -5.1468110765729636, "global_step": 12851, "epoch": 305, "val_loss": 73685.484375} {"train_loss": -5.141251087188721, "global_step": 12852, "epoch": 306} {"train_loss": -5.124016761779785, "global_step": 12853, "epoch": 306} {"train_loss": -5.199328899383545, "global_step": 12854, "epoch": 306} {"train_loss": -5.201266288757324, "global_step": 12855, "epoch": 306} {"train_loss": -5.18173885345459, "global_step": 12856, "epoch": 306} {"train_loss": -5.219429016113281, "global_step": 12857, "epoch": 306} {"train_loss": -5.080141067504883, "global_step": 12858, "epoch": 306} {"train_loss": -5.074422359466553, "global_step": 12859, "epoch": 306} {"train_loss": -5.115964889526367, "global_step": 12860, "epoch": 306} {"train_loss": -5.0444865226745605, "global_step": 12861, "epoch": 306} {"train_loss": -5.025256156921387, "global_step": 12862, "epoch": 306} {"train_loss": -5.076482772827148, "global_step": 12863, "epoch": 306} {"train_loss": -5.017850875854492, "global_step": 12864, "epoch": 306} {"train_loss": -4.98020076751709, "global_step": 12865, "epoch": 306} {"train_loss": -5.244711875915527, "global_step": 12866, "epoch": 306} {"train_loss": -5.0605597496032715, "global_step": 12867, "epoch": 306} {"train_loss": -5.133316993713379, "global_step": 12868, "epoch": 306} {"train_loss": -5.246973991394043, "global_step": 12869, "epoch": 306} {"train_loss": -5.193000793457031, "global_step": 12870, "epoch": 306} {"train_loss": -5.00479793548584, "global_step": 12871, "epoch": 306} {"train_loss": -5.214373588562012, "global_step": 12872, "epoch": 306} {"train_loss": -4.966010093688965, "global_step": 12873, "epoch": 306} {"train_loss": -5.0999040603637695, "global_step": 12874, "epoch": 306} {"train_loss": -5.1296844482421875, "global_step": 12875, "epoch": 306} {"train_loss": -5.258021831512451, "global_step": 12876, "epoch": 306} {"train_loss": -5.1454854011535645, "global_step": 12877, "epoch": 306} {"train_loss": -5.138062000274658, "global_step": 12878, "epoch": 306} {"train_loss": -5.046988487243652, "global_step": 12879, "epoch": 306} {"train_loss": -5.098846435546875, "global_step": 12880, "epoch": 306} {"train_loss": -5.090662002563477, "global_step": 12881, "epoch": 306} {"train_loss": -5.080859184265137, "global_step": 12882, "epoch": 306} {"train_loss": -5.070744514465332, "global_step": 12883, "epoch": 306} {"train_loss": -5.106488227844238, "global_step": 12884, "epoch": 306} {"train_loss": -5.250812530517578, "global_step": 12885, "epoch": 306} {"train_loss": -5.1012163162231445, "global_step": 12886, "epoch": 306} {"train_loss": -5.104525566101074, "global_step": 12887, "epoch": 306} {"train_loss": -5.129292011260986, "global_step": 12888, "epoch": 306} {"train_loss": -5.096368789672852, "global_step": 12889, "epoch": 306} {"train_loss": -5.379364013671875, "global_step": 12890, "epoch": 306} {"train_loss": -5.140993118286133, "global_step": 12891, "epoch": 306} {"train_loss": -5.161153316497803, "global_step": 12892, "epoch": 306} {"train_loss": -5.130204336983817, "global_step": 12893, "epoch": 306, "val_loss": 73067.875} {"train_loss": -5.113243579864502, "global_step": 12894, "epoch": 307} {"train_loss": -5.017237663269043, "global_step": 12895, "epoch": 307} {"train_loss": -5.236324787139893, "global_step": 12896, "epoch": 307} {"train_loss": -5.169862270355225, "global_step": 12897, "epoch": 307} {"train_loss": -5.146749019622803, "global_step": 12898, "epoch": 307} {"train_loss": -5.305682182312012, "global_step": 12899, "epoch": 307} {"train_loss": -5.171952247619629, "global_step": 12900, "epoch": 307} {"train_loss": -5.043388366699219, "global_step": 12901, "epoch": 307} {"train_loss": -5.155189037322998, "global_step": 12902, "epoch": 307} {"train_loss": -5.135256290435791, "global_step": 12903, "epoch": 307} {"train_loss": -4.981225490570068, "global_step": 12904, "epoch": 307} {"train_loss": -5.153439044952393, "global_step": 12905, "epoch": 307} {"train_loss": -5.176492691040039, "global_step": 12906, "epoch": 307} {"train_loss": -5.275558948516846, "global_step": 12907, "epoch": 307} {"train_loss": -5.253147602081299, "global_step": 12908, "epoch": 307} {"train_loss": -5.066130638122559, "global_step": 12909, "epoch": 307} {"train_loss": -5.148297309875488, "global_step": 12910, "epoch": 307} {"train_loss": -5.11561393737793, "global_step": 12911, "epoch": 307} {"train_loss": -5.32005500793457, "global_step": 12912, "epoch": 307} {"train_loss": -5.140361785888672, "global_step": 12913, "epoch": 307} {"train_loss": -5.059299468994141, "global_step": 12914, "epoch": 307} {"train_loss": -5.373887062072754, "global_step": 12915, "epoch": 307} {"train_loss": -5.286304473876953, "global_step": 12916, "epoch": 307} {"train_loss": -5.112972736358643, "global_step": 12917, "epoch": 307} {"train_loss": -5.224277973175049, "global_step": 12918, "epoch": 307} {"train_loss": -5.165518760681152, "global_step": 12919, "epoch": 307} {"train_loss": -5.234844207763672, "global_step": 12920, "epoch": 307} {"train_loss": -5.207016468048096, "global_step": 12921, "epoch": 307} {"train_loss": -5.0494842529296875, "global_step": 12922, "epoch": 307} {"train_loss": -5.174154281616211, "global_step": 12923, "epoch": 307} {"train_loss": -5.1759562492370605, "global_step": 12924, "epoch": 307} {"train_loss": -5.062085151672363, "global_step": 12925, "epoch": 307} {"train_loss": -5.144220352172852, "global_step": 12926, "epoch": 307} {"train_loss": -5.140474319458008, "global_step": 12927, "epoch": 307} {"train_loss": -5.032641410827637, "global_step": 12928, "epoch": 307} {"train_loss": -5.212843894958496, "global_step": 12929, "epoch": 307} {"train_loss": -5.211886405944824, "global_step": 12930, "epoch": 307} {"train_loss": -5.195977210998535, "global_step": 12931, "epoch": 307} {"train_loss": -5.224856376647949, "global_step": 12932, "epoch": 307} {"train_loss": -5.148619651794434, "global_step": 12933, "epoch": 307} {"train_loss": -5.1503376960754395, "global_step": 12934, "epoch": 307} {"train_loss": -5.16393400373913, "global_step": 12935, "epoch": 307, "val_loss": 72858.265625} {"train_loss": -5.217733383178711, "global_step": 12936, "epoch": 308} {"train_loss": -5.236416816711426, "global_step": 12937, "epoch": 308} {"train_loss": -5.133069038391113, "global_step": 12938, "epoch": 308} {"train_loss": -5.338458061218262, "global_step": 12939, "epoch": 308} {"train_loss": -5.209511756896973, "global_step": 12940, "epoch": 308} {"train_loss": -5.220998764038086, "global_step": 12941, "epoch": 308} {"train_loss": -5.219267845153809, "global_step": 12942, "epoch": 308} {"train_loss": -5.303800582885742, "global_step": 12943, "epoch": 308} {"train_loss": -5.233922481536865, "global_step": 12944, "epoch": 308} {"train_loss": -5.191074371337891, "global_step": 12945, "epoch": 308} {"train_loss": -5.283176422119141, "global_step": 12946, "epoch": 308} {"train_loss": -5.268441200256348, "global_step": 12947, "epoch": 308} {"train_loss": -5.153878211975098, "global_step": 12948, "epoch": 308} {"train_loss": -5.116676330566406, "global_step": 12949, "epoch": 308} {"train_loss": -5.17303466796875, "global_step": 12950, "epoch": 308} {"train_loss": -5.266823768615723, "global_step": 12951, "epoch": 308} {"train_loss": -5.1859235763549805, "global_step": 12952, "epoch": 308} {"train_loss": -5.149226188659668, "global_step": 12953, "epoch": 308} {"train_loss": -5.1794209480285645, "global_step": 12954, "epoch": 308} {"train_loss": -5.148566246032715, "global_step": 12955, "epoch": 308} {"train_loss": -5.248523712158203, "global_step": 12956, "epoch": 308} {"train_loss": -4.8687052726745605, "global_step": 12957, "epoch": 308} {"train_loss": -5.138034820556641, "global_step": 12958, "epoch": 308} {"train_loss": -5.0595598220825195, "global_step": 12959, "epoch": 308} {"train_loss": -5.1288557052612305, "global_step": 12960, "epoch": 308} {"train_loss": -4.996842861175537, "global_step": 12961, "epoch": 308} {"train_loss": -5.113126277923584, "global_step": 12962, "epoch": 308} {"train_loss": -4.965223789215088, "global_step": 12963, "epoch": 308} {"train_loss": -5.022615909576416, "global_step": 12964, "epoch": 308} {"train_loss": -5.21893310546875, "global_step": 12965, "epoch": 308} {"train_loss": -4.963085174560547, "global_step": 12966, "epoch": 308} {"train_loss": -5.079093933105469, "global_step": 12967, "epoch": 308} {"train_loss": -4.92711877822876, "global_step": 12968, "epoch": 308} {"train_loss": -5.047858238220215, "global_step": 12969, "epoch": 308} {"train_loss": -5.022149085998535, "global_step": 12970, "epoch": 308} {"train_loss": -4.857193946838379, "global_step": 12971, "epoch": 308} {"train_loss": -5.037447452545166, "global_step": 12972, "epoch": 308} {"train_loss": -5.020901203155518, "global_step": 12973, "epoch": 308} {"train_loss": -5.149941444396973, "global_step": 12974, "epoch": 308} {"train_loss": -5.018825531005859, "global_step": 12975, "epoch": 308} {"train_loss": -4.967430591583252, "global_step": 12976, "epoch": 308} {"train_loss": -5.120726687567575, "global_step": 12977, "epoch": 308, "val_loss": 75029.09375} {"train_loss": -5.105400085449219, "global_step": 12978, "epoch": 309} {"train_loss": -5.057771682739258, "global_step": 12979, "epoch": 309} {"train_loss": -5.15247917175293, "global_step": 12980, "epoch": 309} {"train_loss": -5.0009660720825195, "global_step": 12981, "epoch": 309} {"train_loss": -5.139122009277344, "global_step": 12982, "epoch": 309} {"train_loss": -5.02427864074707, "global_step": 12983, "epoch": 309} {"train_loss": -5.137909889221191, "global_step": 12984, "epoch": 309} {"train_loss": -5.069698333740234, "global_step": 12985, "epoch": 309} {"train_loss": -5.171316146850586, "global_step": 12986, "epoch": 309} {"train_loss": -5.149099826812744, "global_step": 12987, "epoch": 309} {"train_loss": -5.14716911315918, "global_step": 12988, "epoch": 309} {"train_loss": -5.181864261627197, "global_step": 12989, "epoch": 309} {"train_loss": -5.2446088790893555, "global_step": 12990, "epoch": 309} {"train_loss": -5.069150924682617, "global_step": 12991, "epoch": 309} {"train_loss": -5.136728763580322, "global_step": 12992, "epoch": 309} {"train_loss": -5.199437618255615, "global_step": 12993, "epoch": 309} {"train_loss": -5.052868843078613, "global_step": 12994, "epoch": 309} {"train_loss": -5.227516174316406, "global_step": 12995, "epoch": 309} {"train_loss": -5.190412521362305, "global_step": 12996, "epoch": 309} {"train_loss": -5.010807037353516, "global_step": 12997, "epoch": 309} {"train_loss": -5.281883239746094, "global_step": 12998, "epoch": 309} {"train_loss": -5.157788276672363, "global_step": 12999, "epoch": 309} {"train_loss": -5.125699043273926, "global_step": 13000, "epoch": 309} {"train_loss": -5.098474502563477, "global_step": 13001, "epoch": 309} {"train_loss": -5.294713020324707, "global_step": 13002, "epoch": 309} {"train_loss": -5.224273204803467, "global_step": 13003, "epoch": 309} {"train_loss": -5.1691412925720215, "global_step": 13004, "epoch": 309} {"train_loss": -5.147109031677246, "global_step": 13005, "epoch": 309} {"train_loss": -5.153282165527344, "global_step": 13006, "epoch": 309} {"train_loss": -5.253896713256836, "global_step": 13007, "epoch": 309} {"train_loss": -5.09856653213501, "global_step": 13008, "epoch": 309} {"train_loss": -5.032242298126221, "global_step": 13009, "epoch": 309} {"train_loss": -5.114853858947754, "global_step": 13010, "epoch": 309} {"train_loss": -5.115435600280762, "global_step": 13011, "epoch": 309} {"train_loss": -5.145054817199707, "global_step": 13012, "epoch": 309} {"train_loss": -5.214600563049316, "global_step": 13013, "epoch": 309} {"train_loss": -5.190593242645264, "global_step": 13014, "epoch": 309} {"train_loss": -5.079062461853027, "global_step": 13015, "epoch": 309} {"train_loss": -5.062429428100586, "global_step": 13016, "epoch": 309} {"train_loss": -5.224068641662598, "global_step": 13017, "epoch": 309} {"train_loss": -5.025280952453613, "global_step": 13018, "epoch": 309} {"train_loss": -5.139711561657133, "global_step": 13019, "epoch": 309, "val_loss": 73209.1484375} {"train_loss": -5.038604736328125, "global_step": 13020, "epoch": 310} {"train_loss": -5.071686267852783, "global_step": 13021, "epoch": 310} {"train_loss": -5.265369415283203, "global_step": 13022, "epoch": 310} {"train_loss": -5.087215900421143, "global_step": 13023, "epoch": 310} {"train_loss": -5.029499053955078, "global_step": 13024, "epoch": 310} {"train_loss": -5.210905075073242, "global_step": 13025, "epoch": 310} {"train_loss": -4.995571613311768, "global_step": 13026, "epoch": 310} {"train_loss": -5.162919998168945, "global_step": 13027, "epoch": 310} {"train_loss": -5.203085899353027, "global_step": 13028, "epoch": 310} {"train_loss": -5.1199140548706055, "global_step": 13029, "epoch": 310} {"train_loss": -5.111321449279785, "global_step": 13030, "epoch": 310} {"train_loss": -5.114346981048584, "global_step": 13031, "epoch": 310} {"train_loss": -5.310237884521484, "global_step": 13032, "epoch": 310} {"train_loss": -5.180137634277344, "global_step": 13033, "epoch": 310} {"train_loss": -4.914751052856445, "global_step": 13034, "epoch": 310} {"train_loss": -5.208941459655762, "global_step": 13035, "epoch": 310} {"train_loss": -5.136417388916016, "global_step": 13036, "epoch": 310} {"train_loss": -5.064629077911377, "global_step": 13037, "epoch": 310} {"train_loss": -5.174261569976807, "global_step": 13038, "epoch": 310} {"train_loss": -5.071319103240967, "global_step": 13039, "epoch": 310} {"train_loss": -5.151741027832031, "global_step": 13040, "epoch": 310} {"train_loss": -5.184100151062012, "global_step": 13041, "epoch": 310} {"train_loss": -5.017144203186035, "global_step": 13042, "epoch": 310} {"train_loss": -5.122989177703857, "global_step": 13043, "epoch": 310} {"train_loss": -5.204921245574951, "global_step": 13044, "epoch": 310} {"train_loss": -5.121479034423828, "global_step": 13045, "epoch": 310} {"train_loss": -4.970478057861328, "global_step": 13046, "epoch": 310} {"train_loss": -5.155220031738281, "global_step": 13047, "epoch": 310} {"train_loss": -5.293606758117676, "global_step": 13048, "epoch": 310} {"train_loss": -5.149255752563477, "global_step": 13049, "epoch": 310} {"train_loss": -5.309954643249512, "global_step": 13050, "epoch": 310} {"train_loss": -5.1494059562683105, "global_step": 13051, "epoch": 310} {"train_loss": -5.145326137542725, "global_step": 13052, "epoch": 310} {"train_loss": -5.06867790222168, "global_step": 13053, "epoch": 310} {"train_loss": -5.060937881469727, "global_step": 13054, "epoch": 310} {"train_loss": -5.212041854858398, "global_step": 13055, "epoch": 310} {"train_loss": -5.126488208770752, "global_step": 13056, "epoch": 310} {"train_loss": -5.124340057373047, "global_step": 13057, "epoch": 310} {"train_loss": -5.031313896179199, "global_step": 13058, "epoch": 310} {"train_loss": -5.295468330383301, "global_step": 13059, "epoch": 310} {"train_loss": -5.050149440765381, "global_step": 13060, "epoch": 310} {"train_loss": -5.130273489725022, "global_step": 13061, "epoch": 310, "val_loss": 73002.9375} {"train_loss": -5.027778625488281, "global_step": 13062, "epoch": 311} {"train_loss": -4.938539981842041, "global_step": 13063, "epoch": 311} {"train_loss": -5.284330368041992, "global_step": 13064, "epoch": 311} {"train_loss": -4.955726146697998, "global_step": 13065, "epoch": 311} {"train_loss": -5.141726493835449, "global_step": 13066, "epoch": 311} {"train_loss": -5.12556266784668, "global_step": 13067, "epoch": 311} {"train_loss": -5.136799335479736, "global_step": 13068, "epoch": 311} {"train_loss": -5.091246604919434, "global_step": 13069, "epoch": 311} {"train_loss": -5.047359466552734, "global_step": 13070, "epoch": 311} {"train_loss": -5.096594333648682, "global_step": 13071, "epoch": 311} {"train_loss": -5.153345108032227, "global_step": 13072, "epoch": 311} {"train_loss": -5.083431720733643, "global_step": 13073, "epoch": 311} {"train_loss": -5.2047624588012695, "global_step": 13074, "epoch": 311} {"train_loss": -5.148772239685059, "global_step": 13075, "epoch": 311} {"train_loss": -5.201519012451172, "global_step": 13076, "epoch": 311} {"train_loss": -5.085930824279785, "global_step": 13077, "epoch": 311} {"train_loss": -5.245515823364258, "global_step": 13078, "epoch": 311} {"train_loss": -5.196743488311768, "global_step": 13079, "epoch": 311} {"train_loss": -5.141651153564453, "global_step": 13080, "epoch": 311} {"train_loss": -5.158023357391357, "global_step": 13081, "epoch": 311} {"train_loss": -5.184549331665039, "global_step": 13082, "epoch": 311} {"train_loss": -5.120309352874756, "global_step": 13083, "epoch": 311} {"train_loss": -5.150888442993164, "global_step": 13084, "epoch": 311} {"train_loss": -5.1016645431518555, "global_step": 13085, "epoch": 311} {"train_loss": -5.268313884735107, "global_step": 13086, "epoch": 311} {"train_loss": -5.142457008361816, "global_step": 13087, "epoch": 311} {"train_loss": -5.2098388671875, "global_step": 13088, "epoch": 311} {"train_loss": -5.064422607421875, "global_step": 13089, "epoch": 311} {"train_loss": -5.244834899902344, "global_step": 13090, "epoch": 311} {"train_loss": -5.010225296020508, "global_step": 13091, "epoch": 311} {"train_loss": -5.127470016479492, "global_step": 13092, "epoch": 311} {"train_loss": -5.14630126953125, "global_step": 13093, "epoch": 311} {"train_loss": -5.048676013946533, "global_step": 13094, "epoch": 311} {"train_loss": -5.098972320556641, "global_step": 13095, "epoch": 311} {"train_loss": -5.266692161560059, "global_step": 13096, "epoch": 311} {"train_loss": -5.141918182373047, "global_step": 13097, "epoch": 311} {"train_loss": -5.139243125915527, "global_step": 13098, "epoch": 311} {"train_loss": -5.122812271118164, "global_step": 13099, "epoch": 311} {"train_loss": -5.127408981323242, "global_step": 13100, "epoch": 311} {"train_loss": -5.058859348297119, "global_step": 13101, "epoch": 311} {"train_loss": -5.194159507751465, "global_step": 13102, "epoch": 311} {"train_loss": -5.1300278050558905, "global_step": 13103, "epoch": 311, "val_loss": 74808.03125} {"train_loss": -5.109501838684082, "global_step": 13104, "epoch": 312} {"train_loss": -5.1709489822387695, "global_step": 13105, "epoch": 312} {"train_loss": -5.204779624938965, "global_step": 13106, "epoch": 312} {"train_loss": -5.089038848876953, "global_step": 13107, "epoch": 312} {"train_loss": -5.228899002075195, "global_step": 13108, "epoch": 312} {"train_loss": -5.140979766845703, "global_step": 13109, "epoch": 312} {"train_loss": -5.0956220626831055, "global_step": 13110, "epoch": 312} {"train_loss": -5.225461959838867, "global_step": 13111, "epoch": 312} {"train_loss": -5.083215236663818, "global_step": 13112, "epoch": 312} {"train_loss": -5.090948104858398, "global_step": 13113, "epoch": 312} {"train_loss": -5.105637550354004, "global_step": 13114, "epoch": 312} {"train_loss": -5.233541488647461, "global_step": 13115, "epoch": 312} {"train_loss": -5.076205730438232, "global_step": 13116, "epoch": 312} {"train_loss": -5.134397506713867, "global_step": 13117, "epoch": 312} {"train_loss": -5.2989912033081055, "global_step": 13118, "epoch": 312} {"train_loss": -5.257263660430908, "global_step": 13119, "epoch": 312} {"train_loss": -5.09708833694458, "global_step": 13120, "epoch": 312} {"train_loss": -5.155539512634277, "global_step": 13121, "epoch": 312} {"train_loss": -5.2344160079956055, "global_step": 13122, "epoch": 312} {"train_loss": -5.186365127563477, "global_step": 13123, "epoch": 312} {"train_loss": -5.158434867858887, "global_step": 13124, "epoch": 312} {"train_loss": -5.101741790771484, "global_step": 13125, "epoch": 312} {"train_loss": -5.124658584594727, "global_step": 13126, "epoch": 312} {"train_loss": -5.151991844177246, "global_step": 13127, "epoch": 312} {"train_loss": -5.204244613647461, "global_step": 13128, "epoch": 312} {"train_loss": -5.111635208129883, "global_step": 13129, "epoch": 312} {"train_loss": -5.186994552612305, "global_step": 13130, "epoch": 312} {"train_loss": -5.17054557800293, "global_step": 13131, "epoch": 312} {"train_loss": -5.24964714050293, "global_step": 13132, "epoch": 312} {"train_loss": -5.24870491027832, "global_step": 13133, "epoch": 312} {"train_loss": -5.154296875, "global_step": 13134, "epoch": 312} {"train_loss": -5.058239936828613, "global_step": 13135, "epoch": 312} {"train_loss": -5.093622207641602, "global_step": 13136, "epoch": 312} {"train_loss": -4.906915664672852, "global_step": 13137, "epoch": 312} {"train_loss": -5.231187343597412, "global_step": 13138, "epoch": 312} {"train_loss": -5.022738933563232, "global_step": 13139, "epoch": 312} {"train_loss": -5.0734076499938965, "global_step": 13140, "epoch": 312} {"train_loss": -5.195892333984375, "global_step": 13141, "epoch": 312} {"train_loss": -5.086853981018066, "global_step": 13142, "epoch": 312} {"train_loss": -5.179590225219727, "global_step": 13143, "epoch": 312} {"train_loss": -5.067741870880127, "global_step": 13144, "epoch": 312} {"train_loss": -5.143694809504917, "global_step": 13145, "epoch": 312, "val_loss": 73522.5625} {"train_loss": -5.0237579345703125, "global_step": 13146, "epoch": 313} {"train_loss": -5.221714973449707, "global_step": 13147, "epoch": 313} {"train_loss": -5.075905799865723, "global_step": 13148, "epoch": 313} {"train_loss": -5.162850379943848, "global_step": 13149, "epoch": 313} {"train_loss": -5.294030666351318, "global_step": 13150, "epoch": 313} {"train_loss": -5.048856735229492, "global_step": 13151, "epoch": 313} {"train_loss": -5.242743492126465, "global_step": 13152, "epoch": 313} {"train_loss": -5.077075004577637, "global_step": 13153, "epoch": 313} {"train_loss": -5.272120475769043, "global_step": 13154, "epoch": 313} {"train_loss": -5.332646369934082, "global_step": 13155, "epoch": 313} {"train_loss": -5.2578582763671875, "global_step": 13156, "epoch": 313} {"train_loss": -5.079453468322754, "global_step": 13157, "epoch": 313} {"train_loss": -5.248106002807617, "global_step": 13158, "epoch": 313} {"train_loss": -5.107932090759277, "global_step": 13159, "epoch": 313} {"train_loss": -5.249884605407715, "global_step": 13160, "epoch": 313} {"train_loss": -5.120841026306152, "global_step": 13161, "epoch": 313} {"train_loss": -5.347799301147461, "global_step": 13162, "epoch": 313} {"train_loss": -5.327823638916016, "global_step": 13163, "epoch": 313} {"train_loss": -5.29838752746582, "global_step": 13164, "epoch": 313} {"train_loss": -5.1993727684021, "global_step": 13165, "epoch": 313} {"train_loss": -5.072225093841553, "global_step": 13166, "epoch": 313} {"train_loss": -5.270327091217041, "global_step": 13167, "epoch": 313} {"train_loss": -5.093343734741211, "global_step": 13168, "epoch": 313} {"train_loss": -5.144130706787109, "global_step": 13169, "epoch": 313} {"train_loss": -5.416695594787598, "global_step": 13170, "epoch": 313} {"train_loss": -5.092841148376465, "global_step": 13171, "epoch": 313} {"train_loss": -5.111283779144287, "global_step": 13172, "epoch": 313} {"train_loss": -5.180511474609375, "global_step": 13173, "epoch": 313} {"train_loss": -5.1602067947387695, "global_step": 13174, "epoch": 313} {"train_loss": -5.107663154602051, "global_step": 13175, "epoch": 313} {"train_loss": -5.1377763748168945, "global_step": 13176, "epoch": 313} {"train_loss": -5.325841903686523, "global_step": 13177, "epoch": 313} {"train_loss": -5.197928428649902, "global_step": 13178, "epoch": 313} {"train_loss": -5.078965187072754, "global_step": 13179, "epoch": 313} {"train_loss": -5.087002277374268, "global_step": 13180, "epoch": 313} {"train_loss": -5.061617851257324, "global_step": 13181, "epoch": 313} {"train_loss": -5.132796287536621, "global_step": 13182, "epoch": 313} {"train_loss": -5.074698448181152, "global_step": 13183, "epoch": 313} {"train_loss": -5.283858299255371, "global_step": 13184, "epoch": 313} {"train_loss": -5.044583320617676, "global_step": 13185, "epoch": 313} {"train_loss": -5.1638336181640625, "global_step": 13186, "epoch": 313} {"train_loss": -5.175062769935245, "global_step": 13187, "epoch": 313, "val_loss": 73123.4140625} {"train_loss": -5.108017444610596, "global_step": 13188, "epoch": 314} {"train_loss": -5.108991622924805, "global_step": 13189, "epoch": 314} {"train_loss": -5.084468364715576, "global_step": 13190, "epoch": 314} {"train_loss": -5.171667098999023, "global_step": 13191, "epoch": 314} {"train_loss": -5.174264907836914, "global_step": 13192, "epoch": 314} {"train_loss": -5.142968654632568, "global_step": 13193, "epoch": 314} {"train_loss": -5.250976085662842, "global_step": 13194, "epoch": 314} {"train_loss": -5.262742042541504, "global_step": 13195, "epoch": 314} {"train_loss": -5.076559543609619, "global_step": 13196, "epoch": 314} {"train_loss": -5.04077672958374, "global_step": 13197, "epoch": 314} {"train_loss": -5.052773952484131, "global_step": 13198, "epoch": 314} {"train_loss": -5.077903747558594, "global_step": 13199, "epoch": 314} {"train_loss": -5.196306228637695, "global_step": 13200, "epoch": 314} {"train_loss": -5.084604263305664, "global_step": 13201, "epoch": 314} {"train_loss": -5.09968900680542, "global_step": 13202, "epoch": 314} {"train_loss": -5.251723289489746, "global_step": 13203, "epoch": 314} {"train_loss": -5.224898338317871, "global_step": 13204, "epoch": 314} {"train_loss": -5.190453052520752, "global_step": 13205, "epoch": 314} {"train_loss": -5.274694919586182, "global_step": 13206, "epoch": 314} {"train_loss": -5.168544769287109, "global_step": 13207, "epoch": 314} {"train_loss": -5.048269271850586, "global_step": 13208, "epoch": 314} {"train_loss": -5.215545654296875, "global_step": 13209, "epoch": 314} {"train_loss": -5.2864861488342285, "global_step": 13210, "epoch": 314} {"train_loss": -5.17098331451416, "global_step": 13211, "epoch": 314} {"train_loss": -5.280684947967529, "global_step": 13212, "epoch": 314} {"train_loss": -5.362514972686768, "global_step": 13213, "epoch": 314} {"train_loss": -5.219301223754883, "global_step": 13214, "epoch": 314} {"train_loss": -5.03302001953125, "global_step": 13215, "epoch": 314} {"train_loss": -5.118832111358643, "global_step": 13216, "epoch": 314} {"train_loss": -5.04249382019043, "global_step": 13217, "epoch": 314} {"train_loss": -5.088593482971191, "global_step": 13218, "epoch": 314} {"train_loss": -5.1543965339660645, "global_step": 13219, "epoch": 314} {"train_loss": -5.182987213134766, "global_step": 13220, "epoch": 314} {"train_loss": -5.193865776062012, "global_step": 13221, "epoch": 314} {"train_loss": -5.226358413696289, "global_step": 13222, "epoch": 314} {"train_loss": -5.122157096862793, "global_step": 13223, "epoch": 314} {"train_loss": -5.091367721557617, "global_step": 13224, "epoch": 314} {"train_loss": -5.272418022155762, "global_step": 13225, "epoch": 314} {"train_loss": -5.211087226867676, "global_step": 13226, "epoch": 314} {"train_loss": -5.061610221862793, "global_step": 13227, "epoch": 314} {"train_loss": -5.232654094696045, "global_step": 13228, "epoch": 314} {"train_loss": -5.16090448697408, "global_step": 13229, "epoch": 314, "val_loss": 73273.5390625} {"train_loss": -5.325054168701172, "global_step": 13230, "epoch": 315} {"train_loss": -5.144237518310547, "global_step": 13231, "epoch": 315} {"train_loss": -5.06712007522583, "global_step": 13232, "epoch": 315} {"train_loss": -5.16393518447876, "global_step": 13233, "epoch": 315} {"train_loss": -5.2151780128479, "global_step": 13234, "epoch": 315} {"train_loss": -4.893058776855469, "global_step": 13235, "epoch": 315} {"train_loss": -5.268313407897949, "global_step": 13236, "epoch": 315} {"train_loss": -5.1780900955200195, "global_step": 13237, "epoch": 315} {"train_loss": -5.063748359680176, "global_step": 13238, "epoch": 315} {"train_loss": -5.255263328552246, "global_step": 13239, "epoch": 315} {"train_loss": -5.084531784057617, "global_step": 13240, "epoch": 315} {"train_loss": -5.254732131958008, "global_step": 13241, "epoch": 315} {"train_loss": -5.275069713592529, "global_step": 13242, "epoch": 315} {"train_loss": -5.11822509765625, "global_step": 13243, "epoch": 315} {"train_loss": -5.141100883483887, "global_step": 13244, "epoch": 315} {"train_loss": -5.136858940124512, "global_step": 13245, "epoch": 315} {"train_loss": -5.141300678253174, "global_step": 13246, "epoch": 315} {"train_loss": -4.982672691345215, "global_step": 13247, "epoch": 315} {"train_loss": -5.055839538574219, "global_step": 13248, "epoch": 315} {"train_loss": -5.091355323791504, "global_step": 13249, "epoch": 315} {"train_loss": -5.060542106628418, "global_step": 13250, "epoch": 315} {"train_loss": -5.198419570922852, "global_step": 13251, "epoch": 315} {"train_loss": -5.141048431396484, "global_step": 13252, "epoch": 315} {"train_loss": -5.011007308959961, "global_step": 13253, "epoch": 315} {"train_loss": -5.088703155517578, "global_step": 13254, "epoch": 315} {"train_loss": -5.049112319946289, "global_step": 13255, "epoch": 315} {"train_loss": -5.072686672210693, "global_step": 13256, "epoch": 315} {"train_loss": -5.3676652908325195, "global_step": 13257, "epoch": 315} {"train_loss": -4.9573211669921875, "global_step": 13258, "epoch": 315} {"train_loss": -5.076654434204102, "global_step": 13259, "epoch": 315} {"train_loss": -5.1488871574401855, "global_step": 13260, "epoch": 315} {"train_loss": -5.195240497589111, "global_step": 13261, "epoch": 315} {"train_loss": -5.102018356323242, "global_step": 13262, "epoch": 315} {"train_loss": -5.174105167388916, "global_step": 13263, "epoch": 315} {"train_loss": -5.133603572845459, "global_step": 13264, "epoch": 315} {"train_loss": -5.1374359130859375, "global_step": 13265, "epoch": 315} {"train_loss": -5.125216484069824, "global_step": 13266, "epoch": 315} {"train_loss": -5.155433654785156, "global_step": 13267, "epoch": 315} {"train_loss": -5.123064994812012, "global_step": 13268, "epoch": 315} {"train_loss": -5.080273628234863, "global_step": 13269, "epoch": 315} {"train_loss": -5.1864118576049805, "global_step": 13270, "epoch": 315} {"train_loss": -5.133113917850313, "global_step": 13271, "epoch": 315, "val_loss": 72373.109375} {"train_loss": -5.126836776733398, "global_step": 13272, "epoch": 316} {"train_loss": -5.29191255569458, "global_step": 13273, "epoch": 316} {"train_loss": -5.193231582641602, "global_step": 13274, "epoch": 316} {"train_loss": -5.070901870727539, "global_step": 13275, "epoch": 316} {"train_loss": -5.264211654663086, "global_step": 13276, "epoch": 316} {"train_loss": -5.31997013092041, "global_step": 13277, "epoch": 316} {"train_loss": -5.229883193969727, "global_step": 13278, "epoch": 316} {"train_loss": -5.138391494750977, "global_step": 13279, "epoch": 316} {"train_loss": -5.208547592163086, "global_step": 13280, "epoch": 316} {"train_loss": -5.183296203613281, "global_step": 13281, "epoch": 316} {"train_loss": -5.175810813903809, "global_step": 13282, "epoch": 316} {"train_loss": -5.078032970428467, "global_step": 13283, "epoch": 316} {"train_loss": -5.2297515869140625, "global_step": 13284, "epoch": 316} {"train_loss": -5.209761619567871, "global_step": 13285, "epoch": 316} {"train_loss": -5.272898197174072, "global_step": 13286, "epoch": 316} {"train_loss": -5.043821334838867, "global_step": 13287, "epoch": 316} {"train_loss": -5.1353631019592285, "global_step": 13288, "epoch": 316} {"train_loss": -5.181641101837158, "global_step": 13289, "epoch": 316} {"train_loss": -5.213216781616211, "global_step": 13290, "epoch": 316} {"train_loss": -5.279103755950928, "global_step": 13291, "epoch": 316} {"train_loss": -4.931158065795898, "global_step": 13292, "epoch": 316} {"train_loss": -5.225897789001465, "global_step": 13293, "epoch": 316} {"train_loss": -5.0145344734191895, "global_step": 13294, "epoch": 316} {"train_loss": -5.135660648345947, "global_step": 13295, "epoch": 316} {"train_loss": -5.271986961364746, "global_step": 13296, "epoch": 316} {"train_loss": -5.124575138092041, "global_step": 13297, "epoch": 316} {"train_loss": -5.287016868591309, "global_step": 13298, "epoch": 316} {"train_loss": -5.079898357391357, "global_step": 13299, "epoch": 316} {"train_loss": -5.131691932678223, "global_step": 13300, "epoch": 316} {"train_loss": -5.147860527038574, "global_step": 13301, "epoch": 316} {"train_loss": -5.2384819984436035, "global_step": 13302, "epoch": 316} {"train_loss": -5.234448432922363, "global_step": 13303, "epoch": 316} {"train_loss": -5.186846733093262, "global_step": 13304, "epoch": 316} {"train_loss": -5.204754829406738, "global_step": 13305, "epoch": 316} {"train_loss": -5.155300140380859, "global_step": 13306, "epoch": 316} {"train_loss": -5.299038887023926, "global_step": 13307, "epoch": 316} {"train_loss": -5.201766014099121, "global_step": 13308, "epoch": 316} {"train_loss": -5.1417083740234375, "global_step": 13309, "epoch": 316} {"train_loss": -5.32579231262207, "global_step": 13310, "epoch": 316} {"train_loss": -5.163340091705322, "global_step": 13311, "epoch": 316} {"train_loss": -5.172922134399414, "global_step": 13312, "epoch": 316} {"train_loss": -5.180710792541504, "global_step": 13313, "epoch": 316, "val_loss": 72856.3984375} {"train_loss": -5.119846343994141, "global_step": 13314, "epoch": 317} {"train_loss": -5.107507705688477, "global_step": 13315, "epoch": 317} {"train_loss": -5.168749809265137, "global_step": 13316, "epoch": 317} {"train_loss": -5.250776290893555, "global_step": 13317, "epoch": 317} {"train_loss": -5.0952301025390625, "global_step": 13318, "epoch": 317} {"train_loss": -5.2548112869262695, "global_step": 13319, "epoch": 317} {"train_loss": -5.209527015686035, "global_step": 13320, "epoch": 317} {"train_loss": -5.222598552703857, "global_step": 13321, "epoch": 317} {"train_loss": -5.0941057205200195, "global_step": 13322, "epoch": 317} {"train_loss": -5.266712665557861, "global_step": 13323, "epoch": 317} {"train_loss": -5.150984764099121, "global_step": 13324, "epoch": 317} {"train_loss": -5.089988708496094, "global_step": 13325, "epoch": 317} {"train_loss": -5.118559837341309, "global_step": 13326, "epoch": 317} {"train_loss": -5.168239593505859, "global_step": 13327, "epoch": 317} {"train_loss": -5.235612869262695, "global_step": 13328, "epoch": 317} {"train_loss": -5.110569477081299, "global_step": 13329, "epoch": 317} {"train_loss": -5.13845157623291, "global_step": 13330, "epoch": 317} {"train_loss": -5.335758209228516, "global_step": 13331, "epoch": 317} {"train_loss": -5.200314521789551, "global_step": 13332, "epoch": 317} {"train_loss": -5.013474464416504, "global_step": 13333, "epoch": 317} {"train_loss": -5.088395118713379, "global_step": 13334, "epoch": 317} {"train_loss": -5.1419148445129395, "global_step": 13335, "epoch": 317} {"train_loss": -5.029932975769043, "global_step": 13336, "epoch": 317} {"train_loss": -5.168785095214844, "global_step": 13337, "epoch": 317} {"train_loss": -5.039432525634766, "global_step": 13338, "epoch": 317} {"train_loss": -5.106278419494629, "global_step": 13339, "epoch": 317} {"train_loss": -5.100222587585449, "global_step": 13340, "epoch": 317} {"train_loss": -5.134923934936523, "global_step": 13341, "epoch": 317} {"train_loss": -5.161088943481445, "global_step": 13342, "epoch": 317} {"train_loss": -4.97418212890625, "global_step": 13343, "epoch": 317} {"train_loss": -5.215478897094727, "global_step": 13344, "epoch": 317} {"train_loss": -5.144622802734375, "global_step": 13345, "epoch": 317} {"train_loss": -5.072959899902344, "global_step": 13346, "epoch": 317} {"train_loss": -5.261307716369629, "global_step": 13347, "epoch": 317} {"train_loss": -5.189996719360352, "global_step": 13348, "epoch": 317} {"train_loss": -5.0800557136535645, "global_step": 13349, "epoch": 317} {"train_loss": -5.0714006423950195, "global_step": 13350, "epoch": 317} {"train_loss": -5.116397857666016, "global_step": 13351, "epoch": 317} {"train_loss": -4.979520797729492, "global_step": 13352, "epoch": 317} {"train_loss": -5.123201847076416, "global_step": 13353, "epoch": 317} {"train_loss": -5.120632171630859, "global_step": 13354, "epoch": 317} {"train_loss": -5.13776741709028, "global_step": 13355, "epoch": 317, "val_loss": 72910.1875} {"train_loss": -5.212822437286377, "global_step": 13356, "epoch": 318} {"train_loss": -5.206589698791504, "global_step": 13357, "epoch": 318} {"train_loss": -5.001070976257324, "global_step": 13358, "epoch": 318} {"train_loss": -5.299564838409424, "global_step": 13359, "epoch": 318} {"train_loss": -5.071317195892334, "global_step": 13360, "epoch": 318} {"train_loss": -5.2918596267700195, "global_step": 13361, "epoch": 318} {"train_loss": -5.3299994468688965, "global_step": 13362, "epoch": 318} {"train_loss": -4.981687068939209, "global_step": 13363, "epoch": 318} {"train_loss": -5.1302170753479, "global_step": 13364, "epoch": 318} {"train_loss": -5.164853096008301, "global_step": 13365, "epoch": 318} {"train_loss": -5.178654670715332, "global_step": 13366, "epoch": 318} {"train_loss": -5.132349491119385, "global_step": 13367, "epoch": 318} {"train_loss": -5.05665397644043, "global_step": 13368, "epoch": 318} {"train_loss": -5.243391036987305, "global_step": 13369, "epoch": 318} {"train_loss": -5.049567222595215, "global_step": 13370, "epoch": 318} {"train_loss": -5.259794235229492, "global_step": 13371, "epoch": 318} {"train_loss": -5.239040851593018, "global_step": 13372, "epoch": 318} {"train_loss": -5.043058395385742, "global_step": 13373, "epoch": 318} {"train_loss": -5.165483474731445, "global_step": 13374, "epoch": 318} {"train_loss": -5.245641708374023, "global_step": 13375, "epoch": 318} {"train_loss": -5.0791168212890625, "global_step": 13376, "epoch": 318} {"train_loss": -5.120057106018066, "global_step": 13377, "epoch": 318} {"train_loss": -5.046452522277832, "global_step": 13378, "epoch": 318} {"train_loss": -5.192401885986328, "global_step": 13379, "epoch": 318} {"train_loss": -5.274753570556641, "global_step": 13380, "epoch": 318} {"train_loss": -5.144282341003418, "global_step": 13381, "epoch": 318} {"train_loss": -5.153777599334717, "global_step": 13382, "epoch": 318} {"train_loss": -5.2790303230285645, "global_step": 13383, "epoch": 318} {"train_loss": -5.017533779144287, "global_step": 13384, "epoch": 318} {"train_loss": -5.2241315841674805, "global_step": 13385, "epoch": 318} {"train_loss": -5.153761386871338, "global_step": 13386, "epoch": 318} {"train_loss": -5.19754695892334, "global_step": 13387, "epoch": 318} {"train_loss": -5.262478351593018, "global_step": 13388, "epoch": 318} {"train_loss": -5.011778354644775, "global_step": 13389, "epoch": 318} {"train_loss": -5.088779449462891, "global_step": 13390, "epoch": 318} {"train_loss": -5.164008617401123, "global_step": 13391, "epoch": 318} {"train_loss": -5.249778747558594, "global_step": 13392, "epoch": 318} {"train_loss": -5.239826679229736, "global_step": 13393, "epoch": 318} {"train_loss": -5.102811813354492, "global_step": 13394, "epoch": 318} {"train_loss": -5.132089138031006, "global_step": 13395, "epoch": 318} {"train_loss": -5.007837772369385, "global_step": 13396, "epoch": 318} {"train_loss": -5.157800288427444, "global_step": 13397, "epoch": 318, "val_loss": 72551.2421875} {"train_loss": -5.179405212402344, "global_step": 13398, "epoch": 319} {"train_loss": -5.175239086151123, "global_step": 13399, "epoch": 319} {"train_loss": -5.112242221832275, "global_step": 13400, "epoch": 319} {"train_loss": -5.2308349609375, "global_step": 13401, "epoch": 319} {"train_loss": -5.065996170043945, "global_step": 13402, "epoch": 319} {"train_loss": -5.207500457763672, "global_step": 13403, "epoch": 319} {"train_loss": -5.165699481964111, "global_step": 13404, "epoch": 319} {"train_loss": -5.191650867462158, "global_step": 13405, "epoch": 319} {"train_loss": -5.1191301345825195, "global_step": 13406, "epoch": 319} {"train_loss": -5.116976737976074, "global_step": 13407, "epoch": 319} {"train_loss": -5.0479559898376465, "global_step": 13408, "epoch": 319} {"train_loss": -5.171679496765137, "global_step": 13409, "epoch": 319} {"train_loss": -5.146492004394531, "global_step": 13410, "epoch": 319} {"train_loss": -5.151350021362305, "global_step": 13411, "epoch": 319} {"train_loss": -5.301141738891602, "global_step": 13412, "epoch": 319} {"train_loss": -5.1671271324157715, "global_step": 13413, "epoch": 319} {"train_loss": -5.226093292236328, "global_step": 13414, "epoch": 319} {"train_loss": -5.286037445068359, "global_step": 13415, "epoch": 319} {"train_loss": -5.001186370849609, "global_step": 13416, "epoch": 319} {"train_loss": -5.223250389099121, "global_step": 13417, "epoch": 319} {"train_loss": -5.154455184936523, "global_step": 13418, "epoch": 319} {"train_loss": -5.1775712966918945, "global_step": 13419, "epoch": 319} {"train_loss": -5.120221138000488, "global_step": 13420, "epoch": 319} {"train_loss": -5.143528938293457, "global_step": 13421, "epoch": 319} {"train_loss": -5.312330722808838, "global_step": 13422, "epoch": 319} {"train_loss": -5.149930953979492, "global_step": 13423, "epoch": 319} {"train_loss": -5.26839017868042, "global_step": 13424, "epoch": 319} {"train_loss": -5.317357063293457, "global_step": 13425, "epoch": 319} {"train_loss": -5.268352508544922, "global_step": 13426, "epoch": 319} {"train_loss": -5.099020957946777, "global_step": 13427, "epoch": 319} {"train_loss": -5.200096607208252, "global_step": 13428, "epoch": 319} {"train_loss": -5.163129806518555, "global_step": 13429, "epoch": 319} {"train_loss": -5.148801803588867, "global_step": 13430, "epoch": 319} {"train_loss": -5.159740447998047, "global_step": 13431, "epoch": 319} {"train_loss": -5.156494617462158, "global_step": 13432, "epoch": 319} {"train_loss": -5.089568138122559, "global_step": 13433, "epoch": 319} {"train_loss": -5.028663158416748, "global_step": 13434, "epoch": 319} {"train_loss": -5.114240646362305, "global_step": 13435, "epoch": 319} {"train_loss": -5.1362810134887695, "global_step": 13436, "epoch": 319} {"train_loss": -5.024742126464844, "global_step": 13437, "epoch": 319} {"train_loss": -5.294734477996826, "global_step": 13438, "epoch": 319} {"train_loss": -5.156933546066284, "global_step": 13439, "epoch": 319, "val_loss": 75440.703125} {"train_loss": -4.9777512550354, "global_step": 13440, "epoch": 320} {"train_loss": -4.9983320236206055, "global_step": 13441, "epoch": 320} {"train_loss": -5.013223648071289, "global_step": 13442, "epoch": 320} {"train_loss": -5.277978420257568, "global_step": 13443, "epoch": 320} {"train_loss": -4.981555938720703, "global_step": 13444, "epoch": 320} {"train_loss": -5.038786888122559, "global_step": 13445, "epoch": 320} {"train_loss": -5.0113701820373535, "global_step": 13446, "epoch": 320} {"train_loss": -5.145754814147949, "global_step": 13447, "epoch": 320} {"train_loss": -5.062931060791016, "global_step": 13448, "epoch": 320} {"train_loss": -5.263019561767578, "global_step": 13449, "epoch": 320} {"train_loss": -5.085223197937012, "global_step": 13450, "epoch": 320} {"train_loss": -5.089149475097656, "global_step": 13451, "epoch": 320} {"train_loss": -5.213696479797363, "global_step": 13452, "epoch": 320} {"train_loss": -5.080403804779053, "global_step": 13453, "epoch": 320} {"train_loss": -5.1865410804748535, "global_step": 13454, "epoch": 320} {"train_loss": -4.987100124359131, "global_step": 13455, "epoch": 320} {"train_loss": -5.180776596069336, "global_step": 13456, "epoch": 320} {"train_loss": -5.181484222412109, "global_step": 13457, "epoch": 320} {"train_loss": -5.089555740356445, "global_step": 13458, "epoch": 320} {"train_loss": -5.138123035430908, "global_step": 13459, "epoch": 320} {"train_loss": -5.090717315673828, "global_step": 13460, "epoch": 320} {"train_loss": -5.171594142913818, "global_step": 13461, "epoch": 320} {"train_loss": -5.177289962768555, "global_step": 13462, "epoch": 320} {"train_loss": -5.184289932250977, "global_step": 13463, "epoch": 320} {"train_loss": -5.290276527404785, "global_step": 13464, "epoch": 320} {"train_loss": -5.106830596923828, "global_step": 13465, "epoch": 320} {"train_loss": -5.351370811462402, "global_step": 13466, "epoch": 320} {"train_loss": -5.152451515197754, "global_step": 13467, "epoch": 320} {"train_loss": -5.165637969970703, "global_step": 13468, "epoch": 320} {"train_loss": -5.257124423980713, "global_step": 13469, "epoch": 320} {"train_loss": -5.16103982925415, "global_step": 13470, "epoch": 320} {"train_loss": -5.0854949951171875, "global_step": 13471, "epoch": 320} {"train_loss": -5.223036289215088, "global_step": 13472, "epoch": 320} {"train_loss": -5.202881813049316, "global_step": 13473, "epoch": 320} {"train_loss": -5.083807468414307, "global_step": 13474, "epoch": 320} {"train_loss": -5.19190788269043, "global_step": 13475, "epoch": 320} {"train_loss": -5.18714714050293, "global_step": 13476, "epoch": 320} {"train_loss": -5.245429992675781, "global_step": 13477, "epoch": 320} {"train_loss": -5.119248390197754, "global_step": 13478, "epoch": 320} {"train_loss": -5.197142601013184, "global_step": 13479, "epoch": 320} {"train_loss": -5.233348846435547, "global_step": 13480, "epoch": 320} {"train_loss": -5.147446110135033, "global_step": 13481, "epoch": 320, "val_loss": 72748.125} {"train_loss": -5.288039207458496, "global_step": 13482, "epoch": 321} {"train_loss": -5.167882442474365, "global_step": 13483, "epoch": 321} {"train_loss": -5.1555023193359375, "global_step": 13484, "epoch": 321} {"train_loss": -5.215813636779785, "global_step": 13485, "epoch": 321} {"train_loss": -5.2040252685546875, "global_step": 13486, "epoch": 321} {"train_loss": -5.053379535675049, "global_step": 13487, "epoch": 321} {"train_loss": -5.261899948120117, "global_step": 13488, "epoch": 321} {"train_loss": -5.295003890991211, "global_step": 13489, "epoch": 321} {"train_loss": -5.20845890045166, "global_step": 13490, "epoch": 321} {"train_loss": -5.304757118225098, "global_step": 13491, "epoch": 321} {"train_loss": -5.117769241333008, "global_step": 13492, "epoch": 321} {"train_loss": -5.219785690307617, "global_step": 13493, "epoch": 321} {"train_loss": -5.066687107086182, "global_step": 13494, "epoch": 321} {"train_loss": -5.17967414855957, "global_step": 13495, "epoch": 321} {"train_loss": -5.071226596832275, "global_step": 13496, "epoch": 321} {"train_loss": -5.176542282104492, "global_step": 13497, "epoch": 321} {"train_loss": -5.182422637939453, "global_step": 13498, "epoch": 321} {"train_loss": -5.054022789001465, "global_step": 13499, "epoch": 321} {"train_loss": -5.234909534454346, "global_step": 13500, "epoch": 321} {"train_loss": -5.263148307800293, "global_step": 13501, "epoch": 321} {"train_loss": -5.066956520080566, "global_step": 13502, "epoch": 321} {"train_loss": -5.311778545379639, "global_step": 13503, "epoch": 321} {"train_loss": -5.209505081176758, "global_step": 13504, "epoch": 321} {"train_loss": -5.184476852416992, "global_step": 13505, "epoch": 321} {"train_loss": -5.04951286315918, "global_step": 13506, "epoch": 321} {"train_loss": -5.089058876037598, "global_step": 13507, "epoch": 321} {"train_loss": -5.170352935791016, "global_step": 13508, "epoch": 321} {"train_loss": -5.189551830291748, "global_step": 13509, "epoch": 321} {"train_loss": -5.139461040496826, "global_step": 13510, "epoch": 321} {"train_loss": -5.2254319190979, "global_step": 13511, "epoch": 321} {"train_loss": -5.242206573486328, "global_step": 13512, "epoch": 321} {"train_loss": -5.253119468688965, "global_step": 13513, "epoch": 321} {"train_loss": -5.171085357666016, "global_step": 13514, "epoch": 321} {"train_loss": -5.172702789306641, "global_step": 13515, "epoch": 321} {"train_loss": -5.125801086425781, "global_step": 13516, "epoch": 321} {"train_loss": -5.15791130065918, "global_step": 13517, "epoch": 321} {"train_loss": -5.169281959533691, "global_step": 13518, "epoch": 321} {"train_loss": -5.22224235534668, "global_step": 13519, "epoch": 321} {"train_loss": -5.133985996246338, "global_step": 13520, "epoch": 321} {"train_loss": -5.0884809494018555, "global_step": 13521, "epoch": 321} {"train_loss": -5.2778472900390625, "global_step": 13522, "epoch": 321} {"train_loss": -5.184699921380906, "global_step": 13523, "epoch": 321, "val_loss": 73036.671875} {"train_loss": -5.210501194000244, "global_step": 13524, "epoch": 322} {"train_loss": -5.12429141998291, "global_step": 13525, "epoch": 322} {"train_loss": -5.208613395690918, "global_step": 13526, "epoch": 322} {"train_loss": -5.253618240356445, "global_step": 13527, "epoch": 322} {"train_loss": -5.254372596740723, "global_step": 13528, "epoch": 322} {"train_loss": -5.206374168395996, "global_step": 13529, "epoch": 322} {"train_loss": -5.075717449188232, "global_step": 13530, "epoch": 322} {"train_loss": -5.211907863616943, "global_step": 13531, "epoch": 322} {"train_loss": -5.324373722076416, "global_step": 13532, "epoch": 322} {"train_loss": -5.105079650878906, "global_step": 13533, "epoch": 322} {"train_loss": -5.015008449554443, "global_step": 13534, "epoch": 322} {"train_loss": -5.282208442687988, "global_step": 13535, "epoch": 322} {"train_loss": -5.028305530548096, "global_step": 13536, "epoch": 322} {"train_loss": -5.079986572265625, "global_step": 13537, "epoch": 322} {"train_loss": -5.171576499938965, "global_step": 13538, "epoch": 322} {"train_loss": -5.131126403808594, "global_step": 13539, "epoch": 322} {"train_loss": -5.156761169433594, "global_step": 13540, "epoch": 322} {"train_loss": -5.116417407989502, "global_step": 13541, "epoch": 322} {"train_loss": -5.152035713195801, "global_step": 13542, "epoch": 322} {"train_loss": -5.061655044555664, "global_step": 13543, "epoch": 322} {"train_loss": -5.252631664276123, "global_step": 13544, "epoch": 322} {"train_loss": -5.0448808670043945, "global_step": 13545, "epoch": 322} {"train_loss": -5.000560760498047, "global_step": 13546, "epoch": 322} {"train_loss": -5.102783203125, "global_step": 13547, "epoch": 322} {"train_loss": -5.102510452270508, "global_step": 13548, "epoch": 322} {"train_loss": -5.169829368591309, "global_step": 13549, "epoch": 322} {"train_loss": -5.150551795959473, "global_step": 13550, "epoch": 322} {"train_loss": -5.172650337219238, "global_step": 13551, "epoch": 322} {"train_loss": -5.187291145324707, "global_step": 13552, "epoch": 322} {"train_loss": -5.050436496734619, "global_step": 13553, "epoch": 322} {"train_loss": -5.251147270202637, "global_step": 13554, "epoch": 322} {"train_loss": -5.161555290222168, "global_step": 13555, "epoch": 322} {"train_loss": -5.1383376121521, "global_step": 13556, "epoch": 322} {"train_loss": -5.178070068359375, "global_step": 13557, "epoch": 322} {"train_loss": -5.034296035766602, "global_step": 13558, "epoch": 322} {"train_loss": -5.212053298950195, "global_step": 13559, "epoch": 322} {"train_loss": -5.233519554138184, "global_step": 13560, "epoch": 322} {"train_loss": -5.247274875640869, "global_step": 13561, "epoch": 322} {"train_loss": -5.169637203216553, "global_step": 13562, "epoch": 322} {"train_loss": -5.009278297424316, "global_step": 13563, "epoch": 322} {"train_loss": -5.313173294067383, "global_step": 13564, "epoch": 322} {"train_loss": -5.1498000508262995, "global_step": 13565, "epoch": 322, "val_loss": 73376.3125} {"train_loss": -5.149178504943848, "global_step": 13566, "epoch": 323} {"train_loss": -5.147695541381836, "global_step": 13567, "epoch": 323} {"train_loss": -5.176220893859863, "global_step": 13568, "epoch": 323} {"train_loss": -5.031438827514648, "global_step": 13569, "epoch": 323} {"train_loss": -5.154279708862305, "global_step": 13570, "epoch": 323} {"train_loss": -4.969451904296875, "global_step": 13571, "epoch": 323} {"train_loss": -5.193329334259033, "global_step": 13572, "epoch": 323} {"train_loss": -5.193883895874023, "global_step": 13573, "epoch": 323} {"train_loss": -5.03861141204834, "global_step": 13574, "epoch": 323} {"train_loss": -5.306001663208008, "global_step": 13575, "epoch": 323} {"train_loss": -5.061474323272705, "global_step": 13576, "epoch": 323} {"train_loss": -5.215076446533203, "global_step": 13577, "epoch": 323} {"train_loss": -5.071918487548828, "global_step": 13578, "epoch": 323} {"train_loss": -5.165246963500977, "global_step": 13579, "epoch": 323} {"train_loss": -5.096035957336426, "global_step": 13580, "epoch": 323} {"train_loss": -5.173962593078613, "global_step": 13581, "epoch": 323} {"train_loss": -5.184991836547852, "global_step": 13582, "epoch": 323} {"train_loss": -5.184657096862793, "global_step": 13583, "epoch": 323} {"train_loss": -5.12092399597168, "global_step": 13584, "epoch": 323} {"train_loss": -5.3211445808410645, "global_step": 13585, "epoch": 323} {"train_loss": -5.158773422241211, "global_step": 13586, "epoch": 323} {"train_loss": -5.150547027587891, "global_step": 13587, "epoch": 323} {"train_loss": -5.126646518707275, "global_step": 13588, "epoch": 323} {"train_loss": -5.211965084075928, "global_step": 13589, "epoch": 323} {"train_loss": -5.225481986999512, "global_step": 13590, "epoch": 323} {"train_loss": -5.313717842102051, "global_step": 13591, "epoch": 323} {"train_loss": -5.163727283477783, "global_step": 13592, "epoch": 323} {"train_loss": -5.261207580566406, "global_step": 13593, "epoch": 323} {"train_loss": -5.054729461669922, "global_step": 13594, "epoch": 323} {"train_loss": -5.161924362182617, "global_step": 13595, "epoch": 323} {"train_loss": -5.022642612457275, "global_step": 13596, "epoch": 323} {"train_loss": -5.073031425476074, "global_step": 13597, "epoch": 323} {"train_loss": -5.048398017883301, "global_step": 13598, "epoch": 323} {"train_loss": -5.081752777099609, "global_step": 13599, "epoch": 323} {"train_loss": -5.155116081237793, "global_step": 13600, "epoch": 323} {"train_loss": -5.229743003845215, "global_step": 13601, "epoch": 323} {"train_loss": -5.214449405670166, "global_step": 13602, "epoch": 323} {"train_loss": -5.166618347167969, "global_step": 13603, "epoch": 323} {"train_loss": -5.096187591552734, "global_step": 13604, "epoch": 323} {"train_loss": -5.158761501312256, "global_step": 13605, "epoch": 323} {"train_loss": -5.196191787719727, "global_step": 13606, "epoch": 323} {"train_loss": -5.151553222111294, "global_step": 13607, "epoch": 323, "val_loss": 72900.4765625} {"train_loss": -5.030652046203613, "global_step": 13608, "epoch": 324} {"train_loss": -5.213489532470703, "global_step": 13609, "epoch": 324} {"train_loss": -4.965028285980225, "global_step": 13610, "epoch": 324} {"train_loss": -5.325855255126953, "global_step": 13611, "epoch": 324} {"train_loss": -5.358170986175537, "global_step": 13612, "epoch": 324} {"train_loss": -5.1887125968933105, "global_step": 13613, "epoch": 324} {"train_loss": -5.279165267944336, "global_step": 13614, "epoch": 324} {"train_loss": -5.1693010330200195, "global_step": 13615, "epoch": 324} {"train_loss": -5.255083084106445, "global_step": 13616, "epoch": 324} {"train_loss": -5.2798566818237305, "global_step": 13617, "epoch": 324} {"train_loss": -5.1430158615112305, "global_step": 13618, "epoch": 324} {"train_loss": -5.241570949554443, "global_step": 13619, "epoch": 324} {"train_loss": -5.089838981628418, "global_step": 13620, "epoch": 324} {"train_loss": -4.994141578674316, "global_step": 13621, "epoch": 324} {"train_loss": -5.218862533569336, "global_step": 13622, "epoch": 324} {"train_loss": -5.199681758880615, "global_step": 13623, "epoch": 324} {"train_loss": -5.235591888427734, "global_step": 13624, "epoch": 324} {"train_loss": -5.3741559982299805, "global_step": 13625, "epoch": 324} {"train_loss": -5.216967582702637, "global_step": 13626, "epoch": 324} {"train_loss": -5.189990997314453, "global_step": 13627, "epoch": 324} {"train_loss": -5.218358039855957, "global_step": 13628, "epoch": 324} {"train_loss": -5.240545272827148, "global_step": 13629, "epoch": 324} {"train_loss": -5.259797096252441, "global_step": 13630, "epoch": 324} {"train_loss": -5.134551048278809, "global_step": 13631, "epoch": 324} {"train_loss": -5.187707901000977, "global_step": 13632, "epoch": 324} {"train_loss": -5.258820056915283, "global_step": 13633, "epoch": 324} {"train_loss": -5.111238479614258, "global_step": 13634, "epoch": 324} {"train_loss": -5.361729621887207, "global_step": 13635, "epoch": 324} {"train_loss": -4.961885452270508, "global_step": 13636, "epoch": 324} {"train_loss": -5.092790603637695, "global_step": 13637, "epoch": 324} {"train_loss": -5.110471248626709, "global_step": 13638, "epoch": 324} {"train_loss": -5.144901275634766, "global_step": 13639, "epoch": 324} {"train_loss": -5.053890228271484, "global_step": 13640, "epoch": 324} {"train_loss": -5.187545299530029, "global_step": 13641, "epoch": 324} {"train_loss": -5.238980770111084, "global_step": 13642, "epoch": 324} {"train_loss": -5.126689910888672, "global_step": 13643, "epoch": 324} {"train_loss": -5.237781047821045, "global_step": 13644, "epoch": 324} {"train_loss": -5.143344879150391, "global_step": 13645, "epoch": 324} {"train_loss": -5.002337455749512, "global_step": 13646, "epoch": 324} {"train_loss": -5.108806133270264, "global_step": 13647, "epoch": 324} {"train_loss": -5.246517181396484, "global_step": 13648, "epoch": 324} {"train_loss": -5.180522759755452, "global_step": 13649, "epoch": 324, "val_loss": 73450.7265625} {"train_loss": -4.995635509490967, "global_step": 13650, "epoch": 325} {"train_loss": -5.187410831451416, "global_step": 13651, "epoch": 325} {"train_loss": -5.059772491455078, "global_step": 13652, "epoch": 325} {"train_loss": -5.123317718505859, "global_step": 13653, "epoch": 325} {"train_loss": -5.141822814941406, "global_step": 13654, "epoch": 325} {"train_loss": -5.022966384887695, "global_step": 13655, "epoch": 325} {"train_loss": -5.124258041381836, "global_step": 13656, "epoch": 325} {"train_loss": -5.236132621765137, "global_step": 13657, "epoch": 325} {"train_loss": -5.104411602020264, "global_step": 13658, "epoch": 325} {"train_loss": -5.20750617980957, "global_step": 13659, "epoch": 325} {"train_loss": -5.080474853515625, "global_step": 13660, "epoch": 325} {"train_loss": -5.185197353363037, "global_step": 13661, "epoch": 325} {"train_loss": -5.1552324295043945, "global_step": 13662, "epoch": 325} {"train_loss": -5.200432300567627, "global_step": 13663, "epoch": 325} {"train_loss": -5.280076026916504, "global_step": 13664, "epoch": 325} {"train_loss": -5.2764892578125, "global_step": 13665, "epoch": 325} {"train_loss": -5.297463893890381, "global_step": 13666, "epoch": 325} {"train_loss": -5.292275428771973, "global_step": 13667, "epoch": 325} {"train_loss": -5.039979934692383, "global_step": 13668, "epoch": 325} {"train_loss": -5.302319526672363, "global_step": 13669, "epoch": 325} {"train_loss": -5.038751125335693, "global_step": 13670, "epoch": 325} {"train_loss": -5.195718765258789, "global_step": 13671, "epoch": 325} {"train_loss": -5.27211856842041, "global_step": 13672, "epoch": 325} {"train_loss": -5.138864517211914, "global_step": 13673, "epoch": 325} {"train_loss": -5.171303749084473, "global_step": 13674, "epoch": 325} {"train_loss": -5.206597805023193, "global_step": 13675, "epoch": 325} {"train_loss": -5.077345848083496, "global_step": 13676, "epoch": 325} {"train_loss": -5.252261638641357, "global_step": 13677, "epoch": 325} {"train_loss": -5.241262435913086, "global_step": 13678, "epoch": 325} {"train_loss": -5.202675819396973, "global_step": 13679, "epoch": 325} {"train_loss": -5.168824195861816, "global_step": 13680, "epoch": 325} {"train_loss": -5.125617980957031, "global_step": 13681, "epoch": 325} {"train_loss": -5.125184059143066, "global_step": 13682, "epoch": 325} {"train_loss": -5.147562503814697, "global_step": 13683, "epoch": 325} {"train_loss": -5.096513748168945, "global_step": 13684, "epoch": 325} {"train_loss": -5.361238479614258, "global_step": 13685, "epoch": 325} {"train_loss": -5.191048622131348, "global_step": 13686, "epoch": 325} {"train_loss": -5.224871635437012, "global_step": 13687, "epoch": 325} {"train_loss": -5.246892929077148, "global_step": 13688, "epoch": 325} {"train_loss": -5.225566864013672, "global_step": 13689, "epoch": 325} {"train_loss": -5.182220458984375, "global_step": 13690, "epoch": 325} {"train_loss": -5.174092338198707, "global_step": 13691, "epoch": 325, "val_loss": 72508.9296875} {"train_loss": -5.157426357269287, "global_step": 13692, "epoch": 326} {"train_loss": -5.171600341796875, "global_step": 13693, "epoch": 326} {"train_loss": -5.227246284484863, "global_step": 13694, "epoch": 326} {"train_loss": -5.072912216186523, "global_step": 13695, "epoch": 326} {"train_loss": -5.209859848022461, "global_step": 13696, "epoch": 326} {"train_loss": -5.1931471824646, "global_step": 13697, "epoch": 326} {"train_loss": -5.145479202270508, "global_step": 13698, "epoch": 326} {"train_loss": -5.022713661193848, "global_step": 13699, "epoch": 326} {"train_loss": -5.171027660369873, "global_step": 13700, "epoch": 326} {"train_loss": -5.031268119812012, "global_step": 13701, "epoch": 326} {"train_loss": -5.289068222045898, "global_step": 13702, "epoch": 326} {"train_loss": -5.157849311828613, "global_step": 13703, "epoch": 326} {"train_loss": -4.975492477416992, "global_step": 13704, "epoch": 326} {"train_loss": -5.280131816864014, "global_step": 13705, "epoch": 326} {"train_loss": -5.278420925140381, "global_step": 13706, "epoch": 326} {"train_loss": -5.124176979064941, "global_step": 13707, "epoch": 326} {"train_loss": -5.288936138153076, "global_step": 13708, "epoch": 326} {"train_loss": -5.012875556945801, "global_step": 13709, "epoch": 326} {"train_loss": -5.287839889526367, "global_step": 13710, "epoch": 326} {"train_loss": -5.345642566680908, "global_step": 13711, "epoch": 326} {"train_loss": -5.276047229766846, "global_step": 13712, "epoch": 326} {"train_loss": -5.147535800933838, "global_step": 13713, "epoch": 326} {"train_loss": -5.201231002807617, "global_step": 13714, "epoch": 326} {"train_loss": -5.224768161773682, "global_step": 13715, "epoch": 326} {"train_loss": -5.186764717102051, "global_step": 13716, "epoch": 326} {"train_loss": -5.207973480224609, "global_step": 13717, "epoch": 326} {"train_loss": -5.17376708984375, "global_step": 13718, "epoch": 326} {"train_loss": -5.150424003601074, "global_step": 13719, "epoch": 326} {"train_loss": -5.329928398132324, "global_step": 13720, "epoch": 326} {"train_loss": -5.260765075683594, "global_step": 13721, "epoch": 326} {"train_loss": -5.312981605529785, "global_step": 13722, "epoch": 326} {"train_loss": -5.094749450683594, "global_step": 13723, "epoch": 326} {"train_loss": -5.195387840270996, "global_step": 13724, "epoch": 326} {"train_loss": -5.210370063781738, "global_step": 13725, "epoch": 326} {"train_loss": -5.260689735412598, "global_step": 13726, "epoch": 326} {"train_loss": -4.997032642364502, "global_step": 13727, "epoch": 326} {"train_loss": -5.096247673034668, "global_step": 13728, "epoch": 326} {"train_loss": -5.225459098815918, "global_step": 13729, "epoch": 326} {"train_loss": -5.1533918380737305, "global_step": 13730, "epoch": 326} {"train_loss": -4.859704971313477, "global_step": 13731, "epoch": 326} {"train_loss": -5.205049991607666, "global_step": 13732, "epoch": 326} {"train_loss": -5.173544531776791, "global_step": 13733, "epoch": 326, "val_loss": 74501.8515625} {"train_loss": -5.01670503616333, "global_step": 13734, "epoch": 327} {"train_loss": -5.14794921875, "global_step": 13735, "epoch": 327} {"train_loss": -4.99459171295166, "global_step": 13736, "epoch": 327} {"train_loss": -5.08807897567749, "global_step": 13737, "epoch": 327} {"train_loss": -5.087554931640625, "global_step": 13738, "epoch": 327} {"train_loss": -4.92913818359375, "global_step": 13739, "epoch": 327} {"train_loss": -5.165991306304932, "global_step": 13740, "epoch": 327} {"train_loss": -5.066040515899658, "global_step": 13741, "epoch": 327} {"train_loss": -5.057013511657715, "global_step": 13742, "epoch": 327} {"train_loss": -5.240607261657715, "global_step": 13743, "epoch": 327} {"train_loss": -5.1170759201049805, "global_step": 13744, "epoch": 327} {"train_loss": -5.098938941955566, "global_step": 13745, "epoch": 327} {"train_loss": -5.17106819152832, "global_step": 13746, "epoch": 327} {"train_loss": -5.21364688873291, "global_step": 13747, "epoch": 327} {"train_loss": -5.265519618988037, "global_step": 13748, "epoch": 327} {"train_loss": -5.161433219909668, "global_step": 13749, "epoch": 327} {"train_loss": -5.259069442749023, "global_step": 13750, "epoch": 327} {"train_loss": -5.1465373039245605, "global_step": 13751, "epoch": 327} {"train_loss": -5.096940994262695, "global_step": 13752, "epoch": 327} {"train_loss": -5.187081336975098, "global_step": 13753, "epoch": 327} {"train_loss": -5.285343170166016, "global_step": 13754, "epoch": 327} {"train_loss": -5.123766899108887, "global_step": 13755, "epoch": 327} {"train_loss": -5.0815863609313965, "global_step": 13756, "epoch": 327} {"train_loss": -5.17003870010376, "global_step": 13757, "epoch": 327} {"train_loss": -5.108151435852051, "global_step": 13758, "epoch": 327} {"train_loss": -4.986809730529785, "global_step": 13759, "epoch": 327} {"train_loss": -5.0991692543029785, "global_step": 13760, "epoch": 327} {"train_loss": -5.181012153625488, "global_step": 13761, "epoch": 327} {"train_loss": -5.023257255554199, "global_step": 13762, "epoch": 327} {"train_loss": -5.197957992553711, "global_step": 13763, "epoch": 327} {"train_loss": -5.001097202301025, "global_step": 13764, "epoch": 327} {"train_loss": -5.198566436767578, "global_step": 13765, "epoch": 327} {"train_loss": -5.145547866821289, "global_step": 13766, "epoch": 327} {"train_loss": -5.044596195220947, "global_step": 13767, "epoch": 327} {"train_loss": -5.10600471496582, "global_step": 13768, "epoch": 327} {"train_loss": -5.111908912658691, "global_step": 13769, "epoch": 327} {"train_loss": -5.201714515686035, "global_step": 13770, "epoch": 327} {"train_loss": -4.986448287963867, "global_step": 13771, "epoch": 327} {"train_loss": -5.1413655281066895, "global_step": 13772, "epoch": 327} {"train_loss": -5.220216751098633, "global_step": 13773, "epoch": 327} {"train_loss": -5.167762756347656, "global_step": 13774, "epoch": 327} {"train_loss": -5.123039574850173, "global_step": 13775, "epoch": 327, "val_loss": 73470.4140625} {"train_loss": -5.1517333984375, "global_step": 13776, "epoch": 328} {"train_loss": -5.167413234710693, "global_step": 13777, "epoch": 328} {"train_loss": -5.137686729431152, "global_step": 13778, "epoch": 328} {"train_loss": -5.0540452003479, "global_step": 13779, "epoch": 328} {"train_loss": -5.121990203857422, "global_step": 13780, "epoch": 328} {"train_loss": -5.152881622314453, "global_step": 13781, "epoch": 328} {"train_loss": -5.235212802886963, "global_step": 13782, "epoch": 328} {"train_loss": -5.202861785888672, "global_step": 13783, "epoch": 328} {"train_loss": -5.211312294006348, "global_step": 13784, "epoch": 328} {"train_loss": -5.172739505767822, "global_step": 13785, "epoch": 328} {"train_loss": -5.107430458068848, "global_step": 13786, "epoch": 328} {"train_loss": -5.283936500549316, "global_step": 13787, "epoch": 328} {"train_loss": -5.099889755249023, "global_step": 13788, "epoch": 328} {"train_loss": -5.198699951171875, "global_step": 13789, "epoch": 328} {"train_loss": -5.221848487854004, "global_step": 13790, "epoch": 328} {"train_loss": -5.109364032745361, "global_step": 13791, "epoch": 328} {"train_loss": -5.2555389404296875, "global_step": 13792, "epoch": 328} {"train_loss": -5.254471778869629, "global_step": 13793, "epoch": 328} {"train_loss": -5.211548805236816, "global_step": 13794, "epoch": 328} {"train_loss": -5.18178129196167, "global_step": 13795, "epoch": 328} {"train_loss": -5.26287841796875, "global_step": 13796, "epoch": 328} {"train_loss": -5.169748306274414, "global_step": 13797, "epoch": 328} {"train_loss": -5.2530341148376465, "global_step": 13798, "epoch": 328} {"train_loss": -5.060852527618408, "global_step": 13799, "epoch": 328} {"train_loss": -5.223653793334961, "global_step": 13800, "epoch": 328} {"train_loss": -5.2862701416015625, "global_step": 13801, "epoch": 328} {"train_loss": -5.176171779632568, "global_step": 13802, "epoch": 328} {"train_loss": -5.298763275146484, "global_step": 13803, "epoch": 328} {"train_loss": -5.140511512756348, "global_step": 13804, "epoch": 328} {"train_loss": -5.263288497924805, "global_step": 13805, "epoch": 328} {"train_loss": -5.235301971435547, "global_step": 13806, "epoch": 328} {"train_loss": -5.188117980957031, "global_step": 13807, "epoch": 328} {"train_loss": -5.078203201293945, "global_step": 13808, "epoch": 328} {"train_loss": -5.100201606750488, "global_step": 13809, "epoch": 328} {"train_loss": -5.000884056091309, "global_step": 13810, "epoch": 328} {"train_loss": -5.189764976501465, "global_step": 13811, "epoch": 328} {"train_loss": -5.173233985900879, "global_step": 13812, "epoch": 328} {"train_loss": -5.3129682540893555, "global_step": 13813, "epoch": 328} {"train_loss": -5.091248989105225, "global_step": 13814, "epoch": 328} {"train_loss": -5.248692989349365, "global_step": 13815, "epoch": 328} {"train_loss": -5.166202545166016, "global_step": 13816, "epoch": 328} {"train_loss": -5.1812660694122314, "global_step": 13817, "epoch": 328, "val_loss": 72388.09375} {"train_loss": -5.190376281738281, "global_step": 13818, "epoch": 329} {"train_loss": -5.131019592285156, "global_step": 13819, "epoch": 329} {"train_loss": -5.135298728942871, "global_step": 13820, "epoch": 329} {"train_loss": -5.2157487869262695, "global_step": 13821, "epoch": 329} {"train_loss": -5.247498512268066, "global_step": 13822, "epoch": 329} {"train_loss": -5.117310523986816, "global_step": 13823, "epoch": 329} {"train_loss": -5.2873687744140625, "global_step": 13824, "epoch": 329} {"train_loss": -5.1698317527771, "global_step": 13825, "epoch": 329} {"train_loss": -5.008112907409668, "global_step": 13826, "epoch": 329} {"train_loss": -5.124630451202393, "global_step": 13827, "epoch": 329} {"train_loss": -5.293149471282959, "global_step": 13828, "epoch": 329} {"train_loss": -5.129337310791016, "global_step": 13829, "epoch": 329} {"train_loss": -5.219357490539551, "global_step": 13830, "epoch": 329} {"train_loss": -5.208609580993652, "global_step": 13831, "epoch": 329} {"train_loss": -5.086554527282715, "global_step": 13832, "epoch": 329} {"train_loss": -5.345665454864502, "global_step": 13833, "epoch": 329} {"train_loss": -5.209851264953613, "global_step": 13834, "epoch": 329} {"train_loss": -5.1763200759887695, "global_step": 13835, "epoch": 329} {"train_loss": -5.289859771728516, "global_step": 13836, "epoch": 329} {"train_loss": -5.125788688659668, "global_step": 13837, "epoch": 329} {"train_loss": -5.165805816650391, "global_step": 13838, "epoch": 329} {"train_loss": -5.207938194274902, "global_step": 13839, "epoch": 329} {"train_loss": -5.052850723266602, "global_step": 13840, "epoch": 329} {"train_loss": -5.177736282348633, "global_step": 13841, "epoch": 329} {"train_loss": -5.253211498260498, "global_step": 13842, "epoch": 329} {"train_loss": -5.179652214050293, "global_step": 13843, "epoch": 329} {"train_loss": -5.229623317718506, "global_step": 13844, "epoch": 329} {"train_loss": -5.1837568283081055, "global_step": 13845, "epoch": 329} {"train_loss": -5.1959381103515625, "global_step": 13846, "epoch": 329} {"train_loss": -5.184015274047852, "global_step": 13847, "epoch": 329} {"train_loss": -5.156946182250977, "global_step": 13848, "epoch": 329} {"train_loss": -5.000648498535156, "global_step": 13849, "epoch": 329} {"train_loss": -5.186716079711914, "global_step": 13850, "epoch": 329} {"train_loss": -5.2675065994262695, "global_step": 13851, "epoch": 329} {"train_loss": -5.228001117706299, "global_step": 13852, "epoch": 329} {"train_loss": -5.199819087982178, "global_step": 13853, "epoch": 329} {"train_loss": -5.229532718658447, "global_step": 13854, "epoch": 329} {"train_loss": -5.04624080657959, "global_step": 13855, "epoch": 329} {"train_loss": -5.199857711791992, "global_step": 13856, "epoch": 329} {"train_loss": -5.1992902755737305, "global_step": 13857, "epoch": 329} {"train_loss": -5.201740741729736, "global_step": 13858, "epoch": 329} {"train_loss": -5.182345640091669, "global_step": 13859, "epoch": 329, "val_loss": 72488.171875} {"train_loss": -5.206417560577393, "global_step": 13860, "epoch": 330} {"train_loss": -5.171253204345703, "global_step": 13861, "epoch": 330} {"train_loss": -5.19252347946167, "global_step": 13862, "epoch": 330} {"train_loss": -5.170571327209473, "global_step": 13863, "epoch": 330} {"train_loss": -5.143069267272949, "global_step": 13864, "epoch": 330} {"train_loss": -5.133932590484619, "global_step": 13865, "epoch": 330} {"train_loss": -5.1792097091674805, "global_step": 13866, "epoch": 330} {"train_loss": -5.221796035766602, "global_step": 13867, "epoch": 330} {"train_loss": -5.2215118408203125, "global_step": 13868, "epoch": 330} {"train_loss": -5.228303909301758, "global_step": 13869, "epoch": 330} {"train_loss": -5.1641058921813965, "global_step": 13870, "epoch": 330} {"train_loss": -5.283046245574951, "global_step": 13871, "epoch": 330} {"train_loss": -5.1482415199279785, "global_step": 13872, "epoch": 330} {"train_loss": -5.1480021476745605, "global_step": 13873, "epoch": 330} {"train_loss": -5.098825931549072, "global_step": 13874, "epoch": 330} {"train_loss": -5.266916751861572, "global_step": 13875, "epoch": 330} {"train_loss": -5.317115783691406, "global_step": 13876, "epoch": 330} {"train_loss": -5.180440425872803, "global_step": 13877, "epoch": 330} {"train_loss": -5.211031436920166, "global_step": 13878, "epoch": 330} {"train_loss": -5.267587661743164, "global_step": 13879, "epoch": 330} {"train_loss": -5.182185173034668, "global_step": 13880, "epoch": 330} {"train_loss": -5.088574409484863, "global_step": 13881, "epoch": 330} {"train_loss": -5.205201625823975, "global_step": 13882, "epoch": 330} {"train_loss": -5.181454658508301, "global_step": 13883, "epoch": 330} {"train_loss": -5.153724193572998, "global_step": 13884, "epoch": 330} {"train_loss": -5.137677192687988, "global_step": 13885, "epoch": 330} {"train_loss": -5.312978744506836, "global_step": 13886, "epoch": 330} {"train_loss": -5.286226272583008, "global_step": 13887, "epoch": 330} {"train_loss": -5.245100975036621, "global_step": 13888, "epoch": 330} {"train_loss": -5.255533218383789, "global_step": 13889, "epoch": 330} {"train_loss": -5.136712074279785, "global_step": 13890, "epoch": 330} {"train_loss": -5.196111679077148, "global_step": 13891, "epoch": 330} {"train_loss": -5.176290512084961, "global_step": 13892, "epoch": 330} {"train_loss": -5.3051652908325195, "global_step": 13893, "epoch": 330} {"train_loss": -5.193906784057617, "global_step": 13894, "epoch": 330} {"train_loss": -5.174895763397217, "global_step": 13895, "epoch": 330} {"train_loss": -5.184648513793945, "global_step": 13896, "epoch": 330} {"train_loss": -5.301918029785156, "global_step": 13897, "epoch": 330} {"train_loss": -5.144496917724609, "global_step": 13898, "epoch": 330} {"train_loss": -5.322532653808594, "global_step": 13899, "epoch": 330} {"train_loss": -5.23605489730835, "global_step": 13900, "epoch": 330} {"train_loss": -5.201981737500145, "global_step": 13901, "epoch": 330, "val_loss": 72982.109375} {"train_loss": -5.229872703552246, "global_step": 13902, "epoch": 331} {"train_loss": -5.185397148132324, "global_step": 13903, "epoch": 331} {"train_loss": -5.142841339111328, "global_step": 13904, "epoch": 331} {"train_loss": -5.2479448318481445, "global_step": 13905, "epoch": 331} {"train_loss": -5.057473182678223, "global_step": 13906, "epoch": 331} {"train_loss": -5.332744598388672, "global_step": 13907, "epoch": 331} {"train_loss": -5.262766361236572, "global_step": 13908, "epoch": 331} {"train_loss": -5.006473541259766, "global_step": 13909, "epoch": 331} {"train_loss": -5.151212692260742, "global_step": 13910, "epoch": 331} {"train_loss": -5.141271591186523, "global_step": 13911, "epoch": 331} {"train_loss": -5.27885103225708, "global_step": 13912, "epoch": 331} {"train_loss": -5.309516429901123, "global_step": 13913, "epoch": 331} {"train_loss": -5.286140441894531, "global_step": 13914, "epoch": 331} {"train_loss": -5.31060791015625, "global_step": 13915, "epoch": 331} {"train_loss": -5.127091407775879, "global_step": 13916, "epoch": 331} {"train_loss": -5.129017353057861, "global_step": 13917, "epoch": 331} {"train_loss": -5.3008856773376465, "global_step": 13918, "epoch": 331} {"train_loss": -5.257643699645996, "global_step": 13919, "epoch": 331} {"train_loss": -5.234915733337402, "global_step": 13920, "epoch": 331} {"train_loss": -5.219663619995117, "global_step": 13921, "epoch": 331} {"train_loss": -5.149651527404785, "global_step": 13922, "epoch": 331} {"train_loss": -5.2331929206848145, "global_step": 13923, "epoch": 331} {"train_loss": -5.069999694824219, "global_step": 13924, "epoch": 331} {"train_loss": -5.265525817871094, "global_step": 13925, "epoch": 331} {"train_loss": -5.242703437805176, "global_step": 13926, "epoch": 331} {"train_loss": -5.113801956176758, "global_step": 13927, "epoch": 331} {"train_loss": -5.228742599487305, "global_step": 13928, "epoch": 331} {"train_loss": -5.349630355834961, "global_step": 13929, "epoch": 331} {"train_loss": -5.168585300445557, "global_step": 13930, "epoch": 331} {"train_loss": -5.362760543823242, "global_step": 13931, "epoch": 331} {"train_loss": -5.034645080566406, "global_step": 13932, "epoch": 331} {"train_loss": -5.063353538513184, "global_step": 13933, "epoch": 331} {"train_loss": -5.211613178253174, "global_step": 13934, "epoch": 331} {"train_loss": -5.057126522064209, "global_step": 13935, "epoch": 331} {"train_loss": -5.217694282531738, "global_step": 13936, "epoch": 331} {"train_loss": -5.245279312133789, "global_step": 13937, "epoch": 331} {"train_loss": -5.065055847167969, "global_step": 13938, "epoch": 331} {"train_loss": -5.145275592803955, "global_step": 13939, "epoch": 331} {"train_loss": -5.229905128479004, "global_step": 13940, "epoch": 331} {"train_loss": -5.206496238708496, "global_step": 13941, "epoch": 331} {"train_loss": -5.211245536804199, "global_step": 13942, "epoch": 331} {"train_loss": -5.196752105440412, "global_step": 13943, "epoch": 331, "val_loss": 73027.8515625} {"train_loss": -5.248380661010742, "global_step": 13944, "epoch": 332} {"train_loss": -5.186431884765625, "global_step": 13945, "epoch": 332} {"train_loss": -5.202370643615723, "global_step": 13946, "epoch": 332} {"train_loss": -5.287576675415039, "global_step": 13947, "epoch": 332} {"train_loss": -5.282227516174316, "global_step": 13948, "epoch": 332} {"train_loss": -5.123469829559326, "global_step": 13949, "epoch": 332} {"train_loss": -5.220081329345703, "global_step": 13950, "epoch": 332} {"train_loss": -5.125962257385254, "global_step": 13951, "epoch": 332} {"train_loss": -5.1457109451293945, "global_step": 13952, "epoch": 332} {"train_loss": -5.153470993041992, "global_step": 13953, "epoch": 332} {"train_loss": -5.227352142333984, "global_step": 13954, "epoch": 332} {"train_loss": -5.144172191619873, "global_step": 13955, "epoch": 332} {"train_loss": -5.085389614105225, "global_step": 13956, "epoch": 332} {"train_loss": -4.985658645629883, "global_step": 13957, "epoch": 332} {"train_loss": -4.968472957611084, "global_step": 13958, "epoch": 332} {"train_loss": -5.106194972991943, "global_step": 13959, "epoch": 332} {"train_loss": -4.920476913452148, "global_step": 13960, "epoch": 332} {"train_loss": -4.971118927001953, "global_step": 13961, "epoch": 332} {"train_loss": -5.126001358032227, "global_step": 13962, "epoch": 332} {"train_loss": -4.9480719566345215, "global_step": 13963, "epoch": 332} {"train_loss": -5.077103614807129, "global_step": 13964, "epoch": 332} {"train_loss": -5.03518009185791, "global_step": 13965, "epoch": 332} {"train_loss": -5.116187572479248, "global_step": 13966, "epoch": 332} {"train_loss": -5.097718238830566, "global_step": 13967, "epoch": 332} {"train_loss": -5.057128429412842, "global_step": 13968, "epoch": 332} {"train_loss": -5.258450031280518, "global_step": 13969, "epoch": 332} {"train_loss": -5.138814926147461, "global_step": 13970, "epoch": 332} {"train_loss": -5.151225566864014, "global_step": 13971, "epoch": 332} {"train_loss": -5.084839820861816, "global_step": 13972, "epoch": 332} {"train_loss": -5.117132663726807, "global_step": 13973, "epoch": 332} {"train_loss": -5.222592830657959, "global_step": 13974, "epoch": 332} {"train_loss": -5.122833728790283, "global_step": 13975, "epoch": 332} {"train_loss": -5.222002983093262, "global_step": 13976, "epoch": 332} {"train_loss": -5.196193695068359, "global_step": 13977, "epoch": 332} {"train_loss": -5.043233871459961, "global_step": 13978, "epoch": 332} {"train_loss": -4.983066558837891, "global_step": 13979, "epoch": 332} {"train_loss": -5.126255035400391, "global_step": 13980, "epoch": 332} {"train_loss": -5.181094169616699, "global_step": 13981, "epoch": 332} {"train_loss": -5.192934513092041, "global_step": 13982, "epoch": 332} {"train_loss": -5.059024810791016, "global_step": 13983, "epoch": 332} {"train_loss": -5.0716705322265625, "global_step": 13984, "epoch": 332} {"train_loss": -5.124783890587943, "global_step": 13985, "epoch": 332, "val_loss": 72299.03125} {"train_loss": -5.185856819152832, "global_step": 13986, "epoch": 333} {"train_loss": -5.109598159790039, "global_step": 13987, "epoch": 333} {"train_loss": -5.237768173217773, "global_step": 13988, "epoch": 333} {"train_loss": -5.125837802886963, "global_step": 13989, "epoch": 333} {"train_loss": -5.06272029876709, "global_step": 13990, "epoch": 333} {"train_loss": -5.222842693328857, "global_step": 13991, "epoch": 333} {"train_loss": -5.23239803314209, "global_step": 13992, "epoch": 333} {"train_loss": -5.264087677001953, "global_step": 13993, "epoch": 333} {"train_loss": -5.233715534210205, "global_step": 13994, "epoch": 333} {"train_loss": -5.166266441345215, "global_step": 13995, "epoch": 333} {"train_loss": -5.246096611022949, "global_step": 13996, "epoch": 333} {"train_loss": -5.150394439697266, "global_step": 13997, "epoch": 333} {"train_loss": -5.32530403137207, "global_step": 13998, "epoch": 333} {"train_loss": -5.219638824462891, "global_step": 13999, "epoch": 333} {"train_loss": -5.138298511505127, "global_step": 14000, "epoch": 333} {"train_loss": -5.156525611877441, "global_step": 14001, "epoch": 333} {"train_loss": -5.2486677169799805, "global_step": 14002, "epoch": 333} {"train_loss": -5.042268753051758, "global_step": 14003, "epoch": 333} {"train_loss": -5.307535648345947, "global_step": 14004, "epoch": 333} {"train_loss": -5.175027847290039, "global_step": 14005, "epoch": 333} {"train_loss": -5.151217460632324, "global_step": 14006, "epoch": 333} {"train_loss": -5.265547752380371, "global_step": 14007, "epoch": 333} {"train_loss": -5.292227745056152, "global_step": 14008, "epoch": 333} {"train_loss": -5.148375511169434, "global_step": 14009, "epoch": 333} {"train_loss": -5.287049770355225, "global_step": 14010, "epoch": 333} {"train_loss": -5.210979461669922, "global_step": 14011, "epoch": 333} {"train_loss": -5.145565986633301, "global_step": 14012, "epoch": 333} {"train_loss": -5.105101108551025, "global_step": 14013, "epoch": 333} {"train_loss": -5.16656494140625, "global_step": 14014, "epoch": 333} {"train_loss": -5.161568641662598, "global_step": 14015, "epoch": 333} {"train_loss": -5.23157262802124, "global_step": 14016, "epoch": 333} {"train_loss": -5.063288688659668, "global_step": 14017, "epoch": 333} {"train_loss": -5.1983819007873535, "global_step": 14018, "epoch": 333} {"train_loss": -5.12828254699707, "global_step": 14019, "epoch": 333} {"train_loss": -5.291945934295654, "global_step": 14020, "epoch": 333} {"train_loss": -5.291748523712158, "global_step": 14021, "epoch": 333} {"train_loss": -5.233941078186035, "global_step": 14022, "epoch": 333} {"train_loss": -5.161853790283203, "global_step": 14023, "epoch": 333} {"train_loss": -5.192685127258301, "global_step": 14024, "epoch": 333} {"train_loss": -5.308686256408691, "global_step": 14025, "epoch": 333} {"train_loss": -5.151190280914307, "global_step": 14026, "epoch": 333} {"train_loss": -5.195405335653396, "global_step": 14027, "epoch": 333, "val_loss": 72749.71875} {"train_loss": -5.13749885559082, "global_step": 14028, "epoch": 334} {"train_loss": -5.265631675720215, "global_step": 14029, "epoch": 334} {"train_loss": -5.131415367126465, "global_step": 14030, "epoch": 334} {"train_loss": -5.156327247619629, "global_step": 14031, "epoch": 334} {"train_loss": -5.257914066314697, "global_step": 14032, "epoch": 334} {"train_loss": -4.964892864227295, "global_step": 14033, "epoch": 334} {"train_loss": -5.144583702087402, "global_step": 14034, "epoch": 334} {"train_loss": -5.154119491577148, "global_step": 14035, "epoch": 334} {"train_loss": -5.144020080566406, "global_step": 14036, "epoch": 334} {"train_loss": -5.253442287445068, "global_step": 14037, "epoch": 334} {"train_loss": -5.2178850173950195, "global_step": 14038, "epoch": 334} {"train_loss": -5.112828254699707, "global_step": 14039, "epoch": 334} {"train_loss": -5.237046241760254, "global_step": 14040, "epoch": 334} {"train_loss": -5.322615623474121, "global_step": 14041, "epoch": 334} {"train_loss": -5.1004438400268555, "global_step": 14042, "epoch": 334} {"train_loss": -5.176546573638916, "global_step": 14043, "epoch": 334} {"train_loss": -5.108759880065918, "global_step": 14044, "epoch": 334} {"train_loss": -5.145394325256348, "global_step": 14045, "epoch": 334} {"train_loss": -5.2218523025512695, "global_step": 14046, "epoch": 334} {"train_loss": -5.221182823181152, "global_step": 14047, "epoch": 334} {"train_loss": -5.164008617401123, "global_step": 14048, "epoch": 334} {"train_loss": -5.275931358337402, "global_step": 14049, "epoch": 334} {"train_loss": -5.113718032836914, "global_step": 14050, "epoch": 334} {"train_loss": -5.218212127685547, "global_step": 14051, "epoch": 334} {"train_loss": -5.153509616851807, "global_step": 14052, "epoch": 334} {"train_loss": -5.252631187438965, "global_step": 14053, "epoch": 334} {"train_loss": -5.085700988769531, "global_step": 14054, "epoch": 334} {"train_loss": -5.275299549102783, "global_step": 14055, "epoch": 334} {"train_loss": -5.310689449310303, "global_step": 14056, "epoch": 334} {"train_loss": -5.181708335876465, "global_step": 14057, "epoch": 334} {"train_loss": -5.161081314086914, "global_step": 14058, "epoch": 334} {"train_loss": -5.248932838439941, "global_step": 14059, "epoch": 334} {"train_loss": -5.1504340171813965, "global_step": 14060, "epoch": 334} {"train_loss": -5.153012275695801, "global_step": 14061, "epoch": 334} {"train_loss": -5.204511642456055, "global_step": 14062, "epoch": 334} {"train_loss": -5.250674247741699, "global_step": 14063, "epoch": 334} {"train_loss": -5.116923809051514, "global_step": 14064, "epoch": 334} {"train_loss": -5.185184478759766, "global_step": 14065, "epoch": 334} {"train_loss": -4.993490219116211, "global_step": 14066, "epoch": 334} {"train_loss": -5.02646541595459, "global_step": 14067, "epoch": 334} {"train_loss": -5.232035160064697, "global_step": 14068, "epoch": 334} {"train_loss": -5.171342645372663, "global_step": 14069, "epoch": 334, "val_loss": 72691.8125} {"train_loss": -5.257442951202393, "global_step": 14070, "epoch": 335} {"train_loss": -5.33661413192749, "global_step": 14071, "epoch": 335} {"train_loss": -5.015424728393555, "global_step": 14072, "epoch": 335} {"train_loss": -5.079738140106201, "global_step": 14073, "epoch": 335} {"train_loss": -4.959317207336426, "global_step": 14074, "epoch": 335} {"train_loss": -5.133612632751465, "global_step": 14075, "epoch": 335} {"train_loss": -5.1351141929626465, "global_step": 14076, "epoch": 335} {"train_loss": -5.057657241821289, "global_step": 14077, "epoch": 335} {"train_loss": -4.978188991546631, "global_step": 14078, "epoch": 335} {"train_loss": -5.034882068634033, "global_step": 14079, "epoch": 335} {"train_loss": -5.168591022491455, "global_step": 14080, "epoch": 335} {"train_loss": -5.12293815612793, "global_step": 14081, "epoch": 335} {"train_loss": -5.175373077392578, "global_step": 14082, "epoch": 335} {"train_loss": -5.007122993469238, "global_step": 14083, "epoch": 335} {"train_loss": -5.03980827331543, "global_step": 14084, "epoch": 335} {"train_loss": -5.166632652282715, "global_step": 14085, "epoch": 335} {"train_loss": -4.953064918518066, "global_step": 14086, "epoch": 335} {"train_loss": -5.193758964538574, "global_step": 14087, "epoch": 335} {"train_loss": -5.042388439178467, "global_step": 14088, "epoch": 335} {"train_loss": -5.205385684967041, "global_step": 14089, "epoch": 335} {"train_loss": -5.135542869567871, "global_step": 14090, "epoch": 335} {"train_loss": -5.064889907836914, "global_step": 14091, "epoch": 335} {"train_loss": -5.0224080085754395, "global_step": 14092, "epoch": 335} {"train_loss": -5.167845726013184, "global_step": 14093, "epoch": 335} {"train_loss": -5.065298080444336, "global_step": 14094, "epoch": 335} {"train_loss": -5.125371932983398, "global_step": 14095, "epoch": 335} {"train_loss": -5.241335868835449, "global_step": 14096, "epoch": 335} {"train_loss": -5.046634674072266, "global_step": 14097, "epoch": 335} {"train_loss": -5.332612037658691, "global_step": 14098, "epoch": 335} {"train_loss": -5.05108642578125, "global_step": 14099, "epoch": 335} {"train_loss": -5.251252174377441, "global_step": 14100, "epoch": 335} {"train_loss": -5.158087730407715, "global_step": 14101, "epoch": 335} {"train_loss": -5.096719741821289, "global_step": 14102, "epoch": 335} {"train_loss": -5.175939559936523, "global_step": 14103, "epoch": 335} {"train_loss": -5.20588493347168, "global_step": 14104, "epoch": 335} {"train_loss": -5.185882568359375, "global_step": 14105, "epoch": 335} {"train_loss": -5.257309913635254, "global_step": 14106, "epoch": 335} {"train_loss": -5.075316905975342, "global_step": 14107, "epoch": 335} {"train_loss": -5.146701812744141, "global_step": 14108, "epoch": 335} {"train_loss": -5.130925178527832, "global_step": 14109, "epoch": 335} {"train_loss": -5.222919940948486, "global_step": 14110, "epoch": 335} {"train_loss": -5.125670137859526, "global_step": 14111, "epoch": 335, "val_loss": 72358.9453125} {"train_loss": -5.2313127517700195, "global_step": 14112, "epoch": 336} {"train_loss": -5.196173667907715, "global_step": 14113, "epoch": 336} {"train_loss": -5.225059509277344, "global_step": 14114, "epoch": 336} {"train_loss": -5.19671630859375, "global_step": 14115, "epoch": 336} {"train_loss": -5.303271293640137, "global_step": 14116, "epoch": 336} {"train_loss": -5.2176384925842285, "global_step": 14117, "epoch": 336} {"train_loss": -5.2287116050720215, "global_step": 14118, "epoch": 336} {"train_loss": -5.197632789611816, "global_step": 14119, "epoch": 336} {"train_loss": -5.22566556930542, "global_step": 14120, "epoch": 336} {"train_loss": -5.300412654876709, "global_step": 14121, "epoch": 336} {"train_loss": -5.222602367401123, "global_step": 14122, "epoch": 336} {"train_loss": -5.131040573120117, "global_step": 14123, "epoch": 336} {"train_loss": -5.28765344619751, "global_step": 14124, "epoch": 336} {"train_loss": -5.35414981842041, "global_step": 14125, "epoch": 336} {"train_loss": -5.19168758392334, "global_step": 14126, "epoch": 336} {"train_loss": -5.203366279602051, "global_step": 14127, "epoch": 336} {"train_loss": -5.126048564910889, "global_step": 14128, "epoch": 336} {"train_loss": -5.26010799407959, "global_step": 14129, "epoch": 336} {"train_loss": -5.196050643920898, "global_step": 14130, "epoch": 336} {"train_loss": -5.071086883544922, "global_step": 14131, "epoch": 336} {"train_loss": -5.231649398803711, "global_step": 14132, "epoch": 336} {"train_loss": -5.181486129760742, "global_step": 14133, "epoch": 336} {"train_loss": -5.205450057983398, "global_step": 14134, "epoch": 336} {"train_loss": -5.097454071044922, "global_step": 14135, "epoch": 336} {"train_loss": -5.104755401611328, "global_step": 14136, "epoch": 336} {"train_loss": -4.9981279373168945, "global_step": 14137, "epoch": 336} {"train_loss": -5.033844470977783, "global_step": 14138, "epoch": 336} {"train_loss": -5.223422527313232, "global_step": 14139, "epoch": 336} {"train_loss": -5.0785627365112305, "global_step": 14140, "epoch": 336} {"train_loss": -5.209353923797607, "global_step": 14141, "epoch": 336} {"train_loss": -5.052457809448242, "global_step": 14142, "epoch": 336} {"train_loss": -5.042794227600098, "global_step": 14143, "epoch": 336} {"train_loss": -5.0633039474487305, "global_step": 14144, "epoch": 336} {"train_loss": -5.038867950439453, "global_step": 14145, "epoch": 336} {"train_loss": -5.160009384155273, "global_step": 14146, "epoch": 336} {"train_loss": -5.10336971282959, "global_step": 14147, "epoch": 336} {"train_loss": -5.162293910980225, "global_step": 14148, "epoch": 336} {"train_loss": -5.218135833740234, "global_step": 14149, "epoch": 336} {"train_loss": -5.132515907287598, "global_step": 14150, "epoch": 336} {"train_loss": -5.156824111938477, "global_step": 14151, "epoch": 336} {"train_loss": -5.194447994232178, "global_step": 14152, "epoch": 336} {"train_loss": -5.171548377899897, "global_step": 14153, "epoch": 336, "val_loss": 72151.828125} {"train_loss": -5.091348648071289, "global_step": 14154, "epoch": 337} {"train_loss": -5.02161979675293, "global_step": 14155, "epoch": 337} {"train_loss": -5.169560432434082, "global_step": 14156, "epoch": 337} {"train_loss": -5.285978317260742, "global_step": 14157, "epoch": 337} {"train_loss": -5.191056251525879, "global_step": 14158, "epoch": 337} {"train_loss": -5.195047378540039, "global_step": 14159, "epoch": 337} {"train_loss": -5.177522659301758, "global_step": 14160, "epoch": 337} {"train_loss": -5.185946464538574, "global_step": 14161, "epoch": 337} {"train_loss": -5.185142517089844, "global_step": 14162, "epoch": 337} {"train_loss": -5.331453323364258, "global_step": 14163, "epoch": 337} {"train_loss": -5.267024517059326, "global_step": 14164, "epoch": 337} {"train_loss": -5.257339000701904, "global_step": 14165, "epoch": 337} {"train_loss": -5.174886226654053, "global_step": 14166, "epoch": 337} {"train_loss": -5.299190044403076, "global_step": 14167, "epoch": 337} {"train_loss": -5.294536590576172, "global_step": 14168, "epoch": 337} {"train_loss": -5.227099895477295, "global_step": 14169, "epoch": 337} {"train_loss": -5.174091339111328, "global_step": 14170, "epoch": 337} {"train_loss": -5.240114688873291, "global_step": 14171, "epoch": 337} {"train_loss": -5.017876625061035, "global_step": 14172, "epoch": 337} {"train_loss": -5.252584934234619, "global_step": 14173, "epoch": 337} {"train_loss": -5.318572044372559, "global_step": 14174, "epoch": 337} {"train_loss": -5.205593109130859, "global_step": 14175, "epoch": 337} {"train_loss": -5.199465274810791, "global_step": 14176, "epoch": 337} {"train_loss": -5.3865647315979, "global_step": 14177, "epoch": 337} {"train_loss": -5.029539108276367, "global_step": 14178, "epoch": 337} {"train_loss": -5.259116172790527, "global_step": 14179, "epoch": 337} {"train_loss": -5.171062469482422, "global_step": 14180, "epoch": 337} {"train_loss": -5.184057235717773, "global_step": 14181, "epoch": 337} {"train_loss": -5.131809234619141, "global_step": 14182, "epoch": 337} {"train_loss": -5.173740386962891, "global_step": 14183, "epoch": 337} {"train_loss": -5.195578098297119, "global_step": 14184, "epoch": 337} {"train_loss": -5.185747146606445, "global_step": 14185, "epoch": 337} {"train_loss": -5.307391166687012, "global_step": 14186, "epoch": 337} {"train_loss": -5.1867828369140625, "global_step": 14187, "epoch": 337} {"train_loss": -5.188416481018066, "global_step": 14188, "epoch": 337} {"train_loss": -5.17900276184082, "global_step": 14189, "epoch": 337} {"train_loss": -5.341989994049072, "global_step": 14190, "epoch": 337} {"train_loss": -5.075721740722656, "global_step": 14191, "epoch": 337} {"train_loss": -5.206225395202637, "global_step": 14192, "epoch": 337} {"train_loss": -5.212780952453613, "global_step": 14193, "epoch": 337} {"train_loss": -5.241118907928467, "global_step": 14194, "epoch": 337} {"train_loss": -5.205418075834002, "global_step": 14195, "epoch": 337, "val_loss": 72070.0859375} {"train_loss": -5.109480857849121, "global_step": 14196, "epoch": 338} {"train_loss": -5.178235054016113, "global_step": 14197, "epoch": 338} {"train_loss": -5.204005241394043, "global_step": 14198, "epoch": 338} {"train_loss": -5.131707191467285, "global_step": 14199, "epoch": 338} {"train_loss": -5.339601516723633, "global_step": 14200, "epoch": 338} {"train_loss": -5.21501350402832, "global_step": 14201, "epoch": 338} {"train_loss": -5.187753677368164, "global_step": 14202, "epoch": 338} {"train_loss": -5.228862285614014, "global_step": 14203, "epoch": 338} {"train_loss": -5.139732360839844, "global_step": 14204, "epoch": 338} {"train_loss": -5.236213684082031, "global_step": 14205, "epoch": 338} {"train_loss": -5.247057914733887, "global_step": 14206, "epoch": 338} {"train_loss": -5.211775779724121, "global_step": 14207, "epoch": 338} {"train_loss": -5.283100605010986, "global_step": 14208, "epoch": 338} {"train_loss": -5.088067054748535, "global_step": 14209, "epoch": 338} {"train_loss": -5.17794132232666, "global_step": 14210, "epoch": 338} {"train_loss": -5.3401689529418945, "global_step": 14211, "epoch": 338} {"train_loss": -5.163000106811523, "global_step": 14212, "epoch": 338} {"train_loss": -5.274394989013672, "global_step": 14213, "epoch": 338} {"train_loss": -5.190098762512207, "global_step": 14214, "epoch": 338} {"train_loss": -5.186703681945801, "global_step": 14215, "epoch": 338} {"train_loss": -5.165691375732422, "global_step": 14216, "epoch": 338} {"train_loss": -5.175467491149902, "global_step": 14217, "epoch": 338} {"train_loss": -5.097108364105225, "global_step": 14218, "epoch": 338} {"train_loss": -5.258057117462158, "global_step": 14219, "epoch": 338} {"train_loss": -5.282323837280273, "global_step": 14220, "epoch": 338} {"train_loss": -5.153712272644043, "global_step": 14221, "epoch": 338} {"train_loss": -5.184544086456299, "global_step": 14222, "epoch": 338} {"train_loss": -5.316375732421875, "global_step": 14223, "epoch": 338} {"train_loss": -5.390473365783691, "global_step": 14224, "epoch": 338} {"train_loss": -5.03267240524292, "global_step": 14225, "epoch": 338} {"train_loss": -5.253384590148926, "global_step": 14226, "epoch": 338} {"train_loss": -5.154285430908203, "global_step": 14227, "epoch": 338} {"train_loss": -5.194526672363281, "global_step": 14228, "epoch": 338} {"train_loss": -5.251270294189453, "global_step": 14229, "epoch": 338} {"train_loss": -5.196781158447266, "global_step": 14230, "epoch": 338} {"train_loss": -5.229218006134033, "global_step": 14231, "epoch": 338} {"train_loss": -5.270018100738525, "global_step": 14232, "epoch": 338} {"train_loss": -5.180995464324951, "global_step": 14233, "epoch": 338} {"train_loss": -5.227809906005859, "global_step": 14234, "epoch": 338} {"train_loss": -5.310741901397705, "global_step": 14235, "epoch": 338} {"train_loss": -5.291491508483887, "global_step": 14236, "epoch": 338} {"train_loss": -5.215738455454509, "global_step": 14237, "epoch": 338, "val_loss": 72276.4375} {"train_loss": -4.971848487854004, "global_step": 14238, "epoch": 339} {"train_loss": -5.2812180519104, "global_step": 14239, "epoch": 339} {"train_loss": -5.095790863037109, "global_step": 14240, "epoch": 339} {"train_loss": -5.252839088439941, "global_step": 14241, "epoch": 339} {"train_loss": -5.296645164489746, "global_step": 14242, "epoch": 339} {"train_loss": -5.339998245239258, "global_step": 14243, "epoch": 339} {"train_loss": -5.2047319412231445, "global_step": 14244, "epoch": 339} {"train_loss": -5.190272331237793, "global_step": 14245, "epoch": 339} {"train_loss": -5.139101982116699, "global_step": 14246, "epoch": 339} {"train_loss": -5.217039108276367, "global_step": 14247, "epoch": 339} {"train_loss": -5.078648567199707, "global_step": 14248, "epoch": 339} {"train_loss": -5.257793426513672, "global_step": 14249, "epoch": 339} {"train_loss": -5.154689788818359, "global_step": 14250, "epoch": 339} {"train_loss": -5.161115646362305, "global_step": 14251, "epoch": 339} {"train_loss": -5.003354072570801, "global_step": 14252, "epoch": 339} {"train_loss": -5.284345626831055, "global_step": 14253, "epoch": 339} {"train_loss": -5.26115083694458, "global_step": 14254, "epoch": 339} {"train_loss": -5.076930046081543, "global_step": 14255, "epoch": 339} {"train_loss": -5.09500789642334, "global_step": 14256, "epoch": 339} {"train_loss": -5.3027663230896, "global_step": 14257, "epoch": 339} {"train_loss": -5.137607097625732, "global_step": 14258, "epoch": 339} {"train_loss": -5.131860733032227, "global_step": 14259, "epoch": 339} {"train_loss": -5.205369472503662, "global_step": 14260, "epoch": 339} {"train_loss": -5.242653846740723, "global_step": 14261, "epoch": 339} {"train_loss": -5.322330951690674, "global_step": 14262, "epoch": 339} {"train_loss": -5.1537556648254395, "global_step": 14263, "epoch": 339} {"train_loss": -5.143882751464844, "global_step": 14264, "epoch": 339} {"train_loss": -5.263978004455566, "global_step": 14265, "epoch": 339} {"train_loss": -5.168820858001709, "global_step": 14266, "epoch": 339} {"train_loss": -5.168711185455322, "global_step": 14267, "epoch": 339} {"train_loss": -4.981540203094482, "global_step": 14268, "epoch": 339} {"train_loss": -5.220141410827637, "global_step": 14269, "epoch": 339} {"train_loss": -5.137271881103516, "global_step": 14270, "epoch": 339} {"train_loss": -5.136468887329102, "global_step": 14271, "epoch": 339} {"train_loss": -5.217983245849609, "global_step": 14272, "epoch": 339} {"train_loss": -5.099762916564941, "global_step": 14273, "epoch": 339} {"train_loss": -4.96186637878418, "global_step": 14274, "epoch": 339} {"train_loss": -5.1994805335998535, "global_step": 14275, "epoch": 339} {"train_loss": -5.043416500091553, "global_step": 14276, "epoch": 339} {"train_loss": -5.163957595825195, "global_step": 14277, "epoch": 339} {"train_loss": -5.2340407371521, "global_step": 14278, "epoch": 339} {"train_loss": -5.166832992008755, "global_step": 14279, "epoch": 339, "val_loss": 72276.1953125} {"train_loss": -5.10040283203125, "global_step": 14280, "epoch": 340} {"train_loss": -4.997025489807129, "global_step": 14281, "epoch": 340} {"train_loss": -5.145349979400635, "global_step": 14282, "epoch": 340} {"train_loss": -5.158655643463135, "global_step": 14283, "epoch": 340} {"train_loss": -4.947750568389893, "global_step": 14284, "epoch": 340} {"train_loss": -5.1639509201049805, "global_step": 14285, "epoch": 340} {"train_loss": -5.02745246887207, "global_step": 14286, "epoch": 340} {"train_loss": -5.163627624511719, "global_step": 14287, "epoch": 340} {"train_loss": -5.139459609985352, "global_step": 14288, "epoch": 340} {"train_loss": -5.0946044921875, "global_step": 14289, "epoch": 340} {"train_loss": -5.158121109008789, "global_step": 14290, "epoch": 340} {"train_loss": -5.1892290115356445, "global_step": 14291, "epoch": 340} {"train_loss": -5.270853042602539, "global_step": 14292, "epoch": 340} {"train_loss": -5.203644752502441, "global_step": 14293, "epoch": 340} {"train_loss": -5.172396659851074, "global_step": 14294, "epoch": 340} {"train_loss": -5.273401260375977, "global_step": 14295, "epoch": 340} {"train_loss": -5.175463676452637, "global_step": 14296, "epoch": 340} {"train_loss": -5.207076072692871, "global_step": 14297, "epoch": 340} {"train_loss": -5.207591533660889, "global_step": 14298, "epoch": 340} {"train_loss": -5.284348487854004, "global_step": 14299, "epoch": 340} {"train_loss": -5.247613906860352, "global_step": 14300, "epoch": 340} {"train_loss": -5.287419319152832, "global_step": 14301, "epoch": 340} {"train_loss": -5.340203762054443, "global_step": 14302, "epoch": 340} {"train_loss": -5.102182388305664, "global_step": 14303, "epoch": 340} {"train_loss": -5.206760883331299, "global_step": 14304, "epoch": 340} {"train_loss": -5.197776794433594, "global_step": 14305, "epoch": 340} {"train_loss": -5.199404716491699, "global_step": 14306, "epoch": 340} {"train_loss": -5.211370944976807, "global_step": 14307, "epoch": 340} {"train_loss": -5.258031368255615, "global_step": 14308, "epoch": 340} {"train_loss": -5.2190446853637695, "global_step": 14309, "epoch": 340} {"train_loss": -5.298837184906006, "global_step": 14310, "epoch": 340} {"train_loss": -5.055484294891357, "global_step": 14311, "epoch": 340} {"train_loss": -5.356107711791992, "global_step": 14312, "epoch": 340} {"train_loss": -5.329335689544678, "global_step": 14313, "epoch": 340} {"train_loss": -5.264433860778809, "global_step": 14314, "epoch": 340} {"train_loss": -5.237210273742676, "global_step": 14315, "epoch": 340} {"train_loss": -5.2345991134643555, "global_step": 14316, "epoch": 340} {"train_loss": -5.238577365875244, "global_step": 14317, "epoch": 340} {"train_loss": -5.15110969543457, "global_step": 14318, "epoch": 340} {"train_loss": -5.383532524108887, "global_step": 14319, "epoch": 340} {"train_loss": -5.211437225341797, "global_step": 14320, "epoch": 340} {"train_loss": -5.1979973543257945, "global_step": 14321, "epoch": 340, "val_loss": 71602.703125} {"train_loss": -5.227344512939453, "global_step": 14322, "epoch": 341} {"train_loss": -5.2414655685424805, "global_step": 14323, "epoch": 341} {"train_loss": -5.154445648193359, "global_step": 14324, "epoch": 341} {"train_loss": -5.194773197174072, "global_step": 14325, "epoch": 341} {"train_loss": -5.104397296905518, "global_step": 14326, "epoch": 341} {"train_loss": -5.137159824371338, "global_step": 14327, "epoch": 341} {"train_loss": -5.423684597015381, "global_step": 14328, "epoch": 341} {"train_loss": -5.364413261413574, "global_step": 14329, "epoch": 341} {"train_loss": -5.209829330444336, "global_step": 14330, "epoch": 341} {"train_loss": -5.241450309753418, "global_step": 14331, "epoch": 341} {"train_loss": -5.209674835205078, "global_step": 14332, "epoch": 341} {"train_loss": -5.233101844787598, "global_step": 14333, "epoch": 341} {"train_loss": -5.265508651733398, "global_step": 14334, "epoch": 341} {"train_loss": -5.280895709991455, "global_step": 14335, "epoch": 341} {"train_loss": -5.241060256958008, "global_step": 14336, "epoch": 341} {"train_loss": -5.296487808227539, "global_step": 14337, "epoch": 341} {"train_loss": -5.204118728637695, "global_step": 14338, "epoch": 341} {"train_loss": -5.182680606842041, "global_step": 14339, "epoch": 341} {"train_loss": -5.156196594238281, "global_step": 14340, "epoch": 341} {"train_loss": -5.057428359985352, "global_step": 14341, "epoch": 341} {"train_loss": -5.206602096557617, "global_step": 14342, "epoch": 341} {"train_loss": -5.174959182739258, "global_step": 14343, "epoch": 341} {"train_loss": -5.125972270965576, "global_step": 14344, "epoch": 341} {"train_loss": -5.144243240356445, "global_step": 14345, "epoch": 341} {"train_loss": -5.230075836181641, "global_step": 14346, "epoch": 341} {"train_loss": -5.1112470626831055, "global_step": 14347, "epoch": 341} {"train_loss": -5.1017842292785645, "global_step": 14348, "epoch": 341} {"train_loss": -5.146784782409668, "global_step": 14349, "epoch": 341} {"train_loss": -5.142653942108154, "global_step": 14350, "epoch": 341} {"train_loss": -5.244490623474121, "global_step": 14351, "epoch": 341} {"train_loss": -5.136714458465576, "global_step": 14352, "epoch": 341} {"train_loss": -4.977502346038818, "global_step": 14353, "epoch": 341} {"train_loss": -5.180422782897949, "global_step": 14354, "epoch": 341} {"train_loss": -5.211519241333008, "global_step": 14355, "epoch": 341} {"train_loss": -5.106865882873535, "global_step": 14356, "epoch": 341} {"train_loss": -5.077571868896484, "global_step": 14357, "epoch": 341} {"train_loss": -5.154977321624756, "global_step": 14358, "epoch": 341} {"train_loss": -5.223516464233398, "global_step": 14359, "epoch": 341} {"train_loss": -5.1872148513793945, "global_step": 14360, "epoch": 341} {"train_loss": -5.073697090148926, "global_step": 14361, "epoch": 341} {"train_loss": -5.085944175720215, "global_step": 14362, "epoch": 341} {"train_loss": -5.179739077885945, "global_step": 14363, "epoch": 341, "val_loss": 72694.0859375} {"train_loss": -5.273792743682861, "global_step": 14364, "epoch": 342} {"train_loss": -5.141208648681641, "global_step": 14365, "epoch": 342} {"train_loss": -5.045729637145996, "global_step": 14366, "epoch": 342} {"train_loss": -5.055287837982178, "global_step": 14367, "epoch": 342} {"train_loss": -5.073786735534668, "global_step": 14368, "epoch": 342} {"train_loss": -5.2272233963012695, "global_step": 14369, "epoch": 342} {"train_loss": -5.152083873748779, "global_step": 14370, "epoch": 342} {"train_loss": -5.234889030456543, "global_step": 14371, "epoch": 342} {"train_loss": -5.234017848968506, "global_step": 14372, "epoch": 342} {"train_loss": -5.167442321777344, "global_step": 14373, "epoch": 342} {"train_loss": -5.249514579772949, "global_step": 14374, "epoch": 342} {"train_loss": -5.149479866027832, "global_step": 14375, "epoch": 342} {"train_loss": -5.191920280456543, "global_step": 14376, "epoch": 342} {"train_loss": -5.377333641052246, "global_step": 14377, "epoch": 342} {"train_loss": -5.163665294647217, "global_step": 14378, "epoch": 342} {"train_loss": -5.199387550354004, "global_step": 14379, "epoch": 342} {"train_loss": -5.243459701538086, "global_step": 14380, "epoch": 342} {"train_loss": -5.2777299880981445, "global_step": 14381, "epoch": 342} {"train_loss": -5.248599052429199, "global_step": 14382, "epoch": 342} {"train_loss": -5.150790214538574, "global_step": 14383, "epoch": 342} {"train_loss": -5.2178754806518555, "global_step": 14384, "epoch": 342} {"train_loss": -5.343979835510254, "global_step": 14385, "epoch": 342} {"train_loss": -5.3627753257751465, "global_step": 14386, "epoch": 342} {"train_loss": -5.111654758453369, "global_step": 14387, "epoch": 342} {"train_loss": -5.338019847869873, "global_step": 14388, "epoch": 342} {"train_loss": -5.065990447998047, "global_step": 14389, "epoch": 342} {"train_loss": -5.233697891235352, "global_step": 14390, "epoch": 342} {"train_loss": -5.113168239593506, "global_step": 14391, "epoch": 342} {"train_loss": -5.100010871887207, "global_step": 14392, "epoch": 342} {"train_loss": -5.104991912841797, "global_step": 14393, "epoch": 342} {"train_loss": -5.162857532501221, "global_step": 14394, "epoch": 342} {"train_loss": -5.07426118850708, "global_step": 14395, "epoch": 342} {"train_loss": -4.999262809753418, "global_step": 14396, "epoch": 342} {"train_loss": -5.178854465484619, "global_step": 14397, "epoch": 342} {"train_loss": -5.021335601806641, "global_step": 14398, "epoch": 342} {"train_loss": -4.982262134552002, "global_step": 14399, "epoch": 342} {"train_loss": -5.144065856933594, "global_step": 14400, "epoch": 342} {"train_loss": -4.9461669921875, "global_step": 14401, "epoch": 342} {"train_loss": -5.235265731811523, "global_step": 14402, "epoch": 342} {"train_loss": -5.18571662902832, "global_step": 14403, "epoch": 342} {"train_loss": -5.123701095581055, "global_step": 14404, "epoch": 342} {"train_loss": -5.168690624691191, "global_step": 14405, "epoch": 342, "val_loss": 71984.5625} {"train_loss": -5.1251630783081055, "global_step": 14406, "epoch": 343} {"train_loss": -5.184067726135254, "global_step": 14407, "epoch": 343} {"train_loss": -5.0867815017700195, "global_step": 14408, "epoch": 343} {"train_loss": -5.190455436706543, "global_step": 14409, "epoch": 343} {"train_loss": -5.0647783279418945, "global_step": 14410, "epoch": 343} {"train_loss": -5.111147880554199, "global_step": 14411, "epoch": 343} {"train_loss": -5.160935401916504, "global_step": 14412, "epoch": 343} {"train_loss": -5.286495208740234, "global_step": 14413, "epoch": 343} {"train_loss": -5.253269672393799, "global_step": 14414, "epoch": 343} {"train_loss": -5.228096008300781, "global_step": 14415, "epoch": 343} {"train_loss": -5.262319087982178, "global_step": 14416, "epoch": 343} {"train_loss": -5.267603874206543, "global_step": 14417, "epoch": 343} {"train_loss": -5.197366714477539, "global_step": 14418, "epoch": 343} {"train_loss": -5.151769638061523, "global_step": 14419, "epoch": 343} {"train_loss": -5.208554267883301, "global_step": 14420, "epoch": 343} {"train_loss": -5.311689376831055, "global_step": 14421, "epoch": 343} {"train_loss": -5.133343696594238, "global_step": 14422, "epoch": 343} {"train_loss": -5.129363536834717, "global_step": 14423, "epoch": 343} {"train_loss": -5.270533084869385, "global_step": 14424, "epoch": 343} {"train_loss": -5.360673904418945, "global_step": 14425, "epoch": 343} {"train_loss": -5.252006530761719, "global_step": 14426, "epoch": 343} {"train_loss": -5.204791069030762, "global_step": 14427, "epoch": 343} {"train_loss": -5.257512092590332, "global_step": 14428, "epoch": 343} {"train_loss": -5.2728986740112305, "global_step": 14429, "epoch": 343} {"train_loss": -5.21589994430542, "global_step": 14430, "epoch": 343} {"train_loss": -5.1409125328063965, "global_step": 14431, "epoch": 343} {"train_loss": -5.125886917114258, "global_step": 14432, "epoch": 343} {"train_loss": -5.295156478881836, "global_step": 14433, "epoch": 343} {"train_loss": -5.092888355255127, "global_step": 14434, "epoch": 343} {"train_loss": -5.352497100830078, "global_step": 14435, "epoch": 343} {"train_loss": -5.2446184158325195, "global_step": 14436, "epoch": 343} {"train_loss": -5.1316728591918945, "global_step": 14437, "epoch": 343} {"train_loss": -5.089779853820801, "global_step": 14438, "epoch": 343} {"train_loss": -5.320052623748779, "global_step": 14439, "epoch": 343} {"train_loss": -5.178340911865234, "global_step": 14440, "epoch": 343} {"train_loss": -5.318378448486328, "global_step": 14441, "epoch": 343} {"train_loss": -5.121063232421875, "global_step": 14442, "epoch": 343} {"train_loss": -5.240610122680664, "global_step": 14443, "epoch": 343} {"train_loss": -5.2709503173828125, "global_step": 14444, "epoch": 343} {"train_loss": -4.945858955383301, "global_step": 14445, "epoch": 343} {"train_loss": -4.988433361053467, "global_step": 14446, "epoch": 343} {"train_loss": -5.195501248041789, "global_step": 14447, "epoch": 343, "val_loss": 72409.3984375} {"train_loss": -4.944091796875, "global_step": 14448, "epoch": 344} {"train_loss": -4.992441177368164, "global_step": 14449, "epoch": 344} {"train_loss": -5.067905426025391, "global_step": 14450, "epoch": 344} {"train_loss": -4.9673309326171875, "global_step": 14451, "epoch": 344} {"train_loss": -5.24353551864624, "global_step": 14452, "epoch": 344} {"train_loss": -5.177008628845215, "global_step": 14453, "epoch": 344} {"train_loss": -4.985480785369873, "global_step": 14454, "epoch": 344} {"train_loss": -5.060211658477783, "global_step": 14455, "epoch": 344} {"train_loss": -5.1472625732421875, "global_step": 14456, "epoch": 344} {"train_loss": -5.144320964813232, "global_step": 14457, "epoch": 344} {"train_loss": -5.007353782653809, "global_step": 14458, "epoch": 344} {"train_loss": -5.263730049133301, "global_step": 14459, "epoch": 344} {"train_loss": -5.049695014953613, "global_step": 14460, "epoch": 344} {"train_loss": -5.2920074462890625, "global_step": 14461, "epoch": 344} {"train_loss": -5.17236852645874, "global_step": 14462, "epoch": 344} {"train_loss": -5.189787864685059, "global_step": 14463, "epoch": 344} {"train_loss": -5.112265110015869, "global_step": 14464, "epoch": 344} {"train_loss": -5.2191691398620605, "global_step": 14465, "epoch": 344} {"train_loss": -5.201323986053467, "global_step": 14466, "epoch": 344} {"train_loss": -5.124378204345703, "global_step": 14467, "epoch": 344} {"train_loss": -5.335023880004883, "global_step": 14468, "epoch": 344} {"train_loss": -5.202454566955566, "global_step": 14469, "epoch": 344} {"train_loss": -5.108757495880127, "global_step": 14470, "epoch": 344} {"train_loss": -5.12550687789917, "global_step": 14471, "epoch": 344} {"train_loss": -5.067511558532715, "global_step": 14472, "epoch": 344} {"train_loss": -5.155192852020264, "global_step": 14473, "epoch": 344} {"train_loss": -5.322324752807617, "global_step": 14474, "epoch": 344} {"train_loss": -5.318794250488281, "global_step": 14475, "epoch": 344} {"train_loss": -5.131369113922119, "global_step": 14476, "epoch": 344} {"train_loss": -5.306916236877441, "global_step": 14477, "epoch": 344} {"train_loss": -5.2854108810424805, "global_step": 14478, "epoch": 344} {"train_loss": -5.125454425811768, "global_step": 14479, "epoch": 344} {"train_loss": -5.171573162078857, "global_step": 14480, "epoch": 344} {"train_loss": -5.114310264587402, "global_step": 14481, "epoch": 344} {"train_loss": -5.190546989440918, "global_step": 14482, "epoch": 344} {"train_loss": -5.247264862060547, "global_step": 14483, "epoch": 344} {"train_loss": -5.254679203033447, "global_step": 14484, "epoch": 344} {"train_loss": -5.214724540710449, "global_step": 14485, "epoch": 344} {"train_loss": -5.2430219650268555, "global_step": 14486, "epoch": 344} {"train_loss": -5.01002311706543, "global_step": 14487, "epoch": 344} {"train_loss": -5.052460670471191, "global_step": 14488, "epoch": 344} {"train_loss": -5.1539900075821645, "global_step": 14489, "epoch": 344, "val_loss": 71684.5234375} {"train_loss": -5.163460731506348, "global_step": 14490, "epoch": 345} {"train_loss": -5.292172431945801, "global_step": 14491, "epoch": 345} {"train_loss": -5.151778221130371, "global_step": 14492, "epoch": 345} {"train_loss": -5.284510612487793, "global_step": 14493, "epoch": 345} {"train_loss": -5.089702129364014, "global_step": 14494, "epoch": 345} {"train_loss": -5.21403169631958, "global_step": 14495, "epoch": 345} {"train_loss": -5.156706809997559, "global_step": 14496, "epoch": 345} {"train_loss": -5.249289512634277, "global_step": 14497, "epoch": 345} {"train_loss": -5.168756484985352, "global_step": 14498, "epoch": 345} {"train_loss": -5.243807792663574, "global_step": 14499, "epoch": 345} {"train_loss": -5.324006080627441, "global_step": 14500, "epoch": 345} {"train_loss": -5.180616855621338, "global_step": 14501, "epoch": 345} {"train_loss": -5.3195905685424805, "global_step": 14502, "epoch": 345} {"train_loss": -5.186127662658691, "global_step": 14503, "epoch": 345} {"train_loss": -5.048245429992676, "global_step": 14504, "epoch": 345} {"train_loss": -5.229656219482422, "global_step": 14505, "epoch": 345} {"train_loss": -4.950335502624512, "global_step": 14506, "epoch": 345} {"train_loss": -5.18411922454834, "global_step": 14507, "epoch": 345} {"train_loss": -5.196761131286621, "global_step": 14508, "epoch": 345} {"train_loss": -5.1252970695495605, "global_step": 14509, "epoch": 345} {"train_loss": -5.08975076675415, "global_step": 14510, "epoch": 345} {"train_loss": -5.168373107910156, "global_step": 14511, "epoch": 345} {"train_loss": -4.971180438995361, "global_step": 14512, "epoch": 345} {"train_loss": -5.32243537902832, "global_step": 14513, "epoch": 345} {"train_loss": -5.047104835510254, "global_step": 14514, "epoch": 345} {"train_loss": -5.153669357299805, "global_step": 14515, "epoch": 345} {"train_loss": -5.189133167266846, "global_step": 14516, "epoch": 345} {"train_loss": -5.1722517013549805, "global_step": 14517, "epoch": 345} {"train_loss": -5.282547473907471, "global_step": 14518, "epoch": 345} {"train_loss": -5.278881549835205, "global_step": 14519, "epoch": 345} {"train_loss": -5.084375381469727, "global_step": 14520, "epoch": 345} {"train_loss": -5.115813255310059, "global_step": 14521, "epoch": 345} {"train_loss": -5.137737274169922, "global_step": 14522, "epoch": 345} {"train_loss": -5.284455299377441, "global_step": 14523, "epoch": 345} {"train_loss": -5.041492462158203, "global_step": 14524, "epoch": 345} {"train_loss": -5.217471122741699, "global_step": 14525, "epoch": 345} {"train_loss": -5.223165512084961, "global_step": 14526, "epoch": 345} {"train_loss": -5.032407283782959, "global_step": 14527, "epoch": 345} {"train_loss": -5.321846961975098, "global_step": 14528, "epoch": 345} {"train_loss": -5.051688194274902, "global_step": 14529, "epoch": 345} {"train_loss": -5.110305309295654, "global_step": 14530, "epoch": 345} {"train_loss": -5.174150024141584, "global_step": 14531, "epoch": 345, "val_loss": 72144.84375} {"train_loss": -5.105617523193359, "global_step": 14532, "epoch": 346} {"train_loss": -5.181486129760742, "global_step": 14533, "epoch": 346} {"train_loss": -5.1071648597717285, "global_step": 14534, "epoch": 346} {"train_loss": -5.144367694854736, "global_step": 14535, "epoch": 346} {"train_loss": -5.294302940368652, "global_step": 14536, "epoch": 346} {"train_loss": -5.293376445770264, "global_step": 14537, "epoch": 346} {"train_loss": -5.117883205413818, "global_step": 14538, "epoch": 346} {"train_loss": -5.11533260345459, "global_step": 14539, "epoch": 346} {"train_loss": -5.04961633682251, "global_step": 14540, "epoch": 346} {"train_loss": -5.329586505889893, "global_step": 14541, "epoch": 346} {"train_loss": -5.156541347503662, "global_step": 14542, "epoch": 346} {"train_loss": -5.098453521728516, "global_step": 14543, "epoch": 346} {"train_loss": -5.210529327392578, "global_step": 14544, "epoch": 346} {"train_loss": -5.331507682800293, "global_step": 14545, "epoch": 346} {"train_loss": -5.132266521453857, "global_step": 14546, "epoch": 346} {"train_loss": -5.2137298583984375, "global_step": 14547, "epoch": 346} {"train_loss": -5.165828704833984, "global_step": 14548, "epoch": 346} {"train_loss": -5.194842338562012, "global_step": 14549, "epoch": 346} {"train_loss": -5.219440460205078, "global_step": 14550, "epoch": 346} {"train_loss": -5.295597553253174, "global_step": 14551, "epoch": 346} {"train_loss": -5.149759769439697, "global_step": 14552, "epoch": 346} {"train_loss": -5.234311580657959, "global_step": 14553, "epoch": 346} {"train_loss": -5.150018215179443, "global_step": 14554, "epoch": 346} {"train_loss": -5.0991315841674805, "global_step": 14555, "epoch": 346} {"train_loss": -5.2198872566223145, "global_step": 14556, "epoch": 346} {"train_loss": -5.165839195251465, "global_step": 14557, "epoch": 346} {"train_loss": -5.3423752784729, "global_step": 14558, "epoch": 346} {"train_loss": -5.269283294677734, "global_step": 14559, "epoch": 346} {"train_loss": -5.286757469177246, "global_step": 14560, "epoch": 346} {"train_loss": -5.1550822257995605, "global_step": 14561, "epoch": 346} {"train_loss": -5.192854881286621, "global_step": 14562, "epoch": 346} {"train_loss": -5.296045780181885, "global_step": 14563, "epoch": 346} {"train_loss": -5.177977085113525, "global_step": 14564, "epoch": 346} {"train_loss": -5.122865676879883, "global_step": 14565, "epoch": 346} {"train_loss": -5.189950942993164, "global_step": 14566, "epoch": 346} {"train_loss": -5.299063682556152, "global_step": 14567, "epoch": 346} {"train_loss": -5.112793922424316, "global_step": 14568, "epoch": 346} {"train_loss": -5.220861911773682, "global_step": 14569, "epoch": 346} {"train_loss": -5.251866340637207, "global_step": 14570, "epoch": 346} {"train_loss": -4.978104114532471, "global_step": 14571, "epoch": 346} {"train_loss": -5.122036933898926, "global_step": 14572, "epoch": 346} {"train_loss": -5.18538897378104, "global_step": 14573, "epoch": 346, "val_loss": 72081.3984375} {"train_loss": -5.0805559158325195, "global_step": 14574, "epoch": 347} {"train_loss": -5.280187129974365, "global_step": 14575, "epoch": 347} {"train_loss": -5.252473831176758, "global_step": 14576, "epoch": 347} {"train_loss": -5.085928916931152, "global_step": 14577, "epoch": 347} {"train_loss": -5.006150722503662, "global_step": 14578, "epoch": 347} {"train_loss": -5.268355369567871, "global_step": 14579, "epoch": 347} {"train_loss": -5.167395114898682, "global_step": 14580, "epoch": 347} {"train_loss": -5.240355491638184, "global_step": 14581, "epoch": 347} {"train_loss": -5.094104766845703, "global_step": 14582, "epoch": 347} {"train_loss": -5.147500991821289, "global_step": 14583, "epoch": 347} {"train_loss": -5.267960071563721, "global_step": 14584, "epoch": 347} {"train_loss": -5.046969413757324, "global_step": 14585, "epoch": 347} {"train_loss": -5.264517784118652, "global_step": 14586, "epoch": 347} {"train_loss": -5.180716037750244, "global_step": 14587, "epoch": 347} {"train_loss": -5.152462005615234, "global_step": 14588, "epoch": 347} {"train_loss": -5.121411323547363, "global_step": 14589, "epoch": 347} {"train_loss": -5.212471961975098, "global_step": 14590, "epoch": 347} {"train_loss": -5.176340103149414, "global_step": 14591, "epoch": 347} {"train_loss": -5.155085563659668, "global_step": 14592, "epoch": 347} {"train_loss": -5.133113861083984, "global_step": 14593, "epoch": 347} {"train_loss": -5.28279972076416, "global_step": 14594, "epoch": 347} {"train_loss": -5.2738752365112305, "global_step": 14595, "epoch": 347} {"train_loss": -5.200532913208008, "global_step": 14596, "epoch": 347} {"train_loss": -5.3215837478637695, "global_step": 14597, "epoch": 347} {"train_loss": -5.075499534606934, "global_step": 14598, "epoch": 347} {"train_loss": -5.227208137512207, "global_step": 14599, "epoch": 347} {"train_loss": -5.012364864349365, "global_step": 14600, "epoch": 347} {"train_loss": -5.088818550109863, "global_step": 14601, "epoch": 347} {"train_loss": -5.317207336425781, "global_step": 14602, "epoch": 347} {"train_loss": -5.099978923797607, "global_step": 14603, "epoch": 347} {"train_loss": -5.207265853881836, "global_step": 14604, "epoch": 347} {"train_loss": -5.361539840698242, "global_step": 14605, "epoch": 347} {"train_loss": -5.267384052276611, "global_step": 14606, "epoch": 347} {"train_loss": -5.281673431396484, "global_step": 14607, "epoch": 347} {"train_loss": -5.123719215393066, "global_step": 14608, "epoch": 347} {"train_loss": -5.281787872314453, "global_step": 14609, "epoch": 347} {"train_loss": -5.191329479217529, "global_step": 14610, "epoch": 347} {"train_loss": -5.210939407348633, "global_step": 14611, "epoch": 347} {"train_loss": -5.1514692306518555, "global_step": 14612, "epoch": 347} {"train_loss": -5.269620418548584, "global_step": 14613, "epoch": 347} {"train_loss": -5.291210174560547, "global_step": 14614, "epoch": 347} {"train_loss": -5.194662820725214, "global_step": 14615, "epoch": 347, "val_loss": 72221.9453125} {"train_loss": -5.129067420959473, "global_step": 14616, "epoch": 348} {"train_loss": -5.218774795532227, "global_step": 14617, "epoch": 348} {"train_loss": -5.224277496337891, "global_step": 14618, "epoch": 348} {"train_loss": -5.099345684051514, "global_step": 14619, "epoch": 348} {"train_loss": -5.218305587768555, "global_step": 14620, "epoch": 348} {"train_loss": -5.214448928833008, "global_step": 14621, "epoch": 348} {"train_loss": -5.20627498626709, "global_step": 14622, "epoch": 348} {"train_loss": -5.290632247924805, "global_step": 14623, "epoch": 348} {"train_loss": -5.298445224761963, "global_step": 14624, "epoch": 348} {"train_loss": -5.113377094268799, "global_step": 14625, "epoch": 348} {"train_loss": -5.232346534729004, "global_step": 14626, "epoch": 348} {"train_loss": -5.094328880310059, "global_step": 14627, "epoch": 348} {"train_loss": -5.21829891204834, "global_step": 14628, "epoch": 348} {"train_loss": -5.187612056732178, "global_step": 14629, "epoch": 348} {"train_loss": -5.216722011566162, "global_step": 14630, "epoch": 348} {"train_loss": -5.3186421394348145, "global_step": 14631, "epoch": 348} {"train_loss": -5.160182952880859, "global_step": 14632, "epoch": 348} {"train_loss": -5.297395706176758, "global_step": 14633, "epoch": 348} {"train_loss": -5.292608261108398, "global_step": 14634, "epoch": 348} {"train_loss": -5.2016472816467285, "global_step": 14635, "epoch": 348} {"train_loss": -5.312314033508301, "global_step": 14636, "epoch": 348} {"train_loss": -5.178249359130859, "global_step": 14637, "epoch": 348} {"train_loss": -5.055861949920654, "global_step": 14638, "epoch": 348} {"train_loss": -5.129906177520752, "global_step": 14639, "epoch": 348} {"train_loss": -5.222410678863525, "global_step": 14640, "epoch": 348} {"train_loss": -5.130487442016602, "global_step": 14641, "epoch": 348} {"train_loss": -4.945226669311523, "global_step": 14642, "epoch": 348} {"train_loss": -5.085528373718262, "global_step": 14643, "epoch": 348} {"train_loss": -4.988887310028076, "global_step": 14644, "epoch": 348} {"train_loss": -5.21945858001709, "global_step": 14645, "epoch": 348} {"train_loss": -5.312723159790039, "global_step": 14646, "epoch": 348} {"train_loss": -5.1186933517456055, "global_step": 14647, "epoch": 348} {"train_loss": -5.196798324584961, "global_step": 14648, "epoch": 348} {"train_loss": -5.293028831481934, "global_step": 14649, "epoch": 348} {"train_loss": -5.1514997482299805, "global_step": 14650, "epoch": 348} {"train_loss": -5.057528018951416, "global_step": 14651, "epoch": 348} {"train_loss": -5.096281051635742, "global_step": 14652, "epoch": 348} {"train_loss": -4.99606990814209, "global_step": 14653, "epoch": 348} {"train_loss": -5.230674743652344, "global_step": 14654, "epoch": 348} {"train_loss": -5.007565498352051, "global_step": 14655, "epoch": 348} {"train_loss": -5.271007537841797, "global_step": 14656, "epoch": 348} {"train_loss": -5.174852246329898, "global_step": 14657, "epoch": 348, "val_loss": 72633.171875} {"train_loss": -5.127497673034668, "global_step": 14658, "epoch": 349} {"train_loss": -5.145256519317627, "global_step": 14659, "epoch": 349} {"train_loss": -5.220515251159668, "global_step": 14660, "epoch": 349} {"train_loss": -5.352218151092529, "global_step": 14661, "epoch": 349} {"train_loss": -5.135497093200684, "global_step": 14662, "epoch": 349} {"train_loss": -5.166808128356934, "global_step": 14663, "epoch": 349} {"train_loss": -5.204444885253906, "global_step": 14664, "epoch": 349} {"train_loss": -5.139006614685059, "global_step": 14665, "epoch": 349} {"train_loss": -5.1235785484313965, "global_step": 14666, "epoch": 349} {"train_loss": -5.09199857711792, "global_step": 14667, "epoch": 349} {"train_loss": -5.112113952636719, "global_step": 14668, "epoch": 349} {"train_loss": -5.205076217651367, "global_step": 14669, "epoch": 349} {"train_loss": -5.178020477294922, "global_step": 14670, "epoch": 349} {"train_loss": -5.308947563171387, "global_step": 14671, "epoch": 349} {"train_loss": -5.218149662017822, "global_step": 14672, "epoch": 349} {"train_loss": -5.286075592041016, "global_step": 14673, "epoch": 349} {"train_loss": -5.278398513793945, "global_step": 14674, "epoch": 349} {"train_loss": -5.132857322692871, "global_step": 14675, "epoch": 349} {"train_loss": -5.153372764587402, "global_step": 14676, "epoch": 349} {"train_loss": -5.266222953796387, "global_step": 14677, "epoch": 349} {"train_loss": -5.248237609863281, "global_step": 14678, "epoch": 349} {"train_loss": -5.105964183807373, "global_step": 14679, "epoch": 349} {"train_loss": -5.152580738067627, "global_step": 14680, "epoch": 349} {"train_loss": -5.288149356842041, "global_step": 14681, "epoch": 349} {"train_loss": -5.324131965637207, "global_step": 14682, "epoch": 349} {"train_loss": -5.28748893737793, "global_step": 14683, "epoch": 349} {"train_loss": -5.169038772583008, "global_step": 14684, "epoch": 349} {"train_loss": -5.203766822814941, "global_step": 14685, "epoch": 349} {"train_loss": -5.262912750244141, "global_step": 14686, "epoch": 349} {"train_loss": -5.231748104095459, "global_step": 14687, "epoch": 349} {"train_loss": -5.0280022621154785, "global_step": 14688, "epoch": 349} {"train_loss": -5.145687103271484, "global_step": 14689, "epoch": 349} {"train_loss": -5.034398078918457, "global_step": 14690, "epoch": 349} {"train_loss": -5.183082103729248, "global_step": 14691, "epoch": 349} {"train_loss": -5.213687419891357, "global_step": 14692, "epoch": 349} {"train_loss": -5.303476333618164, "global_step": 14693, "epoch": 349} {"train_loss": -5.337221145629883, "global_step": 14694, "epoch": 349} {"train_loss": -5.276915550231934, "global_step": 14695, "epoch": 349} {"train_loss": -5.268098831176758, "global_step": 14696, "epoch": 349} {"train_loss": -5.221961975097656, "global_step": 14697, "epoch": 349} {"train_loss": -5.27073860168457, "global_step": 14698, "epoch": 349} {"train_loss": -5.206585895447504, "global_step": 14699, "epoch": 349, "val_loss": 71094.828125} {"train_loss": -5.304405212402344, "global_step": 14700, "epoch": 350} {"train_loss": -5.24755859375, "global_step": 14701, "epoch": 350} {"train_loss": -5.166420936584473, "global_step": 14702, "epoch": 350} {"train_loss": -5.226189136505127, "global_step": 14703, "epoch": 350} {"train_loss": -5.234215259552002, "global_step": 14704, "epoch": 350} {"train_loss": -5.171536922454834, "global_step": 14705, "epoch": 350} {"train_loss": -5.162538528442383, "global_step": 14706, "epoch": 350} {"train_loss": -5.144566059112549, "global_step": 14707, "epoch": 350} {"train_loss": -5.2050933837890625, "global_step": 14708, "epoch": 350} {"train_loss": -5.21337890625, "global_step": 14709, "epoch": 350} {"train_loss": -5.157797813415527, "global_step": 14710, "epoch": 350} {"train_loss": -5.193021297454834, "global_step": 14711, "epoch": 350} {"train_loss": -5.161962509155273, "global_step": 14712, "epoch": 350} {"train_loss": -5.0714874267578125, "global_step": 14713, "epoch": 350} {"train_loss": -5.384912490844727, "global_step": 14714, "epoch": 350} {"train_loss": -5.0403337478637695, "global_step": 14715, "epoch": 350} {"train_loss": -5.1471357345581055, "global_step": 14716, "epoch": 350} {"train_loss": -5.0261359214782715, "global_step": 14717, "epoch": 350} {"train_loss": -5.1588544845581055, "global_step": 14718, "epoch": 350} {"train_loss": -4.9322991371154785, "global_step": 14719, "epoch": 350} {"train_loss": -5.10422420501709, "global_step": 14720, "epoch": 350} {"train_loss": -5.056395053863525, "global_step": 14721, "epoch": 350} {"train_loss": -5.116010665893555, "global_step": 14722, "epoch": 350} {"train_loss": -5.114470481872559, "global_step": 14723, "epoch": 350} {"train_loss": -5.065555095672607, "global_step": 14724, "epoch": 350} {"train_loss": -5.210986137390137, "global_step": 14725, "epoch": 350} {"train_loss": -5.202273845672607, "global_step": 14726, "epoch": 350} {"train_loss": -5.086694717407227, "global_step": 14727, "epoch": 350} {"train_loss": -5.284486770629883, "global_step": 14728, "epoch": 350} {"train_loss": -5.262849807739258, "global_step": 14729, "epoch": 350} {"train_loss": -5.115657806396484, "global_step": 14730, "epoch": 350} {"train_loss": -5.16981840133667, "global_step": 14731, "epoch": 350} {"train_loss": -5.239760398864746, "global_step": 14732, "epoch": 350} {"train_loss": -5.208955764770508, "global_step": 14733, "epoch": 350} {"train_loss": -5.280251502990723, "global_step": 14734, "epoch": 350} {"train_loss": -5.361806869506836, "global_step": 14735, "epoch": 350} {"train_loss": -5.262809753417969, "global_step": 14736, "epoch": 350} {"train_loss": -5.127438545227051, "global_step": 14737, "epoch": 350} {"train_loss": -5.019786834716797, "global_step": 14738, "epoch": 350} {"train_loss": -5.271581649780273, "global_step": 14739, "epoch": 350} {"train_loss": -5.189886569976807, "global_step": 14740, "epoch": 350} {"train_loss": -5.173626956485567, "global_step": 14741, "epoch": 350, "train/sim_max_reward_0": 0.4221327418207509, "train/sim_max_reward_1": 0.4229549398632371, "train/sim_max_reward_2": 0.30035204286874956, "train/sim_max_reward_3": 0.13553606801148152, "train/sim_max_reward_4": 0.2725826998546899, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.16560437581847667, "test/sim_max_reward_4400001": 0.2733612298387847, "test/sim_max_reward_4400002": 0.24494637115457166, "test/sim_max_reward_4400003": 0.07170972924600626, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.024096306002191852, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3668855308070418, "test/sim_max_reward_4400009": 0.14036245551027735, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.3240747998499712, "test/sim_max_reward_4400012": 0.3714125683722688, "test/sim_max_reward_4400013": 0.05569209882391426, "test/sim_max_reward_4400014": 0.0045659072126957466, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2942798284794546, "test/sim_max_reward_4400019": 0.1967216768225202, "test/sim_max_reward_4400020": 0.05481353906579601, "test/sim_max_reward_4400021": 0.31929266138829165, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.17241811599301182, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.25858849715145543, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.03590942299450747, "test/sim_max_reward_4400028": 0.30333926170141123, "test/sim_max_reward_4400029": 0.40318619772990827, "test/sim_max_reward_4400030": 0.031229597183181357, "test/sim_max_reward_4400031": 1.2890978942579066e-05, "test/sim_max_reward_4400032": 0.03474331964153611, "test/sim_max_reward_4400033": 0.12846186628297035, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.5969995676797784, "test/sim_max_reward_4400036": 0.3474359626294164, "test/sim_max_reward_4400037": 0.18534688875145539, "test/sim_max_reward_4400038": 0.35238695745466075, "test/sim_max_reward_4400039": 0.5033354934264404, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.4516520965998646, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.04991221647237323, "test/sim_max_reward_4400045": 0.2641905317016767, "test/sim_max_reward_4400046": 0.21715812438355547, "test/sim_max_reward_4400047": 0.1830305180757342, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.2910905419635161, "test/mean_score": 0.1590303430241674, "val_loss": 71786.5859375} {"train_loss": -5.137570381164551, "global_step": 14742, "epoch": 351} {"train_loss": -5.192267417907715, "global_step": 14743, "epoch": 351} {"train_loss": -5.297345161437988, "global_step": 14744, "epoch": 351} {"train_loss": -5.044658184051514, "global_step": 14745, "epoch": 351} {"train_loss": -5.216556072235107, "global_step": 14746, "epoch": 351} {"train_loss": -5.294465065002441, "global_step": 14747, "epoch": 351} {"train_loss": -5.202958106994629, "global_step": 14748, "epoch": 351} {"train_loss": -5.098022937774658, "global_step": 14749, "epoch": 351} {"train_loss": -5.143177509307861, "global_step": 14750, "epoch": 351} {"train_loss": -5.301011085510254, "global_step": 14751, "epoch": 351} {"train_loss": -5.124263286590576, "global_step": 14752, "epoch": 351} {"train_loss": -5.048913478851318, "global_step": 14753, "epoch": 351} {"train_loss": -5.261200904846191, "global_step": 14754, "epoch": 351} {"train_loss": -5.101247310638428, "global_step": 14755, "epoch": 351} {"train_loss": -5.155431270599365, "global_step": 14756, "epoch": 351} {"train_loss": -5.098852157592773, "global_step": 14757, "epoch": 351} {"train_loss": -5.308138370513916, "global_step": 14758, "epoch": 351} {"train_loss": -5.272283554077148, "global_step": 14759, "epoch": 351} {"train_loss": -5.0941667556762695, "global_step": 14760, "epoch": 351} {"train_loss": -5.201498985290527, "global_step": 14761, "epoch": 351} {"train_loss": -5.282357692718506, "global_step": 14762, "epoch": 351} {"train_loss": -5.179039478302002, "global_step": 14763, "epoch": 351} {"train_loss": -5.247930526733398, "global_step": 14764, "epoch": 351} {"train_loss": -5.138554096221924, "global_step": 14765, "epoch": 351} {"train_loss": -5.178081512451172, "global_step": 14766, "epoch": 351} {"train_loss": -5.177426338195801, "global_step": 14767, "epoch": 351} {"train_loss": -5.210683822631836, "global_step": 14768, "epoch": 351} {"train_loss": -5.21047306060791, "global_step": 14769, "epoch": 351} {"train_loss": -5.156162261962891, "global_step": 14770, "epoch": 351} {"train_loss": -5.2559404373168945, "global_step": 14771, "epoch": 351} {"train_loss": -5.194425106048584, "global_step": 14772, "epoch": 351} {"train_loss": -5.249969482421875, "global_step": 14773, "epoch": 351} {"train_loss": -5.203157901763916, "global_step": 14774, "epoch": 351} {"train_loss": -5.187429428100586, "global_step": 14775, "epoch": 351} {"train_loss": -5.037971019744873, "global_step": 14776, "epoch": 351} {"train_loss": -5.142330169677734, "global_step": 14777, "epoch": 351} {"train_loss": -5.207036018371582, "global_step": 14778, "epoch": 351} {"train_loss": -5.251510143280029, "global_step": 14779, "epoch": 351} {"train_loss": -5.227800369262695, "global_step": 14780, "epoch": 351} {"train_loss": -5.2737884521484375, "global_step": 14781, "epoch": 351} {"train_loss": -5.110740661621094, "global_step": 14782, "epoch": 351} {"train_loss": -5.189862001509893, "global_step": 14783, "epoch": 351, "val_loss": 71831.1640625} {"train_loss": -5.267441272735596, "global_step": 14784, "epoch": 352} {"train_loss": -5.148139953613281, "global_step": 14785, "epoch": 352} {"train_loss": -5.104195594787598, "global_step": 14786, "epoch": 352} {"train_loss": -5.2289276123046875, "global_step": 14787, "epoch": 352} {"train_loss": -5.121163368225098, "global_step": 14788, "epoch": 352} {"train_loss": -5.211999416351318, "global_step": 14789, "epoch": 352} {"train_loss": -5.136096000671387, "global_step": 14790, "epoch": 352} {"train_loss": -5.177186965942383, "global_step": 14791, "epoch": 352} {"train_loss": -5.167436599731445, "global_step": 14792, "epoch": 352} {"train_loss": -5.262240409851074, "global_step": 14793, "epoch": 352} {"train_loss": -5.118863105773926, "global_step": 14794, "epoch": 352} {"train_loss": -5.296313285827637, "global_step": 14795, "epoch": 352} {"train_loss": -5.155219554901123, "global_step": 14796, "epoch": 352} {"train_loss": -5.1724534034729, "global_step": 14797, "epoch": 352} {"train_loss": -5.242775917053223, "global_step": 14798, "epoch": 352} {"train_loss": -5.175570487976074, "global_step": 14799, "epoch": 352} {"train_loss": -5.26743745803833, "global_step": 14800, "epoch": 352} {"train_loss": -5.0779924392700195, "global_step": 14801, "epoch": 352} {"train_loss": -5.1125874519348145, "global_step": 14802, "epoch": 352} {"train_loss": -5.184793472290039, "global_step": 14803, "epoch": 352} {"train_loss": -5.093539237976074, "global_step": 14804, "epoch": 352} {"train_loss": -5.071493625640869, "global_step": 14805, "epoch": 352} {"train_loss": -5.257648468017578, "global_step": 14806, "epoch": 352} {"train_loss": -5.127613544464111, "global_step": 14807, "epoch": 352} {"train_loss": -5.277529239654541, "global_step": 14808, "epoch": 352} {"train_loss": -5.135741233825684, "global_step": 14809, "epoch": 352} {"train_loss": -5.291919708251953, "global_step": 14810, "epoch": 352} {"train_loss": -5.374429702758789, "global_step": 14811, "epoch": 352} {"train_loss": -5.285691261291504, "global_step": 14812, "epoch": 352} {"train_loss": -5.17850923538208, "global_step": 14813, "epoch": 352} {"train_loss": -5.162024974822998, "global_step": 14814, "epoch": 352} {"train_loss": -5.150577068328857, "global_step": 14815, "epoch": 352} {"train_loss": -5.057760238647461, "global_step": 14816, "epoch": 352} {"train_loss": -5.213337421417236, "global_step": 14817, "epoch": 352} {"train_loss": -5.098256587982178, "global_step": 14818, "epoch": 352} {"train_loss": -5.11622953414917, "global_step": 14819, "epoch": 352} {"train_loss": -5.3022074699401855, "global_step": 14820, "epoch": 352} {"train_loss": -5.212695121765137, "global_step": 14821, "epoch": 352} {"train_loss": -5.086942195892334, "global_step": 14822, "epoch": 352} {"train_loss": -5.444659233093262, "global_step": 14823, "epoch": 352} {"train_loss": -5.205136775970459, "global_step": 14824, "epoch": 352} {"train_loss": -5.1842785108657115, "global_step": 14825, "epoch": 352, "val_loss": 71695.796875} {"train_loss": -5.164112091064453, "global_step": 14826, "epoch": 353} {"train_loss": -5.165816307067871, "global_step": 14827, "epoch": 353} {"train_loss": -5.187854766845703, "global_step": 14828, "epoch": 353} {"train_loss": -5.103185653686523, "global_step": 14829, "epoch": 353} {"train_loss": -5.138328552246094, "global_step": 14830, "epoch": 353} {"train_loss": -5.37986946105957, "global_step": 14831, "epoch": 353} {"train_loss": -5.2880048751831055, "global_step": 14832, "epoch": 353} {"train_loss": -5.263584136962891, "global_step": 14833, "epoch": 353} {"train_loss": -5.241024017333984, "global_step": 14834, "epoch": 353} {"train_loss": -5.3477935791015625, "global_step": 14835, "epoch": 353} {"train_loss": -5.158871650695801, "global_step": 14836, "epoch": 353} {"train_loss": -5.280029296875, "global_step": 14837, "epoch": 353} {"train_loss": -5.127991199493408, "global_step": 14838, "epoch": 353} {"train_loss": -5.134296417236328, "global_step": 14839, "epoch": 353} {"train_loss": -5.173567771911621, "global_step": 14840, "epoch": 353} {"train_loss": -5.276876449584961, "global_step": 14841, "epoch": 353} {"train_loss": -5.179378032684326, "global_step": 14842, "epoch": 353} {"train_loss": -5.27567195892334, "global_step": 14843, "epoch": 353} {"train_loss": -5.233996868133545, "global_step": 14844, "epoch": 353} {"train_loss": -5.200898170471191, "global_step": 14845, "epoch": 353} {"train_loss": -5.095043182373047, "global_step": 14846, "epoch": 353} {"train_loss": -5.338491439819336, "global_step": 14847, "epoch": 353} {"train_loss": -5.17887020111084, "global_step": 14848, "epoch": 353} {"train_loss": -5.136688232421875, "global_step": 14849, "epoch": 353} {"train_loss": -5.301205158233643, "global_step": 14850, "epoch": 353} {"train_loss": -5.093307018280029, "global_step": 14851, "epoch": 353} {"train_loss": -5.290556907653809, "global_step": 14852, "epoch": 353} {"train_loss": -5.259640693664551, "global_step": 14853, "epoch": 353} {"train_loss": -5.175571441650391, "global_step": 14854, "epoch": 353} {"train_loss": -5.203254699707031, "global_step": 14855, "epoch": 353} {"train_loss": -5.271504878997803, "global_step": 14856, "epoch": 353} {"train_loss": -5.224764823913574, "global_step": 14857, "epoch": 353} {"train_loss": -5.210164546966553, "global_step": 14858, "epoch": 353} {"train_loss": -5.261286735534668, "global_step": 14859, "epoch": 353} {"train_loss": -5.284716606140137, "global_step": 14860, "epoch": 353} {"train_loss": -5.0136823654174805, "global_step": 14861, "epoch": 353} {"train_loss": -5.283538341522217, "global_step": 14862, "epoch": 353} {"train_loss": -5.286861896514893, "global_step": 14863, "epoch": 353} {"train_loss": -5.257888317108154, "global_step": 14864, "epoch": 353} {"train_loss": -5.1892571449279785, "global_step": 14865, "epoch": 353} {"train_loss": -5.315783500671387, "global_step": 14866, "epoch": 353} {"train_loss": -5.2143409706297374, "global_step": 14867, "epoch": 353, "val_loss": 72939.3828125} {"train_loss": -5.210156440734863, "global_step": 14868, "epoch": 354} {"train_loss": -5.241418838500977, "global_step": 14869, "epoch": 354} {"train_loss": -5.027185440063477, "global_step": 14870, "epoch": 354} {"train_loss": -4.960549354553223, "global_step": 14871, "epoch": 354} {"train_loss": -5.1132965087890625, "global_step": 14872, "epoch": 354} {"train_loss": -5.232232093811035, "global_step": 14873, "epoch": 354} {"train_loss": -5.1266069412231445, "global_step": 14874, "epoch": 354} {"train_loss": -5.29329776763916, "global_step": 14875, "epoch": 354} {"train_loss": -5.079439640045166, "global_step": 14876, "epoch": 354} {"train_loss": -5.102459907531738, "global_step": 14877, "epoch": 354} {"train_loss": -5.235212326049805, "global_step": 14878, "epoch": 354} {"train_loss": -5.062748908996582, "global_step": 14879, "epoch": 354} {"train_loss": -4.957185745239258, "global_step": 14880, "epoch": 354} {"train_loss": -5.037143707275391, "global_step": 14881, "epoch": 354} {"train_loss": -5.260135173797607, "global_step": 14882, "epoch": 354} {"train_loss": -5.261226654052734, "global_step": 14883, "epoch": 354} {"train_loss": -5.220827579498291, "global_step": 14884, "epoch": 354} {"train_loss": -5.2271318435668945, "global_step": 14885, "epoch": 354} {"train_loss": -5.339134693145752, "global_step": 14886, "epoch": 354} {"train_loss": -5.297208309173584, "global_step": 14887, "epoch": 354} {"train_loss": -5.191662788391113, "global_step": 14888, "epoch": 354} {"train_loss": -5.125499248504639, "global_step": 14889, "epoch": 354} {"train_loss": -5.213902473449707, "global_step": 14890, "epoch": 354} {"train_loss": -5.169770240783691, "global_step": 14891, "epoch": 354} {"train_loss": -5.319944381713867, "global_step": 14892, "epoch": 354} {"train_loss": -5.231748104095459, "global_step": 14893, "epoch": 354} {"train_loss": -5.065454483032227, "global_step": 14894, "epoch": 354} {"train_loss": -5.185863971710205, "global_step": 14895, "epoch": 354} {"train_loss": -5.082729339599609, "global_step": 14896, "epoch": 354} {"train_loss": -5.062701225280762, "global_step": 14897, "epoch": 354} {"train_loss": -5.1259307861328125, "global_step": 14898, "epoch": 354} {"train_loss": -4.972872734069824, "global_step": 14899, "epoch": 354} {"train_loss": -5.185844421386719, "global_step": 14900, "epoch": 354} {"train_loss": -4.935715675354004, "global_step": 14901, "epoch": 354} {"train_loss": -5.318912982940674, "global_step": 14902, "epoch": 354} {"train_loss": -5.104389667510986, "global_step": 14903, "epoch": 354} {"train_loss": -5.392341613769531, "global_step": 14904, "epoch": 354} {"train_loss": -5.2015228271484375, "global_step": 14905, "epoch": 354} {"train_loss": -5.137231826782227, "global_step": 14906, "epoch": 354} {"train_loss": -5.284370422363281, "global_step": 14907, "epoch": 354} {"train_loss": -5.211555004119873, "global_step": 14908, "epoch": 354} {"train_loss": -5.166703962144398, "global_step": 14909, "epoch": 354, "val_loss": 71786.65625} {"train_loss": -5.192850589752197, "global_step": 14910, "epoch": 355} {"train_loss": -5.1603875160217285, "global_step": 14911, "epoch": 355} {"train_loss": -5.312290668487549, "global_step": 14912, "epoch": 355} {"train_loss": -5.204843521118164, "global_step": 14913, "epoch": 355} {"train_loss": -5.123723030090332, "global_step": 14914, "epoch": 355} {"train_loss": -5.227450847625732, "global_step": 14915, "epoch": 355} {"train_loss": -5.109472274780273, "global_step": 14916, "epoch": 355} {"train_loss": -5.095617294311523, "global_step": 14917, "epoch": 355} {"train_loss": -5.232140064239502, "global_step": 14918, "epoch": 355} {"train_loss": -5.1028547286987305, "global_step": 14919, "epoch": 355} {"train_loss": -5.185373306274414, "global_step": 14920, "epoch": 355} {"train_loss": -5.255870819091797, "global_step": 14921, "epoch": 355} {"train_loss": -5.01895809173584, "global_step": 14922, "epoch": 355} {"train_loss": -5.119162559509277, "global_step": 14923, "epoch": 355} {"train_loss": -5.210824012756348, "global_step": 14924, "epoch": 355} {"train_loss": -5.156311511993408, "global_step": 14925, "epoch": 355} {"train_loss": -5.2685747146606445, "global_step": 14926, "epoch": 355} {"train_loss": -5.129914283752441, "global_step": 14927, "epoch": 355} {"train_loss": -5.140099048614502, "global_step": 14928, "epoch": 355} {"train_loss": -5.101016521453857, "global_step": 14929, "epoch": 355} {"train_loss": -5.1512908935546875, "global_step": 14930, "epoch": 355} {"train_loss": -5.211041450500488, "global_step": 14931, "epoch": 355} {"train_loss": -5.240352153778076, "global_step": 14932, "epoch": 355} {"train_loss": -5.16427755355835, "global_step": 14933, "epoch": 355} {"train_loss": -5.2398529052734375, "global_step": 14934, "epoch": 355} {"train_loss": -5.41172981262207, "global_step": 14935, "epoch": 355} {"train_loss": -4.991131782531738, "global_step": 14936, "epoch": 355} {"train_loss": -5.2455220222473145, "global_step": 14937, "epoch": 355} {"train_loss": -5.159765720367432, "global_step": 14938, "epoch": 355} {"train_loss": -5.09843635559082, "global_step": 14939, "epoch": 355} {"train_loss": -5.205843448638916, "global_step": 14940, "epoch": 355} {"train_loss": -5.037362575531006, "global_step": 14941, "epoch": 355} {"train_loss": -5.254837512969971, "global_step": 14942, "epoch": 355} {"train_loss": -5.136190414428711, "global_step": 14943, "epoch": 355} {"train_loss": -5.171301364898682, "global_step": 14944, "epoch": 355} {"train_loss": -5.209662437438965, "global_step": 14945, "epoch": 355} {"train_loss": -5.104745864868164, "global_step": 14946, "epoch": 355} {"train_loss": -5.168532848358154, "global_step": 14947, "epoch": 355} {"train_loss": -5.159150123596191, "global_step": 14948, "epoch": 355} {"train_loss": -5.241941452026367, "global_step": 14949, "epoch": 355} {"train_loss": -5.313567638397217, "global_step": 14950, "epoch": 355} {"train_loss": -5.173110995973859, "global_step": 14951, "epoch": 355, "val_loss": 71241.046875} {"train_loss": -5.08562707901001, "global_step": 14952, "epoch": 356} {"train_loss": -5.3072381019592285, "global_step": 14953, "epoch": 356} {"train_loss": -5.310700416564941, "global_step": 14954, "epoch": 356} {"train_loss": -5.257256031036377, "global_step": 14955, "epoch": 356} {"train_loss": -5.286219596862793, "global_step": 14956, "epoch": 356} {"train_loss": -5.14501953125, "global_step": 14957, "epoch": 356} {"train_loss": -5.239603042602539, "global_step": 14958, "epoch": 356} {"train_loss": -5.183061599731445, "global_step": 14959, "epoch": 356} {"train_loss": -5.188570976257324, "global_step": 14960, "epoch": 356} {"train_loss": -5.252495765686035, "global_step": 14961, "epoch": 356} {"train_loss": -5.173361778259277, "global_step": 14962, "epoch": 356} {"train_loss": -5.1798601150512695, "global_step": 14963, "epoch": 356} {"train_loss": -5.213894844055176, "global_step": 14964, "epoch": 356} {"train_loss": -5.145072937011719, "global_step": 14965, "epoch": 356} {"train_loss": -5.15078067779541, "global_step": 14966, "epoch": 356} {"train_loss": -5.2362060546875, "global_step": 14967, "epoch": 356} {"train_loss": -5.119421005249023, "global_step": 14968, "epoch": 356} {"train_loss": -5.226981163024902, "global_step": 14969, "epoch": 356} {"train_loss": -5.381311893463135, "global_step": 14970, "epoch": 356} {"train_loss": -5.226869583129883, "global_step": 14971, "epoch": 356} {"train_loss": -5.354698657989502, "global_step": 14972, "epoch": 356} {"train_loss": -5.297852516174316, "global_step": 14973, "epoch": 356} {"train_loss": -5.42495584487915, "global_step": 14974, "epoch": 356} {"train_loss": -5.063269138336182, "global_step": 14975, "epoch": 356} {"train_loss": -5.138874053955078, "global_step": 14976, "epoch": 356} {"train_loss": -5.260912895202637, "global_step": 14977, "epoch": 356} {"train_loss": -5.198520660400391, "global_step": 14978, "epoch": 356} {"train_loss": -5.281858921051025, "global_step": 14979, "epoch": 356} {"train_loss": -5.123094081878662, "global_step": 14980, "epoch": 356} {"train_loss": -5.2678680419921875, "global_step": 14981, "epoch": 356} {"train_loss": -5.092306137084961, "global_step": 14982, "epoch": 356} {"train_loss": -5.31496524810791, "global_step": 14983, "epoch": 356} {"train_loss": -5.231800079345703, "global_step": 14984, "epoch": 356} {"train_loss": -5.258279800415039, "global_step": 14985, "epoch": 356} {"train_loss": -5.280431747436523, "global_step": 14986, "epoch": 356} {"train_loss": -5.146903038024902, "global_step": 14987, "epoch": 356} {"train_loss": -5.188564300537109, "global_step": 14988, "epoch": 356} {"train_loss": -5.300724983215332, "global_step": 14989, "epoch": 356} {"train_loss": -5.280974864959717, "global_step": 14990, "epoch": 356} {"train_loss": -5.2392706871032715, "global_step": 14991, "epoch": 356} {"train_loss": -5.1911396980285645, "global_step": 14992, "epoch": 356} {"train_loss": -5.225452968052456, "global_step": 14993, "epoch": 356, "val_loss": 72119.265625} {"train_loss": -5.120409965515137, "global_step": 14994, "epoch": 357} {"train_loss": -5.233063697814941, "global_step": 14995, "epoch": 357} {"train_loss": -5.140965461730957, "global_step": 14996, "epoch": 357} {"train_loss": -5.275121688842773, "global_step": 14997, "epoch": 357} {"train_loss": -5.240482330322266, "global_step": 14998, "epoch": 357} {"train_loss": -5.226879119873047, "global_step": 14999, "epoch": 357} {"train_loss": -5.1393280029296875, "global_step": 15000, "epoch": 357} {"train_loss": -5.317774295806885, "global_step": 15001, "epoch": 357} {"train_loss": -5.328487396240234, "global_step": 15002, "epoch": 357} {"train_loss": -5.104087829589844, "global_step": 15003, "epoch": 357} {"train_loss": -5.186481952667236, "global_step": 15004, "epoch": 357} {"train_loss": -5.3492021560668945, "global_step": 15005, "epoch": 357} {"train_loss": -5.18009614944458, "global_step": 15006, "epoch": 357} {"train_loss": -5.283102989196777, "global_step": 15007, "epoch": 357} {"train_loss": -5.311767578125, "global_step": 15008, "epoch": 357} {"train_loss": -5.133356094360352, "global_step": 15009, "epoch": 357} {"train_loss": -5.24712610244751, "global_step": 15010, "epoch": 357} {"train_loss": -5.069359302520752, "global_step": 15011, "epoch": 357} {"train_loss": -5.232442855834961, "global_step": 15012, "epoch": 357} {"train_loss": -5.192890644073486, "global_step": 15013, "epoch": 357} {"train_loss": -5.212279796600342, "global_step": 15014, "epoch": 357} {"train_loss": -5.216668128967285, "global_step": 15015, "epoch": 357} {"train_loss": -5.233871936798096, "global_step": 15016, "epoch": 357} {"train_loss": -5.233005523681641, "global_step": 15017, "epoch": 357} {"train_loss": -5.150336265563965, "global_step": 15018, "epoch": 357} {"train_loss": -5.207953929901123, "global_step": 15019, "epoch": 357} {"train_loss": -5.315265655517578, "global_step": 15020, "epoch": 357} {"train_loss": -5.179877758026123, "global_step": 15021, "epoch": 357} {"train_loss": -5.183967113494873, "global_step": 15022, "epoch": 357} {"train_loss": -5.148544788360596, "global_step": 15023, "epoch": 357} {"train_loss": -5.246486663818359, "global_step": 15024, "epoch": 357} {"train_loss": -5.232600212097168, "global_step": 15025, "epoch": 357} {"train_loss": -5.338279724121094, "global_step": 15026, "epoch": 357} {"train_loss": -5.167509078979492, "global_step": 15027, "epoch": 357} {"train_loss": -5.283886909484863, "global_step": 15028, "epoch": 357} {"train_loss": -5.27619743347168, "global_step": 15029, "epoch": 357} {"train_loss": -5.235683917999268, "global_step": 15030, "epoch": 357} {"train_loss": -5.249528884887695, "global_step": 15031, "epoch": 357} {"train_loss": -5.333434104919434, "global_step": 15032, "epoch": 357} {"train_loss": -5.258694648742676, "global_step": 15033, "epoch": 357} {"train_loss": -5.116148471832275, "global_step": 15034, "epoch": 357} {"train_loss": -5.221404927117484, "global_step": 15035, "epoch": 357, "val_loss": 71686.7578125} {"train_loss": -5.388152122497559, "global_step": 15036, "epoch": 358} {"train_loss": -5.241846561431885, "global_step": 15037, "epoch": 358} {"train_loss": -5.204792499542236, "global_step": 15038, "epoch": 358} {"train_loss": -5.284564018249512, "global_step": 15039, "epoch": 358} {"train_loss": -5.112500190734863, "global_step": 15040, "epoch": 358} {"train_loss": -5.2939958572387695, "global_step": 15041, "epoch": 358} {"train_loss": -5.027937412261963, "global_step": 15042, "epoch": 358} {"train_loss": -5.214663505554199, "global_step": 15043, "epoch": 358} {"train_loss": -5.225029468536377, "global_step": 15044, "epoch": 358} {"train_loss": -5.212274551391602, "global_step": 15045, "epoch": 358} {"train_loss": -5.072695255279541, "global_step": 15046, "epoch": 358} {"train_loss": -5.214914321899414, "global_step": 15047, "epoch": 358} {"train_loss": -5.148415565490723, "global_step": 15048, "epoch": 358} {"train_loss": -5.071943283081055, "global_step": 15049, "epoch": 358} {"train_loss": -5.066742420196533, "global_step": 15050, "epoch": 358} {"train_loss": -5.160574436187744, "global_step": 15051, "epoch": 358} {"train_loss": -5.090366363525391, "global_step": 15052, "epoch": 358} {"train_loss": -5.279026031494141, "global_step": 15053, "epoch": 358} {"train_loss": -5.066857814788818, "global_step": 15054, "epoch": 358} {"train_loss": -5.188520908355713, "global_step": 15055, "epoch": 358} {"train_loss": -5.112537860870361, "global_step": 15056, "epoch": 358} {"train_loss": -5.2444987297058105, "global_step": 15057, "epoch": 358} {"train_loss": -5.109784126281738, "global_step": 15058, "epoch": 358} {"train_loss": -5.199666976928711, "global_step": 15059, "epoch": 358} {"train_loss": -5.229352951049805, "global_step": 15060, "epoch": 358} {"train_loss": -5.082458972930908, "global_step": 15061, "epoch": 358} {"train_loss": -5.323007583618164, "global_step": 15062, "epoch": 358} {"train_loss": -5.254678726196289, "global_step": 15063, "epoch": 358} {"train_loss": -5.297576904296875, "global_step": 15064, "epoch": 358} {"train_loss": -5.297129154205322, "global_step": 15065, "epoch": 358} {"train_loss": -5.2350335121154785, "global_step": 15066, "epoch": 358} {"train_loss": -5.25986909866333, "global_step": 15067, "epoch": 358} {"train_loss": -5.325445175170898, "global_step": 15068, "epoch": 358} {"train_loss": -5.2085418701171875, "global_step": 15069, "epoch": 358} {"train_loss": -5.189556121826172, "global_step": 15070, "epoch": 358} {"train_loss": -5.277095794677734, "global_step": 15071, "epoch": 358} {"train_loss": -5.233661651611328, "global_step": 15072, "epoch": 358} {"train_loss": -5.160733222961426, "global_step": 15073, "epoch": 358} {"train_loss": -5.265012264251709, "global_step": 15074, "epoch": 358} {"train_loss": -5.307839393615723, "global_step": 15075, "epoch": 358} {"train_loss": -5.110939025878906, "global_step": 15076, "epoch": 358} {"train_loss": -5.203131153469994, "global_step": 15077, "epoch": 358, "val_loss": 71364.265625} {"train_loss": -5.25957727432251, "global_step": 15078, "epoch": 359} {"train_loss": -5.10753059387207, "global_step": 15079, "epoch": 359} {"train_loss": -5.049263000488281, "global_step": 15080, "epoch": 359} {"train_loss": -5.197916030883789, "global_step": 15081, "epoch": 359} {"train_loss": -5.184569358825684, "global_step": 15082, "epoch": 359} {"train_loss": -5.150090217590332, "global_step": 15083, "epoch": 359} {"train_loss": -5.246044158935547, "global_step": 15084, "epoch": 359} {"train_loss": -5.178018093109131, "global_step": 15085, "epoch": 359} {"train_loss": -5.154091835021973, "global_step": 15086, "epoch": 359} {"train_loss": -5.157232284545898, "global_step": 15087, "epoch": 359} {"train_loss": -5.200742244720459, "global_step": 15088, "epoch": 359} {"train_loss": -5.274587631225586, "global_step": 15089, "epoch": 359} {"train_loss": -5.3343939781188965, "global_step": 15090, "epoch": 359} {"train_loss": -5.29611873626709, "global_step": 15091, "epoch": 359} {"train_loss": -5.227783203125, "global_step": 15092, "epoch": 359} {"train_loss": -5.168295860290527, "global_step": 15093, "epoch": 359} {"train_loss": -5.159157752990723, "global_step": 15094, "epoch": 359} {"train_loss": -5.2058916091918945, "global_step": 15095, "epoch": 359} {"train_loss": -5.367813587188721, "global_step": 15096, "epoch": 359} {"train_loss": -5.27862024307251, "global_step": 15097, "epoch": 359} {"train_loss": -5.133174896240234, "global_step": 15098, "epoch": 359} {"train_loss": -5.331610679626465, "global_step": 15099, "epoch": 359} {"train_loss": -5.200620651245117, "global_step": 15100, "epoch": 359} {"train_loss": -5.117979049682617, "global_step": 15101, "epoch": 359} {"train_loss": -5.0579447746276855, "global_step": 15102, "epoch": 359} {"train_loss": -5.211852550506592, "global_step": 15103, "epoch": 359} {"train_loss": -5.13199520111084, "global_step": 15104, "epoch": 359} {"train_loss": -5.248004913330078, "global_step": 15105, "epoch": 359} {"train_loss": -5.130244255065918, "global_step": 15106, "epoch": 359} {"train_loss": -5.3016357421875, "global_step": 15107, "epoch": 359} {"train_loss": -5.34036111831665, "global_step": 15108, "epoch": 359} {"train_loss": -5.236577033996582, "global_step": 15109, "epoch": 359} {"train_loss": -5.234236240386963, "global_step": 15110, "epoch": 359} {"train_loss": -5.099143981933594, "global_step": 15111, "epoch": 359} {"train_loss": -5.270930290222168, "global_step": 15112, "epoch": 359} {"train_loss": -5.2252912521362305, "global_step": 15113, "epoch": 359} {"train_loss": -5.4091105461120605, "global_step": 15114, "epoch": 359} {"train_loss": -5.070655822753906, "global_step": 15115, "epoch": 359} {"train_loss": -5.253121376037598, "global_step": 15116, "epoch": 359} {"train_loss": -5.21224308013916, "global_step": 15117, "epoch": 359} {"train_loss": -5.249207496643066, "global_step": 15118, "epoch": 359} {"train_loss": -5.209459293456304, "global_step": 15119, "epoch": 359, "val_loss": 71012.2421875} {"train_loss": -5.1379499435424805, "global_step": 15120, "epoch": 360} {"train_loss": -5.295675754547119, "global_step": 15121, "epoch": 360} {"train_loss": -5.208057403564453, "global_step": 15122, "epoch": 360} {"train_loss": -5.383025169372559, "global_step": 15123, "epoch": 360} {"train_loss": -5.185132026672363, "global_step": 15124, "epoch": 360} {"train_loss": -5.133836269378662, "global_step": 15125, "epoch": 360} {"train_loss": -5.21382999420166, "global_step": 15126, "epoch": 360} {"train_loss": -5.175127983093262, "global_step": 15127, "epoch": 360} {"train_loss": -5.315006256103516, "global_step": 15128, "epoch": 360} {"train_loss": -5.313043594360352, "global_step": 15129, "epoch": 360} {"train_loss": -5.264767169952393, "global_step": 15130, "epoch": 360} {"train_loss": -5.374979019165039, "global_step": 15131, "epoch": 360} {"train_loss": -5.1998677253723145, "global_step": 15132, "epoch": 360} {"train_loss": -5.22890567779541, "global_step": 15133, "epoch": 360} {"train_loss": -5.094244956970215, "global_step": 15134, "epoch": 360} {"train_loss": -5.30419921875, "global_step": 15135, "epoch": 360} {"train_loss": -5.242724895477295, "global_step": 15136, "epoch": 360} {"train_loss": -5.221924781799316, "global_step": 15137, "epoch": 360} {"train_loss": -5.268354892730713, "global_step": 15138, "epoch": 360} {"train_loss": -5.343090057373047, "global_step": 15139, "epoch": 360} {"train_loss": -5.291755199432373, "global_step": 15140, "epoch": 360} {"train_loss": -5.062519073486328, "global_step": 15141, "epoch": 360} {"train_loss": -5.279707908630371, "global_step": 15142, "epoch": 360} {"train_loss": -5.213202476501465, "global_step": 15143, "epoch": 360} {"train_loss": -5.143989562988281, "global_step": 15144, "epoch": 360} {"train_loss": -5.31652307510376, "global_step": 15145, "epoch": 360} {"train_loss": -5.344322204589844, "global_step": 15146, "epoch": 360} {"train_loss": -5.171913146972656, "global_step": 15147, "epoch": 360} {"train_loss": -5.176645755767822, "global_step": 15148, "epoch": 360} {"train_loss": -5.143467903137207, "global_step": 15149, "epoch": 360} {"train_loss": -5.2840657234191895, "global_step": 15150, "epoch": 360} {"train_loss": -5.059589385986328, "global_step": 15151, "epoch": 360} {"train_loss": -5.406524658203125, "global_step": 15152, "epoch": 360} {"train_loss": -5.031912803649902, "global_step": 15153, "epoch": 360} {"train_loss": -5.198980808258057, "global_step": 15154, "epoch": 360} {"train_loss": -5.235723495483398, "global_step": 15155, "epoch": 360} {"train_loss": -5.160740852355957, "global_step": 15156, "epoch": 360} {"train_loss": -5.140969276428223, "global_step": 15157, "epoch": 360} {"train_loss": -5.256309509277344, "global_step": 15158, "epoch": 360} {"train_loss": -5.17051362991333, "global_step": 15159, "epoch": 360} {"train_loss": -5.011309623718262, "global_step": 15160, "epoch": 360} {"train_loss": -5.216181493940807, "global_step": 15161, "epoch": 360, "val_loss": 71245.21875} {"train_loss": -5.149278163909912, "global_step": 15162, "epoch": 361} {"train_loss": -5.129278182983398, "global_step": 15163, "epoch": 361} {"train_loss": -5.155843734741211, "global_step": 15164, "epoch": 361} {"train_loss": -5.088491439819336, "global_step": 15165, "epoch": 361} {"train_loss": -5.253654479980469, "global_step": 15166, "epoch": 361} {"train_loss": -5.182459831237793, "global_step": 15167, "epoch": 361} {"train_loss": -5.352947235107422, "global_step": 15168, "epoch": 361} {"train_loss": -5.276955604553223, "global_step": 15169, "epoch": 361} {"train_loss": -5.128586769104004, "global_step": 15170, "epoch": 361} {"train_loss": -5.120383262634277, "global_step": 15171, "epoch": 361} {"train_loss": -5.191499710083008, "global_step": 15172, "epoch": 361} {"train_loss": -5.144804000854492, "global_step": 15173, "epoch": 361} {"train_loss": -5.219415187835693, "global_step": 15174, "epoch": 361} {"train_loss": -5.192802906036377, "global_step": 15175, "epoch": 361} {"train_loss": -5.270130634307861, "global_step": 15176, "epoch": 361} {"train_loss": -5.324728965759277, "global_step": 15177, "epoch": 361} {"train_loss": -5.232267379760742, "global_step": 15178, "epoch": 361} {"train_loss": -5.148382186889648, "global_step": 15179, "epoch": 361} {"train_loss": -5.226313591003418, "global_step": 15180, "epoch": 361} {"train_loss": -5.081510543823242, "global_step": 15181, "epoch": 361} {"train_loss": -5.184198379516602, "global_step": 15182, "epoch": 361} {"train_loss": -5.146941184997559, "global_step": 15183, "epoch": 361} {"train_loss": -5.140774726867676, "global_step": 15184, "epoch": 361} {"train_loss": -5.184697151184082, "global_step": 15185, "epoch": 361} {"train_loss": -5.258426189422607, "global_step": 15186, "epoch": 361} {"train_loss": -5.192198753356934, "global_step": 15187, "epoch": 361} {"train_loss": -5.257595062255859, "global_step": 15188, "epoch": 361} {"train_loss": -5.199456214904785, "global_step": 15189, "epoch": 361} {"train_loss": -5.2504167556762695, "global_step": 15190, "epoch": 361} {"train_loss": -5.198427200317383, "global_step": 15191, "epoch": 361} {"train_loss": -5.286759376525879, "global_step": 15192, "epoch": 361} {"train_loss": -5.116028785705566, "global_step": 15193, "epoch": 361} {"train_loss": -5.299291610717773, "global_step": 15194, "epoch": 361} {"train_loss": -5.049318313598633, "global_step": 15195, "epoch": 361} {"train_loss": -5.226524829864502, "global_step": 15196, "epoch": 361} {"train_loss": -5.059321880340576, "global_step": 15197, "epoch": 361} {"train_loss": -5.181525230407715, "global_step": 15198, "epoch": 361} {"train_loss": -5.163258075714111, "global_step": 15199, "epoch": 361} {"train_loss": -5.120038986206055, "global_step": 15200, "epoch": 361} {"train_loss": -5.0729804039001465, "global_step": 15201, "epoch": 361} {"train_loss": -5.1249871253967285, "global_step": 15202, "epoch": 361} {"train_loss": -5.178514151346116, "global_step": 15203, "epoch": 361, "val_loss": 71603.609375} {"train_loss": -4.9998884201049805, "global_step": 15204, "epoch": 362} {"train_loss": -4.981742858886719, "global_step": 15205, "epoch": 362} {"train_loss": -5.0743513107299805, "global_step": 15206, "epoch": 362} {"train_loss": -5.115176200866699, "global_step": 15207, "epoch": 362} {"train_loss": -5.204492568969727, "global_step": 15208, "epoch": 362} {"train_loss": -4.93784236907959, "global_step": 15209, "epoch": 362} {"train_loss": -5.0811686515808105, "global_step": 15210, "epoch": 362} {"train_loss": -5.134796142578125, "global_step": 15211, "epoch": 362} {"train_loss": -5.117910385131836, "global_step": 15212, "epoch": 362} {"train_loss": -5.055027961730957, "global_step": 15213, "epoch": 362} {"train_loss": -5.178441047668457, "global_step": 15214, "epoch": 362} {"train_loss": -4.9911370277404785, "global_step": 15215, "epoch": 362} {"train_loss": -5.186193943023682, "global_step": 15216, "epoch": 362} {"train_loss": -5.269631385803223, "global_step": 15217, "epoch": 362} {"train_loss": -5.166985988616943, "global_step": 15218, "epoch": 362} {"train_loss": -5.101914405822754, "global_step": 15219, "epoch": 362} {"train_loss": -5.166749477386475, "global_step": 15220, "epoch": 362} {"train_loss": -5.118654251098633, "global_step": 15221, "epoch": 362} {"train_loss": -5.210297584533691, "global_step": 15222, "epoch": 362} {"train_loss": -5.213118553161621, "global_step": 15223, "epoch": 362} {"train_loss": -5.269733905792236, "global_step": 15224, "epoch": 362} {"train_loss": -5.30393123626709, "global_step": 15225, "epoch": 362} {"train_loss": -5.2380218505859375, "global_step": 15226, "epoch": 362} {"train_loss": -5.1349968910217285, "global_step": 15227, "epoch": 362} {"train_loss": -5.29721736907959, "global_step": 15228, "epoch": 362} {"train_loss": -5.243947982788086, "global_step": 15229, "epoch": 362} {"train_loss": -5.352049827575684, "global_step": 15230, "epoch": 362} {"train_loss": -5.329716682434082, "global_step": 15231, "epoch": 362} {"train_loss": -5.134640693664551, "global_step": 15232, "epoch": 362} {"train_loss": -5.24919319152832, "global_step": 15233, "epoch": 362} {"train_loss": -5.2625627517700195, "global_step": 15234, "epoch": 362} {"train_loss": -5.287641525268555, "global_step": 15235, "epoch": 362} {"train_loss": -5.302156448364258, "global_step": 15236, "epoch": 362} {"train_loss": -5.244007110595703, "global_step": 15237, "epoch": 362} {"train_loss": -5.205485820770264, "global_step": 15238, "epoch": 362} {"train_loss": -5.291231155395508, "global_step": 15239, "epoch": 362} {"train_loss": -5.271343231201172, "global_step": 15240, "epoch": 362} {"train_loss": -5.131538391113281, "global_step": 15241, "epoch": 362} {"train_loss": -5.1961140632629395, "global_step": 15242, "epoch": 362} {"train_loss": -5.220283031463623, "global_step": 15243, "epoch": 362} {"train_loss": -5.044251441955566, "global_step": 15244, "epoch": 362} {"train_loss": -5.176196881702968, "global_step": 15245, "epoch": 362, "val_loss": 71667.9609375} {"train_loss": -5.24273681640625, "global_step": 15246, "epoch": 363} {"train_loss": -4.992339134216309, "global_step": 15247, "epoch": 363} {"train_loss": -5.155257225036621, "global_step": 15248, "epoch": 363} {"train_loss": -5.290204048156738, "global_step": 15249, "epoch": 363} {"train_loss": -4.952207565307617, "global_step": 15250, "epoch": 363} {"train_loss": -5.193434715270996, "global_step": 15251, "epoch": 363} {"train_loss": -5.1861891746521, "global_step": 15252, "epoch": 363} {"train_loss": -5.138228416442871, "global_step": 15253, "epoch": 363} {"train_loss": -5.313116073608398, "global_step": 15254, "epoch": 363} {"train_loss": -5.1413116455078125, "global_step": 15255, "epoch": 363} {"train_loss": -5.226710319519043, "global_step": 15256, "epoch": 363} {"train_loss": -5.201933860778809, "global_step": 15257, "epoch": 363} {"train_loss": -5.2572712898254395, "global_step": 15258, "epoch": 363} {"train_loss": -5.151644706726074, "global_step": 15259, "epoch": 363} {"train_loss": -5.188417434692383, "global_step": 15260, "epoch": 363} {"train_loss": -5.31392240524292, "global_step": 15261, "epoch": 363} {"train_loss": -5.260432243347168, "global_step": 15262, "epoch": 363} {"train_loss": -5.231997489929199, "global_step": 15263, "epoch": 363} {"train_loss": -5.021733283996582, "global_step": 15264, "epoch": 363} {"train_loss": -5.100381851196289, "global_step": 15265, "epoch": 363} {"train_loss": -5.350869655609131, "global_step": 15266, "epoch": 363} {"train_loss": -5.148388862609863, "global_step": 15267, "epoch": 363} {"train_loss": -5.195686340332031, "global_step": 15268, "epoch": 363} {"train_loss": -5.2361650466918945, "global_step": 15269, "epoch": 363} {"train_loss": -5.1906514167785645, "global_step": 15270, "epoch": 363} {"train_loss": -5.361207962036133, "global_step": 15271, "epoch": 363} {"train_loss": -5.35237979888916, "global_step": 15272, "epoch": 363} {"train_loss": -5.123157978057861, "global_step": 15273, "epoch": 363} {"train_loss": -5.316689491271973, "global_step": 15274, "epoch": 363} {"train_loss": -5.111730575561523, "global_step": 15275, "epoch": 363} {"train_loss": -5.23892068862915, "global_step": 15276, "epoch": 363} {"train_loss": -5.2448811531066895, "global_step": 15277, "epoch": 363} {"train_loss": -5.203500747680664, "global_step": 15278, "epoch": 363} {"train_loss": -5.1007561683654785, "global_step": 15279, "epoch": 363} {"train_loss": -5.169615745544434, "global_step": 15280, "epoch": 363} {"train_loss": -5.262129783630371, "global_step": 15281, "epoch": 363} {"train_loss": -5.239006996154785, "global_step": 15282, "epoch": 363} {"train_loss": -5.198640823364258, "global_step": 15283, "epoch": 363} {"train_loss": -5.133742332458496, "global_step": 15284, "epoch": 363} {"train_loss": -5.130154609680176, "global_step": 15285, "epoch": 363} {"train_loss": -5.178056716918945, "global_step": 15286, "epoch": 363} {"train_loss": -5.196151415506999, "global_step": 15287, "epoch": 363, "val_loss": 70699.5390625} {"train_loss": -5.301065444946289, "global_step": 15288, "epoch": 364} {"train_loss": -5.255138874053955, "global_step": 15289, "epoch": 364} {"train_loss": -5.274042129516602, "global_step": 15290, "epoch": 364} {"train_loss": -5.168235778808594, "global_step": 15291, "epoch": 364} {"train_loss": -5.226995468139648, "global_step": 15292, "epoch": 364} {"train_loss": -5.13168478012085, "global_step": 15293, "epoch": 364} {"train_loss": -5.2389912605285645, "global_step": 15294, "epoch": 364} {"train_loss": -5.254025459289551, "global_step": 15295, "epoch": 364} {"train_loss": -5.266180038452148, "global_step": 15296, "epoch": 364} {"train_loss": -5.322568893432617, "global_step": 15297, "epoch": 364} {"train_loss": -5.185583591461182, "global_step": 15298, "epoch": 364} {"train_loss": -5.2563323974609375, "global_step": 15299, "epoch": 364} {"train_loss": -5.36128568649292, "global_step": 15300, "epoch": 364} {"train_loss": -5.189550876617432, "global_step": 15301, "epoch": 364} {"train_loss": -5.205086708068848, "global_step": 15302, "epoch": 364} {"train_loss": -5.354775428771973, "global_step": 15303, "epoch": 364} {"train_loss": -5.338289260864258, "global_step": 15304, "epoch": 364} {"train_loss": -5.326988697052002, "global_step": 15305, "epoch": 364} {"train_loss": -5.214487075805664, "global_step": 15306, "epoch": 364} {"train_loss": -5.192023754119873, "global_step": 15307, "epoch": 364} {"train_loss": -5.124660491943359, "global_step": 15308, "epoch": 364} {"train_loss": -5.286336421966553, "global_step": 15309, "epoch": 364} {"train_loss": -5.260247707366943, "global_step": 15310, "epoch": 364} {"train_loss": -5.362271785736084, "global_step": 15311, "epoch": 364} {"train_loss": -5.075665473937988, "global_step": 15312, "epoch": 364} {"train_loss": -5.249862194061279, "global_step": 15313, "epoch": 364} {"train_loss": -5.276098251342773, "global_step": 15314, "epoch": 364} {"train_loss": -5.210605621337891, "global_step": 15315, "epoch": 364} {"train_loss": -5.115471839904785, "global_step": 15316, "epoch": 364} {"train_loss": -5.159560680389404, "global_step": 15317, "epoch": 364} {"train_loss": -5.112200736999512, "global_step": 15318, "epoch": 364} {"train_loss": -5.188969135284424, "global_step": 15319, "epoch": 364} {"train_loss": -5.196047306060791, "global_step": 15320, "epoch": 364} {"train_loss": -5.203561782836914, "global_step": 15321, "epoch": 364} {"train_loss": -5.367112636566162, "global_step": 15322, "epoch": 364} {"train_loss": -5.224026203155518, "global_step": 15323, "epoch": 364} {"train_loss": -5.142976760864258, "global_step": 15324, "epoch": 364} {"train_loss": -5.274629592895508, "global_step": 15325, "epoch": 364} {"train_loss": -5.0815229415893555, "global_step": 15326, "epoch": 364} {"train_loss": -5.226614952087402, "global_step": 15327, "epoch": 364} {"train_loss": -5.187056541442871, "global_step": 15328, "epoch": 364} {"train_loss": -5.229535012018113, "global_step": 15329, "epoch": 364, "val_loss": 70923.859375} {"train_loss": -5.221342086791992, "global_step": 15330, "epoch": 365} {"train_loss": -5.206051826477051, "global_step": 15331, "epoch": 365} {"train_loss": -5.187490940093994, "global_step": 15332, "epoch": 365} {"train_loss": -5.195743560791016, "global_step": 15333, "epoch": 365} {"train_loss": -5.2963104248046875, "global_step": 15334, "epoch": 365} {"train_loss": -5.195679187774658, "global_step": 15335, "epoch": 365} {"train_loss": -5.299633026123047, "global_step": 15336, "epoch": 365} {"train_loss": -5.081060409545898, "global_step": 15337, "epoch": 365} {"train_loss": -5.165326118469238, "global_step": 15338, "epoch": 365} {"train_loss": -5.283472061157227, "global_step": 15339, "epoch": 365} {"train_loss": -5.20927619934082, "global_step": 15340, "epoch": 365} {"train_loss": -5.086981773376465, "global_step": 15341, "epoch": 365} {"train_loss": -5.346066951751709, "global_step": 15342, "epoch": 365} {"train_loss": -5.251635551452637, "global_step": 15343, "epoch": 365} {"train_loss": -5.095174789428711, "global_step": 15344, "epoch": 365} {"train_loss": -5.251072883605957, "global_step": 15345, "epoch": 365} {"train_loss": -5.208355903625488, "global_step": 15346, "epoch": 365} {"train_loss": -5.283977508544922, "global_step": 15347, "epoch": 365} {"train_loss": -5.237887382507324, "global_step": 15348, "epoch": 365} {"train_loss": -5.289297103881836, "global_step": 15349, "epoch": 365} {"train_loss": -5.238440036773682, "global_step": 15350, "epoch": 365} {"train_loss": -5.342984199523926, "global_step": 15351, "epoch": 365} {"train_loss": -5.176366329193115, "global_step": 15352, "epoch": 365} {"train_loss": -5.276170253753662, "global_step": 15353, "epoch": 365} {"train_loss": -5.2522077560424805, "global_step": 15354, "epoch": 365} {"train_loss": -5.280224800109863, "global_step": 15355, "epoch": 365} {"train_loss": -5.257717132568359, "global_step": 15356, "epoch": 365} {"train_loss": -5.224593162536621, "global_step": 15357, "epoch": 365} {"train_loss": -5.231765270233154, "global_step": 15358, "epoch": 365} {"train_loss": -5.318978309631348, "global_step": 15359, "epoch": 365} {"train_loss": -5.2018723487854, "global_step": 15360, "epoch": 365} {"train_loss": -5.319777488708496, "global_step": 15361, "epoch": 365} {"train_loss": -5.257582664489746, "global_step": 15362, "epoch": 365} {"train_loss": -5.230322360992432, "global_step": 15363, "epoch": 365} {"train_loss": -5.18803071975708, "global_step": 15364, "epoch": 365} {"train_loss": -5.282200336456299, "global_step": 15365, "epoch": 365} {"train_loss": -5.261484146118164, "global_step": 15366, "epoch": 365} {"train_loss": -5.2342987060546875, "global_step": 15367, "epoch": 365} {"train_loss": -5.222808837890625, "global_step": 15368, "epoch": 365} {"train_loss": -5.296938896179199, "global_step": 15369, "epoch": 365} {"train_loss": -5.285329818725586, "global_step": 15370, "epoch": 365} {"train_loss": -5.235828569957188, "global_step": 15371, "epoch": 365, "val_loss": 70784.4140625} {"train_loss": -5.177574157714844, "global_step": 15372, "epoch": 366} {"train_loss": -5.137820243835449, "global_step": 15373, "epoch": 366} {"train_loss": -5.357143402099609, "global_step": 15374, "epoch": 366} {"train_loss": -5.159479141235352, "global_step": 15375, "epoch": 366} {"train_loss": -5.360518455505371, "global_step": 15376, "epoch": 366} {"train_loss": -5.229940414428711, "global_step": 15377, "epoch": 366} {"train_loss": -5.228421211242676, "global_step": 15378, "epoch": 366} {"train_loss": -5.302699089050293, "global_step": 15379, "epoch": 366} {"train_loss": -5.343160629272461, "global_step": 15380, "epoch": 366} {"train_loss": -5.242487907409668, "global_step": 15381, "epoch": 366} {"train_loss": -5.29808235168457, "global_step": 15382, "epoch": 366} {"train_loss": -5.292987823486328, "global_step": 15383, "epoch": 366} {"train_loss": -5.196998119354248, "global_step": 15384, "epoch": 366} {"train_loss": -5.260830402374268, "global_step": 15385, "epoch": 366} {"train_loss": -5.256929397583008, "global_step": 15386, "epoch": 366} {"train_loss": -5.22159481048584, "global_step": 15387, "epoch": 366} {"train_loss": -5.046605110168457, "global_step": 15388, "epoch": 366} {"train_loss": -5.322335243225098, "global_step": 15389, "epoch": 366} {"train_loss": -5.0972089767456055, "global_step": 15390, "epoch": 366} {"train_loss": -5.220552444458008, "global_step": 15391, "epoch": 366} {"train_loss": -5.261221885681152, "global_step": 15392, "epoch": 366} {"train_loss": -5.113076686859131, "global_step": 15393, "epoch": 366} {"train_loss": -5.232198715209961, "global_step": 15394, "epoch": 366} {"train_loss": -5.217703819274902, "global_step": 15395, "epoch": 366} {"train_loss": -5.167315483093262, "global_step": 15396, "epoch": 366} {"train_loss": -5.28084659576416, "global_step": 15397, "epoch": 366} {"train_loss": -5.129196643829346, "global_step": 15398, "epoch": 366} {"train_loss": -5.296407699584961, "global_step": 15399, "epoch": 366} {"train_loss": -5.265039443969727, "global_step": 15400, "epoch": 366} {"train_loss": -5.164850234985352, "global_step": 15401, "epoch": 366} {"train_loss": -5.314657211303711, "global_step": 15402, "epoch": 366} {"train_loss": -5.266921520233154, "global_step": 15403, "epoch": 366} {"train_loss": -5.198550224304199, "global_step": 15404, "epoch": 366} {"train_loss": -5.234548568725586, "global_step": 15405, "epoch": 366} {"train_loss": -5.210211753845215, "global_step": 15406, "epoch": 366} {"train_loss": -5.211770534515381, "global_step": 15407, "epoch": 366} {"train_loss": -5.1785359382629395, "global_step": 15408, "epoch": 366} {"train_loss": -5.279163360595703, "global_step": 15409, "epoch": 366} {"train_loss": -5.15756368637085, "global_step": 15410, "epoch": 366} {"train_loss": -5.24742317199707, "global_step": 15411, "epoch": 366} {"train_loss": -5.194246292114258, "global_step": 15412, "epoch": 366} {"train_loss": -5.229453518277123, "global_step": 15413, "epoch": 366, "val_loss": 71408.78125} {"train_loss": -5.304622173309326, "global_step": 15414, "epoch": 367} {"train_loss": -5.323232650756836, "global_step": 15415, "epoch": 367} {"train_loss": -5.366682052612305, "global_step": 15416, "epoch": 367} {"train_loss": -5.148223400115967, "global_step": 15417, "epoch": 367} {"train_loss": -5.176534652709961, "global_step": 15418, "epoch": 367} {"train_loss": -5.242986679077148, "global_step": 15419, "epoch": 367} {"train_loss": -5.150839328765869, "global_step": 15420, "epoch": 367} {"train_loss": -5.283369064331055, "global_step": 15421, "epoch": 367} {"train_loss": -5.166242599487305, "global_step": 15422, "epoch": 367} {"train_loss": -5.140186786651611, "global_step": 15423, "epoch": 367} {"train_loss": -5.300937652587891, "global_step": 15424, "epoch": 367} {"train_loss": -5.14912223815918, "global_step": 15425, "epoch": 367} {"train_loss": -5.338454246520996, "global_step": 15426, "epoch": 367} {"train_loss": -5.329986095428467, "global_step": 15427, "epoch": 367} {"train_loss": -5.212780952453613, "global_step": 15428, "epoch": 367} {"train_loss": -5.2158002853393555, "global_step": 15429, "epoch": 367} {"train_loss": -5.213746547698975, "global_step": 15430, "epoch": 367} {"train_loss": -5.391737937927246, "global_step": 15431, "epoch": 367} {"train_loss": -5.254044055938721, "global_step": 15432, "epoch": 367} {"train_loss": -5.15432596206665, "global_step": 15433, "epoch": 367} {"train_loss": -5.250256538391113, "global_step": 15434, "epoch": 367} {"train_loss": -5.117300033569336, "global_step": 15435, "epoch": 367} {"train_loss": -5.190305233001709, "global_step": 15436, "epoch": 367} {"train_loss": -5.244653701782227, "global_step": 15437, "epoch": 367} {"train_loss": -5.249032020568848, "global_step": 15438, "epoch": 367} {"train_loss": -5.230059623718262, "global_step": 15439, "epoch": 367} {"train_loss": -5.016283988952637, "global_step": 15440, "epoch": 367} {"train_loss": -5.357393264770508, "global_step": 15441, "epoch": 367} {"train_loss": -5.3274407386779785, "global_step": 15442, "epoch": 367} {"train_loss": -5.242457389831543, "global_step": 15443, "epoch": 367} {"train_loss": -5.209628105163574, "global_step": 15444, "epoch": 367} {"train_loss": -5.231149196624756, "global_step": 15445, "epoch": 367} {"train_loss": -5.199695587158203, "global_step": 15446, "epoch": 367} {"train_loss": -5.168905258178711, "global_step": 15447, "epoch": 367} {"train_loss": -5.098119258880615, "global_step": 15448, "epoch": 367} {"train_loss": -5.155922889709473, "global_step": 15449, "epoch": 367} {"train_loss": -5.091146469116211, "global_step": 15450, "epoch": 367} {"train_loss": -5.100951194763184, "global_step": 15451, "epoch": 367} {"train_loss": -4.991031646728516, "global_step": 15452, "epoch": 367} {"train_loss": -5.296700954437256, "global_step": 15453, "epoch": 367} {"train_loss": -5.153536796569824, "global_step": 15454, "epoch": 367} {"train_loss": -5.210174447014218, "global_step": 15455, "epoch": 367, "val_loss": 70866.2734375} {"train_loss": -5.331779479980469, "global_step": 15456, "epoch": 368} {"train_loss": -5.135371208190918, "global_step": 15457, "epoch": 368} {"train_loss": -5.08142614364624, "global_step": 15458, "epoch": 368} {"train_loss": -5.108941078186035, "global_step": 15459, "epoch": 368} {"train_loss": -5.078146457672119, "global_step": 15460, "epoch": 368} {"train_loss": -5.293859481811523, "global_step": 15461, "epoch": 368} {"train_loss": -5.278800964355469, "global_step": 15462, "epoch": 368} {"train_loss": -5.137557029724121, "global_step": 15463, "epoch": 368} {"train_loss": -5.266841411590576, "global_step": 15464, "epoch": 368} {"train_loss": -5.079843521118164, "global_step": 15465, "epoch": 368} {"train_loss": -4.979766845703125, "global_step": 15466, "epoch": 368} {"train_loss": -5.234158515930176, "global_step": 15467, "epoch": 368} {"train_loss": -5.1168718338012695, "global_step": 15468, "epoch": 368} {"train_loss": -5.1034016609191895, "global_step": 15469, "epoch": 368} {"train_loss": -5.216782093048096, "global_step": 15470, "epoch": 368} {"train_loss": -4.991338729858398, "global_step": 15471, "epoch": 368} {"train_loss": -5.253820419311523, "global_step": 15472, "epoch": 368} {"train_loss": -5.1401166915893555, "global_step": 15473, "epoch": 368} {"train_loss": -5.154473304748535, "global_step": 15474, "epoch": 368} {"train_loss": -5.224574089050293, "global_step": 15475, "epoch": 368} {"train_loss": -5.281047344207764, "global_step": 15476, "epoch": 368} {"train_loss": -5.284626007080078, "global_step": 15477, "epoch": 368} {"train_loss": -5.347869396209717, "global_step": 15478, "epoch": 368} {"train_loss": -5.21247673034668, "global_step": 15479, "epoch": 368} {"train_loss": -5.287717342376709, "global_step": 15480, "epoch": 368} {"train_loss": -5.389297962188721, "global_step": 15481, "epoch": 368} {"train_loss": -5.054266929626465, "global_step": 15482, "epoch": 368} {"train_loss": -5.146738529205322, "global_step": 15483, "epoch": 368} {"train_loss": -5.303046226501465, "global_step": 15484, "epoch": 368} {"train_loss": -5.085972785949707, "global_step": 15485, "epoch": 368} {"train_loss": -5.199067115783691, "global_step": 15486, "epoch": 368} {"train_loss": -5.177079200744629, "global_step": 15487, "epoch": 368} {"train_loss": -5.207560062408447, "global_step": 15488, "epoch": 368} {"train_loss": -5.249727249145508, "global_step": 15489, "epoch": 368} {"train_loss": -5.253514289855957, "global_step": 15490, "epoch": 368} {"train_loss": -5.223076820373535, "global_step": 15491, "epoch": 368} {"train_loss": -5.307149410247803, "global_step": 15492, "epoch": 368} {"train_loss": -5.256475448608398, "global_step": 15493, "epoch": 368} {"train_loss": -5.394906044006348, "global_step": 15494, "epoch": 368} {"train_loss": -5.353288650512695, "global_step": 15495, "epoch": 368} {"train_loss": -5.375493049621582, "global_step": 15496, "epoch": 368} {"train_loss": -5.210263479323614, "global_step": 15497, "epoch": 368, "val_loss": 71166.5625} {"train_loss": -5.305169105529785, "global_step": 15498, "epoch": 369} {"train_loss": -5.393765926361084, "global_step": 15499, "epoch": 369} {"train_loss": -5.167900562286377, "global_step": 15500, "epoch": 369} {"train_loss": -5.120029926300049, "global_step": 15501, "epoch": 369} {"train_loss": -5.3308515548706055, "global_step": 15502, "epoch": 369} {"train_loss": -5.217251777648926, "global_step": 15503, "epoch": 369} {"train_loss": -5.267332077026367, "global_step": 15504, "epoch": 369} {"train_loss": -5.370996475219727, "global_step": 15505, "epoch": 369} {"train_loss": -5.189101219177246, "global_step": 15506, "epoch": 369} {"train_loss": -5.207520484924316, "global_step": 15507, "epoch": 369} {"train_loss": -5.157488822937012, "global_step": 15508, "epoch": 369} {"train_loss": -5.2781572341918945, "global_step": 15509, "epoch": 369} {"train_loss": -5.336960315704346, "global_step": 15510, "epoch": 369} {"train_loss": -5.238541603088379, "global_step": 15511, "epoch": 369} {"train_loss": -5.159089088439941, "global_step": 15512, "epoch": 369} {"train_loss": -5.285155296325684, "global_step": 15513, "epoch": 369} {"train_loss": -5.105152130126953, "global_step": 15514, "epoch": 369} {"train_loss": -5.221551895141602, "global_step": 15515, "epoch": 369} {"train_loss": -5.1800994873046875, "global_step": 15516, "epoch": 369} {"train_loss": -5.148352146148682, "global_step": 15517, "epoch": 369} {"train_loss": -5.270553112030029, "global_step": 15518, "epoch": 369} {"train_loss": -5.227603912353516, "global_step": 15519, "epoch": 369} {"train_loss": -5.223298072814941, "global_step": 15520, "epoch": 369} {"train_loss": -5.225064277648926, "global_step": 15521, "epoch": 369} {"train_loss": -5.284162998199463, "global_step": 15522, "epoch": 369} {"train_loss": -5.214930534362793, "global_step": 15523, "epoch": 369} {"train_loss": -5.199861526489258, "global_step": 15524, "epoch": 369} {"train_loss": -5.2206130027771, "global_step": 15525, "epoch": 369} {"train_loss": -5.323393821716309, "global_step": 15526, "epoch": 369} {"train_loss": -5.200231552124023, "global_step": 15527, "epoch": 369} {"train_loss": -5.30161190032959, "global_step": 15528, "epoch": 369} {"train_loss": -5.173616886138916, "global_step": 15529, "epoch": 369} {"train_loss": -5.094643592834473, "global_step": 15530, "epoch": 369} {"train_loss": -5.200364112854004, "global_step": 15531, "epoch": 369} {"train_loss": -5.131470680236816, "global_step": 15532, "epoch": 369} {"train_loss": -5.264064788818359, "global_step": 15533, "epoch": 369} {"train_loss": -5.293437480926514, "global_step": 15534, "epoch": 369} {"train_loss": -5.128963470458984, "global_step": 15535, "epoch": 369} {"train_loss": -5.317946910858154, "global_step": 15536, "epoch": 369} {"train_loss": -5.186920642852783, "global_step": 15537, "epoch": 369} {"train_loss": -5.274306297302246, "global_step": 15538, "epoch": 369} {"train_loss": -5.229822760536557, "global_step": 15539, "epoch": 369, "val_loss": 70858.640625} {"train_loss": -5.194666862487793, "global_step": 15540, "epoch": 370} {"train_loss": -5.142683982849121, "global_step": 15541, "epoch": 370} {"train_loss": -5.271769046783447, "global_step": 15542, "epoch": 370} {"train_loss": -5.2621002197265625, "global_step": 15543, "epoch": 370} {"train_loss": -5.2606425285339355, "global_step": 15544, "epoch": 370} {"train_loss": -5.294027328491211, "global_step": 15545, "epoch": 370} {"train_loss": -5.253270149230957, "global_step": 15546, "epoch": 370} {"train_loss": -5.365828990936279, "global_step": 15547, "epoch": 370} {"train_loss": -5.153652191162109, "global_step": 15548, "epoch": 370} {"train_loss": -5.2401251792907715, "global_step": 15549, "epoch": 370} {"train_loss": -5.189620494842529, "global_step": 15550, "epoch": 370} {"train_loss": -5.282943248748779, "global_step": 15551, "epoch": 370} {"train_loss": -5.363679885864258, "global_step": 15552, "epoch": 370} {"train_loss": -5.353198051452637, "global_step": 15553, "epoch": 370} {"train_loss": -5.39219856262207, "global_step": 15554, "epoch": 370} {"train_loss": -5.281036376953125, "global_step": 15555, "epoch": 370} {"train_loss": -5.245626926422119, "global_step": 15556, "epoch": 370} {"train_loss": -5.413923263549805, "global_step": 15557, "epoch": 370} {"train_loss": -5.174620628356934, "global_step": 15558, "epoch": 370} {"train_loss": -5.257696151733398, "global_step": 15559, "epoch": 370} {"train_loss": -5.199246406555176, "global_step": 15560, "epoch": 370} {"train_loss": -5.250187873840332, "global_step": 15561, "epoch": 370} {"train_loss": -5.138744354248047, "global_step": 15562, "epoch": 370} {"train_loss": -5.1984148025512695, "global_step": 15563, "epoch": 370} {"train_loss": -5.308204650878906, "global_step": 15564, "epoch": 370} {"train_loss": -5.062851905822754, "global_step": 15565, "epoch": 370} {"train_loss": -5.018750190734863, "global_step": 15566, "epoch": 370} {"train_loss": -5.004469871520996, "global_step": 15567, "epoch": 370} {"train_loss": -5.099031448364258, "global_step": 15568, "epoch": 370} {"train_loss": -4.7985124588012695, "global_step": 15569, "epoch": 370} {"train_loss": -4.772348880767822, "global_step": 15570, "epoch": 370} {"train_loss": -5.173280715942383, "global_step": 15571, "epoch": 370} {"train_loss": -5.301363945007324, "global_step": 15572, "epoch": 370} {"train_loss": -4.938629150390625, "global_step": 15573, "epoch": 370} {"train_loss": -5.011323928833008, "global_step": 15574, "epoch": 370} {"train_loss": -5.0977091789245605, "global_step": 15575, "epoch": 370} {"train_loss": -5.236713886260986, "global_step": 15576, "epoch": 370} {"train_loss": -4.960278511047363, "global_step": 15577, "epoch": 370} {"train_loss": -5.028785228729248, "global_step": 15578, "epoch": 370} {"train_loss": -5.1454010009765625, "global_step": 15579, "epoch": 370} {"train_loss": -5.008683204650879, "global_step": 15580, "epoch": 370} {"train_loss": -5.1744419279552645, "global_step": 15581, "epoch": 370, "val_loss": 70744.84375} {"train_loss": -5.203956604003906, "global_step": 15582, "epoch": 371} {"train_loss": -5.214488506317139, "global_step": 15583, "epoch": 371} {"train_loss": -5.087192058563232, "global_step": 15584, "epoch": 371} {"train_loss": -5.157615661621094, "global_step": 15585, "epoch": 371} {"train_loss": -5.228487491607666, "global_step": 15586, "epoch": 371} {"train_loss": -5.094546318054199, "global_step": 15587, "epoch": 371} {"train_loss": -5.221203804016113, "global_step": 15588, "epoch": 371} {"train_loss": -5.287104606628418, "global_step": 15589, "epoch": 371} {"train_loss": -5.10469913482666, "global_step": 15590, "epoch": 371} {"train_loss": -5.153324604034424, "global_step": 15591, "epoch": 371} {"train_loss": -5.186357021331787, "global_step": 15592, "epoch": 371} {"train_loss": -5.4028730392456055, "global_step": 15593, "epoch": 371} {"train_loss": -5.055243492126465, "global_step": 15594, "epoch": 371} {"train_loss": -5.207143783569336, "global_step": 15595, "epoch": 371} {"train_loss": -5.1690192222595215, "global_step": 15596, "epoch": 371} {"train_loss": -5.084264755249023, "global_step": 15597, "epoch": 371} {"train_loss": -5.212765693664551, "global_step": 15598, "epoch": 371} {"train_loss": -5.1316237449646, "global_step": 15599, "epoch": 371} {"train_loss": -5.304267406463623, "global_step": 15600, "epoch": 371} {"train_loss": -5.161359786987305, "global_step": 15601, "epoch": 371} {"train_loss": -5.246216773986816, "global_step": 15602, "epoch": 371} {"train_loss": -5.254331588745117, "global_step": 15603, "epoch": 371} {"train_loss": -5.218120574951172, "global_step": 15604, "epoch": 371} {"train_loss": -5.236508846282959, "global_step": 15605, "epoch": 371} {"train_loss": -5.347378253936768, "global_step": 15606, "epoch": 371} {"train_loss": -5.254177570343018, "global_step": 15607, "epoch": 371} {"train_loss": -5.102177619934082, "global_step": 15608, "epoch": 371} {"train_loss": -5.177652359008789, "global_step": 15609, "epoch": 371} {"train_loss": -5.192419052124023, "global_step": 15610, "epoch": 371} {"train_loss": -5.287442684173584, "global_step": 15611, "epoch": 371} {"train_loss": -5.239165306091309, "global_step": 15612, "epoch": 371} {"train_loss": -5.289896488189697, "global_step": 15613, "epoch": 371} {"train_loss": -5.1836395263671875, "global_step": 15614, "epoch": 371} {"train_loss": -5.254393100738525, "global_step": 15615, "epoch": 371} {"train_loss": -5.307485103607178, "global_step": 15616, "epoch": 371} {"train_loss": -5.309585094451904, "global_step": 15617, "epoch": 371} {"train_loss": -5.088164329528809, "global_step": 15618, "epoch": 371} {"train_loss": -5.343446254730225, "global_step": 15619, "epoch": 371} {"train_loss": -5.093805313110352, "global_step": 15620, "epoch": 371} {"train_loss": -5.007472991943359, "global_step": 15621, "epoch": 371} {"train_loss": -5.252067565917969, "global_step": 15622, "epoch": 371} {"train_loss": -5.203374249594552, "global_step": 15623, "epoch": 371, "val_loss": 72205.65625} {"train_loss": -5.08842658996582, "global_step": 15624, "epoch": 372} {"train_loss": -5.097281455993652, "global_step": 15625, "epoch": 372} {"train_loss": -5.059722423553467, "global_step": 15626, "epoch": 372} {"train_loss": -5.0743889808654785, "global_step": 15627, "epoch": 372} {"train_loss": -5.157753944396973, "global_step": 15628, "epoch": 372} {"train_loss": -5.013580799102783, "global_step": 15629, "epoch": 372} {"train_loss": -5.0790605545043945, "global_step": 15630, "epoch": 372} {"train_loss": -4.839024543762207, "global_step": 15631, "epoch": 372} {"train_loss": -5.099524021148682, "global_step": 15632, "epoch": 372} {"train_loss": -5.026556968688965, "global_step": 15633, "epoch": 372} {"train_loss": -4.9187822341918945, "global_step": 15634, "epoch": 372} {"train_loss": -5.170351982116699, "global_step": 15635, "epoch": 372} {"train_loss": -5.023348808288574, "global_step": 15636, "epoch": 372} {"train_loss": -5.096808433532715, "global_step": 15637, "epoch": 372} {"train_loss": -4.852998733520508, "global_step": 15638, "epoch": 372} {"train_loss": -5.136836528778076, "global_step": 15639, "epoch": 372} {"train_loss": -5.095583438873291, "global_step": 15640, "epoch": 372} {"train_loss": -5.0482072830200195, "global_step": 15641, "epoch": 372} {"train_loss": -5.1496500968933105, "global_step": 15642, "epoch": 372} {"train_loss": -5.146685600280762, "global_step": 15643, "epoch": 372} {"train_loss": -5.18858528137207, "global_step": 15644, "epoch": 372} {"train_loss": -5.255043983459473, "global_step": 15645, "epoch": 372} {"train_loss": -5.126794815063477, "global_step": 15646, "epoch": 372} {"train_loss": -5.148725509643555, "global_step": 15647, "epoch": 372} {"train_loss": -5.140501499176025, "global_step": 15648, "epoch": 372} {"train_loss": -5.250566005706787, "global_step": 15649, "epoch": 372} {"train_loss": -5.229156970977783, "global_step": 15650, "epoch": 372} {"train_loss": -5.210043907165527, "global_step": 15651, "epoch": 372} {"train_loss": -5.222998142242432, "global_step": 15652, "epoch": 372} {"train_loss": -5.14564847946167, "global_step": 15653, "epoch": 372} {"train_loss": -5.330986976623535, "global_step": 15654, "epoch": 372} {"train_loss": -5.168241500854492, "global_step": 15655, "epoch": 372} {"train_loss": -5.223531723022461, "global_step": 15656, "epoch": 372} {"train_loss": -5.250052452087402, "global_step": 15657, "epoch": 372} {"train_loss": -5.144237518310547, "global_step": 15658, "epoch": 372} {"train_loss": -5.210536956787109, "global_step": 15659, "epoch": 372} {"train_loss": -5.255338191986084, "global_step": 15660, "epoch": 372} {"train_loss": -5.254689693450928, "global_step": 15661, "epoch": 372} {"train_loss": -5.263402938842773, "global_step": 15662, "epoch": 372} {"train_loss": -5.240921974182129, "global_step": 15663, "epoch": 372} {"train_loss": -5.218542098999023, "global_step": 15664, "epoch": 372} {"train_loss": -5.140127057120914, "global_step": 15665, "epoch": 372, "val_loss": 70583.2734375} {"train_loss": -5.247745513916016, "global_step": 15666, "epoch": 373} {"train_loss": -5.151512145996094, "global_step": 15667, "epoch": 373} {"train_loss": -5.200967311859131, "global_step": 15668, "epoch": 373} {"train_loss": -5.240418434143066, "global_step": 15669, "epoch": 373} {"train_loss": -5.1359357833862305, "global_step": 15670, "epoch": 373} {"train_loss": -5.122077941894531, "global_step": 15671, "epoch": 373} {"train_loss": -5.312797546386719, "global_step": 15672, "epoch": 373} {"train_loss": -5.208375453948975, "global_step": 15673, "epoch": 373} {"train_loss": -5.304264545440674, "global_step": 15674, "epoch": 373} {"train_loss": -5.314151763916016, "global_step": 15675, "epoch": 373} {"train_loss": -5.200255870819092, "global_step": 15676, "epoch": 373} {"train_loss": -5.270090103149414, "global_step": 15677, "epoch": 373} {"train_loss": -5.173235893249512, "global_step": 15678, "epoch": 373} {"train_loss": -5.327101707458496, "global_step": 15679, "epoch": 373} {"train_loss": -5.335289001464844, "global_step": 15680, "epoch": 373} {"train_loss": -5.092350482940674, "global_step": 15681, "epoch": 373} {"train_loss": -5.312723159790039, "global_step": 15682, "epoch": 373} {"train_loss": -5.189335823059082, "global_step": 15683, "epoch": 373} {"train_loss": -5.312480449676514, "global_step": 15684, "epoch": 373} {"train_loss": -5.119859218597412, "global_step": 15685, "epoch": 373} {"train_loss": -5.241098403930664, "global_step": 15686, "epoch": 373} {"train_loss": -5.249422550201416, "global_step": 15687, "epoch": 373} {"train_loss": -5.197218418121338, "global_step": 15688, "epoch": 373} {"train_loss": -5.26322603225708, "global_step": 15689, "epoch": 373} {"train_loss": -5.3121137619018555, "global_step": 15690, "epoch": 373} {"train_loss": -5.260943412780762, "global_step": 15691, "epoch": 373} {"train_loss": -5.283712387084961, "global_step": 15692, "epoch": 373} {"train_loss": -5.282662391662598, "global_step": 15693, "epoch": 373} {"train_loss": -5.110746383666992, "global_step": 15694, "epoch": 373} {"train_loss": -5.29042387008667, "global_step": 15695, "epoch": 373} {"train_loss": -5.2861247062683105, "global_step": 15696, "epoch": 373} {"train_loss": -5.261765480041504, "global_step": 15697, "epoch": 373} {"train_loss": -5.176445007324219, "global_step": 15698, "epoch": 373} {"train_loss": -5.294010162353516, "global_step": 15699, "epoch": 373} {"train_loss": -5.221404075622559, "global_step": 15700, "epoch": 373} {"train_loss": -5.3784637451171875, "global_step": 15701, "epoch": 373} {"train_loss": -5.25299072265625, "global_step": 15702, "epoch": 373} {"train_loss": -5.210626602172852, "global_step": 15703, "epoch": 373} {"train_loss": -5.24554443359375, "global_step": 15704, "epoch": 373} {"train_loss": -5.22231912612915, "global_step": 15705, "epoch": 373} {"train_loss": -5.217702865600586, "global_step": 15706, "epoch": 373} {"train_loss": -5.238433111281622, "global_step": 15707, "epoch": 373, "val_loss": 70651.5234375} {"train_loss": -5.3619489669799805, "global_step": 15708, "epoch": 374} {"train_loss": -5.267852306365967, "global_step": 15709, "epoch": 374} {"train_loss": -5.203466415405273, "global_step": 15710, "epoch": 374} {"train_loss": -5.145439147949219, "global_step": 15711, "epoch": 374} {"train_loss": -5.146047115325928, "global_step": 15712, "epoch": 374} {"train_loss": -5.20190954208374, "global_step": 15713, "epoch": 374} {"train_loss": -5.22829008102417, "global_step": 15714, "epoch": 374} {"train_loss": -5.101109981536865, "global_step": 15715, "epoch": 374} {"train_loss": -5.2148027420043945, "global_step": 15716, "epoch": 374} {"train_loss": -4.939619064331055, "global_step": 15717, "epoch": 374} {"train_loss": -4.997798919677734, "global_step": 15718, "epoch": 374} {"train_loss": -5.2605133056640625, "global_step": 15719, "epoch": 374} {"train_loss": -4.711753845214844, "global_step": 15720, "epoch": 374} {"train_loss": -5.15579080581665, "global_step": 15721, "epoch": 374} {"train_loss": -5.303781509399414, "global_step": 15722, "epoch": 374} {"train_loss": -5.0290422439575195, "global_step": 15723, "epoch": 374} {"train_loss": -5.018581390380859, "global_step": 15724, "epoch": 374} {"train_loss": -5.073387145996094, "global_step": 15725, "epoch": 374} {"train_loss": -5.114095687866211, "global_step": 15726, "epoch": 374} {"train_loss": -5.013140678405762, "global_step": 15727, "epoch": 374} {"train_loss": -5.294645309448242, "global_step": 15728, "epoch": 374} {"train_loss": -5.086629867553711, "global_step": 15729, "epoch": 374} {"train_loss": -5.025772571563721, "global_step": 15730, "epoch": 374} {"train_loss": -5.157684326171875, "global_step": 15731, "epoch": 374} {"train_loss": -5.309500694274902, "global_step": 15732, "epoch": 374} {"train_loss": -5.165951728820801, "global_step": 15733, "epoch": 374} {"train_loss": -5.131493091583252, "global_step": 15734, "epoch": 374} {"train_loss": -5.045374870300293, "global_step": 15735, "epoch": 374} {"train_loss": -5.120677947998047, "global_step": 15736, "epoch": 374} {"train_loss": -5.071864128112793, "global_step": 15737, "epoch": 374} {"train_loss": -5.183805465698242, "global_step": 15738, "epoch": 374} {"train_loss": -5.22259521484375, "global_step": 15739, "epoch": 374} {"train_loss": -5.279340744018555, "global_step": 15740, "epoch": 374} {"train_loss": -5.086315155029297, "global_step": 15741, "epoch": 374} {"train_loss": -5.217212677001953, "global_step": 15742, "epoch": 374} {"train_loss": -5.035632133483887, "global_step": 15743, "epoch": 374} {"train_loss": -5.248437881469727, "global_step": 15744, "epoch": 374} {"train_loss": -5.185935020446777, "global_step": 15745, "epoch": 374} {"train_loss": -5.027703762054443, "global_step": 15746, "epoch": 374} {"train_loss": -5.222677707672119, "global_step": 15747, "epoch": 374} {"train_loss": -5.399905681610107, "global_step": 15748, "epoch": 374} {"train_loss": -5.147807461874826, "global_step": 15749, "epoch": 374, "val_loss": 71262.390625} {"train_loss": -5.214139461517334, "global_step": 15750, "epoch": 375} {"train_loss": -5.232900619506836, "global_step": 15751, "epoch": 375} {"train_loss": -5.241349220275879, "global_step": 15752, "epoch": 375} {"train_loss": -5.021702766418457, "global_step": 15753, "epoch": 375} {"train_loss": -5.219797134399414, "global_step": 15754, "epoch": 375} {"train_loss": -5.1013288497924805, "global_step": 15755, "epoch": 375} {"train_loss": -5.301572799682617, "global_step": 15756, "epoch": 375} {"train_loss": -5.144528388977051, "global_step": 15757, "epoch": 375} {"train_loss": -4.976707458496094, "global_step": 15758, "epoch": 375} {"train_loss": -5.131217956542969, "global_step": 15759, "epoch": 375} {"train_loss": -5.104063034057617, "global_step": 15760, "epoch": 375} {"train_loss": -5.277413368225098, "global_step": 15761, "epoch": 375} {"train_loss": -5.136567115783691, "global_step": 15762, "epoch": 375} {"train_loss": -5.159515857696533, "global_step": 15763, "epoch": 375} {"train_loss": -5.215538501739502, "global_step": 15764, "epoch": 375} {"train_loss": -5.306653022766113, "global_step": 15765, "epoch": 375} {"train_loss": -5.248327732086182, "global_step": 15766, "epoch": 375} {"train_loss": -5.359360694885254, "global_step": 15767, "epoch": 375} {"train_loss": -5.2284955978393555, "global_step": 15768, "epoch": 375} {"train_loss": -5.238162040710449, "global_step": 15769, "epoch": 375} {"train_loss": -5.358960151672363, "global_step": 15770, "epoch": 375} {"train_loss": -5.184996604919434, "global_step": 15771, "epoch": 375} {"train_loss": -5.342992782592773, "global_step": 15772, "epoch": 375} {"train_loss": -5.33210563659668, "global_step": 15773, "epoch": 375} {"train_loss": -5.320564270019531, "global_step": 15774, "epoch": 375} {"train_loss": -5.255986213684082, "global_step": 15775, "epoch": 375} {"train_loss": -5.020594596862793, "global_step": 15776, "epoch": 375} {"train_loss": -5.284188270568848, "global_step": 15777, "epoch": 375} {"train_loss": -5.222006797790527, "global_step": 15778, "epoch": 375} {"train_loss": -5.252426624298096, "global_step": 15779, "epoch": 375} {"train_loss": -5.170543670654297, "global_step": 15780, "epoch": 375} {"train_loss": -5.274009704589844, "global_step": 15781, "epoch": 375} {"train_loss": -5.334727764129639, "global_step": 15782, "epoch": 375} {"train_loss": -5.269629955291748, "global_step": 15783, "epoch": 375} {"train_loss": -5.279056072235107, "global_step": 15784, "epoch": 375} {"train_loss": -5.24503231048584, "global_step": 15785, "epoch": 375} {"train_loss": -5.252321243286133, "global_step": 15786, "epoch": 375} {"train_loss": -5.352499961853027, "global_step": 15787, "epoch": 375} {"train_loss": -5.1821746826171875, "global_step": 15788, "epoch": 375} {"train_loss": -5.2706804275512695, "global_step": 15789, "epoch": 375} {"train_loss": -5.309869766235352, "global_step": 15790, "epoch": 375} {"train_loss": -5.229778119495937, "global_step": 15791, "epoch": 375, "val_loss": 70654.1484375} {"train_loss": -5.196700096130371, "global_step": 15792, "epoch": 376} {"train_loss": -5.270119667053223, "global_step": 15793, "epoch": 376} {"train_loss": -5.229160308837891, "global_step": 15794, "epoch": 376} {"train_loss": -5.273890972137451, "global_step": 15795, "epoch": 376} {"train_loss": -5.1865129470825195, "global_step": 15796, "epoch": 376} {"train_loss": -5.249467849731445, "global_step": 15797, "epoch": 376} {"train_loss": -5.1668620109558105, "global_step": 15798, "epoch": 376} {"train_loss": -5.278886318206787, "global_step": 15799, "epoch": 376} {"train_loss": -5.327336311340332, "global_step": 15800, "epoch": 376} {"train_loss": -5.295405387878418, "global_step": 15801, "epoch": 376} {"train_loss": -5.235010147094727, "global_step": 15802, "epoch": 376} {"train_loss": -5.22686767578125, "global_step": 15803, "epoch": 376} {"train_loss": -5.310704231262207, "global_step": 15804, "epoch": 376} {"train_loss": -5.222651481628418, "global_step": 15805, "epoch": 376} {"train_loss": -5.163883209228516, "global_step": 15806, "epoch": 376} {"train_loss": -5.3060760498046875, "global_step": 15807, "epoch": 376} {"train_loss": -5.134957790374756, "global_step": 15808, "epoch": 376} {"train_loss": -5.223480224609375, "global_step": 15809, "epoch": 376} {"train_loss": -5.216414928436279, "global_step": 15810, "epoch": 376} {"train_loss": -5.17894983291626, "global_step": 15811, "epoch": 376} {"train_loss": -5.202920436859131, "global_step": 15812, "epoch": 376} {"train_loss": -4.934288024902344, "global_step": 15813, "epoch": 376} {"train_loss": -5.253252029418945, "global_step": 15814, "epoch": 376} {"train_loss": -4.945603370666504, "global_step": 15815, "epoch": 376} {"train_loss": -5.11737060546875, "global_step": 15816, "epoch": 376} {"train_loss": -5.260427474975586, "global_step": 15817, "epoch": 376} {"train_loss": -5.0909223556518555, "global_step": 15818, "epoch": 376} {"train_loss": -5.227710723876953, "global_step": 15819, "epoch": 376} {"train_loss": -5.212615966796875, "global_step": 15820, "epoch": 376} {"train_loss": -5.164836883544922, "global_step": 15821, "epoch": 376} {"train_loss": -5.176230430603027, "global_step": 15822, "epoch": 376} {"train_loss": -5.194713592529297, "global_step": 15823, "epoch": 376} {"train_loss": -5.214347839355469, "global_step": 15824, "epoch": 376} {"train_loss": -5.228198528289795, "global_step": 15825, "epoch": 376} {"train_loss": -5.23549747467041, "global_step": 15826, "epoch": 376} {"train_loss": -5.2174482345581055, "global_step": 15827, "epoch": 376} {"train_loss": -5.236172676086426, "global_step": 15828, "epoch": 376} {"train_loss": -5.133543968200684, "global_step": 15829, "epoch": 376} {"train_loss": -5.276433944702148, "global_step": 15830, "epoch": 376} {"train_loss": -5.1144914627075195, "global_step": 15831, "epoch": 376} {"train_loss": -5.212095737457275, "global_step": 15832, "epoch": 376} {"train_loss": -5.204475652603876, "global_step": 15833, "epoch": 376, "val_loss": 71115.0859375} {"train_loss": -5.370108604431152, "global_step": 15834, "epoch": 377} {"train_loss": -5.3505964279174805, "global_step": 15835, "epoch": 377} {"train_loss": -5.400577545166016, "global_step": 15836, "epoch": 377} {"train_loss": -5.22335147857666, "global_step": 15837, "epoch": 377} {"train_loss": -5.231390953063965, "global_step": 15838, "epoch": 377} {"train_loss": -5.263321876525879, "global_step": 15839, "epoch": 377} {"train_loss": -5.402177333831787, "global_step": 15840, "epoch": 377} {"train_loss": -5.237382888793945, "global_step": 15841, "epoch": 377} {"train_loss": -5.357443332672119, "global_step": 15842, "epoch": 377} {"train_loss": -5.235360145568848, "global_step": 15843, "epoch": 377} {"train_loss": -5.330329895019531, "global_step": 15844, "epoch": 377} {"train_loss": -5.23182487487793, "global_step": 15845, "epoch": 377} {"train_loss": -5.017484664916992, "global_step": 15846, "epoch": 377} {"train_loss": -5.155005931854248, "global_step": 15847, "epoch": 377} {"train_loss": -5.195075988769531, "global_step": 15848, "epoch": 377} {"train_loss": -5.304844379425049, "global_step": 15849, "epoch": 377} {"train_loss": -5.060251712799072, "global_step": 15850, "epoch": 377} {"train_loss": -5.226739406585693, "global_step": 15851, "epoch": 377} {"train_loss": -5.205502033233643, "global_step": 15852, "epoch": 377} {"train_loss": -5.230267524719238, "global_step": 15853, "epoch": 377} {"train_loss": -5.203815937042236, "global_step": 15854, "epoch": 377} {"train_loss": -5.162993907928467, "global_step": 15855, "epoch": 377} {"train_loss": -5.294683933258057, "global_step": 15856, "epoch": 377} {"train_loss": -5.039020538330078, "global_step": 15857, "epoch": 377} {"train_loss": -5.27170991897583, "global_step": 15858, "epoch": 377} {"train_loss": -5.187540054321289, "global_step": 15859, "epoch": 377} {"train_loss": -5.153932571411133, "global_step": 15860, "epoch": 377} {"train_loss": -5.302438735961914, "global_step": 15861, "epoch": 377} {"train_loss": -5.2298102378845215, "global_step": 15862, "epoch": 377} {"train_loss": -5.172331809997559, "global_step": 15863, "epoch": 377} {"train_loss": -5.283043384552002, "global_step": 15864, "epoch": 377} {"train_loss": -5.269862651824951, "global_step": 15865, "epoch": 377} {"train_loss": -5.10472297668457, "global_step": 15866, "epoch": 377} {"train_loss": -5.327492713928223, "global_step": 15867, "epoch": 377} {"train_loss": -5.1957106590271, "global_step": 15868, "epoch": 377} {"train_loss": -5.071367263793945, "global_step": 15869, "epoch": 377} {"train_loss": -5.316001892089844, "global_step": 15870, "epoch": 377} {"train_loss": -5.251877307891846, "global_step": 15871, "epoch": 377} {"train_loss": -5.126431465148926, "global_step": 15872, "epoch": 377} {"train_loss": -5.3146796226501465, "global_step": 15873, "epoch": 377} {"train_loss": -5.174398899078369, "global_step": 15874, "epoch": 377} {"train_loss": -5.229822771889823, "global_step": 15875, "epoch": 377, "val_loss": 70989.921875} {"train_loss": -5.238459587097168, "global_step": 15876, "epoch": 378} {"train_loss": -5.0753278732299805, "global_step": 15877, "epoch": 378} {"train_loss": -5.209036827087402, "global_step": 15878, "epoch": 378} {"train_loss": -5.18251895904541, "global_step": 15879, "epoch": 378} {"train_loss": -5.180893898010254, "global_step": 15880, "epoch": 378} {"train_loss": -5.097036361694336, "global_step": 15881, "epoch": 378} {"train_loss": -5.143633842468262, "global_step": 15882, "epoch": 378} {"train_loss": -5.290151596069336, "global_step": 15883, "epoch": 378} {"train_loss": -5.104315280914307, "global_step": 15884, "epoch": 378} {"train_loss": -5.251265525817871, "global_step": 15885, "epoch": 378} {"train_loss": -5.228124141693115, "global_step": 15886, "epoch": 378} {"train_loss": -5.175575256347656, "global_step": 15887, "epoch": 378} {"train_loss": -5.341116905212402, "global_step": 15888, "epoch": 378} {"train_loss": -5.181189060211182, "global_step": 15889, "epoch": 378} {"train_loss": -5.204184532165527, "global_step": 15890, "epoch": 378} {"train_loss": -5.150692462921143, "global_step": 15891, "epoch": 378} {"train_loss": -5.128396034240723, "global_step": 15892, "epoch": 378} {"train_loss": -5.07747745513916, "global_step": 15893, "epoch": 378} {"train_loss": -5.171982765197754, "global_step": 15894, "epoch": 378} {"train_loss": -5.252718925476074, "global_step": 15895, "epoch": 378} {"train_loss": -5.24557638168335, "global_step": 15896, "epoch": 378} {"train_loss": -5.187644004821777, "global_step": 15897, "epoch": 378} {"train_loss": -5.3511152267456055, "global_step": 15898, "epoch": 378} {"train_loss": -5.359635829925537, "global_step": 15899, "epoch": 378} {"train_loss": -5.2728471755981445, "global_step": 15900, "epoch": 378} {"train_loss": -5.308774948120117, "global_step": 15901, "epoch": 378} {"train_loss": -5.229410171508789, "global_step": 15902, "epoch": 378} {"train_loss": -5.173174858093262, "global_step": 15903, "epoch": 378} {"train_loss": -5.225751876831055, "global_step": 15904, "epoch": 378} {"train_loss": -5.275188446044922, "global_step": 15905, "epoch": 378} {"train_loss": -5.0402021408081055, "global_step": 15906, "epoch": 378} {"train_loss": -5.264801025390625, "global_step": 15907, "epoch": 378} {"train_loss": -5.220979690551758, "global_step": 15908, "epoch": 378} {"train_loss": -5.041726112365723, "global_step": 15909, "epoch": 378} {"train_loss": -5.184208869934082, "global_step": 15910, "epoch": 378} {"train_loss": -5.267313003540039, "global_step": 15911, "epoch": 378} {"train_loss": -5.218420028686523, "global_step": 15912, "epoch": 378} {"train_loss": -5.292978763580322, "global_step": 15913, "epoch": 378} {"train_loss": -5.111667633056641, "global_step": 15914, "epoch": 378} {"train_loss": -5.296204566955566, "global_step": 15915, "epoch": 378} {"train_loss": -5.082560062408447, "global_step": 15916, "epoch": 378} {"train_loss": -5.202391488211496, "global_step": 15917, "epoch": 378, "val_loss": 70963.828125} {"train_loss": -5.233491897583008, "global_step": 15918, "epoch": 379} {"train_loss": -5.193225860595703, "global_step": 15919, "epoch": 379} {"train_loss": -5.291689872741699, "global_step": 15920, "epoch": 379} {"train_loss": -5.372861385345459, "global_step": 15921, "epoch": 379} {"train_loss": -5.283120632171631, "global_step": 15922, "epoch": 379} {"train_loss": -5.312114238739014, "global_step": 15923, "epoch": 379} {"train_loss": -5.308548450469971, "global_step": 15924, "epoch": 379} {"train_loss": -5.2970805168151855, "global_step": 15925, "epoch": 379} {"train_loss": -5.387025833129883, "global_step": 15926, "epoch": 379} {"train_loss": -5.317120552062988, "global_step": 15927, "epoch": 379} {"train_loss": -5.221338748931885, "global_step": 15928, "epoch": 379} {"train_loss": -5.240602970123291, "global_step": 15929, "epoch": 379} {"train_loss": -5.224465370178223, "global_step": 15930, "epoch": 379} {"train_loss": -5.197492599487305, "global_step": 15931, "epoch": 379} {"train_loss": -5.199470520019531, "global_step": 15932, "epoch": 379} {"train_loss": -5.303715705871582, "global_step": 15933, "epoch": 379} {"train_loss": -5.185922622680664, "global_step": 15934, "epoch": 379} {"train_loss": -5.154119491577148, "global_step": 15935, "epoch": 379} {"train_loss": -5.212668418884277, "global_step": 15936, "epoch": 379} {"train_loss": -5.251274108886719, "global_step": 15937, "epoch": 379} {"train_loss": -5.181857109069824, "global_step": 15938, "epoch": 379} {"train_loss": -5.344625473022461, "global_step": 15939, "epoch": 379} {"train_loss": -5.127087116241455, "global_step": 15940, "epoch": 379} {"train_loss": -5.145526885986328, "global_step": 15941, "epoch": 379} {"train_loss": -5.209149360656738, "global_step": 15942, "epoch": 379} {"train_loss": -5.1720709800720215, "global_step": 15943, "epoch": 379} {"train_loss": -5.2770795822143555, "global_step": 15944, "epoch": 379} {"train_loss": -5.156268119812012, "global_step": 15945, "epoch": 379} {"train_loss": -5.1199235916137695, "global_step": 15946, "epoch": 379} {"train_loss": -5.201480865478516, "global_step": 15947, "epoch": 379} {"train_loss": -5.318584442138672, "global_step": 15948, "epoch": 379} {"train_loss": -5.141120910644531, "global_step": 15949, "epoch": 379} {"train_loss": -5.24725341796875, "global_step": 15950, "epoch": 379} {"train_loss": -5.239904403686523, "global_step": 15951, "epoch": 379} {"train_loss": -5.210721492767334, "global_step": 15952, "epoch": 379} {"train_loss": -5.2851667404174805, "global_step": 15953, "epoch": 379} {"train_loss": -5.331681251525879, "global_step": 15954, "epoch": 379} {"train_loss": -5.235721588134766, "global_step": 15955, "epoch": 379} {"train_loss": -5.1086745262146, "global_step": 15956, "epoch": 379} {"train_loss": -5.257929801940918, "global_step": 15957, "epoch": 379} {"train_loss": -5.2063398361206055, "global_step": 15958, "epoch": 379} {"train_loss": -5.237912552697318, "global_step": 15959, "epoch": 379, "val_loss": 70678.1640625} {"train_loss": -5.294801235198975, "global_step": 15960, "epoch": 380} {"train_loss": -5.271991729736328, "global_step": 15961, "epoch": 380} {"train_loss": -5.269773960113525, "global_step": 15962, "epoch": 380} {"train_loss": -5.29170036315918, "global_step": 15963, "epoch": 380} {"train_loss": -5.350172519683838, "global_step": 15964, "epoch": 380} {"train_loss": -5.2279462814331055, "global_step": 15965, "epoch": 380} {"train_loss": -5.321406841278076, "global_step": 15966, "epoch": 380} {"train_loss": -5.2877655029296875, "global_step": 15967, "epoch": 380} {"train_loss": -5.247920036315918, "global_step": 15968, "epoch": 380} {"train_loss": -5.301657676696777, "global_step": 15969, "epoch": 380} {"train_loss": -5.188950538635254, "global_step": 15970, "epoch": 380} {"train_loss": -5.395651817321777, "global_step": 15971, "epoch": 380} {"train_loss": -5.127196311950684, "global_step": 15972, "epoch": 380} {"train_loss": -5.309380531311035, "global_step": 15973, "epoch": 380} {"train_loss": -5.196596145629883, "global_step": 15974, "epoch": 380} {"train_loss": -5.23917293548584, "global_step": 15975, "epoch": 380} {"train_loss": -5.125238418579102, "global_step": 15976, "epoch": 380} {"train_loss": -5.218186855316162, "global_step": 15977, "epoch": 380} {"train_loss": -5.160181999206543, "global_step": 15978, "epoch": 380} {"train_loss": -5.268293380737305, "global_step": 15979, "epoch": 380} {"train_loss": -5.2692179679870605, "global_step": 15980, "epoch": 380} {"train_loss": -5.253540992736816, "global_step": 15981, "epoch": 380} {"train_loss": -5.205466270446777, "global_step": 15982, "epoch": 380} {"train_loss": -5.310883045196533, "global_step": 15983, "epoch": 380} {"train_loss": -5.341089725494385, "global_step": 15984, "epoch": 380} {"train_loss": -5.151862621307373, "global_step": 15985, "epoch": 380} {"train_loss": -5.133997917175293, "global_step": 15986, "epoch": 380} {"train_loss": -5.302550315856934, "global_step": 15987, "epoch": 380} {"train_loss": -5.140665054321289, "global_step": 15988, "epoch": 380} {"train_loss": -5.219048500061035, "global_step": 15989, "epoch": 380} {"train_loss": -5.099414825439453, "global_step": 15990, "epoch": 380} {"train_loss": -5.270902156829834, "global_step": 15991, "epoch": 380} {"train_loss": -5.158533096313477, "global_step": 15992, "epoch": 380} {"train_loss": -5.259264945983887, "global_step": 15993, "epoch": 380} {"train_loss": -5.1612324714660645, "global_step": 15994, "epoch": 380} {"train_loss": -5.287114143371582, "global_step": 15995, "epoch": 380} {"train_loss": -5.267292022705078, "global_step": 15996, "epoch": 380} {"train_loss": -5.073105812072754, "global_step": 15997, "epoch": 380} {"train_loss": -5.33763313293457, "global_step": 15998, "epoch": 380} {"train_loss": -5.251666069030762, "global_step": 15999, "epoch": 380} {"train_loss": -5.252360820770264, "global_step": 16000, "epoch": 380} {"train_loss": -5.2381181035723, "global_step": 16001, "epoch": 380, "val_loss": 70589.328125} {"train_loss": -5.306405544281006, "global_step": 16002, "epoch": 381} {"train_loss": -5.205650329589844, "global_step": 16003, "epoch": 381} {"train_loss": -5.345726013183594, "global_step": 16004, "epoch": 381} {"train_loss": -5.227753639221191, "global_step": 16005, "epoch": 381} {"train_loss": -5.30157995223999, "global_step": 16006, "epoch": 381} {"train_loss": -5.206610202789307, "global_step": 16007, "epoch": 381} {"train_loss": -5.211686611175537, "global_step": 16008, "epoch": 381} {"train_loss": -5.355338096618652, "global_step": 16009, "epoch": 381} {"train_loss": -5.208870887756348, "global_step": 16010, "epoch": 381} {"train_loss": -5.131278991699219, "global_step": 16011, "epoch": 381} {"train_loss": -5.142564296722412, "global_step": 16012, "epoch": 381} {"train_loss": -5.138195514678955, "global_step": 16013, "epoch": 381} {"train_loss": -5.230902671813965, "global_step": 16014, "epoch": 381} {"train_loss": -5.194005966186523, "global_step": 16015, "epoch": 381} {"train_loss": -5.169671058654785, "global_step": 16016, "epoch": 381} {"train_loss": -5.122742652893066, "global_step": 16017, "epoch": 381} {"train_loss": -5.346103191375732, "global_step": 16018, "epoch": 381} {"train_loss": -5.165500640869141, "global_step": 16019, "epoch": 381} {"train_loss": -5.245050430297852, "global_step": 16020, "epoch": 381} {"train_loss": -5.252338886260986, "global_step": 16021, "epoch": 381} {"train_loss": -5.10308837890625, "global_step": 16022, "epoch": 381} {"train_loss": -5.224098205566406, "global_step": 16023, "epoch": 381} {"train_loss": -5.2932353019714355, "global_step": 16024, "epoch": 381} {"train_loss": -5.09716272354126, "global_step": 16025, "epoch": 381} {"train_loss": -5.254362106323242, "global_step": 16026, "epoch": 381} {"train_loss": -5.198356628417969, "global_step": 16027, "epoch": 381} {"train_loss": -5.260302543640137, "global_step": 16028, "epoch": 381} {"train_loss": -5.274481773376465, "global_step": 16029, "epoch": 381} {"train_loss": -5.294102668762207, "global_step": 16030, "epoch": 381} {"train_loss": -5.240470886230469, "global_step": 16031, "epoch": 381} {"train_loss": -5.171764373779297, "global_step": 16032, "epoch": 381} {"train_loss": -5.165922164916992, "global_step": 16033, "epoch": 381} {"train_loss": -5.285475254058838, "global_step": 16034, "epoch": 381} {"train_loss": -5.3124494552612305, "global_step": 16035, "epoch": 381} {"train_loss": -5.206492900848389, "global_step": 16036, "epoch": 381} {"train_loss": -5.2039313316345215, "global_step": 16037, "epoch": 381} {"train_loss": -5.253082275390625, "global_step": 16038, "epoch": 381} {"train_loss": -5.265403747558594, "global_step": 16039, "epoch": 381} {"train_loss": -5.354447841644287, "global_step": 16040, "epoch": 381} {"train_loss": -5.314793586730957, "global_step": 16041, "epoch": 381} {"train_loss": -5.379733085632324, "global_step": 16042, "epoch": 381} {"train_loss": -5.235554411297753, "global_step": 16043, "epoch": 381, "val_loss": 70955.109375} {"train_loss": -5.39974308013916, "global_step": 16044, "epoch": 382} {"train_loss": -5.275580883026123, "global_step": 16045, "epoch": 382} {"train_loss": -5.1859283447265625, "global_step": 16046, "epoch": 382} {"train_loss": -5.288248062133789, "global_step": 16047, "epoch": 382} {"train_loss": -5.3087005615234375, "global_step": 16048, "epoch": 382} {"train_loss": -5.346132278442383, "global_step": 16049, "epoch": 382} {"train_loss": -5.249755859375, "global_step": 16050, "epoch": 382} {"train_loss": -5.1796770095825195, "global_step": 16051, "epoch": 382} {"train_loss": -5.195310592651367, "global_step": 16052, "epoch": 382} {"train_loss": -5.204926490783691, "global_step": 16053, "epoch": 382} {"train_loss": -5.05313777923584, "global_step": 16054, "epoch": 382} {"train_loss": -5.251713752746582, "global_step": 16055, "epoch": 382} {"train_loss": -5.234434127807617, "global_step": 16056, "epoch": 382} {"train_loss": -5.181441783905029, "global_step": 16057, "epoch": 382} {"train_loss": -5.303860664367676, "global_step": 16058, "epoch": 382} {"train_loss": -5.2567877769470215, "global_step": 16059, "epoch": 382} {"train_loss": -5.179269313812256, "global_step": 16060, "epoch": 382} {"train_loss": -5.173698425292969, "global_step": 16061, "epoch": 382} {"train_loss": -5.302238464355469, "global_step": 16062, "epoch": 382} {"train_loss": -5.137872219085693, "global_step": 16063, "epoch": 382} {"train_loss": -5.17140007019043, "global_step": 16064, "epoch": 382} {"train_loss": -5.392195224761963, "global_step": 16065, "epoch": 382} {"train_loss": -5.194672584533691, "global_step": 16066, "epoch": 382} {"train_loss": -5.280129432678223, "global_step": 16067, "epoch": 382} {"train_loss": -5.263179779052734, "global_step": 16068, "epoch": 382} {"train_loss": -5.233415603637695, "global_step": 16069, "epoch": 382} {"train_loss": -5.194845199584961, "global_step": 16070, "epoch": 382} {"train_loss": -5.276699066162109, "global_step": 16071, "epoch": 382} {"train_loss": -5.330618858337402, "global_step": 16072, "epoch": 382} {"train_loss": -5.197489261627197, "global_step": 16073, "epoch": 382} {"train_loss": -5.188476085662842, "global_step": 16074, "epoch": 382} {"train_loss": -5.322591781616211, "global_step": 16075, "epoch": 382} {"train_loss": -5.2151384353637695, "global_step": 16076, "epoch": 382} {"train_loss": -5.293056488037109, "global_step": 16077, "epoch": 382} {"train_loss": -5.2516326904296875, "global_step": 16078, "epoch": 382} {"train_loss": -5.301353931427002, "global_step": 16079, "epoch": 382} {"train_loss": -5.324365615844727, "global_step": 16080, "epoch": 382} {"train_loss": -5.298995018005371, "global_step": 16081, "epoch": 382} {"train_loss": -5.1422319412231445, "global_step": 16082, "epoch": 382} {"train_loss": -5.096528053283691, "global_step": 16083, "epoch": 382} {"train_loss": -5.179788589477539, "global_step": 16084, "epoch": 382} {"train_loss": -5.240173986979893, "global_step": 16085, "epoch": 382, "val_loss": 70586.234375} {"train_loss": -5.284950256347656, "global_step": 16086, "epoch": 383} {"train_loss": -5.268301963806152, "global_step": 16087, "epoch": 383} {"train_loss": -5.1699371337890625, "global_step": 16088, "epoch": 383} {"train_loss": -5.086719512939453, "global_step": 16089, "epoch": 383} {"train_loss": -5.351316928863525, "global_step": 16090, "epoch": 383} {"train_loss": -5.163420677185059, "global_step": 16091, "epoch": 383} {"train_loss": -5.238696098327637, "global_step": 16092, "epoch": 383} {"train_loss": -5.273017883300781, "global_step": 16093, "epoch": 383} {"train_loss": -5.172535419464111, "global_step": 16094, "epoch": 383} {"train_loss": -5.153995990753174, "global_step": 16095, "epoch": 383} {"train_loss": -5.282726764678955, "global_step": 16096, "epoch": 383} {"train_loss": -5.2943572998046875, "global_step": 16097, "epoch": 383} {"train_loss": -5.21694278717041, "global_step": 16098, "epoch": 383} {"train_loss": -5.254812240600586, "global_step": 16099, "epoch": 383} {"train_loss": -5.268468856811523, "global_step": 16100, "epoch": 383} {"train_loss": -5.255734443664551, "global_step": 16101, "epoch": 383} {"train_loss": -5.298575401306152, "global_step": 16102, "epoch": 383} {"train_loss": -5.129708290100098, "global_step": 16103, "epoch": 383} {"train_loss": -5.058294296264648, "global_step": 16104, "epoch": 383} {"train_loss": -5.1986541748046875, "global_step": 16105, "epoch": 383} {"train_loss": -5.253866672515869, "global_step": 16106, "epoch": 383} {"train_loss": -5.305110931396484, "global_step": 16107, "epoch": 383} {"train_loss": -5.148153781890869, "global_step": 16108, "epoch": 383} {"train_loss": -5.200955390930176, "global_step": 16109, "epoch": 383} {"train_loss": -5.270478248596191, "global_step": 16110, "epoch": 383} {"train_loss": -5.321671485900879, "global_step": 16111, "epoch": 383} {"train_loss": -5.30582332611084, "global_step": 16112, "epoch": 383} {"train_loss": -5.096663951873779, "global_step": 16113, "epoch": 383} {"train_loss": -5.266407012939453, "global_step": 16114, "epoch": 383} {"train_loss": -5.120155334472656, "global_step": 16115, "epoch": 383} {"train_loss": -5.342376232147217, "global_step": 16116, "epoch": 383} {"train_loss": -5.150644302368164, "global_step": 16117, "epoch": 383} {"train_loss": -5.297865867614746, "global_step": 16118, "epoch": 383} {"train_loss": -5.190917491912842, "global_step": 16119, "epoch": 383} {"train_loss": -5.214776039123535, "global_step": 16120, "epoch": 383} {"train_loss": -5.226485252380371, "global_step": 16121, "epoch": 383} {"train_loss": -5.2638750076293945, "global_step": 16122, "epoch": 383} {"train_loss": -5.184311866760254, "global_step": 16123, "epoch": 383} {"train_loss": -5.276341438293457, "global_step": 16124, "epoch": 383} {"train_loss": -5.3490753173828125, "global_step": 16125, "epoch": 383} {"train_loss": -5.172907829284668, "global_step": 16126, "epoch": 383} {"train_loss": -5.228695460728237, "global_step": 16127, "epoch": 383, "val_loss": 71082.8359375} {"train_loss": -5.142280578613281, "global_step": 16128, "epoch": 384} {"train_loss": -5.086872100830078, "global_step": 16129, "epoch": 384} {"train_loss": -5.290799617767334, "global_step": 16130, "epoch": 384} {"train_loss": -5.2696027755737305, "global_step": 16131, "epoch": 384} {"train_loss": -5.314768314361572, "global_step": 16132, "epoch": 384} {"train_loss": -5.320342063903809, "global_step": 16133, "epoch": 384} {"train_loss": -5.219306468963623, "global_step": 16134, "epoch": 384} {"train_loss": -5.116214752197266, "global_step": 16135, "epoch": 384} {"train_loss": -5.2803425788879395, "global_step": 16136, "epoch": 384} {"train_loss": -5.351410865783691, "global_step": 16137, "epoch": 384} {"train_loss": -5.216882705688477, "global_step": 16138, "epoch": 384} {"train_loss": -5.278845310211182, "global_step": 16139, "epoch": 384} {"train_loss": -5.279632568359375, "global_step": 16140, "epoch": 384} {"train_loss": -5.177097320556641, "global_step": 16141, "epoch": 384} {"train_loss": -5.012802600860596, "global_step": 16142, "epoch": 384} {"train_loss": -5.178514003753662, "global_step": 16143, "epoch": 384} {"train_loss": -5.302496433258057, "global_step": 16144, "epoch": 384} {"train_loss": -5.127837181091309, "global_step": 16145, "epoch": 384} {"train_loss": -5.240985870361328, "global_step": 16146, "epoch": 384} {"train_loss": -5.244204521179199, "global_step": 16147, "epoch": 384} {"train_loss": -5.138034343719482, "global_step": 16148, "epoch": 384} {"train_loss": -5.200165271759033, "global_step": 16149, "epoch": 384} {"train_loss": -5.2426910400390625, "global_step": 16150, "epoch": 384} {"train_loss": -5.2725725173950195, "global_step": 16151, "epoch": 384} {"train_loss": -5.160730361938477, "global_step": 16152, "epoch": 384} {"train_loss": -5.3956685066223145, "global_step": 16153, "epoch": 384} {"train_loss": -5.20399808883667, "global_step": 16154, "epoch": 384} {"train_loss": -5.166962146759033, "global_step": 16155, "epoch": 384} {"train_loss": -5.386521339416504, "global_step": 16156, "epoch": 384} {"train_loss": -5.314267158508301, "global_step": 16157, "epoch": 384} {"train_loss": -5.193569660186768, "global_step": 16158, "epoch": 384} {"train_loss": -5.220609664916992, "global_step": 16159, "epoch": 384} {"train_loss": -5.353438377380371, "global_step": 16160, "epoch": 384} {"train_loss": -5.3380126953125, "global_step": 16161, "epoch": 384} {"train_loss": -5.142136096954346, "global_step": 16162, "epoch": 384} {"train_loss": -5.293570041656494, "global_step": 16163, "epoch": 384} {"train_loss": -5.396055221557617, "global_step": 16164, "epoch": 384} {"train_loss": -5.136338710784912, "global_step": 16165, "epoch": 384} {"train_loss": -5.251959323883057, "global_step": 16166, "epoch": 384} {"train_loss": -5.280468940734863, "global_step": 16167, "epoch": 384} {"train_loss": -5.337018966674805, "global_step": 16168, "epoch": 384} {"train_loss": -5.242384013675508, "global_step": 16169, "epoch": 384, "val_loss": 70436.140625} {"train_loss": -5.2856597900390625, "global_step": 16170, "epoch": 385} {"train_loss": -5.251566410064697, "global_step": 16171, "epoch": 385} {"train_loss": -5.367419242858887, "global_step": 16172, "epoch": 385} {"train_loss": -5.266950607299805, "global_step": 16173, "epoch": 385} {"train_loss": -5.326991558074951, "global_step": 16174, "epoch": 385} {"train_loss": -5.250551700592041, "global_step": 16175, "epoch": 385} {"train_loss": -5.371203422546387, "global_step": 16176, "epoch": 385} {"train_loss": -5.184123992919922, "global_step": 16177, "epoch": 385} {"train_loss": -5.221614837646484, "global_step": 16178, "epoch": 385} {"train_loss": -5.214278221130371, "global_step": 16179, "epoch": 385} {"train_loss": -5.184191703796387, "global_step": 16180, "epoch": 385} {"train_loss": -5.11653995513916, "global_step": 16181, "epoch": 385} {"train_loss": -5.298481464385986, "global_step": 16182, "epoch": 385} {"train_loss": -5.203730583190918, "global_step": 16183, "epoch": 385} {"train_loss": -5.135005950927734, "global_step": 16184, "epoch": 385} {"train_loss": -5.3505096435546875, "global_step": 16185, "epoch": 385} {"train_loss": -5.184372901916504, "global_step": 16186, "epoch": 385} {"train_loss": -5.075278282165527, "global_step": 16187, "epoch": 385} {"train_loss": -5.200366497039795, "global_step": 16188, "epoch": 385} {"train_loss": -5.3192362785339355, "global_step": 16189, "epoch": 385} {"train_loss": -5.067590713500977, "global_step": 16190, "epoch": 385} {"train_loss": -5.17213773727417, "global_step": 16191, "epoch": 385} {"train_loss": -5.4408087730407715, "global_step": 16192, "epoch": 385} {"train_loss": -5.312812805175781, "global_step": 16193, "epoch": 385} {"train_loss": -5.34833288192749, "global_step": 16194, "epoch": 385} {"train_loss": -5.212543487548828, "global_step": 16195, "epoch": 385} {"train_loss": -5.103029727935791, "global_step": 16196, "epoch": 385} {"train_loss": -5.133728981018066, "global_step": 16197, "epoch": 385} {"train_loss": -5.265414714813232, "global_step": 16198, "epoch": 385} {"train_loss": -5.328498840332031, "global_step": 16199, "epoch": 385} {"train_loss": -5.222559928894043, "global_step": 16200, "epoch": 385} {"train_loss": -5.262505054473877, "global_step": 16201, "epoch": 385} {"train_loss": -5.195857048034668, "global_step": 16202, "epoch": 385} {"train_loss": -5.31282377243042, "global_step": 16203, "epoch": 385} {"train_loss": -5.165717124938965, "global_step": 16204, "epoch": 385} {"train_loss": -5.246915817260742, "global_step": 16205, "epoch": 385} {"train_loss": -5.275651454925537, "global_step": 16206, "epoch": 385} {"train_loss": -5.325123310089111, "global_step": 16207, "epoch": 385} {"train_loss": -5.266356468200684, "global_step": 16208, "epoch": 385} {"train_loss": -5.282306671142578, "global_step": 16209, "epoch": 385} {"train_loss": -5.151088714599609, "global_step": 16210, "epoch": 385} {"train_loss": -5.244519903546288, "global_step": 16211, "epoch": 385, "val_loss": 70379.5703125} {"train_loss": -5.17978572845459, "global_step": 16212, "epoch": 386} {"train_loss": -5.203132152557373, "global_step": 16213, "epoch": 386} {"train_loss": -5.338305473327637, "global_step": 16214, "epoch": 386} {"train_loss": -5.209079742431641, "global_step": 16215, "epoch": 386} {"train_loss": -5.218409538269043, "global_step": 16216, "epoch": 386} {"train_loss": -5.185472011566162, "global_step": 16217, "epoch": 386} {"train_loss": -5.319272041320801, "global_step": 16218, "epoch": 386} {"train_loss": -5.320686340332031, "global_step": 16219, "epoch": 386} {"train_loss": -5.247676372528076, "global_step": 16220, "epoch": 386} {"train_loss": -4.973942756652832, "global_step": 16221, "epoch": 386} {"train_loss": -5.354467868804932, "global_step": 16222, "epoch": 386} {"train_loss": -5.350133895874023, "global_step": 16223, "epoch": 386} {"train_loss": -5.300356864929199, "global_step": 16224, "epoch": 386} {"train_loss": -5.3468122482299805, "global_step": 16225, "epoch": 386} {"train_loss": -5.220078945159912, "global_step": 16226, "epoch": 386} {"train_loss": -5.217214107513428, "global_step": 16227, "epoch": 386} {"train_loss": -5.231164455413818, "global_step": 16228, "epoch": 386} {"train_loss": -5.153526782989502, "global_step": 16229, "epoch": 386} {"train_loss": -5.35600471496582, "global_step": 16230, "epoch": 386} {"train_loss": -5.282984256744385, "global_step": 16231, "epoch": 386} {"train_loss": -5.095659255981445, "global_step": 16232, "epoch": 386} {"train_loss": -5.2568817138671875, "global_step": 16233, "epoch": 386} {"train_loss": -5.157960891723633, "global_step": 16234, "epoch": 386} {"train_loss": -5.332531929016113, "global_step": 16235, "epoch": 386} {"train_loss": -5.303297996520996, "global_step": 16236, "epoch": 386} {"train_loss": -5.205420970916748, "global_step": 16237, "epoch": 386} {"train_loss": -5.165656089782715, "global_step": 16238, "epoch": 386} {"train_loss": -5.271430969238281, "global_step": 16239, "epoch": 386} {"train_loss": -4.990349769592285, "global_step": 16240, "epoch": 386} {"train_loss": -5.242182731628418, "global_step": 16241, "epoch": 386} {"train_loss": -5.250521183013916, "global_step": 16242, "epoch": 386} {"train_loss": -5.171875, "global_step": 16243, "epoch": 386} {"train_loss": -5.074008941650391, "global_step": 16244, "epoch": 386} {"train_loss": -5.038488388061523, "global_step": 16245, "epoch": 386} {"train_loss": -5.2231364250183105, "global_step": 16246, "epoch": 386} {"train_loss": -5.195740222930908, "global_step": 16247, "epoch": 386} {"train_loss": -5.078360557556152, "global_step": 16248, "epoch": 386} {"train_loss": -5.3205108642578125, "global_step": 16249, "epoch": 386} {"train_loss": -5.084277153015137, "global_step": 16250, "epoch": 386} {"train_loss": -5.143184185028076, "global_step": 16251, "epoch": 386} {"train_loss": -5.216510772705078, "global_step": 16252, "epoch": 386} {"train_loss": -5.211652097247896, "global_step": 16253, "epoch": 386, "val_loss": 70842.53125} {"train_loss": -5.237086296081543, "global_step": 16254, "epoch": 387} {"train_loss": -5.139453887939453, "global_step": 16255, "epoch": 387} {"train_loss": -5.254833221435547, "global_step": 16256, "epoch": 387} {"train_loss": -5.154593467712402, "global_step": 16257, "epoch": 387} {"train_loss": -5.243783950805664, "global_step": 16258, "epoch": 387} {"train_loss": -5.253930568695068, "global_step": 16259, "epoch": 387} {"train_loss": -5.298329830169678, "global_step": 16260, "epoch": 387} {"train_loss": -5.377474784851074, "global_step": 16261, "epoch": 387} {"train_loss": -5.130868911743164, "global_step": 16262, "epoch": 387} {"train_loss": -5.318553924560547, "global_step": 16263, "epoch": 387} {"train_loss": -5.3266215324401855, "global_step": 16264, "epoch": 387} {"train_loss": -5.277998924255371, "global_step": 16265, "epoch": 387} {"train_loss": -5.268359184265137, "global_step": 16266, "epoch": 387} {"train_loss": -5.2213568687438965, "global_step": 16267, "epoch": 387} {"train_loss": -5.238853454589844, "global_step": 16268, "epoch": 387} {"train_loss": -5.3516130447387695, "global_step": 16269, "epoch": 387} {"train_loss": -5.2455596923828125, "global_step": 16270, "epoch": 387} {"train_loss": -5.245354652404785, "global_step": 16271, "epoch": 387} {"train_loss": -5.347079753875732, "global_step": 16272, "epoch": 387} {"train_loss": -5.183862686157227, "global_step": 16273, "epoch": 387} {"train_loss": -5.284786224365234, "global_step": 16274, "epoch": 387} {"train_loss": -5.345727443695068, "global_step": 16275, "epoch": 387} {"train_loss": -5.1424560546875, "global_step": 16276, "epoch": 387} {"train_loss": -5.111298561096191, "global_step": 16277, "epoch": 387} {"train_loss": -5.097628593444824, "global_step": 16278, "epoch": 387} {"train_loss": -5.195928573608398, "global_step": 16279, "epoch": 387} {"train_loss": -5.267434597015381, "global_step": 16280, "epoch": 387} {"train_loss": -5.153097629547119, "global_step": 16281, "epoch": 387} {"train_loss": -5.178795337677002, "global_step": 16282, "epoch": 387} {"train_loss": -5.127013683319092, "global_step": 16283, "epoch": 387} {"train_loss": -5.109635353088379, "global_step": 16284, "epoch": 387} {"train_loss": -5.203843116760254, "global_step": 16285, "epoch": 387} {"train_loss": -5.121241569519043, "global_step": 16286, "epoch": 387} {"train_loss": -5.181736946105957, "global_step": 16287, "epoch": 387} {"train_loss": -5.112124919891357, "global_step": 16288, "epoch": 387} {"train_loss": -5.191703796386719, "global_step": 16289, "epoch": 387} {"train_loss": -5.1270012855529785, "global_step": 16290, "epoch": 387} {"train_loss": -5.208242893218994, "global_step": 16291, "epoch": 387} {"train_loss": -5.209743499755859, "global_step": 16292, "epoch": 387} {"train_loss": -5.418091773986816, "global_step": 16293, "epoch": 387} {"train_loss": -5.108139991760254, "global_step": 16294, "epoch": 387} {"train_loss": -5.219878525961013, "global_step": 16295, "epoch": 387, "val_loss": 71780.0546875} {"train_loss": -5.024728298187256, "global_step": 16296, "epoch": 388} {"train_loss": -5.164427757263184, "global_step": 16297, "epoch": 388} {"train_loss": -5.125287055969238, "global_step": 16298, "epoch": 388} {"train_loss": -5.157238006591797, "global_step": 16299, "epoch": 388} {"train_loss": -5.222380638122559, "global_step": 16300, "epoch": 388} {"train_loss": -5.181302070617676, "global_step": 16301, "epoch": 388} {"train_loss": -5.134825706481934, "global_step": 16302, "epoch": 388} {"train_loss": -5.320591449737549, "global_step": 16303, "epoch": 388} {"train_loss": -5.063030242919922, "global_step": 16304, "epoch": 388} {"train_loss": -5.134294033050537, "global_step": 16305, "epoch": 388} {"train_loss": -5.066184997558594, "global_step": 16306, "epoch": 388} {"train_loss": -5.2354416847229, "global_step": 16307, "epoch": 388} {"train_loss": -5.295126914978027, "global_step": 16308, "epoch": 388} {"train_loss": -5.125472068786621, "global_step": 16309, "epoch": 388} {"train_loss": -5.249835968017578, "global_step": 16310, "epoch": 388} {"train_loss": -5.134140491485596, "global_step": 16311, "epoch": 388} {"train_loss": -5.206301689147949, "global_step": 16312, "epoch": 388} {"train_loss": -4.918962001800537, "global_step": 16313, "epoch": 388} {"train_loss": -5.2532477378845215, "global_step": 16314, "epoch": 388} {"train_loss": -5.505035400390625, "global_step": 16315, "epoch": 388} {"train_loss": -5.1201910972595215, "global_step": 16316, "epoch": 388} {"train_loss": -5.239951133728027, "global_step": 16317, "epoch": 388} {"train_loss": -5.240359306335449, "global_step": 16318, "epoch": 388} {"train_loss": -5.123726844787598, "global_step": 16319, "epoch": 388} {"train_loss": -5.260682106018066, "global_step": 16320, "epoch": 388} {"train_loss": -5.231326103210449, "global_step": 16321, "epoch": 388} {"train_loss": -5.224388122558594, "global_step": 16322, "epoch": 388} {"train_loss": -5.321548938751221, "global_step": 16323, "epoch": 388} {"train_loss": -5.230302810668945, "global_step": 16324, "epoch": 388} {"train_loss": -5.313082695007324, "global_step": 16325, "epoch": 388} {"train_loss": -5.271951675415039, "global_step": 16326, "epoch": 388} {"train_loss": -5.224157810211182, "global_step": 16327, "epoch": 388} {"train_loss": -5.065988540649414, "global_step": 16328, "epoch": 388} {"train_loss": -5.1697282791137695, "global_step": 16329, "epoch": 388} {"train_loss": -5.261533260345459, "global_step": 16330, "epoch": 388} {"train_loss": -5.106298446655273, "global_step": 16331, "epoch": 388} {"train_loss": -5.31717586517334, "global_step": 16332, "epoch": 388} {"train_loss": -5.157625675201416, "global_step": 16333, "epoch": 388} {"train_loss": -5.2995405197143555, "global_step": 16334, "epoch": 388} {"train_loss": -5.120885848999023, "global_step": 16335, "epoch": 388} {"train_loss": -5.210414886474609, "global_step": 16336, "epoch": 388} {"train_loss": -5.201499768665859, "global_step": 16337, "epoch": 388, "val_loss": 70430.2734375} {"train_loss": -5.326360702514648, "global_step": 16338, "epoch": 389} {"train_loss": -5.329846382141113, "global_step": 16339, "epoch": 389} {"train_loss": -5.374131202697754, "global_step": 16340, "epoch": 389} {"train_loss": -5.394723892211914, "global_step": 16341, "epoch": 389} {"train_loss": -5.198072910308838, "global_step": 16342, "epoch": 389} {"train_loss": -5.221303462982178, "global_step": 16343, "epoch": 389} {"train_loss": -5.259310245513916, "global_step": 16344, "epoch": 389} {"train_loss": -5.250055313110352, "global_step": 16345, "epoch": 389} {"train_loss": -5.302402496337891, "global_step": 16346, "epoch": 389} {"train_loss": -5.237160682678223, "global_step": 16347, "epoch": 389} {"train_loss": -5.205692291259766, "global_step": 16348, "epoch": 389} {"train_loss": -5.342310905456543, "global_step": 16349, "epoch": 389} {"train_loss": -5.298920154571533, "global_step": 16350, "epoch": 389} {"train_loss": -5.155460357666016, "global_step": 16351, "epoch": 389} {"train_loss": -5.304692268371582, "global_step": 16352, "epoch": 389} {"train_loss": -5.309749603271484, "global_step": 16353, "epoch": 389} {"train_loss": -5.290927886962891, "global_step": 16354, "epoch": 389} {"train_loss": -5.301634788513184, "global_step": 16355, "epoch": 389} {"train_loss": -5.195621967315674, "global_step": 16356, "epoch": 389} {"train_loss": -5.278576850891113, "global_step": 16357, "epoch": 389} {"train_loss": -5.2797956466674805, "global_step": 16358, "epoch": 389} {"train_loss": -5.15302038192749, "global_step": 16359, "epoch": 389} {"train_loss": -5.200686454772949, "global_step": 16360, "epoch": 389} {"train_loss": -5.258080959320068, "global_step": 16361, "epoch": 389} {"train_loss": -5.231670379638672, "global_step": 16362, "epoch": 389} {"train_loss": -5.2558722496032715, "global_step": 16363, "epoch": 389} {"train_loss": -5.1840620040893555, "global_step": 16364, "epoch": 389} {"train_loss": -5.1911702156066895, "global_step": 16365, "epoch": 389} {"train_loss": -5.14433479309082, "global_step": 16366, "epoch": 389} {"train_loss": -5.312256813049316, "global_step": 16367, "epoch": 389} {"train_loss": -5.2117228507995605, "global_step": 16368, "epoch": 389} {"train_loss": -5.22767972946167, "global_step": 16369, "epoch": 389} {"train_loss": -5.272684097290039, "global_step": 16370, "epoch": 389} {"train_loss": -5.184057712554932, "global_step": 16371, "epoch": 389} {"train_loss": -5.445483207702637, "global_step": 16372, "epoch": 389} {"train_loss": -5.254200458526611, "global_step": 16373, "epoch": 389} {"train_loss": -5.221343994140625, "global_step": 16374, "epoch": 389} {"train_loss": -5.269179344177246, "global_step": 16375, "epoch": 389} {"train_loss": -5.189936637878418, "global_step": 16376, "epoch": 389} {"train_loss": -5.258808135986328, "global_step": 16377, "epoch": 389} {"train_loss": -5.268740653991699, "global_step": 16378, "epoch": 389} {"train_loss": -5.258539063589914, "global_step": 16379, "epoch": 389, "val_loss": 70319.2578125} {"train_loss": -5.252730369567871, "global_step": 16380, "epoch": 390} {"train_loss": -5.224316596984863, "global_step": 16381, "epoch": 390} {"train_loss": -5.334748268127441, "global_step": 16382, "epoch": 390} {"train_loss": -5.161161422729492, "global_step": 16383, "epoch": 390} {"train_loss": -5.244662761688232, "global_step": 16384, "epoch": 390} {"train_loss": -5.112290382385254, "global_step": 16385, "epoch": 390} {"train_loss": -5.289124488830566, "global_step": 16386, "epoch": 390} {"train_loss": -5.25022029876709, "global_step": 16387, "epoch": 390} {"train_loss": -4.981963157653809, "global_step": 16388, "epoch": 390} {"train_loss": -5.439450263977051, "global_step": 16389, "epoch": 390} {"train_loss": -5.2944793701171875, "global_step": 16390, "epoch": 390} {"train_loss": -5.322795867919922, "global_step": 16391, "epoch": 390} {"train_loss": -5.150355339050293, "global_step": 16392, "epoch": 390} {"train_loss": -5.353964805603027, "global_step": 16393, "epoch": 390} {"train_loss": -5.286219120025635, "global_step": 16394, "epoch": 390} {"train_loss": -5.24626350402832, "global_step": 16395, "epoch": 390} {"train_loss": -5.054233551025391, "global_step": 16396, "epoch": 390} {"train_loss": -5.28753662109375, "global_step": 16397, "epoch": 390} {"train_loss": -5.159490585327148, "global_step": 16398, "epoch": 390} {"train_loss": -5.173144340515137, "global_step": 16399, "epoch": 390} {"train_loss": -5.329974174499512, "global_step": 16400, "epoch": 390} {"train_loss": -5.189615249633789, "global_step": 16401, "epoch": 390} {"train_loss": -5.150289535522461, "global_step": 16402, "epoch": 390} {"train_loss": -5.252821922302246, "global_step": 16403, "epoch": 390} {"train_loss": -5.401239395141602, "global_step": 16404, "epoch": 390} {"train_loss": -5.310317039489746, "global_step": 16405, "epoch": 390} {"train_loss": -5.202004432678223, "global_step": 16406, "epoch": 390} {"train_loss": -5.284206390380859, "global_step": 16407, "epoch": 390} {"train_loss": -5.251604080200195, "global_step": 16408, "epoch": 390} {"train_loss": -5.16738748550415, "global_step": 16409, "epoch": 390} {"train_loss": -5.109551429748535, "global_step": 16410, "epoch": 390} {"train_loss": -5.374163627624512, "global_step": 16411, "epoch": 390} {"train_loss": -5.322001934051514, "global_step": 16412, "epoch": 390} {"train_loss": -5.159642696380615, "global_step": 16413, "epoch": 390} {"train_loss": -5.268341064453125, "global_step": 16414, "epoch": 390} {"train_loss": -5.172264099121094, "global_step": 16415, "epoch": 390} {"train_loss": -5.348206520080566, "global_step": 16416, "epoch": 390} {"train_loss": -5.26848030090332, "global_step": 16417, "epoch": 390} {"train_loss": -5.292180061340332, "global_step": 16418, "epoch": 390} {"train_loss": -5.298871994018555, "global_step": 16419, "epoch": 390} {"train_loss": -5.211352348327637, "global_step": 16420, "epoch": 390} {"train_loss": -5.242411057154338, "global_step": 16421, "epoch": 390, "val_loss": 70390.3203125} {"train_loss": -5.257780075073242, "global_step": 16422, "epoch": 391} {"train_loss": -5.191715717315674, "global_step": 16423, "epoch": 391} {"train_loss": -5.219374656677246, "global_step": 16424, "epoch": 391} {"train_loss": -5.372351169586182, "global_step": 16425, "epoch": 391} {"train_loss": -5.16374397277832, "global_step": 16426, "epoch": 391} {"train_loss": -5.162741661071777, "global_step": 16427, "epoch": 391} {"train_loss": -5.2692131996154785, "global_step": 16428, "epoch": 391} {"train_loss": -5.045197486877441, "global_step": 16429, "epoch": 391} {"train_loss": -5.216114044189453, "global_step": 16430, "epoch": 391} {"train_loss": -5.292822360992432, "global_step": 16431, "epoch": 391} {"train_loss": -5.326395034790039, "global_step": 16432, "epoch": 391} {"train_loss": -5.166781425476074, "global_step": 16433, "epoch": 391} {"train_loss": -5.5074567794799805, "global_step": 16434, "epoch": 391} {"train_loss": -5.222880840301514, "global_step": 16435, "epoch": 391} {"train_loss": -5.253965377807617, "global_step": 16436, "epoch": 391} {"train_loss": -5.316444396972656, "global_step": 16437, "epoch": 391} {"train_loss": -5.405966758728027, "global_step": 16438, "epoch": 391} {"train_loss": -5.161201000213623, "global_step": 16439, "epoch": 391} {"train_loss": -5.420154094696045, "global_step": 16440, "epoch": 391} {"train_loss": -5.266372203826904, "global_step": 16441, "epoch": 391} {"train_loss": -5.102169990539551, "global_step": 16442, "epoch": 391} {"train_loss": -5.21961784362793, "global_step": 16443, "epoch": 391} {"train_loss": -5.305455684661865, "global_step": 16444, "epoch": 391} {"train_loss": -5.2478861808776855, "global_step": 16445, "epoch": 391} {"train_loss": -5.115275859832764, "global_step": 16446, "epoch": 391} {"train_loss": -5.257000923156738, "global_step": 16447, "epoch": 391} {"train_loss": -5.224112510681152, "global_step": 16448, "epoch": 391} {"train_loss": -5.123215675354004, "global_step": 16449, "epoch": 391} {"train_loss": -5.216996192932129, "global_step": 16450, "epoch": 391} {"train_loss": -5.209891319274902, "global_step": 16451, "epoch": 391} {"train_loss": -5.054511070251465, "global_step": 16452, "epoch": 391} {"train_loss": -5.183578014373779, "global_step": 16453, "epoch": 391} {"train_loss": -5.279869556427002, "global_step": 16454, "epoch": 391} {"train_loss": -5.22639274597168, "global_step": 16455, "epoch": 391} {"train_loss": -5.2349748611450195, "global_step": 16456, "epoch": 391} {"train_loss": -5.1397294998168945, "global_step": 16457, "epoch": 391} {"train_loss": -5.128916263580322, "global_step": 16458, "epoch": 391} {"train_loss": -5.201170921325684, "global_step": 16459, "epoch": 391} {"train_loss": -5.36612606048584, "global_step": 16460, "epoch": 391} {"train_loss": -5.435608863830566, "global_step": 16461, "epoch": 391} {"train_loss": -5.089200973510742, "global_step": 16462, "epoch": 391} {"train_loss": -5.23404335975647, "global_step": 16463, "epoch": 391, "val_loss": 71525.9765625} {"train_loss": -5.177487373352051, "global_step": 16464, "epoch": 392} {"train_loss": -5.237822532653809, "global_step": 16465, "epoch": 392} {"train_loss": -5.275671005249023, "global_step": 16466, "epoch": 392} {"train_loss": -5.086277961730957, "global_step": 16467, "epoch": 392} {"train_loss": -5.266057968139648, "global_step": 16468, "epoch": 392} {"train_loss": -5.130553245544434, "global_step": 16469, "epoch": 392} {"train_loss": -5.094047546386719, "global_step": 16470, "epoch": 392} {"train_loss": -5.270423889160156, "global_step": 16471, "epoch": 392} {"train_loss": -5.2543463706970215, "global_step": 16472, "epoch": 392} {"train_loss": -5.180543422698975, "global_step": 16473, "epoch": 392} {"train_loss": -5.197258472442627, "global_step": 16474, "epoch": 392} {"train_loss": -5.266956329345703, "global_step": 16475, "epoch": 392} {"train_loss": -5.3187408447265625, "global_step": 16476, "epoch": 392} {"train_loss": -5.2440009117126465, "global_step": 16477, "epoch": 392} {"train_loss": -5.235348701477051, "global_step": 16478, "epoch": 392} {"train_loss": -5.105358123779297, "global_step": 16479, "epoch": 392} {"train_loss": -5.254258632659912, "global_step": 16480, "epoch": 392} {"train_loss": -5.318573951721191, "global_step": 16481, "epoch": 392} {"train_loss": -5.210247039794922, "global_step": 16482, "epoch": 392} {"train_loss": -5.256813049316406, "global_step": 16483, "epoch": 392} {"train_loss": -5.192550182342529, "global_step": 16484, "epoch": 392} {"train_loss": -5.202140808105469, "global_step": 16485, "epoch": 392} {"train_loss": -5.2686662673950195, "global_step": 16486, "epoch": 392} {"train_loss": -5.318343162536621, "global_step": 16487, "epoch": 392} {"train_loss": -5.287693023681641, "global_step": 16488, "epoch": 392} {"train_loss": -5.400874137878418, "global_step": 16489, "epoch": 392} {"train_loss": -5.2442851066589355, "global_step": 16490, "epoch": 392} {"train_loss": -5.201351165771484, "global_step": 16491, "epoch": 392} {"train_loss": -5.39012336730957, "global_step": 16492, "epoch": 392} {"train_loss": -5.353707313537598, "global_step": 16493, "epoch": 392} {"train_loss": -5.235655784606934, "global_step": 16494, "epoch": 392} {"train_loss": -5.2746429443359375, "global_step": 16495, "epoch": 392} {"train_loss": -5.378420829772949, "global_step": 16496, "epoch": 392} {"train_loss": -5.218597888946533, "global_step": 16497, "epoch": 392} {"train_loss": -5.254741668701172, "global_step": 16498, "epoch": 392} {"train_loss": -5.242166996002197, "global_step": 16499, "epoch": 392} {"train_loss": -5.288065433502197, "global_step": 16500, "epoch": 392} {"train_loss": -5.193912029266357, "global_step": 16501, "epoch": 392} {"train_loss": -5.201840877532959, "global_step": 16502, "epoch": 392} {"train_loss": -5.250031471252441, "global_step": 16503, "epoch": 392} {"train_loss": -5.165169715881348, "global_step": 16504, "epoch": 392} {"train_loss": -5.241858436947777, "global_step": 16505, "epoch": 392, "val_loss": 70483.7109375} {"train_loss": -5.392887592315674, "global_step": 16506, "epoch": 393} {"train_loss": -5.3219170570373535, "global_step": 16507, "epoch": 393} {"train_loss": -5.23237419128418, "global_step": 16508, "epoch": 393} {"train_loss": -5.122608661651611, "global_step": 16509, "epoch": 393} {"train_loss": -5.2912492752075195, "global_step": 16510, "epoch": 393} {"train_loss": -5.247413158416748, "global_step": 16511, "epoch": 393} {"train_loss": -5.35093355178833, "global_step": 16512, "epoch": 393} {"train_loss": -5.224498748779297, "global_step": 16513, "epoch": 393} {"train_loss": -5.25954008102417, "global_step": 16514, "epoch": 393} {"train_loss": -5.223698616027832, "global_step": 16515, "epoch": 393} {"train_loss": -5.132672309875488, "global_step": 16516, "epoch": 393} {"train_loss": -5.297894477844238, "global_step": 16517, "epoch": 393} {"train_loss": -5.189674377441406, "global_step": 16518, "epoch": 393} {"train_loss": -5.349137306213379, "global_step": 16519, "epoch": 393} {"train_loss": -5.207613468170166, "global_step": 16520, "epoch": 393} {"train_loss": -5.285234451293945, "global_step": 16521, "epoch": 393} {"train_loss": -5.311962127685547, "global_step": 16522, "epoch": 393} {"train_loss": -5.195270538330078, "global_step": 16523, "epoch": 393} {"train_loss": -5.205452919006348, "global_step": 16524, "epoch": 393} {"train_loss": -5.098021507263184, "global_step": 16525, "epoch": 393} {"train_loss": -5.141055583953857, "global_step": 16526, "epoch": 393} {"train_loss": -5.312664031982422, "global_step": 16527, "epoch": 393} {"train_loss": -5.296675682067871, "global_step": 16528, "epoch": 393} {"train_loss": -5.1986083984375, "global_step": 16529, "epoch": 393} {"train_loss": -5.287325859069824, "global_step": 16530, "epoch": 393} {"train_loss": -5.239514350891113, "global_step": 16531, "epoch": 393} {"train_loss": -5.2092180252075195, "global_step": 16532, "epoch": 393} {"train_loss": -5.1967315673828125, "global_step": 16533, "epoch": 393} {"train_loss": -5.261660099029541, "global_step": 16534, "epoch": 393} {"train_loss": -5.081660270690918, "global_step": 16535, "epoch": 393} {"train_loss": -5.249912738800049, "global_step": 16536, "epoch": 393} {"train_loss": -5.179001808166504, "global_step": 16537, "epoch": 393} {"train_loss": -5.247226238250732, "global_step": 16538, "epoch": 393} {"train_loss": -5.266449928283691, "global_step": 16539, "epoch": 393} {"train_loss": -5.305584907531738, "global_step": 16540, "epoch": 393} {"train_loss": -5.1181535720825195, "global_step": 16541, "epoch": 393} {"train_loss": -5.394778251647949, "global_step": 16542, "epoch": 393} {"train_loss": -5.359320640563965, "global_step": 16543, "epoch": 393} {"train_loss": -5.2943572998046875, "global_step": 16544, "epoch": 393} {"train_loss": -5.32672119140625, "global_step": 16545, "epoch": 393} {"train_loss": -5.226540565490723, "global_step": 16546, "epoch": 393} {"train_loss": -5.250468606040592, "global_step": 16547, "epoch": 393, "val_loss": 70737.5078125} {"train_loss": -5.294371604919434, "global_step": 16548, "epoch": 394} {"train_loss": -5.220088005065918, "global_step": 16549, "epoch": 394} {"train_loss": -5.140406131744385, "global_step": 16550, "epoch": 394} {"train_loss": -5.275568008422852, "global_step": 16551, "epoch": 394} {"train_loss": -5.139375686645508, "global_step": 16552, "epoch": 394} {"train_loss": -5.16863489151001, "global_step": 16553, "epoch": 394} {"train_loss": -5.326817512512207, "global_step": 16554, "epoch": 394} {"train_loss": -5.324154853820801, "global_step": 16555, "epoch": 394} {"train_loss": -5.211982727050781, "global_step": 16556, "epoch": 394} {"train_loss": -5.26643180847168, "global_step": 16557, "epoch": 394} {"train_loss": -5.15471887588501, "global_step": 16558, "epoch": 394} {"train_loss": -5.406659126281738, "global_step": 16559, "epoch": 394} {"train_loss": -5.283577919006348, "global_step": 16560, "epoch": 394} {"train_loss": -5.178580284118652, "global_step": 16561, "epoch": 394} {"train_loss": -5.316926002502441, "global_step": 16562, "epoch": 394} {"train_loss": -5.297240257263184, "global_step": 16563, "epoch": 394} {"train_loss": -5.239946365356445, "global_step": 16564, "epoch": 394} {"train_loss": -5.376749038696289, "global_step": 16565, "epoch": 394} {"train_loss": -5.385933876037598, "global_step": 16566, "epoch": 394} {"train_loss": -5.160198211669922, "global_step": 16567, "epoch": 394} {"train_loss": -5.331043243408203, "global_step": 16568, "epoch": 394} {"train_loss": -5.243758201599121, "global_step": 16569, "epoch": 394} {"train_loss": -5.27634334564209, "global_step": 16570, "epoch": 394} {"train_loss": -5.148067951202393, "global_step": 16571, "epoch": 394} {"train_loss": -5.29953670501709, "global_step": 16572, "epoch": 394} {"train_loss": -5.340004920959473, "global_step": 16573, "epoch": 394} {"train_loss": -5.317949295043945, "global_step": 16574, "epoch": 394} {"train_loss": -5.227038383483887, "global_step": 16575, "epoch": 394} {"train_loss": -5.155093669891357, "global_step": 16576, "epoch": 394} {"train_loss": -5.275687217712402, "global_step": 16577, "epoch": 394} {"train_loss": -5.224238395690918, "global_step": 16578, "epoch": 394} {"train_loss": -5.130081653594971, "global_step": 16579, "epoch": 394} {"train_loss": -5.300588607788086, "global_step": 16580, "epoch": 394} {"train_loss": -5.3489580154418945, "global_step": 16581, "epoch": 394} {"train_loss": -5.179079055786133, "global_step": 16582, "epoch": 394} {"train_loss": -5.2804975509643555, "global_step": 16583, "epoch": 394} {"train_loss": -5.246888160705566, "global_step": 16584, "epoch": 394} {"train_loss": -5.299807548522949, "global_step": 16585, "epoch": 394} {"train_loss": -5.201826095581055, "global_step": 16586, "epoch": 394} {"train_loss": -5.273857116699219, "global_step": 16587, "epoch": 394} {"train_loss": -5.1628947257995605, "global_step": 16588, "epoch": 394} {"train_loss": -5.2538443974086215, "global_step": 16589, "epoch": 394, "val_loss": 70192.234375} {"train_loss": -5.243030548095703, "global_step": 16590, "epoch": 395} {"train_loss": -5.205341339111328, "global_step": 16591, "epoch": 395} {"train_loss": -5.29405403137207, "global_step": 16592, "epoch": 395} {"train_loss": -5.306134223937988, "global_step": 16593, "epoch": 395} {"train_loss": -5.277762413024902, "global_step": 16594, "epoch": 395} {"train_loss": -5.3902587890625, "global_step": 16595, "epoch": 395} {"train_loss": -5.10466194152832, "global_step": 16596, "epoch": 395} {"train_loss": -5.259368896484375, "global_step": 16597, "epoch": 395} {"train_loss": -5.263378143310547, "global_step": 16598, "epoch": 395} {"train_loss": -5.138394355773926, "global_step": 16599, "epoch": 395} {"train_loss": -5.193681240081787, "global_step": 16600, "epoch": 395} {"train_loss": -5.32977294921875, "global_step": 16601, "epoch": 395} {"train_loss": -5.323552131652832, "global_step": 16602, "epoch": 395} {"train_loss": -5.402368068695068, "global_step": 16603, "epoch": 395} {"train_loss": -5.281017303466797, "global_step": 16604, "epoch": 395} {"train_loss": -5.322306156158447, "global_step": 16605, "epoch": 395} {"train_loss": -5.194088935852051, "global_step": 16606, "epoch": 395} {"train_loss": -5.167951583862305, "global_step": 16607, "epoch": 395} {"train_loss": -5.238358497619629, "global_step": 16608, "epoch": 395} {"train_loss": -5.157073497772217, "global_step": 16609, "epoch": 395} {"train_loss": -5.249784469604492, "global_step": 16610, "epoch": 395} {"train_loss": -5.293032169342041, "global_step": 16611, "epoch": 395} {"train_loss": -5.26236629486084, "global_step": 16612, "epoch": 395} {"train_loss": -5.2393693923950195, "global_step": 16613, "epoch": 395} {"train_loss": -5.310259819030762, "global_step": 16614, "epoch": 395} {"train_loss": -5.32717752456665, "global_step": 16615, "epoch": 395} {"train_loss": -5.218592643737793, "global_step": 16616, "epoch": 395} {"train_loss": -5.290740489959717, "global_step": 16617, "epoch": 395} {"train_loss": -5.272778511047363, "global_step": 16618, "epoch": 395} {"train_loss": -5.223163604736328, "global_step": 16619, "epoch": 395} {"train_loss": -5.170513153076172, "global_step": 16620, "epoch": 395} {"train_loss": -5.140567779541016, "global_step": 16621, "epoch": 395} {"train_loss": -5.256406784057617, "global_step": 16622, "epoch": 395} {"train_loss": -5.1917314529418945, "global_step": 16623, "epoch": 395} {"train_loss": -4.804018020629883, "global_step": 16624, "epoch": 395} {"train_loss": -5.019244194030762, "global_step": 16625, "epoch": 395} {"train_loss": -4.944849967956543, "global_step": 16626, "epoch": 395} {"train_loss": -5.295257568359375, "global_step": 16627, "epoch": 395} {"train_loss": -5.022342205047607, "global_step": 16628, "epoch": 395} {"train_loss": -4.963301658630371, "global_step": 16629, "epoch": 395} {"train_loss": -4.9916791915893555, "global_step": 16630, "epoch": 395} {"train_loss": -5.203626030967349, "global_step": 16631, "epoch": 395, "val_loss": 70633.2578125} {"train_loss": -5.126556396484375, "global_step": 16632, "epoch": 396} {"train_loss": -5.104413032531738, "global_step": 16633, "epoch": 396} {"train_loss": -5.097714424133301, "global_step": 16634, "epoch": 396} {"train_loss": -5.155404090881348, "global_step": 16635, "epoch": 396} {"train_loss": -5.0854291915893555, "global_step": 16636, "epoch": 396} {"train_loss": -5.199837684631348, "global_step": 16637, "epoch": 396} {"train_loss": -5.206390380859375, "global_step": 16638, "epoch": 396} {"train_loss": -5.0970048904418945, "global_step": 16639, "epoch": 396} {"train_loss": -5.193894386291504, "global_step": 16640, "epoch": 396} {"train_loss": -5.243934631347656, "global_step": 16641, "epoch": 396} {"train_loss": -5.191976547241211, "global_step": 16642, "epoch": 396} {"train_loss": -5.146092891693115, "global_step": 16643, "epoch": 396} {"train_loss": -5.194703102111816, "global_step": 16644, "epoch": 396} {"train_loss": -5.287958145141602, "global_step": 16645, "epoch": 396} {"train_loss": -5.357910633087158, "global_step": 16646, "epoch": 396} {"train_loss": -5.254924774169922, "global_step": 16647, "epoch": 396} {"train_loss": -5.205461502075195, "global_step": 16648, "epoch": 396} {"train_loss": -5.346584320068359, "global_step": 16649, "epoch": 396} {"train_loss": -5.169992446899414, "global_step": 16650, "epoch": 396} {"train_loss": -5.333741188049316, "global_step": 16651, "epoch": 396} {"train_loss": -5.124607086181641, "global_step": 16652, "epoch": 396} {"train_loss": -5.313055038452148, "global_step": 16653, "epoch": 396} {"train_loss": -5.222458362579346, "global_step": 16654, "epoch": 396} {"train_loss": -5.305136680603027, "global_step": 16655, "epoch": 396} {"train_loss": -5.328570365905762, "global_step": 16656, "epoch": 396} {"train_loss": -5.11666202545166, "global_step": 16657, "epoch": 396} {"train_loss": -5.328211307525635, "global_step": 16658, "epoch": 396} {"train_loss": -5.184510231018066, "global_step": 16659, "epoch": 396} {"train_loss": -5.303976535797119, "global_step": 16660, "epoch": 396} {"train_loss": -5.385207176208496, "global_step": 16661, "epoch": 396} {"train_loss": -5.234914779663086, "global_step": 16662, "epoch": 396} {"train_loss": -5.206321716308594, "global_step": 16663, "epoch": 396} {"train_loss": -5.306741714477539, "global_step": 16664, "epoch": 396} {"train_loss": -5.3680524826049805, "global_step": 16665, "epoch": 396} {"train_loss": -5.145344257354736, "global_step": 16666, "epoch": 396} {"train_loss": -5.250226020812988, "global_step": 16667, "epoch": 396} {"train_loss": -5.085492134094238, "global_step": 16668, "epoch": 396} {"train_loss": -5.273139476776123, "global_step": 16669, "epoch": 396} {"train_loss": -5.2473273277282715, "global_step": 16670, "epoch": 396} {"train_loss": -5.178284645080566, "global_step": 16671, "epoch": 396} {"train_loss": -5.249993324279785, "global_step": 16672, "epoch": 396} {"train_loss": -5.2252318972633, "global_step": 16673, "epoch": 396, "val_loss": 70024.3125} {"train_loss": -5.307150363922119, "global_step": 16674, "epoch": 397} {"train_loss": -5.387504577636719, "global_step": 16675, "epoch": 397} {"train_loss": -5.336685657501221, "global_step": 16676, "epoch": 397} {"train_loss": -5.330060958862305, "global_step": 16677, "epoch": 397} {"train_loss": -5.185271739959717, "global_step": 16678, "epoch": 397} {"train_loss": -5.288393974304199, "global_step": 16679, "epoch": 397} {"train_loss": -5.279697418212891, "global_step": 16680, "epoch": 397} {"train_loss": -5.3586931228637695, "global_step": 16681, "epoch": 397} {"train_loss": -5.136420249938965, "global_step": 16682, "epoch": 397} {"train_loss": -5.285113334655762, "global_step": 16683, "epoch": 397} {"train_loss": -5.265172958374023, "global_step": 16684, "epoch": 397} {"train_loss": -5.15451717376709, "global_step": 16685, "epoch": 397} {"train_loss": -5.019847869873047, "global_step": 16686, "epoch": 397} {"train_loss": -5.172857284545898, "global_step": 16687, "epoch": 397} {"train_loss": -5.292006969451904, "global_step": 16688, "epoch": 397} {"train_loss": -5.138433456420898, "global_step": 16689, "epoch": 397} {"train_loss": -5.256204605102539, "global_step": 16690, "epoch": 397} {"train_loss": -5.222164154052734, "global_step": 16691, "epoch": 397} {"train_loss": -5.18379545211792, "global_step": 16692, "epoch": 397} {"train_loss": -5.215113639831543, "global_step": 16693, "epoch": 397} {"train_loss": -5.200138568878174, "global_step": 16694, "epoch": 397} {"train_loss": -5.20576810836792, "global_step": 16695, "epoch": 397} {"train_loss": -5.193594932556152, "global_step": 16696, "epoch": 397} {"train_loss": -5.25254487991333, "global_step": 16697, "epoch": 397} {"train_loss": -5.144960403442383, "global_step": 16698, "epoch": 397} {"train_loss": -5.103307247161865, "global_step": 16699, "epoch": 397} {"train_loss": -5.298066139221191, "global_step": 16700, "epoch": 397} {"train_loss": -5.187381744384766, "global_step": 16701, "epoch": 397} {"train_loss": -5.286200523376465, "global_step": 16702, "epoch": 397} {"train_loss": -5.25540018081665, "global_step": 16703, "epoch": 397} {"train_loss": -5.253726005554199, "global_step": 16704, "epoch": 397} {"train_loss": -5.312532901763916, "global_step": 16705, "epoch": 397} {"train_loss": -5.466198921203613, "global_step": 16706, "epoch": 397} {"train_loss": -5.133364200592041, "global_step": 16707, "epoch": 397} {"train_loss": -5.209599018096924, "global_step": 16708, "epoch": 397} {"train_loss": -5.21306848526001, "global_step": 16709, "epoch": 397} {"train_loss": -5.218029975891113, "global_step": 16710, "epoch": 397} {"train_loss": -5.299605846405029, "global_step": 16711, "epoch": 397} {"train_loss": -5.127528190612793, "global_step": 16712, "epoch": 397} {"train_loss": -5.305349349975586, "global_step": 16713, "epoch": 397} {"train_loss": -5.198937892913818, "global_step": 16714, "epoch": 397} {"train_loss": -5.235594738097418, "global_step": 16715, "epoch": 397, "val_loss": 70217.984375} {"train_loss": -5.297842502593994, "global_step": 16716, "epoch": 398} {"train_loss": -5.21997594833374, "global_step": 16717, "epoch": 398} {"train_loss": -5.216538906097412, "global_step": 16718, "epoch": 398} {"train_loss": -5.294215202331543, "global_step": 16719, "epoch": 398} {"train_loss": -5.202358722686768, "global_step": 16720, "epoch": 398} {"train_loss": -5.265536785125732, "global_step": 16721, "epoch": 398} {"train_loss": -5.228017330169678, "global_step": 16722, "epoch": 398} {"train_loss": -5.410020351409912, "global_step": 16723, "epoch": 398} {"train_loss": -5.148312568664551, "global_step": 16724, "epoch": 398} {"train_loss": -5.232618808746338, "global_step": 16725, "epoch": 398} {"train_loss": -5.327823638916016, "global_step": 16726, "epoch": 398} {"train_loss": -5.378472328186035, "global_step": 16727, "epoch": 398} {"train_loss": -5.139115810394287, "global_step": 16728, "epoch": 398} {"train_loss": -5.258321285247803, "global_step": 16729, "epoch": 398} {"train_loss": -5.213214874267578, "global_step": 16730, "epoch": 398} {"train_loss": -5.300565719604492, "global_step": 16731, "epoch": 398} {"train_loss": -5.234185218811035, "global_step": 16732, "epoch": 398} {"train_loss": -5.253052234649658, "global_step": 16733, "epoch": 398} {"train_loss": -5.317756652832031, "global_step": 16734, "epoch": 398} {"train_loss": -5.251496315002441, "global_step": 16735, "epoch": 398} {"train_loss": -5.324000835418701, "global_step": 16736, "epoch": 398} {"train_loss": -5.260480880737305, "global_step": 16737, "epoch": 398} {"train_loss": -5.255649566650391, "global_step": 16738, "epoch": 398} {"train_loss": -5.273719787597656, "global_step": 16739, "epoch": 398} {"train_loss": -5.252264976501465, "global_step": 16740, "epoch": 398} {"train_loss": -5.225577354431152, "global_step": 16741, "epoch": 398} {"train_loss": -5.158945083618164, "global_step": 16742, "epoch": 398} {"train_loss": -5.2143049240112305, "global_step": 16743, "epoch": 398} {"train_loss": -5.2399749755859375, "global_step": 16744, "epoch": 398} {"train_loss": -5.0915846824646, "global_step": 16745, "epoch": 398} {"train_loss": -5.223660469055176, "global_step": 16746, "epoch": 398} {"train_loss": -5.136506080627441, "global_step": 16747, "epoch": 398} {"train_loss": -5.276633262634277, "global_step": 16748, "epoch": 398} {"train_loss": -5.396584510803223, "global_step": 16749, "epoch": 398} {"train_loss": -5.296626091003418, "global_step": 16750, "epoch": 398} {"train_loss": -5.292754173278809, "global_step": 16751, "epoch": 398} {"train_loss": -5.145626544952393, "global_step": 16752, "epoch": 398} {"train_loss": -5.343950271606445, "global_step": 16753, "epoch": 398} {"train_loss": -5.2561259269714355, "global_step": 16754, "epoch": 398} {"train_loss": -5.25529670715332, "global_step": 16755, "epoch": 398} {"train_loss": -5.309528350830078, "global_step": 16756, "epoch": 398} {"train_loss": -5.251756929215931, "global_step": 16757, "epoch": 398, "val_loss": 70643.421875} {"train_loss": -5.321046829223633, "global_step": 16758, "epoch": 399} {"train_loss": -5.319646835327148, "global_step": 16759, "epoch": 399} {"train_loss": -5.285355567932129, "global_step": 16760, "epoch": 399} {"train_loss": -5.233495712280273, "global_step": 16761, "epoch": 399} {"train_loss": -5.205766677856445, "global_step": 16762, "epoch": 399} {"train_loss": -5.1442670822143555, "global_step": 16763, "epoch": 399} {"train_loss": -5.32249641418457, "global_step": 16764, "epoch": 399} {"train_loss": -5.28425407409668, "global_step": 16765, "epoch": 399} {"train_loss": -5.123612403869629, "global_step": 16766, "epoch": 399} {"train_loss": -5.234726905822754, "global_step": 16767, "epoch": 399} {"train_loss": -5.392864227294922, "global_step": 16768, "epoch": 399} {"train_loss": -5.41016149520874, "global_step": 16769, "epoch": 399} {"train_loss": -5.294257164001465, "global_step": 16770, "epoch": 399} {"train_loss": -5.190518379211426, "global_step": 16771, "epoch": 399} {"train_loss": -5.192748546600342, "global_step": 16772, "epoch": 399} {"train_loss": -5.235873222351074, "global_step": 16773, "epoch": 399} {"train_loss": -5.230110168457031, "global_step": 16774, "epoch": 399} {"train_loss": -5.1177825927734375, "global_step": 16775, "epoch": 399} {"train_loss": -5.280765056610107, "global_step": 16776, "epoch": 399} {"train_loss": -5.178315162658691, "global_step": 16777, "epoch": 399} {"train_loss": -4.886031627655029, "global_step": 16778, "epoch": 399} {"train_loss": -5.294461250305176, "global_step": 16779, "epoch": 399} {"train_loss": -5.3035173416137695, "global_step": 16780, "epoch": 399} {"train_loss": -5.004518508911133, "global_step": 16781, "epoch": 399} {"train_loss": -5.180137634277344, "global_step": 16782, "epoch": 399} {"train_loss": -5.072882175445557, "global_step": 16783, "epoch": 399} {"train_loss": -5.056389808654785, "global_step": 16784, "epoch": 399} {"train_loss": -5.267516613006592, "global_step": 16785, "epoch": 399} {"train_loss": -5.020456314086914, "global_step": 16786, "epoch": 399} {"train_loss": -5.208705902099609, "global_step": 16787, "epoch": 399} {"train_loss": -5.08853816986084, "global_step": 16788, "epoch": 399} {"train_loss": -5.163741588592529, "global_step": 16789, "epoch": 399} {"train_loss": -5.005743026733398, "global_step": 16790, "epoch": 399} {"train_loss": -5.287849426269531, "global_step": 16791, "epoch": 399} {"train_loss": -5.096325874328613, "global_step": 16792, "epoch": 399} {"train_loss": -5.067002296447754, "global_step": 16793, "epoch": 399} {"train_loss": -5.180070877075195, "global_step": 16794, "epoch": 399} {"train_loss": -4.929606914520264, "global_step": 16795, "epoch": 399} {"train_loss": -5.106194019317627, "global_step": 16796, "epoch": 399} {"train_loss": -5.2008957862854, "global_step": 16797, "epoch": 399} {"train_loss": -4.969886302947998, "global_step": 16798, "epoch": 399} {"train_loss": -5.182146288099743, "global_step": 16799, "epoch": 399, "val_loss": 70374.03125} {"train_loss": -5.205417156219482, "global_step": 16800, "epoch": 400} {"train_loss": -5.152620315551758, "global_step": 16801, "epoch": 400} {"train_loss": -5.104659080505371, "global_step": 16802, "epoch": 400} {"train_loss": -5.128952980041504, "global_step": 16803, "epoch": 400} {"train_loss": -5.3315229415893555, "global_step": 16804, "epoch": 400} {"train_loss": -5.143476963043213, "global_step": 16805, "epoch": 400} {"train_loss": -5.311534881591797, "global_step": 16806, "epoch": 400} {"train_loss": -5.21125602722168, "global_step": 16807, "epoch": 400} {"train_loss": -5.33698034286499, "global_step": 16808, "epoch": 400} {"train_loss": -5.274722576141357, "global_step": 16809, "epoch": 400} {"train_loss": -5.222091197967529, "global_step": 16810, "epoch": 400} {"train_loss": -5.357921600341797, "global_step": 16811, "epoch": 400} {"train_loss": -5.187865257263184, "global_step": 16812, "epoch": 400} {"train_loss": -5.2014875411987305, "global_step": 16813, "epoch": 400} {"train_loss": -5.190688133239746, "global_step": 16814, "epoch": 400} {"train_loss": -5.246078968048096, "global_step": 16815, "epoch": 400} {"train_loss": -5.300701141357422, "global_step": 16816, "epoch": 400} {"train_loss": -5.267065048217773, "global_step": 16817, "epoch": 400} {"train_loss": -5.238380432128906, "global_step": 16818, "epoch": 400} {"train_loss": -5.253538131713867, "global_step": 16819, "epoch": 400} {"train_loss": -5.104287147521973, "global_step": 16820, "epoch": 400} {"train_loss": -5.28352165222168, "global_step": 16821, "epoch": 400} {"train_loss": -5.286365032196045, "global_step": 16822, "epoch": 400} {"train_loss": -5.304045677185059, "global_step": 16823, "epoch": 400} {"train_loss": -5.1420793533325195, "global_step": 16824, "epoch": 400} {"train_loss": -5.14824104309082, "global_step": 16825, "epoch": 400} {"train_loss": -5.247987270355225, "global_step": 16826, "epoch": 400} {"train_loss": -5.065797805786133, "global_step": 16827, "epoch": 400} {"train_loss": -5.1829047203063965, "global_step": 16828, "epoch": 400} {"train_loss": -5.33782434463501, "global_step": 16829, "epoch": 400} {"train_loss": -5.050045967102051, "global_step": 16830, "epoch": 400} {"train_loss": -4.9987664222717285, "global_step": 16831, "epoch": 400} {"train_loss": -5.2040815353393555, "global_step": 16832, "epoch": 400} {"train_loss": -5.185942649841309, "global_step": 16833, "epoch": 400} {"train_loss": -5.189374923706055, "global_step": 16834, "epoch": 400} {"train_loss": -5.25761604309082, "global_step": 16835, "epoch": 400} {"train_loss": -5.242550849914551, "global_step": 16836, "epoch": 400} {"train_loss": -5.054288864135742, "global_step": 16837, "epoch": 400} {"train_loss": -5.198975563049316, "global_step": 16838, "epoch": 400} {"train_loss": -5.279543399810791, "global_step": 16839, "epoch": 400} {"train_loss": -5.1864471435546875, "global_step": 16840, "epoch": 400} {"train_loss": -5.209627628326416, "global_step": 16841, "epoch": 400, "train/sim_max_reward_0": 0.49653039911170277, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.2606447261199013, "train/sim_max_reward_3": 0.027000251875486304, "train/sim_max_reward_4": 0.3142909543409577, "train/sim_max_reward_5": 0.5419996421213568, "test/sim_max_reward_4400000": 0.42854217085786683, "test/sim_max_reward_4400001": 0.17402012026901084, "test/sim_max_reward_4400002": 0.5181028534969874, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.10402440303119044, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.21978627225958666, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.07374705819516401, "test/sim_max_reward_4400012": 0.8906618306571936, "test/sim_max_reward_4400013": 0.9081301112848581, "test/sim_max_reward_4400014": 0.3705917419862047, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.49295310851824325, "test/sim_max_reward_4400018": 0.27845041582698304, "test/sim_max_reward_4400019": 0.23630520590329643, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5714821052728916, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.04265587881680046, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.26080674905310364, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.20931202985835984, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.44764535738533123, "test/sim_max_reward_4400031": 0.13702547867945444, "test/sim_max_reward_4400032": 0.774303250781065, "test/sim_max_reward_4400033": 0.13050522050468955, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.48961137057594556, "test/sim_max_reward_4400036": 0.38262738332091417, "test/sim_max_reward_4400037": 0.5760185809566302, "test/sim_max_reward_4400038": 0.8352556124218489, "test/sim_max_reward_4400039": 0.5054623223837762, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.2725198867547432, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.0, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.9046626040577859, "test/sim_max_reward_4400047": 0.24245932516733856, "test/sim_max_reward_4400048": 0.2832134361399909, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.273523575798534, "test/mean_score": 0.25202991460180413, "val_loss": 70719.0625} {"train_loss": -5.232912063598633, "global_step": 16842, "epoch": 401} {"train_loss": -5.189319610595703, "global_step": 16843, "epoch": 401} {"train_loss": -5.08121395111084, "global_step": 16844, "epoch": 401} {"train_loss": -5.144485950469971, "global_step": 16845, "epoch": 401} {"train_loss": -5.276772499084473, "global_step": 16846, "epoch": 401} {"train_loss": -5.2743940353393555, "global_step": 16847, "epoch": 401} {"train_loss": -5.378124713897705, "global_step": 16848, "epoch": 401} {"train_loss": -5.180041313171387, "global_step": 16849, "epoch": 401} {"train_loss": -5.165725231170654, "global_step": 16850, "epoch": 401} {"train_loss": -5.37129020690918, "global_step": 16851, "epoch": 401} {"train_loss": -5.298172473907471, "global_step": 16852, "epoch": 401} {"train_loss": -5.271407127380371, "global_step": 16853, "epoch": 401} {"train_loss": -5.205409049987793, "global_step": 16854, "epoch": 401} {"train_loss": -5.313897132873535, "global_step": 16855, "epoch": 401} {"train_loss": -5.163797378540039, "global_step": 16856, "epoch": 401} {"train_loss": -5.369873523712158, "global_step": 16857, "epoch": 401} {"train_loss": -5.322173595428467, "global_step": 16858, "epoch": 401} {"train_loss": -5.186975479125977, "global_step": 16859, "epoch": 401} {"train_loss": -5.342293739318848, "global_step": 16860, "epoch": 401} {"train_loss": -5.3149638175964355, "global_step": 16861, "epoch": 401} {"train_loss": -5.188534736633301, "global_step": 16862, "epoch": 401} {"train_loss": -5.339953422546387, "global_step": 16863, "epoch": 401} {"train_loss": -5.282087802886963, "global_step": 16864, "epoch": 401} {"train_loss": -5.170322418212891, "global_step": 16865, "epoch": 401} {"train_loss": -5.360444068908691, "global_step": 16866, "epoch": 401} {"train_loss": -5.3706817626953125, "global_step": 16867, "epoch": 401} {"train_loss": -5.253719329833984, "global_step": 16868, "epoch": 401} {"train_loss": -5.1636061668396, "global_step": 16869, "epoch": 401} {"train_loss": -5.346467971801758, "global_step": 16870, "epoch": 401} {"train_loss": -5.402739524841309, "global_step": 16871, "epoch": 401} {"train_loss": -5.159531593322754, "global_step": 16872, "epoch": 401} {"train_loss": -5.268476486206055, "global_step": 16873, "epoch": 401} {"train_loss": -5.255054473876953, "global_step": 16874, "epoch": 401} {"train_loss": -5.090967178344727, "global_step": 16875, "epoch": 401} {"train_loss": -5.3600172996521, "global_step": 16876, "epoch": 401} {"train_loss": -5.241232872009277, "global_step": 16877, "epoch": 401} {"train_loss": -5.230652809143066, "global_step": 16878, "epoch": 401} {"train_loss": -5.134894371032715, "global_step": 16879, "epoch": 401} {"train_loss": -5.20245885848999, "global_step": 16880, "epoch": 401} {"train_loss": -5.0379438400268555, "global_step": 16881, "epoch": 401} {"train_loss": -5.24245548248291, "global_step": 16882, "epoch": 401} {"train_loss": -5.244981595448086, "global_step": 16883, "epoch": 401, "val_loss": 70128.0390625} {"train_loss": -5.159290790557861, "global_step": 16884, "epoch": 402} {"train_loss": -5.319465637207031, "global_step": 16885, "epoch": 402} {"train_loss": -5.2090959548950195, "global_step": 16886, "epoch": 402} {"train_loss": -5.229887008666992, "global_step": 16887, "epoch": 402} {"train_loss": -5.108627796173096, "global_step": 16888, "epoch": 402} {"train_loss": -5.2274250984191895, "global_step": 16889, "epoch": 402} {"train_loss": -5.257268905639648, "global_step": 16890, "epoch": 402} {"train_loss": -5.2331695556640625, "global_step": 16891, "epoch": 402} {"train_loss": -5.210072994232178, "global_step": 16892, "epoch": 402} {"train_loss": -5.228858947753906, "global_step": 16893, "epoch": 402} {"train_loss": -5.186266899108887, "global_step": 16894, "epoch": 402} {"train_loss": -5.2585954666137695, "global_step": 16895, "epoch": 402} {"train_loss": -5.260986804962158, "global_step": 16896, "epoch": 402} {"train_loss": -5.13661527633667, "global_step": 16897, "epoch": 402} {"train_loss": -5.1629767417907715, "global_step": 16898, "epoch": 402} {"train_loss": -5.3049116134643555, "global_step": 16899, "epoch": 402} {"train_loss": -5.243546485900879, "global_step": 16900, "epoch": 402} {"train_loss": -5.408870697021484, "global_step": 16901, "epoch": 402} {"train_loss": -5.177299499511719, "global_step": 16902, "epoch": 402} {"train_loss": -5.352256774902344, "global_step": 16903, "epoch": 402} {"train_loss": -5.4379472732543945, "global_step": 16904, "epoch": 402} {"train_loss": -5.244383335113525, "global_step": 16905, "epoch": 402} {"train_loss": -5.318539619445801, "global_step": 16906, "epoch": 402} {"train_loss": -5.150728702545166, "global_step": 16907, "epoch": 402} {"train_loss": -5.309843063354492, "global_step": 16908, "epoch": 402} {"train_loss": -5.084830284118652, "global_step": 16909, "epoch": 402} {"train_loss": -5.2361650466918945, "global_step": 16910, "epoch": 402} {"train_loss": -5.291983604431152, "global_step": 16911, "epoch": 402} {"train_loss": -5.325539588928223, "global_step": 16912, "epoch": 402} {"train_loss": -5.201319694519043, "global_step": 16913, "epoch": 402} {"train_loss": -5.320370674133301, "global_step": 16914, "epoch": 402} {"train_loss": -5.309707164764404, "global_step": 16915, "epoch": 402} {"train_loss": -5.3965582847595215, "global_step": 16916, "epoch": 402} {"train_loss": -5.199108123779297, "global_step": 16917, "epoch": 402} {"train_loss": -5.316007614135742, "global_step": 16918, "epoch": 402} {"train_loss": -5.309122085571289, "global_step": 16919, "epoch": 402} {"train_loss": -5.207964897155762, "global_step": 16920, "epoch": 402} {"train_loss": -5.301811695098877, "global_step": 16921, "epoch": 402} {"train_loss": -5.278148174285889, "global_step": 16922, "epoch": 402} {"train_loss": -5.293430805206299, "global_step": 16923, "epoch": 402} {"train_loss": -5.197936058044434, "global_step": 16924, "epoch": 402} {"train_loss": -5.256192729586647, "global_step": 16925, "epoch": 402, "val_loss": 70682.609375} {"train_loss": -5.143404006958008, "global_step": 16926, "epoch": 403} {"train_loss": -5.005028247833252, "global_step": 16927, "epoch": 403} {"train_loss": -5.207325458526611, "global_step": 16928, "epoch": 403} {"train_loss": -5.160512924194336, "global_step": 16929, "epoch": 403} {"train_loss": -5.079375267028809, "global_step": 16930, "epoch": 403} {"train_loss": -5.269169330596924, "global_step": 16931, "epoch": 403} {"train_loss": -5.179174900054932, "global_step": 16932, "epoch": 403} {"train_loss": -5.151189804077148, "global_step": 16933, "epoch": 403} {"train_loss": -5.1541748046875, "global_step": 16934, "epoch": 403} {"train_loss": -4.98558235168457, "global_step": 16935, "epoch": 403} {"train_loss": -5.213642120361328, "global_step": 16936, "epoch": 403} {"train_loss": -5.176649570465088, "global_step": 16937, "epoch": 403} {"train_loss": -5.053005695343018, "global_step": 16938, "epoch": 403} {"train_loss": -5.20276403427124, "global_step": 16939, "epoch": 403} {"train_loss": -5.233835220336914, "global_step": 16940, "epoch": 403} {"train_loss": -5.223079204559326, "global_step": 16941, "epoch": 403} {"train_loss": -5.19691801071167, "global_step": 16942, "epoch": 403} {"train_loss": -5.190265655517578, "global_step": 16943, "epoch": 403} {"train_loss": -5.226004600524902, "global_step": 16944, "epoch": 403} {"train_loss": -5.221719741821289, "global_step": 16945, "epoch": 403} {"train_loss": -5.222856521606445, "global_step": 16946, "epoch": 403} {"train_loss": -5.290134429931641, "global_step": 16947, "epoch": 403} {"train_loss": -5.239421844482422, "global_step": 16948, "epoch": 403} {"train_loss": -5.328526496887207, "global_step": 16949, "epoch": 403} {"train_loss": -5.1249847412109375, "global_step": 16950, "epoch": 403} {"train_loss": -5.259137153625488, "global_step": 16951, "epoch": 403} {"train_loss": -5.32076358795166, "global_step": 16952, "epoch": 403} {"train_loss": -5.384952545166016, "global_step": 16953, "epoch": 403} {"train_loss": -5.195125579833984, "global_step": 16954, "epoch": 403} {"train_loss": -5.2159881591796875, "global_step": 16955, "epoch": 403} {"train_loss": -5.123781204223633, "global_step": 16956, "epoch": 403} {"train_loss": -5.399827003479004, "global_step": 16957, "epoch": 403} {"train_loss": -5.233426570892334, "global_step": 16958, "epoch": 403} {"train_loss": -5.234780311584473, "global_step": 16959, "epoch": 403} {"train_loss": -5.248724937438965, "global_step": 16960, "epoch": 403} {"train_loss": -5.33599853515625, "global_step": 16961, "epoch": 403} {"train_loss": -5.230726718902588, "global_step": 16962, "epoch": 403} {"train_loss": -5.197334289550781, "global_step": 16963, "epoch": 403} {"train_loss": -5.195603847503662, "global_step": 16964, "epoch": 403} {"train_loss": -5.18693733215332, "global_step": 16965, "epoch": 403} {"train_loss": -5.275631904602051, "global_step": 16966, "epoch": 403} {"train_loss": -5.209542240415301, "global_step": 16967, "epoch": 403, "val_loss": 70244.609375} {"train_loss": -5.347448825836182, "global_step": 16968, "epoch": 404} {"train_loss": -5.227943420410156, "global_step": 16969, "epoch": 404} {"train_loss": -5.149287223815918, "global_step": 16970, "epoch": 404} {"train_loss": -5.237762928009033, "global_step": 16971, "epoch": 404} {"train_loss": -5.121789932250977, "global_step": 16972, "epoch": 404} {"train_loss": -5.390473365783691, "global_step": 16973, "epoch": 404} {"train_loss": -5.352161884307861, "global_step": 16974, "epoch": 404} {"train_loss": -5.357452392578125, "global_step": 16975, "epoch": 404} {"train_loss": -5.343753337860107, "global_step": 16976, "epoch": 404} {"train_loss": -5.248347282409668, "global_step": 16977, "epoch": 404} {"train_loss": -5.382197380065918, "global_step": 16978, "epoch": 404} {"train_loss": -5.237929821014404, "global_step": 16979, "epoch": 404} {"train_loss": -5.168874740600586, "global_step": 16980, "epoch": 404} {"train_loss": -5.3233184814453125, "global_step": 16981, "epoch": 404} {"train_loss": -5.333298683166504, "global_step": 16982, "epoch": 404} {"train_loss": -5.349961280822754, "global_step": 16983, "epoch": 404} {"train_loss": -5.3543314933776855, "global_step": 16984, "epoch": 404} {"train_loss": -5.239716529846191, "global_step": 16985, "epoch": 404} {"train_loss": -5.291691780090332, "global_step": 16986, "epoch": 404} {"train_loss": -5.293615341186523, "global_step": 16987, "epoch": 404} {"train_loss": -5.26495361328125, "global_step": 16988, "epoch": 404} {"train_loss": -5.2676544189453125, "global_step": 16989, "epoch": 404} {"train_loss": -5.238650321960449, "global_step": 16990, "epoch": 404} {"train_loss": -5.184608459472656, "global_step": 16991, "epoch": 404} {"train_loss": -5.449212074279785, "global_step": 16992, "epoch": 404} {"train_loss": -5.226787567138672, "global_step": 16993, "epoch": 404} {"train_loss": -5.149357795715332, "global_step": 16994, "epoch": 404} {"train_loss": -5.204152584075928, "global_step": 16995, "epoch": 404} {"train_loss": -5.044406414031982, "global_step": 16996, "epoch": 404} {"train_loss": -5.291347503662109, "global_step": 16997, "epoch": 404} {"train_loss": -5.245486259460449, "global_step": 16998, "epoch": 404} {"train_loss": -5.013293743133545, "global_step": 16999, "epoch": 404} {"train_loss": -5.221741676330566, "global_step": 17000, "epoch": 404} {"train_loss": -5.21651029586792, "global_step": 17001, "epoch": 404} {"train_loss": -5.099413871765137, "global_step": 17002, "epoch": 404} {"train_loss": -5.348965644836426, "global_step": 17003, "epoch": 404} {"train_loss": -5.234408855438232, "global_step": 17004, "epoch": 404} {"train_loss": -5.0973711013793945, "global_step": 17005, "epoch": 404} {"train_loss": -5.114413261413574, "global_step": 17006, "epoch": 404} {"train_loss": -4.92508602142334, "global_step": 17007, "epoch": 404} {"train_loss": -5.189070224761963, "global_step": 17008, "epoch": 404} {"train_loss": -5.233526207151867, "global_step": 17009, "epoch": 404, "val_loss": 70120.78125} {"train_loss": -5.211343765258789, "global_step": 17010, "epoch": 405} {"train_loss": -5.135931968688965, "global_step": 17011, "epoch": 405} {"train_loss": -5.190563201904297, "global_step": 17012, "epoch": 405} {"train_loss": -5.172018051147461, "global_step": 17013, "epoch": 405} {"train_loss": -5.2475738525390625, "global_step": 17014, "epoch": 405} {"train_loss": -5.219309329986572, "global_step": 17015, "epoch": 405} {"train_loss": -5.258718967437744, "global_step": 17016, "epoch": 405} {"train_loss": -5.320954322814941, "global_step": 17017, "epoch": 405} {"train_loss": -5.180948734283447, "global_step": 17018, "epoch": 405} {"train_loss": -5.089822769165039, "global_step": 17019, "epoch": 405} {"train_loss": -5.1262969970703125, "global_step": 17020, "epoch": 405} {"train_loss": -5.173473834991455, "global_step": 17021, "epoch": 405} {"train_loss": -5.267923355102539, "global_step": 17022, "epoch": 405} {"train_loss": -5.213545322418213, "global_step": 17023, "epoch": 405} {"train_loss": -5.283653259277344, "global_step": 17024, "epoch": 405} {"train_loss": -5.126646041870117, "global_step": 17025, "epoch": 405} {"train_loss": -5.165367126464844, "global_step": 17026, "epoch": 405} {"train_loss": -5.160165309906006, "global_step": 17027, "epoch": 405} {"train_loss": -5.2483015060424805, "global_step": 17028, "epoch": 405} {"train_loss": -5.263638496398926, "global_step": 17029, "epoch": 405} {"train_loss": -5.383710861206055, "global_step": 17030, "epoch": 405} {"train_loss": -5.298386096954346, "global_step": 17031, "epoch": 405} {"train_loss": -5.196502685546875, "global_step": 17032, "epoch": 405} {"train_loss": -5.365093231201172, "global_step": 17033, "epoch": 405} {"train_loss": -5.246098518371582, "global_step": 17034, "epoch": 405} {"train_loss": -5.257359504699707, "global_step": 17035, "epoch": 405} {"train_loss": -5.368657112121582, "global_step": 17036, "epoch": 405} {"train_loss": -5.131821632385254, "global_step": 17037, "epoch": 405} {"train_loss": -5.251401901245117, "global_step": 17038, "epoch": 405} {"train_loss": -5.286102294921875, "global_step": 17039, "epoch": 405} {"train_loss": -5.370891571044922, "global_step": 17040, "epoch": 405} {"train_loss": -5.056035995483398, "global_step": 17041, "epoch": 405} {"train_loss": -5.1642255783081055, "global_step": 17042, "epoch": 405} {"train_loss": -5.14067268371582, "global_step": 17043, "epoch": 405} {"train_loss": -5.071290016174316, "global_step": 17044, "epoch": 405} {"train_loss": -5.155264854431152, "global_step": 17045, "epoch": 405} {"train_loss": -5.139779090881348, "global_step": 17046, "epoch": 405} {"train_loss": -5.022033214569092, "global_step": 17047, "epoch": 405} {"train_loss": -5.2096991539001465, "global_step": 17048, "epoch": 405} {"train_loss": -5.084420204162598, "global_step": 17049, "epoch": 405} {"train_loss": -5.30388879776001, "global_step": 17050, "epoch": 405} {"train_loss": -5.205874193282354, "global_step": 17051, "epoch": 405, "val_loss": 70081.984375} {"train_loss": -5.2517900466918945, "global_step": 17052, "epoch": 406} {"train_loss": -5.320452690124512, "global_step": 17053, "epoch": 406} {"train_loss": -5.209462642669678, "global_step": 17054, "epoch": 406} {"train_loss": -5.257862091064453, "global_step": 17055, "epoch": 406} {"train_loss": -5.316132545471191, "global_step": 17056, "epoch": 406} {"train_loss": -5.293447017669678, "global_step": 17057, "epoch": 406} {"train_loss": -5.26799201965332, "global_step": 17058, "epoch": 406} {"train_loss": -5.307901382446289, "global_step": 17059, "epoch": 406} {"train_loss": -5.206284046173096, "global_step": 17060, "epoch": 406} {"train_loss": -5.306445121765137, "global_step": 17061, "epoch": 406} {"train_loss": -5.08558988571167, "global_step": 17062, "epoch": 406} {"train_loss": -5.288136959075928, "global_step": 17063, "epoch": 406} {"train_loss": -5.325567245483398, "global_step": 17064, "epoch": 406} {"train_loss": -5.274813175201416, "global_step": 17065, "epoch": 406} {"train_loss": -5.156195640563965, "global_step": 17066, "epoch": 406} {"train_loss": -5.278436183929443, "global_step": 17067, "epoch": 406} {"train_loss": -5.337506294250488, "global_step": 17068, "epoch": 406} {"train_loss": -5.201900005340576, "global_step": 17069, "epoch": 406} {"train_loss": -5.216152191162109, "global_step": 17070, "epoch": 406} {"train_loss": -5.216157913208008, "global_step": 17071, "epoch": 406} {"train_loss": -5.227231979370117, "global_step": 17072, "epoch": 406} {"train_loss": -5.199843883514404, "global_step": 17073, "epoch": 406} {"train_loss": -5.309654235839844, "global_step": 17074, "epoch": 406} {"train_loss": -5.1740875244140625, "global_step": 17075, "epoch": 406} {"train_loss": -5.253647804260254, "global_step": 17076, "epoch": 406} {"train_loss": -5.344611644744873, "global_step": 17077, "epoch": 406} {"train_loss": -5.16469669342041, "global_step": 17078, "epoch": 406} {"train_loss": -5.164960861206055, "global_step": 17079, "epoch": 406} {"train_loss": -5.32335090637207, "global_step": 17080, "epoch": 406} {"train_loss": -5.250551223754883, "global_step": 17081, "epoch": 406} {"train_loss": -5.18233060836792, "global_step": 17082, "epoch": 406} {"train_loss": -5.356906890869141, "global_step": 17083, "epoch": 406} {"train_loss": -5.191173553466797, "global_step": 17084, "epoch": 406} {"train_loss": -5.274810791015625, "global_step": 17085, "epoch": 406} {"train_loss": -5.202564239501953, "global_step": 17086, "epoch": 406} {"train_loss": -5.320108413696289, "global_step": 17087, "epoch": 406} {"train_loss": -5.349199295043945, "global_step": 17088, "epoch": 406} {"train_loss": -5.343052387237549, "global_step": 17089, "epoch": 406} {"train_loss": -5.186304092407227, "global_step": 17090, "epoch": 406} {"train_loss": -5.209002494812012, "global_step": 17091, "epoch": 406} {"train_loss": -5.235884189605713, "global_step": 17092, "epoch": 406} {"train_loss": -5.255218664805095, "global_step": 17093, "epoch": 406, "val_loss": 70302.2109375} {"train_loss": -5.255121231079102, "global_step": 17094, "epoch": 407} {"train_loss": -5.221234321594238, "global_step": 17095, "epoch": 407} {"train_loss": -5.298597812652588, "global_step": 17096, "epoch": 407} {"train_loss": -5.058145999908447, "global_step": 17097, "epoch": 407} {"train_loss": -5.346964359283447, "global_step": 17098, "epoch": 407} {"train_loss": -5.1475934982299805, "global_step": 17099, "epoch": 407} {"train_loss": -5.181423187255859, "global_step": 17100, "epoch": 407} {"train_loss": -5.343812942504883, "global_step": 17101, "epoch": 407} {"train_loss": -5.2910871505737305, "global_step": 17102, "epoch": 407} {"train_loss": -5.306822776794434, "global_step": 17103, "epoch": 407} {"train_loss": -5.362971305847168, "global_step": 17104, "epoch": 407} {"train_loss": -5.1593217849731445, "global_step": 17105, "epoch": 407} {"train_loss": -5.27025842666626, "global_step": 17106, "epoch": 407} {"train_loss": -5.403247356414795, "global_step": 17107, "epoch": 407} {"train_loss": -5.20042610168457, "global_step": 17108, "epoch": 407} {"train_loss": -5.233767509460449, "global_step": 17109, "epoch": 407} {"train_loss": -5.246879577636719, "global_step": 17110, "epoch": 407} {"train_loss": -5.359476566314697, "global_step": 17111, "epoch": 407} {"train_loss": -5.359427452087402, "global_step": 17112, "epoch": 407} {"train_loss": -5.309301376342773, "global_step": 17113, "epoch": 407} {"train_loss": -5.174378395080566, "global_step": 17114, "epoch": 407} {"train_loss": -5.10398006439209, "global_step": 17115, "epoch": 407} {"train_loss": -5.185880184173584, "global_step": 17116, "epoch": 407} {"train_loss": -5.1795549392700195, "global_step": 17117, "epoch": 407} {"train_loss": -5.211911201477051, "global_step": 17118, "epoch": 407} {"train_loss": -5.235828399658203, "global_step": 17119, "epoch": 407} {"train_loss": -5.219361305236816, "global_step": 17120, "epoch": 407} {"train_loss": -5.349428176879883, "global_step": 17121, "epoch": 407} {"train_loss": -5.362530708312988, "global_step": 17122, "epoch": 407} {"train_loss": -5.365569114685059, "global_step": 17123, "epoch": 407} {"train_loss": -5.241001129150391, "global_step": 17124, "epoch": 407} {"train_loss": -5.133011817932129, "global_step": 17125, "epoch": 407} {"train_loss": -5.3025617599487305, "global_step": 17126, "epoch": 407} {"train_loss": -5.235075950622559, "global_step": 17127, "epoch": 407} {"train_loss": -5.270654678344727, "global_step": 17128, "epoch": 407} {"train_loss": -5.286665916442871, "global_step": 17129, "epoch": 407} {"train_loss": -5.191547393798828, "global_step": 17130, "epoch": 407} {"train_loss": -5.240508556365967, "global_step": 17131, "epoch": 407} {"train_loss": -5.2357282638549805, "global_step": 17132, "epoch": 407} {"train_loss": -5.319040298461914, "global_step": 17133, "epoch": 407} {"train_loss": -5.2226362228393555, "global_step": 17134, "epoch": 407} {"train_loss": -5.256589492162068, "global_step": 17135, "epoch": 407, "val_loss": 70057.3125} {"train_loss": -5.496323108673096, "global_step": 17136, "epoch": 408} {"train_loss": -5.19542121887207, "global_step": 17137, "epoch": 408} {"train_loss": -5.239644527435303, "global_step": 17138, "epoch": 408} {"train_loss": -5.172860145568848, "global_step": 17139, "epoch": 408} {"train_loss": -5.3701090812683105, "global_step": 17140, "epoch": 408} {"train_loss": -5.139708518981934, "global_step": 17141, "epoch": 408} {"train_loss": -5.248770713806152, "global_step": 17142, "epoch": 408} {"train_loss": -5.232028961181641, "global_step": 17143, "epoch": 408} {"train_loss": -5.180712699890137, "global_step": 17144, "epoch": 408} {"train_loss": -5.243068695068359, "global_step": 17145, "epoch": 408} {"train_loss": -5.351637840270996, "global_step": 17146, "epoch": 408} {"train_loss": -5.370930194854736, "global_step": 17147, "epoch": 408} {"train_loss": -5.184944152832031, "global_step": 17148, "epoch": 408} {"train_loss": -5.284552574157715, "global_step": 17149, "epoch": 408} {"train_loss": -5.159881591796875, "global_step": 17150, "epoch": 408} {"train_loss": -5.283789157867432, "global_step": 17151, "epoch": 408} {"train_loss": -5.311798095703125, "global_step": 17152, "epoch": 408} {"train_loss": -5.258363723754883, "global_step": 17153, "epoch": 408} {"train_loss": -5.185334205627441, "global_step": 17154, "epoch": 408} {"train_loss": -5.187422275543213, "global_step": 17155, "epoch": 408} {"train_loss": -5.230738162994385, "global_step": 17156, "epoch": 408} {"train_loss": -5.173361301422119, "global_step": 17157, "epoch": 408} {"train_loss": -5.083277702331543, "global_step": 17158, "epoch": 408} {"train_loss": -5.29999303817749, "global_step": 17159, "epoch": 408} {"train_loss": -5.266598224639893, "global_step": 17160, "epoch": 408} {"train_loss": -5.23680305480957, "global_step": 17161, "epoch": 408} {"train_loss": -5.289525985717773, "global_step": 17162, "epoch": 408} {"train_loss": -5.2191572189331055, "global_step": 17163, "epoch": 408} {"train_loss": -5.154106616973877, "global_step": 17164, "epoch": 408} {"train_loss": -5.208992004394531, "global_step": 17165, "epoch": 408} {"train_loss": -5.356908798217773, "global_step": 17166, "epoch": 408} {"train_loss": -5.163060188293457, "global_step": 17167, "epoch": 408} {"train_loss": -5.252878189086914, "global_step": 17168, "epoch": 408} {"train_loss": -5.191324234008789, "global_step": 17169, "epoch": 408} {"train_loss": -5.337239742279053, "global_step": 17170, "epoch": 408} {"train_loss": -5.1866865158081055, "global_step": 17171, "epoch": 408} {"train_loss": -5.270537376403809, "global_step": 17172, "epoch": 408} {"train_loss": -5.262576103210449, "global_step": 17173, "epoch": 408} {"train_loss": -5.209167003631592, "global_step": 17174, "epoch": 408} {"train_loss": -5.204998970031738, "global_step": 17175, "epoch": 408} {"train_loss": -5.358749866485596, "global_step": 17176, "epoch": 408} {"train_loss": -5.2464720748719715, "global_step": 17177, "epoch": 408, "val_loss": 69988.765625} {"train_loss": -5.297053813934326, "global_step": 17178, "epoch": 409} {"train_loss": -5.2523651123046875, "global_step": 17179, "epoch": 409} {"train_loss": -5.260402202606201, "global_step": 17180, "epoch": 409} {"train_loss": -5.250439167022705, "global_step": 17181, "epoch": 409} {"train_loss": -5.371851921081543, "global_step": 17182, "epoch": 409} {"train_loss": -5.245290279388428, "global_step": 17183, "epoch": 409} {"train_loss": -5.229982852935791, "global_step": 17184, "epoch": 409} {"train_loss": -5.191865921020508, "global_step": 17185, "epoch": 409} {"train_loss": -5.263195991516113, "global_step": 17186, "epoch": 409} {"train_loss": -5.3487701416015625, "global_step": 17187, "epoch": 409} {"train_loss": -5.257969379425049, "global_step": 17188, "epoch": 409} {"train_loss": -5.368430137634277, "global_step": 17189, "epoch": 409} {"train_loss": -5.224833011627197, "global_step": 17190, "epoch": 409} {"train_loss": -5.295495986938477, "global_step": 17191, "epoch": 409} {"train_loss": -5.273797512054443, "global_step": 17192, "epoch": 409} {"train_loss": -5.133905410766602, "global_step": 17193, "epoch": 409} {"train_loss": -5.254913330078125, "global_step": 17194, "epoch": 409} {"train_loss": -5.298395156860352, "global_step": 17195, "epoch": 409} {"train_loss": -5.2288713455200195, "global_step": 17196, "epoch": 409} {"train_loss": -5.178893089294434, "global_step": 17197, "epoch": 409} {"train_loss": -5.327549934387207, "global_step": 17198, "epoch": 409} {"train_loss": -5.268595218658447, "global_step": 17199, "epoch": 409} {"train_loss": -5.312709808349609, "global_step": 17200, "epoch": 409} {"train_loss": -5.270014762878418, "global_step": 17201, "epoch": 409} {"train_loss": -5.400798797607422, "global_step": 17202, "epoch": 409} {"train_loss": -5.196964263916016, "global_step": 17203, "epoch": 409} {"train_loss": -5.172880172729492, "global_step": 17204, "epoch": 409} {"train_loss": -5.198534965515137, "global_step": 17205, "epoch": 409} {"train_loss": -5.291513442993164, "global_step": 17206, "epoch": 409} {"train_loss": -5.214591979980469, "global_step": 17207, "epoch": 409} {"train_loss": -5.285792350769043, "global_step": 17208, "epoch": 409} {"train_loss": -5.418033599853516, "global_step": 17209, "epoch": 409} {"train_loss": -5.280111312866211, "global_step": 17210, "epoch": 409} {"train_loss": -5.335562705993652, "global_step": 17211, "epoch": 409} {"train_loss": -5.169625759124756, "global_step": 17212, "epoch": 409} {"train_loss": -5.277261257171631, "global_step": 17213, "epoch": 409} {"train_loss": -5.412440299987793, "global_step": 17214, "epoch": 409} {"train_loss": -5.200684547424316, "global_step": 17215, "epoch": 409} {"train_loss": -5.294621467590332, "global_step": 17216, "epoch": 409} {"train_loss": -5.252871513366699, "global_step": 17217, "epoch": 409} {"train_loss": -5.198921203613281, "global_step": 17218, "epoch": 409} {"train_loss": -5.268676428567796, "global_step": 17219, "epoch": 409, "val_loss": 69792.0078125} {"train_loss": -5.193680286407471, "global_step": 17220, "epoch": 410} {"train_loss": -5.1698479652404785, "global_step": 17221, "epoch": 410} {"train_loss": -5.340123176574707, "global_step": 17222, "epoch": 410} {"train_loss": -5.232172966003418, "global_step": 17223, "epoch": 410} {"train_loss": -5.2480082511901855, "global_step": 17224, "epoch": 410} {"train_loss": -5.317028999328613, "global_step": 17225, "epoch": 410} {"train_loss": -5.3055500984191895, "global_step": 17226, "epoch": 410} {"train_loss": -5.280392646789551, "global_step": 17227, "epoch": 410} {"train_loss": -5.259871482849121, "global_step": 17228, "epoch": 410} {"train_loss": -5.332467555999756, "global_step": 17229, "epoch": 410} {"train_loss": -5.117520332336426, "global_step": 17230, "epoch": 410} {"train_loss": -5.2235307693481445, "global_step": 17231, "epoch": 410} {"train_loss": -5.308685779571533, "global_step": 17232, "epoch": 410} {"train_loss": -5.2916059494018555, "global_step": 17233, "epoch": 410} {"train_loss": -5.328945636749268, "global_step": 17234, "epoch": 410} {"train_loss": -5.296038627624512, "global_step": 17235, "epoch": 410} {"train_loss": -5.366935729980469, "global_step": 17236, "epoch": 410} {"train_loss": -5.317460060119629, "global_step": 17237, "epoch": 410} {"train_loss": -5.328456401824951, "global_step": 17238, "epoch": 410} {"train_loss": -5.355340003967285, "global_step": 17239, "epoch": 410} {"train_loss": -5.272504806518555, "global_step": 17240, "epoch": 410} {"train_loss": -5.154739856719971, "global_step": 17241, "epoch": 410} {"train_loss": -5.2866621017456055, "global_step": 17242, "epoch": 410} {"train_loss": -5.200631618499756, "global_step": 17243, "epoch": 410} {"train_loss": -5.241066932678223, "global_step": 17244, "epoch": 410} {"train_loss": -5.348766326904297, "global_step": 17245, "epoch": 410} {"train_loss": -5.220264434814453, "global_step": 17246, "epoch": 410} {"train_loss": -5.267716407775879, "global_step": 17247, "epoch": 410} {"train_loss": -5.325081825256348, "global_step": 17248, "epoch": 410} {"train_loss": -5.218656539916992, "global_step": 17249, "epoch": 410} {"train_loss": -5.207350730895996, "global_step": 17250, "epoch": 410} {"train_loss": -5.127346038818359, "global_step": 17251, "epoch": 410} {"train_loss": -5.349017143249512, "global_step": 17252, "epoch": 410} {"train_loss": -5.349102020263672, "global_step": 17253, "epoch": 410} {"train_loss": -5.257007122039795, "global_step": 17254, "epoch": 410} {"train_loss": -5.366152763366699, "global_step": 17255, "epoch": 410} {"train_loss": -5.15156364440918, "global_step": 17256, "epoch": 410} {"train_loss": -5.304756164550781, "global_step": 17257, "epoch": 410} {"train_loss": -5.406982421875, "global_step": 17258, "epoch": 410} {"train_loss": -5.329350471496582, "global_step": 17259, "epoch": 410} {"train_loss": -5.200690269470215, "global_step": 17260, "epoch": 410} {"train_loss": -5.269434599649339, "global_step": 17261, "epoch": 410, "val_loss": 70449.234375} {"train_loss": -5.190167427062988, "global_step": 17262, "epoch": 411} {"train_loss": -5.2379350662231445, "global_step": 17263, "epoch": 411} {"train_loss": -5.242915153503418, "global_step": 17264, "epoch": 411} {"train_loss": -5.141282081604004, "global_step": 17265, "epoch": 411} {"train_loss": -5.150765419006348, "global_step": 17266, "epoch": 411} {"train_loss": -5.091426849365234, "global_step": 17267, "epoch": 411} {"train_loss": -5.320796966552734, "global_step": 17268, "epoch": 411} {"train_loss": -5.262178421020508, "global_step": 17269, "epoch": 411} {"train_loss": -5.234420299530029, "global_step": 17270, "epoch": 411} {"train_loss": -5.255483627319336, "global_step": 17271, "epoch": 411} {"train_loss": -5.311030387878418, "global_step": 17272, "epoch": 411} {"train_loss": -5.294924259185791, "global_step": 17273, "epoch": 411} {"train_loss": -5.228611946105957, "global_step": 17274, "epoch": 411} {"train_loss": -5.151110649108887, "global_step": 17275, "epoch": 411} {"train_loss": -5.230110168457031, "global_step": 17276, "epoch": 411} {"train_loss": -5.284988880157471, "global_step": 17277, "epoch": 411} {"train_loss": -5.216317653656006, "global_step": 17278, "epoch": 411} {"train_loss": -5.265078544616699, "global_step": 17279, "epoch": 411} {"train_loss": -5.308722496032715, "global_step": 17280, "epoch": 411} {"train_loss": -5.197123050689697, "global_step": 17281, "epoch": 411} {"train_loss": -5.30623722076416, "global_step": 17282, "epoch": 411} {"train_loss": -5.258312702178955, "global_step": 17283, "epoch": 411} {"train_loss": -5.247520923614502, "global_step": 17284, "epoch": 411} {"train_loss": -5.284858703613281, "global_step": 17285, "epoch": 411} {"train_loss": -5.425897598266602, "global_step": 17286, "epoch": 411} {"train_loss": -5.230648994445801, "global_step": 17287, "epoch": 411} {"train_loss": -5.245794296264648, "global_step": 17288, "epoch": 411} {"train_loss": -5.348011016845703, "global_step": 17289, "epoch": 411} {"train_loss": -5.169098854064941, "global_step": 17290, "epoch": 411} {"train_loss": -5.230427265167236, "global_step": 17291, "epoch": 411} {"train_loss": -5.213451385498047, "global_step": 17292, "epoch": 411} {"train_loss": -5.330606460571289, "global_step": 17293, "epoch": 411} {"train_loss": -5.18870735168457, "global_step": 17294, "epoch": 411} {"train_loss": -5.201089859008789, "global_step": 17295, "epoch": 411} {"train_loss": -5.3968682289123535, "global_step": 17296, "epoch": 411} {"train_loss": -5.266290664672852, "global_step": 17297, "epoch": 411} {"train_loss": -5.343316555023193, "global_step": 17298, "epoch": 411} {"train_loss": -5.256983757019043, "global_step": 17299, "epoch": 411} {"train_loss": -5.279519081115723, "global_step": 17300, "epoch": 411} {"train_loss": -5.242555618286133, "global_step": 17301, "epoch": 411} {"train_loss": -5.07069730758667, "global_step": 17302, "epoch": 411} {"train_loss": -5.244294257391067, "global_step": 17303, "epoch": 411, "val_loss": 70280.8671875} {"train_loss": -5.217708110809326, "global_step": 17304, "epoch": 412} {"train_loss": -5.371450424194336, "global_step": 17305, "epoch": 412} {"train_loss": -5.021522045135498, "global_step": 17306, "epoch": 412} {"train_loss": -5.287519454956055, "global_step": 17307, "epoch": 412} {"train_loss": -5.339354515075684, "global_step": 17308, "epoch": 412} {"train_loss": -5.156033515930176, "global_step": 17309, "epoch": 412} {"train_loss": -5.23500919342041, "global_step": 17310, "epoch": 412} {"train_loss": -5.229156017303467, "global_step": 17311, "epoch": 412} {"train_loss": -5.069518089294434, "global_step": 17312, "epoch": 412} {"train_loss": -5.220794677734375, "global_step": 17313, "epoch": 412} {"train_loss": -5.398521423339844, "global_step": 17314, "epoch": 412} {"train_loss": -5.188580513000488, "global_step": 17315, "epoch": 412} {"train_loss": -5.196728706359863, "global_step": 17316, "epoch": 412} {"train_loss": -5.258984088897705, "global_step": 17317, "epoch": 412} {"train_loss": -5.294532299041748, "global_step": 17318, "epoch": 412} {"train_loss": -5.2024922370910645, "global_step": 17319, "epoch": 412} {"train_loss": -5.194845199584961, "global_step": 17320, "epoch": 412} {"train_loss": -5.204844951629639, "global_step": 17321, "epoch": 412} {"train_loss": -5.189757347106934, "global_step": 17322, "epoch": 412} {"train_loss": -5.400563716888428, "global_step": 17323, "epoch": 412} {"train_loss": -5.238801002502441, "global_step": 17324, "epoch": 412} {"train_loss": -5.225962162017822, "global_step": 17325, "epoch": 412} {"train_loss": -5.293941974639893, "global_step": 17326, "epoch": 412} {"train_loss": -5.246042728424072, "global_step": 17327, "epoch": 412} {"train_loss": -5.145909309387207, "global_step": 17328, "epoch": 412} {"train_loss": -5.292883396148682, "global_step": 17329, "epoch": 412} {"train_loss": -5.124977111816406, "global_step": 17330, "epoch": 412} {"train_loss": -5.283934593200684, "global_step": 17331, "epoch": 412} {"train_loss": -5.181682586669922, "global_step": 17332, "epoch": 412} {"train_loss": -5.294864654541016, "global_step": 17333, "epoch": 412} {"train_loss": -5.237972259521484, "global_step": 17334, "epoch": 412} {"train_loss": -5.347591876983643, "global_step": 17335, "epoch": 412} {"train_loss": -5.285109519958496, "global_step": 17336, "epoch": 412} {"train_loss": -5.307442665100098, "global_step": 17337, "epoch": 412} {"train_loss": -5.258572578430176, "global_step": 17338, "epoch": 412} {"train_loss": -5.215624809265137, "global_step": 17339, "epoch": 412} {"train_loss": -5.262175559997559, "global_step": 17340, "epoch": 412} {"train_loss": -5.303583145141602, "global_step": 17341, "epoch": 412} {"train_loss": -5.300012111663818, "global_step": 17342, "epoch": 412} {"train_loss": -5.227569580078125, "global_step": 17343, "epoch": 412} {"train_loss": -5.291123390197754, "global_step": 17344, "epoch": 412} {"train_loss": -5.2432632219223745, "global_step": 17345, "epoch": 412, "val_loss": 70141.2578125} {"train_loss": -5.21442985534668, "global_step": 17346, "epoch": 413} {"train_loss": -5.298062801361084, "global_step": 17347, "epoch": 413} {"train_loss": -5.292940139770508, "global_step": 17348, "epoch": 413} {"train_loss": -5.222720146179199, "global_step": 17349, "epoch": 413} {"train_loss": -5.3365044593811035, "global_step": 17350, "epoch": 413} {"train_loss": -5.309635639190674, "global_step": 17351, "epoch": 413} {"train_loss": -5.179110527038574, "global_step": 17352, "epoch": 413} {"train_loss": -5.255926132202148, "global_step": 17353, "epoch": 413} {"train_loss": -5.205984115600586, "global_step": 17354, "epoch": 413} {"train_loss": -5.247419357299805, "global_step": 17355, "epoch": 413} {"train_loss": -5.175826549530029, "global_step": 17356, "epoch": 413} {"train_loss": -5.2760009765625, "global_step": 17357, "epoch": 413} {"train_loss": -5.180583953857422, "global_step": 17358, "epoch": 413} {"train_loss": -5.070553779602051, "global_step": 17359, "epoch": 413} {"train_loss": -5.161763668060303, "global_step": 17360, "epoch": 413} {"train_loss": -5.18076229095459, "global_step": 17361, "epoch": 413} {"train_loss": -5.289585113525391, "global_step": 17362, "epoch": 413} {"train_loss": -5.17286491394043, "global_step": 17363, "epoch": 413} {"train_loss": -4.997435569763184, "global_step": 17364, "epoch": 413} {"train_loss": -5.194026947021484, "global_step": 17365, "epoch": 413} {"train_loss": -5.198244094848633, "global_step": 17366, "epoch": 413} {"train_loss": -5.1512579917907715, "global_step": 17367, "epoch": 413} {"train_loss": -5.2639031410217285, "global_step": 17368, "epoch": 413} {"train_loss": -5.121427536010742, "global_step": 17369, "epoch": 413} {"train_loss": -5.212660789489746, "global_step": 17370, "epoch": 413} {"train_loss": -5.146747589111328, "global_step": 17371, "epoch": 413} {"train_loss": -5.179419040679932, "global_step": 17372, "epoch": 413} {"train_loss": -5.29328727722168, "global_step": 17373, "epoch": 413} {"train_loss": -5.258172988891602, "global_step": 17374, "epoch": 413} {"train_loss": -5.353424072265625, "global_step": 17375, "epoch": 413} {"train_loss": -5.337801456451416, "global_step": 17376, "epoch": 413} {"train_loss": -5.261209011077881, "global_step": 17377, "epoch": 413} {"train_loss": -5.190907955169678, "global_step": 17378, "epoch": 413} {"train_loss": -5.288243293762207, "global_step": 17379, "epoch": 413} {"train_loss": -5.163149356842041, "global_step": 17380, "epoch": 413} {"train_loss": -5.206124305725098, "global_step": 17381, "epoch": 413} {"train_loss": -5.233978271484375, "global_step": 17382, "epoch": 413} {"train_loss": -5.185126304626465, "global_step": 17383, "epoch": 413} {"train_loss": -5.229931831359863, "global_step": 17384, "epoch": 413} {"train_loss": -5.147817611694336, "global_step": 17385, "epoch": 413} {"train_loss": -5.086601257324219, "global_step": 17386, "epoch": 413} {"train_loss": -5.212947084790184, "global_step": 17387, "epoch": 413, "val_loss": 70115.2421875} {"train_loss": -5.039978981018066, "global_step": 17388, "epoch": 414} {"train_loss": -5.1198530197143555, "global_step": 17389, "epoch": 414} {"train_loss": -5.127050399780273, "global_step": 17390, "epoch": 414} {"train_loss": -5.177277565002441, "global_step": 17391, "epoch": 414} {"train_loss": -5.290167331695557, "global_step": 17392, "epoch": 414} {"train_loss": -5.20897912979126, "global_step": 17393, "epoch": 414} {"train_loss": -5.117448329925537, "global_step": 17394, "epoch": 414} {"train_loss": -5.2658610343933105, "global_step": 17395, "epoch": 414} {"train_loss": -5.264153480529785, "global_step": 17396, "epoch": 414} {"train_loss": -5.247203350067139, "global_step": 17397, "epoch": 414} {"train_loss": -5.135541915893555, "global_step": 17398, "epoch": 414} {"train_loss": -5.2389678955078125, "global_step": 17399, "epoch": 414} {"train_loss": -5.070712566375732, "global_step": 17400, "epoch": 414} {"train_loss": -5.2241010665893555, "global_step": 17401, "epoch": 414} {"train_loss": -5.18814754486084, "global_step": 17402, "epoch": 414} {"train_loss": -5.274700164794922, "global_step": 17403, "epoch": 414} {"train_loss": -5.210218906402588, "global_step": 17404, "epoch": 414} {"train_loss": -5.249174118041992, "global_step": 17405, "epoch": 414} {"train_loss": -5.160689353942871, "global_step": 17406, "epoch": 414} {"train_loss": -5.20867395401001, "global_step": 17407, "epoch": 414} {"train_loss": -5.2800798416137695, "global_step": 17408, "epoch": 414} {"train_loss": -5.299434661865234, "global_step": 17409, "epoch": 414} {"train_loss": -5.325676918029785, "global_step": 17410, "epoch": 414} {"train_loss": -5.2441864013671875, "global_step": 17411, "epoch": 414} {"train_loss": -5.341935157775879, "global_step": 17412, "epoch": 414} {"train_loss": -5.285179615020752, "global_step": 17413, "epoch": 414} {"train_loss": -5.328209400177002, "global_step": 17414, "epoch": 414} {"train_loss": -5.1623687744140625, "global_step": 17415, "epoch": 414} {"train_loss": -5.327354907989502, "global_step": 17416, "epoch": 414} {"train_loss": -5.32247257232666, "global_step": 17417, "epoch": 414} {"train_loss": -5.224923133850098, "global_step": 17418, "epoch": 414} {"train_loss": -5.343845844268799, "global_step": 17419, "epoch": 414} {"train_loss": -5.272712707519531, "global_step": 17420, "epoch": 414} {"train_loss": -5.266805648803711, "global_step": 17421, "epoch": 414} {"train_loss": -5.298349380493164, "global_step": 17422, "epoch": 414} {"train_loss": -5.105315685272217, "global_step": 17423, "epoch": 414} {"train_loss": -5.149928569793701, "global_step": 17424, "epoch": 414} {"train_loss": -5.322002410888672, "global_step": 17425, "epoch": 414} {"train_loss": -5.28169059753418, "global_step": 17426, "epoch": 414} {"train_loss": -5.2063751220703125, "global_step": 17427, "epoch": 414} {"train_loss": -5.245466232299805, "global_step": 17428, "epoch": 414} {"train_loss": -5.226294483457293, "global_step": 17429, "epoch": 414, "val_loss": 69986.390625} {"train_loss": -5.1368489265441895, "global_step": 17430, "epoch": 415} {"train_loss": -5.273935794830322, "global_step": 17431, "epoch": 415} {"train_loss": -5.259166717529297, "global_step": 17432, "epoch": 415} {"train_loss": -5.193310737609863, "global_step": 17433, "epoch": 415} {"train_loss": -5.255275249481201, "global_step": 17434, "epoch": 415} {"train_loss": -5.221421241760254, "global_step": 17435, "epoch": 415} {"train_loss": -5.28812837600708, "global_step": 17436, "epoch": 415} {"train_loss": -5.318504333496094, "global_step": 17437, "epoch": 415} {"train_loss": -5.148609161376953, "global_step": 17438, "epoch": 415} {"train_loss": -5.533951759338379, "global_step": 17439, "epoch": 415} {"train_loss": -5.217546463012695, "global_step": 17440, "epoch": 415} {"train_loss": -5.3365678787231445, "global_step": 17441, "epoch": 415} {"train_loss": -5.265592575073242, "global_step": 17442, "epoch": 415} {"train_loss": -5.2423553466796875, "global_step": 17443, "epoch": 415} {"train_loss": -5.122437477111816, "global_step": 17444, "epoch": 415} {"train_loss": -5.202785491943359, "global_step": 17445, "epoch": 415} {"train_loss": -5.381509780883789, "global_step": 17446, "epoch": 415} {"train_loss": -5.370025634765625, "global_step": 17447, "epoch": 415} {"train_loss": -5.242944717407227, "global_step": 17448, "epoch": 415} {"train_loss": -5.385730743408203, "global_step": 17449, "epoch": 415} {"train_loss": -5.276030540466309, "global_step": 17450, "epoch": 415} {"train_loss": -5.241739273071289, "global_step": 17451, "epoch": 415} {"train_loss": -5.1356306076049805, "global_step": 17452, "epoch": 415} {"train_loss": -5.260759353637695, "global_step": 17453, "epoch": 415} {"train_loss": -5.326438903808594, "global_step": 17454, "epoch": 415} {"train_loss": -5.225246429443359, "global_step": 17455, "epoch": 415} {"train_loss": -5.199179172515869, "global_step": 17456, "epoch": 415} {"train_loss": -5.277227401733398, "global_step": 17457, "epoch": 415} {"train_loss": -5.260353088378906, "global_step": 17458, "epoch": 415} {"train_loss": -5.282107353210449, "global_step": 17459, "epoch": 415} {"train_loss": -5.296383380889893, "global_step": 17460, "epoch": 415} {"train_loss": -5.304038047790527, "global_step": 17461, "epoch": 415} {"train_loss": -5.188782691955566, "global_step": 17462, "epoch": 415} {"train_loss": -5.287999153137207, "global_step": 17463, "epoch": 415} {"train_loss": -5.349601745605469, "global_step": 17464, "epoch": 415} {"train_loss": -5.461162567138672, "global_step": 17465, "epoch": 415} {"train_loss": -5.228485584259033, "global_step": 17466, "epoch": 415} {"train_loss": -5.325612545013428, "global_step": 17467, "epoch": 415} {"train_loss": -5.335898399353027, "global_step": 17468, "epoch": 415} {"train_loss": -5.344016075134277, "global_step": 17469, "epoch": 415} {"train_loss": -5.323480606079102, "global_step": 17470, "epoch": 415} {"train_loss": -5.276917151042393, "global_step": 17471, "epoch": 415, "val_loss": 70106.7421875} {"train_loss": -5.2944841384887695, "global_step": 17472, "epoch": 416} {"train_loss": -5.103809356689453, "global_step": 17473, "epoch": 416} {"train_loss": -5.287547588348389, "global_step": 17474, "epoch": 416} {"train_loss": -5.379482269287109, "global_step": 17475, "epoch": 416} {"train_loss": -5.263667106628418, "global_step": 17476, "epoch": 416} {"train_loss": -5.282485008239746, "global_step": 17477, "epoch": 416} {"train_loss": -5.203595161437988, "global_step": 17478, "epoch": 416} {"train_loss": -5.248085021972656, "global_step": 17479, "epoch": 416} {"train_loss": -5.187606334686279, "global_step": 17480, "epoch": 416} {"train_loss": -5.271610260009766, "global_step": 17481, "epoch": 416} {"train_loss": -5.2552900314331055, "global_step": 17482, "epoch": 416} {"train_loss": -5.02884578704834, "global_step": 17483, "epoch": 416} {"train_loss": -5.390114784240723, "global_step": 17484, "epoch": 416} {"train_loss": -5.296486854553223, "global_step": 17485, "epoch": 416} {"train_loss": -5.322724342346191, "global_step": 17486, "epoch": 416} {"train_loss": -5.172358989715576, "global_step": 17487, "epoch": 416} {"train_loss": -5.1375908851623535, "global_step": 17488, "epoch": 416} {"train_loss": -5.192317008972168, "global_step": 17489, "epoch": 416} {"train_loss": -5.313257217407227, "global_step": 17490, "epoch": 416} {"train_loss": -5.109477996826172, "global_step": 17491, "epoch": 416} {"train_loss": -5.254969120025635, "global_step": 17492, "epoch": 416} {"train_loss": -5.224255561828613, "global_step": 17493, "epoch": 416} {"train_loss": -5.214790344238281, "global_step": 17494, "epoch": 416} {"train_loss": -5.1160125732421875, "global_step": 17495, "epoch": 416} {"train_loss": -5.247154712677002, "global_step": 17496, "epoch": 416} {"train_loss": -5.381802082061768, "global_step": 17497, "epoch": 416} {"train_loss": -5.224665641784668, "global_step": 17498, "epoch": 416} {"train_loss": -5.3653974533081055, "global_step": 17499, "epoch": 416} {"train_loss": -5.1549153327941895, "global_step": 17500, "epoch": 416} {"train_loss": -5.30175256729126, "global_step": 17501, "epoch": 416} {"train_loss": -5.209507465362549, "global_step": 17502, "epoch": 416} {"train_loss": -5.31056547164917, "global_step": 17503, "epoch": 416} {"train_loss": -5.308633327484131, "global_step": 17504, "epoch": 416} {"train_loss": -5.353092670440674, "global_step": 17505, "epoch": 416} {"train_loss": -5.269069671630859, "global_step": 17506, "epoch": 416} {"train_loss": -5.335047721862793, "global_step": 17507, "epoch": 416} {"train_loss": -5.30493688583374, "global_step": 17508, "epoch": 416} {"train_loss": -5.233248233795166, "global_step": 17509, "epoch": 416} {"train_loss": -5.296938419342041, "global_step": 17510, "epoch": 416} {"train_loss": -5.1345415115356445, "global_step": 17511, "epoch": 416} {"train_loss": -5.232255935668945, "global_step": 17512, "epoch": 416} {"train_loss": -5.249767144521077, "global_step": 17513, "epoch": 416, "val_loss": 70396.640625} {"train_loss": -5.3343987464904785, "global_step": 17514, "epoch": 417} {"train_loss": -5.309684753417969, "global_step": 17515, "epoch": 417} {"train_loss": -5.370781421661377, "global_step": 17516, "epoch": 417} {"train_loss": -5.343209266662598, "global_step": 17517, "epoch": 417} {"train_loss": -5.261157989501953, "global_step": 17518, "epoch": 417} {"train_loss": -5.281219005584717, "global_step": 17519, "epoch": 417} {"train_loss": -5.335858345031738, "global_step": 17520, "epoch": 417} {"train_loss": -5.4062042236328125, "global_step": 17521, "epoch": 417} {"train_loss": -5.28102970123291, "global_step": 17522, "epoch": 417} {"train_loss": -5.253714561462402, "global_step": 17523, "epoch": 417} {"train_loss": -5.317984104156494, "global_step": 17524, "epoch": 417} {"train_loss": -5.277376651763916, "global_step": 17525, "epoch": 417} {"train_loss": -5.1375041007995605, "global_step": 17526, "epoch": 417} {"train_loss": -5.123100757598877, "global_step": 17527, "epoch": 417} {"train_loss": -5.289312362670898, "global_step": 17528, "epoch": 417} {"train_loss": -5.289401054382324, "global_step": 17529, "epoch": 417} {"train_loss": -5.286569595336914, "global_step": 17530, "epoch": 417} {"train_loss": -5.165959358215332, "global_step": 17531, "epoch": 417} {"train_loss": -5.20658016204834, "global_step": 17532, "epoch": 417} {"train_loss": -5.097002029418945, "global_step": 17533, "epoch": 417} {"train_loss": -5.172460079193115, "global_step": 17534, "epoch": 417} {"train_loss": -5.101794719696045, "global_step": 17535, "epoch": 417} {"train_loss": -4.9968461990356445, "global_step": 17536, "epoch": 417} {"train_loss": -5.273873329162598, "global_step": 17537, "epoch": 417} {"train_loss": -5.125775337219238, "global_step": 17538, "epoch": 417} {"train_loss": -5.2570648193359375, "global_step": 17539, "epoch": 417} {"train_loss": -5.203942775726318, "global_step": 17540, "epoch": 417} {"train_loss": -5.207592010498047, "global_step": 17541, "epoch": 417} {"train_loss": -5.175440788269043, "global_step": 17542, "epoch": 417} {"train_loss": -5.210229396820068, "global_step": 17543, "epoch": 417} {"train_loss": -5.360241889953613, "global_step": 17544, "epoch": 417} {"train_loss": -5.313799858093262, "global_step": 17545, "epoch": 417} {"train_loss": -5.192290306091309, "global_step": 17546, "epoch": 417} {"train_loss": -5.218828201293945, "global_step": 17547, "epoch": 417} {"train_loss": -5.273134231567383, "global_step": 17548, "epoch": 417} {"train_loss": -5.1491193771362305, "global_step": 17549, "epoch": 417} {"train_loss": -5.2901458740234375, "global_step": 17550, "epoch": 417} {"train_loss": -5.25201416015625, "global_step": 17551, "epoch": 417} {"train_loss": -5.224859237670898, "global_step": 17552, "epoch": 417} {"train_loss": -5.2150702476501465, "global_step": 17553, "epoch": 417} {"train_loss": -5.210631847381592, "global_step": 17554, "epoch": 417} {"train_loss": -5.241492407662528, "global_step": 17555, "epoch": 417, "val_loss": 69738.3984375} {"train_loss": -5.278099060058594, "global_step": 17556, "epoch": 418} {"train_loss": -5.091169834136963, "global_step": 17557, "epoch": 418} {"train_loss": -5.203813552856445, "global_step": 17558, "epoch": 418} {"train_loss": -5.277698993682861, "global_step": 17559, "epoch": 418} {"train_loss": -5.134098052978516, "global_step": 17560, "epoch": 418} {"train_loss": -5.204853057861328, "global_step": 17561, "epoch": 418} {"train_loss": -5.328230857849121, "global_step": 17562, "epoch": 418} {"train_loss": -5.261280059814453, "global_step": 17563, "epoch": 418} {"train_loss": -5.278635025024414, "global_step": 17564, "epoch": 418} {"train_loss": -5.368755340576172, "global_step": 17565, "epoch": 418} {"train_loss": -5.288793563842773, "global_step": 17566, "epoch": 418} {"train_loss": -5.323816776275635, "global_step": 17567, "epoch": 418} {"train_loss": -5.356728553771973, "global_step": 17568, "epoch": 418} {"train_loss": -5.261528015136719, "global_step": 17569, "epoch": 418} {"train_loss": -5.149230003356934, "global_step": 17570, "epoch": 418} {"train_loss": -5.254674911499023, "global_step": 17571, "epoch": 418} {"train_loss": -5.228546142578125, "global_step": 17572, "epoch": 418} {"train_loss": -5.199015140533447, "global_step": 17573, "epoch": 418} {"train_loss": -5.271531105041504, "global_step": 17574, "epoch": 418} {"train_loss": -5.403780937194824, "global_step": 17575, "epoch": 418} {"train_loss": -5.265753746032715, "global_step": 17576, "epoch": 418} {"train_loss": -5.162688732147217, "global_step": 17577, "epoch": 418} {"train_loss": -5.243613243103027, "global_step": 17578, "epoch": 418} {"train_loss": -5.28515625, "global_step": 17579, "epoch": 418} {"train_loss": -5.2300825119018555, "global_step": 17580, "epoch": 418} {"train_loss": -5.214000701904297, "global_step": 17581, "epoch": 418} {"train_loss": -5.287753105163574, "global_step": 17582, "epoch": 418} {"train_loss": -5.291294097900391, "global_step": 17583, "epoch": 418} {"train_loss": -5.247291088104248, "global_step": 17584, "epoch": 418} {"train_loss": -5.218173027038574, "global_step": 17585, "epoch": 418} {"train_loss": -5.261262893676758, "global_step": 17586, "epoch": 418} {"train_loss": -5.246497631072998, "global_step": 17587, "epoch": 418} {"train_loss": -5.269187927246094, "global_step": 17588, "epoch": 418} {"train_loss": -4.99906063079834, "global_step": 17589, "epoch": 418} {"train_loss": -5.31876277923584, "global_step": 17590, "epoch": 418} {"train_loss": -5.3384857177734375, "global_step": 17591, "epoch": 418} {"train_loss": -5.26823091506958, "global_step": 17592, "epoch": 418} {"train_loss": -5.182762622833252, "global_step": 17593, "epoch": 418} {"train_loss": -5.300750732421875, "global_step": 17594, "epoch": 418} {"train_loss": -5.303506374359131, "global_step": 17595, "epoch": 418} {"train_loss": -5.180359363555908, "global_step": 17596, "epoch": 418} {"train_loss": -5.252252760387602, "global_step": 17597, "epoch": 418, "val_loss": 69849.1875} {"train_loss": -5.210892677307129, "global_step": 17598, "epoch": 419} {"train_loss": -5.284296989440918, "global_step": 17599, "epoch": 419} {"train_loss": -5.187852382659912, "global_step": 17600, "epoch": 419} {"train_loss": -5.214101314544678, "global_step": 17601, "epoch": 419} {"train_loss": -5.335831642150879, "global_step": 17602, "epoch": 419} {"train_loss": -5.174088478088379, "global_step": 17603, "epoch": 419} {"train_loss": -5.381357192993164, "global_step": 17604, "epoch": 419} {"train_loss": -5.270951271057129, "global_step": 17605, "epoch": 419} {"train_loss": -5.413759708404541, "global_step": 17606, "epoch": 419} {"train_loss": -5.301077842712402, "global_step": 17607, "epoch": 419} {"train_loss": -5.21903133392334, "global_step": 17608, "epoch": 419} {"train_loss": -5.25086784362793, "global_step": 17609, "epoch": 419} {"train_loss": -5.417856216430664, "global_step": 17610, "epoch": 419} {"train_loss": -5.291936874389648, "global_step": 17611, "epoch": 419} {"train_loss": -5.32029390335083, "global_step": 17612, "epoch": 419} {"train_loss": -5.257810592651367, "global_step": 17613, "epoch": 419} {"train_loss": -5.276339530944824, "global_step": 17614, "epoch": 419} {"train_loss": -5.290702819824219, "global_step": 17615, "epoch": 419} {"train_loss": -5.331278324127197, "global_step": 17616, "epoch": 419} {"train_loss": -5.180421829223633, "global_step": 17617, "epoch": 419} {"train_loss": -5.260937690734863, "global_step": 17618, "epoch": 419} {"train_loss": -5.18474817276001, "global_step": 17619, "epoch": 419} {"train_loss": -5.298337936401367, "global_step": 17620, "epoch": 419} {"train_loss": -5.253337860107422, "global_step": 17621, "epoch": 419} {"train_loss": -5.255692958831787, "global_step": 17622, "epoch": 419} {"train_loss": -5.303077697753906, "global_step": 17623, "epoch": 419} {"train_loss": -5.3745646476745605, "global_step": 17624, "epoch": 419} {"train_loss": -5.368966102600098, "global_step": 17625, "epoch": 419} {"train_loss": -5.381453037261963, "global_step": 17626, "epoch": 419} {"train_loss": -5.399849891662598, "global_step": 17627, "epoch": 419} {"train_loss": -5.220425605773926, "global_step": 17628, "epoch": 419} {"train_loss": -5.273031234741211, "global_step": 17629, "epoch": 419} {"train_loss": -5.319416046142578, "global_step": 17630, "epoch": 419} {"train_loss": -5.183464527130127, "global_step": 17631, "epoch": 419} {"train_loss": -5.290973663330078, "global_step": 17632, "epoch": 419} {"train_loss": -5.3155517578125, "global_step": 17633, "epoch": 419} {"train_loss": -5.252195358276367, "global_step": 17634, "epoch": 419} {"train_loss": -5.1590166091918945, "global_step": 17635, "epoch": 419} {"train_loss": -5.347715854644775, "global_step": 17636, "epoch": 419} {"train_loss": -5.308615207672119, "global_step": 17637, "epoch": 419} {"train_loss": -5.344119548797607, "global_step": 17638, "epoch": 419} {"train_loss": -5.284189110710507, "global_step": 17639, "epoch": 419, "val_loss": 69655.421875} {"train_loss": -5.249070167541504, "global_step": 17640, "epoch": 420} {"train_loss": -5.314694404602051, "global_step": 17641, "epoch": 420} {"train_loss": -5.264092922210693, "global_step": 17642, "epoch": 420} {"train_loss": -5.402593612670898, "global_step": 17643, "epoch": 420} {"train_loss": -5.368348598480225, "global_step": 17644, "epoch": 420} {"train_loss": -5.360222816467285, "global_step": 17645, "epoch": 420} {"train_loss": -5.304289817810059, "global_step": 17646, "epoch": 420} {"train_loss": -5.278944969177246, "global_step": 17647, "epoch": 420} {"train_loss": -5.222406387329102, "global_step": 17648, "epoch": 420} {"train_loss": -5.22414493560791, "global_step": 17649, "epoch": 420} {"train_loss": -5.364729881286621, "global_step": 17650, "epoch": 420} {"train_loss": -5.191810607910156, "global_step": 17651, "epoch": 420} {"train_loss": -5.337355613708496, "global_step": 17652, "epoch": 420} {"train_loss": -5.183121204376221, "global_step": 17653, "epoch": 420} {"train_loss": -5.241085052490234, "global_step": 17654, "epoch": 420} {"train_loss": -5.396039009094238, "global_step": 17655, "epoch": 420} {"train_loss": -5.221495628356934, "global_step": 17656, "epoch": 420} {"train_loss": -5.224979877471924, "global_step": 17657, "epoch": 420} {"train_loss": -5.239725112915039, "global_step": 17658, "epoch": 420} {"train_loss": -5.297876358032227, "global_step": 17659, "epoch": 420} {"train_loss": -5.234697341918945, "global_step": 17660, "epoch": 420} {"train_loss": -5.245068550109863, "global_step": 17661, "epoch": 420} {"train_loss": -5.264782428741455, "global_step": 17662, "epoch": 420} {"train_loss": -5.306171417236328, "global_step": 17663, "epoch": 420} {"train_loss": -5.222426891326904, "global_step": 17664, "epoch": 420} {"train_loss": -5.350799560546875, "global_step": 17665, "epoch": 420} {"train_loss": -5.272158622741699, "global_step": 17666, "epoch": 420} {"train_loss": -5.381528377532959, "global_step": 17667, "epoch": 420} {"train_loss": -5.396269798278809, "global_step": 17668, "epoch": 420} {"train_loss": -5.252142906188965, "global_step": 17669, "epoch": 420} {"train_loss": -5.220648765563965, "global_step": 17670, "epoch": 420} {"train_loss": -5.179424285888672, "global_step": 17671, "epoch": 420} {"train_loss": -5.318342685699463, "global_step": 17672, "epoch": 420} {"train_loss": -5.238585472106934, "global_step": 17673, "epoch": 420} {"train_loss": -5.304048538208008, "global_step": 17674, "epoch": 420} {"train_loss": -5.268213748931885, "global_step": 17675, "epoch": 420} {"train_loss": -5.391923904418945, "global_step": 17676, "epoch": 420} {"train_loss": -5.279519557952881, "global_step": 17677, "epoch": 420} {"train_loss": -5.228595733642578, "global_step": 17678, "epoch": 420} {"train_loss": -5.320061683654785, "global_step": 17679, "epoch": 420} {"train_loss": -5.388734817504883, "global_step": 17680, "epoch": 420} {"train_loss": -5.28756841023763, "global_step": 17681, "epoch": 420, "val_loss": 69685.359375} {"train_loss": -5.239754676818848, "global_step": 17682, "epoch": 421} {"train_loss": -5.286977767944336, "global_step": 17683, "epoch": 421} {"train_loss": -5.385483741760254, "global_step": 17684, "epoch": 421} {"train_loss": -5.196086883544922, "global_step": 17685, "epoch": 421} {"train_loss": -5.23458194732666, "global_step": 17686, "epoch": 421} {"train_loss": -5.158758163452148, "global_step": 17687, "epoch": 421} {"train_loss": -5.232629776000977, "global_step": 17688, "epoch": 421} {"train_loss": -5.357941627502441, "global_step": 17689, "epoch": 421} {"train_loss": -5.276065826416016, "global_step": 17690, "epoch": 421} {"train_loss": -5.307279586791992, "global_step": 17691, "epoch": 421} {"train_loss": -5.190166473388672, "global_step": 17692, "epoch": 421} {"train_loss": -5.128892421722412, "global_step": 17693, "epoch": 421} {"train_loss": -5.119497299194336, "global_step": 17694, "epoch": 421} {"train_loss": -5.232177734375, "global_step": 17695, "epoch": 421} {"train_loss": -5.181582450866699, "global_step": 17696, "epoch": 421} {"train_loss": -5.36552619934082, "global_step": 17697, "epoch": 421} {"train_loss": -5.280163764953613, "global_step": 17698, "epoch": 421} {"train_loss": -5.230944633483887, "global_step": 17699, "epoch": 421} {"train_loss": -5.329904079437256, "global_step": 17700, "epoch": 421} {"train_loss": -5.174238204956055, "global_step": 17701, "epoch": 421} {"train_loss": -5.2238240242004395, "global_step": 17702, "epoch": 421} {"train_loss": -5.253299236297607, "global_step": 17703, "epoch": 421} {"train_loss": -5.4100446701049805, "global_step": 17704, "epoch": 421} {"train_loss": -5.296274662017822, "global_step": 17705, "epoch": 421} {"train_loss": -5.180452346801758, "global_step": 17706, "epoch": 421} {"train_loss": -5.320030212402344, "global_step": 17707, "epoch": 421} {"train_loss": -5.168749809265137, "global_step": 17708, "epoch": 421} {"train_loss": -5.305157661437988, "global_step": 17709, "epoch": 421} {"train_loss": -5.154341697692871, "global_step": 17710, "epoch": 421} {"train_loss": -5.134437561035156, "global_step": 17711, "epoch": 421} {"train_loss": -5.291108131408691, "global_step": 17712, "epoch": 421} {"train_loss": -5.1919636726379395, "global_step": 17713, "epoch": 421} {"train_loss": -5.137964725494385, "global_step": 17714, "epoch": 421} {"train_loss": -5.316548824310303, "global_step": 17715, "epoch": 421} {"train_loss": -5.208771705627441, "global_step": 17716, "epoch": 421} {"train_loss": -5.132231712341309, "global_step": 17717, "epoch": 421} {"train_loss": -5.250702857971191, "global_step": 17718, "epoch": 421} {"train_loss": -5.202712059020996, "global_step": 17719, "epoch": 421} {"train_loss": -5.208247184753418, "global_step": 17720, "epoch": 421} {"train_loss": -5.3215837478637695, "global_step": 17721, "epoch": 421} {"train_loss": -4.996706485748291, "global_step": 17722, "epoch": 421} {"train_loss": -5.2363923617771695, "global_step": 17723, "epoch": 421, "val_loss": 69906.0859375} {"train_loss": -5.373659133911133, "global_step": 17724, "epoch": 422} {"train_loss": -5.049243450164795, "global_step": 17725, "epoch": 422} {"train_loss": -5.299846172332764, "global_step": 17726, "epoch": 422} {"train_loss": -5.341403007507324, "global_step": 17727, "epoch": 422} {"train_loss": -5.097576141357422, "global_step": 17728, "epoch": 422} {"train_loss": -5.254601955413818, "global_step": 17729, "epoch": 422} {"train_loss": -4.962519645690918, "global_step": 17730, "epoch": 422} {"train_loss": -4.968964099884033, "global_step": 17731, "epoch": 422} {"train_loss": -5.224318027496338, "global_step": 17732, "epoch": 422} {"train_loss": -5.067590713500977, "global_step": 17733, "epoch": 422} {"train_loss": -5.130004405975342, "global_step": 17734, "epoch": 422} {"train_loss": -5.129943370819092, "global_step": 17735, "epoch": 422} {"train_loss": -5.236797332763672, "global_step": 17736, "epoch": 422} {"train_loss": -5.027052879333496, "global_step": 17737, "epoch": 422} {"train_loss": -5.00029182434082, "global_step": 17738, "epoch": 422} {"train_loss": -5.227325439453125, "global_step": 17739, "epoch": 422} {"train_loss": -5.158054828643799, "global_step": 17740, "epoch": 422} {"train_loss": -5.336543560028076, "global_step": 17741, "epoch": 422} {"train_loss": -5.310842514038086, "global_step": 17742, "epoch": 422} {"train_loss": -5.37960147857666, "global_step": 17743, "epoch": 422} {"train_loss": -5.253557205200195, "global_step": 17744, "epoch": 422} {"train_loss": -5.316573143005371, "global_step": 17745, "epoch": 422} {"train_loss": -5.221557140350342, "global_step": 17746, "epoch": 422} {"train_loss": -5.250170707702637, "global_step": 17747, "epoch": 422} {"train_loss": -5.298556327819824, "global_step": 17748, "epoch": 422} {"train_loss": -5.245815277099609, "global_step": 17749, "epoch": 422} {"train_loss": -5.25373649597168, "global_step": 17750, "epoch": 422} {"train_loss": -5.411411285400391, "global_step": 17751, "epoch": 422} {"train_loss": -5.229825496673584, "global_step": 17752, "epoch": 422} {"train_loss": -5.324635028839111, "global_step": 17753, "epoch": 422} {"train_loss": -5.226531982421875, "global_step": 17754, "epoch": 422} {"train_loss": -5.092986106872559, "global_step": 17755, "epoch": 422} {"train_loss": -5.222635269165039, "global_step": 17756, "epoch": 422} {"train_loss": -5.359172821044922, "global_step": 17757, "epoch": 422} {"train_loss": -5.221103668212891, "global_step": 17758, "epoch": 422} {"train_loss": -5.383232116699219, "global_step": 17759, "epoch": 422} {"train_loss": -5.241816520690918, "global_step": 17760, "epoch": 422} {"train_loss": -5.257652759552002, "global_step": 17761, "epoch": 422} {"train_loss": -5.337145805358887, "global_step": 17762, "epoch": 422} {"train_loss": -5.262738227844238, "global_step": 17763, "epoch": 422} {"train_loss": -5.242949485778809, "global_step": 17764, "epoch": 422} {"train_loss": -5.223068316777547, "global_step": 17765, "epoch": 422, "val_loss": 70748.7890625} {"train_loss": -5.176932334899902, "global_step": 17766, "epoch": 423} {"train_loss": -5.0735554695129395, "global_step": 17767, "epoch": 423} {"train_loss": -5.071305751800537, "global_step": 17768, "epoch": 423} {"train_loss": -5.180693626403809, "global_step": 17769, "epoch": 423} {"train_loss": -5.080663681030273, "global_step": 17770, "epoch": 423} {"train_loss": -5.29423713684082, "global_step": 17771, "epoch": 423} {"train_loss": -4.98901891708374, "global_step": 17772, "epoch": 423} {"train_loss": -5.286626815795898, "global_step": 17773, "epoch": 423} {"train_loss": -5.156789779663086, "global_step": 17774, "epoch": 423} {"train_loss": -5.235836029052734, "global_step": 17775, "epoch": 423} {"train_loss": -5.2943010330200195, "global_step": 17776, "epoch": 423} {"train_loss": -5.291530132293701, "global_step": 17777, "epoch": 423} {"train_loss": -5.209346771240234, "global_step": 17778, "epoch": 423} {"train_loss": -5.179727554321289, "global_step": 17779, "epoch": 423} {"train_loss": -5.149231433868408, "global_step": 17780, "epoch": 423} {"train_loss": -5.423571586608887, "global_step": 17781, "epoch": 423} {"train_loss": -5.249933242797852, "global_step": 17782, "epoch": 423} {"train_loss": -5.153033256530762, "global_step": 17783, "epoch": 423} {"train_loss": -5.317904472351074, "global_step": 17784, "epoch": 423} {"train_loss": -5.165802001953125, "global_step": 17785, "epoch": 423} {"train_loss": -5.253319263458252, "global_step": 17786, "epoch": 423} {"train_loss": -5.1335530281066895, "global_step": 17787, "epoch": 423} {"train_loss": -5.282570838928223, "global_step": 17788, "epoch": 423} {"train_loss": -5.105008125305176, "global_step": 17789, "epoch": 423} {"train_loss": -5.173757553100586, "global_step": 17790, "epoch": 423} {"train_loss": -5.274683952331543, "global_step": 17791, "epoch": 423} {"train_loss": -5.120969772338867, "global_step": 17792, "epoch": 423} {"train_loss": -5.397542476654053, "global_step": 17793, "epoch": 423} {"train_loss": -5.291516304016113, "global_step": 17794, "epoch": 423} {"train_loss": -5.118568420410156, "global_step": 17795, "epoch": 423} {"train_loss": -5.318231105804443, "global_step": 17796, "epoch": 423} {"train_loss": -5.287604808807373, "global_step": 17797, "epoch": 423} {"train_loss": -5.229966163635254, "global_step": 17798, "epoch": 423} {"train_loss": -5.152314186096191, "global_step": 17799, "epoch": 423} {"train_loss": -5.296221733093262, "global_step": 17800, "epoch": 423} {"train_loss": -5.236484527587891, "global_step": 17801, "epoch": 423} {"train_loss": -5.318658828735352, "global_step": 17802, "epoch": 423} {"train_loss": -5.278275012969971, "global_step": 17803, "epoch": 423} {"train_loss": -5.471623420715332, "global_step": 17804, "epoch": 423} {"train_loss": -5.093100547790527, "global_step": 17805, "epoch": 423} {"train_loss": -5.287935256958008, "global_step": 17806, "epoch": 423} {"train_loss": -5.224969398407709, "global_step": 17807, "epoch": 423, "val_loss": 69559.96875} {"train_loss": -5.361871719360352, "global_step": 17808, "epoch": 424} {"train_loss": -5.251860618591309, "global_step": 17809, "epoch": 424} {"train_loss": -5.280473709106445, "global_step": 17810, "epoch": 424} {"train_loss": -5.182626724243164, "global_step": 17811, "epoch": 424} {"train_loss": -5.305941581726074, "global_step": 17812, "epoch": 424} {"train_loss": -5.168065547943115, "global_step": 17813, "epoch": 424} {"train_loss": -5.338078498840332, "global_step": 17814, "epoch": 424} {"train_loss": -5.180855751037598, "global_step": 17815, "epoch": 424} {"train_loss": -5.130821704864502, "global_step": 17816, "epoch": 424} {"train_loss": -5.257200241088867, "global_step": 17817, "epoch": 424} {"train_loss": -5.236074447631836, "global_step": 17818, "epoch": 424} {"train_loss": -5.243542671203613, "global_step": 17819, "epoch": 424} {"train_loss": -5.1451215744018555, "global_step": 17820, "epoch": 424} {"train_loss": -5.308492660522461, "global_step": 17821, "epoch": 424} {"train_loss": -5.2397003173828125, "global_step": 17822, "epoch": 424} {"train_loss": -5.391045570373535, "global_step": 17823, "epoch": 424} {"train_loss": -5.293428421020508, "global_step": 17824, "epoch": 424} {"train_loss": -5.246021747589111, "global_step": 17825, "epoch": 424} {"train_loss": -5.315479755401611, "global_step": 17826, "epoch": 424} {"train_loss": -5.072790145874023, "global_step": 17827, "epoch": 424} {"train_loss": -5.267316818237305, "global_step": 17828, "epoch": 424} {"train_loss": -5.375875949859619, "global_step": 17829, "epoch": 424} {"train_loss": -5.35410213470459, "global_step": 17830, "epoch": 424} {"train_loss": -5.330682754516602, "global_step": 17831, "epoch": 424} {"train_loss": -5.241116523742676, "global_step": 17832, "epoch": 424} {"train_loss": -5.274809837341309, "global_step": 17833, "epoch": 424} {"train_loss": -5.2692718505859375, "global_step": 17834, "epoch": 424} {"train_loss": -5.171306610107422, "global_step": 17835, "epoch": 424} {"train_loss": -5.164614200592041, "global_step": 17836, "epoch": 424} {"train_loss": -5.2276716232299805, "global_step": 17837, "epoch": 424} {"train_loss": -5.126428604125977, "global_step": 17838, "epoch": 424} {"train_loss": -5.383386611938477, "global_step": 17839, "epoch": 424} {"train_loss": -5.358818531036377, "global_step": 17840, "epoch": 424} {"train_loss": -5.345135688781738, "global_step": 17841, "epoch": 424} {"train_loss": -5.19316291809082, "global_step": 17842, "epoch": 424} {"train_loss": -5.370826721191406, "global_step": 17843, "epoch": 424} {"train_loss": -5.129315376281738, "global_step": 17844, "epoch": 424} {"train_loss": -5.291308403015137, "global_step": 17845, "epoch": 424} {"train_loss": -5.206836700439453, "global_step": 17846, "epoch": 424} {"train_loss": -5.193783760070801, "global_step": 17847, "epoch": 424} {"train_loss": -5.335616111755371, "global_step": 17848, "epoch": 424} {"train_loss": -5.255220027196975, "global_step": 17849, "epoch": 424, "val_loss": 69929.7890625} {"train_loss": -5.20173454284668, "global_step": 17850, "epoch": 425} {"train_loss": -5.107552528381348, "global_step": 17851, "epoch": 425} {"train_loss": -5.182124137878418, "global_step": 17852, "epoch": 425} {"train_loss": -5.258184432983398, "global_step": 17853, "epoch": 425} {"train_loss": -5.2689948081970215, "global_step": 17854, "epoch": 425} {"train_loss": -5.369797706604004, "global_step": 17855, "epoch": 425} {"train_loss": -5.246536731719971, "global_step": 17856, "epoch": 425} {"train_loss": -5.3010663986206055, "global_step": 17857, "epoch": 425} {"train_loss": -5.359262466430664, "global_step": 17858, "epoch": 425} {"train_loss": -5.257656097412109, "global_step": 17859, "epoch": 425} {"train_loss": -5.441190719604492, "global_step": 17860, "epoch": 425} {"train_loss": -5.360991954803467, "global_step": 17861, "epoch": 425} {"train_loss": -5.236168384552002, "global_step": 17862, "epoch": 425} {"train_loss": -5.293094635009766, "global_step": 17863, "epoch": 425} {"train_loss": -5.316408157348633, "global_step": 17864, "epoch": 425} {"train_loss": -5.350616455078125, "global_step": 17865, "epoch": 425} {"train_loss": -5.320648670196533, "global_step": 17866, "epoch": 425} {"train_loss": -5.309666156768799, "global_step": 17867, "epoch": 425} {"train_loss": -5.435779571533203, "global_step": 17868, "epoch": 425} {"train_loss": -5.312004089355469, "global_step": 17869, "epoch": 425} {"train_loss": -5.110846042633057, "global_step": 17870, "epoch": 425} {"train_loss": -5.338539123535156, "global_step": 17871, "epoch": 425} {"train_loss": -5.34688663482666, "global_step": 17872, "epoch": 425} {"train_loss": -5.075067520141602, "global_step": 17873, "epoch": 425} {"train_loss": -5.267134189605713, "global_step": 17874, "epoch": 425} {"train_loss": -5.33392333984375, "global_step": 17875, "epoch": 425} {"train_loss": -5.263882637023926, "global_step": 17876, "epoch": 425} {"train_loss": -5.141108512878418, "global_step": 17877, "epoch": 425} {"train_loss": -5.30618953704834, "global_step": 17878, "epoch": 425} {"train_loss": -5.214594841003418, "global_step": 17879, "epoch": 425} {"train_loss": -5.13247013092041, "global_step": 17880, "epoch": 425} {"train_loss": -5.295709133148193, "global_step": 17881, "epoch": 425} {"train_loss": -5.29884147644043, "global_step": 17882, "epoch": 425} {"train_loss": -5.260848522186279, "global_step": 17883, "epoch": 425} {"train_loss": -5.317803859710693, "global_step": 17884, "epoch": 425} {"train_loss": -5.042978763580322, "global_step": 17885, "epoch": 425} {"train_loss": -5.176945209503174, "global_step": 17886, "epoch": 425} {"train_loss": -5.273942947387695, "global_step": 17887, "epoch": 425} {"train_loss": -5.2894487380981445, "global_step": 17888, "epoch": 425} {"train_loss": -5.091456413269043, "global_step": 17889, "epoch": 425} {"train_loss": -5.208769798278809, "global_step": 17890, "epoch": 425} {"train_loss": -5.261167696544102, "global_step": 17891, "epoch": 425, "val_loss": 69806.25} {"train_loss": -5.365933418273926, "global_step": 17892, "epoch": 426} {"train_loss": -5.174615859985352, "global_step": 17893, "epoch": 426} {"train_loss": -5.126105308532715, "global_step": 17894, "epoch": 426} {"train_loss": -5.20393180847168, "global_step": 17895, "epoch": 426} {"train_loss": -5.279097557067871, "global_step": 17896, "epoch": 426} {"train_loss": -5.159383773803711, "global_step": 17897, "epoch": 426} {"train_loss": -5.3998236656188965, "global_step": 17898, "epoch": 426} {"train_loss": -5.32199764251709, "global_step": 17899, "epoch": 426} {"train_loss": -5.400763511657715, "global_step": 17900, "epoch": 426} {"train_loss": -5.396949768066406, "global_step": 17901, "epoch": 426} {"train_loss": -5.138256549835205, "global_step": 17902, "epoch": 426} {"train_loss": -5.2548370361328125, "global_step": 17903, "epoch": 426} {"train_loss": -5.340469837188721, "global_step": 17904, "epoch": 426} {"train_loss": -5.06062650680542, "global_step": 17905, "epoch": 426} {"train_loss": -5.174039840698242, "global_step": 17906, "epoch": 426} {"train_loss": -5.359776973724365, "global_step": 17907, "epoch": 426} {"train_loss": -5.460798263549805, "global_step": 17908, "epoch": 426} {"train_loss": -5.186318397521973, "global_step": 17909, "epoch": 426} {"train_loss": -5.2877068519592285, "global_step": 17910, "epoch": 426} {"train_loss": -5.214310646057129, "global_step": 17911, "epoch": 426} {"train_loss": -5.153905868530273, "global_step": 17912, "epoch": 426} {"train_loss": -5.337502479553223, "global_step": 17913, "epoch": 426} {"train_loss": -5.269957542419434, "global_step": 17914, "epoch": 426} {"train_loss": -5.185280799865723, "global_step": 17915, "epoch": 426} {"train_loss": -5.165642738342285, "global_step": 17916, "epoch": 426} {"train_loss": -5.12930965423584, "global_step": 17917, "epoch": 426} {"train_loss": -5.190939903259277, "global_step": 17918, "epoch": 426} {"train_loss": -5.279296398162842, "global_step": 17919, "epoch": 426} {"train_loss": -5.261392116546631, "global_step": 17920, "epoch": 426} {"train_loss": -5.175945281982422, "global_step": 17921, "epoch": 426} {"train_loss": -5.251743793487549, "global_step": 17922, "epoch": 426} {"train_loss": -5.349797248840332, "global_step": 17923, "epoch": 426} {"train_loss": -5.17580509185791, "global_step": 17924, "epoch": 426} {"train_loss": -5.290104866027832, "global_step": 17925, "epoch": 426} {"train_loss": -5.234841346740723, "global_step": 17926, "epoch": 426} {"train_loss": -5.307274341583252, "global_step": 17927, "epoch": 426} {"train_loss": -5.219746112823486, "global_step": 17928, "epoch": 426} {"train_loss": -5.3682451248168945, "global_step": 17929, "epoch": 426} {"train_loss": -5.284563064575195, "global_step": 17930, "epoch": 426} {"train_loss": -5.263772010803223, "global_step": 17931, "epoch": 426} {"train_loss": -5.271813869476318, "global_step": 17932, "epoch": 426} {"train_loss": -5.2569810549418134, "global_step": 17933, "epoch": 426, "val_loss": 70214.4921875} {"train_loss": -5.175244331359863, "global_step": 17934, "epoch": 427} {"train_loss": -5.285662651062012, "global_step": 17935, "epoch": 427} {"train_loss": -5.351356506347656, "global_step": 17936, "epoch": 427} {"train_loss": -5.292036533355713, "global_step": 17937, "epoch": 427} {"train_loss": -5.2143168449401855, "global_step": 17938, "epoch": 427} {"train_loss": -5.312809467315674, "global_step": 17939, "epoch": 427} {"train_loss": -5.279728412628174, "global_step": 17940, "epoch": 427} {"train_loss": -5.2028679847717285, "global_step": 17941, "epoch": 427} {"train_loss": -5.4062089920043945, "global_step": 17942, "epoch": 427} {"train_loss": -5.244546890258789, "global_step": 17943, "epoch": 427} {"train_loss": -5.239602088928223, "global_step": 17944, "epoch": 427} {"train_loss": -5.426793098449707, "global_step": 17945, "epoch": 427} {"train_loss": -5.230787754058838, "global_step": 17946, "epoch": 427} {"train_loss": -5.316771030426025, "global_step": 17947, "epoch": 427} {"train_loss": -5.336117744445801, "global_step": 17948, "epoch": 427} {"train_loss": -5.299821853637695, "global_step": 17949, "epoch": 427} {"train_loss": -5.208795547485352, "global_step": 17950, "epoch": 427} {"train_loss": -5.221977710723877, "global_step": 17951, "epoch": 427} {"train_loss": -5.188790321350098, "global_step": 17952, "epoch": 427} {"train_loss": -5.239092826843262, "global_step": 17953, "epoch": 427} {"train_loss": -5.347870826721191, "global_step": 17954, "epoch": 427} {"train_loss": -5.418157577514648, "global_step": 17955, "epoch": 427} {"train_loss": -5.24981689453125, "global_step": 17956, "epoch": 427} {"train_loss": -5.15453577041626, "global_step": 17957, "epoch": 427} {"train_loss": -5.291616916656494, "global_step": 17958, "epoch": 427} {"train_loss": -5.372086524963379, "global_step": 17959, "epoch": 427} {"train_loss": -5.271912574768066, "global_step": 17960, "epoch": 427} {"train_loss": -5.290558815002441, "global_step": 17961, "epoch": 427} {"train_loss": -5.325189113616943, "global_step": 17962, "epoch": 427} {"train_loss": -5.415719032287598, "global_step": 17963, "epoch": 427} {"train_loss": -5.202057361602783, "global_step": 17964, "epoch": 427} {"train_loss": -5.261068344116211, "global_step": 17965, "epoch": 427} {"train_loss": -5.390501499176025, "global_step": 17966, "epoch": 427} {"train_loss": -5.447998046875, "global_step": 17967, "epoch": 427} {"train_loss": -5.182891845703125, "global_step": 17968, "epoch": 427} {"train_loss": -5.211903095245361, "global_step": 17969, "epoch": 427} {"train_loss": -5.328857421875, "global_step": 17970, "epoch": 427} {"train_loss": -5.2519965171813965, "global_step": 17971, "epoch": 427} {"train_loss": -5.235980987548828, "global_step": 17972, "epoch": 427} {"train_loss": -5.3026275634765625, "global_step": 17973, "epoch": 427} {"train_loss": -5.291751861572266, "global_step": 17974, "epoch": 427} {"train_loss": -5.287544012069702, "global_step": 17975, "epoch": 427, "val_loss": 69850.3359375} {"train_loss": -5.2440104484558105, "global_step": 17976, "epoch": 428} {"train_loss": -5.4150543212890625, "global_step": 17977, "epoch": 428} {"train_loss": -5.273037910461426, "global_step": 17978, "epoch": 428} {"train_loss": -5.325493335723877, "global_step": 17979, "epoch": 428} {"train_loss": -5.208400726318359, "global_step": 17980, "epoch": 428} {"train_loss": -5.273824691772461, "global_step": 17981, "epoch": 428} {"train_loss": -5.324322700500488, "global_step": 17982, "epoch": 428} {"train_loss": -5.301868915557861, "global_step": 17983, "epoch": 428} {"train_loss": -5.319984436035156, "global_step": 17984, "epoch": 428} {"train_loss": -5.25201416015625, "global_step": 17985, "epoch": 428} {"train_loss": -5.27690315246582, "global_step": 17986, "epoch": 428} {"train_loss": -5.289809226989746, "global_step": 17987, "epoch": 428} {"train_loss": -5.247259140014648, "global_step": 17988, "epoch": 428} {"train_loss": -5.209727764129639, "global_step": 17989, "epoch": 428} {"train_loss": -5.385992050170898, "global_step": 17990, "epoch": 428} {"train_loss": -5.181320667266846, "global_step": 17991, "epoch": 428} {"train_loss": -5.437183380126953, "global_step": 17992, "epoch": 428} {"train_loss": -5.335240364074707, "global_step": 17993, "epoch": 428} {"train_loss": -5.2309699058532715, "global_step": 17994, "epoch": 428} {"train_loss": -5.160342693328857, "global_step": 17995, "epoch": 428} {"train_loss": -5.402870178222656, "global_step": 17996, "epoch": 428} {"train_loss": -5.402440071105957, "global_step": 17997, "epoch": 428} {"train_loss": -5.208300590515137, "global_step": 17998, "epoch": 428} {"train_loss": -5.232237815856934, "global_step": 17999, "epoch": 428} {"train_loss": -5.224437236785889, "global_step": 18000, "epoch": 428} {"train_loss": -5.278155326843262, "global_step": 18001, "epoch": 428} {"train_loss": -5.316188812255859, "global_step": 18002, "epoch": 428} {"train_loss": -5.343071937561035, "global_step": 18003, "epoch": 428} {"train_loss": -5.200902938842773, "global_step": 18004, "epoch": 428} {"train_loss": -5.16005802154541, "global_step": 18005, "epoch": 428} {"train_loss": -5.27649450302124, "global_step": 18006, "epoch": 428} {"train_loss": -5.286215782165527, "global_step": 18007, "epoch": 428} {"train_loss": -5.328202247619629, "global_step": 18008, "epoch": 428} {"train_loss": -5.197622776031494, "global_step": 18009, "epoch": 428} {"train_loss": -5.3969340324401855, "global_step": 18010, "epoch": 428} {"train_loss": -5.1321611404418945, "global_step": 18011, "epoch": 428} {"train_loss": -5.304834365844727, "global_step": 18012, "epoch": 428} {"train_loss": -5.295068740844727, "global_step": 18013, "epoch": 428} {"train_loss": -5.271681785583496, "global_step": 18014, "epoch": 428} {"train_loss": -5.281963348388672, "global_step": 18015, "epoch": 428} {"train_loss": -5.244198322296143, "global_step": 18016, "epoch": 428} {"train_loss": -5.279112168720791, "global_step": 18017, "epoch": 428, "val_loss": 69686.3046875} {"train_loss": -5.182343482971191, "global_step": 18018, "epoch": 429} {"train_loss": -5.325905799865723, "global_step": 18019, "epoch": 429} {"train_loss": -5.3710222244262695, "global_step": 18020, "epoch": 429} {"train_loss": -5.359098434448242, "global_step": 18021, "epoch": 429} {"train_loss": -5.249934196472168, "global_step": 18022, "epoch": 429} {"train_loss": -5.196178436279297, "global_step": 18023, "epoch": 429} {"train_loss": -5.360834121704102, "global_step": 18024, "epoch": 429} {"train_loss": -5.110648155212402, "global_step": 18025, "epoch": 429} {"train_loss": -5.239732265472412, "global_step": 18026, "epoch": 429} {"train_loss": -5.361250877380371, "global_step": 18027, "epoch": 429} {"train_loss": -5.373952865600586, "global_step": 18028, "epoch": 429} {"train_loss": -5.411022186279297, "global_step": 18029, "epoch": 429} {"train_loss": -5.300844669342041, "global_step": 18030, "epoch": 429} {"train_loss": -5.172832489013672, "global_step": 18031, "epoch": 429} {"train_loss": -5.2969512939453125, "global_step": 18032, "epoch": 429} {"train_loss": -5.297306060791016, "global_step": 18033, "epoch": 429} {"train_loss": -5.210099220275879, "global_step": 18034, "epoch": 429} {"train_loss": -5.285802841186523, "global_step": 18035, "epoch": 429} {"train_loss": -5.285186290740967, "global_step": 18036, "epoch": 429} {"train_loss": -5.17188835144043, "global_step": 18037, "epoch": 429} {"train_loss": -5.219179153442383, "global_step": 18038, "epoch": 429} {"train_loss": -5.289549350738525, "global_step": 18039, "epoch": 429} {"train_loss": -5.170925140380859, "global_step": 18040, "epoch": 429} {"train_loss": -5.403409481048584, "global_step": 18041, "epoch": 429} {"train_loss": -5.351992130279541, "global_step": 18042, "epoch": 429} {"train_loss": -5.213176727294922, "global_step": 18043, "epoch": 429} {"train_loss": -5.369457721710205, "global_step": 18044, "epoch": 429} {"train_loss": -5.304538249969482, "global_step": 18045, "epoch": 429} {"train_loss": -5.3483381271362305, "global_step": 18046, "epoch": 429} {"train_loss": -5.259904861450195, "global_step": 18047, "epoch": 429} {"train_loss": -5.101753234863281, "global_step": 18048, "epoch": 429} {"train_loss": -5.416156768798828, "global_step": 18049, "epoch": 429} {"train_loss": -5.228423118591309, "global_step": 18050, "epoch": 429} {"train_loss": -5.225264549255371, "global_step": 18051, "epoch": 429} {"train_loss": -5.153983116149902, "global_step": 18052, "epoch": 429} {"train_loss": -5.211147308349609, "global_step": 18053, "epoch": 429} {"train_loss": -5.2409820556640625, "global_step": 18054, "epoch": 429} {"train_loss": -5.06158447265625, "global_step": 18055, "epoch": 429} {"train_loss": -5.309788703918457, "global_step": 18056, "epoch": 429} {"train_loss": -5.134396076202393, "global_step": 18057, "epoch": 429} {"train_loss": -5.308126926422119, "global_step": 18058, "epoch": 429} {"train_loss": -5.26626409803118, "global_step": 18059, "epoch": 429, "val_loss": 70602.1640625} {"train_loss": -5.208127498626709, "global_step": 18060, "epoch": 430} {"train_loss": -5.350419998168945, "global_step": 18061, "epoch": 430} {"train_loss": -5.156729698181152, "global_step": 18062, "epoch": 430} {"train_loss": -5.317018985748291, "global_step": 18063, "epoch": 430} {"train_loss": -5.374493598937988, "global_step": 18064, "epoch": 430} {"train_loss": -5.1468505859375, "global_step": 18065, "epoch": 430} {"train_loss": -5.255838394165039, "global_step": 18066, "epoch": 430} {"train_loss": -5.386101722717285, "global_step": 18067, "epoch": 430} {"train_loss": -5.506076812744141, "global_step": 18068, "epoch": 430} {"train_loss": -5.384040355682373, "global_step": 18069, "epoch": 430} {"train_loss": -5.254687309265137, "global_step": 18070, "epoch": 430} {"train_loss": -5.30788516998291, "global_step": 18071, "epoch": 430} {"train_loss": -5.242548942565918, "global_step": 18072, "epoch": 430} {"train_loss": -5.271086692810059, "global_step": 18073, "epoch": 430} {"train_loss": -5.445763111114502, "global_step": 18074, "epoch": 430} {"train_loss": -5.303399085998535, "global_step": 18075, "epoch": 430} {"train_loss": -5.350737571716309, "global_step": 18076, "epoch": 430} {"train_loss": -5.347818851470947, "global_step": 18077, "epoch": 430} {"train_loss": -5.329392433166504, "global_step": 18078, "epoch": 430} {"train_loss": -5.328132152557373, "global_step": 18079, "epoch": 430} {"train_loss": -5.353006839752197, "global_step": 18080, "epoch": 430} {"train_loss": -5.247010707855225, "global_step": 18081, "epoch": 430} {"train_loss": -5.256339073181152, "global_step": 18082, "epoch": 430} {"train_loss": -5.249177932739258, "global_step": 18083, "epoch": 430} {"train_loss": -5.390827178955078, "global_step": 18084, "epoch": 430} {"train_loss": -5.279390335083008, "global_step": 18085, "epoch": 430} {"train_loss": -5.395554542541504, "global_step": 18086, "epoch": 430} {"train_loss": -5.227484703063965, "global_step": 18087, "epoch": 430} {"train_loss": -5.218974590301514, "global_step": 18088, "epoch": 430} {"train_loss": -5.322213649749756, "global_step": 18089, "epoch": 430} {"train_loss": -5.1844096183776855, "global_step": 18090, "epoch": 430} {"train_loss": -5.285520553588867, "global_step": 18091, "epoch": 430} {"train_loss": -5.212881088256836, "global_step": 18092, "epoch": 430} {"train_loss": -5.385937213897705, "global_step": 18093, "epoch": 430} {"train_loss": -5.165389537811279, "global_step": 18094, "epoch": 430} {"train_loss": -5.368255615234375, "global_step": 18095, "epoch": 430} {"train_loss": -5.237090587615967, "global_step": 18096, "epoch": 430} {"train_loss": -5.2357025146484375, "global_step": 18097, "epoch": 430} {"train_loss": -5.275946140289307, "global_step": 18098, "epoch": 430} {"train_loss": -5.22031831741333, "global_step": 18099, "epoch": 430} {"train_loss": -5.2357940673828125, "global_step": 18100, "epoch": 430} {"train_loss": -5.288024925050282, "global_step": 18101, "epoch": 430, "val_loss": 69341.6875} {"train_loss": -5.337071418762207, "global_step": 18102, "epoch": 431} {"train_loss": -5.236229419708252, "global_step": 18103, "epoch": 431} {"train_loss": -5.3144612312316895, "global_step": 18104, "epoch": 431} {"train_loss": -5.266603469848633, "global_step": 18105, "epoch": 431} {"train_loss": -5.225252151489258, "global_step": 18106, "epoch": 431} {"train_loss": -5.32529354095459, "global_step": 18107, "epoch": 431} {"train_loss": -5.313385963439941, "global_step": 18108, "epoch": 431} {"train_loss": -5.257989406585693, "global_step": 18109, "epoch": 431} {"train_loss": -5.352406024932861, "global_step": 18110, "epoch": 431} {"train_loss": -5.3332319259643555, "global_step": 18111, "epoch": 431} {"train_loss": -5.237283706665039, "global_step": 18112, "epoch": 431} {"train_loss": -5.339986324310303, "global_step": 18113, "epoch": 431} {"train_loss": -5.2702202796936035, "global_step": 18114, "epoch": 431} {"train_loss": -5.278708457946777, "global_step": 18115, "epoch": 431} {"train_loss": -5.202815055847168, "global_step": 18116, "epoch": 431} {"train_loss": -5.234276294708252, "global_step": 18117, "epoch": 431} {"train_loss": -5.161482334136963, "global_step": 18118, "epoch": 431} {"train_loss": -5.323159694671631, "global_step": 18119, "epoch": 431} {"train_loss": -5.332607269287109, "global_step": 18120, "epoch": 431} {"train_loss": -5.374702453613281, "global_step": 18121, "epoch": 431} {"train_loss": -5.294643402099609, "global_step": 18122, "epoch": 431} {"train_loss": -5.270896911621094, "global_step": 18123, "epoch": 431} {"train_loss": -5.289680480957031, "global_step": 18124, "epoch": 431} {"train_loss": -5.224168300628662, "global_step": 18125, "epoch": 431} {"train_loss": -5.379400730133057, "global_step": 18126, "epoch": 431} {"train_loss": -5.285828590393066, "global_step": 18127, "epoch": 431} {"train_loss": -5.4356842041015625, "global_step": 18128, "epoch": 431} {"train_loss": -5.217302322387695, "global_step": 18129, "epoch": 431} {"train_loss": -5.259335994720459, "global_step": 18130, "epoch": 431} {"train_loss": -5.2718186378479, "global_step": 18131, "epoch": 431} {"train_loss": -5.400081634521484, "global_step": 18132, "epoch": 431} {"train_loss": -5.300039291381836, "global_step": 18133, "epoch": 431} {"train_loss": -5.241966247558594, "global_step": 18134, "epoch": 431} {"train_loss": -5.309527397155762, "global_step": 18135, "epoch": 431} {"train_loss": -5.221996784210205, "global_step": 18136, "epoch": 431} {"train_loss": -5.485127925872803, "global_step": 18137, "epoch": 431} {"train_loss": -5.288888931274414, "global_step": 18138, "epoch": 431} {"train_loss": -5.388068199157715, "global_step": 18139, "epoch": 431} {"train_loss": -5.392719268798828, "global_step": 18140, "epoch": 431} {"train_loss": -5.294469833374023, "global_step": 18141, "epoch": 431} {"train_loss": -5.229025840759277, "global_step": 18142, "epoch": 431} {"train_loss": -5.295659894034976, "global_step": 18143, "epoch": 431, "val_loss": 69497.8984375} {"train_loss": -5.334892272949219, "global_step": 18144, "epoch": 432} {"train_loss": -5.3902082443237305, "global_step": 18145, "epoch": 432} {"train_loss": -5.287713527679443, "global_step": 18146, "epoch": 432} {"train_loss": -5.286932945251465, "global_step": 18147, "epoch": 432} {"train_loss": -5.239753723144531, "global_step": 18148, "epoch": 432} {"train_loss": -5.252643585205078, "global_step": 18149, "epoch": 432} {"train_loss": -5.222097396850586, "global_step": 18150, "epoch": 432} {"train_loss": -5.264802932739258, "global_step": 18151, "epoch": 432} {"train_loss": -5.2993574142456055, "global_step": 18152, "epoch": 432} {"train_loss": -5.312183380126953, "global_step": 18153, "epoch": 432} {"train_loss": -5.324057579040527, "global_step": 18154, "epoch": 432} {"train_loss": -5.30702018737793, "global_step": 18155, "epoch": 432} {"train_loss": -5.37519645690918, "global_step": 18156, "epoch": 432} {"train_loss": -5.336220741271973, "global_step": 18157, "epoch": 432} {"train_loss": -5.226709365844727, "global_step": 18158, "epoch": 432} {"train_loss": -5.367421627044678, "global_step": 18159, "epoch": 432} {"train_loss": -5.303504943847656, "global_step": 18160, "epoch": 432} {"train_loss": -5.250129699707031, "global_step": 18161, "epoch": 432} {"train_loss": -5.24791145324707, "global_step": 18162, "epoch": 432} {"train_loss": -5.152124404907227, "global_step": 18163, "epoch": 432} {"train_loss": -5.349244594573975, "global_step": 18164, "epoch": 432} {"train_loss": -5.2275848388671875, "global_step": 18165, "epoch": 432} {"train_loss": -5.24708366394043, "global_step": 18166, "epoch": 432} {"train_loss": -5.270440101623535, "global_step": 18167, "epoch": 432} {"train_loss": -5.212071418762207, "global_step": 18168, "epoch": 432} {"train_loss": -5.256424903869629, "global_step": 18169, "epoch": 432} {"train_loss": -5.271520137786865, "global_step": 18170, "epoch": 432} {"train_loss": -5.07031774520874, "global_step": 18171, "epoch": 432} {"train_loss": -5.221685409545898, "global_step": 18172, "epoch": 432} {"train_loss": -5.317796230316162, "global_step": 18173, "epoch": 432} {"train_loss": -5.286663055419922, "global_step": 18174, "epoch": 432} {"train_loss": -5.243070602416992, "global_step": 18175, "epoch": 432} {"train_loss": -5.31044864654541, "global_step": 18176, "epoch": 432} {"train_loss": -5.252965927124023, "global_step": 18177, "epoch": 432} {"train_loss": -5.1839094161987305, "global_step": 18178, "epoch": 432} {"train_loss": -5.2443389892578125, "global_step": 18179, "epoch": 432} {"train_loss": -4.981975555419922, "global_step": 18180, "epoch": 432} {"train_loss": -5.232837677001953, "global_step": 18181, "epoch": 432} {"train_loss": -5.216697692871094, "global_step": 18182, "epoch": 432} {"train_loss": -5.251786231994629, "global_step": 18183, "epoch": 432} {"train_loss": -5.304839611053467, "global_step": 18184, "epoch": 432} {"train_loss": -5.2588285605112715, "global_step": 18185, "epoch": 432, "val_loss": 69504.9140625} {"train_loss": -5.182042598724365, "global_step": 18186, "epoch": 433} {"train_loss": -5.227071762084961, "global_step": 18187, "epoch": 433} {"train_loss": -5.26080322265625, "global_step": 18188, "epoch": 433} {"train_loss": -5.209413528442383, "global_step": 18189, "epoch": 433} {"train_loss": -5.193002700805664, "global_step": 18190, "epoch": 433} {"train_loss": -5.085967063903809, "global_step": 18191, "epoch": 433} {"train_loss": -5.2715253829956055, "global_step": 18192, "epoch": 433} {"train_loss": -5.085943222045898, "global_step": 18193, "epoch": 433} {"train_loss": -5.276313304901123, "global_step": 18194, "epoch": 433} {"train_loss": -5.173561096191406, "global_step": 18195, "epoch": 433} {"train_loss": -5.307831287384033, "global_step": 18196, "epoch": 433} {"train_loss": -5.385471343994141, "global_step": 18197, "epoch": 433} {"train_loss": -5.2286577224731445, "global_step": 18198, "epoch": 433} {"train_loss": -5.191702365875244, "global_step": 18199, "epoch": 433} {"train_loss": -5.237284183502197, "global_step": 18200, "epoch": 433} {"train_loss": -5.20794677734375, "global_step": 18201, "epoch": 433} {"train_loss": -5.239260673522949, "global_step": 18202, "epoch": 433} {"train_loss": -5.1559343338012695, "global_step": 18203, "epoch": 433} {"train_loss": -5.396828651428223, "global_step": 18204, "epoch": 433} {"train_loss": -5.308405876159668, "global_step": 18205, "epoch": 433} {"train_loss": -5.290743827819824, "global_step": 18206, "epoch": 433} {"train_loss": -5.289766311645508, "global_step": 18207, "epoch": 433} {"train_loss": -5.127519130706787, "global_step": 18208, "epoch": 433} {"train_loss": -5.234945297241211, "global_step": 18209, "epoch": 433} {"train_loss": -5.3727707862854, "global_step": 18210, "epoch": 433} {"train_loss": -5.259479999542236, "global_step": 18211, "epoch": 433} {"train_loss": -5.26126766204834, "global_step": 18212, "epoch": 433} {"train_loss": -5.228296756744385, "global_step": 18213, "epoch": 433} {"train_loss": -5.099197864532471, "global_step": 18214, "epoch": 433} {"train_loss": -5.371920108795166, "global_step": 18215, "epoch": 433} {"train_loss": -5.174001693725586, "global_step": 18216, "epoch": 433} {"train_loss": -5.208629608154297, "global_step": 18217, "epoch": 433} {"train_loss": -5.222187042236328, "global_step": 18218, "epoch": 433} {"train_loss": -5.268754959106445, "global_step": 18219, "epoch": 433} {"train_loss": -5.29562520980835, "global_step": 18220, "epoch": 433} {"train_loss": -5.2655229568481445, "global_step": 18221, "epoch": 433} {"train_loss": -5.253481864929199, "global_step": 18222, "epoch": 433} {"train_loss": -5.318397521972656, "global_step": 18223, "epoch": 433} {"train_loss": -5.1451616287231445, "global_step": 18224, "epoch": 433} {"train_loss": -5.349245071411133, "global_step": 18225, "epoch": 433} {"train_loss": -5.186638832092285, "global_step": 18226, "epoch": 433} {"train_loss": -5.239650680905297, "global_step": 18227, "epoch": 433, "val_loss": 69457.21875} {"train_loss": -5.4041619300842285, "global_step": 18228, "epoch": 434} {"train_loss": -5.279126167297363, "global_step": 18229, "epoch": 434} {"train_loss": -5.308698654174805, "global_step": 18230, "epoch": 434} {"train_loss": -5.186308860778809, "global_step": 18231, "epoch": 434} {"train_loss": -5.166652679443359, "global_step": 18232, "epoch": 434} {"train_loss": -5.351292610168457, "global_step": 18233, "epoch": 434} {"train_loss": -5.268650531768799, "global_step": 18234, "epoch": 434} {"train_loss": -5.178412914276123, "global_step": 18235, "epoch": 434} {"train_loss": -5.29428768157959, "global_step": 18236, "epoch": 434} {"train_loss": -5.172806739807129, "global_step": 18237, "epoch": 434} {"train_loss": -5.356375694274902, "global_step": 18238, "epoch": 434} {"train_loss": -5.223150730133057, "global_step": 18239, "epoch": 434} {"train_loss": -5.213541507720947, "global_step": 18240, "epoch": 434} {"train_loss": -5.039816856384277, "global_step": 18241, "epoch": 434} {"train_loss": -5.2174482345581055, "global_step": 18242, "epoch": 434} {"train_loss": -5.252570629119873, "global_step": 18243, "epoch": 434} {"train_loss": -5.304238319396973, "global_step": 18244, "epoch": 434} {"train_loss": -5.300259590148926, "global_step": 18245, "epoch": 434} {"train_loss": -4.999964237213135, "global_step": 18246, "epoch": 434} {"train_loss": -5.272335052490234, "global_step": 18247, "epoch": 434} {"train_loss": -5.103046417236328, "global_step": 18248, "epoch": 434} {"train_loss": -5.198947906494141, "global_step": 18249, "epoch": 434} {"train_loss": -5.187832832336426, "global_step": 18250, "epoch": 434} {"train_loss": -5.127617835998535, "global_step": 18251, "epoch": 434} {"train_loss": -5.27433967590332, "global_step": 18252, "epoch": 434} {"train_loss": -5.184967041015625, "global_step": 18253, "epoch": 434} {"train_loss": -5.228079795837402, "global_step": 18254, "epoch": 434} {"train_loss": -5.203069686889648, "global_step": 18255, "epoch": 434} {"train_loss": -5.15283203125, "global_step": 18256, "epoch": 434} {"train_loss": -5.184238433837891, "global_step": 18257, "epoch": 434} {"train_loss": -5.157303810119629, "global_step": 18258, "epoch": 434} {"train_loss": -5.352240562438965, "global_step": 18259, "epoch": 434} {"train_loss": -5.231549263000488, "global_step": 18260, "epoch": 434} {"train_loss": -5.232462406158447, "global_step": 18261, "epoch": 434} {"train_loss": -5.267748832702637, "global_step": 18262, "epoch": 434} {"train_loss": -5.340631008148193, "global_step": 18263, "epoch": 434} {"train_loss": -5.312407493591309, "global_step": 18264, "epoch": 434} {"train_loss": -5.274096488952637, "global_step": 18265, "epoch": 434} {"train_loss": -5.333996295928955, "global_step": 18266, "epoch": 434} {"train_loss": -5.353241920471191, "global_step": 18267, "epoch": 434} {"train_loss": -5.2390875816345215, "global_step": 18268, "epoch": 434} {"train_loss": -5.234830549785069, "global_step": 18269, "epoch": 434, "val_loss": 69448.71875} {"train_loss": -5.238163948059082, "global_step": 18270, "epoch": 435} {"train_loss": -5.176889896392822, "global_step": 18271, "epoch": 435} {"train_loss": -5.147469520568848, "global_step": 18272, "epoch": 435} {"train_loss": -5.189043998718262, "global_step": 18273, "epoch": 435} {"train_loss": -5.265792369842529, "global_step": 18274, "epoch": 435} {"train_loss": -5.205024242401123, "global_step": 18275, "epoch": 435} {"train_loss": -5.429865837097168, "global_step": 18276, "epoch": 435} {"train_loss": -5.381945610046387, "global_step": 18277, "epoch": 435} {"train_loss": -5.272452354431152, "global_step": 18278, "epoch": 435} {"train_loss": -5.233377933502197, "global_step": 18279, "epoch": 435} {"train_loss": -5.238743782043457, "global_step": 18280, "epoch": 435} {"train_loss": -5.327018737792969, "global_step": 18281, "epoch": 435} {"train_loss": -5.2206220626831055, "global_step": 18282, "epoch": 435} {"train_loss": -5.270118713378906, "global_step": 18283, "epoch": 435} {"train_loss": -5.262367248535156, "global_step": 18284, "epoch": 435} {"train_loss": -5.253292083740234, "global_step": 18285, "epoch": 435} {"train_loss": -5.230597496032715, "global_step": 18286, "epoch": 435} {"train_loss": -5.286499500274658, "global_step": 18287, "epoch": 435} {"train_loss": -5.36942195892334, "global_step": 18288, "epoch": 435} {"train_loss": -5.165861129760742, "global_step": 18289, "epoch": 435} {"train_loss": -5.220120429992676, "global_step": 18290, "epoch": 435} {"train_loss": -5.281050682067871, "global_step": 18291, "epoch": 435} {"train_loss": -5.380346298217773, "global_step": 18292, "epoch": 435} {"train_loss": -5.363828182220459, "global_step": 18293, "epoch": 435} {"train_loss": -5.277745723724365, "global_step": 18294, "epoch": 435} {"train_loss": -5.346637725830078, "global_step": 18295, "epoch": 435} {"train_loss": -5.347044944763184, "global_step": 18296, "epoch": 435} {"train_loss": -5.402676582336426, "global_step": 18297, "epoch": 435} {"train_loss": -5.521221160888672, "global_step": 18298, "epoch": 435} {"train_loss": -5.287683486938477, "global_step": 18299, "epoch": 435} {"train_loss": -5.2986602783203125, "global_step": 18300, "epoch": 435} {"train_loss": -5.254763603210449, "global_step": 18301, "epoch": 435} {"train_loss": -5.207306861877441, "global_step": 18302, "epoch": 435} {"train_loss": -5.190011501312256, "global_step": 18303, "epoch": 435} {"train_loss": -5.391111373901367, "global_step": 18304, "epoch": 435} {"train_loss": -5.310480117797852, "global_step": 18305, "epoch": 435} {"train_loss": -5.262281894683838, "global_step": 18306, "epoch": 435} {"train_loss": -5.221645355224609, "global_step": 18307, "epoch": 435} {"train_loss": -5.288487434387207, "global_step": 18308, "epoch": 435} {"train_loss": -5.276668548583984, "global_step": 18309, "epoch": 435} {"train_loss": -5.268093109130859, "global_step": 18310, "epoch": 435} {"train_loss": -5.280084814344134, "global_step": 18311, "epoch": 435, "val_loss": 69767.4453125} {"train_loss": -5.389361381530762, "global_step": 18312, "epoch": 436} {"train_loss": -5.276358604431152, "global_step": 18313, "epoch": 436} {"train_loss": -5.277230739593506, "global_step": 18314, "epoch": 436} {"train_loss": -5.380134582519531, "global_step": 18315, "epoch": 436} {"train_loss": -5.348013877868652, "global_step": 18316, "epoch": 436} {"train_loss": -5.323246955871582, "global_step": 18317, "epoch": 436} {"train_loss": -5.441763877868652, "global_step": 18318, "epoch": 436} {"train_loss": -5.122037410736084, "global_step": 18319, "epoch": 436} {"train_loss": -5.357446670532227, "global_step": 18320, "epoch": 436} {"train_loss": -5.434634208679199, "global_step": 18321, "epoch": 436} {"train_loss": -5.286709308624268, "global_step": 18322, "epoch": 436} {"train_loss": -5.270722389221191, "global_step": 18323, "epoch": 436} {"train_loss": -5.339870452880859, "global_step": 18324, "epoch": 436} {"train_loss": -5.127250671386719, "global_step": 18325, "epoch": 436} {"train_loss": -5.466230392456055, "global_step": 18326, "epoch": 436} {"train_loss": -5.265407085418701, "global_step": 18327, "epoch": 436} {"train_loss": -5.063675880432129, "global_step": 18328, "epoch": 436} {"train_loss": -5.283158302307129, "global_step": 18329, "epoch": 436} {"train_loss": -5.226667404174805, "global_step": 18330, "epoch": 436} {"train_loss": -5.04179573059082, "global_step": 18331, "epoch": 436} {"train_loss": -5.260217189788818, "global_step": 18332, "epoch": 436} {"train_loss": -5.095576286315918, "global_step": 18333, "epoch": 436} {"train_loss": -5.182827472686768, "global_step": 18334, "epoch": 436} {"train_loss": -5.163661003112793, "global_step": 18335, "epoch": 436} {"train_loss": -5.258845806121826, "global_step": 18336, "epoch": 436} {"train_loss": -5.334402561187744, "global_step": 18337, "epoch": 436} {"train_loss": -5.276376724243164, "global_step": 18338, "epoch": 436} {"train_loss": -5.418943405151367, "global_step": 18339, "epoch": 436} {"train_loss": -5.24926233291626, "global_step": 18340, "epoch": 436} {"train_loss": -5.29973030090332, "global_step": 18341, "epoch": 436} {"train_loss": -5.278729438781738, "global_step": 18342, "epoch": 436} {"train_loss": -5.1541290283203125, "global_step": 18343, "epoch": 436} {"train_loss": -5.196562767028809, "global_step": 18344, "epoch": 436} {"train_loss": -5.229436874389648, "global_step": 18345, "epoch": 436} {"train_loss": -5.221489429473877, "global_step": 18346, "epoch": 436} {"train_loss": -5.353036880493164, "global_step": 18347, "epoch": 436} {"train_loss": -5.422064781188965, "global_step": 18348, "epoch": 436} {"train_loss": -5.200564861297607, "global_step": 18349, "epoch": 436} {"train_loss": -5.142528533935547, "global_step": 18350, "epoch": 436} {"train_loss": -5.260478973388672, "global_step": 18351, "epoch": 436} {"train_loss": -5.337621688842773, "global_step": 18352, "epoch": 436} {"train_loss": -5.270909173148019, "global_step": 18353, "epoch": 436, "val_loss": 69603.015625} {"train_loss": -5.187370300292969, "global_step": 18354, "epoch": 437} {"train_loss": -5.487800121307373, "global_step": 18355, "epoch": 437} {"train_loss": -5.24785852432251, "global_step": 18356, "epoch": 437} {"train_loss": -5.183925628662109, "global_step": 18357, "epoch": 437} {"train_loss": -5.306012153625488, "global_step": 18358, "epoch": 437} {"train_loss": -5.2664690017700195, "global_step": 18359, "epoch": 437} {"train_loss": -5.164277076721191, "global_step": 18360, "epoch": 437} {"train_loss": -5.086580276489258, "global_step": 18361, "epoch": 437} {"train_loss": -5.224871635437012, "global_step": 18362, "epoch": 437} {"train_loss": -5.270135879516602, "global_step": 18363, "epoch": 437} {"train_loss": -5.073369979858398, "global_step": 18364, "epoch": 437} {"train_loss": -5.2435736656188965, "global_step": 18365, "epoch": 437} {"train_loss": -5.099623680114746, "global_step": 18366, "epoch": 437} {"train_loss": -5.191285133361816, "global_step": 18367, "epoch": 437} {"train_loss": -5.304049015045166, "global_step": 18368, "epoch": 437} {"train_loss": -5.218042373657227, "global_step": 18369, "epoch": 437} {"train_loss": -5.17249870300293, "global_step": 18370, "epoch": 437} {"train_loss": -5.224484443664551, "global_step": 18371, "epoch": 437} {"train_loss": -5.213315010070801, "global_step": 18372, "epoch": 437} {"train_loss": -5.267512321472168, "global_step": 18373, "epoch": 437} {"train_loss": -5.032165050506592, "global_step": 18374, "epoch": 437} {"train_loss": -5.240843296051025, "global_step": 18375, "epoch": 437} {"train_loss": -5.106543064117432, "global_step": 18376, "epoch": 437} {"train_loss": -5.292331695556641, "global_step": 18377, "epoch": 437} {"train_loss": -5.121071815490723, "global_step": 18378, "epoch": 437} {"train_loss": -5.259642601013184, "global_step": 18379, "epoch": 437} {"train_loss": -5.171233654022217, "global_step": 18380, "epoch": 437} {"train_loss": -5.2409443855285645, "global_step": 18381, "epoch": 437} {"train_loss": -5.289286136627197, "global_step": 18382, "epoch": 437} {"train_loss": -5.234838485717773, "global_step": 18383, "epoch": 437} {"train_loss": -5.13348388671875, "global_step": 18384, "epoch": 437} {"train_loss": -5.240937232971191, "global_step": 18385, "epoch": 437} {"train_loss": -5.254019737243652, "global_step": 18386, "epoch": 437} {"train_loss": -5.239940643310547, "global_step": 18387, "epoch": 437} {"train_loss": -5.251731872558594, "global_step": 18388, "epoch": 437} {"train_loss": -5.296522617340088, "global_step": 18389, "epoch": 437} {"train_loss": -5.20963191986084, "global_step": 18390, "epoch": 437} {"train_loss": -5.247039318084717, "global_step": 18391, "epoch": 437} {"train_loss": -5.280999183654785, "global_step": 18392, "epoch": 437} {"train_loss": -5.249636650085449, "global_step": 18393, "epoch": 437} {"train_loss": -5.190552234649658, "global_step": 18394, "epoch": 437} {"train_loss": -5.220083554585774, "global_step": 18395, "epoch": 437, "val_loss": 69767.1015625} {"train_loss": -5.324856281280518, "global_step": 18396, "epoch": 438} {"train_loss": -5.265981197357178, "global_step": 18397, "epoch": 438} {"train_loss": -5.121181488037109, "global_step": 18398, "epoch": 438} {"train_loss": -5.200616836547852, "global_step": 18399, "epoch": 438} {"train_loss": -5.150566101074219, "global_step": 18400, "epoch": 438} {"train_loss": -5.193325996398926, "global_step": 18401, "epoch": 438} {"train_loss": -5.353977203369141, "global_step": 18402, "epoch": 438} {"train_loss": -5.275684356689453, "global_step": 18403, "epoch": 438} {"train_loss": -5.252619743347168, "global_step": 18404, "epoch": 438} {"train_loss": -5.23764705657959, "global_step": 18405, "epoch": 438} {"train_loss": -5.2539286613464355, "global_step": 18406, "epoch": 438} {"train_loss": -5.387713432312012, "global_step": 18407, "epoch": 438} {"train_loss": -5.315291404724121, "global_step": 18408, "epoch": 438} {"train_loss": -5.276532173156738, "global_step": 18409, "epoch": 438} {"train_loss": -5.436718940734863, "global_step": 18410, "epoch": 438} {"train_loss": -5.294155120849609, "global_step": 18411, "epoch": 438} {"train_loss": -5.103028297424316, "global_step": 18412, "epoch": 438} {"train_loss": -5.205167293548584, "global_step": 18413, "epoch": 438} {"train_loss": -5.2692551612854, "global_step": 18414, "epoch": 438} {"train_loss": -5.2529168128967285, "global_step": 18415, "epoch": 438} {"train_loss": -5.2856669425964355, "global_step": 18416, "epoch": 438} {"train_loss": -5.279425144195557, "global_step": 18417, "epoch": 438} {"train_loss": -5.261538028717041, "global_step": 18418, "epoch": 438} {"train_loss": -5.331895351409912, "global_step": 18419, "epoch": 438} {"train_loss": -5.246854782104492, "global_step": 18420, "epoch": 438} {"train_loss": -5.287144660949707, "global_step": 18421, "epoch": 438} {"train_loss": -5.306398391723633, "global_step": 18422, "epoch": 438} {"train_loss": -5.248892784118652, "global_step": 18423, "epoch": 438} {"train_loss": -5.293643951416016, "global_step": 18424, "epoch": 438} {"train_loss": -5.391540050506592, "global_step": 18425, "epoch": 438} {"train_loss": -5.371117115020752, "global_step": 18426, "epoch": 438} {"train_loss": -5.236448287963867, "global_step": 18427, "epoch": 438} {"train_loss": -5.290000915527344, "global_step": 18428, "epoch": 438} {"train_loss": -5.345366954803467, "global_step": 18429, "epoch": 438} {"train_loss": -5.330206871032715, "global_step": 18430, "epoch": 438} {"train_loss": -5.220552921295166, "global_step": 18431, "epoch": 438} {"train_loss": -5.314212799072266, "global_step": 18432, "epoch": 438} {"train_loss": -5.358502388000488, "global_step": 18433, "epoch": 438} {"train_loss": -5.443357944488525, "global_step": 18434, "epoch": 438} {"train_loss": -5.346397399902344, "global_step": 18435, "epoch": 438} {"train_loss": -5.329232692718506, "global_step": 18436, "epoch": 438} {"train_loss": -5.2829669543675015, "global_step": 18437, "epoch": 438, "val_loss": 69545.4453125} {"train_loss": -5.239231586456299, "global_step": 18438, "epoch": 439} {"train_loss": -5.272737979888916, "global_step": 18439, "epoch": 439} {"train_loss": -5.207117080688477, "global_step": 18440, "epoch": 439} {"train_loss": -5.182092666625977, "global_step": 18441, "epoch": 439} {"train_loss": -5.271056175231934, "global_step": 18442, "epoch": 439} {"train_loss": -5.222118854522705, "global_step": 18443, "epoch": 439} {"train_loss": -5.2570319175720215, "global_step": 18444, "epoch": 439} {"train_loss": -5.302321434020996, "global_step": 18445, "epoch": 439} {"train_loss": -5.300146579742432, "global_step": 18446, "epoch": 439} {"train_loss": -5.275710105895996, "global_step": 18447, "epoch": 439} {"train_loss": -5.21950626373291, "global_step": 18448, "epoch": 439} {"train_loss": -5.301968574523926, "global_step": 18449, "epoch": 439} {"train_loss": -5.277237892150879, "global_step": 18450, "epoch": 439} {"train_loss": -5.3357625007629395, "global_step": 18451, "epoch": 439} {"train_loss": -5.288778781890869, "global_step": 18452, "epoch": 439} {"train_loss": -5.12498664855957, "global_step": 18453, "epoch": 439} {"train_loss": -5.207732677459717, "global_step": 18454, "epoch": 439} {"train_loss": -5.351264953613281, "global_step": 18455, "epoch": 439} {"train_loss": -5.22800874710083, "global_step": 18456, "epoch": 439} {"train_loss": -5.37399435043335, "global_step": 18457, "epoch": 439} {"train_loss": -5.3380327224731445, "global_step": 18458, "epoch": 439} {"train_loss": -5.300320625305176, "global_step": 18459, "epoch": 439} {"train_loss": -5.281087875366211, "global_step": 18460, "epoch": 439} {"train_loss": -5.2496538162231445, "global_step": 18461, "epoch": 439} {"train_loss": -5.266421794891357, "global_step": 18462, "epoch": 439} {"train_loss": -5.237926959991455, "global_step": 18463, "epoch": 439} {"train_loss": -5.446981906890869, "global_step": 18464, "epoch": 439} {"train_loss": -5.273316383361816, "global_step": 18465, "epoch": 439} {"train_loss": -5.1949005126953125, "global_step": 18466, "epoch": 439} {"train_loss": -5.338088035583496, "global_step": 18467, "epoch": 439} {"train_loss": -5.380179405212402, "global_step": 18468, "epoch": 439} {"train_loss": -5.281584739685059, "global_step": 18469, "epoch": 439} {"train_loss": -5.28935432434082, "global_step": 18470, "epoch": 439} {"train_loss": -5.259958267211914, "global_step": 18471, "epoch": 439} {"train_loss": -5.422457218170166, "global_step": 18472, "epoch": 439} {"train_loss": -5.184412956237793, "global_step": 18473, "epoch": 439} {"train_loss": -5.449997901916504, "global_step": 18474, "epoch": 439} {"train_loss": -5.206577777862549, "global_step": 18475, "epoch": 439} {"train_loss": -4.911067008972168, "global_step": 18476, "epoch": 439} {"train_loss": -5.317385196685791, "global_step": 18477, "epoch": 439} {"train_loss": -4.960686683654785, "global_step": 18478, "epoch": 439} {"train_loss": -5.26377702894665, "global_step": 18479, "epoch": 439, "val_loss": 69885.375} {"train_loss": -5.215887069702148, "global_step": 18480, "epoch": 440} {"train_loss": -5.131725311279297, "global_step": 18481, "epoch": 440} {"train_loss": -5.273455619812012, "global_step": 18482, "epoch": 440} {"train_loss": -5.3089494705200195, "global_step": 18483, "epoch": 440} {"train_loss": -5.2791595458984375, "global_step": 18484, "epoch": 440} {"train_loss": -5.297676086425781, "global_step": 18485, "epoch": 440} {"train_loss": -5.187033653259277, "global_step": 18486, "epoch": 440} {"train_loss": -5.4370598793029785, "global_step": 18487, "epoch": 440} {"train_loss": -5.384336471557617, "global_step": 18488, "epoch": 440} {"train_loss": -5.193729400634766, "global_step": 18489, "epoch": 440} {"train_loss": -5.265049457550049, "global_step": 18490, "epoch": 440} {"train_loss": -5.359611511230469, "global_step": 18491, "epoch": 440} {"train_loss": -5.1627912521362305, "global_step": 18492, "epoch": 440} {"train_loss": -5.147273540496826, "global_step": 18493, "epoch": 440} {"train_loss": -5.159200191497803, "global_step": 18494, "epoch": 440} {"train_loss": -5.185360908508301, "global_step": 18495, "epoch": 440} {"train_loss": -5.203632354736328, "global_step": 18496, "epoch": 440} {"train_loss": -5.267331123352051, "global_step": 18497, "epoch": 440} {"train_loss": -5.350008487701416, "global_step": 18498, "epoch": 440} {"train_loss": -5.279940128326416, "global_step": 18499, "epoch": 440} {"train_loss": -5.274558067321777, "global_step": 18500, "epoch": 440} {"train_loss": -5.186205863952637, "global_step": 18501, "epoch": 440} {"train_loss": -5.329801559448242, "global_step": 18502, "epoch": 440} {"train_loss": -5.393459320068359, "global_step": 18503, "epoch": 440} {"train_loss": -5.253336429595947, "global_step": 18504, "epoch": 440} {"train_loss": -5.227294445037842, "global_step": 18505, "epoch": 440} {"train_loss": -5.351902484893799, "global_step": 18506, "epoch": 440} {"train_loss": -5.377044677734375, "global_step": 18507, "epoch": 440} {"train_loss": -5.354328155517578, "global_step": 18508, "epoch": 440} {"train_loss": -5.369157791137695, "global_step": 18509, "epoch": 440} {"train_loss": -5.342878341674805, "global_step": 18510, "epoch": 440} {"train_loss": -5.346563339233398, "global_step": 18511, "epoch": 440} {"train_loss": -5.266476154327393, "global_step": 18512, "epoch": 440} {"train_loss": -5.271510124206543, "global_step": 18513, "epoch": 440} {"train_loss": -5.378568649291992, "global_step": 18514, "epoch": 440} {"train_loss": -5.2989325523376465, "global_step": 18515, "epoch": 440} {"train_loss": -5.341981887817383, "global_step": 18516, "epoch": 440} {"train_loss": -5.429826259613037, "global_step": 18517, "epoch": 440} {"train_loss": -5.305431365966797, "global_step": 18518, "epoch": 440} {"train_loss": -5.261368274688721, "global_step": 18519, "epoch": 440} {"train_loss": -5.295456886291504, "global_step": 18520, "epoch": 440} {"train_loss": -5.286233788444882, "global_step": 18521, "epoch": 440, "val_loss": 69656.109375} {"train_loss": -5.29628324508667, "global_step": 18522, "epoch": 441} {"train_loss": -5.293377876281738, "global_step": 18523, "epoch": 441} {"train_loss": -5.212039947509766, "global_step": 18524, "epoch": 441} {"train_loss": -5.327025413513184, "global_step": 18525, "epoch": 441} {"train_loss": -5.236388206481934, "global_step": 18526, "epoch": 441} {"train_loss": -5.18447208404541, "global_step": 18527, "epoch": 441} {"train_loss": -5.212018966674805, "global_step": 18528, "epoch": 441} {"train_loss": -5.259209156036377, "global_step": 18529, "epoch": 441} {"train_loss": -5.174624919891357, "global_step": 18530, "epoch": 441} {"train_loss": -5.355403423309326, "global_step": 18531, "epoch": 441} {"train_loss": -5.315404891967773, "global_step": 18532, "epoch": 441} {"train_loss": -5.353337287902832, "global_step": 18533, "epoch": 441} {"train_loss": -5.191823959350586, "global_step": 18534, "epoch": 441} {"train_loss": -5.317623615264893, "global_step": 18535, "epoch": 441} {"train_loss": -5.132319927215576, "global_step": 18536, "epoch": 441} {"train_loss": -5.214347839355469, "global_step": 18537, "epoch": 441} {"train_loss": -5.258701801300049, "global_step": 18538, "epoch": 441} {"train_loss": -5.422518730163574, "global_step": 18539, "epoch": 441} {"train_loss": -5.3772101402282715, "global_step": 18540, "epoch": 441} {"train_loss": -5.397711277008057, "global_step": 18541, "epoch": 441} {"train_loss": -5.235403537750244, "global_step": 18542, "epoch": 441} {"train_loss": -5.337944030761719, "global_step": 18543, "epoch": 441} {"train_loss": -5.308018684387207, "global_step": 18544, "epoch": 441} {"train_loss": -5.253148078918457, "global_step": 18545, "epoch": 441} {"train_loss": -5.239439010620117, "global_step": 18546, "epoch": 441} {"train_loss": -5.234697341918945, "global_step": 18547, "epoch": 441} {"train_loss": -5.258465766906738, "global_step": 18548, "epoch": 441} {"train_loss": -5.357525825500488, "global_step": 18549, "epoch": 441} {"train_loss": -5.313420295715332, "global_step": 18550, "epoch": 441} {"train_loss": -5.307656764984131, "global_step": 18551, "epoch": 441} {"train_loss": -5.208065032958984, "global_step": 18552, "epoch": 441} {"train_loss": -5.145686626434326, "global_step": 18553, "epoch": 441} {"train_loss": -5.39501953125, "global_step": 18554, "epoch": 441} {"train_loss": -5.329482078552246, "global_step": 18555, "epoch": 441} {"train_loss": -5.227335453033447, "global_step": 18556, "epoch": 441} {"train_loss": -5.207045078277588, "global_step": 18557, "epoch": 441} {"train_loss": -5.137636184692383, "global_step": 18558, "epoch": 441} {"train_loss": -5.118978023529053, "global_step": 18559, "epoch": 441} {"train_loss": -5.154987812042236, "global_step": 18560, "epoch": 441} {"train_loss": -5.322744846343994, "global_step": 18561, "epoch": 441} {"train_loss": -5.093718528747559, "global_step": 18562, "epoch": 441} {"train_loss": -5.261912198293777, "global_step": 18563, "epoch": 441, "val_loss": 70170.4296875} {"train_loss": -5.133363246917725, "global_step": 18564, "epoch": 442} {"train_loss": -5.316299915313721, "global_step": 18565, "epoch": 442} {"train_loss": -5.414106369018555, "global_step": 18566, "epoch": 442} {"train_loss": -5.182579517364502, "global_step": 18567, "epoch": 442} {"train_loss": -5.238931655883789, "global_step": 18568, "epoch": 442} {"train_loss": -5.283071517944336, "global_step": 18569, "epoch": 442} {"train_loss": -5.313896179199219, "global_step": 18570, "epoch": 442} {"train_loss": -5.417995929718018, "global_step": 18571, "epoch": 442} {"train_loss": -5.297802448272705, "global_step": 18572, "epoch": 442} {"train_loss": -5.2594685554504395, "global_step": 18573, "epoch": 442} {"train_loss": -5.369959354400635, "global_step": 18574, "epoch": 442} {"train_loss": -5.176328182220459, "global_step": 18575, "epoch": 442} {"train_loss": -5.476140022277832, "global_step": 18576, "epoch": 442} {"train_loss": -5.283957481384277, "global_step": 18577, "epoch": 442} {"train_loss": -5.157486438751221, "global_step": 18578, "epoch": 442} {"train_loss": -5.196816444396973, "global_step": 18579, "epoch": 442} {"train_loss": -5.292775630950928, "global_step": 18580, "epoch": 442} {"train_loss": -5.239508628845215, "global_step": 18581, "epoch": 442} {"train_loss": -5.219508647918701, "global_step": 18582, "epoch": 442} {"train_loss": -5.215078353881836, "global_step": 18583, "epoch": 442} {"train_loss": -5.153418064117432, "global_step": 18584, "epoch": 442} {"train_loss": -5.204503059387207, "global_step": 18585, "epoch": 442} {"train_loss": -5.37313175201416, "global_step": 18586, "epoch": 442} {"train_loss": -5.320677757263184, "global_step": 18587, "epoch": 442} {"train_loss": -5.335498332977295, "global_step": 18588, "epoch": 442} {"train_loss": -5.307370185852051, "global_step": 18589, "epoch": 442} {"train_loss": -5.399398326873779, "global_step": 18590, "epoch": 442} {"train_loss": -5.285822868347168, "global_step": 18591, "epoch": 442} {"train_loss": -5.320791244506836, "global_step": 18592, "epoch": 442} {"train_loss": -5.320555686950684, "global_step": 18593, "epoch": 442} {"train_loss": -5.25313138961792, "global_step": 18594, "epoch": 442} {"train_loss": -5.233384132385254, "global_step": 18595, "epoch": 442} {"train_loss": -5.306234836578369, "global_step": 18596, "epoch": 442} {"train_loss": -5.437933444976807, "global_step": 18597, "epoch": 442} {"train_loss": -5.265318870544434, "global_step": 18598, "epoch": 442} {"train_loss": -5.2721028327941895, "global_step": 18599, "epoch": 442} {"train_loss": -5.32604455947876, "global_step": 18600, "epoch": 442} {"train_loss": -5.349175453186035, "global_step": 18601, "epoch": 442} {"train_loss": -5.387920379638672, "global_step": 18602, "epoch": 442} {"train_loss": -5.186726093292236, "global_step": 18603, "epoch": 442} {"train_loss": -5.3856024742126465, "global_step": 18604, "epoch": 442} {"train_loss": -5.290641591662452, "global_step": 18605, "epoch": 442, "val_loss": 69643.7578125} {"train_loss": -5.217486381530762, "global_step": 18606, "epoch": 443} {"train_loss": -5.374888896942139, "global_step": 18607, "epoch": 443} {"train_loss": -5.216172695159912, "global_step": 18608, "epoch": 443} {"train_loss": -5.267396450042725, "global_step": 18609, "epoch": 443} {"train_loss": -5.330009460449219, "global_step": 18610, "epoch": 443} {"train_loss": -5.2158308029174805, "global_step": 18611, "epoch": 443} {"train_loss": -5.4686784744262695, "global_step": 18612, "epoch": 443} {"train_loss": -5.378918647766113, "global_step": 18613, "epoch": 443} {"train_loss": -5.251655578613281, "global_step": 18614, "epoch": 443} {"train_loss": -5.271949768066406, "global_step": 18615, "epoch": 443} {"train_loss": -5.341076374053955, "global_step": 18616, "epoch": 443} {"train_loss": -5.195530891418457, "global_step": 18617, "epoch": 443} {"train_loss": -5.178443431854248, "global_step": 18618, "epoch": 443} {"train_loss": -5.238463878631592, "global_step": 18619, "epoch": 443} {"train_loss": -5.43747615814209, "global_step": 18620, "epoch": 443} {"train_loss": -5.245091438293457, "global_step": 18621, "epoch": 443} {"train_loss": -5.3939971923828125, "global_step": 18622, "epoch": 443} {"train_loss": -5.368288516998291, "global_step": 18623, "epoch": 443} {"train_loss": -5.164015769958496, "global_step": 18624, "epoch": 443} {"train_loss": -5.314296722412109, "global_step": 18625, "epoch": 443} {"train_loss": -5.407416820526123, "global_step": 18626, "epoch": 443} {"train_loss": -5.154681205749512, "global_step": 18627, "epoch": 443} {"train_loss": -5.221583843231201, "global_step": 18628, "epoch": 443} {"train_loss": -5.241568565368652, "global_step": 18629, "epoch": 443} {"train_loss": -5.220248222351074, "global_step": 18630, "epoch": 443} {"train_loss": -5.0998029708862305, "global_step": 18631, "epoch": 443} {"train_loss": -5.290234565734863, "global_step": 18632, "epoch": 443} {"train_loss": -5.269728660583496, "global_step": 18633, "epoch": 443} {"train_loss": -5.177216529846191, "global_step": 18634, "epoch": 443} {"train_loss": -5.315871238708496, "global_step": 18635, "epoch": 443} {"train_loss": -5.243454933166504, "global_step": 18636, "epoch": 443} {"train_loss": -5.176055908203125, "global_step": 18637, "epoch": 443} {"train_loss": -5.239368915557861, "global_step": 18638, "epoch": 443} {"train_loss": -5.169464111328125, "global_step": 18639, "epoch": 443} {"train_loss": -5.191939353942871, "global_step": 18640, "epoch": 443} {"train_loss": -5.166348934173584, "global_step": 18641, "epoch": 443} {"train_loss": -5.3410325050354, "global_step": 18642, "epoch": 443} {"train_loss": -5.27972412109375, "global_step": 18643, "epoch": 443} {"train_loss": -5.27403450012207, "global_step": 18644, "epoch": 443} {"train_loss": -5.14005184173584, "global_step": 18645, "epoch": 443} {"train_loss": -5.15249490737915, "global_step": 18646, "epoch": 443} {"train_loss": -5.260630948202951, "global_step": 18647, "epoch": 443, "val_loss": 69494.796875} {"train_loss": -5.222330093383789, "global_step": 18648, "epoch": 444} {"train_loss": -5.309417724609375, "global_step": 18649, "epoch": 444} {"train_loss": -5.163434982299805, "global_step": 18650, "epoch": 444} {"train_loss": -5.324690818786621, "global_step": 18651, "epoch": 444} {"train_loss": -5.283503532409668, "global_step": 18652, "epoch": 444} {"train_loss": -5.287018299102783, "global_step": 18653, "epoch": 444} {"train_loss": -5.217951774597168, "global_step": 18654, "epoch": 444} {"train_loss": -5.353977203369141, "global_step": 18655, "epoch": 444} {"train_loss": -5.269988059997559, "global_step": 18656, "epoch": 444} {"train_loss": -5.131809711456299, "global_step": 18657, "epoch": 444} {"train_loss": -5.088655471801758, "global_step": 18658, "epoch": 444} {"train_loss": -5.253671169281006, "global_step": 18659, "epoch": 444} {"train_loss": -5.286653518676758, "global_step": 18660, "epoch": 444} {"train_loss": -5.141143798828125, "global_step": 18661, "epoch": 444} {"train_loss": -5.162093162536621, "global_step": 18662, "epoch": 444} {"train_loss": -5.194800853729248, "global_step": 18663, "epoch": 444} {"train_loss": -5.1952805519104, "global_step": 18664, "epoch": 444} {"train_loss": -5.295411586761475, "global_step": 18665, "epoch": 444} {"train_loss": -5.360328674316406, "global_step": 18666, "epoch": 444} {"train_loss": -5.070310592651367, "global_step": 18667, "epoch": 444} {"train_loss": -5.352042198181152, "global_step": 18668, "epoch": 444} {"train_loss": -5.3020734786987305, "global_step": 18669, "epoch": 444} {"train_loss": -5.190431594848633, "global_step": 18670, "epoch": 444} {"train_loss": -5.2144975662231445, "global_step": 18671, "epoch": 444} {"train_loss": -5.148073196411133, "global_step": 18672, "epoch": 444} {"train_loss": -5.346132278442383, "global_step": 18673, "epoch": 444} {"train_loss": -5.320215225219727, "global_step": 18674, "epoch": 444} {"train_loss": -5.188512802124023, "global_step": 18675, "epoch": 444} {"train_loss": -5.2196197509765625, "global_step": 18676, "epoch": 444} {"train_loss": -5.27419376373291, "global_step": 18677, "epoch": 444} {"train_loss": -5.365878105163574, "global_step": 18678, "epoch": 444} {"train_loss": -5.204125881195068, "global_step": 18679, "epoch": 444} {"train_loss": -5.188445091247559, "global_step": 18680, "epoch": 444} {"train_loss": -5.29876708984375, "global_step": 18681, "epoch": 444} {"train_loss": -5.094160079956055, "global_step": 18682, "epoch": 444} {"train_loss": -5.437632083892822, "global_step": 18683, "epoch": 444} {"train_loss": -5.352039813995361, "global_step": 18684, "epoch": 444} {"train_loss": -5.404803276062012, "global_step": 18685, "epoch": 444} {"train_loss": -5.366790771484375, "global_step": 18686, "epoch": 444} {"train_loss": -5.287086486816406, "global_step": 18687, "epoch": 444} {"train_loss": -5.271178722381592, "global_step": 18688, "epoch": 444} {"train_loss": -5.255933420998709, "global_step": 18689, "epoch": 444, "val_loss": 69396.140625} {"train_loss": -5.168063163757324, "global_step": 18690, "epoch": 445} {"train_loss": -5.271033763885498, "global_step": 18691, "epoch": 445} {"train_loss": -5.440796852111816, "global_step": 18692, "epoch": 445} {"train_loss": -5.215799808502197, "global_step": 18693, "epoch": 445} {"train_loss": -5.360751152038574, "global_step": 18694, "epoch": 445} {"train_loss": -5.292665481567383, "global_step": 18695, "epoch": 445} {"train_loss": -5.072265625, "global_step": 18696, "epoch": 445} {"train_loss": -5.421655654907227, "global_step": 18697, "epoch": 445} {"train_loss": -5.344841480255127, "global_step": 18698, "epoch": 445} {"train_loss": -5.110982894897461, "global_step": 18699, "epoch": 445} {"train_loss": -5.296890735626221, "global_step": 18700, "epoch": 445} {"train_loss": -5.127942085266113, "global_step": 18701, "epoch": 445} {"train_loss": -5.189608097076416, "global_step": 18702, "epoch": 445} {"train_loss": -5.221994400024414, "global_step": 18703, "epoch": 445} {"train_loss": -5.306998252868652, "global_step": 18704, "epoch": 445} {"train_loss": -5.142408847808838, "global_step": 18705, "epoch": 445} {"train_loss": -5.242994785308838, "global_step": 18706, "epoch": 445} {"train_loss": -5.2943549156188965, "global_step": 18707, "epoch": 445} {"train_loss": -5.371665000915527, "global_step": 18708, "epoch": 445} {"train_loss": -5.128881454467773, "global_step": 18709, "epoch": 445} {"train_loss": -5.285818099975586, "global_step": 18710, "epoch": 445} {"train_loss": -5.229953765869141, "global_step": 18711, "epoch": 445} {"train_loss": -5.205141544342041, "global_step": 18712, "epoch": 445} {"train_loss": -5.250797271728516, "global_step": 18713, "epoch": 445} {"train_loss": -5.214158058166504, "global_step": 18714, "epoch": 445} {"train_loss": -5.1341400146484375, "global_step": 18715, "epoch": 445} {"train_loss": -5.344724655151367, "global_step": 18716, "epoch": 445} {"train_loss": -5.233972549438477, "global_step": 18717, "epoch": 445} {"train_loss": -5.055693626403809, "global_step": 18718, "epoch": 445} {"train_loss": -5.390275478363037, "global_step": 18719, "epoch": 445} {"train_loss": -5.280356407165527, "global_step": 18720, "epoch": 445} {"train_loss": -5.219821929931641, "global_step": 18721, "epoch": 445} {"train_loss": -5.3235626220703125, "global_step": 18722, "epoch": 445} {"train_loss": -5.2970991134643555, "global_step": 18723, "epoch": 445} {"train_loss": -5.4087958335876465, "global_step": 18724, "epoch": 445} {"train_loss": -5.2442097663879395, "global_step": 18725, "epoch": 445} {"train_loss": -5.229516983032227, "global_step": 18726, "epoch": 445} {"train_loss": -5.188846111297607, "global_step": 18727, "epoch": 445} {"train_loss": -5.306116104125977, "global_step": 18728, "epoch": 445} {"train_loss": -5.250482559204102, "global_step": 18729, "epoch": 445} {"train_loss": -5.400891304016113, "global_step": 18730, "epoch": 445} {"train_loss": -5.257368632725307, "global_step": 18731, "epoch": 445, "val_loss": 69319.9140625} {"train_loss": -5.272097587585449, "global_step": 18732, "epoch": 446} {"train_loss": -5.210640907287598, "global_step": 18733, "epoch": 446} {"train_loss": -5.419274806976318, "global_step": 18734, "epoch": 446} {"train_loss": -5.232231140136719, "global_step": 18735, "epoch": 446} {"train_loss": -5.261233329772949, "global_step": 18736, "epoch": 446} {"train_loss": -5.347827911376953, "global_step": 18737, "epoch": 446} {"train_loss": -5.347152233123779, "global_step": 18738, "epoch": 446} {"train_loss": -5.357479095458984, "global_step": 18739, "epoch": 446} {"train_loss": -5.207819938659668, "global_step": 18740, "epoch": 446} {"train_loss": -5.270130157470703, "global_step": 18741, "epoch": 446} {"train_loss": -5.298295021057129, "global_step": 18742, "epoch": 446} {"train_loss": -5.32122802734375, "global_step": 18743, "epoch": 446} {"train_loss": -5.345185279846191, "global_step": 18744, "epoch": 446} {"train_loss": -5.1783447265625, "global_step": 18745, "epoch": 446} {"train_loss": -5.26413631439209, "global_step": 18746, "epoch": 446} {"train_loss": -5.20456600189209, "global_step": 18747, "epoch": 446} {"train_loss": -5.24746036529541, "global_step": 18748, "epoch": 446} {"train_loss": -5.380518436431885, "global_step": 18749, "epoch": 446} {"train_loss": -5.341540336608887, "global_step": 18750, "epoch": 446} {"train_loss": -5.381532669067383, "global_step": 18751, "epoch": 446} {"train_loss": -5.317607402801514, "global_step": 18752, "epoch": 446} {"train_loss": -5.243252754211426, "global_step": 18753, "epoch": 446} {"train_loss": -5.241631031036377, "global_step": 18754, "epoch": 446} {"train_loss": -5.285655975341797, "global_step": 18755, "epoch": 446} {"train_loss": -5.3009138107299805, "global_step": 18756, "epoch": 446} {"train_loss": -5.342474937438965, "global_step": 18757, "epoch": 446} {"train_loss": -5.377813339233398, "global_step": 18758, "epoch": 446} {"train_loss": -5.110320091247559, "global_step": 18759, "epoch": 446} {"train_loss": -5.156562805175781, "global_step": 18760, "epoch": 446} {"train_loss": -5.3632707595825195, "global_step": 18761, "epoch": 446} {"train_loss": -5.462989807128906, "global_step": 18762, "epoch": 446} {"train_loss": -5.076607704162598, "global_step": 18763, "epoch": 446} {"train_loss": -5.130337715148926, "global_step": 18764, "epoch": 446} {"train_loss": -5.152671813964844, "global_step": 18765, "epoch": 446} {"train_loss": -5.063885688781738, "global_step": 18766, "epoch": 446} {"train_loss": -5.153236389160156, "global_step": 18767, "epoch": 446} {"train_loss": -5.206295013427734, "global_step": 18768, "epoch": 446} {"train_loss": -5.12531852722168, "global_step": 18769, "epoch": 446} {"train_loss": -5.103701591491699, "global_step": 18770, "epoch": 446} {"train_loss": -5.249146461486816, "global_step": 18771, "epoch": 446} {"train_loss": -5.322758674621582, "global_step": 18772, "epoch": 446} {"train_loss": -5.257293349220639, "global_step": 18773, "epoch": 446, "val_loss": 69060.7578125} {"train_loss": -5.3463287353515625, "global_step": 18774, "epoch": 447} {"train_loss": -5.122095108032227, "global_step": 18775, "epoch": 447} {"train_loss": -5.097832202911377, "global_step": 18776, "epoch": 447} {"train_loss": -5.252981185913086, "global_step": 18777, "epoch": 447} {"train_loss": -5.163110733032227, "global_step": 18778, "epoch": 447} {"train_loss": -5.323731422424316, "global_step": 18779, "epoch": 447} {"train_loss": -5.219088554382324, "global_step": 18780, "epoch": 447} {"train_loss": -5.163585662841797, "global_step": 18781, "epoch": 447} {"train_loss": -5.2094316482543945, "global_step": 18782, "epoch": 447} {"train_loss": -5.1842522621154785, "global_step": 18783, "epoch": 447} {"train_loss": -5.310390949249268, "global_step": 18784, "epoch": 447} {"train_loss": -5.169210910797119, "global_step": 18785, "epoch": 447} {"train_loss": -5.247692108154297, "global_step": 18786, "epoch": 447} {"train_loss": -5.2339768409729, "global_step": 18787, "epoch": 447} {"train_loss": -5.434145927429199, "global_step": 18788, "epoch": 447} {"train_loss": -5.167859077453613, "global_step": 18789, "epoch": 447} {"train_loss": -5.333240985870361, "global_step": 18790, "epoch": 447} {"train_loss": -5.220495223999023, "global_step": 18791, "epoch": 447} {"train_loss": -5.2588653564453125, "global_step": 18792, "epoch": 447} {"train_loss": -5.363217353820801, "global_step": 18793, "epoch": 447} {"train_loss": -5.354896545410156, "global_step": 18794, "epoch": 447} {"train_loss": -5.372183799743652, "global_step": 18795, "epoch": 447} {"train_loss": -5.175697326660156, "global_step": 18796, "epoch": 447} {"train_loss": -5.427832126617432, "global_step": 18797, "epoch": 447} {"train_loss": -5.321409225463867, "global_step": 18798, "epoch": 447} {"train_loss": -5.260699272155762, "global_step": 18799, "epoch": 447} {"train_loss": -5.458486557006836, "global_step": 18800, "epoch": 447} {"train_loss": -5.4540910720825195, "global_step": 18801, "epoch": 447} {"train_loss": -5.2748188972473145, "global_step": 18802, "epoch": 447} {"train_loss": -5.194674491882324, "global_step": 18803, "epoch": 447} {"train_loss": -5.315512657165527, "global_step": 18804, "epoch": 447} {"train_loss": -5.196565628051758, "global_step": 18805, "epoch": 447} {"train_loss": -5.320615768432617, "global_step": 18806, "epoch": 447} {"train_loss": -5.161004066467285, "global_step": 18807, "epoch": 447} {"train_loss": -5.355795860290527, "global_step": 18808, "epoch": 447} {"train_loss": -5.23748779296875, "global_step": 18809, "epoch": 447} {"train_loss": -5.294917106628418, "global_step": 18810, "epoch": 447} {"train_loss": -5.247254371643066, "global_step": 18811, "epoch": 447} {"train_loss": -5.357964515686035, "global_step": 18812, "epoch": 447} {"train_loss": -5.172424793243408, "global_step": 18813, "epoch": 447} {"train_loss": -5.451506614685059, "global_step": 18814, "epoch": 447} {"train_loss": -5.275019293739682, "global_step": 18815, "epoch": 447, "val_loss": 69067.1015625} {"train_loss": -5.273622512817383, "global_step": 18816, "epoch": 448} {"train_loss": -5.2632737159729, "global_step": 18817, "epoch": 448} {"train_loss": -5.194477558135986, "global_step": 18818, "epoch": 448} {"train_loss": -5.307921886444092, "global_step": 18819, "epoch": 448} {"train_loss": -5.239771366119385, "global_step": 18820, "epoch": 448} {"train_loss": -5.1885271072387695, "global_step": 18821, "epoch": 448} {"train_loss": -5.316600322723389, "global_step": 18822, "epoch": 448} {"train_loss": -5.296962738037109, "global_step": 18823, "epoch": 448} {"train_loss": -5.155450344085693, "global_step": 18824, "epoch": 448} {"train_loss": -5.491635322570801, "global_step": 18825, "epoch": 448} {"train_loss": -5.28371524810791, "global_step": 18826, "epoch": 448} {"train_loss": -5.376626491546631, "global_step": 18827, "epoch": 448} {"train_loss": -5.322950839996338, "global_step": 18828, "epoch": 448} {"train_loss": -5.208695411682129, "global_step": 18829, "epoch": 448} {"train_loss": -5.329298973083496, "global_step": 18830, "epoch": 448} {"train_loss": -5.306870460510254, "global_step": 18831, "epoch": 448} {"train_loss": -5.288705825805664, "global_step": 18832, "epoch": 448} {"train_loss": -5.266951560974121, "global_step": 18833, "epoch": 448} {"train_loss": -5.294987678527832, "global_step": 18834, "epoch": 448} {"train_loss": -5.282451152801514, "global_step": 18835, "epoch": 448} {"train_loss": -5.1904683113098145, "global_step": 18836, "epoch": 448} {"train_loss": -5.358684062957764, "global_step": 18837, "epoch": 448} {"train_loss": -5.232623100280762, "global_step": 18838, "epoch": 448} {"train_loss": -5.215244770050049, "global_step": 18839, "epoch": 448} {"train_loss": -5.315515518188477, "global_step": 18840, "epoch": 448} {"train_loss": -5.163087844848633, "global_step": 18841, "epoch": 448} {"train_loss": -5.23020076751709, "global_step": 18842, "epoch": 448} {"train_loss": -5.311709403991699, "global_step": 18843, "epoch": 448} {"train_loss": -5.3366193771362305, "global_step": 18844, "epoch": 448} {"train_loss": -5.244101524353027, "global_step": 18845, "epoch": 448} {"train_loss": -5.1653056144714355, "global_step": 18846, "epoch": 448} {"train_loss": -5.150433540344238, "global_step": 18847, "epoch": 448} {"train_loss": -5.360472202301025, "global_step": 18848, "epoch": 448} {"train_loss": -5.3104047775268555, "global_step": 18849, "epoch": 448} {"train_loss": -5.335508346557617, "global_step": 18850, "epoch": 448} {"train_loss": -5.409422874450684, "global_step": 18851, "epoch": 448} {"train_loss": -5.293367862701416, "global_step": 18852, "epoch": 448} {"train_loss": -5.2871222496032715, "global_step": 18853, "epoch": 448} {"train_loss": -5.372217655181885, "global_step": 18854, "epoch": 448} {"train_loss": -5.2824907302856445, "global_step": 18855, "epoch": 448} {"train_loss": -5.143364906311035, "global_step": 18856, "epoch": 448} {"train_loss": -5.276418038776943, "global_step": 18857, "epoch": 448, "val_loss": 69499.0390625} {"train_loss": -5.189305305480957, "global_step": 18858, "epoch": 449} {"train_loss": -5.402092456817627, "global_step": 18859, "epoch": 449} {"train_loss": -5.4318437576293945, "global_step": 18860, "epoch": 449} {"train_loss": -5.228352069854736, "global_step": 18861, "epoch": 449} {"train_loss": -5.419769287109375, "global_step": 18862, "epoch": 449} {"train_loss": -5.234368801116943, "global_step": 18863, "epoch": 449} {"train_loss": -5.236575126647949, "global_step": 18864, "epoch": 449} {"train_loss": -5.380224704742432, "global_step": 18865, "epoch": 449} {"train_loss": -5.234157085418701, "global_step": 18866, "epoch": 449} {"train_loss": -5.290271759033203, "global_step": 18867, "epoch": 449} {"train_loss": -5.303348064422607, "global_step": 18868, "epoch": 449} {"train_loss": -5.290698528289795, "global_step": 18869, "epoch": 449} {"train_loss": -5.365410804748535, "global_step": 18870, "epoch": 449} {"train_loss": -5.288446426391602, "global_step": 18871, "epoch": 449} {"train_loss": -5.22951602935791, "global_step": 18872, "epoch": 449} {"train_loss": -5.3690643310546875, "global_step": 18873, "epoch": 449} {"train_loss": -5.123701095581055, "global_step": 18874, "epoch": 449} {"train_loss": -5.287518501281738, "global_step": 18875, "epoch": 449} {"train_loss": -5.272172927856445, "global_step": 18876, "epoch": 449} {"train_loss": -5.335634708404541, "global_step": 18877, "epoch": 449} {"train_loss": -5.246550559997559, "global_step": 18878, "epoch": 449} {"train_loss": -5.212235450744629, "global_step": 18879, "epoch": 449} {"train_loss": -5.323193550109863, "global_step": 18880, "epoch": 449} {"train_loss": -5.210330963134766, "global_step": 18881, "epoch": 449} {"train_loss": -5.254186153411865, "global_step": 18882, "epoch": 449} {"train_loss": -5.348278999328613, "global_step": 18883, "epoch": 449} {"train_loss": -5.469334602355957, "global_step": 18884, "epoch": 449} {"train_loss": -5.263122081756592, "global_step": 18885, "epoch": 449} {"train_loss": -5.3180413246154785, "global_step": 18886, "epoch": 449} {"train_loss": -5.262706756591797, "global_step": 18887, "epoch": 449} {"train_loss": -5.383782386779785, "global_step": 18888, "epoch": 449} {"train_loss": -5.319531440734863, "global_step": 18889, "epoch": 449} {"train_loss": -5.210641860961914, "global_step": 18890, "epoch": 449} {"train_loss": -5.2615742683410645, "global_step": 18891, "epoch": 449} {"train_loss": -5.165078163146973, "global_step": 18892, "epoch": 449} {"train_loss": -5.3290557861328125, "global_step": 18893, "epoch": 449} {"train_loss": -5.364079475402832, "global_step": 18894, "epoch": 449} {"train_loss": -5.265995979309082, "global_step": 18895, "epoch": 449} {"train_loss": -5.265286922454834, "global_step": 18896, "epoch": 449} {"train_loss": -5.323554039001465, "global_step": 18897, "epoch": 449} {"train_loss": -5.374587059020996, "global_step": 18898, "epoch": 449} {"train_loss": -5.292204516274588, "global_step": 18899, "epoch": 449, "val_loss": 69385.078125} {"train_loss": -5.285675048828125, "global_step": 18900, "epoch": 450} {"train_loss": -5.236198425292969, "global_step": 18901, "epoch": 450} {"train_loss": -5.337803840637207, "global_step": 18902, "epoch": 450} {"train_loss": -5.4201250076293945, "global_step": 18903, "epoch": 450} {"train_loss": -5.266469478607178, "global_step": 18904, "epoch": 450} {"train_loss": -5.30434513092041, "global_step": 18905, "epoch": 450} {"train_loss": -5.367900371551514, "global_step": 18906, "epoch": 450} {"train_loss": -5.236093044281006, "global_step": 18907, "epoch": 450} {"train_loss": -5.162450313568115, "global_step": 18908, "epoch": 450} {"train_loss": -5.174027442932129, "global_step": 18909, "epoch": 450} {"train_loss": -5.203205108642578, "global_step": 18910, "epoch": 450} {"train_loss": -5.287424564361572, "global_step": 18911, "epoch": 450} {"train_loss": -5.148857593536377, "global_step": 18912, "epoch": 450} {"train_loss": -5.424430847167969, "global_step": 18913, "epoch": 450} {"train_loss": -5.196298599243164, "global_step": 18914, "epoch": 450} {"train_loss": -5.26285457611084, "global_step": 18915, "epoch": 450} {"train_loss": -5.3811140060424805, "global_step": 18916, "epoch": 450} {"train_loss": -5.281830310821533, "global_step": 18917, "epoch": 450} {"train_loss": -5.293593406677246, "global_step": 18918, "epoch": 450} {"train_loss": -5.168677806854248, "global_step": 18919, "epoch": 450} {"train_loss": -5.22864294052124, "global_step": 18920, "epoch": 450} {"train_loss": -5.378229141235352, "global_step": 18921, "epoch": 450} {"train_loss": -5.202005386352539, "global_step": 18922, "epoch": 450} {"train_loss": -5.307647705078125, "global_step": 18923, "epoch": 450} {"train_loss": -5.311257839202881, "global_step": 18924, "epoch": 450} {"train_loss": -5.381346702575684, "global_step": 18925, "epoch": 450} {"train_loss": -5.321146011352539, "global_step": 18926, "epoch": 450} {"train_loss": -5.425909042358398, "global_step": 18927, "epoch": 450} {"train_loss": -5.296656131744385, "global_step": 18928, "epoch": 450} {"train_loss": -5.359763145446777, "global_step": 18929, "epoch": 450} {"train_loss": -5.264081001281738, "global_step": 18930, "epoch": 450} {"train_loss": -5.299844264984131, "global_step": 18931, "epoch": 450} {"train_loss": -5.256411075592041, "global_step": 18932, "epoch": 450} {"train_loss": -5.344418525695801, "global_step": 18933, "epoch": 450} {"train_loss": -5.236869812011719, "global_step": 18934, "epoch": 450} {"train_loss": -5.344078063964844, "global_step": 18935, "epoch": 450} {"train_loss": -5.438211441040039, "global_step": 18936, "epoch": 450} {"train_loss": -5.393563270568848, "global_step": 18937, "epoch": 450} {"train_loss": -5.373044967651367, "global_step": 18938, "epoch": 450} {"train_loss": -5.239212512969971, "global_step": 18939, "epoch": 450} {"train_loss": -5.2628092765808105, "global_step": 18940, "epoch": 450} {"train_loss": -5.2950916063217885, "global_step": 18941, "epoch": 450, "train/sim_max_reward_0": 0.22623842806540242, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.09410349400649934, "train/sim_max_reward_4": 0.42104104779071233, "train/sim_max_reward_5": 0.5189598608851955, "test/sim_max_reward_4400000": 0.3565199273093855, "test/sim_max_reward_4400001": 0.2410126669463773, "test/sim_max_reward_4400002": 0.5593260789379622, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.18150710456374688, "test/sim_max_reward_4400005": 0.1864693632485471, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.8218511693005641, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.30478284743347545, "test/sim_max_reward_4400013": 0.4349476267498327, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1669743825892275, "test/sim_max_reward_4400018": 0.7928370597051039, "test/sim_max_reward_4400019": 0.7265122179340051, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.05973640412310143, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.26206647880502426, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.21083518127273346, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.031229597183181357, "test/sim_max_reward_4400031": 0.2554018483909894, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.10750247979342091, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.3553694715663705, "test/sim_max_reward_4400036": 0.6835398511851445, "test/sim_max_reward_4400037": 0.26199803197188126, "test/sim_max_reward_4400038": 0.5566855655021231, "test/sim_max_reward_4400039": 0.502486823006607, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.3473317619859971, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.0, "test/sim_max_reward_4400045": 0.20829660720626256, "test/sim_max_reward_4400046": 0.19218025367224437, "test/sim_max_reward_4400047": 0.14149911602495555, "test/sim_max_reward_4400048": 0.3547404114813681, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.21016971866160147, "test/mean_score": 0.20696307687306206, "val_loss": 69760.9609375} {"train_loss": -5.205596923828125, "global_step": 18942, "epoch": 451} {"train_loss": -5.279038906097412, "global_step": 18943, "epoch": 451} {"train_loss": -5.330867767333984, "global_step": 18944, "epoch": 451} {"train_loss": -5.234052658081055, "global_step": 18945, "epoch": 451} {"train_loss": -5.336124420166016, "global_step": 18946, "epoch": 451} {"train_loss": -5.315374851226807, "global_step": 18947, "epoch": 451} {"train_loss": -5.388707160949707, "global_step": 18948, "epoch": 451} {"train_loss": -5.223731994628906, "global_step": 18949, "epoch": 451} {"train_loss": -5.2728681564331055, "global_step": 18950, "epoch": 451} {"train_loss": -5.195021629333496, "global_step": 18951, "epoch": 451} {"train_loss": -5.359353065490723, "global_step": 18952, "epoch": 451} {"train_loss": -5.270908832550049, "global_step": 18953, "epoch": 451} {"train_loss": -5.3427734375, "global_step": 18954, "epoch": 451} {"train_loss": -5.337810516357422, "global_step": 18955, "epoch": 451} {"train_loss": -5.367932319641113, "global_step": 18956, "epoch": 451} {"train_loss": -5.403298377990723, "global_step": 18957, "epoch": 451} {"train_loss": -5.395620346069336, "global_step": 18958, "epoch": 451} {"train_loss": -5.280074119567871, "global_step": 18959, "epoch": 451} {"train_loss": -5.330250263214111, "global_step": 18960, "epoch": 451} {"train_loss": -5.330898284912109, "global_step": 18961, "epoch": 451} {"train_loss": -5.33095645904541, "global_step": 18962, "epoch": 451} {"train_loss": -5.270169258117676, "global_step": 18963, "epoch": 451} {"train_loss": -5.241250991821289, "global_step": 18964, "epoch": 451} {"train_loss": -5.305538177490234, "global_step": 18965, "epoch": 451} {"train_loss": -5.413735389709473, "global_step": 18966, "epoch": 451} {"train_loss": -5.348007678985596, "global_step": 18967, "epoch": 451} {"train_loss": -5.411794662475586, "global_step": 18968, "epoch": 451} {"train_loss": -5.276119232177734, "global_step": 18969, "epoch": 451} {"train_loss": -5.223118782043457, "global_step": 18970, "epoch": 451} {"train_loss": -5.274327278137207, "global_step": 18971, "epoch": 451} {"train_loss": -5.247719764709473, "global_step": 18972, "epoch": 451} {"train_loss": -5.19350528717041, "global_step": 18973, "epoch": 451} {"train_loss": -5.140574932098389, "global_step": 18974, "epoch": 451} {"train_loss": -5.076749324798584, "global_step": 18975, "epoch": 451} {"train_loss": -5.415467262268066, "global_step": 18976, "epoch": 451} {"train_loss": -5.041287422180176, "global_step": 18977, "epoch": 451} {"train_loss": -5.222821235656738, "global_step": 18978, "epoch": 451} {"train_loss": -5.253145217895508, "global_step": 18979, "epoch": 451} {"train_loss": -5.369376182556152, "global_step": 18980, "epoch": 451} {"train_loss": -5.217971324920654, "global_step": 18981, "epoch": 451} {"train_loss": -5.356280326843262, "global_step": 18982, "epoch": 451} {"train_loss": -5.286273309162685, "global_step": 18983, "epoch": 451, "val_loss": 70118.3515625} {"train_loss": -5.352299690246582, "global_step": 18984, "epoch": 452} {"train_loss": -5.319110870361328, "global_step": 18985, "epoch": 452} {"train_loss": -5.177607536315918, "global_step": 18986, "epoch": 452} {"train_loss": -5.379786491394043, "global_step": 18987, "epoch": 452} {"train_loss": -5.150697708129883, "global_step": 18988, "epoch": 452} {"train_loss": -5.21217679977417, "global_step": 18989, "epoch": 452} {"train_loss": -5.417012691497803, "global_step": 18990, "epoch": 452} {"train_loss": -5.137872695922852, "global_step": 18991, "epoch": 452} {"train_loss": -5.099442005157471, "global_step": 18992, "epoch": 452} {"train_loss": -5.20879602432251, "global_step": 18993, "epoch": 452} {"train_loss": -5.217926025390625, "global_step": 18994, "epoch": 452} {"train_loss": -5.2458648681640625, "global_step": 18995, "epoch": 452} {"train_loss": -5.245760917663574, "global_step": 18996, "epoch": 452} {"train_loss": -5.260049819946289, "global_step": 18997, "epoch": 452} {"train_loss": -5.278892517089844, "global_step": 18998, "epoch": 452} {"train_loss": -5.036447525024414, "global_step": 18999, "epoch": 452} {"train_loss": -5.363727569580078, "global_step": 19000, "epoch": 452} {"train_loss": -5.316418647766113, "global_step": 19001, "epoch": 452} {"train_loss": -5.2128801345825195, "global_step": 19002, "epoch": 452} {"train_loss": -5.346092224121094, "global_step": 19003, "epoch": 452} {"train_loss": -5.281137466430664, "global_step": 19004, "epoch": 452} {"train_loss": -5.17619514465332, "global_step": 19005, "epoch": 452} {"train_loss": -5.248834133148193, "global_step": 19006, "epoch": 452} {"train_loss": -5.301032066345215, "global_step": 19007, "epoch": 452} {"train_loss": -5.248730659484863, "global_step": 19008, "epoch": 452} {"train_loss": -5.330740928649902, "global_step": 19009, "epoch": 452} {"train_loss": -5.284484386444092, "global_step": 19010, "epoch": 452} {"train_loss": -5.079977512359619, "global_step": 19011, "epoch": 452} {"train_loss": -5.235294818878174, "global_step": 19012, "epoch": 452} {"train_loss": -5.2782673835754395, "global_step": 19013, "epoch": 452} {"train_loss": -5.286319732666016, "global_step": 19014, "epoch": 452} {"train_loss": -5.189840316772461, "global_step": 19015, "epoch": 452} {"train_loss": -5.334501266479492, "global_step": 19016, "epoch": 452} {"train_loss": -5.235943794250488, "global_step": 19017, "epoch": 452} {"train_loss": -5.376955986022949, "global_step": 19018, "epoch": 452} {"train_loss": -5.269697189331055, "global_step": 19019, "epoch": 452} {"train_loss": -5.1473565101623535, "global_step": 19020, "epoch": 452} {"train_loss": -5.311961650848389, "global_step": 19021, "epoch": 452} {"train_loss": -5.252025127410889, "global_step": 19022, "epoch": 452} {"train_loss": -5.224809646606445, "global_step": 19023, "epoch": 452} {"train_loss": -5.339340686798096, "global_step": 19024, "epoch": 452} {"train_loss": -5.255099875586374, "global_step": 19025, "epoch": 452, "val_loss": 69905.0859375} {"train_loss": -5.293608665466309, "global_step": 19026, "epoch": 453} {"train_loss": -5.166418075561523, "global_step": 19027, "epoch": 453} {"train_loss": -5.382966041564941, "global_step": 19028, "epoch": 453} {"train_loss": -5.290680885314941, "global_step": 19029, "epoch": 453} {"train_loss": -5.382824897766113, "global_step": 19030, "epoch": 453} {"train_loss": -5.162740707397461, "global_step": 19031, "epoch": 453} {"train_loss": -5.257676601409912, "global_step": 19032, "epoch": 453} {"train_loss": -5.289653778076172, "global_step": 19033, "epoch": 453} {"train_loss": -5.310079574584961, "global_step": 19034, "epoch": 453} {"train_loss": -5.210940837860107, "global_step": 19035, "epoch": 453} {"train_loss": -5.33939266204834, "global_step": 19036, "epoch": 453} {"train_loss": -5.349175453186035, "global_step": 19037, "epoch": 453} {"train_loss": -5.276984214782715, "global_step": 19038, "epoch": 453} {"train_loss": -5.314889907836914, "global_step": 19039, "epoch": 453} {"train_loss": -5.294224262237549, "global_step": 19040, "epoch": 453} {"train_loss": -5.200625896453857, "global_step": 19041, "epoch": 453} {"train_loss": -5.28381872177124, "global_step": 19042, "epoch": 453} {"train_loss": -5.315734386444092, "global_step": 19043, "epoch": 453} {"train_loss": -5.357177257537842, "global_step": 19044, "epoch": 453} {"train_loss": -5.320397853851318, "global_step": 19045, "epoch": 453} {"train_loss": -5.411742687225342, "global_step": 19046, "epoch": 453} {"train_loss": -5.0712385177612305, "global_step": 19047, "epoch": 453} {"train_loss": -5.341940879821777, "global_step": 19048, "epoch": 453} {"train_loss": -5.36276388168335, "global_step": 19049, "epoch": 453} {"train_loss": -5.183012008666992, "global_step": 19050, "epoch": 453} {"train_loss": -5.431086540222168, "global_step": 19051, "epoch": 453} {"train_loss": -5.332099914550781, "global_step": 19052, "epoch": 453} {"train_loss": -5.206517219543457, "global_step": 19053, "epoch": 453} {"train_loss": -5.3436689376831055, "global_step": 19054, "epoch": 453} {"train_loss": -5.286060333251953, "global_step": 19055, "epoch": 453} {"train_loss": -5.3916168212890625, "global_step": 19056, "epoch": 453} {"train_loss": -5.353425979614258, "global_step": 19057, "epoch": 453} {"train_loss": -5.368823051452637, "global_step": 19058, "epoch": 453} {"train_loss": -5.241121292114258, "global_step": 19059, "epoch": 453} {"train_loss": -5.3456315994262695, "global_step": 19060, "epoch": 453} {"train_loss": -5.3201446533203125, "global_step": 19061, "epoch": 453} {"train_loss": -5.328494548797607, "global_step": 19062, "epoch": 453} {"train_loss": -5.334413051605225, "global_step": 19063, "epoch": 453} {"train_loss": -5.36370849609375, "global_step": 19064, "epoch": 453} {"train_loss": -5.255269527435303, "global_step": 19065, "epoch": 453} {"train_loss": -5.231571197509766, "global_step": 19066, "epoch": 453} {"train_loss": -5.299826746895199, "global_step": 19067, "epoch": 453, "val_loss": 69066.7265625} {"train_loss": -5.444858551025391, "global_step": 19068, "epoch": 454} {"train_loss": -5.361346244812012, "global_step": 19069, "epoch": 454} {"train_loss": -5.211699962615967, "global_step": 19070, "epoch": 454} {"train_loss": -5.367384910583496, "global_step": 19071, "epoch": 454} {"train_loss": -5.2221269607543945, "global_step": 19072, "epoch": 454} {"train_loss": -5.293210029602051, "global_step": 19073, "epoch": 454} {"train_loss": -5.29746675491333, "global_step": 19074, "epoch": 454} {"train_loss": -5.3845720291137695, "global_step": 19075, "epoch": 454} {"train_loss": -5.389989852905273, "global_step": 19076, "epoch": 454} {"train_loss": -5.228636264801025, "global_step": 19077, "epoch": 454} {"train_loss": -5.342331886291504, "global_step": 19078, "epoch": 454} {"train_loss": -5.222370147705078, "global_step": 19079, "epoch": 454} {"train_loss": -5.315331935882568, "global_step": 19080, "epoch": 454} {"train_loss": -5.331795692443848, "global_step": 19081, "epoch": 454} {"train_loss": -5.273307800292969, "global_step": 19082, "epoch": 454} {"train_loss": -5.318262100219727, "global_step": 19083, "epoch": 454} {"train_loss": -5.311452865600586, "global_step": 19084, "epoch": 454} {"train_loss": -5.423948287963867, "global_step": 19085, "epoch": 454} {"train_loss": -5.170948505401611, "global_step": 19086, "epoch": 454} {"train_loss": -5.352966785430908, "global_step": 19087, "epoch": 454} {"train_loss": -5.288739204406738, "global_step": 19088, "epoch": 454} {"train_loss": -5.196925163269043, "global_step": 19089, "epoch": 454} {"train_loss": -5.298354148864746, "global_step": 19090, "epoch": 454} {"train_loss": -5.284651756286621, "global_step": 19091, "epoch": 454} {"train_loss": -5.299628257751465, "global_step": 19092, "epoch": 454} {"train_loss": -5.4233174324035645, "global_step": 19093, "epoch": 454} {"train_loss": -5.065643310546875, "global_step": 19094, "epoch": 454} {"train_loss": -5.294939994812012, "global_step": 19095, "epoch": 454} {"train_loss": -5.341002464294434, "global_step": 19096, "epoch": 454} {"train_loss": -5.2666778564453125, "global_step": 19097, "epoch": 454} {"train_loss": -5.359378814697266, "global_step": 19098, "epoch": 454} {"train_loss": -5.414959907531738, "global_step": 19099, "epoch": 454} {"train_loss": -5.440657615661621, "global_step": 19100, "epoch": 454} {"train_loss": -5.381529331207275, "global_step": 19101, "epoch": 454} {"train_loss": -5.212954998016357, "global_step": 19102, "epoch": 454} {"train_loss": -5.252397060394287, "global_step": 19103, "epoch": 454} {"train_loss": -5.38240909576416, "global_step": 19104, "epoch": 454} {"train_loss": -5.2645087242126465, "global_step": 19105, "epoch": 454} {"train_loss": -5.222995758056641, "global_step": 19106, "epoch": 454} {"train_loss": -5.333683013916016, "global_step": 19107, "epoch": 454} {"train_loss": -5.46521520614624, "global_step": 19108, "epoch": 454} {"train_loss": -5.3104831491197855, "global_step": 19109, "epoch": 454, "val_loss": 69236.3984375} {"train_loss": -5.353801727294922, "global_step": 19110, "epoch": 455} {"train_loss": -5.18927001953125, "global_step": 19111, "epoch": 455} {"train_loss": -5.399736404418945, "global_step": 19112, "epoch": 455} {"train_loss": -5.229969024658203, "global_step": 19113, "epoch": 455} {"train_loss": -5.359179496765137, "global_step": 19114, "epoch": 455} {"train_loss": -5.203564643859863, "global_step": 19115, "epoch": 455} {"train_loss": -5.161581039428711, "global_step": 19116, "epoch": 455} {"train_loss": -5.400063514709473, "global_step": 19117, "epoch": 455} {"train_loss": -5.263772964477539, "global_step": 19118, "epoch": 455} {"train_loss": -5.254184722900391, "global_step": 19119, "epoch": 455} {"train_loss": -5.429548263549805, "global_step": 19120, "epoch": 455} {"train_loss": -5.181769371032715, "global_step": 19121, "epoch": 455} {"train_loss": -5.433888912200928, "global_step": 19122, "epoch": 455} {"train_loss": -5.290065765380859, "global_step": 19123, "epoch": 455} {"train_loss": -5.330081939697266, "global_step": 19124, "epoch": 455} {"train_loss": -5.474145412445068, "global_step": 19125, "epoch": 455} {"train_loss": -5.3534417152404785, "global_step": 19126, "epoch": 455} {"train_loss": -5.2354326248168945, "global_step": 19127, "epoch": 455} {"train_loss": -5.192522048950195, "global_step": 19128, "epoch": 455} {"train_loss": -5.288422107696533, "global_step": 19129, "epoch": 455} {"train_loss": -5.380817890167236, "global_step": 19130, "epoch": 455} {"train_loss": -5.2362565994262695, "global_step": 19131, "epoch": 455} {"train_loss": -5.271785736083984, "global_step": 19132, "epoch": 455} {"train_loss": -5.274883270263672, "global_step": 19133, "epoch": 455} {"train_loss": -5.261596202850342, "global_step": 19134, "epoch": 455} {"train_loss": -5.382761001586914, "global_step": 19135, "epoch": 455} {"train_loss": -5.286710739135742, "global_step": 19136, "epoch": 455} {"train_loss": -5.4059157371521, "global_step": 19137, "epoch": 455} {"train_loss": -5.384995937347412, "global_step": 19138, "epoch": 455} {"train_loss": -5.421219825744629, "global_step": 19139, "epoch": 455} {"train_loss": -5.204624176025391, "global_step": 19140, "epoch": 455} {"train_loss": -5.346726417541504, "global_step": 19141, "epoch": 455} {"train_loss": -5.421896934509277, "global_step": 19142, "epoch": 455} {"train_loss": -5.285853385925293, "global_step": 19143, "epoch": 455} {"train_loss": -5.382685661315918, "global_step": 19144, "epoch": 455} {"train_loss": -5.323006629943848, "global_step": 19145, "epoch": 455} {"train_loss": -5.271988868713379, "global_step": 19146, "epoch": 455} {"train_loss": -5.413694381713867, "global_step": 19147, "epoch": 455} {"train_loss": -5.203849792480469, "global_step": 19148, "epoch": 455} {"train_loss": -5.394338130950928, "global_step": 19149, "epoch": 455} {"train_loss": -5.239145278930664, "global_step": 19150, "epoch": 455} {"train_loss": -5.309128216334751, "global_step": 19151, "epoch": 455, "val_loss": 70013.140625} {"train_loss": -5.256028175354004, "global_step": 19152, "epoch": 456} {"train_loss": -5.241145133972168, "global_step": 19153, "epoch": 456} {"train_loss": -5.283568859100342, "global_step": 19154, "epoch": 456} {"train_loss": -5.210580348968506, "global_step": 19155, "epoch": 456} {"train_loss": -5.3610029220581055, "global_step": 19156, "epoch": 456} {"train_loss": -5.314920425415039, "global_step": 19157, "epoch": 456} {"train_loss": -5.13466215133667, "global_step": 19158, "epoch": 456} {"train_loss": -5.2671661376953125, "global_step": 19159, "epoch": 456} {"train_loss": -5.241934299468994, "global_step": 19160, "epoch": 456} {"train_loss": -5.400345802307129, "global_step": 19161, "epoch": 456} {"train_loss": -5.355368614196777, "global_step": 19162, "epoch": 456} {"train_loss": -5.323151588439941, "global_step": 19163, "epoch": 456} {"train_loss": -5.415552139282227, "global_step": 19164, "epoch": 456} {"train_loss": -5.213757038116455, "global_step": 19165, "epoch": 456} {"train_loss": -5.319814682006836, "global_step": 19166, "epoch": 456} {"train_loss": -5.235889911651611, "global_step": 19167, "epoch": 456} {"train_loss": -5.315615653991699, "global_step": 19168, "epoch": 456} {"train_loss": -5.1802568435668945, "global_step": 19169, "epoch": 456} {"train_loss": -5.3954644203186035, "global_step": 19170, "epoch": 456} {"train_loss": -5.306277275085449, "global_step": 19171, "epoch": 456} {"train_loss": -5.338656425476074, "global_step": 19172, "epoch": 456} {"train_loss": -5.375441551208496, "global_step": 19173, "epoch": 456} {"train_loss": -5.399953365325928, "global_step": 19174, "epoch": 456} {"train_loss": -5.339685440063477, "global_step": 19175, "epoch": 456} {"train_loss": -5.351700305938721, "global_step": 19176, "epoch": 456} {"train_loss": -5.28963565826416, "global_step": 19177, "epoch": 456} {"train_loss": -5.353192329406738, "global_step": 19178, "epoch": 456} {"train_loss": -5.232780456542969, "global_step": 19179, "epoch": 456} {"train_loss": -5.241393089294434, "global_step": 19180, "epoch": 456} {"train_loss": -5.206813812255859, "global_step": 19181, "epoch": 456} {"train_loss": -5.335605621337891, "global_step": 19182, "epoch": 456} {"train_loss": -5.295701026916504, "global_step": 19183, "epoch": 456} {"train_loss": -5.347379684448242, "global_step": 19184, "epoch": 456} {"train_loss": -5.288453102111816, "global_step": 19185, "epoch": 456} {"train_loss": -5.29168701171875, "global_step": 19186, "epoch": 456} {"train_loss": -5.35189151763916, "global_step": 19187, "epoch": 456} {"train_loss": -5.324069499969482, "global_step": 19188, "epoch": 456} {"train_loss": -5.182926177978516, "global_step": 19189, "epoch": 456} {"train_loss": -5.2465434074401855, "global_step": 19190, "epoch": 456} {"train_loss": -5.28028678894043, "global_step": 19191, "epoch": 456} {"train_loss": -5.273016452789307, "global_step": 19192, "epoch": 456} {"train_loss": -5.2945635205223445, "global_step": 19193, "epoch": 456, "val_loss": 68819.875} {"train_loss": -5.379815578460693, "global_step": 19194, "epoch": 457} {"train_loss": -5.316835403442383, "global_step": 19195, "epoch": 457} {"train_loss": -5.406105995178223, "global_step": 19196, "epoch": 457} {"train_loss": -5.284779071807861, "global_step": 19197, "epoch": 457} {"train_loss": -5.2033843994140625, "global_step": 19198, "epoch": 457} {"train_loss": -5.22303581237793, "global_step": 19199, "epoch": 457} {"train_loss": -5.279494762420654, "global_step": 19200, "epoch": 457} {"train_loss": -5.355341911315918, "global_step": 19201, "epoch": 457} {"train_loss": -5.108086585998535, "global_step": 19202, "epoch": 457} {"train_loss": -5.045578956604004, "global_step": 19203, "epoch": 457} {"train_loss": -5.350862503051758, "global_step": 19204, "epoch": 457} {"train_loss": -5.273745536804199, "global_step": 19205, "epoch": 457} {"train_loss": -5.304170608520508, "global_step": 19206, "epoch": 457} {"train_loss": -5.3386688232421875, "global_step": 19207, "epoch": 457} {"train_loss": -5.1196064949035645, "global_step": 19208, "epoch": 457} {"train_loss": -5.187283992767334, "global_step": 19209, "epoch": 457} {"train_loss": -5.247725486755371, "global_step": 19210, "epoch": 457} {"train_loss": -5.177723407745361, "global_step": 19211, "epoch": 457} {"train_loss": -5.375308036804199, "global_step": 19212, "epoch": 457} {"train_loss": -5.364192008972168, "global_step": 19213, "epoch": 457} {"train_loss": -5.236454963684082, "global_step": 19214, "epoch": 457} {"train_loss": -5.330072402954102, "global_step": 19215, "epoch": 457} {"train_loss": -5.291387557983398, "global_step": 19216, "epoch": 457} {"train_loss": -5.232661247253418, "global_step": 19217, "epoch": 457} {"train_loss": -5.105353355407715, "global_step": 19218, "epoch": 457} {"train_loss": -5.315765380859375, "global_step": 19219, "epoch": 457} {"train_loss": -5.31003475189209, "global_step": 19220, "epoch": 457} {"train_loss": -5.24564266204834, "global_step": 19221, "epoch": 457} {"train_loss": -5.344386577606201, "global_step": 19222, "epoch": 457} {"train_loss": -5.282886028289795, "global_step": 19223, "epoch": 457} {"train_loss": -5.353862285614014, "global_step": 19224, "epoch": 457} {"train_loss": -5.339319229125977, "global_step": 19225, "epoch": 457} {"train_loss": -5.304555416107178, "global_step": 19226, "epoch": 457} {"train_loss": -5.2568464279174805, "global_step": 19227, "epoch": 457} {"train_loss": -5.300072193145752, "global_step": 19228, "epoch": 457} {"train_loss": -5.402951240539551, "global_step": 19229, "epoch": 457} {"train_loss": -5.267306327819824, "global_step": 19230, "epoch": 457} {"train_loss": -5.070509910583496, "global_step": 19231, "epoch": 457} {"train_loss": -5.426107406616211, "global_step": 19232, "epoch": 457} {"train_loss": -5.2664079666137695, "global_step": 19233, "epoch": 457} {"train_loss": -5.207761764526367, "global_step": 19234, "epoch": 457} {"train_loss": -5.27118782770066, "global_step": 19235, "epoch": 457, "val_loss": 69087.4375} {"train_loss": -5.2784037590026855, "global_step": 19236, "epoch": 458} {"train_loss": -5.325621128082275, "global_step": 19237, "epoch": 458} {"train_loss": -5.181537628173828, "global_step": 19238, "epoch": 458} {"train_loss": -5.366535663604736, "global_step": 19239, "epoch": 458} {"train_loss": -5.288200378417969, "global_step": 19240, "epoch": 458} {"train_loss": -5.1869707107543945, "global_step": 19241, "epoch": 458} {"train_loss": -5.428616523742676, "global_step": 19242, "epoch": 458} {"train_loss": -5.392158508300781, "global_step": 19243, "epoch": 458} {"train_loss": -5.266737937927246, "global_step": 19244, "epoch": 458} {"train_loss": -5.181292533874512, "global_step": 19245, "epoch": 458} {"train_loss": -5.266058444976807, "global_step": 19246, "epoch": 458} {"train_loss": -5.111135959625244, "global_step": 19247, "epoch": 458} {"train_loss": -5.358419895172119, "global_step": 19248, "epoch": 458} {"train_loss": -5.375694274902344, "global_step": 19249, "epoch": 458} {"train_loss": -5.326691627502441, "global_step": 19250, "epoch": 458} {"train_loss": -5.214694976806641, "global_step": 19251, "epoch": 458} {"train_loss": -5.223564147949219, "global_step": 19252, "epoch": 458} {"train_loss": -5.249795913696289, "global_step": 19253, "epoch": 458} {"train_loss": -5.35526180267334, "global_step": 19254, "epoch": 458} {"train_loss": -5.332788467407227, "global_step": 19255, "epoch": 458} {"train_loss": -5.229526996612549, "global_step": 19256, "epoch": 458} {"train_loss": -5.368450164794922, "global_step": 19257, "epoch": 458} {"train_loss": -5.2686567306518555, "global_step": 19258, "epoch": 458} {"train_loss": -5.401145935058594, "global_step": 19259, "epoch": 458} {"train_loss": -5.318509101867676, "global_step": 19260, "epoch": 458} {"train_loss": -5.194188117980957, "global_step": 19261, "epoch": 458} {"train_loss": -5.236233711242676, "global_step": 19262, "epoch": 458} {"train_loss": -5.412090301513672, "global_step": 19263, "epoch": 458} {"train_loss": -5.035717010498047, "global_step": 19264, "epoch": 458} {"train_loss": -5.151958465576172, "global_step": 19265, "epoch": 458} {"train_loss": -5.349923610687256, "global_step": 19266, "epoch": 458} {"train_loss": -5.203454971313477, "global_step": 19267, "epoch": 458} {"train_loss": -5.21649169921875, "global_step": 19268, "epoch": 458} {"train_loss": -5.351881980895996, "global_step": 19269, "epoch": 458} {"train_loss": -5.066773414611816, "global_step": 19270, "epoch": 458} {"train_loss": -5.420473098754883, "global_step": 19271, "epoch": 458} {"train_loss": -5.4123382568359375, "global_step": 19272, "epoch": 458} {"train_loss": -5.409151077270508, "global_step": 19273, "epoch": 458} {"train_loss": -5.401555061340332, "global_step": 19274, "epoch": 458} {"train_loss": -5.280320167541504, "global_step": 19275, "epoch": 458} {"train_loss": -5.337850570678711, "global_step": 19276, "epoch": 458} {"train_loss": -5.289470184416998, "global_step": 19277, "epoch": 458, "val_loss": 69492.8671875} {"train_loss": -5.153881072998047, "global_step": 19278, "epoch": 459} {"train_loss": -5.418484210968018, "global_step": 19279, "epoch": 459} {"train_loss": -5.176522731781006, "global_step": 19280, "epoch": 459} {"train_loss": -5.230118751525879, "global_step": 19281, "epoch": 459} {"train_loss": -5.406079292297363, "global_step": 19282, "epoch": 459} {"train_loss": -5.345040321350098, "global_step": 19283, "epoch": 459} {"train_loss": -5.336812496185303, "global_step": 19284, "epoch": 459} {"train_loss": -5.473639488220215, "global_step": 19285, "epoch": 459} {"train_loss": -5.169610023498535, "global_step": 19286, "epoch": 459} {"train_loss": -5.253015518188477, "global_step": 19287, "epoch": 459} {"train_loss": -5.279884338378906, "global_step": 19288, "epoch": 459} {"train_loss": -5.376586437225342, "global_step": 19289, "epoch": 459} {"train_loss": -5.289973258972168, "global_step": 19290, "epoch": 459} {"train_loss": -5.265138626098633, "global_step": 19291, "epoch": 459} {"train_loss": -5.287115097045898, "global_step": 19292, "epoch": 459} {"train_loss": -5.28439998626709, "global_step": 19293, "epoch": 459} {"train_loss": -5.367660999298096, "global_step": 19294, "epoch": 459} {"train_loss": -5.397707939147949, "global_step": 19295, "epoch": 459} {"train_loss": -5.3576765060424805, "global_step": 19296, "epoch": 459} {"train_loss": -5.470180988311768, "global_step": 19297, "epoch": 459} {"train_loss": -5.320204257965088, "global_step": 19298, "epoch": 459} {"train_loss": -5.299488067626953, "global_step": 19299, "epoch": 459} {"train_loss": -5.2694807052612305, "global_step": 19300, "epoch": 459} {"train_loss": -5.347664833068848, "global_step": 19301, "epoch": 459} {"train_loss": -5.329875469207764, "global_step": 19302, "epoch": 459} {"train_loss": -5.309126853942871, "global_step": 19303, "epoch": 459} {"train_loss": -5.402338981628418, "global_step": 19304, "epoch": 459} {"train_loss": -5.32353401184082, "global_step": 19305, "epoch": 459} {"train_loss": -5.233703136444092, "global_step": 19306, "epoch": 459} {"train_loss": -5.24678373336792, "global_step": 19307, "epoch": 459} {"train_loss": -5.338109970092773, "global_step": 19308, "epoch": 459} {"train_loss": -5.215208530426025, "global_step": 19309, "epoch": 459} {"train_loss": -5.269008159637451, "global_step": 19310, "epoch": 459} {"train_loss": -5.171686172485352, "global_step": 19311, "epoch": 459} {"train_loss": -5.2631072998046875, "global_step": 19312, "epoch": 459} {"train_loss": -5.2483601570129395, "global_step": 19313, "epoch": 459} {"train_loss": -5.416738033294678, "global_step": 19314, "epoch": 459} {"train_loss": -5.09969425201416, "global_step": 19315, "epoch": 459} {"train_loss": -5.280973434448242, "global_step": 19316, "epoch": 459} {"train_loss": -5.247294902801514, "global_step": 19317, "epoch": 459} {"train_loss": -5.293063163757324, "global_step": 19318, "epoch": 459} {"train_loss": -5.295997063318889, "global_step": 19319, "epoch": 459, "val_loss": 69537.8046875} {"train_loss": -5.310667037963867, "global_step": 19320, "epoch": 460} {"train_loss": -5.178215026855469, "global_step": 19321, "epoch": 460} {"train_loss": -5.263187885284424, "global_step": 19322, "epoch": 460} {"train_loss": -5.264510154724121, "global_step": 19323, "epoch": 460} {"train_loss": -5.294462203979492, "global_step": 19324, "epoch": 460} {"train_loss": -5.309492111206055, "global_step": 19325, "epoch": 460} {"train_loss": -5.2806572914123535, "global_step": 19326, "epoch": 460} {"train_loss": -5.297606468200684, "global_step": 19327, "epoch": 460} {"train_loss": -5.338108539581299, "global_step": 19328, "epoch": 460} {"train_loss": -5.366959571838379, "global_step": 19329, "epoch": 460} {"train_loss": -5.274674415588379, "global_step": 19330, "epoch": 460} {"train_loss": -5.331804275512695, "global_step": 19331, "epoch": 460} {"train_loss": -5.2670416831970215, "global_step": 19332, "epoch": 460} {"train_loss": -5.299041748046875, "global_step": 19333, "epoch": 460} {"train_loss": -5.30649471282959, "global_step": 19334, "epoch": 460} {"train_loss": -5.335457801818848, "global_step": 19335, "epoch": 460} {"train_loss": -5.342153549194336, "global_step": 19336, "epoch": 460} {"train_loss": -5.228341579437256, "global_step": 19337, "epoch": 460} {"train_loss": -5.404544353485107, "global_step": 19338, "epoch": 460} {"train_loss": -5.425225257873535, "global_step": 19339, "epoch": 460} {"train_loss": -5.32354736328125, "global_step": 19340, "epoch": 460} {"train_loss": -5.402774333953857, "global_step": 19341, "epoch": 460} {"train_loss": -5.3352179527282715, "global_step": 19342, "epoch": 460} {"train_loss": -5.320120334625244, "global_step": 19343, "epoch": 460} {"train_loss": -5.38991117477417, "global_step": 19344, "epoch": 460} {"train_loss": -5.311946392059326, "global_step": 19345, "epoch": 460} {"train_loss": -5.324467658996582, "global_step": 19346, "epoch": 460} {"train_loss": -5.249298095703125, "global_step": 19347, "epoch": 460} {"train_loss": -5.148355007171631, "global_step": 19348, "epoch": 460} {"train_loss": -5.40134334564209, "global_step": 19349, "epoch": 460} {"train_loss": -5.340968132019043, "global_step": 19350, "epoch": 460} {"train_loss": -5.343232154846191, "global_step": 19351, "epoch": 460} {"train_loss": -5.30776309967041, "global_step": 19352, "epoch": 460} {"train_loss": -5.2525787353515625, "global_step": 19353, "epoch": 460} {"train_loss": -5.359780311584473, "global_step": 19354, "epoch": 460} {"train_loss": -5.225319862365723, "global_step": 19355, "epoch": 460} {"train_loss": -5.314675807952881, "global_step": 19356, "epoch": 460} {"train_loss": -5.400676250457764, "global_step": 19357, "epoch": 460} {"train_loss": -5.401096343994141, "global_step": 19358, "epoch": 460} {"train_loss": -5.316279888153076, "global_step": 19359, "epoch": 460} {"train_loss": -5.349583625793457, "global_step": 19360, "epoch": 460} {"train_loss": -5.312666893005371, "global_step": 19361, "epoch": 460, "val_loss": 70352.109375} {"train_loss": -5.28698205947876, "global_step": 19362, "epoch": 461} {"train_loss": -5.310170650482178, "global_step": 19363, "epoch": 461} {"train_loss": -5.181861877441406, "global_step": 19364, "epoch": 461} {"train_loss": -5.225605487823486, "global_step": 19365, "epoch": 461} {"train_loss": -5.257411003112793, "global_step": 19366, "epoch": 461} {"train_loss": -5.125988960266113, "global_step": 19367, "epoch": 461} {"train_loss": -5.245230674743652, "global_step": 19368, "epoch": 461} {"train_loss": -5.274949073791504, "global_step": 19369, "epoch": 461} {"train_loss": -5.3008012771606445, "global_step": 19370, "epoch": 461} {"train_loss": -5.349639892578125, "global_step": 19371, "epoch": 461} {"train_loss": -5.359123706817627, "global_step": 19372, "epoch": 461} {"train_loss": -5.288588523864746, "global_step": 19373, "epoch": 461} {"train_loss": -5.376201152801514, "global_step": 19374, "epoch": 461} {"train_loss": -5.350024223327637, "global_step": 19375, "epoch": 461} {"train_loss": -5.192618370056152, "global_step": 19376, "epoch": 461} {"train_loss": -5.30905818939209, "global_step": 19377, "epoch": 461} {"train_loss": -5.228362083435059, "global_step": 19378, "epoch": 461} {"train_loss": -5.218544006347656, "global_step": 19379, "epoch": 461} {"train_loss": -5.384786128997803, "global_step": 19380, "epoch": 461} {"train_loss": -5.408867835998535, "global_step": 19381, "epoch": 461} {"train_loss": -5.202768325805664, "global_step": 19382, "epoch": 461} {"train_loss": -5.339054107666016, "global_step": 19383, "epoch": 461} {"train_loss": -5.172005653381348, "global_step": 19384, "epoch": 461} {"train_loss": -5.244808197021484, "global_step": 19385, "epoch": 461} {"train_loss": -5.316987991333008, "global_step": 19386, "epoch": 461} {"train_loss": -5.103489398956299, "global_step": 19387, "epoch": 461} {"train_loss": -5.277453422546387, "global_step": 19388, "epoch": 461} {"train_loss": -5.312690258026123, "global_step": 19389, "epoch": 461} {"train_loss": -5.2744975090026855, "global_step": 19390, "epoch": 461} {"train_loss": -5.2126874923706055, "global_step": 19391, "epoch": 461} {"train_loss": -5.165551662445068, "global_step": 19392, "epoch": 461} {"train_loss": -5.229384422302246, "global_step": 19393, "epoch": 461} {"train_loss": -5.26561164855957, "global_step": 19394, "epoch": 461} {"train_loss": -5.253547668457031, "global_step": 19395, "epoch": 461} {"train_loss": -5.250180244445801, "global_step": 19396, "epoch": 461} {"train_loss": -5.241476058959961, "global_step": 19397, "epoch": 461} {"train_loss": -5.454184055328369, "global_step": 19398, "epoch": 461} {"train_loss": -5.277472019195557, "global_step": 19399, "epoch": 461} {"train_loss": -5.216732978820801, "global_step": 19400, "epoch": 461} {"train_loss": -5.358511924743652, "global_step": 19401, "epoch": 461} {"train_loss": -5.219203472137451, "global_step": 19402, "epoch": 461} {"train_loss": -5.267974353971935, "global_step": 19403, "epoch": 461, "val_loss": 69864.3984375} {"train_loss": -5.363374710083008, "global_step": 19404, "epoch": 462} {"train_loss": -5.283327102661133, "global_step": 19405, "epoch": 462} {"train_loss": -5.333311080932617, "global_step": 19406, "epoch": 462} {"train_loss": -5.167491436004639, "global_step": 19407, "epoch": 462} {"train_loss": -5.342041969299316, "global_step": 19408, "epoch": 462} {"train_loss": -5.167489051818848, "global_step": 19409, "epoch": 462} {"train_loss": -5.305467128753662, "global_step": 19410, "epoch": 462} {"train_loss": -5.289423942565918, "global_step": 19411, "epoch": 462} {"train_loss": -5.174586296081543, "global_step": 19412, "epoch": 462} {"train_loss": -5.424181938171387, "global_step": 19413, "epoch": 462} {"train_loss": -5.4035749435424805, "global_step": 19414, "epoch": 462} {"train_loss": -5.239723205566406, "global_step": 19415, "epoch": 462} {"train_loss": -5.34426736831665, "global_step": 19416, "epoch": 462} {"train_loss": -5.260417938232422, "global_step": 19417, "epoch": 462} {"train_loss": -5.134060859680176, "global_step": 19418, "epoch": 462} {"train_loss": -5.372632026672363, "global_step": 19419, "epoch": 462} {"train_loss": -5.078988075256348, "global_step": 19420, "epoch": 462} {"train_loss": -5.250724792480469, "global_step": 19421, "epoch": 462} {"train_loss": -5.2140278816223145, "global_step": 19422, "epoch": 462} {"train_loss": -5.308660507202148, "global_step": 19423, "epoch": 462} {"train_loss": -5.33540678024292, "global_step": 19424, "epoch": 462} {"train_loss": -5.346227169036865, "global_step": 19425, "epoch": 462} {"train_loss": -5.093355655670166, "global_step": 19426, "epoch": 462} {"train_loss": -5.168591499328613, "global_step": 19427, "epoch": 462} {"train_loss": -5.246050834655762, "global_step": 19428, "epoch": 462} {"train_loss": -5.252050399780273, "global_step": 19429, "epoch": 462} {"train_loss": -5.414409637451172, "global_step": 19430, "epoch": 462} {"train_loss": -5.254663467407227, "global_step": 19431, "epoch": 462} {"train_loss": -5.328614234924316, "global_step": 19432, "epoch": 462} {"train_loss": -5.2466535568237305, "global_step": 19433, "epoch": 462} {"train_loss": -5.302262306213379, "global_step": 19434, "epoch": 462} {"train_loss": -5.329049110412598, "global_step": 19435, "epoch": 462} {"train_loss": -5.096647262573242, "global_step": 19436, "epoch": 462} {"train_loss": -5.304290294647217, "global_step": 19437, "epoch": 462} {"train_loss": -5.277297496795654, "global_step": 19438, "epoch": 462} {"train_loss": -5.220620155334473, "global_step": 19439, "epoch": 462} {"train_loss": -5.120424747467041, "global_step": 19440, "epoch": 462} {"train_loss": -5.253332138061523, "global_step": 19441, "epoch": 462} {"train_loss": -5.316046237945557, "global_step": 19442, "epoch": 462} {"train_loss": -5.263920783996582, "global_step": 19443, "epoch": 462} {"train_loss": -5.367290496826172, "global_step": 19444, "epoch": 462} {"train_loss": -5.2672137305850075, "global_step": 19445, "epoch": 462, "val_loss": 69224.3125} {"train_loss": -5.335712432861328, "global_step": 19446, "epoch": 463} {"train_loss": -5.2400007247924805, "global_step": 19447, "epoch": 463} {"train_loss": -5.156471252441406, "global_step": 19448, "epoch": 463} {"train_loss": -5.276406288146973, "global_step": 19449, "epoch": 463} {"train_loss": -5.363400459289551, "global_step": 19450, "epoch": 463} {"train_loss": -5.356686115264893, "global_step": 19451, "epoch": 463} {"train_loss": -5.374795913696289, "global_step": 19452, "epoch": 463} {"train_loss": -5.290738105773926, "global_step": 19453, "epoch": 463} {"train_loss": -5.302345275878906, "global_step": 19454, "epoch": 463} {"train_loss": -5.278260231018066, "global_step": 19455, "epoch": 463} {"train_loss": -5.238354206085205, "global_step": 19456, "epoch": 463} {"train_loss": -5.25734806060791, "global_step": 19457, "epoch": 463} {"train_loss": -5.4180498123168945, "global_step": 19458, "epoch": 463} {"train_loss": -5.357249736785889, "global_step": 19459, "epoch": 463} {"train_loss": -5.275630950927734, "global_step": 19460, "epoch": 463} {"train_loss": -5.389267921447754, "global_step": 19461, "epoch": 463} {"train_loss": -5.313882827758789, "global_step": 19462, "epoch": 463} {"train_loss": -5.256101131439209, "global_step": 19463, "epoch": 463} {"train_loss": -5.452845573425293, "global_step": 19464, "epoch": 463} {"train_loss": -5.306841850280762, "global_step": 19465, "epoch": 463} {"train_loss": -5.359339237213135, "global_step": 19466, "epoch": 463} {"train_loss": -5.3528337478637695, "global_step": 19467, "epoch": 463} {"train_loss": -5.353381633758545, "global_step": 19468, "epoch": 463} {"train_loss": -5.393980979919434, "global_step": 19469, "epoch": 463} {"train_loss": -5.349303245544434, "global_step": 19470, "epoch": 463} {"train_loss": -5.356996536254883, "global_step": 19471, "epoch": 463} {"train_loss": -5.261434555053711, "global_step": 19472, "epoch": 463} {"train_loss": -5.188454627990723, "global_step": 19473, "epoch": 463} {"train_loss": -5.338262557983398, "global_step": 19474, "epoch": 463} {"train_loss": -5.244437217712402, "global_step": 19475, "epoch": 463} {"train_loss": -5.3208394050598145, "global_step": 19476, "epoch": 463} {"train_loss": -5.337159633636475, "global_step": 19477, "epoch": 463} {"train_loss": -5.508447647094727, "global_step": 19478, "epoch": 463} {"train_loss": -5.433165550231934, "global_step": 19479, "epoch": 463} {"train_loss": -5.315252304077148, "global_step": 19480, "epoch": 463} {"train_loss": -5.352764129638672, "global_step": 19481, "epoch": 463} {"train_loss": -5.227574348449707, "global_step": 19482, "epoch": 463} {"train_loss": -5.3053669929504395, "global_step": 19483, "epoch": 463} {"train_loss": -5.311046123504639, "global_step": 19484, "epoch": 463} {"train_loss": -5.320531845092773, "global_step": 19485, "epoch": 463} {"train_loss": -5.158717155456543, "global_step": 19486, "epoch": 463} {"train_loss": -5.314439478374663, "global_step": 19487, "epoch": 463, "val_loss": 69362.3203125} {"train_loss": -5.364694595336914, "global_step": 19488, "epoch": 464} {"train_loss": -5.030490875244141, "global_step": 19489, "epoch": 464} {"train_loss": -5.2747578620910645, "global_step": 19490, "epoch": 464} {"train_loss": -5.094349384307861, "global_step": 19491, "epoch": 464} {"train_loss": -5.200325965881348, "global_step": 19492, "epoch": 464} {"train_loss": -5.28713321685791, "global_step": 19493, "epoch": 464} {"train_loss": -5.2674407958984375, "global_step": 19494, "epoch": 464} {"train_loss": -5.392270088195801, "global_step": 19495, "epoch": 464} {"train_loss": -5.257333755493164, "global_step": 19496, "epoch": 464} {"train_loss": -5.16445255279541, "global_step": 19497, "epoch": 464} {"train_loss": -5.244136810302734, "global_step": 19498, "epoch": 464} {"train_loss": -5.270676136016846, "global_step": 19499, "epoch": 464} {"train_loss": -5.244379997253418, "global_step": 19500, "epoch": 464} {"train_loss": -5.367608070373535, "global_step": 19501, "epoch": 464} {"train_loss": -5.26566743850708, "global_step": 19502, "epoch": 464} {"train_loss": -5.360684394836426, "global_step": 19503, "epoch": 464} {"train_loss": -5.25109338760376, "global_step": 19504, "epoch": 464} {"train_loss": -5.317151069641113, "global_step": 19505, "epoch": 464} {"train_loss": -5.257331848144531, "global_step": 19506, "epoch": 464} {"train_loss": -5.273735046386719, "global_step": 19507, "epoch": 464} {"train_loss": -5.473895072937012, "global_step": 19508, "epoch": 464} {"train_loss": -5.325283050537109, "global_step": 19509, "epoch": 464} {"train_loss": -5.321985244750977, "global_step": 19510, "epoch": 464} {"train_loss": -5.312142372131348, "global_step": 19511, "epoch": 464} {"train_loss": -5.362527370452881, "global_step": 19512, "epoch": 464} {"train_loss": -5.3646931648254395, "global_step": 19513, "epoch": 464} {"train_loss": -5.4408278465271, "global_step": 19514, "epoch": 464} {"train_loss": -5.395821571350098, "global_step": 19515, "epoch": 464} {"train_loss": -5.361790180206299, "global_step": 19516, "epoch": 464} {"train_loss": -5.2482194900512695, "global_step": 19517, "epoch": 464} {"train_loss": -5.353621006011963, "global_step": 19518, "epoch": 464} {"train_loss": -5.230742454528809, "global_step": 19519, "epoch": 464} {"train_loss": -5.277797222137451, "global_step": 19520, "epoch": 464} {"train_loss": -5.078356742858887, "global_step": 19521, "epoch": 464} {"train_loss": -5.195886611938477, "global_step": 19522, "epoch": 464} {"train_loss": -5.222341537475586, "global_step": 19523, "epoch": 464} {"train_loss": -5.296812057495117, "global_step": 19524, "epoch": 464} {"train_loss": -5.246279716491699, "global_step": 19525, "epoch": 464} {"train_loss": -5.36805534362793, "global_step": 19526, "epoch": 464} {"train_loss": -5.067350387573242, "global_step": 19527, "epoch": 464} {"train_loss": -5.061549186706543, "global_step": 19528, "epoch": 464} {"train_loss": -5.272506305149624, "global_step": 19529, "epoch": 464, "val_loss": 69099.390625} {"train_loss": -5.282711029052734, "global_step": 19530, "epoch": 465} {"train_loss": -5.3393659591674805, "global_step": 19531, "epoch": 465} {"train_loss": -5.371837615966797, "global_step": 19532, "epoch": 465} {"train_loss": -5.125263214111328, "global_step": 19533, "epoch": 465} {"train_loss": -5.328197479248047, "global_step": 19534, "epoch": 465} {"train_loss": -5.397223949432373, "global_step": 19535, "epoch": 465} {"train_loss": -5.3703718185424805, "global_step": 19536, "epoch": 465} {"train_loss": -5.208889961242676, "global_step": 19537, "epoch": 465} {"train_loss": -5.148351669311523, "global_step": 19538, "epoch": 465} {"train_loss": -5.369451522827148, "global_step": 19539, "epoch": 465} {"train_loss": -5.32401180267334, "global_step": 19540, "epoch": 465} {"train_loss": -5.191302299499512, "global_step": 19541, "epoch": 465} {"train_loss": -5.317309856414795, "global_step": 19542, "epoch": 465} {"train_loss": -5.221546173095703, "global_step": 19543, "epoch": 465} {"train_loss": -5.465633392333984, "global_step": 19544, "epoch": 465} {"train_loss": -5.298969745635986, "global_step": 19545, "epoch": 465} {"train_loss": -5.3304595947265625, "global_step": 19546, "epoch": 465} {"train_loss": -5.377597808837891, "global_step": 19547, "epoch": 465} {"train_loss": -5.395895004272461, "global_step": 19548, "epoch": 465} {"train_loss": -5.289855003356934, "global_step": 19549, "epoch": 465} {"train_loss": -5.399980545043945, "global_step": 19550, "epoch": 465} {"train_loss": -5.2430739402771, "global_step": 19551, "epoch": 465} {"train_loss": -5.1628804206848145, "global_step": 19552, "epoch": 465} {"train_loss": -5.370438575744629, "global_step": 19553, "epoch": 465} {"train_loss": -5.278871536254883, "global_step": 19554, "epoch": 465} {"train_loss": -5.27304220199585, "global_step": 19555, "epoch": 465} {"train_loss": -5.361736297607422, "global_step": 19556, "epoch": 465} {"train_loss": -5.364317893981934, "global_step": 19557, "epoch": 465} {"train_loss": -5.402057647705078, "global_step": 19558, "epoch": 465} {"train_loss": -5.310357093811035, "global_step": 19559, "epoch": 465} {"train_loss": -5.356412410736084, "global_step": 19560, "epoch": 465} {"train_loss": -5.172001361846924, "global_step": 19561, "epoch": 465} {"train_loss": -5.341221809387207, "global_step": 19562, "epoch": 465} {"train_loss": -5.207077980041504, "global_step": 19563, "epoch": 465} {"train_loss": -5.187247276306152, "global_step": 19564, "epoch": 465} {"train_loss": -5.2417216300964355, "global_step": 19565, "epoch": 465} {"train_loss": -5.2381439208984375, "global_step": 19566, "epoch": 465} {"train_loss": -5.038054466247559, "global_step": 19567, "epoch": 465} {"train_loss": -5.142026901245117, "global_step": 19568, "epoch": 465} {"train_loss": -4.886636257171631, "global_step": 19569, "epoch": 465} {"train_loss": -5.461190223693848, "global_step": 19570, "epoch": 465} {"train_loss": -5.277886946996053, "global_step": 19571, "epoch": 465, "val_loss": 71188.078125} {"train_loss": -5.142210006713867, "global_step": 19572, "epoch": 466} {"train_loss": -5.163556098937988, "global_step": 19573, "epoch": 466} {"train_loss": -5.171032905578613, "global_step": 19574, "epoch": 466} {"train_loss": -5.213986396789551, "global_step": 19575, "epoch": 466} {"train_loss": -5.135143756866455, "global_step": 19576, "epoch": 466} {"train_loss": -5.118185043334961, "global_step": 19577, "epoch": 466} {"train_loss": -5.123523712158203, "global_step": 19578, "epoch": 466} {"train_loss": -5.22396993637085, "global_step": 19579, "epoch": 466} {"train_loss": -5.149119853973389, "global_step": 19580, "epoch": 466} {"train_loss": -5.375581741333008, "global_step": 19581, "epoch": 466} {"train_loss": -5.243740081787109, "global_step": 19582, "epoch": 466} {"train_loss": -5.2383527755737305, "global_step": 19583, "epoch": 466} {"train_loss": -5.208219528198242, "global_step": 19584, "epoch": 466} {"train_loss": -5.152215003967285, "global_step": 19585, "epoch": 466} {"train_loss": -5.162294387817383, "global_step": 19586, "epoch": 466} {"train_loss": -5.187005996704102, "global_step": 19587, "epoch": 466} {"train_loss": -5.097339630126953, "global_step": 19588, "epoch": 466} {"train_loss": -5.200527191162109, "global_step": 19589, "epoch": 466} {"train_loss": -5.319917678833008, "global_step": 19590, "epoch": 466} {"train_loss": -5.309224605560303, "global_step": 19591, "epoch": 466} {"train_loss": -5.238259315490723, "global_step": 19592, "epoch": 466} {"train_loss": -5.20249080657959, "global_step": 19593, "epoch": 466} {"train_loss": -5.228708267211914, "global_step": 19594, "epoch": 466} {"train_loss": -5.346127986907959, "global_step": 19595, "epoch": 466} {"train_loss": -5.310260772705078, "global_step": 19596, "epoch": 466} {"train_loss": -5.1857147216796875, "global_step": 19597, "epoch": 466} {"train_loss": -5.187004566192627, "global_step": 19598, "epoch": 466} {"train_loss": -5.215575218200684, "global_step": 19599, "epoch": 466} {"train_loss": -5.319021224975586, "global_step": 19600, "epoch": 466} {"train_loss": -5.279812335968018, "global_step": 19601, "epoch": 466} {"train_loss": -5.322196960449219, "global_step": 19602, "epoch": 466} {"train_loss": -5.362216949462891, "global_step": 19603, "epoch": 466} {"train_loss": -5.197574615478516, "global_step": 19604, "epoch": 466} {"train_loss": -5.383172988891602, "global_step": 19605, "epoch": 466} {"train_loss": -5.174710273742676, "global_step": 19606, "epoch": 466} {"train_loss": -5.238032817840576, "global_step": 19607, "epoch": 466} {"train_loss": -5.491324424743652, "global_step": 19608, "epoch": 466} {"train_loss": -5.339345455169678, "global_step": 19609, "epoch": 466} {"train_loss": -5.445119857788086, "global_step": 19610, "epoch": 466} {"train_loss": -5.373859882354736, "global_step": 19611, "epoch": 466} {"train_loss": -5.336886405944824, "global_step": 19612, "epoch": 466} {"train_loss": -5.247589406513033, "global_step": 19613, "epoch": 466, "val_loss": 68862.6015625} {"train_loss": -5.2800140380859375, "global_step": 19614, "epoch": 467} {"train_loss": -5.313799858093262, "global_step": 19615, "epoch": 467} {"train_loss": -5.362418174743652, "global_step": 19616, "epoch": 467} {"train_loss": -5.317789554595947, "global_step": 19617, "epoch": 467} {"train_loss": -5.466284275054932, "global_step": 19618, "epoch": 467} {"train_loss": -5.334537029266357, "global_step": 19619, "epoch": 467} {"train_loss": -5.273852348327637, "global_step": 19620, "epoch": 467} {"train_loss": -5.229377746582031, "global_step": 19621, "epoch": 467} {"train_loss": -5.427962779998779, "global_step": 19622, "epoch": 467} {"train_loss": -5.453245162963867, "global_step": 19623, "epoch": 467} {"train_loss": -5.327935218811035, "global_step": 19624, "epoch": 467} {"train_loss": -5.4513654708862305, "global_step": 19625, "epoch": 467} {"train_loss": -5.376574516296387, "global_step": 19626, "epoch": 467} {"train_loss": -5.426855564117432, "global_step": 19627, "epoch": 467} {"train_loss": -5.187891960144043, "global_step": 19628, "epoch": 467} {"train_loss": -5.253624439239502, "global_step": 19629, "epoch": 467} {"train_loss": -5.294437408447266, "global_step": 19630, "epoch": 467} {"train_loss": -5.384369850158691, "global_step": 19631, "epoch": 467} {"train_loss": -5.2238383293151855, "global_step": 19632, "epoch": 467} {"train_loss": -5.270020484924316, "global_step": 19633, "epoch": 467} {"train_loss": -5.175771713256836, "global_step": 19634, "epoch": 467} {"train_loss": -5.403992176055908, "global_step": 19635, "epoch": 467} {"train_loss": -5.33786678314209, "global_step": 19636, "epoch": 467} {"train_loss": -5.287546634674072, "global_step": 19637, "epoch": 467} {"train_loss": -5.293100833892822, "global_step": 19638, "epoch": 467} {"train_loss": -5.2936506271362305, "global_step": 19639, "epoch": 467} {"train_loss": -5.4295783042907715, "global_step": 19640, "epoch": 467} {"train_loss": -5.361823081970215, "global_step": 19641, "epoch": 467} {"train_loss": -5.365011215209961, "global_step": 19642, "epoch": 467} {"train_loss": -5.318954944610596, "global_step": 19643, "epoch": 467} {"train_loss": -5.331689834594727, "global_step": 19644, "epoch": 467} {"train_loss": -5.384363174438477, "global_step": 19645, "epoch": 467} {"train_loss": -5.24987268447876, "global_step": 19646, "epoch": 467} {"train_loss": -5.362981796264648, "global_step": 19647, "epoch": 467} {"train_loss": -5.273414134979248, "global_step": 19648, "epoch": 467} {"train_loss": -5.342696189880371, "global_step": 19649, "epoch": 467} {"train_loss": -5.316793441772461, "global_step": 19650, "epoch": 467} {"train_loss": -5.237540245056152, "global_step": 19651, "epoch": 467} {"train_loss": -5.412014007568359, "global_step": 19652, "epoch": 467} {"train_loss": -5.275657653808594, "global_step": 19653, "epoch": 467} {"train_loss": -5.442836761474609, "global_step": 19654, "epoch": 467} {"train_loss": -5.324531418936593, "global_step": 19655, "epoch": 467, "val_loss": 68923.84375} {"train_loss": -5.403578758239746, "global_step": 19656, "epoch": 468} {"train_loss": -5.32997989654541, "global_step": 19657, "epoch": 468} {"train_loss": -5.257330417633057, "global_step": 19658, "epoch": 468} {"train_loss": -5.2886247634887695, "global_step": 19659, "epoch": 468} {"train_loss": -5.211034774780273, "global_step": 19660, "epoch": 468} {"train_loss": -5.368297100067139, "global_step": 19661, "epoch": 468} {"train_loss": -5.449386119842529, "global_step": 19662, "epoch": 468} {"train_loss": -5.337976932525635, "global_step": 19663, "epoch": 468} {"train_loss": -5.304170608520508, "global_step": 19664, "epoch": 468} {"train_loss": -5.35361385345459, "global_step": 19665, "epoch": 468} {"train_loss": -5.348300933837891, "global_step": 19666, "epoch": 468} {"train_loss": -5.16641902923584, "global_step": 19667, "epoch": 468} {"train_loss": -5.410424709320068, "global_step": 19668, "epoch": 468} {"train_loss": -5.337576389312744, "global_step": 19669, "epoch": 468} {"train_loss": -5.363564968109131, "global_step": 19670, "epoch": 468} {"train_loss": -5.255277156829834, "global_step": 19671, "epoch": 468} {"train_loss": -5.278964996337891, "global_step": 19672, "epoch": 468} {"train_loss": -5.364900588989258, "global_step": 19673, "epoch": 468} {"train_loss": -5.339120864868164, "global_step": 19674, "epoch": 468} {"train_loss": -5.369965553283691, "global_step": 19675, "epoch": 468} {"train_loss": -5.262150764465332, "global_step": 19676, "epoch": 468} {"train_loss": -5.28319787979126, "global_step": 19677, "epoch": 468} {"train_loss": -5.286345481872559, "global_step": 19678, "epoch": 468} {"train_loss": -5.131280422210693, "global_step": 19679, "epoch": 468} {"train_loss": -5.353250026702881, "global_step": 19680, "epoch": 468} {"train_loss": -5.214937210083008, "global_step": 19681, "epoch": 468} {"train_loss": -5.328014373779297, "global_step": 19682, "epoch": 468} {"train_loss": -5.220530986785889, "global_step": 19683, "epoch": 468} {"train_loss": -5.243662357330322, "global_step": 19684, "epoch": 468} {"train_loss": -5.3452911376953125, "global_step": 19685, "epoch": 468} {"train_loss": -5.42259407043457, "global_step": 19686, "epoch": 468} {"train_loss": -5.225219249725342, "global_step": 19687, "epoch": 468} {"train_loss": -5.350949287414551, "global_step": 19688, "epoch": 468} {"train_loss": -5.334478378295898, "global_step": 19689, "epoch": 468} {"train_loss": -5.409372806549072, "global_step": 19690, "epoch": 468} {"train_loss": -5.419038772583008, "global_step": 19691, "epoch": 468} {"train_loss": -5.378733158111572, "global_step": 19692, "epoch": 468} {"train_loss": -5.254438400268555, "global_step": 19693, "epoch": 468} {"train_loss": -5.290079116821289, "global_step": 19694, "epoch": 468} {"train_loss": -5.291847229003906, "global_step": 19695, "epoch": 468} {"train_loss": -5.304522514343262, "global_step": 19696, "epoch": 468} {"train_loss": -5.314159211658296, "global_step": 19697, "epoch": 468, "val_loss": 69671.40625} {"train_loss": -5.252912521362305, "global_step": 19698, "epoch": 469} {"train_loss": -5.266530990600586, "global_step": 19699, "epoch": 469} {"train_loss": -5.22434139251709, "global_step": 19700, "epoch": 469} {"train_loss": -5.209637641906738, "global_step": 19701, "epoch": 469} {"train_loss": -5.2994384765625, "global_step": 19702, "epoch": 469} {"train_loss": -5.276035308837891, "global_step": 19703, "epoch": 469} {"train_loss": -5.33207893371582, "global_step": 19704, "epoch": 469} {"train_loss": -5.393719673156738, "global_step": 19705, "epoch": 469} {"train_loss": -5.385231971740723, "global_step": 19706, "epoch": 469} {"train_loss": -5.326822280883789, "global_step": 19707, "epoch": 469} {"train_loss": -5.195581912994385, "global_step": 19708, "epoch": 469} {"train_loss": -5.33455753326416, "global_step": 19709, "epoch": 469} {"train_loss": -5.303886890411377, "global_step": 19710, "epoch": 469} {"train_loss": -5.303433418273926, "global_step": 19711, "epoch": 469} {"train_loss": -5.191756248474121, "global_step": 19712, "epoch": 469} {"train_loss": -5.429622650146484, "global_step": 19713, "epoch": 469} {"train_loss": -5.125183582305908, "global_step": 19714, "epoch": 469} {"train_loss": -5.249058723449707, "global_step": 19715, "epoch": 469} {"train_loss": -5.237005233764648, "global_step": 19716, "epoch": 469} {"train_loss": -5.3184356689453125, "global_step": 19717, "epoch": 469} {"train_loss": -5.38355827331543, "global_step": 19718, "epoch": 469} {"train_loss": -5.3400092124938965, "global_step": 19719, "epoch": 469} {"train_loss": -5.240403652191162, "global_step": 19720, "epoch": 469} {"train_loss": -5.329831123352051, "global_step": 19721, "epoch": 469} {"train_loss": -5.4186248779296875, "global_step": 19722, "epoch": 469} {"train_loss": -5.292842864990234, "global_step": 19723, "epoch": 469} {"train_loss": -5.302541255950928, "global_step": 19724, "epoch": 469} {"train_loss": -5.356503963470459, "global_step": 19725, "epoch": 469} {"train_loss": -5.295880317687988, "global_step": 19726, "epoch": 469} {"train_loss": -5.305330276489258, "global_step": 19727, "epoch": 469} {"train_loss": -5.360583305358887, "global_step": 19728, "epoch": 469} {"train_loss": -5.304810047149658, "global_step": 19729, "epoch": 469} {"train_loss": -5.390905380249023, "global_step": 19730, "epoch": 469} {"train_loss": -5.286016464233398, "global_step": 19731, "epoch": 469} {"train_loss": -5.358303070068359, "global_step": 19732, "epoch": 469} {"train_loss": -5.4015913009643555, "global_step": 19733, "epoch": 469} {"train_loss": -5.362020969390869, "global_step": 19734, "epoch": 469} {"train_loss": -5.284806251525879, "global_step": 19735, "epoch": 469} {"train_loss": -5.270749092102051, "global_step": 19736, "epoch": 469} {"train_loss": -5.426092624664307, "global_step": 19737, "epoch": 469} {"train_loss": -5.337456703186035, "global_step": 19738, "epoch": 469} {"train_loss": -5.305277143205915, "global_step": 19739, "epoch": 469, "val_loss": 69007.140625} {"train_loss": -5.343380928039551, "global_step": 19740, "epoch": 470} {"train_loss": -5.277356147766113, "global_step": 19741, "epoch": 470} {"train_loss": -5.243420600891113, "global_step": 19742, "epoch": 470} {"train_loss": -5.426263809204102, "global_step": 19743, "epoch": 470} {"train_loss": -5.26046085357666, "global_step": 19744, "epoch": 470} {"train_loss": -5.271191596984863, "global_step": 19745, "epoch": 470} {"train_loss": -5.512202262878418, "global_step": 19746, "epoch": 470} {"train_loss": -5.385210037231445, "global_step": 19747, "epoch": 470} {"train_loss": -5.223519325256348, "global_step": 19748, "epoch": 470} {"train_loss": -5.290409564971924, "global_step": 19749, "epoch": 470} {"train_loss": -5.344202995300293, "global_step": 19750, "epoch": 470} {"train_loss": -5.374485969543457, "global_step": 19751, "epoch": 470} {"train_loss": -5.418540954589844, "global_step": 19752, "epoch": 470} {"train_loss": -5.3173828125, "global_step": 19753, "epoch": 470} {"train_loss": -5.2963361740112305, "global_step": 19754, "epoch": 470} {"train_loss": -5.155605316162109, "global_step": 19755, "epoch": 470} {"train_loss": -5.257431983947754, "global_step": 19756, "epoch": 470} {"train_loss": -5.152458190917969, "global_step": 19757, "epoch": 470} {"train_loss": -5.378420829772949, "global_step": 19758, "epoch": 470} {"train_loss": -5.408123970031738, "global_step": 19759, "epoch": 470} {"train_loss": -5.300200939178467, "global_step": 19760, "epoch": 470} {"train_loss": -5.354213714599609, "global_step": 19761, "epoch": 470} {"train_loss": -5.453285217285156, "global_step": 19762, "epoch": 470} {"train_loss": -5.411921977996826, "global_step": 19763, "epoch": 470} {"train_loss": -5.250358581542969, "global_step": 19764, "epoch": 470} {"train_loss": -5.305635452270508, "global_step": 19765, "epoch": 470} {"train_loss": -5.252780914306641, "global_step": 19766, "epoch": 470} {"train_loss": -5.245292663574219, "global_step": 19767, "epoch": 470} {"train_loss": -5.451586723327637, "global_step": 19768, "epoch": 470} {"train_loss": -5.4562225341796875, "global_step": 19769, "epoch": 470} {"train_loss": -5.424075603485107, "global_step": 19770, "epoch": 470} {"train_loss": -5.251889228820801, "global_step": 19771, "epoch": 470} {"train_loss": -5.403746604919434, "global_step": 19772, "epoch": 470} {"train_loss": -5.294203758239746, "global_step": 19773, "epoch": 470} {"train_loss": -5.247246742248535, "global_step": 19774, "epoch": 470} {"train_loss": -5.251948833465576, "global_step": 19775, "epoch": 470} {"train_loss": -5.2891621589660645, "global_step": 19776, "epoch": 470} {"train_loss": -5.282691955566406, "global_step": 19777, "epoch": 470} {"train_loss": -5.362492084503174, "global_step": 19778, "epoch": 470} {"train_loss": -5.302624225616455, "global_step": 19779, "epoch": 470} {"train_loss": -5.351450443267822, "global_step": 19780, "epoch": 470} {"train_loss": -5.317441179638817, "global_step": 19781, "epoch": 470, "val_loss": 68860.4375} {"train_loss": -5.358570098876953, "global_step": 19782, "epoch": 471} {"train_loss": -5.346378326416016, "global_step": 19783, "epoch": 471} {"train_loss": -5.38724422454834, "global_step": 19784, "epoch": 471} {"train_loss": -5.329773426055908, "global_step": 19785, "epoch": 471} {"train_loss": -5.419458866119385, "global_step": 19786, "epoch": 471} {"train_loss": -5.204317569732666, "global_step": 19787, "epoch": 471} {"train_loss": -5.3517045974731445, "global_step": 19788, "epoch": 471} {"train_loss": -5.30521297454834, "global_step": 19789, "epoch": 471} {"train_loss": -5.372590065002441, "global_step": 19790, "epoch": 471} {"train_loss": -5.286121368408203, "global_step": 19791, "epoch": 471} {"train_loss": -5.385618209838867, "global_step": 19792, "epoch": 471} {"train_loss": -5.471785068511963, "global_step": 19793, "epoch": 471} {"train_loss": -5.2117767333984375, "global_step": 19794, "epoch": 471} {"train_loss": -5.297701835632324, "global_step": 19795, "epoch": 471} {"train_loss": -5.302346229553223, "global_step": 19796, "epoch": 471} {"train_loss": -5.377983570098877, "global_step": 19797, "epoch": 471} {"train_loss": -5.387365341186523, "global_step": 19798, "epoch": 471} {"train_loss": -5.396035671234131, "global_step": 19799, "epoch": 471} {"train_loss": -5.357808589935303, "global_step": 19800, "epoch": 471} {"train_loss": -5.483147621154785, "global_step": 19801, "epoch": 471} {"train_loss": -5.3466997146606445, "global_step": 19802, "epoch": 471} {"train_loss": -5.20442008972168, "global_step": 19803, "epoch": 471} {"train_loss": -5.244912147521973, "global_step": 19804, "epoch": 471} {"train_loss": -5.257540702819824, "global_step": 19805, "epoch": 471} {"train_loss": -5.288823127746582, "global_step": 19806, "epoch": 471} {"train_loss": -5.293737411499023, "global_step": 19807, "epoch": 471} {"train_loss": -5.314919471740723, "global_step": 19808, "epoch": 471} {"train_loss": -5.302907943725586, "global_step": 19809, "epoch": 471} {"train_loss": -5.308773994445801, "global_step": 19810, "epoch": 471} {"train_loss": -5.347886562347412, "global_step": 19811, "epoch": 471} {"train_loss": -5.206938743591309, "global_step": 19812, "epoch": 471} {"train_loss": -5.310778617858887, "global_step": 19813, "epoch": 471} {"train_loss": -5.3590312004089355, "global_step": 19814, "epoch": 471} {"train_loss": -5.286903381347656, "global_step": 19815, "epoch": 471} {"train_loss": -5.163562297821045, "global_step": 19816, "epoch": 471} {"train_loss": -5.295570373535156, "global_step": 19817, "epoch": 471} {"train_loss": -5.32868766784668, "global_step": 19818, "epoch": 471} {"train_loss": -5.313432216644287, "global_step": 19819, "epoch": 471} {"train_loss": -5.222696304321289, "global_step": 19820, "epoch": 471} {"train_loss": -5.286579132080078, "global_step": 19821, "epoch": 471} {"train_loss": -5.180417060852051, "global_step": 19822, "epoch": 471} {"train_loss": -5.313711813517979, "global_step": 19823, "epoch": 471, "val_loss": 69142.03125} {"train_loss": -5.275873184204102, "global_step": 19824, "epoch": 472} {"train_loss": -5.076509475708008, "global_step": 19825, "epoch": 472} {"train_loss": -5.1331329345703125, "global_step": 19826, "epoch": 472} {"train_loss": -5.093231678009033, "global_step": 19827, "epoch": 472} {"train_loss": -5.266384124755859, "global_step": 19828, "epoch": 472} {"train_loss": -5.218017101287842, "global_step": 19829, "epoch": 472} {"train_loss": -5.340460300445557, "global_step": 19830, "epoch": 472} {"train_loss": -5.284707069396973, "global_step": 19831, "epoch": 472} {"train_loss": -5.210577011108398, "global_step": 19832, "epoch": 472} {"train_loss": -5.301156997680664, "global_step": 19833, "epoch": 472} {"train_loss": -5.29695463180542, "global_step": 19834, "epoch": 472} {"train_loss": -5.317310333251953, "global_step": 19835, "epoch": 472} {"train_loss": -5.434776782989502, "global_step": 19836, "epoch": 472} {"train_loss": -5.435763359069824, "global_step": 19837, "epoch": 472} {"train_loss": -5.269966125488281, "global_step": 19838, "epoch": 472} {"train_loss": -5.357815742492676, "global_step": 19839, "epoch": 472} {"train_loss": -5.217531204223633, "global_step": 19840, "epoch": 472} {"train_loss": -5.242916107177734, "global_step": 19841, "epoch": 472} {"train_loss": -5.365470886230469, "global_step": 19842, "epoch": 472} {"train_loss": -5.173893928527832, "global_step": 19843, "epoch": 472} {"train_loss": -5.147568702697754, "global_step": 19844, "epoch": 472} {"train_loss": -5.3457746505737305, "global_step": 19845, "epoch": 472} {"train_loss": -5.248652935028076, "global_step": 19846, "epoch": 472} {"train_loss": -5.209425926208496, "global_step": 19847, "epoch": 472} {"train_loss": -5.279468536376953, "global_step": 19848, "epoch": 472} {"train_loss": -5.309170722961426, "global_step": 19849, "epoch": 472} {"train_loss": -5.203308582305908, "global_step": 19850, "epoch": 472} {"train_loss": -5.417023658752441, "global_step": 19851, "epoch": 472} {"train_loss": -5.348385334014893, "global_step": 19852, "epoch": 472} {"train_loss": -5.235640048980713, "global_step": 19853, "epoch": 472} {"train_loss": -5.348838806152344, "global_step": 19854, "epoch": 472} {"train_loss": -5.218298435211182, "global_step": 19855, "epoch": 472} {"train_loss": -5.352179527282715, "global_step": 19856, "epoch": 472} {"train_loss": -5.135497093200684, "global_step": 19857, "epoch": 472} {"train_loss": -5.348914623260498, "global_step": 19858, "epoch": 472} {"train_loss": -5.222354888916016, "global_step": 19859, "epoch": 472} {"train_loss": -5.4348859786987305, "global_step": 19860, "epoch": 472} {"train_loss": -5.266482830047607, "global_step": 19861, "epoch": 472} {"train_loss": -5.306214332580566, "global_step": 19862, "epoch": 472} {"train_loss": -5.25386905670166, "global_step": 19863, "epoch": 472} {"train_loss": -5.275076866149902, "global_step": 19864, "epoch": 472} {"train_loss": -5.2777219499860495, "global_step": 19865, "epoch": 472, "val_loss": 69537.9375} {"train_loss": -5.173566818237305, "global_step": 19866, "epoch": 473} {"train_loss": -5.2620320320129395, "global_step": 19867, "epoch": 473} {"train_loss": -5.364181995391846, "global_step": 19868, "epoch": 473} {"train_loss": -5.217435359954834, "global_step": 19869, "epoch": 473} {"train_loss": -5.309103965759277, "global_step": 19870, "epoch": 473} {"train_loss": -5.406491756439209, "global_step": 19871, "epoch": 473} {"train_loss": -5.273282051086426, "global_step": 19872, "epoch": 473} {"train_loss": -5.381061553955078, "global_step": 19873, "epoch": 473} {"train_loss": -5.266706943511963, "global_step": 19874, "epoch": 473} {"train_loss": -5.237148284912109, "global_step": 19875, "epoch": 473} {"train_loss": -5.364785194396973, "global_step": 19876, "epoch": 473} {"train_loss": -5.371700763702393, "global_step": 19877, "epoch": 473} {"train_loss": -5.345178604125977, "global_step": 19878, "epoch": 473} {"train_loss": -5.383225440979004, "global_step": 19879, "epoch": 473} {"train_loss": -5.229981899261475, "global_step": 19880, "epoch": 473} {"train_loss": -5.321257591247559, "global_step": 19881, "epoch": 473} {"train_loss": -5.337100982666016, "global_step": 19882, "epoch": 473} {"train_loss": -5.201091289520264, "global_step": 19883, "epoch": 473} {"train_loss": -5.334115028381348, "global_step": 19884, "epoch": 473} {"train_loss": -5.310403823852539, "global_step": 19885, "epoch": 473} {"train_loss": -5.264410018920898, "global_step": 19886, "epoch": 473} {"train_loss": -5.2274932861328125, "global_step": 19887, "epoch": 473} {"train_loss": -5.449519634246826, "global_step": 19888, "epoch": 473} {"train_loss": -5.33088493347168, "global_step": 19889, "epoch": 473} {"train_loss": -5.342165946960449, "global_step": 19890, "epoch": 473} {"train_loss": -5.230924606323242, "global_step": 19891, "epoch": 473} {"train_loss": -5.2541279792785645, "global_step": 19892, "epoch": 473} {"train_loss": -5.2221293449401855, "global_step": 19893, "epoch": 473} {"train_loss": -5.306172847747803, "global_step": 19894, "epoch": 473} {"train_loss": -5.3721923828125, "global_step": 19895, "epoch": 473} {"train_loss": -5.250833511352539, "global_step": 19896, "epoch": 473} {"train_loss": -5.349541664123535, "global_step": 19897, "epoch": 473} {"train_loss": -5.378602027893066, "global_step": 19898, "epoch": 473} {"train_loss": -5.311832427978516, "global_step": 19899, "epoch": 473} {"train_loss": -5.325738430023193, "global_step": 19900, "epoch": 473} {"train_loss": -5.445370674133301, "global_step": 19901, "epoch": 473} {"train_loss": -5.308483123779297, "global_step": 19902, "epoch": 473} {"train_loss": -5.324678421020508, "global_step": 19903, "epoch": 473} {"train_loss": -5.3003315925598145, "global_step": 19904, "epoch": 473} {"train_loss": -5.273072242736816, "global_step": 19905, "epoch": 473} {"train_loss": -5.350472450256348, "global_step": 19906, "epoch": 473} {"train_loss": -5.3111851669493175, "global_step": 19907, "epoch": 473, "val_loss": 69206.7890625} {"train_loss": -5.307229995727539, "global_step": 19908, "epoch": 474} {"train_loss": -5.341284275054932, "global_step": 19909, "epoch": 474} {"train_loss": -5.265641689300537, "global_step": 19910, "epoch": 474} {"train_loss": -5.225828647613525, "global_step": 19911, "epoch": 474} {"train_loss": -5.2415056228637695, "global_step": 19912, "epoch": 474} {"train_loss": -5.173760890960693, "global_step": 19913, "epoch": 474} {"train_loss": -5.221725940704346, "global_step": 19914, "epoch": 474} {"train_loss": -5.10784912109375, "global_step": 19915, "epoch": 474} {"train_loss": -5.19632625579834, "global_step": 19916, "epoch": 474} {"train_loss": -5.21943998336792, "global_step": 19917, "epoch": 474} {"train_loss": -5.177530288696289, "global_step": 19918, "epoch": 474} {"train_loss": -5.387933254241943, "global_step": 19919, "epoch": 474} {"train_loss": -5.275399684906006, "global_step": 19920, "epoch": 474} {"train_loss": -5.2779388427734375, "global_step": 19921, "epoch": 474} {"train_loss": -5.3681464195251465, "global_step": 19922, "epoch": 474} {"train_loss": -5.306122779846191, "global_step": 19923, "epoch": 474} {"train_loss": -5.258993148803711, "global_step": 19924, "epoch": 474} {"train_loss": -5.33657169342041, "global_step": 19925, "epoch": 474} {"train_loss": -5.3488006591796875, "global_step": 19926, "epoch": 474} {"train_loss": -5.352646827697754, "global_step": 19927, "epoch": 474} {"train_loss": -5.292325496673584, "global_step": 19928, "epoch": 474} {"train_loss": -5.296456813812256, "global_step": 19929, "epoch": 474} {"train_loss": -5.552460193634033, "global_step": 19930, "epoch": 474} {"train_loss": -5.2736053466796875, "global_step": 19931, "epoch": 474} {"train_loss": -5.408997535705566, "global_step": 19932, "epoch": 474} {"train_loss": -5.204451084136963, "global_step": 19933, "epoch": 474} {"train_loss": -5.417034149169922, "global_step": 19934, "epoch": 474} {"train_loss": -5.305207252502441, "global_step": 19935, "epoch": 474} {"train_loss": -5.396553039550781, "global_step": 19936, "epoch": 474} {"train_loss": -5.291189193725586, "global_step": 19937, "epoch": 474} {"train_loss": -5.329634666442871, "global_step": 19938, "epoch": 474} {"train_loss": -5.446857452392578, "global_step": 19939, "epoch": 474} {"train_loss": -5.139720916748047, "global_step": 19940, "epoch": 474} {"train_loss": -5.397744178771973, "global_step": 19941, "epoch": 474} {"train_loss": -5.377649784088135, "global_step": 19942, "epoch": 474} {"train_loss": -5.252687454223633, "global_step": 19943, "epoch": 474} {"train_loss": -5.272853851318359, "global_step": 19944, "epoch": 474} {"train_loss": -5.4007110595703125, "global_step": 19945, "epoch": 474} {"train_loss": -5.378718376159668, "global_step": 19946, "epoch": 474} {"train_loss": -5.2205939292907715, "global_step": 19947, "epoch": 474} {"train_loss": -5.393781661987305, "global_step": 19948, "epoch": 474} {"train_loss": -5.303612618219285, "global_step": 19949, "epoch": 474, "val_loss": 69122.90625} {"train_loss": -5.27254581451416, "global_step": 19950, "epoch": 475} {"train_loss": -5.305058479309082, "global_step": 19951, "epoch": 475} {"train_loss": -5.254183769226074, "global_step": 19952, "epoch": 475} {"train_loss": -5.372437477111816, "global_step": 19953, "epoch": 475} {"train_loss": -5.288407325744629, "global_step": 19954, "epoch": 475} {"train_loss": -5.266470432281494, "global_step": 19955, "epoch": 475} {"train_loss": -5.190973281860352, "global_step": 19956, "epoch": 475} {"train_loss": -5.4108805656433105, "global_step": 19957, "epoch": 475} {"train_loss": -5.222496032714844, "global_step": 19958, "epoch": 475} {"train_loss": -5.459036350250244, "global_step": 19959, "epoch": 475} {"train_loss": -5.409462928771973, "global_step": 19960, "epoch": 475} {"train_loss": -5.1687164306640625, "global_step": 19961, "epoch": 475} {"train_loss": -5.1557769775390625, "global_step": 19962, "epoch": 475} {"train_loss": -5.325118541717529, "global_step": 19963, "epoch": 475} {"train_loss": -5.310487747192383, "global_step": 19964, "epoch": 475} {"train_loss": -5.463265895843506, "global_step": 19965, "epoch": 475} {"train_loss": -5.127688407897949, "global_step": 19966, "epoch": 475} {"train_loss": -5.397989749908447, "global_step": 19967, "epoch": 475} {"train_loss": -5.362079620361328, "global_step": 19968, "epoch": 475} {"train_loss": -5.182643413543701, "global_step": 19969, "epoch": 475} {"train_loss": -5.3393402099609375, "global_step": 19970, "epoch": 475} {"train_loss": -5.19708251953125, "global_step": 19971, "epoch": 475} {"train_loss": -5.387351036071777, "global_step": 19972, "epoch": 475} {"train_loss": -5.377327919006348, "global_step": 19973, "epoch": 475} {"train_loss": -5.3378448486328125, "global_step": 19974, "epoch": 475} {"train_loss": -5.420149803161621, "global_step": 19975, "epoch": 475} {"train_loss": -5.332342624664307, "global_step": 19976, "epoch": 475} {"train_loss": -5.433310508728027, "global_step": 19977, "epoch": 475} {"train_loss": -5.319158554077148, "global_step": 19978, "epoch": 475} {"train_loss": -5.367769718170166, "global_step": 19979, "epoch": 475} {"train_loss": -5.1988325119018555, "global_step": 19980, "epoch": 475} {"train_loss": -5.33377742767334, "global_step": 19981, "epoch": 475} {"train_loss": -5.4060821533203125, "global_step": 19982, "epoch": 475} {"train_loss": -5.292902946472168, "global_step": 19983, "epoch": 475} {"train_loss": -5.430250644683838, "global_step": 19984, "epoch": 475} {"train_loss": -5.34722900390625, "global_step": 19985, "epoch": 475} {"train_loss": -5.381608009338379, "global_step": 19986, "epoch": 475} {"train_loss": -5.3336920738220215, "global_step": 19987, "epoch": 475} {"train_loss": -5.054625511169434, "global_step": 19988, "epoch": 475} {"train_loss": -5.136419296264648, "global_step": 19989, "epoch": 475} {"train_loss": -5.123790264129639, "global_step": 19990, "epoch": 475} {"train_loss": -5.2993291446140836, "global_step": 19991, "epoch": 475, "val_loss": 69909.4921875} {"train_loss": -5.138803482055664, "global_step": 19992, "epoch": 476} {"train_loss": -5.1033453941345215, "global_step": 19993, "epoch": 476} {"train_loss": -5.110757827758789, "global_step": 19994, "epoch": 476} {"train_loss": -5.259111404418945, "global_step": 19995, "epoch": 476} {"train_loss": -5.178740501403809, "global_step": 19996, "epoch": 476} {"train_loss": -5.219543933868408, "global_step": 19997, "epoch": 476} {"train_loss": -5.257729530334473, "global_step": 19998, "epoch": 476} {"train_loss": -5.285134792327881, "global_step": 19999, "epoch": 476} {"train_loss": -5.228973388671875, "global_step": 20000, "epoch": 476} {"train_loss": -5.2154717445373535, "global_step": 20001, "epoch": 476} {"train_loss": -5.208350658416748, "global_step": 20002, "epoch": 476} {"train_loss": -5.305577278137207, "global_step": 20003, "epoch": 476} {"train_loss": -5.28648042678833, "global_step": 20004, "epoch": 476} {"train_loss": -5.029323101043701, "global_step": 20005, "epoch": 476} {"train_loss": -5.315727233886719, "global_step": 20006, "epoch": 476} {"train_loss": -5.01781702041626, "global_step": 20007, "epoch": 476} {"train_loss": -5.363956451416016, "global_step": 20008, "epoch": 476} {"train_loss": -5.087282180786133, "global_step": 20009, "epoch": 476} {"train_loss": -5.247286796569824, "global_step": 20010, "epoch": 476} {"train_loss": -5.319137096405029, "global_step": 20011, "epoch": 476} {"train_loss": -5.294587135314941, "global_step": 20012, "epoch": 476} {"train_loss": -5.2643914222717285, "global_step": 20013, "epoch": 476} {"train_loss": -5.179876804351807, "global_step": 20014, "epoch": 476} {"train_loss": -5.36680793762207, "global_step": 20015, "epoch": 476} {"train_loss": -5.372104644775391, "global_step": 20016, "epoch": 476} {"train_loss": -5.3379621505737305, "global_step": 20017, "epoch": 476} {"train_loss": -5.307924270629883, "global_step": 20018, "epoch": 476} {"train_loss": -5.186196327209473, "global_step": 20019, "epoch": 476} {"train_loss": -5.334624290466309, "global_step": 20020, "epoch": 476} {"train_loss": -5.318235397338867, "global_step": 20021, "epoch": 476} {"train_loss": -5.13818359375, "global_step": 20022, "epoch": 476} {"train_loss": -5.252882480621338, "global_step": 20023, "epoch": 476} {"train_loss": -5.467440605163574, "global_step": 20024, "epoch": 476} {"train_loss": -5.306802749633789, "global_step": 20025, "epoch": 476} {"train_loss": -5.373017311096191, "global_step": 20026, "epoch": 476} {"train_loss": -5.3429107666015625, "global_step": 20027, "epoch": 476} {"train_loss": -5.419322967529297, "global_step": 20028, "epoch": 476} {"train_loss": -5.325436592102051, "global_step": 20029, "epoch": 476} {"train_loss": -5.275213241577148, "global_step": 20030, "epoch": 476} {"train_loss": -5.270097732543945, "global_step": 20031, "epoch": 476} {"train_loss": -5.216121673583984, "global_step": 20032, "epoch": 476} {"train_loss": -5.260286887486775, "global_step": 20033, "epoch": 476, "val_loss": 69146.5078125} {"train_loss": -5.244264602661133, "global_step": 20034, "epoch": 477} {"train_loss": -5.304135322570801, "global_step": 20035, "epoch": 477} {"train_loss": -5.309597969055176, "global_step": 20036, "epoch": 477} {"train_loss": -5.407418251037598, "global_step": 20037, "epoch": 477} {"train_loss": -5.350247383117676, "global_step": 20038, "epoch": 477} {"train_loss": -5.47883415222168, "global_step": 20039, "epoch": 477} {"train_loss": -5.3811492919921875, "global_step": 20040, "epoch": 477} {"train_loss": -5.2388105392456055, "global_step": 20041, "epoch": 477} {"train_loss": -5.311223030090332, "global_step": 20042, "epoch": 477} {"train_loss": -5.401374816894531, "global_step": 20043, "epoch": 477} {"train_loss": -5.305215835571289, "global_step": 20044, "epoch": 477} {"train_loss": -5.288213729858398, "global_step": 20045, "epoch": 477} {"train_loss": -5.41123628616333, "global_step": 20046, "epoch": 477} {"train_loss": -5.47844123840332, "global_step": 20047, "epoch": 477} {"train_loss": -5.166833400726318, "global_step": 20048, "epoch": 477} {"train_loss": -5.302670478820801, "global_step": 20049, "epoch": 477} {"train_loss": -5.184972763061523, "global_step": 20050, "epoch": 477} {"train_loss": -5.2863969802856445, "global_step": 20051, "epoch": 477} {"train_loss": -5.194984436035156, "global_step": 20052, "epoch": 477} {"train_loss": -5.447691440582275, "global_step": 20053, "epoch": 477} {"train_loss": -5.3105950355529785, "global_step": 20054, "epoch": 477} {"train_loss": -5.219276428222656, "global_step": 20055, "epoch": 477} {"train_loss": -5.252437591552734, "global_step": 20056, "epoch": 477} {"train_loss": -5.408472061157227, "global_step": 20057, "epoch": 477} {"train_loss": -5.111081123352051, "global_step": 20058, "epoch": 477} {"train_loss": -5.192258358001709, "global_step": 20059, "epoch": 477} {"train_loss": -5.3126912117004395, "global_step": 20060, "epoch": 477} {"train_loss": -5.321667671203613, "global_step": 20061, "epoch": 477} {"train_loss": -5.123552322387695, "global_step": 20062, "epoch": 477} {"train_loss": -5.118271827697754, "global_step": 20063, "epoch": 477} {"train_loss": -5.269227027893066, "global_step": 20064, "epoch": 477} {"train_loss": -5.211525917053223, "global_step": 20065, "epoch": 477} {"train_loss": -5.197360515594482, "global_step": 20066, "epoch": 477} {"train_loss": -5.051441669464111, "global_step": 20067, "epoch": 477} {"train_loss": -5.292522430419922, "global_step": 20068, "epoch": 477} {"train_loss": -5.2780256271362305, "global_step": 20069, "epoch": 477} {"train_loss": -5.303937911987305, "global_step": 20070, "epoch": 477} {"train_loss": -5.259999752044678, "global_step": 20071, "epoch": 477} {"train_loss": -5.3913774490356445, "global_step": 20072, "epoch": 477} {"train_loss": -5.336675643920898, "global_step": 20073, "epoch": 477} {"train_loss": -5.135169982910156, "global_step": 20074, "epoch": 477} {"train_loss": -5.28330093338376, "global_step": 20075, "epoch": 477, "val_loss": 69340.9609375} {"train_loss": -5.311003684997559, "global_step": 20076, "epoch": 478} {"train_loss": -5.3213582038879395, "global_step": 20077, "epoch": 478} {"train_loss": -5.328460693359375, "global_step": 20078, "epoch": 478} {"train_loss": -5.303638458251953, "global_step": 20079, "epoch": 478} {"train_loss": -5.384626388549805, "global_step": 20080, "epoch": 478} {"train_loss": -5.311979293823242, "global_step": 20081, "epoch": 478} {"train_loss": -5.330574989318848, "global_step": 20082, "epoch": 478} {"train_loss": -5.377823829650879, "global_step": 20083, "epoch": 478} {"train_loss": -5.301581382751465, "global_step": 20084, "epoch": 478} {"train_loss": -5.263330459594727, "global_step": 20085, "epoch": 478} {"train_loss": -5.35474967956543, "global_step": 20086, "epoch": 478} {"train_loss": -5.097158432006836, "global_step": 20087, "epoch": 478} {"train_loss": -5.150469779968262, "global_step": 20088, "epoch": 478} {"train_loss": -5.300125598907471, "global_step": 20089, "epoch": 478} {"train_loss": -5.2667412757873535, "global_step": 20090, "epoch": 478} {"train_loss": -5.371973991394043, "global_step": 20091, "epoch": 478} {"train_loss": -5.35100793838501, "global_step": 20092, "epoch": 478} {"train_loss": -5.174816131591797, "global_step": 20093, "epoch": 478} {"train_loss": -5.185352325439453, "global_step": 20094, "epoch": 478} {"train_loss": -5.27504825592041, "global_step": 20095, "epoch": 478} {"train_loss": -5.12586784362793, "global_step": 20096, "epoch": 478} {"train_loss": -5.24666690826416, "global_step": 20097, "epoch": 478} {"train_loss": -5.091784954071045, "global_step": 20098, "epoch": 478} {"train_loss": -5.278942108154297, "global_step": 20099, "epoch": 478} {"train_loss": -5.299215793609619, "global_step": 20100, "epoch": 478} {"train_loss": -5.1554460525512695, "global_step": 20101, "epoch": 478} {"train_loss": -5.378023624420166, "global_step": 20102, "epoch": 478} {"train_loss": -5.08555269241333, "global_step": 20103, "epoch": 478} {"train_loss": -5.440207481384277, "global_step": 20104, "epoch": 478} {"train_loss": -5.185673713684082, "global_step": 20105, "epoch": 478} {"train_loss": -5.2888994216918945, "global_step": 20106, "epoch": 478} {"train_loss": -5.250621795654297, "global_step": 20107, "epoch": 478} {"train_loss": -5.2862772941589355, "global_step": 20108, "epoch": 478} {"train_loss": -5.161199569702148, "global_step": 20109, "epoch": 478} {"train_loss": -5.323640823364258, "global_step": 20110, "epoch": 478} {"train_loss": -5.247143268585205, "global_step": 20111, "epoch": 478} {"train_loss": -5.376491546630859, "global_step": 20112, "epoch": 478} {"train_loss": -5.45283317565918, "global_step": 20113, "epoch": 478} {"train_loss": -5.277119159698486, "global_step": 20114, "epoch": 478} {"train_loss": -5.322780609130859, "global_step": 20115, "epoch": 478} {"train_loss": -5.226943016052246, "global_step": 20116, "epoch": 478} {"train_loss": -5.274071602594285, "global_step": 20117, "epoch": 478, "val_loss": 68653.7578125} {"train_loss": -5.244682312011719, "global_step": 20118, "epoch": 479} {"train_loss": -5.230112075805664, "global_step": 20119, "epoch": 479} {"train_loss": -5.319762229919434, "global_step": 20120, "epoch": 479} {"train_loss": -5.29752254486084, "global_step": 20121, "epoch": 479} {"train_loss": -5.250887870788574, "global_step": 20122, "epoch": 479} {"train_loss": -5.356198310852051, "global_step": 20123, "epoch": 479} {"train_loss": -5.074537754058838, "global_step": 20124, "epoch": 479} {"train_loss": -5.4246368408203125, "global_step": 20125, "epoch": 479} {"train_loss": -5.293705940246582, "global_step": 20126, "epoch": 479} {"train_loss": -5.134702205657959, "global_step": 20127, "epoch": 479} {"train_loss": -5.1970295906066895, "global_step": 20128, "epoch": 479} {"train_loss": -5.159307956695557, "global_step": 20129, "epoch": 479} {"train_loss": -5.323482990264893, "global_step": 20130, "epoch": 479} {"train_loss": -5.2715044021606445, "global_step": 20131, "epoch": 479} {"train_loss": -5.269410133361816, "global_step": 20132, "epoch": 479} {"train_loss": -5.234938621520996, "global_step": 20133, "epoch": 479} {"train_loss": -5.155970573425293, "global_step": 20134, "epoch": 479} {"train_loss": -5.350289344787598, "global_step": 20135, "epoch": 479} {"train_loss": -5.195932388305664, "global_step": 20136, "epoch": 479} {"train_loss": -5.2609477043151855, "global_step": 20137, "epoch": 479} {"train_loss": -5.332530975341797, "global_step": 20138, "epoch": 479} {"train_loss": -5.3933820724487305, "global_step": 20139, "epoch": 479} {"train_loss": -5.331247329711914, "global_step": 20140, "epoch": 479} {"train_loss": -5.281578540802002, "global_step": 20141, "epoch": 479} {"train_loss": -5.315159797668457, "global_step": 20142, "epoch": 479} {"train_loss": -5.332322597503662, "global_step": 20143, "epoch": 479} {"train_loss": -5.4174604415893555, "global_step": 20144, "epoch": 479} {"train_loss": -5.244826316833496, "global_step": 20145, "epoch": 479} {"train_loss": -5.325272083282471, "global_step": 20146, "epoch": 479} {"train_loss": -5.27678108215332, "global_step": 20147, "epoch": 479} {"train_loss": -5.3701629638671875, "global_step": 20148, "epoch": 479} {"train_loss": -5.2443413734436035, "global_step": 20149, "epoch": 479} {"train_loss": -5.239621162414551, "global_step": 20150, "epoch": 479} {"train_loss": -5.305310249328613, "global_step": 20151, "epoch": 479} {"train_loss": -5.374940872192383, "global_step": 20152, "epoch": 479} {"train_loss": -5.17188835144043, "global_step": 20153, "epoch": 479} {"train_loss": -5.3265862464904785, "global_step": 20154, "epoch": 479} {"train_loss": -5.2902631759643555, "global_step": 20155, "epoch": 479} {"train_loss": -5.439510345458984, "global_step": 20156, "epoch": 479} {"train_loss": -5.206387519836426, "global_step": 20157, "epoch": 479} {"train_loss": -5.354622840881348, "global_step": 20158, "epoch": 479} {"train_loss": -5.28373570669265, "global_step": 20159, "epoch": 479, "val_loss": 69519.4609375} {"train_loss": -5.314775466918945, "global_step": 20160, "epoch": 480} {"train_loss": -5.289496898651123, "global_step": 20161, "epoch": 480} {"train_loss": -5.296127796173096, "global_step": 20162, "epoch": 480} {"train_loss": -5.378070831298828, "global_step": 20163, "epoch": 480} {"train_loss": -5.396348476409912, "global_step": 20164, "epoch": 480} {"train_loss": -5.338052272796631, "global_step": 20165, "epoch": 480} {"train_loss": -5.334671497344971, "global_step": 20166, "epoch": 480} {"train_loss": -5.326412200927734, "global_step": 20167, "epoch": 480} {"train_loss": -5.278358459472656, "global_step": 20168, "epoch": 480} {"train_loss": -5.354619979858398, "global_step": 20169, "epoch": 480} {"train_loss": -5.446048736572266, "global_step": 20170, "epoch": 480} {"train_loss": -5.407295227050781, "global_step": 20171, "epoch": 480} {"train_loss": -5.338779449462891, "global_step": 20172, "epoch": 480} {"train_loss": -5.278219223022461, "global_step": 20173, "epoch": 480} {"train_loss": -5.320308685302734, "global_step": 20174, "epoch": 480} {"train_loss": -5.393123626708984, "global_step": 20175, "epoch": 480} {"train_loss": -5.377171516418457, "global_step": 20176, "epoch": 480} {"train_loss": -5.303625583648682, "global_step": 20177, "epoch": 480} {"train_loss": -5.309607028961182, "global_step": 20178, "epoch": 480} {"train_loss": -5.354770660400391, "global_step": 20179, "epoch": 480} {"train_loss": -5.341802597045898, "global_step": 20180, "epoch": 480} {"train_loss": -5.374338150024414, "global_step": 20181, "epoch": 480} {"train_loss": -5.27561092376709, "global_step": 20182, "epoch": 480} {"train_loss": -5.388186931610107, "global_step": 20183, "epoch": 480} {"train_loss": -5.282017707824707, "global_step": 20184, "epoch": 480} {"train_loss": -5.243707656860352, "global_step": 20185, "epoch": 480} {"train_loss": -5.30793571472168, "global_step": 20186, "epoch": 480} {"train_loss": -5.24265193939209, "global_step": 20187, "epoch": 480} {"train_loss": -5.232489585876465, "global_step": 20188, "epoch": 480} {"train_loss": -5.337474822998047, "global_step": 20189, "epoch": 480} {"train_loss": -5.312247276306152, "global_step": 20190, "epoch": 480} {"train_loss": -5.2353620529174805, "global_step": 20191, "epoch": 480} {"train_loss": -5.355587959289551, "global_step": 20192, "epoch": 480} {"train_loss": -5.282924652099609, "global_step": 20193, "epoch": 480} {"train_loss": -5.416319847106934, "global_step": 20194, "epoch": 480} {"train_loss": -5.2838544845581055, "global_step": 20195, "epoch": 480} {"train_loss": -5.219612121582031, "global_step": 20196, "epoch": 480} {"train_loss": -5.242997169494629, "global_step": 20197, "epoch": 480} {"train_loss": -5.2964911460876465, "global_step": 20198, "epoch": 480} {"train_loss": -5.2644147872924805, "global_step": 20199, "epoch": 480} {"train_loss": -5.206433296203613, "global_step": 20200, "epoch": 480} {"train_loss": -5.317668574196952, "global_step": 20201, "epoch": 480, "val_loss": 69038.6640625} {"train_loss": -5.351016998291016, "global_step": 20202, "epoch": 481} {"train_loss": -5.358095169067383, "global_step": 20203, "epoch": 481} {"train_loss": -5.365142345428467, "global_step": 20204, "epoch": 481} {"train_loss": -5.2698073387146, "global_step": 20205, "epoch": 481} {"train_loss": -5.349336624145508, "global_step": 20206, "epoch": 481} {"train_loss": -5.307285785675049, "global_step": 20207, "epoch": 481} {"train_loss": -5.323054313659668, "global_step": 20208, "epoch": 481} {"train_loss": -5.249469757080078, "global_step": 20209, "epoch": 481} {"train_loss": -5.3692731857299805, "global_step": 20210, "epoch": 481} {"train_loss": -5.455503463745117, "global_step": 20211, "epoch": 481} {"train_loss": -5.341352462768555, "global_step": 20212, "epoch": 481} {"train_loss": -5.362878799438477, "global_step": 20213, "epoch": 481} {"train_loss": -5.137547969818115, "global_step": 20214, "epoch": 481} {"train_loss": -5.3772196769714355, "global_step": 20215, "epoch": 481} {"train_loss": -5.424914836883545, "global_step": 20216, "epoch": 481} {"train_loss": -5.236761569976807, "global_step": 20217, "epoch": 481} {"train_loss": -5.397494316101074, "global_step": 20218, "epoch": 481} {"train_loss": -5.299941062927246, "global_step": 20219, "epoch": 481} {"train_loss": -5.338846683502197, "global_step": 20220, "epoch": 481} {"train_loss": -5.303302764892578, "global_step": 20221, "epoch": 481} {"train_loss": -5.272812366485596, "global_step": 20222, "epoch": 481} {"train_loss": -5.282439231872559, "global_step": 20223, "epoch": 481} {"train_loss": -5.128140449523926, "global_step": 20224, "epoch": 481} {"train_loss": -5.2080979347229, "global_step": 20225, "epoch": 481} {"train_loss": -5.446779251098633, "global_step": 20226, "epoch": 481} {"train_loss": -5.226171493530273, "global_step": 20227, "epoch": 481} {"train_loss": -5.194836616516113, "global_step": 20228, "epoch": 481} {"train_loss": -5.28039026260376, "global_step": 20229, "epoch": 481} {"train_loss": -5.293974876403809, "global_step": 20230, "epoch": 481} {"train_loss": -5.330449104309082, "global_step": 20231, "epoch": 481} {"train_loss": -5.284946441650391, "global_step": 20232, "epoch": 481} {"train_loss": -5.407413005828857, "global_step": 20233, "epoch": 481} {"train_loss": -5.3819379806518555, "global_step": 20234, "epoch": 481} {"train_loss": -5.301398277282715, "global_step": 20235, "epoch": 481} {"train_loss": -5.263920783996582, "global_step": 20236, "epoch": 481} {"train_loss": -5.423417091369629, "global_step": 20237, "epoch": 481} {"train_loss": -5.3590593338012695, "global_step": 20238, "epoch": 481} {"train_loss": -5.406615257263184, "global_step": 20239, "epoch": 481} {"train_loss": -5.262123107910156, "global_step": 20240, "epoch": 481} {"train_loss": -5.372413158416748, "global_step": 20241, "epoch": 481} {"train_loss": -5.30187463760376, "global_step": 20242, "epoch": 481} {"train_loss": -5.3203683240073065, "global_step": 20243, "epoch": 481, "val_loss": 68480.7109375} {"train_loss": -5.377676486968994, "global_step": 20244, "epoch": 482} {"train_loss": -5.336391448974609, "global_step": 20245, "epoch": 482} {"train_loss": -5.203896999359131, "global_step": 20246, "epoch": 482} {"train_loss": -5.376619338989258, "global_step": 20247, "epoch": 482} {"train_loss": -5.366866111755371, "global_step": 20248, "epoch": 482} {"train_loss": -5.338983535766602, "global_step": 20249, "epoch": 482} {"train_loss": -5.335596084594727, "global_step": 20250, "epoch": 482} {"train_loss": -5.3980607986450195, "global_step": 20251, "epoch": 482} {"train_loss": -5.1691389083862305, "global_step": 20252, "epoch": 482} {"train_loss": -5.227715969085693, "global_step": 20253, "epoch": 482} {"train_loss": -5.443352222442627, "global_step": 20254, "epoch": 482} {"train_loss": -5.254310607910156, "global_step": 20255, "epoch": 482} {"train_loss": -5.323667526245117, "global_step": 20256, "epoch": 482} {"train_loss": -5.235297679901123, "global_step": 20257, "epoch": 482} {"train_loss": -5.37905216217041, "global_step": 20258, "epoch": 482} {"train_loss": -5.390748023986816, "global_step": 20259, "epoch": 482} {"train_loss": -5.361550807952881, "global_step": 20260, "epoch": 482} {"train_loss": -5.197292804718018, "global_step": 20261, "epoch": 482} {"train_loss": -5.415605545043945, "global_step": 20262, "epoch": 482} {"train_loss": -5.3577094078063965, "global_step": 20263, "epoch": 482} {"train_loss": -5.338085174560547, "global_step": 20264, "epoch": 482} {"train_loss": -5.208121299743652, "global_step": 20265, "epoch": 482} {"train_loss": -5.245392799377441, "global_step": 20266, "epoch": 482} {"train_loss": -5.199545860290527, "global_step": 20267, "epoch": 482} {"train_loss": -5.29849910736084, "global_step": 20268, "epoch": 482} {"train_loss": -5.247977256774902, "global_step": 20269, "epoch": 482} {"train_loss": -5.326011657714844, "global_step": 20270, "epoch": 482} {"train_loss": -5.355256080627441, "global_step": 20271, "epoch": 482} {"train_loss": -5.235694885253906, "global_step": 20272, "epoch": 482} {"train_loss": -5.346824645996094, "global_step": 20273, "epoch": 482} {"train_loss": -5.327149391174316, "global_step": 20274, "epoch": 482} {"train_loss": -5.437873840332031, "global_step": 20275, "epoch": 482} {"train_loss": -5.254798889160156, "global_step": 20276, "epoch": 482} {"train_loss": -5.356758117675781, "global_step": 20277, "epoch": 482} {"train_loss": -5.441493511199951, "global_step": 20278, "epoch": 482} {"train_loss": -5.180695533752441, "global_step": 20279, "epoch": 482} {"train_loss": -5.317470073699951, "global_step": 20280, "epoch": 482} {"train_loss": -5.339160919189453, "global_step": 20281, "epoch": 482} {"train_loss": -5.369327545166016, "global_step": 20282, "epoch": 482} {"train_loss": -5.397173881530762, "global_step": 20283, "epoch": 482} {"train_loss": -5.35184383392334, "global_step": 20284, "epoch": 482} {"train_loss": -5.317308607555571, "global_step": 20285, "epoch": 482, "val_loss": 69114.890625} {"train_loss": -5.437604904174805, "global_step": 20286, "epoch": 483} {"train_loss": -5.382612705230713, "global_step": 20287, "epoch": 483} {"train_loss": -5.38136100769043, "global_step": 20288, "epoch": 483} {"train_loss": -5.337063789367676, "global_step": 20289, "epoch": 483} {"train_loss": -5.252660274505615, "global_step": 20290, "epoch": 483} {"train_loss": -5.19108772277832, "global_step": 20291, "epoch": 483} {"train_loss": -5.396822929382324, "global_step": 20292, "epoch": 483} {"train_loss": -5.174743175506592, "global_step": 20293, "epoch": 483} {"train_loss": -5.346174240112305, "global_step": 20294, "epoch": 483} {"train_loss": -5.285668849945068, "global_step": 20295, "epoch": 483} {"train_loss": -5.294647693634033, "global_step": 20296, "epoch": 483} {"train_loss": -5.2613525390625, "global_step": 20297, "epoch": 483} {"train_loss": -5.393282890319824, "global_step": 20298, "epoch": 483} {"train_loss": -5.3545050621032715, "global_step": 20299, "epoch": 483} {"train_loss": -5.224164009094238, "global_step": 20300, "epoch": 483} {"train_loss": -5.352839946746826, "global_step": 20301, "epoch": 483} {"train_loss": -5.2787957191467285, "global_step": 20302, "epoch": 483} {"train_loss": -5.448455333709717, "global_step": 20303, "epoch": 483} {"train_loss": -5.367546558380127, "global_step": 20304, "epoch": 483} {"train_loss": -5.3681321144104, "global_step": 20305, "epoch": 483} {"train_loss": -5.242921829223633, "global_step": 20306, "epoch": 483} {"train_loss": -5.275007724761963, "global_step": 20307, "epoch": 483} {"train_loss": -5.389639854431152, "global_step": 20308, "epoch": 483} {"train_loss": -5.1894755363464355, "global_step": 20309, "epoch": 483} {"train_loss": -5.278357982635498, "global_step": 20310, "epoch": 483} {"train_loss": -5.401912689208984, "global_step": 20311, "epoch": 483} {"train_loss": -5.316131114959717, "global_step": 20312, "epoch": 483} {"train_loss": -5.2630414962768555, "global_step": 20313, "epoch": 483} {"train_loss": -5.157271385192871, "global_step": 20314, "epoch": 483} {"train_loss": -5.264314651489258, "global_step": 20315, "epoch": 483} {"train_loss": -5.37662410736084, "global_step": 20316, "epoch": 483} {"train_loss": -5.412976264953613, "global_step": 20317, "epoch": 483} {"train_loss": -5.157949447631836, "global_step": 20318, "epoch": 483} {"train_loss": -5.3046159744262695, "global_step": 20319, "epoch": 483} {"train_loss": -5.154283046722412, "global_step": 20320, "epoch": 483} {"train_loss": -5.286998748779297, "global_step": 20321, "epoch": 483} {"train_loss": -5.379651069641113, "global_step": 20322, "epoch": 483} {"train_loss": -5.236137390136719, "global_step": 20323, "epoch": 483} {"train_loss": -5.319989204406738, "global_step": 20324, "epoch": 483} {"train_loss": -5.26353120803833, "global_step": 20325, "epoch": 483} {"train_loss": -5.261133670806885, "global_step": 20326, "epoch": 483} {"train_loss": -5.305027405420939, "global_step": 20327, "epoch": 483, "val_loss": 68806.9921875} {"train_loss": -5.325750827789307, "global_step": 20328, "epoch": 484} {"train_loss": -5.421665668487549, "global_step": 20329, "epoch": 484} {"train_loss": -5.304690837860107, "global_step": 20330, "epoch": 484} {"train_loss": -5.379069805145264, "global_step": 20331, "epoch": 484} {"train_loss": -5.32103157043457, "global_step": 20332, "epoch": 484} {"train_loss": -5.372555732727051, "global_step": 20333, "epoch": 484} {"train_loss": -5.344935417175293, "global_step": 20334, "epoch": 484} {"train_loss": -5.411772727966309, "global_step": 20335, "epoch": 484} {"train_loss": -5.378467559814453, "global_step": 20336, "epoch": 484} {"train_loss": -5.297647953033447, "global_step": 20337, "epoch": 484} {"train_loss": -5.300063133239746, "global_step": 20338, "epoch": 484} {"train_loss": -5.30247688293457, "global_step": 20339, "epoch": 484} {"train_loss": -5.317120552062988, "global_step": 20340, "epoch": 484} {"train_loss": -5.417670249938965, "global_step": 20341, "epoch": 484} {"train_loss": -5.37406587600708, "global_step": 20342, "epoch": 484} {"train_loss": -5.435125350952148, "global_step": 20343, "epoch": 484} {"train_loss": -5.3980512619018555, "global_step": 20344, "epoch": 484} {"train_loss": -5.394290924072266, "global_step": 20345, "epoch": 484} {"train_loss": -5.346052169799805, "global_step": 20346, "epoch": 484} {"train_loss": -5.315516471862793, "global_step": 20347, "epoch": 484} {"train_loss": -5.399738311767578, "global_step": 20348, "epoch": 484} {"train_loss": -5.342658042907715, "global_step": 20349, "epoch": 484} {"train_loss": -5.272584915161133, "global_step": 20350, "epoch": 484} {"train_loss": -5.1470232009887695, "global_step": 20351, "epoch": 484} {"train_loss": -5.291709899902344, "global_step": 20352, "epoch": 484} {"train_loss": -5.141699314117432, "global_step": 20353, "epoch": 484} {"train_loss": -5.377060890197754, "global_step": 20354, "epoch": 484} {"train_loss": -5.421699523925781, "global_step": 20355, "epoch": 484} {"train_loss": -5.31088924407959, "global_step": 20356, "epoch": 484} {"train_loss": -5.246525287628174, "global_step": 20357, "epoch": 484} {"train_loss": -5.340253829956055, "global_step": 20358, "epoch": 484} {"train_loss": -5.2732696533203125, "global_step": 20359, "epoch": 484} {"train_loss": -5.2197957038879395, "global_step": 20360, "epoch": 484} {"train_loss": -5.193458557128906, "global_step": 20361, "epoch": 484} {"train_loss": -5.328888893127441, "global_step": 20362, "epoch": 484} {"train_loss": -5.236312389373779, "global_step": 20363, "epoch": 484} {"train_loss": -5.382101058959961, "global_step": 20364, "epoch": 484} {"train_loss": -5.395230293273926, "global_step": 20365, "epoch": 484} {"train_loss": -5.22504997253418, "global_step": 20366, "epoch": 484} {"train_loss": -5.254376411437988, "global_step": 20367, "epoch": 484} {"train_loss": -5.177757263183594, "global_step": 20368, "epoch": 484} {"train_loss": -5.319099426269531, "global_step": 20369, "epoch": 484, "val_loss": 68775.109375} {"train_loss": -5.415801048278809, "global_step": 20370, "epoch": 485} {"train_loss": -5.343152046203613, "global_step": 20371, "epoch": 485} {"train_loss": -5.2926106452941895, "global_step": 20372, "epoch": 485} {"train_loss": -5.375823974609375, "global_step": 20373, "epoch": 485} {"train_loss": -5.307244300842285, "global_step": 20374, "epoch": 485} {"train_loss": -5.296944618225098, "global_step": 20375, "epoch": 485} {"train_loss": -5.305915832519531, "global_step": 20376, "epoch": 485} {"train_loss": -5.1133928298950195, "global_step": 20377, "epoch": 485} {"train_loss": -5.290555953979492, "global_step": 20378, "epoch": 485} {"train_loss": -5.339871406555176, "global_step": 20379, "epoch": 485} {"train_loss": -5.154257774353027, "global_step": 20380, "epoch": 485} {"train_loss": -5.421784400939941, "global_step": 20381, "epoch": 485} {"train_loss": -5.431551933288574, "global_step": 20382, "epoch": 485} {"train_loss": -5.1066789627075195, "global_step": 20383, "epoch": 485} {"train_loss": -5.404736518859863, "global_step": 20384, "epoch": 485} {"train_loss": -5.187376499176025, "global_step": 20385, "epoch": 485} {"train_loss": -5.224166393280029, "global_step": 20386, "epoch": 485} {"train_loss": -5.214564323425293, "global_step": 20387, "epoch": 485} {"train_loss": -5.231066703796387, "global_step": 20388, "epoch": 485} {"train_loss": -5.204693794250488, "global_step": 20389, "epoch": 485} {"train_loss": -5.222336769104004, "global_step": 20390, "epoch": 485} {"train_loss": -5.462414741516113, "global_step": 20391, "epoch": 485} {"train_loss": -5.255376815795898, "global_step": 20392, "epoch": 485} {"train_loss": -5.34478759765625, "global_step": 20393, "epoch": 485} {"train_loss": -5.326510429382324, "global_step": 20394, "epoch": 485} {"train_loss": -5.263113498687744, "global_step": 20395, "epoch": 485} {"train_loss": -5.246575355529785, "global_step": 20396, "epoch": 485} {"train_loss": -5.343636512756348, "global_step": 20397, "epoch": 485} {"train_loss": -5.324956893920898, "global_step": 20398, "epoch": 485} {"train_loss": -5.403565406799316, "global_step": 20399, "epoch": 485} {"train_loss": -5.302538871765137, "global_step": 20400, "epoch": 485} {"train_loss": -5.372570991516113, "global_step": 20401, "epoch": 485} {"train_loss": -5.320498466491699, "global_step": 20402, "epoch": 485} {"train_loss": -5.2915778160095215, "global_step": 20403, "epoch": 485} {"train_loss": -5.323109149932861, "global_step": 20404, "epoch": 485} {"train_loss": -5.39272403717041, "global_step": 20405, "epoch": 485} {"train_loss": -5.465362071990967, "global_step": 20406, "epoch": 485} {"train_loss": -5.23294734954834, "global_step": 20407, "epoch": 485} {"train_loss": -5.2104902267456055, "global_step": 20408, "epoch": 485} {"train_loss": -5.34901762008667, "global_step": 20409, "epoch": 485} {"train_loss": -5.244996070861816, "global_step": 20410, "epoch": 485} {"train_loss": -5.299148457390921, "global_step": 20411, "epoch": 485, "val_loss": 70114.2265625} {"train_loss": -5.1756815910339355, "global_step": 20412, "epoch": 486} {"train_loss": -5.277524471282959, "global_step": 20413, "epoch": 486} {"train_loss": -5.398164749145508, "global_step": 20414, "epoch": 486} {"train_loss": -5.284218788146973, "global_step": 20415, "epoch": 486} {"train_loss": -5.2742109298706055, "global_step": 20416, "epoch": 486} {"train_loss": -5.3675923347473145, "global_step": 20417, "epoch": 486} {"train_loss": -5.292741775512695, "global_step": 20418, "epoch": 486} {"train_loss": -5.225083351135254, "global_step": 20419, "epoch": 486} {"train_loss": -5.408764839172363, "global_step": 20420, "epoch": 486} {"train_loss": -5.426796913146973, "global_step": 20421, "epoch": 486} {"train_loss": -5.185446739196777, "global_step": 20422, "epoch": 486} {"train_loss": -5.315958499908447, "global_step": 20423, "epoch": 486} {"train_loss": -5.1852545738220215, "global_step": 20424, "epoch": 486} {"train_loss": -5.207007884979248, "global_step": 20425, "epoch": 486} {"train_loss": -5.303378105163574, "global_step": 20426, "epoch": 486} {"train_loss": -5.2440056800842285, "global_step": 20427, "epoch": 486} {"train_loss": -5.223721027374268, "global_step": 20428, "epoch": 486} {"train_loss": -5.350324630737305, "global_step": 20429, "epoch": 486} {"train_loss": -5.331310272216797, "global_step": 20430, "epoch": 486} {"train_loss": -5.248475074768066, "global_step": 20431, "epoch": 486} {"train_loss": -5.317379951477051, "global_step": 20432, "epoch": 486} {"train_loss": -5.410428047180176, "global_step": 20433, "epoch": 486} {"train_loss": -5.357897758483887, "global_step": 20434, "epoch": 486} {"train_loss": -5.36821985244751, "global_step": 20435, "epoch": 486} {"train_loss": -5.435612678527832, "global_step": 20436, "epoch": 486} {"train_loss": -5.3910441398620605, "global_step": 20437, "epoch": 486} {"train_loss": -5.348969459533691, "global_step": 20438, "epoch": 486} {"train_loss": -5.4111247062683105, "global_step": 20439, "epoch": 486} {"train_loss": -5.300013065338135, "global_step": 20440, "epoch": 486} {"train_loss": -5.324962139129639, "global_step": 20441, "epoch": 486} {"train_loss": -5.285717010498047, "global_step": 20442, "epoch": 486} {"train_loss": -5.280950546264648, "global_step": 20443, "epoch": 486} {"train_loss": -5.316353797912598, "global_step": 20444, "epoch": 486} {"train_loss": -5.329213619232178, "global_step": 20445, "epoch": 486} {"train_loss": -5.202085494995117, "global_step": 20446, "epoch": 486} {"train_loss": -5.452325344085693, "global_step": 20447, "epoch": 486} {"train_loss": -5.444143295288086, "global_step": 20448, "epoch": 486} {"train_loss": -5.332114219665527, "global_step": 20449, "epoch": 486} {"train_loss": -5.30790376663208, "global_step": 20450, "epoch": 486} {"train_loss": -5.252219200134277, "global_step": 20451, "epoch": 486} {"train_loss": -5.285147190093994, "global_step": 20452, "epoch": 486} {"train_loss": -5.314412173770723, "global_step": 20453, "epoch": 486, "val_loss": 68438.28125} {"train_loss": -5.381443977355957, "global_step": 20454, "epoch": 487} {"train_loss": -5.260311126708984, "global_step": 20455, "epoch": 487} {"train_loss": -5.327392578125, "global_step": 20456, "epoch": 487} {"train_loss": -5.383908271789551, "global_step": 20457, "epoch": 487} {"train_loss": -5.190516948699951, "global_step": 20458, "epoch": 487} {"train_loss": -5.407805442810059, "global_step": 20459, "epoch": 487} {"train_loss": -5.445311546325684, "global_step": 20460, "epoch": 487} {"train_loss": -5.3550639152526855, "global_step": 20461, "epoch": 487} {"train_loss": -5.328333377838135, "global_step": 20462, "epoch": 487} {"train_loss": -5.379664421081543, "global_step": 20463, "epoch": 487} {"train_loss": -5.360806465148926, "global_step": 20464, "epoch": 487} {"train_loss": -5.368589401245117, "global_step": 20465, "epoch": 487} {"train_loss": -5.393391132354736, "global_step": 20466, "epoch": 487} {"train_loss": -5.374972343444824, "global_step": 20467, "epoch": 487} {"train_loss": -5.264337539672852, "global_step": 20468, "epoch": 487} {"train_loss": -5.350054740905762, "global_step": 20469, "epoch": 487} {"train_loss": -5.231090545654297, "global_step": 20470, "epoch": 487} {"train_loss": -5.3007612228393555, "global_step": 20471, "epoch": 487} {"train_loss": -5.315066337585449, "global_step": 20472, "epoch": 487} {"train_loss": -5.455658912658691, "global_step": 20473, "epoch": 487} {"train_loss": -5.303911209106445, "global_step": 20474, "epoch": 487} {"train_loss": -5.219198226928711, "global_step": 20475, "epoch": 487} {"train_loss": -5.335574150085449, "global_step": 20476, "epoch": 487} {"train_loss": -5.129680156707764, "global_step": 20477, "epoch": 487} {"train_loss": -5.344762802124023, "global_step": 20478, "epoch": 487} {"train_loss": -5.297752857208252, "global_step": 20479, "epoch": 487} {"train_loss": -5.400556564331055, "global_step": 20480, "epoch": 487} {"train_loss": -5.2742390632629395, "global_step": 20481, "epoch": 487} {"train_loss": -5.210474967956543, "global_step": 20482, "epoch": 487} {"train_loss": -5.304838180541992, "global_step": 20483, "epoch": 487} {"train_loss": -5.335268020629883, "global_step": 20484, "epoch": 487} {"train_loss": -5.3911662101745605, "global_step": 20485, "epoch": 487} {"train_loss": -5.403364181518555, "global_step": 20486, "epoch": 487} {"train_loss": -5.413095951080322, "global_step": 20487, "epoch": 487} {"train_loss": -5.574886798858643, "global_step": 20488, "epoch": 487} {"train_loss": -5.28959846496582, "global_step": 20489, "epoch": 487} {"train_loss": -5.409680366516113, "global_step": 20490, "epoch": 487} {"train_loss": -5.271675109863281, "global_step": 20491, "epoch": 487} {"train_loss": -5.344261169433594, "global_step": 20492, "epoch": 487} {"train_loss": -5.222692489624023, "global_step": 20493, "epoch": 487} {"train_loss": -5.463738441467285, "global_step": 20494, "epoch": 487} {"train_loss": -5.334427413486299, "global_step": 20495, "epoch": 487, "val_loss": 68699.1953125} {"train_loss": -5.327159404754639, "global_step": 20496, "epoch": 488} {"train_loss": -5.1601152420043945, "global_step": 20497, "epoch": 488} {"train_loss": -5.248676300048828, "global_step": 20498, "epoch": 488} {"train_loss": -5.302752494812012, "global_step": 20499, "epoch": 488} {"train_loss": -5.444093227386475, "global_step": 20500, "epoch": 488} {"train_loss": -5.487412452697754, "global_step": 20501, "epoch": 488} {"train_loss": -5.252241611480713, "global_step": 20502, "epoch": 488} {"train_loss": -5.387027740478516, "global_step": 20503, "epoch": 488} {"train_loss": -5.286409378051758, "global_step": 20504, "epoch": 488} {"train_loss": -5.242796897888184, "global_step": 20505, "epoch": 488} {"train_loss": -5.2583489418029785, "global_step": 20506, "epoch": 488} {"train_loss": -5.464144706726074, "global_step": 20507, "epoch": 488} {"train_loss": -5.271350383758545, "global_step": 20508, "epoch": 488} {"train_loss": -5.209752082824707, "global_step": 20509, "epoch": 488} {"train_loss": -5.487949371337891, "global_step": 20510, "epoch": 488} {"train_loss": -5.280779838562012, "global_step": 20511, "epoch": 488} {"train_loss": -5.4302978515625, "global_step": 20512, "epoch": 488} {"train_loss": -5.32654333114624, "global_step": 20513, "epoch": 488} {"train_loss": -5.395845890045166, "global_step": 20514, "epoch": 488} {"train_loss": -5.32711124420166, "global_step": 20515, "epoch": 488} {"train_loss": -5.254288196563721, "global_step": 20516, "epoch": 488} {"train_loss": -5.393782615661621, "global_step": 20517, "epoch": 488} {"train_loss": -5.343525409698486, "global_step": 20518, "epoch": 488} {"train_loss": -5.305934906005859, "global_step": 20519, "epoch": 488} {"train_loss": -5.325481414794922, "global_step": 20520, "epoch": 488} {"train_loss": -5.329419136047363, "global_step": 20521, "epoch": 488} {"train_loss": -5.308404922485352, "global_step": 20522, "epoch": 488} {"train_loss": -5.3553876876831055, "global_step": 20523, "epoch": 488} {"train_loss": -5.282849311828613, "global_step": 20524, "epoch": 488} {"train_loss": -5.381740570068359, "global_step": 20525, "epoch": 488} {"train_loss": -5.19822883605957, "global_step": 20526, "epoch": 488} {"train_loss": -5.396998405456543, "global_step": 20527, "epoch": 488} {"train_loss": -5.410837650299072, "global_step": 20528, "epoch": 488} {"train_loss": -5.180258750915527, "global_step": 20529, "epoch": 488} {"train_loss": -5.260663986206055, "global_step": 20530, "epoch": 488} {"train_loss": -5.444475173950195, "global_step": 20531, "epoch": 488} {"train_loss": -5.323003768920898, "global_step": 20532, "epoch": 488} {"train_loss": -5.370316028594971, "global_step": 20533, "epoch": 488} {"train_loss": -5.373115062713623, "global_step": 20534, "epoch": 488} {"train_loss": -5.29510498046875, "global_step": 20535, "epoch": 488} {"train_loss": -5.373471260070801, "global_step": 20536, "epoch": 488} {"train_loss": -5.33209965342567, "global_step": 20537, "epoch": 488, "val_loss": 68793.328125} {"train_loss": -5.4864912033081055, "global_step": 20538, "epoch": 489} {"train_loss": -5.233518600463867, "global_step": 20539, "epoch": 489} {"train_loss": -5.253155708312988, "global_step": 20540, "epoch": 489} {"train_loss": -5.31453800201416, "global_step": 20541, "epoch": 489} {"train_loss": -5.311404705047607, "global_step": 20542, "epoch": 489} {"train_loss": -5.311910152435303, "global_step": 20543, "epoch": 489} {"train_loss": -5.412270545959473, "global_step": 20544, "epoch": 489} {"train_loss": -5.373699188232422, "global_step": 20545, "epoch": 489} {"train_loss": -5.369023323059082, "global_step": 20546, "epoch": 489} {"train_loss": -5.2941083908081055, "global_step": 20547, "epoch": 489} {"train_loss": -5.241422653198242, "global_step": 20548, "epoch": 489} {"train_loss": -5.386791229248047, "global_step": 20549, "epoch": 489} {"train_loss": -5.393670082092285, "global_step": 20550, "epoch": 489} {"train_loss": -5.310800552368164, "global_step": 20551, "epoch": 489} {"train_loss": -5.459783554077148, "global_step": 20552, "epoch": 489} {"train_loss": -5.224555969238281, "global_step": 20553, "epoch": 489} {"train_loss": -5.39954137802124, "global_step": 20554, "epoch": 489} {"train_loss": -5.327004432678223, "global_step": 20555, "epoch": 489} {"train_loss": -5.323561191558838, "global_step": 20556, "epoch": 489} {"train_loss": -5.370593070983887, "global_step": 20557, "epoch": 489} {"train_loss": -5.336695194244385, "global_step": 20558, "epoch": 489} {"train_loss": -5.43437385559082, "global_step": 20559, "epoch": 489} {"train_loss": -5.352218151092529, "global_step": 20560, "epoch": 489} {"train_loss": -5.119194030761719, "global_step": 20561, "epoch": 489} {"train_loss": -5.315867900848389, "global_step": 20562, "epoch": 489} {"train_loss": -5.193732261657715, "global_step": 20563, "epoch": 489} {"train_loss": -5.26915979385376, "global_step": 20564, "epoch": 489} {"train_loss": -5.336727142333984, "global_step": 20565, "epoch": 489} {"train_loss": -5.281381607055664, "global_step": 20566, "epoch": 489} {"train_loss": -5.089974880218506, "global_step": 20567, "epoch": 489} {"train_loss": -5.285558700561523, "global_step": 20568, "epoch": 489} {"train_loss": -5.095726013183594, "global_step": 20569, "epoch": 489} {"train_loss": -5.294668197631836, "global_step": 20570, "epoch": 489} {"train_loss": -5.501453399658203, "global_step": 20571, "epoch": 489} {"train_loss": -5.352396488189697, "global_step": 20572, "epoch": 489} {"train_loss": -5.2875823974609375, "global_step": 20573, "epoch": 489} {"train_loss": -5.4486799240112305, "global_step": 20574, "epoch": 489} {"train_loss": -5.311191558837891, "global_step": 20575, "epoch": 489} {"train_loss": -5.29078483581543, "global_step": 20576, "epoch": 489} {"train_loss": -5.335407257080078, "global_step": 20577, "epoch": 489} {"train_loss": -5.252546787261963, "global_step": 20578, "epoch": 489} {"train_loss": -5.319060439155216, "global_step": 20579, "epoch": 489, "val_loss": 69467.7421875} {"train_loss": -5.3832244873046875, "global_step": 20580, "epoch": 490} {"train_loss": -5.358133792877197, "global_step": 20581, "epoch": 490} {"train_loss": -5.286408424377441, "global_step": 20582, "epoch": 490} {"train_loss": -5.338134288787842, "global_step": 20583, "epoch": 490} {"train_loss": -5.344440460205078, "global_step": 20584, "epoch": 490} {"train_loss": -5.429296493530273, "global_step": 20585, "epoch": 490} {"train_loss": -5.1692938804626465, "global_step": 20586, "epoch": 490} {"train_loss": -5.351811408996582, "global_step": 20587, "epoch": 490} {"train_loss": -5.43837833404541, "global_step": 20588, "epoch": 490} {"train_loss": -5.198089599609375, "global_step": 20589, "epoch": 490} {"train_loss": -5.414462089538574, "global_step": 20590, "epoch": 490} {"train_loss": -5.315752983093262, "global_step": 20591, "epoch": 490} {"train_loss": -5.317363262176514, "global_step": 20592, "epoch": 490} {"train_loss": -5.284829139709473, "global_step": 20593, "epoch": 490} {"train_loss": -5.28294038772583, "global_step": 20594, "epoch": 490} {"train_loss": -5.242671012878418, "global_step": 20595, "epoch": 490} {"train_loss": -5.223998069763184, "global_step": 20596, "epoch": 490} {"train_loss": -5.300136566162109, "global_step": 20597, "epoch": 490} {"train_loss": -5.336147308349609, "global_step": 20598, "epoch": 490} {"train_loss": -5.3566436767578125, "global_step": 20599, "epoch": 490} {"train_loss": -5.2731242179870605, "global_step": 20600, "epoch": 490} {"train_loss": -5.209022521972656, "global_step": 20601, "epoch": 490} {"train_loss": -5.283632278442383, "global_step": 20602, "epoch": 490} {"train_loss": -5.25860595703125, "global_step": 20603, "epoch": 490} {"train_loss": -5.218148708343506, "global_step": 20604, "epoch": 490} {"train_loss": -5.238011360168457, "global_step": 20605, "epoch": 490} {"train_loss": -5.320522308349609, "global_step": 20606, "epoch": 490} {"train_loss": -5.194853782653809, "global_step": 20607, "epoch": 490} {"train_loss": -5.305629730224609, "global_step": 20608, "epoch": 490} {"train_loss": -5.227210998535156, "global_step": 20609, "epoch": 490} {"train_loss": -5.2175164222717285, "global_step": 20610, "epoch": 490} {"train_loss": -5.138530731201172, "global_step": 20611, "epoch": 490} {"train_loss": -5.293020248413086, "global_step": 20612, "epoch": 490} {"train_loss": -5.046571254730225, "global_step": 20613, "epoch": 490} {"train_loss": -5.332563400268555, "global_step": 20614, "epoch": 490} {"train_loss": -5.197699546813965, "global_step": 20615, "epoch": 490} {"train_loss": -5.2447509765625, "global_step": 20616, "epoch": 490} {"train_loss": -5.245203495025635, "global_step": 20617, "epoch": 490} {"train_loss": -5.322772026062012, "global_step": 20618, "epoch": 490} {"train_loss": -5.202061653137207, "global_step": 20619, "epoch": 490} {"train_loss": -5.412700653076172, "global_step": 20620, "epoch": 490} {"train_loss": -5.280732586270287, "global_step": 20621, "epoch": 490, "val_loss": 68438.8515625} {"train_loss": -5.337541580200195, "global_step": 20622, "epoch": 491} {"train_loss": -5.343366622924805, "global_step": 20623, "epoch": 491} {"train_loss": -5.307183265686035, "global_step": 20624, "epoch": 491} {"train_loss": -5.301802158355713, "global_step": 20625, "epoch": 491} {"train_loss": -5.391695022583008, "global_step": 20626, "epoch": 491} {"train_loss": -5.331844806671143, "global_step": 20627, "epoch": 491} {"train_loss": -5.378554344177246, "global_step": 20628, "epoch": 491} {"train_loss": -5.317529678344727, "global_step": 20629, "epoch": 491} {"train_loss": -5.363700866699219, "global_step": 20630, "epoch": 491} {"train_loss": -5.307338714599609, "global_step": 20631, "epoch": 491} {"train_loss": -5.361576080322266, "global_step": 20632, "epoch": 491} {"train_loss": -5.243938446044922, "global_step": 20633, "epoch": 491} {"train_loss": -5.294011116027832, "global_step": 20634, "epoch": 491} {"train_loss": -5.487677097320557, "global_step": 20635, "epoch": 491} {"train_loss": -5.345391273498535, "global_step": 20636, "epoch": 491} {"train_loss": -5.408891677856445, "global_step": 20637, "epoch": 491} {"train_loss": -5.27647590637207, "global_step": 20638, "epoch": 491} {"train_loss": -5.349554061889648, "global_step": 20639, "epoch": 491} {"train_loss": -5.403955459594727, "global_step": 20640, "epoch": 491} {"train_loss": -5.3729753494262695, "global_step": 20641, "epoch": 491} {"train_loss": -5.3413896560668945, "global_step": 20642, "epoch": 491} {"train_loss": -5.2992401123046875, "global_step": 20643, "epoch": 491} {"train_loss": -5.2877726554870605, "global_step": 20644, "epoch": 491} {"train_loss": -5.173108100891113, "global_step": 20645, "epoch": 491} {"train_loss": -5.427850246429443, "global_step": 20646, "epoch": 491} {"train_loss": -5.22653865814209, "global_step": 20647, "epoch": 491} {"train_loss": -5.417219161987305, "global_step": 20648, "epoch": 491} {"train_loss": -5.416184902191162, "global_step": 20649, "epoch": 491} {"train_loss": -5.412263870239258, "global_step": 20650, "epoch": 491} {"train_loss": -5.294768333435059, "global_step": 20651, "epoch": 491} {"train_loss": -5.2608232498168945, "global_step": 20652, "epoch": 491} {"train_loss": -5.2557477951049805, "global_step": 20653, "epoch": 491} {"train_loss": -5.281123638153076, "global_step": 20654, "epoch": 491} {"train_loss": -5.077079772949219, "global_step": 20655, "epoch": 491} {"train_loss": -5.353569030761719, "global_step": 20656, "epoch": 491} {"train_loss": -5.341329574584961, "global_step": 20657, "epoch": 491} {"train_loss": -5.3635663986206055, "global_step": 20658, "epoch": 491} {"train_loss": -5.3473615646362305, "global_step": 20659, "epoch": 491} {"train_loss": -5.243551254272461, "global_step": 20660, "epoch": 491} {"train_loss": -5.2512311935424805, "global_step": 20661, "epoch": 491} {"train_loss": -5.381527423858643, "global_step": 20662, "epoch": 491} {"train_loss": -5.325253180095127, "global_step": 20663, "epoch": 491, "val_loss": 68601.4453125} {"train_loss": -5.2247633934021, "global_step": 20664, "epoch": 492} {"train_loss": -5.248920917510986, "global_step": 20665, "epoch": 492} {"train_loss": -5.313043594360352, "global_step": 20666, "epoch": 492} {"train_loss": -5.193992614746094, "global_step": 20667, "epoch": 492} {"train_loss": -5.346086502075195, "global_step": 20668, "epoch": 492} {"train_loss": -5.180635452270508, "global_step": 20669, "epoch": 492} {"train_loss": -5.337945461273193, "global_step": 20670, "epoch": 492} {"train_loss": -5.32230806350708, "global_step": 20671, "epoch": 492} {"train_loss": -5.305505275726318, "global_step": 20672, "epoch": 492} {"train_loss": -5.354848384857178, "global_step": 20673, "epoch": 492} {"train_loss": -5.28913688659668, "global_step": 20674, "epoch": 492} {"train_loss": -5.252993583679199, "global_step": 20675, "epoch": 492} {"train_loss": -5.299350261688232, "global_step": 20676, "epoch": 492} {"train_loss": -5.387036323547363, "global_step": 20677, "epoch": 492} {"train_loss": -5.359415531158447, "global_step": 20678, "epoch": 492} {"train_loss": -5.40427303314209, "global_step": 20679, "epoch": 492} {"train_loss": -5.401885509490967, "global_step": 20680, "epoch": 492} {"train_loss": -5.3044586181640625, "global_step": 20681, "epoch": 492} {"train_loss": -5.338703155517578, "global_step": 20682, "epoch": 492} {"train_loss": -5.414669036865234, "global_step": 20683, "epoch": 492} {"train_loss": -5.265474796295166, "global_step": 20684, "epoch": 492} {"train_loss": -5.16813850402832, "global_step": 20685, "epoch": 492} {"train_loss": -5.256072998046875, "global_step": 20686, "epoch": 492} {"train_loss": -5.42123556137085, "global_step": 20687, "epoch": 492} {"train_loss": -5.357431411743164, "global_step": 20688, "epoch": 492} {"train_loss": -5.359450340270996, "global_step": 20689, "epoch": 492} {"train_loss": -5.245677947998047, "global_step": 20690, "epoch": 492} {"train_loss": -5.249615669250488, "global_step": 20691, "epoch": 492} {"train_loss": -5.3113837242126465, "global_step": 20692, "epoch": 492} {"train_loss": -5.136643409729004, "global_step": 20693, "epoch": 492} {"train_loss": -5.278677463531494, "global_step": 20694, "epoch": 492} {"train_loss": -5.152188301086426, "global_step": 20695, "epoch": 492} {"train_loss": -5.2647600173950195, "global_step": 20696, "epoch": 492} {"train_loss": -5.263270378112793, "global_step": 20697, "epoch": 492} {"train_loss": -5.187333106994629, "global_step": 20698, "epoch": 492} {"train_loss": -5.403883934020996, "global_step": 20699, "epoch": 492} {"train_loss": -5.210840225219727, "global_step": 20700, "epoch": 492} {"train_loss": -5.253108024597168, "global_step": 20701, "epoch": 492} {"train_loss": -5.175691604614258, "global_step": 20702, "epoch": 492} {"train_loss": -5.421548843383789, "global_step": 20703, "epoch": 492} {"train_loss": -5.201751708984375, "global_step": 20704, "epoch": 492} {"train_loss": -5.290525538580758, "global_step": 20705, "epoch": 492, "val_loss": 68977.7890625} {"train_loss": -5.235803604125977, "global_step": 20706, "epoch": 493} {"train_loss": -5.505170822143555, "global_step": 20707, "epoch": 493} {"train_loss": -5.350222110748291, "global_step": 20708, "epoch": 493} {"train_loss": -5.2325439453125, "global_step": 20709, "epoch": 493} {"train_loss": -5.380053520202637, "global_step": 20710, "epoch": 493} {"train_loss": -5.211159706115723, "global_step": 20711, "epoch": 493} {"train_loss": -5.242766380310059, "global_step": 20712, "epoch": 493} {"train_loss": -5.387686252593994, "global_step": 20713, "epoch": 493} {"train_loss": -5.266436576843262, "global_step": 20714, "epoch": 493} {"train_loss": -5.344672203063965, "global_step": 20715, "epoch": 493} {"train_loss": -5.214202404022217, "global_step": 20716, "epoch": 493} {"train_loss": -5.266535758972168, "global_step": 20717, "epoch": 493} {"train_loss": -5.349235534667969, "global_step": 20718, "epoch": 493} {"train_loss": -5.300321102142334, "global_step": 20719, "epoch": 493} {"train_loss": -5.229133605957031, "global_step": 20720, "epoch": 493} {"train_loss": -5.315983295440674, "global_step": 20721, "epoch": 493} {"train_loss": -5.179610729217529, "global_step": 20722, "epoch": 493} {"train_loss": -5.385028839111328, "global_step": 20723, "epoch": 493} {"train_loss": -5.412589073181152, "global_step": 20724, "epoch": 493} {"train_loss": -5.162755489349365, "global_step": 20725, "epoch": 493} {"train_loss": -5.21938419342041, "global_step": 20726, "epoch": 493} {"train_loss": -5.1387529373168945, "global_step": 20727, "epoch": 493} {"train_loss": -5.184028625488281, "global_step": 20728, "epoch": 493} {"train_loss": -5.236706256866455, "global_step": 20729, "epoch": 493} {"train_loss": -5.206949234008789, "global_step": 20730, "epoch": 493} {"train_loss": -5.32949161529541, "global_step": 20731, "epoch": 493} {"train_loss": -5.2807393074035645, "global_step": 20732, "epoch": 493} {"train_loss": -5.319363594055176, "global_step": 20733, "epoch": 493} {"train_loss": -5.297934532165527, "global_step": 20734, "epoch": 493} {"train_loss": -5.181937217712402, "global_step": 20735, "epoch": 493} {"train_loss": -5.303481101989746, "global_step": 20736, "epoch": 493} {"train_loss": -5.144350051879883, "global_step": 20737, "epoch": 493} {"train_loss": -5.184086799621582, "global_step": 20738, "epoch": 493} {"train_loss": -5.30556583404541, "global_step": 20739, "epoch": 493} {"train_loss": -5.310209274291992, "global_step": 20740, "epoch": 493} {"train_loss": -5.25659704208374, "global_step": 20741, "epoch": 493} {"train_loss": -5.1887030601501465, "global_step": 20742, "epoch": 493} {"train_loss": -5.330368518829346, "global_step": 20743, "epoch": 493} {"train_loss": -5.383711338043213, "global_step": 20744, "epoch": 493} {"train_loss": -5.160244941711426, "global_step": 20745, "epoch": 493} {"train_loss": -5.369687080383301, "global_step": 20746, "epoch": 493} {"train_loss": -5.275640907741728, "global_step": 20747, "epoch": 493, "val_loss": 69568.4296875} {"train_loss": -5.284323692321777, "global_step": 20748, "epoch": 494} {"train_loss": -5.466742992401123, "global_step": 20749, "epoch": 494} {"train_loss": -5.2315802574157715, "global_step": 20750, "epoch": 494} {"train_loss": -5.214886665344238, "global_step": 20751, "epoch": 494} {"train_loss": -5.314578056335449, "global_step": 20752, "epoch": 494} {"train_loss": -5.196649551391602, "global_step": 20753, "epoch": 494} {"train_loss": -5.281805515289307, "global_step": 20754, "epoch": 494} {"train_loss": -5.209529876708984, "global_step": 20755, "epoch": 494} {"train_loss": -5.244253158569336, "global_step": 20756, "epoch": 494} {"train_loss": -5.264681339263916, "global_step": 20757, "epoch": 494} {"train_loss": -5.259686470031738, "global_step": 20758, "epoch": 494} {"train_loss": -5.379172325134277, "global_step": 20759, "epoch": 494} {"train_loss": -5.328116416931152, "global_step": 20760, "epoch": 494} {"train_loss": -5.18952751159668, "global_step": 20761, "epoch": 494} {"train_loss": -5.321966171264648, "global_step": 20762, "epoch": 494} {"train_loss": -5.263672828674316, "global_step": 20763, "epoch": 494} {"train_loss": -5.381890773773193, "global_step": 20764, "epoch": 494} {"train_loss": -5.479040622711182, "global_step": 20765, "epoch": 494} {"train_loss": -5.423614501953125, "global_step": 20766, "epoch": 494} {"train_loss": -5.3475141525268555, "global_step": 20767, "epoch": 494} {"train_loss": -5.303084373474121, "global_step": 20768, "epoch": 494} {"train_loss": -5.326173782348633, "global_step": 20769, "epoch": 494} {"train_loss": -5.459285259246826, "global_step": 20770, "epoch": 494} {"train_loss": -5.379887580871582, "global_step": 20771, "epoch": 494} {"train_loss": -5.4285759925842285, "global_step": 20772, "epoch": 494} {"train_loss": -5.229832649230957, "global_step": 20773, "epoch": 494} {"train_loss": -5.373298168182373, "global_step": 20774, "epoch": 494} {"train_loss": -5.234755516052246, "global_step": 20775, "epoch": 494} {"train_loss": -5.374997138977051, "global_step": 20776, "epoch": 494} {"train_loss": -5.149960517883301, "global_step": 20777, "epoch": 494} {"train_loss": -5.456545352935791, "global_step": 20778, "epoch": 494} {"train_loss": -5.31832218170166, "global_step": 20779, "epoch": 494} {"train_loss": -5.1824541091918945, "global_step": 20780, "epoch": 494} {"train_loss": -5.254872798919678, "global_step": 20781, "epoch": 494} {"train_loss": -5.291896820068359, "global_step": 20782, "epoch": 494} {"train_loss": -5.309474945068359, "global_step": 20783, "epoch": 494} {"train_loss": -5.415703773498535, "global_step": 20784, "epoch": 494} {"train_loss": -5.300335884094238, "global_step": 20785, "epoch": 494} {"train_loss": -5.1806745529174805, "global_step": 20786, "epoch": 494} {"train_loss": -5.378266334533691, "global_step": 20787, "epoch": 494} {"train_loss": -5.386443614959717, "global_step": 20788, "epoch": 494} {"train_loss": -5.308849947793143, "global_step": 20789, "epoch": 494, "val_loss": 68637.1015625} {"train_loss": -5.250822067260742, "global_step": 20790, "epoch": 495} {"train_loss": -5.26792049407959, "global_step": 20791, "epoch": 495} {"train_loss": -5.288361549377441, "global_step": 20792, "epoch": 495} {"train_loss": -5.306702613830566, "global_step": 20793, "epoch": 495} {"train_loss": -5.281739711761475, "global_step": 20794, "epoch": 495} {"train_loss": -5.408379077911377, "global_step": 20795, "epoch": 495} {"train_loss": -5.462705612182617, "global_step": 20796, "epoch": 495} {"train_loss": -5.172047138214111, "global_step": 20797, "epoch": 495} {"train_loss": -5.390438079833984, "global_step": 20798, "epoch": 495} {"train_loss": -5.4190216064453125, "global_step": 20799, "epoch": 495} {"train_loss": -5.301308631896973, "global_step": 20800, "epoch": 495} {"train_loss": -5.415238380432129, "global_step": 20801, "epoch": 495} {"train_loss": -5.313488006591797, "global_step": 20802, "epoch": 495} {"train_loss": -5.344977855682373, "global_step": 20803, "epoch": 495} {"train_loss": -5.291733741760254, "global_step": 20804, "epoch": 495} {"train_loss": -5.308154106140137, "global_step": 20805, "epoch": 495} {"train_loss": -5.264068603515625, "global_step": 20806, "epoch": 495} {"train_loss": -5.526064872741699, "global_step": 20807, "epoch": 495} {"train_loss": -5.325049877166748, "global_step": 20808, "epoch": 495} {"train_loss": -5.401355266571045, "global_step": 20809, "epoch": 495} {"train_loss": -5.254444122314453, "global_step": 20810, "epoch": 495} {"train_loss": -5.354680061340332, "global_step": 20811, "epoch": 495} {"train_loss": -5.369482040405273, "global_step": 20812, "epoch": 495} {"train_loss": -5.1710968017578125, "global_step": 20813, "epoch": 495} {"train_loss": -5.262113571166992, "global_step": 20814, "epoch": 495} {"train_loss": -5.328007698059082, "global_step": 20815, "epoch": 495} {"train_loss": -5.48056697845459, "global_step": 20816, "epoch": 495} {"train_loss": -5.215316295623779, "global_step": 20817, "epoch": 495} {"train_loss": -5.3466997146606445, "global_step": 20818, "epoch": 495} {"train_loss": -5.417646408081055, "global_step": 20819, "epoch": 495} {"train_loss": -5.264923095703125, "global_step": 20820, "epoch": 495} {"train_loss": -5.394567489624023, "global_step": 20821, "epoch": 495} {"train_loss": -5.34822940826416, "global_step": 20822, "epoch": 495} {"train_loss": -5.274072170257568, "global_step": 20823, "epoch": 495} {"train_loss": -5.350475788116455, "global_step": 20824, "epoch": 495} {"train_loss": -5.214808940887451, "global_step": 20825, "epoch": 495} {"train_loss": -5.243927478790283, "global_step": 20826, "epoch": 495} {"train_loss": -5.262887477874756, "global_step": 20827, "epoch": 495} {"train_loss": -5.4132866859436035, "global_step": 20828, "epoch": 495} {"train_loss": -5.304131507873535, "global_step": 20829, "epoch": 495} {"train_loss": -5.441313743591309, "global_step": 20830, "epoch": 495} {"train_loss": -5.328739540917533, "global_step": 20831, "epoch": 495, "val_loss": 68846.875} {"train_loss": -5.33167839050293, "global_step": 20832, "epoch": 496} {"train_loss": -5.409974098205566, "global_step": 20833, "epoch": 496} {"train_loss": -5.2927937507629395, "global_step": 20834, "epoch": 496} {"train_loss": -5.324151039123535, "global_step": 20835, "epoch": 496} {"train_loss": -5.448327541351318, "global_step": 20836, "epoch": 496} {"train_loss": -5.2022504806518555, "global_step": 20837, "epoch": 496} {"train_loss": -5.398225784301758, "global_step": 20838, "epoch": 496} {"train_loss": -5.3103837966918945, "global_step": 20839, "epoch": 496} {"train_loss": -5.456307411193848, "global_step": 20840, "epoch": 496} {"train_loss": -5.189218997955322, "global_step": 20841, "epoch": 496} {"train_loss": -5.338351249694824, "global_step": 20842, "epoch": 496} {"train_loss": -5.260513782501221, "global_step": 20843, "epoch": 496} {"train_loss": -5.287609100341797, "global_step": 20844, "epoch": 496} {"train_loss": -5.357242584228516, "global_step": 20845, "epoch": 496} {"train_loss": -5.23942756652832, "global_step": 20846, "epoch": 496} {"train_loss": -5.177447319030762, "global_step": 20847, "epoch": 496} {"train_loss": -5.345980644226074, "global_step": 20848, "epoch": 496} {"train_loss": -5.131760597229004, "global_step": 20849, "epoch": 496} {"train_loss": -5.351821422576904, "global_step": 20850, "epoch": 496} {"train_loss": -5.294654369354248, "global_step": 20851, "epoch": 496} {"train_loss": -5.126553535461426, "global_step": 20852, "epoch": 496} {"train_loss": -5.262579917907715, "global_step": 20853, "epoch": 496} {"train_loss": -5.364047050476074, "global_step": 20854, "epoch": 496} {"train_loss": -5.396489143371582, "global_step": 20855, "epoch": 496} {"train_loss": -5.278384685516357, "global_step": 20856, "epoch": 496} {"train_loss": -5.346301078796387, "global_step": 20857, "epoch": 496} {"train_loss": -5.323698043823242, "global_step": 20858, "epoch": 496} {"train_loss": -5.3217668533325195, "global_step": 20859, "epoch": 496} {"train_loss": -5.486588478088379, "global_step": 20860, "epoch": 496} {"train_loss": -5.218646049499512, "global_step": 20861, "epoch": 496} {"train_loss": -5.343983173370361, "global_step": 20862, "epoch": 496} {"train_loss": -5.359606742858887, "global_step": 20863, "epoch": 496} {"train_loss": -5.397356986999512, "global_step": 20864, "epoch": 496} {"train_loss": -5.213920593261719, "global_step": 20865, "epoch": 496} {"train_loss": -5.337259292602539, "global_step": 20866, "epoch": 496} {"train_loss": -5.428806304931641, "global_step": 20867, "epoch": 496} {"train_loss": -5.36155891418457, "global_step": 20868, "epoch": 496} {"train_loss": -5.366772174835205, "global_step": 20869, "epoch": 496} {"train_loss": -5.39561128616333, "global_step": 20870, "epoch": 496} {"train_loss": -5.37088680267334, "global_step": 20871, "epoch": 496} {"train_loss": -5.405604362487793, "global_step": 20872, "epoch": 496} {"train_loss": -5.3231380099341985, "global_step": 20873, "epoch": 496, "val_loss": 68817.390625} {"train_loss": -5.476790428161621, "global_step": 20874, "epoch": 497} {"train_loss": -5.342433929443359, "global_step": 20875, "epoch": 497} {"train_loss": -5.387152671813965, "global_step": 20876, "epoch": 497} {"train_loss": -5.292712211608887, "global_step": 20877, "epoch": 497} {"train_loss": -5.3205342292785645, "global_step": 20878, "epoch": 497} {"train_loss": -5.375124931335449, "global_step": 20879, "epoch": 497} {"train_loss": -5.265275955200195, "global_step": 20880, "epoch": 497} {"train_loss": -5.319058418273926, "global_step": 20881, "epoch": 497} {"train_loss": -5.302875518798828, "global_step": 20882, "epoch": 497} {"train_loss": -5.444223880767822, "global_step": 20883, "epoch": 497} {"train_loss": -5.269097328186035, "global_step": 20884, "epoch": 497} {"train_loss": -5.317929267883301, "global_step": 20885, "epoch": 497} {"train_loss": -5.318912506103516, "global_step": 20886, "epoch": 497} {"train_loss": -5.247663497924805, "global_step": 20887, "epoch": 497} {"train_loss": -5.298376083374023, "global_step": 20888, "epoch": 497} {"train_loss": -5.342905521392822, "global_step": 20889, "epoch": 497} {"train_loss": -5.359981536865234, "global_step": 20890, "epoch": 497} {"train_loss": -5.170456886291504, "global_step": 20891, "epoch": 497} {"train_loss": -5.341679096221924, "global_step": 20892, "epoch": 497} {"train_loss": -5.411366939544678, "global_step": 20893, "epoch": 497} {"train_loss": -5.245578289031982, "global_step": 20894, "epoch": 497} {"train_loss": -5.338400840759277, "global_step": 20895, "epoch": 497} {"train_loss": -5.400114059448242, "global_step": 20896, "epoch": 497} {"train_loss": -5.283088684082031, "global_step": 20897, "epoch": 497} {"train_loss": -5.407617568969727, "global_step": 20898, "epoch": 497} {"train_loss": -5.301161289215088, "global_step": 20899, "epoch": 497} {"train_loss": -5.271578788757324, "global_step": 20900, "epoch": 497} {"train_loss": -5.283074378967285, "global_step": 20901, "epoch": 497} {"train_loss": -5.287689685821533, "global_step": 20902, "epoch": 497} {"train_loss": -5.136757850646973, "global_step": 20903, "epoch": 497} {"train_loss": -5.311078071594238, "global_step": 20904, "epoch": 497} {"train_loss": -5.166138648986816, "global_step": 20905, "epoch": 497} {"train_loss": -5.321972370147705, "global_step": 20906, "epoch": 497} {"train_loss": -5.211845397949219, "global_step": 20907, "epoch": 497} {"train_loss": -5.273311614990234, "global_step": 20908, "epoch": 497} {"train_loss": -5.260002136230469, "global_step": 20909, "epoch": 497} {"train_loss": -5.202117919921875, "global_step": 20910, "epoch": 497} {"train_loss": -5.246380805969238, "global_step": 20911, "epoch": 497} {"train_loss": -5.279177665710449, "global_step": 20912, "epoch": 497} {"train_loss": -5.156133651733398, "global_step": 20913, "epoch": 497} {"train_loss": -5.540251731872559, "global_step": 20914, "epoch": 497} {"train_loss": -5.3068844590868265, "global_step": 20915, "epoch": 497, "val_loss": 68851.453125} {"train_loss": -5.344112396240234, "global_step": 20916, "epoch": 498} {"train_loss": -5.3328962326049805, "global_step": 20917, "epoch": 498} {"train_loss": -5.2431960105896, "global_step": 20918, "epoch": 498} {"train_loss": -5.349169731140137, "global_step": 20919, "epoch": 498} {"train_loss": -5.333756446838379, "global_step": 20920, "epoch": 498} {"train_loss": -5.128728866577148, "global_step": 20921, "epoch": 498} {"train_loss": -5.353546142578125, "global_step": 20922, "epoch": 498} {"train_loss": -5.305819988250732, "global_step": 20923, "epoch": 498} {"train_loss": -5.444138526916504, "global_step": 20924, "epoch": 498} {"train_loss": -5.4188313484191895, "global_step": 20925, "epoch": 498} {"train_loss": -5.363656997680664, "global_step": 20926, "epoch": 498} {"train_loss": -5.237167835235596, "global_step": 20927, "epoch": 498} {"train_loss": -5.391785621643066, "global_step": 20928, "epoch": 498} {"train_loss": -5.265669345855713, "global_step": 20929, "epoch": 498} {"train_loss": -5.255101203918457, "global_step": 20930, "epoch": 498} {"train_loss": -5.3122076988220215, "global_step": 20931, "epoch": 498} {"train_loss": -5.412779808044434, "global_step": 20932, "epoch": 498} {"train_loss": -5.353043556213379, "global_step": 20933, "epoch": 498} {"train_loss": -5.341763496398926, "global_step": 20934, "epoch": 498} {"train_loss": -5.305117607116699, "global_step": 20935, "epoch": 498} {"train_loss": -5.340133190155029, "global_step": 20936, "epoch": 498} {"train_loss": -5.345422744750977, "global_step": 20937, "epoch": 498} {"train_loss": -5.280711650848389, "global_step": 20938, "epoch": 498} {"train_loss": -5.241847038269043, "global_step": 20939, "epoch": 498} {"train_loss": -5.336170196533203, "global_step": 20940, "epoch": 498} {"train_loss": -5.318408489227295, "global_step": 20941, "epoch": 498} {"train_loss": -5.254275798797607, "global_step": 20942, "epoch": 498} {"train_loss": -5.267086029052734, "global_step": 20943, "epoch": 498} {"train_loss": -5.329668998718262, "global_step": 20944, "epoch": 498} {"train_loss": -5.371554374694824, "global_step": 20945, "epoch": 498} {"train_loss": -5.272411346435547, "global_step": 20946, "epoch": 498} {"train_loss": -5.196285247802734, "global_step": 20947, "epoch": 498} {"train_loss": -5.468055725097656, "global_step": 20948, "epoch": 498} {"train_loss": -5.290188312530518, "global_step": 20949, "epoch": 498} {"train_loss": -5.40015172958374, "global_step": 20950, "epoch": 498} {"train_loss": -5.4293928146362305, "global_step": 20951, "epoch": 498} {"train_loss": -5.367888450622559, "global_step": 20952, "epoch": 498} {"train_loss": -5.380396842956543, "global_step": 20953, "epoch": 498} {"train_loss": -5.432918548583984, "global_step": 20954, "epoch": 498} {"train_loss": -5.323826313018799, "global_step": 20955, "epoch": 498} {"train_loss": -5.331484317779541, "global_step": 20956, "epoch": 498} {"train_loss": -5.3281539508274625, "global_step": 20957, "epoch": 498, "val_loss": 68761.0390625} {"train_loss": -5.375892639160156, "global_step": 20958, "epoch": 499} {"train_loss": -5.195538520812988, "global_step": 20959, "epoch": 499} {"train_loss": -5.424736976623535, "global_step": 20960, "epoch": 499} {"train_loss": -5.375319480895996, "global_step": 20961, "epoch": 499} {"train_loss": -5.382833480834961, "global_step": 20962, "epoch": 499} {"train_loss": -5.2585954666137695, "global_step": 20963, "epoch": 499} {"train_loss": -5.328474044799805, "global_step": 20964, "epoch": 499} {"train_loss": -5.26407527923584, "global_step": 20965, "epoch": 499} {"train_loss": -5.364927291870117, "global_step": 20966, "epoch": 499} {"train_loss": -5.309861183166504, "global_step": 20967, "epoch": 499} {"train_loss": -5.3404951095581055, "global_step": 20968, "epoch": 499} {"train_loss": -5.358582019805908, "global_step": 20969, "epoch": 499} {"train_loss": -5.184842109680176, "global_step": 20970, "epoch": 499} {"train_loss": -5.314905166625977, "global_step": 20971, "epoch": 499} {"train_loss": -5.370033264160156, "global_step": 20972, "epoch": 499} {"train_loss": -5.205944538116455, "global_step": 20973, "epoch": 499} {"train_loss": -5.450080871582031, "global_step": 20974, "epoch": 499} {"train_loss": -5.385913848876953, "global_step": 20975, "epoch": 499} {"train_loss": -5.379739761352539, "global_step": 20976, "epoch": 499} {"train_loss": -5.30064582824707, "global_step": 20977, "epoch": 499} {"train_loss": -5.338778972625732, "global_step": 20978, "epoch": 499} {"train_loss": -5.354218006134033, "global_step": 20979, "epoch": 499} {"train_loss": -5.3504638671875, "global_step": 20980, "epoch": 499} {"train_loss": -5.374727249145508, "global_step": 20981, "epoch": 499} {"train_loss": -5.384139537811279, "global_step": 20982, "epoch": 499} {"train_loss": -5.27468204498291, "global_step": 20983, "epoch": 499} {"train_loss": -5.309518814086914, "global_step": 20984, "epoch": 499} {"train_loss": -5.423386573791504, "global_step": 20985, "epoch": 499} {"train_loss": -5.108345031738281, "global_step": 20986, "epoch": 499} {"train_loss": -5.210686206817627, "global_step": 20987, "epoch": 499} {"train_loss": -5.330966472625732, "global_step": 20988, "epoch": 499} {"train_loss": -5.237865447998047, "global_step": 20989, "epoch": 499} {"train_loss": -5.263219833374023, "global_step": 20990, "epoch": 499} {"train_loss": -5.375665664672852, "global_step": 20991, "epoch": 499} {"train_loss": -5.165097236633301, "global_step": 20992, "epoch": 499} {"train_loss": -5.340074062347412, "global_step": 20993, "epoch": 499} {"train_loss": -5.252036094665527, "global_step": 20994, "epoch": 499} {"train_loss": -5.283268928527832, "global_step": 20995, "epoch": 499} {"train_loss": -5.317912578582764, "global_step": 20996, "epoch": 499} {"train_loss": -5.315197944641113, "global_step": 20997, "epoch": 499} {"train_loss": -5.371350288391113, "global_step": 20998, "epoch": 499} {"train_loss": -5.3211159365517755, "global_step": 20999, "epoch": 499, "val_loss": 68739.2734375} {"train_loss": -5.386363983154297, "global_step": 21000, "epoch": 500} {"train_loss": -5.42634391784668, "global_step": 21001, "epoch": 500} {"train_loss": -5.293128490447998, "global_step": 21002, "epoch": 500} {"train_loss": -5.4231977462768555, "global_step": 21003, "epoch": 500} {"train_loss": -5.240020751953125, "global_step": 21004, "epoch": 500} {"train_loss": -5.322718620300293, "global_step": 21005, "epoch": 500} {"train_loss": -5.299776077270508, "global_step": 21006, "epoch": 500} {"train_loss": -5.247299671173096, "global_step": 21007, "epoch": 500} {"train_loss": -5.398536682128906, "global_step": 21008, "epoch": 500} {"train_loss": -5.207180023193359, "global_step": 21009, "epoch": 500} {"train_loss": -5.284280776977539, "global_step": 21010, "epoch": 500} {"train_loss": -5.287049293518066, "global_step": 21011, "epoch": 500} {"train_loss": -5.270147323608398, "global_step": 21012, "epoch": 500} {"train_loss": -5.365775108337402, "global_step": 21013, "epoch": 500} {"train_loss": -5.227892875671387, "global_step": 21014, "epoch": 500} {"train_loss": -5.239194869995117, "global_step": 21015, "epoch": 500} {"train_loss": -5.416747093200684, "global_step": 21016, "epoch": 500} {"train_loss": -5.287731170654297, "global_step": 21017, "epoch": 500} {"train_loss": -5.221171855926514, "global_step": 21018, "epoch": 500} {"train_loss": -5.287170886993408, "global_step": 21019, "epoch": 500} {"train_loss": -5.435478687286377, "global_step": 21020, "epoch": 500} {"train_loss": -5.317208290100098, "global_step": 21021, "epoch": 500} {"train_loss": -5.162950038909912, "global_step": 21022, "epoch": 500} {"train_loss": -5.142093181610107, "global_step": 21023, "epoch": 500} {"train_loss": -5.404730319976807, "global_step": 21024, "epoch": 500} {"train_loss": -5.25184440612793, "global_step": 21025, "epoch": 500} {"train_loss": -5.315178394317627, "global_step": 21026, "epoch": 500} {"train_loss": -5.174273490905762, "global_step": 21027, "epoch": 500} {"train_loss": -5.210137367248535, "global_step": 21028, "epoch": 500} {"train_loss": -5.246962547302246, "global_step": 21029, "epoch": 500} {"train_loss": -5.37308406829834, "global_step": 21030, "epoch": 500} {"train_loss": -5.288609504699707, "global_step": 21031, "epoch": 500} {"train_loss": -5.351260185241699, "global_step": 21032, "epoch": 500} {"train_loss": -5.187919616699219, "global_step": 21033, "epoch": 500} {"train_loss": -5.202966690063477, "global_step": 21034, "epoch": 500} {"train_loss": -5.2750678062438965, "global_step": 21035, "epoch": 500} {"train_loss": -5.196597576141357, "global_step": 21036, "epoch": 500} {"train_loss": -5.392367362976074, "global_step": 21037, "epoch": 500} {"train_loss": -5.279712677001953, "global_step": 21038, "epoch": 500} {"train_loss": -5.221770763397217, "global_step": 21039, "epoch": 500} {"train_loss": -5.327759742736816, "global_step": 21040, "epoch": 500} {"train_loss": -5.291297106515794, "global_step": 21041, "epoch": 500, "train/sim_max_reward_0": 0.42226851324608616, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.5736890806706957, "train/sim_max_reward_3": 0.07786114174171596, "train/sim_max_reward_4": 0.3710688780273267, "train/sim_max_reward_5": 0.5143543199888964, "test/sim_max_reward_4400000": 0.08842786286054531, "test/sim_max_reward_4400001": 0.014021135271422376, "test/sim_max_reward_4400002": 0.2525913515733921, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.18823253344110857, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.022287212294118928, "test/sim_max_reward_4400007": 0.016760239484898333, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.6239977739937842, "test/sim_max_reward_4400010": 0.29219979513598776, "test/sim_max_reward_4400011": 0.2019034643458615, "test/sim_max_reward_4400012": 0.18188928415016836, "test/sim_max_reward_4400013": 0.20348552801103884, "test/sim_max_reward_4400014": 0.021647645016917436, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1955007116704784, "test/sim_max_reward_4400018": 0.2518949202866243, "test/sim_max_reward_4400019": 0.15522551318473501, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.37648216467235074, "test/sim_max_reward_4400025": 0.18010507811943077, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.048705503536953694, "test/sim_max_reward_4400028": 0.0, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.4472437246614272, "test/sim_max_reward_4400031": 1.2890978942579066e-05, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.13661774955554132, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.4497715261040434, "test/sim_max_reward_4400036": 0.38252715549548066, "test/sim_max_reward_4400037": 0.37943900431392025, "test/sim_max_reward_4400038": 0.4569656989252477, "test/sim_max_reward_4400039": 0.5011761064616976, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.36822367223450886, "test/sim_max_reward_4400042": 0.00630645754821735, "test/sim_max_reward_4400043": 0.04619435957923847, "test/sim_max_reward_4400044": 0.009138066117264846, "test/sim_max_reward_4400045": 3.5657110293289836e-05, "test/sim_max_reward_4400046": 0.17162612814912934, "test/sim_max_reward_4400047": 0.10294098563048172, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.3266529024827533, "test/mean_score": 0.15035609855493676, "val_loss": 68589.9453125} {"train_loss": -5.255785942077637, "global_step": 21042, "epoch": 501} {"train_loss": -5.318325519561768, "global_step": 21043, "epoch": 501} {"train_loss": -5.2111663818359375, "global_step": 21044, "epoch": 501} {"train_loss": -5.277858257293701, "global_step": 21045, "epoch": 501} {"train_loss": -5.3855390548706055, "global_step": 21046, "epoch": 501} {"train_loss": -5.3830461502075195, "global_step": 21047, "epoch": 501} {"train_loss": -5.227751731872559, "global_step": 21048, "epoch": 501} {"train_loss": -5.307589054107666, "global_step": 21049, "epoch": 501} {"train_loss": -5.31519889831543, "global_step": 21050, "epoch": 501} {"train_loss": -5.382938861846924, "global_step": 21051, "epoch": 501} {"train_loss": -5.182375431060791, "global_step": 21052, "epoch": 501} {"train_loss": -5.375369071960449, "global_step": 21053, "epoch": 501} {"train_loss": -5.31455659866333, "global_step": 21054, "epoch": 501} {"train_loss": -5.337748050689697, "global_step": 21055, "epoch": 501} {"train_loss": -5.314672470092773, "global_step": 21056, "epoch": 501} {"train_loss": -5.371508598327637, "global_step": 21057, "epoch": 501} {"train_loss": -5.328068733215332, "global_step": 21058, "epoch": 501} {"train_loss": -5.262781143188477, "global_step": 21059, "epoch": 501} {"train_loss": -5.261341094970703, "global_step": 21060, "epoch": 501} {"train_loss": -5.418503761291504, "global_step": 21061, "epoch": 501} {"train_loss": -5.472877502441406, "global_step": 21062, "epoch": 501} {"train_loss": -5.397092819213867, "global_step": 21063, "epoch": 501} {"train_loss": -5.405496597290039, "global_step": 21064, "epoch": 501} {"train_loss": -5.278871536254883, "global_step": 21065, "epoch": 501} {"train_loss": -5.416074275970459, "global_step": 21066, "epoch": 501} {"train_loss": -5.194828987121582, "global_step": 21067, "epoch": 501} {"train_loss": -5.309854507446289, "global_step": 21068, "epoch": 501} {"train_loss": -5.406190395355225, "global_step": 21069, "epoch": 501} {"train_loss": -5.422627925872803, "global_step": 21070, "epoch": 501} {"train_loss": -5.326016426086426, "global_step": 21071, "epoch": 501} {"train_loss": -5.348404884338379, "global_step": 21072, "epoch": 501} {"train_loss": -5.455604553222656, "global_step": 21073, "epoch": 501} {"train_loss": -5.2484588623046875, "global_step": 21074, "epoch": 501} {"train_loss": -5.241333961486816, "global_step": 21075, "epoch": 501} {"train_loss": -5.380824565887451, "global_step": 21076, "epoch": 501} {"train_loss": -5.337460517883301, "global_step": 21077, "epoch": 501} {"train_loss": -5.404633045196533, "global_step": 21078, "epoch": 501} {"train_loss": -5.429045677185059, "global_step": 21079, "epoch": 501} {"train_loss": -5.394174575805664, "global_step": 21080, "epoch": 501} {"train_loss": -5.340201377868652, "global_step": 21081, "epoch": 501} {"train_loss": -5.253891468048096, "global_step": 21082, "epoch": 501} {"train_loss": -5.332773344857352, "global_step": 21083, "epoch": 501, "val_loss": 68805.578125} {"train_loss": -5.186358451843262, "global_step": 21084, "epoch": 502} {"train_loss": -5.39381217956543, "global_step": 21085, "epoch": 502} {"train_loss": -5.4748969078063965, "global_step": 21086, "epoch": 502} {"train_loss": -5.361640930175781, "global_step": 21087, "epoch": 502} {"train_loss": -5.379663944244385, "global_step": 21088, "epoch": 502} {"train_loss": -5.355566024780273, "global_step": 21089, "epoch": 502} {"train_loss": -5.278011322021484, "global_step": 21090, "epoch": 502} {"train_loss": -5.420989513397217, "global_step": 21091, "epoch": 502} {"train_loss": -5.317574501037598, "global_step": 21092, "epoch": 502} {"train_loss": -5.323947429656982, "global_step": 21093, "epoch": 502} {"train_loss": -5.424670219421387, "global_step": 21094, "epoch": 502} {"train_loss": -5.330990791320801, "global_step": 21095, "epoch": 502} {"train_loss": -5.539517402648926, "global_step": 21096, "epoch": 502} {"train_loss": -5.301967144012451, "global_step": 21097, "epoch": 502} {"train_loss": -5.39526891708374, "global_step": 21098, "epoch": 502} {"train_loss": -5.294508457183838, "global_step": 21099, "epoch": 502} {"train_loss": -5.406904697418213, "global_step": 21100, "epoch": 502} {"train_loss": -5.326784133911133, "global_step": 21101, "epoch": 502} {"train_loss": -5.308767795562744, "global_step": 21102, "epoch": 502} {"train_loss": -5.270669937133789, "global_step": 21103, "epoch": 502} {"train_loss": -5.430380344390869, "global_step": 21104, "epoch": 502} {"train_loss": -5.2824296951293945, "global_step": 21105, "epoch": 502} {"train_loss": -5.107069969177246, "global_step": 21106, "epoch": 502} {"train_loss": -5.349051475524902, "global_step": 21107, "epoch": 502} {"train_loss": -5.121143341064453, "global_step": 21108, "epoch": 502} {"train_loss": -5.069595813751221, "global_step": 21109, "epoch": 502} {"train_loss": -5.45351505279541, "global_step": 21110, "epoch": 502} {"train_loss": -5.224379539489746, "global_step": 21111, "epoch": 502} {"train_loss": -5.252431869506836, "global_step": 21112, "epoch": 502} {"train_loss": -5.3070759773254395, "global_step": 21113, "epoch": 502} {"train_loss": -5.3315324783325195, "global_step": 21114, "epoch": 502} {"train_loss": -5.33207893371582, "global_step": 21115, "epoch": 502} {"train_loss": -5.369844436645508, "global_step": 21116, "epoch": 502} {"train_loss": -5.4582839012146, "global_step": 21117, "epoch": 502} {"train_loss": -5.317375183105469, "global_step": 21118, "epoch": 502} {"train_loss": -5.419068813323975, "global_step": 21119, "epoch": 502} {"train_loss": -5.228798866271973, "global_step": 21120, "epoch": 502} {"train_loss": -5.241620063781738, "global_step": 21121, "epoch": 502} {"train_loss": -5.250865459442139, "global_step": 21122, "epoch": 502} {"train_loss": -5.396208763122559, "global_step": 21123, "epoch": 502} {"train_loss": -5.391805648803711, "global_step": 21124, "epoch": 502} {"train_loss": -5.330260980696905, "global_step": 21125, "epoch": 502, "val_loss": 68556.3359375} {"train_loss": -5.313080787658691, "global_step": 21126, "epoch": 503} {"train_loss": -5.431061744689941, "global_step": 21127, "epoch": 503} {"train_loss": -5.425999641418457, "global_step": 21128, "epoch": 503} {"train_loss": -5.376870155334473, "global_step": 21129, "epoch": 503} {"train_loss": -5.337055683135986, "global_step": 21130, "epoch": 503} {"train_loss": -5.447643280029297, "global_step": 21131, "epoch": 503} {"train_loss": -5.379086494445801, "global_step": 21132, "epoch": 503} {"train_loss": -5.333095073699951, "global_step": 21133, "epoch": 503} {"train_loss": -5.431948184967041, "global_step": 21134, "epoch": 503} {"train_loss": -5.342368125915527, "global_step": 21135, "epoch": 503} {"train_loss": -5.3319854736328125, "global_step": 21136, "epoch": 503} {"train_loss": -5.294681549072266, "global_step": 21137, "epoch": 503} {"train_loss": -5.387697696685791, "global_step": 21138, "epoch": 503} {"train_loss": -5.368238925933838, "global_step": 21139, "epoch": 503} {"train_loss": -5.342665672302246, "global_step": 21140, "epoch": 503} {"train_loss": -5.276538372039795, "global_step": 21141, "epoch": 503} {"train_loss": -5.3788909912109375, "global_step": 21142, "epoch": 503} {"train_loss": -5.256705284118652, "global_step": 21143, "epoch": 503} {"train_loss": -5.184459209442139, "global_step": 21144, "epoch": 503} {"train_loss": -5.329667091369629, "global_step": 21145, "epoch": 503} {"train_loss": -5.205388069152832, "global_step": 21146, "epoch": 503} {"train_loss": -5.448607444763184, "global_step": 21147, "epoch": 503} {"train_loss": -5.2998151779174805, "global_step": 21148, "epoch": 503} {"train_loss": -5.207089424133301, "global_step": 21149, "epoch": 503} {"train_loss": -5.3348493576049805, "global_step": 21150, "epoch": 503} {"train_loss": -5.18783712387085, "global_step": 21151, "epoch": 503} {"train_loss": -5.273836135864258, "global_step": 21152, "epoch": 503} {"train_loss": -5.322908401489258, "global_step": 21153, "epoch": 503} {"train_loss": -5.284817695617676, "global_step": 21154, "epoch": 503} {"train_loss": -5.379772186279297, "global_step": 21155, "epoch": 503} {"train_loss": -5.2558794021606445, "global_step": 21156, "epoch": 503} {"train_loss": -5.351224899291992, "global_step": 21157, "epoch": 503} {"train_loss": -5.281904220581055, "global_step": 21158, "epoch": 503} {"train_loss": -5.280157566070557, "global_step": 21159, "epoch": 503} {"train_loss": -5.319449424743652, "global_step": 21160, "epoch": 503} {"train_loss": -5.382011413574219, "global_step": 21161, "epoch": 503} {"train_loss": -5.410260200500488, "global_step": 21162, "epoch": 503} {"train_loss": -5.328195571899414, "global_step": 21163, "epoch": 503} {"train_loss": -5.363914966583252, "global_step": 21164, "epoch": 503} {"train_loss": -5.376842021942139, "global_step": 21165, "epoch": 503} {"train_loss": -5.33680534362793, "global_step": 21166, "epoch": 503} {"train_loss": -5.330662068866548, "global_step": 21167, "epoch": 503, "val_loss": 68298.3671875} {"train_loss": -5.377554893493652, "global_step": 21168, "epoch": 504} {"train_loss": -5.300311088562012, "global_step": 21169, "epoch": 504} {"train_loss": -5.229820728302002, "global_step": 21170, "epoch": 504} {"train_loss": -5.438974380493164, "global_step": 21171, "epoch": 504} {"train_loss": -5.485466957092285, "global_step": 21172, "epoch": 504} {"train_loss": -5.154745578765869, "global_step": 21173, "epoch": 504} {"train_loss": -5.222519874572754, "global_step": 21174, "epoch": 504} {"train_loss": -5.306089401245117, "global_step": 21175, "epoch": 504} {"train_loss": -5.404914855957031, "global_step": 21176, "epoch": 504} {"train_loss": -5.079455375671387, "global_step": 21177, "epoch": 504} {"train_loss": -5.4276018142700195, "global_step": 21178, "epoch": 504} {"train_loss": -5.056922912597656, "global_step": 21179, "epoch": 504} {"train_loss": -5.264040946960449, "global_step": 21180, "epoch": 504} {"train_loss": -5.406017780303955, "global_step": 21181, "epoch": 504} {"train_loss": -5.281288146972656, "global_step": 21182, "epoch": 504} {"train_loss": -5.338658332824707, "global_step": 21183, "epoch": 504} {"train_loss": -5.265872001647949, "global_step": 21184, "epoch": 504} {"train_loss": -5.25927209854126, "global_step": 21185, "epoch": 504} {"train_loss": -5.407009601593018, "global_step": 21186, "epoch": 504} {"train_loss": -5.278515815734863, "global_step": 21187, "epoch": 504} {"train_loss": -5.3830718994140625, "global_step": 21188, "epoch": 504} {"train_loss": -5.474344253540039, "global_step": 21189, "epoch": 504} {"train_loss": -5.317485332489014, "global_step": 21190, "epoch": 504} {"train_loss": -5.360136032104492, "global_step": 21191, "epoch": 504} {"train_loss": -5.249748229980469, "global_step": 21192, "epoch": 504} {"train_loss": -5.30570650100708, "global_step": 21193, "epoch": 504} {"train_loss": -5.453173637390137, "global_step": 21194, "epoch": 504} {"train_loss": -5.309375286102295, "global_step": 21195, "epoch": 504} {"train_loss": -5.36375617980957, "global_step": 21196, "epoch": 504} {"train_loss": -5.353656768798828, "global_step": 21197, "epoch": 504} {"train_loss": -5.296543598175049, "global_step": 21198, "epoch": 504} {"train_loss": -5.367290496826172, "global_step": 21199, "epoch": 504} {"train_loss": -5.38063907623291, "global_step": 21200, "epoch": 504} {"train_loss": -5.141168594360352, "global_step": 21201, "epoch": 504} {"train_loss": -5.380090713500977, "global_step": 21202, "epoch": 504} {"train_loss": -5.309237003326416, "global_step": 21203, "epoch": 504} {"train_loss": -5.327095985412598, "global_step": 21204, "epoch": 504} {"train_loss": -5.360495090484619, "global_step": 21205, "epoch": 504} {"train_loss": -5.310702323913574, "global_step": 21206, "epoch": 504} {"train_loss": -5.2198805809021, "global_step": 21207, "epoch": 504} {"train_loss": -5.3037800788879395, "global_step": 21208, "epoch": 504} {"train_loss": -5.318720931098575, "global_step": 21209, "epoch": 504, "val_loss": 68570.171875} {"train_loss": -5.347541809082031, "global_step": 21210, "epoch": 505} {"train_loss": -5.346834182739258, "global_step": 21211, "epoch": 505} {"train_loss": -5.304315567016602, "global_step": 21212, "epoch": 505} {"train_loss": -5.375609397888184, "global_step": 21213, "epoch": 505} {"train_loss": -5.346493721008301, "global_step": 21214, "epoch": 505} {"train_loss": -5.45603084564209, "global_step": 21215, "epoch": 505} {"train_loss": -5.55610466003418, "global_step": 21216, "epoch": 505} {"train_loss": -5.264994144439697, "global_step": 21217, "epoch": 505} {"train_loss": -5.315488815307617, "global_step": 21218, "epoch": 505} {"train_loss": -5.223613739013672, "global_step": 21219, "epoch": 505} {"train_loss": -5.3561201095581055, "global_step": 21220, "epoch": 505} {"train_loss": -5.352911472320557, "global_step": 21221, "epoch": 505} {"train_loss": -5.256198883056641, "global_step": 21222, "epoch": 505} {"train_loss": -5.248492240905762, "global_step": 21223, "epoch": 505} {"train_loss": -5.330958366394043, "global_step": 21224, "epoch": 505} {"train_loss": -5.235177040100098, "global_step": 21225, "epoch": 505} {"train_loss": -5.202419757843018, "global_step": 21226, "epoch": 505} {"train_loss": -5.346749305725098, "global_step": 21227, "epoch": 505} {"train_loss": -5.31988000869751, "global_step": 21228, "epoch": 505} {"train_loss": -5.353231430053711, "global_step": 21229, "epoch": 505} {"train_loss": -5.175820350646973, "global_step": 21230, "epoch": 505} {"train_loss": -5.235766410827637, "global_step": 21231, "epoch": 505} {"train_loss": -5.2936811447143555, "global_step": 21232, "epoch": 505} {"train_loss": -5.358054161071777, "global_step": 21233, "epoch": 505} {"train_loss": -5.482538223266602, "global_step": 21234, "epoch": 505} {"train_loss": -5.42490816116333, "global_step": 21235, "epoch": 505} {"train_loss": -5.306055068969727, "global_step": 21236, "epoch": 505} {"train_loss": -5.352640151977539, "global_step": 21237, "epoch": 505} {"train_loss": -5.411375045776367, "global_step": 21238, "epoch": 505} {"train_loss": -5.2504682540893555, "global_step": 21239, "epoch": 505} {"train_loss": -5.350705623626709, "global_step": 21240, "epoch": 505} {"train_loss": -5.3036723136901855, "global_step": 21241, "epoch": 505} {"train_loss": -5.452323913574219, "global_step": 21242, "epoch": 505} {"train_loss": -5.428500175476074, "global_step": 21243, "epoch": 505} {"train_loss": -5.249007225036621, "global_step": 21244, "epoch": 505} {"train_loss": -5.325730800628662, "global_step": 21245, "epoch": 505} {"train_loss": -5.272928237915039, "global_step": 21246, "epoch": 505} {"train_loss": -5.314168930053711, "global_step": 21247, "epoch": 505} {"train_loss": -5.35642671585083, "global_step": 21248, "epoch": 505} {"train_loss": -5.314784049987793, "global_step": 21249, "epoch": 505} {"train_loss": -5.436424255371094, "global_step": 21250, "epoch": 505} {"train_loss": -5.333700702303932, "global_step": 21251, "epoch": 505, "val_loss": 68526.5625} {"train_loss": -5.334537982940674, "global_step": 21252, "epoch": 506} {"train_loss": -5.399989128112793, "global_step": 21253, "epoch": 506} {"train_loss": -5.478242874145508, "global_step": 21254, "epoch": 506} {"train_loss": -5.323941230773926, "global_step": 21255, "epoch": 506} {"train_loss": -5.405448913574219, "global_step": 21256, "epoch": 506} {"train_loss": -5.325194358825684, "global_step": 21257, "epoch": 506} {"train_loss": -5.460785388946533, "global_step": 21258, "epoch": 506} {"train_loss": -5.387913703918457, "global_step": 21259, "epoch": 506} {"train_loss": -5.364699363708496, "global_step": 21260, "epoch": 506} {"train_loss": -5.13676643371582, "global_step": 21261, "epoch": 506} {"train_loss": -5.414562702178955, "global_step": 21262, "epoch": 506} {"train_loss": -5.4948930740356445, "global_step": 21263, "epoch": 506} {"train_loss": -5.172009468078613, "global_step": 21264, "epoch": 506} {"train_loss": -5.233397006988525, "global_step": 21265, "epoch": 506} {"train_loss": -5.364662170410156, "global_step": 21266, "epoch": 506} {"train_loss": -5.3065185546875, "global_step": 21267, "epoch": 506} {"train_loss": -5.188556671142578, "global_step": 21268, "epoch": 506} {"train_loss": -5.4786834716796875, "global_step": 21269, "epoch": 506} {"train_loss": -5.372025489807129, "global_step": 21270, "epoch": 506} {"train_loss": -5.190990924835205, "global_step": 21271, "epoch": 506} {"train_loss": -5.32880973815918, "global_step": 21272, "epoch": 506} {"train_loss": -5.199553966522217, "global_step": 21273, "epoch": 506} {"train_loss": -5.177369594573975, "global_step": 21274, "epoch": 506} {"train_loss": -5.210753917694092, "global_step": 21275, "epoch": 506} {"train_loss": -5.395036697387695, "global_step": 21276, "epoch": 506} {"train_loss": -5.337013244628906, "global_step": 21277, "epoch": 506} {"train_loss": -5.305473804473877, "global_step": 21278, "epoch": 506} {"train_loss": -5.281678676605225, "global_step": 21279, "epoch": 506} {"train_loss": -5.279509544372559, "global_step": 21280, "epoch": 506} {"train_loss": -5.302865982055664, "global_step": 21281, "epoch": 506} {"train_loss": -5.324210166931152, "global_step": 21282, "epoch": 506} {"train_loss": -5.401400566101074, "global_step": 21283, "epoch": 506} {"train_loss": -5.2495551109313965, "global_step": 21284, "epoch": 506} {"train_loss": -5.2297844886779785, "global_step": 21285, "epoch": 506} {"train_loss": -5.316174507141113, "global_step": 21286, "epoch": 506} {"train_loss": -5.307035446166992, "global_step": 21287, "epoch": 506} {"train_loss": -5.309967994689941, "global_step": 21288, "epoch": 506} {"train_loss": -5.343050003051758, "global_step": 21289, "epoch": 506} {"train_loss": -5.365076541900635, "global_step": 21290, "epoch": 506} {"train_loss": -5.1488847732543945, "global_step": 21291, "epoch": 506} {"train_loss": -5.39981746673584, "global_step": 21292, "epoch": 506} {"train_loss": -5.321767625354585, "global_step": 21293, "epoch": 506, "val_loss": 69917.328125} {"train_loss": -5.224487781524658, "global_step": 21294, "epoch": 507} {"train_loss": -5.437635898590088, "global_step": 21295, "epoch": 507} {"train_loss": -5.362883567810059, "global_step": 21296, "epoch": 507} {"train_loss": -5.332492828369141, "global_step": 21297, "epoch": 507} {"train_loss": -5.347965240478516, "global_step": 21298, "epoch": 507} {"train_loss": -5.201507568359375, "global_step": 21299, "epoch": 507} {"train_loss": -5.330921173095703, "global_step": 21300, "epoch": 507} {"train_loss": -5.355996131896973, "global_step": 21301, "epoch": 507} {"train_loss": -5.398131370544434, "global_step": 21302, "epoch": 507} {"train_loss": -5.2719831466674805, "global_step": 21303, "epoch": 507} {"train_loss": -5.332886695861816, "global_step": 21304, "epoch": 507} {"train_loss": -5.27126407623291, "global_step": 21305, "epoch": 507} {"train_loss": -5.2541985511779785, "global_step": 21306, "epoch": 507} {"train_loss": -5.2382612228393555, "global_step": 21307, "epoch": 507} {"train_loss": -5.362864971160889, "global_step": 21308, "epoch": 507} {"train_loss": -5.374693870544434, "global_step": 21309, "epoch": 507} {"train_loss": -5.1894612312316895, "global_step": 21310, "epoch": 507} {"train_loss": -5.316117286682129, "global_step": 21311, "epoch": 507} {"train_loss": -5.372745513916016, "global_step": 21312, "epoch": 507} {"train_loss": -5.4053449630737305, "global_step": 21313, "epoch": 507} {"train_loss": -5.264559745788574, "global_step": 21314, "epoch": 507} {"train_loss": -5.263946533203125, "global_step": 21315, "epoch": 507} {"train_loss": -5.404511451721191, "global_step": 21316, "epoch": 507} {"train_loss": -5.360788822174072, "global_step": 21317, "epoch": 507} {"train_loss": -5.348182678222656, "global_step": 21318, "epoch": 507} {"train_loss": -5.361544132232666, "global_step": 21319, "epoch": 507} {"train_loss": -5.161124229431152, "global_step": 21320, "epoch": 507} {"train_loss": -5.389391899108887, "global_step": 21321, "epoch": 507} {"train_loss": -5.3269195556640625, "global_step": 21322, "epoch": 507} {"train_loss": -5.374936580657959, "global_step": 21323, "epoch": 507} {"train_loss": -5.44235897064209, "global_step": 21324, "epoch": 507} {"train_loss": -5.400177001953125, "global_step": 21325, "epoch": 507} {"train_loss": -5.282139301300049, "global_step": 21326, "epoch": 507} {"train_loss": -5.38311767578125, "global_step": 21327, "epoch": 507} {"train_loss": -5.240880012512207, "global_step": 21328, "epoch": 507} {"train_loss": -5.24658203125, "global_step": 21329, "epoch": 507} {"train_loss": -5.436946868896484, "global_step": 21330, "epoch": 507} {"train_loss": -5.236222743988037, "global_step": 21331, "epoch": 507} {"train_loss": -5.2013630867004395, "global_step": 21332, "epoch": 507} {"train_loss": -5.384097099304199, "global_step": 21333, "epoch": 507} {"train_loss": -5.349936485290527, "global_step": 21334, "epoch": 507} {"train_loss": -5.324240525563558, "global_step": 21335, "epoch": 507, "val_loss": 68584.765625} {"train_loss": -5.285472393035889, "global_step": 21336, "epoch": 508} {"train_loss": -5.457324028015137, "global_step": 21337, "epoch": 508} {"train_loss": -5.26729154586792, "global_step": 21338, "epoch": 508} {"train_loss": -5.271855354309082, "global_step": 21339, "epoch": 508} {"train_loss": -5.35371208190918, "global_step": 21340, "epoch": 508} {"train_loss": -5.342618942260742, "global_step": 21341, "epoch": 508} {"train_loss": -5.318641662597656, "global_step": 21342, "epoch": 508} {"train_loss": -5.291630744934082, "global_step": 21343, "epoch": 508} {"train_loss": -5.314849853515625, "global_step": 21344, "epoch": 508} {"train_loss": -5.240234375, "global_step": 21345, "epoch": 508} {"train_loss": -5.157778263092041, "global_step": 21346, "epoch": 508} {"train_loss": -5.348312854766846, "global_step": 21347, "epoch": 508} {"train_loss": -5.177922248840332, "global_step": 21348, "epoch": 508} {"train_loss": -5.3470611572265625, "global_step": 21349, "epoch": 508} {"train_loss": -5.249024391174316, "global_step": 21350, "epoch": 508} {"train_loss": -5.434943199157715, "global_step": 21351, "epoch": 508} {"train_loss": -5.284675598144531, "global_step": 21352, "epoch": 508} {"train_loss": -5.28794002532959, "global_step": 21353, "epoch": 508} {"train_loss": -5.387194633483887, "global_step": 21354, "epoch": 508} {"train_loss": -5.343728542327881, "global_step": 21355, "epoch": 508} {"train_loss": -5.278644561767578, "global_step": 21356, "epoch": 508} {"train_loss": -5.309021949768066, "global_step": 21357, "epoch": 508} {"train_loss": -5.284646034240723, "global_step": 21358, "epoch": 508} {"train_loss": -5.28037166595459, "global_step": 21359, "epoch": 508} {"train_loss": -5.315116882324219, "global_step": 21360, "epoch": 508} {"train_loss": -5.333934783935547, "global_step": 21361, "epoch": 508} {"train_loss": -5.316995143890381, "global_step": 21362, "epoch": 508} {"train_loss": -5.376270294189453, "global_step": 21363, "epoch": 508} {"train_loss": -5.361867904663086, "global_step": 21364, "epoch": 508} {"train_loss": -5.4361443519592285, "global_step": 21365, "epoch": 508} {"train_loss": -5.41002082824707, "global_step": 21366, "epoch": 508} {"train_loss": -5.309361457824707, "global_step": 21367, "epoch": 508} {"train_loss": -5.3307271003723145, "global_step": 21368, "epoch": 508} {"train_loss": -5.3585405349731445, "global_step": 21369, "epoch": 508} {"train_loss": -5.320735931396484, "global_step": 21370, "epoch": 508} {"train_loss": -5.418918132781982, "global_step": 21371, "epoch": 508} {"train_loss": -5.3270769119262695, "global_step": 21372, "epoch": 508} {"train_loss": -5.313176155090332, "global_step": 21373, "epoch": 508} {"train_loss": -5.444583415985107, "global_step": 21374, "epoch": 508} {"train_loss": -5.262051105499268, "global_step": 21375, "epoch": 508} {"train_loss": -5.25671911239624, "global_step": 21376, "epoch": 508} {"train_loss": -5.325182415190197, "global_step": 21377, "epoch": 508, "val_loss": 68575.6953125} {"train_loss": -5.348867416381836, "global_step": 21378, "epoch": 509} {"train_loss": -5.225793838500977, "global_step": 21379, "epoch": 509} {"train_loss": -5.267454147338867, "global_step": 21380, "epoch": 509} {"train_loss": -5.402653217315674, "global_step": 21381, "epoch": 509} {"train_loss": -5.360250473022461, "global_step": 21382, "epoch": 509} {"train_loss": -5.397257328033447, "global_step": 21383, "epoch": 509} {"train_loss": -5.465013027191162, "global_step": 21384, "epoch": 509} {"train_loss": -5.415280818939209, "global_step": 21385, "epoch": 509} {"train_loss": -5.288333892822266, "global_step": 21386, "epoch": 509} {"train_loss": -5.467272758483887, "global_step": 21387, "epoch": 509} {"train_loss": -5.342400550842285, "global_step": 21388, "epoch": 509} {"train_loss": -5.328200340270996, "global_step": 21389, "epoch": 509} {"train_loss": -5.272660255432129, "global_step": 21390, "epoch": 509} {"train_loss": -5.313270568847656, "global_step": 21391, "epoch": 509} {"train_loss": -5.284963607788086, "global_step": 21392, "epoch": 509} {"train_loss": -5.36189603805542, "global_step": 21393, "epoch": 509} {"train_loss": -5.3626179695129395, "global_step": 21394, "epoch": 509} {"train_loss": -5.2774248123168945, "global_step": 21395, "epoch": 509} {"train_loss": -5.342347145080566, "global_step": 21396, "epoch": 509} {"train_loss": -5.412320137023926, "global_step": 21397, "epoch": 509} {"train_loss": -5.388723373413086, "global_step": 21398, "epoch": 509} {"train_loss": -5.365933418273926, "global_step": 21399, "epoch": 509} {"train_loss": -5.316266059875488, "global_step": 21400, "epoch": 509} {"train_loss": -5.353899955749512, "global_step": 21401, "epoch": 509} {"train_loss": -5.441512584686279, "global_step": 21402, "epoch": 509} {"train_loss": -5.29018497467041, "global_step": 21403, "epoch": 509} {"train_loss": -5.191191673278809, "global_step": 21404, "epoch": 509} {"train_loss": -5.339892387390137, "global_step": 21405, "epoch": 509} {"train_loss": -5.474058151245117, "global_step": 21406, "epoch": 509} {"train_loss": -5.363199234008789, "global_step": 21407, "epoch": 509} {"train_loss": -5.44473934173584, "global_step": 21408, "epoch": 509} {"train_loss": -5.423916816711426, "global_step": 21409, "epoch": 509} {"train_loss": -5.247140884399414, "global_step": 21410, "epoch": 509} {"train_loss": -5.394296169281006, "global_step": 21411, "epoch": 509} {"train_loss": -5.416752338409424, "global_step": 21412, "epoch": 509} {"train_loss": -5.141017913818359, "global_step": 21413, "epoch": 509} {"train_loss": -5.419683456420898, "global_step": 21414, "epoch": 509} {"train_loss": -5.434999942779541, "global_step": 21415, "epoch": 509} {"train_loss": -5.302171230316162, "global_step": 21416, "epoch": 509} {"train_loss": -5.406656742095947, "global_step": 21417, "epoch": 509} {"train_loss": -5.326786041259766, "global_step": 21418, "epoch": 509} {"train_loss": -5.350538900920323, "global_step": 21419, "epoch": 509, "val_loss": 68345.828125} {"train_loss": -5.464982986450195, "global_step": 21420, "epoch": 510} {"train_loss": -5.288870811462402, "global_step": 21421, "epoch": 510} {"train_loss": -5.36453104019165, "global_step": 21422, "epoch": 510} {"train_loss": -5.365921497344971, "global_step": 21423, "epoch": 510} {"train_loss": -5.426360130310059, "global_step": 21424, "epoch": 510} {"train_loss": -5.431809425354004, "global_step": 21425, "epoch": 510} {"train_loss": -5.2884016036987305, "global_step": 21426, "epoch": 510} {"train_loss": -5.352832794189453, "global_step": 21427, "epoch": 510} {"train_loss": -5.236670970916748, "global_step": 21428, "epoch": 510} {"train_loss": -5.418852806091309, "global_step": 21429, "epoch": 510} {"train_loss": -5.316313743591309, "global_step": 21430, "epoch": 510} {"train_loss": -5.37723970413208, "global_step": 21431, "epoch": 510} {"train_loss": -5.275002956390381, "global_step": 21432, "epoch": 510} {"train_loss": -5.293741226196289, "global_step": 21433, "epoch": 510} {"train_loss": -5.290164947509766, "global_step": 21434, "epoch": 510} {"train_loss": -5.420098781585693, "global_step": 21435, "epoch": 510} {"train_loss": -5.347261428833008, "global_step": 21436, "epoch": 510} {"train_loss": -5.53424072265625, "global_step": 21437, "epoch": 510} {"train_loss": -5.157676696777344, "global_step": 21438, "epoch": 510} {"train_loss": -5.261431694030762, "global_step": 21439, "epoch": 510} {"train_loss": -5.402032852172852, "global_step": 21440, "epoch": 510} {"train_loss": -5.279013633728027, "global_step": 21441, "epoch": 510} {"train_loss": -5.242393493652344, "global_step": 21442, "epoch": 510} {"train_loss": -5.285512924194336, "global_step": 21443, "epoch": 510} {"train_loss": -5.352021217346191, "global_step": 21444, "epoch": 510} {"train_loss": -5.320298194885254, "global_step": 21445, "epoch": 510} {"train_loss": -5.231035232543945, "global_step": 21446, "epoch": 510} {"train_loss": -5.342562198638916, "global_step": 21447, "epoch": 510} {"train_loss": -5.310503959655762, "global_step": 21448, "epoch": 510} {"train_loss": -5.307658672332764, "global_step": 21449, "epoch": 510} {"train_loss": -5.210108280181885, "global_step": 21450, "epoch": 510} {"train_loss": -5.442934036254883, "global_step": 21451, "epoch": 510} {"train_loss": -5.322681903839111, "global_step": 21452, "epoch": 510} {"train_loss": -5.205166816711426, "global_step": 21453, "epoch": 510} {"train_loss": -5.352574348449707, "global_step": 21454, "epoch": 510} {"train_loss": -5.464023590087891, "global_step": 21455, "epoch": 510} {"train_loss": -5.402912139892578, "global_step": 21456, "epoch": 510} {"train_loss": -5.140089988708496, "global_step": 21457, "epoch": 510} {"train_loss": -5.25916862487793, "global_step": 21458, "epoch": 510} {"train_loss": -5.2635817527771, "global_step": 21459, "epoch": 510} {"train_loss": -5.356681823730469, "global_step": 21460, "epoch": 510} {"train_loss": -5.325611545926049, "global_step": 21461, "epoch": 510, "val_loss": 68814.4375} {"train_loss": -5.252394676208496, "global_step": 21462, "epoch": 511} {"train_loss": -5.389797210693359, "global_step": 21463, "epoch": 511} {"train_loss": -5.242414951324463, "global_step": 21464, "epoch": 511} {"train_loss": -5.402526378631592, "global_step": 21465, "epoch": 511} {"train_loss": -5.360288143157959, "global_step": 21466, "epoch": 511} {"train_loss": -5.358133792877197, "global_step": 21467, "epoch": 511} {"train_loss": -5.364813327789307, "global_step": 21468, "epoch": 511} {"train_loss": -5.279782295227051, "global_step": 21469, "epoch": 511} {"train_loss": -5.475152492523193, "global_step": 21470, "epoch": 511} {"train_loss": -5.29945182800293, "global_step": 21471, "epoch": 511} {"train_loss": -5.306917190551758, "global_step": 21472, "epoch": 511} {"train_loss": -5.375490665435791, "global_step": 21473, "epoch": 511} {"train_loss": -5.360626697540283, "global_step": 21474, "epoch": 511} {"train_loss": -5.302858352661133, "global_step": 21475, "epoch": 511} {"train_loss": -5.358309745788574, "global_step": 21476, "epoch": 511} {"train_loss": -5.296122074127197, "global_step": 21477, "epoch": 511} {"train_loss": -5.370297431945801, "global_step": 21478, "epoch": 511} {"train_loss": -5.182043075561523, "global_step": 21479, "epoch": 511} {"train_loss": -5.343303680419922, "global_step": 21480, "epoch": 511} {"train_loss": -5.397941589355469, "global_step": 21481, "epoch": 511} {"train_loss": -5.480623245239258, "global_step": 21482, "epoch": 511} {"train_loss": -5.183574199676514, "global_step": 21483, "epoch": 511} {"train_loss": -5.4954118728637695, "global_step": 21484, "epoch": 511} {"train_loss": -5.277571678161621, "global_step": 21485, "epoch": 511} {"train_loss": -5.393289089202881, "global_step": 21486, "epoch": 511} {"train_loss": -5.415402412414551, "global_step": 21487, "epoch": 511} {"train_loss": -5.361655235290527, "global_step": 21488, "epoch": 511} {"train_loss": -5.380828857421875, "global_step": 21489, "epoch": 511} {"train_loss": -5.360805511474609, "global_step": 21490, "epoch": 511} {"train_loss": -5.384429454803467, "global_step": 21491, "epoch": 511} {"train_loss": -5.393990516662598, "global_step": 21492, "epoch": 511} {"train_loss": -5.250044822692871, "global_step": 21493, "epoch": 511} {"train_loss": -5.397819519042969, "global_step": 21494, "epoch": 511} {"train_loss": -5.320141792297363, "global_step": 21495, "epoch": 511} {"train_loss": -5.40395975112915, "global_step": 21496, "epoch": 511} {"train_loss": -5.297464370727539, "global_step": 21497, "epoch": 511} {"train_loss": -5.464851379394531, "global_step": 21498, "epoch": 511} {"train_loss": -5.469883918762207, "global_step": 21499, "epoch": 511} {"train_loss": -5.131877422332764, "global_step": 21500, "epoch": 511} {"train_loss": -5.3241472244262695, "global_step": 21501, "epoch": 511} {"train_loss": -5.338818550109863, "global_step": 21502, "epoch": 511} {"train_loss": -5.346229723521641, "global_step": 21503, "epoch": 511, "val_loss": 68782.2734375} {"train_loss": -5.389834403991699, "global_step": 21504, "epoch": 512} {"train_loss": -5.1807451248168945, "global_step": 21505, "epoch": 512} {"train_loss": -5.315731048583984, "global_step": 21506, "epoch": 512} {"train_loss": -5.378168106079102, "global_step": 21507, "epoch": 512} {"train_loss": -5.333353042602539, "global_step": 21508, "epoch": 512} {"train_loss": -5.404717445373535, "global_step": 21509, "epoch": 512} {"train_loss": -5.317323684692383, "global_step": 21510, "epoch": 512} {"train_loss": -5.340437889099121, "global_step": 21511, "epoch": 512} {"train_loss": -5.376047134399414, "global_step": 21512, "epoch": 512} {"train_loss": -5.351107597351074, "global_step": 21513, "epoch": 512} {"train_loss": -5.41623592376709, "global_step": 21514, "epoch": 512} {"train_loss": -5.4043803215026855, "global_step": 21515, "epoch": 512} {"train_loss": -5.1909894943237305, "global_step": 21516, "epoch": 512} {"train_loss": -5.268031120300293, "global_step": 21517, "epoch": 512} {"train_loss": -5.4247050285339355, "global_step": 21518, "epoch": 512} {"train_loss": -5.454812526702881, "global_step": 21519, "epoch": 512} {"train_loss": -5.320964813232422, "global_step": 21520, "epoch": 512} {"train_loss": -5.414563179016113, "global_step": 21521, "epoch": 512} {"train_loss": -5.472311973571777, "global_step": 21522, "epoch": 512} {"train_loss": -5.347901344299316, "global_step": 21523, "epoch": 512} {"train_loss": -5.172970771789551, "global_step": 21524, "epoch": 512} {"train_loss": -5.2904462814331055, "global_step": 21525, "epoch": 512} {"train_loss": -5.3777756690979, "global_step": 21526, "epoch": 512} {"train_loss": -5.457780361175537, "global_step": 21527, "epoch": 512} {"train_loss": -5.370469093322754, "global_step": 21528, "epoch": 512} {"train_loss": -5.416201591491699, "global_step": 21529, "epoch": 512} {"train_loss": -5.2372002601623535, "global_step": 21530, "epoch": 512} {"train_loss": -5.460432052612305, "global_step": 21531, "epoch": 512} {"train_loss": -5.157769680023193, "global_step": 21532, "epoch": 512} {"train_loss": -5.111362934112549, "global_step": 21533, "epoch": 512} {"train_loss": -5.296756744384766, "global_step": 21534, "epoch": 512} {"train_loss": -5.253435134887695, "global_step": 21535, "epoch": 512} {"train_loss": -5.315776824951172, "global_step": 21536, "epoch": 512} {"train_loss": -5.316604137420654, "global_step": 21537, "epoch": 512} {"train_loss": -5.334415435791016, "global_step": 21538, "epoch": 512} {"train_loss": -5.363306045532227, "global_step": 21539, "epoch": 512} {"train_loss": -5.289746284484863, "global_step": 21540, "epoch": 512} {"train_loss": -5.28075647354126, "global_step": 21541, "epoch": 512} {"train_loss": -5.382596969604492, "global_step": 21542, "epoch": 512} {"train_loss": -5.328485488891602, "global_step": 21543, "epoch": 512} {"train_loss": -5.461479663848877, "global_step": 21544, "epoch": 512} {"train_loss": -5.332580305281139, "global_step": 21545, "epoch": 512, "val_loss": 68856.2265625} {"train_loss": -5.268834114074707, "global_step": 21546, "epoch": 513} {"train_loss": -5.322834491729736, "global_step": 21547, "epoch": 513} {"train_loss": -5.2534966468811035, "global_step": 21548, "epoch": 513} {"train_loss": -5.457376480102539, "global_step": 21549, "epoch": 513} {"train_loss": -5.411043167114258, "global_step": 21550, "epoch": 513} {"train_loss": -5.153087615966797, "global_step": 21551, "epoch": 513} {"train_loss": -5.23016357421875, "global_step": 21552, "epoch": 513} {"train_loss": -5.43348503112793, "global_step": 21553, "epoch": 513} {"train_loss": -5.433529853820801, "global_step": 21554, "epoch": 513} {"train_loss": -5.330006122589111, "global_step": 21555, "epoch": 513} {"train_loss": -5.395059108734131, "global_step": 21556, "epoch": 513} {"train_loss": -5.317043304443359, "global_step": 21557, "epoch": 513} {"train_loss": -5.457452774047852, "global_step": 21558, "epoch": 513} {"train_loss": -5.500441551208496, "global_step": 21559, "epoch": 513} {"train_loss": -5.3768205642700195, "global_step": 21560, "epoch": 513} {"train_loss": -5.326248645782471, "global_step": 21561, "epoch": 513} {"train_loss": -5.354267597198486, "global_step": 21562, "epoch": 513} {"train_loss": -5.17333459854126, "global_step": 21563, "epoch": 513} {"train_loss": -5.422071933746338, "global_step": 21564, "epoch": 513} {"train_loss": -5.301044940948486, "global_step": 21565, "epoch": 513} {"train_loss": -5.530531883239746, "global_step": 21566, "epoch": 513} {"train_loss": -5.448835849761963, "global_step": 21567, "epoch": 513} {"train_loss": -5.2635722160339355, "global_step": 21568, "epoch": 513} {"train_loss": -5.433385848999023, "global_step": 21569, "epoch": 513} {"train_loss": -5.3779191970825195, "global_step": 21570, "epoch": 513} {"train_loss": -5.208512783050537, "global_step": 21571, "epoch": 513} {"train_loss": -5.363707065582275, "global_step": 21572, "epoch": 513} {"train_loss": -5.468940734863281, "global_step": 21573, "epoch": 513} {"train_loss": -5.281315326690674, "global_step": 21574, "epoch": 513} {"train_loss": -5.324621677398682, "global_step": 21575, "epoch": 513} {"train_loss": -5.362668037414551, "global_step": 21576, "epoch": 513} {"train_loss": -5.258332252502441, "global_step": 21577, "epoch": 513} {"train_loss": -5.2326154708862305, "global_step": 21578, "epoch": 513} {"train_loss": -5.359045505523682, "global_step": 21579, "epoch": 513} {"train_loss": -5.294531345367432, "global_step": 21580, "epoch": 513} {"train_loss": -5.328960418701172, "global_step": 21581, "epoch": 513} {"train_loss": -5.3341474533081055, "global_step": 21582, "epoch": 513} {"train_loss": -5.367914199829102, "global_step": 21583, "epoch": 513} {"train_loss": -5.4236555099487305, "global_step": 21584, "epoch": 513} {"train_loss": -5.382760047912598, "global_step": 21585, "epoch": 513} {"train_loss": -5.435318946838379, "global_step": 21586, "epoch": 513} {"train_loss": -5.350246542976016, "global_step": 21587, "epoch": 513, "val_loss": 68440.890625} {"train_loss": -5.389996528625488, "global_step": 21588, "epoch": 514} {"train_loss": -5.571459770202637, "global_step": 21589, "epoch": 514} {"train_loss": -5.417333602905273, "global_step": 21590, "epoch": 514} {"train_loss": -5.367183208465576, "global_step": 21591, "epoch": 514} {"train_loss": -5.170419216156006, "global_step": 21592, "epoch": 514} {"train_loss": -5.316119194030762, "global_step": 21593, "epoch": 514} {"train_loss": -5.180688858032227, "global_step": 21594, "epoch": 514} {"train_loss": -5.3374528884887695, "global_step": 21595, "epoch": 514} {"train_loss": -5.333008766174316, "global_step": 21596, "epoch": 514} {"train_loss": -5.155452251434326, "global_step": 21597, "epoch": 514} {"train_loss": -5.339804172515869, "global_step": 21598, "epoch": 514} {"train_loss": -5.34608793258667, "global_step": 21599, "epoch": 514} {"train_loss": -5.395199298858643, "global_step": 21600, "epoch": 514} {"train_loss": -5.421130657196045, "global_step": 21601, "epoch": 514} {"train_loss": -5.235440731048584, "global_step": 21602, "epoch": 514} {"train_loss": -5.417956352233887, "global_step": 21603, "epoch": 514} {"train_loss": -5.418538570404053, "global_step": 21604, "epoch": 514} {"train_loss": -5.339590549468994, "global_step": 21605, "epoch": 514} {"train_loss": -5.410079002380371, "global_step": 21606, "epoch": 514} {"train_loss": -5.383315563201904, "global_step": 21607, "epoch": 514} {"train_loss": -5.315289497375488, "global_step": 21608, "epoch": 514} {"train_loss": -5.442861557006836, "global_step": 21609, "epoch": 514} {"train_loss": -5.2787675857543945, "global_step": 21610, "epoch": 514} {"train_loss": -5.348116874694824, "global_step": 21611, "epoch": 514} {"train_loss": -5.206277370452881, "global_step": 21612, "epoch": 514} {"train_loss": -5.367948532104492, "global_step": 21613, "epoch": 514} {"train_loss": -5.3998003005981445, "global_step": 21614, "epoch": 514} {"train_loss": -5.292681694030762, "global_step": 21615, "epoch": 514} {"train_loss": -5.446197509765625, "global_step": 21616, "epoch": 514} {"train_loss": -5.362882614135742, "global_step": 21617, "epoch": 514} {"train_loss": -5.362214088439941, "global_step": 21618, "epoch": 514} {"train_loss": -5.3014726638793945, "global_step": 21619, "epoch": 514} {"train_loss": -5.468352317810059, "global_step": 21620, "epoch": 514} {"train_loss": -5.328612327575684, "global_step": 21621, "epoch": 514} {"train_loss": -5.286978721618652, "global_step": 21622, "epoch": 514} {"train_loss": -5.3102617263793945, "global_step": 21623, "epoch": 514} {"train_loss": -5.243748664855957, "global_step": 21624, "epoch": 514} {"train_loss": -5.234745502471924, "global_step": 21625, "epoch": 514} {"train_loss": -5.314091682434082, "global_step": 21626, "epoch": 514} {"train_loss": -5.389181613922119, "global_step": 21627, "epoch": 514} {"train_loss": -5.279706001281738, "global_step": 21628, "epoch": 514} {"train_loss": -5.337392693474179, "global_step": 21629, "epoch": 514, "val_loss": 68395.1484375} {"train_loss": -5.42369270324707, "global_step": 21630, "epoch": 515} {"train_loss": -5.451926231384277, "global_step": 21631, "epoch": 515} {"train_loss": -5.2133026123046875, "global_step": 21632, "epoch": 515} {"train_loss": -5.3826751708984375, "global_step": 21633, "epoch": 515} {"train_loss": -5.42164421081543, "global_step": 21634, "epoch": 515} {"train_loss": -5.393721580505371, "global_step": 21635, "epoch": 515} {"train_loss": -5.376127243041992, "global_step": 21636, "epoch": 515} {"train_loss": -5.335507392883301, "global_step": 21637, "epoch": 515} {"train_loss": -5.378484725952148, "global_step": 21638, "epoch": 515} {"train_loss": -5.4598388671875, "global_step": 21639, "epoch": 515} {"train_loss": -5.323003768920898, "global_step": 21640, "epoch": 515} {"train_loss": -5.335465431213379, "global_step": 21641, "epoch": 515} {"train_loss": -5.303378582000732, "global_step": 21642, "epoch": 515} {"train_loss": -5.410333633422852, "global_step": 21643, "epoch": 515} {"train_loss": -5.360788345336914, "global_step": 21644, "epoch": 515} {"train_loss": -5.424506187438965, "global_step": 21645, "epoch": 515} {"train_loss": -5.217641830444336, "global_step": 21646, "epoch": 515} {"train_loss": -5.337569713592529, "global_step": 21647, "epoch": 515} {"train_loss": -5.4939703941345215, "global_step": 21648, "epoch": 515} {"train_loss": -5.249482154846191, "global_step": 21649, "epoch": 515} {"train_loss": -5.21645450592041, "global_step": 21650, "epoch": 515} {"train_loss": -5.294363498687744, "global_step": 21651, "epoch": 515} {"train_loss": -5.3360137939453125, "global_step": 21652, "epoch": 515} {"train_loss": -5.292977333068848, "global_step": 21653, "epoch": 515} {"train_loss": -5.462111949920654, "global_step": 21654, "epoch": 515} {"train_loss": -5.203280448913574, "global_step": 21655, "epoch": 515} {"train_loss": -5.195039749145508, "global_step": 21656, "epoch": 515} {"train_loss": -5.358822822570801, "global_step": 21657, "epoch": 515} {"train_loss": -5.380380153656006, "global_step": 21658, "epoch": 515} {"train_loss": -5.160719871520996, "global_step": 21659, "epoch": 515} {"train_loss": -5.315328598022461, "global_step": 21660, "epoch": 515} {"train_loss": -5.446855068206787, "global_step": 21661, "epoch": 515} {"train_loss": -5.39054536819458, "global_step": 21662, "epoch": 515} {"train_loss": -5.351569175720215, "global_step": 21663, "epoch": 515} {"train_loss": -5.26519250869751, "global_step": 21664, "epoch": 515} {"train_loss": -5.347391605377197, "global_step": 21665, "epoch": 515} {"train_loss": -5.267987251281738, "global_step": 21666, "epoch": 515} {"train_loss": -5.377690315246582, "global_step": 21667, "epoch": 515} {"train_loss": -5.308807373046875, "global_step": 21668, "epoch": 515} {"train_loss": -5.373645782470703, "global_step": 21669, "epoch": 515} {"train_loss": -5.512335300445557, "global_step": 21670, "epoch": 515} {"train_loss": -5.345999297641573, "global_step": 21671, "epoch": 515, "val_loss": 68530.5625} {"train_loss": -5.334444046020508, "global_step": 21672, "epoch": 516} {"train_loss": -5.379127502441406, "global_step": 21673, "epoch": 516} {"train_loss": -5.305042266845703, "global_step": 21674, "epoch": 516} {"train_loss": -5.284612655639648, "global_step": 21675, "epoch": 516} {"train_loss": -5.373113632202148, "global_step": 21676, "epoch": 516} {"train_loss": -5.426680088043213, "global_step": 21677, "epoch": 516} {"train_loss": -5.304720878601074, "global_step": 21678, "epoch": 516} {"train_loss": -5.39546012878418, "global_step": 21679, "epoch": 516} {"train_loss": -5.365070343017578, "global_step": 21680, "epoch": 516} {"train_loss": -5.366142272949219, "global_step": 21681, "epoch": 516} {"train_loss": -5.359633445739746, "global_step": 21682, "epoch": 516} {"train_loss": -5.362975120544434, "global_step": 21683, "epoch": 516} {"train_loss": -5.36834716796875, "global_step": 21684, "epoch": 516} {"train_loss": -5.328145980834961, "global_step": 21685, "epoch": 516} {"train_loss": -5.37680196762085, "global_step": 21686, "epoch": 516} {"train_loss": -5.3588361740112305, "global_step": 21687, "epoch": 516} {"train_loss": -5.3744306564331055, "global_step": 21688, "epoch": 516} {"train_loss": -5.220397472381592, "global_step": 21689, "epoch": 516} {"train_loss": -5.318446159362793, "global_step": 21690, "epoch": 516} {"train_loss": -5.467426300048828, "global_step": 21691, "epoch": 516} {"train_loss": -5.386008262634277, "global_step": 21692, "epoch": 516} {"train_loss": -5.387824058532715, "global_step": 21693, "epoch": 516} {"train_loss": -5.3474931716918945, "global_step": 21694, "epoch": 516} {"train_loss": -5.321341514587402, "global_step": 21695, "epoch": 516} {"train_loss": -5.381833076477051, "global_step": 21696, "epoch": 516} {"train_loss": -5.32009744644165, "global_step": 21697, "epoch": 516} {"train_loss": -5.408321857452393, "global_step": 21698, "epoch": 516} {"train_loss": -5.3856964111328125, "global_step": 21699, "epoch": 516} {"train_loss": -5.475584983825684, "global_step": 21700, "epoch": 516} {"train_loss": -5.262346267700195, "global_step": 21701, "epoch": 516} {"train_loss": -5.250604629516602, "global_step": 21702, "epoch": 516} {"train_loss": -5.259373188018799, "global_step": 21703, "epoch": 516} {"train_loss": -5.245699882507324, "global_step": 21704, "epoch": 516} {"train_loss": -5.208598613739014, "global_step": 21705, "epoch": 516} {"train_loss": -5.369403839111328, "global_step": 21706, "epoch": 516} {"train_loss": -5.249664306640625, "global_step": 21707, "epoch": 516} {"train_loss": -5.461361885070801, "global_step": 21708, "epoch": 516} {"train_loss": -5.226193904876709, "global_step": 21709, "epoch": 516} {"train_loss": -5.386940002441406, "global_step": 21710, "epoch": 516} {"train_loss": -5.340989112854004, "global_step": 21711, "epoch": 516} {"train_loss": -5.380500793457031, "global_step": 21712, "epoch": 516} {"train_loss": -5.346929027920678, "global_step": 21713, "epoch": 516, "val_loss": 68837.1171875} {"train_loss": -5.242064476013184, "global_step": 21714, "epoch": 517} {"train_loss": -5.229861736297607, "global_step": 21715, "epoch": 517} {"train_loss": -5.346808433532715, "global_step": 21716, "epoch": 517} {"train_loss": -5.4126176834106445, "global_step": 21717, "epoch": 517} {"train_loss": -5.338563442230225, "global_step": 21718, "epoch": 517} {"train_loss": -5.270781517028809, "global_step": 21719, "epoch": 517} {"train_loss": -5.207169532775879, "global_step": 21720, "epoch": 517} {"train_loss": -5.381059646606445, "global_step": 21721, "epoch": 517} {"train_loss": -5.345998764038086, "global_step": 21722, "epoch": 517} {"train_loss": -5.314123153686523, "global_step": 21723, "epoch": 517} {"train_loss": -5.323006629943848, "global_step": 21724, "epoch": 517} {"train_loss": -5.414033889770508, "global_step": 21725, "epoch": 517} {"train_loss": -5.386112213134766, "global_step": 21726, "epoch": 517} {"train_loss": -5.206009864807129, "global_step": 21727, "epoch": 517} {"train_loss": -5.426975250244141, "global_step": 21728, "epoch": 517} {"train_loss": -5.425275802612305, "global_step": 21729, "epoch": 517} {"train_loss": -5.476534843444824, "global_step": 21730, "epoch": 517} {"train_loss": -5.21848201751709, "global_step": 21731, "epoch": 517} {"train_loss": -5.280465126037598, "global_step": 21732, "epoch": 517} {"train_loss": -5.373459339141846, "global_step": 21733, "epoch": 517} {"train_loss": -5.251054286956787, "global_step": 21734, "epoch": 517} {"train_loss": -5.398495674133301, "global_step": 21735, "epoch": 517} {"train_loss": -5.372516632080078, "global_step": 21736, "epoch": 517} {"train_loss": -5.441021919250488, "global_step": 21737, "epoch": 517} {"train_loss": -5.403077125549316, "global_step": 21738, "epoch": 517} {"train_loss": -5.283001899719238, "global_step": 21739, "epoch": 517} {"train_loss": -5.33782958984375, "global_step": 21740, "epoch": 517} {"train_loss": -5.229267120361328, "global_step": 21741, "epoch": 517} {"train_loss": -5.4484052658081055, "global_step": 21742, "epoch": 517} {"train_loss": -5.448028087615967, "global_step": 21743, "epoch": 517} {"train_loss": -5.408761501312256, "global_step": 21744, "epoch": 517} {"train_loss": -5.507900238037109, "global_step": 21745, "epoch": 517} {"train_loss": -5.37509298324585, "global_step": 21746, "epoch": 517} {"train_loss": -5.3696370124816895, "global_step": 21747, "epoch": 517} {"train_loss": -5.387182235717773, "global_step": 21748, "epoch": 517} {"train_loss": -5.244944095611572, "global_step": 21749, "epoch": 517} {"train_loss": -5.516095161437988, "global_step": 21750, "epoch": 517} {"train_loss": -5.112326622009277, "global_step": 21751, "epoch": 517} {"train_loss": -5.30279541015625, "global_step": 21752, "epoch": 517} {"train_loss": -5.539855003356934, "global_step": 21753, "epoch": 517} {"train_loss": -5.224010467529297, "global_step": 21754, "epoch": 517} {"train_loss": -5.345128717876616, "global_step": 21755, "epoch": 517, "val_loss": 68246.2109375} {"train_loss": -5.320521354675293, "global_step": 21756, "epoch": 518} {"train_loss": -5.181781768798828, "global_step": 21757, "epoch": 518} {"train_loss": -5.192251205444336, "global_step": 21758, "epoch": 518} {"train_loss": -5.17262601852417, "global_step": 21759, "epoch": 518} {"train_loss": -5.135321140289307, "global_step": 21760, "epoch": 518} {"train_loss": -5.353781223297119, "global_step": 21761, "epoch": 518} {"train_loss": -5.267612457275391, "global_step": 21762, "epoch": 518} {"train_loss": -5.339125633239746, "global_step": 21763, "epoch": 518} {"train_loss": -5.278962135314941, "global_step": 21764, "epoch": 518} {"train_loss": -5.181997299194336, "global_step": 21765, "epoch": 518} {"train_loss": -5.22440767288208, "global_step": 21766, "epoch": 518} {"train_loss": -5.281726837158203, "global_step": 21767, "epoch": 518} {"train_loss": -5.454169750213623, "global_step": 21768, "epoch": 518} {"train_loss": -5.2406768798828125, "global_step": 21769, "epoch": 518} {"train_loss": -5.267508506774902, "global_step": 21770, "epoch": 518} {"train_loss": -5.362443923950195, "global_step": 21771, "epoch": 518} {"train_loss": -5.346017837524414, "global_step": 21772, "epoch": 518} {"train_loss": -5.414682865142822, "global_step": 21773, "epoch": 518} {"train_loss": -5.334368705749512, "global_step": 21774, "epoch": 518} {"train_loss": -5.330798149108887, "global_step": 21775, "epoch": 518} {"train_loss": -5.251097679138184, "global_step": 21776, "epoch": 518} {"train_loss": -5.454922199249268, "global_step": 21777, "epoch": 518} {"train_loss": -5.404303550720215, "global_step": 21778, "epoch": 518} {"train_loss": -5.435122489929199, "global_step": 21779, "epoch": 518} {"train_loss": -5.418518543243408, "global_step": 21780, "epoch": 518} {"train_loss": -5.269496917724609, "global_step": 21781, "epoch": 518} {"train_loss": -5.104942321777344, "global_step": 21782, "epoch": 518} {"train_loss": -5.334710121154785, "global_step": 21783, "epoch": 518} {"train_loss": -5.2865705490112305, "global_step": 21784, "epoch": 518} {"train_loss": -5.429058074951172, "global_step": 21785, "epoch": 518} {"train_loss": -5.288012504577637, "global_step": 21786, "epoch": 518} {"train_loss": -5.324062347412109, "global_step": 21787, "epoch": 518} {"train_loss": -5.357317924499512, "global_step": 21788, "epoch": 518} {"train_loss": -5.455401420593262, "global_step": 21789, "epoch": 518} {"train_loss": -5.38661003112793, "global_step": 21790, "epoch": 518} {"train_loss": -5.305685520172119, "global_step": 21791, "epoch": 518} {"train_loss": -5.281543254852295, "global_step": 21792, "epoch": 518} {"train_loss": -5.2900872230529785, "global_step": 21793, "epoch": 518} {"train_loss": -5.217936038970947, "global_step": 21794, "epoch": 518} {"train_loss": -5.194207191467285, "global_step": 21795, "epoch": 518} {"train_loss": -5.293664932250977, "global_step": 21796, "epoch": 518} {"train_loss": -5.301371540342059, "global_step": 21797, "epoch": 518, "val_loss": 68691.375} {"train_loss": -5.4146199226379395, "global_step": 21798, "epoch": 519} {"train_loss": -5.345507621765137, "global_step": 21799, "epoch": 519} {"train_loss": -5.28372859954834, "global_step": 21800, "epoch": 519} {"train_loss": -5.444492340087891, "global_step": 21801, "epoch": 519} {"train_loss": -5.3605499267578125, "global_step": 21802, "epoch": 519} {"train_loss": -5.300786018371582, "global_step": 21803, "epoch": 519} {"train_loss": -5.357749938964844, "global_step": 21804, "epoch": 519} {"train_loss": -5.294066429138184, "global_step": 21805, "epoch": 519} {"train_loss": -5.236886024475098, "global_step": 21806, "epoch": 519} {"train_loss": -5.2433695793151855, "global_step": 21807, "epoch": 519} {"train_loss": -5.151503086090088, "global_step": 21808, "epoch": 519} {"train_loss": -5.223703861236572, "global_step": 21809, "epoch": 519} {"train_loss": -5.276459693908691, "global_step": 21810, "epoch": 519} {"train_loss": -5.188814163208008, "global_step": 21811, "epoch": 519} {"train_loss": -5.319117546081543, "global_step": 21812, "epoch": 519} {"train_loss": -5.462028503417969, "global_step": 21813, "epoch": 519} {"train_loss": -5.190728187561035, "global_step": 21814, "epoch": 519} {"train_loss": -5.357818603515625, "global_step": 21815, "epoch": 519} {"train_loss": -5.340655326843262, "global_step": 21816, "epoch": 519} {"train_loss": -5.21913480758667, "global_step": 21817, "epoch": 519} {"train_loss": -5.310548782348633, "global_step": 21818, "epoch": 519} {"train_loss": -5.272323131561279, "global_step": 21819, "epoch": 519} {"train_loss": -5.278285980224609, "global_step": 21820, "epoch": 519} {"train_loss": -5.303955078125, "global_step": 21821, "epoch": 519} {"train_loss": -5.28595495223999, "global_step": 21822, "epoch": 519} {"train_loss": -5.234646320343018, "global_step": 21823, "epoch": 519} {"train_loss": -5.343194961547852, "global_step": 21824, "epoch": 519} {"train_loss": -5.222525119781494, "global_step": 21825, "epoch": 519} {"train_loss": -5.376655578613281, "global_step": 21826, "epoch": 519} {"train_loss": -5.230391502380371, "global_step": 21827, "epoch": 519} {"train_loss": -5.349710464477539, "global_step": 21828, "epoch": 519} {"train_loss": -5.3445281982421875, "global_step": 21829, "epoch": 519} {"train_loss": -5.330659866333008, "global_step": 21830, "epoch": 519} {"train_loss": -5.28240966796875, "global_step": 21831, "epoch": 519} {"train_loss": -5.401151180267334, "global_step": 21832, "epoch": 519} {"train_loss": -5.373363971710205, "global_step": 21833, "epoch": 519} {"train_loss": -5.519443511962891, "global_step": 21834, "epoch": 519} {"train_loss": -5.444280624389648, "global_step": 21835, "epoch": 519} {"train_loss": -5.391290664672852, "global_step": 21836, "epoch": 519} {"train_loss": -5.408435821533203, "global_step": 21837, "epoch": 519} {"train_loss": -5.416473388671875, "global_step": 21838, "epoch": 519} {"train_loss": -5.320951745623634, "global_step": 21839, "epoch": 519, "val_loss": 68001.6953125} {"train_loss": -5.4025983810424805, "global_step": 21840, "epoch": 520} {"train_loss": -5.422645568847656, "global_step": 21841, "epoch": 520} {"train_loss": -5.4513397216796875, "global_step": 21842, "epoch": 520} {"train_loss": -5.360342025756836, "global_step": 21843, "epoch": 520} {"train_loss": -5.344491958618164, "global_step": 21844, "epoch": 520} {"train_loss": -5.51681661605835, "global_step": 21845, "epoch": 520} {"train_loss": -5.405566215515137, "global_step": 21846, "epoch": 520} {"train_loss": -5.311896324157715, "global_step": 21847, "epoch": 520} {"train_loss": -5.357362747192383, "global_step": 21848, "epoch": 520} {"train_loss": -5.3536376953125, "global_step": 21849, "epoch": 520} {"train_loss": -5.4834465980529785, "global_step": 21850, "epoch": 520} {"train_loss": -5.427724838256836, "global_step": 21851, "epoch": 520} {"train_loss": -5.405840873718262, "global_step": 21852, "epoch": 520} {"train_loss": -5.363800048828125, "global_step": 21853, "epoch": 520} {"train_loss": -5.404311656951904, "global_step": 21854, "epoch": 520} {"train_loss": -5.403369426727295, "global_step": 21855, "epoch": 520} {"train_loss": -5.322850227355957, "global_step": 21856, "epoch": 520} {"train_loss": -5.33859395980835, "global_step": 21857, "epoch": 520} {"train_loss": -5.509929180145264, "global_step": 21858, "epoch": 520} {"train_loss": -5.403557777404785, "global_step": 21859, "epoch": 520} {"train_loss": -5.223788738250732, "global_step": 21860, "epoch": 520} {"train_loss": -5.448611259460449, "global_step": 21861, "epoch": 520} {"train_loss": -5.321262836456299, "global_step": 21862, "epoch": 520} {"train_loss": -5.345631122589111, "global_step": 21863, "epoch": 520} {"train_loss": -5.265888214111328, "global_step": 21864, "epoch": 520} {"train_loss": -5.239867210388184, "global_step": 21865, "epoch": 520} {"train_loss": -5.318071365356445, "global_step": 21866, "epoch": 520} {"train_loss": -5.384218215942383, "global_step": 21867, "epoch": 520} {"train_loss": -5.436373710632324, "global_step": 21868, "epoch": 520} {"train_loss": -5.2779645919799805, "global_step": 21869, "epoch": 520} {"train_loss": -5.239989280700684, "global_step": 21870, "epoch": 520} {"train_loss": -5.284452438354492, "global_step": 21871, "epoch": 520} {"train_loss": -5.377110004425049, "global_step": 21872, "epoch": 520} {"train_loss": -5.227835655212402, "global_step": 21873, "epoch": 520} {"train_loss": -5.291112899780273, "global_step": 21874, "epoch": 520} {"train_loss": -5.220366477966309, "global_step": 21875, "epoch": 520} {"train_loss": -5.330530643463135, "global_step": 21876, "epoch": 520} {"train_loss": -5.339473247528076, "global_step": 21877, "epoch": 520} {"train_loss": -5.339811325073242, "global_step": 21878, "epoch": 520} {"train_loss": -5.346348285675049, "global_step": 21879, "epoch": 520} {"train_loss": -5.308955192565918, "global_step": 21880, "epoch": 520} {"train_loss": -5.354669843401227, "global_step": 21881, "epoch": 520, "val_loss": 68423.328125} {"train_loss": -5.379604339599609, "global_step": 21882, "epoch": 521} {"train_loss": -5.511102676391602, "global_step": 21883, "epoch": 521} {"train_loss": -5.340784072875977, "global_step": 21884, "epoch": 521} {"train_loss": -5.2290544509887695, "global_step": 21885, "epoch": 521} {"train_loss": -5.38695764541626, "global_step": 21886, "epoch": 521} {"train_loss": -5.381247520446777, "global_step": 21887, "epoch": 521} {"train_loss": -5.299218654632568, "global_step": 21888, "epoch": 521} {"train_loss": -5.271065711975098, "global_step": 21889, "epoch": 521} {"train_loss": -5.4196672439575195, "global_step": 21890, "epoch": 521} {"train_loss": -5.245952129364014, "global_step": 21891, "epoch": 521} {"train_loss": -5.282515525817871, "global_step": 21892, "epoch": 521} {"train_loss": -5.334895133972168, "global_step": 21893, "epoch": 521} {"train_loss": -5.284097194671631, "global_step": 21894, "epoch": 521} {"train_loss": -5.375226974487305, "global_step": 21895, "epoch": 521} {"train_loss": -5.2841901779174805, "global_step": 21896, "epoch": 521} {"train_loss": -5.348278999328613, "global_step": 21897, "epoch": 521} {"train_loss": -5.401350975036621, "global_step": 21898, "epoch": 521} {"train_loss": -5.373213768005371, "global_step": 21899, "epoch": 521} {"train_loss": -5.272651195526123, "global_step": 21900, "epoch": 521} {"train_loss": -5.32173490524292, "global_step": 21901, "epoch": 521} {"train_loss": -5.3925018310546875, "global_step": 21902, "epoch": 521} {"train_loss": -5.310856819152832, "global_step": 21903, "epoch": 521} {"train_loss": -5.27503776550293, "global_step": 21904, "epoch": 521} {"train_loss": -5.306834697723389, "global_step": 21905, "epoch": 521} {"train_loss": -5.237723350524902, "global_step": 21906, "epoch": 521} {"train_loss": -5.436562538146973, "global_step": 21907, "epoch": 521} {"train_loss": -5.334004878997803, "global_step": 21908, "epoch": 521} {"train_loss": -5.370548725128174, "global_step": 21909, "epoch": 521} {"train_loss": -5.2372026443481445, "global_step": 21910, "epoch": 521} {"train_loss": -5.299557209014893, "global_step": 21911, "epoch": 521} {"train_loss": -5.257093906402588, "global_step": 21912, "epoch": 521} {"train_loss": -5.384398460388184, "global_step": 21913, "epoch": 521} {"train_loss": -5.273185729980469, "global_step": 21914, "epoch": 521} {"train_loss": -5.267213344573975, "global_step": 21915, "epoch": 521} {"train_loss": -5.407891273498535, "global_step": 21916, "epoch": 521} {"train_loss": -5.193280220031738, "global_step": 21917, "epoch": 521} {"train_loss": -5.308488845825195, "global_step": 21918, "epoch": 521} {"train_loss": -5.124320983886719, "global_step": 21919, "epoch": 521} {"train_loss": -5.338691711425781, "global_step": 21920, "epoch": 521} {"train_loss": -5.385085105895996, "global_step": 21921, "epoch": 521} {"train_loss": -5.350335121154785, "global_step": 21922, "epoch": 521} {"train_loss": -5.323742060434251, "global_step": 21923, "epoch": 521, "val_loss": 68562.875} {"train_loss": -5.2315287590026855, "global_step": 21924, "epoch": 522} {"train_loss": -5.360828399658203, "global_step": 21925, "epoch": 522} {"train_loss": -5.2170915603637695, "global_step": 21926, "epoch": 522} {"train_loss": -5.281552314758301, "global_step": 21927, "epoch": 522} {"train_loss": -5.536995887756348, "global_step": 21928, "epoch": 522} {"train_loss": -5.2543182373046875, "global_step": 21929, "epoch": 522} {"train_loss": -5.3035993576049805, "global_step": 21930, "epoch": 522} {"train_loss": -5.30933952331543, "global_step": 21931, "epoch": 522} {"train_loss": -5.337498188018799, "global_step": 21932, "epoch": 522} {"train_loss": -5.276625633239746, "global_step": 21933, "epoch": 522} {"train_loss": -5.36100435256958, "global_step": 21934, "epoch": 522} {"train_loss": -5.285053253173828, "global_step": 21935, "epoch": 522} {"train_loss": -5.2653069496154785, "global_step": 21936, "epoch": 522} {"train_loss": -5.329720973968506, "global_step": 21937, "epoch": 522} {"train_loss": -5.2934980392456055, "global_step": 21938, "epoch": 522} {"train_loss": -5.3028364181518555, "global_step": 21939, "epoch": 522} {"train_loss": -5.285772323608398, "global_step": 21940, "epoch": 522} {"train_loss": -5.253864288330078, "global_step": 21941, "epoch": 522} {"train_loss": -5.283014297485352, "global_step": 21942, "epoch": 522} {"train_loss": -5.156414985656738, "global_step": 21943, "epoch": 522} {"train_loss": -5.257392406463623, "global_step": 21944, "epoch": 522} {"train_loss": -5.395179748535156, "global_step": 21945, "epoch": 522} {"train_loss": -5.267969608306885, "global_step": 21946, "epoch": 522} {"train_loss": -5.346243858337402, "global_step": 21947, "epoch": 522} {"train_loss": -5.371722221374512, "global_step": 21948, "epoch": 522} {"train_loss": -5.4486894607543945, "global_step": 21949, "epoch": 522} {"train_loss": -5.4452433586120605, "global_step": 21950, "epoch": 522} {"train_loss": -5.353633880615234, "global_step": 21951, "epoch": 522} {"train_loss": -5.327191352844238, "global_step": 21952, "epoch": 522} {"train_loss": -5.293399810791016, "global_step": 21953, "epoch": 522} {"train_loss": -5.2221598625183105, "global_step": 21954, "epoch": 522} {"train_loss": -5.266598224639893, "global_step": 21955, "epoch": 522} {"train_loss": -5.379308700561523, "global_step": 21956, "epoch": 522} {"train_loss": -5.466200828552246, "global_step": 21957, "epoch": 522} {"train_loss": -5.401559829711914, "global_step": 21958, "epoch": 522} {"train_loss": -5.601067543029785, "global_step": 21959, "epoch": 522} {"train_loss": -5.257923126220703, "global_step": 21960, "epoch": 522} {"train_loss": -5.259115219116211, "global_step": 21961, "epoch": 522} {"train_loss": -5.443523406982422, "global_step": 21962, "epoch": 522} {"train_loss": -5.201478958129883, "global_step": 21963, "epoch": 522} {"train_loss": -5.415583610534668, "global_step": 21964, "epoch": 522} {"train_loss": -5.327752805891491, "global_step": 21965, "epoch": 522, "val_loss": 68220.6171875} {"train_loss": -5.262083053588867, "global_step": 21966, "epoch": 523} {"train_loss": -5.279922008514404, "global_step": 21967, "epoch": 523} {"train_loss": -5.320488929748535, "global_step": 21968, "epoch": 523} {"train_loss": -5.338632583618164, "global_step": 21969, "epoch": 523} {"train_loss": -5.277170658111572, "global_step": 21970, "epoch": 523} {"train_loss": -5.342350006103516, "global_step": 21971, "epoch": 523} {"train_loss": -5.3744683265686035, "global_step": 21972, "epoch": 523} {"train_loss": -5.377507209777832, "global_step": 21973, "epoch": 523} {"train_loss": -5.273395538330078, "global_step": 21974, "epoch": 523} {"train_loss": -5.378843307495117, "global_step": 21975, "epoch": 523} {"train_loss": -5.438597679138184, "global_step": 21976, "epoch": 523} {"train_loss": -5.295759677886963, "global_step": 21977, "epoch": 523} {"train_loss": -5.296099662780762, "global_step": 21978, "epoch": 523} {"train_loss": -5.296995162963867, "global_step": 21979, "epoch": 523} {"train_loss": -5.446443557739258, "global_step": 21980, "epoch": 523} {"train_loss": -5.294203758239746, "global_step": 21981, "epoch": 523} {"train_loss": -5.4415507316589355, "global_step": 21982, "epoch": 523} {"train_loss": -5.320099830627441, "global_step": 21983, "epoch": 523} {"train_loss": -5.443383693695068, "global_step": 21984, "epoch": 523} {"train_loss": -5.3961873054504395, "global_step": 21985, "epoch": 523} {"train_loss": -5.264008522033691, "global_step": 21986, "epoch": 523} {"train_loss": -5.340926170349121, "global_step": 21987, "epoch": 523} {"train_loss": -5.432826042175293, "global_step": 21988, "epoch": 523} {"train_loss": -5.295044422149658, "global_step": 21989, "epoch": 523} {"train_loss": -5.362795352935791, "global_step": 21990, "epoch": 523} {"train_loss": -5.372265338897705, "global_step": 21991, "epoch": 523} {"train_loss": -5.384641170501709, "global_step": 21992, "epoch": 523} {"train_loss": -5.374964237213135, "global_step": 21993, "epoch": 523} {"train_loss": -5.486004829406738, "global_step": 21994, "epoch": 523} {"train_loss": -5.385806083679199, "global_step": 21995, "epoch": 523} {"train_loss": -5.371730804443359, "global_step": 21996, "epoch": 523} {"train_loss": -5.2091827392578125, "global_step": 21997, "epoch": 523} {"train_loss": -5.3055949211120605, "global_step": 21998, "epoch": 523} {"train_loss": -5.26379919052124, "global_step": 21999, "epoch": 523} {"train_loss": -5.284383773803711, "global_step": 22000, "epoch": 523} {"train_loss": -5.313612937927246, "global_step": 22001, "epoch": 523} {"train_loss": -5.373414516448975, "global_step": 22002, "epoch": 523} {"train_loss": -5.339819431304932, "global_step": 22003, "epoch": 523} {"train_loss": -5.290617942810059, "global_step": 22004, "epoch": 523} {"train_loss": -5.380769729614258, "global_step": 22005, "epoch": 523} {"train_loss": -5.426916599273682, "global_step": 22006, "epoch": 523} {"train_loss": -5.343281768617176, "global_step": 22007, "epoch": 523, "val_loss": 68333.96875} {"train_loss": -5.363058090209961, "global_step": 22008, "epoch": 524} {"train_loss": -5.385143280029297, "global_step": 22009, "epoch": 524} {"train_loss": -5.428847312927246, "global_step": 22010, "epoch": 524} {"train_loss": -5.306568622589111, "global_step": 22011, "epoch": 524} {"train_loss": -5.466785907745361, "global_step": 22012, "epoch": 524} {"train_loss": -5.3815016746521, "global_step": 22013, "epoch": 524} {"train_loss": -5.266171455383301, "global_step": 22014, "epoch": 524} {"train_loss": -5.463679313659668, "global_step": 22015, "epoch": 524} {"train_loss": -5.3233842849731445, "global_step": 22016, "epoch": 524} {"train_loss": -5.384522438049316, "global_step": 22017, "epoch": 524} {"train_loss": -5.379925727844238, "global_step": 22018, "epoch": 524} {"train_loss": -5.329489707946777, "global_step": 22019, "epoch": 524} {"train_loss": -5.35408878326416, "global_step": 22020, "epoch": 524} {"train_loss": -5.414809703826904, "global_step": 22021, "epoch": 524} {"train_loss": -5.377572536468506, "global_step": 22022, "epoch": 524} {"train_loss": -5.2325263023376465, "global_step": 22023, "epoch": 524} {"train_loss": -5.3945207595825195, "global_step": 22024, "epoch": 524} {"train_loss": -5.3442463874816895, "global_step": 22025, "epoch": 524} {"train_loss": -5.345521450042725, "global_step": 22026, "epoch": 524} {"train_loss": -5.289870262145996, "global_step": 22027, "epoch": 524} {"train_loss": -5.4355788230896, "global_step": 22028, "epoch": 524} {"train_loss": -5.404802322387695, "global_step": 22029, "epoch": 524} {"train_loss": -5.237339019775391, "global_step": 22030, "epoch": 524} {"train_loss": -5.412559509277344, "global_step": 22031, "epoch": 524} {"train_loss": -5.397457122802734, "global_step": 22032, "epoch": 524} {"train_loss": -5.388605117797852, "global_step": 22033, "epoch": 524} {"train_loss": -5.415850639343262, "global_step": 22034, "epoch": 524} {"train_loss": -5.348487854003906, "global_step": 22035, "epoch": 524} {"train_loss": -5.32463264465332, "global_step": 22036, "epoch": 524} {"train_loss": -5.324078559875488, "global_step": 22037, "epoch": 524} {"train_loss": -5.535665988922119, "global_step": 22038, "epoch": 524} {"train_loss": -5.278626441955566, "global_step": 22039, "epoch": 524} {"train_loss": -5.345413684844971, "global_step": 22040, "epoch": 524} {"train_loss": -5.25518274307251, "global_step": 22041, "epoch": 524} {"train_loss": -5.192677021026611, "global_step": 22042, "epoch": 524} {"train_loss": -5.158633708953857, "global_step": 22043, "epoch": 524} {"train_loss": -5.2689127922058105, "global_step": 22044, "epoch": 524} {"train_loss": -5.128900527954102, "global_step": 22045, "epoch": 524} {"train_loss": -5.138181686401367, "global_step": 22046, "epoch": 524} {"train_loss": -5.267589092254639, "global_step": 22047, "epoch": 524} {"train_loss": -5.152165412902832, "global_step": 22048, "epoch": 524} {"train_loss": -5.330532459985642, "global_step": 22049, "epoch": 524, "val_loss": 69639.0859375} {"train_loss": -5.157818794250488, "global_step": 22050, "epoch": 525} {"train_loss": -5.391578197479248, "global_step": 22051, "epoch": 525} {"train_loss": -5.289462089538574, "global_step": 22052, "epoch": 525} {"train_loss": -5.249761581420898, "global_step": 22053, "epoch": 525} {"train_loss": -5.323332786560059, "global_step": 22054, "epoch": 525} {"train_loss": -5.3174896240234375, "global_step": 22055, "epoch": 525} {"train_loss": -5.193504810333252, "global_step": 22056, "epoch": 525} {"train_loss": -5.239125728607178, "global_step": 22057, "epoch": 525} {"train_loss": -5.259367942810059, "global_step": 22058, "epoch": 525} {"train_loss": -5.421917915344238, "global_step": 22059, "epoch": 525} {"train_loss": -5.300869941711426, "global_step": 22060, "epoch": 525} {"train_loss": -5.344002723693848, "global_step": 22061, "epoch": 525} {"train_loss": -5.162967681884766, "global_step": 22062, "epoch": 525} {"train_loss": -5.3170061111450195, "global_step": 22063, "epoch": 525} {"train_loss": -5.381471157073975, "global_step": 22064, "epoch": 525} {"train_loss": -5.31768798828125, "global_step": 22065, "epoch": 525} {"train_loss": -5.364588260650635, "global_step": 22066, "epoch": 525} {"train_loss": -5.273204326629639, "global_step": 22067, "epoch": 525} {"train_loss": -5.39030122756958, "global_step": 22068, "epoch": 525} {"train_loss": -5.3166422843933105, "global_step": 22069, "epoch": 525} {"train_loss": -5.33638858795166, "global_step": 22070, "epoch": 525} {"train_loss": -5.296687126159668, "global_step": 22071, "epoch": 525} {"train_loss": -5.329320430755615, "global_step": 22072, "epoch": 525} {"train_loss": -5.436703681945801, "global_step": 22073, "epoch": 525} {"train_loss": -5.139138221740723, "global_step": 22074, "epoch": 525} {"train_loss": -5.409553050994873, "global_step": 22075, "epoch": 525} {"train_loss": -5.368649959564209, "global_step": 22076, "epoch": 525} {"train_loss": -5.3818254470825195, "global_step": 22077, "epoch": 525} {"train_loss": -5.506731986999512, "global_step": 22078, "epoch": 525} {"train_loss": -5.355584144592285, "global_step": 22079, "epoch": 525} {"train_loss": -5.3665266036987305, "global_step": 22080, "epoch": 525} {"train_loss": -5.272250175476074, "global_step": 22081, "epoch": 525} {"train_loss": -5.347678184509277, "global_step": 22082, "epoch": 525} {"train_loss": -5.414695739746094, "global_step": 22083, "epoch": 525} {"train_loss": -5.2838454246521, "global_step": 22084, "epoch": 525} {"train_loss": -5.340909957885742, "global_step": 22085, "epoch": 525} {"train_loss": -5.353611469268799, "global_step": 22086, "epoch": 525} {"train_loss": -5.252519607543945, "global_step": 22087, "epoch": 525} {"train_loss": -5.264566421508789, "global_step": 22088, "epoch": 525} {"train_loss": -5.1971635818481445, "global_step": 22089, "epoch": 525} {"train_loss": -5.108349800109863, "global_step": 22090, "epoch": 525} {"train_loss": -5.312093712034679, "global_step": 22091, "epoch": 525, "val_loss": 69176.828125} {"train_loss": -5.303860664367676, "global_step": 22092, "epoch": 526} {"train_loss": -5.350743293762207, "global_step": 22093, "epoch": 526} {"train_loss": -5.2304487228393555, "global_step": 22094, "epoch": 526} {"train_loss": -5.499652862548828, "global_step": 22095, "epoch": 526} {"train_loss": -5.278670310974121, "global_step": 22096, "epoch": 526} {"train_loss": -5.375881195068359, "global_step": 22097, "epoch": 526} {"train_loss": -5.316918849945068, "global_step": 22098, "epoch": 526} {"train_loss": -5.300769329071045, "global_step": 22099, "epoch": 526} {"train_loss": -5.399958610534668, "global_step": 22100, "epoch": 526} {"train_loss": -5.350175857543945, "global_step": 22101, "epoch": 526} {"train_loss": -5.340834617614746, "global_step": 22102, "epoch": 526} {"train_loss": -5.216894149780273, "global_step": 22103, "epoch": 526} {"train_loss": -5.3598480224609375, "global_step": 22104, "epoch": 526} {"train_loss": -5.313818454742432, "global_step": 22105, "epoch": 526} {"train_loss": -5.451430797576904, "global_step": 22106, "epoch": 526} {"train_loss": -5.377666473388672, "global_step": 22107, "epoch": 526} {"train_loss": -5.419711112976074, "global_step": 22108, "epoch": 526} {"train_loss": -5.417581558227539, "global_step": 22109, "epoch": 526} {"train_loss": -5.338648796081543, "global_step": 22110, "epoch": 526} {"train_loss": -5.294533729553223, "global_step": 22111, "epoch": 526} {"train_loss": -5.368500709533691, "global_step": 22112, "epoch": 526} {"train_loss": -5.269433975219727, "global_step": 22113, "epoch": 526} {"train_loss": -5.294308185577393, "global_step": 22114, "epoch": 526} {"train_loss": -5.442227840423584, "global_step": 22115, "epoch": 526} {"train_loss": -5.438053131103516, "global_step": 22116, "epoch": 526} {"train_loss": -5.4634623527526855, "global_step": 22117, "epoch": 526} {"train_loss": -5.433548450469971, "global_step": 22118, "epoch": 526} {"train_loss": -5.2789788246154785, "global_step": 22119, "epoch": 526} {"train_loss": -5.128108024597168, "global_step": 22120, "epoch": 526} {"train_loss": -5.317191123962402, "global_step": 22121, "epoch": 526} {"train_loss": -5.313220977783203, "global_step": 22122, "epoch": 526} {"train_loss": -5.3620452880859375, "global_step": 22123, "epoch": 526} {"train_loss": -5.368241310119629, "global_step": 22124, "epoch": 526} {"train_loss": -5.405566215515137, "global_step": 22125, "epoch": 526} {"train_loss": -5.4290666580200195, "global_step": 22126, "epoch": 526} {"train_loss": -5.367170333862305, "global_step": 22127, "epoch": 526} {"train_loss": -5.428318977355957, "global_step": 22128, "epoch": 526} {"train_loss": -5.429538249969482, "global_step": 22129, "epoch": 526} {"train_loss": -5.436929702758789, "global_step": 22130, "epoch": 526} {"train_loss": -5.337803840637207, "global_step": 22131, "epoch": 526} {"train_loss": -5.5095977783203125, "global_step": 22132, "epoch": 526} {"train_loss": -5.361412672769456, "global_step": 22133, "epoch": 526, "val_loss": 68008.71875} {"train_loss": -5.424985885620117, "global_step": 22134, "epoch": 527} {"train_loss": -5.32131290435791, "global_step": 22135, "epoch": 527} {"train_loss": -5.2587080001831055, "global_step": 22136, "epoch": 527} {"train_loss": -5.510466575622559, "global_step": 22137, "epoch": 527} {"train_loss": -5.300127983093262, "global_step": 22138, "epoch": 527} {"train_loss": -5.362831115722656, "global_step": 22139, "epoch": 527} {"train_loss": -5.473121643066406, "global_step": 22140, "epoch": 527} {"train_loss": -5.338666915893555, "global_step": 22141, "epoch": 527} {"train_loss": -5.269166946411133, "global_step": 22142, "epoch": 527} {"train_loss": -5.293648719787598, "global_step": 22143, "epoch": 527} {"train_loss": -5.33945894241333, "global_step": 22144, "epoch": 527} {"train_loss": -5.244252681732178, "global_step": 22145, "epoch": 527} {"train_loss": -5.321239471435547, "global_step": 22146, "epoch": 527} {"train_loss": -5.411474704742432, "global_step": 22147, "epoch": 527} {"train_loss": -5.363223075866699, "global_step": 22148, "epoch": 527} {"train_loss": -5.192385196685791, "global_step": 22149, "epoch": 527} {"train_loss": -5.4228105545043945, "global_step": 22150, "epoch": 527} {"train_loss": -5.264688014984131, "global_step": 22151, "epoch": 527} {"train_loss": -5.3748931884765625, "global_step": 22152, "epoch": 527} {"train_loss": -5.389291763305664, "global_step": 22153, "epoch": 527} {"train_loss": -5.301836013793945, "global_step": 22154, "epoch": 527} {"train_loss": -5.284529685974121, "global_step": 22155, "epoch": 527} {"train_loss": -5.3733367919921875, "global_step": 22156, "epoch": 527} {"train_loss": -5.268980979919434, "global_step": 22157, "epoch": 527} {"train_loss": -5.264012813568115, "global_step": 22158, "epoch": 527} {"train_loss": -5.323491096496582, "global_step": 22159, "epoch": 527} {"train_loss": -5.131980895996094, "global_step": 22160, "epoch": 527} {"train_loss": -5.269315719604492, "global_step": 22161, "epoch": 527} {"train_loss": -5.407496452331543, "global_step": 22162, "epoch": 527} {"train_loss": -5.415820598602295, "global_step": 22163, "epoch": 527} {"train_loss": -5.38402795791626, "global_step": 22164, "epoch": 527} {"train_loss": -5.4566264152526855, "global_step": 22165, "epoch": 527} {"train_loss": -5.469788074493408, "global_step": 22166, "epoch": 527} {"train_loss": -5.400263786315918, "global_step": 22167, "epoch": 527} {"train_loss": -5.32022762298584, "global_step": 22168, "epoch": 527} {"train_loss": -5.407680988311768, "global_step": 22169, "epoch": 527} {"train_loss": -5.338136196136475, "global_step": 22170, "epoch": 527} {"train_loss": -5.359831809997559, "global_step": 22171, "epoch": 527} {"train_loss": -5.306501865386963, "global_step": 22172, "epoch": 527} {"train_loss": -5.224483489990234, "global_step": 22173, "epoch": 527} {"train_loss": -5.39979362487793, "global_step": 22174, "epoch": 527} {"train_loss": -5.338913202285767, "global_step": 22175, "epoch": 527, "val_loss": 68453.328125} {"train_loss": -5.3463826179504395, "global_step": 22176, "epoch": 528} {"train_loss": -5.478259086608887, "global_step": 22177, "epoch": 528} {"train_loss": -5.4128522872924805, "global_step": 22178, "epoch": 528} {"train_loss": -5.383704662322998, "global_step": 22179, "epoch": 528} {"train_loss": -5.478059768676758, "global_step": 22180, "epoch": 528} {"train_loss": -5.298326015472412, "global_step": 22181, "epoch": 528} {"train_loss": -5.5288848876953125, "global_step": 22182, "epoch": 528} {"train_loss": -5.3996124267578125, "global_step": 22183, "epoch": 528} {"train_loss": -5.500382423400879, "global_step": 22184, "epoch": 528} {"train_loss": -5.3918681144714355, "global_step": 22185, "epoch": 528} {"train_loss": -5.401490211486816, "global_step": 22186, "epoch": 528} {"train_loss": -5.362586975097656, "global_step": 22187, "epoch": 528} {"train_loss": -5.051424980163574, "global_step": 22188, "epoch": 528} {"train_loss": -5.311595916748047, "global_step": 22189, "epoch": 528} {"train_loss": -5.4888505935668945, "global_step": 22190, "epoch": 528} {"train_loss": -5.326781272888184, "global_step": 22191, "epoch": 528} {"train_loss": -5.398443222045898, "global_step": 22192, "epoch": 528} {"train_loss": -5.4151105880737305, "global_step": 22193, "epoch": 528} {"train_loss": -5.179798603057861, "global_step": 22194, "epoch": 528} {"train_loss": -5.418213844299316, "global_step": 22195, "epoch": 528} {"train_loss": -5.272147178649902, "global_step": 22196, "epoch": 528} {"train_loss": -5.299230575561523, "global_step": 22197, "epoch": 528} {"train_loss": -5.275130271911621, "global_step": 22198, "epoch": 528} {"train_loss": -5.336709022521973, "global_step": 22199, "epoch": 528} {"train_loss": -5.3157124519348145, "global_step": 22200, "epoch": 528} {"train_loss": -5.252108573913574, "global_step": 22201, "epoch": 528} {"train_loss": -5.309902667999268, "global_step": 22202, "epoch": 528} {"train_loss": -5.2466230392456055, "global_step": 22203, "epoch": 528} {"train_loss": -5.307421684265137, "global_step": 22204, "epoch": 528} {"train_loss": -5.242924690246582, "global_step": 22205, "epoch": 528} {"train_loss": -5.2371039390563965, "global_step": 22206, "epoch": 528} {"train_loss": -5.265766143798828, "global_step": 22207, "epoch": 528} {"train_loss": -5.236462116241455, "global_step": 22208, "epoch": 528} {"train_loss": -5.3182783126831055, "global_step": 22209, "epoch": 528} {"train_loss": -5.086552619934082, "global_step": 22210, "epoch": 528} {"train_loss": -5.269768714904785, "global_step": 22211, "epoch": 528} {"train_loss": -5.339621067047119, "global_step": 22212, "epoch": 528} {"train_loss": -5.224218368530273, "global_step": 22213, "epoch": 528} {"train_loss": -5.366766929626465, "global_step": 22214, "epoch": 528} {"train_loss": -5.353948593139648, "global_step": 22215, "epoch": 528} {"train_loss": -5.287872314453125, "global_step": 22216, "epoch": 528} {"train_loss": -5.325768765949068, "global_step": 22217, "epoch": 528, "val_loss": 68878.6171875} {"train_loss": -5.202602863311768, "global_step": 22218, "epoch": 529} {"train_loss": -5.345928192138672, "global_step": 22219, "epoch": 529} {"train_loss": -5.308750152587891, "global_step": 22220, "epoch": 529} {"train_loss": -5.365555286407471, "global_step": 22221, "epoch": 529} {"train_loss": -5.122705459594727, "global_step": 22222, "epoch": 529} {"train_loss": -5.27758264541626, "global_step": 22223, "epoch": 529} {"train_loss": -5.208495140075684, "global_step": 22224, "epoch": 529} {"train_loss": -5.254690170288086, "global_step": 22225, "epoch": 529} {"train_loss": -5.181351184844971, "global_step": 22226, "epoch": 529} {"train_loss": -5.297669410705566, "global_step": 22227, "epoch": 529} {"train_loss": -5.428319931030273, "global_step": 22228, "epoch": 529} {"train_loss": -5.2668304443359375, "global_step": 22229, "epoch": 529} {"train_loss": -5.4463934898376465, "global_step": 22230, "epoch": 529} {"train_loss": -5.306714057922363, "global_step": 22231, "epoch": 529} {"train_loss": -5.294078826904297, "global_step": 22232, "epoch": 529} {"train_loss": -5.392064094543457, "global_step": 22233, "epoch": 529} {"train_loss": -5.320222854614258, "global_step": 22234, "epoch": 529} {"train_loss": -5.3698201179504395, "global_step": 22235, "epoch": 529} {"train_loss": -5.244649887084961, "global_step": 22236, "epoch": 529} {"train_loss": -5.441633224487305, "global_step": 22237, "epoch": 529} {"train_loss": -5.352103233337402, "global_step": 22238, "epoch": 529} {"train_loss": -5.297898292541504, "global_step": 22239, "epoch": 529} {"train_loss": -5.349431037902832, "global_step": 22240, "epoch": 529} {"train_loss": -5.374878883361816, "global_step": 22241, "epoch": 529} {"train_loss": -5.228006362915039, "global_step": 22242, "epoch": 529} {"train_loss": -5.37728214263916, "global_step": 22243, "epoch": 529} {"train_loss": -5.312127113342285, "global_step": 22244, "epoch": 529} {"train_loss": -5.427412033081055, "global_step": 22245, "epoch": 529} {"train_loss": -5.380393028259277, "global_step": 22246, "epoch": 529} {"train_loss": -5.333575248718262, "global_step": 22247, "epoch": 529} {"train_loss": -5.3343610763549805, "global_step": 22248, "epoch": 529} {"train_loss": -5.567279815673828, "global_step": 22249, "epoch": 529} {"train_loss": -5.400496959686279, "global_step": 22250, "epoch": 529} {"train_loss": -5.474129676818848, "global_step": 22251, "epoch": 529} {"train_loss": -5.387975692749023, "global_step": 22252, "epoch": 529} {"train_loss": -5.393204689025879, "global_step": 22253, "epoch": 529} {"train_loss": -5.283650875091553, "global_step": 22254, "epoch": 529} {"train_loss": -5.304441452026367, "global_step": 22255, "epoch": 529} {"train_loss": -5.295327186584473, "global_step": 22256, "epoch": 529} {"train_loss": -5.3082356452941895, "global_step": 22257, "epoch": 529} {"train_loss": -5.345700263977051, "global_step": 22258, "epoch": 529} {"train_loss": -5.330874340874808, "global_step": 22259, "epoch": 529, "val_loss": 68184.171875} {"train_loss": -5.526755332946777, "global_step": 22260, "epoch": 530} {"train_loss": -5.263113498687744, "global_step": 22261, "epoch": 530} {"train_loss": -5.225086212158203, "global_step": 22262, "epoch": 530} {"train_loss": -5.346921443939209, "global_step": 22263, "epoch": 530} {"train_loss": -5.285721778869629, "global_step": 22264, "epoch": 530} {"train_loss": -5.319478988647461, "global_step": 22265, "epoch": 530} {"train_loss": -5.37175178527832, "global_step": 22266, "epoch": 530} {"train_loss": -5.326112270355225, "global_step": 22267, "epoch": 530} {"train_loss": -5.321664333343506, "global_step": 22268, "epoch": 530} {"train_loss": -5.383701801300049, "global_step": 22269, "epoch": 530} {"train_loss": -5.308812141418457, "global_step": 22270, "epoch": 530} {"train_loss": -5.288972854614258, "global_step": 22271, "epoch": 530} {"train_loss": -5.33799934387207, "global_step": 22272, "epoch": 530} {"train_loss": -5.255720138549805, "global_step": 22273, "epoch": 530} {"train_loss": -5.442030429840088, "global_step": 22274, "epoch": 530} {"train_loss": -5.3364644050598145, "global_step": 22275, "epoch": 530} {"train_loss": -5.317610740661621, "global_step": 22276, "epoch": 530} {"train_loss": -5.534418106079102, "global_step": 22277, "epoch": 530} {"train_loss": -5.347753047943115, "global_step": 22278, "epoch": 530} {"train_loss": -5.315361976623535, "global_step": 22279, "epoch": 530} {"train_loss": -5.39979362487793, "global_step": 22280, "epoch": 530} {"train_loss": -5.350607872009277, "global_step": 22281, "epoch": 530} {"train_loss": -5.517507553100586, "global_step": 22282, "epoch": 530} {"train_loss": -5.301202774047852, "global_step": 22283, "epoch": 530} {"train_loss": -5.411032676696777, "global_step": 22284, "epoch": 530} {"train_loss": -5.3921942710876465, "global_step": 22285, "epoch": 530} {"train_loss": -5.362798690795898, "global_step": 22286, "epoch": 530} {"train_loss": -5.292572021484375, "global_step": 22287, "epoch": 530} {"train_loss": -5.296205043792725, "global_step": 22288, "epoch": 530} {"train_loss": -5.427319526672363, "global_step": 22289, "epoch": 530} {"train_loss": -5.318810939788818, "global_step": 22290, "epoch": 530} {"train_loss": -5.286541938781738, "global_step": 22291, "epoch": 530} {"train_loss": -5.368484020233154, "global_step": 22292, "epoch": 530} {"train_loss": -5.34260368347168, "global_step": 22293, "epoch": 530} {"train_loss": -5.343326568603516, "global_step": 22294, "epoch": 530} {"train_loss": -5.268437385559082, "global_step": 22295, "epoch": 530} {"train_loss": -5.411836624145508, "global_step": 22296, "epoch": 530} {"train_loss": -5.3473405838012695, "global_step": 22297, "epoch": 530} {"train_loss": -5.37388277053833, "global_step": 22298, "epoch": 530} {"train_loss": -5.419520378112793, "global_step": 22299, "epoch": 530} {"train_loss": -5.3143534660339355, "global_step": 22300, "epoch": 530} {"train_loss": -5.350512515930903, "global_step": 22301, "epoch": 530, "val_loss": 68051.171875} {"train_loss": -5.372591972351074, "global_step": 22302, "epoch": 531} {"train_loss": -5.364765644073486, "global_step": 22303, "epoch": 531} {"train_loss": -5.3904805183410645, "global_step": 22304, "epoch": 531} {"train_loss": -5.284357070922852, "global_step": 22305, "epoch": 531} {"train_loss": -5.477077484130859, "global_step": 22306, "epoch": 531} {"train_loss": -5.405969619750977, "global_step": 22307, "epoch": 531} {"train_loss": -5.412680625915527, "global_step": 22308, "epoch": 531} {"train_loss": -5.499063491821289, "global_step": 22309, "epoch": 531} {"train_loss": -5.277709007263184, "global_step": 22310, "epoch": 531} {"train_loss": -5.255496025085449, "global_step": 22311, "epoch": 531} {"train_loss": -5.442713260650635, "global_step": 22312, "epoch": 531} {"train_loss": -5.369757652282715, "global_step": 22313, "epoch": 531} {"train_loss": -5.405426502227783, "global_step": 22314, "epoch": 531} {"train_loss": -5.3721513748168945, "global_step": 22315, "epoch": 531} {"train_loss": -5.312617301940918, "global_step": 22316, "epoch": 531} {"train_loss": -5.1710405349731445, "global_step": 22317, "epoch": 531} {"train_loss": -5.385983467102051, "global_step": 22318, "epoch": 531} {"train_loss": -5.343533515930176, "global_step": 22319, "epoch": 531} {"train_loss": -5.2642645835876465, "global_step": 22320, "epoch": 531} {"train_loss": -5.235057830810547, "global_step": 22321, "epoch": 531} {"train_loss": -5.378196716308594, "global_step": 22322, "epoch": 531} {"train_loss": -5.363607883453369, "global_step": 22323, "epoch": 531} {"train_loss": -5.385601043701172, "global_step": 22324, "epoch": 531} {"train_loss": -5.33013391494751, "global_step": 22325, "epoch": 531} {"train_loss": -5.328482627868652, "global_step": 22326, "epoch": 531} {"train_loss": -5.405318737030029, "global_step": 22327, "epoch": 531} {"train_loss": -5.356789588928223, "global_step": 22328, "epoch": 531} {"train_loss": -5.283232688903809, "global_step": 22329, "epoch": 531} {"train_loss": -5.413288116455078, "global_step": 22330, "epoch": 531} {"train_loss": -5.2367353439331055, "global_step": 22331, "epoch": 531} {"train_loss": -5.431634902954102, "global_step": 22332, "epoch": 531} {"train_loss": -5.255655288696289, "global_step": 22333, "epoch": 531} {"train_loss": -5.328033447265625, "global_step": 22334, "epoch": 531} {"train_loss": -5.458861351013184, "global_step": 22335, "epoch": 531} {"train_loss": -5.391241073608398, "global_step": 22336, "epoch": 531} {"train_loss": -5.325953006744385, "global_step": 22337, "epoch": 531} {"train_loss": -5.243824481964111, "global_step": 22338, "epoch": 531} {"train_loss": -5.418642997741699, "global_step": 22339, "epoch": 531} {"train_loss": -5.430285453796387, "global_step": 22340, "epoch": 531} {"train_loss": -5.292857646942139, "global_step": 22341, "epoch": 531} {"train_loss": -5.31334924697876, "global_step": 22342, "epoch": 531} {"train_loss": -5.347651413508824, "global_step": 22343, "epoch": 531, "val_loss": 68637.921875} {"train_loss": -5.162075996398926, "global_step": 22344, "epoch": 532} {"train_loss": -5.381625175476074, "global_step": 22345, "epoch": 532} {"train_loss": -5.4118452072143555, "global_step": 22346, "epoch": 532} {"train_loss": -5.4035797119140625, "global_step": 22347, "epoch": 532} {"train_loss": -5.368827819824219, "global_step": 22348, "epoch": 532} {"train_loss": -5.402543067932129, "global_step": 22349, "epoch": 532} {"train_loss": -5.357149600982666, "global_step": 22350, "epoch": 532} {"train_loss": -5.369514465332031, "global_step": 22351, "epoch": 532} {"train_loss": -5.290158271789551, "global_step": 22352, "epoch": 532} {"train_loss": -5.381219863891602, "global_step": 22353, "epoch": 532} {"train_loss": -5.218584060668945, "global_step": 22354, "epoch": 532} {"train_loss": -5.43527889251709, "global_step": 22355, "epoch": 532} {"train_loss": -5.317159175872803, "global_step": 22356, "epoch": 532} {"train_loss": -5.490767478942871, "global_step": 22357, "epoch": 532} {"train_loss": -5.282709121704102, "global_step": 22358, "epoch": 532} {"train_loss": -5.334481239318848, "global_step": 22359, "epoch": 532} {"train_loss": -5.444152355194092, "global_step": 22360, "epoch": 532} {"train_loss": -5.331533432006836, "global_step": 22361, "epoch": 532} {"train_loss": -5.190352439880371, "global_step": 22362, "epoch": 532} {"train_loss": -5.399182319641113, "global_step": 22363, "epoch": 532} {"train_loss": -5.2134552001953125, "global_step": 22364, "epoch": 532} {"train_loss": -5.233590602874756, "global_step": 22365, "epoch": 532} {"train_loss": -5.3043365478515625, "global_step": 22366, "epoch": 532} {"train_loss": -5.152369976043701, "global_step": 22367, "epoch": 532} {"train_loss": -5.344348430633545, "global_step": 22368, "epoch": 532} {"train_loss": -5.3639726638793945, "global_step": 22369, "epoch": 532} {"train_loss": -5.316449165344238, "global_step": 22370, "epoch": 532} {"train_loss": -5.1311821937561035, "global_step": 22371, "epoch": 532} {"train_loss": -5.385406494140625, "global_step": 22372, "epoch": 532} {"train_loss": -5.325750350952148, "global_step": 22373, "epoch": 532} {"train_loss": -5.392875671386719, "global_step": 22374, "epoch": 532} {"train_loss": -5.252596378326416, "global_step": 22375, "epoch": 532} {"train_loss": -5.415828227996826, "global_step": 22376, "epoch": 532} {"train_loss": -5.156031131744385, "global_step": 22377, "epoch": 532} {"train_loss": -5.316032409667969, "global_step": 22378, "epoch": 532} {"train_loss": -5.259714603424072, "global_step": 22379, "epoch": 532} {"train_loss": -5.327815055847168, "global_step": 22380, "epoch": 532} {"train_loss": -5.245011329650879, "global_step": 22381, "epoch": 532} {"train_loss": -5.313742637634277, "global_step": 22382, "epoch": 532} {"train_loss": -5.293451309204102, "global_step": 22383, "epoch": 532} {"train_loss": -5.315865516662598, "global_step": 22384, "epoch": 532} {"train_loss": -5.3187375749860495, "global_step": 22385, "epoch": 532, "val_loss": 68797.6875} {"train_loss": -5.398590087890625, "global_step": 22386, "epoch": 533} {"train_loss": -5.248510360717773, "global_step": 22387, "epoch": 533} {"train_loss": -5.3440961837768555, "global_step": 22388, "epoch": 533} {"train_loss": -5.394428253173828, "global_step": 22389, "epoch": 533} {"train_loss": -5.27925968170166, "global_step": 22390, "epoch": 533} {"train_loss": -5.51871395111084, "global_step": 22391, "epoch": 533} {"train_loss": -5.111100196838379, "global_step": 22392, "epoch": 533} {"train_loss": -5.402066707611084, "global_step": 22393, "epoch": 533} {"train_loss": -5.340204238891602, "global_step": 22394, "epoch": 533} {"train_loss": -5.290121078491211, "global_step": 22395, "epoch": 533} {"train_loss": -5.275993347167969, "global_step": 22396, "epoch": 533} {"train_loss": -5.3926849365234375, "global_step": 22397, "epoch": 533} {"train_loss": -5.294022083282471, "global_step": 22398, "epoch": 533} {"train_loss": -5.319897174835205, "global_step": 22399, "epoch": 533} {"train_loss": -5.2610931396484375, "global_step": 22400, "epoch": 533} {"train_loss": -5.415952205657959, "global_step": 22401, "epoch": 533} {"train_loss": -5.362759590148926, "global_step": 22402, "epoch": 533} {"train_loss": -5.325287342071533, "global_step": 22403, "epoch": 533} {"train_loss": -5.3328118324279785, "global_step": 22404, "epoch": 533} {"train_loss": -5.367889404296875, "global_step": 22405, "epoch": 533} {"train_loss": -5.238163471221924, "global_step": 22406, "epoch": 533} {"train_loss": -5.454944610595703, "global_step": 22407, "epoch": 533} {"train_loss": -5.3869123458862305, "global_step": 22408, "epoch": 533} {"train_loss": -5.2767252922058105, "global_step": 22409, "epoch": 533} {"train_loss": -5.301792621612549, "global_step": 22410, "epoch": 533} {"train_loss": -5.408524036407471, "global_step": 22411, "epoch": 533} {"train_loss": -5.344873905181885, "global_step": 22412, "epoch": 533} {"train_loss": -5.448276519775391, "global_step": 22413, "epoch": 533} {"train_loss": -5.233691215515137, "global_step": 22414, "epoch": 533} {"train_loss": -5.3065505027771, "global_step": 22415, "epoch": 533} {"train_loss": -5.419297695159912, "global_step": 22416, "epoch": 533} {"train_loss": -5.388882160186768, "global_step": 22417, "epoch": 533} {"train_loss": -5.4566569328308105, "global_step": 22418, "epoch": 533} {"train_loss": -5.359225273132324, "global_step": 22419, "epoch": 533} {"train_loss": -5.278573989868164, "global_step": 22420, "epoch": 533} {"train_loss": -5.250679016113281, "global_step": 22421, "epoch": 533} {"train_loss": -5.355711936950684, "global_step": 22422, "epoch": 533} {"train_loss": -5.156949996948242, "global_step": 22423, "epoch": 533} {"train_loss": -5.334358215332031, "global_step": 22424, "epoch": 533} {"train_loss": -5.195383071899414, "global_step": 22425, "epoch": 533} {"train_loss": -5.290807247161865, "global_step": 22426, "epoch": 533} {"train_loss": -5.33124642145066, "global_step": 22427, "epoch": 533, "val_loss": 68631.6953125} {"train_loss": -5.397637367248535, "global_step": 22428, "epoch": 534} {"train_loss": -5.402280807495117, "global_step": 22429, "epoch": 534} {"train_loss": -5.372539043426514, "global_step": 22430, "epoch": 534} {"train_loss": -5.198408126831055, "global_step": 22431, "epoch": 534} {"train_loss": -5.220448970794678, "global_step": 22432, "epoch": 534} {"train_loss": -5.21699333190918, "global_step": 22433, "epoch": 534} {"train_loss": -5.320809364318848, "global_step": 22434, "epoch": 534} {"train_loss": -5.289960861206055, "global_step": 22435, "epoch": 534} {"train_loss": -5.3796706199646, "global_step": 22436, "epoch": 534} {"train_loss": -5.3642578125, "global_step": 22437, "epoch": 534} {"train_loss": -5.325744152069092, "global_step": 22438, "epoch": 534} {"train_loss": -5.207548141479492, "global_step": 22439, "epoch": 534} {"train_loss": -5.2430620193481445, "global_step": 22440, "epoch": 534} {"train_loss": -5.369595050811768, "global_step": 22441, "epoch": 534} {"train_loss": -5.265605926513672, "global_step": 22442, "epoch": 534} {"train_loss": -5.198945999145508, "global_step": 22443, "epoch": 534} {"train_loss": -5.35614538192749, "global_step": 22444, "epoch": 534} {"train_loss": -5.332862854003906, "global_step": 22445, "epoch": 534} {"train_loss": -5.268104076385498, "global_step": 22446, "epoch": 534} {"train_loss": -5.3048200607299805, "global_step": 22447, "epoch": 534} {"train_loss": -5.369649410247803, "global_step": 22448, "epoch": 534} {"train_loss": -5.3123064041137695, "global_step": 22449, "epoch": 534} {"train_loss": -5.200545310974121, "global_step": 22450, "epoch": 534} {"train_loss": -5.570155143737793, "global_step": 22451, "epoch": 534} {"train_loss": -5.493991374969482, "global_step": 22452, "epoch": 534} {"train_loss": -5.386195182800293, "global_step": 22453, "epoch": 534} {"train_loss": -5.359736442565918, "global_step": 22454, "epoch": 534} {"train_loss": -5.295456409454346, "global_step": 22455, "epoch": 534} {"train_loss": -5.401985168457031, "global_step": 22456, "epoch": 534} {"train_loss": -5.476525783538818, "global_step": 22457, "epoch": 534} {"train_loss": -5.4464521408081055, "global_step": 22458, "epoch": 534} {"train_loss": -5.397076606750488, "global_step": 22459, "epoch": 534} {"train_loss": -5.355571746826172, "global_step": 22460, "epoch": 534} {"train_loss": -5.3435821533203125, "global_step": 22461, "epoch": 534} {"train_loss": -5.339710235595703, "global_step": 22462, "epoch": 534} {"train_loss": -5.406574249267578, "global_step": 22463, "epoch": 534} {"train_loss": -5.343451976776123, "global_step": 22464, "epoch": 534} {"train_loss": -5.340909481048584, "global_step": 22465, "epoch": 534} {"train_loss": -5.2973175048828125, "global_step": 22466, "epoch": 534} {"train_loss": -5.309641361236572, "global_step": 22467, "epoch": 534} {"train_loss": -5.400468826293945, "global_step": 22468, "epoch": 534} {"train_loss": -5.345567532948086, "global_step": 22469, "epoch": 534, "val_loss": 68457.578125} {"train_loss": -5.370882034301758, "global_step": 22470, "epoch": 535} {"train_loss": -5.364499092102051, "global_step": 22471, "epoch": 535} {"train_loss": -5.417884826660156, "global_step": 22472, "epoch": 535} {"train_loss": -5.317930698394775, "global_step": 22473, "epoch": 535} {"train_loss": -5.3520660400390625, "global_step": 22474, "epoch": 535} {"train_loss": -5.456357955932617, "global_step": 22475, "epoch": 535} {"train_loss": -5.465466499328613, "global_step": 22476, "epoch": 535} {"train_loss": -5.378737449645996, "global_step": 22477, "epoch": 535} {"train_loss": -5.352855205535889, "global_step": 22478, "epoch": 535} {"train_loss": -5.27816104888916, "global_step": 22479, "epoch": 535} {"train_loss": -5.274959564208984, "global_step": 22480, "epoch": 535} {"train_loss": -5.342947006225586, "global_step": 22481, "epoch": 535} {"train_loss": -5.2278642654418945, "global_step": 22482, "epoch": 535} {"train_loss": -5.1173505783081055, "global_step": 22483, "epoch": 535} {"train_loss": -5.433392524719238, "global_step": 22484, "epoch": 535} {"train_loss": -5.322859764099121, "global_step": 22485, "epoch": 535} {"train_loss": -5.255664348602295, "global_step": 22486, "epoch": 535} {"train_loss": -5.253332138061523, "global_step": 22487, "epoch": 535} {"train_loss": -5.325721740722656, "global_step": 22488, "epoch": 535} {"train_loss": -5.125837802886963, "global_step": 22489, "epoch": 535} {"train_loss": -5.44819974899292, "global_step": 22490, "epoch": 535} {"train_loss": -5.301453590393066, "global_step": 22491, "epoch": 535} {"train_loss": -5.303396701812744, "global_step": 22492, "epoch": 535} {"train_loss": -5.3332200050354, "global_step": 22493, "epoch": 535} {"train_loss": -5.267220497131348, "global_step": 22494, "epoch": 535} {"train_loss": -5.26966667175293, "global_step": 22495, "epoch": 535} {"train_loss": -5.211437702178955, "global_step": 22496, "epoch": 535} {"train_loss": -5.311345100402832, "global_step": 22497, "epoch": 535} {"train_loss": -5.293302536010742, "global_step": 22498, "epoch": 535} {"train_loss": -5.381960391998291, "global_step": 22499, "epoch": 535} {"train_loss": -5.307826995849609, "global_step": 22500, "epoch": 535} {"train_loss": -5.254514217376709, "global_step": 22501, "epoch": 535} {"train_loss": -5.433306694030762, "global_step": 22502, "epoch": 535} {"train_loss": -5.4755144119262695, "global_step": 22503, "epoch": 535} {"train_loss": -5.460946083068848, "global_step": 22504, "epoch": 535} {"train_loss": -5.354795932769775, "global_step": 22505, "epoch": 535} {"train_loss": -5.414449691772461, "global_step": 22506, "epoch": 535} {"train_loss": -5.363554954528809, "global_step": 22507, "epoch": 535} {"train_loss": -5.296390533447266, "global_step": 22508, "epoch": 535} {"train_loss": -5.1903076171875, "global_step": 22509, "epoch": 535} {"train_loss": -5.281386852264404, "global_step": 22510, "epoch": 535} {"train_loss": -5.327569984254383, "global_step": 22511, "epoch": 535, "val_loss": 68499.7734375} {"train_loss": -5.272312641143799, "global_step": 22512, "epoch": 536} {"train_loss": -5.366745948791504, "global_step": 22513, "epoch": 536} {"train_loss": -5.4016499519348145, "global_step": 22514, "epoch": 536} {"train_loss": -5.291548728942871, "global_step": 22515, "epoch": 536} {"train_loss": -5.319096565246582, "global_step": 22516, "epoch": 536} {"train_loss": -5.3879241943359375, "global_step": 22517, "epoch": 536} {"train_loss": -5.224553108215332, "global_step": 22518, "epoch": 536} {"train_loss": -5.159592628479004, "global_step": 22519, "epoch": 536} {"train_loss": -5.35463809967041, "global_step": 22520, "epoch": 536} {"train_loss": -5.288450241088867, "global_step": 22521, "epoch": 536} {"train_loss": -5.338920593261719, "global_step": 22522, "epoch": 536} {"train_loss": -5.593033790588379, "global_step": 22523, "epoch": 536} {"train_loss": -5.397725582122803, "global_step": 22524, "epoch": 536} {"train_loss": -5.43506383895874, "global_step": 22525, "epoch": 536} {"train_loss": -5.302759170532227, "global_step": 22526, "epoch": 536} {"train_loss": -5.2948317527771, "global_step": 22527, "epoch": 536} {"train_loss": -5.41895866394043, "global_step": 22528, "epoch": 536} {"train_loss": -5.318687438964844, "global_step": 22529, "epoch": 536} {"train_loss": -5.318305969238281, "global_step": 22530, "epoch": 536} {"train_loss": -5.357728004455566, "global_step": 22531, "epoch": 536} {"train_loss": -5.407313346862793, "global_step": 22532, "epoch": 536} {"train_loss": -5.429399490356445, "global_step": 22533, "epoch": 536} {"train_loss": -5.430172920227051, "global_step": 22534, "epoch": 536} {"train_loss": -5.385538578033447, "global_step": 22535, "epoch": 536} {"train_loss": -5.2826995849609375, "global_step": 22536, "epoch": 536} {"train_loss": -5.388964653015137, "global_step": 22537, "epoch": 536} {"train_loss": -5.340753555297852, "global_step": 22538, "epoch": 536} {"train_loss": -5.33070182800293, "global_step": 22539, "epoch": 536} {"train_loss": -5.375735282897949, "global_step": 22540, "epoch": 536} {"train_loss": -5.424679756164551, "global_step": 22541, "epoch": 536} {"train_loss": -5.277270317077637, "global_step": 22542, "epoch": 536} {"train_loss": -5.4001359939575195, "global_step": 22543, "epoch": 536} {"train_loss": -5.141460418701172, "global_step": 22544, "epoch": 536} {"train_loss": -5.407120704650879, "global_step": 22545, "epoch": 536} {"train_loss": -5.157112121582031, "global_step": 22546, "epoch": 536} {"train_loss": -5.282125949859619, "global_step": 22547, "epoch": 536} {"train_loss": -5.323141098022461, "global_step": 22548, "epoch": 536} {"train_loss": -5.387685775756836, "global_step": 22549, "epoch": 536} {"train_loss": -5.30082368850708, "global_step": 22550, "epoch": 536} {"train_loss": -5.313076972961426, "global_step": 22551, "epoch": 536} {"train_loss": -5.331005096435547, "global_step": 22552, "epoch": 536} {"train_loss": -5.341663803373065, "global_step": 22553, "epoch": 536, "val_loss": 68222.875} {"train_loss": -5.3250627517700195, "global_step": 22554, "epoch": 537} {"train_loss": -5.382006645202637, "global_step": 22555, "epoch": 537} {"train_loss": -5.385727405548096, "global_step": 22556, "epoch": 537} {"train_loss": -5.478188991546631, "global_step": 22557, "epoch": 537} {"train_loss": -5.335090160369873, "global_step": 22558, "epoch": 537} {"train_loss": -5.316136360168457, "global_step": 22559, "epoch": 537} {"train_loss": -5.418565273284912, "global_step": 22560, "epoch": 537} {"train_loss": -5.399031162261963, "global_step": 22561, "epoch": 537} {"train_loss": -5.318948268890381, "global_step": 22562, "epoch": 537} {"train_loss": -5.408031463623047, "global_step": 22563, "epoch": 537} {"train_loss": -5.356213569641113, "global_step": 22564, "epoch": 537} {"train_loss": -5.24113130569458, "global_step": 22565, "epoch": 537} {"train_loss": -5.22169828414917, "global_step": 22566, "epoch": 537} {"train_loss": -5.2144598960876465, "global_step": 22567, "epoch": 537} {"train_loss": -5.141522407531738, "global_step": 22568, "epoch": 537} {"train_loss": -5.476094722747803, "global_step": 22569, "epoch": 537} {"train_loss": -5.453223705291748, "global_step": 22570, "epoch": 537} {"train_loss": -5.440468788146973, "global_step": 22571, "epoch": 537} {"train_loss": -5.359620094299316, "global_step": 22572, "epoch": 537} {"train_loss": -5.3528594970703125, "global_step": 22573, "epoch": 537} {"train_loss": -5.398536205291748, "global_step": 22574, "epoch": 537} {"train_loss": -5.489559650421143, "global_step": 22575, "epoch": 537} {"train_loss": -5.34115743637085, "global_step": 22576, "epoch": 537} {"train_loss": -5.360719680786133, "global_step": 22577, "epoch": 537} {"train_loss": -5.385929107666016, "global_step": 22578, "epoch": 537} {"train_loss": -5.403090476989746, "global_step": 22579, "epoch": 537} {"train_loss": -5.267083168029785, "global_step": 22580, "epoch": 537} {"train_loss": -5.3260817527771, "global_step": 22581, "epoch": 537} {"train_loss": -5.383037567138672, "global_step": 22582, "epoch": 537} {"train_loss": -5.3022661209106445, "global_step": 22583, "epoch": 537} {"train_loss": -5.42514705657959, "global_step": 22584, "epoch": 537} {"train_loss": -5.445882320404053, "global_step": 22585, "epoch": 537} {"train_loss": -5.2423295974731445, "global_step": 22586, "epoch": 537} {"train_loss": -5.206300735473633, "global_step": 22587, "epoch": 537} {"train_loss": -5.37537145614624, "global_step": 22588, "epoch": 537} {"train_loss": -5.320738792419434, "global_step": 22589, "epoch": 537} {"train_loss": -5.249183654785156, "global_step": 22590, "epoch": 537} {"train_loss": -5.3117570877075195, "global_step": 22591, "epoch": 537} {"train_loss": -5.420382976531982, "global_step": 22592, "epoch": 537} {"train_loss": -5.348870277404785, "global_step": 22593, "epoch": 537} {"train_loss": -5.300737380981445, "global_step": 22594, "epoch": 537} {"train_loss": -5.351462318783715, "global_step": 22595, "epoch": 537, "val_loss": 68781.5859375} {"train_loss": -5.317740440368652, "global_step": 22596, "epoch": 538} {"train_loss": -5.2759809494018555, "global_step": 22597, "epoch": 538} {"train_loss": -5.365855693817139, "global_step": 22598, "epoch": 538} {"train_loss": -5.206966876983643, "global_step": 22599, "epoch": 538} {"train_loss": -5.380598068237305, "global_step": 22600, "epoch": 538} {"train_loss": -5.532320022583008, "global_step": 22601, "epoch": 538} {"train_loss": -5.352640628814697, "global_step": 22602, "epoch": 538} {"train_loss": -5.349129676818848, "global_step": 22603, "epoch": 538} {"train_loss": -5.381330490112305, "global_step": 22604, "epoch": 538} {"train_loss": -5.394492149353027, "global_step": 22605, "epoch": 538} {"train_loss": -5.366456031799316, "global_step": 22606, "epoch": 538} {"train_loss": -5.353952884674072, "global_step": 22607, "epoch": 538} {"train_loss": -5.382241725921631, "global_step": 22608, "epoch": 538} {"train_loss": -5.362410068511963, "global_step": 22609, "epoch": 538} {"train_loss": -5.32059907913208, "global_step": 22610, "epoch": 538} {"train_loss": -5.343888282775879, "global_step": 22611, "epoch": 538} {"train_loss": -5.31691837310791, "global_step": 22612, "epoch": 538} {"train_loss": -5.34002685546875, "global_step": 22613, "epoch": 538} {"train_loss": -5.305379867553711, "global_step": 22614, "epoch": 538} {"train_loss": -5.251650810241699, "global_step": 22615, "epoch": 538} {"train_loss": -5.386990547180176, "global_step": 22616, "epoch": 538} {"train_loss": -5.347530841827393, "global_step": 22617, "epoch": 538} {"train_loss": -5.267124176025391, "global_step": 22618, "epoch": 538} {"train_loss": -5.382200241088867, "global_step": 22619, "epoch": 538} {"train_loss": -5.214016437530518, "global_step": 22620, "epoch": 538} {"train_loss": -5.30308723449707, "global_step": 22621, "epoch": 538} {"train_loss": -5.276154041290283, "global_step": 22622, "epoch": 538} {"train_loss": -5.446706771850586, "global_step": 22623, "epoch": 538} {"train_loss": -5.389434337615967, "global_step": 22624, "epoch": 538} {"train_loss": -5.385017395019531, "global_step": 22625, "epoch": 538} {"train_loss": -5.311155319213867, "global_step": 22626, "epoch": 538} {"train_loss": -5.3473219871521, "global_step": 22627, "epoch": 538} {"train_loss": -5.313862323760986, "global_step": 22628, "epoch": 538} {"train_loss": -5.525691032409668, "global_step": 22629, "epoch": 538} {"train_loss": -5.291623115539551, "global_step": 22630, "epoch": 538} {"train_loss": -5.320567607879639, "global_step": 22631, "epoch": 538} {"train_loss": -5.357163429260254, "global_step": 22632, "epoch": 538} {"train_loss": -5.21755838394165, "global_step": 22633, "epoch": 538} {"train_loss": -5.35875940322876, "global_step": 22634, "epoch": 538} {"train_loss": -5.198812484741211, "global_step": 22635, "epoch": 538} {"train_loss": -5.3730268478393555, "global_step": 22636, "epoch": 538} {"train_loss": -5.340342975798107, "global_step": 22637, "epoch": 538, "val_loss": 68459.734375} {"train_loss": -5.508196830749512, "global_step": 22638, "epoch": 539} {"train_loss": -5.330647945404053, "global_step": 22639, "epoch": 539} {"train_loss": -5.313310146331787, "global_step": 22640, "epoch": 539} {"train_loss": -5.394702911376953, "global_step": 22641, "epoch": 539} {"train_loss": -5.3152666091918945, "global_step": 22642, "epoch": 539} {"train_loss": -5.32423210144043, "global_step": 22643, "epoch": 539} {"train_loss": -5.34841775894165, "global_step": 22644, "epoch": 539} {"train_loss": -5.419100284576416, "global_step": 22645, "epoch": 539} {"train_loss": -5.19874906539917, "global_step": 22646, "epoch": 539} {"train_loss": -5.359262466430664, "global_step": 22647, "epoch": 539} {"train_loss": -5.43695592880249, "global_step": 22648, "epoch": 539} {"train_loss": -5.228343963623047, "global_step": 22649, "epoch": 539} {"train_loss": -5.419277667999268, "global_step": 22650, "epoch": 539} {"train_loss": -5.32311487197876, "global_step": 22651, "epoch": 539} {"train_loss": -5.403752326965332, "global_step": 22652, "epoch": 539} {"train_loss": -5.383390426635742, "global_step": 22653, "epoch": 539} {"train_loss": -5.167890548706055, "global_step": 22654, "epoch": 539} {"train_loss": -5.3842902183532715, "global_step": 22655, "epoch": 539} {"train_loss": -5.3302459716796875, "global_step": 22656, "epoch": 539} {"train_loss": -5.237992763519287, "global_step": 22657, "epoch": 539} {"train_loss": -5.45734977722168, "global_step": 22658, "epoch": 539} {"train_loss": -5.307329177856445, "global_step": 22659, "epoch": 539} {"train_loss": -5.327833652496338, "global_step": 22660, "epoch": 539} {"train_loss": -5.501224994659424, "global_step": 22661, "epoch": 539} {"train_loss": -5.296045303344727, "global_step": 22662, "epoch": 539} {"train_loss": -5.335649490356445, "global_step": 22663, "epoch": 539} {"train_loss": -5.274188041687012, "global_step": 22664, "epoch": 539} {"train_loss": -5.309881210327148, "global_step": 22665, "epoch": 539} {"train_loss": -5.246787071228027, "global_step": 22666, "epoch": 539} {"train_loss": -5.359055519104004, "global_step": 22667, "epoch": 539} {"train_loss": -5.318512916564941, "global_step": 22668, "epoch": 539} {"train_loss": -5.317313194274902, "global_step": 22669, "epoch": 539} {"train_loss": -5.3429059982299805, "global_step": 22670, "epoch": 539} {"train_loss": -5.344265937805176, "global_step": 22671, "epoch": 539} {"train_loss": -5.328447341918945, "global_step": 22672, "epoch": 539} {"train_loss": -5.263718605041504, "global_step": 22673, "epoch": 539} {"train_loss": -5.376195907592773, "global_step": 22674, "epoch": 539} {"train_loss": -5.271115303039551, "global_step": 22675, "epoch": 539} {"train_loss": -5.397010803222656, "global_step": 22676, "epoch": 539} {"train_loss": -5.43721342086792, "global_step": 22677, "epoch": 539} {"train_loss": -5.445439338684082, "global_step": 22678, "epoch": 539} {"train_loss": -5.343452408200219, "global_step": 22679, "epoch": 539, "val_loss": 68551.6875} {"train_loss": -5.401206970214844, "global_step": 22680, "epoch": 540} {"train_loss": -5.396688461303711, "global_step": 22681, "epoch": 540} {"train_loss": -5.475543975830078, "global_step": 22682, "epoch": 540} {"train_loss": -5.31684684753418, "global_step": 22683, "epoch": 540} {"train_loss": -5.426647186279297, "global_step": 22684, "epoch": 540} {"train_loss": -5.415643692016602, "global_step": 22685, "epoch": 540} {"train_loss": -5.354484558105469, "global_step": 22686, "epoch": 540} {"train_loss": -5.191257476806641, "global_step": 22687, "epoch": 540} {"train_loss": -5.42800235748291, "global_step": 22688, "epoch": 540} {"train_loss": -5.376044273376465, "global_step": 22689, "epoch": 540} {"train_loss": -5.283899307250977, "global_step": 22690, "epoch": 540} {"train_loss": -5.389418601989746, "global_step": 22691, "epoch": 540} {"train_loss": -5.4029998779296875, "global_step": 22692, "epoch": 540} {"train_loss": -5.364501953125, "global_step": 22693, "epoch": 540} {"train_loss": -5.31450891494751, "global_step": 22694, "epoch": 540} {"train_loss": -5.373858451843262, "global_step": 22695, "epoch": 540} {"train_loss": -5.50014066696167, "global_step": 22696, "epoch": 540} {"train_loss": -5.351949691772461, "global_step": 22697, "epoch": 540} {"train_loss": -5.3138885498046875, "global_step": 22698, "epoch": 540} {"train_loss": -5.348264694213867, "global_step": 22699, "epoch": 540} {"train_loss": -5.427196979522705, "global_step": 22700, "epoch": 540} {"train_loss": -5.369437217712402, "global_step": 22701, "epoch": 540} {"train_loss": -5.341373443603516, "global_step": 22702, "epoch": 540} {"train_loss": -5.419193267822266, "global_step": 22703, "epoch": 540} {"train_loss": -5.4495625495910645, "global_step": 22704, "epoch": 540} {"train_loss": -5.428397178649902, "global_step": 22705, "epoch": 540} {"train_loss": -5.346271514892578, "global_step": 22706, "epoch": 540} {"train_loss": -5.421359062194824, "global_step": 22707, "epoch": 540} {"train_loss": -5.393119812011719, "global_step": 22708, "epoch": 540} {"train_loss": -5.442272186279297, "global_step": 22709, "epoch": 540} {"train_loss": -5.379788398742676, "global_step": 22710, "epoch": 540} {"train_loss": -5.296222686767578, "global_step": 22711, "epoch": 540} {"train_loss": -5.312158107757568, "global_step": 22712, "epoch": 540} {"train_loss": -5.418770790100098, "global_step": 22713, "epoch": 540} {"train_loss": -5.26020622253418, "global_step": 22714, "epoch": 540} {"train_loss": -5.290040969848633, "global_step": 22715, "epoch": 540} {"train_loss": -5.381657600402832, "global_step": 22716, "epoch": 540} {"train_loss": -5.390504837036133, "global_step": 22717, "epoch": 540} {"train_loss": -5.435333251953125, "global_step": 22718, "epoch": 540} {"train_loss": -5.221899032592773, "global_step": 22719, "epoch": 540} {"train_loss": -5.42725944519043, "global_step": 22720, "epoch": 540} {"train_loss": -5.372961112431118, "global_step": 22721, "epoch": 540, "val_loss": 67926.03125} {"train_loss": -5.337392807006836, "global_step": 22722, "epoch": 541} {"train_loss": -5.251175880432129, "global_step": 22723, "epoch": 541} {"train_loss": -5.443695068359375, "global_step": 22724, "epoch": 541} {"train_loss": -5.515912055969238, "global_step": 22725, "epoch": 541} {"train_loss": -5.407351493835449, "global_step": 22726, "epoch": 541} {"train_loss": -5.448749542236328, "global_step": 22727, "epoch": 541} {"train_loss": -5.516915321350098, "global_step": 22728, "epoch": 541} {"train_loss": -5.388257026672363, "global_step": 22729, "epoch": 541} {"train_loss": -5.268457412719727, "global_step": 22730, "epoch": 541} {"train_loss": -5.375520706176758, "global_step": 22731, "epoch": 541} {"train_loss": -5.339065074920654, "global_step": 22732, "epoch": 541} {"train_loss": -5.246760845184326, "global_step": 22733, "epoch": 541} {"train_loss": -5.38346529006958, "global_step": 22734, "epoch": 541} {"train_loss": -5.375149726867676, "global_step": 22735, "epoch": 541} {"train_loss": -5.225862979888916, "global_step": 22736, "epoch": 541} {"train_loss": -5.140365123748779, "global_step": 22737, "epoch": 541} {"train_loss": -5.342864036560059, "global_step": 22738, "epoch": 541} {"train_loss": -5.478960037231445, "global_step": 22739, "epoch": 541} {"train_loss": -5.364366054534912, "global_step": 22740, "epoch": 541} {"train_loss": -5.288968086242676, "global_step": 22741, "epoch": 541} {"train_loss": -5.382179260253906, "global_step": 22742, "epoch": 541} {"train_loss": -5.257471084594727, "global_step": 22743, "epoch": 541} {"train_loss": -5.212130546569824, "global_step": 22744, "epoch": 541} {"train_loss": -5.411401748657227, "global_step": 22745, "epoch": 541} {"train_loss": -5.338634490966797, "global_step": 22746, "epoch": 541} {"train_loss": -5.314267158508301, "global_step": 22747, "epoch": 541} {"train_loss": -5.30540657043457, "global_step": 22748, "epoch": 541} {"train_loss": -5.253011703491211, "global_step": 22749, "epoch": 541} {"train_loss": -5.216104030609131, "global_step": 22750, "epoch": 541} {"train_loss": -5.381282806396484, "global_step": 22751, "epoch": 541} {"train_loss": -5.349418640136719, "global_step": 22752, "epoch": 541} {"train_loss": -5.254249572753906, "global_step": 22753, "epoch": 541} {"train_loss": -5.39116907119751, "global_step": 22754, "epoch": 541} {"train_loss": -5.368309497833252, "global_step": 22755, "epoch": 541} {"train_loss": -5.3243255615234375, "global_step": 22756, "epoch": 541} {"train_loss": -5.331926345825195, "global_step": 22757, "epoch": 541} {"train_loss": -5.338324546813965, "global_step": 22758, "epoch": 541} {"train_loss": -5.43678617477417, "global_step": 22759, "epoch": 541} {"train_loss": -5.366763114929199, "global_step": 22760, "epoch": 541} {"train_loss": -5.328807830810547, "global_step": 22761, "epoch": 541} {"train_loss": -5.346004009246826, "global_step": 22762, "epoch": 541} {"train_loss": -5.34032484463283, "global_step": 22763, "epoch": 541, "val_loss": 68040.140625} {"train_loss": -5.3568620681762695, "global_step": 22764, "epoch": 542} {"train_loss": -5.432326316833496, "global_step": 22765, "epoch": 542} {"train_loss": -5.171389579772949, "global_step": 22766, "epoch": 542} {"train_loss": -5.422275543212891, "global_step": 22767, "epoch": 542} {"train_loss": -5.43245792388916, "global_step": 22768, "epoch": 542} {"train_loss": -5.303572654724121, "global_step": 22769, "epoch": 542} {"train_loss": -5.455353736877441, "global_step": 22770, "epoch": 542} {"train_loss": -5.472607612609863, "global_step": 22771, "epoch": 542} {"train_loss": -5.4247894287109375, "global_step": 22772, "epoch": 542} {"train_loss": -5.256197929382324, "global_step": 22773, "epoch": 542} {"train_loss": -5.345519542694092, "global_step": 22774, "epoch": 542} {"train_loss": -5.242437362670898, "global_step": 22775, "epoch": 542} {"train_loss": -5.411616325378418, "global_step": 22776, "epoch": 542} {"train_loss": -5.32718563079834, "global_step": 22777, "epoch": 542} {"train_loss": -5.406999588012695, "global_step": 22778, "epoch": 542} {"train_loss": -5.247073173522949, "global_step": 22779, "epoch": 542} {"train_loss": -5.211042404174805, "global_step": 22780, "epoch": 542} {"train_loss": -5.455739974975586, "global_step": 22781, "epoch": 542} {"train_loss": -5.46843147277832, "global_step": 22782, "epoch": 542} {"train_loss": -5.44284200668335, "global_step": 22783, "epoch": 542} {"train_loss": -5.390620231628418, "global_step": 22784, "epoch": 542} {"train_loss": -5.452104568481445, "global_step": 22785, "epoch": 542} {"train_loss": -5.255183219909668, "global_step": 22786, "epoch": 542} {"train_loss": -5.4618682861328125, "global_step": 22787, "epoch": 542} {"train_loss": -5.416098594665527, "global_step": 22788, "epoch": 542} {"train_loss": -5.476712226867676, "global_step": 22789, "epoch": 542} {"train_loss": -5.322048664093018, "global_step": 22790, "epoch": 542} {"train_loss": -5.3743791580200195, "global_step": 22791, "epoch": 542} {"train_loss": -5.361307621002197, "global_step": 22792, "epoch": 542} {"train_loss": -5.391907215118408, "global_step": 22793, "epoch": 542} {"train_loss": -5.305368900299072, "global_step": 22794, "epoch": 542} {"train_loss": -5.430477619171143, "global_step": 22795, "epoch": 542} {"train_loss": -5.484343528747559, "global_step": 22796, "epoch": 542} {"train_loss": -5.516772270202637, "global_step": 22797, "epoch": 542} {"train_loss": -5.3900957107543945, "global_step": 22798, "epoch": 542} {"train_loss": -5.407609939575195, "global_step": 22799, "epoch": 542} {"train_loss": -5.45147705078125, "global_step": 22800, "epoch": 542} {"train_loss": -5.373488426208496, "global_step": 22801, "epoch": 542} {"train_loss": -5.397668838500977, "global_step": 22802, "epoch": 542} {"train_loss": -5.342648029327393, "global_step": 22803, "epoch": 542} {"train_loss": -5.542022705078125, "global_step": 22804, "epoch": 542} {"train_loss": -5.38303998538426, "global_step": 22805, "epoch": 542, "val_loss": 67878.7265625} {"train_loss": -5.554179668426514, "global_step": 22806, "epoch": 543} {"train_loss": -5.294390678405762, "global_step": 22807, "epoch": 543} {"train_loss": -5.183773040771484, "global_step": 22808, "epoch": 543} {"train_loss": -5.373512268066406, "global_step": 22809, "epoch": 543} {"train_loss": -5.386181831359863, "global_step": 22810, "epoch": 543} {"train_loss": -5.445394039154053, "global_step": 22811, "epoch": 543} {"train_loss": -5.274205207824707, "global_step": 22812, "epoch": 543} {"train_loss": -5.176250457763672, "global_step": 22813, "epoch": 543} {"train_loss": -5.391506195068359, "global_step": 22814, "epoch": 543} {"train_loss": -5.384812355041504, "global_step": 22815, "epoch": 543} {"train_loss": -5.4537506103515625, "global_step": 22816, "epoch": 543} {"train_loss": -5.446536064147949, "global_step": 22817, "epoch": 543} {"train_loss": -5.39986515045166, "global_step": 22818, "epoch": 543} {"train_loss": -5.404407978057861, "global_step": 22819, "epoch": 543} {"train_loss": -5.4547600746154785, "global_step": 22820, "epoch": 543} {"train_loss": -5.453960418701172, "global_step": 22821, "epoch": 543} {"train_loss": -5.429294586181641, "global_step": 22822, "epoch": 543} {"train_loss": -5.30471134185791, "global_step": 22823, "epoch": 543} {"train_loss": -5.3084564208984375, "global_step": 22824, "epoch": 543} {"train_loss": -5.571258068084717, "global_step": 22825, "epoch": 543} {"train_loss": -5.397443771362305, "global_step": 22826, "epoch": 543} {"train_loss": -5.2775444984436035, "global_step": 22827, "epoch": 543} {"train_loss": -5.346757888793945, "global_step": 22828, "epoch": 543} {"train_loss": -5.424219131469727, "global_step": 22829, "epoch": 543} {"train_loss": -5.440998077392578, "global_step": 22830, "epoch": 543} {"train_loss": -5.425782680511475, "global_step": 22831, "epoch": 543} {"train_loss": -5.403531074523926, "global_step": 22832, "epoch": 543} {"train_loss": -5.274611949920654, "global_step": 22833, "epoch": 543} {"train_loss": -5.367948532104492, "global_step": 22834, "epoch": 543} {"train_loss": -5.243253231048584, "global_step": 22835, "epoch": 543} {"train_loss": -5.394771099090576, "global_step": 22836, "epoch": 543} {"train_loss": -5.215547561645508, "global_step": 22837, "epoch": 543} {"train_loss": -5.369272232055664, "global_step": 22838, "epoch": 543} {"train_loss": -5.382592678070068, "global_step": 22839, "epoch": 543} {"train_loss": -5.405738830566406, "global_step": 22840, "epoch": 543} {"train_loss": -5.401773452758789, "global_step": 22841, "epoch": 543} {"train_loss": -5.345712184906006, "global_step": 22842, "epoch": 543} {"train_loss": -5.313384056091309, "global_step": 22843, "epoch": 543} {"train_loss": -5.430819511413574, "global_step": 22844, "epoch": 543} {"train_loss": -5.293213844299316, "global_step": 22845, "epoch": 543} {"train_loss": -5.339332580566406, "global_step": 22846, "epoch": 543} {"train_loss": -5.374453680855887, "global_step": 22847, "epoch": 543, "val_loss": 67915.09375} {"train_loss": -5.49039888381958, "global_step": 22848, "epoch": 544} {"train_loss": -5.338796615600586, "global_step": 22849, "epoch": 544} {"train_loss": -5.332468032836914, "global_step": 22850, "epoch": 544} {"train_loss": -5.446121692657471, "global_step": 22851, "epoch": 544} {"train_loss": -5.350910186767578, "global_step": 22852, "epoch": 544} {"train_loss": -5.22606086730957, "global_step": 22853, "epoch": 544} {"train_loss": -5.403620719909668, "global_step": 22854, "epoch": 544} {"train_loss": -5.371484756469727, "global_step": 22855, "epoch": 544} {"train_loss": -5.444623947143555, "global_step": 22856, "epoch": 544} {"train_loss": -5.354919910430908, "global_step": 22857, "epoch": 544} {"train_loss": -5.426955699920654, "global_step": 22858, "epoch": 544} {"train_loss": -5.406167984008789, "global_step": 22859, "epoch": 544} {"train_loss": -5.194394111633301, "global_step": 22860, "epoch": 544} {"train_loss": -5.483311653137207, "global_step": 22861, "epoch": 544} {"train_loss": -5.372641563415527, "global_step": 22862, "epoch": 544} {"train_loss": -5.44773006439209, "global_step": 22863, "epoch": 544} {"train_loss": -5.48808479309082, "global_step": 22864, "epoch": 544} {"train_loss": -5.512747764587402, "global_step": 22865, "epoch": 544} {"train_loss": -5.270614147186279, "global_step": 22866, "epoch": 544} {"train_loss": -5.30267858505249, "global_step": 22867, "epoch": 544} {"train_loss": -5.362795829772949, "global_step": 22868, "epoch": 544} {"train_loss": -5.414621829986572, "global_step": 22869, "epoch": 544} {"train_loss": -5.419206619262695, "global_step": 22870, "epoch": 544} {"train_loss": -5.406774520874023, "global_step": 22871, "epoch": 544} {"train_loss": -5.348928928375244, "global_step": 22872, "epoch": 544} {"train_loss": -5.310029029846191, "global_step": 22873, "epoch": 544} {"train_loss": -5.4665846824646, "global_step": 22874, "epoch": 544} {"train_loss": -5.454038619995117, "global_step": 22875, "epoch": 544} {"train_loss": -5.325088024139404, "global_step": 22876, "epoch": 544} {"train_loss": -5.257899284362793, "global_step": 22877, "epoch": 544} {"train_loss": -5.481151580810547, "global_step": 22878, "epoch": 544} {"train_loss": -5.445751190185547, "global_step": 22879, "epoch": 544} {"train_loss": -5.514908313751221, "global_step": 22880, "epoch": 544} {"train_loss": -5.2926788330078125, "global_step": 22881, "epoch": 544} {"train_loss": -5.182213306427002, "global_step": 22882, "epoch": 544} {"train_loss": -5.354124069213867, "global_step": 22883, "epoch": 544} {"train_loss": -5.407070636749268, "global_step": 22884, "epoch": 544} {"train_loss": -5.151012420654297, "global_step": 22885, "epoch": 544} {"train_loss": -5.113185405731201, "global_step": 22886, "epoch": 544} {"train_loss": -5.178948402404785, "global_step": 22887, "epoch": 544} {"train_loss": -5.1160173416137695, "global_step": 22888, "epoch": 544} {"train_loss": -5.357440585181827, "global_step": 22889, "epoch": 544, "val_loss": 69542.7265625} {"train_loss": -5.2637481689453125, "global_step": 22890, "epoch": 545} {"train_loss": -5.2756428718566895, "global_step": 22891, "epoch": 545} {"train_loss": -5.231143951416016, "global_step": 22892, "epoch": 545} {"train_loss": -5.411108016967773, "global_step": 22893, "epoch": 545} {"train_loss": -5.234762668609619, "global_step": 22894, "epoch": 545} {"train_loss": -5.225731372833252, "global_step": 22895, "epoch": 545} {"train_loss": -5.266243934631348, "global_step": 22896, "epoch": 545} {"train_loss": -5.264096260070801, "global_step": 22897, "epoch": 545} {"train_loss": -5.350741386413574, "global_step": 22898, "epoch": 545} {"train_loss": -5.267267227172852, "global_step": 22899, "epoch": 545} {"train_loss": -5.331151962280273, "global_step": 22900, "epoch": 545} {"train_loss": -5.233352184295654, "global_step": 22901, "epoch": 545} {"train_loss": -5.360424995422363, "global_step": 22902, "epoch": 545} {"train_loss": -5.355327606201172, "global_step": 22903, "epoch": 545} {"train_loss": -5.364660739898682, "global_step": 22904, "epoch": 545} {"train_loss": -5.366909503936768, "global_step": 22905, "epoch": 545} {"train_loss": -5.354907035827637, "global_step": 22906, "epoch": 545} {"train_loss": -5.237542152404785, "global_step": 22907, "epoch": 545} {"train_loss": -5.50650691986084, "global_step": 22908, "epoch": 545} {"train_loss": -5.321413040161133, "global_step": 22909, "epoch": 545} {"train_loss": -5.336034774780273, "global_step": 22910, "epoch": 545} {"train_loss": -5.438426971435547, "global_step": 22911, "epoch": 545} {"train_loss": -5.189819812774658, "global_step": 22912, "epoch": 545} {"train_loss": -5.348696708679199, "global_step": 22913, "epoch": 545} {"train_loss": -5.403700351715088, "global_step": 22914, "epoch": 545} {"train_loss": -5.35133171081543, "global_step": 22915, "epoch": 545} {"train_loss": -5.374759674072266, "global_step": 22916, "epoch": 545} {"train_loss": -5.357241630554199, "global_step": 22917, "epoch": 545} {"train_loss": -5.257919788360596, "global_step": 22918, "epoch": 545} {"train_loss": -5.472173690795898, "global_step": 22919, "epoch": 545} {"train_loss": -5.41393518447876, "global_step": 22920, "epoch": 545} {"train_loss": -5.431138038635254, "global_step": 22921, "epoch": 545} {"train_loss": -5.197562217712402, "global_step": 22922, "epoch": 545} {"train_loss": -5.449868202209473, "global_step": 22923, "epoch": 545} {"train_loss": -5.382394313812256, "global_step": 22924, "epoch": 545} {"train_loss": -5.428908824920654, "global_step": 22925, "epoch": 545} {"train_loss": -5.408022880554199, "global_step": 22926, "epoch": 545} {"train_loss": -5.3955559730529785, "global_step": 22927, "epoch": 545} {"train_loss": -5.343879222869873, "global_step": 22928, "epoch": 545} {"train_loss": -5.365950584411621, "global_step": 22929, "epoch": 545} {"train_loss": -5.409719467163086, "global_step": 22930, "epoch": 545} {"train_loss": -5.341033946900141, "global_step": 22931, "epoch": 545, "val_loss": 68376.3515625} {"train_loss": -5.419521331787109, "global_step": 22932, "epoch": 546} {"train_loss": -5.424300670623779, "global_step": 22933, "epoch": 546} {"train_loss": -5.439883232116699, "global_step": 22934, "epoch": 546} {"train_loss": -5.4707207679748535, "global_step": 22935, "epoch": 546} {"train_loss": -5.313175201416016, "global_step": 22936, "epoch": 546} {"train_loss": -5.340925216674805, "global_step": 22937, "epoch": 546} {"train_loss": -5.35971736907959, "global_step": 22938, "epoch": 546} {"train_loss": -5.382879257202148, "global_step": 22939, "epoch": 546} {"train_loss": -5.427987098693848, "global_step": 22940, "epoch": 546} {"train_loss": -5.314413070678711, "global_step": 22941, "epoch": 546} {"train_loss": -5.238070487976074, "global_step": 22942, "epoch": 546} {"train_loss": -5.363890171051025, "global_step": 22943, "epoch": 546} {"train_loss": -5.1895647048950195, "global_step": 22944, "epoch": 546} {"train_loss": -5.187529563903809, "global_step": 22945, "epoch": 546} {"train_loss": -5.166922569274902, "global_step": 22946, "epoch": 546} {"train_loss": -5.343125343322754, "global_step": 22947, "epoch": 546} {"train_loss": -5.514678001403809, "global_step": 22948, "epoch": 546} {"train_loss": -5.34960412979126, "global_step": 22949, "epoch": 546} {"train_loss": -5.319049835205078, "global_step": 22950, "epoch": 546} {"train_loss": -5.391681671142578, "global_step": 22951, "epoch": 546} {"train_loss": -5.291084289550781, "global_step": 22952, "epoch": 546} {"train_loss": -5.203023910522461, "global_step": 22953, "epoch": 546} {"train_loss": -5.283982753753662, "global_step": 22954, "epoch": 546} {"train_loss": -5.403987884521484, "global_step": 22955, "epoch": 546} {"train_loss": -5.373771667480469, "global_step": 22956, "epoch": 546} {"train_loss": -5.209722995758057, "global_step": 22957, "epoch": 546} {"train_loss": -5.241497993469238, "global_step": 22958, "epoch": 546} {"train_loss": -5.331097602844238, "global_step": 22959, "epoch": 546} {"train_loss": -5.337825775146484, "global_step": 22960, "epoch": 546} {"train_loss": -5.317246437072754, "global_step": 22961, "epoch": 546} {"train_loss": -5.2684645652771, "global_step": 22962, "epoch": 546} {"train_loss": -5.345238208770752, "global_step": 22963, "epoch": 546} {"train_loss": -5.352551460266113, "global_step": 22964, "epoch": 546} {"train_loss": -5.344796180725098, "global_step": 22965, "epoch": 546} {"train_loss": -5.451866149902344, "global_step": 22966, "epoch": 546} {"train_loss": -5.468166351318359, "global_step": 22967, "epoch": 546} {"train_loss": -5.2714996337890625, "global_step": 22968, "epoch": 546} {"train_loss": -5.379786968231201, "global_step": 22969, "epoch": 546} {"train_loss": -5.413145065307617, "global_step": 22970, "epoch": 546} {"train_loss": -5.331672191619873, "global_step": 22971, "epoch": 546} {"train_loss": -5.324721336364746, "global_step": 22972, "epoch": 546} {"train_loss": -5.340111823309035, "global_step": 22973, "epoch": 546, "val_loss": 68263.0546875} {"train_loss": -5.356813907623291, "global_step": 22974, "epoch": 547} {"train_loss": -5.454796314239502, "global_step": 22975, "epoch": 547} {"train_loss": -5.456315994262695, "global_step": 22976, "epoch": 547} {"train_loss": -5.4022064208984375, "global_step": 22977, "epoch": 547} {"train_loss": -5.393036365509033, "global_step": 22978, "epoch": 547} {"train_loss": -5.421725273132324, "global_step": 22979, "epoch": 547} {"train_loss": -5.269876480102539, "global_step": 22980, "epoch": 547} {"train_loss": -5.4344682693481445, "global_step": 22981, "epoch": 547} {"train_loss": -5.395506858825684, "global_step": 22982, "epoch": 547} {"train_loss": -5.444676399230957, "global_step": 22983, "epoch": 547} {"train_loss": -5.388023376464844, "global_step": 22984, "epoch": 547} {"train_loss": -5.329743385314941, "global_step": 22985, "epoch": 547} {"train_loss": -5.299228191375732, "global_step": 22986, "epoch": 547} {"train_loss": -5.2939558029174805, "global_step": 22987, "epoch": 547} {"train_loss": -5.389170169830322, "global_step": 22988, "epoch": 547} {"train_loss": -5.308175086975098, "global_step": 22989, "epoch": 547} {"train_loss": -5.4130048751831055, "global_step": 22990, "epoch": 547} {"train_loss": -5.385216236114502, "global_step": 22991, "epoch": 547} {"train_loss": -5.349740028381348, "global_step": 22992, "epoch": 547} {"train_loss": -5.324714183807373, "global_step": 22993, "epoch": 547} {"train_loss": -5.427483558654785, "global_step": 22994, "epoch": 547} {"train_loss": -5.259655952453613, "global_step": 22995, "epoch": 547} {"train_loss": -5.480121612548828, "global_step": 22996, "epoch": 547} {"train_loss": -5.450860977172852, "global_step": 22997, "epoch": 547} {"train_loss": -5.481402397155762, "global_step": 22998, "epoch": 547} {"train_loss": -5.346189498901367, "global_step": 22999, "epoch": 547} {"train_loss": -5.386907577514648, "global_step": 23000, "epoch": 547} {"train_loss": -5.414134502410889, "global_step": 23001, "epoch": 547} {"train_loss": -5.294092178344727, "global_step": 23002, "epoch": 547} {"train_loss": -5.406698703765869, "global_step": 23003, "epoch": 547} {"train_loss": -5.331894874572754, "global_step": 23004, "epoch": 547} {"train_loss": -5.302040100097656, "global_step": 23005, "epoch": 547} {"train_loss": -5.372719764709473, "global_step": 23006, "epoch": 547} {"train_loss": -5.393481731414795, "global_step": 23007, "epoch": 547} {"train_loss": -5.414638996124268, "global_step": 23008, "epoch": 547} {"train_loss": -5.285497665405273, "global_step": 23009, "epoch": 547} {"train_loss": -5.419449806213379, "global_step": 23010, "epoch": 547} {"train_loss": -5.323221206665039, "global_step": 23011, "epoch": 547} {"train_loss": -5.28514289855957, "global_step": 23012, "epoch": 547} {"train_loss": -5.292657852172852, "global_step": 23013, "epoch": 547} {"train_loss": -5.213439464569092, "global_step": 23014, "epoch": 547} {"train_loss": -5.365754558926537, "global_step": 23015, "epoch": 547, "val_loss": 68488.28125} {"train_loss": -5.445505619049072, "global_step": 23016, "epoch": 548} {"train_loss": -5.36436128616333, "global_step": 23017, "epoch": 548} {"train_loss": -5.170915126800537, "global_step": 23018, "epoch": 548} {"train_loss": -5.282578468322754, "global_step": 23019, "epoch": 548} {"train_loss": -5.180214881896973, "global_step": 23020, "epoch": 548} {"train_loss": -5.272092342376709, "global_step": 23021, "epoch": 548} {"train_loss": -5.202415943145752, "global_step": 23022, "epoch": 548} {"train_loss": -5.2771382331848145, "global_step": 23023, "epoch": 548} {"train_loss": -5.203482627868652, "global_step": 23024, "epoch": 548} {"train_loss": -5.434546947479248, "global_step": 23025, "epoch": 548} {"train_loss": -5.306456565856934, "global_step": 23026, "epoch": 548} {"train_loss": -5.266453266143799, "global_step": 23027, "epoch": 548} {"train_loss": -5.358662128448486, "global_step": 23028, "epoch": 548} {"train_loss": -5.363675594329834, "global_step": 23029, "epoch": 548} {"train_loss": -5.3672966957092285, "global_step": 23030, "epoch": 548} {"train_loss": -5.4467973709106445, "global_step": 23031, "epoch": 548} {"train_loss": -5.30611515045166, "global_step": 23032, "epoch": 548} {"train_loss": -5.384994983673096, "global_step": 23033, "epoch": 548} {"train_loss": -5.293904781341553, "global_step": 23034, "epoch": 548} {"train_loss": -5.279786109924316, "global_step": 23035, "epoch": 548} {"train_loss": -5.3259453773498535, "global_step": 23036, "epoch": 548} {"train_loss": -5.405300617218018, "global_step": 23037, "epoch": 548} {"train_loss": -5.577077388763428, "global_step": 23038, "epoch": 548} {"train_loss": -5.295015335083008, "global_step": 23039, "epoch": 548} {"train_loss": -5.413345813751221, "global_step": 23040, "epoch": 548} {"train_loss": -5.449765682220459, "global_step": 23041, "epoch": 548} {"train_loss": -5.393933296203613, "global_step": 23042, "epoch": 548} {"train_loss": -5.449948310852051, "global_step": 23043, "epoch": 548} {"train_loss": -5.273879528045654, "global_step": 23044, "epoch": 548} {"train_loss": -5.2794880867004395, "global_step": 23045, "epoch": 548} {"train_loss": -5.475919246673584, "global_step": 23046, "epoch": 548} {"train_loss": -5.290493011474609, "global_step": 23047, "epoch": 548} {"train_loss": -5.344231128692627, "global_step": 23048, "epoch": 548} {"train_loss": -5.456051826477051, "global_step": 23049, "epoch": 548} {"train_loss": -5.443595886230469, "global_step": 23050, "epoch": 548} {"train_loss": -5.290491580963135, "global_step": 23051, "epoch": 548} {"train_loss": -5.314316749572754, "global_step": 23052, "epoch": 548} {"train_loss": -5.474010944366455, "global_step": 23053, "epoch": 548} {"train_loss": -5.147576332092285, "global_step": 23054, "epoch": 548} {"train_loss": -5.291516304016113, "global_step": 23055, "epoch": 548} {"train_loss": -5.3763651847839355, "global_step": 23056, "epoch": 548} {"train_loss": -5.3401619252704435, "global_step": 23057, "epoch": 548, "val_loss": 68376.734375} {"train_loss": -5.326553821563721, "global_step": 23058, "epoch": 549} {"train_loss": -5.329803466796875, "global_step": 23059, "epoch": 549} {"train_loss": -5.419049263000488, "global_step": 23060, "epoch": 549} {"train_loss": -5.2830400466918945, "global_step": 23061, "epoch": 549} {"train_loss": -5.454831123352051, "global_step": 23062, "epoch": 549} {"train_loss": -5.314476013183594, "global_step": 23063, "epoch": 549} {"train_loss": -5.339829444885254, "global_step": 23064, "epoch": 549} {"train_loss": -5.496591091156006, "global_step": 23065, "epoch": 549} {"train_loss": -5.317046165466309, "global_step": 23066, "epoch": 549} {"train_loss": -5.361762046813965, "global_step": 23067, "epoch": 549} {"train_loss": -5.329654693603516, "global_step": 23068, "epoch": 549} {"train_loss": -5.48620080947876, "global_step": 23069, "epoch": 549} {"train_loss": -5.387404441833496, "global_step": 23070, "epoch": 549} {"train_loss": -5.277281284332275, "global_step": 23071, "epoch": 549} {"train_loss": -5.375249862670898, "global_step": 23072, "epoch": 549} {"train_loss": -5.284480094909668, "global_step": 23073, "epoch": 549} {"train_loss": -5.338613986968994, "global_step": 23074, "epoch": 549} {"train_loss": -5.46776819229126, "global_step": 23075, "epoch": 549} {"train_loss": -5.480391502380371, "global_step": 23076, "epoch": 549} {"train_loss": -5.430166244506836, "global_step": 23077, "epoch": 549} {"train_loss": -5.35734748840332, "global_step": 23078, "epoch": 549} {"train_loss": -5.337861061096191, "global_step": 23079, "epoch": 549} {"train_loss": -5.492994785308838, "global_step": 23080, "epoch": 549} {"train_loss": -5.382046699523926, "global_step": 23081, "epoch": 549} {"train_loss": -5.399078369140625, "global_step": 23082, "epoch": 549} {"train_loss": -5.233331680297852, "global_step": 23083, "epoch": 549} {"train_loss": -5.403215408325195, "global_step": 23084, "epoch": 549} {"train_loss": -5.330506324768066, "global_step": 23085, "epoch": 549} {"train_loss": -5.264529228210449, "global_step": 23086, "epoch": 549} {"train_loss": -5.301434516906738, "global_step": 23087, "epoch": 549} {"train_loss": -5.315556526184082, "global_step": 23088, "epoch": 549} {"train_loss": -5.438035488128662, "global_step": 23089, "epoch": 549} {"train_loss": -5.377842903137207, "global_step": 23090, "epoch": 549} {"train_loss": -5.4410905838012695, "global_step": 23091, "epoch": 549} {"train_loss": -5.347373962402344, "global_step": 23092, "epoch": 549} {"train_loss": -5.385096549987793, "global_step": 23093, "epoch": 549} {"train_loss": -5.384377479553223, "global_step": 23094, "epoch": 549} {"train_loss": -5.406511306762695, "global_step": 23095, "epoch": 549} {"train_loss": -5.446188449859619, "global_step": 23096, "epoch": 549} {"train_loss": -5.495303630828857, "global_step": 23097, "epoch": 549} {"train_loss": -5.366497993469238, "global_step": 23098, "epoch": 549} {"train_loss": -5.375809737614223, "global_step": 23099, "epoch": 549, "val_loss": 68069.1328125} {"train_loss": -5.463689804077148, "global_step": 23100, "epoch": 550} {"train_loss": -5.505878448486328, "global_step": 23101, "epoch": 550} {"train_loss": -5.314082622528076, "global_step": 23102, "epoch": 550} {"train_loss": -5.44559907913208, "global_step": 23103, "epoch": 550} {"train_loss": -5.374849319458008, "global_step": 23104, "epoch": 550} {"train_loss": -5.256734848022461, "global_step": 23105, "epoch": 550} {"train_loss": -5.4825520515441895, "global_step": 23106, "epoch": 550} {"train_loss": -5.282034873962402, "global_step": 23107, "epoch": 550} {"train_loss": -5.353272438049316, "global_step": 23108, "epoch": 550} {"train_loss": -5.45672607421875, "global_step": 23109, "epoch": 550} {"train_loss": -5.2784013748168945, "global_step": 23110, "epoch": 550} {"train_loss": -5.438695907592773, "global_step": 23111, "epoch": 550} {"train_loss": -5.4069647789001465, "global_step": 23112, "epoch": 550} {"train_loss": -5.5239057540893555, "global_step": 23113, "epoch": 550} {"train_loss": -5.508464813232422, "global_step": 23114, "epoch": 550} {"train_loss": -5.43583869934082, "global_step": 23115, "epoch": 550} {"train_loss": -5.310408115386963, "global_step": 23116, "epoch": 550} {"train_loss": -5.294111251831055, "global_step": 23117, "epoch": 550} {"train_loss": -5.407842636108398, "global_step": 23118, "epoch": 550} {"train_loss": -5.4969563484191895, "global_step": 23119, "epoch": 550} {"train_loss": -5.363076686859131, "global_step": 23120, "epoch": 550} {"train_loss": -5.3615899085998535, "global_step": 23121, "epoch": 550} {"train_loss": -5.2384538650512695, "global_step": 23122, "epoch": 550} {"train_loss": -5.275781631469727, "global_step": 23123, "epoch": 550} {"train_loss": -5.273819446563721, "global_step": 23124, "epoch": 550} {"train_loss": -5.466428756713867, "global_step": 23125, "epoch": 550} {"train_loss": -5.291625022888184, "global_step": 23126, "epoch": 550} {"train_loss": -5.222163677215576, "global_step": 23127, "epoch": 550} {"train_loss": -5.465900421142578, "global_step": 23128, "epoch": 550} {"train_loss": -5.333587646484375, "global_step": 23129, "epoch": 550} {"train_loss": -5.448002815246582, "global_step": 23130, "epoch": 550} {"train_loss": -5.433815956115723, "global_step": 23131, "epoch": 550} {"train_loss": -5.393444061279297, "global_step": 23132, "epoch": 550} {"train_loss": -5.127981662750244, "global_step": 23133, "epoch": 550} {"train_loss": -5.362855911254883, "global_step": 23134, "epoch": 550} {"train_loss": -5.218130111694336, "global_step": 23135, "epoch": 550} {"train_loss": -5.280348777770996, "global_step": 23136, "epoch": 550} {"train_loss": -5.50252103805542, "global_step": 23137, "epoch": 550} {"train_loss": -5.367377281188965, "global_step": 23138, "epoch": 550} {"train_loss": -5.373661041259766, "global_step": 23139, "epoch": 550} {"train_loss": -5.376439094543457, "global_step": 23140, "epoch": 550} {"train_loss": -5.373853252047584, "global_step": 23141, "epoch": 550, "train/sim_max_reward_0": 0.22293397922949124, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.2028720242250457, "train/sim_max_reward_3": 0.14960211548063354, "train/sim_max_reward_4": 0.774314148214616, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.329151043395255, "test/sim_max_reward_4400001": 0.0776326508694431, "test/sim_max_reward_4400002": 0.40739238522178267, "test/sim_max_reward_4400003": 0.009867730245785317, "test/sim_max_reward_4400004": 0.31095419467364066, "test/sim_max_reward_4400005": 0.21473733692543115, "test/sim_max_reward_4400006": 0.23064767308819645, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.2933280757342888, "test/sim_max_reward_4400010": 0.43335810674039865, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.14257121782196724, "test/sim_max_reward_4400013": 0.39172341714567765, "test/sim_max_reward_4400014": 7.333912394314882e-05, "test/sim_max_reward_4400015": 0.3053478251631731, "test/sim_max_reward_4400016": 0.052552768506935535, "test/sim_max_reward_4400017": 0.16557108299710938, "test/sim_max_reward_4400018": 0.21246540526199528, "test/sim_max_reward_4400019": 0.5239836973364184, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.4320691277145037, "test/sim_max_reward_4400025": 0.2562497483093244, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.06748124963678735, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.3973095398367303, "test/sim_max_reward_4400031": 0.31048835975205585, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.13746065695651885, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.5630887887865939, "test/sim_max_reward_4400036": 0.6013734378649738, "test/sim_max_reward_4400037": 0.28166813880878316, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.8149049247325931, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.3438889779852677, "test/sim_max_reward_4400042": 0.007738010045769513, "test/sim_max_reward_4400043": 0.008543243910560282, "test/sim_max_reward_4400044": 0.006887451885095612, "test/sim_max_reward_4400045": 0.20637701738976522, "test/sim_max_reward_4400046": 0.23800882143420032, "test/sim_max_reward_4400047": 0.17982820646355469, "test/sim_max_reward_4400048": 0.038615799585110924, "test/sim_max_reward_4400049": 0.0038247312528684675, "train/mean_score": 0.25723041795562884, "test/mean_score": 0.19629135572394826, "val_loss": 68188.578125} {"train_loss": -5.472197532653809, "global_step": 23142, "epoch": 551} {"train_loss": -5.368293285369873, "global_step": 23143, "epoch": 551} {"train_loss": -5.476379871368408, "global_step": 23144, "epoch": 551} {"train_loss": -5.331674575805664, "global_step": 23145, "epoch": 551} {"train_loss": -5.412632942199707, "global_step": 23146, "epoch": 551} {"train_loss": -5.405611038208008, "global_step": 23147, "epoch": 551} {"train_loss": -5.367297172546387, "global_step": 23148, "epoch": 551} {"train_loss": -5.292355060577393, "global_step": 23149, "epoch": 551} {"train_loss": -5.203568458557129, "global_step": 23150, "epoch": 551} {"train_loss": -5.347735404968262, "global_step": 23151, "epoch": 551} {"train_loss": -5.4762959480285645, "global_step": 23152, "epoch": 551} {"train_loss": -5.342304706573486, "global_step": 23153, "epoch": 551} {"train_loss": -5.351538181304932, "global_step": 23154, "epoch": 551} {"train_loss": -5.4658403396606445, "global_step": 23155, "epoch": 551} {"train_loss": -5.374355316162109, "global_step": 23156, "epoch": 551} {"train_loss": -5.25400972366333, "global_step": 23157, "epoch": 551} {"train_loss": -5.410043716430664, "global_step": 23158, "epoch": 551} {"train_loss": -5.357131004333496, "global_step": 23159, "epoch": 551} {"train_loss": -5.298196315765381, "global_step": 23160, "epoch": 551} {"train_loss": -5.352329254150391, "global_step": 23161, "epoch": 551} {"train_loss": -5.33494758605957, "global_step": 23162, "epoch": 551} {"train_loss": -5.28559684753418, "global_step": 23163, "epoch": 551} {"train_loss": -5.434378623962402, "global_step": 23164, "epoch": 551} {"train_loss": -5.37824821472168, "global_step": 23165, "epoch": 551} {"train_loss": -5.28205680847168, "global_step": 23166, "epoch": 551} {"train_loss": -5.332664489746094, "global_step": 23167, "epoch": 551} {"train_loss": -5.554902076721191, "global_step": 23168, "epoch": 551} {"train_loss": -5.2849273681640625, "global_step": 23169, "epoch": 551} {"train_loss": -5.39958381652832, "global_step": 23170, "epoch": 551} {"train_loss": -5.383342742919922, "global_step": 23171, "epoch": 551} {"train_loss": -5.433311939239502, "global_step": 23172, "epoch": 551} {"train_loss": -5.2719926834106445, "global_step": 23173, "epoch": 551} {"train_loss": -5.31221342086792, "global_step": 23174, "epoch": 551} {"train_loss": -5.392174243927002, "global_step": 23175, "epoch": 551} {"train_loss": -5.356135368347168, "global_step": 23176, "epoch": 551} {"train_loss": -5.4076313972473145, "global_step": 23177, "epoch": 551} {"train_loss": -5.439446449279785, "global_step": 23178, "epoch": 551} {"train_loss": -5.248929500579834, "global_step": 23179, "epoch": 551} {"train_loss": -5.502272605895996, "global_step": 23180, "epoch": 551} {"train_loss": -5.291762351989746, "global_step": 23181, "epoch": 551} {"train_loss": -5.260819435119629, "global_step": 23182, "epoch": 551} {"train_loss": -5.362737950824556, "global_step": 23183, "epoch": 551, "val_loss": 67858.5859375} {"train_loss": -5.2896833419799805, "global_step": 23184, "epoch": 552} {"train_loss": -5.394388198852539, "global_step": 23185, "epoch": 552} {"train_loss": -5.373674392700195, "global_step": 23186, "epoch": 552} {"train_loss": -5.358589172363281, "global_step": 23187, "epoch": 552} {"train_loss": -5.3572163581848145, "global_step": 23188, "epoch": 552} {"train_loss": -5.274123191833496, "global_step": 23189, "epoch": 552} {"train_loss": -5.444784164428711, "global_step": 23190, "epoch": 552} {"train_loss": -5.250821590423584, "global_step": 23191, "epoch": 552} {"train_loss": -5.34318733215332, "global_step": 23192, "epoch": 552} {"train_loss": -5.335010528564453, "global_step": 23193, "epoch": 552} {"train_loss": -5.304935455322266, "global_step": 23194, "epoch": 552} {"train_loss": -5.2041850090026855, "global_step": 23195, "epoch": 552} {"train_loss": -5.525477409362793, "global_step": 23196, "epoch": 552} {"train_loss": -5.376338005065918, "global_step": 23197, "epoch": 552} {"train_loss": -5.405637741088867, "global_step": 23198, "epoch": 552} {"train_loss": -5.3715925216674805, "global_step": 23199, "epoch": 552} {"train_loss": -5.40183162689209, "global_step": 23200, "epoch": 552} {"train_loss": -5.408588409423828, "global_step": 23201, "epoch": 552} {"train_loss": -5.301887512207031, "global_step": 23202, "epoch": 552} {"train_loss": -5.412613868713379, "global_step": 23203, "epoch": 552} {"train_loss": -5.445459365844727, "global_step": 23204, "epoch": 552} {"train_loss": -5.3747992515563965, "global_step": 23205, "epoch": 552} {"train_loss": -5.376472473144531, "global_step": 23206, "epoch": 552} {"train_loss": -5.389060020446777, "global_step": 23207, "epoch": 552} {"train_loss": -5.210727691650391, "global_step": 23208, "epoch": 552} {"train_loss": -5.399898529052734, "global_step": 23209, "epoch": 552} {"train_loss": -5.404216289520264, "global_step": 23210, "epoch": 552} {"train_loss": -5.426772117614746, "global_step": 23211, "epoch": 552} {"train_loss": -5.357597351074219, "global_step": 23212, "epoch": 552} {"train_loss": -5.422285556793213, "global_step": 23213, "epoch": 552} {"train_loss": -5.397744178771973, "global_step": 23214, "epoch": 552} {"train_loss": -5.438544750213623, "global_step": 23215, "epoch": 552} {"train_loss": -5.348067283630371, "global_step": 23216, "epoch": 552} {"train_loss": -5.434665679931641, "global_step": 23217, "epoch": 552} {"train_loss": -5.40937614440918, "global_step": 23218, "epoch": 552} {"train_loss": -5.26379919052124, "global_step": 23219, "epoch": 552} {"train_loss": -5.429989337921143, "global_step": 23220, "epoch": 552} {"train_loss": -5.481607437133789, "global_step": 23221, "epoch": 552} {"train_loss": -5.268768310546875, "global_step": 23222, "epoch": 552} {"train_loss": -5.2579755783081055, "global_step": 23223, "epoch": 552} {"train_loss": -5.343145370483398, "global_step": 23224, "epoch": 552} {"train_loss": -5.3608504477001375, "global_step": 23225, "epoch": 552, "val_loss": 68818.2578125} {"train_loss": -5.401297569274902, "global_step": 23226, "epoch": 553} {"train_loss": -5.402477741241455, "global_step": 23227, "epoch": 553} {"train_loss": -5.280962944030762, "global_step": 23228, "epoch": 553} {"train_loss": -5.411299228668213, "global_step": 23229, "epoch": 553} {"train_loss": -5.351717948913574, "global_step": 23230, "epoch": 553} {"train_loss": -5.292607307434082, "global_step": 23231, "epoch": 553} {"train_loss": -5.429558753967285, "global_step": 23232, "epoch": 553} {"train_loss": -5.150793552398682, "global_step": 23233, "epoch": 553} {"train_loss": -5.443414688110352, "global_step": 23234, "epoch": 553} {"train_loss": -5.119633674621582, "global_step": 23235, "epoch": 553} {"train_loss": -5.2575225830078125, "global_step": 23236, "epoch": 553} {"train_loss": -5.328906059265137, "global_step": 23237, "epoch": 553} {"train_loss": -5.360172748565674, "global_step": 23238, "epoch": 553} {"train_loss": -5.322847843170166, "global_step": 23239, "epoch": 553} {"train_loss": -5.377044677734375, "global_step": 23240, "epoch": 553} {"train_loss": -5.189723968505859, "global_step": 23241, "epoch": 553} {"train_loss": -5.194392204284668, "global_step": 23242, "epoch": 553} {"train_loss": -5.395997524261475, "global_step": 23243, "epoch": 553} {"train_loss": -5.3704400062561035, "global_step": 23244, "epoch": 553} {"train_loss": -5.357729911804199, "global_step": 23245, "epoch": 553} {"train_loss": -5.447510719299316, "global_step": 23246, "epoch": 553} {"train_loss": -5.383035182952881, "global_step": 23247, "epoch": 553} {"train_loss": -5.180400371551514, "global_step": 23248, "epoch": 553} {"train_loss": -5.3896589279174805, "global_step": 23249, "epoch": 553} {"train_loss": -5.321309566497803, "global_step": 23250, "epoch": 553} {"train_loss": -5.334607124328613, "global_step": 23251, "epoch": 553} {"train_loss": -5.408087253570557, "global_step": 23252, "epoch": 553} {"train_loss": -5.354657173156738, "global_step": 23253, "epoch": 553} {"train_loss": -5.405413627624512, "global_step": 23254, "epoch": 553} {"train_loss": -5.345563888549805, "global_step": 23255, "epoch": 553} {"train_loss": -5.381590366363525, "global_step": 23256, "epoch": 553} {"train_loss": -5.424348831176758, "global_step": 23257, "epoch": 553} {"train_loss": -5.253885269165039, "global_step": 23258, "epoch": 553} {"train_loss": -5.413591384887695, "global_step": 23259, "epoch": 553} {"train_loss": -5.398574352264404, "global_step": 23260, "epoch": 553} {"train_loss": -5.366959571838379, "global_step": 23261, "epoch": 553} {"train_loss": -5.367184638977051, "global_step": 23262, "epoch": 553} {"train_loss": -5.422079086303711, "global_step": 23263, "epoch": 553} {"train_loss": -5.364588737487793, "global_step": 23264, "epoch": 553} {"train_loss": -5.287566184997559, "global_step": 23265, "epoch": 553} {"train_loss": -5.360752582550049, "global_step": 23266, "epoch": 553} {"train_loss": -5.341786055337815, "global_step": 23267, "epoch": 553, "val_loss": 67958.9140625} {"train_loss": -5.3343586921691895, "global_step": 23268, "epoch": 554} {"train_loss": -5.447423934936523, "global_step": 23269, "epoch": 554} {"train_loss": -5.419006824493408, "global_step": 23270, "epoch": 554} {"train_loss": -5.484407901763916, "global_step": 23271, "epoch": 554} {"train_loss": -5.374115467071533, "global_step": 23272, "epoch": 554} {"train_loss": -5.432301998138428, "global_step": 23273, "epoch": 554} {"train_loss": -5.5429277420043945, "global_step": 23274, "epoch": 554} {"train_loss": -5.349976539611816, "global_step": 23275, "epoch": 554} {"train_loss": -5.364900588989258, "global_step": 23276, "epoch": 554} {"train_loss": -5.3657002449035645, "global_step": 23277, "epoch": 554} {"train_loss": -5.430896759033203, "global_step": 23278, "epoch": 554} {"train_loss": -5.205970287322998, "global_step": 23279, "epoch": 554} {"train_loss": -5.361332893371582, "global_step": 23280, "epoch": 554} {"train_loss": -5.293112754821777, "global_step": 23281, "epoch": 554} {"train_loss": -5.267765522003174, "global_step": 23282, "epoch": 554} {"train_loss": -5.362091541290283, "global_step": 23283, "epoch": 554} {"train_loss": -5.404892921447754, "global_step": 23284, "epoch": 554} {"train_loss": -5.268346786499023, "global_step": 23285, "epoch": 554} {"train_loss": -5.302664279937744, "global_step": 23286, "epoch": 554} {"train_loss": -5.165434837341309, "global_step": 23287, "epoch": 554} {"train_loss": -5.333693981170654, "global_step": 23288, "epoch": 554} {"train_loss": -5.159300804138184, "global_step": 23289, "epoch": 554} {"train_loss": -5.395834922790527, "global_step": 23290, "epoch": 554} {"train_loss": -5.299861907958984, "global_step": 23291, "epoch": 554} {"train_loss": -5.136344909667969, "global_step": 23292, "epoch": 554} {"train_loss": -5.250541687011719, "global_step": 23293, "epoch": 554} {"train_loss": -5.004663467407227, "global_step": 23294, "epoch": 554} {"train_loss": -5.295577049255371, "global_step": 23295, "epoch": 554} {"train_loss": -5.289889335632324, "global_step": 23296, "epoch": 554} {"train_loss": -5.280121803283691, "global_step": 23297, "epoch": 554} {"train_loss": -5.339672565460205, "global_step": 23298, "epoch": 554} {"train_loss": -5.268948554992676, "global_step": 23299, "epoch": 554} {"train_loss": -5.41277551651001, "global_step": 23300, "epoch": 554} {"train_loss": -5.381469249725342, "global_step": 23301, "epoch": 554} {"train_loss": -5.4430155754089355, "global_step": 23302, "epoch": 554} {"train_loss": -5.241484642028809, "global_step": 23303, "epoch": 554} {"train_loss": -5.449135780334473, "global_step": 23304, "epoch": 554} {"train_loss": -5.344073295593262, "global_step": 23305, "epoch": 554} {"train_loss": -5.314377784729004, "global_step": 23306, "epoch": 554} {"train_loss": -5.3195648193359375, "global_step": 23307, "epoch": 554} {"train_loss": -5.308526039123535, "global_step": 23308, "epoch": 554} {"train_loss": -5.326414255868821, "global_step": 23309, "epoch": 554, "val_loss": 67856.765625} {"train_loss": -5.310208320617676, "global_step": 23310, "epoch": 555} {"train_loss": -5.327329158782959, "global_step": 23311, "epoch": 555} {"train_loss": -5.465071678161621, "global_step": 23312, "epoch": 555} {"train_loss": -5.344058990478516, "global_step": 23313, "epoch": 555} {"train_loss": -5.287556171417236, "global_step": 23314, "epoch": 555} {"train_loss": -5.280357837677002, "global_step": 23315, "epoch": 555} {"train_loss": -5.441922187805176, "global_step": 23316, "epoch": 555} {"train_loss": -5.319190979003906, "global_step": 23317, "epoch": 555} {"train_loss": -5.400951385498047, "global_step": 23318, "epoch": 555} {"train_loss": -5.34821891784668, "global_step": 23319, "epoch": 555} {"train_loss": -5.436356544494629, "global_step": 23320, "epoch": 555} {"train_loss": -5.214165687561035, "global_step": 23321, "epoch": 555} {"train_loss": -5.333211421966553, "global_step": 23322, "epoch": 555} {"train_loss": -5.355159282684326, "global_step": 23323, "epoch": 555} {"train_loss": -5.360354423522949, "global_step": 23324, "epoch": 555} {"train_loss": -5.467316150665283, "global_step": 23325, "epoch": 555} {"train_loss": -5.4504852294921875, "global_step": 23326, "epoch": 555} {"train_loss": -5.446168899536133, "global_step": 23327, "epoch": 555} {"train_loss": -5.5434112548828125, "global_step": 23328, "epoch": 555} {"train_loss": -5.310667991638184, "global_step": 23329, "epoch": 555} {"train_loss": -5.4440789222717285, "global_step": 23330, "epoch": 555} {"train_loss": -5.47004508972168, "global_step": 23331, "epoch": 555} {"train_loss": -5.338230133056641, "global_step": 23332, "epoch": 555} {"train_loss": -5.285578727722168, "global_step": 23333, "epoch": 555} {"train_loss": -5.496179580688477, "global_step": 23334, "epoch": 555} {"train_loss": -5.2727155685424805, "global_step": 23335, "epoch": 555} {"train_loss": -5.333319664001465, "global_step": 23336, "epoch": 555} {"train_loss": -5.44355583190918, "global_step": 23337, "epoch": 555} {"train_loss": -5.487523078918457, "global_step": 23338, "epoch": 555} {"train_loss": -5.34754753112793, "global_step": 23339, "epoch": 555} {"train_loss": -5.416454315185547, "global_step": 23340, "epoch": 555} {"train_loss": -5.294323921203613, "global_step": 23341, "epoch": 555} {"train_loss": -5.32253360748291, "global_step": 23342, "epoch": 555} {"train_loss": -5.302663803100586, "global_step": 23343, "epoch": 555} {"train_loss": -5.3459272384643555, "global_step": 23344, "epoch": 555} {"train_loss": -5.296530723571777, "global_step": 23345, "epoch": 555} {"train_loss": -5.523760795593262, "global_step": 23346, "epoch": 555} {"train_loss": -5.347885608673096, "global_step": 23347, "epoch": 555} {"train_loss": -5.518926620483398, "global_step": 23348, "epoch": 555} {"train_loss": -5.267569541931152, "global_step": 23349, "epoch": 555} {"train_loss": -5.424310684204102, "global_step": 23350, "epoch": 555} {"train_loss": -5.377190953209286, "global_step": 23351, "epoch": 555, "val_loss": 67969.234375} {"train_loss": -5.440079212188721, "global_step": 23352, "epoch": 556} {"train_loss": -5.399656295776367, "global_step": 23353, "epoch": 556} {"train_loss": -5.350917339324951, "global_step": 23354, "epoch": 556} {"train_loss": -5.469783782958984, "global_step": 23355, "epoch": 556} {"train_loss": -5.407052993774414, "global_step": 23356, "epoch": 556} {"train_loss": -5.512950420379639, "global_step": 23357, "epoch": 556} {"train_loss": -5.211267471313477, "global_step": 23358, "epoch": 556} {"train_loss": -5.285228252410889, "global_step": 23359, "epoch": 556} {"train_loss": -5.512838363647461, "global_step": 23360, "epoch": 556} {"train_loss": -5.186095237731934, "global_step": 23361, "epoch": 556} {"train_loss": -5.348183631896973, "global_step": 23362, "epoch": 556} {"train_loss": -5.540378570556641, "global_step": 23363, "epoch": 556} {"train_loss": -5.146731853485107, "global_step": 23364, "epoch": 556} {"train_loss": -5.30761194229126, "global_step": 23365, "epoch": 556} {"train_loss": -5.435957908630371, "global_step": 23366, "epoch": 556} {"train_loss": -5.039369106292725, "global_step": 23367, "epoch": 556} {"train_loss": -5.443725109100342, "global_step": 23368, "epoch": 556} {"train_loss": -5.09348201751709, "global_step": 23369, "epoch": 556} {"train_loss": -5.226814270019531, "global_step": 23370, "epoch": 556} {"train_loss": -5.226698398590088, "global_step": 23371, "epoch": 556} {"train_loss": -5.213796138763428, "global_step": 23372, "epoch": 556} {"train_loss": -5.336443901062012, "global_step": 23373, "epoch": 556} {"train_loss": -5.040993690490723, "global_step": 23374, "epoch": 556} {"train_loss": -5.2547502517700195, "global_step": 23375, "epoch": 556} {"train_loss": -5.274787902832031, "global_step": 23376, "epoch": 556} {"train_loss": -5.458738327026367, "global_step": 23377, "epoch": 556} {"train_loss": -5.242616653442383, "global_step": 23378, "epoch": 556} {"train_loss": -5.218443393707275, "global_step": 23379, "epoch": 556} {"train_loss": -5.262550354003906, "global_step": 23380, "epoch": 556} {"train_loss": -5.3023457527160645, "global_step": 23381, "epoch": 556} {"train_loss": -5.1403303146362305, "global_step": 23382, "epoch": 556} {"train_loss": -5.307958602905273, "global_step": 23383, "epoch": 556} {"train_loss": -5.1716203689575195, "global_step": 23384, "epoch": 556} {"train_loss": -5.378370761871338, "global_step": 23385, "epoch": 556} {"train_loss": -5.264700889587402, "global_step": 23386, "epoch": 556} {"train_loss": -5.311695575714111, "global_step": 23387, "epoch": 556} {"train_loss": -5.292949676513672, "global_step": 23388, "epoch": 556} {"train_loss": -5.383078575134277, "global_step": 23389, "epoch": 556} {"train_loss": -5.082605838775635, "global_step": 23390, "epoch": 556} {"train_loss": -5.383603572845459, "global_step": 23391, "epoch": 556} {"train_loss": -5.303536415100098, "global_step": 23392, "epoch": 556} {"train_loss": -5.299906696592059, "global_step": 23393, "epoch": 556, "val_loss": 68798.625} {"train_loss": -5.326356887817383, "global_step": 23394, "epoch": 557} {"train_loss": -5.2884626388549805, "global_step": 23395, "epoch": 557} {"train_loss": -5.319662570953369, "global_step": 23396, "epoch": 557} {"train_loss": -5.427109718322754, "global_step": 23397, "epoch": 557} {"train_loss": -5.371665000915527, "global_step": 23398, "epoch": 557} {"train_loss": -5.422011375427246, "global_step": 23399, "epoch": 557} {"train_loss": -5.306946754455566, "global_step": 23400, "epoch": 557} {"train_loss": -5.401686668395996, "global_step": 23401, "epoch": 557} {"train_loss": -5.329380512237549, "global_step": 23402, "epoch": 557} {"train_loss": -5.423047065734863, "global_step": 23403, "epoch": 557} {"train_loss": -5.310910224914551, "global_step": 23404, "epoch": 557} {"train_loss": -5.347841262817383, "global_step": 23405, "epoch": 557} {"train_loss": -5.343919277191162, "global_step": 23406, "epoch": 557} {"train_loss": -5.439595699310303, "global_step": 23407, "epoch": 557} {"train_loss": -5.329827308654785, "global_step": 23408, "epoch": 557} {"train_loss": -5.529017448425293, "global_step": 23409, "epoch": 557} {"train_loss": -5.390774250030518, "global_step": 23410, "epoch": 557} {"train_loss": -5.311829566955566, "global_step": 23411, "epoch": 557} {"train_loss": -5.4404706954956055, "global_step": 23412, "epoch": 557} {"train_loss": -5.335691452026367, "global_step": 23413, "epoch": 557} {"train_loss": -5.3003387451171875, "global_step": 23414, "epoch": 557} {"train_loss": -5.331070899963379, "global_step": 23415, "epoch": 557} {"train_loss": -5.300265789031982, "global_step": 23416, "epoch": 557} {"train_loss": -5.376911163330078, "global_step": 23417, "epoch": 557} {"train_loss": -5.403105735778809, "global_step": 23418, "epoch": 557} {"train_loss": -5.364797115325928, "global_step": 23419, "epoch": 557} {"train_loss": -5.447929382324219, "global_step": 23420, "epoch": 557} {"train_loss": -5.427790641784668, "global_step": 23421, "epoch": 557} {"train_loss": -5.384648323059082, "global_step": 23422, "epoch": 557} {"train_loss": -5.279065132141113, "global_step": 23423, "epoch": 557} {"train_loss": -5.480284690856934, "global_step": 23424, "epoch": 557} {"train_loss": -5.418595314025879, "global_step": 23425, "epoch": 557} {"train_loss": -5.346950531005859, "global_step": 23426, "epoch": 557} {"train_loss": -5.353357315063477, "global_step": 23427, "epoch": 557} {"train_loss": -5.50783634185791, "global_step": 23428, "epoch": 557} {"train_loss": -5.481217861175537, "global_step": 23429, "epoch": 557} {"train_loss": -5.352065086364746, "global_step": 23430, "epoch": 557} {"train_loss": -5.429961204528809, "global_step": 23431, "epoch": 557} {"train_loss": -5.3044939041137695, "global_step": 23432, "epoch": 557} {"train_loss": -5.293585777282715, "global_step": 23433, "epoch": 557} {"train_loss": -5.303987979888916, "global_step": 23434, "epoch": 557} {"train_loss": -5.3695006257011775, "global_step": 23435, "epoch": 557, "val_loss": 68029.921875} {"train_loss": -5.3284592628479, "global_step": 23436, "epoch": 558} {"train_loss": -5.343863010406494, "global_step": 23437, "epoch": 558} {"train_loss": -5.270217418670654, "global_step": 23438, "epoch": 558} {"train_loss": -5.404767036437988, "global_step": 23439, "epoch": 558} {"train_loss": -5.421412944793701, "global_step": 23440, "epoch": 558} {"train_loss": -5.475869655609131, "global_step": 23441, "epoch": 558} {"train_loss": -5.368237018585205, "global_step": 23442, "epoch": 558} {"train_loss": -5.45448112487793, "global_step": 23443, "epoch": 558} {"train_loss": -5.31134033203125, "global_step": 23444, "epoch": 558} {"train_loss": -5.4521803855896, "global_step": 23445, "epoch": 558} {"train_loss": -5.4911956787109375, "global_step": 23446, "epoch": 558} {"train_loss": -5.40620756149292, "global_step": 23447, "epoch": 558} {"train_loss": -5.2660017013549805, "global_step": 23448, "epoch": 558} {"train_loss": -5.364218711853027, "global_step": 23449, "epoch": 558} {"train_loss": -5.383919715881348, "global_step": 23450, "epoch": 558} {"train_loss": -5.444544315338135, "global_step": 23451, "epoch": 558} {"train_loss": -5.323695659637451, "global_step": 23452, "epoch": 558} {"train_loss": -5.351035118103027, "global_step": 23453, "epoch": 558} {"train_loss": -5.422418594360352, "global_step": 23454, "epoch": 558} {"train_loss": -5.266182899475098, "global_step": 23455, "epoch": 558} {"train_loss": -5.464164733886719, "global_step": 23456, "epoch": 558} {"train_loss": -5.34846305847168, "global_step": 23457, "epoch": 558} {"train_loss": -5.407541275024414, "global_step": 23458, "epoch": 558} {"train_loss": -5.276366710662842, "global_step": 23459, "epoch": 558} {"train_loss": -5.383020401000977, "global_step": 23460, "epoch": 558} {"train_loss": -5.339459419250488, "global_step": 23461, "epoch": 558} {"train_loss": -5.341219425201416, "global_step": 23462, "epoch": 558} {"train_loss": -5.330543518066406, "global_step": 23463, "epoch": 558} {"train_loss": -5.425626277923584, "global_step": 23464, "epoch": 558} {"train_loss": -5.40155553817749, "global_step": 23465, "epoch": 558} {"train_loss": -5.453483581542969, "global_step": 23466, "epoch": 558} {"train_loss": -5.369009971618652, "global_step": 23467, "epoch": 558} {"train_loss": -5.42575740814209, "global_step": 23468, "epoch": 558} {"train_loss": -5.317275047302246, "global_step": 23469, "epoch": 558} {"train_loss": -5.440306186676025, "global_step": 23470, "epoch": 558} {"train_loss": -5.392293453216553, "global_step": 23471, "epoch": 558} {"train_loss": -5.458541393280029, "global_step": 23472, "epoch": 558} {"train_loss": -5.318240165710449, "global_step": 23473, "epoch": 558} {"train_loss": -5.325405120849609, "global_step": 23474, "epoch": 558} {"train_loss": -5.419755935668945, "global_step": 23475, "epoch": 558} {"train_loss": -5.320246696472168, "global_step": 23476, "epoch": 558} {"train_loss": -5.37800779796782, "global_step": 23477, "epoch": 558, "val_loss": 68121.90625} {"train_loss": -5.338396072387695, "global_step": 23478, "epoch": 559} {"train_loss": -5.369931221008301, "global_step": 23479, "epoch": 559} {"train_loss": -5.44746208190918, "global_step": 23480, "epoch": 559} {"train_loss": -5.416750907897949, "global_step": 23481, "epoch": 559} {"train_loss": -5.437155723571777, "global_step": 23482, "epoch": 559} {"train_loss": -5.424886703491211, "global_step": 23483, "epoch": 559} {"train_loss": -5.510423183441162, "global_step": 23484, "epoch": 559} {"train_loss": -5.594277858734131, "global_step": 23485, "epoch": 559} {"train_loss": -5.385107040405273, "global_step": 23486, "epoch": 559} {"train_loss": -5.369407653808594, "global_step": 23487, "epoch": 559} {"train_loss": -5.253521919250488, "global_step": 23488, "epoch": 559} {"train_loss": -5.374248504638672, "global_step": 23489, "epoch": 559} {"train_loss": -5.382577896118164, "global_step": 23490, "epoch": 559} {"train_loss": -5.276367664337158, "global_step": 23491, "epoch": 559} {"train_loss": -5.396322727203369, "global_step": 23492, "epoch": 559} {"train_loss": -5.444979667663574, "global_step": 23493, "epoch": 559} {"train_loss": -5.327999114990234, "global_step": 23494, "epoch": 559} {"train_loss": -5.2705230712890625, "global_step": 23495, "epoch": 559} {"train_loss": -5.399644374847412, "global_step": 23496, "epoch": 559} {"train_loss": -5.291553497314453, "global_step": 23497, "epoch": 559} {"train_loss": -5.325944900512695, "global_step": 23498, "epoch": 559} {"train_loss": -5.407970905303955, "global_step": 23499, "epoch": 559} {"train_loss": -5.185842037200928, "global_step": 23500, "epoch": 559} {"train_loss": -5.33953857421875, "global_step": 23501, "epoch": 559} {"train_loss": -5.353620529174805, "global_step": 23502, "epoch": 559} {"train_loss": -5.335077285766602, "global_step": 23503, "epoch": 559} {"train_loss": -5.378032207489014, "global_step": 23504, "epoch": 559} {"train_loss": -5.282812118530273, "global_step": 23505, "epoch": 559} {"train_loss": -5.292497158050537, "global_step": 23506, "epoch": 559} {"train_loss": -5.2411909103393555, "global_step": 23507, "epoch": 559} {"train_loss": -5.383962631225586, "global_step": 23508, "epoch": 559} {"train_loss": -5.355943202972412, "global_step": 23509, "epoch": 559} {"train_loss": -5.424628257751465, "global_step": 23510, "epoch": 559} {"train_loss": -5.222227573394775, "global_step": 23511, "epoch": 559} {"train_loss": -5.33798885345459, "global_step": 23512, "epoch": 559} {"train_loss": -5.281013011932373, "global_step": 23513, "epoch": 559} {"train_loss": -5.265817642211914, "global_step": 23514, "epoch": 559} {"train_loss": -5.313572883605957, "global_step": 23515, "epoch": 559} {"train_loss": -5.263919830322266, "global_step": 23516, "epoch": 559} {"train_loss": -5.480542182922363, "global_step": 23517, "epoch": 559} {"train_loss": -5.344555377960205, "global_step": 23518, "epoch": 559} {"train_loss": -5.353051231020973, "global_step": 23519, "epoch": 559, "val_loss": 68124.828125} {"train_loss": -5.499385833740234, "global_step": 23520, "epoch": 560} {"train_loss": -5.435502052307129, "global_step": 23521, "epoch": 560} {"train_loss": -5.504669189453125, "global_step": 23522, "epoch": 560} {"train_loss": -5.3249969482421875, "global_step": 23523, "epoch": 560} {"train_loss": -5.397701263427734, "global_step": 23524, "epoch": 560} {"train_loss": -5.452310562133789, "global_step": 23525, "epoch": 560} {"train_loss": -5.268661975860596, "global_step": 23526, "epoch": 560} {"train_loss": -5.363344192504883, "global_step": 23527, "epoch": 560} {"train_loss": -5.300990104675293, "global_step": 23528, "epoch": 560} {"train_loss": -5.415292739868164, "global_step": 23529, "epoch": 560} {"train_loss": -5.389034271240234, "global_step": 23530, "epoch": 560} {"train_loss": -5.339476585388184, "global_step": 23531, "epoch": 560} {"train_loss": -5.211441516876221, "global_step": 23532, "epoch": 560} {"train_loss": -5.312456130981445, "global_step": 23533, "epoch": 560} {"train_loss": -5.223289489746094, "global_step": 23534, "epoch": 560} {"train_loss": -5.178822040557861, "global_step": 23535, "epoch": 560} {"train_loss": -5.440564155578613, "global_step": 23536, "epoch": 560} {"train_loss": -5.264403343200684, "global_step": 23537, "epoch": 560} {"train_loss": -5.3811540603637695, "global_step": 23538, "epoch": 560} {"train_loss": -5.249180793762207, "global_step": 23539, "epoch": 560} {"train_loss": -5.262910842895508, "global_step": 23540, "epoch": 560} {"train_loss": -5.230844497680664, "global_step": 23541, "epoch": 560} {"train_loss": -5.2503886222839355, "global_step": 23542, "epoch": 560} {"train_loss": -5.359119415283203, "global_step": 23543, "epoch": 560} {"train_loss": -5.363030910491943, "global_step": 23544, "epoch": 560} {"train_loss": -5.398937225341797, "global_step": 23545, "epoch": 560} {"train_loss": -5.4242963790893555, "global_step": 23546, "epoch": 560} {"train_loss": -5.355676651000977, "global_step": 23547, "epoch": 560} {"train_loss": -5.245731353759766, "global_step": 23548, "epoch": 560} {"train_loss": -5.343865871429443, "global_step": 23549, "epoch": 560} {"train_loss": -5.457180023193359, "global_step": 23550, "epoch": 560} {"train_loss": -5.336374759674072, "global_step": 23551, "epoch": 560} {"train_loss": -5.297595024108887, "global_step": 23552, "epoch": 560} {"train_loss": -5.496272087097168, "global_step": 23553, "epoch": 560} {"train_loss": -5.402984619140625, "global_step": 23554, "epoch": 560} {"train_loss": -5.456615924835205, "global_step": 23555, "epoch": 560} {"train_loss": -5.289162635803223, "global_step": 23556, "epoch": 560} {"train_loss": -5.334410667419434, "global_step": 23557, "epoch": 560} {"train_loss": -5.346746444702148, "global_step": 23558, "epoch": 560} {"train_loss": -5.393275260925293, "global_step": 23559, "epoch": 560} {"train_loss": -5.377297401428223, "global_step": 23560, "epoch": 560} {"train_loss": -5.3481271380469915, "global_step": 23561, "epoch": 560, "val_loss": 68183.234375} {"train_loss": -5.417858600616455, "global_step": 23562, "epoch": 561} {"train_loss": -5.3354010581970215, "global_step": 23563, "epoch": 561} {"train_loss": -5.283572673797607, "global_step": 23564, "epoch": 561} {"train_loss": -5.139091491699219, "global_step": 23565, "epoch": 561} {"train_loss": -5.403397083282471, "global_step": 23566, "epoch": 561} {"train_loss": -5.3321099281311035, "global_step": 23567, "epoch": 561} {"train_loss": -5.427075386047363, "global_step": 23568, "epoch": 561} {"train_loss": -5.419817924499512, "global_step": 23569, "epoch": 561} {"train_loss": -5.370882987976074, "global_step": 23570, "epoch": 561} {"train_loss": -5.313848972320557, "global_step": 23571, "epoch": 561} {"train_loss": -5.486490249633789, "global_step": 23572, "epoch": 561} {"train_loss": -5.30526065826416, "global_step": 23573, "epoch": 561} {"train_loss": -5.344160079956055, "global_step": 23574, "epoch": 561} {"train_loss": -5.3064117431640625, "global_step": 23575, "epoch": 561} {"train_loss": -5.393237113952637, "global_step": 23576, "epoch": 561} {"train_loss": -5.496427536010742, "global_step": 23577, "epoch": 561} {"train_loss": -5.4923295974731445, "global_step": 23578, "epoch": 561} {"train_loss": -5.4237260818481445, "global_step": 23579, "epoch": 561} {"train_loss": -5.419198036193848, "global_step": 23580, "epoch": 561} {"train_loss": -5.517803192138672, "global_step": 23581, "epoch": 561} {"train_loss": -5.371944904327393, "global_step": 23582, "epoch": 561} {"train_loss": -5.336926460266113, "global_step": 23583, "epoch": 561} {"train_loss": -5.410931587219238, "global_step": 23584, "epoch": 561} {"train_loss": -5.302074432373047, "global_step": 23585, "epoch": 561} {"train_loss": -5.2859296798706055, "global_step": 23586, "epoch": 561} {"train_loss": -5.33732795715332, "global_step": 23587, "epoch": 561} {"train_loss": -5.131075382232666, "global_step": 23588, "epoch": 561} {"train_loss": -5.382904529571533, "global_step": 23589, "epoch": 561} {"train_loss": -5.380099773406982, "global_step": 23590, "epoch": 561} {"train_loss": -5.261486530303955, "global_step": 23591, "epoch": 561} {"train_loss": -5.317934989929199, "global_step": 23592, "epoch": 561} {"train_loss": -5.325157165527344, "global_step": 23593, "epoch": 561} {"train_loss": -5.398561000823975, "global_step": 23594, "epoch": 561} {"train_loss": -5.356866359710693, "global_step": 23595, "epoch": 561} {"train_loss": -5.28059196472168, "global_step": 23596, "epoch": 561} {"train_loss": -5.350668907165527, "global_step": 23597, "epoch": 561} {"train_loss": -5.45450496673584, "global_step": 23598, "epoch": 561} {"train_loss": -5.391869068145752, "global_step": 23599, "epoch": 561} {"train_loss": -5.461965560913086, "global_step": 23600, "epoch": 561} {"train_loss": -5.285144329071045, "global_step": 23601, "epoch": 561} {"train_loss": -5.357806205749512, "global_step": 23602, "epoch": 561} {"train_loss": -5.358500673657372, "global_step": 23603, "epoch": 561, "val_loss": 67821.7890625} {"train_loss": -5.5108747482299805, "global_step": 23604, "epoch": 562} {"train_loss": -5.486910820007324, "global_step": 23605, "epoch": 562} {"train_loss": -5.295454978942871, "global_step": 23606, "epoch": 562} {"train_loss": -5.437932968139648, "global_step": 23607, "epoch": 562} {"train_loss": -5.296950340270996, "global_step": 23608, "epoch": 562} {"train_loss": -5.315797805786133, "global_step": 23609, "epoch": 562} {"train_loss": -5.451977252960205, "global_step": 23610, "epoch": 562} {"train_loss": -5.439208507537842, "global_step": 23611, "epoch": 562} {"train_loss": -5.488944053649902, "global_step": 23612, "epoch": 562} {"train_loss": -5.263233184814453, "global_step": 23613, "epoch": 562} {"train_loss": -5.498976707458496, "global_step": 23614, "epoch": 562} {"train_loss": -5.318002700805664, "global_step": 23615, "epoch": 562} {"train_loss": -5.130215644836426, "global_step": 23616, "epoch": 562} {"train_loss": -5.427170276641846, "global_step": 23617, "epoch": 562} {"train_loss": -5.273716926574707, "global_step": 23618, "epoch": 562} {"train_loss": -5.354730129241943, "global_step": 23619, "epoch": 562} {"train_loss": -5.234563827514648, "global_step": 23620, "epoch": 562} {"train_loss": -5.245438575744629, "global_step": 23621, "epoch": 562} {"train_loss": -5.535137176513672, "global_step": 23622, "epoch": 562} {"train_loss": -5.377779006958008, "global_step": 23623, "epoch": 562} {"train_loss": -5.312717437744141, "global_step": 23624, "epoch": 562} {"train_loss": -5.267521858215332, "global_step": 23625, "epoch": 562} {"train_loss": -5.3325018882751465, "global_step": 23626, "epoch": 562} {"train_loss": -5.340826988220215, "global_step": 23627, "epoch": 562} {"train_loss": -5.342589378356934, "global_step": 23628, "epoch": 562} {"train_loss": -5.330654621124268, "global_step": 23629, "epoch": 562} {"train_loss": -5.377425670623779, "global_step": 23630, "epoch": 562} {"train_loss": -5.282958030700684, "global_step": 23631, "epoch": 562} {"train_loss": -5.449397087097168, "global_step": 23632, "epoch": 562} {"train_loss": -5.416055202484131, "global_step": 23633, "epoch": 562} {"train_loss": -5.220627307891846, "global_step": 23634, "epoch": 562} {"train_loss": -5.519162654876709, "global_step": 23635, "epoch": 562} {"train_loss": -5.364349365234375, "global_step": 23636, "epoch": 562} {"train_loss": -5.184251308441162, "global_step": 23637, "epoch": 562} {"train_loss": -5.483312606811523, "global_step": 23638, "epoch": 562} {"train_loss": -5.188543319702148, "global_step": 23639, "epoch": 562} {"train_loss": -5.393372535705566, "global_step": 23640, "epoch": 562} {"train_loss": -5.428377628326416, "global_step": 23641, "epoch": 562} {"train_loss": -5.33648157119751, "global_step": 23642, "epoch": 562} {"train_loss": -5.40523099899292, "global_step": 23643, "epoch": 562} {"train_loss": -5.254065990447998, "global_step": 23644, "epoch": 562} {"train_loss": -5.354123047419956, "global_step": 23645, "epoch": 562, "val_loss": 68070.8515625} {"train_loss": -5.329200744628906, "global_step": 23646, "epoch": 563} {"train_loss": -5.354784965515137, "global_step": 23647, "epoch": 563} {"train_loss": -5.386127948760986, "global_step": 23648, "epoch": 563} {"train_loss": -5.360292434692383, "global_step": 23649, "epoch": 563} {"train_loss": -5.3229522705078125, "global_step": 23650, "epoch": 563} {"train_loss": -5.329655647277832, "global_step": 23651, "epoch": 563} {"train_loss": -5.334423065185547, "global_step": 23652, "epoch": 563} {"train_loss": -5.49399995803833, "global_step": 23653, "epoch": 563} {"train_loss": -5.390804290771484, "global_step": 23654, "epoch": 563} {"train_loss": -5.325094699859619, "global_step": 23655, "epoch": 563} {"train_loss": -5.439729690551758, "global_step": 23656, "epoch": 563} {"train_loss": -5.431607723236084, "global_step": 23657, "epoch": 563} {"train_loss": -5.3879876136779785, "global_step": 23658, "epoch": 563} {"train_loss": -5.401194095611572, "global_step": 23659, "epoch": 563} {"train_loss": -5.2744574546813965, "global_step": 23660, "epoch": 563} {"train_loss": -5.234335899353027, "global_step": 23661, "epoch": 563} {"train_loss": -5.29971170425415, "global_step": 23662, "epoch": 563} {"train_loss": -5.428579330444336, "global_step": 23663, "epoch": 563} {"train_loss": -5.349635124206543, "global_step": 23664, "epoch": 563} {"train_loss": -5.349738121032715, "global_step": 23665, "epoch": 563} {"train_loss": -5.318362712860107, "global_step": 23666, "epoch": 563} {"train_loss": -5.289612293243408, "global_step": 23667, "epoch": 563} {"train_loss": -5.360159397125244, "global_step": 23668, "epoch": 563} {"train_loss": -5.415596008300781, "global_step": 23669, "epoch": 563} {"train_loss": -5.343403339385986, "global_step": 23670, "epoch": 563} {"train_loss": -5.4403977394104, "global_step": 23671, "epoch": 563} {"train_loss": -5.373808860778809, "global_step": 23672, "epoch": 563} {"train_loss": -5.275645732879639, "global_step": 23673, "epoch": 563} {"train_loss": -5.465518951416016, "global_step": 23674, "epoch": 563} {"train_loss": -5.240668296813965, "global_step": 23675, "epoch": 563} {"train_loss": -5.308521270751953, "global_step": 23676, "epoch": 563} {"train_loss": -5.259288787841797, "global_step": 23677, "epoch": 563} {"train_loss": -5.225433349609375, "global_step": 23678, "epoch": 563} {"train_loss": -5.358063697814941, "global_step": 23679, "epoch": 563} {"train_loss": -5.072018146514893, "global_step": 23680, "epoch": 563} {"train_loss": -5.444518089294434, "global_step": 23681, "epoch": 563} {"train_loss": -5.2564897537231445, "global_step": 23682, "epoch": 563} {"train_loss": -5.142352104187012, "global_step": 23683, "epoch": 563} {"train_loss": -5.318111896514893, "global_step": 23684, "epoch": 563} {"train_loss": -5.175962448120117, "global_step": 23685, "epoch": 563} {"train_loss": -5.271514892578125, "global_step": 23686, "epoch": 563} {"train_loss": -5.330649954932077, "global_step": 23687, "epoch": 563, "val_loss": 68635.2890625} {"train_loss": -5.3449273109436035, "global_step": 23688, "epoch": 564} {"train_loss": -5.146773338317871, "global_step": 23689, "epoch": 564} {"train_loss": -5.28767204284668, "global_step": 23690, "epoch": 564} {"train_loss": -5.16203498840332, "global_step": 23691, "epoch": 564} {"train_loss": -5.476930141448975, "global_step": 23692, "epoch": 564} {"train_loss": -5.158452033996582, "global_step": 23693, "epoch": 564} {"train_loss": -5.506168365478516, "global_step": 23694, "epoch": 564} {"train_loss": -5.345785140991211, "global_step": 23695, "epoch": 564} {"train_loss": -5.201748847961426, "global_step": 23696, "epoch": 564} {"train_loss": -5.345465183258057, "global_step": 23697, "epoch": 564} {"train_loss": -5.184133529663086, "global_step": 23698, "epoch": 564} {"train_loss": -5.181964874267578, "global_step": 23699, "epoch": 564} {"train_loss": -5.28791618347168, "global_step": 23700, "epoch": 564} {"train_loss": -5.442197322845459, "global_step": 23701, "epoch": 564} {"train_loss": -5.436078071594238, "global_step": 23702, "epoch": 564} {"train_loss": -5.231744766235352, "global_step": 23703, "epoch": 564} {"train_loss": -5.2856245040893555, "global_step": 23704, "epoch": 564} {"train_loss": -5.23314094543457, "global_step": 23705, "epoch": 564} {"train_loss": -5.41898250579834, "global_step": 23706, "epoch": 564} {"train_loss": -5.498989105224609, "global_step": 23707, "epoch": 564} {"train_loss": -5.3571014404296875, "global_step": 23708, "epoch": 564} {"train_loss": -5.3716535568237305, "global_step": 23709, "epoch": 564} {"train_loss": -5.408470630645752, "global_step": 23710, "epoch": 564} {"train_loss": -5.403729438781738, "global_step": 23711, "epoch": 564} {"train_loss": -5.374893665313721, "global_step": 23712, "epoch": 564} {"train_loss": -5.450822830200195, "global_step": 23713, "epoch": 564} {"train_loss": -5.381284713745117, "global_step": 23714, "epoch": 564} {"train_loss": -5.199514389038086, "global_step": 23715, "epoch": 564} {"train_loss": -5.446415424346924, "global_step": 23716, "epoch": 564} {"train_loss": -5.413037300109863, "global_step": 23717, "epoch": 564} {"train_loss": -5.427709579467773, "global_step": 23718, "epoch": 564} {"train_loss": -5.406495094299316, "global_step": 23719, "epoch": 564} {"train_loss": -5.3178277015686035, "global_step": 23720, "epoch": 564} {"train_loss": -5.388733863830566, "global_step": 23721, "epoch": 564} {"train_loss": -5.3646087646484375, "global_step": 23722, "epoch": 564} {"train_loss": -5.417080879211426, "global_step": 23723, "epoch": 564} {"train_loss": -5.293368339538574, "global_step": 23724, "epoch": 564} {"train_loss": -5.373778343200684, "global_step": 23725, "epoch": 564} {"train_loss": -5.459772109985352, "global_step": 23726, "epoch": 564} {"train_loss": -5.40286922454834, "global_step": 23727, "epoch": 564} {"train_loss": -5.4468841552734375, "global_step": 23728, "epoch": 564} {"train_loss": -5.350964705149333, "global_step": 23729, "epoch": 564, "val_loss": 67995.4140625} {"train_loss": -5.376417636871338, "global_step": 23730, "epoch": 565} {"train_loss": -5.387986183166504, "global_step": 23731, "epoch": 565} {"train_loss": -5.354264736175537, "global_step": 23732, "epoch": 565} {"train_loss": -5.395242214202881, "global_step": 23733, "epoch": 565} {"train_loss": -5.414339542388916, "global_step": 23734, "epoch": 565} {"train_loss": -5.2910332679748535, "global_step": 23735, "epoch": 565} {"train_loss": -5.463006973266602, "global_step": 23736, "epoch": 565} {"train_loss": -5.3260884284973145, "global_step": 23737, "epoch": 565} {"train_loss": -5.340031623840332, "global_step": 23738, "epoch": 565} {"train_loss": -5.388821125030518, "global_step": 23739, "epoch": 565} {"train_loss": -5.39155387878418, "global_step": 23740, "epoch": 565} {"train_loss": -5.433064937591553, "global_step": 23741, "epoch": 565} {"train_loss": -5.497036933898926, "global_step": 23742, "epoch": 565} {"train_loss": -5.350638389587402, "global_step": 23743, "epoch": 565} {"train_loss": -5.405782222747803, "global_step": 23744, "epoch": 565} {"train_loss": -5.4654083251953125, "global_step": 23745, "epoch": 565} {"train_loss": -5.318102836608887, "global_step": 23746, "epoch": 565} {"train_loss": -5.416135787963867, "global_step": 23747, "epoch": 565} {"train_loss": -5.417451858520508, "global_step": 23748, "epoch": 565} {"train_loss": -5.280093669891357, "global_step": 23749, "epoch": 565} {"train_loss": -5.451594352722168, "global_step": 23750, "epoch": 565} {"train_loss": -5.518406867980957, "global_step": 23751, "epoch": 565} {"train_loss": -5.313906669616699, "global_step": 23752, "epoch": 565} {"train_loss": -5.188052654266357, "global_step": 23753, "epoch": 565} {"train_loss": -5.376919269561768, "global_step": 23754, "epoch": 565} {"train_loss": -5.5080437660217285, "global_step": 23755, "epoch": 565} {"train_loss": -5.350492477416992, "global_step": 23756, "epoch": 565} {"train_loss": -5.455996513366699, "global_step": 23757, "epoch": 565} {"train_loss": -5.303576469421387, "global_step": 23758, "epoch": 565} {"train_loss": -5.358384132385254, "global_step": 23759, "epoch": 565} {"train_loss": -5.47325325012207, "global_step": 23760, "epoch": 565} {"train_loss": -5.486568927764893, "global_step": 23761, "epoch": 565} {"train_loss": -5.346702575683594, "global_step": 23762, "epoch": 565} {"train_loss": -5.391160488128662, "global_step": 23763, "epoch": 565} {"train_loss": -5.39092493057251, "global_step": 23764, "epoch": 565} {"train_loss": -5.321684837341309, "global_step": 23765, "epoch": 565} {"train_loss": -5.340292930603027, "global_step": 23766, "epoch": 565} {"train_loss": -5.314002990722656, "global_step": 23767, "epoch": 565} {"train_loss": -5.364585876464844, "global_step": 23768, "epoch": 565} {"train_loss": -5.362782001495361, "global_step": 23769, "epoch": 565} {"train_loss": -5.3576202392578125, "global_step": 23770, "epoch": 565} {"train_loss": -5.379732881273542, "global_step": 23771, "epoch": 565, "val_loss": 68129.640625} {"train_loss": -5.2218217849731445, "global_step": 23772, "epoch": 566} {"train_loss": -5.432723045349121, "global_step": 23773, "epoch": 566} {"train_loss": -5.346076488494873, "global_step": 23774, "epoch": 566} {"train_loss": -5.393536567687988, "global_step": 23775, "epoch": 566} {"train_loss": -5.428191661834717, "global_step": 23776, "epoch": 566} {"train_loss": -5.452083587646484, "global_step": 23777, "epoch": 566} {"train_loss": -5.369961738586426, "global_step": 23778, "epoch": 566} {"train_loss": -5.350224494934082, "global_step": 23779, "epoch": 566} {"train_loss": -5.446125030517578, "global_step": 23780, "epoch": 566} {"train_loss": -5.470831871032715, "global_step": 23781, "epoch": 566} {"train_loss": -5.357969284057617, "global_step": 23782, "epoch": 566} {"train_loss": -5.4908857345581055, "global_step": 23783, "epoch": 566} {"train_loss": -5.435650825500488, "global_step": 23784, "epoch": 566} {"train_loss": -5.3899126052856445, "global_step": 23785, "epoch": 566} {"train_loss": -5.2881760597229, "global_step": 23786, "epoch": 566} {"train_loss": -5.338531017303467, "global_step": 23787, "epoch": 566} {"train_loss": -5.216264247894287, "global_step": 23788, "epoch": 566} {"train_loss": -5.54909610748291, "global_step": 23789, "epoch": 566} {"train_loss": -5.263326644897461, "global_step": 23790, "epoch": 566} {"train_loss": -5.249970436096191, "global_step": 23791, "epoch": 566} {"train_loss": -5.460794448852539, "global_step": 23792, "epoch": 566} {"train_loss": -5.27142333984375, "global_step": 23793, "epoch": 566} {"train_loss": -5.371947288513184, "global_step": 23794, "epoch": 566} {"train_loss": -5.350678443908691, "global_step": 23795, "epoch": 566} {"train_loss": -5.371776103973389, "global_step": 23796, "epoch": 566} {"train_loss": -5.421196460723877, "global_step": 23797, "epoch": 566} {"train_loss": -5.1982879638671875, "global_step": 23798, "epoch": 566} {"train_loss": -5.394049644470215, "global_step": 23799, "epoch": 566} {"train_loss": -5.465202331542969, "global_step": 23800, "epoch": 566} {"train_loss": -5.430388450622559, "global_step": 23801, "epoch": 566} {"train_loss": -5.418593406677246, "global_step": 23802, "epoch": 566} {"train_loss": -5.296900749206543, "global_step": 23803, "epoch": 566} {"train_loss": -5.385505199432373, "global_step": 23804, "epoch": 566} {"train_loss": -5.371243953704834, "global_step": 23805, "epoch": 566} {"train_loss": -5.522890090942383, "global_step": 23806, "epoch": 566} {"train_loss": -5.419435501098633, "global_step": 23807, "epoch": 566} {"train_loss": -5.291262149810791, "global_step": 23808, "epoch": 566} {"train_loss": -5.248788356781006, "global_step": 23809, "epoch": 566} {"train_loss": -5.41625452041626, "global_step": 23810, "epoch": 566} {"train_loss": -5.306939601898193, "global_step": 23811, "epoch": 566} {"train_loss": -5.269957542419434, "global_step": 23812, "epoch": 566} {"train_loss": -5.371448426019578, "global_step": 23813, "epoch": 566, "val_loss": 68677.734375} {"train_loss": -5.448051452636719, "global_step": 23814, "epoch": 567} {"train_loss": -5.271324157714844, "global_step": 23815, "epoch": 567} {"train_loss": -5.400778293609619, "global_step": 23816, "epoch": 567} {"train_loss": -5.470708847045898, "global_step": 23817, "epoch": 567} {"train_loss": -5.266604900360107, "global_step": 23818, "epoch": 567} {"train_loss": -5.383846282958984, "global_step": 23819, "epoch": 567} {"train_loss": -5.311840534210205, "global_step": 23820, "epoch": 567} {"train_loss": -5.431539058685303, "global_step": 23821, "epoch": 567} {"train_loss": -5.325994968414307, "global_step": 23822, "epoch": 567} {"train_loss": -5.369002819061279, "global_step": 23823, "epoch": 567} {"train_loss": -5.3991241455078125, "global_step": 23824, "epoch": 567} {"train_loss": -5.354948043823242, "global_step": 23825, "epoch": 567} {"train_loss": -5.389824867248535, "global_step": 23826, "epoch": 567} {"train_loss": -5.278631687164307, "global_step": 23827, "epoch": 567} {"train_loss": -5.446113586425781, "global_step": 23828, "epoch": 567} {"train_loss": -5.541380405426025, "global_step": 23829, "epoch": 567} {"train_loss": -5.389022350311279, "global_step": 23830, "epoch": 567} {"train_loss": -5.439022064208984, "global_step": 23831, "epoch": 567} {"train_loss": -5.433205604553223, "global_step": 23832, "epoch": 567} {"train_loss": -5.333232879638672, "global_step": 23833, "epoch": 567} {"train_loss": -5.375017166137695, "global_step": 23834, "epoch": 567} {"train_loss": -5.2464799880981445, "global_step": 23835, "epoch": 567} {"train_loss": -5.330297470092773, "global_step": 23836, "epoch": 567} {"train_loss": -5.465609550476074, "global_step": 23837, "epoch": 567} {"train_loss": -5.301828384399414, "global_step": 23838, "epoch": 567} {"train_loss": -5.289061546325684, "global_step": 23839, "epoch": 567} {"train_loss": -5.21607780456543, "global_step": 23840, "epoch": 567} {"train_loss": -5.297553539276123, "global_step": 23841, "epoch": 567} {"train_loss": -5.312329292297363, "global_step": 23842, "epoch": 567} {"train_loss": -5.476240634918213, "global_step": 23843, "epoch": 567} {"train_loss": -5.400546073913574, "global_step": 23844, "epoch": 567} {"train_loss": -5.521304130554199, "global_step": 23845, "epoch": 567} {"train_loss": -5.303691864013672, "global_step": 23846, "epoch": 567} {"train_loss": -5.479315757751465, "global_step": 23847, "epoch": 567} {"train_loss": -5.207770824432373, "global_step": 23848, "epoch": 567} {"train_loss": -5.489745140075684, "global_step": 23849, "epoch": 567} {"train_loss": -5.329281806945801, "global_step": 23850, "epoch": 567} {"train_loss": -5.518815040588379, "global_step": 23851, "epoch": 567} {"train_loss": -5.169288635253906, "global_step": 23852, "epoch": 567} {"train_loss": -5.404054641723633, "global_step": 23853, "epoch": 567} {"train_loss": -5.324986934661865, "global_step": 23854, "epoch": 567} {"train_loss": -5.368369181950887, "global_step": 23855, "epoch": 567, "val_loss": 68459.40625} {"train_loss": -5.144743919372559, "global_step": 23856, "epoch": 568} {"train_loss": -5.19216251373291, "global_step": 23857, "epoch": 568} {"train_loss": -5.403995513916016, "global_step": 23858, "epoch": 568} {"train_loss": -5.381074905395508, "global_step": 23859, "epoch": 568} {"train_loss": -5.392948150634766, "global_step": 23860, "epoch": 568} {"train_loss": -5.380574703216553, "global_step": 23861, "epoch": 568} {"train_loss": -5.26019811630249, "global_step": 23862, "epoch": 568} {"train_loss": -5.423007965087891, "global_step": 23863, "epoch": 568} {"train_loss": -5.4499077796936035, "global_step": 23864, "epoch": 568} {"train_loss": -5.345688343048096, "global_step": 23865, "epoch": 568} {"train_loss": -5.430154323577881, "global_step": 23866, "epoch": 568} {"train_loss": -5.476261138916016, "global_step": 23867, "epoch": 568} {"train_loss": -5.403386116027832, "global_step": 23868, "epoch": 568} {"train_loss": -5.441973686218262, "global_step": 23869, "epoch": 568} {"train_loss": -5.477875709533691, "global_step": 23870, "epoch": 568} {"train_loss": -5.503435134887695, "global_step": 23871, "epoch": 568} {"train_loss": -5.420356273651123, "global_step": 23872, "epoch": 568} {"train_loss": -5.425353050231934, "global_step": 23873, "epoch": 568} {"train_loss": -5.453246593475342, "global_step": 23874, "epoch": 568} {"train_loss": -5.477374076843262, "global_step": 23875, "epoch": 568} {"train_loss": -5.354857444763184, "global_step": 23876, "epoch": 568} {"train_loss": -5.421682357788086, "global_step": 23877, "epoch": 568} {"train_loss": -5.446053504943848, "global_step": 23878, "epoch": 568} {"train_loss": -5.473227500915527, "global_step": 23879, "epoch": 568} {"train_loss": -5.373659610748291, "global_step": 23880, "epoch": 568} {"train_loss": -5.420632839202881, "global_step": 23881, "epoch": 568} {"train_loss": -5.409391403198242, "global_step": 23882, "epoch": 568} {"train_loss": -5.450239181518555, "global_step": 23883, "epoch": 568} {"train_loss": -5.3627400398254395, "global_step": 23884, "epoch": 568} {"train_loss": -5.456786632537842, "global_step": 23885, "epoch": 568} {"train_loss": -5.354983806610107, "global_step": 23886, "epoch": 568} {"train_loss": -5.295558452606201, "global_step": 23887, "epoch": 568} {"train_loss": -5.31243896484375, "global_step": 23888, "epoch": 568} {"train_loss": -5.47499418258667, "global_step": 23889, "epoch": 568} {"train_loss": -5.403341770172119, "global_step": 23890, "epoch": 568} {"train_loss": -5.411582946777344, "global_step": 23891, "epoch": 568} {"train_loss": -5.482442855834961, "global_step": 23892, "epoch": 568} {"train_loss": -5.4446306228637695, "global_step": 23893, "epoch": 568} {"train_loss": -5.289738655090332, "global_step": 23894, "epoch": 568} {"train_loss": -5.334636688232422, "global_step": 23895, "epoch": 568} {"train_loss": -5.416877746582031, "global_step": 23896, "epoch": 568} {"train_loss": -5.398284264973232, "global_step": 23897, "epoch": 568, "val_loss": 67872.4765625} {"train_loss": -5.372561454772949, "global_step": 23898, "epoch": 569} {"train_loss": -5.4582600593566895, "global_step": 23899, "epoch": 569} {"train_loss": -5.368124008178711, "global_step": 23900, "epoch": 569} {"train_loss": -5.429529190063477, "global_step": 23901, "epoch": 569} {"train_loss": -5.324701309204102, "global_step": 23902, "epoch": 569} {"train_loss": -5.417305946350098, "global_step": 23903, "epoch": 569} {"train_loss": -5.407473564147949, "global_step": 23904, "epoch": 569} {"train_loss": -5.280622482299805, "global_step": 23905, "epoch": 569} {"train_loss": -5.372348308563232, "global_step": 23906, "epoch": 569} {"train_loss": -5.477629661560059, "global_step": 23907, "epoch": 569} {"train_loss": -5.2617082595825195, "global_step": 23908, "epoch": 569} {"train_loss": -5.560907363891602, "global_step": 23909, "epoch": 569} {"train_loss": -5.492267608642578, "global_step": 23910, "epoch": 569} {"train_loss": -5.252211570739746, "global_step": 23911, "epoch": 569} {"train_loss": -5.290401458740234, "global_step": 23912, "epoch": 569} {"train_loss": -5.391287326812744, "global_step": 23913, "epoch": 569} {"train_loss": -5.345310688018799, "global_step": 23914, "epoch": 569} {"train_loss": -5.5377678871154785, "global_step": 23915, "epoch": 569} {"train_loss": -5.303045749664307, "global_step": 23916, "epoch": 569} {"train_loss": -5.391410827636719, "global_step": 23917, "epoch": 569} {"train_loss": -5.293704509735107, "global_step": 23918, "epoch": 569} {"train_loss": -5.41334342956543, "global_step": 23919, "epoch": 569} {"train_loss": -5.477779865264893, "global_step": 23920, "epoch": 569} {"train_loss": -5.416633605957031, "global_step": 23921, "epoch": 569} {"train_loss": -5.442605018615723, "global_step": 23922, "epoch": 569} {"train_loss": -5.406719207763672, "global_step": 23923, "epoch": 569} {"train_loss": -5.4947404861450195, "global_step": 23924, "epoch": 569} {"train_loss": -5.393352508544922, "global_step": 23925, "epoch": 569} {"train_loss": -5.390669345855713, "global_step": 23926, "epoch": 569} {"train_loss": -5.46024751663208, "global_step": 23927, "epoch": 569} {"train_loss": -5.501225471496582, "global_step": 23928, "epoch": 569} {"train_loss": -5.328885078430176, "global_step": 23929, "epoch": 569} {"train_loss": -5.373287200927734, "global_step": 23930, "epoch": 569} {"train_loss": -5.314348220825195, "global_step": 23931, "epoch": 569} {"train_loss": -5.334949493408203, "global_step": 23932, "epoch": 569} {"train_loss": -5.348272323608398, "global_step": 23933, "epoch": 569} {"train_loss": -5.513927936553955, "global_step": 23934, "epoch": 569} {"train_loss": -5.4095587730407715, "global_step": 23935, "epoch": 569} {"train_loss": -5.417680740356445, "global_step": 23936, "epoch": 569} {"train_loss": -5.414361953735352, "global_step": 23937, "epoch": 569} {"train_loss": -5.37710428237915, "global_step": 23938, "epoch": 569} {"train_loss": -5.394929874510992, "global_step": 23939, "epoch": 569, "val_loss": 68117.4921875} {"train_loss": -5.421907901763916, "global_step": 23940, "epoch": 570} {"train_loss": -5.3413190841674805, "global_step": 23941, "epoch": 570} {"train_loss": -5.569694995880127, "global_step": 23942, "epoch": 570} {"train_loss": -5.51759672164917, "global_step": 23943, "epoch": 570} {"train_loss": -5.431690216064453, "global_step": 23944, "epoch": 570} {"train_loss": -5.310092449188232, "global_step": 23945, "epoch": 570} {"train_loss": -5.357516288757324, "global_step": 23946, "epoch": 570} {"train_loss": -5.44010066986084, "global_step": 23947, "epoch": 570} {"train_loss": -5.391292572021484, "global_step": 23948, "epoch": 570} {"train_loss": -5.406104564666748, "global_step": 23949, "epoch": 570} {"train_loss": -5.45119571685791, "global_step": 23950, "epoch": 570} {"train_loss": -5.435821533203125, "global_step": 23951, "epoch": 570} {"train_loss": -5.4023942947387695, "global_step": 23952, "epoch": 570} {"train_loss": -5.448537349700928, "global_step": 23953, "epoch": 570} {"train_loss": -5.460935592651367, "global_step": 23954, "epoch": 570} {"train_loss": -5.531838417053223, "global_step": 23955, "epoch": 570} {"train_loss": -5.401759624481201, "global_step": 23956, "epoch": 570} {"train_loss": -5.377102851867676, "global_step": 23957, "epoch": 570} {"train_loss": -5.336817264556885, "global_step": 23958, "epoch": 570} {"train_loss": -5.42569637298584, "global_step": 23959, "epoch": 570} {"train_loss": -5.429488182067871, "global_step": 23960, "epoch": 570} {"train_loss": -5.464169502258301, "global_step": 23961, "epoch": 570} {"train_loss": -5.391452789306641, "global_step": 23962, "epoch": 570} {"train_loss": -5.193019866943359, "global_step": 23963, "epoch": 570} {"train_loss": -5.457376480102539, "global_step": 23964, "epoch": 570} {"train_loss": -5.373466968536377, "global_step": 23965, "epoch": 570} {"train_loss": -5.316556930541992, "global_step": 23966, "epoch": 570} {"train_loss": -5.380292892456055, "global_step": 23967, "epoch": 570} {"train_loss": -5.36667537689209, "global_step": 23968, "epoch": 570} {"train_loss": -5.346590518951416, "global_step": 23969, "epoch": 570} {"train_loss": -5.301724433898926, "global_step": 23970, "epoch": 570} {"train_loss": -5.30328369140625, "global_step": 23971, "epoch": 570} {"train_loss": -5.268362522125244, "global_step": 23972, "epoch": 570} {"train_loss": -5.397976398468018, "global_step": 23973, "epoch": 570} {"train_loss": -5.348204612731934, "global_step": 23974, "epoch": 570} {"train_loss": -5.3334879875183105, "global_step": 23975, "epoch": 570} {"train_loss": -5.4030351638793945, "global_step": 23976, "epoch": 570} {"train_loss": -5.298190593719482, "global_step": 23977, "epoch": 570} {"train_loss": -5.299247741699219, "global_step": 23978, "epoch": 570} {"train_loss": -5.404846668243408, "global_step": 23979, "epoch": 570} {"train_loss": -5.3653435707092285, "global_step": 23980, "epoch": 570} {"train_loss": -5.389573937370663, "global_step": 23981, "epoch": 570, "val_loss": 67992.5859375} {"train_loss": -5.375277519226074, "global_step": 23982, "epoch": 571} {"train_loss": -5.396134853363037, "global_step": 23983, "epoch": 571} {"train_loss": -5.339095115661621, "global_step": 23984, "epoch": 571} {"train_loss": -5.359429359436035, "global_step": 23985, "epoch": 571} {"train_loss": -5.496642112731934, "global_step": 23986, "epoch": 571} {"train_loss": -5.272257328033447, "global_step": 23987, "epoch": 571} {"train_loss": -5.42056131362915, "global_step": 23988, "epoch": 571} {"train_loss": -5.326974868774414, "global_step": 23989, "epoch": 571} {"train_loss": -5.389481544494629, "global_step": 23990, "epoch": 571} {"train_loss": -5.3975725173950195, "global_step": 23991, "epoch": 571} {"train_loss": -5.3322224617004395, "global_step": 23992, "epoch": 571} {"train_loss": -5.297070503234863, "global_step": 23993, "epoch": 571} {"train_loss": -5.2754669189453125, "global_step": 23994, "epoch": 571} {"train_loss": -5.483168601989746, "global_step": 23995, "epoch": 571} {"train_loss": -5.442984580993652, "global_step": 23996, "epoch": 571} {"train_loss": -5.367891311645508, "global_step": 23997, "epoch": 571} {"train_loss": -5.299256324768066, "global_step": 23998, "epoch": 571} {"train_loss": -5.457835674285889, "global_step": 23999, "epoch": 571} {"train_loss": -5.460418701171875, "global_step": 24000, "epoch": 571} {"train_loss": -5.403939723968506, "global_step": 24001, "epoch": 571} {"train_loss": -5.421536445617676, "global_step": 24002, "epoch": 571} {"train_loss": -5.473820686340332, "global_step": 24003, "epoch": 571} {"train_loss": -5.394311904907227, "global_step": 24004, "epoch": 571} {"train_loss": -5.460481643676758, "global_step": 24005, "epoch": 571} {"train_loss": -5.371613025665283, "global_step": 24006, "epoch": 571} {"train_loss": -5.4884185791015625, "global_step": 24007, "epoch": 571} {"train_loss": -5.369152069091797, "global_step": 24008, "epoch": 571} {"train_loss": -5.435031890869141, "global_step": 24009, "epoch": 571} {"train_loss": -5.354188442230225, "global_step": 24010, "epoch": 571} {"train_loss": -5.469925880432129, "global_step": 24011, "epoch": 571} {"train_loss": -5.462501525878906, "global_step": 24012, "epoch": 571} {"train_loss": -5.369217395782471, "global_step": 24013, "epoch": 571} {"train_loss": -5.310756206512451, "global_step": 24014, "epoch": 571} {"train_loss": -5.480214595794678, "global_step": 24015, "epoch": 571} {"train_loss": -5.379336357116699, "global_step": 24016, "epoch": 571} {"train_loss": -5.465424537658691, "global_step": 24017, "epoch": 571} {"train_loss": -5.248019218444824, "global_step": 24018, "epoch": 571} {"train_loss": -5.463321685791016, "global_step": 24019, "epoch": 571} {"train_loss": -5.474027156829834, "global_step": 24020, "epoch": 571} {"train_loss": -5.414435386657715, "global_step": 24021, "epoch": 571} {"train_loss": -5.385878562927246, "global_step": 24022, "epoch": 571} {"train_loss": -5.397062119983492, "global_step": 24023, "epoch": 571, "val_loss": 68331.375} {"train_loss": -5.303215503692627, "global_step": 24024, "epoch": 572} {"train_loss": -5.268194675445557, "global_step": 24025, "epoch": 572} {"train_loss": -5.444437026977539, "global_step": 24026, "epoch": 572} {"train_loss": -5.3188276290893555, "global_step": 24027, "epoch": 572} {"train_loss": -5.394754409790039, "global_step": 24028, "epoch": 572} {"train_loss": -5.31949520111084, "global_step": 24029, "epoch": 572} {"train_loss": -5.470728874206543, "global_step": 24030, "epoch": 572} {"train_loss": -5.352076053619385, "global_step": 24031, "epoch": 572} {"train_loss": -5.432894229888916, "global_step": 24032, "epoch": 572} {"train_loss": -5.42047119140625, "global_step": 24033, "epoch": 572} {"train_loss": -5.454732894897461, "global_step": 24034, "epoch": 572} {"train_loss": -5.4125261306762695, "global_step": 24035, "epoch": 572} {"train_loss": -5.400552749633789, "global_step": 24036, "epoch": 572} {"train_loss": -5.4250922203063965, "global_step": 24037, "epoch": 572} {"train_loss": -5.3337297439575195, "global_step": 24038, "epoch": 572} {"train_loss": -5.420685291290283, "global_step": 24039, "epoch": 572} {"train_loss": -5.310737133026123, "global_step": 24040, "epoch": 572} {"train_loss": -5.304255485534668, "global_step": 24041, "epoch": 572} {"train_loss": -5.332111835479736, "global_step": 24042, "epoch": 572} {"train_loss": -5.512396812438965, "global_step": 24043, "epoch": 572} {"train_loss": -5.361597061157227, "global_step": 24044, "epoch": 572} {"train_loss": -5.377988338470459, "global_step": 24045, "epoch": 572} {"train_loss": -5.342275619506836, "global_step": 24046, "epoch": 572} {"train_loss": -5.477487564086914, "global_step": 24047, "epoch": 572} {"train_loss": -5.462281227111816, "global_step": 24048, "epoch": 572} {"train_loss": -5.463902473449707, "global_step": 24049, "epoch": 572} {"train_loss": -5.432236671447754, "global_step": 24050, "epoch": 572} {"train_loss": -5.277917861938477, "global_step": 24051, "epoch": 572} {"train_loss": -5.443966388702393, "global_step": 24052, "epoch": 572} {"train_loss": -5.399341583251953, "global_step": 24053, "epoch": 572} {"train_loss": -5.389621734619141, "global_step": 24054, "epoch": 572} {"train_loss": -5.355563640594482, "global_step": 24055, "epoch": 572} {"train_loss": -5.3734002113342285, "global_step": 24056, "epoch": 572} {"train_loss": -5.32082462310791, "global_step": 24057, "epoch": 572} {"train_loss": -5.490765571594238, "global_step": 24058, "epoch": 572} {"train_loss": -5.373702526092529, "global_step": 24059, "epoch": 572} {"train_loss": -5.330901145935059, "global_step": 24060, "epoch": 572} {"train_loss": -5.408534049987793, "global_step": 24061, "epoch": 572} {"train_loss": -5.418349266052246, "global_step": 24062, "epoch": 572} {"train_loss": -5.4888458251953125, "global_step": 24063, "epoch": 572} {"train_loss": -5.420619010925293, "global_step": 24064, "epoch": 572} {"train_loss": -5.3885815143585205, "global_step": 24065, "epoch": 572, "val_loss": 67743.0078125} {"train_loss": -5.320876121520996, "global_step": 24066, "epoch": 573} {"train_loss": -5.2913618087768555, "global_step": 24067, "epoch": 573} {"train_loss": -5.311940670013428, "global_step": 24068, "epoch": 573} {"train_loss": -5.4406232833862305, "global_step": 24069, "epoch": 573} {"train_loss": -5.246461391448975, "global_step": 24070, "epoch": 573} {"train_loss": -5.3531951904296875, "global_step": 24071, "epoch": 573} {"train_loss": -5.402912139892578, "global_step": 24072, "epoch": 573} {"train_loss": -5.349407196044922, "global_step": 24073, "epoch": 573} {"train_loss": -5.500189781188965, "global_step": 24074, "epoch": 573} {"train_loss": -5.329336166381836, "global_step": 24075, "epoch": 573} {"train_loss": -5.282125949859619, "global_step": 24076, "epoch": 573} {"train_loss": -5.462408065795898, "global_step": 24077, "epoch": 573} {"train_loss": -5.339601516723633, "global_step": 24078, "epoch": 573} {"train_loss": -5.4306817054748535, "global_step": 24079, "epoch": 573} {"train_loss": -5.417140960693359, "global_step": 24080, "epoch": 573} {"train_loss": -5.307744979858398, "global_step": 24081, "epoch": 573} {"train_loss": -5.362301826477051, "global_step": 24082, "epoch": 573} {"train_loss": -5.33631706237793, "global_step": 24083, "epoch": 573} {"train_loss": -5.162629127502441, "global_step": 24084, "epoch": 573} {"train_loss": -5.361173629760742, "global_step": 24085, "epoch": 573} {"train_loss": -5.284206867218018, "global_step": 24086, "epoch": 573} {"train_loss": -5.380892753601074, "global_step": 24087, "epoch": 573} {"train_loss": -5.205461502075195, "global_step": 24088, "epoch": 573} {"train_loss": -5.267610549926758, "global_step": 24089, "epoch": 573} {"train_loss": -5.196131229400635, "global_step": 24090, "epoch": 573} {"train_loss": -5.3596343994140625, "global_step": 24091, "epoch": 573} {"train_loss": -5.357938766479492, "global_step": 24092, "epoch": 573} {"train_loss": -5.426758766174316, "global_step": 24093, "epoch": 573} {"train_loss": -5.551804065704346, "global_step": 24094, "epoch": 573} {"train_loss": -5.368844509124756, "global_step": 24095, "epoch": 573} {"train_loss": -5.418886184692383, "global_step": 24096, "epoch": 573} {"train_loss": -5.428466320037842, "global_step": 24097, "epoch": 573} {"train_loss": -5.437646389007568, "global_step": 24098, "epoch": 573} {"train_loss": -5.535141944885254, "global_step": 24099, "epoch": 573} {"train_loss": -5.270887851715088, "global_step": 24100, "epoch": 573} {"train_loss": -5.376271724700928, "global_step": 24101, "epoch": 573} {"train_loss": -5.330718994140625, "global_step": 24102, "epoch": 573} {"train_loss": -5.3503875732421875, "global_step": 24103, "epoch": 573} {"train_loss": -5.342752933502197, "global_step": 24104, "epoch": 573} {"train_loss": -5.500707626342773, "global_step": 24105, "epoch": 573} {"train_loss": -5.309112548828125, "global_step": 24106, "epoch": 573} {"train_loss": -5.360000871476673, "global_step": 24107, "epoch": 573, "val_loss": 67705.265625} {"train_loss": -5.515419006347656, "global_step": 24108, "epoch": 574} {"train_loss": -5.438777923583984, "global_step": 24109, "epoch": 574} {"train_loss": -5.439574718475342, "global_step": 24110, "epoch": 574} {"train_loss": -5.377814292907715, "global_step": 24111, "epoch": 574} {"train_loss": -5.408953666687012, "global_step": 24112, "epoch": 574} {"train_loss": -5.276739120483398, "global_step": 24113, "epoch": 574} {"train_loss": -5.4063191413879395, "global_step": 24114, "epoch": 574} {"train_loss": -5.461056709289551, "global_step": 24115, "epoch": 574} {"train_loss": -5.513022422790527, "global_step": 24116, "epoch": 574} {"train_loss": -5.4351019859313965, "global_step": 24117, "epoch": 574} {"train_loss": -5.40889835357666, "global_step": 24118, "epoch": 574} {"train_loss": -5.384956359863281, "global_step": 24119, "epoch": 574} {"train_loss": -5.285369873046875, "global_step": 24120, "epoch": 574} {"train_loss": -5.474147796630859, "global_step": 24121, "epoch": 574} {"train_loss": -5.335615634918213, "global_step": 24122, "epoch": 574} {"train_loss": -5.389248847961426, "global_step": 24123, "epoch": 574} {"train_loss": -5.3675150871276855, "global_step": 24124, "epoch": 574} {"train_loss": -5.318233013153076, "global_step": 24125, "epoch": 574} {"train_loss": -5.4168291091918945, "global_step": 24126, "epoch": 574} {"train_loss": -5.3870038986206055, "global_step": 24127, "epoch": 574} {"train_loss": -5.46092414855957, "global_step": 24128, "epoch": 574} {"train_loss": -5.408422470092773, "global_step": 24129, "epoch": 574} {"train_loss": -5.345183372497559, "global_step": 24130, "epoch": 574} {"train_loss": -5.2524189949035645, "global_step": 24131, "epoch": 574} {"train_loss": -5.437070846557617, "global_step": 24132, "epoch": 574} {"train_loss": -5.3358540534973145, "global_step": 24133, "epoch": 574} {"train_loss": -5.429262638092041, "global_step": 24134, "epoch": 574} {"train_loss": -5.389217853546143, "global_step": 24135, "epoch": 574} {"train_loss": -5.426314353942871, "global_step": 24136, "epoch": 574} {"train_loss": -5.3065690994262695, "global_step": 24137, "epoch": 574} {"train_loss": -5.349700927734375, "global_step": 24138, "epoch": 574} {"train_loss": -5.429385185241699, "global_step": 24139, "epoch": 574} {"train_loss": -5.352544784545898, "global_step": 24140, "epoch": 574} {"train_loss": -5.324807643890381, "global_step": 24141, "epoch": 574} {"train_loss": -5.367735385894775, "global_step": 24142, "epoch": 574} {"train_loss": -5.5149078369140625, "global_step": 24143, "epoch": 574} {"train_loss": -5.39511775970459, "global_step": 24144, "epoch": 574} {"train_loss": -5.143174648284912, "global_step": 24145, "epoch": 574} {"train_loss": -5.364590644836426, "global_step": 24146, "epoch": 574} {"train_loss": -5.411218643188477, "global_step": 24147, "epoch": 574} {"train_loss": -5.301543235778809, "global_step": 24148, "epoch": 574} {"train_loss": -5.386814980279832, "global_step": 24149, "epoch": 574, "val_loss": 67823.4140625} {"train_loss": -5.454958915710449, "global_step": 24150, "epoch": 575} {"train_loss": -5.383843421936035, "global_step": 24151, "epoch": 575} {"train_loss": -5.415372848510742, "global_step": 24152, "epoch": 575} {"train_loss": -5.333191871643066, "global_step": 24153, "epoch": 575} {"train_loss": -5.301937103271484, "global_step": 24154, "epoch": 575} {"train_loss": -5.3227057456970215, "global_step": 24155, "epoch": 575} {"train_loss": -5.488346576690674, "global_step": 24156, "epoch": 575} {"train_loss": -5.273746490478516, "global_step": 24157, "epoch": 575} {"train_loss": -5.301855564117432, "global_step": 24158, "epoch": 575} {"train_loss": -5.532243728637695, "global_step": 24159, "epoch": 575} {"train_loss": -5.379913330078125, "global_step": 24160, "epoch": 575} {"train_loss": -5.445217132568359, "global_step": 24161, "epoch": 575} {"train_loss": -5.320919513702393, "global_step": 24162, "epoch": 575} {"train_loss": -5.412500381469727, "global_step": 24163, "epoch": 575} {"train_loss": -5.286137580871582, "global_step": 24164, "epoch": 575} {"train_loss": -5.361260414123535, "global_step": 24165, "epoch": 575} {"train_loss": -5.364492416381836, "global_step": 24166, "epoch": 575} {"train_loss": -5.476466178894043, "global_step": 24167, "epoch": 575} {"train_loss": -5.258449554443359, "global_step": 24168, "epoch": 575} {"train_loss": -5.382513046264648, "global_step": 24169, "epoch": 575} {"train_loss": -5.324130058288574, "global_step": 24170, "epoch": 575} {"train_loss": -5.3775954246521, "global_step": 24171, "epoch": 575} {"train_loss": -5.309277534484863, "global_step": 24172, "epoch": 575} {"train_loss": -5.4161882400512695, "global_step": 24173, "epoch": 575} {"train_loss": -5.482391357421875, "global_step": 24174, "epoch": 575} {"train_loss": -5.452188491821289, "global_step": 24175, "epoch": 575} {"train_loss": -5.436494827270508, "global_step": 24176, "epoch": 575} {"train_loss": -5.304961204528809, "global_step": 24177, "epoch": 575} {"train_loss": -5.255799293518066, "global_step": 24178, "epoch": 575} {"train_loss": -5.415872573852539, "global_step": 24179, "epoch": 575} {"train_loss": -5.4774651527404785, "global_step": 24180, "epoch": 575} {"train_loss": -5.308652877807617, "global_step": 24181, "epoch": 575} {"train_loss": -5.442082405090332, "global_step": 24182, "epoch": 575} {"train_loss": -5.379514217376709, "global_step": 24183, "epoch": 575} {"train_loss": -5.3199462890625, "global_step": 24184, "epoch": 575} {"train_loss": -5.450341701507568, "global_step": 24185, "epoch": 575} {"train_loss": -5.398198127746582, "global_step": 24186, "epoch": 575} {"train_loss": -5.341549873352051, "global_step": 24187, "epoch": 575} {"train_loss": -5.388189315795898, "global_step": 24188, "epoch": 575} {"train_loss": -5.2211432456970215, "global_step": 24189, "epoch": 575} {"train_loss": -5.272207260131836, "global_step": 24190, "epoch": 575} {"train_loss": -5.3708886078425815, "global_step": 24191, "epoch": 575, "val_loss": 68051.2421875} {"train_loss": -5.310859203338623, "global_step": 24192, "epoch": 576} {"train_loss": -5.353642463684082, "global_step": 24193, "epoch": 576} {"train_loss": -5.247725486755371, "global_step": 24194, "epoch": 576} {"train_loss": -5.416326522827148, "global_step": 24195, "epoch": 576} {"train_loss": -5.32305908203125, "global_step": 24196, "epoch": 576} {"train_loss": -5.3465094566345215, "global_step": 24197, "epoch": 576} {"train_loss": -5.3235859870910645, "global_step": 24198, "epoch": 576} {"train_loss": -5.20322322845459, "global_step": 24199, "epoch": 576} {"train_loss": -5.4063215255737305, "global_step": 24200, "epoch": 576} {"train_loss": -5.166714191436768, "global_step": 24201, "epoch": 576} {"train_loss": -5.31146240234375, "global_step": 24202, "epoch": 576} {"train_loss": -5.384518623352051, "global_step": 24203, "epoch": 576} {"train_loss": -5.39687442779541, "global_step": 24204, "epoch": 576} {"train_loss": -5.4724273681640625, "global_step": 24205, "epoch": 576} {"train_loss": -5.365111351013184, "global_step": 24206, "epoch": 576} {"train_loss": -5.357181549072266, "global_step": 24207, "epoch": 576} {"train_loss": -5.35965633392334, "global_step": 24208, "epoch": 576} {"train_loss": -5.443251609802246, "global_step": 24209, "epoch": 576} {"train_loss": -5.379065036773682, "global_step": 24210, "epoch": 576} {"train_loss": -5.507927894592285, "global_step": 24211, "epoch": 576} {"train_loss": -5.443556308746338, "global_step": 24212, "epoch": 576} {"train_loss": -5.328765869140625, "global_step": 24213, "epoch": 576} {"train_loss": -5.409746170043945, "global_step": 24214, "epoch": 576} {"train_loss": -5.4742431640625, "global_step": 24215, "epoch": 576} {"train_loss": -5.27358341217041, "global_step": 24216, "epoch": 576} {"train_loss": -5.366452693939209, "global_step": 24217, "epoch": 576} {"train_loss": -5.3272905349731445, "global_step": 24218, "epoch": 576} {"train_loss": -5.423439025878906, "global_step": 24219, "epoch": 576} {"train_loss": -5.42770528793335, "global_step": 24220, "epoch": 576} {"train_loss": -5.397131443023682, "global_step": 24221, "epoch": 576} {"train_loss": -5.2447028160095215, "global_step": 24222, "epoch": 576} {"train_loss": -5.403246879577637, "global_step": 24223, "epoch": 576} {"train_loss": -5.404776573181152, "global_step": 24224, "epoch": 576} {"train_loss": -5.198786735534668, "global_step": 24225, "epoch": 576} {"train_loss": -5.30227518081665, "global_step": 24226, "epoch": 576} {"train_loss": -5.3608784675598145, "global_step": 24227, "epoch": 576} {"train_loss": -5.194779396057129, "global_step": 24228, "epoch": 576} {"train_loss": -5.371115207672119, "global_step": 24229, "epoch": 576} {"train_loss": -5.406207084655762, "global_step": 24230, "epoch": 576} {"train_loss": -5.431116104125977, "global_step": 24231, "epoch": 576} {"train_loss": -5.432713508605957, "global_step": 24232, "epoch": 576} {"train_loss": -5.357986427488781, "global_step": 24233, "epoch": 576, "val_loss": 67970.703125} {"train_loss": -5.384462356567383, "global_step": 24234, "epoch": 577} {"train_loss": -5.3742828369140625, "global_step": 24235, "epoch": 577} {"train_loss": -5.461711883544922, "global_step": 24236, "epoch": 577} {"train_loss": -5.379667282104492, "global_step": 24237, "epoch": 577} {"train_loss": -5.3184814453125, "global_step": 24238, "epoch": 577} {"train_loss": -5.516401767730713, "global_step": 24239, "epoch": 577} {"train_loss": -5.382172584533691, "global_step": 24240, "epoch": 577} {"train_loss": -5.4275898933410645, "global_step": 24241, "epoch": 577} {"train_loss": -5.381120204925537, "global_step": 24242, "epoch": 577} {"train_loss": -5.351593017578125, "global_step": 24243, "epoch": 577} {"train_loss": -5.458345890045166, "global_step": 24244, "epoch": 577} {"train_loss": -5.431520462036133, "global_step": 24245, "epoch": 577} {"train_loss": -5.309170722961426, "global_step": 24246, "epoch": 577} {"train_loss": -5.445959091186523, "global_step": 24247, "epoch": 577} {"train_loss": -5.441749572753906, "global_step": 24248, "epoch": 577} {"train_loss": -5.4304585456848145, "global_step": 24249, "epoch": 577} {"train_loss": -5.366377353668213, "global_step": 24250, "epoch": 577} {"train_loss": -5.511421203613281, "global_step": 24251, "epoch": 577} {"train_loss": -5.479903221130371, "global_step": 24252, "epoch": 577} {"train_loss": -5.415399551391602, "global_step": 24253, "epoch": 577} {"train_loss": -5.352016448974609, "global_step": 24254, "epoch": 577} {"train_loss": -5.38640022277832, "global_step": 24255, "epoch": 577} {"train_loss": -5.440436363220215, "global_step": 24256, "epoch": 577} {"train_loss": -5.3491411209106445, "global_step": 24257, "epoch": 577} {"train_loss": -5.27485466003418, "global_step": 24258, "epoch": 577} {"train_loss": -5.394559860229492, "global_step": 24259, "epoch": 577} {"train_loss": -5.349817276000977, "global_step": 24260, "epoch": 577} {"train_loss": -5.427655220031738, "global_step": 24261, "epoch": 577} {"train_loss": -5.337096214294434, "global_step": 24262, "epoch": 577} {"train_loss": -5.410506248474121, "global_step": 24263, "epoch": 577} {"train_loss": -5.323404312133789, "global_step": 24264, "epoch": 577} {"train_loss": -5.364304065704346, "global_step": 24265, "epoch": 577} {"train_loss": -5.355482578277588, "global_step": 24266, "epoch": 577} {"train_loss": -5.411478042602539, "global_step": 24267, "epoch": 577} {"train_loss": -5.290895938873291, "global_step": 24268, "epoch": 577} {"train_loss": -5.436305522918701, "global_step": 24269, "epoch": 577} {"train_loss": -5.233072757720947, "global_step": 24270, "epoch": 577} {"train_loss": -5.289758205413818, "global_step": 24271, "epoch": 577} {"train_loss": -5.332729339599609, "global_step": 24272, "epoch": 577} {"train_loss": -5.207613945007324, "global_step": 24273, "epoch": 577} {"train_loss": -5.306587219238281, "global_step": 24274, "epoch": 577} {"train_loss": -5.377276693071638, "global_step": 24275, "epoch": 577, "val_loss": 67770.7421875} {"train_loss": -5.339613914489746, "global_step": 24276, "epoch": 578} {"train_loss": -5.3206682205200195, "global_step": 24277, "epoch": 578} {"train_loss": -5.355075836181641, "global_step": 24278, "epoch": 578} {"train_loss": -5.477164268493652, "global_step": 24279, "epoch": 578} {"train_loss": -5.414599418640137, "global_step": 24280, "epoch": 578} {"train_loss": -5.380911827087402, "global_step": 24281, "epoch": 578} {"train_loss": -5.315542221069336, "global_step": 24282, "epoch": 578} {"train_loss": -5.390788555145264, "global_step": 24283, "epoch": 578} {"train_loss": -5.37406063079834, "global_step": 24284, "epoch": 578} {"train_loss": -5.358059883117676, "global_step": 24285, "epoch": 578} {"train_loss": -5.473738193511963, "global_step": 24286, "epoch": 578} {"train_loss": -5.295737266540527, "global_step": 24287, "epoch": 578} {"train_loss": -5.331479072570801, "global_step": 24288, "epoch": 578} {"train_loss": -5.470252990722656, "global_step": 24289, "epoch": 578} {"train_loss": -5.3383402824401855, "global_step": 24290, "epoch": 578} {"train_loss": -5.396763801574707, "global_step": 24291, "epoch": 578} {"train_loss": -5.308773040771484, "global_step": 24292, "epoch": 578} {"train_loss": -5.424260139465332, "global_step": 24293, "epoch": 578} {"train_loss": -5.3992414474487305, "global_step": 24294, "epoch": 578} {"train_loss": -5.425858497619629, "global_step": 24295, "epoch": 578} {"train_loss": -5.509641647338867, "global_step": 24296, "epoch": 578} {"train_loss": -5.352362632751465, "global_step": 24297, "epoch": 578} {"train_loss": -5.4682440757751465, "global_step": 24298, "epoch": 578} {"train_loss": -5.489912033081055, "global_step": 24299, "epoch": 578} {"train_loss": -5.431690216064453, "global_step": 24300, "epoch": 578} {"train_loss": -5.601291656494141, "global_step": 24301, "epoch": 578} {"train_loss": -5.433897972106934, "global_step": 24302, "epoch": 578} {"train_loss": -5.309751033782959, "global_step": 24303, "epoch": 578} {"train_loss": -5.324361801147461, "global_step": 24304, "epoch": 578} {"train_loss": -5.4617204666137695, "global_step": 24305, "epoch": 578} {"train_loss": -5.38884162902832, "global_step": 24306, "epoch": 578} {"train_loss": -5.245692253112793, "global_step": 24307, "epoch": 578} {"train_loss": -5.505158424377441, "global_step": 24308, "epoch": 578} {"train_loss": -5.433749198913574, "global_step": 24309, "epoch": 578} {"train_loss": -5.462767601013184, "global_step": 24310, "epoch": 578} {"train_loss": -5.442610740661621, "global_step": 24311, "epoch": 578} {"train_loss": -5.511394023895264, "global_step": 24312, "epoch": 578} {"train_loss": -5.472970008850098, "global_step": 24313, "epoch": 578} {"train_loss": -5.333136558532715, "global_step": 24314, "epoch": 578} {"train_loss": -5.386714935302734, "global_step": 24315, "epoch": 578} {"train_loss": -5.318565368652344, "global_step": 24316, "epoch": 578} {"train_loss": -5.40132905188061, "global_step": 24317, "epoch": 578, "val_loss": 68540.265625} {"train_loss": -5.4705400466918945, "global_step": 24318, "epoch": 579} {"train_loss": -5.394957542419434, "global_step": 24319, "epoch": 579} {"train_loss": -5.3194708824157715, "global_step": 24320, "epoch": 579} {"train_loss": -5.463691711425781, "global_step": 24321, "epoch": 579} {"train_loss": -5.415572166442871, "global_step": 24322, "epoch": 579} {"train_loss": -5.474703788757324, "global_step": 24323, "epoch": 579} {"train_loss": -5.268674850463867, "global_step": 24324, "epoch": 579} {"train_loss": -5.532476425170898, "global_step": 24325, "epoch": 579} {"train_loss": -5.235901832580566, "global_step": 24326, "epoch": 579} {"train_loss": -5.583206653594971, "global_step": 24327, "epoch": 579} {"train_loss": -5.481103897094727, "global_step": 24328, "epoch": 579} {"train_loss": -5.406087875366211, "global_step": 24329, "epoch": 579} {"train_loss": -5.423036575317383, "global_step": 24330, "epoch": 579} {"train_loss": -5.481484413146973, "global_step": 24331, "epoch": 579} {"train_loss": -5.211648941040039, "global_step": 24332, "epoch": 579} {"train_loss": -5.380089282989502, "global_step": 24333, "epoch": 579} {"train_loss": -5.485540866851807, "global_step": 24334, "epoch": 579} {"train_loss": -5.440438270568848, "global_step": 24335, "epoch": 579} {"train_loss": -5.376208782196045, "global_step": 24336, "epoch": 579} {"train_loss": -5.408511161804199, "global_step": 24337, "epoch": 579} {"train_loss": -5.478978633880615, "global_step": 24338, "epoch": 579} {"train_loss": -5.3563385009765625, "global_step": 24339, "epoch": 579} {"train_loss": -5.410228729248047, "global_step": 24340, "epoch": 579} {"train_loss": -5.523275375366211, "global_step": 24341, "epoch": 579} {"train_loss": -5.471999168395996, "global_step": 24342, "epoch": 579} {"train_loss": -5.230874061584473, "global_step": 24343, "epoch": 579} {"train_loss": -5.413888931274414, "global_step": 24344, "epoch": 579} {"train_loss": -5.346652030944824, "global_step": 24345, "epoch": 579} {"train_loss": -5.261173725128174, "global_step": 24346, "epoch": 579} {"train_loss": -5.167505264282227, "global_step": 24347, "epoch": 579} {"train_loss": -5.192836761474609, "global_step": 24348, "epoch": 579} {"train_loss": -5.1834869384765625, "global_step": 24349, "epoch": 579} {"train_loss": -5.373404502868652, "global_step": 24350, "epoch": 579} {"train_loss": -5.22130012512207, "global_step": 24351, "epoch": 579} {"train_loss": -5.178016185760498, "global_step": 24352, "epoch": 579} {"train_loss": -5.3354082107543945, "global_step": 24353, "epoch": 579} {"train_loss": -5.272075653076172, "global_step": 24354, "epoch": 579} {"train_loss": -5.396919250488281, "global_step": 24355, "epoch": 579} {"train_loss": -5.2642717361450195, "global_step": 24356, "epoch": 579} {"train_loss": -5.3629255294799805, "global_step": 24357, "epoch": 579} {"train_loss": -5.291849136352539, "global_step": 24358, "epoch": 579} {"train_loss": -5.364651623226347, "global_step": 24359, "epoch": 579, "val_loss": 68029.265625} {"train_loss": -5.341739654541016, "global_step": 24360, "epoch": 580} {"train_loss": -5.312841415405273, "global_step": 24361, "epoch": 580} {"train_loss": -5.34223747253418, "global_step": 24362, "epoch": 580} {"train_loss": -5.20986795425415, "global_step": 24363, "epoch": 580} {"train_loss": -5.450471878051758, "global_step": 24364, "epoch": 580} {"train_loss": -5.407153129577637, "global_step": 24365, "epoch": 580} {"train_loss": -5.442757606506348, "global_step": 24366, "epoch": 580} {"train_loss": -5.284271240234375, "global_step": 24367, "epoch": 580} {"train_loss": -5.314304351806641, "global_step": 24368, "epoch": 580} {"train_loss": -5.474211692810059, "global_step": 24369, "epoch": 580} {"train_loss": -5.317791938781738, "global_step": 24370, "epoch": 580} {"train_loss": -5.440993309020996, "global_step": 24371, "epoch": 580} {"train_loss": -5.4218668937683105, "global_step": 24372, "epoch": 580} {"train_loss": -5.3167243003845215, "global_step": 24373, "epoch": 580} {"train_loss": -5.304742336273193, "global_step": 24374, "epoch": 580} {"train_loss": -5.412361145019531, "global_step": 24375, "epoch": 580} {"train_loss": -5.35847806930542, "global_step": 24376, "epoch": 580} {"train_loss": -5.375091552734375, "global_step": 24377, "epoch": 580} {"train_loss": -5.31645393371582, "global_step": 24378, "epoch": 580} {"train_loss": -5.3295087814331055, "global_step": 24379, "epoch": 580} {"train_loss": -5.233138561248779, "global_step": 24380, "epoch": 580} {"train_loss": -5.442375183105469, "global_step": 24381, "epoch": 580} {"train_loss": -5.312782287597656, "global_step": 24382, "epoch": 580} {"train_loss": -5.43060827255249, "global_step": 24383, "epoch": 580} {"train_loss": -5.451313495635986, "global_step": 24384, "epoch": 580} {"train_loss": -5.35213565826416, "global_step": 24385, "epoch": 580} {"train_loss": -5.335651397705078, "global_step": 24386, "epoch": 580} {"train_loss": -5.437119483947754, "global_step": 24387, "epoch": 580} {"train_loss": -5.368488788604736, "global_step": 24388, "epoch": 580} {"train_loss": -5.447641372680664, "global_step": 24389, "epoch": 580} {"train_loss": -5.519550323486328, "global_step": 24390, "epoch": 580} {"train_loss": -5.502223968505859, "global_step": 24391, "epoch": 580} {"train_loss": -5.3772759437561035, "global_step": 24392, "epoch": 580} {"train_loss": -5.222586631774902, "global_step": 24393, "epoch": 580} {"train_loss": -5.418056488037109, "global_step": 24394, "epoch": 580} {"train_loss": -5.340244293212891, "global_step": 24395, "epoch": 580} {"train_loss": -5.342776298522949, "global_step": 24396, "epoch": 580} {"train_loss": -5.325812816619873, "global_step": 24397, "epoch": 580} {"train_loss": -5.362703800201416, "global_step": 24398, "epoch": 580} {"train_loss": -5.284502029418945, "global_step": 24399, "epoch": 580} {"train_loss": -5.440911293029785, "global_step": 24400, "epoch": 580} {"train_loss": -5.366402841749645, "global_step": 24401, "epoch": 580, "val_loss": 67989.1875} {"train_loss": -5.3443922996521, "global_step": 24402, "epoch": 581} {"train_loss": -5.465577125549316, "global_step": 24403, "epoch": 581} {"train_loss": -5.495456695556641, "global_step": 24404, "epoch": 581} {"train_loss": -5.567734718322754, "global_step": 24405, "epoch": 581} {"train_loss": -5.253929138183594, "global_step": 24406, "epoch": 581} {"train_loss": -5.378535747528076, "global_step": 24407, "epoch": 581} {"train_loss": -5.416962623596191, "global_step": 24408, "epoch": 581} {"train_loss": -5.237079620361328, "global_step": 24409, "epoch": 581} {"train_loss": -5.548990249633789, "global_step": 24410, "epoch": 581} {"train_loss": -5.405916213989258, "global_step": 24411, "epoch": 581} {"train_loss": -5.377728462219238, "global_step": 24412, "epoch": 581} {"train_loss": -5.50972843170166, "global_step": 24413, "epoch": 581} {"train_loss": -5.331472873687744, "global_step": 24414, "epoch": 581} {"train_loss": -5.5064616203308105, "global_step": 24415, "epoch": 581} {"train_loss": -5.487389087677002, "global_step": 24416, "epoch": 581} {"train_loss": -5.335921287536621, "global_step": 24417, "epoch": 581} {"train_loss": -5.399107933044434, "global_step": 24418, "epoch": 581} {"train_loss": -5.293079376220703, "global_step": 24419, "epoch": 581} {"train_loss": -5.385332107543945, "global_step": 24420, "epoch": 581} {"train_loss": -5.440546035766602, "global_step": 24421, "epoch": 581} {"train_loss": -5.376559257507324, "global_step": 24422, "epoch": 581} {"train_loss": -5.179877758026123, "global_step": 24423, "epoch": 581} {"train_loss": -5.33934211730957, "global_step": 24424, "epoch": 581} {"train_loss": -5.3131842613220215, "global_step": 24425, "epoch": 581} {"train_loss": -5.419726371765137, "global_step": 24426, "epoch": 581} {"train_loss": -5.420182228088379, "global_step": 24427, "epoch": 581} {"train_loss": -5.34390115737915, "global_step": 24428, "epoch": 581} {"train_loss": -5.463879108428955, "global_step": 24429, "epoch": 581} {"train_loss": -5.502662181854248, "global_step": 24430, "epoch": 581} {"train_loss": -5.4122233390808105, "global_step": 24431, "epoch": 581} {"train_loss": -5.272313117980957, "global_step": 24432, "epoch": 581} {"train_loss": -5.216081142425537, "global_step": 24433, "epoch": 581} {"train_loss": -5.272763252258301, "global_step": 24434, "epoch": 581} {"train_loss": -5.293633460998535, "global_step": 24435, "epoch": 581} {"train_loss": -5.1578569412231445, "global_step": 24436, "epoch": 581} {"train_loss": -5.485786437988281, "global_step": 24437, "epoch": 581} {"train_loss": -5.336928367614746, "global_step": 24438, "epoch": 581} {"train_loss": -5.402994155883789, "global_step": 24439, "epoch": 581} {"train_loss": -5.353967666625977, "global_step": 24440, "epoch": 581} {"train_loss": -5.250608444213867, "global_step": 24441, "epoch": 581} {"train_loss": -5.333517074584961, "global_step": 24442, "epoch": 581} {"train_loss": -5.374026082810902, "global_step": 24443, "epoch": 581, "val_loss": 68044.109375} {"train_loss": -5.351953506469727, "global_step": 24444, "epoch": 582} {"train_loss": -5.267031192779541, "global_step": 24445, "epoch": 582} {"train_loss": -5.357516288757324, "global_step": 24446, "epoch": 582} {"train_loss": -5.356719017028809, "global_step": 24447, "epoch": 582} {"train_loss": -5.213251113891602, "global_step": 24448, "epoch": 582} {"train_loss": -5.469472885131836, "global_step": 24449, "epoch": 582} {"train_loss": -5.444612503051758, "global_step": 24450, "epoch": 582} {"train_loss": -5.373064994812012, "global_step": 24451, "epoch": 582} {"train_loss": -5.364195346832275, "global_step": 24452, "epoch": 582} {"train_loss": -5.382393836975098, "global_step": 24453, "epoch": 582} {"train_loss": -5.359747886657715, "global_step": 24454, "epoch": 582} {"train_loss": -5.450078010559082, "global_step": 24455, "epoch": 582} {"train_loss": -5.3918657302856445, "global_step": 24456, "epoch": 582} {"train_loss": -5.443904876708984, "global_step": 24457, "epoch": 582} {"train_loss": -5.408247470855713, "global_step": 24458, "epoch": 582} {"train_loss": -5.191717147827148, "global_step": 24459, "epoch": 582} {"train_loss": -5.373640060424805, "global_step": 24460, "epoch": 582} {"train_loss": -5.3540239334106445, "global_step": 24461, "epoch": 582} {"train_loss": -5.429387092590332, "global_step": 24462, "epoch": 582} {"train_loss": -5.415834426879883, "global_step": 24463, "epoch": 582} {"train_loss": -5.479372978210449, "global_step": 24464, "epoch": 582} {"train_loss": -5.419535160064697, "global_step": 24465, "epoch": 582} {"train_loss": -5.312772750854492, "global_step": 24466, "epoch": 582} {"train_loss": -5.476625442504883, "global_step": 24467, "epoch": 582} {"train_loss": -5.439133644104004, "global_step": 24468, "epoch": 582} {"train_loss": -5.416322708129883, "global_step": 24469, "epoch": 582} {"train_loss": -5.4835124015808105, "global_step": 24470, "epoch": 582} {"train_loss": -5.3341498374938965, "global_step": 24471, "epoch": 582} {"train_loss": -5.508368968963623, "global_step": 24472, "epoch": 582} {"train_loss": -5.294272422790527, "global_step": 24473, "epoch": 582} {"train_loss": -5.310026168823242, "global_step": 24474, "epoch": 582} {"train_loss": -5.301220893859863, "global_step": 24475, "epoch": 582} {"train_loss": -5.460047721862793, "global_step": 24476, "epoch": 582} {"train_loss": -5.3293914794921875, "global_step": 24477, "epoch": 582} {"train_loss": -5.4912590980529785, "global_step": 24478, "epoch": 582} {"train_loss": -5.441742897033691, "global_step": 24479, "epoch": 582} {"train_loss": -5.3599443435668945, "global_step": 24480, "epoch": 582} {"train_loss": -5.461272239685059, "global_step": 24481, "epoch": 582} {"train_loss": -5.27145528793335, "global_step": 24482, "epoch": 582} {"train_loss": -5.3389129638671875, "global_step": 24483, "epoch": 582} {"train_loss": -5.468849182128906, "global_step": 24484, "epoch": 582} {"train_loss": -5.3874038855234785, "global_step": 24485, "epoch": 582, "val_loss": 67755.3046875} {"train_loss": -5.450655460357666, "global_step": 24486, "epoch": 583} {"train_loss": -5.4568986892700195, "global_step": 24487, "epoch": 583} {"train_loss": -5.487459659576416, "global_step": 24488, "epoch": 583} {"train_loss": -5.451501846313477, "global_step": 24489, "epoch": 583} {"train_loss": -5.342245578765869, "global_step": 24490, "epoch": 583} {"train_loss": -5.512091636657715, "global_step": 24491, "epoch": 583} {"train_loss": -5.436710834503174, "global_step": 24492, "epoch": 583} {"train_loss": -5.374205589294434, "global_step": 24493, "epoch": 583} {"train_loss": -5.374042510986328, "global_step": 24494, "epoch": 583} {"train_loss": -5.401679992675781, "global_step": 24495, "epoch": 583} {"train_loss": -5.411480903625488, "global_step": 24496, "epoch": 583} {"train_loss": -5.345487594604492, "global_step": 24497, "epoch": 583} {"train_loss": -5.390369415283203, "global_step": 24498, "epoch": 583} {"train_loss": -5.484545707702637, "global_step": 24499, "epoch": 583} {"train_loss": -5.412819862365723, "global_step": 24500, "epoch": 583} {"train_loss": -5.425915718078613, "global_step": 24501, "epoch": 583} {"train_loss": -5.379846572875977, "global_step": 24502, "epoch": 583} {"train_loss": -5.328082084655762, "global_step": 24503, "epoch": 583} {"train_loss": -5.2413249015808105, "global_step": 24504, "epoch": 583} {"train_loss": -5.266674041748047, "global_step": 24505, "epoch": 583} {"train_loss": -5.335197925567627, "global_step": 24506, "epoch": 583} {"train_loss": -5.274201393127441, "global_step": 24507, "epoch": 583} {"train_loss": -5.499835968017578, "global_step": 24508, "epoch": 583} {"train_loss": -5.301067352294922, "global_step": 24509, "epoch": 583} {"train_loss": -5.228472709655762, "global_step": 24510, "epoch": 583} {"train_loss": -5.363606929779053, "global_step": 24511, "epoch": 583} {"train_loss": -5.32073450088501, "global_step": 24512, "epoch": 583} {"train_loss": -5.359226226806641, "global_step": 24513, "epoch": 583} {"train_loss": -5.43266487121582, "global_step": 24514, "epoch": 583} {"train_loss": -5.191112518310547, "global_step": 24515, "epoch": 583} {"train_loss": -5.417618751525879, "global_step": 24516, "epoch": 583} {"train_loss": -5.440606117248535, "global_step": 24517, "epoch": 583} {"train_loss": -5.413588523864746, "global_step": 24518, "epoch": 583} {"train_loss": -5.385010242462158, "global_step": 24519, "epoch": 583} {"train_loss": -5.327434062957764, "global_step": 24520, "epoch": 583} {"train_loss": -5.365629196166992, "global_step": 24521, "epoch": 583} {"train_loss": -5.376869201660156, "global_step": 24522, "epoch": 583} {"train_loss": -5.285482406616211, "global_step": 24523, "epoch": 583} {"train_loss": -5.489861011505127, "global_step": 24524, "epoch": 583} {"train_loss": -5.322685241699219, "global_step": 24525, "epoch": 583} {"train_loss": -5.50035285949707, "global_step": 24526, "epoch": 583} {"train_loss": -5.380128781000773, "global_step": 24527, "epoch": 583, "val_loss": 67701.5859375} {"train_loss": -5.33558988571167, "global_step": 24528, "epoch": 584} {"train_loss": -5.461387634277344, "global_step": 24529, "epoch": 584} {"train_loss": -5.374797821044922, "global_step": 24530, "epoch": 584} {"train_loss": -5.342075824737549, "global_step": 24531, "epoch": 584} {"train_loss": -5.400613784790039, "global_step": 24532, "epoch": 584} {"train_loss": -5.418376922607422, "global_step": 24533, "epoch": 584} {"train_loss": -5.360597610473633, "global_step": 24534, "epoch": 584} {"train_loss": -5.424365997314453, "global_step": 24535, "epoch": 584} {"train_loss": -5.469480514526367, "global_step": 24536, "epoch": 584} {"train_loss": -5.309013366699219, "global_step": 24537, "epoch": 584} {"train_loss": -5.367795944213867, "global_step": 24538, "epoch": 584} {"train_loss": -5.4510064125061035, "global_step": 24539, "epoch": 584} {"train_loss": -5.231082916259766, "global_step": 24540, "epoch": 584} {"train_loss": -5.441206932067871, "global_step": 24541, "epoch": 584} {"train_loss": -5.434811115264893, "global_step": 24542, "epoch": 584} {"train_loss": -5.411480903625488, "global_step": 24543, "epoch": 584} {"train_loss": -5.468938827514648, "global_step": 24544, "epoch": 584} {"train_loss": -5.30228328704834, "global_step": 24545, "epoch": 584} {"train_loss": -5.384658336639404, "global_step": 24546, "epoch": 584} {"train_loss": -5.401185989379883, "global_step": 24547, "epoch": 584} {"train_loss": -5.316740036010742, "global_step": 24548, "epoch": 584} {"train_loss": -5.271877288818359, "global_step": 24549, "epoch": 584} {"train_loss": -5.243202209472656, "global_step": 24550, "epoch": 584} {"train_loss": -5.441689491271973, "global_step": 24551, "epoch": 584} {"train_loss": -5.468265056610107, "global_step": 24552, "epoch": 584} {"train_loss": -5.46700382232666, "global_step": 24553, "epoch": 584} {"train_loss": -5.3441314697265625, "global_step": 24554, "epoch": 584} {"train_loss": -5.412026882171631, "global_step": 24555, "epoch": 584} {"train_loss": -5.298149108886719, "global_step": 24556, "epoch": 584} {"train_loss": -5.4186577796936035, "global_step": 24557, "epoch": 584} {"train_loss": -5.377427101135254, "global_step": 24558, "epoch": 584} {"train_loss": -5.380120277404785, "global_step": 24559, "epoch": 584} {"train_loss": -5.38700008392334, "global_step": 24560, "epoch": 584} {"train_loss": -5.4540510177612305, "global_step": 24561, "epoch": 584} {"train_loss": -5.464208602905273, "global_step": 24562, "epoch": 584} {"train_loss": -5.306037902832031, "global_step": 24563, "epoch": 584} {"train_loss": -5.391216278076172, "global_step": 24564, "epoch": 584} {"train_loss": -5.542810440063477, "global_step": 24565, "epoch": 584} {"train_loss": -5.34700345993042, "global_step": 24566, "epoch": 584} {"train_loss": -5.401401996612549, "global_step": 24567, "epoch": 584} {"train_loss": -5.395308017730713, "global_step": 24568, "epoch": 584} {"train_loss": -5.388661713827224, "global_step": 24569, "epoch": 584, "val_loss": 67963.6015625} {"train_loss": -5.3940582275390625, "global_step": 24570, "epoch": 585} {"train_loss": -5.542702674865723, "global_step": 24571, "epoch": 585} {"train_loss": -5.366757392883301, "global_step": 24572, "epoch": 585} {"train_loss": -5.360897064208984, "global_step": 24573, "epoch": 585} {"train_loss": -5.338481903076172, "global_step": 24574, "epoch": 585} {"train_loss": -5.496419906616211, "global_step": 24575, "epoch": 585} {"train_loss": -5.4071245193481445, "global_step": 24576, "epoch": 585} {"train_loss": -5.395398139953613, "global_step": 24577, "epoch": 585} {"train_loss": -5.224991798400879, "global_step": 24578, "epoch": 585} {"train_loss": -5.3373308181762695, "global_step": 24579, "epoch": 585} {"train_loss": -5.3412933349609375, "global_step": 24580, "epoch": 585} {"train_loss": -5.436755180358887, "global_step": 24581, "epoch": 585} {"train_loss": -5.48530912399292, "global_step": 24582, "epoch": 585} {"train_loss": -5.487504005432129, "global_step": 24583, "epoch": 585} {"train_loss": -5.362696647644043, "global_step": 24584, "epoch": 585} {"train_loss": -5.429257392883301, "global_step": 24585, "epoch": 585} {"train_loss": -5.390046119689941, "global_step": 24586, "epoch": 585} {"train_loss": -5.306387901306152, "global_step": 24587, "epoch": 585} {"train_loss": -5.467531204223633, "global_step": 24588, "epoch": 585} {"train_loss": -5.322542190551758, "global_step": 24589, "epoch": 585} {"train_loss": -5.376317024230957, "global_step": 24590, "epoch": 585} {"train_loss": -5.390750885009766, "global_step": 24591, "epoch": 585} {"train_loss": -5.433740615844727, "global_step": 24592, "epoch": 585} {"train_loss": -5.481472969055176, "global_step": 24593, "epoch": 585} {"train_loss": -5.61202335357666, "global_step": 24594, "epoch": 585} {"train_loss": -5.510568618774414, "global_step": 24595, "epoch": 585} {"train_loss": -5.481081962585449, "global_step": 24596, "epoch": 585} {"train_loss": -5.421848297119141, "global_step": 24597, "epoch": 585} {"train_loss": -5.555440902709961, "global_step": 24598, "epoch": 585} {"train_loss": -5.423932075500488, "global_step": 24599, "epoch": 585} {"train_loss": -5.310493469238281, "global_step": 24600, "epoch": 585} {"train_loss": -5.485480308532715, "global_step": 24601, "epoch": 585} {"train_loss": -5.450018405914307, "global_step": 24602, "epoch": 585} {"train_loss": -5.2853875160217285, "global_step": 24603, "epoch": 585} {"train_loss": -5.377313613891602, "global_step": 24604, "epoch": 585} {"train_loss": -5.3895673751831055, "global_step": 24605, "epoch": 585} {"train_loss": -5.346343517303467, "global_step": 24606, "epoch": 585} {"train_loss": -5.367109298706055, "global_step": 24607, "epoch": 585} {"train_loss": -5.453639984130859, "global_step": 24608, "epoch": 585} {"train_loss": -5.520112037658691, "global_step": 24609, "epoch": 585} {"train_loss": -5.344801425933838, "global_step": 24610, "epoch": 585} {"train_loss": -5.4077113810039705, "global_step": 24611, "epoch": 585, "val_loss": 68186.03125} {"train_loss": -5.449489116668701, "global_step": 24612, "epoch": 586} {"train_loss": -5.417564868927002, "global_step": 24613, "epoch": 586} {"train_loss": -5.428928852081299, "global_step": 24614, "epoch": 586} {"train_loss": -5.37148904800415, "global_step": 24615, "epoch": 586} {"train_loss": -5.348939895629883, "global_step": 24616, "epoch": 586} {"train_loss": -5.451088905334473, "global_step": 24617, "epoch": 586} {"train_loss": -5.295254707336426, "global_step": 24618, "epoch": 586} {"train_loss": -5.31806755065918, "global_step": 24619, "epoch": 586} {"train_loss": -5.429162979125977, "global_step": 24620, "epoch": 586} {"train_loss": -5.368289947509766, "global_step": 24621, "epoch": 586} {"train_loss": -5.357364654541016, "global_step": 24622, "epoch": 586} {"train_loss": -5.348825454711914, "global_step": 24623, "epoch": 586} {"train_loss": -5.348442077636719, "global_step": 24624, "epoch": 586} {"train_loss": -5.388928413391113, "global_step": 24625, "epoch": 586} {"train_loss": -5.325896263122559, "global_step": 24626, "epoch": 586} {"train_loss": -5.393555641174316, "global_step": 24627, "epoch": 586} {"train_loss": -5.499309062957764, "global_step": 24628, "epoch": 586} {"train_loss": -5.393304824829102, "global_step": 24629, "epoch": 586} {"train_loss": -5.403973579406738, "global_step": 24630, "epoch": 586} {"train_loss": -5.4144463539123535, "global_step": 24631, "epoch": 586} {"train_loss": -5.535281181335449, "global_step": 24632, "epoch": 586} {"train_loss": -5.473917484283447, "global_step": 24633, "epoch": 586} {"train_loss": -5.469353675842285, "global_step": 24634, "epoch": 586} {"train_loss": -5.467629909515381, "global_step": 24635, "epoch": 586} {"train_loss": -5.410167694091797, "global_step": 24636, "epoch": 586} {"train_loss": -5.228759765625, "global_step": 24637, "epoch": 586} {"train_loss": -5.512929916381836, "global_step": 24638, "epoch": 586} {"train_loss": -5.324103355407715, "global_step": 24639, "epoch": 586} {"train_loss": -5.387120246887207, "global_step": 24640, "epoch": 586} {"train_loss": -5.34877347946167, "global_step": 24641, "epoch": 586} {"train_loss": -5.243588447570801, "global_step": 24642, "epoch": 586} {"train_loss": -5.288323879241943, "global_step": 24643, "epoch": 586} {"train_loss": -5.291175842285156, "global_step": 24644, "epoch": 586} {"train_loss": -5.300878524780273, "global_step": 24645, "epoch": 586} {"train_loss": -5.409337997436523, "global_step": 24646, "epoch": 586} {"train_loss": -5.200967788696289, "global_step": 24647, "epoch": 586} {"train_loss": -5.292290687561035, "global_step": 24648, "epoch": 586} {"train_loss": -5.368781566619873, "global_step": 24649, "epoch": 586} {"train_loss": -5.199919700622559, "global_step": 24650, "epoch": 586} {"train_loss": -5.305835247039795, "global_step": 24651, "epoch": 586} {"train_loss": -5.317122459411621, "global_step": 24652, "epoch": 586} {"train_loss": -5.369841110138666, "global_step": 24653, "epoch": 586, "val_loss": 68524.8984375} {"train_loss": -5.39872932434082, "global_step": 24654, "epoch": 587} {"train_loss": -5.370806694030762, "global_step": 24655, "epoch": 587} {"train_loss": -5.496763229370117, "global_step": 24656, "epoch": 587} {"train_loss": -5.184919357299805, "global_step": 24657, "epoch": 587} {"train_loss": -5.50274133682251, "global_step": 24658, "epoch": 587} {"train_loss": -5.414026260375977, "global_step": 24659, "epoch": 587} {"train_loss": -5.411196708679199, "global_step": 24660, "epoch": 587} {"train_loss": -5.280281066894531, "global_step": 24661, "epoch": 587} {"train_loss": -5.387104034423828, "global_step": 24662, "epoch": 587} {"train_loss": -5.426791191101074, "global_step": 24663, "epoch": 587} {"train_loss": -5.166264533996582, "global_step": 24664, "epoch": 587} {"train_loss": -5.370182037353516, "global_step": 24665, "epoch": 587} {"train_loss": -5.341311454772949, "global_step": 24666, "epoch": 587} {"train_loss": -5.314287185668945, "global_step": 24667, "epoch": 587} {"train_loss": -5.213766098022461, "global_step": 24668, "epoch": 587} {"train_loss": -5.337614059448242, "global_step": 24669, "epoch": 587} {"train_loss": -5.41380500793457, "global_step": 24670, "epoch": 587} {"train_loss": -5.352794170379639, "global_step": 24671, "epoch": 587} {"train_loss": -5.355343341827393, "global_step": 24672, "epoch": 587} {"train_loss": -5.396021366119385, "global_step": 24673, "epoch": 587} {"train_loss": -5.304798126220703, "global_step": 24674, "epoch": 587} {"train_loss": -5.394254684448242, "global_step": 24675, "epoch": 587} {"train_loss": -5.352612018585205, "global_step": 24676, "epoch": 587} {"train_loss": -5.307407855987549, "global_step": 24677, "epoch": 587} {"train_loss": -5.539315700531006, "global_step": 24678, "epoch": 587} {"train_loss": -5.3817524909973145, "global_step": 24679, "epoch": 587} {"train_loss": -5.368424415588379, "global_step": 24680, "epoch": 587} {"train_loss": -5.295586109161377, "global_step": 24681, "epoch": 587} {"train_loss": -5.333571434020996, "global_step": 24682, "epoch": 587} {"train_loss": -5.316164016723633, "global_step": 24683, "epoch": 587} {"train_loss": -5.460224151611328, "global_step": 24684, "epoch": 587} {"train_loss": -5.453227996826172, "global_step": 24685, "epoch": 587} {"train_loss": -5.455190181732178, "global_step": 24686, "epoch": 587} {"train_loss": -5.341466903686523, "global_step": 24687, "epoch": 587} {"train_loss": -5.364079475402832, "global_step": 24688, "epoch": 587} {"train_loss": -5.549893379211426, "global_step": 24689, "epoch": 587} {"train_loss": -5.356145858764648, "global_step": 24690, "epoch": 587} {"train_loss": -5.35546875, "global_step": 24691, "epoch": 587} {"train_loss": -5.438716411590576, "global_step": 24692, "epoch": 587} {"train_loss": -5.438876152038574, "global_step": 24693, "epoch": 587} {"train_loss": -5.41762113571167, "global_step": 24694, "epoch": 587} {"train_loss": -5.376733995619274, "global_step": 24695, "epoch": 587, "val_loss": 68213.3515625} {"train_loss": -5.41566801071167, "global_step": 24696, "epoch": 588} {"train_loss": -5.39256477355957, "global_step": 24697, "epoch": 588} {"train_loss": -5.198241233825684, "global_step": 24698, "epoch": 588} {"train_loss": -5.508914470672607, "global_step": 24699, "epoch": 588} {"train_loss": -5.438989639282227, "global_step": 24700, "epoch": 588} {"train_loss": -5.424783706665039, "global_step": 24701, "epoch": 588} {"train_loss": -5.508599281311035, "global_step": 24702, "epoch": 588} {"train_loss": -5.310678482055664, "global_step": 24703, "epoch": 588} {"train_loss": -5.379744529724121, "global_step": 24704, "epoch": 588} {"train_loss": -5.350132942199707, "global_step": 24705, "epoch": 588} {"train_loss": -5.408364295959473, "global_step": 24706, "epoch": 588} {"train_loss": -5.444068431854248, "global_step": 24707, "epoch": 588} {"train_loss": -5.525965690612793, "global_step": 24708, "epoch": 588} {"train_loss": -5.379638671875, "global_step": 24709, "epoch": 588} {"train_loss": -5.335304260253906, "global_step": 24710, "epoch": 588} {"train_loss": -5.3399553298950195, "global_step": 24711, "epoch": 588} {"train_loss": -5.466307640075684, "global_step": 24712, "epoch": 588} {"train_loss": -5.405563831329346, "global_step": 24713, "epoch": 588} {"train_loss": -5.355841636657715, "global_step": 24714, "epoch": 588} {"train_loss": -5.370988845825195, "global_step": 24715, "epoch": 588} {"train_loss": -5.5076470375061035, "global_step": 24716, "epoch": 588} {"train_loss": -5.464107036590576, "global_step": 24717, "epoch": 588} {"train_loss": -5.358450889587402, "global_step": 24718, "epoch": 588} {"train_loss": -5.402579307556152, "global_step": 24719, "epoch": 588} {"train_loss": -5.428613662719727, "global_step": 24720, "epoch": 588} {"train_loss": -5.399100303649902, "global_step": 24721, "epoch": 588} {"train_loss": -5.525899887084961, "global_step": 24722, "epoch": 588} {"train_loss": -5.432735919952393, "global_step": 24723, "epoch": 588} {"train_loss": -5.434749603271484, "global_step": 24724, "epoch": 588} {"train_loss": -5.445524215698242, "global_step": 24725, "epoch": 588} {"train_loss": -5.387941837310791, "global_step": 24726, "epoch": 588} {"train_loss": -5.485145092010498, "global_step": 24727, "epoch": 588} {"train_loss": -5.143013000488281, "global_step": 24728, "epoch": 588} {"train_loss": -5.336671829223633, "global_step": 24729, "epoch": 588} {"train_loss": -5.469060897827148, "global_step": 24730, "epoch": 588} {"train_loss": -5.460107803344727, "global_step": 24731, "epoch": 588} {"train_loss": -5.4832963943481445, "global_step": 24732, "epoch": 588} {"train_loss": -5.348859786987305, "global_step": 24733, "epoch": 588} {"train_loss": -5.450339317321777, "global_step": 24734, "epoch": 588} {"train_loss": -5.294452667236328, "global_step": 24735, "epoch": 588} {"train_loss": -5.464343070983887, "global_step": 24736, "epoch": 588} {"train_loss": -5.408681460789272, "global_step": 24737, "epoch": 588, "val_loss": 67935.171875} {"train_loss": -5.495368003845215, "global_step": 24738, "epoch": 589} {"train_loss": -5.442850112915039, "global_step": 24739, "epoch": 589} {"train_loss": -5.3874030113220215, "global_step": 24740, "epoch": 589} {"train_loss": -5.427704811096191, "global_step": 24741, "epoch": 589} {"train_loss": -5.410816192626953, "global_step": 24742, "epoch": 589} {"train_loss": -5.497318744659424, "global_step": 24743, "epoch": 589} {"train_loss": -5.428801536560059, "global_step": 24744, "epoch": 589} {"train_loss": -5.378427505493164, "global_step": 24745, "epoch": 589} {"train_loss": -5.316744804382324, "global_step": 24746, "epoch": 589} {"train_loss": -5.477537155151367, "global_step": 24747, "epoch": 589} {"train_loss": -5.233349800109863, "global_step": 24748, "epoch": 589} {"train_loss": -5.3416595458984375, "global_step": 24749, "epoch": 589} {"train_loss": -5.213730812072754, "global_step": 24750, "epoch": 589} {"train_loss": -5.27407693862915, "global_step": 24751, "epoch": 589} {"train_loss": -5.578993320465088, "global_step": 24752, "epoch": 589} {"train_loss": -5.471945762634277, "global_step": 24753, "epoch": 589} {"train_loss": -5.385396480560303, "global_step": 24754, "epoch": 589} {"train_loss": -5.208111763000488, "global_step": 24755, "epoch": 589} {"train_loss": -5.3479461669921875, "global_step": 24756, "epoch": 589} {"train_loss": -5.219144821166992, "global_step": 24757, "epoch": 589} {"train_loss": -5.4904632568359375, "global_step": 24758, "epoch": 589} {"train_loss": -5.3562445640563965, "global_step": 24759, "epoch": 589} {"train_loss": -5.4366679191589355, "global_step": 24760, "epoch": 589} {"train_loss": -5.398128509521484, "global_step": 24761, "epoch": 589} {"train_loss": -5.358733177185059, "global_step": 24762, "epoch": 589} {"train_loss": -5.277242660522461, "global_step": 24763, "epoch": 589} {"train_loss": -5.505070209503174, "global_step": 24764, "epoch": 589} {"train_loss": -5.504018306732178, "global_step": 24765, "epoch": 589} {"train_loss": -5.282306671142578, "global_step": 24766, "epoch": 589} {"train_loss": -5.386049270629883, "global_step": 24767, "epoch": 589} {"train_loss": -5.376648902893066, "global_step": 24768, "epoch": 589} {"train_loss": -5.355660438537598, "global_step": 24769, "epoch": 589} {"train_loss": -5.35619592666626, "global_step": 24770, "epoch": 589} {"train_loss": -5.39499044418335, "global_step": 24771, "epoch": 589} {"train_loss": -5.40952205657959, "global_step": 24772, "epoch": 589} {"train_loss": -5.367136001586914, "global_step": 24773, "epoch": 589} {"train_loss": -5.44687557220459, "global_step": 24774, "epoch": 589} {"train_loss": -5.509242057800293, "global_step": 24775, "epoch": 589} {"train_loss": -5.207588195800781, "global_step": 24776, "epoch": 589} {"train_loss": -5.433370590209961, "global_step": 24777, "epoch": 589} {"train_loss": -5.316596031188965, "global_step": 24778, "epoch": 589} {"train_loss": -5.3816969735281805, "global_step": 24779, "epoch": 589, "val_loss": 67750.5546875} {"train_loss": -5.396340370178223, "global_step": 24780, "epoch": 590} {"train_loss": -5.3462629318237305, "global_step": 24781, "epoch": 590} {"train_loss": -5.332705497741699, "global_step": 24782, "epoch": 590} {"train_loss": -5.344971656799316, "global_step": 24783, "epoch": 590} {"train_loss": -5.454184532165527, "global_step": 24784, "epoch": 590} {"train_loss": -5.40266227722168, "global_step": 24785, "epoch": 590} {"train_loss": -5.320973873138428, "global_step": 24786, "epoch": 590} {"train_loss": -5.345376014709473, "global_step": 24787, "epoch": 590} {"train_loss": -5.44470739364624, "global_step": 24788, "epoch": 590} {"train_loss": -5.490586280822754, "global_step": 24789, "epoch": 590} {"train_loss": -5.339955806732178, "global_step": 24790, "epoch": 590} {"train_loss": -5.264467716217041, "global_step": 24791, "epoch": 590} {"train_loss": -5.563041687011719, "global_step": 24792, "epoch": 590} {"train_loss": -5.354729652404785, "global_step": 24793, "epoch": 590} {"train_loss": -5.480703830718994, "global_step": 24794, "epoch": 590} {"train_loss": -5.4569315910339355, "global_step": 24795, "epoch": 590} {"train_loss": -5.256679058074951, "global_step": 24796, "epoch": 590} {"train_loss": -5.366662502288818, "global_step": 24797, "epoch": 590} {"train_loss": -5.453527450561523, "global_step": 24798, "epoch": 590} {"train_loss": -5.353564262390137, "global_step": 24799, "epoch": 590} {"train_loss": -5.358462333679199, "global_step": 24800, "epoch": 590} {"train_loss": -5.330233097076416, "global_step": 24801, "epoch": 590} {"train_loss": -5.518041610717773, "global_step": 24802, "epoch": 590} {"train_loss": -5.407386779785156, "global_step": 24803, "epoch": 590} {"train_loss": -5.357986927032471, "global_step": 24804, "epoch": 590} {"train_loss": -5.348409652709961, "global_step": 24805, "epoch": 590} {"train_loss": -5.476600646972656, "global_step": 24806, "epoch": 590} {"train_loss": -5.518908500671387, "global_step": 24807, "epoch": 590} {"train_loss": -5.3627400398254395, "global_step": 24808, "epoch": 590} {"train_loss": -5.448843002319336, "global_step": 24809, "epoch": 590} {"train_loss": -5.48231840133667, "global_step": 24810, "epoch": 590} {"train_loss": -5.485198974609375, "global_step": 24811, "epoch": 590} {"train_loss": -5.356352806091309, "global_step": 24812, "epoch": 590} {"train_loss": -5.47607421875, "global_step": 24813, "epoch": 590} {"train_loss": -5.240184783935547, "global_step": 24814, "epoch": 590} {"train_loss": -5.3663249015808105, "global_step": 24815, "epoch": 590} {"train_loss": -5.55031681060791, "global_step": 24816, "epoch": 590} {"train_loss": -5.526717185974121, "global_step": 24817, "epoch": 590} {"train_loss": -5.192606449127197, "global_step": 24818, "epoch": 590} {"train_loss": -5.398198127746582, "global_step": 24819, "epoch": 590} {"train_loss": -5.31123161315918, "global_step": 24820, "epoch": 590} {"train_loss": -5.39572598820641, "global_step": 24821, "epoch": 590, "val_loss": 67859.4296875} {"train_loss": -5.279013633728027, "global_step": 24822, "epoch": 591} {"train_loss": -5.305060863494873, "global_step": 24823, "epoch": 591} {"train_loss": -5.412830352783203, "global_step": 24824, "epoch": 591} {"train_loss": -5.392807960510254, "global_step": 24825, "epoch": 591} {"train_loss": -5.5583343505859375, "global_step": 24826, "epoch": 591} {"train_loss": -5.488725662231445, "global_step": 24827, "epoch": 591} {"train_loss": -5.333271503448486, "global_step": 24828, "epoch": 591} {"train_loss": -5.517574310302734, "global_step": 24829, "epoch": 591} {"train_loss": -5.467312812805176, "global_step": 24830, "epoch": 591} {"train_loss": -5.355093955993652, "global_step": 24831, "epoch": 591} {"train_loss": -5.381447792053223, "global_step": 24832, "epoch": 591} {"train_loss": -5.364168167114258, "global_step": 24833, "epoch": 591} {"train_loss": -5.1874542236328125, "global_step": 24834, "epoch": 591} {"train_loss": -5.558410167694092, "global_step": 24835, "epoch": 591} {"train_loss": -5.345816135406494, "global_step": 24836, "epoch": 591} {"train_loss": -5.459875583648682, "global_step": 24837, "epoch": 591} {"train_loss": -5.438930511474609, "global_step": 24838, "epoch": 591} {"train_loss": -5.325511455535889, "global_step": 24839, "epoch": 591} {"train_loss": -5.203075408935547, "global_step": 24840, "epoch": 591} {"train_loss": -5.3601179122924805, "global_step": 24841, "epoch": 591} {"train_loss": -5.193286418914795, "global_step": 24842, "epoch": 591} {"train_loss": -5.330053806304932, "global_step": 24843, "epoch": 591} {"train_loss": -5.277063369750977, "global_step": 24844, "epoch": 591} {"train_loss": -5.255776405334473, "global_step": 24845, "epoch": 591} {"train_loss": -5.26180362701416, "global_step": 24846, "epoch": 591} {"train_loss": -5.314553260803223, "global_step": 24847, "epoch": 591} {"train_loss": -5.549259662628174, "global_step": 24848, "epoch": 591} {"train_loss": -5.298583030700684, "global_step": 24849, "epoch": 591} {"train_loss": -5.375898361206055, "global_step": 24850, "epoch": 591} {"train_loss": -5.402580261230469, "global_step": 24851, "epoch": 591} {"train_loss": -5.340456008911133, "global_step": 24852, "epoch": 591} {"train_loss": -5.353116989135742, "global_step": 24853, "epoch": 591} {"train_loss": -5.27736234664917, "global_step": 24854, "epoch": 591} {"train_loss": -5.431163787841797, "global_step": 24855, "epoch": 591} {"train_loss": -5.325451850891113, "global_step": 24856, "epoch": 591} {"train_loss": -5.330166816711426, "global_step": 24857, "epoch": 591} {"train_loss": -5.3754777908325195, "global_step": 24858, "epoch": 591} {"train_loss": -5.332622051239014, "global_step": 24859, "epoch": 591} {"train_loss": -5.451190948486328, "global_step": 24860, "epoch": 591} {"train_loss": -5.355873107910156, "global_step": 24861, "epoch": 591} {"train_loss": -5.450982570648193, "global_step": 24862, "epoch": 591} {"train_loss": -5.366425105503628, "global_step": 24863, "epoch": 591, "val_loss": 67881.9140625} {"train_loss": -5.4396514892578125, "global_step": 24864, "epoch": 592} {"train_loss": -5.447056770324707, "global_step": 24865, "epoch": 592} {"train_loss": -5.216858863830566, "global_step": 24866, "epoch": 592} {"train_loss": -5.423300743103027, "global_step": 24867, "epoch": 592} {"train_loss": -5.443658828735352, "global_step": 24868, "epoch": 592} {"train_loss": -5.358923435211182, "global_step": 24869, "epoch": 592} {"train_loss": -5.4201812744140625, "global_step": 24870, "epoch": 592} {"train_loss": -5.281344413757324, "global_step": 24871, "epoch": 592} {"train_loss": -5.358405590057373, "global_step": 24872, "epoch": 592} {"train_loss": -5.517464637756348, "global_step": 24873, "epoch": 592} {"train_loss": -5.381473541259766, "global_step": 24874, "epoch": 592} {"train_loss": -5.435118198394775, "global_step": 24875, "epoch": 592} {"train_loss": -5.411114692687988, "global_step": 24876, "epoch": 592} {"train_loss": -5.358829498291016, "global_step": 24877, "epoch": 592} {"train_loss": -5.352607727050781, "global_step": 24878, "epoch": 592} {"train_loss": -5.460050582885742, "global_step": 24879, "epoch": 592} {"train_loss": -5.441205024719238, "global_step": 24880, "epoch": 592} {"train_loss": -5.466070652008057, "global_step": 24881, "epoch": 592} {"train_loss": -5.381219863891602, "global_step": 24882, "epoch": 592} {"train_loss": -5.322995185852051, "global_step": 24883, "epoch": 592} {"train_loss": -5.613712787628174, "global_step": 24884, "epoch": 592} {"train_loss": -5.449038505554199, "global_step": 24885, "epoch": 592} {"train_loss": -5.303387641906738, "global_step": 24886, "epoch": 592} {"train_loss": -5.43270206451416, "global_step": 24887, "epoch": 592} {"train_loss": -5.364651679992676, "global_step": 24888, "epoch": 592} {"train_loss": -5.401699066162109, "global_step": 24889, "epoch": 592} {"train_loss": -5.439054489135742, "global_step": 24890, "epoch": 592} {"train_loss": -5.423714637756348, "global_step": 24891, "epoch": 592} {"train_loss": -5.444976329803467, "global_step": 24892, "epoch": 592} {"train_loss": -5.454010009765625, "global_step": 24893, "epoch": 592} {"train_loss": -5.416701316833496, "global_step": 24894, "epoch": 592} {"train_loss": -5.392577171325684, "global_step": 24895, "epoch": 592} {"train_loss": -5.400167465209961, "global_step": 24896, "epoch": 592} {"train_loss": -5.295744895935059, "global_step": 24897, "epoch": 592} {"train_loss": -5.3615570068359375, "global_step": 24898, "epoch": 592} {"train_loss": -5.317036151885986, "global_step": 24899, "epoch": 592} {"train_loss": -5.4813714027404785, "global_step": 24900, "epoch": 592} {"train_loss": -5.515311241149902, "global_step": 24901, "epoch": 592} {"train_loss": -5.489521503448486, "global_step": 24902, "epoch": 592} {"train_loss": -5.433635234832764, "global_step": 24903, "epoch": 592} {"train_loss": -5.435253143310547, "global_step": 24904, "epoch": 592} {"train_loss": -5.410966112500145, "global_step": 24905, "epoch": 592, "val_loss": 67626.9140625} {"train_loss": -5.4919657707214355, "global_step": 24906, "epoch": 593} {"train_loss": -5.343502998352051, "global_step": 24907, "epoch": 593} {"train_loss": -5.468889236450195, "global_step": 24908, "epoch": 593} {"train_loss": -5.3690900802612305, "global_step": 24909, "epoch": 593} {"train_loss": -5.507594108581543, "global_step": 24910, "epoch": 593} {"train_loss": -5.446374893188477, "global_step": 24911, "epoch": 593} {"train_loss": -5.42823600769043, "global_step": 24912, "epoch": 593} {"train_loss": -5.47464656829834, "global_step": 24913, "epoch": 593} {"train_loss": -5.281232833862305, "global_step": 24914, "epoch": 593} {"train_loss": -5.413002014160156, "global_step": 24915, "epoch": 593} {"train_loss": -5.437309265136719, "global_step": 24916, "epoch": 593} {"train_loss": -5.358522415161133, "global_step": 24917, "epoch": 593} {"train_loss": -5.395206451416016, "global_step": 24918, "epoch": 593} {"train_loss": -5.441930770874023, "global_step": 24919, "epoch": 593} {"train_loss": -5.428971290588379, "global_step": 24920, "epoch": 593} {"train_loss": -5.4894866943359375, "global_step": 24921, "epoch": 593} {"train_loss": -5.454787254333496, "global_step": 24922, "epoch": 593} {"train_loss": -5.504133224487305, "global_step": 24923, "epoch": 593} {"train_loss": -5.367090702056885, "global_step": 24924, "epoch": 593} {"train_loss": -5.377989768981934, "global_step": 24925, "epoch": 593} {"train_loss": -5.506759166717529, "global_step": 24926, "epoch": 593} {"train_loss": -5.494502544403076, "global_step": 24927, "epoch": 593} {"train_loss": -5.409153938293457, "global_step": 24928, "epoch": 593} {"train_loss": -5.460526466369629, "global_step": 24929, "epoch": 593} {"train_loss": -5.391801834106445, "global_step": 24930, "epoch": 593} {"train_loss": -5.279256820678711, "global_step": 24931, "epoch": 593} {"train_loss": -5.442751884460449, "global_step": 24932, "epoch": 593} {"train_loss": -5.547072410583496, "global_step": 24933, "epoch": 593} {"train_loss": -5.32470703125, "global_step": 24934, "epoch": 593} {"train_loss": -5.411886692047119, "global_step": 24935, "epoch": 593} {"train_loss": -5.3905029296875, "global_step": 24936, "epoch": 593} {"train_loss": -5.417911052703857, "global_step": 24937, "epoch": 593} {"train_loss": -5.353246688842773, "global_step": 24938, "epoch": 593} {"train_loss": -5.284299850463867, "global_step": 24939, "epoch": 593} {"train_loss": -5.3028411865234375, "global_step": 24940, "epoch": 593} {"train_loss": -5.34388542175293, "global_step": 24941, "epoch": 593} {"train_loss": -5.3395771980285645, "global_step": 24942, "epoch": 593} {"train_loss": -5.514018535614014, "global_step": 24943, "epoch": 593} {"train_loss": -5.390359401702881, "global_step": 24944, "epoch": 593} {"train_loss": -5.544038772583008, "global_step": 24945, "epoch": 593} {"train_loss": -5.387539863586426, "global_step": 24946, "epoch": 593} {"train_loss": -5.413858470462618, "global_step": 24947, "epoch": 593, "val_loss": 67683.7265625} {"train_loss": -5.456244945526123, "global_step": 24948, "epoch": 594} {"train_loss": -5.463752746582031, "global_step": 24949, "epoch": 594} {"train_loss": -5.397913455963135, "global_step": 24950, "epoch": 594} {"train_loss": -5.434352874755859, "global_step": 24951, "epoch": 594} {"train_loss": -5.489224433898926, "global_step": 24952, "epoch": 594} {"train_loss": -5.372013092041016, "global_step": 24953, "epoch": 594} {"train_loss": -5.3780741691589355, "global_step": 24954, "epoch": 594} {"train_loss": -5.448141098022461, "global_step": 24955, "epoch": 594} {"train_loss": -5.4468584060668945, "global_step": 24956, "epoch": 594} {"train_loss": -5.3768157958984375, "global_step": 24957, "epoch": 594} {"train_loss": -5.475053787231445, "global_step": 24958, "epoch": 594} {"train_loss": -5.48261833190918, "global_step": 24959, "epoch": 594} {"train_loss": -5.440102577209473, "global_step": 24960, "epoch": 594} {"train_loss": -5.461179733276367, "global_step": 24961, "epoch": 594} {"train_loss": -5.414915084838867, "global_step": 24962, "epoch": 594} {"train_loss": -5.332067012786865, "global_step": 24963, "epoch": 594} {"train_loss": -5.455615997314453, "global_step": 24964, "epoch": 594} {"train_loss": -5.334020137786865, "global_step": 24965, "epoch": 594} {"train_loss": -5.464277267456055, "global_step": 24966, "epoch": 594} {"train_loss": -5.473599433898926, "global_step": 24967, "epoch": 594} {"train_loss": -5.548718452453613, "global_step": 24968, "epoch": 594} {"train_loss": -5.500450134277344, "global_step": 24969, "epoch": 594} {"train_loss": -5.311397075653076, "global_step": 24970, "epoch": 594} {"train_loss": -5.431085586547852, "global_step": 24971, "epoch": 594} {"train_loss": -5.370711326599121, "global_step": 24972, "epoch": 594} {"train_loss": -5.298636436462402, "global_step": 24973, "epoch": 594} {"train_loss": -5.4801926612854, "global_step": 24974, "epoch": 594} {"train_loss": -5.346530914306641, "global_step": 24975, "epoch": 594} {"train_loss": -5.431463241577148, "global_step": 24976, "epoch": 594} {"train_loss": -5.355670928955078, "global_step": 24977, "epoch": 594} {"train_loss": -5.398101806640625, "global_step": 24978, "epoch": 594} {"train_loss": -5.292133331298828, "global_step": 24979, "epoch": 594} {"train_loss": -5.353914737701416, "global_step": 24980, "epoch": 594} {"train_loss": -5.362371444702148, "global_step": 24981, "epoch": 594} {"train_loss": -5.390915393829346, "global_step": 24982, "epoch": 594} {"train_loss": -5.304278373718262, "global_step": 24983, "epoch": 594} {"train_loss": -5.516866683959961, "global_step": 24984, "epoch": 594} {"train_loss": -5.485637664794922, "global_step": 24985, "epoch": 594} {"train_loss": -5.491422176361084, "global_step": 24986, "epoch": 594} {"train_loss": -5.365324020385742, "global_step": 24987, "epoch": 594} {"train_loss": -5.323216438293457, "global_step": 24988, "epoch": 594} {"train_loss": -5.416494085675194, "global_step": 24989, "epoch": 594, "val_loss": 67694.921875} {"train_loss": -5.445427417755127, "global_step": 24990, "epoch": 595} {"train_loss": -5.495881080627441, "global_step": 24991, "epoch": 595} {"train_loss": -5.387777328491211, "global_step": 24992, "epoch": 595} {"train_loss": -5.412778854370117, "global_step": 24993, "epoch": 595} {"train_loss": -5.454721450805664, "global_step": 24994, "epoch": 595} {"train_loss": -5.477069854736328, "global_step": 24995, "epoch": 595} {"train_loss": -5.359738349914551, "global_step": 24996, "epoch": 595} {"train_loss": -5.340628623962402, "global_step": 24997, "epoch": 595} {"train_loss": -5.251401424407959, "global_step": 24998, "epoch": 595} {"train_loss": -5.566059589385986, "global_step": 24999, "epoch": 595} {"train_loss": -5.2714080810546875, "global_step": 25000, "epoch": 595} {"train_loss": -5.317441940307617, "global_step": 25001, "epoch": 595} {"train_loss": -5.424539566040039, "global_step": 25002, "epoch": 595} {"train_loss": -5.321742057800293, "global_step": 25003, "epoch": 595} {"train_loss": -5.206305027008057, "global_step": 25004, "epoch": 595} {"train_loss": -5.404150009155273, "global_step": 25005, "epoch": 595} {"train_loss": -5.154839992523193, "global_step": 25006, "epoch": 595} {"train_loss": -5.413514614105225, "global_step": 25007, "epoch": 595} {"train_loss": -5.47952938079834, "global_step": 25008, "epoch": 595} {"train_loss": -5.235508918762207, "global_step": 25009, "epoch": 595} {"train_loss": -5.341699600219727, "global_step": 25010, "epoch": 595} {"train_loss": -5.280156135559082, "global_step": 25011, "epoch": 595} {"train_loss": -5.207184314727783, "global_step": 25012, "epoch": 595} {"train_loss": -5.325826644897461, "global_step": 25013, "epoch": 595} {"train_loss": -5.39115571975708, "global_step": 25014, "epoch": 595} {"train_loss": -5.480450630187988, "global_step": 25015, "epoch": 595} {"train_loss": -5.316010475158691, "global_step": 25016, "epoch": 595} {"train_loss": -5.322054386138916, "global_step": 25017, "epoch": 595} {"train_loss": -5.246389389038086, "global_step": 25018, "epoch": 595} {"train_loss": -5.455361366271973, "global_step": 25019, "epoch": 595} {"train_loss": -5.398839950561523, "global_step": 25020, "epoch": 595} {"train_loss": -5.392003536224365, "global_step": 25021, "epoch": 595} {"train_loss": -5.376039981842041, "global_step": 25022, "epoch": 595} {"train_loss": -5.340280532836914, "global_step": 25023, "epoch": 595} {"train_loss": -5.423820972442627, "global_step": 25024, "epoch": 595} {"train_loss": -5.287532806396484, "global_step": 25025, "epoch": 595} {"train_loss": -5.408565521240234, "global_step": 25026, "epoch": 595} {"train_loss": -5.342077732086182, "global_step": 25027, "epoch": 595} {"train_loss": -5.356668472290039, "global_step": 25028, "epoch": 595} {"train_loss": -5.346010208129883, "global_step": 25029, "epoch": 595} {"train_loss": -5.481971263885498, "global_step": 25030, "epoch": 595} {"train_loss": -5.364036230813889, "global_step": 25031, "epoch": 595, "val_loss": 68636.8359375} {"train_loss": -5.516294479370117, "global_step": 25032, "epoch": 596} {"train_loss": -5.469216346740723, "global_step": 25033, "epoch": 596} {"train_loss": -5.384552001953125, "global_step": 25034, "epoch": 596} {"train_loss": -5.252861499786377, "global_step": 25035, "epoch": 596} {"train_loss": -5.350064754486084, "global_step": 25036, "epoch": 596} {"train_loss": -5.411917686462402, "global_step": 25037, "epoch": 596} {"train_loss": -5.2674760818481445, "global_step": 25038, "epoch": 596} {"train_loss": -5.440803527832031, "global_step": 25039, "epoch": 596} {"train_loss": -5.483711242675781, "global_step": 25040, "epoch": 596} {"train_loss": -5.182960510253906, "global_step": 25041, "epoch": 596} {"train_loss": -5.289572238922119, "global_step": 25042, "epoch": 596} {"train_loss": -5.439537048339844, "global_step": 25043, "epoch": 596} {"train_loss": -5.402299880981445, "global_step": 25044, "epoch": 596} {"train_loss": -5.421892166137695, "global_step": 25045, "epoch": 596} {"train_loss": -5.423947811126709, "global_step": 25046, "epoch": 596} {"train_loss": -5.283809185028076, "global_step": 25047, "epoch": 596} {"train_loss": -5.408795356750488, "global_step": 25048, "epoch": 596} {"train_loss": -5.385231018066406, "global_step": 25049, "epoch": 596} {"train_loss": -5.336976051330566, "global_step": 25050, "epoch": 596} {"train_loss": -5.407696723937988, "global_step": 25051, "epoch": 596} {"train_loss": -5.397791862487793, "global_step": 25052, "epoch": 596} {"train_loss": -5.402700901031494, "global_step": 25053, "epoch": 596} {"train_loss": -5.454165935516357, "global_step": 25054, "epoch": 596} {"train_loss": -5.387445449829102, "global_step": 25055, "epoch": 596} {"train_loss": -5.359995365142822, "global_step": 25056, "epoch": 596} {"train_loss": -5.399466514587402, "global_step": 25057, "epoch": 596} {"train_loss": -5.366814613342285, "global_step": 25058, "epoch": 596} {"train_loss": -5.341727256774902, "global_step": 25059, "epoch": 596} {"train_loss": -5.377650737762451, "global_step": 25060, "epoch": 596} {"train_loss": -5.4516706466674805, "global_step": 25061, "epoch": 596} {"train_loss": -5.390742301940918, "global_step": 25062, "epoch": 596} {"train_loss": -5.420598983764648, "global_step": 25063, "epoch": 596} {"train_loss": -5.441914081573486, "global_step": 25064, "epoch": 596} {"train_loss": -5.430902004241943, "global_step": 25065, "epoch": 596} {"train_loss": -5.484682559967041, "global_step": 25066, "epoch": 596} {"train_loss": -5.4125871658325195, "global_step": 25067, "epoch": 596} {"train_loss": -5.470376968383789, "global_step": 25068, "epoch": 596} {"train_loss": -5.395114421844482, "global_step": 25069, "epoch": 596} {"train_loss": -5.3049397468566895, "global_step": 25070, "epoch": 596} {"train_loss": -5.313460350036621, "global_step": 25071, "epoch": 596} {"train_loss": -5.299097061157227, "global_step": 25072, "epoch": 596} {"train_loss": -5.386106945219494, "global_step": 25073, "epoch": 596, "val_loss": 67688.4453125} {"train_loss": -5.359067916870117, "global_step": 25074, "epoch": 597} {"train_loss": -5.337224006652832, "global_step": 25075, "epoch": 597} {"train_loss": -5.209788799285889, "global_step": 25076, "epoch": 597} {"train_loss": -5.398983478546143, "global_step": 25077, "epoch": 597} {"train_loss": -5.349766731262207, "global_step": 25078, "epoch": 597} {"train_loss": -5.498300075531006, "global_step": 25079, "epoch": 597} {"train_loss": -5.395102500915527, "global_step": 25080, "epoch": 597} {"train_loss": -5.257143974304199, "global_step": 25081, "epoch": 597} {"train_loss": -5.4495697021484375, "global_step": 25082, "epoch": 597} {"train_loss": -5.374009132385254, "global_step": 25083, "epoch": 597} {"train_loss": -5.338940620422363, "global_step": 25084, "epoch": 597} {"train_loss": -5.383800506591797, "global_step": 25085, "epoch": 597} {"train_loss": -5.399837493896484, "global_step": 25086, "epoch": 597} {"train_loss": -5.384438514709473, "global_step": 25087, "epoch": 597} {"train_loss": -5.376955986022949, "global_step": 25088, "epoch": 597} {"train_loss": -5.298552513122559, "global_step": 25089, "epoch": 597} {"train_loss": -5.444064140319824, "global_step": 25090, "epoch": 597} {"train_loss": -5.36531925201416, "global_step": 25091, "epoch": 597} {"train_loss": -5.395601272583008, "global_step": 25092, "epoch": 597} {"train_loss": -5.404921531677246, "global_step": 25093, "epoch": 597} {"train_loss": -5.433338165283203, "global_step": 25094, "epoch": 597} {"train_loss": -5.470036506652832, "global_step": 25095, "epoch": 597} {"train_loss": -5.430521011352539, "global_step": 25096, "epoch": 597} {"train_loss": -5.387555122375488, "global_step": 25097, "epoch": 597} {"train_loss": -5.4009904861450195, "global_step": 25098, "epoch": 597} {"train_loss": -5.523824214935303, "global_step": 25099, "epoch": 597} {"train_loss": -5.318182945251465, "global_step": 25100, "epoch": 597} {"train_loss": -5.404522895812988, "global_step": 25101, "epoch": 597} {"train_loss": -5.456859588623047, "global_step": 25102, "epoch": 597} {"train_loss": -5.484206676483154, "global_step": 25103, "epoch": 597} {"train_loss": -5.491946220397949, "global_step": 25104, "epoch": 597} {"train_loss": -5.466253280639648, "global_step": 25105, "epoch": 597} {"train_loss": -5.542871952056885, "global_step": 25106, "epoch": 597} {"train_loss": -5.424605369567871, "global_step": 25107, "epoch": 597} {"train_loss": -5.492976188659668, "global_step": 25108, "epoch": 597} {"train_loss": -5.349117279052734, "global_step": 25109, "epoch": 597} {"train_loss": -5.521616458892822, "global_step": 25110, "epoch": 597} {"train_loss": -5.283756256103516, "global_step": 25111, "epoch": 597} {"train_loss": -5.325806140899658, "global_step": 25112, "epoch": 597} {"train_loss": -5.408883094787598, "global_step": 25113, "epoch": 597} {"train_loss": -5.392992973327637, "global_step": 25114, "epoch": 597} {"train_loss": -5.399813754217965, "global_step": 25115, "epoch": 597, "val_loss": 68016.4375} {"train_loss": -5.404379367828369, "global_step": 25116, "epoch": 598} {"train_loss": -5.397963523864746, "global_step": 25117, "epoch": 598} {"train_loss": -5.386724472045898, "global_step": 25118, "epoch": 598} {"train_loss": -5.291045188903809, "global_step": 25119, "epoch": 598} {"train_loss": -5.459885120391846, "global_step": 25120, "epoch": 598} {"train_loss": -5.360771179199219, "global_step": 25121, "epoch": 598} {"train_loss": -5.559062480926514, "global_step": 25122, "epoch": 598} {"train_loss": -5.443648815155029, "global_step": 25123, "epoch": 598} {"train_loss": -5.3401899337768555, "global_step": 25124, "epoch": 598} {"train_loss": -5.390235900878906, "global_step": 25125, "epoch": 598} {"train_loss": -5.456818580627441, "global_step": 25126, "epoch": 598} {"train_loss": -5.385004043579102, "global_step": 25127, "epoch": 598} {"train_loss": -5.407373428344727, "global_step": 25128, "epoch": 598} {"train_loss": -5.377924919128418, "global_step": 25129, "epoch": 598} {"train_loss": -5.444123268127441, "global_step": 25130, "epoch": 598} {"train_loss": -5.365222930908203, "global_step": 25131, "epoch": 598} {"train_loss": -5.472437858581543, "global_step": 25132, "epoch": 598} {"train_loss": -5.295439720153809, "global_step": 25133, "epoch": 598} {"train_loss": -5.446043491363525, "global_step": 25134, "epoch": 598} {"train_loss": -5.30280876159668, "global_step": 25135, "epoch": 598} {"train_loss": -5.368401050567627, "global_step": 25136, "epoch": 598} {"train_loss": -5.375823497772217, "global_step": 25137, "epoch": 598} {"train_loss": -5.376348972320557, "global_step": 25138, "epoch": 598} {"train_loss": -5.4391889572143555, "global_step": 25139, "epoch": 598} {"train_loss": -5.385546684265137, "global_step": 25140, "epoch": 598} {"train_loss": -5.471299171447754, "global_step": 25141, "epoch": 598} {"train_loss": -5.3913373947143555, "global_step": 25142, "epoch": 598} {"train_loss": -5.256572723388672, "global_step": 25143, "epoch": 598} {"train_loss": -5.401823043823242, "global_step": 25144, "epoch": 598} {"train_loss": -5.395696640014648, "global_step": 25145, "epoch": 598} {"train_loss": -5.358917236328125, "global_step": 25146, "epoch": 598} {"train_loss": -5.426555156707764, "global_step": 25147, "epoch": 598} {"train_loss": -5.336178779602051, "global_step": 25148, "epoch": 598} {"train_loss": -5.479088306427002, "global_step": 25149, "epoch": 598} {"train_loss": -5.415728569030762, "global_step": 25150, "epoch": 598} {"train_loss": -5.252573013305664, "global_step": 25151, "epoch": 598} {"train_loss": -5.440478801727295, "global_step": 25152, "epoch": 598} {"train_loss": -5.403720855712891, "global_step": 25153, "epoch": 598} {"train_loss": -5.430896282196045, "global_step": 25154, "epoch": 598} {"train_loss": -5.506145477294922, "global_step": 25155, "epoch": 598} {"train_loss": -5.465624809265137, "global_step": 25156, "epoch": 598} {"train_loss": -5.396318935212635, "global_step": 25157, "epoch": 598, "val_loss": 67838.3125} {"train_loss": -5.375061988830566, "global_step": 25158, "epoch": 599} {"train_loss": -5.433586120605469, "global_step": 25159, "epoch": 599} {"train_loss": -5.369185447692871, "global_step": 25160, "epoch": 599} {"train_loss": -5.386893272399902, "global_step": 25161, "epoch": 599} {"train_loss": -5.354443550109863, "global_step": 25162, "epoch": 599} {"train_loss": -5.387660503387451, "global_step": 25163, "epoch": 599} {"train_loss": -5.329827785491943, "global_step": 25164, "epoch": 599} {"train_loss": -5.516843795776367, "global_step": 25165, "epoch": 599} {"train_loss": -5.101105690002441, "global_step": 25166, "epoch": 599} {"train_loss": -5.456258296966553, "global_step": 25167, "epoch": 599} {"train_loss": -5.297323703765869, "global_step": 25168, "epoch": 599} {"train_loss": -5.308469772338867, "global_step": 25169, "epoch": 599} {"train_loss": -5.409619331359863, "global_step": 25170, "epoch": 599} {"train_loss": -5.3710036277771, "global_step": 25171, "epoch": 599} {"train_loss": -5.435959815979004, "global_step": 25172, "epoch": 599} {"train_loss": -5.4560346603393555, "global_step": 25173, "epoch": 599} {"train_loss": -5.449084281921387, "global_step": 25174, "epoch": 599} {"train_loss": -5.346632480621338, "global_step": 25175, "epoch": 599} {"train_loss": -5.46297550201416, "global_step": 25176, "epoch": 599} {"train_loss": -5.358330249786377, "global_step": 25177, "epoch": 599} {"train_loss": -5.406093597412109, "global_step": 25178, "epoch": 599} {"train_loss": -5.377760887145996, "global_step": 25179, "epoch": 599} {"train_loss": -5.400516033172607, "global_step": 25180, "epoch": 599} {"train_loss": -5.412439346313477, "global_step": 25181, "epoch": 599} {"train_loss": -5.380097389221191, "global_step": 25182, "epoch": 599} {"train_loss": -5.424771308898926, "global_step": 25183, "epoch": 599} {"train_loss": -5.466172218322754, "global_step": 25184, "epoch": 599} {"train_loss": -5.417106628417969, "global_step": 25185, "epoch": 599} {"train_loss": -5.308712005615234, "global_step": 25186, "epoch": 599} {"train_loss": -5.394097328186035, "global_step": 25187, "epoch": 599} {"train_loss": -5.367669582366943, "global_step": 25188, "epoch": 599} {"train_loss": -5.433347702026367, "global_step": 25189, "epoch": 599} {"train_loss": -5.454333305358887, "global_step": 25190, "epoch": 599} {"train_loss": -5.314400672912598, "global_step": 25191, "epoch": 599} {"train_loss": -5.278564453125, "global_step": 25192, "epoch": 599} {"train_loss": -5.355042457580566, "global_step": 25193, "epoch": 599} {"train_loss": -5.396714687347412, "global_step": 25194, "epoch": 599} {"train_loss": -5.454941749572754, "global_step": 25195, "epoch": 599} {"train_loss": -5.335085868835449, "global_step": 25196, "epoch": 599} {"train_loss": -5.518157958984375, "global_step": 25197, "epoch": 599} {"train_loss": -5.47623348236084, "global_step": 25198, "epoch": 599} {"train_loss": -5.390617177599952, "global_step": 25199, "epoch": 599, "val_loss": 67621.796875} {"train_loss": -5.421181678771973, "global_step": 25200, "epoch": 600} {"train_loss": -5.537337779998779, "global_step": 25201, "epoch": 600} {"train_loss": -5.343358516693115, "global_step": 25202, "epoch": 600} {"train_loss": -5.365839958190918, "global_step": 25203, "epoch": 600} {"train_loss": -5.463678359985352, "global_step": 25204, "epoch": 600} {"train_loss": -5.359493732452393, "global_step": 25205, "epoch": 600} {"train_loss": -5.346827983856201, "global_step": 25206, "epoch": 600} {"train_loss": -5.467817306518555, "global_step": 25207, "epoch": 600} {"train_loss": -5.335657596588135, "global_step": 25208, "epoch": 600} {"train_loss": -5.35513162612915, "global_step": 25209, "epoch": 600} {"train_loss": -5.304962158203125, "global_step": 25210, "epoch": 600} {"train_loss": -5.426311492919922, "global_step": 25211, "epoch": 600} {"train_loss": -5.126626968383789, "global_step": 25212, "epoch": 600} {"train_loss": -5.229128837585449, "global_step": 25213, "epoch": 600} {"train_loss": -5.429293632507324, "global_step": 25214, "epoch": 600} {"train_loss": -5.339580059051514, "global_step": 25215, "epoch": 600} {"train_loss": -5.32295036315918, "global_step": 25216, "epoch": 600} {"train_loss": -5.3911943435668945, "global_step": 25217, "epoch": 600} {"train_loss": -5.502236366271973, "global_step": 25218, "epoch": 600} {"train_loss": -5.366723537445068, "global_step": 25219, "epoch": 600} {"train_loss": -5.366428852081299, "global_step": 25220, "epoch": 600} {"train_loss": -5.3637800216674805, "global_step": 25221, "epoch": 600} {"train_loss": -5.309064865112305, "global_step": 25222, "epoch": 600} {"train_loss": -5.4720354080200195, "global_step": 25223, "epoch": 600} {"train_loss": -5.3338775634765625, "global_step": 25224, "epoch": 600} {"train_loss": -5.475780010223389, "global_step": 25225, "epoch": 600} {"train_loss": -5.439533233642578, "global_step": 25226, "epoch": 600} {"train_loss": -5.474983215332031, "global_step": 25227, "epoch": 600} {"train_loss": -5.397059440612793, "global_step": 25228, "epoch": 600} {"train_loss": -5.414156913757324, "global_step": 25229, "epoch": 600} {"train_loss": -5.36525821685791, "global_step": 25230, "epoch": 600} {"train_loss": -5.3707475662231445, "global_step": 25231, "epoch": 600} {"train_loss": -5.392393112182617, "global_step": 25232, "epoch": 600} {"train_loss": -5.506357669830322, "global_step": 25233, "epoch": 600} {"train_loss": -5.3843841552734375, "global_step": 25234, "epoch": 600} {"train_loss": -5.189089775085449, "global_step": 25235, "epoch": 600} {"train_loss": -5.326448440551758, "global_step": 25236, "epoch": 600} {"train_loss": -5.237015724182129, "global_step": 25237, "epoch": 600} {"train_loss": -5.439272403717041, "global_step": 25238, "epoch": 600} {"train_loss": -5.396815776824951, "global_step": 25239, "epoch": 600} {"train_loss": -5.1998443603515625, "global_step": 25240, "epoch": 600} {"train_loss": -5.373394546054659, "global_step": 25241, "epoch": 600, "train/sim_max_reward_0": 0.5130369546013374, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.09686084395919983, "train/sim_max_reward_3": 0.19673535572462547, "train/sim_max_reward_4": 0.41649747461438735, "train/sim_max_reward_5": 0.9020828258881372, "test/sim_max_reward_4400000": 0.13808432357560793, "test/sim_max_reward_4400001": 0.018475972189237754, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.30128418199535084, "test/sim_max_reward_4400005": 0.13611917913216917, "test/sim_max_reward_4400006": 0.3504910670017321, "test/sim_max_reward_4400007": 0.04522482762281758, "test/sim_max_reward_4400008": 0.42111723930491335, "test/sim_max_reward_4400009": 0.4597350899639747, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.18480091992353692, "test/sim_max_reward_4400012": 0.2356498859580817, "test/sim_max_reward_4400013": 0.18888364155176235, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.2447279589944935, "test/sim_max_reward_4400017": 0.086610377014632, "test/sim_max_reward_4400018": 0.3413270704866343, "test/sim_max_reward_4400019": 0.26098744339250585, "test/sim_max_reward_4400020": 0.0002456173456467521, "test/sim_max_reward_4400021": 0.3972998064990469, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.13895065569172352, "test/sim_max_reward_4400027": 0.09737002868610871, "test/sim_max_reward_4400028": 0.015788509502182916, "test/sim_max_reward_4400029": 0.20276818213076442, "test/sim_max_reward_4400030": 0.031229597183181357, "test/sim_max_reward_4400031": 0.3582564310306923, "test/sim_max_reward_4400032": 0.1814790936238259, "test/sim_max_reward_4400033": 0.1458759102812456, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.39242298398874165, "test/sim_max_reward_4400036": 0.3121398932790155, "test/sim_max_reward_4400037": 0.28660331566075603, "test/sim_max_reward_4400038": 0.400046984895183, "test/sim_max_reward_4400039": 0.5336799853213371, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.46029112645604436, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.05859791469126623, "test/sim_max_reward_4400044": 0.6704082926337869, "test/sim_max_reward_4400045": 0.6491778715767929, "test/sim_max_reward_4400046": 0.25320634030726125, "test/sim_max_reward_4400047": 0.23739094251349904, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 7.844443349159178e-06, "train/mean_score": 0.3543148226682477, "test/mean_score": 0.21619463726658858, "val_loss": 67697.0546875} {"train_loss": -5.496481895446777, "global_step": 25242, "epoch": 601} {"train_loss": -5.328407287597656, "global_step": 25243, "epoch": 601} {"train_loss": -5.521137237548828, "global_step": 25244, "epoch": 601} {"train_loss": -5.417067527770996, "global_step": 25245, "epoch": 601} {"train_loss": -5.483982086181641, "global_step": 25246, "epoch": 601} {"train_loss": -5.4095587730407715, "global_step": 25247, "epoch": 601} {"train_loss": -5.419095039367676, "global_step": 25248, "epoch": 601} {"train_loss": -5.525115966796875, "global_step": 25249, "epoch": 601} {"train_loss": -5.489649772644043, "global_step": 25250, "epoch": 601} {"train_loss": -5.361135482788086, "global_step": 25251, "epoch": 601} {"train_loss": -5.543680667877197, "global_step": 25252, "epoch": 601} {"train_loss": -5.393918514251709, "global_step": 25253, "epoch": 601} {"train_loss": -5.393997669219971, "global_step": 25254, "epoch": 601} {"train_loss": -5.437705039978027, "global_step": 25255, "epoch": 601} {"train_loss": -5.418422222137451, "global_step": 25256, "epoch": 601} {"train_loss": -5.411848068237305, "global_step": 25257, "epoch": 601} {"train_loss": -5.487985610961914, "global_step": 25258, "epoch": 601} {"train_loss": -5.5923380851745605, "global_step": 25259, "epoch": 601} {"train_loss": -5.378644943237305, "global_step": 25260, "epoch": 601} {"train_loss": -5.344278335571289, "global_step": 25261, "epoch": 601} {"train_loss": -5.333418846130371, "global_step": 25262, "epoch": 601} {"train_loss": -5.3195037841796875, "global_step": 25263, "epoch": 601} {"train_loss": -5.386980056762695, "global_step": 25264, "epoch": 601} {"train_loss": -5.2788472175598145, "global_step": 25265, "epoch": 601} {"train_loss": -5.1773576736450195, "global_step": 25266, "epoch": 601} {"train_loss": -5.483633041381836, "global_step": 25267, "epoch": 601} {"train_loss": -5.220814228057861, "global_step": 25268, "epoch": 601} {"train_loss": -5.313724040985107, "global_step": 25269, "epoch": 601} {"train_loss": -5.275625228881836, "global_step": 25270, "epoch": 601} {"train_loss": -5.370091438293457, "global_step": 25271, "epoch": 601} {"train_loss": -5.438360214233398, "global_step": 25272, "epoch": 601} {"train_loss": -5.3051042556762695, "global_step": 25273, "epoch": 601} {"train_loss": -5.266203880310059, "global_step": 25274, "epoch": 601} {"train_loss": -5.3418779373168945, "global_step": 25275, "epoch": 601} {"train_loss": -5.21948766708374, "global_step": 25276, "epoch": 601} {"train_loss": -5.424475193023682, "global_step": 25277, "epoch": 601} {"train_loss": -5.353425025939941, "global_step": 25278, "epoch": 601} {"train_loss": -5.302238464355469, "global_step": 25279, "epoch": 601} {"train_loss": -5.279114723205566, "global_step": 25280, "epoch": 601} {"train_loss": -5.281303405761719, "global_step": 25281, "epoch": 601} {"train_loss": -5.321216583251953, "global_step": 25282, "epoch": 601} {"train_loss": -5.3822111402239114, "global_step": 25283, "epoch": 601, "val_loss": 67776.9453125} {"train_loss": -5.301382064819336, "global_step": 25284, "epoch": 602} {"train_loss": -5.375056266784668, "global_step": 25285, "epoch": 602} {"train_loss": -5.381980895996094, "global_step": 25286, "epoch": 602} {"train_loss": -5.570171356201172, "global_step": 25287, "epoch": 602} {"train_loss": -5.387569904327393, "global_step": 25288, "epoch": 602} {"train_loss": -5.425792694091797, "global_step": 25289, "epoch": 602} {"train_loss": -5.275816440582275, "global_step": 25290, "epoch": 602} {"train_loss": -5.494467258453369, "global_step": 25291, "epoch": 602} {"train_loss": -5.388815402984619, "global_step": 25292, "epoch": 602} {"train_loss": -5.517845153808594, "global_step": 25293, "epoch": 602} {"train_loss": -5.360451698303223, "global_step": 25294, "epoch": 602} {"train_loss": -5.319886684417725, "global_step": 25295, "epoch": 602} {"train_loss": -5.519118309020996, "global_step": 25296, "epoch": 602} {"train_loss": -5.485761642456055, "global_step": 25297, "epoch": 602} {"train_loss": -5.487331867218018, "global_step": 25298, "epoch": 602} {"train_loss": -5.423274040222168, "global_step": 25299, "epoch": 602} {"train_loss": -5.563075065612793, "global_step": 25300, "epoch": 602} {"train_loss": -5.319433212280273, "global_step": 25301, "epoch": 602} {"train_loss": -5.375916481018066, "global_step": 25302, "epoch": 602} {"train_loss": -5.343513011932373, "global_step": 25303, "epoch": 602} {"train_loss": -5.500866889953613, "global_step": 25304, "epoch": 602} {"train_loss": -5.47710657119751, "global_step": 25305, "epoch": 602} {"train_loss": -5.322684288024902, "global_step": 25306, "epoch": 602} {"train_loss": -5.215826034545898, "global_step": 25307, "epoch": 602} {"train_loss": -5.568075656890869, "global_step": 25308, "epoch": 602} {"train_loss": -5.4533162117004395, "global_step": 25309, "epoch": 602} {"train_loss": -5.276885032653809, "global_step": 25310, "epoch": 602} {"train_loss": -5.365983963012695, "global_step": 25311, "epoch": 602} {"train_loss": -5.369338035583496, "global_step": 25312, "epoch": 602} {"train_loss": -5.236471176147461, "global_step": 25313, "epoch": 602} {"train_loss": -5.341017723083496, "global_step": 25314, "epoch": 602} {"train_loss": -5.419277191162109, "global_step": 25315, "epoch": 602} {"train_loss": -5.5394134521484375, "global_step": 25316, "epoch": 602} {"train_loss": -5.441953182220459, "global_step": 25317, "epoch": 602} {"train_loss": -5.459340572357178, "global_step": 25318, "epoch": 602} {"train_loss": -5.348358154296875, "global_step": 25319, "epoch": 602} {"train_loss": -5.415855407714844, "global_step": 25320, "epoch": 602} {"train_loss": -5.439657211303711, "global_step": 25321, "epoch": 602} {"train_loss": -5.344479084014893, "global_step": 25322, "epoch": 602} {"train_loss": -5.289774417877197, "global_step": 25323, "epoch": 602} {"train_loss": -5.420078277587891, "global_step": 25324, "epoch": 602} {"train_loss": -5.4068580695561, "global_step": 25325, "epoch": 602, "val_loss": 67938.828125} {"train_loss": -5.424553871154785, "global_step": 25326, "epoch": 603} {"train_loss": -5.409299850463867, "global_step": 25327, "epoch": 603} {"train_loss": -5.416882038116455, "global_step": 25328, "epoch": 603} {"train_loss": -5.5554890632629395, "global_step": 25329, "epoch": 603} {"train_loss": -5.31710958480835, "global_step": 25330, "epoch": 603} {"train_loss": -5.3127851486206055, "global_step": 25331, "epoch": 603} {"train_loss": -5.421879768371582, "global_step": 25332, "epoch": 603} {"train_loss": -5.328646659851074, "global_step": 25333, "epoch": 603} {"train_loss": -5.394841194152832, "global_step": 25334, "epoch": 603} {"train_loss": -5.557320594787598, "global_step": 25335, "epoch": 603} {"train_loss": -5.327376365661621, "global_step": 25336, "epoch": 603} {"train_loss": -5.463639259338379, "global_step": 25337, "epoch": 603} {"train_loss": -5.365825176239014, "global_step": 25338, "epoch": 603} {"train_loss": -5.319406986236572, "global_step": 25339, "epoch": 603} {"train_loss": -5.3595404624938965, "global_step": 25340, "epoch": 603} {"train_loss": -5.3523478507995605, "global_step": 25341, "epoch": 603} {"train_loss": -5.471540451049805, "global_step": 25342, "epoch": 603} {"train_loss": -5.388110637664795, "global_step": 25343, "epoch": 603} {"train_loss": -5.546133995056152, "global_step": 25344, "epoch": 603} {"train_loss": -5.341055870056152, "global_step": 25345, "epoch": 603} {"train_loss": -5.359663009643555, "global_step": 25346, "epoch": 603} {"train_loss": -5.395230293273926, "global_step": 25347, "epoch": 603} {"train_loss": -5.408865928649902, "global_step": 25348, "epoch": 603} {"train_loss": -5.409799098968506, "global_step": 25349, "epoch": 603} {"train_loss": -5.428542137145996, "global_step": 25350, "epoch": 603} {"train_loss": -5.473308086395264, "global_step": 25351, "epoch": 603} {"train_loss": -5.539925575256348, "global_step": 25352, "epoch": 603} {"train_loss": -5.436206817626953, "global_step": 25353, "epoch": 603} {"train_loss": -5.432539939880371, "global_step": 25354, "epoch": 603} {"train_loss": -5.438072204589844, "global_step": 25355, "epoch": 603} {"train_loss": -5.393730163574219, "global_step": 25356, "epoch": 603} {"train_loss": -5.480062961578369, "global_step": 25357, "epoch": 603} {"train_loss": -5.3817901611328125, "global_step": 25358, "epoch": 603} {"train_loss": -5.435155391693115, "global_step": 25359, "epoch": 603} {"train_loss": -5.418996810913086, "global_step": 25360, "epoch": 603} {"train_loss": -5.490267276763916, "global_step": 25361, "epoch": 603} {"train_loss": -5.452648162841797, "global_step": 25362, "epoch": 603} {"train_loss": -5.587015151977539, "global_step": 25363, "epoch": 603} {"train_loss": -5.385528087615967, "global_step": 25364, "epoch": 603} {"train_loss": -5.361640453338623, "global_step": 25365, "epoch": 603} {"train_loss": -5.401113510131836, "global_step": 25366, "epoch": 603} {"train_loss": -5.418451831454322, "global_step": 25367, "epoch": 603, "val_loss": 67920.140625} {"train_loss": -5.411010265350342, "global_step": 25368, "epoch": 604} {"train_loss": -5.46406364440918, "global_step": 25369, "epoch": 604} {"train_loss": -5.464620113372803, "global_step": 25370, "epoch": 604} {"train_loss": -5.394814968109131, "global_step": 25371, "epoch": 604} {"train_loss": -5.467967987060547, "global_step": 25372, "epoch": 604} {"train_loss": -5.314602851867676, "global_step": 25373, "epoch": 604} {"train_loss": -5.388497829437256, "global_step": 25374, "epoch": 604} {"train_loss": -5.471739292144775, "global_step": 25375, "epoch": 604} {"train_loss": -5.386051177978516, "global_step": 25376, "epoch": 604} {"train_loss": -5.37528657913208, "global_step": 25377, "epoch": 604} {"train_loss": -5.546526908874512, "global_step": 25378, "epoch": 604} {"train_loss": -5.364731788635254, "global_step": 25379, "epoch": 604} {"train_loss": -5.32558536529541, "global_step": 25380, "epoch": 604} {"train_loss": -5.503277778625488, "global_step": 25381, "epoch": 604} {"train_loss": -5.314539909362793, "global_step": 25382, "epoch": 604} {"train_loss": -5.396671772003174, "global_step": 25383, "epoch": 604} {"train_loss": -5.453385829925537, "global_step": 25384, "epoch": 604} {"train_loss": -5.444240570068359, "global_step": 25385, "epoch": 604} {"train_loss": -5.449012756347656, "global_step": 25386, "epoch": 604} {"train_loss": -5.451085090637207, "global_step": 25387, "epoch": 604} {"train_loss": -5.273873329162598, "global_step": 25388, "epoch": 604} {"train_loss": -5.336363792419434, "global_step": 25389, "epoch": 604} {"train_loss": -5.446046829223633, "global_step": 25390, "epoch": 604} {"train_loss": -5.434796333312988, "global_step": 25391, "epoch": 604} {"train_loss": -5.435827732086182, "global_step": 25392, "epoch": 604} {"train_loss": -5.5061445236206055, "global_step": 25393, "epoch": 604} {"train_loss": -5.438027858734131, "global_step": 25394, "epoch": 604} {"train_loss": -5.362905979156494, "global_step": 25395, "epoch": 604} {"train_loss": -5.517950534820557, "global_step": 25396, "epoch": 604} {"train_loss": -5.430599212646484, "global_step": 25397, "epoch": 604} {"train_loss": -5.23405647277832, "global_step": 25398, "epoch": 604} {"train_loss": -5.342581748962402, "global_step": 25399, "epoch": 604} {"train_loss": -5.43231725692749, "global_step": 25400, "epoch": 604} {"train_loss": -5.355497360229492, "global_step": 25401, "epoch": 604} {"train_loss": -5.311820983886719, "global_step": 25402, "epoch": 604} {"train_loss": -5.273887634277344, "global_step": 25403, "epoch": 604} {"train_loss": -5.415311813354492, "global_step": 25404, "epoch": 604} {"train_loss": -5.3973002433776855, "global_step": 25405, "epoch": 604} {"train_loss": -5.448200225830078, "global_step": 25406, "epoch": 604} {"train_loss": -5.327848434448242, "global_step": 25407, "epoch": 604} {"train_loss": -5.358709812164307, "global_step": 25408, "epoch": 604} {"train_loss": -5.4026752426510765, "global_step": 25409, "epoch": 604, "val_loss": 67999.4140625} {"train_loss": -5.5516228675842285, "global_step": 25410, "epoch": 605} {"train_loss": -5.491762161254883, "global_step": 25411, "epoch": 605} {"train_loss": -5.554657936096191, "global_step": 25412, "epoch": 605} {"train_loss": -5.44985294342041, "global_step": 25413, "epoch": 605} {"train_loss": -5.427455902099609, "global_step": 25414, "epoch": 605} {"train_loss": -5.471029281616211, "global_step": 25415, "epoch": 605} {"train_loss": -5.4562482833862305, "global_step": 25416, "epoch": 605} {"train_loss": -5.397843837738037, "global_step": 25417, "epoch": 605} {"train_loss": -5.312584400177002, "global_step": 25418, "epoch": 605} {"train_loss": -5.378276824951172, "global_step": 25419, "epoch": 605} {"train_loss": -5.307224273681641, "global_step": 25420, "epoch": 605} {"train_loss": -5.452492713928223, "global_step": 25421, "epoch": 605} {"train_loss": -5.306048393249512, "global_step": 25422, "epoch": 605} {"train_loss": -5.353002548217773, "global_step": 25423, "epoch": 605} {"train_loss": -5.2594404220581055, "global_step": 25424, "epoch": 605} {"train_loss": -5.195918560028076, "global_step": 25425, "epoch": 605} {"train_loss": -5.500918865203857, "global_step": 25426, "epoch": 605} {"train_loss": -5.2776312828063965, "global_step": 25427, "epoch": 605} {"train_loss": -5.38145637512207, "global_step": 25428, "epoch": 605} {"train_loss": -5.488720893859863, "global_step": 25429, "epoch": 605} {"train_loss": -5.370462417602539, "global_step": 25430, "epoch": 605} {"train_loss": -5.498795509338379, "global_step": 25431, "epoch": 605} {"train_loss": -5.267886161804199, "global_step": 25432, "epoch": 605} {"train_loss": -5.266963958740234, "global_step": 25433, "epoch": 605} {"train_loss": -5.298440933227539, "global_step": 25434, "epoch": 605} {"train_loss": -5.389895439147949, "global_step": 25435, "epoch": 605} {"train_loss": -5.410394668579102, "global_step": 25436, "epoch": 605} {"train_loss": -5.47585916519165, "global_step": 25437, "epoch": 605} {"train_loss": -5.441645622253418, "global_step": 25438, "epoch": 605} {"train_loss": -5.243656158447266, "global_step": 25439, "epoch": 605} {"train_loss": -5.316828727722168, "global_step": 25440, "epoch": 605} {"train_loss": -5.447544574737549, "global_step": 25441, "epoch": 605} {"train_loss": -5.408013343811035, "global_step": 25442, "epoch": 605} {"train_loss": -5.306012153625488, "global_step": 25443, "epoch": 605} {"train_loss": -5.405983924865723, "global_step": 25444, "epoch": 605} {"train_loss": -5.351095676422119, "global_step": 25445, "epoch": 605} {"train_loss": -5.410760879516602, "global_step": 25446, "epoch": 605} {"train_loss": -5.430887699127197, "global_step": 25447, "epoch": 605} {"train_loss": -5.40680456161499, "global_step": 25448, "epoch": 605} {"train_loss": -5.50968074798584, "global_step": 25449, "epoch": 605} {"train_loss": -5.482270240783691, "global_step": 25450, "epoch": 605} {"train_loss": -5.394243739900135, "global_step": 25451, "epoch": 605, "val_loss": 68009.234375} {"train_loss": -5.393488883972168, "global_step": 25452, "epoch": 606} {"train_loss": -5.621852397918701, "global_step": 25453, "epoch": 606} {"train_loss": -5.500231742858887, "global_step": 25454, "epoch": 606} {"train_loss": -5.432405471801758, "global_step": 25455, "epoch": 606} {"train_loss": -5.364672660827637, "global_step": 25456, "epoch": 606} {"train_loss": -5.375485420227051, "global_step": 25457, "epoch": 606} {"train_loss": -5.304254531860352, "global_step": 25458, "epoch": 606} {"train_loss": -5.441333770751953, "global_step": 25459, "epoch": 606} {"train_loss": -5.411586284637451, "global_step": 25460, "epoch": 606} {"train_loss": -5.242584228515625, "global_step": 25461, "epoch": 606} {"train_loss": -5.4754533767700195, "global_step": 25462, "epoch": 606} {"train_loss": -5.449647426605225, "global_step": 25463, "epoch": 606} {"train_loss": -5.479365825653076, "global_step": 25464, "epoch": 606} {"train_loss": -5.396254539489746, "global_step": 25465, "epoch": 606} {"train_loss": -5.332978248596191, "global_step": 25466, "epoch": 606} {"train_loss": -5.380837440490723, "global_step": 25467, "epoch": 606} {"train_loss": -5.419132232666016, "global_step": 25468, "epoch": 606} {"train_loss": -5.444381237030029, "global_step": 25469, "epoch": 606} {"train_loss": -5.372183799743652, "global_step": 25470, "epoch": 606} {"train_loss": -5.514866828918457, "global_step": 25471, "epoch": 606} {"train_loss": -5.421976089477539, "global_step": 25472, "epoch": 606} {"train_loss": -5.421735763549805, "global_step": 25473, "epoch": 606} {"train_loss": -5.508089065551758, "global_step": 25474, "epoch": 606} {"train_loss": -5.540214538574219, "global_step": 25475, "epoch": 606} {"train_loss": -5.520520210266113, "global_step": 25476, "epoch": 606} {"train_loss": -5.413445472717285, "global_step": 25477, "epoch": 606} {"train_loss": -5.472902297973633, "global_step": 25478, "epoch": 606} {"train_loss": -5.488244533538818, "global_step": 25479, "epoch": 606} {"train_loss": -5.395949363708496, "global_step": 25480, "epoch": 606} {"train_loss": -5.370317459106445, "global_step": 25481, "epoch": 606} {"train_loss": -5.434313774108887, "global_step": 25482, "epoch": 606} {"train_loss": -5.373014450073242, "global_step": 25483, "epoch": 606} {"train_loss": -5.205482482910156, "global_step": 25484, "epoch": 606} {"train_loss": -5.441214084625244, "global_step": 25485, "epoch": 606} {"train_loss": -5.420433521270752, "global_step": 25486, "epoch": 606} {"train_loss": -5.4285736083984375, "global_step": 25487, "epoch": 606} {"train_loss": -5.395606994628906, "global_step": 25488, "epoch": 606} {"train_loss": -5.363699913024902, "global_step": 25489, "epoch": 606} {"train_loss": -5.475588321685791, "global_step": 25490, "epoch": 606} {"train_loss": -5.42744255065918, "global_step": 25491, "epoch": 606} {"train_loss": -5.353100776672363, "global_step": 25492, "epoch": 606} {"train_loss": -5.422235840842838, "global_step": 25493, "epoch": 606, "val_loss": 67445.359375} {"train_loss": -5.509308815002441, "global_step": 25494, "epoch": 607} {"train_loss": -5.430845260620117, "global_step": 25495, "epoch": 607} {"train_loss": -5.464707374572754, "global_step": 25496, "epoch": 607} {"train_loss": -5.376350402832031, "global_step": 25497, "epoch": 607} {"train_loss": -5.393113136291504, "global_step": 25498, "epoch": 607} {"train_loss": -5.4132080078125, "global_step": 25499, "epoch": 607} {"train_loss": -5.558762550354004, "global_step": 25500, "epoch": 607} {"train_loss": -5.398182392120361, "global_step": 25501, "epoch": 607} {"train_loss": -5.509538650512695, "global_step": 25502, "epoch": 607} {"train_loss": -5.530105113983154, "global_step": 25503, "epoch": 607} {"train_loss": -5.3380303382873535, "global_step": 25504, "epoch": 607} {"train_loss": -5.315083026885986, "global_step": 25505, "epoch": 607} {"train_loss": -5.29875373840332, "global_step": 25506, "epoch": 607} {"train_loss": -5.395984649658203, "global_step": 25507, "epoch": 607} {"train_loss": -5.389414310455322, "global_step": 25508, "epoch": 607} {"train_loss": -5.303677558898926, "global_step": 25509, "epoch": 607} {"train_loss": -5.370994567871094, "global_step": 25510, "epoch": 607} {"train_loss": -5.344850063323975, "global_step": 25511, "epoch": 607} {"train_loss": -5.427797317504883, "global_step": 25512, "epoch": 607} {"train_loss": -5.224056243896484, "global_step": 25513, "epoch": 607} {"train_loss": -5.461530685424805, "global_step": 25514, "epoch": 607} {"train_loss": -5.371417999267578, "global_step": 25515, "epoch": 607} {"train_loss": -5.234003067016602, "global_step": 25516, "epoch": 607} {"train_loss": -5.370416641235352, "global_step": 25517, "epoch": 607} {"train_loss": -5.49550724029541, "global_step": 25518, "epoch": 607} {"train_loss": -5.285516738891602, "global_step": 25519, "epoch": 607} {"train_loss": -5.455329895019531, "global_step": 25520, "epoch": 607} {"train_loss": -5.385310173034668, "global_step": 25521, "epoch": 607} {"train_loss": -5.295682907104492, "global_step": 25522, "epoch": 607} {"train_loss": -5.320343971252441, "global_step": 25523, "epoch": 607} {"train_loss": -5.475412845611572, "global_step": 25524, "epoch": 607} {"train_loss": -5.406229496002197, "global_step": 25525, "epoch": 607} {"train_loss": -5.305841445922852, "global_step": 25526, "epoch": 607} {"train_loss": -5.385343551635742, "global_step": 25527, "epoch": 607} {"train_loss": -5.469907760620117, "global_step": 25528, "epoch": 607} {"train_loss": -5.341808319091797, "global_step": 25529, "epoch": 607} {"train_loss": -5.406749725341797, "global_step": 25530, "epoch": 607} {"train_loss": -5.354888916015625, "global_step": 25531, "epoch": 607} {"train_loss": -5.3597636222839355, "global_step": 25532, "epoch": 607} {"train_loss": -5.419492721557617, "global_step": 25533, "epoch": 607} {"train_loss": -5.260857582092285, "global_step": 25534, "epoch": 607} {"train_loss": -5.383548566273281, "global_step": 25535, "epoch": 607, "val_loss": 67710.6875} {"train_loss": -5.50718879699707, "global_step": 25536, "epoch": 608} {"train_loss": -5.366359710693359, "global_step": 25537, "epoch": 608} {"train_loss": -5.576668739318848, "global_step": 25538, "epoch": 608} {"train_loss": -5.363927364349365, "global_step": 25539, "epoch": 608} {"train_loss": -5.467126369476318, "global_step": 25540, "epoch": 608} {"train_loss": -5.389238357543945, "global_step": 25541, "epoch": 608} {"train_loss": -5.469091415405273, "global_step": 25542, "epoch": 608} {"train_loss": -5.3198676109313965, "global_step": 25543, "epoch": 608} {"train_loss": -5.448281288146973, "global_step": 25544, "epoch": 608} {"train_loss": -5.317142963409424, "global_step": 25545, "epoch": 608} {"train_loss": -5.337954044342041, "global_step": 25546, "epoch": 608} {"train_loss": -5.353292465209961, "global_step": 25547, "epoch": 608} {"train_loss": -5.158558368682861, "global_step": 25548, "epoch": 608} {"train_loss": -5.3807525634765625, "global_step": 25549, "epoch": 608} {"train_loss": -5.156538963317871, "global_step": 25550, "epoch": 608} {"train_loss": -5.495779037475586, "global_step": 25551, "epoch": 608} {"train_loss": -5.2506608963012695, "global_step": 25552, "epoch": 608} {"train_loss": -5.2754926681518555, "global_step": 25553, "epoch": 608} {"train_loss": -5.366913795471191, "global_step": 25554, "epoch": 608} {"train_loss": -5.382803916931152, "global_step": 25555, "epoch": 608} {"train_loss": -5.386927604675293, "global_step": 25556, "epoch": 608} {"train_loss": -5.367142677307129, "global_step": 25557, "epoch": 608} {"train_loss": -5.288152694702148, "global_step": 25558, "epoch": 608} {"train_loss": -5.459704399108887, "global_step": 25559, "epoch": 608} {"train_loss": -5.2869110107421875, "global_step": 25560, "epoch": 608} {"train_loss": -5.487860679626465, "global_step": 25561, "epoch": 608} {"train_loss": -5.300230026245117, "global_step": 25562, "epoch": 608} {"train_loss": -5.368303298950195, "global_step": 25563, "epoch": 608} {"train_loss": -5.255826473236084, "global_step": 25564, "epoch": 608} {"train_loss": -5.3303022384643555, "global_step": 25565, "epoch": 608} {"train_loss": -5.340242385864258, "global_step": 25566, "epoch": 608} {"train_loss": -5.257293701171875, "global_step": 25567, "epoch": 608} {"train_loss": -5.430405616760254, "global_step": 25568, "epoch": 608} {"train_loss": -5.322793483734131, "global_step": 25569, "epoch": 608} {"train_loss": -5.290579795837402, "global_step": 25570, "epoch": 608} {"train_loss": -5.24370813369751, "global_step": 25571, "epoch": 608} {"train_loss": -5.316644668579102, "global_step": 25572, "epoch": 608} {"train_loss": -5.40096378326416, "global_step": 25573, "epoch": 608} {"train_loss": -5.29094123840332, "global_step": 25574, "epoch": 608} {"train_loss": -5.475231170654297, "global_step": 25575, "epoch": 608} {"train_loss": -5.222646713256836, "global_step": 25576, "epoch": 608} {"train_loss": -5.356936863490513, "global_step": 25577, "epoch": 608, "val_loss": 67499.90625} {"train_loss": -5.393304824829102, "global_step": 25578, "epoch": 609} {"train_loss": -5.4228105545043945, "global_step": 25579, "epoch": 609} {"train_loss": -5.307072639465332, "global_step": 25580, "epoch": 609} {"train_loss": -5.4127302169799805, "global_step": 25581, "epoch": 609} {"train_loss": -5.410891056060791, "global_step": 25582, "epoch": 609} {"train_loss": -5.422791004180908, "global_step": 25583, "epoch": 609} {"train_loss": -5.341231822967529, "global_step": 25584, "epoch": 609} {"train_loss": -5.483460903167725, "global_step": 25585, "epoch": 609} {"train_loss": -5.452841758728027, "global_step": 25586, "epoch": 609} {"train_loss": -5.642889022827148, "global_step": 25587, "epoch": 609} {"train_loss": -5.313165664672852, "global_step": 25588, "epoch": 609} {"train_loss": -5.408228397369385, "global_step": 25589, "epoch": 609} {"train_loss": -5.433842658996582, "global_step": 25590, "epoch": 609} {"train_loss": -5.410698890686035, "global_step": 25591, "epoch": 609} {"train_loss": -5.2513508796691895, "global_step": 25592, "epoch": 609} {"train_loss": -5.433112144470215, "global_step": 25593, "epoch": 609} {"train_loss": -5.434693336486816, "global_step": 25594, "epoch": 609} {"train_loss": -5.247580528259277, "global_step": 25595, "epoch": 609} {"train_loss": -5.388789176940918, "global_step": 25596, "epoch": 609} {"train_loss": -5.488752365112305, "global_step": 25597, "epoch": 609} {"train_loss": -5.383004665374756, "global_step": 25598, "epoch": 609} {"train_loss": -5.295584678649902, "global_step": 25599, "epoch": 609} {"train_loss": -5.397055149078369, "global_step": 25600, "epoch": 609} {"train_loss": -5.532705307006836, "global_step": 25601, "epoch": 609} {"train_loss": -5.112401485443115, "global_step": 25602, "epoch": 609} {"train_loss": -5.398698806762695, "global_step": 25603, "epoch": 609} {"train_loss": -5.3454999923706055, "global_step": 25604, "epoch": 609} {"train_loss": -5.437602519989014, "global_step": 25605, "epoch": 609} {"train_loss": -5.496730804443359, "global_step": 25606, "epoch": 609} {"train_loss": -5.3256330490112305, "global_step": 25607, "epoch": 609} {"train_loss": -5.343462944030762, "global_step": 25608, "epoch": 609} {"train_loss": -5.471316337585449, "global_step": 25609, "epoch": 609} {"train_loss": -5.305050849914551, "global_step": 25610, "epoch": 609} {"train_loss": -5.482697486877441, "global_step": 25611, "epoch": 609} {"train_loss": -5.464961051940918, "global_step": 25612, "epoch": 609} {"train_loss": -5.335395336151123, "global_step": 25613, "epoch": 609} {"train_loss": -5.337835311889648, "global_step": 25614, "epoch": 609} {"train_loss": -5.287487506866455, "global_step": 25615, "epoch": 609} {"train_loss": -5.334756374359131, "global_step": 25616, "epoch": 609} {"train_loss": -5.352777481079102, "global_step": 25617, "epoch": 609} {"train_loss": -5.286455154418945, "global_step": 25618, "epoch": 609} {"train_loss": -5.3896688506716774, "global_step": 25619, "epoch": 609, "val_loss": 67789.140625} {"train_loss": -5.575137138366699, "global_step": 25620, "epoch": 610} {"train_loss": -5.464554786682129, "global_step": 25621, "epoch": 610} {"train_loss": -5.294873237609863, "global_step": 25622, "epoch": 610} {"train_loss": -5.443586349487305, "global_step": 25623, "epoch": 610} {"train_loss": -5.342002868652344, "global_step": 25624, "epoch": 610} {"train_loss": -5.357937812805176, "global_step": 25625, "epoch": 610} {"train_loss": -5.426580905914307, "global_step": 25626, "epoch": 610} {"train_loss": -5.404338836669922, "global_step": 25627, "epoch": 610} {"train_loss": -5.445538520812988, "global_step": 25628, "epoch": 610} {"train_loss": -5.340782642364502, "global_step": 25629, "epoch": 610} {"train_loss": -5.4471940994262695, "global_step": 25630, "epoch": 610} {"train_loss": -5.475757598876953, "global_step": 25631, "epoch": 610} {"train_loss": -5.468289375305176, "global_step": 25632, "epoch": 610} {"train_loss": -5.3139777183532715, "global_step": 25633, "epoch": 610} {"train_loss": -5.463675498962402, "global_step": 25634, "epoch": 610} {"train_loss": -5.386540412902832, "global_step": 25635, "epoch": 610} {"train_loss": -5.360412120819092, "global_step": 25636, "epoch": 610} {"train_loss": -5.280529022216797, "global_step": 25637, "epoch": 610} {"train_loss": -5.525703430175781, "global_step": 25638, "epoch": 610} {"train_loss": -5.41490364074707, "global_step": 25639, "epoch": 610} {"train_loss": -5.181004524230957, "global_step": 25640, "epoch": 610} {"train_loss": -5.552897930145264, "global_step": 25641, "epoch": 610} {"train_loss": -5.4535932540893555, "global_step": 25642, "epoch": 610} {"train_loss": -5.362145900726318, "global_step": 25643, "epoch": 610} {"train_loss": -5.361163139343262, "global_step": 25644, "epoch": 610} {"train_loss": -5.345902919769287, "global_step": 25645, "epoch": 610} {"train_loss": -5.342051029205322, "global_step": 25646, "epoch": 610} {"train_loss": -5.542166709899902, "global_step": 25647, "epoch": 610} {"train_loss": -5.308742046356201, "global_step": 25648, "epoch": 610} {"train_loss": -5.489979267120361, "global_step": 25649, "epoch": 610} {"train_loss": -5.458126068115234, "global_step": 25650, "epoch": 610} {"train_loss": -5.300466537475586, "global_step": 25651, "epoch": 610} {"train_loss": -5.34535026550293, "global_step": 25652, "epoch": 610} {"train_loss": -5.430783271789551, "global_step": 25653, "epoch": 610} {"train_loss": -5.284862518310547, "global_step": 25654, "epoch": 610} {"train_loss": -5.434273719787598, "global_step": 25655, "epoch": 610} {"train_loss": -5.470914840698242, "global_step": 25656, "epoch": 610} {"train_loss": -5.468727111816406, "global_step": 25657, "epoch": 610} {"train_loss": -5.271624565124512, "global_step": 25658, "epoch": 610} {"train_loss": -5.363585472106934, "global_step": 25659, "epoch": 610} {"train_loss": -5.345795154571533, "global_step": 25660, "epoch": 610} {"train_loss": -5.400073516936529, "global_step": 25661, "epoch": 610, "val_loss": 67500.3515625} {"train_loss": -5.45835542678833, "global_step": 25662, "epoch": 611} {"train_loss": -5.3570709228515625, "global_step": 25663, "epoch": 611} {"train_loss": -5.435424327850342, "global_step": 25664, "epoch": 611} {"train_loss": -5.258515357971191, "global_step": 25665, "epoch": 611} {"train_loss": -5.4978485107421875, "global_step": 25666, "epoch": 611} {"train_loss": -5.531154632568359, "global_step": 25667, "epoch": 611} {"train_loss": -5.430665493011475, "global_step": 25668, "epoch": 611} {"train_loss": -5.261768341064453, "global_step": 25669, "epoch": 611} {"train_loss": -5.339893341064453, "global_step": 25670, "epoch": 611} {"train_loss": -5.489014625549316, "global_step": 25671, "epoch": 611} {"train_loss": -5.476782321929932, "global_step": 25672, "epoch": 611} {"train_loss": -5.520027160644531, "global_step": 25673, "epoch": 611} {"train_loss": -5.330253601074219, "global_step": 25674, "epoch": 611} {"train_loss": -5.427451133728027, "global_step": 25675, "epoch": 611} {"train_loss": -5.524796485900879, "global_step": 25676, "epoch": 611} {"train_loss": -5.423252105712891, "global_step": 25677, "epoch": 611} {"train_loss": -5.2942352294921875, "global_step": 25678, "epoch": 611} {"train_loss": -5.361923694610596, "global_step": 25679, "epoch": 611} {"train_loss": -5.471444129943848, "global_step": 25680, "epoch": 611} {"train_loss": -5.450677871704102, "global_step": 25681, "epoch": 611} {"train_loss": -5.420705795288086, "global_step": 25682, "epoch": 611} {"train_loss": -5.363115310668945, "global_step": 25683, "epoch": 611} {"train_loss": -5.327872276306152, "global_step": 25684, "epoch": 611} {"train_loss": -5.364833831787109, "global_step": 25685, "epoch": 611} {"train_loss": -5.299206733703613, "global_step": 25686, "epoch": 611} {"train_loss": -5.30756950378418, "global_step": 25687, "epoch": 611} {"train_loss": -5.5091633796691895, "global_step": 25688, "epoch": 611} {"train_loss": -5.394403457641602, "global_step": 25689, "epoch": 611} {"train_loss": -5.4136962890625, "global_step": 25690, "epoch": 611} {"train_loss": -5.370255470275879, "global_step": 25691, "epoch": 611} {"train_loss": -5.388179779052734, "global_step": 25692, "epoch": 611} {"train_loss": -5.339190483093262, "global_step": 25693, "epoch": 611} {"train_loss": -5.393097877502441, "global_step": 25694, "epoch": 611} {"train_loss": -5.377774238586426, "global_step": 25695, "epoch": 611} {"train_loss": -5.405834197998047, "global_step": 25696, "epoch": 611} {"train_loss": -5.457703113555908, "global_step": 25697, "epoch": 611} {"train_loss": -5.439227104187012, "global_step": 25698, "epoch": 611} {"train_loss": -5.3797101974487305, "global_step": 25699, "epoch": 611} {"train_loss": -5.419866561889648, "global_step": 25700, "epoch": 611} {"train_loss": -5.487110137939453, "global_step": 25701, "epoch": 611} {"train_loss": -5.272859573364258, "global_step": 25702, "epoch": 611} {"train_loss": -5.405050641014462, "global_step": 25703, "epoch": 611, "val_loss": 67903.125} {"train_loss": -5.377574443817139, "global_step": 25704, "epoch": 612} {"train_loss": -5.2876996994018555, "global_step": 25705, "epoch": 612} {"train_loss": -5.4510297775268555, "global_step": 25706, "epoch": 612} {"train_loss": -5.447846412658691, "global_step": 25707, "epoch": 612} {"train_loss": -5.450427055358887, "global_step": 25708, "epoch": 612} {"train_loss": -5.3124895095825195, "global_step": 25709, "epoch": 612} {"train_loss": -5.504509925842285, "global_step": 25710, "epoch": 612} {"train_loss": -5.418497085571289, "global_step": 25711, "epoch": 612} {"train_loss": -5.425461292266846, "global_step": 25712, "epoch": 612} {"train_loss": -5.311397075653076, "global_step": 25713, "epoch": 612} {"train_loss": -5.409523010253906, "global_step": 25714, "epoch": 612} {"train_loss": -5.4693121910095215, "global_step": 25715, "epoch": 612} {"train_loss": -5.41532564163208, "global_step": 25716, "epoch": 612} {"train_loss": -5.437748432159424, "global_step": 25717, "epoch": 612} {"train_loss": -5.332510948181152, "global_step": 25718, "epoch": 612} {"train_loss": -5.347069263458252, "global_step": 25719, "epoch": 612} {"train_loss": -5.44029426574707, "global_step": 25720, "epoch": 612} {"train_loss": -5.3477983474731445, "global_step": 25721, "epoch": 612} {"train_loss": -5.311352729797363, "global_step": 25722, "epoch": 612} {"train_loss": -5.446315288543701, "global_step": 25723, "epoch": 612} {"train_loss": -5.405427932739258, "global_step": 25724, "epoch": 612} {"train_loss": -5.466228008270264, "global_step": 25725, "epoch": 612} {"train_loss": -5.304878234863281, "global_step": 25726, "epoch": 612} {"train_loss": -5.465420722961426, "global_step": 25727, "epoch": 612} {"train_loss": -5.461057662963867, "global_step": 25728, "epoch": 612} {"train_loss": -5.39306640625, "global_step": 25729, "epoch": 612} {"train_loss": -5.4237284660339355, "global_step": 25730, "epoch": 612} {"train_loss": -5.396139621734619, "global_step": 25731, "epoch": 612} {"train_loss": -5.505040645599365, "global_step": 25732, "epoch": 612} {"train_loss": -5.329789161682129, "global_step": 25733, "epoch": 612} {"train_loss": -5.3003387451171875, "global_step": 25734, "epoch": 612} {"train_loss": -5.366137504577637, "global_step": 25735, "epoch": 612} {"train_loss": -5.424692153930664, "global_step": 25736, "epoch": 612} {"train_loss": -5.380931854248047, "global_step": 25737, "epoch": 612} {"train_loss": -5.3823347091674805, "global_step": 25738, "epoch": 612} {"train_loss": -5.469135761260986, "global_step": 25739, "epoch": 612} {"train_loss": -5.414073467254639, "global_step": 25740, "epoch": 612} {"train_loss": -5.305508613586426, "global_step": 25741, "epoch": 612} {"train_loss": -5.407095909118652, "global_step": 25742, "epoch": 612} {"train_loss": -5.374600410461426, "global_step": 25743, "epoch": 612} {"train_loss": -5.299155235290527, "global_step": 25744, "epoch": 612} {"train_loss": -5.392745812733968, "global_step": 25745, "epoch": 612, "val_loss": 67689.4375} {"train_loss": -5.370048522949219, "global_step": 25746, "epoch": 613} {"train_loss": -5.3729143142700195, "global_step": 25747, "epoch": 613} {"train_loss": -5.397319793701172, "global_step": 25748, "epoch": 613} {"train_loss": -5.405712127685547, "global_step": 25749, "epoch": 613} {"train_loss": -5.410552978515625, "global_step": 25750, "epoch": 613} {"train_loss": -5.409284591674805, "global_step": 25751, "epoch": 613} {"train_loss": -5.416189193725586, "global_step": 25752, "epoch": 613} {"train_loss": -5.243671417236328, "global_step": 25753, "epoch": 613} {"train_loss": -5.384812355041504, "global_step": 25754, "epoch": 613} {"train_loss": -5.443279266357422, "global_step": 25755, "epoch": 613} {"train_loss": -5.314929962158203, "global_step": 25756, "epoch": 613} {"train_loss": -5.466756343841553, "global_step": 25757, "epoch": 613} {"train_loss": -5.476648330688477, "global_step": 25758, "epoch": 613} {"train_loss": -5.282909393310547, "global_step": 25759, "epoch": 613} {"train_loss": -5.356523513793945, "global_step": 25760, "epoch": 613} {"train_loss": -5.562808036804199, "global_step": 25761, "epoch": 613} {"train_loss": -5.460163116455078, "global_step": 25762, "epoch": 613} {"train_loss": -5.2829508781433105, "global_step": 25763, "epoch": 613} {"train_loss": -5.517848014831543, "global_step": 25764, "epoch": 613} {"train_loss": -5.335360050201416, "global_step": 25765, "epoch": 613} {"train_loss": -5.344324111938477, "global_step": 25766, "epoch": 613} {"train_loss": -5.58030891418457, "global_step": 25767, "epoch": 613} {"train_loss": -5.41654109954834, "global_step": 25768, "epoch": 613} {"train_loss": -5.493793487548828, "global_step": 25769, "epoch": 613} {"train_loss": -5.417623043060303, "global_step": 25770, "epoch": 613} {"train_loss": -5.385907173156738, "global_step": 25771, "epoch": 613} {"train_loss": -5.592955589294434, "global_step": 25772, "epoch": 613} {"train_loss": -5.330679893493652, "global_step": 25773, "epoch": 613} {"train_loss": -5.348430156707764, "global_step": 25774, "epoch": 613} {"train_loss": -5.44483757019043, "global_step": 25775, "epoch": 613} {"train_loss": -5.427999019622803, "global_step": 25776, "epoch": 613} {"train_loss": -5.485074996948242, "global_step": 25777, "epoch": 613} {"train_loss": -5.355277061462402, "global_step": 25778, "epoch": 613} {"train_loss": -5.398691177368164, "global_step": 25779, "epoch": 613} {"train_loss": -5.3396477699279785, "global_step": 25780, "epoch": 613} {"train_loss": -5.57210636138916, "global_step": 25781, "epoch": 613} {"train_loss": -5.349346160888672, "global_step": 25782, "epoch": 613} {"train_loss": -5.324371337890625, "global_step": 25783, "epoch": 613} {"train_loss": -5.504606246948242, "global_step": 25784, "epoch": 613} {"train_loss": -5.416189193725586, "global_step": 25785, "epoch": 613} {"train_loss": -5.415970325469971, "global_step": 25786, "epoch": 613} {"train_loss": -5.410384859357562, "global_step": 25787, "epoch": 613, "val_loss": 67535.9765625} {"train_loss": -5.511025905609131, "global_step": 25788, "epoch": 614} {"train_loss": -5.313584327697754, "global_step": 25789, "epoch": 614} {"train_loss": -5.474764823913574, "global_step": 25790, "epoch": 614} {"train_loss": -5.4753265380859375, "global_step": 25791, "epoch": 614} {"train_loss": -5.532802581787109, "global_step": 25792, "epoch": 614} {"train_loss": -5.43940544128418, "global_step": 25793, "epoch": 614} {"train_loss": -5.432899475097656, "global_step": 25794, "epoch": 614} {"train_loss": -5.317220687866211, "global_step": 25795, "epoch": 614} {"train_loss": -5.443045616149902, "global_step": 25796, "epoch": 614} {"train_loss": -5.265605926513672, "global_step": 25797, "epoch": 614} {"train_loss": -5.512304782867432, "global_step": 25798, "epoch": 614} {"train_loss": -5.297159194946289, "global_step": 25799, "epoch": 614} {"train_loss": -5.3122358322143555, "global_step": 25800, "epoch": 614} {"train_loss": -5.3482537269592285, "global_step": 25801, "epoch": 614} {"train_loss": -5.408459663391113, "global_step": 25802, "epoch": 614} {"train_loss": -5.449751853942871, "global_step": 25803, "epoch": 614} {"train_loss": -5.364260673522949, "global_step": 25804, "epoch": 614} {"train_loss": -5.466083526611328, "global_step": 25805, "epoch": 614} {"train_loss": -5.449698448181152, "global_step": 25806, "epoch": 614} {"train_loss": -5.2335100173950195, "global_step": 25807, "epoch": 614} {"train_loss": -5.559643745422363, "global_step": 25808, "epoch": 614} {"train_loss": -5.409448146820068, "global_step": 25809, "epoch": 614} {"train_loss": -5.409175395965576, "global_step": 25810, "epoch": 614} {"train_loss": -5.482763290405273, "global_step": 25811, "epoch": 614} {"train_loss": -5.481436729431152, "global_step": 25812, "epoch": 614} {"train_loss": -5.385702133178711, "global_step": 25813, "epoch": 614} {"train_loss": -5.339035987854004, "global_step": 25814, "epoch": 614} {"train_loss": -5.4483723640441895, "global_step": 25815, "epoch": 614} {"train_loss": -5.546124458312988, "global_step": 25816, "epoch": 614} {"train_loss": -5.482912063598633, "global_step": 25817, "epoch": 614} {"train_loss": -5.4098968505859375, "global_step": 25818, "epoch": 614} {"train_loss": -5.47886848449707, "global_step": 25819, "epoch": 614} {"train_loss": -5.439381122589111, "global_step": 25820, "epoch": 614} {"train_loss": -5.516838550567627, "global_step": 25821, "epoch": 614} {"train_loss": -5.445063591003418, "global_step": 25822, "epoch": 614} {"train_loss": -5.287036895751953, "global_step": 25823, "epoch": 614} {"train_loss": -5.301815986633301, "global_step": 25824, "epoch": 614} {"train_loss": -5.429190635681152, "global_step": 25825, "epoch": 614} {"train_loss": -5.337775707244873, "global_step": 25826, "epoch": 614} {"train_loss": -5.382565021514893, "global_step": 25827, "epoch": 614} {"train_loss": -5.514369010925293, "global_step": 25828, "epoch": 614} {"train_loss": -5.4152776173182895, "global_step": 25829, "epoch": 614, "val_loss": 67625.6484375} {"train_loss": -5.40517520904541, "global_step": 25830, "epoch": 615} {"train_loss": -5.412618637084961, "global_step": 25831, "epoch": 615} {"train_loss": -5.41436767578125, "global_step": 25832, "epoch": 615} {"train_loss": -5.4197516441345215, "global_step": 25833, "epoch": 615} {"train_loss": -5.344149589538574, "global_step": 25834, "epoch": 615} {"train_loss": -5.4696149826049805, "global_step": 25835, "epoch": 615} {"train_loss": -5.3888139724731445, "global_step": 25836, "epoch": 615} {"train_loss": -5.44133186340332, "global_step": 25837, "epoch": 615} {"train_loss": -5.2947492599487305, "global_step": 25838, "epoch": 615} {"train_loss": -5.322333335876465, "global_step": 25839, "epoch": 615} {"train_loss": -5.443802833557129, "global_step": 25840, "epoch": 615} {"train_loss": -5.446099758148193, "global_step": 25841, "epoch": 615} {"train_loss": -5.418858528137207, "global_step": 25842, "epoch": 615} {"train_loss": -5.44147253036499, "global_step": 25843, "epoch": 615} {"train_loss": -5.516506195068359, "global_step": 25844, "epoch": 615} {"train_loss": -5.54724645614624, "global_step": 25845, "epoch": 615} {"train_loss": -5.444061279296875, "global_step": 25846, "epoch": 615} {"train_loss": -5.37283992767334, "global_step": 25847, "epoch": 615} {"train_loss": -5.366069316864014, "global_step": 25848, "epoch": 615} {"train_loss": -5.491805076599121, "global_step": 25849, "epoch": 615} {"train_loss": -5.391222953796387, "global_step": 25850, "epoch": 615} {"train_loss": -5.525722503662109, "global_step": 25851, "epoch": 615} {"train_loss": -5.404790878295898, "global_step": 25852, "epoch": 615} {"train_loss": -5.3684282302856445, "global_step": 25853, "epoch": 615} {"train_loss": -5.35557746887207, "global_step": 25854, "epoch": 615} {"train_loss": -5.3383588790893555, "global_step": 25855, "epoch": 615} {"train_loss": -5.369062423706055, "global_step": 25856, "epoch": 615} {"train_loss": -5.261418342590332, "global_step": 25857, "epoch": 615} {"train_loss": -5.384599208831787, "global_step": 25858, "epoch": 615} {"train_loss": -5.4611077308654785, "global_step": 25859, "epoch": 615} {"train_loss": -5.301994323730469, "global_step": 25860, "epoch": 615} {"train_loss": -5.480016708374023, "global_step": 25861, "epoch": 615} {"train_loss": -5.515004634857178, "global_step": 25862, "epoch": 615} {"train_loss": -5.577339172363281, "global_step": 25863, "epoch": 615} {"train_loss": -5.52046012878418, "global_step": 25864, "epoch": 615} {"train_loss": -5.45754861831665, "global_step": 25865, "epoch": 615} {"train_loss": -5.493558883666992, "global_step": 25866, "epoch": 615} {"train_loss": -5.432523250579834, "global_step": 25867, "epoch": 615} {"train_loss": -5.36652946472168, "global_step": 25868, "epoch": 615} {"train_loss": -5.396384239196777, "global_step": 25869, "epoch": 615} {"train_loss": -5.488944053649902, "global_step": 25870, "epoch": 615} {"train_loss": -5.420763787769136, "global_step": 25871, "epoch": 615, "val_loss": 67721.109375} {"train_loss": -5.349034786224365, "global_step": 25872, "epoch": 616} {"train_loss": -5.486093044281006, "global_step": 25873, "epoch": 616} {"train_loss": -5.465420722961426, "global_step": 25874, "epoch": 616} {"train_loss": -5.393640518188477, "global_step": 25875, "epoch": 616} {"train_loss": -5.478241443634033, "global_step": 25876, "epoch": 616} {"train_loss": -5.389145374298096, "global_step": 25877, "epoch": 616} {"train_loss": -5.593592643737793, "global_step": 25878, "epoch": 616} {"train_loss": -5.425209045410156, "global_step": 25879, "epoch": 616} {"train_loss": -5.292271614074707, "global_step": 25880, "epoch": 616} {"train_loss": -5.366883754730225, "global_step": 25881, "epoch": 616} {"train_loss": -5.399670600891113, "global_step": 25882, "epoch": 616} {"train_loss": -5.422942161560059, "global_step": 25883, "epoch": 616} {"train_loss": -5.301515102386475, "global_step": 25884, "epoch": 616} {"train_loss": -5.339210510253906, "global_step": 25885, "epoch": 616} {"train_loss": -5.436640739440918, "global_step": 25886, "epoch": 616} {"train_loss": -5.415103912353516, "global_step": 25887, "epoch": 616} {"train_loss": -5.320782661437988, "global_step": 25888, "epoch": 616} {"train_loss": -5.450170516967773, "global_step": 25889, "epoch": 616} {"train_loss": -5.347546577453613, "global_step": 25890, "epoch": 616} {"train_loss": -5.286396503448486, "global_step": 25891, "epoch": 616} {"train_loss": -5.311159133911133, "global_step": 25892, "epoch": 616} {"train_loss": -5.251520156860352, "global_step": 25893, "epoch": 616} {"train_loss": -5.45916748046875, "global_step": 25894, "epoch": 616} {"train_loss": -5.313171863555908, "global_step": 25895, "epoch": 616} {"train_loss": -5.3384246826171875, "global_step": 25896, "epoch": 616} {"train_loss": -5.358315467834473, "global_step": 25897, "epoch": 616} {"train_loss": -5.544219017028809, "global_step": 25898, "epoch": 616} {"train_loss": -5.348746299743652, "global_step": 25899, "epoch": 616} {"train_loss": -5.357556343078613, "global_step": 25900, "epoch": 616} {"train_loss": -5.327199935913086, "global_step": 25901, "epoch": 616} {"train_loss": -5.562500953674316, "global_step": 25902, "epoch": 616} {"train_loss": -5.37960147857666, "global_step": 25903, "epoch": 616} {"train_loss": -5.385459899902344, "global_step": 25904, "epoch": 616} {"train_loss": -5.349344253540039, "global_step": 25905, "epoch": 616} {"train_loss": -5.416027069091797, "global_step": 25906, "epoch": 616} {"train_loss": -5.358852386474609, "global_step": 25907, "epoch": 616} {"train_loss": -5.379205703735352, "global_step": 25908, "epoch": 616} {"train_loss": -5.44327449798584, "global_step": 25909, "epoch": 616} {"train_loss": -5.521451950073242, "global_step": 25910, "epoch": 616} {"train_loss": -5.472769737243652, "global_step": 25911, "epoch": 616} {"train_loss": -5.472356796264648, "global_step": 25912, "epoch": 616} {"train_loss": -5.400705019632976, "global_step": 25913, "epoch": 616, "val_loss": 67686.328125} {"train_loss": -5.449006080627441, "global_step": 25914, "epoch": 617} {"train_loss": -5.512640476226807, "global_step": 25915, "epoch": 617} {"train_loss": -5.471786022186279, "global_step": 25916, "epoch": 617} {"train_loss": -5.351545810699463, "global_step": 25917, "epoch": 617} {"train_loss": -5.42380952835083, "global_step": 25918, "epoch": 617} {"train_loss": -5.614470958709717, "global_step": 25919, "epoch": 617} {"train_loss": -5.3238115310668945, "global_step": 25920, "epoch": 617} {"train_loss": -5.3032755851745605, "global_step": 25921, "epoch": 617} {"train_loss": -5.463624954223633, "global_step": 25922, "epoch": 617} {"train_loss": -5.3665008544921875, "global_step": 25923, "epoch": 617} {"train_loss": -5.306938648223877, "global_step": 25924, "epoch": 617} {"train_loss": -5.325826644897461, "global_step": 25925, "epoch": 617} {"train_loss": -5.292006969451904, "global_step": 25926, "epoch": 617} {"train_loss": -5.46683406829834, "global_step": 25927, "epoch": 617} {"train_loss": -5.276452541351318, "global_step": 25928, "epoch": 617} {"train_loss": -5.362038612365723, "global_step": 25929, "epoch": 617} {"train_loss": -5.404869556427002, "global_step": 25930, "epoch": 617} {"train_loss": -5.328109264373779, "global_step": 25931, "epoch": 617} {"train_loss": -5.372970104217529, "global_step": 25932, "epoch": 617} {"train_loss": -5.407651901245117, "global_step": 25933, "epoch": 617} {"train_loss": -5.352206707000732, "global_step": 25934, "epoch": 617} {"train_loss": -5.495945930480957, "global_step": 25935, "epoch": 617} {"train_loss": -5.388011932373047, "global_step": 25936, "epoch": 617} {"train_loss": -5.462274551391602, "global_step": 25937, "epoch": 617} {"train_loss": -5.5650739669799805, "global_step": 25938, "epoch": 617} {"train_loss": -5.485373497009277, "global_step": 25939, "epoch": 617} {"train_loss": -5.388406276702881, "global_step": 25940, "epoch": 617} {"train_loss": -5.422824859619141, "global_step": 25941, "epoch": 617} {"train_loss": -5.392222881317139, "global_step": 25942, "epoch": 617} {"train_loss": -5.432730197906494, "global_step": 25943, "epoch": 617} {"train_loss": -5.433523654937744, "global_step": 25944, "epoch": 617} {"train_loss": -5.536226272583008, "global_step": 25945, "epoch": 617} {"train_loss": -5.434826374053955, "global_step": 25946, "epoch": 617} {"train_loss": -5.486250877380371, "global_step": 25947, "epoch": 617} {"train_loss": -5.415088653564453, "global_step": 25948, "epoch": 617} {"train_loss": -5.382163047790527, "global_step": 25949, "epoch": 617} {"train_loss": -5.34475040435791, "global_step": 25950, "epoch": 617} {"train_loss": -5.406293869018555, "global_step": 25951, "epoch": 617} {"train_loss": -5.383033752441406, "global_step": 25952, "epoch": 617} {"train_loss": -5.411883354187012, "global_step": 25953, "epoch": 617} {"train_loss": -5.355428695678711, "global_step": 25954, "epoch": 617} {"train_loss": -5.412282693953741, "global_step": 25955, "epoch": 617, "val_loss": 67671.3046875} {"train_loss": -5.555252552032471, "global_step": 25956, "epoch": 618} {"train_loss": -5.332728385925293, "global_step": 25957, "epoch": 618} {"train_loss": -5.352369785308838, "global_step": 25958, "epoch": 618} {"train_loss": -5.357880592346191, "global_step": 25959, "epoch": 618} {"train_loss": -5.366761207580566, "global_step": 25960, "epoch": 618} {"train_loss": -5.328244686126709, "global_step": 25961, "epoch": 618} {"train_loss": -5.494791507720947, "global_step": 25962, "epoch": 618} {"train_loss": -5.4831438064575195, "global_step": 25963, "epoch": 618} {"train_loss": -5.391176700592041, "global_step": 25964, "epoch": 618} {"train_loss": -5.389167785644531, "global_step": 25965, "epoch": 618} {"train_loss": -5.515079975128174, "global_step": 25966, "epoch": 618} {"train_loss": -5.564802169799805, "global_step": 25967, "epoch": 618} {"train_loss": -5.391936779022217, "global_step": 25968, "epoch": 618} {"train_loss": -5.411421775817871, "global_step": 25969, "epoch": 618} {"train_loss": -5.325156211853027, "global_step": 25970, "epoch": 618} {"train_loss": -5.353216648101807, "global_step": 25971, "epoch": 618} {"train_loss": -5.430610656738281, "global_step": 25972, "epoch": 618} {"train_loss": -5.234541893005371, "global_step": 25973, "epoch": 618} {"train_loss": -5.486752033233643, "global_step": 25974, "epoch": 618} {"train_loss": -5.2889862060546875, "global_step": 25975, "epoch": 618} {"train_loss": -5.182363510131836, "global_step": 25976, "epoch": 618} {"train_loss": -5.422427177429199, "global_step": 25977, "epoch": 618} {"train_loss": -5.340503215789795, "global_step": 25978, "epoch": 618} {"train_loss": -5.4453887939453125, "global_step": 25979, "epoch": 618} {"train_loss": -5.189115524291992, "global_step": 25980, "epoch": 618} {"train_loss": -5.46330451965332, "global_step": 25981, "epoch": 618} {"train_loss": -5.342312812805176, "global_step": 25982, "epoch": 618} {"train_loss": -5.402966499328613, "global_step": 25983, "epoch": 618} {"train_loss": -5.42378568649292, "global_step": 25984, "epoch": 618} {"train_loss": -5.398473739624023, "global_step": 25985, "epoch": 618} {"train_loss": -5.362766265869141, "global_step": 25986, "epoch": 618} {"train_loss": -5.44924783706665, "global_step": 25987, "epoch": 618} {"train_loss": -5.326269149780273, "global_step": 25988, "epoch": 618} {"train_loss": -5.422905921936035, "global_step": 25989, "epoch": 618} {"train_loss": -5.429032325744629, "global_step": 25990, "epoch": 618} {"train_loss": -5.4049882888793945, "global_step": 25991, "epoch": 618} {"train_loss": -5.386309623718262, "global_step": 25992, "epoch": 618} {"train_loss": -5.341800689697266, "global_step": 25993, "epoch": 618} {"train_loss": -5.404224395751953, "global_step": 25994, "epoch": 618} {"train_loss": -5.332311153411865, "global_step": 25995, "epoch": 618} {"train_loss": -5.463819980621338, "global_step": 25996, "epoch": 618} {"train_loss": -5.391015540985834, "global_step": 25997, "epoch": 618, "val_loss": 67653.171875} {"train_loss": -5.634593963623047, "global_step": 25998, "epoch": 619} {"train_loss": -5.402904510498047, "global_step": 25999, "epoch": 619} {"train_loss": -5.351346969604492, "global_step": 26000, "epoch": 619} {"train_loss": -5.454477310180664, "global_step": 26001, "epoch": 619} {"train_loss": -5.373895645141602, "global_step": 26002, "epoch": 619} {"train_loss": -5.39019775390625, "global_step": 26003, "epoch": 619} {"train_loss": -5.531763076782227, "global_step": 26004, "epoch": 619} {"train_loss": -5.275707244873047, "global_step": 26005, "epoch": 619} {"train_loss": -5.518806457519531, "global_step": 26006, "epoch": 619} {"train_loss": -5.46467924118042, "global_step": 26007, "epoch": 619} {"train_loss": -5.362125396728516, "global_step": 26008, "epoch": 619} {"train_loss": -5.428290367126465, "global_step": 26009, "epoch": 619} {"train_loss": -5.436489105224609, "global_step": 26010, "epoch": 619} {"train_loss": -5.361464500427246, "global_step": 26011, "epoch": 619} {"train_loss": -5.543704032897949, "global_step": 26012, "epoch": 619} {"train_loss": -5.241029739379883, "global_step": 26013, "epoch": 619} {"train_loss": -5.397465229034424, "global_step": 26014, "epoch": 619} {"train_loss": -5.456620693206787, "global_step": 26015, "epoch": 619} {"train_loss": -5.3900465965271, "global_step": 26016, "epoch": 619} {"train_loss": -5.444669723510742, "global_step": 26017, "epoch": 619} {"train_loss": -5.464616298675537, "global_step": 26018, "epoch": 619} {"train_loss": -5.30525016784668, "global_step": 26019, "epoch": 619} {"train_loss": -5.516846656799316, "global_step": 26020, "epoch": 619} {"train_loss": -5.339271068572998, "global_step": 26021, "epoch": 619} {"train_loss": -5.414432525634766, "global_step": 26022, "epoch": 619} {"train_loss": -5.56740665435791, "global_step": 26023, "epoch": 619} {"train_loss": -5.434686660766602, "global_step": 26024, "epoch": 619} {"train_loss": -5.485124588012695, "global_step": 26025, "epoch": 619} {"train_loss": -5.382457256317139, "global_step": 26026, "epoch": 619} {"train_loss": -5.276281833648682, "global_step": 26027, "epoch": 619} {"train_loss": -5.315446853637695, "global_step": 26028, "epoch": 619} {"train_loss": -5.529733180999756, "global_step": 26029, "epoch": 619} {"train_loss": -5.520610809326172, "global_step": 26030, "epoch": 619} {"train_loss": -5.426039695739746, "global_step": 26031, "epoch": 619} {"train_loss": -5.445798397064209, "global_step": 26032, "epoch": 619} {"train_loss": -5.350064277648926, "global_step": 26033, "epoch": 619} {"train_loss": -5.461021423339844, "global_step": 26034, "epoch": 619} {"train_loss": -5.555525779724121, "global_step": 26035, "epoch": 619} {"train_loss": -5.360414505004883, "global_step": 26036, "epoch": 619} {"train_loss": -5.466897964477539, "global_step": 26037, "epoch": 619} {"train_loss": -5.437596321105957, "global_step": 26038, "epoch": 619} {"train_loss": -5.428291127795265, "global_step": 26039, "epoch": 619, "val_loss": 67671.6328125} {"train_loss": -5.533207893371582, "global_step": 26040, "epoch": 620} {"train_loss": -5.516822814941406, "global_step": 26041, "epoch": 620} {"train_loss": -5.185014247894287, "global_step": 26042, "epoch": 620} {"train_loss": -5.445286750793457, "global_step": 26043, "epoch": 620} {"train_loss": -5.4451141357421875, "global_step": 26044, "epoch": 620} {"train_loss": -5.372670650482178, "global_step": 26045, "epoch": 620} {"train_loss": -5.6328229904174805, "global_step": 26046, "epoch": 620} {"train_loss": -5.361930847167969, "global_step": 26047, "epoch": 620} {"train_loss": -5.282840728759766, "global_step": 26048, "epoch": 620} {"train_loss": -5.465357303619385, "global_step": 26049, "epoch": 620} {"train_loss": -5.443039894104004, "global_step": 26050, "epoch": 620} {"train_loss": -5.272120952606201, "global_step": 26051, "epoch": 620} {"train_loss": -5.43809700012207, "global_step": 26052, "epoch": 620} {"train_loss": -5.3716959953308105, "global_step": 26053, "epoch": 620} {"train_loss": -5.2885284423828125, "global_step": 26054, "epoch": 620} {"train_loss": -5.295046806335449, "global_step": 26055, "epoch": 620} {"train_loss": -5.48628044128418, "global_step": 26056, "epoch": 620} {"train_loss": -5.388965129852295, "global_step": 26057, "epoch": 620} {"train_loss": -5.456686973571777, "global_step": 26058, "epoch": 620} {"train_loss": -5.520092010498047, "global_step": 26059, "epoch": 620} {"train_loss": -5.568092346191406, "global_step": 26060, "epoch": 620} {"train_loss": -5.437180519104004, "global_step": 26061, "epoch": 620} {"train_loss": -5.386754035949707, "global_step": 26062, "epoch": 620} {"train_loss": -5.386970520019531, "global_step": 26063, "epoch": 620} {"train_loss": -5.433586597442627, "global_step": 26064, "epoch": 620} {"train_loss": -5.480161666870117, "global_step": 26065, "epoch": 620} {"train_loss": -5.322605133056641, "global_step": 26066, "epoch": 620} {"train_loss": -5.508795261383057, "global_step": 26067, "epoch": 620} {"train_loss": -5.527928352355957, "global_step": 26068, "epoch": 620} {"train_loss": -5.440746307373047, "global_step": 26069, "epoch": 620} {"train_loss": -5.340134143829346, "global_step": 26070, "epoch": 620} {"train_loss": -5.3904290199279785, "global_step": 26071, "epoch": 620} {"train_loss": -5.445636749267578, "global_step": 26072, "epoch": 620} {"train_loss": -5.480101585388184, "global_step": 26073, "epoch": 620} {"train_loss": -5.472280502319336, "global_step": 26074, "epoch": 620} {"train_loss": -5.537360668182373, "global_step": 26075, "epoch": 620} {"train_loss": -5.380214691162109, "global_step": 26076, "epoch": 620} {"train_loss": -5.397775650024414, "global_step": 26077, "epoch": 620} {"train_loss": -5.3393096923828125, "global_step": 26078, "epoch": 620} {"train_loss": -5.394722938537598, "global_step": 26079, "epoch": 620} {"train_loss": -5.2587738037109375, "global_step": 26080, "epoch": 620} {"train_loss": -5.416714554741269, "global_step": 26081, "epoch": 620, "val_loss": 68152.7421875} {"train_loss": -5.542632579803467, "global_step": 26082, "epoch": 621} {"train_loss": -5.471014022827148, "global_step": 26083, "epoch": 621} {"train_loss": -5.550230503082275, "global_step": 26084, "epoch": 621} {"train_loss": -5.436825275421143, "global_step": 26085, "epoch": 621} {"train_loss": -5.412880897521973, "global_step": 26086, "epoch": 621} {"train_loss": -5.46915340423584, "global_step": 26087, "epoch": 621} {"train_loss": -5.179660797119141, "global_step": 26088, "epoch": 621} {"train_loss": -5.394349098205566, "global_step": 26089, "epoch": 621} {"train_loss": -5.499812126159668, "global_step": 26090, "epoch": 621} {"train_loss": -5.300983905792236, "global_step": 26091, "epoch": 621} {"train_loss": -5.324583530426025, "global_step": 26092, "epoch": 621} {"train_loss": -5.4711456298828125, "global_step": 26093, "epoch": 621} {"train_loss": -5.257256031036377, "global_step": 26094, "epoch": 621} {"train_loss": -5.426454067230225, "global_step": 26095, "epoch": 621} {"train_loss": -5.312527656555176, "global_step": 26096, "epoch": 621} {"train_loss": -5.518758773803711, "global_step": 26097, "epoch": 621} {"train_loss": -5.447482109069824, "global_step": 26098, "epoch": 621} {"train_loss": -5.376348495483398, "global_step": 26099, "epoch": 621} {"train_loss": -5.386509418487549, "global_step": 26100, "epoch": 621} {"train_loss": -5.413098335266113, "global_step": 26101, "epoch": 621} {"train_loss": -5.444465637207031, "global_step": 26102, "epoch": 621} {"train_loss": -5.358778953552246, "global_step": 26103, "epoch": 621} {"train_loss": -5.473005294799805, "global_step": 26104, "epoch": 621} {"train_loss": -5.4960174560546875, "global_step": 26105, "epoch": 621} {"train_loss": -5.362397193908691, "global_step": 26106, "epoch": 621} {"train_loss": -5.401885032653809, "global_step": 26107, "epoch": 621} {"train_loss": -5.360805511474609, "global_step": 26108, "epoch": 621} {"train_loss": -5.446393966674805, "global_step": 26109, "epoch": 621} {"train_loss": -5.388180732727051, "global_step": 26110, "epoch": 621} {"train_loss": -5.253213405609131, "global_step": 26111, "epoch": 621} {"train_loss": -5.380413055419922, "global_step": 26112, "epoch": 621} {"train_loss": -5.568624973297119, "global_step": 26113, "epoch": 621} {"train_loss": -5.3085856437683105, "global_step": 26114, "epoch": 621} {"train_loss": -5.48641300201416, "global_step": 26115, "epoch": 621} {"train_loss": -5.296988487243652, "global_step": 26116, "epoch": 621} {"train_loss": -5.375617980957031, "global_step": 26117, "epoch": 621} {"train_loss": -5.411236763000488, "global_step": 26118, "epoch": 621} {"train_loss": -5.4014081954956055, "global_step": 26119, "epoch": 621} {"train_loss": -5.444591522216797, "global_step": 26120, "epoch": 621} {"train_loss": -5.290338039398193, "global_step": 26121, "epoch": 621} {"train_loss": -5.309079170227051, "global_step": 26122, "epoch": 621} {"train_loss": -5.400212446848552, "global_step": 26123, "epoch": 621, "val_loss": 68237.0} {"train_loss": -5.30714750289917, "global_step": 26124, "epoch": 622} {"train_loss": -5.403058052062988, "global_step": 26125, "epoch": 622} {"train_loss": -5.438797950744629, "global_step": 26126, "epoch": 622} {"train_loss": -5.332963466644287, "global_step": 26127, "epoch": 622} {"train_loss": -5.505193710327148, "global_step": 26128, "epoch": 622} {"train_loss": -5.435696125030518, "global_step": 26129, "epoch": 622} {"train_loss": -5.3453474044799805, "global_step": 26130, "epoch": 622} {"train_loss": -5.4592437744140625, "global_step": 26131, "epoch": 622} {"train_loss": -5.454442977905273, "global_step": 26132, "epoch": 622} {"train_loss": -5.414153575897217, "global_step": 26133, "epoch": 622} {"train_loss": -5.367408752441406, "global_step": 26134, "epoch": 622} {"train_loss": -5.42935848236084, "global_step": 26135, "epoch": 622} {"train_loss": -5.486262321472168, "global_step": 26136, "epoch": 622} {"train_loss": -5.412726402282715, "global_step": 26137, "epoch": 622} {"train_loss": -5.217878341674805, "global_step": 26138, "epoch": 622} {"train_loss": -5.418728828430176, "global_step": 26139, "epoch": 622} {"train_loss": -5.525465488433838, "global_step": 26140, "epoch": 622} {"train_loss": -5.340582370758057, "global_step": 26141, "epoch": 622} {"train_loss": -5.635933876037598, "global_step": 26142, "epoch": 622} {"train_loss": -5.417810440063477, "global_step": 26143, "epoch": 622} {"train_loss": -5.401215553283691, "global_step": 26144, "epoch": 622} {"train_loss": -5.418234825134277, "global_step": 26145, "epoch": 622} {"train_loss": -5.4819488525390625, "global_step": 26146, "epoch": 622} {"train_loss": -5.3945207595825195, "global_step": 26147, "epoch": 622} {"train_loss": -5.410879135131836, "global_step": 26148, "epoch": 622} {"train_loss": -5.21832275390625, "global_step": 26149, "epoch": 622} {"train_loss": -5.50787353515625, "global_step": 26150, "epoch": 622} {"train_loss": -5.463559150695801, "global_step": 26151, "epoch": 622} {"train_loss": -5.457077980041504, "global_step": 26152, "epoch": 622} {"train_loss": -5.41940975189209, "global_step": 26153, "epoch": 622} {"train_loss": -5.358987808227539, "global_step": 26154, "epoch": 622} {"train_loss": -5.489497184753418, "global_step": 26155, "epoch": 622} {"train_loss": -5.358070373535156, "global_step": 26156, "epoch": 622} {"train_loss": -5.408378601074219, "global_step": 26157, "epoch": 622} {"train_loss": -5.397195816040039, "global_step": 26158, "epoch": 622} {"train_loss": -5.309917449951172, "global_step": 26159, "epoch": 622} {"train_loss": -5.316660404205322, "global_step": 26160, "epoch": 622} {"train_loss": -5.421245574951172, "global_step": 26161, "epoch": 622} {"train_loss": -5.359354019165039, "global_step": 26162, "epoch": 622} {"train_loss": -5.487860202789307, "global_step": 26163, "epoch": 622} {"train_loss": -5.324166297912598, "global_step": 26164, "epoch": 622} {"train_loss": -5.405524106252761, "global_step": 26165, "epoch": 622, "val_loss": 67540.1796875} {"train_loss": -5.4295172691345215, "global_step": 26166, "epoch": 623} {"train_loss": -5.548398494720459, "global_step": 26167, "epoch": 623} {"train_loss": -5.288826942443848, "global_step": 26168, "epoch": 623} {"train_loss": -5.303782939910889, "global_step": 26169, "epoch": 623} {"train_loss": -5.537206649780273, "global_step": 26170, "epoch": 623} {"train_loss": -5.287178039550781, "global_step": 26171, "epoch": 623} {"train_loss": -5.552587032318115, "global_step": 26172, "epoch": 623} {"train_loss": -5.399257659912109, "global_step": 26173, "epoch": 623} {"train_loss": -5.379565238952637, "global_step": 26174, "epoch": 623} {"train_loss": -5.3643951416015625, "global_step": 26175, "epoch": 623} {"train_loss": -5.537449359893799, "global_step": 26176, "epoch": 623} {"train_loss": -5.394223213195801, "global_step": 26177, "epoch": 623} {"train_loss": -5.412834167480469, "global_step": 26178, "epoch": 623} {"train_loss": -5.433135986328125, "global_step": 26179, "epoch": 623} {"train_loss": -5.483537673950195, "global_step": 26180, "epoch": 623} {"train_loss": -5.256120681762695, "global_step": 26181, "epoch": 623} {"train_loss": -5.484450340270996, "global_step": 26182, "epoch": 623} {"train_loss": -5.453664302825928, "global_step": 26183, "epoch": 623} {"train_loss": -5.554654121398926, "global_step": 26184, "epoch": 623} {"train_loss": -5.398491859436035, "global_step": 26185, "epoch": 623} {"train_loss": -5.483747482299805, "global_step": 26186, "epoch": 623} {"train_loss": -5.572627067565918, "global_step": 26187, "epoch": 623} {"train_loss": -5.484511375427246, "global_step": 26188, "epoch": 623} {"train_loss": -5.470681190490723, "global_step": 26189, "epoch": 623} {"train_loss": -5.477079391479492, "global_step": 26190, "epoch": 623} {"train_loss": -5.402589797973633, "global_step": 26191, "epoch": 623} {"train_loss": -5.44883394241333, "global_step": 26192, "epoch": 623} {"train_loss": -5.5040788650512695, "global_step": 26193, "epoch": 623} {"train_loss": -5.465122699737549, "global_step": 26194, "epoch": 623} {"train_loss": -5.440128803253174, "global_step": 26195, "epoch": 623} {"train_loss": -5.52088737487793, "global_step": 26196, "epoch": 623} {"train_loss": -5.408736228942871, "global_step": 26197, "epoch": 623} {"train_loss": -5.495988368988037, "global_step": 26198, "epoch": 623} {"train_loss": -5.381839275360107, "global_step": 26199, "epoch": 623} {"train_loss": -5.33857536315918, "global_step": 26200, "epoch": 623} {"train_loss": -5.411015510559082, "global_step": 26201, "epoch": 623} {"train_loss": -5.440080642700195, "global_step": 26202, "epoch": 623} {"train_loss": -5.353236675262451, "global_step": 26203, "epoch": 623} {"train_loss": -5.384321689605713, "global_step": 26204, "epoch": 623} {"train_loss": -5.437928199768066, "global_step": 26205, "epoch": 623} {"train_loss": -5.371517181396484, "global_step": 26206, "epoch": 623} {"train_loss": -5.434191612970261, "global_step": 26207, "epoch": 623, "val_loss": 67378.671875} {"train_loss": -5.402902126312256, "global_step": 26208, "epoch": 624} {"train_loss": -5.397668838500977, "global_step": 26209, "epoch": 624} {"train_loss": -5.460090160369873, "global_step": 26210, "epoch": 624} {"train_loss": -5.380270957946777, "global_step": 26211, "epoch": 624} {"train_loss": -5.45012903213501, "global_step": 26212, "epoch": 624} {"train_loss": -5.388355255126953, "global_step": 26213, "epoch": 624} {"train_loss": -5.366832733154297, "global_step": 26214, "epoch": 624} {"train_loss": -5.439021587371826, "global_step": 26215, "epoch": 624} {"train_loss": -5.364883899688721, "global_step": 26216, "epoch": 624} {"train_loss": -5.312914848327637, "global_step": 26217, "epoch": 624} {"train_loss": -5.444055080413818, "global_step": 26218, "epoch": 624} {"train_loss": -5.4340057373046875, "global_step": 26219, "epoch": 624} {"train_loss": -5.421133041381836, "global_step": 26220, "epoch": 624} {"train_loss": -5.416437149047852, "global_step": 26221, "epoch": 624} {"train_loss": -5.423670768737793, "global_step": 26222, "epoch": 624} {"train_loss": -5.252087116241455, "global_step": 26223, "epoch": 624} {"train_loss": -5.416826248168945, "global_step": 26224, "epoch": 624} {"train_loss": -5.482418060302734, "global_step": 26225, "epoch": 624} {"train_loss": -5.4282732009887695, "global_step": 26226, "epoch": 624} {"train_loss": -5.47445011138916, "global_step": 26227, "epoch": 624} {"train_loss": -5.335169315338135, "global_step": 26228, "epoch": 624} {"train_loss": -5.438157558441162, "global_step": 26229, "epoch": 624} {"train_loss": -5.49134635925293, "global_step": 26230, "epoch": 624} {"train_loss": -5.397869110107422, "global_step": 26231, "epoch": 624} {"train_loss": -5.437804222106934, "global_step": 26232, "epoch": 624} {"train_loss": -5.476072311401367, "global_step": 26233, "epoch": 624} {"train_loss": -5.443274974822998, "global_step": 26234, "epoch": 624} {"train_loss": -5.499469757080078, "global_step": 26235, "epoch": 624} {"train_loss": -5.490881443023682, "global_step": 26236, "epoch": 624} {"train_loss": -5.421131134033203, "global_step": 26237, "epoch": 624} {"train_loss": -5.347959041595459, "global_step": 26238, "epoch": 624} {"train_loss": -5.496606826782227, "global_step": 26239, "epoch": 624} {"train_loss": -5.460363388061523, "global_step": 26240, "epoch": 624} {"train_loss": -5.396413803100586, "global_step": 26241, "epoch": 624} {"train_loss": -5.444181442260742, "global_step": 26242, "epoch": 624} {"train_loss": -5.374265670776367, "global_step": 26243, "epoch": 624} {"train_loss": -5.437321186065674, "global_step": 26244, "epoch": 624} {"train_loss": -5.501023292541504, "global_step": 26245, "epoch": 624} {"train_loss": -5.401823997497559, "global_step": 26246, "epoch": 624} {"train_loss": -5.547550678253174, "global_step": 26247, "epoch": 624} {"train_loss": -5.530005931854248, "global_step": 26248, "epoch": 624} {"train_loss": -5.427553903488886, "global_step": 26249, "epoch": 624, "val_loss": 67224.9609375} {"train_loss": -5.423117637634277, "global_step": 26250, "epoch": 625} {"train_loss": -5.405807018280029, "global_step": 26251, "epoch": 625} {"train_loss": -5.537992477416992, "global_step": 26252, "epoch": 625} {"train_loss": -5.461240768432617, "global_step": 26253, "epoch": 625} {"train_loss": -5.435347080230713, "global_step": 26254, "epoch": 625} {"train_loss": -5.40412712097168, "global_step": 26255, "epoch": 625} {"train_loss": -5.442773818969727, "global_step": 26256, "epoch": 625} {"train_loss": -5.365199089050293, "global_step": 26257, "epoch": 625} {"train_loss": -5.429208755493164, "global_step": 26258, "epoch": 625} {"train_loss": -5.54342794418335, "global_step": 26259, "epoch": 625} {"train_loss": -5.474360466003418, "global_step": 26260, "epoch": 625} {"train_loss": -5.274772644042969, "global_step": 26261, "epoch": 625} {"train_loss": -5.544739723205566, "global_step": 26262, "epoch": 625} {"train_loss": -5.380941390991211, "global_step": 26263, "epoch": 625} {"train_loss": -5.368380546569824, "global_step": 26264, "epoch": 625} {"train_loss": -5.471411228179932, "global_step": 26265, "epoch": 625} {"train_loss": -5.327518463134766, "global_step": 26266, "epoch": 625} {"train_loss": -5.301131248474121, "global_step": 26267, "epoch": 625} {"train_loss": -5.485836029052734, "global_step": 26268, "epoch": 625} {"train_loss": -5.365218639373779, "global_step": 26269, "epoch": 625} {"train_loss": -5.391345024108887, "global_step": 26270, "epoch": 625} {"train_loss": -5.407940864562988, "global_step": 26271, "epoch": 625} {"train_loss": -5.437014579772949, "global_step": 26272, "epoch": 625} {"train_loss": -5.4709367752075195, "global_step": 26273, "epoch": 625} {"train_loss": -5.41165828704834, "global_step": 26274, "epoch": 625} {"train_loss": -5.419118881225586, "global_step": 26275, "epoch": 625} {"train_loss": -5.3037919998168945, "global_step": 26276, "epoch": 625} {"train_loss": -5.418177604675293, "global_step": 26277, "epoch": 625} {"train_loss": -5.395465850830078, "global_step": 26278, "epoch": 625} {"train_loss": -5.461705684661865, "global_step": 26279, "epoch": 625} {"train_loss": -5.4869771003723145, "global_step": 26280, "epoch": 625} {"train_loss": -5.301449775695801, "global_step": 26281, "epoch": 625} {"train_loss": -5.421924591064453, "global_step": 26282, "epoch": 625} {"train_loss": -5.350274085998535, "global_step": 26283, "epoch": 625} {"train_loss": -5.410933017730713, "global_step": 26284, "epoch": 625} {"train_loss": -5.348085880279541, "global_step": 26285, "epoch": 625} {"train_loss": -5.477481842041016, "global_step": 26286, "epoch": 625} {"train_loss": -5.359031677246094, "global_step": 26287, "epoch": 625} {"train_loss": -5.441221237182617, "global_step": 26288, "epoch": 625} {"train_loss": -5.453675746917725, "global_step": 26289, "epoch": 625} {"train_loss": -5.401494979858398, "global_step": 26290, "epoch": 625} {"train_loss": -5.41559574717567, "global_step": 26291, "epoch": 625, "val_loss": 67325.9609375} {"train_loss": -5.386053085327148, "global_step": 26292, "epoch": 626} {"train_loss": -5.402242660522461, "global_step": 26293, "epoch": 626} {"train_loss": -5.537379264831543, "global_step": 26294, "epoch": 626} {"train_loss": -5.421387672424316, "global_step": 26295, "epoch": 626} {"train_loss": -5.2685980796813965, "global_step": 26296, "epoch": 626} {"train_loss": -5.517017841339111, "global_step": 26297, "epoch": 626} {"train_loss": -5.361911296844482, "global_step": 26298, "epoch": 626} {"train_loss": -5.434447765350342, "global_step": 26299, "epoch": 626} {"train_loss": -5.290300369262695, "global_step": 26300, "epoch": 626} {"train_loss": -5.438078880310059, "global_step": 26301, "epoch": 626} {"train_loss": -5.462371826171875, "global_step": 26302, "epoch": 626} {"train_loss": -5.382771015167236, "global_step": 26303, "epoch": 626} {"train_loss": -5.573502540588379, "global_step": 26304, "epoch": 626} {"train_loss": -5.369349479675293, "global_step": 26305, "epoch": 626} {"train_loss": -5.464951515197754, "global_step": 26306, "epoch": 626} {"train_loss": -5.461397647857666, "global_step": 26307, "epoch": 626} {"train_loss": -5.419641017913818, "global_step": 26308, "epoch": 626} {"train_loss": -5.516269207000732, "global_step": 26309, "epoch": 626} {"train_loss": -5.330301284790039, "global_step": 26310, "epoch": 626} {"train_loss": -5.351075649261475, "global_step": 26311, "epoch": 626} {"train_loss": -5.377649784088135, "global_step": 26312, "epoch": 626} {"train_loss": -5.455777168273926, "global_step": 26313, "epoch": 626} {"train_loss": -5.396740436553955, "global_step": 26314, "epoch": 626} {"train_loss": -5.438714981079102, "global_step": 26315, "epoch": 626} {"train_loss": -5.456210613250732, "global_step": 26316, "epoch": 626} {"train_loss": -5.540383338928223, "global_step": 26317, "epoch": 626} {"train_loss": -5.37265682220459, "global_step": 26318, "epoch": 626} {"train_loss": -5.382917881011963, "global_step": 26319, "epoch": 626} {"train_loss": -5.5050554275512695, "global_step": 26320, "epoch": 626} {"train_loss": -5.386105537414551, "global_step": 26321, "epoch": 626} {"train_loss": -5.512967109680176, "global_step": 26322, "epoch": 626} {"train_loss": -5.366508483886719, "global_step": 26323, "epoch": 626} {"train_loss": -5.296786308288574, "global_step": 26324, "epoch": 626} {"train_loss": -5.489116668701172, "global_step": 26325, "epoch": 626} {"train_loss": -5.461916923522949, "global_step": 26326, "epoch": 626} {"train_loss": -5.505697250366211, "global_step": 26327, "epoch": 626} {"train_loss": -5.440520286560059, "global_step": 26328, "epoch": 626} {"train_loss": -5.458658218383789, "global_step": 26329, "epoch": 626} {"train_loss": -5.387324333190918, "global_step": 26330, "epoch": 626} {"train_loss": -5.350612163543701, "global_step": 26331, "epoch": 626} {"train_loss": -5.4599080085754395, "global_step": 26332, "epoch": 626} {"train_loss": -5.425032706487746, "global_step": 26333, "epoch": 626, "val_loss": 67752.3359375} {"train_loss": -5.5607590675354, "global_step": 26334, "epoch": 627} {"train_loss": -5.3877105712890625, "global_step": 26335, "epoch": 627} {"train_loss": -5.157401084899902, "global_step": 26336, "epoch": 627} {"train_loss": -5.437760353088379, "global_step": 26337, "epoch": 627} {"train_loss": -5.332327365875244, "global_step": 26338, "epoch": 627} {"train_loss": -5.366991996765137, "global_step": 26339, "epoch": 627} {"train_loss": -5.393303871154785, "global_step": 26340, "epoch": 627} {"train_loss": -5.472528457641602, "global_step": 26341, "epoch": 627} {"train_loss": -5.501567363739014, "global_step": 26342, "epoch": 627} {"train_loss": -5.312062740325928, "global_step": 26343, "epoch": 627} {"train_loss": -5.331361770629883, "global_step": 26344, "epoch": 627} {"train_loss": -5.370815277099609, "global_step": 26345, "epoch": 627} {"train_loss": -5.412295341491699, "global_step": 26346, "epoch": 627} {"train_loss": -5.40020227432251, "global_step": 26347, "epoch": 627} {"train_loss": -5.6700310707092285, "global_step": 26348, "epoch": 627} {"train_loss": -5.352781772613525, "global_step": 26349, "epoch": 627} {"train_loss": -5.488735675811768, "global_step": 26350, "epoch": 627} {"train_loss": -5.395804405212402, "global_step": 26351, "epoch": 627} {"train_loss": -5.4059529304504395, "global_step": 26352, "epoch": 627} {"train_loss": -5.483401775360107, "global_step": 26353, "epoch": 627} {"train_loss": -5.367588043212891, "global_step": 26354, "epoch": 627} {"train_loss": -5.314608573913574, "global_step": 26355, "epoch": 627} {"train_loss": -5.4907426834106445, "global_step": 26356, "epoch": 627} {"train_loss": -5.436064720153809, "global_step": 26357, "epoch": 627} {"train_loss": -5.5132737159729, "global_step": 26358, "epoch": 627} {"train_loss": -5.402107238769531, "global_step": 26359, "epoch": 627} {"train_loss": -5.461422920227051, "global_step": 26360, "epoch": 627} {"train_loss": -5.446579933166504, "global_step": 26361, "epoch": 627} {"train_loss": -5.323644161224365, "global_step": 26362, "epoch": 627} {"train_loss": -5.332569599151611, "global_step": 26363, "epoch": 627} {"train_loss": -5.5172295570373535, "global_step": 26364, "epoch": 627} {"train_loss": -5.477269172668457, "global_step": 26365, "epoch": 627} {"train_loss": -5.411092758178711, "global_step": 26366, "epoch": 627} {"train_loss": -5.431811332702637, "global_step": 26367, "epoch": 627} {"train_loss": -5.589829444885254, "global_step": 26368, "epoch": 627} {"train_loss": -5.360391616821289, "global_step": 26369, "epoch": 627} {"train_loss": -5.354359149932861, "global_step": 26370, "epoch": 627} {"train_loss": -5.48496150970459, "global_step": 26371, "epoch": 627} {"train_loss": -5.495565891265869, "global_step": 26372, "epoch": 627} {"train_loss": -5.419819355010986, "global_step": 26373, "epoch": 627} {"train_loss": -5.478906631469727, "global_step": 26374, "epoch": 627} {"train_loss": -5.423281908035278, "global_step": 26375, "epoch": 627, "val_loss": 67813.7109375} {"train_loss": -5.462871074676514, "global_step": 26376, "epoch": 628} {"train_loss": -5.311586380004883, "global_step": 26377, "epoch": 628} {"train_loss": -5.488030433654785, "global_step": 26378, "epoch": 628} {"train_loss": -5.386061668395996, "global_step": 26379, "epoch": 628} {"train_loss": -5.5276031494140625, "global_step": 26380, "epoch": 628} {"train_loss": -5.458540916442871, "global_step": 26381, "epoch": 628} {"train_loss": -5.501962184906006, "global_step": 26382, "epoch": 628} {"train_loss": -5.391902446746826, "global_step": 26383, "epoch": 628} {"train_loss": -5.494814872741699, "global_step": 26384, "epoch": 628} {"train_loss": -5.465200424194336, "global_step": 26385, "epoch": 628} {"train_loss": -5.412459373474121, "global_step": 26386, "epoch": 628} {"train_loss": -5.396182060241699, "global_step": 26387, "epoch": 628} {"train_loss": -5.392212867736816, "global_step": 26388, "epoch": 628} {"train_loss": -5.559020042419434, "global_step": 26389, "epoch": 628} {"train_loss": -5.447475910186768, "global_step": 26390, "epoch": 628} {"train_loss": -5.45179557800293, "global_step": 26391, "epoch": 628} {"train_loss": -5.396623611450195, "global_step": 26392, "epoch": 628} {"train_loss": -5.463884353637695, "global_step": 26393, "epoch": 628} {"train_loss": -5.487579345703125, "global_step": 26394, "epoch": 628} {"train_loss": -5.455572128295898, "global_step": 26395, "epoch": 628} {"train_loss": -5.4225006103515625, "global_step": 26396, "epoch": 628} {"train_loss": -5.47693395614624, "global_step": 26397, "epoch": 628} {"train_loss": -5.343116760253906, "global_step": 26398, "epoch": 628} {"train_loss": -5.547274112701416, "global_step": 26399, "epoch": 628} {"train_loss": -5.367403984069824, "global_step": 26400, "epoch": 628} {"train_loss": -5.500502586364746, "global_step": 26401, "epoch": 628} {"train_loss": -5.449020862579346, "global_step": 26402, "epoch": 628} {"train_loss": -5.471327304840088, "global_step": 26403, "epoch": 628} {"train_loss": -5.383034706115723, "global_step": 26404, "epoch": 628} {"train_loss": -5.308407306671143, "global_step": 26405, "epoch": 628} {"train_loss": -5.4679107666015625, "global_step": 26406, "epoch": 628} {"train_loss": -5.494718074798584, "global_step": 26407, "epoch": 628} {"train_loss": -5.489880084991455, "global_step": 26408, "epoch": 628} {"train_loss": -5.413814544677734, "global_step": 26409, "epoch": 628} {"train_loss": -5.419052600860596, "global_step": 26410, "epoch": 628} {"train_loss": -5.441492080688477, "global_step": 26411, "epoch": 628} {"train_loss": -5.377797603607178, "global_step": 26412, "epoch": 628} {"train_loss": -5.479352951049805, "global_step": 26413, "epoch": 628} {"train_loss": -5.472522735595703, "global_step": 26414, "epoch": 628} {"train_loss": -5.513267517089844, "global_step": 26415, "epoch": 628} {"train_loss": -5.55748987197876, "global_step": 26416, "epoch": 628} {"train_loss": -5.444091331391108, "global_step": 26417, "epoch": 628, "val_loss": 67410.3671875} {"train_loss": -5.3699846267700195, "global_step": 26418, "epoch": 629} {"train_loss": -5.516175270080566, "global_step": 26419, "epoch": 629} {"train_loss": -5.410348415374756, "global_step": 26420, "epoch": 629} {"train_loss": -5.437586784362793, "global_step": 26421, "epoch": 629} {"train_loss": -5.5552473068237305, "global_step": 26422, "epoch": 629} {"train_loss": -5.30513858795166, "global_step": 26423, "epoch": 629} {"train_loss": -5.323999404907227, "global_step": 26424, "epoch": 629} {"train_loss": -5.483530044555664, "global_step": 26425, "epoch": 629} {"train_loss": -5.461129188537598, "global_step": 26426, "epoch": 629} {"train_loss": -5.519408702850342, "global_step": 26427, "epoch": 629} {"train_loss": -5.358247756958008, "global_step": 26428, "epoch": 629} {"train_loss": -5.251647472381592, "global_step": 26429, "epoch": 629} {"train_loss": -5.285055160522461, "global_step": 26430, "epoch": 629} {"train_loss": -5.373156547546387, "global_step": 26431, "epoch": 629} {"train_loss": -5.371245861053467, "global_step": 26432, "epoch": 629} {"train_loss": -5.290031433105469, "global_step": 26433, "epoch": 629} {"train_loss": -5.37569522857666, "global_step": 26434, "epoch": 629} {"train_loss": -5.451871395111084, "global_step": 26435, "epoch": 629} {"train_loss": -5.455480575561523, "global_step": 26436, "epoch": 629} {"train_loss": -5.4756178855896, "global_step": 26437, "epoch": 629} {"train_loss": -5.502910614013672, "global_step": 26438, "epoch": 629} {"train_loss": -5.333196640014648, "global_step": 26439, "epoch": 629} {"train_loss": -5.392757415771484, "global_step": 26440, "epoch": 629} {"train_loss": -5.373743057250977, "global_step": 26441, "epoch": 629} {"train_loss": -5.487370014190674, "global_step": 26442, "epoch": 629} {"train_loss": -5.524779319763184, "global_step": 26443, "epoch": 629} {"train_loss": -5.55893087387085, "global_step": 26444, "epoch": 629} {"train_loss": -5.338098049163818, "global_step": 26445, "epoch": 629} {"train_loss": -5.353950023651123, "global_step": 26446, "epoch": 629} {"train_loss": -5.542788982391357, "global_step": 26447, "epoch": 629} {"train_loss": -5.462209224700928, "global_step": 26448, "epoch": 629} {"train_loss": -5.408111572265625, "global_step": 26449, "epoch": 629} {"train_loss": -5.389906883239746, "global_step": 26450, "epoch": 629} {"train_loss": -5.443431854248047, "global_step": 26451, "epoch": 629} {"train_loss": -5.61189603805542, "global_step": 26452, "epoch": 629} {"train_loss": -5.408326625823975, "global_step": 26453, "epoch": 629} {"train_loss": -5.4597697257995605, "global_step": 26454, "epoch": 629} {"train_loss": -5.370650768280029, "global_step": 26455, "epoch": 629} {"train_loss": -5.459755897521973, "global_step": 26456, "epoch": 629} {"train_loss": -5.534882068634033, "global_step": 26457, "epoch": 629} {"train_loss": -5.575759410858154, "global_step": 26458, "epoch": 629} {"train_loss": -5.4284890946887785, "global_step": 26459, "epoch": 629, "val_loss": 67402.140625} {"train_loss": -5.5359344482421875, "global_step": 26460, "epoch": 630} {"train_loss": -5.385322570800781, "global_step": 26461, "epoch": 630} {"train_loss": -5.394250392913818, "global_step": 26462, "epoch": 630} {"train_loss": -5.4773969650268555, "global_step": 26463, "epoch": 630} {"train_loss": -5.326787948608398, "global_step": 26464, "epoch": 630} {"train_loss": -5.393453598022461, "global_step": 26465, "epoch": 630} {"train_loss": -5.266462326049805, "global_step": 26466, "epoch": 630} {"train_loss": -5.400211334228516, "global_step": 26467, "epoch": 630} {"train_loss": -5.462456703186035, "global_step": 26468, "epoch": 630} {"train_loss": -5.456663131713867, "global_step": 26469, "epoch": 630} {"train_loss": -5.424119472503662, "global_step": 26470, "epoch": 630} {"train_loss": -5.463757514953613, "global_step": 26471, "epoch": 630} {"train_loss": -5.342953681945801, "global_step": 26472, "epoch": 630} {"train_loss": -5.5386810302734375, "global_step": 26473, "epoch": 630} {"train_loss": -5.488924980163574, "global_step": 26474, "epoch": 630} {"train_loss": -5.4464006423950195, "global_step": 26475, "epoch": 630} {"train_loss": -5.320953369140625, "global_step": 26476, "epoch": 630} {"train_loss": -5.45246696472168, "global_step": 26477, "epoch": 630} {"train_loss": -5.264110565185547, "global_step": 26478, "epoch": 630} {"train_loss": -5.488112449645996, "global_step": 26479, "epoch": 630} {"train_loss": -5.384313583374023, "global_step": 26480, "epoch": 630} {"train_loss": -5.337735176086426, "global_step": 26481, "epoch": 630} {"train_loss": -5.425560474395752, "global_step": 26482, "epoch": 630} {"train_loss": -5.43947172164917, "global_step": 26483, "epoch": 630} {"train_loss": -5.356416702270508, "global_step": 26484, "epoch": 630} {"train_loss": -5.292801380157471, "global_step": 26485, "epoch": 630} {"train_loss": -5.611577987670898, "global_step": 26486, "epoch": 630} {"train_loss": -5.295958042144775, "global_step": 26487, "epoch": 630} {"train_loss": -5.417362213134766, "global_step": 26488, "epoch": 630} {"train_loss": -5.489137172698975, "global_step": 26489, "epoch": 630} {"train_loss": -5.4606828689575195, "global_step": 26490, "epoch": 630} {"train_loss": -5.455536842346191, "global_step": 26491, "epoch": 630} {"train_loss": -5.362654685974121, "global_step": 26492, "epoch": 630} {"train_loss": -5.472451210021973, "global_step": 26493, "epoch": 630} {"train_loss": -5.355772018432617, "global_step": 26494, "epoch": 630} {"train_loss": -5.408980369567871, "global_step": 26495, "epoch": 630} {"train_loss": -5.329793930053711, "global_step": 26496, "epoch": 630} {"train_loss": -5.413698673248291, "global_step": 26497, "epoch": 630} {"train_loss": -5.450418949127197, "global_step": 26498, "epoch": 630} {"train_loss": -5.432955265045166, "global_step": 26499, "epoch": 630} {"train_loss": -5.416621208190918, "global_step": 26500, "epoch": 630} {"train_loss": -5.412330945332845, "global_step": 26501, "epoch": 630, "val_loss": 67710.171875} {"train_loss": -5.338612079620361, "global_step": 26502, "epoch": 631} {"train_loss": -5.419065475463867, "global_step": 26503, "epoch": 631} {"train_loss": -5.471408843994141, "global_step": 26504, "epoch": 631} {"train_loss": -5.447144508361816, "global_step": 26505, "epoch": 631} {"train_loss": -5.317777633666992, "global_step": 26506, "epoch": 631} {"train_loss": -5.355523109436035, "global_step": 26507, "epoch": 631} {"train_loss": -5.445881366729736, "global_step": 26508, "epoch": 631} {"train_loss": -5.478697299957275, "global_step": 26509, "epoch": 631} {"train_loss": -5.381765365600586, "global_step": 26510, "epoch": 631} {"train_loss": -5.292514801025391, "global_step": 26511, "epoch": 631} {"train_loss": -5.534701347351074, "global_step": 26512, "epoch": 631} {"train_loss": -5.443450927734375, "global_step": 26513, "epoch": 631} {"train_loss": -5.463387489318848, "global_step": 26514, "epoch": 631} {"train_loss": -5.435807228088379, "global_step": 26515, "epoch": 631} {"train_loss": -5.243436813354492, "global_step": 26516, "epoch": 631} {"train_loss": -5.436160087585449, "global_step": 26517, "epoch": 631} {"train_loss": -5.4139580726623535, "global_step": 26518, "epoch": 631} {"train_loss": -5.493980407714844, "global_step": 26519, "epoch": 631} {"train_loss": -5.591346740722656, "global_step": 26520, "epoch": 631} {"train_loss": -5.447388172149658, "global_step": 26521, "epoch": 631} {"train_loss": -5.403805732727051, "global_step": 26522, "epoch": 631} {"train_loss": -5.432086944580078, "global_step": 26523, "epoch": 631} {"train_loss": -5.448220252990723, "global_step": 26524, "epoch": 631} {"train_loss": -5.361347675323486, "global_step": 26525, "epoch": 631} {"train_loss": -5.513026237487793, "global_step": 26526, "epoch": 631} {"train_loss": -5.453490257263184, "global_step": 26527, "epoch": 631} {"train_loss": -5.346413612365723, "global_step": 26528, "epoch": 631} {"train_loss": -5.325657367706299, "global_step": 26529, "epoch": 631} {"train_loss": -5.325125694274902, "global_step": 26530, "epoch": 631} {"train_loss": -5.507839202880859, "global_step": 26531, "epoch": 631} {"train_loss": -5.384468078613281, "global_step": 26532, "epoch": 631} {"train_loss": -5.33818244934082, "global_step": 26533, "epoch": 631} {"train_loss": -5.449972152709961, "global_step": 26534, "epoch": 631} {"train_loss": -5.3855085372924805, "global_step": 26535, "epoch": 631} {"train_loss": -5.469603538513184, "global_step": 26536, "epoch": 631} {"train_loss": -5.503472328186035, "global_step": 26537, "epoch": 631} {"train_loss": -5.537708282470703, "global_step": 26538, "epoch": 631} {"train_loss": -5.473855495452881, "global_step": 26539, "epoch": 631} {"train_loss": -5.544350624084473, "global_step": 26540, "epoch": 631} {"train_loss": -5.549704551696777, "global_step": 26541, "epoch": 631} {"train_loss": -5.480471134185791, "global_step": 26542, "epoch": 631} {"train_loss": -5.430843375978016, "global_step": 26543, "epoch": 631, "val_loss": 67926.5703125} {"train_loss": -5.393115043640137, "global_step": 26544, "epoch": 632} {"train_loss": -5.308268070220947, "global_step": 26545, "epoch": 632} {"train_loss": -5.421086311340332, "global_step": 26546, "epoch": 632} {"train_loss": -5.554380893707275, "global_step": 26547, "epoch": 632} {"train_loss": -5.527248382568359, "global_step": 26548, "epoch": 632} {"train_loss": -5.403194427490234, "global_step": 26549, "epoch": 632} {"train_loss": -5.543612480163574, "global_step": 26550, "epoch": 632} {"train_loss": -5.314043045043945, "global_step": 26551, "epoch": 632} {"train_loss": -5.450266361236572, "global_step": 26552, "epoch": 632} {"train_loss": -5.472904682159424, "global_step": 26553, "epoch": 632} {"train_loss": -5.346053123474121, "global_step": 26554, "epoch": 632} {"train_loss": -5.306860446929932, "global_step": 26555, "epoch": 632} {"train_loss": -5.374231338500977, "global_step": 26556, "epoch": 632} {"train_loss": -5.352265357971191, "global_step": 26557, "epoch": 632} {"train_loss": -5.397939205169678, "global_step": 26558, "epoch": 632} {"train_loss": -5.305973052978516, "global_step": 26559, "epoch": 632} {"train_loss": -5.328276634216309, "global_step": 26560, "epoch": 632} {"train_loss": -5.496361255645752, "global_step": 26561, "epoch": 632} {"train_loss": -5.416775226593018, "global_step": 26562, "epoch": 632} {"train_loss": -5.394753456115723, "global_step": 26563, "epoch": 632} {"train_loss": -5.353675842285156, "global_step": 26564, "epoch": 632} {"train_loss": -5.564263820648193, "global_step": 26565, "epoch": 632} {"train_loss": -5.437222003936768, "global_step": 26566, "epoch": 632} {"train_loss": -5.3646745681762695, "global_step": 26567, "epoch": 632} {"train_loss": -5.381841659545898, "global_step": 26568, "epoch": 632} {"train_loss": -5.521516799926758, "global_step": 26569, "epoch": 632} {"train_loss": -5.324584007263184, "global_step": 26570, "epoch": 632} {"train_loss": -5.413945198059082, "global_step": 26571, "epoch": 632} {"train_loss": -5.463381767272949, "global_step": 26572, "epoch": 632} {"train_loss": -5.372928619384766, "global_step": 26573, "epoch": 632} {"train_loss": -5.415294647216797, "global_step": 26574, "epoch": 632} {"train_loss": -5.316746711730957, "global_step": 26575, "epoch": 632} {"train_loss": -5.537981033325195, "global_step": 26576, "epoch": 632} {"train_loss": -5.51179838180542, "global_step": 26577, "epoch": 632} {"train_loss": -5.4068603515625, "global_step": 26578, "epoch": 632} {"train_loss": -5.215271472930908, "global_step": 26579, "epoch": 632} {"train_loss": -5.330033302307129, "global_step": 26580, "epoch": 632} {"train_loss": -5.356823444366455, "global_step": 26581, "epoch": 632} {"train_loss": -5.374059677124023, "global_step": 26582, "epoch": 632} {"train_loss": -5.29323673248291, "global_step": 26583, "epoch": 632} {"train_loss": -5.375203609466553, "global_step": 26584, "epoch": 632} {"train_loss": -5.397469634101505, "global_step": 26585, "epoch": 632, "val_loss": 67688.2421875} {"train_loss": -5.4219770431518555, "global_step": 26586, "epoch": 633} {"train_loss": -5.395077705383301, "global_step": 26587, "epoch": 633} {"train_loss": -5.521699905395508, "global_step": 26588, "epoch": 633} {"train_loss": -5.3767194747924805, "global_step": 26589, "epoch": 633} {"train_loss": -5.414576053619385, "global_step": 26590, "epoch": 633} {"train_loss": -5.413877487182617, "global_step": 26591, "epoch": 633} {"train_loss": -5.427807807922363, "global_step": 26592, "epoch": 633} {"train_loss": -5.369304656982422, "global_step": 26593, "epoch": 633} {"train_loss": -5.469090461730957, "global_step": 26594, "epoch": 633} {"train_loss": -5.36052942276001, "global_step": 26595, "epoch": 633} {"train_loss": -5.474717140197754, "global_step": 26596, "epoch": 633} {"train_loss": -5.3326568603515625, "global_step": 26597, "epoch": 633} {"train_loss": -5.406871795654297, "global_step": 26598, "epoch": 633} {"train_loss": -5.544119358062744, "global_step": 26599, "epoch": 633} {"train_loss": -5.409802436828613, "global_step": 26600, "epoch": 633} {"train_loss": -5.330508232116699, "global_step": 26601, "epoch": 633} {"train_loss": -5.416618347167969, "global_step": 26602, "epoch": 633} {"train_loss": -5.392462730407715, "global_step": 26603, "epoch": 633} {"train_loss": -5.431978225708008, "global_step": 26604, "epoch": 633} {"train_loss": -5.387218475341797, "global_step": 26605, "epoch": 633} {"train_loss": -5.381959438323975, "global_step": 26606, "epoch": 633} {"train_loss": -5.318453788757324, "global_step": 26607, "epoch": 633} {"train_loss": -5.349732398986816, "global_step": 26608, "epoch": 633} {"train_loss": -5.392996788024902, "global_step": 26609, "epoch": 633} {"train_loss": -5.487378120422363, "global_step": 26610, "epoch": 633} {"train_loss": -5.447995662689209, "global_step": 26611, "epoch": 633} {"train_loss": -5.377512454986572, "global_step": 26612, "epoch": 633} {"train_loss": -5.3820600509643555, "global_step": 26613, "epoch": 633} {"train_loss": -5.439056396484375, "global_step": 26614, "epoch": 633} {"train_loss": -5.4124321937561035, "global_step": 26615, "epoch": 633} {"train_loss": -5.459418773651123, "global_step": 26616, "epoch": 633} {"train_loss": -5.597194671630859, "global_step": 26617, "epoch": 633} {"train_loss": -5.352421760559082, "global_step": 26618, "epoch": 633} {"train_loss": -5.420899391174316, "global_step": 26619, "epoch": 633} {"train_loss": -5.489958763122559, "global_step": 26620, "epoch": 633} {"train_loss": -5.252937316894531, "global_step": 26621, "epoch": 633} {"train_loss": -5.313340187072754, "global_step": 26622, "epoch": 633} {"train_loss": -5.413582801818848, "global_step": 26623, "epoch": 633} {"train_loss": -5.30610466003418, "global_step": 26624, "epoch": 633} {"train_loss": -5.375748157501221, "global_step": 26625, "epoch": 633} {"train_loss": -5.279373645782471, "global_step": 26626, "epoch": 633} {"train_loss": -5.401198432559059, "global_step": 26627, "epoch": 633, "val_loss": 67354.1640625} {"train_loss": -5.332724571228027, "global_step": 26628, "epoch": 634} {"train_loss": -5.327249050140381, "global_step": 26629, "epoch": 634} {"train_loss": -5.464641571044922, "global_step": 26630, "epoch": 634} {"train_loss": -5.476728439331055, "global_step": 26631, "epoch": 634} {"train_loss": -5.414632320404053, "global_step": 26632, "epoch": 634} {"train_loss": -5.420610427856445, "global_step": 26633, "epoch": 634} {"train_loss": -5.461207866668701, "global_step": 26634, "epoch": 634} {"train_loss": -5.296645164489746, "global_step": 26635, "epoch": 634} {"train_loss": -5.434170722961426, "global_step": 26636, "epoch": 634} {"train_loss": -5.467150688171387, "global_step": 26637, "epoch": 634} {"train_loss": -5.340532302856445, "global_step": 26638, "epoch": 634} {"train_loss": -5.2774152755737305, "global_step": 26639, "epoch": 634} {"train_loss": -5.394574165344238, "global_step": 26640, "epoch": 634} {"train_loss": -5.317456245422363, "global_step": 26641, "epoch": 634} {"train_loss": -5.238620758056641, "global_step": 26642, "epoch": 634} {"train_loss": -5.416709899902344, "global_step": 26643, "epoch": 634} {"train_loss": -5.308058738708496, "global_step": 26644, "epoch": 634} {"train_loss": -5.471356391906738, "global_step": 26645, "epoch": 634} {"train_loss": -5.31677770614624, "global_step": 26646, "epoch": 634} {"train_loss": -5.322900772094727, "global_step": 26647, "epoch": 634} {"train_loss": -5.33436393737793, "global_step": 26648, "epoch": 634} {"train_loss": -5.383444786071777, "global_step": 26649, "epoch": 634} {"train_loss": -5.35483455657959, "global_step": 26650, "epoch": 634} {"train_loss": -5.348818778991699, "global_step": 26651, "epoch": 634} {"train_loss": -5.365832328796387, "global_step": 26652, "epoch": 634} {"train_loss": -5.4559173583984375, "global_step": 26653, "epoch": 634} {"train_loss": -5.37945556640625, "global_step": 26654, "epoch": 634} {"train_loss": -5.362411975860596, "global_step": 26655, "epoch": 634} {"train_loss": -5.470416069030762, "global_step": 26656, "epoch": 634} {"train_loss": -5.481739044189453, "global_step": 26657, "epoch": 634} {"train_loss": -5.44070291519165, "global_step": 26658, "epoch": 634} {"train_loss": -5.3988447189331055, "global_step": 26659, "epoch": 634} {"train_loss": -5.41438102722168, "global_step": 26660, "epoch": 634} {"train_loss": -5.520186424255371, "global_step": 26661, "epoch": 634} {"train_loss": -5.382180213928223, "global_step": 26662, "epoch": 634} {"train_loss": -5.4379377365112305, "global_step": 26663, "epoch": 634} {"train_loss": -5.330166339874268, "global_step": 26664, "epoch": 634} {"train_loss": -5.499480247497559, "global_step": 26665, "epoch": 634} {"train_loss": -5.48399543762207, "global_step": 26666, "epoch": 634} {"train_loss": -5.339625358581543, "global_step": 26667, "epoch": 634} {"train_loss": -5.59458589553833, "global_step": 26668, "epoch": 634} {"train_loss": -5.397343919390724, "global_step": 26669, "epoch": 634, "val_loss": 67680.71875} {"train_loss": -5.502120018005371, "global_step": 26670, "epoch": 635} {"train_loss": -5.382228374481201, "global_step": 26671, "epoch": 635} {"train_loss": -5.328911304473877, "global_step": 26672, "epoch": 635} {"train_loss": -5.4978861808776855, "global_step": 26673, "epoch": 635} {"train_loss": -5.4896440505981445, "global_step": 26674, "epoch": 635} {"train_loss": -5.401421070098877, "global_step": 26675, "epoch": 635} {"train_loss": -5.515539169311523, "global_step": 26676, "epoch": 635} {"train_loss": -5.3945817947387695, "global_step": 26677, "epoch": 635} {"train_loss": -5.406322002410889, "global_step": 26678, "epoch": 635} {"train_loss": -5.465760231018066, "global_step": 26679, "epoch": 635} {"train_loss": -5.373124122619629, "global_step": 26680, "epoch": 635} {"train_loss": -5.381588935852051, "global_step": 26681, "epoch": 635} {"train_loss": -5.396326065063477, "global_step": 26682, "epoch": 635} {"train_loss": -5.477880954742432, "global_step": 26683, "epoch": 635} {"train_loss": -5.465673446655273, "global_step": 26684, "epoch": 635} {"train_loss": -5.512682914733887, "global_step": 26685, "epoch": 635} {"train_loss": -5.47447395324707, "global_step": 26686, "epoch": 635} {"train_loss": -5.482234954833984, "global_step": 26687, "epoch": 635} {"train_loss": -5.44000244140625, "global_step": 26688, "epoch": 635} {"train_loss": -5.549589157104492, "global_step": 26689, "epoch": 635} {"train_loss": -5.444540977478027, "global_step": 26690, "epoch": 635} {"train_loss": -5.565107345581055, "global_step": 26691, "epoch": 635} {"train_loss": -5.395076751708984, "global_step": 26692, "epoch": 635} {"train_loss": -5.426366806030273, "global_step": 26693, "epoch": 635} {"train_loss": -5.520321369171143, "global_step": 26694, "epoch": 635} {"train_loss": -5.349631309509277, "global_step": 26695, "epoch": 635} {"train_loss": -5.416428565979004, "global_step": 26696, "epoch": 635} {"train_loss": -5.318012237548828, "global_step": 26697, "epoch": 635} {"train_loss": -5.489415168762207, "global_step": 26698, "epoch": 635} {"train_loss": -5.430014610290527, "global_step": 26699, "epoch": 635} {"train_loss": -5.46600866317749, "global_step": 26700, "epoch": 635} {"train_loss": -5.4168291091918945, "global_step": 26701, "epoch": 635} {"train_loss": -5.431446075439453, "global_step": 26702, "epoch": 635} {"train_loss": -5.412365913391113, "global_step": 26703, "epoch": 635} {"train_loss": -5.471781253814697, "global_step": 26704, "epoch": 635} {"train_loss": -5.3291730880737305, "global_step": 26705, "epoch": 635} {"train_loss": -5.532628059387207, "global_step": 26706, "epoch": 635} {"train_loss": -5.454668045043945, "global_step": 26707, "epoch": 635} {"train_loss": -5.4880828857421875, "global_step": 26708, "epoch": 635} {"train_loss": -5.34812593460083, "global_step": 26709, "epoch": 635} {"train_loss": -5.321938991546631, "global_step": 26710, "epoch": 635} {"train_loss": -5.442379701705206, "global_step": 26711, "epoch": 635, "val_loss": 67490.28125} {"train_loss": -5.401324272155762, "global_step": 26712, "epoch": 636} {"train_loss": -5.454990386962891, "global_step": 26713, "epoch": 636} {"train_loss": -5.4180588722229, "global_step": 26714, "epoch": 636} {"train_loss": -5.453688621520996, "global_step": 26715, "epoch": 636} {"train_loss": -5.49725341796875, "global_step": 26716, "epoch": 636} {"train_loss": -5.506858825683594, "global_step": 26717, "epoch": 636} {"train_loss": -5.396188735961914, "global_step": 26718, "epoch": 636} {"train_loss": -5.499563217163086, "global_step": 26719, "epoch": 636} {"train_loss": -5.447763442993164, "global_step": 26720, "epoch": 636} {"train_loss": -5.476078033447266, "global_step": 26721, "epoch": 636} {"train_loss": -5.543994426727295, "global_step": 26722, "epoch": 636} {"train_loss": -5.448136329650879, "global_step": 26723, "epoch": 636} {"train_loss": -5.474506378173828, "global_step": 26724, "epoch": 636} {"train_loss": -5.469883918762207, "global_step": 26725, "epoch": 636} {"train_loss": -5.454909324645996, "global_step": 26726, "epoch": 636} {"train_loss": -5.504703521728516, "global_step": 26727, "epoch": 636} {"train_loss": -5.381159782409668, "global_step": 26728, "epoch": 636} {"train_loss": -5.428797721862793, "global_step": 26729, "epoch": 636} {"train_loss": -5.406114101409912, "global_step": 26730, "epoch": 636} {"train_loss": -5.392826080322266, "global_step": 26731, "epoch": 636} {"train_loss": -5.34841775894165, "global_step": 26732, "epoch": 636} {"train_loss": -5.382465362548828, "global_step": 26733, "epoch": 636} {"train_loss": -5.366257667541504, "global_step": 26734, "epoch": 636} {"train_loss": -5.284716606140137, "global_step": 26735, "epoch": 636} {"train_loss": -5.283164024353027, "global_step": 26736, "epoch": 636} {"train_loss": -5.44008731842041, "global_step": 26737, "epoch": 636} {"train_loss": -5.419412136077881, "global_step": 26738, "epoch": 636} {"train_loss": -5.378345489501953, "global_step": 26739, "epoch": 636} {"train_loss": -5.438706398010254, "global_step": 26740, "epoch": 636} {"train_loss": -5.492430686950684, "global_step": 26741, "epoch": 636} {"train_loss": -5.3173980712890625, "global_step": 26742, "epoch": 636} {"train_loss": -5.383300304412842, "global_step": 26743, "epoch": 636} {"train_loss": -5.432503700256348, "global_step": 26744, "epoch": 636} {"train_loss": -5.44584846496582, "global_step": 26745, "epoch": 636} {"train_loss": -5.302931785583496, "global_step": 26746, "epoch": 636} {"train_loss": -5.524226665496826, "global_step": 26747, "epoch": 636} {"train_loss": -5.519308090209961, "global_step": 26748, "epoch": 636} {"train_loss": -5.412569046020508, "global_step": 26749, "epoch": 636} {"train_loss": -5.388244152069092, "global_step": 26750, "epoch": 636} {"train_loss": -5.395737171173096, "global_step": 26751, "epoch": 636} {"train_loss": -5.423482894897461, "global_step": 26752, "epoch": 636} {"train_loss": -5.427725542159307, "global_step": 26753, "epoch": 636, "val_loss": 67477.6953125} {"train_loss": -5.440040588378906, "global_step": 26754, "epoch": 637} {"train_loss": -5.594683647155762, "global_step": 26755, "epoch": 637} {"train_loss": -5.503949165344238, "global_step": 26756, "epoch": 637} {"train_loss": -5.419000625610352, "global_step": 26757, "epoch": 637} {"train_loss": -5.48127555847168, "global_step": 26758, "epoch": 637} {"train_loss": -5.426305770874023, "global_step": 26759, "epoch": 637} {"train_loss": -5.46784782409668, "global_step": 26760, "epoch": 637} {"train_loss": -5.315890312194824, "global_step": 26761, "epoch": 637} {"train_loss": -5.4479899406433105, "global_step": 26762, "epoch": 637} {"train_loss": -5.307335376739502, "global_step": 26763, "epoch": 637} {"train_loss": -5.268770217895508, "global_step": 26764, "epoch": 637} {"train_loss": -5.541935920715332, "global_step": 26765, "epoch": 637} {"train_loss": -5.2031450271606445, "global_step": 26766, "epoch": 637} {"train_loss": -5.35245418548584, "global_step": 26767, "epoch": 637} {"train_loss": -5.4315643310546875, "global_step": 26768, "epoch": 637} {"train_loss": -5.439986228942871, "global_step": 26769, "epoch": 637} {"train_loss": -5.445030212402344, "global_step": 26770, "epoch": 637} {"train_loss": -5.266801357269287, "global_step": 26771, "epoch": 637} {"train_loss": -5.547336101531982, "global_step": 26772, "epoch": 637} {"train_loss": -5.339354515075684, "global_step": 26773, "epoch": 637} {"train_loss": -5.3992414474487305, "global_step": 26774, "epoch": 637} {"train_loss": -5.575311660766602, "global_step": 26775, "epoch": 637} {"train_loss": -5.458087921142578, "global_step": 26776, "epoch": 637} {"train_loss": -5.521256923675537, "global_step": 26777, "epoch": 637} {"train_loss": -5.324132919311523, "global_step": 26778, "epoch": 637} {"train_loss": -5.5865912437438965, "global_step": 26779, "epoch": 637} {"train_loss": -5.546212196350098, "global_step": 26780, "epoch": 637} {"train_loss": -5.533968925476074, "global_step": 26781, "epoch": 637} {"train_loss": -5.467433452606201, "global_step": 26782, "epoch": 637} {"train_loss": -5.379263877868652, "global_step": 26783, "epoch": 637} {"train_loss": -5.425055503845215, "global_step": 26784, "epoch": 637} {"train_loss": -5.387299537658691, "global_step": 26785, "epoch": 637} {"train_loss": -5.454303741455078, "global_step": 26786, "epoch": 637} {"train_loss": -5.429472923278809, "global_step": 26787, "epoch": 637} {"train_loss": -5.244414329528809, "global_step": 26788, "epoch": 637} {"train_loss": -5.445509910583496, "global_step": 26789, "epoch": 637} {"train_loss": -5.352524280548096, "global_step": 26790, "epoch": 637} {"train_loss": -5.366034507751465, "global_step": 26791, "epoch": 637} {"train_loss": -5.327552318572998, "global_step": 26792, "epoch": 637} {"train_loss": -5.335302352905273, "global_step": 26793, "epoch": 637} {"train_loss": -5.301666736602783, "global_step": 26794, "epoch": 637} {"train_loss": -5.41668423016866, "global_step": 26795, "epoch": 637, "val_loss": 67721.3046875} {"train_loss": -5.389955043792725, "global_step": 26796, "epoch": 638} {"train_loss": -5.43763542175293, "global_step": 26797, "epoch": 638} {"train_loss": -5.509188175201416, "global_step": 26798, "epoch": 638} {"train_loss": -5.485974311828613, "global_step": 26799, "epoch": 638} {"train_loss": -5.52978515625, "global_step": 26800, "epoch": 638} {"train_loss": -5.402340888977051, "global_step": 26801, "epoch": 638} {"train_loss": -5.369054794311523, "global_step": 26802, "epoch": 638} {"train_loss": -5.58354377746582, "global_step": 26803, "epoch": 638} {"train_loss": -5.315384864807129, "global_step": 26804, "epoch": 638} {"train_loss": -5.4803547859191895, "global_step": 26805, "epoch": 638} {"train_loss": -5.4044389724731445, "global_step": 26806, "epoch": 638} {"train_loss": -5.382848739624023, "global_step": 26807, "epoch": 638} {"train_loss": -5.332457065582275, "global_step": 26808, "epoch": 638} {"train_loss": -5.240914821624756, "global_step": 26809, "epoch": 638} {"train_loss": -5.421191215515137, "global_step": 26810, "epoch": 638} {"train_loss": -5.3808746337890625, "global_step": 26811, "epoch": 638} {"train_loss": -5.403694152832031, "global_step": 26812, "epoch": 638} {"train_loss": -5.400918006896973, "global_step": 26813, "epoch": 638} {"train_loss": -5.437465667724609, "global_step": 26814, "epoch": 638} {"train_loss": -5.266628742218018, "global_step": 26815, "epoch": 638} {"train_loss": -5.297233581542969, "global_step": 26816, "epoch": 638} {"train_loss": -5.417172431945801, "global_step": 26817, "epoch": 638} {"train_loss": -5.477075099945068, "global_step": 26818, "epoch": 638} {"train_loss": -5.554368495941162, "global_step": 26819, "epoch": 638} {"train_loss": -5.2605061531066895, "global_step": 26820, "epoch": 638} {"train_loss": -5.346636772155762, "global_step": 26821, "epoch": 638} {"train_loss": -5.409392356872559, "global_step": 26822, "epoch": 638} {"train_loss": -5.437709808349609, "global_step": 26823, "epoch": 638} {"train_loss": -5.502307891845703, "global_step": 26824, "epoch": 638} {"train_loss": -5.416575908660889, "global_step": 26825, "epoch": 638} {"train_loss": -5.346567153930664, "global_step": 26826, "epoch": 638} {"train_loss": -5.410794258117676, "global_step": 26827, "epoch": 638} {"train_loss": -5.289675235748291, "global_step": 26828, "epoch": 638} {"train_loss": -5.248003959655762, "global_step": 26829, "epoch": 638} {"train_loss": -5.346470832824707, "global_step": 26830, "epoch": 638} {"train_loss": -5.504578590393066, "global_step": 26831, "epoch": 638} {"train_loss": -5.48204231262207, "global_step": 26832, "epoch": 638} {"train_loss": -5.448841571807861, "global_step": 26833, "epoch": 638} {"train_loss": -5.390882968902588, "global_step": 26834, "epoch": 638} {"train_loss": -5.477858543395996, "global_step": 26835, "epoch": 638} {"train_loss": -5.522791862487793, "global_step": 26836, "epoch": 638} {"train_loss": -5.407802547727313, "global_step": 26837, "epoch": 638, "val_loss": 67885.234375} {"train_loss": -5.474092960357666, "global_step": 26838, "epoch": 639} {"train_loss": -5.400335311889648, "global_step": 26839, "epoch": 639} {"train_loss": -5.395021915435791, "global_step": 26840, "epoch": 639} {"train_loss": -5.334111213684082, "global_step": 26841, "epoch": 639} {"train_loss": -5.401064872741699, "global_step": 26842, "epoch": 639} {"train_loss": -5.435257911682129, "global_step": 26843, "epoch": 639} {"train_loss": -5.3918232917785645, "global_step": 26844, "epoch": 639} {"train_loss": -5.39591121673584, "global_step": 26845, "epoch": 639} {"train_loss": -5.2977399826049805, "global_step": 26846, "epoch": 639} {"train_loss": -5.572437286376953, "global_step": 26847, "epoch": 639} {"train_loss": -5.470150947570801, "global_step": 26848, "epoch": 639} {"train_loss": -5.428770542144775, "global_step": 26849, "epoch": 639} {"train_loss": -5.408260345458984, "global_step": 26850, "epoch": 639} {"train_loss": -5.391300201416016, "global_step": 26851, "epoch": 639} {"train_loss": -5.549797058105469, "global_step": 26852, "epoch": 639} {"train_loss": -5.214756011962891, "global_step": 26853, "epoch": 639} {"train_loss": -5.535409450531006, "global_step": 26854, "epoch": 639} {"train_loss": -5.4292497634887695, "global_step": 26855, "epoch": 639} {"train_loss": -5.30377721786499, "global_step": 26856, "epoch": 639} {"train_loss": -5.408113479614258, "global_step": 26857, "epoch": 639} {"train_loss": -5.476165771484375, "global_step": 26858, "epoch": 639} {"train_loss": -5.317502975463867, "global_step": 26859, "epoch": 639} {"train_loss": -5.380060195922852, "global_step": 26860, "epoch": 639} {"train_loss": -5.455450057983398, "global_step": 26861, "epoch": 639} {"train_loss": -5.377849578857422, "global_step": 26862, "epoch": 639} {"train_loss": -5.2803635597229, "global_step": 26863, "epoch": 639} {"train_loss": -5.525514602661133, "global_step": 26864, "epoch": 639} {"train_loss": -5.394008636474609, "global_step": 26865, "epoch": 639} {"train_loss": -5.525608062744141, "global_step": 26866, "epoch": 639} {"train_loss": -5.500252723693848, "global_step": 26867, "epoch": 639} {"train_loss": -5.3338623046875, "global_step": 26868, "epoch": 639} {"train_loss": -5.693514823913574, "global_step": 26869, "epoch": 639} {"train_loss": -5.524587631225586, "global_step": 26870, "epoch": 639} {"train_loss": -5.400567054748535, "global_step": 26871, "epoch": 639} {"train_loss": -5.374022483825684, "global_step": 26872, "epoch": 639} {"train_loss": -5.378576278686523, "global_step": 26873, "epoch": 639} {"train_loss": -5.31511116027832, "global_step": 26874, "epoch": 639} {"train_loss": -5.394443511962891, "global_step": 26875, "epoch": 639} {"train_loss": -5.400041580200195, "global_step": 26876, "epoch": 639} {"train_loss": -5.516164779663086, "global_step": 26877, "epoch": 639} {"train_loss": -5.366707801818848, "global_step": 26878, "epoch": 639} {"train_loss": -5.42033508845738, "global_step": 26879, "epoch": 639, "val_loss": 67528.2109375} {"train_loss": -5.515675067901611, "global_step": 26880, "epoch": 640} {"train_loss": -5.473015785217285, "global_step": 26881, "epoch": 640} {"train_loss": -5.338860511779785, "global_step": 26882, "epoch": 640} {"train_loss": -5.530524253845215, "global_step": 26883, "epoch": 640} {"train_loss": -5.391390800476074, "global_step": 26884, "epoch": 640} {"train_loss": -5.462538719177246, "global_step": 26885, "epoch": 640} {"train_loss": -5.3907318115234375, "global_step": 26886, "epoch": 640} {"train_loss": -5.569803237915039, "global_step": 26887, "epoch": 640} {"train_loss": -5.531815528869629, "global_step": 26888, "epoch": 640} {"train_loss": -5.506590843200684, "global_step": 26889, "epoch": 640} {"train_loss": -5.45157527923584, "global_step": 26890, "epoch": 640} {"train_loss": -5.444085121154785, "global_step": 26891, "epoch": 640} {"train_loss": -5.344768524169922, "global_step": 26892, "epoch": 640} {"train_loss": -5.471035003662109, "global_step": 26893, "epoch": 640} {"train_loss": -5.453573226928711, "global_step": 26894, "epoch": 640} {"train_loss": -5.319481372833252, "global_step": 26895, "epoch": 640} {"train_loss": -5.42874813079834, "global_step": 26896, "epoch": 640} {"train_loss": -5.3672075271606445, "global_step": 26897, "epoch": 640} {"train_loss": -5.317441940307617, "global_step": 26898, "epoch": 640} {"train_loss": -5.544281005859375, "global_step": 26899, "epoch": 640} {"train_loss": -5.370540618896484, "global_step": 26900, "epoch": 640} {"train_loss": -5.331088542938232, "global_step": 26901, "epoch": 640} {"train_loss": -5.392166614532471, "global_step": 26902, "epoch": 640} {"train_loss": -5.384772777557373, "global_step": 26903, "epoch": 640} {"train_loss": -5.440774917602539, "global_step": 26904, "epoch": 640} {"train_loss": -5.475498199462891, "global_step": 26905, "epoch": 640} {"train_loss": -5.359385013580322, "global_step": 26906, "epoch": 640} {"train_loss": -5.499424457550049, "global_step": 26907, "epoch": 640} {"train_loss": -5.430159568786621, "global_step": 26908, "epoch": 640} {"train_loss": -5.50777006149292, "global_step": 26909, "epoch": 640} {"train_loss": -5.405448913574219, "global_step": 26910, "epoch": 640} {"train_loss": -5.309374809265137, "global_step": 26911, "epoch": 640} {"train_loss": -5.48909854888916, "global_step": 26912, "epoch": 640} {"train_loss": -5.271630764007568, "global_step": 26913, "epoch": 640} {"train_loss": -5.300752639770508, "global_step": 26914, "epoch": 640} {"train_loss": -5.322464942932129, "global_step": 26915, "epoch": 640} {"train_loss": -5.521890163421631, "global_step": 26916, "epoch": 640} {"train_loss": -5.229904651641846, "global_step": 26917, "epoch": 640} {"train_loss": -5.416857719421387, "global_step": 26918, "epoch": 640} {"train_loss": -5.410927772521973, "global_step": 26919, "epoch": 640} {"train_loss": -5.355243682861328, "global_step": 26920, "epoch": 640} {"train_loss": -5.415474959782192, "global_step": 26921, "epoch": 640, "val_loss": 67886.5390625} {"train_loss": -5.441479682922363, "global_step": 26922, "epoch": 641} {"train_loss": -5.359895706176758, "global_step": 26923, "epoch": 641} {"train_loss": -5.370486736297607, "global_step": 26924, "epoch": 641} {"train_loss": -5.358762741088867, "global_step": 26925, "epoch": 641} {"train_loss": -5.351410388946533, "global_step": 26926, "epoch": 641} {"train_loss": -5.348165035247803, "global_step": 26927, "epoch": 641} {"train_loss": -5.328632354736328, "global_step": 26928, "epoch": 641} {"train_loss": -5.3946380615234375, "global_step": 26929, "epoch": 641} {"train_loss": -5.3950347900390625, "global_step": 26930, "epoch": 641} {"train_loss": -5.456943511962891, "global_step": 26931, "epoch": 641} {"train_loss": -5.345779895782471, "global_step": 26932, "epoch": 641} {"train_loss": -5.473147392272949, "global_step": 26933, "epoch": 641} {"train_loss": -5.498575210571289, "global_step": 26934, "epoch": 641} {"train_loss": -5.369589328765869, "global_step": 26935, "epoch": 641} {"train_loss": -5.439129829406738, "global_step": 26936, "epoch": 641} {"train_loss": -5.490952968597412, "global_step": 26937, "epoch": 641} {"train_loss": -5.338000297546387, "global_step": 26938, "epoch": 641} {"train_loss": -5.376437187194824, "global_step": 26939, "epoch": 641} {"train_loss": -5.37595796585083, "global_step": 26940, "epoch": 641} {"train_loss": -5.382589340209961, "global_step": 26941, "epoch": 641} {"train_loss": -5.420279502868652, "global_step": 26942, "epoch": 641} {"train_loss": -5.3784990310668945, "global_step": 26943, "epoch": 641} {"train_loss": -5.343128204345703, "global_step": 26944, "epoch": 641} {"train_loss": -5.560196876525879, "global_step": 26945, "epoch": 641} {"train_loss": -5.318543910980225, "global_step": 26946, "epoch": 641} {"train_loss": -5.5229644775390625, "global_step": 26947, "epoch": 641} {"train_loss": -5.357063293457031, "global_step": 26948, "epoch": 641} {"train_loss": -5.385270118713379, "global_step": 26949, "epoch": 641} {"train_loss": -5.438497066497803, "global_step": 26950, "epoch": 641} {"train_loss": -5.386038780212402, "global_step": 26951, "epoch": 641} {"train_loss": -5.485897064208984, "global_step": 26952, "epoch": 641} {"train_loss": -5.384919166564941, "global_step": 26953, "epoch": 641} {"train_loss": -5.448897361755371, "global_step": 26954, "epoch": 641} {"train_loss": -5.520107269287109, "global_step": 26955, "epoch": 641} {"train_loss": -5.4517340660095215, "global_step": 26956, "epoch": 641} {"train_loss": -5.4106526374816895, "global_step": 26957, "epoch": 641} {"train_loss": -5.457681179046631, "global_step": 26958, "epoch": 641} {"train_loss": -5.477311134338379, "global_step": 26959, "epoch": 641} {"train_loss": -5.475064277648926, "global_step": 26960, "epoch": 641} {"train_loss": -5.330923557281494, "global_step": 26961, "epoch": 641} {"train_loss": -5.4525604248046875, "global_step": 26962, "epoch": 641} {"train_loss": -5.41112866855803, "global_step": 26963, "epoch": 641, "val_loss": 68852.6875} {"train_loss": -5.267184257507324, "global_step": 26964, "epoch": 642} {"train_loss": -5.391589164733887, "global_step": 26965, "epoch": 642} {"train_loss": -5.424020290374756, "global_step": 26966, "epoch": 642} {"train_loss": -5.189189910888672, "global_step": 26967, "epoch": 642} {"train_loss": -5.374918460845947, "global_step": 26968, "epoch": 642} {"train_loss": -5.237915992736816, "global_step": 26969, "epoch": 642} {"train_loss": -5.263474941253662, "global_step": 26970, "epoch": 642} {"train_loss": -5.4352617263793945, "global_step": 26971, "epoch": 642} {"train_loss": -5.301727294921875, "global_step": 26972, "epoch": 642} {"train_loss": -5.399222373962402, "global_step": 26973, "epoch": 642} {"train_loss": -5.251771450042725, "global_step": 26974, "epoch": 642} {"train_loss": -5.276508331298828, "global_step": 26975, "epoch": 642} {"train_loss": -5.310039520263672, "global_step": 26976, "epoch": 642} {"train_loss": -5.40932559967041, "global_step": 26977, "epoch": 642} {"train_loss": -5.429587364196777, "global_step": 26978, "epoch": 642} {"train_loss": -5.407411098480225, "global_step": 26979, "epoch": 642} {"train_loss": -5.429699897766113, "global_step": 26980, "epoch": 642} {"train_loss": -5.598178386688232, "global_step": 26981, "epoch": 642} {"train_loss": -5.409895420074463, "global_step": 26982, "epoch": 642} {"train_loss": -5.518745422363281, "global_step": 26983, "epoch": 642} {"train_loss": -5.514199256896973, "global_step": 26984, "epoch": 642} {"train_loss": -5.4692606925964355, "global_step": 26985, "epoch": 642} {"train_loss": -5.343654155731201, "global_step": 26986, "epoch": 642} {"train_loss": -5.390222549438477, "global_step": 26987, "epoch": 642} {"train_loss": -5.411125659942627, "global_step": 26988, "epoch": 642} {"train_loss": -5.473371982574463, "global_step": 26989, "epoch": 642} {"train_loss": -5.487952709197998, "global_step": 26990, "epoch": 642} {"train_loss": -5.279024124145508, "global_step": 26991, "epoch": 642} {"train_loss": -5.432409286499023, "global_step": 26992, "epoch": 642} {"train_loss": -5.3788251876831055, "global_step": 26993, "epoch": 642} {"train_loss": -5.365970611572266, "global_step": 26994, "epoch": 642} {"train_loss": -5.541597366333008, "global_step": 26995, "epoch": 642} {"train_loss": -5.45253849029541, "global_step": 26996, "epoch": 642} {"train_loss": -5.305904388427734, "global_step": 26997, "epoch": 642} {"train_loss": -5.461263179779053, "global_step": 26998, "epoch": 642} {"train_loss": -5.416133880615234, "global_step": 26999, "epoch": 642} {"train_loss": -5.484981060028076, "global_step": 27000, "epoch": 642} {"train_loss": -5.407742977142334, "global_step": 27001, "epoch": 642} {"train_loss": -5.445619583129883, "global_step": 27002, "epoch": 642} {"train_loss": -5.3481645584106445, "global_step": 27003, "epoch": 642} {"train_loss": -5.325503349304199, "global_step": 27004, "epoch": 642} {"train_loss": -5.390392133167812, "global_step": 27005, "epoch": 642, "val_loss": 67310.640625} {"train_loss": -5.45037841796875, "global_step": 27006, "epoch": 643} {"train_loss": -5.358148097991943, "global_step": 27007, "epoch": 643} {"train_loss": -5.41248893737793, "global_step": 27008, "epoch": 643} {"train_loss": -5.470578193664551, "global_step": 27009, "epoch": 643} {"train_loss": -5.462745189666748, "global_step": 27010, "epoch": 643} {"train_loss": -5.3923444747924805, "global_step": 27011, "epoch": 643} {"train_loss": -5.417601585388184, "global_step": 27012, "epoch": 643} {"train_loss": -5.377938747406006, "global_step": 27013, "epoch": 643} {"train_loss": -5.396932601928711, "global_step": 27014, "epoch": 643} {"train_loss": -5.348483562469482, "global_step": 27015, "epoch": 643} {"train_loss": -5.320145606994629, "global_step": 27016, "epoch": 643} {"train_loss": -5.433754920959473, "global_step": 27017, "epoch": 643} {"train_loss": -5.321539878845215, "global_step": 27018, "epoch": 643} {"train_loss": -5.403449058532715, "global_step": 27019, "epoch": 643} {"train_loss": -5.52642822265625, "global_step": 27020, "epoch": 643} {"train_loss": -5.4703850746154785, "global_step": 27021, "epoch": 643} {"train_loss": -5.320096969604492, "global_step": 27022, "epoch": 643} {"train_loss": -5.466063499450684, "global_step": 27023, "epoch": 643} {"train_loss": -5.391684532165527, "global_step": 27024, "epoch": 643} {"train_loss": -5.434427261352539, "global_step": 27025, "epoch": 643} {"train_loss": -5.3548173904418945, "global_step": 27026, "epoch": 643} {"train_loss": -5.497287750244141, "global_step": 27027, "epoch": 643} {"train_loss": -5.539976119995117, "global_step": 27028, "epoch": 643} {"train_loss": -5.439654350280762, "global_step": 27029, "epoch": 643} {"train_loss": -5.624472141265869, "global_step": 27030, "epoch": 643} {"train_loss": -5.480536460876465, "global_step": 27031, "epoch": 643} {"train_loss": -5.430782318115234, "global_step": 27032, "epoch": 643} {"train_loss": -5.437835693359375, "global_step": 27033, "epoch": 643} {"train_loss": -5.3840742111206055, "global_step": 27034, "epoch": 643} {"train_loss": -5.509746074676514, "global_step": 27035, "epoch": 643} {"train_loss": -5.437708854675293, "global_step": 27036, "epoch": 643} {"train_loss": -5.534965515136719, "global_step": 27037, "epoch": 643} {"train_loss": -5.392974853515625, "global_step": 27038, "epoch": 643} {"train_loss": -5.385349273681641, "global_step": 27039, "epoch": 643} {"train_loss": -5.518944263458252, "global_step": 27040, "epoch": 643} {"train_loss": -5.452230930328369, "global_step": 27041, "epoch": 643} {"train_loss": -5.46391487121582, "global_step": 27042, "epoch": 643} {"train_loss": -5.488705635070801, "global_step": 27043, "epoch": 643} {"train_loss": -5.355287551879883, "global_step": 27044, "epoch": 643} {"train_loss": -5.436764717102051, "global_step": 27045, "epoch": 643} {"train_loss": -5.505748748779297, "global_step": 27046, "epoch": 643} {"train_loss": -5.438699302219209, "global_step": 27047, "epoch": 643, "val_loss": 67502.765625} {"train_loss": -5.4380388259887695, "global_step": 27048, "epoch": 644} {"train_loss": -5.550312042236328, "global_step": 27049, "epoch": 644} {"train_loss": -5.413967609405518, "global_step": 27050, "epoch": 644} {"train_loss": -5.3470611572265625, "global_step": 27051, "epoch": 644} {"train_loss": -5.508675575256348, "global_step": 27052, "epoch": 644} {"train_loss": -5.439903736114502, "global_step": 27053, "epoch": 644} {"train_loss": -5.460296630859375, "global_step": 27054, "epoch": 644} {"train_loss": -5.424510955810547, "global_step": 27055, "epoch": 644} {"train_loss": -5.490971565246582, "global_step": 27056, "epoch": 644} {"train_loss": -5.511188507080078, "global_step": 27057, "epoch": 644} {"train_loss": -5.36781120300293, "global_step": 27058, "epoch": 644} {"train_loss": -5.526035308837891, "global_step": 27059, "epoch": 644} {"train_loss": -5.4359331130981445, "global_step": 27060, "epoch": 644} {"train_loss": -5.555665016174316, "global_step": 27061, "epoch": 644} {"train_loss": -5.33478307723999, "global_step": 27062, "epoch": 644} {"train_loss": -5.543272018432617, "global_step": 27063, "epoch": 644} {"train_loss": -5.491683006286621, "global_step": 27064, "epoch": 644} {"train_loss": -5.3448052406311035, "global_step": 27065, "epoch": 644} {"train_loss": -5.53549861907959, "global_step": 27066, "epoch": 644} {"train_loss": -5.492129325866699, "global_step": 27067, "epoch": 644} {"train_loss": -5.562760829925537, "global_step": 27068, "epoch": 644} {"train_loss": -5.358438014984131, "global_step": 27069, "epoch": 644} {"train_loss": -5.499391078948975, "global_step": 27070, "epoch": 644} {"train_loss": -5.333614349365234, "global_step": 27071, "epoch": 644} {"train_loss": -5.45860481262207, "global_step": 27072, "epoch": 644} {"train_loss": -5.483801364898682, "global_step": 27073, "epoch": 644} {"train_loss": -5.380891799926758, "global_step": 27074, "epoch": 644} {"train_loss": -5.535589694976807, "global_step": 27075, "epoch": 644} {"train_loss": -5.400310516357422, "global_step": 27076, "epoch": 644} {"train_loss": -5.474767208099365, "global_step": 27077, "epoch": 644} {"train_loss": -5.624052047729492, "global_step": 27078, "epoch": 644} {"train_loss": -5.527745246887207, "global_step": 27079, "epoch": 644} {"train_loss": -5.381032943725586, "global_step": 27080, "epoch": 644} {"train_loss": -5.336755752563477, "global_step": 27081, "epoch": 644} {"train_loss": -5.365169525146484, "global_step": 27082, "epoch": 644} {"train_loss": -5.367208480834961, "global_step": 27083, "epoch": 644} {"train_loss": -5.377945899963379, "global_step": 27084, "epoch": 644} {"train_loss": -5.5360212326049805, "global_step": 27085, "epoch": 644} {"train_loss": -5.398049354553223, "global_step": 27086, "epoch": 644} {"train_loss": -5.206748962402344, "global_step": 27087, "epoch": 644} {"train_loss": -5.379409313201904, "global_step": 27088, "epoch": 644} {"train_loss": -5.440165167763119, "global_step": 27089, "epoch": 644, "val_loss": 67586.6953125} {"train_loss": -5.416806697845459, "global_step": 27090, "epoch": 645} {"train_loss": -5.384557247161865, "global_step": 27091, "epoch": 645} {"train_loss": -5.374115943908691, "global_step": 27092, "epoch": 645} {"train_loss": -5.512625217437744, "global_step": 27093, "epoch": 645} {"train_loss": -5.253668785095215, "global_step": 27094, "epoch": 645} {"train_loss": -5.3056640625, "global_step": 27095, "epoch": 645} {"train_loss": -5.470911502838135, "global_step": 27096, "epoch": 645} {"train_loss": -5.453550338745117, "global_step": 27097, "epoch": 645} {"train_loss": -5.420809268951416, "global_step": 27098, "epoch": 645} {"train_loss": -5.286572456359863, "global_step": 27099, "epoch": 645} {"train_loss": -5.39966344833374, "global_step": 27100, "epoch": 645} {"train_loss": -5.347102165222168, "global_step": 27101, "epoch": 645} {"train_loss": -5.562994003295898, "global_step": 27102, "epoch": 645} {"train_loss": -5.502359390258789, "global_step": 27103, "epoch": 645} {"train_loss": -5.363889694213867, "global_step": 27104, "epoch": 645} {"train_loss": -5.407745361328125, "global_step": 27105, "epoch": 645} {"train_loss": -5.524567604064941, "global_step": 27106, "epoch": 645} {"train_loss": -5.342657089233398, "global_step": 27107, "epoch": 645} {"train_loss": -5.3719706535339355, "global_step": 27108, "epoch": 645} {"train_loss": -5.473302841186523, "global_step": 27109, "epoch": 645} {"train_loss": -5.559598922729492, "global_step": 27110, "epoch": 645} {"train_loss": -5.379589080810547, "global_step": 27111, "epoch": 645} {"train_loss": -5.512578964233398, "global_step": 27112, "epoch": 645} {"train_loss": -5.159855365753174, "global_step": 27113, "epoch": 645} {"train_loss": -5.347236633300781, "global_step": 27114, "epoch": 645} {"train_loss": -5.456597328186035, "global_step": 27115, "epoch": 645} {"train_loss": -5.350767612457275, "global_step": 27116, "epoch": 645} {"train_loss": -5.455712795257568, "global_step": 27117, "epoch": 645} {"train_loss": -5.486146926879883, "global_step": 27118, "epoch": 645} {"train_loss": -5.345405101776123, "global_step": 27119, "epoch": 645} {"train_loss": -5.416189193725586, "global_step": 27120, "epoch": 645} {"train_loss": -5.419371128082275, "global_step": 27121, "epoch": 645} {"train_loss": -5.417451858520508, "global_step": 27122, "epoch": 645} {"train_loss": -5.570884704589844, "global_step": 27123, "epoch": 645} {"train_loss": -5.528378963470459, "global_step": 27124, "epoch": 645} {"train_loss": -5.467219829559326, "global_step": 27125, "epoch": 645} {"train_loss": -5.3636040687561035, "global_step": 27126, "epoch": 645} {"train_loss": -5.490767478942871, "global_step": 27127, "epoch": 645} {"train_loss": -5.4404120445251465, "global_step": 27128, "epoch": 645} {"train_loss": -5.397050380706787, "global_step": 27129, "epoch": 645} {"train_loss": -5.540008544921875, "global_step": 27130, "epoch": 645} {"train_loss": -5.424754699071248, "global_step": 27131, "epoch": 645, "val_loss": 68007.6796875} {"train_loss": -5.436689853668213, "global_step": 27132, "epoch": 646} {"train_loss": -5.295534133911133, "global_step": 27133, "epoch": 646} {"train_loss": -5.422016620635986, "global_step": 27134, "epoch": 646} {"train_loss": -5.453573226928711, "global_step": 27135, "epoch": 646} {"train_loss": -5.347555160522461, "global_step": 27136, "epoch": 646} {"train_loss": -5.380875587463379, "global_step": 27137, "epoch": 646} {"train_loss": -5.302396297454834, "global_step": 27138, "epoch": 646} {"train_loss": -5.410277366638184, "global_step": 27139, "epoch": 646} {"train_loss": -5.381908893585205, "global_step": 27140, "epoch": 646} {"train_loss": -5.367137908935547, "global_step": 27141, "epoch": 646} {"train_loss": -5.495473861694336, "global_step": 27142, "epoch": 646} {"train_loss": -5.497823715209961, "global_step": 27143, "epoch": 646} {"train_loss": -5.424046516418457, "global_step": 27144, "epoch": 646} {"train_loss": -5.455348968505859, "global_step": 27145, "epoch": 646} {"train_loss": -5.47012996673584, "global_step": 27146, "epoch": 646} {"train_loss": -5.5316948890686035, "global_step": 27147, "epoch": 646} {"train_loss": -5.38657283782959, "global_step": 27148, "epoch": 646} {"train_loss": -5.419398307800293, "global_step": 27149, "epoch": 646} {"train_loss": -5.404865741729736, "global_step": 27150, "epoch": 646} {"train_loss": -5.399141311645508, "global_step": 27151, "epoch": 646} {"train_loss": -5.417168140411377, "global_step": 27152, "epoch": 646} {"train_loss": -5.370214462280273, "global_step": 27153, "epoch": 646} {"train_loss": -5.385024070739746, "global_step": 27154, "epoch": 646} {"train_loss": -5.405275344848633, "global_step": 27155, "epoch": 646} {"train_loss": -5.478248596191406, "global_step": 27156, "epoch": 646} {"train_loss": -5.454620838165283, "global_step": 27157, "epoch": 646} {"train_loss": -5.372236251831055, "global_step": 27158, "epoch": 646} {"train_loss": -5.588841915130615, "global_step": 27159, "epoch": 646} {"train_loss": -5.38053035736084, "global_step": 27160, "epoch": 646} {"train_loss": -5.500710487365723, "global_step": 27161, "epoch": 646} {"train_loss": -5.389424800872803, "global_step": 27162, "epoch": 646} {"train_loss": -5.609504699707031, "global_step": 27163, "epoch": 646} {"train_loss": -5.426344871520996, "global_step": 27164, "epoch": 646} {"train_loss": -5.492146968841553, "global_step": 27165, "epoch": 646} {"train_loss": -5.564459323883057, "global_step": 27166, "epoch": 646} {"train_loss": -5.486077785491943, "global_step": 27167, "epoch": 646} {"train_loss": -5.495213985443115, "global_step": 27168, "epoch": 646} {"train_loss": -5.532878875732422, "global_step": 27169, "epoch": 646} {"train_loss": -5.4827470779418945, "global_step": 27170, "epoch": 646} {"train_loss": -5.418671607971191, "global_step": 27171, "epoch": 646} {"train_loss": -5.416797637939453, "global_step": 27172, "epoch": 646} {"train_loss": -5.437621945426578, "global_step": 27173, "epoch": 646, "val_loss": 67510.734375} {"train_loss": -5.342361927032471, "global_step": 27174, "epoch": 647} {"train_loss": -5.484396934509277, "global_step": 27175, "epoch": 647} {"train_loss": -5.4823503494262695, "global_step": 27176, "epoch": 647} {"train_loss": -5.481781005859375, "global_step": 27177, "epoch": 647} {"train_loss": -5.462037086486816, "global_step": 27178, "epoch": 647} {"train_loss": -5.514901638031006, "global_step": 27179, "epoch": 647} {"train_loss": -5.538061618804932, "global_step": 27180, "epoch": 647} {"train_loss": -5.436609268188477, "global_step": 27181, "epoch": 647} {"train_loss": -5.457586288452148, "global_step": 27182, "epoch": 647} {"train_loss": -5.4435038566589355, "global_step": 27183, "epoch": 647} {"train_loss": -5.479304313659668, "global_step": 27184, "epoch": 647} {"train_loss": -5.391822814941406, "global_step": 27185, "epoch": 647} {"train_loss": -5.484204292297363, "global_step": 27186, "epoch": 647} {"train_loss": -5.408110618591309, "global_step": 27187, "epoch": 647} {"train_loss": -5.605405807495117, "global_step": 27188, "epoch": 647} {"train_loss": -5.483009338378906, "global_step": 27189, "epoch": 647} {"train_loss": -5.483733177185059, "global_step": 27190, "epoch": 647} {"train_loss": -5.508114337921143, "global_step": 27191, "epoch": 647} {"train_loss": -5.423846244812012, "global_step": 27192, "epoch": 647} {"train_loss": -5.40466833114624, "global_step": 27193, "epoch": 647} {"train_loss": -5.460148811340332, "global_step": 27194, "epoch": 647} {"train_loss": -5.545587539672852, "global_step": 27195, "epoch": 647} {"train_loss": -5.47801399230957, "global_step": 27196, "epoch": 647} {"train_loss": -5.491657257080078, "global_step": 27197, "epoch": 647} {"train_loss": -5.601926803588867, "global_step": 27198, "epoch": 647} {"train_loss": -5.527354717254639, "global_step": 27199, "epoch": 647} {"train_loss": -5.398787498474121, "global_step": 27200, "epoch": 647} {"train_loss": -5.5219526290893555, "global_step": 27201, "epoch": 647} {"train_loss": -5.430306434631348, "global_step": 27202, "epoch": 647} {"train_loss": -5.360990524291992, "global_step": 27203, "epoch": 647} {"train_loss": -5.533880233764648, "global_step": 27204, "epoch": 647} {"train_loss": -5.469932556152344, "global_step": 27205, "epoch": 647} {"train_loss": -5.499994277954102, "global_step": 27206, "epoch": 647} {"train_loss": -5.348524570465088, "global_step": 27207, "epoch": 647} {"train_loss": -5.415098190307617, "global_step": 27208, "epoch": 647} {"train_loss": -5.376645088195801, "global_step": 27209, "epoch": 647} {"train_loss": -5.295944690704346, "global_step": 27210, "epoch": 647} {"train_loss": -5.362100601196289, "global_step": 27211, "epoch": 647} {"train_loss": -5.337462425231934, "global_step": 27212, "epoch": 647} {"train_loss": -5.27347469329834, "global_step": 27213, "epoch": 647} {"train_loss": -5.593418121337891, "global_step": 27214, "epoch": 647} {"train_loss": -5.453203473772321, "global_step": 27215, "epoch": 647, "val_loss": 68355.2734375} {"train_loss": -5.418735504150391, "global_step": 27216, "epoch": 648} {"train_loss": -5.4569268226623535, "global_step": 27217, "epoch": 648} {"train_loss": -5.49508810043335, "global_step": 27218, "epoch": 648} {"train_loss": -5.5024518966674805, "global_step": 27219, "epoch": 648} {"train_loss": -5.322564125061035, "global_step": 27220, "epoch": 648} {"train_loss": -5.503071308135986, "global_step": 27221, "epoch": 648} {"train_loss": -5.40122127532959, "global_step": 27222, "epoch": 648} {"train_loss": -5.432074546813965, "global_step": 27223, "epoch": 648} {"train_loss": -5.372227668762207, "global_step": 27224, "epoch": 648} {"train_loss": -5.536397933959961, "global_step": 27225, "epoch": 648} {"train_loss": -5.492678642272949, "global_step": 27226, "epoch": 648} {"train_loss": -5.474252700805664, "global_step": 27227, "epoch": 648} {"train_loss": -5.418082237243652, "global_step": 27228, "epoch": 648} {"train_loss": -5.423248291015625, "global_step": 27229, "epoch": 648} {"train_loss": -5.431086540222168, "global_step": 27230, "epoch": 648} {"train_loss": -5.504210472106934, "global_step": 27231, "epoch": 648} {"train_loss": -5.467663764953613, "global_step": 27232, "epoch": 648} {"train_loss": -5.52972412109375, "global_step": 27233, "epoch": 648} {"train_loss": -5.425325393676758, "global_step": 27234, "epoch": 648} {"train_loss": -5.391693115234375, "global_step": 27235, "epoch": 648} {"train_loss": -5.450201511383057, "global_step": 27236, "epoch": 648} {"train_loss": -5.4411211013793945, "global_step": 27237, "epoch": 648} {"train_loss": -5.518271446228027, "global_step": 27238, "epoch": 648} {"train_loss": -5.481892108917236, "global_step": 27239, "epoch": 648} {"train_loss": -5.454875946044922, "global_step": 27240, "epoch": 648} {"train_loss": -5.521781921386719, "global_step": 27241, "epoch": 648} {"train_loss": -5.370912551879883, "global_step": 27242, "epoch": 648} {"train_loss": -5.291069984436035, "global_step": 27243, "epoch": 648} {"train_loss": -5.521392822265625, "global_step": 27244, "epoch": 648} {"train_loss": -5.4437255859375, "global_step": 27245, "epoch": 648} {"train_loss": -5.357021808624268, "global_step": 27246, "epoch": 648} {"train_loss": -5.6354875564575195, "global_step": 27247, "epoch": 648} {"train_loss": -5.378454208374023, "global_step": 27248, "epoch": 648} {"train_loss": -5.411074638366699, "global_step": 27249, "epoch": 648} {"train_loss": -5.489177703857422, "global_step": 27250, "epoch": 648} {"train_loss": -5.3396806716918945, "global_step": 27251, "epoch": 648} {"train_loss": -5.438436508178711, "global_step": 27252, "epoch": 648} {"train_loss": -5.3878984451293945, "global_step": 27253, "epoch": 648} {"train_loss": -5.388985633850098, "global_step": 27254, "epoch": 648} {"train_loss": -5.401486396789551, "global_step": 27255, "epoch": 648} {"train_loss": -5.513068199157715, "global_step": 27256, "epoch": 648} {"train_loss": -5.439151128133138, "global_step": 27257, "epoch": 648, "val_loss": 67542.4609375} {"train_loss": -5.4967145919799805, "global_step": 27258, "epoch": 649} {"train_loss": -5.403526782989502, "global_step": 27259, "epoch": 649} {"train_loss": -5.326940536499023, "global_step": 27260, "epoch": 649} {"train_loss": -5.472677707672119, "global_step": 27261, "epoch": 649} {"train_loss": -5.451727867126465, "global_step": 27262, "epoch": 649} {"train_loss": -5.545302867889404, "global_step": 27263, "epoch": 649} {"train_loss": -5.396947383880615, "global_step": 27264, "epoch": 649} {"train_loss": -5.262145042419434, "global_step": 27265, "epoch": 649} {"train_loss": -5.5361456871032715, "global_step": 27266, "epoch": 649} {"train_loss": -5.401277542114258, "global_step": 27267, "epoch": 649} {"train_loss": -5.358936309814453, "global_step": 27268, "epoch": 649} {"train_loss": -5.511317729949951, "global_step": 27269, "epoch": 649} {"train_loss": -5.377089977264404, "global_step": 27270, "epoch": 649} {"train_loss": -5.453990936279297, "global_step": 27271, "epoch": 649} {"train_loss": -5.310921669006348, "global_step": 27272, "epoch": 649} {"train_loss": -5.43446159362793, "global_step": 27273, "epoch": 649} {"train_loss": -5.299898624420166, "global_step": 27274, "epoch": 649} {"train_loss": -5.457284927368164, "global_step": 27275, "epoch": 649} {"train_loss": -5.280755996704102, "global_step": 27276, "epoch": 649} {"train_loss": -5.401219367980957, "global_step": 27277, "epoch": 649} {"train_loss": -5.3589863777160645, "global_step": 27278, "epoch": 649} {"train_loss": -5.395081043243408, "global_step": 27279, "epoch": 649} {"train_loss": -5.375720977783203, "global_step": 27280, "epoch": 649} {"train_loss": -5.357485771179199, "global_step": 27281, "epoch": 649} {"train_loss": -5.399067401885986, "global_step": 27282, "epoch": 649} {"train_loss": -5.439545154571533, "global_step": 27283, "epoch": 649} {"train_loss": -5.315645217895508, "global_step": 27284, "epoch": 649} {"train_loss": -5.515575885772705, "global_step": 27285, "epoch": 649} {"train_loss": -5.3222856521606445, "global_step": 27286, "epoch": 649} {"train_loss": -5.352845668792725, "global_step": 27287, "epoch": 649} {"train_loss": -5.358695983886719, "global_step": 27288, "epoch": 649} {"train_loss": -5.385690212249756, "global_step": 27289, "epoch": 649} {"train_loss": -5.394946098327637, "global_step": 27290, "epoch": 649} {"train_loss": -5.371148586273193, "global_step": 27291, "epoch": 649} {"train_loss": -5.398152828216553, "global_step": 27292, "epoch": 649} {"train_loss": -5.391262531280518, "global_step": 27293, "epoch": 649} {"train_loss": -5.33490514755249, "global_step": 27294, "epoch": 649} {"train_loss": -5.483656883239746, "global_step": 27295, "epoch": 649} {"train_loss": -5.3732709884643555, "global_step": 27296, "epoch": 649} {"train_loss": -5.327263832092285, "global_step": 27297, "epoch": 649} {"train_loss": -5.334673881530762, "global_step": 27298, "epoch": 649} {"train_loss": -5.394177845546177, "global_step": 27299, "epoch": 649, "val_loss": 67489.1640625} {"train_loss": -5.361110687255859, "global_step": 27300, "epoch": 650} {"train_loss": -5.474555015563965, "global_step": 27301, "epoch": 650} {"train_loss": -5.444798469543457, "global_step": 27302, "epoch": 650} {"train_loss": -5.45198392868042, "global_step": 27303, "epoch": 650} {"train_loss": -5.439371109008789, "global_step": 27304, "epoch": 650} {"train_loss": -5.482856750488281, "global_step": 27305, "epoch": 650} {"train_loss": -5.503469467163086, "global_step": 27306, "epoch": 650} {"train_loss": -5.3705668449401855, "global_step": 27307, "epoch": 650} {"train_loss": -5.398624420166016, "global_step": 27308, "epoch": 650} {"train_loss": -5.37020206451416, "global_step": 27309, "epoch": 650} {"train_loss": -5.3832478523254395, "global_step": 27310, "epoch": 650} {"train_loss": -5.439018249511719, "global_step": 27311, "epoch": 650} {"train_loss": -5.300942420959473, "global_step": 27312, "epoch": 650} {"train_loss": -5.625907897949219, "global_step": 27313, "epoch": 650} {"train_loss": -5.316667556762695, "global_step": 27314, "epoch": 650} {"train_loss": -5.379417896270752, "global_step": 27315, "epoch": 650} {"train_loss": -5.337314128875732, "global_step": 27316, "epoch": 650} {"train_loss": -5.406993865966797, "global_step": 27317, "epoch": 650} {"train_loss": -5.5022478103637695, "global_step": 27318, "epoch": 650} {"train_loss": -5.45103120803833, "global_step": 27319, "epoch": 650} {"train_loss": -5.435388088226318, "global_step": 27320, "epoch": 650} {"train_loss": -5.390673637390137, "global_step": 27321, "epoch": 650} {"train_loss": -5.3242692947387695, "global_step": 27322, "epoch": 650} {"train_loss": -5.522009372711182, "global_step": 27323, "epoch": 650} {"train_loss": -5.432326316833496, "global_step": 27324, "epoch": 650} {"train_loss": -5.469987869262695, "global_step": 27325, "epoch": 650} {"train_loss": -5.585484981536865, "global_step": 27326, "epoch": 650} {"train_loss": -5.488182067871094, "global_step": 27327, "epoch": 650} {"train_loss": -5.423525810241699, "global_step": 27328, "epoch": 650} {"train_loss": -5.524857044219971, "global_step": 27329, "epoch": 650} {"train_loss": -5.442812919616699, "global_step": 27330, "epoch": 650} {"train_loss": -5.436678886413574, "global_step": 27331, "epoch": 650} {"train_loss": -5.477356910705566, "global_step": 27332, "epoch": 650} {"train_loss": -5.479142189025879, "global_step": 27333, "epoch": 650} {"train_loss": -5.3969645500183105, "global_step": 27334, "epoch": 650} {"train_loss": -5.391969680786133, "global_step": 27335, "epoch": 650} {"train_loss": -5.513872146606445, "global_step": 27336, "epoch": 650} {"train_loss": -5.49321174621582, "global_step": 27337, "epoch": 650} {"train_loss": -5.3806071281433105, "global_step": 27338, "epoch": 650} {"train_loss": -5.468721389770508, "global_step": 27339, "epoch": 650} {"train_loss": -5.424972057342529, "global_step": 27340, "epoch": 650} {"train_loss": -5.435693354833694, "global_step": 27341, "epoch": 650, "train/sim_max_reward_0": 0.4082151558950274, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.30740693414214854, "train/sim_max_reward_3": 0.24901078691828918, "train/sim_max_reward_4": 0.31486720459059103, "train/sim_max_reward_5": 0.573283479437789, "test/sim_max_reward_4400000": 0.4234067604085958, "test/sim_max_reward_4400001": 0.7606707763145252, "test/sim_max_reward_4400002": 0.057247533401550595, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.26870910219357824, "test/sim_max_reward_4400005": 0.21676692654583807, "test/sim_max_reward_4400006": 0.19686569237031307, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.4802836305675615, "test/sim_max_reward_4400009": 0.3760991679694713, "test/sim_max_reward_4400010": 0.3962623472886552, "test/sim_max_reward_4400011": 0.29292882103963525, "test/sim_max_reward_4400012": 0.3814782371352737, "test/sim_max_reward_4400013": 0.37988425278794713, "test/sim_max_reward_4400014": 0.15130848375599118, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.3802264696344418, "test/sim_max_reward_4400017": 0.28110321908337116, "test/sim_max_reward_4400018": 0.2997557043182203, "test/sim_max_reward_4400019": 0.3439847818612123, "test/sim_max_reward_4400020": 0.024279676540731952, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.006839557223044938, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.03781151435992362, "test/sim_max_reward_4400027": 0.1151287863092671, "test/sim_max_reward_4400028": 0.2903998622150821, "test/sim_max_reward_4400029": 0.23361534900097194, "test/sim_max_reward_4400030": 0.14329475333442884, "test/sim_max_reward_4400031": 0.39625082934312167, "test/sim_max_reward_4400032": 0.560175198524702, "test/sim_max_reward_4400033": 0.10974396181140587, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.472451549473532, "test/sim_max_reward_4400036": 0.5391799762645246, "test/sim_max_reward_4400037": 0.12496237831165845, "test/sim_max_reward_4400038": 0.15154655579884554, "test/sim_max_reward_4400039": 0.46902236056254293, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6175584779033727, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.059490468925328055, "test/sim_max_reward_4400044": 0.018128436922096376, "test/sim_max_reward_4400045": 0.7151880401585969, "test/sim_max_reward_4400046": 0.1771328070986132, "test/sim_max_reward_4400047": 0.14006560137960855, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.05416053585564581, "train/mean_score": 0.3089098403676074, "test/mean_score": 0.23726839173806952, "val_loss": 67489.0390625} {"train_loss": -5.417291164398193, "global_step": 27342, "epoch": 651} {"train_loss": -5.470928192138672, "global_step": 27343, "epoch": 651} {"train_loss": -5.401767730712891, "global_step": 27344, "epoch": 651} {"train_loss": -5.448905944824219, "global_step": 27345, "epoch": 651} {"train_loss": -5.370009422302246, "global_step": 27346, "epoch": 651} {"train_loss": -5.407413005828857, "global_step": 27347, "epoch": 651} {"train_loss": -5.431763172149658, "global_step": 27348, "epoch": 651} {"train_loss": -5.4655537605285645, "global_step": 27349, "epoch": 651} {"train_loss": -5.461664199829102, "global_step": 27350, "epoch": 651} {"train_loss": -5.441561222076416, "global_step": 27351, "epoch": 651} {"train_loss": -5.387936592102051, "global_step": 27352, "epoch": 651} {"train_loss": -5.6037373542785645, "global_step": 27353, "epoch": 651} {"train_loss": -5.363526344299316, "global_step": 27354, "epoch": 651} {"train_loss": -5.535180568695068, "global_step": 27355, "epoch": 651} {"train_loss": -5.508213520050049, "global_step": 27356, "epoch": 651} {"train_loss": -5.380192756652832, "global_step": 27357, "epoch": 651} {"train_loss": -5.355701446533203, "global_step": 27358, "epoch": 651} {"train_loss": -5.521219253540039, "global_step": 27359, "epoch": 651} {"train_loss": -5.4512481689453125, "global_step": 27360, "epoch": 651} {"train_loss": -5.369529724121094, "global_step": 27361, "epoch": 651} {"train_loss": -5.454437255859375, "global_step": 27362, "epoch": 651} {"train_loss": -5.40915060043335, "global_step": 27363, "epoch": 651} {"train_loss": -5.376952171325684, "global_step": 27364, "epoch": 651} {"train_loss": -5.338681221008301, "global_step": 27365, "epoch": 651} {"train_loss": -5.435660362243652, "global_step": 27366, "epoch": 651} {"train_loss": -5.300386905670166, "global_step": 27367, "epoch": 651} {"train_loss": -5.480816841125488, "global_step": 27368, "epoch": 651} {"train_loss": -5.318667411804199, "global_step": 27369, "epoch": 651} {"train_loss": -5.505598068237305, "global_step": 27370, "epoch": 651} {"train_loss": -5.359015464782715, "global_step": 27371, "epoch": 651} {"train_loss": -5.4365057945251465, "global_step": 27372, "epoch": 651} {"train_loss": -5.4480109214782715, "global_step": 27373, "epoch": 651} {"train_loss": -5.30755615234375, "global_step": 27374, "epoch": 651} {"train_loss": -5.329716682434082, "global_step": 27375, "epoch": 651} {"train_loss": -5.409577369689941, "global_step": 27376, "epoch": 651} {"train_loss": -5.586205005645752, "global_step": 27377, "epoch": 651} {"train_loss": -5.431506156921387, "global_step": 27378, "epoch": 651} {"train_loss": -5.5098066329956055, "global_step": 27379, "epoch": 651} {"train_loss": -5.4600019454956055, "global_step": 27380, "epoch": 651} {"train_loss": -5.467680931091309, "global_step": 27381, "epoch": 651} {"train_loss": -5.459439754486084, "global_step": 27382, "epoch": 651} {"train_loss": -5.429420176006499, "global_step": 27383, "epoch": 651, "val_loss": 67628.296875} {"train_loss": -5.52291202545166, "global_step": 27384, "epoch": 652} {"train_loss": -5.44988489151001, "global_step": 27385, "epoch": 652} {"train_loss": -5.461365222930908, "global_step": 27386, "epoch": 652} {"train_loss": -5.466739654541016, "global_step": 27387, "epoch": 652} {"train_loss": -5.427136421203613, "global_step": 27388, "epoch": 652} {"train_loss": -5.375173568725586, "global_step": 27389, "epoch": 652} {"train_loss": -5.48513126373291, "global_step": 27390, "epoch": 652} {"train_loss": -5.410567760467529, "global_step": 27391, "epoch": 652} {"train_loss": -5.475640296936035, "global_step": 27392, "epoch": 652} {"train_loss": -5.529844284057617, "global_step": 27393, "epoch": 652} {"train_loss": -5.469666957855225, "global_step": 27394, "epoch": 652} {"train_loss": -5.486610412597656, "global_step": 27395, "epoch": 652} {"train_loss": -5.585808277130127, "global_step": 27396, "epoch": 652} {"train_loss": -5.505134582519531, "global_step": 27397, "epoch": 652} {"train_loss": -5.507242679595947, "global_step": 27398, "epoch": 652} {"train_loss": -5.224992752075195, "global_step": 27399, "epoch": 652} {"train_loss": -5.263368606567383, "global_step": 27400, "epoch": 652} {"train_loss": -5.453838348388672, "global_step": 27401, "epoch": 652} {"train_loss": -5.289255142211914, "global_step": 27402, "epoch": 652} {"train_loss": -5.510473251342773, "global_step": 27403, "epoch": 652} {"train_loss": -5.413311958312988, "global_step": 27404, "epoch": 652} {"train_loss": -5.383055686950684, "global_step": 27405, "epoch": 652} {"train_loss": -5.3822221755981445, "global_step": 27406, "epoch": 652} {"train_loss": -5.328952789306641, "global_step": 27407, "epoch": 652} {"train_loss": -5.375638484954834, "global_step": 27408, "epoch": 652} {"train_loss": -5.414802551269531, "global_step": 27409, "epoch": 652} {"train_loss": -5.580810546875, "global_step": 27410, "epoch": 652} {"train_loss": -5.373085021972656, "global_step": 27411, "epoch": 652} {"train_loss": -5.507257461547852, "global_step": 27412, "epoch": 652} {"train_loss": -5.404294967651367, "global_step": 27413, "epoch": 652} {"train_loss": -5.3439788818359375, "global_step": 27414, "epoch": 652} {"train_loss": -5.503757476806641, "global_step": 27415, "epoch": 652} {"train_loss": -5.332569599151611, "global_step": 27416, "epoch": 652} {"train_loss": -5.46207332611084, "global_step": 27417, "epoch": 652} {"train_loss": -5.497966289520264, "global_step": 27418, "epoch": 652} {"train_loss": -5.440549850463867, "global_step": 27419, "epoch": 652} {"train_loss": -5.364265441894531, "global_step": 27420, "epoch": 652} {"train_loss": -5.4675397872924805, "global_step": 27421, "epoch": 652} {"train_loss": -5.469654560089111, "global_step": 27422, "epoch": 652} {"train_loss": -5.357308387756348, "global_step": 27423, "epoch": 652} {"train_loss": -5.450655937194824, "global_step": 27424, "epoch": 652} {"train_loss": -5.429076932725453, "global_step": 27425, "epoch": 652, "val_loss": 68136.828125} {"train_loss": -5.280344486236572, "global_step": 27426, "epoch": 653} {"train_loss": -5.378917694091797, "global_step": 27427, "epoch": 653} {"train_loss": -5.2499895095825195, "global_step": 27428, "epoch": 653} {"train_loss": -5.427970886230469, "global_step": 27429, "epoch": 653} {"train_loss": -5.437939643859863, "global_step": 27430, "epoch": 653} {"train_loss": -5.4301652908325195, "global_step": 27431, "epoch": 653} {"train_loss": -5.433663368225098, "global_step": 27432, "epoch": 653} {"train_loss": -5.289389610290527, "global_step": 27433, "epoch": 653} {"train_loss": -5.42286491394043, "global_step": 27434, "epoch": 653} {"train_loss": -5.324188232421875, "global_step": 27435, "epoch": 653} {"train_loss": -5.418709754943848, "global_step": 27436, "epoch": 653} {"train_loss": -5.511697769165039, "global_step": 27437, "epoch": 653} {"train_loss": -5.287346363067627, "global_step": 27438, "epoch": 653} {"train_loss": -5.410684108734131, "global_step": 27439, "epoch": 653} {"train_loss": -5.542442321777344, "global_step": 27440, "epoch": 653} {"train_loss": -5.504940509796143, "global_step": 27441, "epoch": 653} {"train_loss": -5.432588577270508, "global_step": 27442, "epoch": 653} {"train_loss": -5.4120635986328125, "global_step": 27443, "epoch": 653} {"train_loss": -5.451915740966797, "global_step": 27444, "epoch": 653} {"train_loss": -5.41158390045166, "global_step": 27445, "epoch": 653} {"train_loss": -5.503924369812012, "global_step": 27446, "epoch": 653} {"train_loss": -5.4288458824157715, "global_step": 27447, "epoch": 653} {"train_loss": -5.461860179901123, "global_step": 27448, "epoch": 653} {"train_loss": -5.326789379119873, "global_step": 27449, "epoch": 653} {"train_loss": -5.53714656829834, "global_step": 27450, "epoch": 653} {"train_loss": -5.35178804397583, "global_step": 27451, "epoch": 653} {"train_loss": -5.450192451477051, "global_step": 27452, "epoch": 653} {"train_loss": -5.387592315673828, "global_step": 27453, "epoch": 653} {"train_loss": -5.386077880859375, "global_step": 27454, "epoch": 653} {"train_loss": -5.364373207092285, "global_step": 27455, "epoch": 653} {"train_loss": -5.450329303741455, "global_step": 27456, "epoch": 653} {"train_loss": -5.2562575340271, "global_step": 27457, "epoch": 653} {"train_loss": -5.498464584350586, "global_step": 27458, "epoch": 653} {"train_loss": -5.480005264282227, "global_step": 27459, "epoch": 653} {"train_loss": -5.462747097015381, "global_step": 27460, "epoch": 653} {"train_loss": -5.402629852294922, "global_step": 27461, "epoch": 653} {"train_loss": -5.462776184082031, "global_step": 27462, "epoch": 653} {"train_loss": -5.544134140014648, "global_step": 27463, "epoch": 653} {"train_loss": -5.457204818725586, "global_step": 27464, "epoch": 653} {"train_loss": -5.334164619445801, "global_step": 27465, "epoch": 653} {"train_loss": -5.611017227172852, "global_step": 27466, "epoch": 653} {"train_loss": -5.4210831097194125, "global_step": 27467, "epoch": 653, "val_loss": 67427.5390625} {"train_loss": -5.5352630615234375, "global_step": 27468, "epoch": 654} {"train_loss": -5.543844699859619, "global_step": 27469, "epoch": 654} {"train_loss": -5.429981231689453, "global_step": 27470, "epoch": 654} {"train_loss": -5.3991851806640625, "global_step": 27471, "epoch": 654} {"train_loss": -5.521527290344238, "global_step": 27472, "epoch": 654} {"train_loss": -5.341531753540039, "global_step": 27473, "epoch": 654} {"train_loss": -5.600735664367676, "global_step": 27474, "epoch": 654} {"train_loss": -5.447906970977783, "global_step": 27475, "epoch": 654} {"train_loss": -5.513446807861328, "global_step": 27476, "epoch": 654} {"train_loss": -5.444597244262695, "global_step": 27477, "epoch": 654} {"train_loss": -5.237667083740234, "global_step": 27478, "epoch": 654} {"train_loss": -5.419837474822998, "global_step": 27479, "epoch": 654} {"train_loss": -5.43671989440918, "global_step": 27480, "epoch": 654} {"train_loss": -5.316235542297363, "global_step": 27481, "epoch": 654} {"train_loss": -5.37225341796875, "global_step": 27482, "epoch": 654} {"train_loss": -5.434232711791992, "global_step": 27483, "epoch": 654} {"train_loss": -5.5244035720825195, "global_step": 27484, "epoch": 654} {"train_loss": -5.436062812805176, "global_step": 27485, "epoch": 654} {"train_loss": -5.492002010345459, "global_step": 27486, "epoch": 654} {"train_loss": -5.488496780395508, "global_step": 27487, "epoch": 654} {"train_loss": -5.622607231140137, "global_step": 27488, "epoch": 654} {"train_loss": -5.521188259124756, "global_step": 27489, "epoch": 654} {"train_loss": -5.354520320892334, "global_step": 27490, "epoch": 654} {"train_loss": -5.498917579650879, "global_step": 27491, "epoch": 654} {"train_loss": -5.448270797729492, "global_step": 27492, "epoch": 654} {"train_loss": -5.378100395202637, "global_step": 27493, "epoch": 654} {"train_loss": -5.3845601081848145, "global_step": 27494, "epoch": 654} {"train_loss": -5.539140701293945, "global_step": 27495, "epoch": 654} {"train_loss": -5.597329139709473, "global_step": 27496, "epoch": 654} {"train_loss": -5.437448501586914, "global_step": 27497, "epoch": 654} {"train_loss": -5.480729103088379, "global_step": 27498, "epoch": 654} {"train_loss": -5.502334117889404, "global_step": 27499, "epoch": 654} {"train_loss": -5.481625556945801, "global_step": 27500, "epoch": 654} {"train_loss": -5.486133575439453, "global_step": 27501, "epoch": 654} {"train_loss": -5.500494956970215, "global_step": 27502, "epoch": 654} {"train_loss": -5.438941955566406, "global_step": 27503, "epoch": 654} {"train_loss": -5.396727561950684, "global_step": 27504, "epoch": 654} {"train_loss": -5.499922275543213, "global_step": 27505, "epoch": 654} {"train_loss": -5.493055820465088, "global_step": 27506, "epoch": 654} {"train_loss": -5.290809631347656, "global_step": 27507, "epoch": 654} {"train_loss": -5.40421199798584, "global_step": 27508, "epoch": 654} {"train_loss": -5.452339603787377, "global_step": 27509, "epoch": 654, "val_loss": 68828.4140625} {"train_loss": -5.280352592468262, "global_step": 27510, "epoch": 655} {"train_loss": -5.508056640625, "global_step": 27511, "epoch": 655} {"train_loss": -5.440727233886719, "global_step": 27512, "epoch": 655} {"train_loss": -5.268800735473633, "global_step": 27513, "epoch": 655} {"train_loss": -5.392284870147705, "global_step": 27514, "epoch": 655} {"train_loss": -5.279485702514648, "global_step": 27515, "epoch": 655} {"train_loss": -5.40278434753418, "global_step": 27516, "epoch": 655} {"train_loss": -5.365700721740723, "global_step": 27517, "epoch": 655} {"train_loss": -5.288522720336914, "global_step": 27518, "epoch": 655} {"train_loss": -5.43211555480957, "global_step": 27519, "epoch": 655} {"train_loss": -5.287419319152832, "global_step": 27520, "epoch": 655} {"train_loss": -5.395181655883789, "global_step": 27521, "epoch": 655} {"train_loss": -5.480405330657959, "global_step": 27522, "epoch": 655} {"train_loss": -5.11640739440918, "global_step": 27523, "epoch": 655} {"train_loss": -5.383939743041992, "global_step": 27524, "epoch": 655} {"train_loss": -5.261656284332275, "global_step": 27525, "epoch": 655} {"train_loss": -5.395444869995117, "global_step": 27526, "epoch": 655} {"train_loss": -5.309957027435303, "global_step": 27527, "epoch": 655} {"train_loss": -5.345298767089844, "global_step": 27528, "epoch": 655} {"train_loss": -5.271579742431641, "global_step": 27529, "epoch": 655} {"train_loss": -5.286397933959961, "global_step": 27530, "epoch": 655} {"train_loss": -5.509965419769287, "global_step": 27531, "epoch": 655} {"train_loss": -5.517841815948486, "global_step": 27532, "epoch": 655} {"train_loss": -5.5591607093811035, "global_step": 27533, "epoch": 655} {"train_loss": -5.508960723876953, "global_step": 27534, "epoch": 655} {"train_loss": -5.5916547775268555, "global_step": 27535, "epoch": 655} {"train_loss": -5.429286003112793, "global_step": 27536, "epoch": 655} {"train_loss": -5.471789360046387, "global_step": 27537, "epoch": 655} {"train_loss": -5.425684452056885, "global_step": 27538, "epoch": 655} {"train_loss": -5.325281143188477, "global_step": 27539, "epoch": 655} {"train_loss": -5.542055130004883, "global_step": 27540, "epoch": 655} {"train_loss": -5.372817039489746, "global_step": 27541, "epoch": 655} {"train_loss": -5.4221391677856445, "global_step": 27542, "epoch": 655} {"train_loss": -5.5366363525390625, "global_step": 27543, "epoch": 655} {"train_loss": -5.548605918884277, "global_step": 27544, "epoch": 655} {"train_loss": -5.426181793212891, "global_step": 27545, "epoch": 655} {"train_loss": -5.451159477233887, "global_step": 27546, "epoch": 655} {"train_loss": -5.391861438751221, "global_step": 27547, "epoch": 655} {"train_loss": -5.424069404602051, "global_step": 27548, "epoch": 655} {"train_loss": -5.40140438079834, "global_step": 27549, "epoch": 655} {"train_loss": -5.404573917388916, "global_step": 27550, "epoch": 655} {"train_loss": -5.405997923442295, "global_step": 27551, "epoch": 655, "val_loss": 67106.5625} {"train_loss": -5.368049621582031, "global_step": 27552, "epoch": 656} {"train_loss": -5.454737663269043, "global_step": 27553, "epoch": 656} {"train_loss": -5.512202739715576, "global_step": 27554, "epoch": 656} {"train_loss": -5.47269868850708, "global_step": 27555, "epoch": 656} {"train_loss": -5.437491416931152, "global_step": 27556, "epoch": 656} {"train_loss": -5.598523139953613, "global_step": 27557, "epoch": 656} {"train_loss": -5.486586570739746, "global_step": 27558, "epoch": 656} {"train_loss": -5.407094478607178, "global_step": 27559, "epoch": 656} {"train_loss": -5.42959451675415, "global_step": 27560, "epoch": 656} {"train_loss": -5.358964920043945, "global_step": 27561, "epoch": 656} {"train_loss": -5.460000991821289, "global_step": 27562, "epoch": 656} {"train_loss": -5.420805931091309, "global_step": 27563, "epoch": 656} {"train_loss": -5.436386585235596, "global_step": 27564, "epoch": 656} {"train_loss": -5.559571266174316, "global_step": 27565, "epoch": 656} {"train_loss": -5.5931477546691895, "global_step": 27566, "epoch": 656} {"train_loss": -5.5772504806518555, "global_step": 27567, "epoch": 656} {"train_loss": -5.491912841796875, "global_step": 27568, "epoch": 656} {"train_loss": -5.476820945739746, "global_step": 27569, "epoch": 656} {"train_loss": -5.373918533325195, "global_step": 27570, "epoch": 656} {"train_loss": -5.438199996948242, "global_step": 27571, "epoch": 656} {"train_loss": -5.475922584533691, "global_step": 27572, "epoch": 656} {"train_loss": -5.49884033203125, "global_step": 27573, "epoch": 656} {"train_loss": -5.39304256439209, "global_step": 27574, "epoch": 656} {"train_loss": -5.374125957489014, "global_step": 27575, "epoch": 656} {"train_loss": -5.578988075256348, "global_step": 27576, "epoch": 656} {"train_loss": -5.4621381759643555, "global_step": 27577, "epoch": 656} {"train_loss": -5.477752208709717, "global_step": 27578, "epoch": 656} {"train_loss": -5.365725994110107, "global_step": 27579, "epoch": 656} {"train_loss": -5.4982404708862305, "global_step": 27580, "epoch": 656} {"train_loss": -5.449591636657715, "global_step": 27581, "epoch": 656} {"train_loss": -5.3499579429626465, "global_step": 27582, "epoch": 656} {"train_loss": -5.350771427154541, "global_step": 27583, "epoch": 656} {"train_loss": -5.490823745727539, "global_step": 27584, "epoch": 656} {"train_loss": -5.449559688568115, "global_step": 27585, "epoch": 656} {"train_loss": -5.385142803192139, "global_step": 27586, "epoch": 656} {"train_loss": -5.397168159484863, "global_step": 27587, "epoch": 656} {"train_loss": -5.388740539550781, "global_step": 27588, "epoch": 656} {"train_loss": -5.419730186462402, "global_step": 27589, "epoch": 656} {"train_loss": -5.542584419250488, "global_step": 27590, "epoch": 656} {"train_loss": -5.433640956878662, "global_step": 27591, "epoch": 656} {"train_loss": -5.436398506164551, "global_step": 27592, "epoch": 656} {"train_loss": -5.45439388638451, "global_step": 27593, "epoch": 656, "val_loss": 67727.28125} {"train_loss": -5.486968040466309, "global_step": 27594, "epoch": 657} {"train_loss": -5.479950904846191, "global_step": 27595, "epoch": 657} {"train_loss": -5.354635238647461, "global_step": 27596, "epoch": 657} {"train_loss": -5.438108444213867, "global_step": 27597, "epoch": 657} {"train_loss": -5.470263481140137, "global_step": 27598, "epoch": 657} {"train_loss": -5.491485595703125, "global_step": 27599, "epoch": 657} {"train_loss": -5.450780391693115, "global_step": 27600, "epoch": 657} {"train_loss": -5.545427322387695, "global_step": 27601, "epoch": 657} {"train_loss": -5.319639205932617, "global_step": 27602, "epoch": 657} {"train_loss": -5.428403377532959, "global_step": 27603, "epoch": 657} {"train_loss": -5.363699436187744, "global_step": 27604, "epoch": 657} {"train_loss": -5.3501811027526855, "global_step": 27605, "epoch": 657} {"train_loss": -5.532114028930664, "global_step": 27606, "epoch": 657} {"train_loss": -5.516017436981201, "global_step": 27607, "epoch": 657} {"train_loss": -5.404339790344238, "global_step": 27608, "epoch": 657} {"train_loss": -5.429812908172607, "global_step": 27609, "epoch": 657} {"train_loss": -5.583730697631836, "global_step": 27610, "epoch": 657} {"train_loss": -5.402956008911133, "global_step": 27611, "epoch": 657} {"train_loss": -5.472440242767334, "global_step": 27612, "epoch": 657} {"train_loss": -5.468990325927734, "global_step": 27613, "epoch": 657} {"train_loss": -5.492743492126465, "global_step": 27614, "epoch": 657} {"train_loss": -5.3638811111450195, "global_step": 27615, "epoch": 657} {"train_loss": -5.569509506225586, "global_step": 27616, "epoch": 657} {"train_loss": -5.451866626739502, "global_step": 27617, "epoch": 657} {"train_loss": -5.276792526245117, "global_step": 27618, "epoch": 657} {"train_loss": -5.411481857299805, "global_step": 27619, "epoch": 657} {"train_loss": -5.375183582305908, "global_step": 27620, "epoch": 657} {"train_loss": -5.588545322418213, "global_step": 27621, "epoch": 657} {"train_loss": -5.470953941345215, "global_step": 27622, "epoch": 657} {"train_loss": -5.324013710021973, "global_step": 27623, "epoch": 657} {"train_loss": -5.362278461456299, "global_step": 27624, "epoch": 657} {"train_loss": -5.2476701736450195, "global_step": 27625, "epoch": 657} {"train_loss": -5.39090633392334, "global_step": 27626, "epoch": 657} {"train_loss": -5.502764701843262, "global_step": 27627, "epoch": 657} {"train_loss": -5.333414554595947, "global_step": 27628, "epoch": 657} {"train_loss": -5.539819717407227, "global_step": 27629, "epoch": 657} {"train_loss": -5.377974510192871, "global_step": 27630, "epoch": 657} {"train_loss": -5.549853324890137, "global_step": 27631, "epoch": 657} {"train_loss": -5.423759460449219, "global_step": 27632, "epoch": 657} {"train_loss": -5.536970138549805, "global_step": 27633, "epoch": 657} {"train_loss": -5.341640472412109, "global_step": 27634, "epoch": 657} {"train_loss": -5.437047379357474, "global_step": 27635, "epoch": 657, "val_loss": 67642.2421875} {"train_loss": -5.641862869262695, "global_step": 27636, "epoch": 658} {"train_loss": -5.332596778869629, "global_step": 27637, "epoch": 658} {"train_loss": -5.386771202087402, "global_step": 27638, "epoch": 658} {"train_loss": -5.382841110229492, "global_step": 27639, "epoch": 658} {"train_loss": -5.419536590576172, "global_step": 27640, "epoch": 658} {"train_loss": -5.452846527099609, "global_step": 27641, "epoch": 658} {"train_loss": -5.491815567016602, "global_step": 27642, "epoch": 658} {"train_loss": -5.431726455688477, "global_step": 27643, "epoch": 658} {"train_loss": -5.338689804077148, "global_step": 27644, "epoch": 658} {"train_loss": -5.487283229827881, "global_step": 27645, "epoch": 658} {"train_loss": -5.365840911865234, "global_step": 27646, "epoch": 658} {"train_loss": -5.454402446746826, "global_step": 27647, "epoch": 658} {"train_loss": -5.418250560760498, "global_step": 27648, "epoch": 658} {"train_loss": -5.477051258087158, "global_step": 27649, "epoch": 658} {"train_loss": -5.401332855224609, "global_step": 27650, "epoch": 658} {"train_loss": -5.405045509338379, "global_step": 27651, "epoch": 658} {"train_loss": -5.424571990966797, "global_step": 27652, "epoch": 658} {"train_loss": -5.378500938415527, "global_step": 27653, "epoch": 658} {"train_loss": -5.458776473999023, "global_step": 27654, "epoch": 658} {"train_loss": -5.475348472595215, "global_step": 27655, "epoch": 658} {"train_loss": -5.445042133331299, "global_step": 27656, "epoch": 658} {"train_loss": -5.3287553787231445, "global_step": 27657, "epoch": 658} {"train_loss": -5.361855506896973, "global_step": 27658, "epoch": 658} {"train_loss": -5.575261116027832, "global_step": 27659, "epoch": 658} {"train_loss": -5.407060623168945, "global_step": 27660, "epoch": 658} {"train_loss": -5.520748138427734, "global_step": 27661, "epoch": 658} {"train_loss": -5.478737831115723, "global_step": 27662, "epoch": 658} {"train_loss": -5.421989440917969, "global_step": 27663, "epoch": 658} {"train_loss": -5.596462249755859, "global_step": 27664, "epoch": 658} {"train_loss": -5.4495673179626465, "global_step": 27665, "epoch": 658} {"train_loss": -5.614559173583984, "global_step": 27666, "epoch": 658} {"train_loss": -5.336764335632324, "global_step": 27667, "epoch": 658} {"train_loss": -5.479826927185059, "global_step": 27668, "epoch": 658} {"train_loss": -5.46589469909668, "global_step": 27669, "epoch": 658} {"train_loss": -5.5792694091796875, "global_step": 27670, "epoch": 658} {"train_loss": -5.420257568359375, "global_step": 27671, "epoch": 658} {"train_loss": -5.39841365814209, "global_step": 27672, "epoch": 658} {"train_loss": -5.508963108062744, "global_step": 27673, "epoch": 658} {"train_loss": -5.4539289474487305, "global_step": 27674, "epoch": 658} {"train_loss": -5.484915733337402, "global_step": 27675, "epoch": 658} {"train_loss": -5.413817405700684, "global_step": 27676, "epoch": 658} {"train_loss": -5.453410716283889, "global_step": 27677, "epoch": 658, "val_loss": 67544.8203125} {"train_loss": -5.449275970458984, "global_step": 27678, "epoch": 659} {"train_loss": -5.471675872802734, "global_step": 27679, "epoch": 659} {"train_loss": -5.544186115264893, "global_step": 27680, "epoch": 659} {"train_loss": -5.483482360839844, "global_step": 27681, "epoch": 659} {"train_loss": -5.5967116355896, "global_step": 27682, "epoch": 659} {"train_loss": -5.378964900970459, "global_step": 27683, "epoch": 659} {"train_loss": -5.533021926879883, "global_step": 27684, "epoch": 659} {"train_loss": -5.576074600219727, "global_step": 27685, "epoch": 659} {"train_loss": -5.466114521026611, "global_step": 27686, "epoch": 659} {"train_loss": -5.425119400024414, "global_step": 27687, "epoch": 659} {"train_loss": -5.469369888305664, "global_step": 27688, "epoch": 659} {"train_loss": -5.505349159240723, "global_step": 27689, "epoch": 659} {"train_loss": -5.443689346313477, "global_step": 27690, "epoch": 659} {"train_loss": -5.363864898681641, "global_step": 27691, "epoch": 659} {"train_loss": -5.53753137588501, "global_step": 27692, "epoch": 659} {"train_loss": -5.441020965576172, "global_step": 27693, "epoch": 659} {"train_loss": -5.381356239318848, "global_step": 27694, "epoch": 659} {"train_loss": -5.369492530822754, "global_step": 27695, "epoch": 659} {"train_loss": -5.513582229614258, "global_step": 27696, "epoch": 659} {"train_loss": -5.342137336730957, "global_step": 27697, "epoch": 659} {"train_loss": -5.417649745941162, "global_step": 27698, "epoch": 659} {"train_loss": -5.5071492195129395, "global_step": 27699, "epoch": 659} {"train_loss": -5.459113121032715, "global_step": 27700, "epoch": 659} {"train_loss": -5.30514669418335, "global_step": 27701, "epoch": 659} {"train_loss": -5.45841121673584, "global_step": 27702, "epoch": 659} {"train_loss": -5.563534736633301, "global_step": 27703, "epoch": 659} {"train_loss": -5.5421833992004395, "global_step": 27704, "epoch": 659} {"train_loss": -5.310866355895996, "global_step": 27705, "epoch": 659} {"train_loss": -5.383357048034668, "global_step": 27706, "epoch": 659} {"train_loss": -5.525976181030273, "global_step": 27707, "epoch": 659} {"train_loss": -5.3254899978637695, "global_step": 27708, "epoch": 659} {"train_loss": -5.602323532104492, "global_step": 27709, "epoch": 659} {"train_loss": -5.4530181884765625, "global_step": 27710, "epoch": 659} {"train_loss": -5.453968048095703, "global_step": 27711, "epoch": 659} {"train_loss": -5.442747116088867, "global_step": 27712, "epoch": 659} {"train_loss": -5.460655212402344, "global_step": 27713, "epoch": 659} {"train_loss": -5.440338134765625, "global_step": 27714, "epoch": 659} {"train_loss": -5.485474586486816, "global_step": 27715, "epoch": 659} {"train_loss": -5.462869167327881, "global_step": 27716, "epoch": 659} {"train_loss": -5.434681415557861, "global_step": 27717, "epoch": 659} {"train_loss": -5.466525554656982, "global_step": 27718, "epoch": 659} {"train_loss": -5.456555763880412, "global_step": 27719, "epoch": 659, "val_loss": 67570.7421875} {"train_loss": -5.415337562561035, "global_step": 27720, "epoch": 660} {"train_loss": -5.447940826416016, "global_step": 27721, "epoch": 660} {"train_loss": -5.393679618835449, "global_step": 27722, "epoch": 660} {"train_loss": -5.514528751373291, "global_step": 27723, "epoch": 660} {"train_loss": -5.36086893081665, "global_step": 27724, "epoch": 660} {"train_loss": -5.495131492614746, "global_step": 27725, "epoch": 660} {"train_loss": -5.538689136505127, "global_step": 27726, "epoch": 660} {"train_loss": -5.408504486083984, "global_step": 27727, "epoch": 660} {"train_loss": -5.566158294677734, "global_step": 27728, "epoch": 660} {"train_loss": -5.532550811767578, "global_step": 27729, "epoch": 660} {"train_loss": -5.353268623352051, "global_step": 27730, "epoch": 660} {"train_loss": -5.496055603027344, "global_step": 27731, "epoch": 660} {"train_loss": -5.453789234161377, "global_step": 27732, "epoch": 660} {"train_loss": -5.2296223640441895, "global_step": 27733, "epoch": 660} {"train_loss": -5.439605712890625, "global_step": 27734, "epoch": 660} {"train_loss": -5.434493064880371, "global_step": 27735, "epoch": 660} {"train_loss": -5.4728193283081055, "global_step": 27736, "epoch": 660} {"train_loss": -5.399043083190918, "global_step": 27737, "epoch": 660} {"train_loss": -5.522066116333008, "global_step": 27738, "epoch": 660} {"train_loss": -5.401564121246338, "global_step": 27739, "epoch": 660} {"train_loss": -5.4061126708984375, "global_step": 27740, "epoch": 660} {"train_loss": -5.500103950500488, "global_step": 27741, "epoch": 660} {"train_loss": -5.409196853637695, "global_step": 27742, "epoch": 660} {"train_loss": -5.413210868835449, "global_step": 27743, "epoch": 660} {"train_loss": -5.430660247802734, "global_step": 27744, "epoch": 660} {"train_loss": -5.415256500244141, "global_step": 27745, "epoch": 660} {"train_loss": -5.545283317565918, "global_step": 27746, "epoch": 660} {"train_loss": -5.463864326477051, "global_step": 27747, "epoch": 660} {"train_loss": -5.409102916717529, "global_step": 27748, "epoch": 660} {"train_loss": -5.357086181640625, "global_step": 27749, "epoch": 660} {"train_loss": -5.60122537612915, "global_step": 27750, "epoch": 660} {"train_loss": -5.437875270843506, "global_step": 27751, "epoch": 660} {"train_loss": -5.60513973236084, "global_step": 27752, "epoch": 660} {"train_loss": -5.448624610900879, "global_step": 27753, "epoch": 660} {"train_loss": -5.356001377105713, "global_step": 27754, "epoch": 660} {"train_loss": -5.58721399307251, "global_step": 27755, "epoch": 660} {"train_loss": -5.46608829498291, "global_step": 27756, "epoch": 660} {"train_loss": -5.592432975769043, "global_step": 27757, "epoch": 660} {"train_loss": -5.381783485412598, "global_step": 27758, "epoch": 660} {"train_loss": -5.501312732696533, "global_step": 27759, "epoch": 660} {"train_loss": -5.486602783203125, "global_step": 27760, "epoch": 660} {"train_loss": -5.454145908355713, "global_step": 27761, "epoch": 660, "val_loss": 67331.6875} {"train_loss": -5.480935096740723, "global_step": 27762, "epoch": 661} {"train_loss": -5.5297932624816895, "global_step": 27763, "epoch": 661} {"train_loss": -5.447428226470947, "global_step": 27764, "epoch": 661} {"train_loss": -5.396319389343262, "global_step": 27765, "epoch": 661} {"train_loss": -5.43367862701416, "global_step": 27766, "epoch": 661} {"train_loss": -5.28796911239624, "global_step": 27767, "epoch": 661} {"train_loss": -5.493376731872559, "global_step": 27768, "epoch": 661} {"train_loss": -5.411614418029785, "global_step": 27769, "epoch": 661} {"train_loss": -5.513957500457764, "global_step": 27770, "epoch": 661} {"train_loss": -5.328150272369385, "global_step": 27771, "epoch": 661} {"train_loss": -5.411118507385254, "global_step": 27772, "epoch": 661} {"train_loss": -5.52026891708374, "global_step": 27773, "epoch": 661} {"train_loss": -5.327707290649414, "global_step": 27774, "epoch": 661} {"train_loss": -5.474879264831543, "global_step": 27775, "epoch": 661} {"train_loss": -5.407336235046387, "global_step": 27776, "epoch": 661} {"train_loss": -5.431387901306152, "global_step": 27777, "epoch": 661} {"train_loss": -5.486721992492676, "global_step": 27778, "epoch": 661} {"train_loss": -5.285770416259766, "global_step": 27779, "epoch": 661} {"train_loss": -5.567417144775391, "global_step": 27780, "epoch": 661} {"train_loss": -5.355607509613037, "global_step": 27781, "epoch": 661} {"train_loss": -5.398041725158691, "global_step": 27782, "epoch": 661} {"train_loss": -5.408086776733398, "global_step": 27783, "epoch": 661} {"train_loss": -5.221784591674805, "global_step": 27784, "epoch": 661} {"train_loss": -5.373314380645752, "global_step": 27785, "epoch": 661} {"train_loss": -5.449223518371582, "global_step": 27786, "epoch": 661} {"train_loss": -5.462591171264648, "global_step": 27787, "epoch": 661} {"train_loss": -5.460803985595703, "global_step": 27788, "epoch": 661} {"train_loss": -5.5347065925598145, "global_step": 27789, "epoch": 661} {"train_loss": -5.321999549865723, "global_step": 27790, "epoch": 661} {"train_loss": -5.428053855895996, "global_step": 27791, "epoch": 661} {"train_loss": -5.303464412689209, "global_step": 27792, "epoch": 661} {"train_loss": -5.380965232849121, "global_step": 27793, "epoch": 661} {"train_loss": -5.553254127502441, "global_step": 27794, "epoch": 661} {"train_loss": -5.4606781005859375, "global_step": 27795, "epoch": 661} {"train_loss": -5.420102596282959, "global_step": 27796, "epoch": 661} {"train_loss": -5.415449142456055, "global_step": 27797, "epoch": 661} {"train_loss": -5.641610145568848, "global_step": 27798, "epoch": 661} {"train_loss": -5.578805923461914, "global_step": 27799, "epoch": 661} {"train_loss": -5.324623107910156, "global_step": 27800, "epoch": 661} {"train_loss": -5.4658098220825195, "global_step": 27801, "epoch": 661} {"train_loss": -5.318663597106934, "global_step": 27802, "epoch": 661} {"train_loss": -5.425136702401297, "global_step": 27803, "epoch": 661, "val_loss": 67410.8359375} {"train_loss": -5.4960103034973145, "global_step": 27804, "epoch": 662} {"train_loss": -5.390947341918945, "global_step": 27805, "epoch": 662} {"train_loss": -5.367551326751709, "global_step": 27806, "epoch": 662} {"train_loss": -5.49826192855835, "global_step": 27807, "epoch": 662} {"train_loss": -5.318041801452637, "global_step": 27808, "epoch": 662} {"train_loss": -5.5305914878845215, "global_step": 27809, "epoch": 662} {"train_loss": -5.354836463928223, "global_step": 27810, "epoch": 662} {"train_loss": -5.422098636627197, "global_step": 27811, "epoch": 662} {"train_loss": -5.530683517456055, "global_step": 27812, "epoch": 662} {"train_loss": -5.488165855407715, "global_step": 27813, "epoch": 662} {"train_loss": -5.4399824142456055, "global_step": 27814, "epoch": 662} {"train_loss": -5.396422863006592, "global_step": 27815, "epoch": 662} {"train_loss": -5.4683966636657715, "global_step": 27816, "epoch": 662} {"train_loss": -5.528393745422363, "global_step": 27817, "epoch": 662} {"train_loss": -5.379750728607178, "global_step": 27818, "epoch": 662} {"train_loss": -5.372712135314941, "global_step": 27819, "epoch": 662} {"train_loss": -5.46916389465332, "global_step": 27820, "epoch": 662} {"train_loss": -5.4579901695251465, "global_step": 27821, "epoch": 662} {"train_loss": -5.394568920135498, "global_step": 27822, "epoch": 662} {"train_loss": -5.413066864013672, "global_step": 27823, "epoch": 662} {"train_loss": -5.445920944213867, "global_step": 27824, "epoch": 662} {"train_loss": -5.307093143463135, "global_step": 27825, "epoch": 662} {"train_loss": -5.483759880065918, "global_step": 27826, "epoch": 662} {"train_loss": -5.403715133666992, "global_step": 27827, "epoch": 662} {"train_loss": -5.409060955047607, "global_step": 27828, "epoch": 662} {"train_loss": -5.41148567199707, "global_step": 27829, "epoch": 662} {"train_loss": -5.1446027755737305, "global_step": 27830, "epoch": 662} {"train_loss": -5.307625770568848, "global_step": 27831, "epoch": 662} {"train_loss": -5.259291648864746, "global_step": 27832, "epoch": 662} {"train_loss": -5.276553630828857, "global_step": 27833, "epoch": 662} {"train_loss": -5.5155229568481445, "global_step": 27834, "epoch": 662} {"train_loss": -5.301761150360107, "global_step": 27835, "epoch": 662} {"train_loss": -5.323938846588135, "global_step": 27836, "epoch": 662} {"train_loss": -5.373499870300293, "global_step": 27837, "epoch": 662} {"train_loss": -5.460375785827637, "global_step": 27838, "epoch": 662} {"train_loss": -5.529720306396484, "global_step": 27839, "epoch": 662} {"train_loss": -5.391690731048584, "global_step": 27840, "epoch": 662} {"train_loss": -5.528017520904541, "global_step": 27841, "epoch": 662} {"train_loss": -5.289222717285156, "global_step": 27842, "epoch": 662} {"train_loss": -5.413684844970703, "global_step": 27843, "epoch": 662} {"train_loss": -5.425317764282227, "global_step": 27844, "epoch": 662} {"train_loss": -5.4095323994046165, "global_step": 27845, "epoch": 662, "val_loss": 67426.6953125} {"train_loss": -5.502528190612793, "global_step": 27846, "epoch": 663} {"train_loss": -5.407393932342529, "global_step": 27847, "epoch": 663} {"train_loss": -5.421401023864746, "global_step": 27848, "epoch": 663} {"train_loss": -5.405896186828613, "global_step": 27849, "epoch": 663} {"train_loss": -5.363507270812988, "global_step": 27850, "epoch": 663} {"train_loss": -5.24008321762085, "global_step": 27851, "epoch": 663} {"train_loss": -5.445364952087402, "global_step": 27852, "epoch": 663} {"train_loss": -5.329916954040527, "global_step": 27853, "epoch": 663} {"train_loss": -5.3073883056640625, "global_step": 27854, "epoch": 663} {"train_loss": -5.444323539733887, "global_step": 27855, "epoch": 663} {"train_loss": -5.284863471984863, "global_step": 27856, "epoch": 663} {"train_loss": -5.490827560424805, "global_step": 27857, "epoch": 663} {"train_loss": -5.484966278076172, "global_step": 27858, "epoch": 663} {"train_loss": -5.481025695800781, "global_step": 27859, "epoch": 663} {"train_loss": -5.474360466003418, "global_step": 27860, "epoch": 663} {"train_loss": -5.303316116333008, "global_step": 27861, "epoch": 663} {"train_loss": -5.396846771240234, "global_step": 27862, "epoch": 663} {"train_loss": -5.470863342285156, "global_step": 27863, "epoch": 663} {"train_loss": -5.325223922729492, "global_step": 27864, "epoch": 663} {"train_loss": -5.551265239715576, "global_step": 27865, "epoch": 663} {"train_loss": -5.489938735961914, "global_step": 27866, "epoch": 663} {"train_loss": -5.43239688873291, "global_step": 27867, "epoch": 663} {"train_loss": -5.610658645629883, "global_step": 27868, "epoch": 663} {"train_loss": -5.374678611755371, "global_step": 27869, "epoch": 663} {"train_loss": -5.4694085121154785, "global_step": 27870, "epoch": 663} {"train_loss": -5.431812763214111, "global_step": 27871, "epoch": 663} {"train_loss": -5.342012405395508, "global_step": 27872, "epoch": 663} {"train_loss": -5.412404537200928, "global_step": 27873, "epoch": 663} {"train_loss": -5.451979637145996, "global_step": 27874, "epoch": 663} {"train_loss": -5.591376304626465, "global_step": 27875, "epoch": 663} {"train_loss": -5.5714545249938965, "global_step": 27876, "epoch": 663} {"train_loss": -5.566895008087158, "global_step": 27877, "epoch": 663} {"train_loss": -5.50340461730957, "global_step": 27878, "epoch": 663} {"train_loss": -5.503267765045166, "global_step": 27879, "epoch": 663} {"train_loss": -5.35609245300293, "global_step": 27880, "epoch": 663} {"train_loss": -5.496063709259033, "global_step": 27881, "epoch": 663} {"train_loss": -5.562237739562988, "global_step": 27882, "epoch": 663} {"train_loss": -5.39894962310791, "global_step": 27883, "epoch": 663} {"train_loss": -5.452016830444336, "global_step": 27884, "epoch": 663} {"train_loss": -5.452029228210449, "global_step": 27885, "epoch": 663} {"train_loss": -5.4008283615112305, "global_step": 27886, "epoch": 663} {"train_loss": -5.440345071610951, "global_step": 27887, "epoch": 663, "val_loss": 67588.53125} {"train_loss": -5.403810501098633, "global_step": 27888, "epoch": 664} {"train_loss": -5.339601516723633, "global_step": 27889, "epoch": 664} {"train_loss": -5.497387886047363, "global_step": 27890, "epoch": 664} {"train_loss": -5.369232177734375, "global_step": 27891, "epoch": 664} {"train_loss": -5.247611045837402, "global_step": 27892, "epoch": 664} {"train_loss": -5.501858711242676, "global_step": 27893, "epoch": 664} {"train_loss": -5.218013763427734, "global_step": 27894, "epoch": 664} {"train_loss": -5.335433006286621, "global_step": 27895, "epoch": 664} {"train_loss": -5.3077287673950195, "global_step": 27896, "epoch": 664} {"train_loss": -5.343417644500732, "global_step": 27897, "epoch": 664} {"train_loss": -5.419717788696289, "global_step": 27898, "epoch": 664} {"train_loss": -5.405294895172119, "global_step": 27899, "epoch": 664} {"train_loss": -5.492405891418457, "global_step": 27900, "epoch": 664} {"train_loss": -5.560280799865723, "global_step": 27901, "epoch": 664} {"train_loss": -5.303744316101074, "global_step": 27902, "epoch": 664} {"train_loss": -5.466591835021973, "global_step": 27903, "epoch": 664} {"train_loss": -5.4527997970581055, "global_step": 27904, "epoch": 664} {"train_loss": -5.364334583282471, "global_step": 27905, "epoch": 664} {"train_loss": -5.484063148498535, "global_step": 27906, "epoch": 664} {"train_loss": -5.428427219390869, "global_step": 27907, "epoch": 664} {"train_loss": -5.531721115112305, "global_step": 27908, "epoch": 664} {"train_loss": -5.249172687530518, "global_step": 27909, "epoch": 664} {"train_loss": -5.445804119110107, "global_step": 27910, "epoch": 664} {"train_loss": -5.472115516662598, "global_step": 27911, "epoch": 664} {"train_loss": -5.337629318237305, "global_step": 27912, "epoch": 664} {"train_loss": -5.353959083557129, "global_step": 27913, "epoch": 664} {"train_loss": -5.48232364654541, "global_step": 27914, "epoch": 664} {"train_loss": -5.531593322753906, "global_step": 27915, "epoch": 664} {"train_loss": -5.493112564086914, "global_step": 27916, "epoch": 664} {"train_loss": -5.302685737609863, "global_step": 27917, "epoch": 664} {"train_loss": -5.54014778137207, "global_step": 27918, "epoch": 664} {"train_loss": -5.355437278747559, "global_step": 27919, "epoch": 664} {"train_loss": -5.421487331390381, "global_step": 27920, "epoch": 664} {"train_loss": -5.498603820800781, "global_step": 27921, "epoch": 664} {"train_loss": -5.448625564575195, "global_step": 27922, "epoch": 664} {"train_loss": -5.448785781860352, "global_step": 27923, "epoch": 664} {"train_loss": -5.392151832580566, "global_step": 27924, "epoch": 664} {"train_loss": -5.495600700378418, "global_step": 27925, "epoch": 664} {"train_loss": -5.419827938079834, "global_step": 27926, "epoch": 664} {"train_loss": -5.542126655578613, "global_step": 27927, "epoch": 664} {"train_loss": -5.700937271118164, "global_step": 27928, "epoch": 664} {"train_loss": -5.426301672345116, "global_step": 27929, "epoch": 664, "val_loss": 67142.8046875} {"train_loss": -5.415848731994629, "global_step": 27930, "epoch": 665} {"train_loss": -5.564139366149902, "global_step": 27931, "epoch": 665} {"train_loss": -5.544335842132568, "global_step": 27932, "epoch": 665} {"train_loss": -5.529218673706055, "global_step": 27933, "epoch": 665} {"train_loss": -5.426008701324463, "global_step": 27934, "epoch": 665} {"train_loss": -5.351640224456787, "global_step": 27935, "epoch": 665} {"train_loss": -5.347884654998779, "global_step": 27936, "epoch": 665} {"train_loss": -5.394413948059082, "global_step": 27937, "epoch": 665} {"train_loss": -5.469694137573242, "global_step": 27938, "epoch": 665} {"train_loss": -5.3968000411987305, "global_step": 27939, "epoch": 665} {"train_loss": -5.419072151184082, "global_step": 27940, "epoch": 665} {"train_loss": -5.296436309814453, "global_step": 27941, "epoch": 665} {"train_loss": -5.494100570678711, "global_step": 27942, "epoch": 665} {"train_loss": -5.304850101470947, "global_step": 27943, "epoch": 665} {"train_loss": -5.373959541320801, "global_step": 27944, "epoch": 665} {"train_loss": -5.458115100860596, "global_step": 27945, "epoch": 665} {"train_loss": -5.432075500488281, "global_step": 27946, "epoch": 665} {"train_loss": -5.490352630615234, "global_step": 27947, "epoch": 665} {"train_loss": -5.3645806312561035, "global_step": 27948, "epoch": 665} {"train_loss": -5.4516472816467285, "global_step": 27949, "epoch": 665} {"train_loss": -5.445645809173584, "global_step": 27950, "epoch": 665} {"train_loss": -5.307710647583008, "global_step": 27951, "epoch": 665} {"train_loss": -5.371982097625732, "global_step": 27952, "epoch": 665} {"train_loss": -5.426938056945801, "global_step": 27953, "epoch": 665} {"train_loss": -5.39543342590332, "global_step": 27954, "epoch": 665} {"train_loss": -5.438282012939453, "global_step": 27955, "epoch": 665} {"train_loss": -5.38370418548584, "global_step": 27956, "epoch": 665} {"train_loss": -5.544272422790527, "global_step": 27957, "epoch": 665} {"train_loss": -5.31357479095459, "global_step": 27958, "epoch": 665} {"train_loss": -5.481950283050537, "global_step": 27959, "epoch": 665} {"train_loss": -5.551281452178955, "global_step": 27960, "epoch": 665} {"train_loss": -5.5606842041015625, "global_step": 27961, "epoch": 665} {"train_loss": -5.453658580780029, "global_step": 27962, "epoch": 665} {"train_loss": -5.4341139793396, "global_step": 27963, "epoch": 665} {"train_loss": -5.462467193603516, "global_step": 27964, "epoch": 665} {"train_loss": -5.422754764556885, "global_step": 27965, "epoch": 665} {"train_loss": -5.492353916168213, "global_step": 27966, "epoch": 665} {"train_loss": -5.59654426574707, "global_step": 27967, "epoch": 665} {"train_loss": -5.372438430786133, "global_step": 27968, "epoch": 665} {"train_loss": -5.577749729156494, "global_step": 27969, "epoch": 665} {"train_loss": -5.464989185333252, "global_step": 27970, "epoch": 665} {"train_loss": -5.439722526641119, "global_step": 27971, "epoch": 665, "val_loss": 67217.1640625} {"train_loss": -5.56392765045166, "global_step": 27972, "epoch": 666} {"train_loss": -5.6365461349487305, "global_step": 27973, "epoch": 666} {"train_loss": -5.557511329650879, "global_step": 27974, "epoch": 666} {"train_loss": -5.418807029724121, "global_step": 27975, "epoch": 666} {"train_loss": -5.446815490722656, "global_step": 27976, "epoch": 666} {"train_loss": -5.495489120483398, "global_step": 27977, "epoch": 666} {"train_loss": -5.508526802062988, "global_step": 27978, "epoch": 666} {"train_loss": -5.36348819732666, "global_step": 27979, "epoch": 666} {"train_loss": -5.466253757476807, "global_step": 27980, "epoch": 666} {"train_loss": -5.348499774932861, "global_step": 27981, "epoch": 666} {"train_loss": -5.275851726531982, "global_step": 27982, "epoch": 666} {"train_loss": -5.455041408538818, "global_step": 27983, "epoch": 666} {"train_loss": -5.453436851501465, "global_step": 27984, "epoch": 666} {"train_loss": -5.361908912658691, "global_step": 27985, "epoch": 666} {"train_loss": -5.466722011566162, "global_step": 27986, "epoch": 666} {"train_loss": -5.45159912109375, "global_step": 27987, "epoch": 666} {"train_loss": -5.510952949523926, "global_step": 27988, "epoch": 666} {"train_loss": -5.490930557250977, "global_step": 27989, "epoch": 666} {"train_loss": -5.346334457397461, "global_step": 27990, "epoch": 666} {"train_loss": -5.447266578674316, "global_step": 27991, "epoch": 666} {"train_loss": -5.407994270324707, "global_step": 27992, "epoch": 666} {"train_loss": -5.538640022277832, "global_step": 27993, "epoch": 666} {"train_loss": -5.438628196716309, "global_step": 27994, "epoch": 666} {"train_loss": -5.35983943939209, "global_step": 27995, "epoch": 666} {"train_loss": -5.482860565185547, "global_step": 27996, "epoch": 666} {"train_loss": -5.5120344161987305, "global_step": 27997, "epoch": 666} {"train_loss": -5.5005645751953125, "global_step": 27998, "epoch": 666} {"train_loss": -5.337935924530029, "global_step": 27999, "epoch": 666} {"train_loss": -5.405411720275879, "global_step": 28000, "epoch": 666} {"train_loss": -5.475158214569092, "global_step": 28001, "epoch": 666} {"train_loss": -5.467297554016113, "global_step": 28002, "epoch": 666} {"train_loss": -5.526142120361328, "global_step": 28003, "epoch": 666} {"train_loss": -5.5563740730285645, "global_step": 28004, "epoch": 666} {"train_loss": -5.341691970825195, "global_step": 28005, "epoch": 666} {"train_loss": -5.46274471282959, "global_step": 28006, "epoch": 666} {"train_loss": -5.491377353668213, "global_step": 28007, "epoch": 666} {"train_loss": -5.4605712890625, "global_step": 28008, "epoch": 666} {"train_loss": -5.4585041999816895, "global_step": 28009, "epoch": 666} {"train_loss": -5.489134788513184, "global_step": 28010, "epoch": 666} {"train_loss": -5.537195205688477, "global_step": 28011, "epoch": 666} {"train_loss": -5.502218723297119, "global_step": 28012, "epoch": 666} {"train_loss": -5.456587904975528, "global_step": 28013, "epoch": 666, "val_loss": 67351.8203125} {"train_loss": -5.555342674255371, "global_step": 28014, "epoch": 667} {"train_loss": -5.337612628936768, "global_step": 28015, "epoch": 667} {"train_loss": -5.496767997741699, "global_step": 28016, "epoch": 667} {"train_loss": -5.604910850524902, "global_step": 28017, "epoch": 667} {"train_loss": -5.413361549377441, "global_step": 28018, "epoch": 667} {"train_loss": -5.461946487426758, "global_step": 28019, "epoch": 667} {"train_loss": -5.501760005950928, "global_step": 28020, "epoch": 667} {"train_loss": -5.463399887084961, "global_step": 28021, "epoch": 667} {"train_loss": -5.434556007385254, "global_step": 28022, "epoch": 667} {"train_loss": -5.529444217681885, "global_step": 28023, "epoch": 667} {"train_loss": -5.581789970397949, "global_step": 28024, "epoch": 667} {"train_loss": -5.483129978179932, "global_step": 28025, "epoch": 667} {"train_loss": -5.510270118713379, "global_step": 28026, "epoch": 667} {"train_loss": -5.4867753982543945, "global_step": 28027, "epoch": 667} {"train_loss": -5.540301322937012, "global_step": 28028, "epoch": 667} {"train_loss": -5.5977582931518555, "global_step": 28029, "epoch": 667} {"train_loss": -5.501636981964111, "global_step": 28030, "epoch": 667} {"train_loss": -5.395285606384277, "global_step": 28031, "epoch": 667} {"train_loss": -5.625886917114258, "global_step": 28032, "epoch": 667} {"train_loss": -5.251405715942383, "global_step": 28033, "epoch": 667} {"train_loss": -5.350603103637695, "global_step": 28034, "epoch": 667} {"train_loss": -5.549775123596191, "global_step": 28035, "epoch": 667} {"train_loss": -5.31660270690918, "global_step": 28036, "epoch": 667} {"train_loss": -5.496674537658691, "global_step": 28037, "epoch": 667} {"train_loss": -5.388854503631592, "global_step": 28038, "epoch": 667} {"train_loss": -5.550361633300781, "global_step": 28039, "epoch": 667} {"train_loss": -5.618594169616699, "global_step": 28040, "epoch": 667} {"train_loss": -5.441606521606445, "global_step": 28041, "epoch": 667} {"train_loss": -5.424290657043457, "global_step": 28042, "epoch": 667} {"train_loss": -5.436961650848389, "global_step": 28043, "epoch": 667} {"train_loss": -5.4858503341674805, "global_step": 28044, "epoch": 667} {"train_loss": -5.478215217590332, "global_step": 28045, "epoch": 667} {"train_loss": -5.451693534851074, "global_step": 28046, "epoch": 667} {"train_loss": -5.483325004577637, "global_step": 28047, "epoch": 667} {"train_loss": -5.430089473724365, "global_step": 28048, "epoch": 667} {"train_loss": -5.654388904571533, "global_step": 28049, "epoch": 667} {"train_loss": -5.502407073974609, "global_step": 28050, "epoch": 667} {"train_loss": -5.337038040161133, "global_step": 28051, "epoch": 667} {"train_loss": -5.3945159912109375, "global_step": 28052, "epoch": 667} {"train_loss": -5.510599136352539, "global_step": 28053, "epoch": 667} {"train_loss": -5.3931498527526855, "global_step": 28054, "epoch": 667} {"train_loss": -5.471831412542434, "global_step": 28055, "epoch": 667, "val_loss": 67444.2890625} {"train_loss": -5.5790205001831055, "global_step": 28056, "epoch": 668} {"train_loss": -5.500336647033691, "global_step": 28057, "epoch": 668} {"train_loss": -5.374521732330322, "global_step": 28058, "epoch": 668} {"train_loss": -5.399450302124023, "global_step": 28059, "epoch": 668} {"train_loss": -5.444981098175049, "global_step": 28060, "epoch": 668} {"train_loss": -5.368014812469482, "global_step": 28061, "epoch": 668} {"train_loss": -5.533991813659668, "global_step": 28062, "epoch": 668} {"train_loss": -5.454002380371094, "global_step": 28063, "epoch": 668} {"train_loss": -5.308344841003418, "global_step": 28064, "epoch": 668} {"train_loss": -5.559844017028809, "global_step": 28065, "epoch": 668} {"train_loss": -5.346541404724121, "global_step": 28066, "epoch": 668} {"train_loss": -5.543881416320801, "global_step": 28067, "epoch": 668} {"train_loss": -5.473361968994141, "global_step": 28068, "epoch": 668} {"train_loss": -5.540324687957764, "global_step": 28069, "epoch": 668} {"train_loss": -5.387720108032227, "global_step": 28070, "epoch": 668} {"train_loss": -5.567994594573975, "global_step": 28071, "epoch": 668} {"train_loss": -5.440634250640869, "global_step": 28072, "epoch": 668} {"train_loss": -5.4799933433532715, "global_step": 28073, "epoch": 668} {"train_loss": -5.5955352783203125, "global_step": 28074, "epoch": 668} {"train_loss": -5.424487590789795, "global_step": 28075, "epoch": 668} {"train_loss": -5.4196882247924805, "global_step": 28076, "epoch": 668} {"train_loss": -5.401060581207275, "global_step": 28077, "epoch": 668} {"train_loss": -5.543888092041016, "global_step": 28078, "epoch": 668} {"train_loss": -5.624392509460449, "global_step": 28079, "epoch": 668} {"train_loss": -5.5100226402282715, "global_step": 28080, "epoch": 668} {"train_loss": -5.559852123260498, "global_step": 28081, "epoch": 668} {"train_loss": -5.582904815673828, "global_step": 28082, "epoch": 668} {"train_loss": -5.392634391784668, "global_step": 28083, "epoch": 668} {"train_loss": -5.443204879760742, "global_step": 28084, "epoch": 668} {"train_loss": -5.395569324493408, "global_step": 28085, "epoch": 668} {"train_loss": -5.499195098876953, "global_step": 28086, "epoch": 668} {"train_loss": -5.466108798980713, "global_step": 28087, "epoch": 668} {"train_loss": -5.556101322174072, "global_step": 28088, "epoch": 668} {"train_loss": -5.479848861694336, "global_step": 28089, "epoch": 668} {"train_loss": -5.4344892501831055, "global_step": 28090, "epoch": 668} {"train_loss": -5.334339618682861, "global_step": 28091, "epoch": 668} {"train_loss": -5.3860321044921875, "global_step": 28092, "epoch": 668} {"train_loss": -5.516951560974121, "global_step": 28093, "epoch": 668} {"train_loss": -5.407310485839844, "global_step": 28094, "epoch": 668} {"train_loss": -5.511979103088379, "global_step": 28095, "epoch": 668} {"train_loss": -5.3710784912109375, "global_step": 28096, "epoch": 668} {"train_loss": -5.466029871077764, "global_step": 28097, "epoch": 668, "val_loss": 67171.046875} {"train_loss": -5.443452835083008, "global_step": 28098, "epoch": 669} {"train_loss": -5.453556060791016, "global_step": 28099, "epoch": 669} {"train_loss": -5.44011116027832, "global_step": 28100, "epoch": 669} {"train_loss": -5.42122745513916, "global_step": 28101, "epoch": 669} {"train_loss": -5.431400775909424, "global_step": 28102, "epoch": 669} {"train_loss": -5.49891996383667, "global_step": 28103, "epoch": 669} {"train_loss": -5.611427307128906, "global_step": 28104, "epoch": 669} {"train_loss": -5.410974502563477, "global_step": 28105, "epoch": 669} {"train_loss": -5.514369010925293, "global_step": 28106, "epoch": 669} {"train_loss": -5.464903831481934, "global_step": 28107, "epoch": 669} {"train_loss": -5.346972942352295, "global_step": 28108, "epoch": 669} {"train_loss": -5.467909336090088, "global_step": 28109, "epoch": 669} {"train_loss": -5.498790740966797, "global_step": 28110, "epoch": 669} {"train_loss": -5.510934352874756, "global_step": 28111, "epoch": 669} {"train_loss": -5.543450832366943, "global_step": 28112, "epoch": 669} {"train_loss": -5.490207672119141, "global_step": 28113, "epoch": 669} {"train_loss": -5.487708568572998, "global_step": 28114, "epoch": 669} {"train_loss": -5.352211952209473, "global_step": 28115, "epoch": 669} {"train_loss": -5.552657127380371, "global_step": 28116, "epoch": 669} {"train_loss": -5.545748710632324, "global_step": 28117, "epoch": 669} {"train_loss": -5.469026565551758, "global_step": 28118, "epoch": 669} {"train_loss": -5.454639434814453, "global_step": 28119, "epoch": 669} {"train_loss": -5.358434200286865, "global_step": 28120, "epoch": 669} {"train_loss": -5.551187992095947, "global_step": 28121, "epoch": 669} {"train_loss": -5.496094703674316, "global_step": 28122, "epoch": 669} {"train_loss": -5.391297340393066, "global_step": 28123, "epoch": 669} {"train_loss": -5.391200065612793, "global_step": 28124, "epoch": 669} {"train_loss": -5.4124755859375, "global_step": 28125, "epoch": 669} {"train_loss": -5.471480369567871, "global_step": 28126, "epoch": 669} {"train_loss": -5.585360527038574, "global_step": 28127, "epoch": 669} {"train_loss": -5.348227024078369, "global_step": 28128, "epoch": 669} {"train_loss": -5.534740447998047, "global_step": 28129, "epoch": 669} {"train_loss": -5.347886085510254, "global_step": 28130, "epoch": 669} {"train_loss": -5.46223258972168, "global_step": 28131, "epoch": 669} {"train_loss": -5.4399871826171875, "global_step": 28132, "epoch": 669} {"train_loss": -5.498992919921875, "global_step": 28133, "epoch": 669} {"train_loss": -5.314382553100586, "global_step": 28134, "epoch": 669} {"train_loss": -5.576581954956055, "global_step": 28135, "epoch": 669} {"train_loss": -5.3364458084106445, "global_step": 28136, "epoch": 669} {"train_loss": -5.366292953491211, "global_step": 28137, "epoch": 669} {"train_loss": -5.501943588256836, "global_step": 28138, "epoch": 669} {"train_loss": -5.45743803750901, "global_step": 28139, "epoch": 669, "val_loss": 67382.3984375} {"train_loss": -5.396024703979492, "global_step": 28140, "epoch": 670} {"train_loss": -5.422702789306641, "global_step": 28141, "epoch": 670} {"train_loss": -5.443108558654785, "global_step": 28142, "epoch": 670} {"train_loss": -5.391208171844482, "global_step": 28143, "epoch": 670} {"train_loss": -5.467419147491455, "global_step": 28144, "epoch": 670} {"train_loss": -5.433577537536621, "global_step": 28145, "epoch": 670} {"train_loss": -5.411830902099609, "global_step": 28146, "epoch": 670} {"train_loss": -5.461240291595459, "global_step": 28147, "epoch": 670} {"train_loss": -5.419142246246338, "global_step": 28148, "epoch": 670} {"train_loss": -5.3477020263671875, "global_step": 28149, "epoch": 670} {"train_loss": -5.456292152404785, "global_step": 28150, "epoch": 670} {"train_loss": -5.456423759460449, "global_step": 28151, "epoch": 670} {"train_loss": -5.55278205871582, "global_step": 28152, "epoch": 670} {"train_loss": -5.307234287261963, "global_step": 28153, "epoch": 670} {"train_loss": -5.376045227050781, "global_step": 28154, "epoch": 670} {"train_loss": -5.439389228820801, "global_step": 28155, "epoch": 670} {"train_loss": -5.356180191040039, "global_step": 28156, "epoch": 670} {"train_loss": -5.286458969116211, "global_step": 28157, "epoch": 670} {"train_loss": -5.420457363128662, "global_step": 28158, "epoch": 670} {"train_loss": -5.5420331954956055, "global_step": 28159, "epoch": 670} {"train_loss": -5.432864189147949, "global_step": 28160, "epoch": 670} {"train_loss": -5.463150978088379, "global_step": 28161, "epoch": 670} {"train_loss": -5.368217945098877, "global_step": 28162, "epoch": 670} {"train_loss": -5.492690563201904, "global_step": 28163, "epoch": 670} {"train_loss": -5.4234819412231445, "global_step": 28164, "epoch": 670} {"train_loss": -5.482210636138916, "global_step": 28165, "epoch": 670} {"train_loss": -5.387235641479492, "global_step": 28166, "epoch": 670} {"train_loss": -5.305572509765625, "global_step": 28167, "epoch": 670} {"train_loss": -5.40449333190918, "global_step": 28168, "epoch": 670} {"train_loss": -5.463296890258789, "global_step": 28169, "epoch": 670} {"train_loss": -5.444328308105469, "global_step": 28170, "epoch": 670} {"train_loss": -5.405104637145996, "global_step": 28171, "epoch": 670} {"train_loss": -5.476499557495117, "global_step": 28172, "epoch": 670} {"train_loss": -5.456076145172119, "global_step": 28173, "epoch": 670} {"train_loss": -5.434896945953369, "global_step": 28174, "epoch": 670} {"train_loss": -5.559821128845215, "global_step": 28175, "epoch": 670} {"train_loss": -5.514891624450684, "global_step": 28176, "epoch": 670} {"train_loss": -5.419849395751953, "global_step": 28177, "epoch": 670} {"train_loss": -5.422286033630371, "global_step": 28178, "epoch": 670} {"train_loss": -5.431994438171387, "global_step": 28179, "epoch": 670} {"train_loss": -5.537264823913574, "global_step": 28180, "epoch": 670} {"train_loss": -5.434894550414312, "global_step": 28181, "epoch": 670, "val_loss": 67082.9921875} {"train_loss": -5.418886184692383, "global_step": 28182, "epoch": 671} {"train_loss": -5.466054916381836, "global_step": 28183, "epoch": 671} {"train_loss": -5.586841583251953, "global_step": 28184, "epoch": 671} {"train_loss": -5.462579727172852, "global_step": 28185, "epoch": 671} {"train_loss": -5.659109115600586, "global_step": 28186, "epoch": 671} {"train_loss": -5.402822494506836, "global_step": 28187, "epoch": 671} {"train_loss": -5.447169303894043, "global_step": 28188, "epoch": 671} {"train_loss": -5.5062665939331055, "global_step": 28189, "epoch": 671} {"train_loss": -5.4328813552856445, "global_step": 28190, "epoch": 671} {"train_loss": -5.339090347290039, "global_step": 28191, "epoch": 671} {"train_loss": -5.259721279144287, "global_step": 28192, "epoch": 671} {"train_loss": -5.431052207946777, "global_step": 28193, "epoch": 671} {"train_loss": -5.436636924743652, "global_step": 28194, "epoch": 671} {"train_loss": -5.484776496887207, "global_step": 28195, "epoch": 671} {"train_loss": -5.5622758865356445, "global_step": 28196, "epoch": 671} {"train_loss": -5.4393744468688965, "global_step": 28197, "epoch": 671} {"train_loss": -5.32148551940918, "global_step": 28198, "epoch": 671} {"train_loss": -5.553943634033203, "global_step": 28199, "epoch": 671} {"train_loss": -5.34190559387207, "global_step": 28200, "epoch": 671} {"train_loss": -5.57395076751709, "global_step": 28201, "epoch": 671} {"train_loss": -5.460021018981934, "global_step": 28202, "epoch": 671} {"train_loss": -5.421422481536865, "global_step": 28203, "epoch": 671} {"train_loss": -5.461789131164551, "global_step": 28204, "epoch": 671} {"train_loss": -5.408176898956299, "global_step": 28205, "epoch": 671} {"train_loss": -5.443665027618408, "global_step": 28206, "epoch": 671} {"train_loss": -5.3228631019592285, "global_step": 28207, "epoch": 671} {"train_loss": -5.410207271575928, "global_step": 28208, "epoch": 671} {"train_loss": -5.4225263595581055, "global_step": 28209, "epoch": 671} {"train_loss": -5.386263847351074, "global_step": 28210, "epoch": 671} {"train_loss": -5.554216384887695, "global_step": 28211, "epoch": 671} {"train_loss": -5.470514297485352, "global_step": 28212, "epoch": 671} {"train_loss": -5.453803062438965, "global_step": 28213, "epoch": 671} {"train_loss": -5.3482232093811035, "global_step": 28214, "epoch": 671} {"train_loss": -5.443828582763672, "global_step": 28215, "epoch": 671} {"train_loss": -5.605123519897461, "global_step": 28216, "epoch": 671} {"train_loss": -5.436271667480469, "global_step": 28217, "epoch": 671} {"train_loss": -5.477247714996338, "global_step": 28218, "epoch": 671} {"train_loss": -5.479198455810547, "global_step": 28219, "epoch": 671} {"train_loss": -5.643083572387695, "global_step": 28220, "epoch": 671} {"train_loss": -5.564901351928711, "global_step": 28221, "epoch": 671} {"train_loss": -5.5445356369018555, "global_step": 28222, "epoch": 671} {"train_loss": -5.459194716953096, "global_step": 28223, "epoch": 671, "val_loss": 67531.984375} {"train_loss": -5.6223225593566895, "global_step": 28224, "epoch": 672} {"train_loss": -5.359522819519043, "global_step": 28225, "epoch": 672} {"train_loss": -5.2993974685668945, "global_step": 28226, "epoch": 672} {"train_loss": -5.422032356262207, "global_step": 28227, "epoch": 672} {"train_loss": -5.491130828857422, "global_step": 28228, "epoch": 672} {"train_loss": -5.4529571533203125, "global_step": 28229, "epoch": 672} {"train_loss": -5.457710266113281, "global_step": 28230, "epoch": 672} {"train_loss": -5.417761325836182, "global_step": 28231, "epoch": 672} {"train_loss": -5.410552501678467, "global_step": 28232, "epoch": 672} {"train_loss": -5.316608905792236, "global_step": 28233, "epoch": 672} {"train_loss": -5.4103193283081055, "global_step": 28234, "epoch": 672} {"train_loss": -5.412950038909912, "global_step": 28235, "epoch": 672} {"train_loss": -5.329076290130615, "global_step": 28236, "epoch": 672} {"train_loss": -5.349917411804199, "global_step": 28237, "epoch": 672} {"train_loss": -5.343520164489746, "global_step": 28238, "epoch": 672} {"train_loss": -5.438384056091309, "global_step": 28239, "epoch": 672} {"train_loss": -5.513666152954102, "global_step": 28240, "epoch": 672} {"train_loss": -5.4625139236450195, "global_step": 28241, "epoch": 672} {"train_loss": -5.466983318328857, "global_step": 28242, "epoch": 672} {"train_loss": -5.537356376647949, "global_step": 28243, "epoch": 672} {"train_loss": -5.436341285705566, "global_step": 28244, "epoch": 672} {"train_loss": -5.487211227416992, "global_step": 28245, "epoch": 672} {"train_loss": -5.367661476135254, "global_step": 28246, "epoch": 672} {"train_loss": -5.430427551269531, "global_step": 28247, "epoch": 672} {"train_loss": -5.338641166687012, "global_step": 28248, "epoch": 672} {"train_loss": -5.509905815124512, "global_step": 28249, "epoch": 672} {"train_loss": -5.404923439025879, "global_step": 28250, "epoch": 672} {"train_loss": -5.4262189865112305, "global_step": 28251, "epoch": 672} {"train_loss": -5.57394552230835, "global_step": 28252, "epoch": 672} {"train_loss": -5.495743751525879, "global_step": 28253, "epoch": 672} {"train_loss": -5.3797407150268555, "global_step": 28254, "epoch": 672} {"train_loss": -5.4726104736328125, "global_step": 28255, "epoch": 672} {"train_loss": -5.534965991973877, "global_step": 28256, "epoch": 672} {"train_loss": -5.314674377441406, "global_step": 28257, "epoch": 672} {"train_loss": -5.41193962097168, "global_step": 28258, "epoch": 672} {"train_loss": -5.307270050048828, "global_step": 28259, "epoch": 672} {"train_loss": -5.39020299911499, "global_step": 28260, "epoch": 672} {"train_loss": -5.399496555328369, "global_step": 28261, "epoch": 672} {"train_loss": -5.495574951171875, "global_step": 28262, "epoch": 672} {"train_loss": -5.5604248046875, "global_step": 28263, "epoch": 672} {"train_loss": -5.524632453918457, "global_step": 28264, "epoch": 672} {"train_loss": -5.438379832676479, "global_step": 28265, "epoch": 672, "val_loss": 67577.984375} {"train_loss": -5.590606689453125, "global_step": 28266, "epoch": 673} {"train_loss": -5.512825965881348, "global_step": 28267, "epoch": 673} {"train_loss": -5.402674674987793, "global_step": 28268, "epoch": 673} {"train_loss": -5.399336814880371, "global_step": 28269, "epoch": 673} {"train_loss": -5.447005748748779, "global_step": 28270, "epoch": 673} {"train_loss": -5.427507400512695, "global_step": 28271, "epoch": 673} {"train_loss": -5.474286079406738, "global_step": 28272, "epoch": 673} {"train_loss": -5.484994888305664, "global_step": 28273, "epoch": 673} {"train_loss": -5.3570556640625, "global_step": 28274, "epoch": 673} {"train_loss": -5.438155174255371, "global_step": 28275, "epoch": 673} {"train_loss": -5.469402313232422, "global_step": 28276, "epoch": 673} {"train_loss": -5.533329010009766, "global_step": 28277, "epoch": 673} {"train_loss": -5.385037899017334, "global_step": 28278, "epoch": 673} {"train_loss": -5.540359020233154, "global_step": 28279, "epoch": 673} {"train_loss": -5.501126289367676, "global_step": 28280, "epoch": 673} {"train_loss": -5.466723442077637, "global_step": 28281, "epoch": 673} {"train_loss": -5.312521934509277, "global_step": 28282, "epoch": 673} {"train_loss": -5.409987449645996, "global_step": 28283, "epoch": 673} {"train_loss": -5.46182918548584, "global_step": 28284, "epoch": 673} {"train_loss": -5.550893783569336, "global_step": 28285, "epoch": 673} {"train_loss": -5.583429336547852, "global_step": 28286, "epoch": 673} {"train_loss": -5.404984474182129, "global_step": 28287, "epoch": 673} {"train_loss": -5.465015888214111, "global_step": 28288, "epoch": 673} {"train_loss": -5.366186141967773, "global_step": 28289, "epoch": 673} {"train_loss": -5.548001289367676, "global_step": 28290, "epoch": 673} {"train_loss": -5.363783836364746, "global_step": 28291, "epoch": 673} {"train_loss": -5.333556175231934, "global_step": 28292, "epoch": 673} {"train_loss": -5.499053478240967, "global_step": 28293, "epoch": 673} {"train_loss": -5.50276517868042, "global_step": 28294, "epoch": 673} {"train_loss": -5.349410057067871, "global_step": 28295, "epoch": 673} {"train_loss": -5.5942816734313965, "global_step": 28296, "epoch": 673} {"train_loss": -5.437180042266846, "global_step": 28297, "epoch": 673} {"train_loss": -5.424962520599365, "global_step": 28298, "epoch": 673} {"train_loss": -5.429039001464844, "global_step": 28299, "epoch": 673} {"train_loss": -5.3755574226379395, "global_step": 28300, "epoch": 673} {"train_loss": -5.353992462158203, "global_step": 28301, "epoch": 673} {"train_loss": -5.485949993133545, "global_step": 28302, "epoch": 673} {"train_loss": -5.348978519439697, "global_step": 28303, "epoch": 673} {"train_loss": -5.54343843460083, "global_step": 28304, "epoch": 673} {"train_loss": -5.4292402267456055, "global_step": 28305, "epoch": 673} {"train_loss": -5.465936183929443, "global_step": 28306, "epoch": 673} {"train_loss": -5.448855138960338, "global_step": 28307, "epoch": 673, "val_loss": 67807.6015625} {"train_loss": -5.376244068145752, "global_step": 28308, "epoch": 674} {"train_loss": -5.39365291595459, "global_step": 28309, "epoch": 674} {"train_loss": -5.403966426849365, "global_step": 28310, "epoch": 674} {"train_loss": -5.371405124664307, "global_step": 28311, "epoch": 674} {"train_loss": -5.599606513977051, "global_step": 28312, "epoch": 674} {"train_loss": -5.351279258728027, "global_step": 28313, "epoch": 674} {"train_loss": -5.61376953125, "global_step": 28314, "epoch": 674} {"train_loss": -5.286511421203613, "global_step": 28315, "epoch": 674} {"train_loss": -5.3007354736328125, "global_step": 28316, "epoch": 674} {"train_loss": -5.3900322914123535, "global_step": 28317, "epoch": 674} {"train_loss": -5.608460903167725, "global_step": 28318, "epoch": 674} {"train_loss": -5.351543426513672, "global_step": 28319, "epoch": 674} {"train_loss": -5.450787544250488, "global_step": 28320, "epoch": 674} {"train_loss": -5.425119400024414, "global_step": 28321, "epoch": 674} {"train_loss": -5.292807579040527, "global_step": 28322, "epoch": 674} {"train_loss": -5.541839599609375, "global_step": 28323, "epoch": 674} {"train_loss": -5.518246173858643, "global_step": 28324, "epoch": 674} {"train_loss": -5.451999664306641, "global_step": 28325, "epoch": 674} {"train_loss": -5.515379905700684, "global_step": 28326, "epoch": 674} {"train_loss": -5.511501312255859, "global_step": 28327, "epoch": 674} {"train_loss": -5.280351161956787, "global_step": 28328, "epoch": 674} {"train_loss": -5.527029514312744, "global_step": 28329, "epoch": 674} {"train_loss": -5.360170841217041, "global_step": 28330, "epoch": 674} {"train_loss": -5.428199768066406, "global_step": 28331, "epoch": 674} {"train_loss": -5.470123767852783, "global_step": 28332, "epoch": 674} {"train_loss": -5.544458389282227, "global_step": 28333, "epoch": 674} {"train_loss": -5.344267845153809, "global_step": 28334, "epoch": 674} {"train_loss": -5.53220796585083, "global_step": 28335, "epoch": 674} {"train_loss": -5.530703544616699, "global_step": 28336, "epoch": 674} {"train_loss": -5.402613639831543, "global_step": 28337, "epoch": 674} {"train_loss": -5.490114688873291, "global_step": 28338, "epoch": 674} {"train_loss": -5.621095657348633, "global_step": 28339, "epoch": 674} {"train_loss": -5.483306884765625, "global_step": 28340, "epoch": 674} {"train_loss": -5.534178733825684, "global_step": 28341, "epoch": 674} {"train_loss": -5.511355400085449, "global_step": 28342, "epoch": 674} {"train_loss": -5.411465644836426, "global_step": 28343, "epoch": 674} {"train_loss": -5.515637397766113, "global_step": 28344, "epoch": 674} {"train_loss": -5.424655914306641, "global_step": 28345, "epoch": 674} {"train_loss": -5.503880500793457, "global_step": 28346, "epoch": 674} {"train_loss": -5.4529032707214355, "global_step": 28347, "epoch": 674} {"train_loss": -5.413599014282227, "global_step": 28348, "epoch": 674} {"train_loss": -5.450096811567034, "global_step": 28349, "epoch": 674, "val_loss": 67144.875} {"train_loss": -5.40852165222168, "global_step": 28350, "epoch": 675} {"train_loss": -5.339836597442627, "global_step": 28351, "epoch": 675} {"train_loss": -5.445958137512207, "global_step": 28352, "epoch": 675} {"train_loss": -5.393301010131836, "global_step": 28353, "epoch": 675} {"train_loss": -5.4817304611206055, "global_step": 28354, "epoch": 675} {"train_loss": -5.499391078948975, "global_step": 28355, "epoch": 675} {"train_loss": -5.478967189788818, "global_step": 28356, "epoch": 675} {"train_loss": -5.429444313049316, "global_step": 28357, "epoch": 675} {"train_loss": -5.492061614990234, "global_step": 28358, "epoch": 675} {"train_loss": -5.502292633056641, "global_step": 28359, "epoch": 675} {"train_loss": -5.600546836853027, "global_step": 28360, "epoch": 675} {"train_loss": -5.4365949630737305, "global_step": 28361, "epoch": 675} {"train_loss": -5.522946357727051, "global_step": 28362, "epoch": 675} {"train_loss": -5.494075775146484, "global_step": 28363, "epoch": 675} {"train_loss": -5.473282814025879, "global_step": 28364, "epoch": 675} {"train_loss": -5.531271934509277, "global_step": 28365, "epoch": 675} {"train_loss": -5.514307022094727, "global_step": 28366, "epoch": 675} {"train_loss": -5.5391130447387695, "global_step": 28367, "epoch": 675} {"train_loss": -5.519036293029785, "global_step": 28368, "epoch": 675} {"train_loss": -5.466196060180664, "global_step": 28369, "epoch": 675} {"train_loss": -5.3842315673828125, "global_step": 28370, "epoch": 675} {"train_loss": -5.452826023101807, "global_step": 28371, "epoch": 675} {"train_loss": -5.489326000213623, "global_step": 28372, "epoch": 675} {"train_loss": -5.4890336990356445, "global_step": 28373, "epoch": 675} {"train_loss": -5.401595115661621, "global_step": 28374, "epoch": 675} {"train_loss": -5.363929748535156, "global_step": 28375, "epoch": 675} {"train_loss": -5.480691909790039, "global_step": 28376, "epoch": 675} {"train_loss": -5.348503112792969, "global_step": 28377, "epoch": 675} {"train_loss": -5.354761123657227, "global_step": 28378, "epoch": 675} {"train_loss": -5.446784019470215, "global_step": 28379, "epoch": 675} {"train_loss": -5.362243175506592, "global_step": 28380, "epoch": 675} {"train_loss": -5.481139659881592, "global_step": 28381, "epoch": 675} {"train_loss": -5.534381866455078, "global_step": 28382, "epoch": 675} {"train_loss": -5.2384185791015625, "global_step": 28383, "epoch": 675} {"train_loss": -5.473941802978516, "global_step": 28384, "epoch": 675} {"train_loss": -5.360621452331543, "global_step": 28385, "epoch": 675} {"train_loss": -5.443572044372559, "global_step": 28386, "epoch": 675} {"train_loss": -5.371457099914551, "global_step": 28387, "epoch": 675} {"train_loss": -5.403214454650879, "global_step": 28388, "epoch": 675} {"train_loss": -5.368318557739258, "global_step": 28389, "epoch": 675} {"train_loss": -5.320246696472168, "global_step": 28390, "epoch": 675} {"train_loss": -5.443487019765945, "global_step": 28391, "epoch": 675, "val_loss": 67239.8515625} {"train_loss": -5.427083492279053, "global_step": 28392, "epoch": 676} {"train_loss": -5.382211685180664, "global_step": 28393, "epoch": 676} {"train_loss": -5.421327114105225, "global_step": 28394, "epoch": 676} {"train_loss": -5.412812232971191, "global_step": 28395, "epoch": 676} {"train_loss": -5.5368452072143555, "global_step": 28396, "epoch": 676} {"train_loss": -5.467717170715332, "global_step": 28397, "epoch": 676} {"train_loss": -5.486515045166016, "global_step": 28398, "epoch": 676} {"train_loss": -5.467504978179932, "global_step": 28399, "epoch": 676} {"train_loss": -5.382296562194824, "global_step": 28400, "epoch": 676} {"train_loss": -5.453373908996582, "global_step": 28401, "epoch": 676} {"train_loss": -5.3080549240112305, "global_step": 28402, "epoch": 676} {"train_loss": -5.478699684143066, "global_step": 28403, "epoch": 676} {"train_loss": -5.561850070953369, "global_step": 28404, "epoch": 676} {"train_loss": -5.471311092376709, "global_step": 28405, "epoch": 676} {"train_loss": -5.543447494506836, "global_step": 28406, "epoch": 676} {"train_loss": -5.397423267364502, "global_step": 28407, "epoch": 676} {"train_loss": -5.545825004577637, "global_step": 28408, "epoch": 676} {"train_loss": -5.533257484436035, "global_step": 28409, "epoch": 676} {"train_loss": -5.407983779907227, "global_step": 28410, "epoch": 676} {"train_loss": -5.32555627822876, "global_step": 28411, "epoch": 676} {"train_loss": -5.396327495574951, "global_step": 28412, "epoch": 676} {"train_loss": -5.56696891784668, "global_step": 28413, "epoch": 676} {"train_loss": -5.471697807312012, "global_step": 28414, "epoch": 676} {"train_loss": -5.473038673400879, "global_step": 28415, "epoch": 676} {"train_loss": -5.499191761016846, "global_step": 28416, "epoch": 676} {"train_loss": -5.517864227294922, "global_step": 28417, "epoch": 676} {"train_loss": -5.383561134338379, "global_step": 28418, "epoch": 676} {"train_loss": -5.544034481048584, "global_step": 28419, "epoch": 676} {"train_loss": -5.519255638122559, "global_step": 28420, "epoch": 676} {"train_loss": -5.400157928466797, "global_step": 28421, "epoch": 676} {"train_loss": -5.489500045776367, "global_step": 28422, "epoch": 676} {"train_loss": -5.4298481941223145, "global_step": 28423, "epoch": 676} {"train_loss": -5.428297996520996, "global_step": 28424, "epoch": 676} {"train_loss": -5.443728446960449, "global_step": 28425, "epoch": 676} {"train_loss": -5.533299446105957, "global_step": 28426, "epoch": 676} {"train_loss": -5.504852294921875, "global_step": 28427, "epoch": 676} {"train_loss": -5.4581828117370605, "global_step": 28428, "epoch": 676} {"train_loss": -5.406427383422852, "global_step": 28429, "epoch": 676} {"train_loss": -5.5745134353637695, "global_step": 28430, "epoch": 676} {"train_loss": -5.40219259262085, "global_step": 28431, "epoch": 676} {"train_loss": -5.511427879333496, "global_step": 28432, "epoch": 676} {"train_loss": -5.462163436980474, "global_step": 28433, "epoch": 676, "val_loss": 67198.8359375} {"train_loss": -5.49919319152832, "global_step": 28434, "epoch": 677} {"train_loss": -5.413862705230713, "global_step": 28435, "epoch": 677} {"train_loss": -5.522640228271484, "global_step": 28436, "epoch": 677} {"train_loss": -5.522327899932861, "global_step": 28437, "epoch": 677} {"train_loss": -5.565779685974121, "global_step": 28438, "epoch": 677} {"train_loss": -5.396993637084961, "global_step": 28439, "epoch": 677} {"train_loss": -5.571217060089111, "global_step": 28440, "epoch": 677} {"train_loss": -5.435380935668945, "global_step": 28441, "epoch": 677} {"train_loss": -5.344459533691406, "global_step": 28442, "epoch": 677} {"train_loss": -5.340346813201904, "global_step": 28443, "epoch": 677} {"train_loss": -5.525935173034668, "global_step": 28444, "epoch": 677} {"train_loss": -5.4428253173828125, "global_step": 28445, "epoch": 677} {"train_loss": -5.513278961181641, "global_step": 28446, "epoch": 677} {"train_loss": -5.508128643035889, "global_step": 28447, "epoch": 677} {"train_loss": -5.513069152832031, "global_step": 28448, "epoch": 677} {"train_loss": -5.43755578994751, "global_step": 28449, "epoch": 677} {"train_loss": -5.482142448425293, "global_step": 28450, "epoch": 677} {"train_loss": -5.559233665466309, "global_step": 28451, "epoch": 677} {"train_loss": -5.442410469055176, "global_step": 28452, "epoch": 677} {"train_loss": -5.524356842041016, "global_step": 28453, "epoch": 677} {"train_loss": -5.45523738861084, "global_step": 28454, "epoch": 677} {"train_loss": -5.643696308135986, "global_step": 28455, "epoch": 677} {"train_loss": -5.484623432159424, "global_step": 28456, "epoch": 677} {"train_loss": -5.326282501220703, "global_step": 28457, "epoch": 677} {"train_loss": -5.629612922668457, "global_step": 28458, "epoch": 677} {"train_loss": -5.405306816101074, "global_step": 28459, "epoch": 677} {"train_loss": -5.47007942199707, "global_step": 28460, "epoch": 677} {"train_loss": -5.287704944610596, "global_step": 28461, "epoch": 677} {"train_loss": -5.426972389221191, "global_step": 28462, "epoch": 677} {"train_loss": -5.378469944000244, "global_step": 28463, "epoch": 677} {"train_loss": -5.314083099365234, "global_step": 28464, "epoch": 677} {"train_loss": -5.454352855682373, "global_step": 28465, "epoch": 677} {"train_loss": -5.503817558288574, "global_step": 28466, "epoch": 677} {"train_loss": -5.317061901092529, "global_step": 28467, "epoch": 677} {"train_loss": -5.5436692237854, "global_step": 28468, "epoch": 677} {"train_loss": -5.537550926208496, "global_step": 28469, "epoch": 677} {"train_loss": -5.441139221191406, "global_step": 28470, "epoch": 677} {"train_loss": -5.379558563232422, "global_step": 28471, "epoch": 677} {"train_loss": -5.551467418670654, "global_step": 28472, "epoch": 677} {"train_loss": -5.400416374206543, "global_step": 28473, "epoch": 677} {"train_loss": -5.435083389282227, "global_step": 28474, "epoch": 677} {"train_loss": -5.460702952884493, "global_step": 28475, "epoch": 677, "val_loss": 67234.1328125} {"train_loss": -5.391587257385254, "global_step": 28476, "epoch": 678} {"train_loss": -5.474214553833008, "global_step": 28477, "epoch": 678} {"train_loss": -5.429060935974121, "global_step": 28478, "epoch": 678} {"train_loss": -5.443698883056641, "global_step": 28479, "epoch": 678} {"train_loss": -5.442840576171875, "global_step": 28480, "epoch": 678} {"train_loss": -5.4964399337768555, "global_step": 28481, "epoch": 678} {"train_loss": -5.438668727874756, "global_step": 28482, "epoch": 678} {"train_loss": -5.60674524307251, "global_step": 28483, "epoch": 678} {"train_loss": -5.439853191375732, "global_step": 28484, "epoch": 678} {"train_loss": -5.419931411743164, "global_step": 28485, "epoch": 678} {"train_loss": -5.536038398742676, "global_step": 28486, "epoch": 678} {"train_loss": -5.547091007232666, "global_step": 28487, "epoch": 678} {"train_loss": -5.5224151611328125, "global_step": 28488, "epoch": 678} {"train_loss": -5.417407035827637, "global_step": 28489, "epoch": 678} {"train_loss": -5.492781162261963, "global_step": 28490, "epoch": 678} {"train_loss": -5.4519782066345215, "global_step": 28491, "epoch": 678} {"train_loss": -5.459222793579102, "global_step": 28492, "epoch": 678} {"train_loss": -5.346470355987549, "global_step": 28493, "epoch": 678} {"train_loss": -5.351604461669922, "global_step": 28494, "epoch": 678} {"train_loss": -5.51979398727417, "global_step": 28495, "epoch": 678} {"train_loss": -5.420562744140625, "global_step": 28496, "epoch": 678} {"train_loss": -5.402375221252441, "global_step": 28497, "epoch": 678} {"train_loss": -5.457523822784424, "global_step": 28498, "epoch": 678} {"train_loss": -5.372636318206787, "global_step": 28499, "epoch": 678} {"train_loss": -5.422976493835449, "global_step": 28500, "epoch": 678} {"train_loss": -5.412191390991211, "global_step": 28501, "epoch": 678} {"train_loss": -5.381475448608398, "global_step": 28502, "epoch": 678} {"train_loss": -5.459268569946289, "global_step": 28503, "epoch": 678} {"train_loss": -5.516060829162598, "global_step": 28504, "epoch": 678} {"train_loss": -5.492903232574463, "global_step": 28505, "epoch": 678} {"train_loss": -5.521998405456543, "global_step": 28506, "epoch": 678} {"train_loss": -5.323093414306641, "global_step": 28507, "epoch": 678} {"train_loss": -5.447378635406494, "global_step": 28508, "epoch": 678} {"train_loss": -5.415248870849609, "global_step": 28509, "epoch": 678} {"train_loss": -5.502814292907715, "global_step": 28510, "epoch": 678} {"train_loss": -5.452854156494141, "global_step": 28511, "epoch": 678} {"train_loss": -5.36629581451416, "global_step": 28512, "epoch": 678} {"train_loss": -5.456343650817871, "global_step": 28513, "epoch": 678} {"train_loss": -5.439197540283203, "global_step": 28514, "epoch": 678} {"train_loss": -5.455901145935059, "global_step": 28515, "epoch": 678} {"train_loss": -5.526874542236328, "global_step": 28516, "epoch": 678} {"train_loss": -5.4480949356442405, "global_step": 28517, "epoch": 678, "val_loss": 67125.8046875} {"train_loss": -5.591483116149902, "global_step": 28518, "epoch": 679} {"train_loss": -5.265148639678955, "global_step": 28519, "epoch": 679} {"train_loss": -5.564556121826172, "global_step": 28520, "epoch": 679} {"train_loss": -5.640186786651611, "global_step": 28521, "epoch": 679} {"train_loss": -5.530182361602783, "global_step": 28522, "epoch": 679} {"train_loss": -5.4158830642700195, "global_step": 28523, "epoch": 679} {"train_loss": -5.476388454437256, "global_step": 28524, "epoch": 679} {"train_loss": -5.458667755126953, "global_step": 28525, "epoch": 679} {"train_loss": -5.510859489440918, "global_step": 28526, "epoch": 679} {"train_loss": -5.456857204437256, "global_step": 28527, "epoch": 679} {"train_loss": -5.525955677032471, "global_step": 28528, "epoch": 679} {"train_loss": -5.440200328826904, "global_step": 28529, "epoch": 679} {"train_loss": -5.479206562042236, "global_step": 28530, "epoch": 679} {"train_loss": -5.474879264831543, "global_step": 28531, "epoch": 679} {"train_loss": -5.479065895080566, "global_step": 28532, "epoch": 679} {"train_loss": -5.413820743560791, "global_step": 28533, "epoch": 679} {"train_loss": -5.445697784423828, "global_step": 28534, "epoch": 679} {"train_loss": -5.497323036193848, "global_step": 28535, "epoch": 679} {"train_loss": -5.543327808380127, "global_step": 28536, "epoch": 679} {"train_loss": -5.510345458984375, "global_step": 28537, "epoch": 679} {"train_loss": -5.3921308517456055, "global_step": 28538, "epoch": 679} {"train_loss": -5.455686569213867, "global_step": 28539, "epoch": 679} {"train_loss": -5.539289474487305, "global_step": 28540, "epoch": 679} {"train_loss": -5.412224292755127, "global_step": 28541, "epoch": 679} {"train_loss": -5.564413070678711, "global_step": 28542, "epoch": 679} {"train_loss": -5.54262113571167, "global_step": 28543, "epoch": 679} {"train_loss": -5.490511417388916, "global_step": 28544, "epoch": 679} {"train_loss": -5.501572608947754, "global_step": 28545, "epoch": 679} {"train_loss": -5.405753135681152, "global_step": 28546, "epoch": 679} {"train_loss": -5.543790817260742, "global_step": 28547, "epoch": 679} {"train_loss": -5.5518903732299805, "global_step": 28548, "epoch": 679} {"train_loss": -5.471841812133789, "global_step": 28549, "epoch": 679} {"train_loss": -5.529784202575684, "global_step": 28550, "epoch": 679} {"train_loss": -5.4437127113342285, "global_step": 28551, "epoch": 679} {"train_loss": -5.375805854797363, "global_step": 28552, "epoch": 679} {"train_loss": -5.4230780601501465, "global_step": 28553, "epoch": 679} {"train_loss": -5.353273868560791, "global_step": 28554, "epoch": 679} {"train_loss": -5.46343469619751, "global_step": 28555, "epoch": 679} {"train_loss": -5.406036376953125, "global_step": 28556, "epoch": 679} {"train_loss": -5.395912170410156, "global_step": 28557, "epoch": 679} {"train_loss": -5.394118785858154, "global_step": 28558, "epoch": 679} {"train_loss": -5.472432363600958, "global_step": 28559, "epoch": 679, "val_loss": 67859.75} {"train_loss": -5.462972164154053, "global_step": 28560, "epoch": 680} {"train_loss": -5.438325881958008, "global_step": 28561, "epoch": 680} {"train_loss": -5.4980621337890625, "global_step": 28562, "epoch": 680} {"train_loss": -5.336989402770996, "global_step": 28563, "epoch": 680} {"train_loss": -5.439478874206543, "global_step": 28564, "epoch": 680} {"train_loss": -5.478281497955322, "global_step": 28565, "epoch": 680} {"train_loss": -5.486886978149414, "global_step": 28566, "epoch": 680} {"train_loss": -5.498762130737305, "global_step": 28567, "epoch": 680} {"train_loss": -5.530209541320801, "global_step": 28568, "epoch": 680} {"train_loss": -5.479033946990967, "global_step": 28569, "epoch": 680} {"train_loss": -5.345229625701904, "global_step": 28570, "epoch": 680} {"train_loss": -5.4918718338012695, "global_step": 28571, "epoch": 680} {"train_loss": -5.478379249572754, "global_step": 28572, "epoch": 680} {"train_loss": -5.336883544921875, "global_step": 28573, "epoch": 680} {"train_loss": -5.4032979011535645, "global_step": 28574, "epoch": 680} {"train_loss": -5.4542236328125, "global_step": 28575, "epoch": 680} {"train_loss": -5.445144176483154, "global_step": 28576, "epoch": 680} {"train_loss": -5.474735736846924, "global_step": 28577, "epoch": 680} {"train_loss": -5.387633800506592, "global_step": 28578, "epoch": 680} {"train_loss": -5.385772705078125, "global_step": 28579, "epoch": 680} {"train_loss": -5.380708694458008, "global_step": 28580, "epoch": 680} {"train_loss": -5.373610019683838, "global_step": 28581, "epoch": 680} {"train_loss": -5.430324554443359, "global_step": 28582, "epoch": 680} {"train_loss": -5.441498279571533, "global_step": 28583, "epoch": 680} {"train_loss": -5.388452529907227, "global_step": 28584, "epoch": 680} {"train_loss": -5.396353721618652, "global_step": 28585, "epoch": 680} {"train_loss": -5.420443058013916, "global_step": 28586, "epoch": 680} {"train_loss": -5.42126989364624, "global_step": 28587, "epoch": 680} {"train_loss": -5.555819988250732, "global_step": 28588, "epoch": 680} {"train_loss": -5.54781436920166, "global_step": 28589, "epoch": 680} {"train_loss": -5.475985050201416, "global_step": 28590, "epoch": 680} {"train_loss": -5.501186370849609, "global_step": 28591, "epoch": 680} {"train_loss": -5.611423015594482, "global_step": 28592, "epoch": 680} {"train_loss": -5.373088359832764, "global_step": 28593, "epoch": 680} {"train_loss": -5.489824295043945, "global_step": 28594, "epoch": 680} {"train_loss": -5.614872932434082, "global_step": 28595, "epoch": 680} {"train_loss": -5.497878074645996, "global_step": 28596, "epoch": 680} {"train_loss": -5.438821792602539, "global_step": 28597, "epoch": 680} {"train_loss": -5.4457173347473145, "global_step": 28598, "epoch": 680} {"train_loss": -5.344757556915283, "global_step": 28599, "epoch": 680} {"train_loss": -5.453210353851318, "global_step": 28600, "epoch": 680} {"train_loss": -5.454175143014817, "global_step": 28601, "epoch": 680, "val_loss": 67473.6015625} {"train_loss": -5.471127510070801, "global_step": 28602, "epoch": 681} {"train_loss": -5.395752429962158, "global_step": 28603, "epoch": 681} {"train_loss": -5.4418840408325195, "global_step": 28604, "epoch": 681} {"train_loss": -5.411628723144531, "global_step": 28605, "epoch": 681} {"train_loss": -5.446610450744629, "global_step": 28606, "epoch": 681} {"train_loss": -5.41249942779541, "global_step": 28607, "epoch": 681} {"train_loss": -5.494678497314453, "global_step": 28608, "epoch": 681} {"train_loss": -5.548449516296387, "global_step": 28609, "epoch": 681} {"train_loss": -5.511992454528809, "global_step": 28610, "epoch": 681} {"train_loss": -5.337648868560791, "global_step": 28611, "epoch": 681} {"train_loss": -5.51920223236084, "global_step": 28612, "epoch": 681} {"train_loss": -5.324261665344238, "global_step": 28613, "epoch": 681} {"train_loss": -5.486814975738525, "global_step": 28614, "epoch": 681} {"train_loss": -5.30576753616333, "global_step": 28615, "epoch": 681} {"train_loss": -5.50921630859375, "global_step": 28616, "epoch": 681} {"train_loss": -5.448273658752441, "global_step": 28617, "epoch": 681} {"train_loss": -5.476417541503906, "global_step": 28618, "epoch": 681} {"train_loss": -5.420975685119629, "global_step": 28619, "epoch": 681} {"train_loss": -5.386078357696533, "global_step": 28620, "epoch": 681} {"train_loss": -5.462296485900879, "global_step": 28621, "epoch": 681} {"train_loss": -5.421180248260498, "global_step": 28622, "epoch": 681} {"train_loss": -5.517398357391357, "global_step": 28623, "epoch": 681} {"train_loss": -5.3788042068481445, "global_step": 28624, "epoch": 681} {"train_loss": -5.379434585571289, "global_step": 28625, "epoch": 681} {"train_loss": -5.392241477966309, "global_step": 28626, "epoch": 681} {"train_loss": -5.410512924194336, "global_step": 28627, "epoch": 681} {"train_loss": -5.493989944458008, "global_step": 28628, "epoch": 681} {"train_loss": -5.249631404876709, "global_step": 28629, "epoch": 681} {"train_loss": -5.508735179901123, "global_step": 28630, "epoch": 681} {"train_loss": -5.4030985832214355, "global_step": 28631, "epoch": 681} {"train_loss": -5.504502773284912, "global_step": 28632, "epoch": 681} {"train_loss": -5.3864898681640625, "global_step": 28633, "epoch": 681} {"train_loss": -5.263490676879883, "global_step": 28634, "epoch": 681} {"train_loss": -5.456976890563965, "global_step": 28635, "epoch": 681} {"train_loss": -5.316656589508057, "global_step": 28636, "epoch": 681} {"train_loss": -5.499871253967285, "global_step": 28637, "epoch": 681} {"train_loss": -5.435737609863281, "global_step": 28638, "epoch": 681} {"train_loss": -5.403858661651611, "global_step": 28639, "epoch": 681} {"train_loss": -5.39793586730957, "global_step": 28640, "epoch": 681} {"train_loss": -5.484624862670898, "global_step": 28641, "epoch": 681} {"train_loss": -5.39981746673584, "global_step": 28642, "epoch": 681} {"train_loss": -5.428409985133579, "global_step": 28643, "epoch": 681, "val_loss": 67224.9453125} {"train_loss": -5.5107011795043945, "global_step": 28644, "epoch": 682} {"train_loss": -5.442485809326172, "global_step": 28645, "epoch": 682} {"train_loss": -5.482576370239258, "global_step": 28646, "epoch": 682} {"train_loss": -5.45704460144043, "global_step": 28647, "epoch": 682} {"train_loss": -5.386532783508301, "global_step": 28648, "epoch": 682} {"train_loss": -5.504124641418457, "global_step": 28649, "epoch": 682} {"train_loss": -5.419633388519287, "global_step": 28650, "epoch": 682} {"train_loss": -5.4830756187438965, "global_step": 28651, "epoch": 682} {"train_loss": -5.43434476852417, "global_step": 28652, "epoch": 682} {"train_loss": -5.309586048126221, "global_step": 28653, "epoch": 682} {"train_loss": -5.4771952629089355, "global_step": 28654, "epoch": 682} {"train_loss": -5.535261631011963, "global_step": 28655, "epoch": 682} {"train_loss": -5.582533836364746, "global_step": 28656, "epoch": 682} {"train_loss": -5.464180946350098, "global_step": 28657, "epoch": 682} {"train_loss": -5.433384418487549, "global_step": 28658, "epoch": 682} {"train_loss": -5.236738204956055, "global_step": 28659, "epoch": 682} {"train_loss": -5.408239841461182, "global_step": 28660, "epoch": 682} {"train_loss": -5.1322760581970215, "global_step": 28661, "epoch": 682} {"train_loss": -5.451312065124512, "global_step": 28662, "epoch": 682} {"train_loss": -5.484614372253418, "global_step": 28663, "epoch": 682} {"train_loss": -5.4552412033081055, "global_step": 28664, "epoch": 682} {"train_loss": -5.4843854904174805, "global_step": 28665, "epoch": 682} {"train_loss": -5.472710132598877, "global_step": 28666, "epoch": 682} {"train_loss": -5.361728668212891, "global_step": 28667, "epoch": 682} {"train_loss": -5.491984844207764, "global_step": 28668, "epoch": 682} {"train_loss": -5.359580993652344, "global_step": 28669, "epoch": 682} {"train_loss": -5.283914566040039, "global_step": 28670, "epoch": 682} {"train_loss": -5.474488258361816, "global_step": 28671, "epoch": 682} {"train_loss": -5.439657211303711, "global_step": 28672, "epoch": 682} {"train_loss": -5.402748107910156, "global_step": 28673, "epoch": 682} {"train_loss": -5.520719528198242, "global_step": 28674, "epoch": 682} {"train_loss": -5.393943786621094, "global_step": 28675, "epoch": 682} {"train_loss": -5.286599159240723, "global_step": 28676, "epoch": 682} {"train_loss": -5.499454021453857, "global_step": 28677, "epoch": 682} {"train_loss": -5.472422122955322, "global_step": 28678, "epoch": 682} {"train_loss": -5.468910217285156, "global_step": 28679, "epoch": 682} {"train_loss": -5.506034851074219, "global_step": 28680, "epoch": 682} {"train_loss": -5.480982780456543, "global_step": 28681, "epoch": 682} {"train_loss": -5.4358320236206055, "global_step": 28682, "epoch": 682} {"train_loss": -5.498871803283691, "global_step": 28683, "epoch": 682} {"train_loss": -5.303274631500244, "global_step": 28684, "epoch": 682} {"train_loss": -5.431774752480643, "global_step": 28685, "epoch": 682, "val_loss": 68051.46875} {"train_loss": -5.450584411621094, "global_step": 28686, "epoch": 683} {"train_loss": -5.443965911865234, "global_step": 28687, "epoch": 683} {"train_loss": -5.5148820877075195, "global_step": 28688, "epoch": 683} {"train_loss": -5.37583065032959, "global_step": 28689, "epoch": 683} {"train_loss": -5.495293617248535, "global_step": 28690, "epoch": 683} {"train_loss": -5.35029935836792, "global_step": 28691, "epoch": 683} {"train_loss": -5.4773268699646, "global_step": 28692, "epoch": 683} {"train_loss": -5.449837684631348, "global_step": 28693, "epoch": 683} {"train_loss": -5.496502876281738, "global_step": 28694, "epoch": 683} {"train_loss": -5.424150466918945, "global_step": 28695, "epoch": 683} {"train_loss": -5.489634037017822, "global_step": 28696, "epoch": 683} {"train_loss": -5.509384632110596, "global_step": 28697, "epoch": 683} {"train_loss": -5.5746870040893555, "global_step": 28698, "epoch": 683} {"train_loss": -5.616125583648682, "global_step": 28699, "epoch": 683} {"train_loss": -5.438044548034668, "global_step": 28700, "epoch": 683} {"train_loss": -5.484350204467773, "global_step": 28701, "epoch": 683} {"train_loss": -5.403870582580566, "global_step": 28702, "epoch": 683} {"train_loss": -5.584492206573486, "global_step": 28703, "epoch": 683} {"train_loss": -5.356228828430176, "global_step": 28704, "epoch": 683} {"train_loss": -5.534430503845215, "global_step": 28705, "epoch": 683} {"train_loss": -5.357206344604492, "global_step": 28706, "epoch": 683} {"train_loss": -5.302243709564209, "global_step": 28707, "epoch": 683} {"train_loss": -5.3653459548950195, "global_step": 28708, "epoch": 683} {"train_loss": -5.461061954498291, "global_step": 28709, "epoch": 683} {"train_loss": -5.109546661376953, "global_step": 28710, "epoch": 683} {"train_loss": -5.368536949157715, "global_step": 28711, "epoch": 683} {"train_loss": -5.300179481506348, "global_step": 28712, "epoch": 683} {"train_loss": -5.24267578125, "global_step": 28713, "epoch": 683} {"train_loss": -5.262310981750488, "global_step": 28714, "epoch": 683} {"train_loss": -5.329861640930176, "global_step": 28715, "epoch": 683} {"train_loss": -5.387773513793945, "global_step": 28716, "epoch": 683} {"train_loss": -5.316025733947754, "global_step": 28717, "epoch": 683} {"train_loss": -5.477619171142578, "global_step": 28718, "epoch": 683} {"train_loss": -5.465888500213623, "global_step": 28719, "epoch": 683} {"train_loss": -5.531513690948486, "global_step": 28720, "epoch": 683} {"train_loss": -5.455358505249023, "global_step": 28721, "epoch": 683} {"train_loss": -5.298572063446045, "global_step": 28722, "epoch": 683} {"train_loss": -5.470915794372559, "global_step": 28723, "epoch": 683} {"train_loss": -5.412683010101318, "global_step": 28724, "epoch": 683} {"train_loss": -5.541558265686035, "global_step": 28725, "epoch": 683} {"train_loss": -5.372707843780518, "global_step": 28726, "epoch": 683} {"train_loss": -5.424747444334484, "global_step": 28727, "epoch": 683, "val_loss": 67502.1015625} {"train_loss": -5.571256637573242, "global_step": 28728, "epoch": 684} {"train_loss": -5.43974494934082, "global_step": 28729, "epoch": 684} {"train_loss": -5.54398775100708, "global_step": 28730, "epoch": 684} {"train_loss": -5.408303737640381, "global_step": 28731, "epoch": 684} {"train_loss": -5.569051265716553, "global_step": 28732, "epoch": 684} {"train_loss": -5.487987995147705, "global_step": 28733, "epoch": 684} {"train_loss": -5.6721906661987305, "global_step": 28734, "epoch": 684} {"train_loss": -5.535517692565918, "global_step": 28735, "epoch": 684} {"train_loss": -5.476656913757324, "global_step": 28736, "epoch": 684} {"train_loss": -5.400278091430664, "global_step": 28737, "epoch": 684} {"train_loss": -5.4633612632751465, "global_step": 28738, "epoch": 684} {"train_loss": -5.539304733276367, "global_step": 28739, "epoch": 684} {"train_loss": -5.391232967376709, "global_step": 28740, "epoch": 684} {"train_loss": -5.428667068481445, "global_step": 28741, "epoch": 684} {"train_loss": -5.539173126220703, "global_step": 28742, "epoch": 684} {"train_loss": -5.385053634643555, "global_step": 28743, "epoch": 684} {"train_loss": -5.4565277099609375, "global_step": 28744, "epoch": 684} {"train_loss": -5.507166862487793, "global_step": 28745, "epoch": 684} {"train_loss": -5.377468109130859, "global_step": 28746, "epoch": 684} {"train_loss": -5.47579288482666, "global_step": 28747, "epoch": 684} {"train_loss": -5.357316017150879, "global_step": 28748, "epoch": 684} {"train_loss": -5.502235412597656, "global_step": 28749, "epoch": 684} {"train_loss": -5.391932010650635, "global_step": 28750, "epoch": 684} {"train_loss": -5.446247100830078, "global_step": 28751, "epoch": 684} {"train_loss": -5.522881031036377, "global_step": 28752, "epoch": 684} {"train_loss": -5.54000997543335, "global_step": 28753, "epoch": 684} {"train_loss": -5.453917980194092, "global_step": 28754, "epoch": 684} {"train_loss": -5.310227870941162, "global_step": 28755, "epoch": 684} {"train_loss": -5.472352027893066, "global_step": 28756, "epoch": 684} {"train_loss": -5.5727972984313965, "global_step": 28757, "epoch": 684} {"train_loss": -5.418741226196289, "global_step": 28758, "epoch": 684} {"train_loss": -5.447556972503662, "global_step": 28759, "epoch": 684} {"train_loss": -5.345612049102783, "global_step": 28760, "epoch": 684} {"train_loss": -5.2866010665893555, "global_step": 28761, "epoch": 684} {"train_loss": -5.35568904876709, "global_step": 28762, "epoch": 684} {"train_loss": -5.518586158752441, "global_step": 28763, "epoch": 684} {"train_loss": -5.3527326583862305, "global_step": 28764, "epoch": 684} {"train_loss": -5.542364120483398, "global_step": 28765, "epoch": 684} {"train_loss": -5.441563606262207, "global_step": 28766, "epoch": 684} {"train_loss": -5.505184173583984, "global_step": 28767, "epoch": 684} {"train_loss": -5.492257118225098, "global_step": 28768, "epoch": 684} {"train_loss": -5.463227862403507, "global_step": 28769, "epoch": 684, "val_loss": 67092.984375} {"train_loss": -5.4418253898620605, "global_step": 28770, "epoch": 685} {"train_loss": -5.408642292022705, "global_step": 28771, "epoch": 685} {"train_loss": -5.4619903564453125, "global_step": 28772, "epoch": 685} {"train_loss": -5.467755317687988, "global_step": 28773, "epoch": 685} {"train_loss": -5.631132125854492, "global_step": 28774, "epoch": 685} {"train_loss": -5.389784812927246, "global_step": 28775, "epoch": 685} {"train_loss": -5.5489888191223145, "global_step": 28776, "epoch": 685} {"train_loss": -5.416087627410889, "global_step": 28777, "epoch": 685} {"train_loss": -5.523339748382568, "global_step": 28778, "epoch": 685} {"train_loss": -5.526808261871338, "global_step": 28779, "epoch": 685} {"train_loss": -5.442901611328125, "global_step": 28780, "epoch": 685} {"train_loss": -5.495279788970947, "global_step": 28781, "epoch": 685} {"train_loss": -5.410986423492432, "global_step": 28782, "epoch": 685} {"train_loss": -5.4389801025390625, "global_step": 28783, "epoch": 685} {"train_loss": -5.424773216247559, "global_step": 28784, "epoch": 685} {"train_loss": -5.526900291442871, "global_step": 28785, "epoch": 685} {"train_loss": -5.413468360900879, "global_step": 28786, "epoch": 685} {"train_loss": -5.40718936920166, "global_step": 28787, "epoch": 685} {"train_loss": -5.4953742027282715, "global_step": 28788, "epoch": 685} {"train_loss": -5.493403911590576, "global_step": 28789, "epoch": 685} {"train_loss": -5.387019157409668, "global_step": 28790, "epoch": 685} {"train_loss": -5.497560501098633, "global_step": 28791, "epoch": 685} {"train_loss": -5.434518814086914, "global_step": 28792, "epoch": 685} {"train_loss": -5.4779582023620605, "global_step": 28793, "epoch": 685} {"train_loss": -5.402170181274414, "global_step": 28794, "epoch": 685} {"train_loss": -5.374170303344727, "global_step": 28795, "epoch": 685} {"train_loss": -5.6049113273620605, "global_step": 28796, "epoch": 685} {"train_loss": -5.550059795379639, "global_step": 28797, "epoch": 685} {"train_loss": -5.47585391998291, "global_step": 28798, "epoch": 685} {"train_loss": -5.458901405334473, "global_step": 28799, "epoch": 685} {"train_loss": -5.5693464279174805, "global_step": 28800, "epoch": 685} {"train_loss": -5.557546138763428, "global_step": 28801, "epoch": 685} {"train_loss": -5.370545387268066, "global_step": 28802, "epoch": 685} {"train_loss": -5.308907985687256, "global_step": 28803, "epoch": 685} {"train_loss": -5.38794469833374, "global_step": 28804, "epoch": 685} {"train_loss": -5.399446487426758, "global_step": 28805, "epoch": 685} {"train_loss": -5.563847541809082, "global_step": 28806, "epoch": 685} {"train_loss": -5.538516044616699, "global_step": 28807, "epoch": 685} {"train_loss": -5.448266983032227, "global_step": 28808, "epoch": 685} {"train_loss": -5.386748313903809, "global_step": 28809, "epoch": 685} {"train_loss": -5.580170154571533, "global_step": 28810, "epoch": 685} {"train_loss": -5.46321025348845, "global_step": 28811, "epoch": 685, "val_loss": 67430.4375} {"train_loss": -5.4598069190979, "global_step": 28812, "epoch": 686} {"train_loss": -5.44144344329834, "global_step": 28813, "epoch": 686} {"train_loss": -5.4059906005859375, "global_step": 28814, "epoch": 686} {"train_loss": -5.534446716308594, "global_step": 28815, "epoch": 686} {"train_loss": -5.553993225097656, "global_step": 28816, "epoch": 686} {"train_loss": -5.342803001403809, "global_step": 28817, "epoch": 686} {"train_loss": -5.478983402252197, "global_step": 28818, "epoch": 686} {"train_loss": -5.425982475280762, "global_step": 28819, "epoch": 686} {"train_loss": -5.507628440856934, "global_step": 28820, "epoch": 686} {"train_loss": -5.562380790710449, "global_step": 28821, "epoch": 686} {"train_loss": -5.352928161621094, "global_step": 28822, "epoch": 686} {"train_loss": -5.353848457336426, "global_step": 28823, "epoch": 686} {"train_loss": -5.526655673980713, "global_step": 28824, "epoch": 686} {"train_loss": -5.3342084884643555, "global_step": 28825, "epoch": 686} {"train_loss": -5.514243125915527, "global_step": 28826, "epoch": 686} {"train_loss": -5.496547698974609, "global_step": 28827, "epoch": 686} {"train_loss": -5.356095314025879, "global_step": 28828, "epoch": 686} {"train_loss": -5.517271518707275, "global_step": 28829, "epoch": 686} {"train_loss": -5.425337314605713, "global_step": 28830, "epoch": 686} {"train_loss": -5.36783504486084, "global_step": 28831, "epoch": 686} {"train_loss": -5.449231147766113, "global_step": 28832, "epoch": 686} {"train_loss": -5.542168617248535, "global_step": 28833, "epoch": 686} {"train_loss": -5.516881942749023, "global_step": 28834, "epoch": 686} {"train_loss": -5.454553604125977, "global_step": 28835, "epoch": 686} {"train_loss": -5.276242256164551, "global_step": 28836, "epoch": 686} {"train_loss": -5.422375679016113, "global_step": 28837, "epoch": 686} {"train_loss": -5.484751224517822, "global_step": 28838, "epoch": 686} {"train_loss": -5.474941253662109, "global_step": 28839, "epoch": 686} {"train_loss": -5.4444379806518555, "global_step": 28840, "epoch": 686} {"train_loss": -5.359892845153809, "global_step": 28841, "epoch": 686} {"train_loss": -5.431816101074219, "global_step": 28842, "epoch": 686} {"train_loss": -5.357336521148682, "global_step": 28843, "epoch": 686} {"train_loss": -5.426578521728516, "global_step": 28844, "epoch": 686} {"train_loss": -5.362183570861816, "global_step": 28845, "epoch": 686} {"train_loss": -5.4777631759643555, "global_step": 28846, "epoch": 686} {"train_loss": -5.437933444976807, "global_step": 28847, "epoch": 686} {"train_loss": -5.5121989250183105, "global_step": 28848, "epoch": 686} {"train_loss": -5.403187274932861, "global_step": 28849, "epoch": 686} {"train_loss": -5.419711112976074, "global_step": 28850, "epoch": 686} {"train_loss": -5.488865375518799, "global_step": 28851, "epoch": 686} {"train_loss": -5.334406852722168, "global_step": 28852, "epoch": 686} {"train_loss": -5.438825482413883, "global_step": 28853, "epoch": 686, "val_loss": 66877.90625} {"train_loss": -5.362853050231934, "global_step": 28854, "epoch": 687} {"train_loss": -5.335415840148926, "global_step": 28855, "epoch": 687} {"train_loss": -5.43064546585083, "global_step": 28856, "epoch": 687} {"train_loss": -5.435779571533203, "global_step": 28857, "epoch": 687} {"train_loss": -5.402151107788086, "global_step": 28858, "epoch": 687} {"train_loss": -5.4173736572265625, "global_step": 28859, "epoch": 687} {"train_loss": -5.381129264831543, "global_step": 28860, "epoch": 687} {"train_loss": -5.477753639221191, "global_step": 28861, "epoch": 687} {"train_loss": -5.422379970550537, "global_step": 28862, "epoch": 687} {"train_loss": -5.474947929382324, "global_step": 28863, "epoch": 687} {"train_loss": -5.493216514587402, "global_step": 28864, "epoch": 687} {"train_loss": -5.436310768127441, "global_step": 28865, "epoch": 687} {"train_loss": -5.515866279602051, "global_step": 28866, "epoch": 687} {"train_loss": -5.496000289916992, "global_step": 28867, "epoch": 687} {"train_loss": -5.326916694641113, "global_step": 28868, "epoch": 687} {"train_loss": -5.419002056121826, "global_step": 28869, "epoch": 687} {"train_loss": -5.420535087585449, "global_step": 28870, "epoch": 687} {"train_loss": -5.438405513763428, "global_step": 28871, "epoch": 687} {"train_loss": -5.472049236297607, "global_step": 28872, "epoch": 687} {"train_loss": -5.4327073097229, "global_step": 28873, "epoch": 687} {"train_loss": -5.36824369430542, "global_step": 28874, "epoch": 687} {"train_loss": -5.440459251403809, "global_step": 28875, "epoch": 687} {"train_loss": -5.427423477172852, "global_step": 28876, "epoch": 687} {"train_loss": -5.430019378662109, "global_step": 28877, "epoch": 687} {"train_loss": -5.450477600097656, "global_step": 28878, "epoch": 687} {"train_loss": -5.690068244934082, "global_step": 28879, "epoch": 687} {"train_loss": -5.302640914916992, "global_step": 28880, "epoch": 687} {"train_loss": -5.327299118041992, "global_step": 28881, "epoch": 687} {"train_loss": -5.493334770202637, "global_step": 28882, "epoch": 687} {"train_loss": -5.2794952392578125, "global_step": 28883, "epoch": 687} {"train_loss": -5.441438674926758, "global_step": 28884, "epoch": 687} {"train_loss": -5.4692559242248535, "global_step": 28885, "epoch": 687} {"train_loss": -5.601428031921387, "global_step": 28886, "epoch": 687} {"train_loss": -5.429701805114746, "global_step": 28887, "epoch": 687} {"train_loss": -5.535545349121094, "global_step": 28888, "epoch": 687} {"train_loss": -5.532803535461426, "global_step": 28889, "epoch": 687} {"train_loss": -5.416041851043701, "global_step": 28890, "epoch": 687} {"train_loss": -5.490537643432617, "global_step": 28891, "epoch": 687} {"train_loss": -5.333521842956543, "global_step": 28892, "epoch": 687} {"train_loss": -5.4056010246276855, "global_step": 28893, "epoch": 687} {"train_loss": -5.334620952606201, "global_step": 28894, "epoch": 687} {"train_loss": -5.437197185698009, "global_step": 28895, "epoch": 687, "val_loss": 67370.8515625} {"train_loss": -5.466135501861572, "global_step": 28896, "epoch": 688} {"train_loss": -5.4666643142700195, "global_step": 28897, "epoch": 688} {"train_loss": -5.392251014709473, "global_step": 28898, "epoch": 688} {"train_loss": -5.462621688842773, "global_step": 28899, "epoch": 688} {"train_loss": -5.452373504638672, "global_step": 28900, "epoch": 688} {"train_loss": -5.481240749359131, "global_step": 28901, "epoch": 688} {"train_loss": -5.4822998046875, "global_step": 28902, "epoch": 688} {"train_loss": -5.434823036193848, "global_step": 28903, "epoch": 688} {"train_loss": -5.47773551940918, "global_step": 28904, "epoch": 688} {"train_loss": -5.470340728759766, "global_step": 28905, "epoch": 688} {"train_loss": -5.399123668670654, "global_step": 28906, "epoch": 688} {"train_loss": -5.440271854400635, "global_step": 28907, "epoch": 688} {"train_loss": -5.428858757019043, "global_step": 28908, "epoch": 688} {"train_loss": -5.43833589553833, "global_step": 28909, "epoch": 688} {"train_loss": -5.620954513549805, "global_step": 28910, "epoch": 688} {"train_loss": -5.448174476623535, "global_step": 28911, "epoch": 688} {"train_loss": -5.561241626739502, "global_step": 28912, "epoch": 688} {"train_loss": -5.542513847351074, "global_step": 28913, "epoch": 688} {"train_loss": -5.654362678527832, "global_step": 28914, "epoch": 688} {"train_loss": -5.599359035491943, "global_step": 28915, "epoch": 688} {"train_loss": -5.453761100769043, "global_step": 28916, "epoch": 688} {"train_loss": -5.468973636627197, "global_step": 28917, "epoch": 688} {"train_loss": -5.479007720947266, "global_step": 28918, "epoch": 688} {"train_loss": -5.566246032714844, "global_step": 28919, "epoch": 688} {"train_loss": -5.416267395019531, "global_step": 28920, "epoch": 688} {"train_loss": -5.517178058624268, "global_step": 28921, "epoch": 688} {"train_loss": -5.496364593505859, "global_step": 28922, "epoch": 688} {"train_loss": -5.306139945983887, "global_step": 28923, "epoch": 688} {"train_loss": -5.434546947479248, "global_step": 28924, "epoch": 688} {"train_loss": -5.496882438659668, "global_step": 28925, "epoch": 688} {"train_loss": -5.475900650024414, "global_step": 28926, "epoch": 688} {"train_loss": -5.600135326385498, "global_step": 28927, "epoch": 688} {"train_loss": -5.377655506134033, "global_step": 28928, "epoch": 688} {"train_loss": -5.45744514465332, "global_step": 28929, "epoch": 688} {"train_loss": -5.50167179107666, "global_step": 28930, "epoch": 688} {"train_loss": -5.38789176940918, "global_step": 28931, "epoch": 688} {"train_loss": -5.519479751586914, "global_step": 28932, "epoch": 688} {"train_loss": -5.4266557693481445, "global_step": 28933, "epoch": 688} {"train_loss": -5.501001358032227, "global_step": 28934, "epoch": 688} {"train_loss": -5.630222320556641, "global_step": 28935, "epoch": 688} {"train_loss": -5.188549041748047, "global_step": 28936, "epoch": 688} {"train_loss": -5.470752307346889, "global_step": 28937, "epoch": 688, "val_loss": 67096.765625} {"train_loss": -5.511557579040527, "global_step": 28938, "epoch": 689} {"train_loss": -5.336721420288086, "global_step": 28939, "epoch": 689} {"train_loss": -5.572592258453369, "global_step": 28940, "epoch": 689} {"train_loss": -5.325507164001465, "global_step": 28941, "epoch": 689} {"train_loss": -5.553683757781982, "global_step": 28942, "epoch": 689} {"train_loss": -5.227571487426758, "global_step": 28943, "epoch": 689} {"train_loss": -5.3854780197143555, "global_step": 28944, "epoch": 689} {"train_loss": -5.302201271057129, "global_step": 28945, "epoch": 689} {"train_loss": -5.432926654815674, "global_step": 28946, "epoch": 689} {"train_loss": -5.414886951446533, "global_step": 28947, "epoch": 689} {"train_loss": -5.453644752502441, "global_step": 28948, "epoch": 689} {"train_loss": -5.421939849853516, "global_step": 28949, "epoch": 689} {"train_loss": -5.39215087890625, "global_step": 28950, "epoch": 689} {"train_loss": -5.368842601776123, "global_step": 28951, "epoch": 689} {"train_loss": -5.367783069610596, "global_step": 28952, "epoch": 689} {"train_loss": -5.3961358070373535, "global_step": 28953, "epoch": 689} {"train_loss": -5.414185523986816, "global_step": 28954, "epoch": 689} {"train_loss": -5.417019844055176, "global_step": 28955, "epoch": 689} {"train_loss": -5.347203731536865, "global_step": 28956, "epoch": 689} {"train_loss": -5.52940559387207, "global_step": 28957, "epoch": 689} {"train_loss": -5.366924285888672, "global_step": 28958, "epoch": 689} {"train_loss": -5.471278190612793, "global_step": 28959, "epoch": 689} {"train_loss": -5.622801780700684, "global_step": 28960, "epoch": 689} {"train_loss": -5.453683853149414, "global_step": 28961, "epoch": 689} {"train_loss": -5.486943244934082, "global_step": 28962, "epoch": 689} {"train_loss": -5.431487083435059, "global_step": 28963, "epoch": 689} {"train_loss": -5.46873140335083, "global_step": 28964, "epoch": 689} {"train_loss": -5.513258457183838, "global_step": 28965, "epoch": 689} {"train_loss": -5.411864757537842, "global_step": 28966, "epoch": 689} {"train_loss": -5.477835655212402, "global_step": 28967, "epoch": 689} {"train_loss": -5.338873386383057, "global_step": 28968, "epoch": 689} {"train_loss": -5.598524570465088, "global_step": 28969, "epoch": 689} {"train_loss": -5.355022430419922, "global_step": 28970, "epoch": 689} {"train_loss": -5.564509391784668, "global_step": 28971, "epoch": 689} {"train_loss": -5.655256271362305, "global_step": 28972, "epoch": 689} {"train_loss": -5.607990264892578, "global_step": 28973, "epoch": 689} {"train_loss": -5.346165657043457, "global_step": 28974, "epoch": 689} {"train_loss": -5.541474342346191, "global_step": 28975, "epoch": 689} {"train_loss": -5.500061988830566, "global_step": 28976, "epoch": 689} {"train_loss": -5.401983737945557, "global_step": 28977, "epoch": 689} {"train_loss": -5.599830627441406, "global_step": 28978, "epoch": 689} {"train_loss": -5.447176706223261, "global_step": 28979, "epoch": 689, "val_loss": 66641.21875} {"train_loss": -5.42881965637207, "global_step": 28980, "epoch": 690} {"train_loss": -5.304386138916016, "global_step": 28981, "epoch": 690} {"train_loss": -5.475600242614746, "global_step": 28982, "epoch": 690} {"train_loss": -5.437502861022949, "global_step": 28983, "epoch": 690} {"train_loss": -5.428239822387695, "global_step": 28984, "epoch": 690} {"train_loss": -5.531249046325684, "global_step": 28985, "epoch": 690} {"train_loss": -5.574803352355957, "global_step": 28986, "epoch": 690} {"train_loss": -5.6562700271606445, "global_step": 28987, "epoch": 690} {"train_loss": -5.349588871002197, "global_step": 28988, "epoch": 690} {"train_loss": -5.472914695739746, "global_step": 28989, "epoch": 690} {"train_loss": -5.445438385009766, "global_step": 28990, "epoch": 690} {"train_loss": -5.600362777709961, "global_step": 28991, "epoch": 690} {"train_loss": -5.5257086753845215, "global_step": 28992, "epoch": 690} {"train_loss": -5.446812629699707, "global_step": 28993, "epoch": 690} {"train_loss": -5.483399391174316, "global_step": 28994, "epoch": 690} {"train_loss": -5.448451995849609, "global_step": 28995, "epoch": 690} {"train_loss": -5.516397476196289, "global_step": 28996, "epoch": 690} {"train_loss": -5.440120697021484, "global_step": 28997, "epoch": 690} {"train_loss": -5.327624320983887, "global_step": 28998, "epoch": 690} {"train_loss": -5.441283226013184, "global_step": 28999, "epoch": 690} {"train_loss": -5.466064453125, "global_step": 29000, "epoch": 690} {"train_loss": -5.4043660163879395, "global_step": 29001, "epoch": 690} {"train_loss": -5.532078266143799, "global_step": 29002, "epoch": 690} {"train_loss": -5.592470169067383, "global_step": 29003, "epoch": 690} {"train_loss": -5.476276397705078, "global_step": 29004, "epoch": 690} {"train_loss": -5.6480488777160645, "global_step": 29005, "epoch": 690} {"train_loss": -5.499429225921631, "global_step": 29006, "epoch": 690} {"train_loss": -5.473201751708984, "global_step": 29007, "epoch": 690} {"train_loss": -5.5786285400390625, "global_step": 29008, "epoch": 690} {"train_loss": -5.402949333190918, "global_step": 29009, "epoch": 690} {"train_loss": -5.4464921951293945, "global_step": 29010, "epoch": 690} {"train_loss": -5.451032638549805, "global_step": 29011, "epoch": 690} {"train_loss": -5.538536071777344, "global_step": 29012, "epoch": 690} {"train_loss": -5.5389909744262695, "global_step": 29013, "epoch": 690} {"train_loss": -5.431188583374023, "global_step": 29014, "epoch": 690} {"train_loss": -5.526429176330566, "global_step": 29015, "epoch": 690} {"train_loss": -5.568212509155273, "global_step": 29016, "epoch": 690} {"train_loss": -5.553916931152344, "global_step": 29017, "epoch": 690} {"train_loss": -5.553114414215088, "global_step": 29018, "epoch": 690} {"train_loss": -5.529987335205078, "global_step": 29019, "epoch": 690} {"train_loss": -5.4692254066467285, "global_step": 29020, "epoch": 690} {"train_loss": -5.484940040679205, "global_step": 29021, "epoch": 690, "val_loss": 67340.9453125} {"train_loss": -5.402370452880859, "global_step": 29022, "epoch": 691} {"train_loss": -5.423765182495117, "global_step": 29023, "epoch": 691} {"train_loss": -5.458059787750244, "global_step": 29024, "epoch": 691} {"train_loss": -5.352800369262695, "global_step": 29025, "epoch": 691} {"train_loss": -5.496201515197754, "global_step": 29026, "epoch": 691} {"train_loss": -5.443551063537598, "global_step": 29027, "epoch": 691} {"train_loss": -5.472829818725586, "global_step": 29028, "epoch": 691} {"train_loss": -5.386477947235107, "global_step": 29029, "epoch": 691} {"train_loss": -5.5236992835998535, "global_step": 29030, "epoch": 691} {"train_loss": -5.333701133728027, "global_step": 29031, "epoch": 691} {"train_loss": -5.621098518371582, "global_step": 29032, "epoch": 691} {"train_loss": -5.497550010681152, "global_step": 29033, "epoch": 691} {"train_loss": -5.427026271820068, "global_step": 29034, "epoch": 691} {"train_loss": -5.477372646331787, "global_step": 29035, "epoch": 691} {"train_loss": -5.483491897583008, "global_step": 29036, "epoch": 691} {"train_loss": -5.431051254272461, "global_step": 29037, "epoch": 691} {"train_loss": -5.411409378051758, "global_step": 29038, "epoch": 691} {"train_loss": -5.572071075439453, "global_step": 29039, "epoch": 691} {"train_loss": -5.576201438903809, "global_step": 29040, "epoch": 691} {"train_loss": -5.404561519622803, "global_step": 29041, "epoch": 691} {"train_loss": -5.534194469451904, "global_step": 29042, "epoch": 691} {"train_loss": -5.561781883239746, "global_step": 29043, "epoch": 691} {"train_loss": -5.502213478088379, "global_step": 29044, "epoch": 691} {"train_loss": -5.444546699523926, "global_step": 29045, "epoch": 691} {"train_loss": -5.402592658996582, "global_step": 29046, "epoch": 691} {"train_loss": -5.443150520324707, "global_step": 29047, "epoch": 691} {"train_loss": -5.529129981994629, "global_step": 29048, "epoch": 691} {"train_loss": -5.481538772583008, "global_step": 29049, "epoch": 691} {"train_loss": -5.459347248077393, "global_step": 29050, "epoch": 691} {"train_loss": -5.407218933105469, "global_step": 29051, "epoch": 691} {"train_loss": -5.446329116821289, "global_step": 29052, "epoch": 691} {"train_loss": -5.427104949951172, "global_step": 29053, "epoch": 691} {"train_loss": -5.569573402404785, "global_step": 29054, "epoch": 691} {"train_loss": -5.387564659118652, "global_step": 29055, "epoch": 691} {"train_loss": -5.458056449890137, "global_step": 29056, "epoch": 691} {"train_loss": -5.4825944900512695, "global_step": 29057, "epoch": 691} {"train_loss": -5.556400299072266, "global_step": 29058, "epoch": 691} {"train_loss": -5.325495719909668, "global_step": 29059, "epoch": 691} {"train_loss": -5.510402679443359, "global_step": 29060, "epoch": 691} {"train_loss": -5.419632911682129, "global_step": 29061, "epoch": 691} {"train_loss": -5.394418716430664, "global_step": 29062, "epoch": 691} {"train_loss": -5.459087644304548, "global_step": 29063, "epoch": 691, "val_loss": 67023.890625} {"train_loss": -5.444099426269531, "global_step": 29064, "epoch": 692} {"train_loss": -5.310610294342041, "global_step": 29065, "epoch": 692} {"train_loss": -5.4534711837768555, "global_step": 29066, "epoch": 692} {"train_loss": -5.455694198608398, "global_step": 29067, "epoch": 692} {"train_loss": -5.475961208343506, "global_step": 29068, "epoch": 692} {"train_loss": -5.539560317993164, "global_step": 29069, "epoch": 692} {"train_loss": -5.499417781829834, "global_step": 29070, "epoch": 692} {"train_loss": -5.5629072189331055, "global_step": 29071, "epoch": 692} {"train_loss": -5.536317348480225, "global_step": 29072, "epoch": 692} {"train_loss": -5.545226573944092, "global_step": 29073, "epoch": 692} {"train_loss": -5.485682487487793, "global_step": 29074, "epoch": 692} {"train_loss": -5.35406494140625, "global_step": 29075, "epoch": 692} {"train_loss": -5.5145134925842285, "global_step": 29076, "epoch": 692} {"train_loss": -5.432419776916504, "global_step": 29077, "epoch": 692} {"train_loss": -5.556713104248047, "global_step": 29078, "epoch": 692} {"train_loss": -5.583230018615723, "global_step": 29079, "epoch": 692} {"train_loss": -5.535712242126465, "global_step": 29080, "epoch": 692} {"train_loss": -5.340119361877441, "global_step": 29081, "epoch": 692} {"train_loss": -5.393880844116211, "global_step": 29082, "epoch": 692} {"train_loss": -5.43287992477417, "global_step": 29083, "epoch": 692} {"train_loss": -5.471339225769043, "global_step": 29084, "epoch": 692} {"train_loss": -5.334013938903809, "global_step": 29085, "epoch": 692} {"train_loss": -5.4397101402282715, "global_step": 29086, "epoch": 692} {"train_loss": -5.377801418304443, "global_step": 29087, "epoch": 692} {"train_loss": -5.363984107971191, "global_step": 29088, "epoch": 692} {"train_loss": -5.444286823272705, "global_step": 29089, "epoch": 692} {"train_loss": -5.560582160949707, "global_step": 29090, "epoch": 692} {"train_loss": -5.455312728881836, "global_step": 29091, "epoch": 692} {"train_loss": -5.503515243530273, "global_step": 29092, "epoch": 692} {"train_loss": -5.439309120178223, "global_step": 29093, "epoch": 692} {"train_loss": -5.513378143310547, "global_step": 29094, "epoch": 692} {"train_loss": -5.491781234741211, "global_step": 29095, "epoch": 692} {"train_loss": -5.459552764892578, "global_step": 29096, "epoch": 692} {"train_loss": -5.427124500274658, "global_step": 29097, "epoch": 692} {"train_loss": -5.457080841064453, "global_step": 29098, "epoch": 692} {"train_loss": -5.5230712890625, "global_step": 29099, "epoch": 692} {"train_loss": -5.434409141540527, "global_step": 29100, "epoch": 692} {"train_loss": -5.335012435913086, "global_step": 29101, "epoch": 692} {"train_loss": -5.365317344665527, "global_step": 29102, "epoch": 692} {"train_loss": -5.423183441162109, "global_step": 29103, "epoch": 692} {"train_loss": -5.430871963500977, "global_step": 29104, "epoch": 692} {"train_loss": -5.457633529390607, "global_step": 29105, "epoch": 692, "val_loss": 67760.4609375} {"train_loss": -5.342658042907715, "global_step": 29106, "epoch": 693} {"train_loss": -5.350668907165527, "global_step": 29107, "epoch": 693} {"train_loss": -5.438509941101074, "global_step": 29108, "epoch": 693} {"train_loss": -5.511715888977051, "global_step": 29109, "epoch": 693} {"train_loss": -5.384834289550781, "global_step": 29110, "epoch": 693} {"train_loss": -5.508933067321777, "global_step": 29111, "epoch": 693} {"train_loss": -5.42833137512207, "global_step": 29112, "epoch": 693} {"train_loss": -5.477313995361328, "global_step": 29113, "epoch": 693} {"train_loss": -5.43453311920166, "global_step": 29114, "epoch": 693} {"train_loss": -5.28420352935791, "global_step": 29115, "epoch": 693} {"train_loss": -5.589533805847168, "global_step": 29116, "epoch": 693} {"train_loss": -5.371509075164795, "global_step": 29117, "epoch": 693} {"train_loss": -5.5389509201049805, "global_step": 29118, "epoch": 693} {"train_loss": -5.453042507171631, "global_step": 29119, "epoch": 693} {"train_loss": -5.5491132736206055, "global_step": 29120, "epoch": 693} {"train_loss": -5.357351303100586, "global_step": 29121, "epoch": 693} {"train_loss": -5.480766296386719, "global_step": 29122, "epoch": 693} {"train_loss": -5.316414833068848, "global_step": 29123, "epoch": 693} {"train_loss": -5.4435715675354, "global_step": 29124, "epoch": 693} {"train_loss": -5.538562774658203, "global_step": 29125, "epoch": 693} {"train_loss": -5.2950119972229, "global_step": 29126, "epoch": 693} {"train_loss": -5.287999153137207, "global_step": 29127, "epoch": 693} {"train_loss": -5.519853591918945, "global_step": 29128, "epoch": 693} {"train_loss": -5.336335182189941, "global_step": 29129, "epoch": 693} {"train_loss": -5.506417274475098, "global_step": 29130, "epoch": 693} {"train_loss": -5.573038101196289, "global_step": 29131, "epoch": 693} {"train_loss": -5.36872673034668, "global_step": 29132, "epoch": 693} {"train_loss": -5.514931678771973, "global_step": 29133, "epoch": 693} {"train_loss": -5.434028625488281, "global_step": 29134, "epoch": 693} {"train_loss": -5.572998046875, "global_step": 29135, "epoch": 693} {"train_loss": -5.404486179351807, "global_step": 29136, "epoch": 693} {"train_loss": -5.406057357788086, "global_step": 29137, "epoch": 693} {"train_loss": -5.543951034545898, "global_step": 29138, "epoch": 693} {"train_loss": -5.428841590881348, "global_step": 29139, "epoch": 693} {"train_loss": -5.323472023010254, "global_step": 29140, "epoch": 693} {"train_loss": -5.5580220222473145, "global_step": 29141, "epoch": 693} {"train_loss": -5.3786940574646, "global_step": 29142, "epoch": 693} {"train_loss": -5.462225914001465, "global_step": 29143, "epoch": 693} {"train_loss": -5.47227668762207, "global_step": 29144, "epoch": 693} {"train_loss": -5.491925239562988, "global_step": 29145, "epoch": 693} {"train_loss": -5.455778121948242, "global_step": 29146, "epoch": 693} {"train_loss": -5.443965003603981, "global_step": 29147, "epoch": 693, "val_loss": 67679.609375} {"train_loss": -5.483908653259277, "global_step": 29148, "epoch": 694} {"train_loss": -5.47703742980957, "global_step": 29149, "epoch": 694} {"train_loss": -5.442216396331787, "global_step": 29150, "epoch": 694} {"train_loss": -5.355132102966309, "global_step": 29151, "epoch": 694} {"train_loss": -5.585566520690918, "global_step": 29152, "epoch": 694} {"train_loss": -5.48464298248291, "global_step": 29153, "epoch": 694} {"train_loss": -5.372194290161133, "global_step": 29154, "epoch": 694} {"train_loss": -5.460805416107178, "global_step": 29155, "epoch": 694} {"train_loss": -5.397528648376465, "global_step": 29156, "epoch": 694} {"train_loss": -5.349460124969482, "global_step": 29157, "epoch": 694} {"train_loss": -5.417719841003418, "global_step": 29158, "epoch": 694} {"train_loss": -5.530012130737305, "global_step": 29159, "epoch": 694} {"train_loss": -5.480956077575684, "global_step": 29160, "epoch": 694} {"train_loss": -5.418415069580078, "global_step": 29161, "epoch": 694} {"train_loss": -5.389132499694824, "global_step": 29162, "epoch": 694} {"train_loss": -5.433896064758301, "global_step": 29163, "epoch": 694} {"train_loss": -5.5259599685668945, "global_step": 29164, "epoch": 694} {"train_loss": -5.420273303985596, "global_step": 29165, "epoch": 694} {"train_loss": -5.478110313415527, "global_step": 29166, "epoch": 694} {"train_loss": -5.532594680786133, "global_step": 29167, "epoch": 694} {"train_loss": -5.555984973907471, "global_step": 29168, "epoch": 694} {"train_loss": -5.4154205322265625, "global_step": 29169, "epoch": 694} {"train_loss": -5.534669876098633, "global_step": 29170, "epoch": 694} {"train_loss": -5.572881698608398, "global_step": 29171, "epoch": 694} {"train_loss": -5.3992815017700195, "global_step": 29172, "epoch": 694} {"train_loss": -5.4439849853515625, "global_step": 29173, "epoch": 694} {"train_loss": -5.421058177947998, "global_step": 29174, "epoch": 694} {"train_loss": -5.324471473693848, "global_step": 29175, "epoch": 694} {"train_loss": -5.512294769287109, "global_step": 29176, "epoch": 694} {"train_loss": -5.480412483215332, "global_step": 29177, "epoch": 694} {"train_loss": -5.36521053314209, "global_step": 29178, "epoch": 694} {"train_loss": -5.47968053817749, "global_step": 29179, "epoch": 694} {"train_loss": -5.410874843597412, "global_step": 29180, "epoch": 694} {"train_loss": -5.326704502105713, "global_step": 29181, "epoch": 694} {"train_loss": -5.345431327819824, "global_step": 29182, "epoch": 694} {"train_loss": -5.517704010009766, "global_step": 29183, "epoch": 694} {"train_loss": -5.44627571105957, "global_step": 29184, "epoch": 694} {"train_loss": -5.321127891540527, "global_step": 29185, "epoch": 694} {"train_loss": -5.41703462600708, "global_step": 29186, "epoch": 694} {"train_loss": -5.541179656982422, "global_step": 29187, "epoch": 694} {"train_loss": -5.462834358215332, "global_step": 29188, "epoch": 694} {"train_loss": -5.447715498152233, "global_step": 29189, "epoch": 694, "val_loss": 67072.1640625} {"train_loss": -5.500336647033691, "global_step": 29190, "epoch": 695} {"train_loss": -5.558151721954346, "global_step": 29191, "epoch": 695} {"train_loss": -5.373256206512451, "global_step": 29192, "epoch": 695} {"train_loss": -5.503323078155518, "global_step": 29193, "epoch": 695} {"train_loss": -5.304776191711426, "global_step": 29194, "epoch": 695} {"train_loss": -5.533824920654297, "global_step": 29195, "epoch": 695} {"train_loss": -5.35611629486084, "global_step": 29196, "epoch": 695} {"train_loss": -5.4263715744018555, "global_step": 29197, "epoch": 695} {"train_loss": -5.392078399658203, "global_step": 29198, "epoch": 695} {"train_loss": -5.319665431976318, "global_step": 29199, "epoch": 695} {"train_loss": -5.531746864318848, "global_step": 29200, "epoch": 695} {"train_loss": -5.424949645996094, "global_step": 29201, "epoch": 695} {"train_loss": -5.430628776550293, "global_step": 29202, "epoch": 695} {"train_loss": -5.461038589477539, "global_step": 29203, "epoch": 695} {"train_loss": -5.4346747398376465, "global_step": 29204, "epoch": 695} {"train_loss": -5.332372665405273, "global_step": 29205, "epoch": 695} {"train_loss": -5.501333713531494, "global_step": 29206, "epoch": 695} {"train_loss": -5.353711128234863, "global_step": 29207, "epoch": 695} {"train_loss": -5.576797962188721, "global_step": 29208, "epoch": 695} {"train_loss": -5.546870231628418, "global_step": 29209, "epoch": 695} {"train_loss": -5.552753448486328, "global_step": 29210, "epoch": 695} {"train_loss": -5.500662803649902, "global_step": 29211, "epoch": 695} {"train_loss": -5.416399955749512, "global_step": 29212, "epoch": 695} {"train_loss": -5.408806324005127, "global_step": 29213, "epoch": 695} {"train_loss": -5.541539192199707, "global_step": 29214, "epoch": 695} {"train_loss": -5.618186950683594, "global_step": 29215, "epoch": 695} {"train_loss": -5.348804473876953, "global_step": 29216, "epoch": 695} {"train_loss": -5.549301624298096, "global_step": 29217, "epoch": 695} {"train_loss": -5.37516975402832, "global_step": 29218, "epoch": 695} {"train_loss": -5.510348796844482, "global_step": 29219, "epoch": 695} {"train_loss": -5.44393253326416, "global_step": 29220, "epoch": 695} {"train_loss": -5.537391185760498, "global_step": 29221, "epoch": 695} {"train_loss": -5.374214172363281, "global_step": 29222, "epoch": 695} {"train_loss": -5.345473289489746, "global_step": 29223, "epoch": 695} {"train_loss": -5.5225324630737305, "global_step": 29224, "epoch": 695} {"train_loss": -5.475183486938477, "global_step": 29225, "epoch": 695} {"train_loss": -5.4330363273620605, "global_step": 29226, "epoch": 695} {"train_loss": -5.547519683837891, "global_step": 29227, "epoch": 695} {"train_loss": -5.441789150238037, "global_step": 29228, "epoch": 695} {"train_loss": -5.512028694152832, "global_step": 29229, "epoch": 695} {"train_loss": -5.449615955352783, "global_step": 29230, "epoch": 695} {"train_loss": -5.458654369626727, "global_step": 29231, "epoch": 695, "val_loss": 67086.21875} {"train_loss": -5.466651916503906, "global_step": 29232, "epoch": 696} {"train_loss": -5.3551483154296875, "global_step": 29233, "epoch": 696} {"train_loss": -5.472553253173828, "global_step": 29234, "epoch": 696} {"train_loss": -5.4718427658081055, "global_step": 29235, "epoch": 696} {"train_loss": -5.310844421386719, "global_step": 29236, "epoch": 696} {"train_loss": -5.599982738494873, "global_step": 29237, "epoch": 696} {"train_loss": -5.457187652587891, "global_step": 29238, "epoch": 696} {"train_loss": -5.475796699523926, "global_step": 29239, "epoch": 696} {"train_loss": -5.614443778991699, "global_step": 29240, "epoch": 696} {"train_loss": -5.489492416381836, "global_step": 29241, "epoch": 696} {"train_loss": -5.350701808929443, "global_step": 29242, "epoch": 696} {"train_loss": -5.4561614990234375, "global_step": 29243, "epoch": 696} {"train_loss": -5.608752250671387, "global_step": 29244, "epoch": 696} {"train_loss": -5.410966396331787, "global_step": 29245, "epoch": 696} {"train_loss": -5.497073650360107, "global_step": 29246, "epoch": 696} {"train_loss": -5.4101152420043945, "global_step": 29247, "epoch": 696} {"train_loss": -5.370560646057129, "global_step": 29248, "epoch": 696} {"train_loss": -5.567904472351074, "global_step": 29249, "epoch": 696} {"train_loss": -5.424696922302246, "global_step": 29250, "epoch": 696} {"train_loss": -5.384951591491699, "global_step": 29251, "epoch": 696} {"train_loss": -5.445496082305908, "global_step": 29252, "epoch": 696} {"train_loss": -5.597734451293945, "global_step": 29253, "epoch": 696} {"train_loss": -5.461262226104736, "global_step": 29254, "epoch": 696} {"train_loss": -5.434272766113281, "global_step": 29255, "epoch": 696} {"train_loss": -5.435630798339844, "global_step": 29256, "epoch": 696} {"train_loss": -5.559781074523926, "global_step": 29257, "epoch": 696} {"train_loss": -5.373569011688232, "global_step": 29258, "epoch": 696} {"train_loss": -5.556771755218506, "global_step": 29259, "epoch": 696} {"train_loss": -5.47118616104126, "global_step": 29260, "epoch": 696} {"train_loss": -5.4834794998168945, "global_step": 29261, "epoch": 696} {"train_loss": -5.314263343811035, "global_step": 29262, "epoch": 696} {"train_loss": -5.582454204559326, "global_step": 29263, "epoch": 696} {"train_loss": -5.347214221954346, "global_step": 29264, "epoch": 696} {"train_loss": -5.374732971191406, "global_step": 29265, "epoch": 696} {"train_loss": -5.454811096191406, "global_step": 29266, "epoch": 696} {"train_loss": -5.384099960327148, "global_step": 29267, "epoch": 696} {"train_loss": -5.49208927154541, "global_step": 29268, "epoch": 696} {"train_loss": -5.537024974822998, "global_step": 29269, "epoch": 696} {"train_loss": -5.419780731201172, "global_step": 29270, "epoch": 696} {"train_loss": -5.561557292938232, "global_step": 29271, "epoch": 696} {"train_loss": -5.364889144897461, "global_step": 29272, "epoch": 696} {"train_loss": -5.460385050092425, "global_step": 29273, "epoch": 696, "val_loss": 67036.046875} {"train_loss": -5.521763801574707, "global_step": 29274, "epoch": 697} {"train_loss": -5.4213104248046875, "global_step": 29275, "epoch": 697} {"train_loss": -5.540045738220215, "global_step": 29276, "epoch": 697} {"train_loss": -5.446731090545654, "global_step": 29277, "epoch": 697} {"train_loss": -5.475165843963623, "global_step": 29278, "epoch": 697} {"train_loss": -5.437188148498535, "global_step": 29279, "epoch": 697} {"train_loss": -5.418710708618164, "global_step": 29280, "epoch": 697} {"train_loss": -5.413583755493164, "global_step": 29281, "epoch": 697} {"train_loss": -5.483144760131836, "global_step": 29282, "epoch": 697} {"train_loss": -5.525306701660156, "global_step": 29283, "epoch": 697} {"train_loss": -5.282166004180908, "global_step": 29284, "epoch": 697} {"train_loss": -5.567997932434082, "global_step": 29285, "epoch": 697} {"train_loss": -5.415984153747559, "global_step": 29286, "epoch": 697} {"train_loss": -5.4230241775512695, "global_step": 29287, "epoch": 697} {"train_loss": -5.4469146728515625, "global_step": 29288, "epoch": 697} {"train_loss": -5.4516825675964355, "global_step": 29289, "epoch": 697} {"train_loss": -5.457765579223633, "global_step": 29290, "epoch": 697} {"train_loss": -5.423978328704834, "global_step": 29291, "epoch": 697} {"train_loss": -5.551755428314209, "global_step": 29292, "epoch": 697} {"train_loss": -5.273138046264648, "global_step": 29293, "epoch": 697} {"train_loss": -5.450252532958984, "global_step": 29294, "epoch": 697} {"train_loss": -5.355229377746582, "global_step": 29295, "epoch": 697} {"train_loss": -5.382092475891113, "global_step": 29296, "epoch": 697} {"train_loss": -5.309133529663086, "global_step": 29297, "epoch": 697} {"train_loss": -5.265782356262207, "global_step": 29298, "epoch": 697} {"train_loss": -5.5168962478637695, "global_step": 29299, "epoch": 697} {"train_loss": -5.4080400466918945, "global_step": 29300, "epoch": 697} {"train_loss": -5.417579174041748, "global_step": 29301, "epoch": 697} {"train_loss": -5.455183982849121, "global_step": 29302, "epoch": 697} {"train_loss": -5.338777542114258, "global_step": 29303, "epoch": 697} {"train_loss": -5.448324680328369, "global_step": 29304, "epoch": 697} {"train_loss": -5.443716049194336, "global_step": 29305, "epoch": 697} {"train_loss": -5.32347297668457, "global_step": 29306, "epoch": 697} {"train_loss": -5.455780029296875, "global_step": 29307, "epoch": 697} {"train_loss": -5.60482931137085, "global_step": 29308, "epoch": 697} {"train_loss": -5.626212120056152, "global_step": 29309, "epoch": 697} {"train_loss": -5.53776741027832, "global_step": 29310, "epoch": 697} {"train_loss": -5.564270496368408, "global_step": 29311, "epoch": 697} {"train_loss": -5.397574424743652, "global_step": 29312, "epoch": 697} {"train_loss": -5.480249404907227, "global_step": 29313, "epoch": 697} {"train_loss": -5.508340358734131, "global_step": 29314, "epoch": 697} {"train_loss": -5.447497799282982, "global_step": 29315, "epoch": 697, "val_loss": 67221.046875} {"train_loss": -5.4867143630981445, "global_step": 29316, "epoch": 698} {"train_loss": -5.481225967407227, "global_step": 29317, "epoch": 698} {"train_loss": -5.396871089935303, "global_step": 29318, "epoch": 698} {"train_loss": -5.475455284118652, "global_step": 29319, "epoch": 698} {"train_loss": -5.4679951667785645, "global_step": 29320, "epoch": 698} {"train_loss": -5.617850303649902, "global_step": 29321, "epoch": 698} {"train_loss": -5.435263633728027, "global_step": 29322, "epoch": 698} {"train_loss": -5.609941005706787, "global_step": 29323, "epoch": 698} {"train_loss": -5.558996677398682, "global_step": 29324, "epoch": 698} {"train_loss": -5.44984245300293, "global_step": 29325, "epoch": 698} {"train_loss": -5.427356243133545, "global_step": 29326, "epoch": 698} {"train_loss": -5.485457897186279, "global_step": 29327, "epoch": 698} {"train_loss": -5.424988746643066, "global_step": 29328, "epoch": 698} {"train_loss": -5.496945381164551, "global_step": 29329, "epoch": 698} {"train_loss": -5.480910301208496, "global_step": 29330, "epoch": 698} {"train_loss": -5.519249439239502, "global_step": 29331, "epoch": 698} {"train_loss": -5.440919876098633, "global_step": 29332, "epoch": 698} {"train_loss": -5.486952781677246, "global_step": 29333, "epoch": 698} {"train_loss": -5.462799549102783, "global_step": 29334, "epoch": 698} {"train_loss": -5.446303367614746, "global_step": 29335, "epoch": 698} {"train_loss": -5.663643836975098, "global_step": 29336, "epoch": 698} {"train_loss": -5.442262649536133, "global_step": 29337, "epoch": 698} {"train_loss": -5.577035903930664, "global_step": 29338, "epoch": 698} {"train_loss": -5.6304402351379395, "global_step": 29339, "epoch": 698} {"train_loss": -5.477801322937012, "global_step": 29340, "epoch": 698} {"train_loss": -5.511771202087402, "global_step": 29341, "epoch": 698} {"train_loss": -5.502384185791016, "global_step": 29342, "epoch": 698} {"train_loss": -5.5764570236206055, "global_step": 29343, "epoch": 698} {"train_loss": -5.28753662109375, "global_step": 29344, "epoch": 698} {"train_loss": -5.547804832458496, "global_step": 29345, "epoch": 698} {"train_loss": -5.556303024291992, "global_step": 29346, "epoch": 698} {"train_loss": -5.319494247436523, "global_step": 29347, "epoch": 698} {"train_loss": -5.385390758514404, "global_step": 29348, "epoch": 698} {"train_loss": -5.625553131103516, "global_step": 29349, "epoch": 698} {"train_loss": -5.37382173538208, "global_step": 29350, "epoch": 698} {"train_loss": -5.473545551300049, "global_step": 29351, "epoch": 698} {"train_loss": -5.345229148864746, "global_step": 29352, "epoch": 698} {"train_loss": -5.540994167327881, "global_step": 29353, "epoch": 698} {"train_loss": -5.492124557495117, "global_step": 29354, "epoch": 698} {"train_loss": -5.428277969360352, "global_step": 29355, "epoch": 698} {"train_loss": -5.294972896575928, "global_step": 29356, "epoch": 698} {"train_loss": -5.484556777136667, "global_step": 29357, "epoch": 698, "val_loss": 67698.6484375} {"train_loss": -5.45231294631958, "global_step": 29358, "epoch": 699} {"train_loss": -5.315145492553711, "global_step": 29359, "epoch": 699} {"train_loss": -5.531493186950684, "global_step": 29360, "epoch": 699} {"train_loss": -5.395550727844238, "global_step": 29361, "epoch": 699} {"train_loss": -5.2219319343566895, "global_step": 29362, "epoch": 699} {"train_loss": -5.574828147888184, "global_step": 29363, "epoch": 699} {"train_loss": -5.373190879821777, "global_step": 29364, "epoch": 699} {"train_loss": -5.488447666168213, "global_step": 29365, "epoch": 699} {"train_loss": -5.707841396331787, "global_step": 29366, "epoch": 699} {"train_loss": -5.376618385314941, "global_step": 29367, "epoch": 699} {"train_loss": -5.432214736938477, "global_step": 29368, "epoch": 699} {"train_loss": -5.4168596267700195, "global_step": 29369, "epoch": 699} {"train_loss": -5.359683990478516, "global_step": 29370, "epoch": 699} {"train_loss": -5.348597526550293, "global_step": 29371, "epoch": 699} {"train_loss": -5.541840553283691, "global_step": 29372, "epoch": 699} {"train_loss": -5.473666191101074, "global_step": 29373, "epoch": 699} {"train_loss": -5.453643798828125, "global_step": 29374, "epoch": 699} {"train_loss": -5.455991744995117, "global_step": 29375, "epoch": 699} {"train_loss": -5.338464736938477, "global_step": 29376, "epoch": 699} {"train_loss": -5.443865776062012, "global_step": 29377, "epoch": 699} {"train_loss": -5.567753791809082, "global_step": 29378, "epoch": 699} {"train_loss": -5.529548645019531, "global_step": 29379, "epoch": 699} {"train_loss": -5.580920219421387, "global_step": 29380, "epoch": 699} {"train_loss": -5.609630107879639, "global_step": 29381, "epoch": 699} {"train_loss": -5.539559841156006, "global_step": 29382, "epoch": 699} {"train_loss": -5.456717491149902, "global_step": 29383, "epoch": 699} {"train_loss": -5.427305221557617, "global_step": 29384, "epoch": 699} {"train_loss": -5.494838714599609, "global_step": 29385, "epoch": 699} {"train_loss": -5.680943012237549, "global_step": 29386, "epoch": 699} {"train_loss": -5.473793983459473, "global_step": 29387, "epoch": 699} {"train_loss": -5.367133140563965, "global_step": 29388, "epoch": 699} {"train_loss": -5.468496322631836, "global_step": 29389, "epoch": 699} {"train_loss": -5.5329389572143555, "global_step": 29390, "epoch": 699} {"train_loss": -5.551025390625, "global_step": 29391, "epoch": 699} {"train_loss": -5.510583877563477, "global_step": 29392, "epoch": 699} {"train_loss": -5.435457706451416, "global_step": 29393, "epoch": 699} {"train_loss": -5.374622821807861, "global_step": 29394, "epoch": 699} {"train_loss": -5.519424915313721, "global_step": 29395, "epoch": 699} {"train_loss": -5.418479919433594, "global_step": 29396, "epoch": 699} {"train_loss": -5.483194828033447, "global_step": 29397, "epoch": 699} {"train_loss": -5.556056022644043, "global_step": 29398, "epoch": 699} {"train_loss": -5.472592331114269, "global_step": 29399, "epoch": 699, "val_loss": 66822.6796875} {"train_loss": -5.532301902770996, "global_step": 29400, "epoch": 700} {"train_loss": -5.423565864562988, "global_step": 29401, "epoch": 700} {"train_loss": -5.446715354919434, "global_step": 29402, "epoch": 700} {"train_loss": -5.486412048339844, "global_step": 29403, "epoch": 700} {"train_loss": -5.530467510223389, "global_step": 29404, "epoch": 700} {"train_loss": -5.4506988525390625, "global_step": 29405, "epoch": 700} {"train_loss": -5.51821231842041, "global_step": 29406, "epoch": 700} {"train_loss": -5.4837141036987305, "global_step": 29407, "epoch": 700} {"train_loss": -5.559062957763672, "global_step": 29408, "epoch": 700} {"train_loss": -5.501643180847168, "global_step": 29409, "epoch": 700} {"train_loss": -5.4149627685546875, "global_step": 29410, "epoch": 700} {"train_loss": -5.388411998748779, "global_step": 29411, "epoch": 700} {"train_loss": -5.519594669342041, "global_step": 29412, "epoch": 700} {"train_loss": -5.455000877380371, "global_step": 29413, "epoch": 700} {"train_loss": -5.522158622741699, "global_step": 29414, "epoch": 700} {"train_loss": -5.584098815917969, "global_step": 29415, "epoch": 700} {"train_loss": -5.522355079650879, "global_step": 29416, "epoch": 700} {"train_loss": -5.572263717651367, "global_step": 29417, "epoch": 700} {"train_loss": -5.479958534240723, "global_step": 29418, "epoch": 700} {"train_loss": -5.442731857299805, "global_step": 29419, "epoch": 700} {"train_loss": -5.522963523864746, "global_step": 29420, "epoch": 700} {"train_loss": -5.379639625549316, "global_step": 29421, "epoch": 700} {"train_loss": -5.328375816345215, "global_step": 29422, "epoch": 700} {"train_loss": -5.548126220703125, "global_step": 29423, "epoch": 700} {"train_loss": -5.4305219650268555, "global_step": 29424, "epoch": 700} {"train_loss": -5.544246673583984, "global_step": 29425, "epoch": 700} {"train_loss": -5.3519792556762695, "global_step": 29426, "epoch": 700} {"train_loss": -5.504711151123047, "global_step": 29427, "epoch": 700} {"train_loss": -5.392318248748779, "global_step": 29428, "epoch": 700} {"train_loss": -5.365625858306885, "global_step": 29429, "epoch": 700} {"train_loss": -5.3773651123046875, "global_step": 29430, "epoch": 700} {"train_loss": -5.466134071350098, "global_step": 29431, "epoch": 700} {"train_loss": -5.532740592956543, "global_step": 29432, "epoch": 700} {"train_loss": -5.4878973960876465, "global_step": 29433, "epoch": 700} {"train_loss": -5.3592753410339355, "global_step": 29434, "epoch": 700} {"train_loss": -5.352100849151611, "global_step": 29435, "epoch": 700} {"train_loss": -5.376816749572754, "global_step": 29436, "epoch": 700} {"train_loss": -5.468533515930176, "global_step": 29437, "epoch": 700} {"train_loss": -5.3840179443359375, "global_step": 29438, "epoch": 700} {"train_loss": -5.558767318725586, "global_step": 29439, "epoch": 700} {"train_loss": -5.441590785980225, "global_step": 29440, "epoch": 700} {"train_loss": -5.465270133245559, "global_step": 29441, "epoch": 700, "train/sim_max_reward_0": 0.9671528971725626, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.6632147476517539, "train/sim_max_reward_3": 0.1684786647170538, "train/sim_max_reward_4": 0.3994127231965418, "train/sim_max_reward_5": 0.5476570281270577, "test/sim_max_reward_4400000": 0.17610382935697763, "test/sim_max_reward_4400001": 0.2906337410282143, "test/sim_max_reward_4400002": 0.3434561376730912, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.5087566436881995, "test/sim_max_reward_4400005": 0.16713048838004904, "test/sim_max_reward_4400006": 0.3381698637137593, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.8986658953090509, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.1651111783899076, "test/sim_max_reward_4400012": 0.35450279674082774, "test/sim_max_reward_4400013": 0.8826058956054756, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.14052195435174683, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.374224851469076, "test/sim_max_reward_4400019": 0.4586347538350885, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.025085055794885142, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 4.1610210036222625e-07, "test/sim_max_reward_4400028": 0.0440868411545048, "test/sim_max_reward_4400029": 0.9262048305959869, "test/sim_max_reward_4400030": 0.650390972431504, "test/sim_max_reward_4400031": 0.6140868301835042, "test/sim_max_reward_4400032": 0.43827528830368856, "test/sim_max_reward_4400033": 0.1388355013391034, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.34382175678134064, "test/sim_max_reward_4400036": 0.460583119843114, "test/sim_max_reward_4400037": 0.2877385239284327, "test/sim_max_reward_4400038": 0.4645039448599121, "test/sim_max_reward_4400039": 0.7242638902591922, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7525910466481539, "test/sim_max_reward_4400042": 0.007227341673994632, "test/sim_max_reward_4400043": 0.4625635381752513, "test/sim_max_reward_4400044": 0.0012902502696087986, "test/sim_max_reward_4400045": 0.7306998562353247, "test/sim_max_reward_4400046": 0.8138136573082528, "test/sim_max_reward_4400047": 0.18000856215466324, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.45776525701446147, "test/mean_score": 0.2858179782735383, "val_loss": 67351.234375} {"train_loss": -5.427119255065918, "global_step": 29442, "epoch": 701} {"train_loss": -5.477668762207031, "global_step": 29443, "epoch": 701} {"train_loss": -5.459657669067383, "global_step": 29444, "epoch": 701} {"train_loss": -5.356624603271484, "global_step": 29445, "epoch": 701} {"train_loss": -5.336666107177734, "global_step": 29446, "epoch": 701} {"train_loss": -5.486323356628418, "global_step": 29447, "epoch": 701} {"train_loss": -5.33250093460083, "global_step": 29448, "epoch": 701} {"train_loss": -5.454700946807861, "global_step": 29449, "epoch": 701} {"train_loss": -5.4223856925964355, "global_step": 29450, "epoch": 701} {"train_loss": -5.486225128173828, "global_step": 29451, "epoch": 701} {"train_loss": -5.494115829467773, "global_step": 29452, "epoch": 701} {"train_loss": -5.476917266845703, "global_step": 29453, "epoch": 701} {"train_loss": -5.447296619415283, "global_step": 29454, "epoch": 701} {"train_loss": -5.40595817565918, "global_step": 29455, "epoch": 701} {"train_loss": -5.494351387023926, "global_step": 29456, "epoch": 701} {"train_loss": -5.2714104652404785, "global_step": 29457, "epoch": 701} {"train_loss": -5.458861827850342, "global_step": 29458, "epoch": 701} {"train_loss": -5.422772407531738, "global_step": 29459, "epoch": 701} {"train_loss": -5.375044345855713, "global_step": 29460, "epoch": 701} {"train_loss": -5.599271774291992, "global_step": 29461, "epoch": 701} {"train_loss": -5.582217216491699, "global_step": 29462, "epoch": 701} {"train_loss": -5.362208366394043, "global_step": 29463, "epoch": 701} {"train_loss": -5.55595588684082, "global_step": 29464, "epoch": 701} {"train_loss": -5.5176849365234375, "global_step": 29465, "epoch": 701} {"train_loss": -5.463796615600586, "global_step": 29466, "epoch": 701} {"train_loss": -5.657166004180908, "global_step": 29467, "epoch": 701} {"train_loss": -5.401925563812256, "global_step": 29468, "epoch": 701} {"train_loss": -5.524929523468018, "global_step": 29469, "epoch": 701} {"train_loss": -5.385427474975586, "global_step": 29470, "epoch": 701} {"train_loss": -5.404182434082031, "global_step": 29471, "epoch": 701} {"train_loss": -5.558206081390381, "global_step": 29472, "epoch": 701} {"train_loss": -5.4681477546691895, "global_step": 29473, "epoch": 701} {"train_loss": -5.545920372009277, "global_step": 29474, "epoch": 701} {"train_loss": -5.412720203399658, "global_step": 29475, "epoch": 701} {"train_loss": -5.308881759643555, "global_step": 29476, "epoch": 701} {"train_loss": -5.391970157623291, "global_step": 29477, "epoch": 701} {"train_loss": -5.475222110748291, "global_step": 29478, "epoch": 701} {"train_loss": -5.373417854309082, "global_step": 29479, "epoch": 701} {"train_loss": -5.485535621643066, "global_step": 29480, "epoch": 701} {"train_loss": -5.416276454925537, "global_step": 29481, "epoch": 701} {"train_loss": -5.4898200035095215, "global_step": 29482, "epoch": 701} {"train_loss": -5.448878787812733, "global_step": 29483, "epoch": 701, "val_loss": 67045.0546875} {"train_loss": -5.3427228927612305, "global_step": 29484, "epoch": 702} {"train_loss": -5.35715389251709, "global_step": 29485, "epoch": 702} {"train_loss": -5.502195358276367, "global_step": 29486, "epoch": 702} {"train_loss": -5.305442810058594, "global_step": 29487, "epoch": 702} {"train_loss": -5.525676727294922, "global_step": 29488, "epoch": 702} {"train_loss": -5.438096523284912, "global_step": 29489, "epoch": 702} {"train_loss": -5.464221477508545, "global_step": 29490, "epoch": 702} {"train_loss": -5.335894584655762, "global_step": 29491, "epoch": 702} {"train_loss": -5.405708312988281, "global_step": 29492, "epoch": 702} {"train_loss": -5.477910995483398, "global_step": 29493, "epoch": 702} {"train_loss": -5.505274772644043, "global_step": 29494, "epoch": 702} {"train_loss": -5.591736316680908, "global_step": 29495, "epoch": 702} {"train_loss": -5.600762367248535, "global_step": 29496, "epoch": 702} {"train_loss": -5.378233432769775, "global_step": 29497, "epoch": 702} {"train_loss": -5.477643966674805, "global_step": 29498, "epoch": 702} {"train_loss": -5.604401588439941, "global_step": 29499, "epoch": 702} {"train_loss": -5.535590171813965, "global_step": 29500, "epoch": 702} {"train_loss": -5.637311935424805, "global_step": 29501, "epoch": 702} {"train_loss": -5.435704231262207, "global_step": 29502, "epoch": 702} {"train_loss": -5.441980361938477, "global_step": 29503, "epoch": 702} {"train_loss": -5.558310508728027, "global_step": 29504, "epoch": 702} {"train_loss": -5.330532073974609, "global_step": 29505, "epoch": 702} {"train_loss": -5.373988151550293, "global_step": 29506, "epoch": 702} {"train_loss": -5.5770792961120605, "global_step": 29507, "epoch": 702} {"train_loss": -5.319708824157715, "global_step": 29508, "epoch": 702} {"train_loss": -5.33025598526001, "global_step": 29509, "epoch": 702} {"train_loss": -5.7026801109313965, "global_step": 29510, "epoch": 702} {"train_loss": -5.542087078094482, "global_step": 29511, "epoch": 702} {"train_loss": -5.351466655731201, "global_step": 29512, "epoch": 702} {"train_loss": -5.588672637939453, "global_step": 29513, "epoch": 702} {"train_loss": -5.386854648590088, "global_step": 29514, "epoch": 702} {"train_loss": -5.424844741821289, "global_step": 29515, "epoch": 702} {"train_loss": -5.526885986328125, "global_step": 29516, "epoch": 702} {"train_loss": -5.30322790145874, "global_step": 29517, "epoch": 702} {"train_loss": -5.406313896179199, "global_step": 29518, "epoch": 702} {"train_loss": -5.463469505310059, "global_step": 29519, "epoch": 702} {"train_loss": -5.54256534576416, "global_step": 29520, "epoch": 702} {"train_loss": -5.446811676025391, "global_step": 29521, "epoch": 702} {"train_loss": -5.384888648986816, "global_step": 29522, "epoch": 702} {"train_loss": -5.475089073181152, "global_step": 29523, "epoch": 702} {"train_loss": -5.502871036529541, "global_step": 29524, "epoch": 702} {"train_loss": -5.462593464624314, "global_step": 29525, "epoch": 702, "val_loss": 66835.8125} {"train_loss": -5.434237957000732, "global_step": 29526, "epoch": 703} {"train_loss": -5.322141647338867, "global_step": 29527, "epoch": 703} {"train_loss": -5.391916751861572, "global_step": 29528, "epoch": 703} {"train_loss": -5.377376556396484, "global_step": 29529, "epoch": 703} {"train_loss": -5.549527168273926, "global_step": 29530, "epoch": 703} {"train_loss": -5.488558769226074, "global_step": 29531, "epoch": 703} {"train_loss": -5.556084632873535, "global_step": 29532, "epoch": 703} {"train_loss": -5.377623558044434, "global_step": 29533, "epoch": 703} {"train_loss": -5.243948936462402, "global_step": 29534, "epoch": 703} {"train_loss": -5.412728309631348, "global_step": 29535, "epoch": 703} {"train_loss": -5.430922031402588, "global_step": 29536, "epoch": 703} {"train_loss": -5.428993225097656, "global_step": 29537, "epoch": 703} {"train_loss": -5.444916725158691, "global_step": 29538, "epoch": 703} {"train_loss": -5.600743293762207, "global_step": 29539, "epoch": 703} {"train_loss": -5.367597579956055, "global_step": 29540, "epoch": 703} {"train_loss": -5.452422142028809, "global_step": 29541, "epoch": 703} {"train_loss": -5.5028910636901855, "global_step": 29542, "epoch": 703} {"train_loss": -5.376039505004883, "global_step": 29543, "epoch": 703} {"train_loss": -5.371127128601074, "global_step": 29544, "epoch": 703} {"train_loss": -5.405721187591553, "global_step": 29545, "epoch": 703} {"train_loss": -5.426305294036865, "global_step": 29546, "epoch": 703} {"train_loss": -5.448247909545898, "global_step": 29547, "epoch": 703} {"train_loss": -5.487359523773193, "global_step": 29548, "epoch": 703} {"train_loss": -5.364292144775391, "global_step": 29549, "epoch": 703} {"train_loss": -5.487119674682617, "global_step": 29550, "epoch": 703} {"train_loss": -5.475162506103516, "global_step": 29551, "epoch": 703} {"train_loss": -5.532366752624512, "global_step": 29552, "epoch": 703} {"train_loss": -5.4649810791015625, "global_step": 29553, "epoch": 703} {"train_loss": -5.580077171325684, "global_step": 29554, "epoch": 703} {"train_loss": -5.471900939941406, "global_step": 29555, "epoch": 703} {"train_loss": -5.505322456359863, "global_step": 29556, "epoch": 703} {"train_loss": -5.330454349517822, "global_step": 29557, "epoch": 703} {"train_loss": -5.441484451293945, "global_step": 29558, "epoch": 703} {"train_loss": -5.545565605163574, "global_step": 29559, "epoch": 703} {"train_loss": -5.493293762207031, "global_step": 29560, "epoch": 703} {"train_loss": -5.363320350646973, "global_step": 29561, "epoch": 703} {"train_loss": -5.6460466384887695, "global_step": 29562, "epoch": 703} {"train_loss": -5.503451347351074, "global_step": 29563, "epoch": 703} {"train_loss": -5.448564052581787, "global_step": 29564, "epoch": 703} {"train_loss": -5.594366073608398, "global_step": 29565, "epoch": 703} {"train_loss": -5.533656120300293, "global_step": 29566, "epoch": 703} {"train_loss": -5.457849457150414, "global_step": 29567, "epoch": 703, "val_loss": 67107.3359375} {"train_loss": -5.361751556396484, "global_step": 29568, "epoch": 704} {"train_loss": -5.467487335205078, "global_step": 29569, "epoch": 704} {"train_loss": -5.510236740112305, "global_step": 29570, "epoch": 704} {"train_loss": -5.384078502655029, "global_step": 29571, "epoch": 704} {"train_loss": -5.297465801239014, "global_step": 29572, "epoch": 704} {"train_loss": -5.636020660400391, "global_step": 29573, "epoch": 704} {"train_loss": -5.679872989654541, "global_step": 29574, "epoch": 704} {"train_loss": -5.592851638793945, "global_step": 29575, "epoch": 704} {"train_loss": -5.483551979064941, "global_step": 29576, "epoch": 704} {"train_loss": -5.371149063110352, "global_step": 29577, "epoch": 704} {"train_loss": -5.492116451263428, "global_step": 29578, "epoch": 704} {"train_loss": -5.501315116882324, "global_step": 29579, "epoch": 704} {"train_loss": -5.399765968322754, "global_step": 29580, "epoch": 704} {"train_loss": -5.546392917633057, "global_step": 29581, "epoch": 704} {"train_loss": -5.297621726989746, "global_step": 29582, "epoch": 704} {"train_loss": -5.348586082458496, "global_step": 29583, "epoch": 704} {"train_loss": -5.407923698425293, "global_step": 29584, "epoch": 704} {"train_loss": -5.452608108520508, "global_step": 29585, "epoch": 704} {"train_loss": -5.554035663604736, "global_step": 29586, "epoch": 704} {"train_loss": -5.496219635009766, "global_step": 29587, "epoch": 704} {"train_loss": -5.483088493347168, "global_step": 29588, "epoch": 704} {"train_loss": -5.564297676086426, "global_step": 29589, "epoch": 704} {"train_loss": -5.429636001586914, "global_step": 29590, "epoch": 704} {"train_loss": -5.456715106964111, "global_step": 29591, "epoch": 704} {"train_loss": -5.590113639831543, "global_step": 29592, "epoch": 704} {"train_loss": -5.478232383728027, "global_step": 29593, "epoch": 704} {"train_loss": -5.415283203125, "global_step": 29594, "epoch": 704} {"train_loss": -5.532424449920654, "global_step": 29595, "epoch": 704} {"train_loss": -5.5329742431640625, "global_step": 29596, "epoch": 704} {"train_loss": -5.428335189819336, "global_step": 29597, "epoch": 704} {"train_loss": -5.620386600494385, "global_step": 29598, "epoch": 704} {"train_loss": -5.471262454986572, "global_step": 29599, "epoch": 704} {"train_loss": -5.524129867553711, "global_step": 29600, "epoch": 704} {"train_loss": -5.544526100158691, "global_step": 29601, "epoch": 704} {"train_loss": -5.474601745605469, "global_step": 29602, "epoch": 704} {"train_loss": -5.506965160369873, "global_step": 29603, "epoch": 704} {"train_loss": -5.424591541290283, "global_step": 29604, "epoch": 704} {"train_loss": -5.471231460571289, "global_step": 29605, "epoch": 704} {"train_loss": -5.350512504577637, "global_step": 29606, "epoch": 704} {"train_loss": -5.572720527648926, "global_step": 29607, "epoch": 704} {"train_loss": -5.567593574523926, "global_step": 29608, "epoch": 704} {"train_loss": -5.481336718513852, "global_step": 29609, "epoch": 704, "val_loss": 67819.640625} {"train_loss": -5.521060943603516, "global_step": 29610, "epoch": 705} {"train_loss": -5.343852996826172, "global_step": 29611, "epoch": 705} {"train_loss": -5.495786190032959, "global_step": 29612, "epoch": 705} {"train_loss": -5.51375675201416, "global_step": 29613, "epoch": 705} {"train_loss": -5.5007004737854, "global_step": 29614, "epoch": 705} {"train_loss": -5.521475315093994, "global_step": 29615, "epoch": 705} {"train_loss": -5.417104244232178, "global_step": 29616, "epoch": 705} {"train_loss": -5.547018051147461, "global_step": 29617, "epoch": 705} {"train_loss": -5.533894062042236, "global_step": 29618, "epoch": 705} {"train_loss": -5.580750942230225, "global_step": 29619, "epoch": 705} {"train_loss": -5.5157647132873535, "global_step": 29620, "epoch": 705} {"train_loss": -5.444540500640869, "global_step": 29621, "epoch": 705} {"train_loss": -5.4621076583862305, "global_step": 29622, "epoch": 705} {"train_loss": -5.232047080993652, "global_step": 29623, "epoch": 705} {"train_loss": -5.496002197265625, "global_step": 29624, "epoch": 705} {"train_loss": -5.503778457641602, "global_step": 29625, "epoch": 705} {"train_loss": -5.544252872467041, "global_step": 29626, "epoch": 705} {"train_loss": -5.467265605926514, "global_step": 29627, "epoch": 705} {"train_loss": -5.494577407836914, "global_step": 29628, "epoch": 705} {"train_loss": -5.33767032623291, "global_step": 29629, "epoch": 705} {"train_loss": -5.485799789428711, "global_step": 29630, "epoch": 705} {"train_loss": -5.490033149719238, "global_step": 29631, "epoch": 705} {"train_loss": -5.265941619873047, "global_step": 29632, "epoch": 705} {"train_loss": -5.40013313293457, "global_step": 29633, "epoch": 705} {"train_loss": -5.376021385192871, "global_step": 29634, "epoch": 705} {"train_loss": -5.5086565017700195, "global_step": 29635, "epoch": 705} {"train_loss": -5.4826178550720215, "global_step": 29636, "epoch": 705} {"train_loss": -5.544897079467773, "global_step": 29637, "epoch": 705} {"train_loss": -5.594961643218994, "global_step": 29638, "epoch": 705} {"train_loss": -5.357363700866699, "global_step": 29639, "epoch": 705} {"train_loss": -5.528064727783203, "global_step": 29640, "epoch": 705} {"train_loss": -5.313137531280518, "global_step": 29641, "epoch": 705} {"train_loss": -5.487800598144531, "global_step": 29642, "epoch": 705} {"train_loss": -5.321441173553467, "global_step": 29643, "epoch": 705} {"train_loss": -5.417349815368652, "global_step": 29644, "epoch": 705} {"train_loss": -5.468731880187988, "global_step": 29645, "epoch": 705} {"train_loss": -5.517378807067871, "global_step": 29646, "epoch": 705} {"train_loss": -5.433717727661133, "global_step": 29647, "epoch": 705} {"train_loss": -5.429931640625, "global_step": 29648, "epoch": 705} {"train_loss": -5.369166851043701, "global_step": 29649, "epoch": 705} {"train_loss": -5.413697719573975, "global_step": 29650, "epoch": 705} {"train_loss": -5.456824177787418, "global_step": 29651, "epoch": 705, "val_loss": 67049.25} {"train_loss": -5.39946985244751, "global_step": 29652, "epoch": 706} {"train_loss": -5.432934761047363, "global_step": 29653, "epoch": 706} {"train_loss": -5.617470741271973, "global_step": 29654, "epoch": 706} {"train_loss": -5.525252342224121, "global_step": 29655, "epoch": 706} {"train_loss": -5.410853862762451, "global_step": 29656, "epoch": 706} {"train_loss": -5.494762420654297, "global_step": 29657, "epoch": 706} {"train_loss": -5.453521728515625, "global_step": 29658, "epoch": 706} {"train_loss": -5.531015872955322, "global_step": 29659, "epoch": 706} {"train_loss": -5.475368499755859, "global_step": 29660, "epoch": 706} {"train_loss": -5.464113235473633, "global_step": 29661, "epoch": 706} {"train_loss": -5.562647819519043, "global_step": 29662, "epoch": 706} {"train_loss": -5.458892345428467, "global_step": 29663, "epoch": 706} {"train_loss": -5.468388557434082, "global_step": 29664, "epoch": 706} {"train_loss": -5.449094772338867, "global_step": 29665, "epoch": 706} {"train_loss": -5.656020641326904, "global_step": 29666, "epoch": 706} {"train_loss": -5.462981224060059, "global_step": 29667, "epoch": 706} {"train_loss": -5.5213117599487305, "global_step": 29668, "epoch": 706} {"train_loss": -5.453044891357422, "global_step": 29669, "epoch": 706} {"train_loss": -5.367692947387695, "global_step": 29670, "epoch": 706} {"train_loss": -5.494182586669922, "global_step": 29671, "epoch": 706} {"train_loss": -5.3891119956970215, "global_step": 29672, "epoch": 706} {"train_loss": -5.362090110778809, "global_step": 29673, "epoch": 706} {"train_loss": -5.515842437744141, "global_step": 29674, "epoch": 706} {"train_loss": -5.425025939941406, "global_step": 29675, "epoch": 706} {"train_loss": -5.470427513122559, "global_step": 29676, "epoch": 706} {"train_loss": -5.510885715484619, "global_step": 29677, "epoch": 706} {"train_loss": -5.516303062438965, "global_step": 29678, "epoch": 706} {"train_loss": -5.426590919494629, "global_step": 29679, "epoch": 706} {"train_loss": -5.490997314453125, "global_step": 29680, "epoch": 706} {"train_loss": -5.551805019378662, "global_step": 29681, "epoch": 706} {"train_loss": -5.396902561187744, "global_step": 29682, "epoch": 706} {"train_loss": -5.613056182861328, "global_step": 29683, "epoch": 706} {"train_loss": -5.493921279907227, "global_step": 29684, "epoch": 706} {"train_loss": -5.465798377990723, "global_step": 29685, "epoch": 706} {"train_loss": -5.450405597686768, "global_step": 29686, "epoch": 706} {"train_loss": -5.410216331481934, "global_step": 29687, "epoch": 706} {"train_loss": -5.521299362182617, "global_step": 29688, "epoch": 706} {"train_loss": -5.454012870788574, "global_step": 29689, "epoch": 706} {"train_loss": -5.468749523162842, "global_step": 29690, "epoch": 706} {"train_loss": -5.476202964782715, "global_step": 29691, "epoch": 706} {"train_loss": -5.6416521072387695, "global_step": 29692, "epoch": 706} {"train_loss": -5.481529871622722, "global_step": 29693, "epoch": 706, "val_loss": 67111.5625} {"train_loss": -5.478927135467529, "global_step": 29694, "epoch": 707} {"train_loss": -5.553891181945801, "global_step": 29695, "epoch": 707} {"train_loss": -5.367696285247803, "global_step": 29696, "epoch": 707} {"train_loss": -5.529833793640137, "global_step": 29697, "epoch": 707} {"train_loss": -5.381320476531982, "global_step": 29698, "epoch": 707} {"train_loss": -5.4672346115112305, "global_step": 29699, "epoch": 707} {"train_loss": -5.47225284576416, "global_step": 29700, "epoch": 707} {"train_loss": -5.516779899597168, "global_step": 29701, "epoch": 707} {"train_loss": -5.497923851013184, "global_step": 29702, "epoch": 707} {"train_loss": -5.503542900085449, "global_step": 29703, "epoch": 707} {"train_loss": -5.556211471557617, "global_step": 29704, "epoch": 707} {"train_loss": -5.535674571990967, "global_step": 29705, "epoch": 707} {"train_loss": -5.277891159057617, "global_step": 29706, "epoch": 707} {"train_loss": -5.425920009613037, "global_step": 29707, "epoch": 707} {"train_loss": -5.442193031311035, "global_step": 29708, "epoch": 707} {"train_loss": -5.402311325073242, "global_step": 29709, "epoch": 707} {"train_loss": -5.526468753814697, "global_step": 29710, "epoch": 707} {"train_loss": -5.535134315490723, "global_step": 29711, "epoch": 707} {"train_loss": -5.373302459716797, "global_step": 29712, "epoch": 707} {"train_loss": -5.407710075378418, "global_step": 29713, "epoch": 707} {"train_loss": -5.4497880935668945, "global_step": 29714, "epoch": 707} {"train_loss": -5.3959059715271, "global_step": 29715, "epoch": 707} {"train_loss": -5.418737411499023, "global_step": 29716, "epoch": 707} {"train_loss": -5.523370742797852, "global_step": 29717, "epoch": 707} {"train_loss": -5.48853874206543, "global_step": 29718, "epoch": 707} {"train_loss": -5.4135212898254395, "global_step": 29719, "epoch": 707} {"train_loss": -5.472308158874512, "global_step": 29720, "epoch": 707} {"train_loss": -5.488275051116943, "global_step": 29721, "epoch": 707} {"train_loss": -5.440406322479248, "global_step": 29722, "epoch": 707} {"train_loss": -5.453402042388916, "global_step": 29723, "epoch": 707} {"train_loss": -5.390471458435059, "global_step": 29724, "epoch": 707} {"train_loss": -5.458333969116211, "global_step": 29725, "epoch": 707} {"train_loss": -5.498549461364746, "global_step": 29726, "epoch": 707} {"train_loss": -5.372357368469238, "global_step": 29727, "epoch": 707} {"train_loss": -5.406400680541992, "global_step": 29728, "epoch": 707} {"train_loss": -5.501101493835449, "global_step": 29729, "epoch": 707} {"train_loss": -5.41363525390625, "global_step": 29730, "epoch": 707} {"train_loss": -5.500141143798828, "global_step": 29731, "epoch": 707} {"train_loss": -5.369431495666504, "global_step": 29732, "epoch": 707} {"train_loss": -5.38482666015625, "global_step": 29733, "epoch": 707} {"train_loss": -5.482303619384766, "global_step": 29734, "epoch": 707} {"train_loss": -5.453467346373058, "global_step": 29735, "epoch": 707, "val_loss": 66900.4140625} {"train_loss": -5.445436477661133, "global_step": 29736, "epoch": 708} {"train_loss": -5.474621772766113, "global_step": 29737, "epoch": 708} {"train_loss": -5.461299896240234, "global_step": 29738, "epoch": 708} {"train_loss": -5.406034469604492, "global_step": 29739, "epoch": 708} {"train_loss": -5.485989570617676, "global_step": 29740, "epoch": 708} {"train_loss": -5.356956481933594, "global_step": 29741, "epoch": 708} {"train_loss": -5.535382270812988, "global_step": 29742, "epoch": 708} {"train_loss": -5.381801605224609, "global_step": 29743, "epoch": 708} {"train_loss": -5.562224864959717, "global_step": 29744, "epoch": 708} {"train_loss": -5.413184642791748, "global_step": 29745, "epoch": 708} {"train_loss": -5.467463493347168, "global_step": 29746, "epoch": 708} {"train_loss": -5.434633731842041, "global_step": 29747, "epoch": 708} {"train_loss": -5.526399612426758, "global_step": 29748, "epoch": 708} {"train_loss": -5.508923530578613, "global_step": 29749, "epoch": 708} {"train_loss": -5.293027877807617, "global_step": 29750, "epoch": 708} {"train_loss": -5.4971771240234375, "global_step": 29751, "epoch": 708} {"train_loss": -5.318017959594727, "global_step": 29752, "epoch": 708} {"train_loss": -5.5272979736328125, "global_step": 29753, "epoch": 708} {"train_loss": -5.3526716232299805, "global_step": 29754, "epoch": 708} {"train_loss": -5.191341400146484, "global_step": 29755, "epoch": 708} {"train_loss": -5.381466865539551, "global_step": 29756, "epoch": 708} {"train_loss": -5.477089881896973, "global_step": 29757, "epoch": 708} {"train_loss": -5.383633613586426, "global_step": 29758, "epoch": 708} {"train_loss": -5.403350353240967, "global_step": 29759, "epoch": 708} {"train_loss": -5.474697589874268, "global_step": 29760, "epoch": 708} {"train_loss": -5.364930152893066, "global_step": 29761, "epoch": 708} {"train_loss": -5.467170715332031, "global_step": 29762, "epoch": 708} {"train_loss": -5.348254203796387, "global_step": 29763, "epoch": 708} {"train_loss": -5.525030136108398, "global_step": 29764, "epoch": 708} {"train_loss": -5.435793399810791, "global_step": 29765, "epoch": 708} {"train_loss": -5.395356178283691, "global_step": 29766, "epoch": 708} {"train_loss": -5.516741752624512, "global_step": 29767, "epoch": 708} {"train_loss": -5.407758712768555, "global_step": 29768, "epoch": 708} {"train_loss": -5.425999641418457, "global_step": 29769, "epoch": 708} {"train_loss": -5.457845687866211, "global_step": 29770, "epoch": 708} {"train_loss": -5.505471229553223, "global_step": 29771, "epoch": 708} {"train_loss": -5.492964744567871, "global_step": 29772, "epoch": 708} {"train_loss": -5.539097785949707, "global_step": 29773, "epoch": 708} {"train_loss": -5.320747375488281, "global_step": 29774, "epoch": 708} {"train_loss": -5.569366931915283, "global_step": 29775, "epoch": 708} {"train_loss": -5.517253398895264, "global_step": 29776, "epoch": 708} {"train_loss": -5.440392278489613, "global_step": 29777, "epoch": 708, "val_loss": 66906.78125} {"train_loss": -5.519609451293945, "global_step": 29778, "epoch": 709} {"train_loss": -5.499354362487793, "global_step": 29779, "epoch": 709} {"train_loss": -5.501278877258301, "global_step": 29780, "epoch": 709} {"train_loss": -5.436753273010254, "global_step": 29781, "epoch": 709} {"train_loss": -5.57503080368042, "global_step": 29782, "epoch": 709} {"train_loss": -5.577591896057129, "global_step": 29783, "epoch": 709} {"train_loss": -5.519379615783691, "global_step": 29784, "epoch": 709} {"train_loss": -5.521662712097168, "global_step": 29785, "epoch": 709} {"train_loss": -5.502462387084961, "global_step": 29786, "epoch": 709} {"train_loss": -5.42086935043335, "global_step": 29787, "epoch": 709} {"train_loss": -5.470462322235107, "global_step": 29788, "epoch": 709} {"train_loss": -5.5325093269348145, "global_step": 29789, "epoch": 709} {"train_loss": -5.499246597290039, "global_step": 29790, "epoch": 709} {"train_loss": -5.493433952331543, "global_step": 29791, "epoch": 709} {"train_loss": -5.452096462249756, "global_step": 29792, "epoch": 709} {"train_loss": -5.536708831787109, "global_step": 29793, "epoch": 709} {"train_loss": -5.461214065551758, "global_step": 29794, "epoch": 709} {"train_loss": -5.36660099029541, "global_step": 29795, "epoch": 709} {"train_loss": -5.430902481079102, "global_step": 29796, "epoch": 709} {"train_loss": -5.629354476928711, "global_step": 29797, "epoch": 709} {"train_loss": -5.18876838684082, "global_step": 29798, "epoch": 709} {"train_loss": -5.3567728996276855, "global_step": 29799, "epoch": 709} {"train_loss": -5.388454437255859, "global_step": 29800, "epoch": 709} {"train_loss": -5.426643371582031, "global_step": 29801, "epoch": 709} {"train_loss": -5.417649745941162, "global_step": 29802, "epoch": 709} {"train_loss": -5.46992826461792, "global_step": 29803, "epoch": 709} {"train_loss": -5.3938493728637695, "global_step": 29804, "epoch": 709} {"train_loss": -5.506339073181152, "global_step": 29805, "epoch": 709} {"train_loss": -5.3623456954956055, "global_step": 29806, "epoch": 709} {"train_loss": -5.485531806945801, "global_step": 29807, "epoch": 709} {"train_loss": -5.534873008728027, "global_step": 29808, "epoch": 709} {"train_loss": -5.519182205200195, "global_step": 29809, "epoch": 709} {"train_loss": -5.383254528045654, "global_step": 29810, "epoch": 709} {"train_loss": -5.54953670501709, "global_step": 29811, "epoch": 709} {"train_loss": -5.525661468505859, "global_step": 29812, "epoch": 709} {"train_loss": -5.55871057510376, "global_step": 29813, "epoch": 709} {"train_loss": -5.51693058013916, "global_step": 29814, "epoch": 709} {"train_loss": -5.492415428161621, "global_step": 29815, "epoch": 709} {"train_loss": -5.615024089813232, "global_step": 29816, "epoch": 709} {"train_loss": -5.485386371612549, "global_step": 29817, "epoch": 709} {"train_loss": -5.489060401916504, "global_step": 29818, "epoch": 709} {"train_loss": -5.4786537147703624, "global_step": 29819, "epoch": 709, "val_loss": 66989.53125} {"train_loss": -5.434587478637695, "global_step": 29820, "epoch": 710} {"train_loss": -5.5708112716674805, "global_step": 29821, "epoch": 710} {"train_loss": -5.472076416015625, "global_step": 29822, "epoch": 710} {"train_loss": -5.382977485656738, "global_step": 29823, "epoch": 710} {"train_loss": -5.492066383361816, "global_step": 29824, "epoch": 710} {"train_loss": -5.466869354248047, "global_step": 29825, "epoch": 710} {"train_loss": -5.416619300842285, "global_step": 29826, "epoch": 710} {"train_loss": -5.401937007904053, "global_step": 29827, "epoch": 710} {"train_loss": -5.550957202911377, "global_step": 29828, "epoch": 710} {"train_loss": -5.618266582489014, "global_step": 29829, "epoch": 710} {"train_loss": -5.611429214477539, "global_step": 29830, "epoch": 710} {"train_loss": -5.570722579956055, "global_step": 29831, "epoch": 710} {"train_loss": -5.4337592124938965, "global_step": 29832, "epoch": 710} {"train_loss": -5.57042121887207, "global_step": 29833, "epoch": 710} {"train_loss": -5.437019348144531, "global_step": 29834, "epoch": 710} {"train_loss": -5.362180233001709, "global_step": 29835, "epoch": 710} {"train_loss": -5.413994789123535, "global_step": 29836, "epoch": 710} {"train_loss": -5.402974605560303, "global_step": 29837, "epoch": 710} {"train_loss": -5.581201553344727, "global_step": 29838, "epoch": 710} {"train_loss": -5.42111873626709, "global_step": 29839, "epoch": 710} {"train_loss": -5.384200572967529, "global_step": 29840, "epoch": 710} {"train_loss": -5.452920436859131, "global_step": 29841, "epoch": 710} {"train_loss": -5.535806655883789, "global_step": 29842, "epoch": 710} {"train_loss": -5.388080596923828, "global_step": 29843, "epoch": 710} {"train_loss": -5.4554643630981445, "global_step": 29844, "epoch": 710} {"train_loss": -5.3436737060546875, "global_step": 29845, "epoch": 710} {"train_loss": -5.588671684265137, "global_step": 29846, "epoch": 710} {"train_loss": -5.4493489265441895, "global_step": 29847, "epoch": 710} {"train_loss": -5.575094223022461, "global_step": 29848, "epoch": 710} {"train_loss": -5.471878528594971, "global_step": 29849, "epoch": 710} {"train_loss": -5.508459568023682, "global_step": 29850, "epoch": 710} {"train_loss": -5.418264865875244, "global_step": 29851, "epoch": 710} {"train_loss": -5.570499420166016, "global_step": 29852, "epoch": 710} {"train_loss": -5.486204147338867, "global_step": 29853, "epoch": 710} {"train_loss": -5.529533386230469, "global_step": 29854, "epoch": 710} {"train_loss": -5.488554954528809, "global_step": 29855, "epoch": 710} {"train_loss": -5.551570892333984, "global_step": 29856, "epoch": 710} {"train_loss": -5.490314960479736, "global_step": 29857, "epoch": 710} {"train_loss": -5.44286584854126, "global_step": 29858, "epoch": 710} {"train_loss": -5.521537780761719, "global_step": 29859, "epoch": 710} {"train_loss": -5.440563201904297, "global_step": 29860, "epoch": 710} {"train_loss": -5.481521129608154, "global_step": 29861, "epoch": 710, "val_loss": 66996.859375} {"train_loss": -5.466164588928223, "global_step": 29862, "epoch": 711} {"train_loss": -5.3311614990234375, "global_step": 29863, "epoch": 711} {"train_loss": -5.510289669036865, "global_step": 29864, "epoch": 711} {"train_loss": -5.479139804840088, "global_step": 29865, "epoch": 711} {"train_loss": -5.411027908325195, "global_step": 29866, "epoch": 711} {"train_loss": -5.522769927978516, "global_step": 29867, "epoch": 711} {"train_loss": -5.474241256713867, "global_step": 29868, "epoch": 711} {"train_loss": -5.6157546043396, "global_step": 29869, "epoch": 711} {"train_loss": -5.512143135070801, "global_step": 29870, "epoch": 711} {"train_loss": -5.478037357330322, "global_step": 29871, "epoch": 711} {"train_loss": -5.478055000305176, "global_step": 29872, "epoch": 711} {"train_loss": -5.4580183029174805, "global_step": 29873, "epoch": 711} {"train_loss": -5.474628925323486, "global_step": 29874, "epoch": 711} {"train_loss": -5.630238056182861, "global_step": 29875, "epoch": 711} {"train_loss": -5.503689289093018, "global_step": 29876, "epoch": 711} {"train_loss": -5.437602996826172, "global_step": 29877, "epoch": 711} {"train_loss": -5.46933650970459, "global_step": 29878, "epoch": 711} {"train_loss": -5.537436485290527, "global_step": 29879, "epoch": 711} {"train_loss": -5.424319744110107, "global_step": 29880, "epoch": 711} {"train_loss": -5.450658798217773, "global_step": 29881, "epoch": 711} {"train_loss": -5.43917989730835, "global_step": 29882, "epoch": 711} {"train_loss": -5.450066566467285, "global_step": 29883, "epoch": 711} {"train_loss": -5.339114665985107, "global_step": 29884, "epoch": 711} {"train_loss": -5.476606845855713, "global_step": 29885, "epoch": 711} {"train_loss": -5.466709136962891, "global_step": 29886, "epoch": 711} {"train_loss": -5.4703264236450195, "global_step": 29887, "epoch": 711} {"train_loss": -5.325387001037598, "global_step": 29888, "epoch": 711} {"train_loss": -5.426871299743652, "global_step": 29889, "epoch": 711} {"train_loss": -5.46237850189209, "global_step": 29890, "epoch": 711} {"train_loss": -5.574848175048828, "global_step": 29891, "epoch": 711} {"train_loss": -5.607875823974609, "global_step": 29892, "epoch": 711} {"train_loss": -5.443117618560791, "global_step": 29893, "epoch": 711} {"train_loss": -5.386622428894043, "global_step": 29894, "epoch": 711} {"train_loss": -5.570278167724609, "global_step": 29895, "epoch": 711} {"train_loss": -5.407231330871582, "global_step": 29896, "epoch": 711} {"train_loss": -5.426285743713379, "global_step": 29897, "epoch": 711} {"train_loss": -5.4591450691223145, "global_step": 29898, "epoch": 711} {"train_loss": -5.579159736633301, "global_step": 29899, "epoch": 711} {"train_loss": -5.370288848876953, "global_step": 29900, "epoch": 711} {"train_loss": -5.411040782928467, "global_step": 29901, "epoch": 711} {"train_loss": -5.4193220138549805, "global_step": 29902, "epoch": 711} {"train_loss": -5.465586832591465, "global_step": 29903, "epoch": 711, "val_loss": 67027.078125} {"train_loss": -5.554746627807617, "global_step": 29904, "epoch": 712} {"train_loss": -5.624180793762207, "global_step": 29905, "epoch": 712} {"train_loss": -5.487805366516113, "global_step": 29906, "epoch": 712} {"train_loss": -5.423601150512695, "global_step": 29907, "epoch": 712} {"train_loss": -5.612491607666016, "global_step": 29908, "epoch": 712} {"train_loss": -5.389397621154785, "global_step": 29909, "epoch": 712} {"train_loss": -5.524258136749268, "global_step": 29910, "epoch": 712} {"train_loss": -5.523221492767334, "global_step": 29911, "epoch": 712} {"train_loss": -5.466556549072266, "global_step": 29912, "epoch": 712} {"train_loss": -5.573128700256348, "global_step": 29913, "epoch": 712} {"train_loss": -5.284408092498779, "global_step": 29914, "epoch": 712} {"train_loss": -5.562425136566162, "global_step": 29915, "epoch": 712} {"train_loss": -5.643307685852051, "global_step": 29916, "epoch": 712} {"train_loss": -5.306401252746582, "global_step": 29917, "epoch": 712} {"train_loss": -5.505221366882324, "global_step": 29918, "epoch": 712} {"train_loss": -5.578603267669678, "global_step": 29919, "epoch": 712} {"train_loss": -5.518385887145996, "global_step": 29920, "epoch": 712} {"train_loss": -5.384929656982422, "global_step": 29921, "epoch": 712} {"train_loss": -5.414118766784668, "global_step": 29922, "epoch": 712} {"train_loss": -5.648237705230713, "global_step": 29923, "epoch": 712} {"train_loss": -5.336199760437012, "global_step": 29924, "epoch": 712} {"train_loss": -5.239200592041016, "global_step": 29925, "epoch": 712} {"train_loss": -5.491951942443848, "global_step": 29926, "epoch": 712} {"train_loss": -5.414356231689453, "global_step": 29927, "epoch": 712} {"train_loss": -5.607187747955322, "global_step": 29928, "epoch": 712} {"train_loss": -5.330125331878662, "global_step": 29929, "epoch": 712} {"train_loss": -5.380518913269043, "global_step": 29930, "epoch": 712} {"train_loss": -5.266468524932861, "global_step": 29931, "epoch": 712} {"train_loss": -5.3530473709106445, "global_step": 29932, "epoch": 712} {"train_loss": -5.444334030151367, "global_step": 29933, "epoch": 712} {"train_loss": -5.441981315612793, "global_step": 29934, "epoch": 712} {"train_loss": -5.461810111999512, "global_step": 29935, "epoch": 712} {"train_loss": -5.541738986968994, "global_step": 29936, "epoch": 712} {"train_loss": -5.479403972625732, "global_step": 29937, "epoch": 712} {"train_loss": -5.41628885269165, "global_step": 29938, "epoch": 712} {"train_loss": -5.332179069519043, "global_step": 29939, "epoch": 712} {"train_loss": -5.501394271850586, "global_step": 29940, "epoch": 712} {"train_loss": -5.510768890380859, "global_step": 29941, "epoch": 712} {"train_loss": -5.359654426574707, "global_step": 29942, "epoch": 712} {"train_loss": -5.645033836364746, "global_step": 29943, "epoch": 712} {"train_loss": -5.273885726928711, "global_step": 29944, "epoch": 712} {"train_loss": -5.45956369808742, "global_step": 29945, "epoch": 712, "val_loss": 67399.6640625} {"train_loss": -5.44802188873291, "global_step": 29946, "epoch": 713} {"train_loss": -5.4627532958984375, "global_step": 29947, "epoch": 713} {"train_loss": -5.418246269226074, "global_step": 29948, "epoch": 713} {"train_loss": -5.464718818664551, "global_step": 29949, "epoch": 713} {"train_loss": -5.500849723815918, "global_step": 29950, "epoch": 713} {"train_loss": -5.5380096435546875, "global_step": 29951, "epoch": 713} {"train_loss": -5.447195053100586, "global_step": 29952, "epoch": 713} {"train_loss": -5.491950988769531, "global_step": 29953, "epoch": 713} {"train_loss": -5.567906379699707, "global_step": 29954, "epoch": 713} {"train_loss": -5.43174934387207, "global_step": 29955, "epoch": 713} {"train_loss": -5.517394065856934, "global_step": 29956, "epoch": 713} {"train_loss": -5.484714031219482, "global_step": 29957, "epoch": 713} {"train_loss": -5.522108554840088, "global_step": 29958, "epoch": 713} {"train_loss": -5.280117988586426, "global_step": 29959, "epoch": 713} {"train_loss": -5.467739105224609, "global_step": 29960, "epoch": 713} {"train_loss": -5.685373306274414, "global_step": 29961, "epoch": 713} {"train_loss": -5.4503278732299805, "global_step": 29962, "epoch": 713} {"train_loss": -5.530216217041016, "global_step": 29963, "epoch": 713} {"train_loss": -5.522735595703125, "global_step": 29964, "epoch": 713} {"train_loss": -5.433887481689453, "global_step": 29965, "epoch": 713} {"train_loss": -5.522365093231201, "global_step": 29966, "epoch": 713} {"train_loss": -5.4262189865112305, "global_step": 29967, "epoch": 713} {"train_loss": -5.615689277648926, "global_step": 29968, "epoch": 713} {"train_loss": -5.475404739379883, "global_step": 29969, "epoch": 713} {"train_loss": -5.485773086547852, "global_step": 29970, "epoch": 713} {"train_loss": -5.446688652038574, "global_step": 29971, "epoch": 713} {"train_loss": -5.42165994644165, "global_step": 29972, "epoch": 713} {"train_loss": -5.617615699768066, "global_step": 29973, "epoch": 713} {"train_loss": -5.329927921295166, "global_step": 29974, "epoch": 713} {"train_loss": -5.460357666015625, "global_step": 29975, "epoch": 713} {"train_loss": -5.5610761642456055, "global_step": 29976, "epoch": 713} {"train_loss": -5.509529113769531, "global_step": 29977, "epoch": 713} {"train_loss": -5.513978958129883, "global_step": 29978, "epoch": 713} {"train_loss": -5.418755054473877, "global_step": 29979, "epoch": 713} {"train_loss": -5.543499946594238, "global_step": 29980, "epoch": 713} {"train_loss": -5.497373580932617, "global_step": 29981, "epoch": 713} {"train_loss": -5.557622909545898, "global_step": 29982, "epoch": 713} {"train_loss": -5.55835485458374, "global_step": 29983, "epoch": 713} {"train_loss": -5.423659324645996, "global_step": 29984, "epoch": 713} {"train_loss": -5.430335521697998, "global_step": 29985, "epoch": 713} {"train_loss": -5.452469825744629, "global_step": 29986, "epoch": 713} {"train_loss": -5.4877553553808305, "global_step": 29987, "epoch": 713, "val_loss": 67137.15625} {"train_loss": -5.574751853942871, "global_step": 29988, "epoch": 714} {"train_loss": -5.434043884277344, "global_step": 29989, "epoch": 714} {"train_loss": -5.487031936645508, "global_step": 29990, "epoch": 714} {"train_loss": -5.454086780548096, "global_step": 29991, "epoch": 714} {"train_loss": -5.446707725524902, "global_step": 29992, "epoch": 714} {"train_loss": -5.495541572570801, "global_step": 29993, "epoch": 714} {"train_loss": -5.569436550140381, "global_step": 29994, "epoch": 714} {"train_loss": -5.540678977966309, "global_step": 29995, "epoch": 714} {"train_loss": -5.438377380371094, "global_step": 29996, "epoch": 714} {"train_loss": -5.527740478515625, "global_step": 29997, "epoch": 714} {"train_loss": -5.531170845031738, "global_step": 29998, "epoch": 714} {"train_loss": -5.487013339996338, "global_step": 29999, "epoch": 714} {"train_loss": -5.4292144775390625, "global_step": 30000, "epoch": 714} {"train_loss": -5.441375732421875, "global_step": 30001, "epoch": 714} {"train_loss": -5.442529201507568, "global_step": 30002, "epoch": 714} {"train_loss": -5.557893753051758, "global_step": 30003, "epoch": 714} {"train_loss": -5.461099624633789, "global_step": 30004, "epoch": 714} {"train_loss": -5.413539886474609, "global_step": 30005, "epoch": 714} {"train_loss": -5.501964092254639, "global_step": 30006, "epoch": 714} {"train_loss": -5.3812432289123535, "global_step": 30007, "epoch": 714} {"train_loss": -5.576163291931152, "global_step": 30008, "epoch": 714} {"train_loss": -5.474504470825195, "global_step": 30009, "epoch": 714} {"train_loss": -5.420051097869873, "global_step": 30010, "epoch": 714} {"train_loss": -5.538731575012207, "global_step": 30011, "epoch": 714} {"train_loss": -5.378033638000488, "global_step": 30012, "epoch": 714} {"train_loss": -5.511803150177002, "global_step": 30013, "epoch": 714} {"train_loss": -5.608223915100098, "global_step": 30014, "epoch": 714} {"train_loss": -5.46137809753418, "global_step": 30015, "epoch": 714} {"train_loss": -5.573382377624512, "global_step": 30016, "epoch": 714} {"train_loss": -5.507242202758789, "global_step": 30017, "epoch": 714} {"train_loss": -5.49779748916626, "global_step": 30018, "epoch": 714} {"train_loss": -5.569470405578613, "global_step": 30019, "epoch": 714} {"train_loss": -5.453481197357178, "global_step": 30020, "epoch": 714} {"train_loss": -5.5211639404296875, "global_step": 30021, "epoch": 714} {"train_loss": -5.403905391693115, "global_step": 30022, "epoch": 714} {"train_loss": -5.4852447509765625, "global_step": 30023, "epoch": 714} {"train_loss": -5.499086856842041, "global_step": 30024, "epoch": 714} {"train_loss": -5.440219402313232, "global_step": 30025, "epoch": 714} {"train_loss": -5.5669779777526855, "global_step": 30026, "epoch": 714} {"train_loss": -5.575131416320801, "global_step": 30027, "epoch": 714} {"train_loss": -5.368961334228516, "global_step": 30028, "epoch": 714} {"train_loss": -5.4904541742234, "global_step": 30029, "epoch": 714, "val_loss": 67422.609375} {"train_loss": -5.374268054962158, "global_step": 30030, "epoch": 715} {"train_loss": -5.556928634643555, "global_step": 30031, "epoch": 715} {"train_loss": -5.422384262084961, "global_step": 30032, "epoch": 715} {"train_loss": -5.563045501708984, "global_step": 30033, "epoch": 715} {"train_loss": -5.643616676330566, "global_step": 30034, "epoch": 715} {"train_loss": -5.599618434906006, "global_step": 30035, "epoch": 715} {"train_loss": -5.627840042114258, "global_step": 30036, "epoch": 715} {"train_loss": -5.486611366271973, "global_step": 30037, "epoch": 715} {"train_loss": -5.640584945678711, "global_step": 30038, "epoch": 715} {"train_loss": -5.618687152862549, "global_step": 30039, "epoch": 715} {"train_loss": -5.429730415344238, "global_step": 30040, "epoch": 715} {"train_loss": -5.427445411682129, "global_step": 30041, "epoch": 715} {"train_loss": -5.448470115661621, "global_step": 30042, "epoch": 715} {"train_loss": -5.518420219421387, "global_step": 30043, "epoch": 715} {"train_loss": -5.507912635803223, "global_step": 30044, "epoch": 715} {"train_loss": -5.553896903991699, "global_step": 30045, "epoch": 715} {"train_loss": -5.43550443649292, "global_step": 30046, "epoch": 715} {"train_loss": -5.496339321136475, "global_step": 30047, "epoch": 715} {"train_loss": -5.530470848083496, "global_step": 30048, "epoch": 715} {"train_loss": -5.511649131774902, "global_step": 30049, "epoch": 715} {"train_loss": -5.4530181884765625, "global_step": 30050, "epoch": 715} {"train_loss": -5.612706184387207, "global_step": 30051, "epoch": 715} {"train_loss": -5.480607986450195, "global_step": 30052, "epoch": 715} {"train_loss": -5.418221950531006, "global_step": 30053, "epoch": 715} {"train_loss": -5.474905014038086, "global_step": 30054, "epoch": 715} {"train_loss": -5.512835502624512, "global_step": 30055, "epoch": 715} {"train_loss": -5.555816650390625, "global_step": 30056, "epoch": 715} {"train_loss": -5.467205047607422, "global_step": 30057, "epoch": 715} {"train_loss": -5.526301383972168, "global_step": 30058, "epoch": 715} {"train_loss": -5.2800984382629395, "global_step": 30059, "epoch": 715} {"train_loss": -5.366279125213623, "global_step": 30060, "epoch": 715} {"train_loss": -5.651705741882324, "global_step": 30061, "epoch": 715} {"train_loss": -5.427485466003418, "global_step": 30062, "epoch": 715} {"train_loss": -5.301473617553711, "global_step": 30063, "epoch": 715} {"train_loss": -5.597936630249023, "global_step": 30064, "epoch": 715} {"train_loss": -5.3154377937316895, "global_step": 30065, "epoch": 715} {"train_loss": -5.476285934448242, "global_step": 30066, "epoch": 715} {"train_loss": -5.560225486755371, "global_step": 30067, "epoch": 715} {"train_loss": -5.156763076782227, "global_step": 30068, "epoch": 715} {"train_loss": -5.532253742218018, "global_step": 30069, "epoch": 715} {"train_loss": -5.336789608001709, "global_step": 30070, "epoch": 715} {"train_loss": -5.477642524810064, "global_step": 30071, "epoch": 715, "val_loss": 67352.171875} {"train_loss": -5.44014310836792, "global_step": 30072, "epoch": 716} {"train_loss": -5.338831424713135, "global_step": 30073, "epoch": 716} {"train_loss": -5.444756507873535, "global_step": 30074, "epoch": 716} {"train_loss": -5.423213958740234, "global_step": 30075, "epoch": 716} {"train_loss": -5.521149158477783, "global_step": 30076, "epoch": 716} {"train_loss": -5.376405715942383, "global_step": 30077, "epoch": 716} {"train_loss": -5.46553373336792, "global_step": 30078, "epoch": 716} {"train_loss": -5.5854291915893555, "global_step": 30079, "epoch": 716} {"train_loss": -5.5176310539245605, "global_step": 30080, "epoch": 716} {"train_loss": -5.4096598625183105, "global_step": 30081, "epoch": 716} {"train_loss": -5.386232376098633, "global_step": 30082, "epoch": 716} {"train_loss": -5.41757869720459, "global_step": 30083, "epoch": 716} {"train_loss": -5.493378162384033, "global_step": 30084, "epoch": 716} {"train_loss": -5.247525691986084, "global_step": 30085, "epoch": 716} {"train_loss": -5.499270439147949, "global_step": 30086, "epoch": 716} {"train_loss": -5.508170127868652, "global_step": 30087, "epoch": 716} {"train_loss": -5.426810264587402, "global_step": 30088, "epoch": 716} {"train_loss": -5.502434730529785, "global_step": 30089, "epoch": 716} {"train_loss": -5.394305229187012, "global_step": 30090, "epoch": 716} {"train_loss": -5.446957111358643, "global_step": 30091, "epoch": 716} {"train_loss": -5.354734420776367, "global_step": 30092, "epoch": 716} {"train_loss": -5.569559574127197, "global_step": 30093, "epoch": 716} {"train_loss": -5.468706130981445, "global_step": 30094, "epoch": 716} {"train_loss": -5.490447044372559, "global_step": 30095, "epoch": 716} {"train_loss": -5.547044277191162, "global_step": 30096, "epoch": 716} {"train_loss": -5.497842311859131, "global_step": 30097, "epoch": 716} {"train_loss": -5.463367938995361, "global_step": 30098, "epoch": 716} {"train_loss": -5.379209518432617, "global_step": 30099, "epoch": 716} {"train_loss": -5.500401496887207, "global_step": 30100, "epoch": 716} {"train_loss": -5.488119125366211, "global_step": 30101, "epoch": 716} {"train_loss": -5.61051082611084, "global_step": 30102, "epoch": 716} {"train_loss": -5.509149551391602, "global_step": 30103, "epoch": 716} {"train_loss": -5.472290992736816, "global_step": 30104, "epoch": 716} {"train_loss": -5.496767520904541, "global_step": 30105, "epoch": 716} {"train_loss": -5.607848644256592, "global_step": 30106, "epoch": 716} {"train_loss": -5.641996383666992, "global_step": 30107, "epoch": 716} {"train_loss": -5.520428657531738, "global_step": 30108, "epoch": 716} {"train_loss": -5.555766582489014, "global_step": 30109, "epoch": 716} {"train_loss": -5.437008857727051, "global_step": 30110, "epoch": 716} {"train_loss": -5.397774696350098, "global_step": 30111, "epoch": 716} {"train_loss": -5.418593883514404, "global_step": 30112, "epoch": 716} {"train_loss": -5.472222214653378, "global_step": 30113, "epoch": 716, "val_loss": 67119.265625} {"train_loss": -5.441919326782227, "global_step": 30114, "epoch": 717} {"train_loss": -5.511172294616699, "global_step": 30115, "epoch": 717} {"train_loss": -5.549479007720947, "global_step": 30116, "epoch": 717} {"train_loss": -5.487325668334961, "global_step": 30117, "epoch": 717} {"train_loss": -5.448081970214844, "global_step": 30118, "epoch": 717} {"train_loss": -5.46274471282959, "global_step": 30119, "epoch": 717} {"train_loss": -5.4940385818481445, "global_step": 30120, "epoch": 717} {"train_loss": -5.4367475509643555, "global_step": 30121, "epoch": 717} {"train_loss": -5.484268665313721, "global_step": 30122, "epoch": 717} {"train_loss": -5.395689010620117, "global_step": 30123, "epoch": 717} {"train_loss": -5.51924991607666, "global_step": 30124, "epoch": 717} {"train_loss": -5.437553405761719, "global_step": 30125, "epoch": 717} {"train_loss": -5.330263137817383, "global_step": 30126, "epoch": 717} {"train_loss": -5.590370178222656, "global_step": 30127, "epoch": 717} {"train_loss": -5.391622543334961, "global_step": 30128, "epoch": 717} {"train_loss": -5.429410457611084, "global_step": 30129, "epoch": 717} {"train_loss": -5.504255294799805, "global_step": 30130, "epoch": 717} {"train_loss": -5.57858943939209, "global_step": 30131, "epoch": 717} {"train_loss": -5.484704971313477, "global_step": 30132, "epoch": 717} {"train_loss": -5.454631328582764, "global_step": 30133, "epoch": 717} {"train_loss": -5.474582672119141, "global_step": 30134, "epoch": 717} {"train_loss": -5.510547637939453, "global_step": 30135, "epoch": 717} {"train_loss": -5.4389848709106445, "global_step": 30136, "epoch": 717} {"train_loss": -5.461236000061035, "global_step": 30137, "epoch": 717} {"train_loss": -5.596673965454102, "global_step": 30138, "epoch": 717} {"train_loss": -5.405087471008301, "global_step": 30139, "epoch": 717} {"train_loss": -5.374203205108643, "global_step": 30140, "epoch": 717} {"train_loss": -5.382428169250488, "global_step": 30141, "epoch": 717} {"train_loss": -5.36208438873291, "global_step": 30142, "epoch": 717} {"train_loss": -5.550029277801514, "global_step": 30143, "epoch": 717} {"train_loss": -5.493311882019043, "global_step": 30144, "epoch": 717} {"train_loss": -5.414211273193359, "global_step": 30145, "epoch": 717} {"train_loss": -5.5651679039001465, "global_step": 30146, "epoch": 717} {"train_loss": -5.452125549316406, "global_step": 30147, "epoch": 717} {"train_loss": -5.471592426300049, "global_step": 30148, "epoch": 717} {"train_loss": -5.499701499938965, "global_step": 30149, "epoch": 717} {"train_loss": -5.319104194641113, "global_step": 30150, "epoch": 717} {"train_loss": -5.503949165344238, "global_step": 30151, "epoch": 717} {"train_loss": -5.485509872436523, "global_step": 30152, "epoch": 717} {"train_loss": -5.557462215423584, "global_step": 30153, "epoch": 717} {"train_loss": -5.367405891418457, "global_step": 30154, "epoch": 717} {"train_loss": -5.470446302777245, "global_step": 30155, "epoch": 717, "val_loss": 67216.515625} {"train_loss": -5.430671691894531, "global_step": 30156, "epoch": 718} {"train_loss": -5.557249069213867, "global_step": 30157, "epoch": 718} {"train_loss": -5.507949352264404, "global_step": 30158, "epoch": 718} {"train_loss": -5.3839240074157715, "global_step": 30159, "epoch": 718} {"train_loss": -5.560507774353027, "global_step": 30160, "epoch": 718} {"train_loss": -5.464468002319336, "global_step": 30161, "epoch": 718} {"train_loss": -5.4930949211120605, "global_step": 30162, "epoch": 718} {"train_loss": -5.451944351196289, "global_step": 30163, "epoch": 718} {"train_loss": -5.349946022033691, "global_step": 30164, "epoch": 718} {"train_loss": -5.405586242675781, "global_step": 30165, "epoch": 718} {"train_loss": -5.281806468963623, "global_step": 30166, "epoch": 718} {"train_loss": -5.435321807861328, "global_step": 30167, "epoch": 718} {"train_loss": -5.4398908615112305, "global_step": 30168, "epoch": 718} {"train_loss": -5.461831092834473, "global_step": 30169, "epoch": 718} {"train_loss": -5.387537002563477, "global_step": 30170, "epoch": 718} {"train_loss": -5.473367691040039, "global_step": 30171, "epoch": 718} {"train_loss": -5.456217288970947, "global_step": 30172, "epoch": 718} {"train_loss": -5.485823631286621, "global_step": 30173, "epoch": 718} {"train_loss": -5.502818584442139, "global_step": 30174, "epoch": 718} {"train_loss": -5.461500644683838, "global_step": 30175, "epoch": 718} {"train_loss": -5.4284772872924805, "global_step": 30176, "epoch": 718} {"train_loss": -5.495997428894043, "global_step": 30177, "epoch": 718} {"train_loss": -5.344034671783447, "global_step": 30178, "epoch": 718} {"train_loss": -5.4580278396606445, "global_step": 30179, "epoch": 718} {"train_loss": -5.589399337768555, "global_step": 30180, "epoch": 718} {"train_loss": -5.489547252655029, "global_step": 30181, "epoch": 718} {"train_loss": -5.506608009338379, "global_step": 30182, "epoch": 718} {"train_loss": -5.549642086029053, "global_step": 30183, "epoch": 718} {"train_loss": -5.452637672424316, "global_step": 30184, "epoch": 718} {"train_loss": -5.583770751953125, "global_step": 30185, "epoch": 718} {"train_loss": -5.40887975692749, "global_step": 30186, "epoch": 718} {"train_loss": -5.533639907836914, "global_step": 30187, "epoch": 718} {"train_loss": -5.445403575897217, "global_step": 30188, "epoch": 718} {"train_loss": -5.551998138427734, "global_step": 30189, "epoch": 718} {"train_loss": -5.374537944793701, "global_step": 30190, "epoch": 718} {"train_loss": -5.5226593017578125, "global_step": 30191, "epoch": 718} {"train_loss": -5.474722862243652, "global_step": 30192, "epoch": 718} {"train_loss": -5.545832633972168, "global_step": 30193, "epoch": 718} {"train_loss": -5.456695556640625, "global_step": 30194, "epoch": 718} {"train_loss": -5.440271377563477, "global_step": 30195, "epoch": 718} {"train_loss": -5.524494171142578, "global_step": 30196, "epoch": 718} {"train_loss": -5.468093656358265, "global_step": 30197, "epoch": 718, "val_loss": 67093.8125} {"train_loss": -5.619372844696045, "global_step": 30198, "epoch": 719} {"train_loss": -5.5186262130737305, "global_step": 30199, "epoch": 719} {"train_loss": -5.481438636779785, "global_step": 30200, "epoch": 719} {"train_loss": -5.568825721740723, "global_step": 30201, "epoch": 719} {"train_loss": -5.567052841186523, "global_step": 30202, "epoch": 719} {"train_loss": -5.580137729644775, "global_step": 30203, "epoch": 719} {"train_loss": -5.482714653015137, "global_step": 30204, "epoch": 719} {"train_loss": -5.5278520584106445, "global_step": 30205, "epoch": 719} {"train_loss": -5.408114433288574, "global_step": 30206, "epoch": 719} {"train_loss": -5.466510772705078, "global_step": 30207, "epoch": 719} {"train_loss": -5.651902198791504, "global_step": 30208, "epoch": 719} {"train_loss": -5.566220283508301, "global_step": 30209, "epoch": 719} {"train_loss": -5.411481857299805, "global_step": 30210, "epoch": 719} {"train_loss": -5.5015950202941895, "global_step": 30211, "epoch": 719} {"train_loss": -5.544774055480957, "global_step": 30212, "epoch": 719} {"train_loss": -5.513680934906006, "global_step": 30213, "epoch": 719} {"train_loss": -5.5033979415893555, "global_step": 30214, "epoch": 719} {"train_loss": -5.532493591308594, "global_step": 30215, "epoch": 719} {"train_loss": -5.538604736328125, "global_step": 30216, "epoch": 719} {"train_loss": -5.534950256347656, "global_step": 30217, "epoch": 719} {"train_loss": -5.491975784301758, "global_step": 30218, "epoch": 719} {"train_loss": -5.50889778137207, "global_step": 30219, "epoch": 719} {"train_loss": -5.529252052307129, "global_step": 30220, "epoch": 719} {"train_loss": -5.316746711730957, "global_step": 30221, "epoch": 719} {"train_loss": -5.328042984008789, "global_step": 30222, "epoch": 719} {"train_loss": -5.4903364181518555, "global_step": 30223, "epoch": 719} {"train_loss": -5.459073543548584, "global_step": 30224, "epoch": 719} {"train_loss": -5.370044231414795, "global_step": 30225, "epoch": 719} {"train_loss": -5.4003825187683105, "global_step": 30226, "epoch": 719} {"train_loss": -5.50272274017334, "global_step": 30227, "epoch": 719} {"train_loss": -5.440983295440674, "global_step": 30228, "epoch": 719} {"train_loss": -5.642909049987793, "global_step": 30229, "epoch": 719} {"train_loss": -5.470112323760986, "global_step": 30230, "epoch": 719} {"train_loss": -5.3891282081604, "global_step": 30231, "epoch": 719} {"train_loss": -5.645776748657227, "global_step": 30232, "epoch": 719} {"train_loss": -5.3669586181640625, "global_step": 30233, "epoch": 719} {"train_loss": -5.339045524597168, "global_step": 30234, "epoch": 719} {"train_loss": -5.415233612060547, "global_step": 30235, "epoch": 719} {"train_loss": -5.2902984619140625, "global_step": 30236, "epoch": 719} {"train_loss": -5.519600868225098, "global_step": 30237, "epoch": 719} {"train_loss": -5.464207649230957, "global_step": 30238, "epoch": 719} {"train_loss": -5.48575530733381, "global_step": 30239, "epoch": 719, "val_loss": 67121.3984375} {"train_loss": -5.350464820861816, "global_step": 30240, "epoch": 720} {"train_loss": -5.527721405029297, "global_step": 30241, "epoch": 720} {"train_loss": -5.5518412590026855, "global_step": 30242, "epoch": 720} {"train_loss": -5.596767902374268, "global_step": 30243, "epoch": 720} {"train_loss": -5.488531112670898, "global_step": 30244, "epoch": 720} {"train_loss": -5.485329627990723, "global_step": 30245, "epoch": 720} {"train_loss": -5.560116767883301, "global_step": 30246, "epoch": 720} {"train_loss": -5.516102313995361, "global_step": 30247, "epoch": 720} {"train_loss": -5.3803181648254395, "global_step": 30248, "epoch": 720} {"train_loss": -5.527981758117676, "global_step": 30249, "epoch": 720} {"train_loss": -5.527707099914551, "global_step": 30250, "epoch": 720} {"train_loss": -5.6280412673950195, "global_step": 30251, "epoch": 720} {"train_loss": -5.457574844360352, "global_step": 30252, "epoch": 720} {"train_loss": -5.583921432495117, "global_step": 30253, "epoch": 720} {"train_loss": -5.395549774169922, "global_step": 30254, "epoch": 720} {"train_loss": -5.57616662979126, "global_step": 30255, "epoch": 720} {"train_loss": -5.557242393493652, "global_step": 30256, "epoch": 720} {"train_loss": -5.522977352142334, "global_step": 30257, "epoch": 720} {"train_loss": -5.520827293395996, "global_step": 30258, "epoch": 720} {"train_loss": -5.417486667633057, "global_step": 30259, "epoch": 720} {"train_loss": -5.532232761383057, "global_step": 30260, "epoch": 720} {"train_loss": -5.394911766052246, "global_step": 30261, "epoch": 720} {"train_loss": -5.599218368530273, "global_step": 30262, "epoch": 720} {"train_loss": -5.346877574920654, "global_step": 30263, "epoch": 720} {"train_loss": -5.478463172912598, "global_step": 30264, "epoch": 720} {"train_loss": -5.315831184387207, "global_step": 30265, "epoch": 720} {"train_loss": -5.468869686126709, "global_step": 30266, "epoch": 720} {"train_loss": -5.540645122528076, "global_step": 30267, "epoch": 720} {"train_loss": -5.377470016479492, "global_step": 30268, "epoch": 720} {"train_loss": -5.417932510375977, "global_step": 30269, "epoch": 720} {"train_loss": -5.422181606292725, "global_step": 30270, "epoch": 720} {"train_loss": -5.459508895874023, "global_step": 30271, "epoch": 720} {"train_loss": -5.448945999145508, "global_step": 30272, "epoch": 720} {"train_loss": -5.57343864440918, "global_step": 30273, "epoch": 720} {"train_loss": -5.509479999542236, "global_step": 30274, "epoch": 720} {"train_loss": -5.396678447723389, "global_step": 30275, "epoch": 720} {"train_loss": -5.51576042175293, "global_step": 30276, "epoch": 720} {"train_loss": -5.509222030639648, "global_step": 30277, "epoch": 720} {"train_loss": -5.489276885986328, "global_step": 30278, "epoch": 720} {"train_loss": -5.552742958068848, "global_step": 30279, "epoch": 720} {"train_loss": -5.501008033752441, "global_step": 30280, "epoch": 720} {"train_loss": -5.488806940260387, "global_step": 30281, "epoch": 720, "val_loss": 66797.796875} {"train_loss": -5.655447006225586, "global_step": 30282, "epoch": 721} {"train_loss": -5.525963306427002, "global_step": 30283, "epoch": 721} {"train_loss": -5.620554447174072, "global_step": 30284, "epoch": 721} {"train_loss": -5.595232009887695, "global_step": 30285, "epoch": 721} {"train_loss": -5.626906871795654, "global_step": 30286, "epoch": 721} {"train_loss": -5.483366012573242, "global_step": 30287, "epoch": 721} {"train_loss": -5.42064094543457, "global_step": 30288, "epoch": 721} {"train_loss": -5.429099082946777, "global_step": 30289, "epoch": 721} {"train_loss": -5.36164665222168, "global_step": 30290, "epoch": 721} {"train_loss": -5.453234672546387, "global_step": 30291, "epoch": 721} {"train_loss": -5.499997138977051, "global_step": 30292, "epoch": 721} {"train_loss": -5.534534931182861, "global_step": 30293, "epoch": 721} {"train_loss": -5.466802597045898, "global_step": 30294, "epoch": 721} {"train_loss": -5.450836181640625, "global_step": 30295, "epoch": 721} {"train_loss": -5.439292907714844, "global_step": 30296, "epoch": 721} {"train_loss": -5.4525604248046875, "global_step": 30297, "epoch": 721} {"train_loss": -5.469938278198242, "global_step": 30298, "epoch": 721} {"train_loss": -5.613766670227051, "global_step": 30299, "epoch": 721} {"train_loss": -5.593005657196045, "global_step": 30300, "epoch": 721} {"train_loss": -5.613136291503906, "global_step": 30301, "epoch": 721} {"train_loss": -5.426495552062988, "global_step": 30302, "epoch": 721} {"train_loss": -5.530525207519531, "global_step": 30303, "epoch": 721} {"train_loss": -5.487288475036621, "global_step": 30304, "epoch": 721} {"train_loss": -5.548111915588379, "global_step": 30305, "epoch": 721} {"train_loss": -5.489705562591553, "global_step": 30306, "epoch": 721} {"train_loss": -5.494957447052002, "global_step": 30307, "epoch": 721} {"train_loss": -5.526656150817871, "global_step": 30308, "epoch": 721} {"train_loss": -5.4884185791015625, "global_step": 30309, "epoch": 721} {"train_loss": -5.494289398193359, "global_step": 30310, "epoch": 721} {"train_loss": -5.52217960357666, "global_step": 30311, "epoch": 721} {"train_loss": -5.525205612182617, "global_step": 30312, "epoch": 721} {"train_loss": -5.579130172729492, "global_step": 30313, "epoch": 721} {"train_loss": -5.4724225997924805, "global_step": 30314, "epoch": 721} {"train_loss": -5.526472568511963, "global_step": 30315, "epoch": 721} {"train_loss": -5.517701625823975, "global_step": 30316, "epoch": 721} {"train_loss": -5.311723709106445, "global_step": 30317, "epoch": 721} {"train_loss": -5.5277252197265625, "global_step": 30318, "epoch": 721} {"train_loss": -5.444364547729492, "global_step": 30319, "epoch": 721} {"train_loss": -5.612072944641113, "global_step": 30320, "epoch": 721} {"train_loss": -5.531472206115723, "global_step": 30321, "epoch": 721} {"train_loss": -5.3928542137146, "global_step": 30322, "epoch": 721} {"train_loss": -5.507002489907401, "global_step": 30323, "epoch": 721, "val_loss": 66607.8984375} {"train_loss": -5.624454021453857, "global_step": 30324, "epoch": 722} {"train_loss": -5.354980945587158, "global_step": 30325, "epoch": 722} {"train_loss": -5.48447847366333, "global_step": 30326, "epoch": 722} {"train_loss": -5.545914649963379, "global_step": 30327, "epoch": 722} {"train_loss": -5.4429521560668945, "global_step": 30328, "epoch": 722} {"train_loss": -5.446009159088135, "global_step": 30329, "epoch": 722} {"train_loss": -5.515658378601074, "global_step": 30330, "epoch": 722} {"train_loss": -5.354936599731445, "global_step": 30331, "epoch": 722} {"train_loss": -5.4161763191223145, "global_step": 30332, "epoch": 722} {"train_loss": -5.524395942687988, "global_step": 30333, "epoch": 722} {"train_loss": -5.421869277954102, "global_step": 30334, "epoch": 722} {"train_loss": -5.527630805969238, "global_step": 30335, "epoch": 722} {"train_loss": -5.4718427658081055, "global_step": 30336, "epoch": 722} {"train_loss": -5.458331108093262, "global_step": 30337, "epoch": 722} {"train_loss": -5.449287414550781, "global_step": 30338, "epoch": 722} {"train_loss": -5.432218074798584, "global_step": 30339, "epoch": 722} {"train_loss": -5.4783172607421875, "global_step": 30340, "epoch": 722} {"train_loss": -5.597925186157227, "global_step": 30341, "epoch": 722} {"train_loss": -5.514404296875, "global_step": 30342, "epoch": 722} {"train_loss": -5.57831335067749, "global_step": 30343, "epoch": 722} {"train_loss": -5.442368030548096, "global_step": 30344, "epoch": 722} {"train_loss": -5.5394511222839355, "global_step": 30345, "epoch": 722} {"train_loss": -5.4010539054870605, "global_step": 30346, "epoch": 722} {"train_loss": -5.564763069152832, "global_step": 30347, "epoch": 722} {"train_loss": -5.467679500579834, "global_step": 30348, "epoch": 722} {"train_loss": -5.392902851104736, "global_step": 30349, "epoch": 722} {"train_loss": -5.586475372314453, "global_step": 30350, "epoch": 722} {"train_loss": -5.564877510070801, "global_step": 30351, "epoch": 722} {"train_loss": -5.383565902709961, "global_step": 30352, "epoch": 722} {"train_loss": -5.492173671722412, "global_step": 30353, "epoch": 722} {"train_loss": -5.549437522888184, "global_step": 30354, "epoch": 722} {"train_loss": -5.445860862731934, "global_step": 30355, "epoch": 722} {"train_loss": -5.346090793609619, "global_step": 30356, "epoch": 722} {"train_loss": -5.469475269317627, "global_step": 30357, "epoch": 722} {"train_loss": -5.530518531799316, "global_step": 30358, "epoch": 722} {"train_loss": -5.521422386169434, "global_step": 30359, "epoch": 722} {"train_loss": -5.521000385284424, "global_step": 30360, "epoch": 722} {"train_loss": -5.503582954406738, "global_step": 30361, "epoch": 722} {"train_loss": -5.480080604553223, "global_step": 30362, "epoch": 722} {"train_loss": -5.623381614685059, "global_step": 30363, "epoch": 722} {"train_loss": -5.505899906158447, "global_step": 30364, "epoch": 722} {"train_loss": -5.489063262939453, "global_step": 30365, "epoch": 722, "val_loss": 66964.1484375} {"train_loss": -5.450549602508545, "global_step": 30366, "epoch": 723} {"train_loss": -5.42458438873291, "global_step": 30367, "epoch": 723} {"train_loss": -5.478578567504883, "global_step": 30368, "epoch": 723} {"train_loss": -5.4335222244262695, "global_step": 30369, "epoch": 723} {"train_loss": -5.427128314971924, "global_step": 30370, "epoch": 723} {"train_loss": -5.488974571228027, "global_step": 30371, "epoch": 723} {"train_loss": -5.599211692810059, "global_step": 30372, "epoch": 723} {"train_loss": -5.635530471801758, "global_step": 30373, "epoch": 723} {"train_loss": -5.552162170410156, "global_step": 30374, "epoch": 723} {"train_loss": -5.427607536315918, "global_step": 30375, "epoch": 723} {"train_loss": -5.651213645935059, "global_step": 30376, "epoch": 723} {"train_loss": -5.570262908935547, "global_step": 30377, "epoch": 723} {"train_loss": -5.580923080444336, "global_step": 30378, "epoch": 723} {"train_loss": -5.503380298614502, "global_step": 30379, "epoch": 723} {"train_loss": -5.444238662719727, "global_step": 30380, "epoch": 723} {"train_loss": -5.355617046356201, "global_step": 30381, "epoch": 723} {"train_loss": -5.409467697143555, "global_step": 30382, "epoch": 723} {"train_loss": -5.5089006423950195, "global_step": 30383, "epoch": 723} {"train_loss": -5.5003767013549805, "global_step": 30384, "epoch": 723} {"train_loss": -5.411156177520752, "global_step": 30385, "epoch": 723} {"train_loss": -5.467037200927734, "global_step": 30386, "epoch": 723} {"train_loss": -5.4856462478637695, "global_step": 30387, "epoch": 723} {"train_loss": -5.449585914611816, "global_step": 30388, "epoch": 723} {"train_loss": -5.358870983123779, "global_step": 30389, "epoch": 723} {"train_loss": -5.471070766448975, "global_step": 30390, "epoch": 723} {"train_loss": -5.559993267059326, "global_step": 30391, "epoch": 723} {"train_loss": -5.472624778747559, "global_step": 30392, "epoch": 723} {"train_loss": -5.3420209884643555, "global_step": 30393, "epoch": 723} {"train_loss": -5.4921770095825195, "global_step": 30394, "epoch": 723} {"train_loss": -5.610762596130371, "global_step": 30395, "epoch": 723} {"train_loss": -5.421480655670166, "global_step": 30396, "epoch": 723} {"train_loss": -5.504227161407471, "global_step": 30397, "epoch": 723} {"train_loss": -5.481006622314453, "global_step": 30398, "epoch": 723} {"train_loss": -5.450791358947754, "global_step": 30399, "epoch": 723} {"train_loss": -5.421428203582764, "global_step": 30400, "epoch": 723} {"train_loss": -5.599401473999023, "global_step": 30401, "epoch": 723} {"train_loss": -5.494487762451172, "global_step": 30402, "epoch": 723} {"train_loss": -5.333700180053711, "global_step": 30403, "epoch": 723} {"train_loss": -5.377777576446533, "global_step": 30404, "epoch": 723} {"train_loss": -5.478021621704102, "global_step": 30405, "epoch": 723} {"train_loss": -5.476332664489746, "global_step": 30406, "epoch": 723} {"train_loss": -5.476912441707793, "global_step": 30407, "epoch": 723, "val_loss": 68070.4375} {"train_loss": -5.344964504241943, "global_step": 30408, "epoch": 724} {"train_loss": -5.382325172424316, "global_step": 30409, "epoch": 724} {"train_loss": -5.627571105957031, "global_step": 30410, "epoch": 724} {"train_loss": -5.476614952087402, "global_step": 30411, "epoch": 724} {"train_loss": -5.505016326904297, "global_step": 30412, "epoch": 724} {"train_loss": -5.509356498718262, "global_step": 30413, "epoch": 724} {"train_loss": -5.483310699462891, "global_step": 30414, "epoch": 724} {"train_loss": -5.470325469970703, "global_step": 30415, "epoch": 724} {"train_loss": -5.481138229370117, "global_step": 30416, "epoch": 724} {"train_loss": -5.599748611450195, "global_step": 30417, "epoch": 724} {"train_loss": -5.62729549407959, "global_step": 30418, "epoch": 724} {"train_loss": -5.4280900955200195, "global_step": 30419, "epoch": 724} {"train_loss": -5.296283721923828, "global_step": 30420, "epoch": 724} {"train_loss": -5.511627197265625, "global_step": 30421, "epoch": 724} {"train_loss": -5.400865077972412, "global_step": 30422, "epoch": 724} {"train_loss": -5.4460673332214355, "global_step": 30423, "epoch": 724} {"train_loss": -5.4256157875061035, "global_step": 30424, "epoch": 724} {"train_loss": -5.467948913574219, "global_step": 30425, "epoch": 724} {"train_loss": -5.5143232345581055, "global_step": 30426, "epoch": 724} {"train_loss": -5.601109504699707, "global_step": 30427, "epoch": 724} {"train_loss": -5.480580806732178, "global_step": 30428, "epoch": 724} {"train_loss": -5.259220600128174, "global_step": 30429, "epoch": 724} {"train_loss": -5.431395530700684, "global_step": 30430, "epoch": 724} {"train_loss": -5.450148105621338, "global_step": 30431, "epoch": 724} {"train_loss": -5.366840839385986, "global_step": 30432, "epoch": 724} {"train_loss": -5.369157791137695, "global_step": 30433, "epoch": 724} {"train_loss": -5.371896743774414, "global_step": 30434, "epoch": 724} {"train_loss": -5.526673316955566, "global_step": 30435, "epoch": 724} {"train_loss": -5.330525875091553, "global_step": 30436, "epoch": 724} {"train_loss": -5.5443010330200195, "global_step": 30437, "epoch": 724} {"train_loss": -5.458805084228516, "global_step": 30438, "epoch": 724} {"train_loss": -5.502510070800781, "global_step": 30439, "epoch": 724} {"train_loss": -5.3086371421813965, "global_step": 30440, "epoch": 724} {"train_loss": -5.431794166564941, "global_step": 30441, "epoch": 724} {"train_loss": -5.506909370422363, "global_step": 30442, "epoch": 724} {"train_loss": -5.410647869110107, "global_step": 30443, "epoch": 724} {"train_loss": -5.392336845397949, "global_step": 30444, "epoch": 724} {"train_loss": -5.295945167541504, "global_step": 30445, "epoch": 724} {"train_loss": -5.424820899963379, "global_step": 30446, "epoch": 724} {"train_loss": -5.45250129699707, "global_step": 30447, "epoch": 724} {"train_loss": -5.418140411376953, "global_step": 30448, "epoch": 724} {"train_loss": -5.448699485687983, "global_step": 30449, "epoch": 724, "val_loss": 67007.671875} {"train_loss": -5.490257263183594, "global_step": 30450, "epoch": 725} {"train_loss": -5.57967472076416, "global_step": 30451, "epoch": 725} {"train_loss": -5.4261274337768555, "global_step": 30452, "epoch": 725} {"train_loss": -5.447903633117676, "global_step": 30453, "epoch": 725} {"train_loss": -5.534232139587402, "global_step": 30454, "epoch": 725} {"train_loss": -5.544475078582764, "global_step": 30455, "epoch": 725} {"train_loss": -5.5666351318359375, "global_step": 30456, "epoch": 725} {"train_loss": -5.452740669250488, "global_step": 30457, "epoch": 725} {"train_loss": -5.539427757263184, "global_step": 30458, "epoch": 725} {"train_loss": -5.3801703453063965, "global_step": 30459, "epoch": 725} {"train_loss": -5.361998081207275, "global_step": 30460, "epoch": 725} {"train_loss": -5.425452709197998, "global_step": 30461, "epoch": 725} {"train_loss": -5.4153947830200195, "global_step": 30462, "epoch": 725} {"train_loss": -5.471714973449707, "global_step": 30463, "epoch": 725} {"train_loss": -5.49912166595459, "global_step": 30464, "epoch": 725} {"train_loss": -5.627354621887207, "global_step": 30465, "epoch": 725} {"train_loss": -5.287012577056885, "global_step": 30466, "epoch": 725} {"train_loss": -5.448349952697754, "global_step": 30467, "epoch": 725} {"train_loss": -5.446049690246582, "global_step": 30468, "epoch": 725} {"train_loss": -5.442998886108398, "global_step": 30469, "epoch": 725} {"train_loss": -5.593764305114746, "global_step": 30470, "epoch": 725} {"train_loss": -5.462880611419678, "global_step": 30471, "epoch": 725} {"train_loss": -5.408679008483887, "global_step": 30472, "epoch": 725} {"train_loss": -5.50373649597168, "global_step": 30473, "epoch": 725} {"train_loss": -5.406671524047852, "global_step": 30474, "epoch": 725} {"train_loss": -5.356528282165527, "global_step": 30475, "epoch": 725} {"train_loss": -5.398463249206543, "global_step": 30476, "epoch": 725} {"train_loss": -5.577298641204834, "global_step": 30477, "epoch": 725} {"train_loss": -5.45269775390625, "global_step": 30478, "epoch": 725} {"train_loss": -5.53606653213501, "global_step": 30479, "epoch": 725} {"train_loss": -5.451826095581055, "global_step": 30480, "epoch": 725} {"train_loss": -5.529669761657715, "global_step": 30481, "epoch": 725} {"train_loss": -5.502533912658691, "global_step": 30482, "epoch": 725} {"train_loss": -5.50874137878418, "global_step": 30483, "epoch": 725} {"train_loss": -5.569684028625488, "global_step": 30484, "epoch": 725} {"train_loss": -5.58895206451416, "global_step": 30485, "epoch": 725} {"train_loss": -5.375247001647949, "global_step": 30486, "epoch": 725} {"train_loss": -5.395807266235352, "global_step": 30487, "epoch": 725} {"train_loss": -5.614625930786133, "global_step": 30488, "epoch": 725} {"train_loss": -5.55122184753418, "global_step": 30489, "epoch": 725} {"train_loss": -5.398964881896973, "global_step": 30490, "epoch": 725} {"train_loss": -5.476597944895427, "global_step": 30491, "epoch": 725, "val_loss": 66854.515625} {"train_loss": -5.5156450271606445, "global_step": 30492, "epoch": 726} {"train_loss": -5.394587516784668, "global_step": 30493, "epoch": 726} {"train_loss": -5.3699774742126465, "global_step": 30494, "epoch": 726} {"train_loss": -5.516902923583984, "global_step": 30495, "epoch": 726} {"train_loss": -5.550182819366455, "global_step": 30496, "epoch": 726} {"train_loss": -5.480740070343018, "global_step": 30497, "epoch": 726} {"train_loss": -5.692504405975342, "global_step": 30498, "epoch": 726} {"train_loss": -5.497416973114014, "global_step": 30499, "epoch": 726} {"train_loss": -5.483158111572266, "global_step": 30500, "epoch": 726} {"train_loss": -5.42330265045166, "global_step": 30501, "epoch": 726} {"train_loss": -5.410917282104492, "global_step": 30502, "epoch": 726} {"train_loss": -5.404409885406494, "global_step": 30503, "epoch": 726} {"train_loss": -5.435617446899414, "global_step": 30504, "epoch": 726} {"train_loss": -5.492250442504883, "global_step": 30505, "epoch": 726} {"train_loss": -5.635056972503662, "global_step": 30506, "epoch": 726} {"train_loss": -5.6171793937683105, "global_step": 30507, "epoch": 726} {"train_loss": -5.5208611488342285, "global_step": 30508, "epoch": 726} {"train_loss": -5.5140156745910645, "global_step": 30509, "epoch": 726} {"train_loss": -5.554989337921143, "global_step": 30510, "epoch": 726} {"train_loss": -5.624495506286621, "global_step": 30511, "epoch": 726} {"train_loss": -5.351151466369629, "global_step": 30512, "epoch": 726} {"train_loss": -5.422883987426758, "global_step": 30513, "epoch": 726} {"train_loss": -5.517579078674316, "global_step": 30514, "epoch": 726} {"train_loss": -5.491001129150391, "global_step": 30515, "epoch": 726} {"train_loss": -5.554320335388184, "global_step": 30516, "epoch": 726} {"train_loss": -5.4133076667785645, "global_step": 30517, "epoch": 726} {"train_loss": -5.527116298675537, "global_step": 30518, "epoch": 726} {"train_loss": -5.4952073097229, "global_step": 30519, "epoch": 726} {"train_loss": -5.441027641296387, "global_step": 30520, "epoch": 726} {"train_loss": -5.605051040649414, "global_step": 30521, "epoch": 726} {"train_loss": -5.338502407073975, "global_step": 30522, "epoch": 726} {"train_loss": -5.46153450012207, "global_step": 30523, "epoch": 726} {"train_loss": -5.448451995849609, "global_step": 30524, "epoch": 726} {"train_loss": -5.4311017990112305, "global_step": 30525, "epoch": 726} {"train_loss": -5.469540596008301, "global_step": 30526, "epoch": 726} {"train_loss": -5.500669479370117, "global_step": 30527, "epoch": 726} {"train_loss": -5.64887809753418, "global_step": 30528, "epoch": 726} {"train_loss": -5.540554046630859, "global_step": 30529, "epoch": 726} {"train_loss": -5.498849391937256, "global_step": 30530, "epoch": 726} {"train_loss": -5.52428674697876, "global_step": 30531, "epoch": 726} {"train_loss": -5.520411491394043, "global_step": 30532, "epoch": 726} {"train_loss": -5.495821634928386, "global_step": 30533, "epoch": 726, "val_loss": 66574.875} {"train_loss": -5.494672775268555, "global_step": 30534, "epoch": 727} {"train_loss": -5.446883201599121, "global_step": 30535, "epoch": 727} {"train_loss": -5.566009521484375, "global_step": 30536, "epoch": 727} {"train_loss": -5.618247032165527, "global_step": 30537, "epoch": 727} {"train_loss": -5.436440467834473, "global_step": 30538, "epoch": 727} {"train_loss": -5.5387091636657715, "global_step": 30539, "epoch": 727} {"train_loss": -5.536111831665039, "global_step": 30540, "epoch": 727} {"train_loss": -5.446418285369873, "global_step": 30541, "epoch": 727} {"train_loss": -5.550412654876709, "global_step": 30542, "epoch": 727} {"train_loss": -5.58713436126709, "global_step": 30543, "epoch": 727} {"train_loss": -5.393943786621094, "global_step": 30544, "epoch": 727} {"train_loss": -5.534714698791504, "global_step": 30545, "epoch": 727} {"train_loss": -5.598272323608398, "global_step": 30546, "epoch": 727} {"train_loss": -5.420346260070801, "global_step": 30547, "epoch": 727} {"train_loss": -5.550942420959473, "global_step": 30548, "epoch": 727} {"train_loss": -5.575942039489746, "global_step": 30549, "epoch": 727} {"train_loss": -5.538329124450684, "global_step": 30550, "epoch": 727} {"train_loss": -5.413474082946777, "global_step": 30551, "epoch": 727} {"train_loss": -5.646703243255615, "global_step": 30552, "epoch": 727} {"train_loss": -5.475495338439941, "global_step": 30553, "epoch": 727} {"train_loss": -5.3752641677856445, "global_step": 30554, "epoch": 727} {"train_loss": -5.425539016723633, "global_step": 30555, "epoch": 727} {"train_loss": -5.476848602294922, "global_step": 30556, "epoch": 727} {"train_loss": -5.571737289428711, "global_step": 30557, "epoch": 727} {"train_loss": -5.253752708435059, "global_step": 30558, "epoch": 727} {"train_loss": -5.466015815734863, "global_step": 30559, "epoch": 727} {"train_loss": -5.547811508178711, "global_step": 30560, "epoch": 727} {"train_loss": -5.543623924255371, "global_step": 30561, "epoch": 727} {"train_loss": -5.499638080596924, "global_step": 30562, "epoch": 727} {"train_loss": -5.3293070793151855, "global_step": 30563, "epoch": 727} {"train_loss": -5.433974266052246, "global_step": 30564, "epoch": 727} {"train_loss": -5.344360828399658, "global_step": 30565, "epoch": 727} {"train_loss": -5.436971664428711, "global_step": 30566, "epoch": 727} {"train_loss": -5.29209041595459, "global_step": 30567, "epoch": 727} {"train_loss": -5.324840545654297, "global_step": 30568, "epoch": 727} {"train_loss": -5.529598712921143, "global_step": 30569, "epoch": 727} {"train_loss": -5.426613807678223, "global_step": 30570, "epoch": 727} {"train_loss": -5.670919418334961, "global_step": 30571, "epoch": 727} {"train_loss": -5.507894515991211, "global_step": 30572, "epoch": 727} {"train_loss": -5.404120445251465, "global_step": 30573, "epoch": 727} {"train_loss": -5.4155168533325195, "global_step": 30574, "epoch": 727} {"train_loss": -5.4770021211533315, "global_step": 30575, "epoch": 727, "val_loss": 67060.46875} {"train_loss": -5.5394182205200195, "global_step": 30576, "epoch": 728} {"train_loss": -5.412256240844727, "global_step": 30577, "epoch": 728} {"train_loss": -5.502251148223877, "global_step": 30578, "epoch": 728} {"train_loss": -5.568964004516602, "global_step": 30579, "epoch": 728} {"train_loss": -5.440512657165527, "global_step": 30580, "epoch": 728} {"train_loss": -5.550999641418457, "global_step": 30581, "epoch": 728} {"train_loss": -5.5194196701049805, "global_step": 30582, "epoch": 728} {"train_loss": -5.503701210021973, "global_step": 30583, "epoch": 728} {"train_loss": -5.563002586364746, "global_step": 30584, "epoch": 728} {"train_loss": -5.466461658477783, "global_step": 30585, "epoch": 728} {"train_loss": -5.5805344581604, "global_step": 30586, "epoch": 728} {"train_loss": -5.416708946228027, "global_step": 30587, "epoch": 728} {"train_loss": -5.437819480895996, "global_step": 30588, "epoch": 728} {"train_loss": -5.568759918212891, "global_step": 30589, "epoch": 728} {"train_loss": -5.33347225189209, "global_step": 30590, "epoch": 728} {"train_loss": -5.485480308532715, "global_step": 30591, "epoch": 728} {"train_loss": -5.358201026916504, "global_step": 30592, "epoch": 728} {"train_loss": -5.467812538146973, "global_step": 30593, "epoch": 728} {"train_loss": -5.456059455871582, "global_step": 30594, "epoch": 728} {"train_loss": -5.404977321624756, "global_step": 30595, "epoch": 728} {"train_loss": -5.55574893951416, "global_step": 30596, "epoch": 728} {"train_loss": -5.397556304931641, "global_step": 30597, "epoch": 728} {"train_loss": -5.490682125091553, "global_step": 30598, "epoch": 728} {"train_loss": -5.417728424072266, "global_step": 30599, "epoch": 728} {"train_loss": -5.447291374206543, "global_step": 30600, "epoch": 728} {"train_loss": -5.5512542724609375, "global_step": 30601, "epoch": 728} {"train_loss": -5.41378116607666, "global_step": 30602, "epoch": 728} {"train_loss": -5.359613418579102, "global_step": 30603, "epoch": 728} {"train_loss": -5.590909004211426, "global_step": 30604, "epoch": 728} {"train_loss": -5.485037326812744, "global_step": 30605, "epoch": 728} {"train_loss": -5.538211345672607, "global_step": 30606, "epoch": 728} {"train_loss": -5.360626220703125, "global_step": 30607, "epoch": 728} {"train_loss": -5.387698173522949, "global_step": 30608, "epoch": 728} {"train_loss": -5.551408290863037, "global_step": 30609, "epoch": 728} {"train_loss": -5.480037689208984, "global_step": 30610, "epoch": 728} {"train_loss": -5.449498176574707, "global_step": 30611, "epoch": 728} {"train_loss": -5.5262298583984375, "global_step": 30612, "epoch": 728} {"train_loss": -5.485112190246582, "global_step": 30613, "epoch": 728} {"train_loss": -5.549333572387695, "global_step": 30614, "epoch": 728} {"train_loss": -5.462759971618652, "global_step": 30615, "epoch": 728} {"train_loss": -5.458086013793945, "global_step": 30616, "epoch": 728} {"train_loss": -5.4763023853302, "global_step": 30617, "epoch": 728, "val_loss": 67044.3125} {"train_loss": -5.543863296508789, "global_step": 30618, "epoch": 729} {"train_loss": -5.558483123779297, "global_step": 30619, "epoch": 729} {"train_loss": -5.489651679992676, "global_step": 30620, "epoch": 729} {"train_loss": -5.366774559020996, "global_step": 30621, "epoch": 729} {"train_loss": -5.6226396560668945, "global_step": 30622, "epoch": 729} {"train_loss": -5.431848526000977, "global_step": 30623, "epoch": 729} {"train_loss": -5.476073265075684, "global_step": 30624, "epoch": 729} {"train_loss": -5.446538925170898, "global_step": 30625, "epoch": 729} {"train_loss": -5.468685150146484, "global_step": 30626, "epoch": 729} {"train_loss": -5.654447078704834, "global_step": 30627, "epoch": 729} {"train_loss": -5.518346309661865, "global_step": 30628, "epoch": 729} {"train_loss": -5.443922996520996, "global_step": 30629, "epoch": 729} {"train_loss": -5.461988925933838, "global_step": 30630, "epoch": 729} {"train_loss": -5.423302173614502, "global_step": 30631, "epoch": 729} {"train_loss": -5.535322189331055, "global_step": 30632, "epoch": 729} {"train_loss": -5.6978607177734375, "global_step": 30633, "epoch": 729} {"train_loss": -5.466814994812012, "global_step": 30634, "epoch": 729} {"train_loss": -5.396237850189209, "global_step": 30635, "epoch": 729} {"train_loss": -5.4147844314575195, "global_step": 30636, "epoch": 729} {"train_loss": -5.6057844161987305, "global_step": 30637, "epoch": 729} {"train_loss": -5.524308681488037, "global_step": 30638, "epoch": 729} {"train_loss": -5.43969202041626, "global_step": 30639, "epoch": 729} {"train_loss": -5.4745774269104, "global_step": 30640, "epoch": 729} {"train_loss": -5.54542350769043, "global_step": 30641, "epoch": 729} {"train_loss": -5.5578155517578125, "global_step": 30642, "epoch": 729} {"train_loss": -5.4972429275512695, "global_step": 30643, "epoch": 729} {"train_loss": -5.368087291717529, "global_step": 30644, "epoch": 729} {"train_loss": -5.519194602966309, "global_step": 30645, "epoch": 729} {"train_loss": -5.340768814086914, "global_step": 30646, "epoch": 729} {"train_loss": -5.407994747161865, "global_step": 30647, "epoch": 729} {"train_loss": -5.563165187835693, "global_step": 30648, "epoch": 729} {"train_loss": -5.582953929901123, "global_step": 30649, "epoch": 729} {"train_loss": -5.520363807678223, "global_step": 30650, "epoch": 729} {"train_loss": -5.480952262878418, "global_step": 30651, "epoch": 729} {"train_loss": -5.382404327392578, "global_step": 30652, "epoch": 729} {"train_loss": -5.443671226501465, "global_step": 30653, "epoch": 729} {"train_loss": -5.426904678344727, "global_step": 30654, "epoch": 729} {"train_loss": -5.462515830993652, "global_step": 30655, "epoch": 729} {"train_loss": -5.431921005249023, "global_step": 30656, "epoch": 729} {"train_loss": -5.4421892166137695, "global_step": 30657, "epoch": 729} {"train_loss": -5.39076042175293, "global_step": 30658, "epoch": 729} {"train_loss": -5.483456327801659, "global_step": 30659, "epoch": 729, "val_loss": 66724.6484375} {"train_loss": -5.419814586639404, "global_step": 30660, "epoch": 730} {"train_loss": -5.527745246887207, "global_step": 30661, "epoch": 730} {"train_loss": -5.405755519866943, "global_step": 30662, "epoch": 730} {"train_loss": -5.476309299468994, "global_step": 30663, "epoch": 730} {"train_loss": -5.519184112548828, "global_step": 30664, "epoch": 730} {"train_loss": -5.391086101531982, "global_step": 30665, "epoch": 730} {"train_loss": -5.503803730010986, "global_step": 30666, "epoch": 730} {"train_loss": -5.48003625869751, "global_step": 30667, "epoch": 730} {"train_loss": -5.419978141784668, "global_step": 30668, "epoch": 730} {"train_loss": -5.3789215087890625, "global_step": 30669, "epoch": 730} {"train_loss": -5.289667129516602, "global_step": 30670, "epoch": 730} {"train_loss": -5.478882312774658, "global_step": 30671, "epoch": 730} {"train_loss": -5.614225387573242, "global_step": 30672, "epoch": 730} {"train_loss": -5.487150192260742, "global_step": 30673, "epoch": 730} {"train_loss": -5.510439872741699, "global_step": 30674, "epoch": 730} {"train_loss": -5.502309799194336, "global_step": 30675, "epoch": 730} {"train_loss": -5.575541019439697, "global_step": 30676, "epoch": 730} {"train_loss": -5.538444519042969, "global_step": 30677, "epoch": 730} {"train_loss": -5.48441743850708, "global_step": 30678, "epoch": 730} {"train_loss": -5.460703372955322, "global_step": 30679, "epoch": 730} {"train_loss": -5.5040717124938965, "global_step": 30680, "epoch": 730} {"train_loss": -5.448780536651611, "global_step": 30681, "epoch": 730} {"train_loss": -5.547800540924072, "global_step": 30682, "epoch": 730} {"train_loss": -5.556405544281006, "global_step": 30683, "epoch": 730} {"train_loss": -5.666424751281738, "global_step": 30684, "epoch": 730} {"train_loss": -5.448026657104492, "global_step": 30685, "epoch": 730} {"train_loss": -5.559979438781738, "global_step": 30686, "epoch": 730} {"train_loss": -5.494033336639404, "global_step": 30687, "epoch": 730} {"train_loss": -5.465662956237793, "global_step": 30688, "epoch": 730} {"train_loss": -5.5055084228515625, "global_step": 30689, "epoch": 730} {"train_loss": -5.518812656402588, "global_step": 30690, "epoch": 730} {"train_loss": -5.504913806915283, "global_step": 30691, "epoch": 730} {"train_loss": -5.405575752258301, "global_step": 30692, "epoch": 730} {"train_loss": -5.43498420715332, "global_step": 30693, "epoch": 730} {"train_loss": -5.435683250427246, "global_step": 30694, "epoch": 730} {"train_loss": -5.371784210205078, "global_step": 30695, "epoch": 730} {"train_loss": -5.518745422363281, "global_step": 30696, "epoch": 730} {"train_loss": -5.561290740966797, "global_step": 30697, "epoch": 730} {"train_loss": -5.4682793617248535, "global_step": 30698, "epoch": 730} {"train_loss": -5.545802116394043, "global_step": 30699, "epoch": 730} {"train_loss": -5.406253814697266, "global_step": 30700, "epoch": 730} {"train_loss": -5.483944938296363, "global_step": 30701, "epoch": 730, "val_loss": 66557.5859375} {"train_loss": -5.541092872619629, "global_step": 30702, "epoch": 731} {"train_loss": -5.512056350708008, "global_step": 30703, "epoch": 731} {"train_loss": -5.544964790344238, "global_step": 30704, "epoch": 731} {"train_loss": -5.400496482849121, "global_step": 30705, "epoch": 731} {"train_loss": -5.646125793457031, "global_step": 30706, "epoch": 731} {"train_loss": -5.429404258728027, "global_step": 30707, "epoch": 731} {"train_loss": -5.529122352600098, "global_step": 30708, "epoch": 731} {"train_loss": -5.369797706604004, "global_step": 30709, "epoch": 731} {"train_loss": -5.60699462890625, "global_step": 30710, "epoch": 731} {"train_loss": -5.5523247718811035, "global_step": 30711, "epoch": 731} {"train_loss": -5.505749702453613, "global_step": 30712, "epoch": 731} {"train_loss": -5.555841445922852, "global_step": 30713, "epoch": 731} {"train_loss": -5.450536727905273, "global_step": 30714, "epoch": 731} {"train_loss": -5.501679420471191, "global_step": 30715, "epoch": 731} {"train_loss": -5.514370918273926, "global_step": 30716, "epoch": 731} {"train_loss": -5.386219024658203, "global_step": 30717, "epoch": 731} {"train_loss": -5.556962490081787, "global_step": 30718, "epoch": 731} {"train_loss": -5.417581558227539, "global_step": 30719, "epoch": 731} {"train_loss": -5.518383979797363, "global_step": 30720, "epoch": 731} {"train_loss": -5.534061431884766, "global_step": 30721, "epoch": 731} {"train_loss": -5.484946250915527, "global_step": 30722, "epoch": 731} {"train_loss": -5.565298557281494, "global_step": 30723, "epoch": 731} {"train_loss": -5.599399566650391, "global_step": 30724, "epoch": 731} {"train_loss": -5.428473472595215, "global_step": 30725, "epoch": 731} {"train_loss": -5.374150276184082, "global_step": 30726, "epoch": 731} {"train_loss": -5.553191661834717, "global_step": 30727, "epoch": 731} {"train_loss": -5.357169151306152, "global_step": 30728, "epoch": 731} {"train_loss": -5.311212539672852, "global_step": 30729, "epoch": 731} {"train_loss": -5.428502082824707, "global_step": 30730, "epoch": 731} {"train_loss": -5.351138591766357, "global_step": 30731, "epoch": 731} {"train_loss": -5.405837059020996, "global_step": 30732, "epoch": 731} {"train_loss": -5.253069877624512, "global_step": 30733, "epoch": 731} {"train_loss": -5.477504253387451, "global_step": 30734, "epoch": 731} {"train_loss": -5.326749324798584, "global_step": 30735, "epoch": 731} {"train_loss": -5.4318742752075195, "global_step": 30736, "epoch": 731} {"train_loss": -5.447742462158203, "global_step": 30737, "epoch": 731} {"train_loss": -5.431123733520508, "global_step": 30738, "epoch": 731} {"train_loss": -5.465564727783203, "global_step": 30739, "epoch": 731} {"train_loss": -5.525012493133545, "global_step": 30740, "epoch": 731} {"train_loss": -5.495458126068115, "global_step": 30741, "epoch": 731} {"train_loss": -5.361879348754883, "global_step": 30742, "epoch": 731} {"train_loss": -5.466834000178745, "global_step": 30743, "epoch": 731, "val_loss": 67265.765625} {"train_loss": -5.540014743804932, "global_step": 30744, "epoch": 732} {"train_loss": -5.371330261230469, "global_step": 30745, "epoch": 732} {"train_loss": -5.507802963256836, "global_step": 30746, "epoch": 732} {"train_loss": -5.51620626449585, "global_step": 30747, "epoch": 732} {"train_loss": -5.490319728851318, "global_step": 30748, "epoch": 732} {"train_loss": -5.364208221435547, "global_step": 30749, "epoch": 732} {"train_loss": -5.479495525360107, "global_step": 30750, "epoch": 732} {"train_loss": -5.5802717208862305, "global_step": 30751, "epoch": 732} {"train_loss": -5.440083026885986, "global_step": 30752, "epoch": 732} {"train_loss": -5.550448417663574, "global_step": 30753, "epoch": 732} {"train_loss": -5.323359489440918, "global_step": 30754, "epoch": 732} {"train_loss": -5.522580146789551, "global_step": 30755, "epoch": 732} {"train_loss": -5.48419189453125, "global_step": 30756, "epoch": 732} {"train_loss": -5.530742645263672, "global_step": 30757, "epoch": 732} {"train_loss": -5.4310712814331055, "global_step": 30758, "epoch": 732} {"train_loss": -5.458907127380371, "global_step": 30759, "epoch": 732} {"train_loss": -5.524183750152588, "global_step": 30760, "epoch": 732} {"train_loss": -5.381596565246582, "global_step": 30761, "epoch": 732} {"train_loss": -5.402570724487305, "global_step": 30762, "epoch": 732} {"train_loss": -5.3747663497924805, "global_step": 30763, "epoch": 732} {"train_loss": -5.394229888916016, "global_step": 30764, "epoch": 732} {"train_loss": -5.5310587882995605, "global_step": 30765, "epoch": 732} {"train_loss": -5.2774553298950195, "global_step": 30766, "epoch": 732} {"train_loss": -5.477174758911133, "global_step": 30767, "epoch": 732} {"train_loss": -5.461583614349365, "global_step": 30768, "epoch": 732} {"train_loss": -5.411220073699951, "global_step": 30769, "epoch": 732} {"train_loss": -5.448176383972168, "global_step": 30770, "epoch": 732} {"train_loss": -5.407718658447266, "global_step": 30771, "epoch": 732} {"train_loss": -5.400121688842773, "global_step": 30772, "epoch": 732} {"train_loss": -5.448099136352539, "global_step": 30773, "epoch": 732} {"train_loss": -5.520364284515381, "global_step": 30774, "epoch": 732} {"train_loss": -5.4087677001953125, "global_step": 30775, "epoch": 732} {"train_loss": -5.328708648681641, "global_step": 30776, "epoch": 732} {"train_loss": -5.609340667724609, "global_step": 30777, "epoch": 732} {"train_loss": -5.501369476318359, "global_step": 30778, "epoch": 732} {"train_loss": -5.552210807800293, "global_step": 30779, "epoch": 732} {"train_loss": -5.563413619995117, "global_step": 30780, "epoch": 732} {"train_loss": -5.502085208892822, "global_step": 30781, "epoch": 732} {"train_loss": -5.455528259277344, "global_step": 30782, "epoch": 732} {"train_loss": -5.397616863250732, "global_step": 30783, "epoch": 732} {"train_loss": -5.495323181152344, "global_step": 30784, "epoch": 732} {"train_loss": -5.461433104106358, "global_step": 30785, "epoch": 732, "val_loss": 66777.734375} {"train_loss": -5.501941680908203, "global_step": 30786, "epoch": 733} {"train_loss": -5.5298237800598145, "global_step": 30787, "epoch": 733} {"train_loss": -5.56610107421875, "global_step": 30788, "epoch": 733} {"train_loss": -5.666149139404297, "global_step": 30789, "epoch": 733} {"train_loss": -5.5564751625061035, "global_step": 30790, "epoch": 733} {"train_loss": -5.509353160858154, "global_step": 30791, "epoch": 733} {"train_loss": -5.438655853271484, "global_step": 30792, "epoch": 733} {"train_loss": -5.491333961486816, "global_step": 30793, "epoch": 733} {"train_loss": -5.374814987182617, "global_step": 30794, "epoch": 733} {"train_loss": -5.469557285308838, "global_step": 30795, "epoch": 733} {"train_loss": -5.680176734924316, "global_step": 30796, "epoch": 733} {"train_loss": -5.3934173583984375, "global_step": 30797, "epoch": 733} {"train_loss": -5.454331398010254, "global_step": 30798, "epoch": 733} {"train_loss": -5.427700996398926, "global_step": 30799, "epoch": 733} {"train_loss": -5.527309417724609, "global_step": 30800, "epoch": 733} {"train_loss": -5.570749759674072, "global_step": 30801, "epoch": 733} {"train_loss": -5.52829647064209, "global_step": 30802, "epoch": 733} {"train_loss": -5.391340255737305, "global_step": 30803, "epoch": 733} {"train_loss": -5.359393119812012, "global_step": 30804, "epoch": 733} {"train_loss": -5.441611289978027, "global_step": 30805, "epoch": 733} {"train_loss": -5.296151161193848, "global_step": 30806, "epoch": 733} {"train_loss": -5.413896560668945, "global_step": 30807, "epoch": 733} {"train_loss": -5.504706382751465, "global_step": 30808, "epoch": 733} {"train_loss": -5.4165358543396, "global_step": 30809, "epoch": 733} {"train_loss": -5.494551658630371, "global_step": 30810, "epoch": 733} {"train_loss": -5.532831192016602, "global_step": 30811, "epoch": 733} {"train_loss": -5.565661430358887, "global_step": 30812, "epoch": 733} {"train_loss": -5.4575605392456055, "global_step": 30813, "epoch": 733} {"train_loss": -5.582210540771484, "global_step": 30814, "epoch": 733} {"train_loss": -5.506272315979004, "global_step": 30815, "epoch": 733} {"train_loss": -5.479629993438721, "global_step": 30816, "epoch": 733} {"train_loss": -5.475940704345703, "global_step": 30817, "epoch": 733} {"train_loss": -5.52415657043457, "global_step": 30818, "epoch": 733} {"train_loss": -5.571242332458496, "global_step": 30819, "epoch": 733} {"train_loss": -5.44508171081543, "global_step": 30820, "epoch": 733} {"train_loss": -5.487743377685547, "global_step": 30821, "epoch": 733} {"train_loss": -5.585914611816406, "global_step": 30822, "epoch": 733} {"train_loss": -5.396117210388184, "global_step": 30823, "epoch": 733} {"train_loss": -5.481592178344727, "global_step": 30824, "epoch": 733} {"train_loss": -5.513998031616211, "global_step": 30825, "epoch": 733} {"train_loss": -5.53037691116333, "global_step": 30826, "epoch": 733} {"train_loss": -5.489404735111055, "global_step": 30827, "epoch": 733, "val_loss": 66989.03125} {"train_loss": -5.507317543029785, "global_step": 30828, "epoch": 734} {"train_loss": -5.504062175750732, "global_step": 30829, "epoch": 734} {"train_loss": -5.477435111999512, "global_step": 30830, "epoch": 734} {"train_loss": -5.447251319885254, "global_step": 30831, "epoch": 734} {"train_loss": -5.516008377075195, "global_step": 30832, "epoch": 734} {"train_loss": -5.652321815490723, "global_step": 30833, "epoch": 734} {"train_loss": -5.458959579467773, "global_step": 30834, "epoch": 734} {"train_loss": -5.49166202545166, "global_step": 30835, "epoch": 734} {"train_loss": -5.587055206298828, "global_step": 30836, "epoch": 734} {"train_loss": -5.477555274963379, "global_step": 30837, "epoch": 734} {"train_loss": -5.48495626449585, "global_step": 30838, "epoch": 734} {"train_loss": -5.442788600921631, "global_step": 30839, "epoch": 734} {"train_loss": -5.429604530334473, "global_step": 30840, "epoch": 734} {"train_loss": -5.5319671630859375, "global_step": 30841, "epoch": 734} {"train_loss": -5.466582298278809, "global_step": 30842, "epoch": 734} {"train_loss": -5.61324405670166, "global_step": 30843, "epoch": 734} {"train_loss": -5.592194557189941, "global_step": 30844, "epoch": 734} {"train_loss": -5.513799667358398, "global_step": 30845, "epoch": 734} {"train_loss": -5.60377311706543, "global_step": 30846, "epoch": 734} {"train_loss": -5.429192543029785, "global_step": 30847, "epoch": 734} {"train_loss": -5.467177867889404, "global_step": 30848, "epoch": 734} {"train_loss": -5.415467739105225, "global_step": 30849, "epoch": 734} {"train_loss": -5.419824600219727, "global_step": 30850, "epoch": 734} {"train_loss": -5.455326080322266, "global_step": 30851, "epoch": 734} {"train_loss": -5.541530609130859, "global_step": 30852, "epoch": 734} {"train_loss": -5.481804847717285, "global_step": 30853, "epoch": 734} {"train_loss": -5.581242561340332, "global_step": 30854, "epoch": 734} {"train_loss": -5.486640930175781, "global_step": 30855, "epoch": 734} {"train_loss": -5.404687404632568, "global_step": 30856, "epoch": 734} {"train_loss": -5.539849281311035, "global_step": 30857, "epoch": 734} {"train_loss": -5.587332725524902, "global_step": 30858, "epoch": 734} {"train_loss": -5.500258922576904, "global_step": 30859, "epoch": 734} {"train_loss": -5.441228866577148, "global_step": 30860, "epoch": 734} {"train_loss": -5.526828765869141, "global_step": 30861, "epoch": 734} {"train_loss": -5.462208271026611, "global_step": 30862, "epoch": 734} {"train_loss": -5.65816593170166, "global_step": 30863, "epoch": 734} {"train_loss": -5.46071720123291, "global_step": 30864, "epoch": 734} {"train_loss": -5.424769401550293, "global_step": 30865, "epoch": 734} {"train_loss": -5.544283866882324, "global_step": 30866, "epoch": 734} {"train_loss": -5.532417297363281, "global_step": 30867, "epoch": 734} {"train_loss": -5.434797763824463, "global_step": 30868, "epoch": 734} {"train_loss": -5.503746918269566, "global_step": 30869, "epoch": 734, "val_loss": 66637.6484375} {"train_loss": -5.568760871887207, "global_step": 30870, "epoch": 735} {"train_loss": -5.416841506958008, "global_step": 30871, "epoch": 735} {"train_loss": -5.57121467590332, "global_step": 30872, "epoch": 735} {"train_loss": -5.498773574829102, "global_step": 30873, "epoch": 735} {"train_loss": -5.4803571701049805, "global_step": 30874, "epoch": 735} {"train_loss": -5.5159735679626465, "global_step": 30875, "epoch": 735} {"train_loss": -5.439416885375977, "global_step": 30876, "epoch": 735} {"train_loss": -5.412154674530029, "global_step": 30877, "epoch": 735} {"train_loss": -5.3896942138671875, "global_step": 30878, "epoch": 735} {"train_loss": -5.374398708343506, "global_step": 30879, "epoch": 735} {"train_loss": -5.534585952758789, "global_step": 30880, "epoch": 735} {"train_loss": -5.509392261505127, "global_step": 30881, "epoch": 735} {"train_loss": -5.732005596160889, "global_step": 30882, "epoch": 735} {"train_loss": -5.511935710906982, "global_step": 30883, "epoch": 735} {"train_loss": -5.5614423751831055, "global_step": 30884, "epoch": 735} {"train_loss": -5.4954071044921875, "global_step": 30885, "epoch": 735} {"train_loss": -5.583469867706299, "global_step": 30886, "epoch": 735} {"train_loss": -5.576726913452148, "global_step": 30887, "epoch": 735} {"train_loss": -5.516593933105469, "global_step": 30888, "epoch": 735} {"train_loss": -5.493881702423096, "global_step": 30889, "epoch": 735} {"train_loss": -5.527667999267578, "global_step": 30890, "epoch": 735} {"train_loss": -5.444322109222412, "global_step": 30891, "epoch": 735} {"train_loss": -5.375504493713379, "global_step": 30892, "epoch": 735} {"train_loss": -5.561788082122803, "global_step": 30893, "epoch": 735} {"train_loss": -5.507680892944336, "global_step": 30894, "epoch": 735} {"train_loss": -5.516646385192871, "global_step": 30895, "epoch": 735} {"train_loss": -5.401564598083496, "global_step": 30896, "epoch": 735} {"train_loss": -5.550276756286621, "global_step": 30897, "epoch": 735} {"train_loss": -5.390149116516113, "global_step": 30898, "epoch": 735} {"train_loss": -5.363447666168213, "global_step": 30899, "epoch": 735} {"train_loss": -5.488436698913574, "global_step": 30900, "epoch": 735} {"train_loss": -5.4390716552734375, "global_step": 30901, "epoch": 735} {"train_loss": -5.2862138748168945, "global_step": 30902, "epoch": 735} {"train_loss": -5.479803085327148, "global_step": 30903, "epoch": 735} {"train_loss": -5.569710731506348, "global_step": 30904, "epoch": 735} {"train_loss": -5.460172176361084, "global_step": 30905, "epoch": 735} {"train_loss": -5.522593021392822, "global_step": 30906, "epoch": 735} {"train_loss": -5.562039375305176, "global_step": 30907, "epoch": 735} {"train_loss": -5.498223781585693, "global_step": 30908, "epoch": 735} {"train_loss": -5.460098743438721, "global_step": 30909, "epoch": 735} {"train_loss": -5.40980863571167, "global_step": 30910, "epoch": 735} {"train_loss": -5.4869063922337125, "global_step": 30911, "epoch": 735, "val_loss": 67003.2421875} {"train_loss": -5.415764331817627, "global_step": 30912, "epoch": 736} {"train_loss": -5.521225452423096, "global_step": 30913, "epoch": 736} {"train_loss": -5.5441670417785645, "global_step": 30914, "epoch": 736} {"train_loss": -5.454611778259277, "global_step": 30915, "epoch": 736} {"train_loss": -5.496977806091309, "global_step": 30916, "epoch": 736} {"train_loss": -5.422482490539551, "global_step": 30917, "epoch": 736} {"train_loss": -5.5882110595703125, "global_step": 30918, "epoch": 736} {"train_loss": -5.471745014190674, "global_step": 30919, "epoch": 736} {"train_loss": -5.609442710876465, "global_step": 30920, "epoch": 736} {"train_loss": -5.6347856521606445, "global_step": 30921, "epoch": 736} {"train_loss": -5.470851421356201, "global_step": 30922, "epoch": 736} {"train_loss": -5.5941009521484375, "global_step": 30923, "epoch": 736} {"train_loss": -5.46083927154541, "global_step": 30924, "epoch": 736} {"train_loss": -5.459162712097168, "global_step": 30925, "epoch": 736} {"train_loss": -5.515340328216553, "global_step": 30926, "epoch": 736} {"train_loss": -5.333471298217773, "global_step": 30927, "epoch": 736} {"train_loss": -5.613922119140625, "global_step": 30928, "epoch": 736} {"train_loss": -5.390298843383789, "global_step": 30929, "epoch": 736} {"train_loss": -5.488327980041504, "global_step": 30930, "epoch": 736} {"train_loss": -5.480998516082764, "global_step": 30931, "epoch": 736} {"train_loss": -5.569947719573975, "global_step": 30932, "epoch": 736} {"train_loss": -5.536610126495361, "global_step": 30933, "epoch": 736} {"train_loss": -5.4349045753479, "global_step": 30934, "epoch": 736} {"train_loss": -5.660063743591309, "global_step": 30935, "epoch": 736} {"train_loss": -5.268344879150391, "global_step": 30936, "epoch": 736} {"train_loss": -5.534942626953125, "global_step": 30937, "epoch": 736} {"train_loss": -5.463537693023682, "global_step": 30938, "epoch": 736} {"train_loss": -5.55081844329834, "global_step": 30939, "epoch": 736} {"train_loss": -5.427158355712891, "global_step": 30940, "epoch": 736} {"train_loss": -5.469582557678223, "global_step": 30941, "epoch": 736} {"train_loss": -5.391618251800537, "global_step": 30942, "epoch": 736} {"train_loss": -5.5039143562316895, "global_step": 30943, "epoch": 736} {"train_loss": -5.408902645111084, "global_step": 30944, "epoch": 736} {"train_loss": -5.364070892333984, "global_step": 30945, "epoch": 736} {"train_loss": -5.24760627746582, "global_step": 30946, "epoch": 736} {"train_loss": -5.361016750335693, "global_step": 30947, "epoch": 736} {"train_loss": -5.383842468261719, "global_step": 30948, "epoch": 736} {"train_loss": -5.537383079528809, "global_step": 30949, "epoch": 736} {"train_loss": -5.415074825286865, "global_step": 30950, "epoch": 736} {"train_loss": -5.318549156188965, "global_step": 30951, "epoch": 736} {"train_loss": -5.420316219329834, "global_step": 30952, "epoch": 736} {"train_loss": -5.467458009719849, "global_step": 30953, "epoch": 736, "val_loss": 66845.6328125} {"train_loss": -5.503212928771973, "global_step": 30954, "epoch": 737} {"train_loss": -5.577277183532715, "global_step": 30955, "epoch": 737} {"train_loss": -5.461906909942627, "global_step": 30956, "epoch": 737} {"train_loss": -5.5231733322143555, "global_step": 30957, "epoch": 737} {"train_loss": -5.487438678741455, "global_step": 30958, "epoch": 737} {"train_loss": -5.3599700927734375, "global_step": 30959, "epoch": 737} {"train_loss": -5.6073408126831055, "global_step": 30960, "epoch": 737} {"train_loss": -5.436771392822266, "global_step": 30961, "epoch": 737} {"train_loss": -5.513486862182617, "global_step": 30962, "epoch": 737} {"train_loss": -5.460367202758789, "global_step": 30963, "epoch": 737} {"train_loss": -5.4460625648498535, "global_step": 30964, "epoch": 737} {"train_loss": -5.50450325012207, "global_step": 30965, "epoch": 737} {"train_loss": -5.501183986663818, "global_step": 30966, "epoch": 737} {"train_loss": -5.551257133483887, "global_step": 30967, "epoch": 737} {"train_loss": -5.424496650695801, "global_step": 30968, "epoch": 737} {"train_loss": -5.61357307434082, "global_step": 30969, "epoch": 737} {"train_loss": -5.4921875, "global_step": 30970, "epoch": 737} {"train_loss": -5.445568084716797, "global_step": 30971, "epoch": 737} {"train_loss": -5.3125691413879395, "global_step": 30972, "epoch": 737} {"train_loss": -5.438316822052002, "global_step": 30973, "epoch": 737} {"train_loss": -5.4801154136657715, "global_step": 30974, "epoch": 737} {"train_loss": -5.453275680541992, "global_step": 30975, "epoch": 737} {"train_loss": -5.4948835372924805, "global_step": 30976, "epoch": 737} {"train_loss": -5.401597023010254, "global_step": 30977, "epoch": 737} {"train_loss": -5.545872211456299, "global_step": 30978, "epoch": 737} {"train_loss": -5.507543563842773, "global_step": 30979, "epoch": 737} {"train_loss": -5.303666114807129, "global_step": 30980, "epoch": 737} {"train_loss": -5.566310882568359, "global_step": 30981, "epoch": 737} {"train_loss": -5.292666435241699, "global_step": 30982, "epoch": 737} {"train_loss": -5.3021135330200195, "global_step": 30983, "epoch": 737} {"train_loss": -5.6228861808776855, "global_step": 30984, "epoch": 737} {"train_loss": -5.464991569519043, "global_step": 30985, "epoch": 737} {"train_loss": -5.512765884399414, "global_step": 30986, "epoch": 737} {"train_loss": -5.413290500640869, "global_step": 30987, "epoch": 737} {"train_loss": -5.494386196136475, "global_step": 30988, "epoch": 737} {"train_loss": -5.471290588378906, "global_step": 30989, "epoch": 737} {"train_loss": -5.594150543212891, "global_step": 30990, "epoch": 737} {"train_loss": -5.519503593444824, "global_step": 30991, "epoch": 737} {"train_loss": -5.365151882171631, "global_step": 30992, "epoch": 737} {"train_loss": -5.5294599533081055, "global_step": 30993, "epoch": 737} {"train_loss": -5.475750923156738, "global_step": 30994, "epoch": 737} {"train_loss": -5.475083067303612, "global_step": 30995, "epoch": 737, "val_loss": 66986.0078125} {"train_loss": -5.614624977111816, "global_step": 30996, "epoch": 738} {"train_loss": -5.466978073120117, "global_step": 30997, "epoch": 738} {"train_loss": -5.458247184753418, "global_step": 30998, "epoch": 738} {"train_loss": -5.514154434204102, "global_step": 30999, "epoch": 738} {"train_loss": -5.391961574554443, "global_step": 31000, "epoch": 738} {"train_loss": -5.430783748626709, "global_step": 31001, "epoch": 738} {"train_loss": -5.525509834289551, "global_step": 31002, "epoch": 738} {"train_loss": -5.423857688903809, "global_step": 31003, "epoch": 738} {"train_loss": -5.493544578552246, "global_step": 31004, "epoch": 738} {"train_loss": -5.573878288269043, "global_step": 31005, "epoch": 738} {"train_loss": -5.5375776290893555, "global_step": 31006, "epoch": 738} {"train_loss": -5.476903915405273, "global_step": 31007, "epoch": 738} {"train_loss": -5.593286514282227, "global_step": 31008, "epoch": 738} {"train_loss": -5.392309188842773, "global_step": 31009, "epoch": 738} {"train_loss": -5.653861045837402, "global_step": 31010, "epoch": 738} {"train_loss": -5.600772857666016, "global_step": 31011, "epoch": 738} {"train_loss": -5.487864971160889, "global_step": 31012, "epoch": 738} {"train_loss": -5.513876438140869, "global_step": 31013, "epoch": 738} {"train_loss": -5.683388710021973, "global_step": 31014, "epoch": 738} {"train_loss": -5.564846038818359, "global_step": 31015, "epoch": 738} {"train_loss": -5.599089622497559, "global_step": 31016, "epoch": 738} {"train_loss": -5.359323501586914, "global_step": 31017, "epoch": 738} {"train_loss": -5.532862663269043, "global_step": 31018, "epoch": 738} {"train_loss": -5.442203998565674, "global_step": 31019, "epoch": 738} {"train_loss": -5.572381973266602, "global_step": 31020, "epoch": 738} {"train_loss": -5.4962663650512695, "global_step": 31021, "epoch": 738} {"train_loss": -5.606894493103027, "global_step": 31022, "epoch": 738} {"train_loss": -5.447187900543213, "global_step": 31023, "epoch": 738} {"train_loss": -5.388628005981445, "global_step": 31024, "epoch": 738} {"train_loss": -5.581789970397949, "global_step": 31025, "epoch": 738} {"train_loss": -5.5305891036987305, "global_step": 31026, "epoch": 738} {"train_loss": -5.499105930328369, "global_step": 31027, "epoch": 738} {"train_loss": -5.463217258453369, "global_step": 31028, "epoch": 738} {"train_loss": -5.525856971740723, "global_step": 31029, "epoch": 738} {"train_loss": -5.56483268737793, "global_step": 31030, "epoch": 738} {"train_loss": -5.613432884216309, "global_step": 31031, "epoch": 738} {"train_loss": -5.566258907318115, "global_step": 31032, "epoch": 738} {"train_loss": -5.441448211669922, "global_step": 31033, "epoch": 738} {"train_loss": -5.475082874298096, "global_step": 31034, "epoch": 738} {"train_loss": -5.382521152496338, "global_step": 31035, "epoch": 738} {"train_loss": -5.486196517944336, "global_step": 31036, "epoch": 738} {"train_loss": -5.509977147692726, "global_step": 31037, "epoch": 738, "val_loss": 66724.4453125} {"train_loss": -5.579808235168457, "global_step": 31038, "epoch": 739} {"train_loss": -5.513570785522461, "global_step": 31039, "epoch": 739} {"train_loss": -5.595485687255859, "global_step": 31040, "epoch": 739} {"train_loss": -5.531735420227051, "global_step": 31041, "epoch": 739} {"train_loss": -5.534764289855957, "global_step": 31042, "epoch": 739} {"train_loss": -5.481915473937988, "global_step": 31043, "epoch": 739} {"train_loss": -5.602221488952637, "global_step": 31044, "epoch": 739} {"train_loss": -5.514276027679443, "global_step": 31045, "epoch": 739} {"train_loss": -5.4280619621276855, "global_step": 31046, "epoch": 739} {"train_loss": -5.402843952178955, "global_step": 31047, "epoch": 739} {"train_loss": -5.5313720703125, "global_step": 31048, "epoch": 739} {"train_loss": -5.396157264709473, "global_step": 31049, "epoch": 739} {"train_loss": -5.474925518035889, "global_step": 31050, "epoch": 739} {"train_loss": -5.5428571701049805, "global_step": 31051, "epoch": 739} {"train_loss": -5.391285419464111, "global_step": 31052, "epoch": 739} {"train_loss": -5.583582401275635, "global_step": 31053, "epoch": 739} {"train_loss": -5.491999626159668, "global_step": 31054, "epoch": 739} {"train_loss": -5.536882400512695, "global_step": 31055, "epoch": 739} {"train_loss": -5.470696449279785, "global_step": 31056, "epoch": 739} {"train_loss": -5.550076484680176, "global_step": 31057, "epoch": 739} {"train_loss": -5.475159645080566, "global_step": 31058, "epoch": 739} {"train_loss": -5.49302864074707, "global_step": 31059, "epoch": 739} {"train_loss": -5.599453449249268, "global_step": 31060, "epoch": 739} {"train_loss": -5.509748458862305, "global_step": 31061, "epoch": 739} {"train_loss": -5.568717002868652, "global_step": 31062, "epoch": 739} {"train_loss": -5.426152229309082, "global_step": 31063, "epoch": 739} {"train_loss": -5.570170879364014, "global_step": 31064, "epoch": 739} {"train_loss": -5.546465873718262, "global_step": 31065, "epoch": 739} {"train_loss": -5.409811496734619, "global_step": 31066, "epoch": 739} {"train_loss": -5.6201324462890625, "global_step": 31067, "epoch": 739} {"train_loss": -5.486747741699219, "global_step": 31068, "epoch": 739} {"train_loss": -5.550232410430908, "global_step": 31069, "epoch": 739} {"train_loss": -5.449259281158447, "global_step": 31070, "epoch": 739} {"train_loss": -5.602687358856201, "global_step": 31071, "epoch": 739} {"train_loss": -5.47141695022583, "global_step": 31072, "epoch": 739} {"train_loss": -5.512868881225586, "global_step": 31073, "epoch": 739} {"train_loss": -5.591005325317383, "global_step": 31074, "epoch": 739} {"train_loss": -5.58232307434082, "global_step": 31075, "epoch": 739} {"train_loss": -5.5429534912109375, "global_step": 31076, "epoch": 739} {"train_loss": -5.581426620483398, "global_step": 31077, "epoch": 739} {"train_loss": -5.510461330413818, "global_step": 31078, "epoch": 739} {"train_loss": -5.51643028713408, "global_step": 31079, "epoch": 739, "val_loss": 66541.265625} {"train_loss": -5.611934185028076, "global_step": 31080, "epoch": 740} {"train_loss": -5.486721038818359, "global_step": 31081, "epoch": 740} {"train_loss": -5.534159183502197, "global_step": 31082, "epoch": 740} {"train_loss": -5.534936904907227, "global_step": 31083, "epoch": 740} {"train_loss": -5.501241683959961, "global_step": 31084, "epoch": 740} {"train_loss": -5.498649597167969, "global_step": 31085, "epoch": 740} {"train_loss": -5.507200241088867, "global_step": 31086, "epoch": 740} {"train_loss": -5.4077067375183105, "global_step": 31087, "epoch": 740} {"train_loss": -5.4081597328186035, "global_step": 31088, "epoch": 740} {"train_loss": -5.457789897918701, "global_step": 31089, "epoch": 740} {"train_loss": -5.429644584655762, "global_step": 31090, "epoch": 740} {"train_loss": -5.644519329071045, "global_step": 31091, "epoch": 740} {"train_loss": -5.326255798339844, "global_step": 31092, "epoch": 740} {"train_loss": -5.496239185333252, "global_step": 31093, "epoch": 740} {"train_loss": -5.510075569152832, "global_step": 31094, "epoch": 740} {"train_loss": -5.397130012512207, "global_step": 31095, "epoch": 740} {"train_loss": -5.555517196655273, "global_step": 31096, "epoch": 740} {"train_loss": -5.48801326751709, "global_step": 31097, "epoch": 740} {"train_loss": -5.380178451538086, "global_step": 31098, "epoch": 740} {"train_loss": -5.57451057434082, "global_step": 31099, "epoch": 740} {"train_loss": -5.419466018676758, "global_step": 31100, "epoch": 740} {"train_loss": -5.468283653259277, "global_step": 31101, "epoch": 740} {"train_loss": -5.5023345947265625, "global_step": 31102, "epoch": 740} {"train_loss": -5.510733127593994, "global_step": 31103, "epoch": 740} {"train_loss": -5.499207019805908, "global_step": 31104, "epoch": 740} {"train_loss": -5.402288436889648, "global_step": 31105, "epoch": 740} {"train_loss": -5.51383113861084, "global_step": 31106, "epoch": 740} {"train_loss": -5.468600273132324, "global_step": 31107, "epoch": 740} {"train_loss": -5.55010986328125, "global_step": 31108, "epoch": 740} {"train_loss": -5.462413787841797, "global_step": 31109, "epoch": 740} {"train_loss": -5.396639823913574, "global_step": 31110, "epoch": 740} {"train_loss": -5.480108261108398, "global_step": 31111, "epoch": 740} {"train_loss": -5.353185653686523, "global_step": 31112, "epoch": 740} {"train_loss": -5.457647323608398, "global_step": 31113, "epoch": 740} {"train_loss": -5.54964542388916, "global_step": 31114, "epoch": 740} {"train_loss": -5.493940353393555, "global_step": 31115, "epoch": 740} {"train_loss": -5.480263710021973, "global_step": 31116, "epoch": 740} {"train_loss": -5.465525150299072, "global_step": 31117, "epoch": 740} {"train_loss": -5.483417510986328, "global_step": 31118, "epoch": 740} {"train_loss": -5.463952541351318, "global_step": 31119, "epoch": 740} {"train_loss": -5.554078102111816, "global_step": 31120, "epoch": 740} {"train_loss": -5.483773061207363, "global_step": 31121, "epoch": 740, "val_loss": 66993.03125} {"train_loss": -5.4802165031433105, "global_step": 31122, "epoch": 741} {"train_loss": -5.393709659576416, "global_step": 31123, "epoch": 741} {"train_loss": -5.394957542419434, "global_step": 31124, "epoch": 741} {"train_loss": -5.356447219848633, "global_step": 31125, "epoch": 741} {"train_loss": -5.479784965515137, "global_step": 31126, "epoch": 741} {"train_loss": -5.542604446411133, "global_step": 31127, "epoch": 741} {"train_loss": -5.5711870193481445, "global_step": 31128, "epoch": 741} {"train_loss": -5.519659042358398, "global_step": 31129, "epoch": 741} {"train_loss": -5.479578971862793, "global_step": 31130, "epoch": 741} {"train_loss": -5.492290496826172, "global_step": 31131, "epoch": 741} {"train_loss": -5.407228469848633, "global_step": 31132, "epoch": 741} {"train_loss": -5.516139507293701, "global_step": 31133, "epoch": 741} {"train_loss": -5.538778305053711, "global_step": 31134, "epoch": 741} {"train_loss": -5.591969013214111, "global_step": 31135, "epoch": 741} {"train_loss": -5.334253311157227, "global_step": 31136, "epoch": 741} {"train_loss": -5.429350852966309, "global_step": 31137, "epoch": 741} {"train_loss": -5.5561604499816895, "global_step": 31138, "epoch": 741} {"train_loss": -5.475351333618164, "global_step": 31139, "epoch": 741} {"train_loss": -5.556090354919434, "global_step": 31140, "epoch": 741} {"train_loss": -5.621788024902344, "global_step": 31141, "epoch": 741} {"train_loss": -5.512334823608398, "global_step": 31142, "epoch": 741} {"train_loss": -5.540606498718262, "global_step": 31143, "epoch": 741} {"train_loss": -5.393215179443359, "global_step": 31144, "epoch": 741} {"train_loss": -5.535411834716797, "global_step": 31145, "epoch": 741} {"train_loss": -5.583971977233887, "global_step": 31146, "epoch": 741} {"train_loss": -5.630080223083496, "global_step": 31147, "epoch": 741} {"train_loss": -5.375204563140869, "global_step": 31148, "epoch": 741} {"train_loss": -5.474116325378418, "global_step": 31149, "epoch": 741} {"train_loss": -5.397113800048828, "global_step": 31150, "epoch": 741} {"train_loss": -5.520168304443359, "global_step": 31151, "epoch": 741} {"train_loss": -5.576745510101318, "global_step": 31152, "epoch": 741} {"train_loss": -5.3887939453125, "global_step": 31153, "epoch": 741} {"train_loss": -5.422746181488037, "global_step": 31154, "epoch": 741} {"train_loss": -5.438600540161133, "global_step": 31155, "epoch": 741} {"train_loss": -5.37281608581543, "global_step": 31156, "epoch": 741} {"train_loss": -5.606323719024658, "global_step": 31157, "epoch": 741} {"train_loss": -5.495574474334717, "global_step": 31158, "epoch": 741} {"train_loss": -5.503718376159668, "global_step": 31159, "epoch": 741} {"train_loss": -5.505461692810059, "global_step": 31160, "epoch": 741} {"train_loss": -5.435369491577148, "global_step": 31161, "epoch": 741} {"train_loss": -5.546511173248291, "global_step": 31162, "epoch": 741} {"train_loss": -5.487022195543561, "global_step": 31163, "epoch": 741, "val_loss": 66813.140625} {"train_loss": -5.383488178253174, "global_step": 31164, "epoch": 742} {"train_loss": -5.576160430908203, "global_step": 31165, "epoch": 742} {"train_loss": -5.36570405960083, "global_step": 31166, "epoch": 742} {"train_loss": -5.395082473754883, "global_step": 31167, "epoch": 742} {"train_loss": -5.415348052978516, "global_step": 31168, "epoch": 742} {"train_loss": -5.448306083679199, "global_step": 31169, "epoch": 742} {"train_loss": -5.56407356262207, "global_step": 31170, "epoch": 742} {"train_loss": -5.384758949279785, "global_step": 31171, "epoch": 742} {"train_loss": -5.594752311706543, "global_step": 31172, "epoch": 742} {"train_loss": -5.351179599761963, "global_step": 31173, "epoch": 742} {"train_loss": -5.530122756958008, "global_step": 31174, "epoch": 742} {"train_loss": -5.356985092163086, "global_step": 31175, "epoch": 742} {"train_loss": -5.32707405090332, "global_step": 31176, "epoch": 742} {"train_loss": -5.517477035522461, "global_step": 31177, "epoch": 742} {"train_loss": -5.40778923034668, "global_step": 31178, "epoch": 742} {"train_loss": -5.423496246337891, "global_step": 31179, "epoch": 742} {"train_loss": -5.391558647155762, "global_step": 31180, "epoch": 742} {"train_loss": -5.387200355529785, "global_step": 31181, "epoch": 742} {"train_loss": -5.370909214019775, "global_step": 31182, "epoch": 742} {"train_loss": -5.467074394226074, "global_step": 31183, "epoch": 742} {"train_loss": -5.487751007080078, "global_step": 31184, "epoch": 742} {"train_loss": -5.464397430419922, "global_step": 31185, "epoch": 742} {"train_loss": -5.400234222412109, "global_step": 31186, "epoch": 742} {"train_loss": -5.521860122680664, "global_step": 31187, "epoch": 742} {"train_loss": -5.369771957397461, "global_step": 31188, "epoch": 742} {"train_loss": -5.539708137512207, "global_step": 31189, "epoch": 742} {"train_loss": -5.4576215744018555, "global_step": 31190, "epoch": 742} {"train_loss": -5.482007026672363, "global_step": 31191, "epoch": 742} {"train_loss": -5.481863021850586, "global_step": 31192, "epoch": 742} {"train_loss": -5.370220184326172, "global_step": 31193, "epoch": 742} {"train_loss": -5.505754470825195, "global_step": 31194, "epoch": 742} {"train_loss": -5.579427719116211, "global_step": 31195, "epoch": 742} {"train_loss": -5.540698051452637, "global_step": 31196, "epoch": 742} {"train_loss": -5.498200416564941, "global_step": 31197, "epoch": 742} {"train_loss": -5.554265022277832, "global_step": 31198, "epoch": 742} {"train_loss": -5.416711807250977, "global_step": 31199, "epoch": 742} {"train_loss": -5.446832656860352, "global_step": 31200, "epoch": 742} {"train_loss": -5.669830322265625, "global_step": 31201, "epoch": 742} {"train_loss": -5.563078880310059, "global_step": 31202, "epoch": 742} {"train_loss": -5.549892425537109, "global_step": 31203, "epoch": 742} {"train_loss": -5.395074844360352, "global_step": 31204, "epoch": 742} {"train_loss": -5.463938906079247, "global_step": 31205, "epoch": 742, "val_loss": 66686.3984375} {"train_loss": -5.587728023529053, "global_step": 31206, "epoch": 743} {"train_loss": -5.52588415145874, "global_step": 31207, "epoch": 743} {"train_loss": -5.537478923797607, "global_step": 31208, "epoch": 743} {"train_loss": -5.513177871704102, "global_step": 31209, "epoch": 743} {"train_loss": -5.435708999633789, "global_step": 31210, "epoch": 743} {"train_loss": -5.471523761749268, "global_step": 31211, "epoch": 743} {"train_loss": -5.3738603591918945, "global_step": 31212, "epoch": 743} {"train_loss": -5.4813337326049805, "global_step": 31213, "epoch": 743} {"train_loss": -5.525935649871826, "global_step": 31214, "epoch": 743} {"train_loss": -5.516276836395264, "global_step": 31215, "epoch": 743} {"train_loss": -5.477700233459473, "global_step": 31216, "epoch": 743} {"train_loss": -5.715001106262207, "global_step": 31217, "epoch": 743} {"train_loss": -5.499754428863525, "global_step": 31218, "epoch": 743} {"train_loss": -5.490812301635742, "global_step": 31219, "epoch": 743} {"train_loss": -5.603334903717041, "global_step": 31220, "epoch": 743} {"train_loss": -5.5413126945495605, "global_step": 31221, "epoch": 743} {"train_loss": -5.607697486877441, "global_step": 31222, "epoch": 743} {"train_loss": -5.472146034240723, "global_step": 31223, "epoch": 743} {"train_loss": -5.500313758850098, "global_step": 31224, "epoch": 743} {"train_loss": -5.4644670486450195, "global_step": 31225, "epoch": 743} {"train_loss": -5.385713577270508, "global_step": 31226, "epoch": 743} {"train_loss": -5.490262031555176, "global_step": 31227, "epoch": 743} {"train_loss": -5.4687819480896, "global_step": 31228, "epoch": 743} {"train_loss": -5.52939510345459, "global_step": 31229, "epoch": 743} {"train_loss": -5.559940338134766, "global_step": 31230, "epoch": 743} {"train_loss": -5.485078811645508, "global_step": 31231, "epoch": 743} {"train_loss": -5.5010223388671875, "global_step": 31232, "epoch": 743} {"train_loss": -5.515179634094238, "global_step": 31233, "epoch": 743} {"train_loss": -5.58156681060791, "global_step": 31234, "epoch": 743} {"train_loss": -5.57938289642334, "global_step": 31235, "epoch": 743} {"train_loss": -5.357102394104004, "global_step": 31236, "epoch": 743} {"train_loss": -5.388909339904785, "global_step": 31237, "epoch": 743} {"train_loss": -5.475428581237793, "global_step": 31238, "epoch": 743} {"train_loss": -5.473504066467285, "global_step": 31239, "epoch": 743} {"train_loss": -5.315923690795898, "global_step": 31240, "epoch": 743} {"train_loss": -5.504513740539551, "global_step": 31241, "epoch": 743} {"train_loss": -5.473223686218262, "global_step": 31242, "epoch": 743} {"train_loss": -5.3871917724609375, "global_step": 31243, "epoch": 743} {"train_loss": -5.385723114013672, "global_step": 31244, "epoch": 743} {"train_loss": -5.413874626159668, "global_step": 31245, "epoch": 743} {"train_loss": -5.570740699768066, "global_step": 31246, "epoch": 743} {"train_loss": -5.491074289594378, "global_step": 31247, "epoch": 743, "val_loss": 67157.3671875} {"train_loss": -5.53025484085083, "global_step": 31248, "epoch": 744} {"train_loss": -5.655854225158691, "global_step": 31249, "epoch": 744} {"train_loss": -5.377608299255371, "global_step": 31250, "epoch": 744} {"train_loss": -5.594234466552734, "global_step": 31251, "epoch": 744} {"train_loss": -5.434185028076172, "global_step": 31252, "epoch": 744} {"train_loss": -5.475688934326172, "global_step": 31253, "epoch": 744} {"train_loss": -5.465124607086182, "global_step": 31254, "epoch": 744} {"train_loss": -5.435385227203369, "global_step": 31255, "epoch": 744} {"train_loss": -5.475962162017822, "global_step": 31256, "epoch": 744} {"train_loss": -5.4734039306640625, "global_step": 31257, "epoch": 744} {"train_loss": -5.539063453674316, "global_step": 31258, "epoch": 744} {"train_loss": -5.434174537658691, "global_step": 31259, "epoch": 744} {"train_loss": -5.496595859527588, "global_step": 31260, "epoch": 744} {"train_loss": -5.340561866760254, "global_step": 31261, "epoch": 744} {"train_loss": -5.494835376739502, "global_step": 31262, "epoch": 744} {"train_loss": -5.439514636993408, "global_step": 31263, "epoch": 744} {"train_loss": -5.324857711791992, "global_step": 31264, "epoch": 744} {"train_loss": -5.329739570617676, "global_step": 31265, "epoch": 744} {"train_loss": -5.48021125793457, "global_step": 31266, "epoch": 744} {"train_loss": -5.50050163269043, "global_step": 31267, "epoch": 744} {"train_loss": -5.414974212646484, "global_step": 31268, "epoch": 744} {"train_loss": -5.425491809844971, "global_step": 31269, "epoch": 744} {"train_loss": -5.493978977203369, "global_step": 31270, "epoch": 744} {"train_loss": -5.273087501525879, "global_step": 31271, "epoch": 744} {"train_loss": -5.586945533752441, "global_step": 31272, "epoch": 744} {"train_loss": -5.483111381530762, "global_step": 31273, "epoch": 744} {"train_loss": -5.5068678855896, "global_step": 31274, "epoch": 744} {"train_loss": -5.493520736694336, "global_step": 31275, "epoch": 744} {"train_loss": -5.466704845428467, "global_step": 31276, "epoch": 744} {"train_loss": -5.441301345825195, "global_step": 31277, "epoch": 744} {"train_loss": -5.630577087402344, "global_step": 31278, "epoch": 744} {"train_loss": -5.444509029388428, "global_step": 31279, "epoch": 744} {"train_loss": -5.420750617980957, "global_step": 31280, "epoch": 744} {"train_loss": -5.501330852508545, "global_step": 31281, "epoch": 744} {"train_loss": -5.4569902420043945, "global_step": 31282, "epoch": 744} {"train_loss": -5.523545742034912, "global_step": 31283, "epoch": 744} {"train_loss": -5.505795001983643, "global_step": 31284, "epoch": 744} {"train_loss": -5.553800582885742, "global_step": 31285, "epoch": 744} {"train_loss": -5.4937744140625, "global_step": 31286, "epoch": 744} {"train_loss": -5.472405433654785, "global_step": 31287, "epoch": 744} {"train_loss": -5.584379196166992, "global_step": 31288, "epoch": 744} {"train_loss": -5.475175062815349, "global_step": 31289, "epoch": 744, "val_loss": 67086.78125} {"train_loss": -5.574868202209473, "global_step": 31290, "epoch": 745} {"train_loss": -5.555598258972168, "global_step": 31291, "epoch": 745} {"train_loss": -5.571084976196289, "global_step": 31292, "epoch": 745} {"train_loss": -5.530203819274902, "global_step": 31293, "epoch": 745} {"train_loss": -5.537539482116699, "global_step": 31294, "epoch": 745} {"train_loss": -5.379793167114258, "global_step": 31295, "epoch": 745} {"train_loss": -5.394773006439209, "global_step": 31296, "epoch": 745} {"train_loss": -5.460381507873535, "global_step": 31297, "epoch": 745} {"train_loss": -5.348147869110107, "global_step": 31298, "epoch": 745} {"train_loss": -5.511434555053711, "global_step": 31299, "epoch": 745} {"train_loss": -5.473999977111816, "global_step": 31300, "epoch": 745} {"train_loss": -5.524333953857422, "global_step": 31301, "epoch": 745} {"train_loss": -5.347066879272461, "global_step": 31302, "epoch": 745} {"train_loss": -5.368109226226807, "global_step": 31303, "epoch": 745} {"train_loss": -5.358500957489014, "global_step": 31304, "epoch": 745} {"train_loss": -5.215549945831299, "global_step": 31305, "epoch": 745} {"train_loss": -5.493968963623047, "global_step": 31306, "epoch": 745} {"train_loss": -5.358244895935059, "global_step": 31307, "epoch": 745} {"train_loss": -5.444608688354492, "global_step": 31308, "epoch": 745} {"train_loss": -5.468315124511719, "global_step": 31309, "epoch": 745} {"train_loss": -5.44675350189209, "global_step": 31310, "epoch": 745} {"train_loss": -5.473012924194336, "global_step": 31311, "epoch": 745} {"train_loss": -5.358675479888916, "global_step": 31312, "epoch": 745} {"train_loss": -5.542019844055176, "global_step": 31313, "epoch": 745} {"train_loss": -5.350407600402832, "global_step": 31314, "epoch": 745} {"train_loss": -5.468650817871094, "global_step": 31315, "epoch": 745} {"train_loss": -5.320094108581543, "global_step": 31316, "epoch": 745} {"train_loss": -5.429619789123535, "global_step": 31317, "epoch": 745} {"train_loss": -5.534976959228516, "global_step": 31318, "epoch": 745} {"train_loss": -5.486459732055664, "global_step": 31319, "epoch": 745} {"train_loss": -5.556735038757324, "global_step": 31320, "epoch": 745} {"train_loss": -5.311408042907715, "global_step": 31321, "epoch": 745} {"train_loss": -5.418910503387451, "global_step": 31322, "epoch": 745} {"train_loss": -5.412525177001953, "global_step": 31323, "epoch": 745} {"train_loss": -5.380620002746582, "global_step": 31324, "epoch": 745} {"train_loss": -5.5074615478515625, "global_step": 31325, "epoch": 745} {"train_loss": -5.469078063964844, "global_step": 31326, "epoch": 745} {"train_loss": -5.397855758666992, "global_step": 31327, "epoch": 745} {"train_loss": -5.469645023345947, "global_step": 31328, "epoch": 745} {"train_loss": -5.380389213562012, "global_step": 31329, "epoch": 745} {"train_loss": -5.618232727050781, "global_step": 31330, "epoch": 745} {"train_loss": -5.448001975104923, "global_step": 31331, "epoch": 745, "val_loss": 67224.375} {"train_loss": -5.462352752685547, "global_step": 31332, "epoch": 746} {"train_loss": -5.566856861114502, "global_step": 31333, "epoch": 746} {"train_loss": -5.467716217041016, "global_step": 31334, "epoch": 746} {"train_loss": -5.432733535766602, "global_step": 31335, "epoch": 746} {"train_loss": -5.5127668380737305, "global_step": 31336, "epoch": 746} {"train_loss": -5.449653625488281, "global_step": 31337, "epoch": 746} {"train_loss": -5.536330223083496, "global_step": 31338, "epoch": 746} {"train_loss": -5.540851593017578, "global_step": 31339, "epoch": 746} {"train_loss": -5.488115310668945, "global_step": 31340, "epoch": 746} {"train_loss": -5.51630163192749, "global_step": 31341, "epoch": 746} {"train_loss": -5.4614410400390625, "global_step": 31342, "epoch": 746} {"train_loss": -5.596354961395264, "global_step": 31343, "epoch": 746} {"train_loss": -5.498405456542969, "global_step": 31344, "epoch": 746} {"train_loss": -5.561128616333008, "global_step": 31345, "epoch": 746} {"train_loss": -5.510499954223633, "global_step": 31346, "epoch": 746} {"train_loss": -5.529270172119141, "global_step": 31347, "epoch": 746} {"train_loss": -5.4978837966918945, "global_step": 31348, "epoch": 746} {"train_loss": -5.507813453674316, "global_step": 31349, "epoch": 746} {"train_loss": -5.639072418212891, "global_step": 31350, "epoch": 746} {"train_loss": -5.574291229248047, "global_step": 31351, "epoch": 746} {"train_loss": -5.572079181671143, "global_step": 31352, "epoch": 746} {"train_loss": -5.618349075317383, "global_step": 31353, "epoch": 746} {"train_loss": -5.533695220947266, "global_step": 31354, "epoch": 746} {"train_loss": -5.44766902923584, "global_step": 31355, "epoch": 746} {"train_loss": -5.448687553405762, "global_step": 31356, "epoch": 746} {"train_loss": -5.6405839920043945, "global_step": 31357, "epoch": 746} {"train_loss": -5.3905348777771, "global_step": 31358, "epoch": 746} {"train_loss": -5.581571578979492, "global_step": 31359, "epoch": 746} {"train_loss": -5.517464637756348, "global_step": 31360, "epoch": 746} {"train_loss": -5.482110023498535, "global_step": 31361, "epoch": 746} {"train_loss": -5.48742151260376, "global_step": 31362, "epoch": 746} {"train_loss": -5.534547805786133, "global_step": 31363, "epoch": 746} {"train_loss": -5.4810709953308105, "global_step": 31364, "epoch": 746} {"train_loss": -5.524010181427002, "global_step": 31365, "epoch": 746} {"train_loss": -5.431277275085449, "global_step": 31366, "epoch": 746} {"train_loss": -5.585978031158447, "global_step": 31367, "epoch": 746} {"train_loss": -5.500584602355957, "global_step": 31368, "epoch": 746} {"train_loss": -5.416210174560547, "global_step": 31369, "epoch": 746} {"train_loss": -5.50755500793457, "global_step": 31370, "epoch": 746} {"train_loss": -5.51918888092041, "global_step": 31371, "epoch": 746} {"train_loss": -5.484950065612793, "global_step": 31372, "epoch": 746} {"train_loss": -5.513603857585362, "global_step": 31373, "epoch": 746, "val_loss": 67273.4921875} {"train_loss": -5.482144355773926, "global_step": 31374, "epoch": 747} {"train_loss": -5.409168720245361, "global_step": 31375, "epoch": 747} {"train_loss": -5.429283142089844, "global_step": 31376, "epoch": 747} {"train_loss": -5.469488143920898, "global_step": 31377, "epoch": 747} {"train_loss": -5.509866237640381, "global_step": 31378, "epoch": 747} {"train_loss": -5.489335060119629, "global_step": 31379, "epoch": 747} {"train_loss": -5.495846748352051, "global_step": 31380, "epoch": 747} {"train_loss": -5.453456878662109, "global_step": 31381, "epoch": 747} {"train_loss": -5.498342514038086, "global_step": 31382, "epoch": 747} {"train_loss": -5.505643844604492, "global_step": 31383, "epoch": 747} {"train_loss": -5.495854377746582, "global_step": 31384, "epoch": 747} {"train_loss": -5.467978477478027, "global_step": 31385, "epoch": 747} {"train_loss": -5.348104000091553, "global_step": 31386, "epoch": 747} {"train_loss": -5.526313781738281, "global_step": 31387, "epoch": 747} {"train_loss": -5.525050163269043, "global_step": 31388, "epoch": 747} {"train_loss": -5.645766258239746, "global_step": 31389, "epoch": 747} {"train_loss": -5.616782188415527, "global_step": 31390, "epoch": 747} {"train_loss": -5.529184341430664, "global_step": 31391, "epoch": 747} {"train_loss": -5.535750389099121, "global_step": 31392, "epoch": 747} {"train_loss": -5.601127624511719, "global_step": 31393, "epoch": 747} {"train_loss": -5.529638290405273, "global_step": 31394, "epoch": 747} {"train_loss": -5.483634948730469, "global_step": 31395, "epoch": 747} {"train_loss": -5.515973091125488, "global_step": 31396, "epoch": 747} {"train_loss": -5.534309387207031, "global_step": 31397, "epoch": 747} {"train_loss": -5.5142974853515625, "global_step": 31398, "epoch": 747} {"train_loss": -5.632801055908203, "global_step": 31399, "epoch": 747} {"train_loss": -5.429265022277832, "global_step": 31400, "epoch": 747} {"train_loss": -5.505382537841797, "global_step": 31401, "epoch": 747} {"train_loss": -5.408902645111084, "global_step": 31402, "epoch": 747} {"train_loss": -5.402704238891602, "global_step": 31403, "epoch": 747} {"train_loss": -5.426660060882568, "global_step": 31404, "epoch": 747} {"train_loss": -5.5959320068359375, "global_step": 31405, "epoch": 747} {"train_loss": -5.5738525390625, "global_step": 31406, "epoch": 747} {"train_loss": -5.466585159301758, "global_step": 31407, "epoch": 747} {"train_loss": -5.574206352233887, "global_step": 31408, "epoch": 747} {"train_loss": -5.517393112182617, "global_step": 31409, "epoch": 747} {"train_loss": -5.485235214233398, "global_step": 31410, "epoch": 747} {"train_loss": -5.554381370544434, "global_step": 31411, "epoch": 747} {"train_loss": -5.471916198730469, "global_step": 31412, "epoch": 747} {"train_loss": -5.496404647827148, "global_step": 31413, "epoch": 747} {"train_loss": -5.559452056884766, "global_step": 31414, "epoch": 747} {"train_loss": -5.5044642970675515, "global_step": 31415, "epoch": 747, "val_loss": 66959.5234375} {"train_loss": -5.534553050994873, "global_step": 31416, "epoch": 748} {"train_loss": -5.309193134307861, "global_step": 31417, "epoch": 748} {"train_loss": -5.432850360870361, "global_step": 31418, "epoch": 748} {"train_loss": -5.467386245727539, "global_step": 31419, "epoch": 748} {"train_loss": -5.509549140930176, "global_step": 31420, "epoch": 748} {"train_loss": -5.412275314331055, "global_step": 31421, "epoch": 748} {"train_loss": -5.443722724914551, "global_step": 31422, "epoch": 748} {"train_loss": -5.453274726867676, "global_step": 31423, "epoch": 748} {"train_loss": -5.343618392944336, "global_step": 31424, "epoch": 748} {"train_loss": -5.4549126625061035, "global_step": 31425, "epoch": 748} {"train_loss": -5.309234619140625, "global_step": 31426, "epoch": 748} {"train_loss": -5.624526500701904, "global_step": 31427, "epoch": 748} {"train_loss": -5.543726444244385, "global_step": 31428, "epoch": 748} {"train_loss": -5.36203670501709, "global_step": 31429, "epoch": 748} {"train_loss": -5.594193458557129, "global_step": 31430, "epoch": 748} {"train_loss": -5.528158187866211, "global_step": 31431, "epoch": 748} {"train_loss": -5.573841571807861, "global_step": 31432, "epoch": 748} {"train_loss": -5.495007514953613, "global_step": 31433, "epoch": 748} {"train_loss": -5.444690704345703, "global_step": 31434, "epoch": 748} {"train_loss": -5.564334392547607, "global_step": 31435, "epoch": 748} {"train_loss": -5.359575271606445, "global_step": 31436, "epoch": 748} {"train_loss": -5.509133815765381, "global_step": 31437, "epoch": 748} {"train_loss": -5.5609846115112305, "global_step": 31438, "epoch": 748} {"train_loss": -5.5756683349609375, "global_step": 31439, "epoch": 748} {"train_loss": -5.507861137390137, "global_step": 31440, "epoch": 748} {"train_loss": -5.50241756439209, "global_step": 31441, "epoch": 748} {"train_loss": -5.4173808097839355, "global_step": 31442, "epoch": 748} {"train_loss": -5.506587028503418, "global_step": 31443, "epoch": 748} {"train_loss": -5.503571510314941, "global_step": 31444, "epoch": 748} {"train_loss": -5.466423034667969, "global_step": 31445, "epoch": 748} {"train_loss": -5.488621711730957, "global_step": 31446, "epoch": 748} {"train_loss": -5.501656532287598, "global_step": 31447, "epoch": 748} {"train_loss": -5.545307636260986, "global_step": 31448, "epoch": 748} {"train_loss": -5.452649116516113, "global_step": 31449, "epoch": 748} {"train_loss": -5.431722164154053, "global_step": 31450, "epoch": 748} {"train_loss": -5.543571472167969, "global_step": 31451, "epoch": 748} {"train_loss": -5.579931259155273, "global_step": 31452, "epoch": 748} {"train_loss": -5.59367561340332, "global_step": 31453, "epoch": 748} {"train_loss": -5.495018005371094, "global_step": 31454, "epoch": 748} {"train_loss": -5.45100212097168, "global_step": 31455, "epoch": 748} {"train_loss": -5.5214996337890625, "global_step": 31456, "epoch": 748} {"train_loss": -5.489788225718907, "global_step": 31457, "epoch": 748, "val_loss": 66966.6015625} {"train_loss": -5.4664177894592285, "global_step": 31458, "epoch": 749} {"train_loss": -5.483060359954834, "global_step": 31459, "epoch": 749} {"train_loss": -5.484429359436035, "global_step": 31460, "epoch": 749} {"train_loss": -5.5954999923706055, "global_step": 31461, "epoch": 749} {"train_loss": -5.516315460205078, "global_step": 31462, "epoch": 749} {"train_loss": -5.539433479309082, "global_step": 31463, "epoch": 749} {"train_loss": -5.522740840911865, "global_step": 31464, "epoch": 749} {"train_loss": -5.452537536621094, "global_step": 31465, "epoch": 749} {"train_loss": -5.399710655212402, "global_step": 31466, "epoch": 749} {"train_loss": -5.538227081298828, "global_step": 31467, "epoch": 749} {"train_loss": -5.366240501403809, "global_step": 31468, "epoch": 749} {"train_loss": -5.5485148429870605, "global_step": 31469, "epoch": 749} {"train_loss": -5.507293701171875, "global_step": 31470, "epoch": 749} {"train_loss": -5.541769027709961, "global_step": 31471, "epoch": 749} {"train_loss": -5.556388854980469, "global_step": 31472, "epoch": 749} {"train_loss": -5.539520263671875, "global_step": 31473, "epoch": 749} {"train_loss": -5.59033203125, "global_step": 31474, "epoch": 749} {"train_loss": -5.549764633178711, "global_step": 31475, "epoch": 749} {"train_loss": -5.5582275390625, "global_step": 31476, "epoch": 749} {"train_loss": -5.525713920593262, "global_step": 31477, "epoch": 749} {"train_loss": -5.572896957397461, "global_step": 31478, "epoch": 749} {"train_loss": -5.496877670288086, "global_step": 31479, "epoch": 749} {"train_loss": -5.519916534423828, "global_step": 31480, "epoch": 749} {"train_loss": -5.526524543762207, "global_step": 31481, "epoch": 749} {"train_loss": -5.593260288238525, "global_step": 31482, "epoch": 749} {"train_loss": -5.333386421203613, "global_step": 31483, "epoch": 749} {"train_loss": -5.608798980712891, "global_step": 31484, "epoch": 749} {"train_loss": -5.619801044464111, "global_step": 31485, "epoch": 749} {"train_loss": -5.442500114440918, "global_step": 31486, "epoch": 749} {"train_loss": -5.496694564819336, "global_step": 31487, "epoch": 749} {"train_loss": -5.557762145996094, "global_step": 31488, "epoch": 749} {"train_loss": -5.508227825164795, "global_step": 31489, "epoch": 749} {"train_loss": -5.425580024719238, "global_step": 31490, "epoch": 749} {"train_loss": -5.523702621459961, "global_step": 31491, "epoch": 749} {"train_loss": -5.475291728973389, "global_step": 31492, "epoch": 749} {"train_loss": -5.460477828979492, "global_step": 31493, "epoch": 749} {"train_loss": -5.435904502868652, "global_step": 31494, "epoch": 749} {"train_loss": -5.539941787719727, "global_step": 31495, "epoch": 749} {"train_loss": -5.380256652832031, "global_step": 31496, "epoch": 749} {"train_loss": -5.52095890045166, "global_step": 31497, "epoch": 749} {"train_loss": -5.519717216491699, "global_step": 31498, "epoch": 749} {"train_loss": -5.50739540372576, "global_step": 31499, "epoch": 749, "val_loss": 67041.4375} {"train_loss": -5.490549087524414, "global_step": 31500, "epoch": 750} {"train_loss": -5.577070236206055, "global_step": 31501, "epoch": 750} {"train_loss": -5.530435562133789, "global_step": 31502, "epoch": 750} {"train_loss": -5.41276741027832, "global_step": 31503, "epoch": 750} {"train_loss": -5.587291717529297, "global_step": 31504, "epoch": 750} {"train_loss": -5.51170539855957, "global_step": 31505, "epoch": 750} {"train_loss": -5.53418493270874, "global_step": 31506, "epoch": 750} {"train_loss": -5.5259857177734375, "global_step": 31507, "epoch": 750} {"train_loss": -5.431845188140869, "global_step": 31508, "epoch": 750} {"train_loss": -5.534676551818848, "global_step": 31509, "epoch": 750} {"train_loss": -5.470898628234863, "global_step": 31510, "epoch": 750} {"train_loss": -5.576909065246582, "global_step": 31511, "epoch": 750} {"train_loss": -5.5684332847595215, "global_step": 31512, "epoch": 750} {"train_loss": -5.484502792358398, "global_step": 31513, "epoch": 750} {"train_loss": -5.565741539001465, "global_step": 31514, "epoch": 750} {"train_loss": -5.446249008178711, "global_step": 31515, "epoch": 750} {"train_loss": -5.574031829833984, "global_step": 31516, "epoch": 750} {"train_loss": -5.480808258056641, "global_step": 31517, "epoch": 750} {"train_loss": -5.460906982421875, "global_step": 31518, "epoch": 750} {"train_loss": -5.496883392333984, "global_step": 31519, "epoch": 750} {"train_loss": -5.640250205993652, "global_step": 31520, "epoch": 750} {"train_loss": -5.552840232849121, "global_step": 31521, "epoch": 750} {"train_loss": -5.432126522064209, "global_step": 31522, "epoch": 750} {"train_loss": -5.543872356414795, "global_step": 31523, "epoch": 750} {"train_loss": -5.560484409332275, "global_step": 31524, "epoch": 750} {"train_loss": -5.4929962158203125, "global_step": 31525, "epoch": 750} {"train_loss": -5.455559730529785, "global_step": 31526, "epoch": 750} {"train_loss": -5.601970672607422, "global_step": 31527, "epoch": 750} {"train_loss": -5.64201545715332, "global_step": 31528, "epoch": 750} {"train_loss": -5.4425225257873535, "global_step": 31529, "epoch": 750} {"train_loss": -5.512564659118652, "global_step": 31530, "epoch": 750} {"train_loss": -5.586686134338379, "global_step": 31531, "epoch": 750} {"train_loss": -5.521007061004639, "global_step": 31532, "epoch": 750} {"train_loss": -5.524060249328613, "global_step": 31533, "epoch": 750} {"train_loss": -5.494393348693848, "global_step": 31534, "epoch": 750} {"train_loss": -5.461006164550781, "global_step": 31535, "epoch": 750} {"train_loss": -5.462438583374023, "global_step": 31536, "epoch": 750} {"train_loss": -5.538236618041992, "global_step": 31537, "epoch": 750} {"train_loss": -5.385416030883789, "global_step": 31538, "epoch": 750} {"train_loss": -5.558130264282227, "global_step": 31539, "epoch": 750} {"train_loss": -5.435589790344238, "global_step": 31540, "epoch": 750} {"train_loss": -5.513960054942539, "global_step": 31541, "epoch": 750, "train/sim_max_reward_0": 0.41987990087850746, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.48537381275466773, "train/sim_max_reward_3": 0.1305285004575785, "train/sim_max_reward_4": 0.47489714632161095, "train/sim_max_reward_5": 0.8068053848333013, "test/sim_max_reward_4400000": 0.15641647857671895, "test/sim_max_reward_4400001": 0.512700054458175, "test/sim_max_reward_4400002": 0.2718975777716969, "test/sim_max_reward_4400003": 0.1107507704996224, "test/sim_max_reward_4400004": 0.1993864467625205, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.13321280796125773, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3382343860462125, "test/sim_max_reward_4400009": 0.4818694194296195, "test/sim_max_reward_4400010": 0.30546376870473085, "test/sim_max_reward_4400011": 0.18872160003938612, "test/sim_max_reward_4400012": 0.6464833829793557, "test/sim_max_reward_4400013": 0.5253381049919306, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.29266801089547834, "test/sim_max_reward_4400016": 0.16152033495145543, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.350175144148896, "test/sim_max_reward_4400019": 0.21919637838190992, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.30536591846581485, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.332880346917265, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.25088906558727675, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.024827155636263847, "test/sim_max_reward_4400028": 0.21769183736107978, "test/sim_max_reward_4400029": 0.5299559704280152, "test/sim_max_reward_4400030": 0.3201262381230792, "test/sim_max_reward_4400031": 0.02267480417533296, "test/sim_max_reward_4400032": 0.2362305093753071, "test/sim_max_reward_4400033": 0.1512510993960716, "test/sim_max_reward_4400034": 0.8923355625248598, "test/sim_max_reward_4400035": 0.4723316540667915, "test/sim_max_reward_4400036": 0.3726408676480675, "test/sim_max_reward_4400037": 0.7537882415119599, "test/sim_max_reward_4400038": 0.307333346349161, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6006899141369931, "test/sim_max_reward_4400042": 0.029857454617049275, "test/sim_max_reward_4400043": 0.08667174184744732, "test/sim_max_reward_4400044": 0.02574715646017168, "test/sim_max_reward_4400045": 0.8735788927977949, "test/sim_max_reward_4400046": 0.26417985211786194, "test/sim_max_reward_4400047": 0.238678193778015, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.31864046303086824, "train/mean_score": 0.3863600377445775, "test/mean_score": 0.27241415199546315, "val_loss": 66572.7421875} {"train_loss": -5.600214958190918, "global_step": 31542, "epoch": 751} {"train_loss": -5.465281963348389, "global_step": 31543, "epoch": 751} {"train_loss": -5.519217491149902, "global_step": 31544, "epoch": 751} {"train_loss": -5.448620796203613, "global_step": 31545, "epoch": 751} {"train_loss": -5.433401107788086, "global_step": 31546, "epoch": 751} {"train_loss": -5.590563774108887, "global_step": 31547, "epoch": 751} {"train_loss": -5.520172119140625, "global_step": 31548, "epoch": 751} {"train_loss": -5.382073402404785, "global_step": 31549, "epoch": 751} {"train_loss": -5.595050811767578, "global_step": 31550, "epoch": 751} {"train_loss": -5.547604560852051, "global_step": 31551, "epoch": 751} {"train_loss": -5.333727836608887, "global_step": 31552, "epoch": 751} {"train_loss": -5.5979509353637695, "global_step": 31553, "epoch": 751} {"train_loss": -5.4480438232421875, "global_step": 31554, "epoch": 751} {"train_loss": -5.519567012786865, "global_step": 31555, "epoch": 751} {"train_loss": -5.437867164611816, "global_step": 31556, "epoch": 751} {"train_loss": -5.344449996948242, "global_step": 31557, "epoch": 751} {"train_loss": -5.577109336853027, "global_step": 31558, "epoch": 751} {"train_loss": -5.520289897918701, "global_step": 31559, "epoch": 751} {"train_loss": -5.545368194580078, "global_step": 31560, "epoch": 751} {"train_loss": -5.503010272979736, "global_step": 31561, "epoch": 751} {"train_loss": -5.54904317855835, "global_step": 31562, "epoch": 751} {"train_loss": -5.456337928771973, "global_step": 31563, "epoch": 751} {"train_loss": -5.373565196990967, "global_step": 31564, "epoch": 751} {"train_loss": -5.565127372741699, "global_step": 31565, "epoch": 751} {"train_loss": -5.642333984375, "global_step": 31566, "epoch": 751} {"train_loss": -5.530121803283691, "global_step": 31567, "epoch": 751} {"train_loss": -5.579623222351074, "global_step": 31568, "epoch": 751} {"train_loss": -5.393558502197266, "global_step": 31569, "epoch": 751} {"train_loss": -5.6666717529296875, "global_step": 31570, "epoch": 751} {"train_loss": -5.460186958312988, "global_step": 31571, "epoch": 751} {"train_loss": -5.4656081199646, "global_step": 31572, "epoch": 751} {"train_loss": -5.56311559677124, "global_step": 31573, "epoch": 751} {"train_loss": -5.541201591491699, "global_step": 31574, "epoch": 751} {"train_loss": -5.423521995544434, "global_step": 31575, "epoch": 751} {"train_loss": -5.54335880279541, "global_step": 31576, "epoch": 751} {"train_loss": -5.6282572746276855, "global_step": 31577, "epoch": 751} {"train_loss": -5.551743507385254, "global_step": 31578, "epoch": 751} {"train_loss": -5.536611557006836, "global_step": 31579, "epoch": 751} {"train_loss": -5.486786365509033, "global_step": 31580, "epoch": 751} {"train_loss": -5.503972053527832, "global_step": 31581, "epoch": 751} {"train_loss": -5.569957733154297, "global_step": 31582, "epoch": 751} {"train_loss": -5.514183010373797, "global_step": 31583, "epoch": 751, "val_loss": 66585.125} {"train_loss": -5.600491523742676, "global_step": 31584, "epoch": 752} {"train_loss": -5.536302089691162, "global_step": 31585, "epoch": 752} {"train_loss": -5.4648332595825195, "global_step": 31586, "epoch": 752} {"train_loss": -5.54380989074707, "global_step": 31587, "epoch": 752} {"train_loss": -5.397678375244141, "global_step": 31588, "epoch": 752} {"train_loss": -5.463063716888428, "global_step": 31589, "epoch": 752} {"train_loss": -5.512279510498047, "global_step": 31590, "epoch": 752} {"train_loss": -5.504493713378906, "global_step": 31591, "epoch": 752} {"train_loss": -5.521078109741211, "global_step": 31592, "epoch": 752} {"train_loss": -5.611349582672119, "global_step": 31593, "epoch": 752} {"train_loss": -5.492851257324219, "global_step": 31594, "epoch": 752} {"train_loss": -5.502495765686035, "global_step": 31595, "epoch": 752} {"train_loss": -5.548532485961914, "global_step": 31596, "epoch": 752} {"train_loss": -5.576239585876465, "global_step": 31597, "epoch": 752} {"train_loss": -5.417654514312744, "global_step": 31598, "epoch": 752} {"train_loss": -5.469942092895508, "global_step": 31599, "epoch": 752} {"train_loss": -5.534550189971924, "global_step": 31600, "epoch": 752} {"train_loss": -5.4904279708862305, "global_step": 31601, "epoch": 752} {"train_loss": -5.53166389465332, "global_step": 31602, "epoch": 752} {"train_loss": -5.508720874786377, "global_step": 31603, "epoch": 752} {"train_loss": -5.570828914642334, "global_step": 31604, "epoch": 752} {"train_loss": -5.4299774169921875, "global_step": 31605, "epoch": 752} {"train_loss": -5.474908351898193, "global_step": 31606, "epoch": 752} {"train_loss": -5.555202484130859, "global_step": 31607, "epoch": 752} {"train_loss": -5.559694290161133, "global_step": 31608, "epoch": 752} {"train_loss": -5.513160705566406, "global_step": 31609, "epoch": 752} {"train_loss": -5.56561279296875, "global_step": 31610, "epoch": 752} {"train_loss": -5.539363384246826, "global_step": 31611, "epoch": 752} {"train_loss": -5.547430038452148, "global_step": 31612, "epoch": 752} {"train_loss": -5.439053535461426, "global_step": 31613, "epoch": 752} {"train_loss": -5.454137802124023, "global_step": 31614, "epoch": 752} {"train_loss": -5.572372913360596, "global_step": 31615, "epoch": 752} {"train_loss": -5.63637638092041, "global_step": 31616, "epoch": 752} {"train_loss": -5.537274360656738, "global_step": 31617, "epoch": 752} {"train_loss": -5.445806503295898, "global_step": 31618, "epoch": 752} {"train_loss": -5.423656463623047, "global_step": 31619, "epoch": 752} {"train_loss": -5.387395858764648, "global_step": 31620, "epoch": 752} {"train_loss": -5.536014080047607, "global_step": 31621, "epoch": 752} {"train_loss": -5.418976783752441, "global_step": 31622, "epoch": 752} {"train_loss": -5.548007965087891, "global_step": 31623, "epoch": 752} {"train_loss": -5.4966511726379395, "global_step": 31624, "epoch": 752} {"train_loss": -5.508972088495891, "global_step": 31625, "epoch": 752, "val_loss": 66918.0546875} {"train_loss": -5.537130355834961, "global_step": 31626, "epoch": 753} {"train_loss": -5.537336349487305, "global_step": 31627, "epoch": 753} {"train_loss": -5.472543716430664, "global_step": 31628, "epoch": 753} {"train_loss": -5.578310966491699, "global_step": 31629, "epoch": 753} {"train_loss": -5.352232933044434, "global_step": 31630, "epoch": 753} {"train_loss": -5.4488372802734375, "global_step": 31631, "epoch": 753} {"train_loss": -5.6421613693237305, "global_step": 31632, "epoch": 753} {"train_loss": -5.46232795715332, "global_step": 31633, "epoch": 753} {"train_loss": -5.537961483001709, "global_step": 31634, "epoch": 753} {"train_loss": -5.410314083099365, "global_step": 31635, "epoch": 753} {"train_loss": -5.597204208374023, "global_step": 31636, "epoch": 753} {"train_loss": -5.337996482849121, "global_step": 31637, "epoch": 753} {"train_loss": -5.40831184387207, "global_step": 31638, "epoch": 753} {"train_loss": -5.314634323120117, "global_step": 31639, "epoch": 753} {"train_loss": -5.500845909118652, "global_step": 31640, "epoch": 753} {"train_loss": -5.466052055358887, "global_step": 31641, "epoch": 753} {"train_loss": -5.547435760498047, "global_step": 31642, "epoch": 753} {"train_loss": -5.501547813415527, "global_step": 31643, "epoch": 753} {"train_loss": -5.544971942901611, "global_step": 31644, "epoch": 753} {"train_loss": -5.521661758422852, "global_step": 31645, "epoch": 753} {"train_loss": -5.55806827545166, "global_step": 31646, "epoch": 753} {"train_loss": -5.531092166900635, "global_step": 31647, "epoch": 753} {"train_loss": -5.429464340209961, "global_step": 31648, "epoch": 753} {"train_loss": -5.471232891082764, "global_step": 31649, "epoch": 753} {"train_loss": -5.7004194259643555, "global_step": 31650, "epoch": 753} {"train_loss": -5.5599212646484375, "global_step": 31651, "epoch": 753} {"train_loss": -5.430480003356934, "global_step": 31652, "epoch": 753} {"train_loss": -5.477573394775391, "global_step": 31653, "epoch": 753} {"train_loss": -5.433477401733398, "global_step": 31654, "epoch": 753} {"train_loss": -5.581145286560059, "global_step": 31655, "epoch": 753} {"train_loss": -5.435723304748535, "global_step": 31656, "epoch": 753} {"train_loss": -5.576668739318848, "global_step": 31657, "epoch": 753} {"train_loss": -5.520867347717285, "global_step": 31658, "epoch": 753} {"train_loss": -5.520578861236572, "global_step": 31659, "epoch": 753} {"train_loss": -5.463281631469727, "global_step": 31660, "epoch": 753} {"train_loss": -5.533170700073242, "global_step": 31661, "epoch": 753} {"train_loss": -5.421843528747559, "global_step": 31662, "epoch": 753} {"train_loss": -5.409835338592529, "global_step": 31663, "epoch": 753} {"train_loss": -5.568349838256836, "global_step": 31664, "epoch": 753} {"train_loss": -5.47585391998291, "global_step": 31665, "epoch": 753} {"train_loss": -5.523928642272949, "global_step": 31666, "epoch": 753} {"train_loss": -5.49550705864316, "global_step": 31667, "epoch": 753, "val_loss": 66843.4375} {"train_loss": -5.3687334060668945, "global_step": 31668, "epoch": 754} {"train_loss": -5.64311408996582, "global_step": 31669, "epoch": 754} {"train_loss": -5.405746936798096, "global_step": 31670, "epoch": 754} {"train_loss": -5.480957508087158, "global_step": 31671, "epoch": 754} {"train_loss": -5.470615386962891, "global_step": 31672, "epoch": 754} {"train_loss": -5.45232629776001, "global_step": 31673, "epoch": 754} {"train_loss": -5.542169570922852, "global_step": 31674, "epoch": 754} {"train_loss": -5.530075550079346, "global_step": 31675, "epoch": 754} {"train_loss": -5.488661766052246, "global_step": 31676, "epoch": 754} {"train_loss": -5.463860034942627, "global_step": 31677, "epoch": 754} {"train_loss": -5.506631374359131, "global_step": 31678, "epoch": 754} {"train_loss": -5.6057448387146, "global_step": 31679, "epoch": 754} {"train_loss": -5.455394268035889, "global_step": 31680, "epoch": 754} {"train_loss": -5.516484260559082, "global_step": 31681, "epoch": 754} {"train_loss": -5.591231822967529, "global_step": 31682, "epoch": 754} {"train_loss": -5.549901008605957, "global_step": 31683, "epoch": 754} {"train_loss": -5.561605930328369, "global_step": 31684, "epoch": 754} {"train_loss": -5.524274826049805, "global_step": 31685, "epoch": 754} {"train_loss": -5.50540828704834, "global_step": 31686, "epoch": 754} {"train_loss": -5.540215492248535, "global_step": 31687, "epoch": 754} {"train_loss": -5.563836097717285, "global_step": 31688, "epoch": 754} {"train_loss": -5.3901777267456055, "global_step": 31689, "epoch": 754} {"train_loss": -5.319707870483398, "global_step": 31690, "epoch": 754} {"train_loss": -5.462233543395996, "global_step": 31691, "epoch": 754} {"train_loss": -5.4609375, "global_step": 31692, "epoch": 754} {"train_loss": -5.4544677734375, "global_step": 31693, "epoch": 754} {"train_loss": -5.463605880737305, "global_step": 31694, "epoch": 754} {"train_loss": -5.626197814941406, "global_step": 31695, "epoch": 754} {"train_loss": -5.547671318054199, "global_step": 31696, "epoch": 754} {"train_loss": -5.500180721282959, "global_step": 31697, "epoch": 754} {"train_loss": -5.429931163787842, "global_step": 31698, "epoch": 754} {"train_loss": -5.5406270027160645, "global_step": 31699, "epoch": 754} {"train_loss": -5.428615570068359, "global_step": 31700, "epoch": 754} {"train_loss": -5.563514709472656, "global_step": 31701, "epoch": 754} {"train_loss": -5.558347225189209, "global_step": 31702, "epoch": 754} {"train_loss": -5.328954696655273, "global_step": 31703, "epoch": 754} {"train_loss": -5.612668991088867, "global_step": 31704, "epoch": 754} {"train_loss": -5.5038557052612305, "global_step": 31705, "epoch": 754} {"train_loss": -5.633421897888184, "global_step": 31706, "epoch": 754} {"train_loss": -5.545772552490234, "global_step": 31707, "epoch": 754} {"train_loss": -5.425615310668945, "global_step": 31708, "epoch": 754} {"train_loss": -5.500764744622367, "global_step": 31709, "epoch": 754, "val_loss": 66707.921875} {"train_loss": -5.4817728996276855, "global_step": 31710, "epoch": 755} {"train_loss": -5.21713399887085, "global_step": 31711, "epoch": 755} {"train_loss": -5.593339443206787, "global_step": 31712, "epoch": 755} {"train_loss": -5.619913101196289, "global_step": 31713, "epoch": 755} {"train_loss": -5.382937431335449, "global_step": 31714, "epoch": 755} {"train_loss": -5.4918012619018555, "global_step": 31715, "epoch": 755} {"train_loss": -5.4924468994140625, "global_step": 31716, "epoch": 755} {"train_loss": -5.528629302978516, "global_step": 31717, "epoch": 755} {"train_loss": -5.3131256103515625, "global_step": 31718, "epoch": 755} {"train_loss": -5.309202194213867, "global_step": 31719, "epoch": 755} {"train_loss": -5.532474040985107, "global_step": 31720, "epoch": 755} {"train_loss": -5.280884742736816, "global_step": 31721, "epoch": 755} {"train_loss": -5.541670799255371, "global_step": 31722, "epoch": 755} {"train_loss": -5.518426418304443, "global_step": 31723, "epoch": 755} {"train_loss": -5.362481594085693, "global_step": 31724, "epoch": 755} {"train_loss": -5.4588704109191895, "global_step": 31725, "epoch": 755} {"train_loss": -5.390102386474609, "global_step": 31726, "epoch": 755} {"train_loss": -5.477933883666992, "global_step": 31727, "epoch": 755} {"train_loss": -5.474429130554199, "global_step": 31728, "epoch": 755} {"train_loss": -5.550670146942139, "global_step": 31729, "epoch": 755} {"train_loss": -5.613668441772461, "global_step": 31730, "epoch": 755} {"train_loss": -5.500180721282959, "global_step": 31731, "epoch": 755} {"train_loss": -5.375469207763672, "global_step": 31732, "epoch": 755} {"train_loss": -5.529389381408691, "global_step": 31733, "epoch": 755} {"train_loss": -5.628565788269043, "global_step": 31734, "epoch": 755} {"train_loss": -5.430222988128662, "global_step": 31735, "epoch": 755} {"train_loss": -5.386606216430664, "global_step": 31736, "epoch": 755} {"train_loss": -5.622541904449463, "global_step": 31737, "epoch": 755} {"train_loss": -5.437664985656738, "global_step": 31738, "epoch": 755} {"train_loss": -5.496309280395508, "global_step": 31739, "epoch": 755} {"train_loss": -5.606836318969727, "global_step": 31740, "epoch": 755} {"train_loss": -5.435606956481934, "global_step": 31741, "epoch": 755} {"train_loss": -5.245579719543457, "global_step": 31742, "epoch": 755} {"train_loss": -5.526047706604004, "global_step": 31743, "epoch": 755} {"train_loss": -5.474712371826172, "global_step": 31744, "epoch": 755} {"train_loss": -5.385252952575684, "global_step": 31745, "epoch": 755} {"train_loss": -5.54817533493042, "global_step": 31746, "epoch": 755} {"train_loss": -5.477986812591553, "global_step": 31747, "epoch": 755} {"train_loss": -5.507771015167236, "global_step": 31748, "epoch": 755} {"train_loss": -5.390040397644043, "global_step": 31749, "epoch": 755} {"train_loss": -5.583593368530273, "global_step": 31750, "epoch": 755} {"train_loss": -5.465004410062518, "global_step": 31751, "epoch": 755, "val_loss": 66448.1015625} {"train_loss": -5.419430732727051, "global_step": 31752, "epoch": 756} {"train_loss": -5.446662425994873, "global_step": 31753, "epoch": 756} {"train_loss": -5.451684951782227, "global_step": 31754, "epoch": 756} {"train_loss": -5.594383716583252, "global_step": 31755, "epoch": 756} {"train_loss": -5.456912994384766, "global_step": 31756, "epoch": 756} {"train_loss": -5.459603786468506, "global_step": 31757, "epoch": 756} {"train_loss": -5.543342113494873, "global_step": 31758, "epoch": 756} {"train_loss": -5.438294410705566, "global_step": 31759, "epoch": 756} {"train_loss": -5.572026252746582, "global_step": 31760, "epoch": 756} {"train_loss": -5.493285179138184, "global_step": 31761, "epoch": 756} {"train_loss": -5.407576560974121, "global_step": 31762, "epoch": 756} {"train_loss": -5.518429279327393, "global_step": 31763, "epoch": 756} {"train_loss": -5.41070556640625, "global_step": 31764, "epoch": 756} {"train_loss": -5.5142822265625, "global_step": 31765, "epoch": 756} {"train_loss": -5.61307430267334, "global_step": 31766, "epoch": 756} {"train_loss": -5.450250625610352, "global_step": 31767, "epoch": 756} {"train_loss": -5.6366047859191895, "global_step": 31768, "epoch": 756} {"train_loss": -5.503730773925781, "global_step": 31769, "epoch": 756} {"train_loss": -5.635062217712402, "global_step": 31770, "epoch": 756} {"train_loss": -5.614548683166504, "global_step": 31771, "epoch": 756} {"train_loss": -5.468945503234863, "global_step": 31772, "epoch": 756} {"train_loss": -5.584589958190918, "global_step": 31773, "epoch": 756} {"train_loss": -5.504016876220703, "global_step": 31774, "epoch": 756} {"train_loss": -5.436842441558838, "global_step": 31775, "epoch": 756} {"train_loss": -5.466721534729004, "global_step": 31776, "epoch": 756} {"train_loss": -5.437725067138672, "global_step": 31777, "epoch": 756} {"train_loss": -5.578896522521973, "global_step": 31778, "epoch": 756} {"train_loss": -5.481818675994873, "global_step": 31779, "epoch": 756} {"train_loss": -5.497085094451904, "global_step": 31780, "epoch": 756} {"train_loss": -5.5367817878723145, "global_step": 31781, "epoch": 756} {"train_loss": -5.570202827453613, "global_step": 31782, "epoch": 756} {"train_loss": -5.546896934509277, "global_step": 31783, "epoch": 756} {"train_loss": -5.459965705871582, "global_step": 31784, "epoch": 756} {"train_loss": -5.491698741912842, "global_step": 31785, "epoch": 756} {"train_loss": -5.52635383605957, "global_step": 31786, "epoch": 756} {"train_loss": -5.475291728973389, "global_step": 31787, "epoch": 756} {"train_loss": -5.386430740356445, "global_step": 31788, "epoch": 756} {"train_loss": -5.540557384490967, "global_step": 31789, "epoch": 756} {"train_loss": -5.576510429382324, "global_step": 31790, "epoch": 756} {"train_loss": -5.624253273010254, "global_step": 31791, "epoch": 756} {"train_loss": -5.5316691398620605, "global_step": 31792, "epoch": 756} {"train_loss": -5.508050725573585, "global_step": 31793, "epoch": 756, "val_loss": 67376.71875} {"train_loss": -5.497939109802246, "global_step": 31794, "epoch": 757} {"train_loss": -5.4067230224609375, "global_step": 31795, "epoch": 757} {"train_loss": -5.539584159851074, "global_step": 31796, "epoch": 757} {"train_loss": -5.381258964538574, "global_step": 31797, "epoch": 757} {"train_loss": -5.542491912841797, "global_step": 31798, "epoch": 757} {"train_loss": -5.4381608963012695, "global_step": 31799, "epoch": 757} {"train_loss": -5.4397969245910645, "global_step": 31800, "epoch": 757} {"train_loss": -5.606497287750244, "global_step": 31801, "epoch": 757} {"train_loss": -5.541032791137695, "global_step": 31802, "epoch": 757} {"train_loss": -5.474674701690674, "global_step": 31803, "epoch": 757} {"train_loss": -5.43836784362793, "global_step": 31804, "epoch": 757} {"train_loss": -5.441586494445801, "global_step": 31805, "epoch": 757} {"train_loss": -5.4887471199035645, "global_step": 31806, "epoch": 757} {"train_loss": -5.475922584533691, "global_step": 31807, "epoch": 757} {"train_loss": -5.400278091430664, "global_step": 31808, "epoch": 757} {"train_loss": -5.499233722686768, "global_step": 31809, "epoch": 757} {"train_loss": -5.459568500518799, "global_step": 31810, "epoch": 757} {"train_loss": -5.544498920440674, "global_step": 31811, "epoch": 757} {"train_loss": -5.41342830657959, "global_step": 31812, "epoch": 757} {"train_loss": -5.418990612030029, "global_step": 31813, "epoch": 757} {"train_loss": -5.621934413909912, "global_step": 31814, "epoch": 757} {"train_loss": -5.493932723999023, "global_step": 31815, "epoch": 757} {"train_loss": -5.6128644943237305, "global_step": 31816, "epoch": 757} {"train_loss": -5.5139031410217285, "global_step": 31817, "epoch": 757} {"train_loss": -5.5460286140441895, "global_step": 31818, "epoch": 757} {"train_loss": -5.419032096862793, "global_step": 31819, "epoch": 757} {"train_loss": -5.458266258239746, "global_step": 31820, "epoch": 757} {"train_loss": -5.338825225830078, "global_step": 31821, "epoch": 757} {"train_loss": -5.440297603607178, "global_step": 31822, "epoch": 757} {"train_loss": -5.473697662353516, "global_step": 31823, "epoch": 757} {"train_loss": -5.636573791503906, "global_step": 31824, "epoch": 757} {"train_loss": -5.488795280456543, "global_step": 31825, "epoch": 757} {"train_loss": -5.378965854644775, "global_step": 31826, "epoch": 757} {"train_loss": -5.526435852050781, "global_step": 31827, "epoch": 757} {"train_loss": -5.349956035614014, "global_step": 31828, "epoch": 757} {"train_loss": -5.577386379241943, "global_step": 31829, "epoch": 757} {"train_loss": -5.305781364440918, "global_step": 31830, "epoch": 757} {"train_loss": -5.445721626281738, "global_step": 31831, "epoch": 757} {"train_loss": -5.5689167976379395, "global_step": 31832, "epoch": 757} {"train_loss": -5.3566694259643555, "global_step": 31833, "epoch": 757} {"train_loss": -5.431737422943115, "global_step": 31834, "epoch": 757} {"train_loss": -5.475109951836722, "global_step": 31835, "epoch": 757, "val_loss": 66604.1953125} {"train_loss": -5.435525417327881, "global_step": 31836, "epoch": 758} {"train_loss": -5.437772274017334, "global_step": 31837, "epoch": 758} {"train_loss": -5.53994083404541, "global_step": 31838, "epoch": 758} {"train_loss": -5.449496269226074, "global_step": 31839, "epoch": 758} {"train_loss": -5.496929168701172, "global_step": 31840, "epoch": 758} {"train_loss": -5.582925319671631, "global_step": 31841, "epoch": 758} {"train_loss": -5.61852502822876, "global_step": 31842, "epoch": 758} {"train_loss": -5.516578197479248, "global_step": 31843, "epoch": 758} {"train_loss": -5.607525825500488, "global_step": 31844, "epoch": 758} {"train_loss": -5.5951008796691895, "global_step": 31845, "epoch": 758} {"train_loss": -5.48325252532959, "global_step": 31846, "epoch": 758} {"train_loss": -5.611232757568359, "global_step": 31847, "epoch": 758} {"train_loss": -5.492420196533203, "global_step": 31848, "epoch": 758} {"train_loss": -5.57271671295166, "global_step": 31849, "epoch": 758} {"train_loss": -5.504655838012695, "global_step": 31850, "epoch": 758} {"train_loss": -5.484725475311279, "global_step": 31851, "epoch": 758} {"train_loss": -5.449845314025879, "global_step": 31852, "epoch": 758} {"train_loss": -5.410505294799805, "global_step": 31853, "epoch": 758} {"train_loss": -5.257429122924805, "global_step": 31854, "epoch": 758} {"train_loss": -5.4342522621154785, "global_step": 31855, "epoch": 758} {"train_loss": -5.553993225097656, "global_step": 31856, "epoch": 758} {"train_loss": -5.422710418701172, "global_step": 31857, "epoch": 758} {"train_loss": -5.548985481262207, "global_step": 31858, "epoch": 758} {"train_loss": -5.492782115936279, "global_step": 31859, "epoch": 758} {"train_loss": -5.451904296875, "global_step": 31860, "epoch": 758} {"train_loss": -5.420300483703613, "global_step": 31861, "epoch": 758} {"train_loss": -5.472831726074219, "global_step": 31862, "epoch": 758} {"train_loss": -5.580226898193359, "global_step": 31863, "epoch": 758} {"train_loss": -5.556329250335693, "global_step": 31864, "epoch": 758} {"train_loss": -5.3839192390441895, "global_step": 31865, "epoch": 758} {"train_loss": -5.554837226867676, "global_step": 31866, "epoch": 758} {"train_loss": -5.579345226287842, "global_step": 31867, "epoch": 758} {"train_loss": -5.4884490966796875, "global_step": 31868, "epoch": 758} {"train_loss": -5.472965717315674, "global_step": 31869, "epoch": 758} {"train_loss": -5.654294013977051, "global_step": 31870, "epoch": 758} {"train_loss": -5.499895095825195, "global_step": 31871, "epoch": 758} {"train_loss": -5.387250900268555, "global_step": 31872, "epoch": 758} {"train_loss": -5.573489189147949, "global_step": 31873, "epoch": 758} {"train_loss": -5.567654132843018, "global_step": 31874, "epoch": 758} {"train_loss": -5.33713436126709, "global_step": 31875, "epoch": 758} {"train_loss": -5.552210807800293, "global_step": 31876, "epoch": 758} {"train_loss": -5.499532540639241, "global_step": 31877, "epoch": 758, "val_loss": 67326.5078125} {"train_loss": -5.489527702331543, "global_step": 31878, "epoch": 759} {"train_loss": -5.561860084533691, "global_step": 31879, "epoch": 759} {"train_loss": -5.554838180541992, "global_step": 31880, "epoch": 759} {"train_loss": -5.38034200668335, "global_step": 31881, "epoch": 759} {"train_loss": -5.471837043762207, "global_step": 31882, "epoch": 759} {"train_loss": -5.53959321975708, "global_step": 31883, "epoch": 759} {"train_loss": -5.534547805786133, "global_step": 31884, "epoch": 759} {"train_loss": -5.462328910827637, "global_step": 31885, "epoch": 759} {"train_loss": -5.520481109619141, "global_step": 31886, "epoch": 759} {"train_loss": -5.556792259216309, "global_step": 31887, "epoch": 759} {"train_loss": -5.503873825073242, "global_step": 31888, "epoch": 759} {"train_loss": -5.599081993103027, "global_step": 31889, "epoch": 759} {"train_loss": -5.503403663635254, "global_step": 31890, "epoch": 759} {"train_loss": -5.598492622375488, "global_step": 31891, "epoch": 759} {"train_loss": -5.46120023727417, "global_step": 31892, "epoch": 759} {"train_loss": -5.507570266723633, "global_step": 31893, "epoch": 759} {"train_loss": -5.43397331237793, "global_step": 31894, "epoch": 759} {"train_loss": -5.544254779815674, "global_step": 31895, "epoch": 759} {"train_loss": -5.513803482055664, "global_step": 31896, "epoch": 759} {"train_loss": -5.473348617553711, "global_step": 31897, "epoch": 759} {"train_loss": -5.6874284744262695, "global_step": 31898, "epoch": 759} {"train_loss": -5.472358703613281, "global_step": 31899, "epoch": 759} {"train_loss": -5.4887003898620605, "global_step": 31900, "epoch": 759} {"train_loss": -5.591001033782959, "global_step": 31901, "epoch": 759} {"train_loss": -5.37524938583374, "global_step": 31902, "epoch": 759} {"train_loss": -5.586897850036621, "global_step": 31903, "epoch": 759} {"train_loss": -5.439718723297119, "global_step": 31904, "epoch": 759} {"train_loss": -5.580431938171387, "global_step": 31905, "epoch": 759} {"train_loss": -5.672475814819336, "global_step": 31906, "epoch": 759} {"train_loss": -5.424236297607422, "global_step": 31907, "epoch": 759} {"train_loss": -5.4043779373168945, "global_step": 31908, "epoch": 759} {"train_loss": -5.470751762390137, "global_step": 31909, "epoch": 759} {"train_loss": -5.514023303985596, "global_step": 31910, "epoch": 759} {"train_loss": -5.370199680328369, "global_step": 31911, "epoch": 759} {"train_loss": -5.625463008880615, "global_step": 31912, "epoch": 759} {"train_loss": -5.599309921264648, "global_step": 31913, "epoch": 759} {"train_loss": -5.466588973999023, "global_step": 31914, "epoch": 759} {"train_loss": -5.539762496948242, "global_step": 31915, "epoch": 759} {"train_loss": -5.693119525909424, "global_step": 31916, "epoch": 759} {"train_loss": -5.564079761505127, "global_step": 31917, "epoch": 759} {"train_loss": -5.576048374176025, "global_step": 31918, "epoch": 759} {"train_loss": -5.522659279051281, "global_step": 31919, "epoch": 759, "val_loss": 66774.9921875} {"train_loss": -5.394249439239502, "global_step": 31920, "epoch": 760} {"train_loss": -5.563526153564453, "global_step": 31921, "epoch": 760} {"train_loss": -5.4924540519714355, "global_step": 31922, "epoch": 760} {"train_loss": -5.471158027648926, "global_step": 31923, "epoch": 760} {"train_loss": -5.4923200607299805, "global_step": 31924, "epoch": 760} {"train_loss": -5.563349723815918, "global_step": 31925, "epoch": 760} {"train_loss": -5.543001174926758, "global_step": 31926, "epoch": 760} {"train_loss": -5.507989883422852, "global_step": 31927, "epoch": 760} {"train_loss": -5.544390678405762, "global_step": 31928, "epoch": 760} {"train_loss": -5.487400054931641, "global_step": 31929, "epoch": 760} {"train_loss": -5.484828948974609, "global_step": 31930, "epoch": 760} {"train_loss": -5.455610275268555, "global_step": 31931, "epoch": 760} {"train_loss": -5.426554203033447, "global_step": 31932, "epoch": 760} {"train_loss": -5.566495895385742, "global_step": 31933, "epoch": 760} {"train_loss": -5.360561370849609, "global_step": 31934, "epoch": 760} {"train_loss": -5.575621604919434, "global_step": 31935, "epoch": 760} {"train_loss": -5.489537239074707, "global_step": 31936, "epoch": 760} {"train_loss": -5.4241180419921875, "global_step": 31937, "epoch": 760} {"train_loss": -5.558294296264648, "global_step": 31938, "epoch": 760} {"train_loss": -5.411166667938232, "global_step": 31939, "epoch": 760} {"train_loss": -5.6204633712768555, "global_step": 31940, "epoch": 760} {"train_loss": -5.348246097564697, "global_step": 31941, "epoch": 760} {"train_loss": -5.576385498046875, "global_step": 31942, "epoch": 760} {"train_loss": -5.595617294311523, "global_step": 31943, "epoch": 760} {"train_loss": -5.459043025970459, "global_step": 31944, "epoch": 760} {"train_loss": -5.670596122741699, "global_step": 31945, "epoch": 760} {"train_loss": -5.626060962677002, "global_step": 31946, "epoch": 760} {"train_loss": -5.554996013641357, "global_step": 31947, "epoch": 760} {"train_loss": -5.517196178436279, "global_step": 31948, "epoch": 760} {"train_loss": -5.49965763092041, "global_step": 31949, "epoch": 760} {"train_loss": -5.488100051879883, "global_step": 31950, "epoch": 760} {"train_loss": -5.607694149017334, "global_step": 31951, "epoch": 760} {"train_loss": -5.351806640625, "global_step": 31952, "epoch": 760} {"train_loss": -5.543545722961426, "global_step": 31953, "epoch": 760} {"train_loss": -5.4794697761535645, "global_step": 31954, "epoch": 760} {"train_loss": -5.416285514831543, "global_step": 31955, "epoch": 760} {"train_loss": -5.483022689819336, "global_step": 31956, "epoch": 760} {"train_loss": -5.56423282623291, "global_step": 31957, "epoch": 760} {"train_loss": -5.616946697235107, "global_step": 31958, "epoch": 760} {"train_loss": -5.373250961303711, "global_step": 31959, "epoch": 760} {"train_loss": -5.434392929077148, "global_step": 31960, "epoch": 760} {"train_loss": -5.506227504639399, "global_step": 31961, "epoch": 760, "val_loss": 66671.375} {"train_loss": -5.414785861968994, "global_step": 31962, "epoch": 761} {"train_loss": -5.508520126342773, "global_step": 31963, "epoch": 761} {"train_loss": -5.498414993286133, "global_step": 31964, "epoch": 761} {"train_loss": -5.465378761291504, "global_step": 31965, "epoch": 761} {"train_loss": -5.413052082061768, "global_step": 31966, "epoch": 761} {"train_loss": -5.545422077178955, "global_step": 31967, "epoch": 761} {"train_loss": -5.472879409790039, "global_step": 31968, "epoch": 761} {"train_loss": -5.507347106933594, "global_step": 31969, "epoch": 761} {"train_loss": -5.479440212249756, "global_step": 31970, "epoch": 761} {"train_loss": -5.447737693786621, "global_step": 31971, "epoch": 761} {"train_loss": -5.516095161437988, "global_step": 31972, "epoch": 761} {"train_loss": -5.558780193328857, "global_step": 31973, "epoch": 761} {"train_loss": -5.460862636566162, "global_step": 31974, "epoch": 761} {"train_loss": -5.452300548553467, "global_step": 31975, "epoch": 761} {"train_loss": -5.575479984283447, "global_step": 31976, "epoch": 761} {"train_loss": -5.472037315368652, "global_step": 31977, "epoch": 761} {"train_loss": -5.497348785400391, "global_step": 31978, "epoch": 761} {"train_loss": -5.448549747467041, "global_step": 31979, "epoch": 761} {"train_loss": -5.497211456298828, "global_step": 31980, "epoch": 761} {"train_loss": -5.53409481048584, "global_step": 31981, "epoch": 761} {"train_loss": -5.516188621520996, "global_step": 31982, "epoch": 761} {"train_loss": -5.377819061279297, "global_step": 31983, "epoch": 761} {"train_loss": -5.564122676849365, "global_step": 31984, "epoch": 761} {"train_loss": -5.674739837646484, "global_step": 31985, "epoch": 761} {"train_loss": -5.427550315856934, "global_step": 31986, "epoch": 761} {"train_loss": -5.50797176361084, "global_step": 31987, "epoch": 761} {"train_loss": -5.567553520202637, "global_step": 31988, "epoch": 761} {"train_loss": -5.5421247482299805, "global_step": 31989, "epoch": 761} {"train_loss": -5.492990493774414, "global_step": 31990, "epoch": 761} {"train_loss": -5.479616165161133, "global_step": 31991, "epoch": 761} {"train_loss": -5.52579927444458, "global_step": 31992, "epoch": 761} {"train_loss": -5.50022554397583, "global_step": 31993, "epoch": 761} {"train_loss": -5.435922622680664, "global_step": 31994, "epoch": 761} {"train_loss": -5.4662065505981445, "global_step": 31995, "epoch": 761} {"train_loss": -5.575653076171875, "global_step": 31996, "epoch": 761} {"train_loss": -5.49062442779541, "global_step": 31997, "epoch": 761} {"train_loss": -5.430882930755615, "global_step": 31998, "epoch": 761} {"train_loss": -5.408821105957031, "global_step": 31999, "epoch": 761} {"train_loss": -5.544936180114746, "global_step": 32000, "epoch": 761} {"train_loss": -5.473850727081299, "global_step": 32001, "epoch": 761} {"train_loss": -5.426116943359375, "global_step": 32002, "epoch": 761} {"train_loss": -5.495458648318336, "global_step": 32003, "epoch": 761, "val_loss": 66578.015625} {"train_loss": -5.457885265350342, "global_step": 32004, "epoch": 762} {"train_loss": -5.424898147583008, "global_step": 32005, "epoch": 762} {"train_loss": -5.451383590698242, "global_step": 32006, "epoch": 762} {"train_loss": -5.39597225189209, "global_step": 32007, "epoch": 762} {"train_loss": -5.507166862487793, "global_step": 32008, "epoch": 762} {"train_loss": -5.649012088775635, "global_step": 32009, "epoch": 762} {"train_loss": -5.674252033233643, "global_step": 32010, "epoch": 762} {"train_loss": -5.371605396270752, "global_step": 32011, "epoch": 762} {"train_loss": -5.607294082641602, "global_step": 32012, "epoch": 762} {"train_loss": -5.595897674560547, "global_step": 32013, "epoch": 762} {"train_loss": -5.489641189575195, "global_step": 32014, "epoch": 762} {"train_loss": -5.409852027893066, "global_step": 32015, "epoch": 762} {"train_loss": -5.516399383544922, "global_step": 32016, "epoch": 762} {"train_loss": -5.38604736328125, "global_step": 32017, "epoch": 762} {"train_loss": -5.527369022369385, "global_step": 32018, "epoch": 762} {"train_loss": -5.560534954071045, "global_step": 32019, "epoch": 762} {"train_loss": -5.36899995803833, "global_step": 32020, "epoch": 762} {"train_loss": -5.423118591308594, "global_step": 32021, "epoch": 762} {"train_loss": -5.401159286499023, "global_step": 32022, "epoch": 762} {"train_loss": -5.497612953186035, "global_step": 32023, "epoch": 762} {"train_loss": -5.555830001831055, "global_step": 32024, "epoch": 762} {"train_loss": -5.556142330169678, "global_step": 32025, "epoch": 762} {"train_loss": -5.394300937652588, "global_step": 32026, "epoch": 762} {"train_loss": -5.527929306030273, "global_step": 32027, "epoch": 762} {"train_loss": -5.397721290588379, "global_step": 32028, "epoch": 762} {"train_loss": -5.412261009216309, "global_step": 32029, "epoch": 762} {"train_loss": -5.489534378051758, "global_step": 32030, "epoch": 762} {"train_loss": -5.571422576904297, "global_step": 32031, "epoch": 762} {"train_loss": -5.423615455627441, "global_step": 32032, "epoch": 762} {"train_loss": -5.536564350128174, "global_step": 32033, "epoch": 762} {"train_loss": -5.650467872619629, "global_step": 32034, "epoch": 762} {"train_loss": -5.587686538696289, "global_step": 32035, "epoch": 762} {"train_loss": -5.4817214012146, "global_step": 32036, "epoch": 762} {"train_loss": -5.62495231628418, "global_step": 32037, "epoch": 762} {"train_loss": -5.481123924255371, "global_step": 32038, "epoch": 762} {"train_loss": -5.491737365722656, "global_step": 32039, "epoch": 762} {"train_loss": -5.575265884399414, "global_step": 32040, "epoch": 762} {"train_loss": -5.580273628234863, "global_step": 32041, "epoch": 762} {"train_loss": -5.464542388916016, "global_step": 32042, "epoch": 762} {"train_loss": -5.432006359100342, "global_step": 32043, "epoch": 762} {"train_loss": -5.532815933227539, "global_step": 32044, "epoch": 762} {"train_loss": -5.4965624922797796, "global_step": 32045, "epoch": 762, "val_loss": 66724.6953125} {"train_loss": -5.594542503356934, "global_step": 32046, "epoch": 763} {"train_loss": -5.4825944900512695, "global_step": 32047, "epoch": 763} {"train_loss": -5.583453178405762, "global_step": 32048, "epoch": 763} {"train_loss": -5.41115665435791, "global_step": 32049, "epoch": 763} {"train_loss": -5.560579299926758, "global_step": 32050, "epoch": 763} {"train_loss": -5.631422519683838, "global_step": 32051, "epoch": 763} {"train_loss": -5.380234718322754, "global_step": 32052, "epoch": 763} {"train_loss": -5.600857734680176, "global_step": 32053, "epoch": 763} {"train_loss": -5.524191856384277, "global_step": 32054, "epoch": 763} {"train_loss": -5.3499979972839355, "global_step": 32055, "epoch": 763} {"train_loss": -5.562112808227539, "global_step": 32056, "epoch": 763} {"train_loss": -5.441188335418701, "global_step": 32057, "epoch": 763} {"train_loss": -5.484394073486328, "global_step": 32058, "epoch": 763} {"train_loss": -5.460428714752197, "global_step": 32059, "epoch": 763} {"train_loss": -5.473966598510742, "global_step": 32060, "epoch": 763} {"train_loss": -5.512311935424805, "global_step": 32061, "epoch": 763} {"train_loss": -5.381059646606445, "global_step": 32062, "epoch": 763} {"train_loss": -5.461538791656494, "global_step": 32063, "epoch": 763} {"train_loss": -5.55509090423584, "global_step": 32064, "epoch": 763} {"train_loss": -5.719089031219482, "global_step": 32065, "epoch": 763} {"train_loss": -5.468583106994629, "global_step": 32066, "epoch": 763} {"train_loss": -5.381621837615967, "global_step": 32067, "epoch": 763} {"train_loss": -5.662396430969238, "global_step": 32068, "epoch": 763} {"train_loss": -5.509742736816406, "global_step": 32069, "epoch": 763} {"train_loss": -5.455528259277344, "global_step": 32070, "epoch": 763} {"train_loss": -5.486844062805176, "global_step": 32071, "epoch": 763} {"train_loss": -5.494647979736328, "global_step": 32072, "epoch": 763} {"train_loss": -5.587369441986084, "global_step": 32073, "epoch": 763} {"train_loss": -5.5196533203125, "global_step": 32074, "epoch": 763} {"train_loss": -5.484220504760742, "global_step": 32075, "epoch": 763} {"train_loss": -5.604338645935059, "global_step": 32076, "epoch": 763} {"train_loss": -5.389222621917725, "global_step": 32077, "epoch": 763} {"train_loss": -5.478693008422852, "global_step": 32078, "epoch": 763} {"train_loss": -5.464456081390381, "global_step": 32079, "epoch": 763} {"train_loss": -5.525480270385742, "global_step": 32080, "epoch": 763} {"train_loss": -5.552757263183594, "global_step": 32081, "epoch": 763} {"train_loss": -5.480136871337891, "global_step": 32082, "epoch": 763} {"train_loss": -5.424132347106934, "global_step": 32083, "epoch": 763} {"train_loss": -5.584747314453125, "global_step": 32084, "epoch": 763} {"train_loss": -5.4686126708984375, "global_step": 32085, "epoch": 763} {"train_loss": -5.615324020385742, "global_step": 32086, "epoch": 763} {"train_loss": -5.50436350277492, "global_step": 32087, "epoch": 763, "val_loss": 66598.921875} {"train_loss": -5.543567180633545, "global_step": 32088, "epoch": 764} {"train_loss": -5.5982842445373535, "global_step": 32089, "epoch": 764} {"train_loss": -5.589766979217529, "global_step": 32090, "epoch": 764} {"train_loss": -5.554515838623047, "global_step": 32091, "epoch": 764} {"train_loss": -5.499085426330566, "global_step": 32092, "epoch": 764} {"train_loss": -5.546339988708496, "global_step": 32093, "epoch": 764} {"train_loss": -5.518730163574219, "global_step": 32094, "epoch": 764} {"train_loss": -5.563960075378418, "global_step": 32095, "epoch": 764} {"train_loss": -5.4377288818359375, "global_step": 32096, "epoch": 764} {"train_loss": -5.550745487213135, "global_step": 32097, "epoch": 764} {"train_loss": -5.519880294799805, "global_step": 32098, "epoch": 764} {"train_loss": -5.574247360229492, "global_step": 32099, "epoch": 764} {"train_loss": -5.508767604827881, "global_step": 32100, "epoch": 764} {"train_loss": -5.674997329711914, "global_step": 32101, "epoch": 764} {"train_loss": -5.536273956298828, "global_step": 32102, "epoch": 764} {"train_loss": -5.44096565246582, "global_step": 32103, "epoch": 764} {"train_loss": -5.544467926025391, "global_step": 32104, "epoch": 764} {"train_loss": -5.480582237243652, "global_step": 32105, "epoch": 764} {"train_loss": -5.482483863830566, "global_step": 32106, "epoch": 764} {"train_loss": -5.525881767272949, "global_step": 32107, "epoch": 764} {"train_loss": -5.536170959472656, "global_step": 32108, "epoch": 764} {"train_loss": -5.464101791381836, "global_step": 32109, "epoch": 764} {"train_loss": -5.520069122314453, "global_step": 32110, "epoch": 764} {"train_loss": -5.464447021484375, "global_step": 32111, "epoch": 764} {"train_loss": -5.507761001586914, "global_step": 32112, "epoch": 764} {"train_loss": -5.54591178894043, "global_step": 32113, "epoch": 764} {"train_loss": -5.5257248878479, "global_step": 32114, "epoch": 764} {"train_loss": -5.540470600128174, "global_step": 32115, "epoch": 764} {"train_loss": -5.3528923988342285, "global_step": 32116, "epoch": 764} {"train_loss": -5.472338676452637, "global_step": 32117, "epoch": 764} {"train_loss": -5.4536213874816895, "global_step": 32118, "epoch": 764} {"train_loss": -5.572939872741699, "global_step": 32119, "epoch": 764} {"train_loss": -5.63577127456665, "global_step": 32120, "epoch": 764} {"train_loss": -5.380694389343262, "global_step": 32121, "epoch": 764} {"train_loss": -5.5385966300964355, "global_step": 32122, "epoch": 764} {"train_loss": -5.510634899139404, "global_step": 32123, "epoch": 764} {"train_loss": -5.483826637268066, "global_step": 32124, "epoch": 764} {"train_loss": -5.6125993728637695, "global_step": 32125, "epoch": 764} {"train_loss": -5.420785903930664, "global_step": 32126, "epoch": 764} {"train_loss": -5.551013946533203, "global_step": 32127, "epoch": 764} {"train_loss": -5.5861735343933105, "global_step": 32128, "epoch": 764} {"train_loss": -5.5191750185830255, "global_step": 32129, "epoch": 764, "val_loss": 66651.96875} {"train_loss": -5.538995265960693, "global_step": 32130, "epoch": 765} {"train_loss": -5.615739822387695, "global_step": 32131, "epoch": 765} {"train_loss": -5.532998561859131, "global_step": 32132, "epoch": 765} {"train_loss": -5.395083427429199, "global_step": 32133, "epoch": 765} {"train_loss": -5.586137294769287, "global_step": 32134, "epoch": 765} {"train_loss": -5.533999443054199, "global_step": 32135, "epoch": 765} {"train_loss": -5.721510887145996, "global_step": 32136, "epoch": 765} {"train_loss": -5.478548049926758, "global_step": 32137, "epoch": 765} {"train_loss": -5.4594950675964355, "global_step": 32138, "epoch": 765} {"train_loss": -5.444210052490234, "global_step": 32139, "epoch": 765} {"train_loss": -5.345037460327148, "global_step": 32140, "epoch": 765} {"train_loss": -5.549641132354736, "global_step": 32141, "epoch": 765} {"train_loss": -5.580186367034912, "global_step": 32142, "epoch": 765} {"train_loss": -5.606746673583984, "global_step": 32143, "epoch": 765} {"train_loss": -5.499022483825684, "global_step": 32144, "epoch": 765} {"train_loss": -5.493727684020996, "global_step": 32145, "epoch": 765} {"train_loss": -5.583172798156738, "global_step": 32146, "epoch": 765} {"train_loss": -5.609755516052246, "global_step": 32147, "epoch": 765} {"train_loss": -5.448617935180664, "global_step": 32148, "epoch": 765} {"train_loss": -5.512180328369141, "global_step": 32149, "epoch": 765} {"train_loss": -5.510786056518555, "global_step": 32150, "epoch": 765} {"train_loss": -5.586885452270508, "global_step": 32151, "epoch": 765} {"train_loss": -5.427708625793457, "global_step": 32152, "epoch": 765} {"train_loss": -5.634304046630859, "global_step": 32153, "epoch": 765} {"train_loss": -5.516656398773193, "global_step": 32154, "epoch": 765} {"train_loss": -5.641113758087158, "global_step": 32155, "epoch": 765} {"train_loss": -5.470218658447266, "global_step": 32156, "epoch": 765} {"train_loss": -5.482600212097168, "global_step": 32157, "epoch": 765} {"train_loss": -5.3740129470825195, "global_step": 32158, "epoch": 765} {"train_loss": -5.423015117645264, "global_step": 32159, "epoch": 765} {"train_loss": -5.605104446411133, "global_step": 32160, "epoch": 765} {"train_loss": -5.4529218673706055, "global_step": 32161, "epoch": 765} {"train_loss": -5.636573791503906, "global_step": 32162, "epoch": 765} {"train_loss": -5.299445629119873, "global_step": 32163, "epoch": 765} {"train_loss": -5.518902778625488, "global_step": 32164, "epoch": 765} {"train_loss": -5.512997627258301, "global_step": 32165, "epoch": 765} {"train_loss": -5.463344573974609, "global_step": 32166, "epoch": 765} {"train_loss": -5.4380598068237305, "global_step": 32167, "epoch": 765} {"train_loss": -5.523428916931152, "global_step": 32168, "epoch": 765} {"train_loss": -5.616676330566406, "global_step": 32169, "epoch": 765} {"train_loss": -5.504777908325195, "global_step": 32170, "epoch": 765} {"train_loss": -5.516288711911156, "global_step": 32171, "epoch": 765, "val_loss": 66601.4609375} {"train_loss": -5.587205410003662, "global_step": 32172, "epoch": 766} {"train_loss": -5.480513572692871, "global_step": 32173, "epoch": 766} {"train_loss": -5.442784786224365, "global_step": 32174, "epoch": 766} {"train_loss": -5.512618064880371, "global_step": 32175, "epoch": 766} {"train_loss": -5.559991836547852, "global_step": 32176, "epoch": 766} {"train_loss": -5.629036903381348, "global_step": 32177, "epoch": 766} {"train_loss": -5.590712547302246, "global_step": 32178, "epoch": 766} {"train_loss": -5.410312652587891, "global_step": 32179, "epoch": 766} {"train_loss": -5.460748672485352, "global_step": 32180, "epoch": 766} {"train_loss": -5.52630615234375, "global_step": 32181, "epoch": 766} {"train_loss": -5.620699405670166, "global_step": 32182, "epoch": 766} {"train_loss": -5.629702091217041, "global_step": 32183, "epoch": 766} {"train_loss": -5.490474700927734, "global_step": 32184, "epoch": 766} {"train_loss": -5.50787353515625, "global_step": 32185, "epoch": 766} {"train_loss": -5.624317646026611, "global_step": 32186, "epoch": 766} {"train_loss": -5.537594318389893, "global_step": 32187, "epoch": 766} {"train_loss": -5.64407205581665, "global_step": 32188, "epoch": 766} {"train_loss": -5.662169933319092, "global_step": 32189, "epoch": 766} {"train_loss": -5.507046699523926, "global_step": 32190, "epoch": 766} {"train_loss": -5.495131969451904, "global_step": 32191, "epoch": 766} {"train_loss": -5.587890625, "global_step": 32192, "epoch": 766} {"train_loss": -5.387807846069336, "global_step": 32193, "epoch": 766} {"train_loss": -5.473027229309082, "global_step": 32194, "epoch": 766} {"train_loss": -5.472410202026367, "global_step": 32195, "epoch": 766} {"train_loss": -5.504748821258545, "global_step": 32196, "epoch": 766} {"train_loss": -5.51318359375, "global_step": 32197, "epoch": 766} {"train_loss": -5.528036117553711, "global_step": 32198, "epoch": 766} {"train_loss": -5.377621173858643, "global_step": 32199, "epoch": 766} {"train_loss": -5.535139083862305, "global_step": 32200, "epoch": 766} {"train_loss": -5.464532852172852, "global_step": 32201, "epoch": 766} {"train_loss": -5.412001609802246, "global_step": 32202, "epoch": 766} {"train_loss": -5.429862022399902, "global_step": 32203, "epoch": 766} {"train_loss": -5.624824047088623, "global_step": 32204, "epoch": 766} {"train_loss": -5.623337745666504, "global_step": 32205, "epoch": 766} {"train_loss": -5.321732521057129, "global_step": 32206, "epoch": 766} {"train_loss": -5.5475263595581055, "global_step": 32207, "epoch": 766} {"train_loss": -5.685604572296143, "global_step": 32208, "epoch": 766} {"train_loss": -5.617256164550781, "global_step": 32209, "epoch": 766} {"train_loss": -5.651464462280273, "global_step": 32210, "epoch": 766} {"train_loss": -5.528017997741699, "global_step": 32211, "epoch": 766} {"train_loss": -5.540358066558838, "global_step": 32212, "epoch": 766} {"train_loss": -5.529019548779442, "global_step": 32213, "epoch": 766, "val_loss": 66467.3828125} {"train_loss": -5.545295715332031, "global_step": 32214, "epoch": 767} {"train_loss": -5.547957897186279, "global_step": 32215, "epoch": 767} {"train_loss": -5.396547317504883, "global_step": 32216, "epoch": 767} {"train_loss": -5.539987564086914, "global_step": 32217, "epoch": 767} {"train_loss": -5.665068626403809, "global_step": 32218, "epoch": 767} {"train_loss": -5.479754447937012, "global_step": 32219, "epoch": 767} {"train_loss": -5.591948509216309, "global_step": 32220, "epoch": 767} {"train_loss": -5.605461597442627, "global_step": 32221, "epoch": 767} {"train_loss": -5.556027412414551, "global_step": 32222, "epoch": 767} {"train_loss": -5.515050411224365, "global_step": 32223, "epoch": 767} {"train_loss": -5.420070648193359, "global_step": 32224, "epoch": 767} {"train_loss": -5.585031986236572, "global_step": 32225, "epoch": 767} {"train_loss": -5.592902183532715, "global_step": 32226, "epoch": 767} {"train_loss": -5.381265163421631, "global_step": 32227, "epoch": 767} {"train_loss": -5.4871931076049805, "global_step": 32228, "epoch": 767} {"train_loss": -5.381806373596191, "global_step": 32229, "epoch": 767} {"train_loss": -5.440421104431152, "global_step": 32230, "epoch": 767} {"train_loss": -5.537948131561279, "global_step": 32231, "epoch": 767} {"train_loss": -5.452210426330566, "global_step": 32232, "epoch": 767} {"train_loss": -5.480186462402344, "global_step": 32233, "epoch": 767} {"train_loss": -5.60306453704834, "global_step": 32234, "epoch": 767} {"train_loss": -5.446238994598389, "global_step": 32235, "epoch": 767} {"train_loss": -5.521913528442383, "global_step": 32236, "epoch": 767} {"train_loss": -5.5113205909729, "global_step": 32237, "epoch": 767} {"train_loss": -5.636119365692139, "global_step": 32238, "epoch": 767} {"train_loss": -5.481319427490234, "global_step": 32239, "epoch": 767} {"train_loss": -5.443594932556152, "global_step": 32240, "epoch": 767} {"train_loss": -5.611184597015381, "global_step": 32241, "epoch": 767} {"train_loss": -5.596124172210693, "global_step": 32242, "epoch": 767} {"train_loss": -5.536375999450684, "global_step": 32243, "epoch": 767} {"train_loss": -5.633427619934082, "global_step": 32244, "epoch": 767} {"train_loss": -5.561042785644531, "global_step": 32245, "epoch": 767} {"train_loss": -5.523567199707031, "global_step": 32246, "epoch": 767} {"train_loss": -5.551644325256348, "global_step": 32247, "epoch": 767} {"train_loss": -5.44312047958374, "global_step": 32248, "epoch": 767} {"train_loss": -5.452304363250732, "global_step": 32249, "epoch": 767} {"train_loss": -5.45694637298584, "global_step": 32250, "epoch": 767} {"train_loss": -5.529914379119873, "global_step": 32251, "epoch": 767} {"train_loss": -5.612226486206055, "global_step": 32252, "epoch": 767} {"train_loss": -5.595207691192627, "global_step": 32253, "epoch": 767} {"train_loss": -5.462345600128174, "global_step": 32254, "epoch": 767} {"train_loss": -5.520967517580305, "global_step": 32255, "epoch": 767, "val_loss": 66726.2421875} {"train_loss": -5.489688873291016, "global_step": 32256, "epoch": 768} {"train_loss": -5.5416646003723145, "global_step": 32257, "epoch": 768} {"train_loss": -5.303750514984131, "global_step": 32258, "epoch": 768} {"train_loss": -5.416546821594238, "global_step": 32259, "epoch": 768} {"train_loss": -5.450930118560791, "global_step": 32260, "epoch": 768} {"train_loss": -5.473569869995117, "global_step": 32261, "epoch": 768} {"train_loss": -5.49519157409668, "global_step": 32262, "epoch": 768} {"train_loss": -5.5416364669799805, "global_step": 32263, "epoch": 768} {"train_loss": -5.583645820617676, "global_step": 32264, "epoch": 768} {"train_loss": -5.48920202255249, "global_step": 32265, "epoch": 768} {"train_loss": -5.441338539123535, "global_step": 32266, "epoch": 768} {"train_loss": -5.419193744659424, "global_step": 32267, "epoch": 768} {"train_loss": -5.5198469161987305, "global_step": 32268, "epoch": 768} {"train_loss": -5.413605690002441, "global_step": 32269, "epoch": 768} {"train_loss": -5.573519706726074, "global_step": 32270, "epoch": 768} {"train_loss": -5.623612403869629, "global_step": 32271, "epoch": 768} {"train_loss": -5.5706305503845215, "global_step": 32272, "epoch": 768} {"train_loss": -5.506570816040039, "global_step": 32273, "epoch": 768} {"train_loss": -5.608428001403809, "global_step": 32274, "epoch": 768} {"train_loss": -5.4735002517700195, "global_step": 32275, "epoch": 768} {"train_loss": -5.626160621643066, "global_step": 32276, "epoch": 768} {"train_loss": -5.48487663269043, "global_step": 32277, "epoch": 768} {"train_loss": -5.4312639236450195, "global_step": 32278, "epoch": 768} {"train_loss": -5.5539093017578125, "global_step": 32279, "epoch": 768} {"train_loss": -5.347888469696045, "global_step": 32280, "epoch": 768} {"train_loss": -5.470843315124512, "global_step": 32281, "epoch": 768} {"train_loss": -5.639595031738281, "global_step": 32282, "epoch": 768} {"train_loss": -5.497530937194824, "global_step": 32283, "epoch": 768} {"train_loss": -5.462477684020996, "global_step": 32284, "epoch": 768} {"train_loss": -5.457462310791016, "global_step": 32285, "epoch": 768} {"train_loss": -5.5491838455200195, "global_step": 32286, "epoch": 768} {"train_loss": -5.596275329589844, "global_step": 32287, "epoch": 768} {"train_loss": -5.486876010894775, "global_step": 32288, "epoch": 768} {"train_loss": -5.604702949523926, "global_step": 32289, "epoch": 768} {"train_loss": -5.383288383483887, "global_step": 32290, "epoch": 768} {"train_loss": -5.622563362121582, "global_step": 32291, "epoch": 768} {"train_loss": -5.55136775970459, "global_step": 32292, "epoch": 768} {"train_loss": -5.448004722595215, "global_step": 32293, "epoch": 768} {"train_loss": -5.4704484939575195, "global_step": 32294, "epoch": 768} {"train_loss": -5.549010753631592, "global_step": 32295, "epoch": 768} {"train_loss": -5.662890434265137, "global_step": 32296, "epoch": 768} {"train_loss": -5.512612660725911, "global_step": 32297, "epoch": 768, "val_loss": 66494.265625} {"train_loss": -5.498762130737305, "global_step": 32298, "epoch": 769} {"train_loss": -5.5124406814575195, "global_step": 32299, "epoch": 769} {"train_loss": -5.6210503578186035, "global_step": 32300, "epoch": 769} {"train_loss": -5.426143646240234, "global_step": 32301, "epoch": 769} {"train_loss": -5.520727157592773, "global_step": 32302, "epoch": 769} {"train_loss": -5.634819030761719, "global_step": 32303, "epoch": 769} {"train_loss": -5.50819730758667, "global_step": 32304, "epoch": 769} {"train_loss": -5.621919631958008, "global_step": 32305, "epoch": 769} {"train_loss": -5.655664920806885, "global_step": 32306, "epoch": 769} {"train_loss": -5.4690775871276855, "global_step": 32307, "epoch": 769} {"train_loss": -5.619638919830322, "global_step": 32308, "epoch": 769} {"train_loss": -5.510634422302246, "global_step": 32309, "epoch": 769} {"train_loss": -5.513949871063232, "global_step": 32310, "epoch": 769} {"train_loss": -5.527182102203369, "global_step": 32311, "epoch": 769} {"train_loss": -5.378321647644043, "global_step": 32312, "epoch": 769} {"train_loss": -5.456623554229736, "global_step": 32313, "epoch": 769} {"train_loss": -5.495555877685547, "global_step": 32314, "epoch": 769} {"train_loss": -5.604029178619385, "global_step": 32315, "epoch": 769} {"train_loss": -5.526463508605957, "global_step": 32316, "epoch": 769} {"train_loss": -5.672863960266113, "global_step": 32317, "epoch": 769} {"train_loss": -5.690930366516113, "global_step": 32318, "epoch": 769} {"train_loss": -5.430785655975342, "global_step": 32319, "epoch": 769} {"train_loss": -5.5956268310546875, "global_step": 32320, "epoch": 769} {"train_loss": -5.420769214630127, "global_step": 32321, "epoch": 769} {"train_loss": -5.467040538787842, "global_step": 32322, "epoch": 769} {"train_loss": -5.545723915100098, "global_step": 32323, "epoch": 769} {"train_loss": -5.516266822814941, "global_step": 32324, "epoch": 769} {"train_loss": -5.43808126449585, "global_step": 32325, "epoch": 769} {"train_loss": -5.542908668518066, "global_step": 32326, "epoch": 769} {"train_loss": -5.62872314453125, "global_step": 32327, "epoch": 769} {"train_loss": -5.443605422973633, "global_step": 32328, "epoch": 769} {"train_loss": -5.426133155822754, "global_step": 32329, "epoch": 769} {"train_loss": -5.569779396057129, "global_step": 32330, "epoch": 769} {"train_loss": -5.355775356292725, "global_step": 32331, "epoch": 769} {"train_loss": -5.455850601196289, "global_step": 32332, "epoch": 769} {"train_loss": -5.400036811828613, "global_step": 32333, "epoch": 769} {"train_loss": -5.597978591918945, "global_step": 32334, "epoch": 769} {"train_loss": -5.415523529052734, "global_step": 32335, "epoch": 769} {"train_loss": -5.474987983703613, "global_step": 32336, "epoch": 769} {"train_loss": -5.443324089050293, "global_step": 32337, "epoch": 769} {"train_loss": -5.495911121368408, "global_step": 32338, "epoch": 769} {"train_loss": -5.512615362803142, "global_step": 32339, "epoch": 769, "val_loss": 67250.5078125} {"train_loss": -5.560850620269775, "global_step": 32340, "epoch": 770} {"train_loss": -5.533421516418457, "global_step": 32341, "epoch": 770} {"train_loss": -5.531469821929932, "global_step": 32342, "epoch": 770} {"train_loss": -5.467031002044678, "global_step": 32343, "epoch": 770} {"train_loss": -5.50759220123291, "global_step": 32344, "epoch": 770} {"train_loss": -5.330077171325684, "global_step": 32345, "epoch": 770} {"train_loss": -5.419809341430664, "global_step": 32346, "epoch": 770} {"train_loss": -5.5090179443359375, "global_step": 32347, "epoch": 770} {"train_loss": -5.339495658874512, "global_step": 32348, "epoch": 770} {"train_loss": -5.5326313972473145, "global_step": 32349, "epoch": 770} {"train_loss": -5.420892238616943, "global_step": 32350, "epoch": 770} {"train_loss": -5.55500602722168, "global_step": 32351, "epoch": 770} {"train_loss": -5.57929801940918, "global_step": 32352, "epoch": 770} {"train_loss": -5.5132341384887695, "global_step": 32353, "epoch": 770} {"train_loss": -5.436086177825928, "global_step": 32354, "epoch": 770} {"train_loss": -5.42857551574707, "global_step": 32355, "epoch": 770} {"train_loss": -5.385010719299316, "global_step": 32356, "epoch": 770} {"train_loss": -5.484171390533447, "global_step": 32357, "epoch": 770} {"train_loss": -5.544318199157715, "global_step": 32358, "epoch": 770} {"train_loss": -5.506764888763428, "global_step": 32359, "epoch": 770} {"train_loss": -5.376424789428711, "global_step": 32360, "epoch": 770} {"train_loss": -5.44992733001709, "global_step": 32361, "epoch": 770} {"train_loss": -5.487677097320557, "global_step": 32362, "epoch": 770} {"train_loss": -5.569746017456055, "global_step": 32363, "epoch": 770} {"train_loss": -5.358190059661865, "global_step": 32364, "epoch": 770} {"train_loss": -5.652354717254639, "global_step": 32365, "epoch": 770} {"train_loss": -5.658212661743164, "global_step": 32366, "epoch": 770} {"train_loss": -5.612653732299805, "global_step": 32367, "epoch": 770} {"train_loss": -5.651701927185059, "global_step": 32368, "epoch": 770} {"train_loss": -5.523085117340088, "global_step": 32369, "epoch": 770} {"train_loss": -5.624683380126953, "global_step": 32370, "epoch": 770} {"train_loss": -5.425041198730469, "global_step": 32371, "epoch": 770} {"train_loss": -5.552191734313965, "global_step": 32372, "epoch": 770} {"train_loss": -5.465686798095703, "global_step": 32373, "epoch": 770} {"train_loss": -5.551747798919678, "global_step": 32374, "epoch": 770} {"train_loss": -5.451346397399902, "global_step": 32375, "epoch": 770} {"train_loss": -5.597689628601074, "global_step": 32376, "epoch": 770} {"train_loss": -5.505850315093994, "global_step": 32377, "epoch": 770} {"train_loss": -5.674417495727539, "global_step": 32378, "epoch": 770} {"train_loss": -5.486761093139648, "global_step": 32379, "epoch": 770} {"train_loss": -5.453711032867432, "global_step": 32380, "epoch": 770} {"train_loss": -5.507292917796543, "global_step": 32381, "epoch": 770, "val_loss": 67216.28125} {"train_loss": -5.511604309082031, "global_step": 32382, "epoch": 771} {"train_loss": -5.550018310546875, "global_step": 32383, "epoch": 771} {"train_loss": -5.458701133728027, "global_step": 32384, "epoch": 771} {"train_loss": -5.417325019836426, "global_step": 32385, "epoch": 771} {"train_loss": -5.49809455871582, "global_step": 32386, "epoch": 771} {"train_loss": -5.610554218292236, "global_step": 32387, "epoch": 771} {"train_loss": -5.463174343109131, "global_step": 32388, "epoch": 771} {"train_loss": -5.56008243560791, "global_step": 32389, "epoch": 771} {"train_loss": -5.454664707183838, "global_step": 32390, "epoch": 771} {"train_loss": -5.533143043518066, "global_step": 32391, "epoch": 771} {"train_loss": -5.530439376831055, "global_step": 32392, "epoch": 771} {"train_loss": -5.570355415344238, "global_step": 32393, "epoch": 771} {"train_loss": -5.513888359069824, "global_step": 32394, "epoch": 771} {"train_loss": -5.457486152648926, "global_step": 32395, "epoch": 771} {"train_loss": -5.5072431564331055, "global_step": 32396, "epoch": 771} {"train_loss": -5.518500804901123, "global_step": 32397, "epoch": 771} {"train_loss": -5.721523284912109, "global_step": 32398, "epoch": 771} {"train_loss": -5.57203483581543, "global_step": 32399, "epoch": 771} {"train_loss": -5.58152961730957, "global_step": 32400, "epoch": 771} {"train_loss": -5.548619270324707, "global_step": 32401, "epoch": 771} {"train_loss": -5.36921501159668, "global_step": 32402, "epoch": 771} {"train_loss": -5.604288578033447, "global_step": 32403, "epoch": 771} {"train_loss": -5.585439205169678, "global_step": 32404, "epoch": 771} {"train_loss": -5.505288124084473, "global_step": 32405, "epoch": 771} {"train_loss": -5.46568489074707, "global_step": 32406, "epoch": 771} {"train_loss": -5.48094367980957, "global_step": 32407, "epoch": 771} {"train_loss": -5.463441371917725, "global_step": 32408, "epoch": 771} {"train_loss": -5.537505149841309, "global_step": 32409, "epoch": 771} {"train_loss": -5.496313095092773, "global_step": 32410, "epoch": 771} {"train_loss": -5.524649620056152, "global_step": 32411, "epoch": 771} {"train_loss": -5.590580940246582, "global_step": 32412, "epoch": 771} {"train_loss": -5.650749206542969, "global_step": 32413, "epoch": 771} {"train_loss": -5.624144554138184, "global_step": 32414, "epoch": 771} {"train_loss": -5.448630332946777, "global_step": 32415, "epoch": 771} {"train_loss": -5.418747901916504, "global_step": 32416, "epoch": 771} {"train_loss": -5.534696578979492, "global_step": 32417, "epoch": 771} {"train_loss": -5.46820068359375, "global_step": 32418, "epoch": 771} {"train_loss": -5.5134172439575195, "global_step": 32419, "epoch": 771} {"train_loss": -5.581233978271484, "global_step": 32420, "epoch": 771} {"train_loss": -5.406881809234619, "global_step": 32421, "epoch": 771} {"train_loss": -5.606379508972168, "global_step": 32422, "epoch": 771} {"train_loss": -5.522975365320842, "global_step": 32423, "epoch": 771, "val_loss": 66591.3046875} {"train_loss": -5.637172698974609, "global_step": 32424, "epoch": 772} {"train_loss": -5.426280975341797, "global_step": 32425, "epoch": 772} {"train_loss": -5.447813510894775, "global_step": 32426, "epoch": 772} {"train_loss": -5.468661785125732, "global_step": 32427, "epoch": 772} {"train_loss": -5.384507179260254, "global_step": 32428, "epoch": 772} {"train_loss": -5.438783645629883, "global_step": 32429, "epoch": 772} {"train_loss": -5.553657054901123, "global_step": 32430, "epoch": 772} {"train_loss": -5.493973731994629, "global_step": 32431, "epoch": 772} {"train_loss": -5.461515426635742, "global_step": 32432, "epoch": 772} {"train_loss": -5.412762641906738, "global_step": 32433, "epoch": 772} {"train_loss": -5.584145545959473, "global_step": 32434, "epoch": 772} {"train_loss": -5.5568952560424805, "global_step": 32435, "epoch": 772} {"train_loss": -5.432075500488281, "global_step": 32436, "epoch": 772} {"train_loss": -5.485315322875977, "global_step": 32437, "epoch": 772} {"train_loss": -5.4629011154174805, "global_step": 32438, "epoch": 772} {"train_loss": -5.554021835327148, "global_step": 32439, "epoch": 772} {"train_loss": -5.4988813400268555, "global_step": 32440, "epoch": 772} {"train_loss": -5.610698699951172, "global_step": 32441, "epoch": 772} {"train_loss": -5.540858268737793, "global_step": 32442, "epoch": 772} {"train_loss": -5.635922431945801, "global_step": 32443, "epoch": 772} {"train_loss": -5.550530433654785, "global_step": 32444, "epoch": 772} {"train_loss": -5.578023910522461, "global_step": 32445, "epoch": 772} {"train_loss": -5.447420120239258, "global_step": 32446, "epoch": 772} {"train_loss": -5.391755104064941, "global_step": 32447, "epoch": 772} {"train_loss": -5.573781490325928, "global_step": 32448, "epoch": 772} {"train_loss": -5.546023845672607, "global_step": 32449, "epoch": 772} {"train_loss": -5.499850273132324, "global_step": 32450, "epoch": 772} {"train_loss": -5.520294189453125, "global_step": 32451, "epoch": 772} {"train_loss": -5.6974029541015625, "global_step": 32452, "epoch": 772} {"train_loss": -5.509255409240723, "global_step": 32453, "epoch": 772} {"train_loss": -5.574794292449951, "global_step": 32454, "epoch": 772} {"train_loss": -5.577757835388184, "global_step": 32455, "epoch": 772} {"train_loss": -5.549185276031494, "global_step": 32456, "epoch": 772} {"train_loss": -5.594601154327393, "global_step": 32457, "epoch": 772} {"train_loss": -5.531713962554932, "global_step": 32458, "epoch": 772} {"train_loss": -5.501487731933594, "global_step": 32459, "epoch": 772} {"train_loss": -5.460700511932373, "global_step": 32460, "epoch": 772} {"train_loss": -5.427913665771484, "global_step": 32461, "epoch": 772} {"train_loss": -5.518736839294434, "global_step": 32462, "epoch": 772} {"train_loss": -5.501425743103027, "global_step": 32463, "epoch": 772} {"train_loss": -5.466726779937744, "global_step": 32464, "epoch": 772} {"train_loss": -5.518675894964309, "global_step": 32465, "epoch": 772, "val_loss": 66582.2109375} {"train_loss": -5.528135776519775, "global_step": 32466, "epoch": 773} {"train_loss": -5.51656436920166, "global_step": 32467, "epoch": 773} {"train_loss": -5.532556533813477, "global_step": 32468, "epoch": 773} {"train_loss": -5.585440635681152, "global_step": 32469, "epoch": 773} {"train_loss": -5.396329879760742, "global_step": 32470, "epoch": 773} {"train_loss": -5.414608955383301, "global_step": 32471, "epoch": 773} {"train_loss": -5.431449890136719, "global_step": 32472, "epoch": 773} {"train_loss": -5.481529235839844, "global_step": 32473, "epoch": 773} {"train_loss": -5.64710807800293, "global_step": 32474, "epoch": 773} {"train_loss": -5.553606033325195, "global_step": 32475, "epoch": 773} {"train_loss": -5.438623428344727, "global_step": 32476, "epoch": 773} {"train_loss": -5.475922107696533, "global_step": 32477, "epoch": 773} {"train_loss": -5.523283958435059, "global_step": 32478, "epoch": 773} {"train_loss": -5.458504676818848, "global_step": 32479, "epoch": 773} {"train_loss": -5.55136775970459, "global_step": 32480, "epoch": 773} {"train_loss": -5.640565872192383, "global_step": 32481, "epoch": 773} {"train_loss": -5.521091461181641, "global_step": 32482, "epoch": 773} {"train_loss": -5.643082141876221, "global_step": 32483, "epoch": 773} {"train_loss": -5.683619499206543, "global_step": 32484, "epoch": 773} {"train_loss": -5.469606876373291, "global_step": 32485, "epoch": 773} {"train_loss": -5.578127384185791, "global_step": 32486, "epoch": 773} {"train_loss": -5.519667625427246, "global_step": 32487, "epoch": 773} {"train_loss": -5.4399871826171875, "global_step": 32488, "epoch": 773} {"train_loss": -5.585012912750244, "global_step": 32489, "epoch": 773} {"train_loss": -5.454891681671143, "global_step": 32490, "epoch": 773} {"train_loss": -5.472019195556641, "global_step": 32491, "epoch": 773} {"train_loss": -5.603943824768066, "global_step": 32492, "epoch": 773} {"train_loss": -5.4806318283081055, "global_step": 32493, "epoch": 773} {"train_loss": -5.54020357131958, "global_step": 32494, "epoch": 773} {"train_loss": -5.566953659057617, "global_step": 32495, "epoch": 773} {"train_loss": -5.514718055725098, "global_step": 32496, "epoch": 773} {"train_loss": -5.538670539855957, "global_step": 32497, "epoch": 773} {"train_loss": -5.506491661071777, "global_step": 32498, "epoch": 773} {"train_loss": -5.61550760269165, "global_step": 32499, "epoch": 773} {"train_loss": -5.4766526222229, "global_step": 32500, "epoch": 773} {"train_loss": -5.558586120605469, "global_step": 32501, "epoch": 773} {"train_loss": -5.563258647918701, "global_step": 32502, "epoch": 773} {"train_loss": -5.471506595611572, "global_step": 32503, "epoch": 773} {"train_loss": -5.468058109283447, "global_step": 32504, "epoch": 773} {"train_loss": -5.624556541442871, "global_step": 32505, "epoch": 773} {"train_loss": -5.638406753540039, "global_step": 32506, "epoch": 773} {"train_loss": -5.523877268745785, "global_step": 32507, "epoch": 773, "val_loss": 66752.5546875} {"train_loss": -5.573654651641846, "global_step": 32508, "epoch": 774} {"train_loss": -5.613739490509033, "global_step": 32509, "epoch": 774} {"train_loss": -5.44196891784668, "global_step": 32510, "epoch": 774} {"train_loss": -5.60623836517334, "global_step": 32511, "epoch": 774} {"train_loss": -5.493865966796875, "global_step": 32512, "epoch": 774} {"train_loss": -5.433685302734375, "global_step": 32513, "epoch": 774} {"train_loss": -5.519802093505859, "global_step": 32514, "epoch": 774} {"train_loss": -5.4950408935546875, "global_step": 32515, "epoch": 774} {"train_loss": -5.568631172180176, "global_step": 32516, "epoch": 774} {"train_loss": -5.509422302246094, "global_step": 32517, "epoch": 774} {"train_loss": -5.383920669555664, "global_step": 32518, "epoch": 774} {"train_loss": -5.5462117195129395, "global_step": 32519, "epoch": 774} {"train_loss": -5.580772399902344, "global_step": 32520, "epoch": 774} {"train_loss": -5.439748764038086, "global_step": 32521, "epoch": 774} {"train_loss": -5.612181663513184, "global_step": 32522, "epoch": 774} {"train_loss": -5.4079766273498535, "global_step": 32523, "epoch": 774} {"train_loss": -5.562542915344238, "global_step": 32524, "epoch": 774} {"train_loss": -5.561816215515137, "global_step": 32525, "epoch": 774} {"train_loss": -5.453707695007324, "global_step": 32526, "epoch": 774} {"train_loss": -5.509037971496582, "global_step": 32527, "epoch": 774} {"train_loss": -5.460305690765381, "global_step": 32528, "epoch": 774} {"train_loss": -5.572658538818359, "global_step": 32529, "epoch": 774} {"train_loss": -5.531922340393066, "global_step": 32530, "epoch": 774} {"train_loss": -5.5081868171691895, "global_step": 32531, "epoch": 774} {"train_loss": -5.529411315917969, "global_step": 32532, "epoch": 774} {"train_loss": -5.465853691101074, "global_step": 32533, "epoch": 774} {"train_loss": -5.4366583824157715, "global_step": 32534, "epoch": 774} {"train_loss": -5.5392866134643555, "global_step": 32535, "epoch": 774} {"train_loss": -5.592902660369873, "global_step": 32536, "epoch": 774} {"train_loss": -5.395735740661621, "global_step": 32537, "epoch": 774} {"train_loss": -5.406140327453613, "global_step": 32538, "epoch": 774} {"train_loss": -5.472354888916016, "global_step": 32539, "epoch": 774} {"train_loss": -5.516483306884766, "global_step": 32540, "epoch": 774} {"train_loss": -5.4334001541137695, "global_step": 32541, "epoch": 774} {"train_loss": -5.477672100067139, "global_step": 32542, "epoch": 774} {"train_loss": -5.479766368865967, "global_step": 32543, "epoch": 774} {"train_loss": -5.408028602600098, "global_step": 32544, "epoch": 774} {"train_loss": -5.500425338745117, "global_step": 32545, "epoch": 774} {"train_loss": -5.540777683258057, "global_step": 32546, "epoch": 774} {"train_loss": -5.520538330078125, "global_step": 32547, "epoch": 774} {"train_loss": -5.465371608734131, "global_step": 32548, "epoch": 774} {"train_loss": -5.5025213332403276, "global_step": 32549, "epoch": 774, "val_loss": 66626.21875} {"train_loss": -5.538639545440674, "global_step": 32550, "epoch": 775} {"train_loss": -5.579422473907471, "global_step": 32551, "epoch": 775} {"train_loss": -5.426098823547363, "global_step": 32552, "epoch": 775} {"train_loss": -5.440182685852051, "global_step": 32553, "epoch": 775} {"train_loss": -5.6230669021606445, "global_step": 32554, "epoch": 775} {"train_loss": -5.550296783447266, "global_step": 32555, "epoch": 775} {"train_loss": -5.560026168823242, "global_step": 32556, "epoch": 775} {"train_loss": -5.530733108520508, "global_step": 32557, "epoch": 775} {"train_loss": -5.661375522613525, "global_step": 32558, "epoch": 775} {"train_loss": -5.508486270904541, "global_step": 32559, "epoch": 775} {"train_loss": -5.43994665145874, "global_step": 32560, "epoch": 775} {"train_loss": -5.598893165588379, "global_step": 32561, "epoch": 775} {"train_loss": -5.510968208312988, "global_step": 32562, "epoch": 775} {"train_loss": -5.516844749450684, "global_step": 32563, "epoch": 775} {"train_loss": -5.46824312210083, "global_step": 32564, "epoch": 775} {"train_loss": -5.543363571166992, "global_step": 32565, "epoch": 775} {"train_loss": -5.583394527435303, "global_step": 32566, "epoch": 775} {"train_loss": -5.454368591308594, "global_step": 32567, "epoch": 775} {"train_loss": -5.658512592315674, "global_step": 32568, "epoch": 775} {"train_loss": -5.5150909423828125, "global_step": 32569, "epoch": 775} {"train_loss": -5.529997825622559, "global_step": 32570, "epoch": 775} {"train_loss": -5.6155219078063965, "global_step": 32571, "epoch": 775} {"train_loss": -5.659915447235107, "global_step": 32572, "epoch": 775} {"train_loss": -5.536836624145508, "global_step": 32573, "epoch": 775} {"train_loss": -5.504631042480469, "global_step": 32574, "epoch": 775} {"train_loss": -5.467294216156006, "global_step": 32575, "epoch": 775} {"train_loss": -5.620316028594971, "global_step": 32576, "epoch": 775} {"train_loss": -5.356769561767578, "global_step": 32577, "epoch": 775} {"train_loss": -5.527003288269043, "global_step": 32578, "epoch": 775} {"train_loss": -5.702110290527344, "global_step": 32579, "epoch": 775} {"train_loss": -5.4559478759765625, "global_step": 32580, "epoch": 775} {"train_loss": -5.623835563659668, "global_step": 32581, "epoch": 775} {"train_loss": -5.620730400085449, "global_step": 32582, "epoch": 775} {"train_loss": -5.431356430053711, "global_step": 32583, "epoch": 775} {"train_loss": -5.607156276702881, "global_step": 32584, "epoch": 775} {"train_loss": -5.569873809814453, "global_step": 32585, "epoch": 775} {"train_loss": -5.461383819580078, "global_step": 32586, "epoch": 775} {"train_loss": -5.425025939941406, "global_step": 32587, "epoch": 775} {"train_loss": -5.483853340148926, "global_step": 32588, "epoch": 775} {"train_loss": -5.539671897888184, "global_step": 32589, "epoch": 775} {"train_loss": -5.5667572021484375, "global_step": 32590, "epoch": 775} {"train_loss": -5.533843880607968, "global_step": 32591, "epoch": 775, "val_loss": 66476.9140625} {"train_loss": -5.5421929359436035, "global_step": 32592, "epoch": 776} {"train_loss": -5.542436599731445, "global_step": 32593, "epoch": 776} {"train_loss": -5.428021430969238, "global_step": 32594, "epoch": 776} {"train_loss": -5.391602516174316, "global_step": 32595, "epoch": 776} {"train_loss": -5.551759719848633, "global_step": 32596, "epoch": 776} {"train_loss": -5.433557033538818, "global_step": 32597, "epoch": 776} {"train_loss": -5.590638160705566, "global_step": 32598, "epoch": 776} {"train_loss": -5.532676696777344, "global_step": 32599, "epoch": 776} {"train_loss": -5.468352794647217, "global_step": 32600, "epoch": 776} {"train_loss": -5.446010112762451, "global_step": 32601, "epoch": 776} {"train_loss": -5.550536155700684, "global_step": 32602, "epoch": 776} {"train_loss": -5.589963436126709, "global_step": 32603, "epoch": 776} {"train_loss": -5.462888240814209, "global_step": 32604, "epoch": 776} {"train_loss": -5.51788330078125, "global_step": 32605, "epoch": 776} {"train_loss": -5.3951802253723145, "global_step": 32606, "epoch": 776} {"train_loss": -5.7502217292785645, "global_step": 32607, "epoch": 776} {"train_loss": -5.607211112976074, "global_step": 32608, "epoch": 776} {"train_loss": -5.456696510314941, "global_step": 32609, "epoch": 776} {"train_loss": -5.585988998413086, "global_step": 32610, "epoch": 776} {"train_loss": -5.464612007141113, "global_step": 32611, "epoch": 776} {"train_loss": -5.348094940185547, "global_step": 32612, "epoch": 776} {"train_loss": -5.650352478027344, "global_step": 32613, "epoch": 776} {"train_loss": -5.540663719177246, "global_step": 32614, "epoch": 776} {"train_loss": -5.619390487670898, "global_step": 32615, "epoch": 776} {"train_loss": -5.567292213439941, "global_step": 32616, "epoch": 776} {"train_loss": -5.506112098693848, "global_step": 32617, "epoch": 776} {"train_loss": -5.474701881408691, "global_step": 32618, "epoch": 776} {"train_loss": -5.454789161682129, "global_step": 32619, "epoch": 776} {"train_loss": -5.381328582763672, "global_step": 32620, "epoch": 776} {"train_loss": -5.553289413452148, "global_step": 32621, "epoch": 776} {"train_loss": -5.435870170593262, "global_step": 32622, "epoch": 776} {"train_loss": -5.3690080642700195, "global_step": 32623, "epoch": 776} {"train_loss": -5.656914710998535, "global_step": 32624, "epoch": 776} {"train_loss": -5.514409065246582, "global_step": 32625, "epoch": 776} {"train_loss": -5.4198408126831055, "global_step": 32626, "epoch": 776} {"train_loss": -5.458711624145508, "global_step": 32627, "epoch": 776} {"train_loss": -5.527495384216309, "global_step": 32628, "epoch": 776} {"train_loss": -5.498449325561523, "global_step": 32629, "epoch": 776} {"train_loss": -5.350732803344727, "global_step": 32630, "epoch": 776} {"train_loss": -5.5044145584106445, "global_step": 32631, "epoch": 776} {"train_loss": -5.631542205810547, "global_step": 32632, "epoch": 776} {"train_loss": -5.506419976552327, "global_step": 32633, "epoch": 776, "val_loss": 66757.53125} {"train_loss": -5.4829020500183105, "global_step": 32634, "epoch": 777} {"train_loss": -5.519225597381592, "global_step": 32635, "epoch": 777} {"train_loss": -5.403102874755859, "global_step": 32636, "epoch": 777} {"train_loss": -5.61605167388916, "global_step": 32637, "epoch": 777} {"train_loss": -5.555568695068359, "global_step": 32638, "epoch": 777} {"train_loss": -5.623540878295898, "global_step": 32639, "epoch": 777} {"train_loss": -5.557042121887207, "global_step": 32640, "epoch": 777} {"train_loss": -5.601097583770752, "global_step": 32641, "epoch": 777} {"train_loss": -5.556484222412109, "global_step": 32642, "epoch": 777} {"train_loss": -5.4648942947387695, "global_step": 32643, "epoch": 777} {"train_loss": -5.485428333282471, "global_step": 32644, "epoch": 777} {"train_loss": -5.453120231628418, "global_step": 32645, "epoch": 777} {"train_loss": -5.50733757019043, "global_step": 32646, "epoch": 777} {"train_loss": -5.523651123046875, "global_step": 32647, "epoch": 777} {"train_loss": -5.6315388679504395, "global_step": 32648, "epoch": 777} {"train_loss": -5.548645973205566, "global_step": 32649, "epoch": 777} {"train_loss": -5.548346042633057, "global_step": 32650, "epoch": 777} {"train_loss": -5.450787544250488, "global_step": 32651, "epoch": 777} {"train_loss": -5.478606224060059, "global_step": 32652, "epoch": 777} {"train_loss": -5.466940402984619, "global_step": 32653, "epoch": 777} {"train_loss": -5.513719081878662, "global_step": 32654, "epoch": 777} {"train_loss": -5.598782539367676, "global_step": 32655, "epoch": 777} {"train_loss": -5.51852560043335, "global_step": 32656, "epoch": 777} {"train_loss": -5.360734939575195, "global_step": 32657, "epoch": 777} {"train_loss": -5.528815269470215, "global_step": 32658, "epoch": 777} {"train_loss": -5.512001037597656, "global_step": 32659, "epoch": 777} {"train_loss": -5.5602264404296875, "global_step": 32660, "epoch": 777} {"train_loss": -5.5792555809021, "global_step": 32661, "epoch": 777} {"train_loss": -5.637036323547363, "global_step": 32662, "epoch": 777} {"train_loss": -5.586555004119873, "global_step": 32663, "epoch": 777} {"train_loss": -5.539706230163574, "global_step": 32664, "epoch": 777} {"train_loss": -5.4539713859558105, "global_step": 32665, "epoch": 777} {"train_loss": -5.570112228393555, "global_step": 32666, "epoch": 777} {"train_loss": -5.417782783508301, "global_step": 32667, "epoch": 777} {"train_loss": -5.564724922180176, "global_step": 32668, "epoch": 777} {"train_loss": -5.489072799682617, "global_step": 32669, "epoch": 777} {"train_loss": -5.574416160583496, "global_step": 32670, "epoch": 777} {"train_loss": -5.570908546447754, "global_step": 32671, "epoch": 777} {"train_loss": -5.399203300476074, "global_step": 32672, "epoch": 777} {"train_loss": -5.585594177246094, "global_step": 32673, "epoch": 777} {"train_loss": -5.486227989196777, "global_step": 32674, "epoch": 777} {"train_loss": -5.524688925061907, "global_step": 32675, "epoch": 777, "val_loss": 66465.4296875} {"train_loss": -5.399609565734863, "global_step": 32676, "epoch": 778} {"train_loss": -5.5753984451293945, "global_step": 32677, "epoch": 778} {"train_loss": -5.38183069229126, "global_step": 32678, "epoch": 778} {"train_loss": -5.430268287658691, "global_step": 32679, "epoch": 778} {"train_loss": -5.494907855987549, "global_step": 32680, "epoch": 778} {"train_loss": -5.449967384338379, "global_step": 32681, "epoch": 778} {"train_loss": -5.635312080383301, "global_step": 32682, "epoch": 778} {"train_loss": -5.601127624511719, "global_step": 32683, "epoch": 778} {"train_loss": -5.47125244140625, "global_step": 32684, "epoch": 778} {"train_loss": -5.575101852416992, "global_step": 32685, "epoch": 778} {"train_loss": -5.448097229003906, "global_step": 32686, "epoch": 778} {"train_loss": -5.244400978088379, "global_step": 32687, "epoch": 778} {"train_loss": -5.479063987731934, "global_step": 32688, "epoch": 778} {"train_loss": -5.5035247802734375, "global_step": 32689, "epoch": 778} {"train_loss": -5.517601013183594, "global_step": 32690, "epoch": 778} {"train_loss": -5.304303169250488, "global_step": 32691, "epoch": 778} {"train_loss": -5.482691287994385, "global_step": 32692, "epoch": 778} {"train_loss": -5.351624488830566, "global_step": 32693, "epoch": 778} {"train_loss": -5.574919700622559, "global_step": 32694, "epoch": 778} {"train_loss": -5.390937805175781, "global_step": 32695, "epoch": 778} {"train_loss": -5.476222991943359, "global_step": 32696, "epoch": 778} {"train_loss": -5.475752353668213, "global_step": 32697, "epoch": 778} {"train_loss": -5.500265598297119, "global_step": 32698, "epoch": 778} {"train_loss": -5.391161918640137, "global_step": 32699, "epoch": 778} {"train_loss": -5.394889831542969, "global_step": 32700, "epoch": 778} {"train_loss": -5.441683769226074, "global_step": 32701, "epoch": 778} {"train_loss": -5.498016357421875, "global_step": 32702, "epoch": 778} {"train_loss": -5.347113609313965, "global_step": 32703, "epoch": 778} {"train_loss": -5.430280685424805, "global_step": 32704, "epoch": 778} {"train_loss": -5.420506000518799, "global_step": 32705, "epoch": 778} {"train_loss": -5.4994425773620605, "global_step": 32706, "epoch": 778} {"train_loss": -5.564169883728027, "global_step": 32707, "epoch": 778} {"train_loss": -5.623433589935303, "global_step": 32708, "epoch": 778} {"train_loss": -5.5986785888671875, "global_step": 32709, "epoch": 778} {"train_loss": -5.5166120529174805, "global_step": 32710, "epoch": 778} {"train_loss": -5.487789154052734, "global_step": 32711, "epoch": 778} {"train_loss": -5.42549467086792, "global_step": 32712, "epoch": 778} {"train_loss": -5.415275573730469, "global_step": 32713, "epoch": 778} {"train_loss": -5.523706912994385, "global_step": 32714, "epoch": 778} {"train_loss": -5.519277095794678, "global_step": 32715, "epoch": 778} {"train_loss": -5.465523719787598, "global_step": 32716, "epoch": 778} {"train_loss": -5.474320286796207, "global_step": 32717, "epoch": 778, "val_loss": 67620.8671875} {"train_loss": -5.400272846221924, "global_step": 32718, "epoch": 779} {"train_loss": -5.46042013168335, "global_step": 32719, "epoch": 779} {"train_loss": -5.364223957061768, "global_step": 32720, "epoch": 779} {"train_loss": -5.443463325500488, "global_step": 32721, "epoch": 779} {"train_loss": -5.563844680786133, "global_step": 32722, "epoch": 779} {"train_loss": -5.412347793579102, "global_step": 32723, "epoch": 779} {"train_loss": -5.545083999633789, "global_step": 32724, "epoch": 779} {"train_loss": -5.526081085205078, "global_step": 32725, "epoch": 779} {"train_loss": -5.639963626861572, "global_step": 32726, "epoch": 779} {"train_loss": -5.536655902862549, "global_step": 32727, "epoch": 779} {"train_loss": -5.547360897064209, "global_step": 32728, "epoch": 779} {"train_loss": -5.548470973968506, "global_step": 32729, "epoch": 779} {"train_loss": -5.566108703613281, "global_step": 32730, "epoch": 779} {"train_loss": -5.5649871826171875, "global_step": 32731, "epoch": 779} {"train_loss": -5.557894706726074, "global_step": 32732, "epoch": 779} {"train_loss": -5.5133748054504395, "global_step": 32733, "epoch": 779} {"train_loss": -5.496369361877441, "global_step": 32734, "epoch": 779} {"train_loss": -5.526515007019043, "global_step": 32735, "epoch": 779} {"train_loss": -5.435272216796875, "global_step": 32736, "epoch": 779} {"train_loss": -5.5017194747924805, "global_step": 32737, "epoch": 779} {"train_loss": -5.441814422607422, "global_step": 32738, "epoch": 779} {"train_loss": -5.469367027282715, "global_step": 32739, "epoch": 779} {"train_loss": -5.5814619064331055, "global_step": 32740, "epoch": 779} {"train_loss": -5.5253400802612305, "global_step": 32741, "epoch": 779} {"train_loss": -5.499015808105469, "global_step": 32742, "epoch": 779} {"train_loss": -5.580978870391846, "global_step": 32743, "epoch": 779} {"train_loss": -5.538680076599121, "global_step": 32744, "epoch": 779} {"train_loss": -5.66510009765625, "global_step": 32745, "epoch": 779} {"train_loss": -5.609498023986816, "global_step": 32746, "epoch": 779} {"train_loss": -5.420366287231445, "global_step": 32747, "epoch": 779} {"train_loss": -5.473719596862793, "global_step": 32748, "epoch": 779} {"train_loss": -5.4946417808532715, "global_step": 32749, "epoch": 779} {"train_loss": -5.477777481079102, "global_step": 32750, "epoch": 779} {"train_loss": -5.430042743682861, "global_step": 32751, "epoch": 779} {"train_loss": -5.551414966583252, "global_step": 32752, "epoch": 779} {"train_loss": -5.563651084899902, "global_step": 32753, "epoch": 779} {"train_loss": -5.511671543121338, "global_step": 32754, "epoch": 779} {"train_loss": -5.571069717407227, "global_step": 32755, "epoch": 779} {"train_loss": -5.547577857971191, "global_step": 32756, "epoch": 779} {"train_loss": -5.379794597625732, "global_step": 32757, "epoch": 779} {"train_loss": -5.512589931488037, "global_step": 32758, "epoch": 779} {"train_loss": -5.511307330358596, "global_step": 32759, "epoch": 779, "val_loss": 66409.6875} {"train_loss": -5.455750465393066, "global_step": 32760, "epoch": 780} {"train_loss": -5.690485954284668, "global_step": 32761, "epoch": 780} {"train_loss": -5.513582229614258, "global_step": 32762, "epoch": 780} {"train_loss": -5.5619893074035645, "global_step": 32763, "epoch": 780} {"train_loss": -5.577716827392578, "global_step": 32764, "epoch": 780} {"train_loss": -5.63173246383667, "global_step": 32765, "epoch": 780} {"train_loss": -5.6491923332214355, "global_step": 32766, "epoch": 780} {"train_loss": -5.601238250732422, "global_step": 32767, "epoch": 780} {"train_loss": -5.549807548522949, "global_step": 32768, "epoch": 780} {"train_loss": -5.632851600646973, "global_step": 32769, "epoch": 780} {"train_loss": -5.429819107055664, "global_step": 32770, "epoch": 780} {"train_loss": -5.532896041870117, "global_step": 32771, "epoch": 780} {"train_loss": -5.490668296813965, "global_step": 32772, "epoch": 780} {"train_loss": -5.684391021728516, "global_step": 32773, "epoch": 780} {"train_loss": -5.598231315612793, "global_step": 32774, "epoch": 780} {"train_loss": -5.560619354248047, "global_step": 32775, "epoch": 780} {"train_loss": -5.374581336975098, "global_step": 32776, "epoch": 780} {"train_loss": -5.398143291473389, "global_step": 32777, "epoch": 780} {"train_loss": -5.486087322235107, "global_step": 32778, "epoch": 780} {"train_loss": -5.567165374755859, "global_step": 32779, "epoch": 780} {"train_loss": -5.411857604980469, "global_step": 32780, "epoch": 780} {"train_loss": -5.553292274475098, "global_step": 32781, "epoch": 780} {"train_loss": -5.493577003479004, "global_step": 32782, "epoch": 780} {"train_loss": -5.448807716369629, "global_step": 32783, "epoch": 780} {"train_loss": -5.598704814910889, "global_step": 32784, "epoch": 780} {"train_loss": -5.418235778808594, "global_step": 32785, "epoch": 780} {"train_loss": -5.418083667755127, "global_step": 32786, "epoch": 780} {"train_loss": -5.476067543029785, "global_step": 32787, "epoch": 780} {"train_loss": -5.341639518737793, "global_step": 32788, "epoch": 780} {"train_loss": -5.344734191894531, "global_step": 32789, "epoch": 780} {"train_loss": -5.516777038574219, "global_step": 32790, "epoch": 780} {"train_loss": -5.479840278625488, "global_step": 32791, "epoch": 780} {"train_loss": -5.571290969848633, "global_step": 32792, "epoch": 780} {"train_loss": -5.558974742889404, "global_step": 32793, "epoch": 780} {"train_loss": -5.488183975219727, "global_step": 32794, "epoch": 780} {"train_loss": -5.6107354164123535, "global_step": 32795, "epoch": 780} {"train_loss": -5.517607688903809, "global_step": 32796, "epoch": 780} {"train_loss": -5.586095809936523, "global_step": 32797, "epoch": 780} {"train_loss": -5.44670295715332, "global_step": 32798, "epoch": 780} {"train_loss": -5.565279006958008, "global_step": 32799, "epoch": 780} {"train_loss": -5.5159101486206055, "global_step": 32800, "epoch": 780} {"train_loss": -5.52162260100955, "global_step": 32801, "epoch": 780, "val_loss": 66464.8046875} {"train_loss": -5.533000469207764, "global_step": 32802, "epoch": 781} {"train_loss": -5.576346397399902, "global_step": 32803, "epoch": 781} {"train_loss": -5.633967399597168, "global_step": 32804, "epoch": 781} {"train_loss": -5.521994113922119, "global_step": 32805, "epoch": 781} {"train_loss": -5.5403289794921875, "global_step": 32806, "epoch": 781} {"train_loss": -5.653956890106201, "global_step": 32807, "epoch": 781} {"train_loss": -5.536263465881348, "global_step": 32808, "epoch": 781} {"train_loss": -5.638550758361816, "global_step": 32809, "epoch": 781} {"train_loss": -5.617932319641113, "global_step": 32810, "epoch": 781} {"train_loss": -5.550758361816406, "global_step": 32811, "epoch": 781} {"train_loss": -5.568258285522461, "global_step": 32812, "epoch": 781} {"train_loss": -5.542259216308594, "global_step": 32813, "epoch": 781} {"train_loss": -5.638410568237305, "global_step": 32814, "epoch": 781} {"train_loss": -5.476152420043945, "global_step": 32815, "epoch": 781} {"train_loss": -5.662936210632324, "global_step": 32816, "epoch": 781} {"train_loss": -5.54752254486084, "global_step": 32817, "epoch": 781} {"train_loss": -5.519351959228516, "global_step": 32818, "epoch": 781} {"train_loss": -5.504016876220703, "global_step": 32819, "epoch": 781} {"train_loss": -5.4719953536987305, "global_step": 32820, "epoch": 781} {"train_loss": -5.501492023468018, "global_step": 32821, "epoch": 781} {"train_loss": -5.550275802612305, "global_step": 32822, "epoch": 781} {"train_loss": -5.50972843170166, "global_step": 32823, "epoch": 781} {"train_loss": -5.352304458618164, "global_step": 32824, "epoch": 781} {"train_loss": -5.504714488983154, "global_step": 32825, "epoch": 781} {"train_loss": -5.483553886413574, "global_step": 32826, "epoch": 781} {"train_loss": -5.523597240447998, "global_step": 32827, "epoch": 781} {"train_loss": -5.484063148498535, "global_step": 32828, "epoch": 781} {"train_loss": -5.514134883880615, "global_step": 32829, "epoch": 781} {"train_loss": -5.461973190307617, "global_step": 32830, "epoch": 781} {"train_loss": -5.45101261138916, "global_step": 32831, "epoch": 781} {"train_loss": -5.519761085510254, "global_step": 32832, "epoch": 781} {"train_loss": -5.423707962036133, "global_step": 32833, "epoch": 781} {"train_loss": -5.602730751037598, "global_step": 32834, "epoch": 781} {"train_loss": -5.528659343719482, "global_step": 32835, "epoch": 781} {"train_loss": -5.577234745025635, "global_step": 32836, "epoch": 781} {"train_loss": -5.477081775665283, "global_step": 32837, "epoch": 781} {"train_loss": -5.327263355255127, "global_step": 32838, "epoch": 781} {"train_loss": -5.587832450866699, "global_step": 32839, "epoch": 781} {"train_loss": -5.610675811767578, "global_step": 32840, "epoch": 781} {"train_loss": -5.539173126220703, "global_step": 32841, "epoch": 781} {"train_loss": -5.454812049865723, "global_step": 32842, "epoch": 781} {"train_loss": -5.530265785398937, "global_step": 32843, "epoch": 781, "val_loss": 66593.734375} {"train_loss": -5.583671569824219, "global_step": 32844, "epoch": 782} {"train_loss": -5.471277236938477, "global_step": 32845, "epoch": 782} {"train_loss": -5.667109966278076, "global_step": 32846, "epoch": 782} {"train_loss": -5.574510097503662, "global_step": 32847, "epoch": 782} {"train_loss": -5.600109100341797, "global_step": 32848, "epoch": 782} {"train_loss": -5.385457992553711, "global_step": 32849, "epoch": 782} {"train_loss": -5.4700422286987305, "global_step": 32850, "epoch": 782} {"train_loss": -5.522675037384033, "global_step": 32851, "epoch": 782} {"train_loss": -5.430528163909912, "global_step": 32852, "epoch": 782} {"train_loss": -5.629125595092773, "global_step": 32853, "epoch": 782} {"train_loss": -5.487781524658203, "global_step": 32854, "epoch": 782} {"train_loss": -5.521230697631836, "global_step": 32855, "epoch": 782} {"train_loss": -5.539648056030273, "global_step": 32856, "epoch": 782} {"train_loss": -5.488803863525391, "global_step": 32857, "epoch": 782} {"train_loss": -5.364182949066162, "global_step": 32858, "epoch": 782} {"train_loss": -5.562250137329102, "global_step": 32859, "epoch": 782} {"train_loss": -5.473715782165527, "global_step": 32860, "epoch": 782} {"train_loss": -5.532106399536133, "global_step": 32861, "epoch": 782} {"train_loss": -5.475839614868164, "global_step": 32862, "epoch": 782} {"train_loss": -5.427375793457031, "global_step": 32863, "epoch": 782} {"train_loss": -5.47175407409668, "global_step": 32864, "epoch": 782} {"train_loss": -5.506331443786621, "global_step": 32865, "epoch": 782} {"train_loss": -5.457400798797607, "global_step": 32866, "epoch": 782} {"train_loss": -5.488590240478516, "global_step": 32867, "epoch": 782} {"train_loss": -5.567837238311768, "global_step": 32868, "epoch": 782} {"train_loss": -5.537016868591309, "global_step": 32869, "epoch": 782} {"train_loss": -5.6070756912231445, "global_step": 32870, "epoch": 782} {"train_loss": -5.621770858764648, "global_step": 32871, "epoch": 782} {"train_loss": -5.576543807983398, "global_step": 32872, "epoch": 782} {"train_loss": -5.479828834533691, "global_step": 32873, "epoch": 782} {"train_loss": -5.488440036773682, "global_step": 32874, "epoch": 782} {"train_loss": -5.539461135864258, "global_step": 32875, "epoch": 782} {"train_loss": -5.444731712341309, "global_step": 32876, "epoch": 782} {"train_loss": -5.62149715423584, "global_step": 32877, "epoch": 782} {"train_loss": -5.549560546875, "global_step": 32878, "epoch": 782} {"train_loss": -5.470136642456055, "global_step": 32879, "epoch": 782} {"train_loss": -5.445990562438965, "global_step": 32880, "epoch": 782} {"train_loss": -5.443117618560791, "global_step": 32881, "epoch": 782} {"train_loss": -5.653675556182861, "global_step": 32882, "epoch": 782} {"train_loss": -5.5141096115112305, "global_step": 32883, "epoch": 782} {"train_loss": -5.585735321044922, "global_step": 32884, "epoch": 782} {"train_loss": -5.519936152866909, "global_step": 32885, "epoch": 782, "val_loss": 67204.0859375} {"train_loss": -5.417356967926025, "global_step": 32886, "epoch": 783} {"train_loss": -5.518583297729492, "global_step": 32887, "epoch": 783} {"train_loss": -5.586153030395508, "global_step": 32888, "epoch": 783} {"train_loss": -5.504103660583496, "global_step": 32889, "epoch": 783} {"train_loss": -5.643683433532715, "global_step": 32890, "epoch": 783} {"train_loss": -5.62691068649292, "global_step": 32891, "epoch": 783} {"train_loss": -5.643301486968994, "global_step": 32892, "epoch": 783} {"train_loss": -5.518198013305664, "global_step": 32893, "epoch": 783} {"train_loss": -5.437530517578125, "global_step": 32894, "epoch": 783} {"train_loss": -5.64042854309082, "global_step": 32895, "epoch": 783} {"train_loss": -5.535996913909912, "global_step": 32896, "epoch": 783} {"train_loss": -5.5606584548950195, "global_step": 32897, "epoch": 783} {"train_loss": -5.5993547439575195, "global_step": 32898, "epoch": 783} {"train_loss": -5.474505424499512, "global_step": 32899, "epoch": 783} {"train_loss": -5.571293354034424, "global_step": 32900, "epoch": 783} {"train_loss": -5.529665946960449, "global_step": 32901, "epoch": 783} {"train_loss": -5.470639228820801, "global_step": 32902, "epoch": 783} {"train_loss": -5.601848602294922, "global_step": 32903, "epoch": 783} {"train_loss": -5.557551383972168, "global_step": 32904, "epoch": 783} {"train_loss": -5.456301212310791, "global_step": 32905, "epoch": 783} {"train_loss": -5.405248641967773, "global_step": 32906, "epoch": 783} {"train_loss": -5.461695671081543, "global_step": 32907, "epoch": 783} {"train_loss": -5.504725456237793, "global_step": 32908, "epoch": 783} {"train_loss": -5.4277191162109375, "global_step": 32909, "epoch": 783} {"train_loss": -5.5544114112854, "global_step": 32910, "epoch": 783} {"train_loss": -5.536110877990723, "global_step": 32911, "epoch": 783} {"train_loss": -5.523980617523193, "global_step": 32912, "epoch": 783} {"train_loss": -5.525732040405273, "global_step": 32913, "epoch": 783} {"train_loss": -5.50161075592041, "global_step": 32914, "epoch": 783} {"train_loss": -5.5444135665893555, "global_step": 32915, "epoch": 783} {"train_loss": -5.508655071258545, "global_step": 32916, "epoch": 783} {"train_loss": -5.4608049392700195, "global_step": 32917, "epoch": 783} {"train_loss": -5.506553649902344, "global_step": 32918, "epoch": 783} {"train_loss": -5.429591655731201, "global_step": 32919, "epoch": 783} {"train_loss": -5.5246357917785645, "global_step": 32920, "epoch": 783} {"train_loss": -5.446826457977295, "global_step": 32921, "epoch": 783} {"train_loss": -5.5736188888549805, "global_step": 32922, "epoch": 783} {"train_loss": -5.4182329177856445, "global_step": 32923, "epoch": 783} {"train_loss": -5.5021586418151855, "global_step": 32924, "epoch": 783} {"train_loss": -5.542670726776123, "global_step": 32925, "epoch": 783} {"train_loss": -5.549210071563721, "global_step": 32926, "epoch": 783} {"train_loss": -5.516342208499, "global_step": 32927, "epoch": 783, "val_loss": 66773.3984375} {"train_loss": -5.4496541023254395, "global_step": 32928, "epoch": 784} {"train_loss": -5.642637729644775, "global_step": 32929, "epoch": 784} {"train_loss": -5.514847755432129, "global_step": 32930, "epoch": 784} {"train_loss": -5.436971187591553, "global_step": 32931, "epoch": 784} {"train_loss": -5.495052337646484, "global_step": 32932, "epoch": 784} {"train_loss": -5.591575622558594, "global_step": 32933, "epoch": 784} {"train_loss": -5.432819366455078, "global_step": 32934, "epoch": 784} {"train_loss": -5.561720848083496, "global_step": 32935, "epoch": 784} {"train_loss": -5.480196952819824, "global_step": 32936, "epoch": 784} {"train_loss": -5.630374908447266, "global_step": 32937, "epoch": 784} {"train_loss": -5.51039981842041, "global_step": 32938, "epoch": 784} {"train_loss": -5.443511962890625, "global_step": 32939, "epoch": 784} {"train_loss": -5.495983123779297, "global_step": 32940, "epoch": 784} {"train_loss": -5.535365104675293, "global_step": 32941, "epoch": 784} {"train_loss": -5.579100608825684, "global_step": 32942, "epoch": 784} {"train_loss": -5.491671562194824, "global_step": 32943, "epoch": 784} {"train_loss": -5.465825080871582, "global_step": 32944, "epoch": 784} {"train_loss": -5.371089935302734, "global_step": 32945, "epoch": 784} {"train_loss": -5.473886966705322, "global_step": 32946, "epoch": 784} {"train_loss": -5.442438125610352, "global_step": 32947, "epoch": 784} {"train_loss": -5.532771110534668, "global_step": 32948, "epoch": 784} {"train_loss": -5.473028659820557, "global_step": 32949, "epoch": 784} {"train_loss": -5.5292439460754395, "global_step": 32950, "epoch": 784} {"train_loss": -5.547279357910156, "global_step": 32951, "epoch": 784} {"train_loss": -5.619407653808594, "global_step": 32952, "epoch": 784} {"train_loss": -5.469865798950195, "global_step": 32953, "epoch": 784} {"train_loss": -5.4126152992248535, "global_step": 32954, "epoch": 784} {"train_loss": -5.6227126121521, "global_step": 32955, "epoch": 784} {"train_loss": -5.537574768066406, "global_step": 32956, "epoch": 784} {"train_loss": -5.434470176696777, "global_step": 32957, "epoch": 784} {"train_loss": -5.729458808898926, "global_step": 32958, "epoch": 784} {"train_loss": -5.499383926391602, "global_step": 32959, "epoch": 784} {"train_loss": -5.454928874969482, "global_step": 32960, "epoch": 784} {"train_loss": -5.550618648529053, "global_step": 32961, "epoch": 784} {"train_loss": -5.481740951538086, "global_step": 32962, "epoch": 784} {"train_loss": -5.655910015106201, "global_step": 32963, "epoch": 784} {"train_loss": -5.517236709594727, "global_step": 32964, "epoch": 784} {"train_loss": -5.45809268951416, "global_step": 32965, "epoch": 784} {"train_loss": -5.642327308654785, "global_step": 32966, "epoch": 784} {"train_loss": -5.472474575042725, "global_step": 32967, "epoch": 784} {"train_loss": -5.471307754516602, "global_step": 32968, "epoch": 784} {"train_loss": -5.517230033874512, "global_step": 32969, "epoch": 784, "val_loss": 66525.328125} {"train_loss": -5.388671875, "global_step": 32970, "epoch": 785} {"train_loss": -5.617691993713379, "global_step": 32971, "epoch": 785} {"train_loss": -5.505123138427734, "global_step": 32972, "epoch": 785} {"train_loss": -5.520482063293457, "global_step": 32973, "epoch": 785} {"train_loss": -5.4675750732421875, "global_step": 32974, "epoch": 785} {"train_loss": -5.506292819976807, "global_step": 32975, "epoch": 785} {"train_loss": -5.458854675292969, "global_step": 32976, "epoch": 785} {"train_loss": -5.541971683502197, "global_step": 32977, "epoch": 785} {"train_loss": -5.6260986328125, "global_step": 32978, "epoch": 785} {"train_loss": -5.559488296508789, "global_step": 32979, "epoch": 785} {"train_loss": -5.5361433029174805, "global_step": 32980, "epoch": 785} {"train_loss": -5.476616859436035, "global_step": 32981, "epoch": 785} {"train_loss": -5.604327201843262, "global_step": 32982, "epoch": 785} {"train_loss": -5.542422294616699, "global_step": 32983, "epoch": 785} {"train_loss": -5.604037761688232, "global_step": 32984, "epoch": 785} {"train_loss": -5.522756576538086, "global_step": 32985, "epoch": 785} {"train_loss": -5.392745018005371, "global_step": 32986, "epoch": 785} {"train_loss": -5.337518692016602, "global_step": 32987, "epoch": 785} {"train_loss": -5.479537487030029, "global_step": 32988, "epoch": 785} {"train_loss": -5.49509859085083, "global_step": 32989, "epoch": 785} {"train_loss": -5.48248291015625, "global_step": 32990, "epoch": 785} {"train_loss": -5.513456344604492, "global_step": 32991, "epoch": 785} {"train_loss": -5.358199596405029, "global_step": 32992, "epoch": 785} {"train_loss": -5.471928596496582, "global_step": 32993, "epoch": 785} {"train_loss": -5.411214828491211, "global_step": 32994, "epoch": 785} {"train_loss": -5.585760593414307, "global_step": 32995, "epoch": 785} {"train_loss": -5.45340633392334, "global_step": 32996, "epoch": 785} {"train_loss": -5.406214714050293, "global_step": 32997, "epoch": 785} {"train_loss": -5.586766242980957, "global_step": 32998, "epoch": 785} {"train_loss": -5.372782230377197, "global_step": 32999, "epoch": 785} {"train_loss": -5.520699501037598, "global_step": 33000, "epoch": 785} {"train_loss": -5.421853065490723, "global_step": 33001, "epoch": 785} {"train_loss": -5.50529670715332, "global_step": 33002, "epoch": 785} {"train_loss": -5.430337905883789, "global_step": 33003, "epoch": 785} {"train_loss": -5.440796375274658, "global_step": 33004, "epoch": 785} {"train_loss": -5.567564010620117, "global_step": 33005, "epoch": 785} {"train_loss": -5.484661102294922, "global_step": 33006, "epoch": 785} {"train_loss": -5.510515213012695, "global_step": 33007, "epoch": 785} {"train_loss": -5.583714485168457, "global_step": 33008, "epoch": 785} {"train_loss": -5.440439224243164, "global_step": 33009, "epoch": 785} {"train_loss": -5.459444999694824, "global_step": 33010, "epoch": 785} {"train_loss": -5.490668796357655, "global_step": 33011, "epoch": 785, "val_loss": 66613.109375} {"train_loss": -5.547475814819336, "global_step": 33012, "epoch": 786} {"train_loss": -5.468532562255859, "global_step": 33013, "epoch": 786} {"train_loss": -5.535483360290527, "global_step": 33014, "epoch": 786} {"train_loss": -5.505936622619629, "global_step": 33015, "epoch": 786} {"train_loss": -5.415278434753418, "global_step": 33016, "epoch": 786} {"train_loss": -5.505841255187988, "global_step": 33017, "epoch": 786} {"train_loss": -5.47219705581665, "global_step": 33018, "epoch": 786} {"train_loss": -5.579026222229004, "global_step": 33019, "epoch": 786} {"train_loss": -5.572629451751709, "global_step": 33020, "epoch": 786} {"train_loss": -5.488332748413086, "global_step": 33021, "epoch": 786} {"train_loss": -5.73194694519043, "global_step": 33022, "epoch": 786} {"train_loss": -5.4841718673706055, "global_step": 33023, "epoch": 786} {"train_loss": -5.472777366638184, "global_step": 33024, "epoch": 786} {"train_loss": -5.53459358215332, "global_step": 33025, "epoch": 786} {"train_loss": -5.631052017211914, "global_step": 33026, "epoch": 786} {"train_loss": -5.555551052093506, "global_step": 33027, "epoch": 786} {"train_loss": -5.522408962249756, "global_step": 33028, "epoch": 786} {"train_loss": -5.426120758056641, "global_step": 33029, "epoch": 786} {"train_loss": -5.518373966217041, "global_step": 33030, "epoch": 786} {"train_loss": -5.431928634643555, "global_step": 33031, "epoch": 786} {"train_loss": -5.56957483291626, "global_step": 33032, "epoch": 786} {"train_loss": -5.490897178649902, "global_step": 33033, "epoch": 786} {"train_loss": -5.56187105178833, "global_step": 33034, "epoch": 786} {"train_loss": -5.511386871337891, "global_step": 33035, "epoch": 786} {"train_loss": -5.395173072814941, "global_step": 33036, "epoch": 786} {"train_loss": -5.507229804992676, "global_step": 33037, "epoch": 786} {"train_loss": -5.505534648895264, "global_step": 33038, "epoch": 786} {"train_loss": -5.607168674468994, "global_step": 33039, "epoch": 786} {"train_loss": -5.534929275512695, "global_step": 33040, "epoch": 786} {"train_loss": -5.426717281341553, "global_step": 33041, "epoch": 786} {"train_loss": -5.560525417327881, "global_step": 33042, "epoch": 786} {"train_loss": -5.57900857925415, "global_step": 33043, "epoch": 786} {"train_loss": -5.515066623687744, "global_step": 33044, "epoch": 786} {"train_loss": -5.60610818862915, "global_step": 33045, "epoch": 786} {"train_loss": -5.603769302368164, "global_step": 33046, "epoch": 786} {"train_loss": -5.572563171386719, "global_step": 33047, "epoch": 786} {"train_loss": -5.579281330108643, "global_step": 33048, "epoch": 786} {"train_loss": -5.530210494995117, "global_step": 33049, "epoch": 786} {"train_loss": -5.635965347290039, "global_step": 33050, "epoch": 786} {"train_loss": -5.4599409103393555, "global_step": 33051, "epoch": 786} {"train_loss": -5.389608860015869, "global_step": 33052, "epoch": 786} {"train_loss": -5.524860030128842, "global_step": 33053, "epoch": 786, "val_loss": 66749.953125} {"train_loss": -5.364175319671631, "global_step": 33054, "epoch": 787} {"train_loss": -5.429888725280762, "global_step": 33055, "epoch": 787} {"train_loss": -5.451902389526367, "global_step": 33056, "epoch": 787} {"train_loss": -5.553814888000488, "global_step": 33057, "epoch": 787} {"train_loss": -5.477490425109863, "global_step": 33058, "epoch": 787} {"train_loss": -5.357388496398926, "global_step": 33059, "epoch": 787} {"train_loss": -5.352945327758789, "global_step": 33060, "epoch": 787} {"train_loss": -5.399440288543701, "global_step": 33061, "epoch": 787} {"train_loss": -5.410358428955078, "global_step": 33062, "epoch": 787} {"train_loss": -5.437716484069824, "global_step": 33063, "epoch": 787} {"train_loss": -5.356596946716309, "global_step": 33064, "epoch": 787} {"train_loss": -5.479964256286621, "global_step": 33065, "epoch": 787} {"train_loss": -5.493006706237793, "global_step": 33066, "epoch": 787} {"train_loss": -5.451314449310303, "global_step": 33067, "epoch": 787} {"train_loss": -5.422402381896973, "global_step": 33068, "epoch": 787} {"train_loss": -5.441336631774902, "global_step": 33069, "epoch": 787} {"train_loss": -5.495975971221924, "global_step": 33070, "epoch": 787} {"train_loss": -5.546755313873291, "global_step": 33071, "epoch": 787} {"train_loss": -5.4327592849731445, "global_step": 33072, "epoch": 787} {"train_loss": -5.5475850105285645, "global_step": 33073, "epoch": 787} {"train_loss": -5.579638481140137, "global_step": 33074, "epoch": 787} {"train_loss": -5.496004104614258, "global_step": 33075, "epoch": 787} {"train_loss": -5.4882941246032715, "global_step": 33076, "epoch": 787} {"train_loss": -5.468149662017822, "global_step": 33077, "epoch": 787} {"train_loss": -5.425797462463379, "global_step": 33078, "epoch": 787} {"train_loss": -5.5272908210754395, "global_step": 33079, "epoch": 787} {"train_loss": -5.512363910675049, "global_step": 33080, "epoch": 787} {"train_loss": -5.502697944641113, "global_step": 33081, "epoch": 787} {"train_loss": -5.618435859680176, "global_step": 33082, "epoch": 787} {"train_loss": -5.3876142501831055, "global_step": 33083, "epoch": 787} {"train_loss": -5.603355884552002, "global_step": 33084, "epoch": 787} {"train_loss": -5.400524139404297, "global_step": 33085, "epoch": 787} {"train_loss": -5.509400367736816, "global_step": 33086, "epoch": 787} {"train_loss": -5.541265964508057, "global_step": 33087, "epoch": 787} {"train_loss": -5.527293682098389, "global_step": 33088, "epoch": 787} {"train_loss": -5.6390533447265625, "global_step": 33089, "epoch": 787} {"train_loss": -5.550112724304199, "global_step": 33090, "epoch": 787} {"train_loss": -5.4694976806640625, "global_step": 33091, "epoch": 787} {"train_loss": -5.482203483581543, "global_step": 33092, "epoch": 787} {"train_loss": -5.4708123207092285, "global_step": 33093, "epoch": 787} {"train_loss": -5.645303726196289, "global_step": 33094, "epoch": 787} {"train_loss": -5.481637580054147, "global_step": 33095, "epoch": 787, "val_loss": 66843.875} {"train_loss": -5.493631362915039, "global_step": 33096, "epoch": 788} {"train_loss": -5.566686630249023, "global_step": 33097, "epoch": 788} {"train_loss": -5.478808403015137, "global_step": 33098, "epoch": 788} {"train_loss": -5.504859447479248, "global_step": 33099, "epoch": 788} {"train_loss": -5.499556541442871, "global_step": 33100, "epoch": 788} {"train_loss": -5.585439682006836, "global_step": 33101, "epoch": 788} {"train_loss": -5.463499069213867, "global_step": 33102, "epoch": 788} {"train_loss": -5.5472612380981445, "global_step": 33103, "epoch": 788} {"train_loss": -5.576745986938477, "global_step": 33104, "epoch": 788} {"train_loss": -5.522197723388672, "global_step": 33105, "epoch": 788} {"train_loss": -5.5237650871276855, "global_step": 33106, "epoch": 788} {"train_loss": -5.526922225952148, "global_step": 33107, "epoch": 788} {"train_loss": -5.455203056335449, "global_step": 33108, "epoch": 788} {"train_loss": -5.493790626525879, "global_step": 33109, "epoch": 788} {"train_loss": -5.51059627532959, "global_step": 33110, "epoch": 788} {"train_loss": -5.5407257080078125, "global_step": 33111, "epoch": 788} {"train_loss": -5.490181922912598, "global_step": 33112, "epoch": 788} {"train_loss": -5.460594654083252, "global_step": 33113, "epoch": 788} {"train_loss": -5.562835216522217, "global_step": 33114, "epoch": 788} {"train_loss": -5.340723037719727, "global_step": 33115, "epoch": 788} {"train_loss": -5.572707176208496, "global_step": 33116, "epoch": 788} {"train_loss": -5.426364898681641, "global_step": 33117, "epoch": 788} {"train_loss": -5.472582817077637, "global_step": 33118, "epoch": 788} {"train_loss": -5.512886047363281, "global_step": 33119, "epoch": 788} {"train_loss": -5.551517486572266, "global_step": 33120, "epoch": 788} {"train_loss": -5.597796440124512, "global_step": 33121, "epoch": 788} {"train_loss": -5.604393482208252, "global_step": 33122, "epoch": 788} {"train_loss": -5.590867042541504, "global_step": 33123, "epoch": 788} {"train_loss": -5.563010215759277, "global_step": 33124, "epoch": 788} {"train_loss": -5.429784774780273, "global_step": 33125, "epoch": 788} {"train_loss": -5.561785697937012, "global_step": 33126, "epoch": 788} {"train_loss": -5.527471542358398, "global_step": 33127, "epoch": 788} {"train_loss": -5.530410289764404, "global_step": 33128, "epoch": 788} {"train_loss": -5.427127361297607, "global_step": 33129, "epoch": 788} {"train_loss": -5.501808166503906, "global_step": 33130, "epoch": 788} {"train_loss": -5.610406398773193, "global_step": 33131, "epoch": 788} {"train_loss": -5.579115867614746, "global_step": 33132, "epoch": 788} {"train_loss": -5.505342483520508, "global_step": 33133, "epoch": 788} {"train_loss": -5.447845458984375, "global_step": 33134, "epoch": 788} {"train_loss": -5.603744983673096, "global_step": 33135, "epoch": 788} {"train_loss": -5.534876823425293, "global_step": 33136, "epoch": 788} {"train_loss": -5.520518836520967, "global_step": 33137, "epoch": 788, "val_loss": 66394.2890625} {"train_loss": -5.571837425231934, "global_step": 33138, "epoch": 789} {"train_loss": -5.494198799133301, "global_step": 33139, "epoch": 789} {"train_loss": -5.572579860687256, "global_step": 33140, "epoch": 789} {"train_loss": -5.560788154602051, "global_step": 33141, "epoch": 789} {"train_loss": -5.508615493774414, "global_step": 33142, "epoch": 789} {"train_loss": -5.550570964813232, "global_step": 33143, "epoch": 789} {"train_loss": -5.694395065307617, "global_step": 33144, "epoch": 789} {"train_loss": -5.516609191894531, "global_step": 33145, "epoch": 789} {"train_loss": -5.554216384887695, "global_step": 33146, "epoch": 789} {"train_loss": -5.559305191040039, "global_step": 33147, "epoch": 789} {"train_loss": -5.63592004776001, "global_step": 33148, "epoch": 789} {"train_loss": -5.390376567840576, "global_step": 33149, "epoch": 789} {"train_loss": -5.599662780761719, "global_step": 33150, "epoch": 789} {"train_loss": -5.506795883178711, "global_step": 33151, "epoch": 789} {"train_loss": -5.366000175476074, "global_step": 33152, "epoch": 789} {"train_loss": -5.583957672119141, "global_step": 33153, "epoch": 789} {"train_loss": -5.576959609985352, "global_step": 33154, "epoch": 789} {"train_loss": -5.557422161102295, "global_step": 33155, "epoch": 789} {"train_loss": -5.494318962097168, "global_step": 33156, "epoch": 789} {"train_loss": -5.667346000671387, "global_step": 33157, "epoch": 789} {"train_loss": -5.4992828369140625, "global_step": 33158, "epoch": 789} {"train_loss": -5.5210418701171875, "global_step": 33159, "epoch": 789} {"train_loss": -5.571531772613525, "global_step": 33160, "epoch": 789} {"train_loss": -5.586032390594482, "global_step": 33161, "epoch": 789} {"train_loss": -5.5425872802734375, "global_step": 33162, "epoch": 789} {"train_loss": -5.435527324676514, "global_step": 33163, "epoch": 789} {"train_loss": -5.435051441192627, "global_step": 33164, "epoch": 789} {"train_loss": -5.509987831115723, "global_step": 33165, "epoch": 789} {"train_loss": -5.6136980056762695, "global_step": 33166, "epoch": 789} {"train_loss": -5.492654323577881, "global_step": 33167, "epoch": 789} {"train_loss": -5.4712653160095215, "global_step": 33168, "epoch": 789} {"train_loss": -5.524589538574219, "global_step": 33169, "epoch": 789} {"train_loss": -5.4640793800354, "global_step": 33170, "epoch": 789} {"train_loss": -5.471676826477051, "global_step": 33171, "epoch": 789} {"train_loss": -5.570462226867676, "global_step": 33172, "epoch": 789} {"train_loss": -5.34272575378418, "global_step": 33173, "epoch": 789} {"train_loss": -5.504410743713379, "global_step": 33174, "epoch": 789} {"train_loss": -5.678894996643066, "global_step": 33175, "epoch": 789} {"train_loss": -5.425595760345459, "global_step": 33176, "epoch": 789} {"train_loss": -5.5059428215026855, "global_step": 33177, "epoch": 789} {"train_loss": -5.507990837097168, "global_step": 33178, "epoch": 789} {"train_loss": -5.525540465400333, "global_step": 33179, "epoch": 789, "val_loss": 66569.15625} {"train_loss": -5.440725803375244, "global_step": 33180, "epoch": 790} {"train_loss": -5.442890167236328, "global_step": 33181, "epoch": 790} {"train_loss": -5.494680881500244, "global_step": 33182, "epoch": 790} {"train_loss": -5.428066253662109, "global_step": 33183, "epoch": 790} {"train_loss": -5.590518951416016, "global_step": 33184, "epoch": 790} {"train_loss": -5.470242500305176, "global_step": 33185, "epoch": 790} {"train_loss": -5.409659385681152, "global_step": 33186, "epoch": 790} {"train_loss": -5.433305740356445, "global_step": 33187, "epoch": 790} {"train_loss": -5.482219696044922, "global_step": 33188, "epoch": 790} {"train_loss": -5.455813407897949, "global_step": 33189, "epoch": 790} {"train_loss": -5.4817094802856445, "global_step": 33190, "epoch": 790} {"train_loss": -5.438758850097656, "global_step": 33191, "epoch": 790} {"train_loss": -5.500341415405273, "global_step": 33192, "epoch": 790} {"train_loss": -5.411947250366211, "global_step": 33193, "epoch": 790} {"train_loss": -5.425176620483398, "global_step": 33194, "epoch": 790} {"train_loss": -5.545101165771484, "global_step": 33195, "epoch": 790} {"train_loss": -5.45414924621582, "global_step": 33196, "epoch": 790} {"train_loss": -5.69268798828125, "global_step": 33197, "epoch": 790} {"train_loss": -5.555682182312012, "global_step": 33198, "epoch": 790} {"train_loss": -5.524844169616699, "global_step": 33199, "epoch": 790} {"train_loss": -5.579399108886719, "global_step": 33200, "epoch": 790} {"train_loss": -5.492631912231445, "global_step": 33201, "epoch": 790} {"train_loss": -5.487379550933838, "global_step": 33202, "epoch": 790} {"train_loss": -5.5449419021606445, "global_step": 33203, "epoch": 790} {"train_loss": -5.4375152587890625, "global_step": 33204, "epoch": 790} {"train_loss": -5.46751594543457, "global_step": 33205, "epoch": 790} {"train_loss": -5.506291389465332, "global_step": 33206, "epoch": 790} {"train_loss": -5.669467926025391, "global_step": 33207, "epoch": 790} {"train_loss": -5.498812198638916, "global_step": 33208, "epoch": 790} {"train_loss": -5.432001113891602, "global_step": 33209, "epoch": 790} {"train_loss": -5.601828575134277, "global_step": 33210, "epoch": 790} {"train_loss": -5.620336532592773, "global_step": 33211, "epoch": 790} {"train_loss": -5.5793962478637695, "global_step": 33212, "epoch": 790} {"train_loss": -5.391897201538086, "global_step": 33213, "epoch": 790} {"train_loss": -5.497761249542236, "global_step": 33214, "epoch": 790} {"train_loss": -5.400300979614258, "global_step": 33215, "epoch": 790} {"train_loss": -5.58595085144043, "global_step": 33216, "epoch": 790} {"train_loss": -5.64933967590332, "global_step": 33217, "epoch": 790} {"train_loss": -5.567431449890137, "global_step": 33218, "epoch": 790} {"train_loss": -5.655875205993652, "global_step": 33219, "epoch": 790} {"train_loss": -5.4991655349731445, "global_step": 33220, "epoch": 790} {"train_loss": -5.509034202212379, "global_step": 33221, "epoch": 790, "val_loss": 66292.5} {"train_loss": -5.5826520919799805, "global_step": 33222, "epoch": 791} {"train_loss": -5.504214286804199, "global_step": 33223, "epoch": 791} {"train_loss": -5.510678291320801, "global_step": 33224, "epoch": 791} {"train_loss": -5.497244834899902, "global_step": 33225, "epoch": 791} {"train_loss": -5.581790924072266, "global_step": 33226, "epoch": 791} {"train_loss": -5.535511016845703, "global_step": 33227, "epoch": 791} {"train_loss": -5.614261627197266, "global_step": 33228, "epoch": 791} {"train_loss": -5.605772495269775, "global_step": 33229, "epoch": 791} {"train_loss": -5.6265668869018555, "global_step": 33230, "epoch": 791} {"train_loss": -5.580752849578857, "global_step": 33231, "epoch": 791} {"train_loss": -5.735208511352539, "global_step": 33232, "epoch": 791} {"train_loss": -5.510065078735352, "global_step": 33233, "epoch": 791} {"train_loss": -5.555128574371338, "global_step": 33234, "epoch": 791} {"train_loss": -5.511533737182617, "global_step": 33235, "epoch": 791} {"train_loss": -5.5777692794799805, "global_step": 33236, "epoch": 791} {"train_loss": -5.363049030303955, "global_step": 33237, "epoch": 791} {"train_loss": -5.617034435272217, "global_step": 33238, "epoch": 791} {"train_loss": -5.452534198760986, "global_step": 33239, "epoch": 791} {"train_loss": -5.476999282836914, "global_step": 33240, "epoch": 791} {"train_loss": -5.294449806213379, "global_step": 33241, "epoch": 791} {"train_loss": -5.558194637298584, "global_step": 33242, "epoch": 791} {"train_loss": -5.466426849365234, "global_step": 33243, "epoch": 791} {"train_loss": -5.413623809814453, "global_step": 33244, "epoch": 791} {"train_loss": -5.650579452514648, "global_step": 33245, "epoch": 791} {"train_loss": -5.616089344024658, "global_step": 33246, "epoch": 791} {"train_loss": -5.513408660888672, "global_step": 33247, "epoch": 791} {"train_loss": -5.6061482429504395, "global_step": 33248, "epoch": 791} {"train_loss": -5.479650020599365, "global_step": 33249, "epoch": 791} {"train_loss": -5.525378227233887, "global_step": 33250, "epoch": 791} {"train_loss": -5.5225605964660645, "global_step": 33251, "epoch": 791} {"train_loss": -5.531255722045898, "global_step": 33252, "epoch": 791} {"train_loss": -5.568395614624023, "global_step": 33253, "epoch": 791} {"train_loss": -5.375811576843262, "global_step": 33254, "epoch": 791} {"train_loss": -5.499540328979492, "global_step": 33255, "epoch": 791} {"train_loss": -5.484174728393555, "global_step": 33256, "epoch": 791} {"train_loss": -5.557574272155762, "global_step": 33257, "epoch": 791} {"train_loss": -5.554007053375244, "global_step": 33258, "epoch": 791} {"train_loss": -5.535640716552734, "global_step": 33259, "epoch": 791} {"train_loss": -5.48402214050293, "global_step": 33260, "epoch": 791} {"train_loss": -5.433262348175049, "global_step": 33261, "epoch": 791} {"train_loss": -5.528594017028809, "global_step": 33262, "epoch": 791} {"train_loss": -5.526304108755929, "global_step": 33263, "epoch": 791, "val_loss": 66693.8828125} {"train_loss": -5.512195110321045, "global_step": 33264, "epoch": 792} {"train_loss": -5.476820468902588, "global_step": 33265, "epoch": 792} {"train_loss": -5.500182628631592, "global_step": 33266, "epoch": 792} {"train_loss": -5.531435966491699, "global_step": 33267, "epoch": 792} {"train_loss": -5.508762359619141, "global_step": 33268, "epoch": 792} {"train_loss": -5.75684928894043, "global_step": 33269, "epoch": 792} {"train_loss": -5.605473041534424, "global_step": 33270, "epoch": 792} {"train_loss": -5.611507415771484, "global_step": 33271, "epoch": 792} {"train_loss": -5.648036003112793, "global_step": 33272, "epoch": 792} {"train_loss": -5.57652473449707, "global_step": 33273, "epoch": 792} {"train_loss": -5.5064520835876465, "global_step": 33274, "epoch": 792} {"train_loss": -5.578242301940918, "global_step": 33275, "epoch": 792} {"train_loss": -5.434261322021484, "global_step": 33276, "epoch": 792} {"train_loss": -5.583907127380371, "global_step": 33277, "epoch": 792} {"train_loss": -5.545841217041016, "global_step": 33278, "epoch": 792} {"train_loss": -5.636569023132324, "global_step": 33279, "epoch": 792} {"train_loss": -5.607829570770264, "global_step": 33280, "epoch": 792} {"train_loss": -5.570749759674072, "global_step": 33281, "epoch": 792} {"train_loss": -5.520382404327393, "global_step": 33282, "epoch": 792} {"train_loss": -5.467774868011475, "global_step": 33283, "epoch": 792} {"train_loss": -5.494440078735352, "global_step": 33284, "epoch": 792} {"train_loss": -5.5480756759643555, "global_step": 33285, "epoch": 792} {"train_loss": -5.523002624511719, "global_step": 33286, "epoch": 792} {"train_loss": -5.412270545959473, "global_step": 33287, "epoch": 792} {"train_loss": -5.483243942260742, "global_step": 33288, "epoch": 792} {"train_loss": -5.612874507904053, "global_step": 33289, "epoch": 792} {"train_loss": -5.392363548278809, "global_step": 33290, "epoch": 792} {"train_loss": -5.441018581390381, "global_step": 33291, "epoch": 792} {"train_loss": -5.445339679718018, "global_step": 33292, "epoch": 792} {"train_loss": -5.506977081298828, "global_step": 33293, "epoch": 792} {"train_loss": -5.413394451141357, "global_step": 33294, "epoch": 792} {"train_loss": -5.453606605529785, "global_step": 33295, "epoch": 792} {"train_loss": -5.539474964141846, "global_step": 33296, "epoch": 792} {"train_loss": -5.4445672035217285, "global_step": 33297, "epoch": 792} {"train_loss": -5.4567670822143555, "global_step": 33298, "epoch": 792} {"train_loss": -5.6020097732543945, "global_step": 33299, "epoch": 792} {"train_loss": -5.615510940551758, "global_step": 33300, "epoch": 792} {"train_loss": -5.613698959350586, "global_step": 33301, "epoch": 792} {"train_loss": -5.4629597663879395, "global_step": 33302, "epoch": 792} {"train_loss": -5.450202941894531, "global_step": 33303, "epoch": 792} {"train_loss": -5.524723529815674, "global_step": 33304, "epoch": 792} {"train_loss": -5.525858810969761, "global_step": 33305, "epoch": 792, "val_loss": 66475.9609375} {"train_loss": -5.417425632476807, "global_step": 33306, "epoch": 793} {"train_loss": -5.541523456573486, "global_step": 33307, "epoch": 793} {"train_loss": -5.439286231994629, "global_step": 33308, "epoch": 793} {"train_loss": -5.466494560241699, "global_step": 33309, "epoch": 793} {"train_loss": -5.559450149536133, "global_step": 33310, "epoch": 793} {"train_loss": -5.539562702178955, "global_step": 33311, "epoch": 793} {"train_loss": -5.604944229125977, "global_step": 33312, "epoch": 793} {"train_loss": -5.564493179321289, "global_step": 33313, "epoch": 793} {"train_loss": -5.475132465362549, "global_step": 33314, "epoch": 793} {"train_loss": -5.699759483337402, "global_step": 33315, "epoch": 793} {"train_loss": -5.410129070281982, "global_step": 33316, "epoch": 793} {"train_loss": -5.426067352294922, "global_step": 33317, "epoch": 793} {"train_loss": -5.501049995422363, "global_step": 33318, "epoch": 793} {"train_loss": -5.516360282897949, "global_step": 33319, "epoch": 793} {"train_loss": -5.701943874359131, "global_step": 33320, "epoch": 793} {"train_loss": -5.405671119689941, "global_step": 33321, "epoch": 793} {"train_loss": -5.545496463775635, "global_step": 33322, "epoch": 793} {"train_loss": -5.660674095153809, "global_step": 33323, "epoch": 793} {"train_loss": -5.373204708099365, "global_step": 33324, "epoch": 793} {"train_loss": -5.5053486824035645, "global_step": 33325, "epoch": 793} {"train_loss": -5.636731147766113, "global_step": 33326, "epoch": 793} {"train_loss": -5.340514659881592, "global_step": 33327, "epoch": 793} {"train_loss": -5.560832977294922, "global_step": 33328, "epoch": 793} {"train_loss": -5.457639217376709, "global_step": 33329, "epoch": 793} {"train_loss": -5.553473472595215, "global_step": 33330, "epoch": 793} {"train_loss": -5.523772716522217, "global_step": 33331, "epoch": 793} {"train_loss": -5.538459777832031, "global_step": 33332, "epoch": 793} {"train_loss": -5.483453273773193, "global_step": 33333, "epoch": 793} {"train_loss": -5.539135456085205, "global_step": 33334, "epoch": 793} {"train_loss": -5.55394172668457, "global_step": 33335, "epoch": 793} {"train_loss": -5.558998107910156, "global_step": 33336, "epoch": 793} {"train_loss": -5.433859825134277, "global_step": 33337, "epoch": 793} {"train_loss": -5.590081214904785, "global_step": 33338, "epoch": 793} {"train_loss": -5.540268898010254, "global_step": 33339, "epoch": 793} {"train_loss": -5.665804386138916, "global_step": 33340, "epoch": 793} {"train_loss": -5.5948967933654785, "global_step": 33341, "epoch": 793} {"train_loss": -5.42346715927124, "global_step": 33342, "epoch": 793} {"train_loss": -5.57044792175293, "global_step": 33343, "epoch": 793} {"train_loss": -5.544563293457031, "global_step": 33344, "epoch": 793} {"train_loss": -5.576042175292969, "global_step": 33345, "epoch": 793} {"train_loss": -5.547464370727539, "global_step": 33346, "epoch": 793} {"train_loss": -5.52655367624192, "global_step": 33347, "epoch": 793, "val_loss": 66567.4375} {"train_loss": -5.587686538696289, "global_step": 33348, "epoch": 794} {"train_loss": -5.594448089599609, "global_step": 33349, "epoch": 794} {"train_loss": -5.566128730773926, "global_step": 33350, "epoch": 794} {"train_loss": -5.52581262588501, "global_step": 33351, "epoch": 794} {"train_loss": -5.572253227233887, "global_step": 33352, "epoch": 794} {"train_loss": -5.569016456604004, "global_step": 33353, "epoch": 794} {"train_loss": -5.455447196960449, "global_step": 33354, "epoch": 794} {"train_loss": -5.543238162994385, "global_step": 33355, "epoch": 794} {"train_loss": -5.541255474090576, "global_step": 33356, "epoch": 794} {"train_loss": -5.469295501708984, "global_step": 33357, "epoch": 794} {"train_loss": -5.613940715789795, "global_step": 33358, "epoch": 794} {"train_loss": -5.478276252746582, "global_step": 33359, "epoch": 794} {"train_loss": -5.539175987243652, "global_step": 33360, "epoch": 794} {"train_loss": -5.531660079956055, "global_step": 33361, "epoch": 794} {"train_loss": -5.450575828552246, "global_step": 33362, "epoch": 794} {"train_loss": -5.550348281860352, "global_step": 33363, "epoch": 794} {"train_loss": -5.441957473754883, "global_step": 33364, "epoch": 794} {"train_loss": -5.421578407287598, "global_step": 33365, "epoch": 794} {"train_loss": -5.493197917938232, "global_step": 33366, "epoch": 794} {"train_loss": -5.5720391273498535, "global_step": 33367, "epoch": 794} {"train_loss": -5.482693672180176, "global_step": 33368, "epoch": 794} {"train_loss": -5.543435573577881, "global_step": 33369, "epoch": 794} {"train_loss": -5.549509048461914, "global_step": 33370, "epoch": 794} {"train_loss": -5.564792156219482, "global_step": 33371, "epoch": 794} {"train_loss": -5.544486045837402, "global_step": 33372, "epoch": 794} {"train_loss": -5.524532318115234, "global_step": 33373, "epoch": 794} {"train_loss": -5.561823844909668, "global_step": 33374, "epoch": 794} {"train_loss": -5.621943473815918, "global_step": 33375, "epoch": 794} {"train_loss": -5.603566646575928, "global_step": 33376, "epoch": 794} {"train_loss": -5.559056282043457, "global_step": 33377, "epoch": 794} {"train_loss": -5.496068954467773, "global_step": 33378, "epoch": 794} {"train_loss": -5.529101371765137, "global_step": 33379, "epoch": 794} {"train_loss": -5.534351825714111, "global_step": 33380, "epoch": 794} {"train_loss": -5.55176305770874, "global_step": 33381, "epoch": 794} {"train_loss": -5.518222808837891, "global_step": 33382, "epoch": 794} {"train_loss": -5.508504867553711, "global_step": 33383, "epoch": 794} {"train_loss": -5.557129859924316, "global_step": 33384, "epoch": 794} {"train_loss": -5.526183128356934, "global_step": 33385, "epoch": 794} {"train_loss": -5.530900001525879, "global_step": 33386, "epoch": 794} {"train_loss": -5.56721830368042, "global_step": 33387, "epoch": 794} {"train_loss": -5.484585762023926, "global_step": 33388, "epoch": 794} {"train_loss": -5.536887078058152, "global_step": 33389, "epoch": 794, "val_loss": 66386.046875} {"train_loss": -5.568385601043701, "global_step": 33390, "epoch": 795} {"train_loss": -5.59283971786499, "global_step": 33391, "epoch": 795} {"train_loss": -5.53034782409668, "global_step": 33392, "epoch": 795} {"train_loss": -5.519571304321289, "global_step": 33393, "epoch": 795} {"train_loss": -5.566945552825928, "global_step": 33394, "epoch": 795} {"train_loss": -5.506416320800781, "global_step": 33395, "epoch": 795} {"train_loss": -5.582334041595459, "global_step": 33396, "epoch": 795} {"train_loss": -5.527729034423828, "global_step": 33397, "epoch": 795} {"train_loss": -5.6011643409729, "global_step": 33398, "epoch": 795} {"train_loss": -5.542923927307129, "global_step": 33399, "epoch": 795} {"train_loss": -5.484181880950928, "global_step": 33400, "epoch": 795} {"train_loss": -5.4512529373168945, "global_step": 33401, "epoch": 795} {"train_loss": -5.405393600463867, "global_step": 33402, "epoch": 795} {"train_loss": -5.569348335266113, "global_step": 33403, "epoch": 795} {"train_loss": -5.463933944702148, "global_step": 33404, "epoch": 795} {"train_loss": -5.6468071937561035, "global_step": 33405, "epoch": 795} {"train_loss": -5.446012496948242, "global_step": 33406, "epoch": 795} {"train_loss": -5.426593780517578, "global_step": 33407, "epoch": 795} {"train_loss": -5.497262954711914, "global_step": 33408, "epoch": 795} {"train_loss": -5.44667387008667, "global_step": 33409, "epoch": 795} {"train_loss": -5.589588642120361, "global_step": 33410, "epoch": 795} {"train_loss": -5.376943588256836, "global_step": 33411, "epoch": 795} {"train_loss": -5.491236686706543, "global_step": 33412, "epoch": 795} {"train_loss": -5.4853644371032715, "global_step": 33413, "epoch": 795} {"train_loss": -5.5819902420043945, "global_step": 33414, "epoch": 795} {"train_loss": -5.500017166137695, "global_step": 33415, "epoch": 795} {"train_loss": -5.536001205444336, "global_step": 33416, "epoch": 795} {"train_loss": -5.604417324066162, "global_step": 33417, "epoch": 795} {"train_loss": -5.669421195983887, "global_step": 33418, "epoch": 795} {"train_loss": -5.265817642211914, "global_step": 33419, "epoch": 795} {"train_loss": -5.6361260414123535, "global_step": 33420, "epoch": 795} {"train_loss": -5.680904388427734, "global_step": 33421, "epoch": 795} {"train_loss": -5.482513427734375, "global_step": 33422, "epoch": 795} {"train_loss": -5.554211616516113, "global_step": 33423, "epoch": 795} {"train_loss": -5.479309558868408, "global_step": 33424, "epoch": 795} {"train_loss": -5.668392181396484, "global_step": 33425, "epoch": 795} {"train_loss": -5.435904502868652, "global_step": 33426, "epoch": 795} {"train_loss": -5.454988479614258, "global_step": 33427, "epoch": 795} {"train_loss": -5.546570301055908, "global_step": 33428, "epoch": 795} {"train_loss": -5.574678897857666, "global_step": 33429, "epoch": 795} {"train_loss": -5.4169206619262695, "global_step": 33430, "epoch": 795} {"train_loss": -5.5224556014651345, "global_step": 33431, "epoch": 795, "val_loss": 66548.40625} {"train_loss": -5.47700309753418, "global_step": 33432, "epoch": 796} {"train_loss": -5.614674091339111, "global_step": 33433, "epoch": 796} {"train_loss": -5.531794548034668, "global_step": 33434, "epoch": 796} {"train_loss": -5.407401084899902, "global_step": 33435, "epoch": 796} {"train_loss": -5.525996685028076, "global_step": 33436, "epoch": 796} {"train_loss": -5.588055610656738, "global_step": 33437, "epoch": 796} {"train_loss": -5.62351131439209, "global_step": 33438, "epoch": 796} {"train_loss": -5.533792972564697, "global_step": 33439, "epoch": 796} {"train_loss": -5.603166103363037, "global_step": 33440, "epoch": 796} {"train_loss": -5.554981231689453, "global_step": 33441, "epoch": 796} {"train_loss": -5.465318202972412, "global_step": 33442, "epoch": 796} {"train_loss": -5.492201328277588, "global_step": 33443, "epoch": 796} {"train_loss": -5.539652347564697, "global_step": 33444, "epoch": 796} {"train_loss": -5.528224945068359, "global_step": 33445, "epoch": 796} {"train_loss": -5.541965484619141, "global_step": 33446, "epoch": 796} {"train_loss": -5.499690055847168, "global_step": 33447, "epoch": 796} {"train_loss": -5.488812446594238, "global_step": 33448, "epoch": 796} {"train_loss": -5.5150532722473145, "global_step": 33449, "epoch": 796} {"train_loss": -5.56503963470459, "global_step": 33450, "epoch": 796} {"train_loss": -5.422874450683594, "global_step": 33451, "epoch": 796} {"train_loss": -5.514996528625488, "global_step": 33452, "epoch": 796} {"train_loss": -5.562894344329834, "global_step": 33453, "epoch": 796} {"train_loss": -5.481557846069336, "global_step": 33454, "epoch": 796} {"train_loss": -5.502560615539551, "global_step": 33455, "epoch": 796} {"train_loss": -5.404181003570557, "global_step": 33456, "epoch": 796} {"train_loss": -5.506369590759277, "global_step": 33457, "epoch": 796} {"train_loss": -5.556283950805664, "global_step": 33458, "epoch": 796} {"train_loss": -5.4289093017578125, "global_step": 33459, "epoch": 796} {"train_loss": -5.560831546783447, "global_step": 33460, "epoch": 796} {"train_loss": -5.546753406524658, "global_step": 33461, "epoch": 796} {"train_loss": -5.4114766120910645, "global_step": 33462, "epoch": 796} {"train_loss": -5.727351188659668, "global_step": 33463, "epoch": 796} {"train_loss": -5.509701728820801, "global_step": 33464, "epoch": 796} {"train_loss": -5.529951095581055, "global_step": 33465, "epoch": 796} {"train_loss": -5.357659816741943, "global_step": 33466, "epoch": 796} {"train_loss": -5.568913459777832, "global_step": 33467, "epoch": 796} {"train_loss": -5.43295955657959, "global_step": 33468, "epoch": 796} {"train_loss": -5.532201766967773, "global_step": 33469, "epoch": 796} {"train_loss": -5.632242202758789, "global_step": 33470, "epoch": 796} {"train_loss": -5.512027740478516, "global_step": 33471, "epoch": 796} {"train_loss": -5.471530914306641, "global_step": 33472, "epoch": 796} {"train_loss": -5.518345072155907, "global_step": 33473, "epoch": 796, "val_loss": 66738.984375} {"train_loss": -5.585476875305176, "global_step": 33474, "epoch": 797} {"train_loss": -5.608847618103027, "global_step": 33475, "epoch": 797} {"train_loss": -5.5624003410339355, "global_step": 33476, "epoch": 797} {"train_loss": -5.43792724609375, "global_step": 33477, "epoch": 797} {"train_loss": -5.5370073318481445, "global_step": 33478, "epoch": 797} {"train_loss": -5.462366104125977, "global_step": 33479, "epoch": 797} {"train_loss": -5.621070861816406, "global_step": 33480, "epoch": 797} {"train_loss": -5.51987886428833, "global_step": 33481, "epoch": 797} {"train_loss": -5.4094624519348145, "global_step": 33482, "epoch": 797} {"train_loss": -5.32034969329834, "global_step": 33483, "epoch": 797} {"train_loss": -5.57710075378418, "global_step": 33484, "epoch": 797} {"train_loss": -5.416157245635986, "global_step": 33485, "epoch": 797} {"train_loss": -5.587457656860352, "global_step": 33486, "epoch": 797} {"train_loss": -5.410191059112549, "global_step": 33487, "epoch": 797} {"train_loss": -5.548444747924805, "global_step": 33488, "epoch": 797} {"train_loss": -5.501037120819092, "global_step": 33489, "epoch": 797} {"train_loss": -5.4655537605285645, "global_step": 33490, "epoch": 797} {"train_loss": -5.436223983764648, "global_step": 33491, "epoch": 797} {"train_loss": -5.479443550109863, "global_step": 33492, "epoch": 797} {"train_loss": -5.467245101928711, "global_step": 33493, "epoch": 797} {"train_loss": -5.370139122009277, "global_step": 33494, "epoch": 797} {"train_loss": -5.586927890777588, "global_step": 33495, "epoch": 797} {"train_loss": -5.419628143310547, "global_step": 33496, "epoch": 797} {"train_loss": -5.581449508666992, "global_step": 33497, "epoch": 797} {"train_loss": -5.535567760467529, "global_step": 33498, "epoch": 797} {"train_loss": -5.416741371154785, "global_step": 33499, "epoch": 797} {"train_loss": -5.541227340698242, "global_step": 33500, "epoch": 797} {"train_loss": -5.4976725578308105, "global_step": 33501, "epoch": 797} {"train_loss": -5.539459228515625, "global_step": 33502, "epoch": 797} {"train_loss": -5.381636619567871, "global_step": 33503, "epoch": 797} {"train_loss": -5.6439008712768555, "global_step": 33504, "epoch": 797} {"train_loss": -5.524925231933594, "global_step": 33505, "epoch": 797} {"train_loss": -5.56655740737915, "global_step": 33506, "epoch": 797} {"train_loss": -5.473202228546143, "global_step": 33507, "epoch": 797} {"train_loss": -5.572856903076172, "global_step": 33508, "epoch": 797} {"train_loss": -5.520441055297852, "global_step": 33509, "epoch": 797} {"train_loss": -5.486029624938965, "global_step": 33510, "epoch": 797} {"train_loss": -5.637495994567871, "global_step": 33511, "epoch": 797} {"train_loss": -5.460221290588379, "global_step": 33512, "epoch": 797} {"train_loss": -5.5015740394592285, "global_step": 33513, "epoch": 797} {"train_loss": -5.427196979522705, "global_step": 33514, "epoch": 797} {"train_loss": -5.502526657921927, "global_step": 33515, "epoch": 797, "val_loss": 66541.890625} {"train_loss": -5.445805549621582, "global_step": 33516, "epoch": 798} {"train_loss": -5.561845779418945, "global_step": 33517, "epoch": 798} {"train_loss": -5.550295829772949, "global_step": 33518, "epoch": 798} {"train_loss": -5.6266188621521, "global_step": 33519, "epoch": 798} {"train_loss": -5.5134782791137695, "global_step": 33520, "epoch": 798} {"train_loss": -5.460122585296631, "global_step": 33521, "epoch": 798} {"train_loss": -5.651544094085693, "global_step": 33522, "epoch": 798} {"train_loss": -5.541173934936523, "global_step": 33523, "epoch": 798} {"train_loss": -5.637921333312988, "global_step": 33524, "epoch": 798} {"train_loss": -5.627035140991211, "global_step": 33525, "epoch": 798} {"train_loss": -5.444515228271484, "global_step": 33526, "epoch": 798} {"train_loss": -5.474045276641846, "global_step": 33527, "epoch": 798} {"train_loss": -5.616189956665039, "global_step": 33528, "epoch": 798} {"train_loss": -5.47425651550293, "global_step": 33529, "epoch": 798} {"train_loss": -5.6077985763549805, "global_step": 33530, "epoch": 798} {"train_loss": -5.381592750549316, "global_step": 33531, "epoch": 798} {"train_loss": -5.620459079742432, "global_step": 33532, "epoch": 798} {"train_loss": -5.607733249664307, "global_step": 33533, "epoch": 798} {"train_loss": -5.6939592361450195, "global_step": 33534, "epoch": 798} {"train_loss": -5.649783611297607, "global_step": 33535, "epoch": 798} {"train_loss": -5.594317436218262, "global_step": 33536, "epoch": 798} {"train_loss": -5.55263614654541, "global_step": 33537, "epoch": 798} {"train_loss": -5.5846452713012695, "global_step": 33538, "epoch": 798} {"train_loss": -5.3857197761535645, "global_step": 33539, "epoch": 798} {"train_loss": -5.6002726554870605, "global_step": 33540, "epoch": 798} {"train_loss": -5.449373722076416, "global_step": 33541, "epoch": 798} {"train_loss": -5.4751482009887695, "global_step": 33542, "epoch": 798} {"train_loss": -5.515003681182861, "global_step": 33543, "epoch": 798} {"train_loss": -5.529562950134277, "global_step": 33544, "epoch": 798} {"train_loss": -5.452314376831055, "global_step": 33545, "epoch": 798} {"train_loss": -5.520874977111816, "global_step": 33546, "epoch": 798} {"train_loss": -5.431946754455566, "global_step": 33547, "epoch": 798} {"train_loss": -5.490670204162598, "global_step": 33548, "epoch": 798} {"train_loss": -5.451603889465332, "global_step": 33549, "epoch": 798} {"train_loss": -5.549535751342773, "global_step": 33550, "epoch": 798} {"train_loss": -5.365844249725342, "global_step": 33551, "epoch": 798} {"train_loss": -5.548864841461182, "global_step": 33552, "epoch": 798} {"train_loss": -5.488788604736328, "global_step": 33553, "epoch": 798} {"train_loss": -5.419175148010254, "global_step": 33554, "epoch": 798} {"train_loss": -5.482725143432617, "global_step": 33555, "epoch": 798} {"train_loss": -5.548774719238281, "global_step": 33556, "epoch": 798} {"train_loss": -5.5289062431880405, "global_step": 33557, "epoch": 798, "val_loss": 66950.0} {"train_loss": -5.471774578094482, "global_step": 33558, "epoch": 799} {"train_loss": -5.541098117828369, "global_step": 33559, "epoch": 799} {"train_loss": -5.562981605529785, "global_step": 33560, "epoch": 799} {"train_loss": -5.5024309158325195, "global_step": 33561, "epoch": 799} {"train_loss": -5.506778717041016, "global_step": 33562, "epoch": 799} {"train_loss": -5.498978137969971, "global_step": 33563, "epoch": 799} {"train_loss": -5.441403388977051, "global_step": 33564, "epoch": 799} {"train_loss": -5.424602508544922, "global_step": 33565, "epoch": 799} {"train_loss": -5.516841888427734, "global_step": 33566, "epoch": 799} {"train_loss": -5.434572219848633, "global_step": 33567, "epoch": 799} {"train_loss": -5.561868667602539, "global_step": 33568, "epoch": 799} {"train_loss": -5.572094440460205, "global_step": 33569, "epoch": 799} {"train_loss": -5.615816116333008, "global_step": 33570, "epoch": 799} {"train_loss": -5.536067485809326, "global_step": 33571, "epoch": 799} {"train_loss": -5.53199577331543, "global_step": 33572, "epoch": 799} {"train_loss": -5.527928352355957, "global_step": 33573, "epoch": 799} {"train_loss": -5.621135711669922, "global_step": 33574, "epoch": 799} {"train_loss": -5.580630302429199, "global_step": 33575, "epoch": 799} {"train_loss": -5.667993068695068, "global_step": 33576, "epoch": 799} {"train_loss": -5.654839515686035, "global_step": 33577, "epoch": 799} {"train_loss": -5.521645545959473, "global_step": 33578, "epoch": 799} {"train_loss": -5.429466247558594, "global_step": 33579, "epoch": 799} {"train_loss": -5.452976226806641, "global_step": 33580, "epoch": 799} {"train_loss": -5.529401779174805, "global_step": 33581, "epoch": 799} {"train_loss": -5.636453628540039, "global_step": 33582, "epoch": 799} {"train_loss": -5.626663684844971, "global_step": 33583, "epoch": 799} {"train_loss": -5.481424331665039, "global_step": 33584, "epoch": 799} {"train_loss": -5.496340751647949, "global_step": 33585, "epoch": 799} {"train_loss": -5.651684284210205, "global_step": 33586, "epoch": 799} {"train_loss": -5.518857955932617, "global_step": 33587, "epoch": 799} {"train_loss": -5.649313926696777, "global_step": 33588, "epoch": 799} {"train_loss": -5.50431489944458, "global_step": 33589, "epoch": 799} {"train_loss": -5.490390300750732, "global_step": 33590, "epoch": 799} {"train_loss": -5.476828575134277, "global_step": 33591, "epoch": 799} {"train_loss": -5.39123010635376, "global_step": 33592, "epoch": 799} {"train_loss": -5.510037422180176, "global_step": 33593, "epoch": 799} {"train_loss": -5.549227714538574, "global_step": 33594, "epoch": 799} {"train_loss": -5.533137321472168, "global_step": 33595, "epoch": 799} {"train_loss": -5.5439019203186035, "global_step": 33596, "epoch": 799} {"train_loss": -5.459715843200684, "global_step": 33597, "epoch": 799} {"train_loss": -5.515730857849121, "global_step": 33598, "epoch": 799} {"train_loss": -5.5301448958260675, "global_step": 33599, "epoch": 799, "val_loss": 66793.140625} {"train_loss": -5.55087423324585, "global_step": 33600, "epoch": 800} {"train_loss": -5.622506141662598, "global_step": 33601, "epoch": 800} {"train_loss": -5.594951629638672, "global_step": 33602, "epoch": 800} {"train_loss": -5.612793922424316, "global_step": 33603, "epoch": 800} {"train_loss": -5.5393548011779785, "global_step": 33604, "epoch": 800} {"train_loss": -5.676763534545898, "global_step": 33605, "epoch": 800} {"train_loss": -5.518415451049805, "global_step": 33606, "epoch": 800} {"train_loss": -5.559398651123047, "global_step": 33607, "epoch": 800} {"train_loss": -5.598237991333008, "global_step": 33608, "epoch": 800} {"train_loss": -5.557725429534912, "global_step": 33609, "epoch": 800} {"train_loss": -5.412546634674072, "global_step": 33610, "epoch": 800} {"train_loss": -5.575468063354492, "global_step": 33611, "epoch": 800} {"train_loss": -5.631865501403809, "global_step": 33612, "epoch": 800} {"train_loss": -5.402918815612793, "global_step": 33613, "epoch": 800} {"train_loss": -5.557491302490234, "global_step": 33614, "epoch": 800} {"train_loss": -5.609091281890869, "global_step": 33615, "epoch": 800} {"train_loss": -5.656152725219727, "global_step": 33616, "epoch": 800} {"train_loss": -5.496278762817383, "global_step": 33617, "epoch": 800} {"train_loss": -5.572468280792236, "global_step": 33618, "epoch": 800} {"train_loss": -5.564542770385742, "global_step": 33619, "epoch": 800} {"train_loss": -5.516735076904297, "global_step": 33620, "epoch": 800} {"train_loss": -5.611027717590332, "global_step": 33621, "epoch": 800} {"train_loss": -5.483985900878906, "global_step": 33622, "epoch": 800} {"train_loss": -5.3471174240112305, "global_step": 33623, "epoch": 800} {"train_loss": -5.531270980834961, "global_step": 33624, "epoch": 800} {"train_loss": -5.488624572753906, "global_step": 33625, "epoch": 800} {"train_loss": -5.708503723144531, "global_step": 33626, "epoch": 800} {"train_loss": -5.501897811889648, "global_step": 33627, "epoch": 800} {"train_loss": -5.525223731994629, "global_step": 33628, "epoch": 800} {"train_loss": -5.510632514953613, "global_step": 33629, "epoch": 800} {"train_loss": -5.623844146728516, "global_step": 33630, "epoch": 800} {"train_loss": -5.544553756713867, "global_step": 33631, "epoch": 800} {"train_loss": -5.524035453796387, "global_step": 33632, "epoch": 800} {"train_loss": -5.447645664215088, "global_step": 33633, "epoch": 800} {"train_loss": -5.481011867523193, "global_step": 33634, "epoch": 800} {"train_loss": -5.449341773986816, "global_step": 33635, "epoch": 800} {"train_loss": -5.454859256744385, "global_step": 33636, "epoch": 800} {"train_loss": -5.524857044219971, "global_step": 33637, "epoch": 800} {"train_loss": -5.591423034667969, "global_step": 33638, "epoch": 800} {"train_loss": -5.47763204574585, "global_step": 33639, "epoch": 800} {"train_loss": -5.4197187423706055, "global_step": 33640, "epoch": 800} {"train_loss": -5.538914214997065, "global_step": 33641, "epoch": 800, "train/sim_max_reward_0": 0.7934279112238063, "train/sim_max_reward_1": 0.003267693979881022, "train/sim_max_reward_2": 0.2304630391634523, "train/sim_max_reward_3": 0.1773041864322928, "train/sim_max_reward_4": 0.5416649541088293, "train/sim_max_reward_5": 0.549932601337875, "test/sim_max_reward_4400000": 0.17546121143634125, "test/sim_max_reward_4400001": 0.16790088627112756, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.8308011974089677, "test/sim_max_reward_4400004": 0.2197279137857015, "test/sim_max_reward_4400005": 0.20781047866963281, "test/sim_max_reward_4400006": 0.37854996141883646, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.8115622054160898, "test/sim_max_reward_4400010": 0.16022552350808594, "test/sim_max_reward_4400011": 0.20679176478220865, "test/sim_max_reward_4400012": 0.38838431366792875, "test/sim_max_reward_4400013": 0.3664829815809575, "test/sim_max_reward_4400014": 0.3870154120462209, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.7128645145894936, "test/sim_max_reward_4400017": 0.029598996734554874, "test/sim_max_reward_4400018": 0.3471852205007499, "test/sim_max_reward_4400019": 0.17166124814684897, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.20525871715657168, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.20138037593014163, "test/sim_max_reward_4400026": 0.07287160612887805, "test/sim_max_reward_4400027": 0.022998386263558632, "test/sim_max_reward_4400028": 0.2544764458394795, "test/sim_max_reward_4400029": 0.43319628792279286, "test/sim_max_reward_4400030": 0.48159633900865584, "test/sim_max_reward_4400031": 0.3004249049569049, "test/sim_max_reward_4400032": 0.36407141019753114, "test/sim_max_reward_4400033": 0.6635295746530606, "test/sim_max_reward_4400034": 0.867653648119393, "test/sim_max_reward_4400035": 0.433777114140868, "test/sim_max_reward_4400036": 0.32326008892862135, "test/sim_max_reward_4400037": 0.28090494986926867, "test/sim_max_reward_4400038": 0.33468006943948764, "test/sim_max_reward_4400039": 0.8441517378356026, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.757531098914715, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.5478253956990484, "test/sim_max_reward_4400044": 0.038153313964790006, "test/sim_max_reward_4400045": 0.6779590254605833, "test/sim_max_reward_4400046": 0.2611197965970283, "test/sim_max_reward_4400047": 0.20489272915769385, "test/sim_max_reward_4400048": 0.3442012759445227, "test/sim_max_reward_4400049": 0.21774956029541187, "train/mean_score": 0.38267673104102284, "test/mean_score": 0.30877146136858996, "val_loss": 66381.375} {"train_loss": -5.613036155700684, "global_step": 33642, "epoch": 801} {"train_loss": -5.535976886749268, "global_step": 33643, "epoch": 801} {"train_loss": -5.573455810546875, "global_step": 33644, "epoch": 801} {"train_loss": -5.422354221343994, "global_step": 33645, "epoch": 801} {"train_loss": -5.472384452819824, "global_step": 33646, "epoch": 801} {"train_loss": -5.601280212402344, "global_step": 33647, "epoch": 801} {"train_loss": -5.476459503173828, "global_step": 33648, "epoch": 801} {"train_loss": -5.4917192459106445, "global_step": 33649, "epoch": 801} {"train_loss": -5.5290117263793945, "global_step": 33650, "epoch": 801} {"train_loss": -5.464621543884277, "global_step": 33651, "epoch": 801} {"train_loss": -5.509943962097168, "global_step": 33652, "epoch": 801} {"train_loss": -5.654559135437012, "global_step": 33653, "epoch": 801} {"train_loss": -5.581902980804443, "global_step": 33654, "epoch": 801} {"train_loss": -5.7147064208984375, "global_step": 33655, "epoch": 801} {"train_loss": -5.504185199737549, "global_step": 33656, "epoch": 801} {"train_loss": -5.622763156890869, "global_step": 33657, "epoch": 801} {"train_loss": -5.711816787719727, "global_step": 33658, "epoch": 801} {"train_loss": -5.441274166107178, "global_step": 33659, "epoch": 801} {"train_loss": -5.505011558532715, "global_step": 33660, "epoch": 801} {"train_loss": -5.598297119140625, "global_step": 33661, "epoch": 801} {"train_loss": -5.405892372131348, "global_step": 33662, "epoch": 801} {"train_loss": -5.593146324157715, "global_step": 33663, "epoch": 801} {"train_loss": -5.511534690856934, "global_step": 33664, "epoch": 801} {"train_loss": -5.575320720672607, "global_step": 33665, "epoch": 801} {"train_loss": -5.5947346687316895, "global_step": 33666, "epoch": 801} {"train_loss": -5.538084030151367, "global_step": 33667, "epoch": 801} {"train_loss": -5.624332427978516, "global_step": 33668, "epoch": 801} {"train_loss": -5.569192886352539, "global_step": 33669, "epoch": 801} {"train_loss": -5.567598342895508, "global_step": 33670, "epoch": 801} {"train_loss": -5.655214309692383, "global_step": 33671, "epoch": 801} {"train_loss": -5.4672017097473145, "global_step": 33672, "epoch": 801} {"train_loss": -5.50187873840332, "global_step": 33673, "epoch": 801} {"train_loss": -5.5640106201171875, "global_step": 33674, "epoch": 801} {"train_loss": -5.575568199157715, "global_step": 33675, "epoch": 801} {"train_loss": -5.498550891876221, "global_step": 33676, "epoch": 801} {"train_loss": -5.504960536956787, "global_step": 33677, "epoch": 801} {"train_loss": -5.3928704261779785, "global_step": 33678, "epoch": 801} {"train_loss": -5.458117485046387, "global_step": 33679, "epoch": 801} {"train_loss": -5.377362251281738, "global_step": 33680, "epoch": 801} {"train_loss": -5.4654340744018555, "global_step": 33681, "epoch": 801} {"train_loss": -5.436519622802734, "global_step": 33682, "epoch": 801} {"train_loss": -5.535227991285778, "global_step": 33683, "epoch": 801, "val_loss": 66515.1015625} {"train_loss": -5.46550989151001, "global_step": 33684, "epoch": 802} {"train_loss": -5.4768290519714355, "global_step": 33685, "epoch": 802} {"train_loss": -5.505622863769531, "global_step": 33686, "epoch": 802} {"train_loss": -5.475408554077148, "global_step": 33687, "epoch": 802} {"train_loss": -5.592038154602051, "global_step": 33688, "epoch": 802} {"train_loss": -5.585497856140137, "global_step": 33689, "epoch": 802} {"train_loss": -5.450127601623535, "global_step": 33690, "epoch": 802} {"train_loss": -5.5953593254089355, "global_step": 33691, "epoch": 802} {"train_loss": -5.666840076446533, "global_step": 33692, "epoch": 802} {"train_loss": -5.365288734436035, "global_step": 33693, "epoch": 802} {"train_loss": -5.456831932067871, "global_step": 33694, "epoch": 802} {"train_loss": -5.69977331161499, "global_step": 33695, "epoch": 802} {"train_loss": -5.4457550048828125, "global_step": 33696, "epoch": 802} {"train_loss": -5.574573516845703, "global_step": 33697, "epoch": 802} {"train_loss": -5.608336448669434, "global_step": 33698, "epoch": 802} {"train_loss": -5.276971340179443, "global_step": 33699, "epoch": 802} {"train_loss": -5.652346611022949, "global_step": 33700, "epoch": 802} {"train_loss": -5.440559387207031, "global_step": 33701, "epoch": 802} {"train_loss": -5.499349594116211, "global_step": 33702, "epoch": 802} {"train_loss": -5.662350177764893, "global_step": 33703, "epoch": 802} {"train_loss": -5.427196502685547, "global_step": 33704, "epoch": 802} {"train_loss": -5.5125813484191895, "global_step": 33705, "epoch": 802} {"train_loss": -5.4541521072387695, "global_step": 33706, "epoch": 802} {"train_loss": -5.477235317230225, "global_step": 33707, "epoch": 802} {"train_loss": -5.4760966300964355, "global_step": 33708, "epoch": 802} {"train_loss": -5.537008762359619, "global_step": 33709, "epoch": 802} {"train_loss": -5.563453674316406, "global_step": 33710, "epoch": 802} {"train_loss": -5.409684181213379, "global_step": 33711, "epoch": 802} {"train_loss": -5.440071105957031, "global_step": 33712, "epoch": 802} {"train_loss": -5.5632004737854, "global_step": 33713, "epoch": 802} {"train_loss": -5.517701148986816, "global_step": 33714, "epoch": 802} {"train_loss": -5.649872779846191, "global_step": 33715, "epoch": 802} {"train_loss": -5.514043807983398, "global_step": 33716, "epoch": 802} {"train_loss": -5.550138473510742, "global_step": 33717, "epoch": 802} {"train_loss": -5.5637431144714355, "global_step": 33718, "epoch": 802} {"train_loss": -5.552816867828369, "global_step": 33719, "epoch": 802} {"train_loss": -5.580085754394531, "global_step": 33720, "epoch": 802} {"train_loss": -5.564540863037109, "global_step": 33721, "epoch": 802} {"train_loss": -5.36794376373291, "global_step": 33722, "epoch": 802} {"train_loss": -5.514342784881592, "global_step": 33723, "epoch": 802} {"train_loss": -5.425069808959961, "global_step": 33724, "epoch": 802} {"train_loss": -5.51726526305789, "global_step": 33725, "epoch": 802, "val_loss": 66202.671875} {"train_loss": -5.57923698425293, "global_step": 33726, "epoch": 803} {"train_loss": -5.455075263977051, "global_step": 33727, "epoch": 803} {"train_loss": -5.526079177856445, "global_step": 33728, "epoch": 803} {"train_loss": -5.452366828918457, "global_step": 33729, "epoch": 803} {"train_loss": -5.4469451904296875, "global_step": 33730, "epoch": 803} {"train_loss": -5.541041851043701, "global_step": 33731, "epoch": 803} {"train_loss": -5.595392227172852, "global_step": 33732, "epoch": 803} {"train_loss": -5.448459625244141, "global_step": 33733, "epoch": 803} {"train_loss": -5.5634026527404785, "global_step": 33734, "epoch": 803} {"train_loss": -5.423321723937988, "global_step": 33735, "epoch": 803} {"train_loss": -5.55596923828125, "global_step": 33736, "epoch": 803} {"train_loss": -5.561704635620117, "global_step": 33737, "epoch": 803} {"train_loss": -5.585161209106445, "global_step": 33738, "epoch": 803} {"train_loss": -5.615105628967285, "global_step": 33739, "epoch": 803} {"train_loss": -5.346437454223633, "global_step": 33740, "epoch": 803} {"train_loss": -5.555352210998535, "global_step": 33741, "epoch": 803} {"train_loss": -5.413992881774902, "global_step": 33742, "epoch": 803} {"train_loss": -5.481067657470703, "global_step": 33743, "epoch": 803} {"train_loss": -5.695623397827148, "global_step": 33744, "epoch": 803} {"train_loss": -5.365869045257568, "global_step": 33745, "epoch": 803} {"train_loss": -5.593741416931152, "global_step": 33746, "epoch": 803} {"train_loss": -5.573151588439941, "global_step": 33747, "epoch": 803} {"train_loss": -5.4945454597473145, "global_step": 33748, "epoch": 803} {"train_loss": -5.590041160583496, "global_step": 33749, "epoch": 803} {"train_loss": -5.61356258392334, "global_step": 33750, "epoch": 803} {"train_loss": -5.530459403991699, "global_step": 33751, "epoch": 803} {"train_loss": -5.529738426208496, "global_step": 33752, "epoch": 803} {"train_loss": -5.571774482727051, "global_step": 33753, "epoch": 803} {"train_loss": -5.588342666625977, "global_step": 33754, "epoch": 803} {"train_loss": -5.4855217933654785, "global_step": 33755, "epoch": 803} {"train_loss": -5.584955215454102, "global_step": 33756, "epoch": 803} {"train_loss": -5.394212245941162, "global_step": 33757, "epoch": 803} {"train_loss": -5.522430419921875, "global_step": 33758, "epoch": 803} {"train_loss": -5.536241054534912, "global_step": 33759, "epoch": 803} {"train_loss": -5.422685623168945, "global_step": 33760, "epoch": 803} {"train_loss": -5.59408712387085, "global_step": 33761, "epoch": 803} {"train_loss": -5.572256088256836, "global_step": 33762, "epoch": 803} {"train_loss": -5.3977460861206055, "global_step": 33763, "epoch": 803} {"train_loss": -5.469904899597168, "global_step": 33764, "epoch": 803} {"train_loss": -5.610492706298828, "global_step": 33765, "epoch": 803} {"train_loss": -5.434482574462891, "global_step": 33766, "epoch": 803} {"train_loss": -5.522530226480393, "global_step": 33767, "epoch": 803, "val_loss": 66762.71875} {"train_loss": -5.503773212432861, "global_step": 33768, "epoch": 804} {"train_loss": -5.5431952476501465, "global_step": 33769, "epoch": 804} {"train_loss": -5.521033763885498, "global_step": 33770, "epoch": 804} {"train_loss": -5.585345268249512, "global_step": 33771, "epoch": 804} {"train_loss": -5.529992580413818, "global_step": 33772, "epoch": 804} {"train_loss": -5.61657190322876, "global_step": 33773, "epoch": 804} {"train_loss": -5.570547103881836, "global_step": 33774, "epoch": 804} {"train_loss": -5.468588829040527, "global_step": 33775, "epoch": 804} {"train_loss": -5.476686477661133, "global_step": 33776, "epoch": 804} {"train_loss": -5.589029788970947, "global_step": 33777, "epoch": 804} {"train_loss": -5.416395664215088, "global_step": 33778, "epoch": 804} {"train_loss": -5.632278919219971, "global_step": 33779, "epoch": 804} {"train_loss": -5.570072650909424, "global_step": 33780, "epoch": 804} {"train_loss": -5.513430118560791, "global_step": 33781, "epoch": 804} {"train_loss": -5.4193115234375, "global_step": 33782, "epoch": 804} {"train_loss": -5.493094444274902, "global_step": 33783, "epoch": 804} {"train_loss": -5.537322998046875, "global_step": 33784, "epoch": 804} {"train_loss": -5.582913875579834, "global_step": 33785, "epoch": 804} {"train_loss": -5.531994819641113, "global_step": 33786, "epoch": 804} {"train_loss": -5.614480018615723, "global_step": 33787, "epoch": 804} {"train_loss": -5.563125133514404, "global_step": 33788, "epoch": 804} {"train_loss": -5.532393932342529, "global_step": 33789, "epoch": 804} {"train_loss": -5.515930652618408, "global_step": 33790, "epoch": 804} {"train_loss": -5.589601516723633, "global_step": 33791, "epoch": 804} {"train_loss": -5.555693626403809, "global_step": 33792, "epoch": 804} {"train_loss": -5.442994117736816, "global_step": 33793, "epoch": 804} {"train_loss": -5.5438032150268555, "global_step": 33794, "epoch": 804} {"train_loss": -5.424884796142578, "global_step": 33795, "epoch": 804} {"train_loss": -5.566911697387695, "global_step": 33796, "epoch": 804} {"train_loss": -5.4885358810424805, "global_step": 33797, "epoch": 804} {"train_loss": -5.540900230407715, "global_step": 33798, "epoch": 804} {"train_loss": -5.579626560211182, "global_step": 33799, "epoch": 804} {"train_loss": -5.499384880065918, "global_step": 33800, "epoch": 804} {"train_loss": -5.569854259490967, "global_step": 33801, "epoch": 804} {"train_loss": -5.636507987976074, "global_step": 33802, "epoch": 804} {"train_loss": -5.439877510070801, "global_step": 33803, "epoch": 804} {"train_loss": -5.576542377471924, "global_step": 33804, "epoch": 804} {"train_loss": -5.530332565307617, "global_step": 33805, "epoch": 804} {"train_loss": -5.5717692375183105, "global_step": 33806, "epoch": 804} {"train_loss": -5.4944610595703125, "global_step": 33807, "epoch": 804} {"train_loss": -5.516515731811523, "global_step": 33808, "epoch": 804} {"train_loss": -5.533785922186715, "global_step": 33809, "epoch": 804, "val_loss": 66372.1953125} {"train_loss": -5.370944976806641, "global_step": 33810, "epoch": 805} {"train_loss": -5.612015724182129, "global_step": 33811, "epoch": 805} {"train_loss": -5.454606533050537, "global_step": 33812, "epoch": 805} {"train_loss": -5.413733005523682, "global_step": 33813, "epoch": 805} {"train_loss": -5.694218158721924, "global_step": 33814, "epoch": 805} {"train_loss": -5.528171539306641, "global_step": 33815, "epoch": 805} {"train_loss": -5.573332786560059, "global_step": 33816, "epoch": 805} {"train_loss": -5.523847579956055, "global_step": 33817, "epoch": 805} {"train_loss": -5.603212833404541, "global_step": 33818, "epoch": 805} {"train_loss": -5.566495895385742, "global_step": 33819, "epoch": 805} {"train_loss": -5.475179672241211, "global_step": 33820, "epoch": 805} {"train_loss": -5.497067451477051, "global_step": 33821, "epoch": 805} {"train_loss": -5.639130592346191, "global_step": 33822, "epoch": 805} {"train_loss": -5.517518997192383, "global_step": 33823, "epoch": 805} {"train_loss": -5.432216167449951, "global_step": 33824, "epoch": 805} {"train_loss": -5.573369026184082, "global_step": 33825, "epoch": 805} {"train_loss": -5.3820672035217285, "global_step": 33826, "epoch": 805} {"train_loss": -5.514418601989746, "global_step": 33827, "epoch": 805} {"train_loss": -5.5613603591918945, "global_step": 33828, "epoch": 805} {"train_loss": -5.484644889831543, "global_step": 33829, "epoch": 805} {"train_loss": -5.440253257751465, "global_step": 33830, "epoch": 805} {"train_loss": -5.471891403198242, "global_step": 33831, "epoch": 805} {"train_loss": -5.515814304351807, "global_step": 33832, "epoch": 805} {"train_loss": -5.640174865722656, "global_step": 33833, "epoch": 805} {"train_loss": -5.537646293640137, "global_step": 33834, "epoch": 805} {"train_loss": -5.609212875366211, "global_step": 33835, "epoch": 805} {"train_loss": -5.50527286529541, "global_step": 33836, "epoch": 805} {"train_loss": -5.46504020690918, "global_step": 33837, "epoch": 805} {"train_loss": -5.3728437423706055, "global_step": 33838, "epoch": 805} {"train_loss": -5.60341739654541, "global_step": 33839, "epoch": 805} {"train_loss": -5.5492777824401855, "global_step": 33840, "epoch": 805} {"train_loss": -5.432610034942627, "global_step": 33841, "epoch": 805} {"train_loss": -5.587101459503174, "global_step": 33842, "epoch": 805} {"train_loss": -5.5865302085876465, "global_step": 33843, "epoch": 805} {"train_loss": -5.600374221801758, "global_step": 33844, "epoch": 805} {"train_loss": -5.68585205078125, "global_step": 33845, "epoch": 805} {"train_loss": -5.693168640136719, "global_step": 33846, "epoch": 805} {"train_loss": -5.658060073852539, "global_step": 33847, "epoch": 805} {"train_loss": -5.501190662384033, "global_step": 33848, "epoch": 805} {"train_loss": -5.608040809631348, "global_step": 33849, "epoch": 805} {"train_loss": -5.544853210449219, "global_step": 33850, "epoch": 805} {"train_loss": -5.538783016658964, "global_step": 33851, "epoch": 805, "val_loss": 66740.5078125} {"train_loss": -5.5949602127075195, "global_step": 33852, "epoch": 806} {"train_loss": -5.607109069824219, "global_step": 33853, "epoch": 806} {"train_loss": -5.547002792358398, "global_step": 33854, "epoch": 806} {"train_loss": -5.486545085906982, "global_step": 33855, "epoch": 806} {"train_loss": -5.536614418029785, "global_step": 33856, "epoch": 806} {"train_loss": -5.6107330322265625, "global_step": 33857, "epoch": 806} {"train_loss": -5.382245063781738, "global_step": 33858, "epoch": 806} {"train_loss": -5.606027603149414, "global_step": 33859, "epoch": 806} {"train_loss": -5.4741530418396, "global_step": 33860, "epoch": 806} {"train_loss": -5.379952430725098, "global_step": 33861, "epoch": 806} {"train_loss": -5.6224870681762695, "global_step": 33862, "epoch": 806} {"train_loss": -5.571414947509766, "global_step": 33863, "epoch": 806} {"train_loss": -5.567816257476807, "global_step": 33864, "epoch": 806} {"train_loss": -5.627245903015137, "global_step": 33865, "epoch": 806} {"train_loss": -5.605637550354004, "global_step": 33866, "epoch": 806} {"train_loss": -5.569385051727295, "global_step": 33867, "epoch": 806} {"train_loss": -5.49747371673584, "global_step": 33868, "epoch": 806} {"train_loss": -5.516398906707764, "global_step": 33869, "epoch": 806} {"train_loss": -5.545547008514404, "global_step": 33870, "epoch": 806} {"train_loss": -5.561446666717529, "global_step": 33871, "epoch": 806} {"train_loss": -5.431623458862305, "global_step": 33872, "epoch": 806} {"train_loss": -5.679584980010986, "global_step": 33873, "epoch": 806} {"train_loss": -5.400433540344238, "global_step": 33874, "epoch": 806} {"train_loss": -5.494747161865234, "global_step": 33875, "epoch": 806} {"train_loss": -5.551206111907959, "global_step": 33876, "epoch": 806} {"train_loss": -5.5769171714782715, "global_step": 33877, "epoch": 806} {"train_loss": -5.530786037445068, "global_step": 33878, "epoch": 806} {"train_loss": -5.5299482345581055, "global_step": 33879, "epoch": 806} {"train_loss": -5.438755035400391, "global_step": 33880, "epoch": 806} {"train_loss": -5.472389221191406, "global_step": 33881, "epoch": 806} {"train_loss": -5.559764862060547, "global_step": 33882, "epoch": 806} {"train_loss": -5.52321195602417, "global_step": 33883, "epoch": 806} {"train_loss": -5.491117477416992, "global_step": 33884, "epoch": 806} {"train_loss": -5.72513484954834, "global_step": 33885, "epoch": 806} {"train_loss": -5.586193084716797, "global_step": 33886, "epoch": 806} {"train_loss": -5.407757759094238, "global_step": 33887, "epoch": 806} {"train_loss": -5.4806671142578125, "global_step": 33888, "epoch": 806} {"train_loss": -5.534316062927246, "global_step": 33889, "epoch": 806} {"train_loss": -5.497991561889648, "global_step": 33890, "epoch": 806} {"train_loss": -5.576662063598633, "global_step": 33891, "epoch": 806} {"train_loss": -5.41219425201416, "global_step": 33892, "epoch": 806} {"train_loss": -5.531712747755504, "global_step": 33893, "epoch": 806, "val_loss": 66458.8359375} {"train_loss": -5.532840251922607, "global_step": 33894, "epoch": 807} {"train_loss": -5.490926742553711, "global_step": 33895, "epoch": 807} {"train_loss": -5.565017223358154, "global_step": 33896, "epoch": 807} {"train_loss": -5.738192558288574, "global_step": 33897, "epoch": 807} {"train_loss": -5.485773086547852, "global_step": 33898, "epoch": 807} {"train_loss": -5.5961713790893555, "global_step": 33899, "epoch": 807} {"train_loss": -5.563909530639648, "global_step": 33900, "epoch": 807} {"train_loss": -5.503692626953125, "global_step": 33901, "epoch": 807} {"train_loss": -5.524450302124023, "global_step": 33902, "epoch": 807} {"train_loss": -5.498626708984375, "global_step": 33903, "epoch": 807} {"train_loss": -5.595386505126953, "global_step": 33904, "epoch": 807} {"train_loss": -5.51917839050293, "global_step": 33905, "epoch": 807} {"train_loss": -5.543929576873779, "global_step": 33906, "epoch": 807} {"train_loss": -5.433154106140137, "global_step": 33907, "epoch": 807} {"train_loss": -5.546567440032959, "global_step": 33908, "epoch": 807} {"train_loss": -5.556406021118164, "global_step": 33909, "epoch": 807} {"train_loss": -5.530345916748047, "global_step": 33910, "epoch": 807} {"train_loss": -5.554337501525879, "global_step": 33911, "epoch": 807} {"train_loss": -5.496589660644531, "global_step": 33912, "epoch": 807} {"train_loss": -5.616708755493164, "global_step": 33913, "epoch": 807} {"train_loss": -5.3823323249816895, "global_step": 33914, "epoch": 807} {"train_loss": -5.468934059143066, "global_step": 33915, "epoch": 807} {"train_loss": -5.63095235824585, "global_step": 33916, "epoch": 807} {"train_loss": -5.643651008605957, "global_step": 33917, "epoch": 807} {"train_loss": -5.596708297729492, "global_step": 33918, "epoch": 807} {"train_loss": -5.534359931945801, "global_step": 33919, "epoch": 807} {"train_loss": -5.569300174713135, "global_step": 33920, "epoch": 807} {"train_loss": -5.682239055633545, "global_step": 33921, "epoch": 807} {"train_loss": -5.6905198097229, "global_step": 33922, "epoch": 807} {"train_loss": -5.450016975402832, "global_step": 33923, "epoch": 807} {"train_loss": -5.471784591674805, "global_step": 33924, "epoch": 807} {"train_loss": -5.457424640655518, "global_step": 33925, "epoch": 807} {"train_loss": -5.489861488342285, "global_step": 33926, "epoch": 807} {"train_loss": -5.460514068603516, "global_step": 33927, "epoch": 807} {"train_loss": -5.58134651184082, "global_step": 33928, "epoch": 807} {"train_loss": -5.527214527130127, "global_step": 33929, "epoch": 807} {"train_loss": -5.391226768493652, "global_step": 33930, "epoch": 807} {"train_loss": -5.577446937561035, "global_step": 33931, "epoch": 807} {"train_loss": -5.290562629699707, "global_step": 33932, "epoch": 807} {"train_loss": -5.546055793762207, "global_step": 33933, "epoch": 807} {"train_loss": -5.435122966766357, "global_step": 33934, "epoch": 807} {"train_loss": -5.529862858000255, "global_step": 33935, "epoch": 807, "val_loss": 66401.3046875} {"train_loss": -5.577530860900879, "global_step": 33936, "epoch": 808} {"train_loss": -5.48126220703125, "global_step": 33937, "epoch": 808} {"train_loss": -5.655416488647461, "global_step": 33938, "epoch": 808} {"train_loss": -5.57501220703125, "global_step": 33939, "epoch": 808} {"train_loss": -5.61289119720459, "global_step": 33940, "epoch": 808} {"train_loss": -5.535922050476074, "global_step": 33941, "epoch": 808} {"train_loss": -5.535392761230469, "global_step": 33942, "epoch": 808} {"train_loss": -5.556849479675293, "global_step": 33943, "epoch": 808} {"train_loss": -5.6303253173828125, "global_step": 33944, "epoch": 808} {"train_loss": -5.664363861083984, "global_step": 33945, "epoch": 808} {"train_loss": -5.616186141967773, "global_step": 33946, "epoch": 808} {"train_loss": -5.603626251220703, "global_step": 33947, "epoch": 808} {"train_loss": -5.614394664764404, "global_step": 33948, "epoch": 808} {"train_loss": -5.451862335205078, "global_step": 33949, "epoch": 808} {"train_loss": -5.611790657043457, "global_step": 33950, "epoch": 808} {"train_loss": -5.681943893432617, "global_step": 33951, "epoch": 808} {"train_loss": -5.598313808441162, "global_step": 33952, "epoch": 808} {"train_loss": -5.644093990325928, "global_step": 33953, "epoch": 808} {"train_loss": -5.487510681152344, "global_step": 33954, "epoch": 808} {"train_loss": -5.5725202560424805, "global_step": 33955, "epoch": 808} {"train_loss": -5.613770961761475, "global_step": 33956, "epoch": 808} {"train_loss": -5.593916416168213, "global_step": 33957, "epoch": 808} {"train_loss": -5.583665370941162, "global_step": 33958, "epoch": 808} {"train_loss": -5.537940979003906, "global_step": 33959, "epoch": 808} {"train_loss": -5.463020324707031, "global_step": 33960, "epoch": 808} {"train_loss": -5.589310646057129, "global_step": 33961, "epoch": 808} {"train_loss": -5.421350479125977, "global_step": 33962, "epoch": 808} {"train_loss": -5.346395969390869, "global_step": 33963, "epoch": 808} {"train_loss": -5.568563938140869, "global_step": 33964, "epoch": 808} {"train_loss": -5.555520534515381, "global_step": 33965, "epoch": 808} {"train_loss": -5.641725540161133, "global_step": 33966, "epoch": 808} {"train_loss": -5.451449394226074, "global_step": 33967, "epoch": 808} {"train_loss": -5.503870487213135, "global_step": 33968, "epoch": 808} {"train_loss": -5.654674053192139, "global_step": 33969, "epoch": 808} {"train_loss": -5.595822334289551, "global_step": 33970, "epoch": 808} {"train_loss": -5.638274192810059, "global_step": 33971, "epoch": 808} {"train_loss": -5.529983997344971, "global_step": 33972, "epoch": 808} {"train_loss": -5.524597644805908, "global_step": 33973, "epoch": 808} {"train_loss": -5.601869583129883, "global_step": 33974, "epoch": 808} {"train_loss": -5.50168514251709, "global_step": 33975, "epoch": 808} {"train_loss": -5.604914665222168, "global_step": 33976, "epoch": 808} {"train_loss": -5.566679000854492, "global_step": 33977, "epoch": 808, "val_loss": 66201.671875} {"train_loss": -5.467740058898926, "global_step": 33978, "epoch": 809} {"train_loss": -5.547199249267578, "global_step": 33979, "epoch": 809} {"train_loss": -5.551013469696045, "global_step": 33980, "epoch": 809} {"train_loss": -5.700151443481445, "global_step": 33981, "epoch": 809} {"train_loss": -5.6200971603393555, "global_step": 33982, "epoch": 809} {"train_loss": -5.515782356262207, "global_step": 33983, "epoch": 809} {"train_loss": -5.597236156463623, "global_step": 33984, "epoch": 809} {"train_loss": -5.645989418029785, "global_step": 33985, "epoch": 809} {"train_loss": -5.5853071212768555, "global_step": 33986, "epoch": 809} {"train_loss": -5.530398368835449, "global_step": 33987, "epoch": 809} {"train_loss": -5.4593000411987305, "global_step": 33988, "epoch": 809} {"train_loss": -5.472928047180176, "global_step": 33989, "epoch": 809} {"train_loss": -5.275141716003418, "global_step": 33990, "epoch": 809} {"train_loss": -5.502315521240234, "global_step": 33991, "epoch": 809} {"train_loss": -5.586658477783203, "global_step": 33992, "epoch": 809} {"train_loss": -5.446483135223389, "global_step": 33993, "epoch": 809} {"train_loss": -5.515504360198975, "global_step": 33994, "epoch": 809} {"train_loss": -5.462725639343262, "global_step": 33995, "epoch": 809} {"train_loss": -5.520491600036621, "global_step": 33996, "epoch": 809} {"train_loss": -5.454968452453613, "global_step": 33997, "epoch": 809} {"train_loss": -5.442893981933594, "global_step": 33998, "epoch": 809} {"train_loss": -5.535717487335205, "global_step": 33999, "epoch": 809} {"train_loss": -5.47230339050293, "global_step": 34000, "epoch": 809} {"train_loss": -5.551031589508057, "global_step": 34001, "epoch": 809} {"train_loss": -5.437748908996582, "global_step": 34002, "epoch": 809} {"train_loss": -5.500245571136475, "global_step": 34003, "epoch": 809} {"train_loss": -5.330302715301514, "global_step": 34004, "epoch": 809} {"train_loss": -5.549532890319824, "global_step": 34005, "epoch": 809} {"train_loss": -5.4150896072387695, "global_step": 34006, "epoch": 809} {"train_loss": -5.402902603149414, "global_step": 34007, "epoch": 809} {"train_loss": -5.416074275970459, "global_step": 34008, "epoch": 809} {"train_loss": -5.387884140014648, "global_step": 34009, "epoch": 809} {"train_loss": -5.411750316619873, "global_step": 34010, "epoch": 809} {"train_loss": -5.420958518981934, "global_step": 34011, "epoch": 809} {"train_loss": -5.4470391273498535, "global_step": 34012, "epoch": 809} {"train_loss": -5.315207481384277, "global_step": 34013, "epoch": 809} {"train_loss": -5.455754280090332, "global_step": 34014, "epoch": 809} {"train_loss": -5.388250350952148, "global_step": 34015, "epoch": 809} {"train_loss": -5.311485767364502, "global_step": 34016, "epoch": 809} {"train_loss": -5.38398551940918, "global_step": 34017, "epoch": 809} {"train_loss": -5.518819332122803, "global_step": 34018, "epoch": 809} {"train_loss": -5.474847838992164, "global_step": 34019, "epoch": 809, "val_loss": 67368.4453125} {"train_loss": -5.473361015319824, "global_step": 34020, "epoch": 810} {"train_loss": -5.487371444702148, "global_step": 34021, "epoch": 810} {"train_loss": -5.58209753036499, "global_step": 34022, "epoch": 810} {"train_loss": -5.51464319229126, "global_step": 34023, "epoch": 810} {"train_loss": -5.392919540405273, "global_step": 34024, "epoch": 810} {"train_loss": -5.335134983062744, "global_step": 34025, "epoch": 810} {"train_loss": -5.6005401611328125, "global_step": 34026, "epoch": 810} {"train_loss": -5.366555213928223, "global_step": 34027, "epoch": 810} {"train_loss": -5.481236457824707, "global_step": 34028, "epoch": 810} {"train_loss": -5.414700031280518, "global_step": 34029, "epoch": 810} {"train_loss": -5.645318031311035, "global_step": 34030, "epoch": 810} {"train_loss": -5.424223899841309, "global_step": 34031, "epoch": 810} {"train_loss": -5.534791469573975, "global_step": 34032, "epoch": 810} {"train_loss": -5.555943965911865, "global_step": 34033, "epoch": 810} {"train_loss": -5.635837554931641, "global_step": 34034, "epoch": 810} {"train_loss": -5.425004005432129, "global_step": 34035, "epoch": 810} {"train_loss": -5.510167598724365, "global_step": 34036, "epoch": 810} {"train_loss": -5.506839752197266, "global_step": 34037, "epoch": 810} {"train_loss": -5.45553731918335, "global_step": 34038, "epoch": 810} {"train_loss": -5.472372531890869, "global_step": 34039, "epoch": 810} {"train_loss": -5.510744094848633, "global_step": 34040, "epoch": 810} {"train_loss": -5.627130031585693, "global_step": 34041, "epoch": 810} {"train_loss": -5.436141014099121, "global_step": 34042, "epoch": 810} {"train_loss": -5.4753499031066895, "global_step": 34043, "epoch": 810} {"train_loss": -5.417255401611328, "global_step": 34044, "epoch": 810} {"train_loss": -5.391666412353516, "global_step": 34045, "epoch": 810} {"train_loss": -5.532037258148193, "global_step": 34046, "epoch": 810} {"train_loss": -5.467756271362305, "global_step": 34047, "epoch": 810} {"train_loss": -5.516915798187256, "global_step": 34048, "epoch": 810} {"train_loss": -5.583982467651367, "global_step": 34049, "epoch": 810} {"train_loss": -5.492489337921143, "global_step": 34050, "epoch": 810} {"train_loss": -5.441945552825928, "global_step": 34051, "epoch": 810} {"train_loss": -5.6116862297058105, "global_step": 34052, "epoch": 810} {"train_loss": -5.565617561340332, "global_step": 34053, "epoch": 810} {"train_loss": -5.533267021179199, "global_step": 34054, "epoch": 810} {"train_loss": -5.637847900390625, "global_step": 34055, "epoch": 810} {"train_loss": -5.5231404304504395, "global_step": 34056, "epoch": 810} {"train_loss": -5.598341464996338, "global_step": 34057, "epoch": 810} {"train_loss": -5.589273452758789, "global_step": 34058, "epoch": 810} {"train_loss": -5.615724563598633, "global_step": 34059, "epoch": 810} {"train_loss": -5.6158671379089355, "global_step": 34060, "epoch": 810} {"train_loss": -5.511183852241153, "global_step": 34061, "epoch": 810, "val_loss": 66745.3828125} {"train_loss": -5.610357761383057, "global_step": 34062, "epoch": 811} {"train_loss": -5.551792144775391, "global_step": 34063, "epoch": 811} {"train_loss": -5.510654449462891, "global_step": 34064, "epoch": 811} {"train_loss": -5.780223846435547, "global_step": 34065, "epoch": 811} {"train_loss": -5.529598236083984, "global_step": 34066, "epoch": 811} {"train_loss": -5.454775810241699, "global_step": 34067, "epoch": 811} {"train_loss": -5.5515971183776855, "global_step": 34068, "epoch": 811} {"train_loss": -5.546704292297363, "global_step": 34069, "epoch": 811} {"train_loss": -5.522703170776367, "global_step": 34070, "epoch": 811} {"train_loss": -5.515743255615234, "global_step": 34071, "epoch": 811} {"train_loss": -5.531418800354004, "global_step": 34072, "epoch": 811} {"train_loss": -5.500439643859863, "global_step": 34073, "epoch": 811} {"train_loss": -5.589198589324951, "global_step": 34074, "epoch": 811} {"train_loss": -5.562564849853516, "global_step": 34075, "epoch": 811} {"train_loss": -5.405441761016846, "global_step": 34076, "epoch": 811} {"train_loss": -5.6198296546936035, "global_step": 34077, "epoch": 811} {"train_loss": -5.5348052978515625, "global_step": 34078, "epoch": 811} {"train_loss": -5.636085510253906, "global_step": 34079, "epoch": 811} {"train_loss": -5.500292778015137, "global_step": 34080, "epoch": 811} {"train_loss": -5.433537483215332, "global_step": 34081, "epoch": 811} {"train_loss": -5.658356666564941, "global_step": 34082, "epoch": 811} {"train_loss": -5.61154317855835, "global_step": 34083, "epoch": 811} {"train_loss": -5.6032609939575195, "global_step": 34084, "epoch": 811} {"train_loss": -5.518023490905762, "global_step": 34085, "epoch": 811} {"train_loss": -5.529026985168457, "global_step": 34086, "epoch": 811} {"train_loss": -5.434971809387207, "global_step": 34087, "epoch": 811} {"train_loss": -5.470786094665527, "global_step": 34088, "epoch": 811} {"train_loss": -5.450557708740234, "global_step": 34089, "epoch": 811} {"train_loss": -5.634666919708252, "global_step": 34090, "epoch": 811} {"train_loss": -5.521764278411865, "global_step": 34091, "epoch": 811} {"train_loss": -5.553889274597168, "global_step": 34092, "epoch": 811} {"train_loss": -5.379161834716797, "global_step": 34093, "epoch": 811} {"train_loss": -5.402097702026367, "global_step": 34094, "epoch": 811} {"train_loss": -5.434210777282715, "global_step": 34095, "epoch": 811} {"train_loss": -5.489104270935059, "global_step": 34096, "epoch": 811} {"train_loss": -5.615224838256836, "global_step": 34097, "epoch": 811} {"train_loss": -5.575331211090088, "global_step": 34098, "epoch": 811} {"train_loss": -5.388527870178223, "global_step": 34099, "epoch": 811} {"train_loss": -5.457858085632324, "global_step": 34100, "epoch": 811} {"train_loss": -5.599387168884277, "global_step": 34101, "epoch": 811} {"train_loss": -5.471485137939453, "global_step": 34102, "epoch": 811} {"train_loss": -5.526189713251023, "global_step": 34103, "epoch": 811, "val_loss": 66753.1328125} {"train_loss": -5.5643768310546875, "global_step": 34104, "epoch": 812} {"train_loss": -5.433259963989258, "global_step": 34105, "epoch": 812} {"train_loss": -5.5252485275268555, "global_step": 34106, "epoch": 812} {"train_loss": -5.497479438781738, "global_step": 34107, "epoch": 812} {"train_loss": -5.576744079589844, "global_step": 34108, "epoch": 812} {"train_loss": -5.548438549041748, "global_step": 34109, "epoch": 812} {"train_loss": -5.500628471374512, "global_step": 34110, "epoch": 812} {"train_loss": -5.479634761810303, "global_step": 34111, "epoch": 812} {"train_loss": -5.383233070373535, "global_step": 34112, "epoch": 812} {"train_loss": -5.507989883422852, "global_step": 34113, "epoch": 812} {"train_loss": -5.6040239334106445, "global_step": 34114, "epoch": 812} {"train_loss": -5.517606258392334, "global_step": 34115, "epoch": 812} {"train_loss": -5.482156276702881, "global_step": 34116, "epoch": 812} {"train_loss": -5.615478515625, "global_step": 34117, "epoch": 812} {"train_loss": -5.520434379577637, "global_step": 34118, "epoch": 812} {"train_loss": -5.520595550537109, "global_step": 34119, "epoch": 812} {"train_loss": -5.586667537689209, "global_step": 34120, "epoch": 812} {"train_loss": -5.511073112487793, "global_step": 34121, "epoch": 812} {"train_loss": -5.670288562774658, "global_step": 34122, "epoch": 812} {"train_loss": -5.5188493728637695, "global_step": 34123, "epoch": 812} {"train_loss": -5.534615516662598, "global_step": 34124, "epoch": 812} {"train_loss": -5.577350616455078, "global_step": 34125, "epoch": 812} {"train_loss": -5.5273823738098145, "global_step": 34126, "epoch": 812} {"train_loss": -5.55694580078125, "global_step": 34127, "epoch": 812} {"train_loss": -5.552333354949951, "global_step": 34128, "epoch": 812} {"train_loss": -5.490139007568359, "global_step": 34129, "epoch": 812} {"train_loss": -5.526957988739014, "global_step": 34130, "epoch": 812} {"train_loss": -5.61170768737793, "global_step": 34131, "epoch": 812} {"train_loss": -5.4400410652160645, "global_step": 34132, "epoch": 812} {"train_loss": -5.572419166564941, "global_step": 34133, "epoch": 812} {"train_loss": -5.499210357666016, "global_step": 34134, "epoch": 812} {"train_loss": -5.567914009094238, "global_step": 34135, "epoch": 812} {"train_loss": -5.508835315704346, "global_step": 34136, "epoch": 812} {"train_loss": -5.484480857849121, "global_step": 34137, "epoch": 812} {"train_loss": -5.546915531158447, "global_step": 34138, "epoch": 812} {"train_loss": -5.625368118286133, "global_step": 34139, "epoch": 812} {"train_loss": -5.611358642578125, "global_step": 34140, "epoch": 812} {"train_loss": -5.518139839172363, "global_step": 34141, "epoch": 812} {"train_loss": -5.594305038452148, "global_step": 34142, "epoch": 812} {"train_loss": -5.409407615661621, "global_step": 34143, "epoch": 812} {"train_loss": -5.695365905761719, "global_step": 34144, "epoch": 812} {"train_loss": -5.536791880925496, "global_step": 34145, "epoch": 812, "val_loss": 66264.6875} {"train_loss": -5.58144474029541, "global_step": 34146, "epoch": 813} {"train_loss": -5.676541805267334, "global_step": 34147, "epoch": 813} {"train_loss": -5.804137706756592, "global_step": 34148, "epoch": 813} {"train_loss": -5.560370922088623, "global_step": 34149, "epoch": 813} {"train_loss": -5.470701694488525, "global_step": 34150, "epoch": 813} {"train_loss": -5.589016437530518, "global_step": 34151, "epoch": 813} {"train_loss": -5.573651313781738, "global_step": 34152, "epoch": 813} {"train_loss": -5.633604049682617, "global_step": 34153, "epoch": 813} {"train_loss": -5.681291103363037, "global_step": 34154, "epoch": 813} {"train_loss": -5.5946831703186035, "global_step": 34155, "epoch": 813} {"train_loss": -5.578073501586914, "global_step": 34156, "epoch": 813} {"train_loss": -5.423150062561035, "global_step": 34157, "epoch": 813} {"train_loss": -5.432612419128418, "global_step": 34158, "epoch": 813} {"train_loss": -5.531181335449219, "global_step": 34159, "epoch": 813} {"train_loss": -5.550200939178467, "global_step": 34160, "epoch": 813} {"train_loss": -5.433587074279785, "global_step": 34161, "epoch": 813} {"train_loss": -5.574295520782471, "global_step": 34162, "epoch": 813} {"train_loss": -5.42943000793457, "global_step": 34163, "epoch": 813} {"train_loss": -5.6129584312438965, "global_step": 34164, "epoch": 813} {"train_loss": -5.517873764038086, "global_step": 34165, "epoch": 813} {"train_loss": -5.548285007476807, "global_step": 34166, "epoch": 813} {"train_loss": -5.665888786315918, "global_step": 34167, "epoch": 813} {"train_loss": -5.559638023376465, "global_step": 34168, "epoch": 813} {"train_loss": -5.467365264892578, "global_step": 34169, "epoch": 813} {"train_loss": -5.601207733154297, "global_step": 34170, "epoch": 813} {"train_loss": -5.516707420349121, "global_step": 34171, "epoch": 813} {"train_loss": -5.486871719360352, "global_step": 34172, "epoch": 813} {"train_loss": -5.521963119506836, "global_step": 34173, "epoch": 813} {"train_loss": -5.5477447509765625, "global_step": 34174, "epoch": 813} {"train_loss": -5.47462272644043, "global_step": 34175, "epoch": 813} {"train_loss": -5.4969987869262695, "global_step": 34176, "epoch": 813} {"train_loss": -5.563191890716553, "global_step": 34177, "epoch": 813} {"train_loss": -5.6096296310424805, "global_step": 34178, "epoch": 813} {"train_loss": -5.443958282470703, "global_step": 34179, "epoch": 813} {"train_loss": -5.535547256469727, "global_step": 34180, "epoch": 813} {"train_loss": -5.480030059814453, "global_step": 34181, "epoch": 813} {"train_loss": -5.573570251464844, "global_step": 34182, "epoch": 813} {"train_loss": -5.5923752784729, "global_step": 34183, "epoch": 813} {"train_loss": -5.385556697845459, "global_step": 34184, "epoch": 813} {"train_loss": -5.747046947479248, "global_step": 34185, "epoch": 813} {"train_loss": -5.4904255867004395, "global_step": 34186, "epoch": 813} {"train_loss": -5.548098246256511, "global_step": 34187, "epoch": 813, "val_loss": 66443.6015625} {"train_loss": -5.66716194152832, "global_step": 34188, "epoch": 814} {"train_loss": -5.4356818199157715, "global_step": 34189, "epoch": 814} {"train_loss": -5.48614501953125, "global_step": 34190, "epoch": 814} {"train_loss": -5.477389812469482, "global_step": 34191, "epoch": 814} {"train_loss": -5.593020439147949, "global_step": 34192, "epoch": 814} {"train_loss": -5.565661907196045, "global_step": 34193, "epoch": 814} {"train_loss": -5.543104648590088, "global_step": 34194, "epoch": 814} {"train_loss": -5.5904364585876465, "global_step": 34195, "epoch": 814} {"train_loss": -5.497740745544434, "global_step": 34196, "epoch": 814} {"train_loss": -5.484311580657959, "global_step": 34197, "epoch": 814} {"train_loss": -5.65041446685791, "global_step": 34198, "epoch": 814} {"train_loss": -5.5117387771606445, "global_step": 34199, "epoch": 814} {"train_loss": -5.627350330352783, "global_step": 34200, "epoch": 814} {"train_loss": -5.457040786743164, "global_step": 34201, "epoch": 814} {"train_loss": -5.551922798156738, "global_step": 34202, "epoch": 814} {"train_loss": -5.53546142578125, "global_step": 34203, "epoch": 814} {"train_loss": -5.4563164710998535, "global_step": 34204, "epoch": 814} {"train_loss": -5.500570297241211, "global_step": 34205, "epoch": 814} {"train_loss": -5.597843170166016, "global_step": 34206, "epoch": 814} {"train_loss": -5.433722496032715, "global_step": 34207, "epoch": 814} {"train_loss": -5.633985996246338, "global_step": 34208, "epoch": 814} {"train_loss": -5.518224716186523, "global_step": 34209, "epoch": 814} {"train_loss": -5.517734050750732, "global_step": 34210, "epoch": 814} {"train_loss": -5.6096415519714355, "global_step": 34211, "epoch": 814} {"train_loss": -5.449163436889648, "global_step": 34212, "epoch": 814} {"train_loss": -5.618365287780762, "global_step": 34213, "epoch": 814} {"train_loss": -5.431872367858887, "global_step": 34214, "epoch": 814} {"train_loss": -5.47955322265625, "global_step": 34215, "epoch": 814} {"train_loss": -5.540514945983887, "global_step": 34216, "epoch": 814} {"train_loss": -5.564190864562988, "global_step": 34217, "epoch": 814} {"train_loss": -5.518543243408203, "global_step": 34218, "epoch": 814} {"train_loss": -5.4125800132751465, "global_step": 34219, "epoch": 814} {"train_loss": -5.379509925842285, "global_step": 34220, "epoch": 814} {"train_loss": -5.644672870635986, "global_step": 34221, "epoch": 814} {"train_loss": -5.482840061187744, "global_step": 34222, "epoch": 814} {"train_loss": -5.446613788604736, "global_step": 34223, "epoch": 814} {"train_loss": -5.553043842315674, "global_step": 34224, "epoch": 814} {"train_loss": -5.449638366699219, "global_step": 34225, "epoch": 814} {"train_loss": -5.428680419921875, "global_step": 34226, "epoch": 814} {"train_loss": -5.573239326477051, "global_step": 34227, "epoch": 814} {"train_loss": -5.645153045654297, "global_step": 34228, "epoch": 814} {"train_loss": -5.526806036631267, "global_step": 34229, "epoch": 814, "val_loss": 66265.3125} {"train_loss": -5.588211536407471, "global_step": 34230, "epoch": 815} {"train_loss": -5.448761940002441, "global_step": 34231, "epoch": 815} {"train_loss": -5.559099197387695, "global_step": 34232, "epoch": 815} {"train_loss": -5.502168655395508, "global_step": 34233, "epoch": 815} {"train_loss": -5.538936614990234, "global_step": 34234, "epoch": 815} {"train_loss": -5.687426567077637, "global_step": 34235, "epoch": 815} {"train_loss": -5.470817565917969, "global_step": 34236, "epoch": 815} {"train_loss": -5.617837429046631, "global_step": 34237, "epoch": 815} {"train_loss": -5.563085556030273, "global_step": 34238, "epoch": 815} {"train_loss": -5.4708075523376465, "global_step": 34239, "epoch": 815} {"train_loss": -5.497336387634277, "global_step": 34240, "epoch": 815} {"train_loss": -5.552462100982666, "global_step": 34241, "epoch": 815} {"train_loss": -5.527727127075195, "global_step": 34242, "epoch": 815} {"train_loss": -5.582824230194092, "global_step": 34243, "epoch": 815} {"train_loss": -5.563106060028076, "global_step": 34244, "epoch": 815} {"train_loss": -5.511889457702637, "global_step": 34245, "epoch": 815} {"train_loss": -5.5585618019104, "global_step": 34246, "epoch": 815} {"train_loss": -5.835258960723877, "global_step": 34247, "epoch": 815} {"train_loss": -5.608246803283691, "global_step": 34248, "epoch": 815} {"train_loss": -5.534146308898926, "global_step": 34249, "epoch": 815} {"train_loss": -5.5312299728393555, "global_step": 34250, "epoch": 815} {"train_loss": -5.542702674865723, "global_step": 34251, "epoch": 815} {"train_loss": -5.560047149658203, "global_step": 34252, "epoch": 815} {"train_loss": -5.529762268066406, "global_step": 34253, "epoch": 815} {"train_loss": -5.616418838500977, "global_step": 34254, "epoch": 815} {"train_loss": -5.629681587219238, "global_step": 34255, "epoch": 815} {"train_loss": -5.377542018890381, "global_step": 34256, "epoch": 815} {"train_loss": -5.4203290939331055, "global_step": 34257, "epoch": 815} {"train_loss": -5.438727855682373, "global_step": 34258, "epoch": 815} {"train_loss": -5.481925010681152, "global_step": 34259, "epoch": 815} {"train_loss": -5.423343658447266, "global_step": 34260, "epoch": 815} {"train_loss": -5.469345569610596, "global_step": 34261, "epoch": 815} {"train_loss": -5.462153434753418, "global_step": 34262, "epoch": 815} {"train_loss": -5.516107082366943, "global_step": 34263, "epoch": 815} {"train_loss": -5.428647994995117, "global_step": 34264, "epoch": 815} {"train_loss": -5.440121650695801, "global_step": 34265, "epoch": 815} {"train_loss": -5.457768440246582, "global_step": 34266, "epoch": 815} {"train_loss": -5.544553756713867, "global_step": 34267, "epoch": 815} {"train_loss": -5.621715068817139, "global_step": 34268, "epoch": 815} {"train_loss": -5.57819938659668, "global_step": 34269, "epoch": 815} {"train_loss": -5.541926860809326, "global_step": 34270, "epoch": 815} {"train_loss": -5.532879261743455, "global_step": 34271, "epoch": 815, "val_loss": 66323.765625} {"train_loss": -5.494598388671875, "global_step": 34272, "epoch": 816} {"train_loss": -5.592979431152344, "global_step": 34273, "epoch": 816} {"train_loss": -5.6163225173950195, "global_step": 34274, "epoch": 816} {"train_loss": -5.502636432647705, "global_step": 34275, "epoch": 816} {"train_loss": -5.494367599487305, "global_step": 34276, "epoch": 816} {"train_loss": -5.514854907989502, "global_step": 34277, "epoch": 816} {"train_loss": -5.535665035247803, "global_step": 34278, "epoch": 816} {"train_loss": -5.58380126953125, "global_step": 34279, "epoch": 816} {"train_loss": -5.496554374694824, "global_step": 34280, "epoch": 816} {"train_loss": -5.549503326416016, "global_step": 34281, "epoch": 816} {"train_loss": -5.535049915313721, "global_step": 34282, "epoch": 816} {"train_loss": -5.60595703125, "global_step": 34283, "epoch": 816} {"train_loss": -5.357179641723633, "global_step": 34284, "epoch": 816} {"train_loss": -5.549144268035889, "global_step": 34285, "epoch": 816} {"train_loss": -5.423279762268066, "global_step": 34286, "epoch": 816} {"train_loss": -5.570273399353027, "global_step": 34287, "epoch": 816} {"train_loss": -5.488160610198975, "global_step": 34288, "epoch": 816} {"train_loss": -5.597712993621826, "global_step": 34289, "epoch": 816} {"train_loss": -5.468498706817627, "global_step": 34290, "epoch": 816} {"train_loss": -5.61466121673584, "global_step": 34291, "epoch": 816} {"train_loss": -5.673186302185059, "global_step": 34292, "epoch": 816} {"train_loss": -5.649544715881348, "global_step": 34293, "epoch": 816} {"train_loss": -5.514758586883545, "global_step": 34294, "epoch": 816} {"train_loss": -5.54624605178833, "global_step": 34295, "epoch": 816} {"train_loss": -5.468418121337891, "global_step": 34296, "epoch": 816} {"train_loss": -5.6529541015625, "global_step": 34297, "epoch": 816} {"train_loss": -5.794568061828613, "global_step": 34298, "epoch": 816} {"train_loss": -5.566839218139648, "global_step": 34299, "epoch": 816} {"train_loss": -5.466115951538086, "global_step": 34300, "epoch": 816} {"train_loss": -5.676957130432129, "global_step": 34301, "epoch": 816} {"train_loss": -5.563750267028809, "global_step": 34302, "epoch": 816} {"train_loss": -5.460843086242676, "global_step": 34303, "epoch": 816} {"train_loss": -5.347022533416748, "global_step": 34304, "epoch": 816} {"train_loss": -5.593816757202148, "global_step": 34305, "epoch": 816} {"train_loss": -5.591739654541016, "global_step": 34306, "epoch": 816} {"train_loss": -5.472407341003418, "global_step": 34307, "epoch": 816} {"train_loss": -5.626955986022949, "global_step": 34308, "epoch": 816} {"train_loss": -5.594013690948486, "global_step": 34309, "epoch": 816} {"train_loss": -5.636040687561035, "global_step": 34310, "epoch": 816} {"train_loss": -5.506171703338623, "global_step": 34311, "epoch": 816} {"train_loss": -5.476556777954102, "global_step": 34312, "epoch": 816} {"train_loss": -5.5501737254006525, "global_step": 34313, "epoch": 816, "val_loss": 66519.2578125} {"train_loss": -5.422512054443359, "global_step": 34314, "epoch": 817} {"train_loss": -5.582886695861816, "global_step": 34315, "epoch": 817} {"train_loss": -5.533712387084961, "global_step": 34316, "epoch": 817} {"train_loss": -5.644798278808594, "global_step": 34317, "epoch": 817} {"train_loss": -5.613585472106934, "global_step": 34318, "epoch": 817} {"train_loss": -5.537057876586914, "global_step": 34319, "epoch": 817} {"train_loss": -5.618940353393555, "global_step": 34320, "epoch": 817} {"train_loss": -5.497426509857178, "global_step": 34321, "epoch": 817} {"train_loss": -5.487339973449707, "global_step": 34322, "epoch": 817} {"train_loss": -5.548577785491943, "global_step": 34323, "epoch": 817} {"train_loss": -5.505661964416504, "global_step": 34324, "epoch": 817} {"train_loss": -5.428068161010742, "global_step": 34325, "epoch": 817} {"train_loss": -5.453643321990967, "global_step": 34326, "epoch": 817} {"train_loss": -5.602572441101074, "global_step": 34327, "epoch": 817} {"train_loss": -5.565006256103516, "global_step": 34328, "epoch": 817} {"train_loss": -5.505455017089844, "global_step": 34329, "epoch": 817} {"train_loss": -5.4021148681640625, "global_step": 34330, "epoch": 817} {"train_loss": -5.49515962600708, "global_step": 34331, "epoch": 817} {"train_loss": -5.619218826293945, "global_step": 34332, "epoch": 817} {"train_loss": -5.566683769226074, "global_step": 34333, "epoch": 817} {"train_loss": -5.561185836791992, "global_step": 34334, "epoch": 817} {"train_loss": -5.499509811401367, "global_step": 34335, "epoch": 817} {"train_loss": -5.553937911987305, "global_step": 34336, "epoch": 817} {"train_loss": -5.683438301086426, "global_step": 34337, "epoch": 817} {"train_loss": -5.553967475891113, "global_step": 34338, "epoch": 817} {"train_loss": -5.609819412231445, "global_step": 34339, "epoch": 817} {"train_loss": -5.556938171386719, "global_step": 34340, "epoch": 817} {"train_loss": -5.5947160720825195, "global_step": 34341, "epoch": 817} {"train_loss": -5.459386825561523, "global_step": 34342, "epoch": 817} {"train_loss": -5.535606384277344, "global_step": 34343, "epoch": 817} {"train_loss": -5.547850608825684, "global_step": 34344, "epoch": 817} {"train_loss": -5.58497428894043, "global_step": 34345, "epoch": 817} {"train_loss": -5.542553901672363, "global_step": 34346, "epoch": 817} {"train_loss": -5.598490238189697, "global_step": 34347, "epoch": 817} {"train_loss": -5.549843788146973, "global_step": 34348, "epoch": 817} {"train_loss": -5.52168083190918, "global_step": 34349, "epoch": 817} {"train_loss": -5.554013252258301, "global_step": 34350, "epoch": 817} {"train_loss": -5.648643493652344, "global_step": 34351, "epoch": 817} {"train_loss": -5.5106000900268555, "global_step": 34352, "epoch": 817} {"train_loss": -5.560432434082031, "global_step": 34353, "epoch": 817} {"train_loss": -5.604063987731934, "global_step": 34354, "epoch": 817} {"train_loss": -5.5515948704310825, "global_step": 34355, "epoch": 817, "val_loss": 66489.015625} {"train_loss": -5.5147294998168945, "global_step": 34356, "epoch": 818} {"train_loss": -5.489282131195068, "global_step": 34357, "epoch": 818} {"train_loss": -5.595765113830566, "global_step": 34358, "epoch": 818} {"train_loss": -5.61585807800293, "global_step": 34359, "epoch": 818} {"train_loss": -5.634235858917236, "global_step": 34360, "epoch": 818} {"train_loss": -5.655736446380615, "global_step": 34361, "epoch": 818} {"train_loss": -5.492327690124512, "global_step": 34362, "epoch": 818} {"train_loss": -5.51529598236084, "global_step": 34363, "epoch": 818} {"train_loss": -5.584406852722168, "global_step": 34364, "epoch": 818} {"train_loss": -5.497556686401367, "global_step": 34365, "epoch": 818} {"train_loss": -5.643750190734863, "global_step": 34366, "epoch": 818} {"train_loss": -5.6410417556762695, "global_step": 34367, "epoch": 818} {"train_loss": -5.562016487121582, "global_step": 34368, "epoch": 818} {"train_loss": -5.5472917556762695, "global_step": 34369, "epoch": 818} {"train_loss": -5.708144187927246, "global_step": 34370, "epoch": 818} {"train_loss": -5.646332740783691, "global_step": 34371, "epoch": 818} {"train_loss": -5.471475601196289, "global_step": 34372, "epoch": 818} {"train_loss": -5.54619836807251, "global_step": 34373, "epoch": 818} {"train_loss": -5.373112678527832, "global_step": 34374, "epoch": 818} {"train_loss": -5.5637617111206055, "global_step": 34375, "epoch": 818} {"train_loss": -5.5409464836120605, "global_step": 34376, "epoch": 818} {"train_loss": -5.372381210327148, "global_step": 34377, "epoch": 818} {"train_loss": -5.560643196105957, "global_step": 34378, "epoch": 818} {"train_loss": -5.513940811157227, "global_step": 34379, "epoch": 818} {"train_loss": -5.401140213012695, "global_step": 34380, "epoch": 818} {"train_loss": -5.6684160232543945, "global_step": 34381, "epoch": 818} {"train_loss": -5.4159932136535645, "global_step": 34382, "epoch": 818} {"train_loss": -5.669536590576172, "global_step": 34383, "epoch": 818} {"train_loss": -5.638040542602539, "global_step": 34384, "epoch": 818} {"train_loss": -5.459819793701172, "global_step": 34385, "epoch": 818} {"train_loss": -5.515432834625244, "global_step": 34386, "epoch": 818} {"train_loss": -5.504135608673096, "global_step": 34387, "epoch": 818} {"train_loss": -5.562840461730957, "global_step": 34388, "epoch": 818} {"train_loss": -5.524365425109863, "global_step": 34389, "epoch": 818} {"train_loss": -5.456090450286865, "global_step": 34390, "epoch": 818} {"train_loss": -5.3972063064575195, "global_step": 34391, "epoch": 818} {"train_loss": -5.424655914306641, "global_step": 34392, "epoch": 818} {"train_loss": -5.4200286865234375, "global_step": 34393, "epoch": 818} {"train_loss": -5.442789077758789, "global_step": 34394, "epoch": 818} {"train_loss": -5.530879974365234, "global_step": 34395, "epoch": 818} {"train_loss": -5.548229217529297, "global_step": 34396, "epoch": 818} {"train_loss": -5.535760334559849, "global_step": 34397, "epoch": 818, "val_loss": 66645.3046875} {"train_loss": -5.589914798736572, "global_step": 34398, "epoch": 819} {"train_loss": -5.567742347717285, "global_step": 34399, "epoch": 819} {"train_loss": -5.596812725067139, "global_step": 34400, "epoch": 819} {"train_loss": -5.536312103271484, "global_step": 34401, "epoch": 819} {"train_loss": -5.688933849334717, "global_step": 34402, "epoch": 819} {"train_loss": -5.583270072937012, "global_step": 34403, "epoch": 819} {"train_loss": -5.569717884063721, "global_step": 34404, "epoch": 819} {"train_loss": -5.551778316497803, "global_step": 34405, "epoch": 819} {"train_loss": -5.558706283569336, "global_step": 34406, "epoch": 819} {"train_loss": -5.508116245269775, "global_step": 34407, "epoch": 819} {"train_loss": -5.447541236877441, "global_step": 34408, "epoch": 819} {"train_loss": -5.558899879455566, "global_step": 34409, "epoch": 819} {"train_loss": -5.561180114746094, "global_step": 34410, "epoch": 819} {"train_loss": -5.490867614746094, "global_step": 34411, "epoch": 819} {"train_loss": -5.634940147399902, "global_step": 34412, "epoch": 819} {"train_loss": -5.629066467285156, "global_step": 34413, "epoch": 819} {"train_loss": -5.553470611572266, "global_step": 34414, "epoch": 819} {"train_loss": -5.4631476402282715, "global_step": 34415, "epoch": 819} {"train_loss": -5.613251686096191, "global_step": 34416, "epoch": 819} {"train_loss": -5.615873336791992, "global_step": 34417, "epoch": 819} {"train_loss": -5.50086784362793, "global_step": 34418, "epoch": 819} {"train_loss": -5.559494972229004, "global_step": 34419, "epoch": 819} {"train_loss": -5.6682820320129395, "global_step": 34420, "epoch": 819} {"train_loss": -5.64616060256958, "global_step": 34421, "epoch": 819} {"train_loss": -5.490986347198486, "global_step": 34422, "epoch": 819} {"train_loss": -5.587827682495117, "global_step": 34423, "epoch": 819} {"train_loss": -5.4616594314575195, "global_step": 34424, "epoch": 819} {"train_loss": -5.469635963439941, "global_step": 34425, "epoch": 819} {"train_loss": -5.569778919219971, "global_step": 34426, "epoch": 819} {"train_loss": -5.607865333557129, "global_step": 34427, "epoch": 819} {"train_loss": -5.600818634033203, "global_step": 34428, "epoch": 819} {"train_loss": -5.482834815979004, "global_step": 34429, "epoch": 819} {"train_loss": -5.46073055267334, "global_step": 34430, "epoch": 819} {"train_loss": -5.516088485717773, "global_step": 34431, "epoch": 819} {"train_loss": -5.595761299133301, "global_step": 34432, "epoch": 819} {"train_loss": -5.639688968658447, "global_step": 34433, "epoch": 819} {"train_loss": -5.485860347747803, "global_step": 34434, "epoch": 819} {"train_loss": -5.527673721313477, "global_step": 34435, "epoch": 819} {"train_loss": -5.467645168304443, "global_step": 34436, "epoch": 819} {"train_loss": -5.497998237609863, "global_step": 34437, "epoch": 819} {"train_loss": -5.55333137512207, "global_step": 34438, "epoch": 819} {"train_loss": -5.5519691081274125, "global_step": 34439, "epoch": 819, "val_loss": 66931.6015625} {"train_loss": -5.706821441650391, "global_step": 34440, "epoch": 820} {"train_loss": -5.50666618347168, "global_step": 34441, "epoch": 820} {"train_loss": -5.580653190612793, "global_step": 34442, "epoch": 820} {"train_loss": -5.514997482299805, "global_step": 34443, "epoch": 820} {"train_loss": -5.565151214599609, "global_step": 34444, "epoch": 820} {"train_loss": -5.631458759307861, "global_step": 34445, "epoch": 820} {"train_loss": -5.525490760803223, "global_step": 34446, "epoch": 820} {"train_loss": -5.6115007400512695, "global_step": 34447, "epoch": 820} {"train_loss": -5.45733642578125, "global_step": 34448, "epoch": 820} {"train_loss": -5.608851432800293, "global_step": 34449, "epoch": 820} {"train_loss": -5.411661624908447, "global_step": 34450, "epoch": 820} {"train_loss": -5.708861827850342, "global_step": 34451, "epoch": 820} {"train_loss": -5.497074127197266, "global_step": 34452, "epoch": 820} {"train_loss": -5.597915172576904, "global_step": 34453, "epoch": 820} {"train_loss": -5.483821868896484, "global_step": 34454, "epoch": 820} {"train_loss": -5.536451816558838, "global_step": 34455, "epoch": 820} {"train_loss": -5.612071514129639, "global_step": 34456, "epoch": 820} {"train_loss": -5.546313285827637, "global_step": 34457, "epoch": 820} {"train_loss": -5.578326225280762, "global_step": 34458, "epoch": 820} {"train_loss": -5.615163803100586, "global_step": 34459, "epoch": 820} {"train_loss": -5.510083198547363, "global_step": 34460, "epoch": 820} {"train_loss": -5.521337032318115, "global_step": 34461, "epoch": 820} {"train_loss": -5.5799055099487305, "global_step": 34462, "epoch": 820} {"train_loss": -5.451346397399902, "global_step": 34463, "epoch": 820} {"train_loss": -5.608216285705566, "global_step": 34464, "epoch": 820} {"train_loss": -5.484584808349609, "global_step": 34465, "epoch": 820} {"train_loss": -5.467661380767822, "global_step": 34466, "epoch": 820} {"train_loss": -5.507670879364014, "global_step": 34467, "epoch": 820} {"train_loss": -5.5464887619018555, "global_step": 34468, "epoch": 820} {"train_loss": -5.604829788208008, "global_step": 34469, "epoch": 820} {"train_loss": -5.55136775970459, "global_step": 34470, "epoch": 820} {"train_loss": -5.521803855895996, "global_step": 34471, "epoch": 820} {"train_loss": -5.52922248840332, "global_step": 34472, "epoch": 820} {"train_loss": -5.344115257263184, "global_step": 34473, "epoch": 820} {"train_loss": -5.525843143463135, "global_step": 34474, "epoch": 820} {"train_loss": -5.585983753204346, "global_step": 34475, "epoch": 820} {"train_loss": -5.531159400939941, "global_step": 34476, "epoch": 820} {"train_loss": -5.505853652954102, "global_step": 34477, "epoch": 820} {"train_loss": -5.539399147033691, "global_step": 34478, "epoch": 820} {"train_loss": -5.564300537109375, "global_step": 34479, "epoch": 820} {"train_loss": -5.570868015289307, "global_step": 34480, "epoch": 820} {"train_loss": -5.547240631920951, "global_step": 34481, "epoch": 820, "val_loss": 67045.484375} {"train_loss": -5.536940097808838, "global_step": 34482, "epoch": 821} {"train_loss": -5.396844387054443, "global_step": 34483, "epoch": 821} {"train_loss": -5.681031703948975, "global_step": 34484, "epoch": 821} {"train_loss": -5.605661392211914, "global_step": 34485, "epoch": 821} {"train_loss": -5.442269325256348, "global_step": 34486, "epoch": 821} {"train_loss": -5.488741874694824, "global_step": 34487, "epoch": 821} {"train_loss": -5.5465779304504395, "global_step": 34488, "epoch": 821} {"train_loss": -5.533007621765137, "global_step": 34489, "epoch": 821} {"train_loss": -5.651717185974121, "global_step": 34490, "epoch": 821} {"train_loss": -5.548761367797852, "global_step": 34491, "epoch": 821} {"train_loss": -5.372402191162109, "global_step": 34492, "epoch": 821} {"train_loss": -5.543416976928711, "global_step": 34493, "epoch": 821} {"train_loss": -5.643644332885742, "global_step": 34494, "epoch": 821} {"train_loss": -5.539571762084961, "global_step": 34495, "epoch": 821} {"train_loss": -5.463413238525391, "global_step": 34496, "epoch": 821} {"train_loss": -5.502321243286133, "global_step": 34497, "epoch": 821} {"train_loss": -5.462940692901611, "global_step": 34498, "epoch": 821} {"train_loss": -5.507857799530029, "global_step": 34499, "epoch": 821} {"train_loss": -5.465080261230469, "global_step": 34500, "epoch": 821} {"train_loss": -5.431616306304932, "global_step": 34501, "epoch": 821} {"train_loss": -5.438859939575195, "global_step": 34502, "epoch": 821} {"train_loss": -5.375997066497803, "global_step": 34503, "epoch": 821} {"train_loss": -5.55823278427124, "global_step": 34504, "epoch": 821} {"train_loss": -5.574031829833984, "global_step": 34505, "epoch": 821} {"train_loss": -5.710322380065918, "global_step": 34506, "epoch": 821} {"train_loss": -5.527846336364746, "global_step": 34507, "epoch": 821} {"train_loss": -5.398176193237305, "global_step": 34508, "epoch": 821} {"train_loss": -5.544243812561035, "global_step": 34509, "epoch": 821} {"train_loss": -5.636683464050293, "global_step": 34510, "epoch": 821} {"train_loss": -5.465756416320801, "global_step": 34511, "epoch": 821} {"train_loss": -5.460716724395752, "global_step": 34512, "epoch": 821} {"train_loss": -5.53042459487915, "global_step": 34513, "epoch": 821} {"train_loss": -5.536777973175049, "global_step": 34514, "epoch": 821} {"train_loss": -5.5521111488342285, "global_step": 34515, "epoch": 821} {"train_loss": -5.569401741027832, "global_step": 34516, "epoch": 821} {"train_loss": -5.565907955169678, "global_step": 34517, "epoch": 821} {"train_loss": -5.48505973815918, "global_step": 34518, "epoch": 821} {"train_loss": -5.505544185638428, "global_step": 34519, "epoch": 821} {"train_loss": -5.542121887207031, "global_step": 34520, "epoch": 821} {"train_loss": -5.487933158874512, "global_step": 34521, "epoch": 821} {"train_loss": -5.572861671447754, "global_step": 34522, "epoch": 821} {"train_loss": -5.5207408382779075, "global_step": 34523, "epoch": 821, "val_loss": 66622.296875} {"train_loss": -5.626922607421875, "global_step": 34524, "epoch": 822} {"train_loss": -5.527966499328613, "global_step": 34525, "epoch": 822} {"train_loss": -5.515212535858154, "global_step": 34526, "epoch": 822} {"train_loss": -5.535963535308838, "global_step": 34527, "epoch": 822} {"train_loss": -5.491708755493164, "global_step": 34528, "epoch": 822} {"train_loss": -5.612400054931641, "global_step": 34529, "epoch": 822} {"train_loss": -5.549609184265137, "global_step": 34530, "epoch": 822} {"train_loss": -5.456124305725098, "global_step": 34531, "epoch": 822} {"train_loss": -5.57051944732666, "global_step": 34532, "epoch": 822} {"train_loss": -5.528841972351074, "global_step": 34533, "epoch": 822} {"train_loss": -5.640053749084473, "global_step": 34534, "epoch": 822} {"train_loss": -5.694913864135742, "global_step": 34535, "epoch": 822} {"train_loss": -5.535628318786621, "global_step": 34536, "epoch": 822} {"train_loss": -5.519167900085449, "global_step": 34537, "epoch": 822} {"train_loss": -5.619857311248779, "global_step": 34538, "epoch": 822} {"train_loss": -5.566052436828613, "global_step": 34539, "epoch": 822} {"train_loss": -5.457127094268799, "global_step": 34540, "epoch": 822} {"train_loss": -5.460039138793945, "global_step": 34541, "epoch": 822} {"train_loss": -5.5284318923950195, "global_step": 34542, "epoch": 822} {"train_loss": -5.62048864364624, "global_step": 34543, "epoch": 822} {"train_loss": -5.531923770904541, "global_step": 34544, "epoch": 822} {"train_loss": -5.573816299438477, "global_step": 34545, "epoch": 822} {"train_loss": -5.628592491149902, "global_step": 34546, "epoch": 822} {"train_loss": -5.623467922210693, "global_step": 34547, "epoch": 822} {"train_loss": -5.501666069030762, "global_step": 34548, "epoch": 822} {"train_loss": -5.547636985778809, "global_step": 34549, "epoch": 822} {"train_loss": -5.567880630493164, "global_step": 34550, "epoch": 822} {"train_loss": -5.580202579498291, "global_step": 34551, "epoch": 822} {"train_loss": -5.478726387023926, "global_step": 34552, "epoch": 822} {"train_loss": -5.698829650878906, "global_step": 34553, "epoch": 822} {"train_loss": -5.441262245178223, "global_step": 34554, "epoch": 822} {"train_loss": -5.584364414215088, "global_step": 34555, "epoch": 822} {"train_loss": -5.554302215576172, "global_step": 34556, "epoch": 822} {"train_loss": -5.612848281860352, "global_step": 34557, "epoch": 822} {"train_loss": -5.456141471862793, "global_step": 34558, "epoch": 822} {"train_loss": -5.55864143371582, "global_step": 34559, "epoch": 822} {"train_loss": -5.571523666381836, "global_step": 34560, "epoch": 822} {"train_loss": -5.606507778167725, "global_step": 34561, "epoch": 822} {"train_loss": -5.520203590393066, "global_step": 34562, "epoch": 822} {"train_loss": -5.600353717803955, "global_step": 34563, "epoch": 822} {"train_loss": -5.599826335906982, "global_step": 34564, "epoch": 822} {"train_loss": -5.5561851887475875, "global_step": 34565, "epoch": 822, "val_loss": 66580.6953125} {"train_loss": -5.571897506713867, "global_step": 34566, "epoch": 823} {"train_loss": -5.672056198120117, "global_step": 34567, "epoch": 823} {"train_loss": -5.686017990112305, "global_step": 34568, "epoch": 823} {"train_loss": -5.602019309997559, "global_step": 34569, "epoch": 823} {"train_loss": -5.552794456481934, "global_step": 34570, "epoch": 823} {"train_loss": -5.567420959472656, "global_step": 34571, "epoch": 823} {"train_loss": -5.608672142028809, "global_step": 34572, "epoch": 823} {"train_loss": -5.489086151123047, "global_step": 34573, "epoch": 823} {"train_loss": -5.469915390014648, "global_step": 34574, "epoch": 823} {"train_loss": -5.507834434509277, "global_step": 34575, "epoch": 823} {"train_loss": -5.576656818389893, "global_step": 34576, "epoch": 823} {"train_loss": -5.5535688400268555, "global_step": 34577, "epoch": 823} {"train_loss": -5.603168487548828, "global_step": 34578, "epoch": 823} {"train_loss": -5.5675554275512695, "global_step": 34579, "epoch": 823} {"train_loss": -5.5311503410339355, "global_step": 34580, "epoch": 823} {"train_loss": -5.563817024230957, "global_step": 34581, "epoch": 823} {"train_loss": -5.436912536621094, "global_step": 34582, "epoch": 823} {"train_loss": -5.377684593200684, "global_step": 34583, "epoch": 823} {"train_loss": -5.554868221282959, "global_step": 34584, "epoch": 823} {"train_loss": -5.327528953552246, "global_step": 34585, "epoch": 823} {"train_loss": -5.666360855102539, "global_step": 34586, "epoch": 823} {"train_loss": -5.490654945373535, "global_step": 34587, "epoch": 823} {"train_loss": -5.5428466796875, "global_step": 34588, "epoch": 823} {"train_loss": -5.5640950202941895, "global_step": 34589, "epoch": 823} {"train_loss": -5.492748260498047, "global_step": 34590, "epoch": 823} {"train_loss": -5.583258628845215, "global_step": 34591, "epoch": 823} {"train_loss": -5.581910133361816, "global_step": 34592, "epoch": 823} {"train_loss": -5.5265045166015625, "global_step": 34593, "epoch": 823} {"train_loss": -5.641504287719727, "global_step": 34594, "epoch": 823} {"train_loss": -5.567641258239746, "global_step": 34595, "epoch": 823} {"train_loss": -5.48443603515625, "global_step": 34596, "epoch": 823} {"train_loss": -5.494902610778809, "global_step": 34597, "epoch": 823} {"train_loss": -5.510464191436768, "global_step": 34598, "epoch": 823} {"train_loss": -5.505302429199219, "global_step": 34599, "epoch": 823} {"train_loss": -5.66322135925293, "global_step": 34600, "epoch": 823} {"train_loss": -5.725855827331543, "global_step": 34601, "epoch": 823} {"train_loss": -5.568471908569336, "global_step": 34602, "epoch": 823} {"train_loss": -5.603314399719238, "global_step": 34603, "epoch": 823} {"train_loss": -5.554231643676758, "global_step": 34604, "epoch": 823} {"train_loss": -5.520101070404053, "global_step": 34605, "epoch": 823} {"train_loss": -5.6211838722229, "global_step": 34606, "epoch": 823} {"train_loss": -5.554608186086019, "global_step": 34607, "epoch": 823, "val_loss": 66486.1484375} {"train_loss": -5.552841663360596, "global_step": 34608, "epoch": 824} {"train_loss": -5.643649578094482, "global_step": 34609, "epoch": 824} {"train_loss": -5.565878868103027, "global_step": 34610, "epoch": 824} {"train_loss": -5.400257110595703, "global_step": 34611, "epoch": 824} {"train_loss": -5.548890590667725, "global_step": 34612, "epoch": 824} {"train_loss": -5.575204849243164, "global_step": 34613, "epoch": 824} {"train_loss": -5.606379508972168, "global_step": 34614, "epoch": 824} {"train_loss": -5.5966339111328125, "global_step": 34615, "epoch": 824} {"train_loss": -5.508460998535156, "global_step": 34616, "epoch": 824} {"train_loss": -5.656732082366943, "global_step": 34617, "epoch": 824} {"train_loss": -5.399569034576416, "global_step": 34618, "epoch": 824} {"train_loss": -5.477874279022217, "global_step": 34619, "epoch": 824} {"train_loss": -5.543286323547363, "global_step": 34620, "epoch": 824} {"train_loss": -5.625655174255371, "global_step": 34621, "epoch": 824} {"train_loss": -5.589890003204346, "global_step": 34622, "epoch": 824} {"train_loss": -5.444395065307617, "global_step": 34623, "epoch": 824} {"train_loss": -5.444193363189697, "global_step": 34624, "epoch": 824} {"train_loss": -5.561333656311035, "global_step": 34625, "epoch": 824} {"train_loss": -5.492858409881592, "global_step": 34626, "epoch": 824} {"train_loss": -5.619161605834961, "global_step": 34627, "epoch": 824} {"train_loss": -5.482263565063477, "global_step": 34628, "epoch": 824} {"train_loss": -5.651283264160156, "global_step": 34629, "epoch": 824} {"train_loss": -5.452940464019775, "global_step": 34630, "epoch": 824} {"train_loss": -5.6071295738220215, "global_step": 34631, "epoch": 824} {"train_loss": -5.59106969833374, "global_step": 34632, "epoch": 824} {"train_loss": -5.397518634796143, "global_step": 34633, "epoch": 824} {"train_loss": -5.58507776260376, "global_step": 34634, "epoch": 824} {"train_loss": -5.590763568878174, "global_step": 34635, "epoch": 824} {"train_loss": -5.544144630432129, "global_step": 34636, "epoch": 824} {"train_loss": -5.516202926635742, "global_step": 34637, "epoch": 824} {"train_loss": -5.685625076293945, "global_step": 34638, "epoch": 824} {"train_loss": -5.543612480163574, "global_step": 34639, "epoch": 824} {"train_loss": -5.5116868019104, "global_step": 34640, "epoch": 824} {"train_loss": -5.60727071762085, "global_step": 34641, "epoch": 824} {"train_loss": -5.571791648864746, "global_step": 34642, "epoch": 824} {"train_loss": -5.621697425842285, "global_step": 34643, "epoch": 824} {"train_loss": -5.590429782867432, "global_step": 34644, "epoch": 824} {"train_loss": -5.651557445526123, "global_step": 34645, "epoch": 824} {"train_loss": -5.510576248168945, "global_step": 34646, "epoch": 824} {"train_loss": -5.669193267822266, "global_step": 34647, "epoch": 824} {"train_loss": -5.639201641082764, "global_step": 34648, "epoch": 824} {"train_loss": -5.559654110953922, "global_step": 34649, "epoch": 824, "val_loss": 66211.3984375} {"train_loss": -5.636661052703857, "global_step": 34650, "epoch": 825} {"train_loss": -5.494550704956055, "global_step": 34651, "epoch": 825} {"train_loss": -5.636382579803467, "global_step": 34652, "epoch": 825} {"train_loss": -5.543081283569336, "global_step": 34653, "epoch": 825} {"train_loss": -5.502936840057373, "global_step": 34654, "epoch": 825} {"train_loss": -5.689230918884277, "global_step": 34655, "epoch": 825} {"train_loss": -5.737534046173096, "global_step": 34656, "epoch": 825} {"train_loss": -5.4643144607543945, "global_step": 34657, "epoch": 825} {"train_loss": -5.561147689819336, "global_step": 34658, "epoch": 825} {"train_loss": -5.525702476501465, "global_step": 34659, "epoch": 825} {"train_loss": -5.619700908660889, "global_step": 34660, "epoch": 825} {"train_loss": -5.473188877105713, "global_step": 34661, "epoch": 825} {"train_loss": -5.5444183349609375, "global_step": 34662, "epoch": 825} {"train_loss": -5.344322204589844, "global_step": 34663, "epoch": 825} {"train_loss": -5.508001327514648, "global_step": 34664, "epoch": 825} {"train_loss": -5.622097015380859, "global_step": 34665, "epoch": 825} {"train_loss": -5.543891906738281, "global_step": 34666, "epoch": 825} {"train_loss": -5.6336822509765625, "global_step": 34667, "epoch": 825} {"train_loss": -5.621694564819336, "global_step": 34668, "epoch": 825} {"train_loss": -5.458793640136719, "global_step": 34669, "epoch": 825} {"train_loss": -5.463188171386719, "global_step": 34670, "epoch": 825} {"train_loss": -5.576576232910156, "global_step": 34671, "epoch": 825} {"train_loss": -5.583523750305176, "global_step": 34672, "epoch": 825} {"train_loss": -5.538714408874512, "global_step": 34673, "epoch": 825} {"train_loss": -5.593419075012207, "global_step": 34674, "epoch": 825} {"train_loss": -5.454207420349121, "global_step": 34675, "epoch": 825} {"train_loss": -5.444714546203613, "global_step": 34676, "epoch": 825} {"train_loss": -5.468947410583496, "global_step": 34677, "epoch": 825} {"train_loss": -5.4701948165893555, "global_step": 34678, "epoch": 825} {"train_loss": -5.560210227966309, "global_step": 34679, "epoch": 825} {"train_loss": -5.5154523849487305, "global_step": 34680, "epoch": 825} {"train_loss": -5.698217391967773, "global_step": 34681, "epoch": 825} {"train_loss": -5.538604259490967, "global_step": 34682, "epoch": 825} {"train_loss": -5.468022346496582, "global_step": 34683, "epoch": 825} {"train_loss": -5.649014472961426, "global_step": 34684, "epoch": 825} {"train_loss": -5.552296161651611, "global_step": 34685, "epoch": 825} {"train_loss": -5.418344020843506, "global_step": 34686, "epoch": 825} {"train_loss": -5.496441841125488, "global_step": 34687, "epoch": 825} {"train_loss": -5.488219261169434, "global_step": 34688, "epoch": 825} {"train_loss": -5.671035289764404, "global_step": 34689, "epoch": 825} {"train_loss": -5.403881072998047, "global_step": 34690, "epoch": 825} {"train_loss": -5.541580586206345, "global_step": 34691, "epoch": 825, "val_loss": 66359.1640625} {"train_loss": -5.665721893310547, "global_step": 34692, "epoch": 826} {"train_loss": -5.509912014007568, "global_step": 34693, "epoch": 826} {"train_loss": -5.594679832458496, "global_step": 34694, "epoch": 826} {"train_loss": -5.425205230712891, "global_step": 34695, "epoch": 826} {"train_loss": -5.58022403717041, "global_step": 34696, "epoch": 826} {"train_loss": -5.44962215423584, "global_step": 34697, "epoch": 826} {"train_loss": -5.4740519523620605, "global_step": 34698, "epoch": 826} {"train_loss": -5.269630432128906, "global_step": 34699, "epoch": 826} {"train_loss": -5.525710582733154, "global_step": 34700, "epoch": 826} {"train_loss": -5.46799373626709, "global_step": 34701, "epoch": 826} {"train_loss": -5.305522918701172, "global_step": 34702, "epoch": 826} {"train_loss": -5.460633277893066, "global_step": 34703, "epoch": 826} {"train_loss": -5.490996837615967, "global_step": 34704, "epoch": 826} {"train_loss": -5.550797462463379, "global_step": 34705, "epoch": 826} {"train_loss": -5.497812271118164, "global_step": 34706, "epoch": 826} {"train_loss": -5.511157035827637, "global_step": 34707, "epoch": 826} {"train_loss": -5.680138111114502, "global_step": 34708, "epoch": 826} {"train_loss": -5.340366363525391, "global_step": 34709, "epoch": 826} {"train_loss": -5.54745626449585, "global_step": 34710, "epoch": 826} {"train_loss": -5.466821193695068, "global_step": 34711, "epoch": 826} {"train_loss": -5.549471855163574, "global_step": 34712, "epoch": 826} {"train_loss": -5.662721633911133, "global_step": 34713, "epoch": 826} {"train_loss": -5.588386535644531, "global_step": 34714, "epoch": 826} {"train_loss": -5.519906044006348, "global_step": 34715, "epoch": 826} {"train_loss": -5.4905805587768555, "global_step": 34716, "epoch": 826} {"train_loss": -5.695806503295898, "global_step": 34717, "epoch": 826} {"train_loss": -5.55593204498291, "global_step": 34718, "epoch": 826} {"train_loss": -5.55185604095459, "global_step": 34719, "epoch": 826} {"train_loss": -5.555325508117676, "global_step": 34720, "epoch": 826} {"train_loss": -5.587752819061279, "global_step": 34721, "epoch": 826} {"train_loss": -5.589937686920166, "global_step": 34722, "epoch": 826} {"train_loss": -5.528172016143799, "global_step": 34723, "epoch": 826} {"train_loss": -5.60235595703125, "global_step": 34724, "epoch": 826} {"train_loss": -5.452688217163086, "global_step": 34725, "epoch": 826} {"train_loss": -5.4724531173706055, "global_step": 34726, "epoch": 826} {"train_loss": -5.469615936279297, "global_step": 34727, "epoch": 826} {"train_loss": -5.567563056945801, "global_step": 34728, "epoch": 826} {"train_loss": -5.574031829833984, "global_step": 34729, "epoch": 826} {"train_loss": -5.5030412673950195, "global_step": 34730, "epoch": 826} {"train_loss": -5.5892109870910645, "global_step": 34731, "epoch": 826} {"train_loss": -5.620125770568848, "global_step": 34732, "epoch": 826} {"train_loss": -5.525276365734282, "global_step": 34733, "epoch": 826, "val_loss": 66203.265625} {"train_loss": -5.551227569580078, "global_step": 34734, "epoch": 827} {"train_loss": -5.526561260223389, "global_step": 34735, "epoch": 827} {"train_loss": -5.520190238952637, "global_step": 34736, "epoch": 827} {"train_loss": -5.474140644073486, "global_step": 34737, "epoch": 827} {"train_loss": -5.600491523742676, "global_step": 34738, "epoch": 827} {"train_loss": -5.630127906799316, "global_step": 34739, "epoch": 827} {"train_loss": -5.6789445877075195, "global_step": 34740, "epoch": 827} {"train_loss": -5.613042831420898, "global_step": 34741, "epoch": 827} {"train_loss": -5.473406791687012, "global_step": 34742, "epoch": 827} {"train_loss": -5.455781936645508, "global_step": 34743, "epoch": 827} {"train_loss": -5.597879409790039, "global_step": 34744, "epoch": 827} {"train_loss": -5.57822847366333, "global_step": 34745, "epoch": 827} {"train_loss": -5.458979606628418, "global_step": 34746, "epoch": 827} {"train_loss": -5.513232231140137, "global_step": 34747, "epoch": 827} {"train_loss": -5.561211585998535, "global_step": 34748, "epoch": 827} {"train_loss": -5.493240833282471, "global_step": 34749, "epoch": 827} {"train_loss": -5.52174711227417, "global_step": 34750, "epoch": 827} {"train_loss": -5.486954689025879, "global_step": 34751, "epoch": 827} {"train_loss": -5.620523452758789, "global_step": 34752, "epoch": 827} {"train_loss": -5.422391891479492, "global_step": 34753, "epoch": 827} {"train_loss": -5.603608131408691, "global_step": 34754, "epoch": 827} {"train_loss": -5.441976547241211, "global_step": 34755, "epoch": 827} {"train_loss": -5.483470916748047, "global_step": 34756, "epoch": 827} {"train_loss": -5.488870620727539, "global_step": 34757, "epoch": 827} {"train_loss": -5.596789360046387, "global_step": 34758, "epoch": 827} {"train_loss": -5.501049041748047, "global_step": 34759, "epoch": 827} {"train_loss": -5.557540416717529, "global_step": 34760, "epoch": 827} {"train_loss": -5.495107650756836, "global_step": 34761, "epoch": 827} {"train_loss": -5.5314836502075195, "global_step": 34762, "epoch": 827} {"train_loss": -5.6108293533325195, "global_step": 34763, "epoch": 827} {"train_loss": -5.60420036315918, "global_step": 34764, "epoch": 827} {"train_loss": -5.5936479568481445, "global_step": 34765, "epoch": 827} {"train_loss": -5.539736270904541, "global_step": 34766, "epoch": 827} {"train_loss": -5.593005657196045, "global_step": 34767, "epoch": 827} {"train_loss": -5.638820171356201, "global_step": 34768, "epoch": 827} {"train_loss": -5.629619121551514, "global_step": 34769, "epoch": 827} {"train_loss": -5.483619213104248, "global_step": 34770, "epoch": 827} {"train_loss": -5.594559669494629, "global_step": 34771, "epoch": 827} {"train_loss": -5.571495056152344, "global_step": 34772, "epoch": 827} {"train_loss": -5.613615989685059, "global_step": 34773, "epoch": 827} {"train_loss": -5.573946952819824, "global_step": 34774, "epoch": 827} {"train_loss": -5.5509686924162365, "global_step": 34775, "epoch": 827, "val_loss": 66227.4921875} {"train_loss": -5.610231399536133, "global_step": 34776, "epoch": 828} {"train_loss": -5.646434307098389, "global_step": 34777, "epoch": 828} {"train_loss": -5.5615434646606445, "global_step": 34778, "epoch": 828} {"train_loss": -5.6412248611450195, "global_step": 34779, "epoch": 828} {"train_loss": -5.5785417556762695, "global_step": 34780, "epoch": 828} {"train_loss": -5.516216278076172, "global_step": 34781, "epoch": 828} {"train_loss": -5.641489028930664, "global_step": 34782, "epoch": 828} {"train_loss": -5.564064025878906, "global_step": 34783, "epoch": 828} {"train_loss": -5.577324867248535, "global_step": 34784, "epoch": 828} {"train_loss": -5.465076446533203, "global_step": 34785, "epoch": 828} {"train_loss": -5.464022636413574, "global_step": 34786, "epoch": 828} {"train_loss": -5.573670864105225, "global_step": 34787, "epoch": 828} {"train_loss": -5.601361274719238, "global_step": 34788, "epoch": 828} {"train_loss": -5.426759243011475, "global_step": 34789, "epoch": 828} {"train_loss": -5.619040489196777, "global_step": 34790, "epoch": 828} {"train_loss": -5.490860939025879, "global_step": 34791, "epoch": 828} {"train_loss": -5.666486740112305, "global_step": 34792, "epoch": 828} {"train_loss": -5.6465935707092285, "global_step": 34793, "epoch": 828} {"train_loss": -5.431091785430908, "global_step": 34794, "epoch": 828} {"train_loss": -5.622122287750244, "global_step": 34795, "epoch": 828} {"train_loss": -5.653802871704102, "global_step": 34796, "epoch": 828} {"train_loss": -5.6017351150512695, "global_step": 34797, "epoch": 828} {"train_loss": -5.622664451599121, "global_step": 34798, "epoch": 828} {"train_loss": -5.6089324951171875, "global_step": 34799, "epoch": 828} {"train_loss": -5.521839141845703, "global_step": 34800, "epoch": 828} {"train_loss": -5.490074157714844, "global_step": 34801, "epoch": 828} {"train_loss": -5.584585189819336, "global_step": 34802, "epoch": 828} {"train_loss": -5.667995452880859, "global_step": 34803, "epoch": 828} {"train_loss": -5.475174903869629, "global_step": 34804, "epoch": 828} {"train_loss": -5.486954689025879, "global_step": 34805, "epoch": 828} {"train_loss": -5.487181663513184, "global_step": 34806, "epoch": 828} {"train_loss": -5.587936878204346, "global_step": 34807, "epoch": 828} {"train_loss": -5.529458045959473, "global_step": 34808, "epoch": 828} {"train_loss": -5.679571628570557, "global_step": 34809, "epoch": 828} {"train_loss": -5.5113115310668945, "global_step": 34810, "epoch": 828} {"train_loss": -5.4633331298828125, "global_step": 34811, "epoch": 828} {"train_loss": -5.713129043579102, "global_step": 34812, "epoch": 828} {"train_loss": -5.611248016357422, "global_step": 34813, "epoch": 828} {"train_loss": -5.443094253540039, "global_step": 34814, "epoch": 828} {"train_loss": -5.452664375305176, "global_step": 34815, "epoch": 828} {"train_loss": -5.474900722503662, "global_step": 34816, "epoch": 828} {"train_loss": -5.557760374886649, "global_step": 34817, "epoch": 828, "val_loss": 66515.7890625} {"train_loss": -5.591131210327148, "global_step": 34818, "epoch": 829} {"train_loss": -5.712343692779541, "global_step": 34819, "epoch": 829} {"train_loss": -5.467466354370117, "global_step": 34820, "epoch": 829} {"train_loss": -5.54598331451416, "global_step": 34821, "epoch": 829} {"train_loss": -5.602972984313965, "global_step": 34822, "epoch": 829} {"train_loss": -5.595820426940918, "global_step": 34823, "epoch": 829} {"train_loss": -5.436433792114258, "global_step": 34824, "epoch": 829} {"train_loss": -5.651246070861816, "global_step": 34825, "epoch": 829} {"train_loss": -5.499099254608154, "global_step": 34826, "epoch": 829} {"train_loss": -5.487563133239746, "global_step": 34827, "epoch": 829} {"train_loss": -5.561550140380859, "global_step": 34828, "epoch": 829} {"train_loss": -5.455212116241455, "global_step": 34829, "epoch": 829} {"train_loss": -5.488217830657959, "global_step": 34830, "epoch": 829} {"train_loss": -5.3661088943481445, "global_step": 34831, "epoch": 829} {"train_loss": -5.524744033813477, "global_step": 34832, "epoch": 829} {"train_loss": -5.459201335906982, "global_step": 34833, "epoch": 829} {"train_loss": -5.638691425323486, "global_step": 34834, "epoch": 829} {"train_loss": -5.5584821701049805, "global_step": 34835, "epoch": 829} {"train_loss": -5.592196464538574, "global_step": 34836, "epoch": 829} {"train_loss": -5.507491111755371, "global_step": 34837, "epoch": 829} {"train_loss": -5.447915077209473, "global_step": 34838, "epoch": 829} {"train_loss": -5.495043754577637, "global_step": 34839, "epoch": 829} {"train_loss": -5.402039527893066, "global_step": 34840, "epoch": 829} {"train_loss": -5.645054817199707, "global_step": 34841, "epoch": 829} {"train_loss": -5.574906826019287, "global_step": 34842, "epoch": 829} {"train_loss": -5.492341041564941, "global_step": 34843, "epoch": 829} {"train_loss": -5.5361223220825195, "global_step": 34844, "epoch": 829} {"train_loss": -5.472712516784668, "global_step": 34845, "epoch": 829} {"train_loss": -5.478585243225098, "global_step": 34846, "epoch": 829} {"train_loss": -5.566144943237305, "global_step": 34847, "epoch": 829} {"train_loss": -5.652432441711426, "global_step": 34848, "epoch": 829} {"train_loss": -5.494973182678223, "global_step": 34849, "epoch": 829} {"train_loss": -5.414397239685059, "global_step": 34850, "epoch": 829} {"train_loss": -5.469582557678223, "global_step": 34851, "epoch": 829} {"train_loss": -5.630698204040527, "global_step": 34852, "epoch": 829} {"train_loss": -5.563056945800781, "global_step": 34853, "epoch": 829} {"train_loss": -5.560876846313477, "global_step": 34854, "epoch": 829} {"train_loss": -5.4950270652771, "global_step": 34855, "epoch": 829} {"train_loss": -5.567840576171875, "global_step": 34856, "epoch": 829} {"train_loss": -5.507293224334717, "global_step": 34857, "epoch": 829} {"train_loss": -5.598336219787598, "global_step": 34858, "epoch": 829} {"train_loss": -5.5313844453720815, "global_step": 34859, "epoch": 829, "val_loss": 66619.53125} {"train_loss": -5.628190040588379, "global_step": 34860, "epoch": 830} {"train_loss": -5.670419692993164, "global_step": 34861, "epoch": 830} {"train_loss": -5.470357894897461, "global_step": 34862, "epoch": 830} {"train_loss": -5.481606960296631, "global_step": 34863, "epoch": 830} {"train_loss": -5.487068176269531, "global_step": 34864, "epoch": 830} {"train_loss": -5.454967498779297, "global_step": 34865, "epoch": 830} {"train_loss": -5.725776672363281, "global_step": 34866, "epoch": 830} {"train_loss": -5.71898078918457, "global_step": 34867, "epoch": 830} {"train_loss": -5.689209938049316, "global_step": 34868, "epoch": 830} {"train_loss": -5.60604190826416, "global_step": 34869, "epoch": 830} {"train_loss": -5.537496089935303, "global_step": 34870, "epoch": 830} {"train_loss": -5.530077934265137, "global_step": 34871, "epoch": 830} {"train_loss": -5.73569393157959, "global_step": 34872, "epoch": 830} {"train_loss": -5.563279151916504, "global_step": 34873, "epoch": 830} {"train_loss": -5.679399013519287, "global_step": 34874, "epoch": 830} {"train_loss": -5.637771129608154, "global_step": 34875, "epoch": 830} {"train_loss": -5.460329055786133, "global_step": 34876, "epoch": 830} {"train_loss": -5.518911361694336, "global_step": 34877, "epoch": 830} {"train_loss": -5.532052993774414, "global_step": 34878, "epoch": 830} {"train_loss": -5.572048187255859, "global_step": 34879, "epoch": 830} {"train_loss": -5.619797706604004, "global_step": 34880, "epoch": 830} {"train_loss": -5.583342552185059, "global_step": 34881, "epoch": 830} {"train_loss": -5.690908432006836, "global_step": 34882, "epoch": 830} {"train_loss": -5.575780868530273, "global_step": 34883, "epoch": 830} {"train_loss": -5.5464911460876465, "global_step": 34884, "epoch": 830} {"train_loss": -5.537801265716553, "global_step": 34885, "epoch": 830} {"train_loss": -5.460061073303223, "global_step": 34886, "epoch": 830} {"train_loss": -5.448907852172852, "global_step": 34887, "epoch": 830} {"train_loss": -5.617120742797852, "global_step": 34888, "epoch": 830} {"train_loss": -5.441924095153809, "global_step": 34889, "epoch": 830} {"train_loss": -5.337626934051514, "global_step": 34890, "epoch": 830} {"train_loss": -5.546660900115967, "global_step": 34891, "epoch": 830} {"train_loss": -5.50234842300415, "global_step": 34892, "epoch": 830} {"train_loss": -5.6153082847595215, "global_step": 34893, "epoch": 830} {"train_loss": -5.558516502380371, "global_step": 34894, "epoch": 830} {"train_loss": -5.475070476531982, "global_step": 34895, "epoch": 830} {"train_loss": -5.604154109954834, "global_step": 34896, "epoch": 830} {"train_loss": -5.681262493133545, "global_step": 34897, "epoch": 830} {"train_loss": -5.521915912628174, "global_step": 34898, "epoch": 830} {"train_loss": -5.602562427520752, "global_step": 34899, "epoch": 830} {"train_loss": -5.612405300140381, "global_step": 34900, "epoch": 830} {"train_loss": -5.56942571912493, "global_step": 34901, "epoch": 830, "val_loss": 66058.0390625} {"train_loss": -5.64540958404541, "global_step": 34902, "epoch": 831} {"train_loss": -5.581843376159668, "global_step": 34903, "epoch": 831} {"train_loss": -5.45706844329834, "global_step": 34904, "epoch": 831} {"train_loss": -5.543375015258789, "global_step": 34905, "epoch": 831} {"train_loss": -5.489935874938965, "global_step": 34906, "epoch": 831} {"train_loss": -5.593050956726074, "global_step": 34907, "epoch": 831} {"train_loss": -5.619602203369141, "global_step": 34908, "epoch": 831} {"train_loss": -5.574666976928711, "global_step": 34909, "epoch": 831} {"train_loss": -5.506223678588867, "global_step": 34910, "epoch": 831} {"train_loss": -5.636773109436035, "global_step": 34911, "epoch": 831} {"train_loss": -5.501700401306152, "global_step": 34912, "epoch": 831} {"train_loss": -5.532740592956543, "global_step": 34913, "epoch": 831} {"train_loss": -5.6564788818359375, "global_step": 34914, "epoch": 831} {"train_loss": -5.550620079040527, "global_step": 34915, "epoch": 831} {"train_loss": -5.490302562713623, "global_step": 34916, "epoch": 831} {"train_loss": -5.565499782562256, "global_step": 34917, "epoch": 831} {"train_loss": -5.492245197296143, "global_step": 34918, "epoch": 831} {"train_loss": -5.57385778427124, "global_step": 34919, "epoch": 831} {"train_loss": -5.596857070922852, "global_step": 34920, "epoch": 831} {"train_loss": -5.548625946044922, "global_step": 34921, "epoch": 831} {"train_loss": -5.5165019035339355, "global_step": 34922, "epoch": 831} {"train_loss": -5.427438259124756, "global_step": 34923, "epoch": 831} {"train_loss": -5.619134902954102, "global_step": 34924, "epoch": 831} {"train_loss": -5.505695343017578, "global_step": 34925, "epoch": 831} {"train_loss": -5.33614444732666, "global_step": 34926, "epoch": 831} {"train_loss": -5.663724899291992, "global_step": 34927, "epoch": 831} {"train_loss": -5.398914337158203, "global_step": 34928, "epoch": 831} {"train_loss": -5.5573954582214355, "global_step": 34929, "epoch": 831} {"train_loss": -5.497502326965332, "global_step": 34930, "epoch": 831} {"train_loss": -5.550278663635254, "global_step": 34931, "epoch": 831} {"train_loss": -5.567023754119873, "global_step": 34932, "epoch": 831} {"train_loss": -5.55850887298584, "global_step": 34933, "epoch": 831} {"train_loss": -5.585047721862793, "global_step": 34934, "epoch": 831} {"train_loss": -5.4419074058532715, "global_step": 34935, "epoch": 831} {"train_loss": -5.532462120056152, "global_step": 34936, "epoch": 831} {"train_loss": -5.596081733703613, "global_step": 34937, "epoch": 831} {"train_loss": -5.6022772789001465, "global_step": 34938, "epoch": 831} {"train_loss": -5.539999008178711, "global_step": 34939, "epoch": 831} {"train_loss": -5.470393180847168, "global_step": 34940, "epoch": 831} {"train_loss": -5.400209903717041, "global_step": 34941, "epoch": 831} {"train_loss": -5.4870123863220215, "global_step": 34942, "epoch": 831} {"train_loss": -5.535254455748058, "global_step": 34943, "epoch": 831, "val_loss": 66427.5859375} {"train_loss": -5.583559036254883, "global_step": 34944, "epoch": 832} {"train_loss": -5.549893856048584, "global_step": 34945, "epoch": 832} {"train_loss": -5.57625675201416, "global_step": 34946, "epoch": 832} {"train_loss": -5.538552284240723, "global_step": 34947, "epoch": 832} {"train_loss": -5.676207542419434, "global_step": 34948, "epoch": 832} {"train_loss": -5.621695518493652, "global_step": 34949, "epoch": 832} {"train_loss": -5.540188789367676, "global_step": 34950, "epoch": 832} {"train_loss": -5.623821258544922, "global_step": 34951, "epoch": 832} {"train_loss": -5.575233459472656, "global_step": 34952, "epoch": 832} {"train_loss": -5.649141311645508, "global_step": 34953, "epoch": 832} {"train_loss": -5.431291103363037, "global_step": 34954, "epoch": 832} {"train_loss": -5.51786470413208, "global_step": 34955, "epoch": 832} {"train_loss": -5.610428810119629, "global_step": 34956, "epoch": 832} {"train_loss": -5.500555038452148, "global_step": 34957, "epoch": 832} {"train_loss": -5.582850933074951, "global_step": 34958, "epoch": 832} {"train_loss": -5.503500461578369, "global_step": 34959, "epoch": 832} {"train_loss": -5.7028889656066895, "global_step": 34960, "epoch": 832} {"train_loss": -5.5736260414123535, "global_step": 34961, "epoch": 832} {"train_loss": -5.550790309906006, "global_step": 34962, "epoch": 832} {"train_loss": -5.590350151062012, "global_step": 34963, "epoch": 832} {"train_loss": -5.5717644691467285, "global_step": 34964, "epoch": 832} {"train_loss": -5.518063068389893, "global_step": 34965, "epoch": 832} {"train_loss": -5.540287971496582, "global_step": 34966, "epoch": 832} {"train_loss": -5.504220962524414, "global_step": 34967, "epoch": 832} {"train_loss": -5.559752941131592, "global_step": 34968, "epoch": 832} {"train_loss": -5.514316558837891, "global_step": 34969, "epoch": 832} {"train_loss": -5.607571601867676, "global_step": 34970, "epoch": 832} {"train_loss": -5.659002304077148, "global_step": 34971, "epoch": 832} {"train_loss": -5.525830268859863, "global_step": 34972, "epoch": 832} {"train_loss": -5.507393836975098, "global_step": 34973, "epoch": 832} {"train_loss": -5.49641227722168, "global_step": 34974, "epoch": 832} {"train_loss": -5.586080551147461, "global_step": 34975, "epoch": 832} {"train_loss": -5.668089389801025, "global_step": 34976, "epoch": 832} {"train_loss": -5.5986528396606445, "global_step": 34977, "epoch": 832} {"train_loss": -5.613466739654541, "global_step": 34978, "epoch": 832} {"train_loss": -5.569716930389404, "global_step": 34979, "epoch": 832} {"train_loss": -5.687314987182617, "global_step": 34980, "epoch": 832} {"train_loss": -5.619663238525391, "global_step": 34981, "epoch": 832} {"train_loss": -5.577108383178711, "global_step": 34982, "epoch": 832} {"train_loss": -5.53587007522583, "global_step": 34983, "epoch": 832} {"train_loss": -5.512333869934082, "global_step": 34984, "epoch": 832} {"train_loss": -5.572350433894566, "global_step": 34985, "epoch": 832, "val_loss": 66448.4609375} {"train_loss": -5.609905242919922, "global_step": 34986, "epoch": 833} {"train_loss": -5.5142083168029785, "global_step": 34987, "epoch": 833} {"train_loss": -5.570754051208496, "global_step": 34988, "epoch": 833} {"train_loss": -5.635073661804199, "global_step": 34989, "epoch": 833} {"train_loss": -5.57523250579834, "global_step": 34990, "epoch": 833} {"train_loss": -5.441485404968262, "global_step": 34991, "epoch": 833} {"train_loss": -5.523558616638184, "global_step": 34992, "epoch": 833} {"train_loss": -5.5925188064575195, "global_step": 34993, "epoch": 833} {"train_loss": -5.570345401763916, "global_step": 34994, "epoch": 833} {"train_loss": -5.543127059936523, "global_step": 34995, "epoch": 833} {"train_loss": -5.6334228515625, "global_step": 34996, "epoch": 833} {"train_loss": -5.512136459350586, "global_step": 34997, "epoch": 833} {"train_loss": -5.616857528686523, "global_step": 34998, "epoch": 833} {"train_loss": -5.534282684326172, "global_step": 34999, "epoch": 833} {"train_loss": -5.507390022277832, "global_step": 35000, "epoch": 833} {"train_loss": -5.50658655166626, "global_step": 35001, "epoch": 833} {"train_loss": -5.489527702331543, "global_step": 35002, "epoch": 833} {"train_loss": -5.55704402923584, "global_step": 35003, "epoch": 833} {"train_loss": -5.641949653625488, "global_step": 35004, "epoch": 833} {"train_loss": -5.612285614013672, "global_step": 35005, "epoch": 833} {"train_loss": -5.477128982543945, "global_step": 35006, "epoch": 833} {"train_loss": -5.6015825271606445, "global_step": 35007, "epoch": 833} {"train_loss": -5.505557060241699, "global_step": 35008, "epoch": 833} {"train_loss": -5.534296989440918, "global_step": 35009, "epoch": 833} {"train_loss": -5.612664222717285, "global_step": 35010, "epoch": 833} {"train_loss": -5.535984516143799, "global_step": 35011, "epoch": 833} {"train_loss": -5.487200736999512, "global_step": 35012, "epoch": 833} {"train_loss": -5.61070442199707, "global_step": 35013, "epoch": 833} {"train_loss": -5.400155067443848, "global_step": 35014, "epoch": 833} {"train_loss": -5.4627861976623535, "global_step": 35015, "epoch": 833} {"train_loss": -5.354549407958984, "global_step": 35016, "epoch": 833} {"train_loss": -5.5116801261901855, "global_step": 35017, "epoch": 833} {"train_loss": -5.502321243286133, "global_step": 35018, "epoch": 833} {"train_loss": -5.495458602905273, "global_step": 35019, "epoch": 833} {"train_loss": -5.518184661865234, "global_step": 35020, "epoch": 833} {"train_loss": -5.433704376220703, "global_step": 35021, "epoch": 833} {"train_loss": -5.440752029418945, "global_step": 35022, "epoch": 833} {"train_loss": -5.483686447143555, "global_step": 35023, "epoch": 833} {"train_loss": -5.492408752441406, "global_step": 35024, "epoch": 833} {"train_loss": -5.487397193908691, "global_step": 35025, "epoch": 833} {"train_loss": -5.479803085327148, "global_step": 35026, "epoch": 833} {"train_loss": -5.525677556083316, "global_step": 35027, "epoch": 833, "val_loss": 66134.28125} {"train_loss": -5.534056663513184, "global_step": 35028, "epoch": 834} {"train_loss": -5.50528621673584, "global_step": 35029, "epoch": 834} {"train_loss": -5.562929153442383, "global_step": 35030, "epoch": 834} {"train_loss": -5.605759143829346, "global_step": 35031, "epoch": 834} {"train_loss": -5.4441819190979, "global_step": 35032, "epoch": 834} {"train_loss": -5.614795207977295, "global_step": 35033, "epoch": 834} {"train_loss": -5.596583366394043, "global_step": 35034, "epoch": 834} {"train_loss": -5.574328422546387, "global_step": 35035, "epoch": 834} {"train_loss": -5.586943626403809, "global_step": 35036, "epoch": 834} {"train_loss": -5.3874640464782715, "global_step": 35037, "epoch": 834} {"train_loss": -5.584448337554932, "global_step": 35038, "epoch": 834} {"train_loss": -5.62672233581543, "global_step": 35039, "epoch": 834} {"train_loss": -5.426465034484863, "global_step": 35040, "epoch": 834} {"train_loss": -5.52388334274292, "global_step": 35041, "epoch": 834} {"train_loss": -5.562807083129883, "global_step": 35042, "epoch": 834} {"train_loss": -5.570186614990234, "global_step": 35043, "epoch": 834} {"train_loss": -5.559178829193115, "global_step": 35044, "epoch": 834} {"train_loss": -5.528598785400391, "global_step": 35045, "epoch": 834} {"train_loss": -5.6106719970703125, "global_step": 35046, "epoch": 834} {"train_loss": -5.710316181182861, "global_step": 35047, "epoch": 834} {"train_loss": -5.371874809265137, "global_step": 35048, "epoch": 834} {"train_loss": -5.397327423095703, "global_step": 35049, "epoch": 834} {"train_loss": -5.539556503295898, "global_step": 35050, "epoch": 834} {"train_loss": -5.415498733520508, "global_step": 35051, "epoch": 834} {"train_loss": -5.423994541168213, "global_step": 35052, "epoch": 834} {"train_loss": -5.5633344650268555, "global_step": 35053, "epoch": 834} {"train_loss": -5.469584941864014, "global_step": 35054, "epoch": 834} {"train_loss": -5.5464186668396, "global_step": 35055, "epoch": 834} {"train_loss": -5.576683044433594, "global_step": 35056, "epoch": 834} {"train_loss": -5.461519718170166, "global_step": 35057, "epoch": 834} {"train_loss": -5.572772979736328, "global_step": 35058, "epoch": 834} {"train_loss": -5.617066383361816, "global_step": 35059, "epoch": 834} {"train_loss": -5.564952850341797, "global_step": 35060, "epoch": 834} {"train_loss": -5.46888542175293, "global_step": 35061, "epoch": 834} {"train_loss": -5.637091159820557, "global_step": 35062, "epoch": 834} {"train_loss": -5.658367156982422, "global_step": 35063, "epoch": 834} {"train_loss": -5.519165992736816, "global_step": 35064, "epoch": 834} {"train_loss": -5.509766101837158, "global_step": 35065, "epoch": 834} {"train_loss": -5.481916904449463, "global_step": 35066, "epoch": 834} {"train_loss": -5.538427829742432, "global_step": 35067, "epoch": 834} {"train_loss": -5.543203353881836, "global_step": 35068, "epoch": 834} {"train_loss": -5.533976520810809, "global_step": 35069, "epoch": 834, "val_loss": 66875.5546875} {"train_loss": -5.555194854736328, "global_step": 35070, "epoch": 835} {"train_loss": -5.48604154586792, "global_step": 35071, "epoch": 835} {"train_loss": -5.5156965255737305, "global_step": 35072, "epoch": 835} {"train_loss": -5.5174713134765625, "global_step": 35073, "epoch": 835} {"train_loss": -5.63496208190918, "global_step": 35074, "epoch": 835} {"train_loss": -5.525876522064209, "global_step": 35075, "epoch": 835} {"train_loss": -5.567482948303223, "global_step": 35076, "epoch": 835} {"train_loss": -5.56516695022583, "global_step": 35077, "epoch": 835} {"train_loss": -5.532505989074707, "global_step": 35078, "epoch": 835} {"train_loss": -5.6114630699157715, "global_step": 35079, "epoch": 835} {"train_loss": -5.651725769042969, "global_step": 35080, "epoch": 835} {"train_loss": -5.580672264099121, "global_step": 35081, "epoch": 835} {"train_loss": -5.644832134246826, "global_step": 35082, "epoch": 835} {"train_loss": -5.610523223876953, "global_step": 35083, "epoch": 835} {"train_loss": -5.496942520141602, "global_step": 35084, "epoch": 835} {"train_loss": -5.583260536193848, "global_step": 35085, "epoch": 835} {"train_loss": -5.539944648742676, "global_step": 35086, "epoch": 835} {"train_loss": -5.528665542602539, "global_step": 35087, "epoch": 835} {"train_loss": -5.5541791915893555, "global_step": 35088, "epoch": 835} {"train_loss": -5.6102705001831055, "global_step": 35089, "epoch": 835} {"train_loss": -5.530485153198242, "global_step": 35090, "epoch": 835} {"train_loss": -5.564543724060059, "global_step": 35091, "epoch": 835} {"train_loss": -5.4995646476745605, "global_step": 35092, "epoch": 835} {"train_loss": -5.4437150955200195, "global_step": 35093, "epoch": 835} {"train_loss": -5.557758331298828, "global_step": 35094, "epoch": 835} {"train_loss": -5.709979057312012, "global_step": 35095, "epoch": 835} {"train_loss": -5.504383087158203, "global_step": 35096, "epoch": 835} {"train_loss": -5.451045513153076, "global_step": 35097, "epoch": 835} {"train_loss": -5.6090288162231445, "global_step": 35098, "epoch": 835} {"train_loss": -5.646546363830566, "global_step": 35099, "epoch": 835} {"train_loss": -5.599160194396973, "global_step": 35100, "epoch": 835} {"train_loss": -5.610556602478027, "global_step": 35101, "epoch": 835} {"train_loss": -5.550957679748535, "global_step": 35102, "epoch": 835} {"train_loss": -5.486567497253418, "global_step": 35103, "epoch": 835} {"train_loss": -5.54229736328125, "global_step": 35104, "epoch": 835} {"train_loss": -5.546843528747559, "global_step": 35105, "epoch": 835} {"train_loss": -5.687551021575928, "global_step": 35106, "epoch": 835} {"train_loss": -5.6161346435546875, "global_step": 35107, "epoch": 835} {"train_loss": -5.40570068359375, "global_step": 35108, "epoch": 835} {"train_loss": -5.622377872467041, "global_step": 35109, "epoch": 835} {"train_loss": -5.68356990814209, "global_step": 35110, "epoch": 835} {"train_loss": -5.563769397281465, "global_step": 35111, "epoch": 835, "val_loss": 66041.375} {"train_loss": -5.57432746887207, "global_step": 35112, "epoch": 836} {"train_loss": -5.599938869476318, "global_step": 35113, "epoch": 836} {"train_loss": -5.489465713500977, "global_step": 35114, "epoch": 836} {"train_loss": -5.545565605163574, "global_step": 35115, "epoch": 836} {"train_loss": -5.502111434936523, "global_step": 35116, "epoch": 836} {"train_loss": -5.546997547149658, "global_step": 35117, "epoch": 836} {"train_loss": -5.665897369384766, "global_step": 35118, "epoch": 836} {"train_loss": -5.701169013977051, "global_step": 35119, "epoch": 836} {"train_loss": -5.623003005981445, "global_step": 35120, "epoch": 836} {"train_loss": -5.60207462310791, "global_step": 35121, "epoch": 836} {"train_loss": -5.610832214355469, "global_step": 35122, "epoch": 836} {"train_loss": -5.638928413391113, "global_step": 35123, "epoch": 836} {"train_loss": -5.542514801025391, "global_step": 35124, "epoch": 836} {"train_loss": -5.569669723510742, "global_step": 35125, "epoch": 836} {"train_loss": -5.590251922607422, "global_step": 35126, "epoch": 836} {"train_loss": -5.616403579711914, "global_step": 35127, "epoch": 836} {"train_loss": -5.575109004974365, "global_step": 35128, "epoch": 836} {"train_loss": -5.386250972747803, "global_step": 35129, "epoch": 836} {"train_loss": -5.473735809326172, "global_step": 35130, "epoch": 836} {"train_loss": -5.487531661987305, "global_step": 35131, "epoch": 836} {"train_loss": -5.488961219787598, "global_step": 35132, "epoch": 836} {"train_loss": -5.46612548828125, "global_step": 35133, "epoch": 836} {"train_loss": -5.404621601104736, "global_step": 35134, "epoch": 836} {"train_loss": -5.588204383850098, "global_step": 35135, "epoch": 836} {"train_loss": -5.63137149810791, "global_step": 35136, "epoch": 836} {"train_loss": -5.622130393981934, "global_step": 35137, "epoch": 836} {"train_loss": -5.629227161407471, "global_step": 35138, "epoch": 836} {"train_loss": -5.52249002456665, "global_step": 35139, "epoch": 836} {"train_loss": -5.4811248779296875, "global_step": 35140, "epoch": 836} {"train_loss": -5.4935994148254395, "global_step": 35141, "epoch": 836} {"train_loss": -5.495965957641602, "global_step": 35142, "epoch": 836} {"train_loss": -5.547992706298828, "global_step": 35143, "epoch": 836} {"train_loss": -5.678143501281738, "global_step": 35144, "epoch": 836} {"train_loss": -5.512960433959961, "global_step": 35145, "epoch": 836} {"train_loss": -5.529595375061035, "global_step": 35146, "epoch": 836} {"train_loss": -5.440058708190918, "global_step": 35147, "epoch": 836} {"train_loss": -5.612689971923828, "global_step": 35148, "epoch": 836} {"train_loss": -5.3896918296813965, "global_step": 35149, "epoch": 836} {"train_loss": -5.480706214904785, "global_step": 35150, "epoch": 836} {"train_loss": -5.52322244644165, "global_step": 35151, "epoch": 836} {"train_loss": -5.486377239227295, "global_step": 35152, "epoch": 836} {"train_loss": -5.541985307421003, "global_step": 35153, "epoch": 836, "val_loss": 66287.046875} {"train_loss": -5.517164707183838, "global_step": 35154, "epoch": 837} {"train_loss": -5.468978404998779, "global_step": 35155, "epoch": 837} {"train_loss": -5.564784049987793, "global_step": 35156, "epoch": 837} {"train_loss": -5.387369632720947, "global_step": 35157, "epoch": 837} {"train_loss": -5.503256797790527, "global_step": 35158, "epoch": 837} {"train_loss": -5.498660087585449, "global_step": 35159, "epoch": 837} {"train_loss": -5.454007148742676, "global_step": 35160, "epoch": 837} {"train_loss": -5.626102447509766, "global_step": 35161, "epoch": 837} {"train_loss": -5.52142333984375, "global_step": 35162, "epoch": 837} {"train_loss": -5.50767183303833, "global_step": 35163, "epoch": 837} {"train_loss": -5.664137840270996, "global_step": 35164, "epoch": 837} {"train_loss": -5.541681289672852, "global_step": 35165, "epoch": 837} {"train_loss": -5.559103965759277, "global_step": 35166, "epoch": 837} {"train_loss": -5.498751163482666, "global_step": 35167, "epoch": 837} {"train_loss": -5.529960632324219, "global_step": 35168, "epoch": 837} {"train_loss": -5.667326927185059, "global_step": 35169, "epoch": 837} {"train_loss": -5.615207672119141, "global_step": 35170, "epoch": 837} {"train_loss": -5.485713481903076, "global_step": 35171, "epoch": 837} {"train_loss": -5.674324989318848, "global_step": 35172, "epoch": 837} {"train_loss": -5.427870750427246, "global_step": 35173, "epoch": 837} {"train_loss": -5.399868011474609, "global_step": 35174, "epoch": 837} {"train_loss": -5.546510696411133, "global_step": 35175, "epoch": 837} {"train_loss": -5.522186279296875, "global_step": 35176, "epoch": 837} {"train_loss": -5.593348503112793, "global_step": 35177, "epoch": 837} {"train_loss": -5.434428691864014, "global_step": 35178, "epoch": 837} {"train_loss": -5.516184329986572, "global_step": 35179, "epoch": 837} {"train_loss": -5.6348772048950195, "global_step": 35180, "epoch": 837} {"train_loss": -5.425501346588135, "global_step": 35181, "epoch": 837} {"train_loss": -5.594389915466309, "global_step": 35182, "epoch": 837} {"train_loss": -5.601607322692871, "global_step": 35183, "epoch": 837} {"train_loss": -5.517488479614258, "global_step": 35184, "epoch": 837} {"train_loss": -5.57273530960083, "global_step": 35185, "epoch": 837} {"train_loss": -5.624992370605469, "global_step": 35186, "epoch": 837} {"train_loss": -5.527017593383789, "global_step": 35187, "epoch": 837} {"train_loss": -5.706914901733398, "global_step": 35188, "epoch": 837} {"train_loss": -5.559130668640137, "global_step": 35189, "epoch": 837} {"train_loss": -5.617362022399902, "global_step": 35190, "epoch": 837} {"train_loss": -5.537453651428223, "global_step": 35191, "epoch": 837} {"train_loss": -5.563930511474609, "global_step": 35192, "epoch": 837} {"train_loss": -5.609174728393555, "global_step": 35193, "epoch": 837} {"train_loss": -5.589812278747559, "global_step": 35194, "epoch": 837} {"train_loss": -5.547053007852464, "global_step": 35195, "epoch": 837, "val_loss": 66154.375} {"train_loss": -5.4748125076293945, "global_step": 35196, "epoch": 838} {"train_loss": -5.4948883056640625, "global_step": 35197, "epoch": 838} {"train_loss": -5.649202346801758, "global_step": 35198, "epoch": 838} {"train_loss": -5.508543491363525, "global_step": 35199, "epoch": 838} {"train_loss": -5.576325416564941, "global_step": 35200, "epoch": 838} {"train_loss": -5.605840682983398, "global_step": 35201, "epoch": 838} {"train_loss": -5.518319606781006, "global_step": 35202, "epoch": 838} {"train_loss": -5.4405741691589355, "global_step": 35203, "epoch": 838} {"train_loss": -5.4269585609436035, "global_step": 35204, "epoch": 838} {"train_loss": -5.654760360717773, "global_step": 35205, "epoch": 838} {"train_loss": -5.392286777496338, "global_step": 35206, "epoch": 838} {"train_loss": -5.527255535125732, "global_step": 35207, "epoch": 838} {"train_loss": -5.61063814163208, "global_step": 35208, "epoch": 838} {"train_loss": -5.61862850189209, "global_step": 35209, "epoch": 838} {"train_loss": -5.519474029541016, "global_step": 35210, "epoch": 838} {"train_loss": -5.438865661621094, "global_step": 35211, "epoch": 838} {"train_loss": -5.510397911071777, "global_step": 35212, "epoch": 838} {"train_loss": -5.554035186767578, "global_step": 35213, "epoch": 838} {"train_loss": -5.472675323486328, "global_step": 35214, "epoch": 838} {"train_loss": -5.509535312652588, "global_step": 35215, "epoch": 838} {"train_loss": -5.403933525085449, "global_step": 35216, "epoch": 838} {"train_loss": -5.560175895690918, "global_step": 35217, "epoch": 838} {"train_loss": -5.4857330322265625, "global_step": 35218, "epoch": 838} {"train_loss": -5.590658664703369, "global_step": 35219, "epoch": 838} {"train_loss": -5.571805953979492, "global_step": 35220, "epoch": 838} {"train_loss": -5.459005355834961, "global_step": 35221, "epoch": 838} {"train_loss": -5.515848159790039, "global_step": 35222, "epoch": 838} {"train_loss": -5.600464820861816, "global_step": 35223, "epoch": 838} {"train_loss": -5.595425605773926, "global_step": 35224, "epoch": 838} {"train_loss": -5.447600364685059, "global_step": 35225, "epoch": 838} {"train_loss": -5.612607955932617, "global_step": 35226, "epoch": 838} {"train_loss": -5.625538349151611, "global_step": 35227, "epoch": 838} {"train_loss": -5.618996620178223, "global_step": 35228, "epoch": 838} {"train_loss": -5.599350929260254, "global_step": 35229, "epoch": 838} {"train_loss": -5.674245834350586, "global_step": 35230, "epoch": 838} {"train_loss": -5.453372955322266, "global_step": 35231, "epoch": 838} {"train_loss": -5.514402866363525, "global_step": 35232, "epoch": 838} {"train_loss": -5.656674861907959, "global_step": 35233, "epoch": 838} {"train_loss": -5.5400567054748535, "global_step": 35234, "epoch": 838} {"train_loss": -5.606642723083496, "global_step": 35235, "epoch": 838} {"train_loss": -5.6050872802734375, "global_step": 35236, "epoch": 838} {"train_loss": -5.542877265385219, "global_step": 35237, "epoch": 838, "val_loss": 66477.2265625} {"train_loss": -5.599311828613281, "global_step": 35238, "epoch": 839} {"train_loss": -5.575557708740234, "global_step": 35239, "epoch": 839} {"train_loss": -5.64012336730957, "global_step": 35240, "epoch": 839} {"train_loss": -5.576257705688477, "global_step": 35241, "epoch": 839} {"train_loss": -5.547992706298828, "global_step": 35242, "epoch": 839} {"train_loss": -5.706864356994629, "global_step": 35243, "epoch": 839} {"train_loss": -5.488033294677734, "global_step": 35244, "epoch": 839} {"train_loss": -5.451608180999756, "global_step": 35245, "epoch": 839} {"train_loss": -5.583284378051758, "global_step": 35246, "epoch": 839} {"train_loss": -5.564626693725586, "global_step": 35247, "epoch": 839} {"train_loss": -5.554288387298584, "global_step": 35248, "epoch": 839} {"train_loss": -5.551510810852051, "global_step": 35249, "epoch": 839} {"train_loss": -5.558095455169678, "global_step": 35250, "epoch": 839} {"train_loss": -5.587780475616455, "global_step": 35251, "epoch": 839} {"train_loss": -5.704066753387451, "global_step": 35252, "epoch": 839} {"train_loss": -5.509125709533691, "global_step": 35253, "epoch": 839} {"train_loss": -5.523209571838379, "global_step": 35254, "epoch": 839} {"train_loss": -5.5831804275512695, "global_step": 35255, "epoch": 839} {"train_loss": -5.613333702087402, "global_step": 35256, "epoch": 839} {"train_loss": -5.562670707702637, "global_step": 35257, "epoch": 839} {"train_loss": -5.524235725402832, "global_step": 35258, "epoch": 839} {"train_loss": -5.702220916748047, "global_step": 35259, "epoch": 839} {"train_loss": -5.4958953857421875, "global_step": 35260, "epoch": 839} {"train_loss": -5.588560104370117, "global_step": 35261, "epoch": 839} {"train_loss": -5.491240978240967, "global_step": 35262, "epoch": 839} {"train_loss": -5.475506782531738, "global_step": 35263, "epoch": 839} {"train_loss": -5.630271911621094, "global_step": 35264, "epoch": 839} {"train_loss": -5.5747761726379395, "global_step": 35265, "epoch": 839} {"train_loss": -5.550775527954102, "global_step": 35266, "epoch": 839} {"train_loss": -5.49337100982666, "global_step": 35267, "epoch": 839} {"train_loss": -5.543673992156982, "global_step": 35268, "epoch": 839} {"train_loss": -5.368908882141113, "global_step": 35269, "epoch": 839} {"train_loss": -5.478660583496094, "global_step": 35270, "epoch": 839} {"train_loss": -5.494086265563965, "global_step": 35271, "epoch": 839} {"train_loss": -5.573671817779541, "global_step": 35272, "epoch": 839} {"train_loss": -5.6286725997924805, "global_step": 35273, "epoch": 839} {"train_loss": -5.674617767333984, "global_step": 35274, "epoch": 839} {"train_loss": -5.5688982009887695, "global_step": 35275, "epoch": 839} {"train_loss": -5.520754814147949, "global_step": 35276, "epoch": 839} {"train_loss": -5.534213542938232, "global_step": 35277, "epoch": 839} {"train_loss": -5.643500328063965, "global_step": 35278, "epoch": 839} {"train_loss": -5.5616352671668645, "global_step": 35279, "epoch": 839, "val_loss": 66415.484375} {"train_loss": -5.454216957092285, "global_step": 35280, "epoch": 840} {"train_loss": -5.62383508682251, "global_step": 35281, "epoch": 840} {"train_loss": -5.475468635559082, "global_step": 35282, "epoch": 840} {"train_loss": -5.587078094482422, "global_step": 35283, "epoch": 840} {"train_loss": -5.502567768096924, "global_step": 35284, "epoch": 840} {"train_loss": -5.462649345397949, "global_step": 35285, "epoch": 840} {"train_loss": -5.552741050720215, "global_step": 35286, "epoch": 840} {"train_loss": -5.506435871124268, "global_step": 35287, "epoch": 840} {"train_loss": -5.37584924697876, "global_step": 35288, "epoch": 840} {"train_loss": -5.57211446762085, "global_step": 35289, "epoch": 840} {"train_loss": -5.551987648010254, "global_step": 35290, "epoch": 840} {"train_loss": -5.552420616149902, "global_step": 35291, "epoch": 840} {"train_loss": -5.541135787963867, "global_step": 35292, "epoch": 840} {"train_loss": -5.476937294006348, "global_step": 35293, "epoch": 840} {"train_loss": -5.509018898010254, "global_step": 35294, "epoch": 840} {"train_loss": -5.487668037414551, "global_step": 35295, "epoch": 840} {"train_loss": -5.3672285079956055, "global_step": 35296, "epoch": 840} {"train_loss": -5.570949554443359, "global_step": 35297, "epoch": 840} {"train_loss": -5.505622863769531, "global_step": 35298, "epoch": 840} {"train_loss": -5.593941688537598, "global_step": 35299, "epoch": 840} {"train_loss": -5.353724002838135, "global_step": 35300, "epoch": 840} {"train_loss": -5.521698951721191, "global_step": 35301, "epoch": 840} {"train_loss": -5.524562358856201, "global_step": 35302, "epoch": 840} {"train_loss": -5.611388206481934, "global_step": 35303, "epoch": 840} {"train_loss": -5.519737243652344, "global_step": 35304, "epoch": 840} {"train_loss": -5.54302978515625, "global_step": 35305, "epoch": 840} {"train_loss": -5.588140487670898, "global_step": 35306, "epoch": 840} {"train_loss": -5.3925347328186035, "global_step": 35307, "epoch": 840} {"train_loss": -5.612653732299805, "global_step": 35308, "epoch": 840} {"train_loss": -5.607361316680908, "global_step": 35309, "epoch": 840} {"train_loss": -5.472905158996582, "global_step": 35310, "epoch": 840} {"train_loss": -5.634498596191406, "global_step": 35311, "epoch": 840} {"train_loss": -5.514836311340332, "global_step": 35312, "epoch": 840} {"train_loss": -5.485446929931641, "global_step": 35313, "epoch": 840} {"train_loss": -5.631344795227051, "global_step": 35314, "epoch": 840} {"train_loss": -5.422995567321777, "global_step": 35315, "epoch": 840} {"train_loss": -5.444892883300781, "global_step": 35316, "epoch": 840} {"train_loss": -5.607682228088379, "global_step": 35317, "epoch": 840} {"train_loss": -5.493969917297363, "global_step": 35318, "epoch": 840} {"train_loss": -5.442209720611572, "global_step": 35319, "epoch": 840} {"train_loss": -5.5135979652404785, "global_step": 35320, "epoch": 840} {"train_loss": -5.5192932060786655, "global_step": 35321, "epoch": 840, "val_loss": 67084.8359375} {"train_loss": -5.517716407775879, "global_step": 35322, "epoch": 841} {"train_loss": -5.576552391052246, "global_step": 35323, "epoch": 841} {"train_loss": -5.567378044128418, "global_step": 35324, "epoch": 841} {"train_loss": -5.462823390960693, "global_step": 35325, "epoch": 841} {"train_loss": -5.578202247619629, "global_step": 35326, "epoch": 841} {"train_loss": -5.530943870544434, "global_step": 35327, "epoch": 841} {"train_loss": -5.553793907165527, "global_step": 35328, "epoch": 841} {"train_loss": -5.665301322937012, "global_step": 35329, "epoch": 841} {"train_loss": -5.622369766235352, "global_step": 35330, "epoch": 841} {"train_loss": -5.593194484710693, "global_step": 35331, "epoch": 841} {"train_loss": -5.505135536193848, "global_step": 35332, "epoch": 841} {"train_loss": -5.518540382385254, "global_step": 35333, "epoch": 841} {"train_loss": -5.558114528656006, "global_step": 35334, "epoch": 841} {"train_loss": -5.552372932434082, "global_step": 35335, "epoch": 841} {"train_loss": -5.585912227630615, "global_step": 35336, "epoch": 841} {"train_loss": -5.719761371612549, "global_step": 35337, "epoch": 841} {"train_loss": -5.512862205505371, "global_step": 35338, "epoch": 841} {"train_loss": -5.655942440032959, "global_step": 35339, "epoch": 841} {"train_loss": -5.547725677490234, "global_step": 35340, "epoch": 841} {"train_loss": -5.575379371643066, "global_step": 35341, "epoch": 841} {"train_loss": -5.487353801727295, "global_step": 35342, "epoch": 841} {"train_loss": -5.506612777709961, "global_step": 35343, "epoch": 841} {"train_loss": -5.543226718902588, "global_step": 35344, "epoch": 841} {"train_loss": -5.423023223876953, "global_step": 35345, "epoch": 841} {"train_loss": -5.640442848205566, "global_step": 35346, "epoch": 841} {"train_loss": -5.5808424949646, "global_step": 35347, "epoch": 841} {"train_loss": -5.473155975341797, "global_step": 35348, "epoch": 841} {"train_loss": -5.541408538818359, "global_step": 35349, "epoch": 841} {"train_loss": -5.486945152282715, "global_step": 35350, "epoch": 841} {"train_loss": -5.440849304199219, "global_step": 35351, "epoch": 841} {"train_loss": -5.4633989334106445, "global_step": 35352, "epoch": 841} {"train_loss": -5.508563995361328, "global_step": 35353, "epoch": 841} {"train_loss": -5.699216365814209, "global_step": 35354, "epoch": 841} {"train_loss": -5.651597023010254, "global_step": 35355, "epoch": 841} {"train_loss": -5.628135681152344, "global_step": 35356, "epoch": 841} {"train_loss": -5.747534275054932, "global_step": 35357, "epoch": 841} {"train_loss": -5.5312089920043945, "global_step": 35358, "epoch": 841} {"train_loss": -5.567098617553711, "global_step": 35359, "epoch": 841} {"train_loss": -5.607334136962891, "global_step": 35360, "epoch": 841} {"train_loss": -5.533251762390137, "global_step": 35361, "epoch": 841} {"train_loss": -5.550683975219727, "global_step": 35362, "epoch": 841} {"train_loss": -5.559772003264654, "global_step": 35363, "epoch": 841, "val_loss": 66300.375} {"train_loss": -5.605927467346191, "global_step": 35364, "epoch": 842} {"train_loss": -5.571377277374268, "global_step": 35365, "epoch": 842} {"train_loss": -5.655508995056152, "global_step": 35366, "epoch": 842} {"train_loss": -5.544364929199219, "global_step": 35367, "epoch": 842} {"train_loss": -5.746681213378906, "global_step": 35368, "epoch": 842} {"train_loss": -5.526281356811523, "global_step": 35369, "epoch": 842} {"train_loss": -5.547898292541504, "global_step": 35370, "epoch": 842} {"train_loss": -5.556491851806641, "global_step": 35371, "epoch": 842} {"train_loss": -5.575995445251465, "global_step": 35372, "epoch": 842} {"train_loss": -5.623251914978027, "global_step": 35373, "epoch": 842} {"train_loss": -5.697504997253418, "global_step": 35374, "epoch": 842} {"train_loss": -5.534186363220215, "global_step": 35375, "epoch": 842} {"train_loss": -5.673612594604492, "global_step": 35376, "epoch": 842} {"train_loss": -5.5136308670043945, "global_step": 35377, "epoch": 842} {"train_loss": -5.580378532409668, "global_step": 35378, "epoch": 842} {"train_loss": -5.469658851623535, "global_step": 35379, "epoch": 842} {"train_loss": -5.529092788696289, "global_step": 35380, "epoch": 842} {"train_loss": -5.6435089111328125, "global_step": 35381, "epoch": 842} {"train_loss": -5.486119270324707, "global_step": 35382, "epoch": 842} {"train_loss": -5.586230278015137, "global_step": 35383, "epoch": 842} {"train_loss": -5.711363792419434, "global_step": 35384, "epoch": 842} {"train_loss": -5.545310020446777, "global_step": 35385, "epoch": 842} {"train_loss": -5.681136608123779, "global_step": 35386, "epoch": 842} {"train_loss": -5.568650722503662, "global_step": 35387, "epoch": 842} {"train_loss": -5.439503192901611, "global_step": 35388, "epoch": 842} {"train_loss": -5.517538070678711, "global_step": 35389, "epoch": 842} {"train_loss": -5.567966461181641, "global_step": 35390, "epoch": 842} {"train_loss": -5.635185241699219, "global_step": 35391, "epoch": 842} {"train_loss": -5.657179832458496, "global_step": 35392, "epoch": 842} {"train_loss": -5.556994438171387, "global_step": 35393, "epoch": 842} {"train_loss": -5.606013298034668, "global_step": 35394, "epoch": 842} {"train_loss": -5.5512495040893555, "global_step": 35395, "epoch": 842} {"train_loss": -5.477130889892578, "global_step": 35396, "epoch": 842} {"train_loss": -5.505789756774902, "global_step": 35397, "epoch": 842} {"train_loss": -5.700888633728027, "global_step": 35398, "epoch": 842} {"train_loss": -5.584639072418213, "global_step": 35399, "epoch": 842} {"train_loss": -5.711984157562256, "global_step": 35400, "epoch": 842} {"train_loss": -5.529624938964844, "global_step": 35401, "epoch": 842} {"train_loss": -5.525539398193359, "global_step": 35402, "epoch": 842} {"train_loss": -5.480828285217285, "global_step": 35403, "epoch": 842} {"train_loss": -5.462686538696289, "global_step": 35404, "epoch": 842} {"train_loss": -5.576578798748198, "global_step": 35405, "epoch": 842, "val_loss": 66343.203125} {"train_loss": -5.596055507659912, "global_step": 35406, "epoch": 843} {"train_loss": -5.690017223358154, "global_step": 35407, "epoch": 843} {"train_loss": -5.749683380126953, "global_step": 35408, "epoch": 843} {"train_loss": -5.565705299377441, "global_step": 35409, "epoch": 843} {"train_loss": -5.484975814819336, "global_step": 35410, "epoch": 843} {"train_loss": -5.606915473937988, "global_step": 35411, "epoch": 843} {"train_loss": -5.446479320526123, "global_step": 35412, "epoch": 843} {"train_loss": -5.509123802185059, "global_step": 35413, "epoch": 843} {"train_loss": -5.555745601654053, "global_step": 35414, "epoch": 843} {"train_loss": -5.432972431182861, "global_step": 35415, "epoch": 843} {"train_loss": -5.4890522956848145, "global_step": 35416, "epoch": 843} {"train_loss": -5.43999719619751, "global_step": 35417, "epoch": 843} {"train_loss": -5.4506707191467285, "global_step": 35418, "epoch": 843} {"train_loss": -5.511496067047119, "global_step": 35419, "epoch": 843} {"train_loss": -5.5437726974487305, "global_step": 35420, "epoch": 843} {"train_loss": -5.672085762023926, "global_step": 35421, "epoch": 843} {"train_loss": -5.48948860168457, "global_step": 35422, "epoch": 843} {"train_loss": -5.3481125831604, "global_step": 35423, "epoch": 843} {"train_loss": -5.505429267883301, "global_step": 35424, "epoch": 843} {"train_loss": -5.617458343505859, "global_step": 35425, "epoch": 843} {"train_loss": -5.608371734619141, "global_step": 35426, "epoch": 843} {"train_loss": -5.550943374633789, "global_step": 35427, "epoch": 843} {"train_loss": -5.406623840332031, "global_step": 35428, "epoch": 843} {"train_loss": -5.477613925933838, "global_step": 35429, "epoch": 843} {"train_loss": -5.491253852844238, "global_step": 35430, "epoch": 843} {"train_loss": -5.55042028427124, "global_step": 35431, "epoch": 843} {"train_loss": -5.529337406158447, "global_step": 35432, "epoch": 843} {"train_loss": -5.575008392333984, "global_step": 35433, "epoch": 843} {"train_loss": -5.602269172668457, "global_step": 35434, "epoch": 843} {"train_loss": -5.544182777404785, "global_step": 35435, "epoch": 843} {"train_loss": -5.612955093383789, "global_step": 35436, "epoch": 843} {"train_loss": -5.587159156799316, "global_step": 35437, "epoch": 843} {"train_loss": -5.668440818786621, "global_step": 35438, "epoch": 843} {"train_loss": -5.54288387298584, "global_step": 35439, "epoch": 843} {"train_loss": -5.599027156829834, "global_step": 35440, "epoch": 843} {"train_loss": -5.625576019287109, "global_step": 35441, "epoch": 843} {"train_loss": -5.749118804931641, "global_step": 35442, "epoch": 843} {"train_loss": -5.636543273925781, "global_step": 35443, "epoch": 843} {"train_loss": -5.59416389465332, "global_step": 35444, "epoch": 843} {"train_loss": -5.4885334968566895, "global_step": 35445, "epoch": 843} {"train_loss": -5.648471832275391, "global_step": 35446, "epoch": 843} {"train_loss": -5.555480150949387, "global_step": 35447, "epoch": 843, "val_loss": 66199.71875} {"train_loss": -5.556488513946533, "global_step": 35448, "epoch": 844} {"train_loss": -5.629199981689453, "global_step": 35449, "epoch": 844} {"train_loss": -5.530993461608887, "global_step": 35450, "epoch": 844} {"train_loss": -5.5580644607543945, "global_step": 35451, "epoch": 844} {"train_loss": -5.601378440856934, "global_step": 35452, "epoch": 844} {"train_loss": -5.418513298034668, "global_step": 35453, "epoch": 844} {"train_loss": -5.571172714233398, "global_step": 35454, "epoch": 844} {"train_loss": -5.571300983428955, "global_step": 35455, "epoch": 844} {"train_loss": -5.442516326904297, "global_step": 35456, "epoch": 844} {"train_loss": -5.566883087158203, "global_step": 35457, "epoch": 844} {"train_loss": -5.508535861968994, "global_step": 35458, "epoch": 844} {"train_loss": -5.688377380371094, "global_step": 35459, "epoch": 844} {"train_loss": -5.534411430358887, "global_step": 35460, "epoch": 844} {"train_loss": -5.578003883361816, "global_step": 35461, "epoch": 844} {"train_loss": -5.539661407470703, "global_step": 35462, "epoch": 844} {"train_loss": -5.5395097732543945, "global_step": 35463, "epoch": 844} {"train_loss": -5.6297831535339355, "global_step": 35464, "epoch": 844} {"train_loss": -5.610795974731445, "global_step": 35465, "epoch": 844} {"train_loss": -5.571004867553711, "global_step": 35466, "epoch": 844} {"train_loss": -5.626077651977539, "global_step": 35467, "epoch": 844} {"train_loss": -5.408422946929932, "global_step": 35468, "epoch": 844} {"train_loss": -5.542716026306152, "global_step": 35469, "epoch": 844} {"train_loss": -5.612164497375488, "global_step": 35470, "epoch": 844} {"train_loss": -5.561953544616699, "global_step": 35471, "epoch": 844} {"train_loss": -5.664515972137451, "global_step": 35472, "epoch": 844} {"train_loss": -5.601364612579346, "global_step": 35473, "epoch": 844} {"train_loss": -5.631158828735352, "global_step": 35474, "epoch": 844} {"train_loss": -5.701920509338379, "global_step": 35475, "epoch": 844} {"train_loss": -5.640258312225342, "global_step": 35476, "epoch": 844} {"train_loss": -5.600344657897949, "global_step": 35477, "epoch": 844} {"train_loss": -5.589698791503906, "global_step": 35478, "epoch": 844} {"train_loss": -5.532172203063965, "global_step": 35479, "epoch": 844} {"train_loss": -5.623222351074219, "global_step": 35480, "epoch": 844} {"train_loss": -5.428891181945801, "global_step": 35481, "epoch": 844} {"train_loss": -5.5164384841918945, "global_step": 35482, "epoch": 844} {"train_loss": -5.572547912597656, "global_step": 35483, "epoch": 844} {"train_loss": -5.490444660186768, "global_step": 35484, "epoch": 844} {"train_loss": -5.489130020141602, "global_step": 35485, "epoch": 844} {"train_loss": -5.572773456573486, "global_step": 35486, "epoch": 844} {"train_loss": -5.5539655685424805, "global_step": 35487, "epoch": 844} {"train_loss": -5.4541425704956055, "global_step": 35488, "epoch": 844} {"train_loss": -5.56243406023298, "global_step": 35489, "epoch": 844, "val_loss": 66335.890625} {"train_loss": -5.453846454620361, "global_step": 35490, "epoch": 845} {"train_loss": -5.594348430633545, "global_step": 35491, "epoch": 845} {"train_loss": -5.624605655670166, "global_step": 35492, "epoch": 845} {"train_loss": -5.495872497558594, "global_step": 35493, "epoch": 845} {"train_loss": -5.610778331756592, "global_step": 35494, "epoch": 845} {"train_loss": -5.568358421325684, "global_step": 35495, "epoch": 845} {"train_loss": -5.473169326782227, "global_step": 35496, "epoch": 845} {"train_loss": -5.505209922790527, "global_step": 35497, "epoch": 845} {"train_loss": -5.55800199508667, "global_step": 35498, "epoch": 845} {"train_loss": -5.503020286560059, "global_step": 35499, "epoch": 845} {"train_loss": -5.545658111572266, "global_step": 35500, "epoch": 845} {"train_loss": -5.508209228515625, "global_step": 35501, "epoch": 845} {"train_loss": -5.58919620513916, "global_step": 35502, "epoch": 845} {"train_loss": -5.568122863769531, "global_step": 35503, "epoch": 845} {"train_loss": -5.653936386108398, "global_step": 35504, "epoch": 845} {"train_loss": -5.553408622741699, "global_step": 35505, "epoch": 845} {"train_loss": -5.637642860412598, "global_step": 35506, "epoch": 845} {"train_loss": -5.540951728820801, "global_step": 35507, "epoch": 845} {"train_loss": -5.605344772338867, "global_step": 35508, "epoch": 845} {"train_loss": -5.569851875305176, "global_step": 35509, "epoch": 845} {"train_loss": -5.699615478515625, "global_step": 35510, "epoch": 845} {"train_loss": -5.516496658325195, "global_step": 35511, "epoch": 845} {"train_loss": -5.568273067474365, "global_step": 35512, "epoch": 845} {"train_loss": -5.5967254638671875, "global_step": 35513, "epoch": 845} {"train_loss": -5.510195255279541, "global_step": 35514, "epoch": 845} {"train_loss": -5.56577205657959, "global_step": 35515, "epoch": 845} {"train_loss": -5.678738594055176, "global_step": 35516, "epoch": 845} {"train_loss": -5.404860973358154, "global_step": 35517, "epoch": 845} {"train_loss": -5.542412281036377, "global_step": 35518, "epoch": 845} {"train_loss": -5.508218288421631, "global_step": 35519, "epoch": 845} {"train_loss": -5.4063568115234375, "global_step": 35520, "epoch": 845} {"train_loss": -5.552194595336914, "global_step": 35521, "epoch": 845} {"train_loss": -5.566689968109131, "global_step": 35522, "epoch": 845} {"train_loss": -5.52852201461792, "global_step": 35523, "epoch": 845} {"train_loss": -5.497682571411133, "global_step": 35524, "epoch": 845} {"train_loss": -5.522279739379883, "global_step": 35525, "epoch": 845} {"train_loss": -5.681655406951904, "global_step": 35526, "epoch": 845} {"train_loss": -5.607407093048096, "global_step": 35527, "epoch": 845} {"train_loss": -5.49720573425293, "global_step": 35528, "epoch": 845} {"train_loss": -5.622171401977539, "global_step": 35529, "epoch": 845} {"train_loss": -5.535884857177734, "global_step": 35530, "epoch": 845} {"train_loss": -5.554293496268136, "global_step": 35531, "epoch": 845, "val_loss": 66868.5} {"train_loss": -5.473814010620117, "global_step": 35532, "epoch": 846} {"train_loss": -5.495354652404785, "global_step": 35533, "epoch": 846} {"train_loss": -5.5173749923706055, "global_step": 35534, "epoch": 846} {"train_loss": -5.478789806365967, "global_step": 35535, "epoch": 846} {"train_loss": -5.703856468200684, "global_step": 35536, "epoch": 846} {"train_loss": -5.559803009033203, "global_step": 35537, "epoch": 846} {"train_loss": -5.519658088684082, "global_step": 35538, "epoch": 846} {"train_loss": -5.596446514129639, "global_step": 35539, "epoch": 846} {"train_loss": -5.417397499084473, "global_step": 35540, "epoch": 846} {"train_loss": -5.49790096282959, "global_step": 35541, "epoch": 846} {"train_loss": -5.57359504699707, "global_step": 35542, "epoch": 846} {"train_loss": -5.517251968383789, "global_step": 35543, "epoch": 846} {"train_loss": -5.639565467834473, "global_step": 35544, "epoch": 846} {"train_loss": -5.448798656463623, "global_step": 35545, "epoch": 846} {"train_loss": -5.537226676940918, "global_step": 35546, "epoch": 846} {"train_loss": -5.685619354248047, "global_step": 35547, "epoch": 846} {"train_loss": -5.561665058135986, "global_step": 35548, "epoch": 846} {"train_loss": -5.507445335388184, "global_step": 35549, "epoch": 846} {"train_loss": -5.485969543457031, "global_step": 35550, "epoch": 846} {"train_loss": -5.4885406494140625, "global_step": 35551, "epoch": 846} {"train_loss": -5.415755748748779, "global_step": 35552, "epoch": 846} {"train_loss": -5.52579402923584, "global_step": 35553, "epoch": 846} {"train_loss": -5.644133567810059, "global_step": 35554, "epoch": 846} {"train_loss": -5.407052040100098, "global_step": 35555, "epoch": 846} {"train_loss": -5.508765697479248, "global_step": 35556, "epoch": 846} {"train_loss": -5.613839149475098, "global_step": 35557, "epoch": 846} {"train_loss": -5.392006874084473, "global_step": 35558, "epoch": 846} {"train_loss": -5.699894905090332, "global_step": 35559, "epoch": 846} {"train_loss": -5.474136829376221, "global_step": 35560, "epoch": 846} {"train_loss": -5.576898574829102, "global_step": 35561, "epoch": 846} {"train_loss": -5.434935569763184, "global_step": 35562, "epoch": 846} {"train_loss": -5.551509857177734, "global_step": 35563, "epoch": 846} {"train_loss": -5.567876815795898, "global_step": 35564, "epoch": 846} {"train_loss": -5.714535713195801, "global_step": 35565, "epoch": 846} {"train_loss": -5.579864978790283, "global_step": 35566, "epoch": 846} {"train_loss": -5.4752655029296875, "global_step": 35567, "epoch": 846} {"train_loss": -5.664289474487305, "global_step": 35568, "epoch": 846} {"train_loss": -5.523975372314453, "global_step": 35569, "epoch": 846} {"train_loss": -5.621209144592285, "global_step": 35570, "epoch": 846} {"train_loss": -5.562474727630615, "global_step": 35571, "epoch": 846} {"train_loss": -5.519618034362793, "global_step": 35572, "epoch": 846} {"train_loss": -5.540121555328369, "global_step": 35573, "epoch": 846, "val_loss": 66425.4921875} {"train_loss": -5.5265045166015625, "global_step": 35574, "epoch": 847} {"train_loss": -5.436310291290283, "global_step": 35575, "epoch": 847} {"train_loss": -5.5318121910095215, "global_step": 35576, "epoch": 847} {"train_loss": -5.646859169006348, "global_step": 35577, "epoch": 847} {"train_loss": -5.444180488586426, "global_step": 35578, "epoch": 847} {"train_loss": -5.504062175750732, "global_step": 35579, "epoch": 847} {"train_loss": -5.486813545227051, "global_step": 35580, "epoch": 847} {"train_loss": -5.675073146820068, "global_step": 35581, "epoch": 847} {"train_loss": -5.628829479217529, "global_step": 35582, "epoch": 847} {"train_loss": -5.536215305328369, "global_step": 35583, "epoch": 847} {"train_loss": -5.600255966186523, "global_step": 35584, "epoch": 847} {"train_loss": -5.670821189880371, "global_step": 35585, "epoch": 847} {"train_loss": -5.654983043670654, "global_step": 35586, "epoch": 847} {"train_loss": -5.6483235359191895, "global_step": 35587, "epoch": 847} {"train_loss": -5.566351890563965, "global_step": 35588, "epoch": 847} {"train_loss": -5.562369346618652, "global_step": 35589, "epoch": 847} {"train_loss": -5.569949150085449, "global_step": 35590, "epoch": 847} {"train_loss": -5.4814605712890625, "global_step": 35591, "epoch": 847} {"train_loss": -5.495909214019775, "global_step": 35592, "epoch": 847} {"train_loss": -5.568744659423828, "global_step": 35593, "epoch": 847} {"train_loss": -5.5521111488342285, "global_step": 35594, "epoch": 847} {"train_loss": -5.5294084548950195, "global_step": 35595, "epoch": 847} {"train_loss": -5.630839824676514, "global_step": 35596, "epoch": 847} {"train_loss": -5.546230792999268, "global_step": 35597, "epoch": 847} {"train_loss": -5.566224098205566, "global_step": 35598, "epoch": 847} {"train_loss": -5.624665260314941, "global_step": 35599, "epoch": 847} {"train_loss": -5.438939571380615, "global_step": 35600, "epoch": 847} {"train_loss": -5.511672496795654, "global_step": 35601, "epoch": 847} {"train_loss": -5.555601596832275, "global_step": 35602, "epoch": 847} {"train_loss": -5.579110145568848, "global_step": 35603, "epoch": 847} {"train_loss": -5.567218780517578, "global_step": 35604, "epoch": 847} {"train_loss": -5.5143818855285645, "global_step": 35605, "epoch": 847} {"train_loss": -5.6174516677856445, "global_step": 35606, "epoch": 847} {"train_loss": -5.6203131675720215, "global_step": 35607, "epoch": 847} {"train_loss": -5.518068313598633, "global_step": 35608, "epoch": 847} {"train_loss": -5.5076584815979, "global_step": 35609, "epoch": 847} {"train_loss": -5.6169209480285645, "global_step": 35610, "epoch": 847} {"train_loss": -5.722683429718018, "global_step": 35611, "epoch": 847} {"train_loss": -5.4689483642578125, "global_step": 35612, "epoch": 847} {"train_loss": -5.651364326477051, "global_step": 35613, "epoch": 847} {"train_loss": -5.6588850021362305, "global_step": 35614, "epoch": 847} {"train_loss": -5.568846021379743, "global_step": 35615, "epoch": 847, "val_loss": 66287.53125} {"train_loss": -5.65659236907959, "global_step": 35616, "epoch": 848} {"train_loss": -5.580252647399902, "global_step": 35617, "epoch": 848} {"train_loss": -5.6617913246154785, "global_step": 35618, "epoch": 848} {"train_loss": -5.611317157745361, "global_step": 35619, "epoch": 848} {"train_loss": -5.570343017578125, "global_step": 35620, "epoch": 848} {"train_loss": -5.601371765136719, "global_step": 35621, "epoch": 848} {"train_loss": -5.606235027313232, "global_step": 35622, "epoch": 848} {"train_loss": -5.579699516296387, "global_step": 35623, "epoch": 848} {"train_loss": -5.445350646972656, "global_step": 35624, "epoch": 848} {"train_loss": -5.625668048858643, "global_step": 35625, "epoch": 848} {"train_loss": -5.445291519165039, "global_step": 35626, "epoch": 848} {"train_loss": -5.526476860046387, "global_step": 35627, "epoch": 848} {"train_loss": -5.568216800689697, "global_step": 35628, "epoch": 848} {"train_loss": -5.496456146240234, "global_step": 35629, "epoch": 848} {"train_loss": -5.529634475708008, "global_step": 35630, "epoch": 848} {"train_loss": -5.469600200653076, "global_step": 35631, "epoch": 848} {"train_loss": -5.513880729675293, "global_step": 35632, "epoch": 848} {"train_loss": -5.594968795776367, "global_step": 35633, "epoch": 848} {"train_loss": -5.625343322753906, "global_step": 35634, "epoch": 848} {"train_loss": -5.5075297355651855, "global_step": 35635, "epoch": 848} {"train_loss": -5.50369930267334, "global_step": 35636, "epoch": 848} {"train_loss": -5.585184574127197, "global_step": 35637, "epoch": 848} {"train_loss": -5.5989484786987305, "global_step": 35638, "epoch": 848} {"train_loss": -5.5715227127075195, "global_step": 35639, "epoch": 848} {"train_loss": -5.6174492835998535, "global_step": 35640, "epoch": 848} {"train_loss": -5.590465545654297, "global_step": 35641, "epoch": 848} {"train_loss": -5.680278778076172, "global_step": 35642, "epoch": 848} {"train_loss": -5.502683639526367, "global_step": 35643, "epoch": 848} {"train_loss": -5.548545837402344, "global_step": 35644, "epoch": 848} {"train_loss": -5.551802635192871, "global_step": 35645, "epoch": 848} {"train_loss": -5.7046661376953125, "global_step": 35646, "epoch": 848} {"train_loss": -5.480349540710449, "global_step": 35647, "epoch": 848} {"train_loss": -5.671234607696533, "global_step": 35648, "epoch": 848} {"train_loss": -5.504660606384277, "global_step": 35649, "epoch": 848} {"train_loss": -5.498549461364746, "global_step": 35650, "epoch": 848} {"train_loss": -5.56835412979126, "global_step": 35651, "epoch": 848} {"train_loss": -5.478935718536377, "global_step": 35652, "epoch": 848} {"train_loss": -5.499792575836182, "global_step": 35653, "epoch": 848} {"train_loss": -5.583405017852783, "global_step": 35654, "epoch": 848} {"train_loss": -5.649140357971191, "global_step": 35655, "epoch": 848} {"train_loss": -5.646730422973633, "global_step": 35656, "epoch": 848} {"train_loss": -5.5662857464381625, "global_step": 35657, "epoch": 848, "val_loss": 65847.421875} {"train_loss": -5.563968658447266, "global_step": 35658, "epoch": 849} {"train_loss": -5.494260311126709, "global_step": 35659, "epoch": 849} {"train_loss": -5.5467000007629395, "global_step": 35660, "epoch": 849} {"train_loss": -5.5642781257629395, "global_step": 35661, "epoch": 849} {"train_loss": -5.556575775146484, "global_step": 35662, "epoch": 849} {"train_loss": -5.599057197570801, "global_step": 35663, "epoch": 849} {"train_loss": -5.561409950256348, "global_step": 35664, "epoch": 849} {"train_loss": -5.619161605834961, "global_step": 35665, "epoch": 849} {"train_loss": -5.672626972198486, "global_step": 35666, "epoch": 849} {"train_loss": -5.6475348472595215, "global_step": 35667, "epoch": 849} {"train_loss": -5.535358428955078, "global_step": 35668, "epoch": 849} {"train_loss": -5.471895694732666, "global_step": 35669, "epoch": 849} {"train_loss": -5.676142692565918, "global_step": 35670, "epoch": 849} {"train_loss": -5.377772808074951, "global_step": 35671, "epoch": 849} {"train_loss": -5.587760925292969, "global_step": 35672, "epoch": 849} {"train_loss": -5.622780799865723, "global_step": 35673, "epoch": 849} {"train_loss": -5.600367546081543, "global_step": 35674, "epoch": 849} {"train_loss": -5.43162727355957, "global_step": 35675, "epoch": 849} {"train_loss": -5.566315174102783, "global_step": 35676, "epoch": 849} {"train_loss": -5.590588569641113, "global_step": 35677, "epoch": 849} {"train_loss": -5.485811233520508, "global_step": 35678, "epoch": 849} {"train_loss": -5.651623725891113, "global_step": 35679, "epoch": 849} {"train_loss": -5.552360534667969, "global_step": 35680, "epoch": 849} {"train_loss": -5.605632305145264, "global_step": 35681, "epoch": 849} {"train_loss": -5.583904266357422, "global_step": 35682, "epoch": 849} {"train_loss": -5.521535396575928, "global_step": 35683, "epoch": 849} {"train_loss": -5.631478309631348, "global_step": 35684, "epoch": 849} {"train_loss": -5.557034492492676, "global_step": 35685, "epoch": 849} {"train_loss": -5.511467456817627, "global_step": 35686, "epoch": 849} {"train_loss": -5.5778703689575195, "global_step": 35687, "epoch": 849} {"train_loss": -5.419781684875488, "global_step": 35688, "epoch": 849} {"train_loss": -5.520866394042969, "global_step": 35689, "epoch": 849} {"train_loss": -5.626104354858398, "global_step": 35690, "epoch": 849} {"train_loss": -5.560346603393555, "global_step": 35691, "epoch": 849} {"train_loss": -5.532341957092285, "global_step": 35692, "epoch": 849} {"train_loss": -5.471723556518555, "global_step": 35693, "epoch": 849} {"train_loss": -5.513674736022949, "global_step": 35694, "epoch": 849} {"train_loss": -5.668222427368164, "global_step": 35695, "epoch": 849} {"train_loss": -5.462739944458008, "global_step": 35696, "epoch": 849} {"train_loss": -5.500679969787598, "global_step": 35697, "epoch": 849} {"train_loss": -5.567331790924072, "global_step": 35698, "epoch": 849} {"train_loss": -5.553963116237095, "global_step": 35699, "epoch": 849, "val_loss": 66341.484375} {"train_loss": -5.678816795349121, "global_step": 35700, "epoch": 850} {"train_loss": -5.527342796325684, "global_step": 35701, "epoch": 850} {"train_loss": -5.449037551879883, "global_step": 35702, "epoch": 850} {"train_loss": -5.625124931335449, "global_step": 35703, "epoch": 850} {"train_loss": -5.687953948974609, "global_step": 35704, "epoch": 850} {"train_loss": -5.561272144317627, "global_step": 35705, "epoch": 850} {"train_loss": -5.6102375984191895, "global_step": 35706, "epoch": 850} {"train_loss": -5.6933274269104, "global_step": 35707, "epoch": 850} {"train_loss": -5.603725910186768, "global_step": 35708, "epoch": 850} {"train_loss": -5.592690467834473, "global_step": 35709, "epoch": 850} {"train_loss": -5.633007049560547, "global_step": 35710, "epoch": 850} {"train_loss": -5.600586414337158, "global_step": 35711, "epoch": 850} {"train_loss": -5.499903678894043, "global_step": 35712, "epoch": 850} {"train_loss": -5.67671012878418, "global_step": 35713, "epoch": 850} {"train_loss": -5.632421970367432, "global_step": 35714, "epoch": 850} {"train_loss": -5.330809593200684, "global_step": 35715, "epoch": 850} {"train_loss": -5.536417484283447, "global_step": 35716, "epoch": 850} {"train_loss": -5.450023651123047, "global_step": 35717, "epoch": 850} {"train_loss": -5.53092098236084, "global_step": 35718, "epoch": 850} {"train_loss": -5.681003570556641, "global_step": 35719, "epoch": 850} {"train_loss": -5.409539699554443, "global_step": 35720, "epoch": 850} {"train_loss": -5.359394550323486, "global_step": 35721, "epoch": 850} {"train_loss": -5.580294609069824, "global_step": 35722, "epoch": 850} {"train_loss": -5.467289924621582, "global_step": 35723, "epoch": 850} {"train_loss": -5.673699378967285, "global_step": 35724, "epoch": 850} {"train_loss": -5.362874984741211, "global_step": 35725, "epoch": 850} {"train_loss": -5.553411960601807, "global_step": 35726, "epoch": 850} {"train_loss": -5.640044689178467, "global_step": 35727, "epoch": 850} {"train_loss": -5.454261779785156, "global_step": 35728, "epoch": 850} {"train_loss": -5.567741870880127, "global_step": 35729, "epoch": 850} {"train_loss": -5.45166015625, "global_step": 35730, "epoch": 850} {"train_loss": -5.494711399078369, "global_step": 35731, "epoch": 850} {"train_loss": -5.595546722412109, "global_step": 35732, "epoch": 850} {"train_loss": -5.400913238525391, "global_step": 35733, "epoch": 850} {"train_loss": -5.510004997253418, "global_step": 35734, "epoch": 850} {"train_loss": -5.461390495300293, "global_step": 35735, "epoch": 850} {"train_loss": -5.479554176330566, "global_step": 35736, "epoch": 850} {"train_loss": -5.324141025543213, "global_step": 35737, "epoch": 850} {"train_loss": -5.581783294677734, "global_step": 35738, "epoch": 850} {"train_loss": -5.498122215270996, "global_step": 35739, "epoch": 850} {"train_loss": -5.594520568847656, "global_step": 35740, "epoch": 850} {"train_loss": -5.5430677731831866, "global_step": 35741, "epoch": 850, "train/sim_max_reward_0": 0.564830336767482, "train/sim_max_reward_1": 0.06500088140306147, "train/sim_max_reward_2": 0.41598054802680207, "train/sim_max_reward_3": 0.16395280102195423, "train/sim_max_reward_4": 0.9763522523240207, "train/sim_max_reward_5": 0.7545428076720976, "test/sim_max_reward_4400000": 0.14779655660940397, "test/sim_max_reward_4400001": 0.15392968198044013, "test/sim_max_reward_4400002": 0.7932952616153278, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.34837262704026495, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.44397993127449636, "test/sim_max_reward_4400007": 0.1847136974304617, "test/sim_max_reward_4400008": 0.4855644436895308, "test/sim_max_reward_4400009": 0.30523838143127985, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.2343277042112997, "test/sim_max_reward_4400012": 0.41311537816813626, "test/sim_max_reward_4400013": 0.40492384779132645, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.6180974216797267, "test/sim_max_reward_4400016": 0.08328774083955136, "test/sim_max_reward_4400017": 0.3355199017544798, "test/sim_max_reward_4400018": 0.332891429918457, "test/sim_max_reward_4400019": 0.41837372347536994, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.7233514270217639, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.3947469334482843, "test/sim_max_reward_4400027": 0.10967534385379688, "test/sim_max_reward_4400028": 0.3821259668318443, "test/sim_max_reward_4400029": 0.4037047827731908, "test/sim_max_reward_4400030": 0.4785114073922216, "test/sim_max_reward_4400031": 0.4111502447437176, "test/sim_max_reward_4400032": 0.266465688558694, "test/sim_max_reward_4400033": 0.13871465675694902, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.47335308332701587, "test/sim_max_reward_4400036": 0.31117464825815394, "test/sim_max_reward_4400037": 0.24821438005057644, "test/sim_max_reward_4400038": 0.14940591669451883, "test/sim_max_reward_4400039": 0.44710278304862494, "test/sim_max_reward_4400040": 0.061343557905042936, "test/sim_max_reward_4400041": 0.5885529064684969, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.04857145345112297, "test/sim_max_reward_4400044": 0.19329322398643375, "test/sim_max_reward_4400045": 0.32894695146294334, "test/sim_max_reward_4400046": 0.27968716245250275, "test/sim_max_reward_4400047": 0.9297554725232483, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.015478105314310773, "train/mean_score": 0.49010993786923635, "test/mean_score": 0.2783237827912738, "val_loss": 66380.8515625} {"train_loss": -5.450316429138184, "global_step": 35742, "epoch": 851} {"train_loss": -5.62901496887207, "global_step": 35743, "epoch": 851} {"train_loss": -5.584115505218506, "global_step": 35744, "epoch": 851} {"train_loss": -5.46082878112793, "global_step": 35745, "epoch": 851} {"train_loss": -5.547009468078613, "global_step": 35746, "epoch": 851} {"train_loss": -5.7024736404418945, "global_step": 35747, "epoch": 851} {"train_loss": -5.425100803375244, "global_step": 35748, "epoch": 851} {"train_loss": -5.634193420410156, "global_step": 35749, "epoch": 851} {"train_loss": -5.647704124450684, "global_step": 35750, "epoch": 851} {"train_loss": -5.5400214195251465, "global_step": 35751, "epoch": 851} {"train_loss": -5.6045613288879395, "global_step": 35752, "epoch": 851} {"train_loss": -5.528038501739502, "global_step": 35753, "epoch": 851} {"train_loss": -5.652675628662109, "global_step": 35754, "epoch": 851} {"train_loss": -5.542486190795898, "global_step": 35755, "epoch": 851} {"train_loss": -5.574483871459961, "global_step": 35756, "epoch": 851} {"train_loss": -5.572002410888672, "global_step": 35757, "epoch": 851} {"train_loss": -5.5889201164245605, "global_step": 35758, "epoch": 851} {"train_loss": -5.556803226470947, "global_step": 35759, "epoch": 851} {"train_loss": -5.653845310211182, "global_step": 35760, "epoch": 851} {"train_loss": -5.414484977722168, "global_step": 35761, "epoch": 851} {"train_loss": -5.541421413421631, "global_step": 35762, "epoch": 851} {"train_loss": -5.556429862976074, "global_step": 35763, "epoch": 851} {"train_loss": -5.478399753570557, "global_step": 35764, "epoch": 851} {"train_loss": -5.577088356018066, "global_step": 35765, "epoch": 851} {"train_loss": -5.4497480392456055, "global_step": 35766, "epoch": 851} {"train_loss": -5.560410022735596, "global_step": 35767, "epoch": 851} {"train_loss": -5.616689682006836, "global_step": 35768, "epoch": 851} {"train_loss": -5.453302383422852, "global_step": 35769, "epoch": 851} {"train_loss": -5.427530765533447, "global_step": 35770, "epoch": 851} {"train_loss": -5.665719509124756, "global_step": 35771, "epoch": 851} {"train_loss": -5.588008880615234, "global_step": 35772, "epoch": 851} {"train_loss": -5.578763484954834, "global_step": 35773, "epoch": 851} {"train_loss": -5.404343128204346, "global_step": 35774, "epoch": 851} {"train_loss": -5.590154647827148, "global_step": 35775, "epoch": 851} {"train_loss": -5.567264556884766, "global_step": 35776, "epoch": 851} {"train_loss": -5.538746356964111, "global_step": 35777, "epoch": 851} {"train_loss": -5.627930164337158, "global_step": 35778, "epoch": 851} {"train_loss": -5.637517929077148, "global_step": 35779, "epoch": 851} {"train_loss": -5.638671875, "global_step": 35780, "epoch": 851} {"train_loss": -5.521461486816406, "global_step": 35781, "epoch": 851} {"train_loss": -5.621051788330078, "global_step": 35782, "epoch": 851} {"train_loss": -5.560046752293904, "global_step": 35783, "epoch": 851, "val_loss": 66091.9296875} {"train_loss": -5.499815940856934, "global_step": 35784, "epoch": 852} {"train_loss": -5.59821081161499, "global_step": 35785, "epoch": 852} {"train_loss": -5.47005558013916, "global_step": 35786, "epoch": 852} {"train_loss": -5.535691261291504, "global_step": 35787, "epoch": 852} {"train_loss": -5.4999237060546875, "global_step": 35788, "epoch": 852} {"train_loss": -5.561276912689209, "global_step": 35789, "epoch": 852} {"train_loss": -5.653550624847412, "global_step": 35790, "epoch": 852} {"train_loss": -5.646389961242676, "global_step": 35791, "epoch": 852} {"train_loss": -5.6322526931762695, "global_step": 35792, "epoch": 852} {"train_loss": -5.734275817871094, "global_step": 35793, "epoch": 852} {"train_loss": -5.570934295654297, "global_step": 35794, "epoch": 852} {"train_loss": -5.6118011474609375, "global_step": 35795, "epoch": 852} {"train_loss": -5.7068891525268555, "global_step": 35796, "epoch": 852} {"train_loss": -5.5264997482299805, "global_step": 35797, "epoch": 852} {"train_loss": -5.40164041519165, "global_step": 35798, "epoch": 852} {"train_loss": -5.5348615646362305, "global_step": 35799, "epoch": 852} {"train_loss": -5.626941680908203, "global_step": 35800, "epoch": 852} {"train_loss": -5.457207202911377, "global_step": 35801, "epoch": 852} {"train_loss": -5.575090408325195, "global_step": 35802, "epoch": 852} {"train_loss": -5.5557355880737305, "global_step": 35803, "epoch": 852} {"train_loss": -5.399477958679199, "global_step": 35804, "epoch": 852} {"train_loss": -5.583335876464844, "global_step": 35805, "epoch": 852} {"train_loss": -5.446524620056152, "global_step": 35806, "epoch": 852} {"train_loss": -5.409657955169678, "global_step": 35807, "epoch": 852} {"train_loss": -5.63083553314209, "global_step": 35808, "epoch": 852} {"train_loss": -5.4382123947143555, "global_step": 35809, "epoch": 852} {"train_loss": -5.429732322692871, "global_step": 35810, "epoch": 852} {"train_loss": -5.539191246032715, "global_step": 35811, "epoch": 852} {"train_loss": -5.430950164794922, "global_step": 35812, "epoch": 852} {"train_loss": -5.552857875823975, "global_step": 35813, "epoch": 852} {"train_loss": -5.585074424743652, "global_step": 35814, "epoch": 852} {"train_loss": -5.587690353393555, "global_step": 35815, "epoch": 852} {"train_loss": -5.498950481414795, "global_step": 35816, "epoch": 852} {"train_loss": -5.424142837524414, "global_step": 35817, "epoch": 852} {"train_loss": -5.476166725158691, "global_step": 35818, "epoch": 852} {"train_loss": -5.5523881912231445, "global_step": 35819, "epoch": 852} {"train_loss": -5.427234649658203, "global_step": 35820, "epoch": 852} {"train_loss": -5.601098537445068, "global_step": 35821, "epoch": 852} {"train_loss": -5.527410984039307, "global_step": 35822, "epoch": 852} {"train_loss": -5.658519744873047, "global_step": 35823, "epoch": 852} {"train_loss": -5.39814567565918, "global_step": 35824, "epoch": 852} {"train_loss": -5.537809417361305, "global_step": 35825, "epoch": 852, "val_loss": 66805.625} {"train_loss": -5.609558582305908, "global_step": 35826, "epoch": 853} {"train_loss": -5.56574010848999, "global_step": 35827, "epoch": 853} {"train_loss": -5.336943626403809, "global_step": 35828, "epoch": 853} {"train_loss": -5.584916114807129, "global_step": 35829, "epoch": 853} {"train_loss": -5.731515407562256, "global_step": 35830, "epoch": 853} {"train_loss": -5.563900947570801, "global_step": 35831, "epoch": 853} {"train_loss": -5.54583215713501, "global_step": 35832, "epoch": 853} {"train_loss": -5.543211936950684, "global_step": 35833, "epoch": 853} {"train_loss": -5.54942512512207, "global_step": 35834, "epoch": 853} {"train_loss": -5.579266548156738, "global_step": 35835, "epoch": 853} {"train_loss": -5.678798675537109, "global_step": 35836, "epoch": 853} {"train_loss": -5.578492164611816, "global_step": 35837, "epoch": 853} {"train_loss": -5.718083381652832, "global_step": 35838, "epoch": 853} {"train_loss": -5.6356201171875, "global_step": 35839, "epoch": 853} {"train_loss": -5.410794734954834, "global_step": 35840, "epoch": 853} {"train_loss": -5.460649490356445, "global_step": 35841, "epoch": 853} {"train_loss": -5.625388145446777, "global_step": 35842, "epoch": 853} {"train_loss": -5.463717460632324, "global_step": 35843, "epoch": 853} {"train_loss": -5.584177017211914, "global_step": 35844, "epoch": 853} {"train_loss": -5.489225387573242, "global_step": 35845, "epoch": 853} {"train_loss": -5.575621604919434, "global_step": 35846, "epoch": 853} {"train_loss": -5.4316840171813965, "global_step": 35847, "epoch": 853} {"train_loss": -5.661179542541504, "global_step": 35848, "epoch": 853} {"train_loss": -5.5209808349609375, "global_step": 35849, "epoch": 853} {"train_loss": -5.555051803588867, "global_step": 35850, "epoch": 853} {"train_loss": -5.587576866149902, "global_step": 35851, "epoch": 853} {"train_loss": -5.619697570800781, "global_step": 35852, "epoch": 853} {"train_loss": -5.476426124572754, "global_step": 35853, "epoch": 853} {"train_loss": -5.525354385375977, "global_step": 35854, "epoch": 853} {"train_loss": -5.619103908538818, "global_step": 35855, "epoch": 853} {"train_loss": -5.660954475402832, "global_step": 35856, "epoch": 853} {"train_loss": -5.573901176452637, "global_step": 35857, "epoch": 853} {"train_loss": -5.631818771362305, "global_step": 35858, "epoch": 853} {"train_loss": -5.519662857055664, "global_step": 35859, "epoch": 853} {"train_loss": -5.551115989685059, "global_step": 35860, "epoch": 853} {"train_loss": -5.343976020812988, "global_step": 35861, "epoch": 853} {"train_loss": -5.632290363311768, "global_step": 35862, "epoch": 853} {"train_loss": -5.414607048034668, "global_step": 35863, "epoch": 853} {"train_loss": -5.561606407165527, "global_step": 35864, "epoch": 853} {"train_loss": -5.527087688446045, "global_step": 35865, "epoch": 853} {"train_loss": -5.45423698425293, "global_step": 35866, "epoch": 853} {"train_loss": -5.555185408819289, "global_step": 35867, "epoch": 853, "val_loss": 66328.5078125} {"train_loss": -5.513533592224121, "global_step": 35868, "epoch": 854} {"train_loss": -5.5057854652404785, "global_step": 35869, "epoch": 854} {"train_loss": -5.531594276428223, "global_step": 35870, "epoch": 854} {"train_loss": -5.523310661315918, "global_step": 35871, "epoch": 854} {"train_loss": -5.6157426834106445, "global_step": 35872, "epoch": 854} {"train_loss": -5.5637311935424805, "global_step": 35873, "epoch": 854} {"train_loss": -5.623857498168945, "global_step": 35874, "epoch": 854} {"train_loss": -5.580501556396484, "global_step": 35875, "epoch": 854} {"train_loss": -5.585493087768555, "global_step": 35876, "epoch": 854} {"train_loss": -5.606440544128418, "global_step": 35877, "epoch": 854} {"train_loss": -5.520627975463867, "global_step": 35878, "epoch": 854} {"train_loss": -5.57368803024292, "global_step": 35879, "epoch": 854} {"train_loss": -5.60648250579834, "global_step": 35880, "epoch": 854} {"train_loss": -5.498706340789795, "global_step": 35881, "epoch": 854} {"train_loss": -5.557738304138184, "global_step": 35882, "epoch": 854} {"train_loss": -5.4934492111206055, "global_step": 35883, "epoch": 854} {"train_loss": -5.476129055023193, "global_step": 35884, "epoch": 854} {"train_loss": -5.583677768707275, "global_step": 35885, "epoch": 854} {"train_loss": -5.502262115478516, "global_step": 35886, "epoch": 854} {"train_loss": -5.633573532104492, "global_step": 35887, "epoch": 854} {"train_loss": -5.486386775970459, "global_step": 35888, "epoch": 854} {"train_loss": -5.468956470489502, "global_step": 35889, "epoch": 854} {"train_loss": -5.5784807205200195, "global_step": 35890, "epoch": 854} {"train_loss": -5.536679267883301, "global_step": 35891, "epoch": 854} {"train_loss": -5.536428451538086, "global_step": 35892, "epoch": 854} {"train_loss": -5.4963483810424805, "global_step": 35893, "epoch": 854} {"train_loss": -5.5250396728515625, "global_step": 35894, "epoch": 854} {"train_loss": -5.444479465484619, "global_step": 35895, "epoch": 854} {"train_loss": -5.351787567138672, "global_step": 35896, "epoch": 854} {"train_loss": -5.511676788330078, "global_step": 35897, "epoch": 854} {"train_loss": -5.505977630615234, "global_step": 35898, "epoch": 854} {"train_loss": -5.516520023345947, "global_step": 35899, "epoch": 854} {"train_loss": -5.58034610748291, "global_step": 35900, "epoch": 854} {"train_loss": -5.512751579284668, "global_step": 35901, "epoch": 854} {"train_loss": -5.679385185241699, "global_step": 35902, "epoch": 854} {"train_loss": -5.373859405517578, "global_step": 35903, "epoch": 854} {"train_loss": -5.544137001037598, "global_step": 35904, "epoch": 854} {"train_loss": -5.4123334884643555, "global_step": 35905, "epoch": 854} {"train_loss": -5.600417613983154, "global_step": 35906, "epoch": 854} {"train_loss": -5.49268102645874, "global_step": 35907, "epoch": 854} {"train_loss": -5.516587734222412, "global_step": 35908, "epoch": 854} {"train_loss": -5.5300437495822, "global_step": 35909, "epoch": 854, "val_loss": 66389.3515625} {"train_loss": -5.439031600952148, "global_step": 35910, "epoch": 855} {"train_loss": -5.589856147766113, "global_step": 35911, "epoch": 855} {"train_loss": -5.541329383850098, "global_step": 35912, "epoch": 855} {"train_loss": -5.556956768035889, "global_step": 35913, "epoch": 855} {"train_loss": -5.524771690368652, "global_step": 35914, "epoch": 855} {"train_loss": -5.709381103515625, "global_step": 35915, "epoch": 855} {"train_loss": -5.674271583557129, "global_step": 35916, "epoch": 855} {"train_loss": -5.534742832183838, "global_step": 35917, "epoch": 855} {"train_loss": -5.561499118804932, "global_step": 35918, "epoch": 855} {"train_loss": -5.489076614379883, "global_step": 35919, "epoch": 855} {"train_loss": -5.491606712341309, "global_step": 35920, "epoch": 855} {"train_loss": -5.620972156524658, "global_step": 35921, "epoch": 855} {"train_loss": -5.614154815673828, "global_step": 35922, "epoch": 855} {"train_loss": -5.564629554748535, "global_step": 35923, "epoch": 855} {"train_loss": -5.543028831481934, "global_step": 35924, "epoch": 855} {"train_loss": -5.437924385070801, "global_step": 35925, "epoch": 855} {"train_loss": -5.6479692459106445, "global_step": 35926, "epoch": 855} {"train_loss": -5.556780815124512, "global_step": 35927, "epoch": 855} {"train_loss": -5.706718921661377, "global_step": 35928, "epoch": 855} {"train_loss": -5.5532989501953125, "global_step": 35929, "epoch": 855} {"train_loss": -5.554485321044922, "global_step": 35930, "epoch": 855} {"train_loss": -5.590975761413574, "global_step": 35931, "epoch": 855} {"train_loss": -5.529323577880859, "global_step": 35932, "epoch": 855} {"train_loss": -5.6340436935424805, "global_step": 35933, "epoch": 855} {"train_loss": -5.429780960083008, "global_step": 35934, "epoch": 855} {"train_loss": -5.514426231384277, "global_step": 35935, "epoch": 855} {"train_loss": -5.571567058563232, "global_step": 35936, "epoch": 855} {"train_loss": -5.604034423828125, "global_step": 35937, "epoch": 855} {"train_loss": -5.428396701812744, "global_step": 35938, "epoch": 855} {"train_loss": -5.614527225494385, "global_step": 35939, "epoch": 855} {"train_loss": -5.539502143859863, "global_step": 35940, "epoch": 855} {"train_loss": -5.596968650817871, "global_step": 35941, "epoch": 855} {"train_loss": -5.4782609939575195, "global_step": 35942, "epoch": 855} {"train_loss": -5.580569744110107, "global_step": 35943, "epoch": 855} {"train_loss": -5.556933403015137, "global_step": 35944, "epoch": 855} {"train_loss": -5.5577712059021, "global_step": 35945, "epoch": 855} {"train_loss": -5.480479717254639, "global_step": 35946, "epoch": 855} {"train_loss": -5.570357322692871, "global_step": 35947, "epoch": 855} {"train_loss": -5.491540908813477, "global_step": 35948, "epoch": 855} {"train_loss": -5.580703258514404, "global_step": 35949, "epoch": 855} {"train_loss": -5.575883865356445, "global_step": 35950, "epoch": 855} {"train_loss": -5.557487567265828, "global_step": 35951, "epoch": 855, "val_loss": 66097.515625} {"train_loss": -5.592243194580078, "global_step": 35952, "epoch": 856} {"train_loss": -5.386136054992676, "global_step": 35953, "epoch": 856} {"train_loss": -5.555418014526367, "global_step": 35954, "epoch": 856} {"train_loss": -5.682116985321045, "global_step": 35955, "epoch": 856} {"train_loss": -5.425437927246094, "global_step": 35956, "epoch": 856} {"train_loss": -5.545072555541992, "global_step": 35957, "epoch": 856} {"train_loss": -5.4882426261901855, "global_step": 35958, "epoch": 856} {"train_loss": -5.546520233154297, "global_step": 35959, "epoch": 856} {"train_loss": -5.68296480178833, "global_step": 35960, "epoch": 856} {"train_loss": -5.588273048400879, "global_step": 35961, "epoch": 856} {"train_loss": -5.676794052124023, "global_step": 35962, "epoch": 856} {"train_loss": -5.530174255371094, "global_step": 35963, "epoch": 856} {"train_loss": -5.712858200073242, "global_step": 35964, "epoch": 856} {"train_loss": -5.630613327026367, "global_step": 35965, "epoch": 856} {"train_loss": -5.51908016204834, "global_step": 35966, "epoch": 856} {"train_loss": -5.590770721435547, "global_step": 35967, "epoch": 856} {"train_loss": -5.559791564941406, "global_step": 35968, "epoch": 856} {"train_loss": -5.567038536071777, "global_step": 35969, "epoch": 856} {"train_loss": -5.42073392868042, "global_step": 35970, "epoch": 856} {"train_loss": -5.577312469482422, "global_step": 35971, "epoch": 856} {"train_loss": -5.556302070617676, "global_step": 35972, "epoch": 856} {"train_loss": -5.4264349937438965, "global_step": 35973, "epoch": 856} {"train_loss": -5.5957112312316895, "global_step": 35974, "epoch": 856} {"train_loss": -5.5535454750061035, "global_step": 35975, "epoch": 856} {"train_loss": -5.636317253112793, "global_step": 35976, "epoch": 856} {"train_loss": -5.675331115722656, "global_step": 35977, "epoch": 856} {"train_loss": -5.540966987609863, "global_step": 35978, "epoch": 856} {"train_loss": -5.689447402954102, "global_step": 35979, "epoch": 856} {"train_loss": -5.5910115242004395, "global_step": 35980, "epoch": 856} {"train_loss": -5.605445861816406, "global_step": 35981, "epoch": 856} {"train_loss": -5.792844772338867, "global_step": 35982, "epoch": 856} {"train_loss": -5.514294624328613, "global_step": 35983, "epoch": 856} {"train_loss": -5.640733242034912, "global_step": 35984, "epoch": 856} {"train_loss": -5.548618316650391, "global_step": 35985, "epoch": 856} {"train_loss": -5.503237724304199, "global_step": 35986, "epoch": 856} {"train_loss": -5.55515193939209, "global_step": 35987, "epoch": 856} {"train_loss": -5.558772087097168, "global_step": 35988, "epoch": 856} {"train_loss": -5.420558929443359, "global_step": 35989, "epoch": 856} {"train_loss": -5.510679721832275, "global_step": 35990, "epoch": 856} {"train_loss": -5.438934326171875, "global_step": 35991, "epoch": 856} {"train_loss": -5.623775482177734, "global_step": 35992, "epoch": 856} {"train_loss": -5.563310169038319, "global_step": 35993, "epoch": 856, "val_loss": 66256.859375} {"train_loss": -5.548610687255859, "global_step": 35994, "epoch": 857} {"train_loss": -5.539130687713623, "global_step": 35995, "epoch": 857} {"train_loss": -5.535192012786865, "global_step": 35996, "epoch": 857} {"train_loss": -5.608262538909912, "global_step": 35997, "epoch": 857} {"train_loss": -5.5810346603393555, "global_step": 35998, "epoch": 857} {"train_loss": -5.539505958557129, "global_step": 35999, "epoch": 857} {"train_loss": -5.602695465087891, "global_step": 36000, "epoch": 857} {"train_loss": -5.647851943969727, "global_step": 36001, "epoch": 857} {"train_loss": -5.513025283813477, "global_step": 36002, "epoch": 857} {"train_loss": -5.561030387878418, "global_step": 36003, "epoch": 857} {"train_loss": -5.4862284660339355, "global_step": 36004, "epoch": 857} {"train_loss": -5.591588020324707, "global_step": 36005, "epoch": 857} {"train_loss": -5.615686416625977, "global_step": 36006, "epoch": 857} {"train_loss": -5.655706882476807, "global_step": 36007, "epoch": 857} {"train_loss": -5.693323135375977, "global_step": 36008, "epoch": 857} {"train_loss": -5.600177764892578, "global_step": 36009, "epoch": 857} {"train_loss": -5.584549903869629, "global_step": 36010, "epoch": 857} {"train_loss": -5.6849260330200195, "global_step": 36011, "epoch": 857} {"train_loss": -5.539149761199951, "global_step": 36012, "epoch": 857} {"train_loss": -5.641593933105469, "global_step": 36013, "epoch": 857} {"train_loss": -5.665103912353516, "global_step": 36014, "epoch": 857} {"train_loss": -5.577294826507568, "global_step": 36015, "epoch": 857} {"train_loss": -5.518832206726074, "global_step": 36016, "epoch": 857} {"train_loss": -5.462627410888672, "global_step": 36017, "epoch": 857} {"train_loss": -5.56897497177124, "global_step": 36018, "epoch": 857} {"train_loss": -5.72504997253418, "global_step": 36019, "epoch": 857} {"train_loss": -5.588798522949219, "global_step": 36020, "epoch": 857} {"train_loss": -5.398331165313721, "global_step": 36021, "epoch": 857} {"train_loss": -5.521640300750732, "global_step": 36022, "epoch": 857} {"train_loss": -5.490407943725586, "global_step": 36023, "epoch": 857} {"train_loss": -5.536711692810059, "global_step": 36024, "epoch": 857} {"train_loss": -5.485270023345947, "global_step": 36025, "epoch": 857} {"train_loss": -5.542430877685547, "global_step": 36026, "epoch": 857} {"train_loss": -5.4552741050720215, "global_step": 36027, "epoch": 857} {"train_loss": -5.550774574279785, "global_step": 36028, "epoch": 857} {"train_loss": -5.58740234375, "global_step": 36029, "epoch": 857} {"train_loss": -5.464334487915039, "global_step": 36030, "epoch": 857} {"train_loss": -5.524510383605957, "global_step": 36031, "epoch": 857} {"train_loss": -5.526660919189453, "global_step": 36032, "epoch": 857} {"train_loss": -5.598848819732666, "global_step": 36033, "epoch": 857} {"train_loss": -5.605560302734375, "global_step": 36034, "epoch": 857} {"train_loss": -5.563593512489682, "global_step": 36035, "epoch": 857, "val_loss": 66039.4375} {"train_loss": -5.551303863525391, "global_step": 36036, "epoch": 858} {"train_loss": -5.441689491271973, "global_step": 36037, "epoch": 858} {"train_loss": -5.492907524108887, "global_step": 36038, "epoch": 858} {"train_loss": -5.542095184326172, "global_step": 36039, "epoch": 858} {"train_loss": -5.493159294128418, "global_step": 36040, "epoch": 858} {"train_loss": -5.6863603591918945, "global_step": 36041, "epoch": 858} {"train_loss": -5.474650859832764, "global_step": 36042, "epoch": 858} {"train_loss": -5.597235202789307, "global_step": 36043, "epoch": 858} {"train_loss": -5.674225807189941, "global_step": 36044, "epoch": 858} {"train_loss": -5.482783794403076, "global_step": 36045, "epoch": 858} {"train_loss": -5.596563339233398, "global_step": 36046, "epoch": 858} {"train_loss": -5.582101345062256, "global_step": 36047, "epoch": 858} {"train_loss": -5.519938945770264, "global_step": 36048, "epoch": 858} {"train_loss": -5.615558624267578, "global_step": 36049, "epoch": 858} {"train_loss": -5.52862548828125, "global_step": 36050, "epoch": 858} {"train_loss": -5.458386421203613, "global_step": 36051, "epoch": 858} {"train_loss": -5.4596452713012695, "global_step": 36052, "epoch": 858} {"train_loss": -5.485749244689941, "global_step": 36053, "epoch": 858} {"train_loss": -5.5292277336120605, "global_step": 36054, "epoch": 858} {"train_loss": -5.55714750289917, "global_step": 36055, "epoch": 858} {"train_loss": -5.4050612449646, "global_step": 36056, "epoch": 858} {"train_loss": -5.431542873382568, "global_step": 36057, "epoch": 858} {"train_loss": -5.487112998962402, "global_step": 36058, "epoch": 858} {"train_loss": -5.541806221008301, "global_step": 36059, "epoch": 858} {"train_loss": -5.623443603515625, "global_step": 36060, "epoch": 858} {"train_loss": -5.536775588989258, "global_step": 36061, "epoch": 858} {"train_loss": -5.536325454711914, "global_step": 36062, "epoch": 858} {"train_loss": -5.477088928222656, "global_step": 36063, "epoch": 858} {"train_loss": -5.492090225219727, "global_step": 36064, "epoch": 858} {"train_loss": -5.4944658279418945, "global_step": 36065, "epoch": 858} {"train_loss": -5.520508289337158, "global_step": 36066, "epoch": 858} {"train_loss": -5.559613227844238, "global_step": 36067, "epoch": 858} {"train_loss": -5.558522701263428, "global_step": 36068, "epoch": 858} {"train_loss": -5.585515975952148, "global_step": 36069, "epoch": 858} {"train_loss": -5.526684284210205, "global_step": 36070, "epoch": 858} {"train_loss": -5.525171279907227, "global_step": 36071, "epoch": 858} {"train_loss": -5.608762264251709, "global_step": 36072, "epoch": 858} {"train_loss": -5.547802448272705, "global_step": 36073, "epoch": 858} {"train_loss": -5.491825103759766, "global_step": 36074, "epoch": 858} {"train_loss": -5.53170108795166, "global_step": 36075, "epoch": 858} {"train_loss": -5.428071022033691, "global_step": 36076, "epoch": 858} {"train_loss": -5.528892142432077, "global_step": 36077, "epoch": 858, "val_loss": 65960.03125} {"train_loss": -5.395414352416992, "global_step": 36078, "epoch": 859} {"train_loss": -5.450135231018066, "global_step": 36079, "epoch": 859} {"train_loss": -5.590455055236816, "global_step": 36080, "epoch": 859} {"train_loss": -5.6068949699401855, "global_step": 36081, "epoch": 859} {"train_loss": -5.455289363861084, "global_step": 36082, "epoch": 859} {"train_loss": -5.586015701293945, "global_step": 36083, "epoch": 859} {"train_loss": -5.56627893447876, "global_step": 36084, "epoch": 859} {"train_loss": -5.645951747894287, "global_step": 36085, "epoch": 859} {"train_loss": -5.574457168579102, "global_step": 36086, "epoch": 859} {"train_loss": -5.449317455291748, "global_step": 36087, "epoch": 859} {"train_loss": -5.624171257019043, "global_step": 36088, "epoch": 859} {"train_loss": -5.560080051422119, "global_step": 36089, "epoch": 859} {"train_loss": -5.547982215881348, "global_step": 36090, "epoch": 859} {"train_loss": -5.537650108337402, "global_step": 36091, "epoch": 859} {"train_loss": -5.664668083190918, "global_step": 36092, "epoch": 859} {"train_loss": -5.486795425415039, "global_step": 36093, "epoch": 859} {"train_loss": -5.676115989685059, "global_step": 36094, "epoch": 859} {"train_loss": -5.561642646789551, "global_step": 36095, "epoch": 859} {"train_loss": -5.60897970199585, "global_step": 36096, "epoch": 859} {"train_loss": -5.575767517089844, "global_step": 36097, "epoch": 859} {"train_loss": -5.5755615234375, "global_step": 36098, "epoch": 859} {"train_loss": -5.542695045471191, "global_step": 36099, "epoch": 859} {"train_loss": -5.579492092132568, "global_step": 36100, "epoch": 859} {"train_loss": -5.568094253540039, "global_step": 36101, "epoch": 859} {"train_loss": -5.713982582092285, "global_step": 36102, "epoch": 859} {"train_loss": -5.582952499389648, "global_step": 36103, "epoch": 859} {"train_loss": -5.529851913452148, "global_step": 36104, "epoch": 859} {"train_loss": -5.533990859985352, "global_step": 36105, "epoch": 859} {"train_loss": -5.531400680541992, "global_step": 36106, "epoch": 859} {"train_loss": -5.475761890411377, "global_step": 36107, "epoch": 859} {"train_loss": -5.468430519104004, "global_step": 36108, "epoch": 859} {"train_loss": -5.58735990524292, "global_step": 36109, "epoch": 859} {"train_loss": -5.544532775878906, "global_step": 36110, "epoch": 859} {"train_loss": -5.468757629394531, "global_step": 36111, "epoch": 859} {"train_loss": -5.760543346405029, "global_step": 36112, "epoch": 859} {"train_loss": -5.512584209442139, "global_step": 36113, "epoch": 859} {"train_loss": -5.572830677032471, "global_step": 36114, "epoch": 859} {"train_loss": -5.597841262817383, "global_step": 36115, "epoch": 859} {"train_loss": -5.568513870239258, "global_step": 36116, "epoch": 859} {"train_loss": -5.710166931152344, "global_step": 36117, "epoch": 859} {"train_loss": -5.636116027832031, "global_step": 36118, "epoch": 859} {"train_loss": -5.565869501658848, "global_step": 36119, "epoch": 859, "val_loss": 66216.8125} {"train_loss": -5.492867469787598, "global_step": 36120, "epoch": 860} {"train_loss": -5.5503010749816895, "global_step": 36121, "epoch": 860} {"train_loss": -5.648017883300781, "global_step": 36122, "epoch": 860} {"train_loss": -5.593583106994629, "global_step": 36123, "epoch": 860} {"train_loss": -5.4763641357421875, "global_step": 36124, "epoch": 860} {"train_loss": -5.548022747039795, "global_step": 36125, "epoch": 860} {"train_loss": -5.6268229484558105, "global_step": 36126, "epoch": 860} {"train_loss": -5.615927696228027, "global_step": 36127, "epoch": 860} {"train_loss": -5.5103254318237305, "global_step": 36128, "epoch": 860} {"train_loss": -5.644570350646973, "global_step": 36129, "epoch": 860} {"train_loss": -5.73948335647583, "global_step": 36130, "epoch": 860} {"train_loss": -5.6575398445129395, "global_step": 36131, "epoch": 860} {"train_loss": -5.615948677062988, "global_step": 36132, "epoch": 860} {"train_loss": -5.467087745666504, "global_step": 36133, "epoch": 860} {"train_loss": -5.509872913360596, "global_step": 36134, "epoch": 860} {"train_loss": -5.647818088531494, "global_step": 36135, "epoch": 860} {"train_loss": -5.6391777992248535, "global_step": 36136, "epoch": 860} {"train_loss": -5.638840675354004, "global_step": 36137, "epoch": 860} {"train_loss": -5.473690509796143, "global_step": 36138, "epoch": 860} {"train_loss": -5.6238179206848145, "global_step": 36139, "epoch": 860} {"train_loss": -5.570087909698486, "global_step": 36140, "epoch": 860} {"train_loss": -5.457455158233643, "global_step": 36141, "epoch": 860} {"train_loss": -5.663219451904297, "global_step": 36142, "epoch": 860} {"train_loss": -5.564512729644775, "global_step": 36143, "epoch": 860} {"train_loss": -5.642129898071289, "global_step": 36144, "epoch": 860} {"train_loss": -5.717220306396484, "global_step": 36145, "epoch": 860} {"train_loss": -5.516635894775391, "global_step": 36146, "epoch": 860} {"train_loss": -5.478542804718018, "global_step": 36147, "epoch": 860} {"train_loss": -5.649164199829102, "global_step": 36148, "epoch": 860} {"train_loss": -5.548285484313965, "global_step": 36149, "epoch": 860} {"train_loss": -5.635923385620117, "global_step": 36150, "epoch": 860} {"train_loss": -5.501242637634277, "global_step": 36151, "epoch": 860} {"train_loss": -5.4931745529174805, "global_step": 36152, "epoch": 860} {"train_loss": -5.48259162902832, "global_step": 36153, "epoch": 860} {"train_loss": -5.619463920593262, "global_step": 36154, "epoch": 860} {"train_loss": -5.592644691467285, "global_step": 36155, "epoch": 860} {"train_loss": -5.676326274871826, "global_step": 36156, "epoch": 860} {"train_loss": -5.567255020141602, "global_step": 36157, "epoch": 860} {"train_loss": -5.683507919311523, "global_step": 36158, "epoch": 860} {"train_loss": -5.536106586456299, "global_step": 36159, "epoch": 860} {"train_loss": -5.551969051361084, "global_step": 36160, "epoch": 860} {"train_loss": -5.579481420062837, "global_step": 36161, "epoch": 860, "val_loss": 66307.8359375} {"train_loss": -5.555927753448486, "global_step": 36162, "epoch": 861} {"train_loss": -5.539350986480713, "global_step": 36163, "epoch": 861} {"train_loss": -5.583370685577393, "global_step": 36164, "epoch": 861} {"train_loss": -5.389830589294434, "global_step": 36165, "epoch": 861} {"train_loss": -5.577966690063477, "global_step": 36166, "epoch": 861} {"train_loss": -5.489027976989746, "global_step": 36167, "epoch": 861} {"train_loss": -5.67189884185791, "global_step": 36168, "epoch": 861} {"train_loss": -5.613002300262451, "global_step": 36169, "epoch": 861} {"train_loss": -5.475605010986328, "global_step": 36170, "epoch": 861} {"train_loss": -5.676382541656494, "global_step": 36171, "epoch": 861} {"train_loss": -5.576045989990234, "global_step": 36172, "epoch": 861} {"train_loss": -5.556777000427246, "global_step": 36173, "epoch": 861} {"train_loss": -5.464341163635254, "global_step": 36174, "epoch": 861} {"train_loss": -5.383526802062988, "global_step": 36175, "epoch": 861} {"train_loss": -5.564175128936768, "global_step": 36176, "epoch": 861} {"train_loss": -5.401754379272461, "global_step": 36177, "epoch": 861} {"train_loss": -5.581063270568848, "global_step": 36178, "epoch": 861} {"train_loss": -5.563002586364746, "global_step": 36179, "epoch": 861} {"train_loss": -5.50705623626709, "global_step": 36180, "epoch": 861} {"train_loss": -5.504021167755127, "global_step": 36181, "epoch": 861} {"train_loss": -5.3942790031433105, "global_step": 36182, "epoch": 861} {"train_loss": -5.489289283752441, "global_step": 36183, "epoch": 861} {"train_loss": -5.514695167541504, "global_step": 36184, "epoch": 861} {"train_loss": -5.500725746154785, "global_step": 36185, "epoch": 861} {"train_loss": -5.5481462478637695, "global_step": 36186, "epoch": 861} {"train_loss": -5.499587535858154, "global_step": 36187, "epoch": 861} {"train_loss": -5.615356922149658, "global_step": 36188, "epoch": 861} {"train_loss": -5.635218620300293, "global_step": 36189, "epoch": 861} {"train_loss": -5.521462440490723, "global_step": 36190, "epoch": 861} {"train_loss": -5.508896827697754, "global_step": 36191, "epoch": 861} {"train_loss": -5.594346523284912, "global_step": 36192, "epoch": 861} {"train_loss": -5.446168899536133, "global_step": 36193, "epoch": 861} {"train_loss": -5.768942832946777, "global_step": 36194, "epoch": 861} {"train_loss": -5.444507598876953, "global_step": 36195, "epoch": 861} {"train_loss": -5.7048749923706055, "global_step": 36196, "epoch": 861} {"train_loss": -5.447356224060059, "global_step": 36197, "epoch": 861} {"train_loss": -5.458967208862305, "global_step": 36198, "epoch": 861} {"train_loss": -5.4985222816467285, "global_step": 36199, "epoch": 861} {"train_loss": -5.698094367980957, "global_step": 36200, "epoch": 861} {"train_loss": -5.4696478843688965, "global_step": 36201, "epoch": 861} {"train_loss": -5.514245986938477, "global_step": 36202, "epoch": 861} {"train_loss": -5.533967653910319, "global_step": 36203, "epoch": 861, "val_loss": 66035.0} {"train_loss": -5.568011283874512, "global_step": 36204, "epoch": 862} {"train_loss": -5.553266525268555, "global_step": 36205, "epoch": 862} {"train_loss": -5.594039440155029, "global_step": 36206, "epoch": 862} {"train_loss": -5.517953395843506, "global_step": 36207, "epoch": 862} {"train_loss": -5.364462852478027, "global_step": 36208, "epoch": 862} {"train_loss": -5.555241584777832, "global_step": 36209, "epoch": 862} {"train_loss": -5.621020317077637, "global_step": 36210, "epoch": 862} {"train_loss": -5.587795734405518, "global_step": 36211, "epoch": 862} {"train_loss": -5.532113075256348, "global_step": 36212, "epoch": 862} {"train_loss": -5.707878112792969, "global_step": 36213, "epoch": 862} {"train_loss": -5.760384559631348, "global_step": 36214, "epoch": 862} {"train_loss": -5.576574325561523, "global_step": 36215, "epoch": 862} {"train_loss": -5.541647434234619, "global_step": 36216, "epoch": 862} {"train_loss": -5.501171112060547, "global_step": 36217, "epoch": 862} {"train_loss": -5.519025802612305, "global_step": 36218, "epoch": 862} {"train_loss": -5.477845668792725, "global_step": 36219, "epoch": 862} {"train_loss": -5.537512302398682, "global_step": 36220, "epoch": 862} {"train_loss": -5.717754364013672, "global_step": 36221, "epoch": 862} {"train_loss": -5.557727813720703, "global_step": 36222, "epoch": 862} {"train_loss": -5.603955268859863, "global_step": 36223, "epoch": 862} {"train_loss": -5.578178405761719, "global_step": 36224, "epoch": 862} {"train_loss": -5.663572311401367, "global_step": 36225, "epoch": 862} {"train_loss": -5.5875115394592285, "global_step": 36226, "epoch": 862} {"train_loss": -5.603100776672363, "global_step": 36227, "epoch": 862} {"train_loss": -5.498726844787598, "global_step": 36228, "epoch": 862} {"train_loss": -5.519574165344238, "global_step": 36229, "epoch": 862} {"train_loss": -5.642939567565918, "global_step": 36230, "epoch": 862} {"train_loss": -5.442403793334961, "global_step": 36231, "epoch": 862} {"train_loss": -5.485367774963379, "global_step": 36232, "epoch": 862} {"train_loss": -5.572142601013184, "global_step": 36233, "epoch": 862} {"train_loss": -5.542796611785889, "global_step": 36234, "epoch": 862} {"train_loss": -5.590554237365723, "global_step": 36235, "epoch": 862} {"train_loss": -5.614623546600342, "global_step": 36236, "epoch": 862} {"train_loss": -5.57309103012085, "global_step": 36237, "epoch": 862} {"train_loss": -5.582510471343994, "global_step": 36238, "epoch": 862} {"train_loss": -5.658007621765137, "global_step": 36239, "epoch": 862} {"train_loss": -5.522221565246582, "global_step": 36240, "epoch": 862} {"train_loss": -5.513165473937988, "global_step": 36241, "epoch": 862} {"train_loss": -5.462470054626465, "global_step": 36242, "epoch": 862} {"train_loss": -5.5878729820251465, "global_step": 36243, "epoch": 862} {"train_loss": -5.508979320526123, "global_step": 36244, "epoch": 862} {"train_loss": -5.56388657433646, "global_step": 36245, "epoch": 862, "val_loss": 66217.515625} {"train_loss": -5.750988960266113, "global_step": 36246, "epoch": 863} {"train_loss": -5.461291313171387, "global_step": 36247, "epoch": 863} {"train_loss": -5.657098770141602, "global_step": 36248, "epoch": 863} {"train_loss": -5.529351234436035, "global_step": 36249, "epoch": 863} {"train_loss": -5.513096809387207, "global_step": 36250, "epoch": 863} {"train_loss": -5.591683387756348, "global_step": 36251, "epoch": 863} {"train_loss": -5.438329219818115, "global_step": 36252, "epoch": 863} {"train_loss": -5.645506381988525, "global_step": 36253, "epoch": 863} {"train_loss": -5.5109543800354, "global_step": 36254, "epoch": 863} {"train_loss": -5.585536479949951, "global_step": 36255, "epoch": 863} {"train_loss": -5.551045894622803, "global_step": 36256, "epoch": 863} {"train_loss": -5.500114440917969, "global_step": 36257, "epoch": 863} {"train_loss": -5.493921279907227, "global_step": 36258, "epoch": 863} {"train_loss": -5.476743221282959, "global_step": 36259, "epoch": 863} {"train_loss": -5.392600059509277, "global_step": 36260, "epoch": 863} {"train_loss": -5.668862342834473, "global_step": 36261, "epoch": 863} {"train_loss": -5.539918899536133, "global_step": 36262, "epoch": 863} {"train_loss": -5.611042022705078, "global_step": 36263, "epoch": 863} {"train_loss": -5.518488883972168, "global_step": 36264, "epoch": 863} {"train_loss": -5.6446380615234375, "global_step": 36265, "epoch": 863} {"train_loss": -5.6753082275390625, "global_step": 36266, "epoch": 863} {"train_loss": -5.529719352722168, "global_step": 36267, "epoch": 863} {"train_loss": -5.456384181976318, "global_step": 36268, "epoch": 863} {"train_loss": -5.609760761260986, "global_step": 36269, "epoch": 863} {"train_loss": -5.462505340576172, "global_step": 36270, "epoch": 863} {"train_loss": -5.562614440917969, "global_step": 36271, "epoch": 863} {"train_loss": -5.416377544403076, "global_step": 36272, "epoch": 863} {"train_loss": -5.571969032287598, "global_step": 36273, "epoch": 863} {"train_loss": -5.616937637329102, "global_step": 36274, "epoch": 863} {"train_loss": -5.501205921173096, "global_step": 36275, "epoch": 863} {"train_loss": -5.643497467041016, "global_step": 36276, "epoch": 863} {"train_loss": -5.660093307495117, "global_step": 36277, "epoch": 863} {"train_loss": -5.549624443054199, "global_step": 36278, "epoch": 863} {"train_loss": -5.376674175262451, "global_step": 36279, "epoch": 863} {"train_loss": -5.419151306152344, "global_step": 36280, "epoch": 863} {"train_loss": -5.597057819366455, "global_step": 36281, "epoch": 863} {"train_loss": -5.682869911193848, "global_step": 36282, "epoch": 863} {"train_loss": -5.466368675231934, "global_step": 36283, "epoch": 863} {"train_loss": -5.518111228942871, "global_step": 36284, "epoch": 863} {"train_loss": -5.509111404418945, "global_step": 36285, "epoch": 863} {"train_loss": -5.575244903564453, "global_step": 36286, "epoch": 863} {"train_loss": -5.5501787548973445, "global_step": 36287, "epoch": 863, "val_loss": 66439.0546875} {"train_loss": -5.594252109527588, "global_step": 36288, "epoch": 864} {"train_loss": -5.540211200714111, "global_step": 36289, "epoch": 864} {"train_loss": -5.380309581756592, "global_step": 36290, "epoch": 864} {"train_loss": -5.513818740844727, "global_step": 36291, "epoch": 864} {"train_loss": -5.606226921081543, "global_step": 36292, "epoch": 864} {"train_loss": -5.600536346435547, "global_step": 36293, "epoch": 864} {"train_loss": -5.620297908782959, "global_step": 36294, "epoch": 864} {"train_loss": -5.531886100769043, "global_step": 36295, "epoch": 864} {"train_loss": -5.460320472717285, "global_step": 36296, "epoch": 864} {"train_loss": -5.51033878326416, "global_step": 36297, "epoch": 864} {"train_loss": -5.683981895446777, "global_step": 36298, "epoch": 864} {"train_loss": -5.607909202575684, "global_step": 36299, "epoch": 864} {"train_loss": -5.569343566894531, "global_step": 36300, "epoch": 864} {"train_loss": -5.604619026184082, "global_step": 36301, "epoch": 864} {"train_loss": -5.70684814453125, "global_step": 36302, "epoch": 864} {"train_loss": -5.547674179077148, "global_step": 36303, "epoch": 864} {"train_loss": -5.6586833000183105, "global_step": 36304, "epoch": 864} {"train_loss": -5.5791425704956055, "global_step": 36305, "epoch": 864} {"train_loss": -5.4936909675598145, "global_step": 36306, "epoch": 864} {"train_loss": -5.482038974761963, "global_step": 36307, "epoch": 864} {"train_loss": -5.648368835449219, "global_step": 36308, "epoch": 864} {"train_loss": -5.627781867980957, "global_step": 36309, "epoch": 864} {"train_loss": -5.565685272216797, "global_step": 36310, "epoch": 864} {"train_loss": -5.604640483856201, "global_step": 36311, "epoch": 864} {"train_loss": -5.581828594207764, "global_step": 36312, "epoch": 864} {"train_loss": -5.639468193054199, "global_step": 36313, "epoch": 864} {"train_loss": -5.632622718811035, "global_step": 36314, "epoch": 864} {"train_loss": -5.575098037719727, "global_step": 36315, "epoch": 864} {"train_loss": -5.515331268310547, "global_step": 36316, "epoch": 864} {"train_loss": -5.667902946472168, "global_step": 36317, "epoch": 864} {"train_loss": -5.606834888458252, "global_step": 36318, "epoch": 864} {"train_loss": -5.62968111038208, "global_step": 36319, "epoch": 864} {"train_loss": -5.6830153465271, "global_step": 36320, "epoch": 864} {"train_loss": -5.541870594024658, "global_step": 36321, "epoch": 864} {"train_loss": -5.639030456542969, "global_step": 36322, "epoch": 864} {"train_loss": -5.482768535614014, "global_step": 36323, "epoch": 864} {"train_loss": -5.649575233459473, "global_step": 36324, "epoch": 864} {"train_loss": -5.49611234664917, "global_step": 36325, "epoch": 864} {"train_loss": -5.640651702880859, "global_step": 36326, "epoch": 864} {"train_loss": -5.58909273147583, "global_step": 36327, "epoch": 864} {"train_loss": -5.504751205444336, "global_step": 36328, "epoch": 864} {"train_loss": -5.5781222979227705, "global_step": 36329, "epoch": 864, "val_loss": 66284.609375} {"train_loss": -5.585627555847168, "global_step": 36330, "epoch": 865} {"train_loss": -5.666195869445801, "global_step": 36331, "epoch": 865} {"train_loss": -5.484687805175781, "global_step": 36332, "epoch": 865} {"train_loss": -5.721090316772461, "global_step": 36333, "epoch": 865} {"train_loss": -5.413325309753418, "global_step": 36334, "epoch": 865} {"train_loss": -5.521857261657715, "global_step": 36335, "epoch": 865} {"train_loss": -5.545792579650879, "global_step": 36336, "epoch": 865} {"train_loss": -5.63829231262207, "global_step": 36337, "epoch": 865} {"train_loss": -5.344144821166992, "global_step": 36338, "epoch": 865} {"train_loss": -5.4045610427856445, "global_step": 36339, "epoch": 865} {"train_loss": -5.5794548988342285, "global_step": 36340, "epoch": 865} {"train_loss": -5.5092267990112305, "global_step": 36341, "epoch": 865} {"train_loss": -5.545055866241455, "global_step": 36342, "epoch": 865} {"train_loss": -5.653270721435547, "global_step": 36343, "epoch": 865} {"train_loss": -5.653148174285889, "global_step": 36344, "epoch": 865} {"train_loss": -5.463233470916748, "global_step": 36345, "epoch": 865} {"train_loss": -5.557277679443359, "global_step": 36346, "epoch": 865} {"train_loss": -5.499429702758789, "global_step": 36347, "epoch": 865} {"train_loss": -5.471062183380127, "global_step": 36348, "epoch": 865} {"train_loss": -5.486065864562988, "global_step": 36349, "epoch": 865} {"train_loss": -5.5333476066589355, "global_step": 36350, "epoch": 865} {"train_loss": -5.65524959564209, "global_step": 36351, "epoch": 865} {"train_loss": -5.449944019317627, "global_step": 36352, "epoch": 865} {"train_loss": -5.499161243438721, "global_step": 36353, "epoch": 865} {"train_loss": -5.545084476470947, "global_step": 36354, "epoch": 865} {"train_loss": -5.458827972412109, "global_step": 36355, "epoch": 865} {"train_loss": -5.533522605895996, "global_step": 36356, "epoch": 865} {"train_loss": -5.522507190704346, "global_step": 36357, "epoch": 865} {"train_loss": -5.486220359802246, "global_step": 36358, "epoch": 865} {"train_loss": -5.473094463348389, "global_step": 36359, "epoch": 865} {"train_loss": -5.55587100982666, "global_step": 36360, "epoch": 865} {"train_loss": -5.4601149559021, "global_step": 36361, "epoch": 865} {"train_loss": -5.636679649353027, "global_step": 36362, "epoch": 865} {"train_loss": -5.543851852416992, "global_step": 36363, "epoch": 865} {"train_loss": -5.599719524383545, "global_step": 36364, "epoch": 865} {"train_loss": -5.558642387390137, "global_step": 36365, "epoch": 865} {"train_loss": -5.509513854980469, "global_step": 36366, "epoch": 865} {"train_loss": -5.625256538391113, "global_step": 36367, "epoch": 865} {"train_loss": -5.7182936668396, "global_step": 36368, "epoch": 865} {"train_loss": -5.389527320861816, "global_step": 36369, "epoch": 865} {"train_loss": -5.529007911682129, "global_step": 36370, "epoch": 865} {"train_loss": -5.537914798373268, "global_step": 36371, "epoch": 865, "val_loss": 66186.6875} {"train_loss": -5.524904251098633, "global_step": 36372, "epoch": 866} {"train_loss": -5.550224304199219, "global_step": 36373, "epoch": 866} {"train_loss": -5.6485185623168945, "global_step": 36374, "epoch": 866} {"train_loss": -5.633849143981934, "global_step": 36375, "epoch": 866} {"train_loss": -5.658875942230225, "global_step": 36376, "epoch": 866} {"train_loss": -5.622797966003418, "global_step": 36377, "epoch": 866} {"train_loss": -5.45533561706543, "global_step": 36378, "epoch": 866} {"train_loss": -5.612375259399414, "global_step": 36379, "epoch": 866} {"train_loss": -5.56438684463501, "global_step": 36380, "epoch": 866} {"train_loss": -5.545607566833496, "global_step": 36381, "epoch": 866} {"train_loss": -5.575322151184082, "global_step": 36382, "epoch": 866} {"train_loss": -5.5902814865112305, "global_step": 36383, "epoch": 866} {"train_loss": -5.612209320068359, "global_step": 36384, "epoch": 866} {"train_loss": -5.671246528625488, "global_step": 36385, "epoch": 866} {"train_loss": -5.604885101318359, "global_step": 36386, "epoch": 866} {"train_loss": -5.480619430541992, "global_step": 36387, "epoch": 866} {"train_loss": -5.682332515716553, "global_step": 36388, "epoch": 866} {"train_loss": -5.4732794761657715, "global_step": 36389, "epoch": 866} {"train_loss": -5.458847522735596, "global_step": 36390, "epoch": 866} {"train_loss": -5.591707706451416, "global_step": 36391, "epoch": 866} {"train_loss": -5.539577484130859, "global_step": 36392, "epoch": 866} {"train_loss": -5.646988868713379, "global_step": 36393, "epoch": 866} {"train_loss": -5.483743190765381, "global_step": 36394, "epoch": 866} {"train_loss": -5.521985054016113, "global_step": 36395, "epoch": 866} {"train_loss": -5.626775741577148, "global_step": 36396, "epoch": 866} {"train_loss": -5.617727279663086, "global_step": 36397, "epoch": 866} {"train_loss": -5.5642900466918945, "global_step": 36398, "epoch": 866} {"train_loss": -5.552098274230957, "global_step": 36399, "epoch": 866} {"train_loss": -5.516292095184326, "global_step": 36400, "epoch": 866} {"train_loss": -5.616813659667969, "global_step": 36401, "epoch": 866} {"train_loss": -5.456186771392822, "global_step": 36402, "epoch": 866} {"train_loss": -5.475014686584473, "global_step": 36403, "epoch": 866} {"train_loss": -5.639891624450684, "global_step": 36404, "epoch": 866} {"train_loss": -5.508654594421387, "global_step": 36405, "epoch": 866} {"train_loss": -5.547368049621582, "global_step": 36406, "epoch": 866} {"train_loss": -5.64286994934082, "global_step": 36407, "epoch": 866} {"train_loss": -5.484925270080566, "global_step": 36408, "epoch": 866} {"train_loss": -5.705798625946045, "global_step": 36409, "epoch": 866} {"train_loss": -5.6115570068359375, "global_step": 36410, "epoch": 866} {"train_loss": -5.520216464996338, "global_step": 36411, "epoch": 866} {"train_loss": -5.5351409912109375, "global_step": 36412, "epoch": 866} {"train_loss": -5.572106009437924, "global_step": 36413, "epoch": 866, "val_loss": 66374.5} {"train_loss": -5.429591178894043, "global_step": 36414, "epoch": 867} {"train_loss": -5.665310382843018, "global_step": 36415, "epoch": 867} {"train_loss": -5.683286666870117, "global_step": 36416, "epoch": 867} {"train_loss": -5.4982147216796875, "global_step": 36417, "epoch": 867} {"train_loss": -5.705992698669434, "global_step": 36418, "epoch": 867} {"train_loss": -5.721867084503174, "global_step": 36419, "epoch": 867} {"train_loss": -5.575326919555664, "global_step": 36420, "epoch": 867} {"train_loss": -5.619235992431641, "global_step": 36421, "epoch": 867} {"train_loss": -5.541906356811523, "global_step": 36422, "epoch": 867} {"train_loss": -5.5666704177856445, "global_step": 36423, "epoch": 867} {"train_loss": -5.4972124099731445, "global_step": 36424, "epoch": 867} {"train_loss": -5.562155723571777, "global_step": 36425, "epoch": 867} {"train_loss": -5.711519718170166, "global_step": 36426, "epoch": 867} {"train_loss": -5.465564727783203, "global_step": 36427, "epoch": 867} {"train_loss": -5.65013313293457, "global_step": 36428, "epoch": 867} {"train_loss": -5.646889686584473, "global_step": 36429, "epoch": 867} {"train_loss": -5.390677452087402, "global_step": 36430, "epoch": 867} {"train_loss": -5.554190158843994, "global_step": 36431, "epoch": 867} {"train_loss": -5.293227195739746, "global_step": 36432, "epoch": 867} {"train_loss": -5.577507495880127, "global_step": 36433, "epoch": 867} {"train_loss": -5.458070278167725, "global_step": 36434, "epoch": 867} {"train_loss": -5.36400842666626, "global_step": 36435, "epoch": 867} {"train_loss": -5.462807655334473, "global_step": 36436, "epoch": 867} {"train_loss": -5.332087516784668, "global_step": 36437, "epoch": 867} {"train_loss": -5.4751877784729, "global_step": 36438, "epoch": 867} {"train_loss": -5.473299980163574, "global_step": 36439, "epoch": 867} {"train_loss": -5.663814544677734, "global_step": 36440, "epoch": 867} {"train_loss": -5.516261577606201, "global_step": 36441, "epoch": 867} {"train_loss": -5.5399861335754395, "global_step": 36442, "epoch": 867} {"train_loss": -5.574016571044922, "global_step": 36443, "epoch": 867} {"train_loss": -5.574136734008789, "global_step": 36444, "epoch": 867} {"train_loss": -5.589474678039551, "global_step": 36445, "epoch": 867} {"train_loss": -5.622745513916016, "global_step": 36446, "epoch": 867} {"train_loss": -5.633829116821289, "global_step": 36447, "epoch": 867} {"train_loss": -5.591669082641602, "global_step": 36448, "epoch": 867} {"train_loss": -5.432112216949463, "global_step": 36449, "epoch": 867} {"train_loss": -5.602517127990723, "global_step": 36450, "epoch": 867} {"train_loss": -5.632585525512695, "global_step": 36451, "epoch": 867} {"train_loss": -5.576642990112305, "global_step": 36452, "epoch": 867} {"train_loss": -5.57048225402832, "global_step": 36453, "epoch": 867} {"train_loss": -5.524969100952148, "global_step": 36454, "epoch": 867} {"train_loss": -5.551965055011568, "global_step": 36455, "epoch": 867, "val_loss": 66144.4140625} {"train_loss": -5.693271636962891, "global_step": 36456, "epoch": 868} {"train_loss": -5.641093730926514, "global_step": 36457, "epoch": 868} {"train_loss": -5.622901916503906, "global_step": 36458, "epoch": 868} {"train_loss": -5.574275493621826, "global_step": 36459, "epoch": 868} {"train_loss": -5.445485591888428, "global_step": 36460, "epoch": 868} {"train_loss": -5.579181671142578, "global_step": 36461, "epoch": 868} {"train_loss": -5.487621784210205, "global_step": 36462, "epoch": 868} {"train_loss": -5.545703887939453, "global_step": 36463, "epoch": 868} {"train_loss": -5.644030570983887, "global_step": 36464, "epoch": 868} {"train_loss": -5.636120319366455, "global_step": 36465, "epoch": 868} {"train_loss": -5.393083572387695, "global_step": 36466, "epoch": 868} {"train_loss": -5.619449138641357, "global_step": 36467, "epoch": 868} {"train_loss": -5.532854080200195, "global_step": 36468, "epoch": 868} {"train_loss": -5.574529647827148, "global_step": 36469, "epoch": 868} {"train_loss": -5.467441558837891, "global_step": 36470, "epoch": 868} {"train_loss": -5.557981014251709, "global_step": 36471, "epoch": 868} {"train_loss": -5.629938125610352, "global_step": 36472, "epoch": 868} {"train_loss": -5.6782636642456055, "global_step": 36473, "epoch": 868} {"train_loss": -5.525382995605469, "global_step": 36474, "epoch": 868} {"train_loss": -5.645784378051758, "global_step": 36475, "epoch": 868} {"train_loss": -5.449498653411865, "global_step": 36476, "epoch": 868} {"train_loss": -5.475887298583984, "global_step": 36477, "epoch": 868} {"train_loss": -5.5482330322265625, "global_step": 36478, "epoch": 868} {"train_loss": -5.6105475425720215, "global_step": 36479, "epoch": 868} {"train_loss": -5.542931079864502, "global_step": 36480, "epoch": 868} {"train_loss": -5.616429328918457, "global_step": 36481, "epoch": 868} {"train_loss": -5.652162551879883, "global_step": 36482, "epoch": 868} {"train_loss": -5.655944347381592, "global_step": 36483, "epoch": 868} {"train_loss": -5.485942840576172, "global_step": 36484, "epoch": 868} {"train_loss": -5.493244171142578, "global_step": 36485, "epoch": 868} {"train_loss": -5.674816131591797, "global_step": 36486, "epoch": 868} {"train_loss": -5.5942583084106445, "global_step": 36487, "epoch": 868} {"train_loss": -5.561963081359863, "global_step": 36488, "epoch": 868} {"train_loss": -5.6478681564331055, "global_step": 36489, "epoch": 868} {"train_loss": -5.589999675750732, "global_step": 36490, "epoch": 868} {"train_loss": -5.667104244232178, "global_step": 36491, "epoch": 868} {"train_loss": -5.453768730163574, "global_step": 36492, "epoch": 868} {"train_loss": -5.510303497314453, "global_step": 36493, "epoch": 868} {"train_loss": -5.543868541717529, "global_step": 36494, "epoch": 868} {"train_loss": -5.536737442016602, "global_step": 36495, "epoch": 868} {"train_loss": -5.4845194816589355, "global_step": 36496, "epoch": 868} {"train_loss": -5.567221618833996, "global_step": 36497, "epoch": 868, "val_loss": 66677.796875} {"train_loss": -5.502987861633301, "global_step": 36498, "epoch": 869} {"train_loss": -5.603841304779053, "global_step": 36499, "epoch": 869} {"train_loss": -5.545722007751465, "global_step": 36500, "epoch": 869} {"train_loss": -5.552646160125732, "global_step": 36501, "epoch": 869} {"train_loss": -5.544370651245117, "global_step": 36502, "epoch": 869} {"train_loss": -5.540286064147949, "global_step": 36503, "epoch": 869} {"train_loss": -5.541304111480713, "global_step": 36504, "epoch": 869} {"train_loss": -5.469053268432617, "global_step": 36505, "epoch": 869} {"train_loss": -5.556050777435303, "global_step": 36506, "epoch": 869} {"train_loss": -5.578988075256348, "global_step": 36507, "epoch": 869} {"train_loss": -5.539909839630127, "global_step": 36508, "epoch": 869} {"train_loss": -5.625982284545898, "global_step": 36509, "epoch": 869} {"train_loss": -5.560731887817383, "global_step": 36510, "epoch": 869} {"train_loss": -5.674643516540527, "global_step": 36511, "epoch": 869} {"train_loss": -5.550952434539795, "global_step": 36512, "epoch": 869} {"train_loss": -5.576367378234863, "global_step": 36513, "epoch": 869} {"train_loss": -5.625250816345215, "global_step": 36514, "epoch": 869} {"train_loss": -5.58000373840332, "global_step": 36515, "epoch": 869} {"train_loss": -5.583264350891113, "global_step": 36516, "epoch": 869} {"train_loss": -5.733865737915039, "global_step": 36517, "epoch": 869} {"train_loss": -5.525554656982422, "global_step": 36518, "epoch": 869} {"train_loss": -5.634167671203613, "global_step": 36519, "epoch": 869} {"train_loss": -5.541342735290527, "global_step": 36520, "epoch": 869} {"train_loss": -5.593207359313965, "global_step": 36521, "epoch": 869} {"train_loss": -5.629140853881836, "global_step": 36522, "epoch": 869} {"train_loss": -5.534196853637695, "global_step": 36523, "epoch": 869} {"train_loss": -5.6122283935546875, "global_step": 36524, "epoch": 869} {"train_loss": -5.574813365936279, "global_step": 36525, "epoch": 869} {"train_loss": -5.608925819396973, "global_step": 36526, "epoch": 869} {"train_loss": -5.526096343994141, "global_step": 36527, "epoch": 869} {"train_loss": -5.653735637664795, "global_step": 36528, "epoch": 869} {"train_loss": -5.599620819091797, "global_step": 36529, "epoch": 869} {"train_loss": -5.577178001403809, "global_step": 36530, "epoch": 869} {"train_loss": -5.558054447174072, "global_step": 36531, "epoch": 869} {"train_loss": -5.598158836364746, "global_step": 36532, "epoch": 869} {"train_loss": -5.545847415924072, "global_step": 36533, "epoch": 869} {"train_loss": -5.38572359085083, "global_step": 36534, "epoch": 869} {"train_loss": -5.506099700927734, "global_step": 36535, "epoch": 869} {"train_loss": -5.489500522613525, "global_step": 36536, "epoch": 869} {"train_loss": -5.500807762145996, "global_step": 36537, "epoch": 869} {"train_loss": -5.526522159576416, "global_step": 36538, "epoch": 869} {"train_loss": -5.562126852217174, "global_step": 36539, "epoch": 869, "val_loss": 65828.46875} {"train_loss": -5.631432056427002, "global_step": 36540, "epoch": 870} {"train_loss": -5.5135321617126465, "global_step": 36541, "epoch": 870} {"train_loss": -5.732036113739014, "global_step": 36542, "epoch": 870} {"train_loss": -5.613948822021484, "global_step": 36543, "epoch": 870} {"train_loss": -5.5403289794921875, "global_step": 36544, "epoch": 870} {"train_loss": -5.5790114402771, "global_step": 36545, "epoch": 870} {"train_loss": -5.637322425842285, "global_step": 36546, "epoch": 870} {"train_loss": -5.510112762451172, "global_step": 36547, "epoch": 870} {"train_loss": -5.578483581542969, "global_step": 36548, "epoch": 870} {"train_loss": -5.45323371887207, "global_step": 36549, "epoch": 870} {"train_loss": -5.426105499267578, "global_step": 36550, "epoch": 870} {"train_loss": -5.65476655960083, "global_step": 36551, "epoch": 870} {"train_loss": -5.5053324699401855, "global_step": 36552, "epoch": 870} {"train_loss": -5.605701923370361, "global_step": 36553, "epoch": 870} {"train_loss": -5.627949237823486, "global_step": 36554, "epoch": 870} {"train_loss": -5.498964309692383, "global_step": 36555, "epoch": 870} {"train_loss": -5.5419921875, "global_step": 36556, "epoch": 870} {"train_loss": -5.524988174438477, "global_step": 36557, "epoch": 870} {"train_loss": -5.621445178985596, "global_step": 36558, "epoch": 870} {"train_loss": -5.546034812927246, "global_step": 36559, "epoch": 870} {"train_loss": -5.538137435913086, "global_step": 36560, "epoch": 870} {"train_loss": -5.516598224639893, "global_step": 36561, "epoch": 870} {"train_loss": -5.667348861694336, "global_step": 36562, "epoch": 870} {"train_loss": -5.527098178863525, "global_step": 36563, "epoch": 870} {"train_loss": -5.669282913208008, "global_step": 36564, "epoch": 870} {"train_loss": -5.482367038726807, "global_step": 36565, "epoch": 870} {"train_loss": -5.641997814178467, "global_step": 36566, "epoch": 870} {"train_loss": -5.555351734161377, "global_step": 36567, "epoch": 870} {"train_loss": -5.539996147155762, "global_step": 36568, "epoch": 870} {"train_loss": -5.561954975128174, "global_step": 36569, "epoch": 870} {"train_loss": -5.7012553215026855, "global_step": 36570, "epoch": 870} {"train_loss": -5.610580921173096, "global_step": 36571, "epoch": 870} {"train_loss": -5.518420696258545, "global_step": 36572, "epoch": 870} {"train_loss": -5.594649314880371, "global_step": 36573, "epoch": 870} {"train_loss": -5.525454521179199, "global_step": 36574, "epoch": 870} {"train_loss": -5.491783618927002, "global_step": 36575, "epoch": 870} {"train_loss": -5.568648338317871, "global_step": 36576, "epoch": 870} {"train_loss": -5.577959060668945, "global_step": 36577, "epoch": 870} {"train_loss": -5.530898094177246, "global_step": 36578, "epoch": 870} {"train_loss": -5.640227794647217, "global_step": 36579, "epoch": 870} {"train_loss": -5.414859771728516, "global_step": 36580, "epoch": 870} {"train_loss": -5.564480668022519, "global_step": 36581, "epoch": 870, "val_loss": 65848.1015625} {"train_loss": -5.558988094329834, "global_step": 36582, "epoch": 871} {"train_loss": -5.361723899841309, "global_step": 36583, "epoch": 871} {"train_loss": -5.380366325378418, "global_step": 36584, "epoch": 871} {"train_loss": -5.524284839630127, "global_step": 36585, "epoch": 871} {"train_loss": -5.515033721923828, "global_step": 36586, "epoch": 871} {"train_loss": -5.450220108032227, "global_step": 36587, "epoch": 871} {"train_loss": -5.506568908691406, "global_step": 36588, "epoch": 871} {"train_loss": -5.543395042419434, "global_step": 36589, "epoch": 871} {"train_loss": -5.518202781677246, "global_step": 36590, "epoch": 871} {"train_loss": -5.645415782928467, "global_step": 36591, "epoch": 871} {"train_loss": -5.489389419555664, "global_step": 36592, "epoch": 871} {"train_loss": -5.580122470855713, "global_step": 36593, "epoch": 871} {"train_loss": -5.4116973876953125, "global_step": 36594, "epoch": 871} {"train_loss": -5.534246921539307, "global_step": 36595, "epoch": 871} {"train_loss": -5.712021827697754, "global_step": 36596, "epoch": 871} {"train_loss": -5.477080821990967, "global_step": 36597, "epoch": 871} {"train_loss": -5.508741855621338, "global_step": 36598, "epoch": 871} {"train_loss": -5.454813003540039, "global_step": 36599, "epoch": 871} {"train_loss": -5.7062225341796875, "global_step": 36600, "epoch": 871} {"train_loss": -5.6216535568237305, "global_step": 36601, "epoch": 871} {"train_loss": -5.564647674560547, "global_step": 36602, "epoch": 871} {"train_loss": -5.673089027404785, "global_step": 36603, "epoch": 871} {"train_loss": -5.612642288208008, "global_step": 36604, "epoch": 871} {"train_loss": -5.729223251342773, "global_step": 36605, "epoch": 871} {"train_loss": -5.64802885055542, "global_step": 36606, "epoch": 871} {"train_loss": -5.501608848571777, "global_step": 36607, "epoch": 871} {"train_loss": -5.526175498962402, "global_step": 36608, "epoch": 871} {"train_loss": -5.606600284576416, "global_step": 36609, "epoch": 871} {"train_loss": -5.568159103393555, "global_step": 36610, "epoch": 871} {"train_loss": -5.693297863006592, "global_step": 36611, "epoch": 871} {"train_loss": -5.626269340515137, "global_step": 36612, "epoch": 871} {"train_loss": -5.475401401519775, "global_step": 36613, "epoch": 871} {"train_loss": -5.617271900177002, "global_step": 36614, "epoch": 871} {"train_loss": -5.6276350021362305, "global_step": 36615, "epoch": 871} {"train_loss": -5.577574253082275, "global_step": 36616, "epoch": 871} {"train_loss": -5.649570465087891, "global_step": 36617, "epoch": 871} {"train_loss": -5.69189453125, "global_step": 36618, "epoch": 871} {"train_loss": -5.421536445617676, "global_step": 36619, "epoch": 871} {"train_loss": -5.563429355621338, "global_step": 36620, "epoch": 871} {"train_loss": -5.501797676086426, "global_step": 36621, "epoch": 871} {"train_loss": -5.573066711425781, "global_step": 36622, "epoch": 871} {"train_loss": -5.562207914534069, "global_step": 36623, "epoch": 871, "val_loss": 66059.5703125} {"train_loss": -5.474420547485352, "global_step": 36624, "epoch": 872} {"train_loss": -5.536406993865967, "global_step": 36625, "epoch": 872} {"train_loss": -5.406991004943848, "global_step": 36626, "epoch": 872} {"train_loss": -5.655672073364258, "global_step": 36627, "epoch": 872} {"train_loss": -5.601550579071045, "global_step": 36628, "epoch": 872} {"train_loss": -5.592061519622803, "global_step": 36629, "epoch": 872} {"train_loss": -5.613682270050049, "global_step": 36630, "epoch": 872} {"train_loss": -5.584281921386719, "global_step": 36631, "epoch": 872} {"train_loss": -5.6225385665893555, "global_step": 36632, "epoch": 872} {"train_loss": -5.4985575675964355, "global_step": 36633, "epoch": 872} {"train_loss": -5.602296829223633, "global_step": 36634, "epoch": 872} {"train_loss": -5.72823429107666, "global_step": 36635, "epoch": 872} {"train_loss": -5.5091552734375, "global_step": 36636, "epoch": 872} {"train_loss": -5.51077127456665, "global_step": 36637, "epoch": 872} {"train_loss": -5.547592639923096, "global_step": 36638, "epoch": 872} {"train_loss": -5.466207504272461, "global_step": 36639, "epoch": 872} {"train_loss": -5.549032211303711, "global_step": 36640, "epoch": 872} {"train_loss": -5.641510486602783, "global_step": 36641, "epoch": 872} {"train_loss": -5.351967811584473, "global_step": 36642, "epoch": 872} {"train_loss": -5.694286346435547, "global_step": 36643, "epoch": 872} {"train_loss": -5.5086164474487305, "global_step": 36644, "epoch": 872} {"train_loss": -5.572983741760254, "global_step": 36645, "epoch": 872} {"train_loss": -5.407503128051758, "global_step": 36646, "epoch": 872} {"train_loss": -5.568840026855469, "global_step": 36647, "epoch": 872} {"train_loss": -5.416663646697998, "global_step": 36648, "epoch": 872} {"train_loss": -5.492977142333984, "global_step": 36649, "epoch": 872} {"train_loss": -5.654315948486328, "global_step": 36650, "epoch": 872} {"train_loss": -5.472053050994873, "global_step": 36651, "epoch": 872} {"train_loss": -5.6690449714660645, "global_step": 36652, "epoch": 872} {"train_loss": -5.503143310546875, "global_step": 36653, "epoch": 872} {"train_loss": -5.676743507385254, "global_step": 36654, "epoch": 872} {"train_loss": -5.48962926864624, "global_step": 36655, "epoch": 872} {"train_loss": -5.635382652282715, "global_step": 36656, "epoch": 872} {"train_loss": -5.489969253540039, "global_step": 36657, "epoch": 872} {"train_loss": -5.525368690490723, "global_step": 36658, "epoch": 872} {"train_loss": -5.507811546325684, "global_step": 36659, "epoch": 872} {"train_loss": -5.496072769165039, "global_step": 36660, "epoch": 872} {"train_loss": -5.618508815765381, "global_step": 36661, "epoch": 872} {"train_loss": -5.430192947387695, "global_step": 36662, "epoch": 872} {"train_loss": -5.528811454772949, "global_step": 36663, "epoch": 872} {"train_loss": -5.556417942047119, "global_step": 36664, "epoch": 872} {"train_loss": -5.546955267588298, "global_step": 36665, "epoch": 872, "val_loss": 65989.6171875} {"train_loss": -5.68043851852417, "global_step": 36666, "epoch": 873} {"train_loss": -5.60367488861084, "global_step": 36667, "epoch": 873} {"train_loss": -5.60249137878418, "global_step": 36668, "epoch": 873} {"train_loss": -5.579843997955322, "global_step": 36669, "epoch": 873} {"train_loss": -5.706147193908691, "global_step": 36670, "epoch": 873} {"train_loss": -5.481489181518555, "global_step": 36671, "epoch": 873} {"train_loss": -5.552581787109375, "global_step": 36672, "epoch": 873} {"train_loss": -5.611299991607666, "global_step": 36673, "epoch": 873} {"train_loss": -5.633767604827881, "global_step": 36674, "epoch": 873} {"train_loss": -5.446667671203613, "global_step": 36675, "epoch": 873} {"train_loss": -5.6602630615234375, "global_step": 36676, "epoch": 873} {"train_loss": -5.638792037963867, "global_step": 36677, "epoch": 873} {"train_loss": -5.562938690185547, "global_step": 36678, "epoch": 873} {"train_loss": -5.720467567443848, "global_step": 36679, "epoch": 873} {"train_loss": -5.598781585693359, "global_step": 36680, "epoch": 873} {"train_loss": -5.584834098815918, "global_step": 36681, "epoch": 873} {"train_loss": -5.4920806884765625, "global_step": 36682, "epoch": 873} {"train_loss": -5.551434516906738, "global_step": 36683, "epoch": 873} {"train_loss": -5.612232685089111, "global_step": 36684, "epoch": 873} {"train_loss": -5.419581890106201, "global_step": 36685, "epoch": 873} {"train_loss": -5.5771260261535645, "global_step": 36686, "epoch": 873} {"train_loss": -5.586781024932861, "global_step": 36687, "epoch": 873} {"train_loss": -5.453690528869629, "global_step": 36688, "epoch": 873} {"train_loss": -5.632776260375977, "global_step": 36689, "epoch": 873} {"train_loss": -5.510868072509766, "global_step": 36690, "epoch": 873} {"train_loss": -5.744565963745117, "global_step": 36691, "epoch": 873} {"train_loss": -5.488234519958496, "global_step": 36692, "epoch": 873} {"train_loss": -5.540626525878906, "global_step": 36693, "epoch": 873} {"train_loss": -5.607448101043701, "global_step": 36694, "epoch": 873} {"train_loss": -5.475054740905762, "global_step": 36695, "epoch": 873} {"train_loss": -5.5666327476501465, "global_step": 36696, "epoch": 873} {"train_loss": -5.529693126678467, "global_step": 36697, "epoch": 873} {"train_loss": -5.600090503692627, "global_step": 36698, "epoch": 873} {"train_loss": -5.50949764251709, "global_step": 36699, "epoch": 873} {"train_loss": -5.514956951141357, "global_step": 36700, "epoch": 873} {"train_loss": -5.57935905456543, "global_step": 36701, "epoch": 873} {"train_loss": -5.574075698852539, "global_step": 36702, "epoch": 873} {"train_loss": -5.689586639404297, "global_step": 36703, "epoch": 873} {"train_loss": -5.642765045166016, "global_step": 36704, "epoch": 873} {"train_loss": -5.5621819496154785, "global_step": 36705, "epoch": 873} {"train_loss": -5.551970958709717, "global_step": 36706, "epoch": 873} {"train_loss": -5.577726727440243, "global_step": 36707, "epoch": 873, "val_loss": 66128.359375} {"train_loss": -5.669892311096191, "global_step": 36708, "epoch": 874} {"train_loss": -5.68543815612793, "global_step": 36709, "epoch": 874} {"train_loss": -5.6825361251831055, "global_step": 36710, "epoch": 874} {"train_loss": -5.612589359283447, "global_step": 36711, "epoch": 874} {"train_loss": -5.570878028869629, "global_step": 36712, "epoch": 874} {"train_loss": -5.5162224769592285, "global_step": 36713, "epoch": 874} {"train_loss": -5.750580787658691, "global_step": 36714, "epoch": 874} {"train_loss": -5.681344985961914, "global_step": 36715, "epoch": 874} {"train_loss": -5.578062534332275, "global_step": 36716, "epoch": 874} {"train_loss": -5.5632643699646, "global_step": 36717, "epoch": 874} {"train_loss": -5.577817916870117, "global_step": 36718, "epoch": 874} {"train_loss": -5.685198783874512, "global_step": 36719, "epoch": 874} {"train_loss": -5.723772048950195, "global_step": 36720, "epoch": 874} {"train_loss": -5.53857421875, "global_step": 36721, "epoch": 874} {"train_loss": -5.6676411628723145, "global_step": 36722, "epoch": 874} {"train_loss": -5.59254264831543, "global_step": 36723, "epoch": 874} {"train_loss": -5.601863861083984, "global_step": 36724, "epoch": 874} {"train_loss": -5.565863132476807, "global_step": 36725, "epoch": 874} {"train_loss": -5.537966728210449, "global_step": 36726, "epoch": 874} {"train_loss": -5.547079563140869, "global_step": 36727, "epoch": 874} {"train_loss": -5.589494228363037, "global_step": 36728, "epoch": 874} {"train_loss": -5.674739837646484, "global_step": 36729, "epoch": 874} {"train_loss": -5.426117420196533, "global_step": 36730, "epoch": 874} {"train_loss": -5.6103105545043945, "global_step": 36731, "epoch": 874} {"train_loss": -5.465940475463867, "global_step": 36732, "epoch": 874} {"train_loss": -5.536491394042969, "global_step": 36733, "epoch": 874} {"train_loss": -5.493566036224365, "global_step": 36734, "epoch": 874} {"train_loss": -5.431858539581299, "global_step": 36735, "epoch": 874} {"train_loss": -5.421501159667969, "global_step": 36736, "epoch": 874} {"train_loss": -5.472354888916016, "global_step": 36737, "epoch": 874} {"train_loss": -5.6322479248046875, "global_step": 36738, "epoch": 874} {"train_loss": -5.618691444396973, "global_step": 36739, "epoch": 874} {"train_loss": -5.568522930145264, "global_step": 36740, "epoch": 874} {"train_loss": -5.623132228851318, "global_step": 36741, "epoch": 874} {"train_loss": -5.5359625816345215, "global_step": 36742, "epoch": 874} {"train_loss": -5.616006851196289, "global_step": 36743, "epoch": 874} {"train_loss": -5.636976718902588, "global_step": 36744, "epoch": 874} {"train_loss": -5.574622631072998, "global_step": 36745, "epoch": 874} {"train_loss": -5.59268045425415, "global_step": 36746, "epoch": 874} {"train_loss": -5.553028106689453, "global_step": 36747, "epoch": 874} {"train_loss": -5.496550559997559, "global_step": 36748, "epoch": 874} {"train_loss": -5.58467241695949, "global_step": 36749, "epoch": 874, "val_loss": 66111.203125} {"train_loss": -5.505772113800049, "global_step": 36750, "epoch": 875} {"train_loss": -5.7861008644104, "global_step": 36751, "epoch": 875} {"train_loss": -5.706531524658203, "global_step": 36752, "epoch": 875} {"train_loss": -5.632454872131348, "global_step": 36753, "epoch": 875} {"train_loss": -5.561057090759277, "global_step": 36754, "epoch": 875} {"train_loss": -5.6557207107543945, "global_step": 36755, "epoch": 875} {"train_loss": -5.544476509094238, "global_step": 36756, "epoch": 875} {"train_loss": -5.53410005569458, "global_step": 36757, "epoch": 875} {"train_loss": -5.478020668029785, "global_step": 36758, "epoch": 875} {"train_loss": -5.419567108154297, "global_step": 36759, "epoch": 875} {"train_loss": -5.507883071899414, "global_step": 36760, "epoch": 875} {"train_loss": -5.665680885314941, "global_step": 36761, "epoch": 875} {"train_loss": -5.548576354980469, "global_step": 36762, "epoch": 875} {"train_loss": -5.637619972229004, "global_step": 36763, "epoch": 875} {"train_loss": -5.594325065612793, "global_step": 36764, "epoch": 875} {"train_loss": -5.563360214233398, "global_step": 36765, "epoch": 875} {"train_loss": -5.596521377563477, "global_step": 36766, "epoch": 875} {"train_loss": -5.578073024749756, "global_step": 36767, "epoch": 875} {"train_loss": -5.653367042541504, "global_step": 36768, "epoch": 875} {"train_loss": -5.576714992523193, "global_step": 36769, "epoch": 875} {"train_loss": -5.621435165405273, "global_step": 36770, "epoch": 875} {"train_loss": -5.6190080642700195, "global_step": 36771, "epoch": 875} {"train_loss": -5.707485675811768, "global_step": 36772, "epoch": 875} {"train_loss": -5.649333477020264, "global_step": 36773, "epoch": 875} {"train_loss": -5.567795276641846, "global_step": 36774, "epoch": 875} {"train_loss": -5.663855075836182, "global_step": 36775, "epoch": 875} {"train_loss": -5.626904487609863, "global_step": 36776, "epoch": 875} {"train_loss": -5.593352317810059, "global_step": 36777, "epoch": 875} {"train_loss": -5.648806571960449, "global_step": 36778, "epoch": 875} {"train_loss": -5.613767623901367, "global_step": 36779, "epoch": 875} {"train_loss": -5.624762535095215, "global_step": 36780, "epoch": 875} {"train_loss": -5.466671943664551, "global_step": 36781, "epoch": 875} {"train_loss": -5.538388252258301, "global_step": 36782, "epoch": 875} {"train_loss": -5.579334259033203, "global_step": 36783, "epoch": 875} {"train_loss": -5.344806671142578, "global_step": 36784, "epoch": 875} {"train_loss": -5.511816501617432, "global_step": 36785, "epoch": 875} {"train_loss": -5.577326774597168, "global_step": 36786, "epoch": 875} {"train_loss": -5.457927703857422, "global_step": 36787, "epoch": 875} {"train_loss": -5.532378196716309, "global_step": 36788, "epoch": 875} {"train_loss": -5.637595176696777, "global_step": 36789, "epoch": 875} {"train_loss": -5.445493698120117, "global_step": 36790, "epoch": 875} {"train_loss": -5.579978011903309, "global_step": 36791, "epoch": 875, "val_loss": 66707.4921875} {"train_loss": -5.548471450805664, "global_step": 36792, "epoch": 876} {"train_loss": -5.616743087768555, "global_step": 36793, "epoch": 876} {"train_loss": -5.646086692810059, "global_step": 36794, "epoch": 876} {"train_loss": -5.606929779052734, "global_step": 36795, "epoch": 876} {"train_loss": -5.614960193634033, "global_step": 36796, "epoch": 876} {"train_loss": -5.608649253845215, "global_step": 36797, "epoch": 876} {"train_loss": -5.436176300048828, "global_step": 36798, "epoch": 876} {"train_loss": -5.649033546447754, "global_step": 36799, "epoch": 876} {"train_loss": -5.448936462402344, "global_step": 36800, "epoch": 876} {"train_loss": -5.534676551818848, "global_step": 36801, "epoch": 876} {"train_loss": -5.660312175750732, "global_step": 36802, "epoch": 876} {"train_loss": -5.594876766204834, "global_step": 36803, "epoch": 876} {"train_loss": -5.528599739074707, "global_step": 36804, "epoch": 876} {"train_loss": -5.543344497680664, "global_step": 36805, "epoch": 876} {"train_loss": -5.639618873596191, "global_step": 36806, "epoch": 876} {"train_loss": -5.589540004730225, "global_step": 36807, "epoch": 876} {"train_loss": -5.4239983558654785, "global_step": 36808, "epoch": 876} {"train_loss": -5.579276084899902, "global_step": 36809, "epoch": 876} {"train_loss": -5.639317512512207, "global_step": 36810, "epoch": 876} {"train_loss": -5.561779499053955, "global_step": 36811, "epoch": 876} {"train_loss": -5.747431755065918, "global_step": 36812, "epoch": 876} {"train_loss": -5.647844314575195, "global_step": 36813, "epoch": 876} {"train_loss": -5.661290168762207, "global_step": 36814, "epoch": 876} {"train_loss": -5.570317268371582, "global_step": 36815, "epoch": 876} {"train_loss": -5.607083797454834, "global_step": 36816, "epoch": 876} {"train_loss": -5.642671585083008, "global_step": 36817, "epoch": 876} {"train_loss": -5.398256301879883, "global_step": 36818, "epoch": 876} {"train_loss": -5.639831066131592, "global_step": 36819, "epoch": 876} {"train_loss": -5.538218021392822, "global_step": 36820, "epoch": 876} {"train_loss": -5.538778305053711, "global_step": 36821, "epoch": 876} {"train_loss": -5.519399642944336, "global_step": 36822, "epoch": 876} {"train_loss": -5.554265022277832, "global_step": 36823, "epoch": 876} {"train_loss": -5.536375045776367, "global_step": 36824, "epoch": 876} {"train_loss": -5.551181793212891, "global_step": 36825, "epoch": 876} {"train_loss": -5.5799102783203125, "global_step": 36826, "epoch": 876} {"train_loss": -5.601678371429443, "global_step": 36827, "epoch": 876} {"train_loss": -5.545478820800781, "global_step": 36828, "epoch": 876} {"train_loss": -5.535405158996582, "global_step": 36829, "epoch": 876} {"train_loss": -5.59982967376709, "global_step": 36830, "epoch": 876} {"train_loss": -5.53934383392334, "global_step": 36831, "epoch": 876} {"train_loss": -5.553102970123291, "global_step": 36832, "epoch": 876} {"train_loss": -5.575038512547811, "global_step": 36833, "epoch": 876, "val_loss": 66087.8671875} {"train_loss": -5.578177452087402, "global_step": 36834, "epoch": 877} {"train_loss": -5.6164751052856445, "global_step": 36835, "epoch": 877} {"train_loss": -5.5899858474731445, "global_step": 36836, "epoch": 877} {"train_loss": -5.697574615478516, "global_step": 36837, "epoch": 877} {"train_loss": -5.690274238586426, "global_step": 36838, "epoch": 877} {"train_loss": -5.5567240715026855, "global_step": 36839, "epoch": 877} {"train_loss": -5.5168609619140625, "global_step": 36840, "epoch": 877} {"train_loss": -5.490482330322266, "global_step": 36841, "epoch": 877} {"train_loss": -5.407430648803711, "global_step": 36842, "epoch": 877} {"train_loss": -5.708870887756348, "global_step": 36843, "epoch": 877} {"train_loss": -5.482755661010742, "global_step": 36844, "epoch": 877} {"train_loss": -5.5496392250061035, "global_step": 36845, "epoch": 877} {"train_loss": -5.586301803588867, "global_step": 36846, "epoch": 877} {"train_loss": -5.639134407043457, "global_step": 36847, "epoch": 877} {"train_loss": -5.599237442016602, "global_step": 36848, "epoch": 877} {"train_loss": -5.590909481048584, "global_step": 36849, "epoch": 877} {"train_loss": -5.506066799163818, "global_step": 36850, "epoch": 877} {"train_loss": -5.593039512634277, "global_step": 36851, "epoch": 877} {"train_loss": -5.651695251464844, "global_step": 36852, "epoch": 877} {"train_loss": -5.667350769042969, "global_step": 36853, "epoch": 877} {"train_loss": -5.648441314697266, "global_step": 36854, "epoch": 877} {"train_loss": -5.560883522033691, "global_step": 36855, "epoch": 877} {"train_loss": -5.477292060852051, "global_step": 36856, "epoch": 877} {"train_loss": -5.602316856384277, "global_step": 36857, "epoch": 877} {"train_loss": -5.664890766143799, "global_step": 36858, "epoch": 877} {"train_loss": -5.612188339233398, "global_step": 36859, "epoch": 877} {"train_loss": -5.649596214294434, "global_step": 36860, "epoch": 877} {"train_loss": -5.631994247436523, "global_step": 36861, "epoch": 877} {"train_loss": -5.6028594970703125, "global_step": 36862, "epoch": 877} {"train_loss": -5.637686729431152, "global_step": 36863, "epoch": 877} {"train_loss": -5.5790300369262695, "global_step": 36864, "epoch": 877} {"train_loss": -5.58302116394043, "global_step": 36865, "epoch": 877} {"train_loss": -5.702256202697754, "global_step": 36866, "epoch": 877} {"train_loss": -5.5473313331604, "global_step": 36867, "epoch": 877} {"train_loss": -5.606537818908691, "global_step": 36868, "epoch": 877} {"train_loss": -5.610104560852051, "global_step": 36869, "epoch": 877} {"train_loss": -5.623379707336426, "global_step": 36870, "epoch": 877} {"train_loss": -5.581274032592773, "global_step": 36871, "epoch": 877} {"train_loss": -5.463984489440918, "global_step": 36872, "epoch": 877} {"train_loss": -5.560032844543457, "global_step": 36873, "epoch": 877} {"train_loss": -5.571011066436768, "global_step": 36874, "epoch": 877} {"train_loss": -5.587880872544789, "global_step": 36875, "epoch": 877, "val_loss": 66362.546875} {"train_loss": -5.443272113800049, "global_step": 36876, "epoch": 878} {"train_loss": -5.578397274017334, "global_step": 36877, "epoch": 878} {"train_loss": -5.463644504547119, "global_step": 36878, "epoch": 878} {"train_loss": -5.666505336761475, "global_step": 36879, "epoch": 878} {"train_loss": -5.584784507751465, "global_step": 36880, "epoch": 878} {"train_loss": -5.613827228546143, "global_step": 36881, "epoch": 878} {"train_loss": -5.515686988830566, "global_step": 36882, "epoch": 878} {"train_loss": -5.668664932250977, "global_step": 36883, "epoch": 878} {"train_loss": -5.567258834838867, "global_step": 36884, "epoch": 878} {"train_loss": -5.620003700256348, "global_step": 36885, "epoch": 878} {"train_loss": -5.599011421203613, "global_step": 36886, "epoch": 878} {"train_loss": -5.6486496925354, "global_step": 36887, "epoch": 878} {"train_loss": -5.52283239364624, "global_step": 36888, "epoch": 878} {"train_loss": -5.580033302307129, "global_step": 36889, "epoch": 878} {"train_loss": -5.618241310119629, "global_step": 36890, "epoch": 878} {"train_loss": -5.548442363739014, "global_step": 36891, "epoch": 878} {"train_loss": -5.597860336303711, "global_step": 36892, "epoch": 878} {"train_loss": -5.678208827972412, "global_step": 36893, "epoch": 878} {"train_loss": -5.680764675140381, "global_step": 36894, "epoch": 878} {"train_loss": -5.547035217285156, "global_step": 36895, "epoch": 878} {"train_loss": -5.631796836853027, "global_step": 36896, "epoch": 878} {"train_loss": -5.449623107910156, "global_step": 36897, "epoch": 878} {"train_loss": -5.554218769073486, "global_step": 36898, "epoch": 878} {"train_loss": -5.6771240234375, "global_step": 36899, "epoch": 878} {"train_loss": -5.339117050170898, "global_step": 36900, "epoch": 878} {"train_loss": -5.4796905517578125, "global_step": 36901, "epoch": 878} {"train_loss": -5.487695693969727, "global_step": 36902, "epoch": 878} {"train_loss": -5.390787124633789, "global_step": 36903, "epoch": 878} {"train_loss": -5.496997356414795, "global_step": 36904, "epoch": 878} {"train_loss": -5.487744331359863, "global_step": 36905, "epoch": 878} {"train_loss": -5.446926116943359, "global_step": 36906, "epoch": 878} {"train_loss": -5.6403679847717285, "global_step": 36907, "epoch": 878} {"train_loss": -5.508607864379883, "global_step": 36908, "epoch": 878} {"train_loss": -5.486907482147217, "global_step": 36909, "epoch": 878} {"train_loss": -5.519696235656738, "global_step": 36910, "epoch": 878} {"train_loss": -5.5045576095581055, "global_step": 36911, "epoch": 878} {"train_loss": -5.594178676605225, "global_step": 36912, "epoch": 878} {"train_loss": -5.536478042602539, "global_step": 36913, "epoch": 878} {"train_loss": -5.5071868896484375, "global_step": 36914, "epoch": 878} {"train_loss": -5.588863849639893, "global_step": 36915, "epoch": 878} {"train_loss": -5.6202521324157715, "global_step": 36916, "epoch": 878} {"train_loss": -5.550072794868832, "global_step": 36917, "epoch": 878, "val_loss": 66052.0} {"train_loss": -5.574202060699463, "global_step": 36918, "epoch": 879} {"train_loss": -5.638443470001221, "global_step": 36919, "epoch": 879} {"train_loss": -5.599770545959473, "global_step": 36920, "epoch": 879} {"train_loss": -5.6587934494018555, "global_step": 36921, "epoch": 879} {"train_loss": -5.602179050445557, "global_step": 36922, "epoch": 879} {"train_loss": -5.603531837463379, "global_step": 36923, "epoch": 879} {"train_loss": -5.669083595275879, "global_step": 36924, "epoch": 879} {"train_loss": -5.69797945022583, "global_step": 36925, "epoch": 879} {"train_loss": -5.564519882202148, "global_step": 36926, "epoch": 879} {"train_loss": -5.567745208740234, "global_step": 36927, "epoch": 879} {"train_loss": -5.504756927490234, "global_step": 36928, "epoch": 879} {"train_loss": -5.486722946166992, "global_step": 36929, "epoch": 879} {"train_loss": -5.64976692199707, "global_step": 36930, "epoch": 879} {"train_loss": -5.624467849731445, "global_step": 36931, "epoch": 879} {"train_loss": -5.6501851081848145, "global_step": 36932, "epoch": 879} {"train_loss": -5.513997554779053, "global_step": 36933, "epoch": 879} {"train_loss": -5.496656894683838, "global_step": 36934, "epoch": 879} {"train_loss": -5.592489242553711, "global_step": 36935, "epoch": 879} {"train_loss": -5.6637749671936035, "global_step": 36936, "epoch": 879} {"train_loss": -5.626496315002441, "global_step": 36937, "epoch": 879} {"train_loss": -5.4989776611328125, "global_step": 36938, "epoch": 879} {"train_loss": -5.543348789215088, "global_step": 36939, "epoch": 879} {"train_loss": -5.500425338745117, "global_step": 36940, "epoch": 879} {"train_loss": -5.545773029327393, "global_step": 36941, "epoch": 879} {"train_loss": -5.5019450187683105, "global_step": 36942, "epoch": 879} {"train_loss": -5.4730119705200195, "global_step": 36943, "epoch": 879} {"train_loss": -5.575477600097656, "global_step": 36944, "epoch": 879} {"train_loss": -5.587030410766602, "global_step": 36945, "epoch": 879} {"train_loss": -5.615527153015137, "global_step": 36946, "epoch": 879} {"train_loss": -5.553058624267578, "global_step": 36947, "epoch": 879} {"train_loss": -5.5587921142578125, "global_step": 36948, "epoch": 879} {"train_loss": -5.531999588012695, "global_step": 36949, "epoch": 879} {"train_loss": -5.51521110534668, "global_step": 36950, "epoch": 879} {"train_loss": -5.579998016357422, "global_step": 36951, "epoch": 879} {"train_loss": -5.5544281005859375, "global_step": 36952, "epoch": 879} {"train_loss": -5.4738664627075195, "global_step": 36953, "epoch": 879} {"train_loss": -5.597843170166016, "global_step": 36954, "epoch": 879} {"train_loss": -5.513344764709473, "global_step": 36955, "epoch": 879} {"train_loss": -5.445810794830322, "global_step": 36956, "epoch": 879} {"train_loss": -5.642580032348633, "global_step": 36957, "epoch": 879} {"train_loss": -5.46115779876709, "global_step": 36958, "epoch": 879} {"train_loss": -5.568820294879732, "global_step": 36959, "epoch": 879, "val_loss": 66223.03125} {"train_loss": -5.592917442321777, "global_step": 36960, "epoch": 880} {"train_loss": -5.457743167877197, "global_step": 36961, "epoch": 880} {"train_loss": -5.571014404296875, "global_step": 36962, "epoch": 880} {"train_loss": -5.628352165222168, "global_step": 36963, "epoch": 880} {"train_loss": -5.53255558013916, "global_step": 36964, "epoch": 880} {"train_loss": -5.62775993347168, "global_step": 36965, "epoch": 880} {"train_loss": -5.520723342895508, "global_step": 36966, "epoch": 880} {"train_loss": -5.607146263122559, "global_step": 36967, "epoch": 880} {"train_loss": -5.486832618713379, "global_step": 36968, "epoch": 880} {"train_loss": -5.617507457733154, "global_step": 36969, "epoch": 880} {"train_loss": -5.528661727905273, "global_step": 36970, "epoch": 880} {"train_loss": -5.59173583984375, "global_step": 36971, "epoch": 880} {"train_loss": -5.520513534545898, "global_step": 36972, "epoch": 880} {"train_loss": -5.526633262634277, "global_step": 36973, "epoch": 880} {"train_loss": -5.665596961975098, "global_step": 36974, "epoch": 880} {"train_loss": -5.480011940002441, "global_step": 36975, "epoch": 880} {"train_loss": -5.676471710205078, "global_step": 36976, "epoch": 880} {"train_loss": -5.508999347686768, "global_step": 36977, "epoch": 880} {"train_loss": -5.5002970695495605, "global_step": 36978, "epoch": 880} {"train_loss": -5.669651031494141, "global_step": 36979, "epoch": 880} {"train_loss": -5.465359687805176, "global_step": 36980, "epoch": 880} {"train_loss": -5.510157585144043, "global_step": 36981, "epoch": 880} {"train_loss": -5.571944236755371, "global_step": 36982, "epoch": 880} {"train_loss": -5.564843654632568, "global_step": 36983, "epoch": 880} {"train_loss": -5.4807209968566895, "global_step": 36984, "epoch": 880} {"train_loss": -5.56123161315918, "global_step": 36985, "epoch": 880} {"train_loss": -5.584907054901123, "global_step": 36986, "epoch": 880} {"train_loss": -5.614837646484375, "global_step": 36987, "epoch": 880} {"train_loss": -5.517066478729248, "global_step": 36988, "epoch": 880} {"train_loss": -5.449501037597656, "global_step": 36989, "epoch": 880} {"train_loss": -5.66259765625, "global_step": 36990, "epoch": 880} {"train_loss": -5.610952377319336, "global_step": 36991, "epoch": 880} {"train_loss": -5.485185623168945, "global_step": 36992, "epoch": 880} {"train_loss": -5.611955642700195, "global_step": 36993, "epoch": 880} {"train_loss": -5.50465202331543, "global_step": 36994, "epoch": 880} {"train_loss": -5.367713928222656, "global_step": 36995, "epoch": 880} {"train_loss": -5.494171142578125, "global_step": 36996, "epoch": 880} {"train_loss": -5.404591083526611, "global_step": 36997, "epoch": 880} {"train_loss": -5.7117462158203125, "global_step": 36998, "epoch": 880} {"train_loss": -5.537745475769043, "global_step": 36999, "epoch": 880} {"train_loss": -5.6637678146362305, "global_step": 37000, "epoch": 880} {"train_loss": -5.55360426221575, "global_step": 37001, "epoch": 880, "val_loss": 66267.96875} {"train_loss": -5.561624526977539, "global_step": 37002, "epoch": 881} {"train_loss": -5.6239013671875, "global_step": 37003, "epoch": 881} {"train_loss": -5.752137184143066, "global_step": 37004, "epoch": 881} {"train_loss": -5.492218971252441, "global_step": 37005, "epoch": 881} {"train_loss": -5.525618076324463, "global_step": 37006, "epoch": 881} {"train_loss": -5.511251449584961, "global_step": 37007, "epoch": 881} {"train_loss": -5.663051605224609, "global_step": 37008, "epoch": 881} {"train_loss": -5.684044361114502, "global_step": 37009, "epoch": 881} {"train_loss": -5.592238903045654, "global_step": 37010, "epoch": 881} {"train_loss": -5.6877031326293945, "global_step": 37011, "epoch": 881} {"train_loss": -5.46504020690918, "global_step": 37012, "epoch": 881} {"train_loss": -5.469549179077148, "global_step": 37013, "epoch": 881} {"train_loss": -5.486955642700195, "global_step": 37014, "epoch": 881} {"train_loss": -5.649899005889893, "global_step": 37015, "epoch": 881} {"train_loss": -5.6277079582214355, "global_step": 37016, "epoch": 881} {"train_loss": -5.580455780029297, "global_step": 37017, "epoch": 881} {"train_loss": -5.637526035308838, "global_step": 37018, "epoch": 881} {"train_loss": -5.530219078063965, "global_step": 37019, "epoch": 881} {"train_loss": -5.592673301696777, "global_step": 37020, "epoch": 881} {"train_loss": -5.465706825256348, "global_step": 37021, "epoch": 881} {"train_loss": -5.502938270568848, "global_step": 37022, "epoch": 881} {"train_loss": -5.587547779083252, "global_step": 37023, "epoch": 881} {"train_loss": -5.418440818786621, "global_step": 37024, "epoch": 881} {"train_loss": -5.459949970245361, "global_step": 37025, "epoch": 881} {"train_loss": -5.496187210083008, "global_step": 37026, "epoch": 881} {"train_loss": -5.562625885009766, "global_step": 37027, "epoch": 881} {"train_loss": -5.6057329177856445, "global_step": 37028, "epoch": 881} {"train_loss": -5.631050109863281, "global_step": 37029, "epoch": 881} {"train_loss": -5.668487071990967, "global_step": 37030, "epoch": 881} {"train_loss": -5.492424011230469, "global_step": 37031, "epoch": 881} {"train_loss": -5.5077619552612305, "global_step": 37032, "epoch": 881} {"train_loss": -5.545672416687012, "global_step": 37033, "epoch": 881} {"train_loss": -5.527642726898193, "global_step": 37034, "epoch": 881} {"train_loss": -5.413395404815674, "global_step": 37035, "epoch": 881} {"train_loss": -5.601526260375977, "global_step": 37036, "epoch": 881} {"train_loss": -5.57466983795166, "global_step": 37037, "epoch": 881} {"train_loss": -5.631841659545898, "global_step": 37038, "epoch": 881} {"train_loss": -5.6869001388549805, "global_step": 37039, "epoch": 881} {"train_loss": -5.526092529296875, "global_step": 37040, "epoch": 881} {"train_loss": -5.579429626464844, "global_step": 37041, "epoch": 881} {"train_loss": -5.614099502563477, "global_step": 37042, "epoch": 881} {"train_loss": -5.565909397034418, "global_step": 37043, "epoch": 881, "val_loss": 66289.46875} {"train_loss": -5.623663425445557, "global_step": 37044, "epoch": 882} {"train_loss": -5.632704257965088, "global_step": 37045, "epoch": 882} {"train_loss": -5.673067569732666, "global_step": 37046, "epoch": 882} {"train_loss": -5.560239791870117, "global_step": 37047, "epoch": 882} {"train_loss": -5.676175594329834, "global_step": 37048, "epoch": 882} {"train_loss": -5.519904136657715, "global_step": 37049, "epoch": 882} {"train_loss": -5.499551773071289, "global_step": 37050, "epoch": 882} {"train_loss": -5.631246566772461, "global_step": 37051, "epoch": 882} {"train_loss": -5.435004234313965, "global_step": 37052, "epoch": 882} {"train_loss": -5.635499000549316, "global_step": 37053, "epoch": 882} {"train_loss": -5.6466875076293945, "global_step": 37054, "epoch": 882} {"train_loss": -5.562803268432617, "global_step": 37055, "epoch": 882} {"train_loss": -5.616418838500977, "global_step": 37056, "epoch": 882} {"train_loss": -5.58839750289917, "global_step": 37057, "epoch": 882} {"train_loss": -5.599368095397949, "global_step": 37058, "epoch": 882} {"train_loss": -5.501744270324707, "global_step": 37059, "epoch": 882} {"train_loss": -5.575286865234375, "global_step": 37060, "epoch": 882} {"train_loss": -5.5714569091796875, "global_step": 37061, "epoch": 882} {"train_loss": -5.547744274139404, "global_step": 37062, "epoch": 882} {"train_loss": -5.576813697814941, "global_step": 37063, "epoch": 882} {"train_loss": -5.511197090148926, "global_step": 37064, "epoch": 882} {"train_loss": -5.464056968688965, "global_step": 37065, "epoch": 882} {"train_loss": -5.547063827514648, "global_step": 37066, "epoch": 882} {"train_loss": -5.598079204559326, "global_step": 37067, "epoch": 882} {"train_loss": -5.537289142608643, "global_step": 37068, "epoch": 882} {"train_loss": -5.496403694152832, "global_step": 37069, "epoch": 882} {"train_loss": -5.577919960021973, "global_step": 37070, "epoch": 882} {"train_loss": -5.612288475036621, "global_step": 37071, "epoch": 882} {"train_loss": -5.594168186187744, "global_step": 37072, "epoch": 882} {"train_loss": -5.620205879211426, "global_step": 37073, "epoch": 882} {"train_loss": -5.571591854095459, "global_step": 37074, "epoch": 882} {"train_loss": -5.664958953857422, "global_step": 37075, "epoch": 882} {"train_loss": -5.565028190612793, "global_step": 37076, "epoch": 882} {"train_loss": -5.680545330047607, "global_step": 37077, "epoch": 882} {"train_loss": -5.599653720855713, "global_step": 37078, "epoch": 882} {"train_loss": -5.531993865966797, "global_step": 37079, "epoch": 882} {"train_loss": -5.650323867797852, "global_step": 37080, "epoch": 882} {"train_loss": -5.637063980102539, "global_step": 37081, "epoch": 882} {"train_loss": -5.512524604797363, "global_step": 37082, "epoch": 882} {"train_loss": -5.627967834472656, "global_step": 37083, "epoch": 882} {"train_loss": -5.594649314880371, "global_step": 37084, "epoch": 882} {"train_loss": -5.5803946767534525, "global_step": 37085, "epoch": 882, "val_loss": 65858.515625} {"train_loss": -5.618090629577637, "global_step": 37086, "epoch": 883} {"train_loss": -5.535253047943115, "global_step": 37087, "epoch": 883} {"train_loss": -5.485833168029785, "global_step": 37088, "epoch": 883} {"train_loss": -5.602407932281494, "global_step": 37089, "epoch": 883} {"train_loss": -5.646811008453369, "global_step": 37090, "epoch": 883} {"train_loss": -5.585092544555664, "global_step": 37091, "epoch": 883} {"train_loss": -5.570990085601807, "global_step": 37092, "epoch": 883} {"train_loss": -5.448184013366699, "global_step": 37093, "epoch": 883} {"train_loss": -5.700141906738281, "global_step": 37094, "epoch": 883} {"train_loss": -5.646943092346191, "global_step": 37095, "epoch": 883} {"train_loss": -5.457383155822754, "global_step": 37096, "epoch": 883} {"train_loss": -5.54164981842041, "global_step": 37097, "epoch": 883} {"train_loss": -5.578858375549316, "global_step": 37098, "epoch": 883} {"train_loss": -5.463381767272949, "global_step": 37099, "epoch": 883} {"train_loss": -5.5524139404296875, "global_step": 37100, "epoch": 883} {"train_loss": -5.587679862976074, "global_step": 37101, "epoch": 883} {"train_loss": -5.4626545906066895, "global_step": 37102, "epoch": 883} {"train_loss": -5.599502086639404, "global_step": 37103, "epoch": 883} {"train_loss": -5.574678897857666, "global_step": 37104, "epoch": 883} {"train_loss": -5.366489410400391, "global_step": 37105, "epoch": 883} {"train_loss": -5.532321929931641, "global_step": 37106, "epoch": 883} {"train_loss": -5.42113733291626, "global_step": 37107, "epoch": 883} {"train_loss": -5.556297779083252, "global_step": 37108, "epoch": 883} {"train_loss": -5.438660621643066, "global_step": 37109, "epoch": 883} {"train_loss": -5.601030349731445, "global_step": 37110, "epoch": 883} {"train_loss": -5.677929878234863, "global_step": 37111, "epoch": 883} {"train_loss": -5.487344264984131, "global_step": 37112, "epoch": 883} {"train_loss": -5.482649803161621, "global_step": 37113, "epoch": 883} {"train_loss": -5.593433856964111, "global_step": 37114, "epoch": 883} {"train_loss": -5.566423416137695, "global_step": 37115, "epoch": 883} {"train_loss": -5.479638576507568, "global_step": 37116, "epoch": 883} {"train_loss": -5.672342300415039, "global_step": 37117, "epoch": 883} {"train_loss": -5.670283317565918, "global_step": 37118, "epoch": 883} {"train_loss": -5.572111129760742, "global_step": 37119, "epoch": 883} {"train_loss": -5.5927324295043945, "global_step": 37120, "epoch": 883} {"train_loss": -5.537233352661133, "global_step": 37121, "epoch": 883} {"train_loss": -5.553777694702148, "global_step": 37122, "epoch": 883} {"train_loss": -5.598123073577881, "global_step": 37123, "epoch": 883} {"train_loss": -5.674134254455566, "global_step": 37124, "epoch": 883} {"train_loss": -5.655264377593994, "global_step": 37125, "epoch": 883} {"train_loss": -5.428073883056641, "global_step": 37126, "epoch": 883} {"train_loss": -5.555636394591558, "global_step": 37127, "epoch": 883, "val_loss": 66209.46875} {"train_loss": -5.667544364929199, "global_step": 37128, "epoch": 884} {"train_loss": -5.681301116943359, "global_step": 37129, "epoch": 884} {"train_loss": -5.674327850341797, "global_step": 37130, "epoch": 884} {"train_loss": -5.56353235244751, "global_step": 37131, "epoch": 884} {"train_loss": -5.687321662902832, "global_step": 37132, "epoch": 884} {"train_loss": -5.638762474060059, "global_step": 37133, "epoch": 884} {"train_loss": -5.676768779754639, "global_step": 37134, "epoch": 884} {"train_loss": -5.646892547607422, "global_step": 37135, "epoch": 884} {"train_loss": -5.4433746337890625, "global_step": 37136, "epoch": 884} {"train_loss": -5.626307964324951, "global_step": 37137, "epoch": 884} {"train_loss": -5.570194721221924, "global_step": 37138, "epoch": 884} {"train_loss": -5.529979705810547, "global_step": 37139, "epoch": 884} {"train_loss": -5.618439674377441, "global_step": 37140, "epoch": 884} {"train_loss": -5.678876876831055, "global_step": 37141, "epoch": 884} {"train_loss": -5.546833038330078, "global_step": 37142, "epoch": 884} {"train_loss": -5.5634307861328125, "global_step": 37143, "epoch": 884} {"train_loss": -5.613735198974609, "global_step": 37144, "epoch": 884} {"train_loss": -5.669791221618652, "global_step": 37145, "epoch": 884} {"train_loss": -5.669435501098633, "global_step": 37146, "epoch": 884} {"train_loss": -5.583736896514893, "global_step": 37147, "epoch": 884} {"train_loss": -5.559769630432129, "global_step": 37148, "epoch": 884} {"train_loss": -5.565122604370117, "global_step": 37149, "epoch": 884} {"train_loss": -5.68766975402832, "global_step": 37150, "epoch": 884} {"train_loss": -5.569355010986328, "global_step": 37151, "epoch": 884} {"train_loss": -5.6396708488464355, "global_step": 37152, "epoch": 884} {"train_loss": -5.642374038696289, "global_step": 37153, "epoch": 884} {"train_loss": -5.57404088973999, "global_step": 37154, "epoch": 884} {"train_loss": -5.495335578918457, "global_step": 37155, "epoch": 884} {"train_loss": -5.596149444580078, "global_step": 37156, "epoch": 884} {"train_loss": -5.620486736297607, "global_step": 37157, "epoch": 884} {"train_loss": -5.49683952331543, "global_step": 37158, "epoch": 884} {"train_loss": -5.665071487426758, "global_step": 37159, "epoch": 884} {"train_loss": -5.504121780395508, "global_step": 37160, "epoch": 884} {"train_loss": -5.538472652435303, "global_step": 37161, "epoch": 884} {"train_loss": -5.620224475860596, "global_step": 37162, "epoch": 884} {"train_loss": -5.608803749084473, "global_step": 37163, "epoch": 884} {"train_loss": -5.620777130126953, "global_step": 37164, "epoch": 884} {"train_loss": -5.606113433837891, "global_step": 37165, "epoch": 884} {"train_loss": -5.524219512939453, "global_step": 37166, "epoch": 884} {"train_loss": -5.544760227203369, "global_step": 37167, "epoch": 884} {"train_loss": -5.692151069641113, "global_step": 37168, "epoch": 884} {"train_loss": -5.60301247097197, "global_step": 37169, "epoch": 884, "val_loss": 65877.0546875} {"train_loss": -5.621923923492432, "global_step": 37170, "epoch": 885} {"train_loss": -5.603626728057861, "global_step": 37171, "epoch": 885} {"train_loss": -5.714369773864746, "global_step": 37172, "epoch": 885} {"train_loss": -5.581172943115234, "global_step": 37173, "epoch": 885} {"train_loss": -5.645089149475098, "global_step": 37174, "epoch": 885} {"train_loss": -5.637470245361328, "global_step": 37175, "epoch": 885} {"train_loss": -5.632278919219971, "global_step": 37176, "epoch": 885} {"train_loss": -5.707918167114258, "global_step": 37177, "epoch": 885} {"train_loss": -5.5960187911987305, "global_step": 37178, "epoch": 885} {"train_loss": -5.611854076385498, "global_step": 37179, "epoch": 885} {"train_loss": -5.641932487487793, "global_step": 37180, "epoch": 885} {"train_loss": -5.54640007019043, "global_step": 37181, "epoch": 885} {"train_loss": -5.6077656745910645, "global_step": 37182, "epoch": 885} {"train_loss": -5.619646072387695, "global_step": 37183, "epoch": 885} {"train_loss": -5.454656600952148, "global_step": 37184, "epoch": 885} {"train_loss": -5.494595527648926, "global_step": 37185, "epoch": 885} {"train_loss": -5.558075904846191, "global_step": 37186, "epoch": 885} {"train_loss": -5.646748065948486, "global_step": 37187, "epoch": 885} {"train_loss": -5.536734580993652, "global_step": 37188, "epoch": 885} {"train_loss": -5.632009506225586, "global_step": 37189, "epoch": 885} {"train_loss": -5.5267486572265625, "global_step": 37190, "epoch": 885} {"train_loss": -5.5875773429870605, "global_step": 37191, "epoch": 885} {"train_loss": -5.6524763107299805, "global_step": 37192, "epoch": 885} {"train_loss": -5.556739807128906, "global_step": 37193, "epoch": 885} {"train_loss": -5.630087852478027, "global_step": 37194, "epoch": 885} {"train_loss": -5.504734992980957, "global_step": 37195, "epoch": 885} {"train_loss": -5.5717082023620605, "global_step": 37196, "epoch": 885} {"train_loss": -5.5844879150390625, "global_step": 37197, "epoch": 885} {"train_loss": -5.6532793045043945, "global_step": 37198, "epoch": 885} {"train_loss": -5.429670333862305, "global_step": 37199, "epoch": 885} {"train_loss": -5.653768539428711, "global_step": 37200, "epoch": 885} {"train_loss": -5.455719947814941, "global_step": 37201, "epoch": 885} {"train_loss": -5.6783270835876465, "global_step": 37202, "epoch": 885} {"train_loss": -5.616214275360107, "global_step": 37203, "epoch": 885} {"train_loss": -5.543173313140869, "global_step": 37204, "epoch": 885} {"train_loss": -5.551372528076172, "global_step": 37205, "epoch": 885} {"train_loss": -5.630624771118164, "global_step": 37206, "epoch": 885} {"train_loss": -5.468866348266602, "global_step": 37207, "epoch": 885} {"train_loss": -5.610078811645508, "global_step": 37208, "epoch": 885} {"train_loss": -5.49911642074585, "global_step": 37209, "epoch": 885} {"train_loss": -5.551584243774414, "global_step": 37210, "epoch": 885} {"train_loss": -5.585364727746873, "global_step": 37211, "epoch": 885, "val_loss": 65778.0} {"train_loss": -5.55301570892334, "global_step": 37212, "epoch": 886} {"train_loss": -5.563767433166504, "global_step": 37213, "epoch": 886} {"train_loss": -5.428510665893555, "global_step": 37214, "epoch": 886} {"train_loss": -5.60404634475708, "global_step": 37215, "epoch": 886} {"train_loss": -5.567806720733643, "global_step": 37216, "epoch": 886} {"train_loss": -5.705674171447754, "global_step": 37217, "epoch": 886} {"train_loss": -5.618767738342285, "global_step": 37218, "epoch": 886} {"train_loss": -5.596699237823486, "global_step": 37219, "epoch": 886} {"train_loss": -5.600583076477051, "global_step": 37220, "epoch": 886} {"train_loss": -5.614679336547852, "global_step": 37221, "epoch": 886} {"train_loss": -5.551435947418213, "global_step": 37222, "epoch": 886} {"train_loss": -5.583864212036133, "global_step": 37223, "epoch": 886} {"train_loss": -5.683727264404297, "global_step": 37224, "epoch": 886} {"train_loss": -5.6948113441467285, "global_step": 37225, "epoch": 886} {"train_loss": -5.657731056213379, "global_step": 37226, "epoch": 886} {"train_loss": -5.611798286437988, "global_step": 37227, "epoch": 886} {"train_loss": -5.543773651123047, "global_step": 37228, "epoch": 886} {"train_loss": -5.515317916870117, "global_step": 37229, "epoch": 886} {"train_loss": -5.657954216003418, "global_step": 37230, "epoch": 886} {"train_loss": -5.601716041564941, "global_step": 37231, "epoch": 886} {"train_loss": -5.608651161193848, "global_step": 37232, "epoch": 886} {"train_loss": -5.704729080200195, "global_step": 37233, "epoch": 886} {"train_loss": -5.626741886138916, "global_step": 37234, "epoch": 886} {"train_loss": -5.466242790222168, "global_step": 37235, "epoch": 886} {"train_loss": -5.456321716308594, "global_step": 37236, "epoch": 886} {"train_loss": -5.592715263366699, "global_step": 37237, "epoch": 886} {"train_loss": -5.678362846374512, "global_step": 37238, "epoch": 886} {"train_loss": -5.407326698303223, "global_step": 37239, "epoch": 886} {"train_loss": -5.475805282592773, "global_step": 37240, "epoch": 886} {"train_loss": -5.57002067565918, "global_step": 37241, "epoch": 886} {"train_loss": -5.51383638381958, "global_step": 37242, "epoch": 886} {"train_loss": -5.584211349487305, "global_step": 37243, "epoch": 886} {"train_loss": -5.5969038009643555, "global_step": 37244, "epoch": 886} {"train_loss": -5.472873687744141, "global_step": 37245, "epoch": 886} {"train_loss": -5.615607261657715, "global_step": 37246, "epoch": 886} {"train_loss": -5.641580104827881, "global_step": 37247, "epoch": 886} {"train_loss": -5.553609371185303, "global_step": 37248, "epoch": 886} {"train_loss": -5.602828502655029, "global_step": 37249, "epoch": 886} {"train_loss": -5.673654556274414, "global_step": 37250, "epoch": 886} {"train_loss": -5.650908470153809, "global_step": 37251, "epoch": 886} {"train_loss": -5.583583831787109, "global_step": 37252, "epoch": 886} {"train_loss": -5.586350781576974, "global_step": 37253, "epoch": 886, "val_loss": 65894.9375} {"train_loss": -5.62108850479126, "global_step": 37254, "epoch": 887} {"train_loss": -5.66826868057251, "global_step": 37255, "epoch": 887} {"train_loss": -5.594185829162598, "global_step": 37256, "epoch": 887} {"train_loss": -5.572840690612793, "global_step": 37257, "epoch": 887} {"train_loss": -5.630813121795654, "global_step": 37258, "epoch": 887} {"train_loss": -5.726768493652344, "global_step": 37259, "epoch": 887} {"train_loss": -5.481227874755859, "global_step": 37260, "epoch": 887} {"train_loss": -5.577235221862793, "global_step": 37261, "epoch": 887} {"train_loss": -5.748967170715332, "global_step": 37262, "epoch": 887} {"train_loss": -5.568452835083008, "global_step": 37263, "epoch": 887} {"train_loss": -5.741451740264893, "global_step": 37264, "epoch": 887} {"train_loss": -5.580935001373291, "global_step": 37265, "epoch": 887} {"train_loss": -5.625465393066406, "global_step": 37266, "epoch": 887} {"train_loss": -5.570261001586914, "global_step": 37267, "epoch": 887} {"train_loss": -5.52552604675293, "global_step": 37268, "epoch": 887} {"train_loss": -5.474031448364258, "global_step": 37269, "epoch": 887} {"train_loss": -5.663171768188477, "global_step": 37270, "epoch": 887} {"train_loss": -5.454216957092285, "global_step": 37271, "epoch": 887} {"train_loss": -5.636991500854492, "global_step": 37272, "epoch": 887} {"train_loss": -5.607166290283203, "global_step": 37273, "epoch": 887} {"train_loss": -5.570721626281738, "global_step": 37274, "epoch": 887} {"train_loss": -5.5062360763549805, "global_step": 37275, "epoch": 887} {"train_loss": -5.513958930969238, "global_step": 37276, "epoch": 887} {"train_loss": -5.497394561767578, "global_step": 37277, "epoch": 887} {"train_loss": -5.715778350830078, "global_step": 37278, "epoch": 887} {"train_loss": -5.4764909744262695, "global_step": 37279, "epoch": 887} {"train_loss": -5.514625549316406, "global_step": 37280, "epoch": 887} {"train_loss": -5.52671480178833, "global_step": 37281, "epoch": 887} {"train_loss": -5.531882286071777, "global_step": 37282, "epoch": 887} {"train_loss": -5.587638854980469, "global_step": 37283, "epoch": 887} {"train_loss": -5.699455261230469, "global_step": 37284, "epoch": 887} {"train_loss": -5.484187126159668, "global_step": 37285, "epoch": 887} {"train_loss": -5.543394088745117, "global_step": 37286, "epoch": 887} {"train_loss": -5.413815498352051, "global_step": 37287, "epoch": 887} {"train_loss": -5.48974609375, "global_step": 37288, "epoch": 887} {"train_loss": -5.515219688415527, "global_step": 37289, "epoch": 887} {"train_loss": -5.579124450683594, "global_step": 37290, "epoch": 887} {"train_loss": -5.680643081665039, "global_step": 37291, "epoch": 887} {"train_loss": -5.507232189178467, "global_step": 37292, "epoch": 887} {"train_loss": -5.621025085449219, "global_step": 37293, "epoch": 887} {"train_loss": -5.648698806762695, "global_step": 37294, "epoch": 887} {"train_loss": -5.575160492034185, "global_step": 37295, "epoch": 887, "val_loss": 66305.3203125} {"train_loss": -5.651869773864746, "global_step": 37296, "epoch": 888} {"train_loss": -5.596691131591797, "global_step": 37297, "epoch": 888} {"train_loss": -5.618919372558594, "global_step": 37298, "epoch": 888} {"train_loss": -5.590355396270752, "global_step": 37299, "epoch": 888} {"train_loss": -5.62660026550293, "global_step": 37300, "epoch": 888} {"train_loss": -5.592342376708984, "global_step": 37301, "epoch": 888} {"train_loss": -5.637948989868164, "global_step": 37302, "epoch": 888} {"train_loss": -5.5673346519470215, "global_step": 37303, "epoch": 888} {"train_loss": -5.560300827026367, "global_step": 37304, "epoch": 888} {"train_loss": -5.588987827301025, "global_step": 37305, "epoch": 888} {"train_loss": -5.55131196975708, "global_step": 37306, "epoch": 888} {"train_loss": -5.557964324951172, "global_step": 37307, "epoch": 888} {"train_loss": -5.6070709228515625, "global_step": 37308, "epoch": 888} {"train_loss": -5.630061149597168, "global_step": 37309, "epoch": 888} {"train_loss": -5.522987365722656, "global_step": 37310, "epoch": 888} {"train_loss": -5.436664581298828, "global_step": 37311, "epoch": 888} {"train_loss": -5.575597763061523, "global_step": 37312, "epoch": 888} {"train_loss": -5.557258129119873, "global_step": 37313, "epoch": 888} {"train_loss": -5.462451457977295, "global_step": 37314, "epoch": 888} {"train_loss": -5.7117509841918945, "global_step": 37315, "epoch": 888} {"train_loss": -5.405235290527344, "global_step": 37316, "epoch": 888} {"train_loss": -5.7081217765808105, "global_step": 37317, "epoch": 888} {"train_loss": -5.588878631591797, "global_step": 37318, "epoch": 888} {"train_loss": -5.573939323425293, "global_step": 37319, "epoch": 888} {"train_loss": -5.544615745544434, "global_step": 37320, "epoch": 888} {"train_loss": -5.523512363433838, "global_step": 37321, "epoch": 888} {"train_loss": -5.540940284729004, "global_step": 37322, "epoch": 888} {"train_loss": -5.626763343811035, "global_step": 37323, "epoch": 888} {"train_loss": -5.433889865875244, "global_step": 37324, "epoch": 888} {"train_loss": -5.770268440246582, "global_step": 37325, "epoch": 888} {"train_loss": -5.585318088531494, "global_step": 37326, "epoch": 888} {"train_loss": -5.579094886779785, "global_step": 37327, "epoch": 888} {"train_loss": -5.575920104980469, "global_step": 37328, "epoch": 888} {"train_loss": -5.6451826095581055, "global_step": 37329, "epoch": 888} {"train_loss": -5.4037580490112305, "global_step": 37330, "epoch": 888} {"train_loss": -5.722519874572754, "global_step": 37331, "epoch": 888} {"train_loss": -5.619106769561768, "global_step": 37332, "epoch": 888} {"train_loss": -5.553170204162598, "global_step": 37333, "epoch": 888} {"train_loss": -5.639537811279297, "global_step": 37334, "epoch": 888} {"train_loss": -5.627345085144043, "global_step": 37335, "epoch": 888} {"train_loss": -5.578379154205322, "global_step": 37336, "epoch": 888} {"train_loss": -5.584287132535662, "global_step": 37337, "epoch": 888, "val_loss": 66041.640625} {"train_loss": -5.596095085144043, "global_step": 37338, "epoch": 889} {"train_loss": -5.507882595062256, "global_step": 37339, "epoch": 889} {"train_loss": -5.696294784545898, "global_step": 37340, "epoch": 889} {"train_loss": -5.597650051116943, "global_step": 37341, "epoch": 889} {"train_loss": -5.655172348022461, "global_step": 37342, "epoch": 889} {"train_loss": -5.619748115539551, "global_step": 37343, "epoch": 889} {"train_loss": -5.611250877380371, "global_step": 37344, "epoch": 889} {"train_loss": -5.6176042556762695, "global_step": 37345, "epoch": 889} {"train_loss": -5.5302934646606445, "global_step": 37346, "epoch": 889} {"train_loss": -5.577057361602783, "global_step": 37347, "epoch": 889} {"train_loss": -5.718338489532471, "global_step": 37348, "epoch": 889} {"train_loss": -5.678840160369873, "global_step": 37349, "epoch": 889} {"train_loss": -5.5718584060668945, "global_step": 37350, "epoch": 889} {"train_loss": -5.568711757659912, "global_step": 37351, "epoch": 889} {"train_loss": -5.526708602905273, "global_step": 37352, "epoch": 889} {"train_loss": -5.593476295471191, "global_step": 37353, "epoch": 889} {"train_loss": -5.70600700378418, "global_step": 37354, "epoch": 889} {"train_loss": -5.455142021179199, "global_step": 37355, "epoch": 889} {"train_loss": -5.687747955322266, "global_step": 37356, "epoch": 889} {"train_loss": -5.559140682220459, "global_step": 37357, "epoch": 889} {"train_loss": -5.75765323638916, "global_step": 37358, "epoch": 889} {"train_loss": -5.597382545471191, "global_step": 37359, "epoch": 889} {"train_loss": -5.619290351867676, "global_step": 37360, "epoch": 889} {"train_loss": -5.635476112365723, "global_step": 37361, "epoch": 889} {"train_loss": -5.534666061401367, "global_step": 37362, "epoch": 889} {"train_loss": -5.5582194328308105, "global_step": 37363, "epoch": 889} {"train_loss": -5.605254650115967, "global_step": 37364, "epoch": 889} {"train_loss": -5.585839748382568, "global_step": 37365, "epoch": 889} {"train_loss": -5.628970146179199, "global_step": 37366, "epoch": 889} {"train_loss": -5.525672912597656, "global_step": 37367, "epoch": 889} {"train_loss": -5.638075828552246, "global_step": 37368, "epoch": 889} {"train_loss": -5.5427961349487305, "global_step": 37369, "epoch": 889} {"train_loss": -5.623384475708008, "global_step": 37370, "epoch": 889} {"train_loss": -5.660841941833496, "global_step": 37371, "epoch": 889} {"train_loss": -5.676849842071533, "global_step": 37372, "epoch": 889} {"train_loss": -5.512456893920898, "global_step": 37373, "epoch": 889} {"train_loss": -5.521098613739014, "global_step": 37374, "epoch": 889} {"train_loss": -5.584245681762695, "global_step": 37375, "epoch": 889} {"train_loss": -5.588911056518555, "global_step": 37376, "epoch": 889} {"train_loss": -5.642458915710449, "global_step": 37377, "epoch": 889} {"train_loss": -5.517611503601074, "global_step": 37378, "epoch": 889} {"train_loss": -5.601079940795898, "global_step": 37379, "epoch": 889, "val_loss": 65980.09375} {"train_loss": -5.660550117492676, "global_step": 37380, "epoch": 890} {"train_loss": -5.6240739822387695, "global_step": 37381, "epoch": 890} {"train_loss": -5.520495414733887, "global_step": 37382, "epoch": 890} {"train_loss": -5.556463241577148, "global_step": 37383, "epoch": 890} {"train_loss": -5.592743873596191, "global_step": 37384, "epoch": 890} {"train_loss": -5.611837863922119, "global_step": 37385, "epoch": 890} {"train_loss": -5.507708549499512, "global_step": 37386, "epoch": 890} {"train_loss": -5.417959213256836, "global_step": 37387, "epoch": 890} {"train_loss": -5.673346996307373, "global_step": 37388, "epoch": 890} {"train_loss": -5.526313781738281, "global_step": 37389, "epoch": 890} {"train_loss": -5.56623649597168, "global_step": 37390, "epoch": 890} {"train_loss": -5.5969061851501465, "global_step": 37391, "epoch": 890} {"train_loss": -5.492998123168945, "global_step": 37392, "epoch": 890} {"train_loss": -5.56802225112915, "global_step": 37393, "epoch": 890} {"train_loss": -5.536919593811035, "global_step": 37394, "epoch": 890} {"train_loss": -5.637029647827148, "global_step": 37395, "epoch": 890} {"train_loss": -5.510125637054443, "global_step": 37396, "epoch": 890} {"train_loss": -5.5733113288879395, "global_step": 37397, "epoch": 890} {"train_loss": -5.403229236602783, "global_step": 37398, "epoch": 890} {"train_loss": -5.578871250152588, "global_step": 37399, "epoch": 890} {"train_loss": -5.558547496795654, "global_step": 37400, "epoch": 890} {"train_loss": -5.516975402832031, "global_step": 37401, "epoch": 890} {"train_loss": -5.699857711791992, "global_step": 37402, "epoch": 890} {"train_loss": -5.583089351654053, "global_step": 37403, "epoch": 890} {"train_loss": -5.594020843505859, "global_step": 37404, "epoch": 890} {"train_loss": -5.552924633026123, "global_step": 37405, "epoch": 890} {"train_loss": -5.6569414138793945, "global_step": 37406, "epoch": 890} {"train_loss": -5.643484115600586, "global_step": 37407, "epoch": 890} {"train_loss": -5.572187900543213, "global_step": 37408, "epoch": 890} {"train_loss": -5.587118625640869, "global_step": 37409, "epoch": 890} {"train_loss": -5.592409133911133, "global_step": 37410, "epoch": 890} {"train_loss": -5.604947090148926, "global_step": 37411, "epoch": 890} {"train_loss": -5.460134029388428, "global_step": 37412, "epoch": 890} {"train_loss": -5.447951316833496, "global_step": 37413, "epoch": 890} {"train_loss": -5.534140586853027, "global_step": 37414, "epoch": 890} {"train_loss": -5.667645454406738, "global_step": 37415, "epoch": 890} {"train_loss": -5.5527567863464355, "global_step": 37416, "epoch": 890} {"train_loss": -5.701093673706055, "global_step": 37417, "epoch": 890} {"train_loss": -5.635922908782959, "global_step": 37418, "epoch": 890} {"train_loss": -5.513881683349609, "global_step": 37419, "epoch": 890} {"train_loss": -5.607327461242676, "global_step": 37420, "epoch": 890} {"train_loss": -5.569300572077434, "global_step": 37421, "epoch": 890, "val_loss": 65833.15625} {"train_loss": -5.621157169342041, "global_step": 37422, "epoch": 891} {"train_loss": -5.6714677810668945, "global_step": 37423, "epoch": 891} {"train_loss": -5.529263496398926, "global_step": 37424, "epoch": 891} {"train_loss": -5.567770957946777, "global_step": 37425, "epoch": 891} {"train_loss": -5.63173246383667, "global_step": 37426, "epoch": 891} {"train_loss": -5.5193891525268555, "global_step": 37427, "epoch": 891} {"train_loss": -5.592440128326416, "global_step": 37428, "epoch": 891} {"train_loss": -5.6274566650390625, "global_step": 37429, "epoch": 891} {"train_loss": -5.514540672302246, "global_step": 37430, "epoch": 891} {"train_loss": -5.731161117553711, "global_step": 37431, "epoch": 891} {"train_loss": -5.736404895782471, "global_step": 37432, "epoch": 891} {"train_loss": -5.624118804931641, "global_step": 37433, "epoch": 891} {"train_loss": -5.624859809875488, "global_step": 37434, "epoch": 891} {"train_loss": -5.674686431884766, "global_step": 37435, "epoch": 891} {"train_loss": -5.525101661682129, "global_step": 37436, "epoch": 891} {"train_loss": -5.62118673324585, "global_step": 37437, "epoch": 891} {"train_loss": -5.622018814086914, "global_step": 37438, "epoch": 891} {"train_loss": -5.657029628753662, "global_step": 37439, "epoch": 891} {"train_loss": -5.558454513549805, "global_step": 37440, "epoch": 891} {"train_loss": -5.59849214553833, "global_step": 37441, "epoch": 891} {"train_loss": -5.589912414550781, "global_step": 37442, "epoch": 891} {"train_loss": -5.64417839050293, "global_step": 37443, "epoch": 891} {"train_loss": -5.5442118644714355, "global_step": 37444, "epoch": 891} {"train_loss": -5.552811145782471, "global_step": 37445, "epoch": 891} {"train_loss": -5.597321510314941, "global_step": 37446, "epoch": 891} {"train_loss": -5.5718302726745605, "global_step": 37447, "epoch": 891} {"train_loss": -5.559876441955566, "global_step": 37448, "epoch": 891} {"train_loss": -5.654661178588867, "global_step": 37449, "epoch": 891} {"train_loss": -5.552370071411133, "global_step": 37450, "epoch": 891} {"train_loss": -5.594424247741699, "global_step": 37451, "epoch": 891} {"train_loss": -5.509554386138916, "global_step": 37452, "epoch": 891} {"train_loss": -5.619142532348633, "global_step": 37453, "epoch": 891} {"train_loss": -5.623513221740723, "global_step": 37454, "epoch": 891} {"train_loss": -5.5810089111328125, "global_step": 37455, "epoch": 891} {"train_loss": -5.585052490234375, "global_step": 37456, "epoch": 891} {"train_loss": -5.467301368713379, "global_step": 37457, "epoch": 891} {"train_loss": -5.557224273681641, "global_step": 37458, "epoch": 891} {"train_loss": -5.502476692199707, "global_step": 37459, "epoch": 891} {"train_loss": -5.763205528259277, "global_step": 37460, "epoch": 891} {"train_loss": -5.492897987365723, "global_step": 37461, "epoch": 891} {"train_loss": -5.462881088256836, "global_step": 37462, "epoch": 891} {"train_loss": -5.593430008207049, "global_step": 37463, "epoch": 891, "val_loss": 65862.09375} {"train_loss": -5.458706855773926, "global_step": 37464, "epoch": 892} {"train_loss": -5.6173014640808105, "global_step": 37465, "epoch": 892} {"train_loss": -5.633607864379883, "global_step": 37466, "epoch": 892} {"train_loss": -5.539405822753906, "global_step": 37467, "epoch": 892} {"train_loss": -5.7418622970581055, "global_step": 37468, "epoch": 892} {"train_loss": -5.670692443847656, "global_step": 37469, "epoch": 892} {"train_loss": -5.695828437805176, "global_step": 37470, "epoch": 892} {"train_loss": -5.530241966247559, "global_step": 37471, "epoch": 892} {"train_loss": -5.652530670166016, "global_step": 37472, "epoch": 892} {"train_loss": -5.549307823181152, "global_step": 37473, "epoch": 892} {"train_loss": -5.501431941986084, "global_step": 37474, "epoch": 892} {"train_loss": -5.494894504547119, "global_step": 37475, "epoch": 892} {"train_loss": -5.688185691833496, "global_step": 37476, "epoch": 892} {"train_loss": -5.602900505065918, "global_step": 37477, "epoch": 892} {"train_loss": -5.506743907928467, "global_step": 37478, "epoch": 892} {"train_loss": -5.645565986633301, "global_step": 37479, "epoch": 892} {"train_loss": -5.696021556854248, "global_step": 37480, "epoch": 892} {"train_loss": -5.609225273132324, "global_step": 37481, "epoch": 892} {"train_loss": -5.5886125564575195, "global_step": 37482, "epoch": 892} {"train_loss": -5.479570388793945, "global_step": 37483, "epoch": 892} {"train_loss": -5.608542442321777, "global_step": 37484, "epoch": 892} {"train_loss": -5.68287467956543, "global_step": 37485, "epoch": 892} {"train_loss": -5.5850629806518555, "global_step": 37486, "epoch": 892} {"train_loss": -5.655572414398193, "global_step": 37487, "epoch": 892} {"train_loss": -5.631339073181152, "global_step": 37488, "epoch": 892} {"train_loss": -5.5378828048706055, "global_step": 37489, "epoch": 892} {"train_loss": -5.702192306518555, "global_step": 37490, "epoch": 892} {"train_loss": -5.624502182006836, "global_step": 37491, "epoch": 892} {"train_loss": -5.625180721282959, "global_step": 37492, "epoch": 892} {"train_loss": -5.562921047210693, "global_step": 37493, "epoch": 892} {"train_loss": -5.627391815185547, "global_step": 37494, "epoch": 892} {"train_loss": -5.552848815917969, "global_step": 37495, "epoch": 892} {"train_loss": -5.580845832824707, "global_step": 37496, "epoch": 892} {"train_loss": -5.638971328735352, "global_step": 37497, "epoch": 892} {"train_loss": -5.715972423553467, "global_step": 37498, "epoch": 892} {"train_loss": -5.567326545715332, "global_step": 37499, "epoch": 892} {"train_loss": -5.593975067138672, "global_step": 37500, "epoch": 892} {"train_loss": -5.652306079864502, "global_step": 37501, "epoch": 892} {"train_loss": -5.6605963706970215, "global_step": 37502, "epoch": 892} {"train_loss": -5.624942779541016, "global_step": 37503, "epoch": 892} {"train_loss": -5.634186744689941, "global_step": 37504, "epoch": 892} {"train_loss": -5.607676142737979, "global_step": 37505, "epoch": 892, "val_loss": 65968.203125} {"train_loss": -5.573575019836426, "global_step": 37506, "epoch": 893} {"train_loss": -5.600527286529541, "global_step": 37507, "epoch": 893} {"train_loss": -5.507691383361816, "global_step": 37508, "epoch": 893} {"train_loss": -5.746285915374756, "global_step": 37509, "epoch": 893} {"train_loss": -5.672035217285156, "global_step": 37510, "epoch": 893} {"train_loss": -5.539577484130859, "global_step": 37511, "epoch": 893} {"train_loss": -5.7513227462768555, "global_step": 37512, "epoch": 893} {"train_loss": -5.634479522705078, "global_step": 37513, "epoch": 893} {"train_loss": -5.604500770568848, "global_step": 37514, "epoch": 893} {"train_loss": -5.659717559814453, "global_step": 37515, "epoch": 893} {"train_loss": -5.455071449279785, "global_step": 37516, "epoch": 893} {"train_loss": -5.563660621643066, "global_step": 37517, "epoch": 893} {"train_loss": -5.650685787200928, "global_step": 37518, "epoch": 893} {"train_loss": -5.593677043914795, "global_step": 37519, "epoch": 893} {"train_loss": -5.620609760284424, "global_step": 37520, "epoch": 893} {"train_loss": -5.631560325622559, "global_step": 37521, "epoch": 893} {"train_loss": -5.6002020835876465, "global_step": 37522, "epoch": 893} {"train_loss": -5.563168525695801, "global_step": 37523, "epoch": 893} {"train_loss": -5.562439918518066, "global_step": 37524, "epoch": 893} {"train_loss": -5.535778045654297, "global_step": 37525, "epoch": 893} {"train_loss": -5.544528007507324, "global_step": 37526, "epoch": 893} {"train_loss": -5.643798828125, "global_step": 37527, "epoch": 893} {"train_loss": -5.644930839538574, "global_step": 37528, "epoch": 893} {"train_loss": -5.704398155212402, "global_step": 37529, "epoch": 893} {"train_loss": -5.456486701965332, "global_step": 37530, "epoch": 893} {"train_loss": -5.6473894119262695, "global_step": 37531, "epoch": 893} {"train_loss": -5.6713972091674805, "global_step": 37532, "epoch": 893} {"train_loss": -5.594051837921143, "global_step": 37533, "epoch": 893} {"train_loss": -5.664459228515625, "global_step": 37534, "epoch": 893} {"train_loss": -5.565968036651611, "global_step": 37535, "epoch": 893} {"train_loss": -5.629944801330566, "global_step": 37536, "epoch": 893} {"train_loss": -5.597821235656738, "global_step": 37537, "epoch": 893} {"train_loss": -5.552844047546387, "global_step": 37538, "epoch": 893} {"train_loss": -5.469210624694824, "global_step": 37539, "epoch": 893} {"train_loss": -5.576454162597656, "global_step": 37540, "epoch": 893} {"train_loss": -5.757369518280029, "global_step": 37541, "epoch": 893} {"train_loss": -5.432685852050781, "global_step": 37542, "epoch": 893} {"train_loss": -5.51737117767334, "global_step": 37543, "epoch": 893} {"train_loss": -5.70772647857666, "global_step": 37544, "epoch": 893} {"train_loss": -5.668392658233643, "global_step": 37545, "epoch": 893} {"train_loss": -5.616482257843018, "global_step": 37546, "epoch": 893} {"train_loss": -5.605956577119374, "global_step": 37547, "epoch": 893, "val_loss": 66374.9921875} {"train_loss": -5.504568099975586, "global_step": 37548, "epoch": 894} {"train_loss": -5.576539516448975, "global_step": 37549, "epoch": 894} {"train_loss": -5.682918548583984, "global_step": 37550, "epoch": 894} {"train_loss": -5.758665561676025, "global_step": 37551, "epoch": 894} {"train_loss": -5.586820602416992, "global_step": 37552, "epoch": 894} {"train_loss": -5.618240833282471, "global_step": 37553, "epoch": 894} {"train_loss": -5.49630069732666, "global_step": 37554, "epoch": 894} {"train_loss": -5.719156265258789, "global_step": 37555, "epoch": 894} {"train_loss": -5.634613037109375, "global_step": 37556, "epoch": 894} {"train_loss": -5.469130992889404, "global_step": 37557, "epoch": 894} {"train_loss": -5.54228401184082, "global_step": 37558, "epoch": 894} {"train_loss": -5.459794044494629, "global_step": 37559, "epoch": 894} {"train_loss": -5.548727035522461, "global_step": 37560, "epoch": 894} {"train_loss": -5.643581390380859, "global_step": 37561, "epoch": 894} {"train_loss": -5.465904235839844, "global_step": 37562, "epoch": 894} {"train_loss": -5.543276786804199, "global_step": 37563, "epoch": 894} {"train_loss": -5.401432037353516, "global_step": 37564, "epoch": 894} {"train_loss": -5.619503498077393, "global_step": 37565, "epoch": 894} {"train_loss": -5.550460338592529, "global_step": 37566, "epoch": 894} {"train_loss": -5.522367477416992, "global_step": 37567, "epoch": 894} {"train_loss": -5.606777191162109, "global_step": 37568, "epoch": 894} {"train_loss": -5.565619945526123, "global_step": 37569, "epoch": 894} {"train_loss": -5.629106521606445, "global_step": 37570, "epoch": 894} {"train_loss": -5.552890777587891, "global_step": 37571, "epoch": 894} {"train_loss": -5.628982067108154, "global_step": 37572, "epoch": 894} {"train_loss": -5.550891399383545, "global_step": 37573, "epoch": 894} {"train_loss": -5.691119194030762, "global_step": 37574, "epoch": 894} {"train_loss": -5.599432945251465, "global_step": 37575, "epoch": 894} {"train_loss": -5.632295608520508, "global_step": 37576, "epoch": 894} {"train_loss": -5.507895469665527, "global_step": 37577, "epoch": 894} {"train_loss": -5.482123851776123, "global_step": 37578, "epoch": 894} {"train_loss": -5.586415767669678, "global_step": 37579, "epoch": 894} {"train_loss": -5.478854179382324, "global_step": 37580, "epoch": 894} {"train_loss": -5.611678600311279, "global_step": 37581, "epoch": 894} {"train_loss": -5.613137245178223, "global_step": 37582, "epoch": 894} {"train_loss": -5.613708972930908, "global_step": 37583, "epoch": 894} {"train_loss": -5.648531913757324, "global_step": 37584, "epoch": 894} {"train_loss": -5.603923320770264, "global_step": 37585, "epoch": 894} {"train_loss": -5.457475662231445, "global_step": 37586, "epoch": 894} {"train_loss": -5.615176200866699, "global_step": 37587, "epoch": 894} {"train_loss": -5.563017845153809, "global_step": 37588, "epoch": 894} {"train_loss": -5.572141624632335, "global_step": 37589, "epoch": 894, "val_loss": 66020.4609375} {"train_loss": -5.6037092208862305, "global_step": 37590, "epoch": 895} {"train_loss": -5.570186614990234, "global_step": 37591, "epoch": 895} {"train_loss": -5.660943984985352, "global_step": 37592, "epoch": 895} {"train_loss": -5.5773725509643555, "global_step": 37593, "epoch": 895} {"train_loss": -5.6222004890441895, "global_step": 37594, "epoch": 895} {"train_loss": -5.580209732055664, "global_step": 37595, "epoch": 895} {"train_loss": -5.540750503540039, "global_step": 37596, "epoch": 895} {"train_loss": -5.568169116973877, "global_step": 37597, "epoch": 895} {"train_loss": -5.632184028625488, "global_step": 37598, "epoch": 895} {"train_loss": -5.688755035400391, "global_step": 37599, "epoch": 895} {"train_loss": -5.604769706726074, "global_step": 37600, "epoch": 895} {"train_loss": -5.720064163208008, "global_step": 37601, "epoch": 895} {"train_loss": -5.487178802490234, "global_step": 37602, "epoch": 895} {"train_loss": -5.583154678344727, "global_step": 37603, "epoch": 895} {"train_loss": -5.572855472564697, "global_step": 37604, "epoch": 895} {"train_loss": -5.480349540710449, "global_step": 37605, "epoch": 895} {"train_loss": -5.5771026611328125, "global_step": 37606, "epoch": 895} {"train_loss": -5.5185041427612305, "global_step": 37607, "epoch": 895} {"train_loss": -5.603948593139648, "global_step": 37608, "epoch": 895} {"train_loss": -5.4366865158081055, "global_step": 37609, "epoch": 895} {"train_loss": -5.7207536697387695, "global_step": 37610, "epoch": 895} {"train_loss": -5.694579601287842, "global_step": 37611, "epoch": 895} {"train_loss": -5.617843151092529, "global_step": 37612, "epoch": 895} {"train_loss": -5.415350914001465, "global_step": 37613, "epoch": 895} {"train_loss": -5.567135810852051, "global_step": 37614, "epoch": 895} {"train_loss": -5.612072944641113, "global_step": 37615, "epoch": 895} {"train_loss": -5.562623023986816, "global_step": 37616, "epoch": 895} {"train_loss": -5.587263584136963, "global_step": 37617, "epoch": 895} {"train_loss": -5.671255111694336, "global_step": 37618, "epoch": 895} {"train_loss": -5.587926387786865, "global_step": 37619, "epoch": 895} {"train_loss": -5.645052909851074, "global_step": 37620, "epoch": 895} {"train_loss": -5.540363311767578, "global_step": 37621, "epoch": 895} {"train_loss": -5.663322925567627, "global_step": 37622, "epoch": 895} {"train_loss": -5.638561248779297, "global_step": 37623, "epoch": 895} {"train_loss": -5.700613975524902, "global_step": 37624, "epoch": 895} {"train_loss": -5.570168495178223, "global_step": 37625, "epoch": 895} {"train_loss": -5.595434188842773, "global_step": 37626, "epoch": 895} {"train_loss": -5.603484153747559, "global_step": 37627, "epoch": 895} {"train_loss": -5.530446529388428, "global_step": 37628, "epoch": 895} {"train_loss": -5.630558967590332, "global_step": 37629, "epoch": 895} {"train_loss": -5.659801483154297, "global_step": 37630, "epoch": 895} {"train_loss": -5.597905147643316, "global_step": 37631, "epoch": 895, "val_loss": 65906.671875} {"train_loss": -5.64856481552124, "global_step": 37632, "epoch": 896} {"train_loss": -5.614754676818848, "global_step": 37633, "epoch": 896} {"train_loss": -5.646139144897461, "global_step": 37634, "epoch": 896} {"train_loss": -5.638362884521484, "global_step": 37635, "epoch": 896} {"train_loss": -5.628713607788086, "global_step": 37636, "epoch": 896} {"train_loss": -5.730245590209961, "global_step": 37637, "epoch": 896} {"train_loss": -5.67098331451416, "global_step": 37638, "epoch": 896} {"train_loss": -5.632413387298584, "global_step": 37639, "epoch": 896} {"train_loss": -5.504924774169922, "global_step": 37640, "epoch": 896} {"train_loss": -5.62135124206543, "global_step": 37641, "epoch": 896} {"train_loss": -5.573211669921875, "global_step": 37642, "epoch": 896} {"train_loss": -5.617233753204346, "global_step": 37643, "epoch": 896} {"train_loss": -5.59897518157959, "global_step": 37644, "epoch": 896} {"train_loss": -5.5850982666015625, "global_step": 37645, "epoch": 896} {"train_loss": -5.554162979125977, "global_step": 37646, "epoch": 896} {"train_loss": -5.645723342895508, "global_step": 37647, "epoch": 896} {"train_loss": -5.573214530944824, "global_step": 37648, "epoch": 896} {"train_loss": -5.585829257965088, "global_step": 37649, "epoch": 896} {"train_loss": -5.51406192779541, "global_step": 37650, "epoch": 896} {"train_loss": -5.512866973876953, "global_step": 37651, "epoch": 896} {"train_loss": -5.511621952056885, "global_step": 37652, "epoch": 896} {"train_loss": -5.645147323608398, "global_step": 37653, "epoch": 896} {"train_loss": -5.5566020011901855, "global_step": 37654, "epoch": 896} {"train_loss": -5.670912742614746, "global_step": 37655, "epoch": 896} {"train_loss": -5.611156463623047, "global_step": 37656, "epoch": 896} {"train_loss": -5.708474159240723, "global_step": 37657, "epoch": 896} {"train_loss": -5.4644670486450195, "global_step": 37658, "epoch": 896} {"train_loss": -5.633266925811768, "global_step": 37659, "epoch": 896} {"train_loss": -5.618279457092285, "global_step": 37660, "epoch": 896} {"train_loss": -5.583981990814209, "global_step": 37661, "epoch": 896} {"train_loss": -5.520694255828857, "global_step": 37662, "epoch": 896} {"train_loss": -5.5408172607421875, "global_step": 37663, "epoch": 896} {"train_loss": -5.70517635345459, "global_step": 37664, "epoch": 896} {"train_loss": -5.492372512817383, "global_step": 37665, "epoch": 896} {"train_loss": -5.50889778137207, "global_step": 37666, "epoch": 896} {"train_loss": -5.598348617553711, "global_step": 37667, "epoch": 896} {"train_loss": -5.469417572021484, "global_step": 37668, "epoch": 896} {"train_loss": -5.694576263427734, "global_step": 37669, "epoch": 896} {"train_loss": -5.38919734954834, "global_step": 37670, "epoch": 896} {"train_loss": -5.546246528625488, "global_step": 37671, "epoch": 896} {"train_loss": -5.623526573181152, "global_step": 37672, "epoch": 896} {"train_loss": -5.590220621653965, "global_step": 37673, "epoch": 896, "val_loss": 65920.359375} {"train_loss": -5.583730220794678, "global_step": 37674, "epoch": 897} {"train_loss": -5.51290225982666, "global_step": 37675, "epoch": 897} {"train_loss": -5.548801898956299, "global_step": 37676, "epoch": 897} {"train_loss": -5.579465866088867, "global_step": 37677, "epoch": 897} {"train_loss": -5.594675540924072, "global_step": 37678, "epoch": 897} {"train_loss": -5.558953285217285, "global_step": 37679, "epoch": 897} {"train_loss": -5.565650939941406, "global_step": 37680, "epoch": 897} {"train_loss": -5.705060958862305, "global_step": 37681, "epoch": 897} {"train_loss": -5.615986347198486, "global_step": 37682, "epoch": 897} {"train_loss": -5.618696689605713, "global_step": 37683, "epoch": 897} {"train_loss": -5.465471267700195, "global_step": 37684, "epoch": 897} {"train_loss": -5.587525367736816, "global_step": 37685, "epoch": 897} {"train_loss": -5.604671001434326, "global_step": 37686, "epoch": 897} {"train_loss": -5.589770317077637, "global_step": 37687, "epoch": 897} {"train_loss": -5.694427967071533, "global_step": 37688, "epoch": 897} {"train_loss": -5.64698600769043, "global_step": 37689, "epoch": 897} {"train_loss": -5.601919174194336, "global_step": 37690, "epoch": 897} {"train_loss": -5.5275678634643555, "global_step": 37691, "epoch": 897} {"train_loss": -5.515576362609863, "global_step": 37692, "epoch": 897} {"train_loss": -5.534607410430908, "global_step": 37693, "epoch": 897} {"train_loss": -5.5100297927856445, "global_step": 37694, "epoch": 897} {"train_loss": -5.599513530731201, "global_step": 37695, "epoch": 897} {"train_loss": -5.603977680206299, "global_step": 37696, "epoch": 897} {"train_loss": -5.569463729858398, "global_step": 37697, "epoch": 897} {"train_loss": -5.591130256652832, "global_step": 37698, "epoch": 897} {"train_loss": -5.594141960144043, "global_step": 37699, "epoch": 897} {"train_loss": -5.559521675109863, "global_step": 37700, "epoch": 897} {"train_loss": -5.50144100189209, "global_step": 37701, "epoch": 897} {"train_loss": -5.649681091308594, "global_step": 37702, "epoch": 897} {"train_loss": -5.535951614379883, "global_step": 37703, "epoch": 897} {"train_loss": -5.677181720733643, "global_step": 37704, "epoch": 897} {"train_loss": -5.538885116577148, "global_step": 37705, "epoch": 897} {"train_loss": -5.46834659576416, "global_step": 37706, "epoch": 897} {"train_loss": -5.6192851066589355, "global_step": 37707, "epoch": 897} {"train_loss": -5.531578063964844, "global_step": 37708, "epoch": 897} {"train_loss": -5.481014251708984, "global_step": 37709, "epoch": 897} {"train_loss": -5.58202600479126, "global_step": 37710, "epoch": 897} {"train_loss": -5.57883358001709, "global_step": 37711, "epoch": 897} {"train_loss": -5.564368724822998, "global_step": 37712, "epoch": 897} {"train_loss": -5.492483139038086, "global_step": 37713, "epoch": 897} {"train_loss": -5.469564914703369, "global_step": 37714, "epoch": 897} {"train_loss": -5.574193261918568, "global_step": 37715, "epoch": 897, "val_loss": 66536.8515625} {"train_loss": -5.5723772048950195, "global_step": 37716, "epoch": 898} {"train_loss": -5.546253204345703, "global_step": 37717, "epoch": 898} {"train_loss": -5.634438991546631, "global_step": 37718, "epoch": 898} {"train_loss": -5.425744533538818, "global_step": 37719, "epoch": 898} {"train_loss": -5.5762715339660645, "global_step": 37720, "epoch": 898} {"train_loss": -5.618424415588379, "global_step": 37721, "epoch": 898} {"train_loss": -5.450925827026367, "global_step": 37722, "epoch": 898} {"train_loss": -5.71597957611084, "global_step": 37723, "epoch": 898} {"train_loss": -5.663564682006836, "global_step": 37724, "epoch": 898} {"train_loss": -5.554625511169434, "global_step": 37725, "epoch": 898} {"train_loss": -5.53619384765625, "global_step": 37726, "epoch": 898} {"train_loss": -5.606382369995117, "global_step": 37727, "epoch": 898} {"train_loss": -5.527950286865234, "global_step": 37728, "epoch": 898} {"train_loss": -5.592097282409668, "global_step": 37729, "epoch": 898} {"train_loss": -5.493051528930664, "global_step": 37730, "epoch": 898} {"train_loss": -5.6375226974487305, "global_step": 37731, "epoch": 898} {"train_loss": -5.668658256530762, "global_step": 37732, "epoch": 898} {"train_loss": -5.649965286254883, "global_step": 37733, "epoch": 898} {"train_loss": -5.615849494934082, "global_step": 37734, "epoch": 898} {"train_loss": -5.58802604675293, "global_step": 37735, "epoch": 898} {"train_loss": -5.640663146972656, "global_step": 37736, "epoch": 898} {"train_loss": -5.658193588256836, "global_step": 37737, "epoch": 898} {"train_loss": -5.645552635192871, "global_step": 37738, "epoch": 898} {"train_loss": -5.562029838562012, "global_step": 37739, "epoch": 898} {"train_loss": -5.573067665100098, "global_step": 37740, "epoch": 898} {"train_loss": -5.628220081329346, "global_step": 37741, "epoch": 898} {"train_loss": -5.603794097900391, "global_step": 37742, "epoch": 898} {"train_loss": -5.562450408935547, "global_step": 37743, "epoch": 898} {"train_loss": -5.514729022979736, "global_step": 37744, "epoch": 898} {"train_loss": -5.652094841003418, "global_step": 37745, "epoch": 898} {"train_loss": -5.66853141784668, "global_step": 37746, "epoch": 898} {"train_loss": -5.627649307250977, "global_step": 37747, "epoch": 898} {"train_loss": -5.645997047424316, "global_step": 37748, "epoch": 898} {"train_loss": -5.716064453125, "global_step": 37749, "epoch": 898} {"train_loss": -5.4684014320373535, "global_step": 37750, "epoch": 898} {"train_loss": -5.605303764343262, "global_step": 37751, "epoch": 898} {"train_loss": -5.692177772521973, "global_step": 37752, "epoch": 898} {"train_loss": -5.643224716186523, "global_step": 37753, "epoch": 898} {"train_loss": -5.473773956298828, "global_step": 37754, "epoch": 898} {"train_loss": -5.592865943908691, "global_step": 37755, "epoch": 898} {"train_loss": -5.5865936279296875, "global_step": 37756, "epoch": 898} {"train_loss": -5.596137353352138, "global_step": 37757, "epoch": 898, "val_loss": 66086.703125} {"train_loss": -5.5020880699157715, "global_step": 37758, "epoch": 899} {"train_loss": -5.597476482391357, "global_step": 37759, "epoch": 899} {"train_loss": -5.5473527908325195, "global_step": 37760, "epoch": 899} {"train_loss": -5.581437110900879, "global_step": 37761, "epoch": 899} {"train_loss": -5.630001544952393, "global_step": 37762, "epoch": 899} {"train_loss": -5.660542011260986, "global_step": 37763, "epoch": 899} {"train_loss": -5.4053497314453125, "global_step": 37764, "epoch": 899} {"train_loss": -5.599010944366455, "global_step": 37765, "epoch": 899} {"train_loss": -5.578503131866455, "global_step": 37766, "epoch": 899} {"train_loss": -5.467220306396484, "global_step": 37767, "epoch": 899} {"train_loss": -5.619349479675293, "global_step": 37768, "epoch": 899} {"train_loss": -5.562811851501465, "global_step": 37769, "epoch": 899} {"train_loss": -5.7434306144714355, "global_step": 37770, "epoch": 899} {"train_loss": -5.654936790466309, "global_step": 37771, "epoch": 899} {"train_loss": -5.540675640106201, "global_step": 37772, "epoch": 899} {"train_loss": -5.611956596374512, "global_step": 37773, "epoch": 899} {"train_loss": -5.663236618041992, "global_step": 37774, "epoch": 899} {"train_loss": -5.674921035766602, "global_step": 37775, "epoch": 899} {"train_loss": -5.649164199829102, "global_step": 37776, "epoch": 899} {"train_loss": -5.536804676055908, "global_step": 37777, "epoch": 899} {"train_loss": -5.590305328369141, "global_step": 37778, "epoch": 899} {"train_loss": -5.534558296203613, "global_step": 37779, "epoch": 899} {"train_loss": -5.516657829284668, "global_step": 37780, "epoch": 899} {"train_loss": -5.745355129241943, "global_step": 37781, "epoch": 899} {"train_loss": -5.729143142700195, "global_step": 37782, "epoch": 899} {"train_loss": -5.50189208984375, "global_step": 37783, "epoch": 899} {"train_loss": -5.625284194946289, "global_step": 37784, "epoch": 899} {"train_loss": -5.606804847717285, "global_step": 37785, "epoch": 899} {"train_loss": -5.584712028503418, "global_step": 37786, "epoch": 899} {"train_loss": -5.691799640655518, "global_step": 37787, "epoch": 899} {"train_loss": -5.64752197265625, "global_step": 37788, "epoch": 899} {"train_loss": -5.724593162536621, "global_step": 37789, "epoch": 899} {"train_loss": -5.591648101806641, "global_step": 37790, "epoch": 899} {"train_loss": -5.5767340660095215, "global_step": 37791, "epoch": 899} {"train_loss": -5.669808864593506, "global_step": 37792, "epoch": 899} {"train_loss": -5.5728607177734375, "global_step": 37793, "epoch": 899} {"train_loss": -5.622289657592773, "global_step": 37794, "epoch": 899} {"train_loss": -5.635720729827881, "global_step": 37795, "epoch": 899} {"train_loss": -5.625751495361328, "global_step": 37796, "epoch": 899} {"train_loss": -5.578951835632324, "global_step": 37797, "epoch": 899} {"train_loss": -5.635660171508789, "global_step": 37798, "epoch": 899} {"train_loss": -5.602316027595883, "global_step": 37799, "epoch": 899, "val_loss": 66094.375} {"train_loss": -5.528019905090332, "global_step": 37800, "epoch": 900} {"train_loss": -5.582204818725586, "global_step": 37801, "epoch": 900} {"train_loss": -5.543859481811523, "global_step": 37802, "epoch": 900} {"train_loss": -5.624642372131348, "global_step": 37803, "epoch": 900} {"train_loss": -5.601375579833984, "global_step": 37804, "epoch": 900} {"train_loss": -5.643560409545898, "global_step": 37805, "epoch": 900} {"train_loss": -5.664324760437012, "global_step": 37806, "epoch": 900} {"train_loss": -5.550354957580566, "global_step": 37807, "epoch": 900} {"train_loss": -5.6048407554626465, "global_step": 37808, "epoch": 900} {"train_loss": -5.591102123260498, "global_step": 37809, "epoch": 900} {"train_loss": -5.499836444854736, "global_step": 37810, "epoch": 900} {"train_loss": -5.544554233551025, "global_step": 37811, "epoch": 900} {"train_loss": -5.596279144287109, "global_step": 37812, "epoch": 900} {"train_loss": -5.494658946990967, "global_step": 37813, "epoch": 900} {"train_loss": -5.66703987121582, "global_step": 37814, "epoch": 900} {"train_loss": -5.4423828125, "global_step": 37815, "epoch": 900} {"train_loss": -5.5979413986206055, "global_step": 37816, "epoch": 900} {"train_loss": -5.561334609985352, "global_step": 37817, "epoch": 900} {"train_loss": -5.53240442276001, "global_step": 37818, "epoch": 900} {"train_loss": -5.699432849884033, "global_step": 37819, "epoch": 900} {"train_loss": -5.56648588180542, "global_step": 37820, "epoch": 900} {"train_loss": -5.524267196655273, "global_step": 37821, "epoch": 900} {"train_loss": -5.611660003662109, "global_step": 37822, "epoch": 900} {"train_loss": -5.62471866607666, "global_step": 37823, "epoch": 900} {"train_loss": -5.539113998413086, "global_step": 37824, "epoch": 900} {"train_loss": -5.666531562805176, "global_step": 37825, "epoch": 900} {"train_loss": -5.555793762207031, "global_step": 37826, "epoch": 900} {"train_loss": -5.74528169631958, "global_step": 37827, "epoch": 900} {"train_loss": -5.703766822814941, "global_step": 37828, "epoch": 900} {"train_loss": -5.724311351776123, "global_step": 37829, "epoch": 900} {"train_loss": -5.559381484985352, "global_step": 37830, "epoch": 900} {"train_loss": -5.750494003295898, "global_step": 37831, "epoch": 900} {"train_loss": -5.585203647613525, "global_step": 37832, "epoch": 900} {"train_loss": -5.58527135848999, "global_step": 37833, "epoch": 900} {"train_loss": -5.579147815704346, "global_step": 37834, "epoch": 900} {"train_loss": -5.630797863006592, "global_step": 37835, "epoch": 900} {"train_loss": -5.728762626647949, "global_step": 37836, "epoch": 900} {"train_loss": -5.60390043258667, "global_step": 37837, "epoch": 900} {"train_loss": -5.603074073791504, "global_step": 37838, "epoch": 900} {"train_loss": -5.453995704650879, "global_step": 37839, "epoch": 900} {"train_loss": -5.720217227935791, "global_step": 37840, "epoch": 900} {"train_loss": -5.600626457305181, "global_step": 37841, "epoch": 900, "train/sim_max_reward_0": 0.4340081346960789, "train/sim_max_reward_1": 0.5870328529842381, "train/sim_max_reward_2": 0.5711921449617972, "train/sim_max_reward_3": 0.17357329847355363, "train/sim_max_reward_4": 0.5199227355081056, "train/sim_max_reward_5": 0.7025658404819686, "test/sim_max_reward_4400000": 0.2240891526472715, "test/sim_max_reward_4400001": 0.4611235724233168, "test/sim_max_reward_4400002": 0.319998553868091, "test/sim_max_reward_4400003": 0.007114492317506092, "test/sim_max_reward_4400004": 0.1830352194776119, "test/sim_max_reward_4400005": 0.13748302695332398, "test/sim_max_reward_4400006": 0.02051438767448489, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.4651138924048999, "test/sim_max_reward_4400009": 0.5839283861567914, "test/sim_max_reward_4400010": 0.2874179448084291, "test/sim_max_reward_4400011": 0.1979502398188337, "test/sim_max_reward_4400012": 0.37596977803179404, "test/sim_max_reward_4400013": 0.8502158917311036, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3270774020338197, "test/sim_max_reward_4400019": 0.46683761633397075, "test/sim_max_reward_4400020": 0.0002801417278551616, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.07730770849818305, "test/sim_max_reward_4400023": 0.12111810522248377, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.19413411034438977, "test/sim_max_reward_4400026": 0.09482508078091204, "test/sim_max_reward_4400027": 0.0063484486194079785, "test/sim_max_reward_4400028": 0.2803223653943145, "test/sim_max_reward_4400029": 0.15977268403996014, "test/sim_max_reward_4400030": 0.4059221859259544, "test/sim_max_reward_4400031": 0.3966773136937326, "test/sim_max_reward_4400032": 0.31792614700342264, "test/sim_max_reward_4400033": 0.6940726487942531, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.4653593589462684, "test/sim_max_reward_4400036": 0.33864250225242554, "test/sim_max_reward_4400037": 0.2934528478217335, "test/sim_max_reward_4400038": 0.1498458193880794, "test/sim_max_reward_4400039": 0.7042676100213039, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.3248090485052725, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.13212817396801405, "test/sim_max_reward_4400044": 0.7485165719842002, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.2828926130462366, "test/sim_max_reward_4400047": 0.4605097911693041, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.12768670460416987, "train/mean_score": 0.49804916785095693, "test/mean_score": 0.24461116585860868, "val_loss": 65953.453125} {"train_loss": -5.517674922943115, "global_step": 37842, "epoch": 901} {"train_loss": -5.77194881439209, "global_step": 37843, "epoch": 901} {"train_loss": -5.751943588256836, "global_step": 37844, "epoch": 901} {"train_loss": -5.567065238952637, "global_step": 37845, "epoch": 901} {"train_loss": -5.646685600280762, "global_step": 37846, "epoch": 901} {"train_loss": -5.646927833557129, "global_step": 37847, "epoch": 901} {"train_loss": -5.637803077697754, "global_step": 37848, "epoch": 901} {"train_loss": -5.558358192443848, "global_step": 37849, "epoch": 901} {"train_loss": -5.724501609802246, "global_step": 37850, "epoch": 901} {"train_loss": -5.549571990966797, "global_step": 37851, "epoch": 901} {"train_loss": -5.710908889770508, "global_step": 37852, "epoch": 901} {"train_loss": -5.575959205627441, "global_step": 37853, "epoch": 901} {"train_loss": -5.700346946716309, "global_step": 37854, "epoch": 901} {"train_loss": -5.415287017822266, "global_step": 37855, "epoch": 901} {"train_loss": -5.565186023712158, "global_step": 37856, "epoch": 901} {"train_loss": -5.670260429382324, "global_step": 37857, "epoch": 901} {"train_loss": -5.632505416870117, "global_step": 37858, "epoch": 901} {"train_loss": -5.574423789978027, "global_step": 37859, "epoch": 901} {"train_loss": -5.615598678588867, "global_step": 37860, "epoch": 901} {"train_loss": -5.6699676513671875, "global_step": 37861, "epoch": 901} {"train_loss": -5.669497966766357, "global_step": 37862, "epoch": 901} {"train_loss": -5.723584175109863, "global_step": 37863, "epoch": 901} {"train_loss": -5.517935752868652, "global_step": 37864, "epoch": 901} {"train_loss": -5.650284767150879, "global_step": 37865, "epoch": 901} {"train_loss": -5.583703994750977, "global_step": 37866, "epoch": 901} {"train_loss": -5.658277988433838, "global_step": 37867, "epoch": 901} {"train_loss": -5.556745529174805, "global_step": 37868, "epoch": 901} {"train_loss": -5.6873555183410645, "global_step": 37869, "epoch": 901} {"train_loss": -5.622873306274414, "global_step": 37870, "epoch": 901} {"train_loss": -5.581807613372803, "global_step": 37871, "epoch": 901} {"train_loss": -5.650205612182617, "global_step": 37872, "epoch": 901} {"train_loss": -5.6272969245910645, "global_step": 37873, "epoch": 901} {"train_loss": -5.658633232116699, "global_step": 37874, "epoch": 901} {"train_loss": -5.665134429931641, "global_step": 37875, "epoch": 901} {"train_loss": -5.482191562652588, "global_step": 37876, "epoch": 901} {"train_loss": -5.665322303771973, "global_step": 37877, "epoch": 901} {"train_loss": -5.594145774841309, "global_step": 37878, "epoch": 901} {"train_loss": -5.4758758544921875, "global_step": 37879, "epoch": 901} {"train_loss": -5.672532081604004, "global_step": 37880, "epoch": 901} {"train_loss": -5.529884338378906, "global_step": 37881, "epoch": 901} {"train_loss": -5.640714645385742, "global_step": 37882, "epoch": 901} {"train_loss": -5.6195610364278155, "global_step": 37883, "epoch": 901, "val_loss": 65831.5390625} {"train_loss": -5.745151519775391, "global_step": 37884, "epoch": 902} {"train_loss": -5.509738922119141, "global_step": 37885, "epoch": 902} {"train_loss": -5.59372615814209, "global_step": 37886, "epoch": 902} {"train_loss": -5.604520797729492, "global_step": 37887, "epoch": 902} {"train_loss": -5.524454116821289, "global_step": 37888, "epoch": 902} {"train_loss": -5.601512908935547, "global_step": 37889, "epoch": 902} {"train_loss": -5.522538661956787, "global_step": 37890, "epoch": 902} {"train_loss": -5.728443145751953, "global_step": 37891, "epoch": 902} {"train_loss": -5.592045783996582, "global_step": 37892, "epoch": 902} {"train_loss": -5.6657562255859375, "global_step": 37893, "epoch": 902} {"train_loss": -5.731607437133789, "global_step": 37894, "epoch": 902} {"train_loss": -5.531096458435059, "global_step": 37895, "epoch": 902} {"train_loss": -5.692166328430176, "global_step": 37896, "epoch": 902} {"train_loss": -5.540810585021973, "global_step": 37897, "epoch": 902} {"train_loss": -5.602665901184082, "global_step": 37898, "epoch": 902} {"train_loss": -5.5225043296813965, "global_step": 37899, "epoch": 902} {"train_loss": -5.676244735717773, "global_step": 37900, "epoch": 902} {"train_loss": -5.61485481262207, "global_step": 37901, "epoch": 902} {"train_loss": -5.595355987548828, "global_step": 37902, "epoch": 902} {"train_loss": -5.524636268615723, "global_step": 37903, "epoch": 902} {"train_loss": -5.644314289093018, "global_step": 37904, "epoch": 902} {"train_loss": -5.586158752441406, "global_step": 37905, "epoch": 902} {"train_loss": -5.634885787963867, "global_step": 37906, "epoch": 902} {"train_loss": -5.6889567375183105, "global_step": 37907, "epoch": 902} {"train_loss": -5.695852279663086, "global_step": 37908, "epoch": 902} {"train_loss": -5.769576072692871, "global_step": 37909, "epoch": 902} {"train_loss": -5.584651470184326, "global_step": 37910, "epoch": 902} {"train_loss": -5.665440082550049, "global_step": 37911, "epoch": 902} {"train_loss": -5.517865180969238, "global_step": 37912, "epoch": 902} {"train_loss": -5.575127601623535, "global_step": 37913, "epoch": 902} {"train_loss": -5.698030948638916, "global_step": 37914, "epoch": 902} {"train_loss": -5.489688873291016, "global_step": 37915, "epoch": 902} {"train_loss": -5.542533874511719, "global_step": 37916, "epoch": 902} {"train_loss": -5.558000564575195, "global_step": 37917, "epoch": 902} {"train_loss": -5.532808303833008, "global_step": 37918, "epoch": 902} {"train_loss": -5.585690975189209, "global_step": 37919, "epoch": 902} {"train_loss": -5.552075386047363, "global_step": 37920, "epoch": 902} {"train_loss": -5.5727996826171875, "global_step": 37921, "epoch": 902} {"train_loss": -5.593055248260498, "global_step": 37922, "epoch": 902} {"train_loss": -5.381345272064209, "global_step": 37923, "epoch": 902} {"train_loss": -5.557199001312256, "global_step": 37924, "epoch": 902} {"train_loss": -5.598278443018596, "global_step": 37925, "epoch": 902, "val_loss": 66005.609375} {"train_loss": -5.57847261428833, "global_step": 37926, "epoch": 903} {"train_loss": -5.55185604095459, "global_step": 37927, "epoch": 903} {"train_loss": -5.569261074066162, "global_step": 37928, "epoch": 903} {"train_loss": -5.716717720031738, "global_step": 37929, "epoch": 903} {"train_loss": -5.61613655090332, "global_step": 37930, "epoch": 903} {"train_loss": -5.578422546386719, "global_step": 37931, "epoch": 903} {"train_loss": -5.7038798332214355, "global_step": 37932, "epoch": 903} {"train_loss": -5.585722923278809, "global_step": 37933, "epoch": 903} {"train_loss": -5.597530364990234, "global_step": 37934, "epoch": 903} {"train_loss": -5.615235328674316, "global_step": 37935, "epoch": 903} {"train_loss": -5.667280673980713, "global_step": 37936, "epoch": 903} {"train_loss": -5.595940589904785, "global_step": 37937, "epoch": 903} {"train_loss": -5.574267387390137, "global_step": 37938, "epoch": 903} {"train_loss": -5.588817596435547, "global_step": 37939, "epoch": 903} {"train_loss": -5.5485687255859375, "global_step": 37940, "epoch": 903} {"train_loss": -5.489392280578613, "global_step": 37941, "epoch": 903} {"train_loss": -5.5289411544799805, "global_step": 37942, "epoch": 903} {"train_loss": -5.527225494384766, "global_step": 37943, "epoch": 903} {"train_loss": -5.583723068237305, "global_step": 37944, "epoch": 903} {"train_loss": -5.573224067687988, "global_step": 37945, "epoch": 903} {"train_loss": -5.620925426483154, "global_step": 37946, "epoch": 903} {"train_loss": -5.4329752922058105, "global_step": 37947, "epoch": 903} {"train_loss": -5.6307783126831055, "global_step": 37948, "epoch": 903} {"train_loss": -5.588929176330566, "global_step": 37949, "epoch": 903} {"train_loss": -5.614965438842773, "global_step": 37950, "epoch": 903} {"train_loss": -5.5429277420043945, "global_step": 37951, "epoch": 903} {"train_loss": -5.525107383728027, "global_step": 37952, "epoch": 903} {"train_loss": -5.59124755859375, "global_step": 37953, "epoch": 903} {"train_loss": -5.479137420654297, "global_step": 37954, "epoch": 903} {"train_loss": -5.4842000007629395, "global_step": 37955, "epoch": 903} {"train_loss": -5.438539981842041, "global_step": 37956, "epoch": 903} {"train_loss": -5.452942371368408, "global_step": 37957, "epoch": 903} {"train_loss": -5.650110244750977, "global_step": 37958, "epoch": 903} {"train_loss": -5.467080116271973, "global_step": 37959, "epoch": 903} {"train_loss": -5.4984822273254395, "global_step": 37960, "epoch": 903} {"train_loss": -5.466306209564209, "global_step": 37961, "epoch": 903} {"train_loss": -5.337561130523682, "global_step": 37962, "epoch": 903} {"train_loss": -5.515467643737793, "global_step": 37963, "epoch": 903} {"train_loss": -5.310882091522217, "global_step": 37964, "epoch": 903} {"train_loss": -5.7665863037109375, "global_step": 37965, "epoch": 903} {"train_loss": -5.468162536621094, "global_step": 37966, "epoch": 903} {"train_loss": -5.553885482606434, "global_step": 37967, "epoch": 903, "val_loss": 66806.2890625} {"train_loss": -5.5058159828186035, "global_step": 37968, "epoch": 904} {"train_loss": -5.509334087371826, "global_step": 37969, "epoch": 904} {"train_loss": -5.577446937561035, "global_step": 37970, "epoch": 904} {"train_loss": -5.447697639465332, "global_step": 37971, "epoch": 904} {"train_loss": -5.5707855224609375, "global_step": 37972, "epoch": 904} {"train_loss": -5.483858585357666, "global_step": 37973, "epoch": 904} {"train_loss": -5.516395568847656, "global_step": 37974, "epoch": 904} {"train_loss": -5.647809028625488, "global_step": 37975, "epoch": 904} {"train_loss": -5.597260475158691, "global_step": 37976, "epoch": 904} {"train_loss": -5.563899040222168, "global_step": 37977, "epoch": 904} {"train_loss": -5.686275482177734, "global_step": 37978, "epoch": 904} {"train_loss": -5.620804786682129, "global_step": 37979, "epoch": 904} {"train_loss": -5.5310211181640625, "global_step": 37980, "epoch": 904} {"train_loss": -5.687183380126953, "global_step": 37981, "epoch": 904} {"train_loss": -5.758216857910156, "global_step": 37982, "epoch": 904} {"train_loss": -5.532650470733643, "global_step": 37983, "epoch": 904} {"train_loss": -5.502631187438965, "global_step": 37984, "epoch": 904} {"train_loss": -5.562591075897217, "global_step": 37985, "epoch": 904} {"train_loss": -5.643770217895508, "global_step": 37986, "epoch": 904} {"train_loss": -5.630313873291016, "global_step": 37987, "epoch": 904} {"train_loss": -5.510447025299072, "global_step": 37988, "epoch": 904} {"train_loss": -5.564813613891602, "global_step": 37989, "epoch": 904} {"train_loss": -5.640617370605469, "global_step": 37990, "epoch": 904} {"train_loss": -5.578511714935303, "global_step": 37991, "epoch": 904} {"train_loss": -5.491597652435303, "global_step": 37992, "epoch": 904} {"train_loss": -5.748630046844482, "global_step": 37993, "epoch": 904} {"train_loss": -5.597336769104004, "global_step": 37994, "epoch": 904} {"train_loss": -5.611819744110107, "global_step": 37995, "epoch": 904} {"train_loss": -5.685399055480957, "global_step": 37996, "epoch": 904} {"train_loss": -5.599093437194824, "global_step": 37997, "epoch": 904} {"train_loss": -5.508686065673828, "global_step": 37998, "epoch": 904} {"train_loss": -5.587606430053711, "global_step": 37999, "epoch": 904} {"train_loss": -5.532179355621338, "global_step": 38000, "epoch": 904} {"train_loss": -5.603784084320068, "global_step": 38001, "epoch": 904} {"train_loss": -5.7119035720825195, "global_step": 38002, "epoch": 904} {"train_loss": -5.519678115844727, "global_step": 38003, "epoch": 904} {"train_loss": -5.654266357421875, "global_step": 38004, "epoch": 904} {"train_loss": -5.521018028259277, "global_step": 38005, "epoch": 904} {"train_loss": -5.557997703552246, "global_step": 38006, "epoch": 904} {"train_loss": -5.5900983810424805, "global_step": 38007, "epoch": 904} {"train_loss": -5.549633502960205, "global_step": 38008, "epoch": 904} {"train_loss": -5.584199485324678, "global_step": 38009, "epoch": 904, "val_loss": 66022.09375} {"train_loss": -5.611357688903809, "global_step": 38010, "epoch": 905} {"train_loss": -5.459103584289551, "global_step": 38011, "epoch": 905} {"train_loss": -5.568957328796387, "global_step": 38012, "epoch": 905} {"train_loss": -5.573025226593018, "global_step": 38013, "epoch": 905} {"train_loss": -5.529389381408691, "global_step": 38014, "epoch": 905} {"train_loss": -5.609926700592041, "global_step": 38015, "epoch": 905} {"train_loss": -5.643729209899902, "global_step": 38016, "epoch": 905} {"train_loss": -5.654770374298096, "global_step": 38017, "epoch": 905} {"train_loss": -5.658540725708008, "global_step": 38018, "epoch": 905} {"train_loss": -5.6826887130737305, "global_step": 38019, "epoch": 905} {"train_loss": -5.561862468719482, "global_step": 38020, "epoch": 905} {"train_loss": -5.537754535675049, "global_step": 38021, "epoch": 905} {"train_loss": -5.6669230461120605, "global_step": 38022, "epoch": 905} {"train_loss": -5.568416118621826, "global_step": 38023, "epoch": 905} {"train_loss": -5.3921589851379395, "global_step": 38024, "epoch": 905} {"train_loss": -5.7650017738342285, "global_step": 38025, "epoch": 905} {"train_loss": -5.67962646484375, "global_step": 38026, "epoch": 905} {"train_loss": -5.556452751159668, "global_step": 38027, "epoch": 905} {"train_loss": -5.501530170440674, "global_step": 38028, "epoch": 905} {"train_loss": -5.564326763153076, "global_step": 38029, "epoch": 905} {"train_loss": -5.411151885986328, "global_step": 38030, "epoch": 905} {"train_loss": -5.600729942321777, "global_step": 38031, "epoch": 905} {"train_loss": -5.700286865234375, "global_step": 38032, "epoch": 905} {"train_loss": -5.718659400939941, "global_step": 38033, "epoch": 905} {"train_loss": -5.6140336990356445, "global_step": 38034, "epoch": 905} {"train_loss": -5.631778240203857, "global_step": 38035, "epoch": 905} {"train_loss": -5.542220115661621, "global_step": 38036, "epoch": 905} {"train_loss": -5.635763168334961, "global_step": 38037, "epoch": 905} {"train_loss": -5.648639678955078, "global_step": 38038, "epoch": 905} {"train_loss": -5.634429931640625, "global_step": 38039, "epoch": 905} {"train_loss": -5.589400291442871, "global_step": 38040, "epoch": 905} {"train_loss": -5.72849178314209, "global_step": 38041, "epoch": 905} {"train_loss": -5.642184257507324, "global_step": 38042, "epoch": 905} {"train_loss": -5.668783187866211, "global_step": 38043, "epoch": 905} {"train_loss": -5.576348781585693, "global_step": 38044, "epoch": 905} {"train_loss": -5.54084587097168, "global_step": 38045, "epoch": 905} {"train_loss": -5.592494010925293, "global_step": 38046, "epoch": 905} {"train_loss": -5.754110336303711, "global_step": 38047, "epoch": 905} {"train_loss": -5.5860395431518555, "global_step": 38048, "epoch": 905} {"train_loss": -5.594796180725098, "global_step": 38049, "epoch": 905} {"train_loss": -5.703266143798828, "global_step": 38050, "epoch": 905} {"train_loss": -5.607602471397037, "global_step": 38051, "epoch": 905, "val_loss": 66049.5390625} {"train_loss": -5.539124488830566, "global_step": 38052, "epoch": 906} {"train_loss": -5.55997371673584, "global_step": 38053, "epoch": 906} {"train_loss": -5.619277000427246, "global_step": 38054, "epoch": 906} {"train_loss": -5.588563442230225, "global_step": 38055, "epoch": 906} {"train_loss": -5.42961311340332, "global_step": 38056, "epoch": 906} {"train_loss": -5.57880973815918, "global_step": 38057, "epoch": 906} {"train_loss": -5.417130470275879, "global_step": 38058, "epoch": 906} {"train_loss": -5.413516998291016, "global_step": 38059, "epoch": 906} {"train_loss": -5.498055458068848, "global_step": 38060, "epoch": 906} {"train_loss": -5.424744606018066, "global_step": 38061, "epoch": 906} {"train_loss": -5.537372589111328, "global_step": 38062, "epoch": 906} {"train_loss": -5.419369697570801, "global_step": 38063, "epoch": 906} {"train_loss": -5.611001014709473, "global_step": 38064, "epoch": 906} {"train_loss": -5.539150238037109, "global_step": 38065, "epoch": 906} {"train_loss": -5.451302528381348, "global_step": 38066, "epoch": 906} {"train_loss": -5.577310562133789, "global_step": 38067, "epoch": 906} {"train_loss": -5.479039192199707, "global_step": 38068, "epoch": 906} {"train_loss": -5.617214679718018, "global_step": 38069, "epoch": 906} {"train_loss": -5.528430938720703, "global_step": 38070, "epoch": 906} {"train_loss": -5.547039031982422, "global_step": 38071, "epoch": 906} {"train_loss": -5.700565338134766, "global_step": 38072, "epoch": 906} {"train_loss": -5.551090717315674, "global_step": 38073, "epoch": 906} {"train_loss": -5.527137279510498, "global_step": 38074, "epoch": 906} {"train_loss": -5.609062194824219, "global_step": 38075, "epoch": 906} {"train_loss": -5.602405548095703, "global_step": 38076, "epoch": 906} {"train_loss": -5.515254497528076, "global_step": 38077, "epoch": 906} {"train_loss": -5.601382255554199, "global_step": 38078, "epoch": 906} {"train_loss": -5.600101947784424, "global_step": 38079, "epoch": 906} {"train_loss": -5.58988094329834, "global_step": 38080, "epoch": 906} {"train_loss": -5.557103157043457, "global_step": 38081, "epoch": 906} {"train_loss": -5.646706581115723, "global_step": 38082, "epoch": 906} {"train_loss": -5.534793376922607, "global_step": 38083, "epoch": 906} {"train_loss": -5.618078231811523, "global_step": 38084, "epoch": 906} {"train_loss": -5.624166965484619, "global_step": 38085, "epoch": 906} {"train_loss": -5.601698398590088, "global_step": 38086, "epoch": 906} {"train_loss": -5.683460235595703, "global_step": 38087, "epoch": 906} {"train_loss": -5.4074859619140625, "global_step": 38088, "epoch": 906} {"train_loss": -5.569497108459473, "global_step": 38089, "epoch": 906} {"train_loss": -5.5400896072387695, "global_step": 38090, "epoch": 906} {"train_loss": -5.650646686553955, "global_step": 38091, "epoch": 906} {"train_loss": -5.631084442138672, "global_step": 38092, "epoch": 906} {"train_loss": -5.555673031579881, "global_step": 38093, "epoch": 906, "val_loss": 66451.4453125} {"train_loss": -5.591050148010254, "global_step": 38094, "epoch": 907} {"train_loss": -5.652585029602051, "global_step": 38095, "epoch": 907} {"train_loss": -5.432577133178711, "global_step": 38096, "epoch": 907} {"train_loss": -5.582123279571533, "global_step": 38097, "epoch": 907} {"train_loss": -5.660040855407715, "global_step": 38098, "epoch": 907} {"train_loss": -5.527985095977783, "global_step": 38099, "epoch": 907} {"train_loss": -5.564730167388916, "global_step": 38100, "epoch": 907} {"train_loss": -5.48171329498291, "global_step": 38101, "epoch": 907} {"train_loss": -5.665101051330566, "global_step": 38102, "epoch": 907} {"train_loss": -5.550228595733643, "global_step": 38103, "epoch": 907} {"train_loss": -5.521825313568115, "global_step": 38104, "epoch": 907} {"train_loss": -5.636312961578369, "global_step": 38105, "epoch": 907} {"train_loss": -5.48500919342041, "global_step": 38106, "epoch": 907} {"train_loss": -5.515191078186035, "global_step": 38107, "epoch": 907} {"train_loss": -5.501266956329346, "global_step": 38108, "epoch": 907} {"train_loss": -5.545261859893799, "global_step": 38109, "epoch": 907} {"train_loss": -5.597049713134766, "global_step": 38110, "epoch": 907} {"train_loss": -5.542873382568359, "global_step": 38111, "epoch": 907} {"train_loss": -5.693422317504883, "global_step": 38112, "epoch": 907} {"train_loss": -5.4906158447265625, "global_step": 38113, "epoch": 907} {"train_loss": -5.596718788146973, "global_step": 38114, "epoch": 907} {"train_loss": -5.599731922149658, "global_step": 38115, "epoch": 907} {"train_loss": -5.643484115600586, "global_step": 38116, "epoch": 907} {"train_loss": -5.6441650390625, "global_step": 38117, "epoch": 907} {"train_loss": -5.503461837768555, "global_step": 38118, "epoch": 907} {"train_loss": -5.556244850158691, "global_step": 38119, "epoch": 907} {"train_loss": -5.600833892822266, "global_step": 38120, "epoch": 907} {"train_loss": -5.670884132385254, "global_step": 38121, "epoch": 907} {"train_loss": -5.572903633117676, "global_step": 38122, "epoch": 907} {"train_loss": -5.572195053100586, "global_step": 38123, "epoch": 907} {"train_loss": -5.566796779632568, "global_step": 38124, "epoch": 907} {"train_loss": -5.51757287979126, "global_step": 38125, "epoch": 907} {"train_loss": -5.574188232421875, "global_step": 38126, "epoch": 907} {"train_loss": -5.558899879455566, "global_step": 38127, "epoch": 907} {"train_loss": -5.668938636779785, "global_step": 38128, "epoch": 907} {"train_loss": -5.619677543640137, "global_step": 38129, "epoch": 907} {"train_loss": -5.645462989807129, "global_step": 38130, "epoch": 907} {"train_loss": -5.63671350479126, "global_step": 38131, "epoch": 907} {"train_loss": -5.721622467041016, "global_step": 38132, "epoch": 907} {"train_loss": -5.492227077484131, "global_step": 38133, "epoch": 907} {"train_loss": -5.600550651550293, "global_step": 38134, "epoch": 907} {"train_loss": -5.581685361408052, "global_step": 38135, "epoch": 907, "val_loss": 66144.8984375} {"train_loss": -5.617999076843262, "global_step": 38136, "epoch": 908} {"train_loss": -5.574863433837891, "global_step": 38137, "epoch": 908} {"train_loss": -5.507748126983643, "global_step": 38138, "epoch": 908} {"train_loss": -5.608020782470703, "global_step": 38139, "epoch": 908} {"train_loss": -5.429795742034912, "global_step": 38140, "epoch": 908} {"train_loss": -5.5253448486328125, "global_step": 38141, "epoch": 908} {"train_loss": -5.68068265914917, "global_step": 38142, "epoch": 908} {"train_loss": -5.492693901062012, "global_step": 38143, "epoch": 908} {"train_loss": -5.564807891845703, "global_step": 38144, "epoch": 908} {"train_loss": -5.483478546142578, "global_step": 38145, "epoch": 908} {"train_loss": -5.526165008544922, "global_step": 38146, "epoch": 908} {"train_loss": -5.556373596191406, "global_step": 38147, "epoch": 908} {"train_loss": -5.549291133880615, "global_step": 38148, "epoch": 908} {"train_loss": -5.584230422973633, "global_step": 38149, "epoch": 908} {"train_loss": -5.6596174240112305, "global_step": 38150, "epoch": 908} {"train_loss": -5.670256614685059, "global_step": 38151, "epoch": 908} {"train_loss": -5.581294059753418, "global_step": 38152, "epoch": 908} {"train_loss": -5.565682411193848, "global_step": 38153, "epoch": 908} {"train_loss": -5.559278964996338, "global_step": 38154, "epoch": 908} {"train_loss": -5.669299125671387, "global_step": 38155, "epoch": 908} {"train_loss": -5.6316680908203125, "global_step": 38156, "epoch": 908} {"train_loss": -5.675929546356201, "global_step": 38157, "epoch": 908} {"train_loss": -5.542889595031738, "global_step": 38158, "epoch": 908} {"train_loss": -5.629129409790039, "global_step": 38159, "epoch": 908} {"train_loss": -5.540965557098389, "global_step": 38160, "epoch": 908} {"train_loss": -5.579399585723877, "global_step": 38161, "epoch": 908} {"train_loss": -5.570674896240234, "global_step": 38162, "epoch": 908} {"train_loss": -5.489863872528076, "global_step": 38163, "epoch": 908} {"train_loss": -5.587516784667969, "global_step": 38164, "epoch": 908} {"train_loss": -5.713489532470703, "global_step": 38165, "epoch": 908} {"train_loss": -5.637904644012451, "global_step": 38166, "epoch": 908} {"train_loss": -5.562722206115723, "global_step": 38167, "epoch": 908} {"train_loss": -5.636801719665527, "global_step": 38168, "epoch": 908} {"train_loss": -5.474991798400879, "global_step": 38169, "epoch": 908} {"train_loss": -5.639000415802002, "global_step": 38170, "epoch": 908} {"train_loss": -5.603025436401367, "global_step": 38171, "epoch": 908} {"train_loss": -5.651595115661621, "global_step": 38172, "epoch": 908} {"train_loss": -5.536938190460205, "global_step": 38173, "epoch": 908} {"train_loss": -5.518632411956787, "global_step": 38174, "epoch": 908} {"train_loss": -5.530714988708496, "global_step": 38175, "epoch": 908} {"train_loss": -5.601661682128906, "global_step": 38176, "epoch": 908} {"train_loss": -5.580503202620006, "global_step": 38177, "epoch": 908, "val_loss": 66071.53125} {"train_loss": -5.503952980041504, "global_step": 38178, "epoch": 909} {"train_loss": -5.605555534362793, "global_step": 38179, "epoch": 909} {"train_loss": -5.594971656799316, "global_step": 38180, "epoch": 909} {"train_loss": -5.670248031616211, "global_step": 38181, "epoch": 909} {"train_loss": -5.604449272155762, "global_step": 38182, "epoch": 909} {"train_loss": -5.686107635498047, "global_step": 38183, "epoch": 909} {"train_loss": -5.6557159423828125, "global_step": 38184, "epoch": 909} {"train_loss": -5.6741414070129395, "global_step": 38185, "epoch": 909} {"train_loss": -5.5574541091918945, "global_step": 38186, "epoch": 909} {"train_loss": -5.526185989379883, "global_step": 38187, "epoch": 909} {"train_loss": -5.529036521911621, "global_step": 38188, "epoch": 909} {"train_loss": -5.611748695373535, "global_step": 38189, "epoch": 909} {"train_loss": -5.508615493774414, "global_step": 38190, "epoch": 909} {"train_loss": -5.665470600128174, "global_step": 38191, "epoch": 909} {"train_loss": -5.498660087585449, "global_step": 38192, "epoch": 909} {"train_loss": -5.549126625061035, "global_step": 38193, "epoch": 909} {"train_loss": -5.587894439697266, "global_step": 38194, "epoch": 909} {"train_loss": -5.6436004638671875, "global_step": 38195, "epoch": 909} {"train_loss": -5.52408504486084, "global_step": 38196, "epoch": 909} {"train_loss": -5.677553176879883, "global_step": 38197, "epoch": 909} {"train_loss": -5.7107038497924805, "global_step": 38198, "epoch": 909} {"train_loss": -5.783703804016113, "global_step": 38199, "epoch": 909} {"train_loss": -5.528593063354492, "global_step": 38200, "epoch": 909} {"train_loss": -5.565173149108887, "global_step": 38201, "epoch": 909} {"train_loss": -5.571503639221191, "global_step": 38202, "epoch": 909} {"train_loss": -5.538121223449707, "global_step": 38203, "epoch": 909} {"train_loss": -5.495189666748047, "global_step": 38204, "epoch": 909} {"train_loss": -5.654511451721191, "global_step": 38205, "epoch": 909} {"train_loss": -5.598572731018066, "global_step": 38206, "epoch": 909} {"train_loss": -5.560187339782715, "global_step": 38207, "epoch": 909} {"train_loss": -5.701739311218262, "global_step": 38208, "epoch": 909} {"train_loss": -5.615571022033691, "global_step": 38209, "epoch": 909} {"train_loss": -5.632469177246094, "global_step": 38210, "epoch": 909} {"train_loss": -5.613243579864502, "global_step": 38211, "epoch": 909} {"train_loss": -5.597474098205566, "global_step": 38212, "epoch": 909} {"train_loss": -5.622124671936035, "global_step": 38213, "epoch": 909} {"train_loss": -5.610284805297852, "global_step": 38214, "epoch": 909} {"train_loss": -5.68055534362793, "global_step": 38215, "epoch": 909} {"train_loss": -5.669614791870117, "global_step": 38216, "epoch": 909} {"train_loss": -5.635242938995361, "global_step": 38217, "epoch": 909} {"train_loss": -5.619800567626953, "global_step": 38218, "epoch": 909} {"train_loss": -5.606999794642131, "global_step": 38219, "epoch": 909, "val_loss": 65984.234375} {"train_loss": -5.683500289916992, "global_step": 38220, "epoch": 910} {"train_loss": -5.633988857269287, "global_step": 38221, "epoch": 910} {"train_loss": -5.736074447631836, "global_step": 38222, "epoch": 910} {"train_loss": -5.607307434082031, "global_step": 38223, "epoch": 910} {"train_loss": -5.530129432678223, "global_step": 38224, "epoch": 910} {"train_loss": -5.678001880645752, "global_step": 38225, "epoch": 910} {"train_loss": -5.443463325500488, "global_step": 38226, "epoch": 910} {"train_loss": -5.48514986038208, "global_step": 38227, "epoch": 910} {"train_loss": -5.583342552185059, "global_step": 38228, "epoch": 910} {"train_loss": -5.563146591186523, "global_step": 38229, "epoch": 910} {"train_loss": -5.564585208892822, "global_step": 38230, "epoch": 910} {"train_loss": -5.658107757568359, "global_step": 38231, "epoch": 910} {"train_loss": -5.485347747802734, "global_step": 38232, "epoch": 910} {"train_loss": -5.602121353149414, "global_step": 38233, "epoch": 910} {"train_loss": -5.539652347564697, "global_step": 38234, "epoch": 910} {"train_loss": -5.6871418952941895, "global_step": 38235, "epoch": 910} {"train_loss": -5.5715227127075195, "global_step": 38236, "epoch": 910} {"train_loss": -5.4333343505859375, "global_step": 38237, "epoch": 910} {"train_loss": -5.59124755859375, "global_step": 38238, "epoch": 910} {"train_loss": -5.64768648147583, "global_step": 38239, "epoch": 910} {"train_loss": -5.538704872131348, "global_step": 38240, "epoch": 910} {"train_loss": -5.621045112609863, "global_step": 38241, "epoch": 910} {"train_loss": -5.680156230926514, "global_step": 38242, "epoch": 910} {"train_loss": -5.509586334228516, "global_step": 38243, "epoch": 910} {"train_loss": -5.5464019775390625, "global_step": 38244, "epoch": 910} {"train_loss": -5.553483009338379, "global_step": 38245, "epoch": 910} {"train_loss": -5.496942520141602, "global_step": 38246, "epoch": 910} {"train_loss": -5.546906471252441, "global_step": 38247, "epoch": 910} {"train_loss": -5.6013031005859375, "global_step": 38248, "epoch": 910} {"train_loss": -5.7381086349487305, "global_step": 38249, "epoch": 910} {"train_loss": -5.6328125, "global_step": 38250, "epoch": 910} {"train_loss": -5.606493949890137, "global_step": 38251, "epoch": 910} {"train_loss": -5.634029388427734, "global_step": 38252, "epoch": 910} {"train_loss": -5.625870704650879, "global_step": 38253, "epoch": 910} {"train_loss": -5.545156478881836, "global_step": 38254, "epoch": 910} {"train_loss": -5.667677879333496, "global_step": 38255, "epoch": 910} {"train_loss": -5.567111492156982, "global_step": 38256, "epoch": 910} {"train_loss": -5.609501838684082, "global_step": 38257, "epoch": 910} {"train_loss": -5.4934515953063965, "global_step": 38258, "epoch": 910} {"train_loss": -5.643288612365723, "global_step": 38259, "epoch": 910} {"train_loss": -5.674447059631348, "global_step": 38260, "epoch": 910} {"train_loss": -5.5945299579983665, "global_step": 38261, "epoch": 910, "val_loss": 66060.625} {"train_loss": -5.5061211585998535, "global_step": 38262, "epoch": 911} {"train_loss": -5.611058712005615, "global_step": 38263, "epoch": 911} {"train_loss": -5.720592498779297, "global_step": 38264, "epoch": 911} {"train_loss": -5.596158981323242, "global_step": 38265, "epoch": 911} {"train_loss": -5.57313871383667, "global_step": 38266, "epoch": 911} {"train_loss": -5.596901893615723, "global_step": 38267, "epoch": 911} {"train_loss": -5.626300811767578, "global_step": 38268, "epoch": 911} {"train_loss": -5.6586785316467285, "global_step": 38269, "epoch": 911} {"train_loss": -5.583749771118164, "global_step": 38270, "epoch": 911} {"train_loss": -5.720643520355225, "global_step": 38271, "epoch": 911} {"train_loss": -5.639132022857666, "global_step": 38272, "epoch": 911} {"train_loss": -5.467207908630371, "global_step": 38273, "epoch": 911} {"train_loss": -5.6955742835998535, "global_step": 38274, "epoch": 911} {"train_loss": -5.716276168823242, "global_step": 38275, "epoch": 911} {"train_loss": -5.747748374938965, "global_step": 38276, "epoch": 911} {"train_loss": -5.604837894439697, "global_step": 38277, "epoch": 911} {"train_loss": -5.670955181121826, "global_step": 38278, "epoch": 911} {"train_loss": -5.5967793464660645, "global_step": 38279, "epoch": 911} {"train_loss": -5.591840744018555, "global_step": 38280, "epoch": 911} {"train_loss": -5.578240394592285, "global_step": 38281, "epoch": 911} {"train_loss": -5.662275314331055, "global_step": 38282, "epoch": 911} {"train_loss": -5.694432258605957, "global_step": 38283, "epoch": 911} {"train_loss": -5.567374229431152, "global_step": 38284, "epoch": 911} {"train_loss": -5.700096607208252, "global_step": 38285, "epoch": 911} {"train_loss": -5.7115325927734375, "global_step": 38286, "epoch": 911} {"train_loss": -5.516327857971191, "global_step": 38287, "epoch": 911} {"train_loss": -5.739148139953613, "global_step": 38288, "epoch": 911} {"train_loss": -5.518760681152344, "global_step": 38289, "epoch": 911} {"train_loss": -5.5761895179748535, "global_step": 38290, "epoch": 911} {"train_loss": -5.518625259399414, "global_step": 38291, "epoch": 911} {"train_loss": -5.528526306152344, "global_step": 38292, "epoch": 911} {"train_loss": -5.5109686851501465, "global_step": 38293, "epoch": 911} {"train_loss": -5.5345540046691895, "global_step": 38294, "epoch": 911} {"train_loss": -5.520033836364746, "global_step": 38295, "epoch": 911} {"train_loss": -5.499083042144775, "global_step": 38296, "epoch": 911} {"train_loss": -5.5659332275390625, "global_step": 38297, "epoch": 911} {"train_loss": -5.4604949951171875, "global_step": 38298, "epoch": 911} {"train_loss": -5.36372184753418, "global_step": 38299, "epoch": 911} {"train_loss": -5.5771074295043945, "global_step": 38300, "epoch": 911} {"train_loss": -5.323283672332764, "global_step": 38301, "epoch": 911} {"train_loss": -5.6239166259765625, "global_step": 38302, "epoch": 911} {"train_loss": -5.586905116126651, "global_step": 38303, "epoch": 911, "val_loss": 66205.4140625} {"train_loss": -5.704701900482178, "global_step": 38304, "epoch": 912} {"train_loss": -5.47206974029541, "global_step": 38305, "epoch": 912} {"train_loss": -5.4476518630981445, "global_step": 38306, "epoch": 912} {"train_loss": -5.535496711730957, "global_step": 38307, "epoch": 912} {"train_loss": -5.661746025085449, "global_step": 38308, "epoch": 912} {"train_loss": -5.516817092895508, "global_step": 38309, "epoch": 912} {"train_loss": -5.638111114501953, "global_step": 38310, "epoch": 912} {"train_loss": -5.549948215484619, "global_step": 38311, "epoch": 912} {"train_loss": -5.465846061706543, "global_step": 38312, "epoch": 912} {"train_loss": -5.551931381225586, "global_step": 38313, "epoch": 912} {"train_loss": -5.708627700805664, "global_step": 38314, "epoch": 912} {"train_loss": -5.593441009521484, "global_step": 38315, "epoch": 912} {"train_loss": -5.5268235206604, "global_step": 38316, "epoch": 912} {"train_loss": -5.585432052612305, "global_step": 38317, "epoch": 912} {"train_loss": -5.491122245788574, "global_step": 38318, "epoch": 912} {"train_loss": -5.595149993896484, "global_step": 38319, "epoch": 912} {"train_loss": -5.589578628540039, "global_step": 38320, "epoch": 912} {"train_loss": -5.425029754638672, "global_step": 38321, "epoch": 912} {"train_loss": -5.567190647125244, "global_step": 38322, "epoch": 912} {"train_loss": -5.450042247772217, "global_step": 38323, "epoch": 912} {"train_loss": -5.461726188659668, "global_step": 38324, "epoch": 912} {"train_loss": -5.553767204284668, "global_step": 38325, "epoch": 912} {"train_loss": -5.623500347137451, "global_step": 38326, "epoch": 912} {"train_loss": -5.4832611083984375, "global_step": 38327, "epoch": 912} {"train_loss": -5.533209800720215, "global_step": 38328, "epoch": 912} {"train_loss": -5.562419891357422, "global_step": 38329, "epoch": 912} {"train_loss": -5.629602909088135, "global_step": 38330, "epoch": 912} {"train_loss": -5.692426681518555, "global_step": 38331, "epoch": 912} {"train_loss": -5.675589561462402, "global_step": 38332, "epoch": 912} {"train_loss": -5.556088924407959, "global_step": 38333, "epoch": 912} {"train_loss": -5.549004554748535, "global_step": 38334, "epoch": 912} {"train_loss": -5.667577266693115, "global_step": 38335, "epoch": 912} {"train_loss": -5.599689960479736, "global_step": 38336, "epoch": 912} {"train_loss": -5.618361473083496, "global_step": 38337, "epoch": 912} {"train_loss": -5.646379470825195, "global_step": 38338, "epoch": 912} {"train_loss": -5.632603168487549, "global_step": 38339, "epoch": 912} {"train_loss": -5.6830339431762695, "global_step": 38340, "epoch": 912} {"train_loss": -5.577265739440918, "global_step": 38341, "epoch": 912} {"train_loss": -5.679601669311523, "global_step": 38342, "epoch": 912} {"train_loss": -5.558707237243652, "global_step": 38343, "epoch": 912} {"train_loss": -5.586830139160156, "global_step": 38344, "epoch": 912} {"train_loss": -5.579251414253598, "global_step": 38345, "epoch": 912, "val_loss": 65717.3671875} {"train_loss": -5.580536842346191, "global_step": 38346, "epoch": 913} {"train_loss": -5.478184223175049, "global_step": 38347, "epoch": 913} {"train_loss": -5.7754621505737305, "global_step": 38348, "epoch": 913} {"train_loss": -5.589003562927246, "global_step": 38349, "epoch": 913} {"train_loss": -5.601292610168457, "global_step": 38350, "epoch": 913} {"train_loss": -5.678282737731934, "global_step": 38351, "epoch": 913} {"train_loss": -5.514400482177734, "global_step": 38352, "epoch": 913} {"train_loss": -5.714225769042969, "global_step": 38353, "epoch": 913} {"train_loss": -5.684183120727539, "global_step": 38354, "epoch": 913} {"train_loss": -5.549078941345215, "global_step": 38355, "epoch": 913} {"train_loss": -5.620804786682129, "global_step": 38356, "epoch": 913} {"train_loss": -5.664139747619629, "global_step": 38357, "epoch": 913} {"train_loss": -5.628007888793945, "global_step": 38358, "epoch": 913} {"train_loss": -5.620065689086914, "global_step": 38359, "epoch": 913} {"train_loss": -5.72176456451416, "global_step": 38360, "epoch": 913} {"train_loss": -5.609875202178955, "global_step": 38361, "epoch": 913} {"train_loss": -5.552518844604492, "global_step": 38362, "epoch": 913} {"train_loss": -5.606107711791992, "global_step": 38363, "epoch": 913} {"train_loss": -5.617525100708008, "global_step": 38364, "epoch": 913} {"train_loss": -5.526398658752441, "global_step": 38365, "epoch": 913} {"train_loss": -5.500227928161621, "global_step": 38366, "epoch": 913} {"train_loss": -5.7361040115356445, "global_step": 38367, "epoch": 913} {"train_loss": -5.703328609466553, "global_step": 38368, "epoch": 913} {"train_loss": -5.496990203857422, "global_step": 38369, "epoch": 913} {"train_loss": -5.749789237976074, "global_step": 38370, "epoch": 913} {"train_loss": -5.6574506759643555, "global_step": 38371, "epoch": 913} {"train_loss": -5.642460346221924, "global_step": 38372, "epoch": 913} {"train_loss": -5.566514015197754, "global_step": 38373, "epoch": 913} {"train_loss": -5.569870948791504, "global_step": 38374, "epoch": 913} {"train_loss": -5.492679119110107, "global_step": 38375, "epoch": 913} {"train_loss": -5.55063533782959, "global_step": 38376, "epoch": 913} {"train_loss": -5.645867824554443, "global_step": 38377, "epoch": 913} {"train_loss": -5.560006141662598, "global_step": 38378, "epoch": 913} {"train_loss": -5.509587287902832, "global_step": 38379, "epoch": 913} {"train_loss": -5.640253067016602, "global_step": 38380, "epoch": 913} {"train_loss": -5.535977840423584, "global_step": 38381, "epoch": 913} {"train_loss": -5.588685989379883, "global_step": 38382, "epoch": 913} {"train_loss": -5.604018211364746, "global_step": 38383, "epoch": 913} {"train_loss": -5.435940742492676, "global_step": 38384, "epoch": 913} {"train_loss": -5.465930938720703, "global_step": 38385, "epoch": 913} {"train_loss": -5.566084384918213, "global_step": 38386, "epoch": 913} {"train_loss": -5.596728165944417, "global_step": 38387, "epoch": 913, "val_loss": 65954.828125} {"train_loss": -5.603623867034912, "global_step": 38388, "epoch": 914} {"train_loss": -5.645855903625488, "global_step": 38389, "epoch": 914} {"train_loss": -5.442511081695557, "global_step": 38390, "epoch": 914} {"train_loss": -5.657723426818848, "global_step": 38391, "epoch": 914} {"train_loss": -5.693472862243652, "global_step": 38392, "epoch": 914} {"train_loss": -5.630922794342041, "global_step": 38393, "epoch": 914} {"train_loss": -5.723333358764648, "global_step": 38394, "epoch": 914} {"train_loss": -5.730312347412109, "global_step": 38395, "epoch": 914} {"train_loss": -5.475532054901123, "global_step": 38396, "epoch": 914} {"train_loss": -5.674806594848633, "global_step": 38397, "epoch": 914} {"train_loss": -5.662076950073242, "global_step": 38398, "epoch": 914} {"train_loss": -5.580181121826172, "global_step": 38399, "epoch": 914} {"train_loss": -5.843921661376953, "global_step": 38400, "epoch": 914} {"train_loss": -5.462420463562012, "global_step": 38401, "epoch": 914} {"train_loss": -5.645400524139404, "global_step": 38402, "epoch": 914} {"train_loss": -5.5964674949646, "global_step": 38403, "epoch": 914} {"train_loss": -5.439940929412842, "global_step": 38404, "epoch": 914} {"train_loss": -5.622483253479004, "global_step": 38405, "epoch": 914} {"train_loss": -5.595459938049316, "global_step": 38406, "epoch": 914} {"train_loss": -5.66226053237915, "global_step": 38407, "epoch": 914} {"train_loss": -5.646677017211914, "global_step": 38408, "epoch": 914} {"train_loss": -5.732654571533203, "global_step": 38409, "epoch": 914} {"train_loss": -5.498021125793457, "global_step": 38410, "epoch": 914} {"train_loss": -5.558185577392578, "global_step": 38411, "epoch": 914} {"train_loss": -5.6286725997924805, "global_step": 38412, "epoch": 914} {"train_loss": -5.544225215911865, "global_step": 38413, "epoch": 914} {"train_loss": -5.575482368469238, "global_step": 38414, "epoch": 914} {"train_loss": -5.532716751098633, "global_step": 38415, "epoch": 914} {"train_loss": -5.603580474853516, "global_step": 38416, "epoch": 914} {"train_loss": -5.537270545959473, "global_step": 38417, "epoch": 914} {"train_loss": -5.625123023986816, "global_step": 38418, "epoch": 914} {"train_loss": -5.524751663208008, "global_step": 38419, "epoch": 914} {"train_loss": -5.521551132202148, "global_step": 38420, "epoch": 914} {"train_loss": -5.701545238494873, "global_step": 38421, "epoch": 914} {"train_loss": -5.389117240905762, "global_step": 38422, "epoch": 914} {"train_loss": -5.468469142913818, "global_step": 38423, "epoch": 914} {"train_loss": -5.523354530334473, "global_step": 38424, "epoch": 914} {"train_loss": -5.645260810852051, "global_step": 38425, "epoch": 914} {"train_loss": -5.597993850708008, "global_step": 38426, "epoch": 914} {"train_loss": -5.485036849975586, "global_step": 38427, "epoch": 914} {"train_loss": -5.50554084777832, "global_step": 38428, "epoch": 914} {"train_loss": -5.593037559872582, "global_step": 38429, "epoch": 914, "val_loss": 66709.09375} {"train_loss": -5.570246696472168, "global_step": 38430, "epoch": 915} {"train_loss": -5.633440017700195, "global_step": 38431, "epoch": 915} {"train_loss": -5.6042399406433105, "global_step": 38432, "epoch": 915} {"train_loss": -5.535932540893555, "global_step": 38433, "epoch": 915} {"train_loss": -5.663610458374023, "global_step": 38434, "epoch": 915} {"train_loss": -5.646790504455566, "global_step": 38435, "epoch": 915} {"train_loss": -5.693137168884277, "global_step": 38436, "epoch": 915} {"train_loss": -5.472222805023193, "global_step": 38437, "epoch": 915} {"train_loss": -5.609505653381348, "global_step": 38438, "epoch": 915} {"train_loss": -5.561272621154785, "global_step": 38439, "epoch": 915} {"train_loss": -5.660634994506836, "global_step": 38440, "epoch": 915} {"train_loss": -5.685609817504883, "global_step": 38441, "epoch": 915} {"train_loss": -5.702672481536865, "global_step": 38442, "epoch": 915} {"train_loss": -5.67262077331543, "global_step": 38443, "epoch": 915} {"train_loss": -5.496157646179199, "global_step": 38444, "epoch": 915} {"train_loss": -5.689570426940918, "global_step": 38445, "epoch": 915} {"train_loss": -5.580896854400635, "global_step": 38446, "epoch": 915} {"train_loss": -5.50272274017334, "global_step": 38447, "epoch": 915} {"train_loss": -5.532061576843262, "global_step": 38448, "epoch": 915} {"train_loss": -5.591174125671387, "global_step": 38449, "epoch": 915} {"train_loss": -5.589316368103027, "global_step": 38450, "epoch": 915} {"train_loss": -5.604020595550537, "global_step": 38451, "epoch": 915} {"train_loss": -5.671216011047363, "global_step": 38452, "epoch": 915} {"train_loss": -5.67609977722168, "global_step": 38453, "epoch": 915} {"train_loss": -5.650134563446045, "global_step": 38454, "epoch": 915} {"train_loss": -5.654955863952637, "global_step": 38455, "epoch": 915} {"train_loss": -5.492494583129883, "global_step": 38456, "epoch": 915} {"train_loss": -5.621949195861816, "global_step": 38457, "epoch": 915} {"train_loss": -5.709568023681641, "global_step": 38458, "epoch": 915} {"train_loss": -5.455789566040039, "global_step": 38459, "epoch": 915} {"train_loss": -5.5968017578125, "global_step": 38460, "epoch": 915} {"train_loss": -5.673942565917969, "global_step": 38461, "epoch": 915} {"train_loss": -5.651246070861816, "global_step": 38462, "epoch": 915} {"train_loss": -5.710379600524902, "global_step": 38463, "epoch": 915} {"train_loss": -5.684421539306641, "global_step": 38464, "epoch": 915} {"train_loss": -5.519128799438477, "global_step": 38465, "epoch": 915} {"train_loss": -5.594059467315674, "global_step": 38466, "epoch": 915} {"train_loss": -5.697562217712402, "global_step": 38467, "epoch": 915} {"train_loss": -5.7535247802734375, "global_step": 38468, "epoch": 915} {"train_loss": -5.711307525634766, "global_step": 38469, "epoch": 915} {"train_loss": -5.544564247131348, "global_step": 38470, "epoch": 915} {"train_loss": -5.619017896198091, "global_step": 38471, "epoch": 915, "val_loss": 66048.2421875} {"train_loss": -5.554230213165283, "global_step": 38472, "epoch": 916} {"train_loss": -5.656330108642578, "global_step": 38473, "epoch": 916} {"train_loss": -5.489489555358887, "global_step": 38474, "epoch": 916} {"train_loss": -5.490207195281982, "global_step": 38475, "epoch": 916} {"train_loss": -5.540588855743408, "global_step": 38476, "epoch": 916} {"train_loss": -5.67273473739624, "global_step": 38477, "epoch": 916} {"train_loss": -5.695869445800781, "global_step": 38478, "epoch": 916} {"train_loss": -5.583317279815674, "global_step": 38479, "epoch": 916} {"train_loss": -5.5805792808532715, "global_step": 38480, "epoch": 916} {"train_loss": -5.560465335845947, "global_step": 38481, "epoch": 916} {"train_loss": -5.495582580566406, "global_step": 38482, "epoch": 916} {"train_loss": -5.740176200866699, "global_step": 38483, "epoch": 916} {"train_loss": -5.62220573425293, "global_step": 38484, "epoch": 916} {"train_loss": -5.618334770202637, "global_step": 38485, "epoch": 916} {"train_loss": -5.605716228485107, "global_step": 38486, "epoch": 916} {"train_loss": -5.628008842468262, "global_step": 38487, "epoch": 916} {"train_loss": -5.400368690490723, "global_step": 38488, "epoch": 916} {"train_loss": -5.532223701477051, "global_step": 38489, "epoch": 916} {"train_loss": -5.648066520690918, "global_step": 38490, "epoch": 916} {"train_loss": -5.582806587219238, "global_step": 38491, "epoch": 916} {"train_loss": -5.628146171569824, "global_step": 38492, "epoch": 916} {"train_loss": -5.544008255004883, "global_step": 38493, "epoch": 916} {"train_loss": -5.55976676940918, "global_step": 38494, "epoch": 916} {"train_loss": -5.641502857208252, "global_step": 38495, "epoch": 916} {"train_loss": -5.582071781158447, "global_step": 38496, "epoch": 916} {"train_loss": -5.588101863861084, "global_step": 38497, "epoch": 916} {"train_loss": -5.645382404327393, "global_step": 38498, "epoch": 916} {"train_loss": -5.523189544677734, "global_step": 38499, "epoch": 916} {"train_loss": -5.472687721252441, "global_step": 38500, "epoch": 916} {"train_loss": -5.755346298217773, "global_step": 38501, "epoch": 916} {"train_loss": -5.561294078826904, "global_step": 38502, "epoch": 916} {"train_loss": -5.585160732269287, "global_step": 38503, "epoch": 916} {"train_loss": -5.6524224281311035, "global_step": 38504, "epoch": 916} {"train_loss": -5.5575103759765625, "global_step": 38505, "epoch": 916} {"train_loss": -5.542268753051758, "global_step": 38506, "epoch": 916} {"train_loss": -5.720083236694336, "global_step": 38507, "epoch": 916} {"train_loss": -5.546477317810059, "global_step": 38508, "epoch": 916} {"train_loss": -5.532423973083496, "global_step": 38509, "epoch": 916} {"train_loss": -5.4318766593933105, "global_step": 38510, "epoch": 916} {"train_loss": -5.511239051818848, "global_step": 38511, "epoch": 916} {"train_loss": -5.648798942565918, "global_step": 38512, "epoch": 916} {"train_loss": -5.580425012679327, "global_step": 38513, "epoch": 916, "val_loss": 66279.8125} {"train_loss": -5.682116508483887, "global_step": 38514, "epoch": 917} {"train_loss": -5.5246477127075195, "global_step": 38515, "epoch": 917} {"train_loss": -5.612060546875, "global_step": 38516, "epoch": 917} {"train_loss": -5.562395095825195, "global_step": 38517, "epoch": 917} {"train_loss": -5.566411972045898, "global_step": 38518, "epoch": 917} {"train_loss": -5.634482383728027, "global_step": 38519, "epoch": 917} {"train_loss": -5.798895835876465, "global_step": 38520, "epoch": 917} {"train_loss": -5.480914115905762, "global_step": 38521, "epoch": 917} {"train_loss": -5.615958213806152, "global_step": 38522, "epoch": 917} {"train_loss": -5.547657012939453, "global_step": 38523, "epoch": 917} {"train_loss": -5.534625053405762, "global_step": 38524, "epoch": 917} {"train_loss": -5.678322792053223, "global_step": 38525, "epoch": 917} {"train_loss": -5.519232273101807, "global_step": 38526, "epoch": 917} {"train_loss": -5.483242988586426, "global_step": 38527, "epoch": 917} {"train_loss": -5.540175437927246, "global_step": 38528, "epoch": 917} {"train_loss": -5.579563140869141, "global_step": 38529, "epoch": 917} {"train_loss": -5.548348903656006, "global_step": 38530, "epoch": 917} {"train_loss": -5.547831058502197, "global_step": 38531, "epoch": 917} {"train_loss": -5.655242919921875, "global_step": 38532, "epoch": 917} {"train_loss": -5.625934600830078, "global_step": 38533, "epoch": 917} {"train_loss": -5.484021186828613, "global_step": 38534, "epoch": 917} {"train_loss": -5.684432029724121, "global_step": 38535, "epoch": 917} {"train_loss": -5.586696147918701, "global_step": 38536, "epoch": 917} {"train_loss": -5.595554351806641, "global_step": 38537, "epoch": 917} {"train_loss": -5.682159423828125, "global_step": 38538, "epoch": 917} {"train_loss": -5.655979156494141, "global_step": 38539, "epoch": 917} {"train_loss": -5.5291290283203125, "global_step": 38540, "epoch": 917} {"train_loss": -5.553205490112305, "global_step": 38541, "epoch": 917} {"train_loss": -5.540013313293457, "global_step": 38542, "epoch": 917} {"train_loss": -5.610706329345703, "global_step": 38543, "epoch": 917} {"train_loss": -5.420914649963379, "global_step": 38544, "epoch": 917} {"train_loss": -5.631683349609375, "global_step": 38545, "epoch": 917} {"train_loss": -5.615205764770508, "global_step": 38546, "epoch": 917} {"train_loss": -5.722128868103027, "global_step": 38547, "epoch": 917} {"train_loss": -5.4349212646484375, "global_step": 38548, "epoch": 917} {"train_loss": -5.578264236450195, "global_step": 38549, "epoch": 917} {"train_loss": -5.624596118927002, "global_step": 38550, "epoch": 917} {"train_loss": -5.511116027832031, "global_step": 38551, "epoch": 917} {"train_loss": -5.571938514709473, "global_step": 38552, "epoch": 917} {"train_loss": -5.587368011474609, "global_step": 38553, "epoch": 917} {"train_loss": -5.611124038696289, "global_step": 38554, "epoch": 917} {"train_loss": -5.590230703353882, "global_step": 38555, "epoch": 917, "val_loss": 66416.8046875} {"train_loss": -5.463430404663086, "global_step": 38556, "epoch": 918} {"train_loss": -5.599587917327881, "global_step": 38557, "epoch": 918} {"train_loss": -5.422172546386719, "global_step": 38558, "epoch": 918} {"train_loss": -5.425758361816406, "global_step": 38559, "epoch": 918} {"train_loss": -5.605403900146484, "global_step": 38560, "epoch": 918} {"train_loss": -5.449113845825195, "global_step": 38561, "epoch": 918} {"train_loss": -5.617000102996826, "global_step": 38562, "epoch": 918} {"train_loss": -5.637307643890381, "global_step": 38563, "epoch": 918} {"train_loss": -5.477957725524902, "global_step": 38564, "epoch": 918} {"train_loss": -5.587650299072266, "global_step": 38565, "epoch": 918} {"train_loss": -5.502588272094727, "global_step": 38566, "epoch": 918} {"train_loss": -5.6396660804748535, "global_step": 38567, "epoch": 918} {"train_loss": -5.719944953918457, "global_step": 38568, "epoch": 918} {"train_loss": -5.512152194976807, "global_step": 38569, "epoch": 918} {"train_loss": -5.411194801330566, "global_step": 38570, "epoch": 918} {"train_loss": -5.587791442871094, "global_step": 38571, "epoch": 918} {"train_loss": -5.495162487030029, "global_step": 38572, "epoch": 918} {"train_loss": -5.547823905944824, "global_step": 38573, "epoch": 918} {"train_loss": -5.752471923828125, "global_step": 38574, "epoch": 918} {"train_loss": -5.468548774719238, "global_step": 38575, "epoch": 918} {"train_loss": -5.638058662414551, "global_step": 38576, "epoch": 918} {"train_loss": -5.624311447143555, "global_step": 38577, "epoch": 918} {"train_loss": -5.548356056213379, "global_step": 38578, "epoch": 918} {"train_loss": -5.379816055297852, "global_step": 38579, "epoch": 918} {"train_loss": -5.632698059082031, "global_step": 38580, "epoch": 918} {"train_loss": -5.674816131591797, "global_step": 38581, "epoch": 918} {"train_loss": -5.486064910888672, "global_step": 38582, "epoch": 918} {"train_loss": -5.560718059539795, "global_step": 38583, "epoch": 918} {"train_loss": -5.725255012512207, "global_step": 38584, "epoch": 918} {"train_loss": -5.566276550292969, "global_step": 38585, "epoch": 918} {"train_loss": -5.528176307678223, "global_step": 38586, "epoch": 918} {"train_loss": -5.680445194244385, "global_step": 38587, "epoch": 918} {"train_loss": -5.507550239562988, "global_step": 38588, "epoch": 918} {"train_loss": -5.3901567459106445, "global_step": 38589, "epoch": 918} {"train_loss": -5.609827041625977, "global_step": 38590, "epoch": 918} {"train_loss": -5.6455078125, "global_step": 38591, "epoch": 918} {"train_loss": -5.618659973144531, "global_step": 38592, "epoch": 918} {"train_loss": -5.599926948547363, "global_step": 38593, "epoch": 918} {"train_loss": -5.573696613311768, "global_step": 38594, "epoch": 918} {"train_loss": -5.541172981262207, "global_step": 38595, "epoch": 918} {"train_loss": -5.707954406738281, "global_step": 38596, "epoch": 918} {"train_loss": -5.563369512557983, "global_step": 38597, "epoch": 918, "val_loss": 66005.6875} {"train_loss": -5.584090232849121, "global_step": 38598, "epoch": 919} {"train_loss": -5.637645721435547, "global_step": 38599, "epoch": 919} {"train_loss": -5.559070110321045, "global_step": 38600, "epoch": 919} {"train_loss": -5.5909576416015625, "global_step": 38601, "epoch": 919} {"train_loss": -5.550061225891113, "global_step": 38602, "epoch": 919} {"train_loss": -5.5965189933776855, "global_step": 38603, "epoch": 919} {"train_loss": -5.449087142944336, "global_step": 38604, "epoch": 919} {"train_loss": -5.503366470336914, "global_step": 38605, "epoch": 919} {"train_loss": -5.453583240509033, "global_step": 38606, "epoch": 919} {"train_loss": -5.616049766540527, "global_step": 38607, "epoch": 919} {"train_loss": -5.491832733154297, "global_step": 38608, "epoch": 919} {"train_loss": -5.500691890716553, "global_step": 38609, "epoch": 919} {"train_loss": -5.497165679931641, "global_step": 38610, "epoch": 919} {"train_loss": -5.563600540161133, "global_step": 38611, "epoch": 919} {"train_loss": -5.521519184112549, "global_step": 38612, "epoch": 919} {"train_loss": -5.590968132019043, "global_step": 38613, "epoch": 919} {"train_loss": -5.750141143798828, "global_step": 38614, "epoch": 919} {"train_loss": -5.627863883972168, "global_step": 38615, "epoch": 919} {"train_loss": -5.610478401184082, "global_step": 38616, "epoch": 919} {"train_loss": -5.523954391479492, "global_step": 38617, "epoch": 919} {"train_loss": -5.589985370635986, "global_step": 38618, "epoch": 919} {"train_loss": -5.506558418273926, "global_step": 38619, "epoch": 919} {"train_loss": -5.683165550231934, "global_step": 38620, "epoch": 919} {"train_loss": -5.606574058532715, "global_step": 38621, "epoch": 919} {"train_loss": -5.632000923156738, "global_step": 38622, "epoch": 919} {"train_loss": -5.5433855056762695, "global_step": 38623, "epoch": 919} {"train_loss": -5.497381210327148, "global_step": 38624, "epoch": 919} {"train_loss": -5.673214912414551, "global_step": 38625, "epoch": 919} {"train_loss": -5.639034271240234, "global_step": 38626, "epoch": 919} {"train_loss": -5.591868877410889, "global_step": 38627, "epoch": 919} {"train_loss": -5.507339000701904, "global_step": 38628, "epoch": 919} {"train_loss": -5.715190410614014, "global_step": 38629, "epoch": 919} {"train_loss": -5.726606369018555, "global_step": 38630, "epoch": 919} {"train_loss": -5.559054374694824, "global_step": 38631, "epoch": 919} {"train_loss": -5.519069671630859, "global_step": 38632, "epoch": 919} {"train_loss": -5.634347438812256, "global_step": 38633, "epoch": 919} {"train_loss": -5.619571685791016, "global_step": 38634, "epoch": 919} {"train_loss": -5.714959144592285, "global_step": 38635, "epoch": 919} {"train_loss": -5.602107048034668, "global_step": 38636, "epoch": 919} {"train_loss": -5.533041000366211, "global_step": 38637, "epoch": 919} {"train_loss": -5.668123245239258, "global_step": 38638, "epoch": 919} {"train_loss": -5.584834995723906, "global_step": 38639, "epoch": 919, "val_loss": 66002.515625} {"train_loss": -5.5829362869262695, "global_step": 38640, "epoch": 920} {"train_loss": -5.5786590576171875, "global_step": 38641, "epoch": 920} {"train_loss": -5.54741907119751, "global_step": 38642, "epoch": 920} {"train_loss": -5.6543192863464355, "global_step": 38643, "epoch": 920} {"train_loss": -5.550957679748535, "global_step": 38644, "epoch": 920} {"train_loss": -5.5601911544799805, "global_step": 38645, "epoch": 920} {"train_loss": -5.685282230377197, "global_step": 38646, "epoch": 920} {"train_loss": -5.721832275390625, "global_step": 38647, "epoch": 920} {"train_loss": -5.85801887512207, "global_step": 38648, "epoch": 920} {"train_loss": -5.634331226348877, "global_step": 38649, "epoch": 920} {"train_loss": -5.586164474487305, "global_step": 38650, "epoch": 920} {"train_loss": -5.632094383239746, "global_step": 38651, "epoch": 920} {"train_loss": -5.601243019104004, "global_step": 38652, "epoch": 920} {"train_loss": -5.56522274017334, "global_step": 38653, "epoch": 920} {"train_loss": -5.594805717468262, "global_step": 38654, "epoch": 920} {"train_loss": -5.63165283203125, "global_step": 38655, "epoch": 920} {"train_loss": -5.544257164001465, "global_step": 38656, "epoch": 920} {"train_loss": -5.589691162109375, "global_step": 38657, "epoch": 920} {"train_loss": -5.597139358520508, "global_step": 38658, "epoch": 920} {"train_loss": -5.765179634094238, "global_step": 38659, "epoch": 920} {"train_loss": -5.562717914581299, "global_step": 38660, "epoch": 920} {"train_loss": -5.590561866760254, "global_step": 38661, "epoch": 920} {"train_loss": -5.695248603820801, "global_step": 38662, "epoch": 920} {"train_loss": -5.586804389953613, "global_step": 38663, "epoch": 920} {"train_loss": -5.586009979248047, "global_step": 38664, "epoch": 920} {"train_loss": -5.617849349975586, "global_step": 38665, "epoch": 920} {"train_loss": -5.690913200378418, "global_step": 38666, "epoch": 920} {"train_loss": -5.623804092407227, "global_step": 38667, "epoch": 920} {"train_loss": -5.734874725341797, "global_step": 38668, "epoch": 920} {"train_loss": -5.576470851898193, "global_step": 38669, "epoch": 920} {"train_loss": -5.55518913269043, "global_step": 38670, "epoch": 920} {"train_loss": -5.61773157119751, "global_step": 38671, "epoch": 920} {"train_loss": -5.5810394287109375, "global_step": 38672, "epoch": 920} {"train_loss": -5.532673358917236, "global_step": 38673, "epoch": 920} {"train_loss": -5.609577178955078, "global_step": 38674, "epoch": 920} {"train_loss": -5.73261833190918, "global_step": 38675, "epoch": 920} {"train_loss": -5.601134300231934, "global_step": 38676, "epoch": 920} {"train_loss": -5.691906929016113, "global_step": 38677, "epoch": 920} {"train_loss": -5.618313312530518, "global_step": 38678, "epoch": 920} {"train_loss": -5.510502815246582, "global_step": 38679, "epoch": 920} {"train_loss": -5.652729034423828, "global_step": 38680, "epoch": 920} {"train_loss": -5.6168953123546785, "global_step": 38681, "epoch": 920, "val_loss": 66158.046875} {"train_loss": -5.630259037017822, "global_step": 38682, "epoch": 921} {"train_loss": -5.587000846862793, "global_step": 38683, "epoch": 921} {"train_loss": -5.537559509277344, "global_step": 38684, "epoch": 921} {"train_loss": -5.587322235107422, "global_step": 38685, "epoch": 921} {"train_loss": -5.549129486083984, "global_step": 38686, "epoch": 921} {"train_loss": -5.617783546447754, "global_step": 38687, "epoch": 921} {"train_loss": -5.344321250915527, "global_step": 38688, "epoch": 921} {"train_loss": -5.530056953430176, "global_step": 38689, "epoch": 921} {"train_loss": -5.5596923828125, "global_step": 38690, "epoch": 921} {"train_loss": -5.556090354919434, "global_step": 38691, "epoch": 921} {"train_loss": -5.534317970275879, "global_step": 38692, "epoch": 921} {"train_loss": -5.676575660705566, "global_step": 38693, "epoch": 921} {"train_loss": -5.638920307159424, "global_step": 38694, "epoch": 921} {"train_loss": -5.485340118408203, "global_step": 38695, "epoch": 921} {"train_loss": -5.645243167877197, "global_step": 38696, "epoch": 921} {"train_loss": -5.283329963684082, "global_step": 38697, "epoch": 921} {"train_loss": -5.7093281745910645, "global_step": 38698, "epoch": 921} {"train_loss": -5.4438910484313965, "global_step": 38699, "epoch": 921} {"train_loss": -5.615188121795654, "global_step": 38700, "epoch": 921} {"train_loss": -5.466248035430908, "global_step": 38701, "epoch": 921} {"train_loss": -5.634042739868164, "global_step": 38702, "epoch": 921} {"train_loss": -5.47225284576416, "global_step": 38703, "epoch": 921} {"train_loss": -5.517270088195801, "global_step": 38704, "epoch": 921} {"train_loss": -5.599091529846191, "global_step": 38705, "epoch": 921} {"train_loss": -5.6380438804626465, "global_step": 38706, "epoch": 921} {"train_loss": -5.469975471496582, "global_step": 38707, "epoch": 921} {"train_loss": -5.516920566558838, "global_step": 38708, "epoch": 921} {"train_loss": -5.575441837310791, "global_step": 38709, "epoch": 921} {"train_loss": -5.5413713455200195, "global_step": 38710, "epoch": 921} {"train_loss": -5.574580192565918, "global_step": 38711, "epoch": 921} {"train_loss": -5.508246898651123, "global_step": 38712, "epoch": 921} {"train_loss": -5.469514846801758, "global_step": 38713, "epoch": 921} {"train_loss": -5.760377883911133, "global_step": 38714, "epoch": 921} {"train_loss": -5.41035270690918, "global_step": 38715, "epoch": 921} {"train_loss": -5.655951499938965, "global_step": 38716, "epoch": 921} {"train_loss": -5.490584373474121, "global_step": 38717, "epoch": 921} {"train_loss": -5.555088043212891, "global_step": 38718, "epoch": 921} {"train_loss": -5.623481750488281, "global_step": 38719, "epoch": 921} {"train_loss": -5.708494663238525, "global_step": 38720, "epoch": 921} {"train_loss": -5.482938766479492, "global_step": 38721, "epoch": 921} {"train_loss": -5.599308013916016, "global_step": 38722, "epoch": 921} {"train_loss": -5.556518350328718, "global_step": 38723, "epoch": 921, "val_loss": 66557.1328125} {"train_loss": -5.595425605773926, "global_step": 38724, "epoch": 922} {"train_loss": -5.582893371582031, "global_step": 38725, "epoch": 922} {"train_loss": -5.49678373336792, "global_step": 38726, "epoch": 922} {"train_loss": -5.721785545349121, "global_step": 38727, "epoch": 922} {"train_loss": -5.683767318725586, "global_step": 38728, "epoch": 922} {"train_loss": -5.53117036819458, "global_step": 38729, "epoch": 922} {"train_loss": -5.544520854949951, "global_step": 38730, "epoch": 922} {"train_loss": -5.613030910491943, "global_step": 38731, "epoch": 922} {"train_loss": -5.648575782775879, "global_step": 38732, "epoch": 922} {"train_loss": -5.443619251251221, "global_step": 38733, "epoch": 922} {"train_loss": -5.618191242218018, "global_step": 38734, "epoch": 922} {"train_loss": -5.599842071533203, "global_step": 38735, "epoch": 922} {"train_loss": -5.51329231262207, "global_step": 38736, "epoch": 922} {"train_loss": -5.558528900146484, "global_step": 38737, "epoch": 922} {"train_loss": -5.62393856048584, "global_step": 38738, "epoch": 922} {"train_loss": -5.811112403869629, "global_step": 38739, "epoch": 922} {"train_loss": -5.684395790100098, "global_step": 38740, "epoch": 922} {"train_loss": -5.560736656188965, "global_step": 38741, "epoch": 922} {"train_loss": -5.647594451904297, "global_step": 38742, "epoch": 922} {"train_loss": -5.573175430297852, "global_step": 38743, "epoch": 922} {"train_loss": -5.687685966491699, "global_step": 38744, "epoch": 922} {"train_loss": -5.701499938964844, "global_step": 38745, "epoch": 922} {"train_loss": -5.57883358001709, "global_step": 38746, "epoch": 922} {"train_loss": -5.543312072753906, "global_step": 38747, "epoch": 922} {"train_loss": -5.61128044128418, "global_step": 38748, "epoch": 922} {"train_loss": -5.58952522277832, "global_step": 38749, "epoch": 922} {"train_loss": -5.478432655334473, "global_step": 38750, "epoch": 922} {"train_loss": -5.568016529083252, "global_step": 38751, "epoch": 922} {"train_loss": -5.550799369812012, "global_step": 38752, "epoch": 922} {"train_loss": -5.518355369567871, "global_step": 38753, "epoch": 922} {"train_loss": -5.519292831420898, "global_step": 38754, "epoch": 922} {"train_loss": -5.542769432067871, "global_step": 38755, "epoch": 922} {"train_loss": -5.495011329650879, "global_step": 38756, "epoch": 922} {"train_loss": -5.603654861450195, "global_step": 38757, "epoch": 922} {"train_loss": -5.626294136047363, "global_step": 38758, "epoch": 922} {"train_loss": -5.505897521972656, "global_step": 38759, "epoch": 922} {"train_loss": -5.587194442749023, "global_step": 38760, "epoch": 922} {"train_loss": -5.356032371520996, "global_step": 38761, "epoch": 922} {"train_loss": -5.621262073516846, "global_step": 38762, "epoch": 922} {"train_loss": -5.658914089202881, "global_step": 38763, "epoch": 922} {"train_loss": -5.670596122741699, "global_step": 38764, "epoch": 922} {"train_loss": -5.590210051763625, "global_step": 38765, "epoch": 922, "val_loss": 65753.6640625} {"train_loss": -5.685962677001953, "global_step": 38766, "epoch": 923} {"train_loss": -5.568823337554932, "global_step": 38767, "epoch": 923} {"train_loss": -5.544563293457031, "global_step": 38768, "epoch": 923} {"train_loss": -5.70999813079834, "global_step": 38769, "epoch": 923} {"train_loss": -5.611227512359619, "global_step": 38770, "epoch": 923} {"train_loss": -5.599961280822754, "global_step": 38771, "epoch": 923} {"train_loss": -5.672739028930664, "global_step": 38772, "epoch": 923} {"train_loss": -5.556457996368408, "global_step": 38773, "epoch": 923} {"train_loss": -5.523867607116699, "global_step": 38774, "epoch": 923} {"train_loss": -5.741600036621094, "global_step": 38775, "epoch": 923} {"train_loss": -5.707755088806152, "global_step": 38776, "epoch": 923} {"train_loss": -5.726943492889404, "global_step": 38777, "epoch": 923} {"train_loss": -5.601673126220703, "global_step": 38778, "epoch": 923} {"train_loss": -5.672428131103516, "global_step": 38779, "epoch": 923} {"train_loss": -5.529729843139648, "global_step": 38780, "epoch": 923} {"train_loss": -5.676241874694824, "global_step": 38781, "epoch": 923} {"train_loss": -5.510329246520996, "global_step": 38782, "epoch": 923} {"train_loss": -5.57525110244751, "global_step": 38783, "epoch": 923} {"train_loss": -5.616507530212402, "global_step": 38784, "epoch": 923} {"train_loss": -5.683066368103027, "global_step": 38785, "epoch": 923} {"train_loss": -5.647337913513184, "global_step": 38786, "epoch": 923} {"train_loss": -5.583194732666016, "global_step": 38787, "epoch": 923} {"train_loss": -5.588304042816162, "global_step": 38788, "epoch": 923} {"train_loss": -5.552609920501709, "global_step": 38789, "epoch": 923} {"train_loss": -5.530215740203857, "global_step": 38790, "epoch": 923} {"train_loss": -5.572718143463135, "global_step": 38791, "epoch": 923} {"train_loss": -5.577898979187012, "global_step": 38792, "epoch": 923} {"train_loss": -5.66663932800293, "global_step": 38793, "epoch": 923} {"train_loss": -5.649203777313232, "global_step": 38794, "epoch": 923} {"train_loss": -5.664305686950684, "global_step": 38795, "epoch": 923} {"train_loss": -5.528659820556641, "global_step": 38796, "epoch": 923} {"train_loss": -5.683225154876709, "global_step": 38797, "epoch": 923} {"train_loss": -5.634279251098633, "global_step": 38798, "epoch": 923} {"train_loss": -5.608675956726074, "global_step": 38799, "epoch": 923} {"train_loss": -5.548135757446289, "global_step": 38800, "epoch": 923} {"train_loss": -5.6490936279296875, "global_step": 38801, "epoch": 923} {"train_loss": -5.72942590713501, "global_step": 38802, "epoch": 923} {"train_loss": -5.652736663818359, "global_step": 38803, "epoch": 923} {"train_loss": -5.609958648681641, "global_step": 38804, "epoch": 923} {"train_loss": -5.677128791809082, "global_step": 38805, "epoch": 923} {"train_loss": -5.620683670043945, "global_step": 38806, "epoch": 923} {"train_loss": -5.620134751001994, "global_step": 38807, "epoch": 923, "val_loss": 65860.1953125} {"train_loss": -5.629555702209473, "global_step": 38808, "epoch": 924} {"train_loss": -5.622851371765137, "global_step": 38809, "epoch": 924} {"train_loss": -5.714051246643066, "global_step": 38810, "epoch": 924} {"train_loss": -5.726007461547852, "global_step": 38811, "epoch": 924} {"train_loss": -5.691748142242432, "global_step": 38812, "epoch": 924} {"train_loss": -5.664834022521973, "global_step": 38813, "epoch": 924} {"train_loss": -5.714158058166504, "global_step": 38814, "epoch": 924} {"train_loss": -5.7279863357543945, "global_step": 38815, "epoch": 924} {"train_loss": -5.795243263244629, "global_step": 38816, "epoch": 924} {"train_loss": -5.639392375946045, "global_step": 38817, "epoch": 924} {"train_loss": -5.674992084503174, "global_step": 38818, "epoch": 924} {"train_loss": -5.427151679992676, "global_step": 38819, "epoch": 924} {"train_loss": -5.577502250671387, "global_step": 38820, "epoch": 924} {"train_loss": -5.641733169555664, "global_step": 38821, "epoch": 924} {"train_loss": -5.755571365356445, "global_step": 38822, "epoch": 924} {"train_loss": -5.450600624084473, "global_step": 38823, "epoch": 924} {"train_loss": -5.668517112731934, "global_step": 38824, "epoch": 924} {"train_loss": -5.524427890777588, "global_step": 38825, "epoch": 924} {"train_loss": -5.5626630783081055, "global_step": 38826, "epoch": 924} {"train_loss": -5.673027992248535, "global_step": 38827, "epoch": 924} {"train_loss": -5.4233598709106445, "global_step": 38828, "epoch": 924} {"train_loss": -5.587804794311523, "global_step": 38829, "epoch": 924} {"train_loss": -5.608956336975098, "global_step": 38830, "epoch": 924} {"train_loss": -5.568859100341797, "global_step": 38831, "epoch": 924} {"train_loss": -5.701722145080566, "global_step": 38832, "epoch": 924} {"train_loss": -5.647970199584961, "global_step": 38833, "epoch": 924} {"train_loss": -5.568648815155029, "global_step": 38834, "epoch": 924} {"train_loss": -5.655967712402344, "global_step": 38835, "epoch": 924} {"train_loss": -5.587569236755371, "global_step": 38836, "epoch": 924} {"train_loss": -5.5484113693237305, "global_step": 38837, "epoch": 924} {"train_loss": -5.616225242614746, "global_step": 38838, "epoch": 924} {"train_loss": -5.571516990661621, "global_step": 38839, "epoch": 924} {"train_loss": -5.653586387634277, "global_step": 38840, "epoch": 924} {"train_loss": -5.557636737823486, "global_step": 38841, "epoch": 924} {"train_loss": -5.678840160369873, "global_step": 38842, "epoch": 924} {"train_loss": -5.649715423583984, "global_step": 38843, "epoch": 924} {"train_loss": -5.465099811553955, "global_step": 38844, "epoch": 924} {"train_loss": -5.626489639282227, "global_step": 38845, "epoch": 924} {"train_loss": -5.418768882751465, "global_step": 38846, "epoch": 924} {"train_loss": -5.407700538635254, "global_step": 38847, "epoch": 924} {"train_loss": -5.446504592895508, "global_step": 38848, "epoch": 924} {"train_loss": -5.603813886642456, "global_step": 38849, "epoch": 924, "val_loss": 66367.921875} {"train_loss": -5.583305835723877, "global_step": 38850, "epoch": 925} {"train_loss": -5.45514440536499, "global_step": 38851, "epoch": 925} {"train_loss": -5.6079607009887695, "global_step": 38852, "epoch": 925} {"train_loss": -5.442227840423584, "global_step": 38853, "epoch": 925} {"train_loss": -5.594437122344971, "global_step": 38854, "epoch": 925} {"train_loss": -5.6353302001953125, "global_step": 38855, "epoch": 925} {"train_loss": -5.630699157714844, "global_step": 38856, "epoch": 925} {"train_loss": -5.582996368408203, "global_step": 38857, "epoch": 925} {"train_loss": -5.569666862487793, "global_step": 38858, "epoch": 925} {"train_loss": -5.536213397979736, "global_step": 38859, "epoch": 925} {"train_loss": -5.6710968017578125, "global_step": 38860, "epoch": 925} {"train_loss": -5.553596019744873, "global_step": 38861, "epoch": 925} {"train_loss": -5.563961029052734, "global_step": 38862, "epoch": 925} {"train_loss": -5.661494255065918, "global_step": 38863, "epoch": 925} {"train_loss": -5.711941719055176, "global_step": 38864, "epoch": 925} {"train_loss": -5.678532600402832, "global_step": 38865, "epoch": 925} {"train_loss": -5.627988815307617, "global_step": 38866, "epoch": 925} {"train_loss": -5.543322563171387, "global_step": 38867, "epoch": 925} {"train_loss": -5.5514984130859375, "global_step": 38868, "epoch": 925} {"train_loss": -5.560759544372559, "global_step": 38869, "epoch": 925} {"train_loss": -5.614964008331299, "global_step": 38870, "epoch": 925} {"train_loss": -5.533573627471924, "global_step": 38871, "epoch": 925} {"train_loss": -5.624698162078857, "global_step": 38872, "epoch": 925} {"train_loss": -5.5806965827941895, "global_step": 38873, "epoch": 925} {"train_loss": -5.546082496643066, "global_step": 38874, "epoch": 925} {"train_loss": -5.69439697265625, "global_step": 38875, "epoch": 925} {"train_loss": -5.654279708862305, "global_step": 38876, "epoch": 925} {"train_loss": -5.575282573699951, "global_step": 38877, "epoch": 925} {"train_loss": -5.641210556030273, "global_step": 38878, "epoch": 925} {"train_loss": -5.539501190185547, "global_step": 38879, "epoch": 925} {"train_loss": -5.601382255554199, "global_step": 38880, "epoch": 925} {"train_loss": -5.49672794342041, "global_step": 38881, "epoch": 925} {"train_loss": -5.581458568572998, "global_step": 38882, "epoch": 925} {"train_loss": -5.6092000007629395, "global_step": 38883, "epoch": 925} {"train_loss": -5.654484748840332, "global_step": 38884, "epoch": 925} {"train_loss": -5.582873344421387, "global_step": 38885, "epoch": 925} {"train_loss": -5.676119804382324, "global_step": 38886, "epoch": 925} {"train_loss": -5.724916458129883, "global_step": 38887, "epoch": 925} {"train_loss": -5.542852401733398, "global_step": 38888, "epoch": 925} {"train_loss": -5.732554912567139, "global_step": 38889, "epoch": 925} {"train_loss": -5.690820693969727, "global_step": 38890, "epoch": 925} {"train_loss": -5.599628993443081, "global_step": 38891, "epoch": 925, "val_loss": 65880.9921875} {"train_loss": -5.720721244812012, "global_step": 38892, "epoch": 926} {"train_loss": -5.660708427429199, "global_step": 38893, "epoch": 926} {"train_loss": -5.565295219421387, "global_step": 38894, "epoch": 926} {"train_loss": -5.792672157287598, "global_step": 38895, "epoch": 926} {"train_loss": -5.51663064956665, "global_step": 38896, "epoch": 926} {"train_loss": -5.6224846839904785, "global_step": 38897, "epoch": 926} {"train_loss": -5.597538471221924, "global_step": 38898, "epoch": 926} {"train_loss": -5.497313499450684, "global_step": 38899, "epoch": 926} {"train_loss": -5.652865886688232, "global_step": 38900, "epoch": 926} {"train_loss": -5.62972354888916, "global_step": 38901, "epoch": 926} {"train_loss": -5.515542984008789, "global_step": 38902, "epoch": 926} {"train_loss": -5.519366264343262, "global_step": 38903, "epoch": 926} {"train_loss": -5.63462495803833, "global_step": 38904, "epoch": 926} {"train_loss": -5.5824995040893555, "global_step": 38905, "epoch": 926} {"train_loss": -5.536373138427734, "global_step": 38906, "epoch": 926} {"train_loss": -5.592110633850098, "global_step": 38907, "epoch": 926} {"train_loss": -5.678253173828125, "global_step": 38908, "epoch": 926} {"train_loss": -5.585817337036133, "global_step": 38909, "epoch": 926} {"train_loss": -5.627286911010742, "global_step": 38910, "epoch": 926} {"train_loss": -5.671479225158691, "global_step": 38911, "epoch": 926} {"train_loss": -5.681360721588135, "global_step": 38912, "epoch": 926} {"train_loss": -5.56889533996582, "global_step": 38913, "epoch": 926} {"train_loss": -5.629130840301514, "global_step": 38914, "epoch": 926} {"train_loss": -5.720972061157227, "global_step": 38915, "epoch": 926} {"train_loss": -5.650015830993652, "global_step": 38916, "epoch": 926} {"train_loss": -5.611645698547363, "global_step": 38917, "epoch": 926} {"train_loss": -5.668929100036621, "global_step": 38918, "epoch": 926} {"train_loss": -5.638570308685303, "global_step": 38919, "epoch": 926} {"train_loss": -5.653126239776611, "global_step": 38920, "epoch": 926} {"train_loss": -5.697336673736572, "global_step": 38921, "epoch": 926} {"train_loss": -5.635986804962158, "global_step": 38922, "epoch": 926} {"train_loss": -5.563973426818848, "global_step": 38923, "epoch": 926} {"train_loss": -5.483697414398193, "global_step": 38924, "epoch": 926} {"train_loss": -5.740442276000977, "global_step": 38925, "epoch": 926} {"train_loss": -5.567355155944824, "global_step": 38926, "epoch": 926} {"train_loss": -5.685380935668945, "global_step": 38927, "epoch": 926} {"train_loss": -5.712312698364258, "global_step": 38928, "epoch": 926} {"train_loss": -5.517389297485352, "global_step": 38929, "epoch": 926} {"train_loss": -5.596206188201904, "global_step": 38930, "epoch": 926} {"train_loss": -5.697031021118164, "global_step": 38931, "epoch": 926} {"train_loss": -5.655163288116455, "global_step": 38932, "epoch": 926} {"train_loss": -5.621667203449068, "global_step": 38933, "epoch": 926, "val_loss": 65844.1953125} {"train_loss": -5.607174873352051, "global_step": 38934, "epoch": 927} {"train_loss": -5.668135643005371, "global_step": 38935, "epoch": 927} {"train_loss": -5.621009826660156, "global_step": 38936, "epoch": 927} {"train_loss": -5.54036808013916, "global_step": 38937, "epoch": 927} {"train_loss": -5.609832286834717, "global_step": 38938, "epoch": 927} {"train_loss": -5.567183494567871, "global_step": 38939, "epoch": 927} {"train_loss": -5.642692565917969, "global_step": 38940, "epoch": 927} {"train_loss": -5.5837602615356445, "global_step": 38941, "epoch": 927} {"train_loss": -5.540809154510498, "global_step": 38942, "epoch": 927} {"train_loss": -5.584850311279297, "global_step": 38943, "epoch": 927} {"train_loss": -5.730320930480957, "global_step": 38944, "epoch": 927} {"train_loss": -5.6820831298828125, "global_step": 38945, "epoch": 927} {"train_loss": -5.570830821990967, "global_step": 38946, "epoch": 927} {"train_loss": -5.481109619140625, "global_step": 38947, "epoch": 927} {"train_loss": -5.637748718261719, "global_step": 38948, "epoch": 927} {"train_loss": -5.5666913986206055, "global_step": 38949, "epoch": 927} {"train_loss": -5.646063327789307, "global_step": 38950, "epoch": 927} {"train_loss": -5.477944850921631, "global_step": 38951, "epoch": 927} {"train_loss": -5.651404857635498, "global_step": 38952, "epoch": 927} {"train_loss": -5.452014923095703, "global_step": 38953, "epoch": 927} {"train_loss": -5.6312665939331055, "global_step": 38954, "epoch": 927} {"train_loss": -5.595580577850342, "global_step": 38955, "epoch": 927} {"train_loss": -5.70458984375, "global_step": 38956, "epoch": 927} {"train_loss": -5.731534004211426, "global_step": 38957, "epoch": 927} {"train_loss": -5.679351806640625, "global_step": 38958, "epoch": 927} {"train_loss": -5.505388259887695, "global_step": 38959, "epoch": 927} {"train_loss": -5.683351039886475, "global_step": 38960, "epoch": 927} {"train_loss": -5.641921520233154, "global_step": 38961, "epoch": 927} {"train_loss": -5.4656195640563965, "global_step": 38962, "epoch": 927} {"train_loss": -5.665732383728027, "global_step": 38963, "epoch": 927} {"train_loss": -5.596553802490234, "global_step": 38964, "epoch": 927} {"train_loss": -5.491890907287598, "global_step": 38965, "epoch": 927} {"train_loss": -5.64454984664917, "global_step": 38966, "epoch": 927} {"train_loss": -5.56618595123291, "global_step": 38967, "epoch": 927} {"train_loss": -5.596979141235352, "global_step": 38968, "epoch": 927} {"train_loss": -5.7258148193359375, "global_step": 38969, "epoch": 927} {"train_loss": -5.592170715332031, "global_step": 38970, "epoch": 927} {"train_loss": -5.58383846282959, "global_step": 38971, "epoch": 927} {"train_loss": -5.730945110321045, "global_step": 38972, "epoch": 927} {"train_loss": -5.605825424194336, "global_step": 38973, "epoch": 927} {"train_loss": -5.530710697174072, "global_step": 38974, "epoch": 927} {"train_loss": -5.606839566003709, "global_step": 38975, "epoch": 927, "val_loss": 66318.6640625} {"train_loss": -5.547729015350342, "global_step": 38976, "epoch": 928} {"train_loss": -5.6049957275390625, "global_step": 38977, "epoch": 928} {"train_loss": -5.591691493988037, "global_step": 38978, "epoch": 928} {"train_loss": -5.717011451721191, "global_step": 38979, "epoch": 928} {"train_loss": -5.707388877868652, "global_step": 38980, "epoch": 928} {"train_loss": -5.635407447814941, "global_step": 38981, "epoch": 928} {"train_loss": -5.696455001831055, "global_step": 38982, "epoch": 928} {"train_loss": -5.732521057128906, "global_step": 38983, "epoch": 928} {"train_loss": -5.602083206176758, "global_step": 38984, "epoch": 928} {"train_loss": -5.632551193237305, "global_step": 38985, "epoch": 928} {"train_loss": -5.735997200012207, "global_step": 38986, "epoch": 928} {"train_loss": -5.625547409057617, "global_step": 38987, "epoch": 928} {"train_loss": -5.532411575317383, "global_step": 38988, "epoch": 928} {"train_loss": -5.612195014953613, "global_step": 38989, "epoch": 928} {"train_loss": -5.582437038421631, "global_step": 38990, "epoch": 928} {"train_loss": -5.488099575042725, "global_step": 38991, "epoch": 928} {"train_loss": -5.668568134307861, "global_step": 38992, "epoch": 928} {"train_loss": -5.565515518188477, "global_step": 38993, "epoch": 928} {"train_loss": -5.707981109619141, "global_step": 38994, "epoch": 928} {"train_loss": -5.684428691864014, "global_step": 38995, "epoch": 928} {"train_loss": -5.559910774230957, "global_step": 38996, "epoch": 928} {"train_loss": -5.513314247131348, "global_step": 38997, "epoch": 928} {"train_loss": -5.546810150146484, "global_step": 38998, "epoch": 928} {"train_loss": -5.523130416870117, "global_step": 38999, "epoch": 928} {"train_loss": -5.599270343780518, "global_step": 39000, "epoch": 928} {"train_loss": -5.670642375946045, "global_step": 39001, "epoch": 928} {"train_loss": -5.588550090789795, "global_step": 39002, "epoch": 928} {"train_loss": -5.6691789627075195, "global_step": 39003, "epoch": 928} {"train_loss": -5.524068832397461, "global_step": 39004, "epoch": 928} {"train_loss": -5.620030403137207, "global_step": 39005, "epoch": 928} {"train_loss": -5.699393272399902, "global_step": 39006, "epoch": 928} {"train_loss": -5.580263137817383, "global_step": 39007, "epoch": 928} {"train_loss": -5.706789970397949, "global_step": 39008, "epoch": 928} {"train_loss": -5.698483467102051, "global_step": 39009, "epoch": 928} {"train_loss": -5.613568305969238, "global_step": 39010, "epoch": 928} {"train_loss": -5.666144847869873, "global_step": 39011, "epoch": 928} {"train_loss": -5.4722113609313965, "global_step": 39012, "epoch": 928} {"train_loss": -5.460484981536865, "global_step": 39013, "epoch": 928} {"train_loss": -5.633552074432373, "global_step": 39014, "epoch": 928} {"train_loss": -5.795340061187744, "global_step": 39015, "epoch": 928} {"train_loss": -5.637591361999512, "global_step": 39016, "epoch": 928} {"train_loss": -5.618513970147996, "global_step": 39017, "epoch": 928, "val_loss": 66507.8828125} {"train_loss": -5.600441932678223, "global_step": 39018, "epoch": 929} {"train_loss": -5.693636894226074, "global_step": 39019, "epoch": 929} {"train_loss": -5.539763450622559, "global_step": 39020, "epoch": 929} {"train_loss": -5.636545658111572, "global_step": 39021, "epoch": 929} {"train_loss": -5.661371231079102, "global_step": 39022, "epoch": 929} {"train_loss": -5.631379127502441, "global_step": 39023, "epoch": 929} {"train_loss": -5.672186851501465, "global_step": 39024, "epoch": 929} {"train_loss": -5.643163681030273, "global_step": 39025, "epoch": 929} {"train_loss": -5.460764408111572, "global_step": 39026, "epoch": 929} {"train_loss": -5.551527976989746, "global_step": 39027, "epoch": 929} {"train_loss": -5.623740196228027, "global_step": 39028, "epoch": 929} {"train_loss": -5.572147369384766, "global_step": 39029, "epoch": 929} {"train_loss": -5.62359619140625, "global_step": 39030, "epoch": 929} {"train_loss": -5.5288543701171875, "global_step": 39031, "epoch": 929} {"train_loss": -5.503934383392334, "global_step": 39032, "epoch": 929} {"train_loss": -5.532077789306641, "global_step": 39033, "epoch": 929} {"train_loss": -5.573493003845215, "global_step": 39034, "epoch": 929} {"train_loss": -5.617794036865234, "global_step": 39035, "epoch": 929} {"train_loss": -5.454930305480957, "global_step": 39036, "epoch": 929} {"train_loss": -5.566756248474121, "global_step": 39037, "epoch": 929} {"train_loss": -5.694952487945557, "global_step": 39038, "epoch": 929} {"train_loss": -5.580623626708984, "global_step": 39039, "epoch": 929} {"train_loss": -5.671403884887695, "global_step": 39040, "epoch": 929} {"train_loss": -5.429930686950684, "global_step": 39041, "epoch": 929} {"train_loss": -5.5506720542907715, "global_step": 39042, "epoch": 929} {"train_loss": -5.618592262268066, "global_step": 39043, "epoch": 929} {"train_loss": -5.4373860359191895, "global_step": 39044, "epoch": 929} {"train_loss": -5.634336948394775, "global_step": 39045, "epoch": 929} {"train_loss": -5.453499794006348, "global_step": 39046, "epoch": 929} {"train_loss": -5.584958553314209, "global_step": 39047, "epoch": 929} {"train_loss": -5.745589256286621, "global_step": 39048, "epoch": 929} {"train_loss": -5.6890106201171875, "global_step": 39049, "epoch": 929} {"train_loss": -5.558555603027344, "global_step": 39050, "epoch": 929} {"train_loss": -5.544345855712891, "global_step": 39051, "epoch": 929} {"train_loss": -5.620384216308594, "global_step": 39052, "epoch": 929} {"train_loss": -5.6576008796691895, "global_step": 39053, "epoch": 929} {"train_loss": -5.676056385040283, "global_step": 39054, "epoch": 929} {"train_loss": -5.647268772125244, "global_step": 39055, "epoch": 929} {"train_loss": -5.501177787780762, "global_step": 39056, "epoch": 929} {"train_loss": -5.658795356750488, "global_step": 39057, "epoch": 929} {"train_loss": -5.582176685333252, "global_step": 39058, "epoch": 929} {"train_loss": -5.589884156272525, "global_step": 39059, "epoch": 929, "val_loss": 65799.1953125} {"train_loss": -5.773259162902832, "global_step": 39060, "epoch": 930} {"train_loss": -5.603401184082031, "global_step": 39061, "epoch": 930} {"train_loss": -5.547795295715332, "global_step": 39062, "epoch": 930} {"train_loss": -5.61317253112793, "global_step": 39063, "epoch": 930} {"train_loss": -5.624446392059326, "global_step": 39064, "epoch": 930} {"train_loss": -5.6743268966674805, "global_step": 39065, "epoch": 930} {"train_loss": -5.646613121032715, "global_step": 39066, "epoch": 930} {"train_loss": -5.587345123291016, "global_step": 39067, "epoch": 930} {"train_loss": -5.488185405731201, "global_step": 39068, "epoch": 930} {"train_loss": -5.533902645111084, "global_step": 39069, "epoch": 930} {"train_loss": -5.596273422241211, "global_step": 39070, "epoch": 930} {"train_loss": -5.589084625244141, "global_step": 39071, "epoch": 930} {"train_loss": -5.663333415985107, "global_step": 39072, "epoch": 930} {"train_loss": -5.604660511016846, "global_step": 39073, "epoch": 930} {"train_loss": -5.640256404876709, "global_step": 39074, "epoch": 930} {"train_loss": -5.6325836181640625, "global_step": 39075, "epoch": 930} {"train_loss": -5.706160545349121, "global_step": 39076, "epoch": 930} {"train_loss": -5.694669723510742, "global_step": 39077, "epoch": 930} {"train_loss": -5.622714996337891, "global_step": 39078, "epoch": 930} {"train_loss": -5.519504547119141, "global_step": 39079, "epoch": 930} {"train_loss": -5.4861578941345215, "global_step": 39080, "epoch": 930} {"train_loss": -5.557276248931885, "global_step": 39081, "epoch": 930} {"train_loss": -5.683450222015381, "global_step": 39082, "epoch": 930} {"train_loss": -5.646154403686523, "global_step": 39083, "epoch": 930} {"train_loss": -5.643084526062012, "global_step": 39084, "epoch": 930} {"train_loss": -5.714783668518066, "global_step": 39085, "epoch": 930} {"train_loss": -5.613249778747559, "global_step": 39086, "epoch": 930} {"train_loss": -5.725383758544922, "global_step": 39087, "epoch": 930} {"train_loss": -5.77644157409668, "global_step": 39088, "epoch": 930} {"train_loss": -5.7403035163879395, "global_step": 39089, "epoch": 930} {"train_loss": -5.607486724853516, "global_step": 39090, "epoch": 930} {"train_loss": -5.588937759399414, "global_step": 39091, "epoch": 930} {"train_loss": -5.587343215942383, "global_step": 39092, "epoch": 930} {"train_loss": -5.708583831787109, "global_step": 39093, "epoch": 930} {"train_loss": -5.555221080780029, "global_step": 39094, "epoch": 930} {"train_loss": -5.515974044799805, "global_step": 39095, "epoch": 930} {"train_loss": -5.671399116516113, "global_step": 39096, "epoch": 930} {"train_loss": -5.560434818267822, "global_step": 39097, "epoch": 930} {"train_loss": -5.624911785125732, "global_step": 39098, "epoch": 930} {"train_loss": -5.6728901863098145, "global_step": 39099, "epoch": 930} {"train_loss": -5.496433258056641, "global_step": 39100, "epoch": 930} {"train_loss": -5.62170071828933, "global_step": 39101, "epoch": 930, "val_loss": 66149.3046875} {"train_loss": -5.50960636138916, "global_step": 39102, "epoch": 931} {"train_loss": -5.593663692474365, "global_step": 39103, "epoch": 931} {"train_loss": -5.588629722595215, "global_step": 39104, "epoch": 931} {"train_loss": -5.5353102684021, "global_step": 39105, "epoch": 931} {"train_loss": -5.520193576812744, "global_step": 39106, "epoch": 931} {"train_loss": -5.556118011474609, "global_step": 39107, "epoch": 931} {"train_loss": -5.595652103424072, "global_step": 39108, "epoch": 931} {"train_loss": -5.524601936340332, "global_step": 39109, "epoch": 931} {"train_loss": -5.5820841789245605, "global_step": 39110, "epoch": 931} {"train_loss": -5.693935871124268, "global_step": 39111, "epoch": 931} {"train_loss": -5.5213518142700195, "global_step": 39112, "epoch": 931} {"train_loss": -5.673708915710449, "global_step": 39113, "epoch": 931} {"train_loss": -5.608114242553711, "global_step": 39114, "epoch": 931} {"train_loss": -5.621466159820557, "global_step": 39115, "epoch": 931} {"train_loss": -5.693232536315918, "global_step": 39116, "epoch": 931} {"train_loss": -5.642892837524414, "global_step": 39117, "epoch": 931} {"train_loss": -5.588450908660889, "global_step": 39118, "epoch": 931} {"train_loss": -5.593105316162109, "global_step": 39119, "epoch": 931} {"train_loss": -5.541313171386719, "global_step": 39120, "epoch": 931} {"train_loss": -5.668026924133301, "global_step": 39121, "epoch": 931} {"train_loss": -5.545240879058838, "global_step": 39122, "epoch": 931} {"train_loss": -5.56048583984375, "global_step": 39123, "epoch": 931} {"train_loss": -5.604353904724121, "global_step": 39124, "epoch": 931} {"train_loss": -5.633819580078125, "global_step": 39125, "epoch": 931} {"train_loss": -5.4649248123168945, "global_step": 39126, "epoch": 931} {"train_loss": -5.701810836791992, "global_step": 39127, "epoch": 931} {"train_loss": -5.592777729034424, "global_step": 39128, "epoch": 931} {"train_loss": -5.720362663269043, "global_step": 39129, "epoch": 931} {"train_loss": -5.679826259613037, "global_step": 39130, "epoch": 931} {"train_loss": -5.61586332321167, "global_step": 39131, "epoch": 931} {"train_loss": -5.531755447387695, "global_step": 39132, "epoch": 931} {"train_loss": -5.616618633270264, "global_step": 39133, "epoch": 931} {"train_loss": -5.574999809265137, "global_step": 39134, "epoch": 931} {"train_loss": -5.728433132171631, "global_step": 39135, "epoch": 931} {"train_loss": -5.585921764373779, "global_step": 39136, "epoch": 931} {"train_loss": -5.688286781311035, "global_step": 39137, "epoch": 931} {"train_loss": -5.634213924407959, "global_step": 39138, "epoch": 931} {"train_loss": -5.572261810302734, "global_step": 39139, "epoch": 931} {"train_loss": -5.668767929077148, "global_step": 39140, "epoch": 931} {"train_loss": -5.628172874450684, "global_step": 39141, "epoch": 931} {"train_loss": -5.613876819610596, "global_step": 39142, "epoch": 931} {"train_loss": -5.609044313430786, "global_step": 39143, "epoch": 931, "val_loss": 65990.640625} {"train_loss": -5.66536808013916, "global_step": 39144, "epoch": 932} {"train_loss": -5.58934211730957, "global_step": 39145, "epoch": 932} {"train_loss": -5.565400123596191, "global_step": 39146, "epoch": 932} {"train_loss": -5.736973762512207, "global_step": 39147, "epoch": 932} {"train_loss": -5.556020736694336, "global_step": 39148, "epoch": 932} {"train_loss": -5.629611968994141, "global_step": 39149, "epoch": 932} {"train_loss": -5.652084827423096, "global_step": 39150, "epoch": 932} {"train_loss": -5.701125144958496, "global_step": 39151, "epoch": 932} {"train_loss": -5.728618621826172, "global_step": 39152, "epoch": 932} {"train_loss": -5.625186920166016, "global_step": 39153, "epoch": 932} {"train_loss": -5.7017436027526855, "global_step": 39154, "epoch": 932} {"train_loss": -5.6991424560546875, "global_step": 39155, "epoch": 932} {"train_loss": -5.463111877441406, "global_step": 39156, "epoch": 932} {"train_loss": -5.619785785675049, "global_step": 39157, "epoch": 932} {"train_loss": -5.657571315765381, "global_step": 39158, "epoch": 932} {"train_loss": -5.691738128662109, "global_step": 39159, "epoch": 932} {"train_loss": -5.467522621154785, "global_step": 39160, "epoch": 932} {"train_loss": -5.495070934295654, "global_step": 39161, "epoch": 932} {"train_loss": -5.728022575378418, "global_step": 39162, "epoch": 932} {"train_loss": -5.529825210571289, "global_step": 39163, "epoch": 932} {"train_loss": -5.5264105796813965, "global_step": 39164, "epoch": 932} {"train_loss": -5.5714335441589355, "global_step": 39165, "epoch": 932} {"train_loss": -5.5743255615234375, "global_step": 39166, "epoch": 932} {"train_loss": -5.598526954650879, "global_step": 39167, "epoch": 932} {"train_loss": -5.600038051605225, "global_step": 39168, "epoch": 932} {"train_loss": -5.657215595245361, "global_step": 39169, "epoch": 932} {"train_loss": -5.694705963134766, "global_step": 39170, "epoch": 932} {"train_loss": -5.448125839233398, "global_step": 39171, "epoch": 932} {"train_loss": -5.562821865081787, "global_step": 39172, "epoch": 932} {"train_loss": -5.730949401855469, "global_step": 39173, "epoch": 932} {"train_loss": -5.652786731719971, "global_step": 39174, "epoch": 932} {"train_loss": -5.648400783538818, "global_step": 39175, "epoch": 932} {"train_loss": -5.659660816192627, "global_step": 39176, "epoch": 932} {"train_loss": -5.577345371246338, "global_step": 39177, "epoch": 932} {"train_loss": -5.531683921813965, "global_step": 39178, "epoch": 932} {"train_loss": -5.560357570648193, "global_step": 39179, "epoch": 932} {"train_loss": -5.603948593139648, "global_step": 39180, "epoch": 932} {"train_loss": -5.643742561340332, "global_step": 39181, "epoch": 932} {"train_loss": -5.6367082595825195, "global_step": 39182, "epoch": 932} {"train_loss": -5.770304203033447, "global_step": 39183, "epoch": 932} {"train_loss": -5.61068058013916, "global_step": 39184, "epoch": 932} {"train_loss": -5.615549587068104, "global_step": 39185, "epoch": 932, "val_loss": 66289.4140625} {"train_loss": -5.634371757507324, "global_step": 39186, "epoch": 933} {"train_loss": -5.518364429473877, "global_step": 39187, "epoch": 933} {"train_loss": -5.656332015991211, "global_step": 39188, "epoch": 933} {"train_loss": -5.56804895401001, "global_step": 39189, "epoch": 933} {"train_loss": -5.539920806884766, "global_step": 39190, "epoch": 933} {"train_loss": -5.534402847290039, "global_step": 39191, "epoch": 933} {"train_loss": -5.734947681427002, "global_step": 39192, "epoch": 933} {"train_loss": -5.541377067565918, "global_step": 39193, "epoch": 933} {"train_loss": -5.548452377319336, "global_step": 39194, "epoch": 933} {"train_loss": -5.730532169342041, "global_step": 39195, "epoch": 933} {"train_loss": -5.594442367553711, "global_step": 39196, "epoch": 933} {"train_loss": -5.544456481933594, "global_step": 39197, "epoch": 933} {"train_loss": -5.54144811630249, "global_step": 39198, "epoch": 933} {"train_loss": -5.625449180603027, "global_step": 39199, "epoch": 933} {"train_loss": -5.523468017578125, "global_step": 39200, "epoch": 933} {"train_loss": -5.626460075378418, "global_step": 39201, "epoch": 933} {"train_loss": -5.531098365783691, "global_step": 39202, "epoch": 933} {"train_loss": -5.670132637023926, "global_step": 39203, "epoch": 933} {"train_loss": -5.538525581359863, "global_step": 39204, "epoch": 933} {"train_loss": -5.623112678527832, "global_step": 39205, "epoch": 933} {"train_loss": -5.747490406036377, "global_step": 39206, "epoch": 933} {"train_loss": -5.636318683624268, "global_step": 39207, "epoch": 933} {"train_loss": -5.643877983093262, "global_step": 39208, "epoch": 933} {"train_loss": -5.630125999450684, "global_step": 39209, "epoch": 933} {"train_loss": -5.578415870666504, "global_step": 39210, "epoch": 933} {"train_loss": -5.641776084899902, "global_step": 39211, "epoch": 933} {"train_loss": -5.68021297454834, "global_step": 39212, "epoch": 933} {"train_loss": -5.560548305511475, "global_step": 39213, "epoch": 933} {"train_loss": -5.482959747314453, "global_step": 39214, "epoch": 933} {"train_loss": -5.624804496765137, "global_step": 39215, "epoch": 933} {"train_loss": -5.491592884063721, "global_step": 39216, "epoch": 933} {"train_loss": -5.592442512512207, "global_step": 39217, "epoch": 933} {"train_loss": -5.693878173828125, "global_step": 39218, "epoch": 933} {"train_loss": -5.5743536949157715, "global_step": 39219, "epoch": 933} {"train_loss": -5.601762294769287, "global_step": 39220, "epoch": 933} {"train_loss": -5.585596084594727, "global_step": 39221, "epoch": 933} {"train_loss": -5.637173652648926, "global_step": 39222, "epoch": 933} {"train_loss": -5.6465277671813965, "global_step": 39223, "epoch": 933} {"train_loss": -5.508292198181152, "global_step": 39224, "epoch": 933} {"train_loss": -5.413037300109863, "global_step": 39225, "epoch": 933} {"train_loss": -5.610304832458496, "global_step": 39226, "epoch": 933} {"train_loss": -5.59270361491612, "global_step": 39227, "epoch": 933, "val_loss": 66461.7578125} {"train_loss": -5.618123531341553, "global_step": 39228, "epoch": 934} {"train_loss": -5.620810031890869, "global_step": 39229, "epoch": 934} {"train_loss": -5.624794960021973, "global_step": 39230, "epoch": 934} {"train_loss": -5.607593536376953, "global_step": 39231, "epoch": 934} {"train_loss": -5.545319080352783, "global_step": 39232, "epoch": 934} {"train_loss": -5.6076273918151855, "global_step": 39233, "epoch": 934} {"train_loss": -5.648008346557617, "global_step": 39234, "epoch": 934} {"train_loss": -5.5822858810424805, "global_step": 39235, "epoch": 934} {"train_loss": -5.654606342315674, "global_step": 39236, "epoch": 934} {"train_loss": -5.547061920166016, "global_step": 39237, "epoch": 934} {"train_loss": -5.5371503829956055, "global_step": 39238, "epoch": 934} {"train_loss": -5.72458028793335, "global_step": 39239, "epoch": 934} {"train_loss": -5.433206081390381, "global_step": 39240, "epoch": 934} {"train_loss": -5.69488525390625, "global_step": 39241, "epoch": 934} {"train_loss": -5.570739269256592, "global_step": 39242, "epoch": 934} {"train_loss": -5.58869743347168, "global_step": 39243, "epoch": 934} {"train_loss": -5.615949630737305, "global_step": 39244, "epoch": 934} {"train_loss": -5.654450416564941, "global_step": 39245, "epoch": 934} {"train_loss": -5.4282402992248535, "global_step": 39246, "epoch": 934} {"train_loss": -5.5645751953125, "global_step": 39247, "epoch": 934} {"train_loss": -5.555865287780762, "global_step": 39248, "epoch": 934} {"train_loss": -5.497926712036133, "global_step": 39249, "epoch": 934} {"train_loss": -5.563042163848877, "global_step": 39250, "epoch": 934} {"train_loss": -5.774946212768555, "global_step": 39251, "epoch": 934} {"train_loss": -5.629975318908691, "global_step": 39252, "epoch": 934} {"train_loss": -5.6558990478515625, "global_step": 39253, "epoch": 934} {"train_loss": -5.575031280517578, "global_step": 39254, "epoch": 934} {"train_loss": -5.543551445007324, "global_step": 39255, "epoch": 934} {"train_loss": -5.617149353027344, "global_step": 39256, "epoch": 934} {"train_loss": -5.6139726638793945, "global_step": 39257, "epoch": 934} {"train_loss": -5.609551429748535, "global_step": 39258, "epoch": 934} {"train_loss": -5.7423553466796875, "global_step": 39259, "epoch": 934} {"train_loss": -5.609882354736328, "global_step": 39260, "epoch": 934} {"train_loss": -5.675259590148926, "global_step": 39261, "epoch": 934} {"train_loss": -5.548446178436279, "global_step": 39262, "epoch": 934} {"train_loss": -5.492659568786621, "global_step": 39263, "epoch": 934} {"train_loss": -5.6503753662109375, "global_step": 39264, "epoch": 934} {"train_loss": -5.673966884613037, "global_step": 39265, "epoch": 934} {"train_loss": -5.583992004394531, "global_step": 39266, "epoch": 934} {"train_loss": -5.520684719085693, "global_step": 39267, "epoch": 934} {"train_loss": -5.506958961486816, "global_step": 39268, "epoch": 934} {"train_loss": -5.599467493238903, "global_step": 39269, "epoch": 934, "val_loss": 66433.859375} {"train_loss": -5.529738426208496, "global_step": 39270, "epoch": 935} {"train_loss": -5.684233665466309, "global_step": 39271, "epoch": 935} {"train_loss": -5.491904258728027, "global_step": 39272, "epoch": 935} {"train_loss": -5.6042585372924805, "global_step": 39273, "epoch": 935} {"train_loss": -5.549004554748535, "global_step": 39274, "epoch": 935} {"train_loss": -5.586426258087158, "global_step": 39275, "epoch": 935} {"train_loss": -5.596278190612793, "global_step": 39276, "epoch": 935} {"train_loss": -5.506686210632324, "global_step": 39277, "epoch": 935} {"train_loss": -5.651500701904297, "global_step": 39278, "epoch": 935} {"train_loss": -5.6186113357543945, "global_step": 39279, "epoch": 935} {"train_loss": -5.46270751953125, "global_step": 39280, "epoch": 935} {"train_loss": -5.5627946853637695, "global_step": 39281, "epoch": 935} {"train_loss": -5.523443222045898, "global_step": 39282, "epoch": 935} {"train_loss": -5.689444065093994, "global_step": 39283, "epoch": 935} {"train_loss": -5.58341121673584, "global_step": 39284, "epoch": 935} {"train_loss": -5.560056686401367, "global_step": 39285, "epoch": 935} {"train_loss": -5.469089508056641, "global_step": 39286, "epoch": 935} {"train_loss": -5.526547431945801, "global_step": 39287, "epoch": 935} {"train_loss": -5.5944294929504395, "global_step": 39288, "epoch": 935} {"train_loss": -5.554605484008789, "global_step": 39289, "epoch": 935} {"train_loss": -5.65351676940918, "global_step": 39290, "epoch": 935} {"train_loss": -5.535857200622559, "global_step": 39291, "epoch": 935} {"train_loss": -5.563870429992676, "global_step": 39292, "epoch": 935} {"train_loss": -5.818760871887207, "global_step": 39293, "epoch": 935} {"train_loss": -5.585574626922607, "global_step": 39294, "epoch": 935} {"train_loss": -5.516115188598633, "global_step": 39295, "epoch": 935} {"train_loss": -5.621190547943115, "global_step": 39296, "epoch": 935} {"train_loss": -5.568136692047119, "global_step": 39297, "epoch": 935} {"train_loss": -5.511997222900391, "global_step": 39298, "epoch": 935} {"train_loss": -5.655074119567871, "global_step": 39299, "epoch": 935} {"train_loss": -5.522136688232422, "global_step": 39300, "epoch": 935} {"train_loss": -5.579171180725098, "global_step": 39301, "epoch": 935} {"train_loss": -5.5943922996521, "global_step": 39302, "epoch": 935} {"train_loss": -5.580914497375488, "global_step": 39303, "epoch": 935} {"train_loss": -5.659856796264648, "global_step": 39304, "epoch": 935} {"train_loss": -5.4846954345703125, "global_step": 39305, "epoch": 935} {"train_loss": -5.559455394744873, "global_step": 39306, "epoch": 935} {"train_loss": -5.651477813720703, "global_step": 39307, "epoch": 935} {"train_loss": -5.61518669128418, "global_step": 39308, "epoch": 935} {"train_loss": -5.672150611877441, "global_step": 39309, "epoch": 935} {"train_loss": -5.726085662841797, "global_step": 39310, "epoch": 935} {"train_loss": -5.583744457789829, "global_step": 39311, "epoch": 935, "val_loss": 66176.109375} {"train_loss": -5.719479560852051, "global_step": 39312, "epoch": 936} {"train_loss": -5.724571704864502, "global_step": 39313, "epoch": 936} {"train_loss": -5.704875946044922, "global_step": 39314, "epoch": 936} {"train_loss": -5.623053550720215, "global_step": 39315, "epoch": 936} {"train_loss": -5.689349174499512, "global_step": 39316, "epoch": 936} {"train_loss": -5.670401573181152, "global_step": 39317, "epoch": 936} {"train_loss": -5.5881218910217285, "global_step": 39318, "epoch": 936} {"train_loss": -5.602936744689941, "global_step": 39319, "epoch": 936} {"train_loss": -5.534174919128418, "global_step": 39320, "epoch": 936} {"train_loss": -5.657613754272461, "global_step": 39321, "epoch": 936} {"train_loss": -5.574926376342773, "global_step": 39322, "epoch": 936} {"train_loss": -5.564843654632568, "global_step": 39323, "epoch": 936} {"train_loss": -5.630748748779297, "global_step": 39324, "epoch": 936} {"train_loss": -5.6135149002075195, "global_step": 39325, "epoch": 936} {"train_loss": -5.598859786987305, "global_step": 39326, "epoch": 936} {"train_loss": -5.746713638305664, "global_step": 39327, "epoch": 936} {"train_loss": -5.768797874450684, "global_step": 39328, "epoch": 936} {"train_loss": -5.596421241760254, "global_step": 39329, "epoch": 936} {"train_loss": -5.634634017944336, "global_step": 39330, "epoch": 936} {"train_loss": -5.589752674102783, "global_step": 39331, "epoch": 936} {"train_loss": -5.539343357086182, "global_step": 39332, "epoch": 936} {"train_loss": -5.6690826416015625, "global_step": 39333, "epoch": 936} {"train_loss": -5.607155799865723, "global_step": 39334, "epoch": 936} {"train_loss": -5.608916759490967, "global_step": 39335, "epoch": 936} {"train_loss": -5.589860916137695, "global_step": 39336, "epoch": 936} {"train_loss": -5.620546340942383, "global_step": 39337, "epoch": 936} {"train_loss": -5.593202114105225, "global_step": 39338, "epoch": 936} {"train_loss": -5.787378311157227, "global_step": 39339, "epoch": 936} {"train_loss": -5.4435577392578125, "global_step": 39340, "epoch": 936} {"train_loss": -5.610905170440674, "global_step": 39341, "epoch": 936} {"train_loss": -5.576553821563721, "global_step": 39342, "epoch": 936} {"train_loss": -5.680242538452148, "global_step": 39343, "epoch": 936} {"train_loss": -5.619978904724121, "global_step": 39344, "epoch": 936} {"train_loss": -5.531466484069824, "global_step": 39345, "epoch": 936} {"train_loss": -5.50377893447876, "global_step": 39346, "epoch": 936} {"train_loss": -5.4893903732299805, "global_step": 39347, "epoch": 936} {"train_loss": -5.563365936279297, "global_step": 39348, "epoch": 936} {"train_loss": -5.566315650939941, "global_step": 39349, "epoch": 936} {"train_loss": -5.6242899894714355, "global_step": 39350, "epoch": 936} {"train_loss": -5.516716003417969, "global_step": 39351, "epoch": 936} {"train_loss": -5.64556884765625, "global_step": 39352, "epoch": 936} {"train_loss": -5.615106026331584, "global_step": 39353, "epoch": 936, "val_loss": 66064.21875} {"train_loss": -5.548945426940918, "global_step": 39354, "epoch": 937} {"train_loss": -5.6797895431518555, "global_step": 39355, "epoch": 937} {"train_loss": -5.620954513549805, "global_step": 39356, "epoch": 937} {"train_loss": -5.655907154083252, "global_step": 39357, "epoch": 937} {"train_loss": -5.621865272521973, "global_step": 39358, "epoch": 937} {"train_loss": -5.651508808135986, "global_step": 39359, "epoch": 937} {"train_loss": -5.730181694030762, "global_step": 39360, "epoch": 937} {"train_loss": -5.714198112487793, "global_step": 39361, "epoch": 937} {"train_loss": -5.6745924949646, "global_step": 39362, "epoch": 937} {"train_loss": -5.573980331420898, "global_step": 39363, "epoch": 937} {"train_loss": -5.70695161819458, "global_step": 39364, "epoch": 937} {"train_loss": -5.537277698516846, "global_step": 39365, "epoch": 937} {"train_loss": -5.613585948944092, "global_step": 39366, "epoch": 937} {"train_loss": -5.69843864440918, "global_step": 39367, "epoch": 937} {"train_loss": -5.587389945983887, "global_step": 39368, "epoch": 937} {"train_loss": -5.570357322692871, "global_step": 39369, "epoch": 937} {"train_loss": -5.633667945861816, "global_step": 39370, "epoch": 937} {"train_loss": -5.58416748046875, "global_step": 39371, "epoch": 937} {"train_loss": -5.740032196044922, "global_step": 39372, "epoch": 937} {"train_loss": -5.60205078125, "global_step": 39373, "epoch": 937} {"train_loss": -5.643381595611572, "global_step": 39374, "epoch": 937} {"train_loss": -5.728569030761719, "global_step": 39375, "epoch": 937} {"train_loss": -5.646664619445801, "global_step": 39376, "epoch": 937} {"train_loss": -5.545168876647949, "global_step": 39377, "epoch": 937} {"train_loss": -5.6568145751953125, "global_step": 39378, "epoch": 937} {"train_loss": -5.630121231079102, "global_step": 39379, "epoch": 937} {"train_loss": -5.481209754943848, "global_step": 39380, "epoch": 937} {"train_loss": -5.5595622062683105, "global_step": 39381, "epoch": 937} {"train_loss": -5.597785949707031, "global_step": 39382, "epoch": 937} {"train_loss": -5.586105823516846, "global_step": 39383, "epoch": 937} {"train_loss": -5.5559492111206055, "global_step": 39384, "epoch": 937} {"train_loss": -5.406211853027344, "global_step": 39385, "epoch": 937} {"train_loss": -5.641749382019043, "global_step": 39386, "epoch": 937} {"train_loss": -5.429605484008789, "global_step": 39387, "epoch": 937} {"train_loss": -5.431729316711426, "global_step": 39388, "epoch": 937} {"train_loss": -5.455996036529541, "global_step": 39389, "epoch": 937} {"train_loss": -5.570313930511475, "global_step": 39390, "epoch": 937} {"train_loss": -5.719099044799805, "global_step": 39391, "epoch": 937} {"train_loss": -5.419994354248047, "global_step": 39392, "epoch": 937} {"train_loss": -5.594794273376465, "global_step": 39393, "epoch": 937} {"train_loss": -5.485637664794922, "global_step": 39394, "epoch": 937} {"train_loss": -5.598492156891596, "global_step": 39395, "epoch": 937, "val_loss": 66371.609375} {"train_loss": -5.499703407287598, "global_step": 39396, "epoch": 938} {"train_loss": -5.595159530639648, "global_step": 39397, "epoch": 938} {"train_loss": -5.598859786987305, "global_step": 39398, "epoch": 938} {"train_loss": -5.656224250793457, "global_step": 39399, "epoch": 938} {"train_loss": -5.546772003173828, "global_step": 39400, "epoch": 938} {"train_loss": -5.603629112243652, "global_step": 39401, "epoch": 938} {"train_loss": -5.70740270614624, "global_step": 39402, "epoch": 938} {"train_loss": -5.671087741851807, "global_step": 39403, "epoch": 938} {"train_loss": -5.681768417358398, "global_step": 39404, "epoch": 938} {"train_loss": -5.538795471191406, "global_step": 39405, "epoch": 938} {"train_loss": -5.739463806152344, "global_step": 39406, "epoch": 938} {"train_loss": -5.449559211730957, "global_step": 39407, "epoch": 938} {"train_loss": -5.569318771362305, "global_step": 39408, "epoch": 938} {"train_loss": -5.800166130065918, "global_step": 39409, "epoch": 938} {"train_loss": -5.54528284072876, "global_step": 39410, "epoch": 938} {"train_loss": -5.545158386230469, "global_step": 39411, "epoch": 938} {"train_loss": -5.649799346923828, "global_step": 39412, "epoch": 938} {"train_loss": -5.6750664710998535, "global_step": 39413, "epoch": 938} {"train_loss": -5.592371940612793, "global_step": 39414, "epoch": 938} {"train_loss": -5.56232213973999, "global_step": 39415, "epoch": 938} {"train_loss": -5.470345973968506, "global_step": 39416, "epoch": 938} {"train_loss": -5.614784240722656, "global_step": 39417, "epoch": 938} {"train_loss": -5.667242527008057, "global_step": 39418, "epoch": 938} {"train_loss": -5.5961995124816895, "global_step": 39419, "epoch": 938} {"train_loss": -5.636045455932617, "global_step": 39420, "epoch": 938} {"train_loss": -5.612377643585205, "global_step": 39421, "epoch": 938} {"train_loss": -5.706356048583984, "global_step": 39422, "epoch": 938} {"train_loss": -5.519580364227295, "global_step": 39423, "epoch": 938} {"train_loss": -5.560583591461182, "global_step": 39424, "epoch": 938} {"train_loss": -5.656798362731934, "global_step": 39425, "epoch": 938} {"train_loss": -5.575493812561035, "global_step": 39426, "epoch": 938} {"train_loss": -5.71541690826416, "global_step": 39427, "epoch": 938} {"train_loss": -5.704962730407715, "global_step": 39428, "epoch": 938} {"train_loss": -5.484201431274414, "global_step": 39429, "epoch": 938} {"train_loss": -5.666252613067627, "global_step": 39430, "epoch": 938} {"train_loss": -5.570530891418457, "global_step": 39431, "epoch": 938} {"train_loss": -5.6720685958862305, "global_step": 39432, "epoch": 938} {"train_loss": -5.594295501708984, "global_step": 39433, "epoch": 938} {"train_loss": -5.749070167541504, "global_step": 39434, "epoch": 938} {"train_loss": -5.668089389801025, "global_step": 39435, "epoch": 938} {"train_loss": -5.479488372802734, "global_step": 39436, "epoch": 938} {"train_loss": -5.614162728900001, "global_step": 39437, "epoch": 938, "val_loss": 66044.3359375} {"train_loss": -5.727888107299805, "global_step": 39438, "epoch": 939} {"train_loss": -5.670145034790039, "global_step": 39439, "epoch": 939} {"train_loss": -5.632709503173828, "global_step": 39440, "epoch": 939} {"train_loss": -5.6347551345825195, "global_step": 39441, "epoch": 939} {"train_loss": -5.573486328125, "global_step": 39442, "epoch": 939} {"train_loss": -5.619007110595703, "global_step": 39443, "epoch": 939} {"train_loss": -5.5468363761901855, "global_step": 39444, "epoch": 939} {"train_loss": -5.615179061889648, "global_step": 39445, "epoch": 939} {"train_loss": -5.670840740203857, "global_step": 39446, "epoch": 939} {"train_loss": -5.608837127685547, "global_step": 39447, "epoch": 939} {"train_loss": -5.642168045043945, "global_step": 39448, "epoch": 939} {"train_loss": -5.576594829559326, "global_step": 39449, "epoch": 939} {"train_loss": -5.555029392242432, "global_step": 39450, "epoch": 939} {"train_loss": -5.641334533691406, "global_step": 39451, "epoch": 939} {"train_loss": -5.6498517990112305, "global_step": 39452, "epoch": 939} {"train_loss": -5.710999011993408, "global_step": 39453, "epoch": 939} {"train_loss": -5.672928333282471, "global_step": 39454, "epoch": 939} {"train_loss": -5.624027252197266, "global_step": 39455, "epoch": 939} {"train_loss": -5.631427764892578, "global_step": 39456, "epoch": 939} {"train_loss": -5.704051971435547, "global_step": 39457, "epoch": 939} {"train_loss": -5.619336128234863, "global_step": 39458, "epoch": 939} {"train_loss": -5.516724586486816, "global_step": 39459, "epoch": 939} {"train_loss": -5.584320068359375, "global_step": 39460, "epoch": 939} {"train_loss": -5.530897617340088, "global_step": 39461, "epoch": 939} {"train_loss": -5.674941062927246, "global_step": 39462, "epoch": 939} {"train_loss": -5.7052717208862305, "global_step": 39463, "epoch": 939} {"train_loss": -5.426307201385498, "global_step": 39464, "epoch": 939} {"train_loss": -5.5416107177734375, "global_step": 39465, "epoch": 939} {"train_loss": -5.580906867980957, "global_step": 39466, "epoch": 939} {"train_loss": -5.647968292236328, "global_step": 39467, "epoch": 939} {"train_loss": -5.506563663482666, "global_step": 39468, "epoch": 939} {"train_loss": -5.6156816482543945, "global_step": 39469, "epoch": 939} {"train_loss": -5.414933204650879, "global_step": 39470, "epoch": 939} {"train_loss": -5.527924537658691, "global_step": 39471, "epoch": 939} {"train_loss": -5.638363361358643, "global_step": 39472, "epoch": 939} {"train_loss": -5.493170738220215, "global_step": 39473, "epoch": 939} {"train_loss": -5.441347122192383, "global_step": 39474, "epoch": 939} {"train_loss": -5.523429870605469, "global_step": 39475, "epoch": 939} {"train_loss": -5.6067728996276855, "global_step": 39476, "epoch": 939} {"train_loss": -5.583792686462402, "global_step": 39477, "epoch": 939} {"train_loss": -5.651111602783203, "global_step": 39478, "epoch": 939} {"train_loss": -5.5982521488553, "global_step": 39479, "epoch": 939, "val_loss": 66263.0078125} {"train_loss": -5.533929347991943, "global_step": 39480, "epoch": 940} {"train_loss": -5.578094959259033, "global_step": 39481, "epoch": 940} {"train_loss": -5.514758586883545, "global_step": 39482, "epoch": 940} {"train_loss": -5.610109329223633, "global_step": 39483, "epoch": 940} {"train_loss": -5.485548973083496, "global_step": 39484, "epoch": 940} {"train_loss": -5.522353172302246, "global_step": 39485, "epoch": 940} {"train_loss": -5.558286666870117, "global_step": 39486, "epoch": 940} {"train_loss": -5.524188041687012, "global_step": 39487, "epoch": 940} {"train_loss": -5.579570770263672, "global_step": 39488, "epoch": 940} {"train_loss": -5.492047309875488, "global_step": 39489, "epoch": 940} {"train_loss": -5.7502593994140625, "global_step": 39490, "epoch": 940} {"train_loss": -5.5824294090271, "global_step": 39491, "epoch": 940} {"train_loss": -5.614453315734863, "global_step": 39492, "epoch": 940} {"train_loss": -5.604841232299805, "global_step": 39493, "epoch": 940} {"train_loss": -5.578184127807617, "global_step": 39494, "epoch": 940} {"train_loss": -5.654020309448242, "global_step": 39495, "epoch": 940} {"train_loss": -5.64122200012207, "global_step": 39496, "epoch": 940} {"train_loss": -5.59744930267334, "global_step": 39497, "epoch": 940} {"train_loss": -5.631403923034668, "global_step": 39498, "epoch": 940} {"train_loss": -5.5532755851745605, "global_step": 39499, "epoch": 940} {"train_loss": -5.620410919189453, "global_step": 39500, "epoch": 940} {"train_loss": -5.663643836975098, "global_step": 39501, "epoch": 940} {"train_loss": -5.632262706756592, "global_step": 39502, "epoch": 940} {"train_loss": -5.6509809494018555, "global_step": 39503, "epoch": 940} {"train_loss": -5.69644832611084, "global_step": 39504, "epoch": 940} {"train_loss": -5.719869613647461, "global_step": 39505, "epoch": 940} {"train_loss": -5.635420322418213, "global_step": 39506, "epoch": 940} {"train_loss": -5.696340084075928, "global_step": 39507, "epoch": 940} {"train_loss": -5.508321762084961, "global_step": 39508, "epoch": 940} {"train_loss": -5.6270976066589355, "global_step": 39509, "epoch": 940} {"train_loss": -5.646285057067871, "global_step": 39510, "epoch": 940} {"train_loss": -5.646130561828613, "global_step": 39511, "epoch": 940} {"train_loss": -5.656347274780273, "global_step": 39512, "epoch": 940} {"train_loss": -5.628633499145508, "global_step": 39513, "epoch": 940} {"train_loss": -5.609078884124756, "global_step": 39514, "epoch": 940} {"train_loss": -5.716604232788086, "global_step": 39515, "epoch": 940} {"train_loss": -5.614747524261475, "global_step": 39516, "epoch": 940} {"train_loss": -5.575998306274414, "global_step": 39517, "epoch": 940} {"train_loss": -5.595058441162109, "global_step": 39518, "epoch": 940} {"train_loss": -5.4533162117004395, "global_step": 39519, "epoch": 940} {"train_loss": -5.659005165100098, "global_step": 39520, "epoch": 940} {"train_loss": -5.60872068859282, "global_step": 39521, "epoch": 940, "val_loss": 66102.140625} {"train_loss": -5.696645259857178, "global_step": 39522, "epoch": 941} {"train_loss": -5.532309532165527, "global_step": 39523, "epoch": 941} {"train_loss": -5.62548828125, "global_step": 39524, "epoch": 941} {"train_loss": -5.656397819519043, "global_step": 39525, "epoch": 941} {"train_loss": -5.510822772979736, "global_step": 39526, "epoch": 941} {"train_loss": -5.6074604988098145, "global_step": 39527, "epoch": 941} {"train_loss": -5.754087448120117, "global_step": 39528, "epoch": 941} {"train_loss": -5.543662071228027, "global_step": 39529, "epoch": 941} {"train_loss": -5.521007537841797, "global_step": 39530, "epoch": 941} {"train_loss": -5.783504486083984, "global_step": 39531, "epoch": 941} {"train_loss": -5.559761047363281, "global_step": 39532, "epoch": 941} {"train_loss": -5.561565399169922, "global_step": 39533, "epoch": 941} {"train_loss": -5.719696998596191, "global_step": 39534, "epoch": 941} {"train_loss": -5.576231002807617, "global_step": 39535, "epoch": 941} {"train_loss": -5.556362152099609, "global_step": 39536, "epoch": 941} {"train_loss": -5.624507904052734, "global_step": 39537, "epoch": 941} {"train_loss": -5.50852108001709, "global_step": 39538, "epoch": 941} {"train_loss": -5.546483039855957, "global_step": 39539, "epoch": 941} {"train_loss": -5.547817707061768, "global_step": 39540, "epoch": 941} {"train_loss": -5.523653030395508, "global_step": 39541, "epoch": 941} {"train_loss": -5.662362098693848, "global_step": 39542, "epoch": 941} {"train_loss": -5.6446428298950195, "global_step": 39543, "epoch": 941} {"train_loss": -5.600114822387695, "global_step": 39544, "epoch": 941} {"train_loss": -5.562651634216309, "global_step": 39545, "epoch": 941} {"train_loss": -5.615983963012695, "global_step": 39546, "epoch": 941} {"train_loss": -5.574938774108887, "global_step": 39547, "epoch": 941} {"train_loss": -5.708093643188477, "global_step": 39548, "epoch": 941} {"train_loss": -5.542391300201416, "global_step": 39549, "epoch": 941} {"train_loss": -5.648319244384766, "global_step": 39550, "epoch": 941} {"train_loss": -5.558166027069092, "global_step": 39551, "epoch": 941} {"train_loss": -5.53731107711792, "global_step": 39552, "epoch": 941} {"train_loss": -5.614989757537842, "global_step": 39553, "epoch": 941} {"train_loss": -5.642230033874512, "global_step": 39554, "epoch": 941} {"train_loss": -5.603611469268799, "global_step": 39555, "epoch": 941} {"train_loss": -5.689301490783691, "global_step": 39556, "epoch": 941} {"train_loss": -5.629483222961426, "global_step": 39557, "epoch": 941} {"train_loss": -5.614466190338135, "global_step": 39558, "epoch": 941} {"train_loss": -5.620185852050781, "global_step": 39559, "epoch": 941} {"train_loss": -5.686850547790527, "global_step": 39560, "epoch": 941} {"train_loss": -5.583835124969482, "global_step": 39561, "epoch": 941} {"train_loss": -5.612475395202637, "global_step": 39562, "epoch": 941} {"train_loss": -5.609158459163847, "global_step": 39563, "epoch": 941, "val_loss": 66057.5078125} {"train_loss": -5.734071731567383, "global_step": 39564, "epoch": 942} {"train_loss": -5.701181888580322, "global_step": 39565, "epoch": 942} {"train_loss": -5.550650596618652, "global_step": 39566, "epoch": 942} {"train_loss": -5.633492946624756, "global_step": 39567, "epoch": 942} {"train_loss": -5.65018892288208, "global_step": 39568, "epoch": 942} {"train_loss": -5.703228950500488, "global_step": 39569, "epoch": 942} {"train_loss": -5.603920936584473, "global_step": 39570, "epoch": 942} {"train_loss": -5.599942207336426, "global_step": 39571, "epoch": 942} {"train_loss": -5.571610450744629, "global_step": 39572, "epoch": 942} {"train_loss": -5.61544132232666, "global_step": 39573, "epoch": 942} {"train_loss": -5.658946514129639, "global_step": 39574, "epoch": 942} {"train_loss": -5.6107611656188965, "global_step": 39575, "epoch": 942} {"train_loss": -5.494297981262207, "global_step": 39576, "epoch": 942} {"train_loss": -5.630328178405762, "global_step": 39577, "epoch": 942} {"train_loss": -5.718260288238525, "global_step": 39578, "epoch": 942} {"train_loss": -5.414281845092773, "global_step": 39579, "epoch": 942} {"train_loss": -5.453641891479492, "global_step": 39580, "epoch": 942} {"train_loss": -5.7201738357543945, "global_step": 39581, "epoch": 942} {"train_loss": -5.579310417175293, "global_step": 39582, "epoch": 942} {"train_loss": -5.658339023590088, "global_step": 39583, "epoch": 942} {"train_loss": -5.587107181549072, "global_step": 39584, "epoch": 942} {"train_loss": -5.584115982055664, "global_step": 39585, "epoch": 942} {"train_loss": -5.637080192565918, "global_step": 39586, "epoch": 942} {"train_loss": -5.667472839355469, "global_step": 39587, "epoch": 942} {"train_loss": -5.624886512756348, "global_step": 39588, "epoch": 942} {"train_loss": -5.728018760681152, "global_step": 39589, "epoch": 942} {"train_loss": -5.732560634613037, "global_step": 39590, "epoch": 942} {"train_loss": -5.8010663986206055, "global_step": 39591, "epoch": 942} {"train_loss": -5.6604509353637695, "global_step": 39592, "epoch": 942} {"train_loss": -5.673888683319092, "global_step": 39593, "epoch": 942} {"train_loss": -5.53078556060791, "global_step": 39594, "epoch": 942} {"train_loss": -5.70414924621582, "global_step": 39595, "epoch": 942} {"train_loss": -5.587529182434082, "global_step": 39596, "epoch": 942} {"train_loss": -5.585729598999023, "global_step": 39597, "epoch": 942} {"train_loss": -5.57688045501709, "global_step": 39598, "epoch": 942} {"train_loss": -5.635853290557861, "global_step": 39599, "epoch": 942} {"train_loss": -5.601017475128174, "global_step": 39600, "epoch": 942} {"train_loss": -5.68365478515625, "global_step": 39601, "epoch": 942} {"train_loss": -5.635828971862793, "global_step": 39602, "epoch": 942} {"train_loss": -5.49289083480835, "global_step": 39603, "epoch": 942} {"train_loss": -5.656639099121094, "global_step": 39604, "epoch": 942} {"train_loss": -5.629564126332601, "global_step": 39605, "epoch": 942, "val_loss": 66065.640625} {"train_loss": -5.687376976013184, "global_step": 39606, "epoch": 943} {"train_loss": -5.554102897644043, "global_step": 39607, "epoch": 943} {"train_loss": -5.764176368713379, "global_step": 39608, "epoch": 943} {"train_loss": -5.54901123046875, "global_step": 39609, "epoch": 943} {"train_loss": -5.718424320220947, "global_step": 39610, "epoch": 943} {"train_loss": -5.775594711303711, "global_step": 39611, "epoch": 943} {"train_loss": -5.6517109870910645, "global_step": 39612, "epoch": 943} {"train_loss": -5.5471601486206055, "global_step": 39613, "epoch": 943} {"train_loss": -5.571730613708496, "global_step": 39614, "epoch": 943} {"train_loss": -5.737523078918457, "global_step": 39615, "epoch": 943} {"train_loss": -5.638935089111328, "global_step": 39616, "epoch": 943} {"train_loss": -5.67913818359375, "global_step": 39617, "epoch": 943} {"train_loss": -5.589077949523926, "global_step": 39618, "epoch": 943} {"train_loss": -5.633419990539551, "global_step": 39619, "epoch": 943} {"train_loss": -5.625759124755859, "global_step": 39620, "epoch": 943} {"train_loss": -5.416242599487305, "global_step": 39621, "epoch": 943} {"train_loss": -5.559979438781738, "global_step": 39622, "epoch": 943} {"train_loss": -5.602655410766602, "global_step": 39623, "epoch": 943} {"train_loss": -5.583000183105469, "global_step": 39624, "epoch": 943} {"train_loss": -5.628052711486816, "global_step": 39625, "epoch": 943} {"train_loss": -5.536318778991699, "global_step": 39626, "epoch": 943} {"train_loss": -5.6175150871276855, "global_step": 39627, "epoch": 943} {"train_loss": -5.5500898361206055, "global_step": 39628, "epoch": 943} {"train_loss": -5.549689292907715, "global_step": 39629, "epoch": 943} {"train_loss": -5.515733242034912, "global_step": 39630, "epoch": 943} {"train_loss": -5.473847389221191, "global_step": 39631, "epoch": 943} {"train_loss": -5.490816116333008, "global_step": 39632, "epoch": 943} {"train_loss": -5.623598098754883, "global_step": 39633, "epoch": 943} {"train_loss": -5.524388313293457, "global_step": 39634, "epoch": 943} {"train_loss": -5.581280708312988, "global_step": 39635, "epoch": 943} {"train_loss": -5.541042327880859, "global_step": 39636, "epoch": 943} {"train_loss": -5.456667423248291, "global_step": 39637, "epoch": 943} {"train_loss": -5.692852973937988, "global_step": 39638, "epoch": 943} {"train_loss": -5.576240539550781, "global_step": 39639, "epoch": 943} {"train_loss": -5.685466766357422, "global_step": 39640, "epoch": 943} {"train_loss": -5.648314952850342, "global_step": 39641, "epoch": 943} {"train_loss": -5.7096099853515625, "global_step": 39642, "epoch": 943} {"train_loss": -5.67384147644043, "global_step": 39643, "epoch": 943} {"train_loss": -5.700745582580566, "global_step": 39644, "epoch": 943} {"train_loss": -5.604432106018066, "global_step": 39645, "epoch": 943} {"train_loss": -5.577922821044922, "global_step": 39646, "epoch": 943} {"train_loss": -5.607084796542213, "global_step": 39647, "epoch": 943, "val_loss": 66009.1640625} {"train_loss": -5.6516194343566895, "global_step": 39648, "epoch": 944} {"train_loss": -5.566714763641357, "global_step": 39649, "epoch": 944} {"train_loss": -5.745209693908691, "global_step": 39650, "epoch": 944} {"train_loss": -5.62652587890625, "global_step": 39651, "epoch": 944} {"train_loss": -5.593513011932373, "global_step": 39652, "epoch": 944} {"train_loss": -5.571256637573242, "global_step": 39653, "epoch": 944} {"train_loss": -5.629809379577637, "global_step": 39654, "epoch": 944} {"train_loss": -5.698333263397217, "global_step": 39655, "epoch": 944} {"train_loss": -5.668105125427246, "global_step": 39656, "epoch": 944} {"train_loss": -5.623740196228027, "global_step": 39657, "epoch": 944} {"train_loss": -5.775849342346191, "global_step": 39658, "epoch": 944} {"train_loss": -5.612984657287598, "global_step": 39659, "epoch": 944} {"train_loss": -5.602347373962402, "global_step": 39660, "epoch": 944} {"train_loss": -5.615959167480469, "global_step": 39661, "epoch": 944} {"train_loss": -5.59291934967041, "global_step": 39662, "epoch": 944} {"train_loss": -5.639698505401611, "global_step": 39663, "epoch": 944} {"train_loss": -5.701995372772217, "global_step": 39664, "epoch": 944} {"train_loss": -5.663172721862793, "global_step": 39665, "epoch": 944} {"train_loss": -5.559488773345947, "global_step": 39666, "epoch": 944} {"train_loss": -5.7027106285095215, "global_step": 39667, "epoch": 944} {"train_loss": -5.70698356628418, "global_step": 39668, "epoch": 944} {"train_loss": -5.663880825042725, "global_step": 39669, "epoch": 944} {"train_loss": -5.751378059387207, "global_step": 39670, "epoch": 944} {"train_loss": -5.620277404785156, "global_step": 39671, "epoch": 944} {"train_loss": -5.657126426696777, "global_step": 39672, "epoch": 944} {"train_loss": -5.593738555908203, "global_step": 39673, "epoch": 944} {"train_loss": -5.64377498626709, "global_step": 39674, "epoch": 944} {"train_loss": -5.67056941986084, "global_step": 39675, "epoch": 944} {"train_loss": -5.512530326843262, "global_step": 39676, "epoch": 944} {"train_loss": -5.608291149139404, "global_step": 39677, "epoch": 944} {"train_loss": -5.727112770080566, "global_step": 39678, "epoch": 944} {"train_loss": -5.536656379699707, "global_step": 39679, "epoch": 944} {"train_loss": -5.6261491775512695, "global_step": 39680, "epoch": 944} {"train_loss": -5.521342754364014, "global_step": 39681, "epoch": 944} {"train_loss": -5.591986179351807, "global_step": 39682, "epoch": 944} {"train_loss": -5.616191864013672, "global_step": 39683, "epoch": 944} {"train_loss": -5.701714038848877, "global_step": 39684, "epoch": 944} {"train_loss": -5.683043956756592, "global_step": 39685, "epoch": 944} {"train_loss": -5.627813816070557, "global_step": 39686, "epoch": 944} {"train_loss": -5.773632049560547, "global_step": 39687, "epoch": 944} {"train_loss": -5.539154052734375, "global_step": 39688, "epoch": 944} {"train_loss": -5.6363581248692105, "global_step": 39689, "epoch": 944, "val_loss": 65959.921875} {"train_loss": -5.7698259353637695, "global_step": 39690, "epoch": 945} {"train_loss": -5.616070747375488, "global_step": 39691, "epoch": 945} {"train_loss": -5.5155816078186035, "global_step": 39692, "epoch": 945} {"train_loss": -5.629996299743652, "global_step": 39693, "epoch": 945} {"train_loss": -5.6397600173950195, "global_step": 39694, "epoch": 945} {"train_loss": -5.817199230194092, "global_step": 39695, "epoch": 945} {"train_loss": -5.570526123046875, "global_step": 39696, "epoch": 945} {"train_loss": -5.574113368988037, "global_step": 39697, "epoch": 945} {"train_loss": -5.611771106719971, "global_step": 39698, "epoch": 945} {"train_loss": -5.699344635009766, "global_step": 39699, "epoch": 945} {"train_loss": -5.4764404296875, "global_step": 39700, "epoch": 945} {"train_loss": -5.53669548034668, "global_step": 39701, "epoch": 945} {"train_loss": -5.51292610168457, "global_step": 39702, "epoch": 945} {"train_loss": -5.483140468597412, "global_step": 39703, "epoch": 945} {"train_loss": -5.690610408782959, "global_step": 39704, "epoch": 945} {"train_loss": -5.566073417663574, "global_step": 39705, "epoch": 945} {"train_loss": -5.552706718444824, "global_step": 39706, "epoch": 945} {"train_loss": -5.684685707092285, "global_step": 39707, "epoch": 945} {"train_loss": -5.506336212158203, "global_step": 39708, "epoch": 945} {"train_loss": -5.6072540283203125, "global_step": 39709, "epoch": 945} {"train_loss": -5.496123313903809, "global_step": 39710, "epoch": 945} {"train_loss": -5.63575553894043, "global_step": 39711, "epoch": 945} {"train_loss": -5.553799629211426, "global_step": 39712, "epoch": 945} {"train_loss": -5.6555681228637695, "global_step": 39713, "epoch": 945} {"train_loss": -5.586838722229004, "global_step": 39714, "epoch": 945} {"train_loss": -5.5828704833984375, "global_step": 39715, "epoch": 945} {"train_loss": -5.603295803070068, "global_step": 39716, "epoch": 945} {"train_loss": -5.569726467132568, "global_step": 39717, "epoch": 945} {"train_loss": -5.578359127044678, "global_step": 39718, "epoch": 945} {"train_loss": -5.62777042388916, "global_step": 39719, "epoch": 945} {"train_loss": -5.624490737915039, "global_step": 39720, "epoch": 945} {"train_loss": -5.5999369621276855, "global_step": 39721, "epoch": 945} {"train_loss": -5.632698059082031, "global_step": 39722, "epoch": 945} {"train_loss": -5.808989524841309, "global_step": 39723, "epoch": 945} {"train_loss": -5.656675338745117, "global_step": 39724, "epoch": 945} {"train_loss": -5.776458740234375, "global_step": 39725, "epoch": 945} {"train_loss": -5.519427299499512, "global_step": 39726, "epoch": 945} {"train_loss": -5.66411018371582, "global_step": 39727, "epoch": 945} {"train_loss": -5.612209320068359, "global_step": 39728, "epoch": 945} {"train_loss": -5.604510307312012, "global_step": 39729, "epoch": 945} {"train_loss": -5.588959217071533, "global_step": 39730, "epoch": 945} {"train_loss": -5.608994801839192, "global_step": 39731, "epoch": 945, "val_loss": 65999.3515625} {"train_loss": -5.58900785446167, "global_step": 39732, "epoch": 946} {"train_loss": -5.674901008605957, "global_step": 39733, "epoch": 946} {"train_loss": -5.66408634185791, "global_step": 39734, "epoch": 946} {"train_loss": -5.646228313446045, "global_step": 39735, "epoch": 946} {"train_loss": -5.603266716003418, "global_step": 39736, "epoch": 946} {"train_loss": -5.718585968017578, "global_step": 39737, "epoch": 946} {"train_loss": -5.678979873657227, "global_step": 39738, "epoch": 946} {"train_loss": -5.543614387512207, "global_step": 39739, "epoch": 946} {"train_loss": -5.72305965423584, "global_step": 39740, "epoch": 946} {"train_loss": -5.609349727630615, "global_step": 39741, "epoch": 946} {"train_loss": -5.756443500518799, "global_step": 39742, "epoch": 946} {"train_loss": -5.579493522644043, "global_step": 39743, "epoch": 946} {"train_loss": -5.583053112030029, "global_step": 39744, "epoch": 946} {"train_loss": -5.683444023132324, "global_step": 39745, "epoch": 946} {"train_loss": -5.608325958251953, "global_step": 39746, "epoch": 946} {"train_loss": -5.598988056182861, "global_step": 39747, "epoch": 946} {"train_loss": -5.649688720703125, "global_step": 39748, "epoch": 946} {"train_loss": -5.537928581237793, "global_step": 39749, "epoch": 946} {"train_loss": -5.701378345489502, "global_step": 39750, "epoch": 946} {"train_loss": -5.576234817504883, "global_step": 39751, "epoch": 946} {"train_loss": -5.552853107452393, "global_step": 39752, "epoch": 946} {"train_loss": -5.667992115020752, "global_step": 39753, "epoch": 946} {"train_loss": -5.677499771118164, "global_step": 39754, "epoch": 946} {"train_loss": -5.605595111846924, "global_step": 39755, "epoch": 946} {"train_loss": -5.59547233581543, "global_step": 39756, "epoch": 946} {"train_loss": -5.608892440795898, "global_step": 39757, "epoch": 946} {"train_loss": -5.621595859527588, "global_step": 39758, "epoch": 946} {"train_loss": -5.602250099182129, "global_step": 39759, "epoch": 946} {"train_loss": -5.641882419586182, "global_step": 39760, "epoch": 946} {"train_loss": -5.586307525634766, "global_step": 39761, "epoch": 946} {"train_loss": -5.534885406494141, "global_step": 39762, "epoch": 946} {"train_loss": -5.608760356903076, "global_step": 39763, "epoch": 946} {"train_loss": -5.610064506530762, "global_step": 39764, "epoch": 946} {"train_loss": -5.560976982116699, "global_step": 39765, "epoch": 946} {"train_loss": -5.602249622344971, "global_step": 39766, "epoch": 946} {"train_loss": -5.630690574645996, "global_step": 39767, "epoch": 946} {"train_loss": -5.613183975219727, "global_step": 39768, "epoch": 946} {"train_loss": -5.592937469482422, "global_step": 39769, "epoch": 946} {"train_loss": -5.49009895324707, "global_step": 39770, "epoch": 946} {"train_loss": -5.536785125732422, "global_step": 39771, "epoch": 946} {"train_loss": -5.540349960327148, "global_step": 39772, "epoch": 946} {"train_loss": -5.615674677349272, "global_step": 39773, "epoch": 946, "val_loss": 66096.3046875} {"train_loss": -5.632611274719238, "global_step": 39774, "epoch": 947} {"train_loss": -5.546132564544678, "global_step": 39775, "epoch": 947} {"train_loss": -5.51824951171875, "global_step": 39776, "epoch": 947} {"train_loss": -5.646816253662109, "global_step": 39777, "epoch": 947} {"train_loss": -5.6049485206604, "global_step": 39778, "epoch": 947} {"train_loss": -5.581827163696289, "global_step": 39779, "epoch": 947} {"train_loss": -5.677075386047363, "global_step": 39780, "epoch": 947} {"train_loss": -5.5227766036987305, "global_step": 39781, "epoch": 947} {"train_loss": -5.711148262023926, "global_step": 39782, "epoch": 947} {"train_loss": -5.618745803833008, "global_step": 39783, "epoch": 947} {"train_loss": -5.675618648529053, "global_step": 39784, "epoch": 947} {"train_loss": -5.484766006469727, "global_step": 39785, "epoch": 947} {"train_loss": -5.662407875061035, "global_step": 39786, "epoch": 947} {"train_loss": -5.618167877197266, "global_step": 39787, "epoch": 947} {"train_loss": -5.648680210113525, "global_step": 39788, "epoch": 947} {"train_loss": -5.6989030838012695, "global_step": 39789, "epoch": 947} {"train_loss": -5.496138572692871, "global_step": 39790, "epoch": 947} {"train_loss": -5.626743793487549, "global_step": 39791, "epoch": 947} {"train_loss": -5.616705894470215, "global_step": 39792, "epoch": 947} {"train_loss": -5.769973278045654, "global_step": 39793, "epoch": 947} {"train_loss": -5.714322090148926, "global_step": 39794, "epoch": 947} {"train_loss": -5.613055229187012, "global_step": 39795, "epoch": 947} {"train_loss": -5.637282371520996, "global_step": 39796, "epoch": 947} {"train_loss": -5.660805702209473, "global_step": 39797, "epoch": 947} {"train_loss": -5.718055725097656, "global_step": 39798, "epoch": 947} {"train_loss": -5.559237480163574, "global_step": 39799, "epoch": 947} {"train_loss": -5.717583656311035, "global_step": 39800, "epoch": 947} {"train_loss": -5.5424275398254395, "global_step": 39801, "epoch": 947} {"train_loss": -5.6907196044921875, "global_step": 39802, "epoch": 947} {"train_loss": -5.54626989364624, "global_step": 39803, "epoch": 947} {"train_loss": -5.7527618408203125, "global_step": 39804, "epoch": 947} {"train_loss": -5.623775482177734, "global_step": 39805, "epoch": 947} {"train_loss": -5.634128570556641, "global_step": 39806, "epoch": 947} {"train_loss": -5.548771858215332, "global_step": 39807, "epoch": 947} {"train_loss": -5.601110458374023, "global_step": 39808, "epoch": 947} {"train_loss": -5.780853271484375, "global_step": 39809, "epoch": 947} {"train_loss": -5.578856468200684, "global_step": 39810, "epoch": 947} {"train_loss": -5.736231803894043, "global_step": 39811, "epoch": 947} {"train_loss": -5.577281951904297, "global_step": 39812, "epoch": 947} {"train_loss": -5.642122268676758, "global_step": 39813, "epoch": 947} {"train_loss": -5.684040546417236, "global_step": 39814, "epoch": 947} {"train_loss": -5.633713222685314, "global_step": 39815, "epoch": 947, "val_loss": 66000.5546875} {"train_loss": -5.66994571685791, "global_step": 39816, "epoch": 948} {"train_loss": -5.534642219543457, "global_step": 39817, "epoch": 948} {"train_loss": -5.578630447387695, "global_step": 39818, "epoch": 948} {"train_loss": -5.5375471115112305, "global_step": 39819, "epoch": 948} {"train_loss": -5.694949150085449, "global_step": 39820, "epoch": 948} {"train_loss": -5.658609390258789, "global_step": 39821, "epoch": 948} {"train_loss": -5.6008477210998535, "global_step": 39822, "epoch": 948} {"train_loss": -5.610124588012695, "global_step": 39823, "epoch": 948} {"train_loss": -5.598054885864258, "global_step": 39824, "epoch": 948} {"train_loss": -5.749089241027832, "global_step": 39825, "epoch": 948} {"train_loss": -5.64592170715332, "global_step": 39826, "epoch": 948} {"train_loss": -5.629292011260986, "global_step": 39827, "epoch": 948} {"train_loss": -5.627350807189941, "global_step": 39828, "epoch": 948} {"train_loss": -5.696715354919434, "global_step": 39829, "epoch": 948} {"train_loss": -5.622490406036377, "global_step": 39830, "epoch": 948} {"train_loss": -5.630650520324707, "global_step": 39831, "epoch": 948} {"train_loss": -5.666266441345215, "global_step": 39832, "epoch": 948} {"train_loss": -5.559784889221191, "global_step": 39833, "epoch": 948} {"train_loss": -5.591931343078613, "global_step": 39834, "epoch": 948} {"train_loss": -5.594581604003906, "global_step": 39835, "epoch": 948} {"train_loss": -5.528682231903076, "global_step": 39836, "epoch": 948} {"train_loss": -5.57377290725708, "global_step": 39837, "epoch": 948} {"train_loss": -5.585609436035156, "global_step": 39838, "epoch": 948} {"train_loss": -5.710407733917236, "global_step": 39839, "epoch": 948} {"train_loss": -5.691348075866699, "global_step": 39840, "epoch": 948} {"train_loss": -5.610300540924072, "global_step": 39841, "epoch": 948} {"train_loss": -5.6870574951171875, "global_step": 39842, "epoch": 948} {"train_loss": -5.677097320556641, "global_step": 39843, "epoch": 948} {"train_loss": -5.5698747634887695, "global_step": 39844, "epoch": 948} {"train_loss": -5.574586868286133, "global_step": 39845, "epoch": 948} {"train_loss": -5.702880382537842, "global_step": 39846, "epoch": 948} {"train_loss": -5.670324325561523, "global_step": 39847, "epoch": 948} {"train_loss": -5.658952713012695, "global_step": 39848, "epoch": 948} {"train_loss": -5.656147480010986, "global_step": 39849, "epoch": 948} {"train_loss": -5.614171028137207, "global_step": 39850, "epoch": 948} {"train_loss": -5.482064247131348, "global_step": 39851, "epoch": 948} {"train_loss": -5.624792575836182, "global_step": 39852, "epoch": 948} {"train_loss": -5.428469657897949, "global_step": 39853, "epoch": 948} {"train_loss": -5.691662788391113, "global_step": 39854, "epoch": 948} {"train_loss": -5.524357318878174, "global_step": 39855, "epoch": 948} {"train_loss": -5.575847625732422, "global_step": 39856, "epoch": 948} {"train_loss": -5.621265842801049, "global_step": 39857, "epoch": 948, "val_loss": 65987.140625} {"train_loss": -5.493411064147949, "global_step": 39858, "epoch": 949} {"train_loss": -5.686890602111816, "global_step": 39859, "epoch": 949} {"train_loss": -5.570651054382324, "global_step": 39860, "epoch": 949} {"train_loss": -5.699733257293701, "global_step": 39861, "epoch": 949} {"train_loss": -5.539284706115723, "global_step": 39862, "epoch": 949} {"train_loss": -5.499824523925781, "global_step": 39863, "epoch": 949} {"train_loss": -5.562307357788086, "global_step": 39864, "epoch": 949} {"train_loss": -5.4880523681640625, "global_step": 39865, "epoch": 949} {"train_loss": -5.661654472351074, "global_step": 39866, "epoch": 949} {"train_loss": -5.43753719329834, "global_step": 39867, "epoch": 949} {"train_loss": -5.589588642120361, "global_step": 39868, "epoch": 949} {"train_loss": -5.6261138916015625, "global_step": 39869, "epoch": 949} {"train_loss": -5.43537712097168, "global_step": 39870, "epoch": 949} {"train_loss": -5.70427131652832, "global_step": 39871, "epoch": 949} {"train_loss": -5.494452953338623, "global_step": 39872, "epoch": 949} {"train_loss": -5.567019462585449, "global_step": 39873, "epoch": 949} {"train_loss": -5.692584037780762, "global_step": 39874, "epoch": 949} {"train_loss": -5.436641693115234, "global_step": 39875, "epoch": 949} {"train_loss": -5.738807678222656, "global_step": 39876, "epoch": 949} {"train_loss": -5.500733852386475, "global_step": 39877, "epoch": 949} {"train_loss": -5.48109245300293, "global_step": 39878, "epoch": 949} {"train_loss": -5.5333356857299805, "global_step": 39879, "epoch": 949} {"train_loss": -5.488118648529053, "global_step": 39880, "epoch": 949} {"train_loss": -5.7180280685424805, "global_step": 39881, "epoch": 949} {"train_loss": -5.7027435302734375, "global_step": 39882, "epoch": 949} {"train_loss": -5.592517852783203, "global_step": 39883, "epoch": 949} {"train_loss": -5.548563003540039, "global_step": 39884, "epoch": 949} {"train_loss": -5.556182861328125, "global_step": 39885, "epoch": 949} {"train_loss": -5.6441755294799805, "global_step": 39886, "epoch": 949} {"train_loss": -5.455246925354004, "global_step": 39887, "epoch": 949} {"train_loss": -5.629541397094727, "global_step": 39888, "epoch": 949} {"train_loss": -5.650796413421631, "global_step": 39889, "epoch": 949} {"train_loss": -5.470935821533203, "global_step": 39890, "epoch": 949} {"train_loss": -5.684103965759277, "global_step": 39891, "epoch": 949} {"train_loss": -5.5902419090271, "global_step": 39892, "epoch": 949} {"train_loss": -5.601889133453369, "global_step": 39893, "epoch": 949} {"train_loss": -5.677014350891113, "global_step": 39894, "epoch": 949} {"train_loss": -5.549764156341553, "global_step": 39895, "epoch": 949} {"train_loss": -5.648031234741211, "global_step": 39896, "epoch": 949} {"train_loss": -5.589336395263672, "global_step": 39897, "epoch": 949} {"train_loss": -5.513976097106934, "global_step": 39898, "epoch": 949} {"train_loss": -5.582942837760562, "global_step": 39899, "epoch": 949, "val_loss": 66331.6015625} {"train_loss": -5.475067615509033, "global_step": 39900, "epoch": 950} {"train_loss": -5.649658679962158, "global_step": 39901, "epoch": 950} {"train_loss": -5.550943374633789, "global_step": 39902, "epoch": 950} {"train_loss": -5.479744911193848, "global_step": 39903, "epoch": 950} {"train_loss": -5.706360816955566, "global_step": 39904, "epoch": 950} {"train_loss": -5.544221878051758, "global_step": 39905, "epoch": 950} {"train_loss": -5.739924907684326, "global_step": 39906, "epoch": 950} {"train_loss": -5.630034446716309, "global_step": 39907, "epoch": 950} {"train_loss": -5.500473976135254, "global_step": 39908, "epoch": 950} {"train_loss": -5.779221057891846, "global_step": 39909, "epoch": 950} {"train_loss": -5.57321834564209, "global_step": 39910, "epoch": 950} {"train_loss": -5.60125732421875, "global_step": 39911, "epoch": 950} {"train_loss": -5.7200422286987305, "global_step": 39912, "epoch": 950} {"train_loss": -5.682212829589844, "global_step": 39913, "epoch": 950} {"train_loss": -5.662708282470703, "global_step": 39914, "epoch": 950} {"train_loss": -5.48660945892334, "global_step": 39915, "epoch": 950} {"train_loss": -5.69857120513916, "global_step": 39916, "epoch": 950} {"train_loss": -5.713926315307617, "global_step": 39917, "epoch": 950} {"train_loss": -5.562624931335449, "global_step": 39918, "epoch": 950} {"train_loss": -5.6409101486206055, "global_step": 39919, "epoch": 950} {"train_loss": -5.736844062805176, "global_step": 39920, "epoch": 950} {"train_loss": -5.643500328063965, "global_step": 39921, "epoch": 950} {"train_loss": -5.633821964263916, "global_step": 39922, "epoch": 950} {"train_loss": -5.7288923263549805, "global_step": 39923, "epoch": 950} {"train_loss": -5.722201347351074, "global_step": 39924, "epoch": 950} {"train_loss": -5.503140449523926, "global_step": 39925, "epoch": 950} {"train_loss": -5.776711940765381, "global_step": 39926, "epoch": 950} {"train_loss": -5.610254764556885, "global_step": 39927, "epoch": 950} {"train_loss": -5.582823753356934, "global_step": 39928, "epoch": 950} {"train_loss": -5.593646049499512, "global_step": 39929, "epoch": 950} {"train_loss": -5.715461730957031, "global_step": 39930, "epoch": 950} {"train_loss": -5.59652853012085, "global_step": 39931, "epoch": 950} {"train_loss": -5.666928291320801, "global_step": 39932, "epoch": 950} {"train_loss": -5.7235212326049805, "global_step": 39933, "epoch": 950} {"train_loss": -5.617197036743164, "global_step": 39934, "epoch": 950} {"train_loss": -5.739240646362305, "global_step": 39935, "epoch": 950} {"train_loss": -5.694952487945557, "global_step": 39936, "epoch": 950} {"train_loss": -5.581916809082031, "global_step": 39937, "epoch": 950} {"train_loss": -5.594708442687988, "global_step": 39938, "epoch": 950} {"train_loss": -5.61317253112793, "global_step": 39939, "epoch": 950} {"train_loss": -5.62263298034668, "global_step": 39940, "epoch": 950} {"train_loss": -5.637348402114141, "global_step": 39941, "epoch": 950, "train/sim_max_reward_0": 0.4309446518950438, "train/sim_max_reward_1": 0.001147971476521298, "train/sim_max_reward_2": 0.49202521349543554, "train/sim_max_reward_3": 0.16153321101825568, "train/sim_max_reward_4": 0.4542806832631274, "train/sim_max_reward_5": 0.5480485062137426, "test/sim_max_reward_4400000": 0.1613087107767035, "test/sim_max_reward_4400001": 0.12495639403190094, "test/sim_max_reward_4400002": 0.1783199966412781, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17334790230477, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.4829831907970814, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.5899256615028404, "test/sim_max_reward_4400009": 0.5097510876273056, "test/sim_max_reward_4400010": 0.1622481220924242, "test/sim_max_reward_4400011": 0.30414412919097306, "test/sim_max_reward_4400012": 0.381233683579035, "test/sim_max_reward_4400013": 0.9014379384879757, "test/sim_max_reward_4400014": 0.09217218130689218, "test/sim_max_reward_4400015": 0.22155380358045695, "test/sim_max_reward_4400016": 0.268646921935863, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.291907655031693, "test/sim_max_reward_4400019": 0.0948652885871483, "test/sim_max_reward_4400020": 0.00039858378559703175, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.5794219839976643, "test/sim_max_reward_4400023": 0.13381469758177697, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.8640443928192143, "test/sim_max_reward_4400027": 0.13506178132596056, "test/sim_max_reward_4400028": 0.3192892314367053, "test/sim_max_reward_4400029": 0.19044672507137894, "test/sim_max_reward_4400030": 0.7545759504543892, "test/sim_max_reward_4400031": 0.23275054818003987, "test/sim_max_reward_4400032": 1.0, "test/sim_max_reward_4400033": 0.47112228632035735, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.46815639290179706, "test/sim_max_reward_4400036": 0.415981805144776, "test/sim_max_reward_4400037": 0.3042433685494449, "test/sim_max_reward_4400038": 0.15802768752003252, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.47174409850321, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.01886189446086715, "test/sim_max_reward_4400044": 0.9280486608189533, "test/sim_max_reward_4400045": 0.49373697624123075, "test/sim_max_reward_4400046": 0.2800966642793783, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.40129904067771316, "test/sim_max_reward_4400049": 0.0009426071190695369, "train/mean_score": 0.34799670622702106, "test/mean_score": 0.3256175809514829, "val_loss": 65943.1171875} {"train_loss": -5.562703609466553, "global_step": 39942, "epoch": 951} {"train_loss": -5.600139617919922, "global_step": 39943, "epoch": 951} {"train_loss": -5.467776298522949, "global_step": 39944, "epoch": 951} {"train_loss": -5.726027011871338, "global_step": 39945, "epoch": 951} {"train_loss": -5.7061944007873535, "global_step": 39946, "epoch": 951} {"train_loss": -5.479389667510986, "global_step": 39947, "epoch": 951} {"train_loss": -5.671870231628418, "global_step": 39948, "epoch": 951} {"train_loss": -5.603257179260254, "global_step": 39949, "epoch": 951} {"train_loss": -5.562758922576904, "global_step": 39950, "epoch": 951} {"train_loss": -5.635519981384277, "global_step": 39951, "epoch": 951} {"train_loss": -5.605131149291992, "global_step": 39952, "epoch": 951} {"train_loss": -5.730665683746338, "global_step": 39953, "epoch": 951} {"train_loss": -5.645631790161133, "global_step": 39954, "epoch": 951} {"train_loss": -5.647397041320801, "global_step": 39955, "epoch": 951} {"train_loss": -5.729772567749023, "global_step": 39956, "epoch": 951} {"train_loss": -5.729537010192871, "global_step": 39957, "epoch": 951} {"train_loss": -5.683647155761719, "global_step": 39958, "epoch": 951} {"train_loss": -5.689740180969238, "global_step": 39959, "epoch": 951} {"train_loss": -5.524872779846191, "global_step": 39960, "epoch": 951} {"train_loss": -5.660985946655273, "global_step": 39961, "epoch": 951} {"train_loss": -5.682682991027832, "global_step": 39962, "epoch": 951} {"train_loss": -5.496442794799805, "global_step": 39963, "epoch": 951} {"train_loss": -5.651005268096924, "global_step": 39964, "epoch": 951} {"train_loss": -5.6787309646606445, "global_step": 39965, "epoch": 951} {"train_loss": -5.584258556365967, "global_step": 39966, "epoch": 951} {"train_loss": -5.447650909423828, "global_step": 39967, "epoch": 951} {"train_loss": -5.592362403869629, "global_step": 39968, "epoch": 951} {"train_loss": -5.67619514465332, "global_step": 39969, "epoch": 951} {"train_loss": -5.65013313293457, "global_step": 39970, "epoch": 951} {"train_loss": -5.649303436279297, "global_step": 39971, "epoch": 951} {"train_loss": -5.59342098236084, "global_step": 39972, "epoch": 951} {"train_loss": -5.6798930168151855, "global_step": 39973, "epoch": 951} {"train_loss": -5.559648036956787, "global_step": 39974, "epoch": 951} {"train_loss": -5.698920249938965, "global_step": 39975, "epoch": 951} {"train_loss": -5.6074018478393555, "global_step": 39976, "epoch": 951} {"train_loss": -5.5502028465271, "global_step": 39977, "epoch": 951} {"train_loss": -5.403805732727051, "global_step": 39978, "epoch": 951} {"train_loss": -5.610262393951416, "global_step": 39979, "epoch": 951} {"train_loss": -5.381880283355713, "global_step": 39980, "epoch": 951} {"train_loss": -5.695547580718994, "global_step": 39981, "epoch": 951} {"train_loss": -5.598455429077148, "global_step": 39982, "epoch": 951} {"train_loss": -5.6142706871032715, "global_step": 39983, "epoch": 951, "val_loss": 65936.96875} {"train_loss": -5.599147796630859, "global_step": 39984, "epoch": 952} {"train_loss": -5.6532416343688965, "global_step": 39985, "epoch": 952} {"train_loss": -5.679945468902588, "global_step": 39986, "epoch": 952} {"train_loss": -5.724478721618652, "global_step": 39987, "epoch": 952} {"train_loss": -5.586946487426758, "global_step": 39988, "epoch": 952} {"train_loss": -5.676775932312012, "global_step": 39989, "epoch": 952} {"train_loss": -5.659333229064941, "global_step": 39990, "epoch": 952} {"train_loss": -5.621798515319824, "global_step": 39991, "epoch": 952} {"train_loss": -5.730536460876465, "global_step": 39992, "epoch": 952} {"train_loss": -5.631962299346924, "global_step": 39993, "epoch": 952} {"train_loss": -5.775189399719238, "global_step": 39994, "epoch": 952} {"train_loss": -5.641734600067139, "global_step": 39995, "epoch": 952} {"train_loss": -5.6148481369018555, "global_step": 39996, "epoch": 952} {"train_loss": -5.5727715492248535, "global_step": 39997, "epoch": 952} {"train_loss": -5.679603576660156, "global_step": 39998, "epoch": 952} {"train_loss": -5.617132663726807, "global_step": 39999, "epoch": 952} {"train_loss": -5.660821914672852, "global_step": 40000, "epoch": 952} {"train_loss": -5.573893070220947, "global_step": 40001, "epoch": 952} {"train_loss": -5.7784423828125, "global_step": 40002, "epoch": 952} {"train_loss": -5.615568161010742, "global_step": 40003, "epoch": 952} {"train_loss": -5.679142951965332, "global_step": 40004, "epoch": 952} {"train_loss": -5.627261638641357, "global_step": 40005, "epoch": 952} {"train_loss": -5.597452163696289, "global_step": 40006, "epoch": 952} {"train_loss": -5.716670036315918, "global_step": 40007, "epoch": 952} {"train_loss": -5.725137710571289, "global_step": 40008, "epoch": 952} {"train_loss": -5.741698265075684, "global_step": 40009, "epoch": 952} {"train_loss": -5.610485076904297, "global_step": 40010, "epoch": 952} {"train_loss": -5.643779754638672, "global_step": 40011, "epoch": 952} {"train_loss": -5.657698631286621, "global_step": 40012, "epoch": 952} {"train_loss": -5.541535377502441, "global_step": 40013, "epoch": 952} {"train_loss": -5.584415435791016, "global_step": 40014, "epoch": 952} {"train_loss": -5.592681884765625, "global_step": 40015, "epoch": 952} {"train_loss": -5.5947723388671875, "global_step": 40016, "epoch": 952} {"train_loss": -5.654966354370117, "global_step": 40017, "epoch": 952} {"train_loss": -5.5697150230407715, "global_step": 40018, "epoch": 952} {"train_loss": -5.46884822845459, "global_step": 40019, "epoch": 952} {"train_loss": -5.606189727783203, "global_step": 40020, "epoch": 952} {"train_loss": -5.6270036697387695, "global_step": 40021, "epoch": 952} {"train_loss": -5.478564262390137, "global_step": 40022, "epoch": 952} {"train_loss": -5.60318660736084, "global_step": 40023, "epoch": 952} {"train_loss": -5.53746223449707, "global_step": 40024, "epoch": 952} {"train_loss": -5.632374445597331, "global_step": 40025, "epoch": 952, "val_loss": 65906.71875} {"train_loss": -5.577362060546875, "global_step": 40026, "epoch": 953} {"train_loss": -5.535260200500488, "global_step": 40027, "epoch": 953} {"train_loss": -5.574233055114746, "global_step": 40028, "epoch": 953} {"train_loss": -5.698247909545898, "global_step": 40029, "epoch": 953} {"train_loss": -5.652630805969238, "global_step": 40030, "epoch": 953} {"train_loss": -5.635944843292236, "global_step": 40031, "epoch": 953} {"train_loss": -5.6088738441467285, "global_step": 40032, "epoch": 953} {"train_loss": -5.611144065856934, "global_step": 40033, "epoch": 953} {"train_loss": -5.602316856384277, "global_step": 40034, "epoch": 953} {"train_loss": -5.588955879211426, "global_step": 40035, "epoch": 953} {"train_loss": -5.7277021408081055, "global_step": 40036, "epoch": 953} {"train_loss": -5.490826606750488, "global_step": 40037, "epoch": 953} {"train_loss": -5.460202693939209, "global_step": 40038, "epoch": 953} {"train_loss": -5.627809524536133, "global_step": 40039, "epoch": 953} {"train_loss": -5.618386268615723, "global_step": 40040, "epoch": 953} {"train_loss": -5.647998332977295, "global_step": 40041, "epoch": 953} {"train_loss": -5.526195526123047, "global_step": 40042, "epoch": 953} {"train_loss": -5.61651086807251, "global_step": 40043, "epoch": 953} {"train_loss": -5.671267509460449, "global_step": 40044, "epoch": 953} {"train_loss": -5.532162189483643, "global_step": 40045, "epoch": 953} {"train_loss": -5.509241580963135, "global_step": 40046, "epoch": 953} {"train_loss": -5.665408134460449, "global_step": 40047, "epoch": 953} {"train_loss": -5.669059753417969, "global_step": 40048, "epoch": 953} {"train_loss": -5.64937686920166, "global_step": 40049, "epoch": 953} {"train_loss": -5.634098052978516, "global_step": 40050, "epoch": 953} {"train_loss": -5.672454357147217, "global_step": 40051, "epoch": 953} {"train_loss": -5.697240829467773, "global_step": 40052, "epoch": 953} {"train_loss": -5.586349010467529, "global_step": 40053, "epoch": 953} {"train_loss": -5.659143924713135, "global_step": 40054, "epoch": 953} {"train_loss": -5.670990467071533, "global_step": 40055, "epoch": 953} {"train_loss": -5.550307273864746, "global_step": 40056, "epoch": 953} {"train_loss": -5.66955041885376, "global_step": 40057, "epoch": 953} {"train_loss": -5.66090726852417, "global_step": 40058, "epoch": 953} {"train_loss": -5.586658000946045, "global_step": 40059, "epoch": 953} {"train_loss": -5.579023361206055, "global_step": 40060, "epoch": 953} {"train_loss": -5.642592906951904, "global_step": 40061, "epoch": 953} {"train_loss": -5.666240692138672, "global_step": 40062, "epoch": 953} {"train_loss": -5.657780647277832, "global_step": 40063, "epoch": 953} {"train_loss": -5.6257781982421875, "global_step": 40064, "epoch": 953} {"train_loss": -5.717766761779785, "global_step": 40065, "epoch": 953} {"train_loss": -5.720708847045898, "global_step": 40066, "epoch": 953} {"train_loss": -5.61894280569894, "global_step": 40067, "epoch": 953, "val_loss": 65969.421875} {"train_loss": -5.82003116607666, "global_step": 40068, "epoch": 954} {"train_loss": -5.614836692810059, "global_step": 40069, "epoch": 954} {"train_loss": -5.596519470214844, "global_step": 40070, "epoch": 954} {"train_loss": -5.598146438598633, "global_step": 40071, "epoch": 954} {"train_loss": -5.61429500579834, "global_step": 40072, "epoch": 954} {"train_loss": -5.65047550201416, "global_step": 40073, "epoch": 954} {"train_loss": -5.630911827087402, "global_step": 40074, "epoch": 954} {"train_loss": -5.5987229347229, "global_step": 40075, "epoch": 954} {"train_loss": -5.612950325012207, "global_step": 40076, "epoch": 954} {"train_loss": -5.541408061981201, "global_step": 40077, "epoch": 954} {"train_loss": -5.60189151763916, "global_step": 40078, "epoch": 954} {"train_loss": -5.568990707397461, "global_step": 40079, "epoch": 954} {"train_loss": -5.563403129577637, "global_step": 40080, "epoch": 954} {"train_loss": -5.589086532592773, "global_step": 40081, "epoch": 954} {"train_loss": -5.631955623626709, "global_step": 40082, "epoch": 954} {"train_loss": -5.74704122543335, "global_step": 40083, "epoch": 954} {"train_loss": -5.556815147399902, "global_step": 40084, "epoch": 954} {"train_loss": -5.605694770812988, "global_step": 40085, "epoch": 954} {"train_loss": -5.712365627288818, "global_step": 40086, "epoch": 954} {"train_loss": -5.6115922927856445, "global_step": 40087, "epoch": 954} {"train_loss": -5.526854038238525, "global_step": 40088, "epoch": 954} {"train_loss": -5.595038414001465, "global_step": 40089, "epoch": 954} {"train_loss": -5.629380702972412, "global_step": 40090, "epoch": 954} {"train_loss": -5.530266284942627, "global_step": 40091, "epoch": 954} {"train_loss": -5.548946380615234, "global_step": 40092, "epoch": 954} {"train_loss": -5.648366928100586, "global_step": 40093, "epoch": 954} {"train_loss": -5.578078746795654, "global_step": 40094, "epoch": 954} {"train_loss": -5.604467391967773, "global_step": 40095, "epoch": 954} {"train_loss": -5.636200904846191, "global_step": 40096, "epoch": 954} {"train_loss": -5.528806686401367, "global_step": 40097, "epoch": 954} {"train_loss": -5.616422653198242, "global_step": 40098, "epoch": 954} {"train_loss": -5.593400001525879, "global_step": 40099, "epoch": 954} {"train_loss": -5.555678844451904, "global_step": 40100, "epoch": 954} {"train_loss": -5.599677085876465, "global_step": 40101, "epoch": 954} {"train_loss": -5.642230987548828, "global_step": 40102, "epoch": 954} {"train_loss": -5.6121063232421875, "global_step": 40103, "epoch": 954} {"train_loss": -5.648402214050293, "global_step": 40104, "epoch": 954} {"train_loss": -5.685426712036133, "global_step": 40105, "epoch": 954} {"train_loss": -5.6547417640686035, "global_step": 40106, "epoch": 954} {"train_loss": -5.610021114349365, "global_step": 40107, "epoch": 954} {"train_loss": -5.468017578125, "global_step": 40108, "epoch": 954} {"train_loss": -5.608914318538847, "global_step": 40109, "epoch": 954, "val_loss": 65705.828125} {"train_loss": -5.759072303771973, "global_step": 40110, "epoch": 955} {"train_loss": -5.6619343757629395, "global_step": 40111, "epoch": 955} {"train_loss": -5.627204895019531, "global_step": 40112, "epoch": 955} {"train_loss": -5.713759422302246, "global_step": 40113, "epoch": 955} {"train_loss": -5.708591461181641, "global_step": 40114, "epoch": 955} {"train_loss": -5.574889183044434, "global_step": 40115, "epoch": 955} {"train_loss": -5.563300132751465, "global_step": 40116, "epoch": 955} {"train_loss": -5.707578659057617, "global_step": 40117, "epoch": 955} {"train_loss": -5.569359302520752, "global_step": 40118, "epoch": 955} {"train_loss": -5.64402961730957, "global_step": 40119, "epoch": 955} {"train_loss": -5.559379577636719, "global_step": 40120, "epoch": 955} {"train_loss": -5.647979259490967, "global_step": 40121, "epoch": 955} {"train_loss": -5.489193439483643, "global_step": 40122, "epoch": 955} {"train_loss": -5.760464668273926, "global_step": 40123, "epoch": 955} {"train_loss": -5.699810981750488, "global_step": 40124, "epoch": 955} {"train_loss": -5.583751201629639, "global_step": 40125, "epoch": 955} {"train_loss": -5.7396745681762695, "global_step": 40126, "epoch": 955} {"train_loss": -5.5799174308776855, "global_step": 40127, "epoch": 955} {"train_loss": -5.529696464538574, "global_step": 40128, "epoch": 955} {"train_loss": -5.791223049163818, "global_step": 40129, "epoch": 955} {"train_loss": -5.448981285095215, "global_step": 40130, "epoch": 955} {"train_loss": -5.659154891967773, "global_step": 40131, "epoch": 955} {"train_loss": -5.70143985748291, "global_step": 40132, "epoch": 955} {"train_loss": -5.575724124908447, "global_step": 40133, "epoch": 955} {"train_loss": -5.621997833251953, "global_step": 40134, "epoch": 955} {"train_loss": -5.53652811050415, "global_step": 40135, "epoch": 955} {"train_loss": -5.63313102722168, "global_step": 40136, "epoch": 955} {"train_loss": -5.76133918762207, "global_step": 40137, "epoch": 955} {"train_loss": -5.580039978027344, "global_step": 40138, "epoch": 955} {"train_loss": -5.610740661621094, "global_step": 40139, "epoch": 955} {"train_loss": -5.641275405883789, "global_step": 40140, "epoch": 955} {"train_loss": -5.632301330566406, "global_step": 40141, "epoch": 955} {"train_loss": -5.666983604431152, "global_step": 40142, "epoch": 955} {"train_loss": -5.652979850769043, "global_step": 40143, "epoch": 955} {"train_loss": -5.736516952514648, "global_step": 40144, "epoch": 955} {"train_loss": -5.615738868713379, "global_step": 40145, "epoch": 955} {"train_loss": -5.7265944480896, "global_step": 40146, "epoch": 955} {"train_loss": -5.702725410461426, "global_step": 40147, "epoch": 955} {"train_loss": -5.641526222229004, "global_step": 40148, "epoch": 955} {"train_loss": -5.592887878417969, "global_step": 40149, "epoch": 955} {"train_loss": -5.6502180099487305, "global_step": 40150, "epoch": 955} {"train_loss": -5.640041464851016, "global_step": 40151, "epoch": 955, "val_loss": 66179.9609375} {"train_loss": -5.700891494750977, "global_step": 40152, "epoch": 956} {"train_loss": -5.6591291427612305, "global_step": 40153, "epoch": 956} {"train_loss": -5.624770164489746, "global_step": 40154, "epoch": 956} {"train_loss": -5.561075687408447, "global_step": 40155, "epoch": 956} {"train_loss": -5.801929473876953, "global_step": 40156, "epoch": 956} {"train_loss": -5.516522407531738, "global_step": 40157, "epoch": 956} {"train_loss": -5.628722667694092, "global_step": 40158, "epoch": 956} {"train_loss": -5.585999488830566, "global_step": 40159, "epoch": 956} {"train_loss": -5.641798496246338, "global_step": 40160, "epoch": 956} {"train_loss": -5.718970775604248, "global_step": 40161, "epoch": 956} {"train_loss": -5.585077285766602, "global_step": 40162, "epoch": 956} {"train_loss": -5.772724151611328, "global_step": 40163, "epoch": 956} {"train_loss": -5.476747035980225, "global_step": 40164, "epoch": 956} {"train_loss": -5.55256462097168, "global_step": 40165, "epoch": 956} {"train_loss": -5.638091564178467, "global_step": 40166, "epoch": 956} {"train_loss": -5.456387519836426, "global_step": 40167, "epoch": 956} {"train_loss": -5.7221479415893555, "global_step": 40168, "epoch": 956} {"train_loss": -5.554157733917236, "global_step": 40169, "epoch": 956} {"train_loss": -5.610271453857422, "global_step": 40170, "epoch": 956} {"train_loss": -5.62180233001709, "global_step": 40171, "epoch": 956} {"train_loss": -5.602782249450684, "global_step": 40172, "epoch": 956} {"train_loss": -5.540843486785889, "global_step": 40173, "epoch": 956} {"train_loss": -5.575798988342285, "global_step": 40174, "epoch": 956} {"train_loss": -5.531312942504883, "global_step": 40175, "epoch": 956} {"train_loss": -5.549981117248535, "global_step": 40176, "epoch": 956} {"train_loss": -5.558257102966309, "global_step": 40177, "epoch": 956} {"train_loss": -5.648619174957275, "global_step": 40178, "epoch": 956} {"train_loss": -5.516236305236816, "global_step": 40179, "epoch": 956} {"train_loss": -5.609745025634766, "global_step": 40180, "epoch": 956} {"train_loss": -5.662492752075195, "global_step": 40181, "epoch": 956} {"train_loss": -5.625748157501221, "global_step": 40182, "epoch": 956} {"train_loss": -5.504556179046631, "global_step": 40183, "epoch": 956} {"train_loss": -5.478909015655518, "global_step": 40184, "epoch": 956} {"train_loss": -5.562560081481934, "global_step": 40185, "epoch": 956} {"train_loss": -5.592157363891602, "global_step": 40186, "epoch": 956} {"train_loss": -5.593990802764893, "global_step": 40187, "epoch": 956} {"train_loss": -5.558674335479736, "global_step": 40188, "epoch": 956} {"train_loss": -5.5671610832214355, "global_step": 40189, "epoch": 956} {"train_loss": -5.4994940757751465, "global_step": 40190, "epoch": 956} {"train_loss": -5.657873630523682, "global_step": 40191, "epoch": 956} {"train_loss": -5.748020172119141, "global_step": 40192, "epoch": 956} {"train_loss": -5.598105657668341, "global_step": 40193, "epoch": 956, "val_loss": 66534.53125} {"train_loss": -5.671855449676514, "global_step": 40194, "epoch": 957} {"train_loss": -5.694942474365234, "global_step": 40195, "epoch": 957} {"train_loss": -5.7346086502075195, "global_step": 40196, "epoch": 957} {"train_loss": -5.582873821258545, "global_step": 40197, "epoch": 957} {"train_loss": -5.6418375968933105, "global_step": 40198, "epoch": 957} {"train_loss": -5.687315940856934, "global_step": 40199, "epoch": 957} {"train_loss": -5.528140544891357, "global_step": 40200, "epoch": 957} {"train_loss": -5.533546447753906, "global_step": 40201, "epoch": 957} {"train_loss": -5.478305816650391, "global_step": 40202, "epoch": 957} {"train_loss": -5.716826915740967, "global_step": 40203, "epoch": 957} {"train_loss": -5.634389400482178, "global_step": 40204, "epoch": 957} {"train_loss": -5.540882110595703, "global_step": 40205, "epoch": 957} {"train_loss": -5.595993995666504, "global_step": 40206, "epoch": 957} {"train_loss": -5.660482406616211, "global_step": 40207, "epoch": 957} {"train_loss": -5.552709579467773, "global_step": 40208, "epoch": 957} {"train_loss": -5.7305908203125, "global_step": 40209, "epoch": 957} {"train_loss": -5.5432047843933105, "global_step": 40210, "epoch": 957} {"train_loss": -5.654627799987793, "global_step": 40211, "epoch": 957} {"train_loss": -5.52078104019165, "global_step": 40212, "epoch": 957} {"train_loss": -5.561120510101318, "global_step": 40213, "epoch": 957} {"train_loss": -5.580225944519043, "global_step": 40214, "epoch": 957} {"train_loss": -5.550901412963867, "global_step": 40215, "epoch": 957} {"train_loss": -5.70029354095459, "global_step": 40216, "epoch": 957} {"train_loss": -5.645397186279297, "global_step": 40217, "epoch": 957} {"train_loss": -5.560695171356201, "global_step": 40218, "epoch": 957} {"train_loss": -5.590883255004883, "global_step": 40219, "epoch": 957} {"train_loss": -5.618805885314941, "global_step": 40220, "epoch": 957} {"train_loss": -5.5507588386535645, "global_step": 40221, "epoch": 957} {"train_loss": -5.575260162353516, "global_step": 40222, "epoch": 957} {"train_loss": -5.668951988220215, "global_step": 40223, "epoch": 957} {"train_loss": -5.724564552307129, "global_step": 40224, "epoch": 957} {"train_loss": -5.5610198974609375, "global_step": 40225, "epoch": 957} {"train_loss": -5.669353485107422, "global_step": 40226, "epoch": 957} {"train_loss": -5.547746658325195, "global_step": 40227, "epoch": 957} {"train_loss": -5.587043762207031, "global_step": 40228, "epoch": 957} {"train_loss": -5.756772994995117, "global_step": 40229, "epoch": 957} {"train_loss": -5.617897987365723, "global_step": 40230, "epoch": 957} {"train_loss": -5.606977462768555, "global_step": 40231, "epoch": 957} {"train_loss": -5.60557222366333, "global_step": 40232, "epoch": 957} {"train_loss": -5.498899936676025, "global_step": 40233, "epoch": 957} {"train_loss": -5.650904655456543, "global_step": 40234, "epoch": 957} {"train_loss": -5.611201172783261, "global_step": 40235, "epoch": 957, "val_loss": 66394.21875} {"train_loss": -5.510235786437988, "global_step": 40236, "epoch": 958} {"train_loss": -5.590424537658691, "global_step": 40237, "epoch": 958} {"train_loss": -5.5806989669799805, "global_step": 40238, "epoch": 958} {"train_loss": -5.530294895172119, "global_step": 40239, "epoch": 958} {"train_loss": -5.591360569000244, "global_step": 40240, "epoch": 958} {"train_loss": -5.480891227722168, "global_step": 40241, "epoch": 958} {"train_loss": -5.684141159057617, "global_step": 40242, "epoch": 958} {"train_loss": -5.646076202392578, "global_step": 40243, "epoch": 958} {"train_loss": -5.49317741394043, "global_step": 40244, "epoch": 958} {"train_loss": -5.606383323669434, "global_step": 40245, "epoch": 958} {"train_loss": -5.618101119995117, "global_step": 40246, "epoch": 958} {"train_loss": -5.529766082763672, "global_step": 40247, "epoch": 958} {"train_loss": -5.654713153839111, "global_step": 40248, "epoch": 958} {"train_loss": -5.708017826080322, "global_step": 40249, "epoch": 958} {"train_loss": -5.582254886627197, "global_step": 40250, "epoch": 958} {"train_loss": -5.686222076416016, "global_step": 40251, "epoch": 958} {"train_loss": -5.499584674835205, "global_step": 40252, "epoch": 958} {"train_loss": -5.685480117797852, "global_step": 40253, "epoch": 958} {"train_loss": -5.508429527282715, "global_step": 40254, "epoch": 958} {"train_loss": -5.522322654724121, "global_step": 40255, "epoch": 958} {"train_loss": -5.6478190422058105, "global_step": 40256, "epoch": 958} {"train_loss": -5.638175964355469, "global_step": 40257, "epoch": 958} {"train_loss": -5.619182586669922, "global_step": 40258, "epoch": 958} {"train_loss": -5.517274856567383, "global_step": 40259, "epoch": 958} {"train_loss": -5.642586708068848, "global_step": 40260, "epoch": 958} {"train_loss": -5.5973052978515625, "global_step": 40261, "epoch": 958} {"train_loss": -5.662243843078613, "global_step": 40262, "epoch": 958} {"train_loss": -5.590048789978027, "global_step": 40263, "epoch": 958} {"train_loss": -5.664453983306885, "global_step": 40264, "epoch": 958} {"train_loss": -5.579022407531738, "global_step": 40265, "epoch": 958} {"train_loss": -5.6308393478393555, "global_step": 40266, "epoch": 958} {"train_loss": -5.628002643585205, "global_step": 40267, "epoch": 958} {"train_loss": -5.683264255523682, "global_step": 40268, "epoch": 958} {"train_loss": -5.614070892333984, "global_step": 40269, "epoch": 958} {"train_loss": -5.742493152618408, "global_step": 40270, "epoch": 958} {"train_loss": -5.744537353515625, "global_step": 40271, "epoch": 958} {"train_loss": -5.562711715698242, "global_step": 40272, "epoch": 958} {"train_loss": -5.569425582885742, "global_step": 40273, "epoch": 958} {"train_loss": -5.5595598220825195, "global_step": 40274, "epoch": 958} {"train_loss": -5.652803421020508, "global_step": 40275, "epoch": 958} {"train_loss": -5.666196823120117, "global_step": 40276, "epoch": 958} {"train_loss": -5.606310901187715, "global_step": 40277, "epoch": 958, "val_loss": 65980.9140625} {"train_loss": -5.515777111053467, "global_step": 40278, "epoch": 959} {"train_loss": -5.733859062194824, "global_step": 40279, "epoch": 959} {"train_loss": -5.64145565032959, "global_step": 40280, "epoch": 959} {"train_loss": -5.648997783660889, "global_step": 40281, "epoch": 959} {"train_loss": -5.551792144775391, "global_step": 40282, "epoch": 959} {"train_loss": -5.7377519607543945, "global_step": 40283, "epoch": 959} {"train_loss": -5.599799156188965, "global_step": 40284, "epoch": 959} {"train_loss": -5.599855899810791, "global_step": 40285, "epoch": 959} {"train_loss": -5.557480812072754, "global_step": 40286, "epoch": 959} {"train_loss": -5.709357261657715, "global_step": 40287, "epoch": 959} {"train_loss": -5.653939247131348, "global_step": 40288, "epoch": 959} {"train_loss": -5.4806718826293945, "global_step": 40289, "epoch": 959} {"train_loss": -5.635562896728516, "global_step": 40290, "epoch": 959} {"train_loss": -5.603151798248291, "global_step": 40291, "epoch": 959} {"train_loss": -5.478855133056641, "global_step": 40292, "epoch": 959} {"train_loss": -5.677157878875732, "global_step": 40293, "epoch": 959} {"train_loss": -5.37786865234375, "global_step": 40294, "epoch": 959} {"train_loss": -5.57615852355957, "global_step": 40295, "epoch": 959} {"train_loss": -5.495277404785156, "global_step": 40296, "epoch": 959} {"train_loss": -5.605535984039307, "global_step": 40297, "epoch": 959} {"train_loss": -5.642289161682129, "global_step": 40298, "epoch": 959} {"train_loss": -5.559990882873535, "global_step": 40299, "epoch": 959} {"train_loss": -5.566557884216309, "global_step": 40300, "epoch": 959} {"train_loss": -5.5823822021484375, "global_step": 40301, "epoch": 959} {"train_loss": -5.5991291999816895, "global_step": 40302, "epoch": 959} {"train_loss": -5.634439945220947, "global_step": 40303, "epoch": 959} {"train_loss": -5.521611213684082, "global_step": 40304, "epoch": 959} {"train_loss": -5.621960639953613, "global_step": 40305, "epoch": 959} {"train_loss": -5.667012691497803, "global_step": 40306, "epoch": 959} {"train_loss": -5.530057907104492, "global_step": 40307, "epoch": 959} {"train_loss": -5.663087844848633, "global_step": 40308, "epoch": 959} {"train_loss": -5.778596878051758, "global_step": 40309, "epoch": 959} {"train_loss": -5.484758377075195, "global_step": 40310, "epoch": 959} {"train_loss": -5.636066913604736, "global_step": 40311, "epoch": 959} {"train_loss": -5.675610065460205, "global_step": 40312, "epoch": 959} {"train_loss": -5.692687034606934, "global_step": 40313, "epoch": 959} {"train_loss": -5.652547359466553, "global_step": 40314, "epoch": 959} {"train_loss": -5.7392168045043945, "global_step": 40315, "epoch": 959} {"train_loss": -5.6111063957214355, "global_step": 40316, "epoch": 959} {"train_loss": -5.692939758300781, "global_step": 40317, "epoch": 959} {"train_loss": -5.6407599449157715, "global_step": 40318, "epoch": 959} {"train_loss": -5.6112527052561445, "global_step": 40319, "epoch": 959, "val_loss": 65997.1875} {"train_loss": -5.649571895599365, "global_step": 40320, "epoch": 960} {"train_loss": -5.720612525939941, "global_step": 40321, "epoch": 960} {"train_loss": -5.670178413391113, "global_step": 40322, "epoch": 960} {"train_loss": -5.581901550292969, "global_step": 40323, "epoch": 960} {"train_loss": -5.784379959106445, "global_step": 40324, "epoch": 960} {"train_loss": -5.718354225158691, "global_step": 40325, "epoch": 960} {"train_loss": -5.578946113586426, "global_step": 40326, "epoch": 960} {"train_loss": -5.624488830566406, "global_step": 40327, "epoch": 960} {"train_loss": -5.794818878173828, "global_step": 40328, "epoch": 960} {"train_loss": -5.615195274353027, "global_step": 40329, "epoch": 960} {"train_loss": -5.657873153686523, "global_step": 40330, "epoch": 960} {"train_loss": -5.504683494567871, "global_step": 40331, "epoch": 960} {"train_loss": -5.557945728302002, "global_step": 40332, "epoch": 960} {"train_loss": -5.669323921203613, "global_step": 40333, "epoch": 960} {"train_loss": -5.604469299316406, "global_step": 40334, "epoch": 960} {"train_loss": -5.6400909423828125, "global_step": 40335, "epoch": 960} {"train_loss": -5.573182106018066, "global_step": 40336, "epoch": 960} {"train_loss": -5.604315280914307, "global_step": 40337, "epoch": 960} {"train_loss": -5.672920227050781, "global_step": 40338, "epoch": 960} {"train_loss": -5.807764053344727, "global_step": 40339, "epoch": 960} {"train_loss": -5.611297607421875, "global_step": 40340, "epoch": 960} {"train_loss": -5.571688652038574, "global_step": 40341, "epoch": 960} {"train_loss": -5.751195907592773, "global_step": 40342, "epoch": 960} {"train_loss": -5.7608723640441895, "global_step": 40343, "epoch": 960} {"train_loss": -5.6892781257629395, "global_step": 40344, "epoch": 960} {"train_loss": -5.548290252685547, "global_step": 40345, "epoch": 960} {"train_loss": -5.557373523712158, "global_step": 40346, "epoch": 960} {"train_loss": -5.641799449920654, "global_step": 40347, "epoch": 960} {"train_loss": -5.6952056884765625, "global_step": 40348, "epoch": 960} {"train_loss": -5.7610931396484375, "global_step": 40349, "epoch": 960} {"train_loss": -5.638298511505127, "global_step": 40350, "epoch": 960} {"train_loss": -5.696566104888916, "global_step": 40351, "epoch": 960} {"train_loss": -5.684627532958984, "global_step": 40352, "epoch": 960} {"train_loss": -5.632342338562012, "global_step": 40353, "epoch": 960} {"train_loss": -5.480258941650391, "global_step": 40354, "epoch": 960} {"train_loss": -5.658629894256592, "global_step": 40355, "epoch": 960} {"train_loss": -5.669187545776367, "global_step": 40356, "epoch": 960} {"train_loss": -5.620823860168457, "global_step": 40357, "epoch": 960} {"train_loss": -5.467555046081543, "global_step": 40358, "epoch": 960} {"train_loss": -5.626510143280029, "global_step": 40359, "epoch": 960} {"train_loss": -5.557357311248779, "global_step": 40360, "epoch": 960} {"train_loss": -5.640987566539219, "global_step": 40361, "epoch": 960, "val_loss": 66002.1640625} {"train_loss": -5.542984485626221, "global_step": 40362, "epoch": 961} {"train_loss": -5.552884101867676, "global_step": 40363, "epoch": 961} {"train_loss": -5.546029567718506, "global_step": 40364, "epoch": 961} {"train_loss": -5.688302040100098, "global_step": 40365, "epoch": 961} {"train_loss": -5.564937591552734, "global_step": 40366, "epoch": 961} {"train_loss": -5.637152671813965, "global_step": 40367, "epoch": 961} {"train_loss": -5.593832492828369, "global_step": 40368, "epoch": 961} {"train_loss": -5.640610694885254, "global_step": 40369, "epoch": 961} {"train_loss": -5.528332233428955, "global_step": 40370, "epoch": 961} {"train_loss": -5.776854991912842, "global_step": 40371, "epoch": 961} {"train_loss": -5.625214576721191, "global_step": 40372, "epoch": 961} {"train_loss": -5.591561317443848, "global_step": 40373, "epoch": 961} {"train_loss": -5.662339210510254, "global_step": 40374, "epoch": 961} {"train_loss": -5.625585556030273, "global_step": 40375, "epoch": 961} {"train_loss": -5.654274940490723, "global_step": 40376, "epoch": 961} {"train_loss": -5.571364402770996, "global_step": 40377, "epoch": 961} {"train_loss": -5.564697265625, "global_step": 40378, "epoch": 961} {"train_loss": -5.604736804962158, "global_step": 40379, "epoch": 961} {"train_loss": -5.52410888671875, "global_step": 40380, "epoch": 961} {"train_loss": -5.655787467956543, "global_step": 40381, "epoch": 961} {"train_loss": -5.738501071929932, "global_step": 40382, "epoch": 961} {"train_loss": -5.701098442077637, "global_step": 40383, "epoch": 961} {"train_loss": -5.6125617027282715, "global_step": 40384, "epoch": 961} {"train_loss": -5.7226972579956055, "global_step": 40385, "epoch": 961} {"train_loss": -5.667637825012207, "global_step": 40386, "epoch": 961} {"train_loss": -5.622689723968506, "global_step": 40387, "epoch": 961} {"train_loss": -5.644514083862305, "global_step": 40388, "epoch": 961} {"train_loss": -5.719145774841309, "global_step": 40389, "epoch": 961} {"train_loss": -5.52912712097168, "global_step": 40390, "epoch": 961} {"train_loss": -5.573858737945557, "global_step": 40391, "epoch": 961} {"train_loss": -5.611922264099121, "global_step": 40392, "epoch": 961} {"train_loss": -5.5807976722717285, "global_step": 40393, "epoch": 961} {"train_loss": -5.573879718780518, "global_step": 40394, "epoch": 961} {"train_loss": -5.6309099197387695, "global_step": 40395, "epoch": 961} {"train_loss": -5.601423263549805, "global_step": 40396, "epoch": 961} {"train_loss": -5.633639335632324, "global_step": 40397, "epoch": 961} {"train_loss": -5.631956100463867, "global_step": 40398, "epoch": 961} {"train_loss": -5.648947715759277, "global_step": 40399, "epoch": 961} {"train_loss": -5.6702141761779785, "global_step": 40400, "epoch": 961} {"train_loss": -5.516076564788818, "global_step": 40401, "epoch": 961} {"train_loss": -5.607892990112305, "global_step": 40402, "epoch": 961} {"train_loss": -5.619714839117868, "global_step": 40403, "epoch": 961, "val_loss": 66072.2890625} {"train_loss": -5.564387798309326, "global_step": 40404, "epoch": 962} {"train_loss": -5.662457466125488, "global_step": 40405, "epoch": 962} {"train_loss": -5.469354629516602, "global_step": 40406, "epoch": 962} {"train_loss": -5.758133888244629, "global_step": 40407, "epoch": 962} {"train_loss": -5.754306793212891, "global_step": 40408, "epoch": 962} {"train_loss": -5.674638748168945, "global_step": 40409, "epoch": 962} {"train_loss": -5.677196025848389, "global_step": 40410, "epoch": 962} {"train_loss": -5.661012172698975, "global_step": 40411, "epoch": 962} {"train_loss": -5.585695266723633, "global_step": 40412, "epoch": 962} {"train_loss": -5.601652145385742, "global_step": 40413, "epoch": 962} {"train_loss": -5.588523864746094, "global_step": 40414, "epoch": 962} {"train_loss": -5.819056510925293, "global_step": 40415, "epoch": 962} {"train_loss": -5.719510078430176, "global_step": 40416, "epoch": 962} {"train_loss": -5.577383518218994, "global_step": 40417, "epoch": 962} {"train_loss": -5.5669169425964355, "global_step": 40418, "epoch": 962} {"train_loss": -5.781835556030273, "global_step": 40419, "epoch": 962} {"train_loss": -5.760876178741455, "global_step": 40420, "epoch": 962} {"train_loss": -5.682892799377441, "global_step": 40421, "epoch": 962} {"train_loss": -5.6419477462768555, "global_step": 40422, "epoch": 962} {"train_loss": -5.566984176635742, "global_step": 40423, "epoch": 962} {"train_loss": -5.681095123291016, "global_step": 40424, "epoch": 962} {"train_loss": -5.594120979309082, "global_step": 40425, "epoch": 962} {"train_loss": -5.617476940155029, "global_step": 40426, "epoch": 962} {"train_loss": -5.741708278656006, "global_step": 40427, "epoch": 962} {"train_loss": -5.479608535766602, "global_step": 40428, "epoch": 962} {"train_loss": -5.561529636383057, "global_step": 40429, "epoch": 962} {"train_loss": -5.567666053771973, "global_step": 40430, "epoch": 962} {"train_loss": -5.710567474365234, "global_step": 40431, "epoch": 962} {"train_loss": -5.774165153503418, "global_step": 40432, "epoch": 962} {"train_loss": -5.481804847717285, "global_step": 40433, "epoch": 962} {"train_loss": -5.598974227905273, "global_step": 40434, "epoch": 962} {"train_loss": -5.601826190948486, "global_step": 40435, "epoch": 962} {"train_loss": -5.521635055541992, "global_step": 40436, "epoch": 962} {"train_loss": -5.708680152893066, "global_step": 40437, "epoch": 962} {"train_loss": -5.585141181945801, "global_step": 40438, "epoch": 962} {"train_loss": -5.592276573181152, "global_step": 40439, "epoch": 962} {"train_loss": -5.42565393447876, "global_step": 40440, "epoch": 962} {"train_loss": -5.60841178894043, "global_step": 40441, "epoch": 962} {"train_loss": -5.502325057983398, "global_step": 40442, "epoch": 962} {"train_loss": -5.650707244873047, "global_step": 40443, "epoch": 962} {"train_loss": -5.582952499389648, "global_step": 40444, "epoch": 962} {"train_loss": -5.62542910802932, "global_step": 40445, "epoch": 962, "val_loss": 66763.78125} {"train_loss": -5.687374114990234, "global_step": 40446, "epoch": 963} {"train_loss": -5.526376724243164, "global_step": 40447, "epoch": 963} {"train_loss": -5.707940101623535, "global_step": 40448, "epoch": 963} {"train_loss": -5.635128021240234, "global_step": 40449, "epoch": 963} {"train_loss": -5.506685256958008, "global_step": 40450, "epoch": 963} {"train_loss": -5.622763156890869, "global_step": 40451, "epoch": 963} {"train_loss": -5.679618835449219, "global_step": 40452, "epoch": 963} {"train_loss": -5.606447696685791, "global_step": 40453, "epoch": 963} {"train_loss": -5.704990386962891, "global_step": 40454, "epoch": 963} {"train_loss": -5.600691795349121, "global_step": 40455, "epoch": 963} {"train_loss": -5.763461112976074, "global_step": 40456, "epoch": 963} {"train_loss": -5.723291397094727, "global_step": 40457, "epoch": 963} {"train_loss": -5.6514892578125, "global_step": 40458, "epoch": 963} {"train_loss": -5.659246921539307, "global_step": 40459, "epoch": 963} {"train_loss": -5.505904197692871, "global_step": 40460, "epoch": 963} {"train_loss": -5.664527893066406, "global_step": 40461, "epoch": 963} {"train_loss": -5.696928024291992, "global_step": 40462, "epoch": 963} {"train_loss": -5.683244705200195, "global_step": 40463, "epoch": 963} {"train_loss": -5.61064338684082, "global_step": 40464, "epoch": 963} {"train_loss": -5.6302900314331055, "global_step": 40465, "epoch": 963} {"train_loss": -5.6259965896606445, "global_step": 40466, "epoch": 963} {"train_loss": -5.644329071044922, "global_step": 40467, "epoch": 963} {"train_loss": -5.692079544067383, "global_step": 40468, "epoch": 963} {"train_loss": -5.742194652557373, "global_step": 40469, "epoch": 963} {"train_loss": -5.6663737297058105, "global_step": 40470, "epoch": 963} {"train_loss": -5.709217071533203, "global_step": 40471, "epoch": 963} {"train_loss": -5.760928630828857, "global_step": 40472, "epoch": 963} {"train_loss": -5.6998419761657715, "global_step": 40473, "epoch": 963} {"train_loss": -5.666657447814941, "global_step": 40474, "epoch": 963} {"train_loss": -5.644748687744141, "global_step": 40475, "epoch": 963} {"train_loss": -5.542689323425293, "global_step": 40476, "epoch": 963} {"train_loss": -5.645386695861816, "global_step": 40477, "epoch": 963} {"train_loss": -5.535454750061035, "global_step": 40478, "epoch": 963} {"train_loss": -5.68307638168335, "global_step": 40479, "epoch": 963} {"train_loss": -5.651667594909668, "global_step": 40480, "epoch": 963} {"train_loss": -5.697811126708984, "global_step": 40481, "epoch": 963} {"train_loss": -5.88395881652832, "global_step": 40482, "epoch": 963} {"train_loss": -5.704551696777344, "global_step": 40483, "epoch": 963} {"train_loss": -5.5425028800964355, "global_step": 40484, "epoch": 963} {"train_loss": -5.706060886383057, "global_step": 40485, "epoch": 963} {"train_loss": -5.650824546813965, "global_step": 40486, "epoch": 963} {"train_loss": -5.657200029918125, "global_step": 40487, "epoch": 963, "val_loss": 66022.53125} {"train_loss": -5.606164932250977, "global_step": 40488, "epoch": 964} {"train_loss": -5.597171306610107, "global_step": 40489, "epoch": 964} {"train_loss": -5.585657119750977, "global_step": 40490, "epoch": 964} {"train_loss": -5.739767551422119, "global_step": 40491, "epoch": 964} {"train_loss": -5.616100311279297, "global_step": 40492, "epoch": 964} {"train_loss": -5.614600658416748, "global_step": 40493, "epoch": 964} {"train_loss": -5.676015853881836, "global_step": 40494, "epoch": 964} {"train_loss": -5.734268665313721, "global_step": 40495, "epoch": 964} {"train_loss": -5.747307777404785, "global_step": 40496, "epoch": 964} {"train_loss": -5.535409927368164, "global_step": 40497, "epoch": 964} {"train_loss": -5.535635471343994, "global_step": 40498, "epoch": 964} {"train_loss": -5.644484519958496, "global_step": 40499, "epoch": 964} {"train_loss": -5.672811508178711, "global_step": 40500, "epoch": 964} {"train_loss": -5.654717445373535, "global_step": 40501, "epoch": 964} {"train_loss": -5.67451286315918, "global_step": 40502, "epoch": 964} {"train_loss": -5.705835819244385, "global_step": 40503, "epoch": 964} {"train_loss": -5.473931312561035, "global_step": 40504, "epoch": 964} {"train_loss": -5.608936309814453, "global_step": 40505, "epoch": 964} {"train_loss": -5.543148994445801, "global_step": 40506, "epoch": 964} {"train_loss": -5.664463996887207, "global_step": 40507, "epoch": 964} {"train_loss": -5.5950727462768555, "global_step": 40508, "epoch": 964} {"train_loss": -5.586809158325195, "global_step": 40509, "epoch": 964} {"train_loss": -5.730186462402344, "global_step": 40510, "epoch": 964} {"train_loss": -5.69180965423584, "global_step": 40511, "epoch": 964} {"train_loss": -5.666583061218262, "global_step": 40512, "epoch": 964} {"train_loss": -5.682887554168701, "global_step": 40513, "epoch": 964} {"train_loss": -5.749752998352051, "global_step": 40514, "epoch": 964} {"train_loss": -5.6529130935668945, "global_step": 40515, "epoch": 964} {"train_loss": -5.603327751159668, "global_step": 40516, "epoch": 964} {"train_loss": -5.557836532592773, "global_step": 40517, "epoch": 964} {"train_loss": -5.619715690612793, "global_step": 40518, "epoch": 964} {"train_loss": -5.625766754150391, "global_step": 40519, "epoch": 964} {"train_loss": -5.7652082443237305, "global_step": 40520, "epoch": 964} {"train_loss": -5.56280517578125, "global_step": 40521, "epoch": 964} {"train_loss": -5.522128582000732, "global_step": 40522, "epoch": 964} {"train_loss": -5.754788398742676, "global_step": 40523, "epoch": 964} {"train_loss": -5.553927421569824, "global_step": 40524, "epoch": 964} {"train_loss": -5.535269737243652, "global_step": 40525, "epoch": 964} {"train_loss": -5.649654388427734, "global_step": 40526, "epoch": 964} {"train_loss": -5.6211066246032715, "global_step": 40527, "epoch": 964} {"train_loss": -5.7071533203125, "global_step": 40528, "epoch": 964} {"train_loss": -5.635892720449538, "global_step": 40529, "epoch": 964, "val_loss": 65882.625} {"train_loss": -5.620697021484375, "global_step": 40530, "epoch": 965} {"train_loss": -5.578175067901611, "global_step": 40531, "epoch": 965} {"train_loss": -5.4603071212768555, "global_step": 40532, "epoch": 965} {"train_loss": -5.6635236740112305, "global_step": 40533, "epoch": 965} {"train_loss": -5.671520233154297, "global_step": 40534, "epoch": 965} {"train_loss": -5.670661926269531, "global_step": 40535, "epoch": 965} {"train_loss": -5.739391326904297, "global_step": 40536, "epoch": 965} {"train_loss": -5.624358654022217, "global_step": 40537, "epoch": 965} {"train_loss": -5.568892478942871, "global_step": 40538, "epoch": 965} {"train_loss": -5.611774921417236, "global_step": 40539, "epoch": 965} {"train_loss": -5.5845112800598145, "global_step": 40540, "epoch": 965} {"train_loss": -5.639369964599609, "global_step": 40541, "epoch": 965} {"train_loss": -5.654750347137451, "global_step": 40542, "epoch": 965} {"train_loss": -5.6461076736450195, "global_step": 40543, "epoch": 965} {"train_loss": -5.583624839782715, "global_step": 40544, "epoch": 965} {"train_loss": -5.590785980224609, "global_step": 40545, "epoch": 965} {"train_loss": -5.762504577636719, "global_step": 40546, "epoch": 965} {"train_loss": -5.655631065368652, "global_step": 40547, "epoch": 965} {"train_loss": -5.616949558258057, "global_step": 40548, "epoch": 965} {"train_loss": -5.63115119934082, "global_step": 40549, "epoch": 965} {"train_loss": -5.579039573669434, "global_step": 40550, "epoch": 965} {"train_loss": -5.746708869934082, "global_step": 40551, "epoch": 965} {"train_loss": -5.648406982421875, "global_step": 40552, "epoch": 965} {"train_loss": -5.458437442779541, "global_step": 40553, "epoch": 965} {"train_loss": -5.53095817565918, "global_step": 40554, "epoch": 965} {"train_loss": -5.8100738525390625, "global_step": 40555, "epoch": 965} {"train_loss": -5.361984729766846, "global_step": 40556, "epoch": 965} {"train_loss": -5.606513023376465, "global_step": 40557, "epoch": 965} {"train_loss": -5.485886573791504, "global_step": 40558, "epoch": 965} {"train_loss": -5.52392053604126, "global_step": 40559, "epoch": 965} {"train_loss": -5.471894264221191, "global_step": 40560, "epoch": 965} {"train_loss": -5.581546783447266, "global_step": 40561, "epoch": 965} {"train_loss": -5.582830429077148, "global_step": 40562, "epoch": 965} {"train_loss": -5.610512733459473, "global_step": 40563, "epoch": 965} {"train_loss": -5.624255657196045, "global_step": 40564, "epoch": 965} {"train_loss": -5.656905174255371, "global_step": 40565, "epoch": 965} {"train_loss": -5.536004543304443, "global_step": 40566, "epoch": 965} {"train_loss": -5.6184916496276855, "global_step": 40567, "epoch": 965} {"train_loss": -5.583909511566162, "global_step": 40568, "epoch": 965} {"train_loss": -5.587961673736572, "global_step": 40569, "epoch": 965} {"train_loss": -5.572994709014893, "global_step": 40570, "epoch": 965} {"train_loss": -5.603791622888474, "global_step": 40571, "epoch": 965, "val_loss": 66560.3515625} {"train_loss": -5.629787445068359, "global_step": 40572, "epoch": 966} {"train_loss": -5.570122241973877, "global_step": 40573, "epoch": 966} {"train_loss": -5.577436447143555, "global_step": 40574, "epoch": 966} {"train_loss": -5.578969478607178, "global_step": 40575, "epoch": 966} {"train_loss": -5.502847671508789, "global_step": 40576, "epoch": 966} {"train_loss": -5.618931770324707, "global_step": 40577, "epoch": 966} {"train_loss": -5.512101173400879, "global_step": 40578, "epoch": 966} {"train_loss": -5.6138787269592285, "global_step": 40579, "epoch": 966} {"train_loss": -5.531261920928955, "global_step": 40580, "epoch": 966} {"train_loss": -5.582236289978027, "global_step": 40581, "epoch": 966} {"train_loss": -5.622351169586182, "global_step": 40582, "epoch": 966} {"train_loss": -5.492671012878418, "global_step": 40583, "epoch": 966} {"train_loss": -5.684578895568848, "global_step": 40584, "epoch": 966} {"train_loss": -5.524750232696533, "global_step": 40585, "epoch": 966} {"train_loss": -5.622165203094482, "global_step": 40586, "epoch": 966} {"train_loss": -5.620573043823242, "global_step": 40587, "epoch": 966} {"train_loss": -5.595736503601074, "global_step": 40588, "epoch": 966} {"train_loss": -5.502182483673096, "global_step": 40589, "epoch": 966} {"train_loss": -5.569445610046387, "global_step": 40590, "epoch": 966} {"train_loss": -5.5421905517578125, "global_step": 40591, "epoch": 966} {"train_loss": -5.558144569396973, "global_step": 40592, "epoch": 966} {"train_loss": -5.707084655761719, "global_step": 40593, "epoch": 966} {"train_loss": -5.5461955070495605, "global_step": 40594, "epoch": 966} {"train_loss": -5.5337629318237305, "global_step": 40595, "epoch": 966} {"train_loss": -5.618376731872559, "global_step": 40596, "epoch": 966} {"train_loss": -5.519484996795654, "global_step": 40597, "epoch": 966} {"train_loss": -5.650254249572754, "global_step": 40598, "epoch": 966} {"train_loss": -5.530711650848389, "global_step": 40599, "epoch": 966} {"train_loss": -5.669162750244141, "global_step": 40600, "epoch": 966} {"train_loss": -5.590915203094482, "global_step": 40601, "epoch": 966} {"train_loss": -5.633023262023926, "global_step": 40602, "epoch": 966} {"train_loss": -5.725176811218262, "global_step": 40603, "epoch": 966} {"train_loss": -5.613318920135498, "global_step": 40604, "epoch": 966} {"train_loss": -5.749970436096191, "global_step": 40605, "epoch": 966} {"train_loss": -5.690670013427734, "global_step": 40606, "epoch": 966} {"train_loss": -5.565410614013672, "global_step": 40607, "epoch": 966} {"train_loss": -5.4854559898376465, "global_step": 40608, "epoch": 966} {"train_loss": -5.6353840827941895, "global_step": 40609, "epoch": 966} {"train_loss": -5.609346389770508, "global_step": 40610, "epoch": 966} {"train_loss": -5.661341667175293, "global_step": 40611, "epoch": 966} {"train_loss": -5.523205757141113, "global_step": 40612, "epoch": 966} {"train_loss": -5.5937743414016, "global_step": 40613, "epoch": 966, "val_loss": 65984.8359375} {"train_loss": -5.684688568115234, "global_step": 40614, "epoch": 967} {"train_loss": -5.714068412780762, "global_step": 40615, "epoch": 967} {"train_loss": -5.567641735076904, "global_step": 40616, "epoch": 967} {"train_loss": -5.562332630157471, "global_step": 40617, "epoch": 967} {"train_loss": -5.60347843170166, "global_step": 40618, "epoch": 967} {"train_loss": -5.630064010620117, "global_step": 40619, "epoch": 967} {"train_loss": -5.554948806762695, "global_step": 40620, "epoch": 967} {"train_loss": -5.589053153991699, "global_step": 40621, "epoch": 967} {"train_loss": -5.6334638595581055, "global_step": 40622, "epoch": 967} {"train_loss": -5.555855751037598, "global_step": 40623, "epoch": 967} {"train_loss": -5.650118827819824, "global_step": 40624, "epoch": 967} {"train_loss": -5.638455390930176, "global_step": 40625, "epoch": 967} {"train_loss": -5.701028823852539, "global_step": 40626, "epoch": 967} {"train_loss": -5.606449127197266, "global_step": 40627, "epoch": 967} {"train_loss": -5.773294448852539, "global_step": 40628, "epoch": 967} {"train_loss": -5.631290435791016, "global_step": 40629, "epoch": 967} {"train_loss": -5.551534175872803, "global_step": 40630, "epoch": 967} {"train_loss": -5.58222770690918, "global_step": 40631, "epoch": 967} {"train_loss": -5.629199028015137, "global_step": 40632, "epoch": 967} {"train_loss": -5.656652927398682, "global_step": 40633, "epoch": 967} {"train_loss": -5.699413776397705, "global_step": 40634, "epoch": 967} {"train_loss": -5.689604759216309, "global_step": 40635, "epoch": 967} {"train_loss": -5.758187294006348, "global_step": 40636, "epoch": 967} {"train_loss": -5.689734935760498, "global_step": 40637, "epoch": 967} {"train_loss": -5.68501091003418, "global_step": 40638, "epoch": 967} {"train_loss": -5.723684787750244, "global_step": 40639, "epoch": 967} {"train_loss": -5.699062347412109, "global_step": 40640, "epoch": 967} {"train_loss": -5.646816253662109, "global_step": 40641, "epoch": 967} {"train_loss": -5.54538631439209, "global_step": 40642, "epoch": 967} {"train_loss": -5.612032890319824, "global_step": 40643, "epoch": 967} {"train_loss": -5.573891639709473, "global_step": 40644, "epoch": 967} {"train_loss": -5.673013687133789, "global_step": 40645, "epoch": 967} {"train_loss": -5.758030414581299, "global_step": 40646, "epoch": 967} {"train_loss": -5.623686790466309, "global_step": 40647, "epoch": 967} {"train_loss": -5.549165725708008, "global_step": 40648, "epoch": 967} {"train_loss": -5.614201068878174, "global_step": 40649, "epoch": 967} {"train_loss": -5.568719863891602, "global_step": 40650, "epoch": 967} {"train_loss": -5.642982482910156, "global_step": 40651, "epoch": 967} {"train_loss": -5.6524553298950195, "global_step": 40652, "epoch": 967} {"train_loss": -5.604611873626709, "global_step": 40653, "epoch": 967} {"train_loss": -5.696679592132568, "global_step": 40654, "epoch": 967} {"train_loss": -5.638601836704073, "global_step": 40655, "epoch": 967, "val_loss": 65821.171875} {"train_loss": -5.701270580291748, "global_step": 40656, "epoch": 968} {"train_loss": -5.684709548950195, "global_step": 40657, "epoch": 968} {"train_loss": -5.640589714050293, "global_step": 40658, "epoch": 968} {"train_loss": -5.582271099090576, "global_step": 40659, "epoch": 968} {"train_loss": -5.723982810974121, "global_step": 40660, "epoch": 968} {"train_loss": -5.568051815032959, "global_step": 40661, "epoch": 968} {"train_loss": -5.556130409240723, "global_step": 40662, "epoch": 968} {"train_loss": -5.572944164276123, "global_step": 40663, "epoch": 968} {"train_loss": -5.645730495452881, "global_step": 40664, "epoch": 968} {"train_loss": -5.637457847595215, "global_step": 40665, "epoch": 968} {"train_loss": -5.631190299987793, "global_step": 40666, "epoch": 968} {"train_loss": -5.6312689781188965, "global_step": 40667, "epoch": 968} {"train_loss": -5.646994113922119, "global_step": 40668, "epoch": 968} {"train_loss": -5.632137298583984, "global_step": 40669, "epoch": 968} {"train_loss": -5.614644527435303, "global_step": 40670, "epoch": 968} {"train_loss": -5.480256080627441, "global_step": 40671, "epoch": 968} {"train_loss": -5.544949531555176, "global_step": 40672, "epoch": 968} {"train_loss": -5.6721343994140625, "global_step": 40673, "epoch": 968} {"train_loss": -5.6256208419799805, "global_step": 40674, "epoch": 968} {"train_loss": -5.608432769775391, "global_step": 40675, "epoch": 968} {"train_loss": -5.697274684906006, "global_step": 40676, "epoch": 968} {"train_loss": -5.558272361755371, "global_step": 40677, "epoch": 968} {"train_loss": -5.688665390014648, "global_step": 40678, "epoch": 968} {"train_loss": -5.636320114135742, "global_step": 40679, "epoch": 968} {"train_loss": -5.459966659545898, "global_step": 40680, "epoch": 968} {"train_loss": -5.616293907165527, "global_step": 40681, "epoch": 968} {"train_loss": -5.721468925476074, "global_step": 40682, "epoch": 968} {"train_loss": -5.5276055335998535, "global_step": 40683, "epoch": 968} {"train_loss": -5.690774917602539, "global_step": 40684, "epoch": 968} {"train_loss": -5.635519981384277, "global_step": 40685, "epoch": 968} {"train_loss": -5.659604072570801, "global_step": 40686, "epoch": 968} {"train_loss": -5.612800598144531, "global_step": 40687, "epoch": 968} {"train_loss": -5.4181318283081055, "global_step": 40688, "epoch": 968} {"train_loss": -5.580159664154053, "global_step": 40689, "epoch": 968} {"train_loss": -5.6262736320495605, "global_step": 40690, "epoch": 968} {"train_loss": -5.619412422180176, "global_step": 40691, "epoch": 968} {"train_loss": -5.607706069946289, "global_step": 40692, "epoch": 968} {"train_loss": -5.603283882141113, "global_step": 40693, "epoch": 968} {"train_loss": -5.664438247680664, "global_step": 40694, "epoch": 968} {"train_loss": -5.5677170753479, "global_step": 40695, "epoch": 968} {"train_loss": -5.723344326019287, "global_step": 40696, "epoch": 968} {"train_loss": -5.620230583917527, "global_step": 40697, "epoch": 968, "val_loss": 66639.2734375} {"train_loss": -5.63559627532959, "global_step": 40698, "epoch": 969} {"train_loss": -5.64572811126709, "global_step": 40699, "epoch": 969} {"train_loss": -5.679745674133301, "global_step": 40700, "epoch": 969} {"train_loss": -5.642838954925537, "global_step": 40701, "epoch": 969} {"train_loss": -5.667139053344727, "global_step": 40702, "epoch": 969} {"train_loss": -5.67453670501709, "global_step": 40703, "epoch": 969} {"train_loss": -5.649731636047363, "global_step": 40704, "epoch": 969} {"train_loss": -5.7770490646362305, "global_step": 40705, "epoch": 969} {"train_loss": -5.507377624511719, "global_step": 40706, "epoch": 969} {"train_loss": -5.644619941711426, "global_step": 40707, "epoch": 969} {"train_loss": -5.726273536682129, "global_step": 40708, "epoch": 969} {"train_loss": -5.703341007232666, "global_step": 40709, "epoch": 969} {"train_loss": -5.614169597625732, "global_step": 40710, "epoch": 969} {"train_loss": -5.650632858276367, "global_step": 40711, "epoch": 969} {"train_loss": -5.655982971191406, "global_step": 40712, "epoch": 969} {"train_loss": -5.781528472900391, "global_step": 40713, "epoch": 969} {"train_loss": -5.691789627075195, "global_step": 40714, "epoch": 969} {"train_loss": -5.759990215301514, "global_step": 40715, "epoch": 969} {"train_loss": -5.675698757171631, "global_step": 40716, "epoch": 969} {"train_loss": -5.56252908706665, "global_step": 40717, "epoch": 969} {"train_loss": -5.619410514831543, "global_step": 40718, "epoch": 969} {"train_loss": -5.594352722167969, "global_step": 40719, "epoch": 969} {"train_loss": -5.567602157592773, "global_step": 40720, "epoch": 969} {"train_loss": -5.791450500488281, "global_step": 40721, "epoch": 969} {"train_loss": -5.648916721343994, "global_step": 40722, "epoch": 969} {"train_loss": -5.652838230133057, "global_step": 40723, "epoch": 969} {"train_loss": -5.6239423751831055, "global_step": 40724, "epoch": 969} {"train_loss": -5.6702494621276855, "global_step": 40725, "epoch": 969} {"train_loss": -5.552772521972656, "global_step": 40726, "epoch": 969} {"train_loss": -5.527651786804199, "global_step": 40727, "epoch": 969} {"train_loss": -5.631671905517578, "global_step": 40728, "epoch": 969} {"train_loss": -5.634891510009766, "global_step": 40729, "epoch": 969} {"train_loss": -5.6641998291015625, "global_step": 40730, "epoch": 969} {"train_loss": -5.500235557556152, "global_step": 40731, "epoch": 969} {"train_loss": -5.641620635986328, "global_step": 40732, "epoch": 969} {"train_loss": -5.563693046569824, "global_step": 40733, "epoch": 969} {"train_loss": -5.636491775512695, "global_step": 40734, "epoch": 969} {"train_loss": -5.636279106140137, "global_step": 40735, "epoch": 969} {"train_loss": -5.49329137802124, "global_step": 40736, "epoch": 969} {"train_loss": -5.547957420349121, "global_step": 40737, "epoch": 969} {"train_loss": -5.653934955596924, "global_step": 40738, "epoch": 969} {"train_loss": -5.641076632908413, "global_step": 40739, "epoch": 969, "val_loss": 65955.234375} {"train_loss": -5.755327224731445, "global_step": 40740, "epoch": 970} {"train_loss": -5.698862075805664, "global_step": 40741, "epoch": 970} {"train_loss": -5.64339542388916, "global_step": 40742, "epoch": 970} {"train_loss": -5.659729957580566, "global_step": 40743, "epoch": 970} {"train_loss": -5.679807662963867, "global_step": 40744, "epoch": 970} {"train_loss": -5.7589263916015625, "global_step": 40745, "epoch": 970} {"train_loss": -5.59767484664917, "global_step": 40746, "epoch": 970} {"train_loss": -5.683030128479004, "global_step": 40747, "epoch": 970} {"train_loss": -5.658382892608643, "global_step": 40748, "epoch": 970} {"train_loss": -5.6251325607299805, "global_step": 40749, "epoch": 970} {"train_loss": -5.741486549377441, "global_step": 40750, "epoch": 970} {"train_loss": -5.629899024963379, "global_step": 40751, "epoch": 970} {"train_loss": -5.706130027770996, "global_step": 40752, "epoch": 970} {"train_loss": -5.638986110687256, "global_step": 40753, "epoch": 970} {"train_loss": -5.627696990966797, "global_step": 40754, "epoch": 970} {"train_loss": -5.562595367431641, "global_step": 40755, "epoch": 970} {"train_loss": -5.559812068939209, "global_step": 40756, "epoch": 970} {"train_loss": -5.636653900146484, "global_step": 40757, "epoch": 970} {"train_loss": -5.643614768981934, "global_step": 40758, "epoch": 970} {"train_loss": -5.659916877746582, "global_step": 40759, "epoch": 970} {"train_loss": -5.667606353759766, "global_step": 40760, "epoch": 970} {"train_loss": -5.628171920776367, "global_step": 40761, "epoch": 970} {"train_loss": -5.650464057922363, "global_step": 40762, "epoch": 970} {"train_loss": -5.696895599365234, "global_step": 40763, "epoch": 970} {"train_loss": -5.729898929595947, "global_step": 40764, "epoch": 970} {"train_loss": -5.541017532348633, "global_step": 40765, "epoch": 970} {"train_loss": -5.616802215576172, "global_step": 40766, "epoch": 970} {"train_loss": -5.612973213195801, "global_step": 40767, "epoch": 970} {"train_loss": -5.57051944732666, "global_step": 40768, "epoch": 970} {"train_loss": -5.677535057067871, "global_step": 40769, "epoch": 970} {"train_loss": -5.68095588684082, "global_step": 40770, "epoch": 970} {"train_loss": -5.631818771362305, "global_step": 40771, "epoch": 970} {"train_loss": -5.658625602722168, "global_step": 40772, "epoch": 970} {"train_loss": -5.780107021331787, "global_step": 40773, "epoch": 970} {"train_loss": -5.699933052062988, "global_step": 40774, "epoch": 970} {"train_loss": -5.600322246551514, "global_step": 40775, "epoch": 970} {"train_loss": -5.487295150756836, "global_step": 40776, "epoch": 970} {"train_loss": -5.562897682189941, "global_step": 40777, "epoch": 970} {"train_loss": -5.596705436706543, "global_step": 40778, "epoch": 970} {"train_loss": -5.630501747131348, "global_step": 40779, "epoch": 970} {"train_loss": -5.580334663391113, "global_step": 40780, "epoch": 970} {"train_loss": -5.641748201279413, "global_step": 40781, "epoch": 970, "val_loss": 66259.59375} {"train_loss": -5.56035852432251, "global_step": 40782, "epoch": 971} {"train_loss": -5.574515342712402, "global_step": 40783, "epoch": 971} {"train_loss": -5.5738725662231445, "global_step": 40784, "epoch": 971} {"train_loss": -5.678323745727539, "global_step": 40785, "epoch": 971} {"train_loss": -5.570690155029297, "global_step": 40786, "epoch": 971} {"train_loss": -5.516219139099121, "global_step": 40787, "epoch": 971} {"train_loss": -5.6419477462768555, "global_step": 40788, "epoch": 971} {"train_loss": -5.726052761077881, "global_step": 40789, "epoch": 971} {"train_loss": -5.672957420349121, "global_step": 40790, "epoch": 971} {"train_loss": -5.586499214172363, "global_step": 40791, "epoch": 971} {"train_loss": -5.82415246963501, "global_step": 40792, "epoch": 971} {"train_loss": -5.5461955070495605, "global_step": 40793, "epoch": 971} {"train_loss": -5.613844871520996, "global_step": 40794, "epoch": 971} {"train_loss": -5.554922103881836, "global_step": 40795, "epoch": 971} {"train_loss": -5.5920820236206055, "global_step": 40796, "epoch": 971} {"train_loss": -5.719232082366943, "global_step": 40797, "epoch": 971} {"train_loss": -5.623785018920898, "global_step": 40798, "epoch": 971} {"train_loss": -5.692325115203857, "global_step": 40799, "epoch": 971} {"train_loss": -5.669849395751953, "global_step": 40800, "epoch": 971} {"train_loss": -5.716037750244141, "global_step": 40801, "epoch": 971} {"train_loss": -5.580101490020752, "global_step": 40802, "epoch": 971} {"train_loss": -5.572556495666504, "global_step": 40803, "epoch": 971} {"train_loss": -5.532469749450684, "global_step": 40804, "epoch": 971} {"train_loss": -5.565676689147949, "global_step": 40805, "epoch": 971} {"train_loss": -5.669899940490723, "global_step": 40806, "epoch": 971} {"train_loss": -5.49250602722168, "global_step": 40807, "epoch": 971} {"train_loss": -5.496274948120117, "global_step": 40808, "epoch": 971} {"train_loss": -5.776165008544922, "global_step": 40809, "epoch": 971} {"train_loss": -5.633443832397461, "global_step": 40810, "epoch": 971} {"train_loss": -5.64768123626709, "global_step": 40811, "epoch": 971} {"train_loss": -5.674856185913086, "global_step": 40812, "epoch": 971} {"train_loss": -5.8597846031188965, "global_step": 40813, "epoch": 971} {"train_loss": -5.6375041007995605, "global_step": 40814, "epoch": 971} {"train_loss": -5.608912467956543, "global_step": 40815, "epoch": 971} {"train_loss": -5.623082160949707, "global_step": 40816, "epoch": 971} {"train_loss": -5.57121467590332, "global_step": 40817, "epoch": 971} {"train_loss": -5.558637619018555, "global_step": 40818, "epoch": 971} {"train_loss": -5.667394638061523, "global_step": 40819, "epoch": 971} {"train_loss": -5.644161224365234, "global_step": 40820, "epoch": 971} {"train_loss": -5.654730319976807, "global_step": 40821, "epoch": 971} {"train_loss": -5.619451522827148, "global_step": 40822, "epoch": 971} {"train_loss": -5.630002112615676, "global_step": 40823, "epoch": 971, "val_loss": 66343.2265625} {"train_loss": -5.597766876220703, "global_step": 40824, "epoch": 972} {"train_loss": -5.727597236633301, "global_step": 40825, "epoch": 972} {"train_loss": -5.545339584350586, "global_step": 40826, "epoch": 972} {"train_loss": -5.546742916107178, "global_step": 40827, "epoch": 972} {"train_loss": -5.688119888305664, "global_step": 40828, "epoch": 972} {"train_loss": -5.656078338623047, "global_step": 40829, "epoch": 972} {"train_loss": -5.714840888977051, "global_step": 40830, "epoch": 972} {"train_loss": -5.594665050506592, "global_step": 40831, "epoch": 972} {"train_loss": -5.678559303283691, "global_step": 40832, "epoch": 972} {"train_loss": -5.741274356842041, "global_step": 40833, "epoch": 972} {"train_loss": -5.69998836517334, "global_step": 40834, "epoch": 972} {"train_loss": -5.645116329193115, "global_step": 40835, "epoch": 972} {"train_loss": -5.735713005065918, "global_step": 40836, "epoch": 972} {"train_loss": -5.725167751312256, "global_step": 40837, "epoch": 972} {"train_loss": -5.639573574066162, "global_step": 40838, "epoch": 972} {"train_loss": -5.533995628356934, "global_step": 40839, "epoch": 972} {"train_loss": -5.555360794067383, "global_step": 40840, "epoch": 972} {"train_loss": -5.615789413452148, "global_step": 40841, "epoch": 972} {"train_loss": -5.626162528991699, "global_step": 40842, "epoch": 972} {"train_loss": -5.606689453125, "global_step": 40843, "epoch": 972} {"train_loss": -5.61032247543335, "global_step": 40844, "epoch": 972} {"train_loss": -5.573265552520752, "global_step": 40845, "epoch": 972} {"train_loss": -5.55937385559082, "global_step": 40846, "epoch": 972} {"train_loss": -5.488450527191162, "global_step": 40847, "epoch": 972} {"train_loss": -5.635116100311279, "global_step": 40848, "epoch": 972} {"train_loss": -5.566385269165039, "global_step": 40849, "epoch": 972} {"train_loss": -5.684108734130859, "global_step": 40850, "epoch": 972} {"train_loss": -5.585007667541504, "global_step": 40851, "epoch": 972} {"train_loss": -5.562840938568115, "global_step": 40852, "epoch": 972} {"train_loss": -5.739851951599121, "global_step": 40853, "epoch": 972} {"train_loss": -5.5241546630859375, "global_step": 40854, "epoch": 972} {"train_loss": -5.652927398681641, "global_step": 40855, "epoch": 972} {"train_loss": -5.533262729644775, "global_step": 40856, "epoch": 972} {"train_loss": -5.614832878112793, "global_step": 40857, "epoch": 972} {"train_loss": -5.544964790344238, "global_step": 40858, "epoch": 972} {"train_loss": -5.667757034301758, "global_step": 40859, "epoch": 972} {"train_loss": -5.720914840698242, "global_step": 40860, "epoch": 972} {"train_loss": -5.649408340454102, "global_step": 40861, "epoch": 972} {"train_loss": -5.622671127319336, "global_step": 40862, "epoch": 972} {"train_loss": -5.568283557891846, "global_step": 40863, "epoch": 972} {"train_loss": -5.654565334320068, "global_step": 40864, "epoch": 972} {"train_loss": -5.625323795136952, "global_step": 40865, "epoch": 972, "val_loss": 66519.5859375} {"train_loss": -5.580033779144287, "global_step": 40866, "epoch": 973} {"train_loss": -5.662779331207275, "global_step": 40867, "epoch": 973} {"train_loss": -5.598681926727295, "global_step": 40868, "epoch": 973} {"train_loss": -5.486642837524414, "global_step": 40869, "epoch": 973} {"train_loss": -5.619741439819336, "global_step": 40870, "epoch": 973} {"train_loss": -5.7450056076049805, "global_step": 40871, "epoch": 973} {"train_loss": -5.553086757659912, "global_step": 40872, "epoch": 973} {"train_loss": -5.431122779846191, "global_step": 40873, "epoch": 973} {"train_loss": -5.583158493041992, "global_step": 40874, "epoch": 973} {"train_loss": -5.566069602966309, "global_step": 40875, "epoch": 973} {"train_loss": -5.659204483032227, "global_step": 40876, "epoch": 973} {"train_loss": -5.562877655029297, "global_step": 40877, "epoch": 973} {"train_loss": -5.703272819519043, "global_step": 40878, "epoch": 973} {"train_loss": -5.724002838134766, "global_step": 40879, "epoch": 973} {"train_loss": -5.571833610534668, "global_step": 40880, "epoch": 973} {"train_loss": -5.6906328201293945, "global_step": 40881, "epoch": 973} {"train_loss": -5.6825666427612305, "global_step": 40882, "epoch": 973} {"train_loss": -5.64376163482666, "global_step": 40883, "epoch": 973} {"train_loss": -5.611295700073242, "global_step": 40884, "epoch": 973} {"train_loss": -5.618289470672607, "global_step": 40885, "epoch": 973} {"train_loss": -5.660083770751953, "global_step": 40886, "epoch": 973} {"train_loss": -5.751132965087891, "global_step": 40887, "epoch": 973} {"train_loss": -5.647964954376221, "global_step": 40888, "epoch": 973} {"train_loss": -5.657217502593994, "global_step": 40889, "epoch": 973} {"train_loss": -5.660259246826172, "global_step": 40890, "epoch": 973} {"train_loss": -5.560342788696289, "global_step": 40891, "epoch": 973} {"train_loss": -5.619566917419434, "global_step": 40892, "epoch": 973} {"train_loss": -5.569492340087891, "global_step": 40893, "epoch": 973} {"train_loss": -5.576616287231445, "global_step": 40894, "epoch": 973} {"train_loss": -5.66786527633667, "global_step": 40895, "epoch": 973} {"train_loss": -5.575116157531738, "global_step": 40896, "epoch": 973} {"train_loss": -5.664064884185791, "global_step": 40897, "epoch": 973} {"train_loss": -5.624986171722412, "global_step": 40898, "epoch": 973} {"train_loss": -5.679042816162109, "global_step": 40899, "epoch": 973} {"train_loss": -5.591688632965088, "global_step": 40900, "epoch": 973} {"train_loss": -5.589903831481934, "global_step": 40901, "epoch": 973} {"train_loss": -5.6083784103393555, "global_step": 40902, "epoch": 973} {"train_loss": -5.576061248779297, "global_step": 40903, "epoch": 973} {"train_loss": -5.757532119750977, "global_step": 40904, "epoch": 973} {"train_loss": -5.698559761047363, "global_step": 40905, "epoch": 973} {"train_loss": -5.5594563484191895, "global_step": 40906, "epoch": 973} {"train_loss": -5.622811294737316, "global_step": 40907, "epoch": 973, "val_loss": 65836.34375} {"train_loss": -5.50382137298584, "global_step": 40908, "epoch": 974} {"train_loss": -5.684678077697754, "global_step": 40909, "epoch": 974} {"train_loss": -5.712450981140137, "global_step": 40910, "epoch": 974} {"train_loss": -5.659232139587402, "global_step": 40911, "epoch": 974} {"train_loss": -5.67997932434082, "global_step": 40912, "epoch": 974} {"train_loss": -5.609752178192139, "global_step": 40913, "epoch": 974} {"train_loss": -5.625919342041016, "global_step": 40914, "epoch": 974} {"train_loss": -5.651308536529541, "global_step": 40915, "epoch": 974} {"train_loss": -5.5622477531433105, "global_step": 40916, "epoch": 974} {"train_loss": -5.677738189697266, "global_step": 40917, "epoch": 974} {"train_loss": -5.658123970031738, "global_step": 40918, "epoch": 974} {"train_loss": -5.598513126373291, "global_step": 40919, "epoch": 974} {"train_loss": -5.621295928955078, "global_step": 40920, "epoch": 974} {"train_loss": -5.4912824630737305, "global_step": 40921, "epoch": 974} {"train_loss": -5.613614559173584, "global_step": 40922, "epoch": 974} {"train_loss": -5.743887424468994, "global_step": 40923, "epoch": 974} {"train_loss": -5.520207405090332, "global_step": 40924, "epoch": 974} {"train_loss": -5.604263782501221, "global_step": 40925, "epoch": 974} {"train_loss": -5.559970855712891, "global_step": 40926, "epoch": 974} {"train_loss": -5.586590766906738, "global_step": 40927, "epoch": 974} {"train_loss": -5.447274684906006, "global_step": 40928, "epoch": 974} {"train_loss": -5.704803943634033, "global_step": 40929, "epoch": 974} {"train_loss": -5.659854888916016, "global_step": 40930, "epoch": 974} {"train_loss": -5.545351982116699, "global_step": 40931, "epoch": 974} {"train_loss": -5.62790584564209, "global_step": 40932, "epoch": 974} {"train_loss": -5.598344326019287, "global_step": 40933, "epoch": 974} {"train_loss": -5.648344993591309, "global_step": 40934, "epoch": 974} {"train_loss": -5.629983425140381, "global_step": 40935, "epoch": 974} {"train_loss": -5.61246395111084, "global_step": 40936, "epoch": 974} {"train_loss": -5.612300395965576, "global_step": 40937, "epoch": 974} {"train_loss": -5.75544548034668, "global_step": 40938, "epoch": 974} {"train_loss": -5.64759635925293, "global_step": 40939, "epoch": 974} {"train_loss": -5.576111793518066, "global_step": 40940, "epoch": 974} {"train_loss": -5.657413959503174, "global_step": 40941, "epoch": 974} {"train_loss": -5.78797721862793, "global_step": 40942, "epoch": 974} {"train_loss": -5.586426734924316, "global_step": 40943, "epoch": 974} {"train_loss": -5.594376564025879, "global_step": 40944, "epoch": 974} {"train_loss": -5.507562160491943, "global_step": 40945, "epoch": 974} {"train_loss": -5.663415908813477, "global_step": 40946, "epoch": 974} {"train_loss": -5.686605453491211, "global_step": 40947, "epoch": 974} {"train_loss": -5.532082557678223, "global_step": 40948, "epoch": 974} {"train_loss": -5.620943625768025, "global_step": 40949, "epoch": 974, "val_loss": 65729.7109375} {"train_loss": -5.684286594390869, "global_step": 40950, "epoch": 975} {"train_loss": -5.639906883239746, "global_step": 40951, "epoch": 975} {"train_loss": -5.698503494262695, "global_step": 40952, "epoch": 975} {"train_loss": -5.617098331451416, "global_step": 40953, "epoch": 975} {"train_loss": -5.552948951721191, "global_step": 40954, "epoch": 975} {"train_loss": -5.4974260330200195, "global_step": 40955, "epoch": 975} {"train_loss": -5.648182392120361, "global_step": 40956, "epoch": 975} {"train_loss": -5.542356967926025, "global_step": 40957, "epoch": 975} {"train_loss": -5.646718502044678, "global_step": 40958, "epoch": 975} {"train_loss": -5.6360273361206055, "global_step": 40959, "epoch": 975} {"train_loss": -5.650922775268555, "global_step": 40960, "epoch": 975} {"train_loss": -5.537406921386719, "global_step": 40961, "epoch": 975} {"train_loss": -5.6784772872924805, "global_step": 40962, "epoch": 975} {"train_loss": -5.589698791503906, "global_step": 40963, "epoch": 975} {"train_loss": -5.637715816497803, "global_step": 40964, "epoch": 975} {"train_loss": -5.523562431335449, "global_step": 40965, "epoch": 975} {"train_loss": -5.797438621520996, "global_step": 40966, "epoch": 975} {"train_loss": -5.4850754737854, "global_step": 40967, "epoch": 975} {"train_loss": -5.552438735961914, "global_step": 40968, "epoch": 975} {"train_loss": -5.601357460021973, "global_step": 40969, "epoch": 975} {"train_loss": -5.5665788650512695, "global_step": 40970, "epoch": 975} {"train_loss": -5.719997882843018, "global_step": 40971, "epoch": 975} {"train_loss": -5.471108436584473, "global_step": 40972, "epoch": 975} {"train_loss": -5.498884201049805, "global_step": 40973, "epoch": 975} {"train_loss": -5.6815690994262695, "global_step": 40974, "epoch": 975} {"train_loss": -5.706338882446289, "global_step": 40975, "epoch": 975} {"train_loss": -5.430231094360352, "global_step": 40976, "epoch": 975} {"train_loss": -5.789843559265137, "global_step": 40977, "epoch": 975} {"train_loss": -5.58112907409668, "global_step": 40978, "epoch": 975} {"train_loss": -5.588356971740723, "global_step": 40979, "epoch": 975} {"train_loss": -5.674267768859863, "global_step": 40980, "epoch": 975} {"train_loss": -5.644358158111572, "global_step": 40981, "epoch": 975} {"train_loss": -5.590188026428223, "global_step": 40982, "epoch": 975} {"train_loss": -5.684515476226807, "global_step": 40983, "epoch": 975} {"train_loss": -5.527901649475098, "global_step": 40984, "epoch": 975} {"train_loss": -5.504491806030273, "global_step": 40985, "epoch": 975} {"train_loss": -5.631538391113281, "global_step": 40986, "epoch": 975} {"train_loss": -5.6195878982543945, "global_step": 40987, "epoch": 975} {"train_loss": -5.657533645629883, "global_step": 40988, "epoch": 975} {"train_loss": -5.517269134521484, "global_step": 40989, "epoch": 975} {"train_loss": -5.7165398597717285, "global_step": 40990, "epoch": 975} {"train_loss": -5.610001268840971, "global_step": 40991, "epoch": 975, "val_loss": 66221.6015625} {"train_loss": -5.638668060302734, "global_step": 40992, "epoch": 976} {"train_loss": -5.577755928039551, "global_step": 40993, "epoch": 976} {"train_loss": -5.5678391456604, "global_step": 40994, "epoch": 976} {"train_loss": -5.612481117248535, "global_step": 40995, "epoch": 976} {"train_loss": -5.553702354431152, "global_step": 40996, "epoch": 976} {"train_loss": -5.613628387451172, "global_step": 40997, "epoch": 976} {"train_loss": -5.59104061126709, "global_step": 40998, "epoch": 976} {"train_loss": -5.565936088562012, "global_step": 40999, "epoch": 976} {"train_loss": -5.752463340759277, "global_step": 41000, "epoch": 976} {"train_loss": -5.434664726257324, "global_step": 41001, "epoch": 976} {"train_loss": -5.698451519012451, "global_step": 41002, "epoch": 976} {"train_loss": -5.471735954284668, "global_step": 41003, "epoch": 976} {"train_loss": -5.629729747772217, "global_step": 41004, "epoch": 976} {"train_loss": -5.50679874420166, "global_step": 41005, "epoch": 976} {"train_loss": -5.692819595336914, "global_step": 41006, "epoch": 976} {"train_loss": -5.55534029006958, "global_step": 41007, "epoch": 976} {"train_loss": -5.626297950744629, "global_step": 41008, "epoch": 976} {"train_loss": -5.753239631652832, "global_step": 41009, "epoch": 976} {"train_loss": -5.5704345703125, "global_step": 41010, "epoch": 976} {"train_loss": -5.722498893737793, "global_step": 41011, "epoch": 976} {"train_loss": -5.695723533630371, "global_step": 41012, "epoch": 976} {"train_loss": -5.746177673339844, "global_step": 41013, "epoch": 976} {"train_loss": -5.721287250518799, "global_step": 41014, "epoch": 976} {"train_loss": -5.810847282409668, "global_step": 41015, "epoch": 976} {"train_loss": -5.652909278869629, "global_step": 41016, "epoch": 976} {"train_loss": -5.580632209777832, "global_step": 41017, "epoch": 976} {"train_loss": -5.580897331237793, "global_step": 41018, "epoch": 976} {"train_loss": -5.601204872131348, "global_step": 41019, "epoch": 976} {"train_loss": -5.6656060218811035, "global_step": 41020, "epoch": 976} {"train_loss": -5.531500816345215, "global_step": 41021, "epoch": 976} {"train_loss": -5.572364807128906, "global_step": 41022, "epoch": 976} {"train_loss": -5.654600143432617, "global_step": 41023, "epoch": 976} {"train_loss": -5.385072708129883, "global_step": 41024, "epoch": 976} {"train_loss": -5.4431610107421875, "global_step": 41025, "epoch": 976} {"train_loss": -5.557323932647705, "global_step": 41026, "epoch": 976} {"train_loss": -5.602382659912109, "global_step": 41027, "epoch": 976} {"train_loss": -5.735348701477051, "global_step": 41028, "epoch": 976} {"train_loss": -5.500494003295898, "global_step": 41029, "epoch": 976} {"train_loss": -5.52297306060791, "global_step": 41030, "epoch": 976} {"train_loss": -5.679825782775879, "global_step": 41031, "epoch": 976} {"train_loss": -5.645700931549072, "global_step": 41032, "epoch": 976} {"train_loss": -5.612225941249302, "global_step": 41033, "epoch": 976, "val_loss": 66470.84375} {"train_loss": -5.642921447753906, "global_step": 41034, "epoch": 977} {"train_loss": -5.591272354125977, "global_step": 41035, "epoch": 977} {"train_loss": -5.635428428649902, "global_step": 41036, "epoch": 977} {"train_loss": -5.705049514770508, "global_step": 41037, "epoch": 977} {"train_loss": -5.540711402893066, "global_step": 41038, "epoch": 977} {"train_loss": -5.544050693511963, "global_step": 41039, "epoch": 977} {"train_loss": -5.746575355529785, "global_step": 41040, "epoch": 977} {"train_loss": -5.667125701904297, "global_step": 41041, "epoch": 977} {"train_loss": -5.651534080505371, "global_step": 41042, "epoch": 977} {"train_loss": -5.518970489501953, "global_step": 41043, "epoch": 977} {"train_loss": -5.537446022033691, "global_step": 41044, "epoch": 977} {"train_loss": -5.668057441711426, "global_step": 41045, "epoch": 977} {"train_loss": -5.647731781005859, "global_step": 41046, "epoch": 977} {"train_loss": -5.608868598937988, "global_step": 41047, "epoch": 977} {"train_loss": -5.649558067321777, "global_step": 41048, "epoch": 977} {"train_loss": -5.698716640472412, "global_step": 41049, "epoch": 977} {"train_loss": -5.69674015045166, "global_step": 41050, "epoch": 977} {"train_loss": -5.6398820877075195, "global_step": 41051, "epoch": 977} {"train_loss": -5.718921184539795, "global_step": 41052, "epoch": 977} {"train_loss": -5.634631633758545, "global_step": 41053, "epoch": 977} {"train_loss": -5.7319488525390625, "global_step": 41054, "epoch": 977} {"train_loss": -5.721661567687988, "global_step": 41055, "epoch": 977} {"train_loss": -5.633000373840332, "global_step": 41056, "epoch": 977} {"train_loss": -5.644718170166016, "global_step": 41057, "epoch": 977} {"train_loss": -5.803484916687012, "global_step": 41058, "epoch": 977} {"train_loss": -5.5021796226501465, "global_step": 41059, "epoch": 977} {"train_loss": -5.7448225021362305, "global_step": 41060, "epoch": 977} {"train_loss": -5.633799076080322, "global_step": 41061, "epoch": 977} {"train_loss": -5.6179094314575195, "global_step": 41062, "epoch": 977} {"train_loss": -5.511725425720215, "global_step": 41063, "epoch": 977} {"train_loss": -5.760823726654053, "global_step": 41064, "epoch": 977} {"train_loss": -5.511098861694336, "global_step": 41065, "epoch": 977} {"train_loss": -5.421854019165039, "global_step": 41066, "epoch": 977} {"train_loss": -5.640094757080078, "global_step": 41067, "epoch": 977} {"train_loss": -5.64815616607666, "global_step": 41068, "epoch": 977} {"train_loss": -5.448368549346924, "global_step": 41069, "epoch": 977} {"train_loss": -5.590694427490234, "global_step": 41070, "epoch": 977} {"train_loss": -5.520787715911865, "global_step": 41071, "epoch": 977} {"train_loss": -5.649933815002441, "global_step": 41072, "epoch": 977} {"train_loss": -5.6293110847473145, "global_step": 41073, "epoch": 977} {"train_loss": -5.718884468078613, "global_step": 41074, "epoch": 977} {"train_loss": -5.629376831508818, "global_step": 41075, "epoch": 977, "val_loss": 66284.359375} {"train_loss": -5.632102966308594, "global_step": 41076, "epoch": 978} {"train_loss": -5.570899486541748, "global_step": 41077, "epoch": 978} {"train_loss": -5.537903308868408, "global_step": 41078, "epoch": 978} {"train_loss": -5.664228439331055, "global_step": 41079, "epoch": 978} {"train_loss": -5.496460914611816, "global_step": 41080, "epoch": 978} {"train_loss": -5.661317825317383, "global_step": 41081, "epoch": 978} {"train_loss": -5.549049377441406, "global_step": 41082, "epoch": 978} {"train_loss": -5.570343971252441, "global_step": 41083, "epoch": 978} {"train_loss": -5.657006740570068, "global_step": 41084, "epoch": 978} {"train_loss": -5.652683258056641, "global_step": 41085, "epoch": 978} {"train_loss": -5.632228851318359, "global_step": 41086, "epoch": 978} {"train_loss": -5.609824180603027, "global_step": 41087, "epoch": 978} {"train_loss": -5.556265354156494, "global_step": 41088, "epoch": 978} {"train_loss": -5.678159236907959, "global_step": 41089, "epoch": 978} {"train_loss": -5.700991630554199, "global_step": 41090, "epoch": 978} {"train_loss": -5.717318534851074, "global_step": 41091, "epoch": 978} {"train_loss": -5.653159141540527, "global_step": 41092, "epoch": 978} {"train_loss": -5.647169589996338, "global_step": 41093, "epoch": 978} {"train_loss": -5.639070987701416, "global_step": 41094, "epoch": 978} {"train_loss": -5.7052531242370605, "global_step": 41095, "epoch": 978} {"train_loss": -5.646031856536865, "global_step": 41096, "epoch": 978} {"train_loss": -5.683578014373779, "global_step": 41097, "epoch": 978} {"train_loss": -5.686758041381836, "global_step": 41098, "epoch": 978} {"train_loss": -5.596851348876953, "global_step": 41099, "epoch": 978} {"train_loss": -5.665966987609863, "global_step": 41100, "epoch": 978} {"train_loss": -5.672496318817139, "global_step": 41101, "epoch": 978} {"train_loss": -5.801578521728516, "global_step": 41102, "epoch": 978} {"train_loss": -5.532528877258301, "global_step": 41103, "epoch": 978} {"train_loss": -5.722710609436035, "global_step": 41104, "epoch": 978} {"train_loss": -5.749934196472168, "global_step": 41105, "epoch": 978} {"train_loss": -5.619963645935059, "global_step": 41106, "epoch": 978} {"train_loss": -5.659158706665039, "global_step": 41107, "epoch": 978} {"train_loss": -5.761378765106201, "global_step": 41108, "epoch": 978} {"train_loss": -5.564556121826172, "global_step": 41109, "epoch": 978} {"train_loss": -5.6063971519470215, "global_step": 41110, "epoch": 978} {"train_loss": -5.664650917053223, "global_step": 41111, "epoch": 978} {"train_loss": -5.693315505981445, "global_step": 41112, "epoch": 978} {"train_loss": -5.579733848571777, "global_step": 41113, "epoch": 978} {"train_loss": -5.670131683349609, "global_step": 41114, "epoch": 978} {"train_loss": -5.701788425445557, "global_step": 41115, "epoch": 978} {"train_loss": -5.658107280731201, "global_step": 41116, "epoch": 978} {"train_loss": -5.644759439286732, "global_step": 41117, "epoch": 978, "val_loss": 66063.9140625} {"train_loss": -5.69651985168457, "global_step": 41118, "epoch": 979} {"train_loss": -5.7196455001831055, "global_step": 41119, "epoch": 979} {"train_loss": -5.664470672607422, "global_step": 41120, "epoch": 979} {"train_loss": -5.632061958312988, "global_step": 41121, "epoch": 979} {"train_loss": -5.69423246383667, "global_step": 41122, "epoch": 979} {"train_loss": -5.736937999725342, "global_step": 41123, "epoch": 979} {"train_loss": -5.578316688537598, "global_step": 41124, "epoch": 979} {"train_loss": -5.55239200592041, "global_step": 41125, "epoch": 979} {"train_loss": -5.618451118469238, "global_step": 41126, "epoch": 979} {"train_loss": -5.702231407165527, "global_step": 41127, "epoch": 979} {"train_loss": -5.47861909866333, "global_step": 41128, "epoch": 979} {"train_loss": -5.687376976013184, "global_step": 41129, "epoch": 979} {"train_loss": -5.725302219390869, "global_step": 41130, "epoch": 979} {"train_loss": -5.705606460571289, "global_step": 41131, "epoch": 979} {"train_loss": -5.578508377075195, "global_step": 41132, "epoch": 979} {"train_loss": -5.616220474243164, "global_step": 41133, "epoch": 979} {"train_loss": -5.557668209075928, "global_step": 41134, "epoch": 979} {"train_loss": -5.537546157836914, "global_step": 41135, "epoch": 979} {"train_loss": -5.685769081115723, "global_step": 41136, "epoch": 979} {"train_loss": -5.700984477996826, "global_step": 41137, "epoch": 979} {"train_loss": -5.654832363128662, "global_step": 41138, "epoch": 979} {"train_loss": -5.671454429626465, "global_step": 41139, "epoch": 979} {"train_loss": -5.545098781585693, "global_step": 41140, "epoch": 979} {"train_loss": -5.643126010894775, "global_step": 41141, "epoch": 979} {"train_loss": -5.514652729034424, "global_step": 41142, "epoch": 979} {"train_loss": -5.695126533508301, "global_step": 41143, "epoch": 979} {"train_loss": -5.618589878082275, "global_step": 41144, "epoch": 979} {"train_loss": -5.733904838562012, "global_step": 41145, "epoch": 979} {"train_loss": -5.502102851867676, "global_step": 41146, "epoch": 979} {"train_loss": -5.607377529144287, "global_step": 41147, "epoch": 979} {"train_loss": -5.693515777587891, "global_step": 41148, "epoch": 979} {"train_loss": -5.663690567016602, "global_step": 41149, "epoch": 979} {"train_loss": -5.509133338928223, "global_step": 41150, "epoch": 979} {"train_loss": -5.676050186157227, "global_step": 41151, "epoch": 979} {"train_loss": -5.635268211364746, "global_step": 41152, "epoch": 979} {"train_loss": -5.627470970153809, "global_step": 41153, "epoch": 979} {"train_loss": -5.727618217468262, "global_step": 41154, "epoch": 979} {"train_loss": -5.599193572998047, "global_step": 41155, "epoch": 979} {"train_loss": -5.6595869064331055, "global_step": 41156, "epoch": 979} {"train_loss": -5.6694207191467285, "global_step": 41157, "epoch": 979} {"train_loss": -5.635180473327637, "global_step": 41158, "epoch": 979} {"train_loss": -5.634398937225342, "global_step": 41159, "epoch": 979, "val_loss": 65947.28125} {"train_loss": -5.69135856628418, "global_step": 41160, "epoch": 980} {"train_loss": -5.65234899520874, "global_step": 41161, "epoch": 980} {"train_loss": -5.624905109405518, "global_step": 41162, "epoch": 980} {"train_loss": -5.639458179473877, "global_step": 41163, "epoch": 980} {"train_loss": -5.711342811584473, "global_step": 41164, "epoch": 980} {"train_loss": -5.514279365539551, "global_step": 41165, "epoch": 980} {"train_loss": -5.72652530670166, "global_step": 41166, "epoch": 980} {"train_loss": -5.652058124542236, "global_step": 41167, "epoch": 980} {"train_loss": -5.803321838378906, "global_step": 41168, "epoch": 980} {"train_loss": -5.682516574859619, "global_step": 41169, "epoch": 980} {"train_loss": -5.596279144287109, "global_step": 41170, "epoch": 980} {"train_loss": -5.6538286209106445, "global_step": 41171, "epoch": 980} {"train_loss": -5.673392295837402, "global_step": 41172, "epoch": 980} {"train_loss": -5.655641555786133, "global_step": 41173, "epoch": 980} {"train_loss": -5.725673198699951, "global_step": 41174, "epoch": 980} {"train_loss": -5.645735263824463, "global_step": 41175, "epoch": 980} {"train_loss": -5.560821056365967, "global_step": 41176, "epoch": 980} {"train_loss": -5.584921360015869, "global_step": 41177, "epoch": 980} {"train_loss": -5.664261341094971, "global_step": 41178, "epoch": 980} {"train_loss": -5.706556797027588, "global_step": 41179, "epoch": 980} {"train_loss": -5.633358955383301, "global_step": 41180, "epoch": 980} {"train_loss": -5.7360687255859375, "global_step": 41181, "epoch": 980} {"train_loss": -5.5885844230651855, "global_step": 41182, "epoch": 980} {"train_loss": -5.6396894454956055, "global_step": 41183, "epoch": 980} {"train_loss": -5.711392402648926, "global_step": 41184, "epoch": 980} {"train_loss": -5.670287132263184, "global_step": 41185, "epoch": 980} {"train_loss": -5.550745010375977, "global_step": 41186, "epoch": 980} {"train_loss": -5.738800048828125, "global_step": 41187, "epoch": 980} {"train_loss": -5.6311492919921875, "global_step": 41188, "epoch": 980} {"train_loss": -5.682126522064209, "global_step": 41189, "epoch": 980} {"train_loss": -5.631019115447998, "global_step": 41190, "epoch": 980} {"train_loss": -5.638710021972656, "global_step": 41191, "epoch": 980} {"train_loss": -5.642411231994629, "global_step": 41192, "epoch": 980} {"train_loss": -5.517738342285156, "global_step": 41193, "epoch": 980} {"train_loss": -5.681589126586914, "global_step": 41194, "epoch": 980} {"train_loss": -5.603270053863525, "global_step": 41195, "epoch": 980} {"train_loss": -5.628078460693359, "global_step": 41196, "epoch": 980} {"train_loss": -5.458582878112793, "global_step": 41197, "epoch": 980} {"train_loss": -5.682605743408203, "global_step": 41198, "epoch": 980} {"train_loss": -5.600323677062988, "global_step": 41199, "epoch": 980} {"train_loss": -5.498039245605469, "global_step": 41200, "epoch": 980} {"train_loss": -5.64179127556937, "global_step": 41201, "epoch": 980, "val_loss": 66879.671875} {"train_loss": -5.431816101074219, "global_step": 41202, "epoch": 981} {"train_loss": -5.634686470031738, "global_step": 41203, "epoch": 981} {"train_loss": -5.669553756713867, "global_step": 41204, "epoch": 981} {"train_loss": -5.5823822021484375, "global_step": 41205, "epoch": 981} {"train_loss": -5.676602363586426, "global_step": 41206, "epoch": 981} {"train_loss": -5.646998405456543, "global_step": 41207, "epoch": 981} {"train_loss": -5.577686786651611, "global_step": 41208, "epoch": 981} {"train_loss": -5.658060073852539, "global_step": 41209, "epoch": 981} {"train_loss": -5.616560935974121, "global_step": 41210, "epoch": 981} {"train_loss": -5.600762367248535, "global_step": 41211, "epoch": 981} {"train_loss": -5.694077968597412, "global_step": 41212, "epoch": 981} {"train_loss": -5.580078125, "global_step": 41213, "epoch": 981} {"train_loss": -5.505764007568359, "global_step": 41214, "epoch": 981} {"train_loss": -5.704091548919678, "global_step": 41215, "epoch": 981} {"train_loss": -5.621911525726318, "global_step": 41216, "epoch": 981} {"train_loss": -5.560116767883301, "global_step": 41217, "epoch": 981} {"train_loss": -5.909252166748047, "global_step": 41218, "epoch": 981} {"train_loss": -5.571315765380859, "global_step": 41219, "epoch": 981} {"train_loss": -5.709238052368164, "global_step": 41220, "epoch": 981} {"train_loss": -5.641633033752441, "global_step": 41221, "epoch": 981} {"train_loss": -5.615350246429443, "global_step": 41222, "epoch": 981} {"train_loss": -5.789588451385498, "global_step": 41223, "epoch": 981} {"train_loss": -5.511562347412109, "global_step": 41224, "epoch": 981} {"train_loss": -5.566867828369141, "global_step": 41225, "epoch": 981} {"train_loss": -5.663616180419922, "global_step": 41226, "epoch": 981} {"train_loss": -5.606112957000732, "global_step": 41227, "epoch": 981} {"train_loss": -5.486268997192383, "global_step": 41228, "epoch": 981} {"train_loss": -5.683274269104004, "global_step": 41229, "epoch": 981} {"train_loss": -5.660799980163574, "global_step": 41230, "epoch": 981} {"train_loss": -5.703608989715576, "global_step": 41231, "epoch": 981} {"train_loss": -5.611999988555908, "global_step": 41232, "epoch": 981} {"train_loss": -5.728610038757324, "global_step": 41233, "epoch": 981} {"train_loss": -5.600370407104492, "global_step": 41234, "epoch": 981} {"train_loss": -5.68531608581543, "global_step": 41235, "epoch": 981} {"train_loss": -5.707787990570068, "global_step": 41236, "epoch": 981} {"train_loss": -5.712458610534668, "global_step": 41237, "epoch": 981} {"train_loss": -5.619584083557129, "global_step": 41238, "epoch": 981} {"train_loss": -5.6374030113220215, "global_step": 41239, "epoch": 981} {"train_loss": -5.711757659912109, "global_step": 41240, "epoch": 981} {"train_loss": -5.646291255950928, "global_step": 41241, "epoch": 981} {"train_loss": -5.620553970336914, "global_step": 41242, "epoch": 981} {"train_loss": -5.637426853179932, "global_step": 41243, "epoch": 981, "val_loss": 65942.6015625} {"train_loss": -5.759333610534668, "global_step": 41244, "epoch": 982} {"train_loss": -5.681942462921143, "global_step": 41245, "epoch": 982} {"train_loss": -5.681149482727051, "global_step": 41246, "epoch": 982} {"train_loss": -5.664481163024902, "global_step": 41247, "epoch": 982} {"train_loss": -5.702050685882568, "global_step": 41248, "epoch": 982} {"train_loss": -5.818683624267578, "global_step": 41249, "epoch": 982} {"train_loss": -5.477535247802734, "global_step": 41250, "epoch": 982} {"train_loss": -5.655854225158691, "global_step": 41251, "epoch": 982} {"train_loss": -5.5644659996032715, "global_step": 41252, "epoch": 982} {"train_loss": -5.585488319396973, "global_step": 41253, "epoch": 982} {"train_loss": -5.667987823486328, "global_step": 41254, "epoch": 982} {"train_loss": -5.6407470703125, "global_step": 41255, "epoch": 982} {"train_loss": -5.487674236297607, "global_step": 41256, "epoch": 982} {"train_loss": -5.544591903686523, "global_step": 41257, "epoch": 982} {"train_loss": -5.526287078857422, "global_step": 41258, "epoch": 982} {"train_loss": -5.659666538238525, "global_step": 41259, "epoch": 982} {"train_loss": -5.567931175231934, "global_step": 41260, "epoch": 982} {"train_loss": -5.531529903411865, "global_step": 41261, "epoch": 982} {"train_loss": -5.553247451782227, "global_step": 41262, "epoch": 982} {"train_loss": -5.65065860748291, "global_step": 41263, "epoch": 982} {"train_loss": -5.671897888183594, "global_step": 41264, "epoch": 982} {"train_loss": -5.492715835571289, "global_step": 41265, "epoch": 982} {"train_loss": -5.719172477722168, "global_step": 41266, "epoch": 982} {"train_loss": -5.614545822143555, "global_step": 41267, "epoch": 982} {"train_loss": -5.640366554260254, "global_step": 41268, "epoch": 982} {"train_loss": -5.624789237976074, "global_step": 41269, "epoch": 982} {"train_loss": -5.587385177612305, "global_step": 41270, "epoch": 982} {"train_loss": -5.531357288360596, "global_step": 41271, "epoch": 982} {"train_loss": -5.656393051147461, "global_step": 41272, "epoch": 982} {"train_loss": -5.608408451080322, "global_step": 41273, "epoch": 982} {"train_loss": -5.570201873779297, "global_step": 41274, "epoch": 982} {"train_loss": -5.6106767654418945, "global_step": 41275, "epoch": 982} {"train_loss": -5.554048538208008, "global_step": 41276, "epoch": 982} {"train_loss": -5.506827354431152, "global_step": 41277, "epoch": 982} {"train_loss": -5.710570335388184, "global_step": 41278, "epoch": 982} {"train_loss": -5.554044723510742, "global_step": 41279, "epoch": 982} {"train_loss": -5.639510631561279, "global_step": 41280, "epoch": 982} {"train_loss": -5.738809585571289, "global_step": 41281, "epoch": 982} {"train_loss": -5.71975564956665, "global_step": 41282, "epoch": 982} {"train_loss": -5.713882923126221, "global_step": 41283, "epoch": 982} {"train_loss": -5.764054775238037, "global_step": 41284, "epoch": 982} {"train_loss": -5.621049381437755, "global_step": 41285, "epoch": 982, "val_loss": 65979.9375} {"train_loss": -5.770332336425781, "global_step": 41286, "epoch": 983} {"train_loss": -5.698134899139404, "global_step": 41287, "epoch": 983} {"train_loss": -5.6930036544799805, "global_step": 41288, "epoch": 983} {"train_loss": -5.631711959838867, "global_step": 41289, "epoch": 983} {"train_loss": -5.577583312988281, "global_step": 41290, "epoch": 983} {"train_loss": -5.677217960357666, "global_step": 41291, "epoch": 983} {"train_loss": -5.6955766677856445, "global_step": 41292, "epoch": 983} {"train_loss": -5.73663330078125, "global_step": 41293, "epoch": 983} {"train_loss": -5.681591033935547, "global_step": 41294, "epoch": 983} {"train_loss": -5.747702598571777, "global_step": 41295, "epoch": 983} {"train_loss": -5.65031099319458, "global_step": 41296, "epoch": 983} {"train_loss": -5.675955772399902, "global_step": 41297, "epoch": 983} {"train_loss": -5.662707805633545, "global_step": 41298, "epoch": 983} {"train_loss": -5.6721086502075195, "global_step": 41299, "epoch": 983} {"train_loss": -5.63686990737915, "global_step": 41300, "epoch": 983} {"train_loss": -5.708552360534668, "global_step": 41301, "epoch": 983} {"train_loss": -5.647030830383301, "global_step": 41302, "epoch": 983} {"train_loss": -5.624391555786133, "global_step": 41303, "epoch": 983} {"train_loss": -5.625435829162598, "global_step": 41304, "epoch": 983} {"train_loss": -5.658079624176025, "global_step": 41305, "epoch": 983} {"train_loss": -5.752961158752441, "global_step": 41306, "epoch": 983} {"train_loss": -5.590095520019531, "global_step": 41307, "epoch": 983} {"train_loss": -5.588768005371094, "global_step": 41308, "epoch": 983} {"train_loss": -5.705835342407227, "global_step": 41309, "epoch": 983} {"train_loss": -5.565843105316162, "global_step": 41310, "epoch": 983} {"train_loss": -5.663578033447266, "global_step": 41311, "epoch": 983} {"train_loss": -5.611943244934082, "global_step": 41312, "epoch": 983} {"train_loss": -5.641374588012695, "global_step": 41313, "epoch": 983} {"train_loss": -5.538404941558838, "global_step": 41314, "epoch": 983} {"train_loss": -5.717079162597656, "global_step": 41315, "epoch": 983} {"train_loss": -5.565170764923096, "global_step": 41316, "epoch": 983} {"train_loss": -5.540814399719238, "global_step": 41317, "epoch": 983} {"train_loss": -5.779004096984863, "global_step": 41318, "epoch": 983} {"train_loss": -5.581830978393555, "global_step": 41319, "epoch": 983} {"train_loss": -5.628045082092285, "global_step": 41320, "epoch": 983} {"train_loss": -5.601655960083008, "global_step": 41321, "epoch": 983} {"train_loss": -5.620809555053711, "global_step": 41322, "epoch": 983} {"train_loss": -5.650356292724609, "global_step": 41323, "epoch": 983} {"train_loss": -5.603446006774902, "global_step": 41324, "epoch": 983} {"train_loss": -5.54149055480957, "global_step": 41325, "epoch": 983} {"train_loss": -5.6609296798706055, "global_step": 41326, "epoch": 983} {"train_loss": -5.649867205392747, "global_step": 41327, "epoch": 983, "val_loss": 66175.671875} {"train_loss": -5.658768653869629, "global_step": 41328, "epoch": 984} {"train_loss": -5.5582733154296875, "global_step": 41329, "epoch": 984} {"train_loss": -5.6409735679626465, "global_step": 41330, "epoch": 984} {"train_loss": -5.718742370605469, "global_step": 41331, "epoch": 984} {"train_loss": -5.556412696838379, "global_step": 41332, "epoch": 984} {"train_loss": -5.630739212036133, "global_step": 41333, "epoch": 984} {"train_loss": -5.680390357971191, "global_step": 41334, "epoch": 984} {"train_loss": -5.6456618309021, "global_step": 41335, "epoch": 984} {"train_loss": -5.506958961486816, "global_step": 41336, "epoch": 984} {"train_loss": -5.628139495849609, "global_step": 41337, "epoch": 984} {"train_loss": -5.669178009033203, "global_step": 41338, "epoch": 984} {"train_loss": -5.661865234375, "global_step": 41339, "epoch": 984} {"train_loss": -5.7356462478637695, "global_step": 41340, "epoch": 984} {"train_loss": -5.689275741577148, "global_step": 41341, "epoch": 984} {"train_loss": -5.529749870300293, "global_step": 41342, "epoch": 984} {"train_loss": -5.659271240234375, "global_step": 41343, "epoch": 984} {"train_loss": -5.720586776733398, "global_step": 41344, "epoch": 984} {"train_loss": -5.660399913787842, "global_step": 41345, "epoch": 984} {"train_loss": -5.694140434265137, "global_step": 41346, "epoch": 984} {"train_loss": -5.7689948081970215, "global_step": 41347, "epoch": 984} {"train_loss": -5.6535844802856445, "global_step": 41348, "epoch": 984} {"train_loss": -5.546852111816406, "global_step": 41349, "epoch": 984} {"train_loss": -5.655942916870117, "global_step": 41350, "epoch": 984} {"train_loss": -5.601494312286377, "global_step": 41351, "epoch": 984} {"train_loss": -5.56932258605957, "global_step": 41352, "epoch": 984} {"train_loss": -5.587963581085205, "global_step": 41353, "epoch": 984} {"train_loss": -5.535191535949707, "global_step": 41354, "epoch": 984} {"train_loss": -5.73068904876709, "global_step": 41355, "epoch": 984} {"train_loss": -5.588167190551758, "global_step": 41356, "epoch": 984} {"train_loss": -5.602781295776367, "global_step": 41357, "epoch": 984} {"train_loss": -5.643047332763672, "global_step": 41358, "epoch": 984} {"train_loss": -5.706142902374268, "global_step": 41359, "epoch": 984} {"train_loss": -5.636239051818848, "global_step": 41360, "epoch": 984} {"train_loss": -5.518523216247559, "global_step": 41361, "epoch": 984} {"train_loss": -5.599612236022949, "global_step": 41362, "epoch": 984} {"train_loss": -5.667092323303223, "global_step": 41363, "epoch": 984} {"train_loss": -5.778199195861816, "global_step": 41364, "epoch": 984} {"train_loss": -5.607100486755371, "global_step": 41365, "epoch": 984} {"train_loss": -5.711431503295898, "global_step": 41366, "epoch": 984} {"train_loss": -5.54355001449585, "global_step": 41367, "epoch": 984} {"train_loss": -5.826781272888184, "global_step": 41368, "epoch": 984} {"train_loss": -5.637449287232899, "global_step": 41369, "epoch": 984, "val_loss": 65962.15625} {"train_loss": -5.626369476318359, "global_step": 41370, "epoch": 985} {"train_loss": -5.585323810577393, "global_step": 41371, "epoch": 985} {"train_loss": -5.777074813842773, "global_step": 41372, "epoch": 985} {"train_loss": -5.599180698394775, "global_step": 41373, "epoch": 985} {"train_loss": -5.732000350952148, "global_step": 41374, "epoch": 985} {"train_loss": -5.624876022338867, "global_step": 41375, "epoch": 985} {"train_loss": -5.603176116943359, "global_step": 41376, "epoch": 985} {"train_loss": -5.675201892852783, "global_step": 41377, "epoch": 985} {"train_loss": -5.585756778717041, "global_step": 41378, "epoch": 985} {"train_loss": -5.5501508712768555, "global_step": 41379, "epoch": 985} {"train_loss": -5.6870598793029785, "global_step": 41380, "epoch": 985} {"train_loss": -5.665616989135742, "global_step": 41381, "epoch": 985} {"train_loss": -5.546074867248535, "global_step": 41382, "epoch": 985} {"train_loss": -5.628207206726074, "global_step": 41383, "epoch": 985} {"train_loss": -5.589507102966309, "global_step": 41384, "epoch": 985} {"train_loss": -5.643154144287109, "global_step": 41385, "epoch": 985} {"train_loss": -5.634549140930176, "global_step": 41386, "epoch": 985} {"train_loss": -5.581094741821289, "global_step": 41387, "epoch": 985} {"train_loss": -5.679982662200928, "global_step": 41388, "epoch": 985} {"train_loss": -5.623946666717529, "global_step": 41389, "epoch": 985} {"train_loss": -5.515729904174805, "global_step": 41390, "epoch": 985} {"train_loss": -5.569396018981934, "global_step": 41391, "epoch": 985} {"train_loss": -5.688638210296631, "global_step": 41392, "epoch": 985} {"train_loss": -5.614681243896484, "global_step": 41393, "epoch": 985} {"train_loss": -5.738719463348389, "global_step": 41394, "epoch": 985} {"train_loss": -5.620450019836426, "global_step": 41395, "epoch": 985} {"train_loss": -5.550121784210205, "global_step": 41396, "epoch": 985} {"train_loss": -5.629059791564941, "global_step": 41397, "epoch": 985} {"train_loss": -5.595961570739746, "global_step": 41398, "epoch": 985} {"train_loss": -5.539146900177002, "global_step": 41399, "epoch": 985} {"train_loss": -5.34413480758667, "global_step": 41400, "epoch": 985} {"train_loss": -5.581271648406982, "global_step": 41401, "epoch": 985} {"train_loss": -5.4899702072143555, "global_step": 41402, "epoch": 985} {"train_loss": -5.5869574546813965, "global_step": 41403, "epoch": 985} {"train_loss": -5.614030838012695, "global_step": 41404, "epoch": 985} {"train_loss": -5.712960720062256, "global_step": 41405, "epoch": 985} {"train_loss": -5.715779781341553, "global_step": 41406, "epoch": 985} {"train_loss": -5.6305084228515625, "global_step": 41407, "epoch": 985} {"train_loss": -5.595976829528809, "global_step": 41408, "epoch": 985} {"train_loss": -5.546505928039551, "global_step": 41409, "epoch": 985} {"train_loss": -5.555307865142822, "global_step": 41410, "epoch": 985} {"train_loss": -5.608194192250569, "global_step": 41411, "epoch": 985, "val_loss": 66293.2890625} {"train_loss": -5.68409538269043, "global_step": 41412, "epoch": 986} {"train_loss": -5.603419303894043, "global_step": 41413, "epoch": 986} {"train_loss": -5.5306715965271, "global_step": 41414, "epoch": 986} {"train_loss": -5.7084197998046875, "global_step": 41415, "epoch": 986} {"train_loss": -5.456125736236572, "global_step": 41416, "epoch": 986} {"train_loss": -5.646306991577148, "global_step": 41417, "epoch": 986} {"train_loss": -5.452213287353516, "global_step": 41418, "epoch": 986} {"train_loss": -5.6615891456604, "global_step": 41419, "epoch": 986} {"train_loss": -5.645020484924316, "global_step": 41420, "epoch": 986} {"train_loss": -5.610024929046631, "global_step": 41421, "epoch": 986} {"train_loss": -5.714193344116211, "global_step": 41422, "epoch": 986} {"train_loss": -5.604689121246338, "global_step": 41423, "epoch": 986} {"train_loss": -5.758767127990723, "global_step": 41424, "epoch": 986} {"train_loss": -5.473716735839844, "global_step": 41425, "epoch": 986} {"train_loss": -5.506366729736328, "global_step": 41426, "epoch": 986} {"train_loss": -5.497555732727051, "global_step": 41427, "epoch": 986} {"train_loss": -5.359254837036133, "global_step": 41428, "epoch": 986} {"train_loss": -5.680042266845703, "global_step": 41429, "epoch": 986} {"train_loss": -5.568033695220947, "global_step": 41430, "epoch": 986} {"train_loss": -5.605149745941162, "global_step": 41431, "epoch": 986} {"train_loss": -5.387749671936035, "global_step": 41432, "epoch": 986} {"train_loss": -5.6500701904296875, "global_step": 41433, "epoch": 986} {"train_loss": -5.526040554046631, "global_step": 41434, "epoch": 986} {"train_loss": -5.72114896774292, "global_step": 41435, "epoch": 986} {"train_loss": -5.459857940673828, "global_step": 41436, "epoch": 986} {"train_loss": -5.667645454406738, "global_step": 41437, "epoch": 986} {"train_loss": -5.537663459777832, "global_step": 41438, "epoch": 986} {"train_loss": -5.632671356201172, "global_step": 41439, "epoch": 986} {"train_loss": -5.694333076477051, "global_step": 41440, "epoch": 986} {"train_loss": -5.608786582946777, "global_step": 41441, "epoch": 986} {"train_loss": -5.670760154724121, "global_step": 41442, "epoch": 986} {"train_loss": -5.609938144683838, "global_step": 41443, "epoch": 986} {"train_loss": -5.6853790283203125, "global_step": 41444, "epoch": 986} {"train_loss": -5.551285743713379, "global_step": 41445, "epoch": 986} {"train_loss": -5.5929975509643555, "global_step": 41446, "epoch": 986} {"train_loss": -5.666000843048096, "global_step": 41447, "epoch": 986} {"train_loss": -5.561947822570801, "global_step": 41448, "epoch": 986} {"train_loss": -5.647424697875977, "global_step": 41449, "epoch": 986} {"train_loss": -5.5607476234436035, "global_step": 41450, "epoch": 986} {"train_loss": -5.8022141456604, "global_step": 41451, "epoch": 986} {"train_loss": -5.684995651245117, "global_step": 41452, "epoch": 986} {"train_loss": -5.603314399719238, "global_step": 41453, "epoch": 986, "val_loss": 66510.0} {"train_loss": -5.544975757598877, "global_step": 41454, "epoch": 987} {"train_loss": -5.647500991821289, "global_step": 41455, "epoch": 987} {"train_loss": -5.74124813079834, "global_step": 41456, "epoch": 987} {"train_loss": -5.678620338439941, "global_step": 41457, "epoch": 987} {"train_loss": -5.661129951477051, "global_step": 41458, "epoch": 987} {"train_loss": -5.757521629333496, "global_step": 41459, "epoch": 987} {"train_loss": -5.58338737487793, "global_step": 41460, "epoch": 987} {"train_loss": -5.603932857513428, "global_step": 41461, "epoch": 987} {"train_loss": -5.8047943115234375, "global_step": 41462, "epoch": 987} {"train_loss": -5.587294578552246, "global_step": 41463, "epoch": 987} {"train_loss": -5.7648210525512695, "global_step": 41464, "epoch": 987} {"train_loss": -5.654253005981445, "global_step": 41465, "epoch": 987} {"train_loss": -5.637471675872803, "global_step": 41466, "epoch": 987} {"train_loss": -5.735175132751465, "global_step": 41467, "epoch": 987} {"train_loss": -5.5322346687316895, "global_step": 41468, "epoch": 987} {"train_loss": -5.68101167678833, "global_step": 41469, "epoch": 987} {"train_loss": -5.67282772064209, "global_step": 41470, "epoch": 987} {"train_loss": -5.708636283874512, "global_step": 41471, "epoch": 987} {"train_loss": -5.716057777404785, "global_step": 41472, "epoch": 987} {"train_loss": -5.730840682983398, "global_step": 41473, "epoch": 987} {"train_loss": -5.6736297607421875, "global_step": 41474, "epoch": 987} {"train_loss": -5.692224025726318, "global_step": 41475, "epoch": 987} {"train_loss": -5.760437488555908, "global_step": 41476, "epoch": 987} {"train_loss": -5.680103302001953, "global_step": 41477, "epoch": 987} {"train_loss": -5.730062484741211, "global_step": 41478, "epoch": 987} {"train_loss": -5.664686679840088, "global_step": 41479, "epoch": 987} {"train_loss": -5.514227867126465, "global_step": 41480, "epoch": 987} {"train_loss": -5.660569667816162, "global_step": 41481, "epoch": 987} {"train_loss": -5.756009101867676, "global_step": 41482, "epoch": 987} {"train_loss": -5.684660911560059, "global_step": 41483, "epoch": 987} {"train_loss": -5.558711528778076, "global_step": 41484, "epoch": 987} {"train_loss": -5.648497581481934, "global_step": 41485, "epoch": 987} {"train_loss": -5.607129096984863, "global_step": 41486, "epoch": 987} {"train_loss": -5.710630416870117, "global_step": 41487, "epoch": 987} {"train_loss": -5.674612522125244, "global_step": 41488, "epoch": 987} {"train_loss": -5.733477592468262, "global_step": 41489, "epoch": 987} {"train_loss": -5.642358303070068, "global_step": 41490, "epoch": 987} {"train_loss": -5.626178741455078, "global_step": 41491, "epoch": 987} {"train_loss": -5.647920608520508, "global_step": 41492, "epoch": 987} {"train_loss": -5.675872802734375, "global_step": 41493, "epoch": 987} {"train_loss": -5.678472518920898, "global_step": 41494, "epoch": 987} {"train_loss": -5.667226257778349, "global_step": 41495, "epoch": 987, "val_loss": 66051.03125} {"train_loss": -5.594634532928467, "global_step": 41496, "epoch": 988} {"train_loss": -5.688287734985352, "global_step": 41497, "epoch": 988} {"train_loss": -5.578120231628418, "global_step": 41498, "epoch": 988} {"train_loss": -5.708866119384766, "global_step": 41499, "epoch": 988} {"train_loss": -5.561234474182129, "global_step": 41500, "epoch": 988} {"train_loss": -5.693680286407471, "global_step": 41501, "epoch": 988} {"train_loss": -5.608885765075684, "global_step": 41502, "epoch": 988} {"train_loss": -5.6184210777282715, "global_step": 41503, "epoch": 988} {"train_loss": -5.527220726013184, "global_step": 41504, "epoch": 988} {"train_loss": -5.7179765701293945, "global_step": 41505, "epoch": 988} {"train_loss": -5.520090103149414, "global_step": 41506, "epoch": 988} {"train_loss": -5.692742347717285, "global_step": 41507, "epoch": 988} {"train_loss": -5.651223182678223, "global_step": 41508, "epoch": 988} {"train_loss": -5.5044426918029785, "global_step": 41509, "epoch": 988} {"train_loss": -5.578188896179199, "global_step": 41510, "epoch": 988} {"train_loss": -5.604855060577393, "global_step": 41511, "epoch": 988} {"train_loss": -5.551422119140625, "global_step": 41512, "epoch": 988} {"train_loss": -5.664223670959473, "global_step": 41513, "epoch": 988} {"train_loss": -5.642776012420654, "global_step": 41514, "epoch": 988} {"train_loss": -5.629021644592285, "global_step": 41515, "epoch": 988} {"train_loss": -5.767949104309082, "global_step": 41516, "epoch": 988} {"train_loss": -5.709477424621582, "global_step": 41517, "epoch": 988} {"train_loss": -5.6373610496521, "global_step": 41518, "epoch": 988} {"train_loss": -5.684001922607422, "global_step": 41519, "epoch": 988} {"train_loss": -5.732348442077637, "global_step": 41520, "epoch": 988} {"train_loss": -5.724028587341309, "global_step": 41521, "epoch": 988} {"train_loss": -5.636090278625488, "global_step": 41522, "epoch": 988} {"train_loss": -5.662257194519043, "global_step": 41523, "epoch": 988} {"train_loss": -5.530529499053955, "global_step": 41524, "epoch": 988} {"train_loss": -5.537303924560547, "global_step": 41525, "epoch": 988} {"train_loss": -5.774328708648682, "global_step": 41526, "epoch": 988} {"train_loss": -5.630888938903809, "global_step": 41527, "epoch": 988} {"train_loss": -5.83421516418457, "global_step": 41528, "epoch": 988} {"train_loss": -5.769228935241699, "global_step": 41529, "epoch": 988} {"train_loss": -5.6565704345703125, "global_step": 41530, "epoch": 988} {"train_loss": -5.7013139724731445, "global_step": 41531, "epoch": 988} {"train_loss": -5.714930534362793, "global_step": 41532, "epoch": 988} {"train_loss": -5.544785499572754, "global_step": 41533, "epoch": 988} {"train_loss": -5.620674133300781, "global_step": 41534, "epoch": 988} {"train_loss": -5.758337020874023, "global_step": 41535, "epoch": 988} {"train_loss": -5.574041843414307, "global_step": 41536, "epoch": 988} {"train_loss": -5.646350156693232, "global_step": 41537, "epoch": 988, "val_loss": 65958.96875} {"train_loss": -5.724666118621826, "global_step": 41538, "epoch": 989} {"train_loss": -5.557497978210449, "global_step": 41539, "epoch": 989} {"train_loss": -5.650049209594727, "global_step": 41540, "epoch": 989} {"train_loss": -5.693141937255859, "global_step": 41541, "epoch": 989} {"train_loss": -5.600937843322754, "global_step": 41542, "epoch": 989} {"train_loss": -5.5258283615112305, "global_step": 41543, "epoch": 989} {"train_loss": -5.5033793449401855, "global_step": 41544, "epoch": 989} {"train_loss": -5.646434783935547, "global_step": 41545, "epoch": 989} {"train_loss": -5.698210716247559, "global_step": 41546, "epoch": 989} {"train_loss": -5.655149936676025, "global_step": 41547, "epoch": 989} {"train_loss": -5.636608123779297, "global_step": 41548, "epoch": 989} {"train_loss": -5.535860061645508, "global_step": 41549, "epoch": 989} {"train_loss": -5.686056137084961, "global_step": 41550, "epoch": 989} {"train_loss": -5.647974967956543, "global_step": 41551, "epoch": 989} {"train_loss": -5.594810485839844, "global_step": 41552, "epoch": 989} {"train_loss": -5.65208625793457, "global_step": 41553, "epoch": 989} {"train_loss": -5.611645698547363, "global_step": 41554, "epoch": 989} {"train_loss": -5.599420547485352, "global_step": 41555, "epoch": 989} {"train_loss": -5.679502487182617, "global_step": 41556, "epoch": 989} {"train_loss": -5.652351379394531, "global_step": 41557, "epoch": 989} {"train_loss": -5.6201653480529785, "global_step": 41558, "epoch": 989} {"train_loss": -5.661847114562988, "global_step": 41559, "epoch": 989} {"train_loss": -5.758828163146973, "global_step": 41560, "epoch": 989} {"train_loss": -5.616079330444336, "global_step": 41561, "epoch": 989} {"train_loss": -5.66558837890625, "global_step": 41562, "epoch": 989} {"train_loss": -5.727613925933838, "global_step": 41563, "epoch": 989} {"train_loss": -5.726984024047852, "global_step": 41564, "epoch": 989} {"train_loss": -5.711919784545898, "global_step": 41565, "epoch": 989} {"train_loss": -5.6729736328125, "global_step": 41566, "epoch": 989} {"train_loss": -5.594000816345215, "global_step": 41567, "epoch": 989} {"train_loss": -5.678079128265381, "global_step": 41568, "epoch": 989} {"train_loss": -5.583108901977539, "global_step": 41569, "epoch": 989} {"train_loss": -5.648187637329102, "global_step": 41570, "epoch": 989} {"train_loss": -5.658652305603027, "global_step": 41571, "epoch": 989} {"train_loss": -5.567844390869141, "global_step": 41572, "epoch": 989} {"train_loss": -5.700277328491211, "global_step": 41573, "epoch": 989} {"train_loss": -5.768547058105469, "global_step": 41574, "epoch": 989} {"train_loss": -5.732396602630615, "global_step": 41575, "epoch": 989} {"train_loss": -5.675404071807861, "global_step": 41576, "epoch": 989} {"train_loss": -5.6808247566223145, "global_step": 41577, "epoch": 989} {"train_loss": -5.795331954956055, "global_step": 41578, "epoch": 989} {"train_loss": -5.655901091439383, "global_step": 41579, "epoch": 989, "val_loss": 66274.390625} {"train_loss": -5.746164321899414, "global_step": 41580, "epoch": 990} {"train_loss": -5.684119701385498, "global_step": 41581, "epoch": 990} {"train_loss": -5.6119489669799805, "global_step": 41582, "epoch": 990} {"train_loss": -5.63197135925293, "global_step": 41583, "epoch": 990} {"train_loss": -5.5874409675598145, "global_step": 41584, "epoch": 990} {"train_loss": -5.6330342292785645, "global_step": 41585, "epoch": 990} {"train_loss": -5.663970947265625, "global_step": 41586, "epoch": 990} {"train_loss": -5.659735679626465, "global_step": 41587, "epoch": 990} {"train_loss": -5.470102787017822, "global_step": 41588, "epoch": 990} {"train_loss": -5.754506587982178, "global_step": 41589, "epoch": 990} {"train_loss": -5.587457656860352, "global_step": 41590, "epoch": 990} {"train_loss": -5.657308578491211, "global_step": 41591, "epoch": 990} {"train_loss": -5.771594047546387, "global_step": 41592, "epoch": 990} {"train_loss": -5.68906831741333, "global_step": 41593, "epoch": 990} {"train_loss": -5.643350124359131, "global_step": 41594, "epoch": 990} {"train_loss": -5.726795673370361, "global_step": 41595, "epoch": 990} {"train_loss": -5.626809120178223, "global_step": 41596, "epoch": 990} {"train_loss": -5.601572513580322, "global_step": 41597, "epoch": 990} {"train_loss": -5.572232246398926, "global_step": 41598, "epoch": 990} {"train_loss": -5.539229393005371, "global_step": 41599, "epoch": 990} {"train_loss": -5.7663254737854, "global_step": 41600, "epoch": 990} {"train_loss": -5.684209823608398, "global_step": 41601, "epoch": 990} {"train_loss": -5.61435604095459, "global_step": 41602, "epoch": 990} {"train_loss": -5.599963188171387, "global_step": 41603, "epoch": 990} {"train_loss": -5.688139915466309, "global_step": 41604, "epoch": 990} {"train_loss": -5.625792503356934, "global_step": 41605, "epoch": 990} {"train_loss": -5.6100544929504395, "global_step": 41606, "epoch": 990} {"train_loss": -5.6691179275512695, "global_step": 41607, "epoch": 990} {"train_loss": -5.563825607299805, "global_step": 41608, "epoch": 990} {"train_loss": -5.630707263946533, "global_step": 41609, "epoch": 990} {"train_loss": -5.719371795654297, "global_step": 41610, "epoch": 990} {"train_loss": -5.599020004272461, "global_step": 41611, "epoch": 990} {"train_loss": -5.717918395996094, "global_step": 41612, "epoch": 990} {"train_loss": -5.61472225189209, "global_step": 41613, "epoch": 990} {"train_loss": -5.516966819763184, "global_step": 41614, "epoch": 990} {"train_loss": -5.722782135009766, "global_step": 41615, "epoch": 990} {"train_loss": -5.598169326782227, "global_step": 41616, "epoch": 990} {"train_loss": -5.692996501922607, "global_step": 41617, "epoch": 990} {"train_loss": -5.571533203125, "global_step": 41618, "epoch": 990} {"train_loss": -5.598690032958984, "global_step": 41619, "epoch": 990} {"train_loss": -5.566765785217285, "global_step": 41620, "epoch": 990} {"train_loss": -5.635268551962716, "global_step": 41621, "epoch": 990, "val_loss": 66263.859375} {"train_loss": -5.655081748962402, "global_step": 41622, "epoch": 991} {"train_loss": -5.46619987487793, "global_step": 41623, "epoch": 991} {"train_loss": -5.485685348510742, "global_step": 41624, "epoch": 991} {"train_loss": -5.545627593994141, "global_step": 41625, "epoch": 991} {"train_loss": -5.413801193237305, "global_step": 41626, "epoch": 991} {"train_loss": -5.724483489990234, "global_step": 41627, "epoch": 991} {"train_loss": -5.381094932556152, "global_step": 41628, "epoch": 991} {"train_loss": -5.5540056228637695, "global_step": 41629, "epoch": 991} {"train_loss": -5.362024307250977, "global_step": 41630, "epoch": 991} {"train_loss": -5.652263641357422, "global_step": 41631, "epoch": 991} {"train_loss": -5.612203121185303, "global_step": 41632, "epoch": 991} {"train_loss": -5.63401985168457, "global_step": 41633, "epoch": 991} {"train_loss": -5.607288360595703, "global_step": 41634, "epoch": 991} {"train_loss": -5.5781402587890625, "global_step": 41635, "epoch": 991} {"train_loss": -5.505054473876953, "global_step": 41636, "epoch": 991} {"train_loss": -5.483696937561035, "global_step": 41637, "epoch": 991} {"train_loss": -5.615662574768066, "global_step": 41638, "epoch": 991} {"train_loss": -5.529402732849121, "global_step": 41639, "epoch": 991} {"train_loss": -5.617552757263184, "global_step": 41640, "epoch": 991} {"train_loss": -5.654860496520996, "global_step": 41641, "epoch": 991} {"train_loss": -5.643948554992676, "global_step": 41642, "epoch": 991} {"train_loss": -5.608463287353516, "global_step": 41643, "epoch": 991} {"train_loss": -5.6896209716796875, "global_step": 41644, "epoch": 991} {"train_loss": -5.715183258056641, "global_step": 41645, "epoch": 991} {"train_loss": -5.653614521026611, "global_step": 41646, "epoch": 991} {"train_loss": -5.695134162902832, "global_step": 41647, "epoch": 991} {"train_loss": -5.702526569366455, "global_step": 41648, "epoch": 991} {"train_loss": -5.738476753234863, "global_step": 41649, "epoch": 991} {"train_loss": -5.672423362731934, "global_step": 41650, "epoch": 991} {"train_loss": -5.625647068023682, "global_step": 41651, "epoch": 991} {"train_loss": -5.642316818237305, "global_step": 41652, "epoch": 991} {"train_loss": -5.6870880126953125, "global_step": 41653, "epoch": 991} {"train_loss": -5.650718688964844, "global_step": 41654, "epoch": 991} {"train_loss": -5.730865478515625, "global_step": 41655, "epoch": 991} {"train_loss": -5.538507461547852, "global_step": 41656, "epoch": 991} {"train_loss": -5.6070332527160645, "global_step": 41657, "epoch": 991} {"train_loss": -5.532256126403809, "global_step": 41658, "epoch": 991} {"train_loss": -5.6698899269104, "global_step": 41659, "epoch": 991} {"train_loss": -5.714260101318359, "global_step": 41660, "epoch": 991} {"train_loss": -5.651174068450928, "global_step": 41661, "epoch": 991} {"train_loss": -5.682895183563232, "global_step": 41662, "epoch": 991} {"train_loss": -5.611567542666481, "global_step": 41663, "epoch": 991, "val_loss": 65966.609375} {"train_loss": -5.698166847229004, "global_step": 41664, "epoch": 992} {"train_loss": -5.72941780090332, "global_step": 41665, "epoch": 992} {"train_loss": -5.580877304077148, "global_step": 41666, "epoch": 992} {"train_loss": -5.694790840148926, "global_step": 41667, "epoch": 992} {"train_loss": -5.586235046386719, "global_step": 41668, "epoch": 992} {"train_loss": -5.556146621704102, "global_step": 41669, "epoch": 992} {"train_loss": -5.521116256713867, "global_step": 41670, "epoch": 992} {"train_loss": -5.618788719177246, "global_step": 41671, "epoch": 992} {"train_loss": -5.698774814605713, "global_step": 41672, "epoch": 992} {"train_loss": -5.620527267456055, "global_step": 41673, "epoch": 992} {"train_loss": -5.675428867340088, "global_step": 41674, "epoch": 992} {"train_loss": -5.619483947753906, "global_step": 41675, "epoch": 992} {"train_loss": -5.704868316650391, "global_step": 41676, "epoch": 992} {"train_loss": -5.699930191040039, "global_step": 41677, "epoch": 992} {"train_loss": -5.700417518615723, "global_step": 41678, "epoch": 992} {"train_loss": -5.538873672485352, "global_step": 41679, "epoch": 992} {"train_loss": -5.705609321594238, "global_step": 41680, "epoch": 992} {"train_loss": -5.64368200302124, "global_step": 41681, "epoch": 992} {"train_loss": -5.711699962615967, "global_step": 41682, "epoch": 992} {"train_loss": -5.706141471862793, "global_step": 41683, "epoch": 992} {"train_loss": -5.721374034881592, "global_step": 41684, "epoch": 992} {"train_loss": -5.6959147453308105, "global_step": 41685, "epoch": 992} {"train_loss": -5.663697242736816, "global_step": 41686, "epoch": 992} {"train_loss": -5.587308883666992, "global_step": 41687, "epoch": 992} {"train_loss": -5.635223388671875, "global_step": 41688, "epoch": 992} {"train_loss": -5.664340972900391, "global_step": 41689, "epoch": 992} {"train_loss": -5.611804008483887, "global_step": 41690, "epoch": 992} {"train_loss": -5.713799476623535, "global_step": 41691, "epoch": 992} {"train_loss": -5.703436374664307, "global_step": 41692, "epoch": 992} {"train_loss": -5.824586868286133, "global_step": 41693, "epoch": 992} {"train_loss": -5.6361284255981445, "global_step": 41694, "epoch": 992} {"train_loss": -5.762719631195068, "global_step": 41695, "epoch": 992} {"train_loss": -5.579869270324707, "global_step": 41696, "epoch": 992} {"train_loss": -5.68257474899292, "global_step": 41697, "epoch": 992} {"train_loss": -5.604991912841797, "global_step": 41698, "epoch": 992} {"train_loss": -5.652712821960449, "global_step": 41699, "epoch": 992} {"train_loss": -5.6560492515563965, "global_step": 41700, "epoch": 992} {"train_loss": -5.694687843322754, "global_step": 41701, "epoch": 992} {"train_loss": -5.673948764801025, "global_step": 41702, "epoch": 992} {"train_loss": -5.7623701095581055, "global_step": 41703, "epoch": 992} {"train_loss": -5.705261707305908, "global_step": 41704, "epoch": 992} {"train_loss": -5.664199851808094, "global_step": 41705, "epoch": 992, "val_loss": 65894.8046875} {"train_loss": -5.633670330047607, "global_step": 41706, "epoch": 993} {"train_loss": -5.658195495605469, "global_step": 41707, "epoch": 993} {"train_loss": -5.650553226470947, "global_step": 41708, "epoch": 993} {"train_loss": -5.709246635437012, "global_step": 41709, "epoch": 993} {"train_loss": -5.5671186447143555, "global_step": 41710, "epoch": 993} {"train_loss": -5.611080169677734, "global_step": 41711, "epoch": 993} {"train_loss": -5.553653717041016, "global_step": 41712, "epoch": 993} {"train_loss": -5.671047210693359, "global_step": 41713, "epoch": 993} {"train_loss": -5.789769172668457, "global_step": 41714, "epoch": 993} {"train_loss": -5.640839576721191, "global_step": 41715, "epoch": 993} {"train_loss": -5.642351150512695, "global_step": 41716, "epoch": 993} {"train_loss": -5.726287841796875, "global_step": 41717, "epoch": 993} {"train_loss": -5.638713836669922, "global_step": 41718, "epoch": 993} {"train_loss": -5.66757869720459, "global_step": 41719, "epoch": 993} {"train_loss": -5.716910362243652, "global_step": 41720, "epoch": 993} {"train_loss": -5.623464107513428, "global_step": 41721, "epoch": 993} {"train_loss": -5.790848731994629, "global_step": 41722, "epoch": 993} {"train_loss": -5.7601165771484375, "global_step": 41723, "epoch": 993} {"train_loss": -5.683636665344238, "global_step": 41724, "epoch": 993} {"train_loss": -5.740323066711426, "global_step": 41725, "epoch": 993} {"train_loss": -5.736782073974609, "global_step": 41726, "epoch": 993} {"train_loss": -5.743905067443848, "global_step": 41727, "epoch": 993} {"train_loss": -5.734177589416504, "global_step": 41728, "epoch": 993} {"train_loss": -5.612211227416992, "global_step": 41729, "epoch": 993} {"train_loss": -5.803328514099121, "global_step": 41730, "epoch": 993} {"train_loss": -5.587637901306152, "global_step": 41731, "epoch": 993} {"train_loss": -5.624693870544434, "global_step": 41732, "epoch": 993} {"train_loss": -5.7237443923950195, "global_step": 41733, "epoch": 993} {"train_loss": -5.519852638244629, "global_step": 41734, "epoch": 993} {"train_loss": -5.551699638366699, "global_step": 41735, "epoch": 993} {"train_loss": -5.558858871459961, "global_step": 41736, "epoch": 993} {"train_loss": -5.729281425476074, "global_step": 41737, "epoch": 993} {"train_loss": -5.69106388092041, "global_step": 41738, "epoch": 993} {"train_loss": -5.67877197265625, "global_step": 41739, "epoch": 993} {"train_loss": -5.80693244934082, "global_step": 41740, "epoch": 993} {"train_loss": -5.567490100860596, "global_step": 41741, "epoch": 993} {"train_loss": -5.7616682052612305, "global_step": 41742, "epoch": 993} {"train_loss": -5.472734451293945, "global_step": 41743, "epoch": 993} {"train_loss": -5.801338195800781, "global_step": 41744, "epoch": 993} {"train_loss": -5.692305564880371, "global_step": 41745, "epoch": 993} {"train_loss": -5.698938846588135, "global_step": 41746, "epoch": 993} {"train_loss": -5.67088186173212, "global_step": 41747, "epoch": 993, "val_loss": 66184.90625} {"train_loss": -5.647286891937256, "global_step": 41748, "epoch": 994} {"train_loss": -5.6414079666137695, "global_step": 41749, "epoch": 994} {"train_loss": -5.487421989440918, "global_step": 41750, "epoch": 994} {"train_loss": -5.594612121582031, "global_step": 41751, "epoch": 994} {"train_loss": -5.690084457397461, "global_step": 41752, "epoch": 994} {"train_loss": -5.713693618774414, "global_step": 41753, "epoch": 994} {"train_loss": -5.526925086975098, "global_step": 41754, "epoch": 994} {"train_loss": -5.7454118728637695, "global_step": 41755, "epoch": 994} {"train_loss": -5.586269378662109, "global_step": 41756, "epoch": 994} {"train_loss": -5.7058916091918945, "global_step": 41757, "epoch": 994} {"train_loss": -5.703967094421387, "global_step": 41758, "epoch": 994} {"train_loss": -5.51353120803833, "global_step": 41759, "epoch": 994} {"train_loss": -5.637355804443359, "global_step": 41760, "epoch": 994} {"train_loss": -5.681195259094238, "global_step": 41761, "epoch": 994} {"train_loss": -5.555010795593262, "global_step": 41762, "epoch": 994} {"train_loss": -5.596687316894531, "global_step": 41763, "epoch": 994} {"train_loss": -5.551158428192139, "global_step": 41764, "epoch": 994} {"train_loss": -5.715689659118652, "global_step": 41765, "epoch": 994} {"train_loss": -5.531716346740723, "global_step": 41766, "epoch": 994} {"train_loss": -5.546294212341309, "global_step": 41767, "epoch": 994} {"train_loss": -5.682182312011719, "global_step": 41768, "epoch": 994} {"train_loss": -5.695060729980469, "global_step": 41769, "epoch": 994} {"train_loss": -5.698173999786377, "global_step": 41770, "epoch": 994} {"train_loss": -5.624824523925781, "global_step": 41771, "epoch": 994} {"train_loss": -5.732913970947266, "global_step": 41772, "epoch": 994} {"train_loss": -5.7580060958862305, "global_step": 41773, "epoch": 994} {"train_loss": -5.6570329666137695, "global_step": 41774, "epoch": 994} {"train_loss": -5.794627666473389, "global_step": 41775, "epoch": 994} {"train_loss": -5.783947944641113, "global_step": 41776, "epoch": 994} {"train_loss": -5.7142744064331055, "global_step": 41777, "epoch": 994} {"train_loss": -5.652500152587891, "global_step": 41778, "epoch": 994} {"train_loss": -5.671049118041992, "global_step": 41779, "epoch": 994} {"train_loss": -5.778002738952637, "global_step": 41780, "epoch": 994} {"train_loss": -5.571557998657227, "global_step": 41781, "epoch": 994} {"train_loss": -5.7046403884887695, "global_step": 41782, "epoch": 994} {"train_loss": -5.532143592834473, "global_step": 41783, "epoch": 994} {"train_loss": -5.639251708984375, "global_step": 41784, "epoch": 994} {"train_loss": -5.53678560256958, "global_step": 41785, "epoch": 994} {"train_loss": -5.56929874420166, "global_step": 41786, "epoch": 994} {"train_loss": -5.586185455322266, "global_step": 41787, "epoch": 994} {"train_loss": -5.718451976776123, "global_step": 41788, "epoch": 994} {"train_loss": -5.64653518086388, "global_step": 41789, "epoch": 994, "val_loss": 66399.0390625} {"train_loss": -5.622884273529053, "global_step": 41790, "epoch": 995} {"train_loss": -5.622201919555664, "global_step": 41791, "epoch": 995} {"train_loss": -5.596225261688232, "global_step": 41792, "epoch": 995} {"train_loss": -5.555488586425781, "global_step": 41793, "epoch": 995} {"train_loss": -5.564774513244629, "global_step": 41794, "epoch": 995} {"train_loss": -5.6378960609436035, "global_step": 41795, "epoch": 995} {"train_loss": -5.577826023101807, "global_step": 41796, "epoch": 995} {"train_loss": -5.560582160949707, "global_step": 41797, "epoch": 995} {"train_loss": -5.613945007324219, "global_step": 41798, "epoch": 995} {"train_loss": -5.677587509155273, "global_step": 41799, "epoch": 995} {"train_loss": -5.739847183227539, "global_step": 41800, "epoch": 995} {"train_loss": -5.735411167144775, "global_step": 41801, "epoch": 995} {"train_loss": -5.623055934906006, "global_step": 41802, "epoch": 995} {"train_loss": -5.760010719299316, "global_step": 41803, "epoch": 995} {"train_loss": -5.78262186050415, "global_step": 41804, "epoch": 995} {"train_loss": -5.668662071228027, "global_step": 41805, "epoch": 995} {"train_loss": -5.608181476593018, "global_step": 41806, "epoch": 995} {"train_loss": -5.699023246765137, "global_step": 41807, "epoch": 995} {"train_loss": -5.585930824279785, "global_step": 41808, "epoch": 995} {"train_loss": -5.5144195556640625, "global_step": 41809, "epoch": 995} {"train_loss": -5.657731056213379, "global_step": 41810, "epoch": 995} {"train_loss": -5.631366729736328, "global_step": 41811, "epoch": 995} {"train_loss": -5.584170341491699, "global_step": 41812, "epoch": 995} {"train_loss": -5.715707778930664, "global_step": 41813, "epoch": 995} {"train_loss": -5.655255317687988, "global_step": 41814, "epoch": 995} {"train_loss": -5.63348913192749, "global_step": 41815, "epoch": 995} {"train_loss": -5.822956085205078, "global_step": 41816, "epoch": 995} {"train_loss": -5.45960807800293, "global_step": 41817, "epoch": 995} {"train_loss": -5.567296981811523, "global_step": 41818, "epoch": 995} {"train_loss": -5.508326530456543, "global_step": 41819, "epoch": 995} {"train_loss": -5.716065406799316, "global_step": 41820, "epoch": 995} {"train_loss": -5.6873321533203125, "global_step": 41821, "epoch": 995} {"train_loss": -5.525942802429199, "global_step": 41822, "epoch": 995} {"train_loss": -5.508425712585449, "global_step": 41823, "epoch": 995} {"train_loss": -5.719091415405273, "global_step": 41824, "epoch": 995} {"train_loss": -5.610783576965332, "global_step": 41825, "epoch": 995} {"train_loss": -5.601014137268066, "global_step": 41826, "epoch": 995} {"train_loss": -5.6660966873168945, "global_step": 41827, "epoch": 995} {"train_loss": -5.612254619598389, "global_step": 41828, "epoch": 995} {"train_loss": -5.628202438354492, "global_step": 41829, "epoch": 995} {"train_loss": -5.569473743438721, "global_step": 41830, "epoch": 995} {"train_loss": -5.631049417314076, "global_step": 41831, "epoch": 995, "val_loss": 67081.28125} {"train_loss": -5.546623706817627, "global_step": 41832, "epoch": 996} {"train_loss": -5.6288933753967285, "global_step": 41833, "epoch": 996} {"train_loss": -5.5672526359558105, "global_step": 41834, "epoch": 996} {"train_loss": -5.483707427978516, "global_step": 41835, "epoch": 996} {"train_loss": -5.600481033325195, "global_step": 41836, "epoch": 996} {"train_loss": -5.5950469970703125, "global_step": 41837, "epoch": 996} {"train_loss": -5.622729301452637, "global_step": 41838, "epoch": 996} {"train_loss": -5.61549186706543, "global_step": 41839, "epoch": 996} {"train_loss": -5.6677141189575195, "global_step": 41840, "epoch": 996} {"train_loss": -5.726714134216309, "global_step": 41841, "epoch": 996} {"train_loss": -5.605067253112793, "global_step": 41842, "epoch": 996} {"train_loss": -5.7161030769348145, "global_step": 41843, "epoch": 996} {"train_loss": -5.625628471374512, "global_step": 41844, "epoch": 996} {"train_loss": -5.687750816345215, "global_step": 41845, "epoch": 996} {"train_loss": -5.634709358215332, "global_step": 41846, "epoch": 996} {"train_loss": -5.643959999084473, "global_step": 41847, "epoch": 996} {"train_loss": -5.574049949645996, "global_step": 41848, "epoch": 996} {"train_loss": -5.666009902954102, "global_step": 41849, "epoch": 996} {"train_loss": -5.667281150817871, "global_step": 41850, "epoch": 996} {"train_loss": -5.544105529785156, "global_step": 41851, "epoch": 996} {"train_loss": -5.722372055053711, "global_step": 41852, "epoch": 996} {"train_loss": -5.634322643280029, "global_step": 41853, "epoch": 996} {"train_loss": -5.635496139526367, "global_step": 41854, "epoch": 996} {"train_loss": -5.669855117797852, "global_step": 41855, "epoch": 996} {"train_loss": -5.610958576202393, "global_step": 41856, "epoch": 996} {"train_loss": -5.590394020080566, "global_step": 41857, "epoch": 996} {"train_loss": -5.578380584716797, "global_step": 41858, "epoch": 996} {"train_loss": -5.513652324676514, "global_step": 41859, "epoch": 996} {"train_loss": -5.610385417938232, "global_step": 41860, "epoch": 996} {"train_loss": -5.663262367248535, "global_step": 41861, "epoch": 996} {"train_loss": -5.512211799621582, "global_step": 41862, "epoch": 996} {"train_loss": -5.6292243003845215, "global_step": 41863, "epoch": 996} {"train_loss": -5.673211097717285, "global_step": 41864, "epoch": 996} {"train_loss": -5.710905075073242, "global_step": 41865, "epoch": 996} {"train_loss": -5.660652160644531, "global_step": 41866, "epoch": 996} {"train_loss": -5.5660080909729, "global_step": 41867, "epoch": 996} {"train_loss": -5.738517761230469, "global_step": 41868, "epoch": 996} {"train_loss": -5.603743553161621, "global_step": 41869, "epoch": 996} {"train_loss": -5.754545211791992, "global_step": 41870, "epoch": 996} {"train_loss": -5.683140277862549, "global_step": 41871, "epoch": 996} {"train_loss": -5.701010704040527, "global_step": 41872, "epoch": 996} {"train_loss": -5.631300585610526, "global_step": 41873, "epoch": 996, "val_loss": 66165.3046875} {"train_loss": -5.56728458404541, "global_step": 41874, "epoch": 997} {"train_loss": -5.576169013977051, "global_step": 41875, "epoch": 997} {"train_loss": -5.687829971313477, "global_step": 41876, "epoch": 997} {"train_loss": -5.695125579833984, "global_step": 41877, "epoch": 997} {"train_loss": -5.751827716827393, "global_step": 41878, "epoch": 997} {"train_loss": -5.653491973876953, "global_step": 41879, "epoch": 997} {"train_loss": -5.662628173828125, "global_step": 41880, "epoch": 997} {"train_loss": -5.657506942749023, "global_step": 41881, "epoch": 997} {"train_loss": -5.674018859863281, "global_step": 41882, "epoch": 997} {"train_loss": -5.69491720199585, "global_step": 41883, "epoch": 997} {"train_loss": -5.701501846313477, "global_step": 41884, "epoch": 997} {"train_loss": -5.650134086608887, "global_step": 41885, "epoch": 997} {"train_loss": -5.5630083084106445, "global_step": 41886, "epoch": 997} {"train_loss": -5.807927131652832, "global_step": 41887, "epoch": 997} {"train_loss": -5.696562767028809, "global_step": 41888, "epoch": 997} {"train_loss": -5.602212905883789, "global_step": 41889, "epoch": 997} {"train_loss": -5.56996488571167, "global_step": 41890, "epoch": 997} {"train_loss": -5.6488800048828125, "global_step": 41891, "epoch": 997} {"train_loss": -5.614290237426758, "global_step": 41892, "epoch": 997} {"train_loss": -5.620026588439941, "global_step": 41893, "epoch": 997} {"train_loss": -5.616997241973877, "global_step": 41894, "epoch": 997} {"train_loss": -5.601363658905029, "global_step": 41895, "epoch": 997} {"train_loss": -5.503574371337891, "global_step": 41896, "epoch": 997} {"train_loss": -5.691360950469971, "global_step": 41897, "epoch": 997} {"train_loss": -5.620368957519531, "global_step": 41898, "epoch": 997} {"train_loss": -5.547048568725586, "global_step": 41899, "epoch": 997} {"train_loss": -5.789122581481934, "global_step": 41900, "epoch": 997} {"train_loss": -5.5337090492248535, "global_step": 41901, "epoch": 997} {"train_loss": -5.668304443359375, "global_step": 41902, "epoch": 997} {"train_loss": -5.526890277862549, "global_step": 41903, "epoch": 997} {"train_loss": -5.554033279418945, "global_step": 41904, "epoch": 997} {"train_loss": -5.472047328948975, "global_step": 41905, "epoch": 997} {"train_loss": -5.674358367919922, "global_step": 41906, "epoch": 997} {"train_loss": -5.670208930969238, "global_step": 41907, "epoch": 997} {"train_loss": -5.613422393798828, "global_step": 41908, "epoch": 997} {"train_loss": -5.432060241699219, "global_step": 41909, "epoch": 997} {"train_loss": -5.500910758972168, "global_step": 41910, "epoch": 997} {"train_loss": -5.574026107788086, "global_step": 41911, "epoch": 997} {"train_loss": -5.549130916595459, "global_step": 41912, "epoch": 997} {"train_loss": -5.7136616706848145, "global_step": 41913, "epoch": 997} {"train_loss": -5.488795757293701, "global_step": 41914, "epoch": 997} {"train_loss": -5.619357835678827, "global_step": 41915, "epoch": 997, "val_loss": 66196.203125} {"train_loss": -5.625669479370117, "global_step": 41916, "epoch": 998} {"train_loss": -5.741628646850586, "global_step": 41917, "epoch": 998} {"train_loss": -5.598729610443115, "global_step": 41918, "epoch": 998} {"train_loss": -5.625359058380127, "global_step": 41919, "epoch": 998} {"train_loss": -5.692230224609375, "global_step": 41920, "epoch": 998} {"train_loss": -5.557221412658691, "global_step": 41921, "epoch": 998} {"train_loss": -5.503849983215332, "global_step": 41922, "epoch": 998} {"train_loss": -5.642183780670166, "global_step": 41923, "epoch": 998} {"train_loss": -5.595775127410889, "global_step": 41924, "epoch": 998} {"train_loss": -5.572736740112305, "global_step": 41925, "epoch": 998} {"train_loss": -5.696339130401611, "global_step": 41926, "epoch": 998} {"train_loss": -5.600667476654053, "global_step": 41927, "epoch": 998} {"train_loss": -5.638650894165039, "global_step": 41928, "epoch": 998} {"train_loss": -5.6749348640441895, "global_step": 41929, "epoch": 998} {"train_loss": -5.4873127937316895, "global_step": 41930, "epoch": 998} {"train_loss": -5.702936172485352, "global_step": 41931, "epoch": 998} {"train_loss": -5.6944427490234375, "global_step": 41932, "epoch": 998} {"train_loss": -5.6316962242126465, "global_step": 41933, "epoch": 998} {"train_loss": -5.632916450500488, "global_step": 41934, "epoch": 998} {"train_loss": -5.639423370361328, "global_step": 41935, "epoch": 998} {"train_loss": -5.608182430267334, "global_step": 41936, "epoch": 998} {"train_loss": -5.605863094329834, "global_step": 41937, "epoch": 998} {"train_loss": -5.589320659637451, "global_step": 41938, "epoch": 998} {"train_loss": -5.59611701965332, "global_step": 41939, "epoch": 998} {"train_loss": -5.564010143280029, "global_step": 41940, "epoch": 998} {"train_loss": -5.70054292678833, "global_step": 41941, "epoch": 998} {"train_loss": -5.543107032775879, "global_step": 41942, "epoch": 998} {"train_loss": -5.739273548126221, "global_step": 41943, "epoch": 998} {"train_loss": -5.721985816955566, "global_step": 41944, "epoch": 998} {"train_loss": -5.631783485412598, "global_step": 41945, "epoch": 998} {"train_loss": -5.569755554199219, "global_step": 41946, "epoch": 998} {"train_loss": -5.633572578430176, "global_step": 41947, "epoch": 998} {"train_loss": -5.693272113800049, "global_step": 41948, "epoch": 998} {"train_loss": -5.550710678100586, "global_step": 41949, "epoch": 998} {"train_loss": -5.60219144821167, "global_step": 41950, "epoch": 998} {"train_loss": -5.681387424468994, "global_step": 41951, "epoch": 998} {"train_loss": -5.595448017120361, "global_step": 41952, "epoch": 998} {"train_loss": -5.6330718994140625, "global_step": 41953, "epoch": 998} {"train_loss": -5.703577041625977, "global_step": 41954, "epoch": 998} {"train_loss": -5.6240315437316895, "global_step": 41955, "epoch": 998} {"train_loss": -5.663589954376221, "global_step": 41956, "epoch": 998} {"train_loss": -5.631523972465878, "global_step": 41957, "epoch": 998, "val_loss": 66052.125} {"train_loss": -5.671879768371582, "global_step": 41958, "epoch": 999} {"train_loss": -5.612658500671387, "global_step": 41959, "epoch": 999} {"train_loss": -5.571769714355469, "global_step": 41960, "epoch": 999} {"train_loss": -5.69721794128418, "global_step": 41961, "epoch": 999} {"train_loss": -5.66797399520874, "global_step": 41962, "epoch": 999} {"train_loss": -5.63215446472168, "global_step": 41963, "epoch": 999} {"train_loss": -5.631415367126465, "global_step": 41964, "epoch": 999} {"train_loss": -5.675936222076416, "global_step": 41965, "epoch": 999} {"train_loss": -5.641158103942871, "global_step": 41966, "epoch": 999} {"train_loss": -5.662724494934082, "global_step": 41967, "epoch": 999} {"train_loss": -5.667370796203613, "global_step": 41968, "epoch": 999} {"train_loss": -5.565019607543945, "global_step": 41969, "epoch": 999} {"train_loss": -5.712579250335693, "global_step": 41970, "epoch": 999} {"train_loss": -5.840129375457764, "global_step": 41971, "epoch": 999} {"train_loss": -5.601284027099609, "global_step": 41972, "epoch": 999} {"train_loss": -5.650673866271973, "global_step": 41973, "epoch": 999} {"train_loss": -5.546743392944336, "global_step": 41974, "epoch": 999} {"train_loss": -5.611383438110352, "global_step": 41975, "epoch": 999} {"train_loss": -5.746620178222656, "global_step": 41976, "epoch": 999} {"train_loss": -5.655104160308838, "global_step": 41977, "epoch": 999} {"train_loss": -5.6877360343933105, "global_step": 41978, "epoch": 999} {"train_loss": -5.710118293762207, "global_step": 41979, "epoch": 999} {"train_loss": -5.663741111755371, "global_step": 41980, "epoch": 999} {"train_loss": -5.555586814880371, "global_step": 41981, "epoch": 999} {"train_loss": -5.612378120422363, "global_step": 41982, "epoch": 999} {"train_loss": -5.633432388305664, "global_step": 41983, "epoch": 999} {"train_loss": -5.774604320526123, "global_step": 41984, "epoch": 999} {"train_loss": -5.645747184753418, "global_step": 41985, "epoch": 999} {"train_loss": -5.598549842834473, "global_step": 41986, "epoch": 999} {"train_loss": -5.7030348777771, "global_step": 41987, "epoch": 999} {"train_loss": -5.653313636779785, "global_step": 41988, "epoch": 999} {"train_loss": -5.573427200317383, "global_step": 41989, "epoch": 999} {"train_loss": -5.428976058959961, "global_step": 41990, "epoch": 999} {"train_loss": -5.600879192352295, "global_step": 41991, "epoch": 999} {"train_loss": -5.600013732910156, "global_step": 41992, "epoch": 999} {"train_loss": -5.514521598815918, "global_step": 41993, "epoch": 999} {"train_loss": -5.4131574630737305, "global_step": 41994, "epoch": 999} {"train_loss": -5.603611469268799, "global_step": 41995, "epoch": 999} {"train_loss": -5.369790077209473, "global_step": 41996, "epoch": 999} {"train_loss": -5.498211860656738, "global_step": 41997, "epoch": 999} {"train_loss": -5.471722602844238, "global_step": 41998, "epoch": 999} {"train_loss": -5.61629969733102, "global_step": 41999, "epoch": 999, "val_loss": 66885.0859375} {"train_loss": -5.57214879989624, "global_step": 42000, "epoch": 1000} {"train_loss": -5.571628570556641, "global_step": 42001, "epoch": 1000} {"train_loss": -5.503711700439453, "global_step": 42002, "epoch": 1000} {"train_loss": -5.734126567840576, "global_step": 42003, "epoch": 1000} {"train_loss": -5.668548583984375, "global_step": 42004, "epoch": 1000} {"train_loss": -5.549800872802734, "global_step": 42005, "epoch": 1000} {"train_loss": -5.614109516143799, "global_step": 42006, "epoch": 1000} {"train_loss": -5.793137073516846, "global_step": 42007, "epoch": 1000} {"train_loss": -5.683224201202393, "global_step": 42008, "epoch": 1000} {"train_loss": -5.7149529457092285, "global_step": 42009, "epoch": 1000} {"train_loss": -5.678748607635498, "global_step": 42010, "epoch": 1000} {"train_loss": -5.581836700439453, "global_step": 42011, "epoch": 1000} {"train_loss": -5.418096542358398, "global_step": 42012, "epoch": 1000} {"train_loss": -5.508195877075195, "global_step": 42013, "epoch": 1000} {"train_loss": -5.538099765777588, "global_step": 42014, "epoch": 1000} {"train_loss": -5.638447284698486, "global_step": 42015, "epoch": 1000} {"train_loss": -5.561581611633301, "global_step": 42016, "epoch": 1000} {"train_loss": -5.577864646911621, "global_step": 42017, "epoch": 1000} {"train_loss": -5.582242012023926, "global_step": 42018, "epoch": 1000} {"train_loss": -5.559394836425781, "global_step": 42019, "epoch": 1000} {"train_loss": -5.63330078125, "global_step": 42020, "epoch": 1000} {"train_loss": -5.551115989685059, "global_step": 42021, "epoch": 1000} {"train_loss": -5.622275352478027, "global_step": 42022, "epoch": 1000} {"train_loss": -5.555582046508789, "global_step": 42023, "epoch": 1000} {"train_loss": -5.63004207611084, "global_step": 42024, "epoch": 1000} {"train_loss": -5.630096435546875, "global_step": 42025, "epoch": 1000} {"train_loss": -5.655087471008301, "global_step": 42026, "epoch": 1000} {"train_loss": -5.696043968200684, "global_step": 42027, "epoch": 1000} {"train_loss": -5.686095237731934, "global_step": 42028, "epoch": 1000} {"train_loss": -5.7336578369140625, "global_step": 42029, "epoch": 1000} {"train_loss": -5.658209800720215, "global_step": 42030, "epoch": 1000} {"train_loss": -5.621466636657715, "global_step": 42031, "epoch": 1000} {"train_loss": -5.825878620147705, "global_step": 42032, "epoch": 1000} {"train_loss": -5.591448783874512, "global_step": 42033, "epoch": 1000} {"train_loss": -5.61134672164917, "global_step": 42034, "epoch": 1000} {"train_loss": -5.583535194396973, "global_step": 42035, "epoch": 1000} {"train_loss": -5.667490482330322, "global_step": 42036, "epoch": 1000} {"train_loss": -5.634070873260498, "global_step": 42037, "epoch": 1000} {"train_loss": -5.713666915893555, "global_step": 42038, "epoch": 1000} {"train_loss": -5.631422996520996, "global_step": 42039, "epoch": 1000} {"train_loss": -5.639187812805176, "global_step": 42040, "epoch": 1000} {"train_loss": -5.622869026093256, "global_step": 42041, "epoch": 1000, "train/sim_max_reward_0": 0.7501529609888488, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.7050160238601118, "train/sim_max_reward_3": 0.45579064823237775, "train/sim_max_reward_4": 0.41639245106263095, "train/sim_max_reward_5": 0.9028656832082388, "test/sim_max_reward_4400000": 0.356632199248939, "test/sim_max_reward_4400001": 0.7829248089235461, "test/sim_max_reward_4400002": 0.40945880727407485, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.18743850778584933, "test/sim_max_reward_4400005": 0.15972855863526864, "test/sim_max_reward_4400006": 0.33490761287371046, "test/sim_max_reward_4400007": 0.12821632467891955, "test/sim_max_reward_4400008": 0.31758433942237646, "test/sim_max_reward_4400009": 0.8992319945402828, "test/sim_max_reward_4400010": 0.781315646931383, "test/sim_max_reward_4400011": 0.22049559824301648, "test/sim_max_reward_4400012": 0.14520530304279894, "test/sim_max_reward_4400013": 0.7219872955352375, "test/sim_max_reward_4400014": 0.15470785496220776, "test/sim_max_reward_4400015": 0.3293224204335161, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.37485237901713875, "test/sim_max_reward_4400019": 0.0009749247068106374, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.33719052994629517, "test/sim_max_reward_4400023": 0.2575014902023243, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.19228633464567474, "test/sim_max_reward_4400026": 0.10692786151496465, "test/sim_max_reward_4400027": 0.032216258345217824, "test/sim_max_reward_4400028": 0.44946334750700095, "test/sim_max_reward_4400029": 0.4671489864687221, "test/sim_max_reward_4400030": 0.3227867006356216, "test/sim_max_reward_4400031": 0.24512245389903006, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.19618912118613593, "test/sim_max_reward_4400034": 0.37443131462128904, "test/sim_max_reward_4400035": 0.36391940202226736, "test/sim_max_reward_4400036": 0.7099384040520915, "test/sim_max_reward_4400037": 0.35027392909456057, "test/sim_max_reward_4400038": 0.4702342820235371, "test/sim_max_reward_4400039": 0.7181184067617008, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.3662281751842475, "test/sim_max_reward_4400042": 0.01414383563883493, "test/sim_max_reward_4400043": 0.01961272717522902, "test/sim_max_reward_4400044": 0.34511113121486897, "test/sim_max_reward_4400045": 0.6983301011242604, "test/sim_max_reward_4400046": 0.7746151116999763, "test/sim_max_reward_4400047": 0.9088492153837551, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.23841769151674838, "train/mean_score": 0.5384822080956678, "test/mean_score": 0.31329281271402204, "val_loss": 66422.4609375} {"train_loss": -5.562565326690674, "global_step": 42042, "epoch": 1001} {"train_loss": -5.663076400756836, "global_step": 42043, "epoch": 1001} {"train_loss": -5.689709663391113, "global_step": 42044, "epoch": 1001} {"train_loss": -5.629955291748047, "global_step": 42045, "epoch": 1001} {"train_loss": -5.702389717102051, "global_step": 42046, "epoch": 1001} {"train_loss": -5.529590606689453, "global_step": 42047, "epoch": 1001} {"train_loss": -5.717675685882568, "global_step": 42048, "epoch": 1001} {"train_loss": -5.748427391052246, "global_step": 42049, "epoch": 1001} {"train_loss": -5.55897331237793, "global_step": 42050, "epoch": 1001} {"train_loss": -5.6384687423706055, "global_step": 42051, "epoch": 1001} {"train_loss": -5.704977512359619, "global_step": 42052, "epoch": 1001} {"train_loss": -5.755795955657959, "global_step": 42053, "epoch": 1001} {"train_loss": -5.6973419189453125, "global_step": 42054, "epoch": 1001} {"train_loss": -5.643269062042236, "global_step": 42055, "epoch": 1001} {"train_loss": -5.70503044128418, "global_step": 42056, "epoch": 1001} {"train_loss": -5.524035930633545, "global_step": 42057, "epoch": 1001} {"train_loss": -5.624512195587158, "global_step": 42058, "epoch": 1001} {"train_loss": -5.817122459411621, "global_step": 42059, "epoch": 1001} {"train_loss": -5.690756797790527, "global_step": 42060, "epoch": 1001} {"train_loss": -5.612737655639648, "global_step": 42061, "epoch": 1001} {"train_loss": -5.741222381591797, "global_step": 42062, "epoch": 1001} {"train_loss": -5.550443172454834, "global_step": 42063, "epoch": 1001} {"train_loss": -5.579477310180664, "global_step": 42064, "epoch": 1001} {"train_loss": -5.624900817871094, "global_step": 42065, "epoch": 1001} {"train_loss": -5.725923538208008, "global_step": 42066, "epoch": 1001} {"train_loss": -5.5956621170043945, "global_step": 42067, "epoch": 1001} {"train_loss": -5.634674072265625, "global_step": 42068, "epoch": 1001} {"train_loss": -5.7014479637146, "global_step": 42069, "epoch": 1001} {"train_loss": -5.618127822875977, "global_step": 42070, "epoch": 1001} {"train_loss": -5.666360855102539, "global_step": 42071, "epoch": 1001} {"train_loss": -5.7300872802734375, "global_step": 42072, "epoch": 1001} {"train_loss": -5.56864070892334, "global_step": 42073, "epoch": 1001} {"train_loss": -5.664344310760498, "global_step": 42074, "epoch": 1001} {"train_loss": -5.646514415740967, "global_step": 42075, "epoch": 1001} {"train_loss": -5.684662818908691, "global_step": 42076, "epoch": 1001} {"train_loss": -5.730957984924316, "global_step": 42077, "epoch": 1001} {"train_loss": -5.591517925262451, "global_step": 42078, "epoch": 1001} {"train_loss": -5.6282639503479, "global_step": 42079, "epoch": 1001} {"train_loss": -5.706355094909668, "global_step": 42080, "epoch": 1001} {"train_loss": -5.569068908691406, "global_step": 42081, "epoch": 1001} {"train_loss": -5.564013957977295, "global_step": 42082, "epoch": 1001} {"train_loss": -5.653184425263178, "global_step": 42083, "epoch": 1001, "val_loss": 66152.8828125} {"train_loss": -5.401551723480225, "global_step": 42084, "epoch": 1002} {"train_loss": -5.705476760864258, "global_step": 42085, "epoch": 1002} {"train_loss": -5.650016784667969, "global_step": 42086, "epoch": 1002} {"train_loss": -5.664099216461182, "global_step": 42087, "epoch": 1002} {"train_loss": -5.699307918548584, "global_step": 42088, "epoch": 1002} {"train_loss": -5.579928398132324, "global_step": 42089, "epoch": 1002} {"train_loss": -5.645015716552734, "global_step": 42090, "epoch": 1002} {"train_loss": -5.748296737670898, "global_step": 42091, "epoch": 1002} {"train_loss": -5.655661582946777, "global_step": 42092, "epoch": 1002} {"train_loss": -5.630197525024414, "global_step": 42093, "epoch": 1002} {"train_loss": -5.646277904510498, "global_step": 42094, "epoch": 1002} {"train_loss": -5.589086532592773, "global_step": 42095, "epoch": 1002} {"train_loss": -5.5834832191467285, "global_step": 42096, "epoch": 1002} {"train_loss": -5.5990095138549805, "global_step": 42097, "epoch": 1002} {"train_loss": -5.7731218338012695, "global_step": 42098, "epoch": 1002} {"train_loss": -5.6439642906188965, "global_step": 42099, "epoch": 1002} {"train_loss": -5.649237632751465, "global_step": 42100, "epoch": 1002} {"train_loss": -5.617988586425781, "global_step": 42101, "epoch": 1002} {"train_loss": -5.664383888244629, "global_step": 42102, "epoch": 1002} {"train_loss": -5.5762505531311035, "global_step": 42103, "epoch": 1002} {"train_loss": -5.603369235992432, "global_step": 42104, "epoch": 1002} {"train_loss": -5.651257514953613, "global_step": 42105, "epoch": 1002} {"train_loss": -5.754391670227051, "global_step": 42106, "epoch": 1002} {"train_loss": -5.742661952972412, "global_step": 42107, "epoch": 1002} {"train_loss": -5.709489345550537, "global_step": 42108, "epoch": 1002} {"train_loss": -5.711038589477539, "global_step": 42109, "epoch": 1002} {"train_loss": -5.741779327392578, "global_step": 42110, "epoch": 1002} {"train_loss": -5.627346038818359, "global_step": 42111, "epoch": 1002} {"train_loss": -5.721401214599609, "global_step": 42112, "epoch": 1002} {"train_loss": -5.662753105163574, "global_step": 42113, "epoch": 1002} {"train_loss": -5.589902877807617, "global_step": 42114, "epoch": 1002} {"train_loss": -5.633386611938477, "global_step": 42115, "epoch": 1002} {"train_loss": -5.681482315063477, "global_step": 42116, "epoch": 1002} {"train_loss": -5.633351802825928, "global_step": 42117, "epoch": 1002} {"train_loss": -5.745033264160156, "global_step": 42118, "epoch": 1002} {"train_loss": -5.721245765686035, "global_step": 42119, "epoch": 1002} {"train_loss": -5.701651573181152, "global_step": 42120, "epoch": 1002} {"train_loss": -5.632712364196777, "global_step": 42121, "epoch": 1002} {"train_loss": -5.487576961517334, "global_step": 42122, "epoch": 1002} {"train_loss": -5.7246479988098145, "global_step": 42123, "epoch": 1002} {"train_loss": -5.61553955078125, "global_step": 42124, "epoch": 1002} {"train_loss": -5.653029475893293, "global_step": 42125, "epoch": 1002, "val_loss": 66447.734375} {"train_loss": -5.650094985961914, "global_step": 42126, "epoch": 1003} {"train_loss": -5.655580043792725, "global_step": 42127, "epoch": 1003} {"train_loss": -5.758599281311035, "global_step": 42128, "epoch": 1003} {"train_loss": -5.631389617919922, "global_step": 42129, "epoch": 1003} {"train_loss": -5.730608940124512, "global_step": 42130, "epoch": 1003} {"train_loss": -5.624506950378418, "global_step": 42131, "epoch": 1003} {"train_loss": -5.628417491912842, "global_step": 42132, "epoch": 1003} {"train_loss": -5.760767936706543, "global_step": 42133, "epoch": 1003} {"train_loss": -5.649722099304199, "global_step": 42134, "epoch": 1003} {"train_loss": -5.65149450302124, "global_step": 42135, "epoch": 1003} {"train_loss": -5.794312000274658, "global_step": 42136, "epoch": 1003} {"train_loss": -5.6398701667785645, "global_step": 42137, "epoch": 1003} {"train_loss": -5.509612083435059, "global_step": 42138, "epoch": 1003} {"train_loss": -5.731873512268066, "global_step": 42139, "epoch": 1003} {"train_loss": -5.696203708648682, "global_step": 42140, "epoch": 1003} {"train_loss": -5.64302921295166, "global_step": 42141, "epoch": 1003} {"train_loss": -5.6068115234375, "global_step": 42142, "epoch": 1003} {"train_loss": -5.718050956726074, "global_step": 42143, "epoch": 1003} {"train_loss": -5.7087178230285645, "global_step": 42144, "epoch": 1003} {"train_loss": -5.627960681915283, "global_step": 42145, "epoch": 1003} {"train_loss": -5.701553821563721, "global_step": 42146, "epoch": 1003} {"train_loss": -5.674166679382324, "global_step": 42147, "epoch": 1003} {"train_loss": -5.724898815155029, "global_step": 42148, "epoch": 1003} {"train_loss": -5.688587188720703, "global_step": 42149, "epoch": 1003} {"train_loss": -5.591605186462402, "global_step": 42150, "epoch": 1003} {"train_loss": -5.684372901916504, "global_step": 42151, "epoch": 1003} {"train_loss": -5.736397743225098, "global_step": 42152, "epoch": 1003} {"train_loss": -5.588289260864258, "global_step": 42153, "epoch": 1003} {"train_loss": -5.690906524658203, "global_step": 42154, "epoch": 1003} {"train_loss": -5.646710395812988, "global_step": 42155, "epoch": 1003} {"train_loss": -5.720273017883301, "global_step": 42156, "epoch": 1003} {"train_loss": -5.6677021980285645, "global_step": 42157, "epoch": 1003} {"train_loss": -5.700167655944824, "global_step": 42158, "epoch": 1003} {"train_loss": -5.652729034423828, "global_step": 42159, "epoch": 1003} {"train_loss": -5.637490749359131, "global_step": 42160, "epoch": 1003} {"train_loss": -5.6721391677856445, "global_step": 42161, "epoch": 1003} {"train_loss": -5.612006187438965, "global_step": 42162, "epoch": 1003} {"train_loss": -5.634215831756592, "global_step": 42163, "epoch": 1003} {"train_loss": -5.530969619750977, "global_step": 42164, "epoch": 1003} {"train_loss": -5.674969673156738, "global_step": 42165, "epoch": 1003} {"train_loss": -5.7154083251953125, "global_step": 42166, "epoch": 1003} {"train_loss": -5.664552211761475, "global_step": 42167, "epoch": 1003, "val_loss": 66167.7109375} {"train_loss": -5.688047885894775, "global_step": 42168, "epoch": 1004} {"train_loss": -5.590954780578613, "global_step": 42169, "epoch": 1004} {"train_loss": -5.589178085327148, "global_step": 42170, "epoch": 1004} {"train_loss": -5.718143463134766, "global_step": 42171, "epoch": 1004} {"train_loss": -5.792187690734863, "global_step": 42172, "epoch": 1004} {"train_loss": -5.738001346588135, "global_step": 42173, "epoch": 1004} {"train_loss": -5.6622443199157715, "global_step": 42174, "epoch": 1004} {"train_loss": -5.675316333770752, "global_step": 42175, "epoch": 1004} {"train_loss": -5.727154731750488, "global_step": 42176, "epoch": 1004} {"train_loss": -5.761633396148682, "global_step": 42177, "epoch": 1004} {"train_loss": -5.744696140289307, "global_step": 42178, "epoch": 1004} {"train_loss": -5.5679216384887695, "global_step": 42179, "epoch": 1004} {"train_loss": -5.709005355834961, "global_step": 42180, "epoch": 1004} {"train_loss": -5.654165267944336, "global_step": 42181, "epoch": 1004} {"train_loss": -5.573873043060303, "global_step": 42182, "epoch": 1004} {"train_loss": -5.566422462463379, "global_step": 42183, "epoch": 1004} {"train_loss": -5.618653297424316, "global_step": 42184, "epoch": 1004} {"train_loss": -5.644783973693848, "global_step": 42185, "epoch": 1004} {"train_loss": -5.602283477783203, "global_step": 42186, "epoch": 1004} {"train_loss": -5.746686935424805, "global_step": 42187, "epoch": 1004} {"train_loss": -5.709524154663086, "global_step": 42188, "epoch": 1004} {"train_loss": -5.695132255554199, "global_step": 42189, "epoch": 1004} {"train_loss": -5.57740592956543, "global_step": 42190, "epoch": 1004} {"train_loss": -5.659226417541504, "global_step": 42191, "epoch": 1004} {"train_loss": -5.652204513549805, "global_step": 42192, "epoch": 1004} {"train_loss": -5.7330803871154785, "global_step": 42193, "epoch": 1004} {"train_loss": -5.623597621917725, "global_step": 42194, "epoch": 1004} {"train_loss": -5.685832977294922, "global_step": 42195, "epoch": 1004} {"train_loss": -5.706912040710449, "global_step": 42196, "epoch": 1004} {"train_loss": -5.537823677062988, "global_step": 42197, "epoch": 1004} {"train_loss": -5.655877113342285, "global_step": 42198, "epoch": 1004} {"train_loss": -5.763581275939941, "global_step": 42199, "epoch": 1004} {"train_loss": -5.734346866607666, "global_step": 42200, "epoch": 1004} {"train_loss": -5.892246723175049, "global_step": 42201, "epoch": 1004} {"train_loss": -5.621094226837158, "global_step": 42202, "epoch": 1004} {"train_loss": -5.746347427368164, "global_step": 42203, "epoch": 1004} {"train_loss": -5.801621913909912, "global_step": 42204, "epoch": 1004} {"train_loss": -5.641292572021484, "global_step": 42205, "epoch": 1004} {"train_loss": -5.491654396057129, "global_step": 42206, "epoch": 1004} {"train_loss": -5.603509902954102, "global_step": 42207, "epoch": 1004} {"train_loss": -5.742243766784668, "global_step": 42208, "epoch": 1004} {"train_loss": -5.6742011819566995, "global_step": 42209, "epoch": 1004, "val_loss": 66111.0390625} {"train_loss": -5.670392036437988, "global_step": 42210, "epoch": 1005} {"train_loss": -5.726306438446045, "global_step": 42211, "epoch": 1005} {"train_loss": -5.7076497077941895, "global_step": 42212, "epoch": 1005} {"train_loss": -5.772001266479492, "global_step": 42213, "epoch": 1005} {"train_loss": -5.7684645652771, "global_step": 42214, "epoch": 1005} {"train_loss": -5.6822190284729, "global_step": 42215, "epoch": 1005} {"train_loss": -5.66296911239624, "global_step": 42216, "epoch": 1005} {"train_loss": -5.539555072784424, "global_step": 42217, "epoch": 1005} {"train_loss": -5.68904447555542, "global_step": 42218, "epoch": 1005} {"train_loss": -5.667166709899902, "global_step": 42219, "epoch": 1005} {"train_loss": -5.615102291107178, "global_step": 42220, "epoch": 1005} {"train_loss": -5.68634557723999, "global_step": 42221, "epoch": 1005} {"train_loss": -5.683480262756348, "global_step": 42222, "epoch": 1005} {"train_loss": -5.570953845977783, "global_step": 42223, "epoch": 1005} {"train_loss": -5.588274002075195, "global_step": 42224, "epoch": 1005} {"train_loss": -5.466747283935547, "global_step": 42225, "epoch": 1005} {"train_loss": -5.5650315284729, "global_step": 42226, "epoch": 1005} {"train_loss": -5.528465270996094, "global_step": 42227, "epoch": 1005} {"train_loss": -5.466561317443848, "global_step": 42228, "epoch": 1005} {"train_loss": -5.72020149230957, "global_step": 42229, "epoch": 1005} {"train_loss": -5.654365062713623, "global_step": 42230, "epoch": 1005} {"train_loss": -5.624614715576172, "global_step": 42231, "epoch": 1005} {"train_loss": -5.7188401222229, "global_step": 42232, "epoch": 1005} {"train_loss": -5.663776397705078, "global_step": 42233, "epoch": 1005} {"train_loss": -5.5323944091796875, "global_step": 42234, "epoch": 1005} {"train_loss": -5.631185531616211, "global_step": 42235, "epoch": 1005} {"train_loss": -5.632376670837402, "global_step": 42236, "epoch": 1005} {"train_loss": -5.654863357543945, "global_step": 42237, "epoch": 1005} {"train_loss": -5.731966018676758, "global_step": 42238, "epoch": 1005} {"train_loss": -5.506741523742676, "global_step": 42239, "epoch": 1005} {"train_loss": -5.679450511932373, "global_step": 42240, "epoch": 1005} {"train_loss": -5.663944721221924, "global_step": 42241, "epoch": 1005} {"train_loss": -5.795003890991211, "global_step": 42242, "epoch": 1005} {"train_loss": -5.626089096069336, "global_step": 42243, "epoch": 1005} {"train_loss": -5.654306888580322, "global_step": 42244, "epoch": 1005} {"train_loss": -5.649062156677246, "global_step": 42245, "epoch": 1005} {"train_loss": -5.668333530426025, "global_step": 42246, "epoch": 1005} {"train_loss": -5.601333141326904, "global_step": 42247, "epoch": 1005} {"train_loss": -5.650566101074219, "global_step": 42248, "epoch": 1005} {"train_loss": -5.63498592376709, "global_step": 42249, "epoch": 1005} {"train_loss": -5.766854763031006, "global_step": 42250, "epoch": 1005} {"train_loss": -5.645959570294335, "global_step": 42251, "epoch": 1005, "val_loss": 65874.5625} {"train_loss": -5.713290691375732, "global_step": 42252, "epoch": 1006} {"train_loss": -5.708529472351074, "global_step": 42253, "epoch": 1006} {"train_loss": -5.668026924133301, "global_step": 42254, "epoch": 1006} {"train_loss": -5.743128299713135, "global_step": 42255, "epoch": 1006} {"train_loss": -5.608698844909668, "global_step": 42256, "epoch": 1006} {"train_loss": -5.773372173309326, "global_step": 42257, "epoch": 1006} {"train_loss": -5.652359485626221, "global_step": 42258, "epoch": 1006} {"train_loss": -5.538018226623535, "global_step": 42259, "epoch": 1006} {"train_loss": -5.697854042053223, "global_step": 42260, "epoch": 1006} {"train_loss": -5.786928176879883, "global_step": 42261, "epoch": 1006} {"train_loss": -5.844120979309082, "global_step": 42262, "epoch": 1006} {"train_loss": -5.644784927368164, "global_step": 42263, "epoch": 1006} {"train_loss": -5.664132118225098, "global_step": 42264, "epoch": 1006} {"train_loss": -5.575727462768555, "global_step": 42265, "epoch": 1006} {"train_loss": -5.687784194946289, "global_step": 42266, "epoch": 1006} {"train_loss": -5.615175247192383, "global_step": 42267, "epoch": 1006} {"train_loss": -5.589750289916992, "global_step": 42268, "epoch": 1006} {"train_loss": -5.7404465675354, "global_step": 42269, "epoch": 1006} {"train_loss": -5.611963748931885, "global_step": 42270, "epoch": 1006} {"train_loss": -5.511525630950928, "global_step": 42271, "epoch": 1006} {"train_loss": -5.601746082305908, "global_step": 42272, "epoch": 1006} {"train_loss": -5.653529167175293, "global_step": 42273, "epoch": 1006} {"train_loss": -5.467113494873047, "global_step": 42274, "epoch": 1006} {"train_loss": -5.756565093994141, "global_step": 42275, "epoch": 1006} {"train_loss": -5.680018424987793, "global_step": 42276, "epoch": 1006} {"train_loss": -5.636536598205566, "global_step": 42277, "epoch": 1006} {"train_loss": -5.644105434417725, "global_step": 42278, "epoch": 1006} {"train_loss": -5.61754846572876, "global_step": 42279, "epoch": 1006} {"train_loss": -5.5583977699279785, "global_step": 42280, "epoch": 1006} {"train_loss": -5.716896057128906, "global_step": 42281, "epoch": 1006} {"train_loss": -5.66380500793457, "global_step": 42282, "epoch": 1006} {"train_loss": -5.536531448364258, "global_step": 42283, "epoch": 1006} {"train_loss": -5.615042686462402, "global_step": 42284, "epoch": 1006} {"train_loss": -5.6575775146484375, "global_step": 42285, "epoch": 1006} {"train_loss": -5.587000846862793, "global_step": 42286, "epoch": 1006} {"train_loss": -5.677727699279785, "global_step": 42287, "epoch": 1006} {"train_loss": -5.49936056137085, "global_step": 42288, "epoch": 1006} {"train_loss": -5.584886074066162, "global_step": 42289, "epoch": 1006} {"train_loss": -5.717296600341797, "global_step": 42290, "epoch": 1006} {"train_loss": -5.694378852844238, "global_step": 42291, "epoch": 1006} {"train_loss": -5.649224758148193, "global_step": 42292, "epoch": 1006} {"train_loss": -5.648756617591495, "global_step": 42293, "epoch": 1006, "val_loss": 66194.1015625} {"train_loss": -5.766084671020508, "global_step": 42294, "epoch": 1007} {"train_loss": -5.6678385734558105, "global_step": 42295, "epoch": 1007} {"train_loss": -5.674830436706543, "global_step": 42296, "epoch": 1007} {"train_loss": -5.710023880004883, "global_step": 42297, "epoch": 1007} {"train_loss": -5.642516136169434, "global_step": 42298, "epoch": 1007} {"train_loss": -5.619362831115723, "global_step": 42299, "epoch": 1007} {"train_loss": -5.560033321380615, "global_step": 42300, "epoch": 1007} {"train_loss": -5.614421844482422, "global_step": 42301, "epoch": 1007} {"train_loss": -5.702935218811035, "global_step": 42302, "epoch": 1007} {"train_loss": -5.541230201721191, "global_step": 42303, "epoch": 1007} {"train_loss": -5.603848457336426, "global_step": 42304, "epoch": 1007} {"train_loss": -5.544492721557617, "global_step": 42305, "epoch": 1007} {"train_loss": -5.648782730102539, "global_step": 42306, "epoch": 1007} {"train_loss": -5.614209175109863, "global_step": 42307, "epoch": 1007} {"train_loss": -5.680469036102295, "global_step": 42308, "epoch": 1007} {"train_loss": -5.815256118774414, "global_step": 42309, "epoch": 1007} {"train_loss": -5.7188568115234375, "global_step": 42310, "epoch": 1007} {"train_loss": -5.688612937927246, "global_step": 42311, "epoch": 1007} {"train_loss": -5.653297424316406, "global_step": 42312, "epoch": 1007} {"train_loss": -5.70689582824707, "global_step": 42313, "epoch": 1007} {"train_loss": -5.694363594055176, "global_step": 42314, "epoch": 1007} {"train_loss": -5.529389381408691, "global_step": 42315, "epoch": 1007} {"train_loss": -5.652341842651367, "global_step": 42316, "epoch": 1007} {"train_loss": -5.614897727966309, "global_step": 42317, "epoch": 1007} {"train_loss": -5.600295066833496, "global_step": 42318, "epoch": 1007} {"train_loss": -5.723817825317383, "global_step": 42319, "epoch": 1007} {"train_loss": -5.769445419311523, "global_step": 42320, "epoch": 1007} {"train_loss": -5.715970039367676, "global_step": 42321, "epoch": 1007} {"train_loss": -5.666512489318848, "global_step": 42322, "epoch": 1007} {"train_loss": -5.655599594116211, "global_step": 42323, "epoch": 1007} {"train_loss": -5.719747543334961, "global_step": 42324, "epoch": 1007} {"train_loss": -5.676905155181885, "global_step": 42325, "epoch": 1007} {"train_loss": -5.5055928230285645, "global_step": 42326, "epoch": 1007} {"train_loss": -5.6303815841674805, "global_step": 42327, "epoch": 1007} {"train_loss": -5.590703964233398, "global_step": 42328, "epoch": 1007} {"train_loss": -5.556705474853516, "global_step": 42329, "epoch": 1007} {"train_loss": -5.628286838531494, "global_step": 42330, "epoch": 1007} {"train_loss": -5.553576469421387, "global_step": 42331, "epoch": 1007} {"train_loss": -5.6260151863098145, "global_step": 42332, "epoch": 1007} {"train_loss": -5.715386867523193, "global_step": 42333, "epoch": 1007} {"train_loss": -5.5458879470825195, "global_step": 42334, "epoch": 1007} {"train_loss": -5.6480967317308695, "global_step": 42335, "epoch": 1007, "val_loss": 66227.515625} {"train_loss": -5.713077545166016, "global_step": 42336, "epoch": 1008} {"train_loss": -5.588471412658691, "global_step": 42337, "epoch": 1008} {"train_loss": -5.664885520935059, "global_step": 42338, "epoch": 1008} {"train_loss": -5.664727210998535, "global_step": 42339, "epoch": 1008} {"train_loss": -5.756829738616943, "global_step": 42340, "epoch": 1008} {"train_loss": -5.538183212280273, "global_step": 42341, "epoch": 1008} {"train_loss": -5.637439727783203, "global_step": 42342, "epoch": 1008} {"train_loss": -5.576241970062256, "global_step": 42343, "epoch": 1008} {"train_loss": -5.656651020050049, "global_step": 42344, "epoch": 1008} {"train_loss": -5.781130790710449, "global_step": 42345, "epoch": 1008} {"train_loss": -5.665775775909424, "global_step": 42346, "epoch": 1008} {"train_loss": -5.524587154388428, "global_step": 42347, "epoch": 1008} {"train_loss": -5.59567928314209, "global_step": 42348, "epoch": 1008} {"train_loss": -5.709303855895996, "global_step": 42349, "epoch": 1008} {"train_loss": -5.706145286560059, "global_step": 42350, "epoch": 1008} {"train_loss": -5.558104991912842, "global_step": 42351, "epoch": 1008} {"train_loss": -5.525050163269043, "global_step": 42352, "epoch": 1008} {"train_loss": -5.620365142822266, "global_step": 42353, "epoch": 1008} {"train_loss": -5.513579368591309, "global_step": 42354, "epoch": 1008} {"train_loss": -5.732240676879883, "global_step": 42355, "epoch": 1008} {"train_loss": -5.641678333282471, "global_step": 42356, "epoch": 1008} {"train_loss": -5.702946662902832, "global_step": 42357, "epoch": 1008} {"train_loss": -5.654510974884033, "global_step": 42358, "epoch": 1008} {"train_loss": -5.657144546508789, "global_step": 42359, "epoch": 1008} {"train_loss": -5.681875228881836, "global_step": 42360, "epoch": 1008} {"train_loss": -5.629974365234375, "global_step": 42361, "epoch": 1008} {"train_loss": -5.771677017211914, "global_step": 42362, "epoch": 1008} {"train_loss": -5.649916648864746, "global_step": 42363, "epoch": 1008} {"train_loss": -5.739337921142578, "global_step": 42364, "epoch": 1008} {"train_loss": -5.758861541748047, "global_step": 42365, "epoch": 1008} {"train_loss": -5.557579517364502, "global_step": 42366, "epoch": 1008} {"train_loss": -5.698747634887695, "global_step": 42367, "epoch": 1008} {"train_loss": -5.611879348754883, "global_step": 42368, "epoch": 1008} {"train_loss": -5.574043273925781, "global_step": 42369, "epoch": 1008} {"train_loss": -5.632478713989258, "global_step": 42370, "epoch": 1008} {"train_loss": -5.4947428703308105, "global_step": 42371, "epoch": 1008} {"train_loss": -5.726336479187012, "global_step": 42372, "epoch": 1008} {"train_loss": -5.672379493713379, "global_step": 42373, "epoch": 1008} {"train_loss": -5.715147018432617, "global_step": 42374, "epoch": 1008} {"train_loss": -5.737117767333984, "global_step": 42375, "epoch": 1008} {"train_loss": -5.44612455368042, "global_step": 42376, "epoch": 1008} {"train_loss": -5.64625746863229, "global_step": 42377, "epoch": 1008, "val_loss": 66125.5234375} {"train_loss": -5.709619045257568, "global_step": 42378, "epoch": 1009} {"train_loss": -5.601699352264404, "global_step": 42379, "epoch": 1009} {"train_loss": -5.640966415405273, "global_step": 42380, "epoch": 1009} {"train_loss": -5.753742218017578, "global_step": 42381, "epoch": 1009} {"train_loss": -5.592048645019531, "global_step": 42382, "epoch": 1009} {"train_loss": -5.53956413269043, "global_step": 42383, "epoch": 1009} {"train_loss": -5.6378173828125, "global_step": 42384, "epoch": 1009} {"train_loss": -5.651005744934082, "global_step": 42385, "epoch": 1009} {"train_loss": -5.649909019470215, "global_step": 42386, "epoch": 1009} {"train_loss": -5.631692886352539, "global_step": 42387, "epoch": 1009} {"train_loss": -5.6472578048706055, "global_step": 42388, "epoch": 1009} {"train_loss": -5.560225009918213, "global_step": 42389, "epoch": 1009} {"train_loss": -5.7550811767578125, "global_step": 42390, "epoch": 1009} {"train_loss": -5.737684726715088, "global_step": 42391, "epoch": 1009} {"train_loss": -5.539471626281738, "global_step": 42392, "epoch": 1009} {"train_loss": -5.747003555297852, "global_step": 42393, "epoch": 1009} {"train_loss": -5.618882179260254, "global_step": 42394, "epoch": 1009} {"train_loss": -5.648010730743408, "global_step": 42395, "epoch": 1009} {"train_loss": -5.642519950866699, "global_step": 42396, "epoch": 1009} {"train_loss": -5.711263656616211, "global_step": 42397, "epoch": 1009} {"train_loss": -5.731342315673828, "global_step": 42398, "epoch": 1009} {"train_loss": -5.665368556976318, "global_step": 42399, "epoch": 1009} {"train_loss": -5.75050163269043, "global_step": 42400, "epoch": 1009} {"train_loss": -5.642923355102539, "global_step": 42401, "epoch": 1009} {"train_loss": -5.649213790893555, "global_step": 42402, "epoch": 1009} {"train_loss": -5.629463195800781, "global_step": 42403, "epoch": 1009} {"train_loss": -5.613682746887207, "global_step": 42404, "epoch": 1009} {"train_loss": -5.757790565490723, "global_step": 42405, "epoch": 1009} {"train_loss": -5.641722679138184, "global_step": 42406, "epoch": 1009} {"train_loss": -5.668142318725586, "global_step": 42407, "epoch": 1009} {"train_loss": -5.570796012878418, "global_step": 42408, "epoch": 1009} {"train_loss": -5.544434547424316, "global_step": 42409, "epoch": 1009} {"train_loss": -5.512364387512207, "global_step": 42410, "epoch": 1009} {"train_loss": -5.666501045227051, "global_step": 42411, "epoch": 1009} {"train_loss": -5.71150016784668, "global_step": 42412, "epoch": 1009} {"train_loss": -5.587258338928223, "global_step": 42413, "epoch": 1009} {"train_loss": -5.553600311279297, "global_step": 42414, "epoch": 1009} {"train_loss": -5.438203811645508, "global_step": 42415, "epoch": 1009} {"train_loss": -5.628139019012451, "global_step": 42416, "epoch": 1009} {"train_loss": -5.587273597717285, "global_step": 42417, "epoch": 1009} {"train_loss": -5.505529403686523, "global_step": 42418, "epoch": 1009} {"train_loss": -5.638010342915853, "global_step": 42419, "epoch": 1009, "val_loss": 66395.5625} {"train_loss": -5.451362609863281, "global_step": 42420, "epoch": 1010} {"train_loss": -5.680760383605957, "global_step": 42421, "epoch": 1010} {"train_loss": -5.51820707321167, "global_step": 42422, "epoch": 1010} {"train_loss": -5.5487165451049805, "global_step": 42423, "epoch": 1010} {"train_loss": -5.701798439025879, "global_step": 42424, "epoch": 1010} {"train_loss": -5.611375331878662, "global_step": 42425, "epoch": 1010} {"train_loss": -5.683900356292725, "global_step": 42426, "epoch": 1010} {"train_loss": -5.644550800323486, "global_step": 42427, "epoch": 1010} {"train_loss": -5.773406505584717, "global_step": 42428, "epoch": 1010} {"train_loss": -5.585982322692871, "global_step": 42429, "epoch": 1010} {"train_loss": -5.613131523132324, "global_step": 42430, "epoch": 1010} {"train_loss": -5.727798938751221, "global_step": 42431, "epoch": 1010} {"train_loss": -5.461715221405029, "global_step": 42432, "epoch": 1010} {"train_loss": -5.710780143737793, "global_step": 42433, "epoch": 1010} {"train_loss": -5.509044170379639, "global_step": 42434, "epoch": 1010} {"train_loss": -5.683754920959473, "global_step": 42435, "epoch": 1010} {"train_loss": -5.607564926147461, "global_step": 42436, "epoch": 1010} {"train_loss": -5.553534507751465, "global_step": 42437, "epoch": 1010} {"train_loss": -5.559442043304443, "global_step": 42438, "epoch": 1010} {"train_loss": -5.60036563873291, "global_step": 42439, "epoch": 1010} {"train_loss": -5.7305450439453125, "global_step": 42440, "epoch": 1010} {"train_loss": -5.576906204223633, "global_step": 42441, "epoch": 1010} {"train_loss": -5.613319396972656, "global_step": 42442, "epoch": 1010} {"train_loss": -5.4416608810424805, "global_step": 42443, "epoch": 1010} {"train_loss": -5.542847633361816, "global_step": 42444, "epoch": 1010} {"train_loss": -5.658164024353027, "global_step": 42445, "epoch": 1010} {"train_loss": -5.679535388946533, "global_step": 42446, "epoch": 1010} {"train_loss": -5.555245876312256, "global_step": 42447, "epoch": 1010} {"train_loss": -5.716738700866699, "global_step": 42448, "epoch": 1010} {"train_loss": -5.724968910217285, "global_step": 42449, "epoch": 1010} {"train_loss": -5.657217025756836, "global_step": 42450, "epoch": 1010} {"train_loss": -5.701716423034668, "global_step": 42451, "epoch": 1010} {"train_loss": -5.570044040679932, "global_step": 42452, "epoch": 1010} {"train_loss": -5.593238830566406, "global_step": 42453, "epoch": 1010} {"train_loss": -5.606930255889893, "global_step": 42454, "epoch": 1010} {"train_loss": -5.542215347290039, "global_step": 42455, "epoch": 1010} {"train_loss": -5.547896385192871, "global_step": 42456, "epoch": 1010} {"train_loss": -5.539241790771484, "global_step": 42457, "epoch": 1010} {"train_loss": -5.817543029785156, "global_step": 42458, "epoch": 1010} {"train_loss": -5.701494216918945, "global_step": 42459, "epoch": 1010} {"train_loss": -5.53963565826416, "global_step": 42460, "epoch": 1010} {"train_loss": -5.613002322968983, "global_step": 42461, "epoch": 1010, "val_loss": 66145.734375} {"train_loss": -5.5327467918396, "global_step": 42462, "epoch": 1011} {"train_loss": -5.728189945220947, "global_step": 42463, "epoch": 1011} {"train_loss": -5.60836935043335, "global_step": 42464, "epoch": 1011} {"train_loss": -5.4726667404174805, "global_step": 42465, "epoch": 1011} {"train_loss": -5.6617302894592285, "global_step": 42466, "epoch": 1011} {"train_loss": -5.621569633483887, "global_step": 42467, "epoch": 1011} {"train_loss": -5.682631492614746, "global_step": 42468, "epoch": 1011} {"train_loss": -5.627856254577637, "global_step": 42469, "epoch": 1011} {"train_loss": -5.613889694213867, "global_step": 42470, "epoch": 1011} {"train_loss": -5.662693500518799, "global_step": 42471, "epoch": 1011} {"train_loss": -5.749533653259277, "global_step": 42472, "epoch": 1011} {"train_loss": -5.788409233093262, "global_step": 42473, "epoch": 1011} {"train_loss": -5.607573509216309, "global_step": 42474, "epoch": 1011} {"train_loss": -5.679460525512695, "global_step": 42475, "epoch": 1011} {"train_loss": -5.6827216148376465, "global_step": 42476, "epoch": 1011} {"train_loss": -5.537367820739746, "global_step": 42477, "epoch": 1011} {"train_loss": -5.5904998779296875, "global_step": 42478, "epoch": 1011} {"train_loss": -5.666721343994141, "global_step": 42479, "epoch": 1011} {"train_loss": -5.6599860191345215, "global_step": 42480, "epoch": 1011} {"train_loss": -5.722201347351074, "global_step": 42481, "epoch": 1011} {"train_loss": -5.6271538734436035, "global_step": 42482, "epoch": 1011} {"train_loss": -5.694571495056152, "global_step": 42483, "epoch": 1011} {"train_loss": -5.646770477294922, "global_step": 42484, "epoch": 1011} {"train_loss": -5.615571022033691, "global_step": 42485, "epoch": 1011} {"train_loss": -5.667498588562012, "global_step": 42486, "epoch": 1011} {"train_loss": -5.629641056060791, "global_step": 42487, "epoch": 1011} {"train_loss": -5.602686882019043, "global_step": 42488, "epoch": 1011} {"train_loss": -5.68592643737793, "global_step": 42489, "epoch": 1011} {"train_loss": -5.603152275085449, "global_step": 42490, "epoch": 1011} {"train_loss": -5.667119979858398, "global_step": 42491, "epoch": 1011} {"train_loss": -5.665125846862793, "global_step": 42492, "epoch": 1011} {"train_loss": -5.802224159240723, "global_step": 42493, "epoch": 1011} {"train_loss": -5.654756546020508, "global_step": 42494, "epoch": 1011} {"train_loss": -5.756988525390625, "global_step": 42495, "epoch": 1011} {"train_loss": -5.746050834655762, "global_step": 42496, "epoch": 1011} {"train_loss": -5.610652923583984, "global_step": 42497, "epoch": 1011} {"train_loss": -5.657912731170654, "global_step": 42498, "epoch": 1011} {"train_loss": -5.730612754821777, "global_step": 42499, "epoch": 1011} {"train_loss": -5.621835708618164, "global_step": 42500, "epoch": 1011} {"train_loss": -5.645960330963135, "global_step": 42501, "epoch": 1011} {"train_loss": -5.622188568115234, "global_step": 42502, "epoch": 1011} {"train_loss": -5.656965812047322, "global_step": 42503, "epoch": 1011, "val_loss": 66005.734375} {"train_loss": -5.519344329833984, "global_step": 42504, "epoch": 1012} {"train_loss": -5.678062438964844, "global_step": 42505, "epoch": 1012} {"train_loss": -5.5893754959106445, "global_step": 42506, "epoch": 1012} {"train_loss": -5.666384220123291, "global_step": 42507, "epoch": 1012} {"train_loss": -5.6725263595581055, "global_step": 42508, "epoch": 1012} {"train_loss": -5.681448936462402, "global_step": 42509, "epoch": 1012} {"train_loss": -5.687267780303955, "global_step": 42510, "epoch": 1012} {"train_loss": -5.624610424041748, "global_step": 42511, "epoch": 1012} {"train_loss": -5.5026750564575195, "global_step": 42512, "epoch": 1012} {"train_loss": -5.698554992675781, "global_step": 42513, "epoch": 1012} {"train_loss": -5.667930603027344, "global_step": 42514, "epoch": 1012} {"train_loss": -5.698280334472656, "global_step": 42515, "epoch": 1012} {"train_loss": -5.641384124755859, "global_step": 42516, "epoch": 1012} {"train_loss": -5.759677886962891, "global_step": 42517, "epoch": 1012} {"train_loss": -5.731418132781982, "global_step": 42518, "epoch": 1012} {"train_loss": -5.641939163208008, "global_step": 42519, "epoch": 1012} {"train_loss": -5.615379810333252, "global_step": 42520, "epoch": 1012} {"train_loss": -5.655640125274658, "global_step": 42521, "epoch": 1012} {"train_loss": -5.670257091522217, "global_step": 42522, "epoch": 1012} {"train_loss": -5.757392406463623, "global_step": 42523, "epoch": 1012} {"train_loss": -5.665938377380371, "global_step": 42524, "epoch": 1012} {"train_loss": -5.611518859863281, "global_step": 42525, "epoch": 1012} {"train_loss": -5.6847243309021, "global_step": 42526, "epoch": 1012} {"train_loss": -5.6526079177856445, "global_step": 42527, "epoch": 1012} {"train_loss": -5.551054954528809, "global_step": 42528, "epoch": 1012} {"train_loss": -5.563415050506592, "global_step": 42529, "epoch": 1012} {"train_loss": -5.682218551635742, "global_step": 42530, "epoch": 1012} {"train_loss": -5.712019920349121, "global_step": 42531, "epoch": 1012} {"train_loss": -5.605526924133301, "global_step": 42532, "epoch": 1012} {"train_loss": -5.792950630187988, "global_step": 42533, "epoch": 1012} {"train_loss": -5.803454399108887, "global_step": 42534, "epoch": 1012} {"train_loss": -5.735739231109619, "global_step": 42535, "epoch": 1012} {"train_loss": -5.720068454742432, "global_step": 42536, "epoch": 1012} {"train_loss": -5.54939079284668, "global_step": 42537, "epoch": 1012} {"train_loss": -5.675746917724609, "global_step": 42538, "epoch": 1012} {"train_loss": -5.633920669555664, "global_step": 42539, "epoch": 1012} {"train_loss": -5.795671463012695, "global_step": 42540, "epoch": 1012} {"train_loss": -5.658940315246582, "global_step": 42541, "epoch": 1012} {"train_loss": -5.512631416320801, "global_step": 42542, "epoch": 1012} {"train_loss": -5.656388282775879, "global_step": 42543, "epoch": 1012} {"train_loss": -5.508726596832275, "global_step": 42544, "epoch": 1012} {"train_loss": -5.656534319832211, "global_step": 42545, "epoch": 1012, "val_loss": 66212.046875} {"train_loss": -5.633784294128418, "global_step": 42546, "epoch": 1013} {"train_loss": -5.575125694274902, "global_step": 42547, "epoch": 1013} {"train_loss": -5.672560691833496, "global_step": 42548, "epoch": 1013} {"train_loss": -5.588931083679199, "global_step": 42549, "epoch": 1013} {"train_loss": -5.7005109786987305, "global_step": 42550, "epoch": 1013} {"train_loss": -5.57828950881958, "global_step": 42551, "epoch": 1013} {"train_loss": -5.671879291534424, "global_step": 42552, "epoch": 1013} {"train_loss": -5.673664093017578, "global_step": 42553, "epoch": 1013} {"train_loss": -5.634881973266602, "global_step": 42554, "epoch": 1013} {"train_loss": -5.654197692871094, "global_step": 42555, "epoch": 1013} {"train_loss": -5.710901260375977, "global_step": 42556, "epoch": 1013} {"train_loss": -5.481616020202637, "global_step": 42557, "epoch": 1013} {"train_loss": -5.576466083526611, "global_step": 42558, "epoch": 1013} {"train_loss": -5.746329307556152, "global_step": 42559, "epoch": 1013} {"train_loss": -5.610472679138184, "global_step": 42560, "epoch": 1013} {"train_loss": -5.665197372436523, "global_step": 42561, "epoch": 1013} {"train_loss": -5.66181755065918, "global_step": 42562, "epoch": 1013} {"train_loss": -5.748894691467285, "global_step": 42563, "epoch": 1013} {"train_loss": -5.778918743133545, "global_step": 42564, "epoch": 1013} {"train_loss": -5.602666854858398, "global_step": 42565, "epoch": 1013} {"train_loss": -5.6047468185424805, "global_step": 42566, "epoch": 1013} {"train_loss": -5.656267166137695, "global_step": 42567, "epoch": 1013} {"train_loss": -5.707967758178711, "global_step": 42568, "epoch": 1013} {"train_loss": -5.753124713897705, "global_step": 42569, "epoch": 1013} {"train_loss": -5.748680114746094, "global_step": 42570, "epoch": 1013} {"train_loss": -5.653348445892334, "global_step": 42571, "epoch": 1013} {"train_loss": -5.8513922691345215, "global_step": 42572, "epoch": 1013} {"train_loss": -5.649649620056152, "global_step": 42573, "epoch": 1013} {"train_loss": -5.60429573059082, "global_step": 42574, "epoch": 1013} {"train_loss": -5.689022064208984, "global_step": 42575, "epoch": 1013} {"train_loss": -5.534233570098877, "global_step": 42576, "epoch": 1013} {"train_loss": -5.626556396484375, "global_step": 42577, "epoch": 1013} {"train_loss": -5.65079402923584, "global_step": 42578, "epoch": 1013} {"train_loss": -5.6595683097839355, "global_step": 42579, "epoch": 1013} {"train_loss": -5.602848052978516, "global_step": 42580, "epoch": 1013} {"train_loss": -5.673853397369385, "global_step": 42581, "epoch": 1013} {"train_loss": -5.705629348754883, "global_step": 42582, "epoch": 1013} {"train_loss": -5.666515350341797, "global_step": 42583, "epoch": 1013} {"train_loss": -5.678868293762207, "global_step": 42584, "epoch": 1013} {"train_loss": -5.6349358558654785, "global_step": 42585, "epoch": 1013} {"train_loss": -5.608171463012695, "global_step": 42586, "epoch": 1013} {"train_loss": -5.6544710000356035, "global_step": 42587, "epoch": 1013, "val_loss": 66024.234375} {"train_loss": -5.602294921875, "global_step": 42588, "epoch": 1014} {"train_loss": -5.707722187042236, "global_step": 42589, "epoch": 1014} {"train_loss": -5.697309494018555, "global_step": 42590, "epoch": 1014} {"train_loss": -5.682900905609131, "global_step": 42591, "epoch": 1014} {"train_loss": -5.718758583068848, "global_step": 42592, "epoch": 1014} {"train_loss": -5.636933326721191, "global_step": 42593, "epoch": 1014} {"train_loss": -5.694544792175293, "global_step": 42594, "epoch": 1014} {"train_loss": -5.765443325042725, "global_step": 42595, "epoch": 1014} {"train_loss": -5.741610527038574, "global_step": 42596, "epoch": 1014} {"train_loss": -5.657290458679199, "global_step": 42597, "epoch": 1014} {"train_loss": -5.562308311462402, "global_step": 42598, "epoch": 1014} {"train_loss": -5.672008514404297, "global_step": 42599, "epoch": 1014} {"train_loss": -5.739803314208984, "global_step": 42600, "epoch": 1014} {"train_loss": -5.8044657707214355, "global_step": 42601, "epoch": 1014} {"train_loss": -5.56180477142334, "global_step": 42602, "epoch": 1014} {"train_loss": -5.551280498504639, "global_step": 42603, "epoch": 1014} {"train_loss": -5.637784004211426, "global_step": 42604, "epoch": 1014} {"train_loss": -5.672074317932129, "global_step": 42605, "epoch": 1014} {"train_loss": -5.681979179382324, "global_step": 42606, "epoch": 1014} {"train_loss": -5.721132278442383, "global_step": 42607, "epoch": 1014} {"train_loss": -5.492326736450195, "global_step": 42608, "epoch": 1014} {"train_loss": -5.7435712814331055, "global_step": 42609, "epoch": 1014} {"train_loss": -5.503691673278809, "global_step": 42610, "epoch": 1014} {"train_loss": -5.751883506774902, "global_step": 42611, "epoch": 1014} {"train_loss": -5.771142482757568, "global_step": 42612, "epoch": 1014} {"train_loss": -5.787627220153809, "global_step": 42613, "epoch": 1014} {"train_loss": -5.658555507659912, "global_step": 42614, "epoch": 1014} {"train_loss": -5.535883903503418, "global_step": 42615, "epoch": 1014} {"train_loss": -5.535763740539551, "global_step": 42616, "epoch": 1014} {"train_loss": -5.690350532531738, "global_step": 42617, "epoch": 1014} {"train_loss": -5.719113826751709, "global_step": 42618, "epoch": 1014} {"train_loss": -5.689135551452637, "global_step": 42619, "epoch": 1014} {"train_loss": -5.730057239532471, "global_step": 42620, "epoch": 1014} {"train_loss": -5.605498313903809, "global_step": 42621, "epoch": 1014} {"train_loss": -5.5777788162231445, "global_step": 42622, "epoch": 1014} {"train_loss": -5.760957717895508, "global_step": 42623, "epoch": 1014} {"train_loss": -5.714728355407715, "global_step": 42624, "epoch": 1014} {"train_loss": -5.691001892089844, "global_step": 42625, "epoch": 1014} {"train_loss": -5.576190948486328, "global_step": 42626, "epoch": 1014} {"train_loss": -5.621366500854492, "global_step": 42627, "epoch": 1014} {"train_loss": -5.668441295623779, "global_step": 42628, "epoch": 1014} {"train_loss": -5.667082752500262, "global_step": 42629, "epoch": 1014, "val_loss": 66147.65625} {"train_loss": -5.643102645874023, "global_step": 42630, "epoch": 1015} {"train_loss": -5.638193130493164, "global_step": 42631, "epoch": 1015} {"train_loss": -5.635708332061768, "global_step": 42632, "epoch": 1015} {"train_loss": -5.778271675109863, "global_step": 42633, "epoch": 1015} {"train_loss": -5.6406450271606445, "global_step": 42634, "epoch": 1015} {"train_loss": -5.726933479309082, "global_step": 42635, "epoch": 1015} {"train_loss": -5.749107360839844, "global_step": 42636, "epoch": 1015} {"train_loss": -5.653406143188477, "global_step": 42637, "epoch": 1015} {"train_loss": -5.707312107086182, "global_step": 42638, "epoch": 1015} {"train_loss": -5.686126232147217, "global_step": 42639, "epoch": 1015} {"train_loss": -5.670014381408691, "global_step": 42640, "epoch": 1015} {"train_loss": -5.595833778381348, "global_step": 42641, "epoch": 1015} {"train_loss": -5.509681701660156, "global_step": 42642, "epoch": 1015} {"train_loss": -5.750165939331055, "global_step": 42643, "epoch": 1015} {"train_loss": -5.672802448272705, "global_step": 42644, "epoch": 1015} {"train_loss": -5.631945610046387, "global_step": 42645, "epoch": 1015} {"train_loss": -5.669881820678711, "global_step": 42646, "epoch": 1015} {"train_loss": -5.672489166259766, "global_step": 42647, "epoch": 1015} {"train_loss": -5.7313032150268555, "global_step": 42648, "epoch": 1015} {"train_loss": -5.604644775390625, "global_step": 42649, "epoch": 1015} {"train_loss": -5.636039733886719, "global_step": 42650, "epoch": 1015} {"train_loss": -5.540582656860352, "global_step": 42651, "epoch": 1015} {"train_loss": -5.633670806884766, "global_step": 42652, "epoch": 1015} {"train_loss": -5.585500717163086, "global_step": 42653, "epoch": 1015} {"train_loss": -5.530669212341309, "global_step": 42654, "epoch": 1015} {"train_loss": -5.777709007263184, "global_step": 42655, "epoch": 1015} {"train_loss": -5.598845481872559, "global_step": 42656, "epoch": 1015} {"train_loss": -5.459636688232422, "global_step": 42657, "epoch": 1015} {"train_loss": -5.628609657287598, "global_step": 42658, "epoch": 1015} {"train_loss": -5.53678035736084, "global_step": 42659, "epoch": 1015} {"train_loss": -5.624281883239746, "global_step": 42660, "epoch": 1015} {"train_loss": -5.537829875946045, "global_step": 42661, "epoch": 1015} {"train_loss": -5.6507134437561035, "global_step": 42662, "epoch": 1015} {"train_loss": -5.617619514465332, "global_step": 42663, "epoch": 1015} {"train_loss": -5.704130172729492, "global_step": 42664, "epoch": 1015} {"train_loss": -5.664995193481445, "global_step": 42665, "epoch": 1015} {"train_loss": -5.7259440422058105, "global_step": 42666, "epoch": 1015} {"train_loss": -5.7253522872924805, "global_step": 42667, "epoch": 1015} {"train_loss": -5.60598087310791, "global_step": 42668, "epoch": 1015} {"train_loss": -5.668542385101318, "global_step": 42669, "epoch": 1015} {"train_loss": -5.642776012420654, "global_step": 42670, "epoch": 1015} {"train_loss": -5.64790145556132, "global_step": 42671, "epoch": 1015, "val_loss": 66098.453125} {"train_loss": -5.648263931274414, "global_step": 42672, "epoch": 1016} {"train_loss": -5.556937217712402, "global_step": 42673, "epoch": 1016} {"train_loss": -5.657692909240723, "global_step": 42674, "epoch": 1016} {"train_loss": -5.83171272277832, "global_step": 42675, "epoch": 1016} {"train_loss": -5.666876792907715, "global_step": 42676, "epoch": 1016} {"train_loss": -5.7106828689575195, "global_step": 42677, "epoch": 1016} {"train_loss": -5.656676769256592, "global_step": 42678, "epoch": 1016} {"train_loss": -5.551822662353516, "global_step": 42679, "epoch": 1016} {"train_loss": -5.803884506225586, "global_step": 42680, "epoch": 1016} {"train_loss": -5.752720832824707, "global_step": 42681, "epoch": 1016} {"train_loss": -5.736886024475098, "global_step": 42682, "epoch": 1016} {"train_loss": -5.710309982299805, "global_step": 42683, "epoch": 1016} {"train_loss": -5.7527313232421875, "global_step": 42684, "epoch": 1016} {"train_loss": -5.5043044090271, "global_step": 42685, "epoch": 1016} {"train_loss": -5.632514953613281, "global_step": 42686, "epoch": 1016} {"train_loss": -5.682705402374268, "global_step": 42687, "epoch": 1016} {"train_loss": -5.582944869995117, "global_step": 42688, "epoch": 1016} {"train_loss": -5.601700782775879, "global_step": 42689, "epoch": 1016} {"train_loss": -5.707179069519043, "global_step": 42690, "epoch": 1016} {"train_loss": -5.632190704345703, "global_step": 42691, "epoch": 1016} {"train_loss": -5.656599044799805, "global_step": 42692, "epoch": 1016} {"train_loss": -5.686197280883789, "global_step": 42693, "epoch": 1016} {"train_loss": -5.760443687438965, "global_step": 42694, "epoch": 1016} {"train_loss": -5.812198162078857, "global_step": 42695, "epoch": 1016} {"train_loss": -5.65640926361084, "global_step": 42696, "epoch": 1016} {"train_loss": -5.744549751281738, "global_step": 42697, "epoch": 1016} {"train_loss": -5.803793907165527, "global_step": 42698, "epoch": 1016} {"train_loss": -5.645712852478027, "global_step": 42699, "epoch": 1016} {"train_loss": -5.700873851776123, "global_step": 42700, "epoch": 1016} {"train_loss": -5.672123908996582, "global_step": 42701, "epoch": 1016} {"train_loss": -5.82874870300293, "global_step": 42702, "epoch": 1016} {"train_loss": -5.611104488372803, "global_step": 42703, "epoch": 1016} {"train_loss": -5.604030609130859, "global_step": 42704, "epoch": 1016} {"train_loss": -5.777627944946289, "global_step": 42705, "epoch": 1016} {"train_loss": -5.63816499710083, "global_step": 42706, "epoch": 1016} {"train_loss": -5.647700786590576, "global_step": 42707, "epoch": 1016} {"train_loss": -5.623697757720947, "global_step": 42708, "epoch": 1016} {"train_loss": -5.609824180603027, "global_step": 42709, "epoch": 1016} {"train_loss": -5.741690158843994, "global_step": 42710, "epoch": 1016} {"train_loss": -5.7397589683532715, "global_step": 42711, "epoch": 1016} {"train_loss": -5.681829452514648, "global_step": 42712, "epoch": 1016} {"train_loss": -5.684667541867211, "global_step": 42713, "epoch": 1016, "val_loss": 66110.8203125} {"train_loss": -5.718434810638428, "global_step": 42714, "epoch": 1017} {"train_loss": -5.804083347320557, "global_step": 42715, "epoch": 1017} {"train_loss": -5.775277137756348, "global_step": 42716, "epoch": 1017} {"train_loss": -5.49143123626709, "global_step": 42717, "epoch": 1017} {"train_loss": -5.67333984375, "global_step": 42718, "epoch": 1017} {"train_loss": -5.654293060302734, "global_step": 42719, "epoch": 1017} {"train_loss": -5.577862739562988, "global_step": 42720, "epoch": 1017} {"train_loss": -5.725590705871582, "global_step": 42721, "epoch": 1017} {"train_loss": -5.576316833496094, "global_step": 42722, "epoch": 1017} {"train_loss": -5.6432976722717285, "global_step": 42723, "epoch": 1017} {"train_loss": -5.684080123901367, "global_step": 42724, "epoch": 1017} {"train_loss": -5.6661834716796875, "global_step": 42725, "epoch": 1017} {"train_loss": -5.635566711425781, "global_step": 42726, "epoch": 1017} {"train_loss": -5.7540178298950195, "global_step": 42727, "epoch": 1017} {"train_loss": -5.604865074157715, "global_step": 42728, "epoch": 1017} {"train_loss": -5.479586601257324, "global_step": 42729, "epoch": 1017} {"train_loss": -5.485499858856201, "global_step": 42730, "epoch": 1017} {"train_loss": -5.711104393005371, "global_step": 42731, "epoch": 1017} {"train_loss": -5.488526821136475, "global_step": 42732, "epoch": 1017} {"train_loss": -5.564422607421875, "global_step": 42733, "epoch": 1017} {"train_loss": -5.696831226348877, "global_step": 42734, "epoch": 1017} {"train_loss": -5.510296821594238, "global_step": 42735, "epoch": 1017} {"train_loss": -5.676950454711914, "global_step": 42736, "epoch": 1017} {"train_loss": -5.621629238128662, "global_step": 42737, "epoch": 1017} {"train_loss": -5.659825801849365, "global_step": 42738, "epoch": 1017} {"train_loss": -5.615023612976074, "global_step": 42739, "epoch": 1017} {"train_loss": -5.646977424621582, "global_step": 42740, "epoch": 1017} {"train_loss": -5.8099799156188965, "global_step": 42741, "epoch": 1017} {"train_loss": -5.556975364685059, "global_step": 42742, "epoch": 1017} {"train_loss": -5.703236103057861, "global_step": 42743, "epoch": 1017} {"train_loss": -5.62733268737793, "global_step": 42744, "epoch": 1017} {"train_loss": -5.904007434844971, "global_step": 42745, "epoch": 1017} {"train_loss": -5.574045658111572, "global_step": 42746, "epoch": 1017} {"train_loss": -5.678193092346191, "global_step": 42747, "epoch": 1017} {"train_loss": -5.592060089111328, "global_step": 42748, "epoch": 1017} {"train_loss": -5.698756217956543, "global_step": 42749, "epoch": 1017} {"train_loss": -5.6286821365356445, "global_step": 42750, "epoch": 1017} {"train_loss": -5.65008544921875, "global_step": 42751, "epoch": 1017} {"train_loss": -5.676003456115723, "global_step": 42752, "epoch": 1017} {"train_loss": -5.700758934020996, "global_step": 42753, "epoch": 1017} {"train_loss": -5.831648826599121, "global_step": 42754, "epoch": 1017} {"train_loss": -5.652492398307437, "global_step": 42755, "epoch": 1017, "val_loss": 66203.3359375} {"train_loss": -5.651864051818848, "global_step": 42756, "epoch": 1018} {"train_loss": -5.789650917053223, "global_step": 42757, "epoch": 1018} {"train_loss": -5.704649925231934, "global_step": 42758, "epoch": 1018} {"train_loss": -5.750709533691406, "global_step": 42759, "epoch": 1018} {"train_loss": -5.7165727615356445, "global_step": 42760, "epoch": 1018} {"train_loss": -5.719436168670654, "global_step": 42761, "epoch": 1018} {"train_loss": -5.713213920593262, "global_step": 42762, "epoch": 1018} {"train_loss": -5.836133003234863, "global_step": 42763, "epoch": 1018} {"train_loss": -5.659885406494141, "global_step": 42764, "epoch": 1018} {"train_loss": -5.555266380310059, "global_step": 42765, "epoch": 1018} {"train_loss": -5.602731227874756, "global_step": 42766, "epoch": 1018} {"train_loss": -5.611196994781494, "global_step": 42767, "epoch": 1018} {"train_loss": -5.672540664672852, "global_step": 42768, "epoch": 1018} {"train_loss": -5.8205180168151855, "global_step": 42769, "epoch": 1018} {"train_loss": -5.605422019958496, "global_step": 42770, "epoch": 1018} {"train_loss": -5.736428260803223, "global_step": 42771, "epoch": 1018} {"train_loss": -5.738040924072266, "global_step": 42772, "epoch": 1018} {"train_loss": -5.602983474731445, "global_step": 42773, "epoch": 1018} {"train_loss": -5.694774627685547, "global_step": 42774, "epoch": 1018} {"train_loss": -5.643651962280273, "global_step": 42775, "epoch": 1018} {"train_loss": -5.597453594207764, "global_step": 42776, "epoch": 1018} {"train_loss": -5.790242671966553, "global_step": 42777, "epoch": 1018} {"train_loss": -5.604794979095459, "global_step": 42778, "epoch": 1018} {"train_loss": -5.535877227783203, "global_step": 42779, "epoch": 1018} {"train_loss": -5.613736629486084, "global_step": 42780, "epoch": 1018} {"train_loss": -5.62493896484375, "global_step": 42781, "epoch": 1018} {"train_loss": -5.552882194519043, "global_step": 42782, "epoch": 1018} {"train_loss": -5.806085586547852, "global_step": 42783, "epoch": 1018} {"train_loss": -5.603583335876465, "global_step": 42784, "epoch": 1018} {"train_loss": -5.711095809936523, "global_step": 42785, "epoch": 1018} {"train_loss": -5.639021873474121, "global_step": 42786, "epoch": 1018} {"train_loss": -5.74828577041626, "global_step": 42787, "epoch": 1018} {"train_loss": -5.7443695068359375, "global_step": 42788, "epoch": 1018} {"train_loss": -5.678518295288086, "global_step": 42789, "epoch": 1018} {"train_loss": -5.587501525878906, "global_step": 42790, "epoch": 1018} {"train_loss": -5.647002696990967, "global_step": 42791, "epoch": 1018} {"train_loss": -5.608439922332764, "global_step": 42792, "epoch": 1018} {"train_loss": -5.6999735832214355, "global_step": 42793, "epoch": 1018} {"train_loss": -5.599740982055664, "global_step": 42794, "epoch": 1018} {"train_loss": -5.720891952514648, "global_step": 42795, "epoch": 1018} {"train_loss": -5.678408145904541, "global_step": 42796, "epoch": 1018} {"train_loss": -5.671507824034918, "global_step": 42797, "epoch": 1018, "val_loss": 66167.0} {"train_loss": -5.687521934509277, "global_step": 42798, "epoch": 1019} {"train_loss": -5.5977783203125, "global_step": 42799, "epoch": 1019} {"train_loss": -5.733256816864014, "global_step": 42800, "epoch": 1019} {"train_loss": -5.777145862579346, "global_step": 42801, "epoch": 1019} {"train_loss": -5.727703094482422, "global_step": 42802, "epoch": 1019} {"train_loss": -5.62367057800293, "global_step": 42803, "epoch": 1019} {"train_loss": -5.7293381690979, "global_step": 42804, "epoch": 1019} {"train_loss": -5.707881927490234, "global_step": 42805, "epoch": 1019} {"train_loss": -5.59120512008667, "global_step": 42806, "epoch": 1019} {"train_loss": -5.615902423858643, "global_step": 42807, "epoch": 1019} {"train_loss": -5.731947422027588, "global_step": 42808, "epoch": 1019} {"train_loss": -5.754764080047607, "global_step": 42809, "epoch": 1019} {"train_loss": -5.761648178100586, "global_step": 42810, "epoch": 1019} {"train_loss": -5.603903770446777, "global_step": 42811, "epoch": 1019} {"train_loss": -5.707653045654297, "global_step": 42812, "epoch": 1019} {"train_loss": -5.632408618927002, "global_step": 42813, "epoch": 1019} {"train_loss": -5.744872570037842, "global_step": 42814, "epoch": 1019} {"train_loss": -5.703764915466309, "global_step": 42815, "epoch": 1019} {"train_loss": -5.7895684242248535, "global_step": 42816, "epoch": 1019} {"train_loss": -5.741399765014648, "global_step": 42817, "epoch": 1019} {"train_loss": -5.751558303833008, "global_step": 42818, "epoch": 1019} {"train_loss": -5.657357215881348, "global_step": 42819, "epoch": 1019} {"train_loss": -5.614669322967529, "global_step": 42820, "epoch": 1019} {"train_loss": -5.678056716918945, "global_step": 42821, "epoch": 1019} {"train_loss": -5.649217128753662, "global_step": 42822, "epoch": 1019} {"train_loss": -5.629586219787598, "global_step": 42823, "epoch": 1019} {"train_loss": -5.688926696777344, "global_step": 42824, "epoch": 1019} {"train_loss": -5.583428382873535, "global_step": 42825, "epoch": 1019} {"train_loss": -5.722826957702637, "global_step": 42826, "epoch": 1019} {"train_loss": -5.660262584686279, "global_step": 42827, "epoch": 1019} {"train_loss": -5.732396125793457, "global_step": 42828, "epoch": 1019} {"train_loss": -5.737379550933838, "global_step": 42829, "epoch": 1019} {"train_loss": -5.600767612457275, "global_step": 42830, "epoch": 1019} {"train_loss": -5.819308280944824, "global_step": 42831, "epoch": 1019} {"train_loss": -5.733179092407227, "global_step": 42832, "epoch": 1019} {"train_loss": -5.705674171447754, "global_step": 42833, "epoch": 1019} {"train_loss": -5.666099548339844, "global_step": 42834, "epoch": 1019} {"train_loss": -5.675478935241699, "global_step": 42835, "epoch": 1019} {"train_loss": -5.555175304412842, "global_step": 42836, "epoch": 1019} {"train_loss": -5.696403980255127, "global_step": 42837, "epoch": 1019} {"train_loss": -5.891045570373535, "global_step": 42838, "epoch": 1019} {"train_loss": -5.689489444096883, "global_step": 42839, "epoch": 1019, "val_loss": 66110.9453125} {"train_loss": -5.69550085067749, "global_step": 42840, "epoch": 1020} {"train_loss": -5.729635715484619, "global_step": 42841, "epoch": 1020} {"train_loss": -5.595752716064453, "global_step": 42842, "epoch": 1020} {"train_loss": -5.7376484870910645, "global_step": 42843, "epoch": 1020} {"train_loss": -5.7786455154418945, "global_step": 42844, "epoch": 1020} {"train_loss": -5.581299781799316, "global_step": 42845, "epoch": 1020} {"train_loss": -5.688857078552246, "global_step": 42846, "epoch": 1020} {"train_loss": -5.702343940734863, "global_step": 42847, "epoch": 1020} {"train_loss": -5.764404296875, "global_step": 42848, "epoch": 1020} {"train_loss": -5.7613983154296875, "global_step": 42849, "epoch": 1020} {"train_loss": -5.704853057861328, "global_step": 42850, "epoch": 1020} {"train_loss": -5.667021751403809, "global_step": 42851, "epoch": 1020} {"train_loss": -5.566631317138672, "global_step": 42852, "epoch": 1020} {"train_loss": -5.614055633544922, "global_step": 42853, "epoch": 1020} {"train_loss": -5.639542102813721, "global_step": 42854, "epoch": 1020} {"train_loss": -5.7572503089904785, "global_step": 42855, "epoch": 1020} {"train_loss": -5.71527099609375, "global_step": 42856, "epoch": 1020} {"train_loss": -5.811863899230957, "global_step": 42857, "epoch": 1020} {"train_loss": -5.793144226074219, "global_step": 42858, "epoch": 1020} {"train_loss": -5.526329517364502, "global_step": 42859, "epoch": 1020} {"train_loss": -5.613523960113525, "global_step": 42860, "epoch": 1020} {"train_loss": -5.659671783447266, "global_step": 42861, "epoch": 1020} {"train_loss": -5.692431449890137, "global_step": 42862, "epoch": 1020} {"train_loss": -5.730990409851074, "global_step": 42863, "epoch": 1020} {"train_loss": -5.747181415557861, "global_step": 42864, "epoch": 1020} {"train_loss": -5.731281280517578, "global_step": 42865, "epoch": 1020} {"train_loss": -5.661516189575195, "global_step": 42866, "epoch": 1020} {"train_loss": -5.550699234008789, "global_step": 42867, "epoch": 1020} {"train_loss": -5.713300704956055, "global_step": 42868, "epoch": 1020} {"train_loss": -5.707370758056641, "global_step": 42869, "epoch": 1020} {"train_loss": -5.716904640197754, "global_step": 42870, "epoch": 1020} {"train_loss": -5.589715003967285, "global_step": 42871, "epoch": 1020} {"train_loss": -5.694688320159912, "global_step": 42872, "epoch": 1020} {"train_loss": -5.641141891479492, "global_step": 42873, "epoch": 1020} {"train_loss": -5.562646389007568, "global_step": 42874, "epoch": 1020} {"train_loss": -5.754812717437744, "global_step": 42875, "epoch": 1020} {"train_loss": -5.6960978507995605, "global_step": 42876, "epoch": 1020} {"train_loss": -5.591249465942383, "global_step": 42877, "epoch": 1020} {"train_loss": -5.698637962341309, "global_step": 42878, "epoch": 1020} {"train_loss": -5.6799421310424805, "global_step": 42879, "epoch": 1020} {"train_loss": -5.540895938873291, "global_step": 42880, "epoch": 1020} {"train_loss": -5.674743243626186, "global_step": 42881, "epoch": 1020, "val_loss": 65860.4609375} {"train_loss": -5.664578437805176, "global_step": 42882, "epoch": 1021} {"train_loss": -5.689202308654785, "global_step": 42883, "epoch": 1021} {"train_loss": -5.721464157104492, "global_step": 42884, "epoch": 1021} {"train_loss": -5.7269439697265625, "global_step": 42885, "epoch": 1021} {"train_loss": -5.51399040222168, "global_step": 42886, "epoch": 1021} {"train_loss": -5.69019889831543, "global_step": 42887, "epoch": 1021} {"train_loss": -5.699188232421875, "global_step": 42888, "epoch": 1021} {"train_loss": -5.735569953918457, "global_step": 42889, "epoch": 1021} {"train_loss": -5.709880828857422, "global_step": 42890, "epoch": 1021} {"train_loss": -5.712776184082031, "global_step": 42891, "epoch": 1021} {"train_loss": -5.51063346862793, "global_step": 42892, "epoch": 1021} {"train_loss": -5.71486234664917, "global_step": 42893, "epoch": 1021} {"train_loss": -5.64176607131958, "global_step": 42894, "epoch": 1021} {"train_loss": -5.706690311431885, "global_step": 42895, "epoch": 1021} {"train_loss": -5.718184471130371, "global_step": 42896, "epoch": 1021} {"train_loss": -5.7167863845825195, "global_step": 42897, "epoch": 1021} {"train_loss": -5.722434997558594, "global_step": 42898, "epoch": 1021} {"train_loss": -5.691956520080566, "global_step": 42899, "epoch": 1021} {"train_loss": -5.510288238525391, "global_step": 42900, "epoch": 1021} {"train_loss": -5.657927513122559, "global_step": 42901, "epoch": 1021} {"train_loss": -5.727564811706543, "global_step": 42902, "epoch": 1021} {"train_loss": -5.661472320556641, "global_step": 42903, "epoch": 1021} {"train_loss": -5.589556694030762, "global_step": 42904, "epoch": 1021} {"train_loss": -5.658619403839111, "global_step": 42905, "epoch": 1021} {"train_loss": -5.671159267425537, "global_step": 42906, "epoch": 1021} {"train_loss": -5.703894138336182, "global_step": 42907, "epoch": 1021} {"train_loss": -5.700667381286621, "global_step": 42908, "epoch": 1021} {"train_loss": -5.60930061340332, "global_step": 42909, "epoch": 1021} {"train_loss": -5.672939300537109, "global_step": 42910, "epoch": 1021} {"train_loss": -5.584411144256592, "global_step": 42911, "epoch": 1021} {"train_loss": -5.639137268066406, "global_step": 42912, "epoch": 1021} {"train_loss": -5.644086837768555, "global_step": 42913, "epoch": 1021} {"train_loss": -5.725193023681641, "global_step": 42914, "epoch": 1021} {"train_loss": -5.581534385681152, "global_step": 42915, "epoch": 1021} {"train_loss": -5.586733818054199, "global_step": 42916, "epoch": 1021} {"train_loss": -5.708225727081299, "global_step": 42917, "epoch": 1021} {"train_loss": -5.761722564697266, "global_step": 42918, "epoch": 1021} {"train_loss": -5.6278276443481445, "global_step": 42919, "epoch": 1021} {"train_loss": -5.589054584503174, "global_step": 42920, "epoch": 1021} {"train_loss": -5.520637512207031, "global_step": 42921, "epoch": 1021} {"train_loss": -5.731799602508545, "global_step": 42922, "epoch": 1021} {"train_loss": -5.664667277109055, "global_step": 42923, "epoch": 1021, "val_loss": 66191.171875} {"train_loss": -5.5718255043029785, "global_step": 42924, "epoch": 1022} {"train_loss": -5.672942638397217, "global_step": 42925, "epoch": 1022} {"train_loss": -5.706254005432129, "global_step": 42926, "epoch": 1022} {"train_loss": -5.700867652893066, "global_step": 42927, "epoch": 1022} {"train_loss": -5.667498588562012, "global_step": 42928, "epoch": 1022} {"train_loss": -5.706584453582764, "global_step": 42929, "epoch": 1022} {"train_loss": -5.780022621154785, "global_step": 42930, "epoch": 1022} {"train_loss": -5.746877670288086, "global_step": 42931, "epoch": 1022} {"train_loss": -5.74333381652832, "global_step": 42932, "epoch": 1022} {"train_loss": -5.787621974945068, "global_step": 42933, "epoch": 1022} {"train_loss": -5.694870948791504, "global_step": 42934, "epoch": 1022} {"train_loss": -5.7409772872924805, "global_step": 42935, "epoch": 1022} {"train_loss": -5.671797752380371, "global_step": 42936, "epoch": 1022} {"train_loss": -5.790881156921387, "global_step": 42937, "epoch": 1022} {"train_loss": -5.699433326721191, "global_step": 42938, "epoch": 1022} {"train_loss": -5.6233930587768555, "global_step": 42939, "epoch": 1022} {"train_loss": -5.59750509262085, "global_step": 42940, "epoch": 1022} {"train_loss": -5.691089630126953, "global_step": 42941, "epoch": 1022} {"train_loss": -5.583876609802246, "global_step": 42942, "epoch": 1022} {"train_loss": -5.623431205749512, "global_step": 42943, "epoch": 1022} {"train_loss": -5.5994720458984375, "global_step": 42944, "epoch": 1022} {"train_loss": -5.730368137359619, "global_step": 42945, "epoch": 1022} {"train_loss": -5.56383752822876, "global_step": 42946, "epoch": 1022} {"train_loss": -5.639150619506836, "global_step": 42947, "epoch": 1022} {"train_loss": -5.754146575927734, "global_step": 42948, "epoch": 1022} {"train_loss": -5.654356002807617, "global_step": 42949, "epoch": 1022} {"train_loss": -5.7058258056640625, "global_step": 42950, "epoch": 1022} {"train_loss": -5.656251907348633, "global_step": 42951, "epoch": 1022} {"train_loss": -5.618890285491943, "global_step": 42952, "epoch": 1022} {"train_loss": -5.750809669494629, "global_step": 42953, "epoch": 1022} {"train_loss": -5.758064270019531, "global_step": 42954, "epoch": 1022} {"train_loss": -5.612297058105469, "global_step": 42955, "epoch": 1022} {"train_loss": -5.632359981536865, "global_step": 42956, "epoch": 1022} {"train_loss": -5.6668243408203125, "global_step": 42957, "epoch": 1022} {"train_loss": -5.769581317901611, "global_step": 42958, "epoch": 1022} {"train_loss": -5.743696689605713, "global_step": 42959, "epoch": 1022} {"train_loss": -5.720469951629639, "global_step": 42960, "epoch": 1022} {"train_loss": -5.66220760345459, "global_step": 42961, "epoch": 1022} {"train_loss": -5.747328758239746, "global_step": 42962, "epoch": 1022} {"train_loss": -5.7066731452941895, "global_step": 42963, "epoch": 1022} {"train_loss": -5.657942771911621, "global_step": 42964, "epoch": 1022} {"train_loss": -5.689357348850796, "global_step": 42965, "epoch": 1022, "val_loss": 65973.765625} {"train_loss": -5.749942779541016, "global_step": 42966, "epoch": 1023} {"train_loss": -5.696281433105469, "global_step": 42967, "epoch": 1023} {"train_loss": -5.559149742126465, "global_step": 42968, "epoch": 1023} {"train_loss": -5.677162170410156, "global_step": 42969, "epoch": 1023} {"train_loss": -5.73189115524292, "global_step": 42970, "epoch": 1023} {"train_loss": -5.683638572692871, "global_step": 42971, "epoch": 1023} {"train_loss": -5.773093223571777, "global_step": 42972, "epoch": 1023} {"train_loss": -5.599705696105957, "global_step": 42973, "epoch": 1023} {"train_loss": -5.680102348327637, "global_step": 42974, "epoch": 1023} {"train_loss": -5.692460060119629, "global_step": 42975, "epoch": 1023} {"train_loss": -5.721582412719727, "global_step": 42976, "epoch": 1023} {"train_loss": -5.673891067504883, "global_step": 42977, "epoch": 1023} {"train_loss": -5.7645392417907715, "global_step": 42978, "epoch": 1023} {"train_loss": -5.7279744148254395, "global_step": 42979, "epoch": 1023} {"train_loss": -5.75959587097168, "global_step": 42980, "epoch": 1023} {"train_loss": -5.6764726638793945, "global_step": 42981, "epoch": 1023} {"train_loss": -5.743797779083252, "global_step": 42982, "epoch": 1023} {"train_loss": -5.667436599731445, "global_step": 42983, "epoch": 1023} {"train_loss": -5.634616851806641, "global_step": 42984, "epoch": 1023} {"train_loss": -5.67331600189209, "global_step": 42985, "epoch": 1023} {"train_loss": -5.785732269287109, "global_step": 42986, "epoch": 1023} {"train_loss": -5.674291610717773, "global_step": 42987, "epoch": 1023} {"train_loss": -5.5152082443237305, "global_step": 42988, "epoch": 1023} {"train_loss": -5.680604457855225, "global_step": 42989, "epoch": 1023} {"train_loss": -5.665120601654053, "global_step": 42990, "epoch": 1023} {"train_loss": -5.617654800415039, "global_step": 42991, "epoch": 1023} {"train_loss": -5.550783157348633, "global_step": 42992, "epoch": 1023} {"train_loss": -5.7532639503479, "global_step": 42993, "epoch": 1023} {"train_loss": -5.610185623168945, "global_step": 42994, "epoch": 1023} {"train_loss": -5.757120132446289, "global_step": 42995, "epoch": 1023} {"train_loss": -5.777585029602051, "global_step": 42996, "epoch": 1023} {"train_loss": -5.645004749298096, "global_step": 42997, "epoch": 1023} {"train_loss": -5.5582451820373535, "global_step": 42998, "epoch": 1023} {"train_loss": -5.604335784912109, "global_step": 42999, "epoch": 1023} {"train_loss": -5.7215681076049805, "global_step": 43000, "epoch": 1023} {"train_loss": -5.617264270782471, "global_step": 43001, "epoch": 1023} {"train_loss": -5.662526607513428, "global_step": 43002, "epoch": 1023} {"train_loss": -5.677615165710449, "global_step": 43003, "epoch": 1023} {"train_loss": -5.698819160461426, "global_step": 43004, "epoch": 1023} {"train_loss": -5.686570167541504, "global_step": 43005, "epoch": 1023} {"train_loss": -5.711347579956055, "global_step": 43006, "epoch": 1023} {"train_loss": -5.678942691712153, "global_step": 43007, "epoch": 1023, "val_loss": 66035.1015625} {"train_loss": -5.6989617347717285, "global_step": 43008, "epoch": 1024} {"train_loss": -5.702340126037598, "global_step": 43009, "epoch": 1024} {"train_loss": -5.600024223327637, "global_step": 43010, "epoch": 1024} {"train_loss": -5.8095245361328125, "global_step": 43011, "epoch": 1024} {"train_loss": -5.742874622344971, "global_step": 43012, "epoch": 1024} {"train_loss": -5.711280822753906, "global_step": 43013, "epoch": 1024} {"train_loss": -5.648717880249023, "global_step": 43014, "epoch": 1024} {"train_loss": -5.544351577758789, "global_step": 43015, "epoch": 1024} {"train_loss": -5.6264472007751465, "global_step": 43016, "epoch": 1024} {"train_loss": -5.57504415512085, "global_step": 43017, "epoch": 1024} {"train_loss": -5.564690589904785, "global_step": 43018, "epoch": 1024} {"train_loss": -5.579941749572754, "global_step": 43019, "epoch": 1024} {"train_loss": -5.5557661056518555, "global_step": 43020, "epoch": 1024} {"train_loss": -5.786311149597168, "global_step": 43021, "epoch": 1024} {"train_loss": -5.600258827209473, "global_step": 43022, "epoch": 1024} {"train_loss": -5.622779846191406, "global_step": 43023, "epoch": 1024} {"train_loss": -5.676785945892334, "global_step": 43024, "epoch": 1024} {"train_loss": -5.428865909576416, "global_step": 43025, "epoch": 1024} {"train_loss": -5.651285171508789, "global_step": 43026, "epoch": 1024} {"train_loss": -5.532252788543701, "global_step": 43027, "epoch": 1024} {"train_loss": -5.714821815490723, "global_step": 43028, "epoch": 1024} {"train_loss": -5.567358493804932, "global_step": 43029, "epoch": 1024} {"train_loss": -5.63316535949707, "global_step": 43030, "epoch": 1024} {"train_loss": -5.801329612731934, "global_step": 43031, "epoch": 1024} {"train_loss": -5.730727195739746, "global_step": 43032, "epoch": 1024} {"train_loss": -5.56194543838501, "global_step": 43033, "epoch": 1024} {"train_loss": -5.785038948059082, "global_step": 43034, "epoch": 1024} {"train_loss": -5.6381635665893555, "global_step": 43035, "epoch": 1024} {"train_loss": -5.698970317840576, "global_step": 43036, "epoch": 1024} {"train_loss": -5.746787071228027, "global_step": 43037, "epoch": 1024} {"train_loss": -5.679594039916992, "global_step": 43038, "epoch": 1024} {"train_loss": -5.722411155700684, "global_step": 43039, "epoch": 1024} {"train_loss": -5.711375713348389, "global_step": 43040, "epoch": 1024} {"train_loss": -5.804544448852539, "global_step": 43041, "epoch": 1024} {"train_loss": -5.569405555725098, "global_step": 43042, "epoch": 1024} {"train_loss": -5.672257423400879, "global_step": 43043, "epoch": 1024} {"train_loss": -5.750680923461914, "global_step": 43044, "epoch": 1024} {"train_loss": -5.629467010498047, "global_step": 43045, "epoch": 1024} {"train_loss": -5.570608139038086, "global_step": 43046, "epoch": 1024} {"train_loss": -5.600433349609375, "global_step": 43047, "epoch": 1024} {"train_loss": -5.574796199798584, "global_step": 43048, "epoch": 1024} {"train_loss": -5.656105938411894, "global_step": 43049, "epoch": 1024, "val_loss": 66370.6015625} {"train_loss": -5.709182262420654, "global_step": 43050, "epoch": 1025} {"train_loss": -5.614799499511719, "global_step": 43051, "epoch": 1025} {"train_loss": -5.55159854888916, "global_step": 43052, "epoch": 1025} {"train_loss": -5.667111396789551, "global_step": 43053, "epoch": 1025} {"train_loss": -5.69346809387207, "global_step": 43054, "epoch": 1025} {"train_loss": -5.571586608886719, "global_step": 43055, "epoch": 1025} {"train_loss": -5.54033088684082, "global_step": 43056, "epoch": 1025} {"train_loss": -5.590629577636719, "global_step": 43057, "epoch": 1025} {"train_loss": -5.747347831726074, "global_step": 43058, "epoch": 1025} {"train_loss": -5.819212913513184, "global_step": 43059, "epoch": 1025} {"train_loss": -5.703620910644531, "global_step": 43060, "epoch": 1025} {"train_loss": -5.60272216796875, "global_step": 43061, "epoch": 1025} {"train_loss": -5.6688642501831055, "global_step": 43062, "epoch": 1025} {"train_loss": -5.589734077453613, "global_step": 43063, "epoch": 1025} {"train_loss": -5.668788433074951, "global_step": 43064, "epoch": 1025} {"train_loss": -5.835165977478027, "global_step": 43065, "epoch": 1025} {"train_loss": -5.7050371170043945, "global_step": 43066, "epoch": 1025} {"train_loss": -5.914057731628418, "global_step": 43067, "epoch": 1025} {"train_loss": -5.709917068481445, "global_step": 43068, "epoch": 1025} {"train_loss": -5.730757713317871, "global_step": 43069, "epoch": 1025} {"train_loss": -5.677260875701904, "global_step": 43070, "epoch": 1025} {"train_loss": -5.6145453453063965, "global_step": 43071, "epoch": 1025} {"train_loss": -5.6027326583862305, "global_step": 43072, "epoch": 1025} {"train_loss": -5.631068706512451, "global_step": 43073, "epoch": 1025} {"train_loss": -5.7571563720703125, "global_step": 43074, "epoch": 1025} {"train_loss": -5.743842124938965, "global_step": 43075, "epoch": 1025} {"train_loss": -5.701224327087402, "global_step": 43076, "epoch": 1025} {"train_loss": -5.62497615814209, "global_step": 43077, "epoch": 1025} {"train_loss": -5.656663417816162, "global_step": 43078, "epoch": 1025} {"train_loss": -5.632436752319336, "global_step": 43079, "epoch": 1025} {"train_loss": -5.756467342376709, "global_step": 43080, "epoch": 1025} {"train_loss": -5.7390546798706055, "global_step": 43081, "epoch": 1025} {"train_loss": -5.697139739990234, "global_step": 43082, "epoch": 1025} {"train_loss": -5.824959754943848, "global_step": 43083, "epoch": 1025} {"train_loss": -5.622761249542236, "global_step": 43084, "epoch": 1025} {"train_loss": -5.798885345458984, "global_step": 43085, "epoch": 1025} {"train_loss": -5.738617897033691, "global_step": 43086, "epoch": 1025} {"train_loss": -5.7512359619140625, "global_step": 43087, "epoch": 1025} {"train_loss": -5.699353218078613, "global_step": 43088, "epoch": 1025} {"train_loss": -5.6075520515441895, "global_step": 43089, "epoch": 1025} {"train_loss": -5.696082592010498, "global_step": 43090, "epoch": 1025} {"train_loss": -5.684066931406657, "global_step": 43091, "epoch": 1025, "val_loss": 66543.2890625} {"train_loss": -5.657552719116211, "global_step": 43092, "epoch": 1026} {"train_loss": -5.6947174072265625, "global_step": 43093, "epoch": 1026} {"train_loss": -5.6597900390625, "global_step": 43094, "epoch": 1026} {"train_loss": -5.626031875610352, "global_step": 43095, "epoch": 1026} {"train_loss": -5.5645856857299805, "global_step": 43096, "epoch": 1026} {"train_loss": -5.592896461486816, "global_step": 43097, "epoch": 1026} {"train_loss": -5.552995204925537, "global_step": 43098, "epoch": 1026} {"train_loss": -5.621440410614014, "global_step": 43099, "epoch": 1026} {"train_loss": -5.552630424499512, "global_step": 43100, "epoch": 1026} {"train_loss": -5.674675941467285, "global_step": 43101, "epoch": 1026} {"train_loss": -5.680346965789795, "global_step": 43102, "epoch": 1026} {"train_loss": -5.5934367179870605, "global_step": 43103, "epoch": 1026} {"train_loss": -5.749402046203613, "global_step": 43104, "epoch": 1026} {"train_loss": -5.669755458831787, "global_step": 43105, "epoch": 1026} {"train_loss": -5.605860710144043, "global_step": 43106, "epoch": 1026} {"train_loss": -5.602171897888184, "global_step": 43107, "epoch": 1026} {"train_loss": -5.653800964355469, "global_step": 43108, "epoch": 1026} {"train_loss": -5.628904342651367, "global_step": 43109, "epoch": 1026} {"train_loss": -5.556816101074219, "global_step": 43110, "epoch": 1026} {"train_loss": -5.682115077972412, "global_step": 43111, "epoch": 1026} {"train_loss": -5.4808759689331055, "global_step": 43112, "epoch": 1026} {"train_loss": -5.574889183044434, "global_step": 43113, "epoch": 1026} {"train_loss": -5.755035400390625, "global_step": 43114, "epoch": 1026} {"train_loss": -5.621710777282715, "global_step": 43115, "epoch": 1026} {"train_loss": -5.786471843719482, "global_step": 43116, "epoch": 1026} {"train_loss": -5.6130828857421875, "global_step": 43117, "epoch": 1026} {"train_loss": -5.640222549438477, "global_step": 43118, "epoch": 1026} {"train_loss": -5.767645835876465, "global_step": 43119, "epoch": 1026} {"train_loss": -5.552557468414307, "global_step": 43120, "epoch": 1026} {"train_loss": -5.62852668762207, "global_step": 43121, "epoch": 1026} {"train_loss": -5.661687850952148, "global_step": 43122, "epoch": 1026} {"train_loss": -5.553832530975342, "global_step": 43123, "epoch": 1026} {"train_loss": -5.622419834136963, "global_step": 43124, "epoch": 1026} {"train_loss": -5.651555061340332, "global_step": 43125, "epoch": 1026} {"train_loss": -5.727447509765625, "global_step": 43126, "epoch": 1026} {"train_loss": -5.742660999298096, "global_step": 43127, "epoch": 1026} {"train_loss": -5.526723861694336, "global_step": 43128, "epoch": 1026} {"train_loss": -5.676032543182373, "global_step": 43129, "epoch": 1026} {"train_loss": -5.602272033691406, "global_step": 43130, "epoch": 1026} {"train_loss": -5.5875139236450195, "global_step": 43131, "epoch": 1026} {"train_loss": -5.685547828674316, "global_step": 43132, "epoch": 1026} {"train_loss": -5.6377316770099455, "global_step": 43133, "epoch": 1026, "val_loss": 66073.28125} {"train_loss": -5.610182762145996, "global_step": 43134, "epoch": 1027} {"train_loss": -5.69729471206665, "global_step": 43135, "epoch": 1027} {"train_loss": -5.735611915588379, "global_step": 43136, "epoch": 1027} {"train_loss": -5.688309669494629, "global_step": 43137, "epoch": 1027} {"train_loss": -5.720317363739014, "global_step": 43138, "epoch": 1027} {"train_loss": -5.614191055297852, "global_step": 43139, "epoch": 1027} {"train_loss": -5.641096115112305, "global_step": 43140, "epoch": 1027} {"train_loss": -5.6329569816589355, "global_step": 43141, "epoch": 1027} {"train_loss": -5.603764533996582, "global_step": 43142, "epoch": 1027} {"train_loss": -5.509640693664551, "global_step": 43143, "epoch": 1027} {"train_loss": -5.701077938079834, "global_step": 43144, "epoch": 1027} {"train_loss": -5.74037504196167, "global_step": 43145, "epoch": 1027} {"train_loss": -5.598994255065918, "global_step": 43146, "epoch": 1027} {"train_loss": -5.677907943725586, "global_step": 43147, "epoch": 1027} {"train_loss": -5.573991775512695, "global_step": 43148, "epoch": 1027} {"train_loss": -5.617278099060059, "global_step": 43149, "epoch": 1027} {"train_loss": -5.611576080322266, "global_step": 43150, "epoch": 1027} {"train_loss": -5.512076377868652, "global_step": 43151, "epoch": 1027} {"train_loss": -5.645652770996094, "global_step": 43152, "epoch": 1027} {"train_loss": -5.546051025390625, "global_step": 43153, "epoch": 1027} {"train_loss": -5.6437883377075195, "global_step": 43154, "epoch": 1027} {"train_loss": -5.672687530517578, "global_step": 43155, "epoch": 1027} {"train_loss": -5.653907775878906, "global_step": 43156, "epoch": 1027} {"train_loss": -5.6902971267700195, "global_step": 43157, "epoch": 1027} {"train_loss": -5.646262168884277, "global_step": 43158, "epoch": 1027} {"train_loss": -5.660138130187988, "global_step": 43159, "epoch": 1027} {"train_loss": -5.755345344543457, "global_step": 43160, "epoch": 1027} {"train_loss": -5.748190402984619, "global_step": 43161, "epoch": 1027} {"train_loss": -5.667452812194824, "global_step": 43162, "epoch": 1027} {"train_loss": -5.825796127319336, "global_step": 43163, "epoch": 1027} {"train_loss": -5.600498676300049, "global_step": 43164, "epoch": 1027} {"train_loss": -5.710807800292969, "global_step": 43165, "epoch": 1027} {"train_loss": -5.6891913414001465, "global_step": 43166, "epoch": 1027} {"train_loss": -5.598165512084961, "global_step": 43167, "epoch": 1027} {"train_loss": -5.805077075958252, "global_step": 43168, "epoch": 1027} {"train_loss": -5.67963981628418, "global_step": 43169, "epoch": 1027} {"train_loss": -5.51646614074707, "global_step": 43170, "epoch": 1027} {"train_loss": -5.660045623779297, "global_step": 43171, "epoch": 1027} {"train_loss": -5.790186882019043, "global_step": 43172, "epoch": 1027} {"train_loss": -5.540966033935547, "global_step": 43173, "epoch": 1027} {"train_loss": -5.640826225280762, "global_step": 43174, "epoch": 1027} {"train_loss": -5.655893234979539, "global_step": 43175, "epoch": 1027, "val_loss": 66400.5} {"train_loss": -5.616508483886719, "global_step": 43176, "epoch": 1028} {"train_loss": -5.7469329833984375, "global_step": 43177, "epoch": 1028} {"train_loss": -5.536243915557861, "global_step": 43178, "epoch": 1028} {"train_loss": -5.601531028747559, "global_step": 43179, "epoch": 1028} {"train_loss": -5.714378833770752, "global_step": 43180, "epoch": 1028} {"train_loss": -5.63607931137085, "global_step": 43181, "epoch": 1028} {"train_loss": -5.786057472229004, "global_step": 43182, "epoch": 1028} {"train_loss": -5.65672492980957, "global_step": 43183, "epoch": 1028} {"train_loss": -5.802031517028809, "global_step": 43184, "epoch": 1028} {"train_loss": -5.648329734802246, "global_step": 43185, "epoch": 1028} {"train_loss": -5.691288471221924, "global_step": 43186, "epoch": 1028} {"train_loss": -5.589200019836426, "global_step": 43187, "epoch": 1028} {"train_loss": -5.551720142364502, "global_step": 43188, "epoch": 1028} {"train_loss": -5.597182273864746, "global_step": 43189, "epoch": 1028} {"train_loss": -5.597143650054932, "global_step": 43190, "epoch": 1028} {"train_loss": -5.417293548583984, "global_step": 43191, "epoch": 1028} {"train_loss": -5.603274345397949, "global_step": 43192, "epoch": 1028} {"train_loss": -5.651483535766602, "global_step": 43193, "epoch": 1028} {"train_loss": -5.605088233947754, "global_step": 43194, "epoch": 1028} {"train_loss": -5.61033296585083, "global_step": 43195, "epoch": 1028} {"train_loss": -5.59604549407959, "global_step": 43196, "epoch": 1028} {"train_loss": -5.742586135864258, "global_step": 43197, "epoch": 1028} {"train_loss": -5.638587951660156, "global_step": 43198, "epoch": 1028} {"train_loss": -5.623440742492676, "global_step": 43199, "epoch": 1028} {"train_loss": -5.576064586639404, "global_step": 43200, "epoch": 1028} {"train_loss": -5.709842681884766, "global_step": 43201, "epoch": 1028} {"train_loss": -5.652836799621582, "global_step": 43202, "epoch": 1028} {"train_loss": -5.583175182342529, "global_step": 43203, "epoch": 1028} {"train_loss": -5.738293647766113, "global_step": 43204, "epoch": 1028} {"train_loss": -5.594179630279541, "global_step": 43205, "epoch": 1028} {"train_loss": -5.606827735900879, "global_step": 43206, "epoch": 1028} {"train_loss": -5.6399736404418945, "global_step": 43207, "epoch": 1028} {"train_loss": -5.676711082458496, "global_step": 43208, "epoch": 1028} {"train_loss": -5.74946403503418, "global_step": 43209, "epoch": 1028} {"train_loss": -5.65351676940918, "global_step": 43210, "epoch": 1028} {"train_loss": -5.6338677406311035, "global_step": 43211, "epoch": 1028} {"train_loss": -5.505331039428711, "global_step": 43212, "epoch": 1028} {"train_loss": -5.515368461608887, "global_step": 43213, "epoch": 1028} {"train_loss": -5.693942070007324, "global_step": 43214, "epoch": 1028} {"train_loss": -5.720211982727051, "global_step": 43215, "epoch": 1028} {"train_loss": -5.607496738433838, "global_step": 43216, "epoch": 1028} {"train_loss": -5.6371161597115655, "global_step": 43217, "epoch": 1028, "val_loss": 65843.75} {"train_loss": -5.718878746032715, "global_step": 43218, "epoch": 1029} {"train_loss": -5.574189186096191, "global_step": 43219, "epoch": 1029} {"train_loss": -5.642518997192383, "global_step": 43220, "epoch": 1029} {"train_loss": -5.798047065734863, "global_step": 43221, "epoch": 1029} {"train_loss": -5.688440799713135, "global_step": 43222, "epoch": 1029} {"train_loss": -5.663688659667969, "global_step": 43223, "epoch": 1029} {"train_loss": -5.583797454833984, "global_step": 43224, "epoch": 1029} {"train_loss": -5.5372772216796875, "global_step": 43225, "epoch": 1029} {"train_loss": -5.579655170440674, "global_step": 43226, "epoch": 1029} {"train_loss": -5.612802505493164, "global_step": 43227, "epoch": 1029} {"train_loss": -5.598971366882324, "global_step": 43228, "epoch": 1029} {"train_loss": -5.627021312713623, "global_step": 43229, "epoch": 1029} {"train_loss": -5.4498677253723145, "global_step": 43230, "epoch": 1029} {"train_loss": -5.619124412536621, "global_step": 43231, "epoch": 1029} {"train_loss": -5.696864604949951, "global_step": 43232, "epoch": 1029} {"train_loss": -5.591116905212402, "global_step": 43233, "epoch": 1029} {"train_loss": -5.647347450256348, "global_step": 43234, "epoch": 1029} {"train_loss": -5.724486351013184, "global_step": 43235, "epoch": 1029} {"train_loss": -5.729369163513184, "global_step": 43236, "epoch": 1029} {"train_loss": -5.579439163208008, "global_step": 43237, "epoch": 1029} {"train_loss": -5.540347099304199, "global_step": 43238, "epoch": 1029} {"train_loss": -5.668553352355957, "global_step": 43239, "epoch": 1029} {"train_loss": -5.7632527351379395, "global_step": 43240, "epoch": 1029} {"train_loss": -5.770430088043213, "global_step": 43241, "epoch": 1029} {"train_loss": -5.614404678344727, "global_step": 43242, "epoch": 1029} {"train_loss": -5.737071990966797, "global_step": 43243, "epoch": 1029} {"train_loss": -5.625331878662109, "global_step": 43244, "epoch": 1029} {"train_loss": -5.870163917541504, "global_step": 43245, "epoch": 1029} {"train_loss": -5.711582183837891, "global_step": 43246, "epoch": 1029} {"train_loss": -5.754193305969238, "global_step": 43247, "epoch": 1029} {"train_loss": -5.723135948181152, "global_step": 43248, "epoch": 1029} {"train_loss": -5.707571983337402, "global_step": 43249, "epoch": 1029} {"train_loss": -5.788487434387207, "global_step": 43250, "epoch": 1029} {"train_loss": -5.600238800048828, "global_step": 43251, "epoch": 1029} {"train_loss": -5.52275276184082, "global_step": 43252, "epoch": 1029} {"train_loss": -5.704775810241699, "global_step": 43253, "epoch": 1029} {"train_loss": -5.6257123947143555, "global_step": 43254, "epoch": 1029} {"train_loss": -5.7436652183532715, "global_step": 43255, "epoch": 1029} {"train_loss": -5.666826248168945, "global_step": 43256, "epoch": 1029} {"train_loss": -5.752297878265381, "global_step": 43257, "epoch": 1029} {"train_loss": -5.788646221160889, "global_step": 43258, "epoch": 1029} {"train_loss": -5.666376329603649, "global_step": 43259, "epoch": 1029, "val_loss": 65865.859375} {"train_loss": -5.8276686668396, "global_step": 43260, "epoch": 1030} {"train_loss": -5.587128162384033, "global_step": 43261, "epoch": 1030} {"train_loss": -5.801352500915527, "global_step": 43262, "epoch": 1030} {"train_loss": -5.679491996765137, "global_step": 43263, "epoch": 1030} {"train_loss": -5.685385704040527, "global_step": 43264, "epoch": 1030} {"train_loss": -5.753340721130371, "global_step": 43265, "epoch": 1030} {"train_loss": -5.5589599609375, "global_step": 43266, "epoch": 1030} {"train_loss": -5.57982873916626, "global_step": 43267, "epoch": 1030} {"train_loss": -5.661225318908691, "global_step": 43268, "epoch": 1030} {"train_loss": -5.667030334472656, "global_step": 43269, "epoch": 1030} {"train_loss": -5.730066776275635, "global_step": 43270, "epoch": 1030} {"train_loss": -5.608168601989746, "global_step": 43271, "epoch": 1030} {"train_loss": -5.7979960441589355, "global_step": 43272, "epoch": 1030} {"train_loss": -5.7217206954956055, "global_step": 43273, "epoch": 1030} {"train_loss": -5.531441688537598, "global_step": 43274, "epoch": 1030} {"train_loss": -5.569587707519531, "global_step": 43275, "epoch": 1030} {"train_loss": -5.500401020050049, "global_step": 43276, "epoch": 1030} {"train_loss": -5.6285400390625, "global_step": 43277, "epoch": 1030} {"train_loss": -5.696573257446289, "global_step": 43278, "epoch": 1030} {"train_loss": -5.589908599853516, "global_step": 43279, "epoch": 1030} {"train_loss": -5.713341236114502, "global_step": 43280, "epoch": 1030} {"train_loss": -5.662693977355957, "global_step": 43281, "epoch": 1030} {"train_loss": -5.627047538757324, "global_step": 43282, "epoch": 1030} {"train_loss": -5.7520246505737305, "global_step": 43283, "epoch": 1030} {"train_loss": -5.634311676025391, "global_step": 43284, "epoch": 1030} {"train_loss": -5.607251167297363, "global_step": 43285, "epoch": 1030} {"train_loss": -5.582221508026123, "global_step": 43286, "epoch": 1030} {"train_loss": -5.547454833984375, "global_step": 43287, "epoch": 1030} {"train_loss": -5.733072757720947, "global_step": 43288, "epoch": 1030} {"train_loss": -5.575126647949219, "global_step": 43289, "epoch": 1030} {"train_loss": -5.506560325622559, "global_step": 43290, "epoch": 1030} {"train_loss": -5.670591354370117, "global_step": 43291, "epoch": 1030} {"train_loss": -5.622979164123535, "global_step": 43292, "epoch": 1030} {"train_loss": -5.586133003234863, "global_step": 43293, "epoch": 1030} {"train_loss": -5.707256317138672, "global_step": 43294, "epoch": 1030} {"train_loss": -5.584998607635498, "global_step": 43295, "epoch": 1030} {"train_loss": -5.643853187561035, "global_step": 43296, "epoch": 1030} {"train_loss": -5.740732669830322, "global_step": 43297, "epoch": 1030} {"train_loss": -5.781815528869629, "global_step": 43298, "epoch": 1030} {"train_loss": -5.630331993103027, "global_step": 43299, "epoch": 1030} {"train_loss": -5.844876766204834, "global_step": 43300, "epoch": 1030} {"train_loss": -5.657722348258609, "global_step": 43301, "epoch": 1030, "val_loss": 66100.59375} {"train_loss": -5.630200386047363, "global_step": 43302, "epoch": 1031} {"train_loss": -5.59940242767334, "global_step": 43303, "epoch": 1031} {"train_loss": -5.776852607727051, "global_step": 43304, "epoch": 1031} {"train_loss": -5.829640865325928, "global_step": 43305, "epoch": 1031} {"train_loss": -5.522468566894531, "global_step": 43306, "epoch": 1031} {"train_loss": -5.6754326820373535, "global_step": 43307, "epoch": 1031} {"train_loss": -5.634860515594482, "global_step": 43308, "epoch": 1031} {"train_loss": -5.698568820953369, "global_step": 43309, "epoch": 1031} {"train_loss": -5.705679893493652, "global_step": 43310, "epoch": 1031} {"train_loss": -5.555668354034424, "global_step": 43311, "epoch": 1031} {"train_loss": -5.627081871032715, "global_step": 43312, "epoch": 1031} {"train_loss": -5.706308841705322, "global_step": 43313, "epoch": 1031} {"train_loss": -5.6278839111328125, "global_step": 43314, "epoch": 1031} {"train_loss": -5.669964790344238, "global_step": 43315, "epoch": 1031} {"train_loss": -5.781164169311523, "global_step": 43316, "epoch": 1031} {"train_loss": -5.711063385009766, "global_step": 43317, "epoch": 1031} {"train_loss": -5.709249496459961, "global_step": 43318, "epoch": 1031} {"train_loss": -5.690402030944824, "global_step": 43319, "epoch": 1031} {"train_loss": -5.655383586883545, "global_step": 43320, "epoch": 1031} {"train_loss": -5.730973720550537, "global_step": 43321, "epoch": 1031} {"train_loss": -5.698911190032959, "global_step": 43322, "epoch": 1031} {"train_loss": -5.654376029968262, "global_step": 43323, "epoch": 1031} {"train_loss": -5.846663475036621, "global_step": 43324, "epoch": 1031} {"train_loss": -5.771875381469727, "global_step": 43325, "epoch": 1031} {"train_loss": -5.7550249099731445, "global_step": 43326, "epoch": 1031} {"train_loss": -5.776895523071289, "global_step": 43327, "epoch": 1031} {"train_loss": -5.792251110076904, "global_step": 43328, "epoch": 1031} {"train_loss": -5.691699504852295, "global_step": 43329, "epoch": 1031} {"train_loss": -5.680843830108643, "global_step": 43330, "epoch": 1031} {"train_loss": -5.66019344329834, "global_step": 43331, "epoch": 1031} {"train_loss": -5.6508331298828125, "global_step": 43332, "epoch": 1031} {"train_loss": -5.738775253295898, "global_step": 43333, "epoch": 1031} {"train_loss": -5.679241180419922, "global_step": 43334, "epoch": 1031} {"train_loss": -5.666966438293457, "global_step": 43335, "epoch": 1031} {"train_loss": -5.6649274826049805, "global_step": 43336, "epoch": 1031} {"train_loss": -5.627240180969238, "global_step": 43337, "epoch": 1031} {"train_loss": -5.578657150268555, "global_step": 43338, "epoch": 1031} {"train_loss": -5.6823201179504395, "global_step": 43339, "epoch": 1031} {"train_loss": -5.761646270751953, "global_step": 43340, "epoch": 1031} {"train_loss": -5.546327590942383, "global_step": 43341, "epoch": 1031} {"train_loss": -5.571890830993652, "global_step": 43342, "epoch": 1031} {"train_loss": -5.684373923710415, "global_step": 43343, "epoch": 1031, "val_loss": 66055.53125} {"train_loss": -5.7469892501831055, "global_step": 43344, "epoch": 1032} {"train_loss": -5.704273223876953, "global_step": 43345, "epoch": 1032} {"train_loss": -5.5609307289123535, "global_step": 43346, "epoch": 1032} {"train_loss": -5.717578887939453, "global_step": 43347, "epoch": 1032} {"train_loss": -5.844714641571045, "global_step": 43348, "epoch": 1032} {"train_loss": -5.6764936447143555, "global_step": 43349, "epoch": 1032} {"train_loss": -5.739020824432373, "global_step": 43350, "epoch": 1032} {"train_loss": -5.60812520980835, "global_step": 43351, "epoch": 1032} {"train_loss": -5.639324188232422, "global_step": 43352, "epoch": 1032} {"train_loss": -5.7135467529296875, "global_step": 43353, "epoch": 1032} {"train_loss": -5.622479438781738, "global_step": 43354, "epoch": 1032} {"train_loss": -5.572265148162842, "global_step": 43355, "epoch": 1032} {"train_loss": -5.646522045135498, "global_step": 43356, "epoch": 1032} {"train_loss": -5.698348522186279, "global_step": 43357, "epoch": 1032} {"train_loss": -5.692144393920898, "global_step": 43358, "epoch": 1032} {"train_loss": -5.720574378967285, "global_step": 43359, "epoch": 1032} {"train_loss": -5.614383697509766, "global_step": 43360, "epoch": 1032} {"train_loss": -5.718031883239746, "global_step": 43361, "epoch": 1032} {"train_loss": -5.637185573577881, "global_step": 43362, "epoch": 1032} {"train_loss": -5.736407279968262, "global_step": 43363, "epoch": 1032} {"train_loss": -5.66111421585083, "global_step": 43364, "epoch": 1032} {"train_loss": -5.707244873046875, "global_step": 43365, "epoch": 1032} {"train_loss": -5.670163154602051, "global_step": 43366, "epoch": 1032} {"train_loss": -5.609652042388916, "global_step": 43367, "epoch": 1032} {"train_loss": -5.741596221923828, "global_step": 43368, "epoch": 1032} {"train_loss": -5.717761993408203, "global_step": 43369, "epoch": 1032} {"train_loss": -5.464990615844727, "global_step": 43370, "epoch": 1032} {"train_loss": -5.743206024169922, "global_step": 43371, "epoch": 1032} {"train_loss": -5.653658866882324, "global_step": 43372, "epoch": 1032} {"train_loss": -5.748720169067383, "global_step": 43373, "epoch": 1032} {"train_loss": -5.557831764221191, "global_step": 43374, "epoch": 1032} {"train_loss": -5.7412519454956055, "global_step": 43375, "epoch": 1032} {"train_loss": -5.837939262390137, "global_step": 43376, "epoch": 1032} {"train_loss": -5.593359470367432, "global_step": 43377, "epoch": 1032} {"train_loss": -5.648813724517822, "global_step": 43378, "epoch": 1032} {"train_loss": -5.738228797912598, "global_step": 43379, "epoch": 1032} {"train_loss": -5.743147850036621, "global_step": 43380, "epoch": 1032} {"train_loss": -5.5444722175598145, "global_step": 43381, "epoch": 1032} {"train_loss": -5.6400041580200195, "global_step": 43382, "epoch": 1032} {"train_loss": -5.679686546325684, "global_step": 43383, "epoch": 1032} {"train_loss": -5.514528751373291, "global_step": 43384, "epoch": 1032} {"train_loss": -5.672775824864705, "global_step": 43385, "epoch": 1032, "val_loss": 66418.921875} {"train_loss": -5.612509250640869, "global_step": 43386, "epoch": 1033} {"train_loss": -5.61959171295166, "global_step": 43387, "epoch": 1033} {"train_loss": -5.722134113311768, "global_step": 43388, "epoch": 1033} {"train_loss": -5.601795673370361, "global_step": 43389, "epoch": 1033} {"train_loss": -5.674768447875977, "global_step": 43390, "epoch": 1033} {"train_loss": -5.746598243713379, "global_step": 43391, "epoch": 1033} {"train_loss": -5.455214500427246, "global_step": 43392, "epoch": 1033} {"train_loss": -5.7057600021362305, "global_step": 43393, "epoch": 1033} {"train_loss": -5.549250602722168, "global_step": 43394, "epoch": 1033} {"train_loss": -5.626245498657227, "global_step": 43395, "epoch": 1033} {"train_loss": -5.659815788269043, "global_step": 43396, "epoch": 1033} {"train_loss": -5.512217998504639, "global_step": 43397, "epoch": 1033} {"train_loss": -5.679348468780518, "global_step": 43398, "epoch": 1033} {"train_loss": -5.598793029785156, "global_step": 43399, "epoch": 1033} {"train_loss": -5.661513328552246, "global_step": 43400, "epoch": 1033} {"train_loss": -5.67378044128418, "global_step": 43401, "epoch": 1033} {"train_loss": -5.632175922393799, "global_step": 43402, "epoch": 1033} {"train_loss": -5.551548480987549, "global_step": 43403, "epoch": 1033} {"train_loss": -5.595327854156494, "global_step": 43404, "epoch": 1033} {"train_loss": -5.518021583557129, "global_step": 43405, "epoch": 1033} {"train_loss": -5.7883453369140625, "global_step": 43406, "epoch": 1033} {"train_loss": -5.6373186111450195, "global_step": 43407, "epoch": 1033} {"train_loss": -5.6571197509765625, "global_step": 43408, "epoch": 1033} {"train_loss": -5.5550432205200195, "global_step": 43409, "epoch": 1033} {"train_loss": -5.733915328979492, "global_step": 43410, "epoch": 1033} {"train_loss": -5.660486698150635, "global_step": 43411, "epoch": 1033} {"train_loss": -5.581707000732422, "global_step": 43412, "epoch": 1033} {"train_loss": -5.663137435913086, "global_step": 43413, "epoch": 1033} {"train_loss": -5.672881126403809, "global_step": 43414, "epoch": 1033} {"train_loss": -5.748000621795654, "global_step": 43415, "epoch": 1033} {"train_loss": -5.7554216384887695, "global_step": 43416, "epoch": 1033} {"train_loss": -5.691080093383789, "global_step": 43417, "epoch": 1033} {"train_loss": -5.812413215637207, "global_step": 43418, "epoch": 1033} {"train_loss": -5.7015533447265625, "global_step": 43419, "epoch": 1033} {"train_loss": -5.701767921447754, "global_step": 43420, "epoch": 1033} {"train_loss": -5.777410507202148, "global_step": 43421, "epoch": 1033} {"train_loss": -5.690205097198486, "global_step": 43422, "epoch": 1033} {"train_loss": -5.543169975280762, "global_step": 43423, "epoch": 1033} {"train_loss": -5.662105560302734, "global_step": 43424, "epoch": 1033} {"train_loss": -5.520316123962402, "global_step": 43425, "epoch": 1033} {"train_loss": -5.542819976806641, "global_step": 43426, "epoch": 1033} {"train_loss": -5.65155241602943, "global_step": 43427, "epoch": 1033, "val_loss": 65793.015625} {"train_loss": -5.654184341430664, "global_step": 43428, "epoch": 1034} {"train_loss": -5.74207067489624, "global_step": 43429, "epoch": 1034} {"train_loss": -5.636752128601074, "global_step": 43430, "epoch": 1034} {"train_loss": -5.786089897155762, "global_step": 43431, "epoch": 1034} {"train_loss": -5.66798210144043, "global_step": 43432, "epoch": 1034} {"train_loss": -5.6462554931640625, "global_step": 43433, "epoch": 1034} {"train_loss": -5.670627593994141, "global_step": 43434, "epoch": 1034} {"train_loss": -5.682807445526123, "global_step": 43435, "epoch": 1034} {"train_loss": -5.632847785949707, "global_step": 43436, "epoch": 1034} {"train_loss": -5.803740501403809, "global_step": 43437, "epoch": 1034} {"train_loss": -5.6919965744018555, "global_step": 43438, "epoch": 1034} {"train_loss": -5.554101943969727, "global_step": 43439, "epoch": 1034} {"train_loss": -5.7065043449401855, "global_step": 43440, "epoch": 1034} {"train_loss": -5.835667610168457, "global_step": 43441, "epoch": 1034} {"train_loss": -5.606232643127441, "global_step": 43442, "epoch": 1034} {"train_loss": -5.566284656524658, "global_step": 43443, "epoch": 1034} {"train_loss": -5.620258331298828, "global_step": 43444, "epoch": 1034} {"train_loss": -5.7074995040893555, "global_step": 43445, "epoch": 1034} {"train_loss": -5.680560111999512, "global_step": 43446, "epoch": 1034} {"train_loss": -5.762113094329834, "global_step": 43447, "epoch": 1034} {"train_loss": -5.6146135330200195, "global_step": 43448, "epoch": 1034} {"train_loss": -5.695737838745117, "global_step": 43449, "epoch": 1034} {"train_loss": -5.59189510345459, "global_step": 43450, "epoch": 1034} {"train_loss": -5.535652160644531, "global_step": 43451, "epoch": 1034} {"train_loss": -5.781915664672852, "global_step": 43452, "epoch": 1034} {"train_loss": -5.623706817626953, "global_step": 43453, "epoch": 1034} {"train_loss": -5.628345489501953, "global_step": 43454, "epoch": 1034} {"train_loss": -5.679224967956543, "global_step": 43455, "epoch": 1034} {"train_loss": -5.674605369567871, "global_step": 43456, "epoch": 1034} {"train_loss": -5.655037879943848, "global_step": 43457, "epoch": 1034} {"train_loss": -5.435843467712402, "global_step": 43458, "epoch": 1034} {"train_loss": -5.700636386871338, "global_step": 43459, "epoch": 1034} {"train_loss": -5.728931427001953, "global_step": 43460, "epoch": 1034} {"train_loss": -5.611317157745361, "global_step": 43461, "epoch": 1034} {"train_loss": -5.673968315124512, "global_step": 43462, "epoch": 1034} {"train_loss": -5.680397033691406, "global_step": 43463, "epoch": 1034} {"train_loss": -5.66045618057251, "global_step": 43464, "epoch": 1034} {"train_loss": -5.678050994873047, "global_step": 43465, "epoch": 1034} {"train_loss": -5.496020317077637, "global_step": 43466, "epoch": 1034} {"train_loss": -5.618734836578369, "global_step": 43467, "epoch": 1034} {"train_loss": -5.612781524658203, "global_step": 43468, "epoch": 1034} {"train_loss": -5.662279060908726, "global_step": 43469, "epoch": 1034, "val_loss": 66194.4296875} {"train_loss": -5.7740631103515625, "global_step": 43470, "epoch": 1035} {"train_loss": -5.682404041290283, "global_step": 43471, "epoch": 1035} {"train_loss": -5.655302047729492, "global_step": 43472, "epoch": 1035} {"train_loss": -5.617135047912598, "global_step": 43473, "epoch": 1035} {"train_loss": -5.704665660858154, "global_step": 43474, "epoch": 1035} {"train_loss": -5.632297039031982, "global_step": 43475, "epoch": 1035} {"train_loss": -5.689831733703613, "global_step": 43476, "epoch": 1035} {"train_loss": -5.659520626068115, "global_step": 43477, "epoch": 1035} {"train_loss": -5.7205400466918945, "global_step": 43478, "epoch": 1035} {"train_loss": -5.822073936462402, "global_step": 43479, "epoch": 1035} {"train_loss": -5.638511657714844, "global_step": 43480, "epoch": 1035} {"train_loss": -5.675105094909668, "global_step": 43481, "epoch": 1035} {"train_loss": -5.627684593200684, "global_step": 43482, "epoch": 1035} {"train_loss": -5.724944114685059, "global_step": 43483, "epoch": 1035} {"train_loss": -5.692041397094727, "global_step": 43484, "epoch": 1035} {"train_loss": -5.535777568817139, "global_step": 43485, "epoch": 1035} {"train_loss": -5.650607109069824, "global_step": 43486, "epoch": 1035} {"train_loss": -5.671772003173828, "global_step": 43487, "epoch": 1035} {"train_loss": -5.671103477478027, "global_step": 43488, "epoch": 1035} {"train_loss": -5.71704626083374, "global_step": 43489, "epoch": 1035} {"train_loss": -5.679788589477539, "global_step": 43490, "epoch": 1035} {"train_loss": -5.643105983734131, "global_step": 43491, "epoch": 1035} {"train_loss": -5.747533321380615, "global_step": 43492, "epoch": 1035} {"train_loss": -5.6251983642578125, "global_step": 43493, "epoch": 1035} {"train_loss": -5.709587097167969, "global_step": 43494, "epoch": 1035} {"train_loss": -5.647329330444336, "global_step": 43495, "epoch": 1035} {"train_loss": -5.782361030578613, "global_step": 43496, "epoch": 1035} {"train_loss": -5.846440315246582, "global_step": 43497, "epoch": 1035} {"train_loss": -5.656233787536621, "global_step": 43498, "epoch": 1035} {"train_loss": -5.710970401763916, "global_step": 43499, "epoch": 1035} {"train_loss": -5.592555999755859, "global_step": 43500, "epoch": 1035} {"train_loss": -5.642327785491943, "global_step": 43501, "epoch": 1035} {"train_loss": -5.624240875244141, "global_step": 43502, "epoch": 1035} {"train_loss": -5.6206583976745605, "global_step": 43503, "epoch": 1035} {"train_loss": -5.763903617858887, "global_step": 43504, "epoch": 1035} {"train_loss": -5.604310989379883, "global_step": 43505, "epoch": 1035} {"train_loss": -5.48910665512085, "global_step": 43506, "epoch": 1035} {"train_loss": -5.656412124633789, "global_step": 43507, "epoch": 1035} {"train_loss": -5.656376361846924, "global_step": 43508, "epoch": 1035} {"train_loss": -5.506319522857666, "global_step": 43509, "epoch": 1035} {"train_loss": -5.462488174438477, "global_step": 43510, "epoch": 1035} {"train_loss": -5.663641225723993, "global_step": 43511, "epoch": 1035, "val_loss": 66226.46875} {"train_loss": -5.500618934631348, "global_step": 43512, "epoch": 1036} {"train_loss": -5.665151596069336, "global_step": 43513, "epoch": 1036} {"train_loss": -5.697109222412109, "global_step": 43514, "epoch": 1036} {"train_loss": -5.735605239868164, "global_step": 43515, "epoch": 1036} {"train_loss": -5.581610202789307, "global_step": 43516, "epoch": 1036} {"train_loss": -5.651721477508545, "global_step": 43517, "epoch": 1036} {"train_loss": -5.715620994567871, "global_step": 43518, "epoch": 1036} {"train_loss": -5.5891499519348145, "global_step": 43519, "epoch": 1036} {"train_loss": -5.586413383483887, "global_step": 43520, "epoch": 1036} {"train_loss": -5.735978126525879, "global_step": 43521, "epoch": 1036} {"train_loss": -5.706376075744629, "global_step": 43522, "epoch": 1036} {"train_loss": -5.662773132324219, "global_step": 43523, "epoch": 1036} {"train_loss": -5.7495880126953125, "global_step": 43524, "epoch": 1036} {"train_loss": -5.544827461242676, "global_step": 43525, "epoch": 1036} {"train_loss": -5.710797309875488, "global_step": 43526, "epoch": 1036} {"train_loss": -5.665153503417969, "global_step": 43527, "epoch": 1036} {"train_loss": -5.786497116088867, "global_step": 43528, "epoch": 1036} {"train_loss": -5.628657341003418, "global_step": 43529, "epoch": 1036} {"train_loss": -5.652441501617432, "global_step": 43530, "epoch": 1036} {"train_loss": -5.792993545532227, "global_step": 43531, "epoch": 1036} {"train_loss": -5.7527570724487305, "global_step": 43532, "epoch": 1036} {"train_loss": -5.736594200134277, "global_step": 43533, "epoch": 1036} {"train_loss": -5.692291259765625, "global_step": 43534, "epoch": 1036} {"train_loss": -5.623448371887207, "global_step": 43535, "epoch": 1036} {"train_loss": -5.758910179138184, "global_step": 43536, "epoch": 1036} {"train_loss": -5.591822624206543, "global_step": 43537, "epoch": 1036} {"train_loss": -5.672487735748291, "global_step": 43538, "epoch": 1036} {"train_loss": -5.686573028564453, "global_step": 43539, "epoch": 1036} {"train_loss": -5.8055644035339355, "global_step": 43540, "epoch": 1036} {"train_loss": -5.601040363311768, "global_step": 43541, "epoch": 1036} {"train_loss": -5.5201520919799805, "global_step": 43542, "epoch": 1036} {"train_loss": -5.6337738037109375, "global_step": 43543, "epoch": 1036} {"train_loss": -5.690396308898926, "global_step": 43544, "epoch": 1036} {"train_loss": -5.558716297149658, "global_step": 43545, "epoch": 1036} {"train_loss": -5.692351341247559, "global_step": 43546, "epoch": 1036} {"train_loss": -5.764164924621582, "global_step": 43547, "epoch": 1036} {"train_loss": -5.542536735534668, "global_step": 43548, "epoch": 1036} {"train_loss": -5.728606224060059, "global_step": 43549, "epoch": 1036} {"train_loss": -5.596860408782959, "global_step": 43550, "epoch": 1036} {"train_loss": -5.538564682006836, "global_step": 43551, "epoch": 1036} {"train_loss": -5.712002277374268, "global_step": 43552, "epoch": 1036} {"train_loss": -5.662712403706142, "global_step": 43553, "epoch": 1036, "val_loss": 66309.1875} {"train_loss": -5.697634696960449, "global_step": 43554, "epoch": 1037} {"train_loss": -5.756707191467285, "global_step": 43555, "epoch": 1037} {"train_loss": -5.51957893371582, "global_step": 43556, "epoch": 1037} {"train_loss": -5.544887065887451, "global_step": 43557, "epoch": 1037} {"train_loss": -5.610137939453125, "global_step": 43558, "epoch": 1037} {"train_loss": -5.577218055725098, "global_step": 43559, "epoch": 1037} {"train_loss": -5.790276050567627, "global_step": 43560, "epoch": 1037} {"train_loss": -5.472370147705078, "global_step": 43561, "epoch": 1037} {"train_loss": -5.6974592208862305, "global_step": 43562, "epoch": 1037} {"train_loss": -5.695598125457764, "global_step": 43563, "epoch": 1037} {"train_loss": -5.622344493865967, "global_step": 43564, "epoch": 1037} {"train_loss": -5.618340969085693, "global_step": 43565, "epoch": 1037} {"train_loss": -5.7278618812561035, "global_step": 43566, "epoch": 1037} {"train_loss": -5.638676643371582, "global_step": 43567, "epoch": 1037} {"train_loss": -5.695128440856934, "global_step": 43568, "epoch": 1037} {"train_loss": -5.678252220153809, "global_step": 43569, "epoch": 1037} {"train_loss": -5.62497615814209, "global_step": 43570, "epoch": 1037} {"train_loss": -5.694042205810547, "global_step": 43571, "epoch": 1037} {"train_loss": -5.65846061706543, "global_step": 43572, "epoch": 1037} {"train_loss": -5.725068092346191, "global_step": 43573, "epoch": 1037} {"train_loss": -5.613653659820557, "global_step": 43574, "epoch": 1037} {"train_loss": -5.640256881713867, "global_step": 43575, "epoch": 1037} {"train_loss": -5.746747970581055, "global_step": 43576, "epoch": 1037} {"train_loss": -5.737736701965332, "global_step": 43577, "epoch": 1037} {"train_loss": -5.777758598327637, "global_step": 43578, "epoch": 1037} {"train_loss": -5.605374813079834, "global_step": 43579, "epoch": 1037} {"train_loss": -5.688875675201416, "global_step": 43580, "epoch": 1037} {"train_loss": -5.6882123947143555, "global_step": 43581, "epoch": 1037} {"train_loss": -5.702308654785156, "global_step": 43582, "epoch": 1037} {"train_loss": -5.688667297363281, "global_step": 43583, "epoch": 1037} {"train_loss": -5.690497398376465, "global_step": 43584, "epoch": 1037} {"train_loss": -5.593790054321289, "global_step": 43585, "epoch": 1037} {"train_loss": -5.701826095581055, "global_step": 43586, "epoch": 1037} {"train_loss": -5.670350074768066, "global_step": 43587, "epoch": 1037} {"train_loss": -5.752530097961426, "global_step": 43588, "epoch": 1037} {"train_loss": -5.646581172943115, "global_step": 43589, "epoch": 1037} {"train_loss": -5.505987167358398, "global_step": 43590, "epoch": 1037} {"train_loss": -5.715580940246582, "global_step": 43591, "epoch": 1037} {"train_loss": -5.688220024108887, "global_step": 43592, "epoch": 1037} {"train_loss": -5.685096740722656, "global_step": 43593, "epoch": 1037} {"train_loss": -5.6916704177856445, "global_step": 43594, "epoch": 1037} {"train_loss": -5.66537880897522, "global_step": 43595, "epoch": 1037, "val_loss": 65772.734375} {"train_loss": -5.562039375305176, "global_step": 43596, "epoch": 1038} {"train_loss": -5.756804466247559, "global_step": 43597, "epoch": 1038} {"train_loss": -5.633532524108887, "global_step": 43598, "epoch": 1038} {"train_loss": -5.690511226654053, "global_step": 43599, "epoch": 1038} {"train_loss": -5.490484714508057, "global_step": 43600, "epoch": 1038} {"train_loss": -5.663675308227539, "global_step": 43601, "epoch": 1038} {"train_loss": -5.6711745262146, "global_step": 43602, "epoch": 1038} {"train_loss": -5.618727684020996, "global_step": 43603, "epoch": 1038} {"train_loss": -5.607813835144043, "global_step": 43604, "epoch": 1038} {"train_loss": -5.712401390075684, "global_step": 43605, "epoch": 1038} {"train_loss": -5.823888778686523, "global_step": 43606, "epoch": 1038} {"train_loss": -5.739920139312744, "global_step": 43607, "epoch": 1038} {"train_loss": -5.657420635223389, "global_step": 43608, "epoch": 1038} {"train_loss": -5.6521806716918945, "global_step": 43609, "epoch": 1038} {"train_loss": -5.603076934814453, "global_step": 43610, "epoch": 1038} {"train_loss": -5.749079704284668, "global_step": 43611, "epoch": 1038} {"train_loss": -5.684691429138184, "global_step": 43612, "epoch": 1038} {"train_loss": -5.733172416687012, "global_step": 43613, "epoch": 1038} {"train_loss": -5.7662672996521, "global_step": 43614, "epoch": 1038} {"train_loss": -5.6177191734313965, "global_step": 43615, "epoch": 1038} {"train_loss": -5.730473518371582, "global_step": 43616, "epoch": 1038} {"train_loss": -5.626033782958984, "global_step": 43617, "epoch": 1038} {"train_loss": -5.465320587158203, "global_step": 43618, "epoch": 1038} {"train_loss": -5.604769229888916, "global_step": 43619, "epoch": 1038} {"train_loss": -5.683794021606445, "global_step": 43620, "epoch": 1038} {"train_loss": -5.684337615966797, "global_step": 43621, "epoch": 1038} {"train_loss": -5.674652576446533, "global_step": 43622, "epoch": 1038} {"train_loss": -5.718985557556152, "global_step": 43623, "epoch": 1038} {"train_loss": -5.664412498474121, "global_step": 43624, "epoch": 1038} {"train_loss": -5.702802658081055, "global_step": 43625, "epoch": 1038} {"train_loss": -5.632138252258301, "global_step": 43626, "epoch": 1038} {"train_loss": -5.673879146575928, "global_step": 43627, "epoch": 1038} {"train_loss": -5.665865421295166, "global_step": 43628, "epoch": 1038} {"train_loss": -5.772040843963623, "global_step": 43629, "epoch": 1038} {"train_loss": -5.728821277618408, "global_step": 43630, "epoch": 1038} {"train_loss": -5.728476524353027, "global_step": 43631, "epoch": 1038} {"train_loss": -5.654299736022949, "global_step": 43632, "epoch": 1038} {"train_loss": -5.705879211425781, "global_step": 43633, "epoch": 1038} {"train_loss": -5.719472885131836, "global_step": 43634, "epoch": 1038} {"train_loss": -5.616855621337891, "global_step": 43635, "epoch": 1038} {"train_loss": -5.720492839813232, "global_step": 43636, "epoch": 1038} {"train_loss": -5.676000016076224, "global_step": 43637, "epoch": 1038, "val_loss": 66246.5859375} {"train_loss": -5.725022315979004, "global_step": 43638, "epoch": 1039} {"train_loss": -5.8102288246154785, "global_step": 43639, "epoch": 1039} {"train_loss": -5.672590255737305, "global_step": 43640, "epoch": 1039} {"train_loss": -5.8450164794921875, "global_step": 43641, "epoch": 1039} {"train_loss": -5.519800186157227, "global_step": 43642, "epoch": 1039} {"train_loss": -5.740433692932129, "global_step": 43643, "epoch": 1039} {"train_loss": -5.804541110992432, "global_step": 43644, "epoch": 1039} {"train_loss": -5.690375804901123, "global_step": 43645, "epoch": 1039} {"train_loss": -5.803894519805908, "global_step": 43646, "epoch": 1039} {"train_loss": -5.79428768157959, "global_step": 43647, "epoch": 1039} {"train_loss": -5.658836841583252, "global_step": 43648, "epoch": 1039} {"train_loss": -5.773674011230469, "global_step": 43649, "epoch": 1039} {"train_loss": -5.665104389190674, "global_step": 43650, "epoch": 1039} {"train_loss": -5.699710845947266, "global_step": 43651, "epoch": 1039} {"train_loss": -5.768239974975586, "global_step": 43652, "epoch": 1039} {"train_loss": -5.656362056732178, "global_step": 43653, "epoch": 1039} {"train_loss": -5.623500347137451, "global_step": 43654, "epoch": 1039} {"train_loss": -5.61843204498291, "global_step": 43655, "epoch": 1039} {"train_loss": -5.712366580963135, "global_step": 43656, "epoch": 1039} {"train_loss": -5.550523281097412, "global_step": 43657, "epoch": 1039} {"train_loss": -5.610527992248535, "global_step": 43658, "epoch": 1039} {"train_loss": -5.717291831970215, "global_step": 43659, "epoch": 1039} {"train_loss": -5.616072654724121, "global_step": 43660, "epoch": 1039} {"train_loss": -5.552883148193359, "global_step": 43661, "epoch": 1039} {"train_loss": -5.601691246032715, "global_step": 43662, "epoch": 1039} {"train_loss": -5.610727310180664, "global_step": 43663, "epoch": 1039} {"train_loss": -5.718345642089844, "global_step": 43664, "epoch": 1039} {"train_loss": -5.520735740661621, "global_step": 43665, "epoch": 1039} {"train_loss": -5.5922088623046875, "global_step": 43666, "epoch": 1039} {"train_loss": -5.670424938201904, "global_step": 43667, "epoch": 1039} {"train_loss": -5.638477325439453, "global_step": 43668, "epoch": 1039} {"train_loss": -5.723254203796387, "global_step": 43669, "epoch": 1039} {"train_loss": -5.657039642333984, "global_step": 43670, "epoch": 1039} {"train_loss": -5.547904014587402, "global_step": 43671, "epoch": 1039} {"train_loss": -5.6172285079956055, "global_step": 43672, "epoch": 1039} {"train_loss": -5.499377727508545, "global_step": 43673, "epoch": 1039} {"train_loss": -5.708161354064941, "global_step": 43674, "epoch": 1039} {"train_loss": -5.627469539642334, "global_step": 43675, "epoch": 1039} {"train_loss": -5.703026294708252, "global_step": 43676, "epoch": 1039} {"train_loss": -5.7229413986206055, "global_step": 43677, "epoch": 1039} {"train_loss": -5.585782051086426, "global_step": 43678, "epoch": 1039} {"train_loss": -5.667476086389451, "global_step": 43679, "epoch": 1039, "val_loss": 66059.1875} {"train_loss": -5.700962543487549, "global_step": 43680, "epoch": 1040} {"train_loss": -5.654277801513672, "global_step": 43681, "epoch": 1040} {"train_loss": -5.660429000854492, "global_step": 43682, "epoch": 1040} {"train_loss": -5.728860378265381, "global_step": 43683, "epoch": 1040} {"train_loss": -5.708666801452637, "global_step": 43684, "epoch": 1040} {"train_loss": -5.510622978210449, "global_step": 43685, "epoch": 1040} {"train_loss": -5.707361221313477, "global_step": 43686, "epoch": 1040} {"train_loss": -5.544841766357422, "global_step": 43687, "epoch": 1040} {"train_loss": -5.608453750610352, "global_step": 43688, "epoch": 1040} {"train_loss": -5.750306129455566, "global_step": 43689, "epoch": 1040} {"train_loss": -5.575522422790527, "global_step": 43690, "epoch": 1040} {"train_loss": -5.685177326202393, "global_step": 43691, "epoch": 1040} {"train_loss": -5.555501461029053, "global_step": 43692, "epoch": 1040} {"train_loss": -5.525699615478516, "global_step": 43693, "epoch": 1040} {"train_loss": -5.62320613861084, "global_step": 43694, "epoch": 1040} {"train_loss": -5.5110578536987305, "global_step": 43695, "epoch": 1040} {"train_loss": -5.695092678070068, "global_step": 43696, "epoch": 1040} {"train_loss": -5.705295085906982, "global_step": 43697, "epoch": 1040} {"train_loss": -5.622466087341309, "global_step": 43698, "epoch": 1040} {"train_loss": -5.729884147644043, "global_step": 43699, "epoch": 1040} {"train_loss": -5.408990859985352, "global_step": 43700, "epoch": 1040} {"train_loss": -5.608823776245117, "global_step": 43701, "epoch": 1040} {"train_loss": -5.763514518737793, "global_step": 43702, "epoch": 1040} {"train_loss": -5.7371368408203125, "global_step": 43703, "epoch": 1040} {"train_loss": -5.617746353149414, "global_step": 43704, "epoch": 1040} {"train_loss": -5.5981597900390625, "global_step": 43705, "epoch": 1040} {"train_loss": -5.70108699798584, "global_step": 43706, "epoch": 1040} {"train_loss": -5.711097717285156, "global_step": 43707, "epoch": 1040} {"train_loss": -5.683794021606445, "global_step": 43708, "epoch": 1040} {"train_loss": -5.533103942871094, "global_step": 43709, "epoch": 1040} {"train_loss": -5.706780910491943, "global_step": 43710, "epoch": 1040} {"train_loss": -5.637726783752441, "global_step": 43711, "epoch": 1040} {"train_loss": -5.6745195388793945, "global_step": 43712, "epoch": 1040} {"train_loss": -5.667975425720215, "global_step": 43713, "epoch": 1040} {"train_loss": -5.687549591064453, "global_step": 43714, "epoch": 1040} {"train_loss": -5.676536560058594, "global_step": 43715, "epoch": 1040} {"train_loss": -5.644407272338867, "global_step": 43716, "epoch": 1040} {"train_loss": -5.585515975952148, "global_step": 43717, "epoch": 1040} {"train_loss": -5.658325672149658, "global_step": 43718, "epoch": 1040} {"train_loss": -5.560616970062256, "global_step": 43719, "epoch": 1040} {"train_loss": -5.69047737121582, "global_step": 43720, "epoch": 1040} {"train_loss": -5.643266961688087, "global_step": 43721, "epoch": 1040, "val_loss": 66260.890625} {"train_loss": -5.677104473114014, "global_step": 43722, "epoch": 1041} {"train_loss": -5.693763256072998, "global_step": 43723, "epoch": 1041} {"train_loss": -5.6195173263549805, "global_step": 43724, "epoch": 1041} {"train_loss": -5.614333152770996, "global_step": 43725, "epoch": 1041} {"train_loss": -5.694988250732422, "global_step": 43726, "epoch": 1041} {"train_loss": -5.513786792755127, "global_step": 43727, "epoch": 1041} {"train_loss": -5.5742316246032715, "global_step": 43728, "epoch": 1041} {"train_loss": -5.58192253112793, "global_step": 43729, "epoch": 1041} {"train_loss": -5.79099702835083, "global_step": 43730, "epoch": 1041} {"train_loss": -5.4917683601379395, "global_step": 43731, "epoch": 1041} {"train_loss": -5.679345607757568, "global_step": 43732, "epoch": 1041} {"train_loss": -5.639978408813477, "global_step": 43733, "epoch": 1041} {"train_loss": -5.730084419250488, "global_step": 43734, "epoch": 1041} {"train_loss": -5.624893665313721, "global_step": 43735, "epoch": 1041} {"train_loss": -5.5728840827941895, "global_step": 43736, "epoch": 1041} {"train_loss": -5.765440940856934, "global_step": 43737, "epoch": 1041} {"train_loss": -5.693899154663086, "global_step": 43738, "epoch": 1041} {"train_loss": -5.708005905151367, "global_step": 43739, "epoch": 1041} {"train_loss": -5.557072162628174, "global_step": 43740, "epoch": 1041} {"train_loss": -5.588040351867676, "global_step": 43741, "epoch": 1041} {"train_loss": -5.661604404449463, "global_step": 43742, "epoch": 1041} {"train_loss": -5.5290727615356445, "global_step": 43743, "epoch": 1041} {"train_loss": -5.691542148590088, "global_step": 43744, "epoch": 1041} {"train_loss": -5.551629066467285, "global_step": 43745, "epoch": 1041} {"train_loss": -5.620669364929199, "global_step": 43746, "epoch": 1041} {"train_loss": -5.587487697601318, "global_step": 43747, "epoch": 1041} {"train_loss": -5.672855854034424, "global_step": 43748, "epoch": 1041} {"train_loss": -5.659523010253906, "global_step": 43749, "epoch": 1041} {"train_loss": -5.721129894256592, "global_step": 43750, "epoch": 1041} {"train_loss": -5.691402435302734, "global_step": 43751, "epoch": 1041} {"train_loss": -5.649791717529297, "global_step": 43752, "epoch": 1041} {"train_loss": -5.742715358734131, "global_step": 43753, "epoch": 1041} {"train_loss": -5.66117000579834, "global_step": 43754, "epoch": 1041} {"train_loss": -5.636238098144531, "global_step": 43755, "epoch": 1041} {"train_loss": -5.680301666259766, "global_step": 43756, "epoch": 1041} {"train_loss": -5.666512489318848, "global_step": 43757, "epoch": 1041} {"train_loss": -5.743898391723633, "global_step": 43758, "epoch": 1041} {"train_loss": -5.723557949066162, "global_step": 43759, "epoch": 1041} {"train_loss": -5.5692572593688965, "global_step": 43760, "epoch": 1041} {"train_loss": -5.649272918701172, "global_step": 43761, "epoch": 1041} {"train_loss": -5.65456485748291, "global_step": 43762, "epoch": 1041} {"train_loss": -5.65073375474839, "global_step": 43763, "epoch": 1041, "val_loss": 66615.1953125} {"train_loss": -5.576595306396484, "global_step": 43764, "epoch": 1042} {"train_loss": -5.613348007202148, "global_step": 43765, "epoch": 1042} {"train_loss": -5.577664375305176, "global_step": 43766, "epoch": 1042} {"train_loss": -5.80668830871582, "global_step": 43767, "epoch": 1042} {"train_loss": -5.583293437957764, "global_step": 43768, "epoch": 1042} {"train_loss": -5.818357467651367, "global_step": 43769, "epoch": 1042} {"train_loss": -5.691937446594238, "global_step": 43770, "epoch": 1042} {"train_loss": -5.6766767501831055, "global_step": 43771, "epoch": 1042} {"train_loss": -5.607314109802246, "global_step": 43772, "epoch": 1042} {"train_loss": -5.696767807006836, "global_step": 43773, "epoch": 1042} {"train_loss": -5.777234077453613, "global_step": 43774, "epoch": 1042} {"train_loss": -5.622044563293457, "global_step": 43775, "epoch": 1042} {"train_loss": -5.787784099578857, "global_step": 43776, "epoch": 1042} {"train_loss": -5.716203689575195, "global_step": 43777, "epoch": 1042} {"train_loss": -5.624817848205566, "global_step": 43778, "epoch": 1042} {"train_loss": -5.5304718017578125, "global_step": 43779, "epoch": 1042} {"train_loss": -5.62327766418457, "global_step": 43780, "epoch": 1042} {"train_loss": -5.720261573791504, "global_step": 43781, "epoch": 1042} {"train_loss": -5.6664838790893555, "global_step": 43782, "epoch": 1042} {"train_loss": -5.646308898925781, "global_step": 43783, "epoch": 1042} {"train_loss": -5.735279083251953, "global_step": 43784, "epoch": 1042} {"train_loss": -5.739128589630127, "global_step": 43785, "epoch": 1042} {"train_loss": -5.717442512512207, "global_step": 43786, "epoch": 1042} {"train_loss": -5.774168968200684, "global_step": 43787, "epoch": 1042} {"train_loss": -5.774190902709961, "global_step": 43788, "epoch": 1042} {"train_loss": -5.633886337280273, "global_step": 43789, "epoch": 1042} {"train_loss": -5.703153610229492, "global_step": 43790, "epoch": 1042} {"train_loss": -5.663083553314209, "global_step": 43791, "epoch": 1042} {"train_loss": -5.711645603179932, "global_step": 43792, "epoch": 1042} {"train_loss": -5.785836219787598, "global_step": 43793, "epoch": 1042} {"train_loss": -5.790163993835449, "global_step": 43794, "epoch": 1042} {"train_loss": -5.700634002685547, "global_step": 43795, "epoch": 1042} {"train_loss": -5.840205192565918, "global_step": 43796, "epoch": 1042} {"train_loss": -5.700100898742676, "global_step": 43797, "epoch": 1042} {"train_loss": -5.644737720489502, "global_step": 43798, "epoch": 1042} {"train_loss": -5.649887561798096, "global_step": 43799, "epoch": 1042} {"train_loss": -5.631518363952637, "global_step": 43800, "epoch": 1042} {"train_loss": -5.6546220779418945, "global_step": 43801, "epoch": 1042} {"train_loss": -5.6029863357543945, "global_step": 43802, "epoch": 1042} {"train_loss": -5.626167297363281, "global_step": 43803, "epoch": 1042} {"train_loss": -5.7052106857299805, "global_step": 43804, "epoch": 1042} {"train_loss": -5.6879136221749445, "global_step": 43805, "epoch": 1042, "val_loss": 66009.484375} {"train_loss": -5.6878509521484375, "global_step": 43806, "epoch": 1043} {"train_loss": -5.822734355926514, "global_step": 43807, "epoch": 1043} {"train_loss": -5.595889568328857, "global_step": 43808, "epoch": 1043} {"train_loss": -5.706647872924805, "global_step": 43809, "epoch": 1043} {"train_loss": -5.657456398010254, "global_step": 43810, "epoch": 1043} {"train_loss": -5.685671329498291, "global_step": 43811, "epoch": 1043} {"train_loss": -5.7104082107543945, "global_step": 43812, "epoch": 1043} {"train_loss": -5.644874572753906, "global_step": 43813, "epoch": 1043} {"train_loss": -5.854218006134033, "global_step": 43814, "epoch": 1043} {"train_loss": -5.568809509277344, "global_step": 43815, "epoch": 1043} {"train_loss": -5.603842735290527, "global_step": 43816, "epoch": 1043} {"train_loss": -5.694558143615723, "global_step": 43817, "epoch": 1043} {"train_loss": -5.517123222351074, "global_step": 43818, "epoch": 1043} {"train_loss": -5.674396991729736, "global_step": 43819, "epoch": 1043} {"train_loss": -5.681375503540039, "global_step": 43820, "epoch": 1043} {"train_loss": -5.639824867248535, "global_step": 43821, "epoch": 1043} {"train_loss": -5.682300090789795, "global_step": 43822, "epoch": 1043} {"train_loss": -5.635615825653076, "global_step": 43823, "epoch": 1043} {"train_loss": -5.608098030090332, "global_step": 43824, "epoch": 1043} {"train_loss": -5.598701000213623, "global_step": 43825, "epoch": 1043} {"train_loss": -5.594513893127441, "global_step": 43826, "epoch": 1043} {"train_loss": -5.654664039611816, "global_step": 43827, "epoch": 1043} {"train_loss": -5.503528118133545, "global_step": 43828, "epoch": 1043} {"train_loss": -5.5272111892700195, "global_step": 43829, "epoch": 1043} {"train_loss": -5.595964431762695, "global_step": 43830, "epoch": 1043} {"train_loss": -5.7332234382629395, "global_step": 43831, "epoch": 1043} {"train_loss": -5.592616558074951, "global_step": 43832, "epoch": 1043} {"train_loss": -5.705566883087158, "global_step": 43833, "epoch": 1043} {"train_loss": -5.7303643226623535, "global_step": 43834, "epoch": 1043} {"train_loss": -5.678230285644531, "global_step": 43835, "epoch": 1043} {"train_loss": -5.56252384185791, "global_step": 43836, "epoch": 1043} {"train_loss": -5.651436805725098, "global_step": 43837, "epoch": 1043} {"train_loss": -5.609601974487305, "global_step": 43838, "epoch": 1043} {"train_loss": -5.631391525268555, "global_step": 43839, "epoch": 1043} {"train_loss": -5.637335777282715, "global_step": 43840, "epoch": 1043} {"train_loss": -5.775940895080566, "global_step": 43841, "epoch": 1043} {"train_loss": -5.719832420349121, "global_step": 43842, "epoch": 1043} {"train_loss": -5.502820014953613, "global_step": 43843, "epoch": 1043} {"train_loss": -5.6987385749816895, "global_step": 43844, "epoch": 1043} {"train_loss": -5.688445568084717, "global_step": 43845, "epoch": 1043} {"train_loss": -5.710247993469238, "global_step": 43846, "epoch": 1043} {"train_loss": -5.654667309352329, "global_step": 43847, "epoch": 1043, "val_loss": 66455.59375} {"train_loss": -5.597535610198975, "global_step": 43848, "epoch": 1044} {"train_loss": -5.670186996459961, "global_step": 43849, "epoch": 1044} {"train_loss": -5.543539524078369, "global_step": 43850, "epoch": 1044} {"train_loss": -5.5952043533325195, "global_step": 43851, "epoch": 1044} {"train_loss": -5.547929286956787, "global_step": 43852, "epoch": 1044} {"train_loss": -5.71206521987915, "global_step": 43853, "epoch": 1044} {"train_loss": -5.588075160980225, "global_step": 43854, "epoch": 1044} {"train_loss": -5.6408305168151855, "global_step": 43855, "epoch": 1044} {"train_loss": -5.706131935119629, "global_step": 43856, "epoch": 1044} {"train_loss": -5.601290702819824, "global_step": 43857, "epoch": 1044} {"train_loss": -5.649796009063721, "global_step": 43858, "epoch": 1044} {"train_loss": -5.726963996887207, "global_step": 43859, "epoch": 1044} {"train_loss": -5.74688720703125, "global_step": 43860, "epoch": 1044} {"train_loss": -5.705876350402832, "global_step": 43861, "epoch": 1044} {"train_loss": -5.6580810546875, "global_step": 43862, "epoch": 1044} {"train_loss": -5.70443058013916, "global_step": 43863, "epoch": 1044} {"train_loss": -5.656847953796387, "global_step": 43864, "epoch": 1044} {"train_loss": -5.793292045593262, "global_step": 43865, "epoch": 1044} {"train_loss": -5.794382572174072, "global_step": 43866, "epoch": 1044} {"train_loss": -5.7020063400268555, "global_step": 43867, "epoch": 1044} {"train_loss": -5.745131015777588, "global_step": 43868, "epoch": 1044} {"train_loss": -5.6533660888671875, "global_step": 43869, "epoch": 1044} {"train_loss": -5.731561183929443, "global_step": 43870, "epoch": 1044} {"train_loss": -5.672615051269531, "global_step": 43871, "epoch": 1044} {"train_loss": -5.767529487609863, "global_step": 43872, "epoch": 1044} {"train_loss": -5.6802191734313965, "global_step": 43873, "epoch": 1044} {"train_loss": -5.790207386016846, "global_step": 43874, "epoch": 1044} {"train_loss": -5.755918502807617, "global_step": 43875, "epoch": 1044} {"train_loss": -5.687859535217285, "global_step": 43876, "epoch": 1044} {"train_loss": -5.682345390319824, "global_step": 43877, "epoch": 1044} {"train_loss": -5.700153827667236, "global_step": 43878, "epoch": 1044} {"train_loss": -5.669767379760742, "global_step": 43879, "epoch": 1044} {"train_loss": -5.645332336425781, "global_step": 43880, "epoch": 1044} {"train_loss": -5.461099147796631, "global_step": 43881, "epoch": 1044} {"train_loss": -5.589482307434082, "global_step": 43882, "epoch": 1044} {"train_loss": -5.747318267822266, "global_step": 43883, "epoch": 1044} {"train_loss": -5.689327716827393, "global_step": 43884, "epoch": 1044} {"train_loss": -5.716949939727783, "global_step": 43885, "epoch": 1044} {"train_loss": -5.749014854431152, "global_step": 43886, "epoch": 1044} {"train_loss": -5.643506050109863, "global_step": 43887, "epoch": 1044} {"train_loss": -5.719837665557861, "global_step": 43888, "epoch": 1044} {"train_loss": -5.676947207677932, "global_step": 43889, "epoch": 1044, "val_loss": 65902.984375} {"train_loss": -5.740217685699463, "global_step": 43890, "epoch": 1045} {"train_loss": -5.640702247619629, "global_step": 43891, "epoch": 1045} {"train_loss": -5.631422996520996, "global_step": 43892, "epoch": 1045} {"train_loss": -5.631691932678223, "global_step": 43893, "epoch": 1045} {"train_loss": -5.6870903968811035, "global_step": 43894, "epoch": 1045} {"train_loss": -5.725793361663818, "global_step": 43895, "epoch": 1045} {"train_loss": -5.648247718811035, "global_step": 43896, "epoch": 1045} {"train_loss": -5.588420867919922, "global_step": 43897, "epoch": 1045} {"train_loss": -5.745146751403809, "global_step": 43898, "epoch": 1045} {"train_loss": -5.604907989501953, "global_step": 43899, "epoch": 1045} {"train_loss": -5.884642601013184, "global_step": 43900, "epoch": 1045} {"train_loss": -5.532086372375488, "global_step": 43901, "epoch": 1045} {"train_loss": -5.66373348236084, "global_step": 43902, "epoch": 1045} {"train_loss": -5.620925426483154, "global_step": 43903, "epoch": 1045} {"train_loss": -5.6346540451049805, "global_step": 43904, "epoch": 1045} {"train_loss": -5.662445068359375, "global_step": 43905, "epoch": 1045} {"train_loss": -5.676156044006348, "global_step": 43906, "epoch": 1045} {"train_loss": -5.697867393493652, "global_step": 43907, "epoch": 1045} {"train_loss": -5.68210506439209, "global_step": 43908, "epoch": 1045} {"train_loss": -5.760052680969238, "global_step": 43909, "epoch": 1045} {"train_loss": -5.7000274658203125, "global_step": 43910, "epoch": 1045} {"train_loss": -5.714356422424316, "global_step": 43911, "epoch": 1045} {"train_loss": -5.736928939819336, "global_step": 43912, "epoch": 1045} {"train_loss": -5.751595973968506, "global_step": 43913, "epoch": 1045} {"train_loss": -5.712322235107422, "global_step": 43914, "epoch": 1045} {"train_loss": -5.785698890686035, "global_step": 43915, "epoch": 1045} {"train_loss": -5.689903736114502, "global_step": 43916, "epoch": 1045} {"train_loss": -5.696514129638672, "global_step": 43917, "epoch": 1045} {"train_loss": -5.566137790679932, "global_step": 43918, "epoch": 1045} {"train_loss": -5.663613319396973, "global_step": 43919, "epoch": 1045} {"train_loss": -5.7386016845703125, "global_step": 43920, "epoch": 1045} {"train_loss": -5.750028133392334, "global_step": 43921, "epoch": 1045} {"train_loss": -5.654271125793457, "global_step": 43922, "epoch": 1045} {"train_loss": -5.390172004699707, "global_step": 43923, "epoch": 1045} {"train_loss": -5.583676338195801, "global_step": 43924, "epoch": 1045} {"train_loss": -5.374510765075684, "global_step": 43925, "epoch": 1045} {"train_loss": -5.706375598907471, "global_step": 43926, "epoch": 1045} {"train_loss": -5.604287624359131, "global_step": 43927, "epoch": 1045} {"train_loss": -5.616273880004883, "global_step": 43928, "epoch": 1045} {"train_loss": -5.641041278839111, "global_step": 43929, "epoch": 1045} {"train_loss": -5.6600542068481445, "global_step": 43930, "epoch": 1045} {"train_loss": -5.661017372494652, "global_step": 43931, "epoch": 1045, "val_loss": 66362.34375} {"train_loss": -5.536770820617676, "global_step": 43932, "epoch": 1046} {"train_loss": -5.748658180236816, "global_step": 43933, "epoch": 1046} {"train_loss": -5.585941314697266, "global_step": 43934, "epoch": 1046} {"train_loss": -5.722747802734375, "global_step": 43935, "epoch": 1046} {"train_loss": -5.572064399719238, "global_step": 43936, "epoch": 1046} {"train_loss": -5.515741348266602, "global_step": 43937, "epoch": 1046} {"train_loss": -5.663812637329102, "global_step": 43938, "epoch": 1046} {"train_loss": -5.686784267425537, "global_step": 43939, "epoch": 1046} {"train_loss": -5.762036323547363, "global_step": 43940, "epoch": 1046} {"train_loss": -5.616130352020264, "global_step": 43941, "epoch": 1046} {"train_loss": -5.604494094848633, "global_step": 43942, "epoch": 1046} {"train_loss": -5.57933235168457, "global_step": 43943, "epoch": 1046} {"train_loss": -5.594667434692383, "global_step": 43944, "epoch": 1046} {"train_loss": -5.728372573852539, "global_step": 43945, "epoch": 1046} {"train_loss": -5.63700008392334, "global_step": 43946, "epoch": 1046} {"train_loss": -5.756241798400879, "global_step": 43947, "epoch": 1046} {"train_loss": -5.665790557861328, "global_step": 43948, "epoch": 1046} {"train_loss": -5.610332489013672, "global_step": 43949, "epoch": 1046} {"train_loss": -5.7345476150512695, "global_step": 43950, "epoch": 1046} {"train_loss": -5.666644096374512, "global_step": 43951, "epoch": 1046} {"train_loss": -5.63150691986084, "global_step": 43952, "epoch": 1046} {"train_loss": -5.773041248321533, "global_step": 43953, "epoch": 1046} {"train_loss": -5.567083358764648, "global_step": 43954, "epoch": 1046} {"train_loss": -5.60877799987793, "global_step": 43955, "epoch": 1046} {"train_loss": -5.820892333984375, "global_step": 43956, "epoch": 1046} {"train_loss": -5.709951400756836, "global_step": 43957, "epoch": 1046} {"train_loss": -5.561859130859375, "global_step": 43958, "epoch": 1046} {"train_loss": -5.7690629959106445, "global_step": 43959, "epoch": 1046} {"train_loss": -5.745211124420166, "global_step": 43960, "epoch": 1046} {"train_loss": -5.523882865905762, "global_step": 43961, "epoch": 1046} {"train_loss": -5.640940189361572, "global_step": 43962, "epoch": 1046} {"train_loss": -5.718347072601318, "global_step": 43963, "epoch": 1046} {"train_loss": -5.6883769035339355, "global_step": 43964, "epoch": 1046} {"train_loss": -5.740875244140625, "global_step": 43965, "epoch": 1046} {"train_loss": -5.604722023010254, "global_step": 43966, "epoch": 1046} {"train_loss": -5.624795913696289, "global_step": 43967, "epoch": 1046} {"train_loss": -5.539182662963867, "global_step": 43968, "epoch": 1046} {"train_loss": -5.580497741699219, "global_step": 43969, "epoch": 1046} {"train_loss": -5.632091999053955, "global_step": 43970, "epoch": 1046} {"train_loss": -5.666463851928711, "global_step": 43971, "epoch": 1046} {"train_loss": -5.576284408569336, "global_step": 43972, "epoch": 1046} {"train_loss": -5.652798391523815, "global_step": 43973, "epoch": 1046, "val_loss": 66101.0625} {"train_loss": -5.740898132324219, "global_step": 43974, "epoch": 1047} {"train_loss": -5.610753059387207, "global_step": 43975, "epoch": 1047} {"train_loss": -5.6467180252075195, "global_step": 43976, "epoch": 1047} {"train_loss": -5.611257553100586, "global_step": 43977, "epoch": 1047} {"train_loss": -5.579824447631836, "global_step": 43978, "epoch": 1047} {"train_loss": -5.853055000305176, "global_step": 43979, "epoch": 1047} {"train_loss": -5.6800031661987305, "global_step": 43980, "epoch": 1047} {"train_loss": -5.669442653656006, "global_step": 43981, "epoch": 1047} {"train_loss": -5.706348419189453, "global_step": 43982, "epoch": 1047} {"train_loss": -5.579229354858398, "global_step": 43983, "epoch": 1047} {"train_loss": -5.6623640060424805, "global_step": 43984, "epoch": 1047} {"train_loss": -5.654364585876465, "global_step": 43985, "epoch": 1047} {"train_loss": -5.758126735687256, "global_step": 43986, "epoch": 1047} {"train_loss": -5.70388126373291, "global_step": 43987, "epoch": 1047} {"train_loss": -5.727648735046387, "global_step": 43988, "epoch": 1047} {"train_loss": -5.674834251403809, "global_step": 43989, "epoch": 1047} {"train_loss": -5.760348796844482, "global_step": 43990, "epoch": 1047} {"train_loss": -5.732649803161621, "global_step": 43991, "epoch": 1047} {"train_loss": -5.789020538330078, "global_step": 43992, "epoch": 1047} {"train_loss": -5.673715591430664, "global_step": 43993, "epoch": 1047} {"train_loss": -5.813138961791992, "global_step": 43994, "epoch": 1047} {"train_loss": -5.565231800079346, "global_step": 43995, "epoch": 1047} {"train_loss": -5.570616722106934, "global_step": 43996, "epoch": 1047} {"train_loss": -5.627337455749512, "global_step": 43997, "epoch": 1047} {"train_loss": -5.665055274963379, "global_step": 43998, "epoch": 1047} {"train_loss": -5.726984024047852, "global_step": 43999, "epoch": 1047} {"train_loss": -5.758087158203125, "global_step": 44000, "epoch": 1047} {"train_loss": -5.706462860107422, "global_step": 44001, "epoch": 1047} {"train_loss": -5.766447067260742, "global_step": 44002, "epoch": 1047} {"train_loss": -5.772665977478027, "global_step": 44003, "epoch": 1047} {"train_loss": -5.741397857666016, "global_step": 44004, "epoch": 1047} {"train_loss": -5.66001558303833, "global_step": 44005, "epoch": 1047} {"train_loss": -5.653799057006836, "global_step": 44006, "epoch": 1047} {"train_loss": -5.6573710441589355, "global_step": 44007, "epoch": 1047} {"train_loss": -5.72158145904541, "global_step": 44008, "epoch": 1047} {"train_loss": -5.578691482543945, "global_step": 44009, "epoch": 1047} {"train_loss": -5.641702651977539, "global_step": 44010, "epoch": 1047} {"train_loss": -5.6703643798828125, "global_step": 44011, "epoch": 1047} {"train_loss": -5.698086738586426, "global_step": 44012, "epoch": 1047} {"train_loss": -5.594160556793213, "global_step": 44013, "epoch": 1047} {"train_loss": -5.64418888092041, "global_step": 44014, "epoch": 1047} {"train_loss": -5.681649957384382, "global_step": 44015, "epoch": 1047, "val_loss": 66396.875} {"train_loss": -5.617668151855469, "global_step": 44016, "epoch": 1048} {"train_loss": -5.511213302612305, "global_step": 44017, "epoch": 1048} {"train_loss": -5.644900321960449, "global_step": 44018, "epoch": 1048} {"train_loss": -5.635887145996094, "global_step": 44019, "epoch": 1048} {"train_loss": -5.672283172607422, "global_step": 44020, "epoch": 1048} {"train_loss": -5.6820220947265625, "global_step": 44021, "epoch": 1048} {"train_loss": -5.583817481994629, "global_step": 44022, "epoch": 1048} {"train_loss": -5.58383846282959, "global_step": 44023, "epoch": 1048} {"train_loss": -5.673521041870117, "global_step": 44024, "epoch": 1048} {"train_loss": -5.546881675720215, "global_step": 44025, "epoch": 1048} {"train_loss": -5.6921539306640625, "global_step": 44026, "epoch": 1048} {"train_loss": -5.729957103729248, "global_step": 44027, "epoch": 1048} {"train_loss": -5.672997951507568, "global_step": 44028, "epoch": 1048} {"train_loss": -5.649387836456299, "global_step": 44029, "epoch": 1048} {"train_loss": -5.617422580718994, "global_step": 44030, "epoch": 1048} {"train_loss": -5.735812664031982, "global_step": 44031, "epoch": 1048} {"train_loss": -5.7158050537109375, "global_step": 44032, "epoch": 1048} {"train_loss": -5.600523948669434, "global_step": 44033, "epoch": 1048} {"train_loss": -5.60715913772583, "global_step": 44034, "epoch": 1048} {"train_loss": -5.667017936706543, "global_step": 44035, "epoch": 1048} {"train_loss": -5.575416564941406, "global_step": 44036, "epoch": 1048} {"train_loss": -5.578058242797852, "global_step": 44037, "epoch": 1048} {"train_loss": -5.614417552947998, "global_step": 44038, "epoch": 1048} {"train_loss": -5.793784141540527, "global_step": 44039, "epoch": 1048} {"train_loss": -5.640345573425293, "global_step": 44040, "epoch": 1048} {"train_loss": -5.6803879737854, "global_step": 44041, "epoch": 1048} {"train_loss": -5.534456729888916, "global_step": 44042, "epoch": 1048} {"train_loss": -5.656902313232422, "global_step": 44043, "epoch": 1048} {"train_loss": -5.817388534545898, "global_step": 44044, "epoch": 1048} {"train_loss": -5.850557804107666, "global_step": 44045, "epoch": 1048} {"train_loss": -5.71144962310791, "global_step": 44046, "epoch": 1048} {"train_loss": -5.768985748291016, "global_step": 44047, "epoch": 1048} {"train_loss": -5.577587604522705, "global_step": 44048, "epoch": 1048} {"train_loss": -5.725861549377441, "global_step": 44049, "epoch": 1048} {"train_loss": -5.737404823303223, "global_step": 44050, "epoch": 1048} {"train_loss": -5.572504043579102, "global_step": 44051, "epoch": 1048} {"train_loss": -5.614343643188477, "global_step": 44052, "epoch": 1048} {"train_loss": -5.557428359985352, "global_step": 44053, "epoch": 1048} {"train_loss": -5.781364440917969, "global_step": 44054, "epoch": 1048} {"train_loss": -5.587569236755371, "global_step": 44055, "epoch": 1048} {"train_loss": -5.749310493469238, "global_step": 44056, "epoch": 1048} {"train_loss": -5.659008457547142, "global_step": 44057, "epoch": 1048, "val_loss": 66261.0390625} {"train_loss": -5.678884983062744, "global_step": 44058, "epoch": 1049} {"train_loss": -5.623349189758301, "global_step": 44059, "epoch": 1049} {"train_loss": -5.658957004547119, "global_step": 44060, "epoch": 1049} {"train_loss": -5.491575241088867, "global_step": 44061, "epoch": 1049} {"train_loss": -5.728243350982666, "global_step": 44062, "epoch": 1049} {"train_loss": -5.665772438049316, "global_step": 44063, "epoch": 1049} {"train_loss": -5.686276435852051, "global_step": 44064, "epoch": 1049} {"train_loss": -5.6046576499938965, "global_step": 44065, "epoch": 1049} {"train_loss": -5.662447452545166, "global_step": 44066, "epoch": 1049} {"train_loss": -5.600813865661621, "global_step": 44067, "epoch": 1049} {"train_loss": -5.551725387573242, "global_step": 44068, "epoch": 1049} {"train_loss": -5.739920616149902, "global_step": 44069, "epoch": 1049} {"train_loss": -5.628095626831055, "global_step": 44070, "epoch": 1049} {"train_loss": -5.6853532791137695, "global_step": 44071, "epoch": 1049} {"train_loss": -5.773316860198975, "global_step": 44072, "epoch": 1049} {"train_loss": -5.618453502655029, "global_step": 44073, "epoch": 1049} {"train_loss": -5.712947845458984, "global_step": 44074, "epoch": 1049} {"train_loss": -5.654973030090332, "global_step": 44075, "epoch": 1049} {"train_loss": -5.610849380493164, "global_step": 44076, "epoch": 1049} {"train_loss": -5.634218692779541, "global_step": 44077, "epoch": 1049} {"train_loss": -5.652052879333496, "global_step": 44078, "epoch": 1049} {"train_loss": -5.54079008102417, "global_step": 44079, "epoch": 1049} {"train_loss": -5.618901252746582, "global_step": 44080, "epoch": 1049} {"train_loss": -5.724853515625, "global_step": 44081, "epoch": 1049} {"train_loss": -5.707005500793457, "global_step": 44082, "epoch": 1049} {"train_loss": -5.630422115325928, "global_step": 44083, "epoch": 1049} {"train_loss": -5.73599100112915, "global_step": 44084, "epoch": 1049} {"train_loss": -5.622478485107422, "global_step": 44085, "epoch": 1049} {"train_loss": -5.732046127319336, "global_step": 44086, "epoch": 1049} {"train_loss": -5.71996545791626, "global_step": 44087, "epoch": 1049} {"train_loss": -5.723349571228027, "global_step": 44088, "epoch": 1049} {"train_loss": -5.814592361450195, "global_step": 44089, "epoch": 1049} {"train_loss": -5.742159843444824, "global_step": 44090, "epoch": 1049} {"train_loss": -5.545961856842041, "global_step": 44091, "epoch": 1049} {"train_loss": -5.679152965545654, "global_step": 44092, "epoch": 1049} {"train_loss": -5.6954345703125, "global_step": 44093, "epoch": 1049} {"train_loss": -5.79718017578125, "global_step": 44094, "epoch": 1049} {"train_loss": -5.763007164001465, "global_step": 44095, "epoch": 1049} {"train_loss": -5.681993007659912, "global_step": 44096, "epoch": 1049} {"train_loss": -5.631218433380127, "global_step": 44097, "epoch": 1049} {"train_loss": -5.642378330230713, "global_step": 44098, "epoch": 1049} {"train_loss": -5.6714330060141425, "global_step": 44099, "epoch": 1049, "val_loss": 66240.1328125} {"train_loss": -5.877213478088379, "global_step": 44100, "epoch": 1050} {"train_loss": -5.752189636230469, "global_step": 44101, "epoch": 1050} {"train_loss": -5.7334184646606445, "global_step": 44102, "epoch": 1050} {"train_loss": -5.760059356689453, "global_step": 44103, "epoch": 1050} {"train_loss": -5.877695560455322, "global_step": 44104, "epoch": 1050} {"train_loss": -5.700013160705566, "global_step": 44105, "epoch": 1050} {"train_loss": -5.733582019805908, "global_step": 44106, "epoch": 1050} {"train_loss": -5.68250846862793, "global_step": 44107, "epoch": 1050} {"train_loss": -5.673376083374023, "global_step": 44108, "epoch": 1050} {"train_loss": -5.705695152282715, "global_step": 44109, "epoch": 1050} {"train_loss": -5.720852851867676, "global_step": 44110, "epoch": 1050} {"train_loss": -5.7496747970581055, "global_step": 44111, "epoch": 1050} {"train_loss": -5.628864288330078, "global_step": 44112, "epoch": 1050} {"train_loss": -5.642917633056641, "global_step": 44113, "epoch": 1050} {"train_loss": -5.529110908508301, "global_step": 44114, "epoch": 1050} {"train_loss": -5.573996067047119, "global_step": 44115, "epoch": 1050} {"train_loss": -5.672387599945068, "global_step": 44116, "epoch": 1050} {"train_loss": -5.571262359619141, "global_step": 44117, "epoch": 1050} {"train_loss": -5.621451377868652, "global_step": 44118, "epoch": 1050} {"train_loss": -5.564756870269775, "global_step": 44119, "epoch": 1050} {"train_loss": -5.58814001083374, "global_step": 44120, "epoch": 1050} {"train_loss": -5.53885555267334, "global_step": 44121, "epoch": 1050} {"train_loss": -5.672609329223633, "global_step": 44122, "epoch": 1050} {"train_loss": -5.719642639160156, "global_step": 44123, "epoch": 1050} {"train_loss": -5.719306468963623, "global_step": 44124, "epoch": 1050} {"train_loss": -5.724597930908203, "global_step": 44125, "epoch": 1050} {"train_loss": -5.732416152954102, "global_step": 44126, "epoch": 1050} {"train_loss": -5.688058853149414, "global_step": 44127, "epoch": 1050} {"train_loss": -5.776496887207031, "global_step": 44128, "epoch": 1050} {"train_loss": -5.691120147705078, "global_step": 44129, "epoch": 1050} {"train_loss": -5.775128364562988, "global_step": 44130, "epoch": 1050} {"train_loss": -5.641822814941406, "global_step": 44131, "epoch": 1050} {"train_loss": -5.680981636047363, "global_step": 44132, "epoch": 1050} {"train_loss": -5.845054626464844, "global_step": 44133, "epoch": 1050} {"train_loss": -5.680934906005859, "global_step": 44134, "epoch": 1050} {"train_loss": -5.687459945678711, "global_step": 44135, "epoch": 1050} {"train_loss": -5.632226467132568, "global_step": 44136, "epoch": 1050} {"train_loss": -5.595900535583496, "global_step": 44137, "epoch": 1050} {"train_loss": -5.703963756561279, "global_step": 44138, "epoch": 1050} {"train_loss": -5.69378137588501, "global_step": 44139, "epoch": 1050} {"train_loss": -5.683383464813232, "global_step": 44140, "epoch": 1050} {"train_loss": -5.687536319096883, "global_step": 44141, "epoch": 1050, "train/sim_max_reward_0": 0.6788450708377006, "train/sim_max_reward_1": 0.1431846784830326, "train/sim_max_reward_2": 0.4350743410025218, "train/sim_max_reward_3": 0.17659087149945468, "train/sim_max_reward_4": 0.5585325562612522, "train/sim_max_reward_5": 0.8236945148026764, "test/sim_max_reward_4400000": 0.15445970394332162, "test/sim_max_reward_4400001": 0.35647557474911046, "test/sim_max_reward_4400002": 0.05643902194472198, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.21079189915040397, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.07877411151721417, "test/sim_max_reward_4400008": 0.5644918183116967, "test/sim_max_reward_4400009": 0.4135048710681539, "test/sim_max_reward_4400010": 0.25283903225415844, "test/sim_max_reward_4400011": 0.07394220976996922, "test/sim_max_reward_4400012": 0.2772852036006211, "test/sim_max_reward_4400013": 0.9117666221241001, "test/sim_max_reward_4400014": 0.2570526085005111, "test/sim_max_reward_4400015": 0.18869305402302353, "test/sim_max_reward_4400016": 0.06889110576219681, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.36706641247669697, "test/sim_max_reward_4400019": 0.17449500687856084, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5795113315517243, "test/sim_max_reward_4400022": 0.24277360074059093, "test/sim_max_reward_4400023": 0.08779411411690283, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.38006866212730483, "test/sim_max_reward_4400027": 0.07525635131594402, "test/sim_max_reward_4400028": 0.3032989978213586, "test/sim_max_reward_4400029": 0.07987556607830011, "test/sim_max_reward_4400030": 0.6174217361058877, "test/sim_max_reward_4400031": 0.43221754849213395, "test/sim_max_reward_4400032": 0.12448701641722072, "test/sim_max_reward_4400033": 0.17724182101083483, "test/sim_max_reward_4400034": 0.1538314032831831, "test/sim_max_reward_4400035": 0.5052279365242118, "test/sim_max_reward_4400036": 0.6309411136573848, "test/sim_max_reward_4400037": 0.30487812832608324, "test/sim_max_reward_4400038": 0.27686627902575245, "test/sim_max_reward_4400039": 0.6360132237834231, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9066227246193189, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.7979799294952133, "test/sim_max_reward_4400045": 0.23418164734627117, "test/sim_max_reward_4400046": 0.2984495419394041, "test/sim_max_reward_4400047": 0.6946269273775364, "test/sim_max_reward_4400048": 0.9166745623945234, "test/sim_max_reward_4400049": 0.6119330750770848, "train/mean_score": 0.46932033881443974, "test/mean_score": 0.2987665084937925, "val_loss": 66078.4453125} {"train_loss": -5.770079612731934, "global_step": 44142, "epoch": 1051} {"train_loss": -5.599189758300781, "global_step": 44143, "epoch": 1051} {"train_loss": -5.713659286499023, "global_step": 44144, "epoch": 1051} {"train_loss": -5.591950416564941, "global_step": 44145, "epoch": 1051} {"train_loss": -5.566190719604492, "global_step": 44146, "epoch": 1051} {"train_loss": -5.678689479827881, "global_step": 44147, "epoch": 1051} {"train_loss": -5.786218643188477, "global_step": 44148, "epoch": 1051} {"train_loss": -5.819540977478027, "global_step": 44149, "epoch": 1051} {"train_loss": -5.657740592956543, "global_step": 44150, "epoch": 1051} {"train_loss": -5.722955703735352, "global_step": 44151, "epoch": 1051} {"train_loss": -5.732036590576172, "global_step": 44152, "epoch": 1051} {"train_loss": -5.678962707519531, "global_step": 44153, "epoch": 1051} {"train_loss": -5.7191877365112305, "global_step": 44154, "epoch": 1051} {"train_loss": -5.561490058898926, "global_step": 44155, "epoch": 1051} {"train_loss": -5.793277740478516, "global_step": 44156, "epoch": 1051} {"train_loss": -5.685503005981445, "global_step": 44157, "epoch": 1051} {"train_loss": -5.7504682540893555, "global_step": 44158, "epoch": 1051} {"train_loss": -5.543603897094727, "global_step": 44159, "epoch": 1051} {"train_loss": -5.647385597229004, "global_step": 44160, "epoch": 1051} {"train_loss": -5.667868614196777, "global_step": 44161, "epoch": 1051} {"train_loss": -5.667407989501953, "global_step": 44162, "epoch": 1051} {"train_loss": -5.775577068328857, "global_step": 44163, "epoch": 1051} {"train_loss": -5.694782257080078, "global_step": 44164, "epoch": 1051} {"train_loss": -5.576201438903809, "global_step": 44165, "epoch": 1051} {"train_loss": -5.580462455749512, "global_step": 44166, "epoch": 1051} {"train_loss": -5.576214790344238, "global_step": 44167, "epoch": 1051} {"train_loss": -5.584880352020264, "global_step": 44168, "epoch": 1051} {"train_loss": -5.632395267486572, "global_step": 44169, "epoch": 1051} {"train_loss": -5.684321403503418, "global_step": 44170, "epoch": 1051} {"train_loss": -5.665327548980713, "global_step": 44171, "epoch": 1051} {"train_loss": -5.706456661224365, "global_step": 44172, "epoch": 1051} {"train_loss": -5.791860580444336, "global_step": 44173, "epoch": 1051} {"train_loss": -5.680041313171387, "global_step": 44174, "epoch": 1051} {"train_loss": -5.772269248962402, "global_step": 44175, "epoch": 1051} {"train_loss": -5.745151519775391, "global_step": 44176, "epoch": 1051} {"train_loss": -5.636676788330078, "global_step": 44177, "epoch": 1051} {"train_loss": -5.666519641876221, "global_step": 44178, "epoch": 1051} {"train_loss": -5.8157501220703125, "global_step": 44179, "epoch": 1051} {"train_loss": -5.645374298095703, "global_step": 44180, "epoch": 1051} {"train_loss": -5.75678825378418, "global_step": 44181, "epoch": 1051} {"train_loss": -5.734335422515869, "global_step": 44182, "epoch": 1051} {"train_loss": -5.683233806065151, "global_step": 44183, "epoch": 1051, "val_loss": 66174.5390625} {"train_loss": -5.688672065734863, "global_step": 44184, "epoch": 1052} {"train_loss": -5.845963478088379, "global_step": 44185, "epoch": 1052} {"train_loss": -5.687856674194336, "global_step": 44186, "epoch": 1052} {"train_loss": -5.552841663360596, "global_step": 44187, "epoch": 1052} {"train_loss": -5.647513389587402, "global_step": 44188, "epoch": 1052} {"train_loss": -5.754944324493408, "global_step": 44189, "epoch": 1052} {"train_loss": -5.699939727783203, "global_step": 44190, "epoch": 1052} {"train_loss": -5.608102321624756, "global_step": 44191, "epoch": 1052} {"train_loss": -5.761055946350098, "global_step": 44192, "epoch": 1052} {"train_loss": -5.66875696182251, "global_step": 44193, "epoch": 1052} {"train_loss": -5.665355205535889, "global_step": 44194, "epoch": 1052} {"train_loss": -5.690727233886719, "global_step": 44195, "epoch": 1052} {"train_loss": -5.593931674957275, "global_step": 44196, "epoch": 1052} {"train_loss": -5.670773506164551, "global_step": 44197, "epoch": 1052} {"train_loss": -5.6908674240112305, "global_step": 44198, "epoch": 1052} {"train_loss": -5.578608989715576, "global_step": 44199, "epoch": 1052} {"train_loss": -5.682132720947266, "global_step": 44200, "epoch": 1052} {"train_loss": -5.66923189163208, "global_step": 44201, "epoch": 1052} {"train_loss": -5.723601818084717, "global_step": 44202, "epoch": 1052} {"train_loss": -5.706487655639648, "global_step": 44203, "epoch": 1052} {"train_loss": -5.771420955657959, "global_step": 44204, "epoch": 1052} {"train_loss": -5.644744396209717, "global_step": 44205, "epoch": 1052} {"train_loss": -5.680293083190918, "global_step": 44206, "epoch": 1052} {"train_loss": -5.742218017578125, "global_step": 44207, "epoch": 1052} {"train_loss": -5.746898651123047, "global_step": 44208, "epoch": 1052} {"train_loss": -5.680942535400391, "global_step": 44209, "epoch": 1052} {"train_loss": -5.688469886779785, "global_step": 44210, "epoch": 1052} {"train_loss": -5.665985107421875, "global_step": 44211, "epoch": 1052} {"train_loss": -5.683795928955078, "global_step": 44212, "epoch": 1052} {"train_loss": -5.609265327453613, "global_step": 44213, "epoch": 1052} {"train_loss": -5.639451026916504, "global_step": 44214, "epoch": 1052} {"train_loss": -5.636374473571777, "global_step": 44215, "epoch": 1052} {"train_loss": -5.68668270111084, "global_step": 44216, "epoch": 1052} {"train_loss": -5.680864334106445, "global_step": 44217, "epoch": 1052} {"train_loss": -5.733125686645508, "global_step": 44218, "epoch": 1052} {"train_loss": -5.744623184204102, "global_step": 44219, "epoch": 1052} {"train_loss": -5.596411228179932, "global_step": 44220, "epoch": 1052} {"train_loss": -5.735904693603516, "global_step": 44221, "epoch": 1052} {"train_loss": -5.610431671142578, "global_step": 44222, "epoch": 1052} {"train_loss": -5.658185958862305, "global_step": 44223, "epoch": 1052} {"train_loss": -5.8360090255737305, "global_step": 44224, "epoch": 1052} {"train_loss": -5.686426015127273, "global_step": 44225, "epoch": 1052, "val_loss": 66012.2421875} {"train_loss": -5.7352375984191895, "global_step": 44226, "epoch": 1053} {"train_loss": -5.718796730041504, "global_step": 44227, "epoch": 1053} {"train_loss": -5.652460098266602, "global_step": 44228, "epoch": 1053} {"train_loss": -5.641110420227051, "global_step": 44229, "epoch": 1053} {"train_loss": -5.64954948425293, "global_step": 44230, "epoch": 1053} {"train_loss": -5.730502128601074, "global_step": 44231, "epoch": 1053} {"train_loss": -5.832262992858887, "global_step": 44232, "epoch": 1053} {"train_loss": -5.64605188369751, "global_step": 44233, "epoch": 1053} {"train_loss": -5.748438835144043, "global_step": 44234, "epoch": 1053} {"train_loss": -5.612536907196045, "global_step": 44235, "epoch": 1053} {"train_loss": -5.855885028839111, "global_step": 44236, "epoch": 1053} {"train_loss": -5.605042934417725, "global_step": 44237, "epoch": 1053} {"train_loss": -5.710611820220947, "global_step": 44238, "epoch": 1053} {"train_loss": -5.590804100036621, "global_step": 44239, "epoch": 1053} {"train_loss": -5.582518100738525, "global_step": 44240, "epoch": 1053} {"train_loss": -5.609697341918945, "global_step": 44241, "epoch": 1053} {"train_loss": -5.663141250610352, "global_step": 44242, "epoch": 1053} {"train_loss": -5.58992862701416, "global_step": 44243, "epoch": 1053} {"train_loss": -5.666041374206543, "global_step": 44244, "epoch": 1053} {"train_loss": -5.814746379852295, "global_step": 44245, "epoch": 1053} {"train_loss": -5.803777694702148, "global_step": 44246, "epoch": 1053} {"train_loss": -5.569025993347168, "global_step": 44247, "epoch": 1053} {"train_loss": -5.707760810852051, "global_step": 44248, "epoch": 1053} {"train_loss": -5.602146625518799, "global_step": 44249, "epoch": 1053} {"train_loss": -5.586185455322266, "global_step": 44250, "epoch": 1053} {"train_loss": -5.740937232971191, "global_step": 44251, "epoch": 1053} {"train_loss": -5.6348347663879395, "global_step": 44252, "epoch": 1053} {"train_loss": -5.557073593139648, "global_step": 44253, "epoch": 1053} {"train_loss": -5.530997276306152, "global_step": 44254, "epoch": 1053} {"train_loss": -5.70260763168335, "global_step": 44255, "epoch": 1053} {"train_loss": -5.576436996459961, "global_step": 44256, "epoch": 1053} {"train_loss": -5.5765790939331055, "global_step": 44257, "epoch": 1053} {"train_loss": -5.645610332489014, "global_step": 44258, "epoch": 1053} {"train_loss": -5.524000644683838, "global_step": 44259, "epoch": 1053} {"train_loss": -5.634799003601074, "global_step": 44260, "epoch": 1053} {"train_loss": -5.555298805236816, "global_step": 44261, "epoch": 1053} {"train_loss": -5.692867755889893, "global_step": 44262, "epoch": 1053} {"train_loss": -5.599151611328125, "global_step": 44263, "epoch": 1053} {"train_loss": -5.777444839477539, "global_step": 44264, "epoch": 1053} {"train_loss": -5.575368881225586, "global_step": 44265, "epoch": 1053} {"train_loss": -5.6798248291015625, "global_step": 44266, "epoch": 1053} {"train_loss": -5.656124137696766, "global_step": 44267, "epoch": 1053, "val_loss": 66044.2734375} {"train_loss": -5.7370781898498535, "global_step": 44268, "epoch": 1054} {"train_loss": -5.665065765380859, "global_step": 44269, "epoch": 1054} {"train_loss": -5.634891033172607, "global_step": 44270, "epoch": 1054} {"train_loss": -5.64198112487793, "global_step": 44271, "epoch": 1054} {"train_loss": -5.700838088989258, "global_step": 44272, "epoch": 1054} {"train_loss": -5.699970245361328, "global_step": 44273, "epoch": 1054} {"train_loss": -5.778711318969727, "global_step": 44274, "epoch": 1054} {"train_loss": -5.716136932373047, "global_step": 44275, "epoch": 1054} {"train_loss": -5.6421356201171875, "global_step": 44276, "epoch": 1054} {"train_loss": -5.666454315185547, "global_step": 44277, "epoch": 1054} {"train_loss": -5.825239658355713, "global_step": 44278, "epoch": 1054} {"train_loss": -5.608119964599609, "global_step": 44279, "epoch": 1054} {"train_loss": -5.758506774902344, "global_step": 44280, "epoch": 1054} {"train_loss": -5.656339645385742, "global_step": 44281, "epoch": 1054} {"train_loss": -5.8130269050598145, "global_step": 44282, "epoch": 1054} {"train_loss": -5.657313346862793, "global_step": 44283, "epoch": 1054} {"train_loss": -5.648194313049316, "global_step": 44284, "epoch": 1054} {"train_loss": -5.783570289611816, "global_step": 44285, "epoch": 1054} {"train_loss": -5.6852521896362305, "global_step": 44286, "epoch": 1054} {"train_loss": -5.667211532592773, "global_step": 44287, "epoch": 1054} {"train_loss": -5.536314964294434, "global_step": 44288, "epoch": 1054} {"train_loss": -5.612970352172852, "global_step": 44289, "epoch": 1054} {"train_loss": -5.809316635131836, "global_step": 44290, "epoch": 1054} {"train_loss": -5.7689409255981445, "global_step": 44291, "epoch": 1054} {"train_loss": -5.798583507537842, "global_step": 44292, "epoch": 1054} {"train_loss": -5.799846172332764, "global_step": 44293, "epoch": 1054} {"train_loss": -5.66339111328125, "global_step": 44294, "epoch": 1054} {"train_loss": -5.705689430236816, "global_step": 44295, "epoch": 1054} {"train_loss": -5.754745960235596, "global_step": 44296, "epoch": 1054} {"train_loss": -5.653740882873535, "global_step": 44297, "epoch": 1054} {"train_loss": -5.710911750793457, "global_step": 44298, "epoch": 1054} {"train_loss": -5.535819053649902, "global_step": 44299, "epoch": 1054} {"train_loss": -5.543848037719727, "global_step": 44300, "epoch": 1054} {"train_loss": -5.648149490356445, "global_step": 44301, "epoch": 1054} {"train_loss": -5.559366703033447, "global_step": 44302, "epoch": 1054} {"train_loss": -5.6706743240356445, "global_step": 44303, "epoch": 1054} {"train_loss": -5.601642608642578, "global_step": 44304, "epoch": 1054} {"train_loss": -5.692334175109863, "global_step": 44305, "epoch": 1054} {"train_loss": -5.756406784057617, "global_step": 44306, "epoch": 1054} {"train_loss": -5.792295455932617, "global_step": 44307, "epoch": 1054} {"train_loss": -5.572201728820801, "global_step": 44308, "epoch": 1054} {"train_loss": -5.689805178415208, "global_step": 44309, "epoch": 1054, "val_loss": 66263.078125} {"train_loss": -5.530884742736816, "global_step": 44310, "epoch": 1055} {"train_loss": -5.591401100158691, "global_step": 44311, "epoch": 1055} {"train_loss": -5.744077682495117, "global_step": 44312, "epoch": 1055} {"train_loss": -5.604720115661621, "global_step": 44313, "epoch": 1055} {"train_loss": -5.591756820678711, "global_step": 44314, "epoch": 1055} {"train_loss": -5.657177448272705, "global_step": 44315, "epoch": 1055} {"train_loss": -5.66837215423584, "global_step": 44316, "epoch": 1055} {"train_loss": -5.712854862213135, "global_step": 44317, "epoch": 1055} {"train_loss": -5.653912544250488, "global_step": 44318, "epoch": 1055} {"train_loss": -5.647983074188232, "global_step": 44319, "epoch": 1055} {"train_loss": -5.601370811462402, "global_step": 44320, "epoch": 1055} {"train_loss": -5.683640480041504, "global_step": 44321, "epoch": 1055} {"train_loss": -5.6776862144470215, "global_step": 44322, "epoch": 1055} {"train_loss": -5.79386043548584, "global_step": 44323, "epoch": 1055} {"train_loss": -5.52927827835083, "global_step": 44324, "epoch": 1055} {"train_loss": -5.681947708129883, "global_step": 44325, "epoch": 1055} {"train_loss": -5.616847991943359, "global_step": 44326, "epoch": 1055} {"train_loss": -5.7067108154296875, "global_step": 44327, "epoch": 1055} {"train_loss": -5.558840274810791, "global_step": 44328, "epoch": 1055} {"train_loss": -5.767931938171387, "global_step": 44329, "epoch": 1055} {"train_loss": -5.588179588317871, "global_step": 44330, "epoch": 1055} {"train_loss": -5.715635299682617, "global_step": 44331, "epoch": 1055} {"train_loss": -5.601583480834961, "global_step": 44332, "epoch": 1055} {"train_loss": -5.7216267585754395, "global_step": 44333, "epoch": 1055} {"train_loss": -5.667398452758789, "global_step": 44334, "epoch": 1055} {"train_loss": -5.731122970581055, "global_step": 44335, "epoch": 1055} {"train_loss": -5.679677486419678, "global_step": 44336, "epoch": 1055} {"train_loss": -5.621128559112549, "global_step": 44337, "epoch": 1055} {"train_loss": -5.588566780090332, "global_step": 44338, "epoch": 1055} {"train_loss": -5.747387409210205, "global_step": 44339, "epoch": 1055} {"train_loss": -5.618222236633301, "global_step": 44340, "epoch": 1055} {"train_loss": -5.746055603027344, "global_step": 44341, "epoch": 1055} {"train_loss": -5.626428604125977, "global_step": 44342, "epoch": 1055} {"train_loss": -5.733109951019287, "global_step": 44343, "epoch": 1055} {"train_loss": -5.695961952209473, "global_step": 44344, "epoch": 1055} {"train_loss": -5.672198295593262, "global_step": 44345, "epoch": 1055} {"train_loss": -5.677862167358398, "global_step": 44346, "epoch": 1055} {"train_loss": -5.5823893547058105, "global_step": 44347, "epoch": 1055} {"train_loss": -5.704442024230957, "global_step": 44348, "epoch": 1055} {"train_loss": -5.602981090545654, "global_step": 44349, "epoch": 1055} {"train_loss": -5.594036102294922, "global_step": 44350, "epoch": 1055} {"train_loss": -5.658665395918346, "global_step": 44351, "epoch": 1055, "val_loss": 66299.171875} {"train_loss": -5.614065647125244, "global_step": 44352, "epoch": 1056} {"train_loss": -5.71389102935791, "global_step": 44353, "epoch": 1056} {"train_loss": -5.562263011932373, "global_step": 44354, "epoch": 1056} {"train_loss": -5.599822998046875, "global_step": 44355, "epoch": 1056} {"train_loss": -5.688772201538086, "global_step": 44356, "epoch": 1056} {"train_loss": -5.607893466949463, "global_step": 44357, "epoch": 1056} {"train_loss": -5.692420959472656, "global_step": 44358, "epoch": 1056} {"train_loss": -5.7448530197143555, "global_step": 44359, "epoch": 1056} {"train_loss": -5.551536560058594, "global_step": 44360, "epoch": 1056} {"train_loss": -5.549345970153809, "global_step": 44361, "epoch": 1056} {"train_loss": -5.624659538269043, "global_step": 44362, "epoch": 1056} {"train_loss": -5.602017402648926, "global_step": 44363, "epoch": 1056} {"train_loss": -5.464648723602295, "global_step": 44364, "epoch": 1056} {"train_loss": -5.668784141540527, "global_step": 44365, "epoch": 1056} {"train_loss": -5.543392181396484, "global_step": 44366, "epoch": 1056} {"train_loss": -5.608823776245117, "global_step": 44367, "epoch": 1056} {"train_loss": -5.678840160369873, "global_step": 44368, "epoch": 1056} {"train_loss": -5.79368782043457, "global_step": 44369, "epoch": 1056} {"train_loss": -5.626928329467773, "global_step": 44370, "epoch": 1056} {"train_loss": -5.676353454589844, "global_step": 44371, "epoch": 1056} {"train_loss": -5.657309532165527, "global_step": 44372, "epoch": 1056} {"train_loss": -5.591045379638672, "global_step": 44373, "epoch": 1056} {"train_loss": -5.69937801361084, "global_step": 44374, "epoch": 1056} {"train_loss": -5.637962341308594, "global_step": 44375, "epoch": 1056} {"train_loss": -5.623830318450928, "global_step": 44376, "epoch": 1056} {"train_loss": -5.677586555480957, "global_step": 44377, "epoch": 1056} {"train_loss": -5.680774688720703, "global_step": 44378, "epoch": 1056} {"train_loss": -5.6549577713012695, "global_step": 44379, "epoch": 1056} {"train_loss": -5.794135093688965, "global_step": 44380, "epoch": 1056} {"train_loss": -5.618834018707275, "global_step": 44381, "epoch": 1056} {"train_loss": -5.771356582641602, "global_step": 44382, "epoch": 1056} {"train_loss": -5.82814884185791, "global_step": 44383, "epoch": 1056} {"train_loss": -5.710297107696533, "global_step": 44384, "epoch": 1056} {"train_loss": -5.695335388183594, "global_step": 44385, "epoch": 1056} {"train_loss": -5.520902633666992, "global_step": 44386, "epoch": 1056} {"train_loss": -5.674463272094727, "global_step": 44387, "epoch": 1056} {"train_loss": -5.643826007843018, "global_step": 44388, "epoch": 1056} {"train_loss": -5.69734001159668, "global_step": 44389, "epoch": 1056} {"train_loss": -5.6045989990234375, "global_step": 44390, "epoch": 1056} {"train_loss": -5.6550703048706055, "global_step": 44391, "epoch": 1056} {"train_loss": -5.699004173278809, "global_step": 44392, "epoch": 1056} {"train_loss": -5.650116034916469, "global_step": 44393, "epoch": 1056, "val_loss": 66095.453125} {"train_loss": -5.665821552276611, "global_step": 44394, "epoch": 1057} {"train_loss": -5.709448337554932, "global_step": 44395, "epoch": 1057} {"train_loss": -5.628496170043945, "global_step": 44396, "epoch": 1057} {"train_loss": -5.621401786804199, "global_step": 44397, "epoch": 1057} {"train_loss": -5.685528755187988, "global_step": 44398, "epoch": 1057} {"train_loss": -5.679865837097168, "global_step": 44399, "epoch": 1057} {"train_loss": -5.671200752258301, "global_step": 44400, "epoch": 1057} {"train_loss": -5.758389472961426, "global_step": 44401, "epoch": 1057} {"train_loss": -5.614273548126221, "global_step": 44402, "epoch": 1057} {"train_loss": -5.756796836853027, "global_step": 44403, "epoch": 1057} {"train_loss": -5.841228485107422, "global_step": 44404, "epoch": 1057} {"train_loss": -5.74722146987915, "global_step": 44405, "epoch": 1057} {"train_loss": -5.752339839935303, "global_step": 44406, "epoch": 1057} {"train_loss": -5.7397661209106445, "global_step": 44407, "epoch": 1057} {"train_loss": -5.7466607093811035, "global_step": 44408, "epoch": 1057} {"train_loss": -5.783476829528809, "global_step": 44409, "epoch": 1057} {"train_loss": -5.662443161010742, "global_step": 44410, "epoch": 1057} {"train_loss": -5.835646629333496, "global_step": 44411, "epoch": 1057} {"train_loss": -5.765764236450195, "global_step": 44412, "epoch": 1057} {"train_loss": -5.690986633300781, "global_step": 44413, "epoch": 1057} {"train_loss": -5.682251930236816, "global_step": 44414, "epoch": 1057} {"train_loss": -5.82042121887207, "global_step": 44415, "epoch": 1057} {"train_loss": -5.722289562225342, "global_step": 44416, "epoch": 1057} {"train_loss": -5.70346736907959, "global_step": 44417, "epoch": 1057} {"train_loss": -5.661253929138184, "global_step": 44418, "epoch": 1057} {"train_loss": -5.693291187286377, "global_step": 44419, "epoch": 1057} {"train_loss": -5.79477071762085, "global_step": 44420, "epoch": 1057} {"train_loss": -5.653780937194824, "global_step": 44421, "epoch": 1057} {"train_loss": -5.767886161804199, "global_step": 44422, "epoch": 1057} {"train_loss": -5.77405309677124, "global_step": 44423, "epoch": 1057} {"train_loss": -5.7068376541137695, "global_step": 44424, "epoch": 1057} {"train_loss": -5.656451225280762, "global_step": 44425, "epoch": 1057} {"train_loss": -5.692473888397217, "global_step": 44426, "epoch": 1057} {"train_loss": -5.577823162078857, "global_step": 44427, "epoch": 1057} {"train_loss": -5.785739421844482, "global_step": 44428, "epoch": 1057} {"train_loss": -5.6745405197143555, "global_step": 44429, "epoch": 1057} {"train_loss": -5.589138507843018, "global_step": 44430, "epoch": 1057} {"train_loss": -5.6350250244140625, "global_step": 44431, "epoch": 1057} {"train_loss": -5.661377906799316, "global_step": 44432, "epoch": 1057} {"train_loss": -5.737100601196289, "global_step": 44433, "epoch": 1057} {"train_loss": -5.555625915527344, "global_step": 44434, "epoch": 1057} {"train_loss": -5.699747721354167, "global_step": 44435, "epoch": 1057, "val_loss": 66101.921875} {"train_loss": -5.676465034484863, "global_step": 44436, "epoch": 1058} {"train_loss": -5.800393104553223, "global_step": 44437, "epoch": 1058} {"train_loss": -5.841271877288818, "global_step": 44438, "epoch": 1058} {"train_loss": -5.76603889465332, "global_step": 44439, "epoch": 1058} {"train_loss": -5.744790077209473, "global_step": 44440, "epoch": 1058} {"train_loss": -5.706164360046387, "global_step": 44441, "epoch": 1058} {"train_loss": -5.550046920776367, "global_step": 44442, "epoch": 1058} {"train_loss": -5.6904449462890625, "global_step": 44443, "epoch": 1058} {"train_loss": -5.573067665100098, "global_step": 44444, "epoch": 1058} {"train_loss": -5.630078315734863, "global_step": 44445, "epoch": 1058} {"train_loss": -5.622590065002441, "global_step": 44446, "epoch": 1058} {"train_loss": -5.763985633850098, "global_step": 44447, "epoch": 1058} {"train_loss": -5.758060455322266, "global_step": 44448, "epoch": 1058} {"train_loss": -5.810812950134277, "global_step": 44449, "epoch": 1058} {"train_loss": -5.682466506958008, "global_step": 44450, "epoch": 1058} {"train_loss": -5.736945152282715, "global_step": 44451, "epoch": 1058} {"train_loss": -5.744894981384277, "global_step": 44452, "epoch": 1058} {"train_loss": -5.806296348571777, "global_step": 44453, "epoch": 1058} {"train_loss": -5.709943771362305, "global_step": 44454, "epoch": 1058} {"train_loss": -5.69407844543457, "global_step": 44455, "epoch": 1058} {"train_loss": -5.786766052246094, "global_step": 44456, "epoch": 1058} {"train_loss": -5.607049942016602, "global_step": 44457, "epoch": 1058} {"train_loss": -5.700366020202637, "global_step": 44458, "epoch": 1058} {"train_loss": -5.607569694519043, "global_step": 44459, "epoch": 1058} {"train_loss": -5.585421085357666, "global_step": 44460, "epoch": 1058} {"train_loss": -5.627182960510254, "global_step": 44461, "epoch": 1058} {"train_loss": -5.733711242675781, "global_step": 44462, "epoch": 1058} {"train_loss": -5.73819637298584, "global_step": 44463, "epoch": 1058} {"train_loss": -5.601949691772461, "global_step": 44464, "epoch": 1058} {"train_loss": -5.742213726043701, "global_step": 44465, "epoch": 1058} {"train_loss": -5.658617973327637, "global_step": 44466, "epoch": 1058} {"train_loss": -5.652842998504639, "global_step": 44467, "epoch": 1058} {"train_loss": -5.826240539550781, "global_step": 44468, "epoch": 1058} {"train_loss": -5.694444179534912, "global_step": 44469, "epoch": 1058} {"train_loss": -5.597665309906006, "global_step": 44470, "epoch": 1058} {"train_loss": -5.697589874267578, "global_step": 44471, "epoch": 1058} {"train_loss": -5.636301040649414, "global_step": 44472, "epoch": 1058} {"train_loss": -5.609434127807617, "global_step": 44473, "epoch": 1058} {"train_loss": -5.732361793518066, "global_step": 44474, "epoch": 1058} {"train_loss": -5.708025932312012, "global_step": 44475, "epoch": 1058} {"train_loss": -5.590491771697998, "global_step": 44476, "epoch": 1058} {"train_loss": -5.6932505539485385, "global_step": 44477, "epoch": 1058, "val_loss": 66006.4765625} {"train_loss": -5.770923614501953, "global_step": 44478, "epoch": 1059} {"train_loss": -5.725069522857666, "global_step": 44479, "epoch": 1059} {"train_loss": -5.698369979858398, "global_step": 44480, "epoch": 1059} {"train_loss": -5.738142967224121, "global_step": 44481, "epoch": 1059} {"train_loss": -5.650382041931152, "global_step": 44482, "epoch": 1059} {"train_loss": -5.748935699462891, "global_step": 44483, "epoch": 1059} {"train_loss": -5.669829368591309, "global_step": 44484, "epoch": 1059} {"train_loss": -5.538172245025635, "global_step": 44485, "epoch": 1059} {"train_loss": -5.781857490539551, "global_step": 44486, "epoch": 1059} {"train_loss": -5.5243964195251465, "global_step": 44487, "epoch": 1059} {"train_loss": -5.585494041442871, "global_step": 44488, "epoch": 1059} {"train_loss": -5.647133827209473, "global_step": 44489, "epoch": 1059} {"train_loss": -5.561257839202881, "global_step": 44490, "epoch": 1059} {"train_loss": -5.621301174163818, "global_step": 44491, "epoch": 1059} {"train_loss": -5.628520488739014, "global_step": 44492, "epoch": 1059} {"train_loss": -5.60036039352417, "global_step": 44493, "epoch": 1059} {"train_loss": -5.671342372894287, "global_step": 44494, "epoch": 1059} {"train_loss": -5.613903999328613, "global_step": 44495, "epoch": 1059} {"train_loss": -5.565464019775391, "global_step": 44496, "epoch": 1059} {"train_loss": -5.670979022979736, "global_step": 44497, "epoch": 1059} {"train_loss": -5.643984794616699, "global_step": 44498, "epoch": 1059} {"train_loss": -5.702692985534668, "global_step": 44499, "epoch": 1059} {"train_loss": -5.698612213134766, "global_step": 44500, "epoch": 1059} {"train_loss": -5.627379417419434, "global_step": 44501, "epoch": 1059} {"train_loss": -5.645552635192871, "global_step": 44502, "epoch": 1059} {"train_loss": -5.7025957107543945, "global_step": 44503, "epoch": 1059} {"train_loss": -5.6908464431762695, "global_step": 44504, "epoch": 1059} {"train_loss": -5.685510635375977, "global_step": 44505, "epoch": 1059} {"train_loss": -5.729463577270508, "global_step": 44506, "epoch": 1059} {"train_loss": -5.669098854064941, "global_step": 44507, "epoch": 1059} {"train_loss": -5.724615097045898, "global_step": 44508, "epoch": 1059} {"train_loss": -5.660471439361572, "global_step": 44509, "epoch": 1059} {"train_loss": -5.642043113708496, "global_step": 44510, "epoch": 1059} {"train_loss": -5.677918910980225, "global_step": 44511, "epoch": 1059} {"train_loss": -5.708211898803711, "global_step": 44512, "epoch": 1059} {"train_loss": -5.677618503570557, "global_step": 44513, "epoch": 1059} {"train_loss": -5.735655307769775, "global_step": 44514, "epoch": 1059} {"train_loss": -5.734146595001221, "global_step": 44515, "epoch": 1059} {"train_loss": -5.720159530639648, "global_step": 44516, "epoch": 1059} {"train_loss": -5.725454330444336, "global_step": 44517, "epoch": 1059} {"train_loss": -5.667736053466797, "global_step": 44518, "epoch": 1059} {"train_loss": -5.670825890132359, "global_step": 44519, "epoch": 1059, "val_loss": 66431.1171875} {"train_loss": -5.6632843017578125, "global_step": 44520, "epoch": 1060} {"train_loss": -5.712342262268066, "global_step": 44521, "epoch": 1060} {"train_loss": -5.6145758628845215, "global_step": 44522, "epoch": 1060} {"train_loss": -5.7462921142578125, "global_step": 44523, "epoch": 1060} {"train_loss": -5.481110095977783, "global_step": 44524, "epoch": 1060} {"train_loss": -5.57330846786499, "global_step": 44525, "epoch": 1060} {"train_loss": -5.637282371520996, "global_step": 44526, "epoch": 1060} {"train_loss": -5.494383811950684, "global_step": 44527, "epoch": 1060} {"train_loss": -5.763489723205566, "global_step": 44528, "epoch": 1060} {"train_loss": -5.52871036529541, "global_step": 44529, "epoch": 1060} {"train_loss": -5.820961952209473, "global_step": 44530, "epoch": 1060} {"train_loss": -5.633334159851074, "global_step": 44531, "epoch": 1060} {"train_loss": -5.664324760437012, "global_step": 44532, "epoch": 1060} {"train_loss": -5.718051910400391, "global_step": 44533, "epoch": 1060} {"train_loss": -5.491952896118164, "global_step": 44534, "epoch": 1060} {"train_loss": -5.582065582275391, "global_step": 44535, "epoch": 1060} {"train_loss": -5.752150535583496, "global_step": 44536, "epoch": 1060} {"train_loss": -5.664009094238281, "global_step": 44537, "epoch": 1060} {"train_loss": -5.624638080596924, "global_step": 44538, "epoch": 1060} {"train_loss": -5.636028289794922, "global_step": 44539, "epoch": 1060} {"train_loss": -5.527875900268555, "global_step": 44540, "epoch": 1060} {"train_loss": -5.642396926879883, "global_step": 44541, "epoch": 1060} {"train_loss": -5.61207389831543, "global_step": 44542, "epoch": 1060} {"train_loss": -5.831688404083252, "global_step": 44543, "epoch": 1060} {"train_loss": -5.538943290710449, "global_step": 44544, "epoch": 1060} {"train_loss": -5.6352338790893555, "global_step": 44545, "epoch": 1060} {"train_loss": -5.772995471954346, "global_step": 44546, "epoch": 1060} {"train_loss": -5.598628997802734, "global_step": 44547, "epoch": 1060} {"train_loss": -5.642101287841797, "global_step": 44548, "epoch": 1060} {"train_loss": -5.5717267990112305, "global_step": 44549, "epoch": 1060} {"train_loss": -5.716730117797852, "global_step": 44550, "epoch": 1060} {"train_loss": -5.646665573120117, "global_step": 44551, "epoch": 1060} {"train_loss": -5.589716911315918, "global_step": 44552, "epoch": 1060} {"train_loss": -5.872694969177246, "global_step": 44553, "epoch": 1060} {"train_loss": -5.684439659118652, "global_step": 44554, "epoch": 1060} {"train_loss": -5.696786880493164, "global_step": 44555, "epoch": 1060} {"train_loss": -5.688149452209473, "global_step": 44556, "epoch": 1060} {"train_loss": -5.79627799987793, "global_step": 44557, "epoch": 1060} {"train_loss": -5.658602714538574, "global_step": 44558, "epoch": 1060} {"train_loss": -5.722633361816406, "global_step": 44559, "epoch": 1060} {"train_loss": -5.641397476196289, "global_step": 44560, "epoch": 1060} {"train_loss": -5.65600475810823, "global_step": 44561, "epoch": 1060, "val_loss": 66296.828125} {"train_loss": -5.773564338684082, "global_step": 44562, "epoch": 1061} {"train_loss": -5.62031888961792, "global_step": 44563, "epoch": 1061} {"train_loss": -5.724521636962891, "global_step": 44564, "epoch": 1061} {"train_loss": -5.68411111831665, "global_step": 44565, "epoch": 1061} {"train_loss": -5.7052154541015625, "global_step": 44566, "epoch": 1061} {"train_loss": -5.693784713745117, "global_step": 44567, "epoch": 1061} {"train_loss": -5.743345737457275, "global_step": 44568, "epoch": 1061} {"train_loss": -5.589727401733398, "global_step": 44569, "epoch": 1061} {"train_loss": -5.636259078979492, "global_step": 44570, "epoch": 1061} {"train_loss": -5.682604789733887, "global_step": 44571, "epoch": 1061} {"train_loss": -5.756561279296875, "global_step": 44572, "epoch": 1061} {"train_loss": -5.772621154785156, "global_step": 44573, "epoch": 1061} {"train_loss": -5.669231414794922, "global_step": 44574, "epoch": 1061} {"train_loss": -5.592247009277344, "global_step": 44575, "epoch": 1061} {"train_loss": -5.585440158843994, "global_step": 44576, "epoch": 1061} {"train_loss": -5.689399719238281, "global_step": 44577, "epoch": 1061} {"train_loss": -5.585229396820068, "global_step": 44578, "epoch": 1061} {"train_loss": -5.646782875061035, "global_step": 44579, "epoch": 1061} {"train_loss": -5.672275543212891, "global_step": 44580, "epoch": 1061} {"train_loss": -5.632842063903809, "global_step": 44581, "epoch": 1061} {"train_loss": -5.639243125915527, "global_step": 44582, "epoch": 1061} {"train_loss": -5.675692558288574, "global_step": 44583, "epoch": 1061} {"train_loss": -5.645150184631348, "global_step": 44584, "epoch": 1061} {"train_loss": -5.6956377029418945, "global_step": 44585, "epoch": 1061} {"train_loss": -5.696554183959961, "global_step": 44586, "epoch": 1061} {"train_loss": -5.617369651794434, "global_step": 44587, "epoch": 1061} {"train_loss": -5.690591812133789, "global_step": 44588, "epoch": 1061} {"train_loss": -5.677000045776367, "global_step": 44589, "epoch": 1061} {"train_loss": -5.6148271560668945, "global_step": 44590, "epoch": 1061} {"train_loss": -5.753952980041504, "global_step": 44591, "epoch": 1061} {"train_loss": -5.761780738830566, "global_step": 44592, "epoch": 1061} {"train_loss": -5.760834217071533, "global_step": 44593, "epoch": 1061} {"train_loss": -5.630031585693359, "global_step": 44594, "epoch": 1061} {"train_loss": -5.604628562927246, "global_step": 44595, "epoch": 1061} {"train_loss": -5.688090801239014, "global_step": 44596, "epoch": 1061} {"train_loss": -5.561720848083496, "global_step": 44597, "epoch": 1061} {"train_loss": -5.708278656005859, "global_step": 44598, "epoch": 1061} {"train_loss": -5.559623718261719, "global_step": 44599, "epoch": 1061} {"train_loss": -5.740331172943115, "global_step": 44600, "epoch": 1061} {"train_loss": -5.615464210510254, "global_step": 44601, "epoch": 1061} {"train_loss": -5.751341819763184, "global_step": 44602, "epoch": 1061} {"train_loss": -5.668543395541963, "global_step": 44603, "epoch": 1061, "val_loss": 66045.859375} {"train_loss": -5.578996658325195, "global_step": 44604, "epoch": 1062} {"train_loss": -5.704989433288574, "global_step": 44605, "epoch": 1062} {"train_loss": -5.655246734619141, "global_step": 44606, "epoch": 1062} {"train_loss": -5.6055145263671875, "global_step": 44607, "epoch": 1062} {"train_loss": -5.643420696258545, "global_step": 44608, "epoch": 1062} {"train_loss": -5.626197814941406, "global_step": 44609, "epoch": 1062} {"train_loss": -5.713638782501221, "global_step": 44610, "epoch": 1062} {"train_loss": -5.543652534484863, "global_step": 44611, "epoch": 1062} {"train_loss": -5.698873519897461, "global_step": 44612, "epoch": 1062} {"train_loss": -5.745354652404785, "global_step": 44613, "epoch": 1062} {"train_loss": -5.715673446655273, "global_step": 44614, "epoch": 1062} {"train_loss": -5.736437797546387, "global_step": 44615, "epoch": 1062} {"train_loss": -5.592146396636963, "global_step": 44616, "epoch": 1062} {"train_loss": -5.680726051330566, "global_step": 44617, "epoch": 1062} {"train_loss": -5.682803153991699, "global_step": 44618, "epoch": 1062} {"train_loss": -5.561745643615723, "global_step": 44619, "epoch": 1062} {"train_loss": -5.889220714569092, "global_step": 44620, "epoch": 1062} {"train_loss": -5.754451274871826, "global_step": 44621, "epoch": 1062} {"train_loss": -5.669472694396973, "global_step": 44622, "epoch": 1062} {"train_loss": -5.736522197723389, "global_step": 44623, "epoch": 1062} {"train_loss": -5.682187080383301, "global_step": 44624, "epoch": 1062} {"train_loss": -5.685929775238037, "global_step": 44625, "epoch": 1062} {"train_loss": -5.635917663574219, "global_step": 44626, "epoch": 1062} {"train_loss": -5.682100772857666, "global_step": 44627, "epoch": 1062} {"train_loss": -5.7001447677612305, "global_step": 44628, "epoch": 1062} {"train_loss": -5.4769487380981445, "global_step": 44629, "epoch": 1062} {"train_loss": -5.7680816650390625, "global_step": 44630, "epoch": 1062} {"train_loss": -5.691694736480713, "global_step": 44631, "epoch": 1062} {"train_loss": -5.7525634765625, "global_step": 44632, "epoch": 1062} {"train_loss": -5.606909275054932, "global_step": 44633, "epoch": 1062} {"train_loss": -5.7535576820373535, "global_step": 44634, "epoch": 1062} {"train_loss": -5.525012969970703, "global_step": 44635, "epoch": 1062} {"train_loss": -5.6297149658203125, "global_step": 44636, "epoch": 1062} {"train_loss": -5.531611919403076, "global_step": 44637, "epoch": 1062} {"train_loss": -5.71100378036499, "global_step": 44638, "epoch": 1062} {"train_loss": -5.498808860778809, "global_step": 44639, "epoch": 1062} {"train_loss": -5.719634056091309, "global_step": 44640, "epoch": 1062} {"train_loss": -5.652233123779297, "global_step": 44641, "epoch": 1062} {"train_loss": -5.698862552642822, "global_step": 44642, "epoch": 1062} {"train_loss": -5.614792823791504, "global_step": 44643, "epoch": 1062} {"train_loss": -5.589688301086426, "global_step": 44644, "epoch": 1062} {"train_loss": -5.662967261813936, "global_step": 44645, "epoch": 1062, "val_loss": 66449.2421875} {"train_loss": -5.7505645751953125, "global_step": 44646, "epoch": 1063} {"train_loss": -5.6313652992248535, "global_step": 44647, "epoch": 1063} {"train_loss": -5.620720863342285, "global_step": 44648, "epoch": 1063} {"train_loss": -5.558305740356445, "global_step": 44649, "epoch": 1063} {"train_loss": -5.711317539215088, "global_step": 44650, "epoch": 1063} {"train_loss": -5.6929612159729, "global_step": 44651, "epoch": 1063} {"train_loss": -5.6088361740112305, "global_step": 44652, "epoch": 1063} {"train_loss": -5.694852828979492, "global_step": 44653, "epoch": 1063} {"train_loss": -5.629955291748047, "global_step": 44654, "epoch": 1063} {"train_loss": -5.7279438972473145, "global_step": 44655, "epoch": 1063} {"train_loss": -5.671018600463867, "global_step": 44656, "epoch": 1063} {"train_loss": -5.685850143432617, "global_step": 44657, "epoch": 1063} {"train_loss": -5.824200630187988, "global_step": 44658, "epoch": 1063} {"train_loss": -5.796224594116211, "global_step": 44659, "epoch": 1063} {"train_loss": -5.549280166625977, "global_step": 44660, "epoch": 1063} {"train_loss": -5.631836891174316, "global_step": 44661, "epoch": 1063} {"train_loss": -5.702981948852539, "global_step": 44662, "epoch": 1063} {"train_loss": -5.501598358154297, "global_step": 44663, "epoch": 1063} {"train_loss": -5.677939414978027, "global_step": 44664, "epoch": 1063} {"train_loss": -5.683025360107422, "global_step": 44665, "epoch": 1063} {"train_loss": -5.653993606567383, "global_step": 44666, "epoch": 1063} {"train_loss": -5.764277458190918, "global_step": 44667, "epoch": 1063} {"train_loss": -5.759430885314941, "global_step": 44668, "epoch": 1063} {"train_loss": -5.791989326477051, "global_step": 44669, "epoch": 1063} {"train_loss": -5.597718238830566, "global_step": 44670, "epoch": 1063} {"train_loss": -5.696510314941406, "global_step": 44671, "epoch": 1063} {"train_loss": -5.6728363037109375, "global_step": 44672, "epoch": 1063} {"train_loss": -5.726095199584961, "global_step": 44673, "epoch": 1063} {"train_loss": -5.789096832275391, "global_step": 44674, "epoch": 1063} {"train_loss": -5.70920467376709, "global_step": 44675, "epoch": 1063} {"train_loss": -5.637493133544922, "global_step": 44676, "epoch": 1063} {"train_loss": -5.729698181152344, "global_step": 44677, "epoch": 1063} {"train_loss": -5.653406143188477, "global_step": 44678, "epoch": 1063} {"train_loss": -5.653491973876953, "global_step": 44679, "epoch": 1063} {"train_loss": -5.807209491729736, "global_step": 44680, "epoch": 1063} {"train_loss": -5.680319786071777, "global_step": 44681, "epoch": 1063} {"train_loss": -5.692925930023193, "global_step": 44682, "epoch": 1063} {"train_loss": -5.602286338806152, "global_step": 44683, "epoch": 1063} {"train_loss": -5.759340286254883, "global_step": 44684, "epoch": 1063} {"train_loss": -5.767581462860107, "global_step": 44685, "epoch": 1063} {"train_loss": -5.664752960205078, "global_step": 44686, "epoch": 1063} {"train_loss": -5.685726120358422, "global_step": 44687, "epoch": 1063, "val_loss": 65988.1484375} {"train_loss": -5.717410087585449, "global_step": 44688, "epoch": 1064} {"train_loss": -5.646407127380371, "global_step": 44689, "epoch": 1064} {"train_loss": -5.788827419281006, "global_step": 44690, "epoch": 1064} {"train_loss": -5.721794128417969, "global_step": 44691, "epoch": 1064} {"train_loss": -5.671074390411377, "global_step": 44692, "epoch": 1064} {"train_loss": -5.734254360198975, "global_step": 44693, "epoch": 1064} {"train_loss": -5.672901153564453, "global_step": 44694, "epoch": 1064} {"train_loss": -5.571224689483643, "global_step": 44695, "epoch": 1064} {"train_loss": -5.799097061157227, "global_step": 44696, "epoch": 1064} {"train_loss": -5.726119518280029, "global_step": 44697, "epoch": 1064} {"train_loss": -5.530679225921631, "global_step": 44698, "epoch": 1064} {"train_loss": -5.792941093444824, "global_step": 44699, "epoch": 1064} {"train_loss": -5.743888854980469, "global_step": 44700, "epoch": 1064} {"train_loss": -5.589690208435059, "global_step": 44701, "epoch": 1064} {"train_loss": -5.771227836608887, "global_step": 44702, "epoch": 1064} {"train_loss": -5.527707099914551, "global_step": 44703, "epoch": 1064} {"train_loss": -5.584084510803223, "global_step": 44704, "epoch": 1064} {"train_loss": -5.621509075164795, "global_step": 44705, "epoch": 1064} {"train_loss": -5.79033899307251, "global_step": 44706, "epoch": 1064} {"train_loss": -5.70571231842041, "global_step": 44707, "epoch": 1064} {"train_loss": -5.725927829742432, "global_step": 44708, "epoch": 1064} {"train_loss": -5.748342037200928, "global_step": 44709, "epoch": 1064} {"train_loss": -5.7622575759887695, "global_step": 44710, "epoch": 1064} {"train_loss": -5.64965295791626, "global_step": 44711, "epoch": 1064} {"train_loss": -5.768507957458496, "global_step": 44712, "epoch": 1064} {"train_loss": -5.664268970489502, "global_step": 44713, "epoch": 1064} {"train_loss": -5.7606635093688965, "global_step": 44714, "epoch": 1064} {"train_loss": -5.596678733825684, "global_step": 44715, "epoch": 1064} {"train_loss": -5.722393989562988, "global_step": 44716, "epoch": 1064} {"train_loss": -5.652103900909424, "global_step": 44717, "epoch": 1064} {"train_loss": -5.638385772705078, "global_step": 44718, "epoch": 1064} {"train_loss": -5.735063552856445, "global_step": 44719, "epoch": 1064} {"train_loss": -5.643669128417969, "global_step": 44720, "epoch": 1064} {"train_loss": -5.697265625, "global_step": 44721, "epoch": 1064} {"train_loss": -5.703275680541992, "global_step": 44722, "epoch": 1064} {"train_loss": -5.6876068115234375, "global_step": 44723, "epoch": 1064} {"train_loss": -5.7619099617004395, "global_step": 44724, "epoch": 1064} {"train_loss": -5.7709221839904785, "global_step": 44725, "epoch": 1064} {"train_loss": -5.687994956970215, "global_step": 44726, "epoch": 1064} {"train_loss": -5.601932048797607, "global_step": 44727, "epoch": 1064} {"train_loss": -5.706641674041748, "global_step": 44728, "epoch": 1064} {"train_loss": -5.6945770354498, "global_step": 44729, "epoch": 1064, "val_loss": 66288.359375} {"train_loss": -5.731228828430176, "global_step": 44730, "epoch": 1065} {"train_loss": -5.856374740600586, "global_step": 44731, "epoch": 1065} {"train_loss": -5.660641670227051, "global_step": 44732, "epoch": 1065} {"train_loss": -5.585429668426514, "global_step": 44733, "epoch": 1065} {"train_loss": -5.755189895629883, "global_step": 44734, "epoch": 1065} {"train_loss": -5.775676727294922, "global_step": 44735, "epoch": 1065} {"train_loss": -5.655459403991699, "global_step": 44736, "epoch": 1065} {"train_loss": -5.601846694946289, "global_step": 44737, "epoch": 1065} {"train_loss": -5.625670433044434, "global_step": 44738, "epoch": 1065} {"train_loss": -5.849782943725586, "global_step": 44739, "epoch": 1065} {"train_loss": -5.68205451965332, "global_step": 44740, "epoch": 1065} {"train_loss": -5.711373329162598, "global_step": 44741, "epoch": 1065} {"train_loss": -5.726966857910156, "global_step": 44742, "epoch": 1065} {"train_loss": -5.635201454162598, "global_step": 44743, "epoch": 1065} {"train_loss": -5.607275485992432, "global_step": 44744, "epoch": 1065} {"train_loss": -5.6973185539245605, "global_step": 44745, "epoch": 1065} {"train_loss": -5.637510299682617, "global_step": 44746, "epoch": 1065} {"train_loss": -5.60445499420166, "global_step": 44747, "epoch": 1065} {"train_loss": -5.636026382446289, "global_step": 44748, "epoch": 1065} {"train_loss": -5.625575065612793, "global_step": 44749, "epoch": 1065} {"train_loss": -5.824186325073242, "global_step": 44750, "epoch": 1065} {"train_loss": -5.639748573303223, "global_step": 44751, "epoch": 1065} {"train_loss": -5.662868499755859, "global_step": 44752, "epoch": 1065} {"train_loss": -5.797916412353516, "global_step": 44753, "epoch": 1065} {"train_loss": -5.75251579284668, "global_step": 44754, "epoch": 1065} {"train_loss": -5.634246826171875, "global_step": 44755, "epoch": 1065} {"train_loss": -5.611334323883057, "global_step": 44756, "epoch": 1065} {"train_loss": -5.651264667510986, "global_step": 44757, "epoch": 1065} {"train_loss": -5.62652587890625, "global_step": 44758, "epoch": 1065} {"train_loss": -5.669015884399414, "global_step": 44759, "epoch": 1065} {"train_loss": -5.831979751586914, "global_step": 44760, "epoch": 1065} {"train_loss": -5.655428886413574, "global_step": 44761, "epoch": 1065} {"train_loss": -5.53520393371582, "global_step": 44762, "epoch": 1065} {"train_loss": -5.605068206787109, "global_step": 44763, "epoch": 1065} {"train_loss": -5.618109226226807, "global_step": 44764, "epoch": 1065} {"train_loss": -5.586817264556885, "global_step": 44765, "epoch": 1065} {"train_loss": -5.605772018432617, "global_step": 44766, "epoch": 1065} {"train_loss": -5.661677837371826, "global_step": 44767, "epoch": 1065} {"train_loss": -5.656843185424805, "global_step": 44768, "epoch": 1065} {"train_loss": -5.680820465087891, "global_step": 44769, "epoch": 1065} {"train_loss": -5.813632965087891, "global_step": 44770, "epoch": 1065} {"train_loss": -5.675748450415475, "global_step": 44771, "epoch": 1065, "val_loss": 65982.1328125} {"train_loss": -5.631738185882568, "global_step": 44772, "epoch": 1066} {"train_loss": -5.690865516662598, "global_step": 44773, "epoch": 1066} {"train_loss": -5.738101482391357, "global_step": 44774, "epoch": 1066} {"train_loss": -5.754612922668457, "global_step": 44775, "epoch": 1066} {"train_loss": -5.791892051696777, "global_step": 44776, "epoch": 1066} {"train_loss": -5.699489593505859, "global_step": 44777, "epoch": 1066} {"train_loss": -5.7144622802734375, "global_step": 44778, "epoch": 1066} {"train_loss": -5.650172233581543, "global_step": 44779, "epoch": 1066} {"train_loss": -5.761344909667969, "global_step": 44780, "epoch": 1066} {"train_loss": -5.756266117095947, "global_step": 44781, "epoch": 1066} {"train_loss": -5.581885814666748, "global_step": 44782, "epoch": 1066} {"train_loss": -5.727771759033203, "global_step": 44783, "epoch": 1066} {"train_loss": -5.63227653503418, "global_step": 44784, "epoch": 1066} {"train_loss": -5.7222137451171875, "global_step": 44785, "epoch": 1066} {"train_loss": -5.681550979614258, "global_step": 44786, "epoch": 1066} {"train_loss": -5.518796920776367, "global_step": 44787, "epoch": 1066} {"train_loss": -5.7411322593688965, "global_step": 44788, "epoch": 1066} {"train_loss": -5.616002082824707, "global_step": 44789, "epoch": 1066} {"train_loss": -5.681107521057129, "global_step": 44790, "epoch": 1066} {"train_loss": -5.688458442687988, "global_step": 44791, "epoch": 1066} {"train_loss": -5.538020610809326, "global_step": 44792, "epoch": 1066} {"train_loss": -5.679994583129883, "global_step": 44793, "epoch": 1066} {"train_loss": -5.628740310668945, "global_step": 44794, "epoch": 1066} {"train_loss": -5.6469926834106445, "global_step": 44795, "epoch": 1066} {"train_loss": -5.62534236907959, "global_step": 44796, "epoch": 1066} {"train_loss": -5.631633758544922, "global_step": 44797, "epoch": 1066} {"train_loss": -5.705766677856445, "global_step": 44798, "epoch": 1066} {"train_loss": -5.727128028869629, "global_step": 44799, "epoch": 1066} {"train_loss": -5.696081161499023, "global_step": 44800, "epoch": 1066} {"train_loss": -5.706016540527344, "global_step": 44801, "epoch": 1066} {"train_loss": -5.659882068634033, "global_step": 44802, "epoch": 1066} {"train_loss": -5.667464256286621, "global_step": 44803, "epoch": 1066} {"train_loss": -5.717615604400635, "global_step": 44804, "epoch": 1066} {"train_loss": -5.767433166503906, "global_step": 44805, "epoch": 1066} {"train_loss": -5.695930004119873, "global_step": 44806, "epoch": 1066} {"train_loss": -5.647890090942383, "global_step": 44807, "epoch": 1066} {"train_loss": -5.7833099365234375, "global_step": 44808, "epoch": 1066} {"train_loss": -5.657256126403809, "global_step": 44809, "epoch": 1066} {"train_loss": -5.833629608154297, "global_step": 44810, "epoch": 1066} {"train_loss": -5.671135902404785, "global_step": 44811, "epoch": 1066} {"train_loss": -5.657736301422119, "global_step": 44812, "epoch": 1066} {"train_loss": -5.683488085156395, "global_step": 44813, "epoch": 1066, "val_loss": 66609.421875} {"train_loss": -5.584717750549316, "global_step": 44814, "epoch": 1067} {"train_loss": -5.757306098937988, "global_step": 44815, "epoch": 1067} {"train_loss": -5.6585845947265625, "global_step": 44816, "epoch": 1067} {"train_loss": -5.664000511169434, "global_step": 44817, "epoch": 1067} {"train_loss": -5.728937149047852, "global_step": 44818, "epoch": 1067} {"train_loss": -5.667946815490723, "global_step": 44819, "epoch": 1067} {"train_loss": -5.798873424530029, "global_step": 44820, "epoch": 1067} {"train_loss": -5.686868667602539, "global_step": 44821, "epoch": 1067} {"train_loss": -5.812556266784668, "global_step": 44822, "epoch": 1067} {"train_loss": -5.577036380767822, "global_step": 44823, "epoch": 1067} {"train_loss": -5.564725875854492, "global_step": 44824, "epoch": 1067} {"train_loss": -5.791845321655273, "global_step": 44825, "epoch": 1067} {"train_loss": -5.876012802124023, "global_step": 44826, "epoch": 1067} {"train_loss": -5.7596917152404785, "global_step": 44827, "epoch": 1067} {"train_loss": -5.755790710449219, "global_step": 44828, "epoch": 1067} {"train_loss": -5.735036849975586, "global_step": 44829, "epoch": 1067} {"train_loss": -5.6064653396606445, "global_step": 44830, "epoch": 1067} {"train_loss": -5.734328269958496, "global_step": 44831, "epoch": 1067} {"train_loss": -5.709316253662109, "global_step": 44832, "epoch": 1067} {"train_loss": -5.784035682678223, "global_step": 44833, "epoch": 1067} {"train_loss": -5.670212745666504, "global_step": 44834, "epoch": 1067} {"train_loss": -5.820313453674316, "global_step": 44835, "epoch": 1067} {"train_loss": -5.62611198425293, "global_step": 44836, "epoch": 1067} {"train_loss": -5.63327693939209, "global_step": 44837, "epoch": 1067} {"train_loss": -5.713920593261719, "global_step": 44838, "epoch": 1067} {"train_loss": -5.609101295471191, "global_step": 44839, "epoch": 1067} {"train_loss": -5.626834392547607, "global_step": 44840, "epoch": 1067} {"train_loss": -5.720820426940918, "global_step": 44841, "epoch": 1067} {"train_loss": -5.574306488037109, "global_step": 44842, "epoch": 1067} {"train_loss": -5.731168746948242, "global_step": 44843, "epoch": 1067} {"train_loss": -5.67912483215332, "global_step": 44844, "epoch": 1067} {"train_loss": -5.670026779174805, "global_step": 44845, "epoch": 1067} {"train_loss": -5.648067474365234, "global_step": 44846, "epoch": 1067} {"train_loss": -5.757504463195801, "global_step": 44847, "epoch": 1067} {"train_loss": -5.615159034729004, "global_step": 44848, "epoch": 1067} {"train_loss": -5.583036422729492, "global_step": 44849, "epoch": 1067} {"train_loss": -5.63990592956543, "global_step": 44850, "epoch": 1067} {"train_loss": -5.675080299377441, "global_step": 44851, "epoch": 1067} {"train_loss": -5.783687591552734, "global_step": 44852, "epoch": 1067} {"train_loss": -5.6817216873168945, "global_step": 44853, "epoch": 1067} {"train_loss": -5.567218780517578, "global_step": 44854, "epoch": 1067} {"train_loss": -5.687663997922625, "global_step": 44855, "epoch": 1067, "val_loss": 66353.7109375} {"train_loss": -5.698297500610352, "global_step": 44856, "epoch": 1068} {"train_loss": -5.6874918937683105, "global_step": 44857, "epoch": 1068} {"train_loss": -5.8533477783203125, "global_step": 44858, "epoch": 1068} {"train_loss": -5.699952125549316, "global_step": 44859, "epoch": 1068} {"train_loss": -5.672240257263184, "global_step": 44860, "epoch": 1068} {"train_loss": -5.630903244018555, "global_step": 44861, "epoch": 1068} {"train_loss": -5.650064945220947, "global_step": 44862, "epoch": 1068} {"train_loss": -5.683880805969238, "global_step": 44863, "epoch": 1068} {"train_loss": -5.711907386779785, "global_step": 44864, "epoch": 1068} {"train_loss": -5.755914211273193, "global_step": 44865, "epoch": 1068} {"train_loss": -5.780001640319824, "global_step": 44866, "epoch": 1068} {"train_loss": -5.699030876159668, "global_step": 44867, "epoch": 1068} {"train_loss": -5.68182373046875, "global_step": 44868, "epoch": 1068} {"train_loss": -5.659437656402588, "global_step": 44869, "epoch": 1068} {"train_loss": -5.726490020751953, "global_step": 44870, "epoch": 1068} {"train_loss": -5.790801048278809, "global_step": 44871, "epoch": 1068} {"train_loss": -5.660203456878662, "global_step": 44872, "epoch": 1068} {"train_loss": -5.67008113861084, "global_step": 44873, "epoch": 1068} {"train_loss": -5.72562313079834, "global_step": 44874, "epoch": 1068} {"train_loss": -5.731405258178711, "global_step": 44875, "epoch": 1068} {"train_loss": -5.772263526916504, "global_step": 44876, "epoch": 1068} {"train_loss": -5.6885223388671875, "global_step": 44877, "epoch": 1068} {"train_loss": -5.5864105224609375, "global_step": 44878, "epoch": 1068} {"train_loss": -5.714704990386963, "global_step": 44879, "epoch": 1068} {"train_loss": -5.729957580566406, "global_step": 44880, "epoch": 1068} {"train_loss": -5.6700825691223145, "global_step": 44881, "epoch": 1068} {"train_loss": -5.5426411628723145, "global_step": 44882, "epoch": 1068} {"train_loss": -5.779154300689697, "global_step": 44883, "epoch": 1068} {"train_loss": -5.594295978546143, "global_step": 44884, "epoch": 1068} {"train_loss": -5.7517900466918945, "global_step": 44885, "epoch": 1068} {"train_loss": -5.812492370605469, "global_step": 44886, "epoch": 1068} {"train_loss": -5.734926700592041, "global_step": 44887, "epoch": 1068} {"train_loss": -5.6020660400390625, "global_step": 44888, "epoch": 1068} {"train_loss": -5.770667552947998, "global_step": 44889, "epoch": 1068} {"train_loss": -5.696062088012695, "global_step": 44890, "epoch": 1068} {"train_loss": -5.681928634643555, "global_step": 44891, "epoch": 1068} {"train_loss": -5.712536334991455, "global_step": 44892, "epoch": 1068} {"train_loss": -5.751513481140137, "global_step": 44893, "epoch": 1068} {"train_loss": -5.748575210571289, "global_step": 44894, "epoch": 1068} {"train_loss": -5.659828186035156, "global_step": 44895, "epoch": 1068} {"train_loss": -5.71536111831665, "global_step": 44896, "epoch": 1068} {"train_loss": -5.704894894645328, "global_step": 44897, "epoch": 1068, "val_loss": 66295.4453125} {"train_loss": -5.669707775115967, "global_step": 44898, "epoch": 1069} {"train_loss": -5.595034599304199, "global_step": 44899, "epoch": 1069} {"train_loss": -5.655673027038574, "global_step": 44900, "epoch": 1069} {"train_loss": -5.641222953796387, "global_step": 44901, "epoch": 1069} {"train_loss": -5.634193420410156, "global_step": 44902, "epoch": 1069} {"train_loss": -5.738180637359619, "global_step": 44903, "epoch": 1069} {"train_loss": -5.839261531829834, "global_step": 44904, "epoch": 1069} {"train_loss": -5.7866973876953125, "global_step": 44905, "epoch": 1069} {"train_loss": -5.747064590454102, "global_step": 44906, "epoch": 1069} {"train_loss": -5.692276954650879, "global_step": 44907, "epoch": 1069} {"train_loss": -5.6680755615234375, "global_step": 44908, "epoch": 1069} {"train_loss": -5.631956577301025, "global_step": 44909, "epoch": 1069} {"train_loss": -5.687330722808838, "global_step": 44910, "epoch": 1069} {"train_loss": -5.702624320983887, "global_step": 44911, "epoch": 1069} {"train_loss": -5.827577590942383, "global_step": 44912, "epoch": 1069} {"train_loss": -5.690692901611328, "global_step": 44913, "epoch": 1069} {"train_loss": -5.689915657043457, "global_step": 44914, "epoch": 1069} {"train_loss": -5.646040439605713, "global_step": 44915, "epoch": 1069} {"train_loss": -5.637829303741455, "global_step": 44916, "epoch": 1069} {"train_loss": -5.590253829956055, "global_step": 44917, "epoch": 1069} {"train_loss": -5.803773880004883, "global_step": 44918, "epoch": 1069} {"train_loss": -5.653387546539307, "global_step": 44919, "epoch": 1069} {"train_loss": -5.588769912719727, "global_step": 44920, "epoch": 1069} {"train_loss": -5.590290069580078, "global_step": 44921, "epoch": 1069} {"train_loss": -5.7851972579956055, "global_step": 44922, "epoch": 1069} {"train_loss": -5.592136859893799, "global_step": 44923, "epoch": 1069} {"train_loss": -5.602029800415039, "global_step": 44924, "epoch": 1069} {"train_loss": -5.76817512512207, "global_step": 44925, "epoch": 1069} {"train_loss": -5.678023338317871, "global_step": 44926, "epoch": 1069} {"train_loss": -5.651750087738037, "global_step": 44927, "epoch": 1069} {"train_loss": -5.775683403015137, "global_step": 44928, "epoch": 1069} {"train_loss": -5.700927257537842, "global_step": 44929, "epoch": 1069} {"train_loss": -5.771612167358398, "global_step": 44930, "epoch": 1069} {"train_loss": -5.58983039855957, "global_step": 44931, "epoch": 1069} {"train_loss": -5.695930004119873, "global_step": 44932, "epoch": 1069} {"train_loss": -5.761399269104004, "global_step": 44933, "epoch": 1069} {"train_loss": -5.575160980224609, "global_step": 44934, "epoch": 1069} {"train_loss": -5.889806747436523, "global_step": 44935, "epoch": 1069} {"train_loss": -5.642364501953125, "global_step": 44936, "epoch": 1069} {"train_loss": -5.643624305725098, "global_step": 44937, "epoch": 1069} {"train_loss": -5.732901573181152, "global_step": 44938, "epoch": 1069} {"train_loss": -5.688342582611811, "global_step": 44939, "epoch": 1069, "val_loss": 66082.5859375} {"train_loss": -5.6129865646362305, "global_step": 44940, "epoch": 1070} {"train_loss": -5.764127731323242, "global_step": 44941, "epoch": 1070} {"train_loss": -5.724947929382324, "global_step": 44942, "epoch": 1070} {"train_loss": -5.6409912109375, "global_step": 44943, "epoch": 1070} {"train_loss": -5.728657245635986, "global_step": 44944, "epoch": 1070} {"train_loss": -5.593688488006592, "global_step": 44945, "epoch": 1070} {"train_loss": -5.624577522277832, "global_step": 44946, "epoch": 1070} {"train_loss": -5.733006477355957, "global_step": 44947, "epoch": 1070} {"train_loss": -5.7522430419921875, "global_step": 44948, "epoch": 1070} {"train_loss": -5.665422439575195, "global_step": 44949, "epoch": 1070} {"train_loss": -5.5852203369140625, "global_step": 44950, "epoch": 1070} {"train_loss": -5.7155280113220215, "global_step": 44951, "epoch": 1070} {"train_loss": -5.686638832092285, "global_step": 44952, "epoch": 1070} {"train_loss": -5.822389602661133, "global_step": 44953, "epoch": 1070} {"train_loss": -5.751880168914795, "global_step": 44954, "epoch": 1070} {"train_loss": -5.708378791809082, "global_step": 44955, "epoch": 1070} {"train_loss": -5.6334099769592285, "global_step": 44956, "epoch": 1070} {"train_loss": -5.753839492797852, "global_step": 44957, "epoch": 1070} {"train_loss": -5.639662742614746, "global_step": 44958, "epoch": 1070} {"train_loss": -5.7305755615234375, "global_step": 44959, "epoch": 1070} {"train_loss": -5.78175687789917, "global_step": 44960, "epoch": 1070} {"train_loss": -5.749233722686768, "global_step": 44961, "epoch": 1070} {"train_loss": -5.726024627685547, "global_step": 44962, "epoch": 1070} {"train_loss": -5.7908549308776855, "global_step": 44963, "epoch": 1070} {"train_loss": -5.731786727905273, "global_step": 44964, "epoch": 1070} {"train_loss": -5.772614002227783, "global_step": 44965, "epoch": 1070} {"train_loss": -5.7508864402771, "global_step": 44966, "epoch": 1070} {"train_loss": -5.656315803527832, "global_step": 44967, "epoch": 1070} {"train_loss": -5.7965312004089355, "global_step": 44968, "epoch": 1070} {"train_loss": -5.604710102081299, "global_step": 44969, "epoch": 1070} {"train_loss": -5.648221969604492, "global_step": 44970, "epoch": 1070} {"train_loss": -5.575730323791504, "global_step": 44971, "epoch": 1070} {"train_loss": -5.578671455383301, "global_step": 44972, "epoch": 1070} {"train_loss": -5.7057647705078125, "global_step": 44973, "epoch": 1070} {"train_loss": -5.649489402770996, "global_step": 44974, "epoch": 1070} {"train_loss": -5.639676094055176, "global_step": 44975, "epoch": 1070} {"train_loss": -5.628445625305176, "global_step": 44976, "epoch": 1070} {"train_loss": -5.67282772064209, "global_step": 44977, "epoch": 1070} {"train_loss": -5.624245643615723, "global_step": 44978, "epoch": 1070} {"train_loss": -5.737978935241699, "global_step": 44979, "epoch": 1070} {"train_loss": -5.695014953613281, "global_step": 44980, "epoch": 1070} {"train_loss": -5.690755003974552, "global_step": 44981, "epoch": 1070, "val_loss": 66201.8046875} {"train_loss": -5.854372024536133, "global_step": 44982, "epoch": 1071} {"train_loss": -5.547126770019531, "global_step": 44983, "epoch": 1071} {"train_loss": -5.5763678550720215, "global_step": 44984, "epoch": 1071} {"train_loss": -5.664183616638184, "global_step": 44985, "epoch": 1071} {"train_loss": -5.643087387084961, "global_step": 44986, "epoch": 1071} {"train_loss": -5.671098709106445, "global_step": 44987, "epoch": 1071} {"train_loss": -5.540340423583984, "global_step": 44988, "epoch": 1071} {"train_loss": -5.704774856567383, "global_step": 44989, "epoch": 1071} {"train_loss": -5.669034957885742, "global_step": 44990, "epoch": 1071} {"train_loss": -5.7159342765808105, "global_step": 44991, "epoch": 1071} {"train_loss": -5.782292366027832, "global_step": 44992, "epoch": 1071} {"train_loss": -5.651805877685547, "global_step": 44993, "epoch": 1071} {"train_loss": -5.65727424621582, "global_step": 44994, "epoch": 1071} {"train_loss": -5.600100517272949, "global_step": 44995, "epoch": 1071} {"train_loss": -5.641778469085693, "global_step": 44996, "epoch": 1071} {"train_loss": -5.6544575691223145, "global_step": 44997, "epoch": 1071} {"train_loss": -5.664193153381348, "global_step": 44998, "epoch": 1071} {"train_loss": -5.69131326675415, "global_step": 44999, "epoch": 1071} {"train_loss": -5.555665969848633, "global_step": 45000, "epoch": 1071} {"train_loss": -5.640880107879639, "global_step": 45001, "epoch": 1071} {"train_loss": -5.707083225250244, "global_step": 45002, "epoch": 1071} {"train_loss": -5.58607292175293, "global_step": 45003, "epoch": 1071} {"train_loss": -5.698481559753418, "global_step": 45004, "epoch": 1071} {"train_loss": -5.6232733726501465, "global_step": 45005, "epoch": 1071} {"train_loss": -5.6287055015563965, "global_step": 45006, "epoch": 1071} {"train_loss": -5.731821060180664, "global_step": 45007, "epoch": 1071} {"train_loss": -5.770839691162109, "global_step": 45008, "epoch": 1071} {"train_loss": -5.703846454620361, "global_step": 45009, "epoch": 1071} {"train_loss": -5.565279006958008, "global_step": 45010, "epoch": 1071} {"train_loss": -5.731202602386475, "global_step": 45011, "epoch": 1071} {"train_loss": -5.805489540100098, "global_step": 45012, "epoch": 1071} {"train_loss": -5.716835021972656, "global_step": 45013, "epoch": 1071} {"train_loss": -5.7707037925720215, "global_step": 45014, "epoch": 1071} {"train_loss": -5.804245471954346, "global_step": 45015, "epoch": 1071} {"train_loss": -5.5221052169799805, "global_step": 45016, "epoch": 1071} {"train_loss": -5.5929155349731445, "global_step": 45017, "epoch": 1071} {"train_loss": -5.728586196899414, "global_step": 45018, "epoch": 1071} {"train_loss": -5.645137786865234, "global_step": 45019, "epoch": 1071} {"train_loss": -5.755678176879883, "global_step": 45020, "epoch": 1071} {"train_loss": -5.774489879608154, "global_step": 45021, "epoch": 1071} {"train_loss": -5.7319488525390625, "global_step": 45022, "epoch": 1071} {"train_loss": -5.674236490612938, "global_step": 45023, "epoch": 1071, "val_loss": 65936.078125} {"train_loss": -5.686448097229004, "global_step": 45024, "epoch": 1072} {"train_loss": -5.833630561828613, "global_step": 45025, "epoch": 1072} {"train_loss": -5.78741455078125, "global_step": 45026, "epoch": 1072} {"train_loss": -5.7713494300842285, "global_step": 45027, "epoch": 1072} {"train_loss": -5.781133651733398, "global_step": 45028, "epoch": 1072} {"train_loss": -5.745774745941162, "global_step": 45029, "epoch": 1072} {"train_loss": -5.806267261505127, "global_step": 45030, "epoch": 1072} {"train_loss": -5.769580364227295, "global_step": 45031, "epoch": 1072} {"train_loss": -5.532433986663818, "global_step": 45032, "epoch": 1072} {"train_loss": -5.7881598472595215, "global_step": 45033, "epoch": 1072} {"train_loss": -5.951376914978027, "global_step": 45034, "epoch": 1072} {"train_loss": -5.802544116973877, "global_step": 45035, "epoch": 1072} {"train_loss": -5.663750171661377, "global_step": 45036, "epoch": 1072} {"train_loss": -5.679439544677734, "global_step": 45037, "epoch": 1072} {"train_loss": -5.6238789558410645, "global_step": 45038, "epoch": 1072} {"train_loss": -5.681468963623047, "global_step": 45039, "epoch": 1072} {"train_loss": -5.69164514541626, "global_step": 45040, "epoch": 1072} {"train_loss": -5.718472480773926, "global_step": 45041, "epoch": 1072} {"train_loss": -5.641374111175537, "global_step": 45042, "epoch": 1072} {"train_loss": -5.73679256439209, "global_step": 45043, "epoch": 1072} {"train_loss": -5.70208740234375, "global_step": 45044, "epoch": 1072} {"train_loss": -5.748270034790039, "global_step": 45045, "epoch": 1072} {"train_loss": -5.7948126792907715, "global_step": 45046, "epoch": 1072} {"train_loss": -5.543275833129883, "global_step": 45047, "epoch": 1072} {"train_loss": -5.884435653686523, "global_step": 45048, "epoch": 1072} {"train_loss": -5.7110795974731445, "global_step": 45049, "epoch": 1072} {"train_loss": -5.749536514282227, "global_step": 45050, "epoch": 1072} {"train_loss": -5.665257453918457, "global_step": 45051, "epoch": 1072} {"train_loss": -5.650989532470703, "global_step": 45052, "epoch": 1072} {"train_loss": -5.546003341674805, "global_step": 45053, "epoch": 1072} {"train_loss": -5.717267036437988, "global_step": 45054, "epoch": 1072} {"train_loss": -5.758393287658691, "global_step": 45055, "epoch": 1072} {"train_loss": -5.628411293029785, "global_step": 45056, "epoch": 1072} {"train_loss": -5.75691556930542, "global_step": 45057, "epoch": 1072} {"train_loss": -5.59792423248291, "global_step": 45058, "epoch": 1072} {"train_loss": -5.694832801818848, "global_step": 45059, "epoch": 1072} {"train_loss": -5.641919136047363, "global_step": 45060, "epoch": 1072} {"train_loss": -5.617502212524414, "global_step": 45061, "epoch": 1072} {"train_loss": -5.546292304992676, "global_step": 45062, "epoch": 1072} {"train_loss": -5.614309787750244, "global_step": 45063, "epoch": 1072} {"train_loss": -5.665271282196045, "global_step": 45064, "epoch": 1072} {"train_loss": -5.702726443608602, "global_step": 45065, "epoch": 1072, "val_loss": 66302.7734375} {"train_loss": -5.606645584106445, "global_step": 45066, "epoch": 1073} {"train_loss": -5.648961067199707, "global_step": 45067, "epoch": 1073} {"train_loss": -5.68109130859375, "global_step": 45068, "epoch": 1073} {"train_loss": -5.715412616729736, "global_step": 45069, "epoch": 1073} {"train_loss": -5.764029502868652, "global_step": 45070, "epoch": 1073} {"train_loss": -5.495224475860596, "global_step": 45071, "epoch": 1073} {"train_loss": -5.704806327819824, "global_step": 45072, "epoch": 1073} {"train_loss": -5.645942687988281, "global_step": 45073, "epoch": 1073} {"train_loss": -5.708513259887695, "global_step": 45074, "epoch": 1073} {"train_loss": -5.551854133605957, "global_step": 45075, "epoch": 1073} {"train_loss": -5.593958377838135, "global_step": 45076, "epoch": 1073} {"train_loss": -5.701511859893799, "global_step": 45077, "epoch": 1073} {"train_loss": -5.747213363647461, "global_step": 45078, "epoch": 1073} {"train_loss": -5.8838701248168945, "global_step": 45079, "epoch": 1073} {"train_loss": -5.693351745605469, "global_step": 45080, "epoch": 1073} {"train_loss": -5.849953651428223, "global_step": 45081, "epoch": 1073} {"train_loss": -5.7882914543151855, "global_step": 45082, "epoch": 1073} {"train_loss": -5.659371376037598, "global_step": 45083, "epoch": 1073} {"train_loss": -5.820015907287598, "global_step": 45084, "epoch": 1073} {"train_loss": -5.583127021789551, "global_step": 45085, "epoch": 1073} {"train_loss": -5.769256591796875, "global_step": 45086, "epoch": 1073} {"train_loss": -5.694408416748047, "global_step": 45087, "epoch": 1073} {"train_loss": -5.661647796630859, "global_step": 45088, "epoch": 1073} {"train_loss": -5.601539611816406, "global_step": 45089, "epoch": 1073} {"train_loss": -5.64200496673584, "global_step": 45090, "epoch": 1073} {"train_loss": -5.681023597717285, "global_step": 45091, "epoch": 1073} {"train_loss": -5.682222843170166, "global_step": 45092, "epoch": 1073} {"train_loss": -5.688754081726074, "global_step": 45093, "epoch": 1073} {"train_loss": -5.6979851722717285, "global_step": 45094, "epoch": 1073} {"train_loss": -5.729516983032227, "global_step": 45095, "epoch": 1073} {"train_loss": -5.727911949157715, "global_step": 45096, "epoch": 1073} {"train_loss": -5.653205394744873, "global_step": 45097, "epoch": 1073} {"train_loss": -5.679656982421875, "global_step": 45098, "epoch": 1073} {"train_loss": -5.841217994689941, "global_step": 45099, "epoch": 1073} {"train_loss": -5.750177383422852, "global_step": 45100, "epoch": 1073} {"train_loss": -5.76913595199585, "global_step": 45101, "epoch": 1073} {"train_loss": -5.535797119140625, "global_step": 45102, "epoch": 1073} {"train_loss": -5.65650749206543, "global_step": 45103, "epoch": 1073} {"train_loss": -5.587008953094482, "global_step": 45104, "epoch": 1073} {"train_loss": -5.759685516357422, "global_step": 45105, "epoch": 1073} {"train_loss": -5.787533760070801, "global_step": 45106, "epoch": 1073} {"train_loss": -5.695332754225958, "global_step": 45107, "epoch": 1073, "val_loss": 65964.9140625} {"train_loss": -5.691611289978027, "global_step": 45108, "epoch": 1074} {"train_loss": -5.725013732910156, "global_step": 45109, "epoch": 1074} {"train_loss": -5.806082725524902, "global_step": 45110, "epoch": 1074} {"train_loss": -5.703357696533203, "global_step": 45111, "epoch": 1074} {"train_loss": -5.797693729400635, "global_step": 45112, "epoch": 1074} {"train_loss": -5.649299621582031, "global_step": 45113, "epoch": 1074} {"train_loss": -5.647841453552246, "global_step": 45114, "epoch": 1074} {"train_loss": -5.659135818481445, "global_step": 45115, "epoch": 1074} {"train_loss": -5.670071125030518, "global_step": 45116, "epoch": 1074} {"train_loss": -5.639151573181152, "global_step": 45117, "epoch": 1074} {"train_loss": -5.73124361038208, "global_step": 45118, "epoch": 1074} {"train_loss": -5.662313461303711, "global_step": 45119, "epoch": 1074} {"train_loss": -5.792843341827393, "global_step": 45120, "epoch": 1074} {"train_loss": -5.7821364402771, "global_step": 45121, "epoch": 1074} {"train_loss": -5.7479400634765625, "global_step": 45122, "epoch": 1074} {"train_loss": -5.73316764831543, "global_step": 45123, "epoch": 1074} {"train_loss": -5.733609199523926, "global_step": 45124, "epoch": 1074} {"train_loss": -5.715080261230469, "global_step": 45125, "epoch": 1074} {"train_loss": -5.694173336029053, "global_step": 45126, "epoch": 1074} {"train_loss": -5.592662811279297, "global_step": 45127, "epoch": 1074} {"train_loss": -5.6323466300964355, "global_step": 45128, "epoch": 1074} {"train_loss": -5.625707626342773, "global_step": 45129, "epoch": 1074} {"train_loss": -5.843480587005615, "global_step": 45130, "epoch": 1074} {"train_loss": -5.665007591247559, "global_step": 45131, "epoch": 1074} {"train_loss": -5.731062889099121, "global_step": 45132, "epoch": 1074} {"train_loss": -5.605790138244629, "global_step": 45133, "epoch": 1074} {"train_loss": -5.771458148956299, "global_step": 45134, "epoch": 1074} {"train_loss": -5.551558494567871, "global_step": 45135, "epoch": 1074} {"train_loss": -5.657547950744629, "global_step": 45136, "epoch": 1074} {"train_loss": -5.676595687866211, "global_step": 45137, "epoch": 1074} {"train_loss": -5.622777938842773, "global_step": 45138, "epoch": 1074} {"train_loss": -5.811573028564453, "global_step": 45139, "epoch": 1074} {"train_loss": -5.691189289093018, "global_step": 45140, "epoch": 1074} {"train_loss": -5.64488410949707, "global_step": 45141, "epoch": 1074} {"train_loss": -5.634596824645996, "global_step": 45142, "epoch": 1074} {"train_loss": -5.764687538146973, "global_step": 45143, "epoch": 1074} {"train_loss": -5.682153701782227, "global_step": 45144, "epoch": 1074} {"train_loss": -5.625631332397461, "global_step": 45145, "epoch": 1074} {"train_loss": -5.687740325927734, "global_step": 45146, "epoch": 1074} {"train_loss": -5.633360385894775, "global_step": 45147, "epoch": 1074} {"train_loss": -5.727384567260742, "global_step": 45148, "epoch": 1074} {"train_loss": -5.693566719690959, "global_step": 45149, "epoch": 1074, "val_loss": 66003.9140625} {"train_loss": -5.638667106628418, "global_step": 45150, "epoch": 1075} {"train_loss": -5.728232383728027, "global_step": 45151, "epoch": 1075} {"train_loss": -5.573549747467041, "global_step": 45152, "epoch": 1075} {"train_loss": -5.647674083709717, "global_step": 45153, "epoch": 1075} {"train_loss": -5.798239707946777, "global_step": 45154, "epoch": 1075} {"train_loss": -5.603082656860352, "global_step": 45155, "epoch": 1075} {"train_loss": -5.798736572265625, "global_step": 45156, "epoch": 1075} {"train_loss": -5.626224517822266, "global_step": 45157, "epoch": 1075} {"train_loss": -5.8003435134887695, "global_step": 45158, "epoch": 1075} {"train_loss": -5.8335771560668945, "global_step": 45159, "epoch": 1075} {"train_loss": -5.700182914733887, "global_step": 45160, "epoch": 1075} {"train_loss": -5.757643222808838, "global_step": 45161, "epoch": 1075} {"train_loss": -5.760846138000488, "global_step": 45162, "epoch": 1075} {"train_loss": -5.646358013153076, "global_step": 45163, "epoch": 1075} {"train_loss": -5.703974723815918, "global_step": 45164, "epoch": 1075} {"train_loss": -5.698409080505371, "global_step": 45165, "epoch": 1075} {"train_loss": -5.639810562133789, "global_step": 45166, "epoch": 1075} {"train_loss": -5.673295021057129, "global_step": 45167, "epoch": 1075} {"train_loss": -5.641178131103516, "global_step": 45168, "epoch": 1075} {"train_loss": -5.686581611633301, "global_step": 45169, "epoch": 1075} {"train_loss": -5.6748762130737305, "global_step": 45170, "epoch": 1075} {"train_loss": -5.515322685241699, "global_step": 45171, "epoch": 1075} {"train_loss": -5.738180637359619, "global_step": 45172, "epoch": 1075} {"train_loss": -5.723244667053223, "global_step": 45173, "epoch": 1075} {"train_loss": -5.582718849182129, "global_step": 45174, "epoch": 1075} {"train_loss": -5.748344421386719, "global_step": 45175, "epoch": 1075} {"train_loss": -5.607829570770264, "global_step": 45176, "epoch": 1075} {"train_loss": -5.6690473556518555, "global_step": 45177, "epoch": 1075} {"train_loss": -5.640081405639648, "global_step": 45178, "epoch": 1075} {"train_loss": -5.649460792541504, "global_step": 45179, "epoch": 1075} {"train_loss": -5.605457305908203, "global_step": 45180, "epoch": 1075} {"train_loss": -5.697901248931885, "global_step": 45181, "epoch": 1075} {"train_loss": -5.705272674560547, "global_step": 45182, "epoch": 1075} {"train_loss": -5.6360392570495605, "global_step": 45183, "epoch": 1075} {"train_loss": -5.560290336608887, "global_step": 45184, "epoch": 1075} {"train_loss": -5.837335586547852, "global_step": 45185, "epoch": 1075} {"train_loss": -5.707955360412598, "global_step": 45186, "epoch": 1075} {"train_loss": -5.6431884765625, "global_step": 45187, "epoch": 1075} {"train_loss": -5.736819267272949, "global_step": 45188, "epoch": 1075} {"train_loss": -5.894954681396484, "global_step": 45189, "epoch": 1075} {"train_loss": -5.690169811248779, "global_step": 45190, "epoch": 1075} {"train_loss": -5.688367945807321, "global_step": 45191, "epoch": 1075, "val_loss": 66382.8125} {"train_loss": -5.6640625, "global_step": 45192, "epoch": 1076} {"train_loss": -5.628547668457031, "global_step": 45193, "epoch": 1076} {"train_loss": -5.811968803405762, "global_step": 45194, "epoch": 1076} {"train_loss": -5.586730003356934, "global_step": 45195, "epoch": 1076} {"train_loss": -5.605391979217529, "global_step": 45196, "epoch": 1076} {"train_loss": -5.697036266326904, "global_step": 45197, "epoch": 1076} {"train_loss": -5.7519211769104, "global_step": 45198, "epoch": 1076} {"train_loss": -5.685004234313965, "global_step": 45199, "epoch": 1076} {"train_loss": -5.634158611297607, "global_step": 45200, "epoch": 1076} {"train_loss": -5.651752471923828, "global_step": 45201, "epoch": 1076} {"train_loss": -5.733132839202881, "global_step": 45202, "epoch": 1076} {"train_loss": -5.627991676330566, "global_step": 45203, "epoch": 1076} {"train_loss": -5.661521911621094, "global_step": 45204, "epoch": 1076} {"train_loss": -5.727468967437744, "global_step": 45205, "epoch": 1076} {"train_loss": -5.680246353149414, "global_step": 45206, "epoch": 1076} {"train_loss": -5.7579240798950195, "global_step": 45207, "epoch": 1076} {"train_loss": -5.723628044128418, "global_step": 45208, "epoch": 1076} {"train_loss": -5.578213691711426, "global_step": 45209, "epoch": 1076} {"train_loss": -5.6688642501831055, "global_step": 45210, "epoch": 1076} {"train_loss": -5.798378944396973, "global_step": 45211, "epoch": 1076} {"train_loss": -5.634191989898682, "global_step": 45212, "epoch": 1076} {"train_loss": -5.777711868286133, "global_step": 45213, "epoch": 1076} {"train_loss": -5.716974258422852, "global_step": 45214, "epoch": 1076} {"train_loss": -5.715790748596191, "global_step": 45215, "epoch": 1076} {"train_loss": -5.730599880218506, "global_step": 45216, "epoch": 1076} {"train_loss": -5.651693820953369, "global_step": 45217, "epoch": 1076} {"train_loss": -5.7497172355651855, "global_step": 45218, "epoch": 1076} {"train_loss": -5.664328575134277, "global_step": 45219, "epoch": 1076} {"train_loss": -5.743288040161133, "global_step": 45220, "epoch": 1076} {"train_loss": -5.681818962097168, "global_step": 45221, "epoch": 1076} {"train_loss": -5.764681816101074, "global_step": 45222, "epoch": 1076} {"train_loss": -5.6482133865356445, "global_step": 45223, "epoch": 1076} {"train_loss": -5.727066993713379, "global_step": 45224, "epoch": 1076} {"train_loss": -5.735528945922852, "global_step": 45225, "epoch": 1076} {"train_loss": -5.705565452575684, "global_step": 45226, "epoch": 1076} {"train_loss": -5.748112201690674, "global_step": 45227, "epoch": 1076} {"train_loss": -5.704829216003418, "global_step": 45228, "epoch": 1076} {"train_loss": -5.732952117919922, "global_step": 45229, "epoch": 1076} {"train_loss": -5.724401473999023, "global_step": 45230, "epoch": 1076} {"train_loss": -5.474923133850098, "global_step": 45231, "epoch": 1076} {"train_loss": -5.758401870727539, "global_step": 45232, "epoch": 1076} {"train_loss": -5.6928230580829435, "global_step": 45233, "epoch": 1076, "val_loss": 65797.4453125} {"train_loss": -5.657950401306152, "global_step": 45234, "epoch": 1077} {"train_loss": -5.763731956481934, "global_step": 45235, "epoch": 1077} {"train_loss": -5.57255744934082, "global_step": 45236, "epoch": 1077} {"train_loss": -5.612098693847656, "global_step": 45237, "epoch": 1077} {"train_loss": -5.730100631713867, "global_step": 45238, "epoch": 1077} {"train_loss": -5.646158695220947, "global_step": 45239, "epoch": 1077} {"train_loss": -5.764552593231201, "global_step": 45240, "epoch": 1077} {"train_loss": -5.601799488067627, "global_step": 45241, "epoch": 1077} {"train_loss": -5.702112674713135, "global_step": 45242, "epoch": 1077} {"train_loss": -5.790288925170898, "global_step": 45243, "epoch": 1077} {"train_loss": -5.7029218673706055, "global_step": 45244, "epoch": 1077} {"train_loss": -5.639281272888184, "global_step": 45245, "epoch": 1077} {"train_loss": -5.589358329772949, "global_step": 45246, "epoch": 1077} {"train_loss": -5.669322967529297, "global_step": 45247, "epoch": 1077} {"train_loss": -5.685917854309082, "global_step": 45248, "epoch": 1077} {"train_loss": -5.669476509094238, "global_step": 45249, "epoch": 1077} {"train_loss": -5.815055847167969, "global_step": 45250, "epoch": 1077} {"train_loss": -5.625307083129883, "global_step": 45251, "epoch": 1077} {"train_loss": -5.7760725021362305, "global_step": 45252, "epoch": 1077} {"train_loss": -5.6365509033203125, "global_step": 45253, "epoch": 1077} {"train_loss": -5.723476886749268, "global_step": 45254, "epoch": 1077} {"train_loss": -5.6686296463012695, "global_step": 45255, "epoch": 1077} {"train_loss": -5.802594184875488, "global_step": 45256, "epoch": 1077} {"train_loss": -5.696079254150391, "global_step": 45257, "epoch": 1077} {"train_loss": -5.755197525024414, "global_step": 45258, "epoch": 1077} {"train_loss": -5.628552436828613, "global_step": 45259, "epoch": 1077} {"train_loss": -5.576913356781006, "global_step": 45260, "epoch": 1077} {"train_loss": -5.722953796386719, "global_step": 45261, "epoch": 1077} {"train_loss": -5.634099960327148, "global_step": 45262, "epoch": 1077} {"train_loss": -5.771243095397949, "global_step": 45263, "epoch": 1077} {"train_loss": -5.530324935913086, "global_step": 45264, "epoch": 1077} {"train_loss": -5.656161785125732, "global_step": 45265, "epoch": 1077} {"train_loss": -5.535002708435059, "global_step": 45266, "epoch": 1077} {"train_loss": -5.534309387207031, "global_step": 45267, "epoch": 1077} {"train_loss": -5.737567901611328, "global_step": 45268, "epoch": 1077} {"train_loss": -5.542331695556641, "global_step": 45269, "epoch": 1077} {"train_loss": -5.631504535675049, "global_step": 45270, "epoch": 1077} {"train_loss": -5.521878242492676, "global_step": 45271, "epoch": 1077} {"train_loss": -5.519980430603027, "global_step": 45272, "epoch": 1077} {"train_loss": -5.516029357910156, "global_step": 45273, "epoch": 1077} {"train_loss": -5.661548137664795, "global_step": 45274, "epoch": 1077} {"train_loss": -5.658594619660151, "global_step": 45275, "epoch": 1077, "val_loss": 66314.96875} {"train_loss": -5.723735809326172, "global_step": 45276, "epoch": 1078} {"train_loss": -5.666982173919678, "global_step": 45277, "epoch": 1078} {"train_loss": -5.587445259094238, "global_step": 45278, "epoch": 1078} {"train_loss": -5.633023262023926, "global_step": 45279, "epoch": 1078} {"train_loss": -5.639774799346924, "global_step": 45280, "epoch": 1078} {"train_loss": -5.6794586181640625, "global_step": 45281, "epoch": 1078} {"train_loss": -5.707573890686035, "global_step": 45282, "epoch": 1078} {"train_loss": -5.626621246337891, "global_step": 45283, "epoch": 1078} {"train_loss": -5.689690113067627, "global_step": 45284, "epoch": 1078} {"train_loss": -5.62739372253418, "global_step": 45285, "epoch": 1078} {"train_loss": -5.726871490478516, "global_step": 45286, "epoch": 1078} {"train_loss": -5.540509223937988, "global_step": 45287, "epoch": 1078} {"train_loss": -5.703265190124512, "global_step": 45288, "epoch": 1078} {"train_loss": -5.620415210723877, "global_step": 45289, "epoch": 1078} {"train_loss": -5.662184715270996, "global_step": 45290, "epoch": 1078} {"train_loss": -5.810805320739746, "global_step": 45291, "epoch": 1078} {"train_loss": -5.678892135620117, "global_step": 45292, "epoch": 1078} {"train_loss": -5.626184463500977, "global_step": 45293, "epoch": 1078} {"train_loss": -5.637963771820068, "global_step": 45294, "epoch": 1078} {"train_loss": -5.746883869171143, "global_step": 45295, "epoch": 1078} {"train_loss": -5.860091209411621, "global_step": 45296, "epoch": 1078} {"train_loss": -5.670401096343994, "global_step": 45297, "epoch": 1078} {"train_loss": -5.725541114807129, "global_step": 45298, "epoch": 1078} {"train_loss": -5.73406982421875, "global_step": 45299, "epoch": 1078} {"train_loss": -5.63092565536499, "global_step": 45300, "epoch": 1078} {"train_loss": -5.719278335571289, "global_step": 45301, "epoch": 1078} {"train_loss": -5.775634288787842, "global_step": 45302, "epoch": 1078} {"train_loss": -5.864538192749023, "global_step": 45303, "epoch": 1078} {"train_loss": -5.651088714599609, "global_step": 45304, "epoch": 1078} {"train_loss": -5.657257080078125, "global_step": 45305, "epoch": 1078} {"train_loss": -5.656982421875, "global_step": 45306, "epoch": 1078} {"train_loss": -5.6822896003723145, "global_step": 45307, "epoch": 1078} {"train_loss": -5.64363956451416, "global_step": 45308, "epoch": 1078} {"train_loss": -5.630712032318115, "global_step": 45309, "epoch": 1078} {"train_loss": -5.626100540161133, "global_step": 45310, "epoch": 1078} {"train_loss": -5.75209903717041, "global_step": 45311, "epoch": 1078} {"train_loss": -5.688037872314453, "global_step": 45312, "epoch": 1078} {"train_loss": -5.651348114013672, "global_step": 45313, "epoch": 1078} {"train_loss": -5.771120071411133, "global_step": 45314, "epoch": 1078} {"train_loss": -5.786311626434326, "global_step": 45315, "epoch": 1078} {"train_loss": -5.7523884773254395, "global_step": 45316, "epoch": 1078} {"train_loss": -5.688765446345012, "global_step": 45317, "epoch": 1078, "val_loss": 66316.421875} {"train_loss": -5.696088790893555, "global_step": 45318, "epoch": 1079} {"train_loss": -5.652543544769287, "global_step": 45319, "epoch": 1079} {"train_loss": -5.694818496704102, "global_step": 45320, "epoch": 1079} {"train_loss": -5.6141510009765625, "global_step": 45321, "epoch": 1079} {"train_loss": -5.642384052276611, "global_step": 45322, "epoch": 1079} {"train_loss": -5.778013229370117, "global_step": 45323, "epoch": 1079} {"train_loss": -5.774192810058594, "global_step": 45324, "epoch": 1079} {"train_loss": -5.682271957397461, "global_step": 45325, "epoch": 1079} {"train_loss": -5.690532207489014, "global_step": 45326, "epoch": 1079} {"train_loss": -5.705676078796387, "global_step": 45327, "epoch": 1079} {"train_loss": -5.734641075134277, "global_step": 45328, "epoch": 1079} {"train_loss": -5.615941524505615, "global_step": 45329, "epoch": 1079} {"train_loss": -5.813969612121582, "global_step": 45330, "epoch": 1079} {"train_loss": -5.662402153015137, "global_step": 45331, "epoch": 1079} {"train_loss": -5.793707847595215, "global_step": 45332, "epoch": 1079} {"train_loss": -5.663353443145752, "global_step": 45333, "epoch": 1079} {"train_loss": -5.617781639099121, "global_step": 45334, "epoch": 1079} {"train_loss": -5.845332145690918, "global_step": 45335, "epoch": 1079} {"train_loss": -5.697910308837891, "global_step": 45336, "epoch": 1079} {"train_loss": -5.601131916046143, "global_step": 45337, "epoch": 1079} {"train_loss": -5.6787109375, "global_step": 45338, "epoch": 1079} {"train_loss": -5.703876972198486, "global_step": 45339, "epoch": 1079} {"train_loss": -5.673613548278809, "global_step": 45340, "epoch": 1079} {"train_loss": -5.821807861328125, "global_step": 45341, "epoch": 1079} {"train_loss": -5.790946960449219, "global_step": 45342, "epoch": 1079} {"train_loss": -5.774839401245117, "global_step": 45343, "epoch": 1079} {"train_loss": -5.664485931396484, "global_step": 45344, "epoch": 1079} {"train_loss": -5.638843536376953, "global_step": 45345, "epoch": 1079} {"train_loss": -5.674725532531738, "global_step": 45346, "epoch": 1079} {"train_loss": -5.814797401428223, "global_step": 45347, "epoch": 1079} {"train_loss": -5.689355850219727, "global_step": 45348, "epoch": 1079} {"train_loss": -5.59765100479126, "global_step": 45349, "epoch": 1079} {"train_loss": -5.74677038192749, "global_step": 45350, "epoch": 1079} {"train_loss": -5.667721748352051, "global_step": 45351, "epoch": 1079} {"train_loss": -5.70216703414917, "global_step": 45352, "epoch": 1079} {"train_loss": -5.798101425170898, "global_step": 45353, "epoch": 1079} {"train_loss": -5.737751007080078, "global_step": 45354, "epoch": 1079} {"train_loss": -5.667929649353027, "global_step": 45355, "epoch": 1079} {"train_loss": -5.778262615203857, "global_step": 45356, "epoch": 1079} {"train_loss": -5.6175384521484375, "global_step": 45357, "epoch": 1079} {"train_loss": -5.607200622558594, "global_step": 45358, "epoch": 1079} {"train_loss": -5.7049080190204435, "global_step": 45359, "epoch": 1079, "val_loss": 65969.9375} {"train_loss": -5.791996002197266, "global_step": 45360, "epoch": 1080} {"train_loss": -5.691075325012207, "global_step": 45361, "epoch": 1080} {"train_loss": -5.817022323608398, "global_step": 45362, "epoch": 1080} {"train_loss": -5.740442276000977, "global_step": 45363, "epoch": 1080} {"train_loss": -5.744556427001953, "global_step": 45364, "epoch": 1080} {"train_loss": -5.638134956359863, "global_step": 45365, "epoch": 1080} {"train_loss": -5.7885565757751465, "global_step": 45366, "epoch": 1080} {"train_loss": -5.692903518676758, "global_step": 45367, "epoch": 1080} {"train_loss": -5.600616931915283, "global_step": 45368, "epoch": 1080} {"train_loss": -5.607171058654785, "global_step": 45369, "epoch": 1080} {"train_loss": -5.719204902648926, "global_step": 45370, "epoch": 1080} {"train_loss": -5.679823398590088, "global_step": 45371, "epoch": 1080} {"train_loss": -5.547095775604248, "global_step": 45372, "epoch": 1080} {"train_loss": -5.738438606262207, "global_step": 45373, "epoch": 1080} {"train_loss": -5.6394147872924805, "global_step": 45374, "epoch": 1080} {"train_loss": -5.718207359313965, "global_step": 45375, "epoch": 1080} {"train_loss": -5.677247047424316, "global_step": 45376, "epoch": 1080} {"train_loss": -5.691384792327881, "global_step": 45377, "epoch": 1080} {"train_loss": -5.702437400817871, "global_step": 45378, "epoch": 1080} {"train_loss": -5.681026935577393, "global_step": 45379, "epoch": 1080} {"train_loss": -5.740222930908203, "global_step": 45380, "epoch": 1080} {"train_loss": -5.740400791168213, "global_step": 45381, "epoch": 1080} {"train_loss": -5.687111854553223, "global_step": 45382, "epoch": 1080} {"train_loss": -5.684800148010254, "global_step": 45383, "epoch": 1080} {"train_loss": -5.624226093292236, "global_step": 45384, "epoch": 1080} {"train_loss": -5.719770431518555, "global_step": 45385, "epoch": 1080} {"train_loss": -5.724035263061523, "global_step": 45386, "epoch": 1080} {"train_loss": -5.565430641174316, "global_step": 45387, "epoch": 1080} {"train_loss": -5.703639984130859, "global_step": 45388, "epoch": 1080} {"train_loss": -5.795931816101074, "global_step": 45389, "epoch": 1080} {"train_loss": -5.8686909675598145, "global_step": 45390, "epoch": 1080} {"train_loss": -5.694193363189697, "global_step": 45391, "epoch": 1080} {"train_loss": -5.723741054534912, "global_step": 45392, "epoch": 1080} {"train_loss": -5.735827922821045, "global_step": 45393, "epoch": 1080} {"train_loss": -5.641390800476074, "global_step": 45394, "epoch": 1080} {"train_loss": -5.686202526092529, "global_step": 45395, "epoch": 1080} {"train_loss": -5.680306434631348, "global_step": 45396, "epoch": 1080} {"train_loss": -5.675410747528076, "global_step": 45397, "epoch": 1080} {"train_loss": -5.6265482902526855, "global_step": 45398, "epoch": 1080} {"train_loss": -5.7489423751831055, "global_step": 45399, "epoch": 1080} {"train_loss": -5.665755271911621, "global_step": 45400, "epoch": 1080} {"train_loss": -5.701444784800212, "global_step": 45401, "epoch": 1080, "val_loss": 66319.015625} {"train_loss": -5.7186431884765625, "global_step": 45402, "epoch": 1081} {"train_loss": -5.73784875869751, "global_step": 45403, "epoch": 1081} {"train_loss": -5.574054718017578, "global_step": 45404, "epoch": 1081} {"train_loss": -5.8107099533081055, "global_step": 45405, "epoch": 1081} {"train_loss": -5.7502593994140625, "global_step": 45406, "epoch": 1081} {"train_loss": -5.716977119445801, "global_step": 45407, "epoch": 1081} {"train_loss": -5.701949596405029, "global_step": 45408, "epoch": 1081} {"train_loss": -5.7008819580078125, "global_step": 45409, "epoch": 1081} {"train_loss": -5.466184616088867, "global_step": 45410, "epoch": 1081} {"train_loss": -5.6861186027526855, "global_step": 45411, "epoch": 1081} {"train_loss": -5.712144374847412, "global_step": 45412, "epoch": 1081} {"train_loss": -5.713151931762695, "global_step": 45413, "epoch": 1081} {"train_loss": -5.806338310241699, "global_step": 45414, "epoch": 1081} {"train_loss": -5.694339752197266, "global_step": 45415, "epoch": 1081} {"train_loss": -5.7126054763793945, "global_step": 45416, "epoch": 1081} {"train_loss": -5.758937835693359, "global_step": 45417, "epoch": 1081} {"train_loss": -5.570985794067383, "global_step": 45418, "epoch": 1081} {"train_loss": -5.709767818450928, "global_step": 45419, "epoch": 1081} {"train_loss": -5.683178424835205, "global_step": 45420, "epoch": 1081} {"train_loss": -5.749790191650391, "global_step": 45421, "epoch": 1081} {"train_loss": -5.664921760559082, "global_step": 45422, "epoch": 1081} {"train_loss": -5.668033599853516, "global_step": 45423, "epoch": 1081} {"train_loss": -5.667116165161133, "global_step": 45424, "epoch": 1081} {"train_loss": -5.699065208435059, "global_step": 45425, "epoch": 1081} {"train_loss": -5.703083515167236, "global_step": 45426, "epoch": 1081} {"train_loss": -5.774478912353516, "global_step": 45427, "epoch": 1081} {"train_loss": -5.599830627441406, "global_step": 45428, "epoch": 1081} {"train_loss": -5.630999565124512, "global_step": 45429, "epoch": 1081} {"train_loss": -5.623843193054199, "global_step": 45430, "epoch": 1081} {"train_loss": -5.675170421600342, "global_step": 45431, "epoch": 1081} {"train_loss": -5.781832218170166, "global_step": 45432, "epoch": 1081} {"train_loss": -5.675179481506348, "global_step": 45433, "epoch": 1081} {"train_loss": -5.568614482879639, "global_step": 45434, "epoch": 1081} {"train_loss": -5.791867733001709, "global_step": 45435, "epoch": 1081} {"train_loss": -5.632868766784668, "global_step": 45436, "epoch": 1081} {"train_loss": -5.643821716308594, "global_step": 45437, "epoch": 1081} {"train_loss": -5.755487442016602, "global_step": 45438, "epoch": 1081} {"train_loss": -5.662319183349609, "global_step": 45439, "epoch": 1081} {"train_loss": -5.723278999328613, "global_step": 45440, "epoch": 1081} {"train_loss": -5.648674964904785, "global_step": 45441, "epoch": 1081} {"train_loss": -5.708413124084473, "global_step": 45442, "epoch": 1081} {"train_loss": -5.691896325065976, "global_step": 45443, "epoch": 1081, "val_loss": 66099.96875} {"train_loss": -5.713738441467285, "global_step": 45444, "epoch": 1082} {"train_loss": -5.76898717880249, "global_step": 45445, "epoch": 1082} {"train_loss": -5.66628360748291, "global_step": 45446, "epoch": 1082} {"train_loss": -5.802923202514648, "global_step": 45447, "epoch": 1082} {"train_loss": -5.793120384216309, "global_step": 45448, "epoch": 1082} {"train_loss": -5.763155937194824, "global_step": 45449, "epoch": 1082} {"train_loss": -5.786840438842773, "global_step": 45450, "epoch": 1082} {"train_loss": -5.646418571472168, "global_step": 45451, "epoch": 1082} {"train_loss": -5.664509296417236, "global_step": 45452, "epoch": 1082} {"train_loss": -5.678351402282715, "global_step": 45453, "epoch": 1082} {"train_loss": -5.799615859985352, "global_step": 45454, "epoch": 1082} {"train_loss": -5.737419605255127, "global_step": 45455, "epoch": 1082} {"train_loss": -5.819921493530273, "global_step": 45456, "epoch": 1082} {"train_loss": -5.747528076171875, "global_step": 45457, "epoch": 1082} {"train_loss": -5.861544609069824, "global_step": 45458, "epoch": 1082} {"train_loss": -5.617498397827148, "global_step": 45459, "epoch": 1082} {"train_loss": -5.700052261352539, "global_step": 45460, "epoch": 1082} {"train_loss": -5.828178405761719, "global_step": 45461, "epoch": 1082} {"train_loss": -5.469746112823486, "global_step": 45462, "epoch": 1082} {"train_loss": -5.712000370025635, "global_step": 45463, "epoch": 1082} {"train_loss": -5.74625301361084, "global_step": 45464, "epoch": 1082} {"train_loss": -5.617856979370117, "global_step": 45465, "epoch": 1082} {"train_loss": -5.697880744934082, "global_step": 45466, "epoch": 1082} {"train_loss": -5.748299598693848, "global_step": 45467, "epoch": 1082} {"train_loss": -5.502571105957031, "global_step": 45468, "epoch": 1082} {"train_loss": -5.643017768859863, "global_step": 45469, "epoch": 1082} {"train_loss": -5.536102771759033, "global_step": 45470, "epoch": 1082} {"train_loss": -5.57089900970459, "global_step": 45471, "epoch": 1082} {"train_loss": -5.7859368324279785, "global_step": 45472, "epoch": 1082} {"train_loss": -5.466849327087402, "global_step": 45473, "epoch": 1082} {"train_loss": -5.593479156494141, "global_step": 45474, "epoch": 1082} {"train_loss": -5.562740325927734, "global_step": 45475, "epoch": 1082} {"train_loss": -5.639368057250977, "global_step": 45476, "epoch": 1082} {"train_loss": -5.626657485961914, "global_step": 45477, "epoch": 1082} {"train_loss": -5.575390815734863, "global_step": 45478, "epoch": 1082} {"train_loss": -5.71041202545166, "global_step": 45479, "epoch": 1082} {"train_loss": -5.736196041107178, "global_step": 45480, "epoch": 1082} {"train_loss": -5.820210933685303, "global_step": 45481, "epoch": 1082} {"train_loss": -5.666952610015869, "global_step": 45482, "epoch": 1082} {"train_loss": -5.608829498291016, "global_step": 45483, "epoch": 1082} {"train_loss": -5.5302910804748535, "global_step": 45484, "epoch": 1082} {"train_loss": -5.679775805700393, "global_step": 45485, "epoch": 1082, "val_loss": 66161.7578125} {"train_loss": -5.706607818603516, "global_step": 45486, "epoch": 1083} {"train_loss": -5.557539939880371, "global_step": 45487, "epoch": 1083} {"train_loss": -5.7719407081604, "global_step": 45488, "epoch": 1083} {"train_loss": -5.592276573181152, "global_step": 45489, "epoch": 1083} {"train_loss": -5.603798866271973, "global_step": 45490, "epoch": 1083} {"train_loss": -5.590579509735107, "global_step": 45491, "epoch": 1083} {"train_loss": -5.60994815826416, "global_step": 45492, "epoch": 1083} {"train_loss": -5.829301357269287, "global_step": 45493, "epoch": 1083} {"train_loss": -5.651473045349121, "global_step": 45494, "epoch": 1083} {"train_loss": -5.577513217926025, "global_step": 45495, "epoch": 1083} {"train_loss": -5.599981784820557, "global_step": 45496, "epoch": 1083} {"train_loss": -5.637266159057617, "global_step": 45497, "epoch": 1083} {"train_loss": -5.638059616088867, "global_step": 45498, "epoch": 1083} {"train_loss": -5.611757278442383, "global_step": 45499, "epoch": 1083} {"train_loss": -5.753931999206543, "global_step": 45500, "epoch": 1083} {"train_loss": -5.508186340332031, "global_step": 45501, "epoch": 1083} {"train_loss": -5.709620475769043, "global_step": 45502, "epoch": 1083} {"train_loss": -5.673277854919434, "global_step": 45503, "epoch": 1083} {"train_loss": -5.699767112731934, "global_step": 45504, "epoch": 1083} {"train_loss": -5.50371789932251, "global_step": 45505, "epoch": 1083} {"train_loss": -5.786654472351074, "global_step": 45506, "epoch": 1083} {"train_loss": -5.681697845458984, "global_step": 45507, "epoch": 1083} {"train_loss": -5.517608642578125, "global_step": 45508, "epoch": 1083} {"train_loss": -5.742565155029297, "global_step": 45509, "epoch": 1083} {"train_loss": -5.466252326965332, "global_step": 45510, "epoch": 1083} {"train_loss": -5.646034240722656, "global_step": 45511, "epoch": 1083} {"train_loss": -5.665921211242676, "global_step": 45512, "epoch": 1083} {"train_loss": -5.608903884887695, "global_step": 45513, "epoch": 1083} {"train_loss": -5.475893497467041, "global_step": 45514, "epoch": 1083} {"train_loss": -5.780760288238525, "global_step": 45515, "epoch": 1083} {"train_loss": -5.675944805145264, "global_step": 45516, "epoch": 1083} {"train_loss": -5.627019882202148, "global_step": 45517, "epoch": 1083} {"train_loss": -5.616155624389648, "global_step": 45518, "epoch": 1083} {"train_loss": -5.6613078117370605, "global_step": 45519, "epoch": 1083} {"train_loss": -5.630122184753418, "global_step": 45520, "epoch": 1083} {"train_loss": -5.708580017089844, "global_step": 45521, "epoch": 1083} {"train_loss": -5.669356822967529, "global_step": 45522, "epoch": 1083} {"train_loss": -5.674060821533203, "global_step": 45523, "epoch": 1083} {"train_loss": -5.573861122131348, "global_step": 45524, "epoch": 1083} {"train_loss": -5.600219249725342, "global_step": 45525, "epoch": 1083} {"train_loss": -5.476116180419922, "global_step": 45526, "epoch": 1083} {"train_loss": -5.636167889549618, "global_step": 45527, "epoch": 1083, "val_loss": 66486.2734375} {"train_loss": -5.519129753112793, "global_step": 45528, "epoch": 1084} {"train_loss": -5.658079624176025, "global_step": 45529, "epoch": 1084} {"train_loss": -5.783976078033447, "global_step": 45530, "epoch": 1084} {"train_loss": -5.558483123779297, "global_step": 45531, "epoch": 1084} {"train_loss": -5.5320634841918945, "global_step": 45532, "epoch": 1084} {"train_loss": -5.5775322914123535, "global_step": 45533, "epoch": 1084} {"train_loss": -5.651735305786133, "global_step": 45534, "epoch": 1084} {"train_loss": -5.7099833488464355, "global_step": 45535, "epoch": 1084} {"train_loss": -5.656704902648926, "global_step": 45536, "epoch": 1084} {"train_loss": -5.475133895874023, "global_step": 45537, "epoch": 1084} {"train_loss": -5.73831844329834, "global_step": 45538, "epoch": 1084} {"train_loss": -5.678526878356934, "global_step": 45539, "epoch": 1084} {"train_loss": -5.712004661560059, "global_step": 45540, "epoch": 1084} {"train_loss": -5.677095890045166, "global_step": 45541, "epoch": 1084} {"train_loss": -5.682185173034668, "global_step": 45542, "epoch": 1084} {"train_loss": -5.648982048034668, "global_step": 45543, "epoch": 1084} {"train_loss": -5.60288143157959, "global_step": 45544, "epoch": 1084} {"train_loss": -5.803294658660889, "global_step": 45545, "epoch": 1084} {"train_loss": -5.701348781585693, "global_step": 45546, "epoch": 1084} {"train_loss": -5.754931449890137, "global_step": 45547, "epoch": 1084} {"train_loss": -5.6755595207214355, "global_step": 45548, "epoch": 1084} {"train_loss": -5.7083659172058105, "global_step": 45549, "epoch": 1084} {"train_loss": -5.70089054107666, "global_step": 45550, "epoch": 1084} {"train_loss": -5.707015037536621, "global_step": 45551, "epoch": 1084} {"train_loss": -5.70540189743042, "global_step": 45552, "epoch": 1084} {"train_loss": -5.586650371551514, "global_step": 45553, "epoch": 1084} {"train_loss": -5.710582733154297, "global_step": 45554, "epoch": 1084} {"train_loss": -5.841022491455078, "global_step": 45555, "epoch": 1084} {"train_loss": -5.80492639541626, "global_step": 45556, "epoch": 1084} {"train_loss": -5.826199531555176, "global_step": 45557, "epoch": 1084} {"train_loss": -5.755277633666992, "global_step": 45558, "epoch": 1084} {"train_loss": -5.7381110191345215, "global_step": 45559, "epoch": 1084} {"train_loss": -5.811611175537109, "global_step": 45560, "epoch": 1084} {"train_loss": -5.665902614593506, "global_step": 45561, "epoch": 1084} {"train_loss": -5.759237766265869, "global_step": 45562, "epoch": 1084} {"train_loss": -5.684569358825684, "global_step": 45563, "epoch": 1084} {"train_loss": -5.634713649749756, "global_step": 45564, "epoch": 1084} {"train_loss": -5.640347480773926, "global_step": 45565, "epoch": 1084} {"train_loss": -5.7068586349487305, "global_step": 45566, "epoch": 1084} {"train_loss": -5.588067531585693, "global_step": 45567, "epoch": 1084} {"train_loss": -5.70020866394043, "global_step": 45568, "epoch": 1084} {"train_loss": -5.6872049286251976, "global_step": 45569, "epoch": 1084, "val_loss": 66062.09375} {"train_loss": -5.807356834411621, "global_step": 45570, "epoch": 1085} {"train_loss": -5.651968955993652, "global_step": 45571, "epoch": 1085} {"train_loss": -5.842562675476074, "global_step": 45572, "epoch": 1085} {"train_loss": -5.694730758666992, "global_step": 45573, "epoch": 1085} {"train_loss": -5.749988555908203, "global_step": 45574, "epoch": 1085} {"train_loss": -5.7340593338012695, "global_step": 45575, "epoch": 1085} {"train_loss": -5.882196426391602, "global_step": 45576, "epoch": 1085} {"train_loss": -5.568909645080566, "global_step": 45577, "epoch": 1085} {"train_loss": -5.716862678527832, "global_step": 45578, "epoch": 1085} {"train_loss": -5.650119304656982, "global_step": 45579, "epoch": 1085} {"train_loss": -5.672800064086914, "global_step": 45580, "epoch": 1085} {"train_loss": -5.750244617462158, "global_step": 45581, "epoch": 1085} {"train_loss": -5.599748134613037, "global_step": 45582, "epoch": 1085} {"train_loss": -5.655782699584961, "global_step": 45583, "epoch": 1085} {"train_loss": -5.7042036056518555, "global_step": 45584, "epoch": 1085} {"train_loss": -5.715713024139404, "global_step": 45585, "epoch": 1085} {"train_loss": -5.5798468589782715, "global_step": 45586, "epoch": 1085} {"train_loss": -5.696769714355469, "global_step": 45587, "epoch": 1085} {"train_loss": -5.630300045013428, "global_step": 45588, "epoch": 1085} {"train_loss": -5.694251537322998, "global_step": 45589, "epoch": 1085} {"train_loss": -5.712928771972656, "global_step": 45590, "epoch": 1085} {"train_loss": -5.760615348815918, "global_step": 45591, "epoch": 1085} {"train_loss": -5.696292877197266, "global_step": 45592, "epoch": 1085} {"train_loss": -5.667769432067871, "global_step": 45593, "epoch": 1085} {"train_loss": -5.718583106994629, "global_step": 45594, "epoch": 1085} {"train_loss": -5.748523712158203, "global_step": 45595, "epoch": 1085} {"train_loss": -5.776558876037598, "global_step": 45596, "epoch": 1085} {"train_loss": -5.748374938964844, "global_step": 45597, "epoch": 1085} {"train_loss": -5.672821998596191, "global_step": 45598, "epoch": 1085} {"train_loss": -5.662738800048828, "global_step": 45599, "epoch": 1085} {"train_loss": -5.677995681762695, "global_step": 45600, "epoch": 1085} {"train_loss": -5.642633438110352, "global_step": 45601, "epoch": 1085} {"train_loss": -5.740546226501465, "global_step": 45602, "epoch": 1085} {"train_loss": -5.649694919586182, "global_step": 45603, "epoch": 1085} {"train_loss": -5.733785152435303, "global_step": 45604, "epoch": 1085} {"train_loss": -5.677553176879883, "global_step": 45605, "epoch": 1085} {"train_loss": -5.522121429443359, "global_step": 45606, "epoch": 1085} {"train_loss": -5.792563438415527, "global_step": 45607, "epoch": 1085} {"train_loss": -5.723113536834717, "global_step": 45608, "epoch": 1085} {"train_loss": -5.677178382873535, "global_step": 45609, "epoch": 1085} {"train_loss": -5.697565078735352, "global_step": 45610, "epoch": 1085} {"train_loss": -5.697979416166033, "global_step": 45611, "epoch": 1085, "val_loss": 66361.375} {"train_loss": -5.651543617248535, "global_step": 45612, "epoch": 1086} {"train_loss": -5.6730146408081055, "global_step": 45613, "epoch": 1086} {"train_loss": -5.692163467407227, "global_step": 45614, "epoch": 1086} {"train_loss": -5.696532249450684, "global_step": 45615, "epoch": 1086} {"train_loss": -5.837884902954102, "global_step": 45616, "epoch": 1086} {"train_loss": -5.8615522384643555, "global_step": 45617, "epoch": 1086} {"train_loss": -5.7064738273620605, "global_step": 45618, "epoch": 1086} {"train_loss": -5.6774492263793945, "global_step": 45619, "epoch": 1086} {"train_loss": -5.837400436401367, "global_step": 45620, "epoch": 1086} {"train_loss": -5.7497239112854, "global_step": 45621, "epoch": 1086} {"train_loss": -5.824859619140625, "global_step": 45622, "epoch": 1086} {"train_loss": -5.626091003417969, "global_step": 45623, "epoch": 1086} {"train_loss": -5.837531089782715, "global_step": 45624, "epoch": 1086} {"train_loss": -5.686450004577637, "global_step": 45625, "epoch": 1086} {"train_loss": -5.8138837814331055, "global_step": 45626, "epoch": 1086} {"train_loss": -5.779130935668945, "global_step": 45627, "epoch": 1086} {"train_loss": -5.832386016845703, "global_step": 45628, "epoch": 1086} {"train_loss": -5.8561296463012695, "global_step": 45629, "epoch": 1086} {"train_loss": -5.706543445587158, "global_step": 45630, "epoch": 1086} {"train_loss": -5.729430198669434, "global_step": 45631, "epoch": 1086} {"train_loss": -5.700968265533447, "global_step": 45632, "epoch": 1086} {"train_loss": -5.697228908538818, "global_step": 45633, "epoch": 1086} {"train_loss": -5.72825813293457, "global_step": 45634, "epoch": 1086} {"train_loss": -5.7604570388793945, "global_step": 45635, "epoch": 1086} {"train_loss": -5.670347213745117, "global_step": 45636, "epoch": 1086} {"train_loss": -5.552363395690918, "global_step": 45637, "epoch": 1086} {"train_loss": -5.7433881759643555, "global_step": 45638, "epoch": 1086} {"train_loss": -5.730936527252197, "global_step": 45639, "epoch": 1086} {"train_loss": -5.701924800872803, "global_step": 45640, "epoch": 1086} {"train_loss": -5.654683589935303, "global_step": 45641, "epoch": 1086} {"train_loss": -5.65318489074707, "global_step": 45642, "epoch": 1086} {"train_loss": -5.630444526672363, "global_step": 45643, "epoch": 1086} {"train_loss": -5.774224281311035, "global_step": 45644, "epoch": 1086} {"train_loss": -5.596399307250977, "global_step": 45645, "epoch": 1086} {"train_loss": -5.723294258117676, "global_step": 45646, "epoch": 1086} {"train_loss": -5.8325042724609375, "global_step": 45647, "epoch": 1086} {"train_loss": -5.5799031257629395, "global_step": 45648, "epoch": 1086} {"train_loss": -5.809345245361328, "global_step": 45649, "epoch": 1086} {"train_loss": -5.7682600021362305, "global_step": 45650, "epoch": 1086} {"train_loss": -5.74359655380249, "global_step": 45651, "epoch": 1086} {"train_loss": -5.710458278656006, "global_step": 45652, "epoch": 1086} {"train_loss": -5.726023571831839, "global_step": 45653, "epoch": 1086, "val_loss": 66470.171875} {"train_loss": -5.657061576843262, "global_step": 45654, "epoch": 1087} {"train_loss": -5.793943405151367, "global_step": 45655, "epoch": 1087} {"train_loss": -5.747498035430908, "global_step": 45656, "epoch": 1087} {"train_loss": -5.701058387756348, "global_step": 45657, "epoch": 1087} {"train_loss": -5.754276275634766, "global_step": 45658, "epoch": 1087} {"train_loss": -5.6671624183654785, "global_step": 45659, "epoch": 1087} {"train_loss": -5.769411087036133, "global_step": 45660, "epoch": 1087} {"train_loss": -5.673518180847168, "global_step": 45661, "epoch": 1087} {"train_loss": -5.661240100860596, "global_step": 45662, "epoch": 1087} {"train_loss": -5.558518409729004, "global_step": 45663, "epoch": 1087} {"train_loss": -5.81134033203125, "global_step": 45664, "epoch": 1087} {"train_loss": -5.927453994750977, "global_step": 45665, "epoch": 1087} {"train_loss": -5.855969429016113, "global_step": 45666, "epoch": 1087} {"train_loss": -5.653400421142578, "global_step": 45667, "epoch": 1087} {"train_loss": -5.600474834442139, "global_step": 45668, "epoch": 1087} {"train_loss": -5.610506057739258, "global_step": 45669, "epoch": 1087} {"train_loss": -5.6903605461120605, "global_step": 45670, "epoch": 1087} {"train_loss": -5.667129039764404, "global_step": 45671, "epoch": 1087} {"train_loss": -5.6942973136901855, "global_step": 45672, "epoch": 1087} {"train_loss": -5.742094993591309, "global_step": 45673, "epoch": 1087} {"train_loss": -5.72349739074707, "global_step": 45674, "epoch": 1087} {"train_loss": -5.705685138702393, "global_step": 45675, "epoch": 1087} {"train_loss": -5.659867286682129, "global_step": 45676, "epoch": 1087} {"train_loss": -5.767156600952148, "global_step": 45677, "epoch": 1087} {"train_loss": -5.639508247375488, "global_step": 45678, "epoch": 1087} {"train_loss": -5.729183197021484, "global_step": 45679, "epoch": 1087} {"train_loss": -5.713936805725098, "global_step": 45680, "epoch": 1087} {"train_loss": -5.755618572235107, "global_step": 45681, "epoch": 1087} {"train_loss": -5.540137767791748, "global_step": 45682, "epoch": 1087} {"train_loss": -5.7134599685668945, "global_step": 45683, "epoch": 1087} {"train_loss": -5.698760509490967, "global_step": 45684, "epoch": 1087} {"train_loss": -5.774744033813477, "global_step": 45685, "epoch": 1087} {"train_loss": -5.637964725494385, "global_step": 45686, "epoch": 1087} {"train_loss": -5.704275608062744, "global_step": 45687, "epoch": 1087} {"train_loss": -5.558694362640381, "global_step": 45688, "epoch": 1087} {"train_loss": -5.625980377197266, "global_step": 45689, "epoch": 1087} {"train_loss": -5.72002649307251, "global_step": 45690, "epoch": 1087} {"train_loss": -5.575644493103027, "global_step": 45691, "epoch": 1087} {"train_loss": -5.692870140075684, "global_step": 45692, "epoch": 1087} {"train_loss": -5.721684455871582, "global_step": 45693, "epoch": 1087} {"train_loss": -5.726422309875488, "global_step": 45694, "epoch": 1087} {"train_loss": -5.693816139584496, "global_step": 45695, "epoch": 1087, "val_loss": 66046.640625} {"train_loss": -5.678527355194092, "global_step": 45696, "epoch": 1088} {"train_loss": -5.702661514282227, "global_step": 45697, "epoch": 1088} {"train_loss": -5.72031831741333, "global_step": 45698, "epoch": 1088} {"train_loss": -5.710616111755371, "global_step": 45699, "epoch": 1088} {"train_loss": -5.699217796325684, "global_step": 45700, "epoch": 1088} {"train_loss": -5.744428634643555, "global_step": 45701, "epoch": 1088} {"train_loss": -5.720775604248047, "global_step": 45702, "epoch": 1088} {"train_loss": -5.5960774421691895, "global_step": 45703, "epoch": 1088} {"train_loss": -5.647736549377441, "global_step": 45704, "epoch": 1088} {"train_loss": -5.563979148864746, "global_step": 45705, "epoch": 1088} {"train_loss": -5.5902180671691895, "global_step": 45706, "epoch": 1088} {"train_loss": -5.777939796447754, "global_step": 45707, "epoch": 1088} {"train_loss": -5.642868518829346, "global_step": 45708, "epoch": 1088} {"train_loss": -5.739779472351074, "global_step": 45709, "epoch": 1088} {"train_loss": -5.576440811157227, "global_step": 45710, "epoch": 1088} {"train_loss": -5.803620338439941, "global_step": 45711, "epoch": 1088} {"train_loss": -5.794881343841553, "global_step": 45712, "epoch": 1088} {"train_loss": -5.621938705444336, "global_step": 45713, "epoch": 1088} {"train_loss": -5.767838001251221, "global_step": 45714, "epoch": 1088} {"train_loss": -5.737026691436768, "global_step": 45715, "epoch": 1088} {"train_loss": -5.75577449798584, "global_step": 45716, "epoch": 1088} {"train_loss": -5.72597599029541, "global_step": 45717, "epoch": 1088} {"train_loss": -5.631403923034668, "global_step": 45718, "epoch": 1088} {"train_loss": -5.871702671051025, "global_step": 45719, "epoch": 1088} {"train_loss": -5.748673915863037, "global_step": 45720, "epoch": 1088} {"train_loss": -5.6534013748168945, "global_step": 45721, "epoch": 1088} {"train_loss": -5.715212821960449, "global_step": 45722, "epoch": 1088} {"train_loss": -5.694587707519531, "global_step": 45723, "epoch": 1088} {"train_loss": -5.57136344909668, "global_step": 45724, "epoch": 1088} {"train_loss": -5.593929290771484, "global_step": 45725, "epoch": 1088} {"train_loss": -5.7768402099609375, "global_step": 45726, "epoch": 1088} {"train_loss": -5.849705219268799, "global_step": 45727, "epoch": 1088} {"train_loss": -5.6941986083984375, "global_step": 45728, "epoch": 1088} {"train_loss": -5.685977935791016, "global_step": 45729, "epoch": 1088} {"train_loss": -5.670543670654297, "global_step": 45730, "epoch": 1088} {"train_loss": -5.6830949783325195, "global_step": 45731, "epoch": 1088} {"train_loss": -5.667893409729004, "global_step": 45732, "epoch": 1088} {"train_loss": -5.793087959289551, "global_step": 45733, "epoch": 1088} {"train_loss": -5.651764869689941, "global_step": 45734, "epoch": 1088} {"train_loss": -5.530810356140137, "global_step": 45735, "epoch": 1088} {"train_loss": -5.793475151062012, "global_step": 45736, "epoch": 1088} {"train_loss": -5.694690624872844, "global_step": 45737, "epoch": 1088, "val_loss": 66063.9453125} {"train_loss": -5.833008766174316, "global_step": 45738, "epoch": 1089} {"train_loss": -5.611541748046875, "global_step": 45739, "epoch": 1089} {"train_loss": -5.728512287139893, "global_step": 45740, "epoch": 1089} {"train_loss": -5.801957130432129, "global_step": 45741, "epoch": 1089} {"train_loss": -5.628757953643799, "global_step": 45742, "epoch": 1089} {"train_loss": -5.676945686340332, "global_step": 45743, "epoch": 1089} {"train_loss": -5.604875564575195, "global_step": 45744, "epoch": 1089} {"train_loss": -5.813169002532959, "global_step": 45745, "epoch": 1089} {"train_loss": -5.753012657165527, "global_step": 45746, "epoch": 1089} {"train_loss": -5.735638618469238, "global_step": 45747, "epoch": 1089} {"train_loss": -5.787501335144043, "global_step": 45748, "epoch": 1089} {"train_loss": -5.815024375915527, "global_step": 45749, "epoch": 1089} {"train_loss": -5.787930488586426, "global_step": 45750, "epoch": 1089} {"train_loss": -5.812226295471191, "global_step": 45751, "epoch": 1089} {"train_loss": -5.675365447998047, "global_step": 45752, "epoch": 1089} {"train_loss": -5.677096843719482, "global_step": 45753, "epoch": 1089} {"train_loss": -5.546536445617676, "global_step": 45754, "epoch": 1089} {"train_loss": -5.608489513397217, "global_step": 45755, "epoch": 1089} {"train_loss": -5.720987319946289, "global_step": 45756, "epoch": 1089} {"train_loss": -5.60848331451416, "global_step": 45757, "epoch": 1089} {"train_loss": -5.80792236328125, "global_step": 45758, "epoch": 1089} {"train_loss": -5.7823920249938965, "global_step": 45759, "epoch": 1089} {"train_loss": -5.597307205200195, "global_step": 45760, "epoch": 1089} {"train_loss": -5.739792823791504, "global_step": 45761, "epoch": 1089} {"train_loss": -5.432930946350098, "global_step": 45762, "epoch": 1089} {"train_loss": -5.521434307098389, "global_step": 45763, "epoch": 1089} {"train_loss": -5.6059112548828125, "global_step": 45764, "epoch": 1089} {"train_loss": -5.484784126281738, "global_step": 45765, "epoch": 1089} {"train_loss": -5.743452072143555, "global_step": 45766, "epoch": 1089} {"train_loss": -5.6275954246521, "global_step": 45767, "epoch": 1089} {"train_loss": -5.763214111328125, "global_step": 45768, "epoch": 1089} {"train_loss": -5.644561767578125, "global_step": 45769, "epoch": 1089} {"train_loss": -5.749240398406982, "global_step": 45770, "epoch": 1089} {"train_loss": -5.629100322723389, "global_step": 45771, "epoch": 1089} {"train_loss": -5.694470405578613, "global_step": 45772, "epoch": 1089} {"train_loss": -5.667374610900879, "global_step": 45773, "epoch": 1089} {"train_loss": -5.63827657699585, "global_step": 45774, "epoch": 1089} {"train_loss": -5.742273330688477, "global_step": 45775, "epoch": 1089} {"train_loss": -5.840572834014893, "global_step": 45776, "epoch": 1089} {"train_loss": -5.835145950317383, "global_step": 45777, "epoch": 1089} {"train_loss": -5.73493766784668, "global_step": 45778, "epoch": 1089} {"train_loss": -5.693679616564796, "global_step": 45779, "epoch": 1089, "val_loss": 66216.9453125} {"train_loss": -5.823984146118164, "global_step": 45780, "epoch": 1090} {"train_loss": -5.650908946990967, "global_step": 45781, "epoch": 1090} {"train_loss": -5.59820556640625, "global_step": 45782, "epoch": 1090} {"train_loss": -5.6954145431518555, "global_step": 45783, "epoch": 1090} {"train_loss": -5.662505149841309, "global_step": 45784, "epoch": 1090} {"train_loss": -5.63627290725708, "global_step": 45785, "epoch": 1090} {"train_loss": -5.824726104736328, "global_step": 45786, "epoch": 1090} {"train_loss": -5.607161045074463, "global_step": 45787, "epoch": 1090} {"train_loss": -5.721758842468262, "global_step": 45788, "epoch": 1090} {"train_loss": -5.814203262329102, "global_step": 45789, "epoch": 1090} {"train_loss": -5.580881595611572, "global_step": 45790, "epoch": 1090} {"train_loss": -5.724776268005371, "global_step": 45791, "epoch": 1090} {"train_loss": -5.765419006347656, "global_step": 45792, "epoch": 1090} {"train_loss": -5.798772811889648, "global_step": 45793, "epoch": 1090} {"train_loss": -5.566833972930908, "global_step": 45794, "epoch": 1090} {"train_loss": -5.787070274353027, "global_step": 45795, "epoch": 1090} {"train_loss": -5.852746963500977, "global_step": 45796, "epoch": 1090} {"train_loss": -5.536876678466797, "global_step": 45797, "epoch": 1090} {"train_loss": -5.686902046203613, "global_step": 45798, "epoch": 1090} {"train_loss": -5.8621907234191895, "global_step": 45799, "epoch": 1090} {"train_loss": -5.564266204833984, "global_step": 45800, "epoch": 1090} {"train_loss": -5.73090124130249, "global_step": 45801, "epoch": 1090} {"train_loss": -5.764154434204102, "global_step": 45802, "epoch": 1090} {"train_loss": -5.686775207519531, "global_step": 45803, "epoch": 1090} {"train_loss": -5.611934661865234, "global_step": 45804, "epoch": 1090} {"train_loss": -5.836663722991943, "global_step": 45805, "epoch": 1090} {"train_loss": -5.771121978759766, "global_step": 45806, "epoch": 1090} {"train_loss": -5.734617233276367, "global_step": 45807, "epoch": 1090} {"train_loss": -5.704505920410156, "global_step": 45808, "epoch": 1090} {"train_loss": -5.724617004394531, "global_step": 45809, "epoch": 1090} {"train_loss": -5.7260026931762695, "global_step": 45810, "epoch": 1090} {"train_loss": -5.692943096160889, "global_step": 45811, "epoch": 1090} {"train_loss": -5.6452484130859375, "global_step": 45812, "epoch": 1090} {"train_loss": -5.75372838973999, "global_step": 45813, "epoch": 1090} {"train_loss": -5.724977970123291, "global_step": 45814, "epoch": 1090} {"train_loss": -5.802524566650391, "global_step": 45815, "epoch": 1090} {"train_loss": -5.742717742919922, "global_step": 45816, "epoch": 1090} {"train_loss": -5.666484832763672, "global_step": 45817, "epoch": 1090} {"train_loss": -5.630724906921387, "global_step": 45818, "epoch": 1090} {"train_loss": -5.715007305145264, "global_step": 45819, "epoch": 1090} {"train_loss": -5.605717182159424, "global_step": 45820, "epoch": 1090} {"train_loss": -5.710729496819632, "global_step": 45821, "epoch": 1090, "val_loss": 66003.5546875} {"train_loss": -5.647409915924072, "global_step": 45822, "epoch": 1091} {"train_loss": -5.7559099197387695, "global_step": 45823, "epoch": 1091} {"train_loss": -5.571023464202881, "global_step": 45824, "epoch": 1091} {"train_loss": -5.770596504211426, "global_step": 45825, "epoch": 1091} {"train_loss": -5.586118221282959, "global_step": 45826, "epoch": 1091} {"train_loss": -5.70165491104126, "global_step": 45827, "epoch": 1091} {"train_loss": -5.628584861755371, "global_step": 45828, "epoch": 1091} {"train_loss": -5.60589599609375, "global_step": 45829, "epoch": 1091} {"train_loss": -5.617547035217285, "global_step": 45830, "epoch": 1091} {"train_loss": -5.641904354095459, "global_step": 45831, "epoch": 1091} {"train_loss": -5.670879364013672, "global_step": 45832, "epoch": 1091} {"train_loss": -5.5518646240234375, "global_step": 45833, "epoch": 1091} {"train_loss": -5.713711738586426, "global_step": 45834, "epoch": 1091} {"train_loss": -5.491276741027832, "global_step": 45835, "epoch": 1091} {"train_loss": -5.779849052429199, "global_step": 45836, "epoch": 1091} {"train_loss": -5.657472610473633, "global_step": 45837, "epoch": 1091} {"train_loss": -5.5336809158325195, "global_step": 45838, "epoch": 1091} {"train_loss": -5.619607448577881, "global_step": 45839, "epoch": 1091} {"train_loss": -5.608128547668457, "global_step": 45840, "epoch": 1091} {"train_loss": -5.61052942276001, "global_step": 45841, "epoch": 1091} {"train_loss": -5.734094619750977, "global_step": 45842, "epoch": 1091} {"train_loss": -5.595696449279785, "global_step": 45843, "epoch": 1091} {"train_loss": -5.720834732055664, "global_step": 45844, "epoch": 1091} {"train_loss": -5.6573944091796875, "global_step": 45845, "epoch": 1091} {"train_loss": -5.615342617034912, "global_step": 45846, "epoch": 1091} {"train_loss": -5.648515224456787, "global_step": 45847, "epoch": 1091} {"train_loss": -5.557880878448486, "global_step": 45848, "epoch": 1091} {"train_loss": -5.682161331176758, "global_step": 45849, "epoch": 1091} {"train_loss": -5.611072063446045, "global_step": 45850, "epoch": 1091} {"train_loss": -5.66140604019165, "global_step": 45851, "epoch": 1091} {"train_loss": -5.705551624298096, "global_step": 45852, "epoch": 1091} {"train_loss": -5.56233024597168, "global_step": 45853, "epoch": 1091} {"train_loss": -5.693608283996582, "global_step": 45854, "epoch": 1091} {"train_loss": -5.556687831878662, "global_step": 45855, "epoch": 1091} {"train_loss": -5.716156959533691, "global_step": 45856, "epoch": 1091} {"train_loss": -5.6839399337768555, "global_step": 45857, "epoch": 1091} {"train_loss": -5.653223037719727, "global_step": 45858, "epoch": 1091} {"train_loss": -5.679305076599121, "global_step": 45859, "epoch": 1091} {"train_loss": -5.653895378112793, "global_step": 45860, "epoch": 1091} {"train_loss": -5.794189453125, "global_step": 45861, "epoch": 1091} {"train_loss": -5.541624546051025, "global_step": 45862, "epoch": 1091} {"train_loss": -5.65038259824117, "global_step": 45863, "epoch": 1091, "val_loss": 66762.75} {"train_loss": -5.580615520477295, "global_step": 45864, "epoch": 1092} {"train_loss": -5.820305824279785, "global_step": 45865, "epoch": 1092} {"train_loss": -5.6414384841918945, "global_step": 45866, "epoch": 1092} {"train_loss": -5.648397922515869, "global_step": 45867, "epoch": 1092} {"train_loss": -5.745135307312012, "global_step": 45868, "epoch": 1092} {"train_loss": -5.614304542541504, "global_step": 45869, "epoch": 1092} {"train_loss": -5.798636436462402, "global_step": 45870, "epoch": 1092} {"train_loss": -5.650700569152832, "global_step": 45871, "epoch": 1092} {"train_loss": -5.631756782531738, "global_step": 45872, "epoch": 1092} {"train_loss": -5.57081937789917, "global_step": 45873, "epoch": 1092} {"train_loss": -5.629948139190674, "global_step": 45874, "epoch": 1092} {"train_loss": -5.724313259124756, "global_step": 45875, "epoch": 1092} {"train_loss": -5.753909587860107, "global_step": 45876, "epoch": 1092} {"train_loss": -5.678957462310791, "global_step": 45877, "epoch": 1092} {"train_loss": -5.696634292602539, "global_step": 45878, "epoch": 1092} {"train_loss": -5.837142467498779, "global_step": 45879, "epoch": 1092} {"train_loss": -5.797696113586426, "global_step": 45880, "epoch": 1092} {"train_loss": -5.787684917449951, "global_step": 45881, "epoch": 1092} {"train_loss": -5.750530242919922, "global_step": 45882, "epoch": 1092} {"train_loss": -5.804723262786865, "global_step": 45883, "epoch": 1092} {"train_loss": -5.611907958984375, "global_step": 45884, "epoch": 1092} {"train_loss": -5.658411026000977, "global_step": 45885, "epoch": 1092} {"train_loss": -5.732779502868652, "global_step": 45886, "epoch": 1092} {"train_loss": -5.560683250427246, "global_step": 45887, "epoch": 1092} {"train_loss": -5.666165351867676, "global_step": 45888, "epoch": 1092} {"train_loss": -5.712615013122559, "global_step": 45889, "epoch": 1092} {"train_loss": -5.725316047668457, "global_step": 45890, "epoch": 1092} {"train_loss": -5.766345977783203, "global_step": 45891, "epoch": 1092} {"train_loss": -5.764679431915283, "global_step": 45892, "epoch": 1092} {"train_loss": -5.797006607055664, "global_step": 45893, "epoch": 1092} {"train_loss": -5.667506217956543, "global_step": 45894, "epoch": 1092} {"train_loss": -5.792721748352051, "global_step": 45895, "epoch": 1092} {"train_loss": -5.6431684494018555, "global_step": 45896, "epoch": 1092} {"train_loss": -5.690718650817871, "global_step": 45897, "epoch": 1092} {"train_loss": -5.692221641540527, "global_step": 45898, "epoch": 1092} {"train_loss": -5.518599510192871, "global_step": 45899, "epoch": 1092} {"train_loss": -5.7780561447143555, "global_step": 45900, "epoch": 1092} {"train_loss": -5.559123992919922, "global_step": 45901, "epoch": 1092} {"train_loss": -5.699979305267334, "global_step": 45902, "epoch": 1092} {"train_loss": -5.631639003753662, "global_step": 45903, "epoch": 1092} {"train_loss": -5.6458940505981445, "global_step": 45904, "epoch": 1092} {"train_loss": -5.695947919573102, "global_step": 45905, "epoch": 1092, "val_loss": 66347.578125} {"train_loss": -5.741144180297852, "global_step": 45906, "epoch": 1093} {"train_loss": -5.728149890899658, "global_step": 45907, "epoch": 1093} {"train_loss": -5.9105377197265625, "global_step": 45908, "epoch": 1093} {"train_loss": -5.718577861785889, "global_step": 45909, "epoch": 1093} {"train_loss": -5.741715431213379, "global_step": 45910, "epoch": 1093} {"train_loss": -5.694668292999268, "global_step": 45911, "epoch": 1093} {"train_loss": -5.63261079788208, "global_step": 45912, "epoch": 1093} {"train_loss": -5.700418949127197, "global_step": 45913, "epoch": 1093} {"train_loss": -5.598728179931641, "global_step": 45914, "epoch": 1093} {"train_loss": -5.676693916320801, "global_step": 45915, "epoch": 1093} {"train_loss": -5.677933692932129, "global_step": 45916, "epoch": 1093} {"train_loss": -5.781439304351807, "global_step": 45917, "epoch": 1093} {"train_loss": -5.808689594268799, "global_step": 45918, "epoch": 1093} {"train_loss": -5.631442070007324, "global_step": 45919, "epoch": 1093} {"train_loss": -5.750900745391846, "global_step": 45920, "epoch": 1093} {"train_loss": -5.646004676818848, "global_step": 45921, "epoch": 1093} {"train_loss": -5.758077621459961, "global_step": 45922, "epoch": 1093} {"train_loss": -5.597576141357422, "global_step": 45923, "epoch": 1093} {"train_loss": -5.549400329589844, "global_step": 45924, "epoch": 1093} {"train_loss": -5.664331912994385, "global_step": 45925, "epoch": 1093} {"train_loss": -5.559609413146973, "global_step": 45926, "epoch": 1093} {"train_loss": -5.555521011352539, "global_step": 45927, "epoch": 1093} {"train_loss": -5.743087291717529, "global_step": 45928, "epoch": 1093} {"train_loss": -5.720763683319092, "global_step": 45929, "epoch": 1093} {"train_loss": -5.705036163330078, "global_step": 45930, "epoch": 1093} {"train_loss": -5.638392448425293, "global_step": 45931, "epoch": 1093} {"train_loss": -5.6170430183410645, "global_step": 45932, "epoch": 1093} {"train_loss": -5.726629257202148, "global_step": 45933, "epoch": 1093} {"train_loss": -5.745403289794922, "global_step": 45934, "epoch": 1093} {"train_loss": -5.791264533996582, "global_step": 45935, "epoch": 1093} {"train_loss": -5.80332088470459, "global_step": 45936, "epoch": 1093} {"train_loss": -5.726783275604248, "global_step": 45937, "epoch": 1093} {"train_loss": -5.843810081481934, "global_step": 45938, "epoch": 1093} {"train_loss": -5.663417339324951, "global_step": 45939, "epoch": 1093} {"train_loss": -5.722068786621094, "global_step": 45940, "epoch": 1093} {"train_loss": -5.667391777038574, "global_step": 45941, "epoch": 1093} {"train_loss": -5.663138389587402, "global_step": 45942, "epoch": 1093} {"train_loss": -5.6208882331848145, "global_step": 45943, "epoch": 1093} {"train_loss": -5.734894752502441, "global_step": 45944, "epoch": 1093} {"train_loss": -5.793241500854492, "global_step": 45945, "epoch": 1093} {"train_loss": -5.7562689781188965, "global_step": 45946, "epoch": 1093} {"train_loss": -5.702007282347906, "global_step": 45947, "epoch": 1093, "val_loss": 66040.8359375} {"train_loss": -5.8350396156311035, "global_step": 45948, "epoch": 1094} {"train_loss": -5.711367607116699, "global_step": 45949, "epoch": 1094} {"train_loss": -5.774237632751465, "global_step": 45950, "epoch": 1094} {"train_loss": -5.743997097015381, "global_step": 45951, "epoch": 1094} {"train_loss": -5.8602142333984375, "global_step": 45952, "epoch": 1094} {"train_loss": -5.8263444900512695, "global_step": 45953, "epoch": 1094} {"train_loss": -5.684159278869629, "global_step": 45954, "epoch": 1094} {"train_loss": -5.7980241775512695, "global_step": 45955, "epoch": 1094} {"train_loss": -5.7681379318237305, "global_step": 45956, "epoch": 1094} {"train_loss": -5.791408061981201, "global_step": 45957, "epoch": 1094} {"train_loss": -5.687029838562012, "global_step": 45958, "epoch": 1094} {"train_loss": -5.757462024688721, "global_step": 45959, "epoch": 1094} {"train_loss": -5.685342788696289, "global_step": 45960, "epoch": 1094} {"train_loss": -5.7154035568237305, "global_step": 45961, "epoch": 1094} {"train_loss": -5.654413223266602, "global_step": 45962, "epoch": 1094} {"train_loss": -5.695677280426025, "global_step": 45963, "epoch": 1094} {"train_loss": -5.6874918937683105, "global_step": 45964, "epoch": 1094} {"train_loss": -5.63468599319458, "global_step": 45965, "epoch": 1094} {"train_loss": -5.698166370391846, "global_step": 45966, "epoch": 1094} {"train_loss": -5.7240309715271, "global_step": 45967, "epoch": 1094} {"train_loss": -5.642082214355469, "global_step": 45968, "epoch": 1094} {"train_loss": -5.795828342437744, "global_step": 45969, "epoch": 1094} {"train_loss": -5.604013919830322, "global_step": 45970, "epoch": 1094} {"train_loss": -5.69720458984375, "global_step": 45971, "epoch": 1094} {"train_loss": -5.754118919372559, "global_step": 45972, "epoch": 1094} {"train_loss": -5.605159282684326, "global_step": 45973, "epoch": 1094} {"train_loss": -5.7528910636901855, "global_step": 45974, "epoch": 1094} {"train_loss": -5.56594705581665, "global_step": 45975, "epoch": 1094} {"train_loss": -5.661262512207031, "global_step": 45976, "epoch": 1094} {"train_loss": -5.740212440490723, "global_step": 45977, "epoch": 1094} {"train_loss": -5.767061710357666, "global_step": 45978, "epoch": 1094} {"train_loss": -5.652561187744141, "global_step": 45979, "epoch": 1094} {"train_loss": -5.778580665588379, "global_step": 45980, "epoch": 1094} {"train_loss": -5.609535217285156, "global_step": 45981, "epoch": 1094} {"train_loss": -5.682619571685791, "global_step": 45982, "epoch": 1094} {"train_loss": -5.707102298736572, "global_step": 45983, "epoch": 1094} {"train_loss": -5.821739673614502, "global_step": 45984, "epoch": 1094} {"train_loss": -5.677921772003174, "global_step": 45985, "epoch": 1094} {"train_loss": -5.78950834274292, "global_step": 45986, "epoch": 1094} {"train_loss": -5.755044937133789, "global_step": 45987, "epoch": 1094} {"train_loss": -5.673709869384766, "global_step": 45988, "epoch": 1094} {"train_loss": -5.718032496316092, "global_step": 45989, "epoch": 1094, "val_loss": 66092.1875} {"train_loss": -5.825965881347656, "global_step": 45990, "epoch": 1095} {"train_loss": -5.658451080322266, "global_step": 45991, "epoch": 1095} {"train_loss": -5.829526901245117, "global_step": 45992, "epoch": 1095} {"train_loss": -5.74532413482666, "global_step": 45993, "epoch": 1095} {"train_loss": -5.754701614379883, "global_step": 45994, "epoch": 1095} {"train_loss": -5.920113563537598, "global_step": 45995, "epoch": 1095} {"train_loss": -5.688879013061523, "global_step": 45996, "epoch": 1095} {"train_loss": -5.691869258880615, "global_step": 45997, "epoch": 1095} {"train_loss": -5.5694780349731445, "global_step": 45998, "epoch": 1095} {"train_loss": -5.671906471252441, "global_step": 45999, "epoch": 1095} {"train_loss": -5.648182392120361, "global_step": 46000, "epoch": 1095} {"train_loss": -5.653696060180664, "global_step": 46001, "epoch": 1095} {"train_loss": -5.733173370361328, "global_step": 46002, "epoch": 1095} {"train_loss": -5.698462963104248, "global_step": 46003, "epoch": 1095} {"train_loss": -5.754148006439209, "global_step": 46004, "epoch": 1095} {"train_loss": -5.604097366333008, "global_step": 46005, "epoch": 1095} {"train_loss": -5.731794357299805, "global_step": 46006, "epoch": 1095} {"train_loss": -5.550434112548828, "global_step": 46007, "epoch": 1095} {"train_loss": -5.694940567016602, "global_step": 46008, "epoch": 1095} {"train_loss": -5.795044898986816, "global_step": 46009, "epoch": 1095} {"train_loss": -5.685473442077637, "global_step": 46010, "epoch": 1095} {"train_loss": -5.671369552612305, "global_step": 46011, "epoch": 1095} {"train_loss": -5.6109161376953125, "global_step": 46012, "epoch": 1095} {"train_loss": -5.685024261474609, "global_step": 46013, "epoch": 1095} {"train_loss": -5.6997456550598145, "global_step": 46014, "epoch": 1095} {"train_loss": -5.667116165161133, "global_step": 46015, "epoch": 1095} {"train_loss": -5.84332799911499, "global_step": 46016, "epoch": 1095} {"train_loss": -5.6045331954956055, "global_step": 46017, "epoch": 1095} {"train_loss": -5.704802989959717, "global_step": 46018, "epoch": 1095} {"train_loss": -5.71694278717041, "global_step": 46019, "epoch": 1095} {"train_loss": -5.758544921875, "global_step": 46020, "epoch": 1095} {"train_loss": -5.6600141525268555, "global_step": 46021, "epoch": 1095} {"train_loss": -5.690972328186035, "global_step": 46022, "epoch": 1095} {"train_loss": -5.720226287841797, "global_step": 46023, "epoch": 1095} {"train_loss": -5.752307415008545, "global_step": 46024, "epoch": 1095} {"train_loss": -5.7261834144592285, "global_step": 46025, "epoch": 1095} {"train_loss": -5.757040023803711, "global_step": 46026, "epoch": 1095} {"train_loss": -5.657100677490234, "global_step": 46027, "epoch": 1095} {"train_loss": -5.700130462646484, "global_step": 46028, "epoch": 1095} {"train_loss": -5.805201530456543, "global_step": 46029, "epoch": 1095} {"train_loss": -5.71442174911499, "global_step": 46030, "epoch": 1095} {"train_loss": -5.709250098183041, "global_step": 46031, "epoch": 1095, "val_loss": 66100.7890625} {"train_loss": -5.7095441818237305, "global_step": 46032, "epoch": 1096} {"train_loss": -5.690304756164551, "global_step": 46033, "epoch": 1096} {"train_loss": -5.6754150390625, "global_step": 46034, "epoch": 1096} {"train_loss": -5.679961204528809, "global_step": 46035, "epoch": 1096} {"train_loss": -5.798303127288818, "global_step": 46036, "epoch": 1096} {"train_loss": -5.744332790374756, "global_step": 46037, "epoch": 1096} {"train_loss": -5.5969953536987305, "global_step": 46038, "epoch": 1096} {"train_loss": -5.7475996017456055, "global_step": 46039, "epoch": 1096} {"train_loss": -5.68013858795166, "global_step": 46040, "epoch": 1096} {"train_loss": -5.571513652801514, "global_step": 46041, "epoch": 1096} {"train_loss": -5.693604469299316, "global_step": 46042, "epoch": 1096} {"train_loss": -5.838156700134277, "global_step": 46043, "epoch": 1096} {"train_loss": -5.628854274749756, "global_step": 46044, "epoch": 1096} {"train_loss": -5.811161041259766, "global_step": 46045, "epoch": 1096} {"train_loss": -5.694892406463623, "global_step": 46046, "epoch": 1096} {"train_loss": -5.657139778137207, "global_step": 46047, "epoch": 1096} {"train_loss": -5.690426349639893, "global_step": 46048, "epoch": 1096} {"train_loss": -5.614182472229004, "global_step": 46049, "epoch": 1096} {"train_loss": -5.707961082458496, "global_step": 46050, "epoch": 1096} {"train_loss": -5.718226909637451, "global_step": 46051, "epoch": 1096} {"train_loss": -5.574121475219727, "global_step": 46052, "epoch": 1096} {"train_loss": -5.830262184143066, "global_step": 46053, "epoch": 1096} {"train_loss": -5.66960334777832, "global_step": 46054, "epoch": 1096} {"train_loss": -5.800031661987305, "global_step": 46055, "epoch": 1096} {"train_loss": -5.670045852661133, "global_step": 46056, "epoch": 1096} {"train_loss": -5.716489315032959, "global_step": 46057, "epoch": 1096} {"train_loss": -5.774078369140625, "global_step": 46058, "epoch": 1096} {"train_loss": -5.629951477050781, "global_step": 46059, "epoch": 1096} {"train_loss": -5.582348823547363, "global_step": 46060, "epoch": 1096} {"train_loss": -5.72730827331543, "global_step": 46061, "epoch": 1096} {"train_loss": -5.674270153045654, "global_step": 46062, "epoch": 1096} {"train_loss": -5.737555503845215, "global_step": 46063, "epoch": 1096} {"train_loss": -5.745247840881348, "global_step": 46064, "epoch": 1096} {"train_loss": -5.64506196975708, "global_step": 46065, "epoch": 1096} {"train_loss": -5.679898262023926, "global_step": 46066, "epoch": 1096} {"train_loss": -5.730988502502441, "global_step": 46067, "epoch": 1096} {"train_loss": -5.749682426452637, "global_step": 46068, "epoch": 1096} {"train_loss": -5.871937274932861, "global_step": 46069, "epoch": 1096} {"train_loss": -5.718935966491699, "global_step": 46070, "epoch": 1096} {"train_loss": -5.629411697387695, "global_step": 46071, "epoch": 1096} {"train_loss": -5.787716865539551, "global_step": 46072, "epoch": 1096} {"train_loss": -5.704121203649612, "global_step": 46073, "epoch": 1096, "val_loss": 66063.6171875} {"train_loss": -5.786111831665039, "global_step": 46074, "epoch": 1097} {"train_loss": -5.761999130249023, "global_step": 46075, "epoch": 1097} {"train_loss": -5.82981014251709, "global_step": 46076, "epoch": 1097} {"train_loss": -5.720276832580566, "global_step": 46077, "epoch": 1097} {"train_loss": -5.778967380523682, "global_step": 46078, "epoch": 1097} {"train_loss": -5.8454179763793945, "global_step": 46079, "epoch": 1097} {"train_loss": -5.6850996017456055, "global_step": 46080, "epoch": 1097} {"train_loss": -5.701879501342773, "global_step": 46081, "epoch": 1097} {"train_loss": -5.712563991546631, "global_step": 46082, "epoch": 1097} {"train_loss": -5.67795467376709, "global_step": 46083, "epoch": 1097} {"train_loss": -5.7118425369262695, "global_step": 46084, "epoch": 1097} {"train_loss": -5.601721286773682, "global_step": 46085, "epoch": 1097} {"train_loss": -5.636422157287598, "global_step": 46086, "epoch": 1097} {"train_loss": -5.669939994812012, "global_step": 46087, "epoch": 1097} {"train_loss": -5.714922904968262, "global_step": 46088, "epoch": 1097} {"train_loss": -5.679736137390137, "global_step": 46089, "epoch": 1097} {"train_loss": -5.566887378692627, "global_step": 46090, "epoch": 1097} {"train_loss": -5.718194961547852, "global_step": 46091, "epoch": 1097} {"train_loss": -5.739119052886963, "global_step": 46092, "epoch": 1097} {"train_loss": -5.629753112792969, "global_step": 46093, "epoch": 1097} {"train_loss": -5.688750267028809, "global_step": 46094, "epoch": 1097} {"train_loss": -5.695056915283203, "global_step": 46095, "epoch": 1097} {"train_loss": -5.683050632476807, "global_step": 46096, "epoch": 1097} {"train_loss": -5.709476470947266, "global_step": 46097, "epoch": 1097} {"train_loss": -5.632683753967285, "global_step": 46098, "epoch": 1097} {"train_loss": -5.670988082885742, "global_step": 46099, "epoch": 1097} {"train_loss": -5.640973091125488, "global_step": 46100, "epoch": 1097} {"train_loss": -5.731870174407959, "global_step": 46101, "epoch": 1097} {"train_loss": -5.736406326293945, "global_step": 46102, "epoch": 1097} {"train_loss": -5.763644218444824, "global_step": 46103, "epoch": 1097} {"train_loss": -5.734783172607422, "global_step": 46104, "epoch": 1097} {"train_loss": -5.747170925140381, "global_step": 46105, "epoch": 1097} {"train_loss": -5.651642799377441, "global_step": 46106, "epoch": 1097} {"train_loss": -5.67009973526001, "global_step": 46107, "epoch": 1097} {"train_loss": -5.686122417449951, "global_step": 46108, "epoch": 1097} {"train_loss": -5.707533836364746, "global_step": 46109, "epoch": 1097} {"train_loss": -5.593014717102051, "global_step": 46110, "epoch": 1097} {"train_loss": -5.584288597106934, "global_step": 46111, "epoch": 1097} {"train_loss": -5.663991928100586, "global_step": 46112, "epoch": 1097} {"train_loss": -5.677175045013428, "global_step": 46113, "epoch": 1097} {"train_loss": -5.530418872833252, "global_step": 46114, "epoch": 1097} {"train_loss": -5.689631314504714, "global_step": 46115, "epoch": 1097, "val_loss": 66270.125} {"train_loss": -5.5313334465026855, "global_step": 46116, "epoch": 1098} {"train_loss": -5.590319633483887, "global_step": 46117, "epoch": 1098} {"train_loss": -5.553513050079346, "global_step": 46118, "epoch": 1098} {"train_loss": -5.552541732788086, "global_step": 46119, "epoch": 1098} {"train_loss": -5.634187698364258, "global_step": 46120, "epoch": 1098} {"train_loss": -5.489437103271484, "global_step": 46121, "epoch": 1098} {"train_loss": -5.74157190322876, "global_step": 46122, "epoch": 1098} {"train_loss": -5.600594520568848, "global_step": 46123, "epoch": 1098} {"train_loss": -5.613611221313477, "global_step": 46124, "epoch": 1098} {"train_loss": -5.58198881149292, "global_step": 46125, "epoch": 1098} {"train_loss": -5.675837993621826, "global_step": 46126, "epoch": 1098} {"train_loss": -5.646193027496338, "global_step": 46127, "epoch": 1098} {"train_loss": -5.8052215576171875, "global_step": 46128, "epoch": 1098} {"train_loss": -5.781676769256592, "global_step": 46129, "epoch": 1098} {"train_loss": -5.764374732971191, "global_step": 46130, "epoch": 1098} {"train_loss": -5.715129852294922, "global_step": 46131, "epoch": 1098} {"train_loss": -5.783883571624756, "global_step": 46132, "epoch": 1098} {"train_loss": -5.659417152404785, "global_step": 46133, "epoch": 1098} {"train_loss": -5.567683219909668, "global_step": 46134, "epoch": 1098} {"train_loss": -5.614343643188477, "global_step": 46135, "epoch": 1098} {"train_loss": -5.640233039855957, "global_step": 46136, "epoch": 1098} {"train_loss": -5.551925182342529, "global_step": 46137, "epoch": 1098} {"train_loss": -5.848260879516602, "global_step": 46138, "epoch": 1098} {"train_loss": -5.677538871765137, "global_step": 46139, "epoch": 1098} {"train_loss": -5.5132927894592285, "global_step": 46140, "epoch": 1098} {"train_loss": -5.857583999633789, "global_step": 46141, "epoch": 1098} {"train_loss": -5.4678635597229, "global_step": 46142, "epoch": 1098} {"train_loss": -5.703256607055664, "global_step": 46143, "epoch": 1098} {"train_loss": -5.655272483825684, "global_step": 46144, "epoch": 1098} {"train_loss": -5.602969646453857, "global_step": 46145, "epoch": 1098} {"train_loss": -5.655488967895508, "global_step": 46146, "epoch": 1098} {"train_loss": -5.5609893798828125, "global_step": 46147, "epoch": 1098} {"train_loss": -5.726997375488281, "global_step": 46148, "epoch": 1098} {"train_loss": -5.675058364868164, "global_step": 46149, "epoch": 1098} {"train_loss": -5.799301624298096, "global_step": 46150, "epoch": 1098} {"train_loss": -5.670929908752441, "global_step": 46151, "epoch": 1098} {"train_loss": -5.715543746948242, "global_step": 46152, "epoch": 1098} {"train_loss": -5.656528949737549, "global_step": 46153, "epoch": 1098} {"train_loss": -5.722645282745361, "global_step": 46154, "epoch": 1098} {"train_loss": -5.691990852355957, "global_step": 46155, "epoch": 1098} {"train_loss": -5.701642036437988, "global_step": 46156, "epoch": 1098} {"train_loss": -5.662628310067313, "global_step": 46157, "epoch": 1098, "val_loss": 65980.7421875} {"train_loss": -5.779532432556152, "global_step": 46158, "epoch": 1099} {"train_loss": -5.740192890167236, "global_step": 46159, "epoch": 1099} {"train_loss": -5.804078102111816, "global_step": 46160, "epoch": 1099} {"train_loss": -5.666088104248047, "global_step": 46161, "epoch": 1099} {"train_loss": -5.847879409790039, "global_step": 46162, "epoch": 1099} {"train_loss": -5.583927154541016, "global_step": 46163, "epoch": 1099} {"train_loss": -5.696033477783203, "global_step": 46164, "epoch": 1099} {"train_loss": -5.617868900299072, "global_step": 46165, "epoch": 1099} {"train_loss": -5.726376056671143, "global_step": 46166, "epoch": 1099} {"train_loss": -5.571352005004883, "global_step": 46167, "epoch": 1099} {"train_loss": -5.623252868652344, "global_step": 46168, "epoch": 1099} {"train_loss": -5.696871757507324, "global_step": 46169, "epoch": 1099} {"train_loss": -5.779237747192383, "global_step": 46170, "epoch": 1099} {"train_loss": -5.653510570526123, "global_step": 46171, "epoch": 1099} {"train_loss": -5.734319686889648, "global_step": 46172, "epoch": 1099} {"train_loss": -5.734270095825195, "global_step": 46173, "epoch": 1099} {"train_loss": -5.709495544433594, "global_step": 46174, "epoch": 1099} {"train_loss": -5.710601806640625, "global_step": 46175, "epoch": 1099} {"train_loss": -5.669007778167725, "global_step": 46176, "epoch": 1099} {"train_loss": -5.7570037841796875, "global_step": 46177, "epoch": 1099} {"train_loss": -5.721682548522949, "global_step": 46178, "epoch": 1099} {"train_loss": -5.735221862792969, "global_step": 46179, "epoch": 1099} {"train_loss": -5.549858093261719, "global_step": 46180, "epoch": 1099} {"train_loss": -5.748749732971191, "global_step": 46181, "epoch": 1099} {"train_loss": -5.683881759643555, "global_step": 46182, "epoch": 1099} {"train_loss": -5.594503402709961, "global_step": 46183, "epoch": 1099} {"train_loss": -5.725857734680176, "global_step": 46184, "epoch": 1099} {"train_loss": -5.7083740234375, "global_step": 46185, "epoch": 1099} {"train_loss": -5.611135482788086, "global_step": 46186, "epoch": 1099} {"train_loss": -5.802177429199219, "global_step": 46187, "epoch": 1099} {"train_loss": -5.731332778930664, "global_step": 46188, "epoch": 1099} {"train_loss": -5.717238426208496, "global_step": 46189, "epoch": 1099} {"train_loss": -5.641112327575684, "global_step": 46190, "epoch": 1099} {"train_loss": -5.826438903808594, "global_step": 46191, "epoch": 1099} {"train_loss": -5.630308628082275, "global_step": 46192, "epoch": 1099} {"train_loss": -5.743736267089844, "global_step": 46193, "epoch": 1099} {"train_loss": -5.7068891525268555, "global_step": 46194, "epoch": 1099} {"train_loss": -5.789695739746094, "global_step": 46195, "epoch": 1099} {"train_loss": -5.68963623046875, "global_step": 46196, "epoch": 1099} {"train_loss": -5.707073211669922, "global_step": 46197, "epoch": 1099} {"train_loss": -5.735750198364258, "global_step": 46198, "epoch": 1099} {"train_loss": -5.704754409335909, "global_step": 46199, "epoch": 1099, "val_loss": 65575.71875} {"train_loss": -5.668485164642334, "global_step": 46200, "epoch": 1100} {"train_loss": -5.714766502380371, "global_step": 46201, "epoch": 1100} {"train_loss": -5.746334075927734, "global_step": 46202, "epoch": 1100} {"train_loss": -5.6937665939331055, "global_step": 46203, "epoch": 1100} {"train_loss": -5.722881317138672, "global_step": 46204, "epoch": 1100} {"train_loss": -5.751494407653809, "global_step": 46205, "epoch": 1100} {"train_loss": -5.716139793395996, "global_step": 46206, "epoch": 1100} {"train_loss": -5.717367172241211, "global_step": 46207, "epoch": 1100} {"train_loss": -5.819813251495361, "global_step": 46208, "epoch": 1100} {"train_loss": -5.7652716636657715, "global_step": 46209, "epoch": 1100} {"train_loss": -5.654764652252197, "global_step": 46210, "epoch": 1100} {"train_loss": -5.700044631958008, "global_step": 46211, "epoch": 1100} {"train_loss": -5.704187393188477, "global_step": 46212, "epoch": 1100} {"train_loss": -5.724828720092773, "global_step": 46213, "epoch": 1100} {"train_loss": -5.660879611968994, "global_step": 46214, "epoch": 1100} {"train_loss": -5.639494895935059, "global_step": 46215, "epoch": 1100} {"train_loss": -5.765695571899414, "global_step": 46216, "epoch": 1100} {"train_loss": -5.688372611999512, "global_step": 46217, "epoch": 1100} {"train_loss": -5.607423782348633, "global_step": 46218, "epoch": 1100} {"train_loss": -5.552964210510254, "global_step": 46219, "epoch": 1100} {"train_loss": -5.736750602722168, "global_step": 46220, "epoch": 1100} {"train_loss": -5.643174171447754, "global_step": 46221, "epoch": 1100} {"train_loss": -5.668810844421387, "global_step": 46222, "epoch": 1100} {"train_loss": -5.742021560668945, "global_step": 46223, "epoch": 1100} {"train_loss": -5.6267852783203125, "global_step": 46224, "epoch": 1100} {"train_loss": -5.761543273925781, "global_step": 46225, "epoch": 1100} {"train_loss": -5.744812965393066, "global_step": 46226, "epoch": 1100} {"train_loss": -5.725435256958008, "global_step": 46227, "epoch": 1100} {"train_loss": -5.560652732849121, "global_step": 46228, "epoch": 1100} {"train_loss": -5.741013050079346, "global_step": 46229, "epoch": 1100} {"train_loss": -5.649742126464844, "global_step": 46230, "epoch": 1100} {"train_loss": -5.68769645690918, "global_step": 46231, "epoch": 1100} {"train_loss": -5.581464767456055, "global_step": 46232, "epoch": 1100} {"train_loss": -5.646014213562012, "global_step": 46233, "epoch": 1100} {"train_loss": -5.737519264221191, "global_step": 46234, "epoch": 1100} {"train_loss": -5.584853172302246, "global_step": 46235, "epoch": 1100} {"train_loss": -5.505336284637451, "global_step": 46236, "epoch": 1100} {"train_loss": -5.6954240798950195, "global_step": 46237, "epoch": 1100} {"train_loss": -5.666092872619629, "global_step": 46238, "epoch": 1100} {"train_loss": -5.836059093475342, "global_step": 46239, "epoch": 1100} {"train_loss": -5.715450286865234, "global_step": 46240, "epoch": 1100} {"train_loss": -5.688615571884882, "global_step": 46241, "epoch": 1100, "train/sim_max_reward_0": 0.781012710863941, "train/sim_max_reward_1": 0.721825569163793, "train/sim_max_reward_2": 0.615976929268992, "train/sim_max_reward_3": 0.17214051756407506, "train/sim_max_reward_4": 0.3603174728513977, "train/sim_max_reward_5": 0.5742875002050686, "test/sim_max_reward_4400000": 0.3816582639020822, "test/sim_max_reward_4400001": 0.9578062375777308, "test/sim_max_reward_4400002": 0.05586643948976491, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.33731965798692526, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.4585430416961332, "test/sim_max_reward_4400009": 0.5433232333851744, "test/sim_max_reward_4400010": 0.2040368518331075, "test/sim_max_reward_4400011": 0.14364923467733606, "test/sim_max_reward_4400012": 0.4803562557568566, "test/sim_max_reward_4400013": 0.05569209882391426, "test/sim_max_reward_4400014": 0.3299482521486073, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.30879445944398803, "test/sim_max_reward_4400019": 0.09352402975411146, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.2806421844437937, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.2190156841955961, "test/sim_max_reward_4400026": 0.028246454608266674, "test/sim_max_reward_4400027": 0.022288859986033232, "test/sim_max_reward_4400028": 0.36588360881828713, "test/sim_max_reward_4400029": 0.5305751567813215, "test/sim_max_reward_4400030": 0.34688423215286596, "test/sim_max_reward_4400031": 0.8398113903049343, "test/sim_max_reward_4400032": 0.129249901899667, "test/sim_max_reward_4400033": 0.1871019528808424, "test/sim_max_reward_4400034": 0.15240740407497663, "test/sim_max_reward_4400035": 0.9362837008994036, "test/sim_max_reward_4400036": 0.35491950240235565, "test/sim_max_reward_4400037": 0.8540460299241968, "test/sim_max_reward_4400038": 0.22232473020811866, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7239150768059357, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.033112613389544625, "test/sim_max_reward_4400044": 0.017920773642776142, "test/sim_max_reward_4400045": 0.5000833875339543, "test/sim_max_reward_4400046": 0.2867394463939894, "test/sim_max_reward_4400047": 0.7327625327797649, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.06433555668872559, "train/mean_score": 0.5375934499862112, "test/mean_score": 0.2632471875668135, "val_loss": 66127.5859375} {"train_loss": -5.636219024658203, "global_step": 46242, "epoch": 1101} {"train_loss": -5.638476371765137, "global_step": 46243, "epoch": 1101} {"train_loss": -5.670734882354736, "global_step": 46244, "epoch": 1101} {"train_loss": -5.744218826293945, "global_step": 46245, "epoch": 1101} {"train_loss": -5.6785888671875, "global_step": 46246, "epoch": 1101} {"train_loss": -5.700923919677734, "global_step": 46247, "epoch": 1101} {"train_loss": -5.742162227630615, "global_step": 46248, "epoch": 1101} {"train_loss": -5.620419502258301, "global_step": 46249, "epoch": 1101} {"train_loss": -5.649433135986328, "global_step": 46250, "epoch": 1101} {"train_loss": -5.730919361114502, "global_step": 46251, "epoch": 1101} {"train_loss": -5.723553657531738, "global_step": 46252, "epoch": 1101} {"train_loss": -5.818052291870117, "global_step": 46253, "epoch": 1101} {"train_loss": -5.587160110473633, "global_step": 46254, "epoch": 1101} {"train_loss": -5.681798934936523, "global_step": 46255, "epoch": 1101} {"train_loss": -5.744486331939697, "global_step": 46256, "epoch": 1101} {"train_loss": -5.691380500793457, "global_step": 46257, "epoch": 1101} {"train_loss": -5.669595718383789, "global_step": 46258, "epoch": 1101} {"train_loss": -5.701474189758301, "global_step": 46259, "epoch": 1101} {"train_loss": -5.796064376831055, "global_step": 46260, "epoch": 1101} {"train_loss": -5.618252754211426, "global_step": 46261, "epoch": 1101} {"train_loss": -5.654191970825195, "global_step": 46262, "epoch": 1101} {"train_loss": -5.655473709106445, "global_step": 46263, "epoch": 1101} {"train_loss": -5.668139457702637, "global_step": 46264, "epoch": 1101} {"train_loss": -5.6306047439575195, "global_step": 46265, "epoch": 1101} {"train_loss": -5.857479572296143, "global_step": 46266, "epoch": 1101} {"train_loss": -5.643779754638672, "global_step": 46267, "epoch": 1101} {"train_loss": -5.629493713378906, "global_step": 46268, "epoch": 1101} {"train_loss": -5.676163673400879, "global_step": 46269, "epoch": 1101} {"train_loss": -5.6160430908203125, "global_step": 46270, "epoch": 1101} {"train_loss": -5.748669624328613, "global_step": 46271, "epoch": 1101} {"train_loss": -5.642706871032715, "global_step": 46272, "epoch": 1101} {"train_loss": -5.6433563232421875, "global_step": 46273, "epoch": 1101} {"train_loss": -5.7209858894348145, "global_step": 46274, "epoch": 1101} {"train_loss": -5.523176193237305, "global_step": 46275, "epoch": 1101} {"train_loss": -5.805385112762451, "global_step": 46276, "epoch": 1101} {"train_loss": -5.832568168640137, "global_step": 46277, "epoch": 1101} {"train_loss": -5.691558837890625, "global_step": 46278, "epoch": 1101} {"train_loss": -5.681024551391602, "global_step": 46279, "epoch": 1101} {"train_loss": -5.796213150024414, "global_step": 46280, "epoch": 1101} {"train_loss": -5.7809858322143555, "global_step": 46281, "epoch": 1101} {"train_loss": -5.704801559448242, "global_step": 46282, "epoch": 1101} {"train_loss": -5.69728558404105, "global_step": 46283, "epoch": 1101, "val_loss": 66379.7890625} {"train_loss": -5.775845050811768, "global_step": 46284, "epoch": 1102} {"train_loss": -5.555764198303223, "global_step": 46285, "epoch": 1102} {"train_loss": -5.719602108001709, "global_step": 46286, "epoch": 1102} {"train_loss": -5.82330322265625, "global_step": 46287, "epoch": 1102} {"train_loss": -5.694039821624756, "global_step": 46288, "epoch": 1102} {"train_loss": -5.715060234069824, "global_step": 46289, "epoch": 1102} {"train_loss": -5.752020835876465, "global_step": 46290, "epoch": 1102} {"train_loss": -5.716516017913818, "global_step": 46291, "epoch": 1102} {"train_loss": -5.824958801269531, "global_step": 46292, "epoch": 1102} {"train_loss": -5.70547342300415, "global_step": 46293, "epoch": 1102} {"train_loss": -5.669676780700684, "global_step": 46294, "epoch": 1102} {"train_loss": -5.784567356109619, "global_step": 46295, "epoch": 1102} {"train_loss": -5.648290634155273, "global_step": 46296, "epoch": 1102} {"train_loss": -5.687066078186035, "global_step": 46297, "epoch": 1102} {"train_loss": -5.643930435180664, "global_step": 46298, "epoch": 1102} {"train_loss": -5.666565895080566, "global_step": 46299, "epoch": 1102} {"train_loss": -5.751530647277832, "global_step": 46300, "epoch": 1102} {"train_loss": -5.615880012512207, "global_step": 46301, "epoch": 1102} {"train_loss": -5.8644938468933105, "global_step": 46302, "epoch": 1102} {"train_loss": -5.801884651184082, "global_step": 46303, "epoch": 1102} {"train_loss": -5.696150779724121, "global_step": 46304, "epoch": 1102} {"train_loss": -5.663559913635254, "global_step": 46305, "epoch": 1102} {"train_loss": -5.617808818817139, "global_step": 46306, "epoch": 1102} {"train_loss": -5.767913341522217, "global_step": 46307, "epoch": 1102} {"train_loss": -5.788422584533691, "global_step": 46308, "epoch": 1102} {"train_loss": -5.646196365356445, "global_step": 46309, "epoch": 1102} {"train_loss": -5.7732157707214355, "global_step": 46310, "epoch": 1102} {"train_loss": -5.758367538452148, "global_step": 46311, "epoch": 1102} {"train_loss": -5.739879131317139, "global_step": 46312, "epoch": 1102} {"train_loss": -5.693676948547363, "global_step": 46313, "epoch": 1102} {"train_loss": -5.736076354980469, "global_step": 46314, "epoch": 1102} {"train_loss": -5.809763431549072, "global_step": 46315, "epoch": 1102} {"train_loss": -5.839038848876953, "global_step": 46316, "epoch": 1102} {"train_loss": -5.743978977203369, "global_step": 46317, "epoch": 1102} {"train_loss": -5.752532482147217, "global_step": 46318, "epoch": 1102} {"train_loss": -5.633259296417236, "global_step": 46319, "epoch": 1102} {"train_loss": -5.754343032836914, "global_step": 46320, "epoch": 1102} {"train_loss": -5.631929397583008, "global_step": 46321, "epoch": 1102} {"train_loss": -5.733343124389648, "global_step": 46322, "epoch": 1102} {"train_loss": -5.689016342163086, "global_step": 46323, "epoch": 1102} {"train_loss": -5.654407024383545, "global_step": 46324, "epoch": 1102} {"train_loss": -5.7201323963346935, "global_step": 46325, "epoch": 1102, "val_loss": 66115.4453125} {"train_loss": -5.798089027404785, "global_step": 46326, "epoch": 1103} {"train_loss": -5.697470664978027, "global_step": 46327, "epoch": 1103} {"train_loss": -5.63442325592041, "global_step": 46328, "epoch": 1103} {"train_loss": -5.605868339538574, "global_step": 46329, "epoch": 1103} {"train_loss": -5.7133097648620605, "global_step": 46330, "epoch": 1103} {"train_loss": -5.749431610107422, "global_step": 46331, "epoch": 1103} {"train_loss": -5.683404922485352, "global_step": 46332, "epoch": 1103} {"train_loss": -5.736889839172363, "global_step": 46333, "epoch": 1103} {"train_loss": -5.49717378616333, "global_step": 46334, "epoch": 1103} {"train_loss": -5.873769760131836, "global_step": 46335, "epoch": 1103} {"train_loss": -5.724721908569336, "global_step": 46336, "epoch": 1103} {"train_loss": -5.634525299072266, "global_step": 46337, "epoch": 1103} {"train_loss": -5.73695182800293, "global_step": 46338, "epoch": 1103} {"train_loss": -5.7342000007629395, "global_step": 46339, "epoch": 1103} {"train_loss": -5.705986976623535, "global_step": 46340, "epoch": 1103} {"train_loss": -5.801342010498047, "global_step": 46341, "epoch": 1103} {"train_loss": -5.676181793212891, "global_step": 46342, "epoch": 1103} {"train_loss": -5.672672748565674, "global_step": 46343, "epoch": 1103} {"train_loss": -5.80570125579834, "global_step": 46344, "epoch": 1103} {"train_loss": -5.681740760803223, "global_step": 46345, "epoch": 1103} {"train_loss": -5.648038864135742, "global_step": 46346, "epoch": 1103} {"train_loss": -5.843905925750732, "global_step": 46347, "epoch": 1103} {"train_loss": -5.732959747314453, "global_step": 46348, "epoch": 1103} {"train_loss": -5.639925956726074, "global_step": 46349, "epoch": 1103} {"train_loss": -5.654417514801025, "global_step": 46350, "epoch": 1103} {"train_loss": -5.720973968505859, "global_step": 46351, "epoch": 1103} {"train_loss": -5.825572967529297, "global_step": 46352, "epoch": 1103} {"train_loss": -5.537200927734375, "global_step": 46353, "epoch": 1103} {"train_loss": -5.782517433166504, "global_step": 46354, "epoch": 1103} {"train_loss": -5.629513263702393, "global_step": 46355, "epoch": 1103} {"train_loss": -5.684695720672607, "global_step": 46356, "epoch": 1103} {"train_loss": -5.688885688781738, "global_step": 46357, "epoch": 1103} {"train_loss": -5.771205902099609, "global_step": 46358, "epoch": 1103} {"train_loss": -5.763625144958496, "global_step": 46359, "epoch": 1103} {"train_loss": -5.786440849304199, "global_step": 46360, "epoch": 1103} {"train_loss": -5.647554397583008, "global_step": 46361, "epoch": 1103} {"train_loss": -5.76523494720459, "global_step": 46362, "epoch": 1103} {"train_loss": -5.7185959815979, "global_step": 46363, "epoch": 1103} {"train_loss": -5.86242151260376, "global_step": 46364, "epoch": 1103} {"train_loss": -5.586103916168213, "global_step": 46365, "epoch": 1103} {"train_loss": -5.628864288330078, "global_step": 46366, "epoch": 1103} {"train_loss": -5.71160938626244, "global_step": 46367, "epoch": 1103, "val_loss": 66107.3515625} {"train_loss": -5.756465911865234, "global_step": 46368, "epoch": 1104} {"train_loss": -5.78914737701416, "global_step": 46369, "epoch": 1104} {"train_loss": -5.728915691375732, "global_step": 46370, "epoch": 1104} {"train_loss": -5.894184112548828, "global_step": 46371, "epoch": 1104} {"train_loss": -5.739289283752441, "global_step": 46372, "epoch": 1104} {"train_loss": -5.686524391174316, "global_step": 46373, "epoch": 1104} {"train_loss": -5.7429094314575195, "global_step": 46374, "epoch": 1104} {"train_loss": -5.737003326416016, "global_step": 46375, "epoch": 1104} {"train_loss": -5.750954627990723, "global_step": 46376, "epoch": 1104} {"train_loss": -5.729050636291504, "global_step": 46377, "epoch": 1104} {"train_loss": -5.763004302978516, "global_step": 46378, "epoch": 1104} {"train_loss": -5.836014270782471, "global_step": 46379, "epoch": 1104} {"train_loss": -5.833364486694336, "global_step": 46380, "epoch": 1104} {"train_loss": -5.710687637329102, "global_step": 46381, "epoch": 1104} {"train_loss": -5.718601703643799, "global_step": 46382, "epoch": 1104} {"train_loss": -5.67000675201416, "global_step": 46383, "epoch": 1104} {"train_loss": -5.609109878540039, "global_step": 46384, "epoch": 1104} {"train_loss": -5.672959327697754, "global_step": 46385, "epoch": 1104} {"train_loss": -5.769438743591309, "global_step": 46386, "epoch": 1104} {"train_loss": -5.705541610717773, "global_step": 46387, "epoch": 1104} {"train_loss": -5.70343017578125, "global_step": 46388, "epoch": 1104} {"train_loss": -5.738483905792236, "global_step": 46389, "epoch": 1104} {"train_loss": -5.7326273918151855, "global_step": 46390, "epoch": 1104} {"train_loss": -5.682342052459717, "global_step": 46391, "epoch": 1104} {"train_loss": -5.763284206390381, "global_step": 46392, "epoch": 1104} {"train_loss": -5.688878536224365, "global_step": 46393, "epoch": 1104} {"train_loss": -5.662525177001953, "global_step": 46394, "epoch": 1104} {"train_loss": -5.674216270446777, "global_step": 46395, "epoch": 1104} {"train_loss": -5.621647357940674, "global_step": 46396, "epoch": 1104} {"train_loss": -5.7100653648376465, "global_step": 46397, "epoch": 1104} {"train_loss": -5.658518314361572, "global_step": 46398, "epoch": 1104} {"train_loss": -5.789630889892578, "global_step": 46399, "epoch": 1104} {"train_loss": -5.7934675216674805, "global_step": 46400, "epoch": 1104} {"train_loss": -5.736878395080566, "global_step": 46401, "epoch": 1104} {"train_loss": -5.775608062744141, "global_step": 46402, "epoch": 1104} {"train_loss": -5.6225996017456055, "global_step": 46403, "epoch": 1104} {"train_loss": -5.695581912994385, "global_step": 46404, "epoch": 1104} {"train_loss": -5.801344871520996, "global_step": 46405, "epoch": 1104} {"train_loss": -5.682590007781982, "global_step": 46406, "epoch": 1104} {"train_loss": -5.746771812438965, "global_step": 46407, "epoch": 1104} {"train_loss": -5.777420997619629, "global_step": 46408, "epoch": 1104} {"train_loss": -5.727469205856323, "global_step": 46409, "epoch": 1104, "val_loss": 66001.0078125} {"train_loss": -5.681084632873535, "global_step": 46410, "epoch": 1105} {"train_loss": -5.670828342437744, "global_step": 46411, "epoch": 1105} {"train_loss": -5.762994289398193, "global_step": 46412, "epoch": 1105} {"train_loss": -5.782742977142334, "global_step": 46413, "epoch": 1105} {"train_loss": -5.616922378540039, "global_step": 46414, "epoch": 1105} {"train_loss": -5.770063877105713, "global_step": 46415, "epoch": 1105} {"train_loss": -5.660364151000977, "global_step": 46416, "epoch": 1105} {"train_loss": -5.661929130554199, "global_step": 46417, "epoch": 1105} {"train_loss": -5.717048168182373, "global_step": 46418, "epoch": 1105} {"train_loss": -5.657713890075684, "global_step": 46419, "epoch": 1105} {"train_loss": -5.7066802978515625, "global_step": 46420, "epoch": 1105} {"train_loss": -5.670229434967041, "global_step": 46421, "epoch": 1105} {"train_loss": -5.695513725280762, "global_step": 46422, "epoch": 1105} {"train_loss": -5.696020126342773, "global_step": 46423, "epoch": 1105} {"train_loss": -5.658785820007324, "global_step": 46424, "epoch": 1105} {"train_loss": -5.716512680053711, "global_step": 46425, "epoch": 1105} {"train_loss": -5.798038959503174, "global_step": 46426, "epoch": 1105} {"train_loss": -5.707460403442383, "global_step": 46427, "epoch": 1105} {"train_loss": -5.825498580932617, "global_step": 46428, "epoch": 1105} {"train_loss": -5.688506126403809, "global_step": 46429, "epoch": 1105} {"train_loss": -5.735203742980957, "global_step": 46430, "epoch": 1105} {"train_loss": -5.680308818817139, "global_step": 46431, "epoch": 1105} {"train_loss": -5.654114723205566, "global_step": 46432, "epoch": 1105} {"train_loss": -5.7435808181762695, "global_step": 46433, "epoch": 1105} {"train_loss": -5.699977397918701, "global_step": 46434, "epoch": 1105} {"train_loss": -5.641707420349121, "global_step": 46435, "epoch": 1105} {"train_loss": -5.716533660888672, "global_step": 46436, "epoch": 1105} {"train_loss": -5.725481986999512, "global_step": 46437, "epoch": 1105} {"train_loss": -5.649178504943848, "global_step": 46438, "epoch": 1105} {"train_loss": -5.628597736358643, "global_step": 46439, "epoch": 1105} {"train_loss": -5.606425762176514, "global_step": 46440, "epoch": 1105} {"train_loss": -5.693044185638428, "global_step": 46441, "epoch": 1105} {"train_loss": -5.6959404945373535, "global_step": 46442, "epoch": 1105} {"train_loss": -5.649348258972168, "global_step": 46443, "epoch": 1105} {"train_loss": -5.681580066680908, "global_step": 46444, "epoch": 1105} {"train_loss": -5.70785665512085, "global_step": 46445, "epoch": 1105} {"train_loss": -5.721432685852051, "global_step": 46446, "epoch": 1105} {"train_loss": -5.729511260986328, "global_step": 46447, "epoch": 1105} {"train_loss": -5.744262218475342, "global_step": 46448, "epoch": 1105} {"train_loss": -5.685192584991455, "global_step": 46449, "epoch": 1105} {"train_loss": -5.669663906097412, "global_step": 46450, "epoch": 1105} {"train_loss": -5.697100582576933, "global_step": 46451, "epoch": 1105, "val_loss": 66244.2421875} {"train_loss": -5.795468330383301, "global_step": 46452, "epoch": 1106} {"train_loss": -5.612138271331787, "global_step": 46453, "epoch": 1106} {"train_loss": -5.712309837341309, "global_step": 46454, "epoch": 1106} {"train_loss": -5.601424217224121, "global_step": 46455, "epoch": 1106} {"train_loss": -5.544284343719482, "global_step": 46456, "epoch": 1106} {"train_loss": -5.664118766784668, "global_step": 46457, "epoch": 1106} {"train_loss": -5.588219165802002, "global_step": 46458, "epoch": 1106} {"train_loss": -5.626959800720215, "global_step": 46459, "epoch": 1106} {"train_loss": -5.670222759246826, "global_step": 46460, "epoch": 1106} {"train_loss": -5.637846946716309, "global_step": 46461, "epoch": 1106} {"train_loss": -5.683868408203125, "global_step": 46462, "epoch": 1106} {"train_loss": -5.758480072021484, "global_step": 46463, "epoch": 1106} {"train_loss": -5.632867813110352, "global_step": 46464, "epoch": 1106} {"train_loss": -5.551970958709717, "global_step": 46465, "epoch": 1106} {"train_loss": -5.667471885681152, "global_step": 46466, "epoch": 1106} {"train_loss": -5.755600929260254, "global_step": 46467, "epoch": 1106} {"train_loss": -5.720968246459961, "global_step": 46468, "epoch": 1106} {"train_loss": -5.656824111938477, "global_step": 46469, "epoch": 1106} {"train_loss": -5.771247863769531, "global_step": 46470, "epoch": 1106} {"train_loss": -5.7509765625, "global_step": 46471, "epoch": 1106} {"train_loss": -5.7457427978515625, "global_step": 46472, "epoch": 1106} {"train_loss": -5.676572322845459, "global_step": 46473, "epoch": 1106} {"train_loss": -5.763106346130371, "global_step": 46474, "epoch": 1106} {"train_loss": -5.781924247741699, "global_step": 46475, "epoch": 1106} {"train_loss": -5.747132778167725, "global_step": 46476, "epoch": 1106} {"train_loss": -5.695350646972656, "global_step": 46477, "epoch": 1106} {"train_loss": -5.701364517211914, "global_step": 46478, "epoch": 1106} {"train_loss": -5.816518783569336, "global_step": 46479, "epoch": 1106} {"train_loss": -5.698854446411133, "global_step": 46480, "epoch": 1106} {"train_loss": -5.610050201416016, "global_step": 46481, "epoch": 1106} {"train_loss": -5.738833427429199, "global_step": 46482, "epoch": 1106} {"train_loss": -5.769268035888672, "global_step": 46483, "epoch": 1106} {"train_loss": -5.735596656799316, "global_step": 46484, "epoch": 1106} {"train_loss": -5.649173736572266, "global_step": 46485, "epoch": 1106} {"train_loss": -5.715162754058838, "global_step": 46486, "epoch": 1106} {"train_loss": -5.695585250854492, "global_step": 46487, "epoch": 1106} {"train_loss": -5.536104202270508, "global_step": 46488, "epoch": 1106} {"train_loss": -5.595964431762695, "global_step": 46489, "epoch": 1106} {"train_loss": -5.721735954284668, "global_step": 46490, "epoch": 1106} {"train_loss": -5.633628845214844, "global_step": 46491, "epoch": 1106} {"train_loss": -5.713955402374268, "global_step": 46492, "epoch": 1106} {"train_loss": -5.685630423682077, "global_step": 46493, "epoch": 1106, "val_loss": 66216.3046875} {"train_loss": -5.754421234130859, "global_step": 46494, "epoch": 1107} {"train_loss": -5.677732467651367, "global_step": 46495, "epoch": 1107} {"train_loss": -5.484496593475342, "global_step": 46496, "epoch": 1107} {"train_loss": -5.622960090637207, "global_step": 46497, "epoch": 1107} {"train_loss": -5.71687126159668, "global_step": 46498, "epoch": 1107} {"train_loss": -5.682056427001953, "global_step": 46499, "epoch": 1107} {"train_loss": -5.718603610992432, "global_step": 46500, "epoch": 1107} {"train_loss": -5.688152313232422, "global_step": 46501, "epoch": 1107} {"train_loss": -5.59724760055542, "global_step": 46502, "epoch": 1107} {"train_loss": -5.568145751953125, "global_step": 46503, "epoch": 1107} {"train_loss": -5.725176811218262, "global_step": 46504, "epoch": 1107} {"train_loss": -5.717836380004883, "global_step": 46505, "epoch": 1107} {"train_loss": -5.610755920410156, "global_step": 46506, "epoch": 1107} {"train_loss": -5.637147426605225, "global_step": 46507, "epoch": 1107} {"train_loss": -5.7479705810546875, "global_step": 46508, "epoch": 1107} {"train_loss": -5.7637481689453125, "global_step": 46509, "epoch": 1107} {"train_loss": -5.627933502197266, "global_step": 46510, "epoch": 1107} {"train_loss": -5.692080974578857, "global_step": 46511, "epoch": 1107} {"train_loss": -5.678658485412598, "global_step": 46512, "epoch": 1107} {"train_loss": -5.509873867034912, "global_step": 46513, "epoch": 1107} {"train_loss": -5.799106597900391, "global_step": 46514, "epoch": 1107} {"train_loss": -5.671225547790527, "global_step": 46515, "epoch": 1107} {"train_loss": -5.750074863433838, "global_step": 46516, "epoch": 1107} {"train_loss": -5.773690700531006, "global_step": 46517, "epoch": 1107} {"train_loss": -5.819625377655029, "global_step": 46518, "epoch": 1107} {"train_loss": -5.891650199890137, "global_step": 46519, "epoch": 1107} {"train_loss": -5.656482696533203, "global_step": 46520, "epoch": 1107} {"train_loss": -5.8069562911987305, "global_step": 46521, "epoch": 1107} {"train_loss": -5.706974029541016, "global_step": 46522, "epoch": 1107} {"train_loss": -5.618529796600342, "global_step": 46523, "epoch": 1107} {"train_loss": -5.703179359436035, "global_step": 46524, "epoch": 1107} {"train_loss": -5.630627632141113, "global_step": 46525, "epoch": 1107} {"train_loss": -5.761950969696045, "global_step": 46526, "epoch": 1107} {"train_loss": -5.690384864807129, "global_step": 46527, "epoch": 1107} {"train_loss": -5.775592803955078, "global_step": 46528, "epoch": 1107} {"train_loss": -5.841536521911621, "global_step": 46529, "epoch": 1107} {"train_loss": -5.679187774658203, "global_step": 46530, "epoch": 1107} {"train_loss": -5.6867218017578125, "global_step": 46531, "epoch": 1107} {"train_loss": -5.675199031829834, "global_step": 46532, "epoch": 1107} {"train_loss": -5.693295001983643, "global_step": 46533, "epoch": 1107} {"train_loss": -5.727304458618164, "global_step": 46534, "epoch": 1107} {"train_loss": -5.701708169210525, "global_step": 46535, "epoch": 1107, "val_loss": 66095.8671875} {"train_loss": -5.634615421295166, "global_step": 46536, "epoch": 1108} {"train_loss": -5.625578880310059, "global_step": 46537, "epoch": 1108} {"train_loss": -5.639890670776367, "global_step": 46538, "epoch": 1108} {"train_loss": -5.7141923904418945, "global_step": 46539, "epoch": 1108} {"train_loss": -5.8586907386779785, "global_step": 46540, "epoch": 1108} {"train_loss": -5.7327494621276855, "global_step": 46541, "epoch": 1108} {"train_loss": -5.753007888793945, "global_step": 46542, "epoch": 1108} {"train_loss": -5.616395950317383, "global_step": 46543, "epoch": 1108} {"train_loss": -5.6781229972839355, "global_step": 46544, "epoch": 1108} {"train_loss": -5.748680591583252, "global_step": 46545, "epoch": 1108} {"train_loss": -5.714573860168457, "global_step": 46546, "epoch": 1108} {"train_loss": -5.740046501159668, "global_step": 46547, "epoch": 1108} {"train_loss": -5.843006134033203, "global_step": 46548, "epoch": 1108} {"train_loss": -5.794947624206543, "global_step": 46549, "epoch": 1108} {"train_loss": -5.876688003540039, "global_step": 46550, "epoch": 1108} {"train_loss": -5.687580108642578, "global_step": 46551, "epoch": 1108} {"train_loss": -5.846133232116699, "global_step": 46552, "epoch": 1108} {"train_loss": -5.790785789489746, "global_step": 46553, "epoch": 1108} {"train_loss": -5.627527236938477, "global_step": 46554, "epoch": 1108} {"train_loss": -5.76686954498291, "global_step": 46555, "epoch": 1108} {"train_loss": -5.744171142578125, "global_step": 46556, "epoch": 1108} {"train_loss": -5.7998151779174805, "global_step": 46557, "epoch": 1108} {"train_loss": -5.893240451812744, "global_step": 46558, "epoch": 1108} {"train_loss": -5.704292297363281, "global_step": 46559, "epoch": 1108} {"train_loss": -5.701451301574707, "global_step": 46560, "epoch": 1108} {"train_loss": -5.752516269683838, "global_step": 46561, "epoch": 1108} {"train_loss": -5.701725006103516, "global_step": 46562, "epoch": 1108} {"train_loss": -5.599565029144287, "global_step": 46563, "epoch": 1108} {"train_loss": -5.9260125160217285, "global_step": 46564, "epoch": 1108} {"train_loss": -5.6374831199646, "global_step": 46565, "epoch": 1108} {"train_loss": -5.5865936279296875, "global_step": 46566, "epoch": 1108} {"train_loss": -5.65552282333374, "global_step": 46567, "epoch": 1108} {"train_loss": -5.621255397796631, "global_step": 46568, "epoch": 1108} {"train_loss": -5.7484965324401855, "global_step": 46569, "epoch": 1108} {"train_loss": -5.713586330413818, "global_step": 46570, "epoch": 1108} {"train_loss": -5.6499342918396, "global_step": 46571, "epoch": 1108} {"train_loss": -5.716371536254883, "global_step": 46572, "epoch": 1108} {"train_loss": -5.6682891845703125, "global_step": 46573, "epoch": 1108} {"train_loss": -5.629246234893799, "global_step": 46574, "epoch": 1108} {"train_loss": -5.7618560791015625, "global_step": 46575, "epoch": 1108} {"train_loss": -5.624739646911621, "global_step": 46576, "epoch": 1108} {"train_loss": -5.720916634514218, "global_step": 46577, "epoch": 1108, "val_loss": 66213.984375} {"train_loss": -5.604011535644531, "global_step": 46578, "epoch": 1109} {"train_loss": -5.745392322540283, "global_step": 46579, "epoch": 1109} {"train_loss": -5.706706523895264, "global_step": 46580, "epoch": 1109} {"train_loss": -5.797632694244385, "global_step": 46581, "epoch": 1109} {"train_loss": -5.6911725997924805, "global_step": 46582, "epoch": 1109} {"train_loss": -5.826016902923584, "global_step": 46583, "epoch": 1109} {"train_loss": -5.733569622039795, "global_step": 46584, "epoch": 1109} {"train_loss": -5.675630569458008, "global_step": 46585, "epoch": 1109} {"train_loss": -5.801092624664307, "global_step": 46586, "epoch": 1109} {"train_loss": -5.631697654724121, "global_step": 46587, "epoch": 1109} {"train_loss": -5.745853424072266, "global_step": 46588, "epoch": 1109} {"train_loss": -5.658316612243652, "global_step": 46589, "epoch": 1109} {"train_loss": -5.661198616027832, "global_step": 46590, "epoch": 1109} {"train_loss": -5.641838550567627, "global_step": 46591, "epoch": 1109} {"train_loss": -5.618697166442871, "global_step": 46592, "epoch": 1109} {"train_loss": -5.693624496459961, "global_step": 46593, "epoch": 1109} {"train_loss": -5.791813850402832, "global_step": 46594, "epoch": 1109} {"train_loss": -5.728580474853516, "global_step": 46595, "epoch": 1109} {"train_loss": -5.603845596313477, "global_step": 46596, "epoch": 1109} {"train_loss": -5.681659698486328, "global_step": 46597, "epoch": 1109} {"train_loss": -5.866154193878174, "global_step": 46598, "epoch": 1109} {"train_loss": -5.706418991088867, "global_step": 46599, "epoch": 1109} {"train_loss": -5.735452651977539, "global_step": 46600, "epoch": 1109} {"train_loss": -5.765622138977051, "global_step": 46601, "epoch": 1109} {"train_loss": -5.736855983734131, "global_step": 46602, "epoch": 1109} {"train_loss": -5.668601036071777, "global_step": 46603, "epoch": 1109} {"train_loss": -5.7626543045043945, "global_step": 46604, "epoch": 1109} {"train_loss": -5.684784889221191, "global_step": 46605, "epoch": 1109} {"train_loss": -5.779065132141113, "global_step": 46606, "epoch": 1109} {"train_loss": -5.804180145263672, "global_step": 46607, "epoch": 1109} {"train_loss": -5.778260231018066, "global_step": 46608, "epoch": 1109} {"train_loss": -5.677191257476807, "global_step": 46609, "epoch": 1109} {"train_loss": -5.709328651428223, "global_step": 46610, "epoch": 1109} {"train_loss": -5.680010795593262, "global_step": 46611, "epoch": 1109} {"train_loss": -5.541463851928711, "global_step": 46612, "epoch": 1109} {"train_loss": -5.828822612762451, "global_step": 46613, "epoch": 1109} {"train_loss": -5.812985420227051, "global_step": 46614, "epoch": 1109} {"train_loss": -5.841066360473633, "global_step": 46615, "epoch": 1109} {"train_loss": -5.896063804626465, "global_step": 46616, "epoch": 1109} {"train_loss": -5.693246364593506, "global_step": 46617, "epoch": 1109} {"train_loss": -5.7264299392700195, "global_step": 46618, "epoch": 1109} {"train_loss": -5.724861349378314, "global_step": 46619, "epoch": 1109, "val_loss": 66013.5234375} {"train_loss": -5.779852867126465, "global_step": 46620, "epoch": 1110} {"train_loss": -5.756699562072754, "global_step": 46621, "epoch": 1110} {"train_loss": -5.656656265258789, "global_step": 46622, "epoch": 1110} {"train_loss": -5.559659481048584, "global_step": 46623, "epoch": 1110} {"train_loss": -5.815007209777832, "global_step": 46624, "epoch": 1110} {"train_loss": -5.632430553436279, "global_step": 46625, "epoch": 1110} {"train_loss": -5.638401031494141, "global_step": 46626, "epoch": 1110} {"train_loss": -5.728367805480957, "global_step": 46627, "epoch": 1110} {"train_loss": -5.70162296295166, "global_step": 46628, "epoch": 1110} {"train_loss": -5.801406383514404, "global_step": 46629, "epoch": 1110} {"train_loss": -5.659697532653809, "global_step": 46630, "epoch": 1110} {"train_loss": -5.6544189453125, "global_step": 46631, "epoch": 1110} {"train_loss": -5.8296709060668945, "global_step": 46632, "epoch": 1110} {"train_loss": -5.668806076049805, "global_step": 46633, "epoch": 1110} {"train_loss": -5.673984527587891, "global_step": 46634, "epoch": 1110} {"train_loss": -5.660273551940918, "global_step": 46635, "epoch": 1110} {"train_loss": -5.625400543212891, "global_step": 46636, "epoch": 1110} {"train_loss": -5.662182807922363, "global_step": 46637, "epoch": 1110} {"train_loss": -5.576547622680664, "global_step": 46638, "epoch": 1110} {"train_loss": -5.657625198364258, "global_step": 46639, "epoch": 1110} {"train_loss": -5.66783332824707, "global_step": 46640, "epoch": 1110} {"train_loss": -5.631405830383301, "global_step": 46641, "epoch": 1110} {"train_loss": -5.752063274383545, "global_step": 46642, "epoch": 1110} {"train_loss": -5.67047119140625, "global_step": 46643, "epoch": 1110} {"train_loss": -5.704566955566406, "global_step": 46644, "epoch": 1110} {"train_loss": -5.666860580444336, "global_step": 46645, "epoch": 1110} {"train_loss": -5.665325164794922, "global_step": 46646, "epoch": 1110} {"train_loss": -5.702832221984863, "global_step": 46647, "epoch": 1110} {"train_loss": -5.727136611938477, "global_step": 46648, "epoch": 1110} {"train_loss": -5.672616004943848, "global_step": 46649, "epoch": 1110} {"train_loss": -5.560796737670898, "global_step": 46650, "epoch": 1110} {"train_loss": -5.5312347412109375, "global_step": 46651, "epoch": 1110} {"train_loss": -5.576101779937744, "global_step": 46652, "epoch": 1110} {"train_loss": -5.56749153137207, "global_step": 46653, "epoch": 1110} {"train_loss": -5.674661636352539, "global_step": 46654, "epoch": 1110} {"train_loss": -5.725415229797363, "global_step": 46655, "epoch": 1110} {"train_loss": -5.637192726135254, "global_step": 46656, "epoch": 1110} {"train_loss": -5.663981914520264, "global_step": 46657, "epoch": 1110} {"train_loss": -5.710233688354492, "global_step": 46658, "epoch": 1110} {"train_loss": -5.698297500610352, "global_step": 46659, "epoch": 1110} {"train_loss": -5.606163024902344, "global_step": 46660, "epoch": 1110} {"train_loss": -5.674758695420765, "global_step": 46661, "epoch": 1110, "val_loss": 66078.640625} {"train_loss": -5.5976972579956055, "global_step": 46662, "epoch": 1111} {"train_loss": -5.664280891418457, "global_step": 46663, "epoch": 1111} {"train_loss": -5.603603363037109, "global_step": 46664, "epoch": 1111} {"train_loss": -5.788667678833008, "global_step": 46665, "epoch": 1111} {"train_loss": -5.707374572753906, "global_step": 46666, "epoch": 1111} {"train_loss": -5.671076774597168, "global_step": 46667, "epoch": 1111} {"train_loss": -5.900467872619629, "global_step": 46668, "epoch": 1111} {"train_loss": -5.667712688446045, "global_step": 46669, "epoch": 1111} {"train_loss": -5.8400726318359375, "global_step": 46670, "epoch": 1111} {"train_loss": -5.559029579162598, "global_step": 46671, "epoch": 1111} {"train_loss": -5.78304386138916, "global_step": 46672, "epoch": 1111} {"train_loss": -5.800138473510742, "global_step": 46673, "epoch": 1111} {"train_loss": -5.672739505767822, "global_step": 46674, "epoch": 1111} {"train_loss": -5.576615333557129, "global_step": 46675, "epoch": 1111} {"train_loss": -5.815329551696777, "global_step": 46676, "epoch": 1111} {"train_loss": -5.631263732910156, "global_step": 46677, "epoch": 1111} {"train_loss": -5.6439619064331055, "global_step": 46678, "epoch": 1111} {"train_loss": -5.64107608795166, "global_step": 46679, "epoch": 1111} {"train_loss": -5.757597923278809, "global_step": 46680, "epoch": 1111} {"train_loss": -5.627498626708984, "global_step": 46681, "epoch": 1111} {"train_loss": -5.715872764587402, "global_step": 46682, "epoch": 1111} {"train_loss": -5.823381423950195, "global_step": 46683, "epoch": 1111} {"train_loss": -5.725447654724121, "global_step": 46684, "epoch": 1111} {"train_loss": -5.730828285217285, "global_step": 46685, "epoch": 1111} {"train_loss": -5.814121246337891, "global_step": 46686, "epoch": 1111} {"train_loss": -5.719966888427734, "global_step": 46687, "epoch": 1111} {"train_loss": -5.783276557922363, "global_step": 46688, "epoch": 1111} {"train_loss": -5.672394752502441, "global_step": 46689, "epoch": 1111} {"train_loss": -5.656000137329102, "global_step": 46690, "epoch": 1111} {"train_loss": -5.651729583740234, "global_step": 46691, "epoch": 1111} {"train_loss": -5.619659423828125, "global_step": 46692, "epoch": 1111} {"train_loss": -5.672473430633545, "global_step": 46693, "epoch": 1111} {"train_loss": -5.75262975692749, "global_step": 46694, "epoch": 1111} {"train_loss": -5.671591281890869, "global_step": 46695, "epoch": 1111} {"train_loss": -5.587985992431641, "global_step": 46696, "epoch": 1111} {"train_loss": -5.714558124542236, "global_step": 46697, "epoch": 1111} {"train_loss": -5.731929302215576, "global_step": 46698, "epoch": 1111} {"train_loss": -5.675803184509277, "global_step": 46699, "epoch": 1111} {"train_loss": -5.743860244750977, "global_step": 46700, "epoch": 1111} {"train_loss": -5.657382488250732, "global_step": 46701, "epoch": 1111} {"train_loss": -5.591132164001465, "global_step": 46702, "epoch": 1111} {"train_loss": -5.69903412319365, "global_step": 46703, "epoch": 1111, "val_loss": 67044.203125} {"train_loss": -5.603783130645752, "global_step": 46704, "epoch": 1112} {"train_loss": -5.830534934997559, "global_step": 46705, "epoch": 1112} {"train_loss": -5.827086925506592, "global_step": 46706, "epoch": 1112} {"train_loss": -5.547937870025635, "global_step": 46707, "epoch": 1112} {"train_loss": -5.673516273498535, "global_step": 46708, "epoch": 1112} {"train_loss": -5.555412292480469, "global_step": 46709, "epoch": 1112} {"train_loss": -5.754611968994141, "global_step": 46710, "epoch": 1112} {"train_loss": -5.642046928405762, "global_step": 46711, "epoch": 1112} {"train_loss": -5.593249320983887, "global_step": 46712, "epoch": 1112} {"train_loss": -5.626428604125977, "global_step": 46713, "epoch": 1112} {"train_loss": -5.451408386230469, "global_step": 46714, "epoch": 1112} {"train_loss": -5.548696517944336, "global_step": 46715, "epoch": 1112} {"train_loss": -5.521505355834961, "global_step": 46716, "epoch": 1112} {"train_loss": -5.5482282638549805, "global_step": 46717, "epoch": 1112} {"train_loss": -5.6851606369018555, "global_step": 46718, "epoch": 1112} {"train_loss": -5.724884986877441, "global_step": 46719, "epoch": 1112} {"train_loss": -5.6786603927612305, "global_step": 46720, "epoch": 1112} {"train_loss": -5.635138034820557, "global_step": 46721, "epoch": 1112} {"train_loss": -5.6060967445373535, "global_step": 46722, "epoch": 1112} {"train_loss": -5.563716888427734, "global_step": 46723, "epoch": 1112} {"train_loss": -5.621431827545166, "global_step": 46724, "epoch": 1112} {"train_loss": -5.545029640197754, "global_step": 46725, "epoch": 1112} {"train_loss": -5.5754780769348145, "global_step": 46726, "epoch": 1112} {"train_loss": -5.62277889251709, "global_step": 46727, "epoch": 1112} {"train_loss": -5.800906181335449, "global_step": 46728, "epoch": 1112} {"train_loss": -5.514618873596191, "global_step": 46729, "epoch": 1112} {"train_loss": -5.550187110900879, "global_step": 46730, "epoch": 1112} {"train_loss": -5.690344333648682, "global_step": 46731, "epoch": 1112} {"train_loss": -5.6544647216796875, "global_step": 46732, "epoch": 1112} {"train_loss": -5.663161754608154, "global_step": 46733, "epoch": 1112} {"train_loss": -5.625080108642578, "global_step": 46734, "epoch": 1112} {"train_loss": -5.752889156341553, "global_step": 46735, "epoch": 1112} {"train_loss": -5.563482284545898, "global_step": 46736, "epoch": 1112} {"train_loss": -5.637601852416992, "global_step": 46737, "epoch": 1112} {"train_loss": -5.627945899963379, "global_step": 46738, "epoch": 1112} {"train_loss": -5.795961380004883, "global_step": 46739, "epoch": 1112} {"train_loss": -5.641326904296875, "global_step": 46740, "epoch": 1112} {"train_loss": -5.593080520629883, "global_step": 46741, "epoch": 1112} {"train_loss": -5.691573619842529, "global_step": 46742, "epoch": 1112} {"train_loss": -5.695728302001953, "global_step": 46743, "epoch": 1112} {"train_loss": -5.773792743682861, "global_step": 46744, "epoch": 1112} {"train_loss": -5.63988318897429, "global_step": 46745, "epoch": 1112, "val_loss": 65979.7578125} {"train_loss": -5.746744155883789, "global_step": 46746, "epoch": 1113} {"train_loss": -5.474118232727051, "global_step": 46747, "epoch": 1113} {"train_loss": -5.716327667236328, "global_step": 46748, "epoch": 1113} {"train_loss": -5.634919166564941, "global_step": 46749, "epoch": 1113} {"train_loss": -5.644808292388916, "global_step": 46750, "epoch": 1113} {"train_loss": -5.709329605102539, "global_step": 46751, "epoch": 1113} {"train_loss": -5.585099220275879, "global_step": 46752, "epoch": 1113} {"train_loss": -5.7153401374816895, "global_step": 46753, "epoch": 1113} {"train_loss": -5.831595420837402, "global_step": 46754, "epoch": 1113} {"train_loss": -5.613382339477539, "global_step": 46755, "epoch": 1113} {"train_loss": -5.72579288482666, "global_step": 46756, "epoch": 1113} {"train_loss": -5.896895408630371, "global_step": 46757, "epoch": 1113} {"train_loss": -5.72364616394043, "global_step": 46758, "epoch": 1113} {"train_loss": -5.692209243774414, "global_step": 46759, "epoch": 1113} {"train_loss": -5.845721244812012, "global_step": 46760, "epoch": 1113} {"train_loss": -5.679683208465576, "global_step": 46761, "epoch": 1113} {"train_loss": -5.763848304748535, "global_step": 46762, "epoch": 1113} {"train_loss": -5.709329605102539, "global_step": 46763, "epoch": 1113} {"train_loss": -5.757210731506348, "global_step": 46764, "epoch": 1113} {"train_loss": -5.799232482910156, "global_step": 46765, "epoch": 1113} {"train_loss": -5.751330852508545, "global_step": 46766, "epoch": 1113} {"train_loss": -5.756280899047852, "global_step": 46767, "epoch": 1113} {"train_loss": -5.662895202636719, "global_step": 46768, "epoch": 1113} {"train_loss": -5.725634574890137, "global_step": 46769, "epoch": 1113} {"train_loss": -5.662838935852051, "global_step": 46770, "epoch": 1113} {"train_loss": -5.623187065124512, "global_step": 46771, "epoch": 1113} {"train_loss": -5.786606788635254, "global_step": 46772, "epoch": 1113} {"train_loss": -5.672631740570068, "global_step": 46773, "epoch": 1113} {"train_loss": -5.763749122619629, "global_step": 46774, "epoch": 1113} {"train_loss": -5.5816521644592285, "global_step": 46775, "epoch": 1113} {"train_loss": -5.7113752365112305, "global_step": 46776, "epoch": 1113} {"train_loss": -5.704501152038574, "global_step": 46777, "epoch": 1113} {"train_loss": -5.721766471862793, "global_step": 46778, "epoch": 1113} {"train_loss": -5.6516218185424805, "global_step": 46779, "epoch": 1113} {"train_loss": -5.680127143859863, "global_step": 46780, "epoch": 1113} {"train_loss": -5.629491806030273, "global_step": 46781, "epoch": 1113} {"train_loss": -5.763378143310547, "global_step": 46782, "epoch": 1113} {"train_loss": -5.803693771362305, "global_step": 46783, "epoch": 1113} {"train_loss": -5.67088508605957, "global_step": 46784, "epoch": 1113} {"train_loss": -5.684928894042969, "global_step": 46785, "epoch": 1113} {"train_loss": -5.673348426818848, "global_step": 46786, "epoch": 1113} {"train_loss": -5.706054721559797, "global_step": 46787, "epoch": 1113, "val_loss": 65970.7421875} {"train_loss": -5.756286144256592, "global_step": 46788, "epoch": 1114} {"train_loss": -5.652129650115967, "global_step": 46789, "epoch": 1114} {"train_loss": -5.810953140258789, "global_step": 46790, "epoch": 1114} {"train_loss": -5.669920444488525, "global_step": 46791, "epoch": 1114} {"train_loss": -5.623289585113525, "global_step": 46792, "epoch": 1114} {"train_loss": -5.807333946228027, "global_step": 46793, "epoch": 1114} {"train_loss": -5.663311958312988, "global_step": 46794, "epoch": 1114} {"train_loss": -5.620235443115234, "global_step": 46795, "epoch": 1114} {"train_loss": -5.736635208129883, "global_step": 46796, "epoch": 1114} {"train_loss": -5.805464744567871, "global_step": 46797, "epoch": 1114} {"train_loss": -5.898013591766357, "global_step": 46798, "epoch": 1114} {"train_loss": -5.724735260009766, "global_step": 46799, "epoch": 1114} {"train_loss": -5.633179664611816, "global_step": 46800, "epoch": 1114} {"train_loss": -5.590273380279541, "global_step": 46801, "epoch": 1114} {"train_loss": -5.78779411315918, "global_step": 46802, "epoch": 1114} {"train_loss": -5.624019145965576, "global_step": 46803, "epoch": 1114} {"train_loss": -5.716183185577393, "global_step": 46804, "epoch": 1114} {"train_loss": -5.6621503829956055, "global_step": 46805, "epoch": 1114} {"train_loss": -5.807028770446777, "global_step": 46806, "epoch": 1114} {"train_loss": -5.726465702056885, "global_step": 46807, "epoch": 1114} {"train_loss": -5.77303409576416, "global_step": 46808, "epoch": 1114} {"train_loss": -5.734562397003174, "global_step": 46809, "epoch": 1114} {"train_loss": -5.788852691650391, "global_step": 46810, "epoch": 1114} {"train_loss": -5.78303861618042, "global_step": 46811, "epoch": 1114} {"train_loss": -5.7088236808776855, "global_step": 46812, "epoch": 1114} {"train_loss": -5.618195533752441, "global_step": 46813, "epoch": 1114} {"train_loss": -5.704103946685791, "global_step": 46814, "epoch": 1114} {"train_loss": -5.762173652648926, "global_step": 46815, "epoch": 1114} {"train_loss": -5.792972564697266, "global_step": 46816, "epoch": 1114} {"train_loss": -5.672837734222412, "global_step": 46817, "epoch": 1114} {"train_loss": -5.7142486572265625, "global_step": 46818, "epoch": 1114} {"train_loss": -5.783691883087158, "global_step": 46819, "epoch": 1114} {"train_loss": -5.673559188842773, "global_step": 46820, "epoch": 1114} {"train_loss": -5.8010406494140625, "global_step": 46821, "epoch": 1114} {"train_loss": -5.625406265258789, "global_step": 46822, "epoch": 1114} {"train_loss": -5.741374969482422, "global_step": 46823, "epoch": 1114} {"train_loss": -5.650104999542236, "global_step": 46824, "epoch": 1114} {"train_loss": -5.673155307769775, "global_step": 46825, "epoch": 1114} {"train_loss": -5.741562843322754, "global_step": 46826, "epoch": 1114} {"train_loss": -5.802084922790527, "global_step": 46827, "epoch": 1114} {"train_loss": -5.70911979675293, "global_step": 46828, "epoch": 1114} {"train_loss": -5.720911605017526, "global_step": 46829, "epoch": 1114, "val_loss": 66061.5390625} {"train_loss": -5.871279716491699, "global_step": 46830, "epoch": 1115} {"train_loss": -5.803179740905762, "global_step": 46831, "epoch": 1115} {"train_loss": -5.677360534667969, "global_step": 46832, "epoch": 1115} {"train_loss": -5.736181735992432, "global_step": 46833, "epoch": 1115} {"train_loss": -5.771466255187988, "global_step": 46834, "epoch": 1115} {"train_loss": -5.7734479904174805, "global_step": 46835, "epoch": 1115} {"train_loss": -5.766691207885742, "global_step": 46836, "epoch": 1115} {"train_loss": -5.716359615325928, "global_step": 46837, "epoch": 1115} {"train_loss": -5.802859783172607, "global_step": 46838, "epoch": 1115} {"train_loss": -5.754574775695801, "global_step": 46839, "epoch": 1115} {"train_loss": -5.67236852645874, "global_step": 46840, "epoch": 1115} {"train_loss": -5.567143440246582, "global_step": 46841, "epoch": 1115} {"train_loss": -5.6822190284729, "global_step": 46842, "epoch": 1115} {"train_loss": -5.672365188598633, "global_step": 46843, "epoch": 1115} {"train_loss": -5.731757164001465, "global_step": 46844, "epoch": 1115} {"train_loss": -5.613633155822754, "global_step": 46845, "epoch": 1115} {"train_loss": -5.631711959838867, "global_step": 46846, "epoch": 1115} {"train_loss": -5.760008811950684, "global_step": 46847, "epoch": 1115} {"train_loss": -5.740001201629639, "global_step": 46848, "epoch": 1115} {"train_loss": -5.787827014923096, "global_step": 46849, "epoch": 1115} {"train_loss": -5.728856086730957, "global_step": 46850, "epoch": 1115} {"train_loss": -5.648524284362793, "global_step": 46851, "epoch": 1115} {"train_loss": -5.772252559661865, "global_step": 46852, "epoch": 1115} {"train_loss": -5.645585536956787, "global_step": 46853, "epoch": 1115} {"train_loss": -5.667190074920654, "global_step": 46854, "epoch": 1115} {"train_loss": -5.77911376953125, "global_step": 46855, "epoch": 1115} {"train_loss": -5.6783647537231445, "global_step": 46856, "epoch": 1115} {"train_loss": -5.718233108520508, "global_step": 46857, "epoch": 1115} {"train_loss": -5.60308837890625, "global_step": 46858, "epoch": 1115} {"train_loss": -5.671751976013184, "global_step": 46859, "epoch": 1115} {"train_loss": -5.7581939697265625, "global_step": 46860, "epoch": 1115} {"train_loss": -5.743323802947998, "global_step": 46861, "epoch": 1115} {"train_loss": -5.722945213317871, "global_step": 46862, "epoch": 1115} {"train_loss": -5.6717915534973145, "global_step": 46863, "epoch": 1115} {"train_loss": -5.786371231079102, "global_step": 46864, "epoch": 1115} {"train_loss": -5.630521774291992, "global_step": 46865, "epoch": 1115} {"train_loss": -5.612490177154541, "global_step": 46866, "epoch": 1115} {"train_loss": -5.738733768463135, "global_step": 46867, "epoch": 1115} {"train_loss": -5.851007461547852, "global_step": 46868, "epoch": 1115} {"train_loss": -5.844561576843262, "global_step": 46869, "epoch": 1115} {"train_loss": -5.741613388061523, "global_step": 46870, "epoch": 1115} {"train_loss": -5.72090204556783, "global_step": 46871, "epoch": 1115, "val_loss": 66395.7578125} {"train_loss": -5.685517311096191, "global_step": 46872, "epoch": 1116} {"train_loss": -5.7076497077941895, "global_step": 46873, "epoch": 1116} {"train_loss": -5.802488803863525, "global_step": 46874, "epoch": 1116} {"train_loss": -5.785229206085205, "global_step": 46875, "epoch": 1116} {"train_loss": -5.640820026397705, "global_step": 46876, "epoch": 1116} {"train_loss": -5.680579662322998, "global_step": 46877, "epoch": 1116} {"train_loss": -5.589103698730469, "global_step": 46878, "epoch": 1116} {"train_loss": -5.6388373374938965, "global_step": 46879, "epoch": 1116} {"train_loss": -5.615084648132324, "global_step": 46880, "epoch": 1116} {"train_loss": -5.632328033447266, "global_step": 46881, "epoch": 1116} {"train_loss": -5.7235517501831055, "global_step": 46882, "epoch": 1116} {"train_loss": -5.5887770652771, "global_step": 46883, "epoch": 1116} {"train_loss": -5.661388397216797, "global_step": 46884, "epoch": 1116} {"train_loss": -5.694543361663818, "global_step": 46885, "epoch": 1116} {"train_loss": -5.5652923583984375, "global_step": 46886, "epoch": 1116} {"train_loss": -5.775795936584473, "global_step": 46887, "epoch": 1116} {"train_loss": -5.646903038024902, "global_step": 46888, "epoch": 1116} {"train_loss": -5.750875473022461, "global_step": 46889, "epoch": 1116} {"train_loss": -5.556600093841553, "global_step": 46890, "epoch": 1116} {"train_loss": -5.639151573181152, "global_step": 46891, "epoch": 1116} {"train_loss": -5.675288200378418, "global_step": 46892, "epoch": 1116} {"train_loss": -5.755252838134766, "global_step": 46893, "epoch": 1116} {"train_loss": -5.7749834060668945, "global_step": 46894, "epoch": 1116} {"train_loss": -5.640316963195801, "global_step": 46895, "epoch": 1116} {"train_loss": -5.691758632659912, "global_step": 46896, "epoch": 1116} {"train_loss": -5.706274509429932, "global_step": 46897, "epoch": 1116} {"train_loss": -5.7785749435424805, "global_step": 46898, "epoch": 1116} {"train_loss": -5.6156816482543945, "global_step": 46899, "epoch": 1116} {"train_loss": -5.83635950088501, "global_step": 46900, "epoch": 1116} {"train_loss": -5.59969425201416, "global_step": 46901, "epoch": 1116} {"train_loss": -5.657928943634033, "global_step": 46902, "epoch": 1116} {"train_loss": -5.716938018798828, "global_step": 46903, "epoch": 1116} {"train_loss": -5.656622409820557, "global_step": 46904, "epoch": 1116} {"train_loss": -5.7535247802734375, "global_step": 46905, "epoch": 1116} {"train_loss": -5.712991714477539, "global_step": 46906, "epoch": 1116} {"train_loss": -5.7650957107543945, "global_step": 46907, "epoch": 1116} {"train_loss": -5.6142354011535645, "global_step": 46908, "epoch": 1116} {"train_loss": -5.761059761047363, "global_step": 46909, "epoch": 1116} {"train_loss": -5.736425876617432, "global_step": 46910, "epoch": 1116} {"train_loss": -5.7422990798950195, "global_step": 46911, "epoch": 1116} {"train_loss": -5.59871768951416, "global_step": 46912, "epoch": 1116} {"train_loss": -5.689231475194295, "global_step": 46913, "epoch": 1116, "val_loss": 66202.53125} {"train_loss": -5.738397598266602, "global_step": 46914, "epoch": 1117} {"train_loss": -5.690682411193848, "global_step": 46915, "epoch": 1117} {"train_loss": -5.701612949371338, "global_step": 46916, "epoch": 1117} {"train_loss": -5.728982925415039, "global_step": 46917, "epoch": 1117} {"train_loss": -5.72153902053833, "global_step": 46918, "epoch": 1117} {"train_loss": -5.75468635559082, "global_step": 46919, "epoch": 1117} {"train_loss": -5.658106803894043, "global_step": 46920, "epoch": 1117} {"train_loss": -5.830849647521973, "global_step": 46921, "epoch": 1117} {"train_loss": -5.747935771942139, "global_step": 46922, "epoch": 1117} {"train_loss": -5.686473846435547, "global_step": 46923, "epoch": 1117} {"train_loss": -5.789069175720215, "global_step": 46924, "epoch": 1117} {"train_loss": -5.656877517700195, "global_step": 46925, "epoch": 1117} {"train_loss": -5.80409049987793, "global_step": 46926, "epoch": 1117} {"train_loss": -5.679431438446045, "global_step": 46927, "epoch": 1117} {"train_loss": -5.747969627380371, "global_step": 46928, "epoch": 1117} {"train_loss": -5.684069633483887, "global_step": 46929, "epoch": 1117} {"train_loss": -5.858851432800293, "global_step": 46930, "epoch": 1117} {"train_loss": -5.714132308959961, "global_step": 46931, "epoch": 1117} {"train_loss": -5.591527938842773, "global_step": 46932, "epoch": 1117} {"train_loss": -5.699845314025879, "global_step": 46933, "epoch": 1117} {"train_loss": -5.7840776443481445, "global_step": 46934, "epoch": 1117} {"train_loss": -5.687702655792236, "global_step": 46935, "epoch": 1117} {"train_loss": -5.864866256713867, "global_step": 46936, "epoch": 1117} {"train_loss": -5.856707572937012, "global_step": 46937, "epoch": 1117} {"train_loss": -5.8029375076293945, "global_step": 46938, "epoch": 1117} {"train_loss": -5.675905704498291, "global_step": 46939, "epoch": 1117} {"train_loss": -5.8862762451171875, "global_step": 46940, "epoch": 1117} {"train_loss": -5.672723770141602, "global_step": 46941, "epoch": 1117} {"train_loss": -5.629282474517822, "global_step": 46942, "epoch": 1117} {"train_loss": -5.6470561027526855, "global_step": 46943, "epoch": 1117} {"train_loss": -5.771063804626465, "global_step": 46944, "epoch": 1117} {"train_loss": -5.750810146331787, "global_step": 46945, "epoch": 1117} {"train_loss": -5.686942100524902, "global_step": 46946, "epoch": 1117} {"train_loss": -5.8112688064575195, "global_step": 46947, "epoch": 1117} {"train_loss": -5.7199482917785645, "global_step": 46948, "epoch": 1117} {"train_loss": -5.8060736656188965, "global_step": 46949, "epoch": 1117} {"train_loss": -5.751061916351318, "global_step": 46950, "epoch": 1117} {"train_loss": -5.63580322265625, "global_step": 46951, "epoch": 1117} {"train_loss": -5.6844868659973145, "global_step": 46952, "epoch": 1117} {"train_loss": -5.820866107940674, "global_step": 46953, "epoch": 1117} {"train_loss": -5.6460418701171875, "global_step": 46954, "epoch": 1117} {"train_loss": -5.735053391683669, "global_step": 46955, "epoch": 1117, "val_loss": 66180.3046875} {"train_loss": -5.7358479499816895, "global_step": 46956, "epoch": 1118} {"train_loss": -5.687895774841309, "global_step": 46957, "epoch": 1118} {"train_loss": -5.770781517028809, "global_step": 46958, "epoch": 1118} {"train_loss": -5.880698204040527, "global_step": 46959, "epoch": 1118} {"train_loss": -5.701091766357422, "global_step": 46960, "epoch": 1118} {"train_loss": -5.61845064163208, "global_step": 46961, "epoch": 1118} {"train_loss": -5.663797378540039, "global_step": 46962, "epoch": 1118} {"train_loss": -5.78293514251709, "global_step": 46963, "epoch": 1118} {"train_loss": -5.623015880584717, "global_step": 46964, "epoch": 1118} {"train_loss": -5.788298606872559, "global_step": 46965, "epoch": 1118} {"train_loss": -5.779836654663086, "global_step": 46966, "epoch": 1118} {"train_loss": -5.7713141441345215, "global_step": 46967, "epoch": 1118} {"train_loss": -5.760904788970947, "global_step": 46968, "epoch": 1118} {"train_loss": -5.7447919845581055, "global_step": 46969, "epoch": 1118} {"train_loss": -5.835081100463867, "global_step": 46970, "epoch": 1118} {"train_loss": -5.716363906860352, "global_step": 46971, "epoch": 1118} {"train_loss": -5.687941551208496, "global_step": 46972, "epoch": 1118} {"train_loss": -5.809144020080566, "global_step": 46973, "epoch": 1118} {"train_loss": -5.690436363220215, "global_step": 46974, "epoch": 1118} {"train_loss": -5.756202697753906, "global_step": 46975, "epoch": 1118} {"train_loss": -5.695108413696289, "global_step": 46976, "epoch": 1118} {"train_loss": -5.583515644073486, "global_step": 46977, "epoch": 1118} {"train_loss": -5.753495693206787, "global_step": 46978, "epoch": 1118} {"train_loss": -5.720993995666504, "global_step": 46979, "epoch": 1118} {"train_loss": -5.769153118133545, "global_step": 46980, "epoch": 1118} {"train_loss": -5.683654308319092, "global_step": 46981, "epoch": 1118} {"train_loss": -5.701504707336426, "global_step": 46982, "epoch": 1118} {"train_loss": -5.626861572265625, "global_step": 46983, "epoch": 1118} {"train_loss": -5.606825828552246, "global_step": 46984, "epoch": 1118} {"train_loss": -5.720879554748535, "global_step": 46985, "epoch": 1118} {"train_loss": -5.775496482849121, "global_step": 46986, "epoch": 1118} {"train_loss": -5.7338151931762695, "global_step": 46987, "epoch": 1118} {"train_loss": -5.680521488189697, "global_step": 46988, "epoch": 1118} {"train_loss": -5.6345367431640625, "global_step": 46989, "epoch": 1118} {"train_loss": -5.747988700866699, "global_step": 46990, "epoch": 1118} {"train_loss": -5.607908248901367, "global_step": 46991, "epoch": 1118} {"train_loss": -5.745545387268066, "global_step": 46992, "epoch": 1118} {"train_loss": -5.645373344421387, "global_step": 46993, "epoch": 1118} {"train_loss": -5.726754188537598, "global_step": 46994, "epoch": 1118} {"train_loss": -5.787181854248047, "global_step": 46995, "epoch": 1118} {"train_loss": -5.663824081420898, "global_step": 46996, "epoch": 1118} {"train_loss": -5.71814657392956, "global_step": 46997, "epoch": 1118, "val_loss": 66171.9140625} {"train_loss": -5.651672840118408, "global_step": 46998, "epoch": 1119} {"train_loss": -5.778407096862793, "global_step": 46999, "epoch": 1119} {"train_loss": -5.704202175140381, "global_step": 47000, "epoch": 1119} {"train_loss": -5.769431114196777, "global_step": 47001, "epoch": 1119} {"train_loss": -5.841433525085449, "global_step": 47002, "epoch": 1119} {"train_loss": -5.769689559936523, "global_step": 47003, "epoch": 1119} {"train_loss": -5.746884822845459, "global_step": 47004, "epoch": 1119} {"train_loss": -5.666250228881836, "global_step": 47005, "epoch": 1119} {"train_loss": -5.682075500488281, "global_step": 47006, "epoch": 1119} {"train_loss": -5.695878982543945, "global_step": 47007, "epoch": 1119} {"train_loss": -5.759398460388184, "global_step": 47008, "epoch": 1119} {"train_loss": -5.75996208190918, "global_step": 47009, "epoch": 1119} {"train_loss": -5.592089653015137, "global_step": 47010, "epoch": 1119} {"train_loss": -5.71782922744751, "global_step": 47011, "epoch": 1119} {"train_loss": -5.786286354064941, "global_step": 47012, "epoch": 1119} {"train_loss": -5.767781734466553, "global_step": 47013, "epoch": 1119} {"train_loss": -5.621009826660156, "global_step": 47014, "epoch": 1119} {"train_loss": -5.807621955871582, "global_step": 47015, "epoch": 1119} {"train_loss": -5.797520637512207, "global_step": 47016, "epoch": 1119} {"train_loss": -5.81362771987915, "global_step": 47017, "epoch": 1119} {"train_loss": -5.742043495178223, "global_step": 47018, "epoch": 1119} {"train_loss": -5.826047897338867, "global_step": 47019, "epoch": 1119} {"train_loss": -5.846826076507568, "global_step": 47020, "epoch": 1119} {"train_loss": -5.75642204284668, "global_step": 47021, "epoch": 1119} {"train_loss": -5.792072296142578, "global_step": 47022, "epoch": 1119} {"train_loss": -5.737299919128418, "global_step": 47023, "epoch": 1119} {"train_loss": -5.781805992126465, "global_step": 47024, "epoch": 1119} {"train_loss": -5.798248291015625, "global_step": 47025, "epoch": 1119} {"train_loss": -5.799464702606201, "global_step": 47026, "epoch": 1119} {"train_loss": -5.825674057006836, "global_step": 47027, "epoch": 1119} {"train_loss": -5.795925140380859, "global_step": 47028, "epoch": 1119} {"train_loss": -5.676322937011719, "global_step": 47029, "epoch": 1119} {"train_loss": -5.817204475402832, "global_step": 47030, "epoch": 1119} {"train_loss": -5.693875312805176, "global_step": 47031, "epoch": 1119} {"train_loss": -5.79701566696167, "global_step": 47032, "epoch": 1119} {"train_loss": -5.658631324768066, "global_step": 47033, "epoch": 1119} {"train_loss": -5.708569526672363, "global_step": 47034, "epoch": 1119} {"train_loss": -5.656241416931152, "global_step": 47035, "epoch": 1119} {"train_loss": -5.660726547241211, "global_step": 47036, "epoch": 1119} {"train_loss": -5.687532424926758, "global_step": 47037, "epoch": 1119} {"train_loss": -5.6646833419799805, "global_step": 47038, "epoch": 1119} {"train_loss": -5.741701988946824, "global_step": 47039, "epoch": 1119, "val_loss": 65854.7734375} {"train_loss": -5.723189353942871, "global_step": 47040, "epoch": 1120} {"train_loss": -5.765009880065918, "global_step": 47041, "epoch": 1120} {"train_loss": -5.730119705200195, "global_step": 47042, "epoch": 1120} {"train_loss": -5.8192853927612305, "global_step": 47043, "epoch": 1120} {"train_loss": -5.651130676269531, "global_step": 47044, "epoch": 1120} {"train_loss": -5.79266357421875, "global_step": 47045, "epoch": 1120} {"train_loss": -5.706125259399414, "global_step": 47046, "epoch": 1120} {"train_loss": -5.796850204467773, "global_step": 47047, "epoch": 1120} {"train_loss": -5.871431350708008, "global_step": 47048, "epoch": 1120} {"train_loss": -5.7078399658203125, "global_step": 47049, "epoch": 1120} {"train_loss": -5.784755706787109, "global_step": 47050, "epoch": 1120} {"train_loss": -5.785280227661133, "global_step": 47051, "epoch": 1120} {"train_loss": -5.797484874725342, "global_step": 47052, "epoch": 1120} {"train_loss": -5.690310478210449, "global_step": 47053, "epoch": 1120} {"train_loss": -5.708730697631836, "global_step": 47054, "epoch": 1120} {"train_loss": -5.874416828155518, "global_step": 47055, "epoch": 1120} {"train_loss": -5.635880470275879, "global_step": 47056, "epoch": 1120} {"train_loss": -5.519023418426514, "global_step": 47057, "epoch": 1120} {"train_loss": -5.690650939941406, "global_step": 47058, "epoch": 1120} {"train_loss": -5.604951858520508, "global_step": 47059, "epoch": 1120} {"train_loss": -5.765654563903809, "global_step": 47060, "epoch": 1120} {"train_loss": -5.569287300109863, "global_step": 47061, "epoch": 1120} {"train_loss": -5.720418930053711, "global_step": 47062, "epoch": 1120} {"train_loss": -5.688022613525391, "global_step": 47063, "epoch": 1120} {"train_loss": -5.732429504394531, "global_step": 47064, "epoch": 1120} {"train_loss": -5.685531139373779, "global_step": 47065, "epoch": 1120} {"train_loss": -5.7389020919799805, "global_step": 47066, "epoch": 1120} {"train_loss": -5.589362144470215, "global_step": 47067, "epoch": 1120} {"train_loss": -5.747629165649414, "global_step": 47068, "epoch": 1120} {"train_loss": -5.7154741287231445, "global_step": 47069, "epoch": 1120} {"train_loss": -5.726265907287598, "global_step": 47070, "epoch": 1120} {"train_loss": -5.718133926391602, "global_step": 47071, "epoch": 1120} {"train_loss": -5.727615833282471, "global_step": 47072, "epoch": 1120} {"train_loss": -5.7473907470703125, "global_step": 47073, "epoch": 1120} {"train_loss": -5.73509407043457, "global_step": 47074, "epoch": 1120} {"train_loss": -5.818392276763916, "global_step": 47075, "epoch": 1120} {"train_loss": -5.598067283630371, "global_step": 47076, "epoch": 1120} {"train_loss": -5.703788757324219, "global_step": 47077, "epoch": 1120} {"train_loss": -5.770769119262695, "global_step": 47078, "epoch": 1120} {"train_loss": -5.778694152832031, "global_step": 47079, "epoch": 1120} {"train_loss": -5.668093681335449, "global_step": 47080, "epoch": 1120} {"train_loss": -5.718937465122768, "global_step": 47081, "epoch": 1120, "val_loss": 65877.2890625} {"train_loss": -5.652938365936279, "global_step": 47082, "epoch": 1121} {"train_loss": -5.742085933685303, "global_step": 47083, "epoch": 1121} {"train_loss": -5.634219169616699, "global_step": 47084, "epoch": 1121} {"train_loss": -5.689752578735352, "global_step": 47085, "epoch": 1121} {"train_loss": -5.7555012702941895, "global_step": 47086, "epoch": 1121} {"train_loss": -5.696585655212402, "global_step": 47087, "epoch": 1121} {"train_loss": -5.657263278961182, "global_step": 47088, "epoch": 1121} {"train_loss": -5.734794616699219, "global_step": 47089, "epoch": 1121} {"train_loss": -5.6317901611328125, "global_step": 47090, "epoch": 1121} {"train_loss": -5.620791435241699, "global_step": 47091, "epoch": 1121} {"train_loss": -5.834322452545166, "global_step": 47092, "epoch": 1121} {"train_loss": -5.678915977478027, "global_step": 47093, "epoch": 1121} {"train_loss": -5.672407150268555, "global_step": 47094, "epoch": 1121} {"train_loss": -5.698766231536865, "global_step": 47095, "epoch": 1121} {"train_loss": -5.643693447113037, "global_step": 47096, "epoch": 1121} {"train_loss": -5.723780632019043, "global_step": 47097, "epoch": 1121} {"train_loss": -5.693321228027344, "global_step": 47098, "epoch": 1121} {"train_loss": -5.750417232513428, "global_step": 47099, "epoch": 1121} {"train_loss": -5.709722995758057, "global_step": 47100, "epoch": 1121} {"train_loss": -5.50620698928833, "global_step": 47101, "epoch": 1121} {"train_loss": -5.76907205581665, "global_step": 47102, "epoch": 1121} {"train_loss": -5.452092170715332, "global_step": 47103, "epoch": 1121} {"train_loss": -5.616959571838379, "global_step": 47104, "epoch": 1121} {"train_loss": -5.491689205169678, "global_step": 47105, "epoch": 1121} {"train_loss": -5.592299461364746, "global_step": 47106, "epoch": 1121} {"train_loss": -5.722591400146484, "global_step": 47107, "epoch": 1121} {"train_loss": -5.6010847091674805, "global_step": 47108, "epoch": 1121} {"train_loss": -5.620901584625244, "global_step": 47109, "epoch": 1121} {"train_loss": -5.605265140533447, "global_step": 47110, "epoch": 1121} {"train_loss": -5.501338958740234, "global_step": 47111, "epoch": 1121} {"train_loss": -5.703843116760254, "global_step": 47112, "epoch": 1121} {"train_loss": -5.781059741973877, "global_step": 47113, "epoch": 1121} {"train_loss": -5.576010704040527, "global_step": 47114, "epoch": 1121} {"train_loss": -5.694563865661621, "global_step": 47115, "epoch": 1121} {"train_loss": -5.5950117111206055, "global_step": 47116, "epoch": 1121} {"train_loss": -5.671380996704102, "global_step": 47117, "epoch": 1121} {"train_loss": -5.800926208496094, "global_step": 47118, "epoch": 1121} {"train_loss": -5.6884765625, "global_step": 47119, "epoch": 1121} {"train_loss": -5.736109733581543, "global_step": 47120, "epoch": 1121} {"train_loss": -5.696047782897949, "global_step": 47121, "epoch": 1121} {"train_loss": -5.825482368469238, "global_step": 47122, "epoch": 1121} {"train_loss": -5.671729405721028, "global_step": 47123, "epoch": 1121, "val_loss": 66180.078125} {"train_loss": -5.715943336486816, "global_step": 47124, "epoch": 1122} {"train_loss": -5.726996421813965, "global_step": 47125, "epoch": 1122} {"train_loss": -5.721042633056641, "global_step": 47126, "epoch": 1122} {"train_loss": -5.6978654861450195, "global_step": 47127, "epoch": 1122} {"train_loss": -5.783875465393066, "global_step": 47128, "epoch": 1122} {"train_loss": -5.625943183898926, "global_step": 47129, "epoch": 1122} {"train_loss": -5.707388401031494, "global_step": 47130, "epoch": 1122} {"train_loss": -5.868031024932861, "global_step": 47131, "epoch": 1122} {"train_loss": -5.849220275878906, "global_step": 47132, "epoch": 1122} {"train_loss": -5.801117897033691, "global_step": 47133, "epoch": 1122} {"train_loss": -5.801340579986572, "global_step": 47134, "epoch": 1122} {"train_loss": -5.778082847595215, "global_step": 47135, "epoch": 1122} {"train_loss": -5.790923595428467, "global_step": 47136, "epoch": 1122} {"train_loss": -5.784259796142578, "global_step": 47137, "epoch": 1122} {"train_loss": -5.764579772949219, "global_step": 47138, "epoch": 1122} {"train_loss": -5.744400501251221, "global_step": 47139, "epoch": 1122} {"train_loss": -5.669238567352295, "global_step": 47140, "epoch": 1122} {"train_loss": -5.769993782043457, "global_step": 47141, "epoch": 1122} {"train_loss": -5.7333455085754395, "global_step": 47142, "epoch": 1122} {"train_loss": -5.569748878479004, "global_step": 47143, "epoch": 1122} {"train_loss": -5.776810169219971, "global_step": 47144, "epoch": 1122} {"train_loss": -5.614956855773926, "global_step": 47145, "epoch": 1122} {"train_loss": -5.822132110595703, "global_step": 47146, "epoch": 1122} {"train_loss": -5.739772319793701, "global_step": 47147, "epoch": 1122} {"train_loss": -5.70599365234375, "global_step": 47148, "epoch": 1122} {"train_loss": -5.734508037567139, "global_step": 47149, "epoch": 1122} {"train_loss": -5.667758464813232, "global_step": 47150, "epoch": 1122} {"train_loss": -5.671054363250732, "global_step": 47151, "epoch": 1122} {"train_loss": -5.698553085327148, "global_step": 47152, "epoch": 1122} {"train_loss": -5.657182693481445, "global_step": 47153, "epoch": 1122} {"train_loss": -5.746681213378906, "global_step": 47154, "epoch": 1122} {"train_loss": -5.651803970336914, "global_step": 47155, "epoch": 1122} {"train_loss": -5.609983444213867, "global_step": 47156, "epoch": 1122} {"train_loss": -5.636890411376953, "global_step": 47157, "epoch": 1122} {"train_loss": -5.745847225189209, "global_step": 47158, "epoch": 1122} {"train_loss": -5.789083003997803, "global_step": 47159, "epoch": 1122} {"train_loss": -5.739108562469482, "global_step": 47160, "epoch": 1122} {"train_loss": -5.75949764251709, "global_step": 47161, "epoch": 1122} {"train_loss": -5.7166876792907715, "global_step": 47162, "epoch": 1122} {"train_loss": -5.623219966888428, "global_step": 47163, "epoch": 1122} {"train_loss": -5.6924896240234375, "global_step": 47164, "epoch": 1122} {"train_loss": -5.722587596802485, "global_step": 47165, "epoch": 1122, "val_loss": 66043.609375} {"train_loss": -5.711214065551758, "global_step": 47166, "epoch": 1123} {"train_loss": -5.784199237823486, "global_step": 47167, "epoch": 1123} {"train_loss": -5.681853294372559, "global_step": 47168, "epoch": 1123} {"train_loss": -5.7388916015625, "global_step": 47169, "epoch": 1123} {"train_loss": -5.836007118225098, "global_step": 47170, "epoch": 1123} {"train_loss": -5.681514263153076, "global_step": 47171, "epoch": 1123} {"train_loss": -5.631309986114502, "global_step": 47172, "epoch": 1123} {"train_loss": -5.658523082733154, "global_step": 47173, "epoch": 1123} {"train_loss": -5.801623344421387, "global_step": 47174, "epoch": 1123} {"train_loss": -5.793886661529541, "global_step": 47175, "epoch": 1123} {"train_loss": -5.7765092849731445, "global_step": 47176, "epoch": 1123} {"train_loss": -5.786123752593994, "global_step": 47177, "epoch": 1123} {"train_loss": -5.719085693359375, "global_step": 47178, "epoch": 1123} {"train_loss": -5.7261199951171875, "global_step": 47179, "epoch": 1123} {"train_loss": -5.789436340332031, "global_step": 47180, "epoch": 1123} {"train_loss": -5.664103031158447, "global_step": 47181, "epoch": 1123} {"train_loss": -5.865443229675293, "global_step": 47182, "epoch": 1123} {"train_loss": -5.613661766052246, "global_step": 47183, "epoch": 1123} {"train_loss": -5.678255081176758, "global_step": 47184, "epoch": 1123} {"train_loss": -5.684149742126465, "global_step": 47185, "epoch": 1123} {"train_loss": -5.765177249908447, "global_step": 47186, "epoch": 1123} {"train_loss": -5.706184387207031, "global_step": 47187, "epoch": 1123} {"train_loss": -5.716456413269043, "global_step": 47188, "epoch": 1123} {"train_loss": -5.687026023864746, "global_step": 47189, "epoch": 1123} {"train_loss": -5.689450263977051, "global_step": 47190, "epoch": 1123} {"train_loss": -5.757316589355469, "global_step": 47191, "epoch": 1123} {"train_loss": -5.741355895996094, "global_step": 47192, "epoch": 1123} {"train_loss": -5.700103759765625, "global_step": 47193, "epoch": 1123} {"train_loss": -5.754769325256348, "global_step": 47194, "epoch": 1123} {"train_loss": -5.73818302154541, "global_step": 47195, "epoch": 1123} {"train_loss": -5.750307083129883, "global_step": 47196, "epoch": 1123} {"train_loss": -5.7651143074035645, "global_step": 47197, "epoch": 1123} {"train_loss": -5.835742950439453, "global_step": 47198, "epoch": 1123} {"train_loss": -5.637434959411621, "global_step": 47199, "epoch": 1123} {"train_loss": -5.818814754486084, "global_step": 47200, "epoch": 1123} {"train_loss": -5.766366004943848, "global_step": 47201, "epoch": 1123} {"train_loss": -5.877551078796387, "global_step": 47202, "epoch": 1123} {"train_loss": -5.677162170410156, "global_step": 47203, "epoch": 1123} {"train_loss": -5.734903335571289, "global_step": 47204, "epoch": 1123} {"train_loss": -5.715208053588867, "global_step": 47205, "epoch": 1123} {"train_loss": -5.81118106842041, "global_step": 47206, "epoch": 1123} {"train_loss": -5.736254419599261, "global_step": 47207, "epoch": 1123, "val_loss": 66442.25} {"train_loss": -5.732443332672119, "global_step": 47208, "epoch": 1124} {"train_loss": -5.846426010131836, "global_step": 47209, "epoch": 1124} {"train_loss": -5.636889457702637, "global_step": 47210, "epoch": 1124} {"train_loss": -5.726491928100586, "global_step": 47211, "epoch": 1124} {"train_loss": -5.799596309661865, "global_step": 47212, "epoch": 1124} {"train_loss": -5.717385292053223, "global_step": 47213, "epoch": 1124} {"train_loss": -5.747077465057373, "global_step": 47214, "epoch": 1124} {"train_loss": -5.786408424377441, "global_step": 47215, "epoch": 1124} {"train_loss": -5.756210803985596, "global_step": 47216, "epoch": 1124} {"train_loss": -5.681969165802002, "global_step": 47217, "epoch": 1124} {"train_loss": -5.689314842224121, "global_step": 47218, "epoch": 1124} {"train_loss": -5.734665870666504, "global_step": 47219, "epoch": 1124} {"train_loss": -5.735429763793945, "global_step": 47220, "epoch": 1124} {"train_loss": -5.6473493576049805, "global_step": 47221, "epoch": 1124} {"train_loss": -5.66292142868042, "global_step": 47222, "epoch": 1124} {"train_loss": -5.707344055175781, "global_step": 47223, "epoch": 1124} {"train_loss": -5.799761772155762, "global_step": 47224, "epoch": 1124} {"train_loss": -5.644460678100586, "global_step": 47225, "epoch": 1124} {"train_loss": -5.838266372680664, "global_step": 47226, "epoch": 1124} {"train_loss": -5.715386390686035, "global_step": 47227, "epoch": 1124} {"train_loss": -5.714634895324707, "global_step": 47228, "epoch": 1124} {"train_loss": -5.670262813568115, "global_step": 47229, "epoch": 1124} {"train_loss": -5.598688125610352, "global_step": 47230, "epoch": 1124} {"train_loss": -5.696732521057129, "global_step": 47231, "epoch": 1124} {"train_loss": -5.745272636413574, "global_step": 47232, "epoch": 1124} {"train_loss": -5.807290077209473, "global_step": 47233, "epoch": 1124} {"train_loss": -5.759243011474609, "global_step": 47234, "epoch": 1124} {"train_loss": -5.665814399719238, "global_step": 47235, "epoch": 1124} {"train_loss": -5.831792831420898, "global_step": 47236, "epoch": 1124} {"train_loss": -5.676535129547119, "global_step": 47237, "epoch": 1124} {"train_loss": -5.734363079071045, "global_step": 47238, "epoch": 1124} {"train_loss": -5.724795341491699, "global_step": 47239, "epoch": 1124} {"train_loss": -5.748533248901367, "global_step": 47240, "epoch": 1124} {"train_loss": -5.76313591003418, "global_step": 47241, "epoch": 1124} {"train_loss": -5.660585403442383, "global_step": 47242, "epoch": 1124} {"train_loss": -5.802677631378174, "global_step": 47243, "epoch": 1124} {"train_loss": -5.778630256652832, "global_step": 47244, "epoch": 1124} {"train_loss": -5.64829158782959, "global_step": 47245, "epoch": 1124} {"train_loss": -5.694790840148926, "global_step": 47246, "epoch": 1124} {"train_loss": -5.726195812225342, "global_step": 47247, "epoch": 1124} {"train_loss": -5.761119842529297, "global_step": 47248, "epoch": 1124} {"train_loss": -5.728132361457462, "global_step": 47249, "epoch": 1124, "val_loss": 65939.1328125} {"train_loss": -5.767809867858887, "global_step": 47250, "epoch": 1125} {"train_loss": -5.815285682678223, "global_step": 47251, "epoch": 1125} {"train_loss": -5.739160060882568, "global_step": 47252, "epoch": 1125} {"train_loss": -5.920599460601807, "global_step": 47253, "epoch": 1125} {"train_loss": -5.72930908203125, "global_step": 47254, "epoch": 1125} {"train_loss": -5.796064853668213, "global_step": 47255, "epoch": 1125} {"train_loss": -5.781278610229492, "global_step": 47256, "epoch": 1125} {"train_loss": -5.7511820793151855, "global_step": 47257, "epoch": 1125} {"train_loss": -5.771402359008789, "global_step": 47258, "epoch": 1125} {"train_loss": -5.84006404876709, "global_step": 47259, "epoch": 1125} {"train_loss": -5.829316139221191, "global_step": 47260, "epoch": 1125} {"train_loss": -5.783054351806641, "global_step": 47261, "epoch": 1125} {"train_loss": -5.697404861450195, "global_step": 47262, "epoch": 1125} {"train_loss": -5.7050371170043945, "global_step": 47263, "epoch": 1125} {"train_loss": -5.788773536682129, "global_step": 47264, "epoch": 1125} {"train_loss": -5.7122273445129395, "global_step": 47265, "epoch": 1125} {"train_loss": -5.792840957641602, "global_step": 47266, "epoch": 1125} {"train_loss": -5.925473213195801, "global_step": 47267, "epoch": 1125} {"train_loss": -5.7631683349609375, "global_step": 47268, "epoch": 1125} {"train_loss": -5.739632606506348, "global_step": 47269, "epoch": 1125} {"train_loss": -5.672114372253418, "global_step": 47270, "epoch": 1125} {"train_loss": -5.80702018737793, "global_step": 47271, "epoch": 1125} {"train_loss": -5.771129608154297, "global_step": 47272, "epoch": 1125} {"train_loss": -5.651617050170898, "global_step": 47273, "epoch": 1125} {"train_loss": -5.791535377502441, "global_step": 47274, "epoch": 1125} {"train_loss": -5.861317157745361, "global_step": 47275, "epoch": 1125} {"train_loss": -5.649641990661621, "global_step": 47276, "epoch": 1125} {"train_loss": -5.6876912117004395, "global_step": 47277, "epoch": 1125} {"train_loss": -5.836209297180176, "global_step": 47278, "epoch": 1125} {"train_loss": -5.676029205322266, "global_step": 47279, "epoch": 1125} {"train_loss": -5.732556343078613, "global_step": 47280, "epoch": 1125} {"train_loss": -5.665813446044922, "global_step": 47281, "epoch": 1125} {"train_loss": -5.790708541870117, "global_step": 47282, "epoch": 1125} {"train_loss": -5.7625532150268555, "global_step": 47283, "epoch": 1125} {"train_loss": -5.688444137573242, "global_step": 47284, "epoch": 1125} {"train_loss": -5.717564105987549, "global_step": 47285, "epoch": 1125} {"train_loss": -5.698248386383057, "global_step": 47286, "epoch": 1125} {"train_loss": -5.608049392700195, "global_step": 47287, "epoch": 1125} {"train_loss": -5.787578582763672, "global_step": 47288, "epoch": 1125} {"train_loss": -5.749617576599121, "global_step": 47289, "epoch": 1125} {"train_loss": -5.665984630584717, "global_step": 47290, "epoch": 1125} {"train_loss": -5.751201073328654, "global_step": 47291, "epoch": 1125, "val_loss": 66008.671875} {"train_loss": -5.753196716308594, "global_step": 47292, "epoch": 1126} {"train_loss": -5.731475830078125, "global_step": 47293, "epoch": 1126} {"train_loss": -5.777303695678711, "global_step": 47294, "epoch": 1126} {"train_loss": -5.651304721832275, "global_step": 47295, "epoch": 1126} {"train_loss": -5.726219177246094, "global_step": 47296, "epoch": 1126} {"train_loss": -5.787405490875244, "global_step": 47297, "epoch": 1126} {"train_loss": -5.733090400695801, "global_step": 47298, "epoch": 1126} {"train_loss": -5.661272048950195, "global_step": 47299, "epoch": 1126} {"train_loss": -5.6390814781188965, "global_step": 47300, "epoch": 1126} {"train_loss": -5.760262966156006, "global_step": 47301, "epoch": 1126} {"train_loss": -5.76397180557251, "global_step": 47302, "epoch": 1126} {"train_loss": -5.790223121643066, "global_step": 47303, "epoch": 1126} {"train_loss": -5.872681140899658, "global_step": 47304, "epoch": 1126} {"train_loss": -5.844443321228027, "global_step": 47305, "epoch": 1126} {"train_loss": -5.820640563964844, "global_step": 47306, "epoch": 1126} {"train_loss": -5.807986259460449, "global_step": 47307, "epoch": 1126} {"train_loss": -5.67384147644043, "global_step": 47308, "epoch": 1126} {"train_loss": -5.675284385681152, "global_step": 47309, "epoch": 1126} {"train_loss": -5.746969223022461, "global_step": 47310, "epoch": 1126} {"train_loss": -5.749917030334473, "global_step": 47311, "epoch": 1126} {"train_loss": -5.834910869598389, "global_step": 47312, "epoch": 1126} {"train_loss": -5.689472675323486, "global_step": 47313, "epoch": 1126} {"train_loss": -5.767587184906006, "global_step": 47314, "epoch": 1126} {"train_loss": -5.786746025085449, "global_step": 47315, "epoch": 1126} {"train_loss": -5.7471795082092285, "global_step": 47316, "epoch": 1126} {"train_loss": -5.730307102203369, "global_step": 47317, "epoch": 1126} {"train_loss": -5.694901466369629, "global_step": 47318, "epoch": 1126} {"train_loss": -5.734030246734619, "global_step": 47319, "epoch": 1126} {"train_loss": -5.710940837860107, "global_step": 47320, "epoch": 1126} {"train_loss": -5.805597305297852, "global_step": 47321, "epoch": 1126} {"train_loss": -5.699684143066406, "global_step": 47322, "epoch": 1126} {"train_loss": -5.757685661315918, "global_step": 47323, "epoch": 1126} {"train_loss": -5.607020378112793, "global_step": 47324, "epoch": 1126} {"train_loss": -5.73758602142334, "global_step": 47325, "epoch": 1126} {"train_loss": -5.654447555541992, "global_step": 47326, "epoch": 1126} {"train_loss": -5.5027008056640625, "global_step": 47327, "epoch": 1126} {"train_loss": -5.787625312805176, "global_step": 47328, "epoch": 1126} {"train_loss": -5.65330696105957, "global_step": 47329, "epoch": 1126} {"train_loss": -5.627257347106934, "global_step": 47330, "epoch": 1126} {"train_loss": -5.579957962036133, "global_step": 47331, "epoch": 1126} {"train_loss": -5.75634765625, "global_step": 47332, "epoch": 1126} {"train_loss": -5.724262419201079, "global_step": 47333, "epoch": 1126, "val_loss": 66643.3359375} {"train_loss": -5.705008506774902, "global_step": 47334, "epoch": 1127} {"train_loss": -5.639798164367676, "global_step": 47335, "epoch": 1127} {"train_loss": -5.613202095031738, "global_step": 47336, "epoch": 1127} {"train_loss": -5.58357048034668, "global_step": 47337, "epoch": 1127} {"train_loss": -5.748717308044434, "global_step": 47338, "epoch": 1127} {"train_loss": -5.800191402435303, "global_step": 47339, "epoch": 1127} {"train_loss": -5.712051868438721, "global_step": 47340, "epoch": 1127} {"train_loss": -5.638561725616455, "global_step": 47341, "epoch": 1127} {"train_loss": -5.623757839202881, "global_step": 47342, "epoch": 1127} {"train_loss": -5.6631011962890625, "global_step": 47343, "epoch": 1127} {"train_loss": -5.647583484649658, "global_step": 47344, "epoch": 1127} {"train_loss": -5.8243231773376465, "global_step": 47345, "epoch": 1127} {"train_loss": -5.669544219970703, "global_step": 47346, "epoch": 1127} {"train_loss": -5.69891357421875, "global_step": 47347, "epoch": 1127} {"train_loss": -5.766144752502441, "global_step": 47348, "epoch": 1127} {"train_loss": -5.839399814605713, "global_step": 47349, "epoch": 1127} {"train_loss": -5.681070327758789, "global_step": 47350, "epoch": 1127} {"train_loss": -5.705348014831543, "global_step": 47351, "epoch": 1127} {"train_loss": -5.733822822570801, "global_step": 47352, "epoch": 1127} {"train_loss": -5.719420433044434, "global_step": 47353, "epoch": 1127} {"train_loss": -5.816939830780029, "global_step": 47354, "epoch": 1127} {"train_loss": -5.750612258911133, "global_step": 47355, "epoch": 1127} {"train_loss": -5.79262638092041, "global_step": 47356, "epoch": 1127} {"train_loss": -5.739588737487793, "global_step": 47357, "epoch": 1127} {"train_loss": -5.821005344390869, "global_step": 47358, "epoch": 1127} {"train_loss": -5.675162315368652, "global_step": 47359, "epoch": 1127} {"train_loss": -5.743932723999023, "global_step": 47360, "epoch": 1127} {"train_loss": -5.717132091522217, "global_step": 47361, "epoch": 1127} {"train_loss": -5.707822322845459, "global_step": 47362, "epoch": 1127} {"train_loss": -5.605233192443848, "global_step": 47363, "epoch": 1127} {"train_loss": -5.737209320068359, "global_step": 47364, "epoch": 1127} {"train_loss": -5.787382125854492, "global_step": 47365, "epoch": 1127} {"train_loss": -5.828178405761719, "global_step": 47366, "epoch": 1127} {"train_loss": -5.679295539855957, "global_step": 47367, "epoch": 1127} {"train_loss": -5.662468910217285, "global_step": 47368, "epoch": 1127} {"train_loss": -5.706782341003418, "global_step": 47369, "epoch": 1127} {"train_loss": -5.791169166564941, "global_step": 47370, "epoch": 1127} {"train_loss": -5.6913228034973145, "global_step": 47371, "epoch": 1127} {"train_loss": -5.579639911651611, "global_step": 47372, "epoch": 1127} {"train_loss": -5.689343452453613, "global_step": 47373, "epoch": 1127} {"train_loss": -5.7549543380737305, "global_step": 47374, "epoch": 1127} {"train_loss": -5.710547095253354, "global_step": 47375, "epoch": 1127, "val_loss": 66104.015625} {"train_loss": -5.671566963195801, "global_step": 47376, "epoch": 1128} {"train_loss": -5.678916931152344, "global_step": 47377, "epoch": 1128} {"train_loss": -5.676835060119629, "global_step": 47378, "epoch": 1128} {"train_loss": -5.5699028968811035, "global_step": 47379, "epoch": 1128} {"train_loss": -5.669144630432129, "global_step": 47380, "epoch": 1128} {"train_loss": -5.6770219802856445, "global_step": 47381, "epoch": 1128} {"train_loss": -5.715950965881348, "global_step": 47382, "epoch": 1128} {"train_loss": -5.7017107009887695, "global_step": 47383, "epoch": 1128} {"train_loss": -5.614981651306152, "global_step": 47384, "epoch": 1128} {"train_loss": -5.6624274253845215, "global_step": 47385, "epoch": 1128} {"train_loss": -5.656620025634766, "global_step": 47386, "epoch": 1128} {"train_loss": -5.670139312744141, "global_step": 47387, "epoch": 1128} {"train_loss": -5.749054431915283, "global_step": 47388, "epoch": 1128} {"train_loss": -5.600184440612793, "global_step": 47389, "epoch": 1128} {"train_loss": -5.7577056884765625, "global_step": 47390, "epoch": 1128} {"train_loss": -5.6467084884643555, "global_step": 47391, "epoch": 1128} {"train_loss": -5.563509941101074, "global_step": 47392, "epoch": 1128} {"train_loss": -5.6704206466674805, "global_step": 47393, "epoch": 1128} {"train_loss": -5.586604118347168, "global_step": 47394, "epoch": 1128} {"train_loss": -5.626819610595703, "global_step": 47395, "epoch": 1128} {"train_loss": -5.61652946472168, "global_step": 47396, "epoch": 1128} {"train_loss": -5.761350154876709, "global_step": 47397, "epoch": 1128} {"train_loss": -5.471651077270508, "global_step": 47398, "epoch": 1128} {"train_loss": -5.632491111755371, "global_step": 47399, "epoch": 1128} {"train_loss": -5.667085647583008, "global_step": 47400, "epoch": 1128} {"train_loss": -5.583261013031006, "global_step": 47401, "epoch": 1128} {"train_loss": -5.425267219543457, "global_step": 47402, "epoch": 1128} {"train_loss": -5.771491050720215, "global_step": 47403, "epoch": 1128} {"train_loss": -5.62650203704834, "global_step": 47404, "epoch": 1128} {"train_loss": -5.61319637298584, "global_step": 47405, "epoch": 1128} {"train_loss": -5.753176689147949, "global_step": 47406, "epoch": 1128} {"train_loss": -5.6465253829956055, "global_step": 47407, "epoch": 1128} {"train_loss": -5.6664042472839355, "global_step": 47408, "epoch": 1128} {"train_loss": -5.739995956420898, "global_step": 47409, "epoch": 1128} {"train_loss": -5.6592326164245605, "global_step": 47410, "epoch": 1128} {"train_loss": -5.614485740661621, "global_step": 47411, "epoch": 1128} {"train_loss": -5.630222320556641, "global_step": 47412, "epoch": 1128} {"train_loss": -5.674638271331787, "global_step": 47413, "epoch": 1128} {"train_loss": -5.7122626304626465, "global_step": 47414, "epoch": 1128} {"train_loss": -5.732264518737793, "global_step": 47415, "epoch": 1128} {"train_loss": -5.730047225952148, "global_step": 47416, "epoch": 1128} {"train_loss": -5.656538055056617, "global_step": 47417, "epoch": 1128, "val_loss": 66161.46875} {"train_loss": -5.7180304527282715, "global_step": 47418, "epoch": 1129} {"train_loss": -5.737038612365723, "global_step": 47419, "epoch": 1129} {"train_loss": -5.767469882965088, "global_step": 47420, "epoch": 1129} {"train_loss": -5.7187299728393555, "global_step": 47421, "epoch": 1129} {"train_loss": -5.7316999435424805, "global_step": 47422, "epoch": 1129} {"train_loss": -5.836353302001953, "global_step": 47423, "epoch": 1129} {"train_loss": -5.643890380859375, "global_step": 47424, "epoch": 1129} {"train_loss": -5.643240928649902, "global_step": 47425, "epoch": 1129} {"train_loss": -5.702917098999023, "global_step": 47426, "epoch": 1129} {"train_loss": -5.851414680480957, "global_step": 47427, "epoch": 1129} {"train_loss": -5.633317947387695, "global_step": 47428, "epoch": 1129} {"train_loss": -5.704891204833984, "global_step": 47429, "epoch": 1129} {"train_loss": -5.7012248039245605, "global_step": 47430, "epoch": 1129} {"train_loss": -5.7135443687438965, "global_step": 47431, "epoch": 1129} {"train_loss": -5.72320032119751, "global_step": 47432, "epoch": 1129} {"train_loss": -5.740838050842285, "global_step": 47433, "epoch": 1129} {"train_loss": -5.725827693939209, "global_step": 47434, "epoch": 1129} {"train_loss": -5.878207206726074, "global_step": 47435, "epoch": 1129} {"train_loss": -5.56832218170166, "global_step": 47436, "epoch": 1129} {"train_loss": -5.6886162757873535, "global_step": 47437, "epoch": 1129} {"train_loss": -5.672405242919922, "global_step": 47438, "epoch": 1129} {"train_loss": -5.616602897644043, "global_step": 47439, "epoch": 1129} {"train_loss": -5.789356708526611, "global_step": 47440, "epoch": 1129} {"train_loss": -5.603967189788818, "global_step": 47441, "epoch": 1129} {"train_loss": -5.760459899902344, "global_step": 47442, "epoch": 1129} {"train_loss": -5.729131698608398, "global_step": 47443, "epoch": 1129} {"train_loss": -5.698750972747803, "global_step": 47444, "epoch": 1129} {"train_loss": -5.762863636016846, "global_step": 47445, "epoch": 1129} {"train_loss": -5.7409162521362305, "global_step": 47446, "epoch": 1129} {"train_loss": -5.653758525848389, "global_step": 47447, "epoch": 1129} {"train_loss": -5.717869758605957, "global_step": 47448, "epoch": 1129} {"train_loss": -5.514477729797363, "global_step": 47449, "epoch": 1129} {"train_loss": -5.725766181945801, "global_step": 47450, "epoch": 1129} {"train_loss": -5.55281925201416, "global_step": 47451, "epoch": 1129} {"train_loss": -5.683371067047119, "global_step": 47452, "epoch": 1129} {"train_loss": -5.749712944030762, "global_step": 47453, "epoch": 1129} {"train_loss": -5.675076007843018, "global_step": 47454, "epoch": 1129} {"train_loss": -5.730566501617432, "global_step": 47455, "epoch": 1129} {"train_loss": -5.691056251525879, "global_step": 47456, "epoch": 1129} {"train_loss": -5.861472129821777, "global_step": 47457, "epoch": 1129} {"train_loss": -5.748141288757324, "global_step": 47458, "epoch": 1129} {"train_loss": -5.709303787776402, "global_step": 47459, "epoch": 1129, "val_loss": 66026.515625} {"train_loss": -5.834966659545898, "global_step": 47460, "epoch": 1130} {"train_loss": -5.71820592880249, "global_step": 47461, "epoch": 1130} {"train_loss": -5.810711860656738, "global_step": 47462, "epoch": 1130} {"train_loss": -5.655123710632324, "global_step": 47463, "epoch": 1130} {"train_loss": -5.698541164398193, "global_step": 47464, "epoch": 1130} {"train_loss": -5.883631706237793, "global_step": 47465, "epoch": 1130} {"train_loss": -5.757735252380371, "global_step": 47466, "epoch": 1130} {"train_loss": -5.707767009735107, "global_step": 47467, "epoch": 1130} {"train_loss": -5.688175201416016, "global_step": 47468, "epoch": 1130} {"train_loss": -5.7318315505981445, "global_step": 47469, "epoch": 1130} {"train_loss": -5.713939666748047, "global_step": 47470, "epoch": 1130} {"train_loss": -5.590971946716309, "global_step": 47471, "epoch": 1130} {"train_loss": -5.821937561035156, "global_step": 47472, "epoch": 1130} {"train_loss": -5.815891742706299, "global_step": 47473, "epoch": 1130} {"train_loss": -5.547215461730957, "global_step": 47474, "epoch": 1130} {"train_loss": -5.754058837890625, "global_step": 47475, "epoch": 1130} {"train_loss": -5.676167011260986, "global_step": 47476, "epoch": 1130} {"train_loss": -5.731393814086914, "global_step": 47477, "epoch": 1130} {"train_loss": -5.7291412353515625, "global_step": 47478, "epoch": 1130} {"train_loss": -5.659635066986084, "global_step": 47479, "epoch": 1130} {"train_loss": -5.825414180755615, "global_step": 47480, "epoch": 1130} {"train_loss": -5.826859474182129, "global_step": 47481, "epoch": 1130} {"train_loss": -5.710402011871338, "global_step": 47482, "epoch": 1130} {"train_loss": -5.829692840576172, "global_step": 47483, "epoch": 1130} {"train_loss": -5.743374824523926, "global_step": 47484, "epoch": 1130} {"train_loss": -5.79298210144043, "global_step": 47485, "epoch": 1130} {"train_loss": -5.6069254875183105, "global_step": 47486, "epoch": 1130} {"train_loss": -5.778851509094238, "global_step": 47487, "epoch": 1130} {"train_loss": -5.692766189575195, "global_step": 47488, "epoch": 1130} {"train_loss": -5.583791732788086, "global_step": 47489, "epoch": 1130} {"train_loss": -5.753445625305176, "global_step": 47490, "epoch": 1130} {"train_loss": -5.525253772735596, "global_step": 47491, "epoch": 1130} {"train_loss": -5.595423698425293, "global_step": 47492, "epoch": 1130} {"train_loss": -5.7664079666137695, "global_step": 47493, "epoch": 1130} {"train_loss": -5.606317520141602, "global_step": 47494, "epoch": 1130} {"train_loss": -5.619240760803223, "global_step": 47495, "epoch": 1130} {"train_loss": -5.676584243774414, "global_step": 47496, "epoch": 1130} {"train_loss": -5.69285774230957, "global_step": 47497, "epoch": 1130} {"train_loss": -5.5863237380981445, "global_step": 47498, "epoch": 1130} {"train_loss": -5.73312520980835, "global_step": 47499, "epoch": 1130} {"train_loss": -5.740689277648926, "global_step": 47500, "epoch": 1130} {"train_loss": -5.71283179237729, "global_step": 47501, "epoch": 1130, "val_loss": 66108.015625} {"train_loss": -5.725650310516357, "global_step": 47502, "epoch": 1131} {"train_loss": -5.871554851531982, "global_step": 47503, "epoch": 1131} {"train_loss": -5.7158684730529785, "global_step": 47504, "epoch": 1131} {"train_loss": -5.84188985824585, "global_step": 47505, "epoch": 1131} {"train_loss": -5.694147109985352, "global_step": 47506, "epoch": 1131} {"train_loss": -5.684595584869385, "global_step": 47507, "epoch": 1131} {"train_loss": -5.741964340209961, "global_step": 47508, "epoch": 1131} {"train_loss": -5.7000412940979, "global_step": 47509, "epoch": 1131} {"train_loss": -5.794129371643066, "global_step": 47510, "epoch": 1131} {"train_loss": -5.80446195602417, "global_step": 47511, "epoch": 1131} {"train_loss": -5.689475059509277, "global_step": 47512, "epoch": 1131} {"train_loss": -5.74513053894043, "global_step": 47513, "epoch": 1131} {"train_loss": -5.812788963317871, "global_step": 47514, "epoch": 1131} {"train_loss": -5.674000263214111, "global_step": 47515, "epoch": 1131} {"train_loss": -5.696860313415527, "global_step": 47516, "epoch": 1131} {"train_loss": -5.713700771331787, "global_step": 47517, "epoch": 1131} {"train_loss": -5.768383026123047, "global_step": 47518, "epoch": 1131} {"train_loss": -5.708284378051758, "global_step": 47519, "epoch": 1131} {"train_loss": -5.706018924713135, "global_step": 47520, "epoch": 1131} {"train_loss": -5.821996212005615, "global_step": 47521, "epoch": 1131} {"train_loss": -5.6942644119262695, "global_step": 47522, "epoch": 1131} {"train_loss": -5.573728084564209, "global_step": 47523, "epoch": 1131} {"train_loss": -5.771546363830566, "global_step": 47524, "epoch": 1131} {"train_loss": -5.642298698425293, "global_step": 47525, "epoch": 1131} {"train_loss": -5.67722225189209, "global_step": 47526, "epoch": 1131} {"train_loss": -5.633164405822754, "global_step": 47527, "epoch": 1131} {"train_loss": -5.752367973327637, "global_step": 47528, "epoch": 1131} {"train_loss": -5.642881870269775, "global_step": 47529, "epoch": 1131} {"train_loss": -5.722967624664307, "global_step": 47530, "epoch": 1131} {"train_loss": -5.766296863555908, "global_step": 47531, "epoch": 1131} {"train_loss": -5.685482501983643, "global_step": 47532, "epoch": 1131} {"train_loss": -5.784883975982666, "global_step": 47533, "epoch": 1131} {"train_loss": -5.772580146789551, "global_step": 47534, "epoch": 1131} {"train_loss": -5.631749629974365, "global_step": 47535, "epoch": 1131} {"train_loss": -5.798477649688721, "global_step": 47536, "epoch": 1131} {"train_loss": -5.643743991851807, "global_step": 47537, "epoch": 1131} {"train_loss": -5.661818027496338, "global_step": 47538, "epoch": 1131} {"train_loss": -5.87225866317749, "global_step": 47539, "epoch": 1131} {"train_loss": -5.739460468292236, "global_step": 47540, "epoch": 1131} {"train_loss": -5.74842643737793, "global_step": 47541, "epoch": 1131} {"train_loss": -5.664023399353027, "global_step": 47542, "epoch": 1131} {"train_loss": -5.727217583429246, "global_step": 47543, "epoch": 1131, "val_loss": 66102.2890625} {"train_loss": -5.706166744232178, "global_step": 47544, "epoch": 1132} {"train_loss": -5.662137985229492, "global_step": 47545, "epoch": 1132} {"train_loss": -5.795818328857422, "global_step": 47546, "epoch": 1132} {"train_loss": -5.696511268615723, "global_step": 47547, "epoch": 1132} {"train_loss": -5.689204216003418, "global_step": 47548, "epoch": 1132} {"train_loss": -5.718969821929932, "global_step": 47549, "epoch": 1132} {"train_loss": -5.505908012390137, "global_step": 47550, "epoch": 1132} {"train_loss": -5.742903709411621, "global_step": 47551, "epoch": 1132} {"train_loss": -5.640627384185791, "global_step": 47552, "epoch": 1132} {"train_loss": -5.753008842468262, "global_step": 47553, "epoch": 1132} {"train_loss": -5.667425632476807, "global_step": 47554, "epoch": 1132} {"train_loss": -5.774904251098633, "global_step": 47555, "epoch": 1132} {"train_loss": -5.757079601287842, "global_step": 47556, "epoch": 1132} {"train_loss": -5.584262847900391, "global_step": 47557, "epoch": 1132} {"train_loss": -5.817461013793945, "global_step": 47558, "epoch": 1132} {"train_loss": -5.576819896697998, "global_step": 47559, "epoch": 1132} {"train_loss": -5.670201778411865, "global_step": 47560, "epoch": 1132} {"train_loss": -5.740675449371338, "global_step": 47561, "epoch": 1132} {"train_loss": -5.6989970207214355, "global_step": 47562, "epoch": 1132} {"train_loss": -5.763570785522461, "global_step": 47563, "epoch": 1132} {"train_loss": -5.710495948791504, "global_step": 47564, "epoch": 1132} {"train_loss": -5.727495193481445, "global_step": 47565, "epoch": 1132} {"train_loss": -5.7797064781188965, "global_step": 47566, "epoch": 1132} {"train_loss": -5.823432922363281, "global_step": 47567, "epoch": 1132} {"train_loss": -5.807343482971191, "global_step": 47568, "epoch": 1132} {"train_loss": -5.694064617156982, "global_step": 47569, "epoch": 1132} {"train_loss": -5.766909599304199, "global_step": 47570, "epoch": 1132} {"train_loss": -5.721126556396484, "global_step": 47571, "epoch": 1132} {"train_loss": -5.65625524520874, "global_step": 47572, "epoch": 1132} {"train_loss": -5.753875255584717, "global_step": 47573, "epoch": 1132} {"train_loss": -5.689842700958252, "global_step": 47574, "epoch": 1132} {"train_loss": -5.807279109954834, "global_step": 47575, "epoch": 1132} {"train_loss": -5.718925952911377, "global_step": 47576, "epoch": 1132} {"train_loss": -5.795905113220215, "global_step": 47577, "epoch": 1132} {"train_loss": -5.691346168518066, "global_step": 47578, "epoch": 1132} {"train_loss": -5.621996879577637, "global_step": 47579, "epoch": 1132} {"train_loss": -5.634890079498291, "global_step": 47580, "epoch": 1132} {"train_loss": -5.825057029724121, "global_step": 47581, "epoch": 1132} {"train_loss": -5.651416778564453, "global_step": 47582, "epoch": 1132} {"train_loss": -5.711965084075928, "global_step": 47583, "epoch": 1132} {"train_loss": -5.659292221069336, "global_step": 47584, "epoch": 1132} {"train_loss": -5.715095054535639, "global_step": 47585, "epoch": 1132, "val_loss": 66171.015625} {"train_loss": -5.709568977355957, "global_step": 47586, "epoch": 1133} {"train_loss": -5.724244117736816, "global_step": 47587, "epoch": 1133} {"train_loss": -5.82125997543335, "global_step": 47588, "epoch": 1133} {"train_loss": -5.752323627471924, "global_step": 47589, "epoch": 1133} {"train_loss": -5.730345249176025, "global_step": 47590, "epoch": 1133} {"train_loss": -5.700725555419922, "global_step": 47591, "epoch": 1133} {"train_loss": -5.656499862670898, "global_step": 47592, "epoch": 1133} {"train_loss": -5.827465057373047, "global_step": 47593, "epoch": 1133} {"train_loss": -5.653365135192871, "global_step": 47594, "epoch": 1133} {"train_loss": -5.7438859939575195, "global_step": 47595, "epoch": 1133} {"train_loss": -5.761567115783691, "global_step": 47596, "epoch": 1133} {"train_loss": -5.745547294616699, "global_step": 47597, "epoch": 1133} {"train_loss": -5.787659168243408, "global_step": 47598, "epoch": 1133} {"train_loss": -5.67555046081543, "global_step": 47599, "epoch": 1133} {"train_loss": -5.757308006286621, "global_step": 47600, "epoch": 1133} {"train_loss": -5.807798385620117, "global_step": 47601, "epoch": 1133} {"train_loss": -5.759934425354004, "global_step": 47602, "epoch": 1133} {"train_loss": -5.674731254577637, "global_step": 47603, "epoch": 1133} {"train_loss": -5.751429557800293, "global_step": 47604, "epoch": 1133} {"train_loss": -5.758254051208496, "global_step": 47605, "epoch": 1133} {"train_loss": -5.641359806060791, "global_step": 47606, "epoch": 1133} {"train_loss": -5.692104339599609, "global_step": 47607, "epoch": 1133} {"train_loss": -5.643704891204834, "global_step": 47608, "epoch": 1133} {"train_loss": -5.8094072341918945, "global_step": 47609, "epoch": 1133} {"train_loss": -5.580788612365723, "global_step": 47610, "epoch": 1133} {"train_loss": -5.656182289123535, "global_step": 47611, "epoch": 1133} {"train_loss": -5.564101219177246, "global_step": 47612, "epoch": 1133} {"train_loss": -5.884610176086426, "global_step": 47613, "epoch": 1133} {"train_loss": -5.723906517028809, "global_step": 47614, "epoch": 1133} {"train_loss": -5.714514255523682, "global_step": 47615, "epoch": 1133} {"train_loss": -5.671104431152344, "global_step": 47616, "epoch": 1133} {"train_loss": -5.705338954925537, "global_step": 47617, "epoch": 1133} {"train_loss": -5.586252212524414, "global_step": 47618, "epoch": 1133} {"train_loss": -5.7843241691589355, "global_step": 47619, "epoch": 1133} {"train_loss": -5.8998942375183105, "global_step": 47620, "epoch": 1133} {"train_loss": -5.763029098510742, "global_step": 47621, "epoch": 1133} {"train_loss": -5.697420120239258, "global_step": 47622, "epoch": 1133} {"train_loss": -5.604609489440918, "global_step": 47623, "epoch": 1133} {"train_loss": -5.81385612487793, "global_step": 47624, "epoch": 1133} {"train_loss": -5.674182891845703, "global_step": 47625, "epoch": 1133} {"train_loss": -5.649805068969727, "global_step": 47626, "epoch": 1133} {"train_loss": -5.7214240573701405, "global_step": 47627, "epoch": 1133, "val_loss": 65961.1640625} {"train_loss": -5.682404518127441, "global_step": 47628, "epoch": 1134} {"train_loss": -5.639760494232178, "global_step": 47629, "epoch": 1134} {"train_loss": -5.77046012878418, "global_step": 47630, "epoch": 1134} {"train_loss": -5.763686656951904, "global_step": 47631, "epoch": 1134} {"train_loss": -5.726450443267822, "global_step": 47632, "epoch": 1134} {"train_loss": -5.754746437072754, "global_step": 47633, "epoch": 1134} {"train_loss": -5.687500953674316, "global_step": 47634, "epoch": 1134} {"train_loss": -5.796145439147949, "global_step": 47635, "epoch": 1134} {"train_loss": -5.662858009338379, "global_step": 47636, "epoch": 1134} {"train_loss": -5.676663398742676, "global_step": 47637, "epoch": 1134} {"train_loss": -5.7872819900512695, "global_step": 47638, "epoch": 1134} {"train_loss": -5.7486066818237305, "global_step": 47639, "epoch": 1134} {"train_loss": -5.828251361846924, "global_step": 47640, "epoch": 1134} {"train_loss": -5.7899065017700195, "global_step": 47641, "epoch": 1134} {"train_loss": -5.762737274169922, "global_step": 47642, "epoch": 1134} {"train_loss": -5.749168872833252, "global_step": 47643, "epoch": 1134} {"train_loss": -5.719512939453125, "global_step": 47644, "epoch": 1134} {"train_loss": -5.631957054138184, "global_step": 47645, "epoch": 1134} {"train_loss": -5.685832500457764, "global_step": 47646, "epoch": 1134} {"train_loss": -5.687816619873047, "global_step": 47647, "epoch": 1134} {"train_loss": -5.788240432739258, "global_step": 47648, "epoch": 1134} {"train_loss": -5.778498649597168, "global_step": 47649, "epoch": 1134} {"train_loss": -5.797000885009766, "global_step": 47650, "epoch": 1134} {"train_loss": -5.794503211975098, "global_step": 47651, "epoch": 1134} {"train_loss": -5.635376930236816, "global_step": 47652, "epoch": 1134} {"train_loss": -5.731480121612549, "global_step": 47653, "epoch": 1134} {"train_loss": -5.681841850280762, "global_step": 47654, "epoch": 1134} {"train_loss": -5.703155040740967, "global_step": 47655, "epoch": 1134} {"train_loss": -5.660140037536621, "global_step": 47656, "epoch": 1134} {"train_loss": -5.728337287902832, "global_step": 47657, "epoch": 1134} {"train_loss": -5.699122428894043, "global_step": 47658, "epoch": 1134} {"train_loss": -5.710845947265625, "global_step": 47659, "epoch": 1134} {"train_loss": -5.634354591369629, "global_step": 47660, "epoch": 1134} {"train_loss": -5.7089691162109375, "global_step": 47661, "epoch": 1134} {"train_loss": -5.734696388244629, "global_step": 47662, "epoch": 1134} {"train_loss": -5.904110431671143, "global_step": 47663, "epoch": 1134} {"train_loss": -5.7667012214660645, "global_step": 47664, "epoch": 1134} {"train_loss": -5.640126705169678, "global_step": 47665, "epoch": 1134} {"train_loss": -5.684823036193848, "global_step": 47666, "epoch": 1134} {"train_loss": -5.781071662902832, "global_step": 47667, "epoch": 1134} {"train_loss": -5.683201789855957, "global_step": 47668, "epoch": 1134} {"train_loss": -5.72556749979655, "global_step": 47669, "epoch": 1134, "val_loss": 66128.9140625} {"train_loss": -5.651749610900879, "global_step": 47670, "epoch": 1135} {"train_loss": -5.724886417388916, "global_step": 47671, "epoch": 1135} {"train_loss": -5.508609771728516, "global_step": 47672, "epoch": 1135} {"train_loss": -5.649845123291016, "global_step": 47673, "epoch": 1135} {"train_loss": -5.739898681640625, "global_step": 47674, "epoch": 1135} {"train_loss": -5.764721393585205, "global_step": 47675, "epoch": 1135} {"train_loss": -5.770847797393799, "global_step": 47676, "epoch": 1135} {"train_loss": -5.825031280517578, "global_step": 47677, "epoch": 1135} {"train_loss": -5.832956314086914, "global_step": 47678, "epoch": 1135} {"train_loss": -5.816812515258789, "global_step": 47679, "epoch": 1135} {"train_loss": -5.732287406921387, "global_step": 47680, "epoch": 1135} {"train_loss": -5.795332908630371, "global_step": 47681, "epoch": 1135} {"train_loss": -5.871677875518799, "global_step": 47682, "epoch": 1135} {"train_loss": -5.600522994995117, "global_step": 47683, "epoch": 1135} {"train_loss": -5.658504009246826, "global_step": 47684, "epoch": 1135} {"train_loss": -5.7015061378479, "global_step": 47685, "epoch": 1135} {"train_loss": -5.825375556945801, "global_step": 47686, "epoch": 1135} {"train_loss": -5.647609710693359, "global_step": 47687, "epoch": 1135} {"train_loss": -5.726799488067627, "global_step": 47688, "epoch": 1135} {"train_loss": -5.782029151916504, "global_step": 47689, "epoch": 1135} {"train_loss": -5.80501127243042, "global_step": 47690, "epoch": 1135} {"train_loss": -5.762234687805176, "global_step": 47691, "epoch": 1135} {"train_loss": -5.6633453369140625, "global_step": 47692, "epoch": 1135} {"train_loss": -5.570116996765137, "global_step": 47693, "epoch": 1135} {"train_loss": -5.78734827041626, "global_step": 47694, "epoch": 1135} {"train_loss": -5.610327243804932, "global_step": 47695, "epoch": 1135} {"train_loss": -5.64024543762207, "global_step": 47696, "epoch": 1135} {"train_loss": -5.616939067840576, "global_step": 47697, "epoch": 1135} {"train_loss": -5.504591941833496, "global_step": 47698, "epoch": 1135} {"train_loss": -5.782895088195801, "global_step": 47699, "epoch": 1135} {"train_loss": -5.512690544128418, "global_step": 47700, "epoch": 1135} {"train_loss": -5.738138198852539, "global_step": 47701, "epoch": 1135} {"train_loss": -5.731550216674805, "global_step": 47702, "epoch": 1135} {"train_loss": -5.786541938781738, "global_step": 47703, "epoch": 1135} {"train_loss": -5.744311332702637, "global_step": 47704, "epoch": 1135} {"train_loss": -5.791560173034668, "global_step": 47705, "epoch": 1135} {"train_loss": -5.6762895584106445, "global_step": 47706, "epoch": 1135} {"train_loss": -5.835389137268066, "global_step": 47707, "epoch": 1135} {"train_loss": -5.705516815185547, "global_step": 47708, "epoch": 1135} {"train_loss": -5.721985340118408, "global_step": 47709, "epoch": 1135} {"train_loss": -5.663448333740234, "global_step": 47710, "epoch": 1135} {"train_loss": -5.71444144703093, "global_step": 47711, "epoch": 1135, "val_loss": 66053.4921875} {"train_loss": -5.75798225402832, "global_step": 47712, "epoch": 1136} {"train_loss": -5.7530364990234375, "global_step": 47713, "epoch": 1136} {"train_loss": -5.783139705657959, "global_step": 47714, "epoch": 1136} {"train_loss": -5.771634578704834, "global_step": 47715, "epoch": 1136} {"train_loss": -5.820913314819336, "global_step": 47716, "epoch": 1136} {"train_loss": -5.683534622192383, "global_step": 47717, "epoch": 1136} {"train_loss": -5.775887966156006, "global_step": 47718, "epoch": 1136} {"train_loss": -5.650425910949707, "global_step": 47719, "epoch": 1136} {"train_loss": -5.751949310302734, "global_step": 47720, "epoch": 1136} {"train_loss": -5.862922191619873, "global_step": 47721, "epoch": 1136} {"train_loss": -5.719770431518555, "global_step": 47722, "epoch": 1136} {"train_loss": -5.759583950042725, "global_step": 47723, "epoch": 1136} {"train_loss": -5.686720848083496, "global_step": 47724, "epoch": 1136} {"train_loss": -5.6769633293151855, "global_step": 47725, "epoch": 1136} {"train_loss": -5.653299808502197, "global_step": 47726, "epoch": 1136} {"train_loss": -5.700342655181885, "global_step": 47727, "epoch": 1136} {"train_loss": -5.740628242492676, "global_step": 47728, "epoch": 1136} {"train_loss": -5.744734764099121, "global_step": 47729, "epoch": 1136} {"train_loss": -5.70053243637085, "global_step": 47730, "epoch": 1136} {"train_loss": -5.714452743530273, "global_step": 47731, "epoch": 1136} {"train_loss": -5.693826675415039, "global_step": 47732, "epoch": 1136} {"train_loss": -5.6446661949157715, "global_step": 47733, "epoch": 1136} {"train_loss": -5.846137046813965, "global_step": 47734, "epoch": 1136} {"train_loss": -5.7644429206848145, "global_step": 47735, "epoch": 1136} {"train_loss": -5.749175071716309, "global_step": 47736, "epoch": 1136} {"train_loss": -5.695422172546387, "global_step": 47737, "epoch": 1136} {"train_loss": -5.755862712860107, "global_step": 47738, "epoch": 1136} {"train_loss": -5.788899898529053, "global_step": 47739, "epoch": 1136} {"train_loss": -5.75811767578125, "global_step": 47740, "epoch": 1136} {"train_loss": -5.631688117980957, "global_step": 47741, "epoch": 1136} {"train_loss": -5.946722030639648, "global_step": 47742, "epoch": 1136} {"train_loss": -5.775134086608887, "global_step": 47743, "epoch": 1136} {"train_loss": -5.762381076812744, "global_step": 47744, "epoch": 1136} {"train_loss": -5.741454124450684, "global_step": 47745, "epoch": 1136} {"train_loss": -5.699183464050293, "global_step": 47746, "epoch": 1136} {"train_loss": -5.775424003601074, "global_step": 47747, "epoch": 1136} {"train_loss": -5.770075798034668, "global_step": 47748, "epoch": 1136} {"train_loss": -5.636845588684082, "global_step": 47749, "epoch": 1136} {"train_loss": -5.7064995765686035, "global_step": 47750, "epoch": 1136} {"train_loss": -5.800043106079102, "global_step": 47751, "epoch": 1136} {"train_loss": -5.769738674163818, "global_step": 47752, "epoch": 1136} {"train_loss": -5.739140533265614, "global_step": 47753, "epoch": 1136, "val_loss": 65964.5859375} {"train_loss": -5.657876014709473, "global_step": 47754, "epoch": 1137} {"train_loss": -5.885444164276123, "global_step": 47755, "epoch": 1137} {"train_loss": -5.750299453735352, "global_step": 47756, "epoch": 1137} {"train_loss": -5.7263665199279785, "global_step": 47757, "epoch": 1137} {"train_loss": -5.730729103088379, "global_step": 47758, "epoch": 1137} {"train_loss": -5.730729103088379, "global_step": 47759, "epoch": 1137} {"train_loss": -5.636549472808838, "global_step": 47760, "epoch": 1137} {"train_loss": -5.647533416748047, "global_step": 47761, "epoch": 1137} {"train_loss": -5.696386337280273, "global_step": 47762, "epoch": 1137} {"train_loss": -5.769315242767334, "global_step": 47763, "epoch": 1137} {"train_loss": -5.714537620544434, "global_step": 47764, "epoch": 1137} {"train_loss": -5.666528224945068, "global_step": 47765, "epoch": 1137} {"train_loss": -5.812101364135742, "global_step": 47766, "epoch": 1137} {"train_loss": -5.71402645111084, "global_step": 47767, "epoch": 1137} {"train_loss": -5.829390048980713, "global_step": 47768, "epoch": 1137} {"train_loss": -5.719903469085693, "global_step": 47769, "epoch": 1137} {"train_loss": -5.720214366912842, "global_step": 47770, "epoch": 1137} {"train_loss": -5.7266950607299805, "global_step": 47771, "epoch": 1137} {"train_loss": -5.677578926086426, "global_step": 47772, "epoch": 1137} {"train_loss": -5.850916862487793, "global_step": 47773, "epoch": 1137} {"train_loss": -5.528099536895752, "global_step": 47774, "epoch": 1137} {"train_loss": -5.7315673828125, "global_step": 47775, "epoch": 1137} {"train_loss": -5.696063041687012, "global_step": 47776, "epoch": 1137} {"train_loss": -5.740144729614258, "global_step": 47777, "epoch": 1137} {"train_loss": -5.797161102294922, "global_step": 47778, "epoch": 1137} {"train_loss": -5.623376369476318, "global_step": 47779, "epoch": 1137} {"train_loss": -5.82878303527832, "global_step": 47780, "epoch": 1137} {"train_loss": -5.77133321762085, "global_step": 47781, "epoch": 1137} {"train_loss": -5.681671142578125, "global_step": 47782, "epoch": 1137} {"train_loss": -5.614176273345947, "global_step": 47783, "epoch": 1137} {"train_loss": -5.806239604949951, "global_step": 47784, "epoch": 1137} {"train_loss": -5.652368545532227, "global_step": 47785, "epoch": 1137} {"train_loss": -5.64979362487793, "global_step": 47786, "epoch": 1137} {"train_loss": -5.76561164855957, "global_step": 47787, "epoch": 1137} {"train_loss": -5.66607666015625, "global_step": 47788, "epoch": 1137} {"train_loss": -5.777732849121094, "global_step": 47789, "epoch": 1137} {"train_loss": -5.756985187530518, "global_step": 47790, "epoch": 1137} {"train_loss": -5.72100830078125, "global_step": 47791, "epoch": 1137} {"train_loss": -5.778348445892334, "global_step": 47792, "epoch": 1137} {"train_loss": -5.789083480834961, "global_step": 47793, "epoch": 1137} {"train_loss": -5.793580055236816, "global_step": 47794, "epoch": 1137} {"train_loss": -5.730220635732015, "global_step": 47795, "epoch": 1137, "val_loss": 65978.609375} {"train_loss": -5.606568336486816, "global_step": 47796, "epoch": 1138} {"train_loss": -5.800887584686279, "global_step": 47797, "epoch": 1138} {"train_loss": -5.612126350402832, "global_step": 47798, "epoch": 1138} {"train_loss": -5.611966609954834, "global_step": 47799, "epoch": 1138} {"train_loss": -5.8351216316223145, "global_step": 47800, "epoch": 1138} {"train_loss": -5.67130708694458, "global_step": 47801, "epoch": 1138} {"train_loss": -5.798484802246094, "global_step": 47802, "epoch": 1138} {"train_loss": -5.8516340255737305, "global_step": 47803, "epoch": 1138} {"train_loss": -5.711644172668457, "global_step": 47804, "epoch": 1138} {"train_loss": -5.700702667236328, "global_step": 47805, "epoch": 1138} {"train_loss": -5.774423599243164, "global_step": 47806, "epoch": 1138} {"train_loss": -5.639989376068115, "global_step": 47807, "epoch": 1138} {"train_loss": -5.8960795402526855, "global_step": 47808, "epoch": 1138} {"train_loss": -5.7544426918029785, "global_step": 47809, "epoch": 1138} {"train_loss": -5.781398296356201, "global_step": 47810, "epoch": 1138} {"train_loss": -5.776972770690918, "global_step": 47811, "epoch": 1138} {"train_loss": -5.524864196777344, "global_step": 47812, "epoch": 1138} {"train_loss": -5.711675643920898, "global_step": 47813, "epoch": 1138} {"train_loss": -5.664121150970459, "global_step": 47814, "epoch": 1138} {"train_loss": -5.680584907531738, "global_step": 47815, "epoch": 1138} {"train_loss": -5.695387840270996, "global_step": 47816, "epoch": 1138} {"train_loss": -5.760184288024902, "global_step": 47817, "epoch": 1138} {"train_loss": -5.7668232917785645, "global_step": 47818, "epoch": 1138} {"train_loss": -5.746695518493652, "global_step": 47819, "epoch": 1138} {"train_loss": -5.677896022796631, "global_step": 47820, "epoch": 1138} {"train_loss": -5.879487991333008, "global_step": 47821, "epoch": 1138} {"train_loss": -5.829468727111816, "global_step": 47822, "epoch": 1138} {"train_loss": -5.818001747131348, "global_step": 47823, "epoch": 1138} {"train_loss": -5.706912040710449, "global_step": 47824, "epoch": 1138} {"train_loss": -5.731380462646484, "global_step": 47825, "epoch": 1138} {"train_loss": -5.692137718200684, "global_step": 47826, "epoch": 1138} {"train_loss": -5.718421936035156, "global_step": 47827, "epoch": 1138} {"train_loss": -5.682192802429199, "global_step": 47828, "epoch": 1138} {"train_loss": -5.7839508056640625, "global_step": 47829, "epoch": 1138} {"train_loss": -5.712180137634277, "global_step": 47830, "epoch": 1138} {"train_loss": -5.670160293579102, "global_step": 47831, "epoch": 1138} {"train_loss": -5.889790058135986, "global_step": 47832, "epoch": 1138} {"train_loss": -5.8625946044921875, "global_step": 47833, "epoch": 1138} {"train_loss": -5.675230503082275, "global_step": 47834, "epoch": 1138} {"train_loss": -5.88775110244751, "global_step": 47835, "epoch": 1138} {"train_loss": -5.713588714599609, "global_step": 47836, "epoch": 1138} {"train_loss": -5.739951917103359, "global_step": 47837, "epoch": 1138, "val_loss": 65923.4453125} {"train_loss": -5.872953414916992, "global_step": 47838, "epoch": 1139} {"train_loss": -5.728268623352051, "global_step": 47839, "epoch": 1139} {"train_loss": -5.754570007324219, "global_step": 47840, "epoch": 1139} {"train_loss": -5.757735729217529, "global_step": 47841, "epoch": 1139} {"train_loss": -5.759714126586914, "global_step": 47842, "epoch": 1139} {"train_loss": -5.807845115661621, "global_step": 47843, "epoch": 1139} {"train_loss": -5.815762519836426, "global_step": 47844, "epoch": 1139} {"train_loss": -5.712743759155273, "global_step": 47845, "epoch": 1139} {"train_loss": -5.731529235839844, "global_step": 47846, "epoch": 1139} {"train_loss": -5.636561393737793, "global_step": 47847, "epoch": 1139} {"train_loss": -5.765100002288818, "global_step": 47848, "epoch": 1139} {"train_loss": -5.752328872680664, "global_step": 47849, "epoch": 1139} {"train_loss": -5.770233154296875, "global_step": 47850, "epoch": 1139} {"train_loss": -5.768436431884766, "global_step": 47851, "epoch": 1139} {"train_loss": -5.737051486968994, "global_step": 47852, "epoch": 1139} {"train_loss": -5.757236957550049, "global_step": 47853, "epoch": 1139} {"train_loss": -5.85651159286499, "global_step": 47854, "epoch": 1139} {"train_loss": -5.713665008544922, "global_step": 47855, "epoch": 1139} {"train_loss": -5.831177711486816, "global_step": 47856, "epoch": 1139} {"train_loss": -5.626035690307617, "global_step": 47857, "epoch": 1139} {"train_loss": -5.844613552093506, "global_step": 47858, "epoch": 1139} {"train_loss": -5.732198715209961, "global_step": 47859, "epoch": 1139} {"train_loss": -5.743656158447266, "global_step": 47860, "epoch": 1139} {"train_loss": -5.63637638092041, "global_step": 47861, "epoch": 1139} {"train_loss": -5.783357620239258, "global_step": 47862, "epoch": 1139} {"train_loss": -5.623108386993408, "global_step": 47863, "epoch": 1139} {"train_loss": -5.582250595092773, "global_step": 47864, "epoch": 1139} {"train_loss": -5.819753170013428, "global_step": 47865, "epoch": 1139} {"train_loss": -5.8464813232421875, "global_step": 47866, "epoch": 1139} {"train_loss": -5.848008155822754, "global_step": 47867, "epoch": 1139} {"train_loss": -5.633993625640869, "global_step": 47868, "epoch": 1139} {"train_loss": -5.617527961730957, "global_step": 47869, "epoch": 1139} {"train_loss": -5.771549701690674, "global_step": 47870, "epoch": 1139} {"train_loss": -5.647241592407227, "global_step": 47871, "epoch": 1139} {"train_loss": -5.7110395431518555, "global_step": 47872, "epoch": 1139} {"train_loss": -5.723963737487793, "global_step": 47873, "epoch": 1139} {"train_loss": -5.666114330291748, "global_step": 47874, "epoch": 1139} {"train_loss": -5.670378684997559, "global_step": 47875, "epoch": 1139} {"train_loss": -5.708568572998047, "global_step": 47876, "epoch": 1139} {"train_loss": -5.686356544494629, "global_step": 47877, "epoch": 1139} {"train_loss": -5.724390506744385, "global_step": 47878, "epoch": 1139} {"train_loss": -5.73617130234128, "global_step": 47879, "epoch": 1139, "val_loss": 66235.1640625} {"train_loss": -5.791842460632324, "global_step": 47880, "epoch": 1140} {"train_loss": -5.660508632659912, "global_step": 47881, "epoch": 1140} {"train_loss": -5.659888744354248, "global_step": 47882, "epoch": 1140} {"train_loss": -5.801492691040039, "global_step": 47883, "epoch": 1140} {"train_loss": -5.761033058166504, "global_step": 47884, "epoch": 1140} {"train_loss": -5.795418739318848, "global_step": 47885, "epoch": 1140} {"train_loss": -5.687668323516846, "global_step": 47886, "epoch": 1140} {"train_loss": -5.687243938446045, "global_step": 47887, "epoch": 1140} {"train_loss": -5.747730255126953, "global_step": 47888, "epoch": 1140} {"train_loss": -5.817534923553467, "global_step": 47889, "epoch": 1140} {"train_loss": -5.651371002197266, "global_step": 47890, "epoch": 1140} {"train_loss": -5.6619110107421875, "global_step": 47891, "epoch": 1140} {"train_loss": -5.766266345977783, "global_step": 47892, "epoch": 1140} {"train_loss": -5.680337905883789, "global_step": 47893, "epoch": 1140} {"train_loss": -5.818540096282959, "global_step": 47894, "epoch": 1140} {"train_loss": -5.77757453918457, "global_step": 47895, "epoch": 1140} {"train_loss": -5.7022199630737305, "global_step": 47896, "epoch": 1140} {"train_loss": -5.694289684295654, "global_step": 47897, "epoch": 1140} {"train_loss": -5.7778449058532715, "global_step": 47898, "epoch": 1140} {"train_loss": -5.683725357055664, "global_step": 47899, "epoch": 1140} {"train_loss": -5.626028060913086, "global_step": 47900, "epoch": 1140} {"train_loss": -5.743424892425537, "global_step": 47901, "epoch": 1140} {"train_loss": -5.804684638977051, "global_step": 47902, "epoch": 1140} {"train_loss": -5.737701416015625, "global_step": 47903, "epoch": 1140} {"train_loss": -5.813414096832275, "global_step": 47904, "epoch": 1140} {"train_loss": -5.7418904304504395, "global_step": 47905, "epoch": 1140} {"train_loss": -5.672171592712402, "global_step": 47906, "epoch": 1140} {"train_loss": -5.681357383728027, "global_step": 47907, "epoch": 1140} {"train_loss": -5.609264373779297, "global_step": 47908, "epoch": 1140} {"train_loss": -5.716750144958496, "global_step": 47909, "epoch": 1140} {"train_loss": -5.756094932556152, "global_step": 47910, "epoch": 1140} {"train_loss": -5.577834606170654, "global_step": 47911, "epoch": 1140} {"train_loss": -5.598882675170898, "global_step": 47912, "epoch": 1140} {"train_loss": -5.651062965393066, "global_step": 47913, "epoch": 1140} {"train_loss": -5.869522571563721, "global_step": 47914, "epoch": 1140} {"train_loss": -5.784963130950928, "global_step": 47915, "epoch": 1140} {"train_loss": -5.608828067779541, "global_step": 47916, "epoch": 1140} {"train_loss": -5.616273403167725, "global_step": 47917, "epoch": 1140} {"train_loss": -5.69696569442749, "global_step": 47918, "epoch": 1140} {"train_loss": -5.719920635223389, "global_step": 47919, "epoch": 1140} {"train_loss": -5.763689994812012, "global_step": 47920, "epoch": 1140} {"train_loss": -5.716340451013474, "global_step": 47921, "epoch": 1140, "val_loss": 66094.796875} {"train_loss": -5.799734115600586, "global_step": 47922, "epoch": 1141} {"train_loss": -5.645501136779785, "global_step": 47923, "epoch": 1141} {"train_loss": -5.732156753540039, "global_step": 47924, "epoch": 1141} {"train_loss": -5.738779544830322, "global_step": 47925, "epoch": 1141} {"train_loss": -5.804144859313965, "global_step": 47926, "epoch": 1141} {"train_loss": -5.679266929626465, "global_step": 47927, "epoch": 1141} {"train_loss": -5.751363754272461, "global_step": 47928, "epoch": 1141} {"train_loss": -5.748851776123047, "global_step": 47929, "epoch": 1141} {"train_loss": -5.656281471252441, "global_step": 47930, "epoch": 1141} {"train_loss": -5.761536598205566, "global_step": 47931, "epoch": 1141} {"train_loss": -5.773740768432617, "global_step": 47932, "epoch": 1141} {"train_loss": -5.798207759857178, "global_step": 47933, "epoch": 1141} {"train_loss": -5.770166873931885, "global_step": 47934, "epoch": 1141} {"train_loss": -5.726843357086182, "global_step": 47935, "epoch": 1141} {"train_loss": -5.724480628967285, "global_step": 47936, "epoch": 1141} {"train_loss": -5.697604179382324, "global_step": 47937, "epoch": 1141} {"train_loss": -5.736516952514648, "global_step": 47938, "epoch": 1141} {"train_loss": -5.833310127258301, "global_step": 47939, "epoch": 1141} {"train_loss": -5.716790199279785, "global_step": 47940, "epoch": 1141} {"train_loss": -5.685389518737793, "global_step": 47941, "epoch": 1141} {"train_loss": -5.840375900268555, "global_step": 47942, "epoch": 1141} {"train_loss": -5.656537055969238, "global_step": 47943, "epoch": 1141} {"train_loss": -5.78298282623291, "global_step": 47944, "epoch": 1141} {"train_loss": -5.79329776763916, "global_step": 47945, "epoch": 1141} {"train_loss": -5.782082557678223, "global_step": 47946, "epoch": 1141} {"train_loss": -5.777467250823975, "global_step": 47947, "epoch": 1141} {"train_loss": -5.7552289962768555, "global_step": 47948, "epoch": 1141} {"train_loss": -5.656915187835693, "global_step": 47949, "epoch": 1141} {"train_loss": -5.886878967285156, "global_step": 47950, "epoch": 1141} {"train_loss": -5.676469802856445, "global_step": 47951, "epoch": 1141} {"train_loss": -5.751260757446289, "global_step": 47952, "epoch": 1141} {"train_loss": -5.799382209777832, "global_step": 47953, "epoch": 1141} {"train_loss": -5.804483413696289, "global_step": 47954, "epoch": 1141} {"train_loss": -5.632185459136963, "global_step": 47955, "epoch": 1141} {"train_loss": -5.757048606872559, "global_step": 47956, "epoch": 1141} {"train_loss": -5.855954170227051, "global_step": 47957, "epoch": 1141} {"train_loss": -5.929995536804199, "global_step": 47958, "epoch": 1141} {"train_loss": -5.8277177810668945, "global_step": 47959, "epoch": 1141} {"train_loss": -5.644146919250488, "global_step": 47960, "epoch": 1141} {"train_loss": -5.789202690124512, "global_step": 47961, "epoch": 1141} {"train_loss": -5.628870010375977, "global_step": 47962, "epoch": 1141} {"train_loss": -5.751797346841721, "global_step": 47963, "epoch": 1141, "val_loss": 66076.953125} {"train_loss": -5.873902320861816, "global_step": 47964, "epoch": 1142} {"train_loss": -5.685340881347656, "global_step": 47965, "epoch": 1142} {"train_loss": -5.570084095001221, "global_step": 47966, "epoch": 1142} {"train_loss": -5.591907024383545, "global_step": 47967, "epoch": 1142} {"train_loss": -5.7202606201171875, "global_step": 47968, "epoch": 1142} {"train_loss": -5.622923851013184, "global_step": 47969, "epoch": 1142} {"train_loss": -5.7884111404418945, "global_step": 47970, "epoch": 1142} {"train_loss": -5.763637542724609, "global_step": 47971, "epoch": 1142} {"train_loss": -5.56773567199707, "global_step": 47972, "epoch": 1142} {"train_loss": -5.794681549072266, "global_step": 47973, "epoch": 1142} {"train_loss": -5.813168048858643, "global_step": 47974, "epoch": 1142} {"train_loss": -5.741886138916016, "global_step": 47975, "epoch": 1142} {"train_loss": -5.736145973205566, "global_step": 47976, "epoch": 1142} {"train_loss": -5.87032413482666, "global_step": 47977, "epoch": 1142} {"train_loss": -5.752226829528809, "global_step": 47978, "epoch": 1142} {"train_loss": -5.735528945922852, "global_step": 47979, "epoch": 1142} {"train_loss": -5.589321136474609, "global_step": 47980, "epoch": 1142} {"train_loss": -5.630812644958496, "global_step": 47981, "epoch": 1142} {"train_loss": -5.684467315673828, "global_step": 47982, "epoch": 1142} {"train_loss": -5.777864456176758, "global_step": 47983, "epoch": 1142} {"train_loss": -5.503822326660156, "global_step": 47984, "epoch": 1142} {"train_loss": -5.715739727020264, "global_step": 47985, "epoch": 1142} {"train_loss": -5.754572868347168, "global_step": 47986, "epoch": 1142} {"train_loss": -5.6280717849731445, "global_step": 47987, "epoch": 1142} {"train_loss": -5.770178318023682, "global_step": 47988, "epoch": 1142} {"train_loss": -5.701772689819336, "global_step": 47989, "epoch": 1142} {"train_loss": -5.65256404876709, "global_step": 47990, "epoch": 1142} {"train_loss": -5.712627410888672, "global_step": 47991, "epoch": 1142} {"train_loss": -5.676661491394043, "global_step": 47992, "epoch": 1142} {"train_loss": -5.791972637176514, "global_step": 47993, "epoch": 1142} {"train_loss": -5.749028205871582, "global_step": 47994, "epoch": 1142} {"train_loss": -5.794852256774902, "global_step": 47995, "epoch": 1142} {"train_loss": -5.702759742736816, "global_step": 47996, "epoch": 1142} {"train_loss": -5.751708984375, "global_step": 47997, "epoch": 1142} {"train_loss": -5.677400588989258, "global_step": 47998, "epoch": 1142} {"train_loss": -5.841475963592529, "global_step": 47999, "epoch": 1142} {"train_loss": -5.777992248535156, "global_step": 48000, "epoch": 1142} {"train_loss": -5.6524553298950195, "global_step": 48001, "epoch": 1142} {"train_loss": -5.7527289390563965, "global_step": 48002, "epoch": 1142} {"train_loss": -5.70161771774292, "global_step": 48003, "epoch": 1142} {"train_loss": -5.592989444732666, "global_step": 48004, "epoch": 1142} {"train_loss": -5.713062706447783, "global_step": 48005, "epoch": 1142, "val_loss": 65917.03125} {"train_loss": -5.712827205657959, "global_step": 48006, "epoch": 1143} {"train_loss": -5.737635135650635, "global_step": 48007, "epoch": 1143} {"train_loss": -5.707623481750488, "global_step": 48008, "epoch": 1143} {"train_loss": -5.6279706954956055, "global_step": 48009, "epoch": 1143} {"train_loss": -5.60511589050293, "global_step": 48010, "epoch": 1143} {"train_loss": -5.590731620788574, "global_step": 48011, "epoch": 1143} {"train_loss": -5.8186845779418945, "global_step": 48012, "epoch": 1143} {"train_loss": -5.6202073097229, "global_step": 48013, "epoch": 1143} {"train_loss": -5.586666107177734, "global_step": 48014, "epoch": 1143} {"train_loss": -5.656182289123535, "global_step": 48015, "epoch": 1143} {"train_loss": -5.477347373962402, "global_step": 48016, "epoch": 1143} {"train_loss": -5.586325645446777, "global_step": 48017, "epoch": 1143} {"train_loss": -5.450870037078857, "global_step": 48018, "epoch": 1143} {"train_loss": -5.646820068359375, "global_step": 48019, "epoch": 1143} {"train_loss": -5.675804138183594, "global_step": 48020, "epoch": 1143} {"train_loss": -5.559725761413574, "global_step": 48021, "epoch": 1143} {"train_loss": -5.611727714538574, "global_step": 48022, "epoch": 1143} {"train_loss": -5.722329616546631, "global_step": 48023, "epoch": 1143} {"train_loss": -5.489343643188477, "global_step": 48024, "epoch": 1143} {"train_loss": -5.596602439880371, "global_step": 48025, "epoch": 1143} {"train_loss": -5.609226226806641, "global_step": 48026, "epoch": 1143} {"train_loss": -5.693819999694824, "global_step": 48027, "epoch": 1143} {"train_loss": -5.633584976196289, "global_step": 48028, "epoch": 1143} {"train_loss": -5.624307155609131, "global_step": 48029, "epoch": 1143} {"train_loss": -5.648427963256836, "global_step": 48030, "epoch": 1143} {"train_loss": -5.750429153442383, "global_step": 48031, "epoch": 1143} {"train_loss": -5.624477386474609, "global_step": 48032, "epoch": 1143} {"train_loss": -5.762197017669678, "global_step": 48033, "epoch": 1143} {"train_loss": -5.666851043701172, "global_step": 48034, "epoch": 1143} {"train_loss": -5.728265762329102, "global_step": 48035, "epoch": 1143} {"train_loss": -5.605737209320068, "global_step": 48036, "epoch": 1143} {"train_loss": -5.873333930969238, "global_step": 48037, "epoch": 1143} {"train_loss": -5.731748580932617, "global_step": 48038, "epoch": 1143} {"train_loss": -5.655643463134766, "global_step": 48039, "epoch": 1143} {"train_loss": -5.651081562042236, "global_step": 48040, "epoch": 1143} {"train_loss": -5.600127696990967, "global_step": 48041, "epoch": 1143} {"train_loss": -5.791919708251953, "global_step": 48042, "epoch": 1143} {"train_loss": -5.7082366943359375, "global_step": 48043, "epoch": 1143} {"train_loss": -5.737476348876953, "global_step": 48044, "epoch": 1143} {"train_loss": -5.6772847175598145, "global_step": 48045, "epoch": 1143} {"train_loss": -5.651562690734863, "global_step": 48046, "epoch": 1143} {"train_loss": -5.659712757383074, "global_step": 48047, "epoch": 1143, "val_loss": 66155.03125} {"train_loss": -5.777814865112305, "global_step": 48048, "epoch": 1144} {"train_loss": -5.681650161743164, "global_step": 48049, "epoch": 1144} {"train_loss": -5.632307052612305, "global_step": 48050, "epoch": 1144} {"train_loss": -5.802338123321533, "global_step": 48051, "epoch": 1144} {"train_loss": -5.800457000732422, "global_step": 48052, "epoch": 1144} {"train_loss": -5.650644302368164, "global_step": 48053, "epoch": 1144} {"train_loss": -5.747621059417725, "global_step": 48054, "epoch": 1144} {"train_loss": -5.803436279296875, "global_step": 48055, "epoch": 1144} {"train_loss": -5.761845588684082, "global_step": 48056, "epoch": 1144} {"train_loss": -5.688442230224609, "global_step": 48057, "epoch": 1144} {"train_loss": -5.838042736053467, "global_step": 48058, "epoch": 1144} {"train_loss": -5.807392597198486, "global_step": 48059, "epoch": 1144} {"train_loss": -5.656405448913574, "global_step": 48060, "epoch": 1144} {"train_loss": -5.733554363250732, "global_step": 48061, "epoch": 1144} {"train_loss": -5.815553188323975, "global_step": 48062, "epoch": 1144} {"train_loss": -5.76470422744751, "global_step": 48063, "epoch": 1144} {"train_loss": -5.749385833740234, "global_step": 48064, "epoch": 1144} {"train_loss": -5.79246711730957, "global_step": 48065, "epoch": 1144} {"train_loss": -5.847165107727051, "global_step": 48066, "epoch": 1144} {"train_loss": -5.9166579246521, "global_step": 48067, "epoch": 1144} {"train_loss": -5.695772647857666, "global_step": 48068, "epoch": 1144} {"train_loss": -5.753302574157715, "global_step": 48069, "epoch": 1144} {"train_loss": -5.7736968994140625, "global_step": 48070, "epoch": 1144} {"train_loss": -5.700860023498535, "global_step": 48071, "epoch": 1144} {"train_loss": -5.669567108154297, "global_step": 48072, "epoch": 1144} {"train_loss": -5.755773067474365, "global_step": 48073, "epoch": 1144} {"train_loss": -5.641785621643066, "global_step": 48074, "epoch": 1144} {"train_loss": -5.6880784034729, "global_step": 48075, "epoch": 1144} {"train_loss": -5.768655776977539, "global_step": 48076, "epoch": 1144} {"train_loss": -5.716817855834961, "global_step": 48077, "epoch": 1144} {"train_loss": -5.678744316101074, "global_step": 48078, "epoch": 1144} {"train_loss": -5.828271865844727, "global_step": 48079, "epoch": 1144} {"train_loss": -5.692061424255371, "global_step": 48080, "epoch": 1144} {"train_loss": -5.654346466064453, "global_step": 48081, "epoch": 1144} {"train_loss": -5.496997833251953, "global_step": 48082, "epoch": 1144} {"train_loss": -5.795731067657471, "global_step": 48083, "epoch": 1144} {"train_loss": -5.581567764282227, "global_step": 48084, "epoch": 1144} {"train_loss": -5.695666790008545, "global_step": 48085, "epoch": 1144} {"train_loss": -5.758807182312012, "global_step": 48086, "epoch": 1144} {"train_loss": -5.727786540985107, "global_step": 48087, "epoch": 1144} {"train_loss": -5.811586380004883, "global_step": 48088, "epoch": 1144} {"train_loss": -5.734246776217506, "global_step": 48089, "epoch": 1144, "val_loss": 65809.828125} {"train_loss": -5.747869491577148, "global_step": 48090, "epoch": 1145} {"train_loss": -5.6533203125, "global_step": 48091, "epoch": 1145} {"train_loss": -5.80092716217041, "global_step": 48092, "epoch": 1145} {"train_loss": -5.679834365844727, "global_step": 48093, "epoch": 1145} {"train_loss": -5.67028284072876, "global_step": 48094, "epoch": 1145} {"train_loss": -5.718042373657227, "global_step": 48095, "epoch": 1145} {"train_loss": -5.69002103805542, "global_step": 48096, "epoch": 1145} {"train_loss": -5.780947685241699, "global_step": 48097, "epoch": 1145} {"train_loss": -5.743711471557617, "global_step": 48098, "epoch": 1145} {"train_loss": -5.798097133636475, "global_step": 48099, "epoch": 1145} {"train_loss": -5.687363147735596, "global_step": 48100, "epoch": 1145} {"train_loss": -5.689279556274414, "global_step": 48101, "epoch": 1145} {"train_loss": -5.694632053375244, "global_step": 48102, "epoch": 1145} {"train_loss": -5.832892894744873, "global_step": 48103, "epoch": 1145} {"train_loss": -5.704998016357422, "global_step": 48104, "epoch": 1145} {"train_loss": -5.6416096687316895, "global_step": 48105, "epoch": 1145} {"train_loss": -5.797633647918701, "global_step": 48106, "epoch": 1145} {"train_loss": -5.709355354309082, "global_step": 48107, "epoch": 1145} {"train_loss": -5.660731792449951, "global_step": 48108, "epoch": 1145} {"train_loss": -5.708253383636475, "global_step": 48109, "epoch": 1145} {"train_loss": -5.858285427093506, "global_step": 48110, "epoch": 1145} {"train_loss": -5.886527061462402, "global_step": 48111, "epoch": 1145} {"train_loss": -5.683239936828613, "global_step": 48112, "epoch": 1145} {"train_loss": -5.571537017822266, "global_step": 48113, "epoch": 1145} {"train_loss": -5.513024806976318, "global_step": 48114, "epoch": 1145} {"train_loss": -5.673133850097656, "global_step": 48115, "epoch": 1145} {"train_loss": -5.596787929534912, "global_step": 48116, "epoch": 1145} {"train_loss": -5.724515914916992, "global_step": 48117, "epoch": 1145} {"train_loss": -5.583755016326904, "global_step": 48118, "epoch": 1145} {"train_loss": -5.622487545013428, "global_step": 48119, "epoch": 1145} {"train_loss": -5.657493591308594, "global_step": 48120, "epoch": 1145} {"train_loss": -5.69635009765625, "global_step": 48121, "epoch": 1145} {"train_loss": -5.625331878662109, "global_step": 48122, "epoch": 1145} {"train_loss": -5.65070915222168, "global_step": 48123, "epoch": 1145} {"train_loss": -5.599233627319336, "global_step": 48124, "epoch": 1145} {"train_loss": -5.859524250030518, "global_step": 48125, "epoch": 1145} {"train_loss": -5.711554527282715, "global_step": 48126, "epoch": 1145} {"train_loss": -5.761120796203613, "global_step": 48127, "epoch": 1145} {"train_loss": -5.75039529800415, "global_step": 48128, "epoch": 1145} {"train_loss": -5.740286827087402, "global_step": 48129, "epoch": 1145} {"train_loss": -5.6238813400268555, "global_step": 48130, "epoch": 1145} {"train_loss": -5.702353227706182, "global_step": 48131, "epoch": 1145, "val_loss": 66364.328125} {"train_loss": -5.8328118324279785, "global_step": 48132, "epoch": 1146} {"train_loss": -5.673250198364258, "global_step": 48133, "epoch": 1146} {"train_loss": -5.706420421600342, "global_step": 48134, "epoch": 1146} {"train_loss": -5.786357879638672, "global_step": 48135, "epoch": 1146} {"train_loss": -5.659303665161133, "global_step": 48136, "epoch": 1146} {"train_loss": -5.851451873779297, "global_step": 48137, "epoch": 1146} {"train_loss": -5.552911758422852, "global_step": 48138, "epoch": 1146} {"train_loss": -5.697142124176025, "global_step": 48139, "epoch": 1146} {"train_loss": -5.553526401519775, "global_step": 48140, "epoch": 1146} {"train_loss": -5.7099103927612305, "global_step": 48141, "epoch": 1146} {"train_loss": -5.604608535766602, "global_step": 48142, "epoch": 1146} {"train_loss": -5.675100326538086, "global_step": 48143, "epoch": 1146} {"train_loss": -5.683737277984619, "global_step": 48144, "epoch": 1146} {"train_loss": -5.775771141052246, "global_step": 48145, "epoch": 1146} {"train_loss": -5.53049373626709, "global_step": 48146, "epoch": 1146} {"train_loss": -5.652430057525635, "global_step": 48147, "epoch": 1146} {"train_loss": -5.676310062408447, "global_step": 48148, "epoch": 1146} {"train_loss": -5.745200157165527, "global_step": 48149, "epoch": 1146} {"train_loss": -5.735816478729248, "global_step": 48150, "epoch": 1146} {"train_loss": -5.657509803771973, "global_step": 48151, "epoch": 1146} {"train_loss": -5.5854387283325195, "global_step": 48152, "epoch": 1146} {"train_loss": -5.688016414642334, "global_step": 48153, "epoch": 1146} {"train_loss": -5.696045875549316, "global_step": 48154, "epoch": 1146} {"train_loss": -5.745336055755615, "global_step": 48155, "epoch": 1146} {"train_loss": -5.71649169921875, "global_step": 48156, "epoch": 1146} {"train_loss": -5.743322372436523, "global_step": 48157, "epoch": 1146} {"train_loss": -5.713843822479248, "global_step": 48158, "epoch": 1146} {"train_loss": -5.7353925704956055, "global_step": 48159, "epoch": 1146} {"train_loss": -5.761256694793701, "global_step": 48160, "epoch": 1146} {"train_loss": -5.613298416137695, "global_step": 48161, "epoch": 1146} {"train_loss": -5.74176025390625, "global_step": 48162, "epoch": 1146} {"train_loss": -5.56107759475708, "global_step": 48163, "epoch": 1146} {"train_loss": -5.700449466705322, "global_step": 48164, "epoch": 1146} {"train_loss": -5.6911540031433105, "global_step": 48165, "epoch": 1146} {"train_loss": -5.678276062011719, "global_step": 48166, "epoch": 1146} {"train_loss": -5.719122886657715, "global_step": 48167, "epoch": 1146} {"train_loss": -5.73524284362793, "global_step": 48168, "epoch": 1146} {"train_loss": -5.655287265777588, "global_step": 48169, "epoch": 1146} {"train_loss": -5.847741603851318, "global_step": 48170, "epoch": 1146} {"train_loss": -5.709985733032227, "global_step": 48171, "epoch": 1146} {"train_loss": -5.793449401855469, "global_step": 48172, "epoch": 1146} {"train_loss": -5.697583141781035, "global_step": 48173, "epoch": 1146, "val_loss": 66331.328125} {"train_loss": -5.661866188049316, "global_step": 48174, "epoch": 1147} {"train_loss": -5.807873725891113, "global_step": 48175, "epoch": 1147} {"train_loss": -5.687257289886475, "global_step": 48176, "epoch": 1147} {"train_loss": -5.692930221557617, "global_step": 48177, "epoch": 1147} {"train_loss": -5.661454200744629, "global_step": 48178, "epoch": 1147} {"train_loss": -5.6551690101623535, "global_step": 48179, "epoch": 1147} {"train_loss": -5.779213905334473, "global_step": 48180, "epoch": 1147} {"train_loss": -5.711105823516846, "global_step": 48181, "epoch": 1147} {"train_loss": -5.732233047485352, "global_step": 48182, "epoch": 1147} {"train_loss": -5.677123069763184, "global_step": 48183, "epoch": 1147} {"train_loss": -5.716876029968262, "global_step": 48184, "epoch": 1147} {"train_loss": -5.777110576629639, "global_step": 48185, "epoch": 1147} {"train_loss": -5.781919479370117, "global_step": 48186, "epoch": 1147} {"train_loss": -5.648076057434082, "global_step": 48187, "epoch": 1147} {"train_loss": -5.6546549797058105, "global_step": 48188, "epoch": 1147} {"train_loss": -5.8535990715026855, "global_step": 48189, "epoch": 1147} {"train_loss": -5.750636100769043, "global_step": 48190, "epoch": 1147} {"train_loss": -5.636533260345459, "global_step": 48191, "epoch": 1147} {"train_loss": -5.7929816246032715, "global_step": 48192, "epoch": 1147} {"train_loss": -5.633582592010498, "global_step": 48193, "epoch": 1147} {"train_loss": -5.628612041473389, "global_step": 48194, "epoch": 1147} {"train_loss": -5.720901966094971, "global_step": 48195, "epoch": 1147} {"train_loss": -5.78350830078125, "global_step": 48196, "epoch": 1147} {"train_loss": -5.735168933868408, "global_step": 48197, "epoch": 1147} {"train_loss": -5.6763129234313965, "global_step": 48198, "epoch": 1147} {"train_loss": -5.755353927612305, "global_step": 48199, "epoch": 1147} {"train_loss": -5.86658239364624, "global_step": 48200, "epoch": 1147} {"train_loss": -5.61829948425293, "global_step": 48201, "epoch": 1147} {"train_loss": -5.720374584197998, "global_step": 48202, "epoch": 1147} {"train_loss": -5.6963701248168945, "global_step": 48203, "epoch": 1147} {"train_loss": -5.767529487609863, "global_step": 48204, "epoch": 1147} {"train_loss": -5.874870300292969, "global_step": 48205, "epoch": 1147} {"train_loss": -5.651911735534668, "global_step": 48206, "epoch": 1147} {"train_loss": -5.779011249542236, "global_step": 48207, "epoch": 1147} {"train_loss": -5.813337326049805, "global_step": 48208, "epoch": 1147} {"train_loss": -5.748558044433594, "global_step": 48209, "epoch": 1147} {"train_loss": -5.790649890899658, "global_step": 48210, "epoch": 1147} {"train_loss": -5.718225002288818, "global_step": 48211, "epoch": 1147} {"train_loss": -5.776786804199219, "global_step": 48212, "epoch": 1147} {"train_loss": -5.739926815032959, "global_step": 48213, "epoch": 1147} {"train_loss": -5.738290786743164, "global_step": 48214, "epoch": 1147} {"train_loss": -5.730725447336833, "global_step": 48215, "epoch": 1147, "val_loss": 66051.34375} {"train_loss": -5.691449165344238, "global_step": 48216, "epoch": 1148} {"train_loss": -5.747716903686523, "global_step": 48217, "epoch": 1148} {"train_loss": -5.712216377258301, "global_step": 48218, "epoch": 1148} {"train_loss": -5.893904685974121, "global_step": 48219, "epoch": 1148} {"train_loss": -5.684317588806152, "global_step": 48220, "epoch": 1148} {"train_loss": -5.749373435974121, "global_step": 48221, "epoch": 1148} {"train_loss": -5.746187210083008, "global_step": 48222, "epoch": 1148} {"train_loss": -5.643807411193848, "global_step": 48223, "epoch": 1148} {"train_loss": -5.711002349853516, "global_step": 48224, "epoch": 1148} {"train_loss": -5.719837665557861, "global_step": 48225, "epoch": 1148} {"train_loss": -5.716193199157715, "global_step": 48226, "epoch": 1148} {"train_loss": -5.759861946105957, "global_step": 48227, "epoch": 1148} {"train_loss": -5.671842098236084, "global_step": 48228, "epoch": 1148} {"train_loss": -5.633390426635742, "global_step": 48229, "epoch": 1148} {"train_loss": -5.727851390838623, "global_step": 48230, "epoch": 1148} {"train_loss": -5.748598575592041, "global_step": 48231, "epoch": 1148} {"train_loss": -5.820126533508301, "global_step": 48232, "epoch": 1148} {"train_loss": -5.770274639129639, "global_step": 48233, "epoch": 1148} {"train_loss": -5.649584770202637, "global_step": 48234, "epoch": 1148} {"train_loss": -5.812027931213379, "global_step": 48235, "epoch": 1148} {"train_loss": -5.727081298828125, "global_step": 48236, "epoch": 1148} {"train_loss": -5.905572414398193, "global_step": 48237, "epoch": 1148} {"train_loss": -5.732140064239502, "global_step": 48238, "epoch": 1148} {"train_loss": -5.681535720825195, "global_step": 48239, "epoch": 1148} {"train_loss": -5.704300403594971, "global_step": 48240, "epoch": 1148} {"train_loss": -5.777802467346191, "global_step": 48241, "epoch": 1148} {"train_loss": -5.705887794494629, "global_step": 48242, "epoch": 1148} {"train_loss": -5.7418646812438965, "global_step": 48243, "epoch": 1148} {"train_loss": -5.700127601623535, "global_step": 48244, "epoch": 1148} {"train_loss": -5.724738121032715, "global_step": 48245, "epoch": 1148} {"train_loss": -5.628392219543457, "global_step": 48246, "epoch": 1148} {"train_loss": -5.73854398727417, "global_step": 48247, "epoch": 1148} {"train_loss": -5.585417747497559, "global_step": 48248, "epoch": 1148} {"train_loss": -5.711794853210449, "global_step": 48249, "epoch": 1148} {"train_loss": -5.619171142578125, "global_step": 48250, "epoch": 1148} {"train_loss": -5.770030975341797, "global_step": 48251, "epoch": 1148} {"train_loss": -5.72320032119751, "global_step": 48252, "epoch": 1148} {"train_loss": -5.710405349731445, "global_step": 48253, "epoch": 1148} {"train_loss": -5.706305027008057, "global_step": 48254, "epoch": 1148} {"train_loss": -5.79102897644043, "global_step": 48255, "epoch": 1148} {"train_loss": -5.802216053009033, "global_step": 48256, "epoch": 1148} {"train_loss": -5.730371429806664, "global_step": 48257, "epoch": 1148, "val_loss": 66233.3515625} {"train_loss": -5.89778995513916, "global_step": 48258, "epoch": 1149} {"train_loss": -5.7464599609375, "global_step": 48259, "epoch": 1149} {"train_loss": -5.916781902313232, "global_step": 48260, "epoch": 1149} {"train_loss": -5.747045993804932, "global_step": 48261, "epoch": 1149} {"train_loss": -5.8653411865234375, "global_step": 48262, "epoch": 1149} {"train_loss": -5.764747142791748, "global_step": 48263, "epoch": 1149} {"train_loss": -5.686556816101074, "global_step": 48264, "epoch": 1149} {"train_loss": -5.762720108032227, "global_step": 48265, "epoch": 1149} {"train_loss": -5.746848106384277, "global_step": 48266, "epoch": 1149} {"train_loss": -5.698858261108398, "global_step": 48267, "epoch": 1149} {"train_loss": -5.715482234954834, "global_step": 48268, "epoch": 1149} {"train_loss": -5.709990501403809, "global_step": 48269, "epoch": 1149} {"train_loss": -5.786667346954346, "global_step": 48270, "epoch": 1149} {"train_loss": -5.725711345672607, "global_step": 48271, "epoch": 1149} {"train_loss": -5.768832206726074, "global_step": 48272, "epoch": 1149} {"train_loss": -5.7354350090026855, "global_step": 48273, "epoch": 1149} {"train_loss": -5.700430870056152, "global_step": 48274, "epoch": 1149} {"train_loss": -5.570226669311523, "global_step": 48275, "epoch": 1149} {"train_loss": -5.594164848327637, "global_step": 48276, "epoch": 1149} {"train_loss": -5.798648357391357, "global_step": 48277, "epoch": 1149} {"train_loss": -5.521081924438477, "global_step": 48278, "epoch": 1149} {"train_loss": -5.68608283996582, "global_step": 48279, "epoch": 1149} {"train_loss": -5.666119575500488, "global_step": 48280, "epoch": 1149} {"train_loss": -5.775229454040527, "global_step": 48281, "epoch": 1149} {"train_loss": -5.597378730773926, "global_step": 48282, "epoch": 1149} {"train_loss": -5.634232044219971, "global_step": 48283, "epoch": 1149} {"train_loss": -5.770015239715576, "global_step": 48284, "epoch": 1149} {"train_loss": -5.636862754821777, "global_step": 48285, "epoch": 1149} {"train_loss": -5.711721420288086, "global_step": 48286, "epoch": 1149} {"train_loss": -5.7222900390625, "global_step": 48287, "epoch": 1149} {"train_loss": -5.794551849365234, "global_step": 48288, "epoch": 1149} {"train_loss": -5.586700916290283, "global_step": 48289, "epoch": 1149} {"train_loss": -5.746610641479492, "global_step": 48290, "epoch": 1149} {"train_loss": -5.722240447998047, "global_step": 48291, "epoch": 1149} {"train_loss": -5.69387674331665, "global_step": 48292, "epoch": 1149} {"train_loss": -5.658084392547607, "global_step": 48293, "epoch": 1149} {"train_loss": -5.7715253829956055, "global_step": 48294, "epoch": 1149} {"train_loss": -5.884732723236084, "global_step": 48295, "epoch": 1149} {"train_loss": -5.7572736740112305, "global_step": 48296, "epoch": 1149} {"train_loss": -5.770505428314209, "global_step": 48297, "epoch": 1149} {"train_loss": -5.695096015930176, "global_step": 48298, "epoch": 1149} {"train_loss": -5.7262858890351795, "global_step": 48299, "epoch": 1149, "val_loss": 66270.5390625} {"train_loss": -5.785141944885254, "global_step": 48300, "epoch": 1150} {"train_loss": -5.791938781738281, "global_step": 48301, "epoch": 1150} {"train_loss": -5.728141784667969, "global_step": 48302, "epoch": 1150} {"train_loss": -5.7422685623168945, "global_step": 48303, "epoch": 1150} {"train_loss": -5.678680419921875, "global_step": 48304, "epoch": 1150} {"train_loss": -5.632641792297363, "global_step": 48305, "epoch": 1150} {"train_loss": -5.699912071228027, "global_step": 48306, "epoch": 1150} {"train_loss": -5.80577278137207, "global_step": 48307, "epoch": 1150} {"train_loss": -5.685090065002441, "global_step": 48308, "epoch": 1150} {"train_loss": -5.8242011070251465, "global_step": 48309, "epoch": 1150} {"train_loss": -5.644555568695068, "global_step": 48310, "epoch": 1150} {"train_loss": -5.736336708068848, "global_step": 48311, "epoch": 1150} {"train_loss": -5.595444679260254, "global_step": 48312, "epoch": 1150} {"train_loss": -5.753864765167236, "global_step": 48313, "epoch": 1150} {"train_loss": -5.679754734039307, "global_step": 48314, "epoch": 1150} {"train_loss": -5.7019853591918945, "global_step": 48315, "epoch": 1150} {"train_loss": -5.783644676208496, "global_step": 48316, "epoch": 1150} {"train_loss": -5.716058731079102, "global_step": 48317, "epoch": 1150} {"train_loss": -5.761993408203125, "global_step": 48318, "epoch": 1150} {"train_loss": -5.795136451721191, "global_step": 48319, "epoch": 1150} {"train_loss": -5.813418865203857, "global_step": 48320, "epoch": 1150} {"train_loss": -5.696375846862793, "global_step": 48321, "epoch": 1150} {"train_loss": -5.721447944641113, "global_step": 48322, "epoch": 1150} {"train_loss": -5.725905418395996, "global_step": 48323, "epoch": 1150} {"train_loss": -5.722522258758545, "global_step": 48324, "epoch": 1150} {"train_loss": -5.870915412902832, "global_step": 48325, "epoch": 1150} {"train_loss": -5.661747932434082, "global_step": 48326, "epoch": 1150} {"train_loss": -5.8033599853515625, "global_step": 48327, "epoch": 1150} {"train_loss": -5.8325605392456055, "global_step": 48328, "epoch": 1150} {"train_loss": -5.706051826477051, "global_step": 48329, "epoch": 1150} {"train_loss": -5.787301540374756, "global_step": 48330, "epoch": 1150} {"train_loss": -5.7439470291137695, "global_step": 48331, "epoch": 1150} {"train_loss": -5.6707987785339355, "global_step": 48332, "epoch": 1150} {"train_loss": -5.8063740730285645, "global_step": 48333, "epoch": 1150} {"train_loss": -5.7323503494262695, "global_step": 48334, "epoch": 1150} {"train_loss": -5.697057723999023, "global_step": 48335, "epoch": 1150} {"train_loss": -5.78993034362793, "global_step": 48336, "epoch": 1150} {"train_loss": -5.679772853851318, "global_step": 48337, "epoch": 1150} {"train_loss": -5.687421798706055, "global_step": 48338, "epoch": 1150} {"train_loss": -5.653785228729248, "global_step": 48339, "epoch": 1150} {"train_loss": -5.768690586090088, "global_step": 48340, "epoch": 1150} {"train_loss": -5.736184597015381, "global_step": 48341, "epoch": 1150, "train/sim_max_reward_0": 0.35127809910842506, "train/sim_max_reward_1": 0.9122358876479986, "train/sim_max_reward_2": 0.5754163237434986, "train/sim_max_reward_3": 0.16015540279025542, "train/sim_max_reward_4": 0.4250313164024884, "train/sim_max_reward_5": 0.7269279979282544, "test/sim_max_reward_4400000": 0.7621948226452121, "test/sim_max_reward_4400001": 0.17669941371147382, "test/sim_max_reward_4400002": 0.5144768820603632, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.3797036954990397, "test/sim_max_reward_4400007": 0.28623868543965825, "test/sim_max_reward_4400008": 0.5754778612531983, "test/sim_max_reward_4400009": 0.3679014781454586, "test/sim_max_reward_4400010": 0.2751044539890837, "test/sim_max_reward_4400011": 0.20796477426299226, "test/sim_max_reward_4400012": 0.2979965283282726, "test/sim_max_reward_4400013": 0.4480271233632642, "test/sim_max_reward_4400014": 0.4895592190102454, "test/sim_max_reward_4400015": 0.6204811415467647, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.29169477101249275, "test/sim_max_reward_4400019": 0.3918503869007012, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5624547757792494, "test/sim_max_reward_4400022": 0.162118304217415, "test/sim_max_reward_4400023": 0.6068531693836067, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.22706851479953385, "test/sim_max_reward_4400026": 0.9697574288578382, "test/sim_max_reward_4400027": 0.04296285317193991, "test/sim_max_reward_4400028": 0.915972371699169, "test/sim_max_reward_4400029": 0.19607740693319936, "test/sim_max_reward_4400030": 0.031229597183181357, "test/sim_max_reward_4400031": 0.8399686333972117, "test/sim_max_reward_4400032": 0.2180100277860872, "test/sim_max_reward_4400033": 0.19112047207239058, "test/sim_max_reward_4400034": 0.821726620205514, "test/sim_max_reward_4400035": 0.47939890790306544, "test/sim_max_reward_4400036": 0.4199619763839177, "test/sim_max_reward_4400037": 0.6657709020394323, "test/sim_max_reward_4400038": 0.15300133262932653, "test/sim_max_reward_4400039": 0.7624093137783738, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.989630804483362, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.805638244307094, "test/sim_max_reward_4400044": 0.40232383842675007, "test/sim_max_reward_4400045": 0.3246380469357392, "test/sim_max_reward_4400046": 0.39536106054901043, "test/sim_max_reward_4400047": 0.8657816214241539, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.20068108185110825, "train/mean_score": 0.5251741712701534, "test/mean_score": 0.37209906542028093, "val_loss": 66077.046875} {"train_loss": -5.7245893478393555, "global_step": 48342, "epoch": 1151} {"train_loss": -5.748294830322266, "global_step": 48343, "epoch": 1151} {"train_loss": -5.78140926361084, "global_step": 48344, "epoch": 1151} {"train_loss": -5.699921607971191, "global_step": 48345, "epoch": 1151} {"train_loss": -5.844923973083496, "global_step": 48346, "epoch": 1151} {"train_loss": -5.854803085327148, "global_step": 48347, "epoch": 1151} {"train_loss": -5.8058905601501465, "global_step": 48348, "epoch": 1151} {"train_loss": -5.634191513061523, "global_step": 48349, "epoch": 1151} {"train_loss": -5.696203708648682, "global_step": 48350, "epoch": 1151} {"train_loss": -5.726563453674316, "global_step": 48351, "epoch": 1151} {"train_loss": -5.81843900680542, "global_step": 48352, "epoch": 1151} {"train_loss": -5.687742233276367, "global_step": 48353, "epoch": 1151} {"train_loss": -5.782017707824707, "global_step": 48354, "epoch": 1151} {"train_loss": -5.85164737701416, "global_step": 48355, "epoch": 1151} {"train_loss": -5.8371262550354, "global_step": 48356, "epoch": 1151} {"train_loss": -5.688025951385498, "global_step": 48357, "epoch": 1151} {"train_loss": -5.772810459136963, "global_step": 48358, "epoch": 1151} {"train_loss": -5.816789627075195, "global_step": 48359, "epoch": 1151} {"train_loss": -5.801024913787842, "global_step": 48360, "epoch": 1151} {"train_loss": -5.935153961181641, "global_step": 48361, "epoch": 1151} {"train_loss": -5.656416893005371, "global_step": 48362, "epoch": 1151} {"train_loss": -5.7961106300354, "global_step": 48363, "epoch": 1151} {"train_loss": -5.8748297691345215, "global_step": 48364, "epoch": 1151} {"train_loss": -5.523167610168457, "global_step": 48365, "epoch": 1151} {"train_loss": -5.731906890869141, "global_step": 48366, "epoch": 1151} {"train_loss": -5.679200172424316, "global_step": 48367, "epoch": 1151} {"train_loss": -5.638343334197998, "global_step": 48368, "epoch": 1151} {"train_loss": -5.6229352951049805, "global_step": 48369, "epoch": 1151} {"train_loss": -5.756383419036865, "global_step": 48370, "epoch": 1151} {"train_loss": -5.6112189292907715, "global_step": 48371, "epoch": 1151} {"train_loss": -5.791298866271973, "global_step": 48372, "epoch": 1151} {"train_loss": -5.755260467529297, "global_step": 48373, "epoch": 1151} {"train_loss": -5.602246284484863, "global_step": 48374, "epoch": 1151} {"train_loss": -5.728660583496094, "global_step": 48375, "epoch": 1151} {"train_loss": -5.884302616119385, "global_step": 48376, "epoch": 1151} {"train_loss": -5.791855812072754, "global_step": 48377, "epoch": 1151} {"train_loss": -5.766796112060547, "global_step": 48378, "epoch": 1151} {"train_loss": -5.771351337432861, "global_step": 48379, "epoch": 1151} {"train_loss": -5.722536087036133, "global_step": 48380, "epoch": 1151} {"train_loss": -5.84420919418335, "global_step": 48381, "epoch": 1151} {"train_loss": -5.627775192260742, "global_step": 48382, "epoch": 1151} {"train_loss": -5.749568382898967, "global_step": 48383, "epoch": 1151, "val_loss": 66050.5625} {"train_loss": -5.810856819152832, "global_step": 48384, "epoch": 1152} {"train_loss": -5.810698986053467, "global_step": 48385, "epoch": 1152} {"train_loss": -5.903429985046387, "global_step": 48386, "epoch": 1152} {"train_loss": -5.814885139465332, "global_step": 48387, "epoch": 1152} {"train_loss": -5.668864727020264, "global_step": 48388, "epoch": 1152} {"train_loss": -5.775245666503906, "global_step": 48389, "epoch": 1152} {"train_loss": -5.757905960083008, "global_step": 48390, "epoch": 1152} {"train_loss": -5.763946533203125, "global_step": 48391, "epoch": 1152} {"train_loss": -5.884493350982666, "global_step": 48392, "epoch": 1152} {"train_loss": -5.778604984283447, "global_step": 48393, "epoch": 1152} {"train_loss": -5.689464569091797, "global_step": 48394, "epoch": 1152} {"train_loss": -5.72978401184082, "global_step": 48395, "epoch": 1152} {"train_loss": -5.8270673751831055, "global_step": 48396, "epoch": 1152} {"train_loss": -5.664882183074951, "global_step": 48397, "epoch": 1152} {"train_loss": -5.760822296142578, "global_step": 48398, "epoch": 1152} {"train_loss": -5.749912738800049, "global_step": 48399, "epoch": 1152} {"train_loss": -5.696412086486816, "global_step": 48400, "epoch": 1152} {"train_loss": -5.75007963180542, "global_step": 48401, "epoch": 1152} {"train_loss": -5.7480316162109375, "global_step": 48402, "epoch": 1152} {"train_loss": -5.773397922515869, "global_step": 48403, "epoch": 1152} {"train_loss": -5.7895097732543945, "global_step": 48404, "epoch": 1152} {"train_loss": -5.745421886444092, "global_step": 48405, "epoch": 1152} {"train_loss": -5.81210994720459, "global_step": 48406, "epoch": 1152} {"train_loss": -5.651873588562012, "global_step": 48407, "epoch": 1152} {"train_loss": -5.642482757568359, "global_step": 48408, "epoch": 1152} {"train_loss": -5.814806938171387, "global_step": 48409, "epoch": 1152} {"train_loss": -5.647241592407227, "global_step": 48410, "epoch": 1152} {"train_loss": -5.722871780395508, "global_step": 48411, "epoch": 1152} {"train_loss": -5.721914768218994, "global_step": 48412, "epoch": 1152} {"train_loss": -5.700169086456299, "global_step": 48413, "epoch": 1152} {"train_loss": -5.7194390296936035, "global_step": 48414, "epoch": 1152} {"train_loss": -5.701627731323242, "global_step": 48415, "epoch": 1152} {"train_loss": -5.677087783813477, "global_step": 48416, "epoch": 1152} {"train_loss": -5.651656627655029, "global_step": 48417, "epoch": 1152} {"train_loss": -5.704482078552246, "global_step": 48418, "epoch": 1152} {"train_loss": -5.689903259277344, "global_step": 48419, "epoch": 1152} {"train_loss": -5.725627899169922, "global_step": 48420, "epoch": 1152} {"train_loss": -5.767243385314941, "global_step": 48421, "epoch": 1152} {"train_loss": -5.808104515075684, "global_step": 48422, "epoch": 1152} {"train_loss": -5.737015247344971, "global_step": 48423, "epoch": 1152} {"train_loss": -5.686123847961426, "global_step": 48424, "epoch": 1152} {"train_loss": -5.743385632832845, "global_step": 48425, "epoch": 1152, "val_loss": 65982.578125} {"train_loss": -5.692539215087891, "global_step": 48426, "epoch": 1153} {"train_loss": -5.795943260192871, "global_step": 48427, "epoch": 1153} {"train_loss": -5.7320356369018555, "global_step": 48428, "epoch": 1153} {"train_loss": -5.847569465637207, "global_step": 48429, "epoch": 1153} {"train_loss": -5.810201644897461, "global_step": 48430, "epoch": 1153} {"train_loss": -5.8208208084106445, "global_step": 48431, "epoch": 1153} {"train_loss": -5.806943416595459, "global_step": 48432, "epoch": 1153} {"train_loss": -5.809749603271484, "global_step": 48433, "epoch": 1153} {"train_loss": -5.799546241760254, "global_step": 48434, "epoch": 1153} {"train_loss": -5.684304237365723, "global_step": 48435, "epoch": 1153} {"train_loss": -5.575207710266113, "global_step": 48436, "epoch": 1153} {"train_loss": -5.5178022384643555, "global_step": 48437, "epoch": 1153} {"train_loss": -5.828834533691406, "global_step": 48438, "epoch": 1153} {"train_loss": -5.668505668640137, "global_step": 48439, "epoch": 1153} {"train_loss": -5.74925422668457, "global_step": 48440, "epoch": 1153} {"train_loss": -5.796258926391602, "global_step": 48441, "epoch": 1153} {"train_loss": -5.7876787185668945, "global_step": 48442, "epoch": 1153} {"train_loss": -5.785337448120117, "global_step": 48443, "epoch": 1153} {"train_loss": -5.766427040100098, "global_step": 48444, "epoch": 1153} {"train_loss": -5.6864213943481445, "global_step": 48445, "epoch": 1153} {"train_loss": -5.762438774108887, "global_step": 48446, "epoch": 1153} {"train_loss": -5.70259952545166, "global_step": 48447, "epoch": 1153} {"train_loss": -5.819436073303223, "global_step": 48448, "epoch": 1153} {"train_loss": -5.6494646072387695, "global_step": 48449, "epoch": 1153} {"train_loss": -5.849884033203125, "global_step": 48450, "epoch": 1153} {"train_loss": -5.736447811126709, "global_step": 48451, "epoch": 1153} {"train_loss": -5.827268600463867, "global_step": 48452, "epoch": 1153} {"train_loss": -5.6259260177612305, "global_step": 48453, "epoch": 1153} {"train_loss": -5.8124542236328125, "global_step": 48454, "epoch": 1153} {"train_loss": -5.606782913208008, "global_step": 48455, "epoch": 1153} {"train_loss": -5.760820388793945, "global_step": 48456, "epoch": 1153} {"train_loss": -5.790173053741455, "global_step": 48457, "epoch": 1153} {"train_loss": -5.732027053833008, "global_step": 48458, "epoch": 1153} {"train_loss": -5.901315689086914, "global_step": 48459, "epoch": 1153} {"train_loss": -5.730283737182617, "global_step": 48460, "epoch": 1153} {"train_loss": -5.66355037689209, "global_step": 48461, "epoch": 1153} {"train_loss": -5.804299354553223, "global_step": 48462, "epoch": 1153} {"train_loss": -5.713005542755127, "global_step": 48463, "epoch": 1153} {"train_loss": -5.629767417907715, "global_step": 48464, "epoch": 1153} {"train_loss": -5.793310165405273, "global_step": 48465, "epoch": 1153} {"train_loss": -5.7828168869018555, "global_step": 48466, "epoch": 1153} {"train_loss": -5.748885915392921, "global_step": 48467, "epoch": 1153, "val_loss": 65976.5859375} {"train_loss": -5.725319862365723, "global_step": 48468, "epoch": 1154} {"train_loss": -5.833562850952148, "global_step": 48469, "epoch": 1154} {"train_loss": -5.783595561981201, "global_step": 48470, "epoch": 1154} {"train_loss": -5.758861064910889, "global_step": 48471, "epoch": 1154} {"train_loss": -5.673495769500732, "global_step": 48472, "epoch": 1154} {"train_loss": -5.713847637176514, "global_step": 48473, "epoch": 1154} {"train_loss": -5.618453025817871, "global_step": 48474, "epoch": 1154} {"train_loss": -5.890634536743164, "global_step": 48475, "epoch": 1154} {"train_loss": -5.691796779632568, "global_step": 48476, "epoch": 1154} {"train_loss": -5.724200248718262, "global_step": 48477, "epoch": 1154} {"train_loss": -5.797911643981934, "global_step": 48478, "epoch": 1154} {"train_loss": -5.81365966796875, "global_step": 48479, "epoch": 1154} {"train_loss": -5.7254815101623535, "global_step": 48480, "epoch": 1154} {"train_loss": -5.803369522094727, "global_step": 48481, "epoch": 1154} {"train_loss": -5.664762496948242, "global_step": 48482, "epoch": 1154} {"train_loss": -5.783510684967041, "global_step": 48483, "epoch": 1154} {"train_loss": -5.702826499938965, "global_step": 48484, "epoch": 1154} {"train_loss": -5.652479648590088, "global_step": 48485, "epoch": 1154} {"train_loss": -5.64156436920166, "global_step": 48486, "epoch": 1154} {"train_loss": -5.796691417694092, "global_step": 48487, "epoch": 1154} {"train_loss": -5.832317352294922, "global_step": 48488, "epoch": 1154} {"train_loss": -5.659677505493164, "global_step": 48489, "epoch": 1154} {"train_loss": -5.827615737915039, "global_step": 48490, "epoch": 1154} {"train_loss": -5.661569595336914, "global_step": 48491, "epoch": 1154} {"train_loss": -5.847369194030762, "global_step": 48492, "epoch": 1154} {"train_loss": -5.726717948913574, "global_step": 48493, "epoch": 1154} {"train_loss": -5.6754255294799805, "global_step": 48494, "epoch": 1154} {"train_loss": -5.820559501647949, "global_step": 48495, "epoch": 1154} {"train_loss": -5.786201000213623, "global_step": 48496, "epoch": 1154} {"train_loss": -5.688606262207031, "global_step": 48497, "epoch": 1154} {"train_loss": -5.873969078063965, "global_step": 48498, "epoch": 1154} {"train_loss": -5.725094318389893, "global_step": 48499, "epoch": 1154} {"train_loss": -5.757123947143555, "global_step": 48500, "epoch": 1154} {"train_loss": -5.774935245513916, "global_step": 48501, "epoch": 1154} {"train_loss": -5.713170528411865, "global_step": 48502, "epoch": 1154} {"train_loss": -5.800278663635254, "global_step": 48503, "epoch": 1154} {"train_loss": -5.788255214691162, "global_step": 48504, "epoch": 1154} {"train_loss": -5.737830638885498, "global_step": 48505, "epoch": 1154} {"train_loss": -5.718195915222168, "global_step": 48506, "epoch": 1154} {"train_loss": -5.713205337524414, "global_step": 48507, "epoch": 1154} {"train_loss": -5.705478668212891, "global_step": 48508, "epoch": 1154} {"train_loss": -5.7489684990474155, "global_step": 48509, "epoch": 1154, "val_loss": 66074.71875} {"train_loss": -5.81115198135376, "global_step": 48510, "epoch": 1155} {"train_loss": -5.676568984985352, "global_step": 48511, "epoch": 1155} {"train_loss": -5.7375664710998535, "global_step": 48512, "epoch": 1155} {"train_loss": -5.585087776184082, "global_step": 48513, "epoch": 1155} {"train_loss": -5.692749977111816, "global_step": 48514, "epoch": 1155} {"train_loss": -5.686764717102051, "global_step": 48515, "epoch": 1155} {"train_loss": -5.62941837310791, "global_step": 48516, "epoch": 1155} {"train_loss": -5.727697849273682, "global_step": 48517, "epoch": 1155} {"train_loss": -5.634329319000244, "global_step": 48518, "epoch": 1155} {"train_loss": -5.504833221435547, "global_step": 48519, "epoch": 1155} {"train_loss": -5.728675842285156, "global_step": 48520, "epoch": 1155} {"train_loss": -5.701838493347168, "global_step": 48521, "epoch": 1155} {"train_loss": -5.8591790199279785, "global_step": 48522, "epoch": 1155} {"train_loss": -5.72532320022583, "global_step": 48523, "epoch": 1155} {"train_loss": -5.7433929443359375, "global_step": 48524, "epoch": 1155} {"train_loss": -5.692730903625488, "global_step": 48525, "epoch": 1155} {"train_loss": -5.766429901123047, "global_step": 48526, "epoch": 1155} {"train_loss": -5.682607650756836, "global_step": 48527, "epoch": 1155} {"train_loss": -5.746763706207275, "global_step": 48528, "epoch": 1155} {"train_loss": -5.6155781745910645, "global_step": 48529, "epoch": 1155} {"train_loss": -5.734884262084961, "global_step": 48530, "epoch": 1155} {"train_loss": -5.643327713012695, "global_step": 48531, "epoch": 1155} {"train_loss": -5.686138153076172, "global_step": 48532, "epoch": 1155} {"train_loss": -5.801347732543945, "global_step": 48533, "epoch": 1155} {"train_loss": -5.677818298339844, "global_step": 48534, "epoch": 1155} {"train_loss": -5.723549842834473, "global_step": 48535, "epoch": 1155} {"train_loss": -5.857426643371582, "global_step": 48536, "epoch": 1155} {"train_loss": -5.7870988845825195, "global_step": 48537, "epoch": 1155} {"train_loss": -5.685943126678467, "global_step": 48538, "epoch": 1155} {"train_loss": -5.725851058959961, "global_step": 48539, "epoch": 1155} {"train_loss": -5.739919662475586, "global_step": 48540, "epoch": 1155} {"train_loss": -5.871721267700195, "global_step": 48541, "epoch": 1155} {"train_loss": -5.742934226989746, "global_step": 48542, "epoch": 1155} {"train_loss": -5.810186862945557, "global_step": 48543, "epoch": 1155} {"train_loss": -5.750109672546387, "global_step": 48544, "epoch": 1155} {"train_loss": -5.735515594482422, "global_step": 48545, "epoch": 1155} {"train_loss": -5.675728797912598, "global_step": 48546, "epoch": 1155} {"train_loss": -5.761716842651367, "global_step": 48547, "epoch": 1155} {"train_loss": -5.648123264312744, "global_step": 48548, "epoch": 1155} {"train_loss": -5.682785511016846, "global_step": 48549, "epoch": 1155} {"train_loss": -5.821475028991699, "global_step": 48550, "epoch": 1155} {"train_loss": -5.718614703132992, "global_step": 48551, "epoch": 1155, "val_loss": 66086.9921875} {"train_loss": -5.855998516082764, "global_step": 48552, "epoch": 1156} {"train_loss": -5.552355766296387, "global_step": 48553, "epoch": 1156} {"train_loss": -5.678436756134033, "global_step": 48554, "epoch": 1156} {"train_loss": -5.605130195617676, "global_step": 48555, "epoch": 1156} {"train_loss": -5.769442558288574, "global_step": 48556, "epoch": 1156} {"train_loss": -5.700490474700928, "global_step": 48557, "epoch": 1156} {"train_loss": -5.627841949462891, "global_step": 48558, "epoch": 1156} {"train_loss": -5.70023250579834, "global_step": 48559, "epoch": 1156} {"train_loss": -5.565611362457275, "global_step": 48560, "epoch": 1156} {"train_loss": -5.681386947631836, "global_step": 48561, "epoch": 1156} {"train_loss": -5.606015682220459, "global_step": 48562, "epoch": 1156} {"train_loss": -5.669771194458008, "global_step": 48563, "epoch": 1156} {"train_loss": -5.689644813537598, "global_step": 48564, "epoch": 1156} {"train_loss": -5.673104286193848, "global_step": 48565, "epoch": 1156} {"train_loss": -5.713905334472656, "global_step": 48566, "epoch": 1156} {"train_loss": -5.875076770782471, "global_step": 48567, "epoch": 1156} {"train_loss": -5.563904762268066, "global_step": 48568, "epoch": 1156} {"train_loss": -5.725553035736084, "global_step": 48569, "epoch": 1156} {"train_loss": -5.708942890167236, "global_step": 48570, "epoch": 1156} {"train_loss": -5.707671165466309, "global_step": 48571, "epoch": 1156} {"train_loss": -5.716859817504883, "global_step": 48572, "epoch": 1156} {"train_loss": -5.698461532592773, "global_step": 48573, "epoch": 1156} {"train_loss": -5.644752025604248, "global_step": 48574, "epoch": 1156} {"train_loss": -5.662587642669678, "global_step": 48575, "epoch": 1156} {"train_loss": -5.744373321533203, "global_step": 48576, "epoch": 1156} {"train_loss": -5.8226213455200195, "global_step": 48577, "epoch": 1156} {"train_loss": -5.833078861236572, "global_step": 48578, "epoch": 1156} {"train_loss": -5.731973648071289, "global_step": 48579, "epoch": 1156} {"train_loss": -5.717507839202881, "global_step": 48580, "epoch": 1156} {"train_loss": -5.8023834228515625, "global_step": 48581, "epoch": 1156} {"train_loss": -5.8220534324646, "global_step": 48582, "epoch": 1156} {"train_loss": -5.732579708099365, "global_step": 48583, "epoch": 1156} {"train_loss": -5.647985935211182, "global_step": 48584, "epoch": 1156} {"train_loss": -5.739292621612549, "global_step": 48585, "epoch": 1156} {"train_loss": -5.776782989501953, "global_step": 48586, "epoch": 1156} {"train_loss": -5.7072577476501465, "global_step": 48587, "epoch": 1156} {"train_loss": -5.677218437194824, "global_step": 48588, "epoch": 1156} {"train_loss": -5.778782844543457, "global_step": 48589, "epoch": 1156} {"train_loss": -5.678127288818359, "global_step": 48590, "epoch": 1156} {"train_loss": -5.745697021484375, "global_step": 48591, "epoch": 1156} {"train_loss": -5.696392059326172, "global_step": 48592, "epoch": 1156} {"train_loss": -5.706770874205089, "global_step": 48593, "epoch": 1156, "val_loss": 66021.4921875} {"train_loss": -5.803804397583008, "global_step": 48594, "epoch": 1157} {"train_loss": -5.682352066040039, "global_step": 48595, "epoch": 1157} {"train_loss": -5.660749435424805, "global_step": 48596, "epoch": 1157} {"train_loss": -5.854985237121582, "global_step": 48597, "epoch": 1157} {"train_loss": -5.734458923339844, "global_step": 48598, "epoch": 1157} {"train_loss": -5.80787992477417, "global_step": 48599, "epoch": 1157} {"train_loss": -5.609869003295898, "global_step": 48600, "epoch": 1157} {"train_loss": -5.707140922546387, "global_step": 48601, "epoch": 1157} {"train_loss": -5.733412265777588, "global_step": 48602, "epoch": 1157} {"train_loss": -5.805968284606934, "global_step": 48603, "epoch": 1157} {"train_loss": -5.719127655029297, "global_step": 48604, "epoch": 1157} {"train_loss": -5.806843280792236, "global_step": 48605, "epoch": 1157} {"train_loss": -5.768177032470703, "global_step": 48606, "epoch": 1157} {"train_loss": -5.757463455200195, "global_step": 48607, "epoch": 1157} {"train_loss": -5.729432106018066, "global_step": 48608, "epoch": 1157} {"train_loss": -5.602056980133057, "global_step": 48609, "epoch": 1157} {"train_loss": -5.600802421569824, "global_step": 48610, "epoch": 1157} {"train_loss": -5.799015045166016, "global_step": 48611, "epoch": 1157} {"train_loss": -5.8583784103393555, "global_step": 48612, "epoch": 1157} {"train_loss": -5.6893792152404785, "global_step": 48613, "epoch": 1157} {"train_loss": -5.760908126831055, "global_step": 48614, "epoch": 1157} {"train_loss": -5.795093536376953, "global_step": 48615, "epoch": 1157} {"train_loss": -5.799271583557129, "global_step": 48616, "epoch": 1157} {"train_loss": -5.841115951538086, "global_step": 48617, "epoch": 1157} {"train_loss": -5.774944305419922, "global_step": 48618, "epoch": 1157} {"train_loss": -5.820015907287598, "global_step": 48619, "epoch": 1157} {"train_loss": -5.663269996643066, "global_step": 48620, "epoch": 1157} {"train_loss": -5.8330864906311035, "global_step": 48621, "epoch": 1157} {"train_loss": -5.6570515632629395, "global_step": 48622, "epoch": 1157} {"train_loss": -5.584906101226807, "global_step": 48623, "epoch": 1157} {"train_loss": -5.631107330322266, "global_step": 48624, "epoch": 1157} {"train_loss": -5.64036750793457, "global_step": 48625, "epoch": 1157} {"train_loss": -5.655426979064941, "global_step": 48626, "epoch": 1157} {"train_loss": -5.673308372497559, "global_step": 48627, "epoch": 1157} {"train_loss": -5.678221702575684, "global_step": 48628, "epoch": 1157} {"train_loss": -5.725109100341797, "global_step": 48629, "epoch": 1157} {"train_loss": -5.7912702560424805, "global_step": 48630, "epoch": 1157} {"train_loss": -5.879708290100098, "global_step": 48631, "epoch": 1157} {"train_loss": -5.722113609313965, "global_step": 48632, "epoch": 1157} {"train_loss": -5.6797685623168945, "global_step": 48633, "epoch": 1157} {"train_loss": -5.79963493347168, "global_step": 48634, "epoch": 1157} {"train_loss": -5.736013151350475, "global_step": 48635, "epoch": 1157, "val_loss": 66186.40625} {"train_loss": -5.6848602294921875, "global_step": 48636, "epoch": 1158} {"train_loss": -5.7476701736450195, "global_step": 48637, "epoch": 1158} {"train_loss": -5.673347473144531, "global_step": 48638, "epoch": 1158} {"train_loss": -5.765643119812012, "global_step": 48639, "epoch": 1158} {"train_loss": -5.697259426116943, "global_step": 48640, "epoch": 1158} {"train_loss": -5.80241584777832, "global_step": 48641, "epoch": 1158} {"train_loss": -5.740694999694824, "global_step": 48642, "epoch": 1158} {"train_loss": -5.722179889678955, "global_step": 48643, "epoch": 1158} {"train_loss": -5.763879776000977, "global_step": 48644, "epoch": 1158} {"train_loss": -5.75473165512085, "global_step": 48645, "epoch": 1158} {"train_loss": -5.741486072540283, "global_step": 48646, "epoch": 1158} {"train_loss": -5.7565436363220215, "global_step": 48647, "epoch": 1158} {"train_loss": -5.7091803550720215, "global_step": 48648, "epoch": 1158} {"train_loss": -5.734311103820801, "global_step": 48649, "epoch": 1158} {"train_loss": -5.669701099395752, "global_step": 48650, "epoch": 1158} {"train_loss": -5.737437725067139, "global_step": 48651, "epoch": 1158} {"train_loss": -5.743555068969727, "global_step": 48652, "epoch": 1158} {"train_loss": -5.728966236114502, "global_step": 48653, "epoch": 1158} {"train_loss": -5.714172840118408, "global_step": 48654, "epoch": 1158} {"train_loss": -5.723565101623535, "global_step": 48655, "epoch": 1158} {"train_loss": -5.652731895446777, "global_step": 48656, "epoch": 1158} {"train_loss": -5.8594536781311035, "global_step": 48657, "epoch": 1158} {"train_loss": -5.660856246948242, "global_step": 48658, "epoch": 1158} {"train_loss": -5.7277631759643555, "global_step": 48659, "epoch": 1158} {"train_loss": -5.778536796569824, "global_step": 48660, "epoch": 1158} {"train_loss": -5.849300384521484, "global_step": 48661, "epoch": 1158} {"train_loss": -5.805578708648682, "global_step": 48662, "epoch": 1158} {"train_loss": -5.872541427612305, "global_step": 48663, "epoch": 1158} {"train_loss": -5.766829490661621, "global_step": 48664, "epoch": 1158} {"train_loss": -5.664307594299316, "global_step": 48665, "epoch": 1158} {"train_loss": -5.687830448150635, "global_step": 48666, "epoch": 1158} {"train_loss": -5.770333290100098, "global_step": 48667, "epoch": 1158} {"train_loss": -5.637266159057617, "global_step": 48668, "epoch": 1158} {"train_loss": -5.743942737579346, "global_step": 48669, "epoch": 1158} {"train_loss": -5.696600914001465, "global_step": 48670, "epoch": 1158} {"train_loss": -5.700527191162109, "global_step": 48671, "epoch": 1158} {"train_loss": -5.794219493865967, "global_step": 48672, "epoch": 1158} {"train_loss": -5.883045196533203, "global_step": 48673, "epoch": 1158} {"train_loss": -5.822596549987793, "global_step": 48674, "epoch": 1158} {"train_loss": -5.8183488845825195, "global_step": 48675, "epoch": 1158} {"train_loss": -5.680501937866211, "global_step": 48676, "epoch": 1158} {"train_loss": -5.743208658127558, "global_step": 48677, "epoch": 1158, "val_loss": 66169.15625} {"train_loss": -5.777639389038086, "global_step": 48678, "epoch": 1159} {"train_loss": -5.708237648010254, "global_step": 48679, "epoch": 1159} {"train_loss": -5.803627014160156, "global_step": 48680, "epoch": 1159} {"train_loss": -5.763375759124756, "global_step": 48681, "epoch": 1159} {"train_loss": -5.6951704025268555, "global_step": 48682, "epoch": 1159} {"train_loss": -5.757747650146484, "global_step": 48683, "epoch": 1159} {"train_loss": -5.792082786560059, "global_step": 48684, "epoch": 1159} {"train_loss": -5.748315811157227, "global_step": 48685, "epoch": 1159} {"train_loss": -5.778936862945557, "global_step": 48686, "epoch": 1159} {"train_loss": -5.810096740722656, "global_step": 48687, "epoch": 1159} {"train_loss": -5.843474388122559, "global_step": 48688, "epoch": 1159} {"train_loss": -5.77071475982666, "global_step": 48689, "epoch": 1159} {"train_loss": -5.7548956871032715, "global_step": 48690, "epoch": 1159} {"train_loss": -5.798657417297363, "global_step": 48691, "epoch": 1159} {"train_loss": -5.727100372314453, "global_step": 48692, "epoch": 1159} {"train_loss": -5.800165176391602, "global_step": 48693, "epoch": 1159} {"train_loss": -5.678133964538574, "global_step": 48694, "epoch": 1159} {"train_loss": -5.756052017211914, "global_step": 48695, "epoch": 1159} {"train_loss": -5.726348876953125, "global_step": 48696, "epoch": 1159} {"train_loss": -5.670970916748047, "global_step": 48697, "epoch": 1159} {"train_loss": -5.707823276519775, "global_step": 48698, "epoch": 1159} {"train_loss": -5.640371322631836, "global_step": 48699, "epoch": 1159} {"train_loss": -5.864624977111816, "global_step": 48700, "epoch": 1159} {"train_loss": -5.743846893310547, "global_step": 48701, "epoch": 1159} {"train_loss": -5.82916784286499, "global_step": 48702, "epoch": 1159} {"train_loss": -5.8020477294921875, "global_step": 48703, "epoch": 1159} {"train_loss": -5.921593189239502, "global_step": 48704, "epoch": 1159} {"train_loss": -5.650118350982666, "global_step": 48705, "epoch": 1159} {"train_loss": -5.716195106506348, "global_step": 48706, "epoch": 1159} {"train_loss": -5.782194137573242, "global_step": 48707, "epoch": 1159} {"train_loss": -5.758340835571289, "global_step": 48708, "epoch": 1159} {"train_loss": -5.547372817993164, "global_step": 48709, "epoch": 1159} {"train_loss": -5.846318244934082, "global_step": 48710, "epoch": 1159} {"train_loss": -5.589285850524902, "global_step": 48711, "epoch": 1159} {"train_loss": -5.669103145599365, "global_step": 48712, "epoch": 1159} {"train_loss": -5.701722145080566, "global_step": 48713, "epoch": 1159} {"train_loss": -5.729121208190918, "global_step": 48714, "epoch": 1159} {"train_loss": -5.847268581390381, "global_step": 48715, "epoch": 1159} {"train_loss": -5.595655918121338, "global_step": 48716, "epoch": 1159} {"train_loss": -5.602819442749023, "global_step": 48717, "epoch": 1159} {"train_loss": -5.750494956970215, "global_step": 48718, "epoch": 1159} {"train_loss": -5.740110578991118, "global_step": 48719, "epoch": 1159, "val_loss": 66274.0703125} {"train_loss": -5.796698570251465, "global_step": 48720, "epoch": 1160} {"train_loss": -5.612898826599121, "global_step": 48721, "epoch": 1160} {"train_loss": -5.851137638092041, "global_step": 48722, "epoch": 1160} {"train_loss": -5.8506035804748535, "global_step": 48723, "epoch": 1160} {"train_loss": -5.592271327972412, "global_step": 48724, "epoch": 1160} {"train_loss": -5.605754375457764, "global_step": 48725, "epoch": 1160} {"train_loss": -5.801039695739746, "global_step": 48726, "epoch": 1160} {"train_loss": -5.742417335510254, "global_step": 48727, "epoch": 1160} {"train_loss": -5.621342182159424, "global_step": 48728, "epoch": 1160} {"train_loss": -5.782907485961914, "global_step": 48729, "epoch": 1160} {"train_loss": -5.693478584289551, "global_step": 48730, "epoch": 1160} {"train_loss": -5.743587493896484, "global_step": 48731, "epoch": 1160} {"train_loss": -5.680323123931885, "global_step": 48732, "epoch": 1160} {"train_loss": -5.689218521118164, "global_step": 48733, "epoch": 1160} {"train_loss": -5.792905330657959, "global_step": 48734, "epoch": 1160} {"train_loss": -5.77255916595459, "global_step": 48735, "epoch": 1160} {"train_loss": -5.855559349060059, "global_step": 48736, "epoch": 1160} {"train_loss": -5.742475986480713, "global_step": 48737, "epoch": 1160} {"train_loss": -5.742188453674316, "global_step": 48738, "epoch": 1160} {"train_loss": -5.765223979949951, "global_step": 48739, "epoch": 1160} {"train_loss": -5.790245056152344, "global_step": 48740, "epoch": 1160} {"train_loss": -5.830246448516846, "global_step": 48741, "epoch": 1160} {"train_loss": -5.671200275421143, "global_step": 48742, "epoch": 1160} {"train_loss": -5.794502258300781, "global_step": 48743, "epoch": 1160} {"train_loss": -5.711721420288086, "global_step": 48744, "epoch": 1160} {"train_loss": -5.662757873535156, "global_step": 48745, "epoch": 1160} {"train_loss": -5.663473129272461, "global_step": 48746, "epoch": 1160} {"train_loss": -5.715879440307617, "global_step": 48747, "epoch": 1160} {"train_loss": -5.777674674987793, "global_step": 48748, "epoch": 1160} {"train_loss": -5.661715507507324, "global_step": 48749, "epoch": 1160} {"train_loss": -5.73140811920166, "global_step": 48750, "epoch": 1160} {"train_loss": -5.595060348510742, "global_step": 48751, "epoch": 1160} {"train_loss": -5.824987411499023, "global_step": 48752, "epoch": 1160} {"train_loss": -5.774374008178711, "global_step": 48753, "epoch": 1160} {"train_loss": -5.757655143737793, "global_step": 48754, "epoch": 1160} {"train_loss": -5.8027801513671875, "global_step": 48755, "epoch": 1160} {"train_loss": -5.67716121673584, "global_step": 48756, "epoch": 1160} {"train_loss": -5.7560625076293945, "global_step": 48757, "epoch": 1160} {"train_loss": -5.747503280639648, "global_step": 48758, "epoch": 1160} {"train_loss": -5.680203914642334, "global_step": 48759, "epoch": 1160} {"train_loss": -5.762152671813965, "global_step": 48760, "epoch": 1160} {"train_loss": -5.732877436138335, "global_step": 48761, "epoch": 1160, "val_loss": 66007.9453125} {"train_loss": -5.682740688323975, "global_step": 48762, "epoch": 1161} {"train_loss": -5.8273820877075195, "global_step": 48763, "epoch": 1161} {"train_loss": -5.676363945007324, "global_step": 48764, "epoch": 1161} {"train_loss": -5.759537696838379, "global_step": 48765, "epoch": 1161} {"train_loss": -5.711287021636963, "global_step": 48766, "epoch": 1161} {"train_loss": -5.715445518493652, "global_step": 48767, "epoch": 1161} {"train_loss": -5.721214294433594, "global_step": 48768, "epoch": 1161} {"train_loss": -5.803603172302246, "global_step": 48769, "epoch": 1161} {"train_loss": -5.718796730041504, "global_step": 48770, "epoch": 1161} {"train_loss": -5.774528503417969, "global_step": 48771, "epoch": 1161} {"train_loss": -5.618722915649414, "global_step": 48772, "epoch": 1161} {"train_loss": -5.73009729385376, "global_step": 48773, "epoch": 1161} {"train_loss": -5.720470905303955, "global_step": 48774, "epoch": 1161} {"train_loss": -5.745882034301758, "global_step": 48775, "epoch": 1161} {"train_loss": -5.747431755065918, "global_step": 48776, "epoch": 1161} {"train_loss": -5.789384365081787, "global_step": 48777, "epoch": 1161} {"train_loss": -5.829079627990723, "global_step": 48778, "epoch": 1161} {"train_loss": -5.805495738983154, "global_step": 48779, "epoch": 1161} {"train_loss": -5.743897438049316, "global_step": 48780, "epoch": 1161} {"train_loss": -5.697511672973633, "global_step": 48781, "epoch": 1161} {"train_loss": -5.808626174926758, "global_step": 48782, "epoch": 1161} {"train_loss": -5.707831382751465, "global_step": 48783, "epoch": 1161} {"train_loss": -5.87949275970459, "global_step": 48784, "epoch": 1161} {"train_loss": -5.673422336578369, "global_step": 48785, "epoch": 1161} {"train_loss": -5.696113586425781, "global_step": 48786, "epoch": 1161} {"train_loss": -5.698563575744629, "global_step": 48787, "epoch": 1161} {"train_loss": -5.72758674621582, "global_step": 48788, "epoch": 1161} {"train_loss": -5.646709442138672, "global_step": 48789, "epoch": 1161} {"train_loss": -5.680821418762207, "global_step": 48790, "epoch": 1161} {"train_loss": -5.588261604309082, "global_step": 48791, "epoch": 1161} {"train_loss": -5.682608604431152, "global_step": 48792, "epoch": 1161} {"train_loss": -5.902993202209473, "global_step": 48793, "epoch": 1161} {"train_loss": -5.7228102684021, "global_step": 48794, "epoch": 1161} {"train_loss": -5.717289447784424, "global_step": 48795, "epoch": 1161} {"train_loss": -5.777677059173584, "global_step": 48796, "epoch": 1161} {"train_loss": -5.666480541229248, "global_step": 48797, "epoch": 1161} {"train_loss": -5.854063034057617, "global_step": 48798, "epoch": 1161} {"train_loss": -5.855334758758545, "global_step": 48799, "epoch": 1161} {"train_loss": -5.793335914611816, "global_step": 48800, "epoch": 1161} {"train_loss": -5.8051910400390625, "global_step": 48801, "epoch": 1161} {"train_loss": -5.8438239097595215, "global_step": 48802, "epoch": 1161} {"train_loss": -5.746292091551281, "global_step": 48803, "epoch": 1161, "val_loss": 66398.40625} {"train_loss": -5.787176609039307, "global_step": 48804, "epoch": 1162} {"train_loss": -5.705452919006348, "global_step": 48805, "epoch": 1162} {"train_loss": -5.680057048797607, "global_step": 48806, "epoch": 1162} {"train_loss": -5.680655479431152, "global_step": 48807, "epoch": 1162} {"train_loss": -5.772322177886963, "global_step": 48808, "epoch": 1162} {"train_loss": -5.702927112579346, "global_step": 48809, "epoch": 1162} {"train_loss": -5.693450927734375, "global_step": 48810, "epoch": 1162} {"train_loss": -5.820107460021973, "global_step": 48811, "epoch": 1162} {"train_loss": -5.713014602661133, "global_step": 48812, "epoch": 1162} {"train_loss": -5.717103481292725, "global_step": 48813, "epoch": 1162} {"train_loss": -5.684121608734131, "global_step": 48814, "epoch": 1162} {"train_loss": -5.663924694061279, "global_step": 48815, "epoch": 1162} {"train_loss": -5.80595588684082, "global_step": 48816, "epoch": 1162} {"train_loss": -5.62593936920166, "global_step": 48817, "epoch": 1162} {"train_loss": -5.789411544799805, "global_step": 48818, "epoch": 1162} {"train_loss": -5.736740589141846, "global_step": 48819, "epoch": 1162} {"train_loss": -5.759703636169434, "global_step": 48820, "epoch": 1162} {"train_loss": -5.687184810638428, "global_step": 48821, "epoch": 1162} {"train_loss": -5.813460350036621, "global_step": 48822, "epoch": 1162} {"train_loss": -5.7537312507629395, "global_step": 48823, "epoch": 1162} {"train_loss": -5.600799083709717, "global_step": 48824, "epoch": 1162} {"train_loss": -5.66823673248291, "global_step": 48825, "epoch": 1162} {"train_loss": -5.713966369628906, "global_step": 48826, "epoch": 1162} {"train_loss": -5.845400333404541, "global_step": 48827, "epoch": 1162} {"train_loss": -5.756898403167725, "global_step": 48828, "epoch": 1162} {"train_loss": -5.790624618530273, "global_step": 48829, "epoch": 1162} {"train_loss": -5.798170566558838, "global_step": 48830, "epoch": 1162} {"train_loss": -5.679435729980469, "global_step": 48831, "epoch": 1162} {"train_loss": -5.679384231567383, "global_step": 48832, "epoch": 1162} {"train_loss": -5.812511444091797, "global_step": 48833, "epoch": 1162} {"train_loss": -5.789848327636719, "global_step": 48834, "epoch": 1162} {"train_loss": -5.569899559020996, "global_step": 48835, "epoch": 1162} {"train_loss": -5.731621265411377, "global_step": 48836, "epoch": 1162} {"train_loss": -5.7948760986328125, "global_step": 48837, "epoch": 1162} {"train_loss": -5.740692615509033, "global_step": 48838, "epoch": 1162} {"train_loss": -5.916658401489258, "global_step": 48839, "epoch": 1162} {"train_loss": -5.683206558227539, "global_step": 48840, "epoch": 1162} {"train_loss": -5.738718032836914, "global_step": 48841, "epoch": 1162} {"train_loss": -5.711663246154785, "global_step": 48842, "epoch": 1162} {"train_loss": -5.726508140563965, "global_step": 48843, "epoch": 1162} {"train_loss": -5.704204082489014, "global_step": 48844, "epoch": 1162} {"train_loss": -5.733128025418236, "global_step": 48845, "epoch": 1162, "val_loss": 65943.2578125} {"train_loss": -5.72686767578125, "global_step": 48846, "epoch": 1163} {"train_loss": -5.730299472808838, "global_step": 48847, "epoch": 1163} {"train_loss": -5.767765522003174, "global_step": 48848, "epoch": 1163} {"train_loss": -5.815446853637695, "global_step": 48849, "epoch": 1163} {"train_loss": -5.788032531738281, "global_step": 48850, "epoch": 1163} {"train_loss": -5.728457450866699, "global_step": 48851, "epoch": 1163} {"train_loss": -5.678983688354492, "global_step": 48852, "epoch": 1163} {"train_loss": -5.707967758178711, "global_step": 48853, "epoch": 1163} {"train_loss": -5.711936950683594, "global_step": 48854, "epoch": 1163} {"train_loss": -5.716461181640625, "global_step": 48855, "epoch": 1163} {"train_loss": -5.752476692199707, "global_step": 48856, "epoch": 1163} {"train_loss": -5.79001522064209, "global_step": 48857, "epoch": 1163} {"train_loss": -5.773005485534668, "global_step": 48858, "epoch": 1163} {"train_loss": -5.656831741333008, "global_step": 48859, "epoch": 1163} {"train_loss": -5.68746280670166, "global_step": 48860, "epoch": 1163} {"train_loss": -5.711321830749512, "global_step": 48861, "epoch": 1163} {"train_loss": -5.823042392730713, "global_step": 48862, "epoch": 1163} {"train_loss": -5.748236656188965, "global_step": 48863, "epoch": 1163} {"train_loss": -5.618837356567383, "global_step": 48864, "epoch": 1163} {"train_loss": -5.669665336608887, "global_step": 48865, "epoch": 1163} {"train_loss": -5.71946907043457, "global_step": 48866, "epoch": 1163} {"train_loss": -5.76114559173584, "global_step": 48867, "epoch": 1163} {"train_loss": -5.582842826843262, "global_step": 48868, "epoch": 1163} {"train_loss": -5.693668365478516, "global_step": 48869, "epoch": 1163} {"train_loss": -5.6362738609313965, "global_step": 48870, "epoch": 1163} {"train_loss": -5.680361270904541, "global_step": 48871, "epoch": 1163} {"train_loss": -5.7682061195373535, "global_step": 48872, "epoch": 1163} {"train_loss": -5.766471862792969, "global_step": 48873, "epoch": 1163} {"train_loss": -5.781837463378906, "global_step": 48874, "epoch": 1163} {"train_loss": -5.726187229156494, "global_step": 48875, "epoch": 1163} {"train_loss": -5.707436561584473, "global_step": 48876, "epoch": 1163} {"train_loss": -5.785556793212891, "global_step": 48877, "epoch": 1163} {"train_loss": -5.733193397521973, "global_step": 48878, "epoch": 1163} {"train_loss": -5.827134132385254, "global_step": 48879, "epoch": 1163} {"train_loss": -5.728145599365234, "global_step": 48880, "epoch": 1163} {"train_loss": -5.756103038787842, "global_step": 48881, "epoch": 1163} {"train_loss": -5.823250770568848, "global_step": 48882, "epoch": 1163} {"train_loss": -5.68524169921875, "global_step": 48883, "epoch": 1163} {"train_loss": -5.724046230316162, "global_step": 48884, "epoch": 1163} {"train_loss": -5.858524322509766, "global_step": 48885, "epoch": 1163} {"train_loss": -5.770560264587402, "global_step": 48886, "epoch": 1163} {"train_loss": -5.736408994311378, "global_step": 48887, "epoch": 1163, "val_loss": 66208.109375} {"train_loss": -5.701807022094727, "global_step": 48888, "epoch": 1164} {"train_loss": -5.801555633544922, "global_step": 48889, "epoch": 1164} {"train_loss": -5.7327561378479, "global_step": 48890, "epoch": 1164} {"train_loss": -5.734381675720215, "global_step": 48891, "epoch": 1164} {"train_loss": -5.949054718017578, "global_step": 48892, "epoch": 1164} {"train_loss": -5.749372482299805, "global_step": 48893, "epoch": 1164} {"train_loss": -5.625194549560547, "global_step": 48894, "epoch": 1164} {"train_loss": -5.802248954772949, "global_step": 48895, "epoch": 1164} {"train_loss": -5.7000732421875, "global_step": 48896, "epoch": 1164} {"train_loss": -5.728483200073242, "global_step": 48897, "epoch": 1164} {"train_loss": -5.78790283203125, "global_step": 48898, "epoch": 1164} {"train_loss": -5.713034629821777, "global_step": 48899, "epoch": 1164} {"train_loss": -5.718692302703857, "global_step": 48900, "epoch": 1164} {"train_loss": -5.852710247039795, "global_step": 48901, "epoch": 1164} {"train_loss": -5.729079723358154, "global_step": 48902, "epoch": 1164} {"train_loss": -5.793106555938721, "global_step": 48903, "epoch": 1164} {"train_loss": -5.737116813659668, "global_step": 48904, "epoch": 1164} {"train_loss": -5.662687301635742, "global_step": 48905, "epoch": 1164} {"train_loss": -5.745319366455078, "global_step": 48906, "epoch": 1164} {"train_loss": -5.670568466186523, "global_step": 48907, "epoch": 1164} {"train_loss": -5.730095863342285, "global_step": 48908, "epoch": 1164} {"train_loss": -5.701253890991211, "global_step": 48909, "epoch": 1164} {"train_loss": -5.722177028656006, "global_step": 48910, "epoch": 1164} {"train_loss": -5.655023097991943, "global_step": 48911, "epoch": 1164} {"train_loss": -5.790707588195801, "global_step": 48912, "epoch": 1164} {"train_loss": -5.713019371032715, "global_step": 48913, "epoch": 1164} {"train_loss": -5.548440933227539, "global_step": 48914, "epoch": 1164} {"train_loss": -5.832106590270996, "global_step": 48915, "epoch": 1164} {"train_loss": -5.66666841506958, "global_step": 48916, "epoch": 1164} {"train_loss": -5.622942924499512, "global_step": 48917, "epoch": 1164} {"train_loss": -5.731948375701904, "global_step": 48918, "epoch": 1164} {"train_loss": -5.451850414276123, "global_step": 48919, "epoch": 1164} {"train_loss": -5.614190101623535, "global_step": 48920, "epoch": 1164} {"train_loss": -5.608956336975098, "global_step": 48921, "epoch": 1164} {"train_loss": -5.78238582611084, "global_step": 48922, "epoch": 1164} {"train_loss": -5.629735946655273, "global_step": 48923, "epoch": 1164} {"train_loss": -5.629289627075195, "global_step": 48924, "epoch": 1164} {"train_loss": -5.822059631347656, "global_step": 48925, "epoch": 1164} {"train_loss": -5.733302593231201, "global_step": 48926, "epoch": 1164} {"train_loss": -5.638389587402344, "global_step": 48927, "epoch": 1164} {"train_loss": -5.67038631439209, "global_step": 48928, "epoch": 1164} {"train_loss": -5.711459216617403, "global_step": 48929, "epoch": 1164, "val_loss": 66103.640625} {"train_loss": -5.842953681945801, "global_step": 48930, "epoch": 1165} {"train_loss": -5.903036117553711, "global_step": 48931, "epoch": 1165} {"train_loss": -5.63007926940918, "global_step": 48932, "epoch": 1165} {"train_loss": -5.736681938171387, "global_step": 48933, "epoch": 1165} {"train_loss": -5.753582000732422, "global_step": 48934, "epoch": 1165} {"train_loss": -5.6911091804504395, "global_step": 48935, "epoch": 1165} {"train_loss": -5.765256404876709, "global_step": 48936, "epoch": 1165} {"train_loss": -5.752424716949463, "global_step": 48937, "epoch": 1165} {"train_loss": -5.475376605987549, "global_step": 48938, "epoch": 1165} {"train_loss": -5.789193630218506, "global_step": 48939, "epoch": 1165} {"train_loss": -5.746971130371094, "global_step": 48940, "epoch": 1165} {"train_loss": -5.6460418701171875, "global_step": 48941, "epoch": 1165} {"train_loss": -5.778965473175049, "global_step": 48942, "epoch": 1165} {"train_loss": -5.574855804443359, "global_step": 48943, "epoch": 1165} {"train_loss": -5.755683422088623, "global_step": 48944, "epoch": 1165} {"train_loss": -5.738791465759277, "global_step": 48945, "epoch": 1165} {"train_loss": -5.792065620422363, "global_step": 48946, "epoch": 1165} {"train_loss": -5.743456840515137, "global_step": 48947, "epoch": 1165} {"train_loss": -5.6935319900512695, "global_step": 48948, "epoch": 1165} {"train_loss": -5.679116725921631, "global_step": 48949, "epoch": 1165} {"train_loss": -5.748220920562744, "global_step": 48950, "epoch": 1165} {"train_loss": -5.594388961791992, "global_step": 48951, "epoch": 1165} {"train_loss": -5.609747409820557, "global_step": 48952, "epoch": 1165} {"train_loss": -5.633398056030273, "global_step": 48953, "epoch": 1165} {"train_loss": -5.679143905639648, "global_step": 48954, "epoch": 1165} {"train_loss": -5.728496074676514, "global_step": 48955, "epoch": 1165} {"train_loss": -5.723352432250977, "global_step": 48956, "epoch": 1165} {"train_loss": -5.753624439239502, "global_step": 48957, "epoch": 1165} {"train_loss": -5.668871879577637, "global_step": 48958, "epoch": 1165} {"train_loss": -5.804570198059082, "global_step": 48959, "epoch": 1165} {"train_loss": -5.757190227508545, "global_step": 48960, "epoch": 1165} {"train_loss": -5.779997825622559, "global_step": 48961, "epoch": 1165} {"train_loss": -5.7120513916015625, "global_step": 48962, "epoch": 1165} {"train_loss": -5.707690715789795, "global_step": 48963, "epoch": 1165} {"train_loss": -5.71038293838501, "global_step": 48964, "epoch": 1165} {"train_loss": -5.8216657638549805, "global_step": 48965, "epoch": 1165} {"train_loss": -5.671228885650635, "global_step": 48966, "epoch": 1165} {"train_loss": -5.7804412841796875, "global_step": 48967, "epoch": 1165} {"train_loss": -5.837858200073242, "global_step": 48968, "epoch": 1165} {"train_loss": -5.651097297668457, "global_step": 48969, "epoch": 1165} {"train_loss": -5.686481475830078, "global_step": 48970, "epoch": 1165} {"train_loss": -5.724266426903861, "global_step": 48971, "epoch": 1165, "val_loss": 66356.4921875} {"train_loss": -5.615006446838379, "global_step": 48972, "epoch": 1166} {"train_loss": -5.674619197845459, "global_step": 48973, "epoch": 1166} {"train_loss": -5.754847526550293, "global_step": 48974, "epoch": 1166} {"train_loss": -5.72966194152832, "global_step": 48975, "epoch": 1166} {"train_loss": -5.740574836730957, "global_step": 48976, "epoch": 1166} {"train_loss": -5.619376182556152, "global_step": 48977, "epoch": 1166} {"train_loss": -5.871711254119873, "global_step": 48978, "epoch": 1166} {"train_loss": -5.664393901824951, "global_step": 48979, "epoch": 1166} {"train_loss": -5.648202896118164, "global_step": 48980, "epoch": 1166} {"train_loss": -5.83359432220459, "global_step": 48981, "epoch": 1166} {"train_loss": -5.693274021148682, "global_step": 48982, "epoch": 1166} {"train_loss": -5.727189064025879, "global_step": 48983, "epoch": 1166} {"train_loss": -5.619524955749512, "global_step": 48984, "epoch": 1166} {"train_loss": -5.752711296081543, "global_step": 48985, "epoch": 1166} {"train_loss": -5.730852127075195, "global_step": 48986, "epoch": 1166} {"train_loss": -5.716894626617432, "global_step": 48987, "epoch": 1166} {"train_loss": -5.754091262817383, "global_step": 48988, "epoch": 1166} {"train_loss": -5.809233665466309, "global_step": 48989, "epoch": 1166} {"train_loss": -5.802012920379639, "global_step": 48990, "epoch": 1166} {"train_loss": -5.669865131378174, "global_step": 48991, "epoch": 1166} {"train_loss": -5.862978935241699, "global_step": 48992, "epoch": 1166} {"train_loss": -5.63765287399292, "global_step": 48993, "epoch": 1166} {"train_loss": -5.837902069091797, "global_step": 48994, "epoch": 1166} {"train_loss": -5.695796966552734, "global_step": 48995, "epoch": 1166} {"train_loss": -5.654935359954834, "global_step": 48996, "epoch": 1166} {"train_loss": -5.740081787109375, "global_step": 48997, "epoch": 1166} {"train_loss": -5.64194393157959, "global_step": 48998, "epoch": 1166} {"train_loss": -5.781014442443848, "global_step": 48999, "epoch": 1166} {"train_loss": -5.883746147155762, "global_step": 49000, "epoch": 1166} {"train_loss": -5.729607582092285, "global_step": 49001, "epoch": 1166} {"train_loss": -5.765056610107422, "global_step": 49002, "epoch": 1166} {"train_loss": -5.69462776184082, "global_step": 49003, "epoch": 1166} {"train_loss": -5.750388145446777, "global_step": 49004, "epoch": 1166} {"train_loss": -5.805066108703613, "global_step": 49005, "epoch": 1166} {"train_loss": -5.739675521850586, "global_step": 49006, "epoch": 1166} {"train_loss": -5.687954902648926, "global_step": 49007, "epoch": 1166} {"train_loss": -5.769258499145508, "global_step": 49008, "epoch": 1166} {"train_loss": -5.805558681488037, "global_step": 49009, "epoch": 1166} {"train_loss": -5.73583984375, "global_step": 49010, "epoch": 1166} {"train_loss": -5.708288192749023, "global_step": 49011, "epoch": 1166} {"train_loss": -5.816769123077393, "global_step": 49012, "epoch": 1166} {"train_loss": -5.732569410687401, "global_step": 49013, "epoch": 1166, "val_loss": 66087.2734375} {"train_loss": -5.682454586029053, "global_step": 49014, "epoch": 1167} {"train_loss": -5.752642631530762, "global_step": 49015, "epoch": 1167} {"train_loss": -5.69575834274292, "global_step": 49016, "epoch": 1167} {"train_loss": -5.648751258850098, "global_step": 49017, "epoch": 1167} {"train_loss": -5.795261383056641, "global_step": 49018, "epoch": 1167} {"train_loss": -5.5824384689331055, "global_step": 49019, "epoch": 1167} {"train_loss": -5.760473728179932, "global_step": 49020, "epoch": 1167} {"train_loss": -5.700249671936035, "global_step": 49021, "epoch": 1167} {"train_loss": -5.604724884033203, "global_step": 49022, "epoch": 1167} {"train_loss": -5.7102861404418945, "global_step": 49023, "epoch": 1167} {"train_loss": -5.60584020614624, "global_step": 49024, "epoch": 1167} {"train_loss": -5.7012834548950195, "global_step": 49025, "epoch": 1167} {"train_loss": -5.841491222381592, "global_step": 49026, "epoch": 1167} {"train_loss": -5.69581413269043, "global_step": 49027, "epoch": 1167} {"train_loss": -5.647400856018066, "global_step": 49028, "epoch": 1167} {"train_loss": -5.735119819641113, "global_step": 49029, "epoch": 1167} {"train_loss": -5.726500511169434, "global_step": 49030, "epoch": 1167} {"train_loss": -5.697815895080566, "global_step": 49031, "epoch": 1167} {"train_loss": -5.7701592445373535, "global_step": 49032, "epoch": 1167} {"train_loss": -5.690181732177734, "global_step": 49033, "epoch": 1167} {"train_loss": -5.673357009887695, "global_step": 49034, "epoch": 1167} {"train_loss": -5.6601057052612305, "global_step": 49035, "epoch": 1167} {"train_loss": -5.804293632507324, "global_step": 49036, "epoch": 1167} {"train_loss": -5.718784332275391, "global_step": 49037, "epoch": 1167} {"train_loss": -5.591287612915039, "global_step": 49038, "epoch": 1167} {"train_loss": -5.635676383972168, "global_step": 49039, "epoch": 1167} {"train_loss": -5.586179733276367, "global_step": 49040, "epoch": 1167} {"train_loss": -5.529618740081787, "global_step": 49041, "epoch": 1167} {"train_loss": -5.715882301330566, "global_step": 49042, "epoch": 1167} {"train_loss": -5.698156356811523, "global_step": 49043, "epoch": 1167} {"train_loss": -5.732184410095215, "global_step": 49044, "epoch": 1167} {"train_loss": -5.73336935043335, "global_step": 49045, "epoch": 1167} {"train_loss": -5.670698165893555, "global_step": 49046, "epoch": 1167} {"train_loss": -5.7076921463012695, "global_step": 49047, "epoch": 1167} {"train_loss": -5.759805679321289, "global_step": 49048, "epoch": 1167} {"train_loss": -5.774085998535156, "global_step": 49049, "epoch": 1167} {"train_loss": -5.803284168243408, "global_step": 49050, "epoch": 1167} {"train_loss": -5.864083290100098, "global_step": 49051, "epoch": 1167} {"train_loss": -5.692936897277832, "global_step": 49052, "epoch": 1167} {"train_loss": -5.7087578773498535, "global_step": 49053, "epoch": 1167} {"train_loss": -5.761822700500488, "global_step": 49054, "epoch": 1167} {"train_loss": -5.704899186179752, "global_step": 49055, "epoch": 1167, "val_loss": 66279.3671875} {"train_loss": -5.656747817993164, "global_step": 49056, "epoch": 1168} {"train_loss": -5.675518035888672, "global_step": 49057, "epoch": 1168} {"train_loss": -5.799983978271484, "global_step": 49058, "epoch": 1168} {"train_loss": -5.783999443054199, "global_step": 49059, "epoch": 1168} {"train_loss": -5.745214462280273, "global_step": 49060, "epoch": 1168} {"train_loss": -5.7868523597717285, "global_step": 49061, "epoch": 1168} {"train_loss": -5.855639934539795, "global_step": 49062, "epoch": 1168} {"train_loss": -5.732881546020508, "global_step": 49063, "epoch": 1168} {"train_loss": -5.859708786010742, "global_step": 49064, "epoch": 1168} {"train_loss": -5.705315589904785, "global_step": 49065, "epoch": 1168} {"train_loss": -5.770046234130859, "global_step": 49066, "epoch": 1168} {"train_loss": -5.8616485595703125, "global_step": 49067, "epoch": 1168} {"train_loss": -5.654162406921387, "global_step": 49068, "epoch": 1168} {"train_loss": -5.82065486907959, "global_step": 49069, "epoch": 1168} {"train_loss": -5.812570571899414, "global_step": 49070, "epoch": 1168} {"train_loss": -5.642390727996826, "global_step": 49071, "epoch": 1168} {"train_loss": -5.743365287780762, "global_step": 49072, "epoch": 1168} {"train_loss": -5.796986103057861, "global_step": 49073, "epoch": 1168} {"train_loss": -5.687636375427246, "global_step": 49074, "epoch": 1168} {"train_loss": -5.805436611175537, "global_step": 49075, "epoch": 1168} {"train_loss": -5.823737621307373, "global_step": 49076, "epoch": 1168} {"train_loss": -5.808012008666992, "global_step": 49077, "epoch": 1168} {"train_loss": -5.623599052429199, "global_step": 49078, "epoch": 1168} {"train_loss": -5.881319999694824, "global_step": 49079, "epoch": 1168} {"train_loss": -5.816632270812988, "global_step": 49080, "epoch": 1168} {"train_loss": -5.597268581390381, "global_step": 49081, "epoch": 1168} {"train_loss": -5.715515613555908, "global_step": 49082, "epoch": 1168} {"train_loss": -5.8288254737854, "global_step": 49083, "epoch": 1168} {"train_loss": -5.706055641174316, "global_step": 49084, "epoch": 1168} {"train_loss": -5.779897689819336, "global_step": 49085, "epoch": 1168} {"train_loss": -5.775729179382324, "global_step": 49086, "epoch": 1168} {"train_loss": -5.731757164001465, "global_step": 49087, "epoch": 1168} {"train_loss": -5.758284568786621, "global_step": 49088, "epoch": 1168} {"train_loss": -5.543094635009766, "global_step": 49089, "epoch": 1168} {"train_loss": -5.782214164733887, "global_step": 49090, "epoch": 1168} {"train_loss": -5.71262264251709, "global_step": 49091, "epoch": 1168} {"train_loss": -5.715648174285889, "global_step": 49092, "epoch": 1168} {"train_loss": -5.820338249206543, "global_step": 49093, "epoch": 1168} {"train_loss": -5.868886947631836, "global_step": 49094, "epoch": 1168} {"train_loss": -5.889150619506836, "global_step": 49095, "epoch": 1168} {"train_loss": -5.738236427307129, "global_step": 49096, "epoch": 1168} {"train_loss": -5.758673543021793, "global_step": 49097, "epoch": 1168, "val_loss": 66314.3359375} {"train_loss": -5.825613498687744, "global_step": 49098, "epoch": 1169} {"train_loss": -5.6748552322387695, "global_step": 49099, "epoch": 1169} {"train_loss": -5.840075492858887, "global_step": 49100, "epoch": 1169} {"train_loss": -5.742058753967285, "global_step": 49101, "epoch": 1169} {"train_loss": -5.7073750495910645, "global_step": 49102, "epoch": 1169} {"train_loss": -5.8489227294921875, "global_step": 49103, "epoch": 1169} {"train_loss": -5.821809768676758, "global_step": 49104, "epoch": 1169} {"train_loss": -5.698299884796143, "global_step": 49105, "epoch": 1169} {"train_loss": -5.805942535400391, "global_step": 49106, "epoch": 1169} {"train_loss": -5.924635887145996, "global_step": 49107, "epoch": 1169} {"train_loss": -5.8944902420043945, "global_step": 49108, "epoch": 1169} {"train_loss": -5.735552787780762, "global_step": 49109, "epoch": 1169} {"train_loss": -5.829707622528076, "global_step": 49110, "epoch": 1169} {"train_loss": -5.814820289611816, "global_step": 49111, "epoch": 1169} {"train_loss": -5.747413635253906, "global_step": 49112, "epoch": 1169} {"train_loss": -5.670459747314453, "global_step": 49113, "epoch": 1169} {"train_loss": -5.726938247680664, "global_step": 49114, "epoch": 1169} {"train_loss": -5.691188812255859, "global_step": 49115, "epoch": 1169} {"train_loss": -5.6881256103515625, "global_step": 49116, "epoch": 1169} {"train_loss": -5.7403364181518555, "global_step": 49117, "epoch": 1169} {"train_loss": -5.641292572021484, "global_step": 49118, "epoch": 1169} {"train_loss": -5.8086652755737305, "global_step": 49119, "epoch": 1169} {"train_loss": -5.750218868255615, "global_step": 49120, "epoch": 1169} {"train_loss": -5.68577766418457, "global_step": 49121, "epoch": 1169} {"train_loss": -5.655582427978516, "global_step": 49122, "epoch": 1169} {"train_loss": -5.734508037567139, "global_step": 49123, "epoch": 1169} {"train_loss": -5.745021820068359, "global_step": 49124, "epoch": 1169} {"train_loss": -5.759381294250488, "global_step": 49125, "epoch": 1169} {"train_loss": -5.856890678405762, "global_step": 49126, "epoch": 1169} {"train_loss": -5.839294910430908, "global_step": 49127, "epoch": 1169} {"train_loss": -5.799544811248779, "global_step": 49128, "epoch": 1169} {"train_loss": -5.689265251159668, "global_step": 49129, "epoch": 1169} {"train_loss": -5.682796955108643, "global_step": 49130, "epoch": 1169} {"train_loss": -5.605034351348877, "global_step": 49131, "epoch": 1169} {"train_loss": -5.67666482925415, "global_step": 49132, "epoch": 1169} {"train_loss": -5.743559837341309, "global_step": 49133, "epoch": 1169} {"train_loss": -5.700602054595947, "global_step": 49134, "epoch": 1169} {"train_loss": -5.761115074157715, "global_step": 49135, "epoch": 1169} {"train_loss": -5.6537017822265625, "global_step": 49136, "epoch": 1169} {"train_loss": -5.707663536071777, "global_step": 49137, "epoch": 1169} {"train_loss": -5.539727210998535, "global_step": 49138, "epoch": 1169} {"train_loss": -5.7416357199351, "global_step": 49139, "epoch": 1169, "val_loss": 65997.9609375} {"train_loss": -5.828537940979004, "global_step": 49140, "epoch": 1170} {"train_loss": -5.799416542053223, "global_step": 49141, "epoch": 1170} {"train_loss": -5.6926164627075195, "global_step": 49142, "epoch": 1170} {"train_loss": -5.7258148193359375, "global_step": 49143, "epoch": 1170} {"train_loss": -5.765961647033691, "global_step": 49144, "epoch": 1170} {"train_loss": -5.812394142150879, "global_step": 49145, "epoch": 1170} {"train_loss": -5.730058670043945, "global_step": 49146, "epoch": 1170} {"train_loss": -5.799970626831055, "global_step": 49147, "epoch": 1170} {"train_loss": -5.75193977355957, "global_step": 49148, "epoch": 1170} {"train_loss": -5.829926490783691, "global_step": 49149, "epoch": 1170} {"train_loss": -5.705350875854492, "global_step": 49150, "epoch": 1170} {"train_loss": -5.749718189239502, "global_step": 49151, "epoch": 1170} {"train_loss": -5.6618523597717285, "global_step": 49152, "epoch": 1170} {"train_loss": -5.814352035522461, "global_step": 49153, "epoch": 1170} {"train_loss": -5.677942276000977, "global_step": 49154, "epoch": 1170} {"train_loss": -5.757991790771484, "global_step": 49155, "epoch": 1170} {"train_loss": -5.821268081665039, "global_step": 49156, "epoch": 1170} {"train_loss": -5.665295124053955, "global_step": 49157, "epoch": 1170} {"train_loss": -5.654068946838379, "global_step": 49158, "epoch": 1170} {"train_loss": -5.748422622680664, "global_step": 49159, "epoch": 1170} {"train_loss": -5.762001991271973, "global_step": 49160, "epoch": 1170} {"train_loss": -5.696554183959961, "global_step": 49161, "epoch": 1170} {"train_loss": -5.834076881408691, "global_step": 49162, "epoch": 1170} {"train_loss": -5.7062668800354, "global_step": 49163, "epoch": 1170} {"train_loss": -5.778976917266846, "global_step": 49164, "epoch": 1170} {"train_loss": -5.737589359283447, "global_step": 49165, "epoch": 1170} {"train_loss": -5.682030200958252, "global_step": 49166, "epoch": 1170} {"train_loss": -5.736411094665527, "global_step": 49167, "epoch": 1170} {"train_loss": -5.616460800170898, "global_step": 49168, "epoch": 1170} {"train_loss": -5.714735984802246, "global_step": 49169, "epoch": 1170} {"train_loss": -5.737922191619873, "global_step": 49170, "epoch": 1170} {"train_loss": -5.684380531311035, "global_step": 49171, "epoch": 1170} {"train_loss": -5.820085048675537, "global_step": 49172, "epoch": 1170} {"train_loss": -5.654087543487549, "global_step": 49173, "epoch": 1170} {"train_loss": -5.698148727416992, "global_step": 49174, "epoch": 1170} {"train_loss": -5.815719127655029, "global_step": 49175, "epoch": 1170} {"train_loss": -5.726062774658203, "global_step": 49176, "epoch": 1170} {"train_loss": -5.78630256652832, "global_step": 49177, "epoch": 1170} {"train_loss": -5.80073356628418, "global_step": 49178, "epoch": 1170} {"train_loss": -5.699039459228516, "global_step": 49179, "epoch": 1170} {"train_loss": -5.683352947235107, "global_step": 49180, "epoch": 1170} {"train_loss": -5.739473569960821, "global_step": 49181, "epoch": 1170, "val_loss": 66302.609375} {"train_loss": -5.740799903869629, "global_step": 49182, "epoch": 1171} {"train_loss": -5.728696823120117, "global_step": 49183, "epoch": 1171} {"train_loss": -5.8192901611328125, "global_step": 49184, "epoch": 1171} {"train_loss": -5.814791679382324, "global_step": 49185, "epoch": 1171} {"train_loss": -5.791323661804199, "global_step": 49186, "epoch": 1171} {"train_loss": -5.818777561187744, "global_step": 49187, "epoch": 1171} {"train_loss": -5.68718147277832, "global_step": 49188, "epoch": 1171} {"train_loss": -5.873229503631592, "global_step": 49189, "epoch": 1171} {"train_loss": -5.784762382507324, "global_step": 49190, "epoch": 1171} {"train_loss": -5.873538970947266, "global_step": 49191, "epoch": 1171} {"train_loss": -5.849400520324707, "global_step": 49192, "epoch": 1171} {"train_loss": -5.750040531158447, "global_step": 49193, "epoch": 1171} {"train_loss": -5.845530986785889, "global_step": 49194, "epoch": 1171} {"train_loss": -5.828373908996582, "global_step": 49195, "epoch": 1171} {"train_loss": -5.659628391265869, "global_step": 49196, "epoch": 1171} {"train_loss": -5.806936264038086, "global_step": 49197, "epoch": 1171} {"train_loss": -5.695920467376709, "global_step": 49198, "epoch": 1171} {"train_loss": -5.780913829803467, "global_step": 49199, "epoch": 1171} {"train_loss": -5.731932163238525, "global_step": 49200, "epoch": 1171} {"train_loss": -5.670507431030273, "global_step": 49201, "epoch": 1171} {"train_loss": -5.6271796226501465, "global_step": 49202, "epoch": 1171} {"train_loss": -5.732087135314941, "global_step": 49203, "epoch": 1171} {"train_loss": -5.875545024871826, "global_step": 49204, "epoch": 1171} {"train_loss": -5.805776596069336, "global_step": 49205, "epoch": 1171} {"train_loss": -5.786737442016602, "global_step": 49206, "epoch": 1171} {"train_loss": -5.824182510375977, "global_step": 49207, "epoch": 1171} {"train_loss": -5.8642449378967285, "global_step": 49208, "epoch": 1171} {"train_loss": -5.7392377853393555, "global_step": 49209, "epoch": 1171} {"train_loss": -5.721838474273682, "global_step": 49210, "epoch": 1171} {"train_loss": -5.750744819641113, "global_step": 49211, "epoch": 1171} {"train_loss": -5.849672317504883, "global_step": 49212, "epoch": 1171} {"train_loss": -5.692433834075928, "global_step": 49213, "epoch": 1171} {"train_loss": -5.671677589416504, "global_step": 49214, "epoch": 1171} {"train_loss": -5.721172332763672, "global_step": 49215, "epoch": 1171} {"train_loss": -5.655037879943848, "global_step": 49216, "epoch": 1171} {"train_loss": -5.697203159332275, "global_step": 49217, "epoch": 1171} {"train_loss": -5.768564224243164, "global_step": 49218, "epoch": 1171} {"train_loss": -5.637166976928711, "global_step": 49219, "epoch": 1171} {"train_loss": -5.8093976974487305, "global_step": 49220, "epoch": 1171} {"train_loss": -5.769012451171875, "global_step": 49221, "epoch": 1171} {"train_loss": -5.648383617401123, "global_step": 49222, "epoch": 1171} {"train_loss": -5.760833751587641, "global_step": 49223, "epoch": 1171, "val_loss": 66346.3984375} {"train_loss": -5.7369585037231445, "global_step": 49224, "epoch": 1172} {"train_loss": -5.8230767250061035, "global_step": 49225, "epoch": 1172} {"train_loss": -5.727274417877197, "global_step": 49226, "epoch": 1172} {"train_loss": -5.796291828155518, "global_step": 49227, "epoch": 1172} {"train_loss": -5.668880462646484, "global_step": 49228, "epoch": 1172} {"train_loss": -5.7527594566345215, "global_step": 49229, "epoch": 1172} {"train_loss": -5.701674461364746, "global_step": 49230, "epoch": 1172} {"train_loss": -5.680764198303223, "global_step": 49231, "epoch": 1172} {"train_loss": -5.826378345489502, "global_step": 49232, "epoch": 1172} {"train_loss": -5.681787967681885, "global_step": 49233, "epoch": 1172} {"train_loss": -5.798130989074707, "global_step": 49234, "epoch": 1172} {"train_loss": -5.812808990478516, "global_step": 49235, "epoch": 1172} {"train_loss": -5.593420028686523, "global_step": 49236, "epoch": 1172} {"train_loss": -5.7855000495910645, "global_step": 49237, "epoch": 1172} {"train_loss": -5.7939958572387695, "global_step": 49238, "epoch": 1172} {"train_loss": -5.718530654907227, "global_step": 49239, "epoch": 1172} {"train_loss": -5.698115825653076, "global_step": 49240, "epoch": 1172} {"train_loss": -5.627266883850098, "global_step": 49241, "epoch": 1172} {"train_loss": -5.820412635803223, "global_step": 49242, "epoch": 1172} {"train_loss": -5.8275957107543945, "global_step": 49243, "epoch": 1172} {"train_loss": -5.689821720123291, "global_step": 49244, "epoch": 1172} {"train_loss": -5.804989814758301, "global_step": 49245, "epoch": 1172} {"train_loss": -5.753966808319092, "global_step": 49246, "epoch": 1172} {"train_loss": -5.589620590209961, "global_step": 49247, "epoch": 1172} {"train_loss": -5.632603645324707, "global_step": 49248, "epoch": 1172} {"train_loss": -5.727718353271484, "global_step": 49249, "epoch": 1172} {"train_loss": -5.718781471252441, "global_step": 49250, "epoch": 1172} {"train_loss": -5.866987228393555, "global_step": 49251, "epoch": 1172} {"train_loss": -5.566014289855957, "global_step": 49252, "epoch": 1172} {"train_loss": -5.786726951599121, "global_step": 49253, "epoch": 1172} {"train_loss": -5.766299247741699, "global_step": 49254, "epoch": 1172} {"train_loss": -5.683422088623047, "global_step": 49255, "epoch": 1172} {"train_loss": -5.739686489105225, "global_step": 49256, "epoch": 1172} {"train_loss": -5.760689735412598, "global_step": 49257, "epoch": 1172} {"train_loss": -5.67940616607666, "global_step": 49258, "epoch": 1172} {"train_loss": -5.720370292663574, "global_step": 49259, "epoch": 1172} {"train_loss": -5.778589725494385, "global_step": 49260, "epoch": 1172} {"train_loss": -5.76455020904541, "global_step": 49261, "epoch": 1172} {"train_loss": -5.701443672180176, "global_step": 49262, "epoch": 1172} {"train_loss": -5.924151420593262, "global_step": 49263, "epoch": 1172} {"train_loss": -5.529996395111084, "global_step": 49264, "epoch": 1172} {"train_loss": -5.731618404388428, "global_step": 49265, "epoch": 1172, "val_loss": 66006.3359375} {"train_loss": -5.743332862854004, "global_step": 49266, "epoch": 1173} {"train_loss": -5.721783638000488, "global_step": 49267, "epoch": 1173} {"train_loss": -5.735637664794922, "global_step": 49268, "epoch": 1173} {"train_loss": -5.746726036071777, "global_step": 49269, "epoch": 1173} {"train_loss": -5.760800361633301, "global_step": 49270, "epoch": 1173} {"train_loss": -5.7518391609191895, "global_step": 49271, "epoch": 1173} {"train_loss": -5.706598281860352, "global_step": 49272, "epoch": 1173} {"train_loss": -5.72783088684082, "global_step": 49273, "epoch": 1173} {"train_loss": -5.7693634033203125, "global_step": 49274, "epoch": 1173} {"train_loss": -5.753847599029541, "global_step": 49275, "epoch": 1173} {"train_loss": -5.723918914794922, "global_step": 49276, "epoch": 1173} {"train_loss": -5.711190223693848, "global_step": 49277, "epoch": 1173} {"train_loss": -5.791367530822754, "global_step": 49278, "epoch": 1173} {"train_loss": -5.834280490875244, "global_step": 49279, "epoch": 1173} {"train_loss": -5.805209636688232, "global_step": 49280, "epoch": 1173} {"train_loss": -5.937554359436035, "global_step": 49281, "epoch": 1173} {"train_loss": -5.837444305419922, "global_step": 49282, "epoch": 1173} {"train_loss": -5.620807647705078, "global_step": 49283, "epoch": 1173} {"train_loss": -5.6470184326171875, "global_step": 49284, "epoch": 1173} {"train_loss": -5.858208656311035, "global_step": 49285, "epoch": 1173} {"train_loss": -5.716911315917969, "global_step": 49286, "epoch": 1173} {"train_loss": -5.7200775146484375, "global_step": 49287, "epoch": 1173} {"train_loss": -5.7395920753479, "global_step": 49288, "epoch": 1173} {"train_loss": -5.83079719543457, "global_step": 49289, "epoch": 1173} {"train_loss": -5.711472511291504, "global_step": 49290, "epoch": 1173} {"train_loss": -5.54484748840332, "global_step": 49291, "epoch": 1173} {"train_loss": -5.815478324890137, "global_step": 49292, "epoch": 1173} {"train_loss": -5.548514366149902, "global_step": 49293, "epoch": 1173} {"train_loss": -5.670802116394043, "global_step": 49294, "epoch": 1173} {"train_loss": -5.750115871429443, "global_step": 49295, "epoch": 1173} {"train_loss": -5.797657489776611, "global_step": 49296, "epoch": 1173} {"train_loss": -5.6354827880859375, "global_step": 49297, "epoch": 1173} {"train_loss": -5.818892478942871, "global_step": 49298, "epoch": 1173} {"train_loss": -5.719148635864258, "global_step": 49299, "epoch": 1173} {"train_loss": -5.692897796630859, "global_step": 49300, "epoch": 1173} {"train_loss": -5.9266815185546875, "global_step": 49301, "epoch": 1173} {"train_loss": -5.818775177001953, "global_step": 49302, "epoch": 1173} {"train_loss": -5.836404323577881, "global_step": 49303, "epoch": 1173} {"train_loss": -5.688955307006836, "global_step": 49304, "epoch": 1173} {"train_loss": -5.681380748748779, "global_step": 49305, "epoch": 1173} {"train_loss": -5.79496955871582, "global_step": 49306, "epoch": 1173} {"train_loss": -5.750335568473453, "global_step": 49307, "epoch": 1173, "val_loss": 66149.1640625} {"train_loss": -5.798846244812012, "global_step": 49308, "epoch": 1174} {"train_loss": -5.681756973266602, "global_step": 49309, "epoch": 1174} {"train_loss": -5.744836807250977, "global_step": 49310, "epoch": 1174} {"train_loss": -5.8752288818359375, "global_step": 49311, "epoch": 1174} {"train_loss": -5.801023483276367, "global_step": 49312, "epoch": 1174} {"train_loss": -5.829185485839844, "global_step": 49313, "epoch": 1174} {"train_loss": -5.818244934082031, "global_step": 49314, "epoch": 1174} {"train_loss": -5.7873053550720215, "global_step": 49315, "epoch": 1174} {"train_loss": -5.779831409454346, "global_step": 49316, "epoch": 1174} {"train_loss": -5.767085552215576, "global_step": 49317, "epoch": 1174} {"train_loss": -5.789142608642578, "global_step": 49318, "epoch": 1174} {"train_loss": -5.624580383300781, "global_step": 49319, "epoch": 1174} {"train_loss": -5.731087684631348, "global_step": 49320, "epoch": 1174} {"train_loss": -5.687475681304932, "global_step": 49321, "epoch": 1174} {"train_loss": -5.711764812469482, "global_step": 49322, "epoch": 1174} {"train_loss": -5.8294243812561035, "global_step": 49323, "epoch": 1174} {"train_loss": -5.645143508911133, "global_step": 49324, "epoch": 1174} {"train_loss": -5.834347248077393, "global_step": 49325, "epoch": 1174} {"train_loss": -5.715494155883789, "global_step": 49326, "epoch": 1174} {"train_loss": -5.825323104858398, "global_step": 49327, "epoch": 1174} {"train_loss": -5.803906440734863, "global_step": 49328, "epoch": 1174} {"train_loss": -5.622779369354248, "global_step": 49329, "epoch": 1174} {"train_loss": -5.76679801940918, "global_step": 49330, "epoch": 1174} {"train_loss": -5.6241679191589355, "global_step": 49331, "epoch": 1174} {"train_loss": -5.740691661834717, "global_step": 49332, "epoch": 1174} {"train_loss": -5.892121315002441, "global_step": 49333, "epoch": 1174} {"train_loss": -5.593507766723633, "global_step": 49334, "epoch": 1174} {"train_loss": -5.73099422454834, "global_step": 49335, "epoch": 1174} {"train_loss": -5.741757392883301, "global_step": 49336, "epoch": 1174} {"train_loss": -5.723858833312988, "global_step": 49337, "epoch": 1174} {"train_loss": -5.684498310089111, "global_step": 49338, "epoch": 1174} {"train_loss": -5.765069007873535, "global_step": 49339, "epoch": 1174} {"train_loss": -5.81606388092041, "global_step": 49340, "epoch": 1174} {"train_loss": -5.687930107116699, "global_step": 49341, "epoch": 1174} {"train_loss": -5.645729064941406, "global_step": 49342, "epoch": 1174} {"train_loss": -5.798867225646973, "global_step": 49343, "epoch": 1174} {"train_loss": -5.791778087615967, "global_step": 49344, "epoch": 1174} {"train_loss": -5.74846887588501, "global_step": 49345, "epoch": 1174} {"train_loss": -5.775666236877441, "global_step": 49346, "epoch": 1174} {"train_loss": -5.849120140075684, "global_step": 49347, "epoch": 1174} {"train_loss": -5.582606315612793, "global_step": 49348, "epoch": 1174} {"train_loss": -5.750216098058791, "global_step": 49349, "epoch": 1174, "val_loss": 66280.03125} {"train_loss": -5.745090961456299, "global_step": 49350, "epoch": 1175} {"train_loss": -5.830950736999512, "global_step": 49351, "epoch": 1175} {"train_loss": -5.7978692054748535, "global_step": 49352, "epoch": 1175} {"train_loss": -5.800022602081299, "global_step": 49353, "epoch": 1175} {"train_loss": -5.743312835693359, "global_step": 49354, "epoch": 1175} {"train_loss": -5.808492183685303, "global_step": 49355, "epoch": 1175} {"train_loss": -5.838918685913086, "global_step": 49356, "epoch": 1175} {"train_loss": -5.691774368286133, "global_step": 49357, "epoch": 1175} {"train_loss": -5.839956283569336, "global_step": 49358, "epoch": 1175} {"train_loss": -5.772228717803955, "global_step": 49359, "epoch": 1175} {"train_loss": -5.693317413330078, "global_step": 49360, "epoch": 1175} {"train_loss": -5.888254165649414, "global_step": 49361, "epoch": 1175} {"train_loss": -5.897833347320557, "global_step": 49362, "epoch": 1175} {"train_loss": -5.777594566345215, "global_step": 49363, "epoch": 1175} {"train_loss": -5.722742080688477, "global_step": 49364, "epoch": 1175} {"train_loss": -5.6810102462768555, "global_step": 49365, "epoch": 1175} {"train_loss": -5.737549781799316, "global_step": 49366, "epoch": 1175} {"train_loss": -5.664753437042236, "global_step": 49367, "epoch": 1175} {"train_loss": -5.6555352210998535, "global_step": 49368, "epoch": 1175} {"train_loss": -5.867831230163574, "global_step": 49369, "epoch": 1175} {"train_loss": -5.818078517913818, "global_step": 49370, "epoch": 1175} {"train_loss": -5.796643257141113, "global_step": 49371, "epoch": 1175} {"train_loss": -5.7290143966674805, "global_step": 49372, "epoch": 1175} {"train_loss": -5.681682586669922, "global_step": 49373, "epoch": 1175} {"train_loss": -5.7671356201171875, "global_step": 49374, "epoch": 1175} {"train_loss": -5.705759525299072, "global_step": 49375, "epoch": 1175} {"train_loss": -5.8414459228515625, "global_step": 49376, "epoch": 1175} {"train_loss": -5.732974052429199, "global_step": 49377, "epoch": 1175} {"train_loss": -5.725785732269287, "global_step": 49378, "epoch": 1175} {"train_loss": -5.872393608093262, "global_step": 49379, "epoch": 1175} {"train_loss": -5.860119342803955, "global_step": 49380, "epoch": 1175} {"train_loss": -5.801775932312012, "global_step": 49381, "epoch": 1175} {"train_loss": -5.639591217041016, "global_step": 49382, "epoch": 1175} {"train_loss": -5.689013481140137, "global_step": 49383, "epoch": 1175} {"train_loss": -5.729250431060791, "global_step": 49384, "epoch": 1175} {"train_loss": -5.747135639190674, "global_step": 49385, "epoch": 1175} {"train_loss": -5.879292011260986, "global_step": 49386, "epoch": 1175} {"train_loss": -5.846814155578613, "global_step": 49387, "epoch": 1175} {"train_loss": -5.776728630065918, "global_step": 49388, "epoch": 1175} {"train_loss": -5.921835422515869, "global_step": 49389, "epoch": 1175} {"train_loss": -5.805140495300293, "global_step": 49390, "epoch": 1175} {"train_loss": -5.778495720454624, "global_step": 49391, "epoch": 1175, "val_loss": 66076.7578125} {"train_loss": -5.66646146774292, "global_step": 49392, "epoch": 1176} {"train_loss": -5.692630767822266, "global_step": 49393, "epoch": 1176} {"train_loss": -5.760122299194336, "global_step": 49394, "epoch": 1176} {"train_loss": -5.856610298156738, "global_step": 49395, "epoch": 1176} {"train_loss": -5.939949035644531, "global_step": 49396, "epoch": 1176} {"train_loss": -5.677151679992676, "global_step": 49397, "epoch": 1176} {"train_loss": -5.668373107910156, "global_step": 49398, "epoch": 1176} {"train_loss": -5.73292350769043, "global_step": 49399, "epoch": 1176} {"train_loss": -5.7512006759643555, "global_step": 49400, "epoch": 1176} {"train_loss": -5.776242256164551, "global_step": 49401, "epoch": 1176} {"train_loss": -5.774764537811279, "global_step": 49402, "epoch": 1176} {"train_loss": -5.698406219482422, "global_step": 49403, "epoch": 1176} {"train_loss": -5.707086563110352, "global_step": 49404, "epoch": 1176} {"train_loss": -5.76448917388916, "global_step": 49405, "epoch": 1176} {"train_loss": -5.735630035400391, "global_step": 49406, "epoch": 1176} {"train_loss": -5.786857604980469, "global_step": 49407, "epoch": 1176} {"train_loss": -5.791114807128906, "global_step": 49408, "epoch": 1176} {"train_loss": -5.767134189605713, "global_step": 49409, "epoch": 1176} {"train_loss": -5.759181976318359, "global_step": 49410, "epoch": 1176} {"train_loss": -5.704117298126221, "global_step": 49411, "epoch": 1176} {"train_loss": -5.722714424133301, "global_step": 49412, "epoch": 1176} {"train_loss": -5.790273666381836, "global_step": 49413, "epoch": 1176} {"train_loss": -5.792987823486328, "global_step": 49414, "epoch": 1176} {"train_loss": -5.693978309631348, "global_step": 49415, "epoch": 1176} {"train_loss": -5.74462366104126, "global_step": 49416, "epoch": 1176} {"train_loss": -5.796076774597168, "global_step": 49417, "epoch": 1176} {"train_loss": -5.688689231872559, "global_step": 49418, "epoch": 1176} {"train_loss": -5.766037940979004, "global_step": 49419, "epoch": 1176} {"train_loss": -5.73857307434082, "global_step": 49420, "epoch": 1176} {"train_loss": -5.784852027893066, "global_step": 49421, "epoch": 1176} {"train_loss": -5.79783821105957, "global_step": 49422, "epoch": 1176} {"train_loss": -5.712039470672607, "global_step": 49423, "epoch": 1176} {"train_loss": -5.799805164337158, "global_step": 49424, "epoch": 1176} {"train_loss": -5.621001243591309, "global_step": 49425, "epoch": 1176} {"train_loss": -5.7240824699401855, "global_step": 49426, "epoch": 1176} {"train_loss": -5.9204864501953125, "global_step": 49427, "epoch": 1176} {"train_loss": -5.71272611618042, "global_step": 49428, "epoch": 1176} {"train_loss": -5.785280227661133, "global_step": 49429, "epoch": 1176} {"train_loss": -5.9068450927734375, "global_step": 49430, "epoch": 1176} {"train_loss": -5.75792121887207, "global_step": 49431, "epoch": 1176} {"train_loss": -5.783144950866699, "global_step": 49432, "epoch": 1176} {"train_loss": -5.7579740796770364, "global_step": 49433, "epoch": 1176, "val_loss": 66178.515625} {"train_loss": -5.828897953033447, "global_step": 49434, "epoch": 1177} {"train_loss": -5.885336875915527, "global_step": 49435, "epoch": 1177} {"train_loss": -5.801704406738281, "global_step": 49436, "epoch": 1177} {"train_loss": -5.718828201293945, "global_step": 49437, "epoch": 1177} {"train_loss": -5.850471019744873, "global_step": 49438, "epoch": 1177} {"train_loss": -5.7041425704956055, "global_step": 49439, "epoch": 1177} {"train_loss": -5.811519145965576, "global_step": 49440, "epoch": 1177} {"train_loss": -5.685669898986816, "global_step": 49441, "epoch": 1177} {"train_loss": -5.754607200622559, "global_step": 49442, "epoch": 1177} {"train_loss": -5.765023231506348, "global_step": 49443, "epoch": 1177} {"train_loss": -5.694055557250977, "global_step": 49444, "epoch": 1177} {"train_loss": -5.830510139465332, "global_step": 49445, "epoch": 1177} {"train_loss": -5.709612846374512, "global_step": 49446, "epoch": 1177} {"train_loss": -5.702671527862549, "global_step": 49447, "epoch": 1177} {"train_loss": -5.721743583679199, "global_step": 49448, "epoch": 1177} {"train_loss": -5.728227615356445, "global_step": 49449, "epoch": 1177} {"train_loss": -5.686949729919434, "global_step": 49450, "epoch": 1177} {"train_loss": -5.6923017501831055, "global_step": 49451, "epoch": 1177} {"train_loss": -5.870064735412598, "global_step": 49452, "epoch": 1177} {"train_loss": -5.655256271362305, "global_step": 49453, "epoch": 1177} {"train_loss": -5.799164772033691, "global_step": 49454, "epoch": 1177} {"train_loss": -5.674700736999512, "global_step": 49455, "epoch": 1177} {"train_loss": -5.754627704620361, "global_step": 49456, "epoch": 1177} {"train_loss": -5.758814334869385, "global_step": 49457, "epoch": 1177} {"train_loss": -5.6895527839660645, "global_step": 49458, "epoch": 1177} {"train_loss": -5.847417831420898, "global_step": 49459, "epoch": 1177} {"train_loss": -5.648650169372559, "global_step": 49460, "epoch": 1177} {"train_loss": -5.740141868591309, "global_step": 49461, "epoch": 1177} {"train_loss": -5.678310394287109, "global_step": 49462, "epoch": 1177} {"train_loss": -5.7134552001953125, "global_step": 49463, "epoch": 1177} {"train_loss": -5.73433780670166, "global_step": 49464, "epoch": 1177} {"train_loss": -5.685137748718262, "global_step": 49465, "epoch": 1177} {"train_loss": -5.755218505859375, "global_step": 49466, "epoch": 1177} {"train_loss": -5.671209335327148, "global_step": 49467, "epoch": 1177} {"train_loss": -5.753975868225098, "global_step": 49468, "epoch": 1177} {"train_loss": -5.648683547973633, "global_step": 49469, "epoch": 1177} {"train_loss": -5.782240867614746, "global_step": 49470, "epoch": 1177} {"train_loss": -5.630664825439453, "global_step": 49471, "epoch": 1177} {"train_loss": -5.720739841461182, "global_step": 49472, "epoch": 1177} {"train_loss": -5.679262161254883, "global_step": 49473, "epoch": 1177} {"train_loss": -5.724631309509277, "global_step": 49474, "epoch": 1177} {"train_loss": -5.739656164532616, "global_step": 49475, "epoch": 1177, "val_loss": 66261.515625} {"train_loss": -5.836919784545898, "global_step": 49476, "epoch": 1178} {"train_loss": -5.846051216125488, "global_step": 49477, "epoch": 1178} {"train_loss": -5.629795074462891, "global_step": 49478, "epoch": 1178} {"train_loss": -5.781739234924316, "global_step": 49479, "epoch": 1178} {"train_loss": -5.717187881469727, "global_step": 49480, "epoch": 1178} {"train_loss": -5.719381809234619, "global_step": 49481, "epoch": 1178} {"train_loss": -5.733506202697754, "global_step": 49482, "epoch": 1178} {"train_loss": -5.686213970184326, "global_step": 49483, "epoch": 1178} {"train_loss": -5.750542640686035, "global_step": 49484, "epoch": 1178} {"train_loss": -5.76105260848999, "global_step": 49485, "epoch": 1178} {"train_loss": -5.82253360748291, "global_step": 49486, "epoch": 1178} {"train_loss": -5.773479461669922, "global_step": 49487, "epoch": 1178} {"train_loss": -5.888028621673584, "global_step": 49488, "epoch": 1178} {"train_loss": -5.711389541625977, "global_step": 49489, "epoch": 1178} {"train_loss": -5.777837753295898, "global_step": 49490, "epoch": 1178} {"train_loss": -5.740005970001221, "global_step": 49491, "epoch": 1178} {"train_loss": -5.780864715576172, "global_step": 49492, "epoch": 1178} {"train_loss": -5.748434066772461, "global_step": 49493, "epoch": 1178} {"train_loss": -5.7075934410095215, "global_step": 49494, "epoch": 1178} {"train_loss": -5.7974700927734375, "global_step": 49495, "epoch": 1178} {"train_loss": -5.70306396484375, "global_step": 49496, "epoch": 1178} {"train_loss": -5.69419002532959, "global_step": 49497, "epoch": 1178} {"train_loss": -5.844914436340332, "global_step": 49498, "epoch": 1178} {"train_loss": -5.680197238922119, "global_step": 49499, "epoch": 1178} {"train_loss": -5.623685359954834, "global_step": 49500, "epoch": 1178} {"train_loss": -5.738960266113281, "global_step": 49501, "epoch": 1178} {"train_loss": -5.7911176681518555, "global_step": 49502, "epoch": 1178} {"train_loss": -5.720897197723389, "global_step": 49503, "epoch": 1178} {"train_loss": -5.771481513977051, "global_step": 49504, "epoch": 1178} {"train_loss": -5.816555500030518, "global_step": 49505, "epoch": 1178} {"train_loss": -5.81889533996582, "global_step": 49506, "epoch": 1178} {"train_loss": -5.669518947601318, "global_step": 49507, "epoch": 1178} {"train_loss": -5.83464241027832, "global_step": 49508, "epoch": 1178} {"train_loss": -5.769754886627197, "global_step": 49509, "epoch": 1178} {"train_loss": -5.800271034240723, "global_step": 49510, "epoch": 1178} {"train_loss": -5.8169355392456055, "global_step": 49511, "epoch": 1178} {"train_loss": -5.751759052276611, "global_step": 49512, "epoch": 1178} {"train_loss": -5.748411178588867, "global_step": 49513, "epoch": 1178} {"train_loss": -5.680410385131836, "global_step": 49514, "epoch": 1178} {"train_loss": -5.633010387420654, "global_step": 49515, "epoch": 1178} {"train_loss": -5.71592378616333, "global_step": 49516, "epoch": 1178} {"train_loss": -5.751733053298223, "global_step": 49517, "epoch": 1178, "val_loss": 66206.375} {"train_loss": -5.818470001220703, "global_step": 49518, "epoch": 1179} {"train_loss": -5.641269683837891, "global_step": 49519, "epoch": 1179} {"train_loss": -5.664492130279541, "global_step": 49520, "epoch": 1179} {"train_loss": -5.807271957397461, "global_step": 49521, "epoch": 1179} {"train_loss": -5.706991195678711, "global_step": 49522, "epoch": 1179} {"train_loss": -5.753802299499512, "global_step": 49523, "epoch": 1179} {"train_loss": -5.736540794372559, "global_step": 49524, "epoch": 1179} {"train_loss": -5.727394104003906, "global_step": 49525, "epoch": 1179} {"train_loss": -5.811587333679199, "global_step": 49526, "epoch": 1179} {"train_loss": -5.716219902038574, "global_step": 49527, "epoch": 1179} {"train_loss": -5.57470178604126, "global_step": 49528, "epoch": 1179} {"train_loss": -5.6888909339904785, "global_step": 49529, "epoch": 1179} {"train_loss": -5.743441104888916, "global_step": 49530, "epoch": 1179} {"train_loss": -5.760028839111328, "global_step": 49531, "epoch": 1179} {"train_loss": -5.781490325927734, "global_step": 49532, "epoch": 1179} {"train_loss": -5.733948707580566, "global_step": 49533, "epoch": 1179} {"train_loss": -5.768878936767578, "global_step": 49534, "epoch": 1179} {"train_loss": -5.673460960388184, "global_step": 49535, "epoch": 1179} {"train_loss": -5.675121784210205, "global_step": 49536, "epoch": 1179} {"train_loss": -5.736497402191162, "global_step": 49537, "epoch": 1179} {"train_loss": -5.710303783416748, "global_step": 49538, "epoch": 1179} {"train_loss": -5.56063175201416, "global_step": 49539, "epoch": 1179} {"train_loss": -5.738201141357422, "global_step": 49540, "epoch": 1179} {"train_loss": -5.702924728393555, "global_step": 49541, "epoch": 1179} {"train_loss": -5.736784934997559, "global_step": 49542, "epoch": 1179} {"train_loss": -5.7816572189331055, "global_step": 49543, "epoch": 1179} {"train_loss": -5.826683044433594, "global_step": 49544, "epoch": 1179} {"train_loss": -5.687130451202393, "global_step": 49545, "epoch": 1179} {"train_loss": -5.65887451171875, "global_step": 49546, "epoch": 1179} {"train_loss": -5.784651756286621, "global_step": 49547, "epoch": 1179} {"train_loss": -5.792153358459473, "global_step": 49548, "epoch": 1179} {"train_loss": -5.719395637512207, "global_step": 49549, "epoch": 1179} {"train_loss": -5.855961799621582, "global_step": 49550, "epoch": 1179} {"train_loss": -5.676884651184082, "global_step": 49551, "epoch": 1179} {"train_loss": -5.793035507202148, "global_step": 49552, "epoch": 1179} {"train_loss": -5.787753105163574, "global_step": 49553, "epoch": 1179} {"train_loss": -5.840347766876221, "global_step": 49554, "epoch": 1179} {"train_loss": -5.7276716232299805, "global_step": 49555, "epoch": 1179} {"train_loss": -5.714437484741211, "global_step": 49556, "epoch": 1179} {"train_loss": -5.8088603019714355, "global_step": 49557, "epoch": 1179} {"train_loss": -5.807784557342529, "global_step": 49558, "epoch": 1179} {"train_loss": -5.737018006188529, "global_step": 49559, "epoch": 1179, "val_loss": 66414.078125} {"train_loss": -5.775574684143066, "global_step": 49560, "epoch": 1180} {"train_loss": -5.911716938018799, "global_step": 49561, "epoch": 1180} {"train_loss": -5.755558967590332, "global_step": 49562, "epoch": 1180} {"train_loss": -5.694037437438965, "global_step": 49563, "epoch": 1180} {"train_loss": -5.782172203063965, "global_step": 49564, "epoch": 1180} {"train_loss": -5.770806789398193, "global_step": 49565, "epoch": 1180} {"train_loss": -5.777937889099121, "global_step": 49566, "epoch": 1180} {"train_loss": -5.638935565948486, "global_step": 49567, "epoch": 1180} {"train_loss": -5.807258605957031, "global_step": 49568, "epoch": 1180} {"train_loss": -5.654008388519287, "global_step": 49569, "epoch": 1180} {"train_loss": -5.756363391876221, "global_step": 49570, "epoch": 1180} {"train_loss": -5.781227111816406, "global_step": 49571, "epoch": 1180} {"train_loss": -5.832368850708008, "global_step": 49572, "epoch": 1180} {"train_loss": -5.833388328552246, "global_step": 49573, "epoch": 1180} {"train_loss": -5.828979015350342, "global_step": 49574, "epoch": 1180} {"train_loss": -5.936264991760254, "global_step": 49575, "epoch": 1180} {"train_loss": -5.725653648376465, "global_step": 49576, "epoch": 1180} {"train_loss": -5.791876316070557, "global_step": 49577, "epoch": 1180} {"train_loss": -5.938298225402832, "global_step": 49578, "epoch": 1180} {"train_loss": -5.770766258239746, "global_step": 49579, "epoch": 1180} {"train_loss": -5.810384750366211, "global_step": 49580, "epoch": 1180} {"train_loss": -5.821985244750977, "global_step": 49581, "epoch": 1180} {"train_loss": -5.784613609313965, "global_step": 49582, "epoch": 1180} {"train_loss": -5.708283424377441, "global_step": 49583, "epoch": 1180} {"train_loss": -5.747698783874512, "global_step": 49584, "epoch": 1180} {"train_loss": -5.772211074829102, "global_step": 49585, "epoch": 1180} {"train_loss": -5.765220642089844, "global_step": 49586, "epoch": 1180} {"train_loss": -5.753931045532227, "global_step": 49587, "epoch": 1180} {"train_loss": -5.898459434509277, "global_step": 49588, "epoch": 1180} {"train_loss": -5.828892230987549, "global_step": 49589, "epoch": 1180} {"train_loss": -5.759506702423096, "global_step": 49590, "epoch": 1180} {"train_loss": -5.726208686828613, "global_step": 49591, "epoch": 1180} {"train_loss": -5.756738662719727, "global_step": 49592, "epoch": 1180} {"train_loss": -5.6914381980896, "global_step": 49593, "epoch": 1180} {"train_loss": -5.715786933898926, "global_step": 49594, "epoch": 1180} {"train_loss": -5.584770679473877, "global_step": 49595, "epoch": 1180} {"train_loss": -5.641770362854004, "global_step": 49596, "epoch": 1180} {"train_loss": -5.64139461517334, "global_step": 49597, "epoch": 1180} {"train_loss": -5.733480453491211, "global_step": 49598, "epoch": 1180} {"train_loss": -5.915295600891113, "global_step": 49599, "epoch": 1180} {"train_loss": -5.769232749938965, "global_step": 49600, "epoch": 1180} {"train_loss": -5.769512562524705, "global_step": 49601, "epoch": 1180, "val_loss": 66200.515625} {"train_loss": -5.786015510559082, "global_step": 49602, "epoch": 1181} {"train_loss": -5.757635593414307, "global_step": 49603, "epoch": 1181} {"train_loss": -5.805474281311035, "global_step": 49604, "epoch": 1181} {"train_loss": -5.690479278564453, "global_step": 49605, "epoch": 1181} {"train_loss": -5.769288063049316, "global_step": 49606, "epoch": 1181} {"train_loss": -5.804184436798096, "global_step": 49607, "epoch": 1181} {"train_loss": -5.709906578063965, "global_step": 49608, "epoch": 1181} {"train_loss": -5.6099677085876465, "global_step": 49609, "epoch": 1181} {"train_loss": -5.7987775802612305, "global_step": 49610, "epoch": 1181} {"train_loss": -5.806371688842773, "global_step": 49611, "epoch": 1181} {"train_loss": -5.741684913635254, "global_step": 49612, "epoch": 1181} {"train_loss": -5.826184272766113, "global_step": 49613, "epoch": 1181} {"train_loss": -5.690598487854004, "global_step": 49614, "epoch": 1181} {"train_loss": -5.731052875518799, "global_step": 49615, "epoch": 1181} {"train_loss": -5.75302267074585, "global_step": 49616, "epoch": 1181} {"train_loss": -5.754015922546387, "global_step": 49617, "epoch": 1181} {"train_loss": -5.721742630004883, "global_step": 49618, "epoch": 1181} {"train_loss": -5.8618597984313965, "global_step": 49619, "epoch": 1181} {"train_loss": -5.602116584777832, "global_step": 49620, "epoch": 1181} {"train_loss": -5.801599025726318, "global_step": 49621, "epoch": 1181} {"train_loss": -5.787304878234863, "global_step": 49622, "epoch": 1181} {"train_loss": -5.78501558303833, "global_step": 49623, "epoch": 1181} {"train_loss": -5.799014091491699, "global_step": 49624, "epoch": 1181} {"train_loss": -5.7704548835754395, "global_step": 49625, "epoch": 1181} {"train_loss": -5.729306221008301, "global_step": 49626, "epoch": 1181} {"train_loss": -5.791765213012695, "global_step": 49627, "epoch": 1181} {"train_loss": -5.68300199508667, "global_step": 49628, "epoch": 1181} {"train_loss": -5.693472862243652, "global_step": 49629, "epoch": 1181} {"train_loss": -5.663741111755371, "global_step": 49630, "epoch": 1181} {"train_loss": -5.756113052368164, "global_step": 49631, "epoch": 1181} {"train_loss": -5.790722846984863, "global_step": 49632, "epoch": 1181} {"train_loss": -5.724357604980469, "global_step": 49633, "epoch": 1181} {"train_loss": -5.712527751922607, "global_step": 49634, "epoch": 1181} {"train_loss": -5.732781887054443, "global_step": 49635, "epoch": 1181} {"train_loss": -5.695638179779053, "global_step": 49636, "epoch": 1181} {"train_loss": -5.820362091064453, "global_step": 49637, "epoch": 1181} {"train_loss": -5.789754390716553, "global_step": 49638, "epoch": 1181} {"train_loss": -5.670804977416992, "global_step": 49639, "epoch": 1181} {"train_loss": -5.6203532218933105, "global_step": 49640, "epoch": 1181} {"train_loss": -5.734490394592285, "global_step": 49641, "epoch": 1181} {"train_loss": -5.46744966506958, "global_step": 49642, "epoch": 1181} {"train_loss": -5.73483259337289, "global_step": 49643, "epoch": 1181, "val_loss": 66422.2578125} {"train_loss": -5.594246864318848, "global_step": 49644, "epoch": 1182} {"train_loss": -5.633377552032471, "global_step": 49645, "epoch": 1182} {"train_loss": -5.537080764770508, "global_step": 49646, "epoch": 1182} {"train_loss": -5.72438907623291, "global_step": 49647, "epoch": 1182} {"train_loss": -5.6367340087890625, "global_step": 49648, "epoch": 1182} {"train_loss": -5.748411178588867, "global_step": 49649, "epoch": 1182} {"train_loss": -5.742647171020508, "global_step": 49650, "epoch": 1182} {"train_loss": -5.700170516967773, "global_step": 49651, "epoch": 1182} {"train_loss": -5.772809982299805, "global_step": 49652, "epoch": 1182} {"train_loss": -5.659109592437744, "global_step": 49653, "epoch": 1182} {"train_loss": -5.731601715087891, "global_step": 49654, "epoch": 1182} {"train_loss": -5.773775100708008, "global_step": 49655, "epoch": 1182} {"train_loss": -5.853376865386963, "global_step": 49656, "epoch": 1182} {"train_loss": -5.853591442108154, "global_step": 49657, "epoch": 1182} {"train_loss": -5.67460823059082, "global_step": 49658, "epoch": 1182} {"train_loss": -5.606496810913086, "global_step": 49659, "epoch": 1182} {"train_loss": -5.658981800079346, "global_step": 49660, "epoch": 1182} {"train_loss": -5.752720832824707, "global_step": 49661, "epoch": 1182} {"train_loss": -5.659340858459473, "global_step": 49662, "epoch": 1182} {"train_loss": -5.647913932800293, "global_step": 49663, "epoch": 1182} {"train_loss": -5.691037178039551, "global_step": 49664, "epoch": 1182} {"train_loss": -5.646086692810059, "global_step": 49665, "epoch": 1182} {"train_loss": -5.7026686668396, "global_step": 49666, "epoch": 1182} {"train_loss": -5.7198710441589355, "global_step": 49667, "epoch": 1182} {"train_loss": -5.842379570007324, "global_step": 49668, "epoch": 1182} {"train_loss": -5.65211296081543, "global_step": 49669, "epoch": 1182} {"train_loss": -5.764840126037598, "global_step": 49670, "epoch": 1182} {"train_loss": -5.772169589996338, "global_step": 49671, "epoch": 1182} {"train_loss": -5.665691375732422, "global_step": 49672, "epoch": 1182} {"train_loss": -5.771783828735352, "global_step": 49673, "epoch": 1182} {"train_loss": -5.628798484802246, "global_step": 49674, "epoch": 1182} {"train_loss": -5.713387966156006, "global_step": 49675, "epoch": 1182} {"train_loss": -5.817929267883301, "global_step": 49676, "epoch": 1182} {"train_loss": -5.723398208618164, "global_step": 49677, "epoch": 1182} {"train_loss": -5.786472320556641, "global_step": 49678, "epoch": 1182} {"train_loss": -5.8105268478393555, "global_step": 49679, "epoch": 1182} {"train_loss": -5.592050552368164, "global_step": 49680, "epoch": 1182} {"train_loss": -5.726963043212891, "global_step": 49681, "epoch": 1182} {"train_loss": -5.6726393699646, "global_step": 49682, "epoch": 1182} {"train_loss": -5.754604339599609, "global_step": 49683, "epoch": 1182} {"train_loss": -5.693624019622803, "global_step": 49684, "epoch": 1182} {"train_loss": -5.708769752865746, "global_step": 49685, "epoch": 1182, "val_loss": 66234.328125} {"train_loss": -5.819279670715332, "global_step": 49686, "epoch": 1183} {"train_loss": -5.713054656982422, "global_step": 49687, "epoch": 1183} {"train_loss": -5.672893524169922, "global_step": 49688, "epoch": 1183} {"train_loss": -5.733193874359131, "global_step": 49689, "epoch": 1183} {"train_loss": -5.693997383117676, "global_step": 49690, "epoch": 1183} {"train_loss": -5.651226997375488, "global_step": 49691, "epoch": 1183} {"train_loss": -5.642963409423828, "global_step": 49692, "epoch": 1183} {"train_loss": -5.604331016540527, "global_step": 49693, "epoch": 1183} {"train_loss": -5.838509559631348, "global_step": 49694, "epoch": 1183} {"train_loss": -5.739157199859619, "global_step": 49695, "epoch": 1183} {"train_loss": -5.699366569519043, "global_step": 49696, "epoch": 1183} {"train_loss": -5.716125011444092, "global_step": 49697, "epoch": 1183} {"train_loss": -5.88004732131958, "global_step": 49698, "epoch": 1183} {"train_loss": -5.694127082824707, "global_step": 49699, "epoch": 1183} {"train_loss": -5.776007652282715, "global_step": 49700, "epoch": 1183} {"train_loss": -5.821651935577393, "global_step": 49701, "epoch": 1183} {"train_loss": -5.764894008636475, "global_step": 49702, "epoch": 1183} {"train_loss": -5.876993179321289, "global_step": 49703, "epoch": 1183} {"train_loss": -5.822665691375732, "global_step": 49704, "epoch": 1183} {"train_loss": -5.769336700439453, "global_step": 49705, "epoch": 1183} {"train_loss": -5.805436611175537, "global_step": 49706, "epoch": 1183} {"train_loss": -5.756711959838867, "global_step": 49707, "epoch": 1183} {"train_loss": -5.765865325927734, "global_step": 49708, "epoch": 1183} {"train_loss": -5.700423717498779, "global_step": 49709, "epoch": 1183} {"train_loss": -5.783949851989746, "global_step": 49710, "epoch": 1183} {"train_loss": -5.664422512054443, "global_step": 49711, "epoch": 1183} {"train_loss": -5.806850433349609, "global_step": 49712, "epoch": 1183} {"train_loss": -5.751924514770508, "global_step": 49713, "epoch": 1183} {"train_loss": -5.837135314941406, "global_step": 49714, "epoch": 1183} {"train_loss": -5.8254170417785645, "global_step": 49715, "epoch": 1183} {"train_loss": -5.76080322265625, "global_step": 49716, "epoch": 1183} {"train_loss": -5.758797645568848, "global_step": 49717, "epoch": 1183} {"train_loss": -5.751492500305176, "global_step": 49718, "epoch": 1183} {"train_loss": -5.886466026306152, "global_step": 49719, "epoch": 1183} {"train_loss": -5.7691650390625, "global_step": 49720, "epoch": 1183} {"train_loss": -5.843897819519043, "global_step": 49721, "epoch": 1183} {"train_loss": -5.8549299240112305, "global_step": 49722, "epoch": 1183} {"train_loss": -5.766841411590576, "global_step": 49723, "epoch": 1183} {"train_loss": -5.709039688110352, "global_step": 49724, "epoch": 1183} {"train_loss": -5.764801979064941, "global_step": 49725, "epoch": 1183} {"train_loss": -5.809749603271484, "global_step": 49726, "epoch": 1183} {"train_loss": -5.762013492130098, "global_step": 49727, "epoch": 1183, "val_loss": 66059.890625} {"train_loss": -5.8009562492370605, "global_step": 49728, "epoch": 1184} {"train_loss": -5.791589260101318, "global_step": 49729, "epoch": 1184} {"train_loss": -5.641419410705566, "global_step": 49730, "epoch": 1184} {"train_loss": -5.765307903289795, "global_step": 49731, "epoch": 1184} {"train_loss": -5.791252136230469, "global_step": 49732, "epoch": 1184} {"train_loss": -5.721606254577637, "global_step": 49733, "epoch": 1184} {"train_loss": -5.6666975021362305, "global_step": 49734, "epoch": 1184} {"train_loss": -5.673789024353027, "global_step": 49735, "epoch": 1184} {"train_loss": -5.716437339782715, "global_step": 49736, "epoch": 1184} {"train_loss": -5.877224922180176, "global_step": 49737, "epoch": 1184} {"train_loss": -5.832571983337402, "global_step": 49738, "epoch": 1184} {"train_loss": -5.736074447631836, "global_step": 49739, "epoch": 1184} {"train_loss": -5.592148780822754, "global_step": 49740, "epoch": 1184} {"train_loss": -5.856377124786377, "global_step": 49741, "epoch": 1184} {"train_loss": -5.6604533195495605, "global_step": 49742, "epoch": 1184} {"train_loss": -5.71627950668335, "global_step": 49743, "epoch": 1184} {"train_loss": -5.720879554748535, "global_step": 49744, "epoch": 1184} {"train_loss": -5.667701721191406, "global_step": 49745, "epoch": 1184} {"train_loss": -5.65671443939209, "global_step": 49746, "epoch": 1184} {"train_loss": -5.818639755249023, "global_step": 49747, "epoch": 1184} {"train_loss": -5.762728691101074, "global_step": 49748, "epoch": 1184} {"train_loss": -5.754316329956055, "global_step": 49749, "epoch": 1184} {"train_loss": -5.673358917236328, "global_step": 49750, "epoch": 1184} {"train_loss": -5.779397964477539, "global_step": 49751, "epoch": 1184} {"train_loss": -5.656746864318848, "global_step": 49752, "epoch": 1184} {"train_loss": -5.701566696166992, "global_step": 49753, "epoch": 1184} {"train_loss": -5.802581310272217, "global_step": 49754, "epoch": 1184} {"train_loss": -5.74617338180542, "global_step": 49755, "epoch": 1184} {"train_loss": -5.777961730957031, "global_step": 49756, "epoch": 1184} {"train_loss": -5.727447032928467, "global_step": 49757, "epoch": 1184} {"train_loss": -5.743213653564453, "global_step": 49758, "epoch": 1184} {"train_loss": -5.727222919464111, "global_step": 49759, "epoch": 1184} {"train_loss": -5.806198596954346, "global_step": 49760, "epoch": 1184} {"train_loss": -5.6707258224487305, "global_step": 49761, "epoch": 1184} {"train_loss": -5.741206169128418, "global_step": 49762, "epoch": 1184} {"train_loss": -5.773735046386719, "global_step": 49763, "epoch": 1184} {"train_loss": -5.655247688293457, "global_step": 49764, "epoch": 1184} {"train_loss": -5.761763572692871, "global_step": 49765, "epoch": 1184} {"train_loss": -5.799144744873047, "global_step": 49766, "epoch": 1184} {"train_loss": -5.663133144378662, "global_step": 49767, "epoch": 1184} {"train_loss": -5.690126419067383, "global_step": 49768, "epoch": 1184} {"train_loss": -5.735392649968465, "global_step": 49769, "epoch": 1184, "val_loss": 66354.5546875} {"train_loss": -5.758586883544922, "global_step": 49770, "epoch": 1185} {"train_loss": -5.723738670349121, "global_step": 49771, "epoch": 1185} {"train_loss": -5.789368152618408, "global_step": 49772, "epoch": 1185} {"train_loss": -5.7021708488464355, "global_step": 49773, "epoch": 1185} {"train_loss": -5.655844211578369, "global_step": 49774, "epoch": 1185} {"train_loss": -5.673009395599365, "global_step": 49775, "epoch": 1185} {"train_loss": -5.578224182128906, "global_step": 49776, "epoch": 1185} {"train_loss": -5.707275867462158, "global_step": 49777, "epoch": 1185} {"train_loss": -5.65164041519165, "global_step": 49778, "epoch": 1185} {"train_loss": -5.543100357055664, "global_step": 49779, "epoch": 1185} {"train_loss": -5.781823635101318, "global_step": 49780, "epoch": 1185} {"train_loss": -5.61290168762207, "global_step": 49781, "epoch": 1185} {"train_loss": -5.571597099304199, "global_step": 49782, "epoch": 1185} {"train_loss": -5.824006080627441, "global_step": 49783, "epoch": 1185} {"train_loss": -5.695315837860107, "global_step": 49784, "epoch": 1185} {"train_loss": -5.674903869628906, "global_step": 49785, "epoch": 1185} {"train_loss": -5.7554850578308105, "global_step": 49786, "epoch": 1185} {"train_loss": -5.785775184631348, "global_step": 49787, "epoch": 1185} {"train_loss": -5.810457229614258, "global_step": 49788, "epoch": 1185} {"train_loss": -5.833815574645996, "global_step": 49789, "epoch": 1185} {"train_loss": -5.690064907073975, "global_step": 49790, "epoch": 1185} {"train_loss": -5.790761947631836, "global_step": 49791, "epoch": 1185} {"train_loss": -5.733335494995117, "global_step": 49792, "epoch": 1185} {"train_loss": -5.686318874359131, "global_step": 49793, "epoch": 1185} {"train_loss": -5.787741661071777, "global_step": 49794, "epoch": 1185} {"train_loss": -5.738640785217285, "global_step": 49795, "epoch": 1185} {"train_loss": -5.713715553283691, "global_step": 49796, "epoch": 1185} {"train_loss": -5.718832969665527, "global_step": 49797, "epoch": 1185} {"train_loss": -5.712945461273193, "global_step": 49798, "epoch": 1185} {"train_loss": -5.849992752075195, "global_step": 49799, "epoch": 1185} {"train_loss": -5.800198554992676, "global_step": 49800, "epoch": 1185} {"train_loss": -5.719601631164551, "global_step": 49801, "epoch": 1185} {"train_loss": -5.725093841552734, "global_step": 49802, "epoch": 1185} {"train_loss": -5.8630876541137695, "global_step": 49803, "epoch": 1185} {"train_loss": -5.749185085296631, "global_step": 49804, "epoch": 1185} {"train_loss": -5.768594741821289, "global_step": 49805, "epoch": 1185} {"train_loss": -5.706391334533691, "global_step": 49806, "epoch": 1185} {"train_loss": -5.7056732177734375, "global_step": 49807, "epoch": 1185} {"train_loss": -5.706664085388184, "global_step": 49808, "epoch": 1185} {"train_loss": -5.848540306091309, "global_step": 49809, "epoch": 1185} {"train_loss": -5.759464263916016, "global_step": 49810, "epoch": 1185} {"train_loss": -5.7279796827407115, "global_step": 49811, "epoch": 1185, "val_loss": 66065.390625} {"train_loss": -5.762636661529541, "global_step": 49812, "epoch": 1186} {"train_loss": -5.744704246520996, "global_step": 49813, "epoch": 1186} {"train_loss": -5.69724178314209, "global_step": 49814, "epoch": 1186} {"train_loss": -5.774359703063965, "global_step": 49815, "epoch": 1186} {"train_loss": -5.694490432739258, "global_step": 49816, "epoch": 1186} {"train_loss": -5.711001396179199, "global_step": 49817, "epoch": 1186} {"train_loss": -5.791467666625977, "global_step": 49818, "epoch": 1186} {"train_loss": -5.772810935974121, "global_step": 49819, "epoch": 1186} {"train_loss": -5.692567348480225, "global_step": 49820, "epoch": 1186} {"train_loss": -5.782839775085449, "global_step": 49821, "epoch": 1186} {"train_loss": -5.807314872741699, "global_step": 49822, "epoch": 1186} {"train_loss": -5.867450714111328, "global_step": 49823, "epoch": 1186} {"train_loss": -5.869448661804199, "global_step": 49824, "epoch": 1186} {"train_loss": -5.741568565368652, "global_step": 49825, "epoch": 1186} {"train_loss": -5.786031723022461, "global_step": 49826, "epoch": 1186} {"train_loss": -5.774055480957031, "global_step": 49827, "epoch": 1186} {"train_loss": -5.800384521484375, "global_step": 49828, "epoch": 1186} {"train_loss": -5.76910400390625, "global_step": 49829, "epoch": 1186} {"train_loss": -5.766723155975342, "global_step": 49830, "epoch": 1186} {"train_loss": -5.762761116027832, "global_step": 49831, "epoch": 1186} {"train_loss": -5.631570339202881, "global_step": 49832, "epoch": 1186} {"train_loss": -5.721015930175781, "global_step": 49833, "epoch": 1186} {"train_loss": -5.809421539306641, "global_step": 49834, "epoch": 1186} {"train_loss": -5.728273391723633, "global_step": 49835, "epoch": 1186} {"train_loss": -5.819344520568848, "global_step": 49836, "epoch": 1186} {"train_loss": -5.773293495178223, "global_step": 49837, "epoch": 1186} {"train_loss": -5.651556015014648, "global_step": 49838, "epoch": 1186} {"train_loss": -5.766223907470703, "global_step": 49839, "epoch": 1186} {"train_loss": -5.713791847229004, "global_step": 49840, "epoch": 1186} {"train_loss": -5.698419570922852, "global_step": 49841, "epoch": 1186} {"train_loss": -5.589829444885254, "global_step": 49842, "epoch": 1186} {"train_loss": -5.706965923309326, "global_step": 49843, "epoch": 1186} {"train_loss": -5.707313060760498, "global_step": 49844, "epoch": 1186} {"train_loss": -5.689530372619629, "global_step": 49845, "epoch": 1186} {"train_loss": -5.676931858062744, "global_step": 49846, "epoch": 1186} {"train_loss": -5.598785877227783, "global_step": 49847, "epoch": 1186} {"train_loss": -5.899596691131592, "global_step": 49848, "epoch": 1186} {"train_loss": -5.672446250915527, "global_step": 49849, "epoch": 1186} {"train_loss": -5.808992385864258, "global_step": 49850, "epoch": 1186} {"train_loss": -5.706277847290039, "global_step": 49851, "epoch": 1186} {"train_loss": -5.779250144958496, "global_step": 49852, "epoch": 1186} {"train_loss": -5.74422413962228, "global_step": 49853, "epoch": 1186, "val_loss": 66718.1953125} {"train_loss": -5.7680768966674805, "global_step": 49854, "epoch": 1187} {"train_loss": -5.731696128845215, "global_step": 49855, "epoch": 1187} {"train_loss": -5.719661712646484, "global_step": 49856, "epoch": 1187} {"train_loss": -5.82545280456543, "global_step": 49857, "epoch": 1187} {"train_loss": -5.724867820739746, "global_step": 49858, "epoch": 1187} {"train_loss": -5.761666297912598, "global_step": 49859, "epoch": 1187} {"train_loss": -5.726994037628174, "global_step": 49860, "epoch": 1187} {"train_loss": -5.754480361938477, "global_step": 49861, "epoch": 1187} {"train_loss": -5.750922203063965, "global_step": 49862, "epoch": 1187} {"train_loss": -5.745648384094238, "global_step": 49863, "epoch": 1187} {"train_loss": -5.7111406326293945, "global_step": 49864, "epoch": 1187} {"train_loss": -5.786272048950195, "global_step": 49865, "epoch": 1187} {"train_loss": -5.770864009857178, "global_step": 49866, "epoch": 1187} {"train_loss": -5.734273910522461, "global_step": 49867, "epoch": 1187} {"train_loss": -5.779757499694824, "global_step": 49868, "epoch": 1187} {"train_loss": -5.570864677429199, "global_step": 49869, "epoch": 1187} {"train_loss": -5.824113368988037, "global_step": 49870, "epoch": 1187} {"train_loss": -5.705783367156982, "global_step": 49871, "epoch": 1187} {"train_loss": -5.6911115646362305, "global_step": 49872, "epoch": 1187} {"train_loss": -5.8025007247924805, "global_step": 49873, "epoch": 1187} {"train_loss": -5.612900257110596, "global_step": 49874, "epoch": 1187} {"train_loss": -5.749988079071045, "global_step": 49875, "epoch": 1187} {"train_loss": -5.849837303161621, "global_step": 49876, "epoch": 1187} {"train_loss": -5.693992614746094, "global_step": 49877, "epoch": 1187} {"train_loss": -5.7240471839904785, "global_step": 49878, "epoch": 1187} {"train_loss": -5.728962421417236, "global_step": 49879, "epoch": 1187} {"train_loss": -5.75742769241333, "global_step": 49880, "epoch": 1187} {"train_loss": -5.792890548706055, "global_step": 49881, "epoch": 1187} {"train_loss": -5.664064407348633, "global_step": 49882, "epoch": 1187} {"train_loss": -5.757503986358643, "global_step": 49883, "epoch": 1187} {"train_loss": -5.713648796081543, "global_step": 49884, "epoch": 1187} {"train_loss": -5.708483695983887, "global_step": 49885, "epoch": 1187} {"train_loss": -5.65163516998291, "global_step": 49886, "epoch": 1187} {"train_loss": -5.840575218200684, "global_step": 49887, "epoch": 1187} {"train_loss": -5.725935459136963, "global_step": 49888, "epoch": 1187} {"train_loss": -5.758711814880371, "global_step": 49889, "epoch": 1187} {"train_loss": -5.776269912719727, "global_step": 49890, "epoch": 1187} {"train_loss": -5.672346115112305, "global_step": 49891, "epoch": 1187} {"train_loss": -5.706437587738037, "global_step": 49892, "epoch": 1187} {"train_loss": -5.722644805908203, "global_step": 49893, "epoch": 1187} {"train_loss": -5.6747918128967285, "global_step": 49894, "epoch": 1187} {"train_loss": -5.736455690293085, "global_step": 49895, "epoch": 1187, "val_loss": 66142.734375} {"train_loss": -5.821749687194824, "global_step": 49896, "epoch": 1188} {"train_loss": -5.766035079956055, "global_step": 49897, "epoch": 1188} {"train_loss": -5.763863563537598, "global_step": 49898, "epoch": 1188} {"train_loss": -5.54948616027832, "global_step": 49899, "epoch": 1188} {"train_loss": -5.783600330352783, "global_step": 49900, "epoch": 1188} {"train_loss": -5.81207275390625, "global_step": 49901, "epoch": 1188} {"train_loss": -5.777851104736328, "global_step": 49902, "epoch": 1188} {"train_loss": -5.787520408630371, "global_step": 49903, "epoch": 1188} {"train_loss": -5.708978652954102, "global_step": 49904, "epoch": 1188} {"train_loss": -5.832245349884033, "global_step": 49905, "epoch": 1188} {"train_loss": -5.658864974975586, "global_step": 49906, "epoch": 1188} {"train_loss": -5.764312267303467, "global_step": 49907, "epoch": 1188} {"train_loss": -5.820711612701416, "global_step": 49908, "epoch": 1188} {"train_loss": -5.559026718139648, "global_step": 49909, "epoch": 1188} {"train_loss": -5.894837379455566, "global_step": 49910, "epoch": 1188} {"train_loss": -5.860664367675781, "global_step": 49911, "epoch": 1188} {"train_loss": -5.748226165771484, "global_step": 49912, "epoch": 1188} {"train_loss": -5.773303031921387, "global_step": 49913, "epoch": 1188} {"train_loss": -5.614398002624512, "global_step": 49914, "epoch": 1188} {"train_loss": -5.773682594299316, "global_step": 49915, "epoch": 1188} {"train_loss": -5.811641693115234, "global_step": 49916, "epoch": 1188} {"train_loss": -5.838778495788574, "global_step": 49917, "epoch": 1188} {"train_loss": -5.864153861999512, "global_step": 49918, "epoch": 1188} {"train_loss": -5.723634243011475, "global_step": 49919, "epoch": 1188} {"train_loss": -5.839611530303955, "global_step": 49920, "epoch": 1188} {"train_loss": -5.72149133682251, "global_step": 49921, "epoch": 1188} {"train_loss": -5.679647445678711, "global_step": 49922, "epoch": 1188} {"train_loss": -5.779991626739502, "global_step": 49923, "epoch": 1188} {"train_loss": -5.743829727172852, "global_step": 49924, "epoch": 1188} {"train_loss": -5.690258026123047, "global_step": 49925, "epoch": 1188} {"train_loss": -5.7157392501831055, "global_step": 49926, "epoch": 1188} {"train_loss": -5.623497009277344, "global_step": 49927, "epoch": 1188} {"train_loss": -5.82703161239624, "global_step": 49928, "epoch": 1188} {"train_loss": -5.660408020019531, "global_step": 49929, "epoch": 1188} {"train_loss": -5.765591144561768, "global_step": 49930, "epoch": 1188} {"train_loss": -5.7725019454956055, "global_step": 49931, "epoch": 1188} {"train_loss": -5.8686723709106445, "global_step": 49932, "epoch": 1188} {"train_loss": -5.696035861968994, "global_step": 49933, "epoch": 1188} {"train_loss": -5.762620449066162, "global_step": 49934, "epoch": 1188} {"train_loss": -5.774277687072754, "global_step": 49935, "epoch": 1188} {"train_loss": -5.768251419067383, "global_step": 49936, "epoch": 1188} {"train_loss": -5.756252504530407, "global_step": 49937, "epoch": 1188, "val_loss": 66345.6796875} {"train_loss": -5.834336757659912, "global_step": 49938, "epoch": 1189} {"train_loss": -5.71561861038208, "global_step": 49939, "epoch": 1189} {"train_loss": -5.811094284057617, "global_step": 49940, "epoch": 1189} {"train_loss": -5.83446741104126, "global_step": 49941, "epoch": 1189} {"train_loss": -5.831596374511719, "global_step": 49942, "epoch": 1189} {"train_loss": -5.785552024841309, "global_step": 49943, "epoch": 1189} {"train_loss": -5.752460479736328, "global_step": 49944, "epoch": 1189} {"train_loss": -5.734946250915527, "global_step": 49945, "epoch": 1189} {"train_loss": -5.805837154388428, "global_step": 49946, "epoch": 1189} {"train_loss": -5.738918304443359, "global_step": 49947, "epoch": 1189} {"train_loss": -5.8074750900268555, "global_step": 49948, "epoch": 1189} {"train_loss": -5.7373151779174805, "global_step": 49949, "epoch": 1189} {"train_loss": -5.787821292877197, "global_step": 49950, "epoch": 1189} {"train_loss": -5.764729976654053, "global_step": 49951, "epoch": 1189} {"train_loss": -5.752975940704346, "global_step": 49952, "epoch": 1189} {"train_loss": -5.7757954597473145, "global_step": 49953, "epoch": 1189} {"train_loss": -5.838149070739746, "global_step": 49954, "epoch": 1189} {"train_loss": -5.697319030761719, "global_step": 49955, "epoch": 1189} {"train_loss": -5.748116493225098, "global_step": 49956, "epoch": 1189} {"train_loss": -5.69059944152832, "global_step": 49957, "epoch": 1189} {"train_loss": -5.863020896911621, "global_step": 49958, "epoch": 1189} {"train_loss": -5.795831203460693, "global_step": 49959, "epoch": 1189} {"train_loss": -5.690433502197266, "global_step": 49960, "epoch": 1189} {"train_loss": -5.745128631591797, "global_step": 49961, "epoch": 1189} {"train_loss": -5.808154106140137, "global_step": 49962, "epoch": 1189} {"train_loss": -5.873166561126709, "global_step": 49963, "epoch": 1189} {"train_loss": -5.782740592956543, "global_step": 49964, "epoch": 1189} {"train_loss": -5.759311199188232, "global_step": 49965, "epoch": 1189} {"train_loss": -5.759810924530029, "global_step": 49966, "epoch": 1189} {"train_loss": -5.738885402679443, "global_step": 49967, "epoch": 1189} {"train_loss": -5.791470527648926, "global_step": 49968, "epoch": 1189} {"train_loss": -5.7847137451171875, "global_step": 49969, "epoch": 1189} {"train_loss": -5.717999458312988, "global_step": 49970, "epoch": 1189} {"train_loss": -5.812647819519043, "global_step": 49971, "epoch": 1189} {"train_loss": -5.707694053649902, "global_step": 49972, "epoch": 1189} {"train_loss": -5.773978233337402, "global_step": 49973, "epoch": 1189} {"train_loss": -5.641193866729736, "global_step": 49974, "epoch": 1189} {"train_loss": -5.7918596267700195, "global_step": 49975, "epoch": 1189} {"train_loss": -5.746106147766113, "global_step": 49976, "epoch": 1189} {"train_loss": -5.757240295410156, "global_step": 49977, "epoch": 1189} {"train_loss": -5.699702262878418, "global_step": 49978, "epoch": 1189} {"train_loss": -5.768694366727557, "global_step": 49979, "epoch": 1189, "val_loss": 66067.875} {"train_loss": -5.814742088317871, "global_step": 49980, "epoch": 1190} {"train_loss": -5.803601264953613, "global_step": 49981, "epoch": 1190} {"train_loss": -5.780434608459473, "global_step": 49982, "epoch": 1190} {"train_loss": -5.7204365730285645, "global_step": 49983, "epoch": 1190} {"train_loss": -5.763137340545654, "global_step": 49984, "epoch": 1190} {"train_loss": -5.6940083503723145, "global_step": 49985, "epoch": 1190} {"train_loss": -5.736299991607666, "global_step": 49986, "epoch": 1190} {"train_loss": -5.786725044250488, "global_step": 49987, "epoch": 1190} {"train_loss": -5.748699188232422, "global_step": 49988, "epoch": 1190} {"train_loss": -5.7028069496154785, "global_step": 49989, "epoch": 1190} {"train_loss": -5.805872917175293, "global_step": 49990, "epoch": 1190} {"train_loss": -5.744534492492676, "global_step": 49991, "epoch": 1190} {"train_loss": -5.718818664550781, "global_step": 49992, "epoch": 1190} {"train_loss": -5.6528544425964355, "global_step": 49993, "epoch": 1190} {"train_loss": -5.663084983825684, "global_step": 49994, "epoch": 1190} {"train_loss": -5.811476707458496, "global_step": 49995, "epoch": 1190} {"train_loss": -5.714997291564941, "global_step": 49996, "epoch": 1190} {"train_loss": -5.724376201629639, "global_step": 49997, "epoch": 1190} {"train_loss": -5.938631534576416, "global_step": 49998, "epoch": 1190} {"train_loss": -5.572909355163574, "global_step": 49999, "epoch": 1190} {"train_loss": -5.78187370300293, "global_step": 50000, "epoch": 1190} {"train_loss": -5.76028299331665, "global_step": 50001, "epoch": 1190} {"train_loss": -5.735491752624512, "global_step": 50002, "epoch": 1190} {"train_loss": -5.825197219848633, "global_step": 50003, "epoch": 1190} {"train_loss": -5.659050941467285, "global_step": 50004, "epoch": 1190} {"train_loss": -5.717085838317871, "global_step": 50005, "epoch": 1190} {"train_loss": -5.778801441192627, "global_step": 50006, "epoch": 1190} {"train_loss": -5.873438835144043, "global_step": 50007, "epoch": 1190} {"train_loss": -5.78798246383667, "global_step": 50008, "epoch": 1190} {"train_loss": -5.577861785888672, "global_step": 50009, "epoch": 1190} {"train_loss": -5.839446067810059, "global_step": 50010, "epoch": 1190} {"train_loss": -5.728795051574707, "global_step": 50011, "epoch": 1190} {"train_loss": -5.7242021560668945, "global_step": 50012, "epoch": 1190} {"train_loss": -5.778908729553223, "global_step": 50013, "epoch": 1190} {"train_loss": -5.746577262878418, "global_step": 50014, "epoch": 1190} {"train_loss": -5.770203590393066, "global_step": 50015, "epoch": 1190} {"train_loss": -5.7609357833862305, "global_step": 50016, "epoch": 1190} {"train_loss": -5.897655963897705, "global_step": 50017, "epoch": 1190} {"train_loss": -5.703677654266357, "global_step": 50018, "epoch": 1190} {"train_loss": -5.710855007171631, "global_step": 50019, "epoch": 1190} {"train_loss": -5.6214141845703125, "global_step": 50020, "epoch": 1190} {"train_loss": -5.748202392033169, "global_step": 50021, "epoch": 1190, "val_loss": 66115.375} {"train_loss": -5.746097087860107, "global_step": 50022, "epoch": 1191} {"train_loss": -5.572202682495117, "global_step": 50023, "epoch": 1191} {"train_loss": -5.71722412109375, "global_step": 50024, "epoch": 1191} {"train_loss": -5.724175453186035, "global_step": 50025, "epoch": 1191} {"train_loss": -5.634909152984619, "global_step": 50026, "epoch": 1191} {"train_loss": -5.802964210510254, "global_step": 50027, "epoch": 1191} {"train_loss": -5.746644020080566, "global_step": 50028, "epoch": 1191} {"train_loss": -5.7840986251831055, "global_step": 50029, "epoch": 1191} {"train_loss": -5.8563947677612305, "global_step": 50030, "epoch": 1191} {"train_loss": -5.780275344848633, "global_step": 50031, "epoch": 1191} {"train_loss": -5.764322280883789, "global_step": 50032, "epoch": 1191} {"train_loss": -5.843360424041748, "global_step": 50033, "epoch": 1191} {"train_loss": -5.7203874588012695, "global_step": 50034, "epoch": 1191} {"train_loss": -5.788215160369873, "global_step": 50035, "epoch": 1191} {"train_loss": -5.838695526123047, "global_step": 50036, "epoch": 1191} {"train_loss": -5.618770599365234, "global_step": 50037, "epoch": 1191} {"train_loss": -5.713133811950684, "global_step": 50038, "epoch": 1191} {"train_loss": -5.865530490875244, "global_step": 50039, "epoch": 1191} {"train_loss": -5.553553581237793, "global_step": 50040, "epoch": 1191} {"train_loss": -5.6013898849487305, "global_step": 50041, "epoch": 1191} {"train_loss": -5.654875755310059, "global_step": 50042, "epoch": 1191} {"train_loss": -5.639082908630371, "global_step": 50043, "epoch": 1191} {"train_loss": -5.738689422607422, "global_step": 50044, "epoch": 1191} {"train_loss": -5.636809349060059, "global_step": 50045, "epoch": 1191} {"train_loss": -5.736921310424805, "global_step": 50046, "epoch": 1191} {"train_loss": -5.726268768310547, "global_step": 50047, "epoch": 1191} {"train_loss": -5.598386764526367, "global_step": 50048, "epoch": 1191} {"train_loss": -5.780242919921875, "global_step": 50049, "epoch": 1191} {"train_loss": -5.675594329833984, "global_step": 50050, "epoch": 1191} {"train_loss": -5.717704772949219, "global_step": 50051, "epoch": 1191} {"train_loss": -5.68198823928833, "global_step": 50052, "epoch": 1191} {"train_loss": -5.894323348999023, "global_step": 50053, "epoch": 1191} {"train_loss": -5.729185104370117, "global_step": 50054, "epoch": 1191} {"train_loss": -5.681607246398926, "global_step": 50055, "epoch": 1191} {"train_loss": -5.698142051696777, "global_step": 50056, "epoch": 1191} {"train_loss": -5.6215057373046875, "global_step": 50057, "epoch": 1191} {"train_loss": -5.705175399780273, "global_step": 50058, "epoch": 1191} {"train_loss": -5.672571659088135, "global_step": 50059, "epoch": 1191} {"train_loss": -5.898714065551758, "global_step": 50060, "epoch": 1191} {"train_loss": -5.644529342651367, "global_step": 50061, "epoch": 1191} {"train_loss": -5.673059463500977, "global_step": 50062, "epoch": 1191} {"train_loss": -5.717181421461559, "global_step": 50063, "epoch": 1191, "val_loss": 66211.1796875} {"train_loss": -5.720174789428711, "global_step": 50064, "epoch": 1192} {"train_loss": -5.785219192504883, "global_step": 50065, "epoch": 1192} {"train_loss": -5.711056709289551, "global_step": 50066, "epoch": 1192} {"train_loss": -5.687681674957275, "global_step": 50067, "epoch": 1192} {"train_loss": -5.614227294921875, "global_step": 50068, "epoch": 1192} {"train_loss": -5.755143642425537, "global_step": 50069, "epoch": 1192} {"train_loss": -5.902268886566162, "global_step": 50070, "epoch": 1192} {"train_loss": -5.721011161804199, "global_step": 50071, "epoch": 1192} {"train_loss": -5.675116539001465, "global_step": 50072, "epoch": 1192} {"train_loss": -5.786037445068359, "global_step": 50073, "epoch": 1192} {"train_loss": -5.786863327026367, "global_step": 50074, "epoch": 1192} {"train_loss": -5.79705810546875, "global_step": 50075, "epoch": 1192} {"train_loss": -5.839097023010254, "global_step": 50076, "epoch": 1192} {"train_loss": -5.783884525299072, "global_step": 50077, "epoch": 1192} {"train_loss": -5.875360012054443, "global_step": 50078, "epoch": 1192} {"train_loss": -5.750858783721924, "global_step": 50079, "epoch": 1192} {"train_loss": -5.697540283203125, "global_step": 50080, "epoch": 1192} {"train_loss": -5.754807472229004, "global_step": 50081, "epoch": 1192} {"train_loss": -5.707494735717773, "global_step": 50082, "epoch": 1192} {"train_loss": -5.7952494621276855, "global_step": 50083, "epoch": 1192} {"train_loss": -5.743260383605957, "global_step": 50084, "epoch": 1192} {"train_loss": -5.751803398132324, "global_step": 50085, "epoch": 1192} {"train_loss": -5.743154048919678, "global_step": 50086, "epoch": 1192} {"train_loss": -5.705942153930664, "global_step": 50087, "epoch": 1192} {"train_loss": -5.870037078857422, "global_step": 50088, "epoch": 1192} {"train_loss": -5.779642581939697, "global_step": 50089, "epoch": 1192} {"train_loss": -5.759320259094238, "global_step": 50090, "epoch": 1192} {"train_loss": -5.845457077026367, "global_step": 50091, "epoch": 1192} {"train_loss": -5.750720024108887, "global_step": 50092, "epoch": 1192} {"train_loss": -5.782963752746582, "global_step": 50093, "epoch": 1192} {"train_loss": -5.8039045333862305, "global_step": 50094, "epoch": 1192} {"train_loss": -5.764401912689209, "global_step": 50095, "epoch": 1192} {"train_loss": -5.7166361808776855, "global_step": 50096, "epoch": 1192} {"train_loss": -5.829036712646484, "global_step": 50097, "epoch": 1192} {"train_loss": -5.7569756507873535, "global_step": 50098, "epoch": 1192} {"train_loss": -5.774298191070557, "global_step": 50099, "epoch": 1192} {"train_loss": -5.86317777633667, "global_step": 50100, "epoch": 1192} {"train_loss": -5.734438896179199, "global_step": 50101, "epoch": 1192} {"train_loss": -5.650400638580322, "global_step": 50102, "epoch": 1192} {"train_loss": -5.768790245056152, "global_step": 50103, "epoch": 1192} {"train_loss": -5.606087684631348, "global_step": 50104, "epoch": 1192} {"train_loss": -5.759025267192295, "global_step": 50105, "epoch": 1192, "val_loss": 66418.0859375} {"train_loss": -5.78221321105957, "global_step": 50106, "epoch": 1193} {"train_loss": -5.821107864379883, "global_step": 50107, "epoch": 1193} {"train_loss": -5.835129737854004, "global_step": 50108, "epoch": 1193} {"train_loss": -5.678925514221191, "global_step": 50109, "epoch": 1193} {"train_loss": -5.840031623840332, "global_step": 50110, "epoch": 1193} {"train_loss": -5.8115105628967285, "global_step": 50111, "epoch": 1193} {"train_loss": -5.75334358215332, "global_step": 50112, "epoch": 1193} {"train_loss": -5.793687343597412, "global_step": 50113, "epoch": 1193} {"train_loss": -5.758439064025879, "global_step": 50114, "epoch": 1193} {"train_loss": -5.746718406677246, "global_step": 50115, "epoch": 1193} {"train_loss": -5.75111722946167, "global_step": 50116, "epoch": 1193} {"train_loss": -5.683812618255615, "global_step": 50117, "epoch": 1193} {"train_loss": -5.644706726074219, "global_step": 50118, "epoch": 1193} {"train_loss": -5.701803207397461, "global_step": 50119, "epoch": 1193} {"train_loss": -5.714511871337891, "global_step": 50120, "epoch": 1193} {"train_loss": -5.6876606941223145, "global_step": 50121, "epoch": 1193} {"train_loss": -5.896184921264648, "global_step": 50122, "epoch": 1193} {"train_loss": -5.7410078048706055, "global_step": 50123, "epoch": 1193} {"train_loss": -5.871903419494629, "global_step": 50124, "epoch": 1193} {"train_loss": -5.666333198547363, "global_step": 50125, "epoch": 1193} {"train_loss": -5.84274959564209, "global_step": 50126, "epoch": 1193} {"train_loss": -5.831952095031738, "global_step": 50127, "epoch": 1193} {"train_loss": -5.616334915161133, "global_step": 50128, "epoch": 1193} {"train_loss": -5.655512809753418, "global_step": 50129, "epoch": 1193} {"train_loss": -5.68137788772583, "global_step": 50130, "epoch": 1193} {"train_loss": -5.597686767578125, "global_step": 50131, "epoch": 1193} {"train_loss": -5.7955522537231445, "global_step": 50132, "epoch": 1193} {"train_loss": -5.609516143798828, "global_step": 50133, "epoch": 1193} {"train_loss": -5.748588562011719, "global_step": 50134, "epoch": 1193} {"train_loss": -5.761441230773926, "global_step": 50135, "epoch": 1193} {"train_loss": -5.654425621032715, "global_step": 50136, "epoch": 1193} {"train_loss": -5.732778549194336, "global_step": 50137, "epoch": 1193} {"train_loss": -5.60106086730957, "global_step": 50138, "epoch": 1193} {"train_loss": -5.711871147155762, "global_step": 50139, "epoch": 1193} {"train_loss": -5.773810863494873, "global_step": 50140, "epoch": 1193} {"train_loss": -5.701570510864258, "global_step": 50141, "epoch": 1193} {"train_loss": -5.810677528381348, "global_step": 50142, "epoch": 1193} {"train_loss": -5.711467742919922, "global_step": 50143, "epoch": 1193} {"train_loss": -5.73570442199707, "global_step": 50144, "epoch": 1193} {"train_loss": -5.854670524597168, "global_step": 50145, "epoch": 1193} {"train_loss": -5.828386306762695, "global_step": 50146, "epoch": 1193} {"train_loss": -5.739682742527553, "global_step": 50147, "epoch": 1193, "val_loss": 66237.015625} {"train_loss": -5.8407087326049805, "global_step": 50148, "epoch": 1194} {"train_loss": -5.908101558685303, "global_step": 50149, "epoch": 1194} {"train_loss": -5.716764450073242, "global_step": 50150, "epoch": 1194} {"train_loss": -5.9268717765808105, "global_step": 50151, "epoch": 1194} {"train_loss": -5.695291519165039, "global_step": 50152, "epoch": 1194} {"train_loss": -5.792397499084473, "global_step": 50153, "epoch": 1194} {"train_loss": -5.7942705154418945, "global_step": 50154, "epoch": 1194} {"train_loss": -5.761019229888916, "global_step": 50155, "epoch": 1194} {"train_loss": -5.821343898773193, "global_step": 50156, "epoch": 1194} {"train_loss": -5.642340660095215, "global_step": 50157, "epoch": 1194} {"train_loss": -5.755836486816406, "global_step": 50158, "epoch": 1194} {"train_loss": -5.694397926330566, "global_step": 50159, "epoch": 1194} {"train_loss": -5.618640899658203, "global_step": 50160, "epoch": 1194} {"train_loss": -5.729123115539551, "global_step": 50161, "epoch": 1194} {"train_loss": -5.608009338378906, "global_step": 50162, "epoch": 1194} {"train_loss": -5.807445049285889, "global_step": 50163, "epoch": 1194} {"train_loss": -5.817543029785156, "global_step": 50164, "epoch": 1194} {"train_loss": -5.724640846252441, "global_step": 50165, "epoch": 1194} {"train_loss": -5.740691184997559, "global_step": 50166, "epoch": 1194} {"train_loss": -5.816136837005615, "global_step": 50167, "epoch": 1194} {"train_loss": -5.7088847160339355, "global_step": 50168, "epoch": 1194} {"train_loss": -5.756814002990723, "global_step": 50169, "epoch": 1194} {"train_loss": -5.7265625, "global_step": 50170, "epoch": 1194} {"train_loss": -5.7609124183654785, "global_step": 50171, "epoch": 1194} {"train_loss": -5.6590576171875, "global_step": 50172, "epoch": 1194} {"train_loss": -5.691119194030762, "global_step": 50173, "epoch": 1194} {"train_loss": -5.821227550506592, "global_step": 50174, "epoch": 1194} {"train_loss": -5.785438537597656, "global_step": 50175, "epoch": 1194} {"train_loss": -5.675239086151123, "global_step": 50176, "epoch": 1194} {"train_loss": -5.75673770904541, "global_step": 50177, "epoch": 1194} {"train_loss": -5.866078853607178, "global_step": 50178, "epoch": 1194} {"train_loss": -5.626646995544434, "global_step": 50179, "epoch": 1194} {"train_loss": -5.735692977905273, "global_step": 50180, "epoch": 1194} {"train_loss": -5.724100589752197, "global_step": 50181, "epoch": 1194} {"train_loss": -5.671182632446289, "global_step": 50182, "epoch": 1194} {"train_loss": -5.834742546081543, "global_step": 50183, "epoch": 1194} {"train_loss": -5.723430633544922, "global_step": 50184, "epoch": 1194} {"train_loss": -5.770296096801758, "global_step": 50185, "epoch": 1194} {"train_loss": -5.8537421226501465, "global_step": 50186, "epoch": 1194} {"train_loss": -5.8734636306762695, "global_step": 50187, "epoch": 1194} {"train_loss": -5.79444694519043, "global_step": 50188, "epoch": 1194} {"train_loss": -5.756941886175246, "global_step": 50189, "epoch": 1194, "val_loss": 66336.8984375} {"train_loss": -5.787944316864014, "global_step": 50190, "epoch": 1195} {"train_loss": -5.723010063171387, "global_step": 50191, "epoch": 1195} {"train_loss": -5.791752338409424, "global_step": 50192, "epoch": 1195} {"train_loss": -5.7410383224487305, "global_step": 50193, "epoch": 1195} {"train_loss": -5.713009357452393, "global_step": 50194, "epoch": 1195} {"train_loss": -5.761674404144287, "global_step": 50195, "epoch": 1195} {"train_loss": -5.618487358093262, "global_step": 50196, "epoch": 1195} {"train_loss": -5.747485637664795, "global_step": 50197, "epoch": 1195} {"train_loss": -5.737448692321777, "global_step": 50198, "epoch": 1195} {"train_loss": -5.632380485534668, "global_step": 50199, "epoch": 1195} {"train_loss": -5.854148864746094, "global_step": 50200, "epoch": 1195} {"train_loss": -5.796894073486328, "global_step": 50201, "epoch": 1195} {"train_loss": -5.81352424621582, "global_step": 50202, "epoch": 1195} {"train_loss": -5.688989639282227, "global_step": 50203, "epoch": 1195} {"train_loss": -5.680527687072754, "global_step": 50204, "epoch": 1195} {"train_loss": -5.811674118041992, "global_step": 50205, "epoch": 1195} {"train_loss": -5.758456230163574, "global_step": 50206, "epoch": 1195} {"train_loss": -5.671587944030762, "global_step": 50207, "epoch": 1195} {"train_loss": -5.70740270614624, "global_step": 50208, "epoch": 1195} {"train_loss": -5.70986270904541, "global_step": 50209, "epoch": 1195} {"train_loss": -5.696037292480469, "global_step": 50210, "epoch": 1195} {"train_loss": -5.787750244140625, "global_step": 50211, "epoch": 1195} {"train_loss": -5.595487594604492, "global_step": 50212, "epoch": 1195} {"train_loss": -5.772724151611328, "global_step": 50213, "epoch": 1195} {"train_loss": -5.570504188537598, "global_step": 50214, "epoch": 1195} {"train_loss": -5.840072154998779, "global_step": 50215, "epoch": 1195} {"train_loss": -5.824263095855713, "global_step": 50216, "epoch": 1195} {"train_loss": -5.794328212738037, "global_step": 50217, "epoch": 1195} {"train_loss": -5.7280073165893555, "global_step": 50218, "epoch": 1195} {"train_loss": -5.796702861785889, "global_step": 50219, "epoch": 1195} {"train_loss": -5.829224109649658, "global_step": 50220, "epoch": 1195} {"train_loss": -5.80023193359375, "global_step": 50221, "epoch": 1195} {"train_loss": -5.739366054534912, "global_step": 50222, "epoch": 1195} {"train_loss": -5.79551887512207, "global_step": 50223, "epoch": 1195} {"train_loss": -5.656488418579102, "global_step": 50224, "epoch": 1195} {"train_loss": -5.791346073150635, "global_step": 50225, "epoch": 1195} {"train_loss": -5.568716049194336, "global_step": 50226, "epoch": 1195} {"train_loss": -5.605534553527832, "global_step": 50227, "epoch": 1195} {"train_loss": -5.914583206176758, "global_step": 50228, "epoch": 1195} {"train_loss": -5.635581016540527, "global_step": 50229, "epoch": 1195} {"train_loss": -5.857566833496094, "global_step": 50230, "epoch": 1195} {"train_loss": -5.740923972356887, "global_step": 50231, "epoch": 1195, "val_loss": 66056.78125} {"train_loss": -5.686181545257568, "global_step": 50232, "epoch": 1196} {"train_loss": -5.773423194885254, "global_step": 50233, "epoch": 1196} {"train_loss": -5.778948783874512, "global_step": 50234, "epoch": 1196} {"train_loss": -5.811595916748047, "global_step": 50235, "epoch": 1196} {"train_loss": -5.6324143409729, "global_step": 50236, "epoch": 1196} {"train_loss": -5.833532333374023, "global_step": 50237, "epoch": 1196} {"train_loss": -5.828543663024902, "global_step": 50238, "epoch": 1196} {"train_loss": -5.733833312988281, "global_step": 50239, "epoch": 1196} {"train_loss": -5.7807111740112305, "global_step": 50240, "epoch": 1196} {"train_loss": -5.844322204589844, "global_step": 50241, "epoch": 1196} {"train_loss": -5.694781303405762, "global_step": 50242, "epoch": 1196} {"train_loss": -5.760880947113037, "global_step": 50243, "epoch": 1196} {"train_loss": -5.7178144454956055, "global_step": 50244, "epoch": 1196} {"train_loss": -5.716156482696533, "global_step": 50245, "epoch": 1196} {"train_loss": -5.808980941772461, "global_step": 50246, "epoch": 1196} {"train_loss": -5.749927520751953, "global_step": 50247, "epoch": 1196} {"train_loss": -5.809605121612549, "global_step": 50248, "epoch": 1196} {"train_loss": -5.848628520965576, "global_step": 50249, "epoch": 1196} {"train_loss": -5.818883419036865, "global_step": 50250, "epoch": 1196} {"train_loss": -5.723689556121826, "global_step": 50251, "epoch": 1196} {"train_loss": -5.810514450073242, "global_step": 50252, "epoch": 1196} {"train_loss": -5.851395606994629, "global_step": 50253, "epoch": 1196} {"train_loss": -5.7669782638549805, "global_step": 50254, "epoch": 1196} {"train_loss": -5.859276294708252, "global_step": 50255, "epoch": 1196} {"train_loss": -5.848865032196045, "global_step": 50256, "epoch": 1196} {"train_loss": -5.756656646728516, "global_step": 50257, "epoch": 1196} {"train_loss": -5.8914923667907715, "global_step": 50258, "epoch": 1196} {"train_loss": -5.760286331176758, "global_step": 50259, "epoch": 1196} {"train_loss": -5.830698013305664, "global_step": 50260, "epoch": 1196} {"train_loss": -5.81503438949585, "global_step": 50261, "epoch": 1196} {"train_loss": -5.863492965698242, "global_step": 50262, "epoch": 1196} {"train_loss": -5.785518646240234, "global_step": 50263, "epoch": 1196} {"train_loss": -5.681614875793457, "global_step": 50264, "epoch": 1196} {"train_loss": -5.877979278564453, "global_step": 50265, "epoch": 1196} {"train_loss": -5.915260314941406, "global_step": 50266, "epoch": 1196} {"train_loss": -5.732913017272949, "global_step": 50267, "epoch": 1196} {"train_loss": -5.795565605163574, "global_step": 50268, "epoch": 1196} {"train_loss": -5.758152008056641, "global_step": 50269, "epoch": 1196} {"train_loss": -5.868915557861328, "global_step": 50270, "epoch": 1196} {"train_loss": -5.745741844177246, "global_step": 50271, "epoch": 1196} {"train_loss": -5.71992826461792, "global_step": 50272, "epoch": 1196} {"train_loss": -5.785006318773542, "global_step": 50273, "epoch": 1196, "val_loss": 66322.78125} {"train_loss": -5.785393714904785, "global_step": 50274, "epoch": 1197} {"train_loss": -5.819890975952148, "global_step": 50275, "epoch": 1197} {"train_loss": -5.72796630859375, "global_step": 50276, "epoch": 1197} {"train_loss": -5.892017841339111, "global_step": 50277, "epoch": 1197} {"train_loss": -5.744918346405029, "global_step": 50278, "epoch": 1197} {"train_loss": -5.905704498291016, "global_step": 50279, "epoch": 1197} {"train_loss": -5.887631893157959, "global_step": 50280, "epoch": 1197} {"train_loss": -5.7922892570495605, "global_step": 50281, "epoch": 1197} {"train_loss": -5.761200904846191, "global_step": 50282, "epoch": 1197} {"train_loss": -5.798739910125732, "global_step": 50283, "epoch": 1197} {"train_loss": -5.755317687988281, "global_step": 50284, "epoch": 1197} {"train_loss": -5.885624408721924, "global_step": 50285, "epoch": 1197} {"train_loss": -5.731206893920898, "global_step": 50286, "epoch": 1197} {"train_loss": -5.668845176696777, "global_step": 50287, "epoch": 1197} {"train_loss": -5.8390984535217285, "global_step": 50288, "epoch": 1197} {"train_loss": -5.7470526695251465, "global_step": 50289, "epoch": 1197} {"train_loss": -5.762498378753662, "global_step": 50290, "epoch": 1197} {"train_loss": -5.6708221435546875, "global_step": 50291, "epoch": 1197} {"train_loss": -5.81915807723999, "global_step": 50292, "epoch": 1197} {"train_loss": -5.711231231689453, "global_step": 50293, "epoch": 1197} {"train_loss": -5.676775932312012, "global_step": 50294, "epoch": 1197} {"train_loss": -5.710881233215332, "global_step": 50295, "epoch": 1197} {"train_loss": -5.858842849731445, "global_step": 50296, "epoch": 1197} {"train_loss": -5.7540202140808105, "global_step": 50297, "epoch": 1197} {"train_loss": -5.71613883972168, "global_step": 50298, "epoch": 1197} {"train_loss": -5.697040557861328, "global_step": 50299, "epoch": 1197} {"train_loss": -5.787550449371338, "global_step": 50300, "epoch": 1197} {"train_loss": -5.7150468826293945, "global_step": 50301, "epoch": 1197} {"train_loss": -5.734713554382324, "global_step": 50302, "epoch": 1197} {"train_loss": -5.750804901123047, "global_step": 50303, "epoch": 1197} {"train_loss": -5.714719295501709, "global_step": 50304, "epoch": 1197} {"train_loss": -5.696699142456055, "global_step": 50305, "epoch": 1197} {"train_loss": -5.743495941162109, "global_step": 50306, "epoch": 1197} {"train_loss": -5.729007720947266, "global_step": 50307, "epoch": 1197} {"train_loss": -5.753366470336914, "global_step": 50308, "epoch": 1197} {"train_loss": -5.611271858215332, "global_step": 50309, "epoch": 1197} {"train_loss": -5.725114822387695, "global_step": 50310, "epoch": 1197} {"train_loss": -5.775221824645996, "global_step": 50311, "epoch": 1197} {"train_loss": -5.795498371124268, "global_step": 50312, "epoch": 1197} {"train_loss": -5.723208904266357, "global_step": 50313, "epoch": 1197} {"train_loss": -5.800171852111816, "global_step": 50314, "epoch": 1197} {"train_loss": -5.761298418045044, "global_step": 50315, "epoch": 1197, "val_loss": 66261.578125} {"train_loss": -5.774462699890137, "global_step": 50316, "epoch": 1198} {"train_loss": -5.77647590637207, "global_step": 50317, "epoch": 1198} {"train_loss": -5.820635795593262, "global_step": 50318, "epoch": 1198} {"train_loss": -5.704496383666992, "global_step": 50319, "epoch": 1198} {"train_loss": -5.836845397949219, "global_step": 50320, "epoch": 1198} {"train_loss": -5.732568264007568, "global_step": 50321, "epoch": 1198} {"train_loss": -5.83528995513916, "global_step": 50322, "epoch": 1198} {"train_loss": -5.671902179718018, "global_step": 50323, "epoch": 1198} {"train_loss": -5.808600425720215, "global_step": 50324, "epoch": 1198} {"train_loss": -5.895069122314453, "global_step": 50325, "epoch": 1198} {"train_loss": -5.792518615722656, "global_step": 50326, "epoch": 1198} {"train_loss": -5.757709980010986, "global_step": 50327, "epoch": 1198} {"train_loss": -5.797061920166016, "global_step": 50328, "epoch": 1198} {"train_loss": -5.727683067321777, "global_step": 50329, "epoch": 1198} {"train_loss": -5.79327392578125, "global_step": 50330, "epoch": 1198} {"train_loss": -5.722380638122559, "global_step": 50331, "epoch": 1198} {"train_loss": -5.733845233917236, "global_step": 50332, "epoch": 1198} {"train_loss": -5.748117446899414, "global_step": 50333, "epoch": 1198} {"train_loss": -5.8721771240234375, "global_step": 50334, "epoch": 1198} {"train_loss": -5.77391242980957, "global_step": 50335, "epoch": 1198} {"train_loss": -5.84085750579834, "global_step": 50336, "epoch": 1198} {"train_loss": -5.7469282150268555, "global_step": 50337, "epoch": 1198} {"train_loss": -5.7752838134765625, "global_step": 50338, "epoch": 1198} {"train_loss": -5.778451442718506, "global_step": 50339, "epoch": 1198} {"train_loss": -5.733424186706543, "global_step": 50340, "epoch": 1198} {"train_loss": -5.7356061935424805, "global_step": 50341, "epoch": 1198} {"train_loss": -5.841557025909424, "global_step": 50342, "epoch": 1198} {"train_loss": -5.713809013366699, "global_step": 50343, "epoch": 1198} {"train_loss": -5.817130088806152, "global_step": 50344, "epoch": 1198} {"train_loss": -5.746877193450928, "global_step": 50345, "epoch": 1198} {"train_loss": -5.808420658111572, "global_step": 50346, "epoch": 1198} {"train_loss": -5.778451442718506, "global_step": 50347, "epoch": 1198} {"train_loss": -5.854851722717285, "global_step": 50348, "epoch": 1198} {"train_loss": -5.835664749145508, "global_step": 50349, "epoch": 1198} {"train_loss": -5.792304992675781, "global_step": 50350, "epoch": 1198} {"train_loss": -5.892086029052734, "global_step": 50351, "epoch": 1198} {"train_loss": -5.759692668914795, "global_step": 50352, "epoch": 1198} {"train_loss": -5.726813316345215, "global_step": 50353, "epoch": 1198} {"train_loss": -5.712262153625488, "global_step": 50354, "epoch": 1198} {"train_loss": -5.824816703796387, "global_step": 50355, "epoch": 1198} {"train_loss": -5.767500877380371, "global_step": 50356, "epoch": 1198} {"train_loss": -5.78031341234843, "global_step": 50357, "epoch": 1198, "val_loss": 66123.2890625} {"train_loss": -5.741129398345947, "global_step": 50358, "epoch": 1199} {"train_loss": -5.83060359954834, "global_step": 50359, "epoch": 1199} {"train_loss": -5.7859206199646, "global_step": 50360, "epoch": 1199} {"train_loss": -5.741333961486816, "global_step": 50361, "epoch": 1199} {"train_loss": -5.843644142150879, "global_step": 50362, "epoch": 1199} {"train_loss": -5.891232490539551, "global_step": 50363, "epoch": 1199} {"train_loss": -5.875265121459961, "global_step": 50364, "epoch": 1199} {"train_loss": -5.759603500366211, "global_step": 50365, "epoch": 1199} {"train_loss": -5.787923812866211, "global_step": 50366, "epoch": 1199} {"train_loss": -5.814420700073242, "global_step": 50367, "epoch": 1199} {"train_loss": -5.7676777839660645, "global_step": 50368, "epoch": 1199} {"train_loss": -5.748083591461182, "global_step": 50369, "epoch": 1199} {"train_loss": -5.766253471374512, "global_step": 50370, "epoch": 1199} {"train_loss": -5.8235273361206055, "global_step": 50371, "epoch": 1199} {"train_loss": -5.769767761230469, "global_step": 50372, "epoch": 1199} {"train_loss": -5.714859485626221, "global_step": 50373, "epoch": 1199} {"train_loss": -5.682526588439941, "global_step": 50374, "epoch": 1199} {"train_loss": -5.734853744506836, "global_step": 50375, "epoch": 1199} {"train_loss": -5.732645034790039, "global_step": 50376, "epoch": 1199} {"train_loss": -5.865706443786621, "global_step": 50377, "epoch": 1199} {"train_loss": -5.79293155670166, "global_step": 50378, "epoch": 1199} {"train_loss": -5.754124641418457, "global_step": 50379, "epoch": 1199} {"train_loss": -5.784246444702148, "global_step": 50380, "epoch": 1199} {"train_loss": -5.854458332061768, "global_step": 50381, "epoch": 1199} {"train_loss": -5.7689104080200195, "global_step": 50382, "epoch": 1199} {"train_loss": -5.728699207305908, "global_step": 50383, "epoch": 1199} {"train_loss": -5.782653331756592, "global_step": 50384, "epoch": 1199} {"train_loss": -5.845590114593506, "global_step": 50385, "epoch": 1199} {"train_loss": -5.656731605529785, "global_step": 50386, "epoch": 1199} {"train_loss": -5.819916725158691, "global_step": 50387, "epoch": 1199} {"train_loss": -5.679396152496338, "global_step": 50388, "epoch": 1199} {"train_loss": -5.687967777252197, "global_step": 50389, "epoch": 1199} {"train_loss": -5.7856125831604, "global_step": 50390, "epoch": 1199} {"train_loss": -5.6722211837768555, "global_step": 50391, "epoch": 1199} {"train_loss": -5.736953258514404, "global_step": 50392, "epoch": 1199} {"train_loss": -5.700475692749023, "global_step": 50393, "epoch": 1199} {"train_loss": -5.705908298492432, "global_step": 50394, "epoch": 1199} {"train_loss": -5.761944770812988, "global_step": 50395, "epoch": 1199} {"train_loss": -5.858641147613525, "global_step": 50396, "epoch": 1199} {"train_loss": -5.869308948516846, "global_step": 50397, "epoch": 1199} {"train_loss": -5.760141372680664, "global_step": 50398, "epoch": 1199} {"train_loss": -5.773619050071353, "global_step": 50399, "epoch": 1199, "val_loss": 66241.984375} {"train_loss": -5.730247974395752, "global_step": 50400, "epoch": 1200} {"train_loss": -5.790098667144775, "global_step": 50401, "epoch": 1200} {"train_loss": -5.801058769226074, "global_step": 50402, "epoch": 1200} {"train_loss": -5.659142017364502, "global_step": 50403, "epoch": 1200} {"train_loss": -5.8001933097839355, "global_step": 50404, "epoch": 1200} {"train_loss": -5.771069526672363, "global_step": 50405, "epoch": 1200} {"train_loss": -5.654913902282715, "global_step": 50406, "epoch": 1200} {"train_loss": -5.859268665313721, "global_step": 50407, "epoch": 1200} {"train_loss": -5.666530132293701, "global_step": 50408, "epoch": 1200} {"train_loss": -5.935422897338867, "global_step": 50409, "epoch": 1200} {"train_loss": -5.710054397583008, "global_step": 50410, "epoch": 1200} {"train_loss": -5.764708518981934, "global_step": 50411, "epoch": 1200} {"train_loss": -5.790013790130615, "global_step": 50412, "epoch": 1200} {"train_loss": -5.8020782470703125, "global_step": 50413, "epoch": 1200} {"train_loss": -5.798398971557617, "global_step": 50414, "epoch": 1200} {"train_loss": -5.783219814300537, "global_step": 50415, "epoch": 1200} {"train_loss": -5.721916675567627, "global_step": 50416, "epoch": 1200} {"train_loss": -5.871390342712402, "global_step": 50417, "epoch": 1200} {"train_loss": -5.761788845062256, "global_step": 50418, "epoch": 1200} {"train_loss": -5.755013942718506, "global_step": 50419, "epoch": 1200} {"train_loss": -5.789611339569092, "global_step": 50420, "epoch": 1200} {"train_loss": -5.744264125823975, "global_step": 50421, "epoch": 1200} {"train_loss": -5.837289810180664, "global_step": 50422, "epoch": 1200} {"train_loss": -5.719196319580078, "global_step": 50423, "epoch": 1200} {"train_loss": -5.795557975769043, "global_step": 50424, "epoch": 1200} {"train_loss": -5.76506233215332, "global_step": 50425, "epoch": 1200} {"train_loss": -5.850759029388428, "global_step": 50426, "epoch": 1200} {"train_loss": -5.72576379776001, "global_step": 50427, "epoch": 1200} {"train_loss": -5.794781684875488, "global_step": 50428, "epoch": 1200} {"train_loss": -5.73193359375, "global_step": 50429, "epoch": 1200} {"train_loss": -5.845643043518066, "global_step": 50430, "epoch": 1200} {"train_loss": -5.800383567810059, "global_step": 50431, "epoch": 1200} {"train_loss": -5.889153480529785, "global_step": 50432, "epoch": 1200} {"train_loss": -5.705286502838135, "global_step": 50433, "epoch": 1200} {"train_loss": -5.704641342163086, "global_step": 50434, "epoch": 1200} {"train_loss": -5.761363983154297, "global_step": 50435, "epoch": 1200} {"train_loss": -5.693756103515625, "global_step": 50436, "epoch": 1200} {"train_loss": -5.8296966552734375, "global_step": 50437, "epoch": 1200} {"train_loss": -5.709970951080322, "global_step": 50438, "epoch": 1200} {"train_loss": -5.710763454437256, "global_step": 50439, "epoch": 1200} {"train_loss": -5.807259559631348, "global_step": 50440, "epoch": 1200} {"train_loss": -5.7714033126831055, "global_step": 50441, "epoch": 1200, "train/sim_max_reward_0": 0.4226401274528654, "train/sim_max_reward_1": 0.09059443174170007, "train/sim_max_reward_2": 0.5411459854504336, "train/sim_max_reward_3": 0.165902105941985, "train/sim_max_reward_4": 0.9625709686251088, "train/sim_max_reward_5": 0.5632833719283391, "test/sim_max_reward_4400000": 0.289709067621725, "test/sim_max_reward_4400001": 0.7694499714547083, "test/sim_max_reward_4400002": 0.06162358249066209, "test/sim_max_reward_4400003": 0.5816957563104403, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.2119357040349598, "test/sim_max_reward_4400006": 0.33541134767134806, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.5079724907412191, "test/sim_max_reward_4400009": 0.42560924825265356, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.23598362524395614, "test/sim_max_reward_4400012": 0.6322701519080639, "test/sim_max_reward_4400013": 0.3518000663430836, "test/sim_max_reward_4400014": 0.3037854548789058, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.393365910382999, "test/sim_max_reward_4400019": 0.043209922198856165, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.8408256637713759, "test/sim_max_reward_4400022": 0.9195940789275396, "test/sim_max_reward_4400023": 0.47783506703113404, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.11553442849791236, "test/sim_max_reward_4400027": 0.011390123669875293, "test/sim_max_reward_4400028": 0.419536341199062, "test/sim_max_reward_4400029": 0.47721084908037764, "test/sim_max_reward_4400030": 0.3803555527299556, "test/sim_max_reward_4400031": 0.8041617344726083, "test/sim_max_reward_4400032": 0.127526287599278, "test/sim_max_reward_4400033": 0.19347769274320695, "test/sim_max_reward_4400034": 0.7889847385794687, "test/sim_max_reward_4400035": 0.4677669445949415, "test/sim_max_reward_4400036": 0.8764416896579555, "test/sim_max_reward_4400037": 0.9258668934069602, "test/sim_max_reward_4400038": 0.13657331054721272, "test/sim_max_reward_4400039": 0.852282626823331, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.5563825425955593, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.7598504368146013, "test/sim_max_reward_4400044": 0.3609579544093562, "test/sim_max_reward_4400045": 0.8918806554742805, "test/sim_max_reward_4400046": 0.5729155787239774, "test/sim_max_reward_4400047": 0.7438056309016677, "test/sim_max_reward_4400048": 0.3339486899480841, "test/sim_max_reward_4400049": 0.18837277399439672, "train/mean_score": 0.4576894985234053, "test/mean_score": 0.3784063889520581, "val_loss": 66368.5859375} {"train_loss": -5.835638523101807, "global_step": 50442, "epoch": 1201} {"train_loss": -5.812248229980469, "global_step": 50443, "epoch": 1201} {"train_loss": -5.811497688293457, "global_step": 50444, "epoch": 1201} {"train_loss": -5.651450157165527, "global_step": 50445, "epoch": 1201} {"train_loss": -5.856222152709961, "global_step": 50446, "epoch": 1201} {"train_loss": -5.689109802246094, "global_step": 50447, "epoch": 1201} {"train_loss": -5.782562732696533, "global_step": 50448, "epoch": 1201} {"train_loss": -5.682554721832275, "global_step": 50449, "epoch": 1201} {"train_loss": -5.758096694946289, "global_step": 50450, "epoch": 1201} {"train_loss": -5.705538749694824, "global_step": 50451, "epoch": 1201} {"train_loss": -5.825915336608887, "global_step": 50452, "epoch": 1201} {"train_loss": -5.6818389892578125, "global_step": 50453, "epoch": 1201} {"train_loss": -5.690195083618164, "global_step": 50454, "epoch": 1201} {"train_loss": -5.791745185852051, "global_step": 50455, "epoch": 1201} {"train_loss": -5.711201190948486, "global_step": 50456, "epoch": 1201} {"train_loss": -5.752532958984375, "global_step": 50457, "epoch": 1201} {"train_loss": -5.786845684051514, "global_step": 50458, "epoch": 1201} {"train_loss": -5.7814788818359375, "global_step": 50459, "epoch": 1201} {"train_loss": -5.650975704193115, "global_step": 50460, "epoch": 1201} {"train_loss": -5.782665729522705, "global_step": 50461, "epoch": 1201} {"train_loss": -5.611516952514648, "global_step": 50462, "epoch": 1201} {"train_loss": -5.710033893585205, "global_step": 50463, "epoch": 1201} {"train_loss": -5.723053932189941, "global_step": 50464, "epoch": 1201} {"train_loss": -5.815650939941406, "global_step": 50465, "epoch": 1201} {"train_loss": -5.834470748901367, "global_step": 50466, "epoch": 1201} {"train_loss": -5.897268295288086, "global_step": 50467, "epoch": 1201} {"train_loss": -5.730526447296143, "global_step": 50468, "epoch": 1201} {"train_loss": -5.761988639831543, "global_step": 50469, "epoch": 1201} {"train_loss": -5.657309532165527, "global_step": 50470, "epoch": 1201} {"train_loss": -5.724577903747559, "global_step": 50471, "epoch": 1201} {"train_loss": -5.799227714538574, "global_step": 50472, "epoch": 1201} {"train_loss": -5.851317405700684, "global_step": 50473, "epoch": 1201} {"train_loss": -5.823967933654785, "global_step": 50474, "epoch": 1201} {"train_loss": -5.656539440155029, "global_step": 50475, "epoch": 1201} {"train_loss": -5.765280723571777, "global_step": 50476, "epoch": 1201} {"train_loss": -5.710219383239746, "global_step": 50477, "epoch": 1201} {"train_loss": -5.660499572753906, "global_step": 50478, "epoch": 1201} {"train_loss": -5.74643087387085, "global_step": 50479, "epoch": 1201} {"train_loss": -5.576084136962891, "global_step": 50480, "epoch": 1201} {"train_loss": -5.627769470214844, "global_step": 50481, "epoch": 1201} {"train_loss": -5.677672863006592, "global_step": 50482, "epoch": 1201} {"train_loss": -5.738540547234671, "global_step": 50483, "epoch": 1201, "val_loss": 66409.7109375} {"train_loss": -5.628558158874512, "global_step": 50484, "epoch": 1202} {"train_loss": -5.759612083435059, "global_step": 50485, "epoch": 1202} {"train_loss": -5.842304706573486, "global_step": 50486, "epoch": 1202} {"train_loss": -5.701970100402832, "global_step": 50487, "epoch": 1202} {"train_loss": -5.817996025085449, "global_step": 50488, "epoch": 1202} {"train_loss": -5.822493553161621, "global_step": 50489, "epoch": 1202} {"train_loss": -5.869868278503418, "global_step": 50490, "epoch": 1202} {"train_loss": -5.750732898712158, "global_step": 50491, "epoch": 1202} {"train_loss": -5.928997039794922, "global_step": 50492, "epoch": 1202} {"train_loss": -5.6606855392456055, "global_step": 50493, "epoch": 1202} {"train_loss": -5.623520851135254, "global_step": 50494, "epoch": 1202} {"train_loss": -5.784308433532715, "global_step": 50495, "epoch": 1202} {"train_loss": -5.712693214416504, "global_step": 50496, "epoch": 1202} {"train_loss": -5.683307647705078, "global_step": 50497, "epoch": 1202} {"train_loss": -5.812793731689453, "global_step": 50498, "epoch": 1202} {"train_loss": -5.8936262130737305, "global_step": 50499, "epoch": 1202} {"train_loss": -5.748569488525391, "global_step": 50500, "epoch": 1202} {"train_loss": -5.737011909484863, "global_step": 50501, "epoch": 1202} {"train_loss": -5.648340225219727, "global_step": 50502, "epoch": 1202} {"train_loss": -5.695317268371582, "global_step": 50503, "epoch": 1202} {"train_loss": -5.641881942749023, "global_step": 50504, "epoch": 1202} {"train_loss": -5.7138800621032715, "global_step": 50505, "epoch": 1202} {"train_loss": -5.7222580909729, "global_step": 50506, "epoch": 1202} {"train_loss": -5.816210746765137, "global_step": 50507, "epoch": 1202} {"train_loss": -5.892780303955078, "global_step": 50508, "epoch": 1202} {"train_loss": -5.7226762771606445, "global_step": 50509, "epoch": 1202} {"train_loss": -5.760821342468262, "global_step": 50510, "epoch": 1202} {"train_loss": -5.791111469268799, "global_step": 50511, "epoch": 1202} {"train_loss": -5.766951560974121, "global_step": 50512, "epoch": 1202} {"train_loss": -5.721929550170898, "global_step": 50513, "epoch": 1202} {"train_loss": -5.820154190063477, "global_step": 50514, "epoch": 1202} {"train_loss": -5.8235368728637695, "global_step": 50515, "epoch": 1202} {"train_loss": -5.811123371124268, "global_step": 50516, "epoch": 1202} {"train_loss": -5.762089729309082, "global_step": 50517, "epoch": 1202} {"train_loss": -5.856784820556641, "global_step": 50518, "epoch": 1202} {"train_loss": -5.888222694396973, "global_step": 50519, "epoch": 1202} {"train_loss": -5.886258125305176, "global_step": 50520, "epoch": 1202} {"train_loss": -5.8443098068237305, "global_step": 50521, "epoch": 1202} {"train_loss": -5.722471714019775, "global_step": 50522, "epoch": 1202} {"train_loss": -5.640898704528809, "global_step": 50523, "epoch": 1202} {"train_loss": -5.6832427978515625, "global_step": 50524, "epoch": 1202} {"train_loss": -5.765664793196178, "global_step": 50525, "epoch": 1202, "val_loss": 66452.7578125} {"train_loss": -5.765241622924805, "global_step": 50526, "epoch": 1203} {"train_loss": -5.79770040512085, "global_step": 50527, "epoch": 1203} {"train_loss": -5.624192237854004, "global_step": 50528, "epoch": 1203} {"train_loss": -5.772859573364258, "global_step": 50529, "epoch": 1203} {"train_loss": -5.777600288391113, "global_step": 50530, "epoch": 1203} {"train_loss": -5.845183372497559, "global_step": 50531, "epoch": 1203} {"train_loss": -5.879479885101318, "global_step": 50532, "epoch": 1203} {"train_loss": -5.6521148681640625, "global_step": 50533, "epoch": 1203} {"train_loss": -5.823167324066162, "global_step": 50534, "epoch": 1203} {"train_loss": -5.7895002365112305, "global_step": 50535, "epoch": 1203} {"train_loss": -5.817348480224609, "global_step": 50536, "epoch": 1203} {"train_loss": -5.729965686798096, "global_step": 50537, "epoch": 1203} {"train_loss": -5.806269645690918, "global_step": 50538, "epoch": 1203} {"train_loss": -5.710660934448242, "global_step": 50539, "epoch": 1203} {"train_loss": -5.715753555297852, "global_step": 50540, "epoch": 1203} {"train_loss": -5.730356216430664, "global_step": 50541, "epoch": 1203} {"train_loss": -5.658722400665283, "global_step": 50542, "epoch": 1203} {"train_loss": -5.776912689208984, "global_step": 50543, "epoch": 1203} {"train_loss": -5.986502647399902, "global_step": 50544, "epoch": 1203} {"train_loss": -5.775367736816406, "global_step": 50545, "epoch": 1203} {"train_loss": -5.839937686920166, "global_step": 50546, "epoch": 1203} {"train_loss": -5.596429347991943, "global_step": 50547, "epoch": 1203} {"train_loss": -5.782257080078125, "global_step": 50548, "epoch": 1203} {"train_loss": -5.665070533752441, "global_step": 50549, "epoch": 1203} {"train_loss": -5.806950569152832, "global_step": 50550, "epoch": 1203} {"train_loss": -5.70497989654541, "global_step": 50551, "epoch": 1203} {"train_loss": -5.641390800476074, "global_step": 50552, "epoch": 1203} {"train_loss": -5.77644681930542, "global_step": 50553, "epoch": 1203} {"train_loss": -5.740415573120117, "global_step": 50554, "epoch": 1203} {"train_loss": -5.739451885223389, "global_step": 50555, "epoch": 1203} {"train_loss": -5.77596378326416, "global_step": 50556, "epoch": 1203} {"train_loss": -5.743283271789551, "global_step": 50557, "epoch": 1203} {"train_loss": -5.7142438888549805, "global_step": 50558, "epoch": 1203} {"train_loss": -5.625451564788818, "global_step": 50559, "epoch": 1203} {"train_loss": -5.745190620422363, "global_step": 50560, "epoch": 1203} {"train_loss": -5.701385498046875, "global_step": 50561, "epoch": 1203} {"train_loss": -5.685205459594727, "global_step": 50562, "epoch": 1203} {"train_loss": -5.706757545471191, "global_step": 50563, "epoch": 1203} {"train_loss": -5.82921028137207, "global_step": 50564, "epoch": 1203} {"train_loss": -5.759222507476807, "global_step": 50565, "epoch": 1203} {"train_loss": -5.780606746673584, "global_step": 50566, "epoch": 1203} {"train_loss": -5.7515040919894265, "global_step": 50567, "epoch": 1203, "val_loss": 66073.28125} {"train_loss": -5.639031410217285, "global_step": 50568, "epoch": 1204} {"train_loss": -5.695432186126709, "global_step": 50569, "epoch": 1204} {"train_loss": -5.754269599914551, "global_step": 50570, "epoch": 1204} {"train_loss": -5.681012153625488, "global_step": 50571, "epoch": 1204} {"train_loss": -5.689263343811035, "global_step": 50572, "epoch": 1204} {"train_loss": -5.734567642211914, "global_step": 50573, "epoch": 1204} {"train_loss": -5.660400390625, "global_step": 50574, "epoch": 1204} {"train_loss": -5.797965049743652, "global_step": 50575, "epoch": 1204} {"train_loss": -5.7821455001831055, "global_step": 50576, "epoch": 1204} {"train_loss": -5.7698869705200195, "global_step": 50577, "epoch": 1204} {"train_loss": -5.733384132385254, "global_step": 50578, "epoch": 1204} {"train_loss": -5.781564712524414, "global_step": 50579, "epoch": 1204} {"train_loss": -5.866554260253906, "global_step": 50580, "epoch": 1204} {"train_loss": -5.857903480529785, "global_step": 50581, "epoch": 1204} {"train_loss": -5.634488105773926, "global_step": 50582, "epoch": 1204} {"train_loss": -5.926875114440918, "global_step": 50583, "epoch": 1204} {"train_loss": -5.7423858642578125, "global_step": 50584, "epoch": 1204} {"train_loss": -5.784581661224365, "global_step": 50585, "epoch": 1204} {"train_loss": -5.811296463012695, "global_step": 50586, "epoch": 1204} {"train_loss": -5.790983200073242, "global_step": 50587, "epoch": 1204} {"train_loss": -5.792102813720703, "global_step": 50588, "epoch": 1204} {"train_loss": -5.811619281768799, "global_step": 50589, "epoch": 1204} {"train_loss": -5.715010643005371, "global_step": 50590, "epoch": 1204} {"train_loss": -5.749775409698486, "global_step": 50591, "epoch": 1204} {"train_loss": -5.820749759674072, "global_step": 50592, "epoch": 1204} {"train_loss": -5.697872638702393, "global_step": 50593, "epoch": 1204} {"train_loss": -5.840610504150391, "global_step": 50594, "epoch": 1204} {"train_loss": -5.670874118804932, "global_step": 50595, "epoch": 1204} {"train_loss": -5.810802459716797, "global_step": 50596, "epoch": 1204} {"train_loss": -5.721646308898926, "global_step": 50597, "epoch": 1204} {"train_loss": -5.840120315551758, "global_step": 50598, "epoch": 1204} {"train_loss": -5.782072067260742, "global_step": 50599, "epoch": 1204} {"train_loss": -5.670395851135254, "global_step": 50600, "epoch": 1204} {"train_loss": -5.7753071784973145, "global_step": 50601, "epoch": 1204} {"train_loss": -5.592764377593994, "global_step": 50602, "epoch": 1204} {"train_loss": -5.641989707946777, "global_step": 50603, "epoch": 1204} {"train_loss": -5.773189544677734, "global_step": 50604, "epoch": 1204} {"train_loss": -5.738476276397705, "global_step": 50605, "epoch": 1204} {"train_loss": -5.743325710296631, "global_step": 50606, "epoch": 1204} {"train_loss": -5.877111911773682, "global_step": 50607, "epoch": 1204} {"train_loss": -5.688589572906494, "global_step": 50608, "epoch": 1204} {"train_loss": -5.751070998963856, "global_step": 50609, "epoch": 1204, "val_loss": 66191.5234375} {"train_loss": -5.798439979553223, "global_step": 50610, "epoch": 1205} {"train_loss": -5.577394485473633, "global_step": 50611, "epoch": 1205} {"train_loss": -5.753081321716309, "global_step": 50612, "epoch": 1205} {"train_loss": -5.710347652435303, "global_step": 50613, "epoch": 1205} {"train_loss": -5.773255348205566, "global_step": 50614, "epoch": 1205} {"train_loss": -5.793239116668701, "global_step": 50615, "epoch": 1205} {"train_loss": -5.819433212280273, "global_step": 50616, "epoch": 1205} {"train_loss": -5.726513862609863, "global_step": 50617, "epoch": 1205} {"train_loss": -5.666136741638184, "global_step": 50618, "epoch": 1205} {"train_loss": -5.688432216644287, "global_step": 50619, "epoch": 1205} {"train_loss": -5.691327095031738, "global_step": 50620, "epoch": 1205} {"train_loss": -5.724773406982422, "global_step": 50621, "epoch": 1205} {"train_loss": -5.565232276916504, "global_step": 50622, "epoch": 1205} {"train_loss": -5.769596099853516, "global_step": 50623, "epoch": 1205} {"train_loss": -5.682088851928711, "global_step": 50624, "epoch": 1205} {"train_loss": -5.687442302703857, "global_step": 50625, "epoch": 1205} {"train_loss": -5.700117111206055, "global_step": 50626, "epoch": 1205} {"train_loss": -5.714221000671387, "global_step": 50627, "epoch": 1205} {"train_loss": -5.679067611694336, "global_step": 50628, "epoch": 1205} {"train_loss": -5.825780391693115, "global_step": 50629, "epoch": 1205} {"train_loss": -5.759971618652344, "global_step": 50630, "epoch": 1205} {"train_loss": -5.818863868713379, "global_step": 50631, "epoch": 1205} {"train_loss": -5.847659111022949, "global_step": 50632, "epoch": 1205} {"train_loss": -5.685694217681885, "global_step": 50633, "epoch": 1205} {"train_loss": -5.757287979125977, "global_step": 50634, "epoch": 1205} {"train_loss": -5.795205116271973, "global_step": 50635, "epoch": 1205} {"train_loss": -5.845312118530273, "global_step": 50636, "epoch": 1205} {"train_loss": -5.708626747131348, "global_step": 50637, "epoch": 1205} {"train_loss": -5.725593090057373, "global_step": 50638, "epoch": 1205} {"train_loss": -5.898348808288574, "global_step": 50639, "epoch": 1205} {"train_loss": -5.720516204833984, "global_step": 50640, "epoch": 1205} {"train_loss": -5.8058247566223145, "global_step": 50641, "epoch": 1205} {"train_loss": -5.769146919250488, "global_step": 50642, "epoch": 1205} {"train_loss": -5.840721130371094, "global_step": 50643, "epoch": 1205} {"train_loss": -5.761354446411133, "global_step": 50644, "epoch": 1205} {"train_loss": -5.763926982879639, "global_step": 50645, "epoch": 1205} {"train_loss": -5.727005481719971, "global_step": 50646, "epoch": 1205} {"train_loss": -5.681952476501465, "global_step": 50647, "epoch": 1205} {"train_loss": -5.81374979019165, "global_step": 50648, "epoch": 1205} {"train_loss": -5.815462112426758, "global_step": 50649, "epoch": 1205} {"train_loss": -5.860015869140625, "global_step": 50650, "epoch": 1205} {"train_loss": -5.752240703219459, "global_step": 50651, "epoch": 1205, "val_loss": 66228.3046875} {"train_loss": -5.855797290802002, "global_step": 50652, "epoch": 1206} {"train_loss": -5.72308349609375, "global_step": 50653, "epoch": 1206} {"train_loss": -5.802002906799316, "global_step": 50654, "epoch": 1206} {"train_loss": -5.815585136413574, "global_step": 50655, "epoch": 1206} {"train_loss": -5.821550369262695, "global_step": 50656, "epoch": 1206} {"train_loss": -5.685897350311279, "global_step": 50657, "epoch": 1206} {"train_loss": -5.856990337371826, "global_step": 50658, "epoch": 1206} {"train_loss": -5.871516227722168, "global_step": 50659, "epoch": 1206} {"train_loss": -5.791589260101318, "global_step": 50660, "epoch": 1206} {"train_loss": -5.719006538391113, "global_step": 50661, "epoch": 1206} {"train_loss": -5.825839996337891, "global_step": 50662, "epoch": 1206} {"train_loss": -5.8513994216918945, "global_step": 50663, "epoch": 1206} {"train_loss": -5.611245155334473, "global_step": 50664, "epoch": 1206} {"train_loss": -5.740999221801758, "global_step": 50665, "epoch": 1206} {"train_loss": -5.79290771484375, "global_step": 50666, "epoch": 1206} {"train_loss": -5.714177131652832, "global_step": 50667, "epoch": 1206} {"train_loss": -5.78931999206543, "global_step": 50668, "epoch": 1206} {"train_loss": -5.763431549072266, "global_step": 50669, "epoch": 1206} {"train_loss": -5.922440528869629, "global_step": 50670, "epoch": 1206} {"train_loss": -5.808014392852783, "global_step": 50671, "epoch": 1206} {"train_loss": -5.7964582443237305, "global_step": 50672, "epoch": 1206} {"train_loss": -5.742010116577148, "global_step": 50673, "epoch": 1206} {"train_loss": -5.919107437133789, "global_step": 50674, "epoch": 1206} {"train_loss": -5.777044773101807, "global_step": 50675, "epoch": 1206} {"train_loss": -5.730248928070068, "global_step": 50676, "epoch": 1206} {"train_loss": -5.854955196380615, "global_step": 50677, "epoch": 1206} {"train_loss": -5.792036056518555, "global_step": 50678, "epoch": 1206} {"train_loss": -5.8712615966796875, "global_step": 50679, "epoch": 1206} {"train_loss": -5.557633399963379, "global_step": 50680, "epoch": 1206} {"train_loss": -5.835723876953125, "global_step": 50681, "epoch": 1206} {"train_loss": -5.783580780029297, "global_step": 50682, "epoch": 1206} {"train_loss": -5.816242218017578, "global_step": 50683, "epoch": 1206} {"train_loss": -5.719264030456543, "global_step": 50684, "epoch": 1206} {"train_loss": -5.715215682983398, "global_step": 50685, "epoch": 1206} {"train_loss": -5.681179046630859, "global_step": 50686, "epoch": 1206} {"train_loss": -5.786746025085449, "global_step": 50687, "epoch": 1206} {"train_loss": -5.748961448669434, "global_step": 50688, "epoch": 1206} {"train_loss": -5.87109375, "global_step": 50689, "epoch": 1206} {"train_loss": -5.863603591918945, "global_step": 50690, "epoch": 1206} {"train_loss": -5.819159030914307, "global_step": 50691, "epoch": 1206} {"train_loss": -5.802483558654785, "global_step": 50692, "epoch": 1206} {"train_loss": -5.78718900680542, "global_step": 50693, "epoch": 1206, "val_loss": 66167.171875} {"train_loss": -5.79168176651001, "global_step": 50694, "epoch": 1207} {"train_loss": -5.858110427856445, "global_step": 50695, "epoch": 1207} {"train_loss": -5.752967834472656, "global_step": 50696, "epoch": 1207} {"train_loss": -5.738986015319824, "global_step": 50697, "epoch": 1207} {"train_loss": -5.89546012878418, "global_step": 50698, "epoch": 1207} {"train_loss": -5.776440620422363, "global_step": 50699, "epoch": 1207} {"train_loss": -5.703191757202148, "global_step": 50700, "epoch": 1207} {"train_loss": -5.736295223236084, "global_step": 50701, "epoch": 1207} {"train_loss": -5.82598876953125, "global_step": 50702, "epoch": 1207} {"train_loss": -5.819160461425781, "global_step": 50703, "epoch": 1207} {"train_loss": -5.834320068359375, "global_step": 50704, "epoch": 1207} {"train_loss": -5.7544450759887695, "global_step": 50705, "epoch": 1207} {"train_loss": -5.739959239959717, "global_step": 50706, "epoch": 1207} {"train_loss": -5.758559703826904, "global_step": 50707, "epoch": 1207} {"train_loss": -5.702721118927002, "global_step": 50708, "epoch": 1207} {"train_loss": -5.701143741607666, "global_step": 50709, "epoch": 1207} {"train_loss": -5.704054832458496, "global_step": 50710, "epoch": 1207} {"train_loss": -5.842197895050049, "global_step": 50711, "epoch": 1207} {"train_loss": -5.653547286987305, "global_step": 50712, "epoch": 1207} {"train_loss": -5.770717620849609, "global_step": 50713, "epoch": 1207} {"train_loss": -5.793254375457764, "global_step": 50714, "epoch": 1207} {"train_loss": -5.817699432373047, "global_step": 50715, "epoch": 1207} {"train_loss": -5.791644096374512, "global_step": 50716, "epoch": 1207} {"train_loss": -5.653818130493164, "global_step": 50717, "epoch": 1207} {"train_loss": -5.738883972167969, "global_step": 50718, "epoch": 1207} {"train_loss": -5.703579902648926, "global_step": 50719, "epoch": 1207} {"train_loss": -5.776932716369629, "global_step": 50720, "epoch": 1207} {"train_loss": -5.883848667144775, "global_step": 50721, "epoch": 1207} {"train_loss": -5.599822998046875, "global_step": 50722, "epoch": 1207} {"train_loss": -5.741179466247559, "global_step": 50723, "epoch": 1207} {"train_loss": -5.6792473793029785, "global_step": 50724, "epoch": 1207} {"train_loss": -5.808847427368164, "global_step": 50725, "epoch": 1207} {"train_loss": -5.748427391052246, "global_step": 50726, "epoch": 1207} {"train_loss": -5.642128944396973, "global_step": 50727, "epoch": 1207} {"train_loss": -5.753584861755371, "global_step": 50728, "epoch": 1207} {"train_loss": -5.8080339431762695, "global_step": 50729, "epoch": 1207} {"train_loss": -5.774237155914307, "global_step": 50730, "epoch": 1207} {"train_loss": -5.773641109466553, "global_step": 50731, "epoch": 1207} {"train_loss": -5.785470008850098, "global_step": 50732, "epoch": 1207} {"train_loss": -5.734086990356445, "global_step": 50733, "epoch": 1207} {"train_loss": -5.815622806549072, "global_step": 50734, "epoch": 1207} {"train_loss": -5.760057914824713, "global_step": 50735, "epoch": 1207, "val_loss": 66197.109375} {"train_loss": -5.76353645324707, "global_step": 50736, "epoch": 1208} {"train_loss": -5.750720977783203, "global_step": 50737, "epoch": 1208} {"train_loss": -5.668875217437744, "global_step": 50738, "epoch": 1208} {"train_loss": -5.856534481048584, "global_step": 50739, "epoch": 1208} {"train_loss": -5.77874231338501, "global_step": 50740, "epoch": 1208} {"train_loss": -5.808843612670898, "global_step": 50741, "epoch": 1208} {"train_loss": -5.751954078674316, "global_step": 50742, "epoch": 1208} {"train_loss": -5.8234639167785645, "global_step": 50743, "epoch": 1208} {"train_loss": -5.708844184875488, "global_step": 50744, "epoch": 1208} {"train_loss": -5.641294479370117, "global_step": 50745, "epoch": 1208} {"train_loss": -5.905434608459473, "global_step": 50746, "epoch": 1208} {"train_loss": -5.776460647583008, "global_step": 50747, "epoch": 1208} {"train_loss": -5.708401679992676, "global_step": 50748, "epoch": 1208} {"train_loss": -5.943411827087402, "global_step": 50749, "epoch": 1208} {"train_loss": -5.764958381652832, "global_step": 50750, "epoch": 1208} {"train_loss": -5.751290321350098, "global_step": 50751, "epoch": 1208} {"train_loss": -5.805685043334961, "global_step": 50752, "epoch": 1208} {"train_loss": -5.777649402618408, "global_step": 50753, "epoch": 1208} {"train_loss": -5.864151477813721, "global_step": 50754, "epoch": 1208} {"train_loss": -5.8270978927612305, "global_step": 50755, "epoch": 1208} {"train_loss": -5.784375190734863, "global_step": 50756, "epoch": 1208} {"train_loss": -5.7814178466796875, "global_step": 50757, "epoch": 1208} {"train_loss": -5.716368198394775, "global_step": 50758, "epoch": 1208} {"train_loss": -5.766056537628174, "global_step": 50759, "epoch": 1208} {"train_loss": -5.723408222198486, "global_step": 50760, "epoch": 1208} {"train_loss": -5.751635551452637, "global_step": 50761, "epoch": 1208} {"train_loss": -5.770826816558838, "global_step": 50762, "epoch": 1208} {"train_loss": -5.6522369384765625, "global_step": 50763, "epoch": 1208} {"train_loss": -5.7464704513549805, "global_step": 50764, "epoch": 1208} {"train_loss": -5.841466426849365, "global_step": 50765, "epoch": 1208} {"train_loss": -5.653263092041016, "global_step": 50766, "epoch": 1208} {"train_loss": -5.720333099365234, "global_step": 50767, "epoch": 1208} {"train_loss": -5.6838483810424805, "global_step": 50768, "epoch": 1208} {"train_loss": -5.82996940612793, "global_step": 50769, "epoch": 1208} {"train_loss": -5.795241355895996, "global_step": 50770, "epoch": 1208} {"train_loss": -5.682262897491455, "global_step": 50771, "epoch": 1208} {"train_loss": -5.752668380737305, "global_step": 50772, "epoch": 1208} {"train_loss": -5.7546491622924805, "global_step": 50773, "epoch": 1208} {"train_loss": -5.7914719581604, "global_step": 50774, "epoch": 1208} {"train_loss": -5.555269241333008, "global_step": 50775, "epoch": 1208} {"train_loss": -5.790056228637695, "global_step": 50776, "epoch": 1208} {"train_loss": -5.761445851553054, "global_step": 50777, "epoch": 1208, "val_loss": 66319.359375} {"train_loss": -5.76660680770874, "global_step": 50778, "epoch": 1209} {"train_loss": -5.8946709632873535, "global_step": 50779, "epoch": 1209} {"train_loss": -5.907630920410156, "global_step": 50780, "epoch": 1209} {"train_loss": -5.647344589233398, "global_step": 50781, "epoch": 1209} {"train_loss": -5.753407955169678, "global_step": 50782, "epoch": 1209} {"train_loss": -5.733822822570801, "global_step": 50783, "epoch": 1209} {"train_loss": -5.724229335784912, "global_step": 50784, "epoch": 1209} {"train_loss": -5.73154354095459, "global_step": 50785, "epoch": 1209} {"train_loss": -5.780128479003906, "global_step": 50786, "epoch": 1209} {"train_loss": -5.549764633178711, "global_step": 50787, "epoch": 1209} {"train_loss": -5.86769962310791, "global_step": 50788, "epoch": 1209} {"train_loss": -5.8438615798950195, "global_step": 50789, "epoch": 1209} {"train_loss": -5.733614921569824, "global_step": 50790, "epoch": 1209} {"train_loss": -5.718142032623291, "global_step": 50791, "epoch": 1209} {"train_loss": -5.681129455566406, "global_step": 50792, "epoch": 1209} {"train_loss": -5.649593353271484, "global_step": 50793, "epoch": 1209} {"train_loss": -5.65656852722168, "global_step": 50794, "epoch": 1209} {"train_loss": -5.828734397888184, "global_step": 50795, "epoch": 1209} {"train_loss": -5.635714530944824, "global_step": 50796, "epoch": 1209} {"train_loss": -5.61617374420166, "global_step": 50797, "epoch": 1209} {"train_loss": -5.516267776489258, "global_step": 50798, "epoch": 1209} {"train_loss": -5.6260480880737305, "global_step": 50799, "epoch": 1209} {"train_loss": -5.605181694030762, "global_step": 50800, "epoch": 1209} {"train_loss": -5.701284885406494, "global_step": 50801, "epoch": 1209} {"train_loss": -5.637300491333008, "global_step": 50802, "epoch": 1209} {"train_loss": -5.650298118591309, "global_step": 50803, "epoch": 1209} {"train_loss": -5.702861309051514, "global_step": 50804, "epoch": 1209} {"train_loss": -5.5083465576171875, "global_step": 50805, "epoch": 1209} {"train_loss": -5.660465240478516, "global_step": 50806, "epoch": 1209} {"train_loss": -5.770369052886963, "global_step": 50807, "epoch": 1209} {"train_loss": -5.7352495193481445, "global_step": 50808, "epoch": 1209} {"train_loss": -5.736118316650391, "global_step": 50809, "epoch": 1209} {"train_loss": -5.745822906494141, "global_step": 50810, "epoch": 1209} {"train_loss": -5.691516399383545, "global_step": 50811, "epoch": 1209} {"train_loss": -5.721672058105469, "global_step": 50812, "epoch": 1209} {"train_loss": -5.754429340362549, "global_step": 50813, "epoch": 1209} {"train_loss": -5.766313552856445, "global_step": 50814, "epoch": 1209} {"train_loss": -5.622846603393555, "global_step": 50815, "epoch": 1209} {"train_loss": -5.630917549133301, "global_step": 50816, "epoch": 1209} {"train_loss": -5.804974555969238, "global_step": 50817, "epoch": 1209} {"train_loss": -5.663752555847168, "global_step": 50818, "epoch": 1209} {"train_loss": -5.70768388112386, "global_step": 50819, "epoch": 1209, "val_loss": 66081.3046875} {"train_loss": -5.783110618591309, "global_step": 50820, "epoch": 1210} {"train_loss": -5.64786434173584, "global_step": 50821, "epoch": 1210} {"train_loss": -5.78982400894165, "global_step": 50822, "epoch": 1210} {"train_loss": -5.798525810241699, "global_step": 50823, "epoch": 1210} {"train_loss": -5.70283317565918, "global_step": 50824, "epoch": 1210} {"train_loss": -5.774470329284668, "global_step": 50825, "epoch": 1210} {"train_loss": -5.743309497833252, "global_step": 50826, "epoch": 1210} {"train_loss": -5.752740859985352, "global_step": 50827, "epoch": 1210} {"train_loss": -5.664656162261963, "global_step": 50828, "epoch": 1210} {"train_loss": -5.744918346405029, "global_step": 50829, "epoch": 1210} {"train_loss": -5.617787837982178, "global_step": 50830, "epoch": 1210} {"train_loss": -5.8651275634765625, "global_step": 50831, "epoch": 1210} {"train_loss": -5.628763198852539, "global_step": 50832, "epoch": 1210} {"train_loss": -5.670975208282471, "global_step": 50833, "epoch": 1210} {"train_loss": -5.815030097961426, "global_step": 50834, "epoch": 1210} {"train_loss": -5.777214527130127, "global_step": 50835, "epoch": 1210} {"train_loss": -5.718493938446045, "global_step": 50836, "epoch": 1210} {"train_loss": -5.710680961608887, "global_step": 50837, "epoch": 1210} {"train_loss": -5.7877936363220215, "global_step": 50838, "epoch": 1210} {"train_loss": -5.708756446838379, "global_step": 50839, "epoch": 1210} {"train_loss": -5.685283184051514, "global_step": 50840, "epoch": 1210} {"train_loss": -5.794093132019043, "global_step": 50841, "epoch": 1210} {"train_loss": -5.75618314743042, "global_step": 50842, "epoch": 1210} {"train_loss": -5.834758758544922, "global_step": 50843, "epoch": 1210} {"train_loss": -5.750627517700195, "global_step": 50844, "epoch": 1210} {"train_loss": -5.801963806152344, "global_step": 50845, "epoch": 1210} {"train_loss": -5.698958873748779, "global_step": 50846, "epoch": 1210} {"train_loss": -5.788638114929199, "global_step": 50847, "epoch": 1210} {"train_loss": -5.74162483215332, "global_step": 50848, "epoch": 1210} {"train_loss": -5.702086448669434, "global_step": 50849, "epoch": 1210} {"train_loss": -5.68193244934082, "global_step": 50850, "epoch": 1210} {"train_loss": -5.73015832901001, "global_step": 50851, "epoch": 1210} {"train_loss": -5.716757774353027, "global_step": 50852, "epoch": 1210} {"train_loss": -5.7898736000061035, "global_step": 50853, "epoch": 1210} {"train_loss": -5.775198459625244, "global_step": 50854, "epoch": 1210} {"train_loss": -5.548632621765137, "global_step": 50855, "epoch": 1210} {"train_loss": -5.763698577880859, "global_step": 50856, "epoch": 1210} {"train_loss": -5.749361515045166, "global_step": 50857, "epoch": 1210} {"train_loss": -5.777319431304932, "global_step": 50858, "epoch": 1210} {"train_loss": -5.678126335144043, "global_step": 50859, "epoch": 1210} {"train_loss": -5.659819602966309, "global_step": 50860, "epoch": 1210} {"train_loss": -5.73447661172776, "global_step": 50861, "epoch": 1210, "val_loss": 66237.7109375} {"train_loss": -5.732186794281006, "global_step": 50862, "epoch": 1211} {"train_loss": -5.847873687744141, "global_step": 50863, "epoch": 1211} {"train_loss": -5.7619123458862305, "global_step": 50864, "epoch": 1211} {"train_loss": -5.842163562774658, "global_step": 50865, "epoch": 1211} {"train_loss": -5.686100959777832, "global_step": 50866, "epoch": 1211} {"train_loss": -5.807097911834717, "global_step": 50867, "epoch": 1211} {"train_loss": -5.801911354064941, "global_step": 50868, "epoch": 1211} {"train_loss": -5.781700134277344, "global_step": 50869, "epoch": 1211} {"train_loss": -5.865728855133057, "global_step": 50870, "epoch": 1211} {"train_loss": -5.813690185546875, "global_step": 50871, "epoch": 1211} {"train_loss": -5.744722366333008, "global_step": 50872, "epoch": 1211} {"train_loss": -5.615059852600098, "global_step": 50873, "epoch": 1211} {"train_loss": -5.754133224487305, "global_step": 50874, "epoch": 1211} {"train_loss": -5.930004119873047, "global_step": 50875, "epoch": 1211} {"train_loss": -5.852643966674805, "global_step": 50876, "epoch": 1211} {"train_loss": -5.74520206451416, "global_step": 50877, "epoch": 1211} {"train_loss": -5.767478942871094, "global_step": 50878, "epoch": 1211} {"train_loss": -5.761623859405518, "global_step": 50879, "epoch": 1211} {"train_loss": -5.722865104675293, "global_step": 50880, "epoch": 1211} {"train_loss": -5.794012069702148, "global_step": 50881, "epoch": 1211} {"train_loss": -5.767560958862305, "global_step": 50882, "epoch": 1211} {"train_loss": -5.701417446136475, "global_step": 50883, "epoch": 1211} {"train_loss": -5.753374099731445, "global_step": 50884, "epoch": 1211} {"train_loss": -5.725978851318359, "global_step": 50885, "epoch": 1211} {"train_loss": -5.917008399963379, "global_step": 50886, "epoch": 1211} {"train_loss": -5.696990489959717, "global_step": 50887, "epoch": 1211} {"train_loss": -5.7937541007995605, "global_step": 50888, "epoch": 1211} {"train_loss": -5.7232465744018555, "global_step": 50889, "epoch": 1211} {"train_loss": -5.7725677490234375, "global_step": 50890, "epoch": 1211} {"train_loss": -5.730767250061035, "global_step": 50891, "epoch": 1211} {"train_loss": -5.836141586303711, "global_step": 50892, "epoch": 1211} {"train_loss": -5.807487487792969, "global_step": 50893, "epoch": 1211} {"train_loss": -5.742123603820801, "global_step": 50894, "epoch": 1211} {"train_loss": -5.692044734954834, "global_step": 50895, "epoch": 1211} {"train_loss": -5.688610076904297, "global_step": 50896, "epoch": 1211} {"train_loss": -5.680657386779785, "global_step": 50897, "epoch": 1211} {"train_loss": -5.789671421051025, "global_step": 50898, "epoch": 1211} {"train_loss": -5.784511089324951, "global_step": 50899, "epoch": 1211} {"train_loss": -5.717803478240967, "global_step": 50900, "epoch": 1211} {"train_loss": -5.785337448120117, "global_step": 50901, "epoch": 1211} {"train_loss": -5.8877668380737305, "global_step": 50902, "epoch": 1211} {"train_loss": -5.771793444951375, "global_step": 50903, "epoch": 1211, "val_loss": 66147.375} {"train_loss": -5.751644134521484, "global_step": 50904, "epoch": 1212} {"train_loss": -5.723172187805176, "global_step": 50905, "epoch": 1212} {"train_loss": -5.898315906524658, "global_step": 50906, "epoch": 1212} {"train_loss": -5.6860246658325195, "global_step": 50907, "epoch": 1212} {"train_loss": -5.88327693939209, "global_step": 50908, "epoch": 1212} {"train_loss": -5.7777581214904785, "global_step": 50909, "epoch": 1212} {"train_loss": -5.7790069580078125, "global_step": 50910, "epoch": 1212} {"train_loss": -5.984122276306152, "global_step": 50911, "epoch": 1212} {"train_loss": -5.808540344238281, "global_step": 50912, "epoch": 1212} {"train_loss": -5.758027076721191, "global_step": 50913, "epoch": 1212} {"train_loss": -5.71879768371582, "global_step": 50914, "epoch": 1212} {"train_loss": -5.856224060058594, "global_step": 50915, "epoch": 1212} {"train_loss": -5.72462272644043, "global_step": 50916, "epoch": 1212} {"train_loss": -5.7647809982299805, "global_step": 50917, "epoch": 1212} {"train_loss": -5.792041778564453, "global_step": 50918, "epoch": 1212} {"train_loss": -5.914516448974609, "global_step": 50919, "epoch": 1212} {"train_loss": -5.861719131469727, "global_step": 50920, "epoch": 1212} {"train_loss": -5.7092695236206055, "global_step": 50921, "epoch": 1212} {"train_loss": -5.844252109527588, "global_step": 50922, "epoch": 1212} {"train_loss": -5.756189346313477, "global_step": 50923, "epoch": 1212} {"train_loss": -5.833464622497559, "global_step": 50924, "epoch": 1212} {"train_loss": -5.881879806518555, "global_step": 50925, "epoch": 1212} {"train_loss": -5.750966548919678, "global_step": 50926, "epoch": 1212} {"train_loss": -5.695033550262451, "global_step": 50927, "epoch": 1212} {"train_loss": -5.772505760192871, "global_step": 50928, "epoch": 1212} {"train_loss": -5.920680522918701, "global_step": 50929, "epoch": 1212} {"train_loss": -5.858611106872559, "global_step": 50930, "epoch": 1212} {"train_loss": -5.785987377166748, "global_step": 50931, "epoch": 1212} {"train_loss": -5.74533748626709, "global_step": 50932, "epoch": 1212} {"train_loss": -5.744661808013916, "global_step": 50933, "epoch": 1212} {"train_loss": -5.772893905639648, "global_step": 50934, "epoch": 1212} {"train_loss": -5.645906925201416, "global_step": 50935, "epoch": 1212} {"train_loss": -5.7725324630737305, "global_step": 50936, "epoch": 1212} {"train_loss": -5.8028564453125, "global_step": 50937, "epoch": 1212} {"train_loss": -5.730282306671143, "global_step": 50938, "epoch": 1212} {"train_loss": -5.784160137176514, "global_step": 50939, "epoch": 1212} {"train_loss": -5.670821666717529, "global_step": 50940, "epoch": 1212} {"train_loss": -5.755099296569824, "global_step": 50941, "epoch": 1212} {"train_loss": -5.634294509887695, "global_step": 50942, "epoch": 1212} {"train_loss": -5.750634670257568, "global_step": 50943, "epoch": 1212} {"train_loss": -5.801483154296875, "global_step": 50944, "epoch": 1212} {"train_loss": -5.7815431867327005, "global_step": 50945, "epoch": 1212, "val_loss": 66166.453125} {"train_loss": -5.6860761642456055, "global_step": 50946, "epoch": 1213} {"train_loss": -5.677118301391602, "global_step": 50947, "epoch": 1213} {"train_loss": -5.652301788330078, "global_step": 50948, "epoch": 1213} {"train_loss": -5.7389302253723145, "global_step": 50949, "epoch": 1213} {"train_loss": -5.808480262756348, "global_step": 50950, "epoch": 1213} {"train_loss": -5.791272163391113, "global_step": 50951, "epoch": 1213} {"train_loss": -5.639093399047852, "global_step": 50952, "epoch": 1213} {"train_loss": -5.735342025756836, "global_step": 50953, "epoch": 1213} {"train_loss": -5.7694902420043945, "global_step": 50954, "epoch": 1213} {"train_loss": -5.725349426269531, "global_step": 50955, "epoch": 1213} {"train_loss": -5.813480377197266, "global_step": 50956, "epoch": 1213} {"train_loss": -5.67949104309082, "global_step": 50957, "epoch": 1213} {"train_loss": -5.876650810241699, "global_step": 50958, "epoch": 1213} {"train_loss": -5.83474588394165, "global_step": 50959, "epoch": 1213} {"train_loss": -5.831608772277832, "global_step": 50960, "epoch": 1213} {"train_loss": -5.814059734344482, "global_step": 50961, "epoch": 1213} {"train_loss": -5.7952423095703125, "global_step": 50962, "epoch": 1213} {"train_loss": -5.749383926391602, "global_step": 50963, "epoch": 1213} {"train_loss": -5.847595691680908, "global_step": 50964, "epoch": 1213} {"train_loss": -5.789847373962402, "global_step": 50965, "epoch": 1213} {"train_loss": -5.6568603515625, "global_step": 50966, "epoch": 1213} {"train_loss": -5.847496509552002, "global_step": 50967, "epoch": 1213} {"train_loss": -5.797337532043457, "global_step": 50968, "epoch": 1213} {"train_loss": -5.764107704162598, "global_step": 50969, "epoch": 1213} {"train_loss": -5.872340202331543, "global_step": 50970, "epoch": 1213} {"train_loss": -5.771230697631836, "global_step": 50971, "epoch": 1213} {"train_loss": -5.742486476898193, "global_step": 50972, "epoch": 1213} {"train_loss": -5.715766906738281, "global_step": 50973, "epoch": 1213} {"train_loss": -5.77049446105957, "global_step": 50974, "epoch": 1213} {"train_loss": -5.662507057189941, "global_step": 50975, "epoch": 1213} {"train_loss": -5.786454200744629, "global_step": 50976, "epoch": 1213} {"train_loss": -5.772397994995117, "global_step": 50977, "epoch": 1213} {"train_loss": -5.738238334655762, "global_step": 50978, "epoch": 1213} {"train_loss": -5.810098648071289, "global_step": 50979, "epoch": 1213} {"train_loss": -5.769540786743164, "global_step": 50980, "epoch": 1213} {"train_loss": -5.723357677459717, "global_step": 50981, "epoch": 1213} {"train_loss": -5.755344867706299, "global_step": 50982, "epoch": 1213} {"train_loss": -5.652924060821533, "global_step": 50983, "epoch": 1213} {"train_loss": -5.697066307067871, "global_step": 50984, "epoch": 1213} {"train_loss": -5.741959571838379, "global_step": 50985, "epoch": 1213} {"train_loss": -5.760451793670654, "global_step": 50986, "epoch": 1213} {"train_loss": -5.758300826663063, "global_step": 50987, "epoch": 1213, "val_loss": 66534.09375} {"train_loss": -5.776302814483643, "global_step": 50988, "epoch": 1214} {"train_loss": -5.796205043792725, "global_step": 50989, "epoch": 1214} {"train_loss": -5.803536415100098, "global_step": 50990, "epoch": 1214} {"train_loss": -5.792022705078125, "global_step": 50991, "epoch": 1214} {"train_loss": -5.759286403656006, "global_step": 50992, "epoch": 1214} {"train_loss": -5.788055419921875, "global_step": 50993, "epoch": 1214} {"train_loss": -5.846946716308594, "global_step": 50994, "epoch": 1214} {"train_loss": -5.6966552734375, "global_step": 50995, "epoch": 1214} {"train_loss": -5.744112968444824, "global_step": 50996, "epoch": 1214} {"train_loss": -5.742480278015137, "global_step": 50997, "epoch": 1214} {"train_loss": -5.74077033996582, "global_step": 50998, "epoch": 1214} {"train_loss": -5.748093605041504, "global_step": 50999, "epoch": 1214} {"train_loss": -5.623027801513672, "global_step": 51000, "epoch": 1214} {"train_loss": -5.679088115692139, "global_step": 51001, "epoch": 1214} {"train_loss": -5.834764003753662, "global_step": 51002, "epoch": 1214} {"train_loss": -5.855545997619629, "global_step": 51003, "epoch": 1214} {"train_loss": -5.715214729309082, "global_step": 51004, "epoch": 1214} {"train_loss": -5.7410078048706055, "global_step": 51005, "epoch": 1214} {"train_loss": -5.7712016105651855, "global_step": 51006, "epoch": 1214} {"train_loss": -5.76114559173584, "global_step": 51007, "epoch": 1214} {"train_loss": -5.719579696655273, "global_step": 51008, "epoch": 1214} {"train_loss": -5.889217853546143, "global_step": 51009, "epoch": 1214} {"train_loss": -5.780725479125977, "global_step": 51010, "epoch": 1214} {"train_loss": -5.85569429397583, "global_step": 51011, "epoch": 1214} {"train_loss": -5.727433204650879, "global_step": 51012, "epoch": 1214} {"train_loss": -5.76095724105835, "global_step": 51013, "epoch": 1214} {"train_loss": -5.757448196411133, "global_step": 51014, "epoch": 1214} {"train_loss": -5.629649639129639, "global_step": 51015, "epoch": 1214} {"train_loss": -5.631583213806152, "global_step": 51016, "epoch": 1214} {"train_loss": -5.722573757171631, "global_step": 51017, "epoch": 1214} {"train_loss": -5.820644378662109, "global_step": 51018, "epoch": 1214} {"train_loss": -5.718013763427734, "global_step": 51019, "epoch": 1214} {"train_loss": -5.826215744018555, "global_step": 51020, "epoch": 1214} {"train_loss": -5.765739440917969, "global_step": 51021, "epoch": 1214} {"train_loss": -5.835566520690918, "global_step": 51022, "epoch": 1214} {"train_loss": -5.760563850402832, "global_step": 51023, "epoch": 1214} {"train_loss": -5.775726795196533, "global_step": 51024, "epoch": 1214} {"train_loss": -5.857946395874023, "global_step": 51025, "epoch": 1214} {"train_loss": -5.729033470153809, "global_step": 51026, "epoch": 1214} {"train_loss": -5.682766437530518, "global_step": 51027, "epoch": 1214} {"train_loss": -5.8018341064453125, "global_step": 51028, "epoch": 1214} {"train_loss": -5.760494345710391, "global_step": 51029, "epoch": 1214, "val_loss": 66079.375} {"train_loss": -5.712352752685547, "global_step": 51030, "epoch": 1215} {"train_loss": -5.714818000793457, "global_step": 51031, "epoch": 1215} {"train_loss": -5.817249298095703, "global_step": 51032, "epoch": 1215} {"train_loss": -5.682926177978516, "global_step": 51033, "epoch": 1215} {"train_loss": -5.80279541015625, "global_step": 51034, "epoch": 1215} {"train_loss": -5.802148818969727, "global_step": 51035, "epoch": 1215} {"train_loss": -5.8277716636657715, "global_step": 51036, "epoch": 1215} {"train_loss": -5.815817356109619, "global_step": 51037, "epoch": 1215} {"train_loss": -5.7488298416137695, "global_step": 51038, "epoch": 1215} {"train_loss": -5.8669352531433105, "global_step": 51039, "epoch": 1215} {"train_loss": -5.7029523849487305, "global_step": 51040, "epoch": 1215} {"train_loss": -5.770474433898926, "global_step": 51041, "epoch": 1215} {"train_loss": -5.878815650939941, "global_step": 51042, "epoch": 1215} {"train_loss": -5.683543682098389, "global_step": 51043, "epoch": 1215} {"train_loss": -5.8298845291137695, "global_step": 51044, "epoch": 1215} {"train_loss": -5.801985263824463, "global_step": 51045, "epoch": 1215} {"train_loss": -5.861602306365967, "global_step": 51046, "epoch": 1215} {"train_loss": -5.79072380065918, "global_step": 51047, "epoch": 1215} {"train_loss": -5.757889270782471, "global_step": 51048, "epoch": 1215} {"train_loss": -5.797337532043457, "global_step": 51049, "epoch": 1215} {"train_loss": -5.743412017822266, "global_step": 51050, "epoch": 1215} {"train_loss": -5.652102470397949, "global_step": 51051, "epoch": 1215} {"train_loss": -5.754918098449707, "global_step": 51052, "epoch": 1215} {"train_loss": -5.908327102661133, "global_step": 51053, "epoch": 1215} {"train_loss": -5.784893035888672, "global_step": 51054, "epoch": 1215} {"train_loss": -5.789813041687012, "global_step": 51055, "epoch": 1215} {"train_loss": -5.83479118347168, "global_step": 51056, "epoch": 1215} {"train_loss": -5.776130199432373, "global_step": 51057, "epoch": 1215} {"train_loss": -5.86146354675293, "global_step": 51058, "epoch": 1215} {"train_loss": -5.794183731079102, "global_step": 51059, "epoch": 1215} {"train_loss": -5.680551528930664, "global_step": 51060, "epoch": 1215} {"train_loss": -5.748052597045898, "global_step": 51061, "epoch": 1215} {"train_loss": -5.668770790100098, "global_step": 51062, "epoch": 1215} {"train_loss": -5.665476322174072, "global_step": 51063, "epoch": 1215} {"train_loss": -5.81995153427124, "global_step": 51064, "epoch": 1215} {"train_loss": -5.750515937805176, "global_step": 51065, "epoch": 1215} {"train_loss": -5.676807403564453, "global_step": 51066, "epoch": 1215} {"train_loss": -5.699654579162598, "global_step": 51067, "epoch": 1215} {"train_loss": -5.837647914886475, "global_step": 51068, "epoch": 1215} {"train_loss": -5.810459136962891, "global_step": 51069, "epoch": 1215} {"train_loss": -5.757938385009766, "global_step": 51070, "epoch": 1215} {"train_loss": -5.7748749596732, "global_step": 51071, "epoch": 1215, "val_loss": 66187.2734375} {"train_loss": -5.845348358154297, "global_step": 51072, "epoch": 1216} {"train_loss": -5.7863078117370605, "global_step": 51073, "epoch": 1216} {"train_loss": -5.769252777099609, "global_step": 51074, "epoch": 1216} {"train_loss": -5.797213554382324, "global_step": 51075, "epoch": 1216} {"train_loss": -5.832115173339844, "global_step": 51076, "epoch": 1216} {"train_loss": -5.809548377990723, "global_step": 51077, "epoch": 1216} {"train_loss": -5.777231693267822, "global_step": 51078, "epoch": 1216} {"train_loss": -5.829571723937988, "global_step": 51079, "epoch": 1216} {"train_loss": -5.8421125411987305, "global_step": 51080, "epoch": 1216} {"train_loss": -5.846057891845703, "global_step": 51081, "epoch": 1216} {"train_loss": -5.819169998168945, "global_step": 51082, "epoch": 1216} {"train_loss": -5.902593612670898, "global_step": 51083, "epoch": 1216} {"train_loss": -5.8923869132995605, "global_step": 51084, "epoch": 1216} {"train_loss": -5.846918106079102, "global_step": 51085, "epoch": 1216} {"train_loss": -5.842308044433594, "global_step": 51086, "epoch": 1216} {"train_loss": -5.885485649108887, "global_step": 51087, "epoch": 1216} {"train_loss": -5.846043109893799, "global_step": 51088, "epoch": 1216} {"train_loss": -5.799252510070801, "global_step": 51089, "epoch": 1216} {"train_loss": -5.744353294372559, "global_step": 51090, "epoch": 1216} {"train_loss": -5.695138931274414, "global_step": 51091, "epoch": 1216} {"train_loss": -5.782329559326172, "global_step": 51092, "epoch": 1216} {"train_loss": -5.83531379699707, "global_step": 51093, "epoch": 1216} {"train_loss": -5.748084545135498, "global_step": 51094, "epoch": 1216} {"train_loss": -5.7943572998046875, "global_step": 51095, "epoch": 1216} {"train_loss": -5.677559852600098, "global_step": 51096, "epoch": 1216} {"train_loss": -5.721383094787598, "global_step": 51097, "epoch": 1216} {"train_loss": -5.722012042999268, "global_step": 51098, "epoch": 1216} {"train_loss": -5.590322971343994, "global_step": 51099, "epoch": 1216} {"train_loss": -5.74074125289917, "global_step": 51100, "epoch": 1216} {"train_loss": -5.676501750946045, "global_step": 51101, "epoch": 1216} {"train_loss": -5.593791961669922, "global_step": 51102, "epoch": 1216} {"train_loss": -5.845460891723633, "global_step": 51103, "epoch": 1216} {"train_loss": -5.818397045135498, "global_step": 51104, "epoch": 1216} {"train_loss": -5.620349884033203, "global_step": 51105, "epoch": 1216} {"train_loss": -5.7626752853393555, "global_step": 51106, "epoch": 1216} {"train_loss": -5.823205947875977, "global_step": 51107, "epoch": 1216} {"train_loss": -5.727518081665039, "global_step": 51108, "epoch": 1216} {"train_loss": -5.716487884521484, "global_step": 51109, "epoch": 1216} {"train_loss": -5.778658390045166, "global_step": 51110, "epoch": 1216} {"train_loss": -5.730385780334473, "global_step": 51111, "epoch": 1216} {"train_loss": -5.816372871398926, "global_step": 51112, "epoch": 1216} {"train_loss": -5.780235097521827, "global_step": 51113, "epoch": 1216, "val_loss": 66388.8359375} {"train_loss": -5.741580486297607, "global_step": 51114, "epoch": 1217} {"train_loss": -5.770249366760254, "global_step": 51115, "epoch": 1217} {"train_loss": -5.742616653442383, "global_step": 51116, "epoch": 1217} {"train_loss": -5.785706996917725, "global_step": 51117, "epoch": 1217} {"train_loss": -5.705552577972412, "global_step": 51118, "epoch": 1217} {"train_loss": -5.888099193572998, "global_step": 51119, "epoch": 1217} {"train_loss": -5.760054111480713, "global_step": 51120, "epoch": 1217} {"train_loss": -5.858310699462891, "global_step": 51121, "epoch": 1217} {"train_loss": -5.773784160614014, "global_step": 51122, "epoch": 1217} {"train_loss": -5.741263389587402, "global_step": 51123, "epoch": 1217} {"train_loss": -5.767758369445801, "global_step": 51124, "epoch": 1217} {"train_loss": -5.712491512298584, "global_step": 51125, "epoch": 1217} {"train_loss": -5.797545909881592, "global_step": 51126, "epoch": 1217} {"train_loss": -5.659961223602295, "global_step": 51127, "epoch": 1217} {"train_loss": -5.867012023925781, "global_step": 51128, "epoch": 1217} {"train_loss": -5.738286972045898, "global_step": 51129, "epoch": 1217} {"train_loss": -5.79575777053833, "global_step": 51130, "epoch": 1217} {"train_loss": -5.765721321105957, "global_step": 51131, "epoch": 1217} {"train_loss": -5.769145488739014, "global_step": 51132, "epoch": 1217} {"train_loss": -5.76691198348999, "global_step": 51133, "epoch": 1217} {"train_loss": -5.748456001281738, "global_step": 51134, "epoch": 1217} {"train_loss": -5.730978012084961, "global_step": 51135, "epoch": 1217} {"train_loss": -5.826208114624023, "global_step": 51136, "epoch": 1217} {"train_loss": -5.684930801391602, "global_step": 51137, "epoch": 1217} {"train_loss": -5.7801513671875, "global_step": 51138, "epoch": 1217} {"train_loss": -5.720521926879883, "global_step": 51139, "epoch": 1217} {"train_loss": -5.6898193359375, "global_step": 51140, "epoch": 1217} {"train_loss": -5.7875165939331055, "global_step": 51141, "epoch": 1217} {"train_loss": -5.700047492980957, "global_step": 51142, "epoch": 1217} {"train_loss": -5.66717529296875, "global_step": 51143, "epoch": 1217} {"train_loss": -5.742181777954102, "global_step": 51144, "epoch": 1217} {"train_loss": -5.671568393707275, "global_step": 51145, "epoch": 1217} {"train_loss": -5.670529842376709, "global_step": 51146, "epoch": 1217} {"train_loss": -5.788122653961182, "global_step": 51147, "epoch": 1217} {"train_loss": -5.85552978515625, "global_step": 51148, "epoch": 1217} {"train_loss": -5.918947219848633, "global_step": 51149, "epoch": 1217} {"train_loss": -5.687931060791016, "global_step": 51150, "epoch": 1217} {"train_loss": -5.820248126983643, "global_step": 51151, "epoch": 1217} {"train_loss": -5.7551774978637695, "global_step": 51152, "epoch": 1217} {"train_loss": -5.786250114440918, "global_step": 51153, "epoch": 1217} {"train_loss": -5.651103496551514, "global_step": 51154, "epoch": 1217} {"train_loss": -5.759454011917114, "global_step": 51155, "epoch": 1217, "val_loss": 66367.328125} {"train_loss": -5.813081741333008, "global_step": 51156, "epoch": 1218} {"train_loss": -5.806732177734375, "global_step": 51157, "epoch": 1218} {"train_loss": -5.798806190490723, "global_step": 51158, "epoch": 1218} {"train_loss": -5.797704696655273, "global_step": 51159, "epoch": 1218} {"train_loss": -5.655646800994873, "global_step": 51160, "epoch": 1218} {"train_loss": -5.865451335906982, "global_step": 51161, "epoch": 1218} {"train_loss": -5.667680740356445, "global_step": 51162, "epoch": 1218} {"train_loss": -5.7788286209106445, "global_step": 51163, "epoch": 1218} {"train_loss": -5.7689690589904785, "global_step": 51164, "epoch": 1218} {"train_loss": -5.731532096862793, "global_step": 51165, "epoch": 1218} {"train_loss": -5.742433071136475, "global_step": 51166, "epoch": 1218} {"train_loss": -5.796478748321533, "global_step": 51167, "epoch": 1218} {"train_loss": -5.659916877746582, "global_step": 51168, "epoch": 1218} {"train_loss": -5.740509033203125, "global_step": 51169, "epoch": 1218} {"train_loss": -5.669821739196777, "global_step": 51170, "epoch": 1218} {"train_loss": -5.709391117095947, "global_step": 51171, "epoch": 1218} {"train_loss": -5.7756876945495605, "global_step": 51172, "epoch": 1218} {"train_loss": -5.798555374145508, "global_step": 51173, "epoch": 1218} {"train_loss": -5.781942367553711, "global_step": 51174, "epoch": 1218} {"train_loss": -5.808931350708008, "global_step": 51175, "epoch": 1218} {"train_loss": -5.900174140930176, "global_step": 51176, "epoch": 1218} {"train_loss": -5.876091480255127, "global_step": 51177, "epoch": 1218} {"train_loss": -5.817302703857422, "global_step": 51178, "epoch": 1218} {"train_loss": -5.701467037200928, "global_step": 51179, "epoch": 1218} {"train_loss": -5.774101734161377, "global_step": 51180, "epoch": 1218} {"train_loss": -5.775753974914551, "global_step": 51181, "epoch": 1218} {"train_loss": -5.6996355056762695, "global_step": 51182, "epoch": 1218} {"train_loss": -5.683130264282227, "global_step": 51183, "epoch": 1218} {"train_loss": -5.829853057861328, "global_step": 51184, "epoch": 1218} {"train_loss": -5.788802623748779, "global_step": 51185, "epoch": 1218} {"train_loss": -5.80739164352417, "global_step": 51186, "epoch": 1218} {"train_loss": -5.704152584075928, "global_step": 51187, "epoch": 1218} {"train_loss": -5.714754104614258, "global_step": 51188, "epoch": 1218} {"train_loss": -5.7477569580078125, "global_step": 51189, "epoch": 1218} {"train_loss": -5.557361125946045, "global_step": 51190, "epoch": 1218} {"train_loss": -5.63344669342041, "global_step": 51191, "epoch": 1218} {"train_loss": -5.715034008026123, "global_step": 51192, "epoch": 1218} {"train_loss": -5.725510597229004, "global_step": 51193, "epoch": 1218} {"train_loss": -5.71773099899292, "global_step": 51194, "epoch": 1218} {"train_loss": -5.744457244873047, "global_step": 51195, "epoch": 1218} {"train_loss": -5.6320719718933105, "global_step": 51196, "epoch": 1218} {"train_loss": -5.745771601086571, "global_step": 51197, "epoch": 1218, "val_loss": 66103.5} {"train_loss": -5.748919486999512, "global_step": 51198, "epoch": 1219} {"train_loss": -5.619150638580322, "global_step": 51199, "epoch": 1219} {"train_loss": -5.734724044799805, "global_step": 51200, "epoch": 1219} {"train_loss": -5.699331283569336, "global_step": 51201, "epoch": 1219} {"train_loss": -5.858076572418213, "global_step": 51202, "epoch": 1219} {"train_loss": -5.809428691864014, "global_step": 51203, "epoch": 1219} {"train_loss": -5.884589195251465, "global_step": 51204, "epoch": 1219} {"train_loss": -5.742124080657959, "global_step": 51205, "epoch": 1219} {"train_loss": -5.829298496246338, "global_step": 51206, "epoch": 1219} {"train_loss": -5.7760772705078125, "global_step": 51207, "epoch": 1219} {"train_loss": -5.765105247497559, "global_step": 51208, "epoch": 1219} {"train_loss": -5.827136039733887, "global_step": 51209, "epoch": 1219} {"train_loss": -5.670838356018066, "global_step": 51210, "epoch": 1219} {"train_loss": -5.772549629211426, "global_step": 51211, "epoch": 1219} {"train_loss": -5.855459213256836, "global_step": 51212, "epoch": 1219} {"train_loss": -5.821390151977539, "global_step": 51213, "epoch": 1219} {"train_loss": -5.752967834472656, "global_step": 51214, "epoch": 1219} {"train_loss": -5.688248634338379, "global_step": 51215, "epoch": 1219} {"train_loss": -5.704678058624268, "global_step": 51216, "epoch": 1219} {"train_loss": -5.750838756561279, "global_step": 51217, "epoch": 1219} {"train_loss": -5.812823295593262, "global_step": 51218, "epoch": 1219} {"train_loss": -5.734253883361816, "global_step": 51219, "epoch": 1219} {"train_loss": -5.835163116455078, "global_step": 51220, "epoch": 1219} {"train_loss": -5.729034423828125, "global_step": 51221, "epoch": 1219} {"train_loss": -5.8685736656188965, "global_step": 51222, "epoch": 1219} {"train_loss": -5.719829082489014, "global_step": 51223, "epoch": 1219} {"train_loss": -5.7031755447387695, "global_step": 51224, "epoch": 1219} {"train_loss": -5.857889175415039, "global_step": 51225, "epoch": 1219} {"train_loss": -5.738645553588867, "global_step": 51226, "epoch": 1219} {"train_loss": -5.781833648681641, "global_step": 51227, "epoch": 1219} {"train_loss": -5.853139400482178, "global_step": 51228, "epoch": 1219} {"train_loss": -5.853952407836914, "global_step": 51229, "epoch": 1219} {"train_loss": -5.849601745605469, "global_step": 51230, "epoch": 1219} {"train_loss": -5.822055339813232, "global_step": 51231, "epoch": 1219} {"train_loss": -5.755289077758789, "global_step": 51232, "epoch": 1219} {"train_loss": -5.662318229675293, "global_step": 51233, "epoch": 1219} {"train_loss": -5.761263847351074, "global_step": 51234, "epoch": 1219} {"train_loss": -5.850853443145752, "global_step": 51235, "epoch": 1219} {"train_loss": -5.616455078125, "global_step": 51236, "epoch": 1219} {"train_loss": -5.718263626098633, "global_step": 51237, "epoch": 1219} {"train_loss": -5.917426109313965, "global_step": 51238, "epoch": 1219} {"train_loss": -5.770967426754179, "global_step": 51239, "epoch": 1219, "val_loss": 66225.2265625} {"train_loss": -5.80314826965332, "global_step": 51240, "epoch": 1220} {"train_loss": -5.997343063354492, "global_step": 51241, "epoch": 1220} {"train_loss": -5.799015998840332, "global_step": 51242, "epoch": 1220} {"train_loss": -5.817477703094482, "global_step": 51243, "epoch": 1220} {"train_loss": -5.832481384277344, "global_step": 51244, "epoch": 1220} {"train_loss": -5.784168243408203, "global_step": 51245, "epoch": 1220} {"train_loss": -5.745028495788574, "global_step": 51246, "epoch": 1220} {"train_loss": -5.745107173919678, "global_step": 51247, "epoch": 1220} {"train_loss": -5.733729839324951, "global_step": 51248, "epoch": 1220} {"train_loss": -5.754936218261719, "global_step": 51249, "epoch": 1220} {"train_loss": -5.726961135864258, "global_step": 51250, "epoch": 1220} {"train_loss": -5.745675086975098, "global_step": 51251, "epoch": 1220} {"train_loss": -5.77606725692749, "global_step": 51252, "epoch": 1220} {"train_loss": -5.838959693908691, "global_step": 51253, "epoch": 1220} {"train_loss": -5.812161445617676, "global_step": 51254, "epoch": 1220} {"train_loss": -5.773991584777832, "global_step": 51255, "epoch": 1220} {"train_loss": -5.810939788818359, "global_step": 51256, "epoch": 1220} {"train_loss": -5.766809463500977, "global_step": 51257, "epoch": 1220} {"train_loss": -5.879358291625977, "global_step": 51258, "epoch": 1220} {"train_loss": -5.785430908203125, "global_step": 51259, "epoch": 1220} {"train_loss": -5.769522666931152, "global_step": 51260, "epoch": 1220} {"train_loss": -5.876358985900879, "global_step": 51261, "epoch": 1220} {"train_loss": -5.819573402404785, "global_step": 51262, "epoch": 1220} {"train_loss": -5.841672897338867, "global_step": 51263, "epoch": 1220} {"train_loss": -5.748140335083008, "global_step": 51264, "epoch": 1220} {"train_loss": -5.770421504974365, "global_step": 51265, "epoch": 1220} {"train_loss": -5.7759552001953125, "global_step": 51266, "epoch": 1220} {"train_loss": -5.860569000244141, "global_step": 51267, "epoch": 1220} {"train_loss": -5.659939289093018, "global_step": 51268, "epoch": 1220} {"train_loss": -5.781498908996582, "global_step": 51269, "epoch": 1220} {"train_loss": -5.801630973815918, "global_step": 51270, "epoch": 1220} {"train_loss": -5.675403594970703, "global_step": 51271, "epoch": 1220} {"train_loss": -5.79221248626709, "global_step": 51272, "epoch": 1220} {"train_loss": -5.7947235107421875, "global_step": 51273, "epoch": 1220} {"train_loss": -5.611038684844971, "global_step": 51274, "epoch": 1220} {"train_loss": -5.712705135345459, "global_step": 51275, "epoch": 1220} {"train_loss": -5.80265998840332, "global_step": 51276, "epoch": 1220} {"train_loss": -5.859525203704834, "global_step": 51277, "epoch": 1220} {"train_loss": -5.6973371505737305, "global_step": 51278, "epoch": 1220} {"train_loss": -5.655391693115234, "global_step": 51279, "epoch": 1220} {"train_loss": -5.774572372436523, "global_step": 51280, "epoch": 1220} {"train_loss": -5.779085658845448, "global_step": 51281, "epoch": 1220, "val_loss": 66102.9609375} {"train_loss": -5.726020336151123, "global_step": 51282, "epoch": 1221} {"train_loss": -5.660240173339844, "global_step": 51283, "epoch": 1221} {"train_loss": -5.612129211425781, "global_step": 51284, "epoch": 1221} {"train_loss": -5.8794355392456055, "global_step": 51285, "epoch": 1221} {"train_loss": -5.684584617614746, "global_step": 51286, "epoch": 1221} {"train_loss": -5.726419925689697, "global_step": 51287, "epoch": 1221} {"train_loss": -5.718385696411133, "global_step": 51288, "epoch": 1221} {"train_loss": -5.654382705688477, "global_step": 51289, "epoch": 1221} {"train_loss": -5.708196640014648, "global_step": 51290, "epoch": 1221} {"train_loss": -5.782315731048584, "global_step": 51291, "epoch": 1221} {"train_loss": -5.785529136657715, "global_step": 51292, "epoch": 1221} {"train_loss": -5.84098482131958, "global_step": 51293, "epoch": 1221} {"train_loss": -5.758548736572266, "global_step": 51294, "epoch": 1221} {"train_loss": -5.769576549530029, "global_step": 51295, "epoch": 1221} {"train_loss": -5.645374774932861, "global_step": 51296, "epoch": 1221} {"train_loss": -5.805332660675049, "global_step": 51297, "epoch": 1221} {"train_loss": -5.819381237030029, "global_step": 51298, "epoch": 1221} {"train_loss": -5.941303730010986, "global_step": 51299, "epoch": 1221} {"train_loss": -5.726784706115723, "global_step": 51300, "epoch": 1221} {"train_loss": -5.686521530151367, "global_step": 51301, "epoch": 1221} {"train_loss": -5.688261985778809, "global_step": 51302, "epoch": 1221} {"train_loss": -5.704957485198975, "global_step": 51303, "epoch": 1221} {"train_loss": -5.679008483886719, "global_step": 51304, "epoch": 1221} {"train_loss": -5.804712772369385, "global_step": 51305, "epoch": 1221} {"train_loss": -5.761155128479004, "global_step": 51306, "epoch": 1221} {"train_loss": -5.815608024597168, "global_step": 51307, "epoch": 1221} {"train_loss": -5.714360237121582, "global_step": 51308, "epoch": 1221} {"train_loss": -5.679891586303711, "global_step": 51309, "epoch": 1221} {"train_loss": -5.747387886047363, "global_step": 51310, "epoch": 1221} {"train_loss": -5.866142272949219, "global_step": 51311, "epoch": 1221} {"train_loss": -5.72664737701416, "global_step": 51312, "epoch": 1221} {"train_loss": -5.534669876098633, "global_step": 51313, "epoch": 1221} {"train_loss": -5.669368267059326, "global_step": 51314, "epoch": 1221} {"train_loss": -5.913246154785156, "global_step": 51315, "epoch": 1221} {"train_loss": -5.778798580169678, "global_step": 51316, "epoch": 1221} {"train_loss": -5.68997859954834, "global_step": 51317, "epoch": 1221} {"train_loss": -5.771793365478516, "global_step": 51318, "epoch": 1221} {"train_loss": -5.763871192932129, "global_step": 51319, "epoch": 1221} {"train_loss": -5.715806484222412, "global_step": 51320, "epoch": 1221} {"train_loss": -5.866802215576172, "global_step": 51321, "epoch": 1221} {"train_loss": -5.745478630065918, "global_step": 51322, "epoch": 1221} {"train_loss": -5.749518280937558, "global_step": 51323, "epoch": 1221, "val_loss": 66109.484375} {"train_loss": -5.735841751098633, "global_step": 51324, "epoch": 1222} {"train_loss": -5.805562973022461, "global_step": 51325, "epoch": 1222} {"train_loss": -5.765097618103027, "global_step": 51326, "epoch": 1222} {"train_loss": -5.851762294769287, "global_step": 51327, "epoch": 1222} {"train_loss": -5.889508247375488, "global_step": 51328, "epoch": 1222} {"train_loss": -5.6879425048828125, "global_step": 51329, "epoch": 1222} {"train_loss": -5.667121887207031, "global_step": 51330, "epoch": 1222} {"train_loss": -5.722743988037109, "global_step": 51331, "epoch": 1222} {"train_loss": -5.70682954788208, "global_step": 51332, "epoch": 1222} {"train_loss": -5.773711204528809, "global_step": 51333, "epoch": 1222} {"train_loss": -5.791288375854492, "global_step": 51334, "epoch": 1222} {"train_loss": -5.824601173400879, "global_step": 51335, "epoch": 1222} {"train_loss": -5.789357662200928, "global_step": 51336, "epoch": 1222} {"train_loss": -5.757713794708252, "global_step": 51337, "epoch": 1222} {"train_loss": -5.833397388458252, "global_step": 51338, "epoch": 1222} {"train_loss": -5.824268341064453, "global_step": 51339, "epoch": 1222} {"train_loss": -5.761188983917236, "global_step": 51340, "epoch": 1222} {"train_loss": -5.829013347625732, "global_step": 51341, "epoch": 1222} {"train_loss": -5.7215471267700195, "global_step": 51342, "epoch": 1222} {"train_loss": -5.740394592285156, "global_step": 51343, "epoch": 1222} {"train_loss": -5.631748676300049, "global_step": 51344, "epoch": 1222} {"train_loss": -5.742769718170166, "global_step": 51345, "epoch": 1222} {"train_loss": -5.755087852478027, "global_step": 51346, "epoch": 1222} {"train_loss": -5.688803672790527, "global_step": 51347, "epoch": 1222} {"train_loss": -5.7360944747924805, "global_step": 51348, "epoch": 1222} {"train_loss": -5.738467216491699, "global_step": 51349, "epoch": 1222} {"train_loss": -5.761602401733398, "global_step": 51350, "epoch": 1222} {"train_loss": -5.571718215942383, "global_step": 51351, "epoch": 1222} {"train_loss": -5.717796802520752, "global_step": 51352, "epoch": 1222} {"train_loss": -5.819801330566406, "global_step": 51353, "epoch": 1222} {"train_loss": -5.762956619262695, "global_step": 51354, "epoch": 1222} {"train_loss": -5.55313777923584, "global_step": 51355, "epoch": 1222} {"train_loss": -5.807483196258545, "global_step": 51356, "epoch": 1222} {"train_loss": -5.707021713256836, "global_step": 51357, "epoch": 1222} {"train_loss": -5.798634052276611, "global_step": 51358, "epoch": 1222} {"train_loss": -5.774828910827637, "global_step": 51359, "epoch": 1222} {"train_loss": -5.783358097076416, "global_step": 51360, "epoch": 1222} {"train_loss": -5.879161834716797, "global_step": 51361, "epoch": 1222} {"train_loss": -5.8938889503479, "global_step": 51362, "epoch": 1222} {"train_loss": -5.750703811645508, "global_step": 51363, "epoch": 1222} {"train_loss": -5.702795505523682, "global_step": 51364, "epoch": 1222} {"train_loss": -5.75739236105056, "global_step": 51365, "epoch": 1222, "val_loss": 66160.03125} {"train_loss": -5.726520538330078, "global_step": 51366, "epoch": 1223} {"train_loss": -5.685873985290527, "global_step": 51367, "epoch": 1223} {"train_loss": -5.654450416564941, "global_step": 51368, "epoch": 1223} {"train_loss": -5.794954776763916, "global_step": 51369, "epoch": 1223} {"train_loss": -5.801205635070801, "global_step": 51370, "epoch": 1223} {"train_loss": -5.871573448181152, "global_step": 51371, "epoch": 1223} {"train_loss": -5.699643135070801, "global_step": 51372, "epoch": 1223} {"train_loss": -5.807755470275879, "global_step": 51373, "epoch": 1223} {"train_loss": -5.825531005859375, "global_step": 51374, "epoch": 1223} {"train_loss": -5.767577171325684, "global_step": 51375, "epoch": 1223} {"train_loss": -5.7827911376953125, "global_step": 51376, "epoch": 1223} {"train_loss": -5.609043121337891, "global_step": 51377, "epoch": 1223} {"train_loss": -5.805237293243408, "global_step": 51378, "epoch": 1223} {"train_loss": -5.801094055175781, "global_step": 51379, "epoch": 1223} {"train_loss": -5.758666038513184, "global_step": 51380, "epoch": 1223} {"train_loss": -5.819085121154785, "global_step": 51381, "epoch": 1223} {"train_loss": -5.634424686431885, "global_step": 51382, "epoch": 1223} {"train_loss": -5.902227878570557, "global_step": 51383, "epoch": 1223} {"train_loss": -5.643045425415039, "global_step": 51384, "epoch": 1223} {"train_loss": -5.7519659996032715, "global_step": 51385, "epoch": 1223} {"train_loss": -5.728280067443848, "global_step": 51386, "epoch": 1223} {"train_loss": -5.7649736404418945, "global_step": 51387, "epoch": 1223} {"train_loss": -5.757636070251465, "global_step": 51388, "epoch": 1223} {"train_loss": -5.742286682128906, "global_step": 51389, "epoch": 1223} {"train_loss": -5.819672584533691, "global_step": 51390, "epoch": 1223} {"train_loss": -5.836752891540527, "global_step": 51391, "epoch": 1223} {"train_loss": -5.73370361328125, "global_step": 51392, "epoch": 1223} {"train_loss": -5.814515113830566, "global_step": 51393, "epoch": 1223} {"train_loss": -5.844327449798584, "global_step": 51394, "epoch": 1223} {"train_loss": -5.692379951477051, "global_step": 51395, "epoch": 1223} {"train_loss": -5.830284595489502, "global_step": 51396, "epoch": 1223} {"train_loss": -5.847090721130371, "global_step": 51397, "epoch": 1223} {"train_loss": -5.733719348907471, "global_step": 51398, "epoch": 1223} {"train_loss": -5.727874755859375, "global_step": 51399, "epoch": 1223} {"train_loss": -5.787548065185547, "global_step": 51400, "epoch": 1223} {"train_loss": -5.770294189453125, "global_step": 51401, "epoch": 1223} {"train_loss": -5.75178861618042, "global_step": 51402, "epoch": 1223} {"train_loss": -5.685466289520264, "global_step": 51403, "epoch": 1223} {"train_loss": -5.735500335693359, "global_step": 51404, "epoch": 1223} {"train_loss": -5.655772686004639, "global_step": 51405, "epoch": 1223} {"train_loss": -5.653536319732666, "global_step": 51406, "epoch": 1223} {"train_loss": -5.75859302566165, "global_step": 51407, "epoch": 1223, "val_loss": 66309.21875} {"train_loss": -5.880987167358398, "global_step": 51408, "epoch": 1224} {"train_loss": -5.658135414123535, "global_step": 51409, "epoch": 1224} {"train_loss": -5.725507736206055, "global_step": 51410, "epoch": 1224} {"train_loss": -5.724976539611816, "global_step": 51411, "epoch": 1224} {"train_loss": -5.6805100440979, "global_step": 51412, "epoch": 1224} {"train_loss": -5.913754463195801, "global_step": 51413, "epoch": 1224} {"train_loss": -5.599765777587891, "global_step": 51414, "epoch": 1224} {"train_loss": -5.78720235824585, "global_step": 51415, "epoch": 1224} {"train_loss": -5.653463840484619, "global_step": 51416, "epoch": 1224} {"train_loss": -5.677179336547852, "global_step": 51417, "epoch": 1224} {"train_loss": -5.756455898284912, "global_step": 51418, "epoch": 1224} {"train_loss": -5.699130535125732, "global_step": 51419, "epoch": 1224} {"train_loss": -5.762500762939453, "global_step": 51420, "epoch": 1224} {"train_loss": -5.697526931762695, "global_step": 51421, "epoch": 1224} {"train_loss": -5.675422668457031, "global_step": 51422, "epoch": 1224} {"train_loss": -5.81199312210083, "global_step": 51423, "epoch": 1224} {"train_loss": -5.76448917388916, "global_step": 51424, "epoch": 1224} {"train_loss": -5.614097595214844, "global_step": 51425, "epoch": 1224} {"train_loss": -5.617020606994629, "global_step": 51426, "epoch": 1224} {"train_loss": -5.689029693603516, "global_step": 51427, "epoch": 1224} {"train_loss": -5.628087997436523, "global_step": 51428, "epoch": 1224} {"train_loss": -5.795529365539551, "global_step": 51429, "epoch": 1224} {"train_loss": -5.6143646240234375, "global_step": 51430, "epoch": 1224} {"train_loss": -5.8368821144104, "global_step": 51431, "epoch": 1224} {"train_loss": -5.720287322998047, "global_step": 51432, "epoch": 1224} {"train_loss": -5.710944652557373, "global_step": 51433, "epoch": 1224} {"train_loss": -5.787667274475098, "global_step": 51434, "epoch": 1224} {"train_loss": -5.728046417236328, "global_step": 51435, "epoch": 1224} {"train_loss": -5.662186145782471, "global_step": 51436, "epoch": 1224} {"train_loss": -5.764019966125488, "global_step": 51437, "epoch": 1224} {"train_loss": -5.858221530914307, "global_step": 51438, "epoch": 1224} {"train_loss": -5.6329169273376465, "global_step": 51439, "epoch": 1224} {"train_loss": -5.6962571144104, "global_step": 51440, "epoch": 1224} {"train_loss": -5.711613655090332, "global_step": 51441, "epoch": 1224} {"train_loss": -5.567561626434326, "global_step": 51442, "epoch": 1224} {"train_loss": -5.693279266357422, "global_step": 51443, "epoch": 1224} {"train_loss": -5.699683666229248, "global_step": 51444, "epoch": 1224} {"train_loss": -5.752285957336426, "global_step": 51445, "epoch": 1224} {"train_loss": -5.663902282714844, "global_step": 51446, "epoch": 1224} {"train_loss": -5.85727071762085, "global_step": 51447, "epoch": 1224} {"train_loss": -5.649794101715088, "global_step": 51448, "epoch": 1224} {"train_loss": -5.718064342226301, "global_step": 51449, "epoch": 1224, "val_loss": 66371.7421875} {"train_loss": -5.783957481384277, "global_step": 51450, "epoch": 1225} {"train_loss": -5.758229732513428, "global_step": 51451, "epoch": 1225} {"train_loss": -5.628790855407715, "global_step": 51452, "epoch": 1225} {"train_loss": -5.624879837036133, "global_step": 51453, "epoch": 1225} {"train_loss": -5.741156578063965, "global_step": 51454, "epoch": 1225} {"train_loss": -5.697601318359375, "global_step": 51455, "epoch": 1225} {"train_loss": -5.7879228591918945, "global_step": 51456, "epoch": 1225} {"train_loss": -5.7610883712768555, "global_step": 51457, "epoch": 1225} {"train_loss": -5.806787490844727, "global_step": 51458, "epoch": 1225} {"train_loss": -5.783186912536621, "global_step": 51459, "epoch": 1225} {"train_loss": -5.655265808105469, "global_step": 51460, "epoch": 1225} {"train_loss": -5.812154769897461, "global_step": 51461, "epoch": 1225} {"train_loss": -5.848062515258789, "global_step": 51462, "epoch": 1225} {"train_loss": -5.797831058502197, "global_step": 51463, "epoch": 1225} {"train_loss": -5.77923583984375, "global_step": 51464, "epoch": 1225} {"train_loss": -5.715358734130859, "global_step": 51465, "epoch": 1225} {"train_loss": -5.697835922241211, "global_step": 51466, "epoch": 1225} {"train_loss": -5.676074028015137, "global_step": 51467, "epoch": 1225} {"train_loss": -5.845719814300537, "global_step": 51468, "epoch": 1225} {"train_loss": -5.755061626434326, "global_step": 51469, "epoch": 1225} {"train_loss": -5.755456924438477, "global_step": 51470, "epoch": 1225} {"train_loss": -5.719600677490234, "global_step": 51471, "epoch": 1225} {"train_loss": -5.752634525299072, "global_step": 51472, "epoch": 1225} {"train_loss": -5.8021039962768555, "global_step": 51473, "epoch": 1225} {"train_loss": -5.6578216552734375, "global_step": 51474, "epoch": 1225} {"train_loss": -5.702433109283447, "global_step": 51475, "epoch": 1225} {"train_loss": -5.871284484863281, "global_step": 51476, "epoch": 1225} {"train_loss": -5.685671806335449, "global_step": 51477, "epoch": 1225} {"train_loss": -5.774048328399658, "global_step": 51478, "epoch": 1225} {"train_loss": -5.754169940948486, "global_step": 51479, "epoch": 1225} {"train_loss": -5.817615509033203, "global_step": 51480, "epoch": 1225} {"train_loss": -5.879168510437012, "global_step": 51481, "epoch": 1225} {"train_loss": -5.8278350830078125, "global_step": 51482, "epoch": 1225} {"train_loss": -5.810297966003418, "global_step": 51483, "epoch": 1225} {"train_loss": -5.825044631958008, "global_step": 51484, "epoch": 1225} {"train_loss": -5.813918113708496, "global_step": 51485, "epoch": 1225} {"train_loss": -5.80879020690918, "global_step": 51486, "epoch": 1225} {"train_loss": -5.719758987426758, "global_step": 51487, "epoch": 1225} {"train_loss": -5.720818519592285, "global_step": 51488, "epoch": 1225} {"train_loss": -5.781503677368164, "global_step": 51489, "epoch": 1225} {"train_loss": -5.819642543792725, "global_step": 51490, "epoch": 1225} {"train_loss": -5.759534302211943, "global_step": 51491, "epoch": 1225, "val_loss": 66201.6875} {"train_loss": -5.931252479553223, "global_step": 51492, "epoch": 1226} {"train_loss": -5.741528034210205, "global_step": 51493, "epoch": 1226} {"train_loss": -5.913908958435059, "global_step": 51494, "epoch": 1226} {"train_loss": -5.7206830978393555, "global_step": 51495, "epoch": 1226} {"train_loss": -5.811759948730469, "global_step": 51496, "epoch": 1226} {"train_loss": -5.781466960906982, "global_step": 51497, "epoch": 1226} {"train_loss": -5.8035125732421875, "global_step": 51498, "epoch": 1226} {"train_loss": -5.979534149169922, "global_step": 51499, "epoch": 1226} {"train_loss": -5.853243827819824, "global_step": 51500, "epoch": 1226} {"train_loss": -5.7182817459106445, "global_step": 51501, "epoch": 1226} {"train_loss": -5.754342079162598, "global_step": 51502, "epoch": 1226} {"train_loss": -5.814452648162842, "global_step": 51503, "epoch": 1226} {"train_loss": -5.887485980987549, "global_step": 51504, "epoch": 1226} {"train_loss": -5.841005325317383, "global_step": 51505, "epoch": 1226} {"train_loss": -5.799141883850098, "global_step": 51506, "epoch": 1226} {"train_loss": -5.77479887008667, "global_step": 51507, "epoch": 1226} {"train_loss": -5.771947860717773, "global_step": 51508, "epoch": 1226} {"train_loss": -5.778953552246094, "global_step": 51509, "epoch": 1226} {"train_loss": -5.852819919586182, "global_step": 51510, "epoch": 1226} {"train_loss": -5.86207389831543, "global_step": 51511, "epoch": 1226} {"train_loss": -5.83551025390625, "global_step": 51512, "epoch": 1226} {"train_loss": -5.7013092041015625, "global_step": 51513, "epoch": 1226} {"train_loss": -5.7646260261535645, "global_step": 51514, "epoch": 1226} {"train_loss": -5.817322731018066, "global_step": 51515, "epoch": 1226} {"train_loss": -5.63276481628418, "global_step": 51516, "epoch": 1226} {"train_loss": -5.658235549926758, "global_step": 51517, "epoch": 1226} {"train_loss": -5.7046942710876465, "global_step": 51518, "epoch": 1226} {"train_loss": -5.74528694152832, "global_step": 51519, "epoch": 1226} {"train_loss": -5.755794048309326, "global_step": 51520, "epoch": 1226} {"train_loss": -5.744881629943848, "global_step": 51521, "epoch": 1226} {"train_loss": -5.817037582397461, "global_step": 51522, "epoch": 1226} {"train_loss": -5.770124435424805, "global_step": 51523, "epoch": 1226} {"train_loss": -5.765226364135742, "global_step": 51524, "epoch": 1226} {"train_loss": -5.842247009277344, "global_step": 51525, "epoch": 1226} {"train_loss": -5.881083965301514, "global_step": 51526, "epoch": 1226} {"train_loss": -5.7713727951049805, "global_step": 51527, "epoch": 1226} {"train_loss": -5.8092570304870605, "global_step": 51528, "epoch": 1226} {"train_loss": -5.695765495300293, "global_step": 51529, "epoch": 1226} {"train_loss": -5.740545749664307, "global_step": 51530, "epoch": 1226} {"train_loss": -5.751416206359863, "global_step": 51531, "epoch": 1226} {"train_loss": -5.775897979736328, "global_step": 51532, "epoch": 1226} {"train_loss": -5.789292131151472, "global_step": 51533, "epoch": 1226, "val_loss": 66315.0390625} {"train_loss": -5.770265579223633, "global_step": 51534, "epoch": 1227} {"train_loss": -5.686200141906738, "global_step": 51535, "epoch": 1227} {"train_loss": -5.760261535644531, "global_step": 51536, "epoch": 1227} {"train_loss": -5.711264133453369, "global_step": 51537, "epoch": 1227} {"train_loss": -5.754729747772217, "global_step": 51538, "epoch": 1227} {"train_loss": -5.75002384185791, "global_step": 51539, "epoch": 1227} {"train_loss": -5.88958740234375, "global_step": 51540, "epoch": 1227} {"train_loss": -5.885677337646484, "global_step": 51541, "epoch": 1227} {"train_loss": -5.847524642944336, "global_step": 51542, "epoch": 1227} {"train_loss": -5.712777614593506, "global_step": 51543, "epoch": 1227} {"train_loss": -5.814365863800049, "global_step": 51544, "epoch": 1227} {"train_loss": -5.781741619110107, "global_step": 51545, "epoch": 1227} {"train_loss": -5.7850165367126465, "global_step": 51546, "epoch": 1227} {"train_loss": -5.811924934387207, "global_step": 51547, "epoch": 1227} {"train_loss": -5.77289342880249, "global_step": 51548, "epoch": 1227} {"train_loss": -5.6595072746276855, "global_step": 51549, "epoch": 1227} {"train_loss": -5.79506254196167, "global_step": 51550, "epoch": 1227} {"train_loss": -5.679844856262207, "global_step": 51551, "epoch": 1227} {"train_loss": -5.832730293273926, "global_step": 51552, "epoch": 1227} {"train_loss": -5.799798011779785, "global_step": 51553, "epoch": 1227} {"train_loss": -5.861817359924316, "global_step": 51554, "epoch": 1227} {"train_loss": -5.816701889038086, "global_step": 51555, "epoch": 1227} {"train_loss": -5.760350227355957, "global_step": 51556, "epoch": 1227} {"train_loss": -5.817198753356934, "global_step": 51557, "epoch": 1227} {"train_loss": -5.744016647338867, "global_step": 51558, "epoch": 1227} {"train_loss": -5.880437850952148, "global_step": 51559, "epoch": 1227} {"train_loss": -5.742755889892578, "global_step": 51560, "epoch": 1227} {"train_loss": -5.77347993850708, "global_step": 51561, "epoch": 1227} {"train_loss": -5.751937389373779, "global_step": 51562, "epoch": 1227} {"train_loss": -5.708470344543457, "global_step": 51563, "epoch": 1227} {"train_loss": -5.705209732055664, "global_step": 51564, "epoch": 1227} {"train_loss": -5.704226016998291, "global_step": 51565, "epoch": 1227} {"train_loss": -5.7231364250183105, "global_step": 51566, "epoch": 1227} {"train_loss": -5.797553062438965, "global_step": 51567, "epoch": 1227} {"train_loss": -5.683224201202393, "global_step": 51568, "epoch": 1227} {"train_loss": -5.811389923095703, "global_step": 51569, "epoch": 1227} {"train_loss": -5.91237735748291, "global_step": 51570, "epoch": 1227} {"train_loss": -5.834782600402832, "global_step": 51571, "epoch": 1227} {"train_loss": -5.745208263397217, "global_step": 51572, "epoch": 1227} {"train_loss": -5.762893199920654, "global_step": 51573, "epoch": 1227} {"train_loss": -5.90328311920166, "global_step": 51574, "epoch": 1227} {"train_loss": -5.7746822606949575, "global_step": 51575, "epoch": 1227, "val_loss": 66106.390625} {"train_loss": -5.923635482788086, "global_step": 51576, "epoch": 1228} {"train_loss": -5.758038520812988, "global_step": 51577, "epoch": 1228} {"train_loss": -5.615375518798828, "global_step": 51578, "epoch": 1228} {"train_loss": -5.7117600440979, "global_step": 51579, "epoch": 1228} {"train_loss": -5.7250776290893555, "global_step": 51580, "epoch": 1228} {"train_loss": -5.79866361618042, "global_step": 51581, "epoch": 1228} {"train_loss": -5.764814853668213, "global_step": 51582, "epoch": 1228} {"train_loss": -5.80008602142334, "global_step": 51583, "epoch": 1228} {"train_loss": -5.823042869567871, "global_step": 51584, "epoch": 1228} {"train_loss": -5.763368606567383, "global_step": 51585, "epoch": 1228} {"train_loss": -5.819732666015625, "global_step": 51586, "epoch": 1228} {"train_loss": -5.732213497161865, "global_step": 51587, "epoch": 1228} {"train_loss": -5.868255615234375, "global_step": 51588, "epoch": 1228} {"train_loss": -5.789035320281982, "global_step": 51589, "epoch": 1228} {"train_loss": -5.721639156341553, "global_step": 51590, "epoch": 1228} {"train_loss": -5.827954292297363, "global_step": 51591, "epoch": 1228} {"train_loss": -5.817954063415527, "global_step": 51592, "epoch": 1228} {"train_loss": -5.840958595275879, "global_step": 51593, "epoch": 1228} {"train_loss": -5.543460845947266, "global_step": 51594, "epoch": 1228} {"train_loss": -5.750934600830078, "global_step": 51595, "epoch": 1228} {"train_loss": -5.731345176696777, "global_step": 51596, "epoch": 1228} {"train_loss": -5.759422302246094, "global_step": 51597, "epoch": 1228} {"train_loss": -5.8022260665893555, "global_step": 51598, "epoch": 1228} {"train_loss": -5.64434814453125, "global_step": 51599, "epoch": 1228} {"train_loss": -5.72533655166626, "global_step": 51600, "epoch": 1228} {"train_loss": -5.755545616149902, "global_step": 51601, "epoch": 1228} {"train_loss": -5.707849502563477, "global_step": 51602, "epoch": 1228} {"train_loss": -5.63234281539917, "global_step": 51603, "epoch": 1228} {"train_loss": -5.6377668380737305, "global_step": 51604, "epoch": 1228} {"train_loss": -5.578079700469971, "global_step": 51605, "epoch": 1228} {"train_loss": -5.678716659545898, "global_step": 51606, "epoch": 1228} {"train_loss": -5.740384101867676, "global_step": 51607, "epoch": 1228} {"train_loss": -5.81588077545166, "global_step": 51608, "epoch": 1228} {"train_loss": -5.775173187255859, "global_step": 51609, "epoch": 1228} {"train_loss": -5.72884464263916, "global_step": 51610, "epoch": 1228} {"train_loss": -5.712430000305176, "global_step": 51611, "epoch": 1228} {"train_loss": -5.750402927398682, "global_step": 51612, "epoch": 1228} {"train_loss": -5.792625904083252, "global_step": 51613, "epoch": 1228} {"train_loss": -5.944375038146973, "global_step": 51614, "epoch": 1228} {"train_loss": -5.860008239746094, "global_step": 51615, "epoch": 1228} {"train_loss": -5.781206130981445, "global_step": 51616, "epoch": 1228} {"train_loss": -5.7553452877771285, "global_step": 51617, "epoch": 1228, "val_loss": 66336.0625} {"train_loss": -5.762447357177734, "global_step": 51618, "epoch": 1229} {"train_loss": -5.674306869506836, "global_step": 51619, "epoch": 1229} {"train_loss": -5.683224201202393, "global_step": 51620, "epoch": 1229} {"train_loss": -5.705401420593262, "global_step": 51621, "epoch": 1229} {"train_loss": -5.723740577697754, "global_step": 51622, "epoch": 1229} {"train_loss": -5.678717136383057, "global_step": 51623, "epoch": 1229} {"train_loss": -5.719291687011719, "global_step": 51624, "epoch": 1229} {"train_loss": -5.825844764709473, "global_step": 51625, "epoch": 1229} {"train_loss": -5.688819885253906, "global_step": 51626, "epoch": 1229} {"train_loss": -5.751924514770508, "global_step": 51627, "epoch": 1229} {"train_loss": -5.763555526733398, "global_step": 51628, "epoch": 1229} {"train_loss": -5.806050777435303, "global_step": 51629, "epoch": 1229} {"train_loss": -5.798532962799072, "global_step": 51630, "epoch": 1229} {"train_loss": -5.762308120727539, "global_step": 51631, "epoch": 1229} {"train_loss": -5.813560485839844, "global_step": 51632, "epoch": 1229} {"train_loss": -5.874905586242676, "global_step": 51633, "epoch": 1229} {"train_loss": -5.752994060516357, "global_step": 51634, "epoch": 1229} {"train_loss": -5.721020698547363, "global_step": 51635, "epoch": 1229} {"train_loss": -5.800711631774902, "global_step": 51636, "epoch": 1229} {"train_loss": -5.880918502807617, "global_step": 51637, "epoch": 1229} {"train_loss": -5.810403823852539, "global_step": 51638, "epoch": 1229} {"train_loss": -5.894075393676758, "global_step": 51639, "epoch": 1229} {"train_loss": -5.768415451049805, "global_step": 51640, "epoch": 1229} {"train_loss": -5.76960563659668, "global_step": 51641, "epoch": 1229} {"train_loss": -5.7863311767578125, "global_step": 51642, "epoch": 1229} {"train_loss": -5.82098388671875, "global_step": 51643, "epoch": 1229} {"train_loss": -5.7864460945129395, "global_step": 51644, "epoch": 1229} {"train_loss": -5.887460708618164, "global_step": 51645, "epoch": 1229} {"train_loss": -5.741835117340088, "global_step": 51646, "epoch": 1229} {"train_loss": -5.726842880249023, "global_step": 51647, "epoch": 1229} {"train_loss": -5.819544315338135, "global_step": 51648, "epoch": 1229} {"train_loss": -5.705024719238281, "global_step": 51649, "epoch": 1229} {"train_loss": -5.782411575317383, "global_step": 51650, "epoch": 1229} {"train_loss": -5.809750556945801, "global_step": 51651, "epoch": 1229} {"train_loss": -5.818390846252441, "global_step": 51652, "epoch": 1229} {"train_loss": -5.866842746734619, "global_step": 51653, "epoch": 1229} {"train_loss": -5.788668632507324, "global_step": 51654, "epoch": 1229} {"train_loss": -5.70587158203125, "global_step": 51655, "epoch": 1229} {"train_loss": -5.772177219390869, "global_step": 51656, "epoch": 1229} {"train_loss": -5.865944862365723, "global_step": 51657, "epoch": 1229} {"train_loss": -5.790295124053955, "global_step": 51658, "epoch": 1229} {"train_loss": -5.778938145864577, "global_step": 51659, "epoch": 1229, "val_loss": 66219.1015625} {"train_loss": -5.862152099609375, "global_step": 51660, "epoch": 1230} {"train_loss": -5.778070449829102, "global_step": 51661, "epoch": 1230} {"train_loss": -5.7586469650268555, "global_step": 51662, "epoch": 1230} {"train_loss": -5.69029426574707, "global_step": 51663, "epoch": 1230} {"train_loss": -5.809393882751465, "global_step": 51664, "epoch": 1230} {"train_loss": -5.794740676879883, "global_step": 51665, "epoch": 1230} {"train_loss": -5.752963542938232, "global_step": 51666, "epoch": 1230} {"train_loss": -5.724967956542969, "global_step": 51667, "epoch": 1230} {"train_loss": -5.765289306640625, "global_step": 51668, "epoch": 1230} {"train_loss": -5.889769554138184, "global_step": 51669, "epoch": 1230} {"train_loss": -5.796290397644043, "global_step": 51670, "epoch": 1230} {"train_loss": -5.8518524169921875, "global_step": 51671, "epoch": 1230} {"train_loss": -5.682315826416016, "global_step": 51672, "epoch": 1230} {"train_loss": -5.845181465148926, "global_step": 51673, "epoch": 1230} {"train_loss": -5.78158712387085, "global_step": 51674, "epoch": 1230} {"train_loss": -5.796152114868164, "global_step": 51675, "epoch": 1230} {"train_loss": -5.79827880859375, "global_step": 51676, "epoch": 1230} {"train_loss": -5.787515640258789, "global_step": 51677, "epoch": 1230} {"train_loss": -5.689456939697266, "global_step": 51678, "epoch": 1230} {"train_loss": -5.772536754608154, "global_step": 51679, "epoch": 1230} {"train_loss": -5.822731018066406, "global_step": 51680, "epoch": 1230} {"train_loss": -5.816131591796875, "global_step": 51681, "epoch": 1230} {"train_loss": -5.800764083862305, "global_step": 51682, "epoch": 1230} {"train_loss": -5.817211151123047, "global_step": 51683, "epoch": 1230} {"train_loss": -5.9349365234375, "global_step": 51684, "epoch": 1230} {"train_loss": -5.842035293579102, "global_step": 51685, "epoch": 1230} {"train_loss": -5.690217018127441, "global_step": 51686, "epoch": 1230} {"train_loss": -5.735853672027588, "global_step": 51687, "epoch": 1230} {"train_loss": -5.701287746429443, "global_step": 51688, "epoch": 1230} {"train_loss": -5.739937782287598, "global_step": 51689, "epoch": 1230} {"train_loss": -5.872457027435303, "global_step": 51690, "epoch": 1230} {"train_loss": -5.903301239013672, "global_step": 51691, "epoch": 1230} {"train_loss": -5.742549896240234, "global_step": 51692, "epoch": 1230} {"train_loss": -5.821110248565674, "global_step": 51693, "epoch": 1230} {"train_loss": -5.685198783874512, "global_step": 51694, "epoch": 1230} {"train_loss": -5.756933689117432, "global_step": 51695, "epoch": 1230} {"train_loss": -5.935081481933594, "global_step": 51696, "epoch": 1230} {"train_loss": -5.692281246185303, "global_step": 51697, "epoch": 1230} {"train_loss": -5.740735054016113, "global_step": 51698, "epoch": 1230} {"train_loss": -5.752323627471924, "global_step": 51699, "epoch": 1230} {"train_loss": -5.728287696838379, "global_step": 51700, "epoch": 1230} {"train_loss": -5.784380742481777, "global_step": 51701, "epoch": 1230, "val_loss": 66332.8515625} {"train_loss": -5.771283149719238, "global_step": 51702, "epoch": 1231} {"train_loss": -5.6329169273376465, "global_step": 51703, "epoch": 1231} {"train_loss": -5.781744003295898, "global_step": 51704, "epoch": 1231} {"train_loss": -5.745849609375, "global_step": 51705, "epoch": 1231} {"train_loss": -5.772938251495361, "global_step": 51706, "epoch": 1231} {"train_loss": -5.711309432983398, "global_step": 51707, "epoch": 1231} {"train_loss": -5.777324676513672, "global_step": 51708, "epoch": 1231} {"train_loss": -5.7592668533325195, "global_step": 51709, "epoch": 1231} {"train_loss": -5.696369647979736, "global_step": 51710, "epoch": 1231} {"train_loss": -5.689033508300781, "global_step": 51711, "epoch": 1231} {"train_loss": -5.671793460845947, "global_step": 51712, "epoch": 1231} {"train_loss": -5.856316566467285, "global_step": 51713, "epoch": 1231} {"train_loss": -5.7657575607299805, "global_step": 51714, "epoch": 1231} {"train_loss": -5.728765964508057, "global_step": 51715, "epoch": 1231} {"train_loss": -5.97013521194458, "global_step": 51716, "epoch": 1231} {"train_loss": -5.726529121398926, "global_step": 51717, "epoch": 1231} {"train_loss": -5.789813995361328, "global_step": 51718, "epoch": 1231} {"train_loss": -5.747856140136719, "global_step": 51719, "epoch": 1231} {"train_loss": -5.714838027954102, "global_step": 51720, "epoch": 1231} {"train_loss": -5.7859344482421875, "global_step": 51721, "epoch": 1231} {"train_loss": -5.713379383087158, "global_step": 51722, "epoch": 1231} {"train_loss": -5.7901105880737305, "global_step": 51723, "epoch": 1231} {"train_loss": -5.834253311157227, "global_step": 51724, "epoch": 1231} {"train_loss": -5.656874179840088, "global_step": 51725, "epoch": 1231} {"train_loss": -5.849259376525879, "global_step": 51726, "epoch": 1231} {"train_loss": -5.678836822509766, "global_step": 51727, "epoch": 1231} {"train_loss": -5.803098678588867, "global_step": 51728, "epoch": 1231} {"train_loss": -5.596412658691406, "global_step": 51729, "epoch": 1231} {"train_loss": -5.76456356048584, "global_step": 51730, "epoch": 1231} {"train_loss": -5.801097869873047, "global_step": 51731, "epoch": 1231} {"train_loss": -5.73875617980957, "global_step": 51732, "epoch": 1231} {"train_loss": -5.714834213256836, "global_step": 51733, "epoch": 1231} {"train_loss": -5.913880348205566, "global_step": 51734, "epoch": 1231} {"train_loss": -5.910792827606201, "global_step": 51735, "epoch": 1231} {"train_loss": -5.773090362548828, "global_step": 51736, "epoch": 1231} {"train_loss": -5.927116394042969, "global_step": 51737, "epoch": 1231} {"train_loss": -5.789023399353027, "global_step": 51738, "epoch": 1231} {"train_loss": -5.872382164001465, "global_step": 51739, "epoch": 1231} {"train_loss": -5.859863758087158, "global_step": 51740, "epoch": 1231} {"train_loss": -5.714892387390137, "global_step": 51741, "epoch": 1231} {"train_loss": -5.6837310791015625, "global_step": 51742, "epoch": 1231} {"train_loss": -5.76633654321943, "global_step": 51743, "epoch": 1231, "val_loss": 66492.21875} {"train_loss": -5.911299228668213, "global_step": 51744, "epoch": 1232} {"train_loss": -5.831687927246094, "global_step": 51745, "epoch": 1232} {"train_loss": -5.844598770141602, "global_step": 51746, "epoch": 1232} {"train_loss": -5.859058380126953, "global_step": 51747, "epoch": 1232} {"train_loss": -5.91898250579834, "global_step": 51748, "epoch": 1232} {"train_loss": -5.922412395477295, "global_step": 51749, "epoch": 1232} {"train_loss": -5.774179458618164, "global_step": 51750, "epoch": 1232} {"train_loss": -5.715301990509033, "global_step": 51751, "epoch": 1232} {"train_loss": -5.813071250915527, "global_step": 51752, "epoch": 1232} {"train_loss": -5.766008377075195, "global_step": 51753, "epoch": 1232} {"train_loss": -5.765523910522461, "global_step": 51754, "epoch": 1232} {"train_loss": -5.818236351013184, "global_step": 51755, "epoch": 1232} {"train_loss": -5.850786209106445, "global_step": 51756, "epoch": 1232} {"train_loss": -5.791119575500488, "global_step": 51757, "epoch": 1232} {"train_loss": -5.776320457458496, "global_step": 51758, "epoch": 1232} {"train_loss": -5.725651741027832, "global_step": 51759, "epoch": 1232} {"train_loss": -5.931330680847168, "global_step": 51760, "epoch": 1232} {"train_loss": -5.63957405090332, "global_step": 51761, "epoch": 1232} {"train_loss": -5.87949275970459, "global_step": 51762, "epoch": 1232} {"train_loss": -5.634555816650391, "global_step": 51763, "epoch": 1232} {"train_loss": -5.757718086242676, "global_step": 51764, "epoch": 1232} {"train_loss": -5.829046726226807, "global_step": 51765, "epoch": 1232} {"train_loss": -5.798921585083008, "global_step": 51766, "epoch": 1232} {"train_loss": -5.726833343505859, "global_step": 51767, "epoch": 1232} {"train_loss": -5.757508754730225, "global_step": 51768, "epoch": 1232} {"train_loss": -5.5702948570251465, "global_step": 51769, "epoch": 1232} {"train_loss": -5.731755256652832, "global_step": 51770, "epoch": 1232} {"train_loss": -5.766091346740723, "global_step": 51771, "epoch": 1232} {"train_loss": -5.774290084838867, "global_step": 51772, "epoch": 1232} {"train_loss": -5.766922473907471, "global_step": 51773, "epoch": 1232} {"train_loss": -5.7740797996521, "global_step": 51774, "epoch": 1232} {"train_loss": -5.704387664794922, "global_step": 51775, "epoch": 1232} {"train_loss": -5.8774542808532715, "global_step": 51776, "epoch": 1232} {"train_loss": -5.8219218254089355, "global_step": 51777, "epoch": 1232} {"train_loss": -5.802194595336914, "global_step": 51778, "epoch": 1232} {"train_loss": -5.908383846282959, "global_step": 51779, "epoch": 1232} {"train_loss": -5.8558759689331055, "global_step": 51780, "epoch": 1232} {"train_loss": -5.763280868530273, "global_step": 51781, "epoch": 1232} {"train_loss": -5.740513801574707, "global_step": 51782, "epoch": 1232} {"train_loss": -5.821078300476074, "global_step": 51783, "epoch": 1232} {"train_loss": -5.747516632080078, "global_step": 51784, "epoch": 1232} {"train_loss": -5.792197352363949, "global_step": 51785, "epoch": 1232, "val_loss": 66226.5234375} {"train_loss": -5.8766937255859375, "global_step": 51786, "epoch": 1233} {"train_loss": -5.810667991638184, "global_step": 51787, "epoch": 1233} {"train_loss": -5.846295356750488, "global_step": 51788, "epoch": 1233} {"train_loss": -5.868151664733887, "global_step": 51789, "epoch": 1233} {"train_loss": -5.933465480804443, "global_step": 51790, "epoch": 1233} {"train_loss": -5.8384199142456055, "global_step": 51791, "epoch": 1233} {"train_loss": -5.789702415466309, "global_step": 51792, "epoch": 1233} {"train_loss": -5.726809501647949, "global_step": 51793, "epoch": 1233} {"train_loss": -5.887819290161133, "global_step": 51794, "epoch": 1233} {"train_loss": -5.891409873962402, "global_step": 51795, "epoch": 1233} {"train_loss": -5.814042091369629, "global_step": 51796, "epoch": 1233} {"train_loss": -5.731474876403809, "global_step": 51797, "epoch": 1233} {"train_loss": -5.703990936279297, "global_step": 51798, "epoch": 1233} {"train_loss": -5.731192111968994, "global_step": 51799, "epoch": 1233} {"train_loss": -5.787844181060791, "global_step": 51800, "epoch": 1233} {"train_loss": -5.626872539520264, "global_step": 51801, "epoch": 1233} {"train_loss": -5.794959545135498, "global_step": 51802, "epoch": 1233} {"train_loss": -5.781979084014893, "global_step": 51803, "epoch": 1233} {"train_loss": -5.746445655822754, "global_step": 51804, "epoch": 1233} {"train_loss": -5.720765113830566, "global_step": 51805, "epoch": 1233} {"train_loss": -5.63505220413208, "global_step": 51806, "epoch": 1233} {"train_loss": -5.759699821472168, "global_step": 51807, "epoch": 1233} {"train_loss": -5.885168075561523, "global_step": 51808, "epoch": 1233} {"train_loss": -5.714638710021973, "global_step": 51809, "epoch": 1233} {"train_loss": -5.766741752624512, "global_step": 51810, "epoch": 1233} {"train_loss": -5.721841812133789, "global_step": 51811, "epoch": 1233} {"train_loss": -5.772761344909668, "global_step": 51812, "epoch": 1233} {"train_loss": -5.867071151733398, "global_step": 51813, "epoch": 1233} {"train_loss": -5.803915977478027, "global_step": 51814, "epoch": 1233} {"train_loss": -5.801661491394043, "global_step": 51815, "epoch": 1233} {"train_loss": -5.851823329925537, "global_step": 51816, "epoch": 1233} {"train_loss": -5.734244346618652, "global_step": 51817, "epoch": 1233} {"train_loss": -5.545253276824951, "global_step": 51818, "epoch": 1233} {"train_loss": -5.857362747192383, "global_step": 51819, "epoch": 1233} {"train_loss": -5.6462202072143555, "global_step": 51820, "epoch": 1233} {"train_loss": -5.733493328094482, "global_step": 51821, "epoch": 1233} {"train_loss": -5.892380237579346, "global_step": 51822, "epoch": 1233} {"train_loss": -5.66580057144165, "global_step": 51823, "epoch": 1233} {"train_loss": -5.7111334800720215, "global_step": 51824, "epoch": 1233} {"train_loss": -5.747688293457031, "global_step": 51825, "epoch": 1233} {"train_loss": -5.600846290588379, "global_step": 51826, "epoch": 1233} {"train_loss": -5.770654757817586, "global_step": 51827, "epoch": 1233, "val_loss": 66278.125} {"train_loss": -5.706460952758789, "global_step": 51828, "epoch": 1234} {"train_loss": -5.750767707824707, "global_step": 51829, "epoch": 1234} {"train_loss": -5.748678684234619, "global_step": 51830, "epoch": 1234} {"train_loss": -5.766333103179932, "global_step": 51831, "epoch": 1234} {"train_loss": -5.653261184692383, "global_step": 51832, "epoch": 1234} {"train_loss": -5.741832733154297, "global_step": 51833, "epoch": 1234} {"train_loss": -5.791770935058594, "global_step": 51834, "epoch": 1234} {"train_loss": -5.868223190307617, "global_step": 51835, "epoch": 1234} {"train_loss": -5.812110900878906, "global_step": 51836, "epoch": 1234} {"train_loss": -5.816388130187988, "global_step": 51837, "epoch": 1234} {"train_loss": -5.841513633728027, "global_step": 51838, "epoch": 1234} {"train_loss": -5.846524238586426, "global_step": 51839, "epoch": 1234} {"train_loss": -5.8096160888671875, "global_step": 51840, "epoch": 1234} {"train_loss": -5.758870601654053, "global_step": 51841, "epoch": 1234} {"train_loss": -5.736423492431641, "global_step": 51842, "epoch": 1234} {"train_loss": -5.791012287139893, "global_step": 51843, "epoch": 1234} {"train_loss": -5.812993049621582, "global_step": 51844, "epoch": 1234} {"train_loss": -5.766781806945801, "global_step": 51845, "epoch": 1234} {"train_loss": -5.768402099609375, "global_step": 51846, "epoch": 1234} {"train_loss": -5.840940475463867, "global_step": 51847, "epoch": 1234} {"train_loss": -5.854287147521973, "global_step": 51848, "epoch": 1234} {"train_loss": -5.930727005004883, "global_step": 51849, "epoch": 1234} {"train_loss": -5.674825668334961, "global_step": 51850, "epoch": 1234} {"train_loss": -5.759242057800293, "global_step": 51851, "epoch": 1234} {"train_loss": -5.721630096435547, "global_step": 51852, "epoch": 1234} {"train_loss": -5.863674640655518, "global_step": 51853, "epoch": 1234} {"train_loss": -5.754371643066406, "global_step": 51854, "epoch": 1234} {"train_loss": -5.704413414001465, "global_step": 51855, "epoch": 1234} {"train_loss": -5.847285747528076, "global_step": 51856, "epoch": 1234} {"train_loss": -5.780060768127441, "global_step": 51857, "epoch": 1234} {"train_loss": -5.842429161071777, "global_step": 51858, "epoch": 1234} {"train_loss": -5.750753402709961, "global_step": 51859, "epoch": 1234} {"train_loss": -5.743828296661377, "global_step": 51860, "epoch": 1234} {"train_loss": -5.811526775360107, "global_step": 51861, "epoch": 1234} {"train_loss": -5.7521491050720215, "global_step": 51862, "epoch": 1234} {"train_loss": -5.654257297515869, "global_step": 51863, "epoch": 1234} {"train_loss": -5.905282020568848, "global_step": 51864, "epoch": 1234} {"train_loss": -5.734451770782471, "global_step": 51865, "epoch": 1234} {"train_loss": -5.772520065307617, "global_step": 51866, "epoch": 1234} {"train_loss": -5.880600929260254, "global_step": 51867, "epoch": 1234} {"train_loss": -5.8262810707092285, "global_step": 51868, "epoch": 1234} {"train_loss": -5.786272571200416, "global_step": 51869, "epoch": 1234, "val_loss": 66342.3515625} {"train_loss": -5.69828987121582, "global_step": 51870, "epoch": 1235} {"train_loss": -5.747654914855957, "global_step": 51871, "epoch": 1235} {"train_loss": -5.789689540863037, "global_step": 51872, "epoch": 1235} {"train_loss": -5.726229667663574, "global_step": 51873, "epoch": 1235} {"train_loss": -5.84220027923584, "global_step": 51874, "epoch": 1235} {"train_loss": -5.81909704208374, "global_step": 51875, "epoch": 1235} {"train_loss": -5.833992004394531, "global_step": 51876, "epoch": 1235} {"train_loss": -5.901230812072754, "global_step": 51877, "epoch": 1235} {"train_loss": -5.765987873077393, "global_step": 51878, "epoch": 1235} {"train_loss": -5.645378112792969, "global_step": 51879, "epoch": 1235} {"train_loss": -5.869542121887207, "global_step": 51880, "epoch": 1235} {"train_loss": -5.6514081954956055, "global_step": 51881, "epoch": 1235} {"train_loss": -5.874611854553223, "global_step": 51882, "epoch": 1235} {"train_loss": -5.855067253112793, "global_step": 51883, "epoch": 1235} {"train_loss": -5.7245192527771, "global_step": 51884, "epoch": 1235} {"train_loss": -5.9991455078125, "global_step": 51885, "epoch": 1235} {"train_loss": -5.857172012329102, "global_step": 51886, "epoch": 1235} {"train_loss": -5.696847915649414, "global_step": 51887, "epoch": 1235} {"train_loss": -5.91074275970459, "global_step": 51888, "epoch": 1235} {"train_loss": -5.851881980895996, "global_step": 51889, "epoch": 1235} {"train_loss": -5.784977912902832, "global_step": 51890, "epoch": 1235} {"train_loss": -5.804548740386963, "global_step": 51891, "epoch": 1235} {"train_loss": -5.807925224304199, "global_step": 51892, "epoch": 1235} {"train_loss": -5.712957382202148, "global_step": 51893, "epoch": 1235} {"train_loss": -5.82069206237793, "global_step": 51894, "epoch": 1235} {"train_loss": -5.804586887359619, "global_step": 51895, "epoch": 1235} {"train_loss": -5.8236894607543945, "global_step": 51896, "epoch": 1235} {"train_loss": -5.6639509201049805, "global_step": 51897, "epoch": 1235} {"train_loss": -5.677589416503906, "global_step": 51898, "epoch": 1235} {"train_loss": -5.702182292938232, "global_step": 51899, "epoch": 1235} {"train_loss": -5.7765913009643555, "global_step": 51900, "epoch": 1235} {"train_loss": -5.7042236328125, "global_step": 51901, "epoch": 1235} {"train_loss": -5.737825393676758, "global_step": 51902, "epoch": 1235} {"train_loss": -5.850272178649902, "global_step": 51903, "epoch": 1235} {"train_loss": -5.662715911865234, "global_step": 51904, "epoch": 1235} {"train_loss": -5.80739164352417, "global_step": 51905, "epoch": 1235} {"train_loss": -5.764772415161133, "global_step": 51906, "epoch": 1235} {"train_loss": -5.7446489334106445, "global_step": 51907, "epoch": 1235} {"train_loss": -5.838125705718994, "global_step": 51908, "epoch": 1235} {"train_loss": -5.743396759033203, "global_step": 51909, "epoch": 1235} {"train_loss": -5.834983825683594, "global_step": 51910, "epoch": 1235} {"train_loss": -5.784886155809675, "global_step": 51911, "epoch": 1235, "val_loss": 66127.875} {"train_loss": -5.774334907531738, "global_step": 51912, "epoch": 1236} {"train_loss": -5.891475677490234, "global_step": 51913, "epoch": 1236} {"train_loss": -5.879295349121094, "global_step": 51914, "epoch": 1236} {"train_loss": -5.822619438171387, "global_step": 51915, "epoch": 1236} {"train_loss": -5.883969783782959, "global_step": 51916, "epoch": 1236} {"train_loss": -5.738680839538574, "global_step": 51917, "epoch": 1236} {"train_loss": -5.828123092651367, "global_step": 51918, "epoch": 1236} {"train_loss": -5.829309463500977, "global_step": 51919, "epoch": 1236} {"train_loss": -5.86879825592041, "global_step": 51920, "epoch": 1236} {"train_loss": -5.699377059936523, "global_step": 51921, "epoch": 1236} {"train_loss": -5.869314193725586, "global_step": 51922, "epoch": 1236} {"train_loss": -5.808715343475342, "global_step": 51923, "epoch": 1236} {"train_loss": -5.857847213745117, "global_step": 51924, "epoch": 1236} {"train_loss": -5.675864219665527, "global_step": 51925, "epoch": 1236} {"train_loss": -5.863973617553711, "global_step": 51926, "epoch": 1236} {"train_loss": -5.589731216430664, "global_step": 51927, "epoch": 1236} {"train_loss": -5.791797637939453, "global_step": 51928, "epoch": 1236} {"train_loss": -5.8382368087768555, "global_step": 51929, "epoch": 1236} {"train_loss": -5.811122894287109, "global_step": 51930, "epoch": 1236} {"train_loss": -5.83765983581543, "global_step": 51931, "epoch": 1236} {"train_loss": -5.858817100524902, "global_step": 51932, "epoch": 1236} {"train_loss": -5.752917289733887, "global_step": 51933, "epoch": 1236} {"train_loss": -5.810606479644775, "global_step": 51934, "epoch": 1236} {"train_loss": -5.750587463378906, "global_step": 51935, "epoch": 1236} {"train_loss": -5.7027082443237305, "global_step": 51936, "epoch": 1236} {"train_loss": -5.780116081237793, "global_step": 51937, "epoch": 1236} {"train_loss": -5.860823154449463, "global_step": 51938, "epoch": 1236} {"train_loss": -5.799168586730957, "global_step": 51939, "epoch": 1236} {"train_loss": -5.742029190063477, "global_step": 51940, "epoch": 1236} {"train_loss": -5.781404495239258, "global_step": 51941, "epoch": 1236} {"train_loss": -5.76397180557251, "global_step": 51942, "epoch": 1236} {"train_loss": -5.845083713531494, "global_step": 51943, "epoch": 1236} {"train_loss": -5.623773574829102, "global_step": 51944, "epoch": 1236} {"train_loss": -5.788483619689941, "global_step": 51945, "epoch": 1236} {"train_loss": -5.770143985748291, "global_step": 51946, "epoch": 1236} {"train_loss": -5.8030829429626465, "global_step": 51947, "epoch": 1236} {"train_loss": -5.770084857940674, "global_step": 51948, "epoch": 1236} {"train_loss": -5.767614841461182, "global_step": 51949, "epoch": 1236} {"train_loss": -5.966569900512695, "global_step": 51950, "epoch": 1236} {"train_loss": -5.759560585021973, "global_step": 51951, "epoch": 1236} {"train_loss": -5.69876766204834, "global_step": 51952, "epoch": 1236} {"train_loss": -5.793737468265352, "global_step": 51953, "epoch": 1236, "val_loss": 66496.828125} {"train_loss": -5.746978759765625, "global_step": 51954, "epoch": 1237} {"train_loss": -5.8565673828125, "global_step": 51955, "epoch": 1237} {"train_loss": -5.697013854980469, "global_step": 51956, "epoch": 1237} {"train_loss": -5.731361389160156, "global_step": 51957, "epoch": 1237} {"train_loss": -5.820146560668945, "global_step": 51958, "epoch": 1237} {"train_loss": -5.742732048034668, "global_step": 51959, "epoch": 1237} {"train_loss": -5.889832496643066, "global_step": 51960, "epoch": 1237} {"train_loss": -5.918257713317871, "global_step": 51961, "epoch": 1237} {"train_loss": -5.745830535888672, "global_step": 51962, "epoch": 1237} {"train_loss": -5.823922157287598, "global_step": 51963, "epoch": 1237} {"train_loss": -5.71466064453125, "global_step": 51964, "epoch": 1237} {"train_loss": -5.7045087814331055, "global_step": 51965, "epoch": 1237} {"train_loss": -5.815013408660889, "global_step": 51966, "epoch": 1237} {"train_loss": -5.71984338760376, "global_step": 51967, "epoch": 1237} {"train_loss": -5.782131195068359, "global_step": 51968, "epoch": 1237} {"train_loss": -5.676626682281494, "global_step": 51969, "epoch": 1237} {"train_loss": -5.74663782119751, "global_step": 51970, "epoch": 1237} {"train_loss": -5.694447040557861, "global_step": 51971, "epoch": 1237} {"train_loss": -5.718350410461426, "global_step": 51972, "epoch": 1237} {"train_loss": -5.704805374145508, "global_step": 51973, "epoch": 1237} {"train_loss": -5.7486772537231445, "global_step": 51974, "epoch": 1237} {"train_loss": -5.756189346313477, "global_step": 51975, "epoch": 1237} {"train_loss": -5.635946750640869, "global_step": 51976, "epoch": 1237} {"train_loss": -5.773948669433594, "global_step": 51977, "epoch": 1237} {"train_loss": -5.736498832702637, "global_step": 51978, "epoch": 1237} {"train_loss": -5.624700546264648, "global_step": 51979, "epoch": 1237} {"train_loss": -5.747056007385254, "global_step": 51980, "epoch": 1237} {"train_loss": -5.745488166809082, "global_step": 51981, "epoch": 1237} {"train_loss": -5.8575897216796875, "global_step": 51982, "epoch": 1237} {"train_loss": -5.7172088623046875, "global_step": 51983, "epoch": 1237} {"train_loss": -5.740209579467773, "global_step": 51984, "epoch": 1237} {"train_loss": -5.723422050476074, "global_step": 51985, "epoch": 1237} {"train_loss": -5.727913856506348, "global_step": 51986, "epoch": 1237} {"train_loss": -5.7552690505981445, "global_step": 51987, "epoch": 1237} {"train_loss": -5.7284932136535645, "global_step": 51988, "epoch": 1237} {"train_loss": -5.824222087860107, "global_step": 51989, "epoch": 1237} {"train_loss": -5.808284282684326, "global_step": 51990, "epoch": 1237} {"train_loss": -5.85457181930542, "global_step": 51991, "epoch": 1237} {"train_loss": -5.801638603210449, "global_step": 51992, "epoch": 1237} {"train_loss": -5.8333024978637695, "global_step": 51993, "epoch": 1237} {"train_loss": -5.8204026222229, "global_step": 51994, "epoch": 1237} {"train_loss": -5.762263400214059, "global_step": 51995, "epoch": 1237, "val_loss": 66142.28125} {"train_loss": -5.784780025482178, "global_step": 51996, "epoch": 1238} {"train_loss": -5.794768333435059, "global_step": 51997, "epoch": 1238} {"train_loss": -5.800936222076416, "global_step": 51998, "epoch": 1238} {"train_loss": -5.817035675048828, "global_step": 51999, "epoch": 1238} {"train_loss": -5.888796329498291, "global_step": 52000, "epoch": 1238} {"train_loss": -5.854741096496582, "global_step": 52001, "epoch": 1238} {"train_loss": -5.790029048919678, "global_step": 52002, "epoch": 1238} {"train_loss": -5.77481746673584, "global_step": 52003, "epoch": 1238} {"train_loss": -5.713373184204102, "global_step": 52004, "epoch": 1238} {"train_loss": -5.837392807006836, "global_step": 52005, "epoch": 1238} {"train_loss": -5.720699310302734, "global_step": 52006, "epoch": 1238} {"train_loss": -5.811712265014648, "global_step": 52007, "epoch": 1238} {"train_loss": -5.816390037536621, "global_step": 52008, "epoch": 1238} {"train_loss": -5.72913932800293, "global_step": 52009, "epoch": 1238} {"train_loss": -5.775627136230469, "global_step": 52010, "epoch": 1238} {"train_loss": -5.80533504486084, "global_step": 52011, "epoch": 1238} {"train_loss": -5.828864097595215, "global_step": 52012, "epoch": 1238} {"train_loss": -5.721127986907959, "global_step": 52013, "epoch": 1238} {"train_loss": -5.764796733856201, "global_step": 52014, "epoch": 1238} {"train_loss": -5.851728439331055, "global_step": 52015, "epoch": 1238} {"train_loss": -5.598484516143799, "global_step": 52016, "epoch": 1238} {"train_loss": -5.819355010986328, "global_step": 52017, "epoch": 1238} {"train_loss": -5.815227508544922, "global_step": 52018, "epoch": 1238} {"train_loss": -5.690362453460693, "global_step": 52019, "epoch": 1238} {"train_loss": -5.8393354415893555, "global_step": 52020, "epoch": 1238} {"train_loss": -5.675603866577148, "global_step": 52021, "epoch": 1238} {"train_loss": -5.775318145751953, "global_step": 52022, "epoch": 1238} {"train_loss": -5.714812278747559, "global_step": 52023, "epoch": 1238} {"train_loss": -5.7206878662109375, "global_step": 52024, "epoch": 1238} {"train_loss": -5.699180603027344, "global_step": 52025, "epoch": 1238} {"train_loss": -5.799370765686035, "global_step": 52026, "epoch": 1238} {"train_loss": -5.696070671081543, "global_step": 52027, "epoch": 1238} {"train_loss": -5.893681526184082, "global_step": 52028, "epoch": 1238} {"train_loss": -5.747546672821045, "global_step": 52029, "epoch": 1238} {"train_loss": -5.767273902893066, "global_step": 52030, "epoch": 1238} {"train_loss": -5.815381050109863, "global_step": 52031, "epoch": 1238} {"train_loss": -5.68440055847168, "global_step": 52032, "epoch": 1238} {"train_loss": -5.776158332824707, "global_step": 52033, "epoch": 1238} {"train_loss": -5.645345687866211, "global_step": 52034, "epoch": 1238} {"train_loss": -5.787615776062012, "global_step": 52035, "epoch": 1238} {"train_loss": -5.749228000640869, "global_step": 52036, "epoch": 1238} {"train_loss": -5.767500877380371, "global_step": 52037, "epoch": 1238, "val_loss": 66149.734375} {"train_loss": -5.7967448234558105, "global_step": 52038, "epoch": 1239} {"train_loss": -5.713289260864258, "global_step": 52039, "epoch": 1239} {"train_loss": -5.784334659576416, "global_step": 52040, "epoch": 1239} {"train_loss": -5.713377952575684, "global_step": 52041, "epoch": 1239} {"train_loss": -5.750870704650879, "global_step": 52042, "epoch": 1239} {"train_loss": -5.7790632247924805, "global_step": 52043, "epoch": 1239} {"train_loss": -5.728268146514893, "global_step": 52044, "epoch": 1239} {"train_loss": -5.7121429443359375, "global_step": 52045, "epoch": 1239} {"train_loss": -5.746613502502441, "global_step": 52046, "epoch": 1239} {"train_loss": -5.756442546844482, "global_step": 52047, "epoch": 1239} {"train_loss": -5.842237949371338, "global_step": 52048, "epoch": 1239} {"train_loss": -5.8087334632873535, "global_step": 52049, "epoch": 1239} {"train_loss": -5.799651622772217, "global_step": 52050, "epoch": 1239} {"train_loss": -5.714925765991211, "global_step": 52051, "epoch": 1239} {"train_loss": -5.806056499481201, "global_step": 52052, "epoch": 1239} {"train_loss": -5.761247158050537, "global_step": 52053, "epoch": 1239} {"train_loss": -5.776935577392578, "global_step": 52054, "epoch": 1239} {"train_loss": -5.710350513458252, "global_step": 52055, "epoch": 1239} {"train_loss": -5.844078063964844, "global_step": 52056, "epoch": 1239} {"train_loss": -5.783176422119141, "global_step": 52057, "epoch": 1239} {"train_loss": -5.795079231262207, "global_step": 52058, "epoch": 1239} {"train_loss": -5.726019382476807, "global_step": 52059, "epoch": 1239} {"train_loss": -5.827553749084473, "global_step": 52060, "epoch": 1239} {"train_loss": -5.709117412567139, "global_step": 52061, "epoch": 1239} {"train_loss": -5.718484401702881, "global_step": 52062, "epoch": 1239} {"train_loss": -5.69302225112915, "global_step": 52063, "epoch": 1239} {"train_loss": -5.915675163269043, "global_step": 52064, "epoch": 1239} {"train_loss": -5.8675761222839355, "global_step": 52065, "epoch": 1239} {"train_loss": -5.734987258911133, "global_step": 52066, "epoch": 1239} {"train_loss": -5.927306652069092, "global_step": 52067, "epoch": 1239} {"train_loss": -5.823107719421387, "global_step": 52068, "epoch": 1239} {"train_loss": -5.689896583557129, "global_step": 52069, "epoch": 1239} {"train_loss": -5.694452285766602, "global_step": 52070, "epoch": 1239} {"train_loss": -5.726256370544434, "global_step": 52071, "epoch": 1239} {"train_loss": -5.81561803817749, "global_step": 52072, "epoch": 1239} {"train_loss": -5.728770732879639, "global_step": 52073, "epoch": 1239} {"train_loss": -5.694396018981934, "global_step": 52074, "epoch": 1239} {"train_loss": -5.800936698913574, "global_step": 52075, "epoch": 1239} {"train_loss": -5.626946449279785, "global_step": 52076, "epoch": 1239} {"train_loss": -5.869521141052246, "global_step": 52077, "epoch": 1239} {"train_loss": -5.958073139190674, "global_step": 52078, "epoch": 1239} {"train_loss": -5.7742320355914885, "global_step": 52079, "epoch": 1239, "val_loss": 66300.9375} {"train_loss": -5.834202766418457, "global_step": 52080, "epoch": 1240} {"train_loss": -5.865751266479492, "global_step": 52081, "epoch": 1240} {"train_loss": -5.686504364013672, "global_step": 52082, "epoch": 1240} {"train_loss": -5.787332534790039, "global_step": 52083, "epoch": 1240} {"train_loss": -5.741231441497803, "global_step": 52084, "epoch": 1240} {"train_loss": -5.763494491577148, "global_step": 52085, "epoch": 1240} {"train_loss": -5.685158729553223, "global_step": 52086, "epoch": 1240} {"train_loss": -5.877368927001953, "global_step": 52087, "epoch": 1240} {"train_loss": -5.795869827270508, "global_step": 52088, "epoch": 1240} {"train_loss": -5.847153663635254, "global_step": 52089, "epoch": 1240} {"train_loss": -5.84329080581665, "global_step": 52090, "epoch": 1240} {"train_loss": -5.761850357055664, "global_step": 52091, "epoch": 1240} {"train_loss": -5.715115547180176, "global_step": 52092, "epoch": 1240} {"train_loss": -5.715606689453125, "global_step": 52093, "epoch": 1240} {"train_loss": -5.843222618103027, "global_step": 52094, "epoch": 1240} {"train_loss": -5.733839988708496, "global_step": 52095, "epoch": 1240} {"train_loss": -5.813757419586182, "global_step": 52096, "epoch": 1240} {"train_loss": -5.799809455871582, "global_step": 52097, "epoch": 1240} {"train_loss": -5.759798526763916, "global_step": 52098, "epoch": 1240} {"train_loss": -5.772488594055176, "global_step": 52099, "epoch": 1240} {"train_loss": -5.576109886169434, "global_step": 52100, "epoch": 1240} {"train_loss": -5.719717025756836, "global_step": 52101, "epoch": 1240} {"train_loss": -5.808619976043701, "global_step": 52102, "epoch": 1240} {"train_loss": -5.757838249206543, "global_step": 52103, "epoch": 1240} {"train_loss": -5.569606781005859, "global_step": 52104, "epoch": 1240} {"train_loss": -5.79509162902832, "global_step": 52105, "epoch": 1240} {"train_loss": -5.695443153381348, "global_step": 52106, "epoch": 1240} {"train_loss": -5.721660614013672, "global_step": 52107, "epoch": 1240} {"train_loss": -5.727004051208496, "global_step": 52108, "epoch": 1240} {"train_loss": -5.701945781707764, "global_step": 52109, "epoch": 1240} {"train_loss": -5.74847936630249, "global_step": 52110, "epoch": 1240} {"train_loss": -5.658576011657715, "global_step": 52111, "epoch": 1240} {"train_loss": -5.73198127746582, "global_step": 52112, "epoch": 1240} {"train_loss": -5.719974040985107, "global_step": 52113, "epoch": 1240} {"train_loss": -5.851505279541016, "global_step": 52114, "epoch": 1240} {"train_loss": -5.773642063140869, "global_step": 52115, "epoch": 1240} {"train_loss": -5.7771148681640625, "global_step": 52116, "epoch": 1240} {"train_loss": -5.674450874328613, "global_step": 52117, "epoch": 1240} {"train_loss": -5.761542320251465, "global_step": 52118, "epoch": 1240} {"train_loss": -5.708319664001465, "global_step": 52119, "epoch": 1240} {"train_loss": -5.7741289138793945, "global_step": 52120, "epoch": 1240} {"train_loss": -5.75716267313276, "global_step": 52121, "epoch": 1240, "val_loss": 66225.53125} {"train_loss": -5.7009100914001465, "global_step": 52122, "epoch": 1241} {"train_loss": -5.729125499725342, "global_step": 52123, "epoch": 1241} {"train_loss": -5.750906467437744, "global_step": 52124, "epoch": 1241} {"train_loss": -5.727119445800781, "global_step": 52125, "epoch": 1241} {"train_loss": -5.734189510345459, "global_step": 52126, "epoch": 1241} {"train_loss": -5.671852111816406, "global_step": 52127, "epoch": 1241} {"train_loss": -5.765242576599121, "global_step": 52128, "epoch": 1241} {"train_loss": -5.746542453765869, "global_step": 52129, "epoch": 1241} {"train_loss": -5.827915668487549, "global_step": 52130, "epoch": 1241} {"train_loss": -5.8280110359191895, "global_step": 52131, "epoch": 1241} {"train_loss": -5.773916721343994, "global_step": 52132, "epoch": 1241} {"train_loss": -5.699548244476318, "global_step": 52133, "epoch": 1241} {"train_loss": -5.71712589263916, "global_step": 52134, "epoch": 1241} {"train_loss": -5.788408279418945, "global_step": 52135, "epoch": 1241} {"train_loss": -5.689382076263428, "global_step": 52136, "epoch": 1241} {"train_loss": -5.7902116775512695, "global_step": 52137, "epoch": 1241} {"train_loss": -5.788670063018799, "global_step": 52138, "epoch": 1241} {"train_loss": -5.770920753479004, "global_step": 52139, "epoch": 1241} {"train_loss": -5.7624101638793945, "global_step": 52140, "epoch": 1241} {"train_loss": -5.631957054138184, "global_step": 52141, "epoch": 1241} {"train_loss": -5.912237644195557, "global_step": 52142, "epoch": 1241} {"train_loss": -5.794680595397949, "global_step": 52143, "epoch": 1241} {"train_loss": -5.679641246795654, "global_step": 52144, "epoch": 1241} {"train_loss": -5.745392799377441, "global_step": 52145, "epoch": 1241} {"train_loss": -5.7291059494018555, "global_step": 52146, "epoch": 1241} {"train_loss": -5.746335029602051, "global_step": 52147, "epoch": 1241} {"train_loss": -5.810175895690918, "global_step": 52148, "epoch": 1241} {"train_loss": -5.876680374145508, "global_step": 52149, "epoch": 1241} {"train_loss": -5.788504600524902, "global_step": 52150, "epoch": 1241} {"train_loss": -5.717381954193115, "global_step": 52151, "epoch": 1241} {"train_loss": -5.6509246826171875, "global_step": 52152, "epoch": 1241} {"train_loss": -5.870017051696777, "global_step": 52153, "epoch": 1241} {"train_loss": -5.753969192504883, "global_step": 52154, "epoch": 1241} {"train_loss": -5.9826860427856445, "global_step": 52155, "epoch": 1241} {"train_loss": -5.75762939453125, "global_step": 52156, "epoch": 1241} {"train_loss": -5.707089424133301, "global_step": 52157, "epoch": 1241} {"train_loss": -5.722651481628418, "global_step": 52158, "epoch": 1241} {"train_loss": -5.784420967102051, "global_step": 52159, "epoch": 1241} {"train_loss": -5.766946792602539, "global_step": 52160, "epoch": 1241} {"train_loss": -5.706943511962891, "global_step": 52161, "epoch": 1241} {"train_loss": -5.813209533691406, "global_step": 52162, "epoch": 1241} {"train_loss": -5.762944607507615, "global_step": 52163, "epoch": 1241, "val_loss": 66347.0390625} {"train_loss": -5.806239128112793, "global_step": 52164, "epoch": 1242} {"train_loss": -5.8284406661987305, "global_step": 52165, "epoch": 1242} {"train_loss": -5.911525726318359, "global_step": 52166, "epoch": 1242} {"train_loss": -5.7965803146362305, "global_step": 52167, "epoch": 1242} {"train_loss": -5.7032575607299805, "global_step": 52168, "epoch": 1242} {"train_loss": -5.710373878479004, "global_step": 52169, "epoch": 1242} {"train_loss": -5.879741668701172, "global_step": 52170, "epoch": 1242} {"train_loss": -5.698375701904297, "global_step": 52171, "epoch": 1242} {"train_loss": -5.902627944946289, "global_step": 52172, "epoch": 1242} {"train_loss": -5.9193902015686035, "global_step": 52173, "epoch": 1242} {"train_loss": -5.773016929626465, "global_step": 52174, "epoch": 1242} {"train_loss": -5.7515869140625, "global_step": 52175, "epoch": 1242} {"train_loss": -5.87836217880249, "global_step": 52176, "epoch": 1242} {"train_loss": -5.834656715393066, "global_step": 52177, "epoch": 1242} {"train_loss": -5.852420806884766, "global_step": 52178, "epoch": 1242} {"train_loss": -5.834031105041504, "global_step": 52179, "epoch": 1242} {"train_loss": -5.769967079162598, "global_step": 52180, "epoch": 1242} {"train_loss": -5.812997341156006, "global_step": 52181, "epoch": 1242} {"train_loss": -5.71594762802124, "global_step": 52182, "epoch": 1242} {"train_loss": -5.819637775421143, "global_step": 52183, "epoch": 1242} {"train_loss": -5.793303489685059, "global_step": 52184, "epoch": 1242} {"train_loss": -5.78577184677124, "global_step": 52185, "epoch": 1242} {"train_loss": -5.68625545501709, "global_step": 52186, "epoch": 1242} {"train_loss": -5.962109565734863, "global_step": 52187, "epoch": 1242} {"train_loss": -5.726162910461426, "global_step": 52188, "epoch": 1242} {"train_loss": -5.757809162139893, "global_step": 52189, "epoch": 1242} {"train_loss": -5.764675140380859, "global_step": 52190, "epoch": 1242} {"train_loss": -5.784791469573975, "global_step": 52191, "epoch": 1242} {"train_loss": -5.660717010498047, "global_step": 52192, "epoch": 1242} {"train_loss": -5.779705047607422, "global_step": 52193, "epoch": 1242} {"train_loss": -5.700905799865723, "global_step": 52194, "epoch": 1242} {"train_loss": -5.677361488342285, "global_step": 52195, "epoch": 1242} {"train_loss": -5.813899040222168, "global_step": 52196, "epoch": 1242} {"train_loss": -5.787456512451172, "global_step": 52197, "epoch": 1242} {"train_loss": -5.7945756912231445, "global_step": 52198, "epoch": 1242} {"train_loss": -5.804501533508301, "global_step": 52199, "epoch": 1242} {"train_loss": -5.7637939453125, "global_step": 52200, "epoch": 1242} {"train_loss": -5.805237293243408, "global_step": 52201, "epoch": 1242} {"train_loss": -5.815789699554443, "global_step": 52202, "epoch": 1242} {"train_loss": -5.734302520751953, "global_step": 52203, "epoch": 1242} {"train_loss": -5.721033096313477, "global_step": 52204, "epoch": 1242} {"train_loss": -5.7844885757991245, "global_step": 52205, "epoch": 1242, "val_loss": 66467.453125} {"train_loss": -5.73366641998291, "global_step": 52206, "epoch": 1243} {"train_loss": -5.74246072769165, "global_step": 52207, "epoch": 1243} {"train_loss": -5.680465221405029, "global_step": 52208, "epoch": 1243} {"train_loss": -5.812477111816406, "global_step": 52209, "epoch": 1243} {"train_loss": -5.694849967956543, "global_step": 52210, "epoch": 1243} {"train_loss": -5.653782844543457, "global_step": 52211, "epoch": 1243} {"train_loss": -5.908936500549316, "global_step": 52212, "epoch": 1243} {"train_loss": -5.8004045486450195, "global_step": 52213, "epoch": 1243} {"train_loss": -5.805329322814941, "global_step": 52214, "epoch": 1243} {"train_loss": -5.79096794128418, "global_step": 52215, "epoch": 1243} {"train_loss": -5.800429344177246, "global_step": 52216, "epoch": 1243} {"train_loss": -5.815855979919434, "global_step": 52217, "epoch": 1243} {"train_loss": -5.7937331199646, "global_step": 52218, "epoch": 1243} {"train_loss": -5.779669284820557, "global_step": 52219, "epoch": 1243} {"train_loss": -5.723903656005859, "global_step": 52220, "epoch": 1243} {"train_loss": -5.755800247192383, "global_step": 52221, "epoch": 1243} {"train_loss": -5.660285949707031, "global_step": 52222, "epoch": 1243} {"train_loss": -5.7830729484558105, "global_step": 52223, "epoch": 1243} {"train_loss": -5.779282093048096, "global_step": 52224, "epoch": 1243} {"train_loss": -5.741080284118652, "global_step": 52225, "epoch": 1243} {"train_loss": -5.693562030792236, "global_step": 52226, "epoch": 1243} {"train_loss": -5.699283599853516, "global_step": 52227, "epoch": 1243} {"train_loss": -5.841514587402344, "global_step": 52228, "epoch": 1243} {"train_loss": -5.807377815246582, "global_step": 52229, "epoch": 1243} {"train_loss": -5.852015018463135, "global_step": 52230, "epoch": 1243} {"train_loss": -5.87943172454834, "global_step": 52231, "epoch": 1243} {"train_loss": -5.850888252258301, "global_step": 52232, "epoch": 1243} {"train_loss": -5.834376811981201, "global_step": 52233, "epoch": 1243} {"train_loss": -5.892346382141113, "global_step": 52234, "epoch": 1243} {"train_loss": -5.672647953033447, "global_step": 52235, "epoch": 1243} {"train_loss": -5.734099388122559, "global_step": 52236, "epoch": 1243} {"train_loss": -5.896707534790039, "global_step": 52237, "epoch": 1243} {"train_loss": -5.859287738800049, "global_step": 52238, "epoch": 1243} {"train_loss": -5.792490482330322, "global_step": 52239, "epoch": 1243} {"train_loss": -5.7167487144470215, "global_step": 52240, "epoch": 1243} {"train_loss": -5.733484745025635, "global_step": 52241, "epoch": 1243} {"train_loss": -5.778280258178711, "global_step": 52242, "epoch": 1243} {"train_loss": -5.743377685546875, "global_step": 52243, "epoch": 1243} {"train_loss": -5.79617977142334, "global_step": 52244, "epoch": 1243} {"train_loss": -5.808100700378418, "global_step": 52245, "epoch": 1243} {"train_loss": -5.719729423522949, "global_step": 52246, "epoch": 1243} {"train_loss": -5.777323666073027, "global_step": 52247, "epoch": 1243, "val_loss": 66715.3515625} {"train_loss": -5.7369842529296875, "global_step": 52248, "epoch": 1244} {"train_loss": -5.788898468017578, "global_step": 52249, "epoch": 1244} {"train_loss": -5.8667144775390625, "global_step": 52250, "epoch": 1244} {"train_loss": -5.740516185760498, "global_step": 52251, "epoch": 1244} {"train_loss": -5.730233192443848, "global_step": 52252, "epoch": 1244} {"train_loss": -5.623779296875, "global_step": 52253, "epoch": 1244} {"train_loss": -5.740324974060059, "global_step": 52254, "epoch": 1244} {"train_loss": -5.726093292236328, "global_step": 52255, "epoch": 1244} {"train_loss": -5.736007213592529, "global_step": 52256, "epoch": 1244} {"train_loss": -5.821744918823242, "global_step": 52257, "epoch": 1244} {"train_loss": -5.726088523864746, "global_step": 52258, "epoch": 1244} {"train_loss": -5.7489848136901855, "global_step": 52259, "epoch": 1244} {"train_loss": -5.872715950012207, "global_step": 52260, "epoch": 1244} {"train_loss": -5.763175010681152, "global_step": 52261, "epoch": 1244} {"train_loss": -5.692925453186035, "global_step": 52262, "epoch": 1244} {"train_loss": -5.822422504425049, "global_step": 52263, "epoch": 1244} {"train_loss": -5.67618465423584, "global_step": 52264, "epoch": 1244} {"train_loss": -5.781594276428223, "global_step": 52265, "epoch": 1244} {"train_loss": -5.755947113037109, "global_step": 52266, "epoch": 1244} {"train_loss": -5.75815486907959, "global_step": 52267, "epoch": 1244} {"train_loss": -5.724484920501709, "global_step": 52268, "epoch": 1244} {"train_loss": -5.75644063949585, "global_step": 52269, "epoch": 1244} {"train_loss": -5.674779891967773, "global_step": 52270, "epoch": 1244} {"train_loss": -5.887298107147217, "global_step": 52271, "epoch": 1244} {"train_loss": -5.725031852722168, "global_step": 52272, "epoch": 1244} {"train_loss": -5.848533630371094, "global_step": 52273, "epoch": 1244} {"train_loss": -5.7110795974731445, "global_step": 52274, "epoch": 1244} {"train_loss": -5.77659797668457, "global_step": 52275, "epoch": 1244} {"train_loss": -5.814544200897217, "global_step": 52276, "epoch": 1244} {"train_loss": -5.86926794052124, "global_step": 52277, "epoch": 1244} {"train_loss": -5.700355529785156, "global_step": 52278, "epoch": 1244} {"train_loss": -5.856836318969727, "global_step": 52279, "epoch": 1244} {"train_loss": -5.920522212982178, "global_step": 52280, "epoch": 1244} {"train_loss": -5.781322956085205, "global_step": 52281, "epoch": 1244} {"train_loss": -5.840994834899902, "global_step": 52282, "epoch": 1244} {"train_loss": -5.717392921447754, "global_step": 52283, "epoch": 1244} {"train_loss": -5.887453079223633, "global_step": 52284, "epoch": 1244} {"train_loss": -5.796785354614258, "global_step": 52285, "epoch": 1244} {"train_loss": -5.867522716522217, "global_step": 52286, "epoch": 1244} {"train_loss": -5.831637382507324, "global_step": 52287, "epoch": 1244} {"train_loss": -5.8042988777160645, "global_step": 52288, "epoch": 1244} {"train_loss": -5.775393599555606, "global_step": 52289, "epoch": 1244, "val_loss": 66322.6875} {"train_loss": -5.6268768310546875, "global_step": 52290, "epoch": 1245} {"train_loss": -5.818586349487305, "global_step": 52291, "epoch": 1245} {"train_loss": -5.827420711517334, "global_step": 52292, "epoch": 1245} {"train_loss": -5.839357376098633, "global_step": 52293, "epoch": 1245} {"train_loss": -5.742145538330078, "global_step": 52294, "epoch": 1245} {"train_loss": -5.822330474853516, "global_step": 52295, "epoch": 1245} {"train_loss": -5.85307502746582, "global_step": 52296, "epoch": 1245} {"train_loss": -5.874547004699707, "global_step": 52297, "epoch": 1245} {"train_loss": -5.819967746734619, "global_step": 52298, "epoch": 1245} {"train_loss": -5.696031093597412, "global_step": 52299, "epoch": 1245} {"train_loss": -5.7749433517456055, "global_step": 52300, "epoch": 1245} {"train_loss": -5.8148980140686035, "global_step": 52301, "epoch": 1245} {"train_loss": -5.783461093902588, "global_step": 52302, "epoch": 1245} {"train_loss": -5.7521796226501465, "global_step": 52303, "epoch": 1245} {"train_loss": -5.866394996643066, "global_step": 52304, "epoch": 1245} {"train_loss": -5.804625034332275, "global_step": 52305, "epoch": 1245} {"train_loss": -5.765852928161621, "global_step": 52306, "epoch": 1245} {"train_loss": -5.784259796142578, "global_step": 52307, "epoch": 1245} {"train_loss": -5.855879306793213, "global_step": 52308, "epoch": 1245} {"train_loss": -5.807025909423828, "global_step": 52309, "epoch": 1245} {"train_loss": -5.767467498779297, "global_step": 52310, "epoch": 1245} {"train_loss": -5.689120292663574, "global_step": 52311, "epoch": 1245} {"train_loss": -5.739954471588135, "global_step": 52312, "epoch": 1245} {"train_loss": -5.798725605010986, "global_step": 52313, "epoch": 1245} {"train_loss": -5.800885200500488, "global_step": 52314, "epoch": 1245} {"train_loss": -5.692041397094727, "global_step": 52315, "epoch": 1245} {"train_loss": -5.749660491943359, "global_step": 52316, "epoch": 1245} {"train_loss": -5.708327293395996, "global_step": 52317, "epoch": 1245} {"train_loss": -5.82790470123291, "global_step": 52318, "epoch": 1245} {"train_loss": -5.735260009765625, "global_step": 52319, "epoch": 1245} {"train_loss": -5.741605281829834, "global_step": 52320, "epoch": 1245} {"train_loss": -5.817469596862793, "global_step": 52321, "epoch": 1245} {"train_loss": -5.637258052825928, "global_step": 52322, "epoch": 1245} {"train_loss": -5.844960689544678, "global_step": 52323, "epoch": 1245} {"train_loss": -5.754522800445557, "global_step": 52324, "epoch": 1245} {"train_loss": -5.8876566886901855, "global_step": 52325, "epoch": 1245} {"train_loss": -5.7806291580200195, "global_step": 52326, "epoch": 1245} {"train_loss": -5.88533878326416, "global_step": 52327, "epoch": 1245} {"train_loss": -5.849543571472168, "global_step": 52328, "epoch": 1245} {"train_loss": -5.683899879455566, "global_step": 52329, "epoch": 1245} {"train_loss": -5.785688400268555, "global_step": 52330, "epoch": 1245} {"train_loss": -5.782880521955944, "global_step": 52331, "epoch": 1245, "val_loss": 66215.0390625} {"train_loss": -5.828910827636719, "global_step": 52332, "epoch": 1246} {"train_loss": -5.791214466094971, "global_step": 52333, "epoch": 1246} {"train_loss": -5.832357406616211, "global_step": 52334, "epoch": 1246} {"train_loss": -5.807707786560059, "global_step": 52335, "epoch": 1246} {"train_loss": -5.740785598754883, "global_step": 52336, "epoch": 1246} {"train_loss": -5.698432922363281, "global_step": 52337, "epoch": 1246} {"train_loss": -5.856409072875977, "global_step": 52338, "epoch": 1246} {"train_loss": -5.683405876159668, "global_step": 52339, "epoch": 1246} {"train_loss": -5.964554786682129, "global_step": 52340, "epoch": 1246} {"train_loss": -5.7176103591918945, "global_step": 52341, "epoch": 1246} {"train_loss": -5.7431640625, "global_step": 52342, "epoch": 1246} {"train_loss": -5.9177703857421875, "global_step": 52343, "epoch": 1246} {"train_loss": -5.681073188781738, "global_step": 52344, "epoch": 1246} {"train_loss": -5.862532615661621, "global_step": 52345, "epoch": 1246} {"train_loss": -5.96232271194458, "global_step": 52346, "epoch": 1246} {"train_loss": -5.737536907196045, "global_step": 52347, "epoch": 1246} {"train_loss": -5.643412113189697, "global_step": 52348, "epoch": 1246} {"train_loss": -5.865941047668457, "global_step": 52349, "epoch": 1246} {"train_loss": -5.843145370483398, "global_step": 52350, "epoch": 1246} {"train_loss": -5.678134918212891, "global_step": 52351, "epoch": 1246} {"train_loss": -5.635573387145996, "global_step": 52352, "epoch": 1246} {"train_loss": -5.864789009094238, "global_step": 52353, "epoch": 1246} {"train_loss": -5.800726890563965, "global_step": 52354, "epoch": 1246} {"train_loss": -5.783231735229492, "global_step": 52355, "epoch": 1246} {"train_loss": -5.814202785491943, "global_step": 52356, "epoch": 1246} {"train_loss": -5.839394569396973, "global_step": 52357, "epoch": 1246} {"train_loss": -5.951675891876221, "global_step": 52358, "epoch": 1246} {"train_loss": -5.746551990509033, "global_step": 52359, "epoch": 1246} {"train_loss": -5.8941731452941895, "global_step": 52360, "epoch": 1246} {"train_loss": -5.809183120727539, "global_step": 52361, "epoch": 1246} {"train_loss": -5.716821670532227, "global_step": 52362, "epoch": 1246} {"train_loss": -5.778826713562012, "global_step": 52363, "epoch": 1246} {"train_loss": -5.740536689758301, "global_step": 52364, "epoch": 1246} {"train_loss": -5.8422322273254395, "global_step": 52365, "epoch": 1246} {"train_loss": -5.812217712402344, "global_step": 52366, "epoch": 1246} {"train_loss": -5.596174240112305, "global_step": 52367, "epoch": 1246} {"train_loss": -5.576114654541016, "global_step": 52368, "epoch": 1246} {"train_loss": -5.825253009796143, "global_step": 52369, "epoch": 1246} {"train_loss": -5.774359703063965, "global_step": 52370, "epoch": 1246} {"train_loss": -5.737443923950195, "global_step": 52371, "epoch": 1246} {"train_loss": -5.667375564575195, "global_step": 52372, "epoch": 1246} {"train_loss": -5.780188117708478, "global_step": 52373, "epoch": 1246, "val_loss": 66181.2890625} {"train_loss": -5.7246904373168945, "global_step": 52374, "epoch": 1247} {"train_loss": -5.816680431365967, "global_step": 52375, "epoch": 1247} {"train_loss": -5.820190906524658, "global_step": 52376, "epoch": 1247} {"train_loss": -5.794672966003418, "global_step": 52377, "epoch": 1247} {"train_loss": -5.7323994636535645, "global_step": 52378, "epoch": 1247} {"train_loss": -5.715635299682617, "global_step": 52379, "epoch": 1247} {"train_loss": -5.887094974517822, "global_step": 52380, "epoch": 1247} {"train_loss": -5.6726274490356445, "global_step": 52381, "epoch": 1247} {"train_loss": -5.818268775939941, "global_step": 52382, "epoch": 1247} {"train_loss": -5.853304862976074, "global_step": 52383, "epoch": 1247} {"train_loss": -5.7930006980896, "global_step": 52384, "epoch": 1247} {"train_loss": -5.637053489685059, "global_step": 52385, "epoch": 1247} {"train_loss": -5.862025737762451, "global_step": 52386, "epoch": 1247} {"train_loss": -5.764977931976318, "global_step": 52387, "epoch": 1247} {"train_loss": -5.827980041503906, "global_step": 52388, "epoch": 1247} {"train_loss": -5.781888961791992, "global_step": 52389, "epoch": 1247} {"train_loss": -5.7832489013671875, "global_step": 52390, "epoch": 1247} {"train_loss": -5.8442769050598145, "global_step": 52391, "epoch": 1247} {"train_loss": -5.858911037445068, "global_step": 52392, "epoch": 1247} {"train_loss": -5.783313751220703, "global_step": 52393, "epoch": 1247} {"train_loss": -5.687694549560547, "global_step": 52394, "epoch": 1247} {"train_loss": -5.8610429763793945, "global_step": 52395, "epoch": 1247} {"train_loss": -5.7888383865356445, "global_step": 52396, "epoch": 1247} {"train_loss": -5.640944957733154, "global_step": 52397, "epoch": 1247} {"train_loss": -5.8346405029296875, "global_step": 52398, "epoch": 1247} {"train_loss": -5.890039920806885, "global_step": 52399, "epoch": 1247} {"train_loss": -5.8566083908081055, "global_step": 52400, "epoch": 1247} {"train_loss": -5.756114959716797, "global_step": 52401, "epoch": 1247} {"train_loss": -5.836917877197266, "global_step": 52402, "epoch": 1247} {"train_loss": -5.727701663970947, "global_step": 52403, "epoch": 1247} {"train_loss": -5.877937316894531, "global_step": 52404, "epoch": 1247} {"train_loss": -5.927265167236328, "global_step": 52405, "epoch": 1247} {"train_loss": -5.780901908874512, "global_step": 52406, "epoch": 1247} {"train_loss": -5.850947380065918, "global_step": 52407, "epoch": 1247} {"train_loss": -5.9434919357299805, "global_step": 52408, "epoch": 1247} {"train_loss": -5.709536075592041, "global_step": 52409, "epoch": 1247} {"train_loss": -5.821011066436768, "global_step": 52410, "epoch": 1247} {"train_loss": -5.694978713989258, "global_step": 52411, "epoch": 1247} {"train_loss": -5.783548831939697, "global_step": 52412, "epoch": 1247} {"train_loss": -5.740551471710205, "global_step": 52413, "epoch": 1247} {"train_loss": -5.768037796020508, "global_step": 52414, "epoch": 1247} {"train_loss": -5.792827980858939, "global_step": 52415, "epoch": 1247, "val_loss": 66421.3671875} {"train_loss": -5.8774824142456055, "global_step": 52416, "epoch": 1248} {"train_loss": -5.782110214233398, "global_step": 52417, "epoch": 1248} {"train_loss": -5.788132190704346, "global_step": 52418, "epoch": 1248} {"train_loss": -5.818381309509277, "global_step": 52419, "epoch": 1248} {"train_loss": -5.740683555603027, "global_step": 52420, "epoch": 1248} {"train_loss": -5.869635581970215, "global_step": 52421, "epoch": 1248} {"train_loss": -5.841801643371582, "global_step": 52422, "epoch": 1248} {"train_loss": -5.795904159545898, "global_step": 52423, "epoch": 1248} {"train_loss": -5.745543479919434, "global_step": 52424, "epoch": 1248} {"train_loss": -5.785367012023926, "global_step": 52425, "epoch": 1248} {"train_loss": -5.7266845703125, "global_step": 52426, "epoch": 1248} {"train_loss": -5.900280952453613, "global_step": 52427, "epoch": 1248} {"train_loss": -5.76904296875, "global_step": 52428, "epoch": 1248} {"train_loss": -5.746311187744141, "global_step": 52429, "epoch": 1248} {"train_loss": -5.860355854034424, "global_step": 52430, "epoch": 1248} {"train_loss": -5.734424591064453, "global_step": 52431, "epoch": 1248} {"train_loss": -5.766218662261963, "global_step": 52432, "epoch": 1248} {"train_loss": -5.673005104064941, "global_step": 52433, "epoch": 1248} {"train_loss": -5.831083297729492, "global_step": 52434, "epoch": 1248} {"train_loss": -5.758209228515625, "global_step": 52435, "epoch": 1248} {"train_loss": -5.88438606262207, "global_step": 52436, "epoch": 1248} {"train_loss": -5.906435966491699, "global_step": 52437, "epoch": 1248} {"train_loss": -5.756381034851074, "global_step": 52438, "epoch": 1248} {"train_loss": -5.740602016448975, "global_step": 52439, "epoch": 1248} {"train_loss": -5.832797050476074, "global_step": 52440, "epoch": 1248} {"train_loss": -5.813309669494629, "global_step": 52441, "epoch": 1248} {"train_loss": -5.810555934906006, "global_step": 52442, "epoch": 1248} {"train_loss": -5.84978723526001, "global_step": 52443, "epoch": 1248} {"train_loss": -5.831958770751953, "global_step": 52444, "epoch": 1248} {"train_loss": -5.809673309326172, "global_step": 52445, "epoch": 1248} {"train_loss": -5.850849628448486, "global_step": 52446, "epoch": 1248} {"train_loss": -5.844461441040039, "global_step": 52447, "epoch": 1248} {"train_loss": -5.759880542755127, "global_step": 52448, "epoch": 1248} {"train_loss": -5.791419982910156, "global_step": 52449, "epoch": 1248} {"train_loss": -5.719498634338379, "global_step": 52450, "epoch": 1248} {"train_loss": -5.688718795776367, "global_step": 52451, "epoch": 1248} {"train_loss": -5.80271053314209, "global_step": 52452, "epoch": 1248} {"train_loss": -5.8689141273498535, "global_step": 52453, "epoch": 1248} {"train_loss": -5.762407302856445, "global_step": 52454, "epoch": 1248} {"train_loss": -5.805939197540283, "global_step": 52455, "epoch": 1248} {"train_loss": -5.7133989334106445, "global_step": 52456, "epoch": 1248} {"train_loss": -5.797606763385591, "global_step": 52457, "epoch": 1248, "val_loss": 66269.765625} {"train_loss": -5.894157409667969, "global_step": 52458, "epoch": 1249} {"train_loss": -5.776512622833252, "global_step": 52459, "epoch": 1249} {"train_loss": -5.753269195556641, "global_step": 52460, "epoch": 1249} {"train_loss": -5.87769889831543, "global_step": 52461, "epoch": 1249} {"train_loss": -5.708599090576172, "global_step": 52462, "epoch": 1249} {"train_loss": -5.63079833984375, "global_step": 52463, "epoch": 1249} {"train_loss": -5.800841331481934, "global_step": 52464, "epoch": 1249} {"train_loss": -5.904018878936768, "global_step": 52465, "epoch": 1249} {"train_loss": -5.87876033782959, "global_step": 52466, "epoch": 1249} {"train_loss": -5.838254451751709, "global_step": 52467, "epoch": 1249} {"train_loss": -5.795102119445801, "global_step": 52468, "epoch": 1249} {"train_loss": -5.928523063659668, "global_step": 52469, "epoch": 1249} {"train_loss": -5.776848316192627, "global_step": 52470, "epoch": 1249} {"train_loss": -5.768348693847656, "global_step": 52471, "epoch": 1249} {"train_loss": -5.81965970993042, "global_step": 52472, "epoch": 1249} {"train_loss": -5.848594665527344, "global_step": 52473, "epoch": 1249} {"train_loss": -5.89620304107666, "global_step": 52474, "epoch": 1249} {"train_loss": -5.710590839385986, "global_step": 52475, "epoch": 1249} {"train_loss": -5.692129611968994, "global_step": 52476, "epoch": 1249} {"train_loss": -5.787407875061035, "global_step": 52477, "epoch": 1249} {"train_loss": -5.765900611877441, "global_step": 52478, "epoch": 1249} {"train_loss": -5.853045463562012, "global_step": 52479, "epoch": 1249} {"train_loss": -5.651629447937012, "global_step": 52480, "epoch": 1249} {"train_loss": -5.705859184265137, "global_step": 52481, "epoch": 1249} {"train_loss": -5.776570796966553, "global_step": 52482, "epoch": 1249} {"train_loss": -5.8178019523620605, "global_step": 52483, "epoch": 1249} {"train_loss": -5.7826457023620605, "global_step": 52484, "epoch": 1249} {"train_loss": -5.792510986328125, "global_step": 52485, "epoch": 1249} {"train_loss": -5.769084930419922, "global_step": 52486, "epoch": 1249} {"train_loss": -5.781886100769043, "global_step": 52487, "epoch": 1249} {"train_loss": -5.937398433685303, "global_step": 52488, "epoch": 1249} {"train_loss": -5.754913330078125, "global_step": 52489, "epoch": 1249} {"train_loss": -5.666165351867676, "global_step": 52490, "epoch": 1249} {"train_loss": -5.766099452972412, "global_step": 52491, "epoch": 1249} {"train_loss": -5.771503925323486, "global_step": 52492, "epoch": 1249} {"train_loss": -5.855513572692871, "global_step": 52493, "epoch": 1249} {"train_loss": -5.752261161804199, "global_step": 52494, "epoch": 1249} {"train_loss": -5.842491149902344, "global_step": 52495, "epoch": 1249} {"train_loss": -5.674954414367676, "global_step": 52496, "epoch": 1249} {"train_loss": -5.829118728637695, "global_step": 52497, "epoch": 1249} {"train_loss": -5.840374946594238, "global_step": 52498, "epoch": 1249} {"train_loss": -5.793296269008091, "global_step": 52499, "epoch": 1249, "val_loss": 66251.4921875} {"train_loss": -5.875165939331055, "global_step": 52500, "epoch": 1250} {"train_loss": -5.751572608947754, "global_step": 52501, "epoch": 1250} {"train_loss": -5.825260162353516, "global_step": 52502, "epoch": 1250} {"train_loss": -5.735304832458496, "global_step": 52503, "epoch": 1250} {"train_loss": -5.77789306640625, "global_step": 52504, "epoch": 1250} {"train_loss": -5.781833648681641, "global_step": 52505, "epoch": 1250} {"train_loss": -5.8423919677734375, "global_step": 52506, "epoch": 1250} {"train_loss": -5.651669502258301, "global_step": 52507, "epoch": 1250} {"train_loss": -5.709901332855225, "global_step": 52508, "epoch": 1250} {"train_loss": -5.904419898986816, "global_step": 52509, "epoch": 1250} {"train_loss": -5.699767112731934, "global_step": 52510, "epoch": 1250} {"train_loss": -5.783403396606445, "global_step": 52511, "epoch": 1250} {"train_loss": -5.8373260498046875, "global_step": 52512, "epoch": 1250} {"train_loss": -5.71071195602417, "global_step": 52513, "epoch": 1250} {"train_loss": -5.881872653961182, "global_step": 52514, "epoch": 1250} {"train_loss": -5.802447319030762, "global_step": 52515, "epoch": 1250} {"train_loss": -5.690337181091309, "global_step": 52516, "epoch": 1250} {"train_loss": -5.79223108291626, "global_step": 52517, "epoch": 1250} {"train_loss": -5.795714378356934, "global_step": 52518, "epoch": 1250} {"train_loss": -5.653352737426758, "global_step": 52519, "epoch": 1250} {"train_loss": -5.666404724121094, "global_step": 52520, "epoch": 1250} {"train_loss": -5.840508937835693, "global_step": 52521, "epoch": 1250} {"train_loss": -5.788202285766602, "global_step": 52522, "epoch": 1250} {"train_loss": -5.726775169372559, "global_step": 52523, "epoch": 1250} {"train_loss": -5.8227338790893555, "global_step": 52524, "epoch": 1250} {"train_loss": -5.813262462615967, "global_step": 52525, "epoch": 1250} {"train_loss": -5.871971130371094, "global_step": 52526, "epoch": 1250} {"train_loss": -5.711539268493652, "global_step": 52527, "epoch": 1250} {"train_loss": -5.885320663452148, "global_step": 52528, "epoch": 1250} {"train_loss": -5.734365940093994, "global_step": 52529, "epoch": 1250} {"train_loss": -5.782085418701172, "global_step": 52530, "epoch": 1250} {"train_loss": -5.790462017059326, "global_step": 52531, "epoch": 1250} {"train_loss": -5.754622459411621, "global_step": 52532, "epoch": 1250} {"train_loss": -5.753552436828613, "global_step": 52533, "epoch": 1250} {"train_loss": -5.728496551513672, "global_step": 52534, "epoch": 1250} {"train_loss": -5.719791889190674, "global_step": 52535, "epoch": 1250} {"train_loss": -5.805424690246582, "global_step": 52536, "epoch": 1250} {"train_loss": -5.758985996246338, "global_step": 52537, "epoch": 1250} {"train_loss": -5.84129524230957, "global_step": 52538, "epoch": 1250} {"train_loss": -5.768532752990723, "global_step": 52539, "epoch": 1250} {"train_loss": -5.839017868041992, "global_step": 52540, "epoch": 1250} {"train_loss": -5.78033234959557, "global_step": 52541, "epoch": 1250, "train/sim_max_reward_0": 0.35453871186726377, "train/sim_max_reward_1": 0.6925442704647207, "train/sim_max_reward_2": 0.5910171665324633, "train/sim_max_reward_3": 0.15557195061331122, "train/sim_max_reward_4": 0.7193999144492667, "train/sim_max_reward_5": 0.7772489433923425, "test/sim_max_reward_4400000": 0.16853551656667592, "test/sim_max_reward_4400001": 0.9858891407634507, "test/sim_max_reward_4400002": 0.059451365610438525, "test/sim_max_reward_4400003": 0.3390474051105468, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.3910331466782555, "test/sim_max_reward_4400007": 0.03498330996265413, "test/sim_max_reward_4400008": 0.4442722676540384, "test/sim_max_reward_4400009": 0.8459583971401916, "test/sim_max_reward_4400010": 0.330732489704575, "test/sim_max_reward_4400011": 0.6456453907579311, "test/sim_max_reward_4400012": 0.5875470789169269, "test/sim_max_reward_4400013": 0.9261489761374847, "test/sim_max_reward_4400014": 0.35705673938693283, "test/sim_max_reward_4400015": 0.04070016707503623, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.25246228681781846, "test/sim_max_reward_4400019": 0.23903933423800855, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5635955369855662, "test/sim_max_reward_4400022": 0.32837301495773563, "test/sim_max_reward_4400023": 0.8156682232093764, "test/sim_max_reward_4400024": 0.7952705822527263, "test/sim_max_reward_4400025": 0.18858331624988606, "test/sim_max_reward_4400026": 0.8724594184414425, "test/sim_max_reward_4400027": 0.05599891194786263, "test/sim_max_reward_4400028": 0.3367554981515191, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.8569497726845409, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.14196012997700613, "test/sim_max_reward_4400033": 0.21117149297352053, "test/sim_max_reward_4400034": 0.7043053244976262, "test/sim_max_reward_4400035": 0.5156512962890539, "test/sim_max_reward_4400036": 0.8342372546984788, "test/sim_max_reward_4400037": 0.9629495343033793, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9605500291754725, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9903678782675042, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.018484777889960603, "test/sim_max_reward_4400044": 0.9250403042149902, "test/sim_max_reward_4400045": 0.8659822335818002, "test/sim_max_reward_4400046": 0.2206009670142948, "test/sim_max_reward_4400047": 0.9292169100865028, "test/sim_max_reward_4400048": 0.12424750580898904, "test/sim_max_reward_4400049": 0.9423918127842549, "train/mean_score": 0.5483868262198948, "test/mean_score": 0.4596134563958193, "val_loss": 66351.0546875} {"train_loss": -5.8374223709106445, "global_step": 52542, "epoch": 1251} {"train_loss": -5.736663818359375, "global_step": 52543, "epoch": 1251} {"train_loss": -5.905117988586426, "global_step": 52544, "epoch": 1251} {"train_loss": -5.866556644439697, "global_step": 52545, "epoch": 1251} {"train_loss": -5.827583312988281, "global_step": 52546, "epoch": 1251} {"train_loss": -5.791624546051025, "global_step": 52547, "epoch": 1251} {"train_loss": -5.762117385864258, "global_step": 52548, "epoch": 1251} {"train_loss": -5.82387638092041, "global_step": 52549, "epoch": 1251} {"train_loss": -5.876029014587402, "global_step": 52550, "epoch": 1251} {"train_loss": -5.772368907928467, "global_step": 52551, "epoch": 1251} {"train_loss": -5.702567100524902, "global_step": 52552, "epoch": 1251} {"train_loss": -5.776875972747803, "global_step": 52553, "epoch": 1251} {"train_loss": -5.713577747344971, "global_step": 52554, "epoch": 1251} {"train_loss": -5.715086936950684, "global_step": 52555, "epoch": 1251} {"train_loss": -5.550658226013184, "global_step": 52556, "epoch": 1251} {"train_loss": -5.807755470275879, "global_step": 52557, "epoch": 1251} {"train_loss": -5.757858753204346, "global_step": 52558, "epoch": 1251} {"train_loss": -5.727930068969727, "global_step": 52559, "epoch": 1251} {"train_loss": -5.852306365966797, "global_step": 52560, "epoch": 1251} {"train_loss": -5.758588790893555, "global_step": 52561, "epoch": 1251} {"train_loss": -5.804821014404297, "global_step": 52562, "epoch": 1251} {"train_loss": -5.828909397125244, "global_step": 52563, "epoch": 1251} {"train_loss": -5.709100723266602, "global_step": 52564, "epoch": 1251} {"train_loss": -5.79200553894043, "global_step": 52565, "epoch": 1251} {"train_loss": -5.759486198425293, "global_step": 52566, "epoch": 1251} {"train_loss": -5.797760963439941, "global_step": 52567, "epoch": 1251} {"train_loss": -5.775003433227539, "global_step": 52568, "epoch": 1251} {"train_loss": -5.8181633949279785, "global_step": 52569, "epoch": 1251} {"train_loss": -5.819553375244141, "global_step": 52570, "epoch": 1251} {"train_loss": -5.742456436157227, "global_step": 52571, "epoch": 1251} {"train_loss": -5.952398777008057, "global_step": 52572, "epoch": 1251} {"train_loss": -5.912837982177734, "global_step": 52573, "epoch": 1251} {"train_loss": -5.915073394775391, "global_step": 52574, "epoch": 1251} {"train_loss": -5.809536933898926, "global_step": 52575, "epoch": 1251} {"train_loss": -5.815060615539551, "global_step": 52576, "epoch": 1251} {"train_loss": -5.868215560913086, "global_step": 52577, "epoch": 1251} {"train_loss": -5.811964988708496, "global_step": 52578, "epoch": 1251} {"train_loss": -5.791750907897949, "global_step": 52579, "epoch": 1251} {"train_loss": -5.81581974029541, "global_step": 52580, "epoch": 1251} {"train_loss": -5.7506914138793945, "global_step": 52581, "epoch": 1251} {"train_loss": -5.769224166870117, "global_step": 52582, "epoch": 1251} {"train_loss": -5.799065589904785, "global_step": 52583, "epoch": 1251, "val_loss": 66490.7265625} {"train_loss": -5.708245754241943, "global_step": 52584, "epoch": 1252} {"train_loss": -5.805828094482422, "global_step": 52585, "epoch": 1252} {"train_loss": -5.726700782775879, "global_step": 52586, "epoch": 1252} {"train_loss": -5.807123184204102, "global_step": 52587, "epoch": 1252} {"train_loss": -5.7615885734558105, "global_step": 52588, "epoch": 1252} {"train_loss": -5.596269607543945, "global_step": 52589, "epoch": 1252} {"train_loss": -5.728965759277344, "global_step": 52590, "epoch": 1252} {"train_loss": -5.819217681884766, "global_step": 52591, "epoch": 1252} {"train_loss": -5.802585124969482, "global_step": 52592, "epoch": 1252} {"train_loss": -5.765839576721191, "global_step": 52593, "epoch": 1252} {"train_loss": -5.7923264503479, "global_step": 52594, "epoch": 1252} {"train_loss": -5.855686664581299, "global_step": 52595, "epoch": 1252} {"train_loss": -5.86747932434082, "global_step": 52596, "epoch": 1252} {"train_loss": -5.75869083404541, "global_step": 52597, "epoch": 1252} {"train_loss": -5.870046615600586, "global_step": 52598, "epoch": 1252} {"train_loss": -5.811171054840088, "global_step": 52599, "epoch": 1252} {"train_loss": -5.639848232269287, "global_step": 52600, "epoch": 1252} {"train_loss": -5.6737565994262695, "global_step": 52601, "epoch": 1252} {"train_loss": -5.577070236206055, "global_step": 52602, "epoch": 1252} {"train_loss": -5.823835849761963, "global_step": 52603, "epoch": 1252} {"train_loss": -5.793902397155762, "global_step": 52604, "epoch": 1252} {"train_loss": -5.837185859680176, "global_step": 52605, "epoch": 1252} {"train_loss": -5.861359596252441, "global_step": 52606, "epoch": 1252} {"train_loss": -5.716373443603516, "global_step": 52607, "epoch": 1252} {"train_loss": -5.712615013122559, "global_step": 52608, "epoch": 1252} {"train_loss": -5.794760704040527, "global_step": 52609, "epoch": 1252} {"train_loss": -5.736055850982666, "global_step": 52610, "epoch": 1252} {"train_loss": -5.766523361206055, "global_step": 52611, "epoch": 1252} {"train_loss": -5.830671787261963, "global_step": 52612, "epoch": 1252} {"train_loss": -5.88800048828125, "global_step": 52613, "epoch": 1252} {"train_loss": -5.840404510498047, "global_step": 52614, "epoch": 1252} {"train_loss": -5.953574180603027, "global_step": 52615, "epoch": 1252} {"train_loss": -5.826225280761719, "global_step": 52616, "epoch": 1252} {"train_loss": -5.833798408508301, "global_step": 52617, "epoch": 1252} {"train_loss": -5.85332727432251, "global_step": 52618, "epoch": 1252} {"train_loss": -5.768371105194092, "global_step": 52619, "epoch": 1252} {"train_loss": -5.7333083152771, "global_step": 52620, "epoch": 1252} {"train_loss": -5.739192962646484, "global_step": 52621, "epoch": 1252} {"train_loss": -5.583625793457031, "global_step": 52622, "epoch": 1252} {"train_loss": -5.773434638977051, "global_step": 52623, "epoch": 1252} {"train_loss": -5.6576080322265625, "global_step": 52624, "epoch": 1252} {"train_loss": -5.771191506158738, "global_step": 52625, "epoch": 1252, "val_loss": 66470.8984375} {"train_loss": -5.797574996948242, "global_step": 52626, "epoch": 1253} {"train_loss": -5.708898067474365, "global_step": 52627, "epoch": 1253} {"train_loss": -5.643677711486816, "global_step": 52628, "epoch": 1253} {"train_loss": -5.67262601852417, "global_step": 52629, "epoch": 1253} {"train_loss": -5.702000617980957, "global_step": 52630, "epoch": 1253} {"train_loss": -5.762038707733154, "global_step": 52631, "epoch": 1253} {"train_loss": -5.811042785644531, "global_step": 52632, "epoch": 1253} {"train_loss": -5.784380912780762, "global_step": 52633, "epoch": 1253} {"train_loss": -5.853372573852539, "global_step": 52634, "epoch": 1253} {"train_loss": -5.788548469543457, "global_step": 52635, "epoch": 1253} {"train_loss": -5.889304161071777, "global_step": 52636, "epoch": 1253} {"train_loss": -5.823337554931641, "global_step": 52637, "epoch": 1253} {"train_loss": -5.749988555908203, "global_step": 52638, "epoch": 1253} {"train_loss": -5.849458694458008, "global_step": 52639, "epoch": 1253} {"train_loss": -5.687309741973877, "global_step": 52640, "epoch": 1253} {"train_loss": -5.802708625793457, "global_step": 52641, "epoch": 1253} {"train_loss": -5.733258247375488, "global_step": 52642, "epoch": 1253} {"train_loss": -5.838580131530762, "global_step": 52643, "epoch": 1253} {"train_loss": -5.797292709350586, "global_step": 52644, "epoch": 1253} {"train_loss": -5.710297584533691, "global_step": 52645, "epoch": 1253} {"train_loss": -5.778521537780762, "global_step": 52646, "epoch": 1253} {"train_loss": -5.833295822143555, "global_step": 52647, "epoch": 1253} {"train_loss": -5.864673614501953, "global_step": 52648, "epoch": 1253} {"train_loss": -5.67466926574707, "global_step": 52649, "epoch": 1253} {"train_loss": -5.737794876098633, "global_step": 52650, "epoch": 1253} {"train_loss": -5.691267967224121, "global_step": 52651, "epoch": 1253} {"train_loss": -5.82338809967041, "global_step": 52652, "epoch": 1253} {"train_loss": -5.88068962097168, "global_step": 52653, "epoch": 1253} {"train_loss": -5.691867828369141, "global_step": 52654, "epoch": 1253} {"train_loss": -5.91880464553833, "global_step": 52655, "epoch": 1253} {"train_loss": -5.792860507965088, "global_step": 52656, "epoch": 1253} {"train_loss": -5.797222137451172, "global_step": 52657, "epoch": 1253} {"train_loss": -5.736682415008545, "global_step": 52658, "epoch": 1253} {"train_loss": -5.794186115264893, "global_step": 52659, "epoch": 1253} {"train_loss": -5.7697906494140625, "global_step": 52660, "epoch": 1253} {"train_loss": -5.796490669250488, "global_step": 52661, "epoch": 1253} {"train_loss": -5.81178092956543, "global_step": 52662, "epoch": 1253} {"train_loss": -5.8815765380859375, "global_step": 52663, "epoch": 1253} {"train_loss": -5.805905818939209, "global_step": 52664, "epoch": 1253} {"train_loss": -5.747296333312988, "global_step": 52665, "epoch": 1253} {"train_loss": -5.809926986694336, "global_step": 52666, "epoch": 1253} {"train_loss": -5.780454919451759, "global_step": 52667, "epoch": 1253, "val_loss": 66642.5078125} {"train_loss": -5.82204532623291, "global_step": 52668, "epoch": 1254} {"train_loss": -5.668649196624756, "global_step": 52669, "epoch": 1254} {"train_loss": -5.744586944580078, "global_step": 52670, "epoch": 1254} {"train_loss": -5.870049476623535, "global_step": 52671, "epoch": 1254} {"train_loss": -5.847262382507324, "global_step": 52672, "epoch": 1254} {"train_loss": -5.832726955413818, "global_step": 52673, "epoch": 1254} {"train_loss": -5.836174964904785, "global_step": 52674, "epoch": 1254} {"train_loss": -5.732335090637207, "global_step": 52675, "epoch": 1254} {"train_loss": -5.867208957672119, "global_step": 52676, "epoch": 1254} {"train_loss": -5.665234565734863, "global_step": 52677, "epoch": 1254} {"train_loss": -5.674226760864258, "global_step": 52678, "epoch": 1254} {"train_loss": -5.861484527587891, "global_step": 52679, "epoch": 1254} {"train_loss": -5.672848701477051, "global_step": 52680, "epoch": 1254} {"train_loss": -5.641563415527344, "global_step": 52681, "epoch": 1254} {"train_loss": -5.801565170288086, "global_step": 52682, "epoch": 1254} {"train_loss": -5.616586685180664, "global_step": 52683, "epoch": 1254} {"train_loss": -5.737921714782715, "global_step": 52684, "epoch": 1254} {"train_loss": -5.836978435516357, "global_step": 52685, "epoch": 1254} {"train_loss": -5.7551350593566895, "global_step": 52686, "epoch": 1254} {"train_loss": -5.857756614685059, "global_step": 52687, "epoch": 1254} {"train_loss": -5.77474308013916, "global_step": 52688, "epoch": 1254} {"train_loss": -5.750041961669922, "global_step": 52689, "epoch": 1254} {"train_loss": -5.785172939300537, "global_step": 52690, "epoch": 1254} {"train_loss": -5.844901084899902, "global_step": 52691, "epoch": 1254} {"train_loss": -5.642455577850342, "global_step": 52692, "epoch": 1254} {"train_loss": -5.8563690185546875, "global_step": 52693, "epoch": 1254} {"train_loss": -5.724311351776123, "global_step": 52694, "epoch": 1254} {"train_loss": -5.7749128341674805, "global_step": 52695, "epoch": 1254} {"train_loss": -5.755537986755371, "global_step": 52696, "epoch": 1254} {"train_loss": -5.7823686599731445, "global_step": 52697, "epoch": 1254} {"train_loss": -5.7835588455200195, "global_step": 52698, "epoch": 1254} {"train_loss": -5.873380661010742, "global_step": 52699, "epoch": 1254} {"train_loss": -5.803940773010254, "global_step": 52700, "epoch": 1254} {"train_loss": -5.754517078399658, "global_step": 52701, "epoch": 1254} {"train_loss": -5.824288845062256, "global_step": 52702, "epoch": 1254} {"train_loss": -5.805675506591797, "global_step": 52703, "epoch": 1254} {"train_loss": -5.939038276672363, "global_step": 52704, "epoch": 1254} {"train_loss": -5.848296642303467, "global_step": 52705, "epoch": 1254} {"train_loss": -5.8909406661987305, "global_step": 52706, "epoch": 1254} {"train_loss": -5.736781120300293, "global_step": 52707, "epoch": 1254} {"train_loss": -5.779471397399902, "global_step": 52708, "epoch": 1254} {"train_loss": -5.783226580846877, "global_step": 52709, "epoch": 1254, "val_loss": 66255.6484375} {"train_loss": -5.757046222686768, "global_step": 52710, "epoch": 1255} {"train_loss": -5.830511093139648, "global_step": 52711, "epoch": 1255} {"train_loss": -5.8872575759887695, "global_step": 52712, "epoch": 1255} {"train_loss": -5.816871643066406, "global_step": 52713, "epoch": 1255} {"train_loss": -5.738553047180176, "global_step": 52714, "epoch": 1255} {"train_loss": -5.721837997436523, "global_step": 52715, "epoch": 1255} {"train_loss": -5.679952621459961, "global_step": 52716, "epoch": 1255} {"train_loss": -5.719344139099121, "global_step": 52717, "epoch": 1255} {"train_loss": -5.654215335845947, "global_step": 52718, "epoch": 1255} {"train_loss": -5.79982328414917, "global_step": 52719, "epoch": 1255} {"train_loss": -5.830862045288086, "global_step": 52720, "epoch": 1255} {"train_loss": -5.706812381744385, "global_step": 52721, "epoch": 1255} {"train_loss": -5.748645305633545, "global_step": 52722, "epoch": 1255} {"train_loss": -5.616273403167725, "global_step": 52723, "epoch": 1255} {"train_loss": -5.8173112869262695, "global_step": 52724, "epoch": 1255} {"train_loss": -5.564983367919922, "global_step": 52725, "epoch": 1255} {"train_loss": -5.646604537963867, "global_step": 52726, "epoch": 1255} {"train_loss": -5.77691125869751, "global_step": 52727, "epoch": 1255} {"train_loss": -5.583083629608154, "global_step": 52728, "epoch": 1255} {"train_loss": -5.625590801239014, "global_step": 52729, "epoch": 1255} {"train_loss": -5.763731002807617, "global_step": 52730, "epoch": 1255} {"train_loss": -5.800202369689941, "global_step": 52731, "epoch": 1255} {"train_loss": -5.729546546936035, "global_step": 52732, "epoch": 1255} {"train_loss": -5.710354804992676, "global_step": 52733, "epoch": 1255} {"train_loss": -5.7698564529418945, "global_step": 52734, "epoch": 1255} {"train_loss": -5.868937969207764, "global_step": 52735, "epoch": 1255} {"train_loss": -5.736810684204102, "global_step": 52736, "epoch": 1255} {"train_loss": -5.819464683532715, "global_step": 52737, "epoch": 1255} {"train_loss": -5.730024337768555, "global_step": 52738, "epoch": 1255} {"train_loss": -5.839535713195801, "global_step": 52739, "epoch": 1255} {"train_loss": -5.903005599975586, "global_step": 52740, "epoch": 1255} {"train_loss": -5.80555534362793, "global_step": 52741, "epoch": 1255} {"train_loss": -5.793270111083984, "global_step": 52742, "epoch": 1255} {"train_loss": -5.702073097229004, "global_step": 52743, "epoch": 1255} {"train_loss": -5.768655300140381, "global_step": 52744, "epoch": 1255} {"train_loss": -5.822697639465332, "global_step": 52745, "epoch": 1255} {"train_loss": -5.682277679443359, "global_step": 52746, "epoch": 1255} {"train_loss": -5.845104217529297, "global_step": 52747, "epoch": 1255} {"train_loss": -5.853510856628418, "global_step": 52748, "epoch": 1255} {"train_loss": -5.7620720863342285, "global_step": 52749, "epoch": 1255} {"train_loss": -5.811468124389648, "global_step": 52750, "epoch": 1255} {"train_loss": -5.757341782251994, "global_step": 52751, "epoch": 1255, "val_loss": 66346.578125} {"train_loss": -5.80260705947876, "global_step": 52752, "epoch": 1256} {"train_loss": -5.804980278015137, "global_step": 52753, "epoch": 1256} {"train_loss": -5.792220115661621, "global_step": 52754, "epoch": 1256} {"train_loss": -5.926953315734863, "global_step": 52755, "epoch": 1256} {"train_loss": -5.856530666351318, "global_step": 52756, "epoch": 1256} {"train_loss": -5.815552711486816, "global_step": 52757, "epoch": 1256} {"train_loss": -5.7907867431640625, "global_step": 52758, "epoch": 1256} {"train_loss": -5.81221866607666, "global_step": 52759, "epoch": 1256} {"train_loss": -5.788227081298828, "global_step": 52760, "epoch": 1256} {"train_loss": -5.77988862991333, "global_step": 52761, "epoch": 1256} {"train_loss": -5.826883316040039, "global_step": 52762, "epoch": 1256} {"train_loss": -5.753970146179199, "global_step": 52763, "epoch": 1256} {"train_loss": -5.664253234863281, "global_step": 52764, "epoch": 1256} {"train_loss": -5.786269187927246, "global_step": 52765, "epoch": 1256} {"train_loss": -5.710935592651367, "global_step": 52766, "epoch": 1256} {"train_loss": -5.847102165222168, "global_step": 52767, "epoch": 1256} {"train_loss": -5.763956546783447, "global_step": 52768, "epoch": 1256} {"train_loss": -5.751762866973877, "global_step": 52769, "epoch": 1256} {"train_loss": -5.751826286315918, "global_step": 52770, "epoch": 1256} {"train_loss": -5.700991153717041, "global_step": 52771, "epoch": 1256} {"train_loss": -5.661877155303955, "global_step": 52772, "epoch": 1256} {"train_loss": -5.760210037231445, "global_step": 52773, "epoch": 1256} {"train_loss": -5.910580635070801, "global_step": 52774, "epoch": 1256} {"train_loss": -5.768978595733643, "global_step": 52775, "epoch": 1256} {"train_loss": -5.857858657836914, "global_step": 52776, "epoch": 1256} {"train_loss": -5.884252548217773, "global_step": 52777, "epoch": 1256} {"train_loss": -5.751752853393555, "global_step": 52778, "epoch": 1256} {"train_loss": -5.596453666687012, "global_step": 52779, "epoch": 1256} {"train_loss": -5.888363838195801, "global_step": 52780, "epoch": 1256} {"train_loss": -5.76422643661499, "global_step": 52781, "epoch": 1256} {"train_loss": -5.823224067687988, "global_step": 52782, "epoch": 1256} {"train_loss": -5.742727756500244, "global_step": 52783, "epoch": 1256} {"train_loss": -5.750855445861816, "global_step": 52784, "epoch": 1256} {"train_loss": -5.866839408874512, "global_step": 52785, "epoch": 1256} {"train_loss": -5.859505653381348, "global_step": 52786, "epoch": 1256} {"train_loss": -5.6716413497924805, "global_step": 52787, "epoch": 1256} {"train_loss": -5.7065629959106445, "global_step": 52788, "epoch": 1256} {"train_loss": -5.727776050567627, "global_step": 52789, "epoch": 1256} {"train_loss": -5.740664482116699, "global_step": 52790, "epoch": 1256} {"train_loss": -5.770926475524902, "global_step": 52791, "epoch": 1256} {"train_loss": -5.896074295043945, "global_step": 52792, "epoch": 1256} {"train_loss": -5.783094894318354, "global_step": 52793, "epoch": 1256, "val_loss": 66236.3203125} {"train_loss": -5.832551956176758, "global_step": 52794, "epoch": 1257} {"train_loss": -5.781155586242676, "global_step": 52795, "epoch": 1257} {"train_loss": -5.663322448730469, "global_step": 52796, "epoch": 1257} {"train_loss": -5.837948322296143, "global_step": 52797, "epoch": 1257} {"train_loss": -5.79247522354126, "global_step": 52798, "epoch": 1257} {"train_loss": -5.737773895263672, "global_step": 52799, "epoch": 1257} {"train_loss": -5.766513824462891, "global_step": 52800, "epoch": 1257} {"train_loss": -5.617937088012695, "global_step": 52801, "epoch": 1257} {"train_loss": -5.7456464767456055, "global_step": 52802, "epoch": 1257} {"train_loss": -5.804080009460449, "global_step": 52803, "epoch": 1257} {"train_loss": -5.84418249130249, "global_step": 52804, "epoch": 1257} {"train_loss": -5.704183101654053, "global_step": 52805, "epoch": 1257} {"train_loss": -5.761778831481934, "global_step": 52806, "epoch": 1257} {"train_loss": -5.874363899230957, "global_step": 52807, "epoch": 1257} {"train_loss": -5.836634635925293, "global_step": 52808, "epoch": 1257} {"train_loss": -5.6120734214782715, "global_step": 52809, "epoch": 1257} {"train_loss": -5.807353973388672, "global_step": 52810, "epoch": 1257} {"train_loss": -5.905425548553467, "global_step": 52811, "epoch": 1257} {"train_loss": -5.799630165100098, "global_step": 52812, "epoch": 1257} {"train_loss": -5.80129861831665, "global_step": 52813, "epoch": 1257} {"train_loss": -5.851137638092041, "global_step": 52814, "epoch": 1257} {"train_loss": -5.755519866943359, "global_step": 52815, "epoch": 1257} {"train_loss": -5.8181257247924805, "global_step": 52816, "epoch": 1257} {"train_loss": -5.831252098083496, "global_step": 52817, "epoch": 1257} {"train_loss": -5.885097026824951, "global_step": 52818, "epoch": 1257} {"train_loss": -5.759653091430664, "global_step": 52819, "epoch": 1257} {"train_loss": -5.756254196166992, "global_step": 52820, "epoch": 1257} {"train_loss": -5.77842903137207, "global_step": 52821, "epoch": 1257} {"train_loss": -5.795851707458496, "global_step": 52822, "epoch": 1257} {"train_loss": -5.783539295196533, "global_step": 52823, "epoch": 1257} {"train_loss": -5.8504438400268555, "global_step": 52824, "epoch": 1257} {"train_loss": -5.731387138366699, "global_step": 52825, "epoch": 1257} {"train_loss": -5.892546653747559, "global_step": 52826, "epoch": 1257} {"train_loss": -5.930366516113281, "global_step": 52827, "epoch": 1257} {"train_loss": -5.774705410003662, "global_step": 52828, "epoch": 1257} {"train_loss": -5.809477806091309, "global_step": 52829, "epoch": 1257} {"train_loss": -5.7901740074157715, "global_step": 52830, "epoch": 1257} {"train_loss": -5.780849456787109, "global_step": 52831, "epoch": 1257} {"train_loss": -5.610565185546875, "global_step": 52832, "epoch": 1257} {"train_loss": -5.682340621948242, "global_step": 52833, "epoch": 1257} {"train_loss": -5.885244369506836, "global_step": 52834, "epoch": 1257} {"train_loss": -5.789598078954787, "global_step": 52835, "epoch": 1257, "val_loss": 66255.984375} {"train_loss": -5.846451282501221, "global_step": 52836, "epoch": 1258} {"train_loss": -5.74933385848999, "global_step": 52837, "epoch": 1258} {"train_loss": -5.811423301696777, "global_step": 52838, "epoch": 1258} {"train_loss": -5.846812725067139, "global_step": 52839, "epoch": 1258} {"train_loss": -5.861903190612793, "global_step": 52840, "epoch": 1258} {"train_loss": -5.920330047607422, "global_step": 52841, "epoch": 1258} {"train_loss": -5.801736831665039, "global_step": 52842, "epoch": 1258} {"train_loss": -5.864611625671387, "global_step": 52843, "epoch": 1258} {"train_loss": -5.787453651428223, "global_step": 52844, "epoch": 1258} {"train_loss": -5.837015151977539, "global_step": 52845, "epoch": 1258} {"train_loss": -5.780519962310791, "global_step": 52846, "epoch": 1258} {"train_loss": -5.7053070068359375, "global_step": 52847, "epoch": 1258} {"train_loss": -5.757476329803467, "global_step": 52848, "epoch": 1258} {"train_loss": -5.795536994934082, "global_step": 52849, "epoch": 1258} {"train_loss": -5.762589454650879, "global_step": 52850, "epoch": 1258} {"train_loss": -5.752233505249023, "global_step": 52851, "epoch": 1258} {"train_loss": -5.64251708984375, "global_step": 52852, "epoch": 1258} {"train_loss": -5.904513835906982, "global_step": 52853, "epoch": 1258} {"train_loss": -5.7164201736450195, "global_step": 52854, "epoch": 1258} {"train_loss": -5.732689380645752, "global_step": 52855, "epoch": 1258} {"train_loss": -5.814915657043457, "global_step": 52856, "epoch": 1258} {"train_loss": -5.6951003074646, "global_step": 52857, "epoch": 1258} {"train_loss": -5.7208733558654785, "global_step": 52858, "epoch": 1258} {"train_loss": -5.744211196899414, "global_step": 52859, "epoch": 1258} {"train_loss": -5.814393997192383, "global_step": 52860, "epoch": 1258} {"train_loss": -5.763657093048096, "global_step": 52861, "epoch": 1258} {"train_loss": -5.7329840660095215, "global_step": 52862, "epoch": 1258} {"train_loss": -5.713370323181152, "global_step": 52863, "epoch": 1258} {"train_loss": -5.77699089050293, "global_step": 52864, "epoch": 1258} {"train_loss": -5.7607011795043945, "global_step": 52865, "epoch": 1258} {"train_loss": -5.695253372192383, "global_step": 52866, "epoch": 1258} {"train_loss": -5.667019367218018, "global_step": 52867, "epoch": 1258} {"train_loss": -5.7341532707214355, "global_step": 52868, "epoch": 1258} {"train_loss": -5.951226711273193, "global_step": 52869, "epoch": 1258} {"train_loss": -5.660799026489258, "global_step": 52870, "epoch": 1258} {"train_loss": -5.756949424743652, "global_step": 52871, "epoch": 1258} {"train_loss": -5.781003952026367, "global_step": 52872, "epoch": 1258} {"train_loss": -5.725728988647461, "global_step": 52873, "epoch": 1258} {"train_loss": -5.860295295715332, "global_step": 52874, "epoch": 1258} {"train_loss": -5.744343280792236, "global_step": 52875, "epoch": 1258} {"train_loss": -5.726635932922363, "global_step": 52876, "epoch": 1258} {"train_loss": -5.771116631371634, "global_step": 52877, "epoch": 1258, "val_loss": 66290.875} {"train_loss": -5.701364040374756, "global_step": 52878, "epoch": 1259} {"train_loss": -5.729519844055176, "global_step": 52879, "epoch": 1259} {"train_loss": -5.746502876281738, "global_step": 52880, "epoch": 1259} {"train_loss": -5.832178592681885, "global_step": 52881, "epoch": 1259} {"train_loss": -5.767665863037109, "global_step": 52882, "epoch": 1259} {"train_loss": -5.7729644775390625, "global_step": 52883, "epoch": 1259} {"train_loss": -5.84963321685791, "global_step": 52884, "epoch": 1259} {"train_loss": -5.8496994972229, "global_step": 52885, "epoch": 1259} {"train_loss": -5.832977294921875, "global_step": 52886, "epoch": 1259} {"train_loss": -5.807323455810547, "global_step": 52887, "epoch": 1259} {"train_loss": -5.7533769607543945, "global_step": 52888, "epoch": 1259} {"train_loss": -5.8124189376831055, "global_step": 52889, "epoch": 1259} {"train_loss": -5.732698440551758, "global_step": 52890, "epoch": 1259} {"train_loss": -5.850525856018066, "global_step": 52891, "epoch": 1259} {"train_loss": -5.953923225402832, "global_step": 52892, "epoch": 1259} {"train_loss": -5.762147903442383, "global_step": 52893, "epoch": 1259} {"train_loss": -5.714358329772949, "global_step": 52894, "epoch": 1259} {"train_loss": -5.80792760848999, "global_step": 52895, "epoch": 1259} {"train_loss": -5.820650100708008, "global_step": 52896, "epoch": 1259} {"train_loss": -5.764281272888184, "global_step": 52897, "epoch": 1259} {"train_loss": -5.628992080688477, "global_step": 52898, "epoch": 1259} {"train_loss": -5.803403854370117, "global_step": 52899, "epoch": 1259} {"train_loss": -5.732334136962891, "global_step": 52900, "epoch": 1259} {"train_loss": -5.7365312576293945, "global_step": 52901, "epoch": 1259} {"train_loss": -5.8138275146484375, "global_step": 52902, "epoch": 1259} {"train_loss": -5.747420310974121, "global_step": 52903, "epoch": 1259} {"train_loss": -5.888835906982422, "global_step": 52904, "epoch": 1259} {"train_loss": -5.8196001052856445, "global_step": 52905, "epoch": 1259} {"train_loss": -5.870511054992676, "global_step": 52906, "epoch": 1259} {"train_loss": -5.908783435821533, "global_step": 52907, "epoch": 1259} {"train_loss": -5.733574390411377, "global_step": 52908, "epoch": 1259} {"train_loss": -5.856869220733643, "global_step": 52909, "epoch": 1259} {"train_loss": -5.685449600219727, "global_step": 52910, "epoch": 1259} {"train_loss": -5.708211421966553, "global_step": 52911, "epoch": 1259} {"train_loss": -5.734004020690918, "global_step": 52912, "epoch": 1259} {"train_loss": -5.878949165344238, "global_step": 52913, "epoch": 1259} {"train_loss": -5.790721893310547, "global_step": 52914, "epoch": 1259} {"train_loss": -5.884103775024414, "global_step": 52915, "epoch": 1259} {"train_loss": -5.788796424865723, "global_step": 52916, "epoch": 1259} {"train_loss": -5.882774353027344, "global_step": 52917, "epoch": 1259} {"train_loss": -5.6821675300598145, "global_step": 52918, "epoch": 1259} {"train_loss": -5.791096165066674, "global_step": 52919, "epoch": 1259, "val_loss": 66592.453125} {"train_loss": -5.646479606628418, "global_step": 52920, "epoch": 1260} {"train_loss": -5.642498016357422, "global_step": 52921, "epoch": 1260} {"train_loss": -5.863046169281006, "global_step": 52922, "epoch": 1260} {"train_loss": -5.826536655426025, "global_step": 52923, "epoch": 1260} {"train_loss": -5.780568599700928, "global_step": 52924, "epoch": 1260} {"train_loss": -5.799828052520752, "global_step": 52925, "epoch": 1260} {"train_loss": -5.762966156005859, "global_step": 52926, "epoch": 1260} {"train_loss": -5.753705024719238, "global_step": 52927, "epoch": 1260} {"train_loss": -5.684390068054199, "global_step": 52928, "epoch": 1260} {"train_loss": -5.877579689025879, "global_step": 52929, "epoch": 1260} {"train_loss": -5.832527160644531, "global_step": 52930, "epoch": 1260} {"train_loss": -5.791877746582031, "global_step": 52931, "epoch": 1260} {"train_loss": -5.843775272369385, "global_step": 52932, "epoch": 1260} {"train_loss": -5.762447834014893, "global_step": 52933, "epoch": 1260} {"train_loss": -5.7626729011535645, "global_step": 52934, "epoch": 1260} {"train_loss": -5.784322738647461, "global_step": 52935, "epoch": 1260} {"train_loss": -5.862644195556641, "global_step": 52936, "epoch": 1260} {"train_loss": -5.870680809020996, "global_step": 52937, "epoch": 1260} {"train_loss": -5.824897766113281, "global_step": 52938, "epoch": 1260} {"train_loss": -5.766944408416748, "global_step": 52939, "epoch": 1260} {"train_loss": -5.802415370941162, "global_step": 52940, "epoch": 1260} {"train_loss": -5.798460960388184, "global_step": 52941, "epoch": 1260} {"train_loss": -5.777034282684326, "global_step": 52942, "epoch": 1260} {"train_loss": -5.751922607421875, "global_step": 52943, "epoch": 1260} {"train_loss": -5.817747116088867, "global_step": 52944, "epoch": 1260} {"train_loss": -5.740250587463379, "global_step": 52945, "epoch": 1260} {"train_loss": -5.781795501708984, "global_step": 52946, "epoch": 1260} {"train_loss": -5.844202518463135, "global_step": 52947, "epoch": 1260} {"train_loss": -5.82976770401001, "global_step": 52948, "epoch": 1260} {"train_loss": -5.891556262969971, "global_step": 52949, "epoch": 1260} {"train_loss": -5.944283485412598, "global_step": 52950, "epoch": 1260} {"train_loss": -5.806125164031982, "global_step": 52951, "epoch": 1260} {"train_loss": -5.728243827819824, "global_step": 52952, "epoch": 1260} {"train_loss": -5.8280158042907715, "global_step": 52953, "epoch": 1260} {"train_loss": -5.878026008605957, "global_step": 52954, "epoch": 1260} {"train_loss": -5.8810272216796875, "global_step": 52955, "epoch": 1260} {"train_loss": -5.917907238006592, "global_step": 52956, "epoch": 1260} {"train_loss": -5.793368339538574, "global_step": 52957, "epoch": 1260} {"train_loss": -5.903005599975586, "global_step": 52958, "epoch": 1260} {"train_loss": -5.639321327209473, "global_step": 52959, "epoch": 1260} {"train_loss": -5.821229934692383, "global_step": 52960, "epoch": 1260} {"train_loss": -5.800178414299374, "global_step": 52961, "epoch": 1260, "val_loss": 66346.1640625} {"train_loss": -5.788399696350098, "global_step": 52962, "epoch": 1261} {"train_loss": -5.865183353424072, "global_step": 52963, "epoch": 1261} {"train_loss": -5.7209014892578125, "global_step": 52964, "epoch": 1261} {"train_loss": -5.691493511199951, "global_step": 52965, "epoch": 1261} {"train_loss": -5.8595781326293945, "global_step": 52966, "epoch": 1261} {"train_loss": -5.770023822784424, "global_step": 52967, "epoch": 1261} {"train_loss": -5.593303680419922, "global_step": 52968, "epoch": 1261} {"train_loss": -5.778207778930664, "global_step": 52969, "epoch": 1261} {"train_loss": -5.775974273681641, "global_step": 52970, "epoch": 1261} {"train_loss": -5.7293701171875, "global_step": 52971, "epoch": 1261} {"train_loss": -5.777084827423096, "global_step": 52972, "epoch": 1261} {"train_loss": -5.838171005249023, "global_step": 52973, "epoch": 1261} {"train_loss": -5.621140480041504, "global_step": 52974, "epoch": 1261} {"train_loss": -5.686306953430176, "global_step": 52975, "epoch": 1261} {"train_loss": -5.700929641723633, "global_step": 52976, "epoch": 1261} {"train_loss": -5.760071277618408, "global_step": 52977, "epoch": 1261} {"train_loss": -5.844037055969238, "global_step": 52978, "epoch": 1261} {"train_loss": -5.787778854370117, "global_step": 52979, "epoch": 1261} {"train_loss": -5.76649284362793, "global_step": 52980, "epoch": 1261} {"train_loss": -5.777313232421875, "global_step": 52981, "epoch": 1261} {"train_loss": -5.8284406661987305, "global_step": 52982, "epoch": 1261} {"train_loss": -5.817658424377441, "global_step": 52983, "epoch": 1261} {"train_loss": -5.702653884887695, "global_step": 52984, "epoch": 1261} {"train_loss": -5.855964660644531, "global_step": 52985, "epoch": 1261} {"train_loss": -5.8507399559021, "global_step": 52986, "epoch": 1261} {"train_loss": -5.764677047729492, "global_step": 52987, "epoch": 1261} {"train_loss": -5.84344482421875, "global_step": 52988, "epoch": 1261} {"train_loss": -5.767020225524902, "global_step": 52989, "epoch": 1261} {"train_loss": -5.712338447570801, "global_step": 52990, "epoch": 1261} {"train_loss": -5.848017692565918, "global_step": 52991, "epoch": 1261} {"train_loss": -5.708618640899658, "global_step": 52992, "epoch": 1261} {"train_loss": -5.743318557739258, "global_step": 52993, "epoch": 1261} {"train_loss": -5.8495941162109375, "global_step": 52994, "epoch": 1261} {"train_loss": -5.7187089920043945, "global_step": 52995, "epoch": 1261} {"train_loss": -5.842153549194336, "global_step": 52996, "epoch": 1261} {"train_loss": -5.7358245849609375, "global_step": 52997, "epoch": 1261} {"train_loss": -5.951645851135254, "global_step": 52998, "epoch": 1261} {"train_loss": -5.818170547485352, "global_step": 52999, "epoch": 1261} {"train_loss": -5.859501838684082, "global_step": 53000, "epoch": 1261} {"train_loss": -5.754260063171387, "global_step": 53001, "epoch": 1261} {"train_loss": -5.742369651794434, "global_step": 53002, "epoch": 1261} {"train_loss": -5.775985876719157, "global_step": 53003, "epoch": 1261, "val_loss": 66424.9375} {"train_loss": -5.8501057624816895, "global_step": 53004, "epoch": 1262} {"train_loss": -5.621462345123291, "global_step": 53005, "epoch": 1262} {"train_loss": -5.756799221038818, "global_step": 53006, "epoch": 1262} {"train_loss": -5.753018379211426, "global_step": 53007, "epoch": 1262} {"train_loss": -5.834571838378906, "global_step": 53008, "epoch": 1262} {"train_loss": -5.830044746398926, "global_step": 53009, "epoch": 1262} {"train_loss": -5.726490020751953, "global_step": 53010, "epoch": 1262} {"train_loss": -5.831886291503906, "global_step": 53011, "epoch": 1262} {"train_loss": -5.677792549133301, "global_step": 53012, "epoch": 1262} {"train_loss": -5.823304176330566, "global_step": 53013, "epoch": 1262} {"train_loss": -5.91592264175415, "global_step": 53014, "epoch": 1262} {"train_loss": -5.875892639160156, "global_step": 53015, "epoch": 1262} {"train_loss": -5.752492427825928, "global_step": 53016, "epoch": 1262} {"train_loss": -5.937951564788818, "global_step": 53017, "epoch": 1262} {"train_loss": -5.899847984313965, "global_step": 53018, "epoch": 1262} {"train_loss": -5.803684234619141, "global_step": 53019, "epoch": 1262} {"train_loss": -5.740672588348389, "global_step": 53020, "epoch": 1262} {"train_loss": -5.8445634841918945, "global_step": 53021, "epoch": 1262} {"train_loss": -5.886419296264648, "global_step": 53022, "epoch": 1262} {"train_loss": -5.755613327026367, "global_step": 53023, "epoch": 1262} {"train_loss": -5.801759243011475, "global_step": 53024, "epoch": 1262} {"train_loss": -5.917552947998047, "global_step": 53025, "epoch": 1262} {"train_loss": -5.880476951599121, "global_step": 53026, "epoch": 1262} {"train_loss": -5.688475608825684, "global_step": 53027, "epoch": 1262} {"train_loss": -5.860237121582031, "global_step": 53028, "epoch": 1262} {"train_loss": -5.860426425933838, "global_step": 53029, "epoch": 1262} {"train_loss": -5.82529354095459, "global_step": 53030, "epoch": 1262} {"train_loss": -5.908475399017334, "global_step": 53031, "epoch": 1262} {"train_loss": -5.720821380615234, "global_step": 53032, "epoch": 1262} {"train_loss": -5.790367603302002, "global_step": 53033, "epoch": 1262} {"train_loss": -5.883148193359375, "global_step": 53034, "epoch": 1262} {"train_loss": -5.791842460632324, "global_step": 53035, "epoch": 1262} {"train_loss": -5.846043586730957, "global_step": 53036, "epoch": 1262} {"train_loss": -5.676441669464111, "global_step": 53037, "epoch": 1262} {"train_loss": -5.711529731750488, "global_step": 53038, "epoch": 1262} {"train_loss": -5.851502418518066, "global_step": 53039, "epoch": 1262} {"train_loss": -5.805810928344727, "global_step": 53040, "epoch": 1262} {"train_loss": -5.8311309814453125, "global_step": 53041, "epoch": 1262} {"train_loss": -5.771154880523682, "global_step": 53042, "epoch": 1262} {"train_loss": -5.705419063568115, "global_step": 53043, "epoch": 1262} {"train_loss": -5.948508262634277, "global_step": 53044, "epoch": 1262} {"train_loss": -5.808343160720098, "global_step": 53045, "epoch": 1262, "val_loss": 66305.859375} {"train_loss": -5.852975845336914, "global_step": 53046, "epoch": 1263} {"train_loss": -5.754056930541992, "global_step": 53047, "epoch": 1263} {"train_loss": -5.724595069885254, "global_step": 53048, "epoch": 1263} {"train_loss": -5.840512275695801, "global_step": 53049, "epoch": 1263} {"train_loss": -5.65726375579834, "global_step": 53050, "epoch": 1263} {"train_loss": -5.823426723480225, "global_step": 53051, "epoch": 1263} {"train_loss": -5.779224872589111, "global_step": 53052, "epoch": 1263} {"train_loss": -5.7943902015686035, "global_step": 53053, "epoch": 1263} {"train_loss": -5.916651725769043, "global_step": 53054, "epoch": 1263} {"train_loss": -5.7448272705078125, "global_step": 53055, "epoch": 1263} {"train_loss": -5.858882904052734, "global_step": 53056, "epoch": 1263} {"train_loss": -5.743439674377441, "global_step": 53057, "epoch": 1263} {"train_loss": -5.698966979980469, "global_step": 53058, "epoch": 1263} {"train_loss": -5.671512603759766, "global_step": 53059, "epoch": 1263} {"train_loss": -5.754110336303711, "global_step": 53060, "epoch": 1263} {"train_loss": -5.682567119598389, "global_step": 53061, "epoch": 1263} {"train_loss": -5.7273736000061035, "global_step": 53062, "epoch": 1263} {"train_loss": -5.87578010559082, "global_step": 53063, "epoch": 1263} {"train_loss": -5.697391510009766, "global_step": 53064, "epoch": 1263} {"train_loss": -5.7262983322143555, "global_step": 53065, "epoch": 1263} {"train_loss": -5.829591274261475, "global_step": 53066, "epoch": 1263} {"train_loss": -5.705808162689209, "global_step": 53067, "epoch": 1263} {"train_loss": -5.795833587646484, "global_step": 53068, "epoch": 1263} {"train_loss": -5.759994029998779, "global_step": 53069, "epoch": 1263} {"train_loss": -5.773390769958496, "global_step": 53070, "epoch": 1263} {"train_loss": -5.8713507652282715, "global_step": 53071, "epoch": 1263} {"train_loss": -5.8122382164001465, "global_step": 53072, "epoch": 1263} {"train_loss": -5.853183269500732, "global_step": 53073, "epoch": 1263} {"train_loss": -5.839727401733398, "global_step": 53074, "epoch": 1263} {"train_loss": -5.665851593017578, "global_step": 53075, "epoch": 1263} {"train_loss": -5.880787372589111, "global_step": 53076, "epoch": 1263} {"train_loss": -5.854975700378418, "global_step": 53077, "epoch": 1263} {"train_loss": -5.800087928771973, "global_step": 53078, "epoch": 1263} {"train_loss": -5.7493720054626465, "global_step": 53079, "epoch": 1263} {"train_loss": -5.846186637878418, "global_step": 53080, "epoch": 1263} {"train_loss": -5.691925048828125, "global_step": 53081, "epoch": 1263} {"train_loss": -5.828256607055664, "global_step": 53082, "epoch": 1263} {"train_loss": -5.879068851470947, "global_step": 53083, "epoch": 1263} {"train_loss": -5.736315727233887, "global_step": 53084, "epoch": 1263} {"train_loss": -5.69020938873291, "global_step": 53085, "epoch": 1263} {"train_loss": -5.805846691131592, "global_step": 53086, "epoch": 1263} {"train_loss": -5.779552607309251, "global_step": 53087, "epoch": 1263, "val_loss": 66575.8125} {"train_loss": -5.803770542144775, "global_step": 53088, "epoch": 1264} {"train_loss": -5.820394039154053, "global_step": 53089, "epoch": 1264} {"train_loss": -5.744329452514648, "global_step": 53090, "epoch": 1264} {"train_loss": -5.86422061920166, "global_step": 53091, "epoch": 1264} {"train_loss": -5.716928482055664, "global_step": 53092, "epoch": 1264} {"train_loss": -5.775312900543213, "global_step": 53093, "epoch": 1264} {"train_loss": -5.729710102081299, "global_step": 53094, "epoch": 1264} {"train_loss": -5.6092352867126465, "global_step": 53095, "epoch": 1264} {"train_loss": -5.852198123931885, "global_step": 53096, "epoch": 1264} {"train_loss": -5.6899027824401855, "global_step": 53097, "epoch": 1264} {"train_loss": -5.839991569519043, "global_step": 53098, "epoch": 1264} {"train_loss": -5.7710981369018555, "global_step": 53099, "epoch": 1264} {"train_loss": -5.876531600952148, "global_step": 53100, "epoch": 1264} {"train_loss": -5.857171535491943, "global_step": 53101, "epoch": 1264} {"train_loss": -5.7046356201171875, "global_step": 53102, "epoch": 1264} {"train_loss": -5.845815181732178, "global_step": 53103, "epoch": 1264} {"train_loss": -5.7707295417785645, "global_step": 53104, "epoch": 1264} {"train_loss": -5.908176422119141, "global_step": 53105, "epoch": 1264} {"train_loss": -5.829401016235352, "global_step": 53106, "epoch": 1264} {"train_loss": -5.89991569519043, "global_step": 53107, "epoch": 1264} {"train_loss": -5.721826553344727, "global_step": 53108, "epoch": 1264} {"train_loss": -5.720052719116211, "global_step": 53109, "epoch": 1264} {"train_loss": -5.847432613372803, "global_step": 53110, "epoch": 1264} {"train_loss": -5.859772682189941, "global_step": 53111, "epoch": 1264} {"train_loss": -5.910897254943848, "global_step": 53112, "epoch": 1264} {"train_loss": -5.858002662658691, "global_step": 53113, "epoch": 1264} {"train_loss": -5.828154563903809, "global_step": 53114, "epoch": 1264} {"train_loss": -5.841008186340332, "global_step": 53115, "epoch": 1264} {"train_loss": -5.737644195556641, "global_step": 53116, "epoch": 1264} {"train_loss": -5.734406471252441, "global_step": 53117, "epoch": 1264} {"train_loss": -5.668935775756836, "global_step": 53118, "epoch": 1264} {"train_loss": -5.758038520812988, "global_step": 53119, "epoch": 1264} {"train_loss": -5.8440141677856445, "global_step": 53120, "epoch": 1264} {"train_loss": -5.922184944152832, "global_step": 53121, "epoch": 1264} {"train_loss": -5.790447235107422, "global_step": 53122, "epoch": 1264} {"train_loss": -5.758091449737549, "global_step": 53123, "epoch": 1264} {"train_loss": -5.852391242980957, "global_step": 53124, "epoch": 1264} {"train_loss": -5.778396129608154, "global_step": 53125, "epoch": 1264} {"train_loss": -5.78316593170166, "global_step": 53126, "epoch": 1264} {"train_loss": -5.835611343383789, "global_step": 53127, "epoch": 1264} {"train_loss": -5.756772994995117, "global_step": 53128, "epoch": 1264} {"train_loss": -5.798860470453898, "global_step": 53129, "epoch": 1264, "val_loss": 66424.7265625} {"train_loss": -5.761589527130127, "global_step": 53130, "epoch": 1265} {"train_loss": -5.917337417602539, "global_step": 53131, "epoch": 1265} {"train_loss": -5.749859809875488, "global_step": 53132, "epoch": 1265} {"train_loss": -5.793283462524414, "global_step": 53133, "epoch": 1265} {"train_loss": -5.677530288696289, "global_step": 53134, "epoch": 1265} {"train_loss": -5.7467193603515625, "global_step": 53135, "epoch": 1265} {"train_loss": -5.87812614440918, "global_step": 53136, "epoch": 1265} {"train_loss": -5.635297775268555, "global_step": 53137, "epoch": 1265} {"train_loss": -5.766729354858398, "global_step": 53138, "epoch": 1265} {"train_loss": -5.82985258102417, "global_step": 53139, "epoch": 1265} {"train_loss": -5.865488529205322, "global_step": 53140, "epoch": 1265} {"train_loss": -5.817253112792969, "global_step": 53141, "epoch": 1265} {"train_loss": -5.844729423522949, "global_step": 53142, "epoch": 1265} {"train_loss": -5.887484550476074, "global_step": 53143, "epoch": 1265} {"train_loss": -5.760012626647949, "global_step": 53144, "epoch": 1265} {"train_loss": -5.823504447937012, "global_step": 53145, "epoch": 1265} {"train_loss": -5.892197608947754, "global_step": 53146, "epoch": 1265} {"train_loss": -5.89096212387085, "global_step": 53147, "epoch": 1265} {"train_loss": -5.838096618652344, "global_step": 53148, "epoch": 1265} {"train_loss": -5.847425937652588, "global_step": 53149, "epoch": 1265} {"train_loss": -5.869753837585449, "global_step": 53150, "epoch": 1265} {"train_loss": -5.865743637084961, "global_step": 53151, "epoch": 1265} {"train_loss": -5.894791603088379, "global_step": 53152, "epoch": 1265} {"train_loss": -5.800968170166016, "global_step": 53153, "epoch": 1265} {"train_loss": -5.78948974609375, "global_step": 53154, "epoch": 1265} {"train_loss": -5.749012470245361, "global_step": 53155, "epoch": 1265} {"train_loss": -5.788702964782715, "global_step": 53156, "epoch": 1265} {"train_loss": -5.848252296447754, "global_step": 53157, "epoch": 1265} {"train_loss": -5.928631782531738, "global_step": 53158, "epoch": 1265} {"train_loss": -5.832858085632324, "global_step": 53159, "epoch": 1265} {"train_loss": -5.728537082672119, "global_step": 53160, "epoch": 1265} {"train_loss": -5.755797863006592, "global_step": 53161, "epoch": 1265} {"train_loss": -5.86358118057251, "global_step": 53162, "epoch": 1265} {"train_loss": -5.891397476196289, "global_step": 53163, "epoch": 1265} {"train_loss": -5.77260684967041, "global_step": 53164, "epoch": 1265} {"train_loss": -5.71748161315918, "global_step": 53165, "epoch": 1265} {"train_loss": -5.674044609069824, "global_step": 53166, "epoch": 1265} {"train_loss": -5.6843767166137695, "global_step": 53167, "epoch": 1265} {"train_loss": -5.7824788093566895, "global_step": 53168, "epoch": 1265} {"train_loss": -5.799039840698242, "global_step": 53169, "epoch": 1265} {"train_loss": -5.715789794921875, "global_step": 53170, "epoch": 1265} {"train_loss": -5.805077575501942, "global_step": 53171, "epoch": 1265, "val_loss": 66327.4453125} {"train_loss": -5.668333053588867, "global_step": 53172, "epoch": 1266} {"train_loss": -5.783992290496826, "global_step": 53173, "epoch": 1266} {"train_loss": -5.778508186340332, "global_step": 53174, "epoch": 1266} {"train_loss": -5.748286247253418, "global_step": 53175, "epoch": 1266} {"train_loss": -5.799745559692383, "global_step": 53176, "epoch": 1266} {"train_loss": -5.7611775398254395, "global_step": 53177, "epoch": 1266} {"train_loss": -5.810591697692871, "global_step": 53178, "epoch": 1266} {"train_loss": -5.753151893615723, "global_step": 53179, "epoch": 1266} {"train_loss": -5.6651458740234375, "global_step": 53180, "epoch": 1266} {"train_loss": -5.778149604797363, "global_step": 53181, "epoch": 1266} {"train_loss": -5.7743377685546875, "global_step": 53182, "epoch": 1266} {"train_loss": -5.747199535369873, "global_step": 53183, "epoch": 1266} {"train_loss": -5.726274490356445, "global_step": 53184, "epoch": 1266} {"train_loss": -5.7390594482421875, "global_step": 53185, "epoch": 1266} {"train_loss": -5.795607566833496, "global_step": 53186, "epoch": 1266} {"train_loss": -5.7444281578063965, "global_step": 53187, "epoch": 1266} {"train_loss": -5.693736553192139, "global_step": 53188, "epoch": 1266} {"train_loss": -5.763686180114746, "global_step": 53189, "epoch": 1266} {"train_loss": -5.758139610290527, "global_step": 53190, "epoch": 1266} {"train_loss": -5.787016868591309, "global_step": 53191, "epoch": 1266} {"train_loss": -5.78778076171875, "global_step": 53192, "epoch": 1266} {"train_loss": -5.83034610748291, "global_step": 53193, "epoch": 1266} {"train_loss": -5.707076072692871, "global_step": 53194, "epoch": 1266} {"train_loss": -5.808123588562012, "global_step": 53195, "epoch": 1266} {"train_loss": -5.836780071258545, "global_step": 53196, "epoch": 1266} {"train_loss": -5.770953178405762, "global_step": 53197, "epoch": 1266} {"train_loss": -5.752327919006348, "global_step": 53198, "epoch": 1266} {"train_loss": -5.7354230880737305, "global_step": 53199, "epoch": 1266} {"train_loss": -5.877462387084961, "global_step": 53200, "epoch": 1266} {"train_loss": -5.79676628112793, "global_step": 53201, "epoch": 1266} {"train_loss": -5.753674507141113, "global_step": 53202, "epoch": 1266} {"train_loss": -5.686312675476074, "global_step": 53203, "epoch": 1266} {"train_loss": -5.688019275665283, "global_step": 53204, "epoch": 1266} {"train_loss": -5.7282209396362305, "global_step": 53205, "epoch": 1266} {"train_loss": -5.80360221862793, "global_step": 53206, "epoch": 1266} {"train_loss": -5.755029201507568, "global_step": 53207, "epoch": 1266} {"train_loss": -5.77822208404541, "global_step": 53208, "epoch": 1266} {"train_loss": -5.768455505371094, "global_step": 53209, "epoch": 1266} {"train_loss": -5.783106803894043, "global_step": 53210, "epoch": 1266} {"train_loss": -5.627613067626953, "global_step": 53211, "epoch": 1266} {"train_loss": -5.708398818969727, "global_step": 53212, "epoch": 1266} {"train_loss": -5.7576323463803245, "global_step": 53213, "epoch": 1266, "val_loss": 67095.65625} {"train_loss": -5.555814743041992, "global_step": 53214, "epoch": 1267} {"train_loss": -5.905020713806152, "global_step": 53215, "epoch": 1267} {"train_loss": -5.691147327423096, "global_step": 53216, "epoch": 1267} {"train_loss": -5.810022830963135, "global_step": 53217, "epoch": 1267} {"train_loss": -5.682641983032227, "global_step": 53218, "epoch": 1267} {"train_loss": -5.777152061462402, "global_step": 53219, "epoch": 1267} {"train_loss": -5.653214454650879, "global_step": 53220, "epoch": 1267} {"train_loss": -5.732821941375732, "global_step": 53221, "epoch": 1267} {"train_loss": -5.776008605957031, "global_step": 53222, "epoch": 1267} {"train_loss": -5.826659679412842, "global_step": 53223, "epoch": 1267} {"train_loss": -5.855724334716797, "global_step": 53224, "epoch": 1267} {"train_loss": -5.8627142906188965, "global_step": 53225, "epoch": 1267} {"train_loss": -5.772709369659424, "global_step": 53226, "epoch": 1267} {"train_loss": -5.762726783752441, "global_step": 53227, "epoch": 1267} {"train_loss": -5.657917499542236, "global_step": 53228, "epoch": 1267} {"train_loss": -5.838822841644287, "global_step": 53229, "epoch": 1267} {"train_loss": -5.812989234924316, "global_step": 53230, "epoch": 1267} {"train_loss": -5.904144287109375, "global_step": 53231, "epoch": 1267} {"train_loss": -5.832762718200684, "global_step": 53232, "epoch": 1267} {"train_loss": -5.673741817474365, "global_step": 53233, "epoch": 1267} {"train_loss": -5.9025468826293945, "global_step": 53234, "epoch": 1267} {"train_loss": -5.737046718597412, "global_step": 53235, "epoch": 1267} {"train_loss": -5.803771018981934, "global_step": 53236, "epoch": 1267} {"train_loss": -5.643949508666992, "global_step": 53237, "epoch": 1267} {"train_loss": -5.828471660614014, "global_step": 53238, "epoch": 1267} {"train_loss": -5.9055023193359375, "global_step": 53239, "epoch": 1267} {"train_loss": -5.870195388793945, "global_step": 53240, "epoch": 1267} {"train_loss": -5.871335029602051, "global_step": 53241, "epoch": 1267} {"train_loss": -5.7340545654296875, "global_step": 53242, "epoch": 1267} {"train_loss": -5.821127891540527, "global_step": 53243, "epoch": 1267} {"train_loss": -5.785912036895752, "global_step": 53244, "epoch": 1267} {"train_loss": -5.785961627960205, "global_step": 53245, "epoch": 1267} {"train_loss": -5.863710403442383, "global_step": 53246, "epoch": 1267} {"train_loss": -5.774523735046387, "global_step": 53247, "epoch": 1267} {"train_loss": -5.893087387084961, "global_step": 53248, "epoch": 1267} {"train_loss": -5.862608909606934, "global_step": 53249, "epoch": 1267} {"train_loss": -5.774068355560303, "global_step": 53250, "epoch": 1267} {"train_loss": -5.9091691970825195, "global_step": 53251, "epoch": 1267} {"train_loss": -5.731410026550293, "global_step": 53252, "epoch": 1267} {"train_loss": -5.794586658477783, "global_step": 53253, "epoch": 1267} {"train_loss": -5.754244804382324, "global_step": 53254, "epoch": 1267} {"train_loss": -5.7884995710282094, "global_step": 53255, "epoch": 1267, "val_loss": 66604.8359375} {"train_loss": -5.854153633117676, "global_step": 53256, "epoch": 1268} {"train_loss": -5.819031238555908, "global_step": 53257, "epoch": 1268} {"train_loss": -5.845549583435059, "global_step": 53258, "epoch": 1268} {"train_loss": -5.755449295043945, "global_step": 53259, "epoch": 1268} {"train_loss": -5.830511093139648, "global_step": 53260, "epoch": 1268} {"train_loss": -5.925231456756592, "global_step": 53261, "epoch": 1268} {"train_loss": -5.604557991027832, "global_step": 53262, "epoch": 1268} {"train_loss": -5.758923053741455, "global_step": 53263, "epoch": 1268} {"train_loss": -5.752273082733154, "global_step": 53264, "epoch": 1268} {"train_loss": -5.706567764282227, "global_step": 53265, "epoch": 1268} {"train_loss": -5.834567070007324, "global_step": 53266, "epoch": 1268} {"train_loss": -5.812616348266602, "global_step": 53267, "epoch": 1268} {"train_loss": -5.756872177124023, "global_step": 53268, "epoch": 1268} {"train_loss": -5.73768424987793, "global_step": 53269, "epoch": 1268} {"train_loss": -5.703629493713379, "global_step": 53270, "epoch": 1268} {"train_loss": -5.807968616485596, "global_step": 53271, "epoch": 1268} {"train_loss": -5.794622898101807, "global_step": 53272, "epoch": 1268} {"train_loss": -5.833491802215576, "global_step": 53273, "epoch": 1268} {"train_loss": -5.906529426574707, "global_step": 53274, "epoch": 1268} {"train_loss": -5.739750862121582, "global_step": 53275, "epoch": 1268} {"train_loss": -5.806365013122559, "global_step": 53276, "epoch": 1268} {"train_loss": -5.816899299621582, "global_step": 53277, "epoch": 1268} {"train_loss": -5.761055946350098, "global_step": 53278, "epoch": 1268} {"train_loss": -5.812987327575684, "global_step": 53279, "epoch": 1268} {"train_loss": -5.758912086486816, "global_step": 53280, "epoch": 1268} {"train_loss": -5.74422550201416, "global_step": 53281, "epoch": 1268} {"train_loss": -5.761436462402344, "global_step": 53282, "epoch": 1268} {"train_loss": -5.800954341888428, "global_step": 53283, "epoch": 1268} {"train_loss": -5.774537563323975, "global_step": 53284, "epoch": 1268} {"train_loss": -5.8400163650512695, "global_step": 53285, "epoch": 1268} {"train_loss": -5.86483097076416, "global_step": 53286, "epoch": 1268} {"train_loss": -5.773772239685059, "global_step": 53287, "epoch": 1268} {"train_loss": -5.732409477233887, "global_step": 53288, "epoch": 1268} {"train_loss": -5.823681831359863, "global_step": 53289, "epoch": 1268} {"train_loss": -5.826028347015381, "global_step": 53290, "epoch": 1268} {"train_loss": -5.714393138885498, "global_step": 53291, "epoch": 1268} {"train_loss": -5.767968654632568, "global_step": 53292, "epoch": 1268} {"train_loss": -5.82725715637207, "global_step": 53293, "epoch": 1268} {"train_loss": -5.709898948669434, "global_step": 53294, "epoch": 1268} {"train_loss": -5.803097724914551, "global_step": 53295, "epoch": 1268} {"train_loss": -5.797206878662109, "global_step": 53296, "epoch": 1268} {"train_loss": -5.789385897772653, "global_step": 53297, "epoch": 1268, "val_loss": 66860.671875} {"train_loss": -5.817325115203857, "global_step": 53298, "epoch": 1269} {"train_loss": -5.731822967529297, "global_step": 53299, "epoch": 1269} {"train_loss": -5.860605239868164, "global_step": 53300, "epoch": 1269} {"train_loss": -5.8079118728637695, "global_step": 53301, "epoch": 1269} {"train_loss": -5.717398166656494, "global_step": 53302, "epoch": 1269} {"train_loss": -5.705285549163818, "global_step": 53303, "epoch": 1269} {"train_loss": -5.85172700881958, "global_step": 53304, "epoch": 1269} {"train_loss": -5.743691444396973, "global_step": 53305, "epoch": 1269} {"train_loss": -5.797442436218262, "global_step": 53306, "epoch": 1269} {"train_loss": -5.694605827331543, "global_step": 53307, "epoch": 1269} {"train_loss": -5.852504253387451, "global_step": 53308, "epoch": 1269} {"train_loss": -5.73419189453125, "global_step": 53309, "epoch": 1269} {"train_loss": -5.829095840454102, "global_step": 53310, "epoch": 1269} {"train_loss": -5.754767417907715, "global_step": 53311, "epoch": 1269} {"train_loss": -5.92254114151001, "global_step": 53312, "epoch": 1269} {"train_loss": -5.892023086547852, "global_step": 53313, "epoch": 1269} {"train_loss": -5.893327236175537, "global_step": 53314, "epoch": 1269} {"train_loss": -5.8513383865356445, "global_step": 53315, "epoch": 1269} {"train_loss": -5.843057155609131, "global_step": 53316, "epoch": 1269} {"train_loss": -5.6610307693481445, "global_step": 53317, "epoch": 1269} {"train_loss": -5.844441890716553, "global_step": 53318, "epoch": 1269} {"train_loss": -5.967503547668457, "global_step": 53319, "epoch": 1269} {"train_loss": -5.806460857391357, "global_step": 53320, "epoch": 1269} {"train_loss": -5.873913764953613, "global_step": 53321, "epoch": 1269} {"train_loss": -5.804443359375, "global_step": 53322, "epoch": 1269} {"train_loss": -5.916255950927734, "global_step": 53323, "epoch": 1269} {"train_loss": -5.755555152893066, "global_step": 53324, "epoch": 1269} {"train_loss": -5.7613301277160645, "global_step": 53325, "epoch": 1269} {"train_loss": -5.620421886444092, "global_step": 53326, "epoch": 1269} {"train_loss": -5.815507888793945, "global_step": 53327, "epoch": 1269} {"train_loss": -5.685647964477539, "global_step": 53328, "epoch": 1269} {"train_loss": -5.869388580322266, "global_step": 53329, "epoch": 1269} {"train_loss": -5.908939361572266, "global_step": 53330, "epoch": 1269} {"train_loss": -5.701948642730713, "global_step": 53331, "epoch": 1269} {"train_loss": -5.768723964691162, "global_step": 53332, "epoch": 1269} {"train_loss": -5.818880081176758, "global_step": 53333, "epoch": 1269} {"train_loss": -5.777414798736572, "global_step": 53334, "epoch": 1269} {"train_loss": -5.935053825378418, "global_step": 53335, "epoch": 1269} {"train_loss": -5.817901611328125, "global_step": 53336, "epoch": 1269} {"train_loss": -5.778470993041992, "global_step": 53337, "epoch": 1269} {"train_loss": -5.851160049438477, "global_step": 53338, "epoch": 1269} {"train_loss": -5.805221614383516, "global_step": 53339, "epoch": 1269, "val_loss": 66346.9375} {"train_loss": -5.786003112792969, "global_step": 53340, "epoch": 1270} {"train_loss": -5.678970813751221, "global_step": 53341, "epoch": 1270} {"train_loss": -5.749311447143555, "global_step": 53342, "epoch": 1270} {"train_loss": -5.850127220153809, "global_step": 53343, "epoch": 1270} {"train_loss": -5.8010101318359375, "global_step": 53344, "epoch": 1270} {"train_loss": -5.759514808654785, "global_step": 53345, "epoch": 1270} {"train_loss": -5.839638710021973, "global_step": 53346, "epoch": 1270} {"train_loss": -5.82930850982666, "global_step": 53347, "epoch": 1270} {"train_loss": -5.785523414611816, "global_step": 53348, "epoch": 1270} {"train_loss": -5.750174522399902, "global_step": 53349, "epoch": 1270} {"train_loss": -5.762681007385254, "global_step": 53350, "epoch": 1270} {"train_loss": -5.7696099281311035, "global_step": 53351, "epoch": 1270} {"train_loss": -5.83438777923584, "global_step": 53352, "epoch": 1270} {"train_loss": -5.80465030670166, "global_step": 53353, "epoch": 1270} {"train_loss": -5.872289657592773, "global_step": 53354, "epoch": 1270} {"train_loss": -5.825987339019775, "global_step": 53355, "epoch": 1270} {"train_loss": -5.72022819519043, "global_step": 53356, "epoch": 1270} {"train_loss": -5.74777889251709, "global_step": 53357, "epoch": 1270} {"train_loss": -5.868336200714111, "global_step": 53358, "epoch": 1270} {"train_loss": -5.775442123413086, "global_step": 53359, "epoch": 1270} {"train_loss": -5.888788223266602, "global_step": 53360, "epoch": 1270} {"train_loss": -5.734140396118164, "global_step": 53361, "epoch": 1270} {"train_loss": -5.755484580993652, "global_step": 53362, "epoch": 1270} {"train_loss": -5.791409492492676, "global_step": 53363, "epoch": 1270} {"train_loss": -5.771042823791504, "global_step": 53364, "epoch": 1270} {"train_loss": -5.929917335510254, "global_step": 53365, "epoch": 1270} {"train_loss": -5.692134857177734, "global_step": 53366, "epoch": 1270} {"train_loss": -5.805516242980957, "global_step": 53367, "epoch": 1270} {"train_loss": -5.792052268981934, "global_step": 53368, "epoch": 1270} {"train_loss": -5.600545883178711, "global_step": 53369, "epoch": 1270} {"train_loss": -5.9094319343566895, "global_step": 53370, "epoch": 1270} {"train_loss": -5.772281169891357, "global_step": 53371, "epoch": 1270} {"train_loss": -5.719520568847656, "global_step": 53372, "epoch": 1270} {"train_loss": -5.827661514282227, "global_step": 53373, "epoch": 1270} {"train_loss": -5.854703903198242, "global_step": 53374, "epoch": 1270} {"train_loss": -5.71452522277832, "global_step": 53375, "epoch": 1270} {"train_loss": -5.844185829162598, "global_step": 53376, "epoch": 1270} {"train_loss": -5.848723411560059, "global_step": 53377, "epoch": 1270} {"train_loss": -5.633296012878418, "global_step": 53378, "epoch": 1270} {"train_loss": -5.752898216247559, "global_step": 53379, "epoch": 1270} {"train_loss": -5.632876396179199, "global_step": 53380, "epoch": 1270} {"train_loss": -5.783094758079166, "global_step": 53381, "epoch": 1270, "val_loss": 66559.03125} {"train_loss": -5.719521999359131, "global_step": 53382, "epoch": 1271} {"train_loss": -5.714290618896484, "global_step": 53383, "epoch": 1271} {"train_loss": -5.767582893371582, "global_step": 53384, "epoch": 1271} {"train_loss": -5.77283239364624, "global_step": 53385, "epoch": 1271} {"train_loss": -5.808351993560791, "global_step": 53386, "epoch": 1271} {"train_loss": -5.803061008453369, "global_step": 53387, "epoch": 1271} {"train_loss": -5.9007415771484375, "global_step": 53388, "epoch": 1271} {"train_loss": -5.8045525550842285, "global_step": 53389, "epoch": 1271} {"train_loss": -5.846123695373535, "global_step": 53390, "epoch": 1271} {"train_loss": -5.819836616516113, "global_step": 53391, "epoch": 1271} {"train_loss": -5.751789093017578, "global_step": 53392, "epoch": 1271} {"train_loss": -5.804096221923828, "global_step": 53393, "epoch": 1271} {"train_loss": -5.693511962890625, "global_step": 53394, "epoch": 1271} {"train_loss": -5.830770492553711, "global_step": 53395, "epoch": 1271} {"train_loss": -5.674807548522949, "global_step": 53396, "epoch": 1271} {"train_loss": -5.807425022125244, "global_step": 53397, "epoch": 1271} {"train_loss": -5.810988426208496, "global_step": 53398, "epoch": 1271} {"train_loss": -5.931547164916992, "global_step": 53399, "epoch": 1271} {"train_loss": -5.913260459899902, "global_step": 53400, "epoch": 1271} {"train_loss": -5.706811904907227, "global_step": 53401, "epoch": 1271} {"train_loss": -5.937047958374023, "global_step": 53402, "epoch": 1271} {"train_loss": -5.752621650695801, "global_step": 53403, "epoch": 1271} {"train_loss": -5.857324123382568, "global_step": 53404, "epoch": 1271} {"train_loss": -5.773873329162598, "global_step": 53405, "epoch": 1271} {"train_loss": -5.748264312744141, "global_step": 53406, "epoch": 1271} {"train_loss": -5.70550012588501, "global_step": 53407, "epoch": 1271} {"train_loss": -5.810527324676514, "global_step": 53408, "epoch": 1271} {"train_loss": -5.66274356842041, "global_step": 53409, "epoch": 1271} {"train_loss": -5.830073833465576, "global_step": 53410, "epoch": 1271} {"train_loss": -5.81380558013916, "global_step": 53411, "epoch": 1271} {"train_loss": -5.833493232727051, "global_step": 53412, "epoch": 1271} {"train_loss": -5.825533866882324, "global_step": 53413, "epoch": 1271} {"train_loss": -5.864088535308838, "global_step": 53414, "epoch": 1271} {"train_loss": -5.722078323364258, "global_step": 53415, "epoch": 1271} {"train_loss": -5.861430644989014, "global_step": 53416, "epoch": 1271} {"train_loss": -5.8943891525268555, "global_step": 53417, "epoch": 1271} {"train_loss": -5.631124496459961, "global_step": 53418, "epoch": 1271} {"train_loss": -5.801934719085693, "global_step": 53419, "epoch": 1271} {"train_loss": -5.819791793823242, "global_step": 53420, "epoch": 1271} {"train_loss": -5.758266925811768, "global_step": 53421, "epoch": 1271} {"train_loss": -5.966626167297363, "global_step": 53422, "epoch": 1271} {"train_loss": -5.798198325293405, "global_step": 53423, "epoch": 1271, "val_loss": 66886.015625} {"train_loss": -5.704122066497803, "global_step": 53424, "epoch": 1272} {"train_loss": -5.856329441070557, "global_step": 53425, "epoch": 1272} {"train_loss": -5.833559036254883, "global_step": 53426, "epoch": 1272} {"train_loss": -5.766690731048584, "global_step": 53427, "epoch": 1272} {"train_loss": -5.725390911102295, "global_step": 53428, "epoch": 1272} {"train_loss": -5.791003227233887, "global_step": 53429, "epoch": 1272} {"train_loss": -5.840947151184082, "global_step": 53430, "epoch": 1272} {"train_loss": -5.710664749145508, "global_step": 53431, "epoch": 1272} {"train_loss": -5.865015029907227, "global_step": 53432, "epoch": 1272} {"train_loss": -5.808629035949707, "global_step": 53433, "epoch": 1272} {"train_loss": -5.85880184173584, "global_step": 53434, "epoch": 1272} {"train_loss": -5.789422035217285, "global_step": 53435, "epoch": 1272} {"train_loss": -5.825964450836182, "global_step": 53436, "epoch": 1272} {"train_loss": -5.7521071434021, "global_step": 53437, "epoch": 1272} {"train_loss": -5.770374774932861, "global_step": 53438, "epoch": 1272} {"train_loss": -5.800025939941406, "global_step": 53439, "epoch": 1272} {"train_loss": -5.708807945251465, "global_step": 53440, "epoch": 1272} {"train_loss": -5.8365583419799805, "global_step": 53441, "epoch": 1272} {"train_loss": -5.809859275817871, "global_step": 53442, "epoch": 1272} {"train_loss": -5.736763954162598, "global_step": 53443, "epoch": 1272} {"train_loss": -5.861212253570557, "global_step": 53444, "epoch": 1272} {"train_loss": -5.694729804992676, "global_step": 53445, "epoch": 1272} {"train_loss": -5.768885612487793, "global_step": 53446, "epoch": 1272} {"train_loss": -5.792498588562012, "global_step": 53447, "epoch": 1272} {"train_loss": -5.651763439178467, "global_step": 53448, "epoch": 1272} {"train_loss": -5.781058311462402, "global_step": 53449, "epoch": 1272} {"train_loss": -5.8633503913879395, "global_step": 53450, "epoch": 1272} {"train_loss": -5.743315696716309, "global_step": 53451, "epoch": 1272} {"train_loss": -5.737529754638672, "global_step": 53452, "epoch": 1272} {"train_loss": -5.761482238769531, "global_step": 53453, "epoch": 1272} {"train_loss": -5.806825160980225, "global_step": 53454, "epoch": 1272} {"train_loss": -5.819210529327393, "global_step": 53455, "epoch": 1272} {"train_loss": -5.761910438537598, "global_step": 53456, "epoch": 1272} {"train_loss": -5.836462020874023, "global_step": 53457, "epoch": 1272} {"train_loss": -5.773889541625977, "global_step": 53458, "epoch": 1272} {"train_loss": -5.730990409851074, "global_step": 53459, "epoch": 1272} {"train_loss": -5.828159809112549, "global_step": 53460, "epoch": 1272} {"train_loss": -5.785201549530029, "global_step": 53461, "epoch": 1272} {"train_loss": -5.482967376708984, "global_step": 53462, "epoch": 1272} {"train_loss": -5.979087829589844, "global_step": 53463, "epoch": 1272} {"train_loss": -5.724793434143066, "global_step": 53464, "epoch": 1272} {"train_loss": -5.7760243983495805, "global_step": 53465, "epoch": 1272, "val_loss": 66511.609375} {"train_loss": -5.740389823913574, "global_step": 53466, "epoch": 1273} {"train_loss": -5.619052886962891, "global_step": 53467, "epoch": 1273} {"train_loss": -5.80496883392334, "global_step": 53468, "epoch": 1273} {"train_loss": -5.617162704467773, "global_step": 53469, "epoch": 1273} {"train_loss": -5.808780670166016, "global_step": 53470, "epoch": 1273} {"train_loss": -5.761138916015625, "global_step": 53471, "epoch": 1273} {"train_loss": -5.611811637878418, "global_step": 53472, "epoch": 1273} {"train_loss": -5.67570686340332, "global_step": 53473, "epoch": 1273} {"train_loss": -5.823065757751465, "global_step": 53474, "epoch": 1273} {"train_loss": -5.8188629150390625, "global_step": 53475, "epoch": 1273} {"train_loss": -5.739500999450684, "global_step": 53476, "epoch": 1273} {"train_loss": -5.811887741088867, "global_step": 53477, "epoch": 1273} {"train_loss": -5.8452959060668945, "global_step": 53478, "epoch": 1273} {"train_loss": -5.839611530303955, "global_step": 53479, "epoch": 1273} {"train_loss": -5.753906726837158, "global_step": 53480, "epoch": 1273} {"train_loss": -5.871823310852051, "global_step": 53481, "epoch": 1273} {"train_loss": -5.797198295593262, "global_step": 53482, "epoch": 1273} {"train_loss": -5.915997505187988, "global_step": 53483, "epoch": 1273} {"train_loss": -5.702789306640625, "global_step": 53484, "epoch": 1273} {"train_loss": -5.771172523498535, "global_step": 53485, "epoch": 1273} {"train_loss": -5.821195125579834, "global_step": 53486, "epoch": 1273} {"train_loss": -5.789544105529785, "global_step": 53487, "epoch": 1273} {"train_loss": -5.824590682983398, "global_step": 53488, "epoch": 1273} {"train_loss": -5.72259521484375, "global_step": 53489, "epoch": 1273} {"train_loss": -5.8421430587768555, "global_step": 53490, "epoch": 1273} {"train_loss": -5.629693031311035, "global_step": 53491, "epoch": 1273} {"train_loss": -5.772271156311035, "global_step": 53492, "epoch": 1273} {"train_loss": -5.770137786865234, "global_step": 53493, "epoch": 1273} {"train_loss": -5.797669410705566, "global_step": 53494, "epoch": 1273} {"train_loss": -5.7220611572265625, "global_step": 53495, "epoch": 1273} {"train_loss": -5.759997367858887, "global_step": 53496, "epoch": 1273} {"train_loss": -5.84470272064209, "global_step": 53497, "epoch": 1273} {"train_loss": -5.87324333190918, "global_step": 53498, "epoch": 1273} {"train_loss": -5.766289710998535, "global_step": 53499, "epoch": 1273} {"train_loss": -5.7707109451293945, "global_step": 53500, "epoch": 1273} {"train_loss": -5.739680290222168, "global_step": 53501, "epoch": 1273} {"train_loss": -5.906136512756348, "global_step": 53502, "epoch": 1273} {"train_loss": -5.836716651916504, "global_step": 53503, "epoch": 1273} {"train_loss": -5.800617218017578, "global_step": 53504, "epoch": 1273} {"train_loss": -5.845567226409912, "global_step": 53505, "epoch": 1273} {"train_loss": -5.795403480529785, "global_step": 53506, "epoch": 1273} {"train_loss": -5.776477552595592, "global_step": 53507, "epoch": 1273, "val_loss": 66281.6484375} {"train_loss": -5.717401504516602, "global_step": 53508, "epoch": 1274} {"train_loss": -5.852998733520508, "global_step": 53509, "epoch": 1274} {"train_loss": -5.7621564865112305, "global_step": 53510, "epoch": 1274} {"train_loss": -5.780139923095703, "global_step": 53511, "epoch": 1274} {"train_loss": -5.813555717468262, "global_step": 53512, "epoch": 1274} {"train_loss": -5.893335342407227, "global_step": 53513, "epoch": 1274} {"train_loss": -5.9152398109436035, "global_step": 53514, "epoch": 1274} {"train_loss": -5.791784286499023, "global_step": 53515, "epoch": 1274} {"train_loss": -5.82503604888916, "global_step": 53516, "epoch": 1274} {"train_loss": -5.864479064941406, "global_step": 53517, "epoch": 1274} {"train_loss": -5.685215473175049, "global_step": 53518, "epoch": 1274} {"train_loss": -5.951041221618652, "global_step": 53519, "epoch": 1274} {"train_loss": -5.592320442199707, "global_step": 53520, "epoch": 1274} {"train_loss": -5.845910549163818, "global_step": 53521, "epoch": 1274} {"train_loss": -5.8004984855651855, "global_step": 53522, "epoch": 1274} {"train_loss": -5.6892828941345215, "global_step": 53523, "epoch": 1274} {"train_loss": -5.923444747924805, "global_step": 53524, "epoch": 1274} {"train_loss": -5.825159072875977, "global_step": 53525, "epoch": 1274} {"train_loss": -5.658243179321289, "global_step": 53526, "epoch": 1274} {"train_loss": -5.7664055824279785, "global_step": 53527, "epoch": 1274} {"train_loss": -5.7499237060546875, "global_step": 53528, "epoch": 1274} {"train_loss": -5.784497261047363, "global_step": 53529, "epoch": 1274} {"train_loss": -5.691518783569336, "global_step": 53530, "epoch": 1274} {"train_loss": -5.798914432525635, "global_step": 53531, "epoch": 1274} {"train_loss": -5.945422649383545, "global_step": 53532, "epoch": 1274} {"train_loss": -5.68084192276001, "global_step": 53533, "epoch": 1274} {"train_loss": -5.874482154846191, "global_step": 53534, "epoch": 1274} {"train_loss": -5.740781784057617, "global_step": 53535, "epoch": 1274} {"train_loss": -5.883437156677246, "global_step": 53536, "epoch": 1274} {"train_loss": -5.816291332244873, "global_step": 53537, "epoch": 1274} {"train_loss": -5.6820502281188965, "global_step": 53538, "epoch": 1274} {"train_loss": -5.850108623504639, "global_step": 53539, "epoch": 1274} {"train_loss": -5.766777038574219, "global_step": 53540, "epoch": 1274} {"train_loss": -5.7914228439331055, "global_step": 53541, "epoch": 1274} {"train_loss": -5.746660232543945, "global_step": 53542, "epoch": 1274} {"train_loss": -5.764624118804932, "global_step": 53543, "epoch": 1274} {"train_loss": -5.908300876617432, "global_step": 53544, "epoch": 1274} {"train_loss": -5.784196376800537, "global_step": 53545, "epoch": 1274} {"train_loss": -5.762669563293457, "global_step": 53546, "epoch": 1274} {"train_loss": -5.836908340454102, "global_step": 53547, "epoch": 1274} {"train_loss": -5.761335372924805, "global_step": 53548, "epoch": 1274} {"train_loss": -5.793470473516555, "global_step": 53549, "epoch": 1274, "val_loss": 66682.8671875} {"train_loss": -5.754157066345215, "global_step": 53550, "epoch": 1275} {"train_loss": -5.872004508972168, "global_step": 53551, "epoch": 1275} {"train_loss": -5.681937217712402, "global_step": 53552, "epoch": 1275} {"train_loss": -5.855939865112305, "global_step": 53553, "epoch": 1275} {"train_loss": -5.803351402282715, "global_step": 53554, "epoch": 1275} {"train_loss": -5.89634895324707, "global_step": 53555, "epoch": 1275} {"train_loss": -5.765752792358398, "global_step": 53556, "epoch": 1275} {"train_loss": -5.847369194030762, "global_step": 53557, "epoch": 1275} {"train_loss": -5.910986423492432, "global_step": 53558, "epoch": 1275} {"train_loss": -5.784808158874512, "global_step": 53559, "epoch": 1275} {"train_loss": -5.950323104858398, "global_step": 53560, "epoch": 1275} {"train_loss": -5.821978569030762, "global_step": 53561, "epoch": 1275} {"train_loss": -5.648201942443848, "global_step": 53562, "epoch": 1275} {"train_loss": -5.817065238952637, "global_step": 53563, "epoch": 1275} {"train_loss": -5.813125133514404, "global_step": 53564, "epoch": 1275} {"train_loss": -5.820753574371338, "global_step": 53565, "epoch": 1275} {"train_loss": -5.838561058044434, "global_step": 53566, "epoch": 1275} {"train_loss": -5.895163536071777, "global_step": 53567, "epoch": 1275} {"train_loss": -5.890979766845703, "global_step": 53568, "epoch": 1275} {"train_loss": -5.864989280700684, "global_step": 53569, "epoch": 1275} {"train_loss": -5.880355358123779, "global_step": 53570, "epoch": 1275} {"train_loss": -5.8187150955200195, "global_step": 53571, "epoch": 1275} {"train_loss": -5.952817916870117, "global_step": 53572, "epoch": 1275} {"train_loss": -5.709765434265137, "global_step": 53573, "epoch": 1275} {"train_loss": -5.913759231567383, "global_step": 53574, "epoch": 1275} {"train_loss": -5.694518089294434, "global_step": 53575, "epoch": 1275} {"train_loss": -5.836788654327393, "global_step": 53576, "epoch": 1275} {"train_loss": -5.749821186065674, "global_step": 53577, "epoch": 1275} {"train_loss": -5.8252081871032715, "global_step": 53578, "epoch": 1275} {"train_loss": -5.8154802322387695, "global_step": 53579, "epoch": 1275} {"train_loss": -5.718714714050293, "global_step": 53580, "epoch": 1275} {"train_loss": -5.721776008605957, "global_step": 53581, "epoch": 1275} {"train_loss": -5.833080291748047, "global_step": 53582, "epoch": 1275} {"train_loss": -5.8801469802856445, "global_step": 53583, "epoch": 1275} {"train_loss": -5.964095115661621, "global_step": 53584, "epoch": 1275} {"train_loss": -5.808193683624268, "global_step": 53585, "epoch": 1275} {"train_loss": -5.7895708084106445, "global_step": 53586, "epoch": 1275} {"train_loss": -5.756262302398682, "global_step": 53587, "epoch": 1275} {"train_loss": -5.818594932556152, "global_step": 53588, "epoch": 1275} {"train_loss": -5.882144927978516, "global_step": 53589, "epoch": 1275} {"train_loss": -5.7155866622924805, "global_step": 53590, "epoch": 1275} {"train_loss": -5.817643438066755, "global_step": 53591, "epoch": 1275, "val_loss": 66396.8046875} {"train_loss": -5.884055137634277, "global_step": 53592, "epoch": 1276} {"train_loss": -5.878824710845947, "global_step": 53593, "epoch": 1276} {"train_loss": -5.963186264038086, "global_step": 53594, "epoch": 1276} {"train_loss": -5.726254940032959, "global_step": 53595, "epoch": 1276} {"train_loss": -5.784421920776367, "global_step": 53596, "epoch": 1276} {"train_loss": -5.671370506286621, "global_step": 53597, "epoch": 1276} {"train_loss": -5.85389518737793, "global_step": 53598, "epoch": 1276} {"train_loss": -5.780645370483398, "global_step": 53599, "epoch": 1276} {"train_loss": -5.811361789703369, "global_step": 53600, "epoch": 1276} {"train_loss": -5.823822021484375, "global_step": 53601, "epoch": 1276} {"train_loss": -5.892806053161621, "global_step": 53602, "epoch": 1276} {"train_loss": -5.883048057556152, "global_step": 53603, "epoch": 1276} {"train_loss": -5.835270404815674, "global_step": 53604, "epoch": 1276} {"train_loss": -5.907323837280273, "global_step": 53605, "epoch": 1276} {"train_loss": -5.7441630363464355, "global_step": 53606, "epoch": 1276} {"train_loss": -5.911334037780762, "global_step": 53607, "epoch": 1276} {"train_loss": -5.814450263977051, "global_step": 53608, "epoch": 1276} {"train_loss": -5.830324172973633, "global_step": 53609, "epoch": 1276} {"train_loss": -5.7477850914001465, "global_step": 53610, "epoch": 1276} {"train_loss": -5.7535600662231445, "global_step": 53611, "epoch": 1276} {"train_loss": -5.897989273071289, "global_step": 53612, "epoch": 1276} {"train_loss": -5.717280387878418, "global_step": 53613, "epoch": 1276} {"train_loss": -5.759918212890625, "global_step": 53614, "epoch": 1276} {"train_loss": -5.881704330444336, "global_step": 53615, "epoch": 1276} {"train_loss": -5.647027492523193, "global_step": 53616, "epoch": 1276} {"train_loss": -5.8175554275512695, "global_step": 53617, "epoch": 1276} {"train_loss": -5.785332679748535, "global_step": 53618, "epoch": 1276} {"train_loss": -5.804624080657959, "global_step": 53619, "epoch": 1276} {"train_loss": -5.805275917053223, "global_step": 53620, "epoch": 1276} {"train_loss": -5.821620464324951, "global_step": 53621, "epoch": 1276} {"train_loss": -5.684626579284668, "global_step": 53622, "epoch": 1276} {"train_loss": -5.643044471740723, "global_step": 53623, "epoch": 1276} {"train_loss": -5.6649580001831055, "global_step": 53624, "epoch": 1276} {"train_loss": -5.632305145263672, "global_step": 53625, "epoch": 1276} {"train_loss": -5.676243305206299, "global_step": 53626, "epoch": 1276} {"train_loss": -5.759274482727051, "global_step": 53627, "epoch": 1276} {"train_loss": -5.66500997543335, "global_step": 53628, "epoch": 1276} {"train_loss": -5.648493766784668, "global_step": 53629, "epoch": 1276} {"train_loss": -5.726273536682129, "global_step": 53630, "epoch": 1276} {"train_loss": -5.837252616882324, "global_step": 53631, "epoch": 1276} {"train_loss": -5.756624221801758, "global_step": 53632, "epoch": 1276} {"train_loss": -5.783868437721615, "global_step": 53633, "epoch": 1276, "val_loss": 66404.7734375} {"train_loss": -5.837282180786133, "global_step": 53634, "epoch": 1277} {"train_loss": -5.813899517059326, "global_step": 53635, "epoch": 1277} {"train_loss": -5.906650543212891, "global_step": 53636, "epoch": 1277} {"train_loss": -5.782351493835449, "global_step": 53637, "epoch": 1277} {"train_loss": -5.782645225524902, "global_step": 53638, "epoch": 1277} {"train_loss": -5.749648094177246, "global_step": 53639, "epoch": 1277} {"train_loss": -5.759363174438477, "global_step": 53640, "epoch": 1277} {"train_loss": -5.905872344970703, "global_step": 53641, "epoch": 1277} {"train_loss": -5.81913423538208, "global_step": 53642, "epoch": 1277} {"train_loss": -5.814917087554932, "global_step": 53643, "epoch": 1277} {"train_loss": -5.741250514984131, "global_step": 53644, "epoch": 1277} {"train_loss": -5.812603950500488, "global_step": 53645, "epoch": 1277} {"train_loss": -5.940043926239014, "global_step": 53646, "epoch": 1277} {"train_loss": -5.796623229980469, "global_step": 53647, "epoch": 1277} {"train_loss": -5.869362831115723, "global_step": 53648, "epoch": 1277} {"train_loss": -5.823914051055908, "global_step": 53649, "epoch": 1277} {"train_loss": -5.797231674194336, "global_step": 53650, "epoch": 1277} {"train_loss": -5.7329511642456055, "global_step": 53651, "epoch": 1277} {"train_loss": -5.733797073364258, "global_step": 53652, "epoch": 1277} {"train_loss": -5.930375099182129, "global_step": 53653, "epoch": 1277} {"train_loss": -5.922021865844727, "global_step": 53654, "epoch": 1277} {"train_loss": -5.747622966766357, "global_step": 53655, "epoch": 1277} {"train_loss": -5.844577789306641, "global_step": 53656, "epoch": 1277} {"train_loss": -5.815435409545898, "global_step": 53657, "epoch": 1277} {"train_loss": -5.740373611450195, "global_step": 53658, "epoch": 1277} {"train_loss": -5.83099889755249, "global_step": 53659, "epoch": 1277} {"train_loss": -5.882681369781494, "global_step": 53660, "epoch": 1277} {"train_loss": -5.773681640625, "global_step": 53661, "epoch": 1277} {"train_loss": -5.754915237426758, "global_step": 53662, "epoch": 1277} {"train_loss": -5.802850723266602, "global_step": 53663, "epoch": 1277} {"train_loss": -5.757163047790527, "global_step": 53664, "epoch": 1277} {"train_loss": -5.760804176330566, "global_step": 53665, "epoch": 1277} {"train_loss": -5.729124546051025, "global_step": 53666, "epoch": 1277} {"train_loss": -5.890974044799805, "global_step": 53667, "epoch": 1277} {"train_loss": -5.9780988693237305, "global_step": 53668, "epoch": 1277} {"train_loss": -5.940278053283691, "global_step": 53669, "epoch": 1277} {"train_loss": -5.786186218261719, "global_step": 53670, "epoch": 1277} {"train_loss": -5.6616363525390625, "global_step": 53671, "epoch": 1277} {"train_loss": -5.958493232727051, "global_step": 53672, "epoch": 1277} {"train_loss": -5.836828231811523, "global_step": 53673, "epoch": 1277} {"train_loss": -5.777318000793457, "global_step": 53674, "epoch": 1277} {"train_loss": -5.819958959306989, "global_step": 53675, "epoch": 1277, "val_loss": 66278.203125} {"train_loss": -5.833782196044922, "global_step": 53676, "epoch": 1278} {"train_loss": -5.7669267654418945, "global_step": 53677, "epoch": 1278} {"train_loss": -5.80885124206543, "global_step": 53678, "epoch": 1278} {"train_loss": -5.83390998840332, "global_step": 53679, "epoch": 1278} {"train_loss": -5.8000922203063965, "global_step": 53680, "epoch": 1278} {"train_loss": -5.879843711853027, "global_step": 53681, "epoch": 1278} {"train_loss": -5.835722923278809, "global_step": 53682, "epoch": 1278} {"train_loss": -5.794491767883301, "global_step": 53683, "epoch": 1278} {"train_loss": -5.763236999511719, "global_step": 53684, "epoch": 1278} {"train_loss": -5.881984233856201, "global_step": 53685, "epoch": 1278} {"train_loss": -5.907401084899902, "global_step": 53686, "epoch": 1278} {"train_loss": -5.799980640411377, "global_step": 53687, "epoch": 1278} {"train_loss": -5.751225471496582, "global_step": 53688, "epoch": 1278} {"train_loss": -5.778424263000488, "global_step": 53689, "epoch": 1278} {"train_loss": -5.79097843170166, "global_step": 53690, "epoch": 1278} {"train_loss": -5.8901801109313965, "global_step": 53691, "epoch": 1278} {"train_loss": -5.7138872146606445, "global_step": 53692, "epoch": 1278} {"train_loss": -5.87842321395874, "global_step": 53693, "epoch": 1278} {"train_loss": -5.70197868347168, "global_step": 53694, "epoch": 1278} {"train_loss": -5.779122829437256, "global_step": 53695, "epoch": 1278} {"train_loss": -5.718931198120117, "global_step": 53696, "epoch": 1278} {"train_loss": -5.744132041931152, "global_step": 53697, "epoch": 1278} {"train_loss": -5.864907264709473, "global_step": 53698, "epoch": 1278} {"train_loss": -5.8644609451293945, "global_step": 53699, "epoch": 1278} {"train_loss": -5.780828475952148, "global_step": 53700, "epoch": 1278} {"train_loss": -5.733709335327148, "global_step": 53701, "epoch": 1278} {"train_loss": -5.823408126831055, "global_step": 53702, "epoch": 1278} {"train_loss": -5.837800979614258, "global_step": 53703, "epoch": 1278} {"train_loss": -5.897273063659668, "global_step": 53704, "epoch": 1278} {"train_loss": -5.76892614364624, "global_step": 53705, "epoch": 1278} {"train_loss": -5.899432182312012, "global_step": 53706, "epoch": 1278} {"train_loss": -5.93994140625, "global_step": 53707, "epoch": 1278} {"train_loss": -5.899136066436768, "global_step": 53708, "epoch": 1278} {"train_loss": -5.753334999084473, "global_step": 53709, "epoch": 1278} {"train_loss": -5.903285503387451, "global_step": 53710, "epoch": 1278} {"train_loss": -5.849323272705078, "global_step": 53711, "epoch": 1278} {"train_loss": -5.755692958831787, "global_step": 53712, "epoch": 1278} {"train_loss": -5.771923065185547, "global_step": 53713, "epoch": 1278} {"train_loss": -5.795819282531738, "global_step": 53714, "epoch": 1278} {"train_loss": -5.824228286743164, "global_step": 53715, "epoch": 1278} {"train_loss": -5.884362697601318, "global_step": 53716, "epoch": 1278} {"train_loss": -5.81137356303987, "global_step": 53717, "epoch": 1278, "val_loss": 66550.96875} {"train_loss": -5.705259323120117, "global_step": 53718, "epoch": 1279} {"train_loss": -5.822373390197754, "global_step": 53719, "epoch": 1279} {"train_loss": -5.7866997718811035, "global_step": 53720, "epoch": 1279} {"train_loss": -5.729983329772949, "global_step": 53721, "epoch": 1279} {"train_loss": -5.745041847229004, "global_step": 53722, "epoch": 1279} {"train_loss": -5.827722549438477, "global_step": 53723, "epoch": 1279} {"train_loss": -5.824239253997803, "global_step": 53724, "epoch": 1279} {"train_loss": -5.755181312561035, "global_step": 53725, "epoch": 1279} {"train_loss": -5.706418991088867, "global_step": 53726, "epoch": 1279} {"train_loss": -5.737326622009277, "global_step": 53727, "epoch": 1279} {"train_loss": -5.703309059143066, "global_step": 53728, "epoch": 1279} {"train_loss": -5.797136306762695, "global_step": 53729, "epoch": 1279} {"train_loss": -5.778425693511963, "global_step": 53730, "epoch": 1279} {"train_loss": -5.655959129333496, "global_step": 53731, "epoch": 1279} {"train_loss": -5.7020721435546875, "global_step": 53732, "epoch": 1279} {"train_loss": -5.667840957641602, "global_step": 53733, "epoch": 1279} {"train_loss": -5.889200210571289, "global_step": 53734, "epoch": 1279} {"train_loss": -5.843268394470215, "global_step": 53735, "epoch": 1279} {"train_loss": -5.867403507232666, "global_step": 53736, "epoch": 1279} {"train_loss": -5.7544097900390625, "global_step": 53737, "epoch": 1279} {"train_loss": -5.729536056518555, "global_step": 53738, "epoch": 1279} {"train_loss": -5.723228454589844, "global_step": 53739, "epoch": 1279} {"train_loss": -5.802097320556641, "global_step": 53740, "epoch": 1279} {"train_loss": -5.824856758117676, "global_step": 53741, "epoch": 1279} {"train_loss": -5.917325973510742, "global_step": 53742, "epoch": 1279} {"train_loss": -5.95298433303833, "global_step": 53743, "epoch": 1279} {"train_loss": -5.700675010681152, "global_step": 53744, "epoch": 1279} {"train_loss": -5.880805015563965, "global_step": 53745, "epoch": 1279} {"train_loss": -5.761442184448242, "global_step": 53746, "epoch": 1279} {"train_loss": -5.721820831298828, "global_step": 53747, "epoch": 1279} {"train_loss": -5.692612648010254, "global_step": 53748, "epoch": 1279} {"train_loss": -5.748753070831299, "global_step": 53749, "epoch": 1279} {"train_loss": -5.792399883270264, "global_step": 53750, "epoch": 1279} {"train_loss": -5.824293613433838, "global_step": 53751, "epoch": 1279} {"train_loss": -5.750816345214844, "global_step": 53752, "epoch": 1279} {"train_loss": -5.8092474937438965, "global_step": 53753, "epoch": 1279} {"train_loss": -5.800164699554443, "global_step": 53754, "epoch": 1279} {"train_loss": -5.840190410614014, "global_step": 53755, "epoch": 1279} {"train_loss": -5.729050636291504, "global_step": 53756, "epoch": 1279} {"train_loss": -5.838611602783203, "global_step": 53757, "epoch": 1279} {"train_loss": -5.7750043869018555, "global_step": 53758, "epoch": 1279} {"train_loss": -5.779378720692226, "global_step": 53759, "epoch": 1279, "val_loss": 66326.765625} {"train_loss": -5.87308931350708, "global_step": 53760, "epoch": 1280} {"train_loss": -5.794497966766357, "global_step": 53761, "epoch": 1280} {"train_loss": -5.815749168395996, "global_step": 53762, "epoch": 1280} {"train_loss": -5.822908878326416, "global_step": 53763, "epoch": 1280} {"train_loss": -5.826668739318848, "global_step": 53764, "epoch": 1280} {"train_loss": -5.863476753234863, "global_step": 53765, "epoch": 1280} {"train_loss": -5.824915885925293, "global_step": 53766, "epoch": 1280} {"train_loss": -5.797536373138428, "global_step": 53767, "epoch": 1280} {"train_loss": -5.718769073486328, "global_step": 53768, "epoch": 1280} {"train_loss": -5.638945579528809, "global_step": 53769, "epoch": 1280} {"train_loss": -5.80784797668457, "global_step": 53770, "epoch": 1280} {"train_loss": -5.799222469329834, "global_step": 53771, "epoch": 1280} {"train_loss": -5.973213195800781, "global_step": 53772, "epoch": 1280} {"train_loss": -5.728399276733398, "global_step": 53773, "epoch": 1280} {"train_loss": -5.776145935058594, "global_step": 53774, "epoch": 1280} {"train_loss": -5.821959018707275, "global_step": 53775, "epoch": 1280} {"train_loss": -5.864675521850586, "global_step": 53776, "epoch": 1280} {"train_loss": -5.8290205001831055, "global_step": 53777, "epoch": 1280} {"train_loss": -5.8803181648254395, "global_step": 53778, "epoch": 1280} {"train_loss": -5.750044345855713, "global_step": 53779, "epoch": 1280} {"train_loss": -5.789519309997559, "global_step": 53780, "epoch": 1280} {"train_loss": -5.788512229919434, "global_step": 53781, "epoch": 1280} {"train_loss": -5.841123580932617, "global_step": 53782, "epoch": 1280} {"train_loss": -5.713442802429199, "global_step": 53783, "epoch": 1280} {"train_loss": -5.720498085021973, "global_step": 53784, "epoch": 1280} {"train_loss": -5.759357452392578, "global_step": 53785, "epoch": 1280} {"train_loss": -5.776434421539307, "global_step": 53786, "epoch": 1280} {"train_loss": -5.666613578796387, "global_step": 53787, "epoch": 1280} {"train_loss": -5.867159843444824, "global_step": 53788, "epoch": 1280} {"train_loss": -5.74433708190918, "global_step": 53789, "epoch": 1280} {"train_loss": -5.902438163757324, "global_step": 53790, "epoch": 1280} {"train_loss": -5.6351799964904785, "global_step": 53791, "epoch": 1280} {"train_loss": -5.8100786209106445, "global_step": 53792, "epoch": 1280} {"train_loss": -5.830920219421387, "global_step": 53793, "epoch": 1280} {"train_loss": -5.660155296325684, "global_step": 53794, "epoch": 1280} {"train_loss": -5.96435022354126, "global_step": 53795, "epoch": 1280} {"train_loss": -5.782636642456055, "global_step": 53796, "epoch": 1280} {"train_loss": -5.80616569519043, "global_step": 53797, "epoch": 1280} {"train_loss": -5.849055290222168, "global_step": 53798, "epoch": 1280} {"train_loss": -5.630612850189209, "global_step": 53799, "epoch": 1280} {"train_loss": -5.936202049255371, "global_step": 53800, "epoch": 1280} {"train_loss": -5.795106149855114, "global_step": 53801, "epoch": 1280, "val_loss": 66341.1171875} {"train_loss": -5.851381778717041, "global_step": 53802, "epoch": 1281} {"train_loss": -5.666095733642578, "global_step": 53803, "epoch": 1281} {"train_loss": -5.775607585906982, "global_step": 53804, "epoch": 1281} {"train_loss": -5.822648048400879, "global_step": 53805, "epoch": 1281} {"train_loss": -5.899808883666992, "global_step": 53806, "epoch": 1281} {"train_loss": -5.766913890838623, "global_step": 53807, "epoch": 1281} {"train_loss": -5.817893981933594, "global_step": 53808, "epoch": 1281} {"train_loss": -5.806545734405518, "global_step": 53809, "epoch": 1281} {"train_loss": -5.755772590637207, "global_step": 53810, "epoch": 1281} {"train_loss": -5.810963153839111, "global_step": 53811, "epoch": 1281} {"train_loss": -5.700836181640625, "global_step": 53812, "epoch": 1281} {"train_loss": -5.622988224029541, "global_step": 53813, "epoch": 1281} {"train_loss": -5.7792582511901855, "global_step": 53814, "epoch": 1281} {"train_loss": -5.762757778167725, "global_step": 53815, "epoch": 1281} {"train_loss": -5.604145050048828, "global_step": 53816, "epoch": 1281} {"train_loss": -5.871859550476074, "global_step": 53817, "epoch": 1281} {"train_loss": -5.6633100509643555, "global_step": 53818, "epoch": 1281} {"train_loss": -5.832071781158447, "global_step": 53819, "epoch": 1281} {"train_loss": -5.803022384643555, "global_step": 53820, "epoch": 1281} {"train_loss": -5.723689079284668, "global_step": 53821, "epoch": 1281} {"train_loss": -5.834994316101074, "global_step": 53822, "epoch": 1281} {"train_loss": -5.742373943328857, "global_step": 53823, "epoch": 1281} {"train_loss": -5.813442230224609, "global_step": 53824, "epoch": 1281} {"train_loss": -5.734036922454834, "global_step": 53825, "epoch": 1281} {"train_loss": -5.66170072555542, "global_step": 53826, "epoch": 1281} {"train_loss": -5.626874923706055, "global_step": 53827, "epoch": 1281} {"train_loss": -5.734173774719238, "global_step": 53828, "epoch": 1281} {"train_loss": -5.8727946281433105, "global_step": 53829, "epoch": 1281} {"train_loss": -5.8227152824401855, "global_step": 53830, "epoch": 1281} {"train_loss": -5.754059791564941, "global_step": 53831, "epoch": 1281} {"train_loss": -5.918422222137451, "global_step": 53832, "epoch": 1281} {"train_loss": -5.766173362731934, "global_step": 53833, "epoch": 1281} {"train_loss": -5.791320323944092, "global_step": 53834, "epoch": 1281} {"train_loss": -5.946874141693115, "global_step": 53835, "epoch": 1281} {"train_loss": -5.815057754516602, "global_step": 53836, "epoch": 1281} {"train_loss": -5.745687484741211, "global_step": 53837, "epoch": 1281} {"train_loss": -5.788143157958984, "global_step": 53838, "epoch": 1281} {"train_loss": -5.67617130279541, "global_step": 53839, "epoch": 1281} {"train_loss": -5.742210388183594, "global_step": 53840, "epoch": 1281} {"train_loss": -5.818150997161865, "global_step": 53841, "epoch": 1281} {"train_loss": -5.8695831298828125, "global_step": 53842, "epoch": 1281} {"train_loss": -5.7779615720113116, "global_step": 53843, "epoch": 1281, "val_loss": 66335.8984375} {"train_loss": -5.680780410766602, "global_step": 53844, "epoch": 1282} {"train_loss": -5.818874359130859, "global_step": 53845, "epoch": 1282} {"train_loss": -5.722817420959473, "global_step": 53846, "epoch": 1282} {"train_loss": -5.862115383148193, "global_step": 53847, "epoch": 1282} {"train_loss": -5.812761306762695, "global_step": 53848, "epoch": 1282} {"train_loss": -5.8704023361206055, "global_step": 53849, "epoch": 1282} {"train_loss": -5.834545612335205, "global_step": 53850, "epoch": 1282} {"train_loss": -5.808037281036377, "global_step": 53851, "epoch": 1282} {"train_loss": -5.823350429534912, "global_step": 53852, "epoch": 1282} {"train_loss": -5.828031063079834, "global_step": 53853, "epoch": 1282} {"train_loss": -5.800887107849121, "global_step": 53854, "epoch": 1282} {"train_loss": -5.84962272644043, "global_step": 53855, "epoch": 1282} {"train_loss": -5.69505500793457, "global_step": 53856, "epoch": 1282} {"train_loss": -5.99799919128418, "global_step": 53857, "epoch": 1282} {"train_loss": -5.8440985679626465, "global_step": 53858, "epoch": 1282} {"train_loss": -5.743825912475586, "global_step": 53859, "epoch": 1282} {"train_loss": -5.703192710876465, "global_step": 53860, "epoch": 1282} {"train_loss": -5.792837619781494, "global_step": 53861, "epoch": 1282} {"train_loss": -5.903508186340332, "global_step": 53862, "epoch": 1282} {"train_loss": -5.869397163391113, "global_step": 53863, "epoch": 1282} {"train_loss": -5.8071088790893555, "global_step": 53864, "epoch": 1282} {"train_loss": -5.759513854980469, "global_step": 53865, "epoch": 1282} {"train_loss": -5.799102306365967, "global_step": 53866, "epoch": 1282} {"train_loss": -5.82943868637085, "global_step": 53867, "epoch": 1282} {"train_loss": -5.857698440551758, "global_step": 53868, "epoch": 1282} {"train_loss": -5.879089832305908, "global_step": 53869, "epoch": 1282} {"train_loss": -5.861703872680664, "global_step": 53870, "epoch": 1282} {"train_loss": -5.8282151222229, "global_step": 53871, "epoch": 1282} {"train_loss": -5.946070671081543, "global_step": 53872, "epoch": 1282} {"train_loss": -5.790520668029785, "global_step": 53873, "epoch": 1282} {"train_loss": -5.646879196166992, "global_step": 53874, "epoch": 1282} {"train_loss": -5.785490036010742, "global_step": 53875, "epoch": 1282} {"train_loss": -5.793371200561523, "global_step": 53876, "epoch": 1282} {"train_loss": -5.75851583480835, "global_step": 53877, "epoch": 1282} {"train_loss": -5.871747016906738, "global_step": 53878, "epoch": 1282} {"train_loss": -5.839880466461182, "global_step": 53879, "epoch": 1282} {"train_loss": -5.8472676277160645, "global_step": 53880, "epoch": 1282} {"train_loss": -5.765268802642822, "global_step": 53881, "epoch": 1282} {"train_loss": -5.773377418518066, "global_step": 53882, "epoch": 1282} {"train_loss": -5.790569305419922, "global_step": 53883, "epoch": 1282} {"train_loss": -5.839898109436035, "global_step": 53884, "epoch": 1282} {"train_loss": -5.81162378901527, "global_step": 53885, "epoch": 1282, "val_loss": 66342.625} {"train_loss": -5.877326965332031, "global_step": 53886, "epoch": 1283} {"train_loss": -5.920879364013672, "global_step": 53887, "epoch": 1283} {"train_loss": -5.795229911804199, "global_step": 53888, "epoch": 1283} {"train_loss": -5.824653625488281, "global_step": 53889, "epoch": 1283} {"train_loss": -5.948179244995117, "global_step": 53890, "epoch": 1283} {"train_loss": -5.816605567932129, "global_step": 53891, "epoch": 1283} {"train_loss": -5.878354072570801, "global_step": 53892, "epoch": 1283} {"train_loss": -5.823966979980469, "global_step": 53893, "epoch": 1283} {"train_loss": -5.840200424194336, "global_step": 53894, "epoch": 1283} {"train_loss": -5.864327430725098, "global_step": 53895, "epoch": 1283} {"train_loss": -5.874396324157715, "global_step": 53896, "epoch": 1283} {"train_loss": -5.8056535720825195, "global_step": 53897, "epoch": 1283} {"train_loss": -5.859633922576904, "global_step": 53898, "epoch": 1283} {"train_loss": -5.855768203735352, "global_step": 53899, "epoch": 1283} {"train_loss": -5.870723724365234, "global_step": 53900, "epoch": 1283} {"train_loss": -5.869245529174805, "global_step": 53901, "epoch": 1283} {"train_loss": -5.841952323913574, "global_step": 53902, "epoch": 1283} {"train_loss": -5.824556350708008, "global_step": 53903, "epoch": 1283} {"train_loss": -5.925060272216797, "global_step": 53904, "epoch": 1283} {"train_loss": -5.939521789550781, "global_step": 53905, "epoch": 1283} {"train_loss": -5.7566633224487305, "global_step": 53906, "epoch": 1283} {"train_loss": -5.7983903884887695, "global_step": 53907, "epoch": 1283} {"train_loss": -5.740197658538818, "global_step": 53908, "epoch": 1283} {"train_loss": -5.816092491149902, "global_step": 53909, "epoch": 1283} {"train_loss": -5.869250297546387, "global_step": 53910, "epoch": 1283} {"train_loss": -5.76849365234375, "global_step": 53911, "epoch": 1283} {"train_loss": -5.9274091720581055, "global_step": 53912, "epoch": 1283} {"train_loss": -5.8049516677856445, "global_step": 53913, "epoch": 1283} {"train_loss": -5.716329574584961, "global_step": 53914, "epoch": 1283} {"train_loss": -5.859426975250244, "global_step": 53915, "epoch": 1283} {"train_loss": -5.731446743011475, "global_step": 53916, "epoch": 1283} {"train_loss": -5.692955017089844, "global_step": 53917, "epoch": 1283} {"train_loss": -5.798255920410156, "global_step": 53918, "epoch": 1283} {"train_loss": -5.7178497314453125, "global_step": 53919, "epoch": 1283} {"train_loss": -5.802423477172852, "global_step": 53920, "epoch": 1283} {"train_loss": -5.826053142547607, "global_step": 53921, "epoch": 1283} {"train_loss": -5.853997230529785, "global_step": 53922, "epoch": 1283} {"train_loss": -5.822508811950684, "global_step": 53923, "epoch": 1283} {"train_loss": -5.734095573425293, "global_step": 53924, "epoch": 1283} {"train_loss": -5.586503028869629, "global_step": 53925, "epoch": 1283} {"train_loss": -5.722060203552246, "global_step": 53926, "epoch": 1283} {"train_loss": -5.817083858308338, "global_step": 53927, "epoch": 1283, "val_loss": 66108.109375} {"train_loss": -5.8303117752075195, "global_step": 53928, "epoch": 1284} {"train_loss": -5.832150936126709, "global_step": 53929, "epoch": 1284} {"train_loss": -5.901752471923828, "global_step": 53930, "epoch": 1284} {"train_loss": -5.894162654876709, "global_step": 53931, "epoch": 1284} {"train_loss": -5.918816089630127, "global_step": 53932, "epoch": 1284} {"train_loss": -5.775993347167969, "global_step": 53933, "epoch": 1284} {"train_loss": -5.813291549682617, "global_step": 53934, "epoch": 1284} {"train_loss": -5.846059799194336, "global_step": 53935, "epoch": 1284} {"train_loss": -5.831682205200195, "global_step": 53936, "epoch": 1284} {"train_loss": -5.747574329376221, "global_step": 53937, "epoch": 1284} {"train_loss": -5.763875484466553, "global_step": 53938, "epoch": 1284} {"train_loss": -5.905939102172852, "global_step": 53939, "epoch": 1284} {"train_loss": -5.794388771057129, "global_step": 53940, "epoch": 1284} {"train_loss": -5.777655601501465, "global_step": 53941, "epoch": 1284} {"train_loss": -5.797791481018066, "global_step": 53942, "epoch": 1284} {"train_loss": -5.680962085723877, "global_step": 53943, "epoch": 1284} {"train_loss": -5.755184173583984, "global_step": 53944, "epoch": 1284} {"train_loss": -5.778430938720703, "global_step": 53945, "epoch": 1284} {"train_loss": -5.653693199157715, "global_step": 53946, "epoch": 1284} {"train_loss": -5.820710182189941, "global_step": 53947, "epoch": 1284} {"train_loss": -5.735437393188477, "global_step": 53948, "epoch": 1284} {"train_loss": -5.87722110748291, "global_step": 53949, "epoch": 1284} {"train_loss": -5.8423027992248535, "global_step": 53950, "epoch": 1284} {"train_loss": -5.725594520568848, "global_step": 53951, "epoch": 1284} {"train_loss": -5.73209810256958, "global_step": 53952, "epoch": 1284} {"train_loss": -5.714689254760742, "global_step": 53953, "epoch": 1284} {"train_loss": -5.873913288116455, "global_step": 53954, "epoch": 1284} {"train_loss": -5.80015754699707, "global_step": 53955, "epoch": 1284} {"train_loss": -5.597935199737549, "global_step": 53956, "epoch": 1284} {"train_loss": -5.751408576965332, "global_step": 53957, "epoch": 1284} {"train_loss": -5.812583923339844, "global_step": 53958, "epoch": 1284} {"train_loss": -5.823948860168457, "global_step": 53959, "epoch": 1284} {"train_loss": -5.741907596588135, "global_step": 53960, "epoch": 1284} {"train_loss": -5.959880828857422, "global_step": 53961, "epoch": 1284} {"train_loss": -5.725469589233398, "global_step": 53962, "epoch": 1284} {"train_loss": -5.673725128173828, "global_step": 53963, "epoch": 1284} {"train_loss": -5.900026321411133, "global_step": 53964, "epoch": 1284} {"train_loss": -5.747799873352051, "global_step": 53965, "epoch": 1284} {"train_loss": -5.7573561668396, "global_step": 53966, "epoch": 1284} {"train_loss": -5.772665023803711, "global_step": 53967, "epoch": 1284} {"train_loss": -5.862247467041016, "global_step": 53968, "epoch": 1284} {"train_loss": -5.791096153713408, "global_step": 53969, "epoch": 1284, "val_loss": 66185.25} {"train_loss": -5.834789752960205, "global_step": 53970, "epoch": 1285} {"train_loss": -5.805941104888916, "global_step": 53971, "epoch": 1285} {"train_loss": -5.746099472045898, "global_step": 53972, "epoch": 1285} {"train_loss": -5.907590866088867, "global_step": 53973, "epoch": 1285} {"train_loss": -5.750185489654541, "global_step": 53974, "epoch": 1285} {"train_loss": -5.8728251457214355, "global_step": 53975, "epoch": 1285} {"train_loss": -5.8462748527526855, "global_step": 53976, "epoch": 1285} {"train_loss": -5.73708963394165, "global_step": 53977, "epoch": 1285} {"train_loss": -5.841614723205566, "global_step": 53978, "epoch": 1285} {"train_loss": -5.783961296081543, "global_step": 53979, "epoch": 1285} {"train_loss": -5.979384422302246, "global_step": 53980, "epoch": 1285} {"train_loss": -5.8272175788879395, "global_step": 53981, "epoch": 1285} {"train_loss": -5.818388938903809, "global_step": 53982, "epoch": 1285} {"train_loss": -5.924153804779053, "global_step": 53983, "epoch": 1285} {"train_loss": -5.898376941680908, "global_step": 53984, "epoch": 1285} {"train_loss": -5.824348449707031, "global_step": 53985, "epoch": 1285} {"train_loss": -5.794619560241699, "global_step": 53986, "epoch": 1285} {"train_loss": -5.9555840492248535, "global_step": 53987, "epoch": 1285} {"train_loss": -5.816995620727539, "global_step": 53988, "epoch": 1285} {"train_loss": -5.807480812072754, "global_step": 53989, "epoch": 1285} {"train_loss": -5.84702205657959, "global_step": 53990, "epoch": 1285} {"train_loss": -5.922137260437012, "global_step": 53991, "epoch": 1285} {"train_loss": -5.810388565063477, "global_step": 53992, "epoch": 1285} {"train_loss": -5.81644344329834, "global_step": 53993, "epoch": 1285} {"train_loss": -5.810540676116943, "global_step": 53994, "epoch": 1285} {"train_loss": -5.874835014343262, "global_step": 53995, "epoch": 1285} {"train_loss": -5.765627861022949, "global_step": 53996, "epoch": 1285} {"train_loss": -5.814457893371582, "global_step": 53997, "epoch": 1285} {"train_loss": -5.734497547149658, "global_step": 53998, "epoch": 1285} {"train_loss": -5.848075866699219, "global_step": 53999, "epoch": 1285} {"train_loss": -5.843281269073486, "global_step": 54000, "epoch": 1285} {"train_loss": -5.793905258178711, "global_step": 54001, "epoch": 1285} {"train_loss": -5.889834403991699, "global_step": 54002, "epoch": 1285} {"train_loss": -5.838351249694824, "global_step": 54003, "epoch": 1285} {"train_loss": -5.833954811096191, "global_step": 54004, "epoch": 1285} {"train_loss": -5.738613128662109, "global_step": 54005, "epoch": 1285} {"train_loss": -5.916267395019531, "global_step": 54006, "epoch": 1285} {"train_loss": -5.750458717346191, "global_step": 54007, "epoch": 1285} {"train_loss": -5.801408767700195, "global_step": 54008, "epoch": 1285} {"train_loss": -5.800065040588379, "global_step": 54009, "epoch": 1285} {"train_loss": -5.658673286437988, "global_step": 54010, "epoch": 1285} {"train_loss": -5.8256969792502264, "global_step": 54011, "epoch": 1285, "val_loss": 66401.3203125} {"train_loss": -5.800850868225098, "global_step": 54012, "epoch": 1286} {"train_loss": -5.801687717437744, "global_step": 54013, "epoch": 1286} {"train_loss": -5.8345417976379395, "global_step": 54014, "epoch": 1286} {"train_loss": -5.845364570617676, "global_step": 54015, "epoch": 1286} {"train_loss": -5.825113296508789, "global_step": 54016, "epoch": 1286} {"train_loss": -5.857365608215332, "global_step": 54017, "epoch": 1286} {"train_loss": -5.909486293792725, "global_step": 54018, "epoch": 1286} {"train_loss": -5.8669023513793945, "global_step": 54019, "epoch": 1286} {"train_loss": -5.842940330505371, "global_step": 54020, "epoch": 1286} {"train_loss": -5.829938888549805, "global_step": 54021, "epoch": 1286} {"train_loss": -5.730644226074219, "global_step": 54022, "epoch": 1286} {"train_loss": -5.945254802703857, "global_step": 54023, "epoch": 1286} {"train_loss": -5.811496257781982, "global_step": 54024, "epoch": 1286} {"train_loss": -5.82753849029541, "global_step": 54025, "epoch": 1286} {"train_loss": -5.805280685424805, "global_step": 54026, "epoch": 1286} {"train_loss": -5.8377532958984375, "global_step": 54027, "epoch": 1286} {"train_loss": -5.830205917358398, "global_step": 54028, "epoch": 1286} {"train_loss": -5.756862640380859, "global_step": 54029, "epoch": 1286} {"train_loss": -5.795138359069824, "global_step": 54030, "epoch": 1286} {"train_loss": -5.844521522521973, "global_step": 54031, "epoch": 1286} {"train_loss": -5.679131507873535, "global_step": 54032, "epoch": 1286} {"train_loss": -5.748154640197754, "global_step": 54033, "epoch": 1286} {"train_loss": -5.812685966491699, "global_step": 54034, "epoch": 1286} {"train_loss": -5.731359481811523, "global_step": 54035, "epoch": 1286} {"train_loss": -5.81842041015625, "global_step": 54036, "epoch": 1286} {"train_loss": -5.790414333343506, "global_step": 54037, "epoch": 1286} {"train_loss": -5.850738525390625, "global_step": 54038, "epoch": 1286} {"train_loss": -5.833678245544434, "global_step": 54039, "epoch": 1286} {"train_loss": -5.845414161682129, "global_step": 54040, "epoch": 1286} {"train_loss": -5.793012619018555, "global_step": 54041, "epoch": 1286} {"train_loss": -5.8185648918151855, "global_step": 54042, "epoch": 1286} {"train_loss": -5.671809196472168, "global_step": 54043, "epoch": 1286} {"train_loss": -5.841156959533691, "global_step": 54044, "epoch": 1286} {"train_loss": -5.881435871124268, "global_step": 54045, "epoch": 1286} {"train_loss": -5.8793134689331055, "global_step": 54046, "epoch": 1286} {"train_loss": -5.82744026184082, "global_step": 54047, "epoch": 1286} {"train_loss": -5.785061359405518, "global_step": 54048, "epoch": 1286} {"train_loss": -5.81630802154541, "global_step": 54049, "epoch": 1286} {"train_loss": -5.904462814331055, "global_step": 54050, "epoch": 1286} {"train_loss": -5.727020263671875, "global_step": 54051, "epoch": 1286} {"train_loss": -5.828093528747559, "global_step": 54052, "epoch": 1286} {"train_loss": -5.820641108921596, "global_step": 54053, "epoch": 1286, "val_loss": 66359.7265625} {"train_loss": -5.862534999847412, "global_step": 54054, "epoch": 1287} {"train_loss": -5.8167524337768555, "global_step": 54055, "epoch": 1287} {"train_loss": -5.957015037536621, "global_step": 54056, "epoch": 1287} {"train_loss": -5.728716850280762, "global_step": 54057, "epoch": 1287} {"train_loss": -5.834676742553711, "global_step": 54058, "epoch": 1287} {"train_loss": -5.747909069061279, "global_step": 54059, "epoch": 1287} {"train_loss": -5.703973770141602, "global_step": 54060, "epoch": 1287} {"train_loss": -5.89127779006958, "global_step": 54061, "epoch": 1287} {"train_loss": -5.857638835906982, "global_step": 54062, "epoch": 1287} {"train_loss": -5.600992202758789, "global_step": 54063, "epoch": 1287} {"train_loss": -5.801787853240967, "global_step": 54064, "epoch": 1287} {"train_loss": -5.943808555603027, "global_step": 54065, "epoch": 1287} {"train_loss": -5.923114776611328, "global_step": 54066, "epoch": 1287} {"train_loss": -5.727649211883545, "global_step": 54067, "epoch": 1287} {"train_loss": -5.9303693771362305, "global_step": 54068, "epoch": 1287} {"train_loss": -5.877320289611816, "global_step": 54069, "epoch": 1287} {"train_loss": -5.718681335449219, "global_step": 54070, "epoch": 1287} {"train_loss": -5.796780586242676, "global_step": 54071, "epoch": 1287} {"train_loss": -5.727177143096924, "global_step": 54072, "epoch": 1287} {"train_loss": -5.692334175109863, "global_step": 54073, "epoch": 1287} {"train_loss": -5.7581987380981445, "global_step": 54074, "epoch": 1287} {"train_loss": -5.769067287445068, "global_step": 54075, "epoch": 1287} {"train_loss": -5.880832672119141, "global_step": 54076, "epoch": 1287} {"train_loss": -5.655011177062988, "global_step": 54077, "epoch": 1287} {"train_loss": -5.808169364929199, "global_step": 54078, "epoch": 1287} {"train_loss": -5.792759895324707, "global_step": 54079, "epoch": 1287} {"train_loss": -5.804635524749756, "global_step": 54080, "epoch": 1287} {"train_loss": -5.886750221252441, "global_step": 54081, "epoch": 1287} {"train_loss": -5.685783386230469, "global_step": 54082, "epoch": 1287} {"train_loss": -5.898192405700684, "global_step": 54083, "epoch": 1287} {"train_loss": -5.758488655090332, "global_step": 54084, "epoch": 1287} {"train_loss": -5.862653732299805, "global_step": 54085, "epoch": 1287} {"train_loss": -5.732425689697266, "global_step": 54086, "epoch": 1287} {"train_loss": -5.651457786560059, "global_step": 54087, "epoch": 1287} {"train_loss": -5.818029403686523, "global_step": 54088, "epoch": 1287} {"train_loss": -5.700138568878174, "global_step": 54089, "epoch": 1287} {"train_loss": -5.777070999145508, "global_step": 54090, "epoch": 1287} {"train_loss": -5.644370079040527, "global_step": 54091, "epoch": 1287} {"train_loss": -5.810972690582275, "global_step": 54092, "epoch": 1287} {"train_loss": -5.704412937164307, "global_step": 54093, "epoch": 1287} {"train_loss": -5.933079719543457, "global_step": 54094, "epoch": 1287} {"train_loss": -5.7923111120859785, "global_step": 54095, "epoch": 1287, "val_loss": 66641.7109375} {"train_loss": -5.745501518249512, "global_step": 54096, "epoch": 1288} {"train_loss": -5.82747745513916, "global_step": 54097, "epoch": 1288} {"train_loss": -5.762753486633301, "global_step": 54098, "epoch": 1288} {"train_loss": -5.790853500366211, "global_step": 54099, "epoch": 1288} {"train_loss": -5.812365531921387, "global_step": 54100, "epoch": 1288} {"train_loss": -5.821348190307617, "global_step": 54101, "epoch": 1288} {"train_loss": -5.714812278747559, "global_step": 54102, "epoch": 1288} {"train_loss": -5.807991981506348, "global_step": 54103, "epoch": 1288} {"train_loss": -5.773050308227539, "global_step": 54104, "epoch": 1288} {"train_loss": -5.819118499755859, "global_step": 54105, "epoch": 1288} {"train_loss": -5.775374412536621, "global_step": 54106, "epoch": 1288} {"train_loss": -5.751862525939941, "global_step": 54107, "epoch": 1288} {"train_loss": -5.762361526489258, "global_step": 54108, "epoch": 1288} {"train_loss": -5.654971122741699, "global_step": 54109, "epoch": 1288} {"train_loss": -5.749238014221191, "global_step": 54110, "epoch": 1288} {"train_loss": -5.814707279205322, "global_step": 54111, "epoch": 1288} {"train_loss": -5.733393669128418, "global_step": 54112, "epoch": 1288} {"train_loss": -5.6866326332092285, "global_step": 54113, "epoch": 1288} {"train_loss": -5.813676834106445, "global_step": 54114, "epoch": 1288} {"train_loss": -5.8071208000183105, "global_step": 54115, "epoch": 1288} {"train_loss": -5.692173004150391, "global_step": 54116, "epoch": 1288} {"train_loss": -5.719358921051025, "global_step": 54117, "epoch": 1288} {"train_loss": -5.631354331970215, "global_step": 54118, "epoch": 1288} {"train_loss": -5.919246196746826, "global_step": 54119, "epoch": 1288} {"train_loss": -5.644469261169434, "global_step": 54120, "epoch": 1288} {"train_loss": -5.771429061889648, "global_step": 54121, "epoch": 1288} {"train_loss": -5.791500091552734, "global_step": 54122, "epoch": 1288} {"train_loss": -5.824515342712402, "global_step": 54123, "epoch": 1288} {"train_loss": -5.7904534339904785, "global_step": 54124, "epoch": 1288} {"train_loss": -5.580014705657959, "global_step": 54125, "epoch": 1288} {"train_loss": -5.775323867797852, "global_step": 54126, "epoch": 1288} {"train_loss": -5.710840702056885, "global_step": 54127, "epoch": 1288} {"train_loss": -5.777480602264404, "global_step": 54128, "epoch": 1288} {"train_loss": -5.720094680786133, "global_step": 54129, "epoch": 1288} {"train_loss": -5.856259822845459, "global_step": 54130, "epoch": 1288} {"train_loss": -5.731966018676758, "global_step": 54131, "epoch": 1288} {"train_loss": -5.711535453796387, "global_step": 54132, "epoch": 1288} {"train_loss": -5.778417587280273, "global_step": 54133, "epoch": 1288} {"train_loss": -5.730016708374023, "global_step": 54134, "epoch": 1288} {"train_loss": -5.819063186645508, "global_step": 54135, "epoch": 1288} {"train_loss": -5.748812675476074, "global_step": 54136, "epoch": 1288} {"train_loss": -5.758256367274693, "global_step": 54137, "epoch": 1288, "val_loss": 67029.171875} {"train_loss": -5.886693000793457, "global_step": 54138, "epoch": 1289} {"train_loss": -5.722668647766113, "global_step": 54139, "epoch": 1289} {"train_loss": -5.695265769958496, "global_step": 54140, "epoch": 1289} {"train_loss": -5.723542213439941, "global_step": 54141, "epoch": 1289} {"train_loss": -5.714372634887695, "global_step": 54142, "epoch": 1289} {"train_loss": -5.713647842407227, "global_step": 54143, "epoch": 1289} {"train_loss": -5.598084449768066, "global_step": 54144, "epoch": 1289} {"train_loss": -5.747493743896484, "global_step": 54145, "epoch": 1289} {"train_loss": -5.815877437591553, "global_step": 54146, "epoch": 1289} {"train_loss": -5.814610958099365, "global_step": 54147, "epoch": 1289} {"train_loss": -5.890766143798828, "global_step": 54148, "epoch": 1289} {"train_loss": -5.849856376647949, "global_step": 54149, "epoch": 1289} {"train_loss": -5.814693927764893, "global_step": 54150, "epoch": 1289} {"train_loss": -5.906123161315918, "global_step": 54151, "epoch": 1289} {"train_loss": -5.848488807678223, "global_step": 54152, "epoch": 1289} {"train_loss": -5.78033447265625, "global_step": 54153, "epoch": 1289} {"train_loss": -5.851152420043945, "global_step": 54154, "epoch": 1289} {"train_loss": -5.838178634643555, "global_step": 54155, "epoch": 1289} {"train_loss": -5.866884231567383, "global_step": 54156, "epoch": 1289} {"train_loss": -5.919644832611084, "global_step": 54157, "epoch": 1289} {"train_loss": -5.869010925292969, "global_step": 54158, "epoch": 1289} {"train_loss": -5.741284370422363, "global_step": 54159, "epoch": 1289} {"train_loss": -5.756288528442383, "global_step": 54160, "epoch": 1289} {"train_loss": -5.693863868713379, "global_step": 54161, "epoch": 1289} {"train_loss": -5.6818413734436035, "global_step": 54162, "epoch": 1289} {"train_loss": -5.893943786621094, "global_step": 54163, "epoch": 1289} {"train_loss": -5.718213081359863, "global_step": 54164, "epoch": 1289} {"train_loss": -5.747776031494141, "global_step": 54165, "epoch": 1289} {"train_loss": -5.729759216308594, "global_step": 54166, "epoch": 1289} {"train_loss": -5.7639360427856445, "global_step": 54167, "epoch": 1289} {"train_loss": -5.715266227722168, "global_step": 54168, "epoch": 1289} {"train_loss": -5.826176166534424, "global_step": 54169, "epoch": 1289} {"train_loss": -5.792335033416748, "global_step": 54170, "epoch": 1289} {"train_loss": -5.827585220336914, "global_step": 54171, "epoch": 1289} {"train_loss": -5.774972915649414, "global_step": 54172, "epoch": 1289} {"train_loss": -5.813544273376465, "global_step": 54173, "epoch": 1289} {"train_loss": -5.756999969482422, "global_step": 54174, "epoch": 1289} {"train_loss": -5.7632975578308105, "global_step": 54175, "epoch": 1289} {"train_loss": -5.611954689025879, "global_step": 54176, "epoch": 1289} {"train_loss": -5.839144706726074, "global_step": 54177, "epoch": 1289} {"train_loss": -5.906402587890625, "global_step": 54178, "epoch": 1289} {"train_loss": -5.787204538072858, "global_step": 54179, "epoch": 1289, "val_loss": 66381.296875} {"train_loss": -5.782641410827637, "global_step": 54180, "epoch": 1290} {"train_loss": -5.946247100830078, "global_step": 54181, "epoch": 1290} {"train_loss": -5.831039905548096, "global_step": 54182, "epoch": 1290} {"train_loss": -5.790055274963379, "global_step": 54183, "epoch": 1290} {"train_loss": -5.922088146209717, "global_step": 54184, "epoch": 1290} {"train_loss": -5.776820659637451, "global_step": 54185, "epoch": 1290} {"train_loss": -5.801418781280518, "global_step": 54186, "epoch": 1290} {"train_loss": -5.858842849731445, "global_step": 54187, "epoch": 1290} {"train_loss": -5.962756156921387, "global_step": 54188, "epoch": 1290} {"train_loss": -5.836620330810547, "global_step": 54189, "epoch": 1290} {"train_loss": -5.848603248596191, "global_step": 54190, "epoch": 1290} {"train_loss": -5.672845840454102, "global_step": 54191, "epoch": 1290} {"train_loss": -5.658937454223633, "global_step": 54192, "epoch": 1290} {"train_loss": -5.592794418334961, "global_step": 54193, "epoch": 1290} {"train_loss": -5.8886260986328125, "global_step": 54194, "epoch": 1290} {"train_loss": -5.6350908279418945, "global_step": 54195, "epoch": 1290} {"train_loss": -5.777678489685059, "global_step": 54196, "epoch": 1290} {"train_loss": -5.6793622970581055, "global_step": 54197, "epoch": 1290} {"train_loss": -5.71884822845459, "global_step": 54198, "epoch": 1290} {"train_loss": -5.828641891479492, "global_step": 54199, "epoch": 1290} {"train_loss": -5.654579162597656, "global_step": 54200, "epoch": 1290} {"train_loss": -5.727150917053223, "global_step": 54201, "epoch": 1290} {"train_loss": -5.813991546630859, "global_step": 54202, "epoch": 1290} {"train_loss": -5.583095073699951, "global_step": 54203, "epoch": 1290} {"train_loss": -5.8343071937561035, "global_step": 54204, "epoch": 1290} {"train_loss": -5.628208637237549, "global_step": 54205, "epoch": 1290} {"train_loss": -5.727534770965576, "global_step": 54206, "epoch": 1290} {"train_loss": -5.78885555267334, "global_step": 54207, "epoch": 1290} {"train_loss": -5.621549129486084, "global_step": 54208, "epoch": 1290} {"train_loss": -5.819478988647461, "global_step": 54209, "epoch": 1290} {"train_loss": -5.676801681518555, "global_step": 54210, "epoch": 1290} {"train_loss": -5.7912211418151855, "global_step": 54211, "epoch": 1290} {"train_loss": -5.653700351715088, "global_step": 54212, "epoch": 1290} {"train_loss": -5.766356468200684, "global_step": 54213, "epoch": 1290} {"train_loss": -5.843219757080078, "global_step": 54214, "epoch": 1290} {"train_loss": -5.806529998779297, "global_step": 54215, "epoch": 1290} {"train_loss": -5.853006839752197, "global_step": 54216, "epoch": 1290} {"train_loss": -5.812894344329834, "global_step": 54217, "epoch": 1290} {"train_loss": -5.743605136871338, "global_step": 54218, "epoch": 1290} {"train_loss": -5.764520645141602, "global_step": 54219, "epoch": 1290} {"train_loss": -5.86767578125, "global_step": 54220, "epoch": 1290} {"train_loss": -5.771787541253226, "global_step": 54221, "epoch": 1290, "val_loss": 66556.453125} {"train_loss": -5.837588310241699, "global_step": 54222, "epoch": 1291} {"train_loss": -5.93500280380249, "global_step": 54223, "epoch": 1291} {"train_loss": -5.824251174926758, "global_step": 54224, "epoch": 1291} {"train_loss": -5.915561199188232, "global_step": 54225, "epoch": 1291} {"train_loss": -5.723700523376465, "global_step": 54226, "epoch": 1291} {"train_loss": -5.784882545471191, "global_step": 54227, "epoch": 1291} {"train_loss": -5.869121551513672, "global_step": 54228, "epoch": 1291} {"train_loss": -5.878602027893066, "global_step": 54229, "epoch": 1291} {"train_loss": -5.831573486328125, "global_step": 54230, "epoch": 1291} {"train_loss": -5.905840873718262, "global_step": 54231, "epoch": 1291} {"train_loss": -5.757165908813477, "global_step": 54232, "epoch": 1291} {"train_loss": -5.824056625366211, "global_step": 54233, "epoch": 1291} {"train_loss": -5.908685684204102, "global_step": 54234, "epoch": 1291} {"train_loss": -5.846692085266113, "global_step": 54235, "epoch": 1291} {"train_loss": -5.719241619110107, "global_step": 54236, "epoch": 1291} {"train_loss": -5.738459587097168, "global_step": 54237, "epoch": 1291} {"train_loss": -5.8247270584106445, "global_step": 54238, "epoch": 1291} {"train_loss": -5.781582355499268, "global_step": 54239, "epoch": 1291} {"train_loss": -5.823099136352539, "global_step": 54240, "epoch": 1291} {"train_loss": -5.7769975662231445, "global_step": 54241, "epoch": 1291} {"train_loss": -5.743295192718506, "global_step": 54242, "epoch": 1291} {"train_loss": -5.850315093994141, "global_step": 54243, "epoch": 1291} {"train_loss": -5.797104835510254, "global_step": 54244, "epoch": 1291} {"train_loss": -5.776079177856445, "global_step": 54245, "epoch": 1291} {"train_loss": -5.763113498687744, "global_step": 54246, "epoch": 1291} {"train_loss": -5.900810241699219, "global_step": 54247, "epoch": 1291} {"train_loss": -5.7045488357543945, "global_step": 54248, "epoch": 1291} {"train_loss": -5.852397918701172, "global_step": 54249, "epoch": 1291} {"train_loss": -5.679348945617676, "global_step": 54250, "epoch": 1291} {"train_loss": -5.751649856567383, "global_step": 54251, "epoch": 1291} {"train_loss": -5.679296493530273, "global_step": 54252, "epoch": 1291} {"train_loss": -5.7181549072265625, "global_step": 54253, "epoch": 1291} {"train_loss": -5.885828971862793, "global_step": 54254, "epoch": 1291} {"train_loss": -5.840813636779785, "global_step": 54255, "epoch": 1291} {"train_loss": -5.89439582824707, "global_step": 54256, "epoch": 1291} {"train_loss": -5.840928077697754, "global_step": 54257, "epoch": 1291} {"train_loss": -5.750594139099121, "global_step": 54258, "epoch": 1291} {"train_loss": -5.8517560958862305, "global_step": 54259, "epoch": 1291} {"train_loss": -5.9570112228393555, "global_step": 54260, "epoch": 1291} {"train_loss": -5.751769065856934, "global_step": 54261, "epoch": 1291} {"train_loss": -5.619190692901611, "global_step": 54262, "epoch": 1291} {"train_loss": -5.806926625115531, "global_step": 54263, "epoch": 1291, "val_loss": 66257.0078125} {"train_loss": -5.807059288024902, "global_step": 54264, "epoch": 1292} {"train_loss": -5.872677803039551, "global_step": 54265, "epoch": 1292} {"train_loss": -5.779384613037109, "global_step": 54266, "epoch": 1292} {"train_loss": -5.833749771118164, "global_step": 54267, "epoch": 1292} {"train_loss": -5.819553375244141, "global_step": 54268, "epoch": 1292} {"train_loss": -5.873144149780273, "global_step": 54269, "epoch": 1292} {"train_loss": -5.858770370483398, "global_step": 54270, "epoch": 1292} {"train_loss": -5.754241943359375, "global_step": 54271, "epoch": 1292} {"train_loss": -5.839953422546387, "global_step": 54272, "epoch": 1292} {"train_loss": -5.771458625793457, "global_step": 54273, "epoch": 1292} {"train_loss": -5.958912372589111, "global_step": 54274, "epoch": 1292} {"train_loss": -5.811348915100098, "global_step": 54275, "epoch": 1292} {"train_loss": -5.816038608551025, "global_step": 54276, "epoch": 1292} {"train_loss": -5.84139347076416, "global_step": 54277, "epoch": 1292} {"train_loss": -5.929072856903076, "global_step": 54278, "epoch": 1292} {"train_loss": -5.760437965393066, "global_step": 54279, "epoch": 1292} {"train_loss": -5.825520992279053, "global_step": 54280, "epoch": 1292} {"train_loss": -5.806342124938965, "global_step": 54281, "epoch": 1292} {"train_loss": -5.820580005645752, "global_step": 54282, "epoch": 1292} {"train_loss": -5.954244613647461, "global_step": 54283, "epoch": 1292} {"train_loss": -5.748040199279785, "global_step": 54284, "epoch": 1292} {"train_loss": -5.797570705413818, "global_step": 54285, "epoch": 1292} {"train_loss": -5.751497268676758, "global_step": 54286, "epoch": 1292} {"train_loss": -5.856768608093262, "global_step": 54287, "epoch": 1292} {"train_loss": -5.740543842315674, "global_step": 54288, "epoch": 1292} {"train_loss": -5.762155055999756, "global_step": 54289, "epoch": 1292} {"train_loss": -5.756834030151367, "global_step": 54290, "epoch": 1292} {"train_loss": -5.857318878173828, "global_step": 54291, "epoch": 1292} {"train_loss": -5.880997657775879, "global_step": 54292, "epoch": 1292} {"train_loss": -5.836699485778809, "global_step": 54293, "epoch": 1292} {"train_loss": -5.896546363830566, "global_step": 54294, "epoch": 1292} {"train_loss": -5.933119773864746, "global_step": 54295, "epoch": 1292} {"train_loss": -5.835567474365234, "global_step": 54296, "epoch": 1292} {"train_loss": -5.987987518310547, "global_step": 54297, "epoch": 1292} {"train_loss": -5.950463771820068, "global_step": 54298, "epoch": 1292} {"train_loss": -5.857039451599121, "global_step": 54299, "epoch": 1292} {"train_loss": -5.740042686462402, "global_step": 54300, "epoch": 1292} {"train_loss": -5.855477333068848, "global_step": 54301, "epoch": 1292} {"train_loss": -5.830536842346191, "global_step": 54302, "epoch": 1292} {"train_loss": -5.822648048400879, "global_step": 54303, "epoch": 1292} {"train_loss": -5.742196083068848, "global_step": 54304, "epoch": 1292} {"train_loss": -5.830619244348435, "global_step": 54305, "epoch": 1292, "val_loss": 66405.296875} {"train_loss": -5.683645248413086, "global_step": 54306, "epoch": 1293} {"train_loss": -5.816617965698242, "global_step": 54307, "epoch": 1293} {"train_loss": -5.848607063293457, "global_step": 54308, "epoch": 1293} {"train_loss": -5.9284210205078125, "global_step": 54309, "epoch": 1293} {"train_loss": -5.862338066101074, "global_step": 54310, "epoch": 1293} {"train_loss": -5.911620140075684, "global_step": 54311, "epoch": 1293} {"train_loss": -5.809759616851807, "global_step": 54312, "epoch": 1293} {"train_loss": -5.927000522613525, "global_step": 54313, "epoch": 1293} {"train_loss": -5.9221601486206055, "global_step": 54314, "epoch": 1293} {"train_loss": -5.817899703979492, "global_step": 54315, "epoch": 1293} {"train_loss": -5.892743110656738, "global_step": 54316, "epoch": 1293} {"train_loss": -5.9474287033081055, "global_step": 54317, "epoch": 1293} {"train_loss": -5.889463424682617, "global_step": 54318, "epoch": 1293} {"train_loss": -5.813352584838867, "global_step": 54319, "epoch": 1293} {"train_loss": -5.853279113769531, "global_step": 54320, "epoch": 1293} {"train_loss": -5.698156356811523, "global_step": 54321, "epoch": 1293} {"train_loss": -5.654308319091797, "global_step": 54322, "epoch": 1293} {"train_loss": -5.883654594421387, "global_step": 54323, "epoch": 1293} {"train_loss": -5.787078857421875, "global_step": 54324, "epoch": 1293} {"train_loss": -5.687222480773926, "global_step": 54325, "epoch": 1293} {"train_loss": -5.693516731262207, "global_step": 54326, "epoch": 1293} {"train_loss": -5.781558036804199, "global_step": 54327, "epoch": 1293} {"train_loss": -5.749642372131348, "global_step": 54328, "epoch": 1293} {"train_loss": -5.72142219543457, "global_step": 54329, "epoch": 1293} {"train_loss": -5.701817989349365, "global_step": 54330, "epoch": 1293} {"train_loss": -5.831564426422119, "global_step": 54331, "epoch": 1293} {"train_loss": -5.788652420043945, "global_step": 54332, "epoch": 1293} {"train_loss": -5.749856948852539, "global_step": 54333, "epoch": 1293} {"train_loss": -5.783597946166992, "global_step": 54334, "epoch": 1293} {"train_loss": -5.789539813995361, "global_step": 54335, "epoch": 1293} {"train_loss": -5.833592414855957, "global_step": 54336, "epoch": 1293} {"train_loss": -5.712223529815674, "global_step": 54337, "epoch": 1293} {"train_loss": -5.702045440673828, "global_step": 54338, "epoch": 1293} {"train_loss": -5.962180137634277, "global_step": 54339, "epoch": 1293} {"train_loss": -5.825542449951172, "global_step": 54340, "epoch": 1293} {"train_loss": -5.724735260009766, "global_step": 54341, "epoch": 1293} {"train_loss": -5.890483379364014, "global_step": 54342, "epoch": 1293} {"train_loss": -5.863103866577148, "global_step": 54343, "epoch": 1293} {"train_loss": -5.847553253173828, "global_step": 54344, "epoch": 1293} {"train_loss": -5.900140762329102, "global_step": 54345, "epoch": 1293} {"train_loss": -5.780879020690918, "global_step": 54346, "epoch": 1293} {"train_loss": -5.811784187952678, "global_step": 54347, "epoch": 1293, "val_loss": 66457.703125} {"train_loss": -5.862514019012451, "global_step": 54348, "epoch": 1294} {"train_loss": -5.778059482574463, "global_step": 54349, "epoch": 1294} {"train_loss": -5.965984344482422, "global_step": 54350, "epoch": 1294} {"train_loss": -5.8094000816345215, "global_step": 54351, "epoch": 1294} {"train_loss": -5.904721260070801, "global_step": 54352, "epoch": 1294} {"train_loss": -5.729626178741455, "global_step": 54353, "epoch": 1294} {"train_loss": -5.8452301025390625, "global_step": 54354, "epoch": 1294} {"train_loss": -5.890151023864746, "global_step": 54355, "epoch": 1294} {"train_loss": -5.881589889526367, "global_step": 54356, "epoch": 1294} {"train_loss": -5.83993673324585, "global_step": 54357, "epoch": 1294} {"train_loss": -5.890575408935547, "global_step": 54358, "epoch": 1294} {"train_loss": -5.793446063995361, "global_step": 54359, "epoch": 1294} {"train_loss": -5.835205554962158, "global_step": 54360, "epoch": 1294} {"train_loss": -5.697873592376709, "global_step": 54361, "epoch": 1294} {"train_loss": -5.883852005004883, "global_step": 54362, "epoch": 1294} {"train_loss": -5.837292671203613, "global_step": 54363, "epoch": 1294} {"train_loss": -5.900599479675293, "global_step": 54364, "epoch": 1294} {"train_loss": -5.8361711502075195, "global_step": 54365, "epoch": 1294} {"train_loss": -5.817732810974121, "global_step": 54366, "epoch": 1294} {"train_loss": -5.962215900421143, "global_step": 54367, "epoch": 1294} {"train_loss": -5.888335227966309, "global_step": 54368, "epoch": 1294} {"train_loss": -5.69312858581543, "global_step": 54369, "epoch": 1294} {"train_loss": -5.82004976272583, "global_step": 54370, "epoch": 1294} {"train_loss": -5.790871620178223, "global_step": 54371, "epoch": 1294} {"train_loss": -5.8124213218688965, "global_step": 54372, "epoch": 1294} {"train_loss": -5.916258335113525, "global_step": 54373, "epoch": 1294} {"train_loss": -5.80362606048584, "global_step": 54374, "epoch": 1294} {"train_loss": -5.749408721923828, "global_step": 54375, "epoch": 1294} {"train_loss": -5.742251396179199, "global_step": 54376, "epoch": 1294} {"train_loss": -5.8081793785095215, "global_step": 54377, "epoch": 1294} {"train_loss": -5.513514518737793, "global_step": 54378, "epoch": 1294} {"train_loss": -5.796361923217773, "global_step": 54379, "epoch": 1294} {"train_loss": -5.748532295227051, "global_step": 54380, "epoch": 1294} {"train_loss": -5.629612445831299, "global_step": 54381, "epoch": 1294} {"train_loss": -5.768655776977539, "global_step": 54382, "epoch": 1294} {"train_loss": -5.903318405151367, "global_step": 54383, "epoch": 1294} {"train_loss": -5.836633682250977, "global_step": 54384, "epoch": 1294} {"train_loss": -5.806759834289551, "global_step": 54385, "epoch": 1294} {"train_loss": -5.838770866394043, "global_step": 54386, "epoch": 1294} {"train_loss": -5.846161842346191, "global_step": 54387, "epoch": 1294} {"train_loss": -5.769169807434082, "global_step": 54388, "epoch": 1294} {"train_loss": -5.8166190556117465, "global_step": 54389, "epoch": 1294, "val_loss": 66341.0703125} {"train_loss": -5.8069539070129395, "global_step": 54390, "epoch": 1295} {"train_loss": -5.697844505310059, "global_step": 54391, "epoch": 1295} {"train_loss": -5.887921333312988, "global_step": 54392, "epoch": 1295} {"train_loss": -5.732499122619629, "global_step": 54393, "epoch": 1295} {"train_loss": -5.913131237030029, "global_step": 54394, "epoch": 1295} {"train_loss": -5.828979015350342, "global_step": 54395, "epoch": 1295} {"train_loss": -5.8485307693481445, "global_step": 54396, "epoch": 1295} {"train_loss": -5.734241008758545, "global_step": 54397, "epoch": 1295} {"train_loss": -5.8682074546813965, "global_step": 54398, "epoch": 1295} {"train_loss": -5.819667816162109, "global_step": 54399, "epoch": 1295} {"train_loss": -5.850214958190918, "global_step": 54400, "epoch": 1295} {"train_loss": -5.755366325378418, "global_step": 54401, "epoch": 1295} {"train_loss": -5.866951942443848, "global_step": 54402, "epoch": 1295} {"train_loss": -5.836304187774658, "global_step": 54403, "epoch": 1295} {"train_loss": -5.978155136108398, "global_step": 54404, "epoch": 1295} {"train_loss": -5.834024429321289, "global_step": 54405, "epoch": 1295} {"train_loss": -5.811327934265137, "global_step": 54406, "epoch": 1295} {"train_loss": -5.863670349121094, "global_step": 54407, "epoch": 1295} {"train_loss": -5.732738494873047, "global_step": 54408, "epoch": 1295} {"train_loss": -5.747465133666992, "global_step": 54409, "epoch": 1295} {"train_loss": -5.948929309844971, "global_step": 54410, "epoch": 1295} {"train_loss": -5.854646682739258, "global_step": 54411, "epoch": 1295} {"train_loss": -5.905730247497559, "global_step": 54412, "epoch": 1295} {"train_loss": -5.8564276695251465, "global_step": 54413, "epoch": 1295} {"train_loss": -5.737399101257324, "global_step": 54414, "epoch": 1295} {"train_loss": -5.680570125579834, "global_step": 54415, "epoch": 1295} {"train_loss": -5.739524841308594, "global_step": 54416, "epoch": 1295} {"train_loss": -5.784144878387451, "global_step": 54417, "epoch": 1295} {"train_loss": -5.72808837890625, "global_step": 54418, "epoch": 1295} {"train_loss": -5.757596492767334, "global_step": 54419, "epoch": 1295} {"train_loss": -5.69366979598999, "global_step": 54420, "epoch": 1295} {"train_loss": -5.7489824295043945, "global_step": 54421, "epoch": 1295} {"train_loss": -5.763338565826416, "global_step": 54422, "epoch": 1295} {"train_loss": -5.735492706298828, "global_step": 54423, "epoch": 1295} {"train_loss": -5.682124614715576, "global_step": 54424, "epoch": 1295} {"train_loss": -5.762121200561523, "global_step": 54425, "epoch": 1295} {"train_loss": -5.831915855407715, "global_step": 54426, "epoch": 1295} {"train_loss": -5.764780044555664, "global_step": 54427, "epoch": 1295} {"train_loss": -5.76992130279541, "global_step": 54428, "epoch": 1295} {"train_loss": -5.750044822692871, "global_step": 54429, "epoch": 1295} {"train_loss": -5.773521423339844, "global_step": 54430, "epoch": 1295} {"train_loss": -5.796729053769793, "global_step": 54431, "epoch": 1295, "val_loss": 66594.78125} {"train_loss": -5.765206813812256, "global_step": 54432, "epoch": 1296} {"train_loss": -5.770591735839844, "global_step": 54433, "epoch": 1296} {"train_loss": -5.773843765258789, "global_step": 54434, "epoch": 1296} {"train_loss": -5.846738815307617, "global_step": 54435, "epoch": 1296} {"train_loss": -5.695025444030762, "global_step": 54436, "epoch": 1296} {"train_loss": -5.775093078613281, "global_step": 54437, "epoch": 1296} {"train_loss": -5.748601913452148, "global_step": 54438, "epoch": 1296} {"train_loss": -5.821510314941406, "global_step": 54439, "epoch": 1296} {"train_loss": -5.785667419433594, "global_step": 54440, "epoch": 1296} {"train_loss": -5.729432582855225, "global_step": 54441, "epoch": 1296} {"train_loss": -5.782334327697754, "global_step": 54442, "epoch": 1296} {"train_loss": -5.69381046295166, "global_step": 54443, "epoch": 1296} {"train_loss": -5.804450035095215, "global_step": 54444, "epoch": 1296} {"train_loss": -5.799257278442383, "global_step": 54445, "epoch": 1296} {"train_loss": -5.7228803634643555, "global_step": 54446, "epoch": 1296} {"train_loss": -5.7935285568237305, "global_step": 54447, "epoch": 1296} {"train_loss": -5.845613479614258, "global_step": 54448, "epoch": 1296} {"train_loss": -5.813126564025879, "global_step": 54449, "epoch": 1296} {"train_loss": -5.731452941894531, "global_step": 54450, "epoch": 1296} {"train_loss": -5.858371734619141, "global_step": 54451, "epoch": 1296} {"train_loss": -5.784152984619141, "global_step": 54452, "epoch": 1296} {"train_loss": -5.724035263061523, "global_step": 54453, "epoch": 1296} {"train_loss": -5.647602558135986, "global_step": 54454, "epoch": 1296} {"train_loss": -5.814188003540039, "global_step": 54455, "epoch": 1296} {"train_loss": -5.665799617767334, "global_step": 54456, "epoch": 1296} {"train_loss": -5.878874778747559, "global_step": 54457, "epoch": 1296} {"train_loss": -5.673189163208008, "global_step": 54458, "epoch": 1296} {"train_loss": -5.848970413208008, "global_step": 54459, "epoch": 1296} {"train_loss": -5.801180839538574, "global_step": 54460, "epoch": 1296} {"train_loss": -5.71789026260376, "global_step": 54461, "epoch": 1296} {"train_loss": -5.862730503082275, "global_step": 54462, "epoch": 1296} {"train_loss": -5.772882461547852, "global_step": 54463, "epoch": 1296} {"train_loss": -5.7439470291137695, "global_step": 54464, "epoch": 1296} {"train_loss": -5.863996505737305, "global_step": 54465, "epoch": 1296} {"train_loss": -5.815488815307617, "global_step": 54466, "epoch": 1296} {"train_loss": -5.9014081954956055, "global_step": 54467, "epoch": 1296} {"train_loss": -5.754691123962402, "global_step": 54468, "epoch": 1296} {"train_loss": -5.820191383361816, "global_step": 54469, "epoch": 1296} {"train_loss": -5.764124870300293, "global_step": 54470, "epoch": 1296} {"train_loss": -5.847528457641602, "global_step": 54471, "epoch": 1296} {"train_loss": -5.8914971351623535, "global_step": 54472, "epoch": 1296} {"train_loss": -5.78213045710609, "global_step": 54473, "epoch": 1296, "val_loss": 66655.640625} {"train_loss": -5.845435619354248, "global_step": 54474, "epoch": 1297} {"train_loss": -5.83394718170166, "global_step": 54475, "epoch": 1297} {"train_loss": -5.822713851928711, "global_step": 54476, "epoch": 1297} {"train_loss": -5.833809852600098, "global_step": 54477, "epoch": 1297} {"train_loss": -5.834456443786621, "global_step": 54478, "epoch": 1297} {"train_loss": -5.729422569274902, "global_step": 54479, "epoch": 1297} {"train_loss": -5.801578521728516, "global_step": 54480, "epoch": 1297} {"train_loss": -5.840457439422607, "global_step": 54481, "epoch": 1297} {"train_loss": -5.754693031311035, "global_step": 54482, "epoch": 1297} {"train_loss": -5.797489166259766, "global_step": 54483, "epoch": 1297} {"train_loss": -5.761609077453613, "global_step": 54484, "epoch": 1297} {"train_loss": -5.853945255279541, "global_step": 54485, "epoch": 1297} {"train_loss": -5.871460437774658, "global_step": 54486, "epoch": 1297} {"train_loss": -5.780294418334961, "global_step": 54487, "epoch": 1297} {"train_loss": -5.714393138885498, "global_step": 54488, "epoch": 1297} {"train_loss": -5.861658096313477, "global_step": 54489, "epoch": 1297} {"train_loss": -5.693667411804199, "global_step": 54490, "epoch": 1297} {"train_loss": -5.7329301834106445, "global_step": 54491, "epoch": 1297} {"train_loss": -5.879524230957031, "global_step": 54492, "epoch": 1297} {"train_loss": -5.7526774406433105, "global_step": 54493, "epoch": 1297} {"train_loss": -5.82218599319458, "global_step": 54494, "epoch": 1297} {"train_loss": -5.7734832763671875, "global_step": 54495, "epoch": 1297} {"train_loss": -5.743537902832031, "global_step": 54496, "epoch": 1297} {"train_loss": -5.815690040588379, "global_step": 54497, "epoch": 1297} {"train_loss": -5.765488147735596, "global_step": 54498, "epoch": 1297} {"train_loss": -5.908455848693848, "global_step": 54499, "epoch": 1297} {"train_loss": -6.0117082595825195, "global_step": 54500, "epoch": 1297} {"train_loss": -5.845348358154297, "global_step": 54501, "epoch": 1297} {"train_loss": -5.663463115692139, "global_step": 54502, "epoch": 1297} {"train_loss": -5.809112548828125, "global_step": 54503, "epoch": 1297} {"train_loss": -5.8025922775268555, "global_step": 54504, "epoch": 1297} {"train_loss": -5.899044990539551, "global_step": 54505, "epoch": 1297} {"train_loss": -5.843724727630615, "global_step": 54506, "epoch": 1297} {"train_loss": -5.638314247131348, "global_step": 54507, "epoch": 1297} {"train_loss": -5.734033584594727, "global_step": 54508, "epoch": 1297} {"train_loss": -5.842840194702148, "global_step": 54509, "epoch": 1297} {"train_loss": -5.875870704650879, "global_step": 54510, "epoch": 1297} {"train_loss": -5.886843204498291, "global_step": 54511, "epoch": 1297} {"train_loss": -5.894898891448975, "global_step": 54512, "epoch": 1297} {"train_loss": -5.760651588439941, "global_step": 54513, "epoch": 1297} {"train_loss": -5.729212284088135, "global_step": 54514, "epoch": 1297} {"train_loss": -5.807632979892549, "global_step": 54515, "epoch": 1297, "val_loss": 66473.5546875} {"train_loss": -5.886559009552002, "global_step": 54516, "epoch": 1298} {"train_loss": -5.744104385375977, "global_step": 54517, "epoch": 1298} {"train_loss": -5.845500946044922, "global_step": 54518, "epoch": 1298} {"train_loss": -5.72993803024292, "global_step": 54519, "epoch": 1298} {"train_loss": -5.7939581871032715, "global_step": 54520, "epoch": 1298} {"train_loss": -5.869611740112305, "global_step": 54521, "epoch": 1298} {"train_loss": -5.926344871520996, "global_step": 54522, "epoch": 1298} {"train_loss": -5.755319595336914, "global_step": 54523, "epoch": 1298} {"train_loss": -5.87762451171875, "global_step": 54524, "epoch": 1298} {"train_loss": -5.884278297424316, "global_step": 54525, "epoch": 1298} {"train_loss": -5.87291145324707, "global_step": 54526, "epoch": 1298} {"train_loss": -5.882145881652832, "global_step": 54527, "epoch": 1298} {"train_loss": -5.8433518409729, "global_step": 54528, "epoch": 1298} {"train_loss": -5.84205436706543, "global_step": 54529, "epoch": 1298} {"train_loss": -5.851585388183594, "global_step": 54530, "epoch": 1298} {"train_loss": -5.784660339355469, "global_step": 54531, "epoch": 1298} {"train_loss": -5.784183502197266, "global_step": 54532, "epoch": 1298} {"train_loss": -5.863768100738525, "global_step": 54533, "epoch": 1298} {"train_loss": -5.868590354919434, "global_step": 54534, "epoch": 1298} {"train_loss": -5.939976692199707, "global_step": 54535, "epoch": 1298} {"train_loss": -5.672542572021484, "global_step": 54536, "epoch": 1298} {"train_loss": -5.7314348220825195, "global_step": 54537, "epoch": 1298} {"train_loss": -5.830101013183594, "global_step": 54538, "epoch": 1298} {"train_loss": -5.735614776611328, "global_step": 54539, "epoch": 1298} {"train_loss": -5.84908390045166, "global_step": 54540, "epoch": 1298} {"train_loss": -5.717075347900391, "global_step": 54541, "epoch": 1298} {"train_loss": -5.865829944610596, "global_step": 54542, "epoch": 1298} {"train_loss": -5.887901306152344, "global_step": 54543, "epoch": 1298} {"train_loss": -5.784209251403809, "global_step": 54544, "epoch": 1298} {"train_loss": -5.88814115524292, "global_step": 54545, "epoch": 1298} {"train_loss": -5.911260604858398, "global_step": 54546, "epoch": 1298} {"train_loss": -5.92575740814209, "global_step": 54547, "epoch": 1298} {"train_loss": -5.803914546966553, "global_step": 54548, "epoch": 1298} {"train_loss": -5.713522911071777, "global_step": 54549, "epoch": 1298} {"train_loss": -5.988668441772461, "global_step": 54550, "epoch": 1298} {"train_loss": -5.8972368240356445, "global_step": 54551, "epoch": 1298} {"train_loss": -5.873357772827148, "global_step": 54552, "epoch": 1298} {"train_loss": -5.777399063110352, "global_step": 54553, "epoch": 1298} {"train_loss": -5.870114326477051, "global_step": 54554, "epoch": 1298} {"train_loss": -5.80845308303833, "global_step": 54555, "epoch": 1298} {"train_loss": -5.867961406707764, "global_step": 54556, "epoch": 1298} {"train_loss": -5.835179703576224, "global_step": 54557, "epoch": 1298, "val_loss": 66357.046875} {"train_loss": -5.953367710113525, "global_step": 54558, "epoch": 1299} {"train_loss": -5.91370153427124, "global_step": 54559, "epoch": 1299} {"train_loss": -5.830955505371094, "global_step": 54560, "epoch": 1299} {"train_loss": -5.738359451293945, "global_step": 54561, "epoch": 1299} {"train_loss": -5.857786178588867, "global_step": 54562, "epoch": 1299} {"train_loss": -5.848923683166504, "global_step": 54563, "epoch": 1299} {"train_loss": -5.69212532043457, "global_step": 54564, "epoch": 1299} {"train_loss": -5.867001533508301, "global_step": 54565, "epoch": 1299} {"train_loss": -5.875735759735107, "global_step": 54566, "epoch": 1299} {"train_loss": -5.8607401847839355, "global_step": 54567, "epoch": 1299} {"train_loss": -5.789626121520996, "global_step": 54568, "epoch": 1299} {"train_loss": -5.831443786621094, "global_step": 54569, "epoch": 1299} {"train_loss": -5.881231307983398, "global_step": 54570, "epoch": 1299} {"train_loss": -5.81980037689209, "global_step": 54571, "epoch": 1299} {"train_loss": -5.7778120040893555, "global_step": 54572, "epoch": 1299} {"train_loss": -5.769765853881836, "global_step": 54573, "epoch": 1299} {"train_loss": -5.791179656982422, "global_step": 54574, "epoch": 1299} {"train_loss": -5.687345027923584, "global_step": 54575, "epoch": 1299} {"train_loss": -5.692869186401367, "global_step": 54576, "epoch": 1299} {"train_loss": -5.685774803161621, "global_step": 54577, "epoch": 1299} {"train_loss": -5.70318603515625, "global_step": 54578, "epoch": 1299} {"train_loss": -5.7781219482421875, "global_step": 54579, "epoch": 1299} {"train_loss": -5.818366050720215, "global_step": 54580, "epoch": 1299} {"train_loss": -5.869809150695801, "global_step": 54581, "epoch": 1299} {"train_loss": -5.7497358322143555, "global_step": 54582, "epoch": 1299} {"train_loss": -5.908586502075195, "global_step": 54583, "epoch": 1299} {"train_loss": -5.7216796875, "global_step": 54584, "epoch": 1299} {"train_loss": -5.896762847900391, "global_step": 54585, "epoch": 1299} {"train_loss": -5.856660842895508, "global_step": 54586, "epoch": 1299} {"train_loss": -5.846467018127441, "global_step": 54587, "epoch": 1299} {"train_loss": -5.774360179901123, "global_step": 54588, "epoch": 1299} {"train_loss": -5.706820487976074, "global_step": 54589, "epoch": 1299} {"train_loss": -5.868928909301758, "global_step": 54590, "epoch": 1299} {"train_loss": -5.701776027679443, "global_step": 54591, "epoch": 1299} {"train_loss": -5.850070953369141, "global_step": 54592, "epoch": 1299} {"train_loss": -5.719851016998291, "global_step": 54593, "epoch": 1299} {"train_loss": -5.618398189544678, "global_step": 54594, "epoch": 1299} {"train_loss": -5.683448791503906, "global_step": 54595, "epoch": 1299} {"train_loss": -5.792966842651367, "global_step": 54596, "epoch": 1299} {"train_loss": -5.804757118225098, "global_step": 54597, "epoch": 1299} {"train_loss": -5.775749206542969, "global_step": 54598, "epoch": 1299} {"train_loss": -5.796904053006854, "global_step": 54599, "epoch": 1299, "val_loss": 66293.03125} {"train_loss": -5.900486946105957, "global_step": 54600, "epoch": 1300} {"train_loss": -5.7260847091674805, "global_step": 54601, "epoch": 1300} {"train_loss": -5.706789016723633, "global_step": 54602, "epoch": 1300} {"train_loss": -5.8252363204956055, "global_step": 54603, "epoch": 1300} {"train_loss": -5.819576263427734, "global_step": 54604, "epoch": 1300} {"train_loss": -5.806419372558594, "global_step": 54605, "epoch": 1300} {"train_loss": -5.83985710144043, "global_step": 54606, "epoch": 1300} {"train_loss": -5.718116283416748, "global_step": 54607, "epoch": 1300} {"train_loss": -5.733059406280518, "global_step": 54608, "epoch": 1300} {"train_loss": -5.781263828277588, "global_step": 54609, "epoch": 1300} {"train_loss": -5.8230133056640625, "global_step": 54610, "epoch": 1300} {"train_loss": -5.825984001159668, "global_step": 54611, "epoch": 1300} {"train_loss": -5.839869499206543, "global_step": 54612, "epoch": 1300} {"train_loss": -5.864356517791748, "global_step": 54613, "epoch": 1300} {"train_loss": -5.674023628234863, "global_step": 54614, "epoch": 1300} {"train_loss": -5.715400695800781, "global_step": 54615, "epoch": 1300} {"train_loss": -5.702507019042969, "global_step": 54616, "epoch": 1300} {"train_loss": -5.769199848175049, "global_step": 54617, "epoch": 1300} {"train_loss": -5.708469390869141, "global_step": 54618, "epoch": 1300} {"train_loss": -5.689267158508301, "global_step": 54619, "epoch": 1300} {"train_loss": -5.719143867492676, "global_step": 54620, "epoch": 1300} {"train_loss": -5.79461145401001, "global_step": 54621, "epoch": 1300} {"train_loss": -5.808291435241699, "global_step": 54622, "epoch": 1300} {"train_loss": -5.772343635559082, "global_step": 54623, "epoch": 1300} {"train_loss": -5.790923595428467, "global_step": 54624, "epoch": 1300} {"train_loss": -5.698890686035156, "global_step": 54625, "epoch": 1300} {"train_loss": -5.751287460327148, "global_step": 54626, "epoch": 1300} {"train_loss": -5.751178741455078, "global_step": 54627, "epoch": 1300} {"train_loss": -5.771858215332031, "global_step": 54628, "epoch": 1300} {"train_loss": -5.803340435028076, "global_step": 54629, "epoch": 1300} {"train_loss": -5.734758377075195, "global_step": 54630, "epoch": 1300} {"train_loss": -5.91999626159668, "global_step": 54631, "epoch": 1300} {"train_loss": -5.838451385498047, "global_step": 54632, "epoch": 1300} {"train_loss": -5.772731781005859, "global_step": 54633, "epoch": 1300} {"train_loss": -5.977487564086914, "global_step": 54634, "epoch": 1300} {"train_loss": -5.6366119384765625, "global_step": 54635, "epoch": 1300} {"train_loss": -5.917852878570557, "global_step": 54636, "epoch": 1300} {"train_loss": -5.8249664306640625, "global_step": 54637, "epoch": 1300} {"train_loss": -5.786693572998047, "global_step": 54638, "epoch": 1300} {"train_loss": -5.904277324676514, "global_step": 54639, "epoch": 1300} {"train_loss": -5.86212158203125, "global_step": 54640, "epoch": 1300} {"train_loss": -5.791246925081525, "global_step": 54641, "epoch": 1300, "train/sim_max_reward_0": 0.3819704959517275, "train/sim_max_reward_1": 0.22004906792940132, "train/sim_max_reward_2": 0.6413728842648599, "train/sim_max_reward_3": 0.18950320843564428, "train/sim_max_reward_4": 0.9428080554044472, "train/sim_max_reward_5": 0.7627780450956505, "test/sim_max_reward_4400000": 0.15935501084239245, "test/sim_max_reward_4400001": 0.8874526066046129, "test/sim_max_reward_4400002": 0.057520970251672215, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.8723474721364216, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.538909855200621, "test/sim_max_reward_4400009": 0.6476574659189634, "test/sim_max_reward_4400010": 0.29823635165994944, "test/sim_max_reward_4400011": 0.2063996937764392, "test/sim_max_reward_4400012": 0.3506543141207661, "test/sim_max_reward_4400013": 0.396581093376987, "test/sim_max_reward_4400014": 0.4899211739179225, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.548656551430462, "test/sim_max_reward_4400020": 0.00027499252908961397, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.12214325624096874, "test/sim_max_reward_4400023": 0.7085884279356149, "test/sim_max_reward_4400024": 0.6879155153021493, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.09286633500566098, "test/sim_max_reward_4400027": 0.0882731059380678, "test/sim_max_reward_4400028": 0.5947007558428915, "test/sim_max_reward_4400029": 0.023137656058976722, "test/sim_max_reward_4400030": 0.9069137048219845, "test/sim_max_reward_4400031": 0.6626757881994724, "test/sim_max_reward_4400032": 0.11750513477872492, "test/sim_max_reward_4400033": 0.2128349494234291, "test/sim_max_reward_4400034": 0.7611720274836772, "test/sim_max_reward_4400035": 0.4547392526277077, "test/sim_max_reward_4400036": 0.3873980497090425, "test/sim_max_reward_4400037": 0.5477245278893905, "test/sim_max_reward_4400038": 0.13347334577058806, "test/sim_max_reward_4400039": 0.9883108490372916, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7129112115717905, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.6226273689778798, "test/sim_max_reward_4400044": 0.8206967929888571, "test/sim_max_reward_4400045": 0.8847741445873286, "test/sim_max_reward_4400046": 0.7733173437382007, "test/sim_max_reward_4400047": 0.2665990907261167, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.210782177362961, "train/mean_score": 0.5230802928469552, "test/mean_score": 0.36150263561361645, "val_loss": 66264.46875} {"train_loss": -5.7469892501831055, "global_step": 54642, "epoch": 1301} {"train_loss": -5.814713478088379, "global_step": 54643, "epoch": 1301} {"train_loss": -5.924589157104492, "global_step": 54644, "epoch": 1301} {"train_loss": -5.840348243713379, "global_step": 54645, "epoch": 1301} {"train_loss": -5.799962043762207, "global_step": 54646, "epoch": 1301} {"train_loss": -5.6936750411987305, "global_step": 54647, "epoch": 1301} {"train_loss": -5.813418388366699, "global_step": 54648, "epoch": 1301} {"train_loss": -5.8899149894714355, "global_step": 54649, "epoch": 1301} {"train_loss": -5.871694564819336, "global_step": 54650, "epoch": 1301} {"train_loss": -5.748411178588867, "global_step": 54651, "epoch": 1301} {"train_loss": -5.901582717895508, "global_step": 54652, "epoch": 1301} {"train_loss": -5.985768795013428, "global_step": 54653, "epoch": 1301} {"train_loss": -5.852948188781738, "global_step": 54654, "epoch": 1301} {"train_loss": -5.7066850662231445, "global_step": 54655, "epoch": 1301} {"train_loss": -5.7035441398620605, "global_step": 54656, "epoch": 1301} {"train_loss": -5.884237289428711, "global_step": 54657, "epoch": 1301} {"train_loss": -5.911391258239746, "global_step": 54658, "epoch": 1301} {"train_loss": -5.749739170074463, "global_step": 54659, "epoch": 1301} {"train_loss": -5.838367938995361, "global_step": 54660, "epoch": 1301} {"train_loss": -5.863255500793457, "global_step": 54661, "epoch": 1301} {"train_loss": -5.811156272888184, "global_step": 54662, "epoch": 1301} {"train_loss": -5.738462448120117, "global_step": 54663, "epoch": 1301} {"train_loss": -5.799049377441406, "global_step": 54664, "epoch": 1301} {"train_loss": -5.70997953414917, "global_step": 54665, "epoch": 1301} {"train_loss": -5.796273231506348, "global_step": 54666, "epoch": 1301} {"train_loss": -5.717274188995361, "global_step": 54667, "epoch": 1301} {"train_loss": -5.9712653160095215, "global_step": 54668, "epoch": 1301} {"train_loss": -5.754142761230469, "global_step": 54669, "epoch": 1301} {"train_loss": -5.906525611877441, "global_step": 54670, "epoch": 1301} {"train_loss": -5.756954669952393, "global_step": 54671, "epoch": 1301} {"train_loss": -5.75058650970459, "global_step": 54672, "epoch": 1301} {"train_loss": -5.927517890930176, "global_step": 54673, "epoch": 1301} {"train_loss": -5.749944686889648, "global_step": 54674, "epoch": 1301} {"train_loss": -5.858009338378906, "global_step": 54675, "epoch": 1301} {"train_loss": -5.841680526733398, "global_step": 54676, "epoch": 1301} {"train_loss": -5.851669788360596, "global_step": 54677, "epoch": 1301} {"train_loss": -5.77090311050415, "global_step": 54678, "epoch": 1301} {"train_loss": -5.865243911743164, "global_step": 54679, "epoch": 1301} {"train_loss": -5.780210494995117, "global_step": 54680, "epoch": 1301} {"train_loss": -5.8290605545043945, "global_step": 54681, "epoch": 1301} {"train_loss": -5.8744611740112305, "global_step": 54682, "epoch": 1301} {"train_loss": -5.816024837039766, "global_step": 54683, "epoch": 1301, "val_loss": 66518.78125} {"train_loss": -5.885543346405029, "global_step": 54684, "epoch": 1302} {"train_loss": -5.873176574707031, "global_step": 54685, "epoch": 1302} {"train_loss": -5.7862982749938965, "global_step": 54686, "epoch": 1302} {"train_loss": -5.847705841064453, "global_step": 54687, "epoch": 1302} {"train_loss": -5.882896423339844, "global_step": 54688, "epoch": 1302} {"train_loss": -5.861452579498291, "global_step": 54689, "epoch": 1302} {"train_loss": -5.8041486740112305, "global_step": 54690, "epoch": 1302} {"train_loss": -5.953600883483887, "global_step": 54691, "epoch": 1302} {"train_loss": -5.804071426391602, "global_step": 54692, "epoch": 1302} {"train_loss": -5.695821285247803, "global_step": 54693, "epoch": 1302} {"train_loss": -5.768989086151123, "global_step": 54694, "epoch": 1302} {"train_loss": -5.77544641494751, "global_step": 54695, "epoch": 1302} {"train_loss": -5.676264762878418, "global_step": 54696, "epoch": 1302} {"train_loss": -5.85187292098999, "global_step": 54697, "epoch": 1302} {"train_loss": -5.743625640869141, "global_step": 54698, "epoch": 1302} {"train_loss": -5.800173759460449, "global_step": 54699, "epoch": 1302} {"train_loss": -5.894718170166016, "global_step": 54700, "epoch": 1302} {"train_loss": -5.821444511413574, "global_step": 54701, "epoch": 1302} {"train_loss": -5.801000595092773, "global_step": 54702, "epoch": 1302} {"train_loss": -5.7368950843811035, "global_step": 54703, "epoch": 1302} {"train_loss": -5.860732078552246, "global_step": 54704, "epoch": 1302} {"train_loss": -5.898537635803223, "global_step": 54705, "epoch": 1302} {"train_loss": -5.763749122619629, "global_step": 54706, "epoch": 1302} {"train_loss": -5.839259147644043, "global_step": 54707, "epoch": 1302} {"train_loss": -5.829066276550293, "global_step": 54708, "epoch": 1302} {"train_loss": -5.869684219360352, "global_step": 54709, "epoch": 1302} {"train_loss": -5.955488204956055, "global_step": 54710, "epoch": 1302} {"train_loss": -5.788304328918457, "global_step": 54711, "epoch": 1302} {"train_loss": -5.97519063949585, "global_step": 54712, "epoch": 1302} {"train_loss": -5.81210470199585, "global_step": 54713, "epoch": 1302} {"train_loss": -5.844743728637695, "global_step": 54714, "epoch": 1302} {"train_loss": -5.847840309143066, "global_step": 54715, "epoch": 1302} {"train_loss": -5.788811683654785, "global_step": 54716, "epoch": 1302} {"train_loss": -5.866117477416992, "global_step": 54717, "epoch": 1302} {"train_loss": -5.817046165466309, "global_step": 54718, "epoch": 1302} {"train_loss": -5.727291107177734, "global_step": 54719, "epoch": 1302} {"train_loss": -5.915750026702881, "global_step": 54720, "epoch": 1302} {"train_loss": -5.864833831787109, "global_step": 54721, "epoch": 1302} {"train_loss": -5.755715370178223, "global_step": 54722, "epoch": 1302} {"train_loss": -5.803274154663086, "global_step": 54723, "epoch": 1302} {"train_loss": -5.890470504760742, "global_step": 54724, "epoch": 1302} {"train_loss": -5.830268246786935, "global_step": 54725, "epoch": 1302, "val_loss": 66190.3125} {"train_loss": -5.760299205780029, "global_step": 54726, "epoch": 1303} {"train_loss": -5.7066497802734375, "global_step": 54727, "epoch": 1303} {"train_loss": -5.855859279632568, "global_step": 54728, "epoch": 1303} {"train_loss": -5.745623588562012, "global_step": 54729, "epoch": 1303} {"train_loss": -5.9659013748168945, "global_step": 54730, "epoch": 1303} {"train_loss": -5.895313739776611, "global_step": 54731, "epoch": 1303} {"train_loss": -5.9048027992248535, "global_step": 54732, "epoch": 1303} {"train_loss": -5.9092302322387695, "global_step": 54733, "epoch": 1303} {"train_loss": -5.863560676574707, "global_step": 54734, "epoch": 1303} {"train_loss": -5.8719892501831055, "global_step": 54735, "epoch": 1303} {"train_loss": -5.877984046936035, "global_step": 54736, "epoch": 1303} {"train_loss": -5.835470199584961, "global_step": 54737, "epoch": 1303} {"train_loss": -5.810240745544434, "global_step": 54738, "epoch": 1303} {"train_loss": -5.8009352684021, "global_step": 54739, "epoch": 1303} {"train_loss": -5.8832879066467285, "global_step": 54740, "epoch": 1303} {"train_loss": -5.813671112060547, "global_step": 54741, "epoch": 1303} {"train_loss": -5.884413719177246, "global_step": 54742, "epoch": 1303} {"train_loss": -5.822225570678711, "global_step": 54743, "epoch": 1303} {"train_loss": -5.749238014221191, "global_step": 54744, "epoch": 1303} {"train_loss": -5.9133524894714355, "global_step": 54745, "epoch": 1303} {"train_loss": -5.803431510925293, "global_step": 54746, "epoch": 1303} {"train_loss": -5.718560218811035, "global_step": 54747, "epoch": 1303} {"train_loss": -5.721951484680176, "global_step": 54748, "epoch": 1303} {"train_loss": -5.769246578216553, "global_step": 54749, "epoch": 1303} {"train_loss": -5.840869426727295, "global_step": 54750, "epoch": 1303} {"train_loss": -5.929665565490723, "global_step": 54751, "epoch": 1303} {"train_loss": -5.924499034881592, "global_step": 54752, "epoch": 1303} {"train_loss": -5.796268463134766, "global_step": 54753, "epoch": 1303} {"train_loss": -5.689920902252197, "global_step": 54754, "epoch": 1303} {"train_loss": -5.891008377075195, "global_step": 54755, "epoch": 1303} {"train_loss": -5.697178840637207, "global_step": 54756, "epoch": 1303} {"train_loss": -5.810803413391113, "global_step": 54757, "epoch": 1303} {"train_loss": -5.9531073570251465, "global_step": 54758, "epoch": 1303} {"train_loss": -5.805142402648926, "global_step": 54759, "epoch": 1303} {"train_loss": -5.733573913574219, "global_step": 54760, "epoch": 1303} {"train_loss": -5.8918023109436035, "global_step": 54761, "epoch": 1303} {"train_loss": -5.844278812408447, "global_step": 54762, "epoch": 1303} {"train_loss": -5.878170967102051, "global_step": 54763, "epoch": 1303} {"train_loss": -5.862750053405762, "global_step": 54764, "epoch": 1303} {"train_loss": -5.776098251342773, "global_step": 54765, "epoch": 1303} {"train_loss": -5.800233364105225, "global_step": 54766, "epoch": 1303} {"train_loss": -5.828298773084368, "global_step": 54767, "epoch": 1303, "val_loss": 66449.375} {"train_loss": -5.787291526794434, "global_step": 54768, "epoch": 1304} {"train_loss": -5.77301025390625, "global_step": 54769, "epoch": 1304} {"train_loss": -5.660880088806152, "global_step": 54770, "epoch": 1304} {"train_loss": -5.765994071960449, "global_step": 54771, "epoch": 1304} {"train_loss": -5.732950210571289, "global_step": 54772, "epoch": 1304} {"train_loss": -5.896917343139648, "global_step": 54773, "epoch": 1304} {"train_loss": -5.845149040222168, "global_step": 54774, "epoch": 1304} {"train_loss": -5.710488796234131, "global_step": 54775, "epoch": 1304} {"train_loss": -5.666971206665039, "global_step": 54776, "epoch": 1304} {"train_loss": -5.833486557006836, "global_step": 54777, "epoch": 1304} {"train_loss": -5.841156005859375, "global_step": 54778, "epoch": 1304} {"train_loss": -5.740004062652588, "global_step": 54779, "epoch": 1304} {"train_loss": -5.719449996948242, "global_step": 54780, "epoch": 1304} {"train_loss": -5.748020172119141, "global_step": 54781, "epoch": 1304} {"train_loss": -5.896434783935547, "global_step": 54782, "epoch": 1304} {"train_loss": -5.681550979614258, "global_step": 54783, "epoch": 1304} {"train_loss": -5.871616840362549, "global_step": 54784, "epoch": 1304} {"train_loss": -5.810365676879883, "global_step": 54785, "epoch": 1304} {"train_loss": -5.7880167961120605, "global_step": 54786, "epoch": 1304} {"train_loss": -5.853581428527832, "global_step": 54787, "epoch": 1304} {"train_loss": -5.688558101654053, "global_step": 54788, "epoch": 1304} {"train_loss": -5.598822116851807, "global_step": 54789, "epoch": 1304} {"train_loss": -5.859127044677734, "global_step": 54790, "epoch": 1304} {"train_loss": -5.83486270904541, "global_step": 54791, "epoch": 1304} {"train_loss": -5.742528915405273, "global_step": 54792, "epoch": 1304} {"train_loss": -5.854550361633301, "global_step": 54793, "epoch": 1304} {"train_loss": -5.72786808013916, "global_step": 54794, "epoch": 1304} {"train_loss": -5.822674751281738, "global_step": 54795, "epoch": 1304} {"train_loss": -5.601810455322266, "global_step": 54796, "epoch": 1304} {"train_loss": -5.760668754577637, "global_step": 54797, "epoch": 1304} {"train_loss": -5.742769241333008, "global_step": 54798, "epoch": 1304} {"train_loss": -5.863744735717773, "global_step": 54799, "epoch": 1304} {"train_loss": -5.705897331237793, "global_step": 54800, "epoch": 1304} {"train_loss": -5.751634120941162, "global_step": 54801, "epoch": 1304} {"train_loss": -5.864930152893066, "global_step": 54802, "epoch": 1304} {"train_loss": -5.874545097351074, "global_step": 54803, "epoch": 1304} {"train_loss": -5.765689849853516, "global_step": 54804, "epoch": 1304} {"train_loss": -5.782949447631836, "global_step": 54805, "epoch": 1304} {"train_loss": -5.845326900482178, "global_step": 54806, "epoch": 1304} {"train_loss": -5.885627269744873, "global_step": 54807, "epoch": 1304} {"train_loss": -5.798713684082031, "global_step": 54808, "epoch": 1304} {"train_loss": -5.7801513104211715, "global_step": 54809, "epoch": 1304, "val_loss": 66308.0078125} {"train_loss": -5.90280818939209, "global_step": 54810, "epoch": 1305} {"train_loss": -5.8011155128479, "global_step": 54811, "epoch": 1305} {"train_loss": -5.8416266441345215, "global_step": 54812, "epoch": 1305} {"train_loss": -5.717443466186523, "global_step": 54813, "epoch": 1305} {"train_loss": -5.790676593780518, "global_step": 54814, "epoch": 1305} {"train_loss": -5.7324676513671875, "global_step": 54815, "epoch": 1305} {"train_loss": -5.722123146057129, "global_step": 54816, "epoch": 1305} {"train_loss": -5.711945533752441, "global_step": 54817, "epoch": 1305} {"train_loss": -5.842870712280273, "global_step": 54818, "epoch": 1305} {"train_loss": -5.730259895324707, "global_step": 54819, "epoch": 1305} {"train_loss": -5.853364944458008, "global_step": 54820, "epoch": 1305} {"train_loss": -5.985945224761963, "global_step": 54821, "epoch": 1305} {"train_loss": -5.796239376068115, "global_step": 54822, "epoch": 1305} {"train_loss": -5.8319010734558105, "global_step": 54823, "epoch": 1305} {"train_loss": -5.98185920715332, "global_step": 54824, "epoch": 1305} {"train_loss": -5.857845306396484, "global_step": 54825, "epoch": 1305} {"train_loss": -5.780847072601318, "global_step": 54826, "epoch": 1305} {"train_loss": -5.719958305358887, "global_step": 54827, "epoch": 1305} {"train_loss": -5.896597862243652, "global_step": 54828, "epoch": 1305} {"train_loss": -5.815306663513184, "global_step": 54829, "epoch": 1305} {"train_loss": -5.771825790405273, "global_step": 54830, "epoch": 1305} {"train_loss": -5.84481143951416, "global_step": 54831, "epoch": 1305} {"train_loss": -5.766851902008057, "global_step": 54832, "epoch": 1305} {"train_loss": -5.867857933044434, "global_step": 54833, "epoch": 1305} {"train_loss": -5.81449031829834, "global_step": 54834, "epoch": 1305} {"train_loss": -5.85481071472168, "global_step": 54835, "epoch": 1305} {"train_loss": -5.860874176025391, "global_step": 54836, "epoch": 1305} {"train_loss": -5.87257719039917, "global_step": 54837, "epoch": 1305} {"train_loss": -5.851082801818848, "global_step": 54838, "epoch": 1305} {"train_loss": -5.830659866333008, "global_step": 54839, "epoch": 1305} {"train_loss": -5.7794694900512695, "global_step": 54840, "epoch": 1305} {"train_loss": -5.790475845336914, "global_step": 54841, "epoch": 1305} {"train_loss": -5.701520919799805, "global_step": 54842, "epoch": 1305} {"train_loss": -5.839093208312988, "global_step": 54843, "epoch": 1305} {"train_loss": -5.783535957336426, "global_step": 54844, "epoch": 1305} {"train_loss": -5.926377296447754, "global_step": 54845, "epoch": 1305} {"train_loss": -5.761194705963135, "global_step": 54846, "epoch": 1305} {"train_loss": -5.839234352111816, "global_step": 54847, "epoch": 1305} {"train_loss": -5.702853202819824, "global_step": 54848, "epoch": 1305} {"train_loss": -5.840274810791016, "global_step": 54849, "epoch": 1305} {"train_loss": -5.882623672485352, "global_step": 54850, "epoch": 1305} {"train_loss": -5.819440046946208, "global_step": 54851, "epoch": 1305, "val_loss": 66613.4609375} {"train_loss": -5.806792259216309, "global_step": 54852, "epoch": 1306} {"train_loss": -5.94147253036499, "global_step": 54853, "epoch": 1306} {"train_loss": -5.82476806640625, "global_step": 54854, "epoch": 1306} {"train_loss": -5.836387634277344, "global_step": 54855, "epoch": 1306} {"train_loss": -5.794039726257324, "global_step": 54856, "epoch": 1306} {"train_loss": -5.929350852966309, "global_step": 54857, "epoch": 1306} {"train_loss": -5.780762672424316, "global_step": 54858, "epoch": 1306} {"train_loss": -5.69529914855957, "global_step": 54859, "epoch": 1306} {"train_loss": -5.783507347106934, "global_step": 54860, "epoch": 1306} {"train_loss": -5.76577091217041, "global_step": 54861, "epoch": 1306} {"train_loss": -5.757748126983643, "global_step": 54862, "epoch": 1306} {"train_loss": -5.920027732849121, "global_step": 54863, "epoch": 1306} {"train_loss": -5.8045454025268555, "global_step": 54864, "epoch": 1306} {"train_loss": -5.7743401527404785, "global_step": 54865, "epoch": 1306} {"train_loss": -5.792111873626709, "global_step": 54866, "epoch": 1306} {"train_loss": -5.737331390380859, "global_step": 54867, "epoch": 1306} {"train_loss": -5.778024673461914, "global_step": 54868, "epoch": 1306} {"train_loss": -5.794820785522461, "global_step": 54869, "epoch": 1306} {"train_loss": -5.825967788696289, "global_step": 54870, "epoch": 1306} {"train_loss": -5.796978950500488, "global_step": 54871, "epoch": 1306} {"train_loss": -5.735372543334961, "global_step": 54872, "epoch": 1306} {"train_loss": -5.836609840393066, "global_step": 54873, "epoch": 1306} {"train_loss": -5.79180908203125, "global_step": 54874, "epoch": 1306} {"train_loss": -5.793506622314453, "global_step": 54875, "epoch": 1306} {"train_loss": -5.840600967407227, "global_step": 54876, "epoch": 1306} {"train_loss": -5.865077495574951, "global_step": 54877, "epoch": 1306} {"train_loss": -5.910234451293945, "global_step": 54878, "epoch": 1306} {"train_loss": -5.742630958557129, "global_step": 54879, "epoch": 1306} {"train_loss": -5.882305145263672, "global_step": 54880, "epoch": 1306} {"train_loss": -5.944392204284668, "global_step": 54881, "epoch": 1306} {"train_loss": -5.952446937561035, "global_step": 54882, "epoch": 1306} {"train_loss": -5.804737091064453, "global_step": 54883, "epoch": 1306} {"train_loss": -5.722937107086182, "global_step": 54884, "epoch": 1306} {"train_loss": -5.778903961181641, "global_step": 54885, "epoch": 1306} {"train_loss": -5.7303667068481445, "global_step": 54886, "epoch": 1306} {"train_loss": -5.760361194610596, "global_step": 54887, "epoch": 1306} {"train_loss": -5.762281894683838, "global_step": 54888, "epoch": 1306} {"train_loss": -5.829597473144531, "global_step": 54889, "epoch": 1306} {"train_loss": -5.7497639656066895, "global_step": 54890, "epoch": 1306} {"train_loss": -5.859767913818359, "global_step": 54891, "epoch": 1306} {"train_loss": -5.7821478843688965, "global_step": 54892, "epoch": 1306} {"train_loss": -5.809798887797764, "global_step": 54893, "epoch": 1306, "val_loss": 66235.5} {"train_loss": -5.825839996337891, "global_step": 54894, "epoch": 1307} {"train_loss": -5.84982967376709, "global_step": 54895, "epoch": 1307} {"train_loss": -5.925061225891113, "global_step": 54896, "epoch": 1307} {"train_loss": -5.798479080200195, "global_step": 54897, "epoch": 1307} {"train_loss": -5.666175842285156, "global_step": 54898, "epoch": 1307} {"train_loss": -5.811756134033203, "global_step": 54899, "epoch": 1307} {"train_loss": -5.793450355529785, "global_step": 54900, "epoch": 1307} {"train_loss": -5.742897987365723, "global_step": 54901, "epoch": 1307} {"train_loss": -5.844491958618164, "global_step": 54902, "epoch": 1307} {"train_loss": -5.699997901916504, "global_step": 54903, "epoch": 1307} {"train_loss": -5.9101362228393555, "global_step": 54904, "epoch": 1307} {"train_loss": -5.654626846313477, "global_step": 54905, "epoch": 1307} {"train_loss": -5.794400215148926, "global_step": 54906, "epoch": 1307} {"train_loss": -5.829257488250732, "global_step": 54907, "epoch": 1307} {"train_loss": -5.881387710571289, "global_step": 54908, "epoch": 1307} {"train_loss": -5.891183853149414, "global_step": 54909, "epoch": 1307} {"train_loss": -5.732215881347656, "global_step": 54910, "epoch": 1307} {"train_loss": -5.715795993804932, "global_step": 54911, "epoch": 1307} {"train_loss": -5.773663520812988, "global_step": 54912, "epoch": 1307} {"train_loss": -5.876755237579346, "global_step": 54913, "epoch": 1307} {"train_loss": -5.773378372192383, "global_step": 54914, "epoch": 1307} {"train_loss": -5.8635101318359375, "global_step": 54915, "epoch": 1307} {"train_loss": -5.759517669677734, "global_step": 54916, "epoch": 1307} {"train_loss": -5.768531322479248, "global_step": 54917, "epoch": 1307} {"train_loss": -5.937936782836914, "global_step": 54918, "epoch": 1307} {"train_loss": -5.770486831665039, "global_step": 54919, "epoch": 1307} {"train_loss": -5.798618793487549, "global_step": 54920, "epoch": 1307} {"train_loss": -5.805644989013672, "global_step": 54921, "epoch": 1307} {"train_loss": -5.859196662902832, "global_step": 54922, "epoch": 1307} {"train_loss": -5.877842426300049, "global_step": 54923, "epoch": 1307} {"train_loss": -5.651241302490234, "global_step": 54924, "epoch": 1307} {"train_loss": -5.672628402709961, "global_step": 54925, "epoch": 1307} {"train_loss": -5.753753185272217, "global_step": 54926, "epoch": 1307} {"train_loss": -5.790373802185059, "global_step": 54927, "epoch": 1307} {"train_loss": -5.69972038269043, "global_step": 54928, "epoch": 1307} {"train_loss": -5.781380653381348, "global_step": 54929, "epoch": 1307} {"train_loss": -5.800741195678711, "global_step": 54930, "epoch": 1307} {"train_loss": -5.917409896850586, "global_step": 54931, "epoch": 1307} {"train_loss": -5.674522876739502, "global_step": 54932, "epoch": 1307} {"train_loss": -5.853429794311523, "global_step": 54933, "epoch": 1307} {"train_loss": -5.850223541259766, "global_step": 54934, "epoch": 1307} {"train_loss": -5.797136613300869, "global_step": 54935, "epoch": 1307, "val_loss": 66313.2578125} {"train_loss": -5.8134260177612305, "global_step": 54936, "epoch": 1308} {"train_loss": -5.8605475425720215, "global_step": 54937, "epoch": 1308} {"train_loss": -5.8372721672058105, "global_step": 54938, "epoch": 1308} {"train_loss": -5.8696746826171875, "global_step": 54939, "epoch": 1308} {"train_loss": -5.802396774291992, "global_step": 54940, "epoch": 1308} {"train_loss": -5.8656721115112305, "global_step": 54941, "epoch": 1308} {"train_loss": -5.871635437011719, "global_step": 54942, "epoch": 1308} {"train_loss": -5.840332508087158, "global_step": 54943, "epoch": 1308} {"train_loss": -5.915676593780518, "global_step": 54944, "epoch": 1308} {"train_loss": -5.736166954040527, "global_step": 54945, "epoch": 1308} {"train_loss": -5.927585601806641, "global_step": 54946, "epoch": 1308} {"train_loss": -5.900223731994629, "global_step": 54947, "epoch": 1308} {"train_loss": -5.751959800720215, "global_step": 54948, "epoch": 1308} {"train_loss": -5.840269088745117, "global_step": 54949, "epoch": 1308} {"train_loss": -5.80235481262207, "global_step": 54950, "epoch": 1308} {"train_loss": -5.777327537536621, "global_step": 54951, "epoch": 1308} {"train_loss": -5.783815383911133, "global_step": 54952, "epoch": 1308} {"train_loss": -5.80836296081543, "global_step": 54953, "epoch": 1308} {"train_loss": -5.911287307739258, "global_step": 54954, "epoch": 1308} {"train_loss": -5.885411739349365, "global_step": 54955, "epoch": 1308} {"train_loss": -5.844051837921143, "global_step": 54956, "epoch": 1308} {"train_loss": -5.902392387390137, "global_step": 54957, "epoch": 1308} {"train_loss": -5.741364479064941, "global_step": 54958, "epoch": 1308} {"train_loss": -5.841320037841797, "global_step": 54959, "epoch": 1308} {"train_loss": -5.766008377075195, "global_step": 54960, "epoch": 1308} {"train_loss": -5.791831970214844, "global_step": 54961, "epoch": 1308} {"train_loss": -5.817200183868408, "global_step": 54962, "epoch": 1308} {"train_loss": -5.831991672515869, "global_step": 54963, "epoch": 1308} {"train_loss": -5.8715009689331055, "global_step": 54964, "epoch": 1308} {"train_loss": -5.695041656494141, "global_step": 54965, "epoch": 1308} {"train_loss": -5.61248779296875, "global_step": 54966, "epoch": 1308} {"train_loss": -5.801474571228027, "global_step": 54967, "epoch": 1308} {"train_loss": -5.74990177154541, "global_step": 54968, "epoch": 1308} {"train_loss": -5.711063861846924, "global_step": 54969, "epoch": 1308} {"train_loss": -5.786376953125, "global_step": 54970, "epoch": 1308} {"train_loss": -5.644857406616211, "global_step": 54971, "epoch": 1308} {"train_loss": -5.786526679992676, "global_step": 54972, "epoch": 1308} {"train_loss": -5.8772358894348145, "global_step": 54973, "epoch": 1308} {"train_loss": -5.843205451965332, "global_step": 54974, "epoch": 1308} {"train_loss": -5.811638355255127, "global_step": 54975, "epoch": 1308} {"train_loss": -5.880989074707031, "global_step": 54976, "epoch": 1308} {"train_loss": -5.812883944738479, "global_step": 54977, "epoch": 1308, "val_loss": 66765.9375} {"train_loss": -5.808180332183838, "global_step": 54978, "epoch": 1309} {"train_loss": -5.700878143310547, "global_step": 54979, "epoch": 1309} {"train_loss": -5.746837615966797, "global_step": 54980, "epoch": 1309} {"train_loss": -5.788801193237305, "global_step": 54981, "epoch": 1309} {"train_loss": -5.943083763122559, "global_step": 54982, "epoch": 1309} {"train_loss": -5.88393497467041, "global_step": 54983, "epoch": 1309} {"train_loss": -5.872302532196045, "global_step": 54984, "epoch": 1309} {"train_loss": -5.814387321472168, "global_step": 54985, "epoch": 1309} {"train_loss": -5.831566333770752, "global_step": 54986, "epoch": 1309} {"train_loss": -5.792450904846191, "global_step": 54987, "epoch": 1309} {"train_loss": -5.790701866149902, "global_step": 54988, "epoch": 1309} {"train_loss": -5.77996826171875, "global_step": 54989, "epoch": 1309} {"train_loss": -5.80515193939209, "global_step": 54990, "epoch": 1309} {"train_loss": -5.806456565856934, "global_step": 54991, "epoch": 1309} {"train_loss": -5.780277252197266, "global_step": 54992, "epoch": 1309} {"train_loss": -5.7567057609558105, "global_step": 54993, "epoch": 1309} {"train_loss": -5.84805154800415, "global_step": 54994, "epoch": 1309} {"train_loss": -5.771090984344482, "global_step": 54995, "epoch": 1309} {"train_loss": -5.918174743652344, "global_step": 54996, "epoch": 1309} {"train_loss": -5.753887176513672, "global_step": 54997, "epoch": 1309} {"train_loss": -5.8662543296813965, "global_step": 54998, "epoch": 1309} {"train_loss": -5.701491355895996, "global_step": 54999, "epoch": 1309} {"train_loss": -5.682460784912109, "global_step": 55000, "epoch": 1309} {"train_loss": -5.643792629241943, "global_step": 55001, "epoch": 1309} {"train_loss": -5.714659690856934, "global_step": 55002, "epoch": 1309} {"train_loss": -5.895538330078125, "global_step": 55003, "epoch": 1309} {"train_loss": -5.739443778991699, "global_step": 55004, "epoch": 1309} {"train_loss": -5.791969299316406, "global_step": 55005, "epoch": 1309} {"train_loss": -5.810190200805664, "global_step": 55006, "epoch": 1309} {"train_loss": -5.904333114624023, "global_step": 55007, "epoch": 1309} {"train_loss": -5.780301094055176, "global_step": 55008, "epoch": 1309} {"train_loss": -5.732590675354004, "global_step": 55009, "epoch": 1309} {"train_loss": -5.871870040893555, "global_step": 55010, "epoch": 1309} {"train_loss": -5.798035621643066, "global_step": 55011, "epoch": 1309} {"train_loss": -5.771583557128906, "global_step": 55012, "epoch": 1309} {"train_loss": -5.72251033782959, "global_step": 55013, "epoch": 1309} {"train_loss": -5.783196449279785, "global_step": 55014, "epoch": 1309} {"train_loss": -5.861393451690674, "global_step": 55015, "epoch": 1309} {"train_loss": -5.891434192657471, "global_step": 55016, "epoch": 1309} {"train_loss": -5.880513668060303, "global_step": 55017, "epoch": 1309} {"train_loss": -5.840300559997559, "global_step": 55018, "epoch": 1309} {"train_loss": -5.806606008892968, "global_step": 55019, "epoch": 1309, "val_loss": 66443.0078125} {"train_loss": -5.757220268249512, "global_step": 55020, "epoch": 1310} {"train_loss": -5.762787342071533, "global_step": 55021, "epoch": 1310} {"train_loss": -5.887750625610352, "global_step": 55022, "epoch": 1310} {"train_loss": -5.828624725341797, "global_step": 55023, "epoch": 1310} {"train_loss": -5.930550575256348, "global_step": 55024, "epoch": 1310} {"train_loss": -5.832517623901367, "global_step": 55025, "epoch": 1310} {"train_loss": -5.754825592041016, "global_step": 55026, "epoch": 1310} {"train_loss": -5.865375518798828, "global_step": 55027, "epoch": 1310} {"train_loss": -5.839132785797119, "global_step": 55028, "epoch": 1310} {"train_loss": -5.886566162109375, "global_step": 55029, "epoch": 1310} {"train_loss": -5.811968803405762, "global_step": 55030, "epoch": 1310} {"train_loss": -5.895090579986572, "global_step": 55031, "epoch": 1310} {"train_loss": -5.808130741119385, "global_step": 55032, "epoch": 1310} {"train_loss": -5.896127700805664, "global_step": 55033, "epoch": 1310} {"train_loss": -5.882076263427734, "global_step": 55034, "epoch": 1310} {"train_loss": -5.855813026428223, "global_step": 55035, "epoch": 1310} {"train_loss": -5.89627742767334, "global_step": 55036, "epoch": 1310} {"train_loss": -5.918754577636719, "global_step": 55037, "epoch": 1310} {"train_loss": -5.801753520965576, "global_step": 55038, "epoch": 1310} {"train_loss": -5.946023941040039, "global_step": 55039, "epoch": 1310} {"train_loss": -5.792691707611084, "global_step": 55040, "epoch": 1310} {"train_loss": -5.799369812011719, "global_step": 55041, "epoch": 1310} {"train_loss": -5.818550109863281, "global_step": 55042, "epoch": 1310} {"train_loss": -5.900570392608643, "global_step": 55043, "epoch": 1310} {"train_loss": -5.941209316253662, "global_step": 55044, "epoch": 1310} {"train_loss": -5.77507209777832, "global_step": 55045, "epoch": 1310} {"train_loss": -5.816051959991455, "global_step": 55046, "epoch": 1310} {"train_loss": -5.782332897186279, "global_step": 55047, "epoch": 1310} {"train_loss": -5.7992048263549805, "global_step": 55048, "epoch": 1310} {"train_loss": -5.762546062469482, "global_step": 55049, "epoch": 1310} {"train_loss": -5.794219970703125, "global_step": 55050, "epoch": 1310} {"train_loss": -5.854508876800537, "global_step": 55051, "epoch": 1310} {"train_loss": -5.735720634460449, "global_step": 55052, "epoch": 1310} {"train_loss": -5.839648246765137, "global_step": 55053, "epoch": 1310} {"train_loss": -5.781822681427002, "global_step": 55054, "epoch": 1310} {"train_loss": -5.874680519104004, "global_step": 55055, "epoch": 1310} {"train_loss": -5.881026268005371, "global_step": 55056, "epoch": 1310} {"train_loss": -5.853392601013184, "global_step": 55057, "epoch": 1310} {"train_loss": -5.8630266189575195, "global_step": 55058, "epoch": 1310} {"train_loss": -5.809340000152588, "global_step": 55059, "epoch": 1310} {"train_loss": -5.949835777282715, "global_step": 55060, "epoch": 1310} {"train_loss": -5.840120429084415, "global_step": 55061, "epoch": 1310, "val_loss": 66348.5625} {"train_loss": -5.81377649307251, "global_step": 55062, "epoch": 1311} {"train_loss": -5.961799144744873, "global_step": 55063, "epoch": 1311} {"train_loss": -5.898421287536621, "global_step": 55064, "epoch": 1311} {"train_loss": -5.845714092254639, "global_step": 55065, "epoch": 1311} {"train_loss": -5.723145484924316, "global_step": 55066, "epoch": 1311} {"train_loss": -5.803894519805908, "global_step": 55067, "epoch": 1311} {"train_loss": -5.883406162261963, "global_step": 55068, "epoch": 1311} {"train_loss": -5.866610527038574, "global_step": 55069, "epoch": 1311} {"train_loss": -5.812200546264648, "global_step": 55070, "epoch": 1311} {"train_loss": -5.762706756591797, "global_step": 55071, "epoch": 1311} {"train_loss": -5.768670558929443, "global_step": 55072, "epoch": 1311} {"train_loss": -5.828673362731934, "global_step": 55073, "epoch": 1311} {"train_loss": -5.845153331756592, "global_step": 55074, "epoch": 1311} {"train_loss": -5.85417366027832, "global_step": 55075, "epoch": 1311} {"train_loss": -5.783458232879639, "global_step": 55076, "epoch": 1311} {"train_loss": -5.741960525512695, "global_step": 55077, "epoch": 1311} {"train_loss": -5.798081398010254, "global_step": 55078, "epoch": 1311} {"train_loss": -5.811826229095459, "global_step": 55079, "epoch": 1311} {"train_loss": -5.672993183135986, "global_step": 55080, "epoch": 1311} {"train_loss": -5.889220237731934, "global_step": 55081, "epoch": 1311} {"train_loss": -5.743152618408203, "global_step": 55082, "epoch": 1311} {"train_loss": -5.804975509643555, "global_step": 55083, "epoch": 1311} {"train_loss": -5.735379219055176, "global_step": 55084, "epoch": 1311} {"train_loss": -5.725062847137451, "global_step": 55085, "epoch": 1311} {"train_loss": -5.822504997253418, "global_step": 55086, "epoch": 1311} {"train_loss": -5.654990196228027, "global_step": 55087, "epoch": 1311} {"train_loss": -5.851373672485352, "global_step": 55088, "epoch": 1311} {"train_loss": -5.760056972503662, "global_step": 55089, "epoch": 1311} {"train_loss": -5.902949333190918, "global_step": 55090, "epoch": 1311} {"train_loss": -5.771141052246094, "global_step": 55091, "epoch": 1311} {"train_loss": -5.800130844116211, "global_step": 55092, "epoch": 1311} {"train_loss": -5.871037483215332, "global_step": 55093, "epoch": 1311} {"train_loss": -5.714529991149902, "global_step": 55094, "epoch": 1311} {"train_loss": -5.81654691696167, "global_step": 55095, "epoch": 1311} {"train_loss": -5.891753196716309, "global_step": 55096, "epoch": 1311} {"train_loss": -5.915138244628906, "global_step": 55097, "epoch": 1311} {"train_loss": -5.8860673904418945, "global_step": 55098, "epoch": 1311} {"train_loss": -5.721792221069336, "global_step": 55099, "epoch": 1311} {"train_loss": -5.875054359436035, "global_step": 55100, "epoch": 1311} {"train_loss": -5.848231315612793, "global_step": 55101, "epoch": 1311} {"train_loss": -5.714278221130371, "global_step": 55102, "epoch": 1311} {"train_loss": -5.810078950155349, "global_step": 55103, "epoch": 1311, "val_loss": 66531.3984375} {"train_loss": -5.830670356750488, "global_step": 55104, "epoch": 1312} {"train_loss": -5.9114789962768555, "global_step": 55105, "epoch": 1312} {"train_loss": -5.845401763916016, "global_step": 55106, "epoch": 1312} {"train_loss": -5.8904266357421875, "global_step": 55107, "epoch": 1312} {"train_loss": -5.883254528045654, "global_step": 55108, "epoch": 1312} {"train_loss": -5.867209434509277, "global_step": 55109, "epoch": 1312} {"train_loss": -5.728168487548828, "global_step": 55110, "epoch": 1312} {"train_loss": -5.731678485870361, "global_step": 55111, "epoch": 1312} {"train_loss": -5.79171085357666, "global_step": 55112, "epoch": 1312} {"train_loss": -5.795068264007568, "global_step": 55113, "epoch": 1312} {"train_loss": -5.8138580322265625, "global_step": 55114, "epoch": 1312} {"train_loss": -5.611175537109375, "global_step": 55115, "epoch": 1312} {"train_loss": -5.856417655944824, "global_step": 55116, "epoch": 1312} {"train_loss": -5.804659843444824, "global_step": 55117, "epoch": 1312} {"train_loss": -5.867887020111084, "global_step": 55118, "epoch": 1312} {"train_loss": -5.793196678161621, "global_step": 55119, "epoch": 1312} {"train_loss": -5.850405216217041, "global_step": 55120, "epoch": 1312} {"train_loss": -5.83901309967041, "global_step": 55121, "epoch": 1312} {"train_loss": -5.843778133392334, "global_step": 55122, "epoch": 1312} {"train_loss": -5.800772190093994, "global_step": 55123, "epoch": 1312} {"train_loss": -5.856452941894531, "global_step": 55124, "epoch": 1312} {"train_loss": -5.807402610778809, "global_step": 55125, "epoch": 1312} {"train_loss": -5.884158134460449, "global_step": 55126, "epoch": 1312} {"train_loss": -5.891849040985107, "global_step": 55127, "epoch": 1312} {"train_loss": -5.851507186889648, "global_step": 55128, "epoch": 1312} {"train_loss": -5.842960357666016, "global_step": 55129, "epoch": 1312} {"train_loss": -5.83990478515625, "global_step": 55130, "epoch": 1312} {"train_loss": -5.794775009155273, "global_step": 55131, "epoch": 1312} {"train_loss": -5.825973987579346, "global_step": 55132, "epoch": 1312} {"train_loss": -5.953914642333984, "global_step": 55133, "epoch": 1312} {"train_loss": -5.7446489334106445, "global_step": 55134, "epoch": 1312} {"train_loss": -5.771796226501465, "global_step": 55135, "epoch": 1312} {"train_loss": -5.826454162597656, "global_step": 55136, "epoch": 1312} {"train_loss": -5.873369216918945, "global_step": 55137, "epoch": 1312} {"train_loss": -5.871417999267578, "global_step": 55138, "epoch": 1312} {"train_loss": -5.762874603271484, "global_step": 55139, "epoch": 1312} {"train_loss": -5.818121433258057, "global_step": 55140, "epoch": 1312} {"train_loss": -5.830082416534424, "global_step": 55141, "epoch": 1312} {"train_loss": -5.870588302612305, "global_step": 55142, "epoch": 1312} {"train_loss": -5.795737266540527, "global_step": 55143, "epoch": 1312} {"train_loss": -5.748622894287109, "global_step": 55144, "epoch": 1312} {"train_loss": -5.82624161811102, "global_step": 55145, "epoch": 1312, "val_loss": 66334.8515625} {"train_loss": -5.818733215332031, "global_step": 55146, "epoch": 1313} {"train_loss": -5.862408638000488, "global_step": 55147, "epoch": 1313} {"train_loss": -5.8502397537231445, "global_step": 55148, "epoch": 1313} {"train_loss": -5.875290393829346, "global_step": 55149, "epoch": 1313} {"train_loss": -5.946111679077148, "global_step": 55150, "epoch": 1313} {"train_loss": -5.763289451599121, "global_step": 55151, "epoch": 1313} {"train_loss": -5.888654708862305, "global_step": 55152, "epoch": 1313} {"train_loss": -5.716884613037109, "global_step": 55153, "epoch": 1313} {"train_loss": -5.833286285400391, "global_step": 55154, "epoch": 1313} {"train_loss": -5.802436351776123, "global_step": 55155, "epoch": 1313} {"train_loss": -5.812966346740723, "global_step": 55156, "epoch": 1313} {"train_loss": -5.82585334777832, "global_step": 55157, "epoch": 1313} {"train_loss": -5.811161041259766, "global_step": 55158, "epoch": 1313} {"train_loss": -5.731232643127441, "global_step": 55159, "epoch": 1313} {"train_loss": -5.799271583557129, "global_step": 55160, "epoch": 1313} {"train_loss": -5.740348815917969, "global_step": 55161, "epoch": 1313} {"train_loss": -5.818304538726807, "global_step": 55162, "epoch": 1313} {"train_loss": -5.85817813873291, "global_step": 55163, "epoch": 1313} {"train_loss": -5.7916765213012695, "global_step": 55164, "epoch": 1313} {"train_loss": -5.77836799621582, "global_step": 55165, "epoch": 1313} {"train_loss": -5.840696811676025, "global_step": 55166, "epoch": 1313} {"train_loss": -5.796622276306152, "global_step": 55167, "epoch": 1313} {"train_loss": -5.928221702575684, "global_step": 55168, "epoch": 1313} {"train_loss": -5.899554252624512, "global_step": 55169, "epoch": 1313} {"train_loss": -5.862912178039551, "global_step": 55170, "epoch": 1313} {"train_loss": -5.986678123474121, "global_step": 55171, "epoch": 1313} {"train_loss": -5.8082475662231445, "global_step": 55172, "epoch": 1313} {"train_loss": -5.761831283569336, "global_step": 55173, "epoch": 1313} {"train_loss": -5.890086650848389, "global_step": 55174, "epoch": 1313} {"train_loss": -5.883484363555908, "global_step": 55175, "epoch": 1313} {"train_loss": -5.745119571685791, "global_step": 55176, "epoch": 1313} {"train_loss": -5.701669216156006, "global_step": 55177, "epoch": 1313} {"train_loss": -5.869287014007568, "global_step": 55178, "epoch": 1313} {"train_loss": -5.872624397277832, "global_step": 55179, "epoch": 1313} {"train_loss": -5.914178371429443, "global_step": 55180, "epoch": 1313} {"train_loss": -5.861591339111328, "global_step": 55181, "epoch": 1313} {"train_loss": -5.745780944824219, "global_step": 55182, "epoch": 1313} {"train_loss": -5.895918846130371, "global_step": 55183, "epoch": 1313} {"train_loss": -5.842810153961182, "global_step": 55184, "epoch": 1313} {"train_loss": -5.8539137840271, "global_step": 55185, "epoch": 1313} {"train_loss": -5.908625602722168, "global_step": 55186, "epoch": 1313} {"train_loss": -5.831398464384533, "global_step": 55187, "epoch": 1313, "val_loss": 66420.8359375} {"train_loss": -5.874335289001465, "global_step": 55188, "epoch": 1314} {"train_loss": -5.730798721313477, "global_step": 55189, "epoch": 1314} {"train_loss": -5.927068710327148, "global_step": 55190, "epoch": 1314} {"train_loss": -5.816014289855957, "global_step": 55191, "epoch": 1314} {"train_loss": -5.871304512023926, "global_step": 55192, "epoch": 1314} {"train_loss": -5.773736953735352, "global_step": 55193, "epoch": 1314} {"train_loss": -5.842988967895508, "global_step": 55194, "epoch": 1314} {"train_loss": -5.838922500610352, "global_step": 55195, "epoch": 1314} {"train_loss": -5.9135661125183105, "global_step": 55196, "epoch": 1314} {"train_loss": -5.705072402954102, "global_step": 55197, "epoch": 1314} {"train_loss": -5.706419467926025, "global_step": 55198, "epoch": 1314} {"train_loss": -5.941823959350586, "global_step": 55199, "epoch": 1314} {"train_loss": -5.83449649810791, "global_step": 55200, "epoch": 1314} {"train_loss": -5.822954177856445, "global_step": 55201, "epoch": 1314} {"train_loss": -5.966426849365234, "global_step": 55202, "epoch": 1314} {"train_loss": -5.828873634338379, "global_step": 55203, "epoch": 1314} {"train_loss": -5.826435089111328, "global_step": 55204, "epoch": 1314} {"train_loss": -5.815617084503174, "global_step": 55205, "epoch": 1314} {"train_loss": -5.9237823486328125, "global_step": 55206, "epoch": 1314} {"train_loss": -5.7352728843688965, "global_step": 55207, "epoch": 1314} {"train_loss": -5.859851837158203, "global_step": 55208, "epoch": 1314} {"train_loss": -5.730828285217285, "global_step": 55209, "epoch": 1314} {"train_loss": -5.852733612060547, "global_step": 55210, "epoch": 1314} {"train_loss": -5.7705206871032715, "global_step": 55211, "epoch": 1314} {"train_loss": -5.883918762207031, "global_step": 55212, "epoch": 1314} {"train_loss": -5.864009380340576, "global_step": 55213, "epoch": 1314} {"train_loss": -5.93812370300293, "global_step": 55214, "epoch": 1314} {"train_loss": -5.740156173706055, "global_step": 55215, "epoch": 1314} {"train_loss": -5.899925708770752, "global_step": 55216, "epoch": 1314} {"train_loss": -5.880202293395996, "global_step": 55217, "epoch": 1314} {"train_loss": -5.8034257888793945, "global_step": 55218, "epoch": 1314} {"train_loss": -5.782106876373291, "global_step": 55219, "epoch": 1314} {"train_loss": -5.745029449462891, "global_step": 55220, "epoch": 1314} {"train_loss": -5.9069623947143555, "global_step": 55221, "epoch": 1314} {"train_loss": -5.85898494720459, "global_step": 55222, "epoch": 1314} {"train_loss": -5.934711456298828, "global_step": 55223, "epoch": 1314} {"train_loss": -5.868851661682129, "global_step": 55224, "epoch": 1314} {"train_loss": -5.870367527008057, "global_step": 55225, "epoch": 1314} {"train_loss": -5.804954528808594, "global_step": 55226, "epoch": 1314} {"train_loss": -5.892635345458984, "global_step": 55227, "epoch": 1314} {"train_loss": -5.881762981414795, "global_step": 55228, "epoch": 1314} {"train_loss": -5.8404866854349775, "global_step": 55229, "epoch": 1314, "val_loss": 66681.9453125} {"train_loss": -5.8222455978393555, "global_step": 55230, "epoch": 1315} {"train_loss": -5.966658592224121, "global_step": 55231, "epoch": 1315} {"train_loss": -5.918366432189941, "global_step": 55232, "epoch": 1315} {"train_loss": -5.913936614990234, "global_step": 55233, "epoch": 1315} {"train_loss": -5.962307453155518, "global_step": 55234, "epoch": 1315} {"train_loss": -5.812212944030762, "global_step": 55235, "epoch": 1315} {"train_loss": -5.7718658447265625, "global_step": 55236, "epoch": 1315} {"train_loss": -5.745838165283203, "global_step": 55237, "epoch": 1315} {"train_loss": -5.7698845863342285, "global_step": 55238, "epoch": 1315} {"train_loss": -5.821898937225342, "global_step": 55239, "epoch": 1315} {"train_loss": -5.7586259841918945, "global_step": 55240, "epoch": 1315} {"train_loss": -5.832553863525391, "global_step": 55241, "epoch": 1315} {"train_loss": -5.832021713256836, "global_step": 55242, "epoch": 1315} {"train_loss": -5.854497909545898, "global_step": 55243, "epoch": 1315} {"train_loss": -5.685925006866455, "global_step": 55244, "epoch": 1315} {"train_loss": -5.917879104614258, "global_step": 55245, "epoch": 1315} {"train_loss": -5.809194564819336, "global_step": 55246, "epoch": 1315} {"train_loss": -5.792641639709473, "global_step": 55247, "epoch": 1315} {"train_loss": -5.7507643699646, "global_step": 55248, "epoch": 1315} {"train_loss": -5.806530952453613, "global_step": 55249, "epoch": 1315} {"train_loss": -5.69801139831543, "global_step": 55250, "epoch": 1315} {"train_loss": -5.794586181640625, "global_step": 55251, "epoch": 1315} {"train_loss": -5.615477561950684, "global_step": 55252, "epoch": 1315} {"train_loss": -5.884237289428711, "global_step": 55253, "epoch": 1315} {"train_loss": -5.840385437011719, "global_step": 55254, "epoch": 1315} {"train_loss": -5.744561195373535, "global_step": 55255, "epoch": 1315} {"train_loss": -5.942080497741699, "global_step": 55256, "epoch": 1315} {"train_loss": -5.766910552978516, "global_step": 55257, "epoch": 1315} {"train_loss": -5.774991512298584, "global_step": 55258, "epoch": 1315} {"train_loss": -5.813113212585449, "global_step": 55259, "epoch": 1315} {"train_loss": -5.805718421936035, "global_step": 55260, "epoch": 1315} {"train_loss": -5.720426082611084, "global_step": 55261, "epoch": 1315} {"train_loss": -5.794907569885254, "global_step": 55262, "epoch": 1315} {"train_loss": -5.838419437408447, "global_step": 55263, "epoch": 1315} {"train_loss": -5.735821723937988, "global_step": 55264, "epoch": 1315} {"train_loss": -5.7430033683776855, "global_step": 55265, "epoch": 1315} {"train_loss": -5.8502516746521, "global_step": 55266, "epoch": 1315} {"train_loss": -5.848914623260498, "global_step": 55267, "epoch": 1315} {"train_loss": -5.802642822265625, "global_step": 55268, "epoch": 1315} {"train_loss": -5.681033134460449, "global_step": 55269, "epoch": 1315} {"train_loss": -5.760406970977783, "global_step": 55270, "epoch": 1315} {"train_loss": -5.803413527352469, "global_step": 55271, "epoch": 1315, "val_loss": 66728.328125} {"train_loss": -5.978030681610107, "global_step": 55272, "epoch": 1316} {"train_loss": -5.860656261444092, "global_step": 55273, "epoch": 1316} {"train_loss": -5.768469333648682, "global_step": 55274, "epoch": 1316} {"train_loss": -5.867649078369141, "global_step": 55275, "epoch": 1316} {"train_loss": -5.878237724304199, "global_step": 55276, "epoch": 1316} {"train_loss": -5.97268009185791, "global_step": 55277, "epoch": 1316} {"train_loss": -5.788555145263672, "global_step": 55278, "epoch": 1316} {"train_loss": -5.8373260498046875, "global_step": 55279, "epoch": 1316} {"train_loss": -5.937220573425293, "global_step": 55280, "epoch": 1316} {"train_loss": -5.7548723220825195, "global_step": 55281, "epoch": 1316} {"train_loss": -5.86685037612915, "global_step": 55282, "epoch": 1316} {"train_loss": -5.886940956115723, "global_step": 55283, "epoch": 1316} {"train_loss": -5.770815372467041, "global_step": 55284, "epoch": 1316} {"train_loss": -5.699409484863281, "global_step": 55285, "epoch": 1316} {"train_loss": -5.938039302825928, "global_step": 55286, "epoch": 1316} {"train_loss": -5.792410850524902, "global_step": 55287, "epoch": 1316} {"train_loss": -5.793430805206299, "global_step": 55288, "epoch": 1316} {"train_loss": -5.713728904724121, "global_step": 55289, "epoch": 1316} {"train_loss": -5.750924110412598, "global_step": 55290, "epoch": 1316} {"train_loss": -5.789241313934326, "global_step": 55291, "epoch": 1316} {"train_loss": -5.823719024658203, "global_step": 55292, "epoch": 1316} {"train_loss": -5.796146392822266, "global_step": 55293, "epoch": 1316} {"train_loss": -5.87078857421875, "global_step": 55294, "epoch": 1316} {"train_loss": -5.819737911224365, "global_step": 55295, "epoch": 1316} {"train_loss": -5.744689464569092, "global_step": 55296, "epoch": 1316} {"train_loss": -5.860813140869141, "global_step": 55297, "epoch": 1316} {"train_loss": -5.749942302703857, "global_step": 55298, "epoch": 1316} {"train_loss": -5.826357364654541, "global_step": 55299, "epoch": 1316} {"train_loss": -5.689596652984619, "global_step": 55300, "epoch": 1316} {"train_loss": -5.852023601531982, "global_step": 55301, "epoch": 1316} {"train_loss": -5.777874946594238, "global_step": 55302, "epoch": 1316} {"train_loss": -5.809576988220215, "global_step": 55303, "epoch": 1316} {"train_loss": -5.934972286224365, "global_step": 55304, "epoch": 1316} {"train_loss": -5.764861106872559, "global_step": 55305, "epoch": 1316} {"train_loss": -5.956202507019043, "global_step": 55306, "epoch": 1316} {"train_loss": -5.8412652015686035, "global_step": 55307, "epoch": 1316} {"train_loss": -5.835953235626221, "global_step": 55308, "epoch": 1316} {"train_loss": -5.916007995605469, "global_step": 55309, "epoch": 1316} {"train_loss": -5.782985687255859, "global_step": 55310, "epoch": 1316} {"train_loss": -5.883307456970215, "global_step": 55311, "epoch": 1316} {"train_loss": -5.759949684143066, "global_step": 55312, "epoch": 1316} {"train_loss": -5.825799351646786, "global_step": 55313, "epoch": 1316, "val_loss": 66751.1875} {"train_loss": -5.814876556396484, "global_step": 55314, "epoch": 1317} {"train_loss": -5.715327262878418, "global_step": 55315, "epoch": 1317} {"train_loss": -5.814929962158203, "global_step": 55316, "epoch": 1317} {"train_loss": -5.801107406616211, "global_step": 55317, "epoch": 1317} {"train_loss": -5.795379161834717, "global_step": 55318, "epoch": 1317} {"train_loss": -5.832486629486084, "global_step": 55319, "epoch": 1317} {"train_loss": -5.762833595275879, "global_step": 55320, "epoch": 1317} {"train_loss": -5.771207809448242, "global_step": 55321, "epoch": 1317} {"train_loss": -5.877418041229248, "global_step": 55322, "epoch": 1317} {"train_loss": -5.793210983276367, "global_step": 55323, "epoch": 1317} {"train_loss": -5.808467864990234, "global_step": 55324, "epoch": 1317} {"train_loss": -5.774667739868164, "global_step": 55325, "epoch": 1317} {"train_loss": -5.830687999725342, "global_step": 55326, "epoch": 1317} {"train_loss": -5.690967082977295, "global_step": 55327, "epoch": 1317} {"train_loss": -5.774371147155762, "global_step": 55328, "epoch": 1317} {"train_loss": -5.681093692779541, "global_step": 55329, "epoch": 1317} {"train_loss": -5.941377639770508, "global_step": 55330, "epoch": 1317} {"train_loss": -5.8327178955078125, "global_step": 55331, "epoch": 1317} {"train_loss": -5.935941219329834, "global_step": 55332, "epoch": 1317} {"train_loss": -5.8555145263671875, "global_step": 55333, "epoch": 1317} {"train_loss": -5.847414970397949, "global_step": 55334, "epoch": 1317} {"train_loss": -5.825638294219971, "global_step": 55335, "epoch": 1317} {"train_loss": -5.893956661224365, "global_step": 55336, "epoch": 1317} {"train_loss": -5.823370933532715, "global_step": 55337, "epoch": 1317} {"train_loss": -5.7947587966918945, "global_step": 55338, "epoch": 1317} {"train_loss": -5.760804176330566, "global_step": 55339, "epoch": 1317} {"train_loss": -5.7604570388793945, "global_step": 55340, "epoch": 1317} {"train_loss": -5.863900661468506, "global_step": 55341, "epoch": 1317} {"train_loss": -5.815582275390625, "global_step": 55342, "epoch": 1317} {"train_loss": -5.829751491546631, "global_step": 55343, "epoch": 1317} {"train_loss": -5.733341693878174, "global_step": 55344, "epoch": 1317} {"train_loss": -5.780659198760986, "global_step": 55345, "epoch": 1317} {"train_loss": -5.8553314208984375, "global_step": 55346, "epoch": 1317} {"train_loss": -5.773286819458008, "global_step": 55347, "epoch": 1317} {"train_loss": -5.789783477783203, "global_step": 55348, "epoch": 1317} {"train_loss": -5.830002784729004, "global_step": 55349, "epoch": 1317} {"train_loss": -5.860502243041992, "global_step": 55350, "epoch": 1317} {"train_loss": -5.884895324707031, "global_step": 55351, "epoch": 1317} {"train_loss": -5.906213283538818, "global_step": 55352, "epoch": 1317} {"train_loss": -5.870667457580566, "global_step": 55353, "epoch": 1317} {"train_loss": -5.8727874755859375, "global_step": 55354, "epoch": 1317} {"train_loss": -5.818821180434454, "global_step": 55355, "epoch": 1317, "val_loss": 66568.0078125} {"train_loss": -5.935732841491699, "global_step": 55356, "epoch": 1318} {"train_loss": -5.772578239440918, "global_step": 55357, "epoch": 1318} {"train_loss": -5.739555358886719, "global_step": 55358, "epoch": 1318} {"train_loss": -5.7867608070373535, "global_step": 55359, "epoch": 1318} {"train_loss": -5.875364303588867, "global_step": 55360, "epoch": 1318} {"train_loss": -5.797436714172363, "global_step": 55361, "epoch": 1318} {"train_loss": -5.961271286010742, "global_step": 55362, "epoch": 1318} {"train_loss": -5.839309215545654, "global_step": 55363, "epoch": 1318} {"train_loss": -5.873798370361328, "global_step": 55364, "epoch": 1318} {"train_loss": -5.884422302246094, "global_step": 55365, "epoch": 1318} {"train_loss": -5.88353157043457, "global_step": 55366, "epoch": 1318} {"train_loss": -5.812873840332031, "global_step": 55367, "epoch": 1318} {"train_loss": -5.796667575836182, "global_step": 55368, "epoch": 1318} {"train_loss": -5.843893051147461, "global_step": 55369, "epoch": 1318} {"train_loss": -5.905994415283203, "global_step": 55370, "epoch": 1318} {"train_loss": -5.698973178863525, "global_step": 55371, "epoch": 1318} {"train_loss": -5.865151405334473, "global_step": 55372, "epoch": 1318} {"train_loss": -5.855159759521484, "global_step": 55373, "epoch": 1318} {"train_loss": -5.766902446746826, "global_step": 55374, "epoch": 1318} {"train_loss": -5.92426872253418, "global_step": 55375, "epoch": 1318} {"train_loss": -5.80262565612793, "global_step": 55376, "epoch": 1318} {"train_loss": -5.816780090332031, "global_step": 55377, "epoch": 1318} {"train_loss": -5.7770280838012695, "global_step": 55378, "epoch": 1318} {"train_loss": -5.806907653808594, "global_step": 55379, "epoch": 1318} {"train_loss": -5.926011085510254, "global_step": 55380, "epoch": 1318} {"train_loss": -5.854840278625488, "global_step": 55381, "epoch": 1318} {"train_loss": -5.796280860900879, "global_step": 55382, "epoch": 1318} {"train_loss": -5.797236919403076, "global_step": 55383, "epoch": 1318} {"train_loss": -5.76456356048584, "global_step": 55384, "epoch": 1318} {"train_loss": -5.679306983947754, "global_step": 55385, "epoch": 1318} {"train_loss": -5.772059440612793, "global_step": 55386, "epoch": 1318} {"train_loss": -5.833868980407715, "global_step": 55387, "epoch": 1318} {"train_loss": -5.77376651763916, "global_step": 55388, "epoch": 1318} {"train_loss": -5.793593883514404, "global_step": 55389, "epoch": 1318} {"train_loss": -5.6967315673828125, "global_step": 55390, "epoch": 1318} {"train_loss": -5.71376895904541, "global_step": 55391, "epoch": 1318} {"train_loss": -5.846037864685059, "global_step": 55392, "epoch": 1318} {"train_loss": -5.835714340209961, "global_step": 55393, "epoch": 1318} {"train_loss": -5.817354202270508, "global_step": 55394, "epoch": 1318} {"train_loss": -5.795690536499023, "global_step": 55395, "epoch": 1318} {"train_loss": -5.927667617797852, "global_step": 55396, "epoch": 1318} {"train_loss": -5.8185568537030905, "global_step": 55397, "epoch": 1318, "val_loss": 66482.8515625} {"train_loss": -5.82269811630249, "global_step": 55398, "epoch": 1319} {"train_loss": -5.8031005859375, "global_step": 55399, "epoch": 1319} {"train_loss": -5.751184463500977, "global_step": 55400, "epoch": 1319} {"train_loss": -5.870572566986084, "global_step": 55401, "epoch": 1319} {"train_loss": -5.809619903564453, "global_step": 55402, "epoch": 1319} {"train_loss": -5.93588924407959, "global_step": 55403, "epoch": 1319} {"train_loss": -5.809725761413574, "global_step": 55404, "epoch": 1319} {"train_loss": -5.774407863616943, "global_step": 55405, "epoch": 1319} {"train_loss": -5.881996154785156, "global_step": 55406, "epoch": 1319} {"train_loss": -5.67539119720459, "global_step": 55407, "epoch": 1319} {"train_loss": -5.801692962646484, "global_step": 55408, "epoch": 1319} {"train_loss": -5.7974348068237305, "global_step": 55409, "epoch": 1319} {"train_loss": -5.826883316040039, "global_step": 55410, "epoch": 1319} {"train_loss": -5.836686134338379, "global_step": 55411, "epoch": 1319} {"train_loss": -5.863016605377197, "global_step": 55412, "epoch": 1319} {"train_loss": -5.824505805969238, "global_step": 55413, "epoch": 1319} {"train_loss": -5.790564060211182, "global_step": 55414, "epoch": 1319} {"train_loss": -5.733710289001465, "global_step": 55415, "epoch": 1319} {"train_loss": -5.73503303527832, "global_step": 55416, "epoch": 1319} {"train_loss": -5.795706272125244, "global_step": 55417, "epoch": 1319} {"train_loss": -5.762942314147949, "global_step": 55418, "epoch": 1319} {"train_loss": -5.704536437988281, "global_step": 55419, "epoch": 1319} {"train_loss": -5.749210357666016, "global_step": 55420, "epoch": 1319} {"train_loss": -5.867809295654297, "global_step": 55421, "epoch": 1319} {"train_loss": -5.884217739105225, "global_step": 55422, "epoch": 1319} {"train_loss": -5.773462295532227, "global_step": 55423, "epoch": 1319} {"train_loss": -5.814409255981445, "global_step": 55424, "epoch": 1319} {"train_loss": -5.9190778732299805, "global_step": 55425, "epoch": 1319} {"train_loss": -5.78256893157959, "global_step": 55426, "epoch": 1319} {"train_loss": -5.787966251373291, "global_step": 55427, "epoch": 1319} {"train_loss": -5.790884971618652, "global_step": 55428, "epoch": 1319} {"train_loss": -5.828231334686279, "global_step": 55429, "epoch": 1319} {"train_loss": -5.880394458770752, "global_step": 55430, "epoch": 1319} {"train_loss": -5.902729511260986, "global_step": 55431, "epoch": 1319} {"train_loss": -5.853254318237305, "global_step": 55432, "epoch": 1319} {"train_loss": -5.890955924987793, "global_step": 55433, "epoch": 1319} {"train_loss": -5.75828218460083, "global_step": 55434, "epoch": 1319} {"train_loss": -5.875566482543945, "global_step": 55435, "epoch": 1319} {"train_loss": -5.762393951416016, "global_step": 55436, "epoch": 1319} {"train_loss": -5.772552013397217, "global_step": 55437, "epoch": 1319} {"train_loss": -5.804967403411865, "global_step": 55438, "epoch": 1319} {"train_loss": -5.8149389652978805, "global_step": 55439, "epoch": 1319, "val_loss": 66770.515625} {"train_loss": -5.842429161071777, "global_step": 55440, "epoch": 1320} {"train_loss": -5.910175800323486, "global_step": 55441, "epoch": 1320} {"train_loss": -5.834901809692383, "global_step": 55442, "epoch": 1320} {"train_loss": -5.807310581207275, "global_step": 55443, "epoch": 1320} {"train_loss": -5.80190372467041, "global_step": 55444, "epoch": 1320} {"train_loss": -5.894138336181641, "global_step": 55445, "epoch": 1320} {"train_loss": -5.744682788848877, "global_step": 55446, "epoch": 1320} {"train_loss": -5.865347385406494, "global_step": 55447, "epoch": 1320} {"train_loss": -5.828505992889404, "global_step": 55448, "epoch": 1320} {"train_loss": -5.7940568923950195, "global_step": 55449, "epoch": 1320} {"train_loss": -5.875502586364746, "global_step": 55450, "epoch": 1320} {"train_loss": -5.788665771484375, "global_step": 55451, "epoch": 1320} {"train_loss": -5.95128059387207, "global_step": 55452, "epoch": 1320} {"train_loss": -5.777960777282715, "global_step": 55453, "epoch": 1320} {"train_loss": -5.808374404907227, "global_step": 55454, "epoch": 1320} {"train_loss": -5.738424301147461, "global_step": 55455, "epoch": 1320} {"train_loss": -5.795637130737305, "global_step": 55456, "epoch": 1320} {"train_loss": -5.84134578704834, "global_step": 55457, "epoch": 1320} {"train_loss": -5.8677825927734375, "global_step": 55458, "epoch": 1320} {"train_loss": -5.923498630523682, "global_step": 55459, "epoch": 1320} {"train_loss": -5.705681800842285, "global_step": 55460, "epoch": 1320} {"train_loss": -5.828104496002197, "global_step": 55461, "epoch": 1320} {"train_loss": -5.908971786499023, "global_step": 55462, "epoch": 1320} {"train_loss": -5.791322708129883, "global_step": 55463, "epoch": 1320} {"train_loss": -5.790449142456055, "global_step": 55464, "epoch": 1320} {"train_loss": -5.897904396057129, "global_step": 55465, "epoch": 1320} {"train_loss": -5.748297691345215, "global_step": 55466, "epoch": 1320} {"train_loss": -5.839570999145508, "global_step": 55467, "epoch": 1320} {"train_loss": -5.832209587097168, "global_step": 55468, "epoch": 1320} {"train_loss": -5.8467302322387695, "global_step": 55469, "epoch": 1320} {"train_loss": -5.832453727722168, "global_step": 55470, "epoch": 1320} {"train_loss": -5.768228530883789, "global_step": 55471, "epoch": 1320} {"train_loss": -5.83697509765625, "global_step": 55472, "epoch": 1320} {"train_loss": -5.803678512573242, "global_step": 55473, "epoch": 1320} {"train_loss": -5.951215744018555, "global_step": 55474, "epoch": 1320} {"train_loss": -5.835753440856934, "global_step": 55475, "epoch": 1320} {"train_loss": -5.739900588989258, "global_step": 55476, "epoch": 1320} {"train_loss": -5.70142936706543, "global_step": 55477, "epoch": 1320} {"train_loss": -5.868988990783691, "global_step": 55478, "epoch": 1320} {"train_loss": -5.712674140930176, "global_step": 55479, "epoch": 1320} {"train_loss": -5.922127723693848, "global_step": 55480, "epoch": 1320} {"train_loss": -5.828231062207903, "global_step": 55481, "epoch": 1320, "val_loss": 66494.4296875} {"train_loss": -5.848387718200684, "global_step": 55482, "epoch": 1321} {"train_loss": -5.906315803527832, "global_step": 55483, "epoch": 1321} {"train_loss": -5.845208168029785, "global_step": 55484, "epoch": 1321} {"train_loss": -5.745161056518555, "global_step": 55485, "epoch": 1321} {"train_loss": -5.687252521514893, "global_step": 55486, "epoch": 1321} {"train_loss": -5.96392822265625, "global_step": 55487, "epoch": 1321} {"train_loss": -5.860507488250732, "global_step": 55488, "epoch": 1321} {"train_loss": -5.799832820892334, "global_step": 55489, "epoch": 1321} {"train_loss": -5.893852710723877, "global_step": 55490, "epoch": 1321} {"train_loss": -5.820102214813232, "global_step": 55491, "epoch": 1321} {"train_loss": -5.775354385375977, "global_step": 55492, "epoch": 1321} {"train_loss": -5.818323612213135, "global_step": 55493, "epoch": 1321} {"train_loss": -5.766057014465332, "global_step": 55494, "epoch": 1321} {"train_loss": -5.783042907714844, "global_step": 55495, "epoch": 1321} {"train_loss": -5.746209621429443, "global_step": 55496, "epoch": 1321} {"train_loss": -5.810786247253418, "global_step": 55497, "epoch": 1321} {"train_loss": -5.873842239379883, "global_step": 55498, "epoch": 1321} {"train_loss": -5.909725666046143, "global_step": 55499, "epoch": 1321} {"train_loss": -5.869391441345215, "global_step": 55500, "epoch": 1321} {"train_loss": -5.797621250152588, "global_step": 55501, "epoch": 1321} {"train_loss": -5.922158241271973, "global_step": 55502, "epoch": 1321} {"train_loss": -5.870856285095215, "global_step": 55503, "epoch": 1321} {"train_loss": -5.811494827270508, "global_step": 55504, "epoch": 1321} {"train_loss": -5.76984977722168, "global_step": 55505, "epoch": 1321} {"train_loss": -5.79813289642334, "global_step": 55506, "epoch": 1321} {"train_loss": -5.940362930297852, "global_step": 55507, "epoch": 1321} {"train_loss": -5.827869892120361, "global_step": 55508, "epoch": 1321} {"train_loss": -5.774194240570068, "global_step": 55509, "epoch": 1321} {"train_loss": -5.85651969909668, "global_step": 55510, "epoch": 1321} {"train_loss": -5.825340747833252, "global_step": 55511, "epoch": 1321} {"train_loss": -5.865274429321289, "global_step": 55512, "epoch": 1321} {"train_loss": -5.871999740600586, "global_step": 55513, "epoch": 1321} {"train_loss": -5.872199058532715, "global_step": 55514, "epoch": 1321} {"train_loss": -5.894455909729004, "global_step": 55515, "epoch": 1321} {"train_loss": -5.690560340881348, "global_step": 55516, "epoch": 1321} {"train_loss": -5.713494300842285, "global_step": 55517, "epoch": 1321} {"train_loss": -5.85356330871582, "global_step": 55518, "epoch": 1321} {"train_loss": -5.773305892944336, "global_step": 55519, "epoch": 1321} {"train_loss": -5.888955116271973, "global_step": 55520, "epoch": 1321} {"train_loss": -5.899233341217041, "global_step": 55521, "epoch": 1321} {"train_loss": -5.672066688537598, "global_step": 55522, "epoch": 1321} {"train_loss": -5.82816017241705, "global_step": 55523, "epoch": 1321, "val_loss": 66825.8359375} {"train_loss": -5.733761787414551, "global_step": 55524, "epoch": 1322} {"train_loss": -5.707640647888184, "global_step": 55525, "epoch": 1322} {"train_loss": -5.795018196105957, "global_step": 55526, "epoch": 1322} {"train_loss": -5.880054473876953, "global_step": 55527, "epoch": 1322} {"train_loss": -5.779296875, "global_step": 55528, "epoch": 1322} {"train_loss": -5.796043872833252, "global_step": 55529, "epoch": 1322} {"train_loss": -5.8201189041137695, "global_step": 55530, "epoch": 1322} {"train_loss": -5.788378715515137, "global_step": 55531, "epoch": 1322} {"train_loss": -5.815646171569824, "global_step": 55532, "epoch": 1322} {"train_loss": -5.9204325675964355, "global_step": 55533, "epoch": 1322} {"train_loss": -5.801697731018066, "global_step": 55534, "epoch": 1322} {"train_loss": -5.745141983032227, "global_step": 55535, "epoch": 1322} {"train_loss": -5.798271656036377, "global_step": 55536, "epoch": 1322} {"train_loss": -5.87938117980957, "global_step": 55537, "epoch": 1322} {"train_loss": -5.884007453918457, "global_step": 55538, "epoch": 1322} {"train_loss": -5.797249794006348, "global_step": 55539, "epoch": 1322} {"train_loss": -5.940897464752197, "global_step": 55540, "epoch": 1322} {"train_loss": -5.78111457824707, "global_step": 55541, "epoch": 1322} {"train_loss": -5.900595188140869, "global_step": 55542, "epoch": 1322} {"train_loss": -5.904869079589844, "global_step": 55543, "epoch": 1322} {"train_loss": -5.718493461608887, "global_step": 55544, "epoch": 1322} {"train_loss": -5.831289291381836, "global_step": 55545, "epoch": 1322} {"train_loss": -5.957347393035889, "global_step": 55546, "epoch": 1322} {"train_loss": -5.775143623352051, "global_step": 55547, "epoch": 1322} {"train_loss": -5.843863487243652, "global_step": 55548, "epoch": 1322} {"train_loss": -5.82483434677124, "global_step": 55549, "epoch": 1322} {"train_loss": -5.810894012451172, "global_step": 55550, "epoch": 1322} {"train_loss": -5.832823753356934, "global_step": 55551, "epoch": 1322} {"train_loss": -5.7111053466796875, "global_step": 55552, "epoch": 1322} {"train_loss": -5.874329566955566, "global_step": 55553, "epoch": 1322} {"train_loss": -5.865904808044434, "global_step": 55554, "epoch": 1322} {"train_loss": -5.7158026695251465, "global_step": 55555, "epoch": 1322} {"train_loss": -5.858616828918457, "global_step": 55556, "epoch": 1322} {"train_loss": -5.764904975891113, "global_step": 55557, "epoch": 1322} {"train_loss": -5.7798871994018555, "global_step": 55558, "epoch": 1322} {"train_loss": -5.92120361328125, "global_step": 55559, "epoch": 1322} {"train_loss": -5.847818851470947, "global_step": 55560, "epoch": 1322} {"train_loss": -5.962772369384766, "global_step": 55561, "epoch": 1322} {"train_loss": -5.742254257202148, "global_step": 55562, "epoch": 1322} {"train_loss": -5.857992172241211, "global_step": 55563, "epoch": 1322} {"train_loss": -5.918951511383057, "global_step": 55564, "epoch": 1322} {"train_loss": -5.828853482291812, "global_step": 55565, "epoch": 1322, "val_loss": 66687.21875} {"train_loss": -5.825737476348877, "global_step": 55566, "epoch": 1323} {"train_loss": -5.737908363342285, "global_step": 55567, "epoch": 1323} {"train_loss": -5.953434944152832, "global_step": 55568, "epoch": 1323} {"train_loss": -5.779181957244873, "global_step": 55569, "epoch": 1323} {"train_loss": -5.853089809417725, "global_step": 55570, "epoch": 1323} {"train_loss": -5.822762966156006, "global_step": 55571, "epoch": 1323} {"train_loss": -5.706330299377441, "global_step": 55572, "epoch": 1323} {"train_loss": -5.880514144897461, "global_step": 55573, "epoch": 1323} {"train_loss": -5.850661277770996, "global_step": 55574, "epoch": 1323} {"train_loss": -5.842596054077148, "global_step": 55575, "epoch": 1323} {"train_loss": -5.649627208709717, "global_step": 55576, "epoch": 1323} {"train_loss": -5.783923625946045, "global_step": 55577, "epoch": 1323} {"train_loss": -5.846662998199463, "global_step": 55578, "epoch": 1323} {"train_loss": -5.826142311096191, "global_step": 55579, "epoch": 1323} {"train_loss": -5.84779167175293, "global_step": 55580, "epoch": 1323} {"train_loss": -5.715269565582275, "global_step": 55581, "epoch": 1323} {"train_loss": -5.867019176483154, "global_step": 55582, "epoch": 1323} {"train_loss": -5.830732822418213, "global_step": 55583, "epoch": 1323} {"train_loss": -5.711440086364746, "global_step": 55584, "epoch": 1323} {"train_loss": -5.734023571014404, "global_step": 55585, "epoch": 1323} {"train_loss": -5.788103103637695, "global_step": 55586, "epoch": 1323} {"train_loss": -5.769844055175781, "global_step": 55587, "epoch": 1323} {"train_loss": -5.810171127319336, "global_step": 55588, "epoch": 1323} {"train_loss": -5.82758903503418, "global_step": 55589, "epoch": 1323} {"train_loss": -5.794826507568359, "global_step": 55590, "epoch": 1323} {"train_loss": -5.830223083496094, "global_step": 55591, "epoch": 1323} {"train_loss": -5.828123092651367, "global_step": 55592, "epoch": 1323} {"train_loss": -5.869645595550537, "global_step": 55593, "epoch": 1323} {"train_loss": -5.819101333618164, "global_step": 55594, "epoch": 1323} {"train_loss": -5.82349967956543, "global_step": 55595, "epoch": 1323} {"train_loss": -5.737066268920898, "global_step": 55596, "epoch": 1323} {"train_loss": -5.780448913574219, "global_step": 55597, "epoch": 1323} {"train_loss": -5.862987518310547, "global_step": 55598, "epoch": 1323} {"train_loss": -5.696134567260742, "global_step": 55599, "epoch": 1323} {"train_loss": -5.971580505371094, "global_step": 55600, "epoch": 1323} {"train_loss": -5.773819923400879, "global_step": 55601, "epoch": 1323} {"train_loss": -5.903033256530762, "global_step": 55602, "epoch": 1323} {"train_loss": -5.784188270568848, "global_step": 55603, "epoch": 1323} {"train_loss": -5.84543514251709, "global_step": 55604, "epoch": 1323} {"train_loss": -5.778417110443115, "global_step": 55605, "epoch": 1323} {"train_loss": -5.909659385681152, "global_step": 55606, "epoch": 1323} {"train_loss": -5.808994667870658, "global_step": 55607, "epoch": 1323, "val_loss": 66589.234375} {"train_loss": -5.757150173187256, "global_step": 55608, "epoch": 1324} {"train_loss": -5.749539375305176, "global_step": 55609, "epoch": 1324} {"train_loss": -5.735984802246094, "global_step": 55610, "epoch": 1324} {"train_loss": -5.8377485275268555, "global_step": 55611, "epoch": 1324} {"train_loss": -5.7343597412109375, "global_step": 55612, "epoch": 1324} {"train_loss": -5.798681735992432, "global_step": 55613, "epoch": 1324} {"train_loss": -5.718421936035156, "global_step": 55614, "epoch": 1324} {"train_loss": -5.910115718841553, "global_step": 55615, "epoch": 1324} {"train_loss": -5.811766624450684, "global_step": 55616, "epoch": 1324} {"train_loss": -5.815184116363525, "global_step": 55617, "epoch": 1324} {"train_loss": -5.750456809997559, "global_step": 55618, "epoch": 1324} {"train_loss": -5.679471015930176, "global_step": 55619, "epoch": 1324} {"train_loss": -5.724453926086426, "global_step": 55620, "epoch": 1324} {"train_loss": -5.815866947174072, "global_step": 55621, "epoch": 1324} {"train_loss": -5.73085355758667, "global_step": 55622, "epoch": 1324} {"train_loss": -5.8976593017578125, "global_step": 55623, "epoch": 1324} {"train_loss": -5.717799663543701, "global_step": 55624, "epoch": 1324} {"train_loss": -5.8409743309021, "global_step": 55625, "epoch": 1324} {"train_loss": -5.885578155517578, "global_step": 55626, "epoch": 1324} {"train_loss": -5.724483966827393, "global_step": 55627, "epoch": 1324} {"train_loss": -5.872440338134766, "global_step": 55628, "epoch": 1324} {"train_loss": -5.850578308105469, "global_step": 55629, "epoch": 1324} {"train_loss": -5.762502670288086, "global_step": 55630, "epoch": 1324} {"train_loss": -5.7833251953125, "global_step": 55631, "epoch": 1324} {"train_loss": -5.762346267700195, "global_step": 55632, "epoch": 1324} {"train_loss": -5.845439910888672, "global_step": 55633, "epoch": 1324} {"train_loss": -5.686102390289307, "global_step": 55634, "epoch": 1324} {"train_loss": -5.841242790222168, "global_step": 55635, "epoch": 1324} {"train_loss": -5.741459369659424, "global_step": 55636, "epoch": 1324} {"train_loss": -5.841580390930176, "global_step": 55637, "epoch": 1324} {"train_loss": -5.94403076171875, "global_step": 55638, "epoch": 1324} {"train_loss": -5.734491348266602, "global_step": 55639, "epoch": 1324} {"train_loss": -5.788544178009033, "global_step": 55640, "epoch": 1324} {"train_loss": -5.709086894989014, "global_step": 55641, "epoch": 1324} {"train_loss": -5.641888618469238, "global_step": 55642, "epoch": 1324} {"train_loss": -5.830145835876465, "global_step": 55643, "epoch": 1324} {"train_loss": -5.738081455230713, "global_step": 55644, "epoch": 1324} {"train_loss": -5.867950439453125, "global_step": 55645, "epoch": 1324} {"train_loss": -5.92357063293457, "global_step": 55646, "epoch": 1324} {"train_loss": -5.811214447021484, "global_step": 55647, "epoch": 1324} {"train_loss": -5.763543605804443, "global_step": 55648, "epoch": 1324} {"train_loss": -5.791560786111014, "global_step": 55649, "epoch": 1324, "val_loss": 66684.328125} {"train_loss": -5.761751174926758, "global_step": 55650, "epoch": 1325} {"train_loss": -5.69726037979126, "global_step": 55651, "epoch": 1325} {"train_loss": -5.875903129577637, "global_step": 55652, "epoch": 1325} {"train_loss": -5.694091796875, "global_step": 55653, "epoch": 1325} {"train_loss": -5.763548851013184, "global_step": 55654, "epoch": 1325} {"train_loss": -5.834855556488037, "global_step": 55655, "epoch": 1325} {"train_loss": -5.742127418518066, "global_step": 55656, "epoch": 1325} {"train_loss": -5.813786506652832, "global_step": 55657, "epoch": 1325} {"train_loss": -5.912343978881836, "global_step": 55658, "epoch": 1325} {"train_loss": -5.79337739944458, "global_step": 55659, "epoch": 1325} {"train_loss": -5.814791679382324, "global_step": 55660, "epoch": 1325} {"train_loss": -5.7956953048706055, "global_step": 55661, "epoch": 1325} {"train_loss": -5.690021991729736, "global_step": 55662, "epoch": 1325} {"train_loss": -5.866536617279053, "global_step": 55663, "epoch": 1325} {"train_loss": -5.7021918296813965, "global_step": 55664, "epoch": 1325} {"train_loss": -5.77347993850708, "global_step": 55665, "epoch": 1325} {"train_loss": -5.840437889099121, "global_step": 55666, "epoch": 1325} {"train_loss": -5.875732421875, "global_step": 55667, "epoch": 1325} {"train_loss": -5.85007905960083, "global_step": 55668, "epoch": 1325} {"train_loss": -5.9092912673950195, "global_step": 55669, "epoch": 1325} {"train_loss": -5.845622539520264, "global_step": 55670, "epoch": 1325} {"train_loss": -5.879349708557129, "global_step": 55671, "epoch": 1325} {"train_loss": -5.845634460449219, "global_step": 55672, "epoch": 1325} {"train_loss": -5.948277473449707, "global_step": 55673, "epoch": 1325} {"train_loss": -5.788122177124023, "global_step": 55674, "epoch": 1325} {"train_loss": -5.879731178283691, "global_step": 55675, "epoch": 1325} {"train_loss": -5.734444618225098, "global_step": 55676, "epoch": 1325} {"train_loss": -5.707406044006348, "global_step": 55677, "epoch": 1325} {"train_loss": -5.856749057769775, "global_step": 55678, "epoch": 1325} {"train_loss": -5.933493614196777, "global_step": 55679, "epoch": 1325} {"train_loss": -5.959953784942627, "global_step": 55680, "epoch": 1325} {"train_loss": -5.855628490447998, "global_step": 55681, "epoch": 1325} {"train_loss": -5.83227014541626, "global_step": 55682, "epoch": 1325} {"train_loss": -5.900684356689453, "global_step": 55683, "epoch": 1325} {"train_loss": -5.900888919830322, "global_step": 55684, "epoch": 1325} {"train_loss": -5.810905456542969, "global_step": 55685, "epoch": 1325} {"train_loss": -5.900126934051514, "global_step": 55686, "epoch": 1325} {"train_loss": -5.818309307098389, "global_step": 55687, "epoch": 1325} {"train_loss": -5.849462509155273, "global_step": 55688, "epoch": 1325} {"train_loss": -5.710805892944336, "global_step": 55689, "epoch": 1325} {"train_loss": -5.843646049499512, "global_step": 55690, "epoch": 1325} {"train_loss": -5.8231527124132425, "global_step": 55691, "epoch": 1325, "val_loss": 66323.6171875} {"train_loss": -5.789529323577881, "global_step": 55692, "epoch": 1326} {"train_loss": -5.925812721252441, "global_step": 55693, "epoch": 1326} {"train_loss": -5.780232906341553, "global_step": 55694, "epoch": 1326} {"train_loss": -5.789266586303711, "global_step": 55695, "epoch": 1326} {"train_loss": -5.877556800842285, "global_step": 55696, "epoch": 1326} {"train_loss": -5.719545364379883, "global_step": 55697, "epoch": 1326} {"train_loss": -5.843564033508301, "global_step": 55698, "epoch": 1326} {"train_loss": -5.870028495788574, "global_step": 55699, "epoch": 1326} {"train_loss": -5.7530012130737305, "global_step": 55700, "epoch": 1326} {"train_loss": -5.809725761413574, "global_step": 55701, "epoch": 1326} {"train_loss": -5.8125457763671875, "global_step": 55702, "epoch": 1326} {"train_loss": -5.77941370010376, "global_step": 55703, "epoch": 1326} {"train_loss": -5.841910362243652, "global_step": 55704, "epoch": 1326} {"train_loss": -5.832468032836914, "global_step": 55705, "epoch": 1326} {"train_loss": -5.84183931350708, "global_step": 55706, "epoch": 1326} {"train_loss": -5.726603031158447, "global_step": 55707, "epoch": 1326} {"train_loss": -5.868829727172852, "global_step": 55708, "epoch": 1326} {"train_loss": -5.83002233505249, "global_step": 55709, "epoch": 1326} {"train_loss": -5.846689701080322, "global_step": 55710, "epoch": 1326} {"train_loss": -5.818133354187012, "global_step": 55711, "epoch": 1326} {"train_loss": -5.814349174499512, "global_step": 55712, "epoch": 1326} {"train_loss": -5.719329833984375, "global_step": 55713, "epoch": 1326} {"train_loss": -5.91656494140625, "global_step": 55714, "epoch": 1326} {"train_loss": -5.762991905212402, "global_step": 55715, "epoch": 1326} {"train_loss": -5.882819175720215, "global_step": 55716, "epoch": 1326} {"train_loss": -5.651435375213623, "global_step": 55717, "epoch": 1326} {"train_loss": -5.7918548583984375, "global_step": 55718, "epoch": 1326} {"train_loss": -5.917750835418701, "global_step": 55719, "epoch": 1326} {"train_loss": -5.869292259216309, "global_step": 55720, "epoch": 1326} {"train_loss": -5.804469108581543, "global_step": 55721, "epoch": 1326} {"train_loss": -5.845022678375244, "global_step": 55722, "epoch": 1326} {"train_loss": -5.865442752838135, "global_step": 55723, "epoch": 1326} {"train_loss": -5.81882381439209, "global_step": 55724, "epoch": 1326} {"train_loss": -5.767891883850098, "global_step": 55725, "epoch": 1326} {"train_loss": -5.787579536437988, "global_step": 55726, "epoch": 1326} {"train_loss": -5.786890983581543, "global_step": 55727, "epoch": 1326} {"train_loss": -5.836346626281738, "global_step": 55728, "epoch": 1326} {"train_loss": -5.689446449279785, "global_step": 55729, "epoch": 1326} {"train_loss": -5.766944885253906, "global_step": 55730, "epoch": 1326} {"train_loss": -5.720503807067871, "global_step": 55731, "epoch": 1326} {"train_loss": -5.702816963195801, "global_step": 55732, "epoch": 1326} {"train_loss": -5.80920349983942, "global_step": 55733, "epoch": 1326, "val_loss": 66644.0078125} {"train_loss": -5.933384895324707, "global_step": 55734, "epoch": 1327} {"train_loss": -5.710028648376465, "global_step": 55735, "epoch": 1327} {"train_loss": -5.778959274291992, "global_step": 55736, "epoch": 1327} {"train_loss": -5.826436996459961, "global_step": 55737, "epoch": 1327} {"train_loss": -5.732968807220459, "global_step": 55738, "epoch": 1327} {"train_loss": -5.871241569519043, "global_step": 55739, "epoch": 1327} {"train_loss": -5.841858863830566, "global_step": 55740, "epoch": 1327} {"train_loss": -5.931483268737793, "global_step": 55741, "epoch": 1327} {"train_loss": -5.882367134094238, "global_step": 55742, "epoch": 1327} {"train_loss": -5.916013240814209, "global_step": 55743, "epoch": 1327} {"train_loss": -5.777176856994629, "global_step": 55744, "epoch": 1327} {"train_loss": -5.844046592712402, "global_step": 55745, "epoch": 1327} {"train_loss": -5.8639726638793945, "global_step": 55746, "epoch": 1327} {"train_loss": -5.85570764541626, "global_step": 55747, "epoch": 1327} {"train_loss": -5.822640419006348, "global_step": 55748, "epoch": 1327} {"train_loss": -5.80179500579834, "global_step": 55749, "epoch": 1327} {"train_loss": -5.706207275390625, "global_step": 55750, "epoch": 1327} {"train_loss": -5.799603462219238, "global_step": 55751, "epoch": 1327} {"train_loss": -5.70991849899292, "global_step": 55752, "epoch": 1327} {"train_loss": -5.81562614440918, "global_step": 55753, "epoch": 1327} {"train_loss": -5.929520606994629, "global_step": 55754, "epoch": 1327} {"train_loss": -5.891392707824707, "global_step": 55755, "epoch": 1327} {"train_loss": -5.75767707824707, "global_step": 55756, "epoch": 1327} {"train_loss": -5.916326522827148, "global_step": 55757, "epoch": 1327} {"train_loss": -5.755524158477783, "global_step": 55758, "epoch": 1327} {"train_loss": -5.720909118652344, "global_step": 55759, "epoch": 1327} {"train_loss": -5.902705192565918, "global_step": 55760, "epoch": 1327} {"train_loss": -5.831723690032959, "global_step": 55761, "epoch": 1327} {"train_loss": -5.900453567504883, "global_step": 55762, "epoch": 1327} {"train_loss": -5.837386131286621, "global_step": 55763, "epoch": 1327} {"train_loss": -5.803896903991699, "global_step": 55764, "epoch": 1327} {"train_loss": -5.84775447845459, "global_step": 55765, "epoch": 1327} {"train_loss": -5.796718120574951, "global_step": 55766, "epoch": 1327} {"train_loss": -5.820497512817383, "global_step": 55767, "epoch": 1327} {"train_loss": -5.814544200897217, "global_step": 55768, "epoch": 1327} {"train_loss": -5.84419059753418, "global_step": 55769, "epoch": 1327} {"train_loss": -5.835977554321289, "global_step": 55770, "epoch": 1327} {"train_loss": -5.810140609741211, "global_step": 55771, "epoch": 1327} {"train_loss": -5.728811740875244, "global_step": 55772, "epoch": 1327} {"train_loss": -5.780533790588379, "global_step": 55773, "epoch": 1327} {"train_loss": -5.837264060974121, "global_step": 55774, "epoch": 1327} {"train_loss": -5.823458830515544, "global_step": 55775, "epoch": 1327, "val_loss": 66399.515625} {"train_loss": -5.968652248382568, "global_step": 55776, "epoch": 1328} {"train_loss": -5.895443916320801, "global_step": 55777, "epoch": 1328} {"train_loss": -5.657136917114258, "global_step": 55778, "epoch": 1328} {"train_loss": -5.849887847900391, "global_step": 55779, "epoch": 1328} {"train_loss": -5.855839729309082, "global_step": 55780, "epoch": 1328} {"train_loss": -5.8109941482543945, "global_step": 55781, "epoch": 1328} {"train_loss": -5.780176162719727, "global_step": 55782, "epoch": 1328} {"train_loss": -5.810359954833984, "global_step": 55783, "epoch": 1328} {"train_loss": -5.8098039627075195, "global_step": 55784, "epoch": 1328} {"train_loss": -5.780035972595215, "global_step": 55785, "epoch": 1328} {"train_loss": -5.879582405090332, "global_step": 55786, "epoch": 1328} {"train_loss": -5.915839195251465, "global_step": 55787, "epoch": 1328} {"train_loss": -5.763023376464844, "global_step": 55788, "epoch": 1328} {"train_loss": -5.764410972595215, "global_step": 55789, "epoch": 1328} {"train_loss": -5.846347808837891, "global_step": 55790, "epoch": 1328} {"train_loss": -5.845597267150879, "global_step": 55791, "epoch": 1328} {"train_loss": -5.752930164337158, "global_step": 55792, "epoch": 1328} {"train_loss": -5.697192668914795, "global_step": 55793, "epoch": 1328} {"train_loss": -5.874666690826416, "global_step": 55794, "epoch": 1328} {"train_loss": -5.9212870597839355, "global_step": 55795, "epoch": 1328} {"train_loss": -5.807165145874023, "global_step": 55796, "epoch": 1328} {"train_loss": -5.700589656829834, "global_step": 55797, "epoch": 1328} {"train_loss": -5.865470886230469, "global_step": 55798, "epoch": 1328} {"train_loss": -5.71597957611084, "global_step": 55799, "epoch": 1328} {"train_loss": -5.84903621673584, "global_step": 55800, "epoch": 1328} {"train_loss": -5.835414886474609, "global_step": 55801, "epoch": 1328} {"train_loss": -5.8010125160217285, "global_step": 55802, "epoch": 1328} {"train_loss": -5.743682861328125, "global_step": 55803, "epoch": 1328} {"train_loss": -5.789951324462891, "global_step": 55804, "epoch": 1328} {"train_loss": -5.926115989685059, "global_step": 55805, "epoch": 1328} {"train_loss": -5.9012041091918945, "global_step": 55806, "epoch": 1328} {"train_loss": -5.8602399826049805, "global_step": 55807, "epoch": 1328} {"train_loss": -5.7155070304870605, "global_step": 55808, "epoch": 1328} {"train_loss": -5.888952255249023, "global_step": 55809, "epoch": 1328} {"train_loss": -5.858986854553223, "global_step": 55810, "epoch": 1328} {"train_loss": -5.777608871459961, "global_step": 55811, "epoch": 1328} {"train_loss": -5.893054008483887, "global_step": 55812, "epoch": 1328} {"train_loss": -5.831711769104004, "global_step": 55813, "epoch": 1328} {"train_loss": -5.838846683502197, "global_step": 55814, "epoch": 1328} {"train_loss": -5.7787628173828125, "global_step": 55815, "epoch": 1328} {"train_loss": -5.728143215179443, "global_step": 55816, "epoch": 1328} {"train_loss": -5.821880772000267, "global_step": 55817, "epoch": 1328, "val_loss": 66369.1484375} {"train_loss": -5.925011157989502, "global_step": 55818, "epoch": 1329} {"train_loss": -5.885966777801514, "global_step": 55819, "epoch": 1329} {"train_loss": -5.943437099456787, "global_step": 55820, "epoch": 1329} {"train_loss": -5.788061618804932, "global_step": 55821, "epoch": 1329} {"train_loss": -5.915976524353027, "global_step": 55822, "epoch": 1329} {"train_loss": -5.834972381591797, "global_step": 55823, "epoch": 1329} {"train_loss": -5.783493995666504, "global_step": 55824, "epoch": 1329} {"train_loss": -5.785730361938477, "global_step": 55825, "epoch": 1329} {"train_loss": -5.886109352111816, "global_step": 55826, "epoch": 1329} {"train_loss": -5.835961818695068, "global_step": 55827, "epoch": 1329} {"train_loss": -5.88710355758667, "global_step": 55828, "epoch": 1329} {"train_loss": -5.787993907928467, "global_step": 55829, "epoch": 1329} {"train_loss": -5.812185764312744, "global_step": 55830, "epoch": 1329} {"train_loss": -5.738386631011963, "global_step": 55831, "epoch": 1329} {"train_loss": -5.723380088806152, "global_step": 55832, "epoch": 1329} {"train_loss": -5.757729530334473, "global_step": 55833, "epoch": 1329} {"train_loss": -5.805851459503174, "global_step": 55834, "epoch": 1329} {"train_loss": -5.810230255126953, "global_step": 55835, "epoch": 1329} {"train_loss": -5.792548656463623, "global_step": 55836, "epoch": 1329} {"train_loss": -5.854725360870361, "global_step": 55837, "epoch": 1329} {"train_loss": -5.894779682159424, "global_step": 55838, "epoch": 1329} {"train_loss": -5.835491180419922, "global_step": 55839, "epoch": 1329} {"train_loss": -5.827898979187012, "global_step": 55840, "epoch": 1329} {"train_loss": -5.973413467407227, "global_step": 55841, "epoch": 1329} {"train_loss": -5.851361274719238, "global_step": 55842, "epoch": 1329} {"train_loss": -5.866700172424316, "global_step": 55843, "epoch": 1329} {"train_loss": -5.857145309448242, "global_step": 55844, "epoch": 1329} {"train_loss": -5.806546211242676, "global_step": 55845, "epoch": 1329} {"train_loss": -5.784232139587402, "global_step": 55846, "epoch": 1329} {"train_loss": -5.795707702636719, "global_step": 55847, "epoch": 1329} {"train_loss": -5.885114669799805, "global_step": 55848, "epoch": 1329} {"train_loss": -5.762416839599609, "global_step": 55849, "epoch": 1329} {"train_loss": -5.895873069763184, "global_step": 55850, "epoch": 1329} {"train_loss": -5.866457939147949, "global_step": 55851, "epoch": 1329} {"train_loss": -5.784569263458252, "global_step": 55852, "epoch": 1329} {"train_loss": -5.922728538513184, "global_step": 55853, "epoch": 1329} {"train_loss": -5.826157569885254, "global_step": 55854, "epoch": 1329} {"train_loss": -5.763676166534424, "global_step": 55855, "epoch": 1329} {"train_loss": -5.869410037994385, "global_step": 55856, "epoch": 1329} {"train_loss": -5.816808700561523, "global_step": 55857, "epoch": 1329} {"train_loss": -5.736141204833984, "global_step": 55858, "epoch": 1329} {"train_loss": -5.831350440070743, "global_step": 55859, "epoch": 1329, "val_loss": 66592.09375} {"train_loss": -5.933161735534668, "global_step": 55860, "epoch": 1330} {"train_loss": -5.797994613647461, "global_step": 55861, "epoch": 1330} {"train_loss": -5.914114475250244, "global_step": 55862, "epoch": 1330} {"train_loss": -5.838024139404297, "global_step": 55863, "epoch": 1330} {"train_loss": -5.834863662719727, "global_step": 55864, "epoch": 1330} {"train_loss": -5.82628870010376, "global_step": 55865, "epoch": 1330} {"train_loss": -5.939239025115967, "global_step": 55866, "epoch": 1330} {"train_loss": -5.679300308227539, "global_step": 55867, "epoch": 1330} {"train_loss": -5.718886852264404, "global_step": 55868, "epoch": 1330} {"train_loss": -5.865017890930176, "global_step": 55869, "epoch": 1330} {"train_loss": -5.695159912109375, "global_step": 55870, "epoch": 1330} {"train_loss": -5.8139543533325195, "global_step": 55871, "epoch": 1330} {"train_loss": -5.922635078430176, "global_step": 55872, "epoch": 1330} {"train_loss": -5.726597785949707, "global_step": 55873, "epoch": 1330} {"train_loss": -5.831415176391602, "global_step": 55874, "epoch": 1330} {"train_loss": -5.84173583984375, "global_step": 55875, "epoch": 1330} {"train_loss": -5.802412986755371, "global_step": 55876, "epoch": 1330} {"train_loss": -5.859926223754883, "global_step": 55877, "epoch": 1330} {"train_loss": -5.884410858154297, "global_step": 55878, "epoch": 1330} {"train_loss": -5.821727752685547, "global_step": 55879, "epoch": 1330} {"train_loss": -5.781578540802002, "global_step": 55880, "epoch": 1330} {"train_loss": -5.86055850982666, "global_step": 55881, "epoch": 1330} {"train_loss": -5.877342224121094, "global_step": 55882, "epoch": 1330} {"train_loss": -5.913459300994873, "global_step": 55883, "epoch": 1330} {"train_loss": -5.9184770584106445, "global_step": 55884, "epoch": 1330} {"train_loss": -5.760965347290039, "global_step": 55885, "epoch": 1330} {"train_loss": -5.769106864929199, "global_step": 55886, "epoch": 1330} {"train_loss": -5.738190650939941, "global_step": 55887, "epoch": 1330} {"train_loss": -5.915491104125977, "global_step": 55888, "epoch": 1330} {"train_loss": -5.901902675628662, "global_step": 55889, "epoch": 1330} {"train_loss": -5.827052116394043, "global_step": 55890, "epoch": 1330} {"train_loss": -5.779809951782227, "global_step": 55891, "epoch": 1330} {"train_loss": -5.784939765930176, "global_step": 55892, "epoch": 1330} {"train_loss": -5.883166790008545, "global_step": 55893, "epoch": 1330} {"train_loss": -5.866922378540039, "global_step": 55894, "epoch": 1330} {"train_loss": -5.8012542724609375, "global_step": 55895, "epoch": 1330} {"train_loss": -5.853461742401123, "global_step": 55896, "epoch": 1330} {"train_loss": -5.822531223297119, "global_step": 55897, "epoch": 1330} {"train_loss": -5.895405292510986, "global_step": 55898, "epoch": 1330} {"train_loss": -5.883735656738281, "global_step": 55899, "epoch": 1330} {"train_loss": -5.930787086486816, "global_step": 55900, "epoch": 1330} {"train_loss": -5.83743337222508, "global_step": 55901, "epoch": 1330, "val_loss": 66376.0546875} {"train_loss": -5.799342155456543, "global_step": 55902, "epoch": 1331} {"train_loss": -5.795226097106934, "global_step": 55903, "epoch": 1331} {"train_loss": -6.004818916320801, "global_step": 55904, "epoch": 1331} {"train_loss": -5.875328063964844, "global_step": 55905, "epoch": 1331} {"train_loss": -5.954132080078125, "global_step": 55906, "epoch": 1331} {"train_loss": -5.803518295288086, "global_step": 55907, "epoch": 1331} {"train_loss": -5.782684326171875, "global_step": 55908, "epoch": 1331} {"train_loss": -5.924331188201904, "global_step": 55909, "epoch": 1331} {"train_loss": -5.889508247375488, "global_step": 55910, "epoch": 1331} {"train_loss": -5.847891807556152, "global_step": 55911, "epoch": 1331} {"train_loss": -5.967401027679443, "global_step": 55912, "epoch": 1331} {"train_loss": -5.859640121459961, "global_step": 55913, "epoch": 1331} {"train_loss": -5.72016716003418, "global_step": 55914, "epoch": 1331} {"train_loss": -5.802164077758789, "global_step": 55915, "epoch": 1331} {"train_loss": -5.841562271118164, "global_step": 55916, "epoch": 1331} {"train_loss": -5.900747299194336, "global_step": 55917, "epoch": 1331} {"train_loss": -5.820919036865234, "global_step": 55918, "epoch": 1331} {"train_loss": -5.961277961730957, "global_step": 55919, "epoch": 1331} {"train_loss": -5.760555267333984, "global_step": 55920, "epoch": 1331} {"train_loss": -5.853168964385986, "global_step": 55921, "epoch": 1331} {"train_loss": -5.754254341125488, "global_step": 55922, "epoch": 1331} {"train_loss": -5.857592582702637, "global_step": 55923, "epoch": 1331} {"train_loss": -5.844943046569824, "global_step": 55924, "epoch": 1331} {"train_loss": -5.890371322631836, "global_step": 55925, "epoch": 1331} {"train_loss": -5.860128402709961, "global_step": 55926, "epoch": 1331} {"train_loss": -5.891602516174316, "global_step": 55927, "epoch": 1331} {"train_loss": -5.805724143981934, "global_step": 55928, "epoch": 1331} {"train_loss": -5.831294536590576, "global_step": 55929, "epoch": 1331} {"train_loss": -5.901783466339111, "global_step": 55930, "epoch": 1331} {"train_loss": -5.893494606018066, "global_step": 55931, "epoch": 1331} {"train_loss": -5.901741981506348, "global_step": 55932, "epoch": 1331} {"train_loss": -5.799004554748535, "global_step": 55933, "epoch": 1331} {"train_loss": -5.866443634033203, "global_step": 55934, "epoch": 1331} {"train_loss": -5.715532302856445, "global_step": 55935, "epoch": 1331} {"train_loss": -5.921769142150879, "global_step": 55936, "epoch": 1331} {"train_loss": -5.879094123840332, "global_step": 55937, "epoch": 1331} {"train_loss": -5.820980072021484, "global_step": 55938, "epoch": 1331} {"train_loss": -5.847051620483398, "global_step": 55939, "epoch": 1331} {"train_loss": -5.867573261260986, "global_step": 55940, "epoch": 1331} {"train_loss": -5.900598526000977, "global_step": 55941, "epoch": 1331} {"train_loss": -5.732198238372803, "global_step": 55942, "epoch": 1331} {"train_loss": -5.851841790335519, "global_step": 55943, "epoch": 1331, "val_loss": 66366.0625} {"train_loss": -5.956914901733398, "global_step": 55944, "epoch": 1332} {"train_loss": -5.900984287261963, "global_step": 55945, "epoch": 1332} {"train_loss": -5.798454284667969, "global_step": 55946, "epoch": 1332} {"train_loss": -5.857390403747559, "global_step": 55947, "epoch": 1332} {"train_loss": -5.929447174072266, "global_step": 55948, "epoch": 1332} {"train_loss": -5.967827796936035, "global_step": 55949, "epoch": 1332} {"train_loss": -5.904447555541992, "global_step": 55950, "epoch": 1332} {"train_loss": -5.923464298248291, "global_step": 55951, "epoch": 1332} {"train_loss": -5.844303131103516, "global_step": 55952, "epoch": 1332} {"train_loss": -5.821214199066162, "global_step": 55953, "epoch": 1332} {"train_loss": -5.860757827758789, "global_step": 55954, "epoch": 1332} {"train_loss": -5.846219062805176, "global_step": 55955, "epoch": 1332} {"train_loss": -6.004668235778809, "global_step": 55956, "epoch": 1332} {"train_loss": -5.9373779296875, "global_step": 55957, "epoch": 1332} {"train_loss": -5.9543232917785645, "global_step": 55958, "epoch": 1332} {"train_loss": -5.896282196044922, "global_step": 55959, "epoch": 1332} {"train_loss": -5.806177139282227, "global_step": 55960, "epoch": 1332} {"train_loss": -5.744732856750488, "global_step": 55961, "epoch": 1332} {"train_loss": -5.808964729309082, "global_step": 55962, "epoch": 1332} {"train_loss": -5.881253719329834, "global_step": 55963, "epoch": 1332} {"train_loss": -5.80766487121582, "global_step": 55964, "epoch": 1332} {"train_loss": -5.846648216247559, "global_step": 55965, "epoch": 1332} {"train_loss": -5.811866283416748, "global_step": 55966, "epoch": 1332} {"train_loss": -5.967978477478027, "global_step": 55967, "epoch": 1332} {"train_loss": -5.730974197387695, "global_step": 55968, "epoch": 1332} {"train_loss": -5.863029479980469, "global_step": 55969, "epoch": 1332} {"train_loss": -5.799405097961426, "global_step": 55970, "epoch": 1332} {"train_loss": -5.936201095581055, "global_step": 55971, "epoch": 1332} {"train_loss": -5.7772040367126465, "global_step": 55972, "epoch": 1332} {"train_loss": -5.735698223114014, "global_step": 55973, "epoch": 1332} {"train_loss": -5.742103099822998, "global_step": 55974, "epoch": 1332} {"train_loss": -5.927833557128906, "global_step": 55975, "epoch": 1332} {"train_loss": -5.94170618057251, "global_step": 55976, "epoch": 1332} {"train_loss": -5.793389797210693, "global_step": 55977, "epoch": 1332} {"train_loss": -5.7704267501831055, "global_step": 55978, "epoch": 1332} {"train_loss": -5.787690162658691, "global_step": 55979, "epoch": 1332} {"train_loss": -5.737678527832031, "global_step": 55980, "epoch": 1332} {"train_loss": -5.8766188621521, "global_step": 55981, "epoch": 1332} {"train_loss": -5.668543815612793, "global_step": 55982, "epoch": 1332} {"train_loss": -5.837812423706055, "global_step": 55983, "epoch": 1332} {"train_loss": -5.836064338684082, "global_step": 55984, "epoch": 1332} {"train_loss": -5.849650473821731, "global_step": 55985, "epoch": 1332, "val_loss": 66477.2109375} {"train_loss": -5.8371381759643555, "global_step": 55986, "epoch": 1333} {"train_loss": -5.745479106903076, "global_step": 55987, "epoch": 1333} {"train_loss": -5.905005931854248, "global_step": 55988, "epoch": 1333} {"train_loss": -5.895776271820068, "global_step": 55989, "epoch": 1333} {"train_loss": -5.732415676116943, "global_step": 55990, "epoch": 1333} {"train_loss": -6.004828929901123, "global_step": 55991, "epoch": 1333} {"train_loss": -5.736079216003418, "global_step": 55992, "epoch": 1333} {"train_loss": -5.79572057723999, "global_step": 55993, "epoch": 1333} {"train_loss": -5.892131805419922, "global_step": 55994, "epoch": 1333} {"train_loss": -5.920586109161377, "global_step": 55995, "epoch": 1333} {"train_loss": -5.807755470275879, "global_step": 55996, "epoch": 1333} {"train_loss": -5.846316814422607, "global_step": 55997, "epoch": 1333} {"train_loss": -5.925841808319092, "global_step": 55998, "epoch": 1333} {"train_loss": -5.830517768859863, "global_step": 55999, "epoch": 1333} {"train_loss": -5.8410444259643555, "global_step": 56000, "epoch": 1333} {"train_loss": -5.93306827545166, "global_step": 56001, "epoch": 1333} {"train_loss": -5.820517539978027, "global_step": 56002, "epoch": 1333} {"train_loss": -5.943614959716797, "global_step": 56003, "epoch": 1333} {"train_loss": -5.858532428741455, "global_step": 56004, "epoch": 1333} {"train_loss": -5.787052154541016, "global_step": 56005, "epoch": 1333} {"train_loss": -5.9374237060546875, "global_step": 56006, "epoch": 1333} {"train_loss": -5.8260884284973145, "global_step": 56007, "epoch": 1333} {"train_loss": -5.827073097229004, "global_step": 56008, "epoch": 1333} {"train_loss": -5.759941577911377, "global_step": 56009, "epoch": 1333} {"train_loss": -5.75809383392334, "global_step": 56010, "epoch": 1333} {"train_loss": -5.925609111785889, "global_step": 56011, "epoch": 1333} {"train_loss": -5.707233428955078, "global_step": 56012, "epoch": 1333} {"train_loss": -5.795601844787598, "global_step": 56013, "epoch": 1333} {"train_loss": -5.8975372314453125, "global_step": 56014, "epoch": 1333} {"train_loss": -5.852298736572266, "global_step": 56015, "epoch": 1333} {"train_loss": -5.790038108825684, "global_step": 56016, "epoch": 1333} {"train_loss": -5.843021869659424, "global_step": 56017, "epoch": 1333} {"train_loss": -5.7861762046813965, "global_step": 56018, "epoch": 1333} {"train_loss": -5.929801940917969, "global_step": 56019, "epoch": 1333} {"train_loss": -5.836775302886963, "global_step": 56020, "epoch": 1333} {"train_loss": -5.938246726989746, "global_step": 56021, "epoch": 1333} {"train_loss": -5.850554943084717, "global_step": 56022, "epoch": 1333} {"train_loss": -5.723787307739258, "global_step": 56023, "epoch": 1333} {"train_loss": -5.875009059906006, "global_step": 56024, "epoch": 1333} {"train_loss": -5.8167724609375, "global_step": 56025, "epoch": 1333} {"train_loss": -5.768887042999268, "global_step": 56026, "epoch": 1333} {"train_loss": -5.843618086406162, "global_step": 56027, "epoch": 1333, "val_loss": 66733.0859375} {"train_loss": -5.868925094604492, "global_step": 56028, "epoch": 1334} {"train_loss": -5.798535346984863, "global_step": 56029, "epoch": 1334} {"train_loss": -5.794441223144531, "global_step": 56030, "epoch": 1334} {"train_loss": -5.8914337158203125, "global_step": 56031, "epoch": 1334} {"train_loss": -5.869399070739746, "global_step": 56032, "epoch": 1334} {"train_loss": -5.8788981437683105, "global_step": 56033, "epoch": 1334} {"train_loss": -5.7879862785339355, "global_step": 56034, "epoch": 1334} {"train_loss": -5.855940818786621, "global_step": 56035, "epoch": 1334} {"train_loss": -5.81937837600708, "global_step": 56036, "epoch": 1334} {"train_loss": -5.878255844116211, "global_step": 56037, "epoch": 1334} {"train_loss": -5.942439079284668, "global_step": 56038, "epoch": 1334} {"train_loss": -5.917030334472656, "global_step": 56039, "epoch": 1334} {"train_loss": -5.728323459625244, "global_step": 56040, "epoch": 1334} {"train_loss": -5.8750715255737305, "global_step": 56041, "epoch": 1334} {"train_loss": -5.732499122619629, "global_step": 56042, "epoch": 1334} {"train_loss": -5.851984977722168, "global_step": 56043, "epoch": 1334} {"train_loss": -5.7696428298950195, "global_step": 56044, "epoch": 1334} {"train_loss": -5.825281620025635, "global_step": 56045, "epoch": 1334} {"train_loss": -5.761171340942383, "global_step": 56046, "epoch": 1334} {"train_loss": -5.749016761779785, "global_step": 56047, "epoch": 1334} {"train_loss": -5.666863918304443, "global_step": 56048, "epoch": 1334} {"train_loss": -5.775439262390137, "global_step": 56049, "epoch": 1334} {"train_loss": -5.821466445922852, "global_step": 56050, "epoch": 1334} {"train_loss": -5.737866401672363, "global_step": 56051, "epoch": 1334} {"train_loss": -5.677420616149902, "global_step": 56052, "epoch": 1334} {"train_loss": -5.884247779846191, "global_step": 56053, "epoch": 1334} {"train_loss": -5.866748332977295, "global_step": 56054, "epoch": 1334} {"train_loss": -5.835578918457031, "global_step": 56055, "epoch": 1334} {"train_loss": -5.865551471710205, "global_step": 56056, "epoch": 1334} {"train_loss": -5.97960090637207, "global_step": 56057, "epoch": 1334} {"train_loss": -5.772185325622559, "global_step": 56058, "epoch": 1334} {"train_loss": -5.960306167602539, "global_step": 56059, "epoch": 1334} {"train_loss": -5.779894828796387, "global_step": 56060, "epoch": 1334} {"train_loss": -5.895705223083496, "global_step": 56061, "epoch": 1334} {"train_loss": -5.856384754180908, "global_step": 56062, "epoch": 1334} {"train_loss": -5.861114025115967, "global_step": 56063, "epoch": 1334} {"train_loss": -5.871368408203125, "global_step": 56064, "epoch": 1334} {"train_loss": -5.832744598388672, "global_step": 56065, "epoch": 1334} {"train_loss": -5.769266128540039, "global_step": 56066, "epoch": 1334} {"train_loss": -5.831395149230957, "global_step": 56067, "epoch": 1334} {"train_loss": -5.787764549255371, "global_step": 56068, "epoch": 1334} {"train_loss": -5.8292844749632335, "global_step": 56069, "epoch": 1334, "val_loss": 66413.1015625} {"train_loss": -5.860099792480469, "global_step": 56070, "epoch": 1335} {"train_loss": -5.910675048828125, "global_step": 56071, "epoch": 1335} {"train_loss": -5.871518135070801, "global_step": 56072, "epoch": 1335} {"train_loss": -5.947662353515625, "global_step": 56073, "epoch": 1335} {"train_loss": -5.886191368103027, "global_step": 56074, "epoch": 1335} {"train_loss": -5.759476661682129, "global_step": 56075, "epoch": 1335} {"train_loss": -5.9721198081970215, "global_step": 56076, "epoch": 1335} {"train_loss": -5.787598609924316, "global_step": 56077, "epoch": 1335} {"train_loss": -5.866808891296387, "global_step": 56078, "epoch": 1335} {"train_loss": -5.804732799530029, "global_step": 56079, "epoch": 1335} {"train_loss": -5.844808578491211, "global_step": 56080, "epoch": 1335} {"train_loss": -5.7500410079956055, "global_step": 56081, "epoch": 1335} {"train_loss": -5.888284683227539, "global_step": 56082, "epoch": 1335} {"train_loss": -5.922158241271973, "global_step": 56083, "epoch": 1335} {"train_loss": -5.93641471862793, "global_step": 56084, "epoch": 1335} {"train_loss": -5.952854156494141, "global_step": 56085, "epoch": 1335} {"train_loss": -5.920319557189941, "global_step": 56086, "epoch": 1335} {"train_loss": -5.776944160461426, "global_step": 56087, "epoch": 1335} {"train_loss": -5.8759307861328125, "global_step": 56088, "epoch": 1335} {"train_loss": -5.873016357421875, "global_step": 56089, "epoch": 1335} {"train_loss": -5.8146514892578125, "global_step": 56090, "epoch": 1335} {"train_loss": -5.846136093139648, "global_step": 56091, "epoch": 1335} {"train_loss": -5.877222061157227, "global_step": 56092, "epoch": 1335} {"train_loss": -5.794424057006836, "global_step": 56093, "epoch": 1335} {"train_loss": -5.879443645477295, "global_step": 56094, "epoch": 1335} {"train_loss": -5.844793796539307, "global_step": 56095, "epoch": 1335} {"train_loss": -5.735798358917236, "global_step": 56096, "epoch": 1335} {"train_loss": -5.848669052124023, "global_step": 56097, "epoch": 1335} {"train_loss": -5.922883033752441, "global_step": 56098, "epoch": 1335} {"train_loss": -5.84017276763916, "global_step": 56099, "epoch": 1335} {"train_loss": -5.869462966918945, "global_step": 56100, "epoch": 1335} {"train_loss": -5.872406482696533, "global_step": 56101, "epoch": 1335} {"train_loss": -5.832552909851074, "global_step": 56102, "epoch": 1335} {"train_loss": -5.766473770141602, "global_step": 56103, "epoch": 1335} {"train_loss": -5.9113359451293945, "global_step": 56104, "epoch": 1335} {"train_loss": -5.892139434814453, "global_step": 56105, "epoch": 1335} {"train_loss": -5.743607521057129, "global_step": 56106, "epoch": 1335} {"train_loss": -5.7836198806762695, "global_step": 56107, "epoch": 1335} {"train_loss": -5.943569183349609, "global_step": 56108, "epoch": 1335} {"train_loss": -5.853503227233887, "global_step": 56109, "epoch": 1335} {"train_loss": -5.681217193603516, "global_step": 56110, "epoch": 1335} {"train_loss": -5.8547144049689885, "global_step": 56111, "epoch": 1335, "val_loss": 66359.921875} {"train_loss": -5.84907341003418, "global_step": 56112, "epoch": 1336} {"train_loss": -5.81503963470459, "global_step": 56113, "epoch": 1336} {"train_loss": -5.844170570373535, "global_step": 56114, "epoch": 1336} {"train_loss": -5.769852638244629, "global_step": 56115, "epoch": 1336} {"train_loss": -5.9295549392700195, "global_step": 56116, "epoch": 1336} {"train_loss": -5.911559581756592, "global_step": 56117, "epoch": 1336} {"train_loss": -5.872261047363281, "global_step": 56118, "epoch": 1336} {"train_loss": -5.899349212646484, "global_step": 56119, "epoch": 1336} {"train_loss": -5.78617000579834, "global_step": 56120, "epoch": 1336} {"train_loss": -6.001206398010254, "global_step": 56121, "epoch": 1336} {"train_loss": -5.809502124786377, "global_step": 56122, "epoch": 1336} {"train_loss": -5.764934062957764, "global_step": 56123, "epoch": 1336} {"train_loss": -5.894993782043457, "global_step": 56124, "epoch": 1336} {"train_loss": -5.731565475463867, "global_step": 56125, "epoch": 1336} {"train_loss": -5.957177639007568, "global_step": 56126, "epoch": 1336} {"train_loss": -5.9120049476623535, "global_step": 56127, "epoch": 1336} {"train_loss": -5.954594612121582, "global_step": 56128, "epoch": 1336} {"train_loss": -5.742458343505859, "global_step": 56129, "epoch": 1336} {"train_loss": -5.939903736114502, "global_step": 56130, "epoch": 1336} {"train_loss": -5.833813667297363, "global_step": 56131, "epoch": 1336} {"train_loss": -5.933288097381592, "global_step": 56132, "epoch": 1336} {"train_loss": -5.824560642242432, "global_step": 56133, "epoch": 1336} {"train_loss": -5.922327995300293, "global_step": 56134, "epoch": 1336} {"train_loss": -5.922242164611816, "global_step": 56135, "epoch": 1336} {"train_loss": -5.87019157409668, "global_step": 56136, "epoch": 1336} {"train_loss": -5.736027240753174, "global_step": 56137, "epoch": 1336} {"train_loss": -5.77436637878418, "global_step": 56138, "epoch": 1336} {"train_loss": -5.901247978210449, "global_step": 56139, "epoch": 1336} {"train_loss": -5.7800445556640625, "global_step": 56140, "epoch": 1336} {"train_loss": -5.843311309814453, "global_step": 56141, "epoch": 1336} {"train_loss": -5.957003116607666, "global_step": 56142, "epoch": 1336} {"train_loss": -5.736869812011719, "global_step": 56143, "epoch": 1336} {"train_loss": -5.853569984436035, "global_step": 56144, "epoch": 1336} {"train_loss": -5.871728897094727, "global_step": 56145, "epoch": 1336} {"train_loss": -5.861220359802246, "global_step": 56146, "epoch": 1336} {"train_loss": -5.782254219055176, "global_step": 56147, "epoch": 1336} {"train_loss": -5.830635070800781, "global_step": 56148, "epoch": 1336} {"train_loss": -5.807586193084717, "global_step": 56149, "epoch": 1336} {"train_loss": -5.864870548248291, "global_step": 56150, "epoch": 1336} {"train_loss": -5.863209247589111, "global_step": 56151, "epoch": 1336} {"train_loss": -5.96896505355835, "global_step": 56152, "epoch": 1336} {"train_loss": -5.850535835538592, "global_step": 56153, "epoch": 1336, "val_loss": 66456.6640625} {"train_loss": -5.794301986694336, "global_step": 56154, "epoch": 1337} {"train_loss": -5.849697113037109, "global_step": 56155, "epoch": 1337} {"train_loss": -5.814667224884033, "global_step": 56156, "epoch": 1337} {"train_loss": -5.841401100158691, "global_step": 56157, "epoch": 1337} {"train_loss": -5.626441955566406, "global_step": 56158, "epoch": 1337} {"train_loss": -5.7797651290893555, "global_step": 56159, "epoch": 1337} {"train_loss": -5.92085075378418, "global_step": 56160, "epoch": 1337} {"train_loss": -5.830242156982422, "global_step": 56161, "epoch": 1337} {"train_loss": -5.827654838562012, "global_step": 56162, "epoch": 1337} {"train_loss": -5.664578437805176, "global_step": 56163, "epoch": 1337} {"train_loss": -5.778847694396973, "global_step": 56164, "epoch": 1337} {"train_loss": -5.792116165161133, "global_step": 56165, "epoch": 1337} {"train_loss": -5.774803161621094, "global_step": 56166, "epoch": 1337} {"train_loss": -5.766584396362305, "global_step": 56167, "epoch": 1337} {"train_loss": -5.838070869445801, "global_step": 56168, "epoch": 1337} {"train_loss": -5.860077857971191, "global_step": 56169, "epoch": 1337} {"train_loss": -5.850940704345703, "global_step": 56170, "epoch": 1337} {"train_loss": -5.903656005859375, "global_step": 56171, "epoch": 1337} {"train_loss": -5.780893325805664, "global_step": 56172, "epoch": 1337} {"train_loss": -5.882952690124512, "global_step": 56173, "epoch": 1337} {"train_loss": -5.85575008392334, "global_step": 56174, "epoch": 1337} {"train_loss": -5.756842613220215, "global_step": 56175, "epoch": 1337} {"train_loss": -5.96502685546875, "global_step": 56176, "epoch": 1337} {"train_loss": -5.899662017822266, "global_step": 56177, "epoch": 1337} {"train_loss": -5.787705898284912, "global_step": 56178, "epoch": 1337} {"train_loss": -5.891078948974609, "global_step": 56179, "epoch": 1337} {"train_loss": -5.8227949142456055, "global_step": 56180, "epoch": 1337} {"train_loss": -5.839418411254883, "global_step": 56181, "epoch": 1337} {"train_loss": -5.930928707122803, "global_step": 56182, "epoch": 1337} {"train_loss": -5.72659158706665, "global_step": 56183, "epoch": 1337} {"train_loss": -5.90110445022583, "global_step": 56184, "epoch": 1337} {"train_loss": -5.707856178283691, "global_step": 56185, "epoch": 1337} {"train_loss": -5.7570648193359375, "global_step": 56186, "epoch": 1337} {"train_loss": -5.788382530212402, "global_step": 56187, "epoch": 1337} {"train_loss": -5.806661605834961, "global_step": 56188, "epoch": 1337} {"train_loss": -5.810981750488281, "global_step": 56189, "epoch": 1337} {"train_loss": -5.8697333335876465, "global_step": 56190, "epoch": 1337} {"train_loss": -5.755214691162109, "global_step": 56191, "epoch": 1337} {"train_loss": -5.908131122589111, "global_step": 56192, "epoch": 1337} {"train_loss": -5.785327434539795, "global_step": 56193, "epoch": 1337} {"train_loss": -5.797414779663086, "global_step": 56194, "epoch": 1337} {"train_loss": -5.817950702848888, "global_step": 56195, "epoch": 1337, "val_loss": 66630.4609375} {"train_loss": -5.772745609283447, "global_step": 56196, "epoch": 1338} {"train_loss": -5.840567111968994, "global_step": 56197, "epoch": 1338} {"train_loss": -5.869081974029541, "global_step": 56198, "epoch": 1338} {"train_loss": -5.865166664123535, "global_step": 56199, "epoch": 1338} {"train_loss": -5.937858581542969, "global_step": 56200, "epoch": 1338} {"train_loss": -5.899833679199219, "global_step": 56201, "epoch": 1338} {"train_loss": -5.890326023101807, "global_step": 56202, "epoch": 1338} {"train_loss": -5.8311448097229, "global_step": 56203, "epoch": 1338} {"train_loss": -5.81279182434082, "global_step": 56204, "epoch": 1338} {"train_loss": -5.832378387451172, "global_step": 56205, "epoch": 1338} {"train_loss": -5.800929069519043, "global_step": 56206, "epoch": 1338} {"train_loss": -5.754186630249023, "global_step": 56207, "epoch": 1338} {"train_loss": -5.794486999511719, "global_step": 56208, "epoch": 1338} {"train_loss": -5.831045150756836, "global_step": 56209, "epoch": 1338} {"train_loss": -5.837918758392334, "global_step": 56210, "epoch": 1338} {"train_loss": -5.899588108062744, "global_step": 56211, "epoch": 1338} {"train_loss": -5.784645080566406, "global_step": 56212, "epoch": 1338} {"train_loss": -5.704353332519531, "global_step": 56213, "epoch": 1338} {"train_loss": -5.738043308258057, "global_step": 56214, "epoch": 1338} {"train_loss": -5.786539077758789, "global_step": 56215, "epoch": 1338} {"train_loss": -5.795018672943115, "global_step": 56216, "epoch": 1338} {"train_loss": -5.7573041915893555, "global_step": 56217, "epoch": 1338} {"train_loss": -5.876152038574219, "global_step": 56218, "epoch": 1338} {"train_loss": -5.83843994140625, "global_step": 56219, "epoch": 1338} {"train_loss": -5.813742160797119, "global_step": 56220, "epoch": 1338} {"train_loss": -5.889444351196289, "global_step": 56221, "epoch": 1338} {"train_loss": -5.893491744995117, "global_step": 56222, "epoch": 1338} {"train_loss": -5.799790859222412, "global_step": 56223, "epoch": 1338} {"train_loss": -5.766336441040039, "global_step": 56224, "epoch": 1338} {"train_loss": -5.841492652893066, "global_step": 56225, "epoch": 1338} {"train_loss": -5.780149459838867, "global_step": 56226, "epoch": 1338} {"train_loss": -5.794526100158691, "global_step": 56227, "epoch": 1338} {"train_loss": -5.81229305267334, "global_step": 56228, "epoch": 1338} {"train_loss": -5.921021938323975, "global_step": 56229, "epoch": 1338} {"train_loss": -5.843082904815674, "global_step": 56230, "epoch": 1338} {"train_loss": -5.889179706573486, "global_step": 56231, "epoch": 1338} {"train_loss": -5.834921360015869, "global_step": 56232, "epoch": 1338} {"train_loss": -5.862017631530762, "global_step": 56233, "epoch": 1338} {"train_loss": -5.794920921325684, "global_step": 56234, "epoch": 1338} {"train_loss": -5.9100213050842285, "global_step": 56235, "epoch": 1338} {"train_loss": -5.795440196990967, "global_step": 56236, "epoch": 1338} {"train_loss": -5.829956542877924, "global_step": 56237, "epoch": 1338, "val_loss": 66612.6484375} {"train_loss": -5.931075572967529, "global_step": 56238, "epoch": 1339} {"train_loss": -6.058353424072266, "global_step": 56239, "epoch": 1339} {"train_loss": -5.748264312744141, "global_step": 56240, "epoch": 1339} {"train_loss": -5.904012680053711, "global_step": 56241, "epoch": 1339} {"train_loss": -5.790201187133789, "global_step": 56242, "epoch": 1339} {"train_loss": -5.820023059844971, "global_step": 56243, "epoch": 1339} {"train_loss": -5.8149824142456055, "global_step": 56244, "epoch": 1339} {"train_loss": -5.886651992797852, "global_step": 56245, "epoch": 1339} {"train_loss": -5.7343549728393555, "global_step": 56246, "epoch": 1339} {"train_loss": -5.976487636566162, "global_step": 56247, "epoch": 1339} {"train_loss": -5.834868431091309, "global_step": 56248, "epoch": 1339} {"train_loss": -5.868459224700928, "global_step": 56249, "epoch": 1339} {"train_loss": -5.807483673095703, "global_step": 56250, "epoch": 1339} {"train_loss": -5.867225646972656, "global_step": 56251, "epoch": 1339} {"train_loss": -5.793371200561523, "global_step": 56252, "epoch": 1339} {"train_loss": -5.719386100769043, "global_step": 56253, "epoch": 1339} {"train_loss": -5.782359600067139, "global_step": 56254, "epoch": 1339} {"train_loss": -5.901326656341553, "global_step": 56255, "epoch": 1339} {"train_loss": -5.861681938171387, "global_step": 56256, "epoch": 1339} {"train_loss": -5.800594329833984, "global_step": 56257, "epoch": 1339} {"train_loss": -5.78087854385376, "global_step": 56258, "epoch": 1339} {"train_loss": -5.807602882385254, "global_step": 56259, "epoch": 1339} {"train_loss": -5.579830169677734, "global_step": 56260, "epoch": 1339} {"train_loss": -5.9310102462768555, "global_step": 56261, "epoch": 1339} {"train_loss": -5.78980827331543, "global_step": 56262, "epoch": 1339} {"train_loss": -5.831788063049316, "global_step": 56263, "epoch": 1339} {"train_loss": -5.834969997406006, "global_step": 56264, "epoch": 1339} {"train_loss": -5.737371444702148, "global_step": 56265, "epoch": 1339} {"train_loss": -5.922079086303711, "global_step": 56266, "epoch": 1339} {"train_loss": -5.747215747833252, "global_step": 56267, "epoch": 1339} {"train_loss": -5.780876159667969, "global_step": 56268, "epoch": 1339} {"train_loss": -5.9754133224487305, "global_step": 56269, "epoch": 1339} {"train_loss": -5.835053443908691, "global_step": 56270, "epoch": 1339} {"train_loss": -5.9163103103637695, "global_step": 56271, "epoch": 1339} {"train_loss": -5.75144100189209, "global_step": 56272, "epoch": 1339} {"train_loss": -5.816678047180176, "global_step": 56273, "epoch": 1339} {"train_loss": -5.802619934082031, "global_step": 56274, "epoch": 1339} {"train_loss": -5.637245178222656, "global_step": 56275, "epoch": 1339} {"train_loss": -5.883518218994141, "global_step": 56276, "epoch": 1339} {"train_loss": -5.810136318206787, "global_step": 56277, "epoch": 1339} {"train_loss": -5.774740219116211, "global_step": 56278, "epoch": 1339} {"train_loss": -5.828006483259655, "global_step": 56279, "epoch": 1339, "val_loss": 66442.375} {"train_loss": -5.76564884185791, "global_step": 56280, "epoch": 1340} {"train_loss": -5.83586311340332, "global_step": 56281, "epoch": 1340} {"train_loss": -5.925045013427734, "global_step": 56282, "epoch": 1340} {"train_loss": -5.863995552062988, "global_step": 56283, "epoch": 1340} {"train_loss": -5.7638702392578125, "global_step": 56284, "epoch": 1340} {"train_loss": -5.89719820022583, "global_step": 56285, "epoch": 1340} {"train_loss": -5.901472091674805, "global_step": 56286, "epoch": 1340} {"train_loss": -5.825286865234375, "global_step": 56287, "epoch": 1340} {"train_loss": -5.7762908935546875, "global_step": 56288, "epoch": 1340} {"train_loss": -5.941954612731934, "global_step": 56289, "epoch": 1340} {"train_loss": -5.926087379455566, "global_step": 56290, "epoch": 1340} {"train_loss": -5.88790225982666, "global_step": 56291, "epoch": 1340} {"train_loss": -5.977261066436768, "global_step": 56292, "epoch": 1340} {"train_loss": -5.830971717834473, "global_step": 56293, "epoch": 1340} {"train_loss": -5.8881072998046875, "global_step": 56294, "epoch": 1340} {"train_loss": -5.820244789123535, "global_step": 56295, "epoch": 1340} {"train_loss": -5.897841453552246, "global_step": 56296, "epoch": 1340} {"train_loss": -5.779781341552734, "global_step": 56297, "epoch": 1340} {"train_loss": -5.852329254150391, "global_step": 56298, "epoch": 1340} {"train_loss": -5.81837272644043, "global_step": 56299, "epoch": 1340} {"train_loss": -5.7254815101623535, "global_step": 56300, "epoch": 1340} {"train_loss": -5.814544677734375, "global_step": 56301, "epoch": 1340} {"train_loss": -5.72097110748291, "global_step": 56302, "epoch": 1340} {"train_loss": -5.778179168701172, "global_step": 56303, "epoch": 1340} {"train_loss": -5.7219085693359375, "global_step": 56304, "epoch": 1340} {"train_loss": -5.750533580780029, "global_step": 56305, "epoch": 1340} {"train_loss": -5.86273193359375, "global_step": 56306, "epoch": 1340} {"train_loss": -5.838543891906738, "global_step": 56307, "epoch": 1340} {"train_loss": -5.843487739562988, "global_step": 56308, "epoch": 1340} {"train_loss": -5.808892726898193, "global_step": 56309, "epoch": 1340} {"train_loss": -5.8034586906433105, "global_step": 56310, "epoch": 1340} {"train_loss": -5.89291524887085, "global_step": 56311, "epoch": 1340} {"train_loss": -5.821023941040039, "global_step": 56312, "epoch": 1340} {"train_loss": -5.729058265686035, "global_step": 56313, "epoch": 1340} {"train_loss": -5.911858558654785, "global_step": 56314, "epoch": 1340} {"train_loss": -5.793025016784668, "global_step": 56315, "epoch": 1340} {"train_loss": -5.858096599578857, "global_step": 56316, "epoch": 1340} {"train_loss": -5.711884498596191, "global_step": 56317, "epoch": 1340} {"train_loss": -5.701077461242676, "global_step": 56318, "epoch": 1340} {"train_loss": -5.782716751098633, "global_step": 56319, "epoch": 1340} {"train_loss": -5.7957329750061035, "global_step": 56320, "epoch": 1340} {"train_loss": -5.82192747933524, "global_step": 56321, "epoch": 1340, "val_loss": 66709.5078125} {"train_loss": -5.864455223083496, "global_step": 56322, "epoch": 1341} {"train_loss": -5.760629653930664, "global_step": 56323, "epoch": 1341} {"train_loss": -5.863349914550781, "global_step": 56324, "epoch": 1341} {"train_loss": -5.675398826599121, "global_step": 56325, "epoch": 1341} {"train_loss": -5.802027225494385, "global_step": 56326, "epoch": 1341} {"train_loss": -5.754828929901123, "global_step": 56327, "epoch": 1341} {"train_loss": -5.755555152893066, "global_step": 56328, "epoch": 1341} {"train_loss": -5.91282844543457, "global_step": 56329, "epoch": 1341} {"train_loss": -5.69050407409668, "global_step": 56330, "epoch": 1341} {"train_loss": -5.7024993896484375, "global_step": 56331, "epoch": 1341} {"train_loss": -5.8570404052734375, "global_step": 56332, "epoch": 1341} {"train_loss": -5.689269065856934, "global_step": 56333, "epoch": 1341} {"train_loss": -5.923937797546387, "global_step": 56334, "epoch": 1341} {"train_loss": -5.8168253898620605, "global_step": 56335, "epoch": 1341} {"train_loss": -5.89044189453125, "global_step": 56336, "epoch": 1341} {"train_loss": -5.862374782562256, "global_step": 56337, "epoch": 1341} {"train_loss": -5.678139686584473, "global_step": 56338, "epoch": 1341} {"train_loss": -5.961133003234863, "global_step": 56339, "epoch": 1341} {"train_loss": -5.780893325805664, "global_step": 56340, "epoch": 1341} {"train_loss": -5.741655349731445, "global_step": 56341, "epoch": 1341} {"train_loss": -5.828590393066406, "global_step": 56342, "epoch": 1341} {"train_loss": -5.825438499450684, "global_step": 56343, "epoch": 1341} {"train_loss": -5.821204662322998, "global_step": 56344, "epoch": 1341} {"train_loss": -5.861984729766846, "global_step": 56345, "epoch": 1341} {"train_loss": -5.732667922973633, "global_step": 56346, "epoch": 1341} {"train_loss": -5.811097145080566, "global_step": 56347, "epoch": 1341} {"train_loss": -5.848077774047852, "global_step": 56348, "epoch": 1341} {"train_loss": -5.906294822692871, "global_step": 56349, "epoch": 1341} {"train_loss": -5.9067792892456055, "global_step": 56350, "epoch": 1341} {"train_loss": -5.804451942443848, "global_step": 56351, "epoch": 1341} {"train_loss": -5.710068702697754, "global_step": 56352, "epoch": 1341} {"train_loss": -5.97420597076416, "global_step": 56353, "epoch": 1341} {"train_loss": -5.896897792816162, "global_step": 56354, "epoch": 1341} {"train_loss": -5.823756217956543, "global_step": 56355, "epoch": 1341} {"train_loss": -5.869160175323486, "global_step": 56356, "epoch": 1341} {"train_loss": -5.853005886077881, "global_step": 56357, "epoch": 1341} {"train_loss": -5.885085105895996, "global_step": 56358, "epoch": 1341} {"train_loss": -5.850955009460449, "global_step": 56359, "epoch": 1341} {"train_loss": -5.854996681213379, "global_step": 56360, "epoch": 1341} {"train_loss": -5.948962211608887, "global_step": 56361, "epoch": 1341} {"train_loss": -5.830732822418213, "global_step": 56362, "epoch": 1341} {"train_loss": -5.824390956333706, "global_step": 56363, "epoch": 1341, "val_loss": 66465.6015625} {"train_loss": -5.979104518890381, "global_step": 56364, "epoch": 1342} {"train_loss": -6.007020950317383, "global_step": 56365, "epoch": 1342} {"train_loss": -5.8543291091918945, "global_step": 56366, "epoch": 1342} {"train_loss": -5.837615966796875, "global_step": 56367, "epoch": 1342} {"train_loss": -5.808229446411133, "global_step": 56368, "epoch": 1342} {"train_loss": -5.894418239593506, "global_step": 56369, "epoch": 1342} {"train_loss": -5.856117248535156, "global_step": 56370, "epoch": 1342} {"train_loss": -5.97977352142334, "global_step": 56371, "epoch": 1342} {"train_loss": -5.8665771484375, "global_step": 56372, "epoch": 1342} {"train_loss": -5.834437847137451, "global_step": 56373, "epoch": 1342} {"train_loss": -5.859565258026123, "global_step": 56374, "epoch": 1342} {"train_loss": -5.864229202270508, "global_step": 56375, "epoch": 1342} {"train_loss": -5.820065021514893, "global_step": 56376, "epoch": 1342} {"train_loss": -5.922733306884766, "global_step": 56377, "epoch": 1342} {"train_loss": -5.815552711486816, "global_step": 56378, "epoch": 1342} {"train_loss": -5.777501106262207, "global_step": 56379, "epoch": 1342} {"train_loss": -5.731762886047363, "global_step": 56380, "epoch": 1342} {"train_loss": -5.811115264892578, "global_step": 56381, "epoch": 1342} {"train_loss": -5.518124103546143, "global_step": 56382, "epoch": 1342} {"train_loss": -5.837693214416504, "global_step": 56383, "epoch": 1342} {"train_loss": -5.703102111816406, "global_step": 56384, "epoch": 1342} {"train_loss": -5.786465644836426, "global_step": 56385, "epoch": 1342} {"train_loss": -5.865207672119141, "global_step": 56386, "epoch": 1342} {"train_loss": -5.793959140777588, "global_step": 56387, "epoch": 1342} {"train_loss": -5.816062927246094, "global_step": 56388, "epoch": 1342} {"train_loss": -5.708123207092285, "global_step": 56389, "epoch": 1342} {"train_loss": -5.831319808959961, "global_step": 56390, "epoch": 1342} {"train_loss": -5.828904151916504, "global_step": 56391, "epoch": 1342} {"train_loss": -5.755788326263428, "global_step": 56392, "epoch": 1342} {"train_loss": -5.861398696899414, "global_step": 56393, "epoch": 1342} {"train_loss": -5.8947319984436035, "global_step": 56394, "epoch": 1342} {"train_loss": -5.774923801422119, "global_step": 56395, "epoch": 1342} {"train_loss": -5.718590259552002, "global_step": 56396, "epoch": 1342} {"train_loss": -5.824397563934326, "global_step": 56397, "epoch": 1342} {"train_loss": -5.933341026306152, "global_step": 56398, "epoch": 1342} {"train_loss": -5.913514137268066, "global_step": 56399, "epoch": 1342} {"train_loss": -5.956571578979492, "global_step": 56400, "epoch": 1342} {"train_loss": -5.825822830200195, "global_step": 56401, "epoch": 1342} {"train_loss": -5.84344482421875, "global_step": 56402, "epoch": 1342} {"train_loss": -5.839372158050537, "global_step": 56403, "epoch": 1342} {"train_loss": -5.859932899475098, "global_step": 56404, "epoch": 1342} {"train_loss": -5.8321324189503985, "global_step": 56405, "epoch": 1342, "val_loss": 66504.359375} {"train_loss": -5.81596565246582, "global_step": 56406, "epoch": 1343} {"train_loss": -5.8133039474487305, "global_step": 56407, "epoch": 1343} {"train_loss": -5.983556747436523, "global_step": 56408, "epoch": 1343} {"train_loss": -5.852504730224609, "global_step": 56409, "epoch": 1343} {"train_loss": -5.750456809997559, "global_step": 56410, "epoch": 1343} {"train_loss": -5.948406219482422, "global_step": 56411, "epoch": 1343} {"train_loss": -5.861795425415039, "global_step": 56412, "epoch": 1343} {"train_loss": -5.789266586303711, "global_step": 56413, "epoch": 1343} {"train_loss": -5.770699501037598, "global_step": 56414, "epoch": 1343} {"train_loss": -5.84190559387207, "global_step": 56415, "epoch": 1343} {"train_loss": -5.79414176940918, "global_step": 56416, "epoch": 1343} {"train_loss": -5.876529693603516, "global_step": 56417, "epoch": 1343} {"train_loss": -5.866641521453857, "global_step": 56418, "epoch": 1343} {"train_loss": -5.757286071777344, "global_step": 56419, "epoch": 1343} {"train_loss": -5.877188682556152, "global_step": 56420, "epoch": 1343} {"train_loss": -5.940253257751465, "global_step": 56421, "epoch": 1343} {"train_loss": -5.735485553741455, "global_step": 56422, "epoch": 1343} {"train_loss": -5.794968128204346, "global_step": 56423, "epoch": 1343} {"train_loss": -5.881805419921875, "global_step": 56424, "epoch": 1343} {"train_loss": -5.81082010269165, "global_step": 56425, "epoch": 1343} {"train_loss": -5.917177200317383, "global_step": 56426, "epoch": 1343} {"train_loss": -5.73737096786499, "global_step": 56427, "epoch": 1343} {"train_loss": -5.903162002563477, "global_step": 56428, "epoch": 1343} {"train_loss": -5.953662872314453, "global_step": 56429, "epoch": 1343} {"train_loss": -5.784998893737793, "global_step": 56430, "epoch": 1343} {"train_loss": -5.7981109619140625, "global_step": 56431, "epoch": 1343} {"train_loss": -5.764320373535156, "global_step": 56432, "epoch": 1343} {"train_loss": -5.868274211883545, "global_step": 56433, "epoch": 1343} {"train_loss": -5.697378158569336, "global_step": 56434, "epoch": 1343} {"train_loss": -5.656732082366943, "global_step": 56435, "epoch": 1343} {"train_loss": -5.853541851043701, "global_step": 56436, "epoch": 1343} {"train_loss": -5.743490219116211, "global_step": 56437, "epoch": 1343} {"train_loss": -5.954216957092285, "global_step": 56438, "epoch": 1343} {"train_loss": -5.813182353973389, "global_step": 56439, "epoch": 1343} {"train_loss": -5.843910217285156, "global_step": 56440, "epoch": 1343} {"train_loss": -5.87345027923584, "global_step": 56441, "epoch": 1343} {"train_loss": -5.833911895751953, "global_step": 56442, "epoch": 1343} {"train_loss": -5.893146514892578, "global_step": 56443, "epoch": 1343} {"train_loss": -5.887008190155029, "global_step": 56444, "epoch": 1343} {"train_loss": -5.8211822509765625, "global_step": 56445, "epoch": 1343} {"train_loss": -5.845910549163818, "global_step": 56446, "epoch": 1343} {"train_loss": -5.838089261736188, "global_step": 56447, "epoch": 1343, "val_loss": 66494.7265625} {"train_loss": -5.826078414916992, "global_step": 56448, "epoch": 1344} {"train_loss": -5.846588134765625, "global_step": 56449, "epoch": 1344} {"train_loss": -5.936156272888184, "global_step": 56450, "epoch": 1344} {"train_loss": -5.776179313659668, "global_step": 56451, "epoch": 1344} {"train_loss": -5.775406837463379, "global_step": 56452, "epoch": 1344} {"train_loss": -6.000922203063965, "global_step": 56453, "epoch": 1344} {"train_loss": -5.812020778656006, "global_step": 56454, "epoch": 1344} {"train_loss": -5.91096830368042, "global_step": 56455, "epoch": 1344} {"train_loss": -5.877769470214844, "global_step": 56456, "epoch": 1344} {"train_loss": -5.945935249328613, "global_step": 56457, "epoch": 1344} {"train_loss": -5.887612342834473, "global_step": 56458, "epoch": 1344} {"train_loss": -5.848295211791992, "global_step": 56459, "epoch": 1344} {"train_loss": -5.876559734344482, "global_step": 56460, "epoch": 1344} {"train_loss": -5.828306198120117, "global_step": 56461, "epoch": 1344} {"train_loss": -5.705289840698242, "global_step": 56462, "epoch": 1344} {"train_loss": -5.884037971496582, "global_step": 56463, "epoch": 1344} {"train_loss": -5.975696563720703, "global_step": 56464, "epoch": 1344} {"train_loss": -5.682518482208252, "global_step": 56465, "epoch": 1344} {"train_loss": -5.831701278686523, "global_step": 56466, "epoch": 1344} {"train_loss": -5.795628547668457, "global_step": 56467, "epoch": 1344} {"train_loss": -5.732340335845947, "global_step": 56468, "epoch": 1344} {"train_loss": -5.877025604248047, "global_step": 56469, "epoch": 1344} {"train_loss": -5.819167613983154, "global_step": 56470, "epoch": 1344} {"train_loss": -5.747189521789551, "global_step": 56471, "epoch": 1344} {"train_loss": -5.826858043670654, "global_step": 56472, "epoch": 1344} {"train_loss": -5.784101486206055, "global_step": 56473, "epoch": 1344} {"train_loss": -5.752344131469727, "global_step": 56474, "epoch": 1344} {"train_loss": -5.797172546386719, "global_step": 56475, "epoch": 1344} {"train_loss": -5.855046272277832, "global_step": 56476, "epoch": 1344} {"train_loss": -5.90708065032959, "global_step": 56477, "epoch": 1344} {"train_loss": -5.677265167236328, "global_step": 56478, "epoch": 1344} {"train_loss": -5.818819046020508, "global_step": 56479, "epoch": 1344} {"train_loss": -5.806085586547852, "global_step": 56480, "epoch": 1344} {"train_loss": -5.8332977294921875, "global_step": 56481, "epoch": 1344} {"train_loss": -5.845772743225098, "global_step": 56482, "epoch": 1344} {"train_loss": -5.827994346618652, "global_step": 56483, "epoch": 1344} {"train_loss": -5.843751430511475, "global_step": 56484, "epoch": 1344} {"train_loss": -5.898732662200928, "global_step": 56485, "epoch": 1344} {"train_loss": -5.859861373901367, "global_step": 56486, "epoch": 1344} {"train_loss": -5.92859411239624, "global_step": 56487, "epoch": 1344} {"train_loss": -5.807808876037598, "global_step": 56488, "epoch": 1344} {"train_loss": -5.835779996145339, "global_step": 56489, "epoch": 1344, "val_loss": 66439.3515625} {"train_loss": -5.795751094818115, "global_step": 56490, "epoch": 1345} {"train_loss": -5.904807090759277, "global_step": 56491, "epoch": 1345} {"train_loss": -5.9850664138793945, "global_step": 56492, "epoch": 1345} {"train_loss": -5.8653106689453125, "global_step": 56493, "epoch": 1345} {"train_loss": -5.894680023193359, "global_step": 56494, "epoch": 1345} {"train_loss": -5.866654872894287, "global_step": 56495, "epoch": 1345} {"train_loss": -5.895031929016113, "global_step": 56496, "epoch": 1345} {"train_loss": -5.7601847648620605, "global_step": 56497, "epoch": 1345} {"train_loss": -5.8657379150390625, "global_step": 56498, "epoch": 1345} {"train_loss": -5.796651840209961, "global_step": 56499, "epoch": 1345} {"train_loss": -5.860694885253906, "global_step": 56500, "epoch": 1345} {"train_loss": -5.882367134094238, "global_step": 56501, "epoch": 1345} {"train_loss": -5.86181116104126, "global_step": 56502, "epoch": 1345} {"train_loss": -6.052082061767578, "global_step": 56503, "epoch": 1345} {"train_loss": -5.9820146560668945, "global_step": 56504, "epoch": 1345} {"train_loss": -5.873452663421631, "global_step": 56505, "epoch": 1345} {"train_loss": -5.904792785644531, "global_step": 56506, "epoch": 1345} {"train_loss": -5.889620780944824, "global_step": 56507, "epoch": 1345} {"train_loss": -5.668198585510254, "global_step": 56508, "epoch": 1345} {"train_loss": -5.888247489929199, "global_step": 56509, "epoch": 1345} {"train_loss": -5.86271858215332, "global_step": 56510, "epoch": 1345} {"train_loss": -5.97921085357666, "global_step": 56511, "epoch": 1345} {"train_loss": -5.911567687988281, "global_step": 56512, "epoch": 1345} {"train_loss": -5.782346725463867, "global_step": 56513, "epoch": 1345} {"train_loss": -5.904046058654785, "global_step": 56514, "epoch": 1345} {"train_loss": -5.730843544006348, "global_step": 56515, "epoch": 1345} {"train_loss": -5.784553050994873, "global_step": 56516, "epoch": 1345} {"train_loss": -5.812739372253418, "global_step": 56517, "epoch": 1345} {"train_loss": -5.947688102722168, "global_step": 56518, "epoch": 1345} {"train_loss": -5.821250915527344, "global_step": 56519, "epoch": 1345} {"train_loss": -5.812017440795898, "global_step": 56520, "epoch": 1345} {"train_loss": -5.864075660705566, "global_step": 56521, "epoch": 1345} {"train_loss": -5.8153533935546875, "global_step": 56522, "epoch": 1345} {"train_loss": -5.904020309448242, "global_step": 56523, "epoch": 1345} {"train_loss": -5.789034843444824, "global_step": 56524, "epoch": 1345} {"train_loss": -5.790220737457275, "global_step": 56525, "epoch": 1345} {"train_loss": -5.825037479400635, "global_step": 56526, "epoch": 1345} {"train_loss": -5.8468780517578125, "global_step": 56527, "epoch": 1345} {"train_loss": -5.787235260009766, "global_step": 56528, "epoch": 1345} {"train_loss": -5.797513484954834, "global_step": 56529, "epoch": 1345} {"train_loss": -5.856985092163086, "global_step": 56530, "epoch": 1345} {"train_loss": -5.854996999104817, "global_step": 56531, "epoch": 1345, "val_loss": 66446.7890625} {"train_loss": -5.921370029449463, "global_step": 56532, "epoch": 1346} {"train_loss": -5.871899127960205, "global_step": 56533, "epoch": 1346} {"train_loss": -5.875212669372559, "global_step": 56534, "epoch": 1346} {"train_loss": -5.805988788604736, "global_step": 56535, "epoch": 1346} {"train_loss": -5.929976940155029, "global_step": 56536, "epoch": 1346} {"train_loss": -5.87330436706543, "global_step": 56537, "epoch": 1346} {"train_loss": -5.676882743835449, "global_step": 56538, "epoch": 1346} {"train_loss": -5.889455795288086, "global_step": 56539, "epoch": 1346} {"train_loss": -5.725985527038574, "global_step": 56540, "epoch": 1346} {"train_loss": -5.771486759185791, "global_step": 56541, "epoch": 1346} {"train_loss": -5.840039253234863, "global_step": 56542, "epoch": 1346} {"train_loss": -5.8365583419799805, "global_step": 56543, "epoch": 1346} {"train_loss": -5.8073530197143555, "global_step": 56544, "epoch": 1346} {"train_loss": -5.906251907348633, "global_step": 56545, "epoch": 1346} {"train_loss": -5.8839311599731445, "global_step": 56546, "epoch": 1346} {"train_loss": -5.91106653213501, "global_step": 56547, "epoch": 1346} {"train_loss": -5.772899150848389, "global_step": 56548, "epoch": 1346} {"train_loss": -5.967823028564453, "global_step": 56549, "epoch": 1346} {"train_loss": -5.919793128967285, "global_step": 56550, "epoch": 1346} {"train_loss": -5.8176679611206055, "global_step": 56551, "epoch": 1346} {"train_loss": -5.859284400939941, "global_step": 56552, "epoch": 1346} {"train_loss": -5.77882194519043, "global_step": 56553, "epoch": 1346} {"train_loss": -5.696259021759033, "global_step": 56554, "epoch": 1346} {"train_loss": -5.890820503234863, "global_step": 56555, "epoch": 1346} {"train_loss": -5.837634086608887, "global_step": 56556, "epoch": 1346} {"train_loss": -5.930248260498047, "global_step": 56557, "epoch": 1346} {"train_loss": -5.770464897155762, "global_step": 56558, "epoch": 1346} {"train_loss": -5.742881774902344, "global_step": 56559, "epoch": 1346} {"train_loss": -5.841397285461426, "global_step": 56560, "epoch": 1346} {"train_loss": -5.725638389587402, "global_step": 56561, "epoch": 1346} {"train_loss": -5.96935510635376, "global_step": 56562, "epoch": 1346} {"train_loss": -5.726252555847168, "global_step": 56563, "epoch": 1346} {"train_loss": -5.798773765563965, "global_step": 56564, "epoch": 1346} {"train_loss": -5.750244617462158, "global_step": 56565, "epoch": 1346} {"train_loss": -5.811741828918457, "global_step": 56566, "epoch": 1346} {"train_loss": -5.74843692779541, "global_step": 56567, "epoch": 1346} {"train_loss": -5.779559135437012, "global_step": 56568, "epoch": 1346} {"train_loss": -5.843564510345459, "global_step": 56569, "epoch": 1346} {"train_loss": -5.660741806030273, "global_step": 56570, "epoch": 1346} {"train_loss": -5.842567443847656, "global_step": 56571, "epoch": 1346} {"train_loss": -5.739523410797119, "global_step": 56572, "epoch": 1346} {"train_loss": -5.818450223831904, "global_step": 56573, "epoch": 1346, "val_loss": 66634.0546875} {"train_loss": -5.994483947753906, "global_step": 56574, "epoch": 1347} {"train_loss": -5.625321388244629, "global_step": 56575, "epoch": 1347} {"train_loss": -5.845675468444824, "global_step": 56576, "epoch": 1347} {"train_loss": -5.695326805114746, "global_step": 56577, "epoch": 1347} {"train_loss": -5.873560428619385, "global_step": 56578, "epoch": 1347} {"train_loss": -5.789054870605469, "global_step": 56579, "epoch": 1347} {"train_loss": -5.666423797607422, "global_step": 56580, "epoch": 1347} {"train_loss": -5.837583541870117, "global_step": 56581, "epoch": 1347} {"train_loss": -5.855904579162598, "global_step": 56582, "epoch": 1347} {"train_loss": -5.835513114929199, "global_step": 56583, "epoch": 1347} {"train_loss": -5.827140808105469, "global_step": 56584, "epoch": 1347} {"train_loss": -5.904861927032471, "global_step": 56585, "epoch": 1347} {"train_loss": -5.917093276977539, "global_step": 56586, "epoch": 1347} {"train_loss": -5.785024642944336, "global_step": 56587, "epoch": 1347} {"train_loss": -5.831872940063477, "global_step": 56588, "epoch": 1347} {"train_loss": -6.002384662628174, "global_step": 56589, "epoch": 1347} {"train_loss": -5.805082321166992, "global_step": 56590, "epoch": 1347} {"train_loss": -5.878668785095215, "global_step": 56591, "epoch": 1347} {"train_loss": -5.8633551597595215, "global_step": 56592, "epoch": 1347} {"train_loss": -5.918022155761719, "global_step": 56593, "epoch": 1347} {"train_loss": -5.842443943023682, "global_step": 56594, "epoch": 1347} {"train_loss": -5.808797359466553, "global_step": 56595, "epoch": 1347} {"train_loss": -5.854282855987549, "global_step": 56596, "epoch": 1347} {"train_loss": -5.781198501586914, "global_step": 56597, "epoch": 1347} {"train_loss": -5.904054641723633, "global_step": 56598, "epoch": 1347} {"train_loss": -5.768104553222656, "global_step": 56599, "epoch": 1347} {"train_loss": -5.807855129241943, "global_step": 56600, "epoch": 1347} {"train_loss": -5.699602127075195, "global_step": 56601, "epoch": 1347} {"train_loss": -5.901458263397217, "global_step": 56602, "epoch": 1347} {"train_loss": -5.670511245727539, "global_step": 56603, "epoch": 1347} {"train_loss": -5.722738265991211, "global_step": 56604, "epoch": 1347} {"train_loss": -5.912397384643555, "global_step": 56605, "epoch": 1347} {"train_loss": -5.878217697143555, "global_step": 56606, "epoch": 1347} {"train_loss": -5.708714008331299, "global_step": 56607, "epoch": 1347} {"train_loss": -5.882436752319336, "global_step": 56608, "epoch": 1347} {"train_loss": -5.880621910095215, "global_step": 56609, "epoch": 1347} {"train_loss": -5.894243240356445, "global_step": 56610, "epoch": 1347} {"train_loss": -5.955226421356201, "global_step": 56611, "epoch": 1347} {"train_loss": -5.706666946411133, "global_step": 56612, "epoch": 1347} {"train_loss": -5.752959728240967, "global_step": 56613, "epoch": 1347} {"train_loss": -5.807284355163574, "global_step": 56614, "epoch": 1347} {"train_loss": -5.826398349943615, "global_step": 56615, "epoch": 1347, "val_loss": 66604.90625} {"train_loss": -5.940298080444336, "global_step": 56616, "epoch": 1348} {"train_loss": -5.761390209197998, "global_step": 56617, "epoch": 1348} {"train_loss": -5.82510232925415, "global_step": 56618, "epoch": 1348} {"train_loss": -5.910343170166016, "global_step": 56619, "epoch": 1348} {"train_loss": -5.796332359313965, "global_step": 56620, "epoch": 1348} {"train_loss": -5.896110534667969, "global_step": 56621, "epoch": 1348} {"train_loss": -5.9052653312683105, "global_step": 56622, "epoch": 1348} {"train_loss": -5.84104061126709, "global_step": 56623, "epoch": 1348} {"train_loss": -5.8100996017456055, "global_step": 56624, "epoch": 1348} {"train_loss": -5.8960981369018555, "global_step": 56625, "epoch": 1348} {"train_loss": -5.874809741973877, "global_step": 56626, "epoch": 1348} {"train_loss": -5.855551242828369, "global_step": 56627, "epoch": 1348} {"train_loss": -5.732048034667969, "global_step": 56628, "epoch": 1348} {"train_loss": -5.898575305938721, "global_step": 56629, "epoch": 1348} {"train_loss": -5.84402322769165, "global_step": 56630, "epoch": 1348} {"train_loss": -5.805336952209473, "global_step": 56631, "epoch": 1348} {"train_loss": -6.005556583404541, "global_step": 56632, "epoch": 1348} {"train_loss": -5.708243370056152, "global_step": 56633, "epoch": 1348} {"train_loss": -5.918237686157227, "global_step": 56634, "epoch": 1348} {"train_loss": -5.896097183227539, "global_step": 56635, "epoch": 1348} {"train_loss": -5.812167167663574, "global_step": 56636, "epoch": 1348} {"train_loss": -5.894449234008789, "global_step": 56637, "epoch": 1348} {"train_loss": -5.701538562774658, "global_step": 56638, "epoch": 1348} {"train_loss": -5.936281204223633, "global_step": 56639, "epoch": 1348} {"train_loss": -5.820469856262207, "global_step": 56640, "epoch": 1348} {"train_loss": -5.7896037101745605, "global_step": 56641, "epoch": 1348} {"train_loss": -5.791060447692871, "global_step": 56642, "epoch": 1348} {"train_loss": -5.751972675323486, "global_step": 56643, "epoch": 1348} {"train_loss": -5.796819686889648, "global_step": 56644, "epoch": 1348} {"train_loss": -5.874749660491943, "global_step": 56645, "epoch": 1348} {"train_loss": -5.6453399658203125, "global_step": 56646, "epoch": 1348} {"train_loss": -5.789130210876465, "global_step": 56647, "epoch": 1348} {"train_loss": -5.7085747718811035, "global_step": 56648, "epoch": 1348} {"train_loss": -5.805826187133789, "global_step": 56649, "epoch": 1348} {"train_loss": -5.790097713470459, "global_step": 56650, "epoch": 1348} {"train_loss": -5.776636123657227, "global_step": 56651, "epoch": 1348} {"train_loss": -5.880619525909424, "global_step": 56652, "epoch": 1348} {"train_loss": -5.85778284072876, "global_step": 56653, "epoch": 1348} {"train_loss": -5.876194000244141, "global_step": 56654, "epoch": 1348} {"train_loss": -5.831660747528076, "global_step": 56655, "epoch": 1348} {"train_loss": -5.8393707275390625, "global_step": 56656, "epoch": 1348} {"train_loss": -5.832854486647106, "global_step": 56657, "epoch": 1348, "val_loss": 66630.9375} {"train_loss": -5.823973655700684, "global_step": 56658, "epoch": 1349} {"train_loss": -5.8276262283325195, "global_step": 56659, "epoch": 1349} {"train_loss": -5.768104553222656, "global_step": 56660, "epoch": 1349} {"train_loss": -5.802148818969727, "global_step": 56661, "epoch": 1349} {"train_loss": -6.090475082397461, "global_step": 56662, "epoch": 1349} {"train_loss": -5.904460430145264, "global_step": 56663, "epoch": 1349} {"train_loss": -5.826024055480957, "global_step": 56664, "epoch": 1349} {"train_loss": -5.973810195922852, "global_step": 56665, "epoch": 1349} {"train_loss": -5.904049873352051, "global_step": 56666, "epoch": 1349} {"train_loss": -5.769262790679932, "global_step": 56667, "epoch": 1349} {"train_loss": -5.813152313232422, "global_step": 56668, "epoch": 1349} {"train_loss": -5.741424560546875, "global_step": 56669, "epoch": 1349} {"train_loss": -5.805782318115234, "global_step": 56670, "epoch": 1349} {"train_loss": -5.865196228027344, "global_step": 56671, "epoch": 1349} {"train_loss": -5.827157974243164, "global_step": 56672, "epoch": 1349} {"train_loss": -5.859113693237305, "global_step": 56673, "epoch": 1349} {"train_loss": -5.944417953491211, "global_step": 56674, "epoch": 1349} {"train_loss": -5.903253078460693, "global_step": 56675, "epoch": 1349} {"train_loss": -5.8169708251953125, "global_step": 56676, "epoch": 1349} {"train_loss": -5.87788200378418, "global_step": 56677, "epoch": 1349} {"train_loss": -5.805510520935059, "global_step": 56678, "epoch": 1349} {"train_loss": -5.88180685043335, "global_step": 56679, "epoch": 1349} {"train_loss": -5.931122779846191, "global_step": 56680, "epoch": 1349} {"train_loss": -5.940796852111816, "global_step": 56681, "epoch": 1349} {"train_loss": -5.812568664550781, "global_step": 56682, "epoch": 1349} {"train_loss": -5.817383766174316, "global_step": 56683, "epoch": 1349} {"train_loss": -5.9249420166015625, "global_step": 56684, "epoch": 1349} {"train_loss": -5.808785438537598, "global_step": 56685, "epoch": 1349} {"train_loss": -5.934792518615723, "global_step": 56686, "epoch": 1349} {"train_loss": -5.860865592956543, "global_step": 56687, "epoch": 1349} {"train_loss": -5.779934406280518, "global_step": 56688, "epoch": 1349} {"train_loss": -5.730643272399902, "global_step": 56689, "epoch": 1349} {"train_loss": -5.817727088928223, "global_step": 56690, "epoch": 1349} {"train_loss": -5.940674781799316, "global_step": 56691, "epoch": 1349} {"train_loss": -5.881988525390625, "global_step": 56692, "epoch": 1349} {"train_loss": -5.837896823883057, "global_step": 56693, "epoch": 1349} {"train_loss": -5.9115705490112305, "global_step": 56694, "epoch": 1349} {"train_loss": -5.8486738204956055, "global_step": 56695, "epoch": 1349} {"train_loss": -5.841454982757568, "global_step": 56696, "epoch": 1349} {"train_loss": -5.732431411743164, "global_step": 56697, "epoch": 1349} {"train_loss": -5.753536701202393, "global_step": 56698, "epoch": 1349} {"train_loss": -5.850066673187983, "global_step": 56699, "epoch": 1349, "val_loss": 66267.515625} {"train_loss": -5.674671173095703, "global_step": 56700, "epoch": 1350} {"train_loss": -5.951779365539551, "global_step": 56701, "epoch": 1350} {"train_loss": -5.734130859375, "global_step": 56702, "epoch": 1350} {"train_loss": -5.876070976257324, "global_step": 56703, "epoch": 1350} {"train_loss": -5.955545425415039, "global_step": 56704, "epoch": 1350} {"train_loss": -5.882235527038574, "global_step": 56705, "epoch": 1350} {"train_loss": -5.848818778991699, "global_step": 56706, "epoch": 1350} {"train_loss": -5.887723922729492, "global_step": 56707, "epoch": 1350} {"train_loss": -5.884896755218506, "global_step": 56708, "epoch": 1350} {"train_loss": -5.861095428466797, "global_step": 56709, "epoch": 1350} {"train_loss": -5.818187713623047, "global_step": 56710, "epoch": 1350} {"train_loss": -5.721188545227051, "global_step": 56711, "epoch": 1350} {"train_loss": -5.816749572753906, "global_step": 56712, "epoch": 1350} {"train_loss": -5.815075874328613, "global_step": 56713, "epoch": 1350} {"train_loss": -5.805218696594238, "global_step": 56714, "epoch": 1350} {"train_loss": -5.840680122375488, "global_step": 56715, "epoch": 1350} {"train_loss": -5.73342227935791, "global_step": 56716, "epoch": 1350} {"train_loss": -5.853553295135498, "global_step": 56717, "epoch": 1350} {"train_loss": -5.946712970733643, "global_step": 56718, "epoch": 1350} {"train_loss": -5.849191665649414, "global_step": 56719, "epoch": 1350} {"train_loss": -5.880311965942383, "global_step": 56720, "epoch": 1350} {"train_loss": -5.803550720214844, "global_step": 56721, "epoch": 1350} {"train_loss": -5.844956874847412, "global_step": 56722, "epoch": 1350} {"train_loss": -5.7827043533325195, "global_step": 56723, "epoch": 1350} {"train_loss": -5.967109680175781, "global_step": 56724, "epoch": 1350} {"train_loss": -5.934276103973389, "global_step": 56725, "epoch": 1350} {"train_loss": -5.716490268707275, "global_step": 56726, "epoch": 1350} {"train_loss": -5.709259033203125, "global_step": 56727, "epoch": 1350} {"train_loss": -5.730889320373535, "global_step": 56728, "epoch": 1350} {"train_loss": -5.9116034507751465, "global_step": 56729, "epoch": 1350} {"train_loss": -5.850800514221191, "global_step": 56730, "epoch": 1350} {"train_loss": -5.894882678985596, "global_step": 56731, "epoch": 1350} {"train_loss": -5.887115478515625, "global_step": 56732, "epoch": 1350} {"train_loss": -5.8838419914245605, "global_step": 56733, "epoch": 1350} {"train_loss": -5.724231719970703, "global_step": 56734, "epoch": 1350} {"train_loss": -5.823645114898682, "global_step": 56735, "epoch": 1350} {"train_loss": -5.869704246520996, "global_step": 56736, "epoch": 1350} {"train_loss": -5.835836410522461, "global_step": 56737, "epoch": 1350} {"train_loss": -5.90544319152832, "global_step": 56738, "epoch": 1350} {"train_loss": -5.961258888244629, "global_step": 56739, "epoch": 1350} {"train_loss": -5.788641452789307, "global_step": 56740, "epoch": 1350} {"train_loss": -5.840959367297945, "global_step": 56741, "epoch": 1350, "train/sim_max_reward_0": 0.22104266428416725, "train/sim_max_reward_1": 0.8065233090978463, "train/sim_max_reward_2": 0.5860678109356174, "train/sim_max_reward_3": 0.14408754988885933, "train/sim_max_reward_4": 0.34613088042838264, "train/sim_max_reward_5": 0.841619324666669, "test/sim_max_reward_4400000": 0.32445014333528105, "test/sim_max_reward_4400001": 0.9094600377682527, "test/sim_max_reward_4400002": 0.7378882901567657, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.2943772453607116, "test/sim_max_reward_4400006": 0.8658452603693053, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3701756913193621, "test/sim_max_reward_4400009": 0.9161674339954088, "test/sim_max_reward_4400010": 0.3356961166185902, "test/sim_max_reward_4400011": 0.200772145530776, "test/sim_max_reward_4400012": 0.7153373272220757, "test/sim_max_reward_4400013": 0.36794444157508477, "test/sim_max_reward_4400014": 0.7715140166096136, "test/sim_max_reward_4400015": 0.3444555716513313, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3590296930289268, "test/sim_max_reward_4400019": 0.10402249807822113, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.23112504238009146, "test/sim_max_reward_4400023": 0.5814021657275754, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.18056462892016828, "test/sim_max_reward_4400026": 0.48639869600534924, "test/sim_max_reward_4400027": 0.044754881159478975, "test/sim_max_reward_4400028": 0.5730893748754844, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.8286987241322296, "test/sim_max_reward_4400031": 0.41871567692698003, "test/sim_max_reward_4400032": 0.3659730905954058, "test/sim_max_reward_4400033": 0.9033863315115325, "test/sim_max_reward_4400034": 0.3564740579730529, "test/sim_max_reward_4400035": 0.5083664635027321, "test/sim_max_reward_4400036": 0.3829253221334226, "test/sim_max_reward_4400037": 0.499524340088257, "test/sim_max_reward_4400038": 0.8662552548396647, "test/sim_max_reward_4400039": 0.7386504331651378, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9321051080500683, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0188487376500975, "test/sim_max_reward_4400044": 0.755566232023288, "test/sim_max_reward_4400045": 0.7673608232537119, "test/sim_max_reward_4400046": 0.25720081878166123, "test/sim_max_reward_4400047": 0.703373629984839, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.5782399755554025, "train/mean_score": 0.4909119232169236, "test/mean_score": 0.403357652493144, "val_loss": 66530.8515625} {"train_loss": -5.862103462219238, "global_step": 56742, "epoch": 1351} {"train_loss": -5.894870281219482, "global_step": 56743, "epoch": 1351} {"train_loss": -5.912158012390137, "global_step": 56744, "epoch": 1351} {"train_loss": -5.8315839767456055, "global_step": 56745, "epoch": 1351} {"train_loss": -5.946674823760986, "global_step": 56746, "epoch": 1351} {"train_loss": -5.788816452026367, "global_step": 56747, "epoch": 1351} {"train_loss": -5.819352149963379, "global_step": 56748, "epoch": 1351} {"train_loss": -5.788947582244873, "global_step": 56749, "epoch": 1351} {"train_loss": -5.918327808380127, "global_step": 56750, "epoch": 1351} {"train_loss": -5.743055820465088, "global_step": 56751, "epoch": 1351} {"train_loss": -5.880321025848389, "global_step": 56752, "epoch": 1351} {"train_loss": -5.817340850830078, "global_step": 56753, "epoch": 1351} {"train_loss": -5.7720465660095215, "global_step": 56754, "epoch": 1351} {"train_loss": -5.891021728515625, "global_step": 56755, "epoch": 1351} {"train_loss": -5.921176910400391, "global_step": 56756, "epoch": 1351} {"train_loss": -5.832022190093994, "global_step": 56757, "epoch": 1351} {"train_loss": -5.858129978179932, "global_step": 56758, "epoch": 1351} {"train_loss": -5.832797527313232, "global_step": 56759, "epoch": 1351} {"train_loss": -5.834105968475342, "global_step": 56760, "epoch": 1351} {"train_loss": -5.855033874511719, "global_step": 56761, "epoch": 1351} {"train_loss": -5.957979202270508, "global_step": 56762, "epoch": 1351} {"train_loss": -5.851718902587891, "global_step": 56763, "epoch": 1351} {"train_loss": -5.87510871887207, "global_step": 56764, "epoch": 1351} {"train_loss": -5.801580429077148, "global_step": 56765, "epoch": 1351} {"train_loss": -5.907645225524902, "global_step": 56766, "epoch": 1351} {"train_loss": -5.9474382400512695, "global_step": 56767, "epoch": 1351} {"train_loss": -5.821249008178711, "global_step": 56768, "epoch": 1351} {"train_loss": -5.784252166748047, "global_step": 56769, "epoch": 1351} {"train_loss": -5.791079998016357, "global_step": 56770, "epoch": 1351} {"train_loss": -5.804509162902832, "global_step": 56771, "epoch": 1351} {"train_loss": -5.823657035827637, "global_step": 56772, "epoch": 1351} {"train_loss": -5.763702869415283, "global_step": 56773, "epoch": 1351} {"train_loss": -5.859474182128906, "global_step": 56774, "epoch": 1351} {"train_loss": -5.870680332183838, "global_step": 56775, "epoch": 1351} {"train_loss": -5.835494518280029, "global_step": 56776, "epoch": 1351} {"train_loss": -5.884152412414551, "global_step": 56777, "epoch": 1351} {"train_loss": -5.921614646911621, "global_step": 56778, "epoch": 1351} {"train_loss": -5.769098281860352, "global_step": 56779, "epoch": 1351} {"train_loss": -5.9417524337768555, "global_step": 56780, "epoch": 1351} {"train_loss": -5.921433448791504, "global_step": 56781, "epoch": 1351} {"train_loss": -5.955175399780273, "global_step": 56782, "epoch": 1351} {"train_loss": -5.855166503361294, "global_step": 56783, "epoch": 1351, "val_loss": 66424.578125} {"train_loss": -5.912610054016113, "global_step": 56784, "epoch": 1352} {"train_loss": -5.915470600128174, "global_step": 56785, "epoch": 1352} {"train_loss": -6.0044355392456055, "global_step": 56786, "epoch": 1352} {"train_loss": -5.8787312507629395, "global_step": 56787, "epoch": 1352} {"train_loss": -5.77736759185791, "global_step": 56788, "epoch": 1352} {"train_loss": -5.914613723754883, "global_step": 56789, "epoch": 1352} {"train_loss": -5.823437690734863, "global_step": 56790, "epoch": 1352} {"train_loss": -5.955511569976807, "global_step": 56791, "epoch": 1352} {"train_loss": -5.8455328941345215, "global_step": 56792, "epoch": 1352} {"train_loss": -5.9238481521606445, "global_step": 56793, "epoch": 1352} {"train_loss": -5.93830680847168, "global_step": 56794, "epoch": 1352} {"train_loss": -5.701164245605469, "global_step": 56795, "epoch": 1352} {"train_loss": -5.97477388381958, "global_step": 56796, "epoch": 1352} {"train_loss": -5.861632823944092, "global_step": 56797, "epoch": 1352} {"train_loss": -5.775016784667969, "global_step": 56798, "epoch": 1352} {"train_loss": -5.88327693939209, "global_step": 56799, "epoch": 1352} {"train_loss": -5.8737616539001465, "global_step": 56800, "epoch": 1352} {"train_loss": -5.896812438964844, "global_step": 56801, "epoch": 1352} {"train_loss": -5.714938163757324, "global_step": 56802, "epoch": 1352} {"train_loss": -5.899374961853027, "global_step": 56803, "epoch": 1352} {"train_loss": -5.921566486358643, "global_step": 56804, "epoch": 1352} {"train_loss": -5.822834014892578, "global_step": 56805, "epoch": 1352} {"train_loss": -5.82432746887207, "global_step": 56806, "epoch": 1352} {"train_loss": -5.853944778442383, "global_step": 56807, "epoch": 1352} {"train_loss": -5.89394474029541, "global_step": 56808, "epoch": 1352} {"train_loss": -5.719746112823486, "global_step": 56809, "epoch": 1352} {"train_loss": -5.957551956176758, "global_step": 56810, "epoch": 1352} {"train_loss": -5.800210952758789, "global_step": 56811, "epoch": 1352} {"train_loss": -5.890450477600098, "global_step": 56812, "epoch": 1352} {"train_loss": -5.878337860107422, "global_step": 56813, "epoch": 1352} {"train_loss": -5.870075225830078, "global_step": 56814, "epoch": 1352} {"train_loss": -5.753437042236328, "global_step": 56815, "epoch": 1352} {"train_loss": -5.8653364181518555, "global_step": 56816, "epoch": 1352} {"train_loss": -5.895111083984375, "global_step": 56817, "epoch": 1352} {"train_loss": -5.896392822265625, "global_step": 56818, "epoch": 1352} {"train_loss": -6.03667688369751, "global_step": 56819, "epoch": 1352} {"train_loss": -5.87722635269165, "global_step": 56820, "epoch": 1352} {"train_loss": -5.8226213455200195, "global_step": 56821, "epoch": 1352} {"train_loss": -5.795370101928711, "global_step": 56822, "epoch": 1352} {"train_loss": -5.872814178466797, "global_step": 56823, "epoch": 1352} {"train_loss": -5.8048481941223145, "global_step": 56824, "epoch": 1352} {"train_loss": -5.862844603402274, "global_step": 56825, "epoch": 1352, "val_loss": 66769.8046875} {"train_loss": -5.844830513000488, "global_step": 56826, "epoch": 1353} {"train_loss": -5.9246063232421875, "global_step": 56827, "epoch": 1353} {"train_loss": -5.943510055541992, "global_step": 56828, "epoch": 1353} {"train_loss": -5.8573079109191895, "global_step": 56829, "epoch": 1353} {"train_loss": -5.877223968505859, "global_step": 56830, "epoch": 1353} {"train_loss": -5.9185943603515625, "global_step": 56831, "epoch": 1353} {"train_loss": -5.865383148193359, "global_step": 56832, "epoch": 1353} {"train_loss": -5.949470520019531, "global_step": 56833, "epoch": 1353} {"train_loss": -5.746975898742676, "global_step": 56834, "epoch": 1353} {"train_loss": -5.938449859619141, "global_step": 56835, "epoch": 1353} {"train_loss": -5.842061996459961, "global_step": 56836, "epoch": 1353} {"train_loss": -5.853854656219482, "global_step": 56837, "epoch": 1353} {"train_loss": -5.846553802490234, "global_step": 56838, "epoch": 1353} {"train_loss": -5.8224029541015625, "global_step": 56839, "epoch": 1353} {"train_loss": -5.948467254638672, "global_step": 56840, "epoch": 1353} {"train_loss": -5.861204147338867, "global_step": 56841, "epoch": 1353} {"train_loss": -5.838624954223633, "global_step": 56842, "epoch": 1353} {"train_loss": -5.9551544189453125, "global_step": 56843, "epoch": 1353} {"train_loss": -5.759374618530273, "global_step": 56844, "epoch": 1353} {"train_loss": -5.787814617156982, "global_step": 56845, "epoch": 1353} {"train_loss": -5.844611167907715, "global_step": 56846, "epoch": 1353} {"train_loss": -5.849485397338867, "global_step": 56847, "epoch": 1353} {"train_loss": -5.869065761566162, "global_step": 56848, "epoch": 1353} {"train_loss": -5.93861198425293, "global_step": 56849, "epoch": 1353} {"train_loss": -5.911068439483643, "global_step": 56850, "epoch": 1353} {"train_loss": -5.907198905944824, "global_step": 56851, "epoch": 1353} {"train_loss": -5.697980880737305, "global_step": 56852, "epoch": 1353} {"train_loss": -5.867015838623047, "global_step": 56853, "epoch": 1353} {"train_loss": -5.915274620056152, "global_step": 56854, "epoch": 1353} {"train_loss": -5.968997955322266, "global_step": 56855, "epoch": 1353} {"train_loss": -5.884672164916992, "global_step": 56856, "epoch": 1353} {"train_loss": -5.775125503540039, "global_step": 56857, "epoch": 1353} {"train_loss": -5.87635612487793, "global_step": 56858, "epoch": 1353} {"train_loss": -5.7627716064453125, "global_step": 56859, "epoch": 1353} {"train_loss": -5.861357688903809, "global_step": 56860, "epoch": 1353} {"train_loss": -5.8842453956604, "global_step": 56861, "epoch": 1353} {"train_loss": -5.846417427062988, "global_step": 56862, "epoch": 1353} {"train_loss": -5.816286563873291, "global_step": 56863, "epoch": 1353} {"train_loss": -5.878725528717041, "global_step": 56864, "epoch": 1353} {"train_loss": -5.884966850280762, "global_step": 56865, "epoch": 1353} {"train_loss": -5.816144943237305, "global_step": 56866, "epoch": 1353} {"train_loss": -5.863671859105428, "global_step": 56867, "epoch": 1353, "val_loss": 66444.0859375} {"train_loss": -5.846718788146973, "global_step": 56868, "epoch": 1354} {"train_loss": -5.855772495269775, "global_step": 56869, "epoch": 1354} {"train_loss": -5.904626846313477, "global_step": 56870, "epoch": 1354} {"train_loss": -5.774599552154541, "global_step": 56871, "epoch": 1354} {"train_loss": -5.814281463623047, "global_step": 56872, "epoch": 1354} {"train_loss": -5.90660285949707, "global_step": 56873, "epoch": 1354} {"train_loss": -5.863986492156982, "global_step": 56874, "epoch": 1354} {"train_loss": -5.808281898498535, "global_step": 56875, "epoch": 1354} {"train_loss": -5.730405807495117, "global_step": 56876, "epoch": 1354} {"train_loss": -5.848837852478027, "global_step": 56877, "epoch": 1354} {"train_loss": -5.846050262451172, "global_step": 56878, "epoch": 1354} {"train_loss": -5.891047477722168, "global_step": 56879, "epoch": 1354} {"train_loss": -5.819350719451904, "global_step": 56880, "epoch": 1354} {"train_loss": -5.70944356918335, "global_step": 56881, "epoch": 1354} {"train_loss": -5.862546920776367, "global_step": 56882, "epoch": 1354} {"train_loss": -5.861477851867676, "global_step": 56883, "epoch": 1354} {"train_loss": -5.733386039733887, "global_step": 56884, "epoch": 1354} {"train_loss": -5.825686454772949, "global_step": 56885, "epoch": 1354} {"train_loss": -5.784746170043945, "global_step": 56886, "epoch": 1354} {"train_loss": -5.865727424621582, "global_step": 56887, "epoch": 1354} {"train_loss": -5.718084812164307, "global_step": 56888, "epoch": 1354} {"train_loss": -5.78569221496582, "global_step": 56889, "epoch": 1354} {"train_loss": -5.926507949829102, "global_step": 56890, "epoch": 1354} {"train_loss": -5.8559675216674805, "global_step": 56891, "epoch": 1354} {"train_loss": -5.915245056152344, "global_step": 56892, "epoch": 1354} {"train_loss": -5.932141304016113, "global_step": 56893, "epoch": 1354} {"train_loss": -5.7885284423828125, "global_step": 56894, "epoch": 1354} {"train_loss": -5.996017932891846, "global_step": 56895, "epoch": 1354} {"train_loss": -5.753540992736816, "global_step": 56896, "epoch": 1354} {"train_loss": -5.849522113800049, "global_step": 56897, "epoch": 1354} {"train_loss": -5.883342742919922, "global_step": 56898, "epoch": 1354} {"train_loss": -5.817290782928467, "global_step": 56899, "epoch": 1354} {"train_loss": -5.904272079467773, "global_step": 56900, "epoch": 1354} {"train_loss": -5.810981750488281, "global_step": 56901, "epoch": 1354} {"train_loss": -5.826384544372559, "global_step": 56902, "epoch": 1354} {"train_loss": -5.790444374084473, "global_step": 56903, "epoch": 1354} {"train_loss": -5.861974716186523, "global_step": 56904, "epoch": 1354} {"train_loss": -5.789480686187744, "global_step": 56905, "epoch": 1354} {"train_loss": -5.848653793334961, "global_step": 56906, "epoch": 1354} {"train_loss": -5.795681953430176, "global_step": 56907, "epoch": 1354} {"train_loss": -5.763321399688721, "global_step": 56908, "epoch": 1354} {"train_loss": -5.833734217144194, "global_step": 56909, "epoch": 1354, "val_loss": 67053.59375} {"train_loss": -5.7665863037109375, "global_step": 56910, "epoch": 1355} {"train_loss": -5.7628865242004395, "global_step": 56911, "epoch": 1355} {"train_loss": -5.869050979614258, "global_step": 56912, "epoch": 1355} {"train_loss": -5.884929180145264, "global_step": 56913, "epoch": 1355} {"train_loss": -5.903324604034424, "global_step": 56914, "epoch": 1355} {"train_loss": -5.860061168670654, "global_step": 56915, "epoch": 1355} {"train_loss": -5.845886707305908, "global_step": 56916, "epoch": 1355} {"train_loss": -5.8250732421875, "global_step": 56917, "epoch": 1355} {"train_loss": -5.912532806396484, "global_step": 56918, "epoch": 1355} {"train_loss": -5.951722621917725, "global_step": 56919, "epoch": 1355} {"train_loss": -5.795976161956787, "global_step": 56920, "epoch": 1355} {"train_loss": -5.824473857879639, "global_step": 56921, "epoch": 1355} {"train_loss": -5.757291793823242, "global_step": 56922, "epoch": 1355} {"train_loss": -5.8054656982421875, "global_step": 56923, "epoch": 1355} {"train_loss": -5.852818489074707, "global_step": 56924, "epoch": 1355} {"train_loss": -5.816217422485352, "global_step": 56925, "epoch": 1355} {"train_loss": -5.851675987243652, "global_step": 56926, "epoch": 1355} {"train_loss": -5.784052848815918, "global_step": 56927, "epoch": 1355} {"train_loss": -5.829124450683594, "global_step": 56928, "epoch": 1355} {"train_loss": -5.898007392883301, "global_step": 56929, "epoch": 1355} {"train_loss": -5.849260330200195, "global_step": 56930, "epoch": 1355} {"train_loss": -5.741695404052734, "global_step": 56931, "epoch": 1355} {"train_loss": -5.874085903167725, "global_step": 56932, "epoch": 1355} {"train_loss": -5.736003875732422, "global_step": 56933, "epoch": 1355} {"train_loss": -5.8530497550964355, "global_step": 56934, "epoch": 1355} {"train_loss": -5.81419563293457, "global_step": 56935, "epoch": 1355} {"train_loss": -5.865240573883057, "global_step": 56936, "epoch": 1355} {"train_loss": -5.861074447631836, "global_step": 56937, "epoch": 1355} {"train_loss": -5.83299446105957, "global_step": 56938, "epoch": 1355} {"train_loss": -5.842489242553711, "global_step": 56939, "epoch": 1355} {"train_loss": -5.8673601150512695, "global_step": 56940, "epoch": 1355} {"train_loss": -5.863250255584717, "global_step": 56941, "epoch": 1355} {"train_loss": -5.859038352966309, "global_step": 56942, "epoch": 1355} {"train_loss": -5.9401960372924805, "global_step": 56943, "epoch": 1355} {"train_loss": -5.863940238952637, "global_step": 56944, "epoch": 1355} {"train_loss": -5.89967679977417, "global_step": 56945, "epoch": 1355} {"train_loss": -5.883090496063232, "global_step": 56946, "epoch": 1355} {"train_loss": -5.746612071990967, "global_step": 56947, "epoch": 1355} {"train_loss": -5.836922645568848, "global_step": 56948, "epoch": 1355} {"train_loss": -5.729146957397461, "global_step": 56949, "epoch": 1355} {"train_loss": -5.903948783874512, "global_step": 56950, "epoch": 1355} {"train_loss": -5.841280380884807, "global_step": 56951, "epoch": 1355, "val_loss": 66534.1328125} {"train_loss": -5.848145484924316, "global_step": 56952, "epoch": 1356} {"train_loss": -5.81633186340332, "global_step": 56953, "epoch": 1356} {"train_loss": -5.789103031158447, "global_step": 56954, "epoch": 1356} {"train_loss": -5.861943244934082, "global_step": 56955, "epoch": 1356} {"train_loss": -5.755680084228516, "global_step": 56956, "epoch": 1356} {"train_loss": -5.8498430252075195, "global_step": 56957, "epoch": 1356} {"train_loss": -5.897067070007324, "global_step": 56958, "epoch": 1356} {"train_loss": -5.779270172119141, "global_step": 56959, "epoch": 1356} {"train_loss": -5.887354850769043, "global_step": 56960, "epoch": 1356} {"train_loss": -5.799008846282959, "global_step": 56961, "epoch": 1356} {"train_loss": -5.908764839172363, "global_step": 56962, "epoch": 1356} {"train_loss": -5.843216896057129, "global_step": 56963, "epoch": 1356} {"train_loss": -5.793824195861816, "global_step": 56964, "epoch": 1356} {"train_loss": -5.922197341918945, "global_step": 56965, "epoch": 1356} {"train_loss": -5.7969889640808105, "global_step": 56966, "epoch": 1356} {"train_loss": -5.8872833251953125, "global_step": 56967, "epoch": 1356} {"train_loss": -5.8461079597473145, "global_step": 56968, "epoch": 1356} {"train_loss": -5.855922698974609, "global_step": 56969, "epoch": 1356} {"train_loss": -5.782497406005859, "global_step": 56970, "epoch": 1356} {"train_loss": -5.814265251159668, "global_step": 56971, "epoch": 1356} {"train_loss": -5.679444313049316, "global_step": 56972, "epoch": 1356} {"train_loss": -5.880925178527832, "global_step": 56973, "epoch": 1356} {"train_loss": -5.882500171661377, "global_step": 56974, "epoch": 1356} {"train_loss": -5.8439178466796875, "global_step": 56975, "epoch": 1356} {"train_loss": -5.909001350402832, "global_step": 56976, "epoch": 1356} {"train_loss": -5.766776084899902, "global_step": 56977, "epoch": 1356} {"train_loss": -5.79014778137207, "global_step": 56978, "epoch": 1356} {"train_loss": -5.755895614624023, "global_step": 56979, "epoch": 1356} {"train_loss": -5.864774703979492, "global_step": 56980, "epoch": 1356} {"train_loss": -5.989655494689941, "global_step": 56981, "epoch": 1356} {"train_loss": -5.672402858734131, "global_step": 56982, "epoch": 1356} {"train_loss": -5.829060077667236, "global_step": 56983, "epoch": 1356} {"train_loss": -5.814267158508301, "global_step": 56984, "epoch": 1356} {"train_loss": -5.729893684387207, "global_step": 56985, "epoch": 1356} {"train_loss": -5.845293045043945, "global_step": 56986, "epoch": 1356} {"train_loss": -5.823566436767578, "global_step": 56987, "epoch": 1356} {"train_loss": -5.835653781890869, "global_step": 56988, "epoch": 1356} {"train_loss": -5.863445281982422, "global_step": 56989, "epoch": 1356} {"train_loss": -5.901105880737305, "global_step": 56990, "epoch": 1356} {"train_loss": -5.743240833282471, "global_step": 56991, "epoch": 1356} {"train_loss": -5.874920845031738, "global_step": 56992, "epoch": 1356} {"train_loss": -5.829077050799415, "global_step": 56993, "epoch": 1356, "val_loss": 66499.328125} {"train_loss": -5.838273048400879, "global_step": 56994, "epoch": 1357} {"train_loss": -5.929131984710693, "global_step": 56995, "epoch": 1357} {"train_loss": -5.956928730010986, "global_step": 56996, "epoch": 1357} {"train_loss": -5.838932991027832, "global_step": 56997, "epoch": 1357} {"train_loss": -5.934848785400391, "global_step": 56998, "epoch": 1357} {"train_loss": -5.857586860656738, "global_step": 56999, "epoch": 1357} {"train_loss": -5.84355354309082, "global_step": 57000, "epoch": 1357} {"train_loss": -5.887368202209473, "global_step": 57001, "epoch": 1357} {"train_loss": -5.776784896850586, "global_step": 57002, "epoch": 1357} {"train_loss": -5.820089340209961, "global_step": 57003, "epoch": 1357} {"train_loss": -5.783554553985596, "global_step": 57004, "epoch": 1357} {"train_loss": -5.877426624298096, "global_step": 57005, "epoch": 1357} {"train_loss": -5.961082458496094, "global_step": 57006, "epoch": 1357} {"train_loss": -5.873711585998535, "global_step": 57007, "epoch": 1357} {"train_loss": -5.70616340637207, "global_step": 57008, "epoch": 1357} {"train_loss": -6.0222625732421875, "global_step": 57009, "epoch": 1357} {"train_loss": -5.850666046142578, "global_step": 57010, "epoch": 1357} {"train_loss": -5.793773651123047, "global_step": 57011, "epoch": 1357} {"train_loss": -5.84027624130249, "global_step": 57012, "epoch": 1357} {"train_loss": -5.8478803634643555, "global_step": 57013, "epoch": 1357} {"train_loss": -5.889847278594971, "global_step": 57014, "epoch": 1357} {"train_loss": -5.757441520690918, "global_step": 57015, "epoch": 1357} {"train_loss": -5.876747131347656, "global_step": 57016, "epoch": 1357} {"train_loss": -5.748409271240234, "global_step": 57017, "epoch": 1357} {"train_loss": -5.8569769859313965, "global_step": 57018, "epoch": 1357} {"train_loss": -5.824972152709961, "global_step": 57019, "epoch": 1357} {"train_loss": -5.781851291656494, "global_step": 57020, "epoch": 1357} {"train_loss": -5.760532379150391, "global_step": 57021, "epoch": 1357} {"train_loss": -5.817643165588379, "global_step": 57022, "epoch": 1357} {"train_loss": -5.742654800415039, "global_step": 57023, "epoch": 1357} {"train_loss": -5.902416706085205, "global_step": 57024, "epoch": 1357} {"train_loss": -5.901001930236816, "global_step": 57025, "epoch": 1357} {"train_loss": -5.810471057891846, "global_step": 57026, "epoch": 1357} {"train_loss": -5.871747970581055, "global_step": 57027, "epoch": 1357} {"train_loss": -5.835994243621826, "global_step": 57028, "epoch": 1357} {"train_loss": -5.831750869750977, "global_step": 57029, "epoch": 1357} {"train_loss": -5.920231342315674, "global_step": 57030, "epoch": 1357} {"train_loss": -5.834977626800537, "global_step": 57031, "epoch": 1357} {"train_loss": -5.891486167907715, "global_step": 57032, "epoch": 1357} {"train_loss": -5.780816555023193, "global_step": 57033, "epoch": 1357} {"train_loss": -5.877740859985352, "global_step": 57034, "epoch": 1357} {"train_loss": -5.847252471106393, "global_step": 57035, "epoch": 1357, "val_loss": 66521.0234375} {"train_loss": -5.927865028381348, "global_step": 57036, "epoch": 1358} {"train_loss": -5.922980308532715, "global_step": 57037, "epoch": 1358} {"train_loss": -5.781519889831543, "global_step": 57038, "epoch": 1358} {"train_loss": -5.724393844604492, "global_step": 57039, "epoch": 1358} {"train_loss": -5.882795333862305, "global_step": 57040, "epoch": 1358} {"train_loss": -5.809975624084473, "global_step": 57041, "epoch": 1358} {"train_loss": -5.774867534637451, "global_step": 57042, "epoch": 1358} {"train_loss": -5.643428802490234, "global_step": 57043, "epoch": 1358} {"train_loss": -5.849963665008545, "global_step": 57044, "epoch": 1358} {"train_loss": -5.8473286628723145, "global_step": 57045, "epoch": 1358} {"train_loss": -5.885965347290039, "global_step": 57046, "epoch": 1358} {"train_loss": -5.856255531311035, "global_step": 57047, "epoch": 1358} {"train_loss": -5.693336486816406, "global_step": 57048, "epoch": 1358} {"train_loss": -5.819091796875, "global_step": 57049, "epoch": 1358} {"train_loss": -5.7952680587768555, "global_step": 57050, "epoch": 1358} {"train_loss": -5.879364013671875, "global_step": 57051, "epoch": 1358} {"train_loss": -5.889219284057617, "global_step": 57052, "epoch": 1358} {"train_loss": -5.7974138259887695, "global_step": 57053, "epoch": 1358} {"train_loss": -5.85137939453125, "global_step": 57054, "epoch": 1358} {"train_loss": -5.9734296798706055, "global_step": 57055, "epoch": 1358} {"train_loss": -5.841473579406738, "global_step": 57056, "epoch": 1358} {"train_loss": -5.835317134857178, "global_step": 57057, "epoch": 1358} {"train_loss": -5.820704460144043, "global_step": 57058, "epoch": 1358} {"train_loss": -5.895512580871582, "global_step": 57059, "epoch": 1358} {"train_loss": -5.800615310668945, "global_step": 57060, "epoch": 1358} {"train_loss": -5.737200736999512, "global_step": 57061, "epoch": 1358} {"train_loss": -5.840845108032227, "global_step": 57062, "epoch": 1358} {"train_loss": -5.805652618408203, "global_step": 57063, "epoch": 1358} {"train_loss": -5.916723251342773, "global_step": 57064, "epoch": 1358} {"train_loss": -5.919803619384766, "global_step": 57065, "epoch": 1358} {"train_loss": -5.77854061126709, "global_step": 57066, "epoch": 1358} {"train_loss": -5.871098518371582, "global_step": 57067, "epoch": 1358} {"train_loss": -5.747234344482422, "global_step": 57068, "epoch": 1358} {"train_loss": -5.783197402954102, "global_step": 57069, "epoch": 1358} {"train_loss": -5.827560901641846, "global_step": 57070, "epoch": 1358} {"train_loss": -5.937680721282959, "global_step": 57071, "epoch": 1358} {"train_loss": -5.763014793395996, "global_step": 57072, "epoch": 1358} {"train_loss": -5.8212571144104, "global_step": 57073, "epoch": 1358} {"train_loss": -5.827890396118164, "global_step": 57074, "epoch": 1358} {"train_loss": -5.783679485321045, "global_step": 57075, "epoch": 1358} {"train_loss": -5.964343547821045, "global_step": 57076, "epoch": 1358} {"train_loss": -5.8321552730741955, "global_step": 57077, "epoch": 1358, "val_loss": 66642.921875} {"train_loss": -5.823129653930664, "global_step": 57078, "epoch": 1359} {"train_loss": -5.79234504699707, "global_step": 57079, "epoch": 1359} {"train_loss": -5.774685859680176, "global_step": 57080, "epoch": 1359} {"train_loss": -5.909917831420898, "global_step": 57081, "epoch": 1359} {"train_loss": -5.744736671447754, "global_step": 57082, "epoch": 1359} {"train_loss": -5.972668647766113, "global_step": 57083, "epoch": 1359} {"train_loss": -5.843832492828369, "global_step": 57084, "epoch": 1359} {"train_loss": -5.92506217956543, "global_step": 57085, "epoch": 1359} {"train_loss": -5.939449310302734, "global_step": 57086, "epoch": 1359} {"train_loss": -5.880897045135498, "global_step": 57087, "epoch": 1359} {"train_loss": -5.923981666564941, "global_step": 57088, "epoch": 1359} {"train_loss": -5.7233405113220215, "global_step": 57089, "epoch": 1359} {"train_loss": -5.930639743804932, "global_step": 57090, "epoch": 1359} {"train_loss": -5.795320987701416, "global_step": 57091, "epoch": 1359} {"train_loss": -5.836269855499268, "global_step": 57092, "epoch": 1359} {"train_loss": -5.789844036102295, "global_step": 57093, "epoch": 1359} {"train_loss": -5.9104413986206055, "global_step": 57094, "epoch": 1359} {"train_loss": -5.862301349639893, "global_step": 57095, "epoch": 1359} {"train_loss": -5.811212539672852, "global_step": 57096, "epoch": 1359} {"train_loss": -5.932035446166992, "global_step": 57097, "epoch": 1359} {"train_loss": -5.861016273498535, "global_step": 57098, "epoch": 1359} {"train_loss": -5.935580253601074, "global_step": 57099, "epoch": 1359} {"train_loss": -5.863041877746582, "global_step": 57100, "epoch": 1359} {"train_loss": -5.7671732902526855, "global_step": 57101, "epoch": 1359} {"train_loss": -5.883363723754883, "global_step": 57102, "epoch": 1359} {"train_loss": -5.779995918273926, "global_step": 57103, "epoch": 1359} {"train_loss": -5.814308166503906, "global_step": 57104, "epoch": 1359} {"train_loss": -5.804411888122559, "global_step": 57105, "epoch": 1359} {"train_loss": -5.960474014282227, "global_step": 57106, "epoch": 1359} {"train_loss": -5.802934169769287, "global_step": 57107, "epoch": 1359} {"train_loss": -5.998863220214844, "global_step": 57108, "epoch": 1359} {"train_loss": -5.829095363616943, "global_step": 57109, "epoch": 1359} {"train_loss": -5.829184532165527, "global_step": 57110, "epoch": 1359} {"train_loss": -5.746997356414795, "global_step": 57111, "epoch": 1359} {"train_loss": -5.87132453918457, "global_step": 57112, "epoch": 1359} {"train_loss": -5.807358741760254, "global_step": 57113, "epoch": 1359} {"train_loss": -5.711957931518555, "global_step": 57114, "epoch": 1359} {"train_loss": -5.862083911895752, "global_step": 57115, "epoch": 1359} {"train_loss": -5.783489227294922, "global_step": 57116, "epoch": 1359} {"train_loss": -5.766321659088135, "global_step": 57117, "epoch": 1359} {"train_loss": -5.9148149490356445, "global_step": 57118, "epoch": 1359} {"train_loss": -5.845053650083996, "global_step": 57119, "epoch": 1359, "val_loss": 66884.4765625} {"train_loss": -5.789533615112305, "global_step": 57120, "epoch": 1360} {"train_loss": -5.841833114624023, "global_step": 57121, "epoch": 1360} {"train_loss": -5.847765922546387, "global_step": 57122, "epoch": 1360} {"train_loss": -5.847686290740967, "global_step": 57123, "epoch": 1360} {"train_loss": -6.009394645690918, "global_step": 57124, "epoch": 1360} {"train_loss": -5.706528186798096, "global_step": 57125, "epoch": 1360} {"train_loss": -5.808267593383789, "global_step": 57126, "epoch": 1360} {"train_loss": -5.799093246459961, "global_step": 57127, "epoch": 1360} {"train_loss": -5.936546325683594, "global_step": 57128, "epoch": 1360} {"train_loss": -5.841991424560547, "global_step": 57129, "epoch": 1360} {"train_loss": -5.857402801513672, "global_step": 57130, "epoch": 1360} {"train_loss": -5.7481279373168945, "global_step": 57131, "epoch": 1360} {"train_loss": -5.866661071777344, "global_step": 57132, "epoch": 1360} {"train_loss": -5.798937797546387, "global_step": 57133, "epoch": 1360} {"train_loss": -5.771511077880859, "global_step": 57134, "epoch": 1360} {"train_loss": -5.843616962432861, "global_step": 57135, "epoch": 1360} {"train_loss": -5.689955234527588, "global_step": 57136, "epoch": 1360} {"train_loss": -5.9715118408203125, "global_step": 57137, "epoch": 1360} {"train_loss": -5.8889312744140625, "global_step": 57138, "epoch": 1360} {"train_loss": -5.737098693847656, "global_step": 57139, "epoch": 1360} {"train_loss": -5.963813781738281, "global_step": 57140, "epoch": 1360} {"train_loss": -5.81477689743042, "global_step": 57141, "epoch": 1360} {"train_loss": -5.870563507080078, "global_step": 57142, "epoch": 1360} {"train_loss": -5.954482078552246, "global_step": 57143, "epoch": 1360} {"train_loss": -5.743312835693359, "global_step": 57144, "epoch": 1360} {"train_loss": -5.953813552856445, "global_step": 57145, "epoch": 1360} {"train_loss": -5.7584638595581055, "global_step": 57146, "epoch": 1360} {"train_loss": -5.8901777267456055, "global_step": 57147, "epoch": 1360} {"train_loss": -5.789181232452393, "global_step": 57148, "epoch": 1360} {"train_loss": -5.858373641967773, "global_step": 57149, "epoch": 1360} {"train_loss": -5.885765075683594, "global_step": 57150, "epoch": 1360} {"train_loss": -5.8262038230896, "global_step": 57151, "epoch": 1360} {"train_loss": -5.874221324920654, "global_step": 57152, "epoch": 1360} {"train_loss": -5.74652099609375, "global_step": 57153, "epoch": 1360} {"train_loss": -5.843218803405762, "global_step": 57154, "epoch": 1360} {"train_loss": -5.7642951011657715, "global_step": 57155, "epoch": 1360} {"train_loss": -5.713449001312256, "global_step": 57156, "epoch": 1360} {"train_loss": -5.845980167388916, "global_step": 57157, "epoch": 1360} {"train_loss": -5.761837959289551, "global_step": 57158, "epoch": 1360} {"train_loss": -5.847023010253906, "global_step": 57159, "epoch": 1360} {"train_loss": -5.8854451179504395, "global_step": 57160, "epoch": 1360} {"train_loss": -5.8332881813957576, "global_step": 57161, "epoch": 1360, "val_loss": 66298.7578125} {"train_loss": -5.81269645690918, "global_step": 57162, "epoch": 1361} {"train_loss": -5.937741279602051, "global_step": 57163, "epoch": 1361} {"train_loss": -5.909507751464844, "global_step": 57164, "epoch": 1361} {"train_loss": -5.910766124725342, "global_step": 57165, "epoch": 1361} {"train_loss": -5.757070541381836, "global_step": 57166, "epoch": 1361} {"train_loss": -5.898190498352051, "global_step": 57167, "epoch": 1361} {"train_loss": -5.7594499588012695, "global_step": 57168, "epoch": 1361} {"train_loss": -5.8017072677612305, "global_step": 57169, "epoch": 1361} {"train_loss": -5.855875015258789, "global_step": 57170, "epoch": 1361} {"train_loss": -5.925720691680908, "global_step": 57171, "epoch": 1361} {"train_loss": -5.833615779876709, "global_step": 57172, "epoch": 1361} {"train_loss": -5.872093200683594, "global_step": 57173, "epoch": 1361} {"train_loss": -5.650080680847168, "global_step": 57174, "epoch": 1361} {"train_loss": -5.8891282081604, "global_step": 57175, "epoch": 1361} {"train_loss": -5.863317489624023, "global_step": 57176, "epoch": 1361} {"train_loss": -5.959165573120117, "global_step": 57177, "epoch": 1361} {"train_loss": -5.9044084548950195, "global_step": 57178, "epoch": 1361} {"train_loss": -5.884181499481201, "global_step": 57179, "epoch": 1361} {"train_loss": -5.857190132141113, "global_step": 57180, "epoch": 1361} {"train_loss": -5.936798095703125, "global_step": 57181, "epoch": 1361} {"train_loss": -5.877534866333008, "global_step": 57182, "epoch": 1361} {"train_loss": -5.863516807556152, "global_step": 57183, "epoch": 1361} {"train_loss": -5.924020290374756, "global_step": 57184, "epoch": 1361} {"train_loss": -5.873996734619141, "global_step": 57185, "epoch": 1361} {"train_loss": -5.801510334014893, "global_step": 57186, "epoch": 1361} {"train_loss": -5.846661567687988, "global_step": 57187, "epoch": 1361} {"train_loss": -5.8503313064575195, "global_step": 57188, "epoch": 1361} {"train_loss": -5.7537336349487305, "global_step": 57189, "epoch": 1361} {"train_loss": -5.831660747528076, "global_step": 57190, "epoch": 1361} {"train_loss": -5.800214767456055, "global_step": 57191, "epoch": 1361} {"train_loss": -5.872493743896484, "global_step": 57192, "epoch": 1361} {"train_loss": -5.80999755859375, "global_step": 57193, "epoch": 1361} {"train_loss": -5.836328506469727, "global_step": 57194, "epoch": 1361} {"train_loss": -5.913309097290039, "global_step": 57195, "epoch": 1361} {"train_loss": -5.887733459472656, "global_step": 57196, "epoch": 1361} {"train_loss": -5.9278883934021, "global_step": 57197, "epoch": 1361} {"train_loss": -5.9817423820495605, "global_step": 57198, "epoch": 1361} {"train_loss": -5.922171115875244, "global_step": 57199, "epoch": 1361} {"train_loss": -5.723691463470459, "global_step": 57200, "epoch": 1361} {"train_loss": -5.927732467651367, "global_step": 57201, "epoch": 1361} {"train_loss": -5.850601673126221, "global_step": 57202, "epoch": 1361} {"train_loss": -5.859669401532128, "global_step": 57203, "epoch": 1361, "val_loss": 66533.6875} {"train_loss": -5.9064435958862305, "global_step": 57204, "epoch": 1362} {"train_loss": -5.887589931488037, "global_step": 57205, "epoch": 1362} {"train_loss": -5.925229072570801, "global_step": 57206, "epoch": 1362} {"train_loss": -5.8563079833984375, "global_step": 57207, "epoch": 1362} {"train_loss": -5.771313667297363, "global_step": 57208, "epoch": 1362} {"train_loss": -6.004541397094727, "global_step": 57209, "epoch": 1362} {"train_loss": -5.893213272094727, "global_step": 57210, "epoch": 1362} {"train_loss": -5.823720932006836, "global_step": 57211, "epoch": 1362} {"train_loss": -5.84873628616333, "global_step": 57212, "epoch": 1362} {"train_loss": -5.903836250305176, "global_step": 57213, "epoch": 1362} {"train_loss": -5.751248359680176, "global_step": 57214, "epoch": 1362} {"train_loss": -5.8719072341918945, "global_step": 57215, "epoch": 1362} {"train_loss": -5.851207733154297, "global_step": 57216, "epoch": 1362} {"train_loss": -5.868047714233398, "global_step": 57217, "epoch": 1362} {"train_loss": -5.866586208343506, "global_step": 57218, "epoch": 1362} {"train_loss": -5.910799503326416, "global_step": 57219, "epoch": 1362} {"train_loss": -5.922201156616211, "global_step": 57220, "epoch": 1362} {"train_loss": -5.937401294708252, "global_step": 57221, "epoch": 1362} {"train_loss": -5.772617340087891, "global_step": 57222, "epoch": 1362} {"train_loss": -5.785186767578125, "global_step": 57223, "epoch": 1362} {"train_loss": -5.878911972045898, "global_step": 57224, "epoch": 1362} {"train_loss": -5.868938446044922, "global_step": 57225, "epoch": 1362} {"train_loss": -5.832716941833496, "global_step": 57226, "epoch": 1362} {"train_loss": -5.866732597351074, "global_step": 57227, "epoch": 1362} {"train_loss": -5.874494552612305, "global_step": 57228, "epoch": 1362} {"train_loss": -5.8048481941223145, "global_step": 57229, "epoch": 1362} {"train_loss": -5.885515213012695, "global_step": 57230, "epoch": 1362} {"train_loss": -5.733203887939453, "global_step": 57231, "epoch": 1362} {"train_loss": -5.8543548583984375, "global_step": 57232, "epoch": 1362} {"train_loss": -5.99806022644043, "global_step": 57233, "epoch": 1362} {"train_loss": -5.872065544128418, "global_step": 57234, "epoch": 1362} {"train_loss": -5.913121223449707, "global_step": 57235, "epoch": 1362} {"train_loss": -5.820734024047852, "global_step": 57236, "epoch": 1362} {"train_loss": -5.766932487487793, "global_step": 57237, "epoch": 1362} {"train_loss": -5.7500762939453125, "global_step": 57238, "epoch": 1362} {"train_loss": -5.916993618011475, "global_step": 57239, "epoch": 1362} {"train_loss": -5.883419990539551, "global_step": 57240, "epoch": 1362} {"train_loss": -5.883415699005127, "global_step": 57241, "epoch": 1362} {"train_loss": -5.9532856941223145, "global_step": 57242, "epoch": 1362} {"train_loss": -5.792214393615723, "global_step": 57243, "epoch": 1362} {"train_loss": -5.891812324523926, "global_step": 57244, "epoch": 1362} {"train_loss": -5.863103242147536, "global_step": 57245, "epoch": 1362, "val_loss": 66636.4921875} {"train_loss": -5.799351215362549, "global_step": 57246, "epoch": 1363} {"train_loss": -5.875086307525635, "global_step": 57247, "epoch": 1363} {"train_loss": -5.7560930252075195, "global_step": 57248, "epoch": 1363} {"train_loss": -5.8466877937316895, "global_step": 57249, "epoch": 1363} {"train_loss": -5.797918319702148, "global_step": 57250, "epoch": 1363} {"train_loss": -5.979355812072754, "global_step": 57251, "epoch": 1363} {"train_loss": -5.808535575866699, "global_step": 57252, "epoch": 1363} {"train_loss": -5.817674160003662, "global_step": 57253, "epoch": 1363} {"train_loss": -5.691123008728027, "global_step": 57254, "epoch": 1363} {"train_loss": -5.906003952026367, "global_step": 57255, "epoch": 1363} {"train_loss": -5.813504695892334, "global_step": 57256, "epoch": 1363} {"train_loss": -5.740964889526367, "global_step": 57257, "epoch": 1363} {"train_loss": -5.801093578338623, "global_step": 57258, "epoch": 1363} {"train_loss": -5.871417045593262, "global_step": 57259, "epoch": 1363} {"train_loss": -5.76142692565918, "global_step": 57260, "epoch": 1363} {"train_loss": -5.724305152893066, "global_step": 57261, "epoch": 1363} {"train_loss": -5.602051734924316, "global_step": 57262, "epoch": 1363} {"train_loss": -5.805753231048584, "global_step": 57263, "epoch": 1363} {"train_loss": -5.772117614746094, "global_step": 57264, "epoch": 1363} {"train_loss": -5.827747344970703, "global_step": 57265, "epoch": 1363} {"train_loss": -5.862192630767822, "global_step": 57266, "epoch": 1363} {"train_loss": -5.737741470336914, "global_step": 57267, "epoch": 1363} {"train_loss": -5.739741325378418, "global_step": 57268, "epoch": 1363} {"train_loss": -5.854543685913086, "global_step": 57269, "epoch": 1363} {"train_loss": -5.829399108886719, "global_step": 57270, "epoch": 1363} {"train_loss": -5.739482879638672, "global_step": 57271, "epoch": 1363} {"train_loss": -5.891704559326172, "global_step": 57272, "epoch": 1363} {"train_loss": -5.887355804443359, "global_step": 57273, "epoch": 1363} {"train_loss": -5.873958587646484, "global_step": 57274, "epoch": 1363} {"train_loss": -5.815601348876953, "global_step": 57275, "epoch": 1363} {"train_loss": -5.9416069984436035, "global_step": 57276, "epoch": 1363} {"train_loss": -5.898468017578125, "global_step": 57277, "epoch": 1363} {"train_loss": -5.904048442840576, "global_step": 57278, "epoch": 1363} {"train_loss": -5.727776050567627, "global_step": 57279, "epoch": 1363} {"train_loss": -5.8531084060668945, "global_step": 57280, "epoch": 1363} {"train_loss": -5.738712787628174, "global_step": 57281, "epoch": 1363} {"train_loss": -5.761997222900391, "global_step": 57282, "epoch": 1363} {"train_loss": -5.9085798263549805, "global_step": 57283, "epoch": 1363} {"train_loss": -5.858001232147217, "global_step": 57284, "epoch": 1363} {"train_loss": -5.817672252655029, "global_step": 57285, "epoch": 1363} {"train_loss": -5.927101135253906, "global_step": 57286, "epoch": 1363} {"train_loss": -5.819136755807059, "global_step": 57287, "epoch": 1363, "val_loss": 66586.4921875} {"train_loss": -5.911889553070068, "global_step": 57288, "epoch": 1364} {"train_loss": -5.80633544921875, "global_step": 57289, "epoch": 1364} {"train_loss": -5.895708084106445, "global_step": 57290, "epoch": 1364} {"train_loss": -5.876004219055176, "global_step": 57291, "epoch": 1364} {"train_loss": -5.9283976554870605, "global_step": 57292, "epoch": 1364} {"train_loss": -5.852638244628906, "global_step": 57293, "epoch": 1364} {"train_loss": -5.922497272491455, "global_step": 57294, "epoch": 1364} {"train_loss": -5.80472469329834, "global_step": 57295, "epoch": 1364} {"train_loss": -5.981403350830078, "global_step": 57296, "epoch": 1364} {"train_loss": -5.903464317321777, "global_step": 57297, "epoch": 1364} {"train_loss": -5.825052261352539, "global_step": 57298, "epoch": 1364} {"train_loss": -5.769878387451172, "global_step": 57299, "epoch": 1364} {"train_loss": -5.825404644012451, "global_step": 57300, "epoch": 1364} {"train_loss": -5.898879051208496, "global_step": 57301, "epoch": 1364} {"train_loss": -5.928502082824707, "global_step": 57302, "epoch": 1364} {"train_loss": -5.849308013916016, "global_step": 57303, "epoch": 1364} {"train_loss": -5.673853874206543, "global_step": 57304, "epoch": 1364} {"train_loss": -5.813398361206055, "global_step": 57305, "epoch": 1364} {"train_loss": -5.850716590881348, "global_step": 57306, "epoch": 1364} {"train_loss": -5.863813400268555, "global_step": 57307, "epoch": 1364} {"train_loss": -5.799459457397461, "global_step": 57308, "epoch": 1364} {"train_loss": -5.7104597091674805, "global_step": 57309, "epoch": 1364} {"train_loss": -5.764842987060547, "global_step": 57310, "epoch": 1364} {"train_loss": -5.902174949645996, "global_step": 57311, "epoch": 1364} {"train_loss": -5.850090980529785, "global_step": 57312, "epoch": 1364} {"train_loss": -5.847631454467773, "global_step": 57313, "epoch": 1364} {"train_loss": -5.80282735824585, "global_step": 57314, "epoch": 1364} {"train_loss": -5.813419818878174, "global_step": 57315, "epoch": 1364} {"train_loss": -5.880565643310547, "global_step": 57316, "epoch": 1364} {"train_loss": -5.8410539627075195, "global_step": 57317, "epoch": 1364} {"train_loss": -5.850407600402832, "global_step": 57318, "epoch": 1364} {"train_loss": -5.81389856338501, "global_step": 57319, "epoch": 1364} {"train_loss": -5.77708625793457, "global_step": 57320, "epoch": 1364} {"train_loss": -5.799619674682617, "global_step": 57321, "epoch": 1364} {"train_loss": -5.769165992736816, "global_step": 57322, "epoch": 1364} {"train_loss": -5.863215446472168, "global_step": 57323, "epoch": 1364} {"train_loss": -5.834176063537598, "global_step": 57324, "epoch": 1364} {"train_loss": -5.842052936553955, "global_step": 57325, "epoch": 1364} {"train_loss": -5.8698272705078125, "global_step": 57326, "epoch": 1364} {"train_loss": -5.799872398376465, "global_step": 57327, "epoch": 1364} {"train_loss": -5.769781112670898, "global_step": 57328, "epoch": 1364} {"train_loss": -5.841256902331398, "global_step": 57329, "epoch": 1364, "val_loss": 66622.5078125} {"train_loss": -5.772911548614502, "global_step": 57330, "epoch": 1365} {"train_loss": -5.913399696350098, "global_step": 57331, "epoch": 1365} {"train_loss": -5.808516502380371, "global_step": 57332, "epoch": 1365} {"train_loss": -5.7722649574279785, "global_step": 57333, "epoch": 1365} {"train_loss": -5.872241020202637, "global_step": 57334, "epoch": 1365} {"train_loss": -5.782072067260742, "global_step": 57335, "epoch": 1365} {"train_loss": -5.868405818939209, "global_step": 57336, "epoch": 1365} {"train_loss": -5.746302604675293, "global_step": 57337, "epoch": 1365} {"train_loss": -5.632700443267822, "global_step": 57338, "epoch": 1365} {"train_loss": -5.91984748840332, "global_step": 57339, "epoch": 1365} {"train_loss": -5.624667644500732, "global_step": 57340, "epoch": 1365} {"train_loss": -5.80036735534668, "global_step": 57341, "epoch": 1365} {"train_loss": -5.747516632080078, "global_step": 57342, "epoch": 1365} {"train_loss": -5.806921005249023, "global_step": 57343, "epoch": 1365} {"train_loss": -5.844851970672607, "global_step": 57344, "epoch": 1365} {"train_loss": -5.843362808227539, "global_step": 57345, "epoch": 1365} {"train_loss": -5.805584907531738, "global_step": 57346, "epoch": 1365} {"train_loss": -5.737453460693359, "global_step": 57347, "epoch": 1365} {"train_loss": -5.844511985778809, "global_step": 57348, "epoch": 1365} {"train_loss": -5.811088562011719, "global_step": 57349, "epoch": 1365} {"train_loss": -5.804327487945557, "global_step": 57350, "epoch": 1365} {"train_loss": -5.827057838439941, "global_step": 57351, "epoch": 1365} {"train_loss": -5.779820919036865, "global_step": 57352, "epoch": 1365} {"train_loss": -5.754716873168945, "global_step": 57353, "epoch": 1365} {"train_loss": -5.856600761413574, "global_step": 57354, "epoch": 1365} {"train_loss": -5.929563045501709, "global_step": 57355, "epoch": 1365} {"train_loss": -5.783982276916504, "global_step": 57356, "epoch": 1365} {"train_loss": -5.794614315032959, "global_step": 57357, "epoch": 1365} {"train_loss": -5.7483086585998535, "global_step": 57358, "epoch": 1365} {"train_loss": -5.909446716308594, "global_step": 57359, "epoch": 1365} {"train_loss": -5.765978813171387, "global_step": 57360, "epoch": 1365} {"train_loss": -5.785700798034668, "global_step": 57361, "epoch": 1365} {"train_loss": -5.907948970794678, "global_step": 57362, "epoch": 1365} {"train_loss": -5.743481636047363, "global_step": 57363, "epoch": 1365} {"train_loss": -5.956782817840576, "global_step": 57364, "epoch": 1365} {"train_loss": -5.939047813415527, "global_step": 57365, "epoch": 1365} {"train_loss": -5.784204483032227, "global_step": 57366, "epoch": 1365} {"train_loss": -5.850404739379883, "global_step": 57367, "epoch": 1365} {"train_loss": -5.756476402282715, "global_step": 57368, "epoch": 1365} {"train_loss": -5.843153953552246, "global_step": 57369, "epoch": 1365} {"train_loss": -5.85886287689209, "global_step": 57370, "epoch": 1365} {"train_loss": -5.815195685341244, "global_step": 57371, "epoch": 1365, "val_loss": 66597.9296875} {"train_loss": -5.837324619293213, "global_step": 57372, "epoch": 1366} {"train_loss": -5.684365749359131, "global_step": 57373, "epoch": 1366} {"train_loss": -5.764324188232422, "global_step": 57374, "epoch": 1366} {"train_loss": -5.876426696777344, "global_step": 57375, "epoch": 1366} {"train_loss": -5.755117416381836, "global_step": 57376, "epoch": 1366} {"train_loss": -5.837892055511475, "global_step": 57377, "epoch": 1366} {"train_loss": -5.898617744445801, "global_step": 57378, "epoch": 1366} {"train_loss": -5.885417938232422, "global_step": 57379, "epoch": 1366} {"train_loss": -5.771615028381348, "global_step": 57380, "epoch": 1366} {"train_loss": -5.7023820877075195, "global_step": 57381, "epoch": 1366} {"train_loss": -5.784017086029053, "global_step": 57382, "epoch": 1366} {"train_loss": -5.877605438232422, "global_step": 57383, "epoch": 1366} {"train_loss": -5.6839423179626465, "global_step": 57384, "epoch": 1366} {"train_loss": -5.804075717926025, "global_step": 57385, "epoch": 1366} {"train_loss": -5.899731636047363, "global_step": 57386, "epoch": 1366} {"train_loss": -5.777349472045898, "global_step": 57387, "epoch": 1366} {"train_loss": -5.950370788574219, "global_step": 57388, "epoch": 1366} {"train_loss": -5.738315582275391, "global_step": 57389, "epoch": 1366} {"train_loss": -5.907290458679199, "global_step": 57390, "epoch": 1366} {"train_loss": -5.834081649780273, "global_step": 57391, "epoch": 1366} {"train_loss": -5.738826751708984, "global_step": 57392, "epoch": 1366} {"train_loss": -5.823591709136963, "global_step": 57393, "epoch": 1366} {"train_loss": -5.745896339416504, "global_step": 57394, "epoch": 1366} {"train_loss": -5.851558685302734, "global_step": 57395, "epoch": 1366} {"train_loss": -5.835809707641602, "global_step": 57396, "epoch": 1366} {"train_loss": -5.8128275871276855, "global_step": 57397, "epoch": 1366} {"train_loss": -5.951037406921387, "global_step": 57398, "epoch": 1366} {"train_loss": -5.843195915222168, "global_step": 57399, "epoch": 1366} {"train_loss": -5.890783786773682, "global_step": 57400, "epoch": 1366} {"train_loss": -5.637361526489258, "global_step": 57401, "epoch": 1366} {"train_loss": -5.929376602172852, "global_step": 57402, "epoch": 1366} {"train_loss": -5.789513111114502, "global_step": 57403, "epoch": 1366} {"train_loss": -5.916667461395264, "global_step": 57404, "epoch": 1366} {"train_loss": -5.949652671813965, "global_step": 57405, "epoch": 1366} {"train_loss": -5.808567047119141, "global_step": 57406, "epoch": 1366} {"train_loss": -5.714633941650391, "global_step": 57407, "epoch": 1366} {"train_loss": -5.8961944580078125, "global_step": 57408, "epoch": 1366} {"train_loss": -5.776124000549316, "global_step": 57409, "epoch": 1366} {"train_loss": -5.857240676879883, "global_step": 57410, "epoch": 1366} {"train_loss": -5.811264991760254, "global_step": 57411, "epoch": 1366} {"train_loss": -5.791048049926758, "global_step": 57412, "epoch": 1366} {"train_loss": -5.820995274044218, "global_step": 57413, "epoch": 1366, "val_loss": 66442.8984375} {"train_loss": -5.807800769805908, "global_step": 57414, "epoch": 1367} {"train_loss": -5.821418285369873, "global_step": 57415, "epoch": 1367} {"train_loss": -5.822231769561768, "global_step": 57416, "epoch": 1367} {"train_loss": -5.883727073669434, "global_step": 57417, "epoch": 1367} {"train_loss": -5.7228779792785645, "global_step": 57418, "epoch": 1367} {"train_loss": -5.878932952880859, "global_step": 57419, "epoch": 1367} {"train_loss": -5.846077919006348, "global_step": 57420, "epoch": 1367} {"train_loss": -5.790620803833008, "global_step": 57421, "epoch": 1367} {"train_loss": -5.781710624694824, "global_step": 57422, "epoch": 1367} {"train_loss": -5.886774063110352, "global_step": 57423, "epoch": 1367} {"train_loss": -6.000521659851074, "global_step": 57424, "epoch": 1367} {"train_loss": -5.891752243041992, "global_step": 57425, "epoch": 1367} {"train_loss": -5.889486312866211, "global_step": 57426, "epoch": 1367} {"train_loss": -5.90880012512207, "global_step": 57427, "epoch": 1367} {"train_loss": -5.835241317749023, "global_step": 57428, "epoch": 1367} {"train_loss": -5.888360977172852, "global_step": 57429, "epoch": 1367} {"train_loss": -5.943062782287598, "global_step": 57430, "epoch": 1367} {"train_loss": -5.7681498527526855, "global_step": 57431, "epoch": 1367} {"train_loss": -5.9686455726623535, "global_step": 57432, "epoch": 1367} {"train_loss": -5.798038482666016, "global_step": 57433, "epoch": 1367} {"train_loss": -5.885749816894531, "global_step": 57434, "epoch": 1367} {"train_loss": -5.986823558807373, "global_step": 57435, "epoch": 1367} {"train_loss": -5.8131890296936035, "global_step": 57436, "epoch": 1367} {"train_loss": -5.98677921295166, "global_step": 57437, "epoch": 1367} {"train_loss": -5.825541973114014, "global_step": 57438, "epoch": 1367} {"train_loss": -5.742249488830566, "global_step": 57439, "epoch": 1367} {"train_loss": -5.7376909255981445, "global_step": 57440, "epoch": 1367} {"train_loss": -5.73647403717041, "global_step": 57441, "epoch": 1367} {"train_loss": -5.841100692749023, "global_step": 57442, "epoch": 1367} {"train_loss": -5.8531293869018555, "global_step": 57443, "epoch": 1367} {"train_loss": -5.750697135925293, "global_step": 57444, "epoch": 1367} {"train_loss": -5.734566688537598, "global_step": 57445, "epoch": 1367} {"train_loss": -5.674375534057617, "global_step": 57446, "epoch": 1367} {"train_loss": -5.916878700256348, "global_step": 57447, "epoch": 1367} {"train_loss": -5.742248058319092, "global_step": 57448, "epoch": 1367} {"train_loss": -5.80833625793457, "global_step": 57449, "epoch": 1367} {"train_loss": -5.700959205627441, "global_step": 57450, "epoch": 1367} {"train_loss": -5.737421989440918, "global_step": 57451, "epoch": 1367} {"train_loss": -5.755779266357422, "global_step": 57452, "epoch": 1367} {"train_loss": -5.8136186599731445, "global_step": 57453, "epoch": 1367} {"train_loss": -5.713162422180176, "global_step": 57454, "epoch": 1367} {"train_loss": -5.825079951967512, "global_step": 57455, "epoch": 1367, "val_loss": 66913.1796875} {"train_loss": -5.727278232574463, "global_step": 57456, "epoch": 1368} {"train_loss": -5.852795600891113, "global_step": 57457, "epoch": 1368} {"train_loss": -5.793919563293457, "global_step": 57458, "epoch": 1368} {"train_loss": -5.737119674682617, "global_step": 57459, "epoch": 1368} {"train_loss": -5.883739471435547, "global_step": 57460, "epoch": 1368} {"train_loss": -5.85041618347168, "global_step": 57461, "epoch": 1368} {"train_loss": -5.750670909881592, "global_step": 57462, "epoch": 1368} {"train_loss": -5.6262054443359375, "global_step": 57463, "epoch": 1368} {"train_loss": -5.799935340881348, "global_step": 57464, "epoch": 1368} {"train_loss": -5.851088523864746, "global_step": 57465, "epoch": 1368} {"train_loss": -5.7612104415893555, "global_step": 57466, "epoch": 1368} {"train_loss": -5.734574794769287, "global_step": 57467, "epoch": 1368} {"train_loss": -5.931342601776123, "global_step": 57468, "epoch": 1368} {"train_loss": -5.859234809875488, "global_step": 57469, "epoch": 1368} {"train_loss": -5.713594436645508, "global_step": 57470, "epoch": 1368} {"train_loss": -5.852268218994141, "global_step": 57471, "epoch": 1368} {"train_loss": -5.800431251525879, "global_step": 57472, "epoch": 1368} {"train_loss": -5.762876510620117, "global_step": 57473, "epoch": 1368} {"train_loss": -5.7923102378845215, "global_step": 57474, "epoch": 1368} {"train_loss": -5.918627738952637, "global_step": 57475, "epoch": 1368} {"train_loss": -5.786808490753174, "global_step": 57476, "epoch": 1368} {"train_loss": -5.8926191329956055, "global_step": 57477, "epoch": 1368} {"train_loss": -5.8108930587768555, "global_step": 57478, "epoch": 1368} {"train_loss": -5.837882995605469, "global_step": 57479, "epoch": 1368} {"train_loss": -5.843612194061279, "global_step": 57480, "epoch": 1368} {"train_loss": -5.797237396240234, "global_step": 57481, "epoch": 1368} {"train_loss": -5.868328094482422, "global_step": 57482, "epoch": 1368} {"train_loss": -5.718116760253906, "global_step": 57483, "epoch": 1368} {"train_loss": -5.926436424255371, "global_step": 57484, "epoch": 1368} {"train_loss": -5.904936790466309, "global_step": 57485, "epoch": 1368} {"train_loss": -5.695706367492676, "global_step": 57486, "epoch": 1368} {"train_loss": -5.782721519470215, "global_step": 57487, "epoch": 1368} {"train_loss": -5.775554180145264, "global_step": 57488, "epoch": 1368} {"train_loss": -5.83896541595459, "global_step": 57489, "epoch": 1368} {"train_loss": -5.836082458496094, "global_step": 57490, "epoch": 1368} {"train_loss": -5.855871200561523, "global_step": 57491, "epoch": 1368} {"train_loss": -5.878741264343262, "global_step": 57492, "epoch": 1368} {"train_loss": -5.817652225494385, "global_step": 57493, "epoch": 1368} {"train_loss": -5.733168125152588, "global_step": 57494, "epoch": 1368} {"train_loss": -5.934741020202637, "global_step": 57495, "epoch": 1368} {"train_loss": -5.78692626953125, "global_step": 57496, "epoch": 1368} {"train_loss": -5.8163187730880015, "global_step": 57497, "epoch": 1368, "val_loss": 66781.171875} {"train_loss": -5.887165069580078, "global_step": 57498, "epoch": 1369} {"train_loss": -5.720744609832764, "global_step": 57499, "epoch": 1369} {"train_loss": -5.842902660369873, "global_step": 57500, "epoch": 1369} {"train_loss": -5.874294757843018, "global_step": 57501, "epoch": 1369} {"train_loss": -5.769396781921387, "global_step": 57502, "epoch": 1369} {"train_loss": -5.839587211608887, "global_step": 57503, "epoch": 1369} {"train_loss": -5.834755897521973, "global_step": 57504, "epoch": 1369} {"train_loss": -5.8324737548828125, "global_step": 57505, "epoch": 1369} {"train_loss": -5.8152666091918945, "global_step": 57506, "epoch": 1369} {"train_loss": -5.826967716217041, "global_step": 57507, "epoch": 1369} {"train_loss": -5.845366477966309, "global_step": 57508, "epoch": 1369} {"train_loss": -5.859540939331055, "global_step": 57509, "epoch": 1369} {"train_loss": -5.862706184387207, "global_step": 57510, "epoch": 1369} {"train_loss": -5.942374229431152, "global_step": 57511, "epoch": 1369} {"train_loss": -5.764482498168945, "global_step": 57512, "epoch": 1369} {"train_loss": -5.848493576049805, "global_step": 57513, "epoch": 1369} {"train_loss": -5.788073539733887, "global_step": 57514, "epoch": 1369} {"train_loss": -5.792400360107422, "global_step": 57515, "epoch": 1369} {"train_loss": -5.806058406829834, "global_step": 57516, "epoch": 1369} {"train_loss": -5.76844596862793, "global_step": 57517, "epoch": 1369} {"train_loss": -5.92381477355957, "global_step": 57518, "epoch": 1369} {"train_loss": -5.914898872375488, "global_step": 57519, "epoch": 1369} {"train_loss": -5.8053717613220215, "global_step": 57520, "epoch": 1369} {"train_loss": -5.827060699462891, "global_step": 57521, "epoch": 1369} {"train_loss": -5.819974899291992, "global_step": 57522, "epoch": 1369} {"train_loss": -5.891870975494385, "global_step": 57523, "epoch": 1369} {"train_loss": -5.871599197387695, "global_step": 57524, "epoch": 1369} {"train_loss": -5.938156604766846, "global_step": 57525, "epoch": 1369} {"train_loss": -5.864901542663574, "global_step": 57526, "epoch": 1369} {"train_loss": -5.885917663574219, "global_step": 57527, "epoch": 1369} {"train_loss": -5.763063430786133, "global_step": 57528, "epoch": 1369} {"train_loss": -5.812448501586914, "global_step": 57529, "epoch": 1369} {"train_loss": -5.888415813446045, "global_step": 57530, "epoch": 1369} {"train_loss": -5.805558204650879, "global_step": 57531, "epoch": 1369} {"train_loss": -5.907849311828613, "global_step": 57532, "epoch": 1369} {"train_loss": -5.991103172302246, "global_step": 57533, "epoch": 1369} {"train_loss": -5.797333240509033, "global_step": 57534, "epoch": 1369} {"train_loss": -5.7606353759765625, "global_step": 57535, "epoch": 1369} {"train_loss": -5.993839263916016, "global_step": 57536, "epoch": 1369} {"train_loss": -5.8843889236450195, "global_step": 57537, "epoch": 1369} {"train_loss": -5.942026138305664, "global_step": 57538, "epoch": 1369} {"train_loss": -5.84989146959214, "global_step": 57539, "epoch": 1369, "val_loss": 66571.1796875} {"train_loss": -5.767746448516846, "global_step": 57540, "epoch": 1370} {"train_loss": -5.76346492767334, "global_step": 57541, "epoch": 1370} {"train_loss": -5.856046199798584, "global_step": 57542, "epoch": 1370} {"train_loss": -5.93420934677124, "global_step": 57543, "epoch": 1370} {"train_loss": -5.927711486816406, "global_step": 57544, "epoch": 1370} {"train_loss": -5.893965721130371, "global_step": 57545, "epoch": 1370} {"train_loss": -5.83585786819458, "global_step": 57546, "epoch": 1370} {"train_loss": -5.83768892288208, "global_step": 57547, "epoch": 1370} {"train_loss": -5.790928363800049, "global_step": 57548, "epoch": 1370} {"train_loss": -6.026057243347168, "global_step": 57549, "epoch": 1370} {"train_loss": -5.853187561035156, "global_step": 57550, "epoch": 1370} {"train_loss": -5.894309043884277, "global_step": 57551, "epoch": 1370} {"train_loss": -5.795170783996582, "global_step": 57552, "epoch": 1370} {"train_loss": -5.8988494873046875, "global_step": 57553, "epoch": 1370} {"train_loss": -5.778162002563477, "global_step": 57554, "epoch": 1370} {"train_loss": -5.855915069580078, "global_step": 57555, "epoch": 1370} {"train_loss": -5.808281898498535, "global_step": 57556, "epoch": 1370} {"train_loss": -5.797591209411621, "global_step": 57557, "epoch": 1370} {"train_loss": -5.886318683624268, "global_step": 57558, "epoch": 1370} {"train_loss": -5.768187999725342, "global_step": 57559, "epoch": 1370} {"train_loss": -5.951961517333984, "global_step": 57560, "epoch": 1370} {"train_loss": -5.851824760437012, "global_step": 57561, "epoch": 1370} {"train_loss": -5.844744682312012, "global_step": 57562, "epoch": 1370} {"train_loss": -5.958768844604492, "global_step": 57563, "epoch": 1370} {"train_loss": -5.925778388977051, "global_step": 57564, "epoch": 1370} {"train_loss": -5.845677375793457, "global_step": 57565, "epoch": 1370} {"train_loss": -5.924739837646484, "global_step": 57566, "epoch": 1370} {"train_loss": -5.855304718017578, "global_step": 57567, "epoch": 1370} {"train_loss": -5.953032970428467, "global_step": 57568, "epoch": 1370} {"train_loss": -5.782763957977295, "global_step": 57569, "epoch": 1370} {"train_loss": -5.917793273925781, "global_step": 57570, "epoch": 1370} {"train_loss": -5.9541473388671875, "global_step": 57571, "epoch": 1370} {"train_loss": -5.795511722564697, "global_step": 57572, "epoch": 1370} {"train_loss": -5.794647216796875, "global_step": 57573, "epoch": 1370} {"train_loss": -5.742503643035889, "global_step": 57574, "epoch": 1370} {"train_loss": -6.03044319152832, "global_step": 57575, "epoch": 1370} {"train_loss": -5.82340669631958, "global_step": 57576, "epoch": 1370} {"train_loss": -5.864964485168457, "global_step": 57577, "epoch": 1370} {"train_loss": -5.865631103515625, "global_step": 57578, "epoch": 1370} {"train_loss": -5.8927693367004395, "global_step": 57579, "epoch": 1370} {"train_loss": -5.736965179443359, "global_step": 57580, "epoch": 1370} {"train_loss": -5.861052683421543, "global_step": 57581, "epoch": 1370, "val_loss": 66516.5625} {"train_loss": -5.8671722412109375, "global_step": 57582, "epoch": 1371} {"train_loss": -5.941476821899414, "global_step": 57583, "epoch": 1371} {"train_loss": -5.812902450561523, "global_step": 57584, "epoch": 1371} {"train_loss": -5.708470344543457, "global_step": 57585, "epoch": 1371} {"train_loss": -5.943386077880859, "global_step": 57586, "epoch": 1371} {"train_loss": -5.881799697875977, "global_step": 57587, "epoch": 1371} {"train_loss": -5.966351509094238, "global_step": 57588, "epoch": 1371} {"train_loss": -5.824058532714844, "global_step": 57589, "epoch": 1371} {"train_loss": -5.845404148101807, "global_step": 57590, "epoch": 1371} {"train_loss": -5.837492942810059, "global_step": 57591, "epoch": 1371} {"train_loss": -5.932614326477051, "global_step": 57592, "epoch": 1371} {"train_loss": -5.945677757263184, "global_step": 57593, "epoch": 1371} {"train_loss": -5.941648960113525, "global_step": 57594, "epoch": 1371} {"train_loss": -5.839557647705078, "global_step": 57595, "epoch": 1371} {"train_loss": -5.837323188781738, "global_step": 57596, "epoch": 1371} {"train_loss": -5.786516189575195, "global_step": 57597, "epoch": 1371} {"train_loss": -5.874798774719238, "global_step": 57598, "epoch": 1371} {"train_loss": -5.85570764541626, "global_step": 57599, "epoch": 1371} {"train_loss": -5.89228630065918, "global_step": 57600, "epoch": 1371} {"train_loss": -5.777923583984375, "global_step": 57601, "epoch": 1371} {"train_loss": -5.779817581176758, "global_step": 57602, "epoch": 1371} {"train_loss": -5.754970550537109, "global_step": 57603, "epoch": 1371} {"train_loss": -5.79599666595459, "global_step": 57604, "epoch": 1371} {"train_loss": -5.715329170227051, "global_step": 57605, "epoch": 1371} {"train_loss": -5.837379455566406, "global_step": 57606, "epoch": 1371} {"train_loss": -5.877531051635742, "global_step": 57607, "epoch": 1371} {"train_loss": -5.766927719116211, "global_step": 57608, "epoch": 1371} {"train_loss": -5.999190807342529, "global_step": 57609, "epoch": 1371} {"train_loss": -5.946005344390869, "global_step": 57610, "epoch": 1371} {"train_loss": -5.928346157073975, "global_step": 57611, "epoch": 1371} {"train_loss": -5.989585876464844, "global_step": 57612, "epoch": 1371} {"train_loss": -5.826624870300293, "global_step": 57613, "epoch": 1371} {"train_loss": -5.881394386291504, "global_step": 57614, "epoch": 1371} {"train_loss": -5.8940205574035645, "global_step": 57615, "epoch": 1371} {"train_loss": -5.825119972229004, "global_step": 57616, "epoch": 1371} {"train_loss": -5.814441204071045, "global_step": 57617, "epoch": 1371} {"train_loss": -5.908110618591309, "global_step": 57618, "epoch": 1371} {"train_loss": -5.817379951477051, "global_step": 57619, "epoch": 1371} {"train_loss": -5.7703752517700195, "global_step": 57620, "epoch": 1371} {"train_loss": -5.845297813415527, "global_step": 57621, "epoch": 1371} {"train_loss": -5.778519153594971, "global_step": 57622, "epoch": 1371} {"train_loss": -5.854165928704398, "global_step": 57623, "epoch": 1371, "val_loss": 66689.53125} {"train_loss": -5.803400039672852, "global_step": 57624, "epoch": 1372} {"train_loss": -5.903304576873779, "global_step": 57625, "epoch": 1372} {"train_loss": -5.922661304473877, "global_step": 57626, "epoch": 1372} {"train_loss": -5.860826015472412, "global_step": 57627, "epoch": 1372} {"train_loss": -5.824861526489258, "global_step": 57628, "epoch": 1372} {"train_loss": -5.902907371520996, "global_step": 57629, "epoch": 1372} {"train_loss": -5.737845420837402, "global_step": 57630, "epoch": 1372} {"train_loss": -5.876821517944336, "global_step": 57631, "epoch": 1372} {"train_loss": -5.819974899291992, "global_step": 57632, "epoch": 1372} {"train_loss": -5.9480791091918945, "global_step": 57633, "epoch": 1372} {"train_loss": -5.8943610191345215, "global_step": 57634, "epoch": 1372} {"train_loss": -5.797074317932129, "global_step": 57635, "epoch": 1372} {"train_loss": -5.87454891204834, "global_step": 57636, "epoch": 1372} {"train_loss": -5.804744243621826, "global_step": 57637, "epoch": 1372} {"train_loss": -5.826720714569092, "global_step": 57638, "epoch": 1372} {"train_loss": -5.81845760345459, "global_step": 57639, "epoch": 1372} {"train_loss": -5.873027801513672, "global_step": 57640, "epoch": 1372} {"train_loss": -5.773536682128906, "global_step": 57641, "epoch": 1372} {"train_loss": -5.9944562911987305, "global_step": 57642, "epoch": 1372} {"train_loss": -5.740253448486328, "global_step": 57643, "epoch": 1372} {"train_loss": -5.785840034484863, "global_step": 57644, "epoch": 1372} {"train_loss": -5.777897834777832, "global_step": 57645, "epoch": 1372} {"train_loss": -5.750922203063965, "global_step": 57646, "epoch": 1372} {"train_loss": -5.794467926025391, "global_step": 57647, "epoch": 1372} {"train_loss": -5.644861698150635, "global_step": 57648, "epoch": 1372} {"train_loss": -5.915935516357422, "global_step": 57649, "epoch": 1372} {"train_loss": -5.910487651824951, "global_step": 57650, "epoch": 1372} {"train_loss": -5.832307815551758, "global_step": 57651, "epoch": 1372} {"train_loss": -5.895053863525391, "global_step": 57652, "epoch": 1372} {"train_loss": -5.744467258453369, "global_step": 57653, "epoch": 1372} {"train_loss": -5.878215312957764, "global_step": 57654, "epoch": 1372} {"train_loss": -5.7889604568481445, "global_step": 57655, "epoch": 1372} {"train_loss": -5.6800642013549805, "global_step": 57656, "epoch": 1372} {"train_loss": -5.841460227966309, "global_step": 57657, "epoch": 1372} {"train_loss": -5.686140060424805, "global_step": 57658, "epoch": 1372} {"train_loss": -5.6984028816223145, "global_step": 57659, "epoch": 1372} {"train_loss": -5.719864845275879, "global_step": 57660, "epoch": 1372} {"train_loss": -5.87146520614624, "global_step": 57661, "epoch": 1372} {"train_loss": -5.7748122215271, "global_step": 57662, "epoch": 1372} {"train_loss": -5.72335147857666, "global_step": 57663, "epoch": 1372} {"train_loss": -5.7964887619018555, "global_step": 57664, "epoch": 1372} {"train_loss": -5.822281678517659, "global_step": 57665, "epoch": 1372, "val_loss": 66704.578125} {"train_loss": -5.904901027679443, "global_step": 57666, "epoch": 1373} {"train_loss": -5.852901458740234, "global_step": 57667, "epoch": 1373} {"train_loss": -5.853630065917969, "global_step": 57668, "epoch": 1373} {"train_loss": -5.966827392578125, "global_step": 57669, "epoch": 1373} {"train_loss": -5.856369495391846, "global_step": 57670, "epoch": 1373} {"train_loss": -5.825962066650391, "global_step": 57671, "epoch": 1373} {"train_loss": -5.834040641784668, "global_step": 57672, "epoch": 1373} {"train_loss": -5.781373977661133, "global_step": 57673, "epoch": 1373} {"train_loss": -5.75897216796875, "global_step": 57674, "epoch": 1373} {"train_loss": -5.905144691467285, "global_step": 57675, "epoch": 1373} {"train_loss": -5.889907360076904, "global_step": 57676, "epoch": 1373} {"train_loss": -5.905887126922607, "global_step": 57677, "epoch": 1373} {"train_loss": -5.854557037353516, "global_step": 57678, "epoch": 1373} {"train_loss": -5.803223609924316, "global_step": 57679, "epoch": 1373} {"train_loss": -5.942399978637695, "global_step": 57680, "epoch": 1373} {"train_loss": -5.871199607849121, "global_step": 57681, "epoch": 1373} {"train_loss": -5.896512985229492, "global_step": 57682, "epoch": 1373} {"train_loss": -5.907171726226807, "global_step": 57683, "epoch": 1373} {"train_loss": -5.868212699890137, "global_step": 57684, "epoch": 1373} {"train_loss": -5.875267028808594, "global_step": 57685, "epoch": 1373} {"train_loss": -5.9137420654296875, "global_step": 57686, "epoch": 1373} {"train_loss": -5.7605180740356445, "global_step": 57687, "epoch": 1373} {"train_loss": -5.755906105041504, "global_step": 57688, "epoch": 1373} {"train_loss": -5.78283166885376, "global_step": 57689, "epoch": 1373} {"train_loss": -5.910401821136475, "global_step": 57690, "epoch": 1373} {"train_loss": -5.847991943359375, "global_step": 57691, "epoch": 1373} {"train_loss": -5.831830024719238, "global_step": 57692, "epoch": 1373} {"train_loss": -5.914924621582031, "global_step": 57693, "epoch": 1373} {"train_loss": -5.875319480895996, "global_step": 57694, "epoch": 1373} {"train_loss": -5.842975616455078, "global_step": 57695, "epoch": 1373} {"train_loss": -5.850423812866211, "global_step": 57696, "epoch": 1373} {"train_loss": -5.782347679138184, "global_step": 57697, "epoch": 1373} {"train_loss": -5.846558570861816, "global_step": 57698, "epoch": 1373} {"train_loss": -5.759695053100586, "global_step": 57699, "epoch": 1373} {"train_loss": -5.768886566162109, "global_step": 57700, "epoch": 1373} {"train_loss": -5.849149703979492, "global_step": 57701, "epoch": 1373} {"train_loss": -5.871445655822754, "global_step": 57702, "epoch": 1373} {"train_loss": -5.896855354309082, "global_step": 57703, "epoch": 1373} {"train_loss": -5.86568546295166, "global_step": 57704, "epoch": 1373} {"train_loss": -5.743447780609131, "global_step": 57705, "epoch": 1373} {"train_loss": -5.962654113769531, "global_step": 57706, "epoch": 1373} {"train_loss": -5.852490584055583, "global_step": 57707, "epoch": 1373, "val_loss": 66431.8515625} {"train_loss": -5.729823589324951, "global_step": 57708, "epoch": 1374} {"train_loss": -5.730052947998047, "global_step": 57709, "epoch": 1374} {"train_loss": -5.825008869171143, "global_step": 57710, "epoch": 1374} {"train_loss": -5.808565616607666, "global_step": 57711, "epoch": 1374} {"train_loss": -5.769870281219482, "global_step": 57712, "epoch": 1374} {"train_loss": -5.83381462097168, "global_step": 57713, "epoch": 1374} {"train_loss": -5.788809776306152, "global_step": 57714, "epoch": 1374} {"train_loss": -5.794455528259277, "global_step": 57715, "epoch": 1374} {"train_loss": -5.867214202880859, "global_step": 57716, "epoch": 1374} {"train_loss": -5.828202724456787, "global_step": 57717, "epoch": 1374} {"train_loss": -5.875079154968262, "global_step": 57718, "epoch": 1374} {"train_loss": -5.7903666496276855, "global_step": 57719, "epoch": 1374} {"train_loss": -5.8441853523254395, "global_step": 57720, "epoch": 1374} {"train_loss": -5.911228179931641, "global_step": 57721, "epoch": 1374} {"train_loss": -5.857273101806641, "global_step": 57722, "epoch": 1374} {"train_loss": -5.831249237060547, "global_step": 57723, "epoch": 1374} {"train_loss": -5.893575191497803, "global_step": 57724, "epoch": 1374} {"train_loss": -5.874179840087891, "global_step": 57725, "epoch": 1374} {"train_loss": -5.826286792755127, "global_step": 57726, "epoch": 1374} {"train_loss": -5.832172393798828, "global_step": 57727, "epoch": 1374} {"train_loss": -5.898529529571533, "global_step": 57728, "epoch": 1374} {"train_loss": -5.884906768798828, "global_step": 57729, "epoch": 1374} {"train_loss": -5.792250156402588, "global_step": 57730, "epoch": 1374} {"train_loss": -5.810406684875488, "global_step": 57731, "epoch": 1374} {"train_loss": -5.970666885375977, "global_step": 57732, "epoch": 1374} {"train_loss": -5.73486852645874, "global_step": 57733, "epoch": 1374} {"train_loss": -5.724221229553223, "global_step": 57734, "epoch": 1374} {"train_loss": -5.764937400817871, "global_step": 57735, "epoch": 1374} {"train_loss": -5.767971038818359, "global_step": 57736, "epoch": 1374} {"train_loss": -5.888295650482178, "global_step": 57737, "epoch": 1374} {"train_loss": -5.981382369995117, "global_step": 57738, "epoch": 1374} {"train_loss": -5.927407741546631, "global_step": 57739, "epoch": 1374} {"train_loss": -5.776638984680176, "global_step": 57740, "epoch": 1374} {"train_loss": -5.939082145690918, "global_step": 57741, "epoch": 1374} {"train_loss": -5.814960956573486, "global_step": 57742, "epoch": 1374} {"train_loss": -5.924606800079346, "global_step": 57743, "epoch": 1374} {"train_loss": -5.762537002563477, "global_step": 57744, "epoch": 1374} {"train_loss": -5.796184062957764, "global_step": 57745, "epoch": 1374} {"train_loss": -5.811447620391846, "global_step": 57746, "epoch": 1374} {"train_loss": -5.835687637329102, "global_step": 57747, "epoch": 1374} {"train_loss": -5.727605819702148, "global_step": 57748, "epoch": 1374} {"train_loss": -5.829251675378709, "global_step": 57749, "epoch": 1374, "val_loss": 66843.3515625} {"train_loss": -5.777477264404297, "global_step": 57750, "epoch": 1375} {"train_loss": -5.9254631996154785, "global_step": 57751, "epoch": 1375} {"train_loss": -5.750667572021484, "global_step": 57752, "epoch": 1375} {"train_loss": -5.764544486999512, "global_step": 57753, "epoch": 1375} {"train_loss": -5.791797637939453, "global_step": 57754, "epoch": 1375} {"train_loss": -5.854087829589844, "global_step": 57755, "epoch": 1375} {"train_loss": -5.8203125, "global_step": 57756, "epoch": 1375} {"train_loss": -5.781287670135498, "global_step": 57757, "epoch": 1375} {"train_loss": -5.867239952087402, "global_step": 57758, "epoch": 1375} {"train_loss": -5.9284772872924805, "global_step": 57759, "epoch": 1375} {"train_loss": -5.94783878326416, "global_step": 57760, "epoch": 1375} {"train_loss": -5.8628740310668945, "global_step": 57761, "epoch": 1375} {"train_loss": -5.903791904449463, "global_step": 57762, "epoch": 1375} {"train_loss": -5.850264549255371, "global_step": 57763, "epoch": 1375} {"train_loss": -5.825932025909424, "global_step": 57764, "epoch": 1375} {"train_loss": -5.919589042663574, "global_step": 57765, "epoch": 1375} {"train_loss": -5.908148288726807, "global_step": 57766, "epoch": 1375} {"train_loss": -5.899918556213379, "global_step": 57767, "epoch": 1375} {"train_loss": -5.8761773109436035, "global_step": 57768, "epoch": 1375} {"train_loss": -5.857701301574707, "global_step": 57769, "epoch": 1375} {"train_loss": -5.938680648803711, "global_step": 57770, "epoch": 1375} {"train_loss": -5.803037643432617, "global_step": 57771, "epoch": 1375} {"train_loss": -5.862939357757568, "global_step": 57772, "epoch": 1375} {"train_loss": -5.816290855407715, "global_step": 57773, "epoch": 1375} {"train_loss": -5.802778720855713, "global_step": 57774, "epoch": 1375} {"train_loss": -5.8689093589782715, "global_step": 57775, "epoch": 1375} {"train_loss": -5.716015338897705, "global_step": 57776, "epoch": 1375} {"train_loss": -5.999927520751953, "global_step": 57777, "epoch": 1375} {"train_loss": -5.736034870147705, "global_step": 57778, "epoch": 1375} {"train_loss": -5.640697479248047, "global_step": 57779, "epoch": 1375} {"train_loss": -5.784948348999023, "global_step": 57780, "epoch": 1375} {"train_loss": -5.84658145904541, "global_step": 57781, "epoch": 1375} {"train_loss": -5.826827526092529, "global_step": 57782, "epoch": 1375} {"train_loss": -5.879728317260742, "global_step": 57783, "epoch": 1375} {"train_loss": -5.684107780456543, "global_step": 57784, "epoch": 1375} {"train_loss": -5.829492568969727, "global_step": 57785, "epoch": 1375} {"train_loss": -5.764657974243164, "global_step": 57786, "epoch": 1375} {"train_loss": -5.982956886291504, "global_step": 57787, "epoch": 1375} {"train_loss": -5.776334762573242, "global_step": 57788, "epoch": 1375} {"train_loss": -5.876863956451416, "global_step": 57789, "epoch": 1375} {"train_loss": -5.895517349243164, "global_step": 57790, "epoch": 1375} {"train_loss": -5.841433036895025, "global_step": 57791, "epoch": 1375, "val_loss": 66672.6484375} {"train_loss": -5.9472551345825195, "global_step": 57792, "epoch": 1376} {"train_loss": -5.880582332611084, "global_step": 57793, "epoch": 1376} {"train_loss": -6.001392364501953, "global_step": 57794, "epoch": 1376} {"train_loss": -5.808078765869141, "global_step": 57795, "epoch": 1376} {"train_loss": -5.856952667236328, "global_step": 57796, "epoch": 1376} {"train_loss": -5.905482769012451, "global_step": 57797, "epoch": 1376} {"train_loss": -5.886264801025391, "global_step": 57798, "epoch": 1376} {"train_loss": -5.95705509185791, "global_step": 57799, "epoch": 1376} {"train_loss": -5.975407600402832, "global_step": 57800, "epoch": 1376} {"train_loss": -5.925528049468994, "global_step": 57801, "epoch": 1376} {"train_loss": -5.843077659606934, "global_step": 57802, "epoch": 1376} {"train_loss": -5.926105499267578, "global_step": 57803, "epoch": 1376} {"train_loss": -5.896105766296387, "global_step": 57804, "epoch": 1376} {"train_loss": -5.816810607910156, "global_step": 57805, "epoch": 1376} {"train_loss": -5.806483268737793, "global_step": 57806, "epoch": 1376} {"train_loss": -5.851614952087402, "global_step": 57807, "epoch": 1376} {"train_loss": -5.912127494812012, "global_step": 57808, "epoch": 1376} {"train_loss": -5.804708957672119, "global_step": 57809, "epoch": 1376} {"train_loss": -5.832128047943115, "global_step": 57810, "epoch": 1376} {"train_loss": -5.820708274841309, "global_step": 57811, "epoch": 1376} {"train_loss": -5.857593536376953, "global_step": 57812, "epoch": 1376} {"train_loss": -5.8221755027771, "global_step": 57813, "epoch": 1376} {"train_loss": -5.823940277099609, "global_step": 57814, "epoch": 1376} {"train_loss": -5.772212982177734, "global_step": 57815, "epoch": 1376} {"train_loss": -5.857684135437012, "global_step": 57816, "epoch": 1376} {"train_loss": -5.731874942779541, "global_step": 57817, "epoch": 1376} {"train_loss": -5.964468955993652, "global_step": 57818, "epoch": 1376} {"train_loss": -5.835448265075684, "global_step": 57819, "epoch": 1376} {"train_loss": -5.806973934173584, "global_step": 57820, "epoch": 1376} {"train_loss": -5.765152931213379, "global_step": 57821, "epoch": 1376} {"train_loss": -5.896186828613281, "global_step": 57822, "epoch": 1376} {"train_loss": -5.845541000366211, "global_step": 57823, "epoch": 1376} {"train_loss": -5.978402614593506, "global_step": 57824, "epoch": 1376} {"train_loss": -5.907252788543701, "global_step": 57825, "epoch": 1376} {"train_loss": -5.957156658172607, "global_step": 57826, "epoch": 1376} {"train_loss": -5.751006126403809, "global_step": 57827, "epoch": 1376} {"train_loss": -5.906290054321289, "global_step": 57828, "epoch": 1376} {"train_loss": -5.873106956481934, "global_step": 57829, "epoch": 1376} {"train_loss": -5.796538352966309, "global_step": 57830, "epoch": 1376} {"train_loss": -5.767101287841797, "global_step": 57831, "epoch": 1376} {"train_loss": -5.774775981903076, "global_step": 57832, "epoch": 1376} {"train_loss": -5.861986489523025, "global_step": 57833, "epoch": 1376, "val_loss": 66666.1640625} {"train_loss": -5.845002174377441, "global_step": 57834, "epoch": 1377} {"train_loss": -5.992414474487305, "global_step": 57835, "epoch": 1377} {"train_loss": -5.936802387237549, "global_step": 57836, "epoch": 1377} {"train_loss": -5.716917991638184, "global_step": 57837, "epoch": 1377} {"train_loss": -5.904968738555908, "global_step": 57838, "epoch": 1377} {"train_loss": -5.826972961425781, "global_step": 57839, "epoch": 1377} {"train_loss": -5.871085166931152, "global_step": 57840, "epoch": 1377} {"train_loss": -5.928654670715332, "global_step": 57841, "epoch": 1377} {"train_loss": -5.7788190841674805, "global_step": 57842, "epoch": 1377} {"train_loss": -5.945148468017578, "global_step": 57843, "epoch": 1377} {"train_loss": -5.9226789474487305, "global_step": 57844, "epoch": 1377} {"train_loss": -5.790092468261719, "global_step": 57845, "epoch": 1377} {"train_loss": -5.885827541351318, "global_step": 57846, "epoch": 1377} {"train_loss": -5.838068962097168, "global_step": 57847, "epoch": 1377} {"train_loss": -5.9672346115112305, "global_step": 57848, "epoch": 1377} {"train_loss": -5.858395576477051, "global_step": 57849, "epoch": 1377} {"train_loss": -5.911443710327148, "global_step": 57850, "epoch": 1377} {"train_loss": -5.835552215576172, "global_step": 57851, "epoch": 1377} {"train_loss": -5.752289772033691, "global_step": 57852, "epoch": 1377} {"train_loss": -5.818856716156006, "global_step": 57853, "epoch": 1377} {"train_loss": -5.8004608154296875, "global_step": 57854, "epoch": 1377} {"train_loss": -5.928671836853027, "global_step": 57855, "epoch": 1377} {"train_loss": -5.943325519561768, "global_step": 57856, "epoch": 1377} {"train_loss": -5.878731727600098, "global_step": 57857, "epoch": 1377} {"train_loss": -5.867545127868652, "global_step": 57858, "epoch": 1377} {"train_loss": -5.861699104309082, "global_step": 57859, "epoch": 1377} {"train_loss": -5.966966152191162, "global_step": 57860, "epoch": 1377} {"train_loss": -5.798731803894043, "global_step": 57861, "epoch": 1377} {"train_loss": -5.8910417556762695, "global_step": 57862, "epoch": 1377} {"train_loss": -5.882493019104004, "global_step": 57863, "epoch": 1377} {"train_loss": -5.8053483963012695, "global_step": 57864, "epoch": 1377} {"train_loss": -5.753997802734375, "global_step": 57865, "epoch": 1377} {"train_loss": -5.851410388946533, "global_step": 57866, "epoch": 1377} {"train_loss": -5.983038902282715, "global_step": 57867, "epoch": 1377} {"train_loss": -5.776679992675781, "global_step": 57868, "epoch": 1377} {"train_loss": -5.80080509185791, "global_step": 57869, "epoch": 1377} {"train_loss": -5.838833808898926, "global_step": 57870, "epoch": 1377} {"train_loss": -5.878150463104248, "global_step": 57871, "epoch": 1377} {"train_loss": -5.840245246887207, "global_step": 57872, "epoch": 1377} {"train_loss": -5.8538713455200195, "global_step": 57873, "epoch": 1377} {"train_loss": -5.907607555389404, "global_step": 57874, "epoch": 1377} {"train_loss": -5.864547945204235, "global_step": 57875, "epoch": 1377, "val_loss": 66536.3828125} {"train_loss": -5.889771938323975, "global_step": 57876, "epoch": 1378} {"train_loss": -5.873621940612793, "global_step": 57877, "epoch": 1378} {"train_loss": -5.8871660232543945, "global_step": 57878, "epoch": 1378} {"train_loss": -5.908308982849121, "global_step": 57879, "epoch": 1378} {"train_loss": -5.797666072845459, "global_step": 57880, "epoch": 1378} {"train_loss": -5.899145603179932, "global_step": 57881, "epoch": 1378} {"train_loss": -5.855584144592285, "global_step": 57882, "epoch": 1378} {"train_loss": -5.871822357177734, "global_step": 57883, "epoch": 1378} {"train_loss": -5.9412312507629395, "global_step": 57884, "epoch": 1378} {"train_loss": -5.819085121154785, "global_step": 57885, "epoch": 1378} {"train_loss": -5.940638542175293, "global_step": 57886, "epoch": 1378} {"train_loss": -5.877793312072754, "global_step": 57887, "epoch": 1378} {"train_loss": -5.820183753967285, "global_step": 57888, "epoch": 1378} {"train_loss": -5.899039268493652, "global_step": 57889, "epoch": 1378} {"train_loss": -5.8418121337890625, "global_step": 57890, "epoch": 1378} {"train_loss": -5.982781887054443, "global_step": 57891, "epoch": 1378} {"train_loss": -5.8079304695129395, "global_step": 57892, "epoch": 1378} {"train_loss": -6.000675678253174, "global_step": 57893, "epoch": 1378} {"train_loss": -5.968789100646973, "global_step": 57894, "epoch": 1378} {"train_loss": -5.860624313354492, "global_step": 57895, "epoch": 1378} {"train_loss": -5.854087829589844, "global_step": 57896, "epoch": 1378} {"train_loss": -5.9408159255981445, "global_step": 57897, "epoch": 1378} {"train_loss": -5.912962913513184, "global_step": 57898, "epoch": 1378} {"train_loss": -5.848337650299072, "global_step": 57899, "epoch": 1378} {"train_loss": -5.79188346862793, "global_step": 57900, "epoch": 1378} {"train_loss": -5.807694911956787, "global_step": 57901, "epoch": 1378} {"train_loss": -5.896125793457031, "global_step": 57902, "epoch": 1378} {"train_loss": -5.849011421203613, "global_step": 57903, "epoch": 1378} {"train_loss": -5.908146858215332, "global_step": 57904, "epoch": 1378} {"train_loss": -5.901376724243164, "global_step": 57905, "epoch": 1378} {"train_loss": -5.885743141174316, "global_step": 57906, "epoch": 1378} {"train_loss": -5.901177406311035, "global_step": 57907, "epoch": 1378} {"train_loss": -5.915921211242676, "global_step": 57908, "epoch": 1378} {"train_loss": -5.779845237731934, "global_step": 57909, "epoch": 1378} {"train_loss": -5.713115692138672, "global_step": 57910, "epoch": 1378} {"train_loss": -5.829192161560059, "global_step": 57911, "epoch": 1378} {"train_loss": -5.724118232727051, "global_step": 57912, "epoch": 1378} {"train_loss": -5.845249176025391, "global_step": 57913, "epoch": 1378} {"train_loss": -5.8053483963012695, "global_step": 57914, "epoch": 1378} {"train_loss": -5.821498870849609, "global_step": 57915, "epoch": 1378} {"train_loss": -5.864436149597168, "global_step": 57916, "epoch": 1378} {"train_loss": -5.865682215917678, "global_step": 57917, "epoch": 1378, "val_loss": 66633.640625} {"train_loss": -5.795218467712402, "global_step": 57918, "epoch": 1379} {"train_loss": -5.8728837966918945, "global_step": 57919, "epoch": 1379} {"train_loss": -5.905489921569824, "global_step": 57920, "epoch": 1379} {"train_loss": -5.738523006439209, "global_step": 57921, "epoch": 1379} {"train_loss": -5.772185325622559, "global_step": 57922, "epoch": 1379} {"train_loss": -5.931174278259277, "global_step": 57923, "epoch": 1379} {"train_loss": -5.780442714691162, "global_step": 57924, "epoch": 1379} {"train_loss": -5.835344314575195, "global_step": 57925, "epoch": 1379} {"train_loss": -5.823477268218994, "global_step": 57926, "epoch": 1379} {"train_loss": -5.725567817687988, "global_step": 57927, "epoch": 1379} {"train_loss": -5.797636032104492, "global_step": 57928, "epoch": 1379} {"train_loss": -5.927160263061523, "global_step": 57929, "epoch": 1379} {"train_loss": -5.769742965698242, "global_step": 57930, "epoch": 1379} {"train_loss": -5.835267066955566, "global_step": 57931, "epoch": 1379} {"train_loss": -5.925902366638184, "global_step": 57932, "epoch": 1379} {"train_loss": -5.796812057495117, "global_step": 57933, "epoch": 1379} {"train_loss": -5.825860023498535, "global_step": 57934, "epoch": 1379} {"train_loss": -5.83358097076416, "global_step": 57935, "epoch": 1379} {"train_loss": -5.938608169555664, "global_step": 57936, "epoch": 1379} {"train_loss": -5.6847944259643555, "global_step": 57937, "epoch": 1379} {"train_loss": -5.92363166809082, "global_step": 57938, "epoch": 1379} {"train_loss": -5.762112617492676, "global_step": 57939, "epoch": 1379} {"train_loss": -5.906597137451172, "global_step": 57940, "epoch": 1379} {"train_loss": -5.785633087158203, "global_step": 57941, "epoch": 1379} {"train_loss": -5.776362419128418, "global_step": 57942, "epoch": 1379} {"train_loss": -5.924532890319824, "global_step": 57943, "epoch": 1379} {"train_loss": -5.836638450622559, "global_step": 57944, "epoch": 1379} {"train_loss": -5.969003200531006, "global_step": 57945, "epoch": 1379} {"train_loss": -5.938530921936035, "global_step": 57946, "epoch": 1379} {"train_loss": -5.79132080078125, "global_step": 57947, "epoch": 1379} {"train_loss": -5.81585693359375, "global_step": 57948, "epoch": 1379} {"train_loss": -5.834200382232666, "global_step": 57949, "epoch": 1379} {"train_loss": -5.902318000793457, "global_step": 57950, "epoch": 1379} {"train_loss": -5.945976734161377, "global_step": 57951, "epoch": 1379} {"train_loss": -5.926394462585449, "global_step": 57952, "epoch": 1379} {"train_loss": -5.939822673797607, "global_step": 57953, "epoch": 1379} {"train_loss": -5.839022159576416, "global_step": 57954, "epoch": 1379} {"train_loss": -5.944097518920898, "global_step": 57955, "epoch": 1379} {"train_loss": -5.931097984313965, "global_step": 57956, "epoch": 1379} {"train_loss": -5.882326602935791, "global_step": 57957, "epoch": 1379} {"train_loss": -5.875801086425781, "global_step": 57958, "epoch": 1379} {"train_loss": -5.85290401322501, "global_step": 57959, "epoch": 1379, "val_loss": 66638.7265625} {"train_loss": -5.8923563957214355, "global_step": 57960, "epoch": 1380} {"train_loss": -5.888612270355225, "global_step": 57961, "epoch": 1380} {"train_loss": -5.851956367492676, "global_step": 57962, "epoch": 1380} {"train_loss": -5.813404560089111, "global_step": 57963, "epoch": 1380} {"train_loss": -5.7846574783325195, "global_step": 57964, "epoch": 1380} {"train_loss": -5.865839958190918, "global_step": 57965, "epoch": 1380} {"train_loss": -5.900474548339844, "global_step": 57966, "epoch": 1380} {"train_loss": -5.882960319519043, "global_step": 57967, "epoch": 1380} {"train_loss": -5.902811050415039, "global_step": 57968, "epoch": 1380} {"train_loss": -5.903323173522949, "global_step": 57969, "epoch": 1380} {"train_loss": -5.770930767059326, "global_step": 57970, "epoch": 1380} {"train_loss": -5.732583999633789, "global_step": 57971, "epoch": 1380} {"train_loss": -5.864974021911621, "global_step": 57972, "epoch": 1380} {"train_loss": -5.892926216125488, "global_step": 57973, "epoch": 1380} {"train_loss": -5.9233551025390625, "global_step": 57974, "epoch": 1380} {"train_loss": -5.817009449005127, "global_step": 57975, "epoch": 1380} {"train_loss": -5.690891742706299, "global_step": 57976, "epoch": 1380} {"train_loss": -5.780343055725098, "global_step": 57977, "epoch": 1380} {"train_loss": -5.8242878913879395, "global_step": 57978, "epoch": 1380} {"train_loss": -5.723438262939453, "global_step": 57979, "epoch": 1380} {"train_loss": -5.847678184509277, "global_step": 57980, "epoch": 1380} {"train_loss": -5.8400115966796875, "global_step": 57981, "epoch": 1380} {"train_loss": -5.96150016784668, "global_step": 57982, "epoch": 1380} {"train_loss": -5.849904537200928, "global_step": 57983, "epoch": 1380} {"train_loss": -5.982022762298584, "global_step": 57984, "epoch": 1380} {"train_loss": -5.8091888427734375, "global_step": 57985, "epoch": 1380} {"train_loss": -5.8017168045043945, "global_step": 57986, "epoch": 1380} {"train_loss": -5.904998779296875, "global_step": 57987, "epoch": 1380} {"train_loss": -5.821320533752441, "global_step": 57988, "epoch": 1380} {"train_loss": -5.779376983642578, "global_step": 57989, "epoch": 1380} {"train_loss": -5.79810094833374, "global_step": 57990, "epoch": 1380} {"train_loss": -5.905340194702148, "global_step": 57991, "epoch": 1380} {"train_loss": -5.869901657104492, "global_step": 57992, "epoch": 1380} {"train_loss": -5.859356880187988, "global_step": 57993, "epoch": 1380} {"train_loss": -5.9862542152404785, "global_step": 57994, "epoch": 1380} {"train_loss": -5.841119766235352, "global_step": 57995, "epoch": 1380} {"train_loss": -5.998448371887207, "global_step": 57996, "epoch": 1380} {"train_loss": -5.915854454040527, "global_step": 57997, "epoch": 1380} {"train_loss": -5.881445407867432, "global_step": 57998, "epoch": 1380} {"train_loss": -5.944607734680176, "global_step": 57999, "epoch": 1380} {"train_loss": -5.88587760925293, "global_step": 58000, "epoch": 1380} {"train_loss": -5.859252997807094, "global_step": 58001, "epoch": 1380, "val_loss": 66535.546875} {"train_loss": -5.718412399291992, "global_step": 58002, "epoch": 1381} {"train_loss": -5.863279819488525, "global_step": 58003, "epoch": 1381} {"train_loss": -5.933957099914551, "global_step": 58004, "epoch": 1381} {"train_loss": -5.826470375061035, "global_step": 58005, "epoch": 1381} {"train_loss": -5.95351505279541, "global_step": 58006, "epoch": 1381} {"train_loss": -5.954288482666016, "global_step": 58007, "epoch": 1381} {"train_loss": -5.902294158935547, "global_step": 58008, "epoch": 1381} {"train_loss": -5.839582443237305, "global_step": 58009, "epoch": 1381} {"train_loss": -5.924875736236572, "global_step": 58010, "epoch": 1381} {"train_loss": -5.866994380950928, "global_step": 58011, "epoch": 1381} {"train_loss": -5.805294990539551, "global_step": 58012, "epoch": 1381} {"train_loss": -5.843056678771973, "global_step": 58013, "epoch": 1381} {"train_loss": -5.872471332550049, "global_step": 58014, "epoch": 1381} {"train_loss": -6.021848678588867, "global_step": 58015, "epoch": 1381} {"train_loss": -5.819635391235352, "global_step": 58016, "epoch": 1381} {"train_loss": -5.896836280822754, "global_step": 58017, "epoch": 1381} {"train_loss": -5.8124237060546875, "global_step": 58018, "epoch": 1381} {"train_loss": -5.869933128356934, "global_step": 58019, "epoch": 1381} {"train_loss": -5.804935455322266, "global_step": 58020, "epoch": 1381} {"train_loss": -5.878302097320557, "global_step": 58021, "epoch": 1381} {"train_loss": -5.6970624923706055, "global_step": 58022, "epoch": 1381} {"train_loss": -5.9017486572265625, "global_step": 58023, "epoch": 1381} {"train_loss": -5.777068138122559, "global_step": 58024, "epoch": 1381} {"train_loss": -5.789782524108887, "global_step": 58025, "epoch": 1381} {"train_loss": -5.8010406494140625, "global_step": 58026, "epoch": 1381} {"train_loss": -5.894855499267578, "global_step": 58027, "epoch": 1381} {"train_loss": -5.9516777992248535, "global_step": 58028, "epoch": 1381} {"train_loss": -5.849092483520508, "global_step": 58029, "epoch": 1381} {"train_loss": -5.806529521942139, "global_step": 58030, "epoch": 1381} {"train_loss": -5.881636619567871, "global_step": 58031, "epoch": 1381} {"train_loss": -5.875097274780273, "global_step": 58032, "epoch": 1381} {"train_loss": -5.849928855895996, "global_step": 58033, "epoch": 1381} {"train_loss": -5.7876996994018555, "global_step": 58034, "epoch": 1381} {"train_loss": -5.744757652282715, "global_step": 58035, "epoch": 1381} {"train_loss": -5.927424430847168, "global_step": 58036, "epoch": 1381} {"train_loss": -5.726039886474609, "global_step": 58037, "epoch": 1381} {"train_loss": -5.826510906219482, "global_step": 58038, "epoch": 1381} {"train_loss": -5.874565124511719, "global_step": 58039, "epoch": 1381} {"train_loss": -5.843617916107178, "global_step": 58040, "epoch": 1381} {"train_loss": -5.85556697845459, "global_step": 58041, "epoch": 1381} {"train_loss": -5.928859710693359, "global_step": 58042, "epoch": 1381} {"train_loss": -5.8523666972205755, "global_step": 58043, "epoch": 1381, "val_loss": 66659.1953125} {"train_loss": -5.820941925048828, "global_step": 58044, "epoch": 1382} {"train_loss": -5.852863788604736, "global_step": 58045, "epoch": 1382} {"train_loss": -5.897043228149414, "global_step": 58046, "epoch": 1382} {"train_loss": -5.869475841522217, "global_step": 58047, "epoch": 1382} {"train_loss": -5.944089889526367, "global_step": 58048, "epoch": 1382} {"train_loss": -5.743017196655273, "global_step": 58049, "epoch": 1382} {"train_loss": -5.89286470413208, "global_step": 58050, "epoch": 1382} {"train_loss": -5.755486488342285, "global_step": 58051, "epoch": 1382} {"train_loss": -5.857479095458984, "global_step": 58052, "epoch": 1382} {"train_loss": -5.724621772766113, "global_step": 58053, "epoch": 1382} {"train_loss": -5.753198623657227, "global_step": 58054, "epoch": 1382} {"train_loss": -5.9165849685668945, "global_step": 58055, "epoch": 1382} {"train_loss": -5.736254692077637, "global_step": 58056, "epoch": 1382} {"train_loss": -5.89484167098999, "global_step": 58057, "epoch": 1382} {"train_loss": -5.865566253662109, "global_step": 58058, "epoch": 1382} {"train_loss": -5.931674003601074, "global_step": 58059, "epoch": 1382} {"train_loss": -5.8415117263793945, "global_step": 58060, "epoch": 1382} {"train_loss": -5.855865478515625, "global_step": 58061, "epoch": 1382} {"train_loss": -5.828589916229248, "global_step": 58062, "epoch": 1382} {"train_loss": -5.894092559814453, "global_step": 58063, "epoch": 1382} {"train_loss": -5.765941619873047, "global_step": 58064, "epoch": 1382} {"train_loss": -5.948741912841797, "global_step": 58065, "epoch": 1382} {"train_loss": -5.813780307769775, "global_step": 58066, "epoch": 1382} {"train_loss": -5.845605373382568, "global_step": 58067, "epoch": 1382} {"train_loss": -5.691349506378174, "global_step": 58068, "epoch": 1382} {"train_loss": -5.870963096618652, "global_step": 58069, "epoch": 1382} {"train_loss": -5.893606662750244, "global_step": 58070, "epoch": 1382} {"train_loss": -5.720518589019775, "global_step": 58071, "epoch": 1382} {"train_loss": -5.786752700805664, "global_step": 58072, "epoch": 1382} {"train_loss": -5.88630485534668, "global_step": 58073, "epoch": 1382} {"train_loss": -5.738138198852539, "global_step": 58074, "epoch": 1382} {"train_loss": -5.8248395919799805, "global_step": 58075, "epoch": 1382} {"train_loss": -5.962851047515869, "global_step": 58076, "epoch": 1382} {"train_loss": -5.963083744049072, "global_step": 58077, "epoch": 1382} {"train_loss": -5.8975019454956055, "global_step": 58078, "epoch": 1382} {"train_loss": -5.654794216156006, "global_step": 58079, "epoch": 1382} {"train_loss": -5.936987400054932, "global_step": 58080, "epoch": 1382} {"train_loss": -5.813431739807129, "global_step": 58081, "epoch": 1382} {"train_loss": -5.782444953918457, "global_step": 58082, "epoch": 1382} {"train_loss": -5.800597667694092, "global_step": 58083, "epoch": 1382} {"train_loss": -5.822898864746094, "global_step": 58084, "epoch": 1382} {"train_loss": -5.836256583531697, "global_step": 58085, "epoch": 1382, "val_loss": 66802.3046875} {"train_loss": -5.778285980224609, "global_step": 58086, "epoch": 1383} {"train_loss": -5.804548263549805, "global_step": 58087, "epoch": 1383} {"train_loss": -5.94260311126709, "global_step": 58088, "epoch": 1383} {"train_loss": -5.839980602264404, "global_step": 58089, "epoch": 1383} {"train_loss": -5.798713207244873, "global_step": 58090, "epoch": 1383} {"train_loss": -5.804514408111572, "global_step": 58091, "epoch": 1383} {"train_loss": -5.821671962738037, "global_step": 58092, "epoch": 1383} {"train_loss": -5.838120460510254, "global_step": 58093, "epoch": 1383} {"train_loss": -5.865769386291504, "global_step": 58094, "epoch": 1383} {"train_loss": -5.931468486785889, "global_step": 58095, "epoch": 1383} {"train_loss": -5.912787437438965, "global_step": 58096, "epoch": 1383} {"train_loss": -5.779659271240234, "global_step": 58097, "epoch": 1383} {"train_loss": -5.739464282989502, "global_step": 58098, "epoch": 1383} {"train_loss": -5.832202911376953, "global_step": 58099, "epoch": 1383} {"train_loss": -5.875495910644531, "global_step": 58100, "epoch": 1383} {"train_loss": -5.884408473968506, "global_step": 58101, "epoch": 1383} {"train_loss": -5.983675479888916, "global_step": 58102, "epoch": 1383} {"train_loss": -5.83454704284668, "global_step": 58103, "epoch": 1383} {"train_loss": -5.893344402313232, "global_step": 58104, "epoch": 1383} {"train_loss": -5.997469425201416, "global_step": 58105, "epoch": 1383} {"train_loss": -5.9018707275390625, "global_step": 58106, "epoch": 1383} {"train_loss": -5.850279808044434, "global_step": 58107, "epoch": 1383} {"train_loss": -5.92031192779541, "global_step": 58108, "epoch": 1383} {"train_loss": -5.923474311828613, "global_step": 58109, "epoch": 1383} {"train_loss": -5.91366720199585, "global_step": 58110, "epoch": 1383} {"train_loss": -5.865767478942871, "global_step": 58111, "epoch": 1383} {"train_loss": -5.846446990966797, "global_step": 58112, "epoch": 1383} {"train_loss": -5.889499664306641, "global_step": 58113, "epoch": 1383} {"train_loss": -5.790851593017578, "global_step": 58114, "epoch": 1383} {"train_loss": -5.914230823516846, "global_step": 58115, "epoch": 1383} {"train_loss": -5.890652656555176, "global_step": 58116, "epoch": 1383} {"train_loss": -5.7906975746154785, "global_step": 58117, "epoch": 1383} {"train_loss": -5.871896743774414, "global_step": 58118, "epoch": 1383} {"train_loss": -5.8231892585754395, "global_step": 58119, "epoch": 1383} {"train_loss": -5.924136638641357, "global_step": 58120, "epoch": 1383} {"train_loss": -5.8685173988342285, "global_step": 58121, "epoch": 1383} {"train_loss": -5.857677459716797, "global_step": 58122, "epoch": 1383} {"train_loss": -5.759184837341309, "global_step": 58123, "epoch": 1383} {"train_loss": -5.778683662414551, "global_step": 58124, "epoch": 1383} {"train_loss": -5.915740966796875, "global_step": 58125, "epoch": 1383} {"train_loss": -5.824782371520996, "global_step": 58126, "epoch": 1383} {"train_loss": -5.860727673485165, "global_step": 58127, "epoch": 1383, "val_loss": 66915.2890625} {"train_loss": -5.914122104644775, "global_step": 58128, "epoch": 1384} {"train_loss": -5.736026763916016, "global_step": 58129, "epoch": 1384} {"train_loss": -5.884985446929932, "global_step": 58130, "epoch": 1384} {"train_loss": -5.8209004402160645, "global_step": 58131, "epoch": 1384} {"train_loss": -5.920467376708984, "global_step": 58132, "epoch": 1384} {"train_loss": -5.64222526550293, "global_step": 58133, "epoch": 1384} {"train_loss": -5.820256233215332, "global_step": 58134, "epoch": 1384} {"train_loss": -5.861111640930176, "global_step": 58135, "epoch": 1384} {"train_loss": -5.732424259185791, "global_step": 58136, "epoch": 1384} {"train_loss": -5.968530654907227, "global_step": 58137, "epoch": 1384} {"train_loss": -5.8636064529418945, "global_step": 58138, "epoch": 1384} {"train_loss": -5.84819221496582, "global_step": 58139, "epoch": 1384} {"train_loss": -5.718887805938721, "global_step": 58140, "epoch": 1384} {"train_loss": -5.8961029052734375, "global_step": 58141, "epoch": 1384} {"train_loss": -5.920915603637695, "global_step": 58142, "epoch": 1384} {"train_loss": -5.886166095733643, "global_step": 58143, "epoch": 1384} {"train_loss": -5.940070152282715, "global_step": 58144, "epoch": 1384} {"train_loss": -5.85746955871582, "global_step": 58145, "epoch": 1384} {"train_loss": -5.84083366394043, "global_step": 58146, "epoch": 1384} {"train_loss": -5.86908483505249, "global_step": 58147, "epoch": 1384} {"train_loss": -5.728814125061035, "global_step": 58148, "epoch": 1384} {"train_loss": -5.889449119567871, "global_step": 58149, "epoch": 1384} {"train_loss": -5.828378677368164, "global_step": 58150, "epoch": 1384} {"train_loss": -5.86741828918457, "global_step": 58151, "epoch": 1384} {"train_loss": -5.917623043060303, "global_step": 58152, "epoch": 1384} {"train_loss": -5.838107585906982, "global_step": 58153, "epoch": 1384} {"train_loss": -5.777829647064209, "global_step": 58154, "epoch": 1384} {"train_loss": -5.782386302947998, "global_step": 58155, "epoch": 1384} {"train_loss": -5.834402561187744, "global_step": 58156, "epoch": 1384} {"train_loss": -5.8337202072143555, "global_step": 58157, "epoch": 1384} {"train_loss": -5.902963161468506, "global_step": 58158, "epoch": 1384} {"train_loss": -5.859731674194336, "global_step": 58159, "epoch": 1384} {"train_loss": -5.7523298263549805, "global_step": 58160, "epoch": 1384} {"train_loss": -5.8189544677734375, "global_step": 58161, "epoch": 1384} {"train_loss": -5.793954849243164, "global_step": 58162, "epoch": 1384} {"train_loss": -5.9020915031433105, "global_step": 58163, "epoch": 1384} {"train_loss": -5.808377265930176, "global_step": 58164, "epoch": 1384} {"train_loss": -5.863992691040039, "global_step": 58165, "epoch": 1384} {"train_loss": -5.843602180480957, "global_step": 58166, "epoch": 1384} {"train_loss": -5.818173408508301, "global_step": 58167, "epoch": 1384} {"train_loss": -5.936519145965576, "global_step": 58168, "epoch": 1384} {"train_loss": -5.842246328081403, "global_step": 58169, "epoch": 1384, "val_loss": 66510.2421875} {"train_loss": -5.872385025024414, "global_step": 58170, "epoch": 1385} {"train_loss": -5.824118137359619, "global_step": 58171, "epoch": 1385} {"train_loss": -5.835247039794922, "global_step": 58172, "epoch": 1385} {"train_loss": -5.858561992645264, "global_step": 58173, "epoch": 1385} {"train_loss": -5.925697326660156, "global_step": 58174, "epoch": 1385} {"train_loss": -5.853841781616211, "global_step": 58175, "epoch": 1385} {"train_loss": -5.924800872802734, "global_step": 58176, "epoch": 1385} {"train_loss": -5.887600898742676, "global_step": 58177, "epoch": 1385} {"train_loss": -5.785855293273926, "global_step": 58178, "epoch": 1385} {"train_loss": -5.861468315124512, "global_step": 58179, "epoch": 1385} {"train_loss": -5.884827613830566, "global_step": 58180, "epoch": 1385} {"train_loss": -5.907336235046387, "global_step": 58181, "epoch": 1385} {"train_loss": -5.933014869689941, "global_step": 58182, "epoch": 1385} {"train_loss": -5.841736793518066, "global_step": 58183, "epoch": 1385} {"train_loss": -5.833374977111816, "global_step": 58184, "epoch": 1385} {"train_loss": -5.90501594543457, "global_step": 58185, "epoch": 1385} {"train_loss": -5.848812103271484, "global_step": 58186, "epoch": 1385} {"train_loss": -5.78754186630249, "global_step": 58187, "epoch": 1385} {"train_loss": -5.846970558166504, "global_step": 58188, "epoch": 1385} {"train_loss": -5.816721439361572, "global_step": 58189, "epoch": 1385} {"train_loss": -5.998847961425781, "global_step": 58190, "epoch": 1385} {"train_loss": -5.78306770324707, "global_step": 58191, "epoch": 1385} {"train_loss": -5.937082290649414, "global_step": 58192, "epoch": 1385} {"train_loss": -5.816481590270996, "global_step": 58193, "epoch": 1385} {"train_loss": -5.901182174682617, "global_step": 58194, "epoch": 1385} {"train_loss": -5.851408004760742, "global_step": 58195, "epoch": 1385} {"train_loss": -5.756863594055176, "global_step": 58196, "epoch": 1385} {"train_loss": -5.87149715423584, "global_step": 58197, "epoch": 1385} {"train_loss": -5.730538368225098, "global_step": 58198, "epoch": 1385} {"train_loss": -5.837908744812012, "global_step": 58199, "epoch": 1385} {"train_loss": -5.838393688201904, "global_step": 58200, "epoch": 1385} {"train_loss": -5.858536720275879, "global_step": 58201, "epoch": 1385} {"train_loss": -5.871262550354004, "global_step": 58202, "epoch": 1385} {"train_loss": -5.884522914886475, "global_step": 58203, "epoch": 1385} {"train_loss": -5.950082778930664, "global_step": 58204, "epoch": 1385} {"train_loss": -5.831148147583008, "global_step": 58205, "epoch": 1385} {"train_loss": -5.956286430358887, "global_step": 58206, "epoch": 1385} {"train_loss": -5.932507514953613, "global_step": 58207, "epoch": 1385} {"train_loss": -5.888737678527832, "global_step": 58208, "epoch": 1385} {"train_loss": -5.861856937408447, "global_step": 58209, "epoch": 1385} {"train_loss": -5.990311145782471, "global_step": 58210, "epoch": 1385} {"train_loss": -5.8713163648332864, "global_step": 58211, "epoch": 1385, "val_loss": 66480.3359375} {"train_loss": -5.875068187713623, "global_step": 58212, "epoch": 1386} {"train_loss": -5.919390678405762, "global_step": 58213, "epoch": 1386} {"train_loss": -5.939661026000977, "global_step": 58214, "epoch": 1386} {"train_loss": -6.037537574768066, "global_step": 58215, "epoch": 1386} {"train_loss": -5.779699802398682, "global_step": 58216, "epoch": 1386} {"train_loss": -5.910342216491699, "global_step": 58217, "epoch": 1386} {"train_loss": -5.874333381652832, "global_step": 58218, "epoch": 1386} {"train_loss": -5.936188220977783, "global_step": 58219, "epoch": 1386} {"train_loss": -5.892265796661377, "global_step": 58220, "epoch": 1386} {"train_loss": -5.902370452880859, "global_step": 58221, "epoch": 1386} {"train_loss": -5.954037666320801, "global_step": 58222, "epoch": 1386} {"train_loss": -5.8501081466674805, "global_step": 58223, "epoch": 1386} {"train_loss": -5.979004859924316, "global_step": 58224, "epoch": 1386} {"train_loss": -5.8528666496276855, "global_step": 58225, "epoch": 1386} {"train_loss": -5.823807716369629, "global_step": 58226, "epoch": 1386} {"train_loss": -5.871947288513184, "global_step": 58227, "epoch": 1386} {"train_loss": -5.864908695220947, "global_step": 58228, "epoch": 1386} {"train_loss": -5.917719841003418, "global_step": 58229, "epoch": 1386} {"train_loss": -5.776971817016602, "global_step": 58230, "epoch": 1386} {"train_loss": -5.91422700881958, "global_step": 58231, "epoch": 1386} {"train_loss": -5.935581207275391, "global_step": 58232, "epoch": 1386} {"train_loss": -5.957159996032715, "global_step": 58233, "epoch": 1386} {"train_loss": -5.881598472595215, "global_step": 58234, "epoch": 1386} {"train_loss": -5.788021087646484, "global_step": 58235, "epoch": 1386} {"train_loss": -6.02856969833374, "global_step": 58236, "epoch": 1386} {"train_loss": -5.788819313049316, "global_step": 58237, "epoch": 1386} {"train_loss": -5.884111404418945, "global_step": 58238, "epoch": 1386} {"train_loss": -5.833122730255127, "global_step": 58239, "epoch": 1386} {"train_loss": -5.938779830932617, "global_step": 58240, "epoch": 1386} {"train_loss": -5.859542369842529, "global_step": 58241, "epoch": 1386} {"train_loss": -5.822124004364014, "global_step": 58242, "epoch": 1386} {"train_loss": -5.913524627685547, "global_step": 58243, "epoch": 1386} {"train_loss": -5.745798587799072, "global_step": 58244, "epoch": 1386} {"train_loss": -5.850028038024902, "global_step": 58245, "epoch": 1386} {"train_loss": -5.879061698913574, "global_step": 58246, "epoch": 1386} {"train_loss": -5.825416564941406, "global_step": 58247, "epoch": 1386} {"train_loss": -5.846527099609375, "global_step": 58248, "epoch": 1386} {"train_loss": -5.840315818786621, "global_step": 58249, "epoch": 1386} {"train_loss": -5.748555660247803, "global_step": 58250, "epoch": 1386} {"train_loss": -5.852746963500977, "global_step": 58251, "epoch": 1386} {"train_loss": -5.631857872009277, "global_step": 58252, "epoch": 1386} {"train_loss": -5.8676212174551825, "global_step": 58253, "epoch": 1386, "val_loss": 66892.0859375} {"train_loss": -5.760255813598633, "global_step": 58254, "epoch": 1387} {"train_loss": -5.853780746459961, "global_step": 58255, "epoch": 1387} {"train_loss": -5.815944671630859, "global_step": 58256, "epoch": 1387} {"train_loss": -5.753872871398926, "global_step": 58257, "epoch": 1387} {"train_loss": -5.873683929443359, "global_step": 58258, "epoch": 1387} {"train_loss": -5.823137283325195, "global_step": 58259, "epoch": 1387} {"train_loss": -5.886269569396973, "global_step": 58260, "epoch": 1387} {"train_loss": -5.841792106628418, "global_step": 58261, "epoch": 1387} {"train_loss": -5.869021892547607, "global_step": 58262, "epoch": 1387} {"train_loss": -5.844636917114258, "global_step": 58263, "epoch": 1387} {"train_loss": -5.624762535095215, "global_step": 58264, "epoch": 1387} {"train_loss": -5.742281913757324, "global_step": 58265, "epoch": 1387} {"train_loss": -5.80306339263916, "global_step": 58266, "epoch": 1387} {"train_loss": -5.819547176361084, "global_step": 58267, "epoch": 1387} {"train_loss": -5.794463634490967, "global_step": 58268, "epoch": 1387} {"train_loss": -5.834744930267334, "global_step": 58269, "epoch": 1387} {"train_loss": -5.717626571655273, "global_step": 58270, "epoch": 1387} {"train_loss": -5.80002498626709, "global_step": 58271, "epoch": 1387} {"train_loss": -5.880751609802246, "global_step": 58272, "epoch": 1387} {"train_loss": -5.796822547912598, "global_step": 58273, "epoch": 1387} {"train_loss": -5.800369739532471, "global_step": 58274, "epoch": 1387} {"train_loss": -5.794365406036377, "global_step": 58275, "epoch": 1387} {"train_loss": -5.700118064880371, "global_step": 58276, "epoch": 1387} {"train_loss": -5.9001970291137695, "global_step": 58277, "epoch": 1387} {"train_loss": -5.9281086921691895, "global_step": 58278, "epoch": 1387} {"train_loss": -5.816498756408691, "global_step": 58279, "epoch": 1387} {"train_loss": -5.829309463500977, "global_step": 58280, "epoch": 1387} {"train_loss": -5.907045364379883, "global_step": 58281, "epoch": 1387} {"train_loss": -5.720047950744629, "global_step": 58282, "epoch": 1387} {"train_loss": -5.769046783447266, "global_step": 58283, "epoch": 1387} {"train_loss": -5.914177894592285, "global_step": 58284, "epoch": 1387} {"train_loss": -5.893817901611328, "global_step": 58285, "epoch": 1387} {"train_loss": -5.934412002563477, "global_step": 58286, "epoch": 1387} {"train_loss": -5.920787334442139, "global_step": 58287, "epoch": 1387} {"train_loss": -5.938310623168945, "global_step": 58288, "epoch": 1387} {"train_loss": -5.936226844787598, "global_step": 58289, "epoch": 1387} {"train_loss": -5.787117958068848, "global_step": 58290, "epoch": 1387} {"train_loss": -5.6559247970581055, "global_step": 58291, "epoch": 1387} {"train_loss": -5.893571376800537, "global_step": 58292, "epoch": 1387} {"train_loss": -5.823606491088867, "global_step": 58293, "epoch": 1387} {"train_loss": -5.840731620788574, "global_step": 58294, "epoch": 1387} {"train_loss": -5.827274617694673, "global_step": 58295, "epoch": 1387, "val_loss": 66584.125} {"train_loss": -5.747271537780762, "global_step": 58296, "epoch": 1388} {"train_loss": -5.862776756286621, "global_step": 58297, "epoch": 1388} {"train_loss": -5.8813042640686035, "global_step": 58298, "epoch": 1388} {"train_loss": -5.753445625305176, "global_step": 58299, "epoch": 1388} {"train_loss": -5.656769752502441, "global_step": 58300, "epoch": 1388} {"train_loss": -5.818442344665527, "global_step": 58301, "epoch": 1388} {"train_loss": -5.867130279541016, "global_step": 58302, "epoch": 1388} {"train_loss": -5.770089149475098, "global_step": 58303, "epoch": 1388} {"train_loss": -5.803332328796387, "global_step": 58304, "epoch": 1388} {"train_loss": -6.000554084777832, "global_step": 58305, "epoch": 1388} {"train_loss": -5.855649471282959, "global_step": 58306, "epoch": 1388} {"train_loss": -5.791518211364746, "global_step": 58307, "epoch": 1388} {"train_loss": -5.815377235412598, "global_step": 58308, "epoch": 1388} {"train_loss": -5.91847038269043, "global_step": 58309, "epoch": 1388} {"train_loss": -5.923360347747803, "global_step": 58310, "epoch": 1388} {"train_loss": -5.832669734954834, "global_step": 58311, "epoch": 1388} {"train_loss": -5.900388240814209, "global_step": 58312, "epoch": 1388} {"train_loss": -5.817015647888184, "global_step": 58313, "epoch": 1388} {"train_loss": -5.802587509155273, "global_step": 58314, "epoch": 1388} {"train_loss": -6.007903099060059, "global_step": 58315, "epoch": 1388} {"train_loss": -5.885443210601807, "global_step": 58316, "epoch": 1388} {"train_loss": -5.880760669708252, "global_step": 58317, "epoch": 1388} {"train_loss": -5.777307033538818, "global_step": 58318, "epoch": 1388} {"train_loss": -5.822248458862305, "global_step": 58319, "epoch": 1388} {"train_loss": -5.914176940917969, "global_step": 58320, "epoch": 1388} {"train_loss": -5.954334259033203, "global_step": 58321, "epoch": 1388} {"train_loss": -5.695664405822754, "global_step": 58322, "epoch": 1388} {"train_loss": -5.8478803634643555, "global_step": 58323, "epoch": 1388} {"train_loss": -5.728517532348633, "global_step": 58324, "epoch": 1388} {"train_loss": -5.739768028259277, "global_step": 58325, "epoch": 1388} {"train_loss": -5.765273571014404, "global_step": 58326, "epoch": 1388} {"train_loss": -5.841699600219727, "global_step": 58327, "epoch": 1388} {"train_loss": -5.873624801635742, "global_step": 58328, "epoch": 1388} {"train_loss": -5.81060791015625, "global_step": 58329, "epoch": 1388} {"train_loss": -5.8670759201049805, "global_step": 58330, "epoch": 1388} {"train_loss": -5.733386993408203, "global_step": 58331, "epoch": 1388} {"train_loss": -5.941305160522461, "global_step": 58332, "epoch": 1388} {"train_loss": -5.8675055503845215, "global_step": 58333, "epoch": 1388} {"train_loss": -5.931523323059082, "global_step": 58334, "epoch": 1388} {"train_loss": -5.88729190826416, "global_step": 58335, "epoch": 1388} {"train_loss": -5.760647296905518, "global_step": 58336, "epoch": 1388} {"train_loss": -5.837553330830166, "global_step": 58337, "epoch": 1388, "val_loss": 66823.5625} {"train_loss": -5.888312816619873, "global_step": 58338, "epoch": 1389} {"train_loss": -5.848982810974121, "global_step": 58339, "epoch": 1389} {"train_loss": -5.772025108337402, "global_step": 58340, "epoch": 1389} {"train_loss": -5.810190200805664, "global_step": 58341, "epoch": 1389} {"train_loss": -5.752134323120117, "global_step": 58342, "epoch": 1389} {"train_loss": -5.828533172607422, "global_step": 58343, "epoch": 1389} {"train_loss": -5.950942039489746, "global_step": 58344, "epoch": 1389} {"train_loss": -5.83709716796875, "global_step": 58345, "epoch": 1389} {"train_loss": -5.823554039001465, "global_step": 58346, "epoch": 1389} {"train_loss": -5.699317932128906, "global_step": 58347, "epoch": 1389} {"train_loss": -5.937830924987793, "global_step": 58348, "epoch": 1389} {"train_loss": -5.904255390167236, "global_step": 58349, "epoch": 1389} {"train_loss": -5.878882884979248, "global_step": 58350, "epoch": 1389} {"train_loss": -5.828866958618164, "global_step": 58351, "epoch": 1389} {"train_loss": -5.912133693695068, "global_step": 58352, "epoch": 1389} {"train_loss": -6.022119045257568, "global_step": 58353, "epoch": 1389} {"train_loss": -5.869596004486084, "global_step": 58354, "epoch": 1389} {"train_loss": -5.766251087188721, "global_step": 58355, "epoch": 1389} {"train_loss": -5.879806995391846, "global_step": 58356, "epoch": 1389} {"train_loss": -5.829277515411377, "global_step": 58357, "epoch": 1389} {"train_loss": -5.781719207763672, "global_step": 58358, "epoch": 1389} {"train_loss": -5.88588809967041, "global_step": 58359, "epoch": 1389} {"train_loss": -5.997707843780518, "global_step": 58360, "epoch": 1389} {"train_loss": -5.8289995193481445, "global_step": 58361, "epoch": 1389} {"train_loss": -5.84250545501709, "global_step": 58362, "epoch": 1389} {"train_loss": -5.945158004760742, "global_step": 58363, "epoch": 1389} {"train_loss": -5.70947265625, "global_step": 58364, "epoch": 1389} {"train_loss": -5.889863967895508, "global_step": 58365, "epoch": 1389} {"train_loss": -5.931408882141113, "global_step": 58366, "epoch": 1389} {"train_loss": -5.783924102783203, "global_step": 58367, "epoch": 1389} {"train_loss": -5.821328163146973, "global_step": 58368, "epoch": 1389} {"train_loss": -5.978504657745361, "global_step": 58369, "epoch": 1389} {"train_loss": -5.86496639251709, "global_step": 58370, "epoch": 1389} {"train_loss": -5.690941333770752, "global_step": 58371, "epoch": 1389} {"train_loss": -5.9642744064331055, "global_step": 58372, "epoch": 1389} {"train_loss": -5.719247817993164, "global_step": 58373, "epoch": 1389} {"train_loss": -5.855381488800049, "global_step": 58374, "epoch": 1389} {"train_loss": -5.847063064575195, "global_step": 58375, "epoch": 1389} {"train_loss": -5.652774810791016, "global_step": 58376, "epoch": 1389} {"train_loss": -5.872323036193848, "global_step": 58377, "epoch": 1389} {"train_loss": -5.8493876457214355, "global_step": 58378, "epoch": 1389} {"train_loss": -5.845382077353341, "global_step": 58379, "epoch": 1389, "val_loss": 66688.359375} {"train_loss": -5.873351573944092, "global_step": 58380, "epoch": 1390} {"train_loss": -5.928251266479492, "global_step": 58381, "epoch": 1390} {"train_loss": -5.7482404708862305, "global_step": 58382, "epoch": 1390} {"train_loss": -5.986034393310547, "global_step": 58383, "epoch": 1390} {"train_loss": -5.780995845794678, "global_step": 58384, "epoch": 1390} {"train_loss": -5.9113945960998535, "global_step": 58385, "epoch": 1390} {"train_loss": -5.776177883148193, "global_step": 58386, "epoch": 1390} {"train_loss": -5.819293022155762, "global_step": 58387, "epoch": 1390} {"train_loss": -5.795782089233398, "global_step": 58388, "epoch": 1390} {"train_loss": -5.740435600280762, "global_step": 58389, "epoch": 1390} {"train_loss": -5.895271301269531, "global_step": 58390, "epoch": 1390} {"train_loss": -5.879554748535156, "global_step": 58391, "epoch": 1390} {"train_loss": -5.871577739715576, "global_step": 58392, "epoch": 1390} {"train_loss": -5.949735164642334, "global_step": 58393, "epoch": 1390} {"train_loss": -5.8748579025268555, "global_step": 58394, "epoch": 1390} {"train_loss": -5.870967864990234, "global_step": 58395, "epoch": 1390} {"train_loss": -5.895232677459717, "global_step": 58396, "epoch": 1390} {"train_loss": -5.871916770935059, "global_step": 58397, "epoch": 1390} {"train_loss": -5.863122940063477, "global_step": 58398, "epoch": 1390} {"train_loss": -5.816133499145508, "global_step": 58399, "epoch": 1390} {"train_loss": -5.910403728485107, "global_step": 58400, "epoch": 1390} {"train_loss": -5.936150550842285, "global_step": 58401, "epoch": 1390} {"train_loss": -5.91370153427124, "global_step": 58402, "epoch": 1390} {"train_loss": -5.911820888519287, "global_step": 58403, "epoch": 1390} {"train_loss": -5.852123260498047, "global_step": 58404, "epoch": 1390} {"train_loss": -5.770849704742432, "global_step": 58405, "epoch": 1390} {"train_loss": -5.837292194366455, "global_step": 58406, "epoch": 1390} {"train_loss": -5.937861442565918, "global_step": 58407, "epoch": 1390} {"train_loss": -5.888406753540039, "global_step": 58408, "epoch": 1390} {"train_loss": -5.855915069580078, "global_step": 58409, "epoch": 1390} {"train_loss": -5.9160308837890625, "global_step": 58410, "epoch": 1390} {"train_loss": -5.929421901702881, "global_step": 58411, "epoch": 1390} {"train_loss": -5.959959983825684, "global_step": 58412, "epoch": 1390} {"train_loss": -5.818849563598633, "global_step": 58413, "epoch": 1390} {"train_loss": -6.036518096923828, "global_step": 58414, "epoch": 1390} {"train_loss": -5.781352996826172, "global_step": 58415, "epoch": 1390} {"train_loss": -5.90464973449707, "global_step": 58416, "epoch": 1390} {"train_loss": -5.929574966430664, "global_step": 58417, "epoch": 1390} {"train_loss": -5.9136271476745605, "global_step": 58418, "epoch": 1390} {"train_loss": -5.8469109535217285, "global_step": 58419, "epoch": 1390} {"train_loss": -5.895036697387695, "global_step": 58420, "epoch": 1390} {"train_loss": -5.875819649015154, "global_step": 58421, "epoch": 1390, "val_loss": 66720.2421875} {"train_loss": -5.87506103515625, "global_step": 58422, "epoch": 1391} {"train_loss": -5.9420599937438965, "global_step": 58423, "epoch": 1391} {"train_loss": -5.898109436035156, "global_step": 58424, "epoch": 1391} {"train_loss": -5.807750701904297, "global_step": 58425, "epoch": 1391} {"train_loss": -5.804117679595947, "global_step": 58426, "epoch": 1391} {"train_loss": -6.012748718261719, "global_step": 58427, "epoch": 1391} {"train_loss": -5.955857276916504, "global_step": 58428, "epoch": 1391} {"train_loss": -5.8074631690979, "global_step": 58429, "epoch": 1391} {"train_loss": -5.940423965454102, "global_step": 58430, "epoch": 1391} {"train_loss": -5.867820739746094, "global_step": 58431, "epoch": 1391} {"train_loss": -5.864342212677002, "global_step": 58432, "epoch": 1391} {"train_loss": -5.969460487365723, "global_step": 58433, "epoch": 1391} {"train_loss": -5.868196964263916, "global_step": 58434, "epoch": 1391} {"train_loss": -5.898819923400879, "global_step": 58435, "epoch": 1391} {"train_loss": -5.874551773071289, "global_step": 58436, "epoch": 1391} {"train_loss": -5.896013259887695, "global_step": 58437, "epoch": 1391} {"train_loss": -5.875263214111328, "global_step": 58438, "epoch": 1391} {"train_loss": -5.955312252044678, "global_step": 58439, "epoch": 1391} {"train_loss": -5.861791133880615, "global_step": 58440, "epoch": 1391} {"train_loss": -6.019845008850098, "global_step": 58441, "epoch": 1391} {"train_loss": -5.93760871887207, "global_step": 58442, "epoch": 1391} {"train_loss": -5.887638092041016, "global_step": 58443, "epoch": 1391} {"train_loss": -5.960291862487793, "global_step": 58444, "epoch": 1391} {"train_loss": -5.96806001663208, "global_step": 58445, "epoch": 1391} {"train_loss": -5.887879371643066, "global_step": 58446, "epoch": 1391} {"train_loss": -5.956035614013672, "global_step": 58447, "epoch": 1391} {"train_loss": -5.81229829788208, "global_step": 58448, "epoch": 1391} {"train_loss": -5.877442359924316, "global_step": 58449, "epoch": 1391} {"train_loss": -5.77936315536499, "global_step": 58450, "epoch": 1391} {"train_loss": -5.855783462524414, "global_step": 58451, "epoch": 1391} {"train_loss": -5.868240833282471, "global_step": 58452, "epoch": 1391} {"train_loss": -5.8482465744018555, "global_step": 58453, "epoch": 1391} {"train_loss": -5.923763275146484, "global_step": 58454, "epoch": 1391} {"train_loss": -5.862854957580566, "global_step": 58455, "epoch": 1391} {"train_loss": -5.868225574493408, "global_step": 58456, "epoch": 1391} {"train_loss": -5.71634578704834, "global_step": 58457, "epoch": 1391} {"train_loss": -5.806245803833008, "global_step": 58458, "epoch": 1391} {"train_loss": -5.919221878051758, "global_step": 58459, "epoch": 1391} {"train_loss": -5.88194465637207, "global_step": 58460, "epoch": 1391} {"train_loss": -5.889472961425781, "global_step": 58461, "epoch": 1391} {"train_loss": -5.861909866333008, "global_step": 58462, "epoch": 1391} {"train_loss": -5.887636320931571, "global_step": 58463, "epoch": 1391, "val_loss": 66545.609375} {"train_loss": -5.869870185852051, "global_step": 58464, "epoch": 1392} {"train_loss": -5.7892746925354, "global_step": 58465, "epoch": 1392} {"train_loss": -5.835826396942139, "global_step": 58466, "epoch": 1392} {"train_loss": -5.934870719909668, "global_step": 58467, "epoch": 1392} {"train_loss": -5.781344413757324, "global_step": 58468, "epoch": 1392} {"train_loss": -5.916106224060059, "global_step": 58469, "epoch": 1392} {"train_loss": -5.9215521812438965, "global_step": 58470, "epoch": 1392} {"train_loss": -5.682177543640137, "global_step": 58471, "epoch": 1392} {"train_loss": -5.997234344482422, "global_step": 58472, "epoch": 1392} {"train_loss": -5.784878730773926, "global_step": 58473, "epoch": 1392} {"train_loss": -5.8139519691467285, "global_step": 58474, "epoch": 1392} {"train_loss": -5.90955114364624, "global_step": 58475, "epoch": 1392} {"train_loss": -5.807024002075195, "global_step": 58476, "epoch": 1392} {"train_loss": -5.857478618621826, "global_step": 58477, "epoch": 1392} {"train_loss": -5.870903015136719, "global_step": 58478, "epoch": 1392} {"train_loss": -5.859697341918945, "global_step": 58479, "epoch": 1392} {"train_loss": -5.93096923828125, "global_step": 58480, "epoch": 1392} {"train_loss": -5.928869247436523, "global_step": 58481, "epoch": 1392} {"train_loss": -5.865218639373779, "global_step": 58482, "epoch": 1392} {"train_loss": -5.669132232666016, "global_step": 58483, "epoch": 1392} {"train_loss": -5.809013366699219, "global_step": 58484, "epoch": 1392} {"train_loss": -5.725004196166992, "global_step": 58485, "epoch": 1392} {"train_loss": -5.879673957824707, "global_step": 58486, "epoch": 1392} {"train_loss": -5.784201622009277, "global_step": 58487, "epoch": 1392} {"train_loss": -5.880562782287598, "global_step": 58488, "epoch": 1392} {"train_loss": -5.780637741088867, "global_step": 58489, "epoch": 1392} {"train_loss": -5.872806549072266, "global_step": 58490, "epoch": 1392} {"train_loss": -5.909913063049316, "global_step": 58491, "epoch": 1392} {"train_loss": -5.817258834838867, "global_step": 58492, "epoch": 1392} {"train_loss": -5.732551097869873, "global_step": 58493, "epoch": 1392} {"train_loss": -5.893548965454102, "global_step": 58494, "epoch": 1392} {"train_loss": -5.681785583496094, "global_step": 58495, "epoch": 1392} {"train_loss": -5.755483627319336, "global_step": 58496, "epoch": 1392} {"train_loss": -5.880620956420898, "global_step": 58497, "epoch": 1392} {"train_loss": -5.834568977355957, "global_step": 58498, "epoch": 1392} {"train_loss": -5.812712669372559, "global_step": 58499, "epoch": 1392} {"train_loss": -5.719059944152832, "global_step": 58500, "epoch": 1392} {"train_loss": -5.754847049713135, "global_step": 58501, "epoch": 1392} {"train_loss": -5.863921165466309, "global_step": 58502, "epoch": 1392} {"train_loss": -5.862606048583984, "global_step": 58503, "epoch": 1392} {"train_loss": -5.768395900726318, "global_step": 58504, "epoch": 1392} {"train_loss": -5.83191796711513, "global_step": 58505, "epoch": 1392, "val_loss": 66782.6640625} {"train_loss": -5.788435935974121, "global_step": 58506, "epoch": 1393} {"train_loss": -5.8596086502075195, "global_step": 58507, "epoch": 1393} {"train_loss": -5.91717004776001, "global_step": 58508, "epoch": 1393} {"train_loss": -5.959867000579834, "global_step": 58509, "epoch": 1393} {"train_loss": -5.847736835479736, "global_step": 58510, "epoch": 1393} {"train_loss": -5.820616722106934, "global_step": 58511, "epoch": 1393} {"train_loss": -5.902580738067627, "global_step": 58512, "epoch": 1393} {"train_loss": -5.881687164306641, "global_step": 58513, "epoch": 1393} {"train_loss": -5.801417350769043, "global_step": 58514, "epoch": 1393} {"train_loss": -5.784626483917236, "global_step": 58515, "epoch": 1393} {"train_loss": -5.949226379394531, "global_step": 58516, "epoch": 1393} {"train_loss": -5.895771026611328, "global_step": 58517, "epoch": 1393} {"train_loss": -5.828440189361572, "global_step": 58518, "epoch": 1393} {"train_loss": -5.888364315032959, "global_step": 58519, "epoch": 1393} {"train_loss": -5.8219804763793945, "global_step": 58520, "epoch": 1393} {"train_loss": -5.89265251159668, "global_step": 58521, "epoch": 1393} {"train_loss": -5.914282321929932, "global_step": 58522, "epoch": 1393} {"train_loss": -5.9528608322143555, "global_step": 58523, "epoch": 1393} {"train_loss": -5.844432830810547, "global_step": 58524, "epoch": 1393} {"train_loss": -5.887888431549072, "global_step": 58525, "epoch": 1393} {"train_loss": -5.916369438171387, "global_step": 58526, "epoch": 1393} {"train_loss": -5.831976413726807, "global_step": 58527, "epoch": 1393} {"train_loss": -5.928833961486816, "global_step": 58528, "epoch": 1393} {"train_loss": -5.772804260253906, "global_step": 58529, "epoch": 1393} {"train_loss": -5.808941841125488, "global_step": 58530, "epoch": 1393} {"train_loss": -5.853348731994629, "global_step": 58531, "epoch": 1393} {"train_loss": -5.8361616134643555, "global_step": 58532, "epoch": 1393} {"train_loss": -5.976067543029785, "global_step": 58533, "epoch": 1393} {"train_loss": -5.862974166870117, "global_step": 58534, "epoch": 1393} {"train_loss": -5.948119163513184, "global_step": 58535, "epoch": 1393} {"train_loss": -5.816469669342041, "global_step": 58536, "epoch": 1393} {"train_loss": -5.871045112609863, "global_step": 58537, "epoch": 1393} {"train_loss": -5.924191474914551, "global_step": 58538, "epoch": 1393} {"train_loss": -5.785062313079834, "global_step": 58539, "epoch": 1393} {"train_loss": -5.809796333312988, "global_step": 58540, "epoch": 1393} {"train_loss": -5.782491683959961, "global_step": 58541, "epoch": 1393} {"train_loss": -5.833950996398926, "global_step": 58542, "epoch": 1393} {"train_loss": -5.963099002838135, "global_step": 58543, "epoch": 1393} {"train_loss": -6.040262222290039, "global_step": 58544, "epoch": 1393} {"train_loss": -5.858726978302002, "global_step": 58545, "epoch": 1393} {"train_loss": -5.828947067260742, "global_step": 58546, "epoch": 1393} {"train_loss": -5.871730600084577, "global_step": 58547, "epoch": 1393, "val_loss": 66505.265625} {"train_loss": -5.881565093994141, "global_step": 58548, "epoch": 1394} {"train_loss": -5.883864402770996, "global_step": 58549, "epoch": 1394} {"train_loss": -5.818275451660156, "global_step": 58550, "epoch": 1394} {"train_loss": -5.885285377502441, "global_step": 58551, "epoch": 1394} {"train_loss": -5.857321739196777, "global_step": 58552, "epoch": 1394} {"train_loss": -5.865412712097168, "global_step": 58553, "epoch": 1394} {"train_loss": -5.931183815002441, "global_step": 58554, "epoch": 1394} {"train_loss": -5.839693069458008, "global_step": 58555, "epoch": 1394} {"train_loss": -5.917964935302734, "global_step": 58556, "epoch": 1394} {"train_loss": -5.8074951171875, "global_step": 58557, "epoch": 1394} {"train_loss": -5.999641418457031, "global_step": 58558, "epoch": 1394} {"train_loss": -5.824678421020508, "global_step": 58559, "epoch": 1394} {"train_loss": -5.9006757736206055, "global_step": 58560, "epoch": 1394} {"train_loss": -5.933549880981445, "global_step": 58561, "epoch": 1394} {"train_loss": -5.883357048034668, "global_step": 58562, "epoch": 1394} {"train_loss": -5.879306793212891, "global_step": 58563, "epoch": 1394} {"train_loss": -5.90352725982666, "global_step": 58564, "epoch": 1394} {"train_loss": -5.807254791259766, "global_step": 58565, "epoch": 1394} {"train_loss": -5.876914978027344, "global_step": 58566, "epoch": 1394} {"train_loss": -5.9612603187561035, "global_step": 58567, "epoch": 1394} {"train_loss": -5.914000988006592, "global_step": 58568, "epoch": 1394} {"train_loss": -5.902394771575928, "global_step": 58569, "epoch": 1394} {"train_loss": -5.864658355712891, "global_step": 58570, "epoch": 1394} {"train_loss": -5.883212089538574, "global_step": 58571, "epoch": 1394} {"train_loss": -6.016462802886963, "global_step": 58572, "epoch": 1394} {"train_loss": -5.876189231872559, "global_step": 58573, "epoch": 1394} {"train_loss": -5.99309778213501, "global_step": 58574, "epoch": 1394} {"train_loss": -5.810802459716797, "global_step": 58575, "epoch": 1394} {"train_loss": -5.904439449310303, "global_step": 58576, "epoch": 1394} {"train_loss": -5.841373443603516, "global_step": 58577, "epoch": 1394} {"train_loss": -6.0096540451049805, "global_step": 58578, "epoch": 1394} {"train_loss": -5.910407066345215, "global_step": 58579, "epoch": 1394} {"train_loss": -5.812130928039551, "global_step": 58580, "epoch": 1394} {"train_loss": -5.852329254150391, "global_step": 58581, "epoch": 1394} {"train_loss": -5.985285758972168, "global_step": 58582, "epoch": 1394} {"train_loss": -5.832781791687012, "global_step": 58583, "epoch": 1394} {"train_loss": -5.892257213592529, "global_step": 58584, "epoch": 1394} {"train_loss": -5.9153571128845215, "global_step": 58585, "epoch": 1394} {"train_loss": -5.989171981811523, "global_step": 58586, "epoch": 1394} {"train_loss": -5.911103248596191, "global_step": 58587, "epoch": 1394} {"train_loss": -5.847464561462402, "global_step": 58588, "epoch": 1394} {"train_loss": -5.893494696844192, "global_step": 58589, "epoch": 1394, "val_loss": 66571.609375} {"train_loss": -5.806746959686279, "global_step": 58590, "epoch": 1395} {"train_loss": -5.862403392791748, "global_step": 58591, "epoch": 1395} {"train_loss": -5.934483528137207, "global_step": 58592, "epoch": 1395} {"train_loss": -5.856531143188477, "global_step": 58593, "epoch": 1395} {"train_loss": -5.9032883644104, "global_step": 58594, "epoch": 1395} {"train_loss": -5.947503089904785, "global_step": 58595, "epoch": 1395} {"train_loss": -5.828797340393066, "global_step": 58596, "epoch": 1395} {"train_loss": -5.937315464019775, "global_step": 58597, "epoch": 1395} {"train_loss": -5.842741012573242, "global_step": 58598, "epoch": 1395} {"train_loss": -5.939701557159424, "global_step": 58599, "epoch": 1395} {"train_loss": -5.892307281494141, "global_step": 58600, "epoch": 1395} {"train_loss": -5.824195384979248, "global_step": 58601, "epoch": 1395} {"train_loss": -5.797153949737549, "global_step": 58602, "epoch": 1395} {"train_loss": -5.8791117668151855, "global_step": 58603, "epoch": 1395} {"train_loss": -5.890579700469971, "global_step": 58604, "epoch": 1395} {"train_loss": -5.903415679931641, "global_step": 58605, "epoch": 1395} {"train_loss": -5.927860260009766, "global_step": 58606, "epoch": 1395} {"train_loss": -5.827289581298828, "global_step": 58607, "epoch": 1395} {"train_loss": -5.89171028137207, "global_step": 58608, "epoch": 1395} {"train_loss": -5.861162185668945, "global_step": 58609, "epoch": 1395} {"train_loss": -5.8301801681518555, "global_step": 58610, "epoch": 1395} {"train_loss": -5.743932723999023, "global_step": 58611, "epoch": 1395} {"train_loss": -5.8416032791137695, "global_step": 58612, "epoch": 1395} {"train_loss": -5.717251777648926, "global_step": 58613, "epoch": 1395} {"train_loss": -5.904741287231445, "global_step": 58614, "epoch": 1395} {"train_loss": -5.946231365203857, "global_step": 58615, "epoch": 1395} {"train_loss": -5.800187110900879, "global_step": 58616, "epoch": 1395} {"train_loss": -5.771998882293701, "global_step": 58617, "epoch": 1395} {"train_loss": -5.818842887878418, "global_step": 58618, "epoch": 1395} {"train_loss": -5.764077186584473, "global_step": 58619, "epoch": 1395} {"train_loss": -5.798791885375977, "global_step": 58620, "epoch": 1395} {"train_loss": -5.901875972747803, "global_step": 58621, "epoch": 1395} {"train_loss": -5.7113142013549805, "global_step": 58622, "epoch": 1395} {"train_loss": -5.803596496582031, "global_step": 58623, "epoch": 1395} {"train_loss": -5.919316291809082, "global_step": 58624, "epoch": 1395} {"train_loss": -5.932815074920654, "global_step": 58625, "epoch": 1395} {"train_loss": -5.985840797424316, "global_step": 58626, "epoch": 1395} {"train_loss": -5.8279008865356445, "global_step": 58627, "epoch": 1395} {"train_loss": -5.8903398513793945, "global_step": 58628, "epoch": 1395} {"train_loss": -5.977352142333984, "global_step": 58629, "epoch": 1395} {"train_loss": -5.76119327545166, "global_step": 58630, "epoch": 1395} {"train_loss": -5.859587124415806, "global_step": 58631, "epoch": 1395, "val_loss": 66796.9296875} {"train_loss": -5.933588981628418, "global_step": 58632, "epoch": 1396} {"train_loss": -5.831515789031982, "global_step": 58633, "epoch": 1396} {"train_loss": -5.92828893661499, "global_step": 58634, "epoch": 1396} {"train_loss": -5.801090240478516, "global_step": 58635, "epoch": 1396} {"train_loss": -5.841479301452637, "global_step": 58636, "epoch": 1396} {"train_loss": -5.821189880371094, "global_step": 58637, "epoch": 1396} {"train_loss": -5.7852373123168945, "global_step": 58638, "epoch": 1396} {"train_loss": -5.882785320281982, "global_step": 58639, "epoch": 1396} {"train_loss": -5.81511116027832, "global_step": 58640, "epoch": 1396} {"train_loss": -5.950858116149902, "global_step": 58641, "epoch": 1396} {"train_loss": -5.840995788574219, "global_step": 58642, "epoch": 1396} {"train_loss": -5.880182266235352, "global_step": 58643, "epoch": 1396} {"train_loss": -5.8510003089904785, "global_step": 58644, "epoch": 1396} {"train_loss": -5.936387062072754, "global_step": 58645, "epoch": 1396} {"train_loss": -5.713397026062012, "global_step": 58646, "epoch": 1396} {"train_loss": -5.788926124572754, "global_step": 58647, "epoch": 1396} {"train_loss": -5.90704345703125, "global_step": 58648, "epoch": 1396} {"train_loss": -5.855891227722168, "global_step": 58649, "epoch": 1396} {"train_loss": -5.9306511878967285, "global_step": 58650, "epoch": 1396} {"train_loss": -5.823070526123047, "global_step": 58651, "epoch": 1396} {"train_loss": -5.770485877990723, "global_step": 58652, "epoch": 1396} {"train_loss": -5.84274959564209, "global_step": 58653, "epoch": 1396} {"train_loss": -5.840264320373535, "global_step": 58654, "epoch": 1396} {"train_loss": -5.847256660461426, "global_step": 58655, "epoch": 1396} {"train_loss": -5.691530227661133, "global_step": 58656, "epoch": 1396} {"train_loss": -5.8258233070373535, "global_step": 58657, "epoch": 1396} {"train_loss": -5.817717552185059, "global_step": 58658, "epoch": 1396} {"train_loss": -5.750144958496094, "global_step": 58659, "epoch": 1396} {"train_loss": -5.922825813293457, "global_step": 58660, "epoch": 1396} {"train_loss": -5.790465831756592, "global_step": 58661, "epoch": 1396} {"train_loss": -5.726493835449219, "global_step": 58662, "epoch": 1396} {"train_loss": -5.813615798950195, "global_step": 58663, "epoch": 1396} {"train_loss": -5.839765548706055, "global_step": 58664, "epoch": 1396} {"train_loss": -5.799030303955078, "global_step": 58665, "epoch": 1396} {"train_loss": -5.8208112716674805, "global_step": 58666, "epoch": 1396} {"train_loss": -5.901379108428955, "global_step": 58667, "epoch": 1396} {"train_loss": -5.804856777191162, "global_step": 58668, "epoch": 1396} {"train_loss": -5.90523099899292, "global_step": 58669, "epoch": 1396} {"train_loss": -5.766326904296875, "global_step": 58670, "epoch": 1396} {"train_loss": -5.890263557434082, "global_step": 58671, "epoch": 1396} {"train_loss": -5.787021636962891, "global_step": 58672, "epoch": 1396} {"train_loss": -5.836553357896351, "global_step": 58673, "epoch": 1396, "val_loss": 66708.421875} {"train_loss": -5.895160675048828, "global_step": 58674, "epoch": 1397} {"train_loss": -5.862973213195801, "global_step": 58675, "epoch": 1397} {"train_loss": -5.969289779663086, "global_step": 58676, "epoch": 1397} {"train_loss": -5.7526984214782715, "global_step": 58677, "epoch": 1397} {"train_loss": -5.7659759521484375, "global_step": 58678, "epoch": 1397} {"train_loss": -5.8172712326049805, "global_step": 58679, "epoch": 1397} {"train_loss": -5.773866653442383, "global_step": 58680, "epoch": 1397} {"train_loss": -5.823192596435547, "global_step": 58681, "epoch": 1397} {"train_loss": -5.807724475860596, "global_step": 58682, "epoch": 1397} {"train_loss": -5.718103885650635, "global_step": 58683, "epoch": 1397} {"train_loss": -5.889145851135254, "global_step": 58684, "epoch": 1397} {"train_loss": -5.887399673461914, "global_step": 58685, "epoch": 1397} {"train_loss": -5.860202312469482, "global_step": 58686, "epoch": 1397} {"train_loss": -5.862452507019043, "global_step": 58687, "epoch": 1397} {"train_loss": -5.896906852722168, "global_step": 58688, "epoch": 1397} {"train_loss": -5.887423515319824, "global_step": 58689, "epoch": 1397} {"train_loss": -5.817441940307617, "global_step": 58690, "epoch": 1397} {"train_loss": -5.980472564697266, "global_step": 58691, "epoch": 1397} {"train_loss": -5.976106643676758, "global_step": 58692, "epoch": 1397} {"train_loss": -5.950556755065918, "global_step": 58693, "epoch": 1397} {"train_loss": -5.94451379776001, "global_step": 58694, "epoch": 1397} {"train_loss": -5.708103179931641, "global_step": 58695, "epoch": 1397} {"train_loss": -5.9266486167907715, "global_step": 58696, "epoch": 1397} {"train_loss": -5.785519599914551, "global_step": 58697, "epoch": 1397} {"train_loss": -5.837252616882324, "global_step": 58698, "epoch": 1397} {"train_loss": -5.870025634765625, "global_step": 58699, "epoch": 1397} {"train_loss": -5.7142415046691895, "global_step": 58700, "epoch": 1397} {"train_loss": -5.927964210510254, "global_step": 58701, "epoch": 1397} {"train_loss": -5.7936601638793945, "global_step": 58702, "epoch": 1397} {"train_loss": -5.984552383422852, "global_step": 58703, "epoch": 1397} {"train_loss": -5.90744686126709, "global_step": 58704, "epoch": 1397} {"train_loss": -5.954664707183838, "global_step": 58705, "epoch": 1397} {"train_loss": -5.827524185180664, "global_step": 58706, "epoch": 1397} {"train_loss": -5.79261589050293, "global_step": 58707, "epoch": 1397} {"train_loss": -5.868992328643799, "global_step": 58708, "epoch": 1397} {"train_loss": -5.9926347732543945, "global_step": 58709, "epoch": 1397} {"train_loss": -5.829291343688965, "global_step": 58710, "epoch": 1397} {"train_loss": -5.89021635055542, "global_step": 58711, "epoch": 1397} {"train_loss": -5.821805953979492, "global_step": 58712, "epoch": 1397} {"train_loss": -5.869250297546387, "global_step": 58713, "epoch": 1397} {"train_loss": -5.828210830688477, "global_step": 58714, "epoch": 1397} {"train_loss": -5.859622115180606, "global_step": 58715, "epoch": 1397, "val_loss": 66850.6875} {"train_loss": -5.824195861816406, "global_step": 58716, "epoch": 1398} {"train_loss": -5.945204257965088, "global_step": 58717, "epoch": 1398} {"train_loss": -5.9169087409973145, "global_step": 58718, "epoch": 1398} {"train_loss": -5.823144435882568, "global_step": 58719, "epoch": 1398} {"train_loss": -5.994824409484863, "global_step": 58720, "epoch": 1398} {"train_loss": -5.916720390319824, "global_step": 58721, "epoch": 1398} {"train_loss": -5.890430927276611, "global_step": 58722, "epoch": 1398} {"train_loss": -5.907096862792969, "global_step": 58723, "epoch": 1398} {"train_loss": -6.0011701583862305, "global_step": 58724, "epoch": 1398} {"train_loss": -5.865604877471924, "global_step": 58725, "epoch": 1398} {"train_loss": -5.897771835327148, "global_step": 58726, "epoch": 1398} {"train_loss": -5.850017070770264, "global_step": 58727, "epoch": 1398} {"train_loss": -6.012589931488037, "global_step": 58728, "epoch": 1398} {"train_loss": -5.895107269287109, "global_step": 58729, "epoch": 1398} {"train_loss": -5.94446325302124, "global_step": 58730, "epoch": 1398} {"train_loss": -5.840802192687988, "global_step": 58731, "epoch": 1398} {"train_loss": -5.948232650756836, "global_step": 58732, "epoch": 1398} {"train_loss": -5.893538475036621, "global_step": 58733, "epoch": 1398} {"train_loss": -5.895376682281494, "global_step": 58734, "epoch": 1398} {"train_loss": -5.9816670417785645, "global_step": 58735, "epoch": 1398} {"train_loss": -5.954272747039795, "global_step": 58736, "epoch": 1398} {"train_loss": -5.832503318786621, "global_step": 58737, "epoch": 1398} {"train_loss": -5.844311237335205, "global_step": 58738, "epoch": 1398} {"train_loss": -5.849064826965332, "global_step": 58739, "epoch": 1398} {"train_loss": -5.927591323852539, "global_step": 58740, "epoch": 1398} {"train_loss": -5.925103187561035, "global_step": 58741, "epoch": 1398} {"train_loss": -5.934474945068359, "global_step": 58742, "epoch": 1398} {"train_loss": -5.70889139175415, "global_step": 58743, "epoch": 1398} {"train_loss": -5.782261371612549, "global_step": 58744, "epoch": 1398} {"train_loss": -5.82070255279541, "global_step": 58745, "epoch": 1398} {"train_loss": -5.8974609375, "global_step": 58746, "epoch": 1398} {"train_loss": -5.807910919189453, "global_step": 58747, "epoch": 1398} {"train_loss": -5.701355934143066, "global_step": 58748, "epoch": 1398} {"train_loss": -5.713891983032227, "global_step": 58749, "epoch": 1398} {"train_loss": -5.822246551513672, "global_step": 58750, "epoch": 1398} {"train_loss": -5.75087833404541, "global_step": 58751, "epoch": 1398} {"train_loss": -5.770509719848633, "global_step": 58752, "epoch": 1398} {"train_loss": -5.780030727386475, "global_step": 58753, "epoch": 1398} {"train_loss": -5.752937316894531, "global_step": 58754, "epoch": 1398} {"train_loss": -5.865049362182617, "global_step": 58755, "epoch": 1398} {"train_loss": -5.759413719177246, "global_step": 58756, "epoch": 1398} {"train_loss": -5.863266002564203, "global_step": 58757, "epoch": 1398, "val_loss": 66973.7265625} {"train_loss": -5.909874439239502, "global_step": 58758, "epoch": 1399} {"train_loss": -5.878091335296631, "global_step": 58759, "epoch": 1399} {"train_loss": -5.755735397338867, "global_step": 58760, "epoch": 1399} {"train_loss": -5.879903793334961, "global_step": 58761, "epoch": 1399} {"train_loss": -5.889622688293457, "global_step": 58762, "epoch": 1399} {"train_loss": -5.961995601654053, "global_step": 58763, "epoch": 1399} {"train_loss": -5.85384464263916, "global_step": 58764, "epoch": 1399} {"train_loss": -5.9335222244262695, "global_step": 58765, "epoch": 1399} {"train_loss": -5.785250663757324, "global_step": 58766, "epoch": 1399} {"train_loss": -5.866113662719727, "global_step": 58767, "epoch": 1399} {"train_loss": -5.82369327545166, "global_step": 58768, "epoch": 1399} {"train_loss": -5.964159965515137, "global_step": 58769, "epoch": 1399} {"train_loss": -5.968273162841797, "global_step": 58770, "epoch": 1399} {"train_loss": -5.846524238586426, "global_step": 58771, "epoch": 1399} {"train_loss": -5.79448127746582, "global_step": 58772, "epoch": 1399} {"train_loss": -5.845709800720215, "global_step": 58773, "epoch": 1399} {"train_loss": -5.816874027252197, "global_step": 58774, "epoch": 1399} {"train_loss": -5.897724151611328, "global_step": 58775, "epoch": 1399} {"train_loss": -5.917754173278809, "global_step": 58776, "epoch": 1399} {"train_loss": -5.853891849517822, "global_step": 58777, "epoch": 1399} {"train_loss": -5.828388214111328, "global_step": 58778, "epoch": 1399} {"train_loss": -5.831229209899902, "global_step": 58779, "epoch": 1399} {"train_loss": -5.888180255889893, "global_step": 58780, "epoch": 1399} {"train_loss": -5.9186224937438965, "global_step": 58781, "epoch": 1399} {"train_loss": -5.851052761077881, "global_step": 58782, "epoch": 1399} {"train_loss": -5.973043441772461, "global_step": 58783, "epoch": 1399} {"train_loss": -5.7771406173706055, "global_step": 58784, "epoch": 1399} {"train_loss": -5.853605270385742, "global_step": 58785, "epoch": 1399} {"train_loss": -5.809914588928223, "global_step": 58786, "epoch": 1399} {"train_loss": -5.966583251953125, "global_step": 58787, "epoch": 1399} {"train_loss": -5.785826683044434, "global_step": 58788, "epoch": 1399} {"train_loss": -5.86492395401001, "global_step": 58789, "epoch": 1399} {"train_loss": -5.816211700439453, "global_step": 58790, "epoch": 1399} {"train_loss": -5.890017509460449, "global_step": 58791, "epoch": 1399} {"train_loss": -5.852404594421387, "global_step": 58792, "epoch": 1399} {"train_loss": -5.935064315795898, "global_step": 58793, "epoch": 1399} {"train_loss": -5.993323802947998, "global_step": 58794, "epoch": 1399} {"train_loss": -5.787359237670898, "global_step": 58795, "epoch": 1399} {"train_loss": -5.773138046264648, "global_step": 58796, "epoch": 1399} {"train_loss": -5.721434593200684, "global_step": 58797, "epoch": 1399} {"train_loss": -5.738520622253418, "global_step": 58798, "epoch": 1399} {"train_loss": -5.861321369806926, "global_step": 58799, "epoch": 1399, "val_loss": 66491.8203125} {"train_loss": -5.726922988891602, "global_step": 58800, "epoch": 1400} {"train_loss": -5.7281494140625, "global_step": 58801, "epoch": 1400} {"train_loss": -5.889657020568848, "global_step": 58802, "epoch": 1400} {"train_loss": -5.859256267547607, "global_step": 58803, "epoch": 1400} {"train_loss": -5.74750280380249, "global_step": 58804, "epoch": 1400} {"train_loss": -5.921329498291016, "global_step": 58805, "epoch": 1400} {"train_loss": -5.686762809753418, "global_step": 58806, "epoch": 1400} {"train_loss": -5.872310638427734, "global_step": 58807, "epoch": 1400} {"train_loss": -5.865199089050293, "global_step": 58808, "epoch": 1400} {"train_loss": -5.751494407653809, "global_step": 58809, "epoch": 1400} {"train_loss": -5.836034774780273, "global_step": 58810, "epoch": 1400} {"train_loss": -5.951169013977051, "global_step": 58811, "epoch": 1400} {"train_loss": -5.865674018859863, "global_step": 58812, "epoch": 1400} {"train_loss": -5.97126579284668, "global_step": 58813, "epoch": 1400} {"train_loss": -5.868095874786377, "global_step": 58814, "epoch": 1400} {"train_loss": -5.830317497253418, "global_step": 58815, "epoch": 1400} {"train_loss": -5.881096839904785, "global_step": 58816, "epoch": 1400} {"train_loss": -5.844178676605225, "global_step": 58817, "epoch": 1400} {"train_loss": -5.953763008117676, "global_step": 58818, "epoch": 1400} {"train_loss": -5.787691116333008, "global_step": 58819, "epoch": 1400} {"train_loss": -5.891404151916504, "global_step": 58820, "epoch": 1400} {"train_loss": -5.8687615394592285, "global_step": 58821, "epoch": 1400} {"train_loss": -5.750514030456543, "global_step": 58822, "epoch": 1400} {"train_loss": -5.967861175537109, "global_step": 58823, "epoch": 1400} {"train_loss": -5.653810501098633, "global_step": 58824, "epoch": 1400} {"train_loss": -5.8827433586120605, "global_step": 58825, "epoch": 1400} {"train_loss": -5.942327499389648, "global_step": 58826, "epoch": 1400} {"train_loss": -5.837120056152344, "global_step": 58827, "epoch": 1400} {"train_loss": -5.911226749420166, "global_step": 58828, "epoch": 1400} {"train_loss": -5.860673904418945, "global_step": 58829, "epoch": 1400} {"train_loss": -5.8516669273376465, "global_step": 58830, "epoch": 1400} {"train_loss": -6.014531135559082, "global_step": 58831, "epoch": 1400} {"train_loss": -5.814205646514893, "global_step": 58832, "epoch": 1400} {"train_loss": -5.763108730316162, "global_step": 58833, "epoch": 1400} {"train_loss": -5.888445854187012, "global_step": 58834, "epoch": 1400} {"train_loss": -5.796863555908203, "global_step": 58835, "epoch": 1400} {"train_loss": -5.788657188415527, "global_step": 58836, "epoch": 1400} {"train_loss": -5.935036659240723, "global_step": 58837, "epoch": 1400} {"train_loss": -5.888310432434082, "global_step": 58838, "epoch": 1400} {"train_loss": -5.887063026428223, "global_step": 58839, "epoch": 1400} {"train_loss": -5.814203262329102, "global_step": 58840, "epoch": 1400} {"train_loss": -5.852957384926932, "global_step": 58841, "epoch": 1400, "train/sim_max_reward_0": 0.1944902140401905, "train/sim_max_reward_1": 0.9712275637868252, "train/sim_max_reward_2": 0.5653373412441045, "train/sim_max_reward_3": 0.15392485963689378, "train/sim_max_reward_4": 0.38196962945874985, "train/sim_max_reward_5": 0.8833312532234182, "test/sim_max_reward_4400000": 0.8099705596240308, "test/sim_max_reward_4400001": 0.35892638264602594, "test/sim_max_reward_4400002": 0.05782317010312777, "test/sim_max_reward_4400003": 0.8587265575794566, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9001760796453333, "test/sim_max_reward_4400006": 0.2431486424292671, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.45010067349366667, "test/sim_max_reward_4400009": 0.8920627805821263, "test/sim_max_reward_4400010": 0.9361622465950552, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.8753455329738494, "test/sim_max_reward_4400013": 0.805417237245858, "test/sim_max_reward_4400014": 0.360197733117196, "test/sim_max_reward_4400015": 0.2955818280252582, "test/sim_max_reward_4400016": 0.07760919936428257, "test/sim_max_reward_4400017": 0.3781533768894399, "test/sim_max_reward_4400018": 0.4092168468339749, "test/sim_max_reward_4400019": 0.03657382488294429, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5700774721872933, "test/sim_max_reward_4400022": 0.29738020189084624, "test/sim_max_reward_4400023": 0.07026361190119756, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.5091355857581487, "test/sim_max_reward_4400027": 6.952715357933608e-05, "test/sim_max_reward_4400028": 0.8780888381309636, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.6431493564322025, "test/sim_max_reward_4400031": 0.952937303014232, "test/sim_max_reward_4400032": 0.3982716225161214, "test/sim_max_reward_4400033": 0.7949332442080409, "test/sim_max_reward_4400034": 0.6764262411638269, "test/sim_max_reward_4400035": 0.6544593892046777, "test/sim_max_reward_4400036": 0.3918775849219778, "test/sim_max_reward_4400037": 0.8477925080546163, "test/sim_max_reward_4400038": 0.5627166731647616, "test/sim_max_reward_4400039": 0.8212487717069098, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.5830235669279752, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.017073971276667432, "test/sim_max_reward_4400044": 0.9568629380707648, "test/sim_max_reward_4400045": 0.856478848055042, "test/sim_max_reward_4400046": 0.39677851430262046, "test/sim_max_reward_4400047": 0.9882197554931154, "test/sim_max_reward_4400048": 0.3678439104093785, "test/sim_max_reward_4400049": 0.15319504217282406, "train/mean_score": 0.5250468102316971, "test/mean_score": 0.4530053455273355, "val_loss": 66831.671875} {"train_loss": -5.824321746826172, "global_step": 58842, "epoch": 1401} {"train_loss": -5.943052768707275, "global_step": 58843, "epoch": 1401} {"train_loss": -5.844973564147949, "global_step": 58844, "epoch": 1401} {"train_loss": -5.808449745178223, "global_step": 58845, "epoch": 1401} {"train_loss": -5.843055725097656, "global_step": 58846, "epoch": 1401} {"train_loss": -5.840794563293457, "global_step": 58847, "epoch": 1401} {"train_loss": -5.933058261871338, "global_step": 58848, "epoch": 1401} {"train_loss": -5.916712760925293, "global_step": 58849, "epoch": 1401} {"train_loss": -5.830265045166016, "global_step": 58850, "epoch": 1401} {"train_loss": -5.711278915405273, "global_step": 58851, "epoch": 1401} {"train_loss": -5.947121620178223, "global_step": 58852, "epoch": 1401} {"train_loss": -5.783992767333984, "global_step": 58853, "epoch": 1401} {"train_loss": -5.800642967224121, "global_step": 58854, "epoch": 1401} {"train_loss": -5.794729232788086, "global_step": 58855, "epoch": 1401} {"train_loss": -5.743641376495361, "global_step": 58856, "epoch": 1401} {"train_loss": -5.820438385009766, "global_step": 58857, "epoch": 1401} {"train_loss": -5.904964447021484, "global_step": 58858, "epoch": 1401} {"train_loss": -5.815038681030273, "global_step": 58859, "epoch": 1401} {"train_loss": -5.8697099685668945, "global_step": 58860, "epoch": 1401} {"train_loss": -5.903621673583984, "global_step": 58861, "epoch": 1401} {"train_loss": -5.776932239532471, "global_step": 58862, "epoch": 1401} {"train_loss": -5.850059509277344, "global_step": 58863, "epoch": 1401} {"train_loss": -5.960055351257324, "global_step": 58864, "epoch": 1401} {"train_loss": -5.8319501876831055, "global_step": 58865, "epoch": 1401} {"train_loss": -5.839183807373047, "global_step": 58866, "epoch": 1401} {"train_loss": -5.95522928237915, "global_step": 58867, "epoch": 1401} {"train_loss": -5.870120048522949, "global_step": 58868, "epoch": 1401} {"train_loss": -5.783865928649902, "global_step": 58869, "epoch": 1401} {"train_loss": -5.926342010498047, "global_step": 58870, "epoch": 1401} {"train_loss": -5.856644153594971, "global_step": 58871, "epoch": 1401} {"train_loss": -5.8936662673950195, "global_step": 58872, "epoch": 1401} {"train_loss": -5.90360689163208, "global_step": 58873, "epoch": 1401} {"train_loss": -5.852370738983154, "global_step": 58874, "epoch": 1401} {"train_loss": -5.997196197509766, "global_step": 58875, "epoch": 1401} {"train_loss": -5.781688690185547, "global_step": 58876, "epoch": 1401} {"train_loss": -5.896096229553223, "global_step": 58877, "epoch": 1401} {"train_loss": -5.8443779945373535, "global_step": 58878, "epoch": 1401} {"train_loss": -5.806972503662109, "global_step": 58879, "epoch": 1401} {"train_loss": -5.876504898071289, "global_step": 58880, "epoch": 1401} {"train_loss": -5.900708198547363, "global_step": 58881, "epoch": 1401} {"train_loss": -5.756880760192871, "global_step": 58882, "epoch": 1401} {"train_loss": -5.858498016993205, "global_step": 58883, "epoch": 1401, "val_loss": 66422.484375} {"train_loss": -5.879775047302246, "global_step": 58884, "epoch": 1402} {"train_loss": -5.907060623168945, "global_step": 58885, "epoch": 1402} {"train_loss": -5.99752950668335, "global_step": 58886, "epoch": 1402} {"train_loss": -5.991279125213623, "global_step": 58887, "epoch": 1402} {"train_loss": -5.829998970031738, "global_step": 58888, "epoch": 1402} {"train_loss": -5.891173362731934, "global_step": 58889, "epoch": 1402} {"train_loss": -5.8753461837768555, "global_step": 58890, "epoch": 1402} {"train_loss": -5.839203834533691, "global_step": 58891, "epoch": 1402} {"train_loss": -5.743852138519287, "global_step": 58892, "epoch": 1402} {"train_loss": -5.866064071655273, "global_step": 58893, "epoch": 1402} {"train_loss": -5.758115291595459, "global_step": 58894, "epoch": 1402} {"train_loss": -5.7986650466918945, "global_step": 58895, "epoch": 1402} {"train_loss": -5.857621192932129, "global_step": 58896, "epoch": 1402} {"train_loss": -5.854029655456543, "global_step": 58897, "epoch": 1402} {"train_loss": -5.929926872253418, "global_step": 58898, "epoch": 1402} {"train_loss": -5.966001510620117, "global_step": 58899, "epoch": 1402} {"train_loss": -5.891439437866211, "global_step": 58900, "epoch": 1402} {"train_loss": -5.938303470611572, "global_step": 58901, "epoch": 1402} {"train_loss": -5.888968467712402, "global_step": 58902, "epoch": 1402} {"train_loss": -5.923802375793457, "global_step": 58903, "epoch": 1402} {"train_loss": -5.890084266662598, "global_step": 58904, "epoch": 1402} {"train_loss": -5.806884288787842, "global_step": 58905, "epoch": 1402} {"train_loss": -5.868622303009033, "global_step": 58906, "epoch": 1402} {"train_loss": -5.845663070678711, "global_step": 58907, "epoch": 1402} {"train_loss": -5.973536491394043, "global_step": 58908, "epoch": 1402} {"train_loss": -5.996411323547363, "global_step": 58909, "epoch": 1402} {"train_loss": -5.899657726287842, "global_step": 58910, "epoch": 1402} {"train_loss": -5.983993053436279, "global_step": 58911, "epoch": 1402} {"train_loss": -5.827692985534668, "global_step": 58912, "epoch": 1402} {"train_loss": -5.844479560852051, "global_step": 58913, "epoch": 1402} {"train_loss": -5.925419807434082, "global_step": 58914, "epoch": 1402} {"train_loss": -5.709978103637695, "global_step": 58915, "epoch": 1402} {"train_loss": -5.892341613769531, "global_step": 58916, "epoch": 1402} {"train_loss": -5.807141304016113, "global_step": 58917, "epoch": 1402} {"train_loss": -5.685842990875244, "global_step": 58918, "epoch": 1402} {"train_loss": -5.853816509246826, "global_step": 58919, "epoch": 1402} {"train_loss": -5.768417835235596, "global_step": 58920, "epoch": 1402} {"train_loss": -5.897086143493652, "global_step": 58921, "epoch": 1402} {"train_loss": -5.744338035583496, "global_step": 58922, "epoch": 1402} {"train_loss": -5.887953758239746, "global_step": 58923, "epoch": 1402} {"train_loss": -5.690045356750488, "global_step": 58924, "epoch": 1402} {"train_loss": -5.865098067692348, "global_step": 58925, "epoch": 1402, "val_loss": 66984.3125} {"train_loss": -5.826183319091797, "global_step": 58926, "epoch": 1403} {"train_loss": -5.798638343811035, "global_step": 58927, "epoch": 1403} {"train_loss": -6.001296520233154, "global_step": 58928, "epoch": 1403} {"train_loss": -5.695673942565918, "global_step": 58929, "epoch": 1403} {"train_loss": -5.702962875366211, "global_step": 58930, "epoch": 1403} {"train_loss": -5.831266403198242, "global_step": 58931, "epoch": 1403} {"train_loss": -5.77503776550293, "global_step": 58932, "epoch": 1403} {"train_loss": -5.723699569702148, "global_step": 58933, "epoch": 1403} {"train_loss": -5.935158729553223, "global_step": 58934, "epoch": 1403} {"train_loss": -5.759432792663574, "global_step": 58935, "epoch": 1403} {"train_loss": -5.816648960113525, "global_step": 58936, "epoch": 1403} {"train_loss": -5.884589195251465, "global_step": 58937, "epoch": 1403} {"train_loss": -5.841894626617432, "global_step": 58938, "epoch": 1403} {"train_loss": -5.802555084228516, "global_step": 58939, "epoch": 1403} {"train_loss": -5.880804061889648, "global_step": 58940, "epoch": 1403} {"train_loss": -5.941658020019531, "global_step": 58941, "epoch": 1403} {"train_loss": -5.83863639831543, "global_step": 58942, "epoch": 1403} {"train_loss": -5.897197723388672, "global_step": 58943, "epoch": 1403} {"train_loss": -5.895170211791992, "global_step": 58944, "epoch": 1403} {"train_loss": -5.826511383056641, "global_step": 58945, "epoch": 1403} {"train_loss": -5.789706707000732, "global_step": 58946, "epoch": 1403} {"train_loss": -6.010953903198242, "global_step": 58947, "epoch": 1403} {"train_loss": -5.914073944091797, "global_step": 58948, "epoch": 1403} {"train_loss": -5.953793525695801, "global_step": 58949, "epoch": 1403} {"train_loss": -5.835895538330078, "global_step": 58950, "epoch": 1403} {"train_loss": -5.823032855987549, "global_step": 58951, "epoch": 1403} {"train_loss": -5.811818599700928, "global_step": 58952, "epoch": 1403} {"train_loss": -5.738095283508301, "global_step": 58953, "epoch": 1403} {"train_loss": -5.922307014465332, "global_step": 58954, "epoch": 1403} {"train_loss": -5.995766639709473, "global_step": 58955, "epoch": 1403} {"train_loss": -5.841841220855713, "global_step": 58956, "epoch": 1403} {"train_loss": -5.7465901374816895, "global_step": 58957, "epoch": 1403} {"train_loss": -5.9116010665893555, "global_step": 58958, "epoch": 1403} {"train_loss": -5.8484954833984375, "global_step": 58959, "epoch": 1403} {"train_loss": -5.689420700073242, "global_step": 58960, "epoch": 1403} {"train_loss": -5.801723957061768, "global_step": 58961, "epoch": 1403} {"train_loss": -5.9502787590026855, "global_step": 58962, "epoch": 1403} {"train_loss": -5.832988739013672, "global_step": 58963, "epoch": 1403} {"train_loss": -5.827450752258301, "global_step": 58964, "epoch": 1403} {"train_loss": -5.933014392852783, "global_step": 58965, "epoch": 1403} {"train_loss": -5.8097639083862305, "global_step": 58966, "epoch": 1403} {"train_loss": -5.84253944669451, "global_step": 58967, "epoch": 1403, "val_loss": 66477.8515625} {"train_loss": -5.843224048614502, "global_step": 58968, "epoch": 1404} {"train_loss": -5.834785461425781, "global_step": 58969, "epoch": 1404} {"train_loss": -5.8342390060424805, "global_step": 58970, "epoch": 1404} {"train_loss": -5.806227684020996, "global_step": 58971, "epoch": 1404} {"train_loss": -5.92897891998291, "global_step": 58972, "epoch": 1404} {"train_loss": -5.846585273742676, "global_step": 58973, "epoch": 1404} {"train_loss": -5.904603004455566, "global_step": 58974, "epoch": 1404} {"train_loss": -5.9031453132629395, "global_step": 58975, "epoch": 1404} {"train_loss": -5.757541179656982, "global_step": 58976, "epoch": 1404} {"train_loss": -5.874118328094482, "global_step": 58977, "epoch": 1404} {"train_loss": -5.892817974090576, "global_step": 58978, "epoch": 1404} {"train_loss": -5.824580669403076, "global_step": 58979, "epoch": 1404} {"train_loss": -5.723200798034668, "global_step": 58980, "epoch": 1404} {"train_loss": -5.854975700378418, "global_step": 58981, "epoch": 1404} {"train_loss": -5.909852981567383, "global_step": 58982, "epoch": 1404} {"train_loss": -5.793997764587402, "global_step": 58983, "epoch": 1404} {"train_loss": -5.848392486572266, "global_step": 58984, "epoch": 1404} {"train_loss": -5.952054500579834, "global_step": 58985, "epoch": 1404} {"train_loss": -5.951018333435059, "global_step": 58986, "epoch": 1404} {"train_loss": -5.8283491134643555, "global_step": 58987, "epoch": 1404} {"train_loss": -5.830300331115723, "global_step": 58988, "epoch": 1404} {"train_loss": -5.849658966064453, "global_step": 58989, "epoch": 1404} {"train_loss": -5.856081962585449, "global_step": 58990, "epoch": 1404} {"train_loss": -5.9226908683776855, "global_step": 58991, "epoch": 1404} {"train_loss": -5.928770065307617, "global_step": 58992, "epoch": 1404} {"train_loss": -5.940058708190918, "global_step": 58993, "epoch": 1404} {"train_loss": -6.00039005279541, "global_step": 58994, "epoch": 1404} {"train_loss": -5.809689998626709, "global_step": 58995, "epoch": 1404} {"train_loss": -5.857302665710449, "global_step": 58996, "epoch": 1404} {"train_loss": -5.9226531982421875, "global_step": 58997, "epoch": 1404} {"train_loss": -5.921535491943359, "global_step": 58998, "epoch": 1404} {"train_loss": -5.898714065551758, "global_step": 58999, "epoch": 1404} {"train_loss": -5.993679046630859, "global_step": 59000, "epoch": 1404} {"train_loss": -5.902806282043457, "global_step": 59001, "epoch": 1404} {"train_loss": -5.831502914428711, "global_step": 59002, "epoch": 1404} {"train_loss": -5.980700492858887, "global_step": 59003, "epoch": 1404} {"train_loss": -5.980032444000244, "global_step": 59004, "epoch": 1404} {"train_loss": -5.823863506317139, "global_step": 59005, "epoch": 1404} {"train_loss": -5.8766632080078125, "global_step": 59006, "epoch": 1404} {"train_loss": -5.900659561157227, "global_step": 59007, "epoch": 1404} {"train_loss": -5.866904258728027, "global_step": 59008, "epoch": 1404} {"train_loss": -5.877613555817377, "global_step": 59009, "epoch": 1404, "val_loss": 66446.03125} {"train_loss": -5.978188514709473, "global_step": 59010, "epoch": 1405} {"train_loss": -5.8008527755737305, "global_step": 59011, "epoch": 1405} {"train_loss": -6.021716117858887, "global_step": 59012, "epoch": 1405} {"train_loss": -6.03164529800415, "global_step": 59013, "epoch": 1405} {"train_loss": -5.939385414123535, "global_step": 59014, "epoch": 1405} {"train_loss": -5.907973289489746, "global_step": 59015, "epoch": 1405} {"train_loss": -5.972692489624023, "global_step": 59016, "epoch": 1405} {"train_loss": -5.877283573150635, "global_step": 59017, "epoch": 1405} {"train_loss": -5.939829349517822, "global_step": 59018, "epoch": 1405} {"train_loss": -5.978715896606445, "global_step": 59019, "epoch": 1405} {"train_loss": -5.765416622161865, "global_step": 59020, "epoch": 1405} {"train_loss": -5.901443958282471, "global_step": 59021, "epoch": 1405} {"train_loss": -5.911259651184082, "global_step": 59022, "epoch": 1405} {"train_loss": -5.853022575378418, "global_step": 59023, "epoch": 1405} {"train_loss": -5.874181747436523, "global_step": 59024, "epoch": 1405} {"train_loss": -5.918280601501465, "global_step": 59025, "epoch": 1405} {"train_loss": -5.875585556030273, "global_step": 59026, "epoch": 1405} {"train_loss": -5.7326483726501465, "global_step": 59027, "epoch": 1405} {"train_loss": -5.865922927856445, "global_step": 59028, "epoch": 1405} {"train_loss": -5.933165550231934, "global_step": 59029, "epoch": 1405} {"train_loss": -5.891587734222412, "global_step": 59030, "epoch": 1405} {"train_loss": -5.786379814147949, "global_step": 59031, "epoch": 1405} {"train_loss": -5.850402355194092, "global_step": 59032, "epoch": 1405} {"train_loss": -5.8752617835998535, "global_step": 59033, "epoch": 1405} {"train_loss": -5.72943115234375, "global_step": 59034, "epoch": 1405} {"train_loss": -5.947898864746094, "global_step": 59035, "epoch": 1405} {"train_loss": -5.859848499298096, "global_step": 59036, "epoch": 1405} {"train_loss": -5.769973278045654, "global_step": 59037, "epoch": 1405} {"train_loss": -5.7523193359375, "global_step": 59038, "epoch": 1405} {"train_loss": -5.880254745483398, "global_step": 59039, "epoch": 1405} {"train_loss": -5.8896164894104, "global_step": 59040, "epoch": 1405} {"train_loss": -5.704282283782959, "global_step": 59041, "epoch": 1405} {"train_loss": -5.971563339233398, "global_step": 59042, "epoch": 1405} {"train_loss": -5.748884201049805, "global_step": 59043, "epoch": 1405} {"train_loss": -5.8064165115356445, "global_step": 59044, "epoch": 1405} {"train_loss": -5.772942066192627, "global_step": 59045, "epoch": 1405} {"train_loss": -5.719656467437744, "global_step": 59046, "epoch": 1405} {"train_loss": -5.724532127380371, "global_step": 59047, "epoch": 1405} {"train_loss": -5.84437370300293, "global_step": 59048, "epoch": 1405} {"train_loss": -5.842591285705566, "global_step": 59049, "epoch": 1405} {"train_loss": -5.713359832763672, "global_step": 59050, "epoch": 1405} {"train_loss": -5.859801360539028, "global_step": 59051, "epoch": 1405, "val_loss": 66777.6875} {"train_loss": -5.80721378326416, "global_step": 59052, "epoch": 1406} {"train_loss": -5.879256248474121, "global_step": 59053, "epoch": 1406} {"train_loss": -5.799359321594238, "global_step": 59054, "epoch": 1406} {"train_loss": -5.973167896270752, "global_step": 59055, "epoch": 1406} {"train_loss": -6.007663726806641, "global_step": 59056, "epoch": 1406} {"train_loss": -5.825916290283203, "global_step": 59057, "epoch": 1406} {"train_loss": -5.974857330322266, "global_step": 59058, "epoch": 1406} {"train_loss": -5.828588485717773, "global_step": 59059, "epoch": 1406} {"train_loss": -5.961394309997559, "global_step": 59060, "epoch": 1406} {"train_loss": -5.905054092407227, "global_step": 59061, "epoch": 1406} {"train_loss": -5.926483154296875, "global_step": 59062, "epoch": 1406} {"train_loss": -5.911167621612549, "global_step": 59063, "epoch": 1406} {"train_loss": -5.927507400512695, "global_step": 59064, "epoch": 1406} {"train_loss": -5.99600887298584, "global_step": 59065, "epoch": 1406} {"train_loss": -5.915215015411377, "global_step": 59066, "epoch": 1406} {"train_loss": -5.876494407653809, "global_step": 59067, "epoch": 1406} {"train_loss": -5.912548065185547, "global_step": 59068, "epoch": 1406} {"train_loss": -5.821236610412598, "global_step": 59069, "epoch": 1406} {"train_loss": -5.725897789001465, "global_step": 59070, "epoch": 1406} {"train_loss": -5.904686450958252, "global_step": 59071, "epoch": 1406} {"train_loss": -5.865494251251221, "global_step": 59072, "epoch": 1406} {"train_loss": -5.892802715301514, "global_step": 59073, "epoch": 1406} {"train_loss": -5.985727310180664, "global_step": 59074, "epoch": 1406} {"train_loss": -5.865479469299316, "global_step": 59075, "epoch": 1406} {"train_loss": -5.855701446533203, "global_step": 59076, "epoch": 1406} {"train_loss": -5.811636924743652, "global_step": 59077, "epoch": 1406} {"train_loss": -5.9087724685668945, "global_step": 59078, "epoch": 1406} {"train_loss": -5.829739570617676, "global_step": 59079, "epoch": 1406} {"train_loss": -5.979952335357666, "global_step": 59080, "epoch": 1406} {"train_loss": -5.9005303382873535, "global_step": 59081, "epoch": 1406} {"train_loss": -5.923242568969727, "global_step": 59082, "epoch": 1406} {"train_loss": -5.759311199188232, "global_step": 59083, "epoch": 1406} {"train_loss": -5.814250469207764, "global_step": 59084, "epoch": 1406} {"train_loss": -5.870096206665039, "global_step": 59085, "epoch": 1406} {"train_loss": -5.958139419555664, "global_step": 59086, "epoch": 1406} {"train_loss": -5.871177673339844, "global_step": 59087, "epoch": 1406} {"train_loss": -5.9139275550842285, "global_step": 59088, "epoch": 1406} {"train_loss": -5.939478874206543, "global_step": 59089, "epoch": 1406} {"train_loss": -5.902470588684082, "global_step": 59090, "epoch": 1406} {"train_loss": -5.7780632972717285, "global_step": 59091, "epoch": 1406} {"train_loss": -5.8349103927612305, "global_step": 59092, "epoch": 1406} {"train_loss": -5.885082494644892, "global_step": 59093, "epoch": 1406, "val_loss": 66638.28125} {"train_loss": -5.809767723083496, "global_step": 59094, "epoch": 1407} {"train_loss": -5.980056285858154, "global_step": 59095, "epoch": 1407} {"train_loss": -5.947676658630371, "global_step": 59096, "epoch": 1407} {"train_loss": -5.935743808746338, "global_step": 59097, "epoch": 1407} {"train_loss": -5.846002578735352, "global_step": 59098, "epoch": 1407} {"train_loss": -5.896819591522217, "global_step": 59099, "epoch": 1407} {"train_loss": -5.916367530822754, "global_step": 59100, "epoch": 1407} {"train_loss": -5.951058387756348, "global_step": 59101, "epoch": 1407} {"train_loss": -5.958133697509766, "global_step": 59102, "epoch": 1407} {"train_loss": -5.951272964477539, "global_step": 59103, "epoch": 1407} {"train_loss": -5.977663040161133, "global_step": 59104, "epoch": 1407} {"train_loss": -5.878430366516113, "global_step": 59105, "epoch": 1407} {"train_loss": -5.788202285766602, "global_step": 59106, "epoch": 1407} {"train_loss": -5.913261413574219, "global_step": 59107, "epoch": 1407} {"train_loss": -5.846230506896973, "global_step": 59108, "epoch": 1407} {"train_loss": -5.727375030517578, "global_step": 59109, "epoch": 1407} {"train_loss": -5.909600257873535, "global_step": 59110, "epoch": 1407} {"train_loss": -5.791767120361328, "global_step": 59111, "epoch": 1407} {"train_loss": -5.6654157638549805, "global_step": 59112, "epoch": 1407} {"train_loss": -5.932320594787598, "global_step": 59113, "epoch": 1407} {"train_loss": -5.700812339782715, "global_step": 59114, "epoch": 1407} {"train_loss": -5.9796319007873535, "global_step": 59115, "epoch": 1407} {"train_loss": -5.881964206695557, "global_step": 59116, "epoch": 1407} {"train_loss": -6.014790058135986, "global_step": 59117, "epoch": 1407} {"train_loss": -5.8938164710998535, "global_step": 59118, "epoch": 1407} {"train_loss": -5.913163661956787, "global_step": 59119, "epoch": 1407} {"train_loss": -5.976200103759766, "global_step": 59120, "epoch": 1407} {"train_loss": -5.8379621505737305, "global_step": 59121, "epoch": 1407} {"train_loss": -5.737906455993652, "global_step": 59122, "epoch": 1407} {"train_loss": -5.8378190994262695, "global_step": 59123, "epoch": 1407} {"train_loss": -5.848849296569824, "global_step": 59124, "epoch": 1407} {"train_loss": -5.88729190826416, "global_step": 59125, "epoch": 1407} {"train_loss": -5.895255088806152, "global_step": 59126, "epoch": 1407} {"train_loss": -5.8497514724731445, "global_step": 59127, "epoch": 1407} {"train_loss": -5.874878883361816, "global_step": 59128, "epoch": 1407} {"train_loss": -5.806642532348633, "global_step": 59129, "epoch": 1407} {"train_loss": -5.900549411773682, "global_step": 59130, "epoch": 1407} {"train_loss": -5.849318504333496, "global_step": 59131, "epoch": 1407} {"train_loss": -5.849687099456787, "global_step": 59132, "epoch": 1407} {"train_loss": -5.856145858764648, "global_step": 59133, "epoch": 1407} {"train_loss": -5.917298316955566, "global_step": 59134, "epoch": 1407} {"train_loss": -5.8758416175842285, "global_step": 59135, "epoch": 1407, "val_loss": 66528.265625} {"train_loss": -5.9655303955078125, "global_step": 59136, "epoch": 1408} {"train_loss": -5.928750514984131, "global_step": 59137, "epoch": 1408} {"train_loss": -5.909034729003906, "global_step": 59138, "epoch": 1408} {"train_loss": -5.739820957183838, "global_step": 59139, "epoch": 1408} {"train_loss": -5.893064498901367, "global_step": 59140, "epoch": 1408} {"train_loss": -5.825989723205566, "global_step": 59141, "epoch": 1408} {"train_loss": -5.771544933319092, "global_step": 59142, "epoch": 1408} {"train_loss": -5.765267372131348, "global_step": 59143, "epoch": 1408} {"train_loss": -5.8559465408325195, "global_step": 59144, "epoch": 1408} {"train_loss": -5.824289321899414, "global_step": 59145, "epoch": 1408} {"train_loss": -5.855576515197754, "global_step": 59146, "epoch": 1408} {"train_loss": -5.892722129821777, "global_step": 59147, "epoch": 1408} {"train_loss": -5.789568901062012, "global_step": 59148, "epoch": 1408} {"train_loss": -5.85390567779541, "global_step": 59149, "epoch": 1408} {"train_loss": -5.826480865478516, "global_step": 59150, "epoch": 1408} {"train_loss": -5.872405052185059, "global_step": 59151, "epoch": 1408} {"train_loss": -5.871457099914551, "global_step": 59152, "epoch": 1408} {"train_loss": -5.675531387329102, "global_step": 59153, "epoch": 1408} {"train_loss": -5.946342945098877, "global_step": 59154, "epoch": 1408} {"train_loss": -5.794350624084473, "global_step": 59155, "epoch": 1408} {"train_loss": -5.856583595275879, "global_step": 59156, "epoch": 1408} {"train_loss": -5.7566351890563965, "global_step": 59157, "epoch": 1408} {"train_loss": -5.884533405303955, "global_step": 59158, "epoch": 1408} {"train_loss": -5.889333724975586, "global_step": 59159, "epoch": 1408} {"train_loss": -5.857562065124512, "global_step": 59160, "epoch": 1408} {"train_loss": -5.814878463745117, "global_step": 59161, "epoch": 1408} {"train_loss": -5.812679767608643, "global_step": 59162, "epoch": 1408} {"train_loss": -5.710536956787109, "global_step": 59163, "epoch": 1408} {"train_loss": -5.872707366943359, "global_step": 59164, "epoch": 1408} {"train_loss": -5.895221710205078, "global_step": 59165, "epoch": 1408} {"train_loss": -5.93659782409668, "global_step": 59166, "epoch": 1408} {"train_loss": -5.862438678741455, "global_step": 59167, "epoch": 1408} {"train_loss": -5.8997626304626465, "global_step": 59168, "epoch": 1408} {"train_loss": -5.861431121826172, "global_step": 59169, "epoch": 1408} {"train_loss": -5.978148460388184, "global_step": 59170, "epoch": 1408} {"train_loss": -5.826311111450195, "global_step": 59171, "epoch": 1408} {"train_loss": -5.782965660095215, "global_step": 59172, "epoch": 1408} {"train_loss": -5.823127746582031, "global_step": 59173, "epoch": 1408} {"train_loss": -5.87154483795166, "global_step": 59174, "epoch": 1408} {"train_loss": -5.953568458557129, "global_step": 59175, "epoch": 1408} {"train_loss": -5.914342880249023, "global_step": 59176, "epoch": 1408} {"train_loss": -5.856757050468808, "global_step": 59177, "epoch": 1408, "val_loss": 66650.5078125} {"train_loss": -5.905068397521973, "global_step": 59178, "epoch": 1409} {"train_loss": -5.960303783416748, "global_step": 59179, "epoch": 1409} {"train_loss": -5.900899410247803, "global_step": 59180, "epoch": 1409} {"train_loss": -6.000976085662842, "global_step": 59181, "epoch": 1409} {"train_loss": -5.909876823425293, "global_step": 59182, "epoch": 1409} {"train_loss": -5.797450542449951, "global_step": 59183, "epoch": 1409} {"train_loss": -5.927987098693848, "global_step": 59184, "epoch": 1409} {"train_loss": -5.949667453765869, "global_step": 59185, "epoch": 1409} {"train_loss": -5.962522506713867, "global_step": 59186, "epoch": 1409} {"train_loss": -5.9447021484375, "global_step": 59187, "epoch": 1409} {"train_loss": -5.835623741149902, "global_step": 59188, "epoch": 1409} {"train_loss": -5.844287872314453, "global_step": 59189, "epoch": 1409} {"train_loss": -5.944901466369629, "global_step": 59190, "epoch": 1409} {"train_loss": -5.919737815856934, "global_step": 59191, "epoch": 1409} {"train_loss": -5.942604064941406, "global_step": 59192, "epoch": 1409} {"train_loss": -5.8757781982421875, "global_step": 59193, "epoch": 1409} {"train_loss": -5.930249214172363, "global_step": 59194, "epoch": 1409} {"train_loss": -5.8597846031188965, "global_step": 59195, "epoch": 1409} {"train_loss": -5.934022426605225, "global_step": 59196, "epoch": 1409} {"train_loss": -5.896068572998047, "global_step": 59197, "epoch": 1409} {"train_loss": -5.851576805114746, "global_step": 59198, "epoch": 1409} {"train_loss": -5.881239891052246, "global_step": 59199, "epoch": 1409} {"train_loss": -5.915433406829834, "global_step": 59200, "epoch": 1409} {"train_loss": -5.773428916931152, "global_step": 59201, "epoch": 1409} {"train_loss": -5.923604965209961, "global_step": 59202, "epoch": 1409} {"train_loss": -5.915806770324707, "global_step": 59203, "epoch": 1409} {"train_loss": -5.892787933349609, "global_step": 59204, "epoch": 1409} {"train_loss": -5.868865013122559, "global_step": 59205, "epoch": 1409} {"train_loss": -5.996659755706787, "global_step": 59206, "epoch": 1409} {"train_loss": -5.818140506744385, "global_step": 59207, "epoch": 1409} {"train_loss": -5.823247909545898, "global_step": 59208, "epoch": 1409} {"train_loss": -5.935291290283203, "global_step": 59209, "epoch": 1409} {"train_loss": -5.98472261428833, "global_step": 59210, "epoch": 1409} {"train_loss": -5.857931137084961, "global_step": 59211, "epoch": 1409} {"train_loss": -5.824077606201172, "global_step": 59212, "epoch": 1409} {"train_loss": -5.920062065124512, "global_step": 59213, "epoch": 1409} {"train_loss": -5.885008811950684, "global_step": 59214, "epoch": 1409} {"train_loss": -5.71376371383667, "global_step": 59215, "epoch": 1409} {"train_loss": -5.940502166748047, "global_step": 59216, "epoch": 1409} {"train_loss": -5.889530181884766, "global_step": 59217, "epoch": 1409} {"train_loss": -5.86958646774292, "global_step": 59218, "epoch": 1409} {"train_loss": -5.894284974961054, "global_step": 59219, "epoch": 1409, "val_loss": 66976.2890625} {"train_loss": -5.935368537902832, "global_step": 59220, "epoch": 1410} {"train_loss": -5.728543281555176, "global_step": 59221, "epoch": 1410} {"train_loss": -5.917653560638428, "global_step": 59222, "epoch": 1410} {"train_loss": -5.942259311676025, "global_step": 59223, "epoch": 1410} {"train_loss": -5.713723182678223, "global_step": 59224, "epoch": 1410} {"train_loss": -5.762908935546875, "global_step": 59225, "epoch": 1410} {"train_loss": -5.969187259674072, "global_step": 59226, "epoch": 1410} {"train_loss": -5.829659938812256, "global_step": 59227, "epoch": 1410} {"train_loss": -5.809289932250977, "global_step": 59228, "epoch": 1410} {"train_loss": -5.704413890838623, "global_step": 59229, "epoch": 1410} {"train_loss": -5.8625874519348145, "global_step": 59230, "epoch": 1410} {"train_loss": -5.924030780792236, "global_step": 59231, "epoch": 1410} {"train_loss": -5.82607364654541, "global_step": 59232, "epoch": 1410} {"train_loss": -5.8345794677734375, "global_step": 59233, "epoch": 1410} {"train_loss": -5.770329475402832, "global_step": 59234, "epoch": 1410} {"train_loss": -5.742306709289551, "global_step": 59235, "epoch": 1410} {"train_loss": -5.891724586486816, "global_step": 59236, "epoch": 1410} {"train_loss": -5.812520980834961, "global_step": 59237, "epoch": 1410} {"train_loss": -5.682265758514404, "global_step": 59238, "epoch": 1410} {"train_loss": -5.925411224365234, "global_step": 59239, "epoch": 1410} {"train_loss": -5.823320388793945, "global_step": 59240, "epoch": 1410} {"train_loss": -5.721299171447754, "global_step": 59241, "epoch": 1410} {"train_loss": -5.8632493019104, "global_step": 59242, "epoch": 1410} {"train_loss": -5.7393975257873535, "global_step": 59243, "epoch": 1410} {"train_loss": -5.823372840881348, "global_step": 59244, "epoch": 1410} {"train_loss": -5.8931884765625, "global_step": 59245, "epoch": 1410} {"train_loss": -5.738664627075195, "global_step": 59246, "epoch": 1410} {"train_loss": -6.0061845779418945, "global_step": 59247, "epoch": 1410} {"train_loss": -5.8938751220703125, "global_step": 59248, "epoch": 1410} {"train_loss": -5.750732421875, "global_step": 59249, "epoch": 1410} {"train_loss": -5.930079460144043, "global_step": 59250, "epoch": 1410} {"train_loss": -5.849361419677734, "global_step": 59251, "epoch": 1410} {"train_loss": -5.804007530212402, "global_step": 59252, "epoch": 1410} {"train_loss": -5.8666582107543945, "global_step": 59253, "epoch": 1410} {"train_loss": -5.877728462219238, "global_step": 59254, "epoch": 1410} {"train_loss": -5.8316850662231445, "global_step": 59255, "epoch": 1410} {"train_loss": -5.92735481262207, "global_step": 59256, "epoch": 1410} {"train_loss": -5.935324192047119, "global_step": 59257, "epoch": 1410} {"train_loss": -5.885304927825928, "global_step": 59258, "epoch": 1410} {"train_loss": -5.806804656982422, "global_step": 59259, "epoch": 1410} {"train_loss": -5.955981254577637, "global_step": 59260, "epoch": 1410} {"train_loss": -5.841003940218971, "global_step": 59261, "epoch": 1410, "val_loss": 66858.78125} {"train_loss": -5.822443008422852, "global_step": 59262, "epoch": 1411} {"train_loss": -5.8719801902771, "global_step": 59263, "epoch": 1411} {"train_loss": -5.754848480224609, "global_step": 59264, "epoch": 1411} {"train_loss": -5.785051345825195, "global_step": 59265, "epoch": 1411} {"train_loss": -5.923440456390381, "global_step": 59266, "epoch": 1411} {"train_loss": -5.887591361999512, "global_step": 59267, "epoch": 1411} {"train_loss": -5.805344581604004, "global_step": 59268, "epoch": 1411} {"train_loss": -5.887849807739258, "global_step": 59269, "epoch": 1411} {"train_loss": -5.911444664001465, "global_step": 59270, "epoch": 1411} {"train_loss": -5.972442626953125, "global_step": 59271, "epoch": 1411} {"train_loss": -5.743439674377441, "global_step": 59272, "epoch": 1411} {"train_loss": -5.943438529968262, "global_step": 59273, "epoch": 1411} {"train_loss": -5.742321014404297, "global_step": 59274, "epoch": 1411} {"train_loss": -5.8901519775390625, "global_step": 59275, "epoch": 1411} {"train_loss": -5.8164496421813965, "global_step": 59276, "epoch": 1411} {"train_loss": -5.983521938323975, "global_step": 59277, "epoch": 1411} {"train_loss": -5.863678455352783, "global_step": 59278, "epoch": 1411} {"train_loss": -5.906306266784668, "global_step": 59279, "epoch": 1411} {"train_loss": -5.865660667419434, "global_step": 59280, "epoch": 1411} {"train_loss": -5.918645858764648, "global_step": 59281, "epoch": 1411} {"train_loss": -5.9035797119140625, "global_step": 59282, "epoch": 1411} {"train_loss": -5.862732887268066, "global_step": 59283, "epoch": 1411} {"train_loss": -5.928256034851074, "global_step": 59284, "epoch": 1411} {"train_loss": -5.835024833679199, "global_step": 59285, "epoch": 1411} {"train_loss": -5.844908237457275, "global_step": 59286, "epoch": 1411} {"train_loss": -5.796258449554443, "global_step": 59287, "epoch": 1411} {"train_loss": -5.8428192138671875, "global_step": 59288, "epoch": 1411} {"train_loss": -5.743367671966553, "global_step": 59289, "epoch": 1411} {"train_loss": -5.825034141540527, "global_step": 59290, "epoch": 1411} {"train_loss": -5.785052299499512, "global_step": 59291, "epoch": 1411} {"train_loss": -5.6864824295043945, "global_step": 59292, "epoch": 1411} {"train_loss": -5.827994346618652, "global_step": 59293, "epoch": 1411} {"train_loss": -5.843265533447266, "global_step": 59294, "epoch": 1411} {"train_loss": -5.839040756225586, "global_step": 59295, "epoch": 1411} {"train_loss": -5.771732330322266, "global_step": 59296, "epoch": 1411} {"train_loss": -5.7981791496276855, "global_step": 59297, "epoch": 1411} {"train_loss": -5.8953962326049805, "global_step": 59298, "epoch": 1411} {"train_loss": -5.774718284606934, "global_step": 59299, "epoch": 1411} {"train_loss": -5.801280975341797, "global_step": 59300, "epoch": 1411} {"train_loss": -5.7721757888793945, "global_step": 59301, "epoch": 1411} {"train_loss": -5.743075370788574, "global_step": 59302, "epoch": 1411} {"train_loss": -5.838078022003174, "global_step": 59303, "epoch": 1411, "val_loss": 66864.7578125} {"train_loss": -5.8402910232543945, "global_step": 59304, "epoch": 1412} {"train_loss": -5.8271050453186035, "global_step": 59305, "epoch": 1412} {"train_loss": -5.819564342498779, "global_step": 59306, "epoch": 1412} {"train_loss": -5.722658157348633, "global_step": 59307, "epoch": 1412} {"train_loss": -5.881901741027832, "global_step": 59308, "epoch": 1412} {"train_loss": -5.900934219360352, "global_step": 59309, "epoch": 1412} {"train_loss": -5.742642402648926, "global_step": 59310, "epoch": 1412} {"train_loss": -5.876626014709473, "global_step": 59311, "epoch": 1412} {"train_loss": -5.89791202545166, "global_step": 59312, "epoch": 1412} {"train_loss": -5.994959354400635, "global_step": 59313, "epoch": 1412} {"train_loss": -5.817193984985352, "global_step": 59314, "epoch": 1412} {"train_loss": -5.814515113830566, "global_step": 59315, "epoch": 1412} {"train_loss": -5.718445777893066, "global_step": 59316, "epoch": 1412} {"train_loss": -5.700775146484375, "global_step": 59317, "epoch": 1412} {"train_loss": -5.914217948913574, "global_step": 59318, "epoch": 1412} {"train_loss": -5.787555694580078, "global_step": 59319, "epoch": 1412} {"train_loss": -5.9339141845703125, "global_step": 59320, "epoch": 1412} {"train_loss": -5.879389762878418, "global_step": 59321, "epoch": 1412} {"train_loss": -5.872137069702148, "global_step": 59322, "epoch": 1412} {"train_loss": -5.922850608825684, "global_step": 59323, "epoch": 1412} {"train_loss": -5.872735023498535, "global_step": 59324, "epoch": 1412} {"train_loss": -5.724183082580566, "global_step": 59325, "epoch": 1412} {"train_loss": -5.953356742858887, "global_step": 59326, "epoch": 1412} {"train_loss": -5.788571357727051, "global_step": 59327, "epoch": 1412} {"train_loss": -5.922286510467529, "global_step": 59328, "epoch": 1412} {"train_loss": -5.8733978271484375, "global_step": 59329, "epoch": 1412} {"train_loss": -5.664081573486328, "global_step": 59330, "epoch": 1412} {"train_loss": -5.817127704620361, "global_step": 59331, "epoch": 1412} {"train_loss": -5.911660671234131, "global_step": 59332, "epoch": 1412} {"train_loss": -5.859368801116943, "global_step": 59333, "epoch": 1412} {"train_loss": -5.9914164543151855, "global_step": 59334, "epoch": 1412} {"train_loss": -5.8460845947265625, "global_step": 59335, "epoch": 1412} {"train_loss": -5.87111759185791, "global_step": 59336, "epoch": 1412} {"train_loss": -5.791352272033691, "global_step": 59337, "epoch": 1412} {"train_loss": -5.959317684173584, "global_step": 59338, "epoch": 1412} {"train_loss": -5.9226789474487305, "global_step": 59339, "epoch": 1412} {"train_loss": -5.839733123779297, "global_step": 59340, "epoch": 1412} {"train_loss": -5.944470405578613, "global_step": 59341, "epoch": 1412} {"train_loss": -6.001259803771973, "global_step": 59342, "epoch": 1412} {"train_loss": -5.883301734924316, "global_step": 59343, "epoch": 1412} {"train_loss": -5.963851451873779, "global_step": 59344, "epoch": 1412} {"train_loss": -5.863197110948109, "global_step": 59345, "epoch": 1412, "val_loss": 66777.75} {"train_loss": -5.885308742523193, "global_step": 59346, "epoch": 1413} {"train_loss": -5.791108131408691, "global_step": 59347, "epoch": 1413} {"train_loss": -6.081504821777344, "global_step": 59348, "epoch": 1413} {"train_loss": -5.869552135467529, "global_step": 59349, "epoch": 1413} {"train_loss": -5.87967586517334, "global_step": 59350, "epoch": 1413} {"train_loss": -5.833778381347656, "global_step": 59351, "epoch": 1413} {"train_loss": -5.955532550811768, "global_step": 59352, "epoch": 1413} {"train_loss": -5.888757705688477, "global_step": 59353, "epoch": 1413} {"train_loss": -5.850390911102295, "global_step": 59354, "epoch": 1413} {"train_loss": -5.894627094268799, "global_step": 59355, "epoch": 1413} {"train_loss": -5.787264823913574, "global_step": 59356, "epoch": 1413} {"train_loss": -5.895331382751465, "global_step": 59357, "epoch": 1413} {"train_loss": -5.88947868347168, "global_step": 59358, "epoch": 1413} {"train_loss": -5.825889587402344, "global_step": 59359, "epoch": 1413} {"train_loss": -5.8801374435424805, "global_step": 59360, "epoch": 1413} {"train_loss": -5.876926898956299, "global_step": 59361, "epoch": 1413} {"train_loss": -5.85951042175293, "global_step": 59362, "epoch": 1413} {"train_loss": -6.005488395690918, "global_step": 59363, "epoch": 1413} {"train_loss": -5.862494468688965, "global_step": 59364, "epoch": 1413} {"train_loss": -5.844149589538574, "global_step": 59365, "epoch": 1413} {"train_loss": -5.736074924468994, "global_step": 59366, "epoch": 1413} {"train_loss": -5.773128032684326, "global_step": 59367, "epoch": 1413} {"train_loss": -5.866983890533447, "global_step": 59368, "epoch": 1413} {"train_loss": -5.867316722869873, "global_step": 59369, "epoch": 1413} {"train_loss": -5.963726997375488, "global_step": 59370, "epoch": 1413} {"train_loss": -5.862483024597168, "global_step": 59371, "epoch": 1413} {"train_loss": -5.880814552307129, "global_step": 59372, "epoch": 1413} {"train_loss": -5.882767200469971, "global_step": 59373, "epoch": 1413} {"train_loss": -5.97010612487793, "global_step": 59374, "epoch": 1413} {"train_loss": -5.984482288360596, "global_step": 59375, "epoch": 1413} {"train_loss": -5.8387770652771, "global_step": 59376, "epoch": 1413} {"train_loss": -5.901895523071289, "global_step": 59377, "epoch": 1413} {"train_loss": -5.912386894226074, "global_step": 59378, "epoch": 1413} {"train_loss": -5.733550548553467, "global_step": 59379, "epoch": 1413} {"train_loss": -5.785162925720215, "global_step": 59380, "epoch": 1413} {"train_loss": -6.003204345703125, "global_step": 59381, "epoch": 1413} {"train_loss": -5.988723278045654, "global_step": 59382, "epoch": 1413} {"train_loss": -5.916110992431641, "global_step": 59383, "epoch": 1413} {"train_loss": -5.807723045349121, "global_step": 59384, "epoch": 1413} {"train_loss": -5.992464065551758, "global_step": 59385, "epoch": 1413} {"train_loss": -5.845674514770508, "global_step": 59386, "epoch": 1413} {"train_loss": -5.8813033785138815, "global_step": 59387, "epoch": 1413, "val_loss": 66703.0859375} {"train_loss": -5.9122419357299805, "global_step": 59388, "epoch": 1414} {"train_loss": -5.900336742401123, "global_step": 59389, "epoch": 1414} {"train_loss": -5.866255283355713, "global_step": 59390, "epoch": 1414} {"train_loss": -5.909917831420898, "global_step": 59391, "epoch": 1414} {"train_loss": -5.882424831390381, "global_step": 59392, "epoch": 1414} {"train_loss": -5.877559661865234, "global_step": 59393, "epoch": 1414} {"train_loss": -5.866561412811279, "global_step": 59394, "epoch": 1414} {"train_loss": -5.962865829467773, "global_step": 59395, "epoch": 1414} {"train_loss": -5.804927825927734, "global_step": 59396, "epoch": 1414} {"train_loss": -5.838382244110107, "global_step": 59397, "epoch": 1414} {"train_loss": -6.037137031555176, "global_step": 59398, "epoch": 1414} {"train_loss": -5.660396575927734, "global_step": 59399, "epoch": 1414} {"train_loss": -5.902848243713379, "global_step": 59400, "epoch": 1414} {"train_loss": -5.850531101226807, "global_step": 59401, "epoch": 1414} {"train_loss": -5.9072723388671875, "global_step": 59402, "epoch": 1414} {"train_loss": -5.959638595581055, "global_step": 59403, "epoch": 1414} {"train_loss": -5.91414737701416, "global_step": 59404, "epoch": 1414} {"train_loss": -5.994441032409668, "global_step": 59405, "epoch": 1414} {"train_loss": -5.846357345581055, "global_step": 59406, "epoch": 1414} {"train_loss": -5.854905128479004, "global_step": 59407, "epoch": 1414} {"train_loss": -5.900225639343262, "global_step": 59408, "epoch": 1414} {"train_loss": -5.890674114227295, "global_step": 59409, "epoch": 1414} {"train_loss": -5.8262619972229, "global_step": 59410, "epoch": 1414} {"train_loss": -5.854129791259766, "global_step": 59411, "epoch": 1414} {"train_loss": -5.676547050476074, "global_step": 59412, "epoch": 1414} {"train_loss": -5.767886161804199, "global_step": 59413, "epoch": 1414} {"train_loss": -5.859598636627197, "global_step": 59414, "epoch": 1414} {"train_loss": -5.797896385192871, "global_step": 59415, "epoch": 1414} {"train_loss": -5.986283302307129, "global_step": 59416, "epoch": 1414} {"train_loss": -5.877922058105469, "global_step": 59417, "epoch": 1414} {"train_loss": -5.91853141784668, "global_step": 59418, "epoch": 1414} {"train_loss": -5.768759727478027, "global_step": 59419, "epoch": 1414} {"train_loss": -5.953972816467285, "global_step": 59420, "epoch": 1414} {"train_loss": -5.984532356262207, "global_step": 59421, "epoch": 1414} {"train_loss": -5.855682373046875, "global_step": 59422, "epoch": 1414} {"train_loss": -5.873103618621826, "global_step": 59423, "epoch": 1414} {"train_loss": -5.881689071655273, "global_step": 59424, "epoch": 1414} {"train_loss": -5.810184478759766, "global_step": 59425, "epoch": 1414} {"train_loss": -5.848272323608398, "global_step": 59426, "epoch": 1414} {"train_loss": -5.856594562530518, "global_step": 59427, "epoch": 1414} {"train_loss": -5.712503433227539, "global_step": 59428, "epoch": 1414} {"train_loss": -5.869028920219058, "global_step": 59429, "epoch": 1414, "val_loss": 66481.671875} {"train_loss": -5.999056816101074, "global_step": 59430, "epoch": 1415} {"train_loss": -5.893266677856445, "global_step": 59431, "epoch": 1415} {"train_loss": -5.9000043869018555, "global_step": 59432, "epoch": 1415} {"train_loss": -5.861180305480957, "global_step": 59433, "epoch": 1415} {"train_loss": -5.828587532043457, "global_step": 59434, "epoch": 1415} {"train_loss": -5.796670436859131, "global_step": 59435, "epoch": 1415} {"train_loss": -5.916257858276367, "global_step": 59436, "epoch": 1415} {"train_loss": -5.843358039855957, "global_step": 59437, "epoch": 1415} {"train_loss": -5.887845039367676, "global_step": 59438, "epoch": 1415} {"train_loss": -5.9372639656066895, "global_step": 59439, "epoch": 1415} {"train_loss": -5.9307684898376465, "global_step": 59440, "epoch": 1415} {"train_loss": -5.946593284606934, "global_step": 59441, "epoch": 1415} {"train_loss": -5.847836017608643, "global_step": 59442, "epoch": 1415} {"train_loss": -5.990424156188965, "global_step": 59443, "epoch": 1415} {"train_loss": -5.969677448272705, "global_step": 59444, "epoch": 1415} {"train_loss": -5.899296283721924, "global_step": 59445, "epoch": 1415} {"train_loss": -5.924548149108887, "global_step": 59446, "epoch": 1415} {"train_loss": -5.924596786499023, "global_step": 59447, "epoch": 1415} {"train_loss": -5.894765853881836, "global_step": 59448, "epoch": 1415} {"train_loss": -5.855603218078613, "global_step": 59449, "epoch": 1415} {"train_loss": -5.856172561645508, "global_step": 59450, "epoch": 1415} {"train_loss": -5.823968410491943, "global_step": 59451, "epoch": 1415} {"train_loss": -5.813564777374268, "global_step": 59452, "epoch": 1415} {"train_loss": -5.878864765167236, "global_step": 59453, "epoch": 1415} {"train_loss": -5.660861015319824, "global_step": 59454, "epoch": 1415} {"train_loss": -5.863897323608398, "global_step": 59455, "epoch": 1415} {"train_loss": -5.915019989013672, "global_step": 59456, "epoch": 1415} {"train_loss": -5.890788555145264, "global_step": 59457, "epoch": 1415} {"train_loss": -5.89376163482666, "global_step": 59458, "epoch": 1415} {"train_loss": -5.849772930145264, "global_step": 59459, "epoch": 1415} {"train_loss": -5.854265213012695, "global_step": 59460, "epoch": 1415} {"train_loss": -5.885676383972168, "global_step": 59461, "epoch": 1415} {"train_loss": -5.9066901206970215, "global_step": 59462, "epoch": 1415} {"train_loss": -5.881255626678467, "global_step": 59463, "epoch": 1415} {"train_loss": -5.823886871337891, "global_step": 59464, "epoch": 1415} {"train_loss": -5.9600934982299805, "global_step": 59465, "epoch": 1415} {"train_loss": -5.86836576461792, "global_step": 59466, "epoch": 1415} {"train_loss": -5.751916408538818, "global_step": 59467, "epoch": 1415} {"train_loss": -5.862886905670166, "global_step": 59468, "epoch": 1415} {"train_loss": -5.860967636108398, "global_step": 59469, "epoch": 1415} {"train_loss": -5.881528854370117, "global_step": 59470, "epoch": 1415} {"train_loss": -5.881625743139358, "global_step": 59471, "epoch": 1415, "val_loss": 66751.6953125} {"train_loss": -5.7824602127075195, "global_step": 59472, "epoch": 1416} {"train_loss": -5.880680084228516, "global_step": 59473, "epoch": 1416} {"train_loss": -5.813026428222656, "global_step": 59474, "epoch": 1416} {"train_loss": -5.801335334777832, "global_step": 59475, "epoch": 1416} {"train_loss": -5.966818332672119, "global_step": 59476, "epoch": 1416} {"train_loss": -5.904314041137695, "global_step": 59477, "epoch": 1416} {"train_loss": -5.897487163543701, "global_step": 59478, "epoch": 1416} {"train_loss": -5.933188438415527, "global_step": 59479, "epoch": 1416} {"train_loss": -5.742682456970215, "global_step": 59480, "epoch": 1416} {"train_loss": -5.9672698974609375, "global_step": 59481, "epoch": 1416} {"train_loss": -5.718521595001221, "global_step": 59482, "epoch": 1416} {"train_loss": -5.8450775146484375, "global_step": 59483, "epoch": 1416} {"train_loss": -5.8972907066345215, "global_step": 59484, "epoch": 1416} {"train_loss": -5.774956703186035, "global_step": 59485, "epoch": 1416} {"train_loss": -5.940704345703125, "global_step": 59486, "epoch": 1416} {"train_loss": -5.853233337402344, "global_step": 59487, "epoch": 1416} {"train_loss": -5.817225456237793, "global_step": 59488, "epoch": 1416} {"train_loss": -5.883541107177734, "global_step": 59489, "epoch": 1416} {"train_loss": -5.7555341720581055, "global_step": 59490, "epoch": 1416} {"train_loss": -5.70709228515625, "global_step": 59491, "epoch": 1416} {"train_loss": -5.775897026062012, "global_step": 59492, "epoch": 1416} {"train_loss": -5.758206367492676, "global_step": 59493, "epoch": 1416} {"train_loss": -5.8538289070129395, "global_step": 59494, "epoch": 1416} {"train_loss": -5.831171035766602, "global_step": 59495, "epoch": 1416} {"train_loss": -5.673428535461426, "global_step": 59496, "epoch": 1416} {"train_loss": -5.832815170288086, "global_step": 59497, "epoch": 1416} {"train_loss": -5.817727565765381, "global_step": 59498, "epoch": 1416} {"train_loss": -5.878108024597168, "global_step": 59499, "epoch": 1416} {"train_loss": -5.858039379119873, "global_step": 59500, "epoch": 1416} {"train_loss": -5.719436168670654, "global_step": 59501, "epoch": 1416} {"train_loss": -5.70339298248291, "global_step": 59502, "epoch": 1416} {"train_loss": -5.972790718078613, "global_step": 59503, "epoch": 1416} {"train_loss": -5.71951961517334, "global_step": 59504, "epoch": 1416} {"train_loss": -5.803994178771973, "global_step": 59505, "epoch": 1416} {"train_loss": -5.7558488845825195, "global_step": 59506, "epoch": 1416} {"train_loss": -5.964809417724609, "global_step": 59507, "epoch": 1416} {"train_loss": -5.812229156494141, "global_step": 59508, "epoch": 1416} {"train_loss": -5.806204319000244, "global_step": 59509, "epoch": 1416} {"train_loss": -5.761277198791504, "global_step": 59510, "epoch": 1416} {"train_loss": -5.786121368408203, "global_step": 59511, "epoch": 1416} {"train_loss": -5.897915840148926, "global_step": 59512, "epoch": 1416} {"train_loss": -5.8268025034949895, "global_step": 59513, "epoch": 1416, "val_loss": 66636.96875} {"train_loss": -5.903656005859375, "global_step": 59514, "epoch": 1417} {"train_loss": -5.79820442199707, "global_step": 59515, "epoch": 1417} {"train_loss": -5.8714470863342285, "global_step": 59516, "epoch": 1417} {"train_loss": -5.892441749572754, "global_step": 59517, "epoch": 1417} {"train_loss": -6.012011528015137, "global_step": 59518, "epoch": 1417} {"train_loss": -5.8358235359191895, "global_step": 59519, "epoch": 1417} {"train_loss": -5.690703392028809, "global_step": 59520, "epoch": 1417} {"train_loss": -5.868525505065918, "global_step": 59521, "epoch": 1417} {"train_loss": -5.871604919433594, "global_step": 59522, "epoch": 1417} {"train_loss": -5.702592849731445, "global_step": 59523, "epoch": 1417} {"train_loss": -5.854500770568848, "global_step": 59524, "epoch": 1417} {"train_loss": -5.8567047119140625, "global_step": 59525, "epoch": 1417} {"train_loss": -5.920928955078125, "global_step": 59526, "epoch": 1417} {"train_loss": -5.893338680267334, "global_step": 59527, "epoch": 1417} {"train_loss": -5.944942951202393, "global_step": 59528, "epoch": 1417} {"train_loss": -5.893129348754883, "global_step": 59529, "epoch": 1417} {"train_loss": -5.876188278198242, "global_step": 59530, "epoch": 1417} {"train_loss": -5.852192401885986, "global_step": 59531, "epoch": 1417} {"train_loss": -5.8663225173950195, "global_step": 59532, "epoch": 1417} {"train_loss": -5.987387657165527, "global_step": 59533, "epoch": 1417} {"train_loss": -5.915441989898682, "global_step": 59534, "epoch": 1417} {"train_loss": -5.778078079223633, "global_step": 59535, "epoch": 1417} {"train_loss": -5.866079330444336, "global_step": 59536, "epoch": 1417} {"train_loss": -5.781391620635986, "global_step": 59537, "epoch": 1417} {"train_loss": -5.872572898864746, "global_step": 59538, "epoch": 1417} {"train_loss": -5.787306785583496, "global_step": 59539, "epoch": 1417} {"train_loss": -5.797751426696777, "global_step": 59540, "epoch": 1417} {"train_loss": -5.901519775390625, "global_step": 59541, "epoch": 1417} {"train_loss": -5.906676292419434, "global_step": 59542, "epoch": 1417} {"train_loss": -5.8840532302856445, "global_step": 59543, "epoch": 1417} {"train_loss": -5.777033805847168, "global_step": 59544, "epoch": 1417} {"train_loss": -5.9650044441223145, "global_step": 59545, "epoch": 1417} {"train_loss": -5.837080001831055, "global_step": 59546, "epoch": 1417} {"train_loss": -5.821260452270508, "global_step": 59547, "epoch": 1417} {"train_loss": -5.798020362854004, "global_step": 59548, "epoch": 1417} {"train_loss": -5.809889793395996, "global_step": 59549, "epoch": 1417} {"train_loss": -6.007351875305176, "global_step": 59550, "epoch": 1417} {"train_loss": -5.933455944061279, "global_step": 59551, "epoch": 1417} {"train_loss": -5.8900837898254395, "global_step": 59552, "epoch": 1417} {"train_loss": -5.891457557678223, "global_step": 59553, "epoch": 1417} {"train_loss": -5.884675979614258, "global_step": 59554, "epoch": 1417} {"train_loss": -5.867449408485776, "global_step": 59555, "epoch": 1417, "val_loss": 66737.40625} {"train_loss": -5.908668518066406, "global_step": 59556, "epoch": 1418} {"train_loss": -5.735324382781982, "global_step": 59557, "epoch": 1418} {"train_loss": -5.847342014312744, "global_step": 59558, "epoch": 1418} {"train_loss": -5.981777191162109, "global_step": 59559, "epoch": 1418} {"train_loss": -5.955286502838135, "global_step": 59560, "epoch": 1418} {"train_loss": -5.892671585083008, "global_step": 59561, "epoch": 1418} {"train_loss": -6.000561714172363, "global_step": 59562, "epoch": 1418} {"train_loss": -5.843533515930176, "global_step": 59563, "epoch": 1418} {"train_loss": -5.894772052764893, "global_step": 59564, "epoch": 1418} {"train_loss": -5.873912811279297, "global_step": 59565, "epoch": 1418} {"train_loss": -5.771562576293945, "global_step": 59566, "epoch": 1418} {"train_loss": -5.912613868713379, "global_step": 59567, "epoch": 1418} {"train_loss": -5.850791931152344, "global_step": 59568, "epoch": 1418} {"train_loss": -5.898497581481934, "global_step": 59569, "epoch": 1418} {"train_loss": -5.983723163604736, "global_step": 59570, "epoch": 1418} {"train_loss": -5.799448013305664, "global_step": 59571, "epoch": 1418} {"train_loss": -5.777586936950684, "global_step": 59572, "epoch": 1418} {"train_loss": -5.861861228942871, "global_step": 59573, "epoch": 1418} {"train_loss": -5.8846588134765625, "global_step": 59574, "epoch": 1418} {"train_loss": -5.866064071655273, "global_step": 59575, "epoch": 1418} {"train_loss": -5.899663925170898, "global_step": 59576, "epoch": 1418} {"train_loss": -5.891036033630371, "global_step": 59577, "epoch": 1418} {"train_loss": -6.052731513977051, "global_step": 59578, "epoch": 1418} {"train_loss": -5.944701194763184, "global_step": 59579, "epoch": 1418} {"train_loss": -5.832133769989014, "global_step": 59580, "epoch": 1418} {"train_loss": -5.994122505187988, "global_step": 59581, "epoch": 1418} {"train_loss": -5.714406967163086, "global_step": 59582, "epoch": 1418} {"train_loss": -5.894964218139648, "global_step": 59583, "epoch": 1418} {"train_loss": -5.855537414550781, "global_step": 59584, "epoch": 1418} {"train_loss": -5.93662166595459, "global_step": 59585, "epoch": 1418} {"train_loss": -5.949684143066406, "global_step": 59586, "epoch": 1418} {"train_loss": -5.824702262878418, "global_step": 59587, "epoch": 1418} {"train_loss": -5.890082359313965, "global_step": 59588, "epoch": 1418} {"train_loss": -5.804718971252441, "global_step": 59589, "epoch": 1418} {"train_loss": -6.015840530395508, "global_step": 59590, "epoch": 1418} {"train_loss": -5.789883136749268, "global_step": 59591, "epoch": 1418} {"train_loss": -5.941642761230469, "global_step": 59592, "epoch": 1418} {"train_loss": -5.967123985290527, "global_step": 59593, "epoch": 1418} {"train_loss": -5.840190410614014, "global_step": 59594, "epoch": 1418} {"train_loss": -5.79825496673584, "global_step": 59595, "epoch": 1418} {"train_loss": -5.788512229919434, "global_step": 59596, "epoch": 1418} {"train_loss": -5.8816196237291605, "global_step": 59597, "epoch": 1418, "val_loss": 66545.53125} {"train_loss": -5.926912784576416, "global_step": 59598, "epoch": 1419} {"train_loss": -5.888594627380371, "global_step": 59599, "epoch": 1419} {"train_loss": -5.8925371170043945, "global_step": 59600, "epoch": 1419} {"train_loss": -5.954893589019775, "global_step": 59601, "epoch": 1419} {"train_loss": -5.9435529708862305, "global_step": 59602, "epoch": 1419} {"train_loss": -5.956099510192871, "global_step": 59603, "epoch": 1419} {"train_loss": -5.825540065765381, "global_step": 59604, "epoch": 1419} {"train_loss": -5.930681228637695, "global_step": 59605, "epoch": 1419} {"train_loss": -5.888070106506348, "global_step": 59606, "epoch": 1419} {"train_loss": -5.83655309677124, "global_step": 59607, "epoch": 1419} {"train_loss": -5.934732437133789, "global_step": 59608, "epoch": 1419} {"train_loss": -5.863821506500244, "global_step": 59609, "epoch": 1419} {"train_loss": -5.841185092926025, "global_step": 59610, "epoch": 1419} {"train_loss": -5.887685775756836, "global_step": 59611, "epoch": 1419} {"train_loss": -5.718581199645996, "global_step": 59612, "epoch": 1419} {"train_loss": -6.035288333892822, "global_step": 59613, "epoch": 1419} {"train_loss": -5.748619556427002, "global_step": 59614, "epoch": 1419} {"train_loss": -5.867955207824707, "global_step": 59615, "epoch": 1419} {"train_loss": -5.872830390930176, "global_step": 59616, "epoch": 1419} {"train_loss": -5.777887344360352, "global_step": 59617, "epoch": 1419} {"train_loss": -5.916925430297852, "global_step": 59618, "epoch": 1419} {"train_loss": -5.864980697631836, "global_step": 59619, "epoch": 1419} {"train_loss": -5.889336585998535, "global_step": 59620, "epoch": 1419} {"train_loss": -5.912043571472168, "global_step": 59621, "epoch": 1419} {"train_loss": -5.7951836585998535, "global_step": 59622, "epoch": 1419} {"train_loss": -5.876540660858154, "global_step": 59623, "epoch": 1419} {"train_loss": -5.896025657653809, "global_step": 59624, "epoch": 1419} {"train_loss": -5.949178695678711, "global_step": 59625, "epoch": 1419} {"train_loss": -5.771811485290527, "global_step": 59626, "epoch": 1419} {"train_loss": -5.933469772338867, "global_step": 59627, "epoch": 1419} {"train_loss": -5.958395957946777, "global_step": 59628, "epoch": 1419} {"train_loss": -5.981184005737305, "global_step": 59629, "epoch": 1419} {"train_loss": -5.906826972961426, "global_step": 59630, "epoch": 1419} {"train_loss": -5.7995100021362305, "global_step": 59631, "epoch": 1419} {"train_loss": -5.877264976501465, "global_step": 59632, "epoch": 1419} {"train_loss": -5.830860137939453, "global_step": 59633, "epoch": 1419} {"train_loss": -5.973386764526367, "global_step": 59634, "epoch": 1419} {"train_loss": -5.895566940307617, "global_step": 59635, "epoch": 1419} {"train_loss": -6.105466842651367, "global_step": 59636, "epoch": 1419} {"train_loss": -5.953802108764648, "global_step": 59637, "epoch": 1419} {"train_loss": -5.967837333679199, "global_step": 59638, "epoch": 1419} {"train_loss": -5.893024319694156, "global_step": 59639, "epoch": 1419, "val_loss": 66605.3984375} {"train_loss": -5.868021488189697, "global_step": 59640, "epoch": 1420} {"train_loss": -5.896881103515625, "global_step": 59641, "epoch": 1420} {"train_loss": -5.96660852432251, "global_step": 59642, "epoch": 1420} {"train_loss": -5.9626617431640625, "global_step": 59643, "epoch": 1420} {"train_loss": -5.902007102966309, "global_step": 59644, "epoch": 1420} {"train_loss": -5.767749309539795, "global_step": 59645, "epoch": 1420} {"train_loss": -5.9222259521484375, "global_step": 59646, "epoch": 1420} {"train_loss": -5.905661582946777, "global_step": 59647, "epoch": 1420} {"train_loss": -5.869383811950684, "global_step": 59648, "epoch": 1420} {"train_loss": -5.923613548278809, "global_step": 59649, "epoch": 1420} {"train_loss": -5.836256504058838, "global_step": 59650, "epoch": 1420} {"train_loss": -5.958850860595703, "global_step": 59651, "epoch": 1420} {"train_loss": -6.025226593017578, "global_step": 59652, "epoch": 1420} {"train_loss": -5.865867614746094, "global_step": 59653, "epoch": 1420} {"train_loss": -6.014488220214844, "global_step": 59654, "epoch": 1420} {"train_loss": -5.809109210968018, "global_step": 59655, "epoch": 1420} {"train_loss": -5.9588727951049805, "global_step": 59656, "epoch": 1420} {"train_loss": -5.8867034912109375, "global_step": 59657, "epoch": 1420} {"train_loss": -5.962729454040527, "global_step": 59658, "epoch": 1420} {"train_loss": -5.921976566314697, "global_step": 59659, "epoch": 1420} {"train_loss": -5.854302406311035, "global_step": 59660, "epoch": 1420} {"train_loss": -5.8489179611206055, "global_step": 59661, "epoch": 1420} {"train_loss": -5.775186538696289, "global_step": 59662, "epoch": 1420} {"train_loss": -5.892236709594727, "global_step": 59663, "epoch": 1420} {"train_loss": -5.940530300140381, "global_step": 59664, "epoch": 1420} {"train_loss": -5.819850921630859, "global_step": 59665, "epoch": 1420} {"train_loss": -5.997697353363037, "global_step": 59666, "epoch": 1420} {"train_loss": -5.869057655334473, "global_step": 59667, "epoch": 1420} {"train_loss": -6.042446613311768, "global_step": 59668, "epoch": 1420} {"train_loss": -5.866483688354492, "global_step": 59669, "epoch": 1420} {"train_loss": -5.905933856964111, "global_step": 59670, "epoch": 1420} {"train_loss": -5.864377021789551, "global_step": 59671, "epoch": 1420} {"train_loss": -6.017579078674316, "global_step": 59672, "epoch": 1420} {"train_loss": -5.837856292724609, "global_step": 59673, "epoch": 1420} {"train_loss": -5.796935081481934, "global_step": 59674, "epoch": 1420} {"train_loss": -5.847222328186035, "global_step": 59675, "epoch": 1420} {"train_loss": -5.943014144897461, "global_step": 59676, "epoch": 1420} {"train_loss": -5.870680809020996, "global_step": 59677, "epoch": 1420} {"train_loss": -5.805342197418213, "global_step": 59678, "epoch": 1420} {"train_loss": -5.831860542297363, "global_step": 59679, "epoch": 1420} {"train_loss": -5.855068206787109, "global_step": 59680, "epoch": 1420} {"train_loss": -5.8923765818278, "global_step": 59681, "epoch": 1420, "val_loss": 66510.765625} {"train_loss": -5.89276123046875, "global_step": 59682, "epoch": 1421} {"train_loss": -5.7515153884887695, "global_step": 59683, "epoch": 1421} {"train_loss": -5.930037975311279, "global_step": 59684, "epoch": 1421} {"train_loss": -5.791329383850098, "global_step": 59685, "epoch": 1421} {"train_loss": -5.991079330444336, "global_step": 59686, "epoch": 1421} {"train_loss": -5.840707778930664, "global_step": 59687, "epoch": 1421} {"train_loss": -5.912108421325684, "global_step": 59688, "epoch": 1421} {"train_loss": -5.899706840515137, "global_step": 59689, "epoch": 1421} {"train_loss": -5.788453102111816, "global_step": 59690, "epoch": 1421} {"train_loss": -5.910589218139648, "global_step": 59691, "epoch": 1421} {"train_loss": -6.024785995483398, "global_step": 59692, "epoch": 1421} {"train_loss": -5.962064743041992, "global_step": 59693, "epoch": 1421} {"train_loss": -5.874756813049316, "global_step": 59694, "epoch": 1421} {"train_loss": -5.826814651489258, "global_step": 59695, "epoch": 1421} {"train_loss": -6.032810211181641, "global_step": 59696, "epoch": 1421} {"train_loss": -5.905579566955566, "global_step": 59697, "epoch": 1421} {"train_loss": -5.810276985168457, "global_step": 59698, "epoch": 1421} {"train_loss": -5.869168758392334, "global_step": 59699, "epoch": 1421} {"train_loss": -5.834987640380859, "global_step": 59700, "epoch": 1421} {"train_loss": -5.8480706214904785, "global_step": 59701, "epoch": 1421} {"train_loss": -5.837475776672363, "global_step": 59702, "epoch": 1421} {"train_loss": -5.849508285522461, "global_step": 59703, "epoch": 1421} {"train_loss": -5.77009916305542, "global_step": 59704, "epoch": 1421} {"train_loss": -5.871006965637207, "global_step": 59705, "epoch": 1421} {"train_loss": -5.880385398864746, "global_step": 59706, "epoch": 1421} {"train_loss": -5.86024284362793, "global_step": 59707, "epoch": 1421} {"train_loss": -5.815424919128418, "global_step": 59708, "epoch": 1421} {"train_loss": -5.6960296630859375, "global_step": 59709, "epoch": 1421} {"train_loss": -5.781131744384766, "global_step": 59710, "epoch": 1421} {"train_loss": -5.872057914733887, "global_step": 59711, "epoch": 1421} {"train_loss": -5.7326459884643555, "global_step": 59712, "epoch": 1421} {"train_loss": -5.832669258117676, "global_step": 59713, "epoch": 1421} {"train_loss": -5.696771144866943, "global_step": 59714, "epoch": 1421} {"train_loss": -5.883266925811768, "global_step": 59715, "epoch": 1421} {"train_loss": -5.773016929626465, "global_step": 59716, "epoch": 1421} {"train_loss": -5.930480480194092, "global_step": 59717, "epoch": 1421} {"train_loss": -5.9057135581970215, "global_step": 59718, "epoch": 1421} {"train_loss": -5.8063554763793945, "global_step": 59719, "epoch": 1421} {"train_loss": -5.860488414764404, "global_step": 59720, "epoch": 1421} {"train_loss": -5.919798374176025, "global_step": 59721, "epoch": 1421} {"train_loss": -5.921504974365234, "global_step": 59722, "epoch": 1421} {"train_loss": -5.86014875911531, "global_step": 59723, "epoch": 1421, "val_loss": 66403.6796875} {"train_loss": -5.852583885192871, "global_step": 59724, "epoch": 1422} {"train_loss": -5.934104919433594, "global_step": 59725, "epoch": 1422} {"train_loss": -5.96911096572876, "global_step": 59726, "epoch": 1422} {"train_loss": -5.900299072265625, "global_step": 59727, "epoch": 1422} {"train_loss": -5.969815254211426, "global_step": 59728, "epoch": 1422} {"train_loss": -5.9758453369140625, "global_step": 59729, "epoch": 1422} {"train_loss": -5.765601634979248, "global_step": 59730, "epoch": 1422} {"train_loss": -5.943995475769043, "global_step": 59731, "epoch": 1422} {"train_loss": -5.889532089233398, "global_step": 59732, "epoch": 1422} {"train_loss": -5.653782367706299, "global_step": 59733, "epoch": 1422} {"train_loss": -5.846372127532959, "global_step": 59734, "epoch": 1422} {"train_loss": -5.822300910949707, "global_step": 59735, "epoch": 1422} {"train_loss": -5.957223415374756, "global_step": 59736, "epoch": 1422} {"train_loss": -5.831982612609863, "global_step": 59737, "epoch": 1422} {"train_loss": -5.984369277954102, "global_step": 59738, "epoch": 1422} {"train_loss": -5.824692249298096, "global_step": 59739, "epoch": 1422} {"train_loss": -5.839595317840576, "global_step": 59740, "epoch": 1422} {"train_loss": -5.8386945724487305, "global_step": 59741, "epoch": 1422} {"train_loss": -5.943218231201172, "global_step": 59742, "epoch": 1422} {"train_loss": -5.910909652709961, "global_step": 59743, "epoch": 1422} {"train_loss": -5.91040563583374, "global_step": 59744, "epoch": 1422} {"train_loss": -5.768866062164307, "global_step": 59745, "epoch": 1422} {"train_loss": -5.954593658447266, "global_step": 59746, "epoch": 1422} {"train_loss": -5.814359664916992, "global_step": 59747, "epoch": 1422} {"train_loss": -5.767106533050537, "global_step": 59748, "epoch": 1422} {"train_loss": -5.786231994628906, "global_step": 59749, "epoch": 1422} {"train_loss": -5.835562705993652, "global_step": 59750, "epoch": 1422} {"train_loss": -5.8066558837890625, "global_step": 59751, "epoch": 1422} {"train_loss": -5.829836368560791, "global_step": 59752, "epoch": 1422} {"train_loss": -5.774239540100098, "global_step": 59753, "epoch": 1422} {"train_loss": -5.805020809173584, "global_step": 59754, "epoch": 1422} {"train_loss": -5.953776836395264, "global_step": 59755, "epoch": 1422} {"train_loss": -5.784763336181641, "global_step": 59756, "epoch": 1422} {"train_loss": -5.826551914215088, "global_step": 59757, "epoch": 1422} {"train_loss": -5.890895843505859, "global_step": 59758, "epoch": 1422} {"train_loss": -5.819854259490967, "global_step": 59759, "epoch": 1422} {"train_loss": -5.936539173126221, "global_step": 59760, "epoch": 1422} {"train_loss": -5.88071346282959, "global_step": 59761, "epoch": 1422} {"train_loss": -5.815351486206055, "global_step": 59762, "epoch": 1422} {"train_loss": -5.906632423400879, "global_step": 59763, "epoch": 1422} {"train_loss": -5.869128227233887, "global_step": 59764, "epoch": 1422} {"train_loss": -5.863970359166463, "global_step": 59765, "epoch": 1422, "val_loss": 67394.03125} {"train_loss": -5.963235855102539, "global_step": 59766, "epoch": 1423} {"train_loss": -5.809835910797119, "global_step": 59767, "epoch": 1423} {"train_loss": -6.005353927612305, "global_step": 59768, "epoch": 1423} {"train_loss": -5.822798728942871, "global_step": 59769, "epoch": 1423} {"train_loss": -5.827651023864746, "global_step": 59770, "epoch": 1423} {"train_loss": -6.012831211090088, "global_step": 59771, "epoch": 1423} {"train_loss": -5.892492294311523, "global_step": 59772, "epoch": 1423} {"train_loss": -5.900852203369141, "global_step": 59773, "epoch": 1423} {"train_loss": -5.842432022094727, "global_step": 59774, "epoch": 1423} {"train_loss": -5.87462043762207, "global_step": 59775, "epoch": 1423} {"train_loss": -5.853814125061035, "global_step": 59776, "epoch": 1423} {"train_loss": -5.9471435546875, "global_step": 59777, "epoch": 1423} {"train_loss": -5.784376621246338, "global_step": 59778, "epoch": 1423} {"train_loss": -5.8600969314575195, "global_step": 59779, "epoch": 1423} {"train_loss": -5.87971305847168, "global_step": 59780, "epoch": 1423} {"train_loss": -5.938094139099121, "global_step": 59781, "epoch": 1423} {"train_loss": -5.878237724304199, "global_step": 59782, "epoch": 1423} {"train_loss": -5.866507053375244, "global_step": 59783, "epoch": 1423} {"train_loss": -5.888710021972656, "global_step": 59784, "epoch": 1423} {"train_loss": -5.861553192138672, "global_step": 59785, "epoch": 1423} {"train_loss": -5.847252368927002, "global_step": 59786, "epoch": 1423} {"train_loss": -5.884747505187988, "global_step": 59787, "epoch": 1423} {"train_loss": -5.855295181274414, "global_step": 59788, "epoch": 1423} {"train_loss": -5.781660079956055, "global_step": 59789, "epoch": 1423} {"train_loss": -5.78230094909668, "global_step": 59790, "epoch": 1423} {"train_loss": -5.906832695007324, "global_step": 59791, "epoch": 1423} {"train_loss": -5.73322868347168, "global_step": 59792, "epoch": 1423} {"train_loss": -5.972810745239258, "global_step": 59793, "epoch": 1423} {"train_loss": -5.894338607788086, "global_step": 59794, "epoch": 1423} {"train_loss": -5.879040718078613, "global_step": 59795, "epoch": 1423} {"train_loss": -5.850677013397217, "global_step": 59796, "epoch": 1423} {"train_loss": -5.830943584442139, "global_step": 59797, "epoch": 1423} {"train_loss": -5.877913475036621, "global_step": 59798, "epoch": 1423} {"train_loss": -5.759217262268066, "global_step": 59799, "epoch": 1423} {"train_loss": -5.847890853881836, "global_step": 59800, "epoch": 1423} {"train_loss": -5.89409065246582, "global_step": 59801, "epoch": 1423} {"train_loss": -5.907862663269043, "global_step": 59802, "epoch": 1423} {"train_loss": -5.873847007751465, "global_step": 59803, "epoch": 1423} {"train_loss": -5.875472068786621, "global_step": 59804, "epoch": 1423} {"train_loss": -5.898898124694824, "global_step": 59805, "epoch": 1423} {"train_loss": -5.846766948699951, "global_step": 59806, "epoch": 1423} {"train_loss": -5.870097841535296, "global_step": 59807, "epoch": 1423, "val_loss": 66933.96875} {"train_loss": -5.954695224761963, "global_step": 59808, "epoch": 1424} {"train_loss": -6.0001726150512695, "global_step": 59809, "epoch": 1424} {"train_loss": -5.8628315925598145, "global_step": 59810, "epoch": 1424} {"train_loss": -5.881863594055176, "global_step": 59811, "epoch": 1424} {"train_loss": -5.901673316955566, "global_step": 59812, "epoch": 1424} {"train_loss": -5.983935356140137, "global_step": 59813, "epoch": 1424} {"train_loss": -5.9053544998168945, "global_step": 59814, "epoch": 1424} {"train_loss": -5.889337062835693, "global_step": 59815, "epoch": 1424} {"train_loss": -5.825932502746582, "global_step": 59816, "epoch": 1424} {"train_loss": -5.703957557678223, "global_step": 59817, "epoch": 1424} {"train_loss": -5.777667999267578, "global_step": 59818, "epoch": 1424} {"train_loss": -5.961058616638184, "global_step": 59819, "epoch": 1424} {"train_loss": -5.844403266906738, "global_step": 59820, "epoch": 1424} {"train_loss": -5.836829662322998, "global_step": 59821, "epoch": 1424} {"train_loss": -5.854229927062988, "global_step": 59822, "epoch": 1424} {"train_loss": -5.706305503845215, "global_step": 59823, "epoch": 1424} {"train_loss": -5.899684429168701, "global_step": 59824, "epoch": 1424} {"train_loss": -5.781774997711182, "global_step": 59825, "epoch": 1424} {"train_loss": -5.845660209655762, "global_step": 59826, "epoch": 1424} {"train_loss": -5.935807228088379, "global_step": 59827, "epoch": 1424} {"train_loss": -5.880959510803223, "global_step": 59828, "epoch": 1424} {"train_loss": -5.877967357635498, "global_step": 59829, "epoch": 1424} {"train_loss": -5.881397247314453, "global_step": 59830, "epoch": 1424} {"train_loss": -5.878827095031738, "global_step": 59831, "epoch": 1424} {"train_loss": -5.954618453979492, "global_step": 59832, "epoch": 1424} {"train_loss": -5.891739845275879, "global_step": 59833, "epoch": 1424} {"train_loss": -5.961520195007324, "global_step": 59834, "epoch": 1424} {"train_loss": -5.903260707855225, "global_step": 59835, "epoch": 1424} {"train_loss": -5.839206695556641, "global_step": 59836, "epoch": 1424} {"train_loss": -5.896731376647949, "global_step": 59837, "epoch": 1424} {"train_loss": -5.997366428375244, "global_step": 59838, "epoch": 1424} {"train_loss": -6.074901580810547, "global_step": 59839, "epoch": 1424} {"train_loss": -5.950077533721924, "global_step": 59840, "epoch": 1424} {"train_loss": -5.91876220703125, "global_step": 59841, "epoch": 1424} {"train_loss": -5.885795593261719, "global_step": 59842, "epoch": 1424} {"train_loss": -5.94598388671875, "global_step": 59843, "epoch": 1424} {"train_loss": -5.808117866516113, "global_step": 59844, "epoch": 1424} {"train_loss": -5.958505630493164, "global_step": 59845, "epoch": 1424} {"train_loss": -5.828003406524658, "global_step": 59846, "epoch": 1424} {"train_loss": -5.965462684631348, "global_step": 59847, "epoch": 1424} {"train_loss": -5.820989608764648, "global_step": 59848, "epoch": 1424} {"train_loss": -5.892769700004941, "global_step": 59849, "epoch": 1424, "val_loss": 66540.921875} {"train_loss": -5.887257099151611, "global_step": 59850, "epoch": 1425} {"train_loss": -6.010353088378906, "global_step": 59851, "epoch": 1425} {"train_loss": -5.907052040100098, "global_step": 59852, "epoch": 1425} {"train_loss": -5.906947135925293, "global_step": 59853, "epoch": 1425} {"train_loss": -5.833911895751953, "global_step": 59854, "epoch": 1425} {"train_loss": -5.933460712432861, "global_step": 59855, "epoch": 1425} {"train_loss": -5.854334831237793, "global_step": 59856, "epoch": 1425} {"train_loss": -5.78291130065918, "global_step": 59857, "epoch": 1425} {"train_loss": -5.767039775848389, "global_step": 59858, "epoch": 1425} {"train_loss": -5.924653053283691, "global_step": 59859, "epoch": 1425} {"train_loss": -5.780515670776367, "global_step": 59860, "epoch": 1425} {"train_loss": -5.920316696166992, "global_step": 59861, "epoch": 1425} {"train_loss": -5.971543788909912, "global_step": 59862, "epoch": 1425} {"train_loss": -5.913213729858398, "global_step": 59863, "epoch": 1425} {"train_loss": -5.959589004516602, "global_step": 59864, "epoch": 1425} {"train_loss": -5.80800199508667, "global_step": 59865, "epoch": 1425} {"train_loss": -5.802000999450684, "global_step": 59866, "epoch": 1425} {"train_loss": -5.93393087387085, "global_step": 59867, "epoch": 1425} {"train_loss": -5.922079086303711, "global_step": 59868, "epoch": 1425} {"train_loss": -5.991951942443848, "global_step": 59869, "epoch": 1425} {"train_loss": -6.042276382446289, "global_step": 59870, "epoch": 1425} {"train_loss": -5.847110271453857, "global_step": 59871, "epoch": 1425} {"train_loss": -5.897138595581055, "global_step": 59872, "epoch": 1425} {"train_loss": -5.97227144241333, "global_step": 59873, "epoch": 1425} {"train_loss": -5.99592924118042, "global_step": 59874, "epoch": 1425} {"train_loss": -5.897964000701904, "global_step": 59875, "epoch": 1425} {"train_loss": -5.949932098388672, "global_step": 59876, "epoch": 1425} {"train_loss": -5.83527946472168, "global_step": 59877, "epoch": 1425} {"train_loss": -5.899758338928223, "global_step": 59878, "epoch": 1425} {"train_loss": -5.824306011199951, "global_step": 59879, "epoch": 1425} {"train_loss": -5.825695037841797, "global_step": 59880, "epoch": 1425} {"train_loss": -5.951713562011719, "global_step": 59881, "epoch": 1425} {"train_loss": -5.92057991027832, "global_step": 59882, "epoch": 1425} {"train_loss": -5.82989501953125, "global_step": 59883, "epoch": 1425} {"train_loss": -5.9849114418029785, "global_step": 59884, "epoch": 1425} {"train_loss": -5.849030494689941, "global_step": 59885, "epoch": 1425} {"train_loss": -5.874667167663574, "global_step": 59886, "epoch": 1425} {"train_loss": -5.888776779174805, "global_step": 59887, "epoch": 1425} {"train_loss": -5.909285545349121, "global_step": 59888, "epoch": 1425} {"train_loss": -5.8791093826293945, "global_step": 59889, "epoch": 1425} {"train_loss": -5.9266252517700195, "global_step": 59890, "epoch": 1425} {"train_loss": -5.895565577915737, "global_step": 59891, "epoch": 1425, "val_loss": 66707.375} {"train_loss": -5.963303089141846, "global_step": 59892, "epoch": 1426} {"train_loss": -5.898016929626465, "global_step": 59893, "epoch": 1426} {"train_loss": -6.02592658996582, "global_step": 59894, "epoch": 1426} {"train_loss": -5.885196685791016, "global_step": 59895, "epoch": 1426} {"train_loss": -6.012664794921875, "global_step": 59896, "epoch": 1426} {"train_loss": -5.9647932052612305, "global_step": 59897, "epoch": 1426} {"train_loss": -5.900254726409912, "global_step": 59898, "epoch": 1426} {"train_loss": -5.861939430236816, "global_step": 59899, "epoch": 1426} {"train_loss": -5.937475204467773, "global_step": 59900, "epoch": 1426} {"train_loss": -5.860166072845459, "global_step": 59901, "epoch": 1426} {"train_loss": -5.8548054695129395, "global_step": 59902, "epoch": 1426} {"train_loss": -5.890209197998047, "global_step": 59903, "epoch": 1426} {"train_loss": -5.9787421226501465, "global_step": 59904, "epoch": 1426} {"train_loss": -5.900611877441406, "global_step": 59905, "epoch": 1426} {"train_loss": -5.798227310180664, "global_step": 59906, "epoch": 1426} {"train_loss": -5.861049652099609, "global_step": 59907, "epoch": 1426} {"train_loss": -5.941295623779297, "global_step": 59908, "epoch": 1426} {"train_loss": -5.833034038543701, "global_step": 59909, "epoch": 1426} {"train_loss": -5.864612579345703, "global_step": 59910, "epoch": 1426} {"train_loss": -5.867700099945068, "global_step": 59911, "epoch": 1426} {"train_loss": -5.920502662658691, "global_step": 59912, "epoch": 1426} {"train_loss": -5.841403007507324, "global_step": 59913, "epoch": 1426} {"train_loss": -5.972583293914795, "global_step": 59914, "epoch": 1426} {"train_loss": -5.752218246459961, "global_step": 59915, "epoch": 1426} {"train_loss": -5.87573766708374, "global_step": 59916, "epoch": 1426} {"train_loss": -5.785979270935059, "global_step": 59917, "epoch": 1426} {"train_loss": -5.841491222381592, "global_step": 59918, "epoch": 1426} {"train_loss": -5.913222312927246, "global_step": 59919, "epoch": 1426} {"train_loss": -5.8671417236328125, "global_step": 59920, "epoch": 1426} {"train_loss": -5.875144004821777, "global_step": 59921, "epoch": 1426} {"train_loss": -5.871725082397461, "global_step": 59922, "epoch": 1426} {"train_loss": -5.828505516052246, "global_step": 59923, "epoch": 1426} {"train_loss": -5.897587776184082, "global_step": 59924, "epoch": 1426} {"train_loss": -5.783121109008789, "global_step": 59925, "epoch": 1426} {"train_loss": -5.7190046310424805, "global_step": 59926, "epoch": 1426} {"train_loss": -5.877727031707764, "global_step": 59927, "epoch": 1426} {"train_loss": -5.861440658569336, "global_step": 59928, "epoch": 1426} {"train_loss": -5.9203572273254395, "global_step": 59929, "epoch": 1426} {"train_loss": -5.901238441467285, "global_step": 59930, "epoch": 1426} {"train_loss": -5.828044891357422, "global_step": 59931, "epoch": 1426} {"train_loss": -6.002799034118652, "global_step": 59932, "epoch": 1426} {"train_loss": -5.882579156330654, "global_step": 59933, "epoch": 1426, "val_loss": 66980.5546875} {"train_loss": -5.970104217529297, "global_step": 59934, "epoch": 1427} {"train_loss": -5.833261489868164, "global_step": 59935, "epoch": 1427} {"train_loss": -5.7304792404174805, "global_step": 59936, "epoch": 1427} {"train_loss": -6.024811744689941, "global_step": 59937, "epoch": 1427} {"train_loss": -5.787303924560547, "global_step": 59938, "epoch": 1427} {"train_loss": -5.796407699584961, "global_step": 59939, "epoch": 1427} {"train_loss": -5.876248836517334, "global_step": 59940, "epoch": 1427} {"train_loss": -5.963028907775879, "global_step": 59941, "epoch": 1427} {"train_loss": -5.8638224601745605, "global_step": 59942, "epoch": 1427} {"train_loss": -5.786708354949951, "global_step": 59943, "epoch": 1427} {"train_loss": -5.884769439697266, "global_step": 59944, "epoch": 1427} {"train_loss": -5.77407169342041, "global_step": 59945, "epoch": 1427} {"train_loss": -5.853105545043945, "global_step": 59946, "epoch": 1427} {"train_loss": -5.850901126861572, "global_step": 59947, "epoch": 1427} {"train_loss": -6.01619815826416, "global_step": 59948, "epoch": 1427} {"train_loss": -5.771746635437012, "global_step": 59949, "epoch": 1427} {"train_loss": -5.82313346862793, "global_step": 59950, "epoch": 1427} {"train_loss": -5.843623638153076, "global_step": 59951, "epoch": 1427} {"train_loss": -5.852435111999512, "global_step": 59952, "epoch": 1427} {"train_loss": -5.942447662353516, "global_step": 59953, "epoch": 1427} {"train_loss": -5.846592903137207, "global_step": 59954, "epoch": 1427} {"train_loss": -5.773265838623047, "global_step": 59955, "epoch": 1427} {"train_loss": -5.767989635467529, "global_step": 59956, "epoch": 1427} {"train_loss": -5.845836639404297, "global_step": 59957, "epoch": 1427} {"train_loss": -5.960456848144531, "global_step": 59958, "epoch": 1427} {"train_loss": -5.835626602172852, "global_step": 59959, "epoch": 1427} {"train_loss": -5.874817371368408, "global_step": 59960, "epoch": 1427} {"train_loss": -5.951919078826904, "global_step": 59961, "epoch": 1427} {"train_loss": -5.836209774017334, "global_step": 59962, "epoch": 1427} {"train_loss": -5.900244235992432, "global_step": 59963, "epoch": 1427} {"train_loss": -5.802111625671387, "global_step": 59964, "epoch": 1427} {"train_loss": -5.756176948547363, "global_step": 59965, "epoch": 1427} {"train_loss": -5.814426422119141, "global_step": 59966, "epoch": 1427} {"train_loss": -5.75750732421875, "global_step": 59967, "epoch": 1427} {"train_loss": -5.864389419555664, "global_step": 59968, "epoch": 1427} {"train_loss": -5.735450744628906, "global_step": 59969, "epoch": 1427} {"train_loss": -5.91549015045166, "global_step": 59970, "epoch": 1427} {"train_loss": -5.911843299865723, "global_step": 59971, "epoch": 1427} {"train_loss": -5.885948657989502, "global_step": 59972, "epoch": 1427} {"train_loss": -5.823102951049805, "global_step": 59973, "epoch": 1427} {"train_loss": -5.91038703918457, "global_step": 59974, "epoch": 1427} {"train_loss": -5.8530411039079935, "global_step": 59975, "epoch": 1427, "val_loss": 66943.8671875} {"train_loss": -5.884161472320557, "global_step": 59976, "epoch": 1428} {"train_loss": -5.9568939208984375, "global_step": 59977, "epoch": 1428} {"train_loss": -5.819231033325195, "global_step": 59978, "epoch": 1428} {"train_loss": -5.8992414474487305, "global_step": 59979, "epoch": 1428} {"train_loss": -5.804767608642578, "global_step": 59980, "epoch": 1428} {"train_loss": -5.872705459594727, "global_step": 59981, "epoch": 1428} {"train_loss": -5.9320783615112305, "global_step": 59982, "epoch": 1428} {"train_loss": -5.89614200592041, "global_step": 59983, "epoch": 1428} {"train_loss": -5.804616451263428, "global_step": 59984, "epoch": 1428} {"train_loss": -5.942465782165527, "global_step": 59985, "epoch": 1428} {"train_loss": -5.873175621032715, "global_step": 59986, "epoch": 1428} {"train_loss": -5.837826251983643, "global_step": 59987, "epoch": 1428} {"train_loss": -5.946907043457031, "global_step": 59988, "epoch": 1428} {"train_loss": -5.943593502044678, "global_step": 59989, "epoch": 1428} {"train_loss": -5.904061317443848, "global_step": 59990, "epoch": 1428} {"train_loss": -5.860300064086914, "global_step": 59991, "epoch": 1428} {"train_loss": -5.875425338745117, "global_step": 59992, "epoch": 1428} {"train_loss": -5.969486236572266, "global_step": 59993, "epoch": 1428} {"train_loss": -5.920171737670898, "global_step": 59994, "epoch": 1428} {"train_loss": -5.986584186553955, "global_step": 59995, "epoch": 1428} {"train_loss": -5.929538249969482, "global_step": 59996, "epoch": 1428} {"train_loss": -5.788816928863525, "global_step": 59997, "epoch": 1428} {"train_loss": -5.923406600952148, "global_step": 59998, "epoch": 1428} {"train_loss": -5.909618377685547, "global_step": 59999, "epoch": 1428} {"train_loss": -5.9243693351745605, "global_step": 60000, "epoch": 1428} {"train_loss": -5.903420925140381, "global_step": 60001, "epoch": 1428} {"train_loss": -5.834152698516846, "global_step": 60002, "epoch": 1428} {"train_loss": -5.914923667907715, "global_step": 60003, "epoch": 1428} {"train_loss": -5.89995002746582, "global_step": 60004, "epoch": 1428} {"train_loss": -5.938392639160156, "global_step": 60005, "epoch": 1428} {"train_loss": -5.9239654541015625, "global_step": 60006, "epoch": 1428} {"train_loss": -5.926657676696777, "global_step": 60007, "epoch": 1428} {"train_loss": -5.811640739440918, "global_step": 60008, "epoch": 1428} {"train_loss": -5.755279541015625, "global_step": 60009, "epoch": 1428} {"train_loss": -5.899769306182861, "global_step": 60010, "epoch": 1428} {"train_loss": -5.931379318237305, "global_step": 60011, "epoch": 1428} {"train_loss": -5.836942672729492, "global_step": 60012, "epoch": 1428} {"train_loss": -5.918601036071777, "global_step": 60013, "epoch": 1428} {"train_loss": -5.943164825439453, "global_step": 60014, "epoch": 1428} {"train_loss": -5.89499044418335, "global_step": 60015, "epoch": 1428} {"train_loss": -5.903601169586182, "global_step": 60016, "epoch": 1428} {"train_loss": -5.8940061046963645, "global_step": 60017, "epoch": 1428, "val_loss": 66501.6796875} {"train_loss": -5.856706619262695, "global_step": 60018, "epoch": 1429} {"train_loss": -5.905592441558838, "global_step": 60019, "epoch": 1429} {"train_loss": -5.915324687957764, "global_step": 60020, "epoch": 1429} {"train_loss": -5.942587852478027, "global_step": 60021, "epoch": 1429} {"train_loss": -5.878414154052734, "global_step": 60022, "epoch": 1429} {"train_loss": -5.910877227783203, "global_step": 60023, "epoch": 1429} {"train_loss": -5.792909145355225, "global_step": 60024, "epoch": 1429} {"train_loss": -6.035001277923584, "global_step": 60025, "epoch": 1429} {"train_loss": -5.926085472106934, "global_step": 60026, "epoch": 1429} {"train_loss": -5.883005142211914, "global_step": 60027, "epoch": 1429} {"train_loss": -5.974204063415527, "global_step": 60028, "epoch": 1429} {"train_loss": -5.920112609863281, "global_step": 60029, "epoch": 1429} {"train_loss": -5.951813697814941, "global_step": 60030, "epoch": 1429} {"train_loss": -5.945830345153809, "global_step": 60031, "epoch": 1429} {"train_loss": -5.9685211181640625, "global_step": 60032, "epoch": 1429} {"train_loss": -5.985579490661621, "global_step": 60033, "epoch": 1429} {"train_loss": -5.941320419311523, "global_step": 60034, "epoch": 1429} {"train_loss": -5.865399360656738, "global_step": 60035, "epoch": 1429} {"train_loss": -5.908866882324219, "global_step": 60036, "epoch": 1429} {"train_loss": -6.015764236450195, "global_step": 60037, "epoch": 1429} {"train_loss": -5.886210918426514, "global_step": 60038, "epoch": 1429} {"train_loss": -5.976019859313965, "global_step": 60039, "epoch": 1429} {"train_loss": -5.940300464630127, "global_step": 60040, "epoch": 1429} {"train_loss": -5.9865641593933105, "global_step": 60041, "epoch": 1429} {"train_loss": -5.783267021179199, "global_step": 60042, "epoch": 1429} {"train_loss": -5.723960876464844, "global_step": 60043, "epoch": 1429} {"train_loss": -5.892453193664551, "global_step": 60044, "epoch": 1429} {"train_loss": -5.9461750984191895, "global_step": 60045, "epoch": 1429} {"train_loss": -5.862586975097656, "global_step": 60046, "epoch": 1429} {"train_loss": -5.938924789428711, "global_step": 60047, "epoch": 1429} {"train_loss": -5.860498428344727, "global_step": 60048, "epoch": 1429} {"train_loss": -5.842918395996094, "global_step": 60049, "epoch": 1429} {"train_loss": -6.005417823791504, "global_step": 60050, "epoch": 1429} {"train_loss": -5.979174613952637, "global_step": 60051, "epoch": 1429} {"train_loss": -5.853612899780273, "global_step": 60052, "epoch": 1429} {"train_loss": -5.974348068237305, "global_step": 60053, "epoch": 1429} {"train_loss": -5.856695175170898, "global_step": 60054, "epoch": 1429} {"train_loss": -5.840282440185547, "global_step": 60055, "epoch": 1429} {"train_loss": -5.789370536804199, "global_step": 60056, "epoch": 1429} {"train_loss": -5.978946685791016, "global_step": 60057, "epoch": 1429} {"train_loss": -5.90531587600708, "global_step": 60058, "epoch": 1429} {"train_loss": -5.91088080406189, "global_step": 60059, "epoch": 1429, "val_loss": 66644.6953125} {"train_loss": -5.8962507247924805, "global_step": 60060, "epoch": 1430} {"train_loss": -5.969461917877197, "global_step": 60061, "epoch": 1430} {"train_loss": -5.975961685180664, "global_step": 60062, "epoch": 1430} {"train_loss": -5.866863250732422, "global_step": 60063, "epoch": 1430} {"train_loss": -5.969649314880371, "global_step": 60064, "epoch": 1430} {"train_loss": -5.830897331237793, "global_step": 60065, "epoch": 1430} {"train_loss": -5.919730186462402, "global_step": 60066, "epoch": 1430} {"train_loss": -5.862246036529541, "global_step": 60067, "epoch": 1430} {"train_loss": -5.836425304412842, "global_step": 60068, "epoch": 1430} {"train_loss": -5.982702255249023, "global_step": 60069, "epoch": 1430} {"train_loss": -5.927914619445801, "global_step": 60070, "epoch": 1430} {"train_loss": -5.840089797973633, "global_step": 60071, "epoch": 1430} {"train_loss": -5.8715500831604, "global_step": 60072, "epoch": 1430} {"train_loss": -5.948328971862793, "global_step": 60073, "epoch": 1430} {"train_loss": -5.834937572479248, "global_step": 60074, "epoch": 1430} {"train_loss": -5.842862129211426, "global_step": 60075, "epoch": 1430} {"train_loss": -5.9424238204956055, "global_step": 60076, "epoch": 1430} {"train_loss": -5.823282718658447, "global_step": 60077, "epoch": 1430} {"train_loss": -5.822162628173828, "global_step": 60078, "epoch": 1430} {"train_loss": -5.778522491455078, "global_step": 60079, "epoch": 1430} {"train_loss": -5.960089683532715, "global_step": 60080, "epoch": 1430} {"train_loss": -5.781622886657715, "global_step": 60081, "epoch": 1430} {"train_loss": -5.971414566040039, "global_step": 60082, "epoch": 1430} {"train_loss": -5.8168792724609375, "global_step": 60083, "epoch": 1430} {"train_loss": -6.008190155029297, "global_step": 60084, "epoch": 1430} {"train_loss": -5.937502384185791, "global_step": 60085, "epoch": 1430} {"train_loss": -5.920129776000977, "global_step": 60086, "epoch": 1430} {"train_loss": -5.838243007659912, "global_step": 60087, "epoch": 1430} {"train_loss": -5.9853715896606445, "global_step": 60088, "epoch": 1430} {"train_loss": -5.869816780090332, "global_step": 60089, "epoch": 1430} {"train_loss": -5.943953514099121, "global_step": 60090, "epoch": 1430} {"train_loss": -5.892580032348633, "global_step": 60091, "epoch": 1430} {"train_loss": -5.894724369049072, "global_step": 60092, "epoch": 1430} {"train_loss": -5.914429664611816, "global_step": 60093, "epoch": 1430} {"train_loss": -5.809700012207031, "global_step": 60094, "epoch": 1430} {"train_loss": -5.9360198974609375, "global_step": 60095, "epoch": 1430} {"train_loss": -5.765628814697266, "global_step": 60096, "epoch": 1430} {"train_loss": -5.912406921386719, "global_step": 60097, "epoch": 1430} {"train_loss": -5.920945644378662, "global_step": 60098, "epoch": 1430} {"train_loss": -5.94024133682251, "global_step": 60099, "epoch": 1430} {"train_loss": -5.759958744049072, "global_step": 60100, "epoch": 1430} {"train_loss": -5.894405069805327, "global_step": 60101, "epoch": 1430, "val_loss": 66658.578125} {"train_loss": -5.944093704223633, "global_step": 60102, "epoch": 1431} {"train_loss": -5.920876502990723, "global_step": 60103, "epoch": 1431} {"train_loss": -5.753778457641602, "global_step": 60104, "epoch": 1431} {"train_loss": -5.88304328918457, "global_step": 60105, "epoch": 1431} {"train_loss": -5.858009338378906, "global_step": 60106, "epoch": 1431} {"train_loss": -5.858515739440918, "global_step": 60107, "epoch": 1431} {"train_loss": -5.721266746520996, "global_step": 60108, "epoch": 1431} {"train_loss": -5.850735187530518, "global_step": 60109, "epoch": 1431} {"train_loss": -6.026491165161133, "global_step": 60110, "epoch": 1431} {"train_loss": -5.8789873123168945, "global_step": 60111, "epoch": 1431} {"train_loss": -5.857992649078369, "global_step": 60112, "epoch": 1431} {"train_loss": -5.77977180480957, "global_step": 60113, "epoch": 1431} {"train_loss": -5.925350189208984, "global_step": 60114, "epoch": 1431} {"train_loss": -5.918135643005371, "global_step": 60115, "epoch": 1431} {"train_loss": -5.824044227600098, "global_step": 60116, "epoch": 1431} {"train_loss": -5.9807844161987305, "global_step": 60117, "epoch": 1431} {"train_loss": -5.966002464294434, "global_step": 60118, "epoch": 1431} {"train_loss": -5.937605381011963, "global_step": 60119, "epoch": 1431} {"train_loss": -5.875247955322266, "global_step": 60120, "epoch": 1431} {"train_loss": -5.955018997192383, "global_step": 60121, "epoch": 1431} {"train_loss": -5.926214218139648, "global_step": 60122, "epoch": 1431} {"train_loss": -5.8588948249816895, "global_step": 60123, "epoch": 1431} {"train_loss": -5.988384246826172, "global_step": 60124, "epoch": 1431} {"train_loss": -5.837145805358887, "global_step": 60125, "epoch": 1431} {"train_loss": -5.790114402770996, "global_step": 60126, "epoch": 1431} {"train_loss": -5.932229042053223, "global_step": 60127, "epoch": 1431} {"train_loss": -5.931660175323486, "global_step": 60128, "epoch": 1431} {"train_loss": -5.752361297607422, "global_step": 60129, "epoch": 1431} {"train_loss": -5.880192756652832, "global_step": 60130, "epoch": 1431} {"train_loss": -5.951668739318848, "global_step": 60131, "epoch": 1431} {"train_loss": -5.770753860473633, "global_step": 60132, "epoch": 1431} {"train_loss": -5.848079681396484, "global_step": 60133, "epoch": 1431} {"train_loss": -5.645390033721924, "global_step": 60134, "epoch": 1431} {"train_loss": -5.847363471984863, "global_step": 60135, "epoch": 1431} {"train_loss": -5.932474136352539, "global_step": 60136, "epoch": 1431} {"train_loss": -5.958105087280273, "global_step": 60137, "epoch": 1431} {"train_loss": -5.852624893188477, "global_step": 60138, "epoch": 1431} {"train_loss": -5.720411777496338, "global_step": 60139, "epoch": 1431} {"train_loss": -5.711380481719971, "global_step": 60140, "epoch": 1431} {"train_loss": -5.933506965637207, "global_step": 60141, "epoch": 1431} {"train_loss": -5.927510738372803, "global_step": 60142, "epoch": 1431} {"train_loss": -5.872171174912226, "global_step": 60143, "epoch": 1431, "val_loss": 66680.0859375} {"train_loss": -5.892176628112793, "global_step": 60144, "epoch": 1432} {"train_loss": -5.984936714172363, "global_step": 60145, "epoch": 1432} {"train_loss": -5.880873203277588, "global_step": 60146, "epoch": 1432} {"train_loss": -5.876106262207031, "global_step": 60147, "epoch": 1432} {"train_loss": -5.922342300415039, "global_step": 60148, "epoch": 1432} {"train_loss": -5.751118183135986, "global_step": 60149, "epoch": 1432} {"train_loss": -5.892472267150879, "global_step": 60150, "epoch": 1432} {"train_loss": -5.855160236358643, "global_step": 60151, "epoch": 1432} {"train_loss": -5.818723201751709, "global_step": 60152, "epoch": 1432} {"train_loss": -5.7994914054870605, "global_step": 60153, "epoch": 1432} {"train_loss": -5.963832855224609, "global_step": 60154, "epoch": 1432} {"train_loss": -5.863722324371338, "global_step": 60155, "epoch": 1432} {"train_loss": -5.963614463806152, "global_step": 60156, "epoch": 1432} {"train_loss": -5.858299255371094, "global_step": 60157, "epoch": 1432} {"train_loss": -5.927238464355469, "global_step": 60158, "epoch": 1432} {"train_loss": -5.872927665710449, "global_step": 60159, "epoch": 1432} {"train_loss": -5.993388652801514, "global_step": 60160, "epoch": 1432} {"train_loss": -5.9108099937438965, "global_step": 60161, "epoch": 1432} {"train_loss": -5.825735092163086, "global_step": 60162, "epoch": 1432} {"train_loss": -5.90346622467041, "global_step": 60163, "epoch": 1432} {"train_loss": -5.785924911499023, "global_step": 60164, "epoch": 1432} {"train_loss": -5.879039287567139, "global_step": 60165, "epoch": 1432} {"train_loss": -5.8187150955200195, "global_step": 60166, "epoch": 1432} {"train_loss": -5.832832336425781, "global_step": 60167, "epoch": 1432} {"train_loss": -5.847756385803223, "global_step": 60168, "epoch": 1432} {"train_loss": -5.9173479080200195, "global_step": 60169, "epoch": 1432} {"train_loss": -5.921538352966309, "global_step": 60170, "epoch": 1432} {"train_loss": -5.853959083557129, "global_step": 60171, "epoch": 1432} {"train_loss": -5.869159698486328, "global_step": 60172, "epoch": 1432} {"train_loss": -5.854060173034668, "global_step": 60173, "epoch": 1432} {"train_loss": -5.842106819152832, "global_step": 60174, "epoch": 1432} {"train_loss": -5.915953159332275, "global_step": 60175, "epoch": 1432} {"train_loss": -6.034643173217773, "global_step": 60176, "epoch": 1432} {"train_loss": -5.75316047668457, "global_step": 60177, "epoch": 1432} {"train_loss": -5.874684810638428, "global_step": 60178, "epoch": 1432} {"train_loss": -5.909148216247559, "global_step": 60179, "epoch": 1432} {"train_loss": -5.9371209144592285, "global_step": 60180, "epoch": 1432} {"train_loss": -5.768200397491455, "global_step": 60181, "epoch": 1432} {"train_loss": -5.923530578613281, "global_step": 60182, "epoch": 1432} {"train_loss": -5.9300336837768555, "global_step": 60183, "epoch": 1432} {"train_loss": -5.8787336349487305, "global_step": 60184, "epoch": 1432} {"train_loss": -5.881623915263584, "global_step": 60185, "epoch": 1432, "val_loss": 66859.984375} {"train_loss": -5.859367847442627, "global_step": 60186, "epoch": 1433} {"train_loss": -5.893584251403809, "global_step": 60187, "epoch": 1433} {"train_loss": -5.960083484649658, "global_step": 60188, "epoch": 1433} {"train_loss": -5.906048774719238, "global_step": 60189, "epoch": 1433} {"train_loss": -5.880306243896484, "global_step": 60190, "epoch": 1433} {"train_loss": -6.094777584075928, "global_step": 60191, "epoch": 1433} {"train_loss": -5.880923271179199, "global_step": 60192, "epoch": 1433} {"train_loss": -5.967280387878418, "global_step": 60193, "epoch": 1433} {"train_loss": -5.90158748626709, "global_step": 60194, "epoch": 1433} {"train_loss": -5.940228462219238, "global_step": 60195, "epoch": 1433} {"train_loss": -5.974560737609863, "global_step": 60196, "epoch": 1433} {"train_loss": -5.9891862869262695, "global_step": 60197, "epoch": 1433} {"train_loss": -5.909319877624512, "global_step": 60198, "epoch": 1433} {"train_loss": -5.879085540771484, "global_step": 60199, "epoch": 1433} {"train_loss": -5.829338073730469, "global_step": 60200, "epoch": 1433} {"train_loss": -5.998222827911377, "global_step": 60201, "epoch": 1433} {"train_loss": -5.811648368835449, "global_step": 60202, "epoch": 1433} {"train_loss": -5.823831558227539, "global_step": 60203, "epoch": 1433} {"train_loss": -5.9280500411987305, "global_step": 60204, "epoch": 1433} {"train_loss": -6.012024879455566, "global_step": 60205, "epoch": 1433} {"train_loss": -5.888278961181641, "global_step": 60206, "epoch": 1433} {"train_loss": -5.9907660484313965, "global_step": 60207, "epoch": 1433} {"train_loss": -5.815176010131836, "global_step": 60208, "epoch": 1433} {"train_loss": -5.903690814971924, "global_step": 60209, "epoch": 1433} {"train_loss": -6.062038421630859, "global_step": 60210, "epoch": 1433} {"train_loss": -5.924460411071777, "global_step": 60211, "epoch": 1433} {"train_loss": -6.018105506896973, "global_step": 60212, "epoch": 1433} {"train_loss": -5.8186140060424805, "global_step": 60213, "epoch": 1433} {"train_loss": -5.876830101013184, "global_step": 60214, "epoch": 1433} {"train_loss": -5.905622482299805, "global_step": 60215, "epoch": 1433} {"train_loss": -5.8469672203063965, "global_step": 60216, "epoch": 1433} {"train_loss": -5.899202346801758, "global_step": 60217, "epoch": 1433} {"train_loss": -5.992840766906738, "global_step": 60218, "epoch": 1433} {"train_loss": -5.744815349578857, "global_step": 60219, "epoch": 1433} {"train_loss": -5.842400550842285, "global_step": 60220, "epoch": 1433} {"train_loss": -5.919106483459473, "global_step": 60221, "epoch": 1433} {"train_loss": -5.881015300750732, "global_step": 60222, "epoch": 1433} {"train_loss": -5.885288238525391, "global_step": 60223, "epoch": 1433} {"train_loss": -5.8998870849609375, "global_step": 60224, "epoch": 1433} {"train_loss": -5.801135540008545, "global_step": 60225, "epoch": 1433} {"train_loss": -5.862492561340332, "global_step": 60226, "epoch": 1433} {"train_loss": -5.905650479452951, "global_step": 60227, "epoch": 1433, "val_loss": 66647.9453125} {"train_loss": -5.890577793121338, "global_step": 60228, "epoch": 1434} {"train_loss": -5.85661506652832, "global_step": 60229, "epoch": 1434} {"train_loss": -5.97529411315918, "global_step": 60230, "epoch": 1434} {"train_loss": -5.773504257202148, "global_step": 60231, "epoch": 1434} {"train_loss": -5.912567138671875, "global_step": 60232, "epoch": 1434} {"train_loss": -5.934314250946045, "global_step": 60233, "epoch": 1434} {"train_loss": -5.899288177490234, "global_step": 60234, "epoch": 1434} {"train_loss": -5.939709663391113, "global_step": 60235, "epoch": 1434} {"train_loss": -5.973293304443359, "global_step": 60236, "epoch": 1434} {"train_loss": -5.8492841720581055, "global_step": 60237, "epoch": 1434} {"train_loss": -5.923625946044922, "global_step": 60238, "epoch": 1434} {"train_loss": -5.87726354598999, "global_step": 60239, "epoch": 1434} {"train_loss": -5.764902114868164, "global_step": 60240, "epoch": 1434} {"train_loss": -5.795079231262207, "global_step": 60241, "epoch": 1434} {"train_loss": -5.744329929351807, "global_step": 60242, "epoch": 1434} {"train_loss": -5.647463321685791, "global_step": 60243, "epoch": 1434} {"train_loss": -5.951265811920166, "global_step": 60244, "epoch": 1434} {"train_loss": -5.87531852722168, "global_step": 60245, "epoch": 1434} {"train_loss": -5.923879146575928, "global_step": 60246, "epoch": 1434} {"train_loss": -5.873493194580078, "global_step": 60247, "epoch": 1434} {"train_loss": -5.877423286437988, "global_step": 60248, "epoch": 1434} {"train_loss": -5.91335916519165, "global_step": 60249, "epoch": 1434} {"train_loss": -5.961053848266602, "global_step": 60250, "epoch": 1434} {"train_loss": -5.954490661621094, "global_step": 60251, "epoch": 1434} {"train_loss": -5.774449348449707, "global_step": 60252, "epoch": 1434} {"train_loss": -5.894110679626465, "global_step": 60253, "epoch": 1434} {"train_loss": -5.924012184143066, "global_step": 60254, "epoch": 1434} {"train_loss": -5.837430000305176, "global_step": 60255, "epoch": 1434} {"train_loss": -5.9494757652282715, "global_step": 60256, "epoch": 1434} {"train_loss": -5.758779525756836, "global_step": 60257, "epoch": 1434} {"train_loss": -5.839399337768555, "global_step": 60258, "epoch": 1434} {"train_loss": -5.900540351867676, "global_step": 60259, "epoch": 1434} {"train_loss": -5.801731109619141, "global_step": 60260, "epoch": 1434} {"train_loss": -5.9300432205200195, "global_step": 60261, "epoch": 1434} {"train_loss": -5.756751537322998, "global_step": 60262, "epoch": 1434} {"train_loss": -5.971291542053223, "global_step": 60263, "epoch": 1434} {"train_loss": -5.936861991882324, "global_step": 60264, "epoch": 1434} {"train_loss": -5.862501621246338, "global_step": 60265, "epoch": 1434} {"train_loss": -5.781558990478516, "global_step": 60266, "epoch": 1434} {"train_loss": -5.907575607299805, "global_step": 60267, "epoch": 1434} {"train_loss": -5.802002906799316, "global_step": 60268, "epoch": 1434} {"train_loss": -5.870434329623268, "global_step": 60269, "epoch": 1434, "val_loss": 66635.390625} {"train_loss": -5.934210777282715, "global_step": 60270, "epoch": 1435} {"train_loss": -5.878549575805664, "global_step": 60271, "epoch": 1435} {"train_loss": -5.922840118408203, "global_step": 60272, "epoch": 1435} {"train_loss": -5.804704666137695, "global_step": 60273, "epoch": 1435} {"train_loss": -5.869025230407715, "global_step": 60274, "epoch": 1435} {"train_loss": -5.856965065002441, "global_step": 60275, "epoch": 1435} {"train_loss": -5.918429851531982, "global_step": 60276, "epoch": 1435} {"train_loss": -5.825517177581787, "global_step": 60277, "epoch": 1435} {"train_loss": -5.750136852264404, "global_step": 60278, "epoch": 1435} {"train_loss": -5.82958459854126, "global_step": 60279, "epoch": 1435} {"train_loss": -6.001028060913086, "global_step": 60280, "epoch": 1435} {"train_loss": -5.802801132202148, "global_step": 60281, "epoch": 1435} {"train_loss": -5.813754081726074, "global_step": 60282, "epoch": 1435} {"train_loss": -5.842595100402832, "global_step": 60283, "epoch": 1435} {"train_loss": -5.863214015960693, "global_step": 60284, "epoch": 1435} {"train_loss": -5.8396830558776855, "global_step": 60285, "epoch": 1435} {"train_loss": -5.7781877517700195, "global_step": 60286, "epoch": 1435} {"train_loss": -5.89697790145874, "global_step": 60287, "epoch": 1435} {"train_loss": -5.902109146118164, "global_step": 60288, "epoch": 1435} {"train_loss": -5.792325019836426, "global_step": 60289, "epoch": 1435} {"train_loss": -5.9932074546813965, "global_step": 60290, "epoch": 1435} {"train_loss": -5.861252784729004, "global_step": 60291, "epoch": 1435} {"train_loss": -5.855259895324707, "global_step": 60292, "epoch": 1435} {"train_loss": -5.847683906555176, "global_step": 60293, "epoch": 1435} {"train_loss": -5.897765159606934, "global_step": 60294, "epoch": 1435} {"train_loss": -5.871408462524414, "global_step": 60295, "epoch": 1435} {"train_loss": -5.7480669021606445, "global_step": 60296, "epoch": 1435} {"train_loss": -5.903510093688965, "global_step": 60297, "epoch": 1435} {"train_loss": -5.83474063873291, "global_step": 60298, "epoch": 1435} {"train_loss": -5.781575679779053, "global_step": 60299, "epoch": 1435} {"train_loss": -5.848331928253174, "global_step": 60300, "epoch": 1435} {"train_loss": -5.79286003112793, "global_step": 60301, "epoch": 1435} {"train_loss": -5.908430099487305, "global_step": 60302, "epoch": 1435} {"train_loss": -5.671124458312988, "global_step": 60303, "epoch": 1435} {"train_loss": -5.68634033203125, "global_step": 60304, "epoch": 1435} {"train_loss": -5.905688285827637, "global_step": 60305, "epoch": 1435} {"train_loss": -5.710622787475586, "global_step": 60306, "epoch": 1435} {"train_loss": -5.763709545135498, "global_step": 60307, "epoch": 1435} {"train_loss": -5.824437141418457, "global_step": 60308, "epoch": 1435} {"train_loss": -5.80958366394043, "global_step": 60309, "epoch": 1435} {"train_loss": -5.960172176361084, "global_step": 60310, "epoch": 1435} {"train_loss": -5.843263512565976, "global_step": 60311, "epoch": 1435, "val_loss": 67011.2421875} {"train_loss": -5.844388961791992, "global_step": 60312, "epoch": 1436} {"train_loss": -5.813981056213379, "global_step": 60313, "epoch": 1436} {"train_loss": -5.939011096954346, "global_step": 60314, "epoch": 1436} {"train_loss": -5.808963775634766, "global_step": 60315, "epoch": 1436} {"train_loss": -5.876513957977295, "global_step": 60316, "epoch": 1436} {"train_loss": -5.860952854156494, "global_step": 60317, "epoch": 1436} {"train_loss": -5.845038890838623, "global_step": 60318, "epoch": 1436} {"train_loss": -5.855157852172852, "global_step": 60319, "epoch": 1436} {"train_loss": -5.871492385864258, "global_step": 60320, "epoch": 1436} {"train_loss": -5.784243583679199, "global_step": 60321, "epoch": 1436} {"train_loss": -5.841948509216309, "global_step": 60322, "epoch": 1436} {"train_loss": -5.824054718017578, "global_step": 60323, "epoch": 1436} {"train_loss": -5.813758850097656, "global_step": 60324, "epoch": 1436} {"train_loss": -5.889247417449951, "global_step": 60325, "epoch": 1436} {"train_loss": -6.016791343688965, "global_step": 60326, "epoch": 1436} {"train_loss": -5.957528114318848, "global_step": 60327, "epoch": 1436} {"train_loss": -5.926019191741943, "global_step": 60328, "epoch": 1436} {"train_loss": -5.916342258453369, "global_step": 60329, "epoch": 1436} {"train_loss": -5.820958137512207, "global_step": 60330, "epoch": 1436} {"train_loss": -5.977534770965576, "global_step": 60331, "epoch": 1436} {"train_loss": -5.9686479568481445, "global_step": 60332, "epoch": 1436} {"train_loss": -5.920156478881836, "global_step": 60333, "epoch": 1436} {"train_loss": -5.885721206665039, "global_step": 60334, "epoch": 1436} {"train_loss": -5.833857536315918, "global_step": 60335, "epoch": 1436} {"train_loss": -5.877742767333984, "global_step": 60336, "epoch": 1436} {"train_loss": -5.923327445983887, "global_step": 60337, "epoch": 1436} {"train_loss": -5.959900856018066, "global_step": 60338, "epoch": 1436} {"train_loss": -5.921849727630615, "global_step": 60339, "epoch": 1436} {"train_loss": -5.898270130157471, "global_step": 60340, "epoch": 1436} {"train_loss": -5.966909885406494, "global_step": 60341, "epoch": 1436} {"train_loss": -5.909909248352051, "global_step": 60342, "epoch": 1436} {"train_loss": -5.823190689086914, "global_step": 60343, "epoch": 1436} {"train_loss": -5.898575305938721, "global_step": 60344, "epoch": 1436} {"train_loss": -5.96963357925415, "global_step": 60345, "epoch": 1436} {"train_loss": -5.916315078735352, "global_step": 60346, "epoch": 1436} {"train_loss": -5.758453369140625, "global_step": 60347, "epoch": 1436} {"train_loss": -5.97997522354126, "global_step": 60348, "epoch": 1436} {"train_loss": -5.912539482116699, "global_step": 60349, "epoch": 1436} {"train_loss": -5.9318132400512695, "global_step": 60350, "epoch": 1436} {"train_loss": -5.8096771240234375, "global_step": 60351, "epoch": 1436} {"train_loss": -5.852214813232422, "global_step": 60352, "epoch": 1436} {"train_loss": -5.888060399464199, "global_step": 60353, "epoch": 1436, "val_loss": 66730.359375} {"train_loss": -5.998016357421875, "global_step": 60354, "epoch": 1437} {"train_loss": -5.9150896072387695, "global_step": 60355, "epoch": 1437} {"train_loss": -5.7666826248168945, "global_step": 60356, "epoch": 1437} {"train_loss": -5.936445713043213, "global_step": 60357, "epoch": 1437} {"train_loss": -5.902844429016113, "global_step": 60358, "epoch": 1437} {"train_loss": -5.923890113830566, "global_step": 60359, "epoch": 1437} {"train_loss": -5.942558765411377, "global_step": 60360, "epoch": 1437} {"train_loss": -5.899060249328613, "global_step": 60361, "epoch": 1437} {"train_loss": -5.886468887329102, "global_step": 60362, "epoch": 1437} {"train_loss": -5.89138126373291, "global_step": 60363, "epoch": 1437} {"train_loss": -5.930668830871582, "global_step": 60364, "epoch": 1437} {"train_loss": -6.006924629211426, "global_step": 60365, "epoch": 1437} {"train_loss": -5.825112819671631, "global_step": 60366, "epoch": 1437} {"train_loss": -5.877321243286133, "global_step": 60367, "epoch": 1437} {"train_loss": -5.938176155090332, "global_step": 60368, "epoch": 1437} {"train_loss": -5.905702590942383, "global_step": 60369, "epoch": 1437} {"train_loss": -5.943519592285156, "global_step": 60370, "epoch": 1437} {"train_loss": -5.918585300445557, "global_step": 60371, "epoch": 1437} {"train_loss": -5.970836639404297, "global_step": 60372, "epoch": 1437} {"train_loss": -5.922695159912109, "global_step": 60373, "epoch": 1437} {"train_loss": -6.003687858581543, "global_step": 60374, "epoch": 1437} {"train_loss": -5.838750839233398, "global_step": 60375, "epoch": 1437} {"train_loss": -5.97601318359375, "global_step": 60376, "epoch": 1437} {"train_loss": -5.952049255371094, "global_step": 60377, "epoch": 1437} {"train_loss": -5.865172386169434, "global_step": 60378, "epoch": 1437} {"train_loss": -5.9288787841796875, "global_step": 60379, "epoch": 1437} {"train_loss": -6.024592399597168, "global_step": 60380, "epoch": 1437} {"train_loss": -5.8327317237854, "global_step": 60381, "epoch": 1437} {"train_loss": -5.789741516113281, "global_step": 60382, "epoch": 1437} {"train_loss": -5.9055681228637695, "global_step": 60383, "epoch": 1437} {"train_loss": -6.008002281188965, "global_step": 60384, "epoch": 1437} {"train_loss": -5.900071144104004, "global_step": 60385, "epoch": 1437} {"train_loss": -5.839678764343262, "global_step": 60386, "epoch": 1437} {"train_loss": -5.825894832611084, "global_step": 60387, "epoch": 1437} {"train_loss": -5.8665452003479, "global_step": 60388, "epoch": 1437} {"train_loss": -5.939385414123535, "global_step": 60389, "epoch": 1437} {"train_loss": -5.973511695861816, "global_step": 60390, "epoch": 1437} {"train_loss": -5.908436298370361, "global_step": 60391, "epoch": 1437} {"train_loss": -5.910031318664551, "global_step": 60392, "epoch": 1437} {"train_loss": -5.8122968673706055, "global_step": 60393, "epoch": 1437} {"train_loss": -5.835495948791504, "global_step": 60394, "epoch": 1437} {"train_loss": -5.905691373915899, "global_step": 60395, "epoch": 1437, "val_loss": 66723.3046875} {"train_loss": -5.877215385437012, "global_step": 60396, "epoch": 1438} {"train_loss": -5.951193809509277, "global_step": 60397, "epoch": 1438} {"train_loss": -5.857944011688232, "global_step": 60398, "epoch": 1438} {"train_loss": -5.798428535461426, "global_step": 60399, "epoch": 1438} {"train_loss": -5.9185943603515625, "global_step": 60400, "epoch": 1438} {"train_loss": -5.80153751373291, "global_step": 60401, "epoch": 1438} {"train_loss": -5.865751266479492, "global_step": 60402, "epoch": 1438} {"train_loss": -5.912708282470703, "global_step": 60403, "epoch": 1438} {"train_loss": -5.857292652130127, "global_step": 60404, "epoch": 1438} {"train_loss": -6.014752388000488, "global_step": 60405, "epoch": 1438} {"train_loss": -6.060121536254883, "global_step": 60406, "epoch": 1438} {"train_loss": -5.856803894042969, "global_step": 60407, "epoch": 1438} {"train_loss": -5.922873497009277, "global_step": 60408, "epoch": 1438} {"train_loss": -5.904823303222656, "global_step": 60409, "epoch": 1438} {"train_loss": -5.910083770751953, "global_step": 60410, "epoch": 1438} {"train_loss": -5.905570983886719, "global_step": 60411, "epoch": 1438} {"train_loss": -5.7878265380859375, "global_step": 60412, "epoch": 1438} {"train_loss": -5.905463695526123, "global_step": 60413, "epoch": 1438} {"train_loss": -5.911701202392578, "global_step": 60414, "epoch": 1438} {"train_loss": -5.950629711151123, "global_step": 60415, "epoch": 1438} {"train_loss": -6.010954856872559, "global_step": 60416, "epoch": 1438} {"train_loss": -5.7589006423950195, "global_step": 60417, "epoch": 1438} {"train_loss": -5.930606842041016, "global_step": 60418, "epoch": 1438} {"train_loss": -5.759257793426514, "global_step": 60419, "epoch": 1438} {"train_loss": -5.845767974853516, "global_step": 60420, "epoch": 1438} {"train_loss": -5.869177341461182, "global_step": 60421, "epoch": 1438} {"train_loss": -5.825456619262695, "global_step": 60422, "epoch": 1438} {"train_loss": -5.859437942504883, "global_step": 60423, "epoch": 1438} {"train_loss": -5.8541646003723145, "global_step": 60424, "epoch": 1438} {"train_loss": -5.892358779907227, "global_step": 60425, "epoch": 1438} {"train_loss": -5.837582588195801, "global_step": 60426, "epoch": 1438} {"train_loss": -5.918001174926758, "global_step": 60427, "epoch": 1438} {"train_loss": -5.817831039428711, "global_step": 60428, "epoch": 1438} {"train_loss": -5.727838516235352, "global_step": 60429, "epoch": 1438} {"train_loss": -5.8729166984558105, "global_step": 60430, "epoch": 1438} {"train_loss": -5.921723365783691, "global_step": 60431, "epoch": 1438} {"train_loss": -5.827946662902832, "global_step": 60432, "epoch": 1438} {"train_loss": -5.934786796569824, "global_step": 60433, "epoch": 1438} {"train_loss": -5.962442398071289, "global_step": 60434, "epoch": 1438} {"train_loss": -5.887563705444336, "global_step": 60435, "epoch": 1438} {"train_loss": -5.896121501922607, "global_step": 60436, "epoch": 1438} {"train_loss": -5.885017894563221, "global_step": 60437, "epoch": 1438, "val_loss": 66653.1640625} {"train_loss": -5.971253395080566, "global_step": 60438, "epoch": 1439} {"train_loss": -5.898687362670898, "global_step": 60439, "epoch": 1439} {"train_loss": -5.764255523681641, "global_step": 60440, "epoch": 1439} {"train_loss": -5.887155055999756, "global_step": 60441, "epoch": 1439} {"train_loss": -5.797670364379883, "global_step": 60442, "epoch": 1439} {"train_loss": -5.902749061584473, "global_step": 60443, "epoch": 1439} {"train_loss": -5.8785200119018555, "global_step": 60444, "epoch": 1439} {"train_loss": -5.941215991973877, "global_step": 60445, "epoch": 1439} {"train_loss": -5.93161153793335, "global_step": 60446, "epoch": 1439} {"train_loss": -5.903000831604004, "global_step": 60447, "epoch": 1439} {"train_loss": -5.834346771240234, "global_step": 60448, "epoch": 1439} {"train_loss": -5.898561477661133, "global_step": 60449, "epoch": 1439} {"train_loss": -5.8823652267456055, "global_step": 60450, "epoch": 1439} {"train_loss": -5.984206199645996, "global_step": 60451, "epoch": 1439} {"train_loss": -5.9777445793151855, "global_step": 60452, "epoch": 1439} {"train_loss": -5.721638202667236, "global_step": 60453, "epoch": 1439} {"train_loss": -5.930525779724121, "global_step": 60454, "epoch": 1439} {"train_loss": -5.903599262237549, "global_step": 60455, "epoch": 1439} {"train_loss": -5.89974308013916, "global_step": 60456, "epoch": 1439} {"train_loss": -5.874032020568848, "global_step": 60457, "epoch": 1439} {"train_loss": -5.873553276062012, "global_step": 60458, "epoch": 1439} {"train_loss": -5.907770156860352, "global_step": 60459, "epoch": 1439} {"train_loss": -5.881630897521973, "global_step": 60460, "epoch": 1439} {"train_loss": -5.8923492431640625, "global_step": 60461, "epoch": 1439} {"train_loss": -5.8162522315979, "global_step": 60462, "epoch": 1439} {"train_loss": -5.834373474121094, "global_step": 60463, "epoch": 1439} {"train_loss": -5.971526145935059, "global_step": 60464, "epoch": 1439} {"train_loss": -5.932877063751221, "global_step": 60465, "epoch": 1439} {"train_loss": -5.902771949768066, "global_step": 60466, "epoch": 1439} {"train_loss": -5.875359535217285, "global_step": 60467, "epoch": 1439} {"train_loss": -5.88462495803833, "global_step": 60468, "epoch": 1439} {"train_loss": -5.92432975769043, "global_step": 60469, "epoch": 1439} {"train_loss": -5.9720458984375, "global_step": 60470, "epoch": 1439} {"train_loss": -5.90647029876709, "global_step": 60471, "epoch": 1439} {"train_loss": -5.888995170593262, "global_step": 60472, "epoch": 1439} {"train_loss": -5.864853858947754, "global_step": 60473, "epoch": 1439} {"train_loss": -5.98239803314209, "global_step": 60474, "epoch": 1439} {"train_loss": -5.935502529144287, "global_step": 60475, "epoch": 1439} {"train_loss": -5.857499599456787, "global_step": 60476, "epoch": 1439} {"train_loss": -5.904975891113281, "global_step": 60477, "epoch": 1439} {"train_loss": -5.983808517456055, "global_step": 60478, "epoch": 1439} {"train_loss": -5.892186505453927, "global_step": 60479, "epoch": 1439, "val_loss": 66709.4375} {"train_loss": -5.940705299377441, "global_step": 60480, "epoch": 1440} {"train_loss": -5.885807991027832, "global_step": 60481, "epoch": 1440} {"train_loss": -5.890049934387207, "global_step": 60482, "epoch": 1440} {"train_loss": -5.878155708312988, "global_step": 60483, "epoch": 1440} {"train_loss": -5.897818565368652, "global_step": 60484, "epoch": 1440} {"train_loss": -5.827374458312988, "global_step": 60485, "epoch": 1440} {"train_loss": -5.967432498931885, "global_step": 60486, "epoch": 1440} {"train_loss": -5.900778293609619, "global_step": 60487, "epoch": 1440} {"train_loss": -5.865510940551758, "global_step": 60488, "epoch": 1440} {"train_loss": -5.9320526123046875, "global_step": 60489, "epoch": 1440} {"train_loss": -5.905378818511963, "global_step": 60490, "epoch": 1440} {"train_loss": -6.064833164215088, "global_step": 60491, "epoch": 1440} {"train_loss": -5.864626407623291, "global_step": 60492, "epoch": 1440} {"train_loss": -5.937014579772949, "global_step": 60493, "epoch": 1440} {"train_loss": -5.905387878417969, "global_step": 60494, "epoch": 1440} {"train_loss": -5.870454788208008, "global_step": 60495, "epoch": 1440} {"train_loss": -5.975622177124023, "global_step": 60496, "epoch": 1440} {"train_loss": -5.976946830749512, "global_step": 60497, "epoch": 1440} {"train_loss": -5.901133060455322, "global_step": 60498, "epoch": 1440} {"train_loss": -5.808233261108398, "global_step": 60499, "epoch": 1440} {"train_loss": -5.918722629547119, "global_step": 60500, "epoch": 1440} {"train_loss": -5.880801200866699, "global_step": 60501, "epoch": 1440} {"train_loss": -5.915014266967773, "global_step": 60502, "epoch": 1440} {"train_loss": -5.792419910430908, "global_step": 60503, "epoch": 1440} {"train_loss": -5.722252368927002, "global_step": 60504, "epoch": 1440} {"train_loss": -5.942657470703125, "global_step": 60505, "epoch": 1440} {"train_loss": -5.888904571533203, "global_step": 60506, "epoch": 1440} {"train_loss": -5.871241569519043, "global_step": 60507, "epoch": 1440} {"train_loss": -5.929215431213379, "global_step": 60508, "epoch": 1440} {"train_loss": -5.883195877075195, "global_step": 60509, "epoch": 1440} {"train_loss": -5.786563396453857, "global_step": 60510, "epoch": 1440} {"train_loss": -5.862063884735107, "global_step": 60511, "epoch": 1440} {"train_loss": -5.90804386138916, "global_step": 60512, "epoch": 1440} {"train_loss": -5.82733678817749, "global_step": 60513, "epoch": 1440} {"train_loss": -5.863000869750977, "global_step": 60514, "epoch": 1440} {"train_loss": -5.900389671325684, "global_step": 60515, "epoch": 1440} {"train_loss": -5.918820858001709, "global_step": 60516, "epoch": 1440} {"train_loss": -5.931851387023926, "global_step": 60517, "epoch": 1440} {"train_loss": -5.795592308044434, "global_step": 60518, "epoch": 1440} {"train_loss": -5.8022613525390625, "global_step": 60519, "epoch": 1440} {"train_loss": -5.773068904876709, "global_step": 60520, "epoch": 1440} {"train_loss": -5.885380517868769, "global_step": 60521, "epoch": 1440, "val_loss": 67084.375} {"train_loss": -5.985246658325195, "global_step": 60522, "epoch": 1441} {"train_loss": -5.855468273162842, "global_step": 60523, "epoch": 1441} {"train_loss": -5.893725395202637, "global_step": 60524, "epoch": 1441} {"train_loss": -5.9039626121521, "global_step": 60525, "epoch": 1441} {"train_loss": -5.819789886474609, "global_step": 60526, "epoch": 1441} {"train_loss": -5.995838642120361, "global_step": 60527, "epoch": 1441} {"train_loss": -5.828919410705566, "global_step": 60528, "epoch": 1441} {"train_loss": -5.715671539306641, "global_step": 60529, "epoch": 1441} {"train_loss": -5.93162727355957, "global_step": 60530, "epoch": 1441} {"train_loss": -5.9464111328125, "global_step": 60531, "epoch": 1441} {"train_loss": -5.867832183837891, "global_step": 60532, "epoch": 1441} {"train_loss": -5.786884307861328, "global_step": 60533, "epoch": 1441} {"train_loss": -5.821258068084717, "global_step": 60534, "epoch": 1441} {"train_loss": -5.807119846343994, "global_step": 60535, "epoch": 1441} {"train_loss": -5.619088172912598, "global_step": 60536, "epoch": 1441} {"train_loss": -5.7915425300598145, "global_step": 60537, "epoch": 1441} {"train_loss": -5.927557945251465, "global_step": 60538, "epoch": 1441} {"train_loss": -5.8117265701293945, "global_step": 60539, "epoch": 1441} {"train_loss": -5.883114337921143, "global_step": 60540, "epoch": 1441} {"train_loss": -5.882359504699707, "global_step": 60541, "epoch": 1441} {"train_loss": -5.854757785797119, "global_step": 60542, "epoch": 1441} {"train_loss": -5.975771903991699, "global_step": 60543, "epoch": 1441} {"train_loss": -5.746757984161377, "global_step": 60544, "epoch": 1441} {"train_loss": -5.858392238616943, "global_step": 60545, "epoch": 1441} {"train_loss": -5.876440048217773, "global_step": 60546, "epoch": 1441} {"train_loss": -5.751834869384766, "global_step": 60547, "epoch": 1441} {"train_loss": -5.938076019287109, "global_step": 60548, "epoch": 1441} {"train_loss": -5.7554168701171875, "global_step": 60549, "epoch": 1441} {"train_loss": -5.875271797180176, "global_step": 60550, "epoch": 1441} {"train_loss": -5.940169334411621, "global_step": 60551, "epoch": 1441} {"train_loss": -5.945225715637207, "global_step": 60552, "epoch": 1441} {"train_loss": -5.8444013595581055, "global_step": 60553, "epoch": 1441} {"train_loss": -5.696256637573242, "global_step": 60554, "epoch": 1441} {"train_loss": -5.8305768966674805, "global_step": 60555, "epoch": 1441} {"train_loss": -5.690765380859375, "global_step": 60556, "epoch": 1441} {"train_loss": -5.89219856262207, "global_step": 60557, "epoch": 1441} {"train_loss": -5.909185409545898, "global_step": 60558, "epoch": 1441} {"train_loss": -5.835356712341309, "global_step": 60559, "epoch": 1441} {"train_loss": -5.866293907165527, "global_step": 60560, "epoch": 1441} {"train_loss": -5.959588527679443, "global_step": 60561, "epoch": 1441} {"train_loss": -5.799783706665039, "global_step": 60562, "epoch": 1441} {"train_loss": -5.850575889859881, "global_step": 60563, "epoch": 1441, "val_loss": 67105.359375} {"train_loss": -5.980110168457031, "global_step": 60564, "epoch": 1442} {"train_loss": -5.906389236450195, "global_step": 60565, "epoch": 1442} {"train_loss": -5.866168022155762, "global_step": 60566, "epoch": 1442} {"train_loss": -5.8507537841796875, "global_step": 60567, "epoch": 1442} {"train_loss": -5.816317558288574, "global_step": 60568, "epoch": 1442} {"train_loss": -5.928594589233398, "global_step": 60569, "epoch": 1442} {"train_loss": -5.707115173339844, "global_step": 60570, "epoch": 1442} {"train_loss": -5.964677810668945, "global_step": 60571, "epoch": 1442} {"train_loss": -5.941493034362793, "global_step": 60572, "epoch": 1442} {"train_loss": -5.804607391357422, "global_step": 60573, "epoch": 1442} {"train_loss": -5.913347244262695, "global_step": 60574, "epoch": 1442} {"train_loss": -5.893726348876953, "global_step": 60575, "epoch": 1442} {"train_loss": -5.801647663116455, "global_step": 60576, "epoch": 1442} {"train_loss": -5.977794647216797, "global_step": 60577, "epoch": 1442} {"train_loss": -5.988823890686035, "global_step": 60578, "epoch": 1442} {"train_loss": -5.897759914398193, "global_step": 60579, "epoch": 1442} {"train_loss": -5.924568176269531, "global_step": 60580, "epoch": 1442} {"train_loss": -6.088308811187744, "global_step": 60581, "epoch": 1442} {"train_loss": -6.00657844543457, "global_step": 60582, "epoch": 1442} {"train_loss": -5.891790390014648, "global_step": 60583, "epoch": 1442} {"train_loss": -5.820001125335693, "global_step": 60584, "epoch": 1442} {"train_loss": -5.815509796142578, "global_step": 60585, "epoch": 1442} {"train_loss": -5.961543560028076, "global_step": 60586, "epoch": 1442} {"train_loss": -5.841619968414307, "global_step": 60587, "epoch": 1442} {"train_loss": -5.866258144378662, "global_step": 60588, "epoch": 1442} {"train_loss": -5.951592445373535, "global_step": 60589, "epoch": 1442} {"train_loss": -5.905046463012695, "global_step": 60590, "epoch": 1442} {"train_loss": -5.8336920738220215, "global_step": 60591, "epoch": 1442} {"train_loss": -5.949496269226074, "global_step": 60592, "epoch": 1442} {"train_loss": -5.804941177368164, "global_step": 60593, "epoch": 1442} {"train_loss": -5.8124871253967285, "global_step": 60594, "epoch": 1442} {"train_loss": -5.891570091247559, "global_step": 60595, "epoch": 1442} {"train_loss": -5.927709102630615, "global_step": 60596, "epoch": 1442} {"train_loss": -5.891077995300293, "global_step": 60597, "epoch": 1442} {"train_loss": -6.05933141708374, "global_step": 60598, "epoch": 1442} {"train_loss": -5.925189971923828, "global_step": 60599, "epoch": 1442} {"train_loss": -5.823278427124023, "global_step": 60600, "epoch": 1442} {"train_loss": -5.838735580444336, "global_step": 60601, "epoch": 1442} {"train_loss": -5.907582759857178, "global_step": 60602, "epoch": 1442} {"train_loss": -5.888982772827148, "global_step": 60603, "epoch": 1442} {"train_loss": -5.8469438552856445, "global_step": 60604, "epoch": 1442} {"train_loss": -5.897828181584676, "global_step": 60605, "epoch": 1442, "val_loss": 66902.9453125} {"train_loss": -5.792991638183594, "global_step": 60606, "epoch": 1443} {"train_loss": -5.951498985290527, "global_step": 60607, "epoch": 1443} {"train_loss": -5.914412975311279, "global_step": 60608, "epoch": 1443} {"train_loss": -5.817474365234375, "global_step": 60609, "epoch": 1443} {"train_loss": -5.8428192138671875, "global_step": 60610, "epoch": 1443} {"train_loss": -5.9485368728637695, "global_step": 60611, "epoch": 1443} {"train_loss": -5.840104103088379, "global_step": 60612, "epoch": 1443} {"train_loss": -5.887113571166992, "global_step": 60613, "epoch": 1443} {"train_loss": -5.841710090637207, "global_step": 60614, "epoch": 1443} {"train_loss": -5.90219259262085, "global_step": 60615, "epoch": 1443} {"train_loss": -5.860558032989502, "global_step": 60616, "epoch": 1443} {"train_loss": -5.963365077972412, "global_step": 60617, "epoch": 1443} {"train_loss": -5.856444358825684, "global_step": 60618, "epoch": 1443} {"train_loss": -5.938364028930664, "global_step": 60619, "epoch": 1443} {"train_loss": -6.01878023147583, "global_step": 60620, "epoch": 1443} {"train_loss": -5.864023685455322, "global_step": 60621, "epoch": 1443} {"train_loss": -5.873264789581299, "global_step": 60622, "epoch": 1443} {"train_loss": -5.847320556640625, "global_step": 60623, "epoch": 1443} {"train_loss": -5.90310001373291, "global_step": 60624, "epoch": 1443} {"train_loss": -5.9049296379089355, "global_step": 60625, "epoch": 1443} {"train_loss": -5.918612480163574, "global_step": 60626, "epoch": 1443} {"train_loss": -5.896470069885254, "global_step": 60627, "epoch": 1443} {"train_loss": -5.921663284301758, "global_step": 60628, "epoch": 1443} {"train_loss": -5.9482645988464355, "global_step": 60629, "epoch": 1443} {"train_loss": -6.063371658325195, "global_step": 60630, "epoch": 1443} {"train_loss": -5.919530868530273, "global_step": 60631, "epoch": 1443} {"train_loss": -6.000498294830322, "global_step": 60632, "epoch": 1443} {"train_loss": -5.899813652038574, "global_step": 60633, "epoch": 1443} {"train_loss": -5.872344017028809, "global_step": 60634, "epoch": 1443} {"train_loss": -5.91628360748291, "global_step": 60635, "epoch": 1443} {"train_loss": -5.832211017608643, "global_step": 60636, "epoch": 1443} {"train_loss": -5.882491111755371, "global_step": 60637, "epoch": 1443} {"train_loss": -5.8326568603515625, "global_step": 60638, "epoch": 1443} {"train_loss": -5.841518878936768, "global_step": 60639, "epoch": 1443} {"train_loss": -5.916854381561279, "global_step": 60640, "epoch": 1443} {"train_loss": -5.830949306488037, "global_step": 60641, "epoch": 1443} {"train_loss": -5.816946029663086, "global_step": 60642, "epoch": 1443} {"train_loss": -5.848517417907715, "global_step": 60643, "epoch": 1443} {"train_loss": -5.917600631713867, "global_step": 60644, "epoch": 1443} {"train_loss": -5.863680839538574, "global_step": 60645, "epoch": 1443} {"train_loss": -5.913336753845215, "global_step": 60646, "epoch": 1443} {"train_loss": -5.8937570708138605, "global_step": 60647, "epoch": 1443, "val_loss": 66701.6328125} {"train_loss": -5.927120685577393, "global_step": 60648, "epoch": 1444} {"train_loss": -5.949368953704834, "global_step": 60649, "epoch": 1444} {"train_loss": -5.808698654174805, "global_step": 60650, "epoch": 1444} {"train_loss": -5.895834922790527, "global_step": 60651, "epoch": 1444} {"train_loss": -5.836845874786377, "global_step": 60652, "epoch": 1444} {"train_loss": -5.875055313110352, "global_step": 60653, "epoch": 1444} {"train_loss": -5.853250503540039, "global_step": 60654, "epoch": 1444} {"train_loss": -5.917841911315918, "global_step": 60655, "epoch": 1444} {"train_loss": -5.779343605041504, "global_step": 60656, "epoch": 1444} {"train_loss": -5.803709983825684, "global_step": 60657, "epoch": 1444} {"train_loss": -5.8421244621276855, "global_step": 60658, "epoch": 1444} {"train_loss": -5.935384273529053, "global_step": 60659, "epoch": 1444} {"train_loss": -5.874539852142334, "global_step": 60660, "epoch": 1444} {"train_loss": -5.9327497482299805, "global_step": 60661, "epoch": 1444} {"train_loss": -5.850217342376709, "global_step": 60662, "epoch": 1444} {"train_loss": -5.886756896972656, "global_step": 60663, "epoch": 1444} {"train_loss": -5.920640468597412, "global_step": 60664, "epoch": 1444} {"train_loss": -5.767749786376953, "global_step": 60665, "epoch": 1444} {"train_loss": -5.884063720703125, "global_step": 60666, "epoch": 1444} {"train_loss": -5.84013557434082, "global_step": 60667, "epoch": 1444} {"train_loss": -5.958222389221191, "global_step": 60668, "epoch": 1444} {"train_loss": -5.95919132232666, "global_step": 60669, "epoch": 1444} {"train_loss": -5.930077075958252, "global_step": 60670, "epoch": 1444} {"train_loss": -6.020324230194092, "global_step": 60671, "epoch": 1444} {"train_loss": -5.918763637542725, "global_step": 60672, "epoch": 1444} {"train_loss": -5.929875373840332, "global_step": 60673, "epoch": 1444} {"train_loss": -5.818115234375, "global_step": 60674, "epoch": 1444} {"train_loss": -5.781181335449219, "global_step": 60675, "epoch": 1444} {"train_loss": -5.891922950744629, "global_step": 60676, "epoch": 1444} {"train_loss": -5.760364532470703, "global_step": 60677, "epoch": 1444} {"train_loss": -5.812566757202148, "global_step": 60678, "epoch": 1444} {"train_loss": -5.775150299072266, "global_step": 60679, "epoch": 1444} {"train_loss": -5.858895778656006, "global_step": 60680, "epoch": 1444} {"train_loss": -5.828892707824707, "global_step": 60681, "epoch": 1444} {"train_loss": -5.816248893737793, "global_step": 60682, "epoch": 1444} {"train_loss": -5.821051597595215, "global_step": 60683, "epoch": 1444} {"train_loss": -5.8971099853515625, "global_step": 60684, "epoch": 1444} {"train_loss": -5.791257858276367, "global_step": 60685, "epoch": 1444} {"train_loss": -6.015012741088867, "global_step": 60686, "epoch": 1444} {"train_loss": -5.956345558166504, "global_step": 60687, "epoch": 1444} {"train_loss": -5.862491130828857, "global_step": 60688, "epoch": 1444} {"train_loss": -5.874256236212594, "global_step": 60689, "epoch": 1444, "val_loss": 66807.453125} {"train_loss": -5.867025375366211, "global_step": 60690, "epoch": 1445} {"train_loss": -5.8913469314575195, "global_step": 60691, "epoch": 1445} {"train_loss": -5.915128231048584, "global_step": 60692, "epoch": 1445} {"train_loss": -5.987158298492432, "global_step": 60693, "epoch": 1445} {"train_loss": -5.859753608703613, "global_step": 60694, "epoch": 1445} {"train_loss": -5.770717620849609, "global_step": 60695, "epoch": 1445} {"train_loss": -6.016982555389404, "global_step": 60696, "epoch": 1445} {"train_loss": -5.914769172668457, "global_step": 60697, "epoch": 1445} {"train_loss": -5.832120895385742, "global_step": 60698, "epoch": 1445} {"train_loss": -5.959885597229004, "global_step": 60699, "epoch": 1445} {"train_loss": -5.872056007385254, "global_step": 60700, "epoch": 1445} {"train_loss": -5.863747596740723, "global_step": 60701, "epoch": 1445} {"train_loss": -5.96197509765625, "global_step": 60702, "epoch": 1445} {"train_loss": -6.007769584655762, "global_step": 60703, "epoch": 1445} {"train_loss": -6.02174186706543, "global_step": 60704, "epoch": 1445} {"train_loss": -5.897993087768555, "global_step": 60705, "epoch": 1445} {"train_loss": -6.061387062072754, "global_step": 60706, "epoch": 1445} {"train_loss": -5.927130699157715, "global_step": 60707, "epoch": 1445} {"train_loss": -5.879329204559326, "global_step": 60708, "epoch": 1445} {"train_loss": -5.985405445098877, "global_step": 60709, "epoch": 1445} {"train_loss": -5.876255035400391, "global_step": 60710, "epoch": 1445} {"train_loss": -5.903096675872803, "global_step": 60711, "epoch": 1445} {"train_loss": -5.816209316253662, "global_step": 60712, "epoch": 1445} {"train_loss": -5.903209686279297, "global_step": 60713, "epoch": 1445} {"train_loss": -5.748686790466309, "global_step": 60714, "epoch": 1445} {"train_loss": -5.824695587158203, "global_step": 60715, "epoch": 1445} {"train_loss": -5.713808536529541, "global_step": 60716, "epoch": 1445} {"train_loss": -5.766965866088867, "global_step": 60717, "epoch": 1445} {"train_loss": -5.860018730163574, "global_step": 60718, "epoch": 1445} {"train_loss": -5.656528472900391, "global_step": 60719, "epoch": 1445} {"train_loss": -5.919606685638428, "global_step": 60720, "epoch": 1445} {"train_loss": -5.872163772583008, "global_step": 60721, "epoch": 1445} {"train_loss": -5.809490203857422, "global_step": 60722, "epoch": 1445} {"train_loss": -5.809745788574219, "global_step": 60723, "epoch": 1445} {"train_loss": -5.781863212585449, "global_step": 60724, "epoch": 1445} {"train_loss": -5.959012031555176, "global_step": 60725, "epoch": 1445} {"train_loss": -5.882384777069092, "global_step": 60726, "epoch": 1445} {"train_loss": -5.9422149658203125, "global_step": 60727, "epoch": 1445} {"train_loss": -5.924012184143066, "global_step": 60728, "epoch": 1445} {"train_loss": -5.887365341186523, "global_step": 60729, "epoch": 1445} {"train_loss": -5.924802780151367, "global_step": 60730, "epoch": 1445} {"train_loss": -5.883251939501081, "global_step": 60731, "epoch": 1445, "val_loss": 66792.71875} {"train_loss": -6.050989627838135, "global_step": 60732, "epoch": 1446} {"train_loss": -5.850472450256348, "global_step": 60733, "epoch": 1446} {"train_loss": -6.079562187194824, "global_step": 60734, "epoch": 1446} {"train_loss": -5.906377792358398, "global_step": 60735, "epoch": 1446} {"train_loss": -5.958487033843994, "global_step": 60736, "epoch": 1446} {"train_loss": -5.894046783447266, "global_step": 60737, "epoch": 1446} {"train_loss": -5.870351314544678, "global_step": 60738, "epoch": 1446} {"train_loss": -5.777536392211914, "global_step": 60739, "epoch": 1446} {"train_loss": -5.916402816772461, "global_step": 60740, "epoch": 1446} {"train_loss": -5.950728416442871, "global_step": 60741, "epoch": 1446} {"train_loss": -6.009650230407715, "global_step": 60742, "epoch": 1446} {"train_loss": -5.859928131103516, "global_step": 60743, "epoch": 1446} {"train_loss": -5.914679527282715, "global_step": 60744, "epoch": 1446} {"train_loss": -5.865790367126465, "global_step": 60745, "epoch": 1446} {"train_loss": -5.877773284912109, "global_step": 60746, "epoch": 1446} {"train_loss": -5.807384490966797, "global_step": 60747, "epoch": 1446} {"train_loss": -5.7230424880981445, "global_step": 60748, "epoch": 1446} {"train_loss": -5.91131591796875, "global_step": 60749, "epoch": 1446} {"train_loss": -6.0322699546813965, "global_step": 60750, "epoch": 1446} {"train_loss": -5.838303565979004, "global_step": 60751, "epoch": 1446} {"train_loss": -5.929296493530273, "global_step": 60752, "epoch": 1446} {"train_loss": -5.729440212249756, "global_step": 60753, "epoch": 1446} {"train_loss": -5.900966644287109, "global_step": 60754, "epoch": 1446} {"train_loss": -5.730771064758301, "global_step": 60755, "epoch": 1446} {"train_loss": -5.9596662521362305, "global_step": 60756, "epoch": 1446} {"train_loss": -5.874206066131592, "global_step": 60757, "epoch": 1446} {"train_loss": -5.93064546585083, "global_step": 60758, "epoch": 1446} {"train_loss": -5.856198787689209, "global_step": 60759, "epoch": 1446} {"train_loss": -5.807649612426758, "global_step": 60760, "epoch": 1446} {"train_loss": -5.855755805969238, "global_step": 60761, "epoch": 1446} {"train_loss": -5.924201011657715, "global_step": 60762, "epoch": 1446} {"train_loss": -5.822998046875, "global_step": 60763, "epoch": 1446} {"train_loss": -5.935317039489746, "global_step": 60764, "epoch": 1446} {"train_loss": -5.977817535400391, "global_step": 60765, "epoch": 1446} {"train_loss": -5.848585605621338, "global_step": 60766, "epoch": 1446} {"train_loss": -5.813176155090332, "global_step": 60767, "epoch": 1446} {"train_loss": -5.773822784423828, "global_step": 60768, "epoch": 1446} {"train_loss": -5.914250373840332, "global_step": 60769, "epoch": 1446} {"train_loss": -5.768545150756836, "global_step": 60770, "epoch": 1446} {"train_loss": -5.777352333068848, "global_step": 60771, "epoch": 1446} {"train_loss": -5.784572124481201, "global_step": 60772, "epoch": 1446} {"train_loss": -5.875959214710054, "global_step": 60773, "epoch": 1446, "val_loss": 67057.28125} {"train_loss": -5.753846168518066, "global_step": 60774, "epoch": 1447} {"train_loss": -5.838319301605225, "global_step": 60775, "epoch": 1447} {"train_loss": -5.757456302642822, "global_step": 60776, "epoch": 1447} {"train_loss": -5.7702436447143555, "global_step": 60777, "epoch": 1447} {"train_loss": -5.917357444763184, "global_step": 60778, "epoch": 1447} {"train_loss": -5.876791000366211, "global_step": 60779, "epoch": 1447} {"train_loss": -5.941141128540039, "global_step": 60780, "epoch": 1447} {"train_loss": -5.85566520690918, "global_step": 60781, "epoch": 1447} {"train_loss": -5.87177038192749, "global_step": 60782, "epoch": 1447} {"train_loss": -5.953263282775879, "global_step": 60783, "epoch": 1447} {"train_loss": -5.981348037719727, "global_step": 60784, "epoch": 1447} {"train_loss": -5.75856876373291, "global_step": 60785, "epoch": 1447} {"train_loss": -5.946164608001709, "global_step": 60786, "epoch": 1447} {"train_loss": -5.859673500061035, "global_step": 60787, "epoch": 1447} {"train_loss": -5.879120826721191, "global_step": 60788, "epoch": 1447} {"train_loss": -5.840771675109863, "global_step": 60789, "epoch": 1447} {"train_loss": -5.827635288238525, "global_step": 60790, "epoch": 1447} {"train_loss": -5.91456413269043, "global_step": 60791, "epoch": 1447} {"train_loss": -5.793648719787598, "global_step": 60792, "epoch": 1447} {"train_loss": -5.868258953094482, "global_step": 60793, "epoch": 1447} {"train_loss": -5.9444804191589355, "global_step": 60794, "epoch": 1447} {"train_loss": -5.881523132324219, "global_step": 60795, "epoch": 1447} {"train_loss": -5.888072967529297, "global_step": 60796, "epoch": 1447} {"train_loss": -5.915162086486816, "global_step": 60797, "epoch": 1447} {"train_loss": -5.995487213134766, "global_step": 60798, "epoch": 1447} {"train_loss": -5.8803863525390625, "global_step": 60799, "epoch": 1447} {"train_loss": -5.7178521156311035, "global_step": 60800, "epoch": 1447} {"train_loss": -5.818752288818359, "global_step": 60801, "epoch": 1447} {"train_loss": -5.743984222412109, "global_step": 60802, "epoch": 1447} {"train_loss": -5.968050003051758, "global_step": 60803, "epoch": 1447} {"train_loss": -5.798251628875732, "global_step": 60804, "epoch": 1447} {"train_loss": -5.7878098487854, "global_step": 60805, "epoch": 1447} {"train_loss": -5.791595458984375, "global_step": 60806, "epoch": 1447} {"train_loss": -5.816751480102539, "global_step": 60807, "epoch": 1447} {"train_loss": -5.790270805358887, "global_step": 60808, "epoch": 1447} {"train_loss": -5.829538345336914, "global_step": 60809, "epoch": 1447} {"train_loss": -5.821340084075928, "global_step": 60810, "epoch": 1447} {"train_loss": -5.840878963470459, "global_step": 60811, "epoch": 1447} {"train_loss": -5.919726371765137, "global_step": 60812, "epoch": 1447} {"train_loss": -5.85362434387207, "global_step": 60813, "epoch": 1447} {"train_loss": -5.8224029541015625, "global_step": 60814, "epoch": 1447} {"train_loss": -5.855953602563767, "global_step": 60815, "epoch": 1447, "val_loss": 66728.53125} {"train_loss": -5.806024551391602, "global_step": 60816, "epoch": 1448} {"train_loss": -5.76521110534668, "global_step": 60817, "epoch": 1448} {"train_loss": -5.909996032714844, "global_step": 60818, "epoch": 1448} {"train_loss": -5.980853080749512, "global_step": 60819, "epoch": 1448} {"train_loss": -5.927135944366455, "global_step": 60820, "epoch": 1448} {"train_loss": -5.878015041351318, "global_step": 60821, "epoch": 1448} {"train_loss": -5.906293869018555, "global_step": 60822, "epoch": 1448} {"train_loss": -5.894163608551025, "global_step": 60823, "epoch": 1448} {"train_loss": -5.793262481689453, "global_step": 60824, "epoch": 1448} {"train_loss": -5.784431457519531, "global_step": 60825, "epoch": 1448} {"train_loss": -6.056928634643555, "global_step": 60826, "epoch": 1448} {"train_loss": -5.921143531799316, "global_step": 60827, "epoch": 1448} {"train_loss": -6.010725975036621, "global_step": 60828, "epoch": 1448} {"train_loss": -5.898465156555176, "global_step": 60829, "epoch": 1448} {"train_loss": -5.828307151794434, "global_step": 60830, "epoch": 1448} {"train_loss": -5.823952674865723, "global_step": 60831, "epoch": 1448} {"train_loss": -5.803479194641113, "global_step": 60832, "epoch": 1448} {"train_loss": -5.800911903381348, "global_step": 60833, "epoch": 1448} {"train_loss": -5.8435139656066895, "global_step": 60834, "epoch": 1448} {"train_loss": -6.015289783477783, "global_step": 60835, "epoch": 1448} {"train_loss": -5.966649055480957, "global_step": 60836, "epoch": 1448} {"train_loss": -5.964303970336914, "global_step": 60837, "epoch": 1448} {"train_loss": -5.896193504333496, "global_step": 60838, "epoch": 1448} {"train_loss": -5.940854072570801, "global_step": 60839, "epoch": 1448} {"train_loss": -5.922219276428223, "global_step": 60840, "epoch": 1448} {"train_loss": -5.846459865570068, "global_step": 60841, "epoch": 1448} {"train_loss": -6.023133277893066, "global_step": 60842, "epoch": 1448} {"train_loss": -6.015851020812988, "global_step": 60843, "epoch": 1448} {"train_loss": -5.875763893127441, "global_step": 60844, "epoch": 1448} {"train_loss": -5.894099235534668, "global_step": 60845, "epoch": 1448} {"train_loss": -5.968138694763184, "global_step": 60846, "epoch": 1448} {"train_loss": -5.867917537689209, "global_step": 60847, "epoch": 1448} {"train_loss": -5.937541484832764, "global_step": 60848, "epoch": 1448} {"train_loss": -5.917235374450684, "global_step": 60849, "epoch": 1448} {"train_loss": -5.894125938415527, "global_step": 60850, "epoch": 1448} {"train_loss": -5.963293075561523, "global_step": 60851, "epoch": 1448} {"train_loss": -5.820284843444824, "global_step": 60852, "epoch": 1448} {"train_loss": -5.974843978881836, "global_step": 60853, "epoch": 1448} {"train_loss": -5.9796833992004395, "global_step": 60854, "epoch": 1448} {"train_loss": -5.90460205078125, "global_step": 60855, "epoch": 1448} {"train_loss": -5.894344806671143, "global_step": 60856, "epoch": 1448} {"train_loss": -5.902686153139387, "global_step": 60857, "epoch": 1448, "val_loss": 66705.8046875} {"train_loss": -5.857088088989258, "global_step": 60858, "epoch": 1449} {"train_loss": -5.872903347015381, "global_step": 60859, "epoch": 1449} {"train_loss": -5.990564346313477, "global_step": 60860, "epoch": 1449} {"train_loss": -5.920536994934082, "global_step": 60861, "epoch": 1449} {"train_loss": -6.006746292114258, "global_step": 60862, "epoch": 1449} {"train_loss": -5.933661460876465, "global_step": 60863, "epoch": 1449} {"train_loss": -5.92354679107666, "global_step": 60864, "epoch": 1449} {"train_loss": -5.94807243347168, "global_step": 60865, "epoch": 1449} {"train_loss": -5.923098087310791, "global_step": 60866, "epoch": 1449} {"train_loss": -5.924561500549316, "global_step": 60867, "epoch": 1449} {"train_loss": -5.931491851806641, "global_step": 60868, "epoch": 1449} {"train_loss": -6.01319694519043, "global_step": 60869, "epoch": 1449} {"train_loss": -5.934805393218994, "global_step": 60870, "epoch": 1449} {"train_loss": -5.9254865646362305, "global_step": 60871, "epoch": 1449} {"train_loss": -5.934854030609131, "global_step": 60872, "epoch": 1449} {"train_loss": -5.952411651611328, "global_step": 60873, "epoch": 1449} {"train_loss": -5.888222694396973, "global_step": 60874, "epoch": 1449} {"train_loss": -5.929323196411133, "global_step": 60875, "epoch": 1449} {"train_loss": -6.002382278442383, "global_step": 60876, "epoch": 1449} {"train_loss": -5.77573823928833, "global_step": 60877, "epoch": 1449} {"train_loss": -5.831058025360107, "global_step": 60878, "epoch": 1449} {"train_loss": -5.861474990844727, "global_step": 60879, "epoch": 1449} {"train_loss": -5.803239822387695, "global_step": 60880, "epoch": 1449} {"train_loss": -5.761484146118164, "global_step": 60881, "epoch": 1449} {"train_loss": -5.888604164123535, "global_step": 60882, "epoch": 1449} {"train_loss": -5.911511421203613, "global_step": 60883, "epoch": 1449} {"train_loss": -5.938323974609375, "global_step": 60884, "epoch": 1449} {"train_loss": -5.943868637084961, "global_step": 60885, "epoch": 1449} {"train_loss": -5.930003643035889, "global_step": 60886, "epoch": 1449} {"train_loss": -5.871929168701172, "global_step": 60887, "epoch": 1449} {"train_loss": -5.827129364013672, "global_step": 60888, "epoch": 1449} {"train_loss": -5.782524108886719, "global_step": 60889, "epoch": 1449} {"train_loss": -5.833495140075684, "global_step": 60890, "epoch": 1449} {"train_loss": -5.902939796447754, "global_step": 60891, "epoch": 1449} {"train_loss": -5.91645622253418, "global_step": 60892, "epoch": 1449} {"train_loss": -5.8963623046875, "global_step": 60893, "epoch": 1449} {"train_loss": -6.014289379119873, "global_step": 60894, "epoch": 1449} {"train_loss": -5.8013811111450195, "global_step": 60895, "epoch": 1449} {"train_loss": -5.863055229187012, "global_step": 60896, "epoch": 1449} {"train_loss": -5.987679958343506, "global_step": 60897, "epoch": 1449} {"train_loss": -5.790085792541504, "global_step": 60898, "epoch": 1449} {"train_loss": -5.900495154517038, "global_step": 60899, "epoch": 1449, "val_loss": 67299.90625} {"train_loss": -5.83302116394043, "global_step": 60900, "epoch": 1450} {"train_loss": -5.877297401428223, "global_step": 60901, "epoch": 1450} {"train_loss": -5.854667663574219, "global_step": 60902, "epoch": 1450} {"train_loss": -5.83497428894043, "global_step": 60903, "epoch": 1450} {"train_loss": -5.9073872566223145, "global_step": 60904, "epoch": 1450} {"train_loss": -5.875433921813965, "global_step": 60905, "epoch": 1450} {"train_loss": -5.818833351135254, "global_step": 60906, "epoch": 1450} {"train_loss": -5.8863935470581055, "global_step": 60907, "epoch": 1450} {"train_loss": -5.921534538269043, "global_step": 60908, "epoch": 1450} {"train_loss": -5.852320671081543, "global_step": 60909, "epoch": 1450} {"train_loss": -5.90885591506958, "global_step": 60910, "epoch": 1450} {"train_loss": -5.928532123565674, "global_step": 60911, "epoch": 1450} {"train_loss": -6.045856475830078, "global_step": 60912, "epoch": 1450} {"train_loss": -5.81917667388916, "global_step": 60913, "epoch": 1450} {"train_loss": -5.799095153808594, "global_step": 60914, "epoch": 1450} {"train_loss": -6.005212783813477, "global_step": 60915, "epoch": 1450} {"train_loss": -5.905910491943359, "global_step": 60916, "epoch": 1450} {"train_loss": -6.063006401062012, "global_step": 60917, "epoch": 1450} {"train_loss": -5.9582319259643555, "global_step": 60918, "epoch": 1450} {"train_loss": -5.859129428863525, "global_step": 60919, "epoch": 1450} {"train_loss": -5.975567817687988, "global_step": 60920, "epoch": 1450} {"train_loss": -5.934418201446533, "global_step": 60921, "epoch": 1450} {"train_loss": -5.8971405029296875, "global_step": 60922, "epoch": 1450} {"train_loss": -5.848323822021484, "global_step": 60923, "epoch": 1450} {"train_loss": -5.868642807006836, "global_step": 60924, "epoch": 1450} {"train_loss": -5.939664840698242, "global_step": 60925, "epoch": 1450} {"train_loss": -5.924618244171143, "global_step": 60926, "epoch": 1450} {"train_loss": -5.887984752655029, "global_step": 60927, "epoch": 1450} {"train_loss": -6.004452705383301, "global_step": 60928, "epoch": 1450} {"train_loss": -5.783668518066406, "global_step": 60929, "epoch": 1450} {"train_loss": -5.866540431976318, "global_step": 60930, "epoch": 1450} {"train_loss": -5.890527725219727, "global_step": 60931, "epoch": 1450} {"train_loss": -5.819707870483398, "global_step": 60932, "epoch": 1450} {"train_loss": -5.911126136779785, "global_step": 60933, "epoch": 1450} {"train_loss": -5.914532661437988, "global_step": 60934, "epoch": 1450} {"train_loss": -5.85180139541626, "global_step": 60935, "epoch": 1450} {"train_loss": -5.840457439422607, "global_step": 60936, "epoch": 1450} {"train_loss": -5.9861040115356445, "global_step": 60937, "epoch": 1450} {"train_loss": -5.845864772796631, "global_step": 60938, "epoch": 1450} {"train_loss": -5.872869491577148, "global_step": 60939, "epoch": 1450} {"train_loss": -5.98982048034668, "global_step": 60940, "epoch": 1450} {"train_loss": -5.89884725071135, "global_step": 60941, "epoch": 1450, "train/sim_max_reward_0": 0.24530832310938, "train/sim_max_reward_1": 0.8349653148827656, "train/sim_max_reward_2": 0.5726258851995594, "train/sim_max_reward_3": 0.15957145610721363, "train/sim_max_reward_4": 0.8788198741019625, "train/sim_max_reward_5": 0.9051947813008695, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.8988908840583265, "test/sim_max_reward_4400002": 0.5234534364967731, "test/sim_max_reward_4400003": 0.8130371321910395, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.7804625790622756, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3720711857369714, "test/sim_max_reward_4400009": 0.582113918612691, "test/sim_max_reward_4400010": 0.546621080276534, "test/sim_max_reward_4400011": 0.37456565688695614, "test/sim_max_reward_4400012": 0.7894797180916209, "test/sim_max_reward_4400013": 0.8596007137702734, "test/sim_max_reward_4400014": 0.3727890438867391, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.08784285978491531, "test/sim_max_reward_4400018": 0.19778047362749293, "test/sim_max_reward_4400019": 0.1027644708954781, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5766442836686932, "test/sim_max_reward_4400022": 0.2640474373651409, "test/sim_max_reward_4400023": 0.17508914378214915, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.920864682091766, "test/sim_max_reward_4400027": 0.00044026654033164984, "test/sim_max_reward_4400028": 0.40689875511418144, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.8521045638568313, "test/sim_max_reward_4400031": 0.9398982897762176, "test/sim_max_reward_4400032": 0.4487839312533089, "test/sim_max_reward_4400033": 0.6079443914049504, "test/sim_max_reward_4400034": 0.8707061660464028, "test/sim_max_reward_4400035": 0.4736662446960933, "test/sim_max_reward_4400036": 0.3142152596740683, "test/sim_max_reward_4400037": 0.8402326869789059, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.9285326591578841, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9323533877604675, "test/sim_max_reward_4400042": 0.021499455237403153, "test/sim_max_reward_4400043": 0.9816972572244352, "test/sim_max_reward_4400044": 0.8092538992105898, "test/sim_max_reward_4400045": 0.7920020012272835, "test/sim_max_reward_4400046": 0.8598775182680752, "test/sim_max_reward_4400047": 0.9101923304492463, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.03023315997352722, "train/mean_score": 0.5994142724502918, "test/mean_score": 0.45404911800394265, "val_loss": 66692.5078125} {"train_loss": -6.010736465454102, "global_step": 60942, "epoch": 1451} {"train_loss": -5.935762882232666, "global_step": 60943, "epoch": 1451} {"train_loss": -5.899201393127441, "global_step": 60944, "epoch": 1451} {"train_loss": -5.858838081359863, "global_step": 60945, "epoch": 1451} {"train_loss": -5.949494361877441, "global_step": 60946, "epoch": 1451} {"train_loss": -5.8907060623168945, "global_step": 60947, "epoch": 1451} {"train_loss": -5.912424564361572, "global_step": 60948, "epoch": 1451} {"train_loss": -5.93826961517334, "global_step": 60949, "epoch": 1451} {"train_loss": -5.910656929016113, "global_step": 60950, "epoch": 1451} {"train_loss": -5.784510135650635, "global_step": 60951, "epoch": 1451} {"train_loss": -5.73983097076416, "global_step": 60952, "epoch": 1451} {"train_loss": -5.8515729904174805, "global_step": 60953, "epoch": 1451} {"train_loss": -5.69616174697876, "global_step": 60954, "epoch": 1451} {"train_loss": -6.000739097595215, "global_step": 60955, "epoch": 1451} {"train_loss": -5.784153461456299, "global_step": 60956, "epoch": 1451} {"train_loss": -5.91857385635376, "global_step": 60957, "epoch": 1451} {"train_loss": -5.90760612487793, "global_step": 60958, "epoch": 1451} {"train_loss": -5.902360916137695, "global_step": 60959, "epoch": 1451} {"train_loss": -6.001776218414307, "global_step": 60960, "epoch": 1451} {"train_loss": -5.889334678649902, "global_step": 60961, "epoch": 1451} {"train_loss": -5.998256206512451, "global_step": 60962, "epoch": 1451} {"train_loss": -5.988952159881592, "global_step": 60963, "epoch": 1451} {"train_loss": -5.909753799438477, "global_step": 60964, "epoch": 1451} {"train_loss": -5.93345832824707, "global_step": 60965, "epoch": 1451} {"train_loss": -5.890755653381348, "global_step": 60966, "epoch": 1451} {"train_loss": -5.9350385665893555, "global_step": 60967, "epoch": 1451} {"train_loss": -5.835405349731445, "global_step": 60968, "epoch": 1451} {"train_loss": -5.781253337860107, "global_step": 60969, "epoch": 1451} {"train_loss": -5.865612030029297, "global_step": 60970, "epoch": 1451} {"train_loss": -5.9252119064331055, "global_step": 60971, "epoch": 1451} {"train_loss": -5.8435773849487305, "global_step": 60972, "epoch": 1451} {"train_loss": -5.962302207946777, "global_step": 60973, "epoch": 1451} {"train_loss": -5.743075370788574, "global_step": 60974, "epoch": 1451} {"train_loss": -5.864849090576172, "global_step": 60975, "epoch": 1451} {"train_loss": -5.875762939453125, "global_step": 60976, "epoch": 1451} {"train_loss": -5.826286315917969, "global_step": 60977, "epoch": 1451} {"train_loss": -5.999908447265625, "global_step": 60978, "epoch": 1451} {"train_loss": -5.9087066650390625, "global_step": 60979, "epoch": 1451} {"train_loss": -5.828896522521973, "global_step": 60980, "epoch": 1451} {"train_loss": -5.823952674865723, "global_step": 60981, "epoch": 1451} {"train_loss": -5.835078716278076, "global_step": 60982, "epoch": 1451} {"train_loss": -5.885261978421893, "global_step": 60983, "epoch": 1451, "val_loss": 66665.4921875} {"train_loss": -5.908904075622559, "global_step": 60984, "epoch": 1452} {"train_loss": -5.8814616203308105, "global_step": 60985, "epoch": 1452} {"train_loss": -5.912154197692871, "global_step": 60986, "epoch": 1452} {"train_loss": -5.871491432189941, "global_step": 60987, "epoch": 1452} {"train_loss": -6.009927272796631, "global_step": 60988, "epoch": 1452} {"train_loss": -5.878003120422363, "global_step": 60989, "epoch": 1452} {"train_loss": -5.875545501708984, "global_step": 60990, "epoch": 1452} {"train_loss": -5.840006351470947, "global_step": 60991, "epoch": 1452} {"train_loss": -5.7682647705078125, "global_step": 60992, "epoch": 1452} {"train_loss": -5.917365550994873, "global_step": 60993, "epoch": 1452} {"train_loss": -5.781245708465576, "global_step": 60994, "epoch": 1452} {"train_loss": -5.886410713195801, "global_step": 60995, "epoch": 1452} {"train_loss": -5.88970422744751, "global_step": 60996, "epoch": 1452} {"train_loss": -5.769169807434082, "global_step": 60997, "epoch": 1452} {"train_loss": -5.937567710876465, "global_step": 60998, "epoch": 1452} {"train_loss": -5.873612403869629, "global_step": 60999, "epoch": 1452} {"train_loss": -5.825850486755371, "global_step": 61000, "epoch": 1452} {"train_loss": -5.905213356018066, "global_step": 61001, "epoch": 1452} {"train_loss": -5.8287763595581055, "global_step": 61002, "epoch": 1452} {"train_loss": -5.875799179077148, "global_step": 61003, "epoch": 1452} {"train_loss": -5.877302169799805, "global_step": 61004, "epoch": 1452} {"train_loss": -5.773125648498535, "global_step": 61005, "epoch": 1452} {"train_loss": -5.86112117767334, "global_step": 61006, "epoch": 1452} {"train_loss": -5.933651924133301, "global_step": 61007, "epoch": 1452} {"train_loss": -5.841691017150879, "global_step": 61008, "epoch": 1452} {"train_loss": -5.927588939666748, "global_step": 61009, "epoch": 1452} {"train_loss": -5.87083101272583, "global_step": 61010, "epoch": 1452} {"train_loss": -5.95713472366333, "global_step": 61011, "epoch": 1452} {"train_loss": -5.9807209968566895, "global_step": 61012, "epoch": 1452} {"train_loss": -5.8986053466796875, "global_step": 61013, "epoch": 1452} {"train_loss": -5.9306793212890625, "global_step": 61014, "epoch": 1452} {"train_loss": -5.847988128662109, "global_step": 61015, "epoch": 1452} {"train_loss": -5.972211837768555, "global_step": 61016, "epoch": 1452} {"train_loss": -5.929739952087402, "global_step": 61017, "epoch": 1452} {"train_loss": -5.882246017456055, "global_step": 61018, "epoch": 1452} {"train_loss": -5.874578475952148, "global_step": 61019, "epoch": 1452} {"train_loss": -5.936041355133057, "global_step": 61020, "epoch": 1452} {"train_loss": -5.90857458114624, "global_step": 61021, "epoch": 1452} {"train_loss": -5.843524932861328, "global_step": 61022, "epoch": 1452} {"train_loss": -5.806342601776123, "global_step": 61023, "epoch": 1452} {"train_loss": -5.769298553466797, "global_step": 61024, "epoch": 1452} {"train_loss": -5.882382063638596, "global_step": 61025, "epoch": 1452, "val_loss": 66847.375} {"train_loss": -5.761213779449463, "global_step": 61026, "epoch": 1453} {"train_loss": -5.857504367828369, "global_step": 61027, "epoch": 1453} {"train_loss": -5.839643955230713, "global_step": 61028, "epoch": 1453} {"train_loss": -5.779296875, "global_step": 61029, "epoch": 1453} {"train_loss": -5.8398919105529785, "global_step": 61030, "epoch": 1453} {"train_loss": -5.952342987060547, "global_step": 61031, "epoch": 1453} {"train_loss": -5.936483383178711, "global_step": 61032, "epoch": 1453} {"train_loss": -5.82896614074707, "global_step": 61033, "epoch": 1453} {"train_loss": -5.874682903289795, "global_step": 61034, "epoch": 1453} {"train_loss": -5.892188549041748, "global_step": 61035, "epoch": 1453} {"train_loss": -5.904864311218262, "global_step": 61036, "epoch": 1453} {"train_loss": -5.880152225494385, "global_step": 61037, "epoch": 1453} {"train_loss": -5.899916648864746, "global_step": 61038, "epoch": 1453} {"train_loss": -5.853239059448242, "global_step": 61039, "epoch": 1453} {"train_loss": -5.876047611236572, "global_step": 61040, "epoch": 1453} {"train_loss": -5.934727668762207, "global_step": 61041, "epoch": 1453} {"train_loss": -5.931854724884033, "global_step": 61042, "epoch": 1453} {"train_loss": -5.965264320373535, "global_step": 61043, "epoch": 1453} {"train_loss": -5.986997604370117, "global_step": 61044, "epoch": 1453} {"train_loss": -5.776024341583252, "global_step": 61045, "epoch": 1453} {"train_loss": -5.956307411193848, "global_step": 61046, "epoch": 1453} {"train_loss": -5.788801193237305, "global_step": 61047, "epoch": 1453} {"train_loss": -5.889903545379639, "global_step": 61048, "epoch": 1453} {"train_loss": -5.770755767822266, "global_step": 61049, "epoch": 1453} {"train_loss": -5.878347396850586, "global_step": 61050, "epoch": 1453} {"train_loss": -5.98698616027832, "global_step": 61051, "epoch": 1453} {"train_loss": -5.796338081359863, "global_step": 61052, "epoch": 1453} {"train_loss": -5.803900718688965, "global_step": 61053, "epoch": 1453} {"train_loss": -5.964109420776367, "global_step": 61054, "epoch": 1453} {"train_loss": -5.976773262023926, "global_step": 61055, "epoch": 1453} {"train_loss": -5.953171730041504, "global_step": 61056, "epoch": 1453} {"train_loss": -6.129208087921143, "global_step": 61057, "epoch": 1453} {"train_loss": -5.876893997192383, "global_step": 61058, "epoch": 1453} {"train_loss": -5.990809917449951, "global_step": 61059, "epoch": 1453} {"train_loss": -5.968654632568359, "global_step": 61060, "epoch": 1453} {"train_loss": -5.982346534729004, "global_step": 61061, "epoch": 1453} {"train_loss": -5.9289350509643555, "global_step": 61062, "epoch": 1453} {"train_loss": -5.784625053405762, "global_step": 61063, "epoch": 1453} {"train_loss": -5.883922576904297, "global_step": 61064, "epoch": 1453} {"train_loss": -5.791032791137695, "global_step": 61065, "epoch": 1453} {"train_loss": -5.82636022567749, "global_step": 61066, "epoch": 1453} {"train_loss": -5.894280047643752, "global_step": 61067, "epoch": 1453, "val_loss": 66743.2265625} {"train_loss": -5.830593585968018, "global_step": 61068, "epoch": 1454} {"train_loss": -6.0839338302612305, "global_step": 61069, "epoch": 1454} {"train_loss": -5.887449264526367, "global_step": 61070, "epoch": 1454} {"train_loss": -5.876833915710449, "global_step": 61071, "epoch": 1454} {"train_loss": -5.907011032104492, "global_step": 61072, "epoch": 1454} {"train_loss": -5.9524688720703125, "global_step": 61073, "epoch": 1454} {"train_loss": -5.923300743103027, "global_step": 61074, "epoch": 1454} {"train_loss": -5.998651027679443, "global_step": 61075, "epoch": 1454} {"train_loss": -5.860291481018066, "global_step": 61076, "epoch": 1454} {"train_loss": -5.850993633270264, "global_step": 61077, "epoch": 1454} {"train_loss": -5.85991096496582, "global_step": 61078, "epoch": 1454} {"train_loss": -5.858944892883301, "global_step": 61079, "epoch": 1454} {"train_loss": -5.854696273803711, "global_step": 61080, "epoch": 1454} {"train_loss": -5.972588539123535, "global_step": 61081, "epoch": 1454} {"train_loss": -5.882828712463379, "global_step": 61082, "epoch": 1454} {"train_loss": -5.87656307220459, "global_step": 61083, "epoch": 1454} {"train_loss": -5.877506732940674, "global_step": 61084, "epoch": 1454} {"train_loss": -5.876391410827637, "global_step": 61085, "epoch": 1454} {"train_loss": -5.941183090209961, "global_step": 61086, "epoch": 1454} {"train_loss": -5.909602165222168, "global_step": 61087, "epoch": 1454} {"train_loss": -6.0280046463012695, "global_step": 61088, "epoch": 1454} {"train_loss": -5.939290523529053, "global_step": 61089, "epoch": 1454} {"train_loss": -5.975866794586182, "global_step": 61090, "epoch": 1454} {"train_loss": -5.966809272766113, "global_step": 61091, "epoch": 1454} {"train_loss": -5.916893482208252, "global_step": 61092, "epoch": 1454} {"train_loss": -5.835178375244141, "global_step": 61093, "epoch": 1454} {"train_loss": -5.956275939941406, "global_step": 61094, "epoch": 1454} {"train_loss": -5.87126350402832, "global_step": 61095, "epoch": 1454} {"train_loss": -5.904814720153809, "global_step": 61096, "epoch": 1454} {"train_loss": -5.906891822814941, "global_step": 61097, "epoch": 1454} {"train_loss": -5.924675941467285, "global_step": 61098, "epoch": 1454} {"train_loss": -5.914839744567871, "global_step": 61099, "epoch": 1454} {"train_loss": -5.932888031005859, "global_step": 61100, "epoch": 1454} {"train_loss": -5.943782806396484, "global_step": 61101, "epoch": 1454} {"train_loss": -5.937671661376953, "global_step": 61102, "epoch": 1454} {"train_loss": -5.895147323608398, "global_step": 61103, "epoch": 1454} {"train_loss": -5.967953681945801, "global_step": 61104, "epoch": 1454} {"train_loss": -5.870510101318359, "global_step": 61105, "epoch": 1454} {"train_loss": -5.906682014465332, "global_step": 61106, "epoch": 1454} {"train_loss": -5.788985252380371, "global_step": 61107, "epoch": 1454} {"train_loss": -5.845801830291748, "global_step": 61108, "epoch": 1454} {"train_loss": -5.90713754154387, "global_step": 61109, "epoch": 1454, "val_loss": 66858.0703125} {"train_loss": -5.905642509460449, "global_step": 61110, "epoch": 1455} {"train_loss": -6.012418746948242, "global_step": 61111, "epoch": 1455} {"train_loss": -5.9793829917907715, "global_step": 61112, "epoch": 1455} {"train_loss": -5.993389129638672, "global_step": 61113, "epoch": 1455} {"train_loss": -6.002245903015137, "global_step": 61114, "epoch": 1455} {"train_loss": -5.897655487060547, "global_step": 61115, "epoch": 1455} {"train_loss": -5.858259201049805, "global_step": 61116, "epoch": 1455} {"train_loss": -5.8513503074646, "global_step": 61117, "epoch": 1455} {"train_loss": -5.829317569732666, "global_step": 61118, "epoch": 1455} {"train_loss": -5.981312274932861, "global_step": 61119, "epoch": 1455} {"train_loss": -5.975517272949219, "global_step": 61120, "epoch": 1455} {"train_loss": -5.895470142364502, "global_step": 61121, "epoch": 1455} {"train_loss": -6.025491714477539, "global_step": 61122, "epoch": 1455} {"train_loss": -5.86506462097168, "global_step": 61123, "epoch": 1455} {"train_loss": -5.977172374725342, "global_step": 61124, "epoch": 1455} {"train_loss": -5.965667724609375, "global_step": 61125, "epoch": 1455} {"train_loss": -5.916465759277344, "global_step": 61126, "epoch": 1455} {"train_loss": -5.963255882263184, "global_step": 61127, "epoch": 1455} {"train_loss": -5.831958770751953, "global_step": 61128, "epoch": 1455} {"train_loss": -5.818546295166016, "global_step": 61129, "epoch": 1455} {"train_loss": -5.879822731018066, "global_step": 61130, "epoch": 1455} {"train_loss": -5.932775497436523, "global_step": 61131, "epoch": 1455} {"train_loss": -5.912519454956055, "global_step": 61132, "epoch": 1455} {"train_loss": -5.757146835327148, "global_step": 61133, "epoch": 1455} {"train_loss": -5.844270706176758, "global_step": 61134, "epoch": 1455} {"train_loss": -5.848583221435547, "global_step": 61135, "epoch": 1455} {"train_loss": -5.951366424560547, "global_step": 61136, "epoch": 1455} {"train_loss": -5.702923774719238, "global_step": 61137, "epoch": 1455} {"train_loss": -5.81224250793457, "global_step": 61138, "epoch": 1455} {"train_loss": -5.87860107421875, "global_step": 61139, "epoch": 1455} {"train_loss": -5.84296178817749, "global_step": 61140, "epoch": 1455} {"train_loss": -5.806731224060059, "global_step": 61141, "epoch": 1455} {"train_loss": -5.878757476806641, "global_step": 61142, "epoch": 1455} {"train_loss": -5.815247058868408, "global_step": 61143, "epoch": 1455} {"train_loss": -5.8447370529174805, "global_step": 61144, "epoch": 1455} {"train_loss": -5.945672988891602, "global_step": 61145, "epoch": 1455} {"train_loss": -5.886157989501953, "global_step": 61146, "epoch": 1455} {"train_loss": -5.94709587097168, "global_step": 61147, "epoch": 1455} {"train_loss": -5.8744683265686035, "global_step": 61148, "epoch": 1455} {"train_loss": -5.9928975105285645, "global_step": 61149, "epoch": 1455} {"train_loss": -5.876542091369629, "global_step": 61150, "epoch": 1455} {"train_loss": -5.89773348399571, "global_step": 61151, "epoch": 1455, "val_loss": 67008.6640625} {"train_loss": -5.90498685836792, "global_step": 61152, "epoch": 1456} {"train_loss": -5.921192169189453, "global_step": 61153, "epoch": 1456} {"train_loss": -5.950884819030762, "global_step": 61154, "epoch": 1456} {"train_loss": -5.924073696136475, "global_step": 61155, "epoch": 1456} {"train_loss": -5.843771457672119, "global_step": 61156, "epoch": 1456} {"train_loss": -6.02957820892334, "global_step": 61157, "epoch": 1456} {"train_loss": -5.889406681060791, "global_step": 61158, "epoch": 1456} {"train_loss": -5.764219284057617, "global_step": 61159, "epoch": 1456} {"train_loss": -5.908110618591309, "global_step": 61160, "epoch": 1456} {"train_loss": -5.941217422485352, "global_step": 61161, "epoch": 1456} {"train_loss": -5.936341285705566, "global_step": 61162, "epoch": 1456} {"train_loss": -5.947820663452148, "global_step": 61163, "epoch": 1456} {"train_loss": -5.944788932800293, "global_step": 61164, "epoch": 1456} {"train_loss": -5.93422794342041, "global_step": 61165, "epoch": 1456} {"train_loss": -5.968491077423096, "global_step": 61166, "epoch": 1456} {"train_loss": -5.990676403045654, "global_step": 61167, "epoch": 1456} {"train_loss": -5.84558629989624, "global_step": 61168, "epoch": 1456} {"train_loss": -5.801450729370117, "global_step": 61169, "epoch": 1456} {"train_loss": -5.919279098510742, "global_step": 61170, "epoch": 1456} {"train_loss": -5.8224992752075195, "global_step": 61171, "epoch": 1456} {"train_loss": -5.758316516876221, "global_step": 61172, "epoch": 1456} {"train_loss": -5.9742937088012695, "global_step": 61173, "epoch": 1456} {"train_loss": -5.925124168395996, "global_step": 61174, "epoch": 1456} {"train_loss": -5.897946357727051, "global_step": 61175, "epoch": 1456} {"train_loss": -5.947192192077637, "global_step": 61176, "epoch": 1456} {"train_loss": -5.891530990600586, "global_step": 61177, "epoch": 1456} {"train_loss": -5.877451419830322, "global_step": 61178, "epoch": 1456} {"train_loss": -5.847243309020996, "global_step": 61179, "epoch": 1456} {"train_loss": -6.046145439147949, "global_step": 61180, "epoch": 1456} {"train_loss": -5.913776874542236, "global_step": 61181, "epoch": 1456} {"train_loss": -6.006063461303711, "global_step": 61182, "epoch": 1456} {"train_loss": -5.8869428634643555, "global_step": 61183, "epoch": 1456} {"train_loss": -5.902811050415039, "global_step": 61184, "epoch": 1456} {"train_loss": -5.88638973236084, "global_step": 61185, "epoch": 1456} {"train_loss": -5.947772979736328, "global_step": 61186, "epoch": 1456} {"train_loss": -5.9180450439453125, "global_step": 61187, "epoch": 1456} {"train_loss": -5.866497039794922, "global_step": 61188, "epoch": 1456} {"train_loss": -5.948916435241699, "global_step": 61189, "epoch": 1456} {"train_loss": -5.980417251586914, "global_step": 61190, "epoch": 1456} {"train_loss": -6.027639389038086, "global_step": 61191, "epoch": 1456} {"train_loss": -5.869010925292969, "global_step": 61192, "epoch": 1456} {"train_loss": -5.914273386909848, "global_step": 61193, "epoch": 1456, "val_loss": 66618.984375} {"train_loss": -5.943962097167969, "global_step": 61194, "epoch": 1457} {"train_loss": -5.9518961906433105, "global_step": 61195, "epoch": 1457} {"train_loss": -5.89534330368042, "global_step": 61196, "epoch": 1457} {"train_loss": -5.8381876945495605, "global_step": 61197, "epoch": 1457} {"train_loss": -5.751999855041504, "global_step": 61198, "epoch": 1457} {"train_loss": -5.963307857513428, "global_step": 61199, "epoch": 1457} {"train_loss": -5.923211097717285, "global_step": 61200, "epoch": 1457} {"train_loss": -5.874914169311523, "global_step": 61201, "epoch": 1457} {"train_loss": -5.905463218688965, "global_step": 61202, "epoch": 1457} {"train_loss": -5.942320346832275, "global_step": 61203, "epoch": 1457} {"train_loss": -5.96330451965332, "global_step": 61204, "epoch": 1457} {"train_loss": -5.894457817077637, "global_step": 61205, "epoch": 1457} {"train_loss": -5.990519046783447, "global_step": 61206, "epoch": 1457} {"train_loss": -5.931163787841797, "global_step": 61207, "epoch": 1457} {"train_loss": -5.875275611877441, "global_step": 61208, "epoch": 1457} {"train_loss": -5.84675407409668, "global_step": 61209, "epoch": 1457} {"train_loss": -5.820575714111328, "global_step": 61210, "epoch": 1457} {"train_loss": -5.9165802001953125, "global_step": 61211, "epoch": 1457} {"train_loss": -5.8750152587890625, "global_step": 61212, "epoch": 1457} {"train_loss": -5.954371452331543, "global_step": 61213, "epoch": 1457} {"train_loss": -5.914341926574707, "global_step": 61214, "epoch": 1457} {"train_loss": -5.883484840393066, "global_step": 61215, "epoch": 1457} {"train_loss": -5.964644432067871, "global_step": 61216, "epoch": 1457} {"train_loss": -5.941213607788086, "global_step": 61217, "epoch": 1457} {"train_loss": -5.979844093322754, "global_step": 61218, "epoch": 1457} {"train_loss": -5.899265766143799, "global_step": 61219, "epoch": 1457} {"train_loss": -5.823795318603516, "global_step": 61220, "epoch": 1457} {"train_loss": -5.895718574523926, "global_step": 61221, "epoch": 1457} {"train_loss": -5.8044114112854, "global_step": 61222, "epoch": 1457} {"train_loss": -5.834530830383301, "global_step": 61223, "epoch": 1457} {"train_loss": -5.990025520324707, "global_step": 61224, "epoch": 1457} {"train_loss": -6.067750930786133, "global_step": 61225, "epoch": 1457} {"train_loss": -5.931800842285156, "global_step": 61226, "epoch": 1457} {"train_loss": -5.922863483428955, "global_step": 61227, "epoch": 1457} {"train_loss": -5.919728755950928, "global_step": 61228, "epoch": 1457} {"train_loss": -5.8707709312438965, "global_step": 61229, "epoch": 1457} {"train_loss": -5.9748921394348145, "global_step": 61230, "epoch": 1457} {"train_loss": -5.917316436767578, "global_step": 61231, "epoch": 1457} {"train_loss": -5.880916595458984, "global_step": 61232, "epoch": 1457} {"train_loss": -5.868195533752441, "global_step": 61233, "epoch": 1457} {"train_loss": -5.819162368774414, "global_step": 61234, "epoch": 1457} {"train_loss": -5.904973699933007, "global_step": 61235, "epoch": 1457, "val_loss": 66987.5} {"train_loss": -5.86564826965332, "global_step": 61236, "epoch": 1458} {"train_loss": -5.981405258178711, "global_step": 61237, "epoch": 1458} {"train_loss": -5.964784622192383, "global_step": 61238, "epoch": 1458} {"train_loss": -5.936161518096924, "global_step": 61239, "epoch": 1458} {"train_loss": -5.941483020782471, "global_step": 61240, "epoch": 1458} {"train_loss": -5.804304122924805, "global_step": 61241, "epoch": 1458} {"train_loss": -5.901615142822266, "global_step": 61242, "epoch": 1458} {"train_loss": -5.852906703948975, "global_step": 61243, "epoch": 1458} {"train_loss": -5.7738118171691895, "global_step": 61244, "epoch": 1458} {"train_loss": -5.909882545471191, "global_step": 61245, "epoch": 1458} {"train_loss": -6.015925407409668, "global_step": 61246, "epoch": 1458} {"train_loss": -5.829375267028809, "global_step": 61247, "epoch": 1458} {"train_loss": -5.955512523651123, "global_step": 61248, "epoch": 1458} {"train_loss": -5.90132999420166, "global_step": 61249, "epoch": 1458} {"train_loss": -5.8864850997924805, "global_step": 61250, "epoch": 1458} {"train_loss": -5.830380916595459, "global_step": 61251, "epoch": 1458} {"train_loss": -5.962411403656006, "global_step": 61252, "epoch": 1458} {"train_loss": -5.79584264755249, "global_step": 61253, "epoch": 1458} {"train_loss": -5.8262858390808105, "global_step": 61254, "epoch": 1458} {"train_loss": -5.858107566833496, "global_step": 61255, "epoch": 1458} {"train_loss": -6.017792224884033, "global_step": 61256, "epoch": 1458} {"train_loss": -5.879145622253418, "global_step": 61257, "epoch": 1458} {"train_loss": -5.874480247497559, "global_step": 61258, "epoch": 1458} {"train_loss": -5.872529983520508, "global_step": 61259, "epoch": 1458} {"train_loss": -5.883982181549072, "global_step": 61260, "epoch": 1458} {"train_loss": -5.823126792907715, "global_step": 61261, "epoch": 1458} {"train_loss": -5.949660301208496, "global_step": 61262, "epoch": 1458} {"train_loss": -5.8755645751953125, "global_step": 61263, "epoch": 1458} {"train_loss": -5.8174943923950195, "global_step": 61264, "epoch": 1458} {"train_loss": -5.987580299377441, "global_step": 61265, "epoch": 1458} {"train_loss": -5.851609706878662, "global_step": 61266, "epoch": 1458} {"train_loss": -5.8970947265625, "global_step": 61267, "epoch": 1458} {"train_loss": -5.974644660949707, "global_step": 61268, "epoch": 1458} {"train_loss": -5.946345329284668, "global_step": 61269, "epoch": 1458} {"train_loss": -5.912801265716553, "global_step": 61270, "epoch": 1458} {"train_loss": -5.819334983825684, "global_step": 61271, "epoch": 1458} {"train_loss": -5.88571834564209, "global_step": 61272, "epoch": 1458} {"train_loss": -5.915951728820801, "global_step": 61273, "epoch": 1458} {"train_loss": -5.851371765136719, "global_step": 61274, "epoch": 1458} {"train_loss": -5.826180934906006, "global_step": 61275, "epoch": 1458} {"train_loss": -5.876574516296387, "global_step": 61276, "epoch": 1458} {"train_loss": -5.891828423454648, "global_step": 61277, "epoch": 1458, "val_loss": 66981.796875} {"train_loss": -5.721914291381836, "global_step": 61278, "epoch": 1459} {"train_loss": -5.930245399475098, "global_step": 61279, "epoch": 1459} {"train_loss": -5.983014106750488, "global_step": 61280, "epoch": 1459} {"train_loss": -5.929725646972656, "global_step": 61281, "epoch": 1459} {"train_loss": -5.819038391113281, "global_step": 61282, "epoch": 1459} {"train_loss": -5.933051109313965, "global_step": 61283, "epoch": 1459} {"train_loss": -5.927392482757568, "global_step": 61284, "epoch": 1459} {"train_loss": -5.926760673522949, "global_step": 61285, "epoch": 1459} {"train_loss": -5.9020891189575195, "global_step": 61286, "epoch": 1459} {"train_loss": -5.923310279846191, "global_step": 61287, "epoch": 1459} {"train_loss": -6.034523010253906, "global_step": 61288, "epoch": 1459} {"train_loss": -5.80291748046875, "global_step": 61289, "epoch": 1459} {"train_loss": -5.979008674621582, "global_step": 61290, "epoch": 1459} {"train_loss": -5.941430568695068, "global_step": 61291, "epoch": 1459} {"train_loss": -5.969980239868164, "global_step": 61292, "epoch": 1459} {"train_loss": -5.952585220336914, "global_step": 61293, "epoch": 1459} {"train_loss": -5.998234748840332, "global_step": 61294, "epoch": 1459} {"train_loss": -5.930930137634277, "global_step": 61295, "epoch": 1459} {"train_loss": -5.874059677124023, "global_step": 61296, "epoch": 1459} {"train_loss": -5.939209938049316, "global_step": 61297, "epoch": 1459} {"train_loss": -5.9217023849487305, "global_step": 61298, "epoch": 1459} {"train_loss": -5.90726375579834, "global_step": 61299, "epoch": 1459} {"train_loss": -5.9048309326171875, "global_step": 61300, "epoch": 1459} {"train_loss": -5.935811996459961, "global_step": 61301, "epoch": 1459} {"train_loss": -5.924666404724121, "global_step": 61302, "epoch": 1459} {"train_loss": -5.82110071182251, "global_step": 61303, "epoch": 1459} {"train_loss": -5.9751691818237305, "global_step": 61304, "epoch": 1459} {"train_loss": -5.918886184692383, "global_step": 61305, "epoch": 1459} {"train_loss": -5.865115165710449, "global_step": 61306, "epoch": 1459} {"train_loss": -5.909587383270264, "global_step": 61307, "epoch": 1459} {"train_loss": -5.8648881912231445, "global_step": 61308, "epoch": 1459} {"train_loss": -5.706818580627441, "global_step": 61309, "epoch": 1459} {"train_loss": -5.802523612976074, "global_step": 61310, "epoch": 1459} {"train_loss": -5.80401611328125, "global_step": 61311, "epoch": 1459} {"train_loss": -5.92508602142334, "global_step": 61312, "epoch": 1459} {"train_loss": -5.839500904083252, "global_step": 61313, "epoch": 1459} {"train_loss": -5.983524799346924, "global_step": 61314, "epoch": 1459} {"train_loss": -5.816340446472168, "global_step": 61315, "epoch": 1459} {"train_loss": -5.829190254211426, "global_step": 61316, "epoch": 1459} {"train_loss": -5.906890392303467, "global_step": 61317, "epoch": 1459} {"train_loss": -5.8651604652404785, "global_step": 61318, "epoch": 1459} {"train_loss": -5.896972906021845, "global_step": 61319, "epoch": 1459, "val_loss": 66946.984375} {"train_loss": -5.660562515258789, "global_step": 61320, "epoch": 1460} {"train_loss": -5.890161991119385, "global_step": 61321, "epoch": 1460} {"train_loss": -5.818028450012207, "global_step": 61322, "epoch": 1460} {"train_loss": -5.733564376831055, "global_step": 61323, "epoch": 1460} {"train_loss": -5.887068748474121, "global_step": 61324, "epoch": 1460} {"train_loss": -5.895761489868164, "global_step": 61325, "epoch": 1460} {"train_loss": -5.958872318267822, "global_step": 61326, "epoch": 1460} {"train_loss": -5.924741744995117, "global_step": 61327, "epoch": 1460} {"train_loss": -5.853145122528076, "global_step": 61328, "epoch": 1460} {"train_loss": -6.0206475257873535, "global_step": 61329, "epoch": 1460} {"train_loss": -5.839992523193359, "global_step": 61330, "epoch": 1460} {"train_loss": -5.976881980895996, "global_step": 61331, "epoch": 1460} {"train_loss": -5.950765609741211, "global_step": 61332, "epoch": 1460} {"train_loss": -5.9236345291137695, "global_step": 61333, "epoch": 1460} {"train_loss": -5.863394737243652, "global_step": 61334, "epoch": 1460} {"train_loss": -5.8840460777282715, "global_step": 61335, "epoch": 1460} {"train_loss": -5.872640609741211, "global_step": 61336, "epoch": 1460} {"train_loss": -5.952653408050537, "global_step": 61337, "epoch": 1460} {"train_loss": -5.914788246154785, "global_step": 61338, "epoch": 1460} {"train_loss": -5.709867477416992, "global_step": 61339, "epoch": 1460} {"train_loss": -5.9076337814331055, "global_step": 61340, "epoch": 1460} {"train_loss": -5.880189895629883, "global_step": 61341, "epoch": 1460} {"train_loss": -5.9623122215271, "global_step": 61342, "epoch": 1460} {"train_loss": -5.895516395568848, "global_step": 61343, "epoch": 1460} {"train_loss": -5.838455677032471, "global_step": 61344, "epoch": 1460} {"train_loss": -5.93356466293335, "global_step": 61345, "epoch": 1460} {"train_loss": -5.916095733642578, "global_step": 61346, "epoch": 1460} {"train_loss": -5.911644458770752, "global_step": 61347, "epoch": 1460} {"train_loss": -5.889425277709961, "global_step": 61348, "epoch": 1460} {"train_loss": -5.973769187927246, "global_step": 61349, "epoch": 1460} {"train_loss": -5.885426044464111, "global_step": 61350, "epoch": 1460} {"train_loss": -5.916402339935303, "global_step": 61351, "epoch": 1460} {"train_loss": -5.879117488861084, "global_step": 61352, "epoch": 1460} {"train_loss": -5.991017818450928, "global_step": 61353, "epoch": 1460} {"train_loss": -5.840388298034668, "global_step": 61354, "epoch": 1460} {"train_loss": -6.003921985626221, "global_step": 61355, "epoch": 1460} {"train_loss": -5.886223793029785, "global_step": 61356, "epoch": 1460} {"train_loss": -5.994253635406494, "global_step": 61357, "epoch": 1460} {"train_loss": -5.756468296051025, "global_step": 61358, "epoch": 1460} {"train_loss": -5.97123384475708, "global_step": 61359, "epoch": 1460} {"train_loss": -5.872171401977539, "global_step": 61360, "epoch": 1460} {"train_loss": -5.896579912730625, "global_step": 61361, "epoch": 1460, "val_loss": 66739.6015625} {"train_loss": -5.903475284576416, "global_step": 61362, "epoch": 1461} {"train_loss": -5.9448747634887695, "global_step": 61363, "epoch": 1461} {"train_loss": -6.028781414031982, "global_step": 61364, "epoch": 1461} {"train_loss": -5.859869003295898, "global_step": 61365, "epoch": 1461} {"train_loss": -5.745711326599121, "global_step": 61366, "epoch": 1461} {"train_loss": -5.922656536102295, "global_step": 61367, "epoch": 1461} {"train_loss": -5.912238121032715, "global_step": 61368, "epoch": 1461} {"train_loss": -5.898560523986816, "global_step": 61369, "epoch": 1461} {"train_loss": -5.906309604644775, "global_step": 61370, "epoch": 1461} {"train_loss": -5.846950054168701, "global_step": 61371, "epoch": 1461} {"train_loss": -5.962482929229736, "global_step": 61372, "epoch": 1461} {"train_loss": -5.831453800201416, "global_step": 61373, "epoch": 1461} {"train_loss": -5.987065315246582, "global_step": 61374, "epoch": 1461} {"train_loss": -5.806081771850586, "global_step": 61375, "epoch": 1461} {"train_loss": -5.891708850860596, "global_step": 61376, "epoch": 1461} {"train_loss": -5.918644905090332, "global_step": 61377, "epoch": 1461} {"train_loss": -5.965147018432617, "global_step": 61378, "epoch": 1461} {"train_loss": -5.898530960083008, "global_step": 61379, "epoch": 1461} {"train_loss": -5.979891777038574, "global_step": 61380, "epoch": 1461} {"train_loss": -5.849255084991455, "global_step": 61381, "epoch": 1461} {"train_loss": -5.793868064880371, "global_step": 61382, "epoch": 1461} {"train_loss": -5.803350448608398, "global_step": 61383, "epoch": 1461} {"train_loss": -5.904543876647949, "global_step": 61384, "epoch": 1461} {"train_loss": -5.881662368774414, "global_step": 61385, "epoch": 1461} {"train_loss": -5.925961017608643, "global_step": 61386, "epoch": 1461} {"train_loss": -5.898815155029297, "global_step": 61387, "epoch": 1461} {"train_loss": -5.876328468322754, "global_step": 61388, "epoch": 1461} {"train_loss": -5.860891819000244, "global_step": 61389, "epoch": 1461} {"train_loss": -5.840147495269775, "global_step": 61390, "epoch": 1461} {"train_loss": -5.877635478973389, "global_step": 61391, "epoch": 1461} {"train_loss": -5.913807392120361, "global_step": 61392, "epoch": 1461} {"train_loss": -5.945054054260254, "global_step": 61393, "epoch": 1461} {"train_loss": -5.8836188316345215, "global_step": 61394, "epoch": 1461} {"train_loss": -5.983288764953613, "global_step": 61395, "epoch": 1461} {"train_loss": -5.906824111938477, "global_step": 61396, "epoch": 1461} {"train_loss": -5.92460823059082, "global_step": 61397, "epoch": 1461} {"train_loss": -5.9109978675842285, "global_step": 61398, "epoch": 1461} {"train_loss": -5.832916259765625, "global_step": 61399, "epoch": 1461} {"train_loss": -5.851563453674316, "global_step": 61400, "epoch": 1461} {"train_loss": -5.813775062561035, "global_step": 61401, "epoch": 1461} {"train_loss": -5.850405693054199, "global_step": 61402, "epoch": 1461} {"train_loss": -5.892609823317755, "global_step": 61403, "epoch": 1461, "val_loss": 67161.171875} {"train_loss": -5.884108543395996, "global_step": 61404, "epoch": 1462} {"train_loss": -5.932546615600586, "global_step": 61405, "epoch": 1462} {"train_loss": -5.865996837615967, "global_step": 61406, "epoch": 1462} {"train_loss": -5.863669395446777, "global_step": 61407, "epoch": 1462} {"train_loss": -5.858182907104492, "global_step": 61408, "epoch": 1462} {"train_loss": -5.78044319152832, "global_step": 61409, "epoch": 1462} {"train_loss": -5.777413845062256, "global_step": 61410, "epoch": 1462} {"train_loss": -5.977010726928711, "global_step": 61411, "epoch": 1462} {"train_loss": -5.796350002288818, "global_step": 61412, "epoch": 1462} {"train_loss": -5.791172027587891, "global_step": 61413, "epoch": 1462} {"train_loss": -5.973919868469238, "global_step": 61414, "epoch": 1462} {"train_loss": -5.92451810836792, "global_step": 61415, "epoch": 1462} {"train_loss": -5.871199607849121, "global_step": 61416, "epoch": 1462} {"train_loss": -6.025285720825195, "global_step": 61417, "epoch": 1462} {"train_loss": -6.045319557189941, "global_step": 61418, "epoch": 1462} {"train_loss": -5.887661933898926, "global_step": 61419, "epoch": 1462} {"train_loss": -5.957225799560547, "global_step": 61420, "epoch": 1462} {"train_loss": -5.914104461669922, "global_step": 61421, "epoch": 1462} {"train_loss": -5.905299186706543, "global_step": 61422, "epoch": 1462} {"train_loss": -5.943819046020508, "global_step": 61423, "epoch": 1462} {"train_loss": -5.895664691925049, "global_step": 61424, "epoch": 1462} {"train_loss": -5.877594947814941, "global_step": 61425, "epoch": 1462} {"train_loss": -5.908426284790039, "global_step": 61426, "epoch": 1462} {"train_loss": -5.779378414154053, "global_step": 61427, "epoch": 1462} {"train_loss": -5.8983964920043945, "global_step": 61428, "epoch": 1462} {"train_loss": -5.875378608703613, "global_step": 61429, "epoch": 1462} {"train_loss": -5.800657272338867, "global_step": 61430, "epoch": 1462} {"train_loss": -6.074209213256836, "global_step": 61431, "epoch": 1462} {"train_loss": -5.901866436004639, "global_step": 61432, "epoch": 1462} {"train_loss": -5.890561103820801, "global_step": 61433, "epoch": 1462} {"train_loss": -5.883904457092285, "global_step": 61434, "epoch": 1462} {"train_loss": -5.962657928466797, "global_step": 61435, "epoch": 1462} {"train_loss": -5.839920997619629, "global_step": 61436, "epoch": 1462} {"train_loss": -5.97026252746582, "global_step": 61437, "epoch": 1462} {"train_loss": -5.983489990234375, "global_step": 61438, "epoch": 1462} {"train_loss": -5.980214595794678, "global_step": 61439, "epoch": 1462} {"train_loss": -5.993128776550293, "global_step": 61440, "epoch": 1462} {"train_loss": -5.891141891479492, "global_step": 61441, "epoch": 1462} {"train_loss": -5.905983924865723, "global_step": 61442, "epoch": 1462} {"train_loss": -5.949617385864258, "global_step": 61443, "epoch": 1462} {"train_loss": -5.8252034187316895, "global_step": 61444, "epoch": 1462} {"train_loss": -5.904129107793172, "global_step": 61445, "epoch": 1462, "val_loss": 66731.1953125} {"train_loss": -5.994374752044678, "global_step": 61446, "epoch": 1463} {"train_loss": -5.901518821716309, "global_step": 61447, "epoch": 1463} {"train_loss": -6.061971664428711, "global_step": 61448, "epoch": 1463} {"train_loss": -5.9172844886779785, "global_step": 61449, "epoch": 1463} {"train_loss": -5.891288757324219, "global_step": 61450, "epoch": 1463} {"train_loss": -5.920651912689209, "global_step": 61451, "epoch": 1463} {"train_loss": -5.994777679443359, "global_step": 61452, "epoch": 1463} {"train_loss": -5.928245544433594, "global_step": 61453, "epoch": 1463} {"train_loss": -5.910346031188965, "global_step": 61454, "epoch": 1463} {"train_loss": -5.9447832107543945, "global_step": 61455, "epoch": 1463} {"train_loss": -5.79382848739624, "global_step": 61456, "epoch": 1463} {"train_loss": -5.851797580718994, "global_step": 61457, "epoch": 1463} {"train_loss": -5.95162296295166, "global_step": 61458, "epoch": 1463} {"train_loss": -5.827210426330566, "global_step": 61459, "epoch": 1463} {"train_loss": -5.972413063049316, "global_step": 61460, "epoch": 1463} {"train_loss": -5.863567352294922, "global_step": 61461, "epoch": 1463} {"train_loss": -5.9055914878845215, "global_step": 61462, "epoch": 1463} {"train_loss": -5.875741004943848, "global_step": 61463, "epoch": 1463} {"train_loss": -5.90419340133667, "global_step": 61464, "epoch": 1463} {"train_loss": -5.96040678024292, "global_step": 61465, "epoch": 1463} {"train_loss": -5.897390365600586, "global_step": 61466, "epoch": 1463} {"train_loss": -5.800729274749756, "global_step": 61467, "epoch": 1463} {"train_loss": -5.833556175231934, "global_step": 61468, "epoch": 1463} {"train_loss": -6.001926422119141, "global_step": 61469, "epoch": 1463} {"train_loss": -5.837973117828369, "global_step": 61470, "epoch": 1463} {"train_loss": -5.926830291748047, "global_step": 61471, "epoch": 1463} {"train_loss": -5.9416632652282715, "global_step": 61472, "epoch": 1463} {"train_loss": -5.924772262573242, "global_step": 61473, "epoch": 1463} {"train_loss": -5.923793792724609, "global_step": 61474, "epoch": 1463} {"train_loss": -5.923157691955566, "global_step": 61475, "epoch": 1463} {"train_loss": -5.8568291664123535, "global_step": 61476, "epoch": 1463} {"train_loss": -5.889847755432129, "global_step": 61477, "epoch": 1463} {"train_loss": -5.8703999519348145, "global_step": 61478, "epoch": 1463} {"train_loss": -5.914214134216309, "global_step": 61479, "epoch": 1463} {"train_loss": -5.900835037231445, "global_step": 61480, "epoch": 1463} {"train_loss": -5.93474817276001, "global_step": 61481, "epoch": 1463} {"train_loss": -5.896753311157227, "global_step": 61482, "epoch": 1463} {"train_loss": -5.92856502532959, "global_step": 61483, "epoch": 1463} {"train_loss": -5.813112258911133, "global_step": 61484, "epoch": 1463} {"train_loss": -5.871702194213867, "global_step": 61485, "epoch": 1463} {"train_loss": -5.975553512573242, "global_step": 61486, "epoch": 1463} {"train_loss": -5.90731406211853, "global_step": 61487, "epoch": 1463, "val_loss": 66874.390625} {"train_loss": -5.999092102050781, "global_step": 61488, "epoch": 1464} {"train_loss": -5.954634666442871, "global_step": 61489, "epoch": 1464} {"train_loss": -5.981159210205078, "global_step": 61490, "epoch": 1464} {"train_loss": -5.930773735046387, "global_step": 61491, "epoch": 1464} {"train_loss": -5.924198627471924, "global_step": 61492, "epoch": 1464} {"train_loss": -5.840540409088135, "global_step": 61493, "epoch": 1464} {"train_loss": -5.950771331787109, "global_step": 61494, "epoch": 1464} {"train_loss": -5.964885711669922, "global_step": 61495, "epoch": 1464} {"train_loss": -5.868808269500732, "global_step": 61496, "epoch": 1464} {"train_loss": -5.940783500671387, "global_step": 61497, "epoch": 1464} {"train_loss": -6.056035041809082, "global_step": 61498, "epoch": 1464} {"train_loss": -5.927435874938965, "global_step": 61499, "epoch": 1464} {"train_loss": -5.987702369689941, "global_step": 61500, "epoch": 1464} {"train_loss": -5.956295967102051, "global_step": 61501, "epoch": 1464} {"train_loss": -5.933388710021973, "global_step": 61502, "epoch": 1464} {"train_loss": -5.892678260803223, "global_step": 61503, "epoch": 1464} {"train_loss": -5.977709770202637, "global_step": 61504, "epoch": 1464} {"train_loss": -5.824483871459961, "global_step": 61505, "epoch": 1464} {"train_loss": -5.937962055206299, "global_step": 61506, "epoch": 1464} {"train_loss": -5.853702545166016, "global_step": 61507, "epoch": 1464} {"train_loss": -5.888820171356201, "global_step": 61508, "epoch": 1464} {"train_loss": -5.865472316741943, "global_step": 61509, "epoch": 1464} {"train_loss": -5.875975608825684, "global_step": 61510, "epoch": 1464} {"train_loss": -5.865531921386719, "global_step": 61511, "epoch": 1464} {"train_loss": -5.878695964813232, "global_step": 61512, "epoch": 1464} {"train_loss": -5.917716026306152, "global_step": 61513, "epoch": 1464} {"train_loss": -5.875212669372559, "global_step": 61514, "epoch": 1464} {"train_loss": -5.882482051849365, "global_step": 61515, "epoch": 1464} {"train_loss": -5.775439262390137, "global_step": 61516, "epoch": 1464} {"train_loss": -5.956518650054932, "global_step": 61517, "epoch": 1464} {"train_loss": -5.933520793914795, "global_step": 61518, "epoch": 1464} {"train_loss": -5.9138336181640625, "global_step": 61519, "epoch": 1464} {"train_loss": -5.9443559646606445, "global_step": 61520, "epoch": 1464} {"train_loss": -5.857972621917725, "global_step": 61521, "epoch": 1464} {"train_loss": -5.8608078956604, "global_step": 61522, "epoch": 1464} {"train_loss": -5.970729827880859, "global_step": 61523, "epoch": 1464} {"train_loss": -5.80224084854126, "global_step": 61524, "epoch": 1464} {"train_loss": -5.828380584716797, "global_step": 61525, "epoch": 1464} {"train_loss": -5.7096848487854, "global_step": 61526, "epoch": 1464} {"train_loss": -5.907934665679932, "global_step": 61527, "epoch": 1464} {"train_loss": -5.795861721038818, "global_step": 61528, "epoch": 1464} {"train_loss": -5.901305130549839, "global_step": 61529, "epoch": 1464, "val_loss": 67151.9453125} {"train_loss": -5.8707780838012695, "global_step": 61530, "epoch": 1465} {"train_loss": -5.929886817932129, "global_step": 61531, "epoch": 1465} {"train_loss": -5.980042457580566, "global_step": 61532, "epoch": 1465} {"train_loss": -5.947131156921387, "global_step": 61533, "epoch": 1465} {"train_loss": -5.88323974609375, "global_step": 61534, "epoch": 1465} {"train_loss": -5.849599361419678, "global_step": 61535, "epoch": 1465} {"train_loss": -5.929512023925781, "global_step": 61536, "epoch": 1465} {"train_loss": -5.788989067077637, "global_step": 61537, "epoch": 1465} {"train_loss": -5.9951324462890625, "global_step": 61538, "epoch": 1465} {"train_loss": -5.891807556152344, "global_step": 61539, "epoch": 1465} {"train_loss": -5.881102561950684, "global_step": 61540, "epoch": 1465} {"train_loss": -6.006814002990723, "global_step": 61541, "epoch": 1465} {"train_loss": -5.9344072341918945, "global_step": 61542, "epoch": 1465} {"train_loss": -5.992968559265137, "global_step": 61543, "epoch": 1465} {"train_loss": -5.910587310791016, "global_step": 61544, "epoch": 1465} {"train_loss": -5.812930107116699, "global_step": 61545, "epoch": 1465} {"train_loss": -5.990179061889648, "global_step": 61546, "epoch": 1465} {"train_loss": -5.912698268890381, "global_step": 61547, "epoch": 1465} {"train_loss": -5.874284744262695, "global_step": 61548, "epoch": 1465} {"train_loss": -5.845654487609863, "global_step": 61549, "epoch": 1465} {"train_loss": -5.870917320251465, "global_step": 61550, "epoch": 1465} {"train_loss": -5.838189125061035, "global_step": 61551, "epoch": 1465} {"train_loss": -5.819215774536133, "global_step": 61552, "epoch": 1465} {"train_loss": -5.812382698059082, "global_step": 61553, "epoch": 1465} {"train_loss": -5.970937728881836, "global_step": 61554, "epoch": 1465} {"train_loss": -6.015320777893066, "global_step": 61555, "epoch": 1465} {"train_loss": -5.901212215423584, "global_step": 61556, "epoch": 1465} {"train_loss": -5.791384220123291, "global_step": 61557, "epoch": 1465} {"train_loss": -5.737332344055176, "global_step": 61558, "epoch": 1465} {"train_loss": -5.771890163421631, "global_step": 61559, "epoch": 1465} {"train_loss": -5.818836688995361, "global_step": 61560, "epoch": 1465} {"train_loss": -5.786528587341309, "global_step": 61561, "epoch": 1465} {"train_loss": -5.8851094245910645, "global_step": 61562, "epoch": 1465} {"train_loss": -5.857639312744141, "global_step": 61563, "epoch": 1465} {"train_loss": -5.901181221008301, "global_step": 61564, "epoch": 1465} {"train_loss": -5.969819068908691, "global_step": 61565, "epoch": 1465} {"train_loss": -5.904388427734375, "global_step": 61566, "epoch": 1465} {"train_loss": -5.928807735443115, "global_step": 61567, "epoch": 1465} {"train_loss": -5.9730963706970215, "global_step": 61568, "epoch": 1465} {"train_loss": -5.871060848236084, "global_step": 61569, "epoch": 1465} {"train_loss": -5.922163009643555, "global_step": 61570, "epoch": 1465} {"train_loss": -5.893452553522019, "global_step": 61571, "epoch": 1465, "val_loss": 67071.71875} {"train_loss": -5.80108642578125, "global_step": 61572, "epoch": 1466} {"train_loss": -5.832090377807617, "global_step": 61573, "epoch": 1466} {"train_loss": -5.685611724853516, "global_step": 61574, "epoch": 1466} {"train_loss": -5.976044654846191, "global_step": 61575, "epoch": 1466} {"train_loss": -5.936110019683838, "global_step": 61576, "epoch": 1466} {"train_loss": -5.884062767028809, "global_step": 61577, "epoch": 1466} {"train_loss": -5.97309684753418, "global_step": 61578, "epoch": 1466} {"train_loss": -5.75383186340332, "global_step": 61579, "epoch": 1466} {"train_loss": -5.751611709594727, "global_step": 61580, "epoch": 1466} {"train_loss": -5.936272621154785, "global_step": 61581, "epoch": 1466} {"train_loss": -5.821621417999268, "global_step": 61582, "epoch": 1466} {"train_loss": -5.922310829162598, "global_step": 61583, "epoch": 1466} {"train_loss": -5.755337715148926, "global_step": 61584, "epoch": 1466} {"train_loss": -5.84372615814209, "global_step": 61585, "epoch": 1466} {"train_loss": -6.027249336242676, "global_step": 61586, "epoch": 1466} {"train_loss": -5.879734992980957, "global_step": 61587, "epoch": 1466} {"train_loss": -5.941287040710449, "global_step": 61588, "epoch": 1466} {"train_loss": -6.063157081604004, "global_step": 61589, "epoch": 1466} {"train_loss": -5.8438568115234375, "global_step": 61590, "epoch": 1466} {"train_loss": -5.914406776428223, "global_step": 61591, "epoch": 1466} {"train_loss": -5.868165969848633, "global_step": 61592, "epoch": 1466} {"train_loss": -5.884951591491699, "global_step": 61593, "epoch": 1466} {"train_loss": -5.874030113220215, "global_step": 61594, "epoch": 1466} {"train_loss": -5.939345359802246, "global_step": 61595, "epoch": 1466} {"train_loss": -5.909529685974121, "global_step": 61596, "epoch": 1466} {"train_loss": -5.767355442047119, "global_step": 61597, "epoch": 1466} {"train_loss": -5.908648490905762, "global_step": 61598, "epoch": 1466} {"train_loss": -5.9184160232543945, "global_step": 61599, "epoch": 1466} {"train_loss": -5.919171333312988, "global_step": 61600, "epoch": 1466} {"train_loss": -5.827907085418701, "global_step": 61601, "epoch": 1466} {"train_loss": -5.933542251586914, "global_step": 61602, "epoch": 1466} {"train_loss": -5.90369987487793, "global_step": 61603, "epoch": 1466} {"train_loss": -5.944084167480469, "global_step": 61604, "epoch": 1466} {"train_loss": -5.96035099029541, "global_step": 61605, "epoch": 1466} {"train_loss": -5.87055778503418, "global_step": 61606, "epoch": 1466} {"train_loss": -5.922067165374756, "global_step": 61607, "epoch": 1466} {"train_loss": -5.861037731170654, "global_step": 61608, "epoch": 1466} {"train_loss": -5.964316368103027, "global_step": 61609, "epoch": 1466} {"train_loss": -5.767007827758789, "global_step": 61610, "epoch": 1466} {"train_loss": -5.942767143249512, "global_step": 61611, "epoch": 1466} {"train_loss": -5.959173679351807, "global_step": 61612, "epoch": 1466} {"train_loss": -5.885233515784854, "global_step": 61613, "epoch": 1466, "val_loss": 67380.8515625} {"train_loss": -5.981177806854248, "global_step": 61614, "epoch": 1467} {"train_loss": -5.898476600646973, "global_step": 61615, "epoch": 1467} {"train_loss": -5.929787635803223, "global_step": 61616, "epoch": 1467} {"train_loss": -5.8874006271362305, "global_step": 61617, "epoch": 1467} {"train_loss": -5.879307746887207, "global_step": 61618, "epoch": 1467} {"train_loss": -5.817385673522949, "global_step": 61619, "epoch": 1467} {"train_loss": -5.778895378112793, "global_step": 61620, "epoch": 1467} {"train_loss": -5.975080490112305, "global_step": 61621, "epoch": 1467} {"train_loss": -5.947585105895996, "global_step": 61622, "epoch": 1467} {"train_loss": -5.930161952972412, "global_step": 61623, "epoch": 1467} {"train_loss": -5.883559226989746, "global_step": 61624, "epoch": 1467} {"train_loss": -5.998782634735107, "global_step": 61625, "epoch": 1467} {"train_loss": -5.901913166046143, "global_step": 61626, "epoch": 1467} {"train_loss": -5.916787147521973, "global_step": 61627, "epoch": 1467} {"train_loss": -5.951962471008301, "global_step": 61628, "epoch": 1467} {"train_loss": -5.897193908691406, "global_step": 61629, "epoch": 1467} {"train_loss": -5.864315986633301, "global_step": 61630, "epoch": 1467} {"train_loss": -5.857756614685059, "global_step": 61631, "epoch": 1467} {"train_loss": -5.836413383483887, "global_step": 61632, "epoch": 1467} {"train_loss": -6.033009052276611, "global_step": 61633, "epoch": 1467} {"train_loss": -5.895702838897705, "global_step": 61634, "epoch": 1467} {"train_loss": -5.934002876281738, "global_step": 61635, "epoch": 1467} {"train_loss": -5.744162559509277, "global_step": 61636, "epoch": 1467} {"train_loss": -6.015239715576172, "global_step": 61637, "epoch": 1467} {"train_loss": -5.928805351257324, "global_step": 61638, "epoch": 1467} {"train_loss": -6.029849052429199, "global_step": 61639, "epoch": 1467} {"train_loss": -5.857257843017578, "global_step": 61640, "epoch": 1467} {"train_loss": -5.848559379577637, "global_step": 61641, "epoch": 1467} {"train_loss": -5.8895487785339355, "global_step": 61642, "epoch": 1467} {"train_loss": -5.980926513671875, "global_step": 61643, "epoch": 1467} {"train_loss": -5.829944133758545, "global_step": 61644, "epoch": 1467} {"train_loss": -5.872004508972168, "global_step": 61645, "epoch": 1467} {"train_loss": -5.898563385009766, "global_step": 61646, "epoch": 1467} {"train_loss": -5.879655838012695, "global_step": 61647, "epoch": 1467} {"train_loss": -5.911708354949951, "global_step": 61648, "epoch": 1467} {"train_loss": -5.859336853027344, "global_step": 61649, "epoch": 1467} {"train_loss": -5.903999328613281, "global_step": 61650, "epoch": 1467} {"train_loss": -5.900774002075195, "global_step": 61651, "epoch": 1467} {"train_loss": -5.913623809814453, "global_step": 61652, "epoch": 1467} {"train_loss": -5.9649882316589355, "global_step": 61653, "epoch": 1467} {"train_loss": -5.8333258628845215, "global_step": 61654, "epoch": 1467} {"train_loss": -5.903597388948713, "global_step": 61655, "epoch": 1467, "val_loss": 66645.34375} {"train_loss": -5.892800331115723, "global_step": 61656, "epoch": 1468} {"train_loss": -5.875328540802002, "global_step": 61657, "epoch": 1468} {"train_loss": -5.894577980041504, "global_step": 61658, "epoch": 1468} {"train_loss": -5.894955635070801, "global_step": 61659, "epoch": 1468} {"train_loss": -5.855491638183594, "global_step": 61660, "epoch": 1468} {"train_loss": -5.928195953369141, "global_step": 61661, "epoch": 1468} {"train_loss": -5.94805908203125, "global_step": 61662, "epoch": 1468} {"train_loss": -5.79630708694458, "global_step": 61663, "epoch": 1468} {"train_loss": -5.974839210510254, "global_step": 61664, "epoch": 1468} {"train_loss": -6.10577392578125, "global_step": 61665, "epoch": 1468} {"train_loss": -5.887567520141602, "global_step": 61666, "epoch": 1468} {"train_loss": -5.886011123657227, "global_step": 61667, "epoch": 1468} {"train_loss": -5.857484340667725, "global_step": 61668, "epoch": 1468} {"train_loss": -5.998220443725586, "global_step": 61669, "epoch": 1468} {"train_loss": -5.95029354095459, "global_step": 61670, "epoch": 1468} {"train_loss": -5.884704113006592, "global_step": 61671, "epoch": 1468} {"train_loss": -5.842085361480713, "global_step": 61672, "epoch": 1468} {"train_loss": -5.924537658691406, "global_step": 61673, "epoch": 1468} {"train_loss": -5.808920383453369, "global_step": 61674, "epoch": 1468} {"train_loss": -5.858651161193848, "global_step": 61675, "epoch": 1468} {"train_loss": -5.9866156578063965, "global_step": 61676, "epoch": 1468} {"train_loss": -5.844910621643066, "global_step": 61677, "epoch": 1468} {"train_loss": -5.854339599609375, "global_step": 61678, "epoch": 1468} {"train_loss": -5.88651704788208, "global_step": 61679, "epoch": 1468} {"train_loss": -5.861455917358398, "global_step": 61680, "epoch": 1468} {"train_loss": -5.909946918487549, "global_step": 61681, "epoch": 1468} {"train_loss": -5.973972320556641, "global_step": 61682, "epoch": 1468} {"train_loss": -5.893254280090332, "global_step": 61683, "epoch": 1468} {"train_loss": -5.982223987579346, "global_step": 61684, "epoch": 1468} {"train_loss": -5.9690752029418945, "global_step": 61685, "epoch": 1468} {"train_loss": -5.891183853149414, "global_step": 61686, "epoch": 1468} {"train_loss": -5.9859747886657715, "global_step": 61687, "epoch": 1468} {"train_loss": -5.942770004272461, "global_step": 61688, "epoch": 1468} {"train_loss": -5.876370429992676, "global_step": 61689, "epoch": 1468} {"train_loss": -5.741884231567383, "global_step": 61690, "epoch": 1468} {"train_loss": -5.879640102386475, "global_step": 61691, "epoch": 1468} {"train_loss": -5.886862277984619, "global_step": 61692, "epoch": 1468} {"train_loss": -5.9054856300354, "global_step": 61693, "epoch": 1468} {"train_loss": -5.915251731872559, "global_step": 61694, "epoch": 1468} {"train_loss": -5.7981648445129395, "global_step": 61695, "epoch": 1468} {"train_loss": -6.035222053527832, "global_step": 61696, "epoch": 1468} {"train_loss": -5.905296121324811, "global_step": 61697, "epoch": 1468, "val_loss": 66867.5546875} {"train_loss": -5.902764320373535, "global_step": 61698, "epoch": 1469} {"train_loss": -5.946148872375488, "global_step": 61699, "epoch": 1469} {"train_loss": -5.925504207611084, "global_step": 61700, "epoch": 1469} {"train_loss": -5.85971736907959, "global_step": 61701, "epoch": 1469} {"train_loss": -5.805514335632324, "global_step": 61702, "epoch": 1469} {"train_loss": -5.853509902954102, "global_step": 61703, "epoch": 1469} {"train_loss": -5.791144847869873, "global_step": 61704, "epoch": 1469} {"train_loss": -5.846482276916504, "global_step": 61705, "epoch": 1469} {"train_loss": -5.904538154602051, "global_step": 61706, "epoch": 1469} {"train_loss": -5.798221588134766, "global_step": 61707, "epoch": 1469} {"train_loss": -5.848759651184082, "global_step": 61708, "epoch": 1469} {"train_loss": -5.864530563354492, "global_step": 61709, "epoch": 1469} {"train_loss": -5.903154373168945, "global_step": 61710, "epoch": 1469} {"train_loss": -5.903790473937988, "global_step": 61711, "epoch": 1469} {"train_loss": -5.796661376953125, "global_step": 61712, "epoch": 1469} {"train_loss": -5.878439903259277, "global_step": 61713, "epoch": 1469} {"train_loss": -5.755234718322754, "global_step": 61714, "epoch": 1469} {"train_loss": -5.906032562255859, "global_step": 61715, "epoch": 1469} {"train_loss": -5.919992446899414, "global_step": 61716, "epoch": 1469} {"train_loss": -5.7984724044799805, "global_step": 61717, "epoch": 1469} {"train_loss": -5.694328308105469, "global_step": 61718, "epoch": 1469} {"train_loss": -5.929308891296387, "global_step": 61719, "epoch": 1469} {"train_loss": -5.760973930358887, "global_step": 61720, "epoch": 1469} {"train_loss": -5.765667915344238, "global_step": 61721, "epoch": 1469} {"train_loss": -5.867546081542969, "global_step": 61722, "epoch": 1469} {"train_loss": -5.806962966918945, "global_step": 61723, "epoch": 1469} {"train_loss": -5.942127227783203, "global_step": 61724, "epoch": 1469} {"train_loss": -5.9249267578125, "global_step": 61725, "epoch": 1469} {"train_loss": -5.942849159240723, "global_step": 61726, "epoch": 1469} {"train_loss": -5.924775123596191, "global_step": 61727, "epoch": 1469} {"train_loss": -5.97565221786499, "global_step": 61728, "epoch": 1469} {"train_loss": -5.887175559997559, "global_step": 61729, "epoch": 1469} {"train_loss": -5.893835067749023, "global_step": 61730, "epoch": 1469} {"train_loss": -5.828883647918701, "global_step": 61731, "epoch": 1469} {"train_loss": -5.983115196228027, "global_step": 61732, "epoch": 1469} {"train_loss": -5.948742866516113, "global_step": 61733, "epoch": 1469} {"train_loss": -5.9146223068237305, "global_step": 61734, "epoch": 1469} {"train_loss": -6.0311384201049805, "global_step": 61735, "epoch": 1469} {"train_loss": -5.855679035186768, "global_step": 61736, "epoch": 1469} {"train_loss": -5.882246017456055, "global_step": 61737, "epoch": 1469} {"train_loss": -5.9476799964904785, "global_step": 61738, "epoch": 1469} {"train_loss": -5.876969621295021, "global_step": 61739, "epoch": 1469, "val_loss": 66656.6953125} {"train_loss": -5.7755889892578125, "global_step": 61740, "epoch": 1470} {"train_loss": -5.998589515686035, "global_step": 61741, "epoch": 1470} {"train_loss": -5.763436317443848, "global_step": 61742, "epoch": 1470} {"train_loss": -5.8646240234375, "global_step": 61743, "epoch": 1470} {"train_loss": -6.042658805847168, "global_step": 61744, "epoch": 1470} {"train_loss": -5.896304130554199, "global_step": 61745, "epoch": 1470} {"train_loss": -5.838608741760254, "global_step": 61746, "epoch": 1470} {"train_loss": -5.926302909851074, "global_step": 61747, "epoch": 1470} {"train_loss": -6.021049499511719, "global_step": 61748, "epoch": 1470} {"train_loss": -5.969042778015137, "global_step": 61749, "epoch": 1470} {"train_loss": -5.899422645568848, "global_step": 61750, "epoch": 1470} {"train_loss": -5.813785552978516, "global_step": 61751, "epoch": 1470} {"train_loss": -5.931097507476807, "global_step": 61752, "epoch": 1470} {"train_loss": -5.844243049621582, "global_step": 61753, "epoch": 1470} {"train_loss": -5.780405044555664, "global_step": 61754, "epoch": 1470} {"train_loss": -5.907179832458496, "global_step": 61755, "epoch": 1470} {"train_loss": -5.912337779998779, "global_step": 61756, "epoch": 1470} {"train_loss": -5.909898281097412, "global_step": 61757, "epoch": 1470} {"train_loss": -5.915872573852539, "global_step": 61758, "epoch": 1470} {"train_loss": -5.857764720916748, "global_step": 61759, "epoch": 1470} {"train_loss": -6.015606880187988, "global_step": 61760, "epoch": 1470} {"train_loss": -5.900123596191406, "global_step": 61761, "epoch": 1470} {"train_loss": -5.835278511047363, "global_step": 61762, "epoch": 1470} {"train_loss": -5.935271263122559, "global_step": 61763, "epoch": 1470} {"train_loss": -6.037091255187988, "global_step": 61764, "epoch": 1470} {"train_loss": -5.801296710968018, "global_step": 61765, "epoch": 1470} {"train_loss": -5.8812174797058105, "global_step": 61766, "epoch": 1470} {"train_loss": -5.84684944152832, "global_step": 61767, "epoch": 1470} {"train_loss": -5.948387145996094, "global_step": 61768, "epoch": 1470} {"train_loss": -5.915781497955322, "global_step": 61769, "epoch": 1470} {"train_loss": -6.026645660400391, "global_step": 61770, "epoch": 1470} {"train_loss": -5.961102485656738, "global_step": 61771, "epoch": 1470} {"train_loss": -5.901576995849609, "global_step": 61772, "epoch": 1470} {"train_loss": -6.023320198059082, "global_step": 61773, "epoch": 1470} {"train_loss": -5.900371551513672, "global_step": 61774, "epoch": 1470} {"train_loss": -5.9105682373046875, "global_step": 61775, "epoch": 1470} {"train_loss": -5.934327125549316, "global_step": 61776, "epoch": 1470} {"train_loss": -6.012097358703613, "global_step": 61777, "epoch": 1470} {"train_loss": -5.798067092895508, "global_step": 61778, "epoch": 1470} {"train_loss": -5.890100002288818, "global_step": 61779, "epoch": 1470} {"train_loss": -5.921604633331299, "global_step": 61780, "epoch": 1470} {"train_loss": -5.908271403539748, "global_step": 61781, "epoch": 1470, "val_loss": 66933.484375} {"train_loss": -5.941136360168457, "global_step": 61782, "epoch": 1471} {"train_loss": -5.899537086486816, "global_step": 61783, "epoch": 1471} {"train_loss": -5.760039329528809, "global_step": 61784, "epoch": 1471} {"train_loss": -5.898587226867676, "global_step": 61785, "epoch": 1471} {"train_loss": -5.939396381378174, "global_step": 61786, "epoch": 1471} {"train_loss": -5.897378444671631, "global_step": 61787, "epoch": 1471} {"train_loss": -5.968477725982666, "global_step": 61788, "epoch": 1471} {"train_loss": -5.794970989227295, "global_step": 61789, "epoch": 1471} {"train_loss": -5.913450241088867, "global_step": 61790, "epoch": 1471} {"train_loss": -5.890868186950684, "global_step": 61791, "epoch": 1471} {"train_loss": -5.94533634185791, "global_step": 61792, "epoch": 1471} {"train_loss": -5.88049840927124, "global_step": 61793, "epoch": 1471} {"train_loss": -6.0371928215026855, "global_step": 61794, "epoch": 1471} {"train_loss": -5.891644477844238, "global_step": 61795, "epoch": 1471} {"train_loss": -5.8875274658203125, "global_step": 61796, "epoch": 1471} {"train_loss": -5.954504013061523, "global_step": 61797, "epoch": 1471} {"train_loss": -5.831437110900879, "global_step": 61798, "epoch": 1471} {"train_loss": -5.890980243682861, "global_step": 61799, "epoch": 1471} {"train_loss": -5.865520477294922, "global_step": 61800, "epoch": 1471} {"train_loss": -6.0058112144470215, "global_step": 61801, "epoch": 1471} {"train_loss": -5.862332820892334, "global_step": 61802, "epoch": 1471} {"train_loss": -5.890411376953125, "global_step": 61803, "epoch": 1471} {"train_loss": -5.904433250427246, "global_step": 61804, "epoch": 1471} {"train_loss": -5.846301078796387, "global_step": 61805, "epoch": 1471} {"train_loss": -5.763636112213135, "global_step": 61806, "epoch": 1471} {"train_loss": -5.883879661560059, "global_step": 61807, "epoch": 1471} {"train_loss": -5.83616828918457, "global_step": 61808, "epoch": 1471} {"train_loss": -5.92219352722168, "global_step": 61809, "epoch": 1471} {"train_loss": -5.831425666809082, "global_step": 61810, "epoch": 1471} {"train_loss": -5.862147331237793, "global_step": 61811, "epoch": 1471} {"train_loss": -5.899299621582031, "global_step": 61812, "epoch": 1471} {"train_loss": -5.887341499328613, "global_step": 61813, "epoch": 1471} {"train_loss": -5.76497745513916, "global_step": 61814, "epoch": 1471} {"train_loss": -5.912014961242676, "global_step": 61815, "epoch": 1471} {"train_loss": -5.834406852722168, "global_step": 61816, "epoch": 1471} {"train_loss": -5.857022762298584, "global_step": 61817, "epoch": 1471} {"train_loss": -5.7742719650268555, "global_step": 61818, "epoch": 1471} {"train_loss": -5.820208549499512, "global_step": 61819, "epoch": 1471} {"train_loss": -5.791750907897949, "global_step": 61820, "epoch": 1471} {"train_loss": -5.837249755859375, "global_step": 61821, "epoch": 1471} {"train_loss": -5.850606441497803, "global_step": 61822, "epoch": 1471} {"train_loss": -5.8755947181156705, "global_step": 61823, "epoch": 1471, "val_loss": 67016.21875} {"train_loss": -5.930771827697754, "global_step": 61824, "epoch": 1472} {"train_loss": -5.917536735534668, "global_step": 61825, "epoch": 1472} {"train_loss": -5.811168193817139, "global_step": 61826, "epoch": 1472} {"train_loss": -5.960227966308594, "global_step": 61827, "epoch": 1472} {"train_loss": -5.8885040283203125, "global_step": 61828, "epoch": 1472} {"train_loss": -5.91893196105957, "global_step": 61829, "epoch": 1472} {"train_loss": -5.877056121826172, "global_step": 61830, "epoch": 1472} {"train_loss": -6.020994186401367, "global_step": 61831, "epoch": 1472} {"train_loss": -6.070361614227295, "global_step": 61832, "epoch": 1472} {"train_loss": -6.042009353637695, "global_step": 61833, "epoch": 1472} {"train_loss": -5.891537666320801, "global_step": 61834, "epoch": 1472} {"train_loss": -5.995889186859131, "global_step": 61835, "epoch": 1472} {"train_loss": -6.0331268310546875, "global_step": 61836, "epoch": 1472} {"train_loss": -5.836872577667236, "global_step": 61837, "epoch": 1472} {"train_loss": -5.955477714538574, "global_step": 61838, "epoch": 1472} {"train_loss": -5.9362711906433105, "global_step": 61839, "epoch": 1472} {"train_loss": -5.9154558181762695, "global_step": 61840, "epoch": 1472} {"train_loss": -5.932065963745117, "global_step": 61841, "epoch": 1472} {"train_loss": -5.907853603363037, "global_step": 61842, "epoch": 1472} {"train_loss": -5.948278903961182, "global_step": 61843, "epoch": 1472} {"train_loss": -5.735039710998535, "global_step": 61844, "epoch": 1472} {"train_loss": -5.9455976486206055, "global_step": 61845, "epoch": 1472} {"train_loss": -5.986291885375977, "global_step": 61846, "epoch": 1472} {"train_loss": -5.984076499938965, "global_step": 61847, "epoch": 1472} {"train_loss": -5.938756942749023, "global_step": 61848, "epoch": 1472} {"train_loss": -5.972348213195801, "global_step": 61849, "epoch": 1472} {"train_loss": -5.877943992614746, "global_step": 61850, "epoch": 1472} {"train_loss": -5.9221720695495605, "global_step": 61851, "epoch": 1472} {"train_loss": -5.948013782501221, "global_step": 61852, "epoch": 1472} {"train_loss": -5.7443695068359375, "global_step": 61853, "epoch": 1472} {"train_loss": -5.9317731857299805, "global_step": 61854, "epoch": 1472} {"train_loss": -5.974846839904785, "global_step": 61855, "epoch": 1472} {"train_loss": -5.724803924560547, "global_step": 61856, "epoch": 1472} {"train_loss": -5.883687973022461, "global_step": 61857, "epoch": 1472} {"train_loss": -5.965384483337402, "global_step": 61858, "epoch": 1472} {"train_loss": -5.848148345947266, "global_step": 61859, "epoch": 1472} {"train_loss": -5.862860202789307, "global_step": 61860, "epoch": 1472} {"train_loss": -5.799725532531738, "global_step": 61861, "epoch": 1472} {"train_loss": -5.875741958618164, "global_step": 61862, "epoch": 1472} {"train_loss": -5.943442344665527, "global_step": 61863, "epoch": 1472} {"train_loss": -5.721924781799316, "global_step": 61864, "epoch": 1472} {"train_loss": -5.911421957470122, "global_step": 61865, "epoch": 1472, "val_loss": 67225.21875} {"train_loss": -5.748712539672852, "global_step": 61866, "epoch": 1473} {"train_loss": -5.914194107055664, "global_step": 61867, "epoch": 1473} {"train_loss": -5.869503021240234, "global_step": 61868, "epoch": 1473} {"train_loss": -5.987986087799072, "global_step": 61869, "epoch": 1473} {"train_loss": -5.850261688232422, "global_step": 61870, "epoch": 1473} {"train_loss": -5.9581451416015625, "global_step": 61871, "epoch": 1473} {"train_loss": -5.846543312072754, "global_step": 61872, "epoch": 1473} {"train_loss": -5.917115211486816, "global_step": 61873, "epoch": 1473} {"train_loss": -5.814228057861328, "global_step": 61874, "epoch": 1473} {"train_loss": -5.920280456542969, "global_step": 61875, "epoch": 1473} {"train_loss": -5.910894393920898, "global_step": 61876, "epoch": 1473} {"train_loss": -5.932007789611816, "global_step": 61877, "epoch": 1473} {"train_loss": -5.935277938842773, "global_step": 61878, "epoch": 1473} {"train_loss": -5.912724494934082, "global_step": 61879, "epoch": 1473} {"train_loss": -5.968527317047119, "global_step": 61880, "epoch": 1473} {"train_loss": -5.920064926147461, "global_step": 61881, "epoch": 1473} {"train_loss": -5.923773765563965, "global_step": 61882, "epoch": 1473} {"train_loss": -5.927379608154297, "global_step": 61883, "epoch": 1473} {"train_loss": -5.864532470703125, "global_step": 61884, "epoch": 1473} {"train_loss": -5.982783317565918, "global_step": 61885, "epoch": 1473} {"train_loss": -5.7928547859191895, "global_step": 61886, "epoch": 1473} {"train_loss": -5.800625801086426, "global_step": 61887, "epoch": 1473} {"train_loss": -5.831874847412109, "global_step": 61888, "epoch": 1473} {"train_loss": -5.908774375915527, "global_step": 61889, "epoch": 1473} {"train_loss": -5.791722297668457, "global_step": 61890, "epoch": 1473} {"train_loss": -5.758601188659668, "global_step": 61891, "epoch": 1473} {"train_loss": -5.848148822784424, "global_step": 61892, "epoch": 1473} {"train_loss": -5.937577247619629, "global_step": 61893, "epoch": 1473} {"train_loss": -5.929853916168213, "global_step": 61894, "epoch": 1473} {"train_loss": -5.868592262268066, "global_step": 61895, "epoch": 1473} {"train_loss": -5.858497619628906, "global_step": 61896, "epoch": 1473} {"train_loss": -5.9038262367248535, "global_step": 61897, "epoch": 1473} {"train_loss": -5.905411720275879, "global_step": 61898, "epoch": 1473} {"train_loss": -5.992644786834717, "global_step": 61899, "epoch": 1473} {"train_loss": -5.846768379211426, "global_step": 61900, "epoch": 1473} {"train_loss": -6.053325653076172, "global_step": 61901, "epoch": 1473} {"train_loss": -5.911757946014404, "global_step": 61902, "epoch": 1473} {"train_loss": -5.839725017547607, "global_step": 61903, "epoch": 1473} {"train_loss": -5.950409889221191, "global_step": 61904, "epoch": 1473} {"train_loss": -5.8427958488464355, "global_step": 61905, "epoch": 1473} {"train_loss": -5.865595817565918, "global_step": 61906, "epoch": 1473} {"train_loss": -5.889401390438988, "global_step": 61907, "epoch": 1473, "val_loss": 66990.9921875} {"train_loss": -5.86419677734375, "global_step": 61908, "epoch": 1474} {"train_loss": -5.907665252685547, "global_step": 61909, "epoch": 1474} {"train_loss": -5.760679244995117, "global_step": 61910, "epoch": 1474} {"train_loss": -5.912213325500488, "global_step": 61911, "epoch": 1474} {"train_loss": -5.960591793060303, "global_step": 61912, "epoch": 1474} {"train_loss": -5.870721817016602, "global_step": 61913, "epoch": 1474} {"train_loss": -5.90987491607666, "global_step": 61914, "epoch": 1474} {"train_loss": -5.939449310302734, "global_step": 61915, "epoch": 1474} {"train_loss": -5.895930290222168, "global_step": 61916, "epoch": 1474} {"train_loss": -5.869144439697266, "global_step": 61917, "epoch": 1474} {"train_loss": -5.973955154418945, "global_step": 61918, "epoch": 1474} {"train_loss": -5.9912333488464355, "global_step": 61919, "epoch": 1474} {"train_loss": -5.901337623596191, "global_step": 61920, "epoch": 1474} {"train_loss": -5.800196170806885, "global_step": 61921, "epoch": 1474} {"train_loss": -5.8539323806762695, "global_step": 61922, "epoch": 1474} {"train_loss": -5.896696090698242, "global_step": 61923, "epoch": 1474} {"train_loss": -5.98658561706543, "global_step": 61924, "epoch": 1474} {"train_loss": -5.94472074508667, "global_step": 61925, "epoch": 1474} {"train_loss": -6.0234880447387695, "global_step": 61926, "epoch": 1474} {"train_loss": -5.956445693969727, "global_step": 61927, "epoch": 1474} {"train_loss": -6.083042621612549, "global_step": 61928, "epoch": 1474} {"train_loss": -5.958803653717041, "global_step": 61929, "epoch": 1474} {"train_loss": -5.965180397033691, "global_step": 61930, "epoch": 1474} {"train_loss": -5.952308654785156, "global_step": 61931, "epoch": 1474} {"train_loss": -5.82431173324585, "global_step": 61932, "epoch": 1474} {"train_loss": -5.956563472747803, "global_step": 61933, "epoch": 1474} {"train_loss": -5.865647315979004, "global_step": 61934, "epoch": 1474} {"train_loss": -5.865620136260986, "global_step": 61935, "epoch": 1474} {"train_loss": -5.98681640625, "global_step": 61936, "epoch": 1474} {"train_loss": -5.954760551452637, "global_step": 61937, "epoch": 1474} {"train_loss": -6.005885124206543, "global_step": 61938, "epoch": 1474} {"train_loss": -5.866119384765625, "global_step": 61939, "epoch": 1474} {"train_loss": -5.9381184577941895, "global_step": 61940, "epoch": 1474} {"train_loss": -5.770586967468262, "global_step": 61941, "epoch": 1474} {"train_loss": -5.807126045227051, "global_step": 61942, "epoch": 1474} {"train_loss": -5.787846565246582, "global_step": 61943, "epoch": 1474} {"train_loss": -5.883298873901367, "global_step": 61944, "epoch": 1474} {"train_loss": -5.912176609039307, "global_step": 61945, "epoch": 1474} {"train_loss": -5.804074287414551, "global_step": 61946, "epoch": 1474} {"train_loss": -5.849617958068848, "global_step": 61947, "epoch": 1474} {"train_loss": -5.932710647583008, "global_step": 61948, "epoch": 1474} {"train_loss": -5.906867049989247, "global_step": 61949, "epoch": 1474, "val_loss": 66856.3125} {"train_loss": -5.80841064453125, "global_step": 61950, "epoch": 1475} {"train_loss": -5.907026767730713, "global_step": 61951, "epoch": 1475} {"train_loss": -5.908612251281738, "global_step": 61952, "epoch": 1475} {"train_loss": -5.8062262535095215, "global_step": 61953, "epoch": 1475} {"train_loss": -5.918603897094727, "global_step": 61954, "epoch": 1475} {"train_loss": -5.8734450340271, "global_step": 61955, "epoch": 1475} {"train_loss": -5.813979148864746, "global_step": 61956, "epoch": 1475} {"train_loss": -6.027802467346191, "global_step": 61957, "epoch": 1475} {"train_loss": -5.824899196624756, "global_step": 61958, "epoch": 1475} {"train_loss": -5.960075378417969, "global_step": 61959, "epoch": 1475} {"train_loss": -5.889735221862793, "global_step": 61960, "epoch": 1475} {"train_loss": -5.896930694580078, "global_step": 61961, "epoch": 1475} {"train_loss": -5.846302032470703, "global_step": 61962, "epoch": 1475} {"train_loss": -5.8704681396484375, "global_step": 61963, "epoch": 1475} {"train_loss": -5.875251293182373, "global_step": 61964, "epoch": 1475} {"train_loss": -5.949416160583496, "global_step": 61965, "epoch": 1475} {"train_loss": -5.967006206512451, "global_step": 61966, "epoch": 1475} {"train_loss": -5.941544532775879, "global_step": 61967, "epoch": 1475} {"train_loss": -5.867766857147217, "global_step": 61968, "epoch": 1475} {"train_loss": -5.943633079528809, "global_step": 61969, "epoch": 1475} {"train_loss": -5.845700263977051, "global_step": 61970, "epoch": 1475} {"train_loss": -5.9242424964904785, "global_step": 61971, "epoch": 1475} {"train_loss": -5.8514814376831055, "global_step": 61972, "epoch": 1475} {"train_loss": -5.906991958618164, "global_step": 61973, "epoch": 1475} {"train_loss": -5.971736431121826, "global_step": 61974, "epoch": 1475} {"train_loss": -5.8665690422058105, "global_step": 61975, "epoch": 1475} {"train_loss": -6.073324203491211, "global_step": 61976, "epoch": 1475} {"train_loss": -5.970584869384766, "global_step": 61977, "epoch": 1475} {"train_loss": -5.996744155883789, "global_step": 61978, "epoch": 1475} {"train_loss": -6.011738300323486, "global_step": 61979, "epoch": 1475} {"train_loss": -6.0235419273376465, "global_step": 61980, "epoch": 1475} {"train_loss": -5.779601097106934, "global_step": 61981, "epoch": 1475} {"train_loss": -5.9973883628845215, "global_step": 61982, "epoch": 1475} {"train_loss": -5.914674758911133, "global_step": 61983, "epoch": 1475} {"train_loss": -5.968265533447266, "global_step": 61984, "epoch": 1475} {"train_loss": -5.905031681060791, "global_step": 61985, "epoch": 1475} {"train_loss": -6.03223180770874, "global_step": 61986, "epoch": 1475} {"train_loss": -6.032659530639648, "global_step": 61987, "epoch": 1475} {"train_loss": -5.966475009918213, "global_step": 61988, "epoch": 1475} {"train_loss": -6.0651092529296875, "global_step": 61989, "epoch": 1475} {"train_loss": -6.006839752197266, "global_step": 61990, "epoch": 1475} {"train_loss": -5.925970406759353, "global_step": 61991, "epoch": 1475, "val_loss": 66963.3515625} {"train_loss": -5.955491542816162, "global_step": 61992, "epoch": 1476} {"train_loss": -5.8360395431518555, "global_step": 61993, "epoch": 1476} {"train_loss": -5.871608734130859, "global_step": 61994, "epoch": 1476} {"train_loss": -5.834766864776611, "global_step": 61995, "epoch": 1476} {"train_loss": -6.024409294128418, "global_step": 61996, "epoch": 1476} {"train_loss": -6.022526741027832, "global_step": 61997, "epoch": 1476} {"train_loss": -5.97779655456543, "global_step": 61998, "epoch": 1476} {"train_loss": -5.886356353759766, "global_step": 61999, "epoch": 1476} {"train_loss": -5.956973075866699, "global_step": 62000, "epoch": 1476} {"train_loss": -5.910883903503418, "global_step": 62001, "epoch": 1476} {"train_loss": -6.0020904541015625, "global_step": 62002, "epoch": 1476} {"train_loss": -5.9503173828125, "global_step": 62003, "epoch": 1476} {"train_loss": -5.863551139831543, "global_step": 62004, "epoch": 1476} {"train_loss": -5.854256629943848, "global_step": 62005, "epoch": 1476} {"train_loss": -5.839971542358398, "global_step": 62006, "epoch": 1476} {"train_loss": -6.001447677612305, "global_step": 62007, "epoch": 1476} {"train_loss": -5.910740852355957, "global_step": 62008, "epoch": 1476} {"train_loss": -5.808952331542969, "global_step": 62009, "epoch": 1476} {"train_loss": -5.938354969024658, "global_step": 62010, "epoch": 1476} {"train_loss": -5.9007954597473145, "global_step": 62011, "epoch": 1476} {"train_loss": -5.938969612121582, "global_step": 62012, "epoch": 1476} {"train_loss": -5.924845218658447, "global_step": 62013, "epoch": 1476} {"train_loss": -5.978831768035889, "global_step": 62014, "epoch": 1476} {"train_loss": -5.931942939758301, "global_step": 62015, "epoch": 1476} {"train_loss": -5.832983016967773, "global_step": 62016, "epoch": 1476} {"train_loss": -5.843644142150879, "global_step": 62017, "epoch": 1476} {"train_loss": -5.914044380187988, "global_step": 62018, "epoch": 1476} {"train_loss": -5.739511489868164, "global_step": 62019, "epoch": 1476} {"train_loss": -5.985834121704102, "global_step": 62020, "epoch": 1476} {"train_loss": -5.814312934875488, "global_step": 62021, "epoch": 1476} {"train_loss": -5.898836135864258, "global_step": 62022, "epoch": 1476} {"train_loss": -5.818075180053711, "global_step": 62023, "epoch": 1476} {"train_loss": -5.932828426361084, "global_step": 62024, "epoch": 1476} {"train_loss": -5.883631706237793, "global_step": 62025, "epoch": 1476} {"train_loss": -5.868732929229736, "global_step": 62026, "epoch": 1476} {"train_loss": -5.948436737060547, "global_step": 62027, "epoch": 1476} {"train_loss": -5.907435417175293, "global_step": 62028, "epoch": 1476} {"train_loss": -5.84527587890625, "global_step": 62029, "epoch": 1476} {"train_loss": -5.857525825500488, "global_step": 62030, "epoch": 1476} {"train_loss": -5.95203971862793, "global_step": 62031, "epoch": 1476} {"train_loss": -5.750988483428955, "global_step": 62032, "epoch": 1476} {"train_loss": -5.900536798295521, "global_step": 62033, "epoch": 1476, "val_loss": 66953.859375} {"train_loss": -5.8444366455078125, "global_step": 62034, "epoch": 1477} {"train_loss": -5.86383581161499, "global_step": 62035, "epoch": 1477} {"train_loss": -5.90621280670166, "global_step": 62036, "epoch": 1477} {"train_loss": -5.9727091789245605, "global_step": 62037, "epoch": 1477} {"train_loss": -5.949213027954102, "global_step": 62038, "epoch": 1477} {"train_loss": -5.95965051651001, "global_step": 62039, "epoch": 1477} {"train_loss": -5.839844703674316, "global_step": 62040, "epoch": 1477} {"train_loss": -6.0044474601745605, "global_step": 62041, "epoch": 1477} {"train_loss": -5.950811386108398, "global_step": 62042, "epoch": 1477} {"train_loss": -6.025119781494141, "global_step": 62043, "epoch": 1477} {"train_loss": -5.906582355499268, "global_step": 62044, "epoch": 1477} {"train_loss": -5.857578754425049, "global_step": 62045, "epoch": 1477} {"train_loss": -5.813385963439941, "global_step": 62046, "epoch": 1477} {"train_loss": -5.874035358428955, "global_step": 62047, "epoch": 1477} {"train_loss": -5.93704891204834, "global_step": 62048, "epoch": 1477} {"train_loss": -5.882379531860352, "global_step": 62049, "epoch": 1477} {"train_loss": -5.9086432456970215, "global_step": 62050, "epoch": 1477} {"train_loss": -6.027015686035156, "global_step": 62051, "epoch": 1477} {"train_loss": -5.871243000030518, "global_step": 62052, "epoch": 1477} {"train_loss": -5.781438827514648, "global_step": 62053, "epoch": 1477} {"train_loss": -5.887529373168945, "global_step": 62054, "epoch": 1477} {"train_loss": -5.854548454284668, "global_step": 62055, "epoch": 1477} {"train_loss": -5.951891899108887, "global_step": 62056, "epoch": 1477} {"train_loss": -6.057369232177734, "global_step": 62057, "epoch": 1477} {"train_loss": -5.87504243850708, "global_step": 62058, "epoch": 1477} {"train_loss": -5.90769624710083, "global_step": 62059, "epoch": 1477} {"train_loss": -5.990910530090332, "global_step": 62060, "epoch": 1477} {"train_loss": -5.894885063171387, "global_step": 62061, "epoch": 1477} {"train_loss": -5.81801700592041, "global_step": 62062, "epoch": 1477} {"train_loss": -5.966968536376953, "global_step": 62063, "epoch": 1477} {"train_loss": -5.879570484161377, "global_step": 62064, "epoch": 1477} {"train_loss": -5.983070373535156, "global_step": 62065, "epoch": 1477} {"train_loss": -5.904860019683838, "global_step": 62066, "epoch": 1477} {"train_loss": -5.944741249084473, "global_step": 62067, "epoch": 1477} {"train_loss": -5.871933937072754, "global_step": 62068, "epoch": 1477} {"train_loss": -5.786652088165283, "global_step": 62069, "epoch": 1477} {"train_loss": -5.803953647613525, "global_step": 62070, "epoch": 1477} {"train_loss": -5.985538482666016, "global_step": 62071, "epoch": 1477} {"train_loss": -5.751281261444092, "global_step": 62072, "epoch": 1477} {"train_loss": -5.833645343780518, "global_step": 62073, "epoch": 1477} {"train_loss": -5.896438121795654, "global_step": 62074, "epoch": 1477} {"train_loss": -5.900186061859131, "global_step": 62075, "epoch": 1477, "val_loss": 67057.4375} {"train_loss": -5.870325088500977, "global_step": 62076, "epoch": 1478} {"train_loss": -5.988697528839111, "global_step": 62077, "epoch": 1478} {"train_loss": -5.961277008056641, "global_step": 62078, "epoch": 1478} {"train_loss": -5.958176612854004, "global_step": 62079, "epoch": 1478} {"train_loss": -5.967558860778809, "global_step": 62080, "epoch": 1478} {"train_loss": -5.89016056060791, "global_step": 62081, "epoch": 1478} {"train_loss": -5.988515853881836, "global_step": 62082, "epoch": 1478} {"train_loss": -5.965044975280762, "global_step": 62083, "epoch": 1478} {"train_loss": -5.888542175292969, "global_step": 62084, "epoch": 1478} {"train_loss": -5.870938777923584, "global_step": 62085, "epoch": 1478} {"train_loss": -5.826350212097168, "global_step": 62086, "epoch": 1478} {"train_loss": -5.844207286834717, "global_step": 62087, "epoch": 1478} {"train_loss": -5.872394561767578, "global_step": 62088, "epoch": 1478} {"train_loss": -5.801718711853027, "global_step": 62089, "epoch": 1478} {"train_loss": -5.851429462432861, "global_step": 62090, "epoch": 1478} {"train_loss": -5.902222633361816, "global_step": 62091, "epoch": 1478} {"train_loss": -5.971989631652832, "global_step": 62092, "epoch": 1478} {"train_loss": -5.934456825256348, "global_step": 62093, "epoch": 1478} {"train_loss": -5.916840553283691, "global_step": 62094, "epoch": 1478} {"train_loss": -5.92909049987793, "global_step": 62095, "epoch": 1478} {"train_loss": -5.8346662521362305, "global_step": 62096, "epoch": 1478} {"train_loss": -5.97305965423584, "global_step": 62097, "epoch": 1478} {"train_loss": -5.960583686828613, "global_step": 62098, "epoch": 1478} {"train_loss": -5.909755706787109, "global_step": 62099, "epoch": 1478} {"train_loss": -5.943484306335449, "global_step": 62100, "epoch": 1478} {"train_loss": -5.888341903686523, "global_step": 62101, "epoch": 1478} {"train_loss": -5.903595447540283, "global_step": 62102, "epoch": 1478} {"train_loss": -5.774443626403809, "global_step": 62103, "epoch": 1478} {"train_loss": -5.921802043914795, "global_step": 62104, "epoch": 1478} {"train_loss": -5.859101295471191, "global_step": 62105, "epoch": 1478} {"train_loss": -5.99045991897583, "global_step": 62106, "epoch": 1478} {"train_loss": -6.01576042175293, "global_step": 62107, "epoch": 1478} {"train_loss": -5.829179286956787, "global_step": 62108, "epoch": 1478} {"train_loss": -5.995656967163086, "global_step": 62109, "epoch": 1478} {"train_loss": -6.006279945373535, "global_step": 62110, "epoch": 1478} {"train_loss": -6.036310195922852, "global_step": 62111, "epoch": 1478} {"train_loss": -5.922801971435547, "global_step": 62112, "epoch": 1478} {"train_loss": -6.020317554473877, "global_step": 62113, "epoch": 1478} {"train_loss": -5.966533660888672, "global_step": 62114, "epoch": 1478} {"train_loss": -5.964434623718262, "global_step": 62115, "epoch": 1478} {"train_loss": -5.864746570587158, "global_step": 62116, "epoch": 1478} {"train_loss": -5.9225043682825, "global_step": 62117, "epoch": 1478, "val_loss": 66810.421875} {"train_loss": -5.946699142456055, "global_step": 62118, "epoch": 1479} {"train_loss": -5.964075565338135, "global_step": 62119, "epoch": 1479} {"train_loss": -6.017043590545654, "global_step": 62120, "epoch": 1479} {"train_loss": -5.879289150238037, "global_step": 62121, "epoch": 1479} {"train_loss": -5.975457191467285, "global_step": 62122, "epoch": 1479} {"train_loss": -5.9093828201293945, "global_step": 62123, "epoch": 1479} {"train_loss": -5.948771953582764, "global_step": 62124, "epoch": 1479} {"train_loss": -6.045478820800781, "global_step": 62125, "epoch": 1479} {"train_loss": -6.033655643463135, "global_step": 62126, "epoch": 1479} {"train_loss": -5.8814544677734375, "global_step": 62127, "epoch": 1479} {"train_loss": -5.876991271972656, "global_step": 62128, "epoch": 1479} {"train_loss": -5.852840423583984, "global_step": 62129, "epoch": 1479} {"train_loss": -5.86976957321167, "global_step": 62130, "epoch": 1479} {"train_loss": -5.852965831756592, "global_step": 62131, "epoch": 1479} {"train_loss": -5.925537109375, "global_step": 62132, "epoch": 1479} {"train_loss": -6.0298943519592285, "global_step": 62133, "epoch": 1479} {"train_loss": -5.91098690032959, "global_step": 62134, "epoch": 1479} {"train_loss": -5.712749004364014, "global_step": 62135, "epoch": 1479} {"train_loss": -5.9077534675598145, "global_step": 62136, "epoch": 1479} {"train_loss": -6.024389266967773, "global_step": 62137, "epoch": 1479} {"train_loss": -6.021687030792236, "global_step": 62138, "epoch": 1479} {"train_loss": -5.793993949890137, "global_step": 62139, "epoch": 1479} {"train_loss": -5.863363265991211, "global_step": 62140, "epoch": 1479} {"train_loss": -5.947423934936523, "global_step": 62141, "epoch": 1479} {"train_loss": -5.820734977722168, "global_step": 62142, "epoch": 1479} {"train_loss": -5.936276912689209, "global_step": 62143, "epoch": 1479} {"train_loss": -5.816442489624023, "global_step": 62144, "epoch": 1479} {"train_loss": -5.830015182495117, "global_step": 62145, "epoch": 1479} {"train_loss": -5.970293998718262, "global_step": 62146, "epoch": 1479} {"train_loss": -5.897047996520996, "global_step": 62147, "epoch": 1479} {"train_loss": -5.9540910720825195, "global_step": 62148, "epoch": 1479} {"train_loss": -5.823299884796143, "global_step": 62149, "epoch": 1479} {"train_loss": -5.903983116149902, "global_step": 62150, "epoch": 1479} {"train_loss": -5.966255187988281, "global_step": 62151, "epoch": 1479} {"train_loss": -5.963840484619141, "global_step": 62152, "epoch": 1479} {"train_loss": -5.853034496307373, "global_step": 62153, "epoch": 1479} {"train_loss": -5.937610626220703, "global_step": 62154, "epoch": 1479} {"train_loss": -5.881318092346191, "global_step": 62155, "epoch": 1479} {"train_loss": -5.95348596572876, "global_step": 62156, "epoch": 1479} {"train_loss": -5.963678359985352, "global_step": 62157, "epoch": 1479} {"train_loss": -5.915771961212158, "global_step": 62158, "epoch": 1479} {"train_loss": -5.9198975676581975, "global_step": 62159, "epoch": 1479, "val_loss": 66866.890625} {"train_loss": -5.896734714508057, "global_step": 62160, "epoch": 1480} {"train_loss": -5.81214714050293, "global_step": 62161, "epoch": 1480} {"train_loss": -5.838306903839111, "global_step": 62162, "epoch": 1480} {"train_loss": -5.9980268478393555, "global_step": 62163, "epoch": 1480} {"train_loss": -5.856723785400391, "global_step": 62164, "epoch": 1480} {"train_loss": -5.9106645584106445, "global_step": 62165, "epoch": 1480} {"train_loss": -5.945060729980469, "global_step": 62166, "epoch": 1480} {"train_loss": -5.899496078491211, "global_step": 62167, "epoch": 1480} {"train_loss": -5.8463544845581055, "global_step": 62168, "epoch": 1480} {"train_loss": -6.039223670959473, "global_step": 62169, "epoch": 1480} {"train_loss": -5.906400680541992, "global_step": 62170, "epoch": 1480} {"train_loss": -6.092173099517822, "global_step": 62171, "epoch": 1480} {"train_loss": -5.966118812561035, "global_step": 62172, "epoch": 1480} {"train_loss": -5.904166221618652, "global_step": 62173, "epoch": 1480} {"train_loss": -5.817934989929199, "global_step": 62174, "epoch": 1480} {"train_loss": -6.077644348144531, "global_step": 62175, "epoch": 1480} {"train_loss": -5.9044294357299805, "global_step": 62176, "epoch": 1480} {"train_loss": -5.776244163513184, "global_step": 62177, "epoch": 1480} {"train_loss": -5.946087837219238, "global_step": 62178, "epoch": 1480} {"train_loss": -5.990848541259766, "global_step": 62179, "epoch": 1480} {"train_loss": -5.885390281677246, "global_step": 62180, "epoch": 1480} {"train_loss": -5.915152549743652, "global_step": 62181, "epoch": 1480} {"train_loss": -5.8193182945251465, "global_step": 62182, "epoch": 1480} {"train_loss": -5.996609687805176, "global_step": 62183, "epoch": 1480} {"train_loss": -5.915788173675537, "global_step": 62184, "epoch": 1480} {"train_loss": -5.898406982421875, "global_step": 62185, "epoch": 1480} {"train_loss": -5.929424285888672, "global_step": 62186, "epoch": 1480} {"train_loss": -5.754324436187744, "global_step": 62187, "epoch": 1480} {"train_loss": -5.833245277404785, "global_step": 62188, "epoch": 1480} {"train_loss": -5.951719284057617, "global_step": 62189, "epoch": 1480} {"train_loss": -5.857194900512695, "global_step": 62190, "epoch": 1480} {"train_loss": -5.995987892150879, "global_step": 62191, "epoch": 1480} {"train_loss": -5.946252822875977, "global_step": 62192, "epoch": 1480} {"train_loss": -5.8487982749938965, "global_step": 62193, "epoch": 1480} {"train_loss": -5.975089073181152, "global_step": 62194, "epoch": 1480} {"train_loss": -5.898379802703857, "global_step": 62195, "epoch": 1480} {"train_loss": -5.863418102264404, "global_step": 62196, "epoch": 1480} {"train_loss": -5.86716365814209, "global_step": 62197, "epoch": 1480} {"train_loss": -5.928233623504639, "global_step": 62198, "epoch": 1480} {"train_loss": -5.970527648925781, "global_step": 62199, "epoch": 1480} {"train_loss": -5.864394187927246, "global_step": 62200, "epoch": 1480} {"train_loss": -5.908444608960833, "global_step": 62201, "epoch": 1480, "val_loss": 66866.53125} {"train_loss": -5.838888168334961, "global_step": 62202, "epoch": 1481} {"train_loss": -5.872393608093262, "global_step": 62203, "epoch": 1481} {"train_loss": -6.007779121398926, "global_step": 62204, "epoch": 1481} {"train_loss": -5.868208885192871, "global_step": 62205, "epoch": 1481} {"train_loss": -5.871335029602051, "global_step": 62206, "epoch": 1481} {"train_loss": -5.91193962097168, "global_step": 62207, "epoch": 1481} {"train_loss": -5.975527763366699, "global_step": 62208, "epoch": 1481} {"train_loss": -5.874752998352051, "global_step": 62209, "epoch": 1481} {"train_loss": -5.941303253173828, "global_step": 62210, "epoch": 1481} {"train_loss": -5.85450553894043, "global_step": 62211, "epoch": 1481} {"train_loss": -5.881402969360352, "global_step": 62212, "epoch": 1481} {"train_loss": -5.885318756103516, "global_step": 62213, "epoch": 1481} {"train_loss": -5.940188407897949, "global_step": 62214, "epoch": 1481} {"train_loss": -5.915165901184082, "global_step": 62215, "epoch": 1481} {"train_loss": -5.860045909881592, "global_step": 62216, "epoch": 1481} {"train_loss": -5.982708930969238, "global_step": 62217, "epoch": 1481} {"train_loss": -5.9913177490234375, "global_step": 62218, "epoch": 1481} {"train_loss": -5.858185768127441, "global_step": 62219, "epoch": 1481} {"train_loss": -6.085369110107422, "global_step": 62220, "epoch": 1481} {"train_loss": -5.922013282775879, "global_step": 62221, "epoch": 1481} {"train_loss": -5.952579498291016, "global_step": 62222, "epoch": 1481} {"train_loss": -5.927201271057129, "global_step": 62223, "epoch": 1481} {"train_loss": -5.982934474945068, "global_step": 62224, "epoch": 1481} {"train_loss": -5.974919319152832, "global_step": 62225, "epoch": 1481} {"train_loss": -5.889430999755859, "global_step": 62226, "epoch": 1481} {"train_loss": -5.794512748718262, "global_step": 62227, "epoch": 1481} {"train_loss": -6.046291828155518, "global_step": 62228, "epoch": 1481} {"train_loss": -5.915257453918457, "global_step": 62229, "epoch": 1481} {"train_loss": -5.728838920593262, "global_step": 62230, "epoch": 1481} {"train_loss": -5.875171184539795, "global_step": 62231, "epoch": 1481} {"train_loss": -5.804331302642822, "global_step": 62232, "epoch": 1481} {"train_loss": -5.8958635330200195, "global_step": 62233, "epoch": 1481} {"train_loss": -5.8458638191223145, "global_step": 62234, "epoch": 1481} {"train_loss": -5.841155529022217, "global_step": 62235, "epoch": 1481} {"train_loss": -5.998973846435547, "global_step": 62236, "epoch": 1481} {"train_loss": -5.863568305969238, "global_step": 62237, "epoch": 1481} {"train_loss": -5.869179725646973, "global_step": 62238, "epoch": 1481} {"train_loss": -5.886183261871338, "global_step": 62239, "epoch": 1481} {"train_loss": -5.9283952713012695, "global_step": 62240, "epoch": 1481} {"train_loss": -5.824880599975586, "global_step": 62241, "epoch": 1481} {"train_loss": -5.980206489562988, "global_step": 62242, "epoch": 1481} {"train_loss": -5.906472739719209, "global_step": 62243, "epoch": 1481, "val_loss": 67088.28125} {"train_loss": -5.755019187927246, "global_step": 62244, "epoch": 1482} {"train_loss": -5.964513778686523, "global_step": 62245, "epoch": 1482} {"train_loss": -5.820715427398682, "global_step": 62246, "epoch": 1482} {"train_loss": -5.847179889678955, "global_step": 62247, "epoch": 1482} {"train_loss": -5.92030668258667, "global_step": 62248, "epoch": 1482} {"train_loss": -6.004522323608398, "global_step": 62249, "epoch": 1482} {"train_loss": -5.988895416259766, "global_step": 62250, "epoch": 1482} {"train_loss": -6.01333475112915, "global_step": 62251, "epoch": 1482} {"train_loss": -5.9054975509643555, "global_step": 62252, "epoch": 1482} {"train_loss": -5.886712551116943, "global_step": 62253, "epoch": 1482} {"train_loss": -5.905967712402344, "global_step": 62254, "epoch": 1482} {"train_loss": -5.834194183349609, "global_step": 62255, "epoch": 1482} {"train_loss": -5.847879409790039, "global_step": 62256, "epoch": 1482} {"train_loss": -5.854900360107422, "global_step": 62257, "epoch": 1482} {"train_loss": -5.860176086425781, "global_step": 62258, "epoch": 1482} {"train_loss": -5.813599586486816, "global_step": 62259, "epoch": 1482} {"train_loss": -5.952819347381592, "global_step": 62260, "epoch": 1482} {"train_loss": -5.911678791046143, "global_step": 62261, "epoch": 1482} {"train_loss": -5.798728942871094, "global_step": 62262, "epoch": 1482} {"train_loss": -5.84438419342041, "global_step": 62263, "epoch": 1482} {"train_loss": -5.932520866394043, "global_step": 62264, "epoch": 1482} {"train_loss": -5.8229875564575195, "global_step": 62265, "epoch": 1482} {"train_loss": -5.972575664520264, "global_step": 62266, "epoch": 1482} {"train_loss": -5.969712257385254, "global_step": 62267, "epoch": 1482} {"train_loss": -5.857661724090576, "global_step": 62268, "epoch": 1482} {"train_loss": -5.957703113555908, "global_step": 62269, "epoch": 1482} {"train_loss": -5.795675277709961, "global_step": 62270, "epoch": 1482} {"train_loss": -5.82414436340332, "global_step": 62271, "epoch": 1482} {"train_loss": -5.868744373321533, "global_step": 62272, "epoch": 1482} {"train_loss": -5.912657737731934, "global_step": 62273, "epoch": 1482} {"train_loss": -5.986912250518799, "global_step": 62274, "epoch": 1482} {"train_loss": -5.943207740783691, "global_step": 62275, "epoch": 1482} {"train_loss": -5.884859085083008, "global_step": 62276, "epoch": 1482} {"train_loss": -5.936020851135254, "global_step": 62277, "epoch": 1482} {"train_loss": -5.893689155578613, "global_step": 62278, "epoch": 1482} {"train_loss": -5.801210403442383, "global_step": 62279, "epoch": 1482} {"train_loss": -6.004225730895996, "global_step": 62280, "epoch": 1482} {"train_loss": -5.874389171600342, "global_step": 62281, "epoch": 1482} {"train_loss": -5.917981147766113, "global_step": 62282, "epoch": 1482} {"train_loss": -5.986931800842285, "global_step": 62283, "epoch": 1482} {"train_loss": -5.910176753997803, "global_step": 62284, "epoch": 1482} {"train_loss": -5.897827171144032, "global_step": 62285, "epoch": 1482, "val_loss": 66923.8984375} {"train_loss": -5.813389301300049, "global_step": 62286, "epoch": 1483} {"train_loss": -6.023477554321289, "global_step": 62287, "epoch": 1483} {"train_loss": -5.812671661376953, "global_step": 62288, "epoch": 1483} {"train_loss": -5.854024887084961, "global_step": 62289, "epoch": 1483} {"train_loss": -5.971869468688965, "global_step": 62290, "epoch": 1483} {"train_loss": -5.86824893951416, "global_step": 62291, "epoch": 1483} {"train_loss": -5.748322486877441, "global_step": 62292, "epoch": 1483} {"train_loss": -5.829255104064941, "global_step": 62293, "epoch": 1483} {"train_loss": -5.8118205070495605, "global_step": 62294, "epoch": 1483} {"train_loss": -5.79722785949707, "global_step": 62295, "epoch": 1483} {"train_loss": -5.79628849029541, "global_step": 62296, "epoch": 1483} {"train_loss": -5.8066911697387695, "global_step": 62297, "epoch": 1483} {"train_loss": -5.832634925842285, "global_step": 62298, "epoch": 1483} {"train_loss": -5.832185745239258, "global_step": 62299, "epoch": 1483} {"train_loss": -5.81035041809082, "global_step": 62300, "epoch": 1483} {"train_loss": -5.842422962188721, "global_step": 62301, "epoch": 1483} {"train_loss": -5.866389274597168, "global_step": 62302, "epoch": 1483} {"train_loss": -5.861805438995361, "global_step": 62303, "epoch": 1483} {"train_loss": -6.0140380859375, "global_step": 62304, "epoch": 1483} {"train_loss": -5.753653526306152, "global_step": 62305, "epoch": 1483} {"train_loss": -5.918909072875977, "global_step": 62306, "epoch": 1483} {"train_loss": -5.90328311920166, "global_step": 62307, "epoch": 1483} {"train_loss": -5.919406414031982, "global_step": 62308, "epoch": 1483} {"train_loss": -5.9681315422058105, "global_step": 62309, "epoch": 1483} {"train_loss": -5.860881328582764, "global_step": 62310, "epoch": 1483} {"train_loss": -5.745050430297852, "global_step": 62311, "epoch": 1483} {"train_loss": -5.862785339355469, "global_step": 62312, "epoch": 1483} {"train_loss": -5.852230072021484, "global_step": 62313, "epoch": 1483} {"train_loss": -5.948514938354492, "global_step": 62314, "epoch": 1483} {"train_loss": -5.973705768585205, "global_step": 62315, "epoch": 1483} {"train_loss": -5.864360809326172, "global_step": 62316, "epoch": 1483} {"train_loss": -5.926689147949219, "global_step": 62317, "epoch": 1483} {"train_loss": -5.9244232177734375, "global_step": 62318, "epoch": 1483} {"train_loss": -5.868142604827881, "global_step": 62319, "epoch": 1483} {"train_loss": -6.072623252868652, "global_step": 62320, "epoch": 1483} {"train_loss": -5.89954137802124, "global_step": 62321, "epoch": 1483} {"train_loss": -5.895777225494385, "global_step": 62322, "epoch": 1483} {"train_loss": -5.934118270874023, "global_step": 62323, "epoch": 1483} {"train_loss": -5.923128128051758, "global_step": 62324, "epoch": 1483} {"train_loss": -5.847264766693115, "global_step": 62325, "epoch": 1483} {"train_loss": -5.909401893615723, "global_step": 62326, "epoch": 1483} {"train_loss": -5.876751445588612, "global_step": 62327, "epoch": 1483, "val_loss": 66937.4140625} {"train_loss": -5.921521186828613, "global_step": 62328, "epoch": 1484} {"train_loss": -5.889639377593994, "global_step": 62329, "epoch": 1484} {"train_loss": -6.006166934967041, "global_step": 62330, "epoch": 1484} {"train_loss": -5.934963226318359, "global_step": 62331, "epoch": 1484} {"train_loss": -6.002494812011719, "global_step": 62332, "epoch": 1484} {"train_loss": -5.991007328033447, "global_step": 62333, "epoch": 1484} {"train_loss": -5.94445276260376, "global_step": 62334, "epoch": 1484} {"train_loss": -5.888673305511475, "global_step": 62335, "epoch": 1484} {"train_loss": -5.903792858123779, "global_step": 62336, "epoch": 1484} {"train_loss": -5.860888481140137, "global_step": 62337, "epoch": 1484} {"train_loss": -5.892500877380371, "global_step": 62338, "epoch": 1484} {"train_loss": -6.0594401359558105, "global_step": 62339, "epoch": 1484} {"train_loss": -5.806416988372803, "global_step": 62340, "epoch": 1484} {"train_loss": -5.937196731567383, "global_step": 62341, "epoch": 1484} {"train_loss": -5.86298942565918, "global_step": 62342, "epoch": 1484} {"train_loss": -5.790483474731445, "global_step": 62343, "epoch": 1484} {"train_loss": -5.801894664764404, "global_step": 62344, "epoch": 1484} {"train_loss": -5.8328704833984375, "global_step": 62345, "epoch": 1484} {"train_loss": -5.961855888366699, "global_step": 62346, "epoch": 1484} {"train_loss": -5.850257873535156, "global_step": 62347, "epoch": 1484} {"train_loss": -6.04414701461792, "global_step": 62348, "epoch": 1484} {"train_loss": -5.919013023376465, "global_step": 62349, "epoch": 1484} {"train_loss": -5.928337097167969, "global_step": 62350, "epoch": 1484} {"train_loss": -5.887799263000488, "global_step": 62351, "epoch": 1484} {"train_loss": -5.910613059997559, "global_step": 62352, "epoch": 1484} {"train_loss": -5.914436340332031, "global_step": 62353, "epoch": 1484} {"train_loss": -5.9483489990234375, "global_step": 62354, "epoch": 1484} {"train_loss": -5.944931507110596, "global_step": 62355, "epoch": 1484} {"train_loss": -5.888828277587891, "global_step": 62356, "epoch": 1484} {"train_loss": -5.868143081665039, "global_step": 62357, "epoch": 1484} {"train_loss": -5.847315311431885, "global_step": 62358, "epoch": 1484} {"train_loss": -6.013272285461426, "global_step": 62359, "epoch": 1484} {"train_loss": -5.927703380584717, "global_step": 62360, "epoch": 1484} {"train_loss": -5.794748306274414, "global_step": 62361, "epoch": 1484} {"train_loss": -5.932218551635742, "global_step": 62362, "epoch": 1484} {"train_loss": -5.888152122497559, "global_step": 62363, "epoch": 1484} {"train_loss": -5.813760757446289, "global_step": 62364, "epoch": 1484} {"train_loss": -5.889878273010254, "global_step": 62365, "epoch": 1484} {"train_loss": -5.973920822143555, "global_step": 62366, "epoch": 1484} {"train_loss": -6.023900508880615, "global_step": 62367, "epoch": 1484} {"train_loss": -5.865954399108887, "global_step": 62368, "epoch": 1484} {"train_loss": -5.9127176602681475, "global_step": 62369, "epoch": 1484, "val_loss": 66724.3984375} {"train_loss": -5.747996807098389, "global_step": 62370, "epoch": 1485} {"train_loss": -5.901792526245117, "global_step": 62371, "epoch": 1485} {"train_loss": -5.852392196655273, "global_step": 62372, "epoch": 1485} {"train_loss": -5.954793930053711, "global_step": 62373, "epoch": 1485} {"train_loss": -6.029290199279785, "global_step": 62374, "epoch": 1485} {"train_loss": -5.894219398498535, "global_step": 62375, "epoch": 1485} {"train_loss": -5.956153869628906, "global_step": 62376, "epoch": 1485} {"train_loss": -5.872409343719482, "global_step": 62377, "epoch": 1485} {"train_loss": -5.963300704956055, "global_step": 62378, "epoch": 1485} {"train_loss": -6.00027322769165, "global_step": 62379, "epoch": 1485} {"train_loss": -5.931889533996582, "global_step": 62380, "epoch": 1485} {"train_loss": -5.8487749099731445, "global_step": 62381, "epoch": 1485} {"train_loss": -5.898167610168457, "global_step": 62382, "epoch": 1485} {"train_loss": -5.871826648712158, "global_step": 62383, "epoch": 1485} {"train_loss": -5.941985607147217, "global_step": 62384, "epoch": 1485} {"train_loss": -5.972723484039307, "global_step": 62385, "epoch": 1485} {"train_loss": -6.0084733963012695, "global_step": 62386, "epoch": 1485} {"train_loss": -5.893743515014648, "global_step": 62387, "epoch": 1485} {"train_loss": -5.985767364501953, "global_step": 62388, "epoch": 1485} {"train_loss": -5.920195579528809, "global_step": 62389, "epoch": 1485} {"train_loss": -5.981418132781982, "global_step": 62390, "epoch": 1485} {"train_loss": -5.970035076141357, "global_step": 62391, "epoch": 1485} {"train_loss": -5.943051338195801, "global_step": 62392, "epoch": 1485} {"train_loss": -5.908936023712158, "global_step": 62393, "epoch": 1485} {"train_loss": -6.009392261505127, "global_step": 62394, "epoch": 1485} {"train_loss": -5.887048721313477, "global_step": 62395, "epoch": 1485} {"train_loss": -5.873337745666504, "global_step": 62396, "epoch": 1485} {"train_loss": -5.8705620765686035, "global_step": 62397, "epoch": 1485} {"train_loss": -5.882198333740234, "global_step": 62398, "epoch": 1485} {"train_loss": -5.7691216468811035, "global_step": 62399, "epoch": 1485} {"train_loss": -5.935260772705078, "global_step": 62400, "epoch": 1485} {"train_loss": -5.981828212738037, "global_step": 62401, "epoch": 1485} {"train_loss": -5.939164161682129, "global_step": 62402, "epoch": 1485} {"train_loss": -5.864933490753174, "global_step": 62403, "epoch": 1485} {"train_loss": -5.888516426086426, "global_step": 62404, "epoch": 1485} {"train_loss": -6.005634784698486, "global_step": 62405, "epoch": 1485} {"train_loss": -5.856680870056152, "global_step": 62406, "epoch": 1485} {"train_loss": -5.952919960021973, "global_step": 62407, "epoch": 1485} {"train_loss": -5.958062648773193, "global_step": 62408, "epoch": 1485} {"train_loss": -5.823040962219238, "global_step": 62409, "epoch": 1485} {"train_loss": -5.869410037994385, "global_step": 62410, "epoch": 1485} {"train_loss": -5.918495552880423, "global_step": 62411, "epoch": 1485, "val_loss": 66880.25} {"train_loss": -5.880533218383789, "global_step": 62412, "epoch": 1486} {"train_loss": -5.872576713562012, "global_step": 62413, "epoch": 1486} {"train_loss": -5.941453456878662, "global_step": 62414, "epoch": 1486} {"train_loss": -6.027064323425293, "global_step": 62415, "epoch": 1486} {"train_loss": -6.01849365234375, "global_step": 62416, "epoch": 1486} {"train_loss": -5.916651725769043, "global_step": 62417, "epoch": 1486} {"train_loss": -5.9291181564331055, "global_step": 62418, "epoch": 1486} {"train_loss": -5.944997787475586, "global_step": 62419, "epoch": 1486} {"train_loss": -5.797031402587891, "global_step": 62420, "epoch": 1486} {"train_loss": -5.960579872131348, "global_step": 62421, "epoch": 1486} {"train_loss": -5.799391269683838, "global_step": 62422, "epoch": 1486} {"train_loss": -6.012975692749023, "global_step": 62423, "epoch": 1486} {"train_loss": -5.816361427307129, "global_step": 62424, "epoch": 1486} {"train_loss": -5.867227554321289, "global_step": 62425, "epoch": 1486} {"train_loss": -5.872838973999023, "global_step": 62426, "epoch": 1486} {"train_loss": -5.708883285522461, "global_step": 62427, "epoch": 1486} {"train_loss": -5.89357852935791, "global_step": 62428, "epoch": 1486} {"train_loss": -5.860072135925293, "global_step": 62429, "epoch": 1486} {"train_loss": -5.8522844314575195, "global_step": 62430, "epoch": 1486} {"train_loss": -5.939358234405518, "global_step": 62431, "epoch": 1486} {"train_loss": -5.8594584465026855, "global_step": 62432, "epoch": 1486} {"train_loss": -5.817918300628662, "global_step": 62433, "epoch": 1486} {"train_loss": -5.86226749420166, "global_step": 62434, "epoch": 1486} {"train_loss": -5.838639259338379, "global_step": 62435, "epoch": 1486} {"train_loss": -5.917814254760742, "global_step": 62436, "epoch": 1486} {"train_loss": -5.941644668579102, "global_step": 62437, "epoch": 1486} {"train_loss": -5.748325824737549, "global_step": 62438, "epoch": 1486} {"train_loss": -5.9503889083862305, "global_step": 62439, "epoch": 1486} {"train_loss": -5.71395206451416, "global_step": 62440, "epoch": 1486} {"train_loss": -5.764517307281494, "global_step": 62441, "epoch": 1486} {"train_loss": -5.894626140594482, "global_step": 62442, "epoch": 1486} {"train_loss": -5.944830894470215, "global_step": 62443, "epoch": 1486} {"train_loss": -5.901736259460449, "global_step": 62444, "epoch": 1486} {"train_loss": -5.93789005279541, "global_step": 62445, "epoch": 1486} {"train_loss": -5.834290504455566, "global_step": 62446, "epoch": 1486} {"train_loss": -5.914870738983154, "global_step": 62447, "epoch": 1486} {"train_loss": -5.8745341300964355, "global_step": 62448, "epoch": 1486} {"train_loss": -5.913011074066162, "global_step": 62449, "epoch": 1486} {"train_loss": -5.9022369384765625, "global_step": 62450, "epoch": 1486} {"train_loss": -5.859424591064453, "global_step": 62451, "epoch": 1486} {"train_loss": -5.918127059936523, "global_step": 62452, "epoch": 1486} {"train_loss": -5.885542880921137, "global_step": 62453, "epoch": 1486, "val_loss": 66730.9453125} {"train_loss": -5.983702659606934, "global_step": 62454, "epoch": 1487} {"train_loss": -5.8814849853515625, "global_step": 62455, "epoch": 1487} {"train_loss": -5.995199203491211, "global_step": 62456, "epoch": 1487} {"train_loss": -5.933438301086426, "global_step": 62457, "epoch": 1487} {"train_loss": -5.858860969543457, "global_step": 62458, "epoch": 1487} {"train_loss": -6.009056091308594, "global_step": 62459, "epoch": 1487} {"train_loss": -5.746124267578125, "global_step": 62460, "epoch": 1487} {"train_loss": -5.8386125564575195, "global_step": 62461, "epoch": 1487} {"train_loss": -6.0060038566589355, "global_step": 62462, "epoch": 1487} {"train_loss": -5.872658729553223, "global_step": 62463, "epoch": 1487} {"train_loss": -5.820913314819336, "global_step": 62464, "epoch": 1487} {"train_loss": -5.923484802246094, "global_step": 62465, "epoch": 1487} {"train_loss": -5.941018104553223, "global_step": 62466, "epoch": 1487} {"train_loss": -5.936484336853027, "global_step": 62467, "epoch": 1487} {"train_loss": -5.9487385749816895, "global_step": 62468, "epoch": 1487} {"train_loss": -5.879444122314453, "global_step": 62469, "epoch": 1487} {"train_loss": -5.916500091552734, "global_step": 62470, "epoch": 1487} {"train_loss": -5.917352676391602, "global_step": 62471, "epoch": 1487} {"train_loss": -5.87666654586792, "global_step": 62472, "epoch": 1487} {"train_loss": -5.933271408081055, "global_step": 62473, "epoch": 1487} {"train_loss": -5.940005302429199, "global_step": 62474, "epoch": 1487} {"train_loss": -5.876120090484619, "global_step": 62475, "epoch": 1487} {"train_loss": -5.95842170715332, "global_step": 62476, "epoch": 1487} {"train_loss": -5.941659450531006, "global_step": 62477, "epoch": 1487} {"train_loss": -5.830780506134033, "global_step": 62478, "epoch": 1487} {"train_loss": -5.9984893798828125, "global_step": 62479, "epoch": 1487} {"train_loss": -5.980177879333496, "global_step": 62480, "epoch": 1487} {"train_loss": -5.996269226074219, "global_step": 62481, "epoch": 1487} {"train_loss": -6.027673721313477, "global_step": 62482, "epoch": 1487} {"train_loss": -5.976556777954102, "global_step": 62483, "epoch": 1487} {"train_loss": -5.962426662445068, "global_step": 62484, "epoch": 1487} {"train_loss": -6.01252555847168, "global_step": 62485, "epoch": 1487} {"train_loss": -5.9313507080078125, "global_step": 62486, "epoch": 1487} {"train_loss": -5.869993209838867, "global_step": 62487, "epoch": 1487} {"train_loss": -5.88883113861084, "global_step": 62488, "epoch": 1487} {"train_loss": -5.922396659851074, "global_step": 62489, "epoch": 1487} {"train_loss": -5.731138229370117, "global_step": 62490, "epoch": 1487} {"train_loss": -5.8759660720825195, "global_step": 62491, "epoch": 1487} {"train_loss": -5.924663543701172, "global_step": 62492, "epoch": 1487} {"train_loss": -5.891504287719727, "global_step": 62493, "epoch": 1487} {"train_loss": -5.9848785400390625, "global_step": 62494, "epoch": 1487} {"train_loss": -5.918941145851498, "global_step": 62495, "epoch": 1487, "val_loss": 66849.9921875} {"train_loss": -5.936007022857666, "global_step": 62496, "epoch": 1488} {"train_loss": -5.8950347900390625, "global_step": 62497, "epoch": 1488} {"train_loss": -5.907890319824219, "global_step": 62498, "epoch": 1488} {"train_loss": -5.966126918792725, "global_step": 62499, "epoch": 1488} {"train_loss": -5.948801517486572, "global_step": 62500, "epoch": 1488} {"train_loss": -5.8574748039245605, "global_step": 62501, "epoch": 1488} {"train_loss": -5.90592098236084, "global_step": 62502, "epoch": 1488} {"train_loss": -5.8394269943237305, "global_step": 62503, "epoch": 1488} {"train_loss": -6.035578727722168, "global_step": 62504, "epoch": 1488} {"train_loss": -5.914916038513184, "global_step": 62505, "epoch": 1488} {"train_loss": -5.904546737670898, "global_step": 62506, "epoch": 1488} {"train_loss": -5.853305816650391, "global_step": 62507, "epoch": 1488} {"train_loss": -5.849937915802002, "global_step": 62508, "epoch": 1488} {"train_loss": -5.897883892059326, "global_step": 62509, "epoch": 1488} {"train_loss": -5.810737609863281, "global_step": 62510, "epoch": 1488} {"train_loss": -6.014153480529785, "global_step": 62511, "epoch": 1488} {"train_loss": -5.871425628662109, "global_step": 62512, "epoch": 1488} {"train_loss": -5.864663124084473, "global_step": 62513, "epoch": 1488} {"train_loss": -5.897788047790527, "global_step": 62514, "epoch": 1488} {"train_loss": -5.931265354156494, "global_step": 62515, "epoch": 1488} {"train_loss": -5.984256744384766, "global_step": 62516, "epoch": 1488} {"train_loss": -5.672886848449707, "global_step": 62517, "epoch": 1488} {"train_loss": -5.7738847732543945, "global_step": 62518, "epoch": 1488} {"train_loss": -6.0253190994262695, "global_step": 62519, "epoch": 1488} {"train_loss": -5.804518699645996, "global_step": 62520, "epoch": 1488} {"train_loss": -5.88173770904541, "global_step": 62521, "epoch": 1488} {"train_loss": -5.939141273498535, "global_step": 62522, "epoch": 1488} {"train_loss": -5.86337947845459, "global_step": 62523, "epoch": 1488} {"train_loss": -5.893780708312988, "global_step": 62524, "epoch": 1488} {"train_loss": -5.649070739746094, "global_step": 62525, "epoch": 1488} {"train_loss": -5.980537414550781, "global_step": 62526, "epoch": 1488} {"train_loss": -5.873401641845703, "global_step": 62527, "epoch": 1488} {"train_loss": -5.871100425720215, "global_step": 62528, "epoch": 1488} {"train_loss": -5.846444129943848, "global_step": 62529, "epoch": 1488} {"train_loss": -5.716652870178223, "global_step": 62530, "epoch": 1488} {"train_loss": -6.010514259338379, "global_step": 62531, "epoch": 1488} {"train_loss": -5.837368965148926, "global_step": 62532, "epoch": 1488} {"train_loss": -5.871538162231445, "global_step": 62533, "epoch": 1488} {"train_loss": -5.886574745178223, "global_step": 62534, "epoch": 1488} {"train_loss": -5.920748710632324, "global_step": 62535, "epoch": 1488} {"train_loss": -5.933808326721191, "global_step": 62536, "epoch": 1488} {"train_loss": -5.886715071541922, "global_step": 62537, "epoch": 1488, "val_loss": 66841.09375} {"train_loss": -5.994253635406494, "global_step": 62538, "epoch": 1489} {"train_loss": -5.817037582397461, "global_step": 62539, "epoch": 1489} {"train_loss": -5.9319868087768555, "global_step": 62540, "epoch": 1489} {"train_loss": -6.016589641571045, "global_step": 62541, "epoch": 1489} {"train_loss": -5.89626407623291, "global_step": 62542, "epoch": 1489} {"train_loss": -5.7820281982421875, "global_step": 62543, "epoch": 1489} {"train_loss": -5.940679550170898, "global_step": 62544, "epoch": 1489} {"train_loss": -5.91878604888916, "global_step": 62545, "epoch": 1489} {"train_loss": -5.9581298828125, "global_step": 62546, "epoch": 1489} {"train_loss": -5.926515102386475, "global_step": 62547, "epoch": 1489} {"train_loss": -6.072457313537598, "global_step": 62548, "epoch": 1489} {"train_loss": -5.813469886779785, "global_step": 62549, "epoch": 1489} {"train_loss": -5.976202964782715, "global_step": 62550, "epoch": 1489} {"train_loss": -5.887905597686768, "global_step": 62551, "epoch": 1489} {"train_loss": -5.974170207977295, "global_step": 62552, "epoch": 1489} {"train_loss": -5.892256259918213, "global_step": 62553, "epoch": 1489} {"train_loss": -5.973775386810303, "global_step": 62554, "epoch": 1489} {"train_loss": -5.956250190734863, "global_step": 62555, "epoch": 1489} {"train_loss": -5.887638092041016, "global_step": 62556, "epoch": 1489} {"train_loss": -5.903195381164551, "global_step": 62557, "epoch": 1489} {"train_loss": -6.130720615386963, "global_step": 62558, "epoch": 1489} {"train_loss": -5.876486301422119, "global_step": 62559, "epoch": 1489} {"train_loss": -5.876977920532227, "global_step": 62560, "epoch": 1489} {"train_loss": -6.097270488739014, "global_step": 62561, "epoch": 1489} {"train_loss": -5.884922981262207, "global_step": 62562, "epoch": 1489} {"train_loss": -5.9150071144104, "global_step": 62563, "epoch": 1489} {"train_loss": -5.959009647369385, "global_step": 62564, "epoch": 1489} {"train_loss": -5.907398700714111, "global_step": 62565, "epoch": 1489} {"train_loss": -6.107898712158203, "global_step": 62566, "epoch": 1489} {"train_loss": -5.90056848526001, "global_step": 62567, "epoch": 1489} {"train_loss": -5.889106750488281, "global_step": 62568, "epoch": 1489} {"train_loss": -5.859959602355957, "global_step": 62569, "epoch": 1489} {"train_loss": -5.857205390930176, "global_step": 62570, "epoch": 1489} {"train_loss": -5.894972801208496, "global_step": 62571, "epoch": 1489} {"train_loss": -5.934189319610596, "global_step": 62572, "epoch": 1489} {"train_loss": -5.901544570922852, "global_step": 62573, "epoch": 1489} {"train_loss": -5.999542236328125, "global_step": 62574, "epoch": 1489} {"train_loss": -5.955483436584473, "global_step": 62575, "epoch": 1489} {"train_loss": -5.784144878387451, "global_step": 62576, "epoch": 1489} {"train_loss": -5.969773769378662, "global_step": 62577, "epoch": 1489} {"train_loss": -5.898693084716797, "global_step": 62578, "epoch": 1489} {"train_loss": -5.929410060246785, "global_step": 62579, "epoch": 1489, "val_loss": 66908.3359375} {"train_loss": -6.068918228149414, "global_step": 62580, "epoch": 1490} {"train_loss": -5.902644634246826, "global_step": 62581, "epoch": 1490} {"train_loss": -5.870527267456055, "global_step": 62582, "epoch": 1490} {"train_loss": -5.931939601898193, "global_step": 62583, "epoch": 1490} {"train_loss": -5.80936336517334, "global_step": 62584, "epoch": 1490} {"train_loss": -5.845544815063477, "global_step": 62585, "epoch": 1490} {"train_loss": -5.975062370300293, "global_step": 62586, "epoch": 1490} {"train_loss": -5.9233012199401855, "global_step": 62587, "epoch": 1490} {"train_loss": -5.926966667175293, "global_step": 62588, "epoch": 1490} {"train_loss": -5.819053649902344, "global_step": 62589, "epoch": 1490} {"train_loss": -5.832513809204102, "global_step": 62590, "epoch": 1490} {"train_loss": -6.054309844970703, "global_step": 62591, "epoch": 1490} {"train_loss": -5.831917762756348, "global_step": 62592, "epoch": 1490} {"train_loss": -5.90485954284668, "global_step": 62593, "epoch": 1490} {"train_loss": -5.699918746948242, "global_step": 62594, "epoch": 1490} {"train_loss": -5.903783798217773, "global_step": 62595, "epoch": 1490} {"train_loss": -5.888243675231934, "global_step": 62596, "epoch": 1490} {"train_loss": -5.872713088989258, "global_step": 62597, "epoch": 1490} {"train_loss": -5.861401557922363, "global_step": 62598, "epoch": 1490} {"train_loss": -5.814196586608887, "global_step": 62599, "epoch": 1490} {"train_loss": -5.917330265045166, "global_step": 62600, "epoch": 1490} {"train_loss": -5.6579790115356445, "global_step": 62601, "epoch": 1490} {"train_loss": -5.837787628173828, "global_step": 62602, "epoch": 1490} {"train_loss": -5.839610576629639, "global_step": 62603, "epoch": 1490} {"train_loss": -5.806766510009766, "global_step": 62604, "epoch": 1490} {"train_loss": -5.8898234367370605, "global_step": 62605, "epoch": 1490} {"train_loss": -5.88847541809082, "global_step": 62606, "epoch": 1490} {"train_loss": -5.857321739196777, "global_step": 62607, "epoch": 1490} {"train_loss": -5.874220371246338, "global_step": 62608, "epoch": 1490} {"train_loss": -5.889245510101318, "global_step": 62609, "epoch": 1490} {"train_loss": -5.953254222869873, "global_step": 62610, "epoch": 1490} {"train_loss": -6.0855584144592285, "global_step": 62611, "epoch": 1490} {"train_loss": -5.924896240234375, "global_step": 62612, "epoch": 1490} {"train_loss": -5.801129341125488, "global_step": 62613, "epoch": 1490} {"train_loss": -5.887128829956055, "global_step": 62614, "epoch": 1490} {"train_loss": -5.926551818847656, "global_step": 62615, "epoch": 1490} {"train_loss": -5.961334228515625, "global_step": 62616, "epoch": 1490} {"train_loss": -5.913223743438721, "global_step": 62617, "epoch": 1490} {"train_loss": -5.8679118156433105, "global_step": 62618, "epoch": 1490} {"train_loss": -5.832235336303711, "global_step": 62619, "epoch": 1490} {"train_loss": -5.840062141418457, "global_step": 62620, "epoch": 1490} {"train_loss": -5.884011961164928, "global_step": 62621, "epoch": 1490, "val_loss": 66912.9140625} {"train_loss": -5.844854354858398, "global_step": 62622, "epoch": 1491} {"train_loss": -5.878520965576172, "global_step": 62623, "epoch": 1491} {"train_loss": -5.880964279174805, "global_step": 62624, "epoch": 1491} {"train_loss": -5.886839389801025, "global_step": 62625, "epoch": 1491} {"train_loss": -5.911044120788574, "global_step": 62626, "epoch": 1491} {"train_loss": -5.95734977722168, "global_step": 62627, "epoch": 1491} {"train_loss": -6.017155170440674, "global_step": 62628, "epoch": 1491} {"train_loss": -5.863966941833496, "global_step": 62629, "epoch": 1491} {"train_loss": -5.946990489959717, "global_step": 62630, "epoch": 1491} {"train_loss": -6.048551559448242, "global_step": 62631, "epoch": 1491} {"train_loss": -6.007359504699707, "global_step": 62632, "epoch": 1491} {"train_loss": -5.921623229980469, "global_step": 62633, "epoch": 1491} {"train_loss": -5.877341270446777, "global_step": 62634, "epoch": 1491} {"train_loss": -5.98463249206543, "global_step": 62635, "epoch": 1491} {"train_loss": -5.87640380859375, "global_step": 62636, "epoch": 1491} {"train_loss": -6.035898208618164, "global_step": 62637, "epoch": 1491} {"train_loss": -5.858497619628906, "global_step": 62638, "epoch": 1491} {"train_loss": -5.996946334838867, "global_step": 62639, "epoch": 1491} {"train_loss": -5.922164440155029, "global_step": 62640, "epoch": 1491} {"train_loss": -5.928582191467285, "global_step": 62641, "epoch": 1491} {"train_loss": -5.922457695007324, "global_step": 62642, "epoch": 1491} {"train_loss": -5.935193061828613, "global_step": 62643, "epoch": 1491} {"train_loss": -5.935068130493164, "global_step": 62644, "epoch": 1491} {"train_loss": -5.82716178894043, "global_step": 62645, "epoch": 1491} {"train_loss": -5.92354154586792, "global_step": 62646, "epoch": 1491} {"train_loss": -5.934366226196289, "global_step": 62647, "epoch": 1491} {"train_loss": -5.922182083129883, "global_step": 62648, "epoch": 1491} {"train_loss": -5.877982139587402, "global_step": 62649, "epoch": 1491} {"train_loss": -5.798064231872559, "global_step": 62650, "epoch": 1491} {"train_loss": -5.869999408721924, "global_step": 62651, "epoch": 1491} {"train_loss": -6.010005950927734, "global_step": 62652, "epoch": 1491} {"train_loss": -5.976431846618652, "global_step": 62653, "epoch": 1491} {"train_loss": -5.849029541015625, "global_step": 62654, "epoch": 1491} {"train_loss": -5.908319473266602, "global_step": 62655, "epoch": 1491} {"train_loss": -5.890048503875732, "global_step": 62656, "epoch": 1491} {"train_loss": -5.896659851074219, "global_step": 62657, "epoch": 1491} {"train_loss": -5.8944196701049805, "global_step": 62658, "epoch": 1491} {"train_loss": -5.901071548461914, "global_step": 62659, "epoch": 1491} {"train_loss": -5.842855930328369, "global_step": 62660, "epoch": 1491} {"train_loss": -5.839211940765381, "global_step": 62661, "epoch": 1491} {"train_loss": -5.904296875, "global_step": 62662, "epoch": 1491} {"train_loss": -5.913946866989136, "global_step": 62663, "epoch": 1491, "val_loss": 67018.6328125} {"train_loss": -5.8304290771484375, "global_step": 62664, "epoch": 1492} {"train_loss": -6.033827781677246, "global_step": 62665, "epoch": 1492} {"train_loss": -5.847378730773926, "global_step": 62666, "epoch": 1492} {"train_loss": -5.982658863067627, "global_step": 62667, "epoch": 1492} {"train_loss": -5.987595558166504, "global_step": 62668, "epoch": 1492} {"train_loss": -5.884566307067871, "global_step": 62669, "epoch": 1492} {"train_loss": -5.840428352355957, "global_step": 62670, "epoch": 1492} {"train_loss": -5.93857479095459, "global_step": 62671, "epoch": 1492} {"train_loss": -5.870726585388184, "global_step": 62672, "epoch": 1492} {"train_loss": -5.781173229217529, "global_step": 62673, "epoch": 1492} {"train_loss": -5.790916919708252, "global_step": 62674, "epoch": 1492} {"train_loss": -6.021256923675537, "global_step": 62675, "epoch": 1492} {"train_loss": -5.898750305175781, "global_step": 62676, "epoch": 1492} {"train_loss": -5.82234001159668, "global_step": 62677, "epoch": 1492} {"train_loss": -5.774094104766846, "global_step": 62678, "epoch": 1492} {"train_loss": -5.808938980102539, "global_step": 62679, "epoch": 1492} {"train_loss": -5.873629570007324, "global_step": 62680, "epoch": 1492} {"train_loss": -5.928780555725098, "global_step": 62681, "epoch": 1492} {"train_loss": -5.931074142456055, "global_step": 62682, "epoch": 1492} {"train_loss": -5.801538944244385, "global_step": 62683, "epoch": 1492} {"train_loss": -5.824008941650391, "global_step": 62684, "epoch": 1492} {"train_loss": -5.838930130004883, "global_step": 62685, "epoch": 1492} {"train_loss": -5.912983417510986, "global_step": 62686, "epoch": 1492} {"train_loss": -5.797933578491211, "global_step": 62687, "epoch": 1492} {"train_loss": -5.805995464324951, "global_step": 62688, "epoch": 1492} {"train_loss": -5.925742149353027, "global_step": 62689, "epoch": 1492} {"train_loss": -5.948302745819092, "global_step": 62690, "epoch": 1492} {"train_loss": -5.831392288208008, "global_step": 62691, "epoch": 1492} {"train_loss": -5.908079147338867, "global_step": 62692, "epoch": 1492} {"train_loss": -5.908605575561523, "global_step": 62693, "epoch": 1492} {"train_loss": -5.849377155303955, "global_step": 62694, "epoch": 1492} {"train_loss": -5.919988632202148, "global_step": 62695, "epoch": 1492} {"train_loss": -5.913738250732422, "global_step": 62696, "epoch": 1492} {"train_loss": -5.865642547607422, "global_step": 62697, "epoch": 1492} {"train_loss": -5.909104347229004, "global_step": 62698, "epoch": 1492} {"train_loss": -5.845815658569336, "global_step": 62699, "epoch": 1492} {"train_loss": -5.840873718261719, "global_step": 62700, "epoch": 1492} {"train_loss": -5.944889068603516, "global_step": 62701, "epoch": 1492} {"train_loss": -5.882770538330078, "global_step": 62702, "epoch": 1492} {"train_loss": -5.921538352966309, "global_step": 62703, "epoch": 1492} {"train_loss": -5.929455757141113, "global_step": 62704, "epoch": 1492} {"train_loss": -5.88007995060512, "global_step": 62705, "epoch": 1492, "val_loss": 66857.09375} {"train_loss": -5.920600891113281, "global_step": 62706, "epoch": 1493} {"train_loss": -5.985844612121582, "global_step": 62707, "epoch": 1493} {"train_loss": -5.950980186462402, "global_step": 62708, "epoch": 1493} {"train_loss": -5.880614280700684, "global_step": 62709, "epoch": 1493} {"train_loss": -5.892665386199951, "global_step": 62710, "epoch": 1493} {"train_loss": -5.797497272491455, "global_step": 62711, "epoch": 1493} {"train_loss": -5.896965503692627, "global_step": 62712, "epoch": 1493} {"train_loss": -5.876258850097656, "global_step": 62713, "epoch": 1493} {"train_loss": -5.850091934204102, "global_step": 62714, "epoch": 1493} {"train_loss": -5.906070232391357, "global_step": 62715, "epoch": 1493} {"train_loss": -5.939284324645996, "global_step": 62716, "epoch": 1493} {"train_loss": -5.897002220153809, "global_step": 62717, "epoch": 1493} {"train_loss": -5.866240501403809, "global_step": 62718, "epoch": 1493} {"train_loss": -5.831419944763184, "global_step": 62719, "epoch": 1493} {"train_loss": -6.021595478057861, "global_step": 62720, "epoch": 1493} {"train_loss": -5.901924133300781, "global_step": 62721, "epoch": 1493} {"train_loss": -5.868907928466797, "global_step": 62722, "epoch": 1493} {"train_loss": -5.846803188323975, "global_step": 62723, "epoch": 1493} {"train_loss": -5.89959716796875, "global_step": 62724, "epoch": 1493} {"train_loss": -5.810127258300781, "global_step": 62725, "epoch": 1493} {"train_loss": -5.935649871826172, "global_step": 62726, "epoch": 1493} {"train_loss": -6.0420026779174805, "global_step": 62727, "epoch": 1493} {"train_loss": -5.974635124206543, "global_step": 62728, "epoch": 1493} {"train_loss": -5.907314300537109, "global_step": 62729, "epoch": 1493} {"train_loss": -5.831229209899902, "global_step": 62730, "epoch": 1493} {"train_loss": -5.8391571044921875, "global_step": 62731, "epoch": 1493} {"train_loss": -5.93673849105835, "global_step": 62732, "epoch": 1493} {"train_loss": -5.911422252655029, "global_step": 62733, "epoch": 1493} {"train_loss": -5.860752105712891, "global_step": 62734, "epoch": 1493} {"train_loss": -5.974390983581543, "global_step": 62735, "epoch": 1493} {"train_loss": -5.9006500244140625, "global_step": 62736, "epoch": 1493} {"train_loss": -5.830111980438232, "global_step": 62737, "epoch": 1493} {"train_loss": -5.8451128005981445, "global_step": 62738, "epoch": 1493} {"train_loss": -5.955966949462891, "global_step": 62739, "epoch": 1493} {"train_loss": -5.974114418029785, "global_step": 62740, "epoch": 1493} {"train_loss": -5.9745893478393555, "global_step": 62741, "epoch": 1493} {"train_loss": -6.049083709716797, "global_step": 62742, "epoch": 1493} {"train_loss": -5.801461696624756, "global_step": 62743, "epoch": 1493} {"train_loss": -6.009971618652344, "global_step": 62744, "epoch": 1493} {"train_loss": -5.856308937072754, "global_step": 62745, "epoch": 1493} {"train_loss": -5.8690690994262695, "global_step": 62746, "epoch": 1493} {"train_loss": -5.906072866348993, "global_step": 62747, "epoch": 1493, "val_loss": 66812.640625} {"train_loss": -5.920654296875, "global_step": 62748, "epoch": 1494} {"train_loss": -5.897842884063721, "global_step": 62749, "epoch": 1494} {"train_loss": -5.940024375915527, "global_step": 62750, "epoch": 1494} {"train_loss": -5.8979411125183105, "global_step": 62751, "epoch": 1494} {"train_loss": -5.921747207641602, "global_step": 62752, "epoch": 1494} {"train_loss": -5.873908042907715, "global_step": 62753, "epoch": 1494} {"train_loss": -6.056500434875488, "global_step": 62754, "epoch": 1494} {"train_loss": -6.138772964477539, "global_step": 62755, "epoch": 1494} {"train_loss": -5.885207176208496, "global_step": 62756, "epoch": 1494} {"train_loss": -5.734335899353027, "global_step": 62757, "epoch": 1494} {"train_loss": -5.942737102508545, "global_step": 62758, "epoch": 1494} {"train_loss": -5.91800594329834, "global_step": 62759, "epoch": 1494} {"train_loss": -5.939770698547363, "global_step": 62760, "epoch": 1494} {"train_loss": -5.776935577392578, "global_step": 62761, "epoch": 1494} {"train_loss": -5.932567596435547, "global_step": 62762, "epoch": 1494} {"train_loss": -5.970879554748535, "global_step": 62763, "epoch": 1494} {"train_loss": -5.9974365234375, "global_step": 62764, "epoch": 1494} {"train_loss": -5.937576770782471, "global_step": 62765, "epoch": 1494} {"train_loss": -5.897878646850586, "global_step": 62766, "epoch": 1494} {"train_loss": -5.930901050567627, "global_step": 62767, "epoch": 1494} {"train_loss": -5.944164752960205, "global_step": 62768, "epoch": 1494} {"train_loss": -6.138614654541016, "global_step": 62769, "epoch": 1494} {"train_loss": -5.83920955657959, "global_step": 62770, "epoch": 1494} {"train_loss": -5.8874616622924805, "global_step": 62771, "epoch": 1494} {"train_loss": -5.855739593505859, "global_step": 62772, "epoch": 1494} {"train_loss": -5.835387706756592, "global_step": 62773, "epoch": 1494} {"train_loss": -5.960797309875488, "global_step": 62774, "epoch": 1494} {"train_loss": -5.894614219665527, "global_step": 62775, "epoch": 1494} {"train_loss": -6.0978899002075195, "global_step": 62776, "epoch": 1494} {"train_loss": -5.901251792907715, "global_step": 62777, "epoch": 1494} {"train_loss": -5.953222274780273, "global_step": 62778, "epoch": 1494} {"train_loss": -5.896406173706055, "global_step": 62779, "epoch": 1494} {"train_loss": -6.005467414855957, "global_step": 62780, "epoch": 1494} {"train_loss": -5.832353591918945, "global_step": 62781, "epoch": 1494} {"train_loss": -5.881385803222656, "global_step": 62782, "epoch": 1494} {"train_loss": -5.970632076263428, "global_step": 62783, "epoch": 1494} {"train_loss": -5.799683570861816, "global_step": 62784, "epoch": 1494} {"train_loss": -5.929374694824219, "global_step": 62785, "epoch": 1494} {"train_loss": -5.930883884429932, "global_step": 62786, "epoch": 1494} {"train_loss": -5.907623291015625, "global_step": 62787, "epoch": 1494} {"train_loss": -5.955286979675293, "global_step": 62788, "epoch": 1494} {"train_loss": -5.925157864888509, "global_step": 62789, "epoch": 1494, "val_loss": 67147.6484375} {"train_loss": -5.881457805633545, "global_step": 62790, "epoch": 1495} {"train_loss": -5.9082489013671875, "global_step": 62791, "epoch": 1495} {"train_loss": -5.867498397827148, "global_step": 62792, "epoch": 1495} {"train_loss": -5.7007975578308105, "global_step": 62793, "epoch": 1495} {"train_loss": -5.808008670806885, "global_step": 62794, "epoch": 1495} {"train_loss": -5.772577285766602, "global_step": 62795, "epoch": 1495} {"train_loss": -5.720134258270264, "global_step": 62796, "epoch": 1495} {"train_loss": -5.953975677490234, "global_step": 62797, "epoch": 1495} {"train_loss": -5.758387565612793, "global_step": 62798, "epoch": 1495} {"train_loss": -5.779952049255371, "global_step": 62799, "epoch": 1495} {"train_loss": -5.823876857757568, "global_step": 62800, "epoch": 1495} {"train_loss": -5.987276077270508, "global_step": 62801, "epoch": 1495} {"train_loss": -5.6215925216674805, "global_step": 62802, "epoch": 1495} {"train_loss": -5.898830413818359, "global_step": 62803, "epoch": 1495} {"train_loss": -5.849887847900391, "global_step": 62804, "epoch": 1495} {"train_loss": -5.916645050048828, "global_step": 62805, "epoch": 1495} {"train_loss": -5.943648338317871, "global_step": 62806, "epoch": 1495} {"train_loss": -5.906207084655762, "global_step": 62807, "epoch": 1495} {"train_loss": -5.836142539978027, "global_step": 62808, "epoch": 1495} {"train_loss": -5.930549621582031, "global_step": 62809, "epoch": 1495} {"train_loss": -5.991175174713135, "global_step": 62810, "epoch": 1495} {"train_loss": -5.9323015213012695, "global_step": 62811, "epoch": 1495} {"train_loss": -5.963018417358398, "global_step": 62812, "epoch": 1495} {"train_loss": -5.792685508728027, "global_step": 62813, "epoch": 1495} {"train_loss": -5.8776092529296875, "global_step": 62814, "epoch": 1495} {"train_loss": -5.925928592681885, "global_step": 62815, "epoch": 1495} {"train_loss": -5.9405131340026855, "global_step": 62816, "epoch": 1495} {"train_loss": -5.863428115844727, "global_step": 62817, "epoch": 1495} {"train_loss": -5.896876335144043, "global_step": 62818, "epoch": 1495} {"train_loss": -5.870561599731445, "global_step": 62819, "epoch": 1495} {"train_loss": -5.988333225250244, "global_step": 62820, "epoch": 1495} {"train_loss": -5.751119136810303, "global_step": 62821, "epoch": 1495} {"train_loss": -5.802096843719482, "global_step": 62822, "epoch": 1495} {"train_loss": -5.746018409729004, "global_step": 62823, "epoch": 1495} {"train_loss": -5.871809959411621, "global_step": 62824, "epoch": 1495} {"train_loss": -5.782737731933594, "global_step": 62825, "epoch": 1495} {"train_loss": -5.919675827026367, "global_step": 62826, "epoch": 1495} {"train_loss": -5.880400657653809, "global_step": 62827, "epoch": 1495} {"train_loss": -5.723803520202637, "global_step": 62828, "epoch": 1495} {"train_loss": -5.92236328125, "global_step": 62829, "epoch": 1495} {"train_loss": -5.9355573654174805, "global_step": 62830, "epoch": 1495} {"train_loss": -5.8585980506170365, "global_step": 62831, "epoch": 1495, "val_loss": 67089.2265625} {"train_loss": -5.8816328048706055, "global_step": 62832, "epoch": 1496} {"train_loss": -5.8714165687561035, "global_step": 62833, "epoch": 1496} {"train_loss": -5.849174499511719, "global_step": 62834, "epoch": 1496} {"train_loss": -6.02455472946167, "global_step": 62835, "epoch": 1496} {"train_loss": -5.894072532653809, "global_step": 62836, "epoch": 1496} {"train_loss": -5.820126533508301, "global_step": 62837, "epoch": 1496} {"train_loss": -6.020648002624512, "global_step": 62838, "epoch": 1496} {"train_loss": -5.892269134521484, "global_step": 62839, "epoch": 1496} {"train_loss": -5.921217918395996, "global_step": 62840, "epoch": 1496} {"train_loss": -5.989614486694336, "global_step": 62841, "epoch": 1496} {"train_loss": -5.859147071838379, "global_step": 62842, "epoch": 1496} {"train_loss": -5.850193977355957, "global_step": 62843, "epoch": 1496} {"train_loss": -5.9397358894348145, "global_step": 62844, "epoch": 1496} {"train_loss": -5.885624885559082, "global_step": 62845, "epoch": 1496} {"train_loss": -5.809042930603027, "global_step": 62846, "epoch": 1496} {"train_loss": -6.032410621643066, "global_step": 62847, "epoch": 1496} {"train_loss": -5.971341133117676, "global_step": 62848, "epoch": 1496} {"train_loss": -5.9475202560424805, "global_step": 62849, "epoch": 1496} {"train_loss": -5.9513115882873535, "global_step": 62850, "epoch": 1496} {"train_loss": -5.888278007507324, "global_step": 62851, "epoch": 1496} {"train_loss": -5.974300384521484, "global_step": 62852, "epoch": 1496} {"train_loss": -5.765691757202148, "global_step": 62853, "epoch": 1496} {"train_loss": -5.905120372772217, "global_step": 62854, "epoch": 1496} {"train_loss": -5.903680801391602, "global_step": 62855, "epoch": 1496} {"train_loss": -5.864173889160156, "global_step": 62856, "epoch": 1496} {"train_loss": -5.971614360809326, "global_step": 62857, "epoch": 1496} {"train_loss": -5.995233535766602, "global_step": 62858, "epoch": 1496} {"train_loss": -6.028508186340332, "global_step": 62859, "epoch": 1496} {"train_loss": -5.97374153137207, "global_step": 62860, "epoch": 1496} {"train_loss": -5.889194011688232, "global_step": 62861, "epoch": 1496} {"train_loss": -5.9542460441589355, "global_step": 62862, "epoch": 1496} {"train_loss": -5.956367492675781, "global_step": 62863, "epoch": 1496} {"train_loss": -5.869319915771484, "global_step": 62864, "epoch": 1496} {"train_loss": -5.764707565307617, "global_step": 62865, "epoch": 1496} {"train_loss": -5.967416763305664, "global_step": 62866, "epoch": 1496} {"train_loss": -5.995095252990723, "global_step": 62867, "epoch": 1496} {"train_loss": -5.83451509475708, "global_step": 62868, "epoch": 1496} {"train_loss": -5.950791835784912, "global_step": 62869, "epoch": 1496} {"train_loss": -5.859836578369141, "global_step": 62870, "epoch": 1496} {"train_loss": -5.724342346191406, "global_step": 62871, "epoch": 1496} {"train_loss": -5.93497371673584, "global_step": 62872, "epoch": 1496} {"train_loss": -5.907274166742961, "global_step": 62873, "epoch": 1496, "val_loss": 66884.109375} {"train_loss": -5.882131099700928, "global_step": 62874, "epoch": 1497} {"train_loss": -5.959975719451904, "global_step": 62875, "epoch": 1497} {"train_loss": -5.955533981323242, "global_step": 62876, "epoch": 1497} {"train_loss": -5.7740583419799805, "global_step": 62877, "epoch": 1497} {"train_loss": -5.965590476989746, "global_step": 62878, "epoch": 1497} {"train_loss": -5.930489540100098, "global_step": 62879, "epoch": 1497} {"train_loss": -5.887697219848633, "global_step": 62880, "epoch": 1497} {"train_loss": -5.962790012359619, "global_step": 62881, "epoch": 1497} {"train_loss": -5.9192023277282715, "global_step": 62882, "epoch": 1497} {"train_loss": -5.933984756469727, "global_step": 62883, "epoch": 1497} {"train_loss": -5.925638198852539, "global_step": 62884, "epoch": 1497} {"train_loss": -5.910661697387695, "global_step": 62885, "epoch": 1497} {"train_loss": -5.917316436767578, "global_step": 62886, "epoch": 1497} {"train_loss": -6.002732753753662, "global_step": 62887, "epoch": 1497} {"train_loss": -5.938977241516113, "global_step": 62888, "epoch": 1497} {"train_loss": -5.894031047821045, "global_step": 62889, "epoch": 1497} {"train_loss": -5.9062819480896, "global_step": 62890, "epoch": 1497} {"train_loss": -5.91231632232666, "global_step": 62891, "epoch": 1497} {"train_loss": -5.906749725341797, "global_step": 62892, "epoch": 1497} {"train_loss": -5.79262638092041, "global_step": 62893, "epoch": 1497} {"train_loss": -5.927748680114746, "global_step": 62894, "epoch": 1497} {"train_loss": -5.93104362487793, "global_step": 62895, "epoch": 1497} {"train_loss": -5.924315452575684, "global_step": 62896, "epoch": 1497} {"train_loss": -5.941765785217285, "global_step": 62897, "epoch": 1497} {"train_loss": -5.866569519042969, "global_step": 62898, "epoch": 1497} {"train_loss": -5.87514066696167, "global_step": 62899, "epoch": 1497} {"train_loss": -5.781768798828125, "global_step": 62900, "epoch": 1497} {"train_loss": -5.901587963104248, "global_step": 62901, "epoch": 1497} {"train_loss": -5.820122718811035, "global_step": 62902, "epoch": 1497} {"train_loss": -5.818085670471191, "global_step": 62903, "epoch": 1497} {"train_loss": -5.873188018798828, "global_step": 62904, "epoch": 1497} {"train_loss": -5.7177581787109375, "global_step": 62905, "epoch": 1497} {"train_loss": -5.849468231201172, "global_step": 62906, "epoch": 1497} {"train_loss": -5.9900288581848145, "global_step": 62907, "epoch": 1497} {"train_loss": -5.952170372009277, "global_step": 62908, "epoch": 1497} {"train_loss": -5.967328071594238, "global_step": 62909, "epoch": 1497} {"train_loss": -5.871727466583252, "global_step": 62910, "epoch": 1497} {"train_loss": -5.8449320793151855, "global_step": 62911, "epoch": 1497} {"train_loss": -5.915416717529297, "global_step": 62912, "epoch": 1497} {"train_loss": -5.926179885864258, "global_step": 62913, "epoch": 1497} {"train_loss": -5.960812568664551, "global_step": 62914, "epoch": 1497} {"train_loss": -5.902747120176043, "global_step": 62915, "epoch": 1497, "val_loss": 66986.3359375} {"train_loss": -5.91989803314209, "global_step": 62916, "epoch": 1498} {"train_loss": -5.883915901184082, "global_step": 62917, "epoch": 1498} {"train_loss": -5.961456298828125, "global_step": 62918, "epoch": 1498} {"train_loss": -5.9568095207214355, "global_step": 62919, "epoch": 1498} {"train_loss": -5.96076774597168, "global_step": 62920, "epoch": 1498} {"train_loss": -5.966922760009766, "global_step": 62921, "epoch": 1498} {"train_loss": -5.979623794555664, "global_step": 62922, "epoch": 1498} {"train_loss": -5.928290843963623, "global_step": 62923, "epoch": 1498} {"train_loss": -5.9100260734558105, "global_step": 62924, "epoch": 1498} {"train_loss": -6.021169662475586, "global_step": 62925, "epoch": 1498} {"train_loss": -5.918338775634766, "global_step": 62926, "epoch": 1498} {"train_loss": -5.838417053222656, "global_step": 62927, "epoch": 1498} {"train_loss": -5.964475631713867, "global_step": 62928, "epoch": 1498} {"train_loss": -5.869454860687256, "global_step": 62929, "epoch": 1498} {"train_loss": -5.963443756103516, "global_step": 62930, "epoch": 1498} {"train_loss": -6.0089311599731445, "global_step": 62931, "epoch": 1498} {"train_loss": -5.958583354949951, "global_step": 62932, "epoch": 1498} {"train_loss": -6.072308540344238, "global_step": 62933, "epoch": 1498} {"train_loss": -5.817722320556641, "global_step": 62934, "epoch": 1498} {"train_loss": -5.848361968994141, "global_step": 62935, "epoch": 1498} {"train_loss": -5.918735504150391, "global_step": 62936, "epoch": 1498} {"train_loss": -5.918104648590088, "global_step": 62937, "epoch": 1498} {"train_loss": -5.948851585388184, "global_step": 62938, "epoch": 1498} {"train_loss": -5.925590991973877, "global_step": 62939, "epoch": 1498} {"train_loss": -5.853538513183594, "global_step": 62940, "epoch": 1498} {"train_loss": -5.867344856262207, "global_step": 62941, "epoch": 1498} {"train_loss": -5.8323540687561035, "global_step": 62942, "epoch": 1498} {"train_loss": -5.912564277648926, "global_step": 62943, "epoch": 1498} {"train_loss": -5.899624347686768, "global_step": 62944, "epoch": 1498} {"train_loss": -5.922786235809326, "global_step": 62945, "epoch": 1498} {"train_loss": -5.99722957611084, "global_step": 62946, "epoch": 1498} {"train_loss": -5.844757080078125, "global_step": 62947, "epoch": 1498} {"train_loss": -5.897563934326172, "global_step": 62948, "epoch": 1498} {"train_loss": -6.0216965675354, "global_step": 62949, "epoch": 1498} {"train_loss": -5.98436975479126, "global_step": 62950, "epoch": 1498} {"train_loss": -5.905246257781982, "global_step": 62951, "epoch": 1498} {"train_loss": -5.98264217376709, "global_step": 62952, "epoch": 1498} {"train_loss": -5.8308186531066895, "global_step": 62953, "epoch": 1498} {"train_loss": -6.028043746948242, "global_step": 62954, "epoch": 1498} {"train_loss": -6.077557563781738, "global_step": 62955, "epoch": 1498} {"train_loss": -6.062556743621826, "global_step": 62956, "epoch": 1498} {"train_loss": -5.937001648403349, "global_step": 62957, "epoch": 1498, "val_loss": 66879.828125} {"train_loss": -5.782096862792969, "global_step": 62958, "epoch": 1499} {"train_loss": -5.901937961578369, "global_step": 62959, "epoch": 1499} {"train_loss": -5.8651556968688965, "global_step": 62960, "epoch": 1499} {"train_loss": -5.816200256347656, "global_step": 62961, "epoch": 1499} {"train_loss": -6.018594264984131, "global_step": 62962, "epoch": 1499} {"train_loss": -5.935333251953125, "global_step": 62963, "epoch": 1499} {"train_loss": -5.857619762420654, "global_step": 62964, "epoch": 1499} {"train_loss": -5.913217067718506, "global_step": 62965, "epoch": 1499} {"train_loss": -5.910200595855713, "global_step": 62966, "epoch": 1499} {"train_loss": -6.029696464538574, "global_step": 62967, "epoch": 1499} {"train_loss": -5.975215435028076, "global_step": 62968, "epoch": 1499} {"train_loss": -6.027675151824951, "global_step": 62969, "epoch": 1499} {"train_loss": -5.831297874450684, "global_step": 62970, "epoch": 1499} {"train_loss": -6.002262115478516, "global_step": 62971, "epoch": 1499} {"train_loss": -5.891120910644531, "global_step": 62972, "epoch": 1499} {"train_loss": -6.039300918579102, "global_step": 62973, "epoch": 1499} {"train_loss": -5.820560455322266, "global_step": 62974, "epoch": 1499} {"train_loss": -5.989126205444336, "global_step": 62975, "epoch": 1499} {"train_loss": -5.898260116577148, "global_step": 62976, "epoch": 1499} {"train_loss": -6.034963130950928, "global_step": 62977, "epoch": 1499} {"train_loss": -5.93861198425293, "global_step": 62978, "epoch": 1499} {"train_loss": -5.8780837059021, "global_step": 62979, "epoch": 1499} {"train_loss": -5.916754245758057, "global_step": 62980, "epoch": 1499} {"train_loss": -5.8680949211120605, "global_step": 62981, "epoch": 1499} {"train_loss": -5.911552429199219, "global_step": 62982, "epoch": 1499} {"train_loss": -5.930663108825684, "global_step": 62983, "epoch": 1499} {"train_loss": -5.980416297912598, "global_step": 62984, "epoch": 1499} {"train_loss": -5.864221572875977, "global_step": 62985, "epoch": 1499} {"train_loss": -6.047581672668457, "global_step": 62986, "epoch": 1499} {"train_loss": -5.986017227172852, "global_step": 62987, "epoch": 1499} {"train_loss": -6.098940849304199, "global_step": 62988, "epoch": 1499} {"train_loss": -5.966911792755127, "global_step": 62989, "epoch": 1499} {"train_loss": -5.864171981811523, "global_step": 62990, "epoch": 1499} {"train_loss": -5.983790397644043, "global_step": 62991, "epoch": 1499} {"train_loss": -6.0118865966796875, "global_step": 62992, "epoch": 1499} {"train_loss": -5.862152099609375, "global_step": 62993, "epoch": 1499} {"train_loss": -6.005542755126953, "global_step": 62994, "epoch": 1499} {"train_loss": -5.957475662231445, "global_step": 62995, "epoch": 1499} {"train_loss": -5.912642955780029, "global_step": 62996, "epoch": 1499} {"train_loss": -6.034665584564209, "global_step": 62997, "epoch": 1499} {"train_loss": -5.9882941246032715, "global_step": 62998, "epoch": 1499} {"train_loss": -5.938846508661906, "global_step": 62999, "epoch": 1499, "val_loss": 66992.4375} {"train_loss": -5.9965386390686035, "global_step": 63000, "epoch": 1500} {"train_loss": -5.946206569671631, "global_step": 63001, "epoch": 1500} {"train_loss": -5.939785957336426, "global_step": 63002, "epoch": 1500} {"train_loss": -5.998443126678467, "global_step": 63003, "epoch": 1500} {"train_loss": -5.794809818267822, "global_step": 63004, "epoch": 1500} {"train_loss": -5.861987113952637, "global_step": 63005, "epoch": 1500} {"train_loss": -5.926650524139404, "global_step": 63006, "epoch": 1500} {"train_loss": -5.866110801696777, "global_step": 63007, "epoch": 1500} {"train_loss": -5.921670913696289, "global_step": 63008, "epoch": 1500} {"train_loss": -5.803045749664307, "global_step": 63009, "epoch": 1500} {"train_loss": -5.973082542419434, "global_step": 63010, "epoch": 1500} {"train_loss": -5.957508087158203, "global_step": 63011, "epoch": 1500} {"train_loss": -5.936181545257568, "global_step": 63012, "epoch": 1500} {"train_loss": -5.918355464935303, "global_step": 63013, "epoch": 1500} {"train_loss": -5.959635257720947, "global_step": 63014, "epoch": 1500} {"train_loss": -5.929254531860352, "global_step": 63015, "epoch": 1500} {"train_loss": -5.900856018066406, "global_step": 63016, "epoch": 1500} {"train_loss": -5.914322853088379, "global_step": 63017, "epoch": 1500} {"train_loss": -6.080480575561523, "global_step": 63018, "epoch": 1500} {"train_loss": -5.850629806518555, "global_step": 63019, "epoch": 1500} {"train_loss": -5.85050630569458, "global_step": 63020, "epoch": 1500} {"train_loss": -5.919074535369873, "global_step": 63021, "epoch": 1500} {"train_loss": -5.901636600494385, "global_step": 63022, "epoch": 1500} {"train_loss": -5.899096488952637, "global_step": 63023, "epoch": 1500} {"train_loss": -5.875475883483887, "global_step": 63024, "epoch": 1500} {"train_loss": -5.942938327789307, "global_step": 63025, "epoch": 1500} {"train_loss": -5.956449508666992, "global_step": 63026, "epoch": 1500} {"train_loss": -5.98823356628418, "global_step": 63027, "epoch": 1500} {"train_loss": -5.9231414794921875, "global_step": 63028, "epoch": 1500} {"train_loss": -5.814836502075195, "global_step": 63029, "epoch": 1500} {"train_loss": -6.0076446533203125, "global_step": 63030, "epoch": 1500} {"train_loss": -5.913147926330566, "global_step": 63031, "epoch": 1500} {"train_loss": -5.91794490814209, "global_step": 63032, "epoch": 1500} {"train_loss": -5.904940605163574, "global_step": 63033, "epoch": 1500} {"train_loss": -5.863639831542969, "global_step": 63034, "epoch": 1500} {"train_loss": -5.936177730560303, "global_step": 63035, "epoch": 1500} {"train_loss": -5.842467308044434, "global_step": 63036, "epoch": 1500} {"train_loss": -5.869604587554932, "global_step": 63037, "epoch": 1500} {"train_loss": -5.856950759887695, "global_step": 63038, "epoch": 1500} {"train_loss": -6.001443862915039, "global_step": 63039, "epoch": 1500} {"train_loss": -5.886930465698242, "global_step": 63040, "epoch": 1500} {"train_loss": -5.914645115534465, "global_step": 63041, "epoch": 1500, "train/sim_max_reward_0": 0.21222487545471533, "train/sim_max_reward_1": 0.8438098511616123, "train/sim_max_reward_2": 0.6665985608790294, "train/sim_max_reward_3": 0.15582037845318325, "train/sim_max_reward_4": 0.985639308364196, "train/sim_max_reward_5": 0.925249978242188, "test/sim_max_reward_4400000": 0.9010207330693725, "test/sim_max_reward_4400001": 0.15111260193356432, "test/sim_max_reward_4400002": 0.2729675298975044, "test/sim_max_reward_4400003": 0.5461046125044615, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.7001072464804647, "test/sim_max_reward_4400007": 0.5184035240543757, "test/sim_max_reward_4400008": 0.3336575571591155, "test/sim_max_reward_4400009": 0.9735859268455035, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.26082045373118806, "test/sim_max_reward_4400012": 0.6478568851830415, "test/sim_max_reward_4400013": 0.8521874988187346, "test/sim_max_reward_4400014": 0.8090483032436032, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3890444593676337, "test/sim_max_reward_4400019": 0.061238702208032576, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.8730103457866197, "test/sim_max_reward_4400022": 0.9337609343739829, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.19927915216174527, "test/sim_max_reward_4400026": 0.6460075178011252, "test/sim_max_reward_4400027": 0.014605882743363547, "test/sim_max_reward_4400028": 0.9851890892076433, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9640760638669826, "test/sim_max_reward_4400031": 0.8806749897116989, "test/sim_max_reward_4400032": 0.2681812397281287, "test/sim_max_reward_4400033": 0.9430018080042746, "test/sim_max_reward_4400034": 0.9165298402330202, "test/sim_max_reward_4400035": 0.47183120129975464, "test/sim_max_reward_4400036": 0.8805023726196854, "test/sim_max_reward_4400037": 0.9172997452434064, "test/sim_max_reward_4400038": 0.6519102866506173, "test/sim_max_reward_4400039": 0.7735297972478875, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.5366987359606834, "test/sim_max_reward_4400042": 0.006880231386662915, "test/sim_max_reward_4400043": 0.8646285734512178, "test/sim_max_reward_4400044": 0.8417292620284712, "test/sim_max_reward_4400045": 0.37384870971164935, "test/sim_max_reward_4400046": 0.9135316673713011, "test/sim_max_reward_4400047": 0.8524821086183137, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.3165651292720723, "train/mean_score": 0.6315571587591541, "test/mean_score": 0.47643999516090985, "val_loss": 66748.015625} {"train_loss": -6.016685485839844, "global_step": 63042, "epoch": 1501} {"train_loss": -6.025493144989014, "global_step": 63043, "epoch": 1501} {"train_loss": -5.985663890838623, "global_step": 63044, "epoch": 1501} {"train_loss": -5.960583686828613, "global_step": 63045, "epoch": 1501} {"train_loss": -5.886044502258301, "global_step": 63046, "epoch": 1501} {"train_loss": -5.984354496002197, "global_step": 63047, "epoch": 1501} {"train_loss": -5.938734531402588, "global_step": 63048, "epoch": 1501} {"train_loss": -5.768980979919434, "global_step": 63049, "epoch": 1501} {"train_loss": -5.967130661010742, "global_step": 63050, "epoch": 1501} {"train_loss": -5.862640380859375, "global_step": 63051, "epoch": 1501} {"train_loss": -5.898771286010742, "global_step": 63052, "epoch": 1501} {"train_loss": -5.9285125732421875, "global_step": 63053, "epoch": 1501} {"train_loss": -5.859934329986572, "global_step": 63054, "epoch": 1501} {"train_loss": -6.025698661804199, "global_step": 63055, "epoch": 1501} {"train_loss": -5.890570640563965, "global_step": 63056, "epoch": 1501} {"train_loss": -5.860430717468262, "global_step": 63057, "epoch": 1501} {"train_loss": -5.894074440002441, "global_step": 63058, "epoch": 1501} {"train_loss": -5.9151763916015625, "global_step": 63059, "epoch": 1501} {"train_loss": -5.87187385559082, "global_step": 63060, "epoch": 1501} {"train_loss": -5.97204065322876, "global_step": 63061, "epoch": 1501} {"train_loss": -5.738039970397949, "global_step": 63062, "epoch": 1501} {"train_loss": -5.953475475311279, "global_step": 63063, "epoch": 1501} {"train_loss": -5.958463668823242, "global_step": 63064, "epoch": 1501} {"train_loss": -5.835869789123535, "global_step": 63065, "epoch": 1501} {"train_loss": -5.863129138946533, "global_step": 63066, "epoch": 1501} {"train_loss": -5.690903663635254, "global_step": 63067, "epoch": 1501} {"train_loss": -5.993326187133789, "global_step": 63068, "epoch": 1501} {"train_loss": -5.694540977478027, "global_step": 63069, "epoch": 1501} {"train_loss": -5.97198486328125, "global_step": 63070, "epoch": 1501} {"train_loss": -5.932409286499023, "global_step": 63071, "epoch": 1501} {"train_loss": -5.778568267822266, "global_step": 63072, "epoch": 1501} {"train_loss": -5.819209098815918, "global_step": 63073, "epoch": 1501} {"train_loss": -5.943179130554199, "global_step": 63074, "epoch": 1501} {"train_loss": -5.973101615905762, "global_step": 63075, "epoch": 1501} {"train_loss": -5.781662464141846, "global_step": 63076, "epoch": 1501} {"train_loss": -5.897122383117676, "global_step": 63077, "epoch": 1501} {"train_loss": -5.838653564453125, "global_step": 63078, "epoch": 1501} {"train_loss": -5.834158897399902, "global_step": 63079, "epoch": 1501} {"train_loss": -5.991461277008057, "global_step": 63080, "epoch": 1501} {"train_loss": -5.79378080368042, "global_step": 63081, "epoch": 1501} {"train_loss": -5.8518385887146, "global_step": 63082, "epoch": 1501} {"train_loss": -5.8943508352552145, "global_step": 63083, "epoch": 1501, "val_loss": 66923.3515625} {"train_loss": -5.909448146820068, "global_step": 63084, "epoch": 1502} {"train_loss": -5.954028129577637, "global_step": 63085, "epoch": 1502} {"train_loss": -5.954045295715332, "global_step": 63086, "epoch": 1502} {"train_loss": -5.918931007385254, "global_step": 63087, "epoch": 1502} {"train_loss": -5.905303955078125, "global_step": 63088, "epoch": 1502} {"train_loss": -5.965821266174316, "global_step": 63089, "epoch": 1502} {"train_loss": -5.998993873596191, "global_step": 63090, "epoch": 1502} {"train_loss": -5.902630805969238, "global_step": 63091, "epoch": 1502} {"train_loss": -5.831043720245361, "global_step": 63092, "epoch": 1502} {"train_loss": -5.893131256103516, "global_step": 63093, "epoch": 1502} {"train_loss": -5.866185188293457, "global_step": 63094, "epoch": 1502} {"train_loss": -5.947850704193115, "global_step": 63095, "epoch": 1502} {"train_loss": -6.040519714355469, "global_step": 63096, "epoch": 1502} {"train_loss": -6.021647930145264, "global_step": 63097, "epoch": 1502} {"train_loss": -5.805798530578613, "global_step": 63098, "epoch": 1502} {"train_loss": -5.938146591186523, "global_step": 63099, "epoch": 1502} {"train_loss": -5.963644027709961, "global_step": 63100, "epoch": 1502} {"train_loss": -6.014716148376465, "global_step": 63101, "epoch": 1502} {"train_loss": -5.884092330932617, "global_step": 63102, "epoch": 1502} {"train_loss": -5.90725040435791, "global_step": 63103, "epoch": 1502} {"train_loss": -6.033530235290527, "global_step": 63104, "epoch": 1502} {"train_loss": -5.932586669921875, "global_step": 63105, "epoch": 1502} {"train_loss": -5.974936008453369, "global_step": 63106, "epoch": 1502} {"train_loss": -5.857973098754883, "global_step": 63107, "epoch": 1502} {"train_loss": -5.851629257202148, "global_step": 63108, "epoch": 1502} {"train_loss": -5.883893966674805, "global_step": 63109, "epoch": 1502} {"train_loss": -5.878841876983643, "global_step": 63110, "epoch": 1502} {"train_loss": -5.7873640060424805, "global_step": 63111, "epoch": 1502} {"train_loss": -5.76625919342041, "global_step": 63112, "epoch": 1502} {"train_loss": -5.928239822387695, "global_step": 63113, "epoch": 1502} {"train_loss": -6.093194007873535, "global_step": 63114, "epoch": 1502} {"train_loss": -5.9468183517456055, "global_step": 63115, "epoch": 1502} {"train_loss": -5.828070640563965, "global_step": 63116, "epoch": 1502} {"train_loss": -5.840859413146973, "global_step": 63117, "epoch": 1502} {"train_loss": -5.907965183258057, "global_step": 63118, "epoch": 1502} {"train_loss": -5.917481899261475, "global_step": 63119, "epoch": 1502} {"train_loss": -5.775944709777832, "global_step": 63120, "epoch": 1502} {"train_loss": -5.860828399658203, "global_step": 63121, "epoch": 1502} {"train_loss": -5.969583511352539, "global_step": 63122, "epoch": 1502} {"train_loss": -5.819545269012451, "global_step": 63123, "epoch": 1502} {"train_loss": -5.84318733215332, "global_step": 63124, "epoch": 1502} {"train_loss": -5.909539756320772, "global_step": 63125, "epoch": 1502, "val_loss": 67134.328125} {"train_loss": -5.880875587463379, "global_step": 63126, "epoch": 1503} {"train_loss": -6.068549156188965, "global_step": 63127, "epoch": 1503} {"train_loss": -5.786982536315918, "global_step": 63128, "epoch": 1503} {"train_loss": -5.9249677658081055, "global_step": 63129, "epoch": 1503} {"train_loss": -5.91666316986084, "global_step": 63130, "epoch": 1503} {"train_loss": -5.842950820922852, "global_step": 63131, "epoch": 1503} {"train_loss": -6.0013275146484375, "global_step": 63132, "epoch": 1503} {"train_loss": -5.8188629150390625, "global_step": 63133, "epoch": 1503} {"train_loss": -5.912956237792969, "global_step": 63134, "epoch": 1503} {"train_loss": -5.977910995483398, "global_step": 63135, "epoch": 1503} {"train_loss": -5.871081352233887, "global_step": 63136, "epoch": 1503} {"train_loss": -6.006412029266357, "global_step": 63137, "epoch": 1503} {"train_loss": -5.965269088745117, "global_step": 63138, "epoch": 1503} {"train_loss": -5.848321437835693, "global_step": 63139, "epoch": 1503} {"train_loss": -5.892589569091797, "global_step": 63140, "epoch": 1503} {"train_loss": -5.888281345367432, "global_step": 63141, "epoch": 1503} {"train_loss": -5.904509544372559, "global_step": 63142, "epoch": 1503} {"train_loss": -5.845571994781494, "global_step": 63143, "epoch": 1503} {"train_loss": -5.805744171142578, "global_step": 63144, "epoch": 1503} {"train_loss": -5.92177152633667, "global_step": 63145, "epoch": 1503} {"train_loss": -5.905872344970703, "global_step": 63146, "epoch": 1503} {"train_loss": -5.887428283691406, "global_step": 63147, "epoch": 1503} {"train_loss": -5.810919761657715, "global_step": 63148, "epoch": 1503} {"train_loss": -5.892855167388916, "global_step": 63149, "epoch": 1503} {"train_loss": -5.999484062194824, "global_step": 63150, "epoch": 1503} {"train_loss": -5.717126846313477, "global_step": 63151, "epoch": 1503} {"train_loss": -5.918589115142822, "global_step": 63152, "epoch": 1503} {"train_loss": -5.853646278381348, "global_step": 63153, "epoch": 1503} {"train_loss": -5.847410202026367, "global_step": 63154, "epoch": 1503} {"train_loss": -5.866617679595947, "global_step": 63155, "epoch": 1503} {"train_loss": -5.839895248413086, "global_step": 63156, "epoch": 1503} {"train_loss": -5.9533281326293945, "global_step": 63157, "epoch": 1503} {"train_loss": -5.902630805969238, "global_step": 63158, "epoch": 1503} {"train_loss": -6.029322624206543, "global_step": 63159, "epoch": 1503} {"train_loss": -5.893537998199463, "global_step": 63160, "epoch": 1503} {"train_loss": -5.86602783203125, "global_step": 63161, "epoch": 1503} {"train_loss": -5.923784255981445, "global_step": 63162, "epoch": 1503} {"train_loss": -5.860145568847656, "global_step": 63163, "epoch": 1503} {"train_loss": -5.893102645874023, "global_step": 63164, "epoch": 1503} {"train_loss": -5.889237403869629, "global_step": 63165, "epoch": 1503} {"train_loss": -5.812842845916748, "global_step": 63166, "epoch": 1503} {"train_loss": -5.892792474655878, "global_step": 63167, "epoch": 1503, "val_loss": 66993.3984375} {"train_loss": -6.038999557495117, "global_step": 63168, "epoch": 1504} {"train_loss": -6.041449546813965, "global_step": 63169, "epoch": 1504} {"train_loss": -5.871657371520996, "global_step": 63170, "epoch": 1504} {"train_loss": -5.884230136871338, "global_step": 63171, "epoch": 1504} {"train_loss": -5.914741516113281, "global_step": 63172, "epoch": 1504} {"train_loss": -5.849074840545654, "global_step": 63173, "epoch": 1504} {"train_loss": -5.839572429656982, "global_step": 63174, "epoch": 1504} {"train_loss": -6.008129119873047, "global_step": 63175, "epoch": 1504} {"train_loss": -5.82274866104126, "global_step": 63176, "epoch": 1504} {"train_loss": -5.925302505493164, "global_step": 63177, "epoch": 1504} {"train_loss": -5.954187393188477, "global_step": 63178, "epoch": 1504} {"train_loss": -5.8771209716796875, "global_step": 63179, "epoch": 1504} {"train_loss": -5.907347679138184, "global_step": 63180, "epoch": 1504} {"train_loss": -5.881908893585205, "global_step": 63181, "epoch": 1504} {"train_loss": -5.907926559448242, "global_step": 63182, "epoch": 1504} {"train_loss": -5.878542900085449, "global_step": 63183, "epoch": 1504} {"train_loss": -5.9557037353515625, "global_step": 63184, "epoch": 1504} {"train_loss": -5.923912525177002, "global_step": 63185, "epoch": 1504} {"train_loss": -5.899075031280518, "global_step": 63186, "epoch": 1504} {"train_loss": -5.79581880569458, "global_step": 63187, "epoch": 1504} {"train_loss": -5.982425689697266, "global_step": 63188, "epoch": 1504} {"train_loss": -6.084981918334961, "global_step": 63189, "epoch": 1504} {"train_loss": -6.008876323699951, "global_step": 63190, "epoch": 1504} {"train_loss": -5.93233060836792, "global_step": 63191, "epoch": 1504} {"train_loss": -6.042644500732422, "global_step": 63192, "epoch": 1504} {"train_loss": -5.9449238777160645, "global_step": 63193, "epoch": 1504} {"train_loss": -6.0725507736206055, "global_step": 63194, "epoch": 1504} {"train_loss": -5.862248420715332, "global_step": 63195, "epoch": 1504} {"train_loss": -5.898398399353027, "global_step": 63196, "epoch": 1504} {"train_loss": -6.013185977935791, "global_step": 63197, "epoch": 1504} {"train_loss": -6.014215469360352, "global_step": 63198, "epoch": 1504} {"train_loss": -5.982666492462158, "global_step": 63199, "epoch": 1504} {"train_loss": -5.920422077178955, "global_step": 63200, "epoch": 1504} {"train_loss": -5.906835556030273, "global_step": 63201, "epoch": 1504} {"train_loss": -5.887419700622559, "global_step": 63202, "epoch": 1504} {"train_loss": -5.894792556762695, "global_step": 63203, "epoch": 1504} {"train_loss": -6.021726608276367, "global_step": 63204, "epoch": 1504} {"train_loss": -5.877959728240967, "global_step": 63205, "epoch": 1504} {"train_loss": -5.973801612854004, "global_step": 63206, "epoch": 1504} {"train_loss": -5.9591965675354, "global_step": 63207, "epoch": 1504} {"train_loss": -5.926598072052002, "global_step": 63208, "epoch": 1504} {"train_loss": -5.938545749301002, "global_step": 63209, "epoch": 1504, "val_loss": 66948.8828125} {"train_loss": -6.017949104309082, "global_step": 63210, "epoch": 1505} {"train_loss": -6.019037246704102, "global_step": 63211, "epoch": 1505} {"train_loss": -5.890393257141113, "global_step": 63212, "epoch": 1505} {"train_loss": -5.948915481567383, "global_step": 63213, "epoch": 1505} {"train_loss": -6.016989707946777, "global_step": 63214, "epoch": 1505} {"train_loss": -5.986172676086426, "global_step": 63215, "epoch": 1505} {"train_loss": -5.916163444519043, "global_step": 63216, "epoch": 1505} {"train_loss": -6.03406286239624, "global_step": 63217, "epoch": 1505} {"train_loss": -5.890938758850098, "global_step": 63218, "epoch": 1505} {"train_loss": -5.913800239562988, "global_step": 63219, "epoch": 1505} {"train_loss": -5.944149017333984, "global_step": 63220, "epoch": 1505} {"train_loss": -5.915563583374023, "global_step": 63221, "epoch": 1505} {"train_loss": -5.9135847091674805, "global_step": 63222, "epoch": 1505} {"train_loss": -5.914491653442383, "global_step": 63223, "epoch": 1505} {"train_loss": -6.08042049407959, "global_step": 63224, "epoch": 1505} {"train_loss": -5.965936660766602, "global_step": 63225, "epoch": 1505} {"train_loss": -5.954960823059082, "global_step": 63226, "epoch": 1505} {"train_loss": -6.011465072631836, "global_step": 63227, "epoch": 1505} {"train_loss": -5.90310001373291, "global_step": 63228, "epoch": 1505} {"train_loss": -5.881834983825684, "global_step": 63229, "epoch": 1505} {"train_loss": -5.920226097106934, "global_step": 63230, "epoch": 1505} {"train_loss": -5.9939093589782715, "global_step": 63231, "epoch": 1505} {"train_loss": -5.970427989959717, "global_step": 63232, "epoch": 1505} {"train_loss": -5.94650936126709, "global_step": 63233, "epoch": 1505} {"train_loss": -5.930024147033691, "global_step": 63234, "epoch": 1505} {"train_loss": -5.879402160644531, "global_step": 63235, "epoch": 1505} {"train_loss": -5.963461875915527, "global_step": 63236, "epoch": 1505} {"train_loss": -6.0366621017456055, "global_step": 63237, "epoch": 1505} {"train_loss": -5.9052934646606445, "global_step": 63238, "epoch": 1505} {"train_loss": -5.984659194946289, "global_step": 63239, "epoch": 1505} {"train_loss": -5.904843807220459, "global_step": 63240, "epoch": 1505} {"train_loss": -5.93862247467041, "global_step": 63241, "epoch": 1505} {"train_loss": -6.002163887023926, "global_step": 63242, "epoch": 1505} {"train_loss": -5.736084938049316, "global_step": 63243, "epoch": 1505} {"train_loss": -5.7652130126953125, "global_step": 63244, "epoch": 1505} {"train_loss": -5.8309431076049805, "global_step": 63245, "epoch": 1505} {"train_loss": -5.8776397705078125, "global_step": 63246, "epoch": 1505} {"train_loss": -5.842370510101318, "global_step": 63247, "epoch": 1505} {"train_loss": -5.728737831115723, "global_step": 63248, "epoch": 1505} {"train_loss": -6.041373252868652, "global_step": 63249, "epoch": 1505} {"train_loss": -5.928191184997559, "global_step": 63250, "epoch": 1505} {"train_loss": -5.928784608840942, "global_step": 63251, "epoch": 1505, "val_loss": 67156.6953125} {"train_loss": -5.933250427246094, "global_step": 63252, "epoch": 1506} {"train_loss": -5.883457183837891, "global_step": 63253, "epoch": 1506} {"train_loss": -5.87058162689209, "global_step": 63254, "epoch": 1506} {"train_loss": -5.9947590827941895, "global_step": 63255, "epoch": 1506} {"train_loss": -5.972618103027344, "global_step": 63256, "epoch": 1506} {"train_loss": -5.952456474304199, "global_step": 63257, "epoch": 1506} {"train_loss": -5.8067097663879395, "global_step": 63258, "epoch": 1506} {"train_loss": -5.718592643737793, "global_step": 63259, "epoch": 1506} {"train_loss": -5.891927719116211, "global_step": 63260, "epoch": 1506} {"train_loss": -5.862918376922607, "global_step": 63261, "epoch": 1506} {"train_loss": -5.933037757873535, "global_step": 63262, "epoch": 1506} {"train_loss": -5.746502876281738, "global_step": 63263, "epoch": 1506} {"train_loss": -5.787169933319092, "global_step": 63264, "epoch": 1506} {"train_loss": -5.700884819030762, "global_step": 63265, "epoch": 1506} {"train_loss": -5.872880935668945, "global_step": 63266, "epoch": 1506} {"train_loss": -5.948759078979492, "global_step": 63267, "epoch": 1506} {"train_loss": -5.769516944885254, "global_step": 63268, "epoch": 1506} {"train_loss": -5.843018531799316, "global_step": 63269, "epoch": 1506} {"train_loss": -5.845056533813477, "global_step": 63270, "epoch": 1506} {"train_loss": -5.855853080749512, "global_step": 63271, "epoch": 1506} {"train_loss": -5.991056442260742, "global_step": 63272, "epoch": 1506} {"train_loss": -5.802699089050293, "global_step": 63273, "epoch": 1506} {"train_loss": -5.974693775177002, "global_step": 63274, "epoch": 1506} {"train_loss": -5.867999076843262, "global_step": 63275, "epoch": 1506} {"train_loss": -5.8845720291137695, "global_step": 63276, "epoch": 1506} {"train_loss": -5.868260860443115, "global_step": 63277, "epoch": 1506} {"train_loss": -6.023608207702637, "global_step": 63278, "epoch": 1506} {"train_loss": -5.754007339477539, "global_step": 63279, "epoch": 1506} {"train_loss": -5.887352466583252, "global_step": 63280, "epoch": 1506} {"train_loss": -5.970114707946777, "global_step": 63281, "epoch": 1506} {"train_loss": -5.809027194976807, "global_step": 63282, "epoch": 1506} {"train_loss": -5.937525272369385, "global_step": 63283, "epoch": 1506} {"train_loss": -5.91047477722168, "global_step": 63284, "epoch": 1506} {"train_loss": -5.902338981628418, "global_step": 63285, "epoch": 1506} {"train_loss": -5.860891342163086, "global_step": 63286, "epoch": 1506} {"train_loss": -6.050000190734863, "global_step": 63287, "epoch": 1506} {"train_loss": -5.720127105712891, "global_step": 63288, "epoch": 1506} {"train_loss": -5.80802059173584, "global_step": 63289, "epoch": 1506} {"train_loss": -5.9421067237854, "global_step": 63290, "epoch": 1506} {"train_loss": -5.904691696166992, "global_step": 63291, "epoch": 1506} {"train_loss": -5.90058708190918, "global_step": 63292, "epoch": 1506} {"train_loss": -5.8774657476516, "global_step": 63293, "epoch": 1506, "val_loss": 67074.328125} {"train_loss": -5.860339641571045, "global_step": 63294, "epoch": 1507} {"train_loss": -5.911048412322998, "global_step": 63295, "epoch": 1507} {"train_loss": -6.0452470779418945, "global_step": 63296, "epoch": 1507} {"train_loss": -6.0461812019348145, "global_step": 63297, "epoch": 1507} {"train_loss": -5.970719814300537, "global_step": 63298, "epoch": 1507} {"train_loss": -5.929895401000977, "global_step": 63299, "epoch": 1507} {"train_loss": -5.816664218902588, "global_step": 63300, "epoch": 1507} {"train_loss": -5.9258599281311035, "global_step": 63301, "epoch": 1507} {"train_loss": -5.978288650512695, "global_step": 63302, "epoch": 1507} {"train_loss": -5.968029022216797, "global_step": 63303, "epoch": 1507} {"train_loss": -5.853580474853516, "global_step": 63304, "epoch": 1507} {"train_loss": -6.079159259796143, "global_step": 63305, "epoch": 1507} {"train_loss": -5.870763301849365, "global_step": 63306, "epoch": 1507} {"train_loss": -5.91926383972168, "global_step": 63307, "epoch": 1507} {"train_loss": -5.964201927185059, "global_step": 63308, "epoch": 1507} {"train_loss": -5.910645484924316, "global_step": 63309, "epoch": 1507} {"train_loss": -5.873126029968262, "global_step": 63310, "epoch": 1507} {"train_loss": -5.916858673095703, "global_step": 63311, "epoch": 1507} {"train_loss": -5.930298328399658, "global_step": 63312, "epoch": 1507} {"train_loss": -5.939784526824951, "global_step": 63313, "epoch": 1507} {"train_loss": -5.899472236633301, "global_step": 63314, "epoch": 1507} {"train_loss": -5.892088890075684, "global_step": 63315, "epoch": 1507} {"train_loss": -5.872626304626465, "global_step": 63316, "epoch": 1507} {"train_loss": -5.917358875274658, "global_step": 63317, "epoch": 1507} {"train_loss": -5.948065757751465, "global_step": 63318, "epoch": 1507} {"train_loss": -5.820739269256592, "global_step": 63319, "epoch": 1507} {"train_loss": -5.891729354858398, "global_step": 63320, "epoch": 1507} {"train_loss": -6.051051139831543, "global_step": 63321, "epoch": 1507} {"train_loss": -5.908844947814941, "global_step": 63322, "epoch": 1507} {"train_loss": -5.936164855957031, "global_step": 63323, "epoch": 1507} {"train_loss": -5.953592300415039, "global_step": 63324, "epoch": 1507} {"train_loss": -5.9925079345703125, "global_step": 63325, "epoch": 1507} {"train_loss": -5.940600872039795, "global_step": 63326, "epoch": 1507} {"train_loss": -5.906824111938477, "global_step": 63327, "epoch": 1507} {"train_loss": -5.996872901916504, "global_step": 63328, "epoch": 1507} {"train_loss": -6.046477317810059, "global_step": 63329, "epoch": 1507} {"train_loss": -6.057741641998291, "global_step": 63330, "epoch": 1507} {"train_loss": -5.963006496429443, "global_step": 63331, "epoch": 1507} {"train_loss": -5.894421100616455, "global_step": 63332, "epoch": 1507} {"train_loss": -6.093902587890625, "global_step": 63333, "epoch": 1507} {"train_loss": -5.921453475952148, "global_step": 63334, "epoch": 1507} {"train_loss": -5.9448720046452115, "global_step": 63335, "epoch": 1507, "val_loss": 66918.53125} {"train_loss": -5.897592544555664, "global_step": 63336, "epoch": 1508} {"train_loss": -5.948799133300781, "global_step": 63337, "epoch": 1508} {"train_loss": -5.864320755004883, "global_step": 63338, "epoch": 1508} {"train_loss": -5.9898881912231445, "global_step": 63339, "epoch": 1508} {"train_loss": -5.942090034484863, "global_step": 63340, "epoch": 1508} {"train_loss": -5.8436737060546875, "global_step": 63341, "epoch": 1508} {"train_loss": -5.989466190338135, "global_step": 63342, "epoch": 1508} {"train_loss": -5.902832508087158, "global_step": 63343, "epoch": 1508} {"train_loss": -5.9655351638793945, "global_step": 63344, "epoch": 1508} {"train_loss": -5.986509799957275, "global_step": 63345, "epoch": 1508} {"train_loss": -6.158268928527832, "global_step": 63346, "epoch": 1508} {"train_loss": -5.853856086730957, "global_step": 63347, "epoch": 1508} {"train_loss": -6.01238489151001, "global_step": 63348, "epoch": 1508} {"train_loss": -6.165122985839844, "global_step": 63349, "epoch": 1508} {"train_loss": -5.970076560974121, "global_step": 63350, "epoch": 1508} {"train_loss": -5.941498756408691, "global_step": 63351, "epoch": 1508} {"train_loss": -5.942658424377441, "global_step": 63352, "epoch": 1508} {"train_loss": -5.993988990783691, "global_step": 63353, "epoch": 1508} {"train_loss": -5.858318328857422, "global_step": 63354, "epoch": 1508} {"train_loss": -6.015631198883057, "global_step": 63355, "epoch": 1508} {"train_loss": -5.936466217041016, "global_step": 63356, "epoch": 1508} {"train_loss": -5.967232704162598, "global_step": 63357, "epoch": 1508} {"train_loss": -5.944163799285889, "global_step": 63358, "epoch": 1508} {"train_loss": -6.014296531677246, "global_step": 63359, "epoch": 1508} {"train_loss": -5.951159477233887, "global_step": 63360, "epoch": 1508} {"train_loss": -5.960786819458008, "global_step": 63361, "epoch": 1508} {"train_loss": -5.9715576171875, "global_step": 63362, "epoch": 1508} {"train_loss": -5.870596885681152, "global_step": 63363, "epoch": 1508} {"train_loss": -5.883439064025879, "global_step": 63364, "epoch": 1508} {"train_loss": -5.885465621948242, "global_step": 63365, "epoch": 1508} {"train_loss": -6.012179374694824, "global_step": 63366, "epoch": 1508} {"train_loss": -5.9274067878723145, "global_step": 63367, "epoch": 1508} {"train_loss": -5.8474626541137695, "global_step": 63368, "epoch": 1508} {"train_loss": -5.928161144256592, "global_step": 63369, "epoch": 1508} {"train_loss": -5.933391571044922, "global_step": 63370, "epoch": 1508} {"train_loss": -6.060050964355469, "global_step": 63371, "epoch": 1508} {"train_loss": -5.764001846313477, "global_step": 63372, "epoch": 1508} {"train_loss": -5.926876068115234, "global_step": 63373, "epoch": 1508} {"train_loss": -6.078145503997803, "global_step": 63374, "epoch": 1508} {"train_loss": -6.045572757720947, "global_step": 63375, "epoch": 1508} {"train_loss": -5.93358039855957, "global_step": 63376, "epoch": 1508} {"train_loss": -5.954158601306734, "global_step": 63377, "epoch": 1508, "val_loss": 67012.5859375} {"train_loss": -5.982749938964844, "global_step": 63378, "epoch": 1509} {"train_loss": -5.996145725250244, "global_step": 63379, "epoch": 1509} {"train_loss": -5.8807806968688965, "global_step": 63380, "epoch": 1509} {"train_loss": -5.969524383544922, "global_step": 63381, "epoch": 1509} {"train_loss": -6.0531463623046875, "global_step": 63382, "epoch": 1509} {"train_loss": -5.988343715667725, "global_step": 63383, "epoch": 1509} {"train_loss": -5.930912971496582, "global_step": 63384, "epoch": 1509} {"train_loss": -6.033434867858887, "global_step": 63385, "epoch": 1509} {"train_loss": -5.820888996124268, "global_step": 63386, "epoch": 1509} {"train_loss": -5.956636428833008, "global_step": 63387, "epoch": 1509} {"train_loss": -5.781461715698242, "global_step": 63388, "epoch": 1509} {"train_loss": -5.865936279296875, "global_step": 63389, "epoch": 1509} {"train_loss": -5.985152244567871, "global_step": 63390, "epoch": 1509} {"train_loss": -5.789020538330078, "global_step": 63391, "epoch": 1509} {"train_loss": -5.859444618225098, "global_step": 63392, "epoch": 1509} {"train_loss": -5.986064910888672, "global_step": 63393, "epoch": 1509} {"train_loss": -5.845101356506348, "global_step": 63394, "epoch": 1509} {"train_loss": -5.855391979217529, "global_step": 63395, "epoch": 1509} {"train_loss": -6.095753192901611, "global_step": 63396, "epoch": 1509} {"train_loss": -5.849164009094238, "global_step": 63397, "epoch": 1509} {"train_loss": -5.919418811798096, "global_step": 63398, "epoch": 1509} {"train_loss": -5.882038116455078, "global_step": 63399, "epoch": 1509} {"train_loss": -5.945002555847168, "global_step": 63400, "epoch": 1509} {"train_loss": -5.934401512145996, "global_step": 63401, "epoch": 1509} {"train_loss": -5.898210048675537, "global_step": 63402, "epoch": 1509} {"train_loss": -6.022270202636719, "global_step": 63403, "epoch": 1509} {"train_loss": -5.927912712097168, "global_step": 63404, "epoch": 1509} {"train_loss": -5.957000255584717, "global_step": 63405, "epoch": 1509} {"train_loss": -5.974409103393555, "global_step": 63406, "epoch": 1509} {"train_loss": -5.840892791748047, "global_step": 63407, "epoch": 1509} {"train_loss": -5.867203235626221, "global_step": 63408, "epoch": 1509} {"train_loss": -5.891994476318359, "global_step": 63409, "epoch": 1509} {"train_loss": -5.969409942626953, "global_step": 63410, "epoch": 1509} {"train_loss": -5.901028156280518, "global_step": 63411, "epoch": 1509} {"train_loss": -5.954522609710693, "global_step": 63412, "epoch": 1509} {"train_loss": -5.9349822998046875, "global_step": 63413, "epoch": 1509} {"train_loss": -5.894301891326904, "global_step": 63414, "epoch": 1509} {"train_loss": -5.9499430656433105, "global_step": 63415, "epoch": 1509} {"train_loss": -5.900658130645752, "global_step": 63416, "epoch": 1509} {"train_loss": -5.7937092781066895, "global_step": 63417, "epoch": 1509} {"train_loss": -5.9098052978515625, "global_step": 63418, "epoch": 1509} {"train_loss": -5.924445958364577, "global_step": 63419, "epoch": 1509, "val_loss": 66962.96875} {"train_loss": -6.0059003829956055, "global_step": 63420, "epoch": 1510} {"train_loss": -5.933423042297363, "global_step": 63421, "epoch": 1510} {"train_loss": -5.963622093200684, "global_step": 63422, "epoch": 1510} {"train_loss": -5.953439712524414, "global_step": 63423, "epoch": 1510} {"train_loss": -5.919139385223389, "global_step": 63424, "epoch": 1510} {"train_loss": -5.935544967651367, "global_step": 63425, "epoch": 1510} {"train_loss": -5.9235687255859375, "global_step": 63426, "epoch": 1510} {"train_loss": -5.934233665466309, "global_step": 63427, "epoch": 1510} {"train_loss": -6.011100769042969, "global_step": 63428, "epoch": 1510} {"train_loss": -5.7745890617370605, "global_step": 63429, "epoch": 1510} {"train_loss": -6.028922080993652, "global_step": 63430, "epoch": 1510} {"train_loss": -5.897061347961426, "global_step": 63431, "epoch": 1510} {"train_loss": -5.946216583251953, "global_step": 63432, "epoch": 1510} {"train_loss": -5.942666530609131, "global_step": 63433, "epoch": 1510} {"train_loss": -5.794323921203613, "global_step": 63434, "epoch": 1510} {"train_loss": -5.947504043579102, "global_step": 63435, "epoch": 1510} {"train_loss": -5.801424980163574, "global_step": 63436, "epoch": 1510} {"train_loss": -5.915082931518555, "global_step": 63437, "epoch": 1510} {"train_loss": -5.7715163230896, "global_step": 63438, "epoch": 1510} {"train_loss": -5.926365852355957, "global_step": 63439, "epoch": 1510} {"train_loss": -5.991948127746582, "global_step": 63440, "epoch": 1510} {"train_loss": -6.003516674041748, "global_step": 63441, "epoch": 1510} {"train_loss": -5.88385534286499, "global_step": 63442, "epoch": 1510} {"train_loss": -5.912475109100342, "global_step": 63443, "epoch": 1510} {"train_loss": -5.920413017272949, "global_step": 63444, "epoch": 1510} {"train_loss": -6.007397651672363, "global_step": 63445, "epoch": 1510} {"train_loss": -5.935098171234131, "global_step": 63446, "epoch": 1510} {"train_loss": -5.938853740692139, "global_step": 63447, "epoch": 1510} {"train_loss": -5.899951934814453, "global_step": 63448, "epoch": 1510} {"train_loss": -5.935482025146484, "global_step": 63449, "epoch": 1510} {"train_loss": -5.906809329986572, "global_step": 63450, "epoch": 1510} {"train_loss": -5.8810553550720215, "global_step": 63451, "epoch": 1510} {"train_loss": -5.972411155700684, "global_step": 63452, "epoch": 1510} {"train_loss": -5.852099418640137, "global_step": 63453, "epoch": 1510} {"train_loss": -5.852041244506836, "global_step": 63454, "epoch": 1510} {"train_loss": -5.922629356384277, "global_step": 63455, "epoch": 1510} {"train_loss": -5.9243879318237305, "global_step": 63456, "epoch": 1510} {"train_loss": -5.805870532989502, "global_step": 63457, "epoch": 1510} {"train_loss": -5.959771156311035, "global_step": 63458, "epoch": 1510} {"train_loss": -5.916975498199463, "global_step": 63459, "epoch": 1510} {"train_loss": -5.928773880004883, "global_step": 63460, "epoch": 1510} {"train_loss": -5.919610046205067, "global_step": 63461, "epoch": 1510, "val_loss": 66815.8359375} {"train_loss": -5.9841814041137695, "global_step": 63462, "epoch": 1511} {"train_loss": -6.003005027770996, "global_step": 63463, "epoch": 1511} {"train_loss": -5.836308002471924, "global_step": 63464, "epoch": 1511} {"train_loss": -6.0139241218566895, "global_step": 63465, "epoch": 1511} {"train_loss": -5.899747371673584, "global_step": 63466, "epoch": 1511} {"train_loss": -5.947781562805176, "global_step": 63467, "epoch": 1511} {"train_loss": -5.955901145935059, "global_step": 63468, "epoch": 1511} {"train_loss": -6.025883674621582, "global_step": 63469, "epoch": 1511} {"train_loss": -5.9493513107299805, "global_step": 63470, "epoch": 1511} {"train_loss": -5.8601484298706055, "global_step": 63471, "epoch": 1511} {"train_loss": -5.890785217285156, "global_step": 63472, "epoch": 1511} {"train_loss": -5.875688076019287, "global_step": 63473, "epoch": 1511} {"train_loss": -5.876499652862549, "global_step": 63474, "epoch": 1511} {"train_loss": -5.908896446228027, "global_step": 63475, "epoch": 1511} {"train_loss": -5.858346462249756, "global_step": 63476, "epoch": 1511} {"train_loss": -5.944343566894531, "global_step": 63477, "epoch": 1511} {"train_loss": -5.897645950317383, "global_step": 63478, "epoch": 1511} {"train_loss": -5.961391448974609, "global_step": 63479, "epoch": 1511} {"train_loss": -5.84822940826416, "global_step": 63480, "epoch": 1511} {"train_loss": -5.886570453643799, "global_step": 63481, "epoch": 1511} {"train_loss": -5.89129638671875, "global_step": 63482, "epoch": 1511} {"train_loss": -5.904997825622559, "global_step": 63483, "epoch": 1511} {"train_loss": -5.915626049041748, "global_step": 63484, "epoch": 1511} {"train_loss": -5.8966064453125, "global_step": 63485, "epoch": 1511} {"train_loss": -6.0129499435424805, "global_step": 63486, "epoch": 1511} {"train_loss": -5.891317367553711, "global_step": 63487, "epoch": 1511} {"train_loss": -5.9491963386535645, "global_step": 63488, "epoch": 1511} {"train_loss": -5.9395751953125, "global_step": 63489, "epoch": 1511} {"train_loss": -5.968833923339844, "global_step": 63490, "epoch": 1511} {"train_loss": -5.8818359375, "global_step": 63491, "epoch": 1511} {"train_loss": -5.967836380004883, "global_step": 63492, "epoch": 1511} {"train_loss": -5.984670639038086, "global_step": 63493, "epoch": 1511} {"train_loss": -5.964174270629883, "global_step": 63494, "epoch": 1511} {"train_loss": -5.861128807067871, "global_step": 63495, "epoch": 1511} {"train_loss": -5.990246772766113, "global_step": 63496, "epoch": 1511} {"train_loss": -6.13754415512085, "global_step": 63497, "epoch": 1511} {"train_loss": -5.9781365394592285, "global_step": 63498, "epoch": 1511} {"train_loss": -5.96685791015625, "global_step": 63499, "epoch": 1511} {"train_loss": -5.9069671630859375, "global_step": 63500, "epoch": 1511} {"train_loss": -6.011178016662598, "global_step": 63501, "epoch": 1511} {"train_loss": -6.006283283233643, "global_step": 63502, "epoch": 1511} {"train_loss": -5.934912965411232, "global_step": 63503, "epoch": 1511, "val_loss": 66750.53125} {"train_loss": -5.960764408111572, "global_step": 63504, "epoch": 1512} {"train_loss": -5.939453125, "global_step": 63505, "epoch": 1512} {"train_loss": -5.9053754806518555, "global_step": 63506, "epoch": 1512} {"train_loss": -5.896778106689453, "global_step": 63507, "epoch": 1512} {"train_loss": -5.84463357925415, "global_step": 63508, "epoch": 1512} {"train_loss": -5.907320976257324, "global_step": 63509, "epoch": 1512} {"train_loss": -5.936864376068115, "global_step": 63510, "epoch": 1512} {"train_loss": -5.95247745513916, "global_step": 63511, "epoch": 1512} {"train_loss": -5.881840705871582, "global_step": 63512, "epoch": 1512} {"train_loss": -5.9018988609313965, "global_step": 63513, "epoch": 1512} {"train_loss": -5.8955159187316895, "global_step": 63514, "epoch": 1512} {"train_loss": -5.924225807189941, "global_step": 63515, "epoch": 1512} {"train_loss": -5.821955680847168, "global_step": 63516, "epoch": 1512} {"train_loss": -5.772710800170898, "global_step": 63517, "epoch": 1512} {"train_loss": -5.948105812072754, "global_step": 63518, "epoch": 1512} {"train_loss": -5.923502445220947, "global_step": 63519, "epoch": 1512} {"train_loss": -5.87102746963501, "global_step": 63520, "epoch": 1512} {"train_loss": -5.974919319152832, "global_step": 63521, "epoch": 1512} {"train_loss": -5.946524620056152, "global_step": 63522, "epoch": 1512} {"train_loss": -5.945895195007324, "global_step": 63523, "epoch": 1512} {"train_loss": -5.928138256072998, "global_step": 63524, "epoch": 1512} {"train_loss": -5.906100749969482, "global_step": 63525, "epoch": 1512} {"train_loss": -5.97789192199707, "global_step": 63526, "epoch": 1512} {"train_loss": -5.969869613647461, "global_step": 63527, "epoch": 1512} {"train_loss": -5.950506687164307, "global_step": 63528, "epoch": 1512} {"train_loss": -5.965256214141846, "global_step": 63529, "epoch": 1512} {"train_loss": -5.945228099822998, "global_step": 63530, "epoch": 1512} {"train_loss": -5.919755935668945, "global_step": 63531, "epoch": 1512} {"train_loss": -5.968249320983887, "global_step": 63532, "epoch": 1512} {"train_loss": -5.852965354919434, "global_step": 63533, "epoch": 1512} {"train_loss": -5.899130821228027, "global_step": 63534, "epoch": 1512} {"train_loss": -5.879979133605957, "global_step": 63535, "epoch": 1512} {"train_loss": -5.9520087242126465, "global_step": 63536, "epoch": 1512} {"train_loss": -5.822962760925293, "global_step": 63537, "epoch": 1512} {"train_loss": -5.810392379760742, "global_step": 63538, "epoch": 1512} {"train_loss": -5.839344024658203, "global_step": 63539, "epoch": 1512} {"train_loss": -5.924502849578857, "global_step": 63540, "epoch": 1512} {"train_loss": -5.961541175842285, "global_step": 63541, "epoch": 1512} {"train_loss": -5.866187572479248, "global_step": 63542, "epoch": 1512} {"train_loss": -5.93319034576416, "global_step": 63543, "epoch": 1512} {"train_loss": -5.895688056945801, "global_step": 63544, "epoch": 1512} {"train_loss": -5.911859217144194, "global_step": 63545, "epoch": 1512, "val_loss": 66863.140625} {"train_loss": -6.005484104156494, "global_step": 63546, "epoch": 1513} {"train_loss": -5.858119010925293, "global_step": 63547, "epoch": 1513} {"train_loss": -5.831666946411133, "global_step": 63548, "epoch": 1513} {"train_loss": -5.875497817993164, "global_step": 63549, "epoch": 1513} {"train_loss": -5.903824806213379, "global_step": 63550, "epoch": 1513} {"train_loss": -5.896512508392334, "global_step": 63551, "epoch": 1513} {"train_loss": -6.037101745605469, "global_step": 63552, "epoch": 1513} {"train_loss": -5.904199123382568, "global_step": 63553, "epoch": 1513} {"train_loss": -6.012869358062744, "global_step": 63554, "epoch": 1513} {"train_loss": -5.936395645141602, "global_step": 63555, "epoch": 1513} {"train_loss": -5.899576663970947, "global_step": 63556, "epoch": 1513} {"train_loss": -6.0468525886535645, "global_step": 63557, "epoch": 1513} {"train_loss": -5.921331405639648, "global_step": 63558, "epoch": 1513} {"train_loss": -5.918224334716797, "global_step": 63559, "epoch": 1513} {"train_loss": -5.953803062438965, "global_step": 63560, "epoch": 1513} {"train_loss": -5.855864524841309, "global_step": 63561, "epoch": 1513} {"train_loss": -5.967137813568115, "global_step": 63562, "epoch": 1513} {"train_loss": -5.9295573234558105, "global_step": 63563, "epoch": 1513} {"train_loss": -5.896124362945557, "global_step": 63564, "epoch": 1513} {"train_loss": -5.934394836425781, "global_step": 63565, "epoch": 1513} {"train_loss": -5.991972923278809, "global_step": 63566, "epoch": 1513} {"train_loss": -5.944494724273682, "global_step": 63567, "epoch": 1513} {"train_loss": -5.941067695617676, "global_step": 63568, "epoch": 1513} {"train_loss": -5.769933223724365, "global_step": 63569, "epoch": 1513} {"train_loss": -6.0399370193481445, "global_step": 63570, "epoch": 1513} {"train_loss": -5.872531890869141, "global_step": 63571, "epoch": 1513} {"train_loss": -5.92965030670166, "global_step": 63572, "epoch": 1513} {"train_loss": -5.997430324554443, "global_step": 63573, "epoch": 1513} {"train_loss": -5.932570457458496, "global_step": 63574, "epoch": 1513} {"train_loss": -5.855937957763672, "global_step": 63575, "epoch": 1513} {"train_loss": -5.892921447753906, "global_step": 63576, "epoch": 1513} {"train_loss": -5.993144989013672, "global_step": 63577, "epoch": 1513} {"train_loss": -5.935554504394531, "global_step": 63578, "epoch": 1513} {"train_loss": -5.992214679718018, "global_step": 63579, "epoch": 1513} {"train_loss": -5.942739963531494, "global_step": 63580, "epoch": 1513} {"train_loss": -5.96304988861084, "global_step": 63581, "epoch": 1513} {"train_loss": -6.030289173126221, "global_step": 63582, "epoch": 1513} {"train_loss": -5.941556930541992, "global_step": 63583, "epoch": 1513} {"train_loss": -5.785404205322266, "global_step": 63584, "epoch": 1513} {"train_loss": -6.041597843170166, "global_step": 63585, "epoch": 1513} {"train_loss": -5.975913047790527, "global_step": 63586, "epoch": 1513} {"train_loss": -5.936691885902768, "global_step": 63587, "epoch": 1513, "val_loss": 66972.671875} {"train_loss": -5.894255638122559, "global_step": 63588, "epoch": 1514} {"train_loss": -5.939547538757324, "global_step": 63589, "epoch": 1514} {"train_loss": -5.889444351196289, "global_step": 63590, "epoch": 1514} {"train_loss": -5.8834028244018555, "global_step": 63591, "epoch": 1514} {"train_loss": -5.751740455627441, "global_step": 63592, "epoch": 1514} {"train_loss": -6.022565841674805, "global_step": 63593, "epoch": 1514} {"train_loss": -6.012409210205078, "global_step": 63594, "epoch": 1514} {"train_loss": -5.740438461303711, "global_step": 63595, "epoch": 1514} {"train_loss": -5.947842597961426, "global_step": 63596, "epoch": 1514} {"train_loss": -5.9375410079956055, "global_step": 63597, "epoch": 1514} {"train_loss": -5.851372241973877, "global_step": 63598, "epoch": 1514} {"train_loss": -5.937234878540039, "global_step": 63599, "epoch": 1514} {"train_loss": -5.925708293914795, "global_step": 63600, "epoch": 1514} {"train_loss": -5.955320358276367, "global_step": 63601, "epoch": 1514} {"train_loss": -5.877444267272949, "global_step": 63602, "epoch": 1514} {"train_loss": -5.7411980628967285, "global_step": 63603, "epoch": 1514} {"train_loss": -5.9265336990356445, "global_step": 63604, "epoch": 1514} {"train_loss": -5.812578201293945, "global_step": 63605, "epoch": 1514} {"train_loss": -5.905314922332764, "global_step": 63606, "epoch": 1514} {"train_loss": -5.8644561767578125, "global_step": 63607, "epoch": 1514} {"train_loss": -5.939069747924805, "global_step": 63608, "epoch": 1514} {"train_loss": -5.944932460784912, "global_step": 63609, "epoch": 1514} {"train_loss": -5.863766670227051, "global_step": 63610, "epoch": 1514} {"train_loss": -5.894219398498535, "global_step": 63611, "epoch": 1514} {"train_loss": -6.055119514465332, "global_step": 63612, "epoch": 1514} {"train_loss": -5.949894905090332, "global_step": 63613, "epoch": 1514} {"train_loss": -5.980428695678711, "global_step": 63614, "epoch": 1514} {"train_loss": -5.891429424285889, "global_step": 63615, "epoch": 1514} {"train_loss": -5.820891380310059, "global_step": 63616, "epoch": 1514} {"train_loss": -5.877864360809326, "global_step": 63617, "epoch": 1514} {"train_loss": -5.865048408508301, "global_step": 63618, "epoch": 1514} {"train_loss": -5.969107151031494, "global_step": 63619, "epoch": 1514} {"train_loss": -5.992807388305664, "global_step": 63620, "epoch": 1514} {"train_loss": -6.0090436935424805, "global_step": 63621, "epoch": 1514} {"train_loss": -5.895008087158203, "global_step": 63622, "epoch": 1514} {"train_loss": -5.802562713623047, "global_step": 63623, "epoch": 1514} {"train_loss": -5.828451156616211, "global_step": 63624, "epoch": 1514} {"train_loss": -5.786930084228516, "global_step": 63625, "epoch": 1514} {"train_loss": -5.9628729820251465, "global_step": 63626, "epoch": 1514} {"train_loss": -5.868346214294434, "global_step": 63627, "epoch": 1514} {"train_loss": -5.949676036834717, "global_step": 63628, "epoch": 1514} {"train_loss": -5.9008087657746815, "global_step": 63629, "epoch": 1514, "val_loss": 66911.46875} {"train_loss": -5.835399150848389, "global_step": 63630, "epoch": 1515} {"train_loss": -5.860825538635254, "global_step": 63631, "epoch": 1515} {"train_loss": -5.946331024169922, "global_step": 63632, "epoch": 1515} {"train_loss": -5.985401630401611, "global_step": 63633, "epoch": 1515} {"train_loss": -5.836225509643555, "global_step": 63634, "epoch": 1515} {"train_loss": -5.764129638671875, "global_step": 63635, "epoch": 1515} {"train_loss": -5.850399971008301, "global_step": 63636, "epoch": 1515} {"train_loss": -5.719393730163574, "global_step": 63637, "epoch": 1515} {"train_loss": -5.855179786682129, "global_step": 63638, "epoch": 1515} {"train_loss": -5.802159309387207, "global_step": 63639, "epoch": 1515} {"train_loss": -5.9475884437561035, "global_step": 63640, "epoch": 1515} {"train_loss": -5.86650276184082, "global_step": 63641, "epoch": 1515} {"train_loss": -5.847316741943359, "global_step": 63642, "epoch": 1515} {"train_loss": -5.7027997970581055, "global_step": 63643, "epoch": 1515} {"train_loss": -5.838073253631592, "global_step": 63644, "epoch": 1515} {"train_loss": -6.0456223487854, "global_step": 63645, "epoch": 1515} {"train_loss": -5.895064353942871, "global_step": 63646, "epoch": 1515} {"train_loss": -5.9999589920043945, "global_step": 63647, "epoch": 1515} {"train_loss": -5.842839241027832, "global_step": 63648, "epoch": 1515} {"train_loss": -5.928028583526611, "global_step": 63649, "epoch": 1515} {"train_loss": -5.857388496398926, "global_step": 63650, "epoch": 1515} {"train_loss": -6.019113540649414, "global_step": 63651, "epoch": 1515} {"train_loss": -6.002284049987793, "global_step": 63652, "epoch": 1515} {"train_loss": -5.982655048370361, "global_step": 63653, "epoch": 1515} {"train_loss": -5.96228551864624, "global_step": 63654, "epoch": 1515} {"train_loss": -5.9130024909973145, "global_step": 63655, "epoch": 1515} {"train_loss": -5.938686370849609, "global_step": 63656, "epoch": 1515} {"train_loss": -5.887737274169922, "global_step": 63657, "epoch": 1515} {"train_loss": -5.883183002471924, "global_step": 63658, "epoch": 1515} {"train_loss": -5.8818793296813965, "global_step": 63659, "epoch": 1515} {"train_loss": -5.964501857757568, "global_step": 63660, "epoch": 1515} {"train_loss": -5.976863861083984, "global_step": 63661, "epoch": 1515} {"train_loss": -5.956612586975098, "global_step": 63662, "epoch": 1515} {"train_loss": -5.8695878982543945, "global_step": 63663, "epoch": 1515} {"train_loss": -5.8642377853393555, "global_step": 63664, "epoch": 1515} {"train_loss": -5.802491664886475, "global_step": 63665, "epoch": 1515} {"train_loss": -6.070077419281006, "global_step": 63666, "epoch": 1515} {"train_loss": -5.882060527801514, "global_step": 63667, "epoch": 1515} {"train_loss": -5.837575912475586, "global_step": 63668, "epoch": 1515} {"train_loss": -5.8400373458862305, "global_step": 63669, "epoch": 1515} {"train_loss": -5.801767349243164, "global_step": 63670, "epoch": 1515} {"train_loss": -5.890527475447882, "global_step": 63671, "epoch": 1515, "val_loss": 66802.125} {"train_loss": -6.10964298248291, "global_step": 63672, "epoch": 1516} {"train_loss": -5.962059020996094, "global_step": 63673, "epoch": 1516} {"train_loss": -6.085755348205566, "global_step": 63674, "epoch": 1516} {"train_loss": -5.932457447052002, "global_step": 63675, "epoch": 1516} {"train_loss": -5.933420181274414, "global_step": 63676, "epoch": 1516} {"train_loss": -6.045622825622559, "global_step": 63677, "epoch": 1516} {"train_loss": -6.017505645751953, "global_step": 63678, "epoch": 1516} {"train_loss": -6.081229209899902, "global_step": 63679, "epoch": 1516} {"train_loss": -5.918271064758301, "global_step": 63680, "epoch": 1516} {"train_loss": -5.973492622375488, "global_step": 63681, "epoch": 1516} {"train_loss": -6.028231620788574, "global_step": 63682, "epoch": 1516} {"train_loss": -5.98068904876709, "global_step": 63683, "epoch": 1516} {"train_loss": -5.965361595153809, "global_step": 63684, "epoch": 1516} {"train_loss": -5.887333393096924, "global_step": 63685, "epoch": 1516} {"train_loss": -5.887687683105469, "global_step": 63686, "epoch": 1516} {"train_loss": -5.909797668457031, "global_step": 63687, "epoch": 1516} {"train_loss": -5.854291915893555, "global_step": 63688, "epoch": 1516} {"train_loss": -5.794272422790527, "global_step": 63689, "epoch": 1516} {"train_loss": -5.732814788818359, "global_step": 63690, "epoch": 1516} {"train_loss": -5.920517921447754, "global_step": 63691, "epoch": 1516} {"train_loss": -5.938716411590576, "global_step": 63692, "epoch": 1516} {"train_loss": -5.776898384094238, "global_step": 63693, "epoch": 1516} {"train_loss": -5.874875068664551, "global_step": 63694, "epoch": 1516} {"train_loss": -5.799763202667236, "global_step": 63695, "epoch": 1516} {"train_loss": -5.931846618652344, "global_step": 63696, "epoch": 1516} {"train_loss": -5.850468635559082, "global_step": 63697, "epoch": 1516} {"train_loss": -5.908143997192383, "global_step": 63698, "epoch": 1516} {"train_loss": -5.870760917663574, "global_step": 63699, "epoch": 1516} {"train_loss": -6.027961254119873, "global_step": 63700, "epoch": 1516} {"train_loss": -5.904129981994629, "global_step": 63701, "epoch": 1516} {"train_loss": -5.815367698669434, "global_step": 63702, "epoch": 1516} {"train_loss": -5.952944278717041, "global_step": 63703, "epoch": 1516} {"train_loss": -5.817852020263672, "global_step": 63704, "epoch": 1516} {"train_loss": -5.843374252319336, "global_step": 63705, "epoch": 1516} {"train_loss": -5.868840217590332, "global_step": 63706, "epoch": 1516} {"train_loss": -5.742131233215332, "global_step": 63707, "epoch": 1516} {"train_loss": -5.863014221191406, "global_step": 63708, "epoch": 1516} {"train_loss": -5.886438369750977, "global_step": 63709, "epoch": 1516} {"train_loss": -5.938778877258301, "global_step": 63710, "epoch": 1516} {"train_loss": -5.861969470977783, "global_step": 63711, "epoch": 1516} {"train_loss": -5.8816237449646, "global_step": 63712, "epoch": 1516} {"train_loss": -5.908174821308681, "global_step": 63713, "epoch": 1516, "val_loss": 67230.1875} {"train_loss": -6.021635055541992, "global_step": 63714, "epoch": 1517} {"train_loss": -5.864777565002441, "global_step": 63715, "epoch": 1517} {"train_loss": -5.998843193054199, "global_step": 63716, "epoch": 1517} {"train_loss": -5.951566696166992, "global_step": 63717, "epoch": 1517} {"train_loss": -6.006765365600586, "global_step": 63718, "epoch": 1517} {"train_loss": -5.960122108459473, "global_step": 63719, "epoch": 1517} {"train_loss": -5.981967449188232, "global_step": 63720, "epoch": 1517} {"train_loss": -5.804096221923828, "global_step": 63721, "epoch": 1517} {"train_loss": -5.966081142425537, "global_step": 63722, "epoch": 1517} {"train_loss": -6.116374492645264, "global_step": 63723, "epoch": 1517} {"train_loss": -5.97119665145874, "global_step": 63724, "epoch": 1517} {"train_loss": -5.889902114868164, "global_step": 63725, "epoch": 1517} {"train_loss": -5.929776191711426, "global_step": 63726, "epoch": 1517} {"train_loss": -5.819030284881592, "global_step": 63727, "epoch": 1517} {"train_loss": -5.888247489929199, "global_step": 63728, "epoch": 1517} {"train_loss": -5.888860702514648, "global_step": 63729, "epoch": 1517} {"train_loss": -5.974081039428711, "global_step": 63730, "epoch": 1517} {"train_loss": -5.838343143463135, "global_step": 63731, "epoch": 1517} {"train_loss": -5.922354698181152, "global_step": 63732, "epoch": 1517} {"train_loss": -5.905488014221191, "global_step": 63733, "epoch": 1517} {"train_loss": -5.892770767211914, "global_step": 63734, "epoch": 1517} {"train_loss": -5.946024417877197, "global_step": 63735, "epoch": 1517} {"train_loss": -5.874295234680176, "global_step": 63736, "epoch": 1517} {"train_loss": -5.800047874450684, "global_step": 63737, "epoch": 1517} {"train_loss": -5.893096923828125, "global_step": 63738, "epoch": 1517} {"train_loss": -5.773842811584473, "global_step": 63739, "epoch": 1517} {"train_loss": -5.890855312347412, "global_step": 63740, "epoch": 1517} {"train_loss": -5.845565319061279, "global_step": 63741, "epoch": 1517} {"train_loss": -5.865788459777832, "global_step": 63742, "epoch": 1517} {"train_loss": -5.911989212036133, "global_step": 63743, "epoch": 1517} {"train_loss": -5.786355972290039, "global_step": 63744, "epoch": 1517} {"train_loss": -5.93255615234375, "global_step": 63745, "epoch": 1517} {"train_loss": -5.902628421783447, "global_step": 63746, "epoch": 1517} {"train_loss": -5.8952860832214355, "global_step": 63747, "epoch": 1517} {"train_loss": -5.963405132293701, "global_step": 63748, "epoch": 1517} {"train_loss": -5.973634719848633, "global_step": 63749, "epoch": 1517} {"train_loss": -6.012691497802734, "global_step": 63750, "epoch": 1517} {"train_loss": -5.718622207641602, "global_step": 63751, "epoch": 1517} {"train_loss": -5.99826717376709, "global_step": 63752, "epoch": 1517} {"train_loss": -5.893047332763672, "global_step": 63753, "epoch": 1517} {"train_loss": -6.028413772583008, "global_step": 63754, "epoch": 1517} {"train_loss": -5.914491176605225, "global_step": 63755, "epoch": 1517, "val_loss": 67071.28125} {"train_loss": -5.8002519607543945, "global_step": 63756, "epoch": 1518} {"train_loss": -5.880919456481934, "global_step": 63757, "epoch": 1518} {"train_loss": -5.9492902755737305, "global_step": 63758, "epoch": 1518} {"train_loss": -5.924129962921143, "global_step": 63759, "epoch": 1518} {"train_loss": -5.997634410858154, "global_step": 63760, "epoch": 1518} {"train_loss": -5.955796241760254, "global_step": 63761, "epoch": 1518} {"train_loss": -5.8711419105529785, "global_step": 63762, "epoch": 1518} {"train_loss": -5.861340045928955, "global_step": 63763, "epoch": 1518} {"train_loss": -5.885727405548096, "global_step": 63764, "epoch": 1518} {"train_loss": -5.872525691986084, "global_step": 63765, "epoch": 1518} {"train_loss": -5.802307605743408, "global_step": 63766, "epoch": 1518} {"train_loss": -5.9345855712890625, "global_step": 63767, "epoch": 1518} {"train_loss": -5.861189842224121, "global_step": 63768, "epoch": 1518} {"train_loss": -5.986762523651123, "global_step": 63769, "epoch": 1518} {"train_loss": -5.9191389083862305, "global_step": 63770, "epoch": 1518} {"train_loss": -5.909065246582031, "global_step": 63771, "epoch": 1518} {"train_loss": -5.968447208404541, "global_step": 63772, "epoch": 1518} {"train_loss": -5.934847354888916, "global_step": 63773, "epoch": 1518} {"train_loss": -5.999807834625244, "global_step": 63774, "epoch": 1518} {"train_loss": -6.01027250289917, "global_step": 63775, "epoch": 1518} {"train_loss": -5.808976173400879, "global_step": 63776, "epoch": 1518} {"train_loss": -6.051824569702148, "global_step": 63777, "epoch": 1518} {"train_loss": -5.921169281005859, "global_step": 63778, "epoch": 1518} {"train_loss": -5.901726722717285, "global_step": 63779, "epoch": 1518} {"train_loss": -6.1024017333984375, "global_step": 63780, "epoch": 1518} {"train_loss": -5.882708549499512, "global_step": 63781, "epoch": 1518} {"train_loss": -5.956326484680176, "global_step": 63782, "epoch": 1518} {"train_loss": -5.966604709625244, "global_step": 63783, "epoch": 1518} {"train_loss": -5.9671173095703125, "global_step": 63784, "epoch": 1518} {"train_loss": -5.903897285461426, "global_step": 63785, "epoch": 1518} {"train_loss": -5.951643466949463, "global_step": 63786, "epoch": 1518} {"train_loss": -5.859543800354004, "global_step": 63787, "epoch": 1518} {"train_loss": -5.923844337463379, "global_step": 63788, "epoch": 1518} {"train_loss": -5.976133346557617, "global_step": 63789, "epoch": 1518} {"train_loss": -5.957486152648926, "global_step": 63790, "epoch": 1518} {"train_loss": -5.984048843383789, "global_step": 63791, "epoch": 1518} {"train_loss": -5.913830757141113, "global_step": 63792, "epoch": 1518} {"train_loss": -5.9266815185546875, "global_step": 63793, "epoch": 1518} {"train_loss": -5.938488006591797, "global_step": 63794, "epoch": 1518} {"train_loss": -5.892439365386963, "global_step": 63795, "epoch": 1518} {"train_loss": -5.937466621398926, "global_step": 63796, "epoch": 1518} {"train_loss": -5.928974321910313, "global_step": 63797, "epoch": 1518, "val_loss": 66850.3671875} {"train_loss": -6.010347366333008, "global_step": 63798, "epoch": 1519} {"train_loss": -5.856497287750244, "global_step": 63799, "epoch": 1519} {"train_loss": -6.026931285858154, "global_step": 63800, "epoch": 1519} {"train_loss": -5.803835868835449, "global_step": 63801, "epoch": 1519} {"train_loss": -5.980466365814209, "global_step": 63802, "epoch": 1519} {"train_loss": -5.916129112243652, "global_step": 63803, "epoch": 1519} {"train_loss": -5.828986167907715, "global_step": 63804, "epoch": 1519} {"train_loss": -5.865612983703613, "global_step": 63805, "epoch": 1519} {"train_loss": -5.987194061279297, "global_step": 63806, "epoch": 1519} {"train_loss": -5.984536170959473, "global_step": 63807, "epoch": 1519} {"train_loss": -5.681360721588135, "global_step": 63808, "epoch": 1519} {"train_loss": -5.957596778869629, "global_step": 63809, "epoch": 1519} {"train_loss": -5.803225994110107, "global_step": 63810, "epoch": 1519} {"train_loss": -5.897942066192627, "global_step": 63811, "epoch": 1519} {"train_loss": -6.017043113708496, "global_step": 63812, "epoch": 1519} {"train_loss": -5.809523582458496, "global_step": 63813, "epoch": 1519} {"train_loss": -5.8719563484191895, "global_step": 63814, "epoch": 1519} {"train_loss": -5.827856540679932, "global_step": 63815, "epoch": 1519} {"train_loss": -5.9770708084106445, "global_step": 63816, "epoch": 1519} {"train_loss": -5.828131675720215, "global_step": 63817, "epoch": 1519} {"train_loss": -5.762816905975342, "global_step": 63818, "epoch": 1519} {"train_loss": -5.868140697479248, "global_step": 63819, "epoch": 1519} {"train_loss": -5.928411483764648, "global_step": 63820, "epoch": 1519} {"train_loss": -5.869462013244629, "global_step": 63821, "epoch": 1519} {"train_loss": -5.9009857177734375, "global_step": 63822, "epoch": 1519} {"train_loss": -5.946376800537109, "global_step": 63823, "epoch": 1519} {"train_loss": -5.831294059753418, "global_step": 63824, "epoch": 1519} {"train_loss": -5.8350911140441895, "global_step": 63825, "epoch": 1519} {"train_loss": -5.827812671661377, "global_step": 63826, "epoch": 1519} {"train_loss": -5.838714599609375, "global_step": 63827, "epoch": 1519} {"train_loss": -5.959746837615967, "global_step": 63828, "epoch": 1519} {"train_loss": -5.885328769683838, "global_step": 63829, "epoch": 1519} {"train_loss": -5.891162872314453, "global_step": 63830, "epoch": 1519} {"train_loss": -5.792710304260254, "global_step": 63831, "epoch": 1519} {"train_loss": -5.754980564117432, "global_step": 63832, "epoch": 1519} {"train_loss": -5.807388782501221, "global_step": 63833, "epoch": 1519} {"train_loss": -5.823761940002441, "global_step": 63834, "epoch": 1519} {"train_loss": -5.834190368652344, "global_step": 63835, "epoch": 1519} {"train_loss": -5.799434185028076, "global_step": 63836, "epoch": 1519} {"train_loss": -5.89178466796875, "global_step": 63837, "epoch": 1519} {"train_loss": -5.896921634674072, "global_step": 63838, "epoch": 1519} {"train_loss": -5.875445070720854, "global_step": 63839, "epoch": 1519, "val_loss": 67292.578125} {"train_loss": -5.864802360534668, "global_step": 63840, "epoch": 1520} {"train_loss": -5.925891399383545, "global_step": 63841, "epoch": 1520} {"train_loss": -5.866735458374023, "global_step": 63842, "epoch": 1520} {"train_loss": -5.864331245422363, "global_step": 63843, "epoch": 1520} {"train_loss": -5.796464443206787, "global_step": 63844, "epoch": 1520} {"train_loss": -5.838924407958984, "global_step": 63845, "epoch": 1520} {"train_loss": -5.939324378967285, "global_step": 63846, "epoch": 1520} {"train_loss": -5.850231647491455, "global_step": 63847, "epoch": 1520} {"train_loss": -5.92366886138916, "global_step": 63848, "epoch": 1520} {"train_loss": -5.803175926208496, "global_step": 63849, "epoch": 1520} {"train_loss": -5.935665130615234, "global_step": 63850, "epoch": 1520} {"train_loss": -5.981740951538086, "global_step": 63851, "epoch": 1520} {"train_loss": -5.878530502319336, "global_step": 63852, "epoch": 1520} {"train_loss": -5.975397109985352, "global_step": 63853, "epoch": 1520} {"train_loss": -5.926287651062012, "global_step": 63854, "epoch": 1520} {"train_loss": -5.888267993927002, "global_step": 63855, "epoch": 1520} {"train_loss": -5.859361171722412, "global_step": 63856, "epoch": 1520} {"train_loss": -5.846857070922852, "global_step": 63857, "epoch": 1520} {"train_loss": -5.889535903930664, "global_step": 63858, "epoch": 1520} {"train_loss": -5.979058742523193, "global_step": 63859, "epoch": 1520} {"train_loss": -5.808112144470215, "global_step": 63860, "epoch": 1520} {"train_loss": -5.913585662841797, "global_step": 63861, "epoch": 1520} {"train_loss": -5.948576927185059, "global_step": 63862, "epoch": 1520} {"train_loss": -5.959647178649902, "global_step": 63863, "epoch": 1520} {"train_loss": -5.8226728439331055, "global_step": 63864, "epoch": 1520} {"train_loss": -6.036304473876953, "global_step": 63865, "epoch": 1520} {"train_loss": -5.977177619934082, "global_step": 63866, "epoch": 1520} {"train_loss": -5.936410903930664, "global_step": 63867, "epoch": 1520} {"train_loss": -5.939911365509033, "global_step": 63868, "epoch": 1520} {"train_loss": -5.781483173370361, "global_step": 63869, "epoch": 1520} {"train_loss": -5.9121599197387695, "global_step": 63870, "epoch": 1520} {"train_loss": -5.794040679931641, "global_step": 63871, "epoch": 1520} {"train_loss": -5.972298622131348, "global_step": 63872, "epoch": 1520} {"train_loss": -5.935204029083252, "global_step": 63873, "epoch": 1520} {"train_loss": -5.851461410522461, "global_step": 63874, "epoch": 1520} {"train_loss": -5.96083927154541, "global_step": 63875, "epoch": 1520} {"train_loss": -5.9250898361206055, "global_step": 63876, "epoch": 1520} {"train_loss": -5.854737281799316, "global_step": 63877, "epoch": 1520} {"train_loss": -5.868229389190674, "global_step": 63878, "epoch": 1520} {"train_loss": -5.8718953132629395, "global_step": 63879, "epoch": 1520} {"train_loss": -5.83358097076416, "global_step": 63880, "epoch": 1520} {"train_loss": -5.895052217301869, "global_step": 63881, "epoch": 1520, "val_loss": 66970.8359375} {"train_loss": -5.964175224304199, "global_step": 63882, "epoch": 1521} {"train_loss": -5.924230098724365, "global_step": 63883, "epoch": 1521} {"train_loss": -6.012910842895508, "global_step": 63884, "epoch": 1521} {"train_loss": -5.968839645385742, "global_step": 63885, "epoch": 1521} {"train_loss": -5.903313636779785, "global_step": 63886, "epoch": 1521} {"train_loss": -5.86472225189209, "global_step": 63887, "epoch": 1521} {"train_loss": -5.742532730102539, "global_step": 63888, "epoch": 1521} {"train_loss": -5.712460517883301, "global_step": 63889, "epoch": 1521} {"train_loss": -6.0418381690979, "global_step": 63890, "epoch": 1521} {"train_loss": -5.719412803649902, "global_step": 63891, "epoch": 1521} {"train_loss": -5.963962554931641, "global_step": 63892, "epoch": 1521} {"train_loss": -5.973907470703125, "global_step": 63893, "epoch": 1521} {"train_loss": -5.854957580566406, "global_step": 63894, "epoch": 1521} {"train_loss": -5.945286750793457, "global_step": 63895, "epoch": 1521} {"train_loss": -5.875942230224609, "global_step": 63896, "epoch": 1521} {"train_loss": -5.986759185791016, "global_step": 63897, "epoch": 1521} {"train_loss": -5.862186431884766, "global_step": 63898, "epoch": 1521} {"train_loss": -6.054222106933594, "global_step": 63899, "epoch": 1521} {"train_loss": -5.959684371948242, "global_step": 63900, "epoch": 1521} {"train_loss": -5.969311714172363, "global_step": 63901, "epoch": 1521} {"train_loss": -5.927104949951172, "global_step": 63902, "epoch": 1521} {"train_loss": -5.8346428871154785, "global_step": 63903, "epoch": 1521} {"train_loss": -5.990015983581543, "global_step": 63904, "epoch": 1521} {"train_loss": -5.938103199005127, "global_step": 63905, "epoch": 1521} {"train_loss": -5.885126113891602, "global_step": 63906, "epoch": 1521} {"train_loss": -5.894445896148682, "global_step": 63907, "epoch": 1521} {"train_loss": -5.8419647216796875, "global_step": 63908, "epoch": 1521} {"train_loss": -5.987961769104004, "global_step": 63909, "epoch": 1521} {"train_loss": -5.896685600280762, "global_step": 63910, "epoch": 1521} {"train_loss": -5.964322090148926, "global_step": 63911, "epoch": 1521} {"train_loss": -6.1090593338012695, "global_step": 63912, "epoch": 1521} {"train_loss": -5.90349006652832, "global_step": 63913, "epoch": 1521} {"train_loss": -5.926321506500244, "global_step": 63914, "epoch": 1521} {"train_loss": -5.965523719787598, "global_step": 63915, "epoch": 1521} {"train_loss": -5.827077865600586, "global_step": 63916, "epoch": 1521} {"train_loss": -5.981201171875, "global_step": 63917, "epoch": 1521} {"train_loss": -5.816901206970215, "global_step": 63918, "epoch": 1521} {"train_loss": -5.911213397979736, "global_step": 63919, "epoch": 1521} {"train_loss": -5.851558685302734, "global_step": 63920, "epoch": 1521} {"train_loss": -5.934791088104248, "global_step": 63921, "epoch": 1521} {"train_loss": -5.944360733032227, "global_step": 63922, "epoch": 1521} {"train_loss": -5.918442510423207, "global_step": 63923, "epoch": 1521, "val_loss": 67059.125} {"train_loss": -5.956903457641602, "global_step": 63924, "epoch": 1522} {"train_loss": -5.986370086669922, "global_step": 63925, "epoch": 1522} {"train_loss": -5.818385124206543, "global_step": 63926, "epoch": 1522} {"train_loss": -5.979764461517334, "global_step": 63927, "epoch": 1522} {"train_loss": -6.016057968139648, "global_step": 63928, "epoch": 1522} {"train_loss": -5.92559289932251, "global_step": 63929, "epoch": 1522} {"train_loss": -5.947287559509277, "global_step": 63930, "epoch": 1522} {"train_loss": -5.900110244750977, "global_step": 63931, "epoch": 1522} {"train_loss": -5.833560943603516, "global_step": 63932, "epoch": 1522} {"train_loss": -5.893212795257568, "global_step": 63933, "epoch": 1522} {"train_loss": -5.999719619750977, "global_step": 63934, "epoch": 1522} {"train_loss": -5.816043853759766, "global_step": 63935, "epoch": 1522} {"train_loss": -5.966004371643066, "global_step": 63936, "epoch": 1522} {"train_loss": -5.901005268096924, "global_step": 63937, "epoch": 1522} {"train_loss": -5.689867973327637, "global_step": 63938, "epoch": 1522} {"train_loss": -5.883174896240234, "global_step": 63939, "epoch": 1522} {"train_loss": -5.803806781768799, "global_step": 63940, "epoch": 1522} {"train_loss": -5.8653411865234375, "global_step": 63941, "epoch": 1522} {"train_loss": -5.847249984741211, "global_step": 63942, "epoch": 1522} {"train_loss": -5.895654678344727, "global_step": 63943, "epoch": 1522} {"train_loss": -5.751334190368652, "global_step": 63944, "epoch": 1522} {"train_loss": -5.858947277069092, "global_step": 63945, "epoch": 1522} {"train_loss": -5.834413051605225, "global_step": 63946, "epoch": 1522} {"train_loss": -6.0042524337768555, "global_step": 63947, "epoch": 1522} {"train_loss": -5.974430084228516, "global_step": 63948, "epoch": 1522} {"train_loss": -6.039402484893799, "global_step": 63949, "epoch": 1522} {"train_loss": -5.8741559982299805, "global_step": 63950, "epoch": 1522} {"train_loss": -5.884615898132324, "global_step": 63951, "epoch": 1522} {"train_loss": -5.728453159332275, "global_step": 63952, "epoch": 1522} {"train_loss": -5.853124618530273, "global_step": 63953, "epoch": 1522} {"train_loss": -5.899134635925293, "global_step": 63954, "epoch": 1522} {"train_loss": -5.935671329498291, "global_step": 63955, "epoch": 1522} {"train_loss": -5.988873481750488, "global_step": 63956, "epoch": 1522} {"train_loss": -5.846457004547119, "global_step": 63957, "epoch": 1522} {"train_loss": -5.951361656188965, "global_step": 63958, "epoch": 1522} {"train_loss": -5.825695037841797, "global_step": 63959, "epoch": 1522} {"train_loss": -5.973186016082764, "global_step": 63960, "epoch": 1522} {"train_loss": -5.9992194175720215, "global_step": 63961, "epoch": 1522} {"train_loss": -5.857508182525635, "global_step": 63962, "epoch": 1522} {"train_loss": -5.90416955947876, "global_step": 63963, "epoch": 1522} {"train_loss": -5.836547374725342, "global_step": 63964, "epoch": 1522} {"train_loss": -5.896141018186297, "global_step": 63965, "epoch": 1522, "val_loss": 66767.484375} {"train_loss": -6.010418891906738, "global_step": 63966, "epoch": 1523} {"train_loss": -5.868058204650879, "global_step": 63967, "epoch": 1523} {"train_loss": -5.888294696807861, "global_step": 63968, "epoch": 1523} {"train_loss": -5.917824745178223, "global_step": 63969, "epoch": 1523} {"train_loss": -6.011709213256836, "global_step": 63970, "epoch": 1523} {"train_loss": -5.926441192626953, "global_step": 63971, "epoch": 1523} {"train_loss": -6.016520023345947, "global_step": 63972, "epoch": 1523} {"train_loss": -6.012907028198242, "global_step": 63973, "epoch": 1523} {"train_loss": -5.9923601150512695, "global_step": 63974, "epoch": 1523} {"train_loss": -6.001361846923828, "global_step": 63975, "epoch": 1523} {"train_loss": -6.016024589538574, "global_step": 63976, "epoch": 1523} {"train_loss": -5.843023777008057, "global_step": 63977, "epoch": 1523} {"train_loss": -5.939790725708008, "global_step": 63978, "epoch": 1523} {"train_loss": -6.008126258850098, "global_step": 63979, "epoch": 1523} {"train_loss": -5.856595993041992, "global_step": 63980, "epoch": 1523} {"train_loss": -5.950893402099609, "global_step": 63981, "epoch": 1523} {"train_loss": -5.761499881744385, "global_step": 63982, "epoch": 1523} {"train_loss": -6.006496429443359, "global_step": 63983, "epoch": 1523} {"train_loss": -6.057249069213867, "global_step": 63984, "epoch": 1523} {"train_loss": -5.888016700744629, "global_step": 63985, "epoch": 1523} {"train_loss": -5.849783420562744, "global_step": 63986, "epoch": 1523} {"train_loss": -5.773008346557617, "global_step": 63987, "epoch": 1523} {"train_loss": -6.022767066955566, "global_step": 63988, "epoch": 1523} {"train_loss": -5.924859046936035, "global_step": 63989, "epoch": 1523} {"train_loss": -5.830709457397461, "global_step": 63990, "epoch": 1523} {"train_loss": -6.008854866027832, "global_step": 63991, "epoch": 1523} {"train_loss": -5.915384292602539, "global_step": 63992, "epoch": 1523} {"train_loss": -5.891345977783203, "global_step": 63993, "epoch": 1523} {"train_loss": -6.004539489746094, "global_step": 63994, "epoch": 1523} {"train_loss": -5.782289505004883, "global_step": 63995, "epoch": 1523} {"train_loss": -5.979531764984131, "global_step": 63996, "epoch": 1523} {"train_loss": -5.960328578948975, "global_step": 63997, "epoch": 1523} {"train_loss": -5.735058784484863, "global_step": 63998, "epoch": 1523} {"train_loss": -5.955283164978027, "global_step": 63999, "epoch": 1523} {"train_loss": -5.924872398376465, "global_step": 64000, "epoch": 1523} {"train_loss": -5.9254231452941895, "global_step": 64001, "epoch": 1523} {"train_loss": -5.995813369750977, "global_step": 64002, "epoch": 1523} {"train_loss": -5.945520877838135, "global_step": 64003, "epoch": 1523} {"train_loss": -5.852022647857666, "global_step": 64004, "epoch": 1523} {"train_loss": -6.037026405334473, "global_step": 64005, "epoch": 1523} {"train_loss": -5.906728267669678, "global_step": 64006, "epoch": 1523} {"train_loss": -5.929428679602487, "global_step": 64007, "epoch": 1523, "val_loss": 67118.8671875} {"train_loss": -5.900923252105713, "global_step": 64008, "epoch": 1524} {"train_loss": -5.911133289337158, "global_step": 64009, "epoch": 1524} {"train_loss": -5.978763580322266, "global_step": 64010, "epoch": 1524} {"train_loss": -5.878150463104248, "global_step": 64011, "epoch": 1524} {"train_loss": -5.868278503417969, "global_step": 64012, "epoch": 1524} {"train_loss": -5.939056873321533, "global_step": 64013, "epoch": 1524} {"train_loss": -6.038954734802246, "global_step": 64014, "epoch": 1524} {"train_loss": -5.974486351013184, "global_step": 64015, "epoch": 1524} {"train_loss": -6.0120344161987305, "global_step": 64016, "epoch": 1524} {"train_loss": -5.959226608276367, "global_step": 64017, "epoch": 1524} {"train_loss": -5.891684055328369, "global_step": 64018, "epoch": 1524} {"train_loss": -6.092623233795166, "global_step": 64019, "epoch": 1524} {"train_loss": -5.947758674621582, "global_step": 64020, "epoch": 1524} {"train_loss": -5.964199066162109, "global_step": 64021, "epoch": 1524} {"train_loss": -5.887495517730713, "global_step": 64022, "epoch": 1524} {"train_loss": -5.955429553985596, "global_step": 64023, "epoch": 1524} {"train_loss": -5.945265769958496, "global_step": 64024, "epoch": 1524} {"train_loss": -5.9149298667907715, "global_step": 64025, "epoch": 1524} {"train_loss": -5.999065399169922, "global_step": 64026, "epoch": 1524} {"train_loss": -5.829718589782715, "global_step": 64027, "epoch": 1524} {"train_loss": -5.850881099700928, "global_step": 64028, "epoch": 1524} {"train_loss": -6.01888370513916, "global_step": 64029, "epoch": 1524} {"train_loss": -5.9456377029418945, "global_step": 64030, "epoch": 1524} {"train_loss": -5.901250839233398, "global_step": 64031, "epoch": 1524} {"train_loss": -5.963444709777832, "global_step": 64032, "epoch": 1524} {"train_loss": -5.97109317779541, "global_step": 64033, "epoch": 1524} {"train_loss": -5.782077312469482, "global_step": 64034, "epoch": 1524} {"train_loss": -6.0684919357299805, "global_step": 64035, "epoch": 1524} {"train_loss": -5.934513568878174, "global_step": 64036, "epoch": 1524} {"train_loss": -6.028120517730713, "global_step": 64037, "epoch": 1524} {"train_loss": -5.9810380935668945, "global_step": 64038, "epoch": 1524} {"train_loss": -5.908662796020508, "global_step": 64039, "epoch": 1524} {"train_loss": -5.796216011047363, "global_step": 64040, "epoch": 1524} {"train_loss": -6.000426292419434, "global_step": 64041, "epoch": 1524} {"train_loss": -5.935839653015137, "global_step": 64042, "epoch": 1524} {"train_loss": -5.908214569091797, "global_step": 64043, "epoch": 1524} {"train_loss": -5.945985317230225, "global_step": 64044, "epoch": 1524} {"train_loss": -6.01181697845459, "global_step": 64045, "epoch": 1524} {"train_loss": -5.974216461181641, "global_step": 64046, "epoch": 1524} {"train_loss": -6.021487236022949, "global_step": 64047, "epoch": 1524} {"train_loss": -6.052334785461426, "global_step": 64048, "epoch": 1524} {"train_loss": -5.947861512502034, "global_step": 64049, "epoch": 1524, "val_loss": 66873.578125} {"train_loss": -5.910702705383301, "global_step": 64050, "epoch": 1525} {"train_loss": -6.050666809082031, "global_step": 64051, "epoch": 1525} {"train_loss": -5.9748029708862305, "global_step": 64052, "epoch": 1525} {"train_loss": -6.016724586486816, "global_step": 64053, "epoch": 1525} {"train_loss": -5.893763065338135, "global_step": 64054, "epoch": 1525} {"train_loss": -6.048028945922852, "global_step": 64055, "epoch": 1525} {"train_loss": -5.976909637451172, "global_step": 64056, "epoch": 1525} {"train_loss": -5.988933086395264, "global_step": 64057, "epoch": 1525} {"train_loss": -5.879864692687988, "global_step": 64058, "epoch": 1525} {"train_loss": -5.906556606292725, "global_step": 64059, "epoch": 1525} {"train_loss": -5.958001136779785, "global_step": 64060, "epoch": 1525} {"train_loss": -5.851896286010742, "global_step": 64061, "epoch": 1525} {"train_loss": -5.918702125549316, "global_step": 64062, "epoch": 1525} {"train_loss": -6.01969051361084, "global_step": 64063, "epoch": 1525} {"train_loss": -5.936212539672852, "global_step": 64064, "epoch": 1525} {"train_loss": -5.968342304229736, "global_step": 64065, "epoch": 1525} {"train_loss": -5.967164993286133, "global_step": 64066, "epoch": 1525} {"train_loss": -5.925942897796631, "global_step": 64067, "epoch": 1525} {"train_loss": -5.967500686645508, "global_step": 64068, "epoch": 1525} {"train_loss": -6.109858512878418, "global_step": 64069, "epoch": 1525} {"train_loss": -6.01364803314209, "global_step": 64070, "epoch": 1525} {"train_loss": -5.921446323394775, "global_step": 64071, "epoch": 1525} {"train_loss": -5.948631286621094, "global_step": 64072, "epoch": 1525} {"train_loss": -5.870744705200195, "global_step": 64073, "epoch": 1525} {"train_loss": -6.004591941833496, "global_step": 64074, "epoch": 1525} {"train_loss": -5.880666255950928, "global_step": 64075, "epoch": 1525} {"train_loss": -5.895550727844238, "global_step": 64076, "epoch": 1525} {"train_loss": -5.9501953125, "global_step": 64077, "epoch": 1525} {"train_loss": -5.796311378479004, "global_step": 64078, "epoch": 1525} {"train_loss": -6.013360023498535, "global_step": 64079, "epoch": 1525} {"train_loss": -6.0208611488342285, "global_step": 64080, "epoch": 1525} {"train_loss": -5.899200439453125, "global_step": 64081, "epoch": 1525} {"train_loss": -5.988386154174805, "global_step": 64082, "epoch": 1525} {"train_loss": -5.817420482635498, "global_step": 64083, "epoch": 1525} {"train_loss": -5.946359634399414, "global_step": 64084, "epoch": 1525} {"train_loss": -5.881175994873047, "global_step": 64085, "epoch": 1525} {"train_loss": -5.906599998474121, "global_step": 64086, "epoch": 1525} {"train_loss": -5.87810754776001, "global_step": 64087, "epoch": 1525} {"train_loss": -5.850517272949219, "global_step": 64088, "epoch": 1525} {"train_loss": -5.888392448425293, "global_step": 64089, "epoch": 1525} {"train_loss": -5.820453643798828, "global_step": 64090, "epoch": 1525} {"train_loss": -5.938290403002784, "global_step": 64091, "epoch": 1525, "val_loss": 66976.21875} {"train_loss": -5.941035270690918, "global_step": 64092, "epoch": 1526} {"train_loss": -5.9776716232299805, "global_step": 64093, "epoch": 1526} {"train_loss": -6.01767635345459, "global_step": 64094, "epoch": 1526} {"train_loss": -5.976325035095215, "global_step": 64095, "epoch": 1526} {"train_loss": -5.97481107711792, "global_step": 64096, "epoch": 1526} {"train_loss": -5.911062240600586, "global_step": 64097, "epoch": 1526} {"train_loss": -5.894302845001221, "global_step": 64098, "epoch": 1526} {"train_loss": -5.951131343841553, "global_step": 64099, "epoch": 1526} {"train_loss": -5.926190376281738, "global_step": 64100, "epoch": 1526} {"train_loss": -5.954970359802246, "global_step": 64101, "epoch": 1526} {"train_loss": -5.971342086791992, "global_step": 64102, "epoch": 1526} {"train_loss": -5.979964256286621, "global_step": 64103, "epoch": 1526} {"train_loss": -5.974822044372559, "global_step": 64104, "epoch": 1526} {"train_loss": -5.979218006134033, "global_step": 64105, "epoch": 1526} {"train_loss": -5.934867858886719, "global_step": 64106, "epoch": 1526} {"train_loss": -5.802793502807617, "global_step": 64107, "epoch": 1526} {"train_loss": -5.798436164855957, "global_step": 64108, "epoch": 1526} {"train_loss": -5.98737907409668, "global_step": 64109, "epoch": 1526} {"train_loss": -5.817352294921875, "global_step": 64110, "epoch": 1526} {"train_loss": -5.919747829437256, "global_step": 64111, "epoch": 1526} {"train_loss": -5.837831974029541, "global_step": 64112, "epoch": 1526} {"train_loss": -5.7542877197265625, "global_step": 64113, "epoch": 1526} {"train_loss": -5.948765277862549, "global_step": 64114, "epoch": 1526} {"train_loss": -5.779171943664551, "global_step": 64115, "epoch": 1526} {"train_loss": -5.927742004394531, "global_step": 64116, "epoch": 1526} {"train_loss": -6.107546806335449, "global_step": 64117, "epoch": 1526} {"train_loss": -5.95728874206543, "global_step": 64118, "epoch": 1526} {"train_loss": -5.930538177490234, "global_step": 64119, "epoch": 1526} {"train_loss": -5.935914993286133, "global_step": 64120, "epoch": 1526} {"train_loss": -5.844953536987305, "global_step": 64121, "epoch": 1526} {"train_loss": -6.033815383911133, "global_step": 64122, "epoch": 1526} {"train_loss": -5.900351524353027, "global_step": 64123, "epoch": 1526} {"train_loss": -5.922106742858887, "global_step": 64124, "epoch": 1526} {"train_loss": -5.94189977645874, "global_step": 64125, "epoch": 1526} {"train_loss": -5.892794132232666, "global_step": 64126, "epoch": 1526} {"train_loss": -5.952821731567383, "global_step": 64127, "epoch": 1526} {"train_loss": -5.8656415939331055, "global_step": 64128, "epoch": 1526} {"train_loss": -5.8637847900390625, "global_step": 64129, "epoch": 1526} {"train_loss": -5.8578081130981445, "global_step": 64130, "epoch": 1526} {"train_loss": -5.915916442871094, "global_step": 64131, "epoch": 1526} {"train_loss": -5.930562973022461, "global_step": 64132, "epoch": 1526} {"train_loss": -5.918012834730602, "global_step": 64133, "epoch": 1526, "val_loss": 66878.265625} {"train_loss": -5.921761512756348, "global_step": 64134, "epoch": 1527} {"train_loss": -5.937881946563721, "global_step": 64135, "epoch": 1527} {"train_loss": -6.003684997558594, "global_step": 64136, "epoch": 1527} {"train_loss": -5.80341911315918, "global_step": 64137, "epoch": 1527} {"train_loss": -5.978017807006836, "global_step": 64138, "epoch": 1527} {"train_loss": -5.846953392028809, "global_step": 64139, "epoch": 1527} {"train_loss": -5.934637069702148, "global_step": 64140, "epoch": 1527} {"train_loss": -5.893063545227051, "global_step": 64141, "epoch": 1527} {"train_loss": -5.865842819213867, "global_step": 64142, "epoch": 1527} {"train_loss": -5.854113578796387, "global_step": 64143, "epoch": 1527} {"train_loss": -5.958208084106445, "global_step": 64144, "epoch": 1527} {"train_loss": -6.119437217712402, "global_step": 64145, "epoch": 1527} {"train_loss": -5.950265884399414, "global_step": 64146, "epoch": 1527} {"train_loss": -5.857865333557129, "global_step": 64147, "epoch": 1527} {"train_loss": -5.895324230194092, "global_step": 64148, "epoch": 1527} {"train_loss": -5.988348007202148, "global_step": 64149, "epoch": 1527} {"train_loss": -5.93497371673584, "global_step": 64150, "epoch": 1527} {"train_loss": -5.928729057312012, "global_step": 64151, "epoch": 1527} {"train_loss": -5.986181735992432, "global_step": 64152, "epoch": 1527} {"train_loss": -5.977145195007324, "global_step": 64153, "epoch": 1527} {"train_loss": -6.046679496765137, "global_step": 64154, "epoch": 1527} {"train_loss": -5.946979999542236, "global_step": 64155, "epoch": 1527} {"train_loss": -5.941435813903809, "global_step": 64156, "epoch": 1527} {"train_loss": -6.025956153869629, "global_step": 64157, "epoch": 1527} {"train_loss": -6.060353755950928, "global_step": 64158, "epoch": 1527} {"train_loss": -5.827513217926025, "global_step": 64159, "epoch": 1527} {"train_loss": -5.850081920623779, "global_step": 64160, "epoch": 1527} {"train_loss": -5.955164909362793, "global_step": 64161, "epoch": 1527} {"train_loss": -5.950891971588135, "global_step": 64162, "epoch": 1527} {"train_loss": -5.825897216796875, "global_step": 64163, "epoch": 1527} {"train_loss": -5.886448860168457, "global_step": 64164, "epoch": 1527} {"train_loss": -5.891027450561523, "global_step": 64165, "epoch": 1527} {"train_loss": -5.897636413574219, "global_step": 64166, "epoch": 1527} {"train_loss": -5.922423839569092, "global_step": 64167, "epoch": 1527} {"train_loss": -5.8999786376953125, "global_step": 64168, "epoch": 1527} {"train_loss": -5.893209457397461, "global_step": 64169, "epoch": 1527} {"train_loss": -5.864833831787109, "global_step": 64170, "epoch": 1527} {"train_loss": -6.051331043243408, "global_step": 64171, "epoch": 1527} {"train_loss": -5.847951889038086, "global_step": 64172, "epoch": 1527} {"train_loss": -5.953808784484863, "global_step": 64173, "epoch": 1527} {"train_loss": -5.8927154541015625, "global_step": 64174, "epoch": 1527} {"train_loss": -5.932184957322621, "global_step": 64175, "epoch": 1527, "val_loss": 67056.9609375} {"train_loss": -5.978287696838379, "global_step": 64176, "epoch": 1528} {"train_loss": -5.947567939758301, "global_step": 64177, "epoch": 1528} {"train_loss": -5.972626686096191, "global_step": 64178, "epoch": 1528} {"train_loss": -5.784542083740234, "global_step": 64179, "epoch": 1528} {"train_loss": -6.005938529968262, "global_step": 64180, "epoch": 1528} {"train_loss": -5.881369590759277, "global_step": 64181, "epoch": 1528} {"train_loss": -5.845752716064453, "global_step": 64182, "epoch": 1528} {"train_loss": -5.997258186340332, "global_step": 64183, "epoch": 1528} {"train_loss": -5.917576789855957, "global_step": 64184, "epoch": 1528} {"train_loss": -5.97264289855957, "global_step": 64185, "epoch": 1528} {"train_loss": -5.917075157165527, "global_step": 64186, "epoch": 1528} {"train_loss": -6.020124912261963, "global_step": 64187, "epoch": 1528} {"train_loss": -6.0323381423950195, "global_step": 64188, "epoch": 1528} {"train_loss": -5.99334716796875, "global_step": 64189, "epoch": 1528} {"train_loss": -5.945340156555176, "global_step": 64190, "epoch": 1528} {"train_loss": -6.009027481079102, "global_step": 64191, "epoch": 1528} {"train_loss": -6.022650718688965, "global_step": 64192, "epoch": 1528} {"train_loss": -5.877234935760498, "global_step": 64193, "epoch": 1528} {"train_loss": -6.043781757354736, "global_step": 64194, "epoch": 1528} {"train_loss": -5.810449600219727, "global_step": 64195, "epoch": 1528} {"train_loss": -6.116605281829834, "global_step": 64196, "epoch": 1528} {"train_loss": -5.921868801116943, "global_step": 64197, "epoch": 1528} {"train_loss": -5.866766452789307, "global_step": 64198, "epoch": 1528} {"train_loss": -5.904885292053223, "global_step": 64199, "epoch": 1528} {"train_loss": -5.9167680740356445, "global_step": 64200, "epoch": 1528} {"train_loss": -5.875316619873047, "global_step": 64201, "epoch": 1528} {"train_loss": -5.939610481262207, "global_step": 64202, "epoch": 1528} {"train_loss": -5.902030944824219, "global_step": 64203, "epoch": 1528} {"train_loss": -5.866479873657227, "global_step": 64204, "epoch": 1528} {"train_loss": -5.897356033325195, "global_step": 64205, "epoch": 1528} {"train_loss": -6.0054545402526855, "global_step": 64206, "epoch": 1528} {"train_loss": -5.9274678230285645, "global_step": 64207, "epoch": 1528} {"train_loss": -5.914278030395508, "global_step": 64208, "epoch": 1528} {"train_loss": -5.930826663970947, "global_step": 64209, "epoch": 1528} {"train_loss": -5.944520950317383, "global_step": 64210, "epoch": 1528} {"train_loss": -5.8923187255859375, "global_step": 64211, "epoch": 1528} {"train_loss": -5.957765579223633, "global_step": 64212, "epoch": 1528} {"train_loss": -5.788377285003662, "global_step": 64213, "epoch": 1528} {"train_loss": -6.0352702140808105, "global_step": 64214, "epoch": 1528} {"train_loss": -5.976258277893066, "global_step": 64215, "epoch": 1528} {"train_loss": -5.935020446777344, "global_step": 64216, "epoch": 1528} {"train_loss": -5.937829267411005, "global_step": 64217, "epoch": 1528, "val_loss": 67011.453125} {"train_loss": -5.893035888671875, "global_step": 64218, "epoch": 1529} {"train_loss": -5.983185768127441, "global_step": 64219, "epoch": 1529} {"train_loss": -5.8986496925354, "global_step": 64220, "epoch": 1529} {"train_loss": -5.943544387817383, "global_step": 64221, "epoch": 1529} {"train_loss": -5.957229137420654, "global_step": 64222, "epoch": 1529} {"train_loss": -5.955625534057617, "global_step": 64223, "epoch": 1529} {"train_loss": -5.988633155822754, "global_step": 64224, "epoch": 1529} {"train_loss": -5.962688446044922, "global_step": 64225, "epoch": 1529} {"train_loss": -5.959886074066162, "global_step": 64226, "epoch": 1529} {"train_loss": -5.9559526443481445, "global_step": 64227, "epoch": 1529} {"train_loss": -5.888925075531006, "global_step": 64228, "epoch": 1529} {"train_loss": -5.904197692871094, "global_step": 64229, "epoch": 1529} {"train_loss": -5.980971336364746, "global_step": 64230, "epoch": 1529} {"train_loss": -6.037639617919922, "global_step": 64231, "epoch": 1529} {"train_loss": -5.963247776031494, "global_step": 64232, "epoch": 1529} {"train_loss": -5.933887004852295, "global_step": 64233, "epoch": 1529} {"train_loss": -5.920069694519043, "global_step": 64234, "epoch": 1529} {"train_loss": -5.862579345703125, "global_step": 64235, "epoch": 1529} {"train_loss": -6.073295593261719, "global_step": 64236, "epoch": 1529} {"train_loss": -5.993540287017822, "global_step": 64237, "epoch": 1529} {"train_loss": -5.877042770385742, "global_step": 64238, "epoch": 1529} {"train_loss": -5.9774675369262695, "global_step": 64239, "epoch": 1529} {"train_loss": -5.944098472595215, "global_step": 64240, "epoch": 1529} {"train_loss": -5.998115539550781, "global_step": 64241, "epoch": 1529} {"train_loss": -6.02961540222168, "global_step": 64242, "epoch": 1529} {"train_loss": -5.998518943786621, "global_step": 64243, "epoch": 1529} {"train_loss": -5.919466972351074, "global_step": 64244, "epoch": 1529} {"train_loss": -5.985104560852051, "global_step": 64245, "epoch": 1529} {"train_loss": -5.867316246032715, "global_step": 64246, "epoch": 1529} {"train_loss": -5.936031341552734, "global_step": 64247, "epoch": 1529} {"train_loss": -5.885262489318848, "global_step": 64248, "epoch": 1529} {"train_loss": -5.841133117675781, "global_step": 64249, "epoch": 1529} {"train_loss": -6.0410943031311035, "global_step": 64250, "epoch": 1529} {"train_loss": -5.9930100440979, "global_step": 64251, "epoch": 1529} {"train_loss": -5.992594242095947, "global_step": 64252, "epoch": 1529} {"train_loss": -5.845446586608887, "global_step": 64253, "epoch": 1529} {"train_loss": -5.949123382568359, "global_step": 64254, "epoch": 1529} {"train_loss": -6.087071418762207, "global_step": 64255, "epoch": 1529} {"train_loss": -5.935912132263184, "global_step": 64256, "epoch": 1529} {"train_loss": -5.953242778778076, "global_step": 64257, "epoch": 1529} {"train_loss": -5.9825239181518555, "global_step": 64258, "epoch": 1529} {"train_loss": -5.953789336340768, "global_step": 64259, "epoch": 1529, "val_loss": 67006.6796875} {"train_loss": -5.908946990966797, "global_step": 64260, "epoch": 1530} {"train_loss": -6.071292877197266, "global_step": 64261, "epoch": 1530} {"train_loss": -5.94481086730957, "global_step": 64262, "epoch": 1530} {"train_loss": -6.002954959869385, "global_step": 64263, "epoch": 1530} {"train_loss": -5.956972122192383, "global_step": 64264, "epoch": 1530} {"train_loss": -6.063366413116455, "global_step": 64265, "epoch": 1530} {"train_loss": -5.949402809143066, "global_step": 64266, "epoch": 1530} {"train_loss": -5.993930816650391, "global_step": 64267, "epoch": 1530} {"train_loss": -5.987137317657471, "global_step": 64268, "epoch": 1530} {"train_loss": -6.013521194458008, "global_step": 64269, "epoch": 1530} {"train_loss": -5.987005233764648, "global_step": 64270, "epoch": 1530} {"train_loss": -6.081099987030029, "global_step": 64271, "epoch": 1530} {"train_loss": -5.922713756561279, "global_step": 64272, "epoch": 1530} {"train_loss": -5.973041534423828, "global_step": 64273, "epoch": 1530} {"train_loss": -5.936160087585449, "global_step": 64274, "epoch": 1530} {"train_loss": -5.911088466644287, "global_step": 64275, "epoch": 1530} {"train_loss": -5.985337734222412, "global_step": 64276, "epoch": 1530} {"train_loss": -5.959794998168945, "global_step": 64277, "epoch": 1530} {"train_loss": -5.748030662536621, "global_step": 64278, "epoch": 1530} {"train_loss": -5.98984432220459, "global_step": 64279, "epoch": 1530} {"train_loss": -5.913161277770996, "global_step": 64280, "epoch": 1530} {"train_loss": -5.921084403991699, "global_step": 64281, "epoch": 1530} {"train_loss": -5.9629950523376465, "global_step": 64282, "epoch": 1530} {"train_loss": -5.9521484375, "global_step": 64283, "epoch": 1530} {"train_loss": -5.9736833572387695, "global_step": 64284, "epoch": 1530} {"train_loss": -5.787853240966797, "global_step": 64285, "epoch": 1530} {"train_loss": -5.907464027404785, "global_step": 64286, "epoch": 1530} {"train_loss": -5.918627738952637, "global_step": 64287, "epoch": 1530} {"train_loss": -5.94325065612793, "global_step": 64288, "epoch": 1530} {"train_loss": -5.904046058654785, "global_step": 64289, "epoch": 1530} {"train_loss": -5.857021808624268, "global_step": 64290, "epoch": 1530} {"train_loss": -5.925466537475586, "global_step": 64291, "epoch": 1530} {"train_loss": -6.002047538757324, "global_step": 64292, "epoch": 1530} {"train_loss": -5.913263320922852, "global_step": 64293, "epoch": 1530} {"train_loss": -5.97575569152832, "global_step": 64294, "epoch": 1530} {"train_loss": -6.00903844833374, "global_step": 64295, "epoch": 1530} {"train_loss": -5.938312530517578, "global_step": 64296, "epoch": 1530} {"train_loss": -5.948267936706543, "global_step": 64297, "epoch": 1530} {"train_loss": -5.967426776885986, "global_step": 64298, "epoch": 1530} {"train_loss": -6.0219197273254395, "global_step": 64299, "epoch": 1530} {"train_loss": -5.942380905151367, "global_step": 64300, "epoch": 1530} {"train_loss": -5.948150146575201, "global_step": 64301, "epoch": 1530, "val_loss": 66851.171875} {"train_loss": -5.906524658203125, "global_step": 64302, "epoch": 1531} {"train_loss": -5.953370571136475, "global_step": 64303, "epoch": 1531} {"train_loss": -5.821102619171143, "global_step": 64304, "epoch": 1531} {"train_loss": -6.040041923522949, "global_step": 64305, "epoch": 1531} {"train_loss": -5.901171684265137, "global_step": 64306, "epoch": 1531} {"train_loss": -5.912962913513184, "global_step": 64307, "epoch": 1531} {"train_loss": -5.931003570556641, "global_step": 64308, "epoch": 1531} {"train_loss": -5.9401726722717285, "global_step": 64309, "epoch": 1531} {"train_loss": -5.886325836181641, "global_step": 64310, "epoch": 1531} {"train_loss": -5.973844051361084, "global_step": 64311, "epoch": 1531} {"train_loss": -5.9345550537109375, "global_step": 64312, "epoch": 1531} {"train_loss": -5.989518165588379, "global_step": 64313, "epoch": 1531} {"train_loss": -5.922515869140625, "global_step": 64314, "epoch": 1531} {"train_loss": -5.911085605621338, "global_step": 64315, "epoch": 1531} {"train_loss": -5.92650032043457, "global_step": 64316, "epoch": 1531} {"train_loss": -6.049334526062012, "global_step": 64317, "epoch": 1531} {"train_loss": -5.831313133239746, "global_step": 64318, "epoch": 1531} {"train_loss": -5.894659042358398, "global_step": 64319, "epoch": 1531} {"train_loss": -6.029900550842285, "global_step": 64320, "epoch": 1531} {"train_loss": -5.917474746704102, "global_step": 64321, "epoch": 1531} {"train_loss": -5.937991142272949, "global_step": 64322, "epoch": 1531} {"train_loss": -5.801067352294922, "global_step": 64323, "epoch": 1531} {"train_loss": -5.898041248321533, "global_step": 64324, "epoch": 1531} {"train_loss": -5.9031524658203125, "global_step": 64325, "epoch": 1531} {"train_loss": -5.988506317138672, "global_step": 64326, "epoch": 1531} {"train_loss": -5.9193830490112305, "global_step": 64327, "epoch": 1531} {"train_loss": -5.859230995178223, "global_step": 64328, "epoch": 1531} {"train_loss": -5.820433616638184, "global_step": 64329, "epoch": 1531} {"train_loss": -5.874319076538086, "global_step": 64330, "epoch": 1531} {"train_loss": -5.829833030700684, "global_step": 64331, "epoch": 1531} {"train_loss": -6.039011001586914, "global_step": 64332, "epoch": 1531} {"train_loss": -5.813252925872803, "global_step": 64333, "epoch": 1531} {"train_loss": -5.8927001953125, "global_step": 64334, "epoch": 1531} {"train_loss": -5.900324821472168, "global_step": 64335, "epoch": 1531} {"train_loss": -5.882080078125, "global_step": 64336, "epoch": 1531} {"train_loss": -6.017124652862549, "global_step": 64337, "epoch": 1531} {"train_loss": -6.015166759490967, "global_step": 64338, "epoch": 1531} {"train_loss": -5.94835090637207, "global_step": 64339, "epoch": 1531} {"train_loss": -5.90090799331665, "global_step": 64340, "epoch": 1531} {"train_loss": -6.016152381896973, "global_step": 64341, "epoch": 1531} {"train_loss": -6.009862899780273, "global_step": 64342, "epoch": 1531} {"train_loss": -5.923899843579247, "global_step": 64343, "epoch": 1531, "val_loss": 67220.5546875} {"train_loss": -5.8637518882751465, "global_step": 64344, "epoch": 1532} {"train_loss": -6.033415794372559, "global_step": 64345, "epoch": 1532} {"train_loss": -5.963535785675049, "global_step": 64346, "epoch": 1532} {"train_loss": -5.862545490264893, "global_step": 64347, "epoch": 1532} {"train_loss": -5.930825710296631, "global_step": 64348, "epoch": 1532} {"train_loss": -5.878645896911621, "global_step": 64349, "epoch": 1532} {"train_loss": -6.103883743286133, "global_step": 64350, "epoch": 1532} {"train_loss": -5.9998979568481445, "global_step": 64351, "epoch": 1532} {"train_loss": -5.9196977615356445, "global_step": 64352, "epoch": 1532} {"train_loss": -5.964427947998047, "global_step": 64353, "epoch": 1532} {"train_loss": -6.0339460372924805, "global_step": 64354, "epoch": 1532} {"train_loss": -5.879228591918945, "global_step": 64355, "epoch": 1532} {"train_loss": -5.946558475494385, "global_step": 64356, "epoch": 1532} {"train_loss": -5.96903657913208, "global_step": 64357, "epoch": 1532} {"train_loss": -6.0379180908203125, "global_step": 64358, "epoch": 1532} {"train_loss": -5.944622993469238, "global_step": 64359, "epoch": 1532} {"train_loss": -5.939053058624268, "global_step": 64360, "epoch": 1532} {"train_loss": -6.056139945983887, "global_step": 64361, "epoch": 1532} {"train_loss": -6.00883674621582, "global_step": 64362, "epoch": 1532} {"train_loss": -6.058016777038574, "global_step": 64363, "epoch": 1532} {"train_loss": -6.053432464599609, "global_step": 64364, "epoch": 1532} {"train_loss": -6.098937034606934, "global_step": 64365, "epoch": 1532} {"train_loss": -6.004242897033691, "global_step": 64366, "epoch": 1532} {"train_loss": -6.131155967712402, "global_step": 64367, "epoch": 1532} {"train_loss": -5.892060279846191, "global_step": 64368, "epoch": 1532} {"train_loss": -6.056553840637207, "global_step": 64369, "epoch": 1532} {"train_loss": -5.979868412017822, "global_step": 64370, "epoch": 1532} {"train_loss": -5.866888046264648, "global_step": 64371, "epoch": 1532} {"train_loss": -5.935372352600098, "global_step": 64372, "epoch": 1532} {"train_loss": -5.8888349533081055, "global_step": 64373, "epoch": 1532} {"train_loss": -5.855765342712402, "global_step": 64374, "epoch": 1532} {"train_loss": -5.9936323165893555, "global_step": 64375, "epoch": 1532} {"train_loss": -6.014641761779785, "global_step": 64376, "epoch": 1532} {"train_loss": -5.8980841636657715, "global_step": 64377, "epoch": 1532} {"train_loss": -5.8942108154296875, "global_step": 64378, "epoch": 1532} {"train_loss": -5.912292957305908, "global_step": 64379, "epoch": 1532} {"train_loss": -5.8774261474609375, "global_step": 64380, "epoch": 1532} {"train_loss": -5.86671257019043, "global_step": 64381, "epoch": 1532} {"train_loss": -5.93034553527832, "global_step": 64382, "epoch": 1532} {"train_loss": -5.863797664642334, "global_step": 64383, "epoch": 1532} {"train_loss": -5.971118927001953, "global_step": 64384, "epoch": 1532} {"train_loss": -5.956168992178781, "global_step": 64385, "epoch": 1532, "val_loss": 67317.09375} {"train_loss": -5.8704986572265625, "global_step": 64386, "epoch": 1533} {"train_loss": -5.865570068359375, "global_step": 64387, "epoch": 1533} {"train_loss": -5.971587181091309, "global_step": 64388, "epoch": 1533} {"train_loss": -5.946148872375488, "global_step": 64389, "epoch": 1533} {"train_loss": -5.991930961608887, "global_step": 64390, "epoch": 1533} {"train_loss": -5.958284854888916, "global_step": 64391, "epoch": 1533} {"train_loss": -5.857578277587891, "global_step": 64392, "epoch": 1533} {"train_loss": -5.926353454589844, "global_step": 64393, "epoch": 1533} {"train_loss": -6.022413730621338, "global_step": 64394, "epoch": 1533} {"train_loss": -5.908331871032715, "global_step": 64395, "epoch": 1533} {"train_loss": -5.848113059997559, "global_step": 64396, "epoch": 1533} {"train_loss": -5.951008319854736, "global_step": 64397, "epoch": 1533} {"train_loss": -5.983275413513184, "global_step": 64398, "epoch": 1533} {"train_loss": -5.948215961456299, "global_step": 64399, "epoch": 1533} {"train_loss": -6.031940937042236, "global_step": 64400, "epoch": 1533} {"train_loss": -6.014878749847412, "global_step": 64401, "epoch": 1533} {"train_loss": -6.062839508056641, "global_step": 64402, "epoch": 1533} {"train_loss": -5.927557945251465, "global_step": 64403, "epoch": 1533} {"train_loss": -5.961912155151367, "global_step": 64404, "epoch": 1533} {"train_loss": -5.829677581787109, "global_step": 64405, "epoch": 1533} {"train_loss": -5.97506046295166, "global_step": 64406, "epoch": 1533} {"train_loss": -5.906931400299072, "global_step": 64407, "epoch": 1533} {"train_loss": -5.955869674682617, "global_step": 64408, "epoch": 1533} {"train_loss": -5.989142417907715, "global_step": 64409, "epoch": 1533} {"train_loss": -6.036379814147949, "global_step": 64410, "epoch": 1533} {"train_loss": -5.783180236816406, "global_step": 64411, "epoch": 1533} {"train_loss": -5.782505989074707, "global_step": 64412, "epoch": 1533} {"train_loss": -5.881213188171387, "global_step": 64413, "epoch": 1533} {"train_loss": -5.883641242980957, "global_step": 64414, "epoch": 1533} {"train_loss": -5.958863735198975, "global_step": 64415, "epoch": 1533} {"train_loss": -5.8209614753723145, "global_step": 64416, "epoch": 1533} {"train_loss": -6.003894329071045, "global_step": 64417, "epoch": 1533} {"train_loss": -6.003658294677734, "global_step": 64418, "epoch": 1533} {"train_loss": -6.0054097175598145, "global_step": 64419, "epoch": 1533} {"train_loss": -5.923922538757324, "global_step": 64420, "epoch": 1533} {"train_loss": -5.829181671142578, "global_step": 64421, "epoch": 1533} {"train_loss": -5.989557266235352, "global_step": 64422, "epoch": 1533} {"train_loss": -5.980746269226074, "global_step": 64423, "epoch": 1533} {"train_loss": -5.803847312927246, "global_step": 64424, "epoch": 1533} {"train_loss": -5.940217018127441, "global_step": 64425, "epoch": 1533} {"train_loss": -5.907010078430176, "global_step": 64426, "epoch": 1533} {"train_loss": -5.9312379360198975, "global_step": 64427, "epoch": 1533, "val_loss": 67125.9375} {"train_loss": -6.000555992126465, "global_step": 64428, "epoch": 1534} {"train_loss": -5.838397026062012, "global_step": 64429, "epoch": 1534} {"train_loss": -6.011308670043945, "global_step": 64430, "epoch": 1534} {"train_loss": -5.739920616149902, "global_step": 64431, "epoch": 1534} {"train_loss": -6.072471618652344, "global_step": 64432, "epoch": 1534} {"train_loss": -5.922207355499268, "global_step": 64433, "epoch": 1534} {"train_loss": -5.8582305908203125, "global_step": 64434, "epoch": 1534} {"train_loss": -5.908089637756348, "global_step": 64435, "epoch": 1534} {"train_loss": -5.861377716064453, "global_step": 64436, "epoch": 1534} {"train_loss": -5.946052551269531, "global_step": 64437, "epoch": 1534} {"train_loss": -5.849799633026123, "global_step": 64438, "epoch": 1534} {"train_loss": -6.009298324584961, "global_step": 64439, "epoch": 1534} {"train_loss": -5.893496036529541, "global_step": 64440, "epoch": 1534} {"train_loss": -5.921394348144531, "global_step": 64441, "epoch": 1534} {"train_loss": -5.939730167388916, "global_step": 64442, "epoch": 1534} {"train_loss": -5.942750453948975, "global_step": 64443, "epoch": 1534} {"train_loss": -5.858290672302246, "global_step": 64444, "epoch": 1534} {"train_loss": -5.926374435424805, "global_step": 64445, "epoch": 1534} {"train_loss": -5.923399925231934, "global_step": 64446, "epoch": 1534} {"train_loss": -5.925299644470215, "global_step": 64447, "epoch": 1534} {"train_loss": -6.121438503265381, "global_step": 64448, "epoch": 1534} {"train_loss": -6.074477195739746, "global_step": 64449, "epoch": 1534} {"train_loss": -5.956452369689941, "global_step": 64450, "epoch": 1534} {"train_loss": -5.981086730957031, "global_step": 64451, "epoch": 1534} {"train_loss": -5.9365386962890625, "global_step": 64452, "epoch": 1534} {"train_loss": -5.865540504455566, "global_step": 64453, "epoch": 1534} {"train_loss": -6.021097183227539, "global_step": 64454, "epoch": 1534} {"train_loss": -5.945973873138428, "global_step": 64455, "epoch": 1534} {"train_loss": -5.968640327453613, "global_step": 64456, "epoch": 1534} {"train_loss": -6.074843883514404, "global_step": 64457, "epoch": 1534} {"train_loss": -5.975464820861816, "global_step": 64458, "epoch": 1534} {"train_loss": -5.8389177322387695, "global_step": 64459, "epoch": 1534} {"train_loss": -5.92934513092041, "global_step": 64460, "epoch": 1534} {"train_loss": -5.982185363769531, "global_step": 64461, "epoch": 1534} {"train_loss": -5.99696159362793, "global_step": 64462, "epoch": 1534} {"train_loss": -5.777839660644531, "global_step": 64463, "epoch": 1534} {"train_loss": -5.949841499328613, "global_step": 64464, "epoch": 1534} {"train_loss": -5.908763885498047, "global_step": 64465, "epoch": 1534} {"train_loss": -5.915876388549805, "global_step": 64466, "epoch": 1534} {"train_loss": -5.941722869873047, "global_step": 64467, "epoch": 1534} {"train_loss": -5.899111747741699, "global_step": 64468, "epoch": 1534} {"train_loss": -5.936122076851981, "global_step": 64469, "epoch": 1534, "val_loss": 66983.546875} {"train_loss": -6.013889789581299, "global_step": 64470, "epoch": 1535} {"train_loss": -5.928015232086182, "global_step": 64471, "epoch": 1535} {"train_loss": -5.920432090759277, "global_step": 64472, "epoch": 1535} {"train_loss": -5.843214988708496, "global_step": 64473, "epoch": 1535} {"train_loss": -5.915319442749023, "global_step": 64474, "epoch": 1535} {"train_loss": -5.971149921417236, "global_step": 64475, "epoch": 1535} {"train_loss": -5.920368194580078, "global_step": 64476, "epoch": 1535} {"train_loss": -5.784351348876953, "global_step": 64477, "epoch": 1535} {"train_loss": -5.910149097442627, "global_step": 64478, "epoch": 1535} {"train_loss": -5.822175025939941, "global_step": 64479, "epoch": 1535} {"train_loss": -5.782258987426758, "global_step": 64480, "epoch": 1535} {"train_loss": -5.950750350952148, "global_step": 64481, "epoch": 1535} {"train_loss": -5.855696678161621, "global_step": 64482, "epoch": 1535} {"train_loss": -5.988039493560791, "global_step": 64483, "epoch": 1535} {"train_loss": -5.824516296386719, "global_step": 64484, "epoch": 1535} {"train_loss": -5.910776615142822, "global_step": 64485, "epoch": 1535} {"train_loss": -5.97817325592041, "global_step": 64486, "epoch": 1535} {"train_loss": -5.857865333557129, "global_step": 64487, "epoch": 1535} {"train_loss": -5.9502272605896, "global_step": 64488, "epoch": 1535} {"train_loss": -5.97749662399292, "global_step": 64489, "epoch": 1535} {"train_loss": -5.911198616027832, "global_step": 64490, "epoch": 1535} {"train_loss": -5.821450233459473, "global_step": 64491, "epoch": 1535} {"train_loss": -5.875019073486328, "global_step": 64492, "epoch": 1535} {"train_loss": -5.854791164398193, "global_step": 64493, "epoch": 1535} {"train_loss": -6.028149604797363, "global_step": 64494, "epoch": 1535} {"train_loss": -5.987845420837402, "global_step": 64495, "epoch": 1535} {"train_loss": -5.8674635887146, "global_step": 64496, "epoch": 1535} {"train_loss": -5.901397228240967, "global_step": 64497, "epoch": 1535} {"train_loss": -5.969301700592041, "global_step": 64498, "epoch": 1535} {"train_loss": -5.894309997558594, "global_step": 64499, "epoch": 1535} {"train_loss": -5.942856788635254, "global_step": 64500, "epoch": 1535} {"train_loss": -5.9652323722839355, "global_step": 64501, "epoch": 1535} {"train_loss": -5.77262544631958, "global_step": 64502, "epoch": 1535} {"train_loss": -5.88914155960083, "global_step": 64503, "epoch": 1535} {"train_loss": -5.972464561462402, "global_step": 64504, "epoch": 1535} {"train_loss": -5.948337554931641, "global_step": 64505, "epoch": 1535} {"train_loss": -5.968296051025391, "global_step": 64506, "epoch": 1535} {"train_loss": -5.906479358673096, "global_step": 64507, "epoch": 1535} {"train_loss": -5.754235744476318, "global_step": 64508, "epoch": 1535} {"train_loss": -5.850644588470459, "global_step": 64509, "epoch": 1535} {"train_loss": -5.925190448760986, "global_step": 64510, "epoch": 1535} {"train_loss": -5.907241843995594, "global_step": 64511, "epoch": 1535, "val_loss": 67211.5546875} {"train_loss": -5.916871547698975, "global_step": 64512, "epoch": 1536} {"train_loss": -6.066346168518066, "global_step": 64513, "epoch": 1536} {"train_loss": -5.962350845336914, "global_step": 64514, "epoch": 1536} {"train_loss": -5.8538312911987305, "global_step": 64515, "epoch": 1536} {"train_loss": -5.971961498260498, "global_step": 64516, "epoch": 1536} {"train_loss": -5.727748394012451, "global_step": 64517, "epoch": 1536} {"train_loss": -5.886091232299805, "global_step": 64518, "epoch": 1536} {"train_loss": -5.979706764221191, "global_step": 64519, "epoch": 1536} {"train_loss": -5.891165733337402, "global_step": 64520, "epoch": 1536} {"train_loss": -5.883210182189941, "global_step": 64521, "epoch": 1536} {"train_loss": -5.855257034301758, "global_step": 64522, "epoch": 1536} {"train_loss": -5.8816819190979, "global_step": 64523, "epoch": 1536} {"train_loss": -5.994654655456543, "global_step": 64524, "epoch": 1536} {"train_loss": -5.910944938659668, "global_step": 64525, "epoch": 1536} {"train_loss": -5.927727699279785, "global_step": 64526, "epoch": 1536} {"train_loss": -5.956079483032227, "global_step": 64527, "epoch": 1536} {"train_loss": -5.886699199676514, "global_step": 64528, "epoch": 1536} {"train_loss": -6.008883476257324, "global_step": 64529, "epoch": 1536} {"train_loss": -5.992180824279785, "global_step": 64530, "epoch": 1536} {"train_loss": -5.989964962005615, "global_step": 64531, "epoch": 1536} {"train_loss": -6.012201309204102, "global_step": 64532, "epoch": 1536} {"train_loss": -6.000432968139648, "global_step": 64533, "epoch": 1536} {"train_loss": -6.0569562911987305, "global_step": 64534, "epoch": 1536} {"train_loss": -5.9370622634887695, "global_step": 64535, "epoch": 1536} {"train_loss": -5.845488548278809, "global_step": 64536, "epoch": 1536} {"train_loss": -5.822109222412109, "global_step": 64537, "epoch": 1536} {"train_loss": -5.875030517578125, "global_step": 64538, "epoch": 1536} {"train_loss": -5.904784202575684, "global_step": 64539, "epoch": 1536} {"train_loss": -6.132285118103027, "global_step": 64540, "epoch": 1536} {"train_loss": -5.956515789031982, "global_step": 64541, "epoch": 1536} {"train_loss": -5.847842216491699, "global_step": 64542, "epoch": 1536} {"train_loss": -5.899588584899902, "global_step": 64543, "epoch": 1536} {"train_loss": -5.987710952758789, "global_step": 64544, "epoch": 1536} {"train_loss": -5.9398512840271, "global_step": 64545, "epoch": 1536} {"train_loss": -5.793603897094727, "global_step": 64546, "epoch": 1536} {"train_loss": -5.976497650146484, "global_step": 64547, "epoch": 1536} {"train_loss": -5.904567241668701, "global_step": 64548, "epoch": 1536} {"train_loss": -5.985894203186035, "global_step": 64549, "epoch": 1536} {"train_loss": -5.906698226928711, "global_step": 64550, "epoch": 1536} {"train_loss": -6.016731262207031, "global_step": 64551, "epoch": 1536} {"train_loss": -5.8563971519470215, "global_step": 64552, "epoch": 1536} {"train_loss": -5.931197314035325, "global_step": 64553, "epoch": 1536, "val_loss": 66969.78125} {"train_loss": -5.865638732910156, "global_step": 64554, "epoch": 1537} {"train_loss": -5.908796310424805, "global_step": 64555, "epoch": 1537} {"train_loss": -5.927412986755371, "global_step": 64556, "epoch": 1537} {"train_loss": -6.0324859619140625, "global_step": 64557, "epoch": 1537} {"train_loss": -5.9496331214904785, "global_step": 64558, "epoch": 1537} {"train_loss": -5.9571990966796875, "global_step": 64559, "epoch": 1537} {"train_loss": -5.966403007507324, "global_step": 64560, "epoch": 1537} {"train_loss": -5.905205726623535, "global_step": 64561, "epoch": 1537} {"train_loss": -6.003016471862793, "global_step": 64562, "epoch": 1537} {"train_loss": -5.886533737182617, "global_step": 64563, "epoch": 1537} {"train_loss": -6.036555767059326, "global_step": 64564, "epoch": 1537} {"train_loss": -5.933581352233887, "global_step": 64565, "epoch": 1537} {"train_loss": -5.903545379638672, "global_step": 64566, "epoch": 1537} {"train_loss": -6.005341053009033, "global_step": 64567, "epoch": 1537} {"train_loss": -5.874342918395996, "global_step": 64568, "epoch": 1537} {"train_loss": -5.93161678314209, "global_step": 64569, "epoch": 1537} {"train_loss": -5.952188014984131, "global_step": 64570, "epoch": 1537} {"train_loss": -5.923179626464844, "global_step": 64571, "epoch": 1537} {"train_loss": -5.960376739501953, "global_step": 64572, "epoch": 1537} {"train_loss": -6.009529113769531, "global_step": 64573, "epoch": 1537} {"train_loss": -5.910971641540527, "global_step": 64574, "epoch": 1537} {"train_loss": -5.912487030029297, "global_step": 64575, "epoch": 1537} {"train_loss": -5.973018646240234, "global_step": 64576, "epoch": 1537} {"train_loss": -5.852365493774414, "global_step": 64577, "epoch": 1537} {"train_loss": -5.904057025909424, "global_step": 64578, "epoch": 1537} {"train_loss": -6.009749412536621, "global_step": 64579, "epoch": 1537} {"train_loss": -5.962082386016846, "global_step": 64580, "epoch": 1537} {"train_loss": -5.948460578918457, "global_step": 64581, "epoch": 1537} {"train_loss": -5.872267723083496, "global_step": 64582, "epoch": 1537} {"train_loss": -5.96108341217041, "global_step": 64583, "epoch": 1537} {"train_loss": -6.006369590759277, "global_step": 64584, "epoch": 1537} {"train_loss": -5.942751884460449, "global_step": 64585, "epoch": 1537} {"train_loss": -5.9045209884643555, "global_step": 64586, "epoch": 1537} {"train_loss": -6.0191569328308105, "global_step": 64587, "epoch": 1537} {"train_loss": -6.123469352722168, "global_step": 64588, "epoch": 1537} {"train_loss": -5.856078147888184, "global_step": 64589, "epoch": 1537} {"train_loss": -5.916919708251953, "global_step": 64590, "epoch": 1537} {"train_loss": -6.000807762145996, "global_step": 64591, "epoch": 1537} {"train_loss": -5.842852592468262, "global_step": 64592, "epoch": 1537} {"train_loss": -5.99498987197876, "global_step": 64593, "epoch": 1537} {"train_loss": -5.964700698852539, "global_step": 64594, "epoch": 1537} {"train_loss": -5.946366185233707, "global_step": 64595, "epoch": 1537, "val_loss": 67322.1953125} {"train_loss": -5.999059677124023, "global_step": 64596, "epoch": 1538} {"train_loss": -6.017819404602051, "global_step": 64597, "epoch": 1538} {"train_loss": -5.877195358276367, "global_step": 64598, "epoch": 1538} {"train_loss": -5.950811386108398, "global_step": 64599, "epoch": 1538} {"train_loss": -5.919487953186035, "global_step": 64600, "epoch": 1538} {"train_loss": -5.9557342529296875, "global_step": 64601, "epoch": 1538} {"train_loss": -6.001129150390625, "global_step": 64602, "epoch": 1538} {"train_loss": -5.7913641929626465, "global_step": 64603, "epoch": 1538} {"train_loss": -5.988525867462158, "global_step": 64604, "epoch": 1538} {"train_loss": -5.971122741699219, "global_step": 64605, "epoch": 1538} {"train_loss": -5.913669109344482, "global_step": 64606, "epoch": 1538} {"train_loss": -5.8489484786987305, "global_step": 64607, "epoch": 1538} {"train_loss": -5.973808765411377, "global_step": 64608, "epoch": 1538} {"train_loss": -5.852416038513184, "global_step": 64609, "epoch": 1538} {"train_loss": -6.098515033721924, "global_step": 64610, "epoch": 1538} {"train_loss": -5.941240310668945, "global_step": 64611, "epoch": 1538} {"train_loss": -6.027932167053223, "global_step": 64612, "epoch": 1538} {"train_loss": -5.928957939147949, "global_step": 64613, "epoch": 1538} {"train_loss": -5.898431777954102, "global_step": 64614, "epoch": 1538} {"train_loss": -5.924774169921875, "global_step": 64615, "epoch": 1538} {"train_loss": -5.941766738891602, "global_step": 64616, "epoch": 1538} {"train_loss": -5.885312080383301, "global_step": 64617, "epoch": 1538} {"train_loss": -5.851015090942383, "global_step": 64618, "epoch": 1538} {"train_loss": -5.952737808227539, "global_step": 64619, "epoch": 1538} {"train_loss": -5.8304853439331055, "global_step": 64620, "epoch": 1538} {"train_loss": -6.044413089752197, "global_step": 64621, "epoch": 1538} {"train_loss": -5.90097188949585, "global_step": 64622, "epoch": 1538} {"train_loss": -5.900815010070801, "global_step": 64623, "epoch": 1538} {"train_loss": -5.891150951385498, "global_step": 64624, "epoch": 1538} {"train_loss": -6.029474258422852, "global_step": 64625, "epoch": 1538} {"train_loss": -5.8518171310424805, "global_step": 64626, "epoch": 1538} {"train_loss": -6.036494255065918, "global_step": 64627, "epoch": 1538} {"train_loss": -5.940586090087891, "global_step": 64628, "epoch": 1538} {"train_loss": -5.984150409698486, "global_step": 64629, "epoch": 1538} {"train_loss": -6.007233619689941, "global_step": 64630, "epoch": 1538} {"train_loss": -5.97315788269043, "global_step": 64631, "epoch": 1538} {"train_loss": -6.007346153259277, "global_step": 64632, "epoch": 1538} {"train_loss": -5.936659336090088, "global_step": 64633, "epoch": 1538} {"train_loss": -5.809732437133789, "global_step": 64634, "epoch": 1538} {"train_loss": -6.032039642333984, "global_step": 64635, "epoch": 1538} {"train_loss": -5.909467697143555, "global_step": 64636, "epoch": 1538} {"train_loss": -5.939469723474412, "global_step": 64637, "epoch": 1538, "val_loss": 67148.8515625} {"train_loss": -5.878318786621094, "global_step": 64638, "epoch": 1539} {"train_loss": -5.879323959350586, "global_step": 64639, "epoch": 1539} {"train_loss": -5.845088005065918, "global_step": 64640, "epoch": 1539} {"train_loss": -5.905491828918457, "global_step": 64641, "epoch": 1539} {"train_loss": -5.9958648681640625, "global_step": 64642, "epoch": 1539} {"train_loss": -5.9085798263549805, "global_step": 64643, "epoch": 1539} {"train_loss": -5.74694299697876, "global_step": 64644, "epoch": 1539} {"train_loss": -5.868304252624512, "global_step": 64645, "epoch": 1539} {"train_loss": -5.984013557434082, "global_step": 64646, "epoch": 1539} {"train_loss": -5.880131244659424, "global_step": 64647, "epoch": 1539} {"train_loss": -5.90989875793457, "global_step": 64648, "epoch": 1539} {"train_loss": -6.157050609588623, "global_step": 64649, "epoch": 1539} {"train_loss": -5.977164268493652, "global_step": 64650, "epoch": 1539} {"train_loss": -5.82450532913208, "global_step": 64651, "epoch": 1539} {"train_loss": -5.911525249481201, "global_step": 64652, "epoch": 1539} {"train_loss": -5.731371879577637, "global_step": 64653, "epoch": 1539} {"train_loss": -5.911795616149902, "global_step": 64654, "epoch": 1539} {"train_loss": -5.961291313171387, "global_step": 64655, "epoch": 1539} {"train_loss": -6.033045768737793, "global_step": 64656, "epoch": 1539} {"train_loss": -5.9697136878967285, "global_step": 64657, "epoch": 1539} {"train_loss": -5.925100803375244, "global_step": 64658, "epoch": 1539} {"train_loss": -5.963068008422852, "global_step": 64659, "epoch": 1539} {"train_loss": -5.847507476806641, "global_step": 64660, "epoch": 1539} {"train_loss": -5.903804779052734, "global_step": 64661, "epoch": 1539} {"train_loss": -5.9707207679748535, "global_step": 64662, "epoch": 1539} {"train_loss": -6.011102676391602, "global_step": 64663, "epoch": 1539} {"train_loss": -5.925487518310547, "global_step": 64664, "epoch": 1539} {"train_loss": -5.987943649291992, "global_step": 64665, "epoch": 1539} {"train_loss": -5.967371940612793, "global_step": 64666, "epoch": 1539} {"train_loss": -5.981906890869141, "global_step": 64667, "epoch": 1539} {"train_loss": -6.031236171722412, "global_step": 64668, "epoch": 1539} {"train_loss": -5.784799098968506, "global_step": 64669, "epoch": 1539} {"train_loss": -5.765463352203369, "global_step": 64670, "epoch": 1539} {"train_loss": -6.014996528625488, "global_step": 64671, "epoch": 1539} {"train_loss": -5.9160566329956055, "global_step": 64672, "epoch": 1539} {"train_loss": -6.030333042144775, "global_step": 64673, "epoch": 1539} {"train_loss": -5.9975810050964355, "global_step": 64674, "epoch": 1539} {"train_loss": -5.832504749298096, "global_step": 64675, "epoch": 1539} {"train_loss": -5.935815334320068, "global_step": 64676, "epoch": 1539} {"train_loss": -6.010455131530762, "global_step": 64677, "epoch": 1539} {"train_loss": -5.86506462097168, "global_step": 64678, "epoch": 1539} {"train_loss": -5.924680584952945, "global_step": 64679, "epoch": 1539, "val_loss": 67297.3984375} {"train_loss": -5.919982433319092, "global_step": 64680, "epoch": 1540} {"train_loss": -5.85219669342041, "global_step": 64681, "epoch": 1540} {"train_loss": -5.9511613845825195, "global_step": 64682, "epoch": 1540} {"train_loss": -5.804319381713867, "global_step": 64683, "epoch": 1540} {"train_loss": -5.902273178100586, "global_step": 64684, "epoch": 1540} {"train_loss": -5.995371341705322, "global_step": 64685, "epoch": 1540} {"train_loss": -5.839061737060547, "global_step": 64686, "epoch": 1540} {"train_loss": -6.035979270935059, "global_step": 64687, "epoch": 1540} {"train_loss": -6.010633945465088, "global_step": 64688, "epoch": 1540} {"train_loss": -5.865861892700195, "global_step": 64689, "epoch": 1540} {"train_loss": -6.014571189880371, "global_step": 64690, "epoch": 1540} {"train_loss": -5.786619186401367, "global_step": 64691, "epoch": 1540} {"train_loss": -5.997523784637451, "global_step": 64692, "epoch": 1540} {"train_loss": -5.7747802734375, "global_step": 64693, "epoch": 1540} {"train_loss": -5.947218894958496, "global_step": 64694, "epoch": 1540} {"train_loss": -5.906485557556152, "global_step": 64695, "epoch": 1540} {"train_loss": -6.016448020935059, "global_step": 64696, "epoch": 1540} {"train_loss": -5.906195640563965, "global_step": 64697, "epoch": 1540} {"train_loss": -5.949642181396484, "global_step": 64698, "epoch": 1540} {"train_loss": -5.898257255554199, "global_step": 64699, "epoch": 1540} {"train_loss": -6.018167495727539, "global_step": 64700, "epoch": 1540} {"train_loss": -5.9229631423950195, "global_step": 64701, "epoch": 1540} {"train_loss": -6.109140396118164, "global_step": 64702, "epoch": 1540} {"train_loss": -5.961922645568848, "global_step": 64703, "epoch": 1540} {"train_loss": -5.933161735534668, "global_step": 64704, "epoch": 1540} {"train_loss": -6.0218000411987305, "global_step": 64705, "epoch": 1540} {"train_loss": -5.887110710144043, "global_step": 64706, "epoch": 1540} {"train_loss": -5.8275604248046875, "global_step": 64707, "epoch": 1540} {"train_loss": -5.891566276550293, "global_step": 64708, "epoch": 1540} {"train_loss": -5.765806198120117, "global_step": 64709, "epoch": 1540} {"train_loss": -5.89450740814209, "global_step": 64710, "epoch": 1540} {"train_loss": -5.978501319885254, "global_step": 64711, "epoch": 1540} {"train_loss": -5.8726911544799805, "global_step": 64712, "epoch": 1540} {"train_loss": -5.964313507080078, "global_step": 64713, "epoch": 1540} {"train_loss": -5.894803047180176, "global_step": 64714, "epoch": 1540} {"train_loss": -5.9845805168151855, "global_step": 64715, "epoch": 1540} {"train_loss": -5.8729658126831055, "global_step": 64716, "epoch": 1540} {"train_loss": -5.944608688354492, "global_step": 64717, "epoch": 1540} {"train_loss": -5.938947677612305, "global_step": 64718, "epoch": 1540} {"train_loss": -5.952957630157471, "global_step": 64719, "epoch": 1540} {"train_loss": -5.953668594360352, "global_step": 64720, "epoch": 1540} {"train_loss": -5.926504260017758, "global_step": 64721, "epoch": 1540, "val_loss": 67026.9453125} {"train_loss": -5.980068683624268, "global_step": 64722, "epoch": 1541} {"train_loss": -5.941441535949707, "global_step": 64723, "epoch": 1541} {"train_loss": -6.024569511413574, "global_step": 64724, "epoch": 1541} {"train_loss": -5.95299768447876, "global_step": 64725, "epoch": 1541} {"train_loss": -5.917543888092041, "global_step": 64726, "epoch": 1541} {"train_loss": -5.952441692352295, "global_step": 64727, "epoch": 1541} {"train_loss": -5.941648960113525, "global_step": 64728, "epoch": 1541} {"train_loss": -6.073155403137207, "global_step": 64729, "epoch": 1541} {"train_loss": -6.074649810791016, "global_step": 64730, "epoch": 1541} {"train_loss": -5.939445495605469, "global_step": 64731, "epoch": 1541} {"train_loss": -5.8793253898620605, "global_step": 64732, "epoch": 1541} {"train_loss": -6.054898738861084, "global_step": 64733, "epoch": 1541} {"train_loss": -6.023250579833984, "global_step": 64734, "epoch": 1541} {"train_loss": -6.009786605834961, "global_step": 64735, "epoch": 1541} {"train_loss": -5.807193279266357, "global_step": 64736, "epoch": 1541} {"train_loss": -5.977266311645508, "global_step": 64737, "epoch": 1541} {"train_loss": -6.009523391723633, "global_step": 64738, "epoch": 1541} {"train_loss": -5.918818473815918, "global_step": 64739, "epoch": 1541} {"train_loss": -5.865053176879883, "global_step": 64740, "epoch": 1541} {"train_loss": -5.77068567276001, "global_step": 64741, "epoch": 1541} {"train_loss": -5.919012069702148, "global_step": 64742, "epoch": 1541} {"train_loss": -5.937834739685059, "global_step": 64743, "epoch": 1541} {"train_loss": -5.907917499542236, "global_step": 64744, "epoch": 1541} {"train_loss": -5.972745418548584, "global_step": 64745, "epoch": 1541} {"train_loss": -5.869921684265137, "global_step": 64746, "epoch": 1541} {"train_loss": -5.976846694946289, "global_step": 64747, "epoch": 1541} {"train_loss": -6.008774757385254, "global_step": 64748, "epoch": 1541} {"train_loss": -5.900943756103516, "global_step": 64749, "epoch": 1541} {"train_loss": -5.964737892150879, "global_step": 64750, "epoch": 1541} {"train_loss": -5.912891387939453, "global_step": 64751, "epoch": 1541} {"train_loss": -5.913719177246094, "global_step": 64752, "epoch": 1541} {"train_loss": -5.897049903869629, "global_step": 64753, "epoch": 1541} {"train_loss": -5.895050048828125, "global_step": 64754, "epoch": 1541} {"train_loss": -5.897036552429199, "global_step": 64755, "epoch": 1541} {"train_loss": -5.889573097229004, "global_step": 64756, "epoch": 1541} {"train_loss": -5.782114028930664, "global_step": 64757, "epoch": 1541} {"train_loss": -6.010163307189941, "global_step": 64758, "epoch": 1541} {"train_loss": -6.010324478149414, "global_step": 64759, "epoch": 1541} {"train_loss": -6.014296531677246, "global_step": 64760, "epoch": 1541} {"train_loss": -5.890324592590332, "global_step": 64761, "epoch": 1541} {"train_loss": -5.893545150756836, "global_step": 64762, "epoch": 1541} {"train_loss": -5.939687967300415, "global_step": 64763, "epoch": 1541, "val_loss": 67003.0546875} {"train_loss": -5.882545471191406, "global_step": 64764, "epoch": 1542} {"train_loss": -5.9658050537109375, "global_step": 64765, "epoch": 1542} {"train_loss": -5.957490921020508, "global_step": 64766, "epoch": 1542} {"train_loss": -5.963440418243408, "global_step": 64767, "epoch": 1542} {"train_loss": -5.8936662673950195, "global_step": 64768, "epoch": 1542} {"train_loss": -5.987738609313965, "global_step": 64769, "epoch": 1542} {"train_loss": -5.977109909057617, "global_step": 64770, "epoch": 1542} {"train_loss": -5.90286111831665, "global_step": 64771, "epoch": 1542} {"train_loss": -5.920535087585449, "global_step": 64772, "epoch": 1542} {"train_loss": -5.8757758140563965, "global_step": 64773, "epoch": 1542} {"train_loss": -5.96985387802124, "global_step": 64774, "epoch": 1542} {"train_loss": -5.9210309982299805, "global_step": 64775, "epoch": 1542} {"train_loss": -5.803283214569092, "global_step": 64776, "epoch": 1542} {"train_loss": -6.042441368103027, "global_step": 64777, "epoch": 1542} {"train_loss": -5.909127712249756, "global_step": 64778, "epoch": 1542} {"train_loss": -5.918080806732178, "global_step": 64779, "epoch": 1542} {"train_loss": -6.021749973297119, "global_step": 64780, "epoch": 1542} {"train_loss": -5.875086307525635, "global_step": 64781, "epoch": 1542} {"train_loss": -5.889224529266357, "global_step": 64782, "epoch": 1542} {"train_loss": -5.9338459968566895, "global_step": 64783, "epoch": 1542} {"train_loss": -5.851527214050293, "global_step": 64784, "epoch": 1542} {"train_loss": -5.912167072296143, "global_step": 64785, "epoch": 1542} {"train_loss": -5.833644866943359, "global_step": 64786, "epoch": 1542} {"train_loss": -5.933488368988037, "global_step": 64787, "epoch": 1542} {"train_loss": -5.944101810455322, "global_step": 64788, "epoch": 1542} {"train_loss": -6.00314998626709, "global_step": 64789, "epoch": 1542} {"train_loss": -5.912491798400879, "global_step": 64790, "epoch": 1542} {"train_loss": -5.789828300476074, "global_step": 64791, "epoch": 1542} {"train_loss": -6.005980491638184, "global_step": 64792, "epoch": 1542} {"train_loss": -6.003180980682373, "global_step": 64793, "epoch": 1542} {"train_loss": -5.904238224029541, "global_step": 64794, "epoch": 1542} {"train_loss": -6.0036234855651855, "global_step": 64795, "epoch": 1542} {"train_loss": -5.9013824462890625, "global_step": 64796, "epoch": 1542} {"train_loss": -5.874189376831055, "global_step": 64797, "epoch": 1542} {"train_loss": -5.731359481811523, "global_step": 64798, "epoch": 1542} {"train_loss": -6.039480209350586, "global_step": 64799, "epoch": 1542} {"train_loss": -5.852476596832275, "global_step": 64800, "epoch": 1542} {"train_loss": -5.975215435028076, "global_step": 64801, "epoch": 1542} {"train_loss": -5.91026496887207, "global_step": 64802, "epoch": 1542} {"train_loss": -5.864677906036377, "global_step": 64803, "epoch": 1542} {"train_loss": -5.925005912780762, "global_step": 64804, "epoch": 1542} {"train_loss": -5.9206872554052445, "global_step": 64805, "epoch": 1542, "val_loss": 67000.7890625} {"train_loss": -5.8816938400268555, "global_step": 64806, "epoch": 1543} {"train_loss": -5.993157386779785, "global_step": 64807, "epoch": 1543} {"train_loss": -5.991039276123047, "global_step": 64808, "epoch": 1543} {"train_loss": -5.949775695800781, "global_step": 64809, "epoch": 1543} {"train_loss": -5.863552570343018, "global_step": 64810, "epoch": 1543} {"train_loss": -5.901613712310791, "global_step": 64811, "epoch": 1543} {"train_loss": -5.878659725189209, "global_step": 64812, "epoch": 1543} {"train_loss": -5.859508514404297, "global_step": 64813, "epoch": 1543} {"train_loss": -6.0072021484375, "global_step": 64814, "epoch": 1543} {"train_loss": -5.980017185211182, "global_step": 64815, "epoch": 1543} {"train_loss": -6.013095855712891, "global_step": 64816, "epoch": 1543} {"train_loss": -5.920348644256592, "global_step": 64817, "epoch": 1543} {"train_loss": -5.889187812805176, "global_step": 64818, "epoch": 1543} {"train_loss": -5.88802433013916, "global_step": 64819, "epoch": 1543} {"train_loss": -5.84473991394043, "global_step": 64820, "epoch": 1543} {"train_loss": -5.967669486999512, "global_step": 64821, "epoch": 1543} {"train_loss": -5.937042236328125, "global_step": 64822, "epoch": 1543} {"train_loss": -6.027904510498047, "global_step": 64823, "epoch": 1543} {"train_loss": -5.870509147644043, "global_step": 64824, "epoch": 1543} {"train_loss": -5.923318862915039, "global_step": 64825, "epoch": 1543} {"train_loss": -5.968074798583984, "global_step": 64826, "epoch": 1543} {"train_loss": -5.914987564086914, "global_step": 64827, "epoch": 1543} {"train_loss": -5.96524715423584, "global_step": 64828, "epoch": 1543} {"train_loss": -5.889379501342773, "global_step": 64829, "epoch": 1543} {"train_loss": -5.900104999542236, "global_step": 64830, "epoch": 1543} {"train_loss": -5.9200334548950195, "global_step": 64831, "epoch": 1543} {"train_loss": -5.964560508728027, "global_step": 64832, "epoch": 1543} {"train_loss": -5.984100341796875, "global_step": 64833, "epoch": 1543} {"train_loss": -5.986506462097168, "global_step": 64834, "epoch": 1543} {"train_loss": -5.911832809448242, "global_step": 64835, "epoch": 1543} {"train_loss": -5.91461181640625, "global_step": 64836, "epoch": 1543} {"train_loss": -5.984841823577881, "global_step": 64837, "epoch": 1543} {"train_loss": -5.957806587219238, "global_step": 64838, "epoch": 1543} {"train_loss": -6.011178016662598, "global_step": 64839, "epoch": 1543} {"train_loss": -5.998115539550781, "global_step": 64840, "epoch": 1543} {"train_loss": -5.992642402648926, "global_step": 64841, "epoch": 1543} {"train_loss": -5.989292144775391, "global_step": 64842, "epoch": 1543} {"train_loss": -5.983145236968994, "global_step": 64843, "epoch": 1543} {"train_loss": -5.976255416870117, "global_step": 64844, "epoch": 1543} {"train_loss": -6.057708740234375, "global_step": 64845, "epoch": 1543} {"train_loss": -5.975651264190674, "global_step": 64846, "epoch": 1543} {"train_loss": -5.947115273702712, "global_step": 64847, "epoch": 1543, "val_loss": 67137.2421875} {"train_loss": -5.859259605407715, "global_step": 64848, "epoch": 1544} {"train_loss": -6.004063606262207, "global_step": 64849, "epoch": 1544} {"train_loss": -5.938876628875732, "global_step": 64850, "epoch": 1544} {"train_loss": -5.938250541687012, "global_step": 64851, "epoch": 1544} {"train_loss": -5.998631000518799, "global_step": 64852, "epoch": 1544} {"train_loss": -5.957557201385498, "global_step": 64853, "epoch": 1544} {"train_loss": -6.033935070037842, "global_step": 64854, "epoch": 1544} {"train_loss": -5.936122894287109, "global_step": 64855, "epoch": 1544} {"train_loss": -5.967610836029053, "global_step": 64856, "epoch": 1544} {"train_loss": -5.931100368499756, "global_step": 64857, "epoch": 1544} {"train_loss": -5.9669294357299805, "global_step": 64858, "epoch": 1544} {"train_loss": -5.851225852966309, "global_step": 64859, "epoch": 1544} {"train_loss": -5.98759651184082, "global_step": 64860, "epoch": 1544} {"train_loss": -5.929266929626465, "global_step": 64861, "epoch": 1544} {"train_loss": -5.854107856750488, "global_step": 64862, "epoch": 1544} {"train_loss": -5.963013648986816, "global_step": 64863, "epoch": 1544} {"train_loss": -5.821693420410156, "global_step": 64864, "epoch": 1544} {"train_loss": -5.969757080078125, "global_step": 64865, "epoch": 1544} {"train_loss": -5.894564628601074, "global_step": 64866, "epoch": 1544} {"train_loss": -5.921313285827637, "global_step": 64867, "epoch": 1544} {"train_loss": -6.05653190612793, "global_step": 64868, "epoch": 1544} {"train_loss": -6.003777027130127, "global_step": 64869, "epoch": 1544} {"train_loss": -5.993185520172119, "global_step": 64870, "epoch": 1544} {"train_loss": -5.924544811248779, "global_step": 64871, "epoch": 1544} {"train_loss": -5.920103073120117, "global_step": 64872, "epoch": 1544} {"train_loss": -5.801390647888184, "global_step": 64873, "epoch": 1544} {"train_loss": -5.8830108642578125, "global_step": 64874, "epoch": 1544} {"train_loss": -5.878294467926025, "global_step": 64875, "epoch": 1544} {"train_loss": -5.907732963562012, "global_step": 64876, "epoch": 1544} {"train_loss": -5.900274276733398, "global_step": 64877, "epoch": 1544} {"train_loss": -5.937505722045898, "global_step": 64878, "epoch": 1544} {"train_loss": -5.884367942810059, "global_step": 64879, "epoch": 1544} {"train_loss": -5.934687614440918, "global_step": 64880, "epoch": 1544} {"train_loss": -5.991792678833008, "global_step": 64881, "epoch": 1544} {"train_loss": -6.073155403137207, "global_step": 64882, "epoch": 1544} {"train_loss": -6.008648872375488, "global_step": 64883, "epoch": 1544} {"train_loss": -6.0091753005981445, "global_step": 64884, "epoch": 1544} {"train_loss": -5.881474018096924, "global_step": 64885, "epoch": 1544} {"train_loss": -5.955833435058594, "global_step": 64886, "epoch": 1544} {"train_loss": -5.934081077575684, "global_step": 64887, "epoch": 1544} {"train_loss": -6.000481128692627, "global_step": 64888, "epoch": 1544} {"train_loss": -5.942985739026751, "global_step": 64889, "epoch": 1544, "val_loss": 67115.375} {"train_loss": -6.028622150421143, "global_step": 64890, "epoch": 1545} {"train_loss": -5.769105911254883, "global_step": 64891, "epoch": 1545} {"train_loss": -5.932596206665039, "global_step": 64892, "epoch": 1545} {"train_loss": -5.871188163757324, "global_step": 64893, "epoch": 1545} {"train_loss": -5.881466865539551, "global_step": 64894, "epoch": 1545} {"train_loss": -5.898266792297363, "global_step": 64895, "epoch": 1545} {"train_loss": -5.96306037902832, "global_step": 64896, "epoch": 1545} {"train_loss": -5.870462894439697, "global_step": 64897, "epoch": 1545} {"train_loss": -5.957313060760498, "global_step": 64898, "epoch": 1545} {"train_loss": -6.0964508056640625, "global_step": 64899, "epoch": 1545} {"train_loss": -5.9355926513671875, "global_step": 64900, "epoch": 1545} {"train_loss": -5.946041107177734, "global_step": 64901, "epoch": 1545} {"train_loss": -5.98392391204834, "global_step": 64902, "epoch": 1545} {"train_loss": -6.035284996032715, "global_step": 64903, "epoch": 1545} {"train_loss": -5.938076019287109, "global_step": 64904, "epoch": 1545} {"train_loss": -5.916228771209717, "global_step": 64905, "epoch": 1545} {"train_loss": -5.928442001342773, "global_step": 64906, "epoch": 1545} {"train_loss": -5.996854782104492, "global_step": 64907, "epoch": 1545} {"train_loss": -5.845528602600098, "global_step": 64908, "epoch": 1545} {"train_loss": -5.94029426574707, "global_step": 64909, "epoch": 1545} {"train_loss": -5.795232772827148, "global_step": 64910, "epoch": 1545} {"train_loss": -5.902495384216309, "global_step": 64911, "epoch": 1545} {"train_loss": -5.987880706787109, "global_step": 64912, "epoch": 1545} {"train_loss": -5.922525405883789, "global_step": 64913, "epoch": 1545} {"train_loss": -5.92563009262085, "global_step": 64914, "epoch": 1545} {"train_loss": -5.995450973510742, "global_step": 64915, "epoch": 1545} {"train_loss": -5.968384742736816, "global_step": 64916, "epoch": 1545} {"train_loss": -5.910351753234863, "global_step": 64917, "epoch": 1545} {"train_loss": -5.909210205078125, "global_step": 64918, "epoch": 1545} {"train_loss": -5.976798057556152, "global_step": 64919, "epoch": 1545} {"train_loss": -6.0065178871154785, "global_step": 64920, "epoch": 1545} {"train_loss": -5.986771106719971, "global_step": 64921, "epoch": 1545} {"train_loss": -5.8809967041015625, "global_step": 64922, "epoch": 1545} {"train_loss": -5.934654235839844, "global_step": 64923, "epoch": 1545} {"train_loss": -5.995849132537842, "global_step": 64924, "epoch": 1545} {"train_loss": -5.883010387420654, "global_step": 64925, "epoch": 1545} {"train_loss": -5.956065654754639, "global_step": 64926, "epoch": 1545} {"train_loss": -5.954476356506348, "global_step": 64927, "epoch": 1545} {"train_loss": -5.858394622802734, "global_step": 64928, "epoch": 1545} {"train_loss": -6.002888202667236, "global_step": 64929, "epoch": 1545} {"train_loss": -5.863041400909424, "global_step": 64930, "epoch": 1545} {"train_loss": -5.937329780487787, "global_step": 64931, "epoch": 1545, "val_loss": 67037.6328125} {"train_loss": -5.993738651275635, "global_step": 64932, "epoch": 1546} {"train_loss": -6.049116134643555, "global_step": 64933, "epoch": 1546} {"train_loss": -5.93170166015625, "global_step": 64934, "epoch": 1546} {"train_loss": -6.056184768676758, "global_step": 64935, "epoch": 1546} {"train_loss": -5.882495403289795, "global_step": 64936, "epoch": 1546} {"train_loss": -5.988656997680664, "global_step": 64937, "epoch": 1546} {"train_loss": -5.980407238006592, "global_step": 64938, "epoch": 1546} {"train_loss": -5.960766792297363, "global_step": 64939, "epoch": 1546} {"train_loss": -5.935564994812012, "global_step": 64940, "epoch": 1546} {"train_loss": -5.988049507141113, "global_step": 64941, "epoch": 1546} {"train_loss": -5.849236965179443, "global_step": 64942, "epoch": 1546} {"train_loss": -5.818083763122559, "global_step": 64943, "epoch": 1546} {"train_loss": -6.019607067108154, "global_step": 64944, "epoch": 1546} {"train_loss": -5.933791160583496, "global_step": 64945, "epoch": 1546} {"train_loss": -5.928959846496582, "global_step": 64946, "epoch": 1546} {"train_loss": -5.90767765045166, "global_step": 64947, "epoch": 1546} {"train_loss": -5.914424896240234, "global_step": 64948, "epoch": 1546} {"train_loss": -5.960453987121582, "global_step": 64949, "epoch": 1546} {"train_loss": -5.892279624938965, "global_step": 64950, "epoch": 1546} {"train_loss": -5.974483489990234, "global_step": 64951, "epoch": 1546} {"train_loss": -6.0017170906066895, "global_step": 64952, "epoch": 1546} {"train_loss": -6.018087387084961, "global_step": 64953, "epoch": 1546} {"train_loss": -6.0544114112854, "global_step": 64954, "epoch": 1546} {"train_loss": -5.975790023803711, "global_step": 64955, "epoch": 1546} {"train_loss": -5.829748153686523, "global_step": 64956, "epoch": 1546} {"train_loss": -5.959735870361328, "global_step": 64957, "epoch": 1546} {"train_loss": -5.938665390014648, "global_step": 64958, "epoch": 1546} {"train_loss": -5.814342975616455, "global_step": 64959, "epoch": 1546} {"train_loss": -5.976037979125977, "global_step": 64960, "epoch": 1546} {"train_loss": -5.979977607727051, "global_step": 64961, "epoch": 1546} {"train_loss": -5.988508701324463, "global_step": 64962, "epoch": 1546} {"train_loss": -5.7988128662109375, "global_step": 64963, "epoch": 1546} {"train_loss": -5.967004776000977, "global_step": 64964, "epoch": 1546} {"train_loss": -5.928730010986328, "global_step": 64965, "epoch": 1546} {"train_loss": -5.838950157165527, "global_step": 64966, "epoch": 1546} {"train_loss": -5.899847984313965, "global_step": 64967, "epoch": 1546} {"train_loss": -5.959719657897949, "global_step": 64968, "epoch": 1546} {"train_loss": -6.040829181671143, "global_step": 64969, "epoch": 1546} {"train_loss": -6.036956310272217, "global_step": 64970, "epoch": 1546} {"train_loss": -5.973029136657715, "global_step": 64971, "epoch": 1546} {"train_loss": -5.922322750091553, "global_step": 64972, "epoch": 1546} {"train_loss": -5.947610832396007, "global_step": 64973, "epoch": 1546, "val_loss": 67065.7265625} {"train_loss": -5.970127105712891, "global_step": 64974, "epoch": 1547} {"train_loss": -5.921992301940918, "global_step": 64975, "epoch": 1547} {"train_loss": -6.100454330444336, "global_step": 64976, "epoch": 1547} {"train_loss": -5.9282684326171875, "global_step": 64977, "epoch": 1547} {"train_loss": -5.93949556350708, "global_step": 64978, "epoch": 1547} {"train_loss": -6.04449462890625, "global_step": 64979, "epoch": 1547} {"train_loss": -5.902813911437988, "global_step": 64980, "epoch": 1547} {"train_loss": -6.011916160583496, "global_step": 64981, "epoch": 1547} {"train_loss": -5.860569000244141, "global_step": 64982, "epoch": 1547} {"train_loss": -5.804381370544434, "global_step": 64983, "epoch": 1547} {"train_loss": -5.938233852386475, "global_step": 64984, "epoch": 1547} {"train_loss": -5.921914100646973, "global_step": 64985, "epoch": 1547} {"train_loss": -5.782349109649658, "global_step": 64986, "epoch": 1547} {"train_loss": -5.998856544494629, "global_step": 64987, "epoch": 1547} {"train_loss": -5.958685874938965, "global_step": 64988, "epoch": 1547} {"train_loss": -5.951272964477539, "global_step": 64989, "epoch": 1547} {"train_loss": -5.878566741943359, "global_step": 64990, "epoch": 1547} {"train_loss": -5.965388774871826, "global_step": 64991, "epoch": 1547} {"train_loss": -5.999558448791504, "global_step": 64992, "epoch": 1547} {"train_loss": -5.968505859375, "global_step": 64993, "epoch": 1547} {"train_loss": -6.013416290283203, "global_step": 64994, "epoch": 1547} {"train_loss": -5.9115891456604, "global_step": 64995, "epoch": 1547} {"train_loss": -5.83975076675415, "global_step": 64996, "epoch": 1547} {"train_loss": -5.9631667137146, "global_step": 64997, "epoch": 1547} {"train_loss": -5.988032341003418, "global_step": 64998, "epoch": 1547} {"train_loss": -5.89047908782959, "global_step": 64999, "epoch": 1547} {"train_loss": -5.884169578552246, "global_step": 65000, "epoch": 1547} {"train_loss": -6.003636360168457, "global_step": 65001, "epoch": 1547} {"train_loss": -5.802640914916992, "global_step": 65002, "epoch": 1547} {"train_loss": -5.827507019042969, "global_step": 65003, "epoch": 1547} {"train_loss": -5.875831604003906, "global_step": 65004, "epoch": 1547} {"train_loss": -6.043952941894531, "global_step": 65005, "epoch": 1547} {"train_loss": -5.909574508666992, "global_step": 65006, "epoch": 1547} {"train_loss": -5.831368446350098, "global_step": 65007, "epoch": 1547} {"train_loss": -5.9056396484375, "global_step": 65008, "epoch": 1547} {"train_loss": -6.039854049682617, "global_step": 65009, "epoch": 1547} {"train_loss": -5.999238014221191, "global_step": 65010, "epoch": 1547} {"train_loss": -5.803402900695801, "global_step": 65011, "epoch": 1547} {"train_loss": -5.99111795425415, "global_step": 65012, "epoch": 1547} {"train_loss": -5.949258804321289, "global_step": 65013, "epoch": 1547} {"train_loss": -5.886667251586914, "global_step": 65014, "epoch": 1547} {"train_loss": -5.931583256948562, "global_step": 65015, "epoch": 1547, "val_loss": 67235.3984375} {"train_loss": -5.904526710510254, "global_step": 65016, "epoch": 1548} {"train_loss": -6.027772903442383, "global_step": 65017, "epoch": 1548} {"train_loss": -5.915194511413574, "global_step": 65018, "epoch": 1548} {"train_loss": -5.930343151092529, "global_step": 65019, "epoch": 1548} {"train_loss": -6.049778938293457, "global_step": 65020, "epoch": 1548} {"train_loss": -5.866168975830078, "global_step": 65021, "epoch": 1548} {"train_loss": -5.96130895614624, "global_step": 65022, "epoch": 1548} {"train_loss": -5.841609954833984, "global_step": 65023, "epoch": 1548} {"train_loss": -6.001858234405518, "global_step": 65024, "epoch": 1548} {"train_loss": -5.976996421813965, "global_step": 65025, "epoch": 1548} {"train_loss": -5.905881881713867, "global_step": 65026, "epoch": 1548} {"train_loss": -5.939210414886475, "global_step": 65027, "epoch": 1548} {"train_loss": -5.941441059112549, "global_step": 65028, "epoch": 1548} {"train_loss": -5.9077372550964355, "global_step": 65029, "epoch": 1548} {"train_loss": -6.002185821533203, "global_step": 65030, "epoch": 1548} {"train_loss": -5.86671781539917, "global_step": 65031, "epoch": 1548} {"train_loss": -6.0912275314331055, "global_step": 65032, "epoch": 1548} {"train_loss": -5.857790470123291, "global_step": 65033, "epoch": 1548} {"train_loss": -5.891139984130859, "global_step": 65034, "epoch": 1548} {"train_loss": -5.859989166259766, "global_step": 65035, "epoch": 1548} {"train_loss": -5.785303115844727, "global_step": 65036, "epoch": 1548} {"train_loss": -6.04170560836792, "global_step": 65037, "epoch": 1548} {"train_loss": -5.901180267333984, "global_step": 65038, "epoch": 1548} {"train_loss": -5.92500114440918, "global_step": 65039, "epoch": 1548} {"train_loss": -5.891337871551514, "global_step": 65040, "epoch": 1548} {"train_loss": -5.818211555480957, "global_step": 65041, "epoch": 1548} {"train_loss": -5.877934455871582, "global_step": 65042, "epoch": 1548} {"train_loss": -5.775092124938965, "global_step": 65043, "epoch": 1548} {"train_loss": -5.973973274230957, "global_step": 65044, "epoch": 1548} {"train_loss": -5.837413787841797, "global_step": 65045, "epoch": 1548} {"train_loss": -5.874090194702148, "global_step": 65046, "epoch": 1548} {"train_loss": -5.969161033630371, "global_step": 65047, "epoch": 1548} {"train_loss": -5.89309549331665, "global_step": 65048, "epoch": 1548} {"train_loss": -5.913266181945801, "global_step": 65049, "epoch": 1548} {"train_loss": -5.993431091308594, "global_step": 65050, "epoch": 1548} {"train_loss": -5.804235458374023, "global_step": 65051, "epoch": 1548} {"train_loss": -6.009003162384033, "global_step": 65052, "epoch": 1548} {"train_loss": -5.904899597167969, "global_step": 65053, "epoch": 1548} {"train_loss": -6.034709930419922, "global_step": 65054, "epoch": 1548} {"train_loss": -5.969250679016113, "global_step": 65055, "epoch": 1548} {"train_loss": -6.032721996307373, "global_step": 65056, "epoch": 1548} {"train_loss": -5.9266597884041925, "global_step": 65057, "epoch": 1548, "val_loss": 66785.2265625} {"train_loss": -5.887316703796387, "global_step": 65058, "epoch": 1549} {"train_loss": -5.860962867736816, "global_step": 65059, "epoch": 1549} {"train_loss": -5.849458694458008, "global_step": 65060, "epoch": 1549} {"train_loss": -5.923526763916016, "global_step": 65061, "epoch": 1549} {"train_loss": -6.067019462585449, "global_step": 65062, "epoch": 1549} {"train_loss": -5.925516128540039, "global_step": 65063, "epoch": 1549} {"train_loss": -5.889189720153809, "global_step": 65064, "epoch": 1549} {"train_loss": -5.979006767272949, "global_step": 65065, "epoch": 1549} {"train_loss": -5.828464984893799, "global_step": 65066, "epoch": 1549} {"train_loss": -6.022083282470703, "global_step": 65067, "epoch": 1549} {"train_loss": -5.900937557220459, "global_step": 65068, "epoch": 1549} {"train_loss": -5.968780994415283, "global_step": 65069, "epoch": 1549} {"train_loss": -6.011362075805664, "global_step": 65070, "epoch": 1549} {"train_loss": -5.963802337646484, "global_step": 65071, "epoch": 1549} {"train_loss": -5.935009002685547, "global_step": 65072, "epoch": 1549} {"train_loss": -5.849368095397949, "global_step": 65073, "epoch": 1549} {"train_loss": -5.983370780944824, "global_step": 65074, "epoch": 1549} {"train_loss": -5.860828399658203, "global_step": 65075, "epoch": 1549} {"train_loss": -6.057240962982178, "global_step": 65076, "epoch": 1549} {"train_loss": -5.747101783752441, "global_step": 65077, "epoch": 1549} {"train_loss": -6.108156681060791, "global_step": 65078, "epoch": 1549} {"train_loss": -5.975748538970947, "global_step": 65079, "epoch": 1549} {"train_loss": -5.840066909790039, "global_step": 65080, "epoch": 1549} {"train_loss": -5.954301834106445, "global_step": 65081, "epoch": 1549} {"train_loss": -5.933065414428711, "global_step": 65082, "epoch": 1549} {"train_loss": -5.914471626281738, "global_step": 65083, "epoch": 1549} {"train_loss": -6.009517669677734, "global_step": 65084, "epoch": 1549} {"train_loss": -5.935793876647949, "global_step": 65085, "epoch": 1549} {"train_loss": -5.946799278259277, "global_step": 65086, "epoch": 1549} {"train_loss": -5.981814861297607, "global_step": 65087, "epoch": 1549} {"train_loss": -5.895116329193115, "global_step": 65088, "epoch": 1549} {"train_loss": -5.971540451049805, "global_step": 65089, "epoch": 1549} {"train_loss": -5.9354047775268555, "global_step": 65090, "epoch": 1549} {"train_loss": -6.038104057312012, "global_step": 65091, "epoch": 1549} {"train_loss": -5.911345958709717, "global_step": 65092, "epoch": 1549} {"train_loss": -5.953912734985352, "global_step": 65093, "epoch": 1549} {"train_loss": -5.932732105255127, "global_step": 65094, "epoch": 1549} {"train_loss": -6.002155303955078, "global_step": 65095, "epoch": 1549} {"train_loss": -5.994022369384766, "global_step": 65096, "epoch": 1549} {"train_loss": -5.958760738372803, "global_step": 65097, "epoch": 1549} {"train_loss": -5.881622791290283, "global_step": 65098, "epoch": 1549} {"train_loss": -5.941361733845302, "global_step": 65099, "epoch": 1549, "val_loss": 67188.71875} {"train_loss": -5.987967491149902, "global_step": 65100, "epoch": 1550} {"train_loss": -5.896927356719971, "global_step": 65101, "epoch": 1550} {"train_loss": -5.89881706237793, "global_step": 65102, "epoch": 1550} {"train_loss": -5.89644718170166, "global_step": 65103, "epoch": 1550} {"train_loss": -5.893036365509033, "global_step": 65104, "epoch": 1550} {"train_loss": -6.042553901672363, "global_step": 65105, "epoch": 1550} {"train_loss": -6.046561241149902, "global_step": 65106, "epoch": 1550} {"train_loss": -5.985208511352539, "global_step": 65107, "epoch": 1550} {"train_loss": -5.878696441650391, "global_step": 65108, "epoch": 1550} {"train_loss": -5.99497127532959, "global_step": 65109, "epoch": 1550} {"train_loss": -5.930967807769775, "global_step": 65110, "epoch": 1550} {"train_loss": -5.823027610778809, "global_step": 65111, "epoch": 1550} {"train_loss": -5.840239524841309, "global_step": 65112, "epoch": 1550} {"train_loss": -6.075198173522949, "global_step": 65113, "epoch": 1550} {"train_loss": -5.868294715881348, "global_step": 65114, "epoch": 1550} {"train_loss": -6.008502006530762, "global_step": 65115, "epoch": 1550} {"train_loss": -5.907410621643066, "global_step": 65116, "epoch": 1550} {"train_loss": -5.873987197875977, "global_step": 65117, "epoch": 1550} {"train_loss": -5.943764686584473, "global_step": 65118, "epoch": 1550} {"train_loss": -5.919789791107178, "global_step": 65119, "epoch": 1550} {"train_loss": -5.8685150146484375, "global_step": 65120, "epoch": 1550} {"train_loss": -5.916207313537598, "global_step": 65121, "epoch": 1550} {"train_loss": -6.033514022827148, "global_step": 65122, "epoch": 1550} {"train_loss": -5.8124895095825195, "global_step": 65123, "epoch": 1550} {"train_loss": -5.937856674194336, "global_step": 65124, "epoch": 1550} {"train_loss": -5.916177749633789, "global_step": 65125, "epoch": 1550} {"train_loss": -5.883129596710205, "global_step": 65126, "epoch": 1550} {"train_loss": -5.825477600097656, "global_step": 65127, "epoch": 1550} {"train_loss": -6.035885810852051, "global_step": 65128, "epoch": 1550} {"train_loss": -5.887368202209473, "global_step": 65129, "epoch": 1550} {"train_loss": -6.0461530685424805, "global_step": 65130, "epoch": 1550} {"train_loss": -6.0270771980285645, "global_step": 65131, "epoch": 1550} {"train_loss": -5.897012710571289, "global_step": 65132, "epoch": 1550} {"train_loss": -5.960246562957764, "global_step": 65133, "epoch": 1550} {"train_loss": -6.087970733642578, "global_step": 65134, "epoch": 1550} {"train_loss": -5.926374435424805, "global_step": 65135, "epoch": 1550} {"train_loss": -6.0528340339660645, "global_step": 65136, "epoch": 1550} {"train_loss": -6.013116359710693, "global_step": 65137, "epoch": 1550} {"train_loss": -5.972014427185059, "global_step": 65138, "epoch": 1550} {"train_loss": -6.111687660217285, "global_step": 65139, "epoch": 1550} {"train_loss": -5.88137674331665, "global_step": 65140, "epoch": 1550} {"train_loss": -5.948334659848895, "global_step": 65141, "epoch": 1550, "train/sim_max_reward_0": 0.23744851131641234, "train/sim_max_reward_1": 0.8911367302846601, "train/sim_max_reward_2": 0.7969567366281621, "train/sim_max_reward_3": 0.1618647802096346, "train/sim_max_reward_4": 0.7777793226698547, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.14534706747975512, "test/sim_max_reward_4400001": 0.7505426917024017, "test/sim_max_reward_4400002": 0.055687140942149466, "test/sim_max_reward_4400003": 0.7120411023476304, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.48153021136747026, "test/sim_max_reward_4400006": 0.6248831995335654, "test/sim_max_reward_4400007": 0.023562590220815787, "test/sim_max_reward_4400008": 0.2995603376159385, "test/sim_max_reward_4400009": 0.8184027932295851, "test/sim_max_reward_4400010": 0.2433959191684075, "test/sim_max_reward_4400011": 0.18520502200370814, "test/sim_max_reward_4400012": 0.8324140960192726, "test/sim_max_reward_4400013": 0.8357832160710674, "test/sim_max_reward_4400014": 0.5940792248574245, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2936562426140448, "test/sim_max_reward_4400019": 0.049276384997068816, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.16529015765625485, "test/sim_max_reward_4400023": 0.554905842113348, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.21286220899410505, "test/sim_max_reward_4400026": 0.765734351322861, "test/sim_max_reward_4400027": 2.1279810611219842e-05, "test/sim_max_reward_4400028": 0.3719326676419366, "test/sim_max_reward_4400029": 2.38042056957157e-05, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.8528961136012522, "test/sim_max_reward_4400032": 0.13538245428936088, "test/sim_max_reward_4400033": 0.3656726215727734, "test/sim_max_reward_4400034": 0.7422233680547319, "test/sim_max_reward_4400035": 0.8027635221087622, "test/sim_max_reward_4400036": 0.7550897487921373, "test/sim_max_reward_4400037": 0.9065581243197798, "test/sim_max_reward_4400038": 0.11274553550446303, "test/sim_max_reward_4400039": 0.580536737159448, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7685746816863394, "test/sim_max_reward_4400042": 0.5749123974267586, "test/sim_max_reward_4400043": 0.7112662159516379, "test/sim_max_reward_4400044": 0.9070451525350492, "test/sim_max_reward_4400045": 0.799982032948417, "test/sim_max_reward_4400046": 0.4821462069486741, "test/sim_max_reward_4400047": 0.8536355652883816, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.9910626910177728, "train/mean_score": 0.5096951400784852, "test/mean_score": 0.4386075524784544, "val_loss": 66972.9765625} {"train_loss": -5.972878456115723, "global_step": 65142, "epoch": 1551} {"train_loss": -5.925389289855957, "global_step": 65143, "epoch": 1551} {"train_loss": -6.000860214233398, "global_step": 65144, "epoch": 1551} {"train_loss": -6.043880939483643, "global_step": 65145, "epoch": 1551} {"train_loss": -5.82680606842041, "global_step": 65146, "epoch": 1551} {"train_loss": -6.069103240966797, "global_step": 65147, "epoch": 1551} {"train_loss": -5.955984115600586, "global_step": 65148, "epoch": 1551} {"train_loss": -5.989579677581787, "global_step": 65149, "epoch": 1551} {"train_loss": -6.047549247741699, "global_step": 65150, "epoch": 1551} {"train_loss": -5.892526626586914, "global_step": 65151, "epoch": 1551} {"train_loss": -5.8135786056518555, "global_step": 65152, "epoch": 1551} {"train_loss": -6.028547286987305, "global_step": 65153, "epoch": 1551} {"train_loss": -5.969754219055176, "global_step": 65154, "epoch": 1551} {"train_loss": -5.964875221252441, "global_step": 65155, "epoch": 1551} {"train_loss": -5.999977111816406, "global_step": 65156, "epoch": 1551} {"train_loss": -5.8559675216674805, "global_step": 65157, "epoch": 1551} {"train_loss": -5.909884929656982, "global_step": 65158, "epoch": 1551} {"train_loss": -6.049243927001953, "global_step": 65159, "epoch": 1551} {"train_loss": -6.016570568084717, "global_step": 65160, "epoch": 1551} {"train_loss": -5.956276893615723, "global_step": 65161, "epoch": 1551} {"train_loss": -5.998129844665527, "global_step": 65162, "epoch": 1551} {"train_loss": -5.919232368469238, "global_step": 65163, "epoch": 1551} {"train_loss": -5.977840423583984, "global_step": 65164, "epoch": 1551} {"train_loss": -5.773618698120117, "global_step": 65165, "epoch": 1551} {"train_loss": -5.863590717315674, "global_step": 65166, "epoch": 1551} {"train_loss": -6.02932071685791, "global_step": 65167, "epoch": 1551} {"train_loss": -5.9114227294921875, "global_step": 65168, "epoch": 1551} {"train_loss": -5.8042120933532715, "global_step": 65169, "epoch": 1551} {"train_loss": -5.945385932922363, "global_step": 65170, "epoch": 1551} {"train_loss": -5.847803115844727, "global_step": 65171, "epoch": 1551} {"train_loss": -5.8913726806640625, "global_step": 65172, "epoch": 1551} {"train_loss": -6.02146053314209, "global_step": 65173, "epoch": 1551} {"train_loss": -5.868694305419922, "global_step": 65174, "epoch": 1551} {"train_loss": -5.853222846984863, "global_step": 65175, "epoch": 1551} {"train_loss": -5.972540378570557, "global_step": 65176, "epoch": 1551} {"train_loss": -5.945483207702637, "global_step": 65177, "epoch": 1551} {"train_loss": -6.016837120056152, "global_step": 65178, "epoch": 1551} {"train_loss": -6.036116123199463, "global_step": 65179, "epoch": 1551} {"train_loss": -5.974761962890625, "global_step": 65180, "epoch": 1551} {"train_loss": -5.954306602478027, "global_step": 65181, "epoch": 1551} {"train_loss": -5.931488990783691, "global_step": 65182, "epoch": 1551} {"train_loss": -5.94820609546843, "global_step": 65183, "epoch": 1551, "val_loss": 67029.578125} {"train_loss": -5.902994632720947, "global_step": 65184, "epoch": 1552} {"train_loss": -6.002544403076172, "global_step": 65185, "epoch": 1552} {"train_loss": -6.06913948059082, "global_step": 65186, "epoch": 1552} {"train_loss": -5.95556116104126, "global_step": 65187, "epoch": 1552} {"train_loss": -5.957669258117676, "global_step": 65188, "epoch": 1552} {"train_loss": -6.052257061004639, "global_step": 65189, "epoch": 1552} {"train_loss": -5.971634864807129, "global_step": 65190, "epoch": 1552} {"train_loss": -5.88832950592041, "global_step": 65191, "epoch": 1552} {"train_loss": -6.046601295471191, "global_step": 65192, "epoch": 1552} {"train_loss": -6.008195877075195, "global_step": 65193, "epoch": 1552} {"train_loss": -5.9979119300842285, "global_step": 65194, "epoch": 1552} {"train_loss": -6.0142083168029785, "global_step": 65195, "epoch": 1552} {"train_loss": -5.8895063400268555, "global_step": 65196, "epoch": 1552} {"train_loss": -5.983292102813721, "global_step": 65197, "epoch": 1552} {"train_loss": -6.0257744789123535, "global_step": 65198, "epoch": 1552} {"train_loss": -5.96403694152832, "global_step": 65199, "epoch": 1552} {"train_loss": -5.910778045654297, "global_step": 65200, "epoch": 1552} {"train_loss": -5.902134895324707, "global_step": 65201, "epoch": 1552} {"train_loss": -5.978293418884277, "global_step": 65202, "epoch": 1552} {"train_loss": -5.9608564376831055, "global_step": 65203, "epoch": 1552} {"train_loss": -5.905460357666016, "global_step": 65204, "epoch": 1552} {"train_loss": -5.924344062805176, "global_step": 65205, "epoch": 1552} {"train_loss": -5.8916778564453125, "global_step": 65206, "epoch": 1552} {"train_loss": -5.98942756652832, "global_step": 65207, "epoch": 1552} {"train_loss": -6.077610015869141, "global_step": 65208, "epoch": 1552} {"train_loss": -5.862967491149902, "global_step": 65209, "epoch": 1552} {"train_loss": -6.05226993560791, "global_step": 65210, "epoch": 1552} {"train_loss": -6.048022270202637, "global_step": 65211, "epoch": 1552} {"train_loss": -6.012609958648682, "global_step": 65212, "epoch": 1552} {"train_loss": -5.975261211395264, "global_step": 65213, "epoch": 1552} {"train_loss": -6.025174140930176, "global_step": 65214, "epoch": 1552} {"train_loss": -5.955350875854492, "global_step": 65215, "epoch": 1552} {"train_loss": -5.835893154144287, "global_step": 65216, "epoch": 1552} {"train_loss": -6.025096416473389, "global_step": 65217, "epoch": 1552} {"train_loss": -5.99547815322876, "global_step": 65218, "epoch": 1552} {"train_loss": -5.943627834320068, "global_step": 65219, "epoch": 1552} {"train_loss": -5.962400913238525, "global_step": 65220, "epoch": 1552} {"train_loss": -5.890419960021973, "global_step": 65221, "epoch": 1552} {"train_loss": -5.963379383087158, "global_step": 65222, "epoch": 1552} {"train_loss": -5.954659938812256, "global_step": 65223, "epoch": 1552} {"train_loss": -5.920309066772461, "global_step": 65224, "epoch": 1552} {"train_loss": -5.968021370115734, "global_step": 65225, "epoch": 1552, "val_loss": 67103.8046875} {"train_loss": -5.862529754638672, "global_step": 65226, "epoch": 1553} {"train_loss": -5.90984582901001, "global_step": 65227, "epoch": 1553} {"train_loss": -6.069289207458496, "global_step": 65228, "epoch": 1553} {"train_loss": -5.974474906921387, "global_step": 65229, "epoch": 1553} {"train_loss": -5.9134840965271, "global_step": 65230, "epoch": 1553} {"train_loss": -5.9514265060424805, "global_step": 65231, "epoch": 1553} {"train_loss": -6.036861896514893, "global_step": 65232, "epoch": 1553} {"train_loss": -6.078259468078613, "global_step": 65233, "epoch": 1553} {"train_loss": -5.968213081359863, "global_step": 65234, "epoch": 1553} {"train_loss": -6.028267860412598, "global_step": 65235, "epoch": 1553} {"train_loss": -6.03138542175293, "global_step": 65236, "epoch": 1553} {"train_loss": -5.907926559448242, "global_step": 65237, "epoch": 1553} {"train_loss": -5.965551853179932, "global_step": 65238, "epoch": 1553} {"train_loss": -6.006860733032227, "global_step": 65239, "epoch": 1553} {"train_loss": -5.793205261230469, "global_step": 65240, "epoch": 1553} {"train_loss": -5.851614952087402, "global_step": 65241, "epoch": 1553} {"train_loss": -5.908404350280762, "global_step": 65242, "epoch": 1553} {"train_loss": -5.805052757263184, "global_step": 65243, "epoch": 1553} {"train_loss": -6.057461261749268, "global_step": 65244, "epoch": 1553} {"train_loss": -5.792954444885254, "global_step": 65245, "epoch": 1553} {"train_loss": -5.954704284667969, "global_step": 65246, "epoch": 1553} {"train_loss": -6.035294055938721, "global_step": 65247, "epoch": 1553} {"train_loss": -5.88613748550415, "global_step": 65248, "epoch": 1553} {"train_loss": -5.945865631103516, "global_step": 65249, "epoch": 1553} {"train_loss": -5.964629173278809, "global_step": 65250, "epoch": 1553} {"train_loss": -6.0095415115356445, "global_step": 65251, "epoch": 1553} {"train_loss": -5.99070405960083, "global_step": 65252, "epoch": 1553} {"train_loss": -5.920069694519043, "global_step": 65253, "epoch": 1553} {"train_loss": -5.986623764038086, "global_step": 65254, "epoch": 1553} {"train_loss": -5.942420959472656, "global_step": 65255, "epoch": 1553} {"train_loss": -5.89955472946167, "global_step": 65256, "epoch": 1553} {"train_loss": -5.965289115905762, "global_step": 65257, "epoch": 1553} {"train_loss": -5.999534606933594, "global_step": 65258, "epoch": 1553} {"train_loss": -5.944031715393066, "global_step": 65259, "epoch": 1553} {"train_loss": -5.974186897277832, "global_step": 65260, "epoch": 1553} {"train_loss": -5.974454402923584, "global_step": 65261, "epoch": 1553} {"train_loss": -6.032930374145508, "global_step": 65262, "epoch": 1553} {"train_loss": -5.853947639465332, "global_step": 65263, "epoch": 1553} {"train_loss": -6.002861976623535, "global_step": 65264, "epoch": 1553} {"train_loss": -5.912962913513184, "global_step": 65265, "epoch": 1553} {"train_loss": -5.934299945831299, "global_step": 65266, "epoch": 1553} {"train_loss": -5.951583805538359, "global_step": 65267, "epoch": 1553, "val_loss": 67086.96875} {"train_loss": -6.002695560455322, "global_step": 65268, "epoch": 1554} {"train_loss": -5.972728252410889, "global_step": 65269, "epoch": 1554} {"train_loss": -5.989776611328125, "global_step": 65270, "epoch": 1554} {"train_loss": -5.851305961608887, "global_step": 65271, "epoch": 1554} {"train_loss": -6.032472610473633, "global_step": 65272, "epoch": 1554} {"train_loss": -5.810965061187744, "global_step": 65273, "epoch": 1554} {"train_loss": -5.889333724975586, "global_step": 65274, "epoch": 1554} {"train_loss": -6.048213005065918, "global_step": 65275, "epoch": 1554} {"train_loss": -5.926386833190918, "global_step": 65276, "epoch": 1554} {"train_loss": -5.854168891906738, "global_step": 65277, "epoch": 1554} {"train_loss": -5.919951438903809, "global_step": 65278, "epoch": 1554} {"train_loss": -6.043605327606201, "global_step": 65279, "epoch": 1554} {"train_loss": -5.79487943649292, "global_step": 65280, "epoch": 1554} {"train_loss": -5.922634124755859, "global_step": 65281, "epoch": 1554} {"train_loss": -5.85159969329834, "global_step": 65282, "epoch": 1554} {"train_loss": -5.95755672454834, "global_step": 65283, "epoch": 1554} {"train_loss": -5.937060356140137, "global_step": 65284, "epoch": 1554} {"train_loss": -5.900134086608887, "global_step": 65285, "epoch": 1554} {"train_loss": -5.934327125549316, "global_step": 65286, "epoch": 1554} {"train_loss": -6.037418365478516, "global_step": 65287, "epoch": 1554} {"train_loss": -5.8290557861328125, "global_step": 65288, "epoch": 1554} {"train_loss": -5.94639778137207, "global_step": 65289, "epoch": 1554} {"train_loss": -5.878870487213135, "global_step": 65290, "epoch": 1554} {"train_loss": -5.950495719909668, "global_step": 65291, "epoch": 1554} {"train_loss": -5.929041862487793, "global_step": 65292, "epoch": 1554} {"train_loss": -5.954470157623291, "global_step": 65293, "epoch": 1554} {"train_loss": -5.870951175689697, "global_step": 65294, "epoch": 1554} {"train_loss": -5.957637786865234, "global_step": 65295, "epoch": 1554} {"train_loss": -5.951748847961426, "global_step": 65296, "epoch": 1554} {"train_loss": -6.038800239562988, "global_step": 65297, "epoch": 1554} {"train_loss": -5.844714164733887, "global_step": 65298, "epoch": 1554} {"train_loss": -5.97959566116333, "global_step": 65299, "epoch": 1554} {"train_loss": -5.962771415710449, "global_step": 65300, "epoch": 1554} {"train_loss": -6.010988235473633, "global_step": 65301, "epoch": 1554} {"train_loss": -6.034759998321533, "global_step": 65302, "epoch": 1554} {"train_loss": -5.992868900299072, "global_step": 65303, "epoch": 1554} {"train_loss": -6.066989898681641, "global_step": 65304, "epoch": 1554} {"train_loss": -5.9037065505981445, "global_step": 65305, "epoch": 1554} {"train_loss": -6.02073860168457, "global_step": 65306, "epoch": 1554} {"train_loss": -5.937475204467773, "global_step": 65307, "epoch": 1554} {"train_loss": -5.884190559387207, "global_step": 65308, "epoch": 1554} {"train_loss": -5.941094296319144, "global_step": 65309, "epoch": 1554, "val_loss": 67122.6484375} {"train_loss": -5.877988338470459, "global_step": 65310, "epoch": 1555} {"train_loss": -5.822030067443848, "global_step": 65311, "epoch": 1555} {"train_loss": -5.854883193969727, "global_step": 65312, "epoch": 1555} {"train_loss": -5.8984904289245605, "global_step": 65313, "epoch": 1555} {"train_loss": -5.897390365600586, "global_step": 65314, "epoch": 1555} {"train_loss": -5.97776985168457, "global_step": 65315, "epoch": 1555} {"train_loss": -5.904021263122559, "global_step": 65316, "epoch": 1555} {"train_loss": -6.0003981590271, "global_step": 65317, "epoch": 1555} {"train_loss": -5.913807392120361, "global_step": 65318, "epoch": 1555} {"train_loss": -6.014776229858398, "global_step": 65319, "epoch": 1555} {"train_loss": -5.987877368927002, "global_step": 65320, "epoch": 1555} {"train_loss": -5.952461242675781, "global_step": 65321, "epoch": 1555} {"train_loss": -5.954553604125977, "global_step": 65322, "epoch": 1555} {"train_loss": -5.888006210327148, "global_step": 65323, "epoch": 1555} {"train_loss": -6.105525970458984, "global_step": 65324, "epoch": 1555} {"train_loss": -5.9826202392578125, "global_step": 65325, "epoch": 1555} {"train_loss": -6.030603408813477, "global_step": 65326, "epoch": 1555} {"train_loss": -6.06370735168457, "global_step": 65327, "epoch": 1555} {"train_loss": -6.08497953414917, "global_step": 65328, "epoch": 1555} {"train_loss": -5.979762554168701, "global_step": 65329, "epoch": 1555} {"train_loss": -5.904825687408447, "global_step": 65330, "epoch": 1555} {"train_loss": -6.108055114746094, "global_step": 65331, "epoch": 1555} {"train_loss": -6.113917350769043, "global_step": 65332, "epoch": 1555} {"train_loss": -5.99698543548584, "global_step": 65333, "epoch": 1555} {"train_loss": -5.960707664489746, "global_step": 65334, "epoch": 1555} {"train_loss": -6.084076881408691, "global_step": 65335, "epoch": 1555} {"train_loss": -5.888401031494141, "global_step": 65336, "epoch": 1555} {"train_loss": -6.112037658691406, "global_step": 65337, "epoch": 1555} {"train_loss": -5.865920066833496, "global_step": 65338, "epoch": 1555} {"train_loss": -5.9770355224609375, "global_step": 65339, "epoch": 1555} {"train_loss": -5.979915618896484, "global_step": 65340, "epoch": 1555} {"train_loss": -5.916177749633789, "global_step": 65341, "epoch": 1555} {"train_loss": -5.901864051818848, "global_step": 65342, "epoch": 1555} {"train_loss": -6.000489234924316, "global_step": 65343, "epoch": 1555} {"train_loss": -5.92714786529541, "global_step": 65344, "epoch": 1555} {"train_loss": -6.001083850860596, "global_step": 65345, "epoch": 1555} {"train_loss": -5.9326934814453125, "global_step": 65346, "epoch": 1555} {"train_loss": -5.742398262023926, "global_step": 65347, "epoch": 1555} {"train_loss": -5.9916157722473145, "global_step": 65348, "epoch": 1555} {"train_loss": -5.9175705909729, "global_step": 65349, "epoch": 1555} {"train_loss": -6.030673980712891, "global_step": 65350, "epoch": 1555} {"train_loss": -5.965609834307716, "global_step": 65351, "epoch": 1555, "val_loss": 67165.7421875} {"train_loss": -5.827663421630859, "global_step": 65352, "epoch": 1556} {"train_loss": -6.13007926940918, "global_step": 65353, "epoch": 1556} {"train_loss": -5.700335502624512, "global_step": 65354, "epoch": 1556} {"train_loss": -5.954564094543457, "global_step": 65355, "epoch": 1556} {"train_loss": -5.943262100219727, "global_step": 65356, "epoch": 1556} {"train_loss": -5.894952774047852, "global_step": 65357, "epoch": 1556} {"train_loss": -5.846822261810303, "global_step": 65358, "epoch": 1556} {"train_loss": -5.938137054443359, "global_step": 65359, "epoch": 1556} {"train_loss": -6.025246620178223, "global_step": 65360, "epoch": 1556} {"train_loss": -5.777205467224121, "global_step": 65361, "epoch": 1556} {"train_loss": -5.803114891052246, "global_step": 65362, "epoch": 1556} {"train_loss": -5.807900428771973, "global_step": 65363, "epoch": 1556} {"train_loss": -6.029439926147461, "global_step": 65364, "epoch": 1556} {"train_loss": -6.031532287597656, "global_step": 65365, "epoch": 1556} {"train_loss": -5.942964553833008, "global_step": 65366, "epoch": 1556} {"train_loss": -5.809391021728516, "global_step": 65367, "epoch": 1556} {"train_loss": -5.911957740783691, "global_step": 65368, "epoch": 1556} {"train_loss": -5.98177433013916, "global_step": 65369, "epoch": 1556} {"train_loss": -5.941769599914551, "global_step": 65370, "epoch": 1556} {"train_loss": -5.878776550292969, "global_step": 65371, "epoch": 1556} {"train_loss": -5.958276271820068, "global_step": 65372, "epoch": 1556} {"train_loss": -5.828542709350586, "global_step": 65373, "epoch": 1556} {"train_loss": -5.824171543121338, "global_step": 65374, "epoch": 1556} {"train_loss": -5.9216108322143555, "global_step": 65375, "epoch": 1556} {"train_loss": -5.9865007400512695, "global_step": 65376, "epoch": 1556} {"train_loss": -6.04459285736084, "global_step": 65377, "epoch": 1556} {"train_loss": -6.0660529136657715, "global_step": 65378, "epoch": 1556} {"train_loss": -6.012009620666504, "global_step": 65379, "epoch": 1556} {"train_loss": -6.000356674194336, "global_step": 65380, "epoch": 1556} {"train_loss": -6.049508094787598, "global_step": 65381, "epoch": 1556} {"train_loss": -5.970754146575928, "global_step": 65382, "epoch": 1556} {"train_loss": -5.8634209632873535, "global_step": 65383, "epoch": 1556} {"train_loss": -6.1013994216918945, "global_step": 65384, "epoch": 1556} {"train_loss": -5.9022698402404785, "global_step": 65385, "epoch": 1556} {"train_loss": -5.986818313598633, "global_step": 65386, "epoch": 1556} {"train_loss": -6.069328784942627, "global_step": 65387, "epoch": 1556} {"train_loss": -5.9972944259643555, "global_step": 65388, "epoch": 1556} {"train_loss": -5.936358451843262, "global_step": 65389, "epoch": 1556} {"train_loss": -5.970270156860352, "global_step": 65390, "epoch": 1556} {"train_loss": -6.037376403808594, "global_step": 65391, "epoch": 1556} {"train_loss": -5.974428176879883, "global_step": 65392, "epoch": 1556} {"train_loss": -5.943910655521211, "global_step": 65393, "epoch": 1556, "val_loss": 67251.15625} {"train_loss": -5.893063545227051, "global_step": 65394, "epoch": 1557} {"train_loss": -5.890435218811035, "global_step": 65395, "epoch": 1557} {"train_loss": -5.974143981933594, "global_step": 65396, "epoch": 1557} {"train_loss": -6.026736259460449, "global_step": 65397, "epoch": 1557} {"train_loss": -5.890627861022949, "global_step": 65398, "epoch": 1557} {"train_loss": -6.131568431854248, "global_step": 65399, "epoch": 1557} {"train_loss": -6.033483982086182, "global_step": 65400, "epoch": 1557} {"train_loss": -5.888792991638184, "global_step": 65401, "epoch": 1557} {"train_loss": -5.884888648986816, "global_step": 65402, "epoch": 1557} {"train_loss": -5.983370304107666, "global_step": 65403, "epoch": 1557} {"train_loss": -5.900568008422852, "global_step": 65404, "epoch": 1557} {"train_loss": -5.809844970703125, "global_step": 65405, "epoch": 1557} {"train_loss": -5.945778846740723, "global_step": 65406, "epoch": 1557} {"train_loss": -5.928433418273926, "global_step": 65407, "epoch": 1557} {"train_loss": -5.850135803222656, "global_step": 65408, "epoch": 1557} {"train_loss": -5.921348571777344, "global_step": 65409, "epoch": 1557} {"train_loss": -5.8909173011779785, "global_step": 65410, "epoch": 1557} {"train_loss": -5.829581260681152, "global_step": 65411, "epoch": 1557} {"train_loss": -5.9400787353515625, "global_step": 65412, "epoch": 1557} {"train_loss": -5.861081123352051, "global_step": 65413, "epoch": 1557} {"train_loss": -5.8896708488464355, "global_step": 65414, "epoch": 1557} {"train_loss": -5.930741786956787, "global_step": 65415, "epoch": 1557} {"train_loss": -5.845713138580322, "global_step": 65416, "epoch": 1557} {"train_loss": -5.948155403137207, "global_step": 65417, "epoch": 1557} {"train_loss": -5.9414496421813965, "global_step": 65418, "epoch": 1557} {"train_loss": -5.966856002807617, "global_step": 65419, "epoch": 1557} {"train_loss": -5.9913201332092285, "global_step": 65420, "epoch": 1557} {"train_loss": -5.880702018737793, "global_step": 65421, "epoch": 1557} {"train_loss": -5.9649810791015625, "global_step": 65422, "epoch": 1557} {"train_loss": -5.846375942230225, "global_step": 65423, "epoch": 1557} {"train_loss": -5.868097305297852, "global_step": 65424, "epoch": 1557} {"train_loss": -5.945525646209717, "global_step": 65425, "epoch": 1557} {"train_loss": -5.841670036315918, "global_step": 65426, "epoch": 1557} {"train_loss": -5.909680366516113, "global_step": 65427, "epoch": 1557} {"train_loss": -5.820003986358643, "global_step": 65428, "epoch": 1557} {"train_loss": -5.749583721160889, "global_step": 65429, "epoch": 1557} {"train_loss": -6.052193641662598, "global_step": 65430, "epoch": 1557} {"train_loss": -5.8047637939453125, "global_step": 65431, "epoch": 1557} {"train_loss": -5.9748711585998535, "global_step": 65432, "epoch": 1557} {"train_loss": -5.812586307525635, "global_step": 65433, "epoch": 1557} {"train_loss": -5.916792869567871, "global_step": 65434, "epoch": 1557} {"train_loss": -5.914910509472802, "global_step": 65435, "epoch": 1557, "val_loss": 67224.6171875} {"train_loss": -5.931729316711426, "global_step": 65436, "epoch": 1558} {"train_loss": -5.941570281982422, "global_step": 65437, "epoch": 1558} {"train_loss": -5.860405921936035, "global_step": 65438, "epoch": 1558} {"train_loss": -6.005132675170898, "global_step": 65439, "epoch": 1558} {"train_loss": -5.85737419128418, "global_step": 65440, "epoch": 1558} {"train_loss": -5.80082368850708, "global_step": 65441, "epoch": 1558} {"train_loss": -5.982266902923584, "global_step": 65442, "epoch": 1558} {"train_loss": -6.001474380493164, "global_step": 65443, "epoch": 1558} {"train_loss": -5.945408344268799, "global_step": 65444, "epoch": 1558} {"train_loss": -6.009427070617676, "global_step": 65445, "epoch": 1558} {"train_loss": -5.887815475463867, "global_step": 65446, "epoch": 1558} {"train_loss": -5.918391227722168, "global_step": 65447, "epoch": 1558} {"train_loss": -5.896640777587891, "global_step": 65448, "epoch": 1558} {"train_loss": -5.905981063842773, "global_step": 65449, "epoch": 1558} {"train_loss": -5.963983535766602, "global_step": 65450, "epoch": 1558} {"train_loss": -5.881673812866211, "global_step": 65451, "epoch": 1558} {"train_loss": -5.976747512817383, "global_step": 65452, "epoch": 1558} {"train_loss": -5.900813579559326, "global_step": 65453, "epoch": 1558} {"train_loss": -5.923943996429443, "global_step": 65454, "epoch": 1558} {"train_loss": -5.865083694458008, "global_step": 65455, "epoch": 1558} {"train_loss": -5.916921138763428, "global_step": 65456, "epoch": 1558} {"train_loss": -6.053138732910156, "global_step": 65457, "epoch": 1558} {"train_loss": -5.817237854003906, "global_step": 65458, "epoch": 1558} {"train_loss": -6.0075459480285645, "global_step": 65459, "epoch": 1558} {"train_loss": -6.024534225463867, "global_step": 65460, "epoch": 1558} {"train_loss": -5.940438747406006, "global_step": 65461, "epoch": 1558} {"train_loss": -6.001430511474609, "global_step": 65462, "epoch": 1558} {"train_loss": -5.9781904220581055, "global_step": 65463, "epoch": 1558} {"train_loss": -6.079165935516357, "global_step": 65464, "epoch": 1558} {"train_loss": -5.982413291931152, "global_step": 65465, "epoch": 1558} {"train_loss": -5.937399864196777, "global_step": 65466, "epoch": 1558} {"train_loss": -6.001755237579346, "global_step": 65467, "epoch": 1558} {"train_loss": -6.182587146759033, "global_step": 65468, "epoch": 1558} {"train_loss": -5.901867866516113, "global_step": 65469, "epoch": 1558} {"train_loss": -5.947721481323242, "global_step": 65470, "epoch": 1558} {"train_loss": -5.967144966125488, "global_step": 65471, "epoch": 1558} {"train_loss": -5.836423873901367, "global_step": 65472, "epoch": 1558} {"train_loss": -5.949251174926758, "global_step": 65473, "epoch": 1558} {"train_loss": -6.00050163269043, "global_step": 65474, "epoch": 1558} {"train_loss": -5.810451507568359, "global_step": 65475, "epoch": 1558} {"train_loss": -6.018279075622559, "global_step": 65476, "epoch": 1558} {"train_loss": -5.9469032174065, "global_step": 65477, "epoch": 1558, "val_loss": 67239.2734375} {"train_loss": -5.859872817993164, "global_step": 65478, "epoch": 1559} {"train_loss": -5.931061744689941, "global_step": 65479, "epoch": 1559} {"train_loss": -6.104334831237793, "global_step": 65480, "epoch": 1559} {"train_loss": -5.92668342590332, "global_step": 65481, "epoch": 1559} {"train_loss": -6.021059989929199, "global_step": 65482, "epoch": 1559} {"train_loss": -6.008578300476074, "global_step": 65483, "epoch": 1559} {"train_loss": -6.071715831756592, "global_step": 65484, "epoch": 1559} {"train_loss": -6.000344753265381, "global_step": 65485, "epoch": 1559} {"train_loss": -5.889571666717529, "global_step": 65486, "epoch": 1559} {"train_loss": -5.932173728942871, "global_step": 65487, "epoch": 1559} {"train_loss": -5.9261064529418945, "global_step": 65488, "epoch": 1559} {"train_loss": -5.969648361206055, "global_step": 65489, "epoch": 1559} {"train_loss": -5.923176288604736, "global_step": 65490, "epoch": 1559} {"train_loss": -5.899074077606201, "global_step": 65491, "epoch": 1559} {"train_loss": -5.941266059875488, "global_step": 65492, "epoch": 1559} {"train_loss": -6.020939826965332, "global_step": 65493, "epoch": 1559} {"train_loss": -6.090380668640137, "global_step": 65494, "epoch": 1559} {"train_loss": -5.959376811981201, "global_step": 65495, "epoch": 1559} {"train_loss": -5.9345808029174805, "global_step": 65496, "epoch": 1559} {"train_loss": -5.964005470275879, "global_step": 65497, "epoch": 1559} {"train_loss": -5.932796478271484, "global_step": 65498, "epoch": 1559} {"train_loss": -5.8612141609191895, "global_step": 65499, "epoch": 1559} {"train_loss": -5.863990306854248, "global_step": 65500, "epoch": 1559} {"train_loss": -5.8439741134643555, "global_step": 65501, "epoch": 1559} {"train_loss": -6.082573413848877, "global_step": 65502, "epoch": 1559} {"train_loss": -5.997924327850342, "global_step": 65503, "epoch": 1559} {"train_loss": -5.8631086349487305, "global_step": 65504, "epoch": 1559} {"train_loss": -5.860753536224365, "global_step": 65505, "epoch": 1559} {"train_loss": -5.975737571716309, "global_step": 65506, "epoch": 1559} {"train_loss": -5.927841663360596, "global_step": 65507, "epoch": 1559} {"train_loss": -5.9164814949035645, "global_step": 65508, "epoch": 1559} {"train_loss": -5.807374477386475, "global_step": 65509, "epoch": 1559} {"train_loss": -5.874668598175049, "global_step": 65510, "epoch": 1559} {"train_loss": -5.971033573150635, "global_step": 65511, "epoch": 1559} {"train_loss": -5.958446502685547, "global_step": 65512, "epoch": 1559} {"train_loss": -5.9007248878479, "global_step": 65513, "epoch": 1559} {"train_loss": -5.955265045166016, "global_step": 65514, "epoch": 1559} {"train_loss": -6.043549537658691, "global_step": 65515, "epoch": 1559} {"train_loss": -5.9171247482299805, "global_step": 65516, "epoch": 1559} {"train_loss": -5.878542900085449, "global_step": 65517, "epoch": 1559} {"train_loss": -6.123332977294922, "global_step": 65518, "epoch": 1559} {"train_loss": -5.948421330679031, "global_step": 65519, "epoch": 1559, "val_loss": 67371.953125} {"train_loss": -6.016478538513184, "global_step": 65520, "epoch": 1560} {"train_loss": -5.829104900360107, "global_step": 65521, "epoch": 1560} {"train_loss": -5.905206680297852, "global_step": 65522, "epoch": 1560} {"train_loss": -5.976827621459961, "global_step": 65523, "epoch": 1560} {"train_loss": -5.897319793701172, "global_step": 65524, "epoch": 1560} {"train_loss": -5.936321258544922, "global_step": 65525, "epoch": 1560} {"train_loss": -5.970186233520508, "global_step": 65526, "epoch": 1560} {"train_loss": -6.032075881958008, "global_step": 65527, "epoch": 1560} {"train_loss": -6.007403373718262, "global_step": 65528, "epoch": 1560} {"train_loss": -5.849782466888428, "global_step": 65529, "epoch": 1560} {"train_loss": -5.966394901275635, "global_step": 65530, "epoch": 1560} {"train_loss": -5.887618064880371, "global_step": 65531, "epoch": 1560} {"train_loss": -5.984015464782715, "global_step": 65532, "epoch": 1560} {"train_loss": -5.892544269561768, "global_step": 65533, "epoch": 1560} {"train_loss": -5.995489597320557, "global_step": 65534, "epoch": 1560} {"train_loss": -5.967485427856445, "global_step": 65535, "epoch": 1560} {"train_loss": -5.956345558166504, "global_step": 65536, "epoch": 1560} {"train_loss": -5.98166561126709, "global_step": 65537, "epoch": 1560} {"train_loss": -5.985801696777344, "global_step": 65538, "epoch": 1560} {"train_loss": -6.037022590637207, "global_step": 65539, "epoch": 1560} {"train_loss": -5.930938720703125, "global_step": 65540, "epoch": 1560} {"train_loss": -5.974910736083984, "global_step": 65541, "epoch": 1560} {"train_loss": -6.0419769287109375, "global_step": 65542, "epoch": 1560} {"train_loss": -5.941167831420898, "global_step": 65543, "epoch": 1560} {"train_loss": -6.04768705368042, "global_step": 65544, "epoch": 1560} {"train_loss": -5.915408611297607, "global_step": 65545, "epoch": 1560} {"train_loss": -5.973535537719727, "global_step": 65546, "epoch": 1560} {"train_loss": -5.9211554527282715, "global_step": 65547, "epoch": 1560} {"train_loss": -5.848228931427002, "global_step": 65548, "epoch": 1560} {"train_loss": -5.849423408508301, "global_step": 65549, "epoch": 1560} {"train_loss": -5.833639144897461, "global_step": 65550, "epoch": 1560} {"train_loss": -5.922843933105469, "global_step": 65551, "epoch": 1560} {"train_loss": -5.947963714599609, "global_step": 65552, "epoch": 1560} {"train_loss": -5.985653400421143, "global_step": 65553, "epoch": 1560} {"train_loss": -5.892693996429443, "global_step": 65554, "epoch": 1560} {"train_loss": -6.038801670074463, "global_step": 65555, "epoch": 1560} {"train_loss": -5.975909233093262, "global_step": 65556, "epoch": 1560} {"train_loss": -5.8706512451171875, "global_step": 65557, "epoch": 1560} {"train_loss": -5.816705703735352, "global_step": 65558, "epoch": 1560} {"train_loss": -5.98429012298584, "global_step": 65559, "epoch": 1560} {"train_loss": -5.97080659866333, "global_step": 65560, "epoch": 1560} {"train_loss": -5.945269096465338, "global_step": 65561, "epoch": 1560, "val_loss": 67164.203125} {"train_loss": -6.13316011428833, "global_step": 65562, "epoch": 1561} {"train_loss": -6.025677680969238, "global_step": 65563, "epoch": 1561} {"train_loss": -5.8339080810546875, "global_step": 65564, "epoch": 1561} {"train_loss": -6.143946647644043, "global_step": 65565, "epoch": 1561} {"train_loss": -5.934944152832031, "global_step": 65566, "epoch": 1561} {"train_loss": -6.028730869293213, "global_step": 65567, "epoch": 1561} {"train_loss": -5.941356182098389, "global_step": 65568, "epoch": 1561} {"train_loss": -6.012087821960449, "global_step": 65569, "epoch": 1561} {"train_loss": -5.9676432609558105, "global_step": 65570, "epoch": 1561} {"train_loss": -5.9115495681762695, "global_step": 65571, "epoch": 1561} {"train_loss": -6.001187324523926, "global_step": 65572, "epoch": 1561} {"train_loss": -5.948012828826904, "global_step": 65573, "epoch": 1561} {"train_loss": -5.937233924865723, "global_step": 65574, "epoch": 1561} {"train_loss": -5.782347679138184, "global_step": 65575, "epoch": 1561} {"train_loss": -5.9234209060668945, "global_step": 65576, "epoch": 1561} {"train_loss": -6.0829620361328125, "global_step": 65577, "epoch": 1561} {"train_loss": -5.993707180023193, "global_step": 65578, "epoch": 1561} {"train_loss": -5.922150611877441, "global_step": 65579, "epoch": 1561} {"train_loss": -5.971235275268555, "global_step": 65580, "epoch": 1561} {"train_loss": -5.995512962341309, "global_step": 65581, "epoch": 1561} {"train_loss": -5.962210178375244, "global_step": 65582, "epoch": 1561} {"train_loss": -5.935159683227539, "global_step": 65583, "epoch": 1561} {"train_loss": -6.090771675109863, "global_step": 65584, "epoch": 1561} {"train_loss": -5.941505432128906, "global_step": 65585, "epoch": 1561} {"train_loss": -6.034784317016602, "global_step": 65586, "epoch": 1561} {"train_loss": -5.799830436706543, "global_step": 65587, "epoch": 1561} {"train_loss": -5.962235450744629, "global_step": 65588, "epoch": 1561} {"train_loss": -5.906959533691406, "global_step": 65589, "epoch": 1561} {"train_loss": -5.8508477210998535, "global_step": 65590, "epoch": 1561} {"train_loss": -5.962314605712891, "global_step": 65591, "epoch": 1561} {"train_loss": -5.976790904998779, "global_step": 65592, "epoch": 1561} {"train_loss": -5.97834587097168, "global_step": 65593, "epoch": 1561} {"train_loss": -5.847755432128906, "global_step": 65594, "epoch": 1561} {"train_loss": -5.893118858337402, "global_step": 65595, "epoch": 1561} {"train_loss": -5.941701889038086, "global_step": 65596, "epoch": 1561} {"train_loss": -5.855632781982422, "global_step": 65597, "epoch": 1561} {"train_loss": -5.868767738342285, "global_step": 65598, "epoch": 1561} {"train_loss": -5.926050186157227, "global_step": 65599, "epoch": 1561} {"train_loss": -5.819027423858643, "global_step": 65600, "epoch": 1561} {"train_loss": -5.888669967651367, "global_step": 65601, "epoch": 1561} {"train_loss": -5.882590293884277, "global_step": 65602, "epoch": 1561} {"train_loss": -5.9439863704499745, "global_step": 65603, "epoch": 1561, "val_loss": 67194.421875} {"train_loss": -5.867092609405518, "global_step": 65604, "epoch": 1562} {"train_loss": -5.877758979797363, "global_step": 65605, "epoch": 1562} {"train_loss": -5.951620578765869, "global_step": 65606, "epoch": 1562} {"train_loss": -5.797804832458496, "global_step": 65607, "epoch": 1562} {"train_loss": -5.974183082580566, "global_step": 65608, "epoch": 1562} {"train_loss": -5.927810192108154, "global_step": 65609, "epoch": 1562} {"train_loss": -5.947334289550781, "global_step": 65610, "epoch": 1562} {"train_loss": -6.072465896606445, "global_step": 65611, "epoch": 1562} {"train_loss": -6.04247522354126, "global_step": 65612, "epoch": 1562} {"train_loss": -5.9818878173828125, "global_step": 65613, "epoch": 1562} {"train_loss": -5.881957530975342, "global_step": 65614, "epoch": 1562} {"train_loss": -5.913230895996094, "global_step": 65615, "epoch": 1562} {"train_loss": -5.840043544769287, "global_step": 65616, "epoch": 1562} {"train_loss": -5.901988983154297, "global_step": 65617, "epoch": 1562} {"train_loss": -5.994744777679443, "global_step": 65618, "epoch": 1562} {"train_loss": -6.041691303253174, "global_step": 65619, "epoch": 1562} {"train_loss": -6.06957483291626, "global_step": 65620, "epoch": 1562} {"train_loss": -5.849918842315674, "global_step": 65621, "epoch": 1562} {"train_loss": -6.0446672439575195, "global_step": 65622, "epoch": 1562} {"train_loss": -5.985461235046387, "global_step": 65623, "epoch": 1562} {"train_loss": -5.933422088623047, "global_step": 65624, "epoch": 1562} {"train_loss": -5.913783073425293, "global_step": 65625, "epoch": 1562} {"train_loss": -5.924046039581299, "global_step": 65626, "epoch": 1562} {"train_loss": -5.933860778808594, "global_step": 65627, "epoch": 1562} {"train_loss": -6.069212913513184, "global_step": 65628, "epoch": 1562} {"train_loss": -5.945533752441406, "global_step": 65629, "epoch": 1562} {"train_loss": -5.924046516418457, "global_step": 65630, "epoch": 1562} {"train_loss": -6.05802059173584, "global_step": 65631, "epoch": 1562} {"train_loss": -5.9294586181640625, "global_step": 65632, "epoch": 1562} {"train_loss": -5.878720760345459, "global_step": 65633, "epoch": 1562} {"train_loss": -5.848516464233398, "global_step": 65634, "epoch": 1562} {"train_loss": -5.968985557556152, "global_step": 65635, "epoch": 1562} {"train_loss": -5.9202775955200195, "global_step": 65636, "epoch": 1562} {"train_loss": -5.930677890777588, "global_step": 65637, "epoch": 1562} {"train_loss": -5.939122200012207, "global_step": 65638, "epoch": 1562} {"train_loss": -5.9317755699157715, "global_step": 65639, "epoch": 1562} {"train_loss": -6.102745532989502, "global_step": 65640, "epoch": 1562} {"train_loss": -6.00100040435791, "global_step": 65641, "epoch": 1562} {"train_loss": -5.833246231079102, "global_step": 65642, "epoch": 1562} {"train_loss": -6.04517936706543, "global_step": 65643, "epoch": 1562} {"train_loss": -5.99162483215332, "global_step": 65644, "epoch": 1562} {"train_loss": -5.949901353745234, "global_step": 65645, "epoch": 1562, "val_loss": 67209.71875} {"train_loss": -6.150371551513672, "global_step": 65646, "epoch": 1563} {"train_loss": -5.902158260345459, "global_step": 65647, "epoch": 1563} {"train_loss": -5.883686065673828, "global_step": 65648, "epoch": 1563} {"train_loss": -5.939168453216553, "global_step": 65649, "epoch": 1563} {"train_loss": -6.012273788452148, "global_step": 65650, "epoch": 1563} {"train_loss": -5.963720321655273, "global_step": 65651, "epoch": 1563} {"train_loss": -5.952672958374023, "global_step": 65652, "epoch": 1563} {"train_loss": -5.914804458618164, "global_step": 65653, "epoch": 1563} {"train_loss": -5.9172821044921875, "global_step": 65654, "epoch": 1563} {"train_loss": -5.800921440124512, "global_step": 65655, "epoch": 1563} {"train_loss": -5.883217811584473, "global_step": 65656, "epoch": 1563} {"train_loss": -5.889347076416016, "global_step": 65657, "epoch": 1563} {"train_loss": -5.983094215393066, "global_step": 65658, "epoch": 1563} {"train_loss": -5.957900047302246, "global_step": 65659, "epoch": 1563} {"train_loss": -6.027036666870117, "global_step": 65660, "epoch": 1563} {"train_loss": -5.881174087524414, "global_step": 65661, "epoch": 1563} {"train_loss": -5.919877052307129, "global_step": 65662, "epoch": 1563} {"train_loss": -5.977144718170166, "global_step": 65663, "epoch": 1563} {"train_loss": -5.9444804191589355, "global_step": 65664, "epoch": 1563} {"train_loss": -5.923670768737793, "global_step": 65665, "epoch": 1563} {"train_loss": -5.921391010284424, "global_step": 65666, "epoch": 1563} {"train_loss": -5.986414909362793, "global_step": 65667, "epoch": 1563} {"train_loss": -5.873589038848877, "global_step": 65668, "epoch": 1563} {"train_loss": -6.062438011169434, "global_step": 65669, "epoch": 1563} {"train_loss": -5.917520523071289, "global_step": 65670, "epoch": 1563} {"train_loss": -5.9989800453186035, "global_step": 65671, "epoch": 1563} {"train_loss": -6.041611671447754, "global_step": 65672, "epoch": 1563} {"train_loss": -5.899367332458496, "global_step": 65673, "epoch": 1563} {"train_loss": -5.8456830978393555, "global_step": 65674, "epoch": 1563} {"train_loss": -6.040998458862305, "global_step": 65675, "epoch": 1563} {"train_loss": -6.0275068283081055, "global_step": 65676, "epoch": 1563} {"train_loss": -5.952987194061279, "global_step": 65677, "epoch": 1563} {"train_loss": -5.9197587966918945, "global_step": 65678, "epoch": 1563} {"train_loss": -5.956338405609131, "global_step": 65679, "epoch": 1563} {"train_loss": -5.955228805541992, "global_step": 65680, "epoch": 1563} {"train_loss": -6.090324878692627, "global_step": 65681, "epoch": 1563} {"train_loss": -5.958507061004639, "global_step": 65682, "epoch": 1563} {"train_loss": -5.935361862182617, "global_step": 65683, "epoch": 1563} {"train_loss": -5.774713516235352, "global_step": 65684, "epoch": 1563} {"train_loss": -5.895629405975342, "global_step": 65685, "epoch": 1563} {"train_loss": -5.905663967132568, "global_step": 65686, "epoch": 1563} {"train_loss": -5.945567199162075, "global_step": 65687, "epoch": 1563, "val_loss": 67007.390625} {"train_loss": -5.931304931640625, "global_step": 65688, "epoch": 1564} {"train_loss": -5.972790241241455, "global_step": 65689, "epoch": 1564} {"train_loss": -6.0053510665893555, "global_step": 65690, "epoch": 1564} {"train_loss": -5.977287292480469, "global_step": 65691, "epoch": 1564} {"train_loss": -5.879085540771484, "global_step": 65692, "epoch": 1564} {"train_loss": -6.022870063781738, "global_step": 65693, "epoch": 1564} {"train_loss": -5.930230140686035, "global_step": 65694, "epoch": 1564} {"train_loss": -6.061506271362305, "global_step": 65695, "epoch": 1564} {"train_loss": -5.9282989501953125, "global_step": 65696, "epoch": 1564} {"train_loss": -5.974738121032715, "global_step": 65697, "epoch": 1564} {"train_loss": -5.988513946533203, "global_step": 65698, "epoch": 1564} {"train_loss": -5.9112935066223145, "global_step": 65699, "epoch": 1564} {"train_loss": -5.997799873352051, "global_step": 65700, "epoch": 1564} {"train_loss": -6.035343647003174, "global_step": 65701, "epoch": 1564} {"train_loss": -5.933500289916992, "global_step": 65702, "epoch": 1564} {"train_loss": -5.9156389236450195, "global_step": 65703, "epoch": 1564} {"train_loss": -6.137871742248535, "global_step": 65704, "epoch": 1564} {"train_loss": -5.990696907043457, "global_step": 65705, "epoch": 1564} {"train_loss": -5.947003364562988, "global_step": 65706, "epoch": 1564} {"train_loss": -6.047238349914551, "global_step": 65707, "epoch": 1564} {"train_loss": -5.8903961181640625, "global_step": 65708, "epoch": 1564} {"train_loss": -5.927988052368164, "global_step": 65709, "epoch": 1564} {"train_loss": -5.9498491287231445, "global_step": 65710, "epoch": 1564} {"train_loss": -5.904534816741943, "global_step": 65711, "epoch": 1564} {"train_loss": -5.866307735443115, "global_step": 65712, "epoch": 1564} {"train_loss": -5.894576072692871, "global_step": 65713, "epoch": 1564} {"train_loss": -5.981233596801758, "global_step": 65714, "epoch": 1564} {"train_loss": -5.950592041015625, "global_step": 65715, "epoch": 1564} {"train_loss": -6.018091201782227, "global_step": 65716, "epoch": 1564} {"train_loss": -5.915824890136719, "global_step": 65717, "epoch": 1564} {"train_loss": -5.976566314697266, "global_step": 65718, "epoch": 1564} {"train_loss": -6.0543646812438965, "global_step": 65719, "epoch": 1564} {"train_loss": -5.900612831115723, "global_step": 65720, "epoch": 1564} {"train_loss": -5.931278228759766, "global_step": 65721, "epoch": 1564} {"train_loss": -5.972165107727051, "global_step": 65722, "epoch": 1564} {"train_loss": -5.900754451751709, "global_step": 65723, "epoch": 1564} {"train_loss": -6.0325164794921875, "global_step": 65724, "epoch": 1564} {"train_loss": -6.004690170288086, "global_step": 65725, "epoch": 1564} {"train_loss": -6.043384075164795, "global_step": 65726, "epoch": 1564} {"train_loss": -5.937644004821777, "global_step": 65727, "epoch": 1564} {"train_loss": -5.919513702392578, "global_step": 65728, "epoch": 1564} {"train_loss": -5.962090094884236, "global_step": 65729, "epoch": 1564, "val_loss": 67110.359375} {"train_loss": -5.964433193206787, "global_step": 65730, "epoch": 1565} {"train_loss": -5.974928855895996, "global_step": 65731, "epoch": 1565} {"train_loss": -5.8213887214660645, "global_step": 65732, "epoch": 1565} {"train_loss": -5.864514350891113, "global_step": 65733, "epoch": 1565} {"train_loss": -5.915472507476807, "global_step": 65734, "epoch": 1565} {"train_loss": -5.962362289428711, "global_step": 65735, "epoch": 1565} {"train_loss": -5.969738006591797, "global_step": 65736, "epoch": 1565} {"train_loss": -5.946439743041992, "global_step": 65737, "epoch": 1565} {"train_loss": -5.869765758514404, "global_step": 65738, "epoch": 1565} {"train_loss": -5.997190475463867, "global_step": 65739, "epoch": 1565} {"train_loss": -5.878728866577148, "global_step": 65740, "epoch": 1565} {"train_loss": -6.067965507507324, "global_step": 65741, "epoch": 1565} {"train_loss": -5.879528999328613, "global_step": 65742, "epoch": 1565} {"train_loss": -5.905930042266846, "global_step": 65743, "epoch": 1565} {"train_loss": -5.8896894454956055, "global_step": 65744, "epoch": 1565} {"train_loss": -6.042001724243164, "global_step": 65745, "epoch": 1565} {"train_loss": -5.893361568450928, "global_step": 65746, "epoch": 1565} {"train_loss": -6.05169153213501, "global_step": 65747, "epoch": 1565} {"train_loss": -6.094645977020264, "global_step": 65748, "epoch": 1565} {"train_loss": -5.898124694824219, "global_step": 65749, "epoch": 1565} {"train_loss": -5.974724292755127, "global_step": 65750, "epoch": 1565} {"train_loss": -5.89052677154541, "global_step": 65751, "epoch": 1565} {"train_loss": -5.9917497634887695, "global_step": 65752, "epoch": 1565} {"train_loss": -5.964754104614258, "global_step": 65753, "epoch": 1565} {"train_loss": -5.927820682525635, "global_step": 65754, "epoch": 1565} {"train_loss": -5.9722442626953125, "global_step": 65755, "epoch": 1565} {"train_loss": -5.876607418060303, "global_step": 65756, "epoch": 1565} {"train_loss": -6.02886438369751, "global_step": 65757, "epoch": 1565} {"train_loss": -5.984555244445801, "global_step": 65758, "epoch": 1565} {"train_loss": -6.07831335067749, "global_step": 65759, "epoch": 1565} {"train_loss": -6.019546985626221, "global_step": 65760, "epoch": 1565} {"train_loss": -5.955662727355957, "global_step": 65761, "epoch": 1565} {"train_loss": -5.958853244781494, "global_step": 65762, "epoch": 1565} {"train_loss": -5.855408191680908, "global_step": 65763, "epoch": 1565} {"train_loss": -6.115816116333008, "global_step": 65764, "epoch": 1565} {"train_loss": -5.955683708190918, "global_step": 65765, "epoch": 1565} {"train_loss": -5.954873561859131, "global_step": 65766, "epoch": 1565} {"train_loss": -6.099671840667725, "global_step": 65767, "epoch": 1565} {"train_loss": -5.96920919418335, "global_step": 65768, "epoch": 1565} {"train_loss": -5.998161792755127, "global_step": 65769, "epoch": 1565} {"train_loss": -5.944723129272461, "global_step": 65770, "epoch": 1565} {"train_loss": -5.956701108387539, "global_step": 65771, "epoch": 1565, "val_loss": 66968.6875} {"train_loss": -5.991938591003418, "global_step": 65772, "epoch": 1566} {"train_loss": -6.008955001831055, "global_step": 65773, "epoch": 1566} {"train_loss": -5.995887756347656, "global_step": 65774, "epoch": 1566} {"train_loss": -5.901946544647217, "global_step": 65775, "epoch": 1566} {"train_loss": -5.911667823791504, "global_step": 65776, "epoch": 1566} {"train_loss": -5.947264671325684, "global_step": 65777, "epoch": 1566} {"train_loss": -5.951816558837891, "global_step": 65778, "epoch": 1566} {"train_loss": -5.94400691986084, "global_step": 65779, "epoch": 1566} {"train_loss": -5.920124053955078, "global_step": 65780, "epoch": 1566} {"train_loss": -5.851849555969238, "global_step": 65781, "epoch": 1566} {"train_loss": -6.037260055541992, "global_step": 65782, "epoch": 1566} {"train_loss": -5.975917816162109, "global_step": 65783, "epoch": 1566} {"train_loss": -5.973110675811768, "global_step": 65784, "epoch": 1566} {"train_loss": -5.89317512512207, "global_step": 65785, "epoch": 1566} {"train_loss": -6.006891250610352, "global_step": 65786, "epoch": 1566} {"train_loss": -5.889459609985352, "global_step": 65787, "epoch": 1566} {"train_loss": -6.002743721008301, "global_step": 65788, "epoch": 1566} {"train_loss": -6.009203910827637, "global_step": 65789, "epoch": 1566} {"train_loss": -5.889184951782227, "global_step": 65790, "epoch": 1566} {"train_loss": -5.845905303955078, "global_step": 65791, "epoch": 1566} {"train_loss": -5.935098648071289, "global_step": 65792, "epoch": 1566} {"train_loss": -5.865556716918945, "global_step": 65793, "epoch": 1566} {"train_loss": -6.0891265869140625, "global_step": 65794, "epoch": 1566} {"train_loss": -5.954153060913086, "global_step": 65795, "epoch": 1566} {"train_loss": -6.032222270965576, "global_step": 65796, "epoch": 1566} {"train_loss": -5.990121841430664, "global_step": 65797, "epoch": 1566} {"train_loss": -5.894728660583496, "global_step": 65798, "epoch": 1566} {"train_loss": -5.91990852355957, "global_step": 65799, "epoch": 1566} {"train_loss": -5.895173072814941, "global_step": 65800, "epoch": 1566} {"train_loss": -6.020560264587402, "global_step": 65801, "epoch": 1566} {"train_loss": -5.955694198608398, "global_step": 65802, "epoch": 1566} {"train_loss": -5.909562110900879, "global_step": 65803, "epoch": 1566} {"train_loss": -5.995595932006836, "global_step": 65804, "epoch": 1566} {"train_loss": -5.898347854614258, "global_step": 65805, "epoch": 1566} {"train_loss": -5.961102485656738, "global_step": 65806, "epoch": 1566} {"train_loss": -5.8275251388549805, "global_step": 65807, "epoch": 1566} {"train_loss": -5.900251388549805, "global_step": 65808, "epoch": 1566} {"train_loss": -5.958128929138184, "global_step": 65809, "epoch": 1566} {"train_loss": -5.855781555175781, "global_step": 65810, "epoch": 1566} {"train_loss": -6.048056602478027, "global_step": 65811, "epoch": 1566} {"train_loss": -5.841102123260498, "global_step": 65812, "epoch": 1566} {"train_loss": -5.943163996651059, "global_step": 65813, "epoch": 1566, "val_loss": 67146.7109375} {"train_loss": -5.933896541595459, "global_step": 65814, "epoch": 1567} {"train_loss": -5.995960712432861, "global_step": 65815, "epoch": 1567} {"train_loss": -6.07608699798584, "global_step": 65816, "epoch": 1567} {"train_loss": -5.987949371337891, "global_step": 65817, "epoch": 1567} {"train_loss": -5.928831577301025, "global_step": 65818, "epoch": 1567} {"train_loss": -5.936006546020508, "global_step": 65819, "epoch": 1567} {"train_loss": -5.9151082038879395, "global_step": 65820, "epoch": 1567} {"train_loss": -5.905893325805664, "global_step": 65821, "epoch": 1567} {"train_loss": -5.934475898742676, "global_step": 65822, "epoch": 1567} {"train_loss": -6.1475138664245605, "global_step": 65823, "epoch": 1567} {"train_loss": -5.879176139831543, "global_step": 65824, "epoch": 1567} {"train_loss": -5.926553726196289, "global_step": 65825, "epoch": 1567} {"train_loss": -6.040964603424072, "global_step": 65826, "epoch": 1567} {"train_loss": -5.978592872619629, "global_step": 65827, "epoch": 1567} {"train_loss": -6.000161170959473, "global_step": 65828, "epoch": 1567} {"train_loss": -5.913103103637695, "global_step": 65829, "epoch": 1567} {"train_loss": -5.768850326538086, "global_step": 65830, "epoch": 1567} {"train_loss": -5.923211574554443, "global_step": 65831, "epoch": 1567} {"train_loss": -5.788647651672363, "global_step": 65832, "epoch": 1567} {"train_loss": -5.784393310546875, "global_step": 65833, "epoch": 1567} {"train_loss": -5.9249420166015625, "global_step": 65834, "epoch": 1567} {"train_loss": -5.84305477142334, "global_step": 65835, "epoch": 1567} {"train_loss": -5.999268531799316, "global_step": 65836, "epoch": 1567} {"train_loss": -5.906508922576904, "global_step": 65837, "epoch": 1567} {"train_loss": -5.887979507446289, "global_step": 65838, "epoch": 1567} {"train_loss": -5.892586708068848, "global_step": 65839, "epoch": 1567} {"train_loss": -5.922139644622803, "global_step": 65840, "epoch": 1567} {"train_loss": -5.90926456451416, "global_step": 65841, "epoch": 1567} {"train_loss": -5.924520015716553, "global_step": 65842, "epoch": 1567} {"train_loss": -5.961618423461914, "global_step": 65843, "epoch": 1567} {"train_loss": -5.743241310119629, "global_step": 65844, "epoch": 1567} {"train_loss": -5.955167770385742, "global_step": 65845, "epoch": 1567} {"train_loss": -5.812607765197754, "global_step": 65846, "epoch": 1567} {"train_loss": -5.897552490234375, "global_step": 65847, "epoch": 1567} {"train_loss": -5.995824337005615, "global_step": 65848, "epoch": 1567} {"train_loss": -5.981827259063721, "global_step": 65849, "epoch": 1567} {"train_loss": -5.935070037841797, "global_step": 65850, "epoch": 1567} {"train_loss": -5.999027252197266, "global_step": 65851, "epoch": 1567} {"train_loss": -5.929841041564941, "global_step": 65852, "epoch": 1567} {"train_loss": -5.960357666015625, "global_step": 65853, "epoch": 1567} {"train_loss": -5.944405555725098, "global_step": 65854, "epoch": 1567} {"train_loss": -5.928186938876197, "global_step": 65855, "epoch": 1567, "val_loss": 67117.421875} {"train_loss": -6.01917839050293, "global_step": 65856, "epoch": 1568} {"train_loss": -6.008805274963379, "global_step": 65857, "epoch": 1568} {"train_loss": -5.974565505981445, "global_step": 65858, "epoch": 1568} {"train_loss": -5.977158546447754, "global_step": 65859, "epoch": 1568} {"train_loss": -5.9396867752075195, "global_step": 65860, "epoch": 1568} {"train_loss": -5.941229820251465, "global_step": 65861, "epoch": 1568} {"train_loss": -5.877072334289551, "global_step": 65862, "epoch": 1568} {"train_loss": -6.048252105712891, "global_step": 65863, "epoch": 1568} {"train_loss": -5.88021183013916, "global_step": 65864, "epoch": 1568} {"train_loss": -5.975562572479248, "global_step": 65865, "epoch": 1568} {"train_loss": -6.081012725830078, "global_step": 65866, "epoch": 1568} {"train_loss": -5.936589241027832, "global_step": 65867, "epoch": 1568} {"train_loss": -5.997708320617676, "global_step": 65868, "epoch": 1568} {"train_loss": -5.889998435974121, "global_step": 65869, "epoch": 1568} {"train_loss": -5.847440719604492, "global_step": 65870, "epoch": 1568} {"train_loss": -5.830178260803223, "global_step": 65871, "epoch": 1568} {"train_loss": -6.013400554656982, "global_step": 65872, "epoch": 1568} {"train_loss": -5.7821044921875, "global_step": 65873, "epoch": 1568} {"train_loss": -6.035319805145264, "global_step": 65874, "epoch": 1568} {"train_loss": -5.852890968322754, "global_step": 65875, "epoch": 1568} {"train_loss": -5.868607997894287, "global_step": 65876, "epoch": 1568} {"train_loss": -5.94112491607666, "global_step": 65877, "epoch": 1568} {"train_loss": -5.904264450073242, "global_step": 65878, "epoch": 1568} {"train_loss": -5.926692962646484, "global_step": 65879, "epoch": 1568} {"train_loss": -5.872627258300781, "global_step": 65880, "epoch": 1568} {"train_loss": -5.926911354064941, "global_step": 65881, "epoch": 1568} {"train_loss": -5.88848876953125, "global_step": 65882, "epoch": 1568} {"train_loss": -5.824419975280762, "global_step": 65883, "epoch": 1568} {"train_loss": -5.989234447479248, "global_step": 65884, "epoch": 1568} {"train_loss": -6.016457557678223, "global_step": 65885, "epoch": 1568} {"train_loss": -5.889438629150391, "global_step": 65886, "epoch": 1568} {"train_loss": -5.894801139831543, "global_step": 65887, "epoch": 1568} {"train_loss": -5.915827751159668, "global_step": 65888, "epoch": 1568} {"train_loss": -5.964029312133789, "global_step": 65889, "epoch": 1568} {"train_loss": -5.90385627746582, "global_step": 65890, "epoch": 1568} {"train_loss": -5.834167957305908, "global_step": 65891, "epoch": 1568} {"train_loss": -5.8985090255737305, "global_step": 65892, "epoch": 1568} {"train_loss": -5.97251033782959, "global_step": 65893, "epoch": 1568} {"train_loss": -6.12363862991333, "global_step": 65894, "epoch": 1568} {"train_loss": -5.979467868804932, "global_step": 65895, "epoch": 1568} {"train_loss": -5.96506404876709, "global_step": 65896, "epoch": 1568} {"train_loss": -5.937634536198208, "global_step": 65897, "epoch": 1568, "val_loss": 67146.6875} {"train_loss": -5.987964630126953, "global_step": 65898, "epoch": 1569} {"train_loss": -5.961946964263916, "global_step": 65899, "epoch": 1569} {"train_loss": -5.95508337020874, "global_step": 65900, "epoch": 1569} {"train_loss": -6.022618293762207, "global_step": 65901, "epoch": 1569} {"train_loss": -6.002077102661133, "global_step": 65902, "epoch": 1569} {"train_loss": -5.868407726287842, "global_step": 65903, "epoch": 1569} {"train_loss": -5.965253829956055, "global_step": 65904, "epoch": 1569} {"train_loss": -6.047340393066406, "global_step": 65905, "epoch": 1569} {"train_loss": -6.006263732910156, "global_step": 65906, "epoch": 1569} {"train_loss": -5.965935707092285, "global_step": 65907, "epoch": 1569} {"train_loss": -5.957347869873047, "global_step": 65908, "epoch": 1569} {"train_loss": -5.9842000007629395, "global_step": 65909, "epoch": 1569} {"train_loss": -5.939972400665283, "global_step": 65910, "epoch": 1569} {"train_loss": -5.901656150817871, "global_step": 65911, "epoch": 1569} {"train_loss": -6.061426162719727, "global_step": 65912, "epoch": 1569} {"train_loss": -5.987461090087891, "global_step": 65913, "epoch": 1569} {"train_loss": -5.9032673835754395, "global_step": 65914, "epoch": 1569} {"train_loss": -6.0285749435424805, "global_step": 65915, "epoch": 1569} {"train_loss": -5.966646671295166, "global_step": 65916, "epoch": 1569} {"train_loss": -5.867549419403076, "global_step": 65917, "epoch": 1569} {"train_loss": -5.975984573364258, "global_step": 65918, "epoch": 1569} {"train_loss": -5.9521260261535645, "global_step": 65919, "epoch": 1569} {"train_loss": -5.935543537139893, "global_step": 65920, "epoch": 1569} {"train_loss": -5.985917091369629, "global_step": 65921, "epoch": 1569} {"train_loss": -5.884825706481934, "global_step": 65922, "epoch": 1569} {"train_loss": -5.92660665512085, "global_step": 65923, "epoch": 1569} {"train_loss": -6.022769927978516, "global_step": 65924, "epoch": 1569} {"train_loss": -5.9543609619140625, "global_step": 65925, "epoch": 1569} {"train_loss": -5.762722969055176, "global_step": 65926, "epoch": 1569} {"train_loss": -5.995567321777344, "global_step": 65927, "epoch": 1569} {"train_loss": -5.804089546203613, "global_step": 65928, "epoch": 1569} {"train_loss": -6.070899963378906, "global_step": 65929, "epoch": 1569} {"train_loss": -6.0243964195251465, "global_step": 65930, "epoch": 1569} {"train_loss": -6.022206783294678, "global_step": 65931, "epoch": 1569} {"train_loss": -5.929961204528809, "global_step": 65932, "epoch": 1569} {"train_loss": -5.865262985229492, "global_step": 65933, "epoch": 1569} {"train_loss": -5.910422325134277, "global_step": 65934, "epoch": 1569} {"train_loss": -5.999715805053711, "global_step": 65935, "epoch": 1569} {"train_loss": -5.882495880126953, "global_step": 65936, "epoch": 1569} {"train_loss": -5.821445465087891, "global_step": 65937, "epoch": 1569} {"train_loss": -5.828845500946045, "global_step": 65938, "epoch": 1569} {"train_loss": -5.950921421959286, "global_step": 65939, "epoch": 1569, "val_loss": 66988.8203125} {"train_loss": -5.961540222167969, "global_step": 65940, "epoch": 1570} {"train_loss": -5.955280303955078, "global_step": 65941, "epoch": 1570} {"train_loss": -5.984204292297363, "global_step": 65942, "epoch": 1570} {"train_loss": -6.084345817565918, "global_step": 65943, "epoch": 1570} {"train_loss": -5.862893581390381, "global_step": 65944, "epoch": 1570} {"train_loss": -6.028989791870117, "global_step": 65945, "epoch": 1570} {"train_loss": -6.033517837524414, "global_step": 65946, "epoch": 1570} {"train_loss": -5.884356498718262, "global_step": 65947, "epoch": 1570} {"train_loss": -6.036940574645996, "global_step": 65948, "epoch": 1570} {"train_loss": -5.8808064460754395, "global_step": 65949, "epoch": 1570} {"train_loss": -5.872868061065674, "global_step": 65950, "epoch": 1570} {"train_loss": -5.953704833984375, "global_step": 65951, "epoch": 1570} {"train_loss": -5.972209453582764, "global_step": 65952, "epoch": 1570} {"train_loss": -6.049533843994141, "global_step": 65953, "epoch": 1570} {"train_loss": -5.891567707061768, "global_step": 65954, "epoch": 1570} {"train_loss": -5.954690933227539, "global_step": 65955, "epoch": 1570} {"train_loss": -5.97053861618042, "global_step": 65956, "epoch": 1570} {"train_loss": -5.836669921875, "global_step": 65957, "epoch": 1570} {"train_loss": -5.980397701263428, "global_step": 65958, "epoch": 1570} {"train_loss": -5.861204147338867, "global_step": 65959, "epoch": 1570} {"train_loss": -5.907073497772217, "global_step": 65960, "epoch": 1570} {"train_loss": -6.015793323516846, "global_step": 65961, "epoch": 1570} {"train_loss": -5.863886833190918, "global_step": 65962, "epoch": 1570} {"train_loss": -5.919404029846191, "global_step": 65963, "epoch": 1570} {"train_loss": -5.928459167480469, "global_step": 65964, "epoch": 1570} {"train_loss": -5.843301773071289, "global_step": 65965, "epoch": 1570} {"train_loss": -5.989275932312012, "global_step": 65966, "epoch": 1570} {"train_loss": -5.987491130828857, "global_step": 65967, "epoch": 1570} {"train_loss": -5.91658878326416, "global_step": 65968, "epoch": 1570} {"train_loss": -5.941381454467773, "global_step": 65969, "epoch": 1570} {"train_loss": -6.05422306060791, "global_step": 65970, "epoch": 1570} {"train_loss": -5.928600311279297, "global_step": 65971, "epoch": 1570} {"train_loss": -5.972038745880127, "global_step": 65972, "epoch": 1570} {"train_loss": -5.888920307159424, "global_step": 65973, "epoch": 1570} {"train_loss": -5.816489219665527, "global_step": 65974, "epoch": 1570} {"train_loss": -6.1568169593811035, "global_step": 65975, "epoch": 1570} {"train_loss": -6.073666572570801, "global_step": 65976, "epoch": 1570} {"train_loss": -5.90120267868042, "global_step": 65977, "epoch": 1570} {"train_loss": -5.941674709320068, "global_step": 65978, "epoch": 1570} {"train_loss": -6.12080192565918, "global_step": 65979, "epoch": 1570} {"train_loss": -6.000199317932129, "global_step": 65980, "epoch": 1570} {"train_loss": -5.957357690447853, "global_step": 65981, "epoch": 1570, "val_loss": 66980.5546875} {"train_loss": -6.014348983764648, "global_step": 65982, "epoch": 1571} {"train_loss": -5.992835998535156, "global_step": 65983, "epoch": 1571} {"train_loss": -5.987706184387207, "global_step": 65984, "epoch": 1571} {"train_loss": -5.883807182312012, "global_step": 65985, "epoch": 1571} {"train_loss": -5.961266040802002, "global_step": 65986, "epoch": 1571} {"train_loss": -6.04762077331543, "global_step": 65987, "epoch": 1571} {"train_loss": -6.059508323669434, "global_step": 65988, "epoch": 1571} {"train_loss": -6.01162052154541, "global_step": 65989, "epoch": 1571} {"train_loss": -5.998550891876221, "global_step": 65990, "epoch": 1571} {"train_loss": -6.0334882736206055, "global_step": 65991, "epoch": 1571} {"train_loss": -6.051667213439941, "global_step": 65992, "epoch": 1571} {"train_loss": -6.0860443115234375, "global_step": 65993, "epoch": 1571} {"train_loss": -6.059610366821289, "global_step": 65994, "epoch": 1571} {"train_loss": -6.010551452636719, "global_step": 65995, "epoch": 1571} {"train_loss": -5.989483833312988, "global_step": 65996, "epoch": 1571} {"train_loss": -5.901546478271484, "global_step": 65997, "epoch": 1571} {"train_loss": -5.835311412811279, "global_step": 65998, "epoch": 1571} {"train_loss": -5.971652984619141, "global_step": 65999, "epoch": 1571} {"train_loss": -5.980621337890625, "global_step": 66000, "epoch": 1571} {"train_loss": -5.967777252197266, "global_step": 66001, "epoch": 1571} {"train_loss": -5.924661636352539, "global_step": 66002, "epoch": 1571} {"train_loss": -5.992305755615234, "global_step": 66003, "epoch": 1571} {"train_loss": -5.997282028198242, "global_step": 66004, "epoch": 1571} {"train_loss": -5.917726039886475, "global_step": 66005, "epoch": 1571} {"train_loss": -5.969395160675049, "global_step": 66006, "epoch": 1571} {"train_loss": -5.922735214233398, "global_step": 66007, "epoch": 1571} {"train_loss": -5.905306816101074, "global_step": 66008, "epoch": 1571} {"train_loss": -6.009171485900879, "global_step": 66009, "epoch": 1571} {"train_loss": -5.901574611663818, "global_step": 66010, "epoch": 1571} {"train_loss": -6.055028438568115, "global_step": 66011, "epoch": 1571} {"train_loss": -5.929736137390137, "global_step": 66012, "epoch": 1571} {"train_loss": -5.82778263092041, "global_step": 66013, "epoch": 1571} {"train_loss": -5.84375, "global_step": 66014, "epoch": 1571} {"train_loss": -5.966283798217773, "global_step": 66015, "epoch": 1571} {"train_loss": -5.886806488037109, "global_step": 66016, "epoch": 1571} {"train_loss": -5.856720924377441, "global_step": 66017, "epoch": 1571} {"train_loss": -5.85646915435791, "global_step": 66018, "epoch": 1571} {"train_loss": -5.877476215362549, "global_step": 66019, "epoch": 1571} {"train_loss": -6.001465320587158, "global_step": 66020, "epoch": 1571} {"train_loss": -5.897186279296875, "global_step": 66021, "epoch": 1571} {"train_loss": -5.936761856079102, "global_step": 66022, "epoch": 1571} {"train_loss": -5.958496161869594, "global_step": 66023, "epoch": 1571, "val_loss": 67223.703125} {"train_loss": -5.839413642883301, "global_step": 66024, "epoch": 1572} {"train_loss": -5.935530662536621, "global_step": 66025, "epoch": 1572} {"train_loss": -5.889304161071777, "global_step": 66026, "epoch": 1572} {"train_loss": -6.000863075256348, "global_step": 66027, "epoch": 1572} {"train_loss": -5.993570804595947, "global_step": 66028, "epoch": 1572} {"train_loss": -6.005835056304932, "global_step": 66029, "epoch": 1572} {"train_loss": -5.922064781188965, "global_step": 66030, "epoch": 1572} {"train_loss": -5.863738059997559, "global_step": 66031, "epoch": 1572} {"train_loss": -6.006499767303467, "global_step": 66032, "epoch": 1572} {"train_loss": -5.8115997314453125, "global_step": 66033, "epoch": 1572} {"train_loss": -5.926511764526367, "global_step": 66034, "epoch": 1572} {"train_loss": -5.961295127868652, "global_step": 66035, "epoch": 1572} {"train_loss": -5.991994857788086, "global_step": 66036, "epoch": 1572} {"train_loss": -6.0159807205200195, "global_step": 66037, "epoch": 1572} {"train_loss": -5.953949928283691, "global_step": 66038, "epoch": 1572} {"train_loss": -5.974732875823975, "global_step": 66039, "epoch": 1572} {"train_loss": -5.822201728820801, "global_step": 66040, "epoch": 1572} {"train_loss": -5.969124794006348, "global_step": 66041, "epoch": 1572} {"train_loss": -5.9310455322265625, "global_step": 66042, "epoch": 1572} {"train_loss": -5.92454719543457, "global_step": 66043, "epoch": 1572} {"train_loss": -6.019075870513916, "global_step": 66044, "epoch": 1572} {"train_loss": -6.016230583190918, "global_step": 66045, "epoch": 1572} {"train_loss": -5.895890235900879, "global_step": 66046, "epoch": 1572} {"train_loss": -5.934435844421387, "global_step": 66047, "epoch": 1572} {"train_loss": -5.873126029968262, "global_step": 66048, "epoch": 1572} {"train_loss": -5.910979747772217, "global_step": 66049, "epoch": 1572} {"train_loss": -5.990278244018555, "global_step": 66050, "epoch": 1572} {"train_loss": -5.90757942199707, "global_step": 66051, "epoch": 1572} {"train_loss": -6.061674118041992, "global_step": 66052, "epoch": 1572} {"train_loss": -5.922799587249756, "global_step": 66053, "epoch": 1572} {"train_loss": -5.920502662658691, "global_step": 66054, "epoch": 1572} {"train_loss": -5.98902702331543, "global_step": 66055, "epoch": 1572} {"train_loss": -5.858924865722656, "global_step": 66056, "epoch": 1572} {"train_loss": -5.835701942443848, "global_step": 66057, "epoch": 1572} {"train_loss": -5.926175594329834, "global_step": 66058, "epoch": 1572} {"train_loss": -5.816024303436279, "global_step": 66059, "epoch": 1572} {"train_loss": -5.788435935974121, "global_step": 66060, "epoch": 1572} {"train_loss": -5.988311290740967, "global_step": 66061, "epoch": 1572} {"train_loss": -5.733142375946045, "global_step": 66062, "epoch": 1572} {"train_loss": -6.034976959228516, "global_step": 66063, "epoch": 1572} {"train_loss": -5.648552894592285, "global_step": 66064, "epoch": 1572} {"train_loss": -5.923304603213356, "global_step": 66065, "epoch": 1572, "val_loss": 67429.6640625} {"train_loss": -5.811243057250977, "global_step": 66066, "epoch": 1573} {"train_loss": -5.9779181480407715, "global_step": 66067, "epoch": 1573} {"train_loss": -5.85612678527832, "global_step": 66068, "epoch": 1573} {"train_loss": -5.939113140106201, "global_step": 66069, "epoch": 1573} {"train_loss": -5.994076728820801, "global_step": 66070, "epoch": 1573} {"train_loss": -5.945102691650391, "global_step": 66071, "epoch": 1573} {"train_loss": -5.95680046081543, "global_step": 66072, "epoch": 1573} {"train_loss": -5.910529136657715, "global_step": 66073, "epoch": 1573} {"train_loss": -5.900503158569336, "global_step": 66074, "epoch": 1573} {"train_loss": -5.882243633270264, "global_step": 66075, "epoch": 1573} {"train_loss": -5.885989189147949, "global_step": 66076, "epoch": 1573} {"train_loss": -5.87822961807251, "global_step": 66077, "epoch": 1573} {"train_loss": -5.956353664398193, "global_step": 66078, "epoch": 1573} {"train_loss": -5.852384567260742, "global_step": 66079, "epoch": 1573} {"train_loss": -5.914475917816162, "global_step": 66080, "epoch": 1573} {"train_loss": -5.909323215484619, "global_step": 66081, "epoch": 1573} {"train_loss": -5.912380218505859, "global_step": 66082, "epoch": 1573} {"train_loss": -5.983274459838867, "global_step": 66083, "epoch": 1573} {"train_loss": -5.870966911315918, "global_step": 66084, "epoch": 1573} {"train_loss": -5.912208080291748, "global_step": 66085, "epoch": 1573} {"train_loss": -5.886193752288818, "global_step": 66086, "epoch": 1573} {"train_loss": -5.958216667175293, "global_step": 66087, "epoch": 1573} {"train_loss": -5.954554557800293, "global_step": 66088, "epoch": 1573} {"train_loss": -5.939499855041504, "global_step": 66089, "epoch": 1573} {"train_loss": -5.886453151702881, "global_step": 66090, "epoch": 1573} {"train_loss": -5.973620414733887, "global_step": 66091, "epoch": 1573} {"train_loss": -6.055477142333984, "global_step": 66092, "epoch": 1573} {"train_loss": -5.95974588394165, "global_step": 66093, "epoch": 1573} {"train_loss": -5.842011451721191, "global_step": 66094, "epoch": 1573} {"train_loss": -6.076667785644531, "global_step": 66095, "epoch": 1573} {"train_loss": -5.888429164886475, "global_step": 66096, "epoch": 1573} {"train_loss": -5.941601753234863, "global_step": 66097, "epoch": 1573} {"train_loss": -6.01020622253418, "global_step": 66098, "epoch": 1573} {"train_loss": -5.961761951446533, "global_step": 66099, "epoch": 1573} {"train_loss": -6.001553535461426, "global_step": 66100, "epoch": 1573} {"train_loss": -5.954606056213379, "global_step": 66101, "epoch": 1573} {"train_loss": -5.858160018920898, "global_step": 66102, "epoch": 1573} {"train_loss": -6.003396987915039, "global_step": 66103, "epoch": 1573} {"train_loss": -5.988770961761475, "global_step": 66104, "epoch": 1573} {"train_loss": -6.077602386474609, "global_step": 66105, "epoch": 1573} {"train_loss": -5.924497604370117, "global_step": 66106, "epoch": 1573} {"train_loss": -5.934473026366461, "global_step": 66107, "epoch": 1573, "val_loss": 67083.0859375} {"train_loss": -5.99905252456665, "global_step": 66108, "epoch": 1574} {"train_loss": -5.926885604858398, "global_step": 66109, "epoch": 1574} {"train_loss": -6.032503604888916, "global_step": 66110, "epoch": 1574} {"train_loss": -6.03116512298584, "global_step": 66111, "epoch": 1574} {"train_loss": -5.979398250579834, "global_step": 66112, "epoch": 1574} {"train_loss": -6.029956817626953, "global_step": 66113, "epoch": 1574} {"train_loss": -5.898658752441406, "global_step": 66114, "epoch": 1574} {"train_loss": -6.015407085418701, "global_step": 66115, "epoch": 1574} {"train_loss": -6.032548904418945, "global_step": 66116, "epoch": 1574} {"train_loss": -5.998335838317871, "global_step": 66117, "epoch": 1574} {"train_loss": -5.9376068115234375, "global_step": 66118, "epoch": 1574} {"train_loss": -5.764822006225586, "global_step": 66119, "epoch": 1574} {"train_loss": -5.914079666137695, "global_step": 66120, "epoch": 1574} {"train_loss": -5.988523006439209, "global_step": 66121, "epoch": 1574} {"train_loss": -5.9778008460998535, "global_step": 66122, "epoch": 1574} {"train_loss": -5.963592052459717, "global_step": 66123, "epoch": 1574} {"train_loss": -6.056281566619873, "global_step": 66124, "epoch": 1574} {"train_loss": -5.977085113525391, "global_step": 66125, "epoch": 1574} {"train_loss": -5.940938949584961, "global_step": 66126, "epoch": 1574} {"train_loss": -5.885249137878418, "global_step": 66127, "epoch": 1574} {"train_loss": -6.004892349243164, "global_step": 66128, "epoch": 1574} {"train_loss": -5.898371696472168, "global_step": 66129, "epoch": 1574} {"train_loss": -6.0378875732421875, "global_step": 66130, "epoch": 1574} {"train_loss": -6.019159317016602, "global_step": 66131, "epoch": 1574} {"train_loss": -6.050169944763184, "global_step": 66132, "epoch": 1574} {"train_loss": -6.0445356369018555, "global_step": 66133, "epoch": 1574} {"train_loss": -5.948215484619141, "global_step": 66134, "epoch": 1574} {"train_loss": -6.007625579833984, "global_step": 66135, "epoch": 1574} {"train_loss": -6.031023979187012, "global_step": 66136, "epoch": 1574} {"train_loss": -5.849852561950684, "global_step": 66137, "epoch": 1574} {"train_loss": -5.949952125549316, "global_step": 66138, "epoch": 1574} {"train_loss": -5.9890289306640625, "global_step": 66139, "epoch": 1574} {"train_loss": -6.027989387512207, "global_step": 66140, "epoch": 1574} {"train_loss": -5.942144870758057, "global_step": 66141, "epoch": 1574} {"train_loss": -5.952829360961914, "global_step": 66142, "epoch": 1574} {"train_loss": -5.887375831604004, "global_step": 66143, "epoch": 1574} {"train_loss": -5.962192535400391, "global_step": 66144, "epoch": 1574} {"train_loss": -5.930538177490234, "global_step": 66145, "epoch": 1574} {"train_loss": -5.9798583984375, "global_step": 66146, "epoch": 1574} {"train_loss": -5.956305503845215, "global_step": 66147, "epoch": 1574} {"train_loss": -5.998856067657471, "global_step": 66148, "epoch": 1574} {"train_loss": -5.971789484932309, "global_step": 66149, "epoch": 1574, "val_loss": 67154.484375} {"train_loss": -5.881982803344727, "global_step": 66150, "epoch": 1575} {"train_loss": -6.038907527923584, "global_step": 66151, "epoch": 1575} {"train_loss": -5.88222599029541, "global_step": 66152, "epoch": 1575} {"train_loss": -6.119722366333008, "global_step": 66153, "epoch": 1575} {"train_loss": -6.018763065338135, "global_step": 66154, "epoch": 1575} {"train_loss": -6.048224449157715, "global_step": 66155, "epoch": 1575} {"train_loss": -5.9786376953125, "global_step": 66156, "epoch": 1575} {"train_loss": -6.048659801483154, "global_step": 66157, "epoch": 1575} {"train_loss": -5.962933540344238, "global_step": 66158, "epoch": 1575} {"train_loss": -5.943116188049316, "global_step": 66159, "epoch": 1575} {"train_loss": -6.025017738342285, "global_step": 66160, "epoch": 1575} {"train_loss": -6.135256767272949, "global_step": 66161, "epoch": 1575} {"train_loss": -5.954999923706055, "global_step": 66162, "epoch": 1575} {"train_loss": -5.92943000793457, "global_step": 66163, "epoch": 1575} {"train_loss": -5.936056137084961, "global_step": 66164, "epoch": 1575} {"train_loss": -5.973391532897949, "global_step": 66165, "epoch": 1575} {"train_loss": -6.014779090881348, "global_step": 66166, "epoch": 1575} {"train_loss": -5.9040727615356445, "global_step": 66167, "epoch": 1575} {"train_loss": -5.9891533851623535, "global_step": 66168, "epoch": 1575} {"train_loss": -6.023684501647949, "global_step": 66169, "epoch": 1575} {"train_loss": -5.964703559875488, "global_step": 66170, "epoch": 1575} {"train_loss": -6.002850532531738, "global_step": 66171, "epoch": 1575} {"train_loss": -6.048238754272461, "global_step": 66172, "epoch": 1575} {"train_loss": -5.971012115478516, "global_step": 66173, "epoch": 1575} {"train_loss": -5.891142845153809, "global_step": 66174, "epoch": 1575} {"train_loss": -6.0804829597473145, "global_step": 66175, "epoch": 1575} {"train_loss": -5.983750343322754, "global_step": 66176, "epoch": 1575} {"train_loss": -5.987310409545898, "global_step": 66177, "epoch": 1575} {"train_loss": -6.009634017944336, "global_step": 66178, "epoch": 1575} {"train_loss": -5.97619104385376, "global_step": 66179, "epoch": 1575} {"train_loss": -6.014556884765625, "global_step": 66180, "epoch": 1575} {"train_loss": -6.143713474273682, "global_step": 66181, "epoch": 1575} {"train_loss": -5.923086166381836, "global_step": 66182, "epoch": 1575} {"train_loss": -5.862831115722656, "global_step": 66183, "epoch": 1575} {"train_loss": -5.874448776245117, "global_step": 66184, "epoch": 1575} {"train_loss": -5.947948932647705, "global_step": 66185, "epoch": 1575} {"train_loss": -5.98790979385376, "global_step": 66186, "epoch": 1575} {"train_loss": -5.940953254699707, "global_step": 66187, "epoch": 1575} {"train_loss": -5.853384971618652, "global_step": 66188, "epoch": 1575} {"train_loss": -5.888556957244873, "global_step": 66189, "epoch": 1575} {"train_loss": -5.970770359039307, "global_step": 66190, "epoch": 1575} {"train_loss": -5.976826088769095, "global_step": 66191, "epoch": 1575, "val_loss": 66900.78125} {"train_loss": -6.0638227462768555, "global_step": 66192, "epoch": 1576} {"train_loss": -5.99610710144043, "global_step": 66193, "epoch": 1576} {"train_loss": -6.038599014282227, "global_step": 66194, "epoch": 1576} {"train_loss": -5.9431257247924805, "global_step": 66195, "epoch": 1576} {"train_loss": -5.820161819458008, "global_step": 66196, "epoch": 1576} {"train_loss": -6.089564323425293, "global_step": 66197, "epoch": 1576} {"train_loss": -6.015803813934326, "global_step": 66198, "epoch": 1576} {"train_loss": -5.9671311378479, "global_step": 66199, "epoch": 1576} {"train_loss": -5.9808549880981445, "global_step": 66200, "epoch": 1576} {"train_loss": -5.8795342445373535, "global_step": 66201, "epoch": 1576} {"train_loss": -6.022839546203613, "global_step": 66202, "epoch": 1576} {"train_loss": -5.960238933563232, "global_step": 66203, "epoch": 1576} {"train_loss": -5.964744567871094, "global_step": 66204, "epoch": 1576} {"train_loss": -5.9686174392700195, "global_step": 66205, "epoch": 1576} {"train_loss": -5.965764999389648, "global_step": 66206, "epoch": 1576} {"train_loss": -5.876579284667969, "global_step": 66207, "epoch": 1576} {"train_loss": -6.119617462158203, "global_step": 66208, "epoch": 1576} {"train_loss": -6.044548511505127, "global_step": 66209, "epoch": 1576} {"train_loss": -6.064719200134277, "global_step": 66210, "epoch": 1576} {"train_loss": -5.960977554321289, "global_step": 66211, "epoch": 1576} {"train_loss": -6.0053863525390625, "global_step": 66212, "epoch": 1576} {"train_loss": -5.945416450500488, "global_step": 66213, "epoch": 1576} {"train_loss": -5.903818130493164, "global_step": 66214, "epoch": 1576} {"train_loss": -6.001096725463867, "global_step": 66215, "epoch": 1576} {"train_loss": -6.0200371742248535, "global_step": 66216, "epoch": 1576} {"train_loss": -5.934761047363281, "global_step": 66217, "epoch": 1576} {"train_loss": -5.934346675872803, "global_step": 66218, "epoch": 1576} {"train_loss": -6.012925148010254, "global_step": 66219, "epoch": 1576} {"train_loss": -5.876917839050293, "global_step": 66220, "epoch": 1576} {"train_loss": -5.960973262786865, "global_step": 66221, "epoch": 1576} {"train_loss": -6.023104667663574, "global_step": 66222, "epoch": 1576} {"train_loss": -5.959926605224609, "global_step": 66223, "epoch": 1576} {"train_loss": -5.9793596267700195, "global_step": 66224, "epoch": 1576} {"train_loss": -5.929609298706055, "global_step": 66225, "epoch": 1576} {"train_loss": -6.027055740356445, "global_step": 66226, "epoch": 1576} {"train_loss": -6.113656997680664, "global_step": 66227, "epoch": 1576} {"train_loss": -5.97279167175293, "global_step": 66228, "epoch": 1576} {"train_loss": -5.97955322265625, "global_step": 66229, "epoch": 1576} {"train_loss": -6.073589324951172, "global_step": 66230, "epoch": 1576} {"train_loss": -5.939080715179443, "global_step": 66231, "epoch": 1576} {"train_loss": -5.909989356994629, "global_step": 66232, "epoch": 1576} {"train_loss": -5.981539748963856, "global_step": 66233, "epoch": 1576, "val_loss": 67028.046875} {"train_loss": -5.939227104187012, "global_step": 66234, "epoch": 1577} {"train_loss": -5.917827129364014, "global_step": 66235, "epoch": 1577} {"train_loss": -5.996973037719727, "global_step": 66236, "epoch": 1577} {"train_loss": -5.840842247009277, "global_step": 66237, "epoch": 1577} {"train_loss": -5.941158294677734, "global_step": 66238, "epoch": 1577} {"train_loss": -5.940627098083496, "global_step": 66239, "epoch": 1577} {"train_loss": -5.987386703491211, "global_step": 66240, "epoch": 1577} {"train_loss": -6.0090413093566895, "global_step": 66241, "epoch": 1577} {"train_loss": -6.076997756958008, "global_step": 66242, "epoch": 1577} {"train_loss": -6.021107196807861, "global_step": 66243, "epoch": 1577} {"train_loss": -6.026419639587402, "global_step": 66244, "epoch": 1577} {"train_loss": -5.892911434173584, "global_step": 66245, "epoch": 1577} {"train_loss": -6.017985820770264, "global_step": 66246, "epoch": 1577} {"train_loss": -6.01949405670166, "global_step": 66247, "epoch": 1577} {"train_loss": -5.980104923248291, "global_step": 66248, "epoch": 1577} {"train_loss": -5.976287841796875, "global_step": 66249, "epoch": 1577} {"train_loss": -5.9787702560424805, "global_step": 66250, "epoch": 1577} {"train_loss": -5.961518287658691, "global_step": 66251, "epoch": 1577} {"train_loss": -5.867094993591309, "global_step": 66252, "epoch": 1577} {"train_loss": -6.059477806091309, "global_step": 66253, "epoch": 1577} {"train_loss": -5.9780988693237305, "global_step": 66254, "epoch": 1577} {"train_loss": -5.93364953994751, "global_step": 66255, "epoch": 1577} {"train_loss": -5.964012145996094, "global_step": 66256, "epoch": 1577} {"train_loss": -5.997659683227539, "global_step": 66257, "epoch": 1577} {"train_loss": -6.043978214263916, "global_step": 66258, "epoch": 1577} {"train_loss": -6.00723123550415, "global_step": 66259, "epoch": 1577} {"train_loss": -6.037344455718994, "global_step": 66260, "epoch": 1577} {"train_loss": -5.957137107849121, "global_step": 66261, "epoch": 1577} {"train_loss": -6.0620198249816895, "global_step": 66262, "epoch": 1577} {"train_loss": -5.929238319396973, "global_step": 66263, "epoch": 1577} {"train_loss": -5.990951061248779, "global_step": 66264, "epoch": 1577} {"train_loss": -6.030817031860352, "global_step": 66265, "epoch": 1577} {"train_loss": -5.970171928405762, "global_step": 66266, "epoch": 1577} {"train_loss": -5.924969673156738, "global_step": 66267, "epoch": 1577} {"train_loss": -5.866153717041016, "global_step": 66268, "epoch": 1577} {"train_loss": -5.839273452758789, "global_step": 66269, "epoch": 1577} {"train_loss": -5.950927734375, "global_step": 66270, "epoch": 1577} {"train_loss": -5.958832740783691, "global_step": 66271, "epoch": 1577} {"train_loss": -5.953108310699463, "global_step": 66272, "epoch": 1577} {"train_loss": -6.017644882202148, "global_step": 66273, "epoch": 1577} {"train_loss": -5.94520902633667, "global_step": 66274, "epoch": 1577} {"train_loss": -5.972259067353749, "global_step": 66275, "epoch": 1577, "val_loss": 67223.03125} {"train_loss": -6.142911911010742, "global_step": 66276, "epoch": 1578} {"train_loss": -5.916044235229492, "global_step": 66277, "epoch": 1578} {"train_loss": -6.033278942108154, "global_step": 66278, "epoch": 1578} {"train_loss": -5.869556427001953, "global_step": 66279, "epoch": 1578} {"train_loss": -5.867417335510254, "global_step": 66280, "epoch": 1578} {"train_loss": -5.892221927642822, "global_step": 66281, "epoch": 1578} {"train_loss": -5.980463027954102, "global_step": 66282, "epoch": 1578} {"train_loss": -5.923317909240723, "global_step": 66283, "epoch": 1578} {"train_loss": -5.927125453948975, "global_step": 66284, "epoch": 1578} {"train_loss": -5.950553894042969, "global_step": 66285, "epoch": 1578} {"train_loss": -5.97208309173584, "global_step": 66286, "epoch": 1578} {"train_loss": -5.988757133483887, "global_step": 66287, "epoch": 1578} {"train_loss": -5.98247766494751, "global_step": 66288, "epoch": 1578} {"train_loss": -5.923308849334717, "global_step": 66289, "epoch": 1578} {"train_loss": -5.844303131103516, "global_step": 66290, "epoch": 1578} {"train_loss": -5.8968281745910645, "global_step": 66291, "epoch": 1578} {"train_loss": -6.003136157989502, "global_step": 66292, "epoch": 1578} {"train_loss": -5.906393051147461, "global_step": 66293, "epoch": 1578} {"train_loss": -5.867866516113281, "global_step": 66294, "epoch": 1578} {"train_loss": -6.0562849044799805, "global_step": 66295, "epoch": 1578} {"train_loss": -6.075393199920654, "global_step": 66296, "epoch": 1578} {"train_loss": -6.0614237785339355, "global_step": 66297, "epoch": 1578} {"train_loss": -5.962621212005615, "global_step": 66298, "epoch": 1578} {"train_loss": -5.955254554748535, "global_step": 66299, "epoch": 1578} {"train_loss": -5.949031352996826, "global_step": 66300, "epoch": 1578} {"train_loss": -5.901065826416016, "global_step": 66301, "epoch": 1578} {"train_loss": -5.847076892852783, "global_step": 66302, "epoch": 1578} {"train_loss": -5.907916069030762, "global_step": 66303, "epoch": 1578} {"train_loss": -5.9472174644470215, "global_step": 66304, "epoch": 1578} {"train_loss": -5.944404602050781, "global_step": 66305, "epoch": 1578} {"train_loss": -5.940325736999512, "global_step": 66306, "epoch": 1578} {"train_loss": -5.905330657958984, "global_step": 66307, "epoch": 1578} {"train_loss": -5.905628681182861, "global_step": 66308, "epoch": 1578} {"train_loss": -5.9934892654418945, "global_step": 66309, "epoch": 1578} {"train_loss": -5.976226806640625, "global_step": 66310, "epoch": 1578} {"train_loss": -5.989962577819824, "global_step": 66311, "epoch": 1578} {"train_loss": -5.991085529327393, "global_step": 66312, "epoch": 1578} {"train_loss": -5.865148067474365, "global_step": 66313, "epoch": 1578} {"train_loss": -5.914084434509277, "global_step": 66314, "epoch": 1578} {"train_loss": -5.8929595947265625, "global_step": 66315, "epoch": 1578} {"train_loss": -6.00317907333374, "global_step": 66316, "epoch": 1578} {"train_loss": -5.950175103687105, "global_step": 66317, "epoch": 1578, "val_loss": 67396.546875} {"train_loss": -5.874743938446045, "global_step": 66318, "epoch": 1579} {"train_loss": -6.046343803405762, "global_step": 66319, "epoch": 1579} {"train_loss": -5.936608791351318, "global_step": 66320, "epoch": 1579} {"train_loss": -5.882907867431641, "global_step": 66321, "epoch": 1579} {"train_loss": -5.829709053039551, "global_step": 66322, "epoch": 1579} {"train_loss": -5.894660472869873, "global_step": 66323, "epoch": 1579} {"train_loss": -5.998559951782227, "global_step": 66324, "epoch": 1579} {"train_loss": -5.913259029388428, "global_step": 66325, "epoch": 1579} {"train_loss": -5.944280624389648, "global_step": 66326, "epoch": 1579} {"train_loss": -5.901647567749023, "global_step": 66327, "epoch": 1579} {"train_loss": -5.841646194458008, "global_step": 66328, "epoch": 1579} {"train_loss": -5.9116997718811035, "global_step": 66329, "epoch": 1579} {"train_loss": -5.911527633666992, "global_step": 66330, "epoch": 1579} {"train_loss": -5.978135585784912, "global_step": 66331, "epoch": 1579} {"train_loss": -5.935699939727783, "global_step": 66332, "epoch": 1579} {"train_loss": -5.917063236236572, "global_step": 66333, "epoch": 1579} {"train_loss": -5.9097747802734375, "global_step": 66334, "epoch": 1579} {"train_loss": -6.054686546325684, "global_step": 66335, "epoch": 1579} {"train_loss": -5.880335807800293, "global_step": 66336, "epoch": 1579} {"train_loss": -5.943045616149902, "global_step": 66337, "epoch": 1579} {"train_loss": -5.941091537475586, "global_step": 66338, "epoch": 1579} {"train_loss": -5.906896591186523, "global_step": 66339, "epoch": 1579} {"train_loss": -6.111120223999023, "global_step": 66340, "epoch": 1579} {"train_loss": -5.958040237426758, "global_step": 66341, "epoch": 1579} {"train_loss": -5.966769695281982, "global_step": 66342, "epoch": 1579} {"train_loss": -5.882232666015625, "global_step": 66343, "epoch": 1579} {"train_loss": -6.009910583496094, "global_step": 66344, "epoch": 1579} {"train_loss": -5.974961280822754, "global_step": 66345, "epoch": 1579} {"train_loss": -6.029176712036133, "global_step": 66346, "epoch": 1579} {"train_loss": -5.861673355102539, "global_step": 66347, "epoch": 1579} {"train_loss": -5.878541946411133, "global_step": 66348, "epoch": 1579} {"train_loss": -5.882137298583984, "global_step": 66349, "epoch": 1579} {"train_loss": -5.821804046630859, "global_step": 66350, "epoch": 1579} {"train_loss": -5.8384552001953125, "global_step": 66351, "epoch": 1579} {"train_loss": -6.053945064544678, "global_step": 66352, "epoch": 1579} {"train_loss": -6.025911331176758, "global_step": 66353, "epoch": 1579} {"train_loss": -6.03472375869751, "global_step": 66354, "epoch": 1579} {"train_loss": -5.901572227478027, "global_step": 66355, "epoch": 1579} {"train_loss": -5.964452743530273, "global_step": 66356, "epoch": 1579} {"train_loss": -5.87873649597168, "global_step": 66357, "epoch": 1579} {"train_loss": -6.020940780639648, "global_step": 66358, "epoch": 1579} {"train_loss": -5.937008539835612, "global_step": 66359, "epoch": 1579, "val_loss": 67379.8046875} {"train_loss": -5.982574462890625, "global_step": 66360, "epoch": 1580} {"train_loss": -5.98018741607666, "global_step": 66361, "epoch": 1580} {"train_loss": -5.879312515258789, "global_step": 66362, "epoch": 1580} {"train_loss": -5.9285173416137695, "global_step": 66363, "epoch": 1580} {"train_loss": -5.925225257873535, "global_step": 66364, "epoch": 1580} {"train_loss": -6.016246795654297, "global_step": 66365, "epoch": 1580} {"train_loss": -6.039431095123291, "global_step": 66366, "epoch": 1580} {"train_loss": -5.955288887023926, "global_step": 66367, "epoch": 1580} {"train_loss": -5.846226215362549, "global_step": 66368, "epoch": 1580} {"train_loss": -5.928938865661621, "global_step": 66369, "epoch": 1580} {"train_loss": -5.8303728103637695, "global_step": 66370, "epoch": 1580} {"train_loss": -5.99357795715332, "global_step": 66371, "epoch": 1580} {"train_loss": -6.022286415100098, "global_step": 66372, "epoch": 1580} {"train_loss": -5.951103687286377, "global_step": 66373, "epoch": 1580} {"train_loss": -5.967019081115723, "global_step": 66374, "epoch": 1580} {"train_loss": -5.946976661682129, "global_step": 66375, "epoch": 1580} {"train_loss": -5.912771224975586, "global_step": 66376, "epoch": 1580} {"train_loss": -5.9123992919921875, "global_step": 66377, "epoch": 1580} {"train_loss": -5.880131244659424, "global_step": 66378, "epoch": 1580} {"train_loss": -5.921934127807617, "global_step": 66379, "epoch": 1580} {"train_loss": -5.917509078979492, "global_step": 66380, "epoch": 1580} {"train_loss": -5.8715691566467285, "global_step": 66381, "epoch": 1580} {"train_loss": -6.010223388671875, "global_step": 66382, "epoch": 1580} {"train_loss": -5.893216133117676, "global_step": 66383, "epoch": 1580} {"train_loss": -5.968708515167236, "global_step": 66384, "epoch": 1580} {"train_loss": -6.010739326477051, "global_step": 66385, "epoch": 1580} {"train_loss": -6.0954389572143555, "global_step": 66386, "epoch": 1580} {"train_loss": -5.92458438873291, "global_step": 66387, "epoch": 1580} {"train_loss": -5.950702667236328, "global_step": 66388, "epoch": 1580} {"train_loss": -6.096850395202637, "global_step": 66389, "epoch": 1580} {"train_loss": -5.958049774169922, "global_step": 66390, "epoch": 1580} {"train_loss": -5.8997955322265625, "global_step": 66391, "epoch": 1580} {"train_loss": -5.84255313873291, "global_step": 66392, "epoch": 1580} {"train_loss": -5.756546974182129, "global_step": 66393, "epoch": 1580} {"train_loss": -6.0299482345581055, "global_step": 66394, "epoch": 1580} {"train_loss": -5.943169116973877, "global_step": 66395, "epoch": 1580} {"train_loss": -5.863917350769043, "global_step": 66396, "epoch": 1580} {"train_loss": -5.8479413986206055, "global_step": 66397, "epoch": 1580} {"train_loss": -5.912432670593262, "global_step": 66398, "epoch": 1580} {"train_loss": -5.901565074920654, "global_step": 66399, "epoch": 1580} {"train_loss": -6.005661487579346, "global_step": 66400, "epoch": 1580} {"train_loss": -5.940704765773955, "global_step": 66401, "epoch": 1580, "val_loss": 67266.1796875} {"train_loss": -5.942534446716309, "global_step": 66402, "epoch": 1581} {"train_loss": -5.938352108001709, "global_step": 66403, "epoch": 1581} {"train_loss": -5.908632278442383, "global_step": 66404, "epoch": 1581} {"train_loss": -5.974358081817627, "global_step": 66405, "epoch": 1581} {"train_loss": -5.9599609375, "global_step": 66406, "epoch": 1581} {"train_loss": -5.981771469116211, "global_step": 66407, "epoch": 1581} {"train_loss": -5.948206901550293, "global_step": 66408, "epoch": 1581} {"train_loss": -5.843493461608887, "global_step": 66409, "epoch": 1581} {"train_loss": -5.93179178237915, "global_step": 66410, "epoch": 1581} {"train_loss": -5.934028148651123, "global_step": 66411, "epoch": 1581} {"train_loss": -5.984501838684082, "global_step": 66412, "epoch": 1581} {"train_loss": -5.965713024139404, "global_step": 66413, "epoch": 1581} {"train_loss": -6.030826091766357, "global_step": 66414, "epoch": 1581} {"train_loss": -5.914606094360352, "global_step": 66415, "epoch": 1581} {"train_loss": -5.825433254241943, "global_step": 66416, "epoch": 1581} {"train_loss": -5.964275360107422, "global_step": 66417, "epoch": 1581} {"train_loss": -5.836448669433594, "global_step": 66418, "epoch": 1581} {"train_loss": -6.042604446411133, "global_step": 66419, "epoch": 1581} {"train_loss": -5.833408355712891, "global_step": 66420, "epoch": 1581} {"train_loss": -6.010470390319824, "global_step": 66421, "epoch": 1581} {"train_loss": -5.9620819091796875, "global_step": 66422, "epoch": 1581} {"train_loss": -5.936739921569824, "global_step": 66423, "epoch": 1581} {"train_loss": -5.97245979309082, "global_step": 66424, "epoch": 1581} {"train_loss": -5.915536880493164, "global_step": 66425, "epoch": 1581} {"train_loss": -6.0242743492126465, "global_step": 66426, "epoch": 1581} {"train_loss": -5.87540864944458, "global_step": 66427, "epoch": 1581} {"train_loss": -5.827503204345703, "global_step": 66428, "epoch": 1581} {"train_loss": -5.942136764526367, "global_step": 66429, "epoch": 1581} {"train_loss": -5.9787397384643555, "global_step": 66430, "epoch": 1581} {"train_loss": -5.886349201202393, "global_step": 66431, "epoch": 1581} {"train_loss": -6.038575172424316, "global_step": 66432, "epoch": 1581} {"train_loss": -5.923899173736572, "global_step": 66433, "epoch": 1581} {"train_loss": -5.985736846923828, "global_step": 66434, "epoch": 1581} {"train_loss": -5.929196357727051, "global_step": 66435, "epoch": 1581} {"train_loss": -5.998394966125488, "global_step": 66436, "epoch": 1581} {"train_loss": -6.01523494720459, "global_step": 66437, "epoch": 1581} {"train_loss": -5.9647088050842285, "global_step": 66438, "epoch": 1581} {"train_loss": -5.958474159240723, "global_step": 66439, "epoch": 1581} {"train_loss": -5.906769752502441, "global_step": 66440, "epoch": 1581} {"train_loss": -5.898049354553223, "global_step": 66441, "epoch": 1581} {"train_loss": -5.972484111785889, "global_step": 66442, "epoch": 1581} {"train_loss": -5.943815401622227, "global_step": 66443, "epoch": 1581, "val_loss": 67262.171875} {"train_loss": -5.8570556640625, "global_step": 66444, "epoch": 1582} {"train_loss": -5.798802375793457, "global_step": 66445, "epoch": 1582} {"train_loss": -6.040642738342285, "global_step": 66446, "epoch": 1582} {"train_loss": -5.932523727416992, "global_step": 66447, "epoch": 1582} {"train_loss": -5.853816032409668, "global_step": 66448, "epoch": 1582} {"train_loss": -5.919774532318115, "global_step": 66449, "epoch": 1582} {"train_loss": -5.999734401702881, "global_step": 66450, "epoch": 1582} {"train_loss": -5.946879863739014, "global_step": 66451, "epoch": 1582} {"train_loss": -5.894235610961914, "global_step": 66452, "epoch": 1582} {"train_loss": -5.991474628448486, "global_step": 66453, "epoch": 1582} {"train_loss": -5.910897254943848, "global_step": 66454, "epoch": 1582} {"train_loss": -6.012136459350586, "global_step": 66455, "epoch": 1582} {"train_loss": -5.920580863952637, "global_step": 66456, "epoch": 1582} {"train_loss": -6.014044761657715, "global_step": 66457, "epoch": 1582} {"train_loss": -5.91617488861084, "global_step": 66458, "epoch": 1582} {"train_loss": -5.9991278648376465, "global_step": 66459, "epoch": 1582} {"train_loss": -5.937715530395508, "global_step": 66460, "epoch": 1582} {"train_loss": -5.907210350036621, "global_step": 66461, "epoch": 1582} {"train_loss": -5.9566450119018555, "global_step": 66462, "epoch": 1582} {"train_loss": -5.974725246429443, "global_step": 66463, "epoch": 1582} {"train_loss": -5.9126200675964355, "global_step": 66464, "epoch": 1582} {"train_loss": -5.960321426391602, "global_step": 66465, "epoch": 1582} {"train_loss": -5.915295600891113, "global_step": 66466, "epoch": 1582} {"train_loss": -5.947232246398926, "global_step": 66467, "epoch": 1582} {"train_loss": -5.926778793334961, "global_step": 66468, "epoch": 1582} {"train_loss": -5.940018653869629, "global_step": 66469, "epoch": 1582} {"train_loss": -6.061542987823486, "global_step": 66470, "epoch": 1582} {"train_loss": -5.948456764221191, "global_step": 66471, "epoch": 1582} {"train_loss": -5.967041969299316, "global_step": 66472, "epoch": 1582} {"train_loss": -6.05516242980957, "global_step": 66473, "epoch": 1582} {"train_loss": -6.019913673400879, "global_step": 66474, "epoch": 1582} {"train_loss": -6.075516700744629, "global_step": 66475, "epoch": 1582} {"train_loss": -5.9999494552612305, "global_step": 66476, "epoch": 1582} {"train_loss": -6.058145523071289, "global_step": 66477, "epoch": 1582} {"train_loss": -6.086353302001953, "global_step": 66478, "epoch": 1582} {"train_loss": -6.076085090637207, "global_step": 66479, "epoch": 1582} {"train_loss": -5.968996047973633, "global_step": 66480, "epoch": 1582} {"train_loss": -5.927366256713867, "global_step": 66481, "epoch": 1582} {"train_loss": -6.142413139343262, "global_step": 66482, "epoch": 1582} {"train_loss": -6.019783020019531, "global_step": 66483, "epoch": 1582} {"train_loss": -6.0307207107543945, "global_step": 66484, "epoch": 1582} {"train_loss": -5.969293049403599, "global_step": 66485, "epoch": 1582, "val_loss": 67098.875} {"train_loss": -5.933163642883301, "global_step": 66486, "epoch": 1583} {"train_loss": -5.881476402282715, "global_step": 66487, "epoch": 1583} {"train_loss": -6.0075764656066895, "global_step": 66488, "epoch": 1583} {"train_loss": -5.911624431610107, "global_step": 66489, "epoch": 1583} {"train_loss": -6.000293731689453, "global_step": 66490, "epoch": 1583} {"train_loss": -5.984635353088379, "global_step": 66491, "epoch": 1583} {"train_loss": -5.94144344329834, "global_step": 66492, "epoch": 1583} {"train_loss": -5.955867767333984, "global_step": 66493, "epoch": 1583} {"train_loss": -5.973575592041016, "global_step": 66494, "epoch": 1583} {"train_loss": -5.980069160461426, "global_step": 66495, "epoch": 1583} {"train_loss": -5.930760383605957, "global_step": 66496, "epoch": 1583} {"train_loss": -6.014227867126465, "global_step": 66497, "epoch": 1583} {"train_loss": -5.920751571655273, "global_step": 66498, "epoch": 1583} {"train_loss": -5.922295093536377, "global_step": 66499, "epoch": 1583} {"train_loss": -5.999521732330322, "global_step": 66500, "epoch": 1583} {"train_loss": -6.03627347946167, "global_step": 66501, "epoch": 1583} {"train_loss": -5.949190139770508, "global_step": 66502, "epoch": 1583} {"train_loss": -5.943283557891846, "global_step": 66503, "epoch": 1583} {"train_loss": -6.006916522979736, "global_step": 66504, "epoch": 1583} {"train_loss": -5.874791622161865, "global_step": 66505, "epoch": 1583} {"train_loss": -5.971084117889404, "global_step": 66506, "epoch": 1583} {"train_loss": -5.998322486877441, "global_step": 66507, "epoch": 1583} {"train_loss": -6.0315632820129395, "global_step": 66508, "epoch": 1583} {"train_loss": -5.8836798667907715, "global_step": 66509, "epoch": 1583} {"train_loss": -5.94896936416626, "global_step": 66510, "epoch": 1583} {"train_loss": -5.994850158691406, "global_step": 66511, "epoch": 1583} {"train_loss": -5.957262992858887, "global_step": 66512, "epoch": 1583} {"train_loss": -5.925998687744141, "global_step": 66513, "epoch": 1583} {"train_loss": -5.965961456298828, "global_step": 66514, "epoch": 1583} {"train_loss": -5.9651384353637695, "global_step": 66515, "epoch": 1583} {"train_loss": -5.959003448486328, "global_step": 66516, "epoch": 1583} {"train_loss": -5.931174278259277, "global_step": 66517, "epoch": 1583} {"train_loss": -5.927857398986816, "global_step": 66518, "epoch": 1583} {"train_loss": -5.951703071594238, "global_step": 66519, "epoch": 1583} {"train_loss": -5.823546886444092, "global_step": 66520, "epoch": 1583} {"train_loss": -6.074243545532227, "global_step": 66521, "epoch": 1583} {"train_loss": -6.0055999755859375, "global_step": 66522, "epoch": 1583} {"train_loss": -5.806268692016602, "global_step": 66523, "epoch": 1583} {"train_loss": -5.934752464294434, "global_step": 66524, "epoch": 1583} {"train_loss": -5.938162326812744, "global_step": 66525, "epoch": 1583} {"train_loss": -5.941993713378906, "global_step": 66526, "epoch": 1583} {"train_loss": -5.955315237953549, "global_step": 66527, "epoch": 1583, "val_loss": 67022.015625} {"train_loss": -6.03550386428833, "global_step": 66528, "epoch": 1584} {"train_loss": -6.033622741699219, "global_step": 66529, "epoch": 1584} {"train_loss": -5.984793663024902, "global_step": 66530, "epoch": 1584} {"train_loss": -5.921803951263428, "global_step": 66531, "epoch": 1584} {"train_loss": -5.886412143707275, "global_step": 66532, "epoch": 1584} {"train_loss": -5.794513702392578, "global_step": 66533, "epoch": 1584} {"train_loss": -5.9834465980529785, "global_step": 66534, "epoch": 1584} {"train_loss": -5.916324615478516, "global_step": 66535, "epoch": 1584} {"train_loss": -6.074444770812988, "global_step": 66536, "epoch": 1584} {"train_loss": -5.948186874389648, "global_step": 66537, "epoch": 1584} {"train_loss": -6.027285575866699, "global_step": 66538, "epoch": 1584} {"train_loss": -5.9742889404296875, "global_step": 66539, "epoch": 1584} {"train_loss": -5.9784016609191895, "global_step": 66540, "epoch": 1584} {"train_loss": -6.054920196533203, "global_step": 66541, "epoch": 1584} {"train_loss": -5.9036865234375, "global_step": 66542, "epoch": 1584} {"train_loss": -6.175204753875732, "global_step": 66543, "epoch": 1584} {"train_loss": -5.877133369445801, "global_step": 66544, "epoch": 1584} {"train_loss": -5.8381242752075195, "global_step": 66545, "epoch": 1584} {"train_loss": -5.953497886657715, "global_step": 66546, "epoch": 1584} {"train_loss": -5.989407539367676, "global_step": 66547, "epoch": 1584} {"train_loss": -6.0937089920043945, "global_step": 66548, "epoch": 1584} {"train_loss": -5.957706451416016, "global_step": 66549, "epoch": 1584} {"train_loss": -6.000328063964844, "global_step": 66550, "epoch": 1584} {"train_loss": -6.025862693786621, "global_step": 66551, "epoch": 1584} {"train_loss": -6.112727165222168, "global_step": 66552, "epoch": 1584} {"train_loss": -5.954333305358887, "global_step": 66553, "epoch": 1584} {"train_loss": -5.930632591247559, "global_step": 66554, "epoch": 1584} {"train_loss": -5.886396884918213, "global_step": 66555, "epoch": 1584} {"train_loss": -5.892545700073242, "global_step": 66556, "epoch": 1584} {"train_loss": -5.92332649230957, "global_step": 66557, "epoch": 1584} {"train_loss": -5.874270915985107, "global_step": 66558, "epoch": 1584} {"train_loss": -6.033276557922363, "global_step": 66559, "epoch": 1584} {"train_loss": -5.9407453536987305, "global_step": 66560, "epoch": 1584} {"train_loss": -6.0003509521484375, "global_step": 66561, "epoch": 1584} {"train_loss": -6.001951217651367, "global_step": 66562, "epoch": 1584} {"train_loss": -5.833036422729492, "global_step": 66563, "epoch": 1584} {"train_loss": -5.951311111450195, "global_step": 66564, "epoch": 1584} {"train_loss": -5.942771911621094, "global_step": 66565, "epoch": 1584} {"train_loss": -5.986682891845703, "global_step": 66566, "epoch": 1584} {"train_loss": -5.977602958679199, "global_step": 66567, "epoch": 1584} {"train_loss": -5.9205827713012695, "global_step": 66568, "epoch": 1584} {"train_loss": -5.963527191252935, "global_step": 66569, "epoch": 1584, "val_loss": 67300.546875} {"train_loss": -5.995065212249756, "global_step": 66570, "epoch": 1585} {"train_loss": -6.045365810394287, "global_step": 66571, "epoch": 1585} {"train_loss": -6.014817237854004, "global_step": 66572, "epoch": 1585} {"train_loss": -6.03172492980957, "global_step": 66573, "epoch": 1585} {"train_loss": -5.967576026916504, "global_step": 66574, "epoch": 1585} {"train_loss": -5.786108016967773, "global_step": 66575, "epoch": 1585} {"train_loss": -6.048759460449219, "global_step": 66576, "epoch": 1585} {"train_loss": -5.94309139251709, "global_step": 66577, "epoch": 1585} {"train_loss": -5.912345886230469, "global_step": 66578, "epoch": 1585} {"train_loss": -5.883864402770996, "global_step": 66579, "epoch": 1585} {"train_loss": -5.8767900466918945, "global_step": 66580, "epoch": 1585} {"train_loss": -5.887581825256348, "global_step": 66581, "epoch": 1585} {"train_loss": -6.036421775817871, "global_step": 66582, "epoch": 1585} {"train_loss": -5.868695259094238, "global_step": 66583, "epoch": 1585} {"train_loss": -5.953673362731934, "global_step": 66584, "epoch": 1585} {"train_loss": -5.783578872680664, "global_step": 66585, "epoch": 1585} {"train_loss": -6.007453441619873, "global_step": 66586, "epoch": 1585} {"train_loss": -5.904280662536621, "global_step": 66587, "epoch": 1585} {"train_loss": -6.032814979553223, "global_step": 66588, "epoch": 1585} {"train_loss": -6.080314636230469, "global_step": 66589, "epoch": 1585} {"train_loss": -5.921355247497559, "global_step": 66590, "epoch": 1585} {"train_loss": -5.999937057495117, "global_step": 66591, "epoch": 1585} {"train_loss": -6.009774208068848, "global_step": 66592, "epoch": 1585} {"train_loss": -5.924130439758301, "global_step": 66593, "epoch": 1585} {"train_loss": -5.978433609008789, "global_step": 66594, "epoch": 1585} {"train_loss": -5.903351783752441, "global_step": 66595, "epoch": 1585} {"train_loss": -6.021252632141113, "global_step": 66596, "epoch": 1585} {"train_loss": -5.920894622802734, "global_step": 66597, "epoch": 1585} {"train_loss": -5.935004234313965, "global_step": 66598, "epoch": 1585} {"train_loss": -5.917812347412109, "global_step": 66599, "epoch": 1585} {"train_loss": -5.958004951477051, "global_step": 66600, "epoch": 1585} {"train_loss": -5.9260029792785645, "global_step": 66601, "epoch": 1585} {"train_loss": -5.859188079833984, "global_step": 66602, "epoch": 1585} {"train_loss": -5.995438575744629, "global_step": 66603, "epoch": 1585} {"train_loss": -5.963272571563721, "global_step": 66604, "epoch": 1585} {"train_loss": -6.007870674133301, "global_step": 66605, "epoch": 1585} {"train_loss": -5.837245941162109, "global_step": 66606, "epoch": 1585} {"train_loss": -5.9829230308532715, "global_step": 66607, "epoch": 1585} {"train_loss": -5.81951379776001, "global_step": 66608, "epoch": 1585} {"train_loss": -5.947175979614258, "global_step": 66609, "epoch": 1585} {"train_loss": -6.039193153381348, "global_step": 66610, "epoch": 1585} {"train_loss": -5.949099211465745, "global_step": 66611, "epoch": 1585, "val_loss": 67296.734375} {"train_loss": -6.003300666809082, "global_step": 66612, "epoch": 1586} {"train_loss": -5.9607133865356445, "global_step": 66613, "epoch": 1586} {"train_loss": -5.9933624267578125, "global_step": 66614, "epoch": 1586} {"train_loss": -5.99916934967041, "global_step": 66615, "epoch": 1586} {"train_loss": -5.956214904785156, "global_step": 66616, "epoch": 1586} {"train_loss": -6.149666786193848, "global_step": 66617, "epoch": 1586} {"train_loss": -5.981045722961426, "global_step": 66618, "epoch": 1586} {"train_loss": -5.845842361450195, "global_step": 66619, "epoch": 1586} {"train_loss": -6.048316955566406, "global_step": 66620, "epoch": 1586} {"train_loss": -5.946170806884766, "global_step": 66621, "epoch": 1586} {"train_loss": -5.957324981689453, "global_step": 66622, "epoch": 1586} {"train_loss": -5.833977222442627, "global_step": 66623, "epoch": 1586} {"train_loss": -5.992863655090332, "global_step": 66624, "epoch": 1586} {"train_loss": -5.849998474121094, "global_step": 66625, "epoch": 1586} {"train_loss": -6.045790195465088, "global_step": 66626, "epoch": 1586} {"train_loss": -6.00432014465332, "global_step": 66627, "epoch": 1586} {"train_loss": -5.735353469848633, "global_step": 66628, "epoch": 1586} {"train_loss": -6.004838466644287, "global_step": 66629, "epoch": 1586} {"train_loss": -5.881328582763672, "global_step": 66630, "epoch": 1586} {"train_loss": -5.890171527862549, "global_step": 66631, "epoch": 1586} {"train_loss": -5.897500991821289, "global_step": 66632, "epoch": 1586} {"train_loss": -5.819429397583008, "global_step": 66633, "epoch": 1586} {"train_loss": -5.936169624328613, "global_step": 66634, "epoch": 1586} {"train_loss": -5.952633857727051, "global_step": 66635, "epoch": 1586} {"train_loss": -5.79245662689209, "global_step": 66636, "epoch": 1586} {"train_loss": -5.9263224601745605, "global_step": 66637, "epoch": 1586} {"train_loss": -5.726478576660156, "global_step": 66638, "epoch": 1586} {"train_loss": -5.837338447570801, "global_step": 66639, "epoch": 1586} {"train_loss": -5.818875312805176, "global_step": 66640, "epoch": 1586} {"train_loss": -5.905648708343506, "global_step": 66641, "epoch": 1586} {"train_loss": -5.7167158126831055, "global_step": 66642, "epoch": 1586} {"train_loss": -5.88970947265625, "global_step": 66643, "epoch": 1586} {"train_loss": -5.8480753898620605, "global_step": 66644, "epoch": 1586} {"train_loss": -5.913224220275879, "global_step": 66645, "epoch": 1586} {"train_loss": -6.018916606903076, "global_step": 66646, "epoch": 1586} {"train_loss": -5.991649150848389, "global_step": 66647, "epoch": 1586} {"train_loss": -6.089911460876465, "global_step": 66648, "epoch": 1586} {"train_loss": -5.922119140625, "global_step": 66649, "epoch": 1586} {"train_loss": -6.003134727478027, "global_step": 66650, "epoch": 1586} {"train_loss": -5.793497562408447, "global_step": 66651, "epoch": 1586} {"train_loss": -5.983912467956543, "global_step": 66652, "epoch": 1586} {"train_loss": -5.924576327914283, "global_step": 66653, "epoch": 1586, "val_loss": 67506.9609375} {"train_loss": -6.045231819152832, "global_step": 66654, "epoch": 1587} {"train_loss": -5.940199851989746, "global_step": 66655, "epoch": 1587} {"train_loss": -5.980996131896973, "global_step": 66656, "epoch": 1587} {"train_loss": -5.894414901733398, "global_step": 66657, "epoch": 1587} {"train_loss": -5.947075843811035, "global_step": 66658, "epoch": 1587} {"train_loss": -5.856315612792969, "global_step": 66659, "epoch": 1587} {"train_loss": -5.988151550292969, "global_step": 66660, "epoch": 1587} {"train_loss": -5.951407432556152, "global_step": 66661, "epoch": 1587} {"train_loss": -5.979009628295898, "global_step": 66662, "epoch": 1587} {"train_loss": -5.9229583740234375, "global_step": 66663, "epoch": 1587} {"train_loss": -6.078977108001709, "global_step": 66664, "epoch": 1587} {"train_loss": -6.152658462524414, "global_step": 66665, "epoch": 1587} {"train_loss": -5.951860427856445, "global_step": 66666, "epoch": 1587} {"train_loss": -5.965832710266113, "global_step": 66667, "epoch": 1587} {"train_loss": -5.860861778259277, "global_step": 66668, "epoch": 1587} {"train_loss": -5.979514122009277, "global_step": 66669, "epoch": 1587} {"train_loss": -5.952879905700684, "global_step": 66670, "epoch": 1587} {"train_loss": -6.004910945892334, "global_step": 66671, "epoch": 1587} {"train_loss": -5.9362335205078125, "global_step": 66672, "epoch": 1587} {"train_loss": -5.981528282165527, "global_step": 66673, "epoch": 1587} {"train_loss": -5.962888717651367, "global_step": 66674, "epoch": 1587} {"train_loss": -6.007111549377441, "global_step": 66675, "epoch": 1587} {"train_loss": -5.993782043457031, "global_step": 66676, "epoch": 1587} {"train_loss": -6.131368160247803, "global_step": 66677, "epoch": 1587} {"train_loss": -6.002477645874023, "global_step": 66678, "epoch": 1587} {"train_loss": -5.926615238189697, "global_step": 66679, "epoch": 1587} {"train_loss": -5.947936058044434, "global_step": 66680, "epoch": 1587} {"train_loss": -6.006688117980957, "global_step": 66681, "epoch": 1587} {"train_loss": -5.97904109954834, "global_step": 66682, "epoch": 1587} {"train_loss": -5.9453020095825195, "global_step": 66683, "epoch": 1587} {"train_loss": -6.016364097595215, "global_step": 66684, "epoch": 1587} {"train_loss": -5.966590881347656, "global_step": 66685, "epoch": 1587} {"train_loss": -5.919257164001465, "global_step": 66686, "epoch": 1587} {"train_loss": -5.922676086425781, "global_step": 66687, "epoch": 1587} {"train_loss": -5.9292755126953125, "global_step": 66688, "epoch": 1587} {"train_loss": -6.095188617706299, "global_step": 66689, "epoch": 1587} {"train_loss": -5.8215484619140625, "global_step": 66690, "epoch": 1587} {"train_loss": -5.847038269042969, "global_step": 66691, "epoch": 1587} {"train_loss": -6.0278472900390625, "global_step": 66692, "epoch": 1587} {"train_loss": -5.916632652282715, "global_step": 66693, "epoch": 1587} {"train_loss": -6.064480781555176, "global_step": 66694, "epoch": 1587} {"train_loss": -5.973074935731434, "global_step": 66695, "epoch": 1587, "val_loss": 67462.359375} {"train_loss": -5.923408508300781, "global_step": 66696, "epoch": 1588} {"train_loss": -5.964786529541016, "global_step": 66697, "epoch": 1588} {"train_loss": -5.9753193855285645, "global_step": 66698, "epoch": 1588} {"train_loss": -5.91986083984375, "global_step": 66699, "epoch": 1588} {"train_loss": -6.038137912750244, "global_step": 66700, "epoch": 1588} {"train_loss": -6.000147819519043, "global_step": 66701, "epoch": 1588} {"train_loss": -6.002317428588867, "global_step": 66702, "epoch": 1588} {"train_loss": -5.912880897521973, "global_step": 66703, "epoch": 1588} {"train_loss": -5.915471076965332, "global_step": 66704, "epoch": 1588} {"train_loss": -6.078152656555176, "global_step": 66705, "epoch": 1588} {"train_loss": -6.024580001831055, "global_step": 66706, "epoch": 1588} {"train_loss": -5.997930526733398, "global_step": 66707, "epoch": 1588} {"train_loss": -6.080411434173584, "global_step": 66708, "epoch": 1588} {"train_loss": -5.908990859985352, "global_step": 66709, "epoch": 1588} {"train_loss": -5.914373397827148, "global_step": 66710, "epoch": 1588} {"train_loss": -6.0955810546875, "global_step": 66711, "epoch": 1588} {"train_loss": -5.945446014404297, "global_step": 66712, "epoch": 1588} {"train_loss": -5.978862285614014, "global_step": 66713, "epoch": 1588} {"train_loss": -5.924735069274902, "global_step": 66714, "epoch": 1588} {"train_loss": -5.9307861328125, "global_step": 66715, "epoch": 1588} {"train_loss": -6.030091285705566, "global_step": 66716, "epoch": 1588} {"train_loss": -5.951203346252441, "global_step": 66717, "epoch": 1588} {"train_loss": -5.943811416625977, "global_step": 66718, "epoch": 1588} {"train_loss": -5.9611382484436035, "global_step": 66719, "epoch": 1588} {"train_loss": -5.947122573852539, "global_step": 66720, "epoch": 1588} {"train_loss": -6.040666103363037, "global_step": 66721, "epoch": 1588} {"train_loss": -5.904217720031738, "global_step": 66722, "epoch": 1588} {"train_loss": -5.941170692443848, "global_step": 66723, "epoch": 1588} {"train_loss": -5.943216800689697, "global_step": 66724, "epoch": 1588} {"train_loss": -5.85196590423584, "global_step": 66725, "epoch": 1588} {"train_loss": -5.853085041046143, "global_step": 66726, "epoch": 1588} {"train_loss": -6.048233985900879, "global_step": 66727, "epoch": 1588} {"train_loss": -5.776672840118408, "global_step": 66728, "epoch": 1588} {"train_loss": -5.862766265869141, "global_step": 66729, "epoch": 1588} {"train_loss": -5.887721061706543, "global_step": 66730, "epoch": 1588} {"train_loss": -5.962892055511475, "global_step": 66731, "epoch": 1588} {"train_loss": -5.936400413513184, "global_step": 66732, "epoch": 1588} {"train_loss": -5.928947448730469, "global_step": 66733, "epoch": 1588} {"train_loss": -5.987523078918457, "global_step": 66734, "epoch": 1588} {"train_loss": -5.795154571533203, "global_step": 66735, "epoch": 1588} {"train_loss": -6.016368389129639, "global_step": 66736, "epoch": 1588} {"train_loss": -5.951330343882243, "global_step": 66737, "epoch": 1588, "val_loss": 67410.0625} {"train_loss": -5.878820419311523, "global_step": 66738, "epoch": 1589} {"train_loss": -5.913738250732422, "global_step": 66739, "epoch": 1589} {"train_loss": -5.883255481719971, "global_step": 66740, "epoch": 1589} {"train_loss": -5.7846832275390625, "global_step": 66741, "epoch": 1589} {"train_loss": -5.95725154876709, "global_step": 66742, "epoch": 1589} {"train_loss": -6.0171074867248535, "global_step": 66743, "epoch": 1589} {"train_loss": -5.9158782958984375, "global_step": 66744, "epoch": 1589} {"train_loss": -6.136409759521484, "global_step": 66745, "epoch": 1589} {"train_loss": -5.890471935272217, "global_step": 66746, "epoch": 1589} {"train_loss": -5.946974754333496, "global_step": 66747, "epoch": 1589} {"train_loss": -6.039433002471924, "global_step": 66748, "epoch": 1589} {"train_loss": -5.859549045562744, "global_step": 66749, "epoch": 1589} {"train_loss": -6.047182083129883, "global_step": 66750, "epoch": 1589} {"train_loss": -5.944804668426514, "global_step": 66751, "epoch": 1589} {"train_loss": -5.91472053527832, "global_step": 66752, "epoch": 1589} {"train_loss": -5.949230194091797, "global_step": 66753, "epoch": 1589} {"train_loss": -5.796897888183594, "global_step": 66754, "epoch": 1589} {"train_loss": -5.861093997955322, "global_step": 66755, "epoch": 1589} {"train_loss": -6.028469085693359, "global_step": 66756, "epoch": 1589} {"train_loss": -6.009221076965332, "global_step": 66757, "epoch": 1589} {"train_loss": -6.0058393478393555, "global_step": 66758, "epoch": 1589} {"train_loss": -5.972980976104736, "global_step": 66759, "epoch": 1589} {"train_loss": -5.879874229431152, "global_step": 66760, "epoch": 1589} {"train_loss": -5.93475341796875, "global_step": 66761, "epoch": 1589} {"train_loss": -5.746725082397461, "global_step": 66762, "epoch": 1589} {"train_loss": -5.997681617736816, "global_step": 66763, "epoch": 1589} {"train_loss": -5.9296135902404785, "global_step": 66764, "epoch": 1589} {"train_loss": -5.849131107330322, "global_step": 66765, "epoch": 1589} {"train_loss": -5.8582916259765625, "global_step": 66766, "epoch": 1589} {"train_loss": -5.870509624481201, "global_step": 66767, "epoch": 1589} {"train_loss": -5.977961540222168, "global_step": 66768, "epoch": 1589} {"train_loss": -5.937505722045898, "global_step": 66769, "epoch": 1589} {"train_loss": -5.958218574523926, "global_step": 66770, "epoch": 1589} {"train_loss": -5.942137241363525, "global_step": 66771, "epoch": 1589} {"train_loss": -6.04487419128418, "global_step": 66772, "epoch": 1589} {"train_loss": -5.91130256652832, "global_step": 66773, "epoch": 1589} {"train_loss": -5.895291328430176, "global_step": 66774, "epoch": 1589} {"train_loss": -6.016916751861572, "global_step": 66775, "epoch": 1589} {"train_loss": -6.091883659362793, "global_step": 66776, "epoch": 1589} {"train_loss": -5.981679916381836, "global_step": 66777, "epoch": 1589} {"train_loss": -5.945032596588135, "global_step": 66778, "epoch": 1589} {"train_loss": -5.939868665876842, "global_step": 66779, "epoch": 1589, "val_loss": 67067.015625} {"train_loss": -6.078852653503418, "global_step": 66780, "epoch": 1590} {"train_loss": -6.014876842498779, "global_step": 66781, "epoch": 1590} {"train_loss": -6.026788711547852, "global_step": 66782, "epoch": 1590} {"train_loss": -5.929839134216309, "global_step": 66783, "epoch": 1590} {"train_loss": -6.005069255828857, "global_step": 66784, "epoch": 1590} {"train_loss": -5.991515159606934, "global_step": 66785, "epoch": 1590} {"train_loss": -6.120565414428711, "global_step": 66786, "epoch": 1590} {"train_loss": -5.883536338806152, "global_step": 66787, "epoch": 1590} {"train_loss": -6.000333786010742, "global_step": 66788, "epoch": 1590} {"train_loss": -5.961233139038086, "global_step": 66789, "epoch": 1590} {"train_loss": -5.943661689758301, "global_step": 66790, "epoch": 1590} {"train_loss": -6.040447235107422, "global_step": 66791, "epoch": 1590} {"train_loss": -6.083747863769531, "global_step": 66792, "epoch": 1590} {"train_loss": -6.0155487060546875, "global_step": 66793, "epoch": 1590} {"train_loss": -5.905546188354492, "global_step": 66794, "epoch": 1590} {"train_loss": -6.115472793579102, "global_step": 66795, "epoch": 1590} {"train_loss": -5.946746826171875, "global_step": 66796, "epoch": 1590} {"train_loss": -5.959145545959473, "global_step": 66797, "epoch": 1590} {"train_loss": -5.86424446105957, "global_step": 66798, "epoch": 1590} {"train_loss": -5.852707386016846, "global_step": 66799, "epoch": 1590} {"train_loss": -5.908863544464111, "global_step": 66800, "epoch": 1590} {"train_loss": -5.918510913848877, "global_step": 66801, "epoch": 1590} {"train_loss": -5.986282825469971, "global_step": 66802, "epoch": 1590} {"train_loss": -5.962135314941406, "global_step": 66803, "epoch": 1590} {"train_loss": -5.906206130981445, "global_step": 66804, "epoch": 1590} {"train_loss": -5.87760066986084, "global_step": 66805, "epoch": 1590} {"train_loss": -5.880282402038574, "global_step": 66806, "epoch": 1590} {"train_loss": -5.946662902832031, "global_step": 66807, "epoch": 1590} {"train_loss": -5.97819709777832, "global_step": 66808, "epoch": 1590} {"train_loss": -5.897125244140625, "global_step": 66809, "epoch": 1590} {"train_loss": -5.982875823974609, "global_step": 66810, "epoch": 1590} {"train_loss": -6.042386054992676, "global_step": 66811, "epoch": 1590} {"train_loss": -6.057401657104492, "global_step": 66812, "epoch": 1590} {"train_loss": -5.985137462615967, "global_step": 66813, "epoch": 1590} {"train_loss": -5.994678974151611, "global_step": 66814, "epoch": 1590} {"train_loss": -6.094001770019531, "global_step": 66815, "epoch": 1590} {"train_loss": -5.872767448425293, "global_step": 66816, "epoch": 1590} {"train_loss": -5.9599409103393555, "global_step": 66817, "epoch": 1590} {"train_loss": -5.923609733581543, "global_step": 66818, "epoch": 1590} {"train_loss": -5.974225997924805, "global_step": 66819, "epoch": 1590} {"train_loss": -5.896610260009766, "global_step": 66820, "epoch": 1590} {"train_loss": -5.969312145596459, "global_step": 66821, "epoch": 1590, "val_loss": 67224.0546875} {"train_loss": -5.963315486907959, "global_step": 66822, "epoch": 1591} {"train_loss": -5.956846237182617, "global_step": 66823, "epoch": 1591} {"train_loss": -6.031620025634766, "global_step": 66824, "epoch": 1591} {"train_loss": -5.991713523864746, "global_step": 66825, "epoch": 1591} {"train_loss": -6.004690170288086, "global_step": 66826, "epoch": 1591} {"train_loss": -5.884919166564941, "global_step": 66827, "epoch": 1591} {"train_loss": -5.884603500366211, "global_step": 66828, "epoch": 1591} {"train_loss": -5.933633804321289, "global_step": 66829, "epoch": 1591} {"train_loss": -6.047305107116699, "global_step": 66830, "epoch": 1591} {"train_loss": -5.8719353675842285, "global_step": 66831, "epoch": 1591} {"train_loss": -5.921224117279053, "global_step": 66832, "epoch": 1591} {"train_loss": -6.06643533706665, "global_step": 66833, "epoch": 1591} {"train_loss": -5.964235305786133, "global_step": 66834, "epoch": 1591} {"train_loss": -5.920202732086182, "global_step": 66835, "epoch": 1591} {"train_loss": -6.0156660079956055, "global_step": 66836, "epoch": 1591} {"train_loss": -5.964466571807861, "global_step": 66837, "epoch": 1591} {"train_loss": -5.971451282501221, "global_step": 66838, "epoch": 1591} {"train_loss": -5.931826114654541, "global_step": 66839, "epoch": 1591} {"train_loss": -5.998019695281982, "global_step": 66840, "epoch": 1591} {"train_loss": -5.954505920410156, "global_step": 66841, "epoch": 1591} {"train_loss": -5.913693428039551, "global_step": 66842, "epoch": 1591} {"train_loss": -5.921941757202148, "global_step": 66843, "epoch": 1591} {"train_loss": -6.028986930847168, "global_step": 66844, "epoch": 1591} {"train_loss": -6.062819480895996, "global_step": 66845, "epoch": 1591} {"train_loss": -5.944341659545898, "global_step": 66846, "epoch": 1591} {"train_loss": -5.905879020690918, "global_step": 66847, "epoch": 1591} {"train_loss": -6.012334823608398, "global_step": 66848, "epoch": 1591} {"train_loss": -5.954673767089844, "global_step": 66849, "epoch": 1591} {"train_loss": -5.900262355804443, "global_step": 66850, "epoch": 1591} {"train_loss": -5.971887588500977, "global_step": 66851, "epoch": 1591} {"train_loss": -5.90984582901001, "global_step": 66852, "epoch": 1591} {"train_loss": -5.97584342956543, "global_step": 66853, "epoch": 1591} {"train_loss": -6.023563385009766, "global_step": 66854, "epoch": 1591} {"train_loss": -5.886402130126953, "global_step": 66855, "epoch": 1591} {"train_loss": -5.952910423278809, "global_step": 66856, "epoch": 1591} {"train_loss": -5.92240047454834, "global_step": 66857, "epoch": 1591} {"train_loss": -5.955941200256348, "global_step": 66858, "epoch": 1591} {"train_loss": -5.985764980316162, "global_step": 66859, "epoch": 1591} {"train_loss": -5.922182559967041, "global_step": 66860, "epoch": 1591} {"train_loss": -5.916167259216309, "global_step": 66861, "epoch": 1591} {"train_loss": -5.957671165466309, "global_step": 66862, "epoch": 1591} {"train_loss": -5.956809021177746, "global_step": 66863, "epoch": 1591, "val_loss": 67115.296875} {"train_loss": -5.937005996704102, "global_step": 66864, "epoch": 1592} {"train_loss": -5.969053745269775, "global_step": 66865, "epoch": 1592} {"train_loss": -6.014784812927246, "global_step": 66866, "epoch": 1592} {"train_loss": -6.136407852172852, "global_step": 66867, "epoch": 1592} {"train_loss": -6.023349285125732, "global_step": 66868, "epoch": 1592} {"train_loss": -6.007409572601318, "global_step": 66869, "epoch": 1592} {"train_loss": -5.865422248840332, "global_step": 66870, "epoch": 1592} {"train_loss": -5.944972991943359, "global_step": 66871, "epoch": 1592} {"train_loss": -6.066680431365967, "global_step": 66872, "epoch": 1592} {"train_loss": -5.976829528808594, "global_step": 66873, "epoch": 1592} {"train_loss": -5.949598789215088, "global_step": 66874, "epoch": 1592} {"train_loss": -6.011297702789307, "global_step": 66875, "epoch": 1592} {"train_loss": -5.970807075500488, "global_step": 66876, "epoch": 1592} {"train_loss": -6.050809860229492, "global_step": 66877, "epoch": 1592} {"train_loss": -5.939335823059082, "global_step": 66878, "epoch": 1592} {"train_loss": -6.069483757019043, "global_step": 66879, "epoch": 1592} {"train_loss": -6.059494972229004, "global_step": 66880, "epoch": 1592} {"train_loss": -5.89955997467041, "global_step": 66881, "epoch": 1592} {"train_loss": -5.989659786224365, "global_step": 66882, "epoch": 1592} {"train_loss": -5.899267196655273, "global_step": 66883, "epoch": 1592} {"train_loss": -5.917707920074463, "global_step": 66884, "epoch": 1592} {"train_loss": -5.937943458557129, "global_step": 66885, "epoch": 1592} {"train_loss": -5.99440860748291, "global_step": 66886, "epoch": 1592} {"train_loss": -5.962471961975098, "global_step": 66887, "epoch": 1592} {"train_loss": -5.94586706161499, "global_step": 66888, "epoch": 1592} {"train_loss": -5.948064804077148, "global_step": 66889, "epoch": 1592} {"train_loss": -5.821045875549316, "global_step": 66890, "epoch": 1592} {"train_loss": -5.963858127593994, "global_step": 66891, "epoch": 1592} {"train_loss": -6.060401916503906, "global_step": 66892, "epoch": 1592} {"train_loss": -5.922221660614014, "global_step": 66893, "epoch": 1592} {"train_loss": -5.870304107666016, "global_step": 66894, "epoch": 1592} {"train_loss": -5.878384113311768, "global_step": 66895, "epoch": 1592} {"train_loss": -5.849251747131348, "global_step": 66896, "epoch": 1592} {"train_loss": -5.878357410430908, "global_step": 66897, "epoch": 1592} {"train_loss": -5.855007171630859, "global_step": 66898, "epoch": 1592} {"train_loss": -5.908510208129883, "global_step": 66899, "epoch": 1592} {"train_loss": -5.800019264221191, "global_step": 66900, "epoch": 1592} {"train_loss": -5.9855756759643555, "global_step": 66901, "epoch": 1592} {"train_loss": -5.911215305328369, "global_step": 66902, "epoch": 1592} {"train_loss": -5.975067615509033, "global_step": 66903, "epoch": 1592} {"train_loss": -5.935202121734619, "global_step": 66904, "epoch": 1592} {"train_loss": -5.952768303099132, "global_step": 66905, "epoch": 1592, "val_loss": 67588.6328125} {"train_loss": -5.836429119110107, "global_step": 66906, "epoch": 1593} {"train_loss": -5.9024457931518555, "global_step": 66907, "epoch": 1593} {"train_loss": -5.985285758972168, "global_step": 66908, "epoch": 1593} {"train_loss": -5.889013290405273, "global_step": 66909, "epoch": 1593} {"train_loss": -5.916342258453369, "global_step": 66910, "epoch": 1593} {"train_loss": -5.924858093261719, "global_step": 66911, "epoch": 1593} {"train_loss": -5.9183125495910645, "global_step": 66912, "epoch": 1593} {"train_loss": -5.955598831176758, "global_step": 66913, "epoch": 1593} {"train_loss": -6.037014007568359, "global_step": 66914, "epoch": 1593} {"train_loss": -6.030338287353516, "global_step": 66915, "epoch": 1593} {"train_loss": -5.993870735168457, "global_step": 66916, "epoch": 1593} {"train_loss": -6.0379486083984375, "global_step": 66917, "epoch": 1593} {"train_loss": -5.916868209838867, "global_step": 66918, "epoch": 1593} {"train_loss": -5.99692440032959, "global_step": 66919, "epoch": 1593} {"train_loss": -5.973317623138428, "global_step": 66920, "epoch": 1593} {"train_loss": -5.927854537963867, "global_step": 66921, "epoch": 1593} {"train_loss": -5.970109939575195, "global_step": 66922, "epoch": 1593} {"train_loss": -5.942074775695801, "global_step": 66923, "epoch": 1593} {"train_loss": -6.014796257019043, "global_step": 66924, "epoch": 1593} {"train_loss": -6.063876152038574, "global_step": 66925, "epoch": 1593} {"train_loss": -5.981122016906738, "global_step": 66926, "epoch": 1593} {"train_loss": -5.87168025970459, "global_step": 66927, "epoch": 1593} {"train_loss": -5.856877326965332, "global_step": 66928, "epoch": 1593} {"train_loss": -6.066694259643555, "global_step": 66929, "epoch": 1593} {"train_loss": -6.020686626434326, "global_step": 66930, "epoch": 1593} {"train_loss": -5.9087233543396, "global_step": 66931, "epoch": 1593} {"train_loss": -6.006292819976807, "global_step": 66932, "epoch": 1593} {"train_loss": -5.886492729187012, "global_step": 66933, "epoch": 1593} {"train_loss": -5.995685577392578, "global_step": 66934, "epoch": 1593} {"train_loss": -6.05156946182251, "global_step": 66935, "epoch": 1593} {"train_loss": -5.980809688568115, "global_step": 66936, "epoch": 1593} {"train_loss": -5.786667346954346, "global_step": 66937, "epoch": 1593} {"train_loss": -5.764880180358887, "global_step": 66938, "epoch": 1593} {"train_loss": -5.965106964111328, "global_step": 66939, "epoch": 1593} {"train_loss": -5.923549175262451, "global_step": 66940, "epoch": 1593} {"train_loss": -5.911190509796143, "global_step": 66941, "epoch": 1593} {"train_loss": -5.867154598236084, "global_step": 66942, "epoch": 1593} {"train_loss": -5.898977279663086, "global_step": 66943, "epoch": 1593} {"train_loss": -6.016515731811523, "global_step": 66944, "epoch": 1593} {"train_loss": -5.988585472106934, "global_step": 66945, "epoch": 1593} {"train_loss": -5.931866645812988, "global_step": 66946, "epoch": 1593} {"train_loss": -5.9474960168202715, "global_step": 66947, "epoch": 1593, "val_loss": 67174.078125} {"train_loss": -5.910299301147461, "global_step": 66948, "epoch": 1594} {"train_loss": -5.950367450714111, "global_step": 66949, "epoch": 1594} {"train_loss": -6.048985481262207, "global_step": 66950, "epoch": 1594} {"train_loss": -6.083152770996094, "global_step": 66951, "epoch": 1594} {"train_loss": -6.033217430114746, "global_step": 66952, "epoch": 1594} {"train_loss": -5.969368934631348, "global_step": 66953, "epoch": 1594} {"train_loss": -5.891907691955566, "global_step": 66954, "epoch": 1594} {"train_loss": -6.017710208892822, "global_step": 66955, "epoch": 1594} {"train_loss": -6.057934284210205, "global_step": 66956, "epoch": 1594} {"train_loss": -6.078531265258789, "global_step": 66957, "epoch": 1594} {"train_loss": -6.055693626403809, "global_step": 66958, "epoch": 1594} {"train_loss": -5.8528594970703125, "global_step": 66959, "epoch": 1594} {"train_loss": -5.892914295196533, "global_step": 66960, "epoch": 1594} {"train_loss": -5.920924186706543, "global_step": 66961, "epoch": 1594} {"train_loss": -6.0593461990356445, "global_step": 66962, "epoch": 1594} {"train_loss": -5.995774269104004, "global_step": 66963, "epoch": 1594} {"train_loss": -5.962353229522705, "global_step": 66964, "epoch": 1594} {"train_loss": -6.028666019439697, "global_step": 66965, "epoch": 1594} {"train_loss": -6.114480495452881, "global_step": 66966, "epoch": 1594} {"train_loss": -6.0811591148376465, "global_step": 66967, "epoch": 1594} {"train_loss": -5.825710773468018, "global_step": 66968, "epoch": 1594} {"train_loss": -6.022894382476807, "global_step": 66969, "epoch": 1594} {"train_loss": -5.911990165710449, "global_step": 66970, "epoch": 1594} {"train_loss": -5.863913536071777, "global_step": 66971, "epoch": 1594} {"train_loss": -5.969658851623535, "global_step": 66972, "epoch": 1594} {"train_loss": -5.998809814453125, "global_step": 66973, "epoch": 1594} {"train_loss": -5.870373725891113, "global_step": 66974, "epoch": 1594} {"train_loss": -5.967173099517822, "global_step": 66975, "epoch": 1594} {"train_loss": -5.834228992462158, "global_step": 66976, "epoch": 1594} {"train_loss": -5.970190525054932, "global_step": 66977, "epoch": 1594} {"train_loss": -6.083036422729492, "global_step": 66978, "epoch": 1594} {"train_loss": -5.904567241668701, "global_step": 66979, "epoch": 1594} {"train_loss": -5.999040126800537, "global_step": 66980, "epoch": 1594} {"train_loss": -5.996181964874268, "global_step": 66981, "epoch": 1594} {"train_loss": -5.8197712898254395, "global_step": 66982, "epoch": 1594} {"train_loss": -5.948711395263672, "global_step": 66983, "epoch": 1594} {"train_loss": -5.856679916381836, "global_step": 66984, "epoch": 1594} {"train_loss": -5.91765022277832, "global_step": 66985, "epoch": 1594} {"train_loss": -5.799684524536133, "global_step": 66986, "epoch": 1594} {"train_loss": -5.892364978790283, "global_step": 66987, "epoch": 1594} {"train_loss": -5.977218151092529, "global_step": 66988, "epoch": 1594} {"train_loss": -5.9596443970998125, "global_step": 66989, "epoch": 1594, "val_loss": 67450.9765625} {"train_loss": -5.970074653625488, "global_step": 66990, "epoch": 1595} {"train_loss": -6.09330415725708, "global_step": 66991, "epoch": 1595} {"train_loss": -5.943072319030762, "global_step": 66992, "epoch": 1595} {"train_loss": -5.887391090393066, "global_step": 66993, "epoch": 1595} {"train_loss": -5.959057807922363, "global_step": 66994, "epoch": 1595} {"train_loss": -5.9607439041137695, "global_step": 66995, "epoch": 1595} {"train_loss": -5.838346481323242, "global_step": 66996, "epoch": 1595} {"train_loss": -6.056300640106201, "global_step": 66997, "epoch": 1595} {"train_loss": -6.004712104797363, "global_step": 66998, "epoch": 1595} {"train_loss": -5.912712097167969, "global_step": 66999, "epoch": 1595} {"train_loss": -5.991692543029785, "global_step": 67000, "epoch": 1595} {"train_loss": -5.757229804992676, "global_step": 67001, "epoch": 1595} {"train_loss": -5.949113368988037, "global_step": 67002, "epoch": 1595} {"train_loss": -6.092503547668457, "global_step": 67003, "epoch": 1595} {"train_loss": -5.897623062133789, "global_step": 67004, "epoch": 1595} {"train_loss": -5.936367034912109, "global_step": 67005, "epoch": 1595} {"train_loss": -6.0395402908325195, "global_step": 67006, "epoch": 1595} {"train_loss": -6.046444892883301, "global_step": 67007, "epoch": 1595} {"train_loss": -6.06894063949585, "global_step": 67008, "epoch": 1595} {"train_loss": -5.968072414398193, "global_step": 67009, "epoch": 1595} {"train_loss": -5.908265113830566, "global_step": 67010, "epoch": 1595} {"train_loss": -5.931368827819824, "global_step": 67011, "epoch": 1595} {"train_loss": -5.967464923858643, "global_step": 67012, "epoch": 1595} {"train_loss": -6.017475128173828, "global_step": 67013, "epoch": 1595} {"train_loss": -5.982321739196777, "global_step": 67014, "epoch": 1595} {"train_loss": -6.063708305358887, "global_step": 67015, "epoch": 1595} {"train_loss": -5.903819561004639, "global_step": 67016, "epoch": 1595} {"train_loss": -6.089137077331543, "global_step": 67017, "epoch": 1595} {"train_loss": -6.100630760192871, "global_step": 67018, "epoch": 1595} {"train_loss": -6.030638694763184, "global_step": 67019, "epoch": 1595} {"train_loss": -5.969983100891113, "global_step": 67020, "epoch": 1595} {"train_loss": -5.934626579284668, "global_step": 67021, "epoch": 1595} {"train_loss": -6.007063388824463, "global_step": 67022, "epoch": 1595} {"train_loss": -6.086269378662109, "global_step": 67023, "epoch": 1595} {"train_loss": -5.970863342285156, "global_step": 67024, "epoch": 1595} {"train_loss": -5.987926006317139, "global_step": 67025, "epoch": 1595} {"train_loss": -6.072049140930176, "global_step": 67026, "epoch": 1595} {"train_loss": -6.061254501342773, "global_step": 67027, "epoch": 1595} {"train_loss": -5.815328598022461, "global_step": 67028, "epoch": 1595} {"train_loss": -5.941974639892578, "global_step": 67029, "epoch": 1595} {"train_loss": -6.152284622192383, "global_step": 67030, "epoch": 1595} {"train_loss": -5.983416159947713, "global_step": 67031, "epoch": 1595, "val_loss": 67187.0} {"train_loss": -6.004836559295654, "global_step": 67032, "epoch": 1596} {"train_loss": -5.909974098205566, "global_step": 67033, "epoch": 1596} {"train_loss": -6.006463527679443, "global_step": 67034, "epoch": 1596} {"train_loss": -5.845751762390137, "global_step": 67035, "epoch": 1596} {"train_loss": -5.974252223968506, "global_step": 67036, "epoch": 1596} {"train_loss": -6.015652179718018, "global_step": 67037, "epoch": 1596} {"train_loss": -5.9321513175964355, "global_step": 67038, "epoch": 1596} {"train_loss": -5.922183990478516, "global_step": 67039, "epoch": 1596} {"train_loss": -6.061249256134033, "global_step": 67040, "epoch": 1596} {"train_loss": -6.16795539855957, "global_step": 67041, "epoch": 1596} {"train_loss": -5.97416877746582, "global_step": 67042, "epoch": 1596} {"train_loss": -5.929566383361816, "global_step": 67043, "epoch": 1596} {"train_loss": -6.144364356994629, "global_step": 67044, "epoch": 1596} {"train_loss": -5.991428375244141, "global_step": 67045, "epoch": 1596} {"train_loss": -5.861429214477539, "global_step": 67046, "epoch": 1596} {"train_loss": -6.105989456176758, "global_step": 67047, "epoch": 1596} {"train_loss": -5.96702766418457, "global_step": 67048, "epoch": 1596} {"train_loss": -5.959048271179199, "global_step": 67049, "epoch": 1596} {"train_loss": -5.812931060791016, "global_step": 67050, "epoch": 1596} {"train_loss": -5.860061168670654, "global_step": 67051, "epoch": 1596} {"train_loss": -5.954787254333496, "global_step": 67052, "epoch": 1596} {"train_loss": -5.946944236755371, "global_step": 67053, "epoch": 1596} {"train_loss": -5.944679260253906, "global_step": 67054, "epoch": 1596} {"train_loss": -5.913037300109863, "global_step": 67055, "epoch": 1596} {"train_loss": -5.934402942657471, "global_step": 67056, "epoch": 1596} {"train_loss": -5.932912349700928, "global_step": 67057, "epoch": 1596} {"train_loss": -6.070021629333496, "global_step": 67058, "epoch": 1596} {"train_loss": -5.803118705749512, "global_step": 67059, "epoch": 1596} {"train_loss": -5.836207389831543, "global_step": 67060, "epoch": 1596} {"train_loss": -6.010583400726318, "global_step": 67061, "epoch": 1596} {"train_loss": -5.836903095245361, "global_step": 67062, "epoch": 1596} {"train_loss": -5.950859546661377, "global_step": 67063, "epoch": 1596} {"train_loss": -6.058046817779541, "global_step": 67064, "epoch": 1596} {"train_loss": -6.000156402587891, "global_step": 67065, "epoch": 1596} {"train_loss": -5.958060264587402, "global_step": 67066, "epoch": 1596} {"train_loss": -6.108377456665039, "global_step": 67067, "epoch": 1596} {"train_loss": -5.9677653312683105, "global_step": 67068, "epoch": 1596} {"train_loss": -6.028972625732422, "global_step": 67069, "epoch": 1596} {"train_loss": -5.9061079025268555, "global_step": 67070, "epoch": 1596} {"train_loss": -6.017361164093018, "global_step": 67071, "epoch": 1596} {"train_loss": -5.840636253356934, "global_step": 67072, "epoch": 1596} {"train_loss": -5.961313395273118, "global_step": 67073, "epoch": 1596, "val_loss": 67530.859375} {"train_loss": -5.987013816833496, "global_step": 67074, "epoch": 1597} {"train_loss": -5.914089202880859, "global_step": 67075, "epoch": 1597} {"train_loss": -5.812355995178223, "global_step": 67076, "epoch": 1597} {"train_loss": -6.056856155395508, "global_step": 67077, "epoch": 1597} {"train_loss": -5.9288859367370605, "global_step": 67078, "epoch": 1597} {"train_loss": -6.032236576080322, "global_step": 67079, "epoch": 1597} {"train_loss": -5.969633102416992, "global_step": 67080, "epoch": 1597} {"train_loss": -6.065775394439697, "global_step": 67081, "epoch": 1597} {"train_loss": -5.811161518096924, "global_step": 67082, "epoch": 1597} {"train_loss": -5.884346961975098, "global_step": 67083, "epoch": 1597} {"train_loss": -6.040734767913818, "global_step": 67084, "epoch": 1597} {"train_loss": -5.900686264038086, "global_step": 67085, "epoch": 1597} {"train_loss": -5.8655619621276855, "global_step": 67086, "epoch": 1597} {"train_loss": -5.9048614501953125, "global_step": 67087, "epoch": 1597} {"train_loss": -6.096062660217285, "global_step": 67088, "epoch": 1597} {"train_loss": -6.0155181884765625, "global_step": 67089, "epoch": 1597} {"train_loss": -6.051908016204834, "global_step": 67090, "epoch": 1597} {"train_loss": -5.98139762878418, "global_step": 67091, "epoch": 1597} {"train_loss": -6.02372407913208, "global_step": 67092, "epoch": 1597} {"train_loss": -6.039610385894775, "global_step": 67093, "epoch": 1597} {"train_loss": -6.074670314788818, "global_step": 67094, "epoch": 1597} {"train_loss": -6.017269134521484, "global_step": 67095, "epoch": 1597} {"train_loss": -6.0424699783325195, "global_step": 67096, "epoch": 1597} {"train_loss": -6.040251731872559, "global_step": 67097, "epoch": 1597} {"train_loss": -6.003477096557617, "global_step": 67098, "epoch": 1597} {"train_loss": -5.9986572265625, "global_step": 67099, "epoch": 1597} {"train_loss": -6.05342960357666, "global_step": 67100, "epoch": 1597} {"train_loss": -6.036449909210205, "global_step": 67101, "epoch": 1597} {"train_loss": -6.059816360473633, "global_step": 67102, "epoch": 1597} {"train_loss": -5.914303779602051, "global_step": 67103, "epoch": 1597} {"train_loss": -5.923425674438477, "global_step": 67104, "epoch": 1597} {"train_loss": -5.990788459777832, "global_step": 67105, "epoch": 1597} {"train_loss": -5.956645965576172, "global_step": 67106, "epoch": 1597} {"train_loss": -6.029952526092529, "global_step": 67107, "epoch": 1597} {"train_loss": -6.096617698669434, "global_step": 67108, "epoch": 1597} {"train_loss": -5.955105781555176, "global_step": 67109, "epoch": 1597} {"train_loss": -5.937363624572754, "global_step": 67110, "epoch": 1597} {"train_loss": -5.8710103034973145, "global_step": 67111, "epoch": 1597} {"train_loss": -5.901182174682617, "global_step": 67112, "epoch": 1597} {"train_loss": -5.97736930847168, "global_step": 67113, "epoch": 1597} {"train_loss": -5.864195823669434, "global_step": 67114, "epoch": 1597} {"train_loss": -5.978020043600173, "global_step": 67115, "epoch": 1597, "val_loss": 66930.03125} {"train_loss": -6.058932781219482, "global_step": 67116, "epoch": 1598} {"train_loss": -5.98484992980957, "global_step": 67117, "epoch": 1598} {"train_loss": -5.857189178466797, "global_step": 67118, "epoch": 1598} {"train_loss": -6.0938005447387695, "global_step": 67119, "epoch": 1598} {"train_loss": -5.950177192687988, "global_step": 67120, "epoch": 1598} {"train_loss": -5.944958686828613, "global_step": 67121, "epoch": 1598} {"train_loss": -5.947610855102539, "global_step": 67122, "epoch": 1598} {"train_loss": -5.916877746582031, "global_step": 67123, "epoch": 1598} {"train_loss": -5.944800853729248, "global_step": 67124, "epoch": 1598} {"train_loss": -6.041141510009766, "global_step": 67125, "epoch": 1598} {"train_loss": -5.976473808288574, "global_step": 67126, "epoch": 1598} {"train_loss": -5.886397361755371, "global_step": 67127, "epoch": 1598} {"train_loss": -5.954156875610352, "global_step": 67128, "epoch": 1598} {"train_loss": -5.972501754760742, "global_step": 67129, "epoch": 1598} {"train_loss": -5.77768611907959, "global_step": 67130, "epoch": 1598} {"train_loss": -5.983231544494629, "global_step": 67131, "epoch": 1598} {"train_loss": -6.027283668518066, "global_step": 67132, "epoch": 1598} {"train_loss": -6.060319900512695, "global_step": 67133, "epoch": 1598} {"train_loss": -6.1121954917907715, "global_step": 67134, "epoch": 1598} {"train_loss": -5.827107906341553, "global_step": 67135, "epoch": 1598} {"train_loss": -6.022963523864746, "global_step": 67136, "epoch": 1598} {"train_loss": -5.929437637329102, "global_step": 67137, "epoch": 1598} {"train_loss": -5.826709747314453, "global_step": 67138, "epoch": 1598} {"train_loss": -5.9149675369262695, "global_step": 67139, "epoch": 1598} {"train_loss": -6.117499351501465, "global_step": 67140, "epoch": 1598} {"train_loss": -5.98933744430542, "global_step": 67141, "epoch": 1598} {"train_loss": -6.0382890701293945, "global_step": 67142, "epoch": 1598} {"train_loss": -5.9393205642700195, "global_step": 67143, "epoch": 1598} {"train_loss": -5.940682411193848, "global_step": 67144, "epoch": 1598} {"train_loss": -5.908840656280518, "global_step": 67145, "epoch": 1598} {"train_loss": -5.993919849395752, "global_step": 67146, "epoch": 1598} {"train_loss": -5.942170143127441, "global_step": 67147, "epoch": 1598} {"train_loss": -5.878544807434082, "global_step": 67148, "epoch": 1598} {"train_loss": -5.969737529754639, "global_step": 67149, "epoch": 1598} {"train_loss": -6.013949394226074, "global_step": 67150, "epoch": 1598} {"train_loss": -5.894042015075684, "global_step": 67151, "epoch": 1598} {"train_loss": -5.9221954345703125, "global_step": 67152, "epoch": 1598} {"train_loss": -5.979639530181885, "global_step": 67153, "epoch": 1598} {"train_loss": -5.949462890625, "global_step": 67154, "epoch": 1598} {"train_loss": -5.922054290771484, "global_step": 67155, "epoch": 1598} {"train_loss": -5.993083953857422, "global_step": 67156, "epoch": 1598} {"train_loss": -5.958125750223796, "global_step": 67157, "epoch": 1598, "val_loss": 67369.3828125} {"train_loss": -6.0157012939453125, "global_step": 67158, "epoch": 1599} {"train_loss": -5.954458713531494, "global_step": 67159, "epoch": 1599} {"train_loss": -5.914539337158203, "global_step": 67160, "epoch": 1599} {"train_loss": -5.979457378387451, "global_step": 67161, "epoch": 1599} {"train_loss": -5.9659247398376465, "global_step": 67162, "epoch": 1599} {"train_loss": -5.846810340881348, "global_step": 67163, "epoch": 1599} {"train_loss": -5.964691162109375, "global_step": 67164, "epoch": 1599} {"train_loss": -5.8871870040893555, "global_step": 67165, "epoch": 1599} {"train_loss": -5.860751152038574, "global_step": 67166, "epoch": 1599} {"train_loss": -5.924558639526367, "global_step": 67167, "epoch": 1599} {"train_loss": -5.8639936447143555, "global_step": 67168, "epoch": 1599} {"train_loss": -6.022623538970947, "global_step": 67169, "epoch": 1599} {"train_loss": -6.050239086151123, "global_step": 67170, "epoch": 1599} {"train_loss": -5.909961700439453, "global_step": 67171, "epoch": 1599} {"train_loss": -6.027059555053711, "global_step": 67172, "epoch": 1599} {"train_loss": -5.930384635925293, "global_step": 67173, "epoch": 1599} {"train_loss": -6.070745468139648, "global_step": 67174, "epoch": 1599} {"train_loss": -5.988319396972656, "global_step": 67175, "epoch": 1599} {"train_loss": -5.938053131103516, "global_step": 67176, "epoch": 1599} {"train_loss": -5.938711166381836, "global_step": 67177, "epoch": 1599} {"train_loss": -6.057848930358887, "global_step": 67178, "epoch": 1599} {"train_loss": -6.075372695922852, "global_step": 67179, "epoch": 1599} {"train_loss": -5.880995273590088, "global_step": 67180, "epoch": 1599} {"train_loss": -6.063914775848389, "global_step": 67181, "epoch": 1599} {"train_loss": -6.0467634201049805, "global_step": 67182, "epoch": 1599} {"train_loss": -5.9377007484436035, "global_step": 67183, "epoch": 1599} {"train_loss": -5.823334693908691, "global_step": 67184, "epoch": 1599} {"train_loss": -6.049124717712402, "global_step": 67185, "epoch": 1599} {"train_loss": -6.070876121520996, "global_step": 67186, "epoch": 1599} {"train_loss": -5.897850036621094, "global_step": 67187, "epoch": 1599} {"train_loss": -6.0585832595825195, "global_step": 67188, "epoch": 1599} {"train_loss": -5.986967086791992, "global_step": 67189, "epoch": 1599} {"train_loss": -6.130496025085449, "global_step": 67190, "epoch": 1599} {"train_loss": -6.0598955154418945, "global_step": 67191, "epoch": 1599} {"train_loss": -5.8578877449035645, "global_step": 67192, "epoch": 1599} {"train_loss": -6.067846298217773, "global_step": 67193, "epoch": 1599} {"train_loss": -5.994481086730957, "global_step": 67194, "epoch": 1599} {"train_loss": -6.012088298797607, "global_step": 67195, "epoch": 1599} {"train_loss": -5.979302406311035, "global_step": 67196, "epoch": 1599} {"train_loss": -6.125508785247803, "global_step": 67197, "epoch": 1599} {"train_loss": -5.892158508300781, "global_step": 67198, "epoch": 1599} {"train_loss": -5.978558040800548, "global_step": 67199, "epoch": 1599, "val_loss": 67109.0078125} {"train_loss": -6.018902778625488, "global_step": 67200, "epoch": 1600} {"train_loss": -5.892638683319092, "global_step": 67201, "epoch": 1600} {"train_loss": -6.146276950836182, "global_step": 67202, "epoch": 1600} {"train_loss": -6.089787483215332, "global_step": 67203, "epoch": 1600} {"train_loss": -5.903779983520508, "global_step": 67204, "epoch": 1600} {"train_loss": -5.97763204574585, "global_step": 67205, "epoch": 1600} {"train_loss": -6.018477439880371, "global_step": 67206, "epoch": 1600} {"train_loss": -5.856507301330566, "global_step": 67207, "epoch": 1600} {"train_loss": -5.987151145935059, "global_step": 67208, "epoch": 1600} {"train_loss": -5.946590423583984, "global_step": 67209, "epoch": 1600} {"train_loss": -6.006318092346191, "global_step": 67210, "epoch": 1600} {"train_loss": -5.863340854644775, "global_step": 67211, "epoch": 1600} {"train_loss": -5.811962127685547, "global_step": 67212, "epoch": 1600} {"train_loss": -5.9608869552612305, "global_step": 67213, "epoch": 1600} {"train_loss": -5.894635200500488, "global_step": 67214, "epoch": 1600} {"train_loss": -5.89195442199707, "global_step": 67215, "epoch": 1600} {"train_loss": -5.965827941894531, "global_step": 67216, "epoch": 1600} {"train_loss": -5.878127098083496, "global_step": 67217, "epoch": 1600} {"train_loss": -5.939617156982422, "global_step": 67218, "epoch": 1600} {"train_loss": -5.927952766418457, "global_step": 67219, "epoch": 1600} {"train_loss": -5.970544815063477, "global_step": 67220, "epoch": 1600} {"train_loss": -5.949058532714844, "global_step": 67221, "epoch": 1600} {"train_loss": -5.927324295043945, "global_step": 67222, "epoch": 1600} {"train_loss": -5.879570960998535, "global_step": 67223, "epoch": 1600} {"train_loss": -5.981697082519531, "global_step": 67224, "epoch": 1600} {"train_loss": -6.015244483947754, "global_step": 67225, "epoch": 1600} {"train_loss": -5.916682243347168, "global_step": 67226, "epoch": 1600} {"train_loss": -6.080838203430176, "global_step": 67227, "epoch": 1600} {"train_loss": -5.8769211769104, "global_step": 67228, "epoch": 1600} {"train_loss": -5.962230682373047, "global_step": 67229, "epoch": 1600} {"train_loss": -6.060674667358398, "global_step": 67230, "epoch": 1600} {"train_loss": -6.0649309158325195, "global_step": 67231, "epoch": 1600} {"train_loss": -6.103224277496338, "global_step": 67232, "epoch": 1600} {"train_loss": -6.012935638427734, "global_step": 67233, "epoch": 1600} {"train_loss": -6.13330078125, "global_step": 67234, "epoch": 1600} {"train_loss": -5.975032329559326, "global_step": 67235, "epoch": 1600} {"train_loss": -5.923943519592285, "global_step": 67236, "epoch": 1600} {"train_loss": -6.1160888671875, "global_step": 67237, "epoch": 1600} {"train_loss": -5.952498435974121, "global_step": 67238, "epoch": 1600} {"train_loss": -6.029338836669922, "global_step": 67239, "epoch": 1600} {"train_loss": -6.040875434875488, "global_step": 67240, "epoch": 1600} {"train_loss": -5.9739920525323775, "global_step": 67241, "epoch": 1600, "train/sim_max_reward_0": 0.23963927111069644, "train/sim_max_reward_1": 0.4249938155340847, "train/sim_max_reward_2": 0.4296262807415613, "train/sim_max_reward_3": 0.92329730106201, "train/sim_max_reward_4": 0.9368461829958632, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.5324795285372579, "test/sim_max_reward_4400001": 0.8644778839122986, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.8241697521197993, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.37023433410534684, "test/sim_max_reward_4400006": 0.7417215887495321, "test/sim_max_reward_4400007": 0.04883990746862279, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.7734703513438963, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.07364577570463493, "test/sim_max_reward_4400012": 0.49545983789323234, "test/sim_max_reward_4400013": 0.8626837431214726, "test/sim_max_reward_4400014": 0.8804618705470759, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.9321047504290212, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.4671821928752055, "test/sim_max_reward_4400020": 0.5280266689798983, "test/sim_max_reward_4400021": 0.8118385754233121, "test/sim_max_reward_4400022": 0.9514037614510257, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.17928487075587846, "test/sim_max_reward_4400026": 0.9612878469593858, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.37291949661758744, "test/sim_max_reward_4400029": 0.616748002173011, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9401443492754697, "test/sim_max_reward_4400032": 0.5213790820928993, "test/sim_max_reward_4400033": 0.6486658938037965, "test/sim_max_reward_4400034": 0.9136688977720882, "test/sim_max_reward_4400035": 0.8143110867074592, "test/sim_max_reward_4400036": 0.31515192011997145, "test/sim_max_reward_4400037": 0.5812204045961719, "test/sim_max_reward_4400038": 0.1931476430284545, "test/sim_max_reward_4400039": 0.9084829675722779, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6959939239389321, "test/sim_max_reward_4400042": 0.8704783938005771, "test/sim_max_reward_4400043": 0.9967130825026845, "test/sim_max_reward_4400044": 0.18317038570853117, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8523621505381715, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8642821614295648, "train/mean_score": 0.5245646018010671, "test/mean_score": 0.530009823441704, "val_loss": 67154.421875} {"train_loss": -6.033815383911133, "global_step": 67242, "epoch": 1601} {"train_loss": -5.963082790374756, "global_step": 67243, "epoch": 1601} {"train_loss": -6.081979751586914, "global_step": 67244, "epoch": 1601} {"train_loss": -5.89820671081543, "global_step": 67245, "epoch": 1601} {"train_loss": -5.93709659576416, "global_step": 67246, "epoch": 1601} {"train_loss": -5.952808380126953, "global_step": 67247, "epoch": 1601} {"train_loss": -5.981558322906494, "global_step": 67248, "epoch": 1601} {"train_loss": -5.881819248199463, "global_step": 67249, "epoch": 1601} {"train_loss": -5.967139720916748, "global_step": 67250, "epoch": 1601} {"train_loss": -6.029690742492676, "global_step": 67251, "epoch": 1601} {"train_loss": -6.019233703613281, "global_step": 67252, "epoch": 1601} {"train_loss": -6.101591110229492, "global_step": 67253, "epoch": 1601} {"train_loss": -5.991589069366455, "global_step": 67254, "epoch": 1601} {"train_loss": -6.044606685638428, "global_step": 67255, "epoch": 1601} {"train_loss": -5.978104591369629, "global_step": 67256, "epoch": 1601} {"train_loss": -6.0530195236206055, "global_step": 67257, "epoch": 1601} {"train_loss": -5.945775985717773, "global_step": 67258, "epoch": 1601} {"train_loss": -5.973372459411621, "global_step": 67259, "epoch": 1601} {"train_loss": -6.009919166564941, "global_step": 67260, "epoch": 1601} {"train_loss": -5.991529941558838, "global_step": 67261, "epoch": 1601} {"train_loss": -5.9063849449157715, "global_step": 67262, "epoch": 1601} {"train_loss": -6.043015956878662, "global_step": 67263, "epoch": 1601} {"train_loss": -5.891447067260742, "global_step": 67264, "epoch": 1601} {"train_loss": -5.903121471405029, "global_step": 67265, "epoch": 1601} {"train_loss": -6.011223316192627, "global_step": 67266, "epoch": 1601} {"train_loss": -5.914828300476074, "global_step": 67267, "epoch": 1601} {"train_loss": -5.967104911804199, "global_step": 67268, "epoch": 1601} {"train_loss": -6.018549919128418, "global_step": 67269, "epoch": 1601} {"train_loss": -5.8786468505859375, "global_step": 67270, "epoch": 1601} {"train_loss": -5.887175559997559, "global_step": 67271, "epoch": 1601} {"train_loss": -5.981029510498047, "global_step": 67272, "epoch": 1601} {"train_loss": -5.993330478668213, "global_step": 67273, "epoch": 1601} {"train_loss": -6.025519847869873, "global_step": 67274, "epoch": 1601} {"train_loss": -5.846072196960449, "global_step": 67275, "epoch": 1601} {"train_loss": -5.913043975830078, "global_step": 67276, "epoch": 1601} {"train_loss": -6.06674861907959, "global_step": 67277, "epoch": 1601} {"train_loss": -5.78624153137207, "global_step": 67278, "epoch": 1601} {"train_loss": -5.923623085021973, "global_step": 67279, "epoch": 1601} {"train_loss": -5.813541412353516, "global_step": 67280, "epoch": 1601} {"train_loss": -5.782440185546875, "global_step": 67281, "epoch": 1601} {"train_loss": -6.001046180725098, "global_step": 67282, "epoch": 1601} {"train_loss": -5.959365685780843, "global_step": 67283, "epoch": 1601, "val_loss": 67469.46875} {"train_loss": -5.912118434906006, "global_step": 67284, "epoch": 1602} {"train_loss": -5.907237529754639, "global_step": 67285, "epoch": 1602} {"train_loss": -5.9394025802612305, "global_step": 67286, "epoch": 1602} {"train_loss": -6.031988143920898, "global_step": 67287, "epoch": 1602} {"train_loss": -5.862127304077148, "global_step": 67288, "epoch": 1602} {"train_loss": -5.926782608032227, "global_step": 67289, "epoch": 1602} {"train_loss": -5.97113037109375, "global_step": 67290, "epoch": 1602} {"train_loss": -5.882751941680908, "global_step": 67291, "epoch": 1602} {"train_loss": -5.816109657287598, "global_step": 67292, "epoch": 1602} {"train_loss": -5.89634895324707, "global_step": 67293, "epoch": 1602} {"train_loss": -5.941667556762695, "global_step": 67294, "epoch": 1602} {"train_loss": -5.865461349487305, "global_step": 67295, "epoch": 1602} {"train_loss": -5.863936424255371, "global_step": 67296, "epoch": 1602} {"train_loss": -5.905597686767578, "global_step": 67297, "epoch": 1602} {"train_loss": -6.001072406768799, "global_step": 67298, "epoch": 1602} {"train_loss": -5.876275062561035, "global_step": 67299, "epoch": 1602} {"train_loss": -5.943414688110352, "global_step": 67300, "epoch": 1602} {"train_loss": -6.003884315490723, "global_step": 67301, "epoch": 1602} {"train_loss": -6.051007270812988, "global_step": 67302, "epoch": 1602} {"train_loss": -5.980058670043945, "global_step": 67303, "epoch": 1602} {"train_loss": -5.912514686584473, "global_step": 67304, "epoch": 1602} {"train_loss": -5.930845260620117, "global_step": 67305, "epoch": 1602} {"train_loss": -5.925158500671387, "global_step": 67306, "epoch": 1602} {"train_loss": -5.920773506164551, "global_step": 67307, "epoch": 1602} {"train_loss": -5.962353229522705, "global_step": 67308, "epoch": 1602} {"train_loss": -5.931543350219727, "global_step": 67309, "epoch": 1602} {"train_loss": -5.9043073654174805, "global_step": 67310, "epoch": 1602} {"train_loss": -5.963247299194336, "global_step": 67311, "epoch": 1602} {"train_loss": -6.018244743347168, "global_step": 67312, "epoch": 1602} {"train_loss": -6.0459747314453125, "global_step": 67313, "epoch": 1602} {"train_loss": -6.048480987548828, "global_step": 67314, "epoch": 1602} {"train_loss": -6.176490783691406, "global_step": 67315, "epoch": 1602} {"train_loss": -6.096632480621338, "global_step": 67316, "epoch": 1602} {"train_loss": -5.932676792144775, "global_step": 67317, "epoch": 1602} {"train_loss": -6.049059867858887, "global_step": 67318, "epoch": 1602} {"train_loss": -6.04126501083374, "global_step": 67319, "epoch": 1602} {"train_loss": -5.829164505004883, "global_step": 67320, "epoch": 1602} {"train_loss": -6.100435256958008, "global_step": 67321, "epoch": 1602} {"train_loss": -6.039644241333008, "global_step": 67322, "epoch": 1602} {"train_loss": -5.941173553466797, "global_step": 67323, "epoch": 1602} {"train_loss": -6.039098739624023, "global_step": 67324, "epoch": 1602} {"train_loss": -5.962944507598877, "global_step": 67325, "epoch": 1602, "val_loss": 67361.6328125} {"train_loss": -5.904047966003418, "global_step": 67326, "epoch": 1603} {"train_loss": -5.93716287612915, "global_step": 67327, "epoch": 1603} {"train_loss": -5.969782829284668, "global_step": 67328, "epoch": 1603} {"train_loss": -6.123944282531738, "global_step": 67329, "epoch": 1603} {"train_loss": -5.969676494598389, "global_step": 67330, "epoch": 1603} {"train_loss": -5.965993881225586, "global_step": 67331, "epoch": 1603} {"train_loss": -5.886096000671387, "global_step": 67332, "epoch": 1603} {"train_loss": -5.8970866203308105, "global_step": 67333, "epoch": 1603} {"train_loss": -6.0056986808776855, "global_step": 67334, "epoch": 1603} {"train_loss": -6.115638256072998, "global_step": 67335, "epoch": 1603} {"train_loss": -6.045816421508789, "global_step": 67336, "epoch": 1603} {"train_loss": -6.04456901550293, "global_step": 67337, "epoch": 1603} {"train_loss": -5.991793155670166, "global_step": 67338, "epoch": 1603} {"train_loss": -6.026742935180664, "global_step": 67339, "epoch": 1603} {"train_loss": -6.048872947692871, "global_step": 67340, "epoch": 1603} {"train_loss": -5.932681083679199, "global_step": 67341, "epoch": 1603} {"train_loss": -5.829685211181641, "global_step": 67342, "epoch": 1603} {"train_loss": -6.018021583557129, "global_step": 67343, "epoch": 1603} {"train_loss": -6.047114372253418, "global_step": 67344, "epoch": 1603} {"train_loss": -6.122125625610352, "global_step": 67345, "epoch": 1603} {"train_loss": -5.988480091094971, "global_step": 67346, "epoch": 1603} {"train_loss": -6.0147247314453125, "global_step": 67347, "epoch": 1603} {"train_loss": -6.085155010223389, "global_step": 67348, "epoch": 1603} {"train_loss": -5.998902797698975, "global_step": 67349, "epoch": 1603} {"train_loss": -6.075206756591797, "global_step": 67350, "epoch": 1603} {"train_loss": -6.0221638679504395, "global_step": 67351, "epoch": 1603} {"train_loss": -5.976439952850342, "global_step": 67352, "epoch": 1603} {"train_loss": -6.082414150238037, "global_step": 67353, "epoch": 1603} {"train_loss": -5.870563507080078, "global_step": 67354, "epoch": 1603} {"train_loss": -6.030517578125, "global_step": 67355, "epoch": 1603} {"train_loss": -5.929471969604492, "global_step": 67356, "epoch": 1603} {"train_loss": -5.9561567306518555, "global_step": 67357, "epoch": 1603} {"train_loss": -6.01577091217041, "global_step": 67358, "epoch": 1603} {"train_loss": -5.936005592346191, "global_step": 67359, "epoch": 1603} {"train_loss": -6.048561096191406, "global_step": 67360, "epoch": 1603} {"train_loss": -5.934823036193848, "global_step": 67361, "epoch": 1603} {"train_loss": -5.962490081787109, "global_step": 67362, "epoch": 1603} {"train_loss": -5.995242595672607, "global_step": 67363, "epoch": 1603} {"train_loss": -6.022518157958984, "global_step": 67364, "epoch": 1603} {"train_loss": -6.015500068664551, "global_step": 67365, "epoch": 1603} {"train_loss": -5.954768657684326, "global_step": 67366, "epoch": 1603} {"train_loss": -5.9927545956202914, "global_step": 67367, "epoch": 1603, "val_loss": 67223.2890625} {"train_loss": -6.067108154296875, "global_step": 67368, "epoch": 1604} {"train_loss": -6.05123233795166, "global_step": 67369, "epoch": 1604} {"train_loss": -5.894495010375977, "global_step": 67370, "epoch": 1604} {"train_loss": -5.958061218261719, "global_step": 67371, "epoch": 1604} {"train_loss": -5.992468357086182, "global_step": 67372, "epoch": 1604} {"train_loss": -5.870512962341309, "global_step": 67373, "epoch": 1604} {"train_loss": -6.010006904602051, "global_step": 67374, "epoch": 1604} {"train_loss": -5.935979843139648, "global_step": 67375, "epoch": 1604} {"train_loss": -5.986129283905029, "global_step": 67376, "epoch": 1604} {"train_loss": -5.959487438201904, "global_step": 67377, "epoch": 1604} {"train_loss": -6.010158061981201, "global_step": 67378, "epoch": 1604} {"train_loss": -5.931748867034912, "global_step": 67379, "epoch": 1604} {"train_loss": -5.994835376739502, "global_step": 67380, "epoch": 1604} {"train_loss": -5.944950103759766, "global_step": 67381, "epoch": 1604} {"train_loss": -5.944769859313965, "global_step": 67382, "epoch": 1604} {"train_loss": -5.940968036651611, "global_step": 67383, "epoch": 1604} {"train_loss": -5.912508010864258, "global_step": 67384, "epoch": 1604} {"train_loss": -5.9261040687561035, "global_step": 67385, "epoch": 1604} {"train_loss": -5.989023208618164, "global_step": 67386, "epoch": 1604} {"train_loss": -5.936251640319824, "global_step": 67387, "epoch": 1604} {"train_loss": -6.0310468673706055, "global_step": 67388, "epoch": 1604} {"train_loss": -5.942970275878906, "global_step": 67389, "epoch": 1604} {"train_loss": -6.178513526916504, "global_step": 67390, "epoch": 1604} {"train_loss": -6.02996826171875, "global_step": 67391, "epoch": 1604} {"train_loss": -5.93565559387207, "global_step": 67392, "epoch": 1604} {"train_loss": -6.003049850463867, "global_step": 67393, "epoch": 1604} {"train_loss": -6.073758125305176, "global_step": 67394, "epoch": 1604} {"train_loss": -5.914932727813721, "global_step": 67395, "epoch": 1604} {"train_loss": -5.900430202484131, "global_step": 67396, "epoch": 1604} {"train_loss": -5.999967575073242, "global_step": 67397, "epoch": 1604} {"train_loss": -5.917215347290039, "global_step": 67398, "epoch": 1604} {"train_loss": -6.0167694091796875, "global_step": 67399, "epoch": 1604} {"train_loss": -5.990138530731201, "global_step": 67400, "epoch": 1604} {"train_loss": -5.8292083740234375, "global_step": 67401, "epoch": 1604} {"train_loss": -6.102672576904297, "global_step": 67402, "epoch": 1604} {"train_loss": -5.9967827796936035, "global_step": 67403, "epoch": 1604} {"train_loss": -6.013348579406738, "global_step": 67404, "epoch": 1604} {"train_loss": -6.085269927978516, "global_step": 67405, "epoch": 1604} {"train_loss": -5.948335647583008, "global_step": 67406, "epoch": 1604} {"train_loss": -6.072487831115723, "global_step": 67407, "epoch": 1604} {"train_loss": -6.059762477874756, "global_step": 67408, "epoch": 1604} {"train_loss": -5.979974451519194, "global_step": 67409, "epoch": 1604, "val_loss": 67150.6484375} {"train_loss": -5.912773609161377, "global_step": 67410, "epoch": 1605} {"train_loss": -6.061899185180664, "global_step": 67411, "epoch": 1605} {"train_loss": -5.971573352813721, "global_step": 67412, "epoch": 1605} {"train_loss": -5.978420257568359, "global_step": 67413, "epoch": 1605} {"train_loss": -5.945929527282715, "global_step": 67414, "epoch": 1605} {"train_loss": -6.012392997741699, "global_step": 67415, "epoch": 1605} {"train_loss": -5.946447372436523, "global_step": 67416, "epoch": 1605} {"train_loss": -5.9123663902282715, "global_step": 67417, "epoch": 1605} {"train_loss": -5.957146644592285, "global_step": 67418, "epoch": 1605} {"train_loss": -5.984922885894775, "global_step": 67419, "epoch": 1605} {"train_loss": -6.003360271453857, "global_step": 67420, "epoch": 1605} {"train_loss": -6.011392593383789, "global_step": 67421, "epoch": 1605} {"train_loss": -5.891501426696777, "global_step": 67422, "epoch": 1605} {"train_loss": -5.938103199005127, "global_step": 67423, "epoch": 1605} {"train_loss": -5.933023929595947, "global_step": 67424, "epoch": 1605} {"train_loss": -5.725647926330566, "global_step": 67425, "epoch": 1605} {"train_loss": -6.091710090637207, "global_step": 67426, "epoch": 1605} {"train_loss": -5.772434234619141, "global_step": 67427, "epoch": 1605} {"train_loss": -5.996505260467529, "global_step": 67428, "epoch": 1605} {"train_loss": -6.012610912322998, "global_step": 67429, "epoch": 1605} {"train_loss": -5.972867488861084, "global_step": 67430, "epoch": 1605} {"train_loss": -5.927626609802246, "global_step": 67431, "epoch": 1605} {"train_loss": -6.018387317657471, "global_step": 67432, "epoch": 1605} {"train_loss": -6.032697677612305, "global_step": 67433, "epoch": 1605} {"train_loss": -6.09512996673584, "global_step": 67434, "epoch": 1605} {"train_loss": -6.042751312255859, "global_step": 67435, "epoch": 1605} {"train_loss": -6.007353782653809, "global_step": 67436, "epoch": 1605} {"train_loss": -5.788129806518555, "global_step": 67437, "epoch": 1605} {"train_loss": -6.064847946166992, "global_step": 67438, "epoch": 1605} {"train_loss": -5.999077796936035, "global_step": 67439, "epoch": 1605} {"train_loss": -5.814236640930176, "global_step": 67440, "epoch": 1605} {"train_loss": -5.913218975067139, "global_step": 67441, "epoch": 1605} {"train_loss": -5.996377468109131, "global_step": 67442, "epoch": 1605} {"train_loss": -5.993432521820068, "global_step": 67443, "epoch": 1605} {"train_loss": -5.978490829467773, "global_step": 67444, "epoch": 1605} {"train_loss": -5.979964733123779, "global_step": 67445, "epoch": 1605} {"train_loss": -5.959445476531982, "global_step": 67446, "epoch": 1605} {"train_loss": -5.995597839355469, "global_step": 67447, "epoch": 1605} {"train_loss": -5.878851413726807, "global_step": 67448, "epoch": 1605} {"train_loss": -6.041140556335449, "global_step": 67449, "epoch": 1605} {"train_loss": -6.04232120513916, "global_step": 67450, "epoch": 1605} {"train_loss": -5.9668024608067105, "global_step": 67451, "epoch": 1605, "val_loss": 67204.3125} {"train_loss": -5.976657867431641, "global_step": 67452, "epoch": 1606} {"train_loss": -5.821897983551025, "global_step": 67453, "epoch": 1606} {"train_loss": -5.982119560241699, "global_step": 67454, "epoch": 1606} {"train_loss": -6.042165756225586, "global_step": 67455, "epoch": 1606} {"train_loss": -5.948038101196289, "global_step": 67456, "epoch": 1606} {"train_loss": -5.9569597244262695, "global_step": 67457, "epoch": 1606} {"train_loss": -6.029829025268555, "global_step": 67458, "epoch": 1606} {"train_loss": -6.055458068847656, "global_step": 67459, "epoch": 1606} {"train_loss": -5.934464454650879, "global_step": 67460, "epoch": 1606} {"train_loss": -6.010790824890137, "global_step": 67461, "epoch": 1606} {"train_loss": -5.89341926574707, "global_step": 67462, "epoch": 1606} {"train_loss": -6.084455966949463, "global_step": 67463, "epoch": 1606} {"train_loss": -5.892552375793457, "global_step": 67464, "epoch": 1606} {"train_loss": -5.9938859939575195, "global_step": 67465, "epoch": 1606} {"train_loss": -5.81251335144043, "global_step": 67466, "epoch": 1606} {"train_loss": -6.032218933105469, "global_step": 67467, "epoch": 1606} {"train_loss": -5.999691009521484, "global_step": 67468, "epoch": 1606} {"train_loss": -5.982080459594727, "global_step": 67469, "epoch": 1606} {"train_loss": -6.033390998840332, "global_step": 67470, "epoch": 1606} {"train_loss": -6.005221366882324, "global_step": 67471, "epoch": 1606} {"train_loss": -5.917682647705078, "global_step": 67472, "epoch": 1606} {"train_loss": -6.018692970275879, "global_step": 67473, "epoch": 1606} {"train_loss": -5.932904243469238, "global_step": 67474, "epoch": 1606} {"train_loss": -6.028785705566406, "global_step": 67475, "epoch": 1606} {"train_loss": -5.929349899291992, "global_step": 67476, "epoch": 1606} {"train_loss": -5.975043296813965, "global_step": 67477, "epoch": 1606} {"train_loss": -5.986604690551758, "global_step": 67478, "epoch": 1606} {"train_loss": -5.853092670440674, "global_step": 67479, "epoch": 1606} {"train_loss": -5.936470985412598, "global_step": 67480, "epoch": 1606} {"train_loss": -5.981828689575195, "global_step": 67481, "epoch": 1606} {"train_loss": -5.994123458862305, "global_step": 67482, "epoch": 1606} {"train_loss": -5.827809810638428, "global_step": 67483, "epoch": 1606} {"train_loss": -5.951521873474121, "global_step": 67484, "epoch": 1606} {"train_loss": -5.928874969482422, "global_step": 67485, "epoch": 1606} {"train_loss": -5.948033332824707, "global_step": 67486, "epoch": 1606} {"train_loss": -5.949045181274414, "global_step": 67487, "epoch": 1606} {"train_loss": -5.9243645668029785, "global_step": 67488, "epoch": 1606} {"train_loss": -6.000936985015869, "global_step": 67489, "epoch": 1606} {"train_loss": -6.046363353729248, "global_step": 67490, "epoch": 1606} {"train_loss": -5.857456207275391, "global_step": 67491, "epoch": 1606} {"train_loss": -5.8695173263549805, "global_step": 67492, "epoch": 1606} {"train_loss": -5.960131713322231, "global_step": 67493, "epoch": 1606, "val_loss": 67280.578125} {"train_loss": -5.913148880004883, "global_step": 67494, "epoch": 1607} {"train_loss": -5.902615547180176, "global_step": 67495, "epoch": 1607} {"train_loss": -5.9657368659973145, "global_step": 67496, "epoch": 1607} {"train_loss": -5.858678817749023, "global_step": 67497, "epoch": 1607} {"train_loss": -5.995697975158691, "global_step": 67498, "epoch": 1607} {"train_loss": -6.027193069458008, "global_step": 67499, "epoch": 1607} {"train_loss": -6.025364875793457, "global_step": 67500, "epoch": 1607} {"train_loss": -5.913081645965576, "global_step": 67501, "epoch": 1607} {"train_loss": -6.020450592041016, "global_step": 67502, "epoch": 1607} {"train_loss": -5.922610759735107, "global_step": 67503, "epoch": 1607} {"train_loss": -6.040932655334473, "global_step": 67504, "epoch": 1607} {"train_loss": -5.943906307220459, "global_step": 67505, "epoch": 1607} {"train_loss": -5.99345064163208, "global_step": 67506, "epoch": 1607} {"train_loss": -6.070242404937744, "global_step": 67507, "epoch": 1607} {"train_loss": -6.1589035987854, "global_step": 67508, "epoch": 1607} {"train_loss": -6.008678913116455, "global_step": 67509, "epoch": 1607} {"train_loss": -5.943269729614258, "global_step": 67510, "epoch": 1607} {"train_loss": -6.082881927490234, "global_step": 67511, "epoch": 1607} {"train_loss": -6.1179351806640625, "global_step": 67512, "epoch": 1607} {"train_loss": -6.002250671386719, "global_step": 67513, "epoch": 1607} {"train_loss": -5.978188991546631, "global_step": 67514, "epoch": 1607} {"train_loss": -5.975846290588379, "global_step": 67515, "epoch": 1607} {"train_loss": -5.933706283569336, "global_step": 67516, "epoch": 1607} {"train_loss": -5.839995384216309, "global_step": 67517, "epoch": 1607} {"train_loss": -5.980299949645996, "global_step": 67518, "epoch": 1607} {"train_loss": -5.968826770782471, "global_step": 67519, "epoch": 1607} {"train_loss": -6.00706148147583, "global_step": 67520, "epoch": 1607} {"train_loss": -5.943995952606201, "global_step": 67521, "epoch": 1607} {"train_loss": -5.975490570068359, "global_step": 67522, "epoch": 1607} {"train_loss": -5.957096099853516, "global_step": 67523, "epoch": 1607} {"train_loss": -5.970811367034912, "global_step": 67524, "epoch": 1607} {"train_loss": -6.013360977172852, "global_step": 67525, "epoch": 1607} {"train_loss": -5.868652820587158, "global_step": 67526, "epoch": 1607} {"train_loss": -6.0026164054870605, "global_step": 67527, "epoch": 1607} {"train_loss": -5.955563068389893, "global_step": 67528, "epoch": 1607} {"train_loss": -5.94939661026001, "global_step": 67529, "epoch": 1607} {"train_loss": -6.001163005828857, "global_step": 67530, "epoch": 1607} {"train_loss": -5.934250831604004, "global_step": 67531, "epoch": 1607} {"train_loss": -5.884621620178223, "global_step": 67532, "epoch": 1607} {"train_loss": -5.879295349121094, "global_step": 67533, "epoch": 1607} {"train_loss": -6.089264392852783, "global_step": 67534, "epoch": 1607} {"train_loss": -5.978537786574591, "global_step": 67535, "epoch": 1607, "val_loss": 67618.4375} {"train_loss": -5.863132476806641, "global_step": 67536, "epoch": 1608} {"train_loss": -5.830836772918701, "global_step": 67537, "epoch": 1608} {"train_loss": -5.885445594787598, "global_step": 67538, "epoch": 1608} {"train_loss": -6.043266773223877, "global_step": 67539, "epoch": 1608} {"train_loss": -5.922207355499268, "global_step": 67540, "epoch": 1608} {"train_loss": -5.971527099609375, "global_step": 67541, "epoch": 1608} {"train_loss": -5.868715763092041, "global_step": 67542, "epoch": 1608} {"train_loss": -6.148287773132324, "global_step": 67543, "epoch": 1608} {"train_loss": -5.9548187255859375, "global_step": 67544, "epoch": 1608} {"train_loss": -6.083884239196777, "global_step": 67545, "epoch": 1608} {"train_loss": -5.9239959716796875, "global_step": 67546, "epoch": 1608} {"train_loss": -5.873140335083008, "global_step": 67547, "epoch": 1608} {"train_loss": -5.941801071166992, "global_step": 67548, "epoch": 1608} {"train_loss": -6.048791885375977, "global_step": 67549, "epoch": 1608} {"train_loss": -5.813826560974121, "global_step": 67550, "epoch": 1608} {"train_loss": -5.941856384277344, "global_step": 67551, "epoch": 1608} {"train_loss": -6.085766315460205, "global_step": 67552, "epoch": 1608} {"train_loss": -5.96186637878418, "global_step": 67553, "epoch": 1608} {"train_loss": -5.998745918273926, "global_step": 67554, "epoch": 1608} {"train_loss": -6.009279727935791, "global_step": 67555, "epoch": 1608} {"train_loss": -5.968377113342285, "global_step": 67556, "epoch": 1608} {"train_loss": -5.962242603302002, "global_step": 67557, "epoch": 1608} {"train_loss": -6.0927958488464355, "global_step": 67558, "epoch": 1608} {"train_loss": -6.0400190353393555, "global_step": 67559, "epoch": 1608} {"train_loss": -5.982802867889404, "global_step": 67560, "epoch": 1608} {"train_loss": -5.89068078994751, "global_step": 67561, "epoch": 1608} {"train_loss": -6.001682281494141, "global_step": 67562, "epoch": 1608} {"train_loss": -5.887212753295898, "global_step": 67563, "epoch": 1608} {"train_loss": -5.9460906982421875, "global_step": 67564, "epoch": 1608} {"train_loss": -6.196184158325195, "global_step": 67565, "epoch": 1608} {"train_loss": -6.068265914916992, "global_step": 67566, "epoch": 1608} {"train_loss": -6.012264251708984, "global_step": 67567, "epoch": 1608} {"train_loss": -5.945742130279541, "global_step": 67568, "epoch": 1608} {"train_loss": -5.915853500366211, "global_step": 67569, "epoch": 1608} {"train_loss": -5.88817834854126, "global_step": 67570, "epoch": 1608} {"train_loss": -5.9907097816467285, "global_step": 67571, "epoch": 1608} {"train_loss": -5.834494590759277, "global_step": 67572, "epoch": 1608} {"train_loss": -5.930649757385254, "global_step": 67573, "epoch": 1608} {"train_loss": -5.971486568450928, "global_step": 67574, "epoch": 1608} {"train_loss": -5.851300239562988, "global_step": 67575, "epoch": 1608} {"train_loss": -5.960811614990234, "global_step": 67576, "epoch": 1608} {"train_loss": -5.961972951889038, "global_step": 67577, "epoch": 1608, "val_loss": 67370.9609375} {"train_loss": -5.890838623046875, "global_step": 67578, "epoch": 1609} {"train_loss": -5.97859525680542, "global_step": 67579, "epoch": 1609} {"train_loss": -5.935542106628418, "global_step": 67580, "epoch": 1609} {"train_loss": -5.8485941886901855, "global_step": 67581, "epoch": 1609} {"train_loss": -5.946378231048584, "global_step": 67582, "epoch": 1609} {"train_loss": -5.884383678436279, "global_step": 67583, "epoch": 1609} {"train_loss": -6.011124134063721, "global_step": 67584, "epoch": 1609} {"train_loss": -5.887308120727539, "global_step": 67585, "epoch": 1609} {"train_loss": -5.95648193359375, "global_step": 67586, "epoch": 1609} {"train_loss": -5.939255237579346, "global_step": 67587, "epoch": 1609} {"train_loss": -5.9117631912231445, "global_step": 67588, "epoch": 1609} {"train_loss": -6.074262619018555, "global_step": 67589, "epoch": 1609} {"train_loss": -6.009702682495117, "global_step": 67590, "epoch": 1609} {"train_loss": -5.938476085662842, "global_step": 67591, "epoch": 1609} {"train_loss": -6.000368595123291, "global_step": 67592, "epoch": 1609} {"train_loss": -6.01104736328125, "global_step": 67593, "epoch": 1609} {"train_loss": -6.107265472412109, "global_step": 67594, "epoch": 1609} {"train_loss": -5.983975410461426, "global_step": 67595, "epoch": 1609} {"train_loss": -5.828656196594238, "global_step": 67596, "epoch": 1609} {"train_loss": -6.066893577575684, "global_step": 67597, "epoch": 1609} {"train_loss": -5.947419166564941, "global_step": 67598, "epoch": 1609} {"train_loss": -5.903469085693359, "global_step": 67599, "epoch": 1609} {"train_loss": -5.919008255004883, "global_step": 67600, "epoch": 1609} {"train_loss": -5.863940238952637, "global_step": 67601, "epoch": 1609} {"train_loss": -5.921280384063721, "global_step": 67602, "epoch": 1609} {"train_loss": -6.017060279846191, "global_step": 67603, "epoch": 1609} {"train_loss": -5.8997578620910645, "global_step": 67604, "epoch": 1609} {"train_loss": -6.00291633605957, "global_step": 67605, "epoch": 1609} {"train_loss": -5.913732528686523, "global_step": 67606, "epoch": 1609} {"train_loss": -6.067441940307617, "global_step": 67607, "epoch": 1609} {"train_loss": -5.838379859924316, "global_step": 67608, "epoch": 1609} {"train_loss": -5.900001525878906, "global_step": 67609, "epoch": 1609} {"train_loss": -5.900815486907959, "global_step": 67610, "epoch": 1609} {"train_loss": -5.906312942504883, "global_step": 67611, "epoch": 1609} {"train_loss": -5.923250198364258, "global_step": 67612, "epoch": 1609} {"train_loss": -5.974046230316162, "global_step": 67613, "epoch": 1609} {"train_loss": -6.010525226593018, "global_step": 67614, "epoch": 1609} {"train_loss": -6.010610580444336, "global_step": 67615, "epoch": 1609} {"train_loss": -5.792931079864502, "global_step": 67616, "epoch": 1609} {"train_loss": -5.841945171356201, "global_step": 67617, "epoch": 1609} {"train_loss": -5.968197822570801, "global_step": 67618, "epoch": 1609} {"train_loss": -5.9462856111072355, "global_step": 67619, "epoch": 1609, "val_loss": 67141.7578125} {"train_loss": -5.959529876708984, "global_step": 67620, "epoch": 1610} {"train_loss": -5.935565948486328, "global_step": 67621, "epoch": 1610} {"train_loss": -6.0756635665893555, "global_step": 67622, "epoch": 1610} {"train_loss": -5.931520462036133, "global_step": 67623, "epoch": 1610} {"train_loss": -6.020388126373291, "global_step": 67624, "epoch": 1610} {"train_loss": -5.966707229614258, "global_step": 67625, "epoch": 1610} {"train_loss": -6.097968101501465, "global_step": 67626, "epoch": 1610} {"train_loss": -6.098598480224609, "global_step": 67627, "epoch": 1610} {"train_loss": -6.095940589904785, "global_step": 67628, "epoch": 1610} {"train_loss": -6.095783233642578, "global_step": 67629, "epoch": 1610} {"train_loss": -5.960060119628906, "global_step": 67630, "epoch": 1610} {"train_loss": -5.922061920166016, "global_step": 67631, "epoch": 1610} {"train_loss": -6.027957916259766, "global_step": 67632, "epoch": 1610} {"train_loss": -5.899441719055176, "global_step": 67633, "epoch": 1610} {"train_loss": -6.040897369384766, "global_step": 67634, "epoch": 1610} {"train_loss": -6.073092937469482, "global_step": 67635, "epoch": 1610} {"train_loss": -6.006345748901367, "global_step": 67636, "epoch": 1610} {"train_loss": -6.06454610824585, "global_step": 67637, "epoch": 1610} {"train_loss": -6.031640529632568, "global_step": 67638, "epoch": 1610} {"train_loss": -6.030632972717285, "global_step": 67639, "epoch": 1610} {"train_loss": -5.852776050567627, "global_step": 67640, "epoch": 1610} {"train_loss": -5.936015605926514, "global_step": 67641, "epoch": 1610} {"train_loss": -5.8944091796875, "global_step": 67642, "epoch": 1610} {"train_loss": -5.864522933959961, "global_step": 67643, "epoch": 1610} {"train_loss": -5.938534259796143, "global_step": 67644, "epoch": 1610} {"train_loss": -5.87860107421875, "global_step": 67645, "epoch": 1610} {"train_loss": -5.957914352416992, "global_step": 67646, "epoch": 1610} {"train_loss": -6.043244361877441, "global_step": 67647, "epoch": 1610} {"train_loss": -5.924284934997559, "global_step": 67648, "epoch": 1610} {"train_loss": -6.0242085456848145, "global_step": 67649, "epoch": 1610} {"train_loss": -5.914294242858887, "global_step": 67650, "epoch": 1610} {"train_loss": -6.000275135040283, "global_step": 67651, "epoch": 1610} {"train_loss": -5.871192932128906, "global_step": 67652, "epoch": 1610} {"train_loss": -5.943571090698242, "global_step": 67653, "epoch": 1610} {"train_loss": -5.953309059143066, "global_step": 67654, "epoch": 1610} {"train_loss": -5.76478385925293, "global_step": 67655, "epoch": 1610} {"train_loss": -6.029596328735352, "global_step": 67656, "epoch": 1610} {"train_loss": -5.924307823181152, "global_step": 67657, "epoch": 1610} {"train_loss": -5.932668685913086, "global_step": 67658, "epoch": 1610} {"train_loss": -5.939507484436035, "global_step": 67659, "epoch": 1610} {"train_loss": -5.961000919342041, "global_step": 67660, "epoch": 1610} {"train_loss": -5.974449237187703, "global_step": 67661, "epoch": 1610, "val_loss": 67044.984375} {"train_loss": -6.041874885559082, "global_step": 67662, "epoch": 1611} {"train_loss": -5.990272521972656, "global_step": 67663, "epoch": 1611} {"train_loss": -5.916532516479492, "global_step": 67664, "epoch": 1611} {"train_loss": -6.007880210876465, "global_step": 67665, "epoch": 1611} {"train_loss": -5.812767028808594, "global_step": 67666, "epoch": 1611} {"train_loss": -5.953680992126465, "global_step": 67667, "epoch": 1611} {"train_loss": -6.071361064910889, "global_step": 67668, "epoch": 1611} {"train_loss": -5.997591972351074, "global_step": 67669, "epoch": 1611} {"train_loss": -6.020652770996094, "global_step": 67670, "epoch": 1611} {"train_loss": -6.077601432800293, "global_step": 67671, "epoch": 1611} {"train_loss": -6.049825668334961, "global_step": 67672, "epoch": 1611} {"train_loss": -5.982522010803223, "global_step": 67673, "epoch": 1611} {"train_loss": -6.01002836227417, "global_step": 67674, "epoch": 1611} {"train_loss": -5.961010456085205, "global_step": 67675, "epoch": 1611} {"train_loss": -6.057602882385254, "global_step": 67676, "epoch": 1611} {"train_loss": -6.070062637329102, "global_step": 67677, "epoch": 1611} {"train_loss": -5.936095237731934, "global_step": 67678, "epoch": 1611} {"train_loss": -5.96442985534668, "global_step": 67679, "epoch": 1611} {"train_loss": -5.893418312072754, "global_step": 67680, "epoch": 1611} {"train_loss": -5.856623649597168, "global_step": 67681, "epoch": 1611} {"train_loss": -5.920101642608643, "global_step": 67682, "epoch": 1611} {"train_loss": -6.003900527954102, "global_step": 67683, "epoch": 1611} {"train_loss": -5.955907344818115, "global_step": 67684, "epoch": 1611} {"train_loss": -5.828708648681641, "global_step": 67685, "epoch": 1611} {"train_loss": -5.980465888977051, "global_step": 67686, "epoch": 1611} {"train_loss": -5.955258846282959, "global_step": 67687, "epoch": 1611} {"train_loss": -6.026092529296875, "global_step": 67688, "epoch": 1611} {"train_loss": -5.982375144958496, "global_step": 67689, "epoch": 1611} {"train_loss": -6.048728942871094, "global_step": 67690, "epoch": 1611} {"train_loss": -5.962522506713867, "global_step": 67691, "epoch": 1611} {"train_loss": -5.975421905517578, "global_step": 67692, "epoch": 1611} {"train_loss": -5.96268367767334, "global_step": 67693, "epoch": 1611} {"train_loss": -5.940410137176514, "global_step": 67694, "epoch": 1611} {"train_loss": -6.00484561920166, "global_step": 67695, "epoch": 1611} {"train_loss": -5.9153852462768555, "global_step": 67696, "epoch": 1611} {"train_loss": -6.021111965179443, "global_step": 67697, "epoch": 1611} {"train_loss": -6.087709426879883, "global_step": 67698, "epoch": 1611} {"train_loss": -5.993318557739258, "global_step": 67699, "epoch": 1611} {"train_loss": -5.942327499389648, "global_step": 67700, "epoch": 1611} {"train_loss": -6.0315070152282715, "global_step": 67701, "epoch": 1611} {"train_loss": -5.977110385894775, "global_step": 67702, "epoch": 1611} {"train_loss": -5.980723562694731, "global_step": 67703, "epoch": 1611, "val_loss": 67124.765625} {"train_loss": -5.92321252822876, "global_step": 67704, "epoch": 1612} {"train_loss": -5.9604902267456055, "global_step": 67705, "epoch": 1612} {"train_loss": -5.934112548828125, "global_step": 67706, "epoch": 1612} {"train_loss": -6.0285749435424805, "global_step": 67707, "epoch": 1612} {"train_loss": -5.944852828979492, "global_step": 67708, "epoch": 1612} {"train_loss": -5.916957378387451, "global_step": 67709, "epoch": 1612} {"train_loss": -5.970268726348877, "global_step": 67710, "epoch": 1612} {"train_loss": -5.92585563659668, "global_step": 67711, "epoch": 1612} {"train_loss": -6.008370876312256, "global_step": 67712, "epoch": 1612} {"train_loss": -5.923659801483154, "global_step": 67713, "epoch": 1612} {"train_loss": -6.09229040145874, "global_step": 67714, "epoch": 1612} {"train_loss": -5.934410572052002, "global_step": 67715, "epoch": 1612} {"train_loss": -5.968469142913818, "global_step": 67716, "epoch": 1612} {"train_loss": -6.075403213500977, "global_step": 67717, "epoch": 1612} {"train_loss": -5.8977885246276855, "global_step": 67718, "epoch": 1612} {"train_loss": -5.900738716125488, "global_step": 67719, "epoch": 1612} {"train_loss": -5.952743053436279, "global_step": 67720, "epoch": 1612} {"train_loss": -5.874686241149902, "global_step": 67721, "epoch": 1612} {"train_loss": -6.016056060791016, "global_step": 67722, "epoch": 1612} {"train_loss": -6.028285026550293, "global_step": 67723, "epoch": 1612} {"train_loss": -5.857657432556152, "global_step": 67724, "epoch": 1612} {"train_loss": -6.086087226867676, "global_step": 67725, "epoch": 1612} {"train_loss": -6.002191543579102, "global_step": 67726, "epoch": 1612} {"train_loss": -5.881489276885986, "global_step": 67727, "epoch": 1612} {"train_loss": -5.957835674285889, "global_step": 67728, "epoch": 1612} {"train_loss": -5.957657337188721, "global_step": 67729, "epoch": 1612} {"train_loss": -5.9756364822387695, "global_step": 67730, "epoch": 1612} {"train_loss": -6.00264310836792, "global_step": 67731, "epoch": 1612} {"train_loss": -5.9734110832214355, "global_step": 67732, "epoch": 1612} {"train_loss": -6.083090782165527, "global_step": 67733, "epoch": 1612} {"train_loss": -5.9752655029296875, "global_step": 67734, "epoch": 1612} {"train_loss": -5.887088775634766, "global_step": 67735, "epoch": 1612} {"train_loss": -5.966660976409912, "global_step": 67736, "epoch": 1612} {"train_loss": -5.929764747619629, "global_step": 67737, "epoch": 1612} {"train_loss": -5.95214319229126, "global_step": 67738, "epoch": 1612} {"train_loss": -6.0018439292907715, "global_step": 67739, "epoch": 1612} {"train_loss": -5.9778242111206055, "global_step": 67740, "epoch": 1612} {"train_loss": -6.110442161560059, "global_step": 67741, "epoch": 1612} {"train_loss": -5.970712661743164, "global_step": 67742, "epoch": 1612} {"train_loss": -6.028816223144531, "global_step": 67743, "epoch": 1612} {"train_loss": -6.029185771942139, "global_step": 67744, "epoch": 1612} {"train_loss": -5.971976950055077, "global_step": 67745, "epoch": 1612, "val_loss": 67160.3046875} {"train_loss": -6.070839881896973, "global_step": 67746, "epoch": 1613} {"train_loss": -6.032334804534912, "global_step": 67747, "epoch": 1613} {"train_loss": -6.052040100097656, "global_step": 67748, "epoch": 1613} {"train_loss": -5.794605731964111, "global_step": 67749, "epoch": 1613} {"train_loss": -5.99452018737793, "global_step": 67750, "epoch": 1613} {"train_loss": -6.025205612182617, "global_step": 67751, "epoch": 1613} {"train_loss": -6.050464630126953, "global_step": 67752, "epoch": 1613} {"train_loss": -5.959267616271973, "global_step": 67753, "epoch": 1613} {"train_loss": -6.099932670593262, "global_step": 67754, "epoch": 1613} {"train_loss": -5.976475238800049, "global_step": 67755, "epoch": 1613} {"train_loss": -5.953322410583496, "global_step": 67756, "epoch": 1613} {"train_loss": -6.039735794067383, "global_step": 67757, "epoch": 1613} {"train_loss": -6.144358158111572, "global_step": 67758, "epoch": 1613} {"train_loss": -6.0542311668396, "global_step": 67759, "epoch": 1613} {"train_loss": -6.0279693603515625, "global_step": 67760, "epoch": 1613} {"train_loss": -5.8516387939453125, "global_step": 67761, "epoch": 1613} {"train_loss": -6.060581207275391, "global_step": 67762, "epoch": 1613} {"train_loss": -5.954351902008057, "global_step": 67763, "epoch": 1613} {"train_loss": -5.9779486656188965, "global_step": 67764, "epoch": 1613} {"train_loss": -6.033967018127441, "global_step": 67765, "epoch": 1613} {"train_loss": -6.0583906173706055, "global_step": 67766, "epoch": 1613} {"train_loss": -5.958886623382568, "global_step": 67767, "epoch": 1613} {"train_loss": -6.005774021148682, "global_step": 67768, "epoch": 1613} {"train_loss": -6.100438117980957, "global_step": 67769, "epoch": 1613} {"train_loss": -5.973891735076904, "global_step": 67770, "epoch": 1613} {"train_loss": -6.0382232666015625, "global_step": 67771, "epoch": 1613} {"train_loss": -5.976800918579102, "global_step": 67772, "epoch": 1613} {"train_loss": -5.88981819152832, "global_step": 67773, "epoch": 1613} {"train_loss": -5.87579345703125, "global_step": 67774, "epoch": 1613} {"train_loss": -5.984419345855713, "global_step": 67775, "epoch": 1613} {"train_loss": -6.030285835266113, "global_step": 67776, "epoch": 1613} {"train_loss": -5.892181873321533, "global_step": 67777, "epoch": 1613} {"train_loss": -5.9833831787109375, "global_step": 67778, "epoch": 1613} {"train_loss": -5.849460601806641, "global_step": 67779, "epoch": 1613} {"train_loss": -5.865421295166016, "global_step": 67780, "epoch": 1613} {"train_loss": -6.127657890319824, "global_step": 67781, "epoch": 1613} {"train_loss": -5.9555206298828125, "global_step": 67782, "epoch": 1613} {"train_loss": -5.952879905700684, "global_step": 67783, "epoch": 1613} {"train_loss": -5.952047824859619, "global_step": 67784, "epoch": 1613} {"train_loss": -5.917068958282471, "global_step": 67785, "epoch": 1613} {"train_loss": -5.993951797485352, "global_step": 67786, "epoch": 1613} {"train_loss": -5.989440827142625, "global_step": 67787, "epoch": 1613, "val_loss": 67403.6640625} {"train_loss": -5.7889180183410645, "global_step": 67788, "epoch": 1614} {"train_loss": -6.045814037322998, "global_step": 67789, "epoch": 1614} {"train_loss": -5.96833610534668, "global_step": 67790, "epoch": 1614} {"train_loss": -5.950734615325928, "global_step": 67791, "epoch": 1614} {"train_loss": -6.005398750305176, "global_step": 67792, "epoch": 1614} {"train_loss": -5.879004955291748, "global_step": 67793, "epoch": 1614} {"train_loss": -5.988953113555908, "global_step": 67794, "epoch": 1614} {"train_loss": -5.845793724060059, "global_step": 67795, "epoch": 1614} {"train_loss": -5.968198299407959, "global_step": 67796, "epoch": 1614} {"train_loss": -6.130331516265869, "global_step": 67797, "epoch": 1614} {"train_loss": -5.9019775390625, "global_step": 67798, "epoch": 1614} {"train_loss": -6.031551361083984, "global_step": 67799, "epoch": 1614} {"train_loss": -5.997773170471191, "global_step": 67800, "epoch": 1614} {"train_loss": -5.965106964111328, "global_step": 67801, "epoch": 1614} {"train_loss": -5.932903289794922, "global_step": 67802, "epoch": 1614} {"train_loss": -5.887316703796387, "global_step": 67803, "epoch": 1614} {"train_loss": -5.833820343017578, "global_step": 67804, "epoch": 1614} {"train_loss": -5.994870185852051, "global_step": 67805, "epoch": 1614} {"train_loss": -5.96551513671875, "global_step": 67806, "epoch": 1614} {"train_loss": -6.011967658996582, "global_step": 67807, "epoch": 1614} {"train_loss": -6.092580795288086, "global_step": 67808, "epoch": 1614} {"train_loss": -5.965344429016113, "global_step": 67809, "epoch": 1614} {"train_loss": -5.95679235458374, "global_step": 67810, "epoch": 1614} {"train_loss": -5.936849594116211, "global_step": 67811, "epoch": 1614} {"train_loss": -6.007455825805664, "global_step": 67812, "epoch": 1614} {"train_loss": -5.912756443023682, "global_step": 67813, "epoch": 1614} {"train_loss": -5.860857963562012, "global_step": 67814, "epoch": 1614} {"train_loss": -5.953322410583496, "global_step": 67815, "epoch": 1614} {"train_loss": -6.084565162658691, "global_step": 67816, "epoch": 1614} {"train_loss": -6.047216415405273, "global_step": 67817, "epoch": 1614} {"train_loss": -6.011802673339844, "global_step": 67818, "epoch": 1614} {"train_loss": -5.993268013000488, "global_step": 67819, "epoch": 1614} {"train_loss": -5.993017673492432, "global_step": 67820, "epoch": 1614} {"train_loss": -5.914583206176758, "global_step": 67821, "epoch": 1614} {"train_loss": -5.9291276931762695, "global_step": 67822, "epoch": 1614} {"train_loss": -6.052458763122559, "global_step": 67823, "epoch": 1614} {"train_loss": -6.0103607177734375, "global_step": 67824, "epoch": 1614} {"train_loss": -5.89709997177124, "global_step": 67825, "epoch": 1614} {"train_loss": -5.997047424316406, "global_step": 67826, "epoch": 1614} {"train_loss": -6.04512357711792, "global_step": 67827, "epoch": 1614} {"train_loss": -6.007091522216797, "global_step": 67828, "epoch": 1614} {"train_loss": -5.969335204079037, "global_step": 67829, "epoch": 1614, "val_loss": 67495.4921875} {"train_loss": -6.046472072601318, "global_step": 67830, "epoch": 1615} {"train_loss": -5.9593915939331055, "global_step": 67831, "epoch": 1615} {"train_loss": -5.930521011352539, "global_step": 67832, "epoch": 1615} {"train_loss": -5.977129936218262, "global_step": 67833, "epoch": 1615} {"train_loss": -6.00028657913208, "global_step": 67834, "epoch": 1615} {"train_loss": -6.036808490753174, "global_step": 67835, "epoch": 1615} {"train_loss": -6.0159010887146, "global_step": 67836, "epoch": 1615} {"train_loss": -6.0086259841918945, "global_step": 67837, "epoch": 1615} {"train_loss": -5.9785075187683105, "global_step": 67838, "epoch": 1615} {"train_loss": -6.0268330574035645, "global_step": 67839, "epoch": 1615} {"train_loss": -6.043605804443359, "global_step": 67840, "epoch": 1615} {"train_loss": -6.072279453277588, "global_step": 67841, "epoch": 1615} {"train_loss": -5.954167366027832, "global_step": 67842, "epoch": 1615} {"train_loss": -6.0540361404418945, "global_step": 67843, "epoch": 1615} {"train_loss": -5.943366050720215, "global_step": 67844, "epoch": 1615} {"train_loss": -5.873804569244385, "global_step": 67845, "epoch": 1615} {"train_loss": -6.04302978515625, "global_step": 67846, "epoch": 1615} {"train_loss": -5.975327014923096, "global_step": 67847, "epoch": 1615} {"train_loss": -6.073248386383057, "global_step": 67848, "epoch": 1615} {"train_loss": -6.077017784118652, "global_step": 67849, "epoch": 1615} {"train_loss": -5.929882526397705, "global_step": 67850, "epoch": 1615} {"train_loss": -5.933579444885254, "global_step": 67851, "epoch": 1615} {"train_loss": -5.926142692565918, "global_step": 67852, "epoch": 1615} {"train_loss": -5.980633735656738, "global_step": 67853, "epoch": 1615} {"train_loss": -6.054996490478516, "global_step": 67854, "epoch": 1615} {"train_loss": -5.924351692199707, "global_step": 67855, "epoch": 1615} {"train_loss": -6.005928993225098, "global_step": 67856, "epoch": 1615} {"train_loss": -6.071224212646484, "global_step": 67857, "epoch": 1615} {"train_loss": -5.991109848022461, "global_step": 67858, "epoch": 1615} {"train_loss": -5.898371696472168, "global_step": 67859, "epoch": 1615} {"train_loss": -5.9499711990356445, "global_step": 67860, "epoch": 1615} {"train_loss": -5.9928388595581055, "global_step": 67861, "epoch": 1615} {"train_loss": -6.046823024749756, "global_step": 67862, "epoch": 1615} {"train_loss": -6.013480186462402, "global_step": 67863, "epoch": 1615} {"train_loss": -5.979117393493652, "global_step": 67864, "epoch": 1615} {"train_loss": -6.056404113769531, "global_step": 67865, "epoch": 1615} {"train_loss": -5.961282730102539, "global_step": 67866, "epoch": 1615} {"train_loss": -5.944303512573242, "global_step": 67867, "epoch": 1615} {"train_loss": -5.953538417816162, "global_step": 67868, "epoch": 1615} {"train_loss": -5.970856666564941, "global_step": 67869, "epoch": 1615} {"train_loss": -5.907688140869141, "global_step": 67870, "epoch": 1615} {"train_loss": -5.9894778955550425, "global_step": 67871, "epoch": 1615, "val_loss": 67369.109375} {"train_loss": -5.839698791503906, "global_step": 67872, "epoch": 1616} {"train_loss": -5.964224815368652, "global_step": 67873, "epoch": 1616} {"train_loss": -5.912344455718994, "global_step": 67874, "epoch": 1616} {"train_loss": -5.963799476623535, "global_step": 67875, "epoch": 1616} {"train_loss": -5.886987686157227, "global_step": 67876, "epoch": 1616} {"train_loss": -5.942683219909668, "global_step": 67877, "epoch": 1616} {"train_loss": -5.861335754394531, "global_step": 67878, "epoch": 1616} {"train_loss": -5.900439739227295, "global_step": 67879, "epoch": 1616} {"train_loss": -5.9086456298828125, "global_step": 67880, "epoch": 1616} {"train_loss": -5.987364292144775, "global_step": 67881, "epoch": 1616} {"train_loss": -6.023408889770508, "global_step": 67882, "epoch": 1616} {"train_loss": -5.971816062927246, "global_step": 67883, "epoch": 1616} {"train_loss": -5.95742654800415, "global_step": 67884, "epoch": 1616} {"train_loss": -5.9894232749938965, "global_step": 67885, "epoch": 1616} {"train_loss": -5.996106147766113, "global_step": 67886, "epoch": 1616} {"train_loss": -5.960836410522461, "global_step": 67887, "epoch": 1616} {"train_loss": -5.917734146118164, "global_step": 67888, "epoch": 1616} {"train_loss": -5.938129901885986, "global_step": 67889, "epoch": 1616} {"train_loss": -5.88324499130249, "global_step": 67890, "epoch": 1616} {"train_loss": -5.802508354187012, "global_step": 67891, "epoch": 1616} {"train_loss": -6.069847583770752, "global_step": 67892, "epoch": 1616} {"train_loss": -6.071676254272461, "global_step": 67893, "epoch": 1616} {"train_loss": -6.031081199645996, "global_step": 67894, "epoch": 1616} {"train_loss": -5.983217716217041, "global_step": 67895, "epoch": 1616} {"train_loss": -6.012055397033691, "global_step": 67896, "epoch": 1616} {"train_loss": -6.084283351898193, "global_step": 67897, "epoch": 1616} {"train_loss": -5.902437210083008, "global_step": 67898, "epoch": 1616} {"train_loss": -5.920551300048828, "global_step": 67899, "epoch": 1616} {"train_loss": -5.887800216674805, "global_step": 67900, "epoch": 1616} {"train_loss": -6.115616798400879, "global_step": 67901, "epoch": 1616} {"train_loss": -5.886384010314941, "global_step": 67902, "epoch": 1616} {"train_loss": -5.931130409240723, "global_step": 67903, "epoch": 1616} {"train_loss": -6.034415245056152, "global_step": 67904, "epoch": 1616} {"train_loss": -5.927162170410156, "global_step": 67905, "epoch": 1616} {"train_loss": -5.900574684143066, "global_step": 67906, "epoch": 1616} {"train_loss": -5.910046577453613, "global_step": 67907, "epoch": 1616} {"train_loss": -6.058509826660156, "global_step": 67908, "epoch": 1616} {"train_loss": -5.944127082824707, "global_step": 67909, "epoch": 1616} {"train_loss": -5.925948143005371, "global_step": 67910, "epoch": 1616} {"train_loss": -5.974206924438477, "global_step": 67911, "epoch": 1616} {"train_loss": -5.9378252029418945, "global_step": 67912, "epoch": 1616} {"train_loss": -5.952749229612804, "global_step": 67913, "epoch": 1616, "val_loss": 67147.8984375} {"train_loss": -6.0678911209106445, "global_step": 67914, "epoch": 1617} {"train_loss": -5.954286575317383, "global_step": 67915, "epoch": 1617} {"train_loss": -5.951177597045898, "global_step": 67916, "epoch": 1617} {"train_loss": -6.099517822265625, "global_step": 67917, "epoch": 1617} {"train_loss": -6.0752787590026855, "global_step": 67918, "epoch": 1617} {"train_loss": -5.996914863586426, "global_step": 67919, "epoch": 1617} {"train_loss": -6.026165962219238, "global_step": 67920, "epoch": 1617} {"train_loss": -5.9427900314331055, "global_step": 67921, "epoch": 1617} {"train_loss": -5.834139823913574, "global_step": 67922, "epoch": 1617} {"train_loss": -6.078444480895996, "global_step": 67923, "epoch": 1617} {"train_loss": -6.058680534362793, "global_step": 67924, "epoch": 1617} {"train_loss": -5.863255023956299, "global_step": 67925, "epoch": 1617} {"train_loss": -5.882838726043701, "global_step": 67926, "epoch": 1617} {"train_loss": -6.076057434082031, "global_step": 67927, "epoch": 1617} {"train_loss": -5.952216148376465, "global_step": 67928, "epoch": 1617} {"train_loss": -5.939167022705078, "global_step": 67929, "epoch": 1617} {"train_loss": -5.949102878570557, "global_step": 67930, "epoch": 1617} {"train_loss": -6.04789924621582, "global_step": 67931, "epoch": 1617} {"train_loss": -5.800106525421143, "global_step": 67932, "epoch": 1617} {"train_loss": -5.90897798538208, "global_step": 67933, "epoch": 1617} {"train_loss": -5.921424865722656, "global_step": 67934, "epoch": 1617} {"train_loss": -5.89826774597168, "global_step": 67935, "epoch": 1617} {"train_loss": -5.913114070892334, "global_step": 67936, "epoch": 1617} {"train_loss": -5.902565956115723, "global_step": 67937, "epoch": 1617} {"train_loss": -5.992686748504639, "global_step": 67938, "epoch": 1617} {"train_loss": -5.951510906219482, "global_step": 67939, "epoch": 1617} {"train_loss": -5.981361389160156, "global_step": 67940, "epoch": 1617} {"train_loss": -5.97560977935791, "global_step": 67941, "epoch": 1617} {"train_loss": -6.014132499694824, "global_step": 67942, "epoch": 1617} {"train_loss": -5.944014549255371, "global_step": 67943, "epoch": 1617} {"train_loss": -5.97915506362915, "global_step": 67944, "epoch": 1617} {"train_loss": -5.929171562194824, "global_step": 67945, "epoch": 1617} {"train_loss": -5.867555618286133, "global_step": 67946, "epoch": 1617} {"train_loss": -5.9338765144348145, "global_step": 67947, "epoch": 1617} {"train_loss": -5.961944103240967, "global_step": 67948, "epoch": 1617} {"train_loss": -6.008220672607422, "global_step": 67949, "epoch": 1617} {"train_loss": -6.051626205444336, "global_step": 67950, "epoch": 1617} {"train_loss": -5.971620082855225, "global_step": 67951, "epoch": 1617} {"train_loss": -6.085627555847168, "global_step": 67952, "epoch": 1617} {"train_loss": -5.9405975341796875, "global_step": 67953, "epoch": 1617} {"train_loss": -5.9240827560424805, "global_step": 67954, "epoch": 1617} {"train_loss": -5.968806789034889, "global_step": 67955, "epoch": 1617, "val_loss": 67400.9609375} {"train_loss": -5.9658660888671875, "global_step": 67956, "epoch": 1618} {"train_loss": -5.923834800720215, "global_step": 67957, "epoch": 1618} {"train_loss": -6.053389549255371, "global_step": 67958, "epoch": 1618} {"train_loss": -5.906540870666504, "global_step": 67959, "epoch": 1618} {"train_loss": -5.967817783355713, "global_step": 67960, "epoch": 1618} {"train_loss": -5.879152297973633, "global_step": 67961, "epoch": 1618} {"train_loss": -5.993997573852539, "global_step": 67962, "epoch": 1618} {"train_loss": -5.908900260925293, "global_step": 67963, "epoch": 1618} {"train_loss": -6.031377792358398, "global_step": 67964, "epoch": 1618} {"train_loss": -5.898508548736572, "global_step": 67965, "epoch": 1618} {"train_loss": -6.018204212188721, "global_step": 67966, "epoch": 1618} {"train_loss": -5.932727336883545, "global_step": 67967, "epoch": 1618} {"train_loss": -6.035815715789795, "global_step": 67968, "epoch": 1618} {"train_loss": -6.028939723968506, "global_step": 67969, "epoch": 1618} {"train_loss": -6.028650283813477, "global_step": 67970, "epoch": 1618} {"train_loss": -5.948532581329346, "global_step": 67971, "epoch": 1618} {"train_loss": -6.004093170166016, "global_step": 67972, "epoch": 1618} {"train_loss": -6.078824996948242, "global_step": 67973, "epoch": 1618} {"train_loss": -6.0327653884887695, "global_step": 67974, "epoch": 1618} {"train_loss": -6.0365190505981445, "global_step": 67975, "epoch": 1618} {"train_loss": -6.007336139678955, "global_step": 67976, "epoch": 1618} {"train_loss": -5.882643699645996, "global_step": 67977, "epoch": 1618} {"train_loss": -6.130619049072266, "global_step": 67978, "epoch": 1618} {"train_loss": -6.045217037200928, "global_step": 67979, "epoch": 1618} {"train_loss": -6.065374851226807, "global_step": 67980, "epoch": 1618} {"train_loss": -6.00374698638916, "global_step": 67981, "epoch": 1618} {"train_loss": -6.034822463989258, "global_step": 67982, "epoch": 1618} {"train_loss": -5.991687774658203, "global_step": 67983, "epoch": 1618} {"train_loss": -6.0529255867004395, "global_step": 67984, "epoch": 1618} {"train_loss": -6.060392379760742, "global_step": 67985, "epoch": 1618} {"train_loss": -5.973229885101318, "global_step": 67986, "epoch": 1618} {"train_loss": -5.920195579528809, "global_step": 67987, "epoch": 1618} {"train_loss": -6.0055155754089355, "global_step": 67988, "epoch": 1618} {"train_loss": -5.961259365081787, "global_step": 67989, "epoch": 1618} {"train_loss": -6.023155212402344, "global_step": 67990, "epoch": 1618} {"train_loss": -5.909742832183838, "global_step": 67991, "epoch": 1618} {"train_loss": -6.096961498260498, "global_step": 67992, "epoch": 1618} {"train_loss": -5.883220195770264, "global_step": 67993, "epoch": 1618} {"train_loss": -6.0187153816223145, "global_step": 67994, "epoch": 1618} {"train_loss": -5.79351806640625, "global_step": 67995, "epoch": 1618} {"train_loss": -6.015632629394531, "global_step": 67996, "epoch": 1618} {"train_loss": -5.989372344244094, "global_step": 67997, "epoch": 1618, "val_loss": 67180.921875} {"train_loss": -6.032589912414551, "global_step": 67998, "epoch": 1619} {"train_loss": -5.997531890869141, "global_step": 67999, "epoch": 1619} {"train_loss": -6.0029497146606445, "global_step": 68000, "epoch": 1619} {"train_loss": -5.930425643920898, "global_step": 68001, "epoch": 1619} {"train_loss": -6.020082473754883, "global_step": 68002, "epoch": 1619} {"train_loss": -5.851853370666504, "global_step": 68003, "epoch": 1619} {"train_loss": -5.896185398101807, "global_step": 68004, "epoch": 1619} {"train_loss": -6.039384841918945, "global_step": 68005, "epoch": 1619} {"train_loss": -5.923858642578125, "global_step": 68006, "epoch": 1619} {"train_loss": -6.048271179199219, "global_step": 68007, "epoch": 1619} {"train_loss": -6.025143623352051, "global_step": 68008, "epoch": 1619} {"train_loss": -5.933437347412109, "global_step": 68009, "epoch": 1619} {"train_loss": -5.903369903564453, "global_step": 68010, "epoch": 1619} {"train_loss": -5.812188148498535, "global_step": 68011, "epoch": 1619} {"train_loss": -6.168974876403809, "global_step": 68012, "epoch": 1619} {"train_loss": -5.995389461517334, "global_step": 68013, "epoch": 1619} {"train_loss": -6.033408164978027, "global_step": 68014, "epoch": 1619} {"train_loss": -5.927228927612305, "global_step": 68015, "epoch": 1619} {"train_loss": -5.892401218414307, "global_step": 68016, "epoch": 1619} {"train_loss": -5.943519592285156, "global_step": 68017, "epoch": 1619} {"train_loss": -5.965972900390625, "global_step": 68018, "epoch": 1619} {"train_loss": -6.022547721862793, "global_step": 68019, "epoch": 1619} {"train_loss": -6.025326251983643, "global_step": 68020, "epoch": 1619} {"train_loss": -5.980120658874512, "global_step": 68021, "epoch": 1619} {"train_loss": -5.907859802246094, "global_step": 68022, "epoch": 1619} {"train_loss": -5.864867210388184, "global_step": 68023, "epoch": 1619} {"train_loss": -6.1048126220703125, "global_step": 68024, "epoch": 1619} {"train_loss": -5.92894172668457, "global_step": 68025, "epoch": 1619} {"train_loss": -5.946555137634277, "global_step": 68026, "epoch": 1619} {"train_loss": -6.091716766357422, "global_step": 68027, "epoch": 1619} {"train_loss": -5.99570369720459, "global_step": 68028, "epoch": 1619} {"train_loss": -5.975849151611328, "global_step": 68029, "epoch": 1619} {"train_loss": -6.000653266906738, "global_step": 68030, "epoch": 1619} {"train_loss": -5.9816975593566895, "global_step": 68031, "epoch": 1619} {"train_loss": -5.972816467285156, "global_step": 68032, "epoch": 1619} {"train_loss": -5.784769535064697, "global_step": 68033, "epoch": 1619} {"train_loss": -6.0027241706848145, "global_step": 68034, "epoch": 1619} {"train_loss": -6.0107645988464355, "global_step": 68035, "epoch": 1619} {"train_loss": -6.093361854553223, "global_step": 68036, "epoch": 1619} {"train_loss": -5.862969875335693, "global_step": 68037, "epoch": 1619} {"train_loss": -6.022082328796387, "global_step": 68038, "epoch": 1619} {"train_loss": -5.973556688853672, "global_step": 68039, "epoch": 1619, "val_loss": 67292.59375} {"train_loss": -6.053659915924072, "global_step": 68040, "epoch": 1620} {"train_loss": -6.137143135070801, "global_step": 68041, "epoch": 1620} {"train_loss": -5.830102920532227, "global_step": 68042, "epoch": 1620} {"train_loss": -5.972174644470215, "global_step": 68043, "epoch": 1620} {"train_loss": -5.953014373779297, "global_step": 68044, "epoch": 1620} {"train_loss": -5.959928512573242, "global_step": 68045, "epoch": 1620} {"train_loss": -6.108046531677246, "global_step": 68046, "epoch": 1620} {"train_loss": -5.86379337310791, "global_step": 68047, "epoch": 1620} {"train_loss": -6.074663162231445, "global_step": 68048, "epoch": 1620} {"train_loss": -6.081043243408203, "global_step": 68049, "epoch": 1620} {"train_loss": -6.03692626953125, "global_step": 68050, "epoch": 1620} {"train_loss": -6.003868103027344, "global_step": 68051, "epoch": 1620} {"train_loss": -6.011618614196777, "global_step": 68052, "epoch": 1620} {"train_loss": -5.935935020446777, "global_step": 68053, "epoch": 1620} {"train_loss": -6.112610816955566, "global_step": 68054, "epoch": 1620} {"train_loss": -5.86238431930542, "global_step": 68055, "epoch": 1620} {"train_loss": -5.955448627471924, "global_step": 68056, "epoch": 1620} {"train_loss": -5.957455635070801, "global_step": 68057, "epoch": 1620} {"train_loss": -6.0078582763671875, "global_step": 68058, "epoch": 1620} {"train_loss": -5.944620132446289, "global_step": 68059, "epoch": 1620} {"train_loss": -5.953944206237793, "global_step": 68060, "epoch": 1620} {"train_loss": -5.921785831451416, "global_step": 68061, "epoch": 1620} {"train_loss": -5.981822967529297, "global_step": 68062, "epoch": 1620} {"train_loss": -5.9979047775268555, "global_step": 68063, "epoch": 1620} {"train_loss": -5.93949031829834, "global_step": 68064, "epoch": 1620} {"train_loss": -6.113415718078613, "global_step": 68065, "epoch": 1620} {"train_loss": -5.979063987731934, "global_step": 68066, "epoch": 1620} {"train_loss": -5.950057029724121, "global_step": 68067, "epoch": 1620} {"train_loss": -5.903947353363037, "global_step": 68068, "epoch": 1620} {"train_loss": -5.998669624328613, "global_step": 68069, "epoch": 1620} {"train_loss": -6.052840232849121, "global_step": 68070, "epoch": 1620} {"train_loss": -5.880219459533691, "global_step": 68071, "epoch": 1620} {"train_loss": -6.009696960449219, "global_step": 68072, "epoch": 1620} {"train_loss": -5.932282447814941, "global_step": 68073, "epoch": 1620} {"train_loss": -5.956885814666748, "global_step": 68074, "epoch": 1620} {"train_loss": -5.935853481292725, "global_step": 68075, "epoch": 1620} {"train_loss": -5.879027366638184, "global_step": 68076, "epoch": 1620} {"train_loss": -5.9523162841796875, "global_step": 68077, "epoch": 1620} {"train_loss": -5.897653102874756, "global_step": 68078, "epoch": 1620} {"train_loss": -5.943188667297363, "global_step": 68079, "epoch": 1620} {"train_loss": -5.917078971862793, "global_step": 68080, "epoch": 1620} {"train_loss": -5.971896989004953, "global_step": 68081, "epoch": 1620, "val_loss": 67310.265625} {"train_loss": -5.951918601989746, "global_step": 68082, "epoch": 1621} {"train_loss": -5.894632339477539, "global_step": 68083, "epoch": 1621} {"train_loss": -5.896594047546387, "global_step": 68084, "epoch": 1621} {"train_loss": -5.854362487792969, "global_step": 68085, "epoch": 1621} {"train_loss": -5.823983192443848, "global_step": 68086, "epoch": 1621} {"train_loss": -6.0202789306640625, "global_step": 68087, "epoch": 1621} {"train_loss": -5.846157073974609, "global_step": 68088, "epoch": 1621} {"train_loss": -6.074346542358398, "global_step": 68089, "epoch": 1621} {"train_loss": -5.871264457702637, "global_step": 68090, "epoch": 1621} {"train_loss": -5.9675750732421875, "global_step": 68091, "epoch": 1621} {"train_loss": -5.996813774108887, "global_step": 68092, "epoch": 1621} {"train_loss": -5.963962554931641, "global_step": 68093, "epoch": 1621} {"train_loss": -5.9986066818237305, "global_step": 68094, "epoch": 1621} {"train_loss": -6.180497169494629, "global_step": 68095, "epoch": 1621} {"train_loss": -6.069587707519531, "global_step": 68096, "epoch": 1621} {"train_loss": -5.942861557006836, "global_step": 68097, "epoch": 1621} {"train_loss": -6.057431221008301, "global_step": 68098, "epoch": 1621} {"train_loss": -5.894336700439453, "global_step": 68099, "epoch": 1621} {"train_loss": -6.111576080322266, "global_step": 68100, "epoch": 1621} {"train_loss": -6.120933532714844, "global_step": 68101, "epoch": 1621} {"train_loss": -5.970566272735596, "global_step": 68102, "epoch": 1621} {"train_loss": -6.141886234283447, "global_step": 68103, "epoch": 1621} {"train_loss": -5.9275383949279785, "global_step": 68104, "epoch": 1621} {"train_loss": -5.919680595397949, "global_step": 68105, "epoch": 1621} {"train_loss": -5.947226524353027, "global_step": 68106, "epoch": 1621} {"train_loss": -5.893313407897949, "global_step": 68107, "epoch": 1621} {"train_loss": -5.90863037109375, "global_step": 68108, "epoch": 1621} {"train_loss": -5.9513325691223145, "global_step": 68109, "epoch": 1621} {"train_loss": -5.8797197341918945, "global_step": 68110, "epoch": 1621} {"train_loss": -5.943920135498047, "global_step": 68111, "epoch": 1621} {"train_loss": -6.1146697998046875, "global_step": 68112, "epoch": 1621} {"train_loss": -6.05466365814209, "global_step": 68113, "epoch": 1621} {"train_loss": -5.982228755950928, "global_step": 68114, "epoch": 1621} {"train_loss": -6.109273910522461, "global_step": 68115, "epoch": 1621} {"train_loss": -6.029846668243408, "global_step": 68116, "epoch": 1621} {"train_loss": -5.969081878662109, "global_step": 68117, "epoch": 1621} {"train_loss": -5.980825424194336, "global_step": 68118, "epoch": 1621} {"train_loss": -5.941226005554199, "global_step": 68119, "epoch": 1621} {"train_loss": -5.981287002563477, "global_step": 68120, "epoch": 1621} {"train_loss": -5.8961687088012695, "global_step": 68121, "epoch": 1621} {"train_loss": -5.917568683624268, "global_step": 68122, "epoch": 1621} {"train_loss": -5.977273555029006, "global_step": 68123, "epoch": 1621, "val_loss": 67177.109375} {"train_loss": -6.01962947845459, "global_step": 68124, "epoch": 1622} {"train_loss": -6.056710243225098, "global_step": 68125, "epoch": 1622} {"train_loss": -6.120266914367676, "global_step": 68126, "epoch": 1622} {"train_loss": -5.936732292175293, "global_step": 68127, "epoch": 1622} {"train_loss": -6.001978397369385, "global_step": 68128, "epoch": 1622} {"train_loss": -5.999283790588379, "global_step": 68129, "epoch": 1622} {"train_loss": -5.925642490386963, "global_step": 68130, "epoch": 1622} {"train_loss": -6.114568710327148, "global_step": 68131, "epoch": 1622} {"train_loss": -5.986453533172607, "global_step": 68132, "epoch": 1622} {"train_loss": -6.075991630554199, "global_step": 68133, "epoch": 1622} {"train_loss": -6.1314873695373535, "global_step": 68134, "epoch": 1622} {"train_loss": -5.941157817840576, "global_step": 68135, "epoch": 1622} {"train_loss": -5.841689586639404, "global_step": 68136, "epoch": 1622} {"train_loss": -6.102447986602783, "global_step": 68137, "epoch": 1622} {"train_loss": -5.904918670654297, "global_step": 68138, "epoch": 1622} {"train_loss": -5.937853813171387, "global_step": 68139, "epoch": 1622} {"train_loss": -6.069070816040039, "global_step": 68140, "epoch": 1622} {"train_loss": -5.9769392013549805, "global_step": 68141, "epoch": 1622} {"train_loss": -5.921840190887451, "global_step": 68142, "epoch": 1622} {"train_loss": -6.02862024307251, "global_step": 68143, "epoch": 1622} {"train_loss": -6.064205169677734, "global_step": 68144, "epoch": 1622} {"train_loss": -5.903546333312988, "global_step": 68145, "epoch": 1622} {"train_loss": -5.956866264343262, "global_step": 68146, "epoch": 1622} {"train_loss": -6.009666919708252, "global_step": 68147, "epoch": 1622} {"train_loss": -5.913582801818848, "global_step": 68148, "epoch": 1622} {"train_loss": -5.8848772048950195, "global_step": 68149, "epoch": 1622} {"train_loss": -6.0373077392578125, "global_step": 68150, "epoch": 1622} {"train_loss": -6.072094440460205, "global_step": 68151, "epoch": 1622} {"train_loss": -6.019287109375, "global_step": 68152, "epoch": 1622} {"train_loss": -6.041295051574707, "global_step": 68153, "epoch": 1622} {"train_loss": -5.886406898498535, "global_step": 68154, "epoch": 1622} {"train_loss": -5.931846618652344, "global_step": 68155, "epoch": 1622} {"train_loss": -5.983666896820068, "global_step": 68156, "epoch": 1622} {"train_loss": -6.097893714904785, "global_step": 68157, "epoch": 1622} {"train_loss": -6.034585952758789, "global_step": 68158, "epoch": 1622} {"train_loss": -5.965871810913086, "global_step": 68159, "epoch": 1622} {"train_loss": -5.951503276824951, "global_step": 68160, "epoch": 1622} {"train_loss": -6.080422878265381, "global_step": 68161, "epoch": 1622} {"train_loss": -6.050686836242676, "global_step": 68162, "epoch": 1622} {"train_loss": -6.072375297546387, "global_step": 68163, "epoch": 1622} {"train_loss": -5.991059303283691, "global_step": 68164, "epoch": 1622} {"train_loss": -6.002781902040754, "global_step": 68165, "epoch": 1622, "val_loss": 66995.671875} {"train_loss": -6.006594657897949, "global_step": 68166, "epoch": 1623} {"train_loss": -6.03884744644165, "global_step": 68167, "epoch": 1623} {"train_loss": -6.006536483764648, "global_step": 68168, "epoch": 1623} {"train_loss": -5.9496612548828125, "global_step": 68169, "epoch": 1623} {"train_loss": -6.009101390838623, "global_step": 68170, "epoch": 1623} {"train_loss": -5.909634590148926, "global_step": 68171, "epoch": 1623} {"train_loss": -6.07038688659668, "global_step": 68172, "epoch": 1623} {"train_loss": -5.997657775878906, "global_step": 68173, "epoch": 1623} {"train_loss": -5.88322114944458, "global_step": 68174, "epoch": 1623} {"train_loss": -5.926618576049805, "global_step": 68175, "epoch": 1623} {"train_loss": -5.922637939453125, "global_step": 68176, "epoch": 1623} {"train_loss": -5.911832332611084, "global_step": 68177, "epoch": 1623} {"train_loss": -5.986865997314453, "global_step": 68178, "epoch": 1623} {"train_loss": -6.0009284019470215, "global_step": 68179, "epoch": 1623} {"train_loss": -5.93787145614624, "global_step": 68180, "epoch": 1623} {"train_loss": -5.962257385253906, "global_step": 68181, "epoch": 1623} {"train_loss": -6.036118984222412, "global_step": 68182, "epoch": 1623} {"train_loss": -6.025071144104004, "global_step": 68183, "epoch": 1623} {"train_loss": -5.994074821472168, "global_step": 68184, "epoch": 1623} {"train_loss": -6.043507099151611, "global_step": 68185, "epoch": 1623} {"train_loss": -5.867802619934082, "global_step": 68186, "epoch": 1623} {"train_loss": -5.986878395080566, "global_step": 68187, "epoch": 1623} {"train_loss": -6.0157270431518555, "global_step": 68188, "epoch": 1623} {"train_loss": -6.004827976226807, "global_step": 68189, "epoch": 1623} {"train_loss": -5.936424255371094, "global_step": 68190, "epoch": 1623} {"train_loss": -6.017360687255859, "global_step": 68191, "epoch": 1623} {"train_loss": -5.883670806884766, "global_step": 68192, "epoch": 1623} {"train_loss": -6.1049981117248535, "global_step": 68193, "epoch": 1623} {"train_loss": -5.956208229064941, "global_step": 68194, "epoch": 1623} {"train_loss": -5.925398826599121, "global_step": 68195, "epoch": 1623} {"train_loss": -5.931510925292969, "global_step": 68196, "epoch": 1623} {"train_loss": -5.919860363006592, "global_step": 68197, "epoch": 1623} {"train_loss": -5.970979690551758, "global_step": 68198, "epoch": 1623} {"train_loss": -6.000176429748535, "global_step": 68199, "epoch": 1623} {"train_loss": -5.9633684158325195, "global_step": 68200, "epoch": 1623} {"train_loss": -6.1413493156433105, "global_step": 68201, "epoch": 1623} {"train_loss": -5.798653602600098, "global_step": 68202, "epoch": 1623} {"train_loss": -5.887660980224609, "global_step": 68203, "epoch": 1623} {"train_loss": -5.983285903930664, "global_step": 68204, "epoch": 1623} {"train_loss": -5.912765979766846, "global_step": 68205, "epoch": 1623} {"train_loss": -6.041937828063965, "global_step": 68206, "epoch": 1623} {"train_loss": -5.9773119404202415, "global_step": 68207, "epoch": 1623, "val_loss": 67253.0625} {"train_loss": -6.0140275955200195, "global_step": 68208, "epoch": 1624} {"train_loss": -6.042518615722656, "global_step": 68209, "epoch": 1624} {"train_loss": -5.946948051452637, "global_step": 68210, "epoch": 1624} {"train_loss": -5.999029159545898, "global_step": 68211, "epoch": 1624} {"train_loss": -6.041150093078613, "global_step": 68212, "epoch": 1624} {"train_loss": -5.940806865692139, "global_step": 68213, "epoch": 1624} {"train_loss": -5.957254409790039, "global_step": 68214, "epoch": 1624} {"train_loss": -6.01300048828125, "global_step": 68215, "epoch": 1624} {"train_loss": -5.982685089111328, "global_step": 68216, "epoch": 1624} {"train_loss": -6.0759172439575195, "global_step": 68217, "epoch": 1624} {"train_loss": -6.058712005615234, "global_step": 68218, "epoch": 1624} {"train_loss": -6.010862827301025, "global_step": 68219, "epoch": 1624} {"train_loss": -5.997835159301758, "global_step": 68220, "epoch": 1624} {"train_loss": -6.131653785705566, "global_step": 68221, "epoch": 1624} {"train_loss": -5.9923295974731445, "global_step": 68222, "epoch": 1624} {"train_loss": -5.988522529602051, "global_step": 68223, "epoch": 1624} {"train_loss": -6.0361409187316895, "global_step": 68224, "epoch": 1624} {"train_loss": -5.853361129760742, "global_step": 68225, "epoch": 1624} {"train_loss": -5.950343132019043, "global_step": 68226, "epoch": 1624} {"train_loss": -6.027611255645752, "global_step": 68227, "epoch": 1624} {"train_loss": -5.9373650550842285, "global_step": 68228, "epoch": 1624} {"train_loss": -5.957947731018066, "global_step": 68229, "epoch": 1624} {"train_loss": -5.98200798034668, "global_step": 68230, "epoch": 1624} {"train_loss": -6.034383296966553, "global_step": 68231, "epoch": 1624} {"train_loss": -6.028041839599609, "global_step": 68232, "epoch": 1624} {"train_loss": -5.8220109939575195, "global_step": 68233, "epoch": 1624} {"train_loss": -5.951426982879639, "global_step": 68234, "epoch": 1624} {"train_loss": -6.035989761352539, "global_step": 68235, "epoch": 1624} {"train_loss": -6.062511920928955, "global_step": 68236, "epoch": 1624} {"train_loss": -5.967642307281494, "global_step": 68237, "epoch": 1624} {"train_loss": -5.982423305511475, "global_step": 68238, "epoch": 1624} {"train_loss": -5.998657703399658, "global_step": 68239, "epoch": 1624} {"train_loss": -5.921927452087402, "global_step": 68240, "epoch": 1624} {"train_loss": -5.979315757751465, "global_step": 68241, "epoch": 1624} {"train_loss": -5.8059401512146, "global_step": 68242, "epoch": 1624} {"train_loss": -6.064547061920166, "global_step": 68243, "epoch": 1624} {"train_loss": -5.856131553649902, "global_step": 68244, "epoch": 1624} {"train_loss": -6.041823387145996, "global_step": 68245, "epoch": 1624} {"train_loss": -6.015836715698242, "global_step": 68246, "epoch": 1624} {"train_loss": -5.87319278717041, "global_step": 68247, "epoch": 1624} {"train_loss": -5.917938232421875, "global_step": 68248, "epoch": 1624} {"train_loss": -5.981638215837025, "global_step": 68249, "epoch": 1624, "val_loss": 67337.25} {"train_loss": -5.982808589935303, "global_step": 68250, "epoch": 1625} {"train_loss": -5.956064224243164, "global_step": 68251, "epoch": 1625} {"train_loss": -6.002145767211914, "global_step": 68252, "epoch": 1625} {"train_loss": -6.0452117919921875, "global_step": 68253, "epoch": 1625} {"train_loss": -5.953365802764893, "global_step": 68254, "epoch": 1625} {"train_loss": -5.836684226989746, "global_step": 68255, "epoch": 1625} {"train_loss": -5.884613037109375, "global_step": 68256, "epoch": 1625} {"train_loss": -5.886537075042725, "global_step": 68257, "epoch": 1625} {"train_loss": -5.951180458068848, "global_step": 68258, "epoch": 1625} {"train_loss": -5.894092559814453, "global_step": 68259, "epoch": 1625} {"train_loss": -5.962653636932373, "global_step": 68260, "epoch": 1625} {"train_loss": -5.869748592376709, "global_step": 68261, "epoch": 1625} {"train_loss": -5.946931838989258, "global_step": 68262, "epoch": 1625} {"train_loss": -5.773695945739746, "global_step": 68263, "epoch": 1625} {"train_loss": -5.903075695037842, "global_step": 68264, "epoch": 1625} {"train_loss": -5.963581085205078, "global_step": 68265, "epoch": 1625} {"train_loss": -5.923248291015625, "global_step": 68266, "epoch": 1625} {"train_loss": -5.9124040603637695, "global_step": 68267, "epoch": 1625} {"train_loss": -6.026493072509766, "global_step": 68268, "epoch": 1625} {"train_loss": -6.017514228820801, "global_step": 68269, "epoch": 1625} {"train_loss": -5.98658561706543, "global_step": 68270, "epoch": 1625} {"train_loss": -5.8978047370910645, "global_step": 68271, "epoch": 1625} {"train_loss": -5.975022315979004, "global_step": 68272, "epoch": 1625} {"train_loss": -6.001960754394531, "global_step": 68273, "epoch": 1625} {"train_loss": -5.947901725769043, "global_step": 68274, "epoch": 1625} {"train_loss": -5.968307018280029, "global_step": 68275, "epoch": 1625} {"train_loss": -5.994709491729736, "global_step": 68276, "epoch": 1625} {"train_loss": -5.9634857177734375, "global_step": 68277, "epoch": 1625} {"train_loss": -5.926631450653076, "global_step": 68278, "epoch": 1625} {"train_loss": -5.950411796569824, "global_step": 68279, "epoch": 1625} {"train_loss": -5.892245292663574, "global_step": 68280, "epoch": 1625} {"train_loss": -6.00059700012207, "global_step": 68281, "epoch": 1625} {"train_loss": -5.950384616851807, "global_step": 68282, "epoch": 1625} {"train_loss": -6.017610549926758, "global_step": 68283, "epoch": 1625} {"train_loss": -6.023677825927734, "global_step": 68284, "epoch": 1625} {"train_loss": -5.898400783538818, "global_step": 68285, "epoch": 1625} {"train_loss": -5.9872918128967285, "global_step": 68286, "epoch": 1625} {"train_loss": -6.157040596008301, "global_step": 68287, "epoch": 1625} {"train_loss": -5.920937538146973, "global_step": 68288, "epoch": 1625} {"train_loss": -5.908730506896973, "global_step": 68289, "epoch": 1625} {"train_loss": -5.888358116149902, "global_step": 68290, "epoch": 1625} {"train_loss": -5.951721554710751, "global_step": 68291, "epoch": 1625, "val_loss": 67183.8671875} {"train_loss": -6.01161003112793, "global_step": 68292, "epoch": 1626} {"train_loss": -5.831484317779541, "global_step": 68293, "epoch": 1626} {"train_loss": -6.019224166870117, "global_step": 68294, "epoch": 1626} {"train_loss": -5.9407267570495605, "global_step": 68295, "epoch": 1626} {"train_loss": -5.926812648773193, "global_step": 68296, "epoch": 1626} {"train_loss": -5.924957275390625, "global_step": 68297, "epoch": 1626} {"train_loss": -5.825976848602295, "global_step": 68298, "epoch": 1626} {"train_loss": -5.971806526184082, "global_step": 68299, "epoch": 1626} {"train_loss": -5.887331008911133, "global_step": 68300, "epoch": 1626} {"train_loss": -5.943478584289551, "global_step": 68301, "epoch": 1626} {"train_loss": -5.880128383636475, "global_step": 68302, "epoch": 1626} {"train_loss": -5.872065544128418, "global_step": 68303, "epoch": 1626} {"train_loss": -6.030991554260254, "global_step": 68304, "epoch": 1626} {"train_loss": -5.76380729675293, "global_step": 68305, "epoch": 1626} {"train_loss": -6.0724897384643555, "global_step": 68306, "epoch": 1626} {"train_loss": -5.9530534744262695, "global_step": 68307, "epoch": 1626} {"train_loss": -5.87026309967041, "global_step": 68308, "epoch": 1626} {"train_loss": -5.9000678062438965, "global_step": 68309, "epoch": 1626} {"train_loss": -5.840738773345947, "global_step": 68310, "epoch": 1626} {"train_loss": -5.947991371154785, "global_step": 68311, "epoch": 1626} {"train_loss": -5.870506286621094, "global_step": 68312, "epoch": 1626} {"train_loss": -6.079660892486572, "global_step": 68313, "epoch": 1626} {"train_loss": -5.983509063720703, "global_step": 68314, "epoch": 1626} {"train_loss": -6.0580854415893555, "global_step": 68315, "epoch": 1626} {"train_loss": -5.967021942138672, "global_step": 68316, "epoch": 1626} {"train_loss": -6.111887454986572, "global_step": 68317, "epoch": 1626} {"train_loss": -5.961874008178711, "global_step": 68318, "epoch": 1626} {"train_loss": -5.924965858459473, "global_step": 68319, "epoch": 1626} {"train_loss": -5.892253875732422, "global_step": 68320, "epoch": 1626} {"train_loss": -5.879598140716553, "global_step": 68321, "epoch": 1626} {"train_loss": -5.96051549911499, "global_step": 68322, "epoch": 1626} {"train_loss": -6.015789031982422, "global_step": 68323, "epoch": 1626} {"train_loss": -6.03729248046875, "global_step": 68324, "epoch": 1626} {"train_loss": -6.125637054443359, "global_step": 68325, "epoch": 1626} {"train_loss": -5.911190986633301, "global_step": 68326, "epoch": 1626} {"train_loss": -5.960719108581543, "global_step": 68327, "epoch": 1626} {"train_loss": -6.103580951690674, "global_step": 68328, "epoch": 1626} {"train_loss": -5.9524078369140625, "global_step": 68329, "epoch": 1626} {"train_loss": -6.043639183044434, "global_step": 68330, "epoch": 1626} {"train_loss": -5.968295574188232, "global_step": 68331, "epoch": 1626} {"train_loss": -5.980185031890869, "global_step": 68332, "epoch": 1626} {"train_loss": -5.959454014187767, "global_step": 68333, "epoch": 1626, "val_loss": 67249.5625} {"train_loss": -6.043745040893555, "global_step": 68334, "epoch": 1627} {"train_loss": -5.879696846008301, "global_step": 68335, "epoch": 1627} {"train_loss": -6.0975847244262695, "global_step": 68336, "epoch": 1627} {"train_loss": -5.945012092590332, "global_step": 68337, "epoch": 1627} {"train_loss": -5.961746692657471, "global_step": 68338, "epoch": 1627} {"train_loss": -5.910438537597656, "global_step": 68339, "epoch": 1627} {"train_loss": -6.004064559936523, "global_step": 68340, "epoch": 1627} {"train_loss": -6.036486625671387, "global_step": 68341, "epoch": 1627} {"train_loss": -6.052337646484375, "global_step": 68342, "epoch": 1627} {"train_loss": -5.923765182495117, "global_step": 68343, "epoch": 1627} {"train_loss": -5.949301719665527, "global_step": 68344, "epoch": 1627} {"train_loss": -6.108201026916504, "global_step": 68345, "epoch": 1627} {"train_loss": -6.169926643371582, "global_step": 68346, "epoch": 1627} {"train_loss": -6.099441051483154, "global_step": 68347, "epoch": 1627} {"train_loss": -6.0874834060668945, "global_step": 68348, "epoch": 1627} {"train_loss": -5.887692451477051, "global_step": 68349, "epoch": 1627} {"train_loss": -6.083227157592773, "global_step": 68350, "epoch": 1627} {"train_loss": -5.960133075714111, "global_step": 68351, "epoch": 1627} {"train_loss": -6.023995399475098, "global_step": 68352, "epoch": 1627} {"train_loss": -5.963286876678467, "global_step": 68353, "epoch": 1627} {"train_loss": -5.952692985534668, "global_step": 68354, "epoch": 1627} {"train_loss": -5.938060760498047, "global_step": 68355, "epoch": 1627} {"train_loss": -5.944211006164551, "global_step": 68356, "epoch": 1627} {"train_loss": -5.989181041717529, "global_step": 68357, "epoch": 1627} {"train_loss": -5.920175552368164, "global_step": 68358, "epoch": 1627} {"train_loss": -6.009461402893066, "global_step": 68359, "epoch": 1627} {"train_loss": -6.029805660247803, "global_step": 68360, "epoch": 1627} {"train_loss": -5.993315696716309, "global_step": 68361, "epoch": 1627} {"train_loss": -6.007584095001221, "global_step": 68362, "epoch": 1627} {"train_loss": -5.935128211975098, "global_step": 68363, "epoch": 1627} {"train_loss": -5.97635555267334, "global_step": 68364, "epoch": 1627} {"train_loss": -5.983538627624512, "global_step": 68365, "epoch": 1627} {"train_loss": -5.909736156463623, "global_step": 68366, "epoch": 1627} {"train_loss": -5.982068061828613, "global_step": 68367, "epoch": 1627} {"train_loss": -5.980446815490723, "global_step": 68368, "epoch": 1627} {"train_loss": -5.953179359436035, "global_step": 68369, "epoch": 1627} {"train_loss": -5.988486289978027, "global_step": 68370, "epoch": 1627} {"train_loss": -5.966003894805908, "global_step": 68371, "epoch": 1627} {"train_loss": -5.858150482177734, "global_step": 68372, "epoch": 1627} {"train_loss": -6.021421432495117, "global_step": 68373, "epoch": 1627} {"train_loss": -5.948451995849609, "global_step": 68374, "epoch": 1627} {"train_loss": -5.988694724582491, "global_step": 68375, "epoch": 1627, "val_loss": 67374.5} {"train_loss": -5.97236442565918, "global_step": 68376, "epoch": 1628} {"train_loss": -5.955338954925537, "global_step": 68377, "epoch": 1628} {"train_loss": -6.039015769958496, "global_step": 68378, "epoch": 1628} {"train_loss": -6.0039262771606445, "global_step": 68379, "epoch": 1628} {"train_loss": -5.948606491088867, "global_step": 68380, "epoch": 1628} {"train_loss": -5.98060417175293, "global_step": 68381, "epoch": 1628} {"train_loss": -6.107978820800781, "global_step": 68382, "epoch": 1628} {"train_loss": -5.8598313331604, "global_step": 68383, "epoch": 1628} {"train_loss": -5.942540168762207, "global_step": 68384, "epoch": 1628} {"train_loss": -6.0904645919799805, "global_step": 68385, "epoch": 1628} {"train_loss": -5.912631034851074, "global_step": 68386, "epoch": 1628} {"train_loss": -5.987192153930664, "global_step": 68387, "epoch": 1628} {"train_loss": -5.958587646484375, "global_step": 68388, "epoch": 1628} {"train_loss": -5.96395206451416, "global_step": 68389, "epoch": 1628} {"train_loss": -5.8996734619140625, "global_step": 68390, "epoch": 1628} {"train_loss": -6.132442951202393, "global_step": 68391, "epoch": 1628} {"train_loss": -5.796769142150879, "global_step": 68392, "epoch": 1628} {"train_loss": -6.062335968017578, "global_step": 68393, "epoch": 1628} {"train_loss": -5.830907821655273, "global_step": 68394, "epoch": 1628} {"train_loss": -5.85739803314209, "global_step": 68395, "epoch": 1628} {"train_loss": -5.8365983963012695, "global_step": 68396, "epoch": 1628} {"train_loss": -5.962177276611328, "global_step": 68397, "epoch": 1628} {"train_loss": -5.860960006713867, "global_step": 68398, "epoch": 1628} {"train_loss": -5.921337127685547, "global_step": 68399, "epoch": 1628} {"train_loss": -6.009414196014404, "global_step": 68400, "epoch": 1628} {"train_loss": -5.925050735473633, "global_step": 68401, "epoch": 1628} {"train_loss": -5.995102882385254, "global_step": 68402, "epoch": 1628} {"train_loss": -6.030548572540283, "global_step": 68403, "epoch": 1628} {"train_loss": -6.055197715759277, "global_step": 68404, "epoch": 1628} {"train_loss": -6.067853927612305, "global_step": 68405, "epoch": 1628} {"train_loss": -6.027050018310547, "global_step": 68406, "epoch": 1628} {"train_loss": -5.949455261230469, "global_step": 68407, "epoch": 1628} {"train_loss": -6.079655647277832, "global_step": 68408, "epoch": 1628} {"train_loss": -5.821939468383789, "global_step": 68409, "epoch": 1628} {"train_loss": -6.067191123962402, "global_step": 68410, "epoch": 1628} {"train_loss": -5.961610317230225, "global_step": 68411, "epoch": 1628} {"train_loss": -6.094295024871826, "global_step": 68412, "epoch": 1628} {"train_loss": -6.05002498626709, "global_step": 68413, "epoch": 1628} {"train_loss": -6.02488899230957, "global_step": 68414, "epoch": 1628} {"train_loss": -6.028525352478027, "global_step": 68415, "epoch": 1628} {"train_loss": -6.140977382659912, "global_step": 68416, "epoch": 1628} {"train_loss": -5.982430753253755, "global_step": 68417, "epoch": 1628, "val_loss": 67189.71875} {"train_loss": -5.897832870483398, "global_step": 68418, "epoch": 1629} {"train_loss": -6.11536979675293, "global_step": 68419, "epoch": 1629} {"train_loss": -5.925302505493164, "global_step": 68420, "epoch": 1629} {"train_loss": -6.000432968139648, "global_step": 68421, "epoch": 1629} {"train_loss": -6.106980323791504, "global_step": 68422, "epoch": 1629} {"train_loss": -6.041769981384277, "global_step": 68423, "epoch": 1629} {"train_loss": -6.071227073669434, "global_step": 68424, "epoch": 1629} {"train_loss": -6.118289470672607, "global_step": 68425, "epoch": 1629} {"train_loss": -5.982192039489746, "global_step": 68426, "epoch": 1629} {"train_loss": -5.911038398742676, "global_step": 68427, "epoch": 1629} {"train_loss": -5.977273941040039, "global_step": 68428, "epoch": 1629} {"train_loss": -6.105154037475586, "global_step": 68429, "epoch": 1629} {"train_loss": -6.031808853149414, "global_step": 68430, "epoch": 1629} {"train_loss": -5.92983865737915, "global_step": 68431, "epoch": 1629} {"train_loss": -5.98494815826416, "global_step": 68432, "epoch": 1629} {"train_loss": -6.076424598693848, "global_step": 68433, "epoch": 1629} {"train_loss": -6.060558319091797, "global_step": 68434, "epoch": 1629} {"train_loss": -6.078579425811768, "global_step": 68435, "epoch": 1629} {"train_loss": -5.99394416809082, "global_step": 68436, "epoch": 1629} {"train_loss": -6.00178337097168, "global_step": 68437, "epoch": 1629} {"train_loss": -6.0627241134643555, "global_step": 68438, "epoch": 1629} {"train_loss": -5.976714611053467, "global_step": 68439, "epoch": 1629} {"train_loss": -6.00134801864624, "global_step": 68440, "epoch": 1629} {"train_loss": -6.060227394104004, "global_step": 68441, "epoch": 1629} {"train_loss": -5.8916521072387695, "global_step": 68442, "epoch": 1629} {"train_loss": -5.949498653411865, "global_step": 68443, "epoch": 1629} {"train_loss": -6.071758270263672, "global_step": 68444, "epoch": 1629} {"train_loss": -5.942605972290039, "global_step": 68445, "epoch": 1629} {"train_loss": -5.9955058097839355, "global_step": 68446, "epoch": 1629} {"train_loss": -6.069977760314941, "global_step": 68447, "epoch": 1629} {"train_loss": -6.0688676834106445, "global_step": 68448, "epoch": 1629} {"train_loss": -5.854503154754639, "global_step": 68449, "epoch": 1629} {"train_loss": -5.944108486175537, "global_step": 68450, "epoch": 1629} {"train_loss": -6.096575736999512, "global_step": 68451, "epoch": 1629} {"train_loss": -5.928418159484863, "global_step": 68452, "epoch": 1629} {"train_loss": -5.887653350830078, "global_step": 68453, "epoch": 1629} {"train_loss": -5.832533836364746, "global_step": 68454, "epoch": 1629} {"train_loss": -5.9413652420043945, "global_step": 68455, "epoch": 1629} {"train_loss": -5.955119609832764, "global_step": 68456, "epoch": 1629} {"train_loss": -5.894773960113525, "global_step": 68457, "epoch": 1629} {"train_loss": -6.044844627380371, "global_step": 68458, "epoch": 1629} {"train_loss": -5.994422469820295, "global_step": 68459, "epoch": 1629, "val_loss": 67415.625} {"train_loss": -6.085981369018555, "global_step": 68460, "epoch": 1630} {"train_loss": -6.002249717712402, "global_step": 68461, "epoch": 1630} {"train_loss": -5.885508060455322, "global_step": 68462, "epoch": 1630} {"train_loss": -5.914218902587891, "global_step": 68463, "epoch": 1630} {"train_loss": -5.844829559326172, "global_step": 68464, "epoch": 1630} {"train_loss": -5.963637828826904, "global_step": 68465, "epoch": 1630} {"train_loss": -5.868549823760986, "global_step": 68466, "epoch": 1630} {"train_loss": -5.942990779876709, "global_step": 68467, "epoch": 1630} {"train_loss": -6.099249839782715, "global_step": 68468, "epoch": 1630} {"train_loss": -5.911800384521484, "global_step": 68469, "epoch": 1630} {"train_loss": -5.968481063842773, "global_step": 68470, "epoch": 1630} {"train_loss": -6.00054931640625, "global_step": 68471, "epoch": 1630} {"train_loss": -6.131828784942627, "global_step": 68472, "epoch": 1630} {"train_loss": -5.870678901672363, "global_step": 68473, "epoch": 1630} {"train_loss": -6.043487071990967, "global_step": 68474, "epoch": 1630} {"train_loss": -5.9534735679626465, "global_step": 68475, "epoch": 1630} {"train_loss": -5.93898868560791, "global_step": 68476, "epoch": 1630} {"train_loss": -5.9210205078125, "global_step": 68477, "epoch": 1630} {"train_loss": -5.961429595947266, "global_step": 68478, "epoch": 1630} {"train_loss": -5.861584663391113, "global_step": 68479, "epoch": 1630} {"train_loss": -5.9200520515441895, "global_step": 68480, "epoch": 1630} {"train_loss": -5.876143455505371, "global_step": 68481, "epoch": 1630} {"train_loss": -5.9743733406066895, "global_step": 68482, "epoch": 1630} {"train_loss": -5.8169708251953125, "global_step": 68483, "epoch": 1630} {"train_loss": -6.0164289474487305, "global_step": 68484, "epoch": 1630} {"train_loss": -6.001806259155273, "global_step": 68485, "epoch": 1630} {"train_loss": -6.0131988525390625, "global_step": 68486, "epoch": 1630} {"train_loss": -5.9484992027282715, "global_step": 68487, "epoch": 1630} {"train_loss": -5.9629621505737305, "global_step": 68488, "epoch": 1630} {"train_loss": -5.993863582611084, "global_step": 68489, "epoch": 1630} {"train_loss": -5.928432941436768, "global_step": 68490, "epoch": 1630} {"train_loss": -6.070794105529785, "global_step": 68491, "epoch": 1630} {"train_loss": -6.006019592285156, "global_step": 68492, "epoch": 1630} {"train_loss": -5.886279582977295, "global_step": 68493, "epoch": 1630} {"train_loss": -6.02468204498291, "global_step": 68494, "epoch": 1630} {"train_loss": -5.917649745941162, "global_step": 68495, "epoch": 1630} {"train_loss": -6.051671504974365, "global_step": 68496, "epoch": 1630} {"train_loss": -6.12637996673584, "global_step": 68497, "epoch": 1630} {"train_loss": -5.929721832275391, "global_step": 68498, "epoch": 1630} {"train_loss": -5.950839996337891, "global_step": 68499, "epoch": 1630} {"train_loss": -6.038202285766602, "global_step": 68500, "epoch": 1630} {"train_loss": -5.965209836051578, "global_step": 68501, "epoch": 1630, "val_loss": 67278.1953125} {"train_loss": -5.9805121421813965, "global_step": 68502, "epoch": 1631} {"train_loss": -6.0197906494140625, "global_step": 68503, "epoch": 1631} {"train_loss": -5.957887649536133, "global_step": 68504, "epoch": 1631} {"train_loss": -5.956623554229736, "global_step": 68505, "epoch": 1631} {"train_loss": -6.045382499694824, "global_step": 68506, "epoch": 1631} {"train_loss": -6.001453399658203, "global_step": 68507, "epoch": 1631} {"train_loss": -5.9334869384765625, "global_step": 68508, "epoch": 1631} {"train_loss": -6.079243183135986, "global_step": 68509, "epoch": 1631} {"train_loss": -5.905651569366455, "global_step": 68510, "epoch": 1631} {"train_loss": -6.036179542541504, "global_step": 68511, "epoch": 1631} {"train_loss": -5.990189552307129, "global_step": 68512, "epoch": 1631} {"train_loss": -5.962398052215576, "global_step": 68513, "epoch": 1631} {"train_loss": -5.946198463439941, "global_step": 68514, "epoch": 1631} {"train_loss": -6.040513038635254, "global_step": 68515, "epoch": 1631} {"train_loss": -5.928933620452881, "global_step": 68516, "epoch": 1631} {"train_loss": -5.977986812591553, "global_step": 68517, "epoch": 1631} {"train_loss": -6.019296646118164, "global_step": 68518, "epoch": 1631} {"train_loss": -5.887320518493652, "global_step": 68519, "epoch": 1631} {"train_loss": -5.9455180168151855, "global_step": 68520, "epoch": 1631} {"train_loss": -5.8008270263671875, "global_step": 68521, "epoch": 1631} {"train_loss": -5.756303787231445, "global_step": 68522, "epoch": 1631} {"train_loss": -5.960964679718018, "global_step": 68523, "epoch": 1631} {"train_loss": -5.792425632476807, "global_step": 68524, "epoch": 1631} {"train_loss": -5.876399993896484, "global_step": 68525, "epoch": 1631} {"train_loss": -6.00108528137207, "global_step": 68526, "epoch": 1631} {"train_loss": -5.922109127044678, "global_step": 68527, "epoch": 1631} {"train_loss": -5.9022135734558105, "global_step": 68528, "epoch": 1631} {"train_loss": -5.922493934631348, "global_step": 68529, "epoch": 1631} {"train_loss": -5.887112617492676, "global_step": 68530, "epoch": 1631} {"train_loss": -5.838800430297852, "global_step": 68531, "epoch": 1631} {"train_loss": -5.969283103942871, "global_step": 68532, "epoch": 1631} {"train_loss": -5.9354071617126465, "global_step": 68533, "epoch": 1631} {"train_loss": -5.783397197723389, "global_step": 68534, "epoch": 1631} {"train_loss": -6.034908294677734, "global_step": 68535, "epoch": 1631} {"train_loss": -6.012624263763428, "global_step": 68536, "epoch": 1631} {"train_loss": -6.02913761138916, "global_step": 68537, "epoch": 1631} {"train_loss": -6.0759077072143555, "global_step": 68538, "epoch": 1631} {"train_loss": -6.010773658752441, "global_step": 68539, "epoch": 1631} {"train_loss": -6.052389144897461, "global_step": 68540, "epoch": 1631} {"train_loss": -5.938533782958984, "global_step": 68541, "epoch": 1631} {"train_loss": -6.015961647033691, "global_step": 68542, "epoch": 1631} {"train_loss": -5.9560850120726085, "global_step": 68543, "epoch": 1631, "val_loss": 67182.828125} {"train_loss": -6.010507583618164, "global_step": 68544, "epoch": 1632} {"train_loss": -5.929574966430664, "global_step": 68545, "epoch": 1632} {"train_loss": -5.940893650054932, "global_step": 68546, "epoch": 1632} {"train_loss": -5.969303131103516, "global_step": 68547, "epoch": 1632} {"train_loss": -6.073407173156738, "global_step": 68548, "epoch": 1632} {"train_loss": -5.917231559753418, "global_step": 68549, "epoch": 1632} {"train_loss": -6.017611503601074, "global_step": 68550, "epoch": 1632} {"train_loss": -5.883884429931641, "global_step": 68551, "epoch": 1632} {"train_loss": -5.961197376251221, "global_step": 68552, "epoch": 1632} {"train_loss": -5.959942817687988, "global_step": 68553, "epoch": 1632} {"train_loss": -6.049029350280762, "global_step": 68554, "epoch": 1632} {"train_loss": -5.916286945343018, "global_step": 68555, "epoch": 1632} {"train_loss": -5.9483184814453125, "global_step": 68556, "epoch": 1632} {"train_loss": -5.922721862792969, "global_step": 68557, "epoch": 1632} {"train_loss": -6.079509735107422, "global_step": 68558, "epoch": 1632} {"train_loss": -6.0190958976745605, "global_step": 68559, "epoch": 1632} {"train_loss": -5.943225860595703, "global_step": 68560, "epoch": 1632} {"train_loss": -6.149508476257324, "global_step": 68561, "epoch": 1632} {"train_loss": -6.01968240737915, "global_step": 68562, "epoch": 1632} {"train_loss": -5.928606986999512, "global_step": 68563, "epoch": 1632} {"train_loss": -5.991800308227539, "global_step": 68564, "epoch": 1632} {"train_loss": -5.975329875946045, "global_step": 68565, "epoch": 1632} {"train_loss": -6.034082889556885, "global_step": 68566, "epoch": 1632} {"train_loss": -6.079023361206055, "global_step": 68567, "epoch": 1632} {"train_loss": -5.935320854187012, "global_step": 68568, "epoch": 1632} {"train_loss": -6.077452659606934, "global_step": 68569, "epoch": 1632} {"train_loss": -5.911571502685547, "global_step": 68570, "epoch": 1632} {"train_loss": -6.079686164855957, "global_step": 68571, "epoch": 1632} {"train_loss": -5.961860179901123, "global_step": 68572, "epoch": 1632} {"train_loss": -6.017399787902832, "global_step": 68573, "epoch": 1632} {"train_loss": -6.006392478942871, "global_step": 68574, "epoch": 1632} {"train_loss": -6.0304460525512695, "global_step": 68575, "epoch": 1632} {"train_loss": -6.0755438804626465, "global_step": 68576, "epoch": 1632} {"train_loss": -6.011862754821777, "global_step": 68577, "epoch": 1632} {"train_loss": -5.982204914093018, "global_step": 68578, "epoch": 1632} {"train_loss": -5.99418306350708, "global_step": 68579, "epoch": 1632} {"train_loss": -5.938432216644287, "global_step": 68580, "epoch": 1632} {"train_loss": -6.0573320388793945, "global_step": 68581, "epoch": 1632} {"train_loss": -5.969905853271484, "global_step": 68582, "epoch": 1632} {"train_loss": -5.925129413604736, "global_step": 68583, "epoch": 1632} {"train_loss": -5.920290470123291, "global_step": 68584, "epoch": 1632} {"train_loss": -5.988255977630615, "global_step": 68585, "epoch": 1632, "val_loss": 67159.421875} {"train_loss": -5.947864532470703, "global_step": 68586, "epoch": 1633} {"train_loss": -6.050131320953369, "global_step": 68587, "epoch": 1633} {"train_loss": -6.01991081237793, "global_step": 68588, "epoch": 1633} {"train_loss": -5.919500350952148, "global_step": 68589, "epoch": 1633} {"train_loss": -5.948884010314941, "global_step": 68590, "epoch": 1633} {"train_loss": -6.015476703643799, "global_step": 68591, "epoch": 1633} {"train_loss": -6.047515392303467, "global_step": 68592, "epoch": 1633} {"train_loss": -6.003164291381836, "global_step": 68593, "epoch": 1633} {"train_loss": -5.9822540283203125, "global_step": 68594, "epoch": 1633} {"train_loss": -6.0626397132873535, "global_step": 68595, "epoch": 1633} {"train_loss": -6.038421630859375, "global_step": 68596, "epoch": 1633} {"train_loss": -5.950957298278809, "global_step": 68597, "epoch": 1633} {"train_loss": -5.967732906341553, "global_step": 68598, "epoch": 1633} {"train_loss": -6.14544677734375, "global_step": 68599, "epoch": 1633} {"train_loss": -6.105048656463623, "global_step": 68600, "epoch": 1633} {"train_loss": -6.0012898445129395, "global_step": 68601, "epoch": 1633} {"train_loss": -6.075549602508545, "global_step": 68602, "epoch": 1633} {"train_loss": -6.0868449211120605, "global_step": 68603, "epoch": 1633} {"train_loss": -6.037124156951904, "global_step": 68604, "epoch": 1633} {"train_loss": -6.024121284484863, "global_step": 68605, "epoch": 1633} {"train_loss": -5.900315761566162, "global_step": 68606, "epoch": 1633} {"train_loss": -5.930373191833496, "global_step": 68607, "epoch": 1633} {"train_loss": -5.952078342437744, "global_step": 68608, "epoch": 1633} {"train_loss": -5.985593795776367, "global_step": 68609, "epoch": 1633} {"train_loss": -6.059398174285889, "global_step": 68610, "epoch": 1633} {"train_loss": -5.887864112854004, "global_step": 68611, "epoch": 1633} {"train_loss": -5.971286773681641, "global_step": 68612, "epoch": 1633} {"train_loss": -6.082019329071045, "global_step": 68613, "epoch": 1633} {"train_loss": -6.059052467346191, "global_step": 68614, "epoch": 1633} {"train_loss": -6.075170516967773, "global_step": 68615, "epoch": 1633} {"train_loss": -6.057267189025879, "global_step": 68616, "epoch": 1633} {"train_loss": -6.047672271728516, "global_step": 68617, "epoch": 1633} {"train_loss": -6.040199279785156, "global_step": 68618, "epoch": 1633} {"train_loss": -5.902431964874268, "global_step": 68619, "epoch": 1633} {"train_loss": -5.985903263092041, "global_step": 68620, "epoch": 1633} {"train_loss": -6.099147796630859, "global_step": 68621, "epoch": 1633} {"train_loss": -5.94517707824707, "global_step": 68622, "epoch": 1633} {"train_loss": -6.0999836921691895, "global_step": 68623, "epoch": 1633} {"train_loss": -6.014358997344971, "global_step": 68624, "epoch": 1633} {"train_loss": -6.163973808288574, "global_step": 68625, "epoch": 1633} {"train_loss": -6.02706241607666, "global_step": 68626, "epoch": 1633} {"train_loss": -6.015171051025391, "global_step": 68627, "epoch": 1633, "val_loss": 67048.828125} {"train_loss": -6.151822090148926, "global_step": 68628, "epoch": 1634} {"train_loss": -5.957845211029053, "global_step": 68629, "epoch": 1634} {"train_loss": -6.0507073402404785, "global_step": 68630, "epoch": 1634} {"train_loss": -6.00482702255249, "global_step": 68631, "epoch": 1634} {"train_loss": -6.079888820648193, "global_step": 68632, "epoch": 1634} {"train_loss": -6.055347442626953, "global_step": 68633, "epoch": 1634} {"train_loss": -5.939932346343994, "global_step": 68634, "epoch": 1634} {"train_loss": -6.013576030731201, "global_step": 68635, "epoch": 1634} {"train_loss": -6.001446723937988, "global_step": 68636, "epoch": 1634} {"train_loss": -6.021610260009766, "global_step": 68637, "epoch": 1634} {"train_loss": -6.075536727905273, "global_step": 68638, "epoch": 1634} {"train_loss": -5.942366600036621, "global_step": 68639, "epoch": 1634} {"train_loss": -5.932735443115234, "global_step": 68640, "epoch": 1634} {"train_loss": -5.925099849700928, "global_step": 68641, "epoch": 1634} {"train_loss": -6.04804801940918, "global_step": 68642, "epoch": 1634} {"train_loss": -6.052221298217773, "global_step": 68643, "epoch": 1634} {"train_loss": -5.993696212768555, "global_step": 68644, "epoch": 1634} {"train_loss": -6.077223300933838, "global_step": 68645, "epoch": 1634} {"train_loss": -6.084616661071777, "global_step": 68646, "epoch": 1634} {"train_loss": -6.014270782470703, "global_step": 68647, "epoch": 1634} {"train_loss": -5.974041938781738, "global_step": 68648, "epoch": 1634} {"train_loss": -5.991024494171143, "global_step": 68649, "epoch": 1634} {"train_loss": -6.040646553039551, "global_step": 68650, "epoch": 1634} {"train_loss": -6.043305397033691, "global_step": 68651, "epoch": 1634} {"train_loss": -5.89677619934082, "global_step": 68652, "epoch": 1634} {"train_loss": -6.052523612976074, "global_step": 68653, "epoch": 1634} {"train_loss": -5.997441291809082, "global_step": 68654, "epoch": 1634} {"train_loss": -6.009241104125977, "global_step": 68655, "epoch": 1634} {"train_loss": -5.932647705078125, "global_step": 68656, "epoch": 1634} {"train_loss": -6.083776950836182, "global_step": 68657, "epoch": 1634} {"train_loss": -6.076032638549805, "global_step": 68658, "epoch": 1634} {"train_loss": -6.02479362487793, "global_step": 68659, "epoch": 1634} {"train_loss": -5.925462245941162, "global_step": 68660, "epoch": 1634} {"train_loss": -6.087004661560059, "global_step": 68661, "epoch": 1634} {"train_loss": -5.971746444702148, "global_step": 68662, "epoch": 1634} {"train_loss": -5.899379730224609, "global_step": 68663, "epoch": 1634} {"train_loss": -6.074411392211914, "global_step": 68664, "epoch": 1634} {"train_loss": -5.861865997314453, "global_step": 68665, "epoch": 1634} {"train_loss": -5.994772911071777, "global_step": 68666, "epoch": 1634} {"train_loss": -6.045293807983398, "global_step": 68667, "epoch": 1634} {"train_loss": -6.05189847946167, "global_step": 68668, "epoch": 1634} {"train_loss": -6.007937431335449, "global_step": 68669, "epoch": 1634, "val_loss": 67183.875} {"train_loss": -6.002460479736328, "global_step": 68670, "epoch": 1635} {"train_loss": -5.8950419425964355, "global_step": 68671, "epoch": 1635} {"train_loss": -6.028717517852783, "global_step": 68672, "epoch": 1635} {"train_loss": -6.071368217468262, "global_step": 68673, "epoch": 1635} {"train_loss": -5.9894795417785645, "global_step": 68674, "epoch": 1635} {"train_loss": -5.996294975280762, "global_step": 68675, "epoch": 1635} {"train_loss": -5.911620140075684, "global_step": 68676, "epoch": 1635} {"train_loss": -5.976894378662109, "global_step": 68677, "epoch": 1635} {"train_loss": -6.009583473205566, "global_step": 68678, "epoch": 1635} {"train_loss": -6.003080368041992, "global_step": 68679, "epoch": 1635} {"train_loss": -5.984562873840332, "global_step": 68680, "epoch": 1635} {"train_loss": -5.920883655548096, "global_step": 68681, "epoch": 1635} {"train_loss": -5.873249053955078, "global_step": 68682, "epoch": 1635} {"train_loss": -6.025020122528076, "global_step": 68683, "epoch": 1635} {"train_loss": -5.97284460067749, "global_step": 68684, "epoch": 1635} {"train_loss": -5.9155731201171875, "global_step": 68685, "epoch": 1635} {"train_loss": -5.992961883544922, "global_step": 68686, "epoch": 1635} {"train_loss": -5.927605628967285, "global_step": 68687, "epoch": 1635} {"train_loss": -5.94097900390625, "global_step": 68688, "epoch": 1635} {"train_loss": -6.009392261505127, "global_step": 68689, "epoch": 1635} {"train_loss": -5.892195701599121, "global_step": 68690, "epoch": 1635} {"train_loss": -5.953313827514648, "global_step": 68691, "epoch": 1635} {"train_loss": -5.946085453033447, "global_step": 68692, "epoch": 1635} {"train_loss": -6.102077007293701, "global_step": 68693, "epoch": 1635} {"train_loss": -6.014081001281738, "global_step": 68694, "epoch": 1635} {"train_loss": -5.977364540100098, "global_step": 68695, "epoch": 1635} {"train_loss": -5.972972869873047, "global_step": 68696, "epoch": 1635} {"train_loss": -6.008318901062012, "global_step": 68697, "epoch": 1635} {"train_loss": -5.965825080871582, "global_step": 68698, "epoch": 1635} {"train_loss": -5.9078369140625, "global_step": 68699, "epoch": 1635} {"train_loss": -6.037093639373779, "global_step": 68700, "epoch": 1635} {"train_loss": -6.08821964263916, "global_step": 68701, "epoch": 1635} {"train_loss": -5.923238754272461, "global_step": 68702, "epoch": 1635} {"train_loss": -5.98837423324585, "global_step": 68703, "epoch": 1635} {"train_loss": -5.974458694458008, "global_step": 68704, "epoch": 1635} {"train_loss": -5.970475673675537, "global_step": 68705, "epoch": 1635} {"train_loss": -5.963979721069336, "global_step": 68706, "epoch": 1635} {"train_loss": -6.0244975090026855, "global_step": 68707, "epoch": 1635} {"train_loss": -5.910593032836914, "global_step": 68708, "epoch": 1635} {"train_loss": -5.9336256980896, "global_step": 68709, "epoch": 1635} {"train_loss": -5.886775970458984, "global_step": 68710, "epoch": 1635} {"train_loss": -5.976924385343279, "global_step": 68711, "epoch": 1635, "val_loss": 67382.7578125} {"train_loss": -6.127002716064453, "global_step": 68712, "epoch": 1636} {"train_loss": -5.957877159118652, "global_step": 68713, "epoch": 1636} {"train_loss": -5.942215442657471, "global_step": 68714, "epoch": 1636} {"train_loss": -5.9545698165893555, "global_step": 68715, "epoch": 1636} {"train_loss": -6.017092704772949, "global_step": 68716, "epoch": 1636} {"train_loss": -5.906641960144043, "global_step": 68717, "epoch": 1636} {"train_loss": -5.838118076324463, "global_step": 68718, "epoch": 1636} {"train_loss": -5.883358955383301, "global_step": 68719, "epoch": 1636} {"train_loss": -6.044921875, "global_step": 68720, "epoch": 1636} {"train_loss": -6.078727722167969, "global_step": 68721, "epoch": 1636} {"train_loss": -5.984551906585693, "global_step": 68722, "epoch": 1636} {"train_loss": -5.978142738342285, "global_step": 68723, "epoch": 1636} {"train_loss": -6.0203351974487305, "global_step": 68724, "epoch": 1636} {"train_loss": -6.003650665283203, "global_step": 68725, "epoch": 1636} {"train_loss": -6.026772499084473, "global_step": 68726, "epoch": 1636} {"train_loss": -5.88456392288208, "global_step": 68727, "epoch": 1636} {"train_loss": -6.054518222808838, "global_step": 68728, "epoch": 1636} {"train_loss": -6.12581205368042, "global_step": 68729, "epoch": 1636} {"train_loss": -5.954311370849609, "global_step": 68730, "epoch": 1636} {"train_loss": -6.082379341125488, "global_step": 68731, "epoch": 1636} {"train_loss": -6.07573127746582, "global_step": 68732, "epoch": 1636} {"train_loss": -6.0282769203186035, "global_step": 68733, "epoch": 1636} {"train_loss": -6.030180931091309, "global_step": 68734, "epoch": 1636} {"train_loss": -6.071157932281494, "global_step": 68735, "epoch": 1636} {"train_loss": -6.065404891967773, "global_step": 68736, "epoch": 1636} {"train_loss": -5.888575077056885, "global_step": 68737, "epoch": 1636} {"train_loss": -5.846915245056152, "global_step": 68738, "epoch": 1636} {"train_loss": -5.893167495727539, "global_step": 68739, "epoch": 1636} {"train_loss": -5.917131423950195, "global_step": 68740, "epoch": 1636} {"train_loss": -5.78104305267334, "global_step": 68741, "epoch": 1636} {"train_loss": -6.053762435913086, "global_step": 68742, "epoch": 1636} {"train_loss": -6.0794172286987305, "global_step": 68743, "epoch": 1636} {"train_loss": -5.968047618865967, "global_step": 68744, "epoch": 1636} {"train_loss": -6.022368907928467, "global_step": 68745, "epoch": 1636} {"train_loss": -5.904768943786621, "global_step": 68746, "epoch": 1636} {"train_loss": -6.013744831085205, "global_step": 68747, "epoch": 1636} {"train_loss": -5.898006916046143, "global_step": 68748, "epoch": 1636} {"train_loss": -5.7613372802734375, "global_step": 68749, "epoch": 1636} {"train_loss": -5.916643142700195, "global_step": 68750, "epoch": 1636} {"train_loss": -5.977663993835449, "global_step": 68751, "epoch": 1636} {"train_loss": -6.021186828613281, "global_step": 68752, "epoch": 1636} {"train_loss": -5.973379225957961, "global_step": 68753, "epoch": 1636, "val_loss": 67351.171875} {"train_loss": -5.847434997558594, "global_step": 68754, "epoch": 1637} {"train_loss": -6.030179023742676, "global_step": 68755, "epoch": 1637} {"train_loss": -5.7941670417785645, "global_step": 68756, "epoch": 1637} {"train_loss": -6.092132091522217, "global_step": 68757, "epoch": 1637} {"train_loss": -5.932518482208252, "global_step": 68758, "epoch": 1637} {"train_loss": -5.890646457672119, "global_step": 68759, "epoch": 1637} {"train_loss": -5.886981010437012, "global_step": 68760, "epoch": 1637} {"train_loss": -5.969205379486084, "global_step": 68761, "epoch": 1637} {"train_loss": -5.918454170227051, "global_step": 68762, "epoch": 1637} {"train_loss": -6.02998685836792, "global_step": 68763, "epoch": 1637} {"train_loss": -6.079095840454102, "global_step": 68764, "epoch": 1637} {"train_loss": -6.002317428588867, "global_step": 68765, "epoch": 1637} {"train_loss": -6.0453901290893555, "global_step": 68766, "epoch": 1637} {"train_loss": -5.829551696777344, "global_step": 68767, "epoch": 1637} {"train_loss": -5.834003448486328, "global_step": 68768, "epoch": 1637} {"train_loss": -6.016408443450928, "global_step": 68769, "epoch": 1637} {"train_loss": -5.921555995941162, "global_step": 68770, "epoch": 1637} {"train_loss": -5.946455001831055, "global_step": 68771, "epoch": 1637} {"train_loss": -5.984663963317871, "global_step": 68772, "epoch": 1637} {"train_loss": -5.9894514083862305, "global_step": 68773, "epoch": 1637} {"train_loss": -5.94660758972168, "global_step": 68774, "epoch": 1637} {"train_loss": -6.0480241775512695, "global_step": 68775, "epoch": 1637} {"train_loss": -6.047970771789551, "global_step": 68776, "epoch": 1637} {"train_loss": -5.888839244842529, "global_step": 68777, "epoch": 1637} {"train_loss": -5.99994421005249, "global_step": 68778, "epoch": 1637} {"train_loss": -5.854239463806152, "global_step": 68779, "epoch": 1637} {"train_loss": -5.94024133682251, "global_step": 68780, "epoch": 1637} {"train_loss": -5.857851028442383, "global_step": 68781, "epoch": 1637} {"train_loss": -6.01582145690918, "global_step": 68782, "epoch": 1637} {"train_loss": -5.977193832397461, "global_step": 68783, "epoch": 1637} {"train_loss": -5.880020618438721, "global_step": 68784, "epoch": 1637} {"train_loss": -5.985269069671631, "global_step": 68785, "epoch": 1637} {"train_loss": -6.010453224182129, "global_step": 68786, "epoch": 1637} {"train_loss": -6.071694850921631, "global_step": 68787, "epoch": 1637} {"train_loss": -6.09538459777832, "global_step": 68788, "epoch": 1637} {"train_loss": -5.919389724731445, "global_step": 68789, "epoch": 1637} {"train_loss": -6.038703918457031, "global_step": 68790, "epoch": 1637} {"train_loss": -6.089449882507324, "global_step": 68791, "epoch": 1637} {"train_loss": -6.020810604095459, "global_step": 68792, "epoch": 1637} {"train_loss": -5.832383632659912, "global_step": 68793, "epoch": 1637} {"train_loss": -6.09401798248291, "global_step": 68794, "epoch": 1637} {"train_loss": -5.96881415730431, "global_step": 68795, "epoch": 1637, "val_loss": 67482.5078125} {"train_loss": -5.880064010620117, "global_step": 68796, "epoch": 1638} {"train_loss": -5.911457061767578, "global_step": 68797, "epoch": 1638} {"train_loss": -5.950662612915039, "global_step": 68798, "epoch": 1638} {"train_loss": -5.967839241027832, "global_step": 68799, "epoch": 1638} {"train_loss": -5.940786361694336, "global_step": 68800, "epoch": 1638} {"train_loss": -6.014508247375488, "global_step": 68801, "epoch": 1638} {"train_loss": -6.024123668670654, "global_step": 68802, "epoch": 1638} {"train_loss": -5.849852085113525, "global_step": 68803, "epoch": 1638} {"train_loss": -6.029701232910156, "global_step": 68804, "epoch": 1638} {"train_loss": -5.903202533721924, "global_step": 68805, "epoch": 1638} {"train_loss": -5.974730014801025, "global_step": 68806, "epoch": 1638} {"train_loss": -6.014991760253906, "global_step": 68807, "epoch": 1638} {"train_loss": -5.93877649307251, "global_step": 68808, "epoch": 1638} {"train_loss": -6.009385585784912, "global_step": 68809, "epoch": 1638} {"train_loss": -5.99277400970459, "global_step": 68810, "epoch": 1638} {"train_loss": -5.9568986892700195, "global_step": 68811, "epoch": 1638} {"train_loss": -5.941318511962891, "global_step": 68812, "epoch": 1638} {"train_loss": -5.966744422912598, "global_step": 68813, "epoch": 1638} {"train_loss": -6.009070873260498, "global_step": 68814, "epoch": 1638} {"train_loss": -6.033658027648926, "global_step": 68815, "epoch": 1638} {"train_loss": -6.017152309417725, "global_step": 68816, "epoch": 1638} {"train_loss": -6.02482795715332, "global_step": 68817, "epoch": 1638} {"train_loss": -5.874293804168701, "global_step": 68818, "epoch": 1638} {"train_loss": -6.045802116394043, "global_step": 68819, "epoch": 1638} {"train_loss": -5.970733642578125, "global_step": 68820, "epoch": 1638} {"train_loss": -6.032393455505371, "global_step": 68821, "epoch": 1638} {"train_loss": -6.057292938232422, "global_step": 68822, "epoch": 1638} {"train_loss": -5.8722310066223145, "global_step": 68823, "epoch": 1638} {"train_loss": -5.99261999130249, "global_step": 68824, "epoch": 1638} {"train_loss": -6.085391521453857, "global_step": 68825, "epoch": 1638} {"train_loss": -5.91038703918457, "global_step": 68826, "epoch": 1638} {"train_loss": -5.935420036315918, "global_step": 68827, "epoch": 1638} {"train_loss": -6.059394359588623, "global_step": 68828, "epoch": 1638} {"train_loss": -6.057773113250732, "global_step": 68829, "epoch": 1638} {"train_loss": -5.97081995010376, "global_step": 68830, "epoch": 1638} {"train_loss": -5.922956466674805, "global_step": 68831, "epoch": 1638} {"train_loss": -5.947368144989014, "global_step": 68832, "epoch": 1638} {"train_loss": -6.0079345703125, "global_step": 68833, "epoch": 1638} {"train_loss": -6.002897262573242, "global_step": 68834, "epoch": 1638} {"train_loss": -6.04233980178833, "global_step": 68835, "epoch": 1638} {"train_loss": -6.020601272583008, "global_step": 68836, "epoch": 1638} {"train_loss": -5.976384594326928, "global_step": 68837, "epoch": 1638, "val_loss": 67196.9453125} {"train_loss": -6.013875961303711, "global_step": 68838, "epoch": 1639} {"train_loss": -6.040816783905029, "global_step": 68839, "epoch": 1639} {"train_loss": -5.998530387878418, "global_step": 68840, "epoch": 1639} {"train_loss": -5.90040397644043, "global_step": 68841, "epoch": 1639} {"train_loss": -5.993413925170898, "global_step": 68842, "epoch": 1639} {"train_loss": -6.069434642791748, "global_step": 68843, "epoch": 1639} {"train_loss": -5.944420337677002, "global_step": 68844, "epoch": 1639} {"train_loss": -5.980815410614014, "global_step": 68845, "epoch": 1639} {"train_loss": -6.082221031188965, "global_step": 68846, "epoch": 1639} {"train_loss": -5.999589443206787, "global_step": 68847, "epoch": 1639} {"train_loss": -6.002174377441406, "global_step": 68848, "epoch": 1639} {"train_loss": -6.068449020385742, "global_step": 68849, "epoch": 1639} {"train_loss": -5.9677734375, "global_step": 68850, "epoch": 1639} {"train_loss": -6.0081586837768555, "global_step": 68851, "epoch": 1639} {"train_loss": -6.025966167449951, "global_step": 68852, "epoch": 1639} {"train_loss": -5.965078353881836, "global_step": 68853, "epoch": 1639} {"train_loss": -6.034433364868164, "global_step": 68854, "epoch": 1639} {"train_loss": -5.993375778198242, "global_step": 68855, "epoch": 1639} {"train_loss": -5.928223609924316, "global_step": 68856, "epoch": 1639} {"train_loss": -6.092257976531982, "global_step": 68857, "epoch": 1639} {"train_loss": -5.941859722137451, "global_step": 68858, "epoch": 1639} {"train_loss": -6.061635971069336, "global_step": 68859, "epoch": 1639} {"train_loss": -5.928884029388428, "global_step": 68860, "epoch": 1639} {"train_loss": -6.093090057373047, "global_step": 68861, "epoch": 1639} {"train_loss": -6.079018592834473, "global_step": 68862, "epoch": 1639} {"train_loss": -5.975132942199707, "global_step": 68863, "epoch": 1639} {"train_loss": -6.002981185913086, "global_step": 68864, "epoch": 1639} {"train_loss": -5.932924270629883, "global_step": 68865, "epoch": 1639} {"train_loss": -6.002328395843506, "global_step": 68866, "epoch": 1639} {"train_loss": -6.070657253265381, "global_step": 68867, "epoch": 1639} {"train_loss": -5.892578125, "global_step": 68868, "epoch": 1639} {"train_loss": -6.009675979614258, "global_step": 68869, "epoch": 1639} {"train_loss": -6.1193013191223145, "global_step": 68870, "epoch": 1639} {"train_loss": -5.967787742614746, "global_step": 68871, "epoch": 1639} {"train_loss": -6.03621768951416, "global_step": 68872, "epoch": 1639} {"train_loss": -6.047658920288086, "global_step": 68873, "epoch": 1639} {"train_loss": -5.644590377807617, "global_step": 68874, "epoch": 1639} {"train_loss": -5.946840286254883, "global_step": 68875, "epoch": 1639} {"train_loss": -5.812323570251465, "global_step": 68876, "epoch": 1639} {"train_loss": -6.0101213455200195, "global_step": 68877, "epoch": 1639} {"train_loss": -5.982144355773926, "global_step": 68878, "epoch": 1639} {"train_loss": -5.9878997802734375, "global_step": 68879, "epoch": 1639, "val_loss": 67179.8671875} {"train_loss": -5.870340824127197, "global_step": 68880, "epoch": 1640} {"train_loss": -5.826238632202148, "global_step": 68881, "epoch": 1640} {"train_loss": -5.97545862197876, "global_step": 68882, "epoch": 1640} {"train_loss": -5.856888771057129, "global_step": 68883, "epoch": 1640} {"train_loss": -5.959120750427246, "global_step": 68884, "epoch": 1640} {"train_loss": -5.872471809387207, "global_step": 68885, "epoch": 1640} {"train_loss": -5.979244232177734, "global_step": 68886, "epoch": 1640} {"train_loss": -5.903146743774414, "global_step": 68887, "epoch": 1640} {"train_loss": -6.039373397827148, "global_step": 68888, "epoch": 1640} {"train_loss": -5.9694929122924805, "global_step": 68889, "epoch": 1640} {"train_loss": -6.007782459259033, "global_step": 68890, "epoch": 1640} {"train_loss": -5.975831508636475, "global_step": 68891, "epoch": 1640} {"train_loss": -6.053231239318848, "global_step": 68892, "epoch": 1640} {"train_loss": -6.0533447265625, "global_step": 68893, "epoch": 1640} {"train_loss": -6.086582183837891, "global_step": 68894, "epoch": 1640} {"train_loss": -6.066056728363037, "global_step": 68895, "epoch": 1640} {"train_loss": -6.067925453186035, "global_step": 68896, "epoch": 1640} {"train_loss": -6.126008987426758, "global_step": 68897, "epoch": 1640} {"train_loss": -6.016817092895508, "global_step": 68898, "epoch": 1640} {"train_loss": -5.993922233581543, "global_step": 68899, "epoch": 1640} {"train_loss": -5.901320934295654, "global_step": 68900, "epoch": 1640} {"train_loss": -5.949887752532959, "global_step": 68901, "epoch": 1640} {"train_loss": -6.0860137939453125, "global_step": 68902, "epoch": 1640} {"train_loss": -6.013984680175781, "global_step": 68903, "epoch": 1640} {"train_loss": -5.813508987426758, "global_step": 68904, "epoch": 1640} {"train_loss": -5.977975845336914, "global_step": 68905, "epoch": 1640} {"train_loss": -5.906366348266602, "global_step": 68906, "epoch": 1640} {"train_loss": -6.063884258270264, "global_step": 68907, "epoch": 1640} {"train_loss": -6.037662982940674, "global_step": 68908, "epoch": 1640} {"train_loss": -5.937127113342285, "global_step": 68909, "epoch": 1640} {"train_loss": -5.9241437911987305, "global_step": 68910, "epoch": 1640} {"train_loss": -6.012899398803711, "global_step": 68911, "epoch": 1640} {"train_loss": -6.02746057510376, "global_step": 68912, "epoch": 1640} {"train_loss": -6.050177574157715, "global_step": 68913, "epoch": 1640} {"train_loss": -6.081598281860352, "global_step": 68914, "epoch": 1640} {"train_loss": -6.0013427734375, "global_step": 68915, "epoch": 1640} {"train_loss": -5.997697830200195, "global_step": 68916, "epoch": 1640} {"train_loss": -6.027624130249023, "global_step": 68917, "epoch": 1640} {"train_loss": -6.086554527282715, "global_step": 68918, "epoch": 1640} {"train_loss": -5.882719039916992, "global_step": 68919, "epoch": 1640} {"train_loss": -5.940051555633545, "global_step": 68920, "epoch": 1640} {"train_loss": -5.98585599944705, "global_step": 68921, "epoch": 1640, "val_loss": 67429.9921875} {"train_loss": -5.853208541870117, "global_step": 68922, "epoch": 1641} {"train_loss": -6.076284408569336, "global_step": 68923, "epoch": 1641} {"train_loss": -5.896798133850098, "global_step": 68924, "epoch": 1641} {"train_loss": -6.0210723876953125, "global_step": 68925, "epoch": 1641} {"train_loss": -5.877892017364502, "global_step": 68926, "epoch": 1641} {"train_loss": -5.908885478973389, "global_step": 68927, "epoch": 1641} {"train_loss": -6.053767204284668, "global_step": 68928, "epoch": 1641} {"train_loss": -5.886005401611328, "global_step": 68929, "epoch": 1641} {"train_loss": -6.018906593322754, "global_step": 68930, "epoch": 1641} {"train_loss": -5.927107810974121, "global_step": 68931, "epoch": 1641} {"train_loss": -5.917408466339111, "global_step": 68932, "epoch": 1641} {"train_loss": -5.86063289642334, "global_step": 68933, "epoch": 1641} {"train_loss": -5.893766403198242, "global_step": 68934, "epoch": 1641} {"train_loss": -5.876058578491211, "global_step": 68935, "epoch": 1641} {"train_loss": -5.850738525390625, "global_step": 68936, "epoch": 1641} {"train_loss": -5.960742950439453, "global_step": 68937, "epoch": 1641} {"train_loss": -5.94248104095459, "global_step": 68938, "epoch": 1641} {"train_loss": -5.919254302978516, "global_step": 68939, "epoch": 1641} {"train_loss": -5.884965419769287, "global_step": 68940, "epoch": 1641} {"train_loss": -5.949299335479736, "global_step": 68941, "epoch": 1641} {"train_loss": -5.978254318237305, "global_step": 68942, "epoch": 1641} {"train_loss": -6.067026138305664, "global_step": 68943, "epoch": 1641} {"train_loss": -5.94879150390625, "global_step": 68944, "epoch": 1641} {"train_loss": -6.0163068771362305, "global_step": 68945, "epoch": 1641} {"train_loss": -5.90725040435791, "global_step": 68946, "epoch": 1641} {"train_loss": -6.007463455200195, "global_step": 68947, "epoch": 1641} {"train_loss": -5.9549880027771, "global_step": 68948, "epoch": 1641} {"train_loss": -5.951521873474121, "global_step": 68949, "epoch": 1641} {"train_loss": -6.003945350646973, "global_step": 68950, "epoch": 1641} {"train_loss": -6.065275192260742, "global_step": 68951, "epoch": 1641} {"train_loss": -6.0152482986450195, "global_step": 68952, "epoch": 1641} {"train_loss": -5.9887542724609375, "global_step": 68953, "epoch": 1641} {"train_loss": -5.971388816833496, "global_step": 68954, "epoch": 1641} {"train_loss": -5.847662925720215, "global_step": 68955, "epoch": 1641} {"train_loss": -5.949965476989746, "global_step": 68956, "epoch": 1641} {"train_loss": -6.018022060394287, "global_step": 68957, "epoch": 1641} {"train_loss": -5.960113525390625, "global_step": 68958, "epoch": 1641} {"train_loss": -6.0475053787231445, "global_step": 68959, "epoch": 1641} {"train_loss": -6.02984094619751, "global_step": 68960, "epoch": 1641} {"train_loss": -6.072037696838379, "global_step": 68961, "epoch": 1641} {"train_loss": -5.99135684967041, "global_step": 68962, "epoch": 1641} {"train_loss": -5.958490280877976, "global_step": 68963, "epoch": 1641, "val_loss": 67106.609375} {"train_loss": -5.9264984130859375, "global_step": 68964, "epoch": 1642} {"train_loss": -5.886733055114746, "global_step": 68965, "epoch": 1642} {"train_loss": -6.000362396240234, "global_step": 68966, "epoch": 1642} {"train_loss": -6.031865119934082, "global_step": 68967, "epoch": 1642} {"train_loss": -6.060737133026123, "global_step": 68968, "epoch": 1642} {"train_loss": -5.844419479370117, "global_step": 68969, "epoch": 1642} {"train_loss": -6.0593767166137695, "global_step": 68970, "epoch": 1642} {"train_loss": -5.855334758758545, "global_step": 68971, "epoch": 1642} {"train_loss": -5.92897891998291, "global_step": 68972, "epoch": 1642} {"train_loss": -5.954062461853027, "global_step": 68973, "epoch": 1642} {"train_loss": -5.927547454833984, "global_step": 68974, "epoch": 1642} {"train_loss": -5.968680381774902, "global_step": 68975, "epoch": 1642} {"train_loss": -6.00655460357666, "global_step": 68976, "epoch": 1642} {"train_loss": -6.0517120361328125, "global_step": 68977, "epoch": 1642} {"train_loss": -5.98681640625, "global_step": 68978, "epoch": 1642} {"train_loss": -5.99593448638916, "global_step": 68979, "epoch": 1642} {"train_loss": -6.0115461349487305, "global_step": 68980, "epoch": 1642} {"train_loss": -5.93364953994751, "global_step": 68981, "epoch": 1642} {"train_loss": -5.955540657043457, "global_step": 68982, "epoch": 1642} {"train_loss": -5.998368263244629, "global_step": 68983, "epoch": 1642} {"train_loss": -6.015532970428467, "global_step": 68984, "epoch": 1642} {"train_loss": -5.974081516265869, "global_step": 68985, "epoch": 1642} {"train_loss": -6.0185041427612305, "global_step": 68986, "epoch": 1642} {"train_loss": -6.022809028625488, "global_step": 68987, "epoch": 1642} {"train_loss": -6.043510437011719, "global_step": 68988, "epoch": 1642} {"train_loss": -6.004927635192871, "global_step": 68989, "epoch": 1642} {"train_loss": -6.039600372314453, "global_step": 68990, "epoch": 1642} {"train_loss": -5.9791059494018555, "global_step": 68991, "epoch": 1642} {"train_loss": -6.011079788208008, "global_step": 68992, "epoch": 1642} {"train_loss": -5.982356071472168, "global_step": 68993, "epoch": 1642} {"train_loss": -6.02597713470459, "global_step": 68994, "epoch": 1642} {"train_loss": -5.996862411499023, "global_step": 68995, "epoch": 1642} {"train_loss": -6.0164079666137695, "global_step": 68996, "epoch": 1642} {"train_loss": -5.987644195556641, "global_step": 68997, "epoch": 1642} {"train_loss": -5.956744194030762, "global_step": 68998, "epoch": 1642} {"train_loss": -5.982761859893799, "global_step": 68999, "epoch": 1642} {"train_loss": -5.895710468292236, "global_step": 69000, "epoch": 1642} {"train_loss": -5.902278900146484, "global_step": 69001, "epoch": 1642} {"train_loss": -5.993264198303223, "global_step": 69002, "epoch": 1642} {"train_loss": -6.018340110778809, "global_step": 69003, "epoch": 1642} {"train_loss": -6.057211875915527, "global_step": 69004, "epoch": 1642} {"train_loss": -5.98234174365089, "global_step": 69005, "epoch": 1642, "val_loss": 67384.140625} {"train_loss": -6.006869316101074, "global_step": 69006, "epoch": 1643} {"train_loss": -6.092686176300049, "global_step": 69007, "epoch": 1643} {"train_loss": -6.110968112945557, "global_step": 69008, "epoch": 1643} {"train_loss": -6.0203680992126465, "global_step": 69009, "epoch": 1643} {"train_loss": -6.07118034362793, "global_step": 69010, "epoch": 1643} {"train_loss": -6.108242988586426, "global_step": 69011, "epoch": 1643} {"train_loss": -6.008338928222656, "global_step": 69012, "epoch": 1643} {"train_loss": -6.072023391723633, "global_step": 69013, "epoch": 1643} {"train_loss": -6.011989593505859, "global_step": 69014, "epoch": 1643} {"train_loss": -6.061182498931885, "global_step": 69015, "epoch": 1643} {"train_loss": -6.030162811279297, "global_step": 69016, "epoch": 1643} {"train_loss": -5.941664695739746, "global_step": 69017, "epoch": 1643} {"train_loss": -6.099966049194336, "global_step": 69018, "epoch": 1643} {"train_loss": -5.917080879211426, "global_step": 69019, "epoch": 1643} {"train_loss": -5.9386138916015625, "global_step": 69020, "epoch": 1643} {"train_loss": -5.972761154174805, "global_step": 69021, "epoch": 1643} {"train_loss": -5.907511234283447, "global_step": 69022, "epoch": 1643} {"train_loss": -6.035606384277344, "global_step": 69023, "epoch": 1643} {"train_loss": -5.923002243041992, "global_step": 69024, "epoch": 1643} {"train_loss": -5.946377754211426, "global_step": 69025, "epoch": 1643} {"train_loss": -5.927637100219727, "global_step": 69026, "epoch": 1643} {"train_loss": -5.879361152648926, "global_step": 69027, "epoch": 1643} {"train_loss": -5.927186012268066, "global_step": 69028, "epoch": 1643} {"train_loss": -5.940743446350098, "global_step": 69029, "epoch": 1643} {"train_loss": -5.992341041564941, "global_step": 69030, "epoch": 1643} {"train_loss": -5.890629768371582, "global_step": 69031, "epoch": 1643} {"train_loss": -5.919618606567383, "global_step": 69032, "epoch": 1643} {"train_loss": -5.9951934814453125, "global_step": 69033, "epoch": 1643} {"train_loss": -6.021214485168457, "global_step": 69034, "epoch": 1643} {"train_loss": -6.01329231262207, "global_step": 69035, "epoch": 1643} {"train_loss": -5.818666458129883, "global_step": 69036, "epoch": 1643} {"train_loss": -6.049385070800781, "global_step": 69037, "epoch": 1643} {"train_loss": -5.968149662017822, "global_step": 69038, "epoch": 1643} {"train_loss": -6.003385543823242, "global_step": 69039, "epoch": 1643} {"train_loss": -6.067203998565674, "global_step": 69040, "epoch": 1643} {"train_loss": -5.908041477203369, "global_step": 69041, "epoch": 1643} {"train_loss": -6.027671813964844, "global_step": 69042, "epoch": 1643} {"train_loss": -5.917591094970703, "global_step": 69043, "epoch": 1643} {"train_loss": -5.982230186462402, "global_step": 69044, "epoch": 1643} {"train_loss": -6.074844837188721, "global_step": 69045, "epoch": 1643} {"train_loss": -5.981751441955566, "global_step": 69046, "epoch": 1643} {"train_loss": -5.9909701233818415, "global_step": 69047, "epoch": 1643, "val_loss": 67211.78125} {"train_loss": -6.097632884979248, "global_step": 69048, "epoch": 1644} {"train_loss": -5.930954933166504, "global_step": 69049, "epoch": 1644} {"train_loss": -6.016482353210449, "global_step": 69050, "epoch": 1644} {"train_loss": -6.015276908874512, "global_step": 69051, "epoch": 1644} {"train_loss": -6.046532154083252, "global_step": 69052, "epoch": 1644} {"train_loss": -5.9623026847839355, "global_step": 69053, "epoch": 1644} {"train_loss": -5.974941253662109, "global_step": 69054, "epoch": 1644} {"train_loss": -6.054722309112549, "global_step": 69055, "epoch": 1644} {"train_loss": -6.0527849197387695, "global_step": 69056, "epoch": 1644} {"train_loss": -6.094583511352539, "global_step": 69057, "epoch": 1644} {"train_loss": -6.011712074279785, "global_step": 69058, "epoch": 1644} {"train_loss": -5.900984764099121, "global_step": 69059, "epoch": 1644} {"train_loss": -6.038094520568848, "global_step": 69060, "epoch": 1644} {"train_loss": -6.027055740356445, "global_step": 69061, "epoch": 1644} {"train_loss": -5.905683517456055, "global_step": 69062, "epoch": 1644} {"train_loss": -5.950771331787109, "global_step": 69063, "epoch": 1644} {"train_loss": -5.927978038787842, "global_step": 69064, "epoch": 1644} {"train_loss": -5.809708595275879, "global_step": 69065, "epoch": 1644} {"train_loss": -6.000522613525391, "global_step": 69066, "epoch": 1644} {"train_loss": -5.945815086364746, "global_step": 69067, "epoch": 1644} {"train_loss": -6.095039367675781, "global_step": 69068, "epoch": 1644} {"train_loss": -6.035871505737305, "global_step": 69069, "epoch": 1644} {"train_loss": -5.887102127075195, "global_step": 69070, "epoch": 1644} {"train_loss": -6.067220687866211, "global_step": 69071, "epoch": 1644} {"train_loss": -5.9912567138671875, "global_step": 69072, "epoch": 1644} {"train_loss": -6.00356388092041, "global_step": 69073, "epoch": 1644} {"train_loss": -5.959846496582031, "global_step": 69074, "epoch": 1644} {"train_loss": -5.873702526092529, "global_step": 69075, "epoch": 1644} {"train_loss": -6.07751989364624, "global_step": 69076, "epoch": 1644} {"train_loss": -5.980807304382324, "global_step": 69077, "epoch": 1644} {"train_loss": -6.009217262268066, "global_step": 69078, "epoch": 1644} {"train_loss": -5.817290782928467, "global_step": 69079, "epoch": 1644} {"train_loss": -5.940592288970947, "global_step": 69080, "epoch": 1644} {"train_loss": -6.057157516479492, "global_step": 69081, "epoch": 1644} {"train_loss": -5.937413692474365, "global_step": 69082, "epoch": 1644} {"train_loss": -6.065663814544678, "global_step": 69083, "epoch": 1644} {"train_loss": -6.011470794677734, "global_step": 69084, "epoch": 1644} {"train_loss": -6.009924411773682, "global_step": 69085, "epoch": 1644} {"train_loss": -5.97047233581543, "global_step": 69086, "epoch": 1644} {"train_loss": -6.045158863067627, "global_step": 69087, "epoch": 1644} {"train_loss": -6.018435478210449, "global_step": 69088, "epoch": 1644} {"train_loss": -5.991160233815511, "global_step": 69089, "epoch": 1644, "val_loss": 67176.828125} {"train_loss": -6.166492462158203, "global_step": 69090, "epoch": 1645} {"train_loss": -6.053468227386475, "global_step": 69091, "epoch": 1645} {"train_loss": -6.030323028564453, "global_step": 69092, "epoch": 1645} {"train_loss": -6.097136497497559, "global_step": 69093, "epoch": 1645} {"train_loss": -5.984612464904785, "global_step": 69094, "epoch": 1645} {"train_loss": -5.947370529174805, "global_step": 69095, "epoch": 1645} {"train_loss": -5.9339599609375, "global_step": 69096, "epoch": 1645} {"train_loss": -5.903742790222168, "global_step": 69097, "epoch": 1645} {"train_loss": -6.083352088928223, "global_step": 69098, "epoch": 1645} {"train_loss": -6.009740829467773, "global_step": 69099, "epoch": 1645} {"train_loss": -5.993587493896484, "global_step": 69100, "epoch": 1645} {"train_loss": -6.165290832519531, "global_step": 69101, "epoch": 1645} {"train_loss": -6.063451766967773, "global_step": 69102, "epoch": 1645} {"train_loss": -5.920793533325195, "global_step": 69103, "epoch": 1645} {"train_loss": -5.955321311950684, "global_step": 69104, "epoch": 1645} {"train_loss": -6.112151145935059, "global_step": 69105, "epoch": 1645} {"train_loss": -5.8864850997924805, "global_step": 69106, "epoch": 1645} {"train_loss": -5.890143394470215, "global_step": 69107, "epoch": 1645} {"train_loss": -6.017062187194824, "global_step": 69108, "epoch": 1645} {"train_loss": -5.860509395599365, "global_step": 69109, "epoch": 1645} {"train_loss": -6.07365608215332, "global_step": 69110, "epoch": 1645} {"train_loss": -5.969276428222656, "global_step": 69111, "epoch": 1645} {"train_loss": -5.916024684906006, "global_step": 69112, "epoch": 1645} {"train_loss": -6.038349151611328, "global_step": 69113, "epoch": 1645} {"train_loss": -6.0133771896362305, "global_step": 69114, "epoch": 1645} {"train_loss": -5.987398147583008, "global_step": 69115, "epoch": 1645} {"train_loss": -5.953597068786621, "global_step": 69116, "epoch": 1645} {"train_loss": -6.022810935974121, "global_step": 69117, "epoch": 1645} {"train_loss": -5.900392532348633, "global_step": 69118, "epoch": 1645} {"train_loss": -5.938024997711182, "global_step": 69119, "epoch": 1645} {"train_loss": -6.073672771453857, "global_step": 69120, "epoch": 1645} {"train_loss": -5.97661018371582, "global_step": 69121, "epoch": 1645} {"train_loss": -5.929243087768555, "global_step": 69122, "epoch": 1645} {"train_loss": -5.9354023933410645, "global_step": 69123, "epoch": 1645} {"train_loss": -5.9589128494262695, "global_step": 69124, "epoch": 1645} {"train_loss": -5.976717948913574, "global_step": 69125, "epoch": 1645} {"train_loss": -5.994001865386963, "global_step": 69126, "epoch": 1645} {"train_loss": -5.973858833312988, "global_step": 69127, "epoch": 1645} {"train_loss": -6.047586441040039, "global_step": 69128, "epoch": 1645} {"train_loss": -5.970284461975098, "global_step": 69129, "epoch": 1645} {"train_loss": -5.975227355957031, "global_step": 69130, "epoch": 1645} {"train_loss": -5.990506387892223, "global_step": 69131, "epoch": 1645, "val_loss": 67332.3125} {"train_loss": -5.91679573059082, "global_step": 69132, "epoch": 1646} {"train_loss": -6.073525428771973, "global_step": 69133, "epoch": 1646} {"train_loss": -6.0592803955078125, "global_step": 69134, "epoch": 1646} {"train_loss": -5.897560119628906, "global_step": 69135, "epoch": 1646} {"train_loss": -5.96336555480957, "global_step": 69136, "epoch": 1646} {"train_loss": -5.98162841796875, "global_step": 69137, "epoch": 1646} {"train_loss": -6.069825172424316, "global_step": 69138, "epoch": 1646} {"train_loss": -5.973973751068115, "global_step": 69139, "epoch": 1646} {"train_loss": -5.990835189819336, "global_step": 69140, "epoch": 1646} {"train_loss": -6.105556488037109, "global_step": 69141, "epoch": 1646} {"train_loss": -5.953030586242676, "global_step": 69142, "epoch": 1646} {"train_loss": -5.964027404785156, "global_step": 69143, "epoch": 1646} {"train_loss": -6.042135715484619, "global_step": 69144, "epoch": 1646} {"train_loss": -6.055022239685059, "global_step": 69145, "epoch": 1646} {"train_loss": -6.113772869110107, "global_step": 69146, "epoch": 1646} {"train_loss": -6.056365013122559, "global_step": 69147, "epoch": 1646} {"train_loss": -5.964699745178223, "global_step": 69148, "epoch": 1646} {"train_loss": -6.072991371154785, "global_step": 69149, "epoch": 1646} {"train_loss": -5.942584037780762, "global_step": 69150, "epoch": 1646} {"train_loss": -6.028426647186279, "global_step": 69151, "epoch": 1646} {"train_loss": -6.097254753112793, "global_step": 69152, "epoch": 1646} {"train_loss": -6.036954402923584, "global_step": 69153, "epoch": 1646} {"train_loss": -6.026039123535156, "global_step": 69154, "epoch": 1646} {"train_loss": -6.025139808654785, "global_step": 69155, "epoch": 1646} {"train_loss": -5.968517303466797, "global_step": 69156, "epoch": 1646} {"train_loss": -5.947901725769043, "global_step": 69157, "epoch": 1646} {"train_loss": -5.967674732208252, "global_step": 69158, "epoch": 1646} {"train_loss": -6.056037902832031, "global_step": 69159, "epoch": 1646} {"train_loss": -5.929211616516113, "global_step": 69160, "epoch": 1646} {"train_loss": -6.058594703674316, "global_step": 69161, "epoch": 1646} {"train_loss": -5.937069892883301, "global_step": 69162, "epoch": 1646} {"train_loss": -5.874190330505371, "global_step": 69163, "epoch": 1646} {"train_loss": -5.985235214233398, "global_step": 69164, "epoch": 1646} {"train_loss": -5.869540691375732, "global_step": 69165, "epoch": 1646} {"train_loss": -5.990235805511475, "global_step": 69166, "epoch": 1646} {"train_loss": -6.052906036376953, "global_step": 69167, "epoch": 1646} {"train_loss": -5.909028053283691, "global_step": 69168, "epoch": 1646} {"train_loss": -6.088322639465332, "global_step": 69169, "epoch": 1646} {"train_loss": -5.841228485107422, "global_step": 69170, "epoch": 1646} {"train_loss": -5.987340450286865, "global_step": 69171, "epoch": 1646} {"train_loss": -5.946192741394043, "global_step": 69172, "epoch": 1646} {"train_loss": -5.992842072532291, "global_step": 69173, "epoch": 1646, "val_loss": 67555.015625} {"train_loss": -6.015495300292969, "global_step": 69174, "epoch": 1647} {"train_loss": -5.941678524017334, "global_step": 69175, "epoch": 1647} {"train_loss": -5.8756303787231445, "global_step": 69176, "epoch": 1647} {"train_loss": -5.999444961547852, "global_step": 69177, "epoch": 1647} {"train_loss": -6.093589782714844, "global_step": 69178, "epoch": 1647} {"train_loss": -5.853283882141113, "global_step": 69179, "epoch": 1647} {"train_loss": -6.044206619262695, "global_step": 69180, "epoch": 1647} {"train_loss": -5.907538414001465, "global_step": 69181, "epoch": 1647} {"train_loss": -6.013906002044678, "global_step": 69182, "epoch": 1647} {"train_loss": -6.0234198570251465, "global_step": 69183, "epoch": 1647} {"train_loss": -5.879964828491211, "global_step": 69184, "epoch": 1647} {"train_loss": -5.969386100769043, "global_step": 69185, "epoch": 1647} {"train_loss": -5.913763523101807, "global_step": 69186, "epoch": 1647} {"train_loss": -5.985335826873779, "global_step": 69187, "epoch": 1647} {"train_loss": -6.082805156707764, "global_step": 69188, "epoch": 1647} {"train_loss": -5.899038791656494, "global_step": 69189, "epoch": 1647} {"train_loss": -6.047245025634766, "global_step": 69190, "epoch": 1647} {"train_loss": -5.893815040588379, "global_step": 69191, "epoch": 1647} {"train_loss": -5.86403751373291, "global_step": 69192, "epoch": 1647} {"train_loss": -5.949134826660156, "global_step": 69193, "epoch": 1647} {"train_loss": -6.06160831451416, "global_step": 69194, "epoch": 1647} {"train_loss": -5.963058948516846, "global_step": 69195, "epoch": 1647} {"train_loss": -6.017305850982666, "global_step": 69196, "epoch": 1647} {"train_loss": -6.044127464294434, "global_step": 69197, "epoch": 1647} {"train_loss": -5.996459484100342, "global_step": 69198, "epoch": 1647} {"train_loss": -6.0121612548828125, "global_step": 69199, "epoch": 1647} {"train_loss": -5.913859844207764, "global_step": 69200, "epoch": 1647} {"train_loss": -6.019749164581299, "global_step": 69201, "epoch": 1647} {"train_loss": -6.097346305847168, "global_step": 69202, "epoch": 1647} {"train_loss": -6.076631546020508, "global_step": 69203, "epoch": 1647} {"train_loss": -6.051661968231201, "global_step": 69204, "epoch": 1647} {"train_loss": -5.954074859619141, "global_step": 69205, "epoch": 1647} {"train_loss": -5.964967727661133, "global_step": 69206, "epoch": 1647} {"train_loss": -5.937019348144531, "global_step": 69207, "epoch": 1647} {"train_loss": -5.9357805252075195, "global_step": 69208, "epoch": 1647} {"train_loss": -5.909919738769531, "global_step": 69209, "epoch": 1647} {"train_loss": -6.130510330200195, "global_step": 69210, "epoch": 1647} {"train_loss": -5.9075822830200195, "global_step": 69211, "epoch": 1647} {"train_loss": -5.998806476593018, "global_step": 69212, "epoch": 1647} {"train_loss": -6.005282402038574, "global_step": 69213, "epoch": 1647} {"train_loss": -5.921632289886475, "global_step": 69214, "epoch": 1647} {"train_loss": -5.981523536500477, "global_step": 69215, "epoch": 1647, "val_loss": 67288.171875} {"train_loss": -5.866760730743408, "global_step": 69216, "epoch": 1648} {"train_loss": -6.085628986358643, "global_step": 69217, "epoch": 1648} {"train_loss": -5.873641014099121, "global_step": 69218, "epoch": 1648} {"train_loss": -5.967473983764648, "global_step": 69219, "epoch": 1648} {"train_loss": -5.993437767028809, "global_step": 69220, "epoch": 1648} {"train_loss": -5.9372878074646, "global_step": 69221, "epoch": 1648} {"train_loss": -6.01385498046875, "global_step": 69222, "epoch": 1648} {"train_loss": -5.956728935241699, "global_step": 69223, "epoch": 1648} {"train_loss": -5.878774642944336, "global_step": 69224, "epoch": 1648} {"train_loss": -5.992530822753906, "global_step": 69225, "epoch": 1648} {"train_loss": -5.989431381225586, "global_step": 69226, "epoch": 1648} {"train_loss": -6.044747829437256, "global_step": 69227, "epoch": 1648} {"train_loss": -5.860586643218994, "global_step": 69228, "epoch": 1648} {"train_loss": -6.0485920906066895, "global_step": 69229, "epoch": 1648} {"train_loss": -5.99330997467041, "global_step": 69230, "epoch": 1648} {"train_loss": -5.829692840576172, "global_step": 69231, "epoch": 1648} {"train_loss": -5.9766764640808105, "global_step": 69232, "epoch": 1648} {"train_loss": -5.801791667938232, "global_step": 69233, "epoch": 1648} {"train_loss": -5.985037803649902, "global_step": 69234, "epoch": 1648} {"train_loss": -5.938633441925049, "global_step": 69235, "epoch": 1648} {"train_loss": -5.861587047576904, "global_step": 69236, "epoch": 1648} {"train_loss": -5.912073135375977, "global_step": 69237, "epoch": 1648} {"train_loss": -6.08436918258667, "global_step": 69238, "epoch": 1648} {"train_loss": -5.933948040008545, "global_step": 69239, "epoch": 1648} {"train_loss": -6.036345958709717, "global_step": 69240, "epoch": 1648} {"train_loss": -5.957686424255371, "global_step": 69241, "epoch": 1648} {"train_loss": -5.915504455566406, "global_step": 69242, "epoch": 1648} {"train_loss": -6.005015850067139, "global_step": 69243, "epoch": 1648} {"train_loss": -5.9338884353637695, "global_step": 69244, "epoch": 1648} {"train_loss": -5.919026851654053, "global_step": 69245, "epoch": 1648} {"train_loss": -5.9307661056518555, "global_step": 69246, "epoch": 1648} {"train_loss": -5.935630798339844, "global_step": 69247, "epoch": 1648} {"train_loss": -5.934557914733887, "global_step": 69248, "epoch": 1648} {"train_loss": -5.909160614013672, "global_step": 69249, "epoch": 1648} {"train_loss": -5.966423034667969, "global_step": 69250, "epoch": 1648} {"train_loss": -5.946874141693115, "global_step": 69251, "epoch": 1648} {"train_loss": -5.978870391845703, "global_step": 69252, "epoch": 1648} {"train_loss": -6.086381912231445, "global_step": 69253, "epoch": 1648} {"train_loss": -5.933887481689453, "global_step": 69254, "epoch": 1648} {"train_loss": -5.928402423858643, "global_step": 69255, "epoch": 1648} {"train_loss": -5.978709697723389, "global_step": 69256, "epoch": 1648} {"train_loss": -5.953969274248395, "global_step": 69257, "epoch": 1648, "val_loss": 67254.0078125} {"train_loss": -6.082380294799805, "global_step": 69258, "epoch": 1649} {"train_loss": -5.9864325523376465, "global_step": 69259, "epoch": 1649} {"train_loss": -6.033199787139893, "global_step": 69260, "epoch": 1649} {"train_loss": -6.018508434295654, "global_step": 69261, "epoch": 1649} {"train_loss": -5.938641548156738, "global_step": 69262, "epoch": 1649} {"train_loss": -6.005573272705078, "global_step": 69263, "epoch": 1649} {"train_loss": -6.053329944610596, "global_step": 69264, "epoch": 1649} {"train_loss": -6.043344497680664, "global_step": 69265, "epoch": 1649} {"train_loss": -6.022178649902344, "global_step": 69266, "epoch": 1649} {"train_loss": -5.896087646484375, "global_step": 69267, "epoch": 1649} {"train_loss": -5.997616767883301, "global_step": 69268, "epoch": 1649} {"train_loss": -5.947768211364746, "global_step": 69269, "epoch": 1649} {"train_loss": -5.984033584594727, "global_step": 69270, "epoch": 1649} {"train_loss": -6.0631422996521, "global_step": 69271, "epoch": 1649} {"train_loss": -5.949588298797607, "global_step": 69272, "epoch": 1649} {"train_loss": -5.914791584014893, "global_step": 69273, "epoch": 1649} {"train_loss": -6.007656574249268, "global_step": 69274, "epoch": 1649} {"train_loss": -5.949500560760498, "global_step": 69275, "epoch": 1649} {"train_loss": -6.092918395996094, "global_step": 69276, "epoch": 1649} {"train_loss": -5.9748640060424805, "global_step": 69277, "epoch": 1649} {"train_loss": -6.03553581237793, "global_step": 69278, "epoch": 1649} {"train_loss": -6.1688361167907715, "global_step": 69279, "epoch": 1649} {"train_loss": -6.057498455047607, "global_step": 69280, "epoch": 1649} {"train_loss": -6.00508451461792, "global_step": 69281, "epoch": 1649} {"train_loss": -6.062247276306152, "global_step": 69282, "epoch": 1649} {"train_loss": -6.024967193603516, "global_step": 69283, "epoch": 1649} {"train_loss": -5.954604148864746, "global_step": 69284, "epoch": 1649} {"train_loss": -5.942652702331543, "global_step": 69285, "epoch": 1649} {"train_loss": -6.041420936584473, "global_step": 69286, "epoch": 1649} {"train_loss": -5.969956874847412, "global_step": 69287, "epoch": 1649} {"train_loss": -6.023273944854736, "global_step": 69288, "epoch": 1649} {"train_loss": -6.123759746551514, "global_step": 69289, "epoch": 1649} {"train_loss": -5.956473350524902, "global_step": 69290, "epoch": 1649} {"train_loss": -6.0820512771606445, "global_step": 69291, "epoch": 1649} {"train_loss": -6.0869550704956055, "global_step": 69292, "epoch": 1649} {"train_loss": -6.0082292556762695, "global_step": 69293, "epoch": 1649} {"train_loss": -6.073906898498535, "global_step": 69294, "epoch": 1649} {"train_loss": -5.993696212768555, "global_step": 69295, "epoch": 1649} {"train_loss": -6.080194473266602, "global_step": 69296, "epoch": 1649} {"train_loss": -5.893852233886719, "global_step": 69297, "epoch": 1649} {"train_loss": -5.904942512512207, "global_step": 69298, "epoch": 1649} {"train_loss": -6.005519889649891, "global_step": 69299, "epoch": 1649, "val_loss": 67155.7421875} {"train_loss": -5.985261917114258, "global_step": 69300, "epoch": 1650} {"train_loss": -5.983367443084717, "global_step": 69301, "epoch": 1650} {"train_loss": -5.911932945251465, "global_step": 69302, "epoch": 1650} {"train_loss": -5.907168388366699, "global_step": 69303, "epoch": 1650} {"train_loss": -5.893315315246582, "global_step": 69304, "epoch": 1650} {"train_loss": -5.831418514251709, "global_step": 69305, "epoch": 1650} {"train_loss": -6.00321102142334, "global_step": 69306, "epoch": 1650} {"train_loss": -6.007083892822266, "global_step": 69307, "epoch": 1650} {"train_loss": -5.996204376220703, "global_step": 69308, "epoch": 1650} {"train_loss": -6.009154796600342, "global_step": 69309, "epoch": 1650} {"train_loss": -6.049642562866211, "global_step": 69310, "epoch": 1650} {"train_loss": -6.006437301635742, "global_step": 69311, "epoch": 1650} {"train_loss": -5.957319259643555, "global_step": 69312, "epoch": 1650} {"train_loss": -5.873176574707031, "global_step": 69313, "epoch": 1650} {"train_loss": -6.053022384643555, "global_step": 69314, "epoch": 1650} {"train_loss": -6.008569240570068, "global_step": 69315, "epoch": 1650} {"train_loss": -6.097609996795654, "global_step": 69316, "epoch": 1650} {"train_loss": -6.0210161209106445, "global_step": 69317, "epoch": 1650} {"train_loss": -5.9644060134887695, "global_step": 69318, "epoch": 1650} {"train_loss": -5.971401214599609, "global_step": 69319, "epoch": 1650} {"train_loss": -5.9431328773498535, "global_step": 69320, "epoch": 1650} {"train_loss": -5.99567174911499, "global_step": 69321, "epoch": 1650} {"train_loss": -6.0282883644104, "global_step": 69322, "epoch": 1650} {"train_loss": -5.99535608291626, "global_step": 69323, "epoch": 1650} {"train_loss": -6.000151634216309, "global_step": 69324, "epoch": 1650} {"train_loss": -5.877954006195068, "global_step": 69325, "epoch": 1650} {"train_loss": -6.048185348510742, "global_step": 69326, "epoch": 1650} {"train_loss": -5.9852986335754395, "global_step": 69327, "epoch": 1650} {"train_loss": -5.9607391357421875, "global_step": 69328, "epoch": 1650} {"train_loss": -5.9616851806640625, "global_step": 69329, "epoch": 1650} {"train_loss": -5.922832489013672, "global_step": 69330, "epoch": 1650} {"train_loss": -5.94896125793457, "global_step": 69331, "epoch": 1650} {"train_loss": -6.01791524887085, "global_step": 69332, "epoch": 1650} {"train_loss": -6.064820289611816, "global_step": 69333, "epoch": 1650} {"train_loss": -5.869336128234863, "global_step": 69334, "epoch": 1650} {"train_loss": -5.976687431335449, "global_step": 69335, "epoch": 1650} {"train_loss": -6.010852336883545, "global_step": 69336, "epoch": 1650} {"train_loss": -5.952919006347656, "global_step": 69337, "epoch": 1650} {"train_loss": -6.119302749633789, "global_step": 69338, "epoch": 1650} {"train_loss": -6.050898551940918, "global_step": 69339, "epoch": 1650} {"train_loss": -5.9919915199279785, "global_step": 69340, "epoch": 1650} {"train_loss": -5.983486572901408, "global_step": 69341, "epoch": 1650, "train/sim_max_reward_0": 0.19056034852326828, "train/sim_max_reward_1": 0.7729200811422288, "train/sim_max_reward_2": 0.4350493138806123, "train/sim_max_reward_3": 0.1551811626413362, "train/sim_max_reward_4": 0.8932297204742199, "train/sim_max_reward_5": 0.8304210115604875, "test/sim_max_reward_4400000": 0.201891025800859, "test/sim_max_reward_4400001": 0.8157062659272819, "test/sim_max_reward_4400002": 0.35477401126366614, "test/sim_max_reward_4400003": 0.7437154027713807, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.7114637113918515, "test/sim_max_reward_4400007": 0.7291329213723701, "test/sim_max_reward_4400008": 0.3340414146455733, "test/sim_max_reward_4400009": 0.7494094476310249, "test/sim_max_reward_4400010": 0.21105758647640385, "test/sim_max_reward_4400011": 0.073886340361612, "test/sim_max_reward_4400012": 0.9316443260777176, "test/sim_max_reward_4400013": 0.7787860627871452, "test/sim_max_reward_4400014": 0.32968956963461576, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0733711706170949, "test/sim_max_reward_4400017": 0.40816507780595507, "test/sim_max_reward_4400018": 0.21951600063306834, "test/sim_max_reward_4400019": 0.20752789243863312, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5627975369643157, "test/sim_max_reward_4400022": 0.1024898242216648, "test/sim_max_reward_4400023": 0.11950720281349456, "test/sim_max_reward_4400024": 0.490752330475478, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.7868015772597874, "test/sim_max_reward_4400027": 0.09930184080344609, "test/sim_max_reward_4400028": 0.6404846193275524, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.3255455877060452, "test/sim_max_reward_4400031": 0.9123283080434347, "test/sim_max_reward_4400032": 0.9820217286180367, "test/sim_max_reward_4400033": 0.4809104490359764, "test/sim_max_reward_4400034": 0.8371885855973876, "test/sim_max_reward_4400035": 0.8017230063964383, "test/sim_max_reward_4400036": 0.5897679901056699, "test/sim_max_reward_4400037": 0.7782786197353633, "test/sim_max_reward_4400038": 0.11821635195863177, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8239467301047795, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.6524997805686684, "test/sim_max_reward_4400045": 0.7287755676444498, "test/sim_max_reward_4400046": 0.14302671629750538, "test/sim_max_reward_4400047": 0.847839812685783, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.5741403614014451, "train/mean_score": 0.5462269397036922, "test/mean_score": 0.47235242169282116, "val_loss": 67390.1484375} {"train_loss": -6.044539928436279, "global_step": 69342, "epoch": 1651} {"train_loss": -5.960644721984863, "global_step": 69343, "epoch": 1651} {"train_loss": -6.148361682891846, "global_step": 69344, "epoch": 1651} {"train_loss": -6.0262651443481445, "global_step": 69345, "epoch": 1651} {"train_loss": -5.969602108001709, "global_step": 69346, "epoch": 1651} {"train_loss": -6.150123596191406, "global_step": 69347, "epoch": 1651} {"train_loss": -6.071752548217773, "global_step": 69348, "epoch": 1651} {"train_loss": -6.042550086975098, "global_step": 69349, "epoch": 1651} {"train_loss": -5.937101364135742, "global_step": 69350, "epoch": 1651} {"train_loss": -6.044391632080078, "global_step": 69351, "epoch": 1651} {"train_loss": -6.041242599487305, "global_step": 69352, "epoch": 1651} {"train_loss": -5.945476531982422, "global_step": 69353, "epoch": 1651} {"train_loss": -6.0029802322387695, "global_step": 69354, "epoch": 1651} {"train_loss": -6.000802040100098, "global_step": 69355, "epoch": 1651} {"train_loss": -6.009943962097168, "global_step": 69356, "epoch": 1651} {"train_loss": -5.8308563232421875, "global_step": 69357, "epoch": 1651} {"train_loss": -5.927858829498291, "global_step": 69358, "epoch": 1651} {"train_loss": -5.935588359832764, "global_step": 69359, "epoch": 1651} {"train_loss": -5.943317890167236, "global_step": 69360, "epoch": 1651} {"train_loss": -6.050813674926758, "global_step": 69361, "epoch": 1651} {"train_loss": -5.874112129211426, "global_step": 69362, "epoch": 1651} {"train_loss": -6.089303016662598, "global_step": 69363, "epoch": 1651} {"train_loss": -6.031846523284912, "global_step": 69364, "epoch": 1651} {"train_loss": -5.938549041748047, "global_step": 69365, "epoch": 1651} {"train_loss": -6.057454586029053, "global_step": 69366, "epoch": 1651} {"train_loss": -6.013836860656738, "global_step": 69367, "epoch": 1651} {"train_loss": -5.998100280761719, "global_step": 69368, "epoch": 1651} {"train_loss": -5.866860866546631, "global_step": 69369, "epoch": 1651} {"train_loss": -6.0564656257629395, "global_step": 69370, "epoch": 1651} {"train_loss": -5.8819684982299805, "global_step": 69371, "epoch": 1651} {"train_loss": -6.030377388000488, "global_step": 69372, "epoch": 1651} {"train_loss": -5.9159650802612305, "global_step": 69373, "epoch": 1651} {"train_loss": -5.840446949005127, "global_step": 69374, "epoch": 1651} {"train_loss": -5.922168731689453, "global_step": 69375, "epoch": 1651} {"train_loss": -5.990931510925293, "global_step": 69376, "epoch": 1651} {"train_loss": -5.976218223571777, "global_step": 69377, "epoch": 1651} {"train_loss": -5.843400001525879, "global_step": 69378, "epoch": 1651} {"train_loss": -5.974308967590332, "global_step": 69379, "epoch": 1651} {"train_loss": -6.015738010406494, "global_step": 69380, "epoch": 1651} {"train_loss": -6.156880855560303, "global_step": 69381, "epoch": 1651} {"train_loss": -5.960577011108398, "global_step": 69382, "epoch": 1651} {"train_loss": -5.990183671315511, "global_step": 69383, "epoch": 1651, "val_loss": 66945.3515625} {"train_loss": -5.9754133224487305, "global_step": 69384, "epoch": 1652} {"train_loss": -5.947474002838135, "global_step": 69385, "epoch": 1652} {"train_loss": -5.968301773071289, "global_step": 69386, "epoch": 1652} {"train_loss": -6.029972076416016, "global_step": 69387, "epoch": 1652} {"train_loss": -6.010846138000488, "global_step": 69388, "epoch": 1652} {"train_loss": -6.024231910705566, "global_step": 69389, "epoch": 1652} {"train_loss": -6.013219356536865, "global_step": 69390, "epoch": 1652} {"train_loss": -5.996673583984375, "global_step": 69391, "epoch": 1652} {"train_loss": -6.030494689941406, "global_step": 69392, "epoch": 1652} {"train_loss": -5.919511318206787, "global_step": 69393, "epoch": 1652} {"train_loss": -6.032258033752441, "global_step": 69394, "epoch": 1652} {"train_loss": -5.988329887390137, "global_step": 69395, "epoch": 1652} {"train_loss": -5.952453136444092, "global_step": 69396, "epoch": 1652} {"train_loss": -6.008376121520996, "global_step": 69397, "epoch": 1652} {"train_loss": -5.924098968505859, "global_step": 69398, "epoch": 1652} {"train_loss": -6.062437057495117, "global_step": 69399, "epoch": 1652} {"train_loss": -5.912509441375732, "global_step": 69400, "epoch": 1652} {"train_loss": -6.044058322906494, "global_step": 69401, "epoch": 1652} {"train_loss": -6.077453136444092, "global_step": 69402, "epoch": 1652} {"train_loss": -5.949936866760254, "global_step": 69403, "epoch": 1652} {"train_loss": -6.1782965660095215, "global_step": 69404, "epoch": 1652} {"train_loss": -5.99947452545166, "global_step": 69405, "epoch": 1652} {"train_loss": -5.941894054412842, "global_step": 69406, "epoch": 1652} {"train_loss": -5.962728977203369, "global_step": 69407, "epoch": 1652} {"train_loss": -6.08418083190918, "global_step": 69408, "epoch": 1652} {"train_loss": -6.043130874633789, "global_step": 69409, "epoch": 1652} {"train_loss": -5.962026596069336, "global_step": 69410, "epoch": 1652} {"train_loss": -6.0125603675842285, "global_step": 69411, "epoch": 1652} {"train_loss": -6.07884407043457, "global_step": 69412, "epoch": 1652} {"train_loss": -6.049707889556885, "global_step": 69413, "epoch": 1652} {"train_loss": -5.9720869064331055, "global_step": 69414, "epoch": 1652} {"train_loss": -6.2005295753479, "global_step": 69415, "epoch": 1652} {"train_loss": -5.9304375648498535, "global_step": 69416, "epoch": 1652} {"train_loss": -5.985560894012451, "global_step": 69417, "epoch": 1652} {"train_loss": -5.901271820068359, "global_step": 69418, "epoch": 1652} {"train_loss": -5.935840606689453, "global_step": 69419, "epoch": 1652} {"train_loss": -6.067303657531738, "global_step": 69420, "epoch": 1652} {"train_loss": -6.024872779846191, "global_step": 69421, "epoch": 1652} {"train_loss": -5.9498443603515625, "global_step": 69422, "epoch": 1652} {"train_loss": -5.939855575561523, "global_step": 69423, "epoch": 1652} {"train_loss": -5.886361122131348, "global_step": 69424, "epoch": 1652} {"train_loss": -5.994287479491461, "global_step": 69425, "epoch": 1652, "val_loss": 67480.0625} {"train_loss": -5.9593281745910645, "global_step": 69426, "epoch": 1653} {"train_loss": -5.98581600189209, "global_step": 69427, "epoch": 1653} {"train_loss": -5.932005405426025, "global_step": 69428, "epoch": 1653} {"train_loss": -5.880185604095459, "global_step": 69429, "epoch": 1653} {"train_loss": -5.981703758239746, "global_step": 69430, "epoch": 1653} {"train_loss": -6.03483772277832, "global_step": 69431, "epoch": 1653} {"train_loss": -5.974106788635254, "global_step": 69432, "epoch": 1653} {"train_loss": -5.898735046386719, "global_step": 69433, "epoch": 1653} {"train_loss": -5.934286117553711, "global_step": 69434, "epoch": 1653} {"train_loss": -6.016815185546875, "global_step": 69435, "epoch": 1653} {"train_loss": -5.9253997802734375, "global_step": 69436, "epoch": 1653} {"train_loss": -6.067243576049805, "global_step": 69437, "epoch": 1653} {"train_loss": -5.971306800842285, "global_step": 69438, "epoch": 1653} {"train_loss": -5.899757385253906, "global_step": 69439, "epoch": 1653} {"train_loss": -5.991671085357666, "global_step": 69440, "epoch": 1653} {"train_loss": -6.105093955993652, "global_step": 69441, "epoch": 1653} {"train_loss": -5.869345188140869, "global_step": 69442, "epoch": 1653} {"train_loss": -6.002505302429199, "global_step": 69443, "epoch": 1653} {"train_loss": -6.099996566772461, "global_step": 69444, "epoch": 1653} {"train_loss": -5.904635429382324, "global_step": 69445, "epoch": 1653} {"train_loss": -5.900283336639404, "global_step": 69446, "epoch": 1653} {"train_loss": -5.882016181945801, "global_step": 69447, "epoch": 1653} {"train_loss": -5.894650459289551, "global_step": 69448, "epoch": 1653} {"train_loss": -5.880464553833008, "global_step": 69449, "epoch": 1653} {"train_loss": -5.99652624130249, "global_step": 69450, "epoch": 1653} {"train_loss": -5.879037857055664, "global_step": 69451, "epoch": 1653} {"train_loss": -5.95742130279541, "global_step": 69452, "epoch": 1653} {"train_loss": -5.963314056396484, "global_step": 69453, "epoch": 1653} {"train_loss": -5.985448360443115, "global_step": 69454, "epoch": 1653} {"train_loss": -5.978302955627441, "global_step": 69455, "epoch": 1653} {"train_loss": -5.930050849914551, "global_step": 69456, "epoch": 1653} {"train_loss": -6.007119178771973, "global_step": 69457, "epoch": 1653} {"train_loss": -6.076329231262207, "global_step": 69458, "epoch": 1653} {"train_loss": -5.960049152374268, "global_step": 69459, "epoch": 1653} {"train_loss": -6.0328216552734375, "global_step": 69460, "epoch": 1653} {"train_loss": -6.113982200622559, "global_step": 69461, "epoch": 1653} {"train_loss": -5.989301681518555, "global_step": 69462, "epoch": 1653} {"train_loss": -5.932699203491211, "global_step": 69463, "epoch": 1653} {"train_loss": -6.024387359619141, "global_step": 69464, "epoch": 1653} {"train_loss": -5.862361907958984, "global_step": 69465, "epoch": 1653} {"train_loss": -6.030817985534668, "global_step": 69466, "epoch": 1653} {"train_loss": -5.970353943961007, "global_step": 69467, "epoch": 1653, "val_loss": 67166.0625} {"train_loss": -5.966014385223389, "global_step": 69468, "epoch": 1654} {"train_loss": -5.955649375915527, "global_step": 69469, "epoch": 1654} {"train_loss": -5.977750778198242, "global_step": 69470, "epoch": 1654} {"train_loss": -6.052356243133545, "global_step": 69471, "epoch": 1654} {"train_loss": -5.920377731323242, "global_step": 69472, "epoch": 1654} {"train_loss": -6.037957668304443, "global_step": 69473, "epoch": 1654} {"train_loss": -5.8654279708862305, "global_step": 69474, "epoch": 1654} {"train_loss": -5.991547584533691, "global_step": 69475, "epoch": 1654} {"train_loss": -6.043339729309082, "global_step": 69476, "epoch": 1654} {"train_loss": -6.075109481811523, "global_step": 69477, "epoch": 1654} {"train_loss": -5.953629493713379, "global_step": 69478, "epoch": 1654} {"train_loss": -6.145791053771973, "global_step": 69479, "epoch": 1654} {"train_loss": -6.004291534423828, "global_step": 69480, "epoch": 1654} {"train_loss": -6.059500217437744, "global_step": 69481, "epoch": 1654} {"train_loss": -6.034858226776123, "global_step": 69482, "epoch": 1654} {"train_loss": -6.104925155639648, "global_step": 69483, "epoch": 1654} {"train_loss": -5.912662029266357, "global_step": 69484, "epoch": 1654} {"train_loss": -6.014322280883789, "global_step": 69485, "epoch": 1654} {"train_loss": -5.958638668060303, "global_step": 69486, "epoch": 1654} {"train_loss": -6.080201148986816, "global_step": 69487, "epoch": 1654} {"train_loss": -5.957026481628418, "global_step": 69488, "epoch": 1654} {"train_loss": -5.901305675506592, "global_step": 69489, "epoch": 1654} {"train_loss": -6.052346229553223, "global_step": 69490, "epoch": 1654} {"train_loss": -5.920801162719727, "global_step": 69491, "epoch": 1654} {"train_loss": -5.961941242218018, "global_step": 69492, "epoch": 1654} {"train_loss": -5.990412712097168, "global_step": 69493, "epoch": 1654} {"train_loss": -6.064212322235107, "global_step": 69494, "epoch": 1654} {"train_loss": -5.924081802368164, "global_step": 69495, "epoch": 1654} {"train_loss": -6.057762145996094, "global_step": 69496, "epoch": 1654} {"train_loss": -6.018754959106445, "global_step": 69497, "epoch": 1654} {"train_loss": -6.083261013031006, "global_step": 69498, "epoch": 1654} {"train_loss": -5.989465236663818, "global_step": 69499, "epoch": 1654} {"train_loss": -6.036383628845215, "global_step": 69500, "epoch": 1654} {"train_loss": -5.9971723556518555, "global_step": 69501, "epoch": 1654} {"train_loss": -5.9580583572387695, "global_step": 69502, "epoch": 1654} {"train_loss": -5.941385746002197, "global_step": 69503, "epoch": 1654} {"train_loss": -6.1244611740112305, "global_step": 69504, "epoch": 1654} {"train_loss": -6.014259338378906, "global_step": 69505, "epoch": 1654} {"train_loss": -6.1543450355529785, "global_step": 69506, "epoch": 1654} {"train_loss": -6.012520790100098, "global_step": 69507, "epoch": 1654} {"train_loss": -6.090263366699219, "global_step": 69508, "epoch": 1654} {"train_loss": -6.0106836160024, "global_step": 69509, "epoch": 1654, "val_loss": 67272.703125} {"train_loss": -6.05898904800415, "global_step": 69510, "epoch": 1655} {"train_loss": -6.034512996673584, "global_step": 69511, "epoch": 1655} {"train_loss": -6.006805419921875, "global_step": 69512, "epoch": 1655} {"train_loss": -6.034719944000244, "global_step": 69513, "epoch": 1655} {"train_loss": -6.008057594299316, "global_step": 69514, "epoch": 1655} {"train_loss": -5.971005439758301, "global_step": 69515, "epoch": 1655} {"train_loss": -6.022699356079102, "global_step": 69516, "epoch": 1655} {"train_loss": -6.035908222198486, "global_step": 69517, "epoch": 1655} {"train_loss": -5.833765983581543, "global_step": 69518, "epoch": 1655} {"train_loss": -6.085882186889648, "global_step": 69519, "epoch": 1655} {"train_loss": -5.947714805603027, "global_step": 69520, "epoch": 1655} {"train_loss": -5.894681453704834, "global_step": 69521, "epoch": 1655} {"train_loss": -5.993547439575195, "global_step": 69522, "epoch": 1655} {"train_loss": -5.98158073425293, "global_step": 69523, "epoch": 1655} {"train_loss": -5.943056583404541, "global_step": 69524, "epoch": 1655} {"train_loss": -5.9337239265441895, "global_step": 69525, "epoch": 1655} {"train_loss": -5.913712024688721, "global_step": 69526, "epoch": 1655} {"train_loss": -6.005990982055664, "global_step": 69527, "epoch": 1655} {"train_loss": -6.131196975708008, "global_step": 69528, "epoch": 1655} {"train_loss": -5.925795555114746, "global_step": 69529, "epoch": 1655} {"train_loss": -5.977115631103516, "global_step": 69530, "epoch": 1655} {"train_loss": -5.936060905456543, "global_step": 69531, "epoch": 1655} {"train_loss": -5.99046516418457, "global_step": 69532, "epoch": 1655} {"train_loss": -6.075251579284668, "global_step": 69533, "epoch": 1655} {"train_loss": -6.010374546051025, "global_step": 69534, "epoch": 1655} {"train_loss": -6.040641784667969, "global_step": 69535, "epoch": 1655} {"train_loss": -5.852057456970215, "global_step": 69536, "epoch": 1655} {"train_loss": -6.112922191619873, "global_step": 69537, "epoch": 1655} {"train_loss": -5.982972145080566, "global_step": 69538, "epoch": 1655} {"train_loss": -5.93628454208374, "global_step": 69539, "epoch": 1655} {"train_loss": -6.047923564910889, "global_step": 69540, "epoch": 1655} {"train_loss": -6.145965576171875, "global_step": 69541, "epoch": 1655} {"train_loss": -6.026610851287842, "global_step": 69542, "epoch": 1655} {"train_loss": -5.980769157409668, "global_step": 69543, "epoch": 1655} {"train_loss": -5.94907808303833, "global_step": 69544, "epoch": 1655} {"train_loss": -6.069640636444092, "global_step": 69545, "epoch": 1655} {"train_loss": -5.8731184005737305, "global_step": 69546, "epoch": 1655} {"train_loss": -5.995615482330322, "global_step": 69547, "epoch": 1655} {"train_loss": -6.008026599884033, "global_step": 69548, "epoch": 1655} {"train_loss": -6.015830039978027, "global_step": 69549, "epoch": 1655} {"train_loss": -6.046759605407715, "global_step": 69550, "epoch": 1655} {"train_loss": -5.994076229277111, "global_step": 69551, "epoch": 1655, "val_loss": 67485.1015625} {"train_loss": -6.1234283447265625, "global_step": 69552, "epoch": 1656} {"train_loss": -6.0141191482543945, "global_step": 69553, "epoch": 1656} {"train_loss": -6.00380802154541, "global_step": 69554, "epoch": 1656} {"train_loss": -5.957283020019531, "global_step": 69555, "epoch": 1656} {"train_loss": -5.834216117858887, "global_step": 69556, "epoch": 1656} {"train_loss": -5.985403060913086, "global_step": 69557, "epoch": 1656} {"train_loss": -5.911917686462402, "global_step": 69558, "epoch": 1656} {"train_loss": -5.940570831298828, "global_step": 69559, "epoch": 1656} {"train_loss": -6.10434627532959, "global_step": 69560, "epoch": 1656} {"train_loss": -6.067023277282715, "global_step": 69561, "epoch": 1656} {"train_loss": -6.005767345428467, "global_step": 69562, "epoch": 1656} {"train_loss": -6.036716938018799, "global_step": 69563, "epoch": 1656} {"train_loss": -5.990161895751953, "global_step": 69564, "epoch": 1656} {"train_loss": -6.106827735900879, "global_step": 69565, "epoch": 1656} {"train_loss": -6.0457563400268555, "global_step": 69566, "epoch": 1656} {"train_loss": -5.924506187438965, "global_step": 69567, "epoch": 1656} {"train_loss": -5.936634063720703, "global_step": 69568, "epoch": 1656} {"train_loss": -6.011475563049316, "global_step": 69569, "epoch": 1656} {"train_loss": -5.998772621154785, "global_step": 69570, "epoch": 1656} {"train_loss": -6.065237998962402, "global_step": 69571, "epoch": 1656} {"train_loss": -6.027388572692871, "global_step": 69572, "epoch": 1656} {"train_loss": -5.948001861572266, "global_step": 69573, "epoch": 1656} {"train_loss": -6.018415927886963, "global_step": 69574, "epoch": 1656} {"train_loss": -6.020442962646484, "global_step": 69575, "epoch": 1656} {"train_loss": -5.8930158615112305, "global_step": 69576, "epoch": 1656} {"train_loss": -5.888427734375, "global_step": 69577, "epoch": 1656} {"train_loss": -6.00496768951416, "global_step": 69578, "epoch": 1656} {"train_loss": -5.951062202453613, "global_step": 69579, "epoch": 1656} {"train_loss": -6.048150539398193, "global_step": 69580, "epoch": 1656} {"train_loss": -5.989070415496826, "global_step": 69581, "epoch": 1656} {"train_loss": -6.009307861328125, "global_step": 69582, "epoch": 1656} {"train_loss": -6.000767707824707, "global_step": 69583, "epoch": 1656} {"train_loss": -5.966775894165039, "global_step": 69584, "epoch": 1656} {"train_loss": -6.04602575302124, "global_step": 69585, "epoch": 1656} {"train_loss": -5.952225685119629, "global_step": 69586, "epoch": 1656} {"train_loss": -5.929628372192383, "global_step": 69587, "epoch": 1656} {"train_loss": -6.003056526184082, "global_step": 69588, "epoch": 1656} {"train_loss": -6.03837251663208, "global_step": 69589, "epoch": 1656} {"train_loss": -5.942084312438965, "global_step": 69590, "epoch": 1656} {"train_loss": -6.153954029083252, "global_step": 69591, "epoch": 1656} {"train_loss": -6.035333633422852, "global_step": 69592, "epoch": 1656} {"train_loss": -6.000615914662679, "global_step": 69593, "epoch": 1656, "val_loss": 67356.4375} {"train_loss": -6.011665344238281, "global_step": 69594, "epoch": 1657} {"train_loss": -6.048592567443848, "global_step": 69595, "epoch": 1657} {"train_loss": -6.00895881652832, "global_step": 69596, "epoch": 1657} {"train_loss": -5.959210395812988, "global_step": 69597, "epoch": 1657} {"train_loss": -5.8933515548706055, "global_step": 69598, "epoch": 1657} {"train_loss": -6.166356086730957, "global_step": 69599, "epoch": 1657} {"train_loss": -6.018636226654053, "global_step": 69600, "epoch": 1657} {"train_loss": -5.978244781494141, "global_step": 69601, "epoch": 1657} {"train_loss": -6.001884460449219, "global_step": 69602, "epoch": 1657} {"train_loss": -6.027260780334473, "global_step": 69603, "epoch": 1657} {"train_loss": -6.054791450500488, "global_step": 69604, "epoch": 1657} {"train_loss": -5.943582534790039, "global_step": 69605, "epoch": 1657} {"train_loss": -6.083919525146484, "global_step": 69606, "epoch": 1657} {"train_loss": -6.059174537658691, "global_step": 69607, "epoch": 1657} {"train_loss": -5.895482063293457, "global_step": 69608, "epoch": 1657} {"train_loss": -5.982583045959473, "global_step": 69609, "epoch": 1657} {"train_loss": -6.028688430786133, "global_step": 69610, "epoch": 1657} {"train_loss": -5.963146209716797, "global_step": 69611, "epoch": 1657} {"train_loss": -6.036996841430664, "global_step": 69612, "epoch": 1657} {"train_loss": -6.0367350578308105, "global_step": 69613, "epoch": 1657} {"train_loss": -5.908967018127441, "global_step": 69614, "epoch": 1657} {"train_loss": -6.113503456115723, "global_step": 69615, "epoch": 1657} {"train_loss": -5.924879550933838, "global_step": 69616, "epoch": 1657} {"train_loss": -5.983292579650879, "global_step": 69617, "epoch": 1657} {"train_loss": -5.807933807373047, "global_step": 69618, "epoch": 1657} {"train_loss": -5.986865043640137, "global_step": 69619, "epoch": 1657} {"train_loss": -6.056061744689941, "global_step": 69620, "epoch": 1657} {"train_loss": -5.923255443572998, "global_step": 69621, "epoch": 1657} {"train_loss": -6.154797554016113, "global_step": 69622, "epoch": 1657} {"train_loss": -5.969305038452148, "global_step": 69623, "epoch": 1657} {"train_loss": -6.045324325561523, "global_step": 69624, "epoch": 1657} {"train_loss": -6.165440082550049, "global_step": 69625, "epoch": 1657} {"train_loss": -5.94219970703125, "global_step": 69626, "epoch": 1657} {"train_loss": -5.920559883117676, "global_step": 69627, "epoch": 1657} {"train_loss": -5.966789722442627, "global_step": 69628, "epoch": 1657} {"train_loss": -5.925122261047363, "global_step": 69629, "epoch": 1657} {"train_loss": -6.092469215393066, "global_step": 69630, "epoch": 1657} {"train_loss": -5.983888626098633, "global_step": 69631, "epoch": 1657} {"train_loss": -5.97172737121582, "global_step": 69632, "epoch": 1657} {"train_loss": -6.101452350616455, "global_step": 69633, "epoch": 1657} {"train_loss": -5.962418556213379, "global_step": 69634, "epoch": 1657} {"train_loss": -6.002676975159418, "global_step": 69635, "epoch": 1657, "val_loss": 67505.5859375} {"train_loss": -6.021739482879639, "global_step": 69636, "epoch": 1658} {"train_loss": -5.9566569328308105, "global_step": 69637, "epoch": 1658} {"train_loss": -5.941946506500244, "global_step": 69638, "epoch": 1658} {"train_loss": -5.8829145431518555, "global_step": 69639, "epoch": 1658} {"train_loss": -6.000288486480713, "global_step": 69640, "epoch": 1658} {"train_loss": -5.979058265686035, "global_step": 69641, "epoch": 1658} {"train_loss": -6.015695571899414, "global_step": 69642, "epoch": 1658} {"train_loss": -5.998408317565918, "global_step": 69643, "epoch": 1658} {"train_loss": -5.981043815612793, "global_step": 69644, "epoch": 1658} {"train_loss": -6.0717034339904785, "global_step": 69645, "epoch": 1658} {"train_loss": -6.092951774597168, "global_step": 69646, "epoch": 1658} {"train_loss": -5.923717021942139, "global_step": 69647, "epoch": 1658} {"train_loss": -6.135811805725098, "global_step": 69648, "epoch": 1658} {"train_loss": -6.115571975708008, "global_step": 69649, "epoch": 1658} {"train_loss": -6.1236090660095215, "global_step": 69650, "epoch": 1658} {"train_loss": -6.013615131378174, "global_step": 69651, "epoch": 1658} {"train_loss": -6.0440168380737305, "global_step": 69652, "epoch": 1658} {"train_loss": -6.041334629058838, "global_step": 69653, "epoch": 1658} {"train_loss": -6.066479206085205, "global_step": 69654, "epoch": 1658} {"train_loss": -6.135883331298828, "global_step": 69655, "epoch": 1658} {"train_loss": -6.044779300689697, "global_step": 69656, "epoch": 1658} {"train_loss": -5.809240341186523, "global_step": 69657, "epoch": 1658} {"train_loss": -6.004887580871582, "global_step": 69658, "epoch": 1658} {"train_loss": -6.042858123779297, "global_step": 69659, "epoch": 1658} {"train_loss": -6.023124694824219, "global_step": 69660, "epoch": 1658} {"train_loss": -6.000481605529785, "global_step": 69661, "epoch": 1658} {"train_loss": -5.956242084503174, "global_step": 69662, "epoch": 1658} {"train_loss": -6.017701625823975, "global_step": 69663, "epoch": 1658} {"train_loss": -5.936811447143555, "global_step": 69664, "epoch": 1658} {"train_loss": -5.958702087402344, "global_step": 69665, "epoch": 1658} {"train_loss": -5.926324844360352, "global_step": 69666, "epoch": 1658} {"train_loss": -6.14832878112793, "global_step": 69667, "epoch": 1658} {"train_loss": -5.952742576599121, "global_step": 69668, "epoch": 1658} {"train_loss": -5.958200454711914, "global_step": 69669, "epoch": 1658} {"train_loss": -5.93301248550415, "global_step": 69670, "epoch": 1658} {"train_loss": -6.074949741363525, "global_step": 69671, "epoch": 1658} {"train_loss": -5.878653526306152, "global_step": 69672, "epoch": 1658} {"train_loss": -6.016136169433594, "global_step": 69673, "epoch": 1658} {"train_loss": -5.970626354217529, "global_step": 69674, "epoch": 1658} {"train_loss": -6.059106349945068, "global_step": 69675, "epoch": 1658} {"train_loss": -5.917291641235352, "global_step": 69676, "epoch": 1658} {"train_loss": -6.001702967144194, "global_step": 69677, "epoch": 1658, "val_loss": 67438.8828125} {"train_loss": -5.987691879272461, "global_step": 69678, "epoch": 1659} {"train_loss": -5.9975385665893555, "global_step": 69679, "epoch": 1659} {"train_loss": -6.010309219360352, "global_step": 69680, "epoch": 1659} {"train_loss": -5.892342567443848, "global_step": 69681, "epoch": 1659} {"train_loss": -6.058290004730225, "global_step": 69682, "epoch": 1659} {"train_loss": -6.013033866882324, "global_step": 69683, "epoch": 1659} {"train_loss": -5.936326026916504, "global_step": 69684, "epoch": 1659} {"train_loss": -5.948091983795166, "global_step": 69685, "epoch": 1659} {"train_loss": -6.013211727142334, "global_step": 69686, "epoch": 1659} {"train_loss": -6.089898109436035, "global_step": 69687, "epoch": 1659} {"train_loss": -5.996832370758057, "global_step": 69688, "epoch": 1659} {"train_loss": -5.998579978942871, "global_step": 69689, "epoch": 1659} {"train_loss": -5.942224502563477, "global_step": 69690, "epoch": 1659} {"train_loss": -6.029975891113281, "global_step": 69691, "epoch": 1659} {"train_loss": -6.106390476226807, "global_step": 69692, "epoch": 1659} {"train_loss": -6.013688087463379, "global_step": 69693, "epoch": 1659} {"train_loss": -6.105299472808838, "global_step": 69694, "epoch": 1659} {"train_loss": -6.147665977478027, "global_step": 69695, "epoch": 1659} {"train_loss": -5.981712818145752, "global_step": 69696, "epoch": 1659} {"train_loss": -5.977869033813477, "global_step": 69697, "epoch": 1659} {"train_loss": -6.084163188934326, "global_step": 69698, "epoch": 1659} {"train_loss": -6.1768598556518555, "global_step": 69699, "epoch": 1659} {"train_loss": -5.94445276260376, "global_step": 69700, "epoch": 1659} {"train_loss": -5.9162211418151855, "global_step": 69701, "epoch": 1659} {"train_loss": -6.159507751464844, "global_step": 69702, "epoch": 1659} {"train_loss": -6.063782691955566, "global_step": 69703, "epoch": 1659} {"train_loss": -6.010279655456543, "global_step": 69704, "epoch": 1659} {"train_loss": -6.070320129394531, "global_step": 69705, "epoch": 1659} {"train_loss": -6.028937339782715, "global_step": 69706, "epoch": 1659} {"train_loss": -6.130128860473633, "global_step": 69707, "epoch": 1659} {"train_loss": -6.037446975708008, "global_step": 69708, "epoch": 1659} {"train_loss": -6.063205718994141, "global_step": 69709, "epoch": 1659} {"train_loss": -6.108645915985107, "global_step": 69710, "epoch": 1659} {"train_loss": -6.085964202880859, "global_step": 69711, "epoch": 1659} {"train_loss": -6.111164093017578, "global_step": 69712, "epoch": 1659} {"train_loss": -6.052933692932129, "global_step": 69713, "epoch": 1659} {"train_loss": -6.066986083984375, "global_step": 69714, "epoch": 1659} {"train_loss": -6.111663818359375, "global_step": 69715, "epoch": 1659} {"train_loss": -5.9105143547058105, "global_step": 69716, "epoch": 1659} {"train_loss": -6.030192852020264, "global_step": 69717, "epoch": 1659} {"train_loss": -5.8972697257995605, "global_step": 69718, "epoch": 1659} {"train_loss": -6.03492412113008, "global_step": 69719, "epoch": 1659, "val_loss": 67203.3046875} {"train_loss": -6.061200141906738, "global_step": 69720, "epoch": 1660} {"train_loss": -6.027684211730957, "global_step": 69721, "epoch": 1660} {"train_loss": -6.030903339385986, "global_step": 69722, "epoch": 1660} {"train_loss": -5.93672513961792, "global_step": 69723, "epoch": 1660} {"train_loss": -6.003605842590332, "global_step": 69724, "epoch": 1660} {"train_loss": -6.104948997497559, "global_step": 69725, "epoch": 1660} {"train_loss": -5.951202869415283, "global_step": 69726, "epoch": 1660} {"train_loss": -6.032573699951172, "global_step": 69727, "epoch": 1660} {"train_loss": -6.064850330352783, "global_step": 69728, "epoch": 1660} {"train_loss": -5.983058929443359, "global_step": 69729, "epoch": 1660} {"train_loss": -5.95760440826416, "global_step": 69730, "epoch": 1660} {"train_loss": -5.928798198699951, "global_step": 69731, "epoch": 1660} {"train_loss": -5.989867687225342, "global_step": 69732, "epoch": 1660} {"train_loss": -6.026389122009277, "global_step": 69733, "epoch": 1660} {"train_loss": -6.125237464904785, "global_step": 69734, "epoch": 1660} {"train_loss": -6.031868934631348, "global_step": 69735, "epoch": 1660} {"train_loss": -5.96550989151001, "global_step": 69736, "epoch": 1660} {"train_loss": -6.046171188354492, "global_step": 69737, "epoch": 1660} {"train_loss": -5.958008766174316, "global_step": 69738, "epoch": 1660} {"train_loss": -6.0321197509765625, "global_step": 69739, "epoch": 1660} {"train_loss": -6.115049362182617, "global_step": 69740, "epoch": 1660} {"train_loss": -6.024151802062988, "global_step": 69741, "epoch": 1660} {"train_loss": -6.017806053161621, "global_step": 69742, "epoch": 1660} {"train_loss": -6.035708427429199, "global_step": 69743, "epoch": 1660} {"train_loss": -5.999396324157715, "global_step": 69744, "epoch": 1660} {"train_loss": -5.909336090087891, "global_step": 69745, "epoch": 1660} {"train_loss": -6.020910739898682, "global_step": 69746, "epoch": 1660} {"train_loss": -5.816467761993408, "global_step": 69747, "epoch": 1660} {"train_loss": -5.889815330505371, "global_step": 69748, "epoch": 1660} {"train_loss": -6.052586555480957, "global_step": 69749, "epoch": 1660} {"train_loss": -5.917506217956543, "global_step": 69750, "epoch": 1660} {"train_loss": -5.939203262329102, "global_step": 69751, "epoch": 1660} {"train_loss": -6.043248653411865, "global_step": 69752, "epoch": 1660} {"train_loss": -5.984678745269775, "global_step": 69753, "epoch": 1660} {"train_loss": -6.038350582122803, "global_step": 69754, "epoch": 1660} {"train_loss": -5.9572529792785645, "global_step": 69755, "epoch": 1660} {"train_loss": -6.031121253967285, "global_step": 69756, "epoch": 1660} {"train_loss": -5.9661865234375, "global_step": 69757, "epoch": 1660} {"train_loss": -5.977386474609375, "global_step": 69758, "epoch": 1660} {"train_loss": -6.024534225463867, "global_step": 69759, "epoch": 1660} {"train_loss": -5.889004230499268, "global_step": 69760, "epoch": 1660} {"train_loss": -5.996271803265526, "global_step": 69761, "epoch": 1660, "val_loss": 67332.4921875} {"train_loss": -5.99775505065918, "global_step": 69762, "epoch": 1661} {"train_loss": -6.08388614654541, "global_step": 69763, "epoch": 1661} {"train_loss": -5.952067852020264, "global_step": 69764, "epoch": 1661} {"train_loss": -5.99845027923584, "global_step": 69765, "epoch": 1661} {"train_loss": -6.026930809020996, "global_step": 69766, "epoch": 1661} {"train_loss": -6.127092361450195, "global_step": 69767, "epoch": 1661} {"train_loss": -6.013670444488525, "global_step": 69768, "epoch": 1661} {"train_loss": -5.931516170501709, "global_step": 69769, "epoch": 1661} {"train_loss": -6.0061564445495605, "global_step": 69770, "epoch": 1661} {"train_loss": -6.003080368041992, "global_step": 69771, "epoch": 1661} {"train_loss": -5.965206146240234, "global_step": 69772, "epoch": 1661} {"train_loss": -6.040853977203369, "global_step": 69773, "epoch": 1661} {"train_loss": -5.978102207183838, "global_step": 69774, "epoch": 1661} {"train_loss": -6.018505096435547, "global_step": 69775, "epoch": 1661} {"train_loss": -5.910150527954102, "global_step": 69776, "epoch": 1661} {"train_loss": -5.940591335296631, "global_step": 69777, "epoch": 1661} {"train_loss": -6.061939239501953, "global_step": 69778, "epoch": 1661} {"train_loss": -5.954388618469238, "global_step": 69779, "epoch": 1661} {"train_loss": -5.993780136108398, "global_step": 69780, "epoch": 1661} {"train_loss": -6.095217227935791, "global_step": 69781, "epoch": 1661} {"train_loss": -5.967355251312256, "global_step": 69782, "epoch": 1661} {"train_loss": -5.974471092224121, "global_step": 69783, "epoch": 1661} {"train_loss": -5.906000137329102, "global_step": 69784, "epoch": 1661} {"train_loss": -5.937878608703613, "global_step": 69785, "epoch": 1661} {"train_loss": -5.985317707061768, "global_step": 69786, "epoch": 1661} {"train_loss": -6.041767597198486, "global_step": 69787, "epoch": 1661} {"train_loss": -6.066528797149658, "global_step": 69788, "epoch": 1661} {"train_loss": -5.910738945007324, "global_step": 69789, "epoch": 1661} {"train_loss": -5.9259033203125, "global_step": 69790, "epoch": 1661} {"train_loss": -6.011507511138916, "global_step": 69791, "epoch": 1661} {"train_loss": -5.946993350982666, "global_step": 69792, "epoch": 1661} {"train_loss": -5.9624528884887695, "global_step": 69793, "epoch": 1661} {"train_loss": -6.01826810836792, "global_step": 69794, "epoch": 1661} {"train_loss": -5.96127462387085, "global_step": 69795, "epoch": 1661} {"train_loss": -5.8729143142700195, "global_step": 69796, "epoch": 1661} {"train_loss": -6.046726703643799, "global_step": 69797, "epoch": 1661} {"train_loss": -6.0637054443359375, "global_step": 69798, "epoch": 1661} {"train_loss": -6.016120910644531, "global_step": 69799, "epoch": 1661} {"train_loss": -6.125658988952637, "global_step": 69800, "epoch": 1661} {"train_loss": -6.037322044372559, "global_step": 69801, "epoch": 1661} {"train_loss": -5.971166610717773, "global_step": 69802, "epoch": 1661} {"train_loss": -5.994851021539597, "global_step": 69803, "epoch": 1661, "val_loss": 67131.5546875} {"train_loss": -5.923400402069092, "global_step": 69804, "epoch": 1662} {"train_loss": -5.963709831237793, "global_step": 69805, "epoch": 1662} {"train_loss": -6.010464668273926, "global_step": 69806, "epoch": 1662} {"train_loss": -6.058389663696289, "global_step": 69807, "epoch": 1662} {"train_loss": -5.909429550170898, "global_step": 69808, "epoch": 1662} {"train_loss": -5.960000991821289, "global_step": 69809, "epoch": 1662} {"train_loss": -6.08665657043457, "global_step": 69810, "epoch": 1662} {"train_loss": -6.028741836547852, "global_step": 69811, "epoch": 1662} {"train_loss": -5.998268127441406, "global_step": 69812, "epoch": 1662} {"train_loss": -6.069423198699951, "global_step": 69813, "epoch": 1662} {"train_loss": -6.106740951538086, "global_step": 69814, "epoch": 1662} {"train_loss": -5.984613418579102, "global_step": 69815, "epoch": 1662} {"train_loss": -5.934842109680176, "global_step": 69816, "epoch": 1662} {"train_loss": -6.036892414093018, "global_step": 69817, "epoch": 1662} {"train_loss": -5.910655498504639, "global_step": 69818, "epoch": 1662} {"train_loss": -6.057923793792725, "global_step": 69819, "epoch": 1662} {"train_loss": -5.9870285987854, "global_step": 69820, "epoch": 1662} {"train_loss": -5.896758079528809, "global_step": 69821, "epoch": 1662} {"train_loss": -6.041209697723389, "global_step": 69822, "epoch": 1662} {"train_loss": -6.0537214279174805, "global_step": 69823, "epoch": 1662} {"train_loss": -5.990878105163574, "global_step": 69824, "epoch": 1662} {"train_loss": -6.065905570983887, "global_step": 69825, "epoch": 1662} {"train_loss": -6.123029708862305, "global_step": 69826, "epoch": 1662} {"train_loss": -6.009622573852539, "global_step": 69827, "epoch": 1662} {"train_loss": -6.070074558258057, "global_step": 69828, "epoch": 1662} {"train_loss": -5.951199531555176, "global_step": 69829, "epoch": 1662} {"train_loss": -5.945656776428223, "global_step": 69830, "epoch": 1662} {"train_loss": -6.105567932128906, "global_step": 69831, "epoch": 1662} {"train_loss": -6.012510299682617, "global_step": 69832, "epoch": 1662} {"train_loss": -6.089021682739258, "global_step": 69833, "epoch": 1662} {"train_loss": -5.936341285705566, "global_step": 69834, "epoch": 1662} {"train_loss": -6.083095550537109, "global_step": 69835, "epoch": 1662} {"train_loss": -5.942352294921875, "global_step": 69836, "epoch": 1662} {"train_loss": -6.0550642013549805, "global_step": 69837, "epoch": 1662} {"train_loss": -6.134160995483398, "global_step": 69838, "epoch": 1662} {"train_loss": -5.96738338470459, "global_step": 69839, "epoch": 1662} {"train_loss": -6.021146774291992, "global_step": 69840, "epoch": 1662} {"train_loss": -5.933135032653809, "global_step": 69841, "epoch": 1662} {"train_loss": -5.984631538391113, "global_step": 69842, "epoch": 1662} {"train_loss": -6.033411026000977, "global_step": 69843, "epoch": 1662} {"train_loss": -6.069634437561035, "global_step": 69844, "epoch": 1662} {"train_loss": -6.015546333222162, "global_step": 69845, "epoch": 1662, "val_loss": 67336.453125} {"train_loss": -6.013934135437012, "global_step": 69846, "epoch": 1663} {"train_loss": -5.919251918792725, "global_step": 69847, "epoch": 1663} {"train_loss": -5.98499870300293, "global_step": 69848, "epoch": 1663} {"train_loss": -5.940542221069336, "global_step": 69849, "epoch": 1663} {"train_loss": -5.992735385894775, "global_step": 69850, "epoch": 1663} {"train_loss": -5.9489898681640625, "global_step": 69851, "epoch": 1663} {"train_loss": -6.002336025238037, "global_step": 69852, "epoch": 1663} {"train_loss": -5.9349894523620605, "global_step": 69853, "epoch": 1663} {"train_loss": -5.91623067855835, "global_step": 69854, "epoch": 1663} {"train_loss": -5.942903518676758, "global_step": 69855, "epoch": 1663} {"train_loss": -5.882995128631592, "global_step": 69856, "epoch": 1663} {"train_loss": -6.017706871032715, "global_step": 69857, "epoch": 1663} {"train_loss": -6.022882461547852, "global_step": 69858, "epoch": 1663} {"train_loss": -5.9140167236328125, "global_step": 69859, "epoch": 1663} {"train_loss": -5.912265777587891, "global_step": 69860, "epoch": 1663} {"train_loss": -5.981093883514404, "global_step": 69861, "epoch": 1663} {"train_loss": -5.96385383605957, "global_step": 69862, "epoch": 1663} {"train_loss": -5.976245403289795, "global_step": 69863, "epoch": 1663} {"train_loss": -6.0846099853515625, "global_step": 69864, "epoch": 1663} {"train_loss": -5.934438705444336, "global_step": 69865, "epoch": 1663} {"train_loss": -6.0761919021606445, "global_step": 69866, "epoch": 1663} {"train_loss": -6.0393900871276855, "global_step": 69867, "epoch": 1663} {"train_loss": -5.910023212432861, "global_step": 69868, "epoch": 1663} {"train_loss": -6.0583109855651855, "global_step": 69869, "epoch": 1663} {"train_loss": -5.9429779052734375, "global_step": 69870, "epoch": 1663} {"train_loss": -6.026837348937988, "global_step": 69871, "epoch": 1663} {"train_loss": -6.091892719268799, "global_step": 69872, "epoch": 1663} {"train_loss": -5.923965930938721, "global_step": 69873, "epoch": 1663} {"train_loss": -5.978776931762695, "global_step": 69874, "epoch": 1663} {"train_loss": -5.866795539855957, "global_step": 69875, "epoch": 1663} {"train_loss": -6.029562950134277, "global_step": 69876, "epoch": 1663} {"train_loss": -5.972602844238281, "global_step": 69877, "epoch": 1663} {"train_loss": -5.986688613891602, "global_step": 69878, "epoch": 1663} {"train_loss": -5.78724479675293, "global_step": 69879, "epoch": 1663} {"train_loss": -6.154541015625, "global_step": 69880, "epoch": 1663} {"train_loss": -5.934693336486816, "global_step": 69881, "epoch": 1663} {"train_loss": -6.018339157104492, "global_step": 69882, "epoch": 1663} {"train_loss": -6.081609725952148, "global_step": 69883, "epoch": 1663} {"train_loss": -6.046578407287598, "global_step": 69884, "epoch": 1663} {"train_loss": -6.104057312011719, "global_step": 69885, "epoch": 1663} {"train_loss": -6.034452438354492, "global_step": 69886, "epoch": 1663} {"train_loss": -5.984891278403146, "global_step": 69887, "epoch": 1663, "val_loss": 67243.1484375} {"train_loss": -5.891604423522949, "global_step": 69888, "epoch": 1664} {"train_loss": -6.053833484649658, "global_step": 69889, "epoch": 1664} {"train_loss": -6.070524215698242, "global_step": 69890, "epoch": 1664} {"train_loss": -6.008254051208496, "global_step": 69891, "epoch": 1664} {"train_loss": -5.854650020599365, "global_step": 69892, "epoch": 1664} {"train_loss": -6.056329727172852, "global_step": 69893, "epoch": 1664} {"train_loss": -6.10628604888916, "global_step": 69894, "epoch": 1664} {"train_loss": -6.058711051940918, "global_step": 69895, "epoch": 1664} {"train_loss": -6.004012107849121, "global_step": 69896, "epoch": 1664} {"train_loss": -6.04891300201416, "global_step": 69897, "epoch": 1664} {"train_loss": -6.029544830322266, "global_step": 69898, "epoch": 1664} {"train_loss": -5.911026954650879, "global_step": 69899, "epoch": 1664} {"train_loss": -6.061557292938232, "global_step": 69900, "epoch": 1664} {"train_loss": -5.955342769622803, "global_step": 69901, "epoch": 1664} {"train_loss": -5.939674377441406, "global_step": 69902, "epoch": 1664} {"train_loss": -6.0267558097839355, "global_step": 69903, "epoch": 1664} {"train_loss": -5.90183162689209, "global_step": 69904, "epoch": 1664} {"train_loss": -5.9451799392700195, "global_step": 69905, "epoch": 1664} {"train_loss": -5.82509708404541, "global_step": 69906, "epoch": 1664} {"train_loss": -6.1240081787109375, "global_step": 69907, "epoch": 1664} {"train_loss": -6.057649612426758, "global_step": 69908, "epoch": 1664} {"train_loss": -5.954076290130615, "global_step": 69909, "epoch": 1664} {"train_loss": -6.080719470977783, "global_step": 69910, "epoch": 1664} {"train_loss": -5.9425883293151855, "global_step": 69911, "epoch": 1664} {"train_loss": -5.87892484664917, "global_step": 69912, "epoch": 1664} {"train_loss": -5.952340602874756, "global_step": 69913, "epoch": 1664} {"train_loss": -6.175829887390137, "global_step": 69914, "epoch": 1664} {"train_loss": -6.028750419616699, "global_step": 69915, "epoch": 1664} {"train_loss": -6.113451957702637, "global_step": 69916, "epoch": 1664} {"train_loss": -5.904480457305908, "global_step": 69917, "epoch": 1664} {"train_loss": -6.040309906005859, "global_step": 69918, "epoch": 1664} {"train_loss": -5.9281463623046875, "global_step": 69919, "epoch": 1664} {"train_loss": -5.972957134246826, "global_step": 69920, "epoch": 1664} {"train_loss": -6.043850898742676, "global_step": 69921, "epoch": 1664} {"train_loss": -5.972810745239258, "global_step": 69922, "epoch": 1664} {"train_loss": -5.956574440002441, "global_step": 69923, "epoch": 1664} {"train_loss": -5.997148036956787, "global_step": 69924, "epoch": 1664} {"train_loss": -5.934106826782227, "global_step": 69925, "epoch": 1664} {"train_loss": -6.137094497680664, "global_step": 69926, "epoch": 1664} {"train_loss": -5.982421875, "global_step": 69927, "epoch": 1664} {"train_loss": -5.973644256591797, "global_step": 69928, "epoch": 1664} {"train_loss": -5.997051988329206, "global_step": 69929, "epoch": 1664, "val_loss": 67238.5625} {"train_loss": -5.990939140319824, "global_step": 69930, "epoch": 1665} {"train_loss": -5.961568832397461, "global_step": 69931, "epoch": 1665} {"train_loss": -5.902584075927734, "global_step": 69932, "epoch": 1665} {"train_loss": -5.958029270172119, "global_step": 69933, "epoch": 1665} {"train_loss": -6.018134117126465, "global_step": 69934, "epoch": 1665} {"train_loss": -6.079076766967773, "global_step": 69935, "epoch": 1665} {"train_loss": -5.974824905395508, "global_step": 69936, "epoch": 1665} {"train_loss": -5.892099857330322, "global_step": 69937, "epoch": 1665} {"train_loss": -6.01701545715332, "global_step": 69938, "epoch": 1665} {"train_loss": -5.876120090484619, "global_step": 69939, "epoch": 1665} {"train_loss": -6.03562068939209, "global_step": 69940, "epoch": 1665} {"train_loss": -6.024554252624512, "global_step": 69941, "epoch": 1665} {"train_loss": -6.028326988220215, "global_step": 69942, "epoch": 1665} {"train_loss": -6.064099311828613, "global_step": 69943, "epoch": 1665} {"train_loss": -5.98371696472168, "global_step": 69944, "epoch": 1665} {"train_loss": -6.08005428314209, "global_step": 69945, "epoch": 1665} {"train_loss": -6.112650394439697, "global_step": 69946, "epoch": 1665} {"train_loss": -5.917024612426758, "global_step": 69947, "epoch": 1665} {"train_loss": -5.921642303466797, "global_step": 69948, "epoch": 1665} {"train_loss": -6.0937066078186035, "global_step": 69949, "epoch": 1665} {"train_loss": -6.040020942687988, "global_step": 69950, "epoch": 1665} {"train_loss": -5.945974349975586, "global_step": 69951, "epoch": 1665} {"train_loss": -6.094723224639893, "global_step": 69952, "epoch": 1665} {"train_loss": -6.058576583862305, "global_step": 69953, "epoch": 1665} {"train_loss": -6.009136199951172, "global_step": 69954, "epoch": 1665} {"train_loss": -5.982436180114746, "global_step": 69955, "epoch": 1665} {"train_loss": -6.026080131530762, "global_step": 69956, "epoch": 1665} {"train_loss": -6.125303268432617, "global_step": 69957, "epoch": 1665} {"train_loss": -6.0313005447387695, "global_step": 69958, "epoch": 1665} {"train_loss": -6.021773338317871, "global_step": 69959, "epoch": 1665} {"train_loss": -5.953242301940918, "global_step": 69960, "epoch": 1665} {"train_loss": -5.957877159118652, "global_step": 69961, "epoch": 1665} {"train_loss": -5.989670753479004, "global_step": 69962, "epoch": 1665} {"train_loss": -6.019323348999023, "global_step": 69963, "epoch": 1665} {"train_loss": -5.9319987297058105, "global_step": 69964, "epoch": 1665} {"train_loss": -6.030472755432129, "global_step": 69965, "epoch": 1665} {"train_loss": -5.990399360656738, "global_step": 69966, "epoch": 1665} {"train_loss": -6.050682544708252, "global_step": 69967, "epoch": 1665} {"train_loss": -5.990990161895752, "global_step": 69968, "epoch": 1665} {"train_loss": -6.0785698890686035, "global_step": 69969, "epoch": 1665} {"train_loss": -6.044893264770508, "global_step": 69970, "epoch": 1665} {"train_loss": -6.009325402123587, "global_step": 69971, "epoch": 1665, "val_loss": 67177.0859375} {"train_loss": -6.04982852935791, "global_step": 69972, "epoch": 1666} {"train_loss": -6.146843910217285, "global_step": 69973, "epoch": 1666} {"train_loss": -5.87757682800293, "global_step": 69974, "epoch": 1666} {"train_loss": -5.995362281799316, "global_step": 69975, "epoch": 1666} {"train_loss": -5.943883419036865, "global_step": 69976, "epoch": 1666} {"train_loss": -6.070557594299316, "global_step": 69977, "epoch": 1666} {"train_loss": -6.014437675476074, "global_step": 69978, "epoch": 1666} {"train_loss": -5.983982086181641, "global_step": 69979, "epoch": 1666} {"train_loss": -6.063628673553467, "global_step": 69980, "epoch": 1666} {"train_loss": -5.926546096801758, "global_step": 69981, "epoch": 1666} {"train_loss": -5.911623001098633, "global_step": 69982, "epoch": 1666} {"train_loss": -6.14108943939209, "global_step": 69983, "epoch": 1666} {"train_loss": -6.037332534790039, "global_step": 69984, "epoch": 1666} {"train_loss": -5.978260040283203, "global_step": 69985, "epoch": 1666} {"train_loss": -6.051161289215088, "global_step": 69986, "epoch": 1666} {"train_loss": -5.827243804931641, "global_step": 69987, "epoch": 1666} {"train_loss": -5.940589427947998, "global_step": 69988, "epoch": 1666} {"train_loss": -5.8694963455200195, "global_step": 69989, "epoch": 1666} {"train_loss": -5.981806755065918, "global_step": 69990, "epoch": 1666} {"train_loss": -6.0387372970581055, "global_step": 69991, "epoch": 1666} {"train_loss": -6.0079240798950195, "global_step": 69992, "epoch": 1666} {"train_loss": -6.044284820556641, "global_step": 69993, "epoch": 1666} {"train_loss": -6.019766330718994, "global_step": 69994, "epoch": 1666} {"train_loss": -5.857998847961426, "global_step": 69995, "epoch": 1666} {"train_loss": -6.020696640014648, "global_step": 69996, "epoch": 1666} {"train_loss": -6.082182884216309, "global_step": 69997, "epoch": 1666} {"train_loss": -6.0044965744018555, "global_step": 69998, "epoch": 1666} {"train_loss": -5.946861267089844, "global_step": 69999, "epoch": 1666} {"train_loss": -6.073373317718506, "global_step": 70000, "epoch": 1666} {"train_loss": -6.037726402282715, "global_step": 70001, "epoch": 1666} {"train_loss": -5.935677528381348, "global_step": 70002, "epoch": 1666} {"train_loss": -5.935616493225098, "global_step": 70003, "epoch": 1666} {"train_loss": -5.930416107177734, "global_step": 70004, "epoch": 1666} {"train_loss": -5.904394149780273, "global_step": 70005, "epoch": 1666} {"train_loss": -5.921069622039795, "global_step": 70006, "epoch": 1666} {"train_loss": -6.096778869628906, "global_step": 70007, "epoch": 1666} {"train_loss": -6.082688331604004, "global_step": 70008, "epoch": 1666} {"train_loss": -5.9446563720703125, "global_step": 70009, "epoch": 1666} {"train_loss": -5.984274387359619, "global_step": 70010, "epoch": 1666} {"train_loss": -6.053724765777588, "global_step": 70011, "epoch": 1666} {"train_loss": -5.908799171447754, "global_step": 70012, "epoch": 1666} {"train_loss": -5.993943850199382, "global_step": 70013, "epoch": 1666, "val_loss": 67297.4609375} {"train_loss": -6.036730766296387, "global_step": 70014, "epoch": 1667} {"train_loss": -6.006676197052002, "global_step": 70015, "epoch": 1667} {"train_loss": -5.990755081176758, "global_step": 70016, "epoch": 1667} {"train_loss": -6.118306636810303, "global_step": 70017, "epoch": 1667} {"train_loss": -5.971049785614014, "global_step": 70018, "epoch": 1667} {"train_loss": -6.006213188171387, "global_step": 70019, "epoch": 1667} {"train_loss": -6.072560787200928, "global_step": 70020, "epoch": 1667} {"train_loss": -5.9889421463012695, "global_step": 70021, "epoch": 1667} {"train_loss": -5.9040846824646, "global_step": 70022, "epoch": 1667} {"train_loss": -5.977522850036621, "global_step": 70023, "epoch": 1667} {"train_loss": -5.969109535217285, "global_step": 70024, "epoch": 1667} {"train_loss": -5.904819965362549, "global_step": 70025, "epoch": 1667} {"train_loss": -6.159109115600586, "global_step": 70026, "epoch": 1667} {"train_loss": -5.995070934295654, "global_step": 70027, "epoch": 1667} {"train_loss": -6.030477523803711, "global_step": 70028, "epoch": 1667} {"train_loss": -6.00117826461792, "global_step": 70029, "epoch": 1667} {"train_loss": -6.0063323974609375, "global_step": 70030, "epoch": 1667} {"train_loss": -6.022313117980957, "global_step": 70031, "epoch": 1667} {"train_loss": -6.055954456329346, "global_step": 70032, "epoch": 1667} {"train_loss": -6.070755958557129, "global_step": 70033, "epoch": 1667} {"train_loss": -6.017070770263672, "global_step": 70034, "epoch": 1667} {"train_loss": -6.036357879638672, "global_step": 70035, "epoch": 1667} {"train_loss": -5.99008846282959, "global_step": 70036, "epoch": 1667} {"train_loss": -5.969854354858398, "global_step": 70037, "epoch": 1667} {"train_loss": -6.063117980957031, "global_step": 70038, "epoch": 1667} {"train_loss": -6.134868144989014, "global_step": 70039, "epoch": 1667} {"train_loss": -5.928215503692627, "global_step": 70040, "epoch": 1667} {"train_loss": -6.045025825500488, "global_step": 70041, "epoch": 1667} {"train_loss": -5.995291709899902, "global_step": 70042, "epoch": 1667} {"train_loss": -5.9757585525512695, "global_step": 70043, "epoch": 1667} {"train_loss": -6.056859970092773, "global_step": 70044, "epoch": 1667} {"train_loss": -6.016808986663818, "global_step": 70045, "epoch": 1667} {"train_loss": -6.034546852111816, "global_step": 70046, "epoch": 1667} {"train_loss": -5.951793670654297, "global_step": 70047, "epoch": 1667} {"train_loss": -5.999014854431152, "global_step": 70048, "epoch": 1667} {"train_loss": -5.8857903480529785, "global_step": 70049, "epoch": 1667} {"train_loss": -5.976545810699463, "global_step": 70050, "epoch": 1667} {"train_loss": -6.07942008972168, "global_step": 70051, "epoch": 1667} {"train_loss": -6.009215354919434, "global_step": 70052, "epoch": 1667} {"train_loss": -5.974428176879883, "global_step": 70053, "epoch": 1667} {"train_loss": -6.026562690734863, "global_step": 70054, "epoch": 1667} {"train_loss": -6.0093336673009965, "global_step": 70055, "epoch": 1667, "val_loss": 67408.8203125} {"train_loss": -6.078149795532227, "global_step": 70056, "epoch": 1668} {"train_loss": -6.008181095123291, "global_step": 70057, "epoch": 1668} {"train_loss": -5.996025085449219, "global_step": 70058, "epoch": 1668} {"train_loss": -5.937473297119141, "global_step": 70059, "epoch": 1668} {"train_loss": -6.153189659118652, "global_step": 70060, "epoch": 1668} {"train_loss": -5.976265907287598, "global_step": 70061, "epoch": 1668} {"train_loss": -6.056069374084473, "global_step": 70062, "epoch": 1668} {"train_loss": -5.992824554443359, "global_step": 70063, "epoch": 1668} {"train_loss": -5.917102813720703, "global_step": 70064, "epoch": 1668} {"train_loss": -5.9240899085998535, "global_step": 70065, "epoch": 1668} {"train_loss": -6.111976146697998, "global_step": 70066, "epoch": 1668} {"train_loss": -6.065987586975098, "global_step": 70067, "epoch": 1668} {"train_loss": -5.992944717407227, "global_step": 70068, "epoch": 1668} {"train_loss": -6.066808223724365, "global_step": 70069, "epoch": 1668} {"train_loss": -6.025625228881836, "global_step": 70070, "epoch": 1668} {"train_loss": -5.942108631134033, "global_step": 70071, "epoch": 1668} {"train_loss": -5.998371124267578, "global_step": 70072, "epoch": 1668} {"train_loss": -6.07774543762207, "global_step": 70073, "epoch": 1668} {"train_loss": -6.09006404876709, "global_step": 70074, "epoch": 1668} {"train_loss": -5.934704780578613, "global_step": 70075, "epoch": 1668} {"train_loss": -6.040110111236572, "global_step": 70076, "epoch": 1668} {"train_loss": -6.043184757232666, "global_step": 70077, "epoch": 1668} {"train_loss": -6.073290824890137, "global_step": 70078, "epoch": 1668} {"train_loss": -6.015376567840576, "global_step": 70079, "epoch": 1668} {"train_loss": -5.880397319793701, "global_step": 70080, "epoch": 1668} {"train_loss": -6.005733966827393, "global_step": 70081, "epoch": 1668} {"train_loss": -5.9555864334106445, "global_step": 70082, "epoch": 1668} {"train_loss": -6.057078838348389, "global_step": 70083, "epoch": 1668} {"train_loss": -6.051159858703613, "global_step": 70084, "epoch": 1668} {"train_loss": -6.002497673034668, "global_step": 70085, "epoch": 1668} {"train_loss": -5.9202561378479, "global_step": 70086, "epoch": 1668} {"train_loss": -6.054222106933594, "global_step": 70087, "epoch": 1668} {"train_loss": -6.060445785522461, "global_step": 70088, "epoch": 1668} {"train_loss": -5.960010528564453, "global_step": 70089, "epoch": 1668} {"train_loss": -6.082465648651123, "global_step": 70090, "epoch": 1668} {"train_loss": -6.179788589477539, "global_step": 70091, "epoch": 1668} {"train_loss": -5.991575241088867, "global_step": 70092, "epoch": 1668} {"train_loss": -6.04399299621582, "global_step": 70093, "epoch": 1668} {"train_loss": -6.0198564529418945, "global_step": 70094, "epoch": 1668} {"train_loss": -6.135983467102051, "global_step": 70095, "epoch": 1668} {"train_loss": -6.101931571960449, "global_step": 70096, "epoch": 1668} {"train_loss": -6.024109556561425, "global_step": 70097, "epoch": 1668, "val_loss": 67380.7109375} {"train_loss": -6.059093952178955, "global_step": 70098, "epoch": 1669} {"train_loss": -5.985381126403809, "global_step": 70099, "epoch": 1669} {"train_loss": -6.021404266357422, "global_step": 70100, "epoch": 1669} {"train_loss": -6.000974655151367, "global_step": 70101, "epoch": 1669} {"train_loss": -6.03548526763916, "global_step": 70102, "epoch": 1669} {"train_loss": -6.03202486038208, "global_step": 70103, "epoch": 1669} {"train_loss": -5.928153991699219, "global_step": 70104, "epoch": 1669} {"train_loss": -6.014499187469482, "global_step": 70105, "epoch": 1669} {"train_loss": -6.046413421630859, "global_step": 70106, "epoch": 1669} {"train_loss": -6.06942892074585, "global_step": 70107, "epoch": 1669} {"train_loss": -6.062401294708252, "global_step": 70108, "epoch": 1669} {"train_loss": -5.900529384613037, "global_step": 70109, "epoch": 1669} {"train_loss": -6.0103535652160645, "global_step": 70110, "epoch": 1669} {"train_loss": -6.084264755249023, "global_step": 70111, "epoch": 1669} {"train_loss": -5.925779819488525, "global_step": 70112, "epoch": 1669} {"train_loss": -6.095878601074219, "global_step": 70113, "epoch": 1669} {"train_loss": -5.979774475097656, "global_step": 70114, "epoch": 1669} {"train_loss": -5.993563652038574, "global_step": 70115, "epoch": 1669} {"train_loss": -5.895370006561279, "global_step": 70116, "epoch": 1669} {"train_loss": -5.953424453735352, "global_step": 70117, "epoch": 1669} {"train_loss": -5.854913711547852, "global_step": 70118, "epoch": 1669} {"train_loss": -6.01856803894043, "global_step": 70119, "epoch": 1669} {"train_loss": -5.886163711547852, "global_step": 70120, "epoch": 1669} {"train_loss": -5.963731288909912, "global_step": 70121, "epoch": 1669} {"train_loss": -5.922478199005127, "global_step": 70122, "epoch": 1669} {"train_loss": -5.987207889556885, "global_step": 70123, "epoch": 1669} {"train_loss": -5.919216632843018, "global_step": 70124, "epoch": 1669} {"train_loss": -6.030097007751465, "global_step": 70125, "epoch": 1669} {"train_loss": -6.0208892822265625, "global_step": 70126, "epoch": 1669} {"train_loss": -5.80105447769165, "global_step": 70127, "epoch": 1669} {"train_loss": -5.992864608764648, "global_step": 70128, "epoch": 1669} {"train_loss": -6.062154769897461, "global_step": 70129, "epoch": 1669} {"train_loss": -6.023963928222656, "global_step": 70130, "epoch": 1669} {"train_loss": -6.102721214294434, "global_step": 70131, "epoch": 1669} {"train_loss": -5.864285469055176, "global_step": 70132, "epoch": 1669} {"train_loss": -5.9990386962890625, "global_step": 70133, "epoch": 1669} {"train_loss": -6.0457048416137695, "global_step": 70134, "epoch": 1669} {"train_loss": -6.049763202667236, "global_step": 70135, "epoch": 1669} {"train_loss": -6.088376045227051, "global_step": 70136, "epoch": 1669} {"train_loss": -5.961573123931885, "global_step": 70137, "epoch": 1669} {"train_loss": -6.06766414642334, "global_step": 70138, "epoch": 1669} {"train_loss": -5.997940120242891, "global_step": 70139, "epoch": 1669, "val_loss": 67345.109375} {"train_loss": -6.058463096618652, "global_step": 70140, "epoch": 1670} {"train_loss": -5.968397617340088, "global_step": 70141, "epoch": 1670} {"train_loss": -6.0650739669799805, "global_step": 70142, "epoch": 1670} {"train_loss": -5.906778335571289, "global_step": 70143, "epoch": 1670} {"train_loss": -6.069870948791504, "global_step": 70144, "epoch": 1670} {"train_loss": -5.9538679122924805, "global_step": 70145, "epoch": 1670} {"train_loss": -5.991054058074951, "global_step": 70146, "epoch": 1670} {"train_loss": -6.00537109375, "global_step": 70147, "epoch": 1670} {"train_loss": -5.921472549438477, "global_step": 70148, "epoch": 1670} {"train_loss": -5.984975814819336, "global_step": 70149, "epoch": 1670} {"train_loss": -5.964821815490723, "global_step": 70150, "epoch": 1670} {"train_loss": -6.1985273361206055, "global_step": 70151, "epoch": 1670} {"train_loss": -6.070711135864258, "global_step": 70152, "epoch": 1670} {"train_loss": -6.027706623077393, "global_step": 70153, "epoch": 1670} {"train_loss": -6.1747283935546875, "global_step": 70154, "epoch": 1670} {"train_loss": -6.077271461486816, "global_step": 70155, "epoch": 1670} {"train_loss": -6.013825416564941, "global_step": 70156, "epoch": 1670} {"train_loss": -5.889415740966797, "global_step": 70157, "epoch": 1670} {"train_loss": -6.018790245056152, "global_step": 70158, "epoch": 1670} {"train_loss": -6.055276870727539, "global_step": 70159, "epoch": 1670} {"train_loss": -5.876872539520264, "global_step": 70160, "epoch": 1670} {"train_loss": -6.088050842285156, "global_step": 70161, "epoch": 1670} {"train_loss": -6.0671467781066895, "global_step": 70162, "epoch": 1670} {"train_loss": -6.036171913146973, "global_step": 70163, "epoch": 1670} {"train_loss": -6.011569023132324, "global_step": 70164, "epoch": 1670} {"train_loss": -5.952879428863525, "global_step": 70165, "epoch": 1670} {"train_loss": -5.91555118560791, "global_step": 70166, "epoch": 1670} {"train_loss": -5.927555084228516, "global_step": 70167, "epoch": 1670} {"train_loss": -5.864593982696533, "global_step": 70168, "epoch": 1670} {"train_loss": -5.954889297485352, "global_step": 70169, "epoch": 1670} {"train_loss": -6.034548759460449, "global_step": 70170, "epoch": 1670} {"train_loss": -5.9605560302734375, "global_step": 70171, "epoch": 1670} {"train_loss": -5.903311729431152, "global_step": 70172, "epoch": 1670} {"train_loss": -6.028387069702148, "global_step": 70173, "epoch": 1670} {"train_loss": -6.053599834442139, "global_step": 70174, "epoch": 1670} {"train_loss": -5.916329383850098, "global_step": 70175, "epoch": 1670} {"train_loss": -6.086334705352783, "global_step": 70176, "epoch": 1670} {"train_loss": -6.064538478851318, "global_step": 70177, "epoch": 1670} {"train_loss": -6.078019142150879, "global_step": 70178, "epoch": 1670} {"train_loss": -6.044609069824219, "global_step": 70179, "epoch": 1670} {"train_loss": -6.083641529083252, "global_step": 70180, "epoch": 1670} {"train_loss": -6.010195800236294, "global_step": 70181, "epoch": 1670, "val_loss": 67117.921875} {"train_loss": -6.054983139038086, "global_step": 70182, "epoch": 1671} {"train_loss": -6.046937465667725, "global_step": 70183, "epoch": 1671} {"train_loss": -5.988659858703613, "global_step": 70184, "epoch": 1671} {"train_loss": -6.074431419372559, "global_step": 70185, "epoch": 1671} {"train_loss": -6.023126125335693, "global_step": 70186, "epoch": 1671} {"train_loss": -6.1145782470703125, "global_step": 70187, "epoch": 1671} {"train_loss": -5.991238117218018, "global_step": 70188, "epoch": 1671} {"train_loss": -6.020969867706299, "global_step": 70189, "epoch": 1671} {"train_loss": -6.072305679321289, "global_step": 70190, "epoch": 1671} {"train_loss": -6.184493064880371, "global_step": 70191, "epoch": 1671} {"train_loss": -5.9051408767700195, "global_step": 70192, "epoch": 1671} {"train_loss": -5.860328674316406, "global_step": 70193, "epoch": 1671} {"train_loss": -6.050634384155273, "global_step": 70194, "epoch": 1671} {"train_loss": -6.040735244750977, "global_step": 70195, "epoch": 1671} {"train_loss": -5.938377857208252, "global_step": 70196, "epoch": 1671} {"train_loss": -6.063640594482422, "global_step": 70197, "epoch": 1671} {"train_loss": -6.112003326416016, "global_step": 70198, "epoch": 1671} {"train_loss": -5.934001922607422, "global_step": 70199, "epoch": 1671} {"train_loss": -6.044460296630859, "global_step": 70200, "epoch": 1671} {"train_loss": -5.996554374694824, "global_step": 70201, "epoch": 1671} {"train_loss": -6.002321720123291, "global_step": 70202, "epoch": 1671} {"train_loss": -5.999628067016602, "global_step": 70203, "epoch": 1671} {"train_loss": -6.0996317863464355, "global_step": 70204, "epoch": 1671} {"train_loss": -6.052212715148926, "global_step": 70205, "epoch": 1671} {"train_loss": -6.0191473960876465, "global_step": 70206, "epoch": 1671} {"train_loss": -6.01773738861084, "global_step": 70207, "epoch": 1671} {"train_loss": -5.941667556762695, "global_step": 70208, "epoch": 1671} {"train_loss": -6.038669586181641, "global_step": 70209, "epoch": 1671} {"train_loss": -5.914724349975586, "global_step": 70210, "epoch": 1671} {"train_loss": -6.116758346557617, "global_step": 70211, "epoch": 1671} {"train_loss": -5.907221794128418, "global_step": 70212, "epoch": 1671} {"train_loss": -6.0556640625, "global_step": 70213, "epoch": 1671} {"train_loss": -6.049747467041016, "global_step": 70214, "epoch": 1671} {"train_loss": -5.900307655334473, "global_step": 70215, "epoch": 1671} {"train_loss": -5.993486404418945, "global_step": 70216, "epoch": 1671} {"train_loss": -5.895474433898926, "global_step": 70217, "epoch": 1671} {"train_loss": -5.903090476989746, "global_step": 70218, "epoch": 1671} {"train_loss": -6.0099077224731445, "global_step": 70219, "epoch": 1671} {"train_loss": -5.922059535980225, "global_step": 70220, "epoch": 1671} {"train_loss": -5.953008651733398, "global_step": 70221, "epoch": 1671} {"train_loss": -5.960618019104004, "global_step": 70222, "epoch": 1671} {"train_loss": -6.00712463969276, "global_step": 70223, "epoch": 1671, "val_loss": 67424.671875} {"train_loss": -5.901201248168945, "global_step": 70224, "epoch": 1672} {"train_loss": -5.971434116363525, "global_step": 70225, "epoch": 1672} {"train_loss": -5.961714267730713, "global_step": 70226, "epoch": 1672} {"train_loss": -6.057497978210449, "global_step": 70227, "epoch": 1672} {"train_loss": -5.9295196533203125, "global_step": 70228, "epoch": 1672} {"train_loss": -5.822976112365723, "global_step": 70229, "epoch": 1672} {"train_loss": -6.057660102844238, "global_step": 70230, "epoch": 1672} {"train_loss": -6.010333061218262, "global_step": 70231, "epoch": 1672} {"train_loss": -5.984750270843506, "global_step": 70232, "epoch": 1672} {"train_loss": -5.971620559692383, "global_step": 70233, "epoch": 1672} {"train_loss": -6.078317642211914, "global_step": 70234, "epoch": 1672} {"train_loss": -6.027752876281738, "global_step": 70235, "epoch": 1672} {"train_loss": -6.0493550300598145, "global_step": 70236, "epoch": 1672} {"train_loss": -6.045226097106934, "global_step": 70237, "epoch": 1672} {"train_loss": -5.991322040557861, "global_step": 70238, "epoch": 1672} {"train_loss": -6.1046295166015625, "global_step": 70239, "epoch": 1672} {"train_loss": -6.114473819732666, "global_step": 70240, "epoch": 1672} {"train_loss": -5.981585502624512, "global_step": 70241, "epoch": 1672} {"train_loss": -6.034174919128418, "global_step": 70242, "epoch": 1672} {"train_loss": -5.998646259307861, "global_step": 70243, "epoch": 1672} {"train_loss": -6.019031047821045, "global_step": 70244, "epoch": 1672} {"train_loss": -5.975076675415039, "global_step": 70245, "epoch": 1672} {"train_loss": -6.059756278991699, "global_step": 70246, "epoch": 1672} {"train_loss": -5.914407730102539, "global_step": 70247, "epoch": 1672} {"train_loss": -5.969831466674805, "global_step": 70248, "epoch": 1672} {"train_loss": -6.0442047119140625, "global_step": 70249, "epoch": 1672} {"train_loss": -6.055951118469238, "global_step": 70250, "epoch": 1672} {"train_loss": -5.9569597244262695, "global_step": 70251, "epoch": 1672} {"train_loss": -5.995039939880371, "global_step": 70252, "epoch": 1672} {"train_loss": -6.061856269836426, "global_step": 70253, "epoch": 1672} {"train_loss": -6.008537292480469, "global_step": 70254, "epoch": 1672} {"train_loss": -6.117005348205566, "global_step": 70255, "epoch": 1672} {"train_loss": -5.964261054992676, "global_step": 70256, "epoch": 1672} {"train_loss": -6.062023162841797, "global_step": 70257, "epoch": 1672} {"train_loss": -5.953091621398926, "global_step": 70258, "epoch": 1672} {"train_loss": -6.087164878845215, "global_step": 70259, "epoch": 1672} {"train_loss": -5.987205505371094, "global_step": 70260, "epoch": 1672} {"train_loss": -5.9366631507873535, "global_step": 70261, "epoch": 1672} {"train_loss": -5.965397357940674, "global_step": 70262, "epoch": 1672} {"train_loss": -5.986294746398926, "global_step": 70263, "epoch": 1672} {"train_loss": -6.031088829040527, "global_step": 70264, "epoch": 1672} {"train_loss": -6.004795199348813, "global_step": 70265, "epoch": 1672, "val_loss": 67334.8359375} {"train_loss": -5.942063331604004, "global_step": 70266, "epoch": 1673} {"train_loss": -6.125361919403076, "global_step": 70267, "epoch": 1673} {"train_loss": -6.085848808288574, "global_step": 70268, "epoch": 1673} {"train_loss": -5.979989051818848, "global_step": 70269, "epoch": 1673} {"train_loss": -6.005069732666016, "global_step": 70270, "epoch": 1673} {"train_loss": -5.931447982788086, "global_step": 70271, "epoch": 1673} {"train_loss": -6.054157257080078, "global_step": 70272, "epoch": 1673} {"train_loss": -5.9566473960876465, "global_step": 70273, "epoch": 1673} {"train_loss": -5.864715576171875, "global_step": 70274, "epoch": 1673} {"train_loss": -5.976300239562988, "global_step": 70275, "epoch": 1673} {"train_loss": -5.953921794891357, "global_step": 70276, "epoch": 1673} {"train_loss": -6.087097644805908, "global_step": 70277, "epoch": 1673} {"train_loss": -6.009528160095215, "global_step": 70278, "epoch": 1673} {"train_loss": -5.941464900970459, "global_step": 70279, "epoch": 1673} {"train_loss": -6.025028228759766, "global_step": 70280, "epoch": 1673} {"train_loss": -5.829503536224365, "global_step": 70281, "epoch": 1673} {"train_loss": -5.919478416442871, "global_step": 70282, "epoch": 1673} {"train_loss": -5.912696361541748, "global_step": 70283, "epoch": 1673} {"train_loss": -6.056492805480957, "global_step": 70284, "epoch": 1673} {"train_loss": -5.877294063568115, "global_step": 70285, "epoch": 1673} {"train_loss": -5.883382320404053, "global_step": 70286, "epoch": 1673} {"train_loss": -6.045003890991211, "global_step": 70287, "epoch": 1673} {"train_loss": -5.981119632720947, "global_step": 70288, "epoch": 1673} {"train_loss": -6.110150337219238, "global_step": 70289, "epoch": 1673} {"train_loss": -5.8495330810546875, "global_step": 70290, "epoch": 1673} {"train_loss": -5.9449005126953125, "global_step": 70291, "epoch": 1673} {"train_loss": -6.049989700317383, "global_step": 70292, "epoch": 1673} {"train_loss": -5.93716287612915, "global_step": 70293, "epoch": 1673} {"train_loss": -5.927613258361816, "global_step": 70294, "epoch": 1673} {"train_loss": -6.008755207061768, "global_step": 70295, "epoch": 1673} {"train_loss": -5.95169734954834, "global_step": 70296, "epoch": 1673} {"train_loss": -6.018509864807129, "global_step": 70297, "epoch": 1673} {"train_loss": -5.984619140625, "global_step": 70298, "epoch": 1673} {"train_loss": -5.994546413421631, "global_step": 70299, "epoch": 1673} {"train_loss": -5.99539852142334, "global_step": 70300, "epoch": 1673} {"train_loss": -6.099884033203125, "global_step": 70301, "epoch": 1673} {"train_loss": -5.989628791809082, "global_step": 70302, "epoch": 1673} {"train_loss": -6.075295448303223, "global_step": 70303, "epoch": 1673} {"train_loss": -5.897687911987305, "global_step": 70304, "epoch": 1673} {"train_loss": -6.000509262084961, "global_step": 70305, "epoch": 1673} {"train_loss": -6.083782196044922, "global_step": 70306, "epoch": 1673} {"train_loss": -5.987234751383464, "global_step": 70307, "epoch": 1673, "val_loss": 67346.7265625} {"train_loss": -6.112144470214844, "global_step": 70308, "epoch": 1674} {"train_loss": -5.9996185302734375, "global_step": 70309, "epoch": 1674} {"train_loss": -5.981760025024414, "global_step": 70310, "epoch": 1674} {"train_loss": -6.058762073516846, "global_step": 70311, "epoch": 1674} {"train_loss": -5.983959197998047, "global_step": 70312, "epoch": 1674} {"train_loss": -6.055782318115234, "global_step": 70313, "epoch": 1674} {"train_loss": -6.034765243530273, "global_step": 70314, "epoch": 1674} {"train_loss": -6.094666481018066, "global_step": 70315, "epoch": 1674} {"train_loss": -6.05415678024292, "global_step": 70316, "epoch": 1674} {"train_loss": -6.107308864593506, "global_step": 70317, "epoch": 1674} {"train_loss": -5.849438667297363, "global_step": 70318, "epoch": 1674} {"train_loss": -5.974099159240723, "global_step": 70319, "epoch": 1674} {"train_loss": -5.942041397094727, "global_step": 70320, "epoch": 1674} {"train_loss": -6.067753314971924, "global_step": 70321, "epoch": 1674} {"train_loss": -6.122876167297363, "global_step": 70322, "epoch": 1674} {"train_loss": -5.927860260009766, "global_step": 70323, "epoch": 1674} {"train_loss": -5.957420349121094, "global_step": 70324, "epoch": 1674} {"train_loss": -6.127383232116699, "global_step": 70325, "epoch": 1674} {"train_loss": -6.033203125, "global_step": 70326, "epoch": 1674} {"train_loss": -5.902741432189941, "global_step": 70327, "epoch": 1674} {"train_loss": -6.002293109893799, "global_step": 70328, "epoch": 1674} {"train_loss": -6.028291702270508, "global_step": 70329, "epoch": 1674} {"train_loss": -6.1066107749938965, "global_step": 70330, "epoch": 1674} {"train_loss": -6.135024070739746, "global_step": 70331, "epoch": 1674} {"train_loss": -5.952737808227539, "global_step": 70332, "epoch": 1674} {"train_loss": -6.130834579467773, "global_step": 70333, "epoch": 1674} {"train_loss": -5.998646259307861, "global_step": 70334, "epoch": 1674} {"train_loss": -5.889795303344727, "global_step": 70335, "epoch": 1674} {"train_loss": -6.007806301116943, "global_step": 70336, "epoch": 1674} {"train_loss": -5.974863052368164, "global_step": 70337, "epoch": 1674} {"train_loss": -5.914812088012695, "global_step": 70338, "epoch": 1674} {"train_loss": -6.005424499511719, "global_step": 70339, "epoch": 1674} {"train_loss": -6.080705642700195, "global_step": 70340, "epoch": 1674} {"train_loss": -5.963626384735107, "global_step": 70341, "epoch": 1674} {"train_loss": -6.020353317260742, "global_step": 70342, "epoch": 1674} {"train_loss": -5.885132789611816, "global_step": 70343, "epoch": 1674} {"train_loss": -6.005275249481201, "global_step": 70344, "epoch": 1674} {"train_loss": -5.923431873321533, "global_step": 70345, "epoch": 1674} {"train_loss": -5.862416744232178, "global_step": 70346, "epoch": 1674} {"train_loss": -5.985396862030029, "global_step": 70347, "epoch": 1674} {"train_loss": -5.898885250091553, "global_step": 70348, "epoch": 1674} {"train_loss": -6.003663040342785, "global_step": 70349, "epoch": 1674, "val_loss": 67318.1875} {"train_loss": -6.0337371826171875, "global_step": 70350, "epoch": 1675} {"train_loss": -5.915170669555664, "global_step": 70351, "epoch": 1675} {"train_loss": -5.958311080932617, "global_step": 70352, "epoch": 1675} {"train_loss": -5.968615531921387, "global_step": 70353, "epoch": 1675} {"train_loss": -6.005725860595703, "global_step": 70354, "epoch": 1675} {"train_loss": -5.873809814453125, "global_step": 70355, "epoch": 1675} {"train_loss": -5.765996932983398, "global_step": 70356, "epoch": 1675} {"train_loss": -5.951162338256836, "global_step": 70357, "epoch": 1675} {"train_loss": -5.863515377044678, "global_step": 70358, "epoch": 1675} {"train_loss": -5.935065269470215, "global_step": 70359, "epoch": 1675} {"train_loss": -5.826124668121338, "global_step": 70360, "epoch": 1675} {"train_loss": -5.962567329406738, "global_step": 70361, "epoch": 1675} {"train_loss": -5.802526950836182, "global_step": 70362, "epoch": 1675} {"train_loss": -5.949152946472168, "global_step": 70363, "epoch": 1675} {"train_loss": -5.912707328796387, "global_step": 70364, "epoch": 1675} {"train_loss": -5.9364190101623535, "global_step": 70365, "epoch": 1675} {"train_loss": -5.978327751159668, "global_step": 70366, "epoch": 1675} {"train_loss": -6.011516094207764, "global_step": 70367, "epoch": 1675} {"train_loss": -5.967436790466309, "global_step": 70368, "epoch": 1675} {"train_loss": -5.913043022155762, "global_step": 70369, "epoch": 1675} {"train_loss": -5.8339762687683105, "global_step": 70370, "epoch": 1675} {"train_loss": -5.991730690002441, "global_step": 70371, "epoch": 1675} {"train_loss": -5.9021806716918945, "global_step": 70372, "epoch": 1675} {"train_loss": -5.893919944763184, "global_step": 70373, "epoch": 1675} {"train_loss": -5.83753776550293, "global_step": 70374, "epoch": 1675} {"train_loss": -5.985730171203613, "global_step": 70375, "epoch": 1675} {"train_loss": -6.108491897583008, "global_step": 70376, "epoch": 1675} {"train_loss": -5.931464195251465, "global_step": 70377, "epoch": 1675} {"train_loss": -6.189465045928955, "global_step": 70378, "epoch": 1675} {"train_loss": -5.887852668762207, "global_step": 70379, "epoch": 1675} {"train_loss": -5.983819961547852, "global_step": 70380, "epoch": 1675} {"train_loss": -6.102569580078125, "global_step": 70381, "epoch": 1675} {"train_loss": -5.984692573547363, "global_step": 70382, "epoch": 1675} {"train_loss": -6.030158996582031, "global_step": 70383, "epoch": 1675} {"train_loss": -5.989015579223633, "global_step": 70384, "epoch": 1675} {"train_loss": -5.9931640625, "global_step": 70385, "epoch": 1675} {"train_loss": -5.98397159576416, "global_step": 70386, "epoch": 1675} {"train_loss": -6.013872146606445, "global_step": 70387, "epoch": 1675} {"train_loss": -5.910328388214111, "global_step": 70388, "epoch": 1675} {"train_loss": -6.096668243408203, "global_step": 70389, "epoch": 1675} {"train_loss": -6.036964416503906, "global_step": 70390, "epoch": 1675} {"train_loss": -5.957195088976905, "global_step": 70391, "epoch": 1675, "val_loss": 67361.8515625} {"train_loss": -5.988164901733398, "global_step": 70392, "epoch": 1676} {"train_loss": -5.970163345336914, "global_step": 70393, "epoch": 1676} {"train_loss": -6.016884803771973, "global_step": 70394, "epoch": 1676} {"train_loss": -6.066969871520996, "global_step": 70395, "epoch": 1676} {"train_loss": -5.993898391723633, "global_step": 70396, "epoch": 1676} {"train_loss": -5.950676918029785, "global_step": 70397, "epoch": 1676} {"train_loss": -6.051763534545898, "global_step": 70398, "epoch": 1676} {"train_loss": -6.052303314208984, "global_step": 70399, "epoch": 1676} {"train_loss": -6.0431060791015625, "global_step": 70400, "epoch": 1676} {"train_loss": -6.017657279968262, "global_step": 70401, "epoch": 1676} {"train_loss": -6.0975341796875, "global_step": 70402, "epoch": 1676} {"train_loss": -6.076897621154785, "global_step": 70403, "epoch": 1676} {"train_loss": -5.927772521972656, "global_step": 70404, "epoch": 1676} {"train_loss": -6.015911102294922, "global_step": 70405, "epoch": 1676} {"train_loss": -5.889697074890137, "global_step": 70406, "epoch": 1676} {"train_loss": -5.958858489990234, "global_step": 70407, "epoch": 1676} {"train_loss": -6.075179100036621, "global_step": 70408, "epoch": 1676} {"train_loss": -5.897736072540283, "global_step": 70409, "epoch": 1676} {"train_loss": -6.103237152099609, "global_step": 70410, "epoch": 1676} {"train_loss": -5.841925621032715, "global_step": 70411, "epoch": 1676} {"train_loss": -6.005802154541016, "global_step": 70412, "epoch": 1676} {"train_loss": -5.99941873550415, "global_step": 70413, "epoch": 1676} {"train_loss": -5.945651531219482, "global_step": 70414, "epoch": 1676} {"train_loss": -5.874417304992676, "global_step": 70415, "epoch": 1676} {"train_loss": -5.87600564956665, "global_step": 70416, "epoch": 1676} {"train_loss": -5.991797924041748, "global_step": 70417, "epoch": 1676} {"train_loss": -5.854543685913086, "global_step": 70418, "epoch": 1676} {"train_loss": -5.955889701843262, "global_step": 70419, "epoch": 1676} {"train_loss": -5.986316680908203, "global_step": 70420, "epoch": 1676} {"train_loss": -5.9367499351501465, "global_step": 70421, "epoch": 1676} {"train_loss": -6.1082234382629395, "global_step": 70422, "epoch": 1676} {"train_loss": -5.934953689575195, "global_step": 70423, "epoch": 1676} {"train_loss": -5.967874526977539, "global_step": 70424, "epoch": 1676} {"train_loss": -5.878790378570557, "global_step": 70425, "epoch": 1676} {"train_loss": -5.982870101928711, "global_step": 70426, "epoch": 1676} {"train_loss": -5.996553897857666, "global_step": 70427, "epoch": 1676} {"train_loss": -5.957818984985352, "global_step": 70428, "epoch": 1676} {"train_loss": -5.961820125579834, "global_step": 70429, "epoch": 1676} {"train_loss": -6.009385585784912, "global_step": 70430, "epoch": 1676} {"train_loss": -5.879655838012695, "global_step": 70431, "epoch": 1676} {"train_loss": -5.877871513366699, "global_step": 70432, "epoch": 1676} {"train_loss": -5.972749346778507, "global_step": 70433, "epoch": 1676, "val_loss": 67418.53125} {"train_loss": -6.014167308807373, "global_step": 70434, "epoch": 1677} {"train_loss": -5.992252349853516, "global_step": 70435, "epoch": 1677} {"train_loss": -5.9809699058532715, "global_step": 70436, "epoch": 1677} {"train_loss": -6.082552909851074, "global_step": 70437, "epoch": 1677} {"train_loss": -6.052569389343262, "global_step": 70438, "epoch": 1677} {"train_loss": -6.026982307434082, "global_step": 70439, "epoch": 1677} {"train_loss": -5.917280197143555, "global_step": 70440, "epoch": 1677} {"train_loss": -6.029068946838379, "global_step": 70441, "epoch": 1677} {"train_loss": -6.137642860412598, "global_step": 70442, "epoch": 1677} {"train_loss": -5.9492106437683105, "global_step": 70443, "epoch": 1677} {"train_loss": -6.064731597900391, "global_step": 70444, "epoch": 1677} {"train_loss": -5.887587547302246, "global_step": 70445, "epoch": 1677} {"train_loss": -5.979081630706787, "global_step": 70446, "epoch": 1677} {"train_loss": -6.022763729095459, "global_step": 70447, "epoch": 1677} {"train_loss": -6.041505336761475, "global_step": 70448, "epoch": 1677} {"train_loss": -6.04368782043457, "global_step": 70449, "epoch": 1677} {"train_loss": -6.0775651931762695, "global_step": 70450, "epoch": 1677} {"train_loss": -6.116786956787109, "global_step": 70451, "epoch": 1677} {"train_loss": -6.019186973571777, "global_step": 70452, "epoch": 1677} {"train_loss": -5.9514641761779785, "global_step": 70453, "epoch": 1677} {"train_loss": -5.901152610778809, "global_step": 70454, "epoch": 1677} {"train_loss": -6.015262603759766, "global_step": 70455, "epoch": 1677} {"train_loss": -5.931565761566162, "global_step": 70456, "epoch": 1677} {"train_loss": -6.000338554382324, "global_step": 70457, "epoch": 1677} {"train_loss": -6.067780494689941, "global_step": 70458, "epoch": 1677} {"train_loss": -5.866905212402344, "global_step": 70459, "epoch": 1677} {"train_loss": -5.998480319976807, "global_step": 70460, "epoch": 1677} {"train_loss": -6.040177822113037, "global_step": 70461, "epoch": 1677} {"train_loss": -6.001456260681152, "global_step": 70462, "epoch": 1677} {"train_loss": -6.027047157287598, "global_step": 70463, "epoch": 1677} {"train_loss": -5.986028671264648, "global_step": 70464, "epoch": 1677} {"train_loss": -6.007622718811035, "global_step": 70465, "epoch": 1677} {"train_loss": -6.015537261962891, "global_step": 70466, "epoch": 1677} {"train_loss": -5.980459213256836, "global_step": 70467, "epoch": 1677} {"train_loss": -5.993210315704346, "global_step": 70468, "epoch": 1677} {"train_loss": -6.067765235900879, "global_step": 70469, "epoch": 1677} {"train_loss": -6.028410911560059, "global_step": 70470, "epoch": 1677} {"train_loss": -6.045356750488281, "global_step": 70471, "epoch": 1677} {"train_loss": -6.013553142547607, "global_step": 70472, "epoch": 1677} {"train_loss": -5.969196319580078, "global_step": 70473, "epoch": 1677} {"train_loss": -5.920222282409668, "global_step": 70474, "epoch": 1677} {"train_loss": -6.006958598182315, "global_step": 70475, "epoch": 1677, "val_loss": 67596.1953125} {"train_loss": -6.017580986022949, "global_step": 70476, "epoch": 1678} {"train_loss": -5.970166206359863, "global_step": 70477, "epoch": 1678} {"train_loss": -6.07257604598999, "global_step": 70478, "epoch": 1678} {"train_loss": -5.862851142883301, "global_step": 70479, "epoch": 1678} {"train_loss": -5.964691638946533, "global_step": 70480, "epoch": 1678} {"train_loss": -5.954678535461426, "global_step": 70481, "epoch": 1678} {"train_loss": -5.896397590637207, "global_step": 70482, "epoch": 1678} {"train_loss": -5.960352897644043, "global_step": 70483, "epoch": 1678} {"train_loss": -5.850627422332764, "global_step": 70484, "epoch": 1678} {"train_loss": -6.006107330322266, "global_step": 70485, "epoch": 1678} {"train_loss": -5.989627838134766, "global_step": 70486, "epoch": 1678} {"train_loss": -5.923053741455078, "global_step": 70487, "epoch": 1678} {"train_loss": -6.055331230163574, "global_step": 70488, "epoch": 1678} {"train_loss": -6.0329766273498535, "global_step": 70489, "epoch": 1678} {"train_loss": -5.8720808029174805, "global_step": 70490, "epoch": 1678} {"train_loss": -5.862997055053711, "global_step": 70491, "epoch": 1678} {"train_loss": -5.988659858703613, "global_step": 70492, "epoch": 1678} {"train_loss": -5.911688804626465, "global_step": 70493, "epoch": 1678} {"train_loss": -5.980069160461426, "global_step": 70494, "epoch": 1678} {"train_loss": -5.954970359802246, "global_step": 70495, "epoch": 1678} {"train_loss": -6.064523220062256, "global_step": 70496, "epoch": 1678} {"train_loss": -5.9694366455078125, "global_step": 70497, "epoch": 1678} {"train_loss": -6.092092514038086, "global_step": 70498, "epoch": 1678} {"train_loss": -5.935320854187012, "global_step": 70499, "epoch": 1678} {"train_loss": -6.053809642791748, "global_step": 70500, "epoch": 1678} {"train_loss": -6.114912033081055, "global_step": 70501, "epoch": 1678} {"train_loss": -6.092784881591797, "global_step": 70502, "epoch": 1678} {"train_loss": -6.129432201385498, "global_step": 70503, "epoch": 1678} {"train_loss": -6.048263072967529, "global_step": 70504, "epoch": 1678} {"train_loss": -6.017282962799072, "global_step": 70505, "epoch": 1678} {"train_loss": -5.888984680175781, "global_step": 70506, "epoch": 1678} {"train_loss": -6.109890937805176, "global_step": 70507, "epoch": 1678} {"train_loss": -6.037554740905762, "global_step": 70508, "epoch": 1678} {"train_loss": -6.031002044677734, "global_step": 70509, "epoch": 1678} {"train_loss": -6.007899284362793, "global_step": 70510, "epoch": 1678} {"train_loss": -6.004847526550293, "global_step": 70511, "epoch": 1678} {"train_loss": -6.001423358917236, "global_step": 70512, "epoch": 1678} {"train_loss": -6.125396728515625, "global_step": 70513, "epoch": 1678} {"train_loss": -5.883918285369873, "global_step": 70514, "epoch": 1678} {"train_loss": -6.079920768737793, "global_step": 70515, "epoch": 1678} {"train_loss": -5.955817699432373, "global_step": 70516, "epoch": 1678} {"train_loss": -5.996622675941104, "global_step": 70517, "epoch": 1678, "val_loss": 67044.9921875} {"train_loss": -6.031579494476318, "global_step": 70518, "epoch": 1679} {"train_loss": -6.050379276275635, "global_step": 70519, "epoch": 1679} {"train_loss": -5.951069355010986, "global_step": 70520, "epoch": 1679} {"train_loss": -5.943139553070068, "global_step": 70521, "epoch": 1679} {"train_loss": -6.028689384460449, "global_step": 70522, "epoch": 1679} {"train_loss": -6.081910610198975, "global_step": 70523, "epoch": 1679} {"train_loss": -6.047485828399658, "global_step": 70524, "epoch": 1679} {"train_loss": -6.083614349365234, "global_step": 70525, "epoch": 1679} {"train_loss": -5.973031997680664, "global_step": 70526, "epoch": 1679} {"train_loss": -6.095977783203125, "global_step": 70527, "epoch": 1679} {"train_loss": -6.032223701477051, "global_step": 70528, "epoch": 1679} {"train_loss": -5.996137619018555, "global_step": 70529, "epoch": 1679} {"train_loss": -6.004948616027832, "global_step": 70530, "epoch": 1679} {"train_loss": -6.007833480834961, "global_step": 70531, "epoch": 1679} {"train_loss": -5.957343101501465, "global_step": 70532, "epoch": 1679} {"train_loss": -6.0551981925964355, "global_step": 70533, "epoch": 1679} {"train_loss": -6.003109455108643, "global_step": 70534, "epoch": 1679} {"train_loss": -5.942713737487793, "global_step": 70535, "epoch": 1679} {"train_loss": -6.029921054840088, "global_step": 70536, "epoch": 1679} {"train_loss": -6.0313920974731445, "global_step": 70537, "epoch": 1679} {"train_loss": -5.933230400085449, "global_step": 70538, "epoch": 1679} {"train_loss": -5.991325378417969, "global_step": 70539, "epoch": 1679} {"train_loss": -6.067062854766846, "global_step": 70540, "epoch": 1679} {"train_loss": -6.077699661254883, "global_step": 70541, "epoch": 1679} {"train_loss": -6.000347137451172, "global_step": 70542, "epoch": 1679} {"train_loss": -5.955982208251953, "global_step": 70543, "epoch": 1679} {"train_loss": -5.976191997528076, "global_step": 70544, "epoch": 1679} {"train_loss": -6.05253791809082, "global_step": 70545, "epoch": 1679} {"train_loss": -5.984339237213135, "global_step": 70546, "epoch": 1679} {"train_loss": -6.00599479675293, "global_step": 70547, "epoch": 1679} {"train_loss": -6.095137596130371, "global_step": 70548, "epoch": 1679} {"train_loss": -6.007937908172607, "global_step": 70549, "epoch": 1679} {"train_loss": -6.120974063873291, "global_step": 70550, "epoch": 1679} {"train_loss": -5.936640739440918, "global_step": 70551, "epoch": 1679} {"train_loss": -5.998691082000732, "global_step": 70552, "epoch": 1679} {"train_loss": -6.005066394805908, "global_step": 70553, "epoch": 1679} {"train_loss": -5.947622776031494, "global_step": 70554, "epoch": 1679} {"train_loss": -5.916406631469727, "global_step": 70555, "epoch": 1679} {"train_loss": -5.998700141906738, "global_step": 70556, "epoch": 1679} {"train_loss": -6.040277481079102, "global_step": 70557, "epoch": 1679} {"train_loss": -5.980169296264648, "global_step": 70558, "epoch": 1679} {"train_loss": -6.010504926953997, "global_step": 70559, "epoch": 1679, "val_loss": 67496.3046875} {"train_loss": -5.9847002029418945, "global_step": 70560, "epoch": 1680} {"train_loss": -6.030111789703369, "global_step": 70561, "epoch": 1680} {"train_loss": -5.944454193115234, "global_step": 70562, "epoch": 1680} {"train_loss": -6.010993957519531, "global_step": 70563, "epoch": 1680} {"train_loss": -5.992524147033691, "global_step": 70564, "epoch": 1680} {"train_loss": -6.039585113525391, "global_step": 70565, "epoch": 1680} {"train_loss": -6.030755043029785, "global_step": 70566, "epoch": 1680} {"train_loss": -5.948999404907227, "global_step": 70567, "epoch": 1680} {"train_loss": -6.0217061042785645, "global_step": 70568, "epoch": 1680} {"train_loss": -6.103769302368164, "global_step": 70569, "epoch": 1680} {"train_loss": -6.029707908630371, "global_step": 70570, "epoch": 1680} {"train_loss": -5.909040451049805, "global_step": 70571, "epoch": 1680} {"train_loss": -5.900165557861328, "global_step": 70572, "epoch": 1680} {"train_loss": -5.995418071746826, "global_step": 70573, "epoch": 1680} {"train_loss": -6.0190839767456055, "global_step": 70574, "epoch": 1680} {"train_loss": -6.008580207824707, "global_step": 70575, "epoch": 1680} {"train_loss": -6.002446174621582, "global_step": 70576, "epoch": 1680} {"train_loss": -6.085333824157715, "global_step": 70577, "epoch": 1680} {"train_loss": -6.115368843078613, "global_step": 70578, "epoch": 1680} {"train_loss": -6.066343784332275, "global_step": 70579, "epoch": 1680} {"train_loss": -6.052179336547852, "global_step": 70580, "epoch": 1680} {"train_loss": -6.023074626922607, "global_step": 70581, "epoch": 1680} {"train_loss": -6.046470642089844, "global_step": 70582, "epoch": 1680} {"train_loss": -6.103154182434082, "global_step": 70583, "epoch": 1680} {"train_loss": -6.074737548828125, "global_step": 70584, "epoch": 1680} {"train_loss": -5.961050033569336, "global_step": 70585, "epoch": 1680} {"train_loss": -6.084410190582275, "global_step": 70586, "epoch": 1680} {"train_loss": -5.990716934204102, "global_step": 70587, "epoch": 1680} {"train_loss": -6.093557357788086, "global_step": 70588, "epoch": 1680} {"train_loss": -6.005018711090088, "global_step": 70589, "epoch": 1680} {"train_loss": -6.195793151855469, "global_step": 70590, "epoch": 1680} {"train_loss": -6.010226249694824, "global_step": 70591, "epoch": 1680} {"train_loss": -5.8510565757751465, "global_step": 70592, "epoch": 1680} {"train_loss": -6.12062931060791, "global_step": 70593, "epoch": 1680} {"train_loss": -5.99058723449707, "global_step": 70594, "epoch": 1680} {"train_loss": -6.058670997619629, "global_step": 70595, "epoch": 1680} {"train_loss": -6.063748359680176, "global_step": 70596, "epoch": 1680} {"train_loss": -6.0005927085876465, "global_step": 70597, "epoch": 1680} {"train_loss": -6.027640342712402, "global_step": 70598, "epoch": 1680} {"train_loss": -6.037992000579834, "global_step": 70599, "epoch": 1680} {"train_loss": -6.019556999206543, "global_step": 70600, "epoch": 1680} {"train_loss": -6.025581462042672, "global_step": 70601, "epoch": 1680, "val_loss": 67448.1328125} {"train_loss": -6.060013771057129, "global_step": 70602, "epoch": 1681} {"train_loss": -5.9766387939453125, "global_step": 70603, "epoch": 1681} {"train_loss": -6.062349319458008, "global_step": 70604, "epoch": 1681} {"train_loss": -5.848623752593994, "global_step": 70605, "epoch": 1681} {"train_loss": -5.909754753112793, "global_step": 70606, "epoch": 1681} {"train_loss": -5.9809489250183105, "global_step": 70607, "epoch": 1681} {"train_loss": -6.07102108001709, "global_step": 70608, "epoch": 1681} {"train_loss": -6.013886451721191, "global_step": 70609, "epoch": 1681} {"train_loss": -5.9703264236450195, "global_step": 70610, "epoch": 1681} {"train_loss": -6.016055107116699, "global_step": 70611, "epoch": 1681} {"train_loss": -5.9936323165893555, "global_step": 70612, "epoch": 1681} {"train_loss": -5.877799987792969, "global_step": 70613, "epoch": 1681} {"train_loss": -6.036185264587402, "global_step": 70614, "epoch": 1681} {"train_loss": -6.018237113952637, "global_step": 70615, "epoch": 1681} {"train_loss": -5.975797176361084, "global_step": 70616, "epoch": 1681} {"train_loss": -5.967830657958984, "global_step": 70617, "epoch": 1681} {"train_loss": -5.981950283050537, "global_step": 70618, "epoch": 1681} {"train_loss": -6.012545108795166, "global_step": 70619, "epoch": 1681} {"train_loss": -5.918909072875977, "global_step": 70620, "epoch": 1681} {"train_loss": -6.063243865966797, "global_step": 70621, "epoch": 1681} {"train_loss": -5.970557689666748, "global_step": 70622, "epoch": 1681} {"train_loss": -6.002720832824707, "global_step": 70623, "epoch": 1681} {"train_loss": -6.059019565582275, "global_step": 70624, "epoch": 1681} {"train_loss": -5.87190055847168, "global_step": 70625, "epoch": 1681} {"train_loss": -5.998360633850098, "global_step": 70626, "epoch": 1681} {"train_loss": -5.946359157562256, "global_step": 70627, "epoch": 1681} {"train_loss": -5.931760787963867, "global_step": 70628, "epoch": 1681} {"train_loss": -6.0434136390686035, "global_step": 70629, "epoch": 1681} {"train_loss": -5.88704776763916, "global_step": 70630, "epoch": 1681} {"train_loss": -5.905216217041016, "global_step": 70631, "epoch": 1681} {"train_loss": -5.922963619232178, "global_step": 70632, "epoch": 1681} {"train_loss": -5.9608154296875, "global_step": 70633, "epoch": 1681} {"train_loss": -6.05263614654541, "global_step": 70634, "epoch": 1681} {"train_loss": -5.943356037139893, "global_step": 70635, "epoch": 1681} {"train_loss": -6.022412300109863, "global_step": 70636, "epoch": 1681} {"train_loss": -5.915157318115234, "global_step": 70637, "epoch": 1681} {"train_loss": -5.992027759552002, "global_step": 70638, "epoch": 1681} {"train_loss": -6.018460750579834, "global_step": 70639, "epoch": 1681} {"train_loss": -5.900440216064453, "global_step": 70640, "epoch": 1681} {"train_loss": -5.9939985275268555, "global_step": 70641, "epoch": 1681} {"train_loss": -6.016312122344971, "global_step": 70642, "epoch": 1681} {"train_loss": -5.979246014640445, "global_step": 70643, "epoch": 1681, "val_loss": 67294.03125} {"train_loss": -5.927848815917969, "global_step": 70644, "epoch": 1682} {"train_loss": -5.992010116577148, "global_step": 70645, "epoch": 1682} {"train_loss": -6.051095485687256, "global_step": 70646, "epoch": 1682} {"train_loss": -6.148842811584473, "global_step": 70647, "epoch": 1682} {"train_loss": -6.213522911071777, "global_step": 70648, "epoch": 1682} {"train_loss": -6.048379898071289, "global_step": 70649, "epoch": 1682} {"train_loss": -5.9576921463012695, "global_step": 70650, "epoch": 1682} {"train_loss": -6.053277969360352, "global_step": 70651, "epoch": 1682} {"train_loss": -6.046281814575195, "global_step": 70652, "epoch": 1682} {"train_loss": -5.996632099151611, "global_step": 70653, "epoch": 1682} {"train_loss": -5.967812538146973, "global_step": 70654, "epoch": 1682} {"train_loss": -6.066372394561768, "global_step": 70655, "epoch": 1682} {"train_loss": -5.982008934020996, "global_step": 70656, "epoch": 1682} {"train_loss": -5.9383063316345215, "global_step": 70657, "epoch": 1682} {"train_loss": -6.098189353942871, "global_step": 70658, "epoch": 1682} {"train_loss": -5.965694427490234, "global_step": 70659, "epoch": 1682} {"train_loss": -6.036182880401611, "global_step": 70660, "epoch": 1682} {"train_loss": -5.994595527648926, "global_step": 70661, "epoch": 1682} {"train_loss": -5.972225189208984, "global_step": 70662, "epoch": 1682} {"train_loss": -6.04056453704834, "global_step": 70663, "epoch": 1682} {"train_loss": -6.046083927154541, "global_step": 70664, "epoch": 1682} {"train_loss": -5.955417633056641, "global_step": 70665, "epoch": 1682} {"train_loss": -6.001811981201172, "global_step": 70666, "epoch": 1682} {"train_loss": -6.023508071899414, "global_step": 70667, "epoch": 1682} {"train_loss": -6.080533981323242, "global_step": 70668, "epoch": 1682} {"train_loss": -6.1672468185424805, "global_step": 70669, "epoch": 1682} {"train_loss": -6.004112243652344, "global_step": 70670, "epoch": 1682} {"train_loss": -6.077895641326904, "global_step": 70671, "epoch": 1682} {"train_loss": -6.180288314819336, "global_step": 70672, "epoch": 1682} {"train_loss": -6.0119428634643555, "global_step": 70673, "epoch": 1682} {"train_loss": -6.0286688804626465, "global_step": 70674, "epoch": 1682} {"train_loss": -5.961758136749268, "global_step": 70675, "epoch": 1682} {"train_loss": -6.076610565185547, "global_step": 70676, "epoch": 1682} {"train_loss": -5.863652229309082, "global_step": 70677, "epoch": 1682} {"train_loss": -5.924637794494629, "global_step": 70678, "epoch": 1682} {"train_loss": -5.991856098175049, "global_step": 70679, "epoch": 1682} {"train_loss": -5.87347412109375, "global_step": 70680, "epoch": 1682} {"train_loss": -5.965659141540527, "global_step": 70681, "epoch": 1682} {"train_loss": -6.016212463378906, "global_step": 70682, "epoch": 1682} {"train_loss": -6.040444374084473, "global_step": 70683, "epoch": 1682} {"train_loss": -5.995540142059326, "global_step": 70684, "epoch": 1682} {"train_loss": -6.0195222582135886, "global_step": 70685, "epoch": 1682, "val_loss": 67491.6953125} {"train_loss": -6.1318559646606445, "global_step": 70686, "epoch": 1683} {"train_loss": -5.990710258483887, "global_step": 70687, "epoch": 1683} {"train_loss": -5.953945636749268, "global_step": 70688, "epoch": 1683} {"train_loss": -6.037910461425781, "global_step": 70689, "epoch": 1683} {"train_loss": -5.946525573730469, "global_step": 70690, "epoch": 1683} {"train_loss": -5.941978454589844, "global_step": 70691, "epoch": 1683} {"train_loss": -5.974003791809082, "global_step": 70692, "epoch": 1683} {"train_loss": -5.959165573120117, "global_step": 70693, "epoch": 1683} {"train_loss": -6.114715576171875, "global_step": 70694, "epoch": 1683} {"train_loss": -6.017099380493164, "global_step": 70695, "epoch": 1683} {"train_loss": -6.120639324188232, "global_step": 70696, "epoch": 1683} {"train_loss": -6.088350296020508, "global_step": 70697, "epoch": 1683} {"train_loss": -5.93604850769043, "global_step": 70698, "epoch": 1683} {"train_loss": -6.039829254150391, "global_step": 70699, "epoch": 1683} {"train_loss": -6.009713649749756, "global_step": 70700, "epoch": 1683} {"train_loss": -5.935070037841797, "global_step": 70701, "epoch": 1683} {"train_loss": -5.992629051208496, "global_step": 70702, "epoch": 1683} {"train_loss": -6.152889728546143, "global_step": 70703, "epoch": 1683} {"train_loss": -5.993006706237793, "global_step": 70704, "epoch": 1683} {"train_loss": -6.041958808898926, "global_step": 70705, "epoch": 1683} {"train_loss": -6.042613506317139, "global_step": 70706, "epoch": 1683} {"train_loss": -6.020729064941406, "global_step": 70707, "epoch": 1683} {"train_loss": -6.1117706298828125, "global_step": 70708, "epoch": 1683} {"train_loss": -6.055673599243164, "global_step": 70709, "epoch": 1683} {"train_loss": -6.129449367523193, "global_step": 70710, "epoch": 1683} {"train_loss": -5.973611831665039, "global_step": 70711, "epoch": 1683} {"train_loss": -5.9494147300720215, "global_step": 70712, "epoch": 1683} {"train_loss": -5.9703874588012695, "global_step": 70713, "epoch": 1683} {"train_loss": -6.062234878540039, "global_step": 70714, "epoch": 1683} {"train_loss": -5.820114612579346, "global_step": 70715, "epoch": 1683} {"train_loss": -6.027749538421631, "global_step": 70716, "epoch": 1683} {"train_loss": -6.000981330871582, "global_step": 70717, "epoch": 1683} {"train_loss": -6.038723468780518, "global_step": 70718, "epoch": 1683} {"train_loss": -6.032520294189453, "global_step": 70719, "epoch": 1683} {"train_loss": -5.979275703430176, "global_step": 70720, "epoch": 1683} {"train_loss": -6.125532150268555, "global_step": 70721, "epoch": 1683} {"train_loss": -6.023543357849121, "global_step": 70722, "epoch": 1683} {"train_loss": -6.025540351867676, "global_step": 70723, "epoch": 1683} {"train_loss": -5.971323013305664, "global_step": 70724, "epoch": 1683} {"train_loss": -6.028709411621094, "global_step": 70725, "epoch": 1683} {"train_loss": -6.0388641357421875, "global_step": 70726, "epoch": 1683} {"train_loss": -6.0213919707707, "global_step": 70727, "epoch": 1683, "val_loss": 67266.5078125} {"train_loss": -6.010261058807373, "global_step": 70728, "epoch": 1684} {"train_loss": -6.038513660430908, "global_step": 70729, "epoch": 1684} {"train_loss": -6.091770648956299, "global_step": 70730, "epoch": 1684} {"train_loss": -6.027408599853516, "global_step": 70731, "epoch": 1684} {"train_loss": -6.0828776359558105, "global_step": 70732, "epoch": 1684} {"train_loss": -6.083179473876953, "global_step": 70733, "epoch": 1684} {"train_loss": -6.053564071655273, "global_step": 70734, "epoch": 1684} {"train_loss": -5.982851028442383, "global_step": 70735, "epoch": 1684} {"train_loss": -6.089205741882324, "global_step": 70736, "epoch": 1684} {"train_loss": -5.982325553894043, "global_step": 70737, "epoch": 1684} {"train_loss": -6.062836647033691, "global_step": 70738, "epoch": 1684} {"train_loss": -6.017605781555176, "global_step": 70739, "epoch": 1684} {"train_loss": -5.990177154541016, "global_step": 70740, "epoch": 1684} {"train_loss": -5.925917625427246, "global_step": 70741, "epoch": 1684} {"train_loss": -5.9354329109191895, "global_step": 70742, "epoch": 1684} {"train_loss": -6.019538402557373, "global_step": 70743, "epoch": 1684} {"train_loss": -6.007739543914795, "global_step": 70744, "epoch": 1684} {"train_loss": -5.914621829986572, "global_step": 70745, "epoch": 1684} {"train_loss": -5.986649513244629, "global_step": 70746, "epoch": 1684} {"train_loss": -5.92949914932251, "global_step": 70747, "epoch": 1684} {"train_loss": -5.947857856750488, "global_step": 70748, "epoch": 1684} {"train_loss": -6.2000017166137695, "global_step": 70749, "epoch": 1684} {"train_loss": -5.854940891265869, "global_step": 70750, "epoch": 1684} {"train_loss": -5.934001445770264, "global_step": 70751, "epoch": 1684} {"train_loss": -6.037774085998535, "global_step": 70752, "epoch": 1684} {"train_loss": -5.923715591430664, "global_step": 70753, "epoch": 1684} {"train_loss": -5.974938869476318, "global_step": 70754, "epoch": 1684} {"train_loss": -6.058014392852783, "global_step": 70755, "epoch": 1684} {"train_loss": -5.842470169067383, "global_step": 70756, "epoch": 1684} {"train_loss": -5.830528259277344, "global_step": 70757, "epoch": 1684} {"train_loss": -5.968667030334473, "global_step": 70758, "epoch": 1684} {"train_loss": -6.034588813781738, "global_step": 70759, "epoch": 1684} {"train_loss": -5.94188117980957, "global_step": 70760, "epoch": 1684} {"train_loss": -5.96561336517334, "global_step": 70761, "epoch": 1684} {"train_loss": -5.92073917388916, "global_step": 70762, "epoch": 1684} {"train_loss": -6.02285099029541, "global_step": 70763, "epoch": 1684} {"train_loss": -6.035828590393066, "global_step": 70764, "epoch": 1684} {"train_loss": -6.052233695983887, "global_step": 70765, "epoch": 1684} {"train_loss": -6.018433570861816, "global_step": 70766, "epoch": 1684} {"train_loss": -5.978642463684082, "global_step": 70767, "epoch": 1684} {"train_loss": -6.055361747741699, "global_step": 70768, "epoch": 1684} {"train_loss": -5.996666817438035, "global_step": 70769, "epoch": 1684, "val_loss": 67480.7734375} {"train_loss": -6.026046276092529, "global_step": 70770, "epoch": 1685} {"train_loss": -5.998190879821777, "global_step": 70771, "epoch": 1685} {"train_loss": -5.9204607009887695, "global_step": 70772, "epoch": 1685} {"train_loss": -5.957815170288086, "global_step": 70773, "epoch": 1685} {"train_loss": -5.927985668182373, "global_step": 70774, "epoch": 1685} {"train_loss": -5.947282314300537, "global_step": 70775, "epoch": 1685} {"train_loss": -6.052935600280762, "global_step": 70776, "epoch": 1685} {"train_loss": -5.982398509979248, "global_step": 70777, "epoch": 1685} {"train_loss": -6.14047908782959, "global_step": 70778, "epoch": 1685} {"train_loss": -6.091976165771484, "global_step": 70779, "epoch": 1685} {"train_loss": -6.146851539611816, "global_step": 70780, "epoch": 1685} {"train_loss": -5.990583896636963, "global_step": 70781, "epoch": 1685} {"train_loss": -6.083300590515137, "global_step": 70782, "epoch": 1685} {"train_loss": -6.090094089508057, "global_step": 70783, "epoch": 1685} {"train_loss": -5.989368438720703, "global_step": 70784, "epoch": 1685} {"train_loss": -6.0566816329956055, "global_step": 70785, "epoch": 1685} {"train_loss": -5.96229362487793, "global_step": 70786, "epoch": 1685} {"train_loss": -5.98121452331543, "global_step": 70787, "epoch": 1685} {"train_loss": -5.950522422790527, "global_step": 70788, "epoch": 1685} {"train_loss": -6.16568660736084, "global_step": 70789, "epoch": 1685} {"train_loss": -6.007730960845947, "global_step": 70790, "epoch": 1685} {"train_loss": -6.016083240509033, "global_step": 70791, "epoch": 1685} {"train_loss": -5.953062057495117, "global_step": 70792, "epoch": 1685} {"train_loss": -6.094237327575684, "global_step": 70793, "epoch": 1685} {"train_loss": -5.8470306396484375, "global_step": 70794, "epoch": 1685} {"train_loss": -6.117981910705566, "global_step": 70795, "epoch": 1685} {"train_loss": -5.937358856201172, "global_step": 70796, "epoch": 1685} {"train_loss": -5.9760332107543945, "global_step": 70797, "epoch": 1685} {"train_loss": -6.146251201629639, "global_step": 70798, "epoch": 1685} {"train_loss": -6.10533332824707, "global_step": 70799, "epoch": 1685} {"train_loss": -5.99190092086792, "global_step": 70800, "epoch": 1685} {"train_loss": -5.9882402420043945, "global_step": 70801, "epoch": 1685} {"train_loss": -6.039701461791992, "global_step": 70802, "epoch": 1685} {"train_loss": -6.008343696594238, "global_step": 70803, "epoch": 1685} {"train_loss": -6.048680782318115, "global_step": 70804, "epoch": 1685} {"train_loss": -6.0615410804748535, "global_step": 70805, "epoch": 1685} {"train_loss": -6.118459224700928, "global_step": 70806, "epoch": 1685} {"train_loss": -6.065269947052002, "global_step": 70807, "epoch": 1685} {"train_loss": -6.0172882080078125, "global_step": 70808, "epoch": 1685} {"train_loss": -6.125341415405273, "global_step": 70809, "epoch": 1685} {"train_loss": -5.9249796867370605, "global_step": 70810, "epoch": 1685} {"train_loss": -6.0277681691305975, "global_step": 70811, "epoch": 1685, "val_loss": 67202.4609375} {"train_loss": -6.07757568359375, "global_step": 70812, "epoch": 1686} {"train_loss": -5.93023681640625, "global_step": 70813, "epoch": 1686} {"train_loss": -6.022444725036621, "global_step": 70814, "epoch": 1686} {"train_loss": -6.000949859619141, "global_step": 70815, "epoch": 1686} {"train_loss": -5.961391448974609, "global_step": 70816, "epoch": 1686} {"train_loss": -5.931077480316162, "global_step": 70817, "epoch": 1686} {"train_loss": -6.040520191192627, "global_step": 70818, "epoch": 1686} {"train_loss": -5.98492956161499, "global_step": 70819, "epoch": 1686} {"train_loss": -5.99090576171875, "global_step": 70820, "epoch": 1686} {"train_loss": -6.0494384765625, "global_step": 70821, "epoch": 1686} {"train_loss": -6.129628658294678, "global_step": 70822, "epoch": 1686} {"train_loss": -5.9840898513793945, "global_step": 70823, "epoch": 1686} {"train_loss": -6.000452041625977, "global_step": 70824, "epoch": 1686} {"train_loss": -5.979608058929443, "global_step": 70825, "epoch": 1686} {"train_loss": -6.041814804077148, "global_step": 70826, "epoch": 1686} {"train_loss": -6.024300575256348, "global_step": 70827, "epoch": 1686} {"train_loss": -6.023428440093994, "global_step": 70828, "epoch": 1686} {"train_loss": -5.8853759765625, "global_step": 70829, "epoch": 1686} {"train_loss": -5.9217987060546875, "global_step": 70830, "epoch": 1686} {"train_loss": -5.882036209106445, "global_step": 70831, "epoch": 1686} {"train_loss": -5.997051239013672, "global_step": 70832, "epoch": 1686} {"train_loss": -5.958014011383057, "global_step": 70833, "epoch": 1686} {"train_loss": -5.956170558929443, "global_step": 70834, "epoch": 1686} {"train_loss": -6.001497745513916, "global_step": 70835, "epoch": 1686} {"train_loss": -6.015741348266602, "global_step": 70836, "epoch": 1686} {"train_loss": -5.884418964385986, "global_step": 70837, "epoch": 1686} {"train_loss": -5.935611724853516, "global_step": 70838, "epoch": 1686} {"train_loss": -6.056051254272461, "global_step": 70839, "epoch": 1686} {"train_loss": -5.960981369018555, "global_step": 70840, "epoch": 1686} {"train_loss": -5.995024681091309, "global_step": 70841, "epoch": 1686} {"train_loss": -6.049952983856201, "global_step": 70842, "epoch": 1686} {"train_loss": -5.952971458435059, "global_step": 70843, "epoch": 1686} {"train_loss": -5.951087951660156, "global_step": 70844, "epoch": 1686} {"train_loss": -6.004339218139648, "global_step": 70845, "epoch": 1686} {"train_loss": -5.883938789367676, "global_step": 70846, "epoch": 1686} {"train_loss": -5.979465484619141, "global_step": 70847, "epoch": 1686} {"train_loss": -6.010865688323975, "global_step": 70848, "epoch": 1686} {"train_loss": -6.044285774230957, "global_step": 70849, "epoch": 1686} {"train_loss": -5.965916633605957, "global_step": 70850, "epoch": 1686} {"train_loss": -6.07588529586792, "global_step": 70851, "epoch": 1686} {"train_loss": -5.885138511657715, "global_step": 70852, "epoch": 1686} {"train_loss": -5.98701920963469, "global_step": 70853, "epoch": 1686, "val_loss": 67548.0234375} {"train_loss": -5.975050926208496, "global_step": 70854, "epoch": 1687} {"train_loss": -5.9719672203063965, "global_step": 70855, "epoch": 1687} {"train_loss": -5.950955867767334, "global_step": 70856, "epoch": 1687} {"train_loss": -5.993755340576172, "global_step": 70857, "epoch": 1687} {"train_loss": -6.074517250061035, "global_step": 70858, "epoch": 1687} {"train_loss": -6.001145362854004, "global_step": 70859, "epoch": 1687} {"train_loss": -5.91424560546875, "global_step": 70860, "epoch": 1687} {"train_loss": -6.04589319229126, "global_step": 70861, "epoch": 1687} {"train_loss": -6.001236915588379, "global_step": 70862, "epoch": 1687} {"train_loss": -5.925670623779297, "global_step": 70863, "epoch": 1687} {"train_loss": -5.8383402824401855, "global_step": 70864, "epoch": 1687} {"train_loss": -5.871011257171631, "global_step": 70865, "epoch": 1687} {"train_loss": -5.987395763397217, "global_step": 70866, "epoch": 1687} {"train_loss": -5.856042385101318, "global_step": 70867, "epoch": 1687} {"train_loss": -5.981073379516602, "global_step": 70868, "epoch": 1687} {"train_loss": -5.848706245422363, "global_step": 70869, "epoch": 1687} {"train_loss": -5.9424662590026855, "global_step": 70870, "epoch": 1687} {"train_loss": -5.923305511474609, "global_step": 70871, "epoch": 1687} {"train_loss": -5.956495761871338, "global_step": 70872, "epoch": 1687} {"train_loss": -5.903197288513184, "global_step": 70873, "epoch": 1687} {"train_loss": -5.954653739929199, "global_step": 70874, "epoch": 1687} {"train_loss": -5.998565673828125, "global_step": 70875, "epoch": 1687} {"train_loss": -5.987945079803467, "global_step": 70876, "epoch": 1687} {"train_loss": -5.839367389678955, "global_step": 70877, "epoch": 1687} {"train_loss": -6.0365142822265625, "global_step": 70878, "epoch": 1687} {"train_loss": -6.064990997314453, "global_step": 70879, "epoch": 1687} {"train_loss": -6.045284271240234, "global_step": 70880, "epoch": 1687} {"train_loss": -6.039125442504883, "global_step": 70881, "epoch": 1687} {"train_loss": -6.028036594390869, "global_step": 70882, "epoch": 1687} {"train_loss": -6.130718231201172, "global_step": 70883, "epoch": 1687} {"train_loss": -5.991168975830078, "global_step": 70884, "epoch": 1687} {"train_loss": -6.021596908569336, "global_step": 70885, "epoch": 1687} {"train_loss": -5.93510627746582, "global_step": 70886, "epoch": 1687} {"train_loss": -6.109149932861328, "global_step": 70887, "epoch": 1687} {"train_loss": -6.040840148925781, "global_step": 70888, "epoch": 1687} {"train_loss": -5.854076385498047, "global_step": 70889, "epoch": 1687} {"train_loss": -6.040653228759766, "global_step": 70890, "epoch": 1687} {"train_loss": -6.06772518157959, "global_step": 70891, "epoch": 1687} {"train_loss": -6.019070625305176, "global_step": 70892, "epoch": 1687} {"train_loss": -6.004338264465332, "global_step": 70893, "epoch": 1687} {"train_loss": -6.020049095153809, "global_step": 70894, "epoch": 1687} {"train_loss": -5.981580064410255, "global_step": 70895, "epoch": 1687, "val_loss": 67381.1484375} {"train_loss": -5.918846130371094, "global_step": 70896, "epoch": 1688} {"train_loss": -6.066801071166992, "global_step": 70897, "epoch": 1688} {"train_loss": -5.991578102111816, "global_step": 70898, "epoch": 1688} {"train_loss": -6.04560661315918, "global_step": 70899, "epoch": 1688} {"train_loss": -5.99500846862793, "global_step": 70900, "epoch": 1688} {"train_loss": -6.038630485534668, "global_step": 70901, "epoch": 1688} {"train_loss": -5.9942474365234375, "global_step": 70902, "epoch": 1688} {"train_loss": -5.868602752685547, "global_step": 70903, "epoch": 1688} {"train_loss": -5.974457740783691, "global_step": 70904, "epoch": 1688} {"train_loss": -5.9996514320373535, "global_step": 70905, "epoch": 1688} {"train_loss": -5.978014945983887, "global_step": 70906, "epoch": 1688} {"train_loss": -6.063013076782227, "global_step": 70907, "epoch": 1688} {"train_loss": -5.932549476623535, "global_step": 70908, "epoch": 1688} {"train_loss": -5.9220991134643555, "global_step": 70909, "epoch": 1688} {"train_loss": -6.056702613830566, "global_step": 70910, "epoch": 1688} {"train_loss": -5.974094867706299, "global_step": 70911, "epoch": 1688} {"train_loss": -5.905611515045166, "global_step": 70912, "epoch": 1688} {"train_loss": -6.005140781402588, "global_step": 70913, "epoch": 1688} {"train_loss": -5.89882755279541, "global_step": 70914, "epoch": 1688} {"train_loss": -5.8940582275390625, "global_step": 70915, "epoch": 1688} {"train_loss": -6.005613327026367, "global_step": 70916, "epoch": 1688} {"train_loss": -5.839405059814453, "global_step": 70917, "epoch": 1688} {"train_loss": -6.106524467468262, "global_step": 70918, "epoch": 1688} {"train_loss": -5.974076271057129, "global_step": 70919, "epoch": 1688} {"train_loss": -5.966087341308594, "global_step": 70920, "epoch": 1688} {"train_loss": -6.037160396575928, "global_step": 70921, "epoch": 1688} {"train_loss": -5.985751152038574, "global_step": 70922, "epoch": 1688} {"train_loss": -6.001607894897461, "global_step": 70923, "epoch": 1688} {"train_loss": -6.003023147583008, "global_step": 70924, "epoch": 1688} {"train_loss": -5.97453498840332, "global_step": 70925, "epoch": 1688} {"train_loss": -5.977375507354736, "global_step": 70926, "epoch": 1688} {"train_loss": -6.0426530838012695, "global_step": 70927, "epoch": 1688} {"train_loss": -6.043493270874023, "global_step": 70928, "epoch": 1688} {"train_loss": -6.092020034790039, "global_step": 70929, "epoch": 1688} {"train_loss": -6.10703706741333, "global_step": 70930, "epoch": 1688} {"train_loss": -6.068684101104736, "global_step": 70931, "epoch": 1688} {"train_loss": -6.026674270629883, "global_step": 70932, "epoch": 1688} {"train_loss": -5.997733116149902, "global_step": 70933, "epoch": 1688} {"train_loss": -6.090065956115723, "global_step": 70934, "epoch": 1688} {"train_loss": -6.088266372680664, "global_step": 70935, "epoch": 1688} {"train_loss": -6.145327568054199, "global_step": 70936, "epoch": 1688} {"train_loss": -6.003078528812954, "global_step": 70937, "epoch": 1688, "val_loss": 67439.125} {"train_loss": -6.059815883636475, "global_step": 70938, "epoch": 1689} {"train_loss": -6.023534774780273, "global_step": 70939, "epoch": 1689} {"train_loss": -6.1248064041137695, "global_step": 70940, "epoch": 1689} {"train_loss": -6.095486640930176, "global_step": 70941, "epoch": 1689} {"train_loss": -6.10817289352417, "global_step": 70942, "epoch": 1689} {"train_loss": -6.175191402435303, "global_step": 70943, "epoch": 1689} {"train_loss": -6.026854515075684, "global_step": 70944, "epoch": 1689} {"train_loss": -6.061285972595215, "global_step": 70945, "epoch": 1689} {"train_loss": -5.966058254241943, "global_step": 70946, "epoch": 1689} {"train_loss": -6.121008396148682, "global_step": 70947, "epoch": 1689} {"train_loss": -6.122965335845947, "global_step": 70948, "epoch": 1689} {"train_loss": -6.141090393066406, "global_step": 70949, "epoch": 1689} {"train_loss": -5.969499588012695, "global_step": 70950, "epoch": 1689} {"train_loss": -6.004702568054199, "global_step": 70951, "epoch": 1689} {"train_loss": -5.973932266235352, "global_step": 70952, "epoch": 1689} {"train_loss": -6.008131980895996, "global_step": 70953, "epoch": 1689} {"train_loss": -5.995270729064941, "global_step": 70954, "epoch": 1689} {"train_loss": -6.1152544021606445, "global_step": 70955, "epoch": 1689} {"train_loss": -6.003130912780762, "global_step": 70956, "epoch": 1689} {"train_loss": -6.094918251037598, "global_step": 70957, "epoch": 1689} {"train_loss": -6.034679412841797, "global_step": 70958, "epoch": 1689} {"train_loss": -6.044183731079102, "global_step": 70959, "epoch": 1689} {"train_loss": -6.0664262771606445, "global_step": 70960, "epoch": 1689} {"train_loss": -6.025815963745117, "global_step": 70961, "epoch": 1689} {"train_loss": -6.0403594970703125, "global_step": 70962, "epoch": 1689} {"train_loss": -6.0381574630737305, "global_step": 70963, "epoch": 1689} {"train_loss": -5.992656707763672, "global_step": 70964, "epoch": 1689} {"train_loss": -5.929623126983643, "global_step": 70965, "epoch": 1689} {"train_loss": -6.079328536987305, "global_step": 70966, "epoch": 1689} {"train_loss": -6.062792778015137, "global_step": 70967, "epoch": 1689} {"train_loss": -5.97990083694458, "global_step": 70968, "epoch": 1689} {"train_loss": -5.997150897979736, "global_step": 70969, "epoch": 1689} {"train_loss": -6.16666316986084, "global_step": 70970, "epoch": 1689} {"train_loss": -6.012688636779785, "global_step": 70971, "epoch": 1689} {"train_loss": -5.998231887817383, "global_step": 70972, "epoch": 1689} {"train_loss": -6.048701763153076, "global_step": 70973, "epoch": 1689} {"train_loss": -6.062130928039551, "global_step": 70974, "epoch": 1689} {"train_loss": -6.038501739501953, "global_step": 70975, "epoch": 1689} {"train_loss": -6.0150065422058105, "global_step": 70976, "epoch": 1689} {"train_loss": -5.98637580871582, "global_step": 70977, "epoch": 1689} {"train_loss": -6.006173133850098, "global_step": 70978, "epoch": 1689} {"train_loss": -6.040907224019368, "global_step": 70979, "epoch": 1689, "val_loss": 67287.9140625} {"train_loss": -6.076084613800049, "global_step": 70980, "epoch": 1690} {"train_loss": -6.064023017883301, "global_step": 70981, "epoch": 1690} {"train_loss": -6.092682838439941, "global_step": 70982, "epoch": 1690} {"train_loss": -5.958016395568848, "global_step": 70983, "epoch": 1690} {"train_loss": -6.041115760803223, "global_step": 70984, "epoch": 1690} {"train_loss": -5.841482162475586, "global_step": 70985, "epoch": 1690} {"train_loss": -6.016036033630371, "global_step": 70986, "epoch": 1690} {"train_loss": -6.034019947052002, "global_step": 70987, "epoch": 1690} {"train_loss": -6.061420440673828, "global_step": 70988, "epoch": 1690} {"train_loss": -6.019209861755371, "global_step": 70989, "epoch": 1690} {"train_loss": -5.974248886108398, "global_step": 70990, "epoch": 1690} {"train_loss": -5.951332092285156, "global_step": 70991, "epoch": 1690} {"train_loss": -5.963571548461914, "global_step": 70992, "epoch": 1690} {"train_loss": -6.118194103240967, "global_step": 70993, "epoch": 1690} {"train_loss": -5.973246097564697, "global_step": 70994, "epoch": 1690} {"train_loss": -5.998808860778809, "global_step": 70995, "epoch": 1690} {"train_loss": -6.029397487640381, "global_step": 70996, "epoch": 1690} {"train_loss": -5.999266147613525, "global_step": 70997, "epoch": 1690} {"train_loss": -6.090097904205322, "global_step": 70998, "epoch": 1690} {"train_loss": -6.037471294403076, "global_step": 70999, "epoch": 1690} {"train_loss": -5.888566017150879, "global_step": 71000, "epoch": 1690} {"train_loss": -5.999833106994629, "global_step": 71001, "epoch": 1690} {"train_loss": -5.948358058929443, "global_step": 71002, "epoch": 1690} {"train_loss": -6.027331352233887, "global_step": 71003, "epoch": 1690} {"train_loss": -5.9986090660095215, "global_step": 71004, "epoch": 1690} {"train_loss": -5.918074131011963, "global_step": 71005, "epoch": 1690} {"train_loss": -5.995318412780762, "global_step": 71006, "epoch": 1690} {"train_loss": -5.921555042266846, "global_step": 71007, "epoch": 1690} {"train_loss": -5.942080020904541, "global_step": 71008, "epoch": 1690} {"train_loss": -6.031027793884277, "global_step": 71009, "epoch": 1690} {"train_loss": -5.969795227050781, "global_step": 71010, "epoch": 1690} {"train_loss": -6.0603861808776855, "global_step": 71011, "epoch": 1690} {"train_loss": -6.066808700561523, "global_step": 71012, "epoch": 1690} {"train_loss": -5.963321685791016, "global_step": 71013, "epoch": 1690} {"train_loss": -5.9574689865112305, "global_step": 71014, "epoch": 1690} {"train_loss": -6.04285192489624, "global_step": 71015, "epoch": 1690} {"train_loss": -6.0309858322143555, "global_step": 71016, "epoch": 1690} {"train_loss": -6.007767677307129, "global_step": 71017, "epoch": 1690} {"train_loss": -5.962973594665527, "global_step": 71018, "epoch": 1690} {"train_loss": -6.020461082458496, "global_step": 71019, "epoch": 1690} {"train_loss": -5.9721832275390625, "global_step": 71020, "epoch": 1690} {"train_loss": -6.003992761884417, "global_step": 71021, "epoch": 1690, "val_loss": 67149.8984375} {"train_loss": -6.088171005249023, "global_step": 71022, "epoch": 1691} {"train_loss": -5.957470417022705, "global_step": 71023, "epoch": 1691} {"train_loss": -5.979092597961426, "global_step": 71024, "epoch": 1691} {"train_loss": -6.074136734008789, "global_step": 71025, "epoch": 1691} {"train_loss": -6.06227970123291, "global_step": 71026, "epoch": 1691} {"train_loss": -6.133733749389648, "global_step": 71027, "epoch": 1691} {"train_loss": -5.96741247177124, "global_step": 71028, "epoch": 1691} {"train_loss": -6.02046012878418, "global_step": 71029, "epoch": 1691} {"train_loss": -6.05259895324707, "global_step": 71030, "epoch": 1691} {"train_loss": -6.032697677612305, "global_step": 71031, "epoch": 1691} {"train_loss": -6.025952339172363, "global_step": 71032, "epoch": 1691} {"train_loss": -5.966277122497559, "global_step": 71033, "epoch": 1691} {"train_loss": -6.035644054412842, "global_step": 71034, "epoch": 1691} {"train_loss": -6.020001411437988, "global_step": 71035, "epoch": 1691} {"train_loss": -6.05422306060791, "global_step": 71036, "epoch": 1691} {"train_loss": -6.0373077392578125, "global_step": 71037, "epoch": 1691} {"train_loss": -6.030594348907471, "global_step": 71038, "epoch": 1691} {"train_loss": -5.9473395347595215, "global_step": 71039, "epoch": 1691} {"train_loss": -5.972752571105957, "global_step": 71040, "epoch": 1691} {"train_loss": -6.118736743927002, "global_step": 71041, "epoch": 1691} {"train_loss": -5.998904705047607, "global_step": 71042, "epoch": 1691} {"train_loss": -6.106425762176514, "global_step": 71043, "epoch": 1691} {"train_loss": -6.108806610107422, "global_step": 71044, "epoch": 1691} {"train_loss": -6.120737075805664, "global_step": 71045, "epoch": 1691} {"train_loss": -6.075684070587158, "global_step": 71046, "epoch": 1691} {"train_loss": -6.075801849365234, "global_step": 71047, "epoch": 1691} {"train_loss": -6.005882263183594, "global_step": 71048, "epoch": 1691} {"train_loss": -5.942568302154541, "global_step": 71049, "epoch": 1691} {"train_loss": -5.967074394226074, "global_step": 71050, "epoch": 1691} {"train_loss": -6.1446332931518555, "global_step": 71051, "epoch": 1691} {"train_loss": -6.030004501342773, "global_step": 71052, "epoch": 1691} {"train_loss": -6.035710334777832, "global_step": 71053, "epoch": 1691} {"train_loss": -6.140774726867676, "global_step": 71054, "epoch": 1691} {"train_loss": -6.055197715759277, "global_step": 71055, "epoch": 1691} {"train_loss": -6.117619514465332, "global_step": 71056, "epoch": 1691} {"train_loss": -5.994803428649902, "global_step": 71057, "epoch": 1691} {"train_loss": -6.006289482116699, "global_step": 71058, "epoch": 1691} {"train_loss": -5.975458145141602, "global_step": 71059, "epoch": 1691} {"train_loss": -6.112924575805664, "global_step": 71060, "epoch": 1691} {"train_loss": -5.978745460510254, "global_step": 71061, "epoch": 1691} {"train_loss": -6.036479949951172, "global_step": 71062, "epoch": 1691} {"train_loss": -6.038386719567435, "global_step": 71063, "epoch": 1691, "val_loss": 67451.4609375} {"train_loss": -6.008820056915283, "global_step": 71064, "epoch": 1692} {"train_loss": -6.075827598571777, "global_step": 71065, "epoch": 1692} {"train_loss": -6.155421257019043, "global_step": 71066, "epoch": 1692} {"train_loss": -5.864252090454102, "global_step": 71067, "epoch": 1692} {"train_loss": -6.015654563903809, "global_step": 71068, "epoch": 1692} {"train_loss": -5.928773880004883, "global_step": 71069, "epoch": 1692} {"train_loss": -6.057629585266113, "global_step": 71070, "epoch": 1692} {"train_loss": -6.037727355957031, "global_step": 71071, "epoch": 1692} {"train_loss": -5.857914924621582, "global_step": 71072, "epoch": 1692} {"train_loss": -6.016149044036865, "global_step": 71073, "epoch": 1692} {"train_loss": -5.9635396003723145, "global_step": 71074, "epoch": 1692} {"train_loss": -5.894360542297363, "global_step": 71075, "epoch": 1692} {"train_loss": -6.049152851104736, "global_step": 71076, "epoch": 1692} {"train_loss": -5.996277809143066, "global_step": 71077, "epoch": 1692} {"train_loss": -6.011661529541016, "global_step": 71078, "epoch": 1692} {"train_loss": -5.988108158111572, "global_step": 71079, "epoch": 1692} {"train_loss": -5.9794020652771, "global_step": 71080, "epoch": 1692} {"train_loss": -6.0850934982299805, "global_step": 71081, "epoch": 1692} {"train_loss": -6.034531593322754, "global_step": 71082, "epoch": 1692} {"train_loss": -6.008746147155762, "global_step": 71083, "epoch": 1692} {"train_loss": -6.072026252746582, "global_step": 71084, "epoch": 1692} {"train_loss": -6.085906028747559, "global_step": 71085, "epoch": 1692} {"train_loss": -6.054464340209961, "global_step": 71086, "epoch": 1692} {"train_loss": -6.06181001663208, "global_step": 71087, "epoch": 1692} {"train_loss": -6.083792209625244, "global_step": 71088, "epoch": 1692} {"train_loss": -5.9743499755859375, "global_step": 71089, "epoch": 1692} {"train_loss": -6.0581464767456055, "global_step": 71090, "epoch": 1692} {"train_loss": -5.9884934425354, "global_step": 71091, "epoch": 1692} {"train_loss": -6.065283298492432, "global_step": 71092, "epoch": 1692} {"train_loss": -6.036484241485596, "global_step": 71093, "epoch": 1692} {"train_loss": -6.009737968444824, "global_step": 71094, "epoch": 1692} {"train_loss": -6.084123134613037, "global_step": 71095, "epoch": 1692} {"train_loss": -6.077571868896484, "global_step": 71096, "epoch": 1692} {"train_loss": -6.0536699295043945, "global_step": 71097, "epoch": 1692} {"train_loss": -6.057690143585205, "global_step": 71098, "epoch": 1692} {"train_loss": -5.988751411437988, "global_step": 71099, "epoch": 1692} {"train_loss": -6.172930717468262, "global_step": 71100, "epoch": 1692} {"train_loss": -5.993884086608887, "global_step": 71101, "epoch": 1692} {"train_loss": -5.924386978149414, "global_step": 71102, "epoch": 1692} {"train_loss": -6.046820640563965, "global_step": 71103, "epoch": 1692} {"train_loss": -6.035937309265137, "global_step": 71104, "epoch": 1692} {"train_loss": -6.022075142179217, "global_step": 71105, "epoch": 1692, "val_loss": 67140.984375} {"train_loss": -6.169706344604492, "global_step": 71106, "epoch": 1693} {"train_loss": -5.990862846374512, "global_step": 71107, "epoch": 1693} {"train_loss": -6.031484603881836, "global_step": 71108, "epoch": 1693} {"train_loss": -6.066063404083252, "global_step": 71109, "epoch": 1693} {"train_loss": -6.031774044036865, "global_step": 71110, "epoch": 1693} {"train_loss": -6.072186470031738, "global_step": 71111, "epoch": 1693} {"train_loss": -6.071943283081055, "global_step": 71112, "epoch": 1693} {"train_loss": -5.942136764526367, "global_step": 71113, "epoch": 1693} {"train_loss": -5.983340740203857, "global_step": 71114, "epoch": 1693} {"train_loss": -6.094196319580078, "global_step": 71115, "epoch": 1693} {"train_loss": -5.992155075073242, "global_step": 71116, "epoch": 1693} {"train_loss": -5.97733736038208, "global_step": 71117, "epoch": 1693} {"train_loss": -6.038191795349121, "global_step": 71118, "epoch": 1693} {"train_loss": -5.987586975097656, "global_step": 71119, "epoch": 1693} {"train_loss": -6.126591682434082, "global_step": 71120, "epoch": 1693} {"train_loss": -6.01569938659668, "global_step": 71121, "epoch": 1693} {"train_loss": -5.972200393676758, "global_step": 71122, "epoch": 1693} {"train_loss": -5.976509094238281, "global_step": 71123, "epoch": 1693} {"train_loss": -6.067673683166504, "global_step": 71124, "epoch": 1693} {"train_loss": -6.112332344055176, "global_step": 71125, "epoch": 1693} {"train_loss": -5.985859394073486, "global_step": 71126, "epoch": 1693} {"train_loss": -6.130007743835449, "global_step": 71127, "epoch": 1693} {"train_loss": -5.923739433288574, "global_step": 71128, "epoch": 1693} {"train_loss": -6.005744934082031, "global_step": 71129, "epoch": 1693} {"train_loss": -6.010372161865234, "global_step": 71130, "epoch": 1693} {"train_loss": -5.888757228851318, "global_step": 71131, "epoch": 1693} {"train_loss": -6.040799617767334, "global_step": 71132, "epoch": 1693} {"train_loss": -6.039856910705566, "global_step": 71133, "epoch": 1693} {"train_loss": -6.023769378662109, "global_step": 71134, "epoch": 1693} {"train_loss": -6.074103355407715, "global_step": 71135, "epoch": 1693} {"train_loss": -6.026878356933594, "global_step": 71136, "epoch": 1693} {"train_loss": -6.0030317306518555, "global_step": 71137, "epoch": 1693} {"train_loss": -5.933277606964111, "global_step": 71138, "epoch": 1693} {"train_loss": -5.978421211242676, "global_step": 71139, "epoch": 1693} {"train_loss": -6.060880661010742, "global_step": 71140, "epoch": 1693} {"train_loss": -5.975305557250977, "global_step": 71141, "epoch": 1693} {"train_loss": -6.031010627746582, "global_step": 71142, "epoch": 1693} {"train_loss": -5.9983954429626465, "global_step": 71143, "epoch": 1693} {"train_loss": -6.009779930114746, "global_step": 71144, "epoch": 1693} {"train_loss": -5.8742170333862305, "global_step": 71145, "epoch": 1693} {"train_loss": -5.990063667297363, "global_step": 71146, "epoch": 1693} {"train_loss": -6.017106885001773, "global_step": 71147, "epoch": 1693, "val_loss": 67391.40625} {"train_loss": -5.978209495544434, "global_step": 71148, "epoch": 1694} {"train_loss": -5.907280921936035, "global_step": 71149, "epoch": 1694} {"train_loss": -5.976738929748535, "global_step": 71150, "epoch": 1694} {"train_loss": -6.019360065460205, "global_step": 71151, "epoch": 1694} {"train_loss": -5.848796844482422, "global_step": 71152, "epoch": 1694} {"train_loss": -6.053467750549316, "global_step": 71153, "epoch": 1694} {"train_loss": -5.996976852416992, "global_step": 71154, "epoch": 1694} {"train_loss": -5.973523139953613, "global_step": 71155, "epoch": 1694} {"train_loss": -6.101149559020996, "global_step": 71156, "epoch": 1694} {"train_loss": -5.955035209655762, "global_step": 71157, "epoch": 1694} {"train_loss": -6.010284423828125, "global_step": 71158, "epoch": 1694} {"train_loss": -5.995182991027832, "global_step": 71159, "epoch": 1694} {"train_loss": -5.896200656890869, "global_step": 71160, "epoch": 1694} {"train_loss": -5.970519065856934, "global_step": 71161, "epoch": 1694} {"train_loss": -5.93840217590332, "global_step": 71162, "epoch": 1694} {"train_loss": -5.971717357635498, "global_step": 71163, "epoch": 1694} {"train_loss": -5.972415924072266, "global_step": 71164, "epoch": 1694} {"train_loss": -6.092564582824707, "global_step": 71165, "epoch": 1694} {"train_loss": -5.924895763397217, "global_step": 71166, "epoch": 1694} {"train_loss": -5.957833290100098, "global_step": 71167, "epoch": 1694} {"train_loss": -6.0516815185546875, "global_step": 71168, "epoch": 1694} {"train_loss": -6.03462028503418, "global_step": 71169, "epoch": 1694} {"train_loss": -6.060022354125977, "global_step": 71170, "epoch": 1694} {"train_loss": -6.037779808044434, "global_step": 71171, "epoch": 1694} {"train_loss": -5.993280410766602, "global_step": 71172, "epoch": 1694} {"train_loss": -6.05281925201416, "global_step": 71173, "epoch": 1694} {"train_loss": -5.973149299621582, "global_step": 71174, "epoch": 1694} {"train_loss": -5.9266252517700195, "global_step": 71175, "epoch": 1694} {"train_loss": -5.955247402191162, "global_step": 71176, "epoch": 1694} {"train_loss": -6.085097312927246, "global_step": 71177, "epoch": 1694} {"train_loss": -5.936310768127441, "global_step": 71178, "epoch": 1694} {"train_loss": -5.9236555099487305, "global_step": 71179, "epoch": 1694} {"train_loss": -6.095043659210205, "global_step": 71180, "epoch": 1694} {"train_loss": -6.125369548797607, "global_step": 71181, "epoch": 1694} {"train_loss": -6.003661155700684, "global_step": 71182, "epoch": 1694} {"train_loss": -5.978649139404297, "global_step": 71183, "epoch": 1694} {"train_loss": -5.778620719909668, "global_step": 71184, "epoch": 1694} {"train_loss": -6.028841018676758, "global_step": 71185, "epoch": 1694} {"train_loss": -5.968727111816406, "global_step": 71186, "epoch": 1694} {"train_loss": -6.04287052154541, "global_step": 71187, "epoch": 1694} {"train_loss": -6.134842872619629, "global_step": 71188, "epoch": 1694} {"train_loss": -5.991570063999721, "global_step": 71189, "epoch": 1694, "val_loss": 67263.6796875} {"train_loss": -5.93166971206665, "global_step": 71190, "epoch": 1695} {"train_loss": -5.979682445526123, "global_step": 71191, "epoch": 1695} {"train_loss": -5.995977401733398, "global_step": 71192, "epoch": 1695} {"train_loss": -6.040079116821289, "global_step": 71193, "epoch": 1695} {"train_loss": -6.017460823059082, "global_step": 71194, "epoch": 1695} {"train_loss": -5.916508197784424, "global_step": 71195, "epoch": 1695} {"train_loss": -5.995939254760742, "global_step": 71196, "epoch": 1695} {"train_loss": -6.20143985748291, "global_step": 71197, "epoch": 1695} {"train_loss": -5.950860977172852, "global_step": 71198, "epoch": 1695} {"train_loss": -6.028936386108398, "global_step": 71199, "epoch": 1695} {"train_loss": -6.015936374664307, "global_step": 71200, "epoch": 1695} {"train_loss": -6.082215785980225, "global_step": 71201, "epoch": 1695} {"train_loss": -6.103106498718262, "global_step": 71202, "epoch": 1695} {"train_loss": -5.895687103271484, "global_step": 71203, "epoch": 1695} {"train_loss": -6.054610252380371, "global_step": 71204, "epoch": 1695} {"train_loss": -5.9776763916015625, "global_step": 71205, "epoch": 1695} {"train_loss": -5.995661735534668, "global_step": 71206, "epoch": 1695} {"train_loss": -5.870607852935791, "global_step": 71207, "epoch": 1695} {"train_loss": -6.021162033081055, "global_step": 71208, "epoch": 1695} {"train_loss": -5.978036880493164, "global_step": 71209, "epoch": 1695} {"train_loss": -6.096462249755859, "global_step": 71210, "epoch": 1695} {"train_loss": -5.979384422302246, "global_step": 71211, "epoch": 1695} {"train_loss": -5.965686321258545, "global_step": 71212, "epoch": 1695} {"train_loss": -6.001039505004883, "global_step": 71213, "epoch": 1695} {"train_loss": -6.120643615722656, "global_step": 71214, "epoch": 1695} {"train_loss": -5.99112606048584, "global_step": 71215, "epoch": 1695} {"train_loss": -5.909431457519531, "global_step": 71216, "epoch": 1695} {"train_loss": -6.088674545288086, "global_step": 71217, "epoch": 1695} {"train_loss": -5.98915958404541, "global_step": 71218, "epoch": 1695} {"train_loss": -6.030303001403809, "global_step": 71219, "epoch": 1695} {"train_loss": -5.9798054695129395, "global_step": 71220, "epoch": 1695} {"train_loss": -6.125747203826904, "global_step": 71221, "epoch": 1695} {"train_loss": -5.909567832946777, "global_step": 71222, "epoch": 1695} {"train_loss": -6.017178058624268, "global_step": 71223, "epoch": 1695} {"train_loss": -6.017856121063232, "global_step": 71224, "epoch": 1695} {"train_loss": -5.920032501220703, "global_step": 71225, "epoch": 1695} {"train_loss": -6.019811630249023, "global_step": 71226, "epoch": 1695} {"train_loss": -6.030313491821289, "global_step": 71227, "epoch": 1695} {"train_loss": -6.024830341339111, "global_step": 71228, "epoch": 1695} {"train_loss": -6.117021560668945, "global_step": 71229, "epoch": 1695} {"train_loss": -6.073907375335693, "global_step": 71230, "epoch": 1695} {"train_loss": -6.01278493517921, "global_step": 71231, "epoch": 1695, "val_loss": 67582.4375} {"train_loss": -6.000266075134277, "global_step": 71232, "epoch": 1696} {"train_loss": -5.9560227394104, "global_step": 71233, "epoch": 1696} {"train_loss": -5.9545817375183105, "global_step": 71234, "epoch": 1696} {"train_loss": -5.985365867614746, "global_step": 71235, "epoch": 1696} {"train_loss": -5.8089799880981445, "global_step": 71236, "epoch": 1696} {"train_loss": -5.9357500076293945, "global_step": 71237, "epoch": 1696} {"train_loss": -6.055517196655273, "global_step": 71238, "epoch": 1696} {"train_loss": -5.955132007598877, "global_step": 71239, "epoch": 1696} {"train_loss": -6.178947448730469, "global_step": 71240, "epoch": 1696} {"train_loss": -6.064295768737793, "global_step": 71241, "epoch": 1696} {"train_loss": -5.764456272125244, "global_step": 71242, "epoch": 1696} {"train_loss": -6.13425350189209, "global_step": 71243, "epoch": 1696} {"train_loss": -6.011913299560547, "global_step": 71244, "epoch": 1696} {"train_loss": -6.022507667541504, "global_step": 71245, "epoch": 1696} {"train_loss": -5.9488372802734375, "global_step": 71246, "epoch": 1696} {"train_loss": -6.005083084106445, "global_step": 71247, "epoch": 1696} {"train_loss": -6.048095226287842, "global_step": 71248, "epoch": 1696} {"train_loss": -6.014798164367676, "global_step": 71249, "epoch": 1696} {"train_loss": -6.003563404083252, "global_step": 71250, "epoch": 1696} {"train_loss": -6.114941596984863, "global_step": 71251, "epoch": 1696} {"train_loss": -5.9845170974731445, "global_step": 71252, "epoch": 1696} {"train_loss": -6.03503942489624, "global_step": 71253, "epoch": 1696} {"train_loss": -6.076838970184326, "global_step": 71254, "epoch": 1696} {"train_loss": -6.037723541259766, "global_step": 71255, "epoch": 1696} {"train_loss": -6.154101371765137, "global_step": 71256, "epoch": 1696} {"train_loss": -6.015108108520508, "global_step": 71257, "epoch": 1696} {"train_loss": -6.0224480628967285, "global_step": 71258, "epoch": 1696} {"train_loss": -5.973882675170898, "global_step": 71259, "epoch": 1696} {"train_loss": -5.957505702972412, "global_step": 71260, "epoch": 1696} {"train_loss": -6.127105712890625, "global_step": 71261, "epoch": 1696} {"train_loss": -6.005784511566162, "global_step": 71262, "epoch": 1696} {"train_loss": -5.984623908996582, "global_step": 71263, "epoch": 1696} {"train_loss": -5.97791862487793, "global_step": 71264, "epoch": 1696} {"train_loss": -6.020869255065918, "global_step": 71265, "epoch": 1696} {"train_loss": -5.91162109375, "global_step": 71266, "epoch": 1696} {"train_loss": -6.087937355041504, "global_step": 71267, "epoch": 1696} {"train_loss": -6.024393558502197, "global_step": 71268, "epoch": 1696} {"train_loss": -6.107594966888428, "global_step": 71269, "epoch": 1696} {"train_loss": -5.976959228515625, "global_step": 71270, "epoch": 1696} {"train_loss": -6.027794361114502, "global_step": 71271, "epoch": 1696} {"train_loss": -5.981579780578613, "global_step": 71272, "epoch": 1696} {"train_loss": -6.010840279715402, "global_step": 71273, "epoch": 1696, "val_loss": 67414.96875} {"train_loss": -6.049243927001953, "global_step": 71274, "epoch": 1697} {"train_loss": -6.001729965209961, "global_step": 71275, "epoch": 1697} {"train_loss": -6.0172576904296875, "global_step": 71276, "epoch": 1697} {"train_loss": -6.102173805236816, "global_step": 71277, "epoch": 1697} {"train_loss": -6.042511463165283, "global_step": 71278, "epoch": 1697} {"train_loss": -6.151827335357666, "global_step": 71279, "epoch": 1697} {"train_loss": -6.050887107849121, "global_step": 71280, "epoch": 1697} {"train_loss": -6.029139041900635, "global_step": 71281, "epoch": 1697} {"train_loss": -6.10789155960083, "global_step": 71282, "epoch": 1697} {"train_loss": -6.012791633605957, "global_step": 71283, "epoch": 1697} {"train_loss": -5.953408241271973, "global_step": 71284, "epoch": 1697} {"train_loss": -6.148958206176758, "global_step": 71285, "epoch": 1697} {"train_loss": -6.009880065917969, "global_step": 71286, "epoch": 1697} {"train_loss": -6.053591728210449, "global_step": 71287, "epoch": 1697} {"train_loss": -6.010906219482422, "global_step": 71288, "epoch": 1697} {"train_loss": -6.0643110275268555, "global_step": 71289, "epoch": 1697} {"train_loss": -5.96889066696167, "global_step": 71290, "epoch": 1697} {"train_loss": -6.056363105773926, "global_step": 71291, "epoch": 1697} {"train_loss": -6.026590824127197, "global_step": 71292, "epoch": 1697} {"train_loss": -6.008629322052002, "global_step": 71293, "epoch": 1697} {"train_loss": -5.987734794616699, "global_step": 71294, "epoch": 1697} {"train_loss": -6.0215163230896, "global_step": 71295, "epoch": 1697} {"train_loss": -5.9858245849609375, "global_step": 71296, "epoch": 1697} {"train_loss": -6.084794998168945, "global_step": 71297, "epoch": 1697} {"train_loss": -6.013500213623047, "global_step": 71298, "epoch": 1697} {"train_loss": -6.129665374755859, "global_step": 71299, "epoch": 1697} {"train_loss": -5.9531331062316895, "global_step": 71300, "epoch": 1697} {"train_loss": -6.041171073913574, "global_step": 71301, "epoch": 1697} {"train_loss": -6.071829795837402, "global_step": 71302, "epoch": 1697} {"train_loss": -5.868236541748047, "global_step": 71303, "epoch": 1697} {"train_loss": -6.0573320388793945, "global_step": 71304, "epoch": 1697} {"train_loss": -5.972359657287598, "global_step": 71305, "epoch": 1697} {"train_loss": -5.854406356811523, "global_step": 71306, "epoch": 1697} {"train_loss": -6.086347579956055, "global_step": 71307, "epoch": 1697} {"train_loss": -6.038391590118408, "global_step": 71308, "epoch": 1697} {"train_loss": -6.0119309425354, "global_step": 71309, "epoch": 1697} {"train_loss": -5.991730213165283, "global_step": 71310, "epoch": 1697} {"train_loss": -6.021589756011963, "global_step": 71311, "epoch": 1697} {"train_loss": -5.970407009124756, "global_step": 71312, "epoch": 1697} {"train_loss": -5.997946262359619, "global_step": 71313, "epoch": 1697} {"train_loss": -6.000786781311035, "global_step": 71314, "epoch": 1697} {"train_loss": -6.025651772816976, "global_step": 71315, "epoch": 1697, "val_loss": 67377.609375} {"train_loss": -5.943778038024902, "global_step": 71316, "epoch": 1698} {"train_loss": -5.9624481201171875, "global_step": 71317, "epoch": 1698} {"train_loss": -5.972525596618652, "global_step": 71318, "epoch": 1698} {"train_loss": -6.10605525970459, "global_step": 71319, "epoch": 1698} {"train_loss": -6.060856819152832, "global_step": 71320, "epoch": 1698} {"train_loss": -6.125506401062012, "global_step": 71321, "epoch": 1698} {"train_loss": -5.939647674560547, "global_step": 71322, "epoch": 1698} {"train_loss": -6.073038101196289, "global_step": 71323, "epoch": 1698} {"train_loss": -6.072859764099121, "global_step": 71324, "epoch": 1698} {"train_loss": -5.940093517303467, "global_step": 71325, "epoch": 1698} {"train_loss": -6.074434280395508, "global_step": 71326, "epoch": 1698} {"train_loss": -6.167238235473633, "global_step": 71327, "epoch": 1698} {"train_loss": -6.185618877410889, "global_step": 71328, "epoch": 1698} {"train_loss": -6.070738792419434, "global_step": 71329, "epoch": 1698} {"train_loss": -6.038913249969482, "global_step": 71330, "epoch": 1698} {"train_loss": -5.927607536315918, "global_step": 71331, "epoch": 1698} {"train_loss": -6.069466590881348, "global_step": 71332, "epoch": 1698} {"train_loss": -6.072865009307861, "global_step": 71333, "epoch": 1698} {"train_loss": -6.070243835449219, "global_step": 71334, "epoch": 1698} {"train_loss": -6.0837554931640625, "global_step": 71335, "epoch": 1698} {"train_loss": -6.0450520515441895, "global_step": 71336, "epoch": 1698} {"train_loss": -5.95040225982666, "global_step": 71337, "epoch": 1698} {"train_loss": -6.111295700073242, "global_step": 71338, "epoch": 1698} {"train_loss": -5.936639785766602, "global_step": 71339, "epoch": 1698} {"train_loss": -6.080816268920898, "global_step": 71340, "epoch": 1698} {"train_loss": -5.979465484619141, "global_step": 71341, "epoch": 1698} {"train_loss": -5.90834903717041, "global_step": 71342, "epoch": 1698} {"train_loss": -5.9741106033325195, "global_step": 71343, "epoch": 1698} {"train_loss": -6.007877826690674, "global_step": 71344, "epoch": 1698} {"train_loss": -6.041608810424805, "global_step": 71345, "epoch": 1698} {"train_loss": -6.04920768737793, "global_step": 71346, "epoch": 1698} {"train_loss": -5.979733943939209, "global_step": 71347, "epoch": 1698} {"train_loss": -6.090636253356934, "global_step": 71348, "epoch": 1698} {"train_loss": -6.049343109130859, "global_step": 71349, "epoch": 1698} {"train_loss": -5.967240810394287, "global_step": 71350, "epoch": 1698} {"train_loss": -5.832622528076172, "global_step": 71351, "epoch": 1698} {"train_loss": -5.972804546356201, "global_step": 71352, "epoch": 1698} {"train_loss": -6.009634971618652, "global_step": 71353, "epoch": 1698} {"train_loss": -6.1088666915893555, "global_step": 71354, "epoch": 1698} {"train_loss": -6.001453399658203, "global_step": 71355, "epoch": 1698} {"train_loss": -5.939680576324463, "global_step": 71356, "epoch": 1698} {"train_loss": -6.026667265664964, "global_step": 71357, "epoch": 1698, "val_loss": 67337.53125} {"train_loss": -6.044305801391602, "global_step": 71358, "epoch": 1699} {"train_loss": -6.11161994934082, "global_step": 71359, "epoch": 1699} {"train_loss": -6.00583028793335, "global_step": 71360, "epoch": 1699} {"train_loss": -6.019360542297363, "global_step": 71361, "epoch": 1699} {"train_loss": -6.094570159912109, "global_step": 71362, "epoch": 1699} {"train_loss": -6.041182518005371, "global_step": 71363, "epoch": 1699} {"train_loss": -6.037454605102539, "global_step": 71364, "epoch": 1699} {"train_loss": -6.121207237243652, "global_step": 71365, "epoch": 1699} {"train_loss": -6.006505489349365, "global_step": 71366, "epoch": 1699} {"train_loss": -6.094717025756836, "global_step": 71367, "epoch": 1699} {"train_loss": -6.13337516784668, "global_step": 71368, "epoch": 1699} {"train_loss": -6.026500225067139, "global_step": 71369, "epoch": 1699} {"train_loss": -5.992002964019775, "global_step": 71370, "epoch": 1699} {"train_loss": -6.059218406677246, "global_step": 71371, "epoch": 1699} {"train_loss": -6.100198745727539, "global_step": 71372, "epoch": 1699} {"train_loss": -5.999067306518555, "global_step": 71373, "epoch": 1699} {"train_loss": -6.0139970779418945, "global_step": 71374, "epoch": 1699} {"train_loss": -5.901801109313965, "global_step": 71375, "epoch": 1699} {"train_loss": -5.970598220825195, "global_step": 71376, "epoch": 1699} {"train_loss": -5.984073162078857, "global_step": 71377, "epoch": 1699} {"train_loss": -6.054924964904785, "global_step": 71378, "epoch": 1699} {"train_loss": -6.041427135467529, "global_step": 71379, "epoch": 1699} {"train_loss": -5.980389595031738, "global_step": 71380, "epoch": 1699} {"train_loss": -6.125685214996338, "global_step": 71381, "epoch": 1699} {"train_loss": -5.919236183166504, "global_step": 71382, "epoch": 1699} {"train_loss": -5.962717533111572, "global_step": 71383, "epoch": 1699} {"train_loss": -6.01645565032959, "global_step": 71384, "epoch": 1699} {"train_loss": -5.953743934631348, "global_step": 71385, "epoch": 1699} {"train_loss": -5.914474964141846, "global_step": 71386, "epoch": 1699} {"train_loss": -5.933654308319092, "global_step": 71387, "epoch": 1699} {"train_loss": -5.96956729888916, "global_step": 71388, "epoch": 1699} {"train_loss": -6.0307512283325195, "global_step": 71389, "epoch": 1699} {"train_loss": -5.932085990905762, "global_step": 71390, "epoch": 1699} {"train_loss": -5.96314811706543, "global_step": 71391, "epoch": 1699} {"train_loss": -5.989863395690918, "global_step": 71392, "epoch": 1699} {"train_loss": -5.970544338226318, "global_step": 71393, "epoch": 1699} {"train_loss": -6.031069278717041, "global_step": 71394, "epoch": 1699} {"train_loss": -6.0539350509643555, "global_step": 71395, "epoch": 1699} {"train_loss": -6.086183547973633, "global_step": 71396, "epoch": 1699} {"train_loss": -5.973092555999756, "global_step": 71397, "epoch": 1699} {"train_loss": -6.016831398010254, "global_step": 71398, "epoch": 1699} {"train_loss": -6.0144684087662466, "global_step": 71399, "epoch": 1699, "val_loss": 67523.8359375} {"train_loss": -6.092411994934082, "global_step": 71400, "epoch": 1700} {"train_loss": -6.095287322998047, "global_step": 71401, "epoch": 1700} {"train_loss": -6.0118818283081055, "global_step": 71402, "epoch": 1700} {"train_loss": -5.890264987945557, "global_step": 71403, "epoch": 1700} {"train_loss": -5.975198745727539, "global_step": 71404, "epoch": 1700} {"train_loss": -6.195736885070801, "global_step": 71405, "epoch": 1700} {"train_loss": -5.9669928550720215, "global_step": 71406, "epoch": 1700} {"train_loss": -6.080373764038086, "global_step": 71407, "epoch": 1700} {"train_loss": -6.023781776428223, "global_step": 71408, "epoch": 1700} {"train_loss": -5.935384750366211, "global_step": 71409, "epoch": 1700} {"train_loss": -6.019158363342285, "global_step": 71410, "epoch": 1700} {"train_loss": -6.03035306930542, "global_step": 71411, "epoch": 1700} {"train_loss": -6.084717750549316, "global_step": 71412, "epoch": 1700} {"train_loss": -5.967809677124023, "global_step": 71413, "epoch": 1700} {"train_loss": -5.941145896911621, "global_step": 71414, "epoch": 1700} {"train_loss": -6.103311538696289, "global_step": 71415, "epoch": 1700} {"train_loss": -6.022568702697754, "global_step": 71416, "epoch": 1700} {"train_loss": -6.051551818847656, "global_step": 71417, "epoch": 1700} {"train_loss": -5.991072654724121, "global_step": 71418, "epoch": 1700} {"train_loss": -6.019482612609863, "global_step": 71419, "epoch": 1700} {"train_loss": -6.124505043029785, "global_step": 71420, "epoch": 1700} {"train_loss": -6.127809524536133, "global_step": 71421, "epoch": 1700} {"train_loss": -5.964425086975098, "global_step": 71422, "epoch": 1700} {"train_loss": -6.046502113342285, "global_step": 71423, "epoch": 1700} {"train_loss": -6.009501934051514, "global_step": 71424, "epoch": 1700} {"train_loss": -6.007028579711914, "global_step": 71425, "epoch": 1700} {"train_loss": -5.981627464294434, "global_step": 71426, "epoch": 1700} {"train_loss": -5.993809700012207, "global_step": 71427, "epoch": 1700} {"train_loss": -5.961053371429443, "global_step": 71428, "epoch": 1700} {"train_loss": -5.957618713378906, "global_step": 71429, "epoch": 1700} {"train_loss": -5.795388698577881, "global_step": 71430, "epoch": 1700} {"train_loss": -6.070283889770508, "global_step": 71431, "epoch": 1700} {"train_loss": -6.040857315063477, "global_step": 71432, "epoch": 1700} {"train_loss": -5.9337592124938965, "global_step": 71433, "epoch": 1700} {"train_loss": -6.053776741027832, "global_step": 71434, "epoch": 1700} {"train_loss": -6.008330345153809, "global_step": 71435, "epoch": 1700} {"train_loss": -5.977593898773193, "global_step": 71436, "epoch": 1700} {"train_loss": -5.935816764831543, "global_step": 71437, "epoch": 1700} {"train_loss": -6.0594611167907715, "global_step": 71438, "epoch": 1700} {"train_loss": -5.923949241638184, "global_step": 71439, "epoch": 1700} {"train_loss": -5.905031204223633, "global_step": 71440, "epoch": 1700} {"train_loss": -6.012051343917847, "global_step": 71441, "epoch": 1700, "train/sim_max_reward_0": 0.23487989274786839, "train/sim_max_reward_1": 0.8843309564249319, "train/sim_max_reward_2": 0.4116492149532023, "train/sim_max_reward_3": 0.15799507630841442, "train/sim_max_reward_4": 0.8190673432332479, "train/sim_max_reward_5": 0.7842080700022859, "test/sim_max_reward_4400000": 0.978040674822914, "test/sim_max_reward_4400001": 0.7729531910528064, "test/sim_max_reward_4400002": 0.4044445624513553, "test/sim_max_reward_4400003": 0.48331640617340854, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.7530737178970935, "test/sim_max_reward_4400007": 0.5582819878566814, "test/sim_max_reward_4400008": 0.43428458240617723, "test/sim_max_reward_4400009": 0.6664377552039562, "test/sim_max_reward_4400010": 0.22362204549708473, "test/sim_max_reward_4400011": 0.20531439781271257, "test/sim_max_reward_4400012": 0.8795647402788551, "test/sim_max_reward_4400013": 0.3430425879652822, "test/sim_max_reward_4400014": 0.19126038142408006, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.26877101462027175, "test/sim_max_reward_4400019": 0.6274629115637695, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.9322635107514436, "test/sim_max_reward_4400022": 0.2636762284757869, "test/sim_max_reward_4400023": 0.7690221149133146, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1960529264537632, "test/sim_max_reward_4400026": 0.8325999813228236, "test/sim_max_reward_4400027": 0.0499015336894592, "test/sim_max_reward_4400028": 0.7518245410847385, "test/sim_max_reward_4400029": 0.07058119163425813, "test/sim_max_reward_4400030": 0.803243211435556, "test/sim_max_reward_4400031": 0.9348640566795702, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.5621886990562547, "test/sim_max_reward_4400034": 0.9074121050647078, "test/sim_max_reward_4400035": 0.4580100716160517, "test/sim_max_reward_4400036": 0.49692499659721945, "test/sim_max_reward_4400037": 0.31961893320263923, "test/sim_max_reward_4400038": 0.8132824135688459, "test/sim_max_reward_4400039": 0.9979342031420313, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6055258840346086, "test/sim_max_reward_4400042": 0.014526382685964779, "test/sim_max_reward_4400043": 0.7437856509041179, "test/sim_max_reward_4400044": 0.761703002138527, "test/sim_max_reward_4400045": 0.34106233572198524, "test/sim_max_reward_4400046": 0.6383331713582093, "test/sim_max_reward_4400047": 0.8238495570113915, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.5266015628425037, "train/mean_score": 0.5486884256116584, "test/mean_score": 0.45348647900120753, "val_loss": 67500.703125} {"train_loss": -6.08497428894043, "global_step": 71442, "epoch": 1701} {"train_loss": -5.9331464767456055, "global_step": 71443, "epoch": 1701} {"train_loss": -6.046269416809082, "global_step": 71444, "epoch": 1701} {"train_loss": -5.920071601867676, "global_step": 71445, "epoch": 1701} {"train_loss": -5.978849411010742, "global_step": 71446, "epoch": 1701} {"train_loss": -6.072996139526367, "global_step": 71447, "epoch": 1701} {"train_loss": -6.157049179077148, "global_step": 71448, "epoch": 1701} {"train_loss": -6.088865280151367, "global_step": 71449, "epoch": 1701} {"train_loss": -5.976687431335449, "global_step": 71450, "epoch": 1701} {"train_loss": -6.027760982513428, "global_step": 71451, "epoch": 1701} {"train_loss": -6.041792869567871, "global_step": 71452, "epoch": 1701} {"train_loss": -5.937543869018555, "global_step": 71453, "epoch": 1701} {"train_loss": -6.027833938598633, "global_step": 71454, "epoch": 1701} {"train_loss": -6.050031661987305, "global_step": 71455, "epoch": 1701} {"train_loss": -5.937872886657715, "global_step": 71456, "epoch": 1701} {"train_loss": -6.07994270324707, "global_step": 71457, "epoch": 1701} {"train_loss": -6.039813995361328, "global_step": 71458, "epoch": 1701} {"train_loss": -6.128477096557617, "global_step": 71459, "epoch": 1701} {"train_loss": -6.09828519821167, "global_step": 71460, "epoch": 1701} {"train_loss": -6.155956745147705, "global_step": 71461, "epoch": 1701} {"train_loss": -6.15176248550415, "global_step": 71462, "epoch": 1701} {"train_loss": -5.976263999938965, "global_step": 71463, "epoch": 1701} {"train_loss": -5.985339164733887, "global_step": 71464, "epoch": 1701} {"train_loss": -5.97538948059082, "global_step": 71465, "epoch": 1701} {"train_loss": -5.975010871887207, "global_step": 71466, "epoch": 1701} {"train_loss": -6.104918956756592, "global_step": 71467, "epoch": 1701} {"train_loss": -6.025727272033691, "global_step": 71468, "epoch": 1701} {"train_loss": -6.186642169952393, "global_step": 71469, "epoch": 1701} {"train_loss": -5.950222492218018, "global_step": 71470, "epoch": 1701} {"train_loss": -5.993544578552246, "global_step": 71471, "epoch": 1701} {"train_loss": -5.9303364753723145, "global_step": 71472, "epoch": 1701} {"train_loss": -6.091434001922607, "global_step": 71473, "epoch": 1701} {"train_loss": -6.044011116027832, "global_step": 71474, "epoch": 1701} {"train_loss": -6.116046905517578, "global_step": 71475, "epoch": 1701} {"train_loss": -6.1145524978637695, "global_step": 71476, "epoch": 1701} {"train_loss": -6.107389450073242, "global_step": 71477, "epoch": 1701} {"train_loss": -6.0960235595703125, "global_step": 71478, "epoch": 1701} {"train_loss": -5.997013092041016, "global_step": 71479, "epoch": 1701} {"train_loss": -6.012835502624512, "global_step": 71480, "epoch": 1701} {"train_loss": -6.060688018798828, "global_step": 71481, "epoch": 1701} {"train_loss": -6.16434383392334, "global_step": 71482, "epoch": 1701} {"train_loss": -6.044108754112607, "global_step": 71483, "epoch": 1701, "val_loss": 67254.8359375} {"train_loss": -6.158389091491699, "global_step": 71484, "epoch": 1702} {"train_loss": -6.040219306945801, "global_step": 71485, "epoch": 1702} {"train_loss": -6.031643867492676, "global_step": 71486, "epoch": 1702} {"train_loss": -6.0480217933654785, "global_step": 71487, "epoch": 1702} {"train_loss": -6.085960865020752, "global_step": 71488, "epoch": 1702} {"train_loss": -5.990740776062012, "global_step": 71489, "epoch": 1702} {"train_loss": -5.994718551635742, "global_step": 71490, "epoch": 1702} {"train_loss": -6.128251075744629, "global_step": 71491, "epoch": 1702} {"train_loss": -6.126674175262451, "global_step": 71492, "epoch": 1702} {"train_loss": -5.945644378662109, "global_step": 71493, "epoch": 1702} {"train_loss": -6.046537399291992, "global_step": 71494, "epoch": 1702} {"train_loss": -6.092054843902588, "global_step": 71495, "epoch": 1702} {"train_loss": -6.007354736328125, "global_step": 71496, "epoch": 1702} {"train_loss": -6.004280090332031, "global_step": 71497, "epoch": 1702} {"train_loss": -6.051206588745117, "global_step": 71498, "epoch": 1702} {"train_loss": -6.021193981170654, "global_step": 71499, "epoch": 1702} {"train_loss": -5.97967529296875, "global_step": 71500, "epoch": 1702} {"train_loss": -6.064291477203369, "global_step": 71501, "epoch": 1702} {"train_loss": -6.136342525482178, "global_step": 71502, "epoch": 1702} {"train_loss": -5.875339984893799, "global_step": 71503, "epoch": 1702} {"train_loss": -5.949069976806641, "global_step": 71504, "epoch": 1702} {"train_loss": -6.062248229980469, "global_step": 71505, "epoch": 1702} {"train_loss": -6.012603282928467, "global_step": 71506, "epoch": 1702} {"train_loss": -6.003208637237549, "global_step": 71507, "epoch": 1702} {"train_loss": -6.08222770690918, "global_step": 71508, "epoch": 1702} {"train_loss": -6.008230209350586, "global_step": 71509, "epoch": 1702} {"train_loss": -6.049862384796143, "global_step": 71510, "epoch": 1702} {"train_loss": -6.049333095550537, "global_step": 71511, "epoch": 1702} {"train_loss": -6.035220146179199, "global_step": 71512, "epoch": 1702} {"train_loss": -5.936792373657227, "global_step": 71513, "epoch": 1702} {"train_loss": -6.153650283813477, "global_step": 71514, "epoch": 1702} {"train_loss": -5.898380279541016, "global_step": 71515, "epoch": 1702} {"train_loss": -6.053006172180176, "global_step": 71516, "epoch": 1702} {"train_loss": -6.046148300170898, "global_step": 71517, "epoch": 1702} {"train_loss": -5.933906555175781, "global_step": 71518, "epoch": 1702} {"train_loss": -6.071313858032227, "global_step": 71519, "epoch": 1702} {"train_loss": -6.073209762573242, "global_step": 71520, "epoch": 1702} {"train_loss": -5.908111572265625, "global_step": 71521, "epoch": 1702} {"train_loss": -6.086361885070801, "global_step": 71522, "epoch": 1702} {"train_loss": -5.965140342712402, "global_step": 71523, "epoch": 1702} {"train_loss": -6.051287651062012, "global_step": 71524, "epoch": 1702} {"train_loss": -6.029444160915556, "global_step": 71525, "epoch": 1702, "val_loss": 67359.7421875} {"train_loss": -6.016079902648926, "global_step": 71526, "epoch": 1703} {"train_loss": -5.982866287231445, "global_step": 71527, "epoch": 1703} {"train_loss": -6.11537504196167, "global_step": 71528, "epoch": 1703} {"train_loss": -6.05675745010376, "global_step": 71529, "epoch": 1703} {"train_loss": -5.961301803588867, "global_step": 71530, "epoch": 1703} {"train_loss": -5.93109655380249, "global_step": 71531, "epoch": 1703} {"train_loss": -5.9721784591674805, "global_step": 71532, "epoch": 1703} {"train_loss": -5.893588542938232, "global_step": 71533, "epoch": 1703} {"train_loss": -5.961690425872803, "global_step": 71534, "epoch": 1703} {"train_loss": -6.042610168457031, "global_step": 71535, "epoch": 1703} {"train_loss": -6.01182222366333, "global_step": 71536, "epoch": 1703} {"train_loss": -6.01544713973999, "global_step": 71537, "epoch": 1703} {"train_loss": -5.895047187805176, "global_step": 71538, "epoch": 1703} {"train_loss": -5.921773910522461, "global_step": 71539, "epoch": 1703} {"train_loss": -5.719474792480469, "global_step": 71540, "epoch": 1703} {"train_loss": -5.881808757781982, "global_step": 71541, "epoch": 1703} {"train_loss": -6.019250869750977, "global_step": 71542, "epoch": 1703} {"train_loss": -6.047062873840332, "global_step": 71543, "epoch": 1703} {"train_loss": -6.054486274719238, "global_step": 71544, "epoch": 1703} {"train_loss": -5.956073760986328, "global_step": 71545, "epoch": 1703} {"train_loss": -5.997676849365234, "global_step": 71546, "epoch": 1703} {"train_loss": -6.07064151763916, "global_step": 71547, "epoch": 1703} {"train_loss": -6.0401835441589355, "global_step": 71548, "epoch": 1703} {"train_loss": -6.0020036697387695, "global_step": 71549, "epoch": 1703} {"train_loss": -5.922857284545898, "global_step": 71550, "epoch": 1703} {"train_loss": -6.006092071533203, "global_step": 71551, "epoch": 1703} {"train_loss": -6.011876106262207, "global_step": 71552, "epoch": 1703} {"train_loss": -6.140598773956299, "global_step": 71553, "epoch": 1703} {"train_loss": -5.996565341949463, "global_step": 71554, "epoch": 1703} {"train_loss": -6.031382083892822, "global_step": 71555, "epoch": 1703} {"train_loss": -5.97800350189209, "global_step": 71556, "epoch": 1703} {"train_loss": -6.011613368988037, "global_step": 71557, "epoch": 1703} {"train_loss": -6.038875579833984, "global_step": 71558, "epoch": 1703} {"train_loss": -6.043998718261719, "global_step": 71559, "epoch": 1703} {"train_loss": -5.963437080383301, "global_step": 71560, "epoch": 1703} {"train_loss": -6.121368408203125, "global_step": 71561, "epoch": 1703} {"train_loss": -6.099645137786865, "global_step": 71562, "epoch": 1703} {"train_loss": -5.926690101623535, "global_step": 71563, "epoch": 1703} {"train_loss": -6.03437614440918, "global_step": 71564, "epoch": 1703} {"train_loss": -5.95847225189209, "global_step": 71565, "epoch": 1703} {"train_loss": -5.868322372436523, "global_step": 71566, "epoch": 1703} {"train_loss": -5.992981990178426, "global_step": 71567, "epoch": 1703, "val_loss": 67645.0546875} {"train_loss": -6.005415916442871, "global_step": 71568, "epoch": 1704} {"train_loss": -5.976095676422119, "global_step": 71569, "epoch": 1704} {"train_loss": -5.934934616088867, "global_step": 71570, "epoch": 1704} {"train_loss": -5.970810890197754, "global_step": 71571, "epoch": 1704} {"train_loss": -5.949403762817383, "global_step": 71572, "epoch": 1704} {"train_loss": -5.984896659851074, "global_step": 71573, "epoch": 1704} {"train_loss": -6.005841255187988, "global_step": 71574, "epoch": 1704} {"train_loss": -5.830927848815918, "global_step": 71575, "epoch": 1704} {"train_loss": -6.016792297363281, "global_step": 71576, "epoch": 1704} {"train_loss": -5.978358745574951, "global_step": 71577, "epoch": 1704} {"train_loss": -6.011465549468994, "global_step": 71578, "epoch": 1704} {"train_loss": -6.0318427085876465, "global_step": 71579, "epoch": 1704} {"train_loss": -5.989367961883545, "global_step": 71580, "epoch": 1704} {"train_loss": -6.029362678527832, "global_step": 71581, "epoch": 1704} {"train_loss": -6.011975288391113, "global_step": 71582, "epoch": 1704} {"train_loss": -5.982819080352783, "global_step": 71583, "epoch": 1704} {"train_loss": -6.064021110534668, "global_step": 71584, "epoch": 1704} {"train_loss": -5.973911285400391, "global_step": 71585, "epoch": 1704} {"train_loss": -5.920612335205078, "global_step": 71586, "epoch": 1704} {"train_loss": -6.082808494567871, "global_step": 71587, "epoch": 1704} {"train_loss": -6.003490447998047, "global_step": 71588, "epoch": 1704} {"train_loss": -6.067780494689941, "global_step": 71589, "epoch": 1704} {"train_loss": -6.054127216339111, "global_step": 71590, "epoch": 1704} {"train_loss": -5.989474773406982, "global_step": 71591, "epoch": 1704} {"train_loss": -6.090009689331055, "global_step": 71592, "epoch": 1704} {"train_loss": -5.923459053039551, "global_step": 71593, "epoch": 1704} {"train_loss": -6.003330230712891, "global_step": 71594, "epoch": 1704} {"train_loss": -5.98442268371582, "global_step": 71595, "epoch": 1704} {"train_loss": -6.13627815246582, "global_step": 71596, "epoch": 1704} {"train_loss": -6.118664741516113, "global_step": 71597, "epoch": 1704} {"train_loss": -5.902764320373535, "global_step": 71598, "epoch": 1704} {"train_loss": -6.051578521728516, "global_step": 71599, "epoch": 1704} {"train_loss": -5.963691711425781, "global_step": 71600, "epoch": 1704} {"train_loss": -6.031449794769287, "global_step": 71601, "epoch": 1704} {"train_loss": -5.931609153747559, "global_step": 71602, "epoch": 1704} {"train_loss": -5.908075332641602, "global_step": 71603, "epoch": 1704} {"train_loss": -6.093715667724609, "global_step": 71604, "epoch": 1704} {"train_loss": -6.000889778137207, "global_step": 71605, "epoch": 1704} {"train_loss": -6.0274434089660645, "global_step": 71606, "epoch": 1704} {"train_loss": -6.035037994384766, "global_step": 71607, "epoch": 1704} {"train_loss": -6.047484397888184, "global_step": 71608, "epoch": 1704} {"train_loss": -6.003138144810994, "global_step": 71609, "epoch": 1704, "val_loss": 67272.328125} {"train_loss": -6.090559005737305, "global_step": 71610, "epoch": 1705} {"train_loss": -6.0501604080200195, "global_step": 71611, "epoch": 1705} {"train_loss": -5.999597549438477, "global_step": 71612, "epoch": 1705} {"train_loss": -6.015454292297363, "global_step": 71613, "epoch": 1705} {"train_loss": -6.119078636169434, "global_step": 71614, "epoch": 1705} {"train_loss": -6.089022636413574, "global_step": 71615, "epoch": 1705} {"train_loss": -5.948191165924072, "global_step": 71616, "epoch": 1705} {"train_loss": -6.0359930992126465, "global_step": 71617, "epoch": 1705} {"train_loss": -6.025212287902832, "global_step": 71618, "epoch": 1705} {"train_loss": -6.082202434539795, "global_step": 71619, "epoch": 1705} {"train_loss": -6.129790306091309, "global_step": 71620, "epoch": 1705} {"train_loss": -5.977390766143799, "global_step": 71621, "epoch": 1705} {"train_loss": -5.904118537902832, "global_step": 71622, "epoch": 1705} {"train_loss": -5.985846519470215, "global_step": 71623, "epoch": 1705} {"train_loss": -5.932526588439941, "global_step": 71624, "epoch": 1705} {"train_loss": -6.01133918762207, "global_step": 71625, "epoch": 1705} {"train_loss": -6.078116416931152, "global_step": 71626, "epoch": 1705} {"train_loss": -6.19336462020874, "global_step": 71627, "epoch": 1705} {"train_loss": -6.004167079925537, "global_step": 71628, "epoch": 1705} {"train_loss": -5.963099479675293, "global_step": 71629, "epoch": 1705} {"train_loss": -6.055230617523193, "global_step": 71630, "epoch": 1705} {"train_loss": -5.9731011390686035, "global_step": 71631, "epoch": 1705} {"train_loss": -6.078136920928955, "global_step": 71632, "epoch": 1705} {"train_loss": -6.101341247558594, "global_step": 71633, "epoch": 1705} {"train_loss": -6.045829772949219, "global_step": 71634, "epoch": 1705} {"train_loss": -5.9580230712890625, "global_step": 71635, "epoch": 1705} {"train_loss": -5.951011657714844, "global_step": 71636, "epoch": 1705} {"train_loss": -5.917270660400391, "global_step": 71637, "epoch": 1705} {"train_loss": -5.994331359863281, "global_step": 71638, "epoch": 1705} {"train_loss": -5.86265754699707, "global_step": 71639, "epoch": 1705} {"train_loss": -5.8382391929626465, "global_step": 71640, "epoch": 1705} {"train_loss": -6.038443088531494, "global_step": 71641, "epoch": 1705} {"train_loss": -6.032891750335693, "global_step": 71642, "epoch": 1705} {"train_loss": -5.892066478729248, "global_step": 71643, "epoch": 1705} {"train_loss": -6.115256309509277, "global_step": 71644, "epoch": 1705} {"train_loss": -6.0714192390441895, "global_step": 71645, "epoch": 1705} {"train_loss": -6.072752952575684, "global_step": 71646, "epoch": 1705} {"train_loss": -6.084184169769287, "global_step": 71647, "epoch": 1705} {"train_loss": -6.065609455108643, "global_step": 71648, "epoch": 1705} {"train_loss": -5.970458984375, "global_step": 71649, "epoch": 1705} {"train_loss": -6.020532608032227, "global_step": 71650, "epoch": 1705} {"train_loss": -6.020214943658738, "global_step": 71651, "epoch": 1705, "val_loss": 67455.796875} {"train_loss": -6.050858497619629, "global_step": 71652, "epoch": 1706} {"train_loss": -6.09122371673584, "global_step": 71653, "epoch": 1706} {"train_loss": -6.058042526245117, "global_step": 71654, "epoch": 1706} {"train_loss": -6.131096839904785, "global_step": 71655, "epoch": 1706} {"train_loss": -6.111232757568359, "global_step": 71656, "epoch": 1706} {"train_loss": -5.998451232910156, "global_step": 71657, "epoch": 1706} {"train_loss": -6.127923011779785, "global_step": 71658, "epoch": 1706} {"train_loss": -6.014205455780029, "global_step": 71659, "epoch": 1706} {"train_loss": -6.05579137802124, "global_step": 71660, "epoch": 1706} {"train_loss": -6.047299385070801, "global_step": 71661, "epoch": 1706} {"train_loss": -6.032260417938232, "global_step": 71662, "epoch": 1706} {"train_loss": -6.105886459350586, "global_step": 71663, "epoch": 1706} {"train_loss": -5.867763996124268, "global_step": 71664, "epoch": 1706} {"train_loss": -6.058006286621094, "global_step": 71665, "epoch": 1706} {"train_loss": -6.026456356048584, "global_step": 71666, "epoch": 1706} {"train_loss": -5.900920867919922, "global_step": 71667, "epoch": 1706} {"train_loss": -6.082059383392334, "global_step": 71668, "epoch": 1706} {"train_loss": -5.876077175140381, "global_step": 71669, "epoch": 1706} {"train_loss": -5.959904670715332, "global_step": 71670, "epoch": 1706} {"train_loss": -5.949542999267578, "global_step": 71671, "epoch": 1706} {"train_loss": -6.012153625488281, "global_step": 71672, "epoch": 1706} {"train_loss": -6.02631950378418, "global_step": 71673, "epoch": 1706} {"train_loss": -6.00656795501709, "global_step": 71674, "epoch": 1706} {"train_loss": -5.9189863204956055, "global_step": 71675, "epoch": 1706} {"train_loss": -5.832405090332031, "global_step": 71676, "epoch": 1706} {"train_loss": -5.912503719329834, "global_step": 71677, "epoch": 1706} {"train_loss": -5.865866661071777, "global_step": 71678, "epoch": 1706} {"train_loss": -6.061309814453125, "global_step": 71679, "epoch": 1706} {"train_loss": -5.9483137130737305, "global_step": 71680, "epoch": 1706} {"train_loss": -6.054231643676758, "global_step": 71681, "epoch": 1706} {"train_loss": -5.888081073760986, "global_step": 71682, "epoch": 1706} {"train_loss": -6.132870674133301, "global_step": 71683, "epoch": 1706} {"train_loss": -5.8706746101379395, "global_step": 71684, "epoch": 1706} {"train_loss": -6.057662487030029, "global_step": 71685, "epoch": 1706} {"train_loss": -5.9663543701171875, "global_step": 71686, "epoch": 1706} {"train_loss": -6.091394901275635, "global_step": 71687, "epoch": 1706} {"train_loss": -5.868179798126221, "global_step": 71688, "epoch": 1706} {"train_loss": -5.899372577667236, "global_step": 71689, "epoch": 1706} {"train_loss": -6.141114234924316, "global_step": 71690, "epoch": 1706} {"train_loss": -5.9389777183532715, "global_step": 71691, "epoch": 1706} {"train_loss": -6.046751022338867, "global_step": 71692, "epoch": 1706} {"train_loss": -6.003999448957897, "global_step": 71693, "epoch": 1706, "val_loss": 67345.0390625} {"train_loss": -6.106681823730469, "global_step": 71694, "epoch": 1707} {"train_loss": -6.174822807312012, "global_step": 71695, "epoch": 1707} {"train_loss": -5.972556114196777, "global_step": 71696, "epoch": 1707} {"train_loss": -5.984206199645996, "global_step": 71697, "epoch": 1707} {"train_loss": -6.080134391784668, "global_step": 71698, "epoch": 1707} {"train_loss": -6.069137096405029, "global_step": 71699, "epoch": 1707} {"train_loss": -6.091373920440674, "global_step": 71700, "epoch": 1707} {"train_loss": -6.010746002197266, "global_step": 71701, "epoch": 1707} {"train_loss": -6.069554328918457, "global_step": 71702, "epoch": 1707} {"train_loss": -6.118736743927002, "global_step": 71703, "epoch": 1707} {"train_loss": -6.000578880310059, "global_step": 71704, "epoch": 1707} {"train_loss": -5.811663627624512, "global_step": 71705, "epoch": 1707} {"train_loss": -5.969926357269287, "global_step": 71706, "epoch": 1707} {"train_loss": -6.069400787353516, "global_step": 71707, "epoch": 1707} {"train_loss": -6.007265090942383, "global_step": 71708, "epoch": 1707} {"train_loss": -6.032558441162109, "global_step": 71709, "epoch": 1707} {"train_loss": -6.0276384353637695, "global_step": 71710, "epoch": 1707} {"train_loss": -6.093899726867676, "global_step": 71711, "epoch": 1707} {"train_loss": -6.050154685974121, "global_step": 71712, "epoch": 1707} {"train_loss": -5.952334403991699, "global_step": 71713, "epoch": 1707} {"train_loss": -5.998089790344238, "global_step": 71714, "epoch": 1707} {"train_loss": -5.998592376708984, "global_step": 71715, "epoch": 1707} {"train_loss": -6.09670877456665, "global_step": 71716, "epoch": 1707} {"train_loss": -5.993468284606934, "global_step": 71717, "epoch": 1707} {"train_loss": -6.090855121612549, "global_step": 71718, "epoch": 1707} {"train_loss": -5.876981735229492, "global_step": 71719, "epoch": 1707} {"train_loss": -6.012977600097656, "global_step": 71720, "epoch": 1707} {"train_loss": -6.06727409362793, "global_step": 71721, "epoch": 1707} {"train_loss": -5.9361572265625, "global_step": 71722, "epoch": 1707} {"train_loss": -6.059688568115234, "global_step": 71723, "epoch": 1707} {"train_loss": -6.026154518127441, "global_step": 71724, "epoch": 1707} {"train_loss": -5.915226936340332, "global_step": 71725, "epoch": 1707} {"train_loss": -6.068228721618652, "global_step": 71726, "epoch": 1707} {"train_loss": -5.95643424987793, "global_step": 71727, "epoch": 1707} {"train_loss": -5.970028400421143, "global_step": 71728, "epoch": 1707} {"train_loss": -5.881520748138428, "global_step": 71729, "epoch": 1707} {"train_loss": -6.0858378410339355, "global_step": 71730, "epoch": 1707} {"train_loss": -5.984861373901367, "global_step": 71731, "epoch": 1707} {"train_loss": -5.977948188781738, "global_step": 71732, "epoch": 1707} {"train_loss": -5.997304916381836, "global_step": 71733, "epoch": 1707} {"train_loss": -6.034146785736084, "global_step": 71734, "epoch": 1707} {"train_loss": -6.016233342034476, "global_step": 71735, "epoch": 1707, "val_loss": 67405.109375} {"train_loss": -6.073940277099609, "global_step": 71736, "epoch": 1708} {"train_loss": -6.102088928222656, "global_step": 71737, "epoch": 1708} {"train_loss": -5.929788589477539, "global_step": 71738, "epoch": 1708} {"train_loss": -6.044233798980713, "global_step": 71739, "epoch": 1708} {"train_loss": -6.099939823150635, "global_step": 71740, "epoch": 1708} {"train_loss": -6.089189529418945, "global_step": 71741, "epoch": 1708} {"train_loss": -6.082529067993164, "global_step": 71742, "epoch": 1708} {"train_loss": -5.900835037231445, "global_step": 71743, "epoch": 1708} {"train_loss": -6.017640113830566, "global_step": 71744, "epoch": 1708} {"train_loss": -6.100347518920898, "global_step": 71745, "epoch": 1708} {"train_loss": -5.963682651519775, "global_step": 71746, "epoch": 1708} {"train_loss": -6.02155876159668, "global_step": 71747, "epoch": 1708} {"train_loss": -6.103742599487305, "global_step": 71748, "epoch": 1708} {"train_loss": -6.080924034118652, "global_step": 71749, "epoch": 1708} {"train_loss": -6.057602882385254, "global_step": 71750, "epoch": 1708} {"train_loss": -6.148545265197754, "global_step": 71751, "epoch": 1708} {"train_loss": -6.019227981567383, "global_step": 71752, "epoch": 1708} {"train_loss": -6.059573173522949, "global_step": 71753, "epoch": 1708} {"train_loss": -6.029238700866699, "global_step": 71754, "epoch": 1708} {"train_loss": -6.078098297119141, "global_step": 71755, "epoch": 1708} {"train_loss": -5.960153102874756, "global_step": 71756, "epoch": 1708} {"train_loss": -5.9463419914245605, "global_step": 71757, "epoch": 1708} {"train_loss": -5.9877142906188965, "global_step": 71758, "epoch": 1708} {"train_loss": -6.0431389808654785, "global_step": 71759, "epoch": 1708} {"train_loss": -5.97581672668457, "global_step": 71760, "epoch": 1708} {"train_loss": -6.04655122756958, "global_step": 71761, "epoch": 1708} {"train_loss": -5.938417434692383, "global_step": 71762, "epoch": 1708} {"train_loss": -5.929266929626465, "global_step": 71763, "epoch": 1708} {"train_loss": -6.007716178894043, "global_step": 71764, "epoch": 1708} {"train_loss": -5.914793014526367, "global_step": 71765, "epoch": 1708} {"train_loss": -6.020987510681152, "global_step": 71766, "epoch": 1708} {"train_loss": -6.171815395355225, "global_step": 71767, "epoch": 1708} {"train_loss": -5.974137783050537, "global_step": 71768, "epoch": 1708} {"train_loss": -6.119338035583496, "global_step": 71769, "epoch": 1708} {"train_loss": -6.085983753204346, "global_step": 71770, "epoch": 1708} {"train_loss": -6.17884635925293, "global_step": 71771, "epoch": 1708} {"train_loss": -5.989138603210449, "global_step": 71772, "epoch": 1708} {"train_loss": -5.973879814147949, "global_step": 71773, "epoch": 1708} {"train_loss": -6.054102897644043, "global_step": 71774, "epoch": 1708} {"train_loss": -5.856939792633057, "global_step": 71775, "epoch": 1708} {"train_loss": -5.884078502655029, "global_step": 71776, "epoch": 1708} {"train_loss": -6.026470275152297, "global_step": 71777, "epoch": 1708, "val_loss": 67223.7109375} {"train_loss": -5.980135917663574, "global_step": 71778, "epoch": 1709} {"train_loss": -6.0630998611450195, "global_step": 71779, "epoch": 1709} {"train_loss": -5.993626117706299, "global_step": 71780, "epoch": 1709} {"train_loss": -5.985465049743652, "global_step": 71781, "epoch": 1709} {"train_loss": -6.020908832550049, "global_step": 71782, "epoch": 1709} {"train_loss": -6.090865135192871, "global_step": 71783, "epoch": 1709} {"train_loss": -6.002135276794434, "global_step": 71784, "epoch": 1709} {"train_loss": -6.029058456420898, "global_step": 71785, "epoch": 1709} {"train_loss": -6.1078314781188965, "global_step": 71786, "epoch": 1709} {"train_loss": -5.913586616516113, "global_step": 71787, "epoch": 1709} {"train_loss": -6.066467761993408, "global_step": 71788, "epoch": 1709} {"train_loss": -5.915767669677734, "global_step": 71789, "epoch": 1709} {"train_loss": -5.9658050537109375, "global_step": 71790, "epoch": 1709} {"train_loss": -6.102877140045166, "global_step": 71791, "epoch": 1709} {"train_loss": -5.819263458251953, "global_step": 71792, "epoch": 1709} {"train_loss": -5.935419082641602, "global_step": 71793, "epoch": 1709} {"train_loss": -5.864285945892334, "global_step": 71794, "epoch": 1709} {"train_loss": -5.917043685913086, "global_step": 71795, "epoch": 1709} {"train_loss": -6.053783416748047, "global_step": 71796, "epoch": 1709} {"train_loss": -5.990659236907959, "global_step": 71797, "epoch": 1709} {"train_loss": -6.118991851806641, "global_step": 71798, "epoch": 1709} {"train_loss": -5.87697172164917, "global_step": 71799, "epoch": 1709} {"train_loss": -5.950592994689941, "global_step": 71800, "epoch": 1709} {"train_loss": -5.858168125152588, "global_step": 71801, "epoch": 1709} {"train_loss": -6.056711673736572, "global_step": 71802, "epoch": 1709} {"train_loss": -5.950199127197266, "global_step": 71803, "epoch": 1709} {"train_loss": -5.928256034851074, "global_step": 71804, "epoch": 1709} {"train_loss": -5.973670959472656, "global_step": 71805, "epoch": 1709} {"train_loss": -5.897700309753418, "global_step": 71806, "epoch": 1709} {"train_loss": -6.065790176391602, "global_step": 71807, "epoch": 1709} {"train_loss": -5.891035079956055, "global_step": 71808, "epoch": 1709} {"train_loss": -6.040680885314941, "global_step": 71809, "epoch": 1709} {"train_loss": -5.980267524719238, "global_step": 71810, "epoch": 1709} {"train_loss": -5.998699188232422, "global_step": 71811, "epoch": 1709} {"train_loss": -6.096724510192871, "global_step": 71812, "epoch": 1709} {"train_loss": -6.02276086807251, "global_step": 71813, "epoch": 1709} {"train_loss": -5.84034538269043, "global_step": 71814, "epoch": 1709} {"train_loss": -6.088513374328613, "global_step": 71815, "epoch": 1709} {"train_loss": -6.103981018066406, "global_step": 71816, "epoch": 1709} {"train_loss": -6.014523983001709, "global_step": 71817, "epoch": 1709} {"train_loss": -6.102878570556641, "global_step": 71818, "epoch": 1709} {"train_loss": -5.991155454090664, "global_step": 71819, "epoch": 1709, "val_loss": 67483.9609375} {"train_loss": -5.945164203643799, "global_step": 71820, "epoch": 1710} {"train_loss": -5.9592390060424805, "global_step": 71821, "epoch": 1710} {"train_loss": -5.968052387237549, "global_step": 71822, "epoch": 1710} {"train_loss": -6.023829460144043, "global_step": 71823, "epoch": 1710} {"train_loss": -5.97042179107666, "global_step": 71824, "epoch": 1710} {"train_loss": -5.934519290924072, "global_step": 71825, "epoch": 1710} {"train_loss": -5.916104316711426, "global_step": 71826, "epoch": 1710} {"train_loss": -6.0384321212768555, "global_step": 71827, "epoch": 1710} {"train_loss": -6.086671829223633, "global_step": 71828, "epoch": 1710} {"train_loss": -6.054110050201416, "global_step": 71829, "epoch": 1710} {"train_loss": -5.915322303771973, "global_step": 71830, "epoch": 1710} {"train_loss": -5.962910175323486, "global_step": 71831, "epoch": 1710} {"train_loss": -5.957965850830078, "global_step": 71832, "epoch": 1710} {"train_loss": -5.979652404785156, "global_step": 71833, "epoch": 1710} {"train_loss": -6.116064548492432, "global_step": 71834, "epoch": 1710} {"train_loss": -6.0272626876831055, "global_step": 71835, "epoch": 1710} {"train_loss": -6.1483612060546875, "global_step": 71836, "epoch": 1710} {"train_loss": -6.018667697906494, "global_step": 71837, "epoch": 1710} {"train_loss": -6.1216230392456055, "global_step": 71838, "epoch": 1710} {"train_loss": -6.075409889221191, "global_step": 71839, "epoch": 1710} {"train_loss": -6.004075527191162, "global_step": 71840, "epoch": 1710} {"train_loss": -6.012696743011475, "global_step": 71841, "epoch": 1710} {"train_loss": -5.944111347198486, "global_step": 71842, "epoch": 1710} {"train_loss": -5.979545593261719, "global_step": 71843, "epoch": 1710} {"train_loss": -5.941519737243652, "global_step": 71844, "epoch": 1710} {"train_loss": -6.100107192993164, "global_step": 71845, "epoch": 1710} {"train_loss": -5.963122367858887, "global_step": 71846, "epoch": 1710} {"train_loss": -6.0774078369140625, "global_step": 71847, "epoch": 1710} {"train_loss": -5.9678544998168945, "global_step": 71848, "epoch": 1710} {"train_loss": -6.0622076988220215, "global_step": 71849, "epoch": 1710} {"train_loss": -6.013713836669922, "global_step": 71850, "epoch": 1710} {"train_loss": -6.086128234863281, "global_step": 71851, "epoch": 1710} {"train_loss": -6.061968803405762, "global_step": 71852, "epoch": 1710} {"train_loss": -5.948598384857178, "global_step": 71853, "epoch": 1710} {"train_loss": -6.077864646911621, "global_step": 71854, "epoch": 1710} {"train_loss": -6.057534217834473, "global_step": 71855, "epoch": 1710} {"train_loss": -6.031492233276367, "global_step": 71856, "epoch": 1710} {"train_loss": -6.055354118347168, "global_step": 71857, "epoch": 1710} {"train_loss": -6.1052141189575195, "global_step": 71858, "epoch": 1710} {"train_loss": -5.996555328369141, "global_step": 71859, "epoch": 1710} {"train_loss": -6.021770477294922, "global_step": 71860, "epoch": 1710} {"train_loss": -6.016377097084408, "global_step": 71861, "epoch": 1710, "val_loss": 67377.9140625} {"train_loss": -5.931887149810791, "global_step": 71862, "epoch": 1711} {"train_loss": -5.955223083496094, "global_step": 71863, "epoch": 1711} {"train_loss": -6.016674518585205, "global_step": 71864, "epoch": 1711} {"train_loss": -6.041921615600586, "global_step": 71865, "epoch": 1711} {"train_loss": -5.94469690322876, "global_step": 71866, "epoch": 1711} {"train_loss": -6.076409339904785, "global_step": 71867, "epoch": 1711} {"train_loss": -6.047061920166016, "global_step": 71868, "epoch": 1711} {"train_loss": -5.959652900695801, "global_step": 71869, "epoch": 1711} {"train_loss": -6.031167030334473, "global_step": 71870, "epoch": 1711} {"train_loss": -5.982606887817383, "global_step": 71871, "epoch": 1711} {"train_loss": -5.981827259063721, "global_step": 71872, "epoch": 1711} {"train_loss": -5.869809627532959, "global_step": 71873, "epoch": 1711} {"train_loss": -6.005868911743164, "global_step": 71874, "epoch": 1711} {"train_loss": -5.920777320861816, "global_step": 71875, "epoch": 1711} {"train_loss": -6.002567291259766, "global_step": 71876, "epoch": 1711} {"train_loss": -6.047420501708984, "global_step": 71877, "epoch": 1711} {"train_loss": -5.948326110839844, "global_step": 71878, "epoch": 1711} {"train_loss": -6.040436744689941, "global_step": 71879, "epoch": 1711} {"train_loss": -6.101264953613281, "global_step": 71880, "epoch": 1711} {"train_loss": -6.009555339813232, "global_step": 71881, "epoch": 1711} {"train_loss": -6.025175094604492, "global_step": 71882, "epoch": 1711} {"train_loss": -6.059135437011719, "global_step": 71883, "epoch": 1711} {"train_loss": -6.1524505615234375, "global_step": 71884, "epoch": 1711} {"train_loss": -6.121188163757324, "global_step": 71885, "epoch": 1711} {"train_loss": -5.952779769897461, "global_step": 71886, "epoch": 1711} {"train_loss": -6.020331859588623, "global_step": 71887, "epoch": 1711} {"train_loss": -6.023916721343994, "global_step": 71888, "epoch": 1711} {"train_loss": -5.943818092346191, "global_step": 71889, "epoch": 1711} {"train_loss": -6.057852745056152, "global_step": 71890, "epoch": 1711} {"train_loss": -6.002274513244629, "global_step": 71891, "epoch": 1711} {"train_loss": -6.119243621826172, "global_step": 71892, "epoch": 1711} {"train_loss": -6.002339839935303, "global_step": 71893, "epoch": 1711} {"train_loss": -6.081849575042725, "global_step": 71894, "epoch": 1711} {"train_loss": -6.084710121154785, "global_step": 71895, "epoch": 1711} {"train_loss": -6.0525288581848145, "global_step": 71896, "epoch": 1711} {"train_loss": -6.139423847198486, "global_step": 71897, "epoch": 1711} {"train_loss": -5.976221084594727, "global_step": 71898, "epoch": 1711} {"train_loss": -6.109683036804199, "global_step": 71899, "epoch": 1711} {"train_loss": -6.020431995391846, "global_step": 71900, "epoch": 1711} {"train_loss": -5.994617938995361, "global_step": 71901, "epoch": 1711} {"train_loss": -6.028295040130615, "global_step": 71902, "epoch": 1711} {"train_loss": -6.019181047167097, "global_step": 71903, "epoch": 1711, "val_loss": 67120.3828125} {"train_loss": -6.134746074676514, "global_step": 71904, "epoch": 1712} {"train_loss": -6.016507148742676, "global_step": 71905, "epoch": 1712} {"train_loss": -6.05377197265625, "global_step": 71906, "epoch": 1712} {"train_loss": -6.109399795532227, "global_step": 71907, "epoch": 1712} {"train_loss": -6.029609680175781, "global_step": 71908, "epoch": 1712} {"train_loss": -5.953153610229492, "global_step": 71909, "epoch": 1712} {"train_loss": -6.032166481018066, "global_step": 71910, "epoch": 1712} {"train_loss": -5.9502058029174805, "global_step": 71911, "epoch": 1712} {"train_loss": -5.9500885009765625, "global_step": 71912, "epoch": 1712} {"train_loss": -6.104771614074707, "global_step": 71913, "epoch": 1712} {"train_loss": -6.059654235839844, "global_step": 71914, "epoch": 1712} {"train_loss": -5.9940948486328125, "global_step": 71915, "epoch": 1712} {"train_loss": -5.945283889770508, "global_step": 71916, "epoch": 1712} {"train_loss": -5.936127185821533, "global_step": 71917, "epoch": 1712} {"train_loss": -5.88922119140625, "global_step": 71918, "epoch": 1712} {"train_loss": -6.073860168457031, "global_step": 71919, "epoch": 1712} {"train_loss": -6.0119948387146, "global_step": 71920, "epoch": 1712} {"train_loss": -6.003722190856934, "global_step": 71921, "epoch": 1712} {"train_loss": -5.913882255554199, "global_step": 71922, "epoch": 1712} {"train_loss": -5.853832244873047, "global_step": 71923, "epoch": 1712} {"train_loss": -5.999609470367432, "global_step": 71924, "epoch": 1712} {"train_loss": -6.025676250457764, "global_step": 71925, "epoch": 1712} {"train_loss": -5.870945930480957, "global_step": 71926, "epoch": 1712} {"train_loss": -6.042781829833984, "global_step": 71927, "epoch": 1712} {"train_loss": -5.999666213989258, "global_step": 71928, "epoch": 1712} {"train_loss": -5.941425323486328, "global_step": 71929, "epoch": 1712} {"train_loss": -5.949129104614258, "global_step": 71930, "epoch": 1712} {"train_loss": -6.004871368408203, "global_step": 71931, "epoch": 1712} {"train_loss": -5.977373123168945, "global_step": 71932, "epoch": 1712} {"train_loss": -5.766985893249512, "global_step": 71933, "epoch": 1712} {"train_loss": -6.063086032867432, "global_step": 71934, "epoch": 1712} {"train_loss": -5.877737045288086, "global_step": 71935, "epoch": 1712} {"train_loss": -6.0090227127075195, "global_step": 71936, "epoch": 1712} {"train_loss": -5.904365539550781, "global_step": 71937, "epoch": 1712} {"train_loss": -6.106257438659668, "global_step": 71938, "epoch": 1712} {"train_loss": -5.910411834716797, "global_step": 71939, "epoch": 1712} {"train_loss": -5.98209810256958, "global_step": 71940, "epoch": 1712} {"train_loss": -6.007650375366211, "global_step": 71941, "epoch": 1712} {"train_loss": -6.087404727935791, "global_step": 71942, "epoch": 1712} {"train_loss": -6.048101425170898, "global_step": 71943, "epoch": 1712} {"train_loss": -5.975674629211426, "global_step": 71944, "epoch": 1712} {"train_loss": -5.991204954328991, "global_step": 71945, "epoch": 1712, "val_loss": 67527.7578125} {"train_loss": -5.897244930267334, "global_step": 71946, "epoch": 1713} {"train_loss": -5.998449325561523, "global_step": 71947, "epoch": 1713} {"train_loss": -6.004579544067383, "global_step": 71948, "epoch": 1713} {"train_loss": -5.948546409606934, "global_step": 71949, "epoch": 1713} {"train_loss": -6.1762919425964355, "global_step": 71950, "epoch": 1713} {"train_loss": -6.061384201049805, "global_step": 71951, "epoch": 1713} {"train_loss": -6.049907207489014, "global_step": 71952, "epoch": 1713} {"train_loss": -5.996220588684082, "global_step": 71953, "epoch": 1713} {"train_loss": -6.091691970825195, "global_step": 71954, "epoch": 1713} {"train_loss": -6.00485897064209, "global_step": 71955, "epoch": 1713} {"train_loss": -6.059940814971924, "global_step": 71956, "epoch": 1713} {"train_loss": -6.054676055908203, "global_step": 71957, "epoch": 1713} {"train_loss": -6.067313194274902, "global_step": 71958, "epoch": 1713} {"train_loss": -6.022068500518799, "global_step": 71959, "epoch": 1713} {"train_loss": -6.011693954467773, "global_step": 71960, "epoch": 1713} {"train_loss": -5.97586727142334, "global_step": 71961, "epoch": 1713} {"train_loss": -6.008971214294434, "global_step": 71962, "epoch": 1713} {"train_loss": -6.072563171386719, "global_step": 71963, "epoch": 1713} {"train_loss": -6.068965911865234, "global_step": 71964, "epoch": 1713} {"train_loss": -6.026411056518555, "global_step": 71965, "epoch": 1713} {"train_loss": -5.983943939208984, "global_step": 71966, "epoch": 1713} {"train_loss": -6.046722888946533, "global_step": 71967, "epoch": 1713} {"train_loss": -6.058965682983398, "global_step": 71968, "epoch": 1713} {"train_loss": -6.179489612579346, "global_step": 71969, "epoch": 1713} {"train_loss": -6.017155170440674, "global_step": 71970, "epoch": 1713} {"train_loss": -6.088571548461914, "global_step": 71971, "epoch": 1713} {"train_loss": -6.031914710998535, "global_step": 71972, "epoch": 1713} {"train_loss": -6.046013832092285, "global_step": 71973, "epoch": 1713} {"train_loss": -6.1346869468688965, "global_step": 71974, "epoch": 1713} {"train_loss": -6.108678817749023, "global_step": 71975, "epoch": 1713} {"train_loss": -6.066533088684082, "global_step": 71976, "epoch": 1713} {"train_loss": -6.031538009643555, "global_step": 71977, "epoch": 1713} {"train_loss": -5.920526504516602, "global_step": 71978, "epoch": 1713} {"train_loss": -5.945745468139648, "global_step": 71979, "epoch": 1713} {"train_loss": -6.046979904174805, "global_step": 71980, "epoch": 1713} {"train_loss": -6.118499755859375, "global_step": 71981, "epoch": 1713} {"train_loss": -6.102583885192871, "global_step": 71982, "epoch": 1713} {"train_loss": -5.976667881011963, "global_step": 71983, "epoch": 1713} {"train_loss": -5.980997085571289, "global_step": 71984, "epoch": 1713} {"train_loss": -6.0044097900390625, "global_step": 71985, "epoch": 1713} {"train_loss": -6.109983921051025, "global_step": 71986, "epoch": 1713} {"train_loss": -6.039774599529448, "global_step": 71987, "epoch": 1713, "val_loss": 67532.46875} {"train_loss": -5.96885871887207, "global_step": 71988, "epoch": 1714} {"train_loss": -6.171402931213379, "global_step": 71989, "epoch": 1714} {"train_loss": -6.06240701675415, "global_step": 71990, "epoch": 1714} {"train_loss": -6.0189313888549805, "global_step": 71991, "epoch": 1714} {"train_loss": -6.12664794921875, "global_step": 71992, "epoch": 1714} {"train_loss": -6.055391311645508, "global_step": 71993, "epoch": 1714} {"train_loss": -6.028280735015869, "global_step": 71994, "epoch": 1714} {"train_loss": -5.97973108291626, "global_step": 71995, "epoch": 1714} {"train_loss": -6.049307346343994, "global_step": 71996, "epoch": 1714} {"train_loss": -6.0907697677612305, "global_step": 71997, "epoch": 1714} {"train_loss": -5.892868995666504, "global_step": 71998, "epoch": 1714} {"train_loss": -6.018889904022217, "global_step": 71999, "epoch": 1714} {"train_loss": -6.038325309753418, "global_step": 72000, "epoch": 1714} {"train_loss": -6.006594657897949, "global_step": 72001, "epoch": 1714} {"train_loss": -5.995001792907715, "global_step": 72002, "epoch": 1714} {"train_loss": -6.018888473510742, "global_step": 72003, "epoch": 1714} {"train_loss": -6.003978729248047, "global_step": 72004, "epoch": 1714} {"train_loss": -5.999970436096191, "global_step": 72005, "epoch": 1714} {"train_loss": -6.12817907333374, "global_step": 72006, "epoch": 1714} {"train_loss": -5.9951887130737305, "global_step": 72007, "epoch": 1714} {"train_loss": -6.030142784118652, "global_step": 72008, "epoch": 1714} {"train_loss": -5.9432525634765625, "global_step": 72009, "epoch": 1714} {"train_loss": -6.022789001464844, "global_step": 72010, "epoch": 1714} {"train_loss": -6.137324333190918, "global_step": 72011, "epoch": 1714} {"train_loss": -6.001526355743408, "global_step": 72012, "epoch": 1714} {"train_loss": -5.983024597167969, "global_step": 72013, "epoch": 1714} {"train_loss": -6.062314033508301, "global_step": 72014, "epoch": 1714} {"train_loss": -6.01632022857666, "global_step": 72015, "epoch": 1714} {"train_loss": -6.016840934753418, "global_step": 72016, "epoch": 1714} {"train_loss": -5.942411422729492, "global_step": 72017, "epoch": 1714} {"train_loss": -6.045493125915527, "global_step": 72018, "epoch": 1714} {"train_loss": -6.109990119934082, "global_step": 72019, "epoch": 1714} {"train_loss": -5.869395732879639, "global_step": 72020, "epoch": 1714} {"train_loss": -5.934808731079102, "global_step": 72021, "epoch": 1714} {"train_loss": -5.8420796394348145, "global_step": 72022, "epoch": 1714} {"train_loss": -6.053377151489258, "global_step": 72023, "epoch": 1714} {"train_loss": -5.9613447189331055, "global_step": 72024, "epoch": 1714} {"train_loss": -5.930519104003906, "global_step": 72025, "epoch": 1714} {"train_loss": -5.9261627197265625, "global_step": 72026, "epoch": 1714} {"train_loss": -6.055586338043213, "global_step": 72027, "epoch": 1714} {"train_loss": -5.931837558746338, "global_step": 72028, "epoch": 1714} {"train_loss": -6.01179035504659, "global_step": 72029, "epoch": 1714, "val_loss": 67393.4375} {"train_loss": -6.065072059631348, "global_step": 72030, "epoch": 1715} {"train_loss": -6.082386493682861, "global_step": 72031, "epoch": 1715} {"train_loss": -5.931982517242432, "global_step": 72032, "epoch": 1715} {"train_loss": -6.108218193054199, "global_step": 72033, "epoch": 1715} {"train_loss": -6.026047706604004, "global_step": 72034, "epoch": 1715} {"train_loss": -5.910516738891602, "global_step": 72035, "epoch": 1715} {"train_loss": -6.040288925170898, "global_step": 72036, "epoch": 1715} {"train_loss": -6.054617881774902, "global_step": 72037, "epoch": 1715} {"train_loss": -6.056150436401367, "global_step": 72038, "epoch": 1715} {"train_loss": -6.008281707763672, "global_step": 72039, "epoch": 1715} {"train_loss": -5.955392837524414, "global_step": 72040, "epoch": 1715} {"train_loss": -6.113834381103516, "global_step": 72041, "epoch": 1715} {"train_loss": -6.054758071899414, "global_step": 72042, "epoch": 1715} {"train_loss": -6.117944717407227, "global_step": 72043, "epoch": 1715} {"train_loss": -5.895890235900879, "global_step": 72044, "epoch": 1715} {"train_loss": -6.167904853820801, "global_step": 72045, "epoch": 1715} {"train_loss": -6.03837776184082, "global_step": 72046, "epoch": 1715} {"train_loss": -6.023378849029541, "global_step": 72047, "epoch": 1715} {"train_loss": -6.042885780334473, "global_step": 72048, "epoch": 1715} {"train_loss": -6.024881362915039, "global_step": 72049, "epoch": 1715} {"train_loss": -6.145995616912842, "global_step": 72050, "epoch": 1715} {"train_loss": -5.969498634338379, "global_step": 72051, "epoch": 1715} {"train_loss": -6.0703511238098145, "global_step": 72052, "epoch": 1715} {"train_loss": -6.0575737953186035, "global_step": 72053, "epoch": 1715} {"train_loss": -6.065934181213379, "global_step": 72054, "epoch": 1715} {"train_loss": -6.04369592666626, "global_step": 72055, "epoch": 1715} {"train_loss": -6.052957534790039, "global_step": 72056, "epoch": 1715} {"train_loss": -5.986790657043457, "global_step": 72057, "epoch": 1715} {"train_loss": -6.146538734436035, "global_step": 72058, "epoch": 1715} {"train_loss": -6.08310604095459, "global_step": 72059, "epoch": 1715} {"train_loss": -6.014327526092529, "global_step": 72060, "epoch": 1715} {"train_loss": -6.086698532104492, "global_step": 72061, "epoch": 1715} {"train_loss": -6.027456283569336, "global_step": 72062, "epoch": 1715} {"train_loss": -5.955750465393066, "global_step": 72063, "epoch": 1715} {"train_loss": -6.056321144104004, "global_step": 72064, "epoch": 1715} {"train_loss": -6.000282287597656, "global_step": 72065, "epoch": 1715} {"train_loss": -5.9294843673706055, "global_step": 72066, "epoch": 1715} {"train_loss": -6.079238414764404, "global_step": 72067, "epoch": 1715} {"train_loss": -6.110589504241943, "global_step": 72068, "epoch": 1715} {"train_loss": -5.978150367736816, "global_step": 72069, "epoch": 1715} {"train_loss": -6.023493766784668, "global_step": 72070, "epoch": 1715} {"train_loss": -6.0400559675125844, "global_step": 72071, "epoch": 1715, "val_loss": 67431.5078125} {"train_loss": -6.1440839767456055, "global_step": 72072, "epoch": 1716} {"train_loss": -6.110773086547852, "global_step": 72073, "epoch": 1716} {"train_loss": -6.064123153686523, "global_step": 72074, "epoch": 1716} {"train_loss": -6.077138900756836, "global_step": 72075, "epoch": 1716} {"train_loss": -6.1208271980285645, "global_step": 72076, "epoch": 1716} {"train_loss": -6.005411148071289, "global_step": 72077, "epoch": 1716} {"train_loss": -6.052906036376953, "global_step": 72078, "epoch": 1716} {"train_loss": -6.160405158996582, "global_step": 72079, "epoch": 1716} {"train_loss": -5.962246894836426, "global_step": 72080, "epoch": 1716} {"train_loss": -6.033294677734375, "global_step": 72081, "epoch": 1716} {"train_loss": -6.0246429443359375, "global_step": 72082, "epoch": 1716} {"train_loss": -6.10914421081543, "global_step": 72083, "epoch": 1716} {"train_loss": -6.096118450164795, "global_step": 72084, "epoch": 1716} {"train_loss": -6.058839797973633, "global_step": 72085, "epoch": 1716} {"train_loss": -6.138625621795654, "global_step": 72086, "epoch": 1716} {"train_loss": -6.044560432434082, "global_step": 72087, "epoch": 1716} {"train_loss": -6.207343578338623, "global_step": 72088, "epoch": 1716} {"train_loss": -6.023283004760742, "global_step": 72089, "epoch": 1716} {"train_loss": -5.995984077453613, "global_step": 72090, "epoch": 1716} {"train_loss": -6.0571064949035645, "global_step": 72091, "epoch": 1716} {"train_loss": -6.126460075378418, "global_step": 72092, "epoch": 1716} {"train_loss": -6.092691421508789, "global_step": 72093, "epoch": 1716} {"train_loss": -6.030299186706543, "global_step": 72094, "epoch": 1716} {"train_loss": -6.055302619934082, "global_step": 72095, "epoch": 1716} {"train_loss": -5.922255992889404, "global_step": 72096, "epoch": 1716} {"train_loss": -6.08787727355957, "global_step": 72097, "epoch": 1716} {"train_loss": -6.052727699279785, "global_step": 72098, "epoch": 1716} {"train_loss": -6.03049373626709, "global_step": 72099, "epoch": 1716} {"train_loss": -5.961701393127441, "global_step": 72100, "epoch": 1716} {"train_loss": -6.116398811340332, "global_step": 72101, "epoch": 1716} {"train_loss": -5.93065881729126, "global_step": 72102, "epoch": 1716} {"train_loss": -6.046913146972656, "global_step": 72103, "epoch": 1716} {"train_loss": -5.959912300109863, "global_step": 72104, "epoch": 1716} {"train_loss": -6.046048164367676, "global_step": 72105, "epoch": 1716} {"train_loss": -6.147937774658203, "global_step": 72106, "epoch": 1716} {"train_loss": -5.949779033660889, "global_step": 72107, "epoch": 1716} {"train_loss": -6.023667812347412, "global_step": 72108, "epoch": 1716} {"train_loss": -6.027358055114746, "global_step": 72109, "epoch": 1716} {"train_loss": -5.9526214599609375, "global_step": 72110, "epoch": 1716} {"train_loss": -6.081185340881348, "global_step": 72111, "epoch": 1716} {"train_loss": -6.1452741622924805, "global_step": 72112, "epoch": 1716} {"train_loss": -6.052314008985247, "global_step": 72113, "epoch": 1716, "val_loss": 67338.359375} {"train_loss": -5.966261863708496, "global_step": 72114, "epoch": 1717} {"train_loss": -5.980877876281738, "global_step": 72115, "epoch": 1717} {"train_loss": -6.019328594207764, "global_step": 72116, "epoch": 1717} {"train_loss": -6.047566890716553, "global_step": 72117, "epoch": 1717} {"train_loss": -6.062375068664551, "global_step": 72118, "epoch": 1717} {"train_loss": -5.976398468017578, "global_step": 72119, "epoch": 1717} {"train_loss": -6.04248046875, "global_step": 72120, "epoch": 1717} {"train_loss": -6.084789276123047, "global_step": 72121, "epoch": 1717} {"train_loss": -6.061030387878418, "global_step": 72122, "epoch": 1717} {"train_loss": -6.098263263702393, "global_step": 72123, "epoch": 1717} {"train_loss": -5.960012912750244, "global_step": 72124, "epoch": 1717} {"train_loss": -6.030534267425537, "global_step": 72125, "epoch": 1717} {"train_loss": -5.849740982055664, "global_step": 72126, "epoch": 1717} {"train_loss": -6.045543670654297, "global_step": 72127, "epoch": 1717} {"train_loss": -5.9704132080078125, "global_step": 72128, "epoch": 1717} {"train_loss": -5.970698356628418, "global_step": 72129, "epoch": 1717} {"train_loss": -5.988205432891846, "global_step": 72130, "epoch": 1717} {"train_loss": -5.954044342041016, "global_step": 72131, "epoch": 1717} {"train_loss": -6.134183883666992, "global_step": 72132, "epoch": 1717} {"train_loss": -6.03123664855957, "global_step": 72133, "epoch": 1717} {"train_loss": -6.099496841430664, "global_step": 72134, "epoch": 1717} {"train_loss": -6.094880104064941, "global_step": 72135, "epoch": 1717} {"train_loss": -6.051947593688965, "global_step": 72136, "epoch": 1717} {"train_loss": -6.013249397277832, "global_step": 72137, "epoch": 1717} {"train_loss": -6.06544303894043, "global_step": 72138, "epoch": 1717} {"train_loss": -5.935629844665527, "global_step": 72139, "epoch": 1717} {"train_loss": -6.006484508514404, "global_step": 72140, "epoch": 1717} {"train_loss": -5.926980018615723, "global_step": 72141, "epoch": 1717} {"train_loss": -6.09260368347168, "global_step": 72142, "epoch": 1717} {"train_loss": -6.08770751953125, "global_step": 72143, "epoch": 1717} {"train_loss": -6.015791893005371, "global_step": 72144, "epoch": 1717} {"train_loss": -6.078741550445557, "global_step": 72145, "epoch": 1717} {"train_loss": -6.074797630310059, "global_step": 72146, "epoch": 1717} {"train_loss": -6.038646697998047, "global_step": 72147, "epoch": 1717} {"train_loss": -6.161803245544434, "global_step": 72148, "epoch": 1717} {"train_loss": -6.151917457580566, "global_step": 72149, "epoch": 1717} {"train_loss": -6.010652542114258, "global_step": 72150, "epoch": 1717} {"train_loss": -6.079712867736816, "global_step": 72151, "epoch": 1717} {"train_loss": -6.183928966522217, "global_step": 72152, "epoch": 1717} {"train_loss": -5.998732089996338, "global_step": 72153, "epoch": 1717} {"train_loss": -6.115361213684082, "global_step": 72154, "epoch": 1717} {"train_loss": -6.036598114740281, "global_step": 72155, "epoch": 1717, "val_loss": 67492.2890625} {"train_loss": -6.087360382080078, "global_step": 72156, "epoch": 1718} {"train_loss": -6.039062023162842, "global_step": 72157, "epoch": 1718} {"train_loss": -6.051804065704346, "global_step": 72158, "epoch": 1718} {"train_loss": -6.1192426681518555, "global_step": 72159, "epoch": 1718} {"train_loss": -5.99505615234375, "global_step": 72160, "epoch": 1718} {"train_loss": -6.039552211761475, "global_step": 72161, "epoch": 1718} {"train_loss": -6.1523003578186035, "global_step": 72162, "epoch": 1718} {"train_loss": -6.137439727783203, "global_step": 72163, "epoch": 1718} {"train_loss": -5.928150177001953, "global_step": 72164, "epoch": 1718} {"train_loss": -5.9473114013671875, "global_step": 72165, "epoch": 1718} {"train_loss": -5.96650505065918, "global_step": 72166, "epoch": 1718} {"train_loss": -6.046398639678955, "global_step": 72167, "epoch": 1718} {"train_loss": -6.060259819030762, "global_step": 72168, "epoch": 1718} {"train_loss": -6.1654767990112305, "global_step": 72169, "epoch": 1718} {"train_loss": -6.060035228729248, "global_step": 72170, "epoch": 1718} {"train_loss": -6.1016716957092285, "global_step": 72171, "epoch": 1718} {"train_loss": -6.006616592407227, "global_step": 72172, "epoch": 1718} {"train_loss": -5.969296455383301, "global_step": 72173, "epoch": 1718} {"train_loss": -6.054606914520264, "global_step": 72174, "epoch": 1718} {"train_loss": -5.981317043304443, "global_step": 72175, "epoch": 1718} {"train_loss": -6.078045845031738, "global_step": 72176, "epoch": 1718} {"train_loss": -6.126594066619873, "global_step": 72177, "epoch": 1718} {"train_loss": -6.177048206329346, "global_step": 72178, "epoch": 1718} {"train_loss": -5.961095809936523, "global_step": 72179, "epoch": 1718} {"train_loss": -6.010914325714111, "global_step": 72180, "epoch": 1718} {"train_loss": -5.8837809562683105, "global_step": 72181, "epoch": 1718} {"train_loss": -5.924043655395508, "global_step": 72182, "epoch": 1718} {"train_loss": -6.052229404449463, "global_step": 72183, "epoch": 1718} {"train_loss": -6.042919158935547, "global_step": 72184, "epoch": 1718} {"train_loss": -6.06282901763916, "global_step": 72185, "epoch": 1718} {"train_loss": -6.130208492279053, "global_step": 72186, "epoch": 1718} {"train_loss": -6.102077007293701, "global_step": 72187, "epoch": 1718} {"train_loss": -5.97406530380249, "global_step": 72188, "epoch": 1718} {"train_loss": -6.065548896789551, "global_step": 72189, "epoch": 1718} {"train_loss": -6.064759254455566, "global_step": 72190, "epoch": 1718} {"train_loss": -6.010656356811523, "global_step": 72191, "epoch": 1718} {"train_loss": -5.947393417358398, "global_step": 72192, "epoch": 1718} {"train_loss": -6.023007869720459, "global_step": 72193, "epoch": 1718} {"train_loss": -5.938620567321777, "global_step": 72194, "epoch": 1718} {"train_loss": -6.048486709594727, "global_step": 72195, "epoch": 1718} {"train_loss": -5.921821117401123, "global_step": 72196, "epoch": 1718} {"train_loss": -6.032984222684588, "global_step": 72197, "epoch": 1718, "val_loss": 67350.1015625} {"train_loss": -5.900315761566162, "global_step": 72198, "epoch": 1719} {"train_loss": -6.025132179260254, "global_step": 72199, "epoch": 1719} {"train_loss": -6.035154342651367, "global_step": 72200, "epoch": 1719} {"train_loss": -5.936946868896484, "global_step": 72201, "epoch": 1719} {"train_loss": -5.919676303863525, "global_step": 72202, "epoch": 1719} {"train_loss": -5.982566833496094, "global_step": 72203, "epoch": 1719} {"train_loss": -6.035099029541016, "global_step": 72204, "epoch": 1719} {"train_loss": -5.723236560821533, "global_step": 72205, "epoch": 1719} {"train_loss": -5.947872638702393, "global_step": 72206, "epoch": 1719} {"train_loss": -5.860785961151123, "global_step": 72207, "epoch": 1719} {"train_loss": -5.812661170959473, "global_step": 72208, "epoch": 1719} {"train_loss": -5.863618850708008, "global_step": 72209, "epoch": 1719} {"train_loss": -5.996664047241211, "global_step": 72210, "epoch": 1719} {"train_loss": -6.115961074829102, "global_step": 72211, "epoch": 1719} {"train_loss": -6.051825523376465, "global_step": 72212, "epoch": 1719} {"train_loss": -5.961596488952637, "global_step": 72213, "epoch": 1719} {"train_loss": -5.892536163330078, "global_step": 72214, "epoch": 1719} {"train_loss": -5.934191703796387, "global_step": 72215, "epoch": 1719} {"train_loss": -5.881867408752441, "global_step": 72216, "epoch": 1719} {"train_loss": -5.988454341888428, "global_step": 72217, "epoch": 1719} {"train_loss": -5.890411376953125, "global_step": 72218, "epoch": 1719} {"train_loss": -5.914142608642578, "global_step": 72219, "epoch": 1719} {"train_loss": -5.99375581741333, "global_step": 72220, "epoch": 1719} {"train_loss": -6.050104141235352, "global_step": 72221, "epoch": 1719} {"train_loss": -5.987819194793701, "global_step": 72222, "epoch": 1719} {"train_loss": -6.059791088104248, "global_step": 72223, "epoch": 1719} {"train_loss": -5.994135856628418, "global_step": 72224, "epoch": 1719} {"train_loss": -6.0693888664245605, "global_step": 72225, "epoch": 1719} {"train_loss": -6.151503086090088, "global_step": 72226, "epoch": 1719} {"train_loss": -6.025565147399902, "global_step": 72227, "epoch": 1719} {"train_loss": -5.964016914367676, "global_step": 72228, "epoch": 1719} {"train_loss": -6.11004638671875, "global_step": 72229, "epoch": 1719} {"train_loss": -6.067440986633301, "global_step": 72230, "epoch": 1719} {"train_loss": -6.040855407714844, "global_step": 72231, "epoch": 1719} {"train_loss": -6.049380779266357, "global_step": 72232, "epoch": 1719} {"train_loss": -5.996433734893799, "global_step": 72233, "epoch": 1719} {"train_loss": -6.118121147155762, "global_step": 72234, "epoch": 1719} {"train_loss": -6.066828727722168, "global_step": 72235, "epoch": 1719} {"train_loss": -6.110579967498779, "global_step": 72236, "epoch": 1719} {"train_loss": -5.977385520935059, "global_step": 72237, "epoch": 1719} {"train_loss": -5.921189308166504, "global_step": 72238, "epoch": 1719} {"train_loss": -5.989304406302316, "global_step": 72239, "epoch": 1719, "val_loss": 67668.515625} {"train_loss": -5.854391098022461, "global_step": 72240, "epoch": 1720} {"train_loss": -6.071433067321777, "global_step": 72241, "epoch": 1720} {"train_loss": -6.0258684158325195, "global_step": 72242, "epoch": 1720} {"train_loss": -6.037773132324219, "global_step": 72243, "epoch": 1720} {"train_loss": -6.063147068023682, "global_step": 72244, "epoch": 1720} {"train_loss": -5.933087348937988, "global_step": 72245, "epoch": 1720} {"train_loss": -6.073724746704102, "global_step": 72246, "epoch": 1720} {"train_loss": -6.057232856750488, "global_step": 72247, "epoch": 1720} {"train_loss": -5.958188056945801, "global_step": 72248, "epoch": 1720} {"train_loss": -6.234320163726807, "global_step": 72249, "epoch": 1720} {"train_loss": -6.036652088165283, "global_step": 72250, "epoch": 1720} {"train_loss": -5.983773708343506, "global_step": 72251, "epoch": 1720} {"train_loss": -6.058192253112793, "global_step": 72252, "epoch": 1720} {"train_loss": -6.0048065185546875, "global_step": 72253, "epoch": 1720} {"train_loss": -6.01263427734375, "global_step": 72254, "epoch": 1720} {"train_loss": -5.99898624420166, "global_step": 72255, "epoch": 1720} {"train_loss": -6.04440975189209, "global_step": 72256, "epoch": 1720} {"train_loss": -6.053327560424805, "global_step": 72257, "epoch": 1720} {"train_loss": -6.011706352233887, "global_step": 72258, "epoch": 1720} {"train_loss": -5.950908660888672, "global_step": 72259, "epoch": 1720} {"train_loss": -6.067163467407227, "global_step": 72260, "epoch": 1720} {"train_loss": -6.093478679656982, "global_step": 72261, "epoch": 1720} {"train_loss": -5.977651119232178, "global_step": 72262, "epoch": 1720} {"train_loss": -6.069490909576416, "global_step": 72263, "epoch": 1720} {"train_loss": -5.964815139770508, "global_step": 72264, "epoch": 1720} {"train_loss": -5.994301795959473, "global_step": 72265, "epoch": 1720} {"train_loss": -6.083050727844238, "global_step": 72266, "epoch": 1720} {"train_loss": -5.997422218322754, "global_step": 72267, "epoch": 1720} {"train_loss": -6.031312942504883, "global_step": 72268, "epoch": 1720} {"train_loss": -6.110801696777344, "global_step": 72269, "epoch": 1720} {"train_loss": -6.065065383911133, "global_step": 72270, "epoch": 1720} {"train_loss": -6.033098220825195, "global_step": 72271, "epoch": 1720} {"train_loss": -6.097506999969482, "global_step": 72272, "epoch": 1720} {"train_loss": -5.985246658325195, "global_step": 72273, "epoch": 1720} {"train_loss": -6.0118021965026855, "global_step": 72274, "epoch": 1720} {"train_loss": -6.052377700805664, "global_step": 72275, "epoch": 1720} {"train_loss": -6.031366348266602, "global_step": 72276, "epoch": 1720} {"train_loss": -6.065420150756836, "global_step": 72277, "epoch": 1720} {"train_loss": -6.065777778625488, "global_step": 72278, "epoch": 1720} {"train_loss": -6.018435001373291, "global_step": 72279, "epoch": 1720} {"train_loss": -5.9733052253723145, "global_step": 72280, "epoch": 1720} {"train_loss": -6.028409549168178, "global_step": 72281, "epoch": 1720, "val_loss": 67628.78125} {"train_loss": -6.008316516876221, "global_step": 72282, "epoch": 1721} {"train_loss": -6.147821426391602, "global_step": 72283, "epoch": 1721} {"train_loss": -6.104621887207031, "global_step": 72284, "epoch": 1721} {"train_loss": -6.027503967285156, "global_step": 72285, "epoch": 1721} {"train_loss": -5.961163520812988, "global_step": 72286, "epoch": 1721} {"train_loss": -6.065674304962158, "global_step": 72287, "epoch": 1721} {"train_loss": -6.015159606933594, "global_step": 72288, "epoch": 1721} {"train_loss": -6.105024337768555, "global_step": 72289, "epoch": 1721} {"train_loss": -5.9917449951171875, "global_step": 72290, "epoch": 1721} {"train_loss": -5.941384315490723, "global_step": 72291, "epoch": 1721} {"train_loss": -5.9595417976379395, "global_step": 72292, "epoch": 1721} {"train_loss": -6.0812602043151855, "global_step": 72293, "epoch": 1721} {"train_loss": -6.047616004943848, "global_step": 72294, "epoch": 1721} {"train_loss": -6.020747184753418, "global_step": 72295, "epoch": 1721} {"train_loss": -5.985659122467041, "global_step": 72296, "epoch": 1721} {"train_loss": -6.088407516479492, "global_step": 72297, "epoch": 1721} {"train_loss": -5.887299060821533, "global_step": 72298, "epoch": 1721} {"train_loss": -6.050682067871094, "global_step": 72299, "epoch": 1721} {"train_loss": -5.87851619720459, "global_step": 72300, "epoch": 1721} {"train_loss": -6.071393966674805, "global_step": 72301, "epoch": 1721} {"train_loss": -5.997308254241943, "global_step": 72302, "epoch": 1721} {"train_loss": -6.024600982666016, "global_step": 72303, "epoch": 1721} {"train_loss": -6.1420488357543945, "global_step": 72304, "epoch": 1721} {"train_loss": -5.870167255401611, "global_step": 72305, "epoch": 1721} {"train_loss": -6.021747589111328, "global_step": 72306, "epoch": 1721} {"train_loss": -6.023521423339844, "global_step": 72307, "epoch": 1721} {"train_loss": -6.04388952255249, "global_step": 72308, "epoch": 1721} {"train_loss": -5.949522018432617, "global_step": 72309, "epoch": 1721} {"train_loss": -5.923990249633789, "global_step": 72310, "epoch": 1721} {"train_loss": -6.06823205947876, "global_step": 72311, "epoch": 1721} {"train_loss": -5.955934524536133, "global_step": 72312, "epoch": 1721} {"train_loss": -6.059958457946777, "global_step": 72313, "epoch": 1721} {"train_loss": -6.087670803070068, "global_step": 72314, "epoch": 1721} {"train_loss": -6.1035566329956055, "global_step": 72315, "epoch": 1721} {"train_loss": -6.045515537261963, "global_step": 72316, "epoch": 1721} {"train_loss": -6.025607109069824, "global_step": 72317, "epoch": 1721} {"train_loss": -6.054658889770508, "global_step": 72318, "epoch": 1721} {"train_loss": -5.912614345550537, "global_step": 72319, "epoch": 1721} {"train_loss": -5.979813575744629, "global_step": 72320, "epoch": 1721} {"train_loss": -5.979939937591553, "global_step": 72321, "epoch": 1721} {"train_loss": -5.9234113693237305, "global_step": 72322, "epoch": 1721} {"train_loss": -6.017307383673532, "global_step": 72323, "epoch": 1721, "val_loss": 67451.5703125} {"train_loss": -6.098793983459473, "global_step": 72324, "epoch": 1722} {"train_loss": -6.092062473297119, "global_step": 72325, "epoch": 1722} {"train_loss": -6.013943672180176, "global_step": 72326, "epoch": 1722} {"train_loss": -6.243826866149902, "global_step": 72327, "epoch": 1722} {"train_loss": -6.076476097106934, "global_step": 72328, "epoch": 1722} {"train_loss": -5.925312042236328, "global_step": 72329, "epoch": 1722} {"train_loss": -6.048402309417725, "global_step": 72330, "epoch": 1722} {"train_loss": -6.100323677062988, "global_step": 72331, "epoch": 1722} {"train_loss": -6.052035331726074, "global_step": 72332, "epoch": 1722} {"train_loss": -6.066364288330078, "global_step": 72333, "epoch": 1722} {"train_loss": -6.120786666870117, "global_step": 72334, "epoch": 1722} {"train_loss": -5.958323955535889, "global_step": 72335, "epoch": 1722} {"train_loss": -6.047877788543701, "global_step": 72336, "epoch": 1722} {"train_loss": -5.913412094116211, "global_step": 72337, "epoch": 1722} {"train_loss": -6.10279655456543, "global_step": 72338, "epoch": 1722} {"train_loss": -6.115365028381348, "global_step": 72339, "epoch": 1722} {"train_loss": -5.958886623382568, "global_step": 72340, "epoch": 1722} {"train_loss": -5.984410285949707, "global_step": 72341, "epoch": 1722} {"train_loss": -6.045248985290527, "global_step": 72342, "epoch": 1722} {"train_loss": -6.099386215209961, "global_step": 72343, "epoch": 1722} {"train_loss": -5.963099479675293, "global_step": 72344, "epoch": 1722} {"train_loss": -6.041177749633789, "global_step": 72345, "epoch": 1722} {"train_loss": -6.02561092376709, "global_step": 72346, "epoch": 1722} {"train_loss": -6.055671691894531, "global_step": 72347, "epoch": 1722} {"train_loss": -5.970833778381348, "global_step": 72348, "epoch": 1722} {"train_loss": -6.106594085693359, "global_step": 72349, "epoch": 1722} {"train_loss": -6.073816299438477, "global_step": 72350, "epoch": 1722} {"train_loss": -5.990981578826904, "global_step": 72351, "epoch": 1722} {"train_loss": -5.970394134521484, "global_step": 72352, "epoch": 1722} {"train_loss": -6.057338714599609, "global_step": 72353, "epoch": 1722} {"train_loss": -6.08999490737915, "global_step": 72354, "epoch": 1722} {"train_loss": -6.027621746063232, "global_step": 72355, "epoch": 1722} {"train_loss": -6.075904369354248, "global_step": 72356, "epoch": 1722} {"train_loss": -6.1410603523254395, "global_step": 72357, "epoch": 1722} {"train_loss": -6.055670738220215, "global_step": 72358, "epoch": 1722} {"train_loss": -5.982633590698242, "global_step": 72359, "epoch": 1722} {"train_loss": -6.085111618041992, "global_step": 72360, "epoch": 1722} {"train_loss": -6.006552696228027, "global_step": 72361, "epoch": 1722} {"train_loss": -6.059460639953613, "global_step": 72362, "epoch": 1722} {"train_loss": -6.0886030197143555, "global_step": 72363, "epoch": 1722} {"train_loss": -6.05772066116333, "global_step": 72364, "epoch": 1722} {"train_loss": -6.0489800203414195, "global_step": 72365, "epoch": 1722, "val_loss": 67265.7890625} {"train_loss": -6.080916881561279, "global_step": 72366, "epoch": 1723} {"train_loss": -5.989071846008301, "global_step": 72367, "epoch": 1723} {"train_loss": -6.037813663482666, "global_step": 72368, "epoch": 1723} {"train_loss": -6.074409484863281, "global_step": 72369, "epoch": 1723} {"train_loss": -5.939545631408691, "global_step": 72370, "epoch": 1723} {"train_loss": -5.994952201843262, "global_step": 72371, "epoch": 1723} {"train_loss": -6.121870994567871, "global_step": 72372, "epoch": 1723} {"train_loss": -6.05810546875, "global_step": 72373, "epoch": 1723} {"train_loss": -6.185239315032959, "global_step": 72374, "epoch": 1723} {"train_loss": -6.064103126525879, "global_step": 72375, "epoch": 1723} {"train_loss": -6.042604923248291, "global_step": 72376, "epoch": 1723} {"train_loss": -6.1370439529418945, "global_step": 72377, "epoch": 1723} {"train_loss": -6.121531009674072, "global_step": 72378, "epoch": 1723} {"train_loss": -6.0398149490356445, "global_step": 72379, "epoch": 1723} {"train_loss": -6.123508453369141, "global_step": 72380, "epoch": 1723} {"train_loss": -5.949619293212891, "global_step": 72381, "epoch": 1723} {"train_loss": -6.220848560333252, "global_step": 72382, "epoch": 1723} {"train_loss": -6.008785247802734, "global_step": 72383, "epoch": 1723} {"train_loss": -6.0403618812561035, "global_step": 72384, "epoch": 1723} {"train_loss": -6.0048828125, "global_step": 72385, "epoch": 1723} {"train_loss": -6.087092399597168, "global_step": 72386, "epoch": 1723} {"train_loss": -5.984837055206299, "global_step": 72387, "epoch": 1723} {"train_loss": -5.997654438018799, "global_step": 72388, "epoch": 1723} {"train_loss": -5.960897445678711, "global_step": 72389, "epoch": 1723} {"train_loss": -5.973154544830322, "global_step": 72390, "epoch": 1723} {"train_loss": -6.04106330871582, "global_step": 72391, "epoch": 1723} {"train_loss": -6.0250349044799805, "global_step": 72392, "epoch": 1723} {"train_loss": -6.034553527832031, "global_step": 72393, "epoch": 1723} {"train_loss": -5.995547771453857, "global_step": 72394, "epoch": 1723} {"train_loss": -6.080587387084961, "global_step": 72395, "epoch": 1723} {"train_loss": -6.044149398803711, "global_step": 72396, "epoch": 1723} {"train_loss": -6.022683143615723, "global_step": 72397, "epoch": 1723} {"train_loss": -6.049976348876953, "global_step": 72398, "epoch": 1723} {"train_loss": -5.926058769226074, "global_step": 72399, "epoch": 1723} {"train_loss": -6.0437541007995605, "global_step": 72400, "epoch": 1723} {"train_loss": -5.84472131729126, "global_step": 72401, "epoch": 1723} {"train_loss": -6.048324108123779, "global_step": 72402, "epoch": 1723} {"train_loss": -6.112905025482178, "global_step": 72403, "epoch": 1723} {"train_loss": -6.016257286071777, "global_step": 72404, "epoch": 1723} {"train_loss": -6.026833534240723, "global_step": 72405, "epoch": 1723} {"train_loss": -6.117949485778809, "global_step": 72406, "epoch": 1723} {"train_loss": -6.040224711100261, "global_step": 72407, "epoch": 1723, "val_loss": 67220.1875} {"train_loss": -6.097225666046143, "global_step": 72408, "epoch": 1724} {"train_loss": -6.045814514160156, "global_step": 72409, "epoch": 1724} {"train_loss": -6.025141716003418, "global_step": 72410, "epoch": 1724} {"train_loss": -6.032558441162109, "global_step": 72411, "epoch": 1724} {"train_loss": -6.04873514175415, "global_step": 72412, "epoch": 1724} {"train_loss": -6.0032782554626465, "global_step": 72413, "epoch": 1724} {"train_loss": -6.123516082763672, "global_step": 72414, "epoch": 1724} {"train_loss": -5.8225626945495605, "global_step": 72415, "epoch": 1724} {"train_loss": -6.032987594604492, "global_step": 72416, "epoch": 1724} {"train_loss": -5.890203475952148, "global_step": 72417, "epoch": 1724} {"train_loss": -6.00680685043335, "global_step": 72418, "epoch": 1724} {"train_loss": -5.977136611938477, "global_step": 72419, "epoch": 1724} {"train_loss": -6.162350654602051, "global_step": 72420, "epoch": 1724} {"train_loss": -6.079954147338867, "global_step": 72421, "epoch": 1724} {"train_loss": -5.967475891113281, "global_step": 72422, "epoch": 1724} {"train_loss": -6.044126510620117, "global_step": 72423, "epoch": 1724} {"train_loss": -5.952228546142578, "global_step": 72424, "epoch": 1724} {"train_loss": -5.886041641235352, "global_step": 72425, "epoch": 1724} {"train_loss": -6.038082122802734, "global_step": 72426, "epoch": 1724} {"train_loss": -6.080577850341797, "global_step": 72427, "epoch": 1724} {"train_loss": -5.9294891357421875, "global_step": 72428, "epoch": 1724} {"train_loss": -6.068454742431641, "global_step": 72429, "epoch": 1724} {"train_loss": -5.938279151916504, "global_step": 72430, "epoch": 1724} {"train_loss": -5.982813358306885, "global_step": 72431, "epoch": 1724} {"train_loss": -6.04102897644043, "global_step": 72432, "epoch": 1724} {"train_loss": -5.949173927307129, "global_step": 72433, "epoch": 1724} {"train_loss": -6.013387680053711, "global_step": 72434, "epoch": 1724} {"train_loss": -5.952816009521484, "global_step": 72435, "epoch": 1724} {"train_loss": -5.886840343475342, "global_step": 72436, "epoch": 1724} {"train_loss": -5.933991432189941, "global_step": 72437, "epoch": 1724} {"train_loss": -5.983522891998291, "global_step": 72438, "epoch": 1724} {"train_loss": -5.8592729568481445, "global_step": 72439, "epoch": 1724} {"train_loss": -6.040624141693115, "global_step": 72440, "epoch": 1724} {"train_loss": -6.057743072509766, "global_step": 72441, "epoch": 1724} {"train_loss": -5.930924892425537, "global_step": 72442, "epoch": 1724} {"train_loss": -6.078536033630371, "global_step": 72443, "epoch": 1724} {"train_loss": -6.072235107421875, "global_step": 72444, "epoch": 1724} {"train_loss": -5.985840797424316, "global_step": 72445, "epoch": 1724} {"train_loss": -5.998098373413086, "global_step": 72446, "epoch": 1724} {"train_loss": -6.117796897888184, "global_step": 72447, "epoch": 1724} {"train_loss": -5.968961715698242, "global_step": 72448, "epoch": 1724} {"train_loss": -6.003571612494333, "global_step": 72449, "epoch": 1724, "val_loss": 67549.421875} {"train_loss": -6.00097131729126, "global_step": 72450, "epoch": 1725} {"train_loss": -5.962678909301758, "global_step": 72451, "epoch": 1725} {"train_loss": -5.985783100128174, "global_step": 72452, "epoch": 1725} {"train_loss": -5.963962078094482, "global_step": 72453, "epoch": 1725} {"train_loss": -5.992896556854248, "global_step": 72454, "epoch": 1725} {"train_loss": -6.022798538208008, "global_step": 72455, "epoch": 1725} {"train_loss": -6.137465953826904, "global_step": 72456, "epoch": 1725} {"train_loss": -6.0526275634765625, "global_step": 72457, "epoch": 1725} {"train_loss": -6.0535664558410645, "global_step": 72458, "epoch": 1725} {"train_loss": -6.162322044372559, "global_step": 72459, "epoch": 1725} {"train_loss": -6.162707328796387, "global_step": 72460, "epoch": 1725} {"train_loss": -5.96787166595459, "global_step": 72461, "epoch": 1725} {"train_loss": -5.991199016571045, "global_step": 72462, "epoch": 1725} {"train_loss": -6.004931449890137, "global_step": 72463, "epoch": 1725} {"train_loss": -5.975829124450684, "global_step": 72464, "epoch": 1725} {"train_loss": -6.047025680541992, "global_step": 72465, "epoch": 1725} {"train_loss": -6.162026882171631, "global_step": 72466, "epoch": 1725} {"train_loss": -6.065953254699707, "global_step": 72467, "epoch": 1725} {"train_loss": -5.954354286193848, "global_step": 72468, "epoch": 1725} {"train_loss": -6.062355995178223, "global_step": 72469, "epoch": 1725} {"train_loss": -5.976740837097168, "global_step": 72470, "epoch": 1725} {"train_loss": -6.013100624084473, "global_step": 72471, "epoch": 1725} {"train_loss": -6.02299690246582, "global_step": 72472, "epoch": 1725} {"train_loss": -5.951329708099365, "global_step": 72473, "epoch": 1725} {"train_loss": -5.994844913482666, "global_step": 72474, "epoch": 1725} {"train_loss": -6.092536926269531, "global_step": 72475, "epoch": 1725} {"train_loss": -6.141022205352783, "global_step": 72476, "epoch": 1725} {"train_loss": -5.9359025955200195, "global_step": 72477, "epoch": 1725} {"train_loss": -6.090880393981934, "global_step": 72478, "epoch": 1725} {"train_loss": -6.067169666290283, "global_step": 72479, "epoch": 1725} {"train_loss": -6.006312370300293, "global_step": 72480, "epoch": 1725} {"train_loss": -6.007157802581787, "global_step": 72481, "epoch": 1725} {"train_loss": -6.105668067932129, "global_step": 72482, "epoch": 1725} {"train_loss": -6.002401351928711, "global_step": 72483, "epoch": 1725} {"train_loss": -5.990799903869629, "global_step": 72484, "epoch": 1725} {"train_loss": -6.04025936126709, "global_step": 72485, "epoch": 1725} {"train_loss": -5.9724650382995605, "global_step": 72486, "epoch": 1725} {"train_loss": -6.04903507232666, "global_step": 72487, "epoch": 1725} {"train_loss": -6.065650939941406, "global_step": 72488, "epoch": 1725} {"train_loss": -6.098034858703613, "global_step": 72489, "epoch": 1725} {"train_loss": -6.105927467346191, "global_step": 72490, "epoch": 1725} {"train_loss": -6.0345640409560435, "global_step": 72491, "epoch": 1725, "val_loss": 67443.1953125} {"train_loss": -5.945100784301758, "global_step": 72492, "epoch": 1726} {"train_loss": -6.053614139556885, "global_step": 72493, "epoch": 1726} {"train_loss": -6.039127349853516, "global_step": 72494, "epoch": 1726} {"train_loss": -6.1132073402404785, "global_step": 72495, "epoch": 1726} {"train_loss": -6.148423194885254, "global_step": 72496, "epoch": 1726} {"train_loss": -5.983281135559082, "global_step": 72497, "epoch": 1726} {"train_loss": -5.9574174880981445, "global_step": 72498, "epoch": 1726} {"train_loss": -6.054283142089844, "global_step": 72499, "epoch": 1726} {"train_loss": -5.965945243835449, "global_step": 72500, "epoch": 1726} {"train_loss": -6.06328010559082, "global_step": 72501, "epoch": 1726} {"train_loss": -6.097963333129883, "global_step": 72502, "epoch": 1726} {"train_loss": -6.008459091186523, "global_step": 72503, "epoch": 1726} {"train_loss": -6.187394142150879, "global_step": 72504, "epoch": 1726} {"train_loss": -5.958998203277588, "global_step": 72505, "epoch": 1726} {"train_loss": -6.018198013305664, "global_step": 72506, "epoch": 1726} {"train_loss": -6.057394027709961, "global_step": 72507, "epoch": 1726} {"train_loss": -5.886786937713623, "global_step": 72508, "epoch": 1726} {"train_loss": -6.020664691925049, "global_step": 72509, "epoch": 1726} {"train_loss": -6.019173622131348, "global_step": 72510, "epoch": 1726} {"train_loss": -6.124950408935547, "global_step": 72511, "epoch": 1726} {"train_loss": -5.983164310455322, "global_step": 72512, "epoch": 1726} {"train_loss": -6.063538551330566, "global_step": 72513, "epoch": 1726} {"train_loss": -6.083662033081055, "global_step": 72514, "epoch": 1726} {"train_loss": -6.017481803894043, "global_step": 72515, "epoch": 1726} {"train_loss": -6.071882247924805, "global_step": 72516, "epoch": 1726} {"train_loss": -5.930881500244141, "global_step": 72517, "epoch": 1726} {"train_loss": -6.068788528442383, "global_step": 72518, "epoch": 1726} {"train_loss": -6.047720909118652, "global_step": 72519, "epoch": 1726} {"train_loss": -6.038996696472168, "global_step": 72520, "epoch": 1726} {"train_loss": -6.0365447998046875, "global_step": 72521, "epoch": 1726} {"train_loss": -5.978403568267822, "global_step": 72522, "epoch": 1726} {"train_loss": -5.946438312530518, "global_step": 72523, "epoch": 1726} {"train_loss": -6.065208435058594, "global_step": 72524, "epoch": 1726} {"train_loss": -6.2104926109313965, "global_step": 72525, "epoch": 1726} {"train_loss": -5.930597305297852, "global_step": 72526, "epoch": 1726} {"train_loss": -6.0897417068481445, "global_step": 72527, "epoch": 1726} {"train_loss": -5.965121269226074, "global_step": 72528, "epoch": 1726} {"train_loss": -6.001567363739014, "global_step": 72529, "epoch": 1726} {"train_loss": -6.034605503082275, "global_step": 72530, "epoch": 1726} {"train_loss": -6.052674293518066, "global_step": 72531, "epoch": 1726} {"train_loss": -6.086293697357178, "global_step": 72532, "epoch": 1726} {"train_loss": -6.034838892164684, "global_step": 72533, "epoch": 1726, "val_loss": 67458.78125} {"train_loss": -6.051587104797363, "global_step": 72534, "epoch": 1727} {"train_loss": -6.016660690307617, "global_step": 72535, "epoch": 1727} {"train_loss": -6.0290679931640625, "global_step": 72536, "epoch": 1727} {"train_loss": -6.038454055786133, "global_step": 72537, "epoch": 1727} {"train_loss": -5.969728946685791, "global_step": 72538, "epoch": 1727} {"train_loss": -6.097565174102783, "global_step": 72539, "epoch": 1727} {"train_loss": -6.1099042892456055, "global_step": 72540, "epoch": 1727} {"train_loss": -6.116182327270508, "global_step": 72541, "epoch": 1727} {"train_loss": -6.107372283935547, "global_step": 72542, "epoch": 1727} {"train_loss": -6.035876274108887, "global_step": 72543, "epoch": 1727} {"train_loss": -6.145360469818115, "global_step": 72544, "epoch": 1727} {"train_loss": -6.119139194488525, "global_step": 72545, "epoch": 1727} {"train_loss": -5.931082248687744, "global_step": 72546, "epoch": 1727} {"train_loss": -6.03837776184082, "global_step": 72547, "epoch": 1727} {"train_loss": -5.9735941886901855, "global_step": 72548, "epoch": 1727} {"train_loss": -5.986746788024902, "global_step": 72549, "epoch": 1727} {"train_loss": -6.072267532348633, "global_step": 72550, "epoch": 1727} {"train_loss": -6.056015968322754, "global_step": 72551, "epoch": 1727} {"train_loss": -5.993309020996094, "global_step": 72552, "epoch": 1727} {"train_loss": -5.936197280883789, "global_step": 72553, "epoch": 1727} {"train_loss": -6.0255327224731445, "global_step": 72554, "epoch": 1727} {"train_loss": -6.014505386352539, "global_step": 72555, "epoch": 1727} {"train_loss": -5.960484504699707, "global_step": 72556, "epoch": 1727} {"train_loss": -5.981022834777832, "global_step": 72557, "epoch": 1727} {"train_loss": -6.028670310974121, "global_step": 72558, "epoch": 1727} {"train_loss": -6.015054702758789, "global_step": 72559, "epoch": 1727} {"train_loss": -5.927633762359619, "global_step": 72560, "epoch": 1727} {"train_loss": -5.938765525817871, "global_step": 72561, "epoch": 1727} {"train_loss": -6.018258571624756, "global_step": 72562, "epoch": 1727} {"train_loss": -6.0072174072265625, "global_step": 72563, "epoch": 1727} {"train_loss": -6.016970634460449, "global_step": 72564, "epoch": 1727} {"train_loss": -5.993398189544678, "global_step": 72565, "epoch": 1727} {"train_loss": -6.036457061767578, "global_step": 72566, "epoch": 1727} {"train_loss": -5.964419364929199, "global_step": 72567, "epoch": 1727} {"train_loss": -6.091631889343262, "global_step": 72568, "epoch": 1727} {"train_loss": -6.032039642333984, "global_step": 72569, "epoch": 1727} {"train_loss": -6.031664848327637, "global_step": 72570, "epoch": 1727} {"train_loss": -6.035065650939941, "global_step": 72571, "epoch": 1727} {"train_loss": -6.013093948364258, "global_step": 72572, "epoch": 1727} {"train_loss": -6.035079002380371, "global_step": 72573, "epoch": 1727} {"train_loss": -6.069433212280273, "global_step": 72574, "epoch": 1727} {"train_loss": -6.0282383646283835, "global_step": 72575, "epoch": 1727, "val_loss": 67453.109375} {"train_loss": -6.01261568069458, "global_step": 72576, "epoch": 1728} {"train_loss": -5.991736888885498, "global_step": 72577, "epoch": 1728} {"train_loss": -6.0733747482299805, "global_step": 72578, "epoch": 1728} {"train_loss": -6.12059211730957, "global_step": 72579, "epoch": 1728} {"train_loss": -6.151914596557617, "global_step": 72580, "epoch": 1728} {"train_loss": -6.12100887298584, "global_step": 72581, "epoch": 1728} {"train_loss": -6.125739097595215, "global_step": 72582, "epoch": 1728} {"train_loss": -6.0979156494140625, "global_step": 72583, "epoch": 1728} {"train_loss": -6.124726295471191, "global_step": 72584, "epoch": 1728} {"train_loss": -6.102785587310791, "global_step": 72585, "epoch": 1728} {"train_loss": -5.996586322784424, "global_step": 72586, "epoch": 1728} {"train_loss": -6.007968425750732, "global_step": 72587, "epoch": 1728} {"train_loss": -6.064887046813965, "global_step": 72588, "epoch": 1728} {"train_loss": -5.940052509307861, "global_step": 72589, "epoch": 1728} {"train_loss": -6.142918109893799, "global_step": 72590, "epoch": 1728} {"train_loss": -5.974441051483154, "global_step": 72591, "epoch": 1728} {"train_loss": -6.0069193840026855, "global_step": 72592, "epoch": 1728} {"train_loss": -5.971871376037598, "global_step": 72593, "epoch": 1728} {"train_loss": -6.0246124267578125, "global_step": 72594, "epoch": 1728} {"train_loss": -6.0670084953308105, "global_step": 72595, "epoch": 1728} {"train_loss": -6.153437614440918, "global_step": 72596, "epoch": 1728} {"train_loss": -6.010068893432617, "global_step": 72597, "epoch": 1728} {"train_loss": -6.0242085456848145, "global_step": 72598, "epoch": 1728} {"train_loss": -6.022099494934082, "global_step": 72599, "epoch": 1728} {"train_loss": -6.048844337463379, "global_step": 72600, "epoch": 1728} {"train_loss": -6.087069511413574, "global_step": 72601, "epoch": 1728} {"train_loss": -6.054180145263672, "global_step": 72602, "epoch": 1728} {"train_loss": -5.997923374176025, "global_step": 72603, "epoch": 1728} {"train_loss": -6.106534004211426, "global_step": 72604, "epoch": 1728} {"train_loss": -5.937153339385986, "global_step": 72605, "epoch": 1728} {"train_loss": -6.037209510803223, "global_step": 72606, "epoch": 1728} {"train_loss": -6.081916332244873, "global_step": 72607, "epoch": 1728} {"train_loss": -5.986807823181152, "global_step": 72608, "epoch": 1728} {"train_loss": -6.105016708374023, "global_step": 72609, "epoch": 1728} {"train_loss": -6.01212215423584, "global_step": 72610, "epoch": 1728} {"train_loss": -6.005127906799316, "global_step": 72611, "epoch": 1728} {"train_loss": -6.02716064453125, "global_step": 72612, "epoch": 1728} {"train_loss": -6.074874401092529, "global_step": 72613, "epoch": 1728} {"train_loss": -6.033998489379883, "global_step": 72614, "epoch": 1728} {"train_loss": -5.892844200134277, "global_step": 72615, "epoch": 1728} {"train_loss": -6.005295753479004, "global_step": 72616, "epoch": 1728} {"train_loss": -6.043799797693889, "global_step": 72617, "epoch": 1728, "val_loss": 67597.1640625} {"train_loss": -6.0181074142456055, "global_step": 72618, "epoch": 1729} {"train_loss": -5.970081329345703, "global_step": 72619, "epoch": 1729} {"train_loss": -5.998827934265137, "global_step": 72620, "epoch": 1729} {"train_loss": -6.103558540344238, "global_step": 72621, "epoch": 1729} {"train_loss": -5.994157314300537, "global_step": 72622, "epoch": 1729} {"train_loss": -6.101444244384766, "global_step": 72623, "epoch": 1729} {"train_loss": -5.91520357131958, "global_step": 72624, "epoch": 1729} {"train_loss": -6.048038482666016, "global_step": 72625, "epoch": 1729} {"train_loss": -6.0573272705078125, "global_step": 72626, "epoch": 1729} {"train_loss": -5.970852375030518, "global_step": 72627, "epoch": 1729} {"train_loss": -6.001591205596924, "global_step": 72628, "epoch": 1729} {"train_loss": -6.107088088989258, "global_step": 72629, "epoch": 1729} {"train_loss": -5.997231483459473, "global_step": 72630, "epoch": 1729} {"train_loss": -6.152130603790283, "global_step": 72631, "epoch": 1729} {"train_loss": -6.077914714813232, "global_step": 72632, "epoch": 1729} {"train_loss": -5.972157001495361, "global_step": 72633, "epoch": 1729} {"train_loss": -5.983739376068115, "global_step": 72634, "epoch": 1729} {"train_loss": -6.042179107666016, "global_step": 72635, "epoch": 1729} {"train_loss": -6.034923553466797, "global_step": 72636, "epoch": 1729} {"train_loss": -6.010217666625977, "global_step": 72637, "epoch": 1729} {"train_loss": -6.045382499694824, "global_step": 72638, "epoch": 1729} {"train_loss": -6.062104225158691, "global_step": 72639, "epoch": 1729} {"train_loss": -5.911577224731445, "global_step": 72640, "epoch": 1729} {"train_loss": -6.149877548217773, "global_step": 72641, "epoch": 1729} {"train_loss": -6.131592273712158, "global_step": 72642, "epoch": 1729} {"train_loss": -5.797194480895996, "global_step": 72643, "epoch": 1729} {"train_loss": -6.035754680633545, "global_step": 72644, "epoch": 1729} {"train_loss": -5.999327659606934, "global_step": 72645, "epoch": 1729} {"train_loss": -5.932650089263916, "global_step": 72646, "epoch": 1729} {"train_loss": -5.973553657531738, "global_step": 72647, "epoch": 1729} {"train_loss": -5.999414443969727, "global_step": 72648, "epoch": 1729} {"train_loss": -6.03748893737793, "global_step": 72649, "epoch": 1729} {"train_loss": -6.083883762359619, "global_step": 72650, "epoch": 1729} {"train_loss": -5.993481159210205, "global_step": 72651, "epoch": 1729} {"train_loss": -6.115738868713379, "global_step": 72652, "epoch": 1729} {"train_loss": -6.019037246704102, "global_step": 72653, "epoch": 1729} {"train_loss": -5.951851844787598, "global_step": 72654, "epoch": 1729} {"train_loss": -6.01056432723999, "global_step": 72655, "epoch": 1729} {"train_loss": -5.981742858886719, "global_step": 72656, "epoch": 1729} {"train_loss": -6.031120300292969, "global_step": 72657, "epoch": 1729} {"train_loss": -5.95833683013916, "global_step": 72658, "epoch": 1729} {"train_loss": -6.018049206052508, "global_step": 72659, "epoch": 1729, "val_loss": 67254.90625} {"train_loss": -6.098911285400391, "global_step": 72660, "epoch": 1730} {"train_loss": -6.16445255279541, "global_step": 72661, "epoch": 1730} {"train_loss": -5.9642438888549805, "global_step": 72662, "epoch": 1730} {"train_loss": -6.024333953857422, "global_step": 72663, "epoch": 1730} {"train_loss": -5.979138374328613, "global_step": 72664, "epoch": 1730} {"train_loss": -6.097780227661133, "global_step": 72665, "epoch": 1730} {"train_loss": -5.999177932739258, "global_step": 72666, "epoch": 1730} {"train_loss": -6.095261573791504, "global_step": 72667, "epoch": 1730} {"train_loss": -6.064497947692871, "global_step": 72668, "epoch": 1730} {"train_loss": -5.988831520080566, "global_step": 72669, "epoch": 1730} {"train_loss": -6.147372722625732, "global_step": 72670, "epoch": 1730} {"train_loss": -6.019413471221924, "global_step": 72671, "epoch": 1730} {"train_loss": -6.080892562866211, "global_step": 72672, "epoch": 1730} {"train_loss": -6.058996200561523, "global_step": 72673, "epoch": 1730} {"train_loss": -6.009368896484375, "global_step": 72674, "epoch": 1730} {"train_loss": -5.99935245513916, "global_step": 72675, "epoch": 1730} {"train_loss": -6.108969688415527, "global_step": 72676, "epoch": 1730} {"train_loss": -6.0343523025512695, "global_step": 72677, "epoch": 1730} {"train_loss": -6.154611110687256, "global_step": 72678, "epoch": 1730} {"train_loss": -5.969637870788574, "global_step": 72679, "epoch": 1730} {"train_loss": -6.025861740112305, "global_step": 72680, "epoch": 1730} {"train_loss": -6.048069477081299, "global_step": 72681, "epoch": 1730} {"train_loss": -5.934967517852783, "global_step": 72682, "epoch": 1730} {"train_loss": -5.971552848815918, "global_step": 72683, "epoch": 1730} {"train_loss": -6.032650947570801, "global_step": 72684, "epoch": 1730} {"train_loss": -5.9220428466796875, "global_step": 72685, "epoch": 1730} {"train_loss": -6.213626861572266, "global_step": 72686, "epoch": 1730} {"train_loss": -6.007474422454834, "global_step": 72687, "epoch": 1730} {"train_loss": -5.996358871459961, "global_step": 72688, "epoch": 1730} {"train_loss": -6.011960029602051, "global_step": 72689, "epoch": 1730} {"train_loss": -6.044742584228516, "global_step": 72690, "epoch": 1730} {"train_loss": -6.137852668762207, "global_step": 72691, "epoch": 1730} {"train_loss": -6.169863700866699, "global_step": 72692, "epoch": 1730} {"train_loss": -5.90948486328125, "global_step": 72693, "epoch": 1730} {"train_loss": -6.1302995681762695, "global_step": 72694, "epoch": 1730} {"train_loss": -6.204864978790283, "global_step": 72695, "epoch": 1730} {"train_loss": -6.066525459289551, "global_step": 72696, "epoch": 1730} {"train_loss": -5.9823994636535645, "global_step": 72697, "epoch": 1730} {"train_loss": -5.978285789489746, "global_step": 72698, "epoch": 1730} {"train_loss": -5.954124927520752, "global_step": 72699, "epoch": 1730} {"train_loss": -6.018680572509766, "global_step": 72700, "epoch": 1730} {"train_loss": -6.044406993048532, "global_step": 72701, "epoch": 1730, "val_loss": 67478.5859375} {"train_loss": -6.117701530456543, "global_step": 72702, "epoch": 1731} {"train_loss": -6.080140113830566, "global_step": 72703, "epoch": 1731} {"train_loss": -6.107278823852539, "global_step": 72704, "epoch": 1731} {"train_loss": -6.0369977951049805, "global_step": 72705, "epoch": 1731} {"train_loss": -6.088592529296875, "global_step": 72706, "epoch": 1731} {"train_loss": -6.102750778198242, "global_step": 72707, "epoch": 1731} {"train_loss": -6.0194830894470215, "global_step": 72708, "epoch": 1731} {"train_loss": -6.174997329711914, "global_step": 72709, "epoch": 1731} {"train_loss": -6.126470565795898, "global_step": 72710, "epoch": 1731} {"train_loss": -6.140469551086426, "global_step": 72711, "epoch": 1731} {"train_loss": -5.982781410217285, "global_step": 72712, "epoch": 1731} {"train_loss": -6.007308006286621, "global_step": 72713, "epoch": 1731} {"train_loss": -6.130947113037109, "global_step": 72714, "epoch": 1731} {"train_loss": -5.9840850830078125, "global_step": 72715, "epoch": 1731} {"train_loss": -6.015984058380127, "global_step": 72716, "epoch": 1731} {"train_loss": -6.0354413986206055, "global_step": 72717, "epoch": 1731} {"train_loss": -6.078721046447754, "global_step": 72718, "epoch": 1731} {"train_loss": -6.116322040557861, "global_step": 72719, "epoch": 1731} {"train_loss": -6.040815353393555, "global_step": 72720, "epoch": 1731} {"train_loss": -6.046034812927246, "global_step": 72721, "epoch": 1731} {"train_loss": -6.096253871917725, "global_step": 72722, "epoch": 1731} {"train_loss": -6.059247970581055, "global_step": 72723, "epoch": 1731} {"train_loss": -6.195709228515625, "global_step": 72724, "epoch": 1731} {"train_loss": -6.026021957397461, "global_step": 72725, "epoch": 1731} {"train_loss": -6.073041915893555, "global_step": 72726, "epoch": 1731} {"train_loss": -6.123380661010742, "global_step": 72727, "epoch": 1731} {"train_loss": -6.008000373840332, "global_step": 72728, "epoch": 1731} {"train_loss": -6.093083381652832, "global_step": 72729, "epoch": 1731} {"train_loss": -6.064117431640625, "global_step": 72730, "epoch": 1731} {"train_loss": -6.010990142822266, "global_step": 72731, "epoch": 1731} {"train_loss": -6.030490875244141, "global_step": 72732, "epoch": 1731} {"train_loss": -6.066216468811035, "global_step": 72733, "epoch": 1731} {"train_loss": -6.073805809020996, "global_step": 72734, "epoch": 1731} {"train_loss": -6.076422691345215, "global_step": 72735, "epoch": 1731} {"train_loss": -6.053440093994141, "global_step": 72736, "epoch": 1731} {"train_loss": -6.107375144958496, "global_step": 72737, "epoch": 1731} {"train_loss": -5.9408860206604, "global_step": 72738, "epoch": 1731} {"train_loss": -6.017215728759766, "global_step": 72739, "epoch": 1731} {"train_loss": -5.9783477783203125, "global_step": 72740, "epoch": 1731} {"train_loss": -5.983529090881348, "global_step": 72741, "epoch": 1731} {"train_loss": -5.816795349121094, "global_step": 72742, "epoch": 1731} {"train_loss": -6.05416396686009, "global_step": 72743, "epoch": 1731, "val_loss": 67487.4609375} {"train_loss": -5.945152282714844, "global_step": 72744, "epoch": 1732} {"train_loss": -6.02785587310791, "global_step": 72745, "epoch": 1732} {"train_loss": -5.945062637329102, "global_step": 72746, "epoch": 1732} {"train_loss": -5.864294052124023, "global_step": 72747, "epoch": 1732} {"train_loss": -5.900118350982666, "global_step": 72748, "epoch": 1732} {"train_loss": -5.881837368011475, "global_step": 72749, "epoch": 1732} {"train_loss": -6.017171859741211, "global_step": 72750, "epoch": 1732} {"train_loss": -5.98150634765625, "global_step": 72751, "epoch": 1732} {"train_loss": -6.007715225219727, "global_step": 72752, "epoch": 1732} {"train_loss": -6.1272711753845215, "global_step": 72753, "epoch": 1732} {"train_loss": -5.927319049835205, "global_step": 72754, "epoch": 1732} {"train_loss": -5.981377601623535, "global_step": 72755, "epoch": 1732} {"train_loss": -6.011151313781738, "global_step": 72756, "epoch": 1732} {"train_loss": -6.046552658081055, "global_step": 72757, "epoch": 1732} {"train_loss": -6.044914245605469, "global_step": 72758, "epoch": 1732} {"train_loss": -6.088531494140625, "global_step": 72759, "epoch": 1732} {"train_loss": -6.0534210205078125, "global_step": 72760, "epoch": 1732} {"train_loss": -5.94287109375, "global_step": 72761, "epoch": 1732} {"train_loss": -6.035593032836914, "global_step": 72762, "epoch": 1732} {"train_loss": -6.000030040740967, "global_step": 72763, "epoch": 1732} {"train_loss": -6.025940895080566, "global_step": 72764, "epoch": 1732} {"train_loss": -6.1052751541137695, "global_step": 72765, "epoch": 1732} {"train_loss": -6.052542686462402, "global_step": 72766, "epoch": 1732} {"train_loss": -6.1331658363342285, "global_step": 72767, "epoch": 1732} {"train_loss": -6.061783313751221, "global_step": 72768, "epoch": 1732} {"train_loss": -6.032037734985352, "global_step": 72769, "epoch": 1732} {"train_loss": -6.1275224685668945, "global_step": 72770, "epoch": 1732} {"train_loss": -6.045547962188721, "global_step": 72771, "epoch": 1732} {"train_loss": -6.020608901977539, "global_step": 72772, "epoch": 1732} {"train_loss": -5.975430488586426, "global_step": 72773, "epoch": 1732} {"train_loss": -6.169138431549072, "global_step": 72774, "epoch": 1732} {"train_loss": -6.159221649169922, "global_step": 72775, "epoch": 1732} {"train_loss": -6.120443344116211, "global_step": 72776, "epoch": 1732} {"train_loss": -6.016462326049805, "global_step": 72777, "epoch": 1732} {"train_loss": -6.11966609954834, "global_step": 72778, "epoch": 1732} {"train_loss": -6.165031433105469, "global_step": 72779, "epoch": 1732} {"train_loss": -6.094208240509033, "global_step": 72780, "epoch": 1732} {"train_loss": -5.866349697113037, "global_step": 72781, "epoch": 1732} {"train_loss": -6.00396203994751, "global_step": 72782, "epoch": 1732} {"train_loss": -6.05544900894165, "global_step": 72783, "epoch": 1732} {"train_loss": -5.9526214599609375, "global_step": 72784, "epoch": 1732} {"train_loss": -6.030726955050514, "global_step": 72785, "epoch": 1732, "val_loss": 67464.6953125} {"train_loss": -5.891988754272461, "global_step": 72786, "epoch": 1733} {"train_loss": -6.035591125488281, "global_step": 72787, "epoch": 1733} {"train_loss": -5.956144332885742, "global_step": 72788, "epoch": 1733} {"train_loss": -6.001985549926758, "global_step": 72789, "epoch": 1733} {"train_loss": -6.027310371398926, "global_step": 72790, "epoch": 1733} {"train_loss": -6.055942535400391, "global_step": 72791, "epoch": 1733} {"train_loss": -6.063551902770996, "global_step": 72792, "epoch": 1733} {"train_loss": -6.236135482788086, "global_step": 72793, "epoch": 1733} {"train_loss": -6.006730079650879, "global_step": 72794, "epoch": 1733} {"train_loss": -6.02479887008667, "global_step": 72795, "epoch": 1733} {"train_loss": -6.0967278480529785, "global_step": 72796, "epoch": 1733} {"train_loss": -6.0111236572265625, "global_step": 72797, "epoch": 1733} {"train_loss": -5.788593769073486, "global_step": 72798, "epoch": 1733} {"train_loss": -5.910141468048096, "global_step": 72799, "epoch": 1733} {"train_loss": -6.035384178161621, "global_step": 72800, "epoch": 1733} {"train_loss": -6.005757808685303, "global_step": 72801, "epoch": 1733} {"train_loss": -5.98185920715332, "global_step": 72802, "epoch": 1733} {"train_loss": -6.053789138793945, "global_step": 72803, "epoch": 1733} {"train_loss": -6.099759101867676, "global_step": 72804, "epoch": 1733} {"train_loss": -6.076470375061035, "global_step": 72805, "epoch": 1733} {"train_loss": -5.994899272918701, "global_step": 72806, "epoch": 1733} {"train_loss": -6.106720447540283, "global_step": 72807, "epoch": 1733} {"train_loss": -6.009632110595703, "global_step": 72808, "epoch": 1733} {"train_loss": -6.141538619995117, "global_step": 72809, "epoch": 1733} {"train_loss": -6.100427627563477, "global_step": 72810, "epoch": 1733} {"train_loss": -6.013333797454834, "global_step": 72811, "epoch": 1733} {"train_loss": -6.097692012786865, "global_step": 72812, "epoch": 1733} {"train_loss": -5.996488571166992, "global_step": 72813, "epoch": 1733} {"train_loss": -6.032739162445068, "global_step": 72814, "epoch": 1733} {"train_loss": -6.203408718109131, "global_step": 72815, "epoch": 1733} {"train_loss": -5.786656379699707, "global_step": 72816, "epoch": 1733} {"train_loss": -5.97739315032959, "global_step": 72817, "epoch": 1733} {"train_loss": -6.090676784515381, "global_step": 72818, "epoch": 1733} {"train_loss": -5.9364013671875, "global_step": 72819, "epoch": 1733} {"train_loss": -6.052330017089844, "global_step": 72820, "epoch": 1733} {"train_loss": -6.022278785705566, "global_step": 72821, "epoch": 1733} {"train_loss": -5.973860740661621, "global_step": 72822, "epoch": 1733} {"train_loss": -6.095849990844727, "global_step": 72823, "epoch": 1733} {"train_loss": -5.968438148498535, "global_step": 72824, "epoch": 1733} {"train_loss": -6.126543998718262, "global_step": 72825, "epoch": 1733} {"train_loss": -6.0644145011901855, "global_step": 72826, "epoch": 1733} {"train_loss": -6.028190306254795, "global_step": 72827, "epoch": 1733, "val_loss": 67518.6484375} {"train_loss": -6.073916912078857, "global_step": 72828, "epoch": 1734} {"train_loss": -5.9784040451049805, "global_step": 72829, "epoch": 1734} {"train_loss": -6.017527103424072, "global_step": 72830, "epoch": 1734} {"train_loss": -6.058531761169434, "global_step": 72831, "epoch": 1734} {"train_loss": -6.092528343200684, "global_step": 72832, "epoch": 1734} {"train_loss": -6.181126594543457, "global_step": 72833, "epoch": 1734} {"train_loss": -6.051118850708008, "global_step": 72834, "epoch": 1734} {"train_loss": -6.144318580627441, "global_step": 72835, "epoch": 1734} {"train_loss": -6.044018268585205, "global_step": 72836, "epoch": 1734} {"train_loss": -6.02710485458374, "global_step": 72837, "epoch": 1734} {"train_loss": -5.983697891235352, "global_step": 72838, "epoch": 1734} {"train_loss": -5.992893695831299, "global_step": 72839, "epoch": 1734} {"train_loss": -6.121701717376709, "global_step": 72840, "epoch": 1734} {"train_loss": -5.886510848999023, "global_step": 72841, "epoch": 1734} {"train_loss": -6.019113540649414, "global_step": 72842, "epoch": 1734} {"train_loss": -6.069592475891113, "global_step": 72843, "epoch": 1734} {"train_loss": -6.077816963195801, "global_step": 72844, "epoch": 1734} {"train_loss": -5.885532379150391, "global_step": 72845, "epoch": 1734} {"train_loss": -6.140214920043945, "global_step": 72846, "epoch": 1734} {"train_loss": -5.942194938659668, "global_step": 72847, "epoch": 1734} {"train_loss": -6.0229034423828125, "global_step": 72848, "epoch": 1734} {"train_loss": -6.008959770202637, "global_step": 72849, "epoch": 1734} {"train_loss": -5.990530490875244, "global_step": 72850, "epoch": 1734} {"train_loss": -6.101715087890625, "global_step": 72851, "epoch": 1734} {"train_loss": -5.813786506652832, "global_step": 72852, "epoch": 1734} {"train_loss": -6.147636890411377, "global_step": 72853, "epoch": 1734} {"train_loss": -6.041433811187744, "global_step": 72854, "epoch": 1734} {"train_loss": -5.911947250366211, "global_step": 72855, "epoch": 1734} {"train_loss": -6.0099358558654785, "global_step": 72856, "epoch": 1734} {"train_loss": -5.925074577331543, "global_step": 72857, "epoch": 1734} {"train_loss": -5.937493324279785, "global_step": 72858, "epoch": 1734} {"train_loss": -5.955780506134033, "global_step": 72859, "epoch": 1734} {"train_loss": -6.041325569152832, "global_step": 72860, "epoch": 1734} {"train_loss": -6.131265163421631, "global_step": 72861, "epoch": 1734} {"train_loss": -5.862113952636719, "global_step": 72862, "epoch": 1734} {"train_loss": -5.988768577575684, "global_step": 72863, "epoch": 1734} {"train_loss": -6.00669002532959, "global_step": 72864, "epoch": 1734} {"train_loss": -6.090080261230469, "global_step": 72865, "epoch": 1734} {"train_loss": -5.921550273895264, "global_step": 72866, "epoch": 1734} {"train_loss": -6.028977394104004, "global_step": 72867, "epoch": 1734} {"train_loss": -6.095534801483154, "global_step": 72868, "epoch": 1734} {"train_loss": -6.020245949427287, "global_step": 72869, "epoch": 1734, "val_loss": 67391.078125} {"train_loss": -5.957204341888428, "global_step": 72870, "epoch": 1735} {"train_loss": -6.131543159484863, "global_step": 72871, "epoch": 1735} {"train_loss": -6.021670341491699, "global_step": 72872, "epoch": 1735} {"train_loss": -5.972771167755127, "global_step": 72873, "epoch": 1735} {"train_loss": -6.1485700607299805, "global_step": 72874, "epoch": 1735} {"train_loss": -6.0625786781311035, "global_step": 72875, "epoch": 1735} {"train_loss": -5.952096939086914, "global_step": 72876, "epoch": 1735} {"train_loss": -5.969075679779053, "global_step": 72877, "epoch": 1735} {"train_loss": -6.015207290649414, "global_step": 72878, "epoch": 1735} {"train_loss": -6.053501129150391, "global_step": 72879, "epoch": 1735} {"train_loss": -5.989595413208008, "global_step": 72880, "epoch": 1735} {"train_loss": -6.095231533050537, "global_step": 72881, "epoch": 1735} {"train_loss": -6.157562255859375, "global_step": 72882, "epoch": 1735} {"train_loss": -6.017482757568359, "global_step": 72883, "epoch": 1735} {"train_loss": -6.088825225830078, "global_step": 72884, "epoch": 1735} {"train_loss": -6.180270671844482, "global_step": 72885, "epoch": 1735} {"train_loss": -5.9978132247924805, "global_step": 72886, "epoch": 1735} {"train_loss": -6.082611083984375, "global_step": 72887, "epoch": 1735} {"train_loss": -6.034001350402832, "global_step": 72888, "epoch": 1735} {"train_loss": -6.112360954284668, "global_step": 72889, "epoch": 1735} {"train_loss": -6.090904712677002, "global_step": 72890, "epoch": 1735} {"train_loss": -5.93841552734375, "global_step": 72891, "epoch": 1735} {"train_loss": -6.072225570678711, "global_step": 72892, "epoch": 1735} {"train_loss": -6.002380847930908, "global_step": 72893, "epoch": 1735} {"train_loss": -6.015056610107422, "global_step": 72894, "epoch": 1735} {"train_loss": -5.99591064453125, "global_step": 72895, "epoch": 1735} {"train_loss": -5.948524475097656, "global_step": 72896, "epoch": 1735} {"train_loss": -5.92321252822876, "global_step": 72897, "epoch": 1735} {"train_loss": -5.890236854553223, "global_step": 72898, "epoch": 1735} {"train_loss": -6.035251617431641, "global_step": 72899, "epoch": 1735} {"train_loss": -5.95304012298584, "global_step": 72900, "epoch": 1735} {"train_loss": -5.964960098266602, "global_step": 72901, "epoch": 1735} {"train_loss": -6.045961380004883, "global_step": 72902, "epoch": 1735} {"train_loss": -6.035178184509277, "global_step": 72903, "epoch": 1735} {"train_loss": -5.953682899475098, "global_step": 72904, "epoch": 1735} {"train_loss": -6.054050445556641, "global_step": 72905, "epoch": 1735} {"train_loss": -6.065278053283691, "global_step": 72906, "epoch": 1735} {"train_loss": -6.070926666259766, "global_step": 72907, "epoch": 1735} {"train_loss": -5.93300724029541, "global_step": 72908, "epoch": 1735} {"train_loss": -6.024026393890381, "global_step": 72909, "epoch": 1735} {"train_loss": -6.098664283752441, "global_step": 72910, "epoch": 1735} {"train_loss": -6.024109091077532, "global_step": 72911, "epoch": 1735, "val_loss": 67286.140625} {"train_loss": -6.04514217376709, "global_step": 72912, "epoch": 1736} {"train_loss": -5.982096195220947, "global_step": 72913, "epoch": 1736} {"train_loss": -6.079559326171875, "global_step": 72914, "epoch": 1736} {"train_loss": -5.990668296813965, "global_step": 72915, "epoch": 1736} {"train_loss": -5.972459316253662, "global_step": 72916, "epoch": 1736} {"train_loss": -6.086693286895752, "global_step": 72917, "epoch": 1736} {"train_loss": -5.985087871551514, "global_step": 72918, "epoch": 1736} {"train_loss": -6.060955047607422, "global_step": 72919, "epoch": 1736} {"train_loss": -6.069450855255127, "global_step": 72920, "epoch": 1736} {"train_loss": -5.962480545043945, "global_step": 72921, "epoch": 1736} {"train_loss": -6.033182144165039, "global_step": 72922, "epoch": 1736} {"train_loss": -6.041264533996582, "global_step": 72923, "epoch": 1736} {"train_loss": -6.084021091461182, "global_step": 72924, "epoch": 1736} {"train_loss": -6.174167156219482, "global_step": 72925, "epoch": 1736} {"train_loss": -6.077487945556641, "global_step": 72926, "epoch": 1736} {"train_loss": -6.053083896636963, "global_step": 72927, "epoch": 1736} {"train_loss": -6.075772762298584, "global_step": 72928, "epoch": 1736} {"train_loss": -6.04816198348999, "global_step": 72929, "epoch": 1736} {"train_loss": -5.999932289123535, "global_step": 72930, "epoch": 1736} {"train_loss": -6.046721458435059, "global_step": 72931, "epoch": 1736} {"train_loss": -5.919384002685547, "global_step": 72932, "epoch": 1736} {"train_loss": -6.033041477203369, "global_step": 72933, "epoch": 1736} {"train_loss": -6.069665908813477, "global_step": 72934, "epoch": 1736} {"train_loss": -6.1150383949279785, "global_step": 72935, "epoch": 1736} {"train_loss": -6.174184799194336, "global_step": 72936, "epoch": 1736} {"train_loss": -6.103476047515869, "global_step": 72937, "epoch": 1736} {"train_loss": -5.982555389404297, "global_step": 72938, "epoch": 1736} {"train_loss": -6.032131195068359, "global_step": 72939, "epoch": 1736} {"train_loss": -6.0525712966918945, "global_step": 72940, "epoch": 1736} {"train_loss": -6.069565773010254, "global_step": 72941, "epoch": 1736} {"train_loss": -6.065112113952637, "global_step": 72942, "epoch": 1736} {"train_loss": -6.128889083862305, "global_step": 72943, "epoch": 1736} {"train_loss": -6.097577095031738, "global_step": 72944, "epoch": 1736} {"train_loss": -6.045684814453125, "global_step": 72945, "epoch": 1736} {"train_loss": -6.039880752563477, "global_step": 72946, "epoch": 1736} {"train_loss": -6.065103530883789, "global_step": 72947, "epoch": 1736} {"train_loss": -6.003423690795898, "global_step": 72948, "epoch": 1736} {"train_loss": -6.077149868011475, "global_step": 72949, "epoch": 1736} {"train_loss": -6.065121650695801, "global_step": 72950, "epoch": 1736} {"train_loss": -6.144994735717773, "global_step": 72951, "epoch": 1736} {"train_loss": -6.006755828857422, "global_step": 72952, "epoch": 1736} {"train_loss": -6.051087141036987, "global_step": 72953, "epoch": 1736, "val_loss": 67511.625} {"train_loss": -6.071183204650879, "global_step": 72954, "epoch": 1737} {"train_loss": -6.103097438812256, "global_step": 72955, "epoch": 1737} {"train_loss": -6.0743327140808105, "global_step": 72956, "epoch": 1737} {"train_loss": -6.0382184982299805, "global_step": 72957, "epoch": 1737} {"train_loss": -6.081780433654785, "global_step": 72958, "epoch": 1737} {"train_loss": -5.974771499633789, "global_step": 72959, "epoch": 1737} {"train_loss": -5.889936447143555, "global_step": 72960, "epoch": 1737} {"train_loss": -6.122159957885742, "global_step": 72961, "epoch": 1737} {"train_loss": -6.127053260803223, "global_step": 72962, "epoch": 1737} {"train_loss": -5.785046577453613, "global_step": 72963, "epoch": 1737} {"train_loss": -6.039561748504639, "global_step": 72964, "epoch": 1737} {"train_loss": -5.9775567054748535, "global_step": 72965, "epoch": 1737} {"train_loss": -5.924118995666504, "global_step": 72966, "epoch": 1737} {"train_loss": -5.984295845031738, "global_step": 72967, "epoch": 1737} {"train_loss": -6.1108574867248535, "global_step": 72968, "epoch": 1737} {"train_loss": -6.056817054748535, "global_step": 72969, "epoch": 1737} {"train_loss": -6.109267234802246, "global_step": 72970, "epoch": 1737} {"train_loss": -5.93052864074707, "global_step": 72971, "epoch": 1737} {"train_loss": -6.00637149810791, "global_step": 72972, "epoch": 1737} {"train_loss": -5.949786186218262, "global_step": 72973, "epoch": 1737} {"train_loss": -5.969078063964844, "global_step": 72974, "epoch": 1737} {"train_loss": -6.082262992858887, "global_step": 72975, "epoch": 1737} {"train_loss": -5.930379390716553, "global_step": 72976, "epoch": 1737} {"train_loss": -6.12642765045166, "global_step": 72977, "epoch": 1737} {"train_loss": -6.011091709136963, "global_step": 72978, "epoch": 1737} {"train_loss": -6.134332656860352, "global_step": 72979, "epoch": 1737} {"train_loss": -6.05760383605957, "global_step": 72980, "epoch": 1737} {"train_loss": -6.040460586547852, "global_step": 72981, "epoch": 1737} {"train_loss": -6.027713298797607, "global_step": 72982, "epoch": 1737} {"train_loss": -6.163562774658203, "global_step": 72983, "epoch": 1737} {"train_loss": -6.100781440734863, "global_step": 72984, "epoch": 1737} {"train_loss": -6.025059700012207, "global_step": 72985, "epoch": 1737} {"train_loss": -6.042542457580566, "global_step": 72986, "epoch": 1737} {"train_loss": -6.002026557922363, "global_step": 72987, "epoch": 1737} {"train_loss": -6.074575901031494, "global_step": 72988, "epoch": 1737} {"train_loss": -5.968093395233154, "global_step": 72989, "epoch": 1737} {"train_loss": -6.123910903930664, "global_step": 72990, "epoch": 1737} {"train_loss": -6.056719779968262, "global_step": 72991, "epoch": 1737} {"train_loss": -6.184903144836426, "global_step": 72992, "epoch": 1737} {"train_loss": -6.089768886566162, "global_step": 72993, "epoch": 1737} {"train_loss": -6.162903785705566, "global_step": 72994, "epoch": 1737} {"train_loss": -6.0392368748074485, "global_step": 72995, "epoch": 1737, "val_loss": 67279.1953125} {"train_loss": -6.093588829040527, "global_step": 72996, "epoch": 1738} {"train_loss": -6.073943138122559, "global_step": 72997, "epoch": 1738} {"train_loss": -6.175168991088867, "global_step": 72998, "epoch": 1738} {"train_loss": -6.014869213104248, "global_step": 72999, "epoch": 1738} {"train_loss": -5.929006576538086, "global_step": 73000, "epoch": 1738} {"train_loss": -6.002313137054443, "global_step": 73001, "epoch": 1738} {"train_loss": -6.056055068969727, "global_step": 73002, "epoch": 1738} {"train_loss": -6.076465606689453, "global_step": 73003, "epoch": 1738} {"train_loss": -6.0414581298828125, "global_step": 73004, "epoch": 1738} {"train_loss": -6.103782653808594, "global_step": 73005, "epoch": 1738} {"train_loss": -5.995823860168457, "global_step": 73006, "epoch": 1738} {"train_loss": -6.078857421875, "global_step": 73007, "epoch": 1738} {"train_loss": -6.103924751281738, "global_step": 73008, "epoch": 1738} {"train_loss": -6.0426130294799805, "global_step": 73009, "epoch": 1738} {"train_loss": -6.09281063079834, "global_step": 73010, "epoch": 1738} {"train_loss": -6.071978569030762, "global_step": 73011, "epoch": 1738} {"train_loss": -6.109943389892578, "global_step": 73012, "epoch": 1738} {"train_loss": -6.095600605010986, "global_step": 73013, "epoch": 1738} {"train_loss": -5.939244270324707, "global_step": 73014, "epoch": 1738} {"train_loss": -5.903944969177246, "global_step": 73015, "epoch": 1738} {"train_loss": -5.938178062438965, "global_step": 73016, "epoch": 1738} {"train_loss": -5.971022605895996, "global_step": 73017, "epoch": 1738} {"train_loss": -6.006313323974609, "global_step": 73018, "epoch": 1738} {"train_loss": -6.036139488220215, "global_step": 73019, "epoch": 1738} {"train_loss": -6.038876533508301, "global_step": 73020, "epoch": 1738} {"train_loss": -6.113406181335449, "global_step": 73021, "epoch": 1738} {"train_loss": -5.918081283569336, "global_step": 73022, "epoch": 1738} {"train_loss": -6.102278709411621, "global_step": 73023, "epoch": 1738} {"train_loss": -5.994132995605469, "global_step": 73024, "epoch": 1738} {"train_loss": -6.008922100067139, "global_step": 73025, "epoch": 1738} {"train_loss": -6.124757289886475, "global_step": 73026, "epoch": 1738} {"train_loss": -6.15990686416626, "global_step": 73027, "epoch": 1738} {"train_loss": -6.131994724273682, "global_step": 73028, "epoch": 1738} {"train_loss": -6.027437686920166, "global_step": 73029, "epoch": 1738} {"train_loss": -6.124035358428955, "global_step": 73030, "epoch": 1738} {"train_loss": -6.024243354797363, "global_step": 73031, "epoch": 1738} {"train_loss": -6.038342475891113, "global_step": 73032, "epoch": 1738} {"train_loss": -5.9810895919799805, "global_step": 73033, "epoch": 1738} {"train_loss": -6.182669639587402, "global_step": 73034, "epoch": 1738} {"train_loss": -5.98321533203125, "global_step": 73035, "epoch": 1738} {"train_loss": -6.138164520263672, "global_step": 73036, "epoch": 1738} {"train_loss": -6.051952884310768, "global_step": 73037, "epoch": 1738, "val_loss": 67436.96875} {"train_loss": -6.0543365478515625, "global_step": 73038, "epoch": 1739} {"train_loss": -6.0538177490234375, "global_step": 73039, "epoch": 1739} {"train_loss": -6.079867362976074, "global_step": 73040, "epoch": 1739} {"train_loss": -6.0419697761535645, "global_step": 73041, "epoch": 1739} {"train_loss": -5.957124710083008, "global_step": 73042, "epoch": 1739} {"train_loss": -6.05078125, "global_step": 73043, "epoch": 1739} {"train_loss": -6.129065036773682, "global_step": 73044, "epoch": 1739} {"train_loss": -6.0884785652160645, "global_step": 73045, "epoch": 1739} {"train_loss": -5.957342624664307, "global_step": 73046, "epoch": 1739} {"train_loss": -6.057554721832275, "global_step": 73047, "epoch": 1739} {"train_loss": -6.0514936447143555, "global_step": 73048, "epoch": 1739} {"train_loss": -6.033148765563965, "global_step": 73049, "epoch": 1739} {"train_loss": -6.068624973297119, "global_step": 73050, "epoch": 1739} {"train_loss": -6.016759395599365, "global_step": 73051, "epoch": 1739} {"train_loss": -5.947569847106934, "global_step": 73052, "epoch": 1739} {"train_loss": -6.04344367980957, "global_step": 73053, "epoch": 1739} {"train_loss": -5.924297332763672, "global_step": 73054, "epoch": 1739} {"train_loss": -6.080063819885254, "global_step": 73055, "epoch": 1739} {"train_loss": -6.094573974609375, "global_step": 73056, "epoch": 1739} {"train_loss": -5.941364288330078, "global_step": 73057, "epoch": 1739} {"train_loss": -6.096508502960205, "global_step": 73058, "epoch": 1739} {"train_loss": -6.0979461669921875, "global_step": 73059, "epoch": 1739} {"train_loss": -6.0675249099731445, "global_step": 73060, "epoch": 1739} {"train_loss": -6.010099411010742, "global_step": 73061, "epoch": 1739} {"train_loss": -6.157303810119629, "global_step": 73062, "epoch": 1739} {"train_loss": -6.161283493041992, "global_step": 73063, "epoch": 1739} {"train_loss": -6.0014753341674805, "global_step": 73064, "epoch": 1739} {"train_loss": -6.138973236083984, "global_step": 73065, "epoch": 1739} {"train_loss": -6.008505821228027, "global_step": 73066, "epoch": 1739} {"train_loss": -6.02375602722168, "global_step": 73067, "epoch": 1739} {"train_loss": -6.121964454650879, "global_step": 73068, "epoch": 1739} {"train_loss": -6.020343780517578, "global_step": 73069, "epoch": 1739} {"train_loss": -6.069835186004639, "global_step": 73070, "epoch": 1739} {"train_loss": -6.15614128112793, "global_step": 73071, "epoch": 1739} {"train_loss": -6.215764999389648, "global_step": 73072, "epoch": 1739} {"train_loss": -6.025515556335449, "global_step": 73073, "epoch": 1739} {"train_loss": -6.041046142578125, "global_step": 73074, "epoch": 1739} {"train_loss": -6.163475513458252, "global_step": 73075, "epoch": 1739} {"train_loss": -6.008478164672852, "global_step": 73076, "epoch": 1739} {"train_loss": -6.088918685913086, "global_step": 73077, "epoch": 1739} {"train_loss": -6.137045383453369, "global_step": 73078, "epoch": 1739} {"train_loss": -6.064532575153169, "global_step": 73079, "epoch": 1739, "val_loss": 67507.8515625} {"train_loss": -6.151340484619141, "global_step": 73080, "epoch": 1740} {"train_loss": -6.027163505554199, "global_step": 73081, "epoch": 1740} {"train_loss": -6.093104362487793, "global_step": 73082, "epoch": 1740} {"train_loss": -6.037578582763672, "global_step": 73083, "epoch": 1740} {"train_loss": -6.102410793304443, "global_step": 73084, "epoch": 1740} {"train_loss": -5.997242450714111, "global_step": 73085, "epoch": 1740} {"train_loss": -6.022402763366699, "global_step": 73086, "epoch": 1740} {"train_loss": -6.102715492248535, "global_step": 73087, "epoch": 1740} {"train_loss": -6.055633544921875, "global_step": 73088, "epoch": 1740} {"train_loss": -6.06825065612793, "global_step": 73089, "epoch": 1740} {"train_loss": -6.1434855461120605, "global_step": 73090, "epoch": 1740} {"train_loss": -6.051517486572266, "global_step": 73091, "epoch": 1740} {"train_loss": -6.055943489074707, "global_step": 73092, "epoch": 1740} {"train_loss": -5.968930244445801, "global_step": 73093, "epoch": 1740} {"train_loss": -6.001245498657227, "global_step": 73094, "epoch": 1740} {"train_loss": -5.976949691772461, "global_step": 73095, "epoch": 1740} {"train_loss": -6.039361000061035, "global_step": 73096, "epoch": 1740} {"train_loss": -5.982282638549805, "global_step": 73097, "epoch": 1740} {"train_loss": -6.161569595336914, "global_step": 73098, "epoch": 1740} {"train_loss": -5.911370277404785, "global_step": 73099, "epoch": 1740} {"train_loss": -5.967845916748047, "global_step": 73100, "epoch": 1740} {"train_loss": -6.09999942779541, "global_step": 73101, "epoch": 1740} {"train_loss": -5.976805686950684, "global_step": 73102, "epoch": 1740} {"train_loss": -6.087104797363281, "global_step": 73103, "epoch": 1740} {"train_loss": -6.032262802124023, "global_step": 73104, "epoch": 1740} {"train_loss": -6.097942352294922, "global_step": 73105, "epoch": 1740} {"train_loss": -5.992574691772461, "global_step": 73106, "epoch": 1740} {"train_loss": -6.042335510253906, "global_step": 73107, "epoch": 1740} {"train_loss": -6.130753040313721, "global_step": 73108, "epoch": 1740} {"train_loss": -6.055110931396484, "global_step": 73109, "epoch": 1740} {"train_loss": -6.038671493530273, "global_step": 73110, "epoch": 1740} {"train_loss": -6.125914096832275, "global_step": 73111, "epoch": 1740} {"train_loss": -5.965777397155762, "global_step": 73112, "epoch": 1740} {"train_loss": -6.064676284790039, "global_step": 73113, "epoch": 1740} {"train_loss": -5.995242118835449, "global_step": 73114, "epoch": 1740} {"train_loss": -5.940519332885742, "global_step": 73115, "epoch": 1740} {"train_loss": -6.07269287109375, "global_step": 73116, "epoch": 1740} {"train_loss": -6.030326843261719, "global_step": 73117, "epoch": 1740} {"train_loss": -5.952329635620117, "global_step": 73118, "epoch": 1740} {"train_loss": -6.055892467498779, "global_step": 73119, "epoch": 1740} {"train_loss": -6.049298286437988, "global_step": 73120, "epoch": 1740} {"train_loss": -6.04398725146339, "global_step": 73121, "epoch": 1740, "val_loss": 67630.1015625} {"train_loss": -6.007133483886719, "global_step": 73122, "epoch": 1741} {"train_loss": -6.086679458618164, "global_step": 73123, "epoch": 1741} {"train_loss": -5.978082656860352, "global_step": 73124, "epoch": 1741} {"train_loss": -5.926817893981934, "global_step": 73125, "epoch": 1741} {"train_loss": -6.0772552490234375, "global_step": 73126, "epoch": 1741} {"train_loss": -5.960906028747559, "global_step": 73127, "epoch": 1741} {"train_loss": -6.070879936218262, "global_step": 73128, "epoch": 1741} {"train_loss": -6.001934051513672, "global_step": 73129, "epoch": 1741} {"train_loss": -5.998417377471924, "global_step": 73130, "epoch": 1741} {"train_loss": -6.030496597290039, "global_step": 73131, "epoch": 1741} {"train_loss": -5.975841522216797, "global_step": 73132, "epoch": 1741} {"train_loss": -6.13179874420166, "global_step": 73133, "epoch": 1741} {"train_loss": -6.083367347717285, "global_step": 73134, "epoch": 1741} {"train_loss": -6.0545549392700195, "global_step": 73135, "epoch": 1741} {"train_loss": -6.056004524230957, "global_step": 73136, "epoch": 1741} {"train_loss": -5.998147964477539, "global_step": 73137, "epoch": 1741} {"train_loss": -6.066810607910156, "global_step": 73138, "epoch": 1741} {"train_loss": -6.184616565704346, "global_step": 73139, "epoch": 1741} {"train_loss": -5.929657936096191, "global_step": 73140, "epoch": 1741} {"train_loss": -6.1330885887146, "global_step": 73141, "epoch": 1741} {"train_loss": -6.053487777709961, "global_step": 73142, "epoch": 1741} {"train_loss": -5.972535133361816, "global_step": 73143, "epoch": 1741} {"train_loss": -6.0509772300720215, "global_step": 73144, "epoch": 1741} {"train_loss": -6.042672634124756, "global_step": 73145, "epoch": 1741} {"train_loss": -6.0222063064575195, "global_step": 73146, "epoch": 1741} {"train_loss": -6.050145149230957, "global_step": 73147, "epoch": 1741} {"train_loss": -6.010713577270508, "global_step": 73148, "epoch": 1741} {"train_loss": -6.078156471252441, "global_step": 73149, "epoch": 1741} {"train_loss": -6.103318214416504, "global_step": 73150, "epoch": 1741} {"train_loss": -6.058172225952148, "global_step": 73151, "epoch": 1741} {"train_loss": -6.085513114929199, "global_step": 73152, "epoch": 1741} {"train_loss": -6.05999231338501, "global_step": 73153, "epoch": 1741} {"train_loss": -6.059390544891357, "global_step": 73154, "epoch": 1741} {"train_loss": -6.060298919677734, "global_step": 73155, "epoch": 1741} {"train_loss": -6.141630172729492, "global_step": 73156, "epoch": 1741} {"train_loss": -6.02877140045166, "global_step": 73157, "epoch": 1741} {"train_loss": -5.9429473876953125, "global_step": 73158, "epoch": 1741} {"train_loss": -6.181324005126953, "global_step": 73159, "epoch": 1741} {"train_loss": -6.049642562866211, "global_step": 73160, "epoch": 1741} {"train_loss": -6.0777692794799805, "global_step": 73161, "epoch": 1741} {"train_loss": -6.072265625, "global_step": 73162, "epoch": 1741} {"train_loss": -6.048975876399449, "global_step": 73163, "epoch": 1741, "val_loss": 67757.984375} {"train_loss": -6.0439605712890625, "global_step": 73164, "epoch": 1742} {"train_loss": -6.046459197998047, "global_step": 73165, "epoch": 1742} {"train_loss": -6.092282295227051, "global_step": 73166, "epoch": 1742} {"train_loss": -6.011653900146484, "global_step": 73167, "epoch": 1742} {"train_loss": -5.98837947845459, "global_step": 73168, "epoch": 1742} {"train_loss": -5.924173831939697, "global_step": 73169, "epoch": 1742} {"train_loss": -5.996610164642334, "global_step": 73170, "epoch": 1742} {"train_loss": -5.986761093139648, "global_step": 73171, "epoch": 1742} {"train_loss": -5.906426429748535, "global_step": 73172, "epoch": 1742} {"train_loss": -6.121456623077393, "global_step": 73173, "epoch": 1742} {"train_loss": -6.014097690582275, "global_step": 73174, "epoch": 1742} {"train_loss": -6.083683967590332, "global_step": 73175, "epoch": 1742} {"train_loss": -6.037957191467285, "global_step": 73176, "epoch": 1742} {"train_loss": -5.94110631942749, "global_step": 73177, "epoch": 1742} {"train_loss": -6.1003217697143555, "global_step": 73178, "epoch": 1742} {"train_loss": -5.8920698165893555, "global_step": 73179, "epoch": 1742} {"train_loss": -5.979414463043213, "global_step": 73180, "epoch": 1742} {"train_loss": -5.949387550354004, "global_step": 73181, "epoch": 1742} {"train_loss": -6.021336078643799, "global_step": 73182, "epoch": 1742} {"train_loss": -5.990452766418457, "global_step": 73183, "epoch": 1742} {"train_loss": -5.985461235046387, "global_step": 73184, "epoch": 1742} {"train_loss": -5.998588562011719, "global_step": 73185, "epoch": 1742} {"train_loss": -5.9752726554870605, "global_step": 73186, "epoch": 1742} {"train_loss": -5.985552787780762, "global_step": 73187, "epoch": 1742} {"train_loss": -6.026947021484375, "global_step": 73188, "epoch": 1742} {"train_loss": -6.0002946853637695, "global_step": 73189, "epoch": 1742} {"train_loss": -5.956311225891113, "global_step": 73190, "epoch": 1742} {"train_loss": -6.014959812164307, "global_step": 73191, "epoch": 1742} {"train_loss": -6.073544502258301, "global_step": 73192, "epoch": 1742} {"train_loss": -6.093505382537842, "global_step": 73193, "epoch": 1742} {"train_loss": -6.0625410079956055, "global_step": 73194, "epoch": 1742} {"train_loss": -6.052689552307129, "global_step": 73195, "epoch": 1742} {"train_loss": -5.9483962059021, "global_step": 73196, "epoch": 1742} {"train_loss": -6.046052932739258, "global_step": 73197, "epoch": 1742} {"train_loss": -5.921866416931152, "global_step": 73198, "epoch": 1742} {"train_loss": -6.009512901306152, "global_step": 73199, "epoch": 1742} {"train_loss": -6.00669527053833, "global_step": 73200, "epoch": 1742} {"train_loss": -6.084411144256592, "global_step": 73201, "epoch": 1742} {"train_loss": -6.097496032714844, "global_step": 73202, "epoch": 1742} {"train_loss": -6.047015190124512, "global_step": 73203, "epoch": 1742} {"train_loss": -6.065268039703369, "global_step": 73204, "epoch": 1742} {"train_loss": -6.0159847509293325, "global_step": 73205, "epoch": 1742, "val_loss": 67652.1484375} {"train_loss": -6.039768218994141, "global_step": 73206, "epoch": 1743} {"train_loss": -6.036898136138916, "global_step": 73207, "epoch": 1743} {"train_loss": -6.063759803771973, "global_step": 73208, "epoch": 1743} {"train_loss": -5.974865913391113, "global_step": 73209, "epoch": 1743} {"train_loss": -5.976317405700684, "global_step": 73210, "epoch": 1743} {"train_loss": -5.9294281005859375, "global_step": 73211, "epoch": 1743} {"train_loss": -6.098848342895508, "global_step": 73212, "epoch": 1743} {"train_loss": -6.0439677238464355, "global_step": 73213, "epoch": 1743} {"train_loss": -6.119544982910156, "global_step": 73214, "epoch": 1743} {"train_loss": -5.997325897216797, "global_step": 73215, "epoch": 1743} {"train_loss": -6.087608814239502, "global_step": 73216, "epoch": 1743} {"train_loss": -5.9955620765686035, "global_step": 73217, "epoch": 1743} {"train_loss": -6.110148906707764, "global_step": 73218, "epoch": 1743} {"train_loss": -6.019461631774902, "global_step": 73219, "epoch": 1743} {"train_loss": -6.017175674438477, "global_step": 73220, "epoch": 1743} {"train_loss": -6.040414810180664, "global_step": 73221, "epoch": 1743} {"train_loss": -6.030941009521484, "global_step": 73222, "epoch": 1743} {"train_loss": -5.974611282348633, "global_step": 73223, "epoch": 1743} {"train_loss": -5.829854965209961, "global_step": 73224, "epoch": 1743} {"train_loss": -6.0696916580200195, "global_step": 73225, "epoch": 1743} {"train_loss": -6.09463357925415, "global_step": 73226, "epoch": 1743} {"train_loss": -6.062875747680664, "global_step": 73227, "epoch": 1743} {"train_loss": -6.162899017333984, "global_step": 73228, "epoch": 1743} {"train_loss": -6.080687046051025, "global_step": 73229, "epoch": 1743} {"train_loss": -6.078542709350586, "global_step": 73230, "epoch": 1743} {"train_loss": -6.090312480926514, "global_step": 73231, "epoch": 1743} {"train_loss": -6.040299415588379, "global_step": 73232, "epoch": 1743} {"train_loss": -6.00698709487915, "global_step": 73233, "epoch": 1743} {"train_loss": -6.033740997314453, "global_step": 73234, "epoch": 1743} {"train_loss": -6.011258125305176, "global_step": 73235, "epoch": 1743} {"train_loss": -5.951035499572754, "global_step": 73236, "epoch": 1743} {"train_loss": -6.010402202606201, "global_step": 73237, "epoch": 1743} {"train_loss": -5.960588455200195, "global_step": 73238, "epoch": 1743} {"train_loss": -6.035525321960449, "global_step": 73239, "epoch": 1743} {"train_loss": -6.022278308868408, "global_step": 73240, "epoch": 1743} {"train_loss": -6.074096202850342, "global_step": 73241, "epoch": 1743} {"train_loss": -5.975591659545898, "global_step": 73242, "epoch": 1743} {"train_loss": -5.972858428955078, "global_step": 73243, "epoch": 1743} {"train_loss": -5.898298263549805, "global_step": 73244, "epoch": 1743} {"train_loss": -6.031365394592285, "global_step": 73245, "epoch": 1743} {"train_loss": -5.989363670349121, "global_step": 73246, "epoch": 1743} {"train_loss": -6.025448413122268, "global_step": 73247, "epoch": 1743, "val_loss": 67356.84375} {"train_loss": -5.958372116088867, "global_step": 73248, "epoch": 1744} {"train_loss": -6.051109313964844, "global_step": 73249, "epoch": 1744} {"train_loss": -6.038649559020996, "global_step": 73250, "epoch": 1744} {"train_loss": -6.0723981857299805, "global_step": 73251, "epoch": 1744} {"train_loss": -6.049036026000977, "global_step": 73252, "epoch": 1744} {"train_loss": -6.060512542724609, "global_step": 73253, "epoch": 1744} {"train_loss": -6.013379096984863, "global_step": 73254, "epoch": 1744} {"train_loss": -6.081589698791504, "global_step": 73255, "epoch": 1744} {"train_loss": -6.0508012771606445, "global_step": 73256, "epoch": 1744} {"train_loss": -6.05064058303833, "global_step": 73257, "epoch": 1744} {"train_loss": -6.108565330505371, "global_step": 73258, "epoch": 1744} {"train_loss": -6.107102394104004, "global_step": 73259, "epoch": 1744} {"train_loss": -6.057946681976318, "global_step": 73260, "epoch": 1744} {"train_loss": -5.9481940269470215, "global_step": 73261, "epoch": 1744} {"train_loss": -6.071617603302002, "global_step": 73262, "epoch": 1744} {"train_loss": -6.070673942565918, "global_step": 73263, "epoch": 1744} {"train_loss": -6.172267436981201, "global_step": 73264, "epoch": 1744} {"train_loss": -6.174114227294922, "global_step": 73265, "epoch": 1744} {"train_loss": -6.039093017578125, "global_step": 73266, "epoch": 1744} {"train_loss": -6.1428656578063965, "global_step": 73267, "epoch": 1744} {"train_loss": -6.0089240074157715, "global_step": 73268, "epoch": 1744} {"train_loss": -6.0781965255737305, "global_step": 73269, "epoch": 1744} {"train_loss": -6.080987453460693, "global_step": 73270, "epoch": 1744} {"train_loss": -6.004907131195068, "global_step": 73271, "epoch": 1744} {"train_loss": -6.068968772888184, "global_step": 73272, "epoch": 1744} {"train_loss": -6.093952655792236, "global_step": 73273, "epoch": 1744} {"train_loss": -5.895142555236816, "global_step": 73274, "epoch": 1744} {"train_loss": -6.004695892333984, "global_step": 73275, "epoch": 1744} {"train_loss": -6.023073196411133, "global_step": 73276, "epoch": 1744} {"train_loss": -6.037093162536621, "global_step": 73277, "epoch": 1744} {"train_loss": -6.091745376586914, "global_step": 73278, "epoch": 1744} {"train_loss": -6.07327127456665, "global_step": 73279, "epoch": 1744} {"train_loss": -6.147374153137207, "global_step": 73280, "epoch": 1744} {"train_loss": -6.157028675079346, "global_step": 73281, "epoch": 1744} {"train_loss": -6.127777576446533, "global_step": 73282, "epoch": 1744} {"train_loss": -5.948184013366699, "global_step": 73283, "epoch": 1744} {"train_loss": -6.084288120269775, "global_step": 73284, "epoch": 1744} {"train_loss": -5.974287986755371, "global_step": 73285, "epoch": 1744} {"train_loss": -5.922850608825684, "global_step": 73286, "epoch": 1744} {"train_loss": -5.947287082672119, "global_step": 73287, "epoch": 1744} {"train_loss": -6.009338855743408, "global_step": 73288, "epoch": 1744} {"train_loss": -6.05160269283113, "global_step": 73289, "epoch": 1744, "val_loss": 67408.7109375} {"train_loss": -5.902205944061279, "global_step": 73290, "epoch": 1745} {"train_loss": -6.004255771636963, "global_step": 73291, "epoch": 1745} {"train_loss": -6.100595474243164, "global_step": 73292, "epoch": 1745} {"train_loss": -6.06113338470459, "global_step": 73293, "epoch": 1745} {"train_loss": -5.963612079620361, "global_step": 73294, "epoch": 1745} {"train_loss": -6.040898323059082, "global_step": 73295, "epoch": 1745} {"train_loss": -5.965858459472656, "global_step": 73296, "epoch": 1745} {"train_loss": -5.901127815246582, "global_step": 73297, "epoch": 1745} {"train_loss": -6.085169792175293, "global_step": 73298, "epoch": 1745} {"train_loss": -6.098017692565918, "global_step": 73299, "epoch": 1745} {"train_loss": -6.027484893798828, "global_step": 73300, "epoch": 1745} {"train_loss": -6.015096187591553, "global_step": 73301, "epoch": 1745} {"train_loss": -5.951876640319824, "global_step": 73302, "epoch": 1745} {"train_loss": -6.034980773925781, "global_step": 73303, "epoch": 1745} {"train_loss": -6.0035481452941895, "global_step": 73304, "epoch": 1745} {"train_loss": -6.175806999206543, "global_step": 73305, "epoch": 1745} {"train_loss": -6.1540327072143555, "global_step": 73306, "epoch": 1745} {"train_loss": -5.997297286987305, "global_step": 73307, "epoch": 1745} {"train_loss": -6.044748306274414, "global_step": 73308, "epoch": 1745} {"train_loss": -6.107745170593262, "global_step": 73309, "epoch": 1745} {"train_loss": -5.963830947875977, "global_step": 73310, "epoch": 1745} {"train_loss": -5.973945617675781, "global_step": 73311, "epoch": 1745} {"train_loss": -6.026338577270508, "global_step": 73312, "epoch": 1745} {"train_loss": -6.026084899902344, "global_step": 73313, "epoch": 1745} {"train_loss": -6.0601348876953125, "global_step": 73314, "epoch": 1745} {"train_loss": -6.140330791473389, "global_step": 73315, "epoch": 1745} {"train_loss": -6.073205947875977, "global_step": 73316, "epoch": 1745} {"train_loss": -6.105849266052246, "global_step": 73317, "epoch": 1745} {"train_loss": -6.013998508453369, "global_step": 73318, "epoch": 1745} {"train_loss": -6.142643451690674, "global_step": 73319, "epoch": 1745} {"train_loss": -6.013143062591553, "global_step": 73320, "epoch": 1745} {"train_loss": -6.083615303039551, "global_step": 73321, "epoch": 1745} {"train_loss": -6.124302864074707, "global_step": 73322, "epoch": 1745} {"train_loss": -6.124467849731445, "global_step": 73323, "epoch": 1745} {"train_loss": -6.133011817932129, "global_step": 73324, "epoch": 1745} {"train_loss": -6.154720306396484, "global_step": 73325, "epoch": 1745} {"train_loss": -6.052567005157471, "global_step": 73326, "epoch": 1745} {"train_loss": -5.985013008117676, "global_step": 73327, "epoch": 1745} {"train_loss": -5.961403846740723, "global_step": 73328, "epoch": 1745} {"train_loss": -6.155810356140137, "global_step": 73329, "epoch": 1745} {"train_loss": -6.080068111419678, "global_step": 73330, "epoch": 1745} {"train_loss": -6.052110388165429, "global_step": 73331, "epoch": 1745, "val_loss": 67533.390625} {"train_loss": -6.106662750244141, "global_step": 73332, "epoch": 1746} {"train_loss": -6.085128307342529, "global_step": 73333, "epoch": 1746} {"train_loss": -6.061036109924316, "global_step": 73334, "epoch": 1746} {"train_loss": -6.014145374298096, "global_step": 73335, "epoch": 1746} {"train_loss": -6.0113139152526855, "global_step": 73336, "epoch": 1746} {"train_loss": -5.959257125854492, "global_step": 73337, "epoch": 1746} {"train_loss": -6.007646560668945, "global_step": 73338, "epoch": 1746} {"train_loss": -5.969675064086914, "global_step": 73339, "epoch": 1746} {"train_loss": -5.948974132537842, "global_step": 73340, "epoch": 1746} {"train_loss": -5.940858364105225, "global_step": 73341, "epoch": 1746} {"train_loss": -6.124126434326172, "global_step": 73342, "epoch": 1746} {"train_loss": -6.046875953674316, "global_step": 73343, "epoch": 1746} {"train_loss": -6.107147693634033, "global_step": 73344, "epoch": 1746} {"train_loss": -6.0167083740234375, "global_step": 73345, "epoch": 1746} {"train_loss": -5.961763858795166, "global_step": 73346, "epoch": 1746} {"train_loss": -5.953115463256836, "global_step": 73347, "epoch": 1746} {"train_loss": -6.019806385040283, "global_step": 73348, "epoch": 1746} {"train_loss": -5.98071813583374, "global_step": 73349, "epoch": 1746} {"train_loss": -5.885017395019531, "global_step": 73350, "epoch": 1746} {"train_loss": -6.029172897338867, "global_step": 73351, "epoch": 1746} {"train_loss": -6.093174457550049, "global_step": 73352, "epoch": 1746} {"train_loss": -5.977053642272949, "global_step": 73353, "epoch": 1746} {"train_loss": -5.975636005401611, "global_step": 73354, "epoch": 1746} {"train_loss": -6.049651622772217, "global_step": 73355, "epoch": 1746} {"train_loss": -6.043170928955078, "global_step": 73356, "epoch": 1746} {"train_loss": -5.951918601989746, "global_step": 73357, "epoch": 1746} {"train_loss": -6.147171497344971, "global_step": 73358, "epoch": 1746} {"train_loss": -5.940861225128174, "global_step": 73359, "epoch": 1746} {"train_loss": -5.9599480628967285, "global_step": 73360, "epoch": 1746} {"train_loss": -6.062658309936523, "global_step": 73361, "epoch": 1746} {"train_loss": -5.879603385925293, "global_step": 73362, "epoch": 1746} {"train_loss": -6.060031414031982, "global_step": 73363, "epoch": 1746} {"train_loss": -5.98213529586792, "global_step": 73364, "epoch": 1746} {"train_loss": -5.974391937255859, "global_step": 73365, "epoch": 1746} {"train_loss": -6.096914291381836, "global_step": 73366, "epoch": 1746} {"train_loss": -6.019501209259033, "global_step": 73367, "epoch": 1746} {"train_loss": -6.1451873779296875, "global_step": 73368, "epoch": 1746} {"train_loss": -5.890299320220947, "global_step": 73369, "epoch": 1746} {"train_loss": -6.083573341369629, "global_step": 73370, "epoch": 1746} {"train_loss": -6.071228981018066, "global_step": 73371, "epoch": 1746} {"train_loss": -5.932589530944824, "global_step": 73372, "epoch": 1746} {"train_loss": -6.015791234515962, "global_step": 73373, "epoch": 1746, "val_loss": 67490.421875} {"train_loss": -5.989739894866943, "global_step": 73374, "epoch": 1747} {"train_loss": -5.97108793258667, "global_step": 73375, "epoch": 1747} {"train_loss": -6.10964298248291, "global_step": 73376, "epoch": 1747} {"train_loss": -6.041858673095703, "global_step": 73377, "epoch": 1747} {"train_loss": -6.098626136779785, "global_step": 73378, "epoch": 1747} {"train_loss": -5.985608100891113, "global_step": 73379, "epoch": 1747} {"train_loss": -6.006270408630371, "global_step": 73380, "epoch": 1747} {"train_loss": -6.0804009437561035, "global_step": 73381, "epoch": 1747} {"train_loss": -6.082906246185303, "global_step": 73382, "epoch": 1747} {"train_loss": -6.069638729095459, "global_step": 73383, "epoch": 1747} {"train_loss": -5.9610748291015625, "global_step": 73384, "epoch": 1747} {"train_loss": -6.069756984710693, "global_step": 73385, "epoch": 1747} {"train_loss": -6.0042266845703125, "global_step": 73386, "epoch": 1747} {"train_loss": -6.058931350708008, "global_step": 73387, "epoch": 1747} {"train_loss": -6.087835311889648, "global_step": 73388, "epoch": 1747} {"train_loss": -6.003385543823242, "global_step": 73389, "epoch": 1747} {"train_loss": -6.147660732269287, "global_step": 73390, "epoch": 1747} {"train_loss": -6.010835647583008, "global_step": 73391, "epoch": 1747} {"train_loss": -6.2341766357421875, "global_step": 73392, "epoch": 1747} {"train_loss": -6.057562828063965, "global_step": 73393, "epoch": 1747} {"train_loss": -6.028923988342285, "global_step": 73394, "epoch": 1747} {"train_loss": -5.998067378997803, "global_step": 73395, "epoch": 1747} {"train_loss": -5.996575355529785, "global_step": 73396, "epoch": 1747} {"train_loss": -6.035469055175781, "global_step": 73397, "epoch": 1747} {"train_loss": -5.88839054107666, "global_step": 73398, "epoch": 1747} {"train_loss": -6.041805267333984, "global_step": 73399, "epoch": 1747} {"train_loss": -5.870988845825195, "global_step": 73400, "epoch": 1747} {"train_loss": -6.056263446807861, "global_step": 73401, "epoch": 1747} {"train_loss": -5.898683547973633, "global_step": 73402, "epoch": 1747} {"train_loss": -6.000458717346191, "global_step": 73403, "epoch": 1747} {"train_loss": -6.017264366149902, "global_step": 73404, "epoch": 1747} {"train_loss": -5.906711101531982, "global_step": 73405, "epoch": 1747} {"train_loss": -6.0537543296813965, "global_step": 73406, "epoch": 1747} {"train_loss": -5.977611064910889, "global_step": 73407, "epoch": 1747} {"train_loss": -5.963497161865234, "global_step": 73408, "epoch": 1747} {"train_loss": -6.037280082702637, "global_step": 73409, "epoch": 1747} {"train_loss": -6.05362606048584, "global_step": 73410, "epoch": 1747} {"train_loss": -5.948553562164307, "global_step": 73411, "epoch": 1747} {"train_loss": -6.113107204437256, "global_step": 73412, "epoch": 1747} {"train_loss": -6.1120686531066895, "global_step": 73413, "epoch": 1747} {"train_loss": -5.90605354309082, "global_step": 73414, "epoch": 1747} {"train_loss": -6.024748575119745, "global_step": 73415, "epoch": 1747, "val_loss": 67376.734375} {"train_loss": -6.031128883361816, "global_step": 73416, "epoch": 1748} {"train_loss": -6.056997776031494, "global_step": 73417, "epoch": 1748} {"train_loss": -5.93613338470459, "global_step": 73418, "epoch": 1748} {"train_loss": -6.024007797241211, "global_step": 73419, "epoch": 1748} {"train_loss": -5.965943336486816, "global_step": 73420, "epoch": 1748} {"train_loss": -6.165116310119629, "global_step": 73421, "epoch": 1748} {"train_loss": -6.001409530639648, "global_step": 73422, "epoch": 1748} {"train_loss": -5.94697380065918, "global_step": 73423, "epoch": 1748} {"train_loss": -6.033449172973633, "global_step": 73424, "epoch": 1748} {"train_loss": -6.0553717613220215, "global_step": 73425, "epoch": 1748} {"train_loss": -6.0870256423950195, "global_step": 73426, "epoch": 1748} {"train_loss": -6.100141525268555, "global_step": 73427, "epoch": 1748} {"train_loss": -6.055568695068359, "global_step": 73428, "epoch": 1748} {"train_loss": -6.094964027404785, "global_step": 73429, "epoch": 1748} {"train_loss": -6.0677337646484375, "global_step": 73430, "epoch": 1748} {"train_loss": -6.07508659362793, "global_step": 73431, "epoch": 1748} {"train_loss": -6.0586066246032715, "global_step": 73432, "epoch": 1748} {"train_loss": -6.023571014404297, "global_step": 73433, "epoch": 1748} {"train_loss": -6.004243850708008, "global_step": 73434, "epoch": 1748} {"train_loss": -6.054753303527832, "global_step": 73435, "epoch": 1748} {"train_loss": -6.011712551116943, "global_step": 73436, "epoch": 1748} {"train_loss": -6.180517196655273, "global_step": 73437, "epoch": 1748} {"train_loss": -6.275816917419434, "global_step": 73438, "epoch": 1748} {"train_loss": -6.036879539489746, "global_step": 73439, "epoch": 1748} {"train_loss": -5.988466262817383, "global_step": 73440, "epoch": 1748} {"train_loss": -6.056969165802002, "global_step": 73441, "epoch": 1748} {"train_loss": -6.032391548156738, "global_step": 73442, "epoch": 1748} {"train_loss": -6.0043864250183105, "global_step": 73443, "epoch": 1748} {"train_loss": -6.093925952911377, "global_step": 73444, "epoch": 1748} {"train_loss": -6.036803722381592, "global_step": 73445, "epoch": 1748} {"train_loss": -6.131953239440918, "global_step": 73446, "epoch": 1748} {"train_loss": -6.0777130126953125, "global_step": 73447, "epoch": 1748} {"train_loss": -5.961135387420654, "global_step": 73448, "epoch": 1748} {"train_loss": -6.1369781494140625, "global_step": 73449, "epoch": 1748} {"train_loss": -6.057202339172363, "global_step": 73450, "epoch": 1748} {"train_loss": -6.1003642082214355, "global_step": 73451, "epoch": 1748} {"train_loss": -6.029477119445801, "global_step": 73452, "epoch": 1748} {"train_loss": -6.067971229553223, "global_step": 73453, "epoch": 1748} {"train_loss": -5.912315368652344, "global_step": 73454, "epoch": 1748} {"train_loss": -6.126725196838379, "global_step": 73455, "epoch": 1748} {"train_loss": -6.058366298675537, "global_step": 73456, "epoch": 1748} {"train_loss": -6.051866849263509, "global_step": 73457, "epoch": 1748, "val_loss": 67396.4765625} {"train_loss": -6.028429985046387, "global_step": 73458, "epoch": 1749} {"train_loss": -6.0604448318481445, "global_step": 73459, "epoch": 1749} {"train_loss": -6.151491641998291, "global_step": 73460, "epoch": 1749} {"train_loss": -6.053435325622559, "global_step": 73461, "epoch": 1749} {"train_loss": -5.903140068054199, "global_step": 73462, "epoch": 1749} {"train_loss": -6.0016984939575195, "global_step": 73463, "epoch": 1749} {"train_loss": -6.033389091491699, "global_step": 73464, "epoch": 1749} {"train_loss": -6.0952372550964355, "global_step": 73465, "epoch": 1749} {"train_loss": -5.945379257202148, "global_step": 73466, "epoch": 1749} {"train_loss": -5.940735816955566, "global_step": 73467, "epoch": 1749} {"train_loss": -6.195897102355957, "global_step": 73468, "epoch": 1749} {"train_loss": -6.03270149230957, "global_step": 73469, "epoch": 1749} {"train_loss": -6.137822151184082, "global_step": 73470, "epoch": 1749} {"train_loss": -5.957066535949707, "global_step": 73471, "epoch": 1749} {"train_loss": -5.994692802429199, "global_step": 73472, "epoch": 1749} {"train_loss": -6.059771537780762, "global_step": 73473, "epoch": 1749} {"train_loss": -5.991884231567383, "global_step": 73474, "epoch": 1749} {"train_loss": -6.021361351013184, "global_step": 73475, "epoch": 1749} {"train_loss": -5.912276744842529, "global_step": 73476, "epoch": 1749} {"train_loss": -5.964146614074707, "global_step": 73477, "epoch": 1749} {"train_loss": -5.93002986907959, "global_step": 73478, "epoch": 1749} {"train_loss": -5.983564376831055, "global_step": 73479, "epoch": 1749} {"train_loss": -5.964046478271484, "global_step": 73480, "epoch": 1749} {"train_loss": -6.021805763244629, "global_step": 73481, "epoch": 1749} {"train_loss": -5.964064598083496, "global_step": 73482, "epoch": 1749} {"train_loss": -6.021969318389893, "global_step": 73483, "epoch": 1749} {"train_loss": -6.142787933349609, "global_step": 73484, "epoch": 1749} {"train_loss": -6.0902252197265625, "global_step": 73485, "epoch": 1749} {"train_loss": -6.015947341918945, "global_step": 73486, "epoch": 1749} {"train_loss": -6.023897647857666, "global_step": 73487, "epoch": 1749} {"train_loss": -6.003083229064941, "global_step": 73488, "epoch": 1749} {"train_loss": -6.12162971496582, "global_step": 73489, "epoch": 1749} {"train_loss": -6.142314434051514, "global_step": 73490, "epoch": 1749} {"train_loss": -6.029116630554199, "global_step": 73491, "epoch": 1749} {"train_loss": -6.016177654266357, "global_step": 73492, "epoch": 1749} {"train_loss": -6.067867279052734, "global_step": 73493, "epoch": 1749} {"train_loss": -6.067174911499023, "global_step": 73494, "epoch": 1749} {"train_loss": -5.954394817352295, "global_step": 73495, "epoch": 1749} {"train_loss": -6.00618839263916, "global_step": 73496, "epoch": 1749} {"train_loss": -6.071855068206787, "global_step": 73497, "epoch": 1749} {"train_loss": -5.9888916015625, "global_step": 73498, "epoch": 1749} {"train_loss": -6.029580241157895, "global_step": 73499, "epoch": 1749, "val_loss": 67461.984375} {"train_loss": -5.9823317527771, "global_step": 73500, "epoch": 1750} {"train_loss": -6.167508125305176, "global_step": 73501, "epoch": 1750} {"train_loss": -6.151129722595215, "global_step": 73502, "epoch": 1750} {"train_loss": -6.194859504699707, "global_step": 73503, "epoch": 1750} {"train_loss": -6.105511665344238, "global_step": 73504, "epoch": 1750} {"train_loss": -5.955626964569092, "global_step": 73505, "epoch": 1750} {"train_loss": -6.015279769897461, "global_step": 73506, "epoch": 1750} {"train_loss": -6.0016326904296875, "global_step": 73507, "epoch": 1750} {"train_loss": -6.087707996368408, "global_step": 73508, "epoch": 1750} {"train_loss": -6.0853424072265625, "global_step": 73509, "epoch": 1750} {"train_loss": -6.017319679260254, "global_step": 73510, "epoch": 1750} {"train_loss": -6.077127456665039, "global_step": 73511, "epoch": 1750} {"train_loss": -6.253375053405762, "global_step": 73512, "epoch": 1750} {"train_loss": -6.0819549560546875, "global_step": 73513, "epoch": 1750} {"train_loss": -6.064729690551758, "global_step": 73514, "epoch": 1750} {"train_loss": -6.117755889892578, "global_step": 73515, "epoch": 1750} {"train_loss": -5.9958176612854, "global_step": 73516, "epoch": 1750} {"train_loss": -5.949713706970215, "global_step": 73517, "epoch": 1750} {"train_loss": -6.047677040100098, "global_step": 73518, "epoch": 1750} {"train_loss": -6.063570976257324, "global_step": 73519, "epoch": 1750} {"train_loss": -6.144233703613281, "global_step": 73520, "epoch": 1750} {"train_loss": -6.077103137969971, "global_step": 73521, "epoch": 1750} {"train_loss": -6.0658440589904785, "global_step": 73522, "epoch": 1750} {"train_loss": -6.048914432525635, "global_step": 73523, "epoch": 1750} {"train_loss": -6.140551567077637, "global_step": 73524, "epoch": 1750} {"train_loss": -5.942505836486816, "global_step": 73525, "epoch": 1750} {"train_loss": -6.013267517089844, "global_step": 73526, "epoch": 1750} {"train_loss": -6.0090651512146, "global_step": 73527, "epoch": 1750} {"train_loss": -5.972328186035156, "global_step": 73528, "epoch": 1750} {"train_loss": -6.075447082519531, "global_step": 73529, "epoch": 1750} {"train_loss": -6.127988815307617, "global_step": 73530, "epoch": 1750} {"train_loss": -6.010750770568848, "global_step": 73531, "epoch": 1750} {"train_loss": -6.0805840492248535, "global_step": 73532, "epoch": 1750} {"train_loss": -5.945309638977051, "global_step": 73533, "epoch": 1750} {"train_loss": -5.992077827453613, "global_step": 73534, "epoch": 1750} {"train_loss": -6.030912399291992, "global_step": 73535, "epoch": 1750} {"train_loss": -5.905729293823242, "global_step": 73536, "epoch": 1750} {"train_loss": -5.931586265563965, "global_step": 73537, "epoch": 1750} {"train_loss": -5.861464500427246, "global_step": 73538, "epoch": 1750} {"train_loss": -5.93653678894043, "global_step": 73539, "epoch": 1750} {"train_loss": -5.950490951538086, "global_step": 73540, "epoch": 1750} {"train_loss": -6.038354147048223, "global_step": 73541, "epoch": 1750, "train/sim_max_reward_0": 0.3877745122649848, "train/sim_max_reward_1": 0.4758093999375733, "train/sim_max_reward_2": 0.4337096687531045, "train/sim_max_reward_3": 0.14862446311336924, "train/sim_max_reward_4": 0.9175465941253854, "train/sim_max_reward_5": 0.8312156489755083, "test/sim_max_reward_4400000": 0.28386375399437375, "test/sim_max_reward_4400001": 0.7921298479070693, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.7321868542605062, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.3813970342540156, "test/sim_max_reward_4400006": 0.9625286559880726, "test/sim_max_reward_4400007": 0.7032823876205903, "test/sim_max_reward_4400008": 0.3052299273721145, "test/sim_max_reward_4400009": 0.6631077604467694, "test/sim_max_reward_4400010": 0.23190935485569752, "test/sim_max_reward_4400011": 0.07331328573197171, "test/sim_max_reward_4400012": 0.9425162310465414, "test/sim_max_reward_4400013": 0.656001727344812, "test/sim_max_reward_4400014": 0.7682595651566047, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.7304155809832281, "test/sim_max_reward_4400022": 0.8526531075731509, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.9280005811652182, "test/sim_max_reward_4400025": 0.2667177352680846, "test/sim_max_reward_4400026": 0.7620069326624405, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.41027809213778377, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.8526341471316912, "test/sim_max_reward_4400031": 0.8617932040494855, "test/sim_max_reward_4400032": 0.25575612240064305, "test/sim_max_reward_4400033": 0.8510002852748209, "test/sim_max_reward_4400034": 0.8891102068786821, "test/sim_max_reward_4400035": 0.4117975090915161, "test/sim_max_reward_4400036": 0.8929836390653507, "test/sim_max_reward_4400037": 0.9282532260789064, "test/sim_max_reward_4400038": 0.848611442378509, "test/sim_max_reward_4400039": 0.9843027596472188, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.785780289130189, "test/sim_max_reward_4400042": 0.0007302169213768147, "test/sim_max_reward_4400043": 0.8319378799820507, "test/sim_max_reward_4400044": 0.6475940456163134, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8478144250172365, "test/sim_max_reward_4400047": 0.8607695836107867, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8235172461169291, "train/mean_score": 0.5324467145283209, "test/mean_score": 0.5085775656279946, "val_loss": 67640.4453125} {"train_loss": -5.971619606018066, "global_step": 73542, "epoch": 1751} {"train_loss": -5.9494476318359375, "global_step": 73543, "epoch": 1751} {"train_loss": -5.934130668640137, "global_step": 73544, "epoch": 1751} {"train_loss": -6.018457889556885, "global_step": 73545, "epoch": 1751} {"train_loss": -5.943507194519043, "global_step": 73546, "epoch": 1751} {"train_loss": -5.988729476928711, "global_step": 73547, "epoch": 1751} {"train_loss": -5.935530662536621, "global_step": 73548, "epoch": 1751} {"train_loss": -6.100474834442139, "global_step": 73549, "epoch": 1751} {"train_loss": -5.944490909576416, "global_step": 73550, "epoch": 1751} {"train_loss": -6.023136138916016, "global_step": 73551, "epoch": 1751} {"train_loss": -5.885307788848877, "global_step": 73552, "epoch": 1751} {"train_loss": -5.8199052810668945, "global_step": 73553, "epoch": 1751} {"train_loss": -6.000126361846924, "global_step": 73554, "epoch": 1751} {"train_loss": -6.02766227722168, "global_step": 73555, "epoch": 1751} {"train_loss": -5.957771301269531, "global_step": 73556, "epoch": 1751} {"train_loss": -6.017294883728027, "global_step": 73557, "epoch": 1751} {"train_loss": -5.920382499694824, "global_step": 73558, "epoch": 1751} {"train_loss": -5.944253444671631, "global_step": 73559, "epoch": 1751} {"train_loss": -5.902886390686035, "global_step": 73560, "epoch": 1751} {"train_loss": -6.088862419128418, "global_step": 73561, "epoch": 1751} {"train_loss": -6.002933502197266, "global_step": 73562, "epoch": 1751} {"train_loss": -6.037623405456543, "global_step": 73563, "epoch": 1751} {"train_loss": -6.059933662414551, "global_step": 73564, "epoch": 1751} {"train_loss": -6.074155807495117, "global_step": 73565, "epoch": 1751} {"train_loss": -6.044956684112549, "global_step": 73566, "epoch": 1751} {"train_loss": -6.058773994445801, "global_step": 73567, "epoch": 1751} {"train_loss": -5.982461452484131, "global_step": 73568, "epoch": 1751} {"train_loss": -6.0152387619018555, "global_step": 73569, "epoch": 1751} {"train_loss": -6.105584144592285, "global_step": 73570, "epoch": 1751} {"train_loss": -6.008206367492676, "global_step": 73571, "epoch": 1751} {"train_loss": -5.918737888336182, "global_step": 73572, "epoch": 1751} {"train_loss": -6.027317047119141, "global_step": 73573, "epoch": 1751} {"train_loss": -5.96639347076416, "global_step": 73574, "epoch": 1751} {"train_loss": -6.025402069091797, "global_step": 73575, "epoch": 1751} {"train_loss": -5.945615768432617, "global_step": 73576, "epoch": 1751} {"train_loss": -5.992788314819336, "global_step": 73577, "epoch": 1751} {"train_loss": -5.943357944488525, "global_step": 73578, "epoch": 1751} {"train_loss": -6.120149612426758, "global_step": 73579, "epoch": 1751} {"train_loss": -6.088624954223633, "global_step": 73580, "epoch": 1751} {"train_loss": -5.960892200469971, "global_step": 73581, "epoch": 1751} {"train_loss": -6.094008445739746, "global_step": 73582, "epoch": 1751} {"train_loss": -5.996610425767445, "global_step": 73583, "epoch": 1751, "val_loss": 67225.078125} {"train_loss": -5.958829879760742, "global_step": 73584, "epoch": 1752} {"train_loss": -6.028578281402588, "global_step": 73585, "epoch": 1752} {"train_loss": -6.05694055557251, "global_step": 73586, "epoch": 1752} {"train_loss": -5.922736644744873, "global_step": 73587, "epoch": 1752} {"train_loss": -6.095773696899414, "global_step": 73588, "epoch": 1752} {"train_loss": -6.091434478759766, "global_step": 73589, "epoch": 1752} {"train_loss": -6.104525566101074, "global_step": 73590, "epoch": 1752} {"train_loss": -5.85218620300293, "global_step": 73591, "epoch": 1752} {"train_loss": -5.957074165344238, "global_step": 73592, "epoch": 1752} {"train_loss": -6.083623886108398, "global_step": 73593, "epoch": 1752} {"train_loss": -5.904272079467773, "global_step": 73594, "epoch": 1752} {"train_loss": -6.062076091766357, "global_step": 73595, "epoch": 1752} {"train_loss": -6.156249046325684, "global_step": 73596, "epoch": 1752} {"train_loss": -5.906513690948486, "global_step": 73597, "epoch": 1752} {"train_loss": -5.952555179595947, "global_step": 73598, "epoch": 1752} {"train_loss": -6.017656326293945, "global_step": 73599, "epoch": 1752} {"train_loss": -6.0730204582214355, "global_step": 73600, "epoch": 1752} {"train_loss": -5.963447570800781, "global_step": 73601, "epoch": 1752} {"train_loss": -6.059628009796143, "global_step": 73602, "epoch": 1752} {"train_loss": -6.142428874969482, "global_step": 73603, "epoch": 1752} {"train_loss": -6.094315052032471, "global_step": 73604, "epoch": 1752} {"train_loss": -5.981537818908691, "global_step": 73605, "epoch": 1752} {"train_loss": -6.0168538093566895, "global_step": 73606, "epoch": 1752} {"train_loss": -6.170864105224609, "global_step": 73607, "epoch": 1752} {"train_loss": -6.06898307800293, "global_step": 73608, "epoch": 1752} {"train_loss": -5.96857213973999, "global_step": 73609, "epoch": 1752} {"train_loss": -6.081612586975098, "global_step": 73610, "epoch": 1752} {"train_loss": -6.009771347045898, "global_step": 73611, "epoch": 1752} {"train_loss": -6.004301071166992, "global_step": 73612, "epoch": 1752} {"train_loss": -6.123819351196289, "global_step": 73613, "epoch": 1752} {"train_loss": -5.951845169067383, "global_step": 73614, "epoch": 1752} {"train_loss": -5.982490062713623, "global_step": 73615, "epoch": 1752} {"train_loss": -5.975283145904541, "global_step": 73616, "epoch": 1752} {"train_loss": -5.977787017822266, "global_step": 73617, "epoch": 1752} {"train_loss": -6.096250534057617, "global_step": 73618, "epoch": 1752} {"train_loss": -6.1127238273620605, "global_step": 73619, "epoch": 1752} {"train_loss": -6.129180908203125, "global_step": 73620, "epoch": 1752} {"train_loss": -6.082663536071777, "global_step": 73621, "epoch": 1752} {"train_loss": -5.94160270690918, "global_step": 73622, "epoch": 1752} {"train_loss": -6.025434494018555, "global_step": 73623, "epoch": 1752} {"train_loss": -6.002959251403809, "global_step": 73624, "epoch": 1752} {"train_loss": -6.02767310823713, "global_step": 73625, "epoch": 1752, "val_loss": 67537.1015625} {"train_loss": -6.102577209472656, "global_step": 73626, "epoch": 1753} {"train_loss": -6.014118671417236, "global_step": 73627, "epoch": 1753} {"train_loss": -6.041202068328857, "global_step": 73628, "epoch": 1753} {"train_loss": -6.066211223602295, "global_step": 73629, "epoch": 1753} {"train_loss": -5.938434600830078, "global_step": 73630, "epoch": 1753} {"train_loss": -6.163819789886475, "global_step": 73631, "epoch": 1753} {"train_loss": -6.072882175445557, "global_step": 73632, "epoch": 1753} {"train_loss": -6.093081474304199, "global_step": 73633, "epoch": 1753} {"train_loss": -5.990210056304932, "global_step": 73634, "epoch": 1753} {"train_loss": -5.954150199890137, "global_step": 73635, "epoch": 1753} {"train_loss": -5.939728736877441, "global_step": 73636, "epoch": 1753} {"train_loss": -5.947346210479736, "global_step": 73637, "epoch": 1753} {"train_loss": -6.137052059173584, "global_step": 73638, "epoch": 1753} {"train_loss": -6.047326564788818, "global_step": 73639, "epoch": 1753} {"train_loss": -5.969179630279541, "global_step": 73640, "epoch": 1753} {"train_loss": -6.090169906616211, "global_step": 73641, "epoch": 1753} {"train_loss": -6.0108232498168945, "global_step": 73642, "epoch": 1753} {"train_loss": -6.061958312988281, "global_step": 73643, "epoch": 1753} {"train_loss": -5.955249309539795, "global_step": 73644, "epoch": 1753} {"train_loss": -5.974798202514648, "global_step": 73645, "epoch": 1753} {"train_loss": -6.027974605560303, "global_step": 73646, "epoch": 1753} {"train_loss": -6.0379719734191895, "global_step": 73647, "epoch": 1753} {"train_loss": -5.990442276000977, "global_step": 73648, "epoch": 1753} {"train_loss": -5.990014553070068, "global_step": 73649, "epoch": 1753} {"train_loss": -6.033071994781494, "global_step": 73650, "epoch": 1753} {"train_loss": -5.986976623535156, "global_step": 73651, "epoch": 1753} {"train_loss": -6.088749408721924, "global_step": 73652, "epoch": 1753} {"train_loss": -6.004398822784424, "global_step": 73653, "epoch": 1753} {"train_loss": -6.0848822593688965, "global_step": 73654, "epoch": 1753} {"train_loss": -6.100852012634277, "global_step": 73655, "epoch": 1753} {"train_loss": -6.0770978927612305, "global_step": 73656, "epoch": 1753} {"train_loss": -6.084440231323242, "global_step": 73657, "epoch": 1753} {"train_loss": -6.076554298400879, "global_step": 73658, "epoch": 1753} {"train_loss": -6.03596305847168, "global_step": 73659, "epoch": 1753} {"train_loss": -6.035078048706055, "global_step": 73660, "epoch": 1753} {"train_loss": -6.018871784210205, "global_step": 73661, "epoch": 1753} {"train_loss": -5.904581069946289, "global_step": 73662, "epoch": 1753} {"train_loss": -6.144224166870117, "global_step": 73663, "epoch": 1753} {"train_loss": -5.95619010925293, "global_step": 73664, "epoch": 1753} {"train_loss": -6.018120765686035, "global_step": 73665, "epoch": 1753} {"train_loss": -6.0808258056640625, "global_step": 73666, "epoch": 1753} {"train_loss": -6.0327139014289495, "global_step": 73667, "epoch": 1753, "val_loss": 67450.1484375} {"train_loss": -6.076055526733398, "global_step": 73668, "epoch": 1754} {"train_loss": -5.928715705871582, "global_step": 73669, "epoch": 1754} {"train_loss": -6.011837959289551, "global_step": 73670, "epoch": 1754} {"train_loss": -6.17182731628418, "global_step": 73671, "epoch": 1754} {"train_loss": -5.950655937194824, "global_step": 73672, "epoch": 1754} {"train_loss": -6.137203216552734, "global_step": 73673, "epoch": 1754} {"train_loss": -6.050700664520264, "global_step": 73674, "epoch": 1754} {"train_loss": -6.0891313552856445, "global_step": 73675, "epoch": 1754} {"train_loss": -6.126657962799072, "global_step": 73676, "epoch": 1754} {"train_loss": -6.097643852233887, "global_step": 73677, "epoch": 1754} {"train_loss": -6.1792378425598145, "global_step": 73678, "epoch": 1754} {"train_loss": -6.081314563751221, "global_step": 73679, "epoch": 1754} {"train_loss": -6.138461112976074, "global_step": 73680, "epoch": 1754} {"train_loss": -6.097259044647217, "global_step": 73681, "epoch": 1754} {"train_loss": -6.08419942855835, "global_step": 73682, "epoch": 1754} {"train_loss": -6.067543029785156, "global_step": 73683, "epoch": 1754} {"train_loss": -6.158389568328857, "global_step": 73684, "epoch": 1754} {"train_loss": -6.04160213470459, "global_step": 73685, "epoch": 1754} {"train_loss": -6.125494003295898, "global_step": 73686, "epoch": 1754} {"train_loss": -6.06678581237793, "global_step": 73687, "epoch": 1754} {"train_loss": -6.117964744567871, "global_step": 73688, "epoch": 1754} {"train_loss": -5.997642993927002, "global_step": 73689, "epoch": 1754} {"train_loss": -6.096817970275879, "global_step": 73690, "epoch": 1754} {"train_loss": -5.9893598556518555, "global_step": 73691, "epoch": 1754} {"train_loss": -6.1092529296875, "global_step": 73692, "epoch": 1754} {"train_loss": -6.179765701293945, "global_step": 73693, "epoch": 1754} {"train_loss": -6.131687641143799, "global_step": 73694, "epoch": 1754} {"train_loss": -6.060656547546387, "global_step": 73695, "epoch": 1754} {"train_loss": -5.974116325378418, "global_step": 73696, "epoch": 1754} {"train_loss": -6.1338958740234375, "global_step": 73697, "epoch": 1754} {"train_loss": -6.221113204956055, "global_step": 73698, "epoch": 1754} {"train_loss": -6.0207366943359375, "global_step": 73699, "epoch": 1754} {"train_loss": -6.02739143371582, "global_step": 73700, "epoch": 1754} {"train_loss": -6.116244316101074, "global_step": 73701, "epoch": 1754} {"train_loss": -6.0349321365356445, "global_step": 73702, "epoch": 1754} {"train_loss": -6.106235980987549, "global_step": 73703, "epoch": 1754} {"train_loss": -6.050003528594971, "global_step": 73704, "epoch": 1754} {"train_loss": -6.09198522567749, "global_step": 73705, "epoch": 1754} {"train_loss": -5.9799580574035645, "global_step": 73706, "epoch": 1754} {"train_loss": -6.114145278930664, "global_step": 73707, "epoch": 1754} {"train_loss": -6.127822399139404, "global_step": 73708, "epoch": 1754} {"train_loss": -6.080797876630511, "global_step": 73709, "epoch": 1754, "val_loss": 67552.0546875} {"train_loss": -5.997200965881348, "global_step": 73710, "epoch": 1755} {"train_loss": -6.062500476837158, "global_step": 73711, "epoch": 1755} {"train_loss": -6.212553977966309, "global_step": 73712, "epoch": 1755} {"train_loss": -6.078746795654297, "global_step": 73713, "epoch": 1755} {"train_loss": -6.007084846496582, "global_step": 73714, "epoch": 1755} {"train_loss": -5.988323211669922, "global_step": 73715, "epoch": 1755} {"train_loss": -6.171798229217529, "global_step": 73716, "epoch": 1755} {"train_loss": -5.926153182983398, "global_step": 73717, "epoch": 1755} {"train_loss": -5.958019256591797, "global_step": 73718, "epoch": 1755} {"train_loss": -6.163605213165283, "global_step": 73719, "epoch": 1755} {"train_loss": -5.879436492919922, "global_step": 73720, "epoch": 1755} {"train_loss": -6.053414344787598, "global_step": 73721, "epoch": 1755} {"train_loss": -6.01997184753418, "global_step": 73722, "epoch": 1755} {"train_loss": -6.046828746795654, "global_step": 73723, "epoch": 1755} {"train_loss": -6.011192798614502, "global_step": 73724, "epoch": 1755} {"train_loss": -6.044192314147949, "global_step": 73725, "epoch": 1755} {"train_loss": -6.14906644821167, "global_step": 73726, "epoch": 1755} {"train_loss": -6.0618181228637695, "global_step": 73727, "epoch": 1755} {"train_loss": -6.063502311706543, "global_step": 73728, "epoch": 1755} {"train_loss": -6.05305814743042, "global_step": 73729, "epoch": 1755} {"train_loss": -6.0071516036987305, "global_step": 73730, "epoch": 1755} {"train_loss": -6.038698673248291, "global_step": 73731, "epoch": 1755} {"train_loss": -6.033622741699219, "global_step": 73732, "epoch": 1755} {"train_loss": -6.033260345458984, "global_step": 73733, "epoch": 1755} {"train_loss": -6.0753889083862305, "global_step": 73734, "epoch": 1755} {"train_loss": -6.110892295837402, "global_step": 73735, "epoch": 1755} {"train_loss": -5.965483665466309, "global_step": 73736, "epoch": 1755} {"train_loss": -6.097206115722656, "global_step": 73737, "epoch": 1755} {"train_loss": -6.022441864013672, "global_step": 73738, "epoch": 1755} {"train_loss": -5.965937614440918, "global_step": 73739, "epoch": 1755} {"train_loss": -6.027790069580078, "global_step": 73740, "epoch": 1755} {"train_loss": -6.124197959899902, "global_step": 73741, "epoch": 1755} {"train_loss": -6.005056381225586, "global_step": 73742, "epoch": 1755} {"train_loss": -6.148474216461182, "global_step": 73743, "epoch": 1755} {"train_loss": -6.025594711303711, "global_step": 73744, "epoch": 1755} {"train_loss": -6.055487632751465, "global_step": 73745, "epoch": 1755} {"train_loss": -6.026714324951172, "global_step": 73746, "epoch": 1755} {"train_loss": -6.117422103881836, "global_step": 73747, "epoch": 1755} {"train_loss": -6.036138534545898, "global_step": 73748, "epoch": 1755} {"train_loss": -5.996131420135498, "global_step": 73749, "epoch": 1755} {"train_loss": -6.155270099639893, "global_step": 73750, "epoch": 1755} {"train_loss": -6.050180060522897, "global_step": 73751, "epoch": 1755, "val_loss": 67342.875} {"train_loss": -5.9907636642456055, "global_step": 73752, "epoch": 1756} {"train_loss": -6.078387260437012, "global_step": 73753, "epoch": 1756} {"train_loss": -6.15439510345459, "global_step": 73754, "epoch": 1756} {"train_loss": -5.93211555480957, "global_step": 73755, "epoch": 1756} {"train_loss": -6.070119380950928, "global_step": 73756, "epoch": 1756} {"train_loss": -5.992448806762695, "global_step": 73757, "epoch": 1756} {"train_loss": -6.202138900756836, "global_step": 73758, "epoch": 1756} {"train_loss": -6.087813377380371, "global_step": 73759, "epoch": 1756} {"train_loss": -6.116307258605957, "global_step": 73760, "epoch": 1756} {"train_loss": -6.094262599945068, "global_step": 73761, "epoch": 1756} {"train_loss": -6.087905406951904, "global_step": 73762, "epoch": 1756} {"train_loss": -6.103344917297363, "global_step": 73763, "epoch": 1756} {"train_loss": -6.160214424133301, "global_step": 73764, "epoch": 1756} {"train_loss": -6.049753189086914, "global_step": 73765, "epoch": 1756} {"train_loss": -6.087574005126953, "global_step": 73766, "epoch": 1756} {"train_loss": -6.067154884338379, "global_step": 73767, "epoch": 1756} {"train_loss": -6.047997951507568, "global_step": 73768, "epoch": 1756} {"train_loss": -6.010665416717529, "global_step": 73769, "epoch": 1756} {"train_loss": -6.009661674499512, "global_step": 73770, "epoch": 1756} {"train_loss": -6.05810546875, "global_step": 73771, "epoch": 1756} {"train_loss": -6.041302680969238, "global_step": 73772, "epoch": 1756} {"train_loss": -6.014432907104492, "global_step": 73773, "epoch": 1756} {"train_loss": -6.066893577575684, "global_step": 73774, "epoch": 1756} {"train_loss": -6.0568132400512695, "global_step": 73775, "epoch": 1756} {"train_loss": -5.993917465209961, "global_step": 73776, "epoch": 1756} {"train_loss": -6.016573905944824, "global_step": 73777, "epoch": 1756} {"train_loss": -5.884851932525635, "global_step": 73778, "epoch": 1756} {"train_loss": -5.942914962768555, "global_step": 73779, "epoch": 1756} {"train_loss": -5.908855438232422, "global_step": 73780, "epoch": 1756} {"train_loss": -5.97769832611084, "global_step": 73781, "epoch": 1756} {"train_loss": -5.923568248748779, "global_step": 73782, "epoch": 1756} {"train_loss": -5.847063064575195, "global_step": 73783, "epoch": 1756} {"train_loss": -5.914872169494629, "global_step": 73784, "epoch": 1756} {"train_loss": -5.885575294494629, "global_step": 73785, "epoch": 1756} {"train_loss": -5.885395050048828, "global_step": 73786, "epoch": 1756} {"train_loss": -6.051607131958008, "global_step": 73787, "epoch": 1756} {"train_loss": -5.909921646118164, "global_step": 73788, "epoch": 1756} {"train_loss": -6.010405540466309, "global_step": 73789, "epoch": 1756} {"train_loss": -6.026299476623535, "global_step": 73790, "epoch": 1756} {"train_loss": -5.985491752624512, "global_step": 73791, "epoch": 1756} {"train_loss": -5.923041343688965, "global_step": 73792, "epoch": 1756} {"train_loss": -6.018427701223464, "global_step": 73793, "epoch": 1756, "val_loss": 67444.109375} {"train_loss": -5.954655170440674, "global_step": 73794, "epoch": 1757} {"train_loss": -5.994472980499268, "global_step": 73795, "epoch": 1757} {"train_loss": -6.001471519470215, "global_step": 73796, "epoch": 1757} {"train_loss": -6.051772117614746, "global_step": 73797, "epoch": 1757} {"train_loss": -5.894700527191162, "global_step": 73798, "epoch": 1757} {"train_loss": -5.933589935302734, "global_step": 73799, "epoch": 1757} {"train_loss": -6.050447463989258, "global_step": 73800, "epoch": 1757} {"train_loss": -5.974486351013184, "global_step": 73801, "epoch": 1757} {"train_loss": -6.0290045738220215, "global_step": 73802, "epoch": 1757} {"train_loss": -5.979086875915527, "global_step": 73803, "epoch": 1757} {"train_loss": -6.0717267990112305, "global_step": 73804, "epoch": 1757} {"train_loss": -5.986566066741943, "global_step": 73805, "epoch": 1757} {"train_loss": -5.970796585083008, "global_step": 73806, "epoch": 1757} {"train_loss": -6.002906799316406, "global_step": 73807, "epoch": 1757} {"train_loss": -6.012052059173584, "global_step": 73808, "epoch": 1757} {"train_loss": -6.2214860916137695, "global_step": 73809, "epoch": 1757} {"train_loss": -6.0410919189453125, "global_step": 73810, "epoch": 1757} {"train_loss": -6.003499984741211, "global_step": 73811, "epoch": 1757} {"train_loss": -6.122626304626465, "global_step": 73812, "epoch": 1757} {"train_loss": -5.9942474365234375, "global_step": 73813, "epoch": 1757} {"train_loss": -6.109979629516602, "global_step": 73814, "epoch": 1757} {"train_loss": -6.0962982177734375, "global_step": 73815, "epoch": 1757} {"train_loss": -6.043975353240967, "global_step": 73816, "epoch": 1757} {"train_loss": -6.146885871887207, "global_step": 73817, "epoch": 1757} {"train_loss": -6.066908836364746, "global_step": 73818, "epoch": 1757} {"train_loss": -6.09428596496582, "global_step": 73819, "epoch": 1757} {"train_loss": -6.0566511154174805, "global_step": 73820, "epoch": 1757} {"train_loss": -6.1088409423828125, "global_step": 73821, "epoch": 1757} {"train_loss": -5.932337760925293, "global_step": 73822, "epoch": 1757} {"train_loss": -5.963330268859863, "global_step": 73823, "epoch": 1757} {"train_loss": -5.972491264343262, "global_step": 73824, "epoch": 1757} {"train_loss": -5.979921817779541, "global_step": 73825, "epoch": 1757} {"train_loss": -6.133077621459961, "global_step": 73826, "epoch": 1757} {"train_loss": -5.989189147949219, "global_step": 73827, "epoch": 1757} {"train_loss": -6.204702377319336, "global_step": 73828, "epoch": 1757} {"train_loss": -5.960566997528076, "global_step": 73829, "epoch": 1757} {"train_loss": -5.8884429931640625, "global_step": 73830, "epoch": 1757} {"train_loss": -6.081830024719238, "global_step": 73831, "epoch": 1757} {"train_loss": -5.963252067565918, "global_step": 73832, "epoch": 1757} {"train_loss": -6.133650779724121, "global_step": 73833, "epoch": 1757} {"train_loss": -6.0674614906311035, "global_step": 73834, "epoch": 1757} {"train_loss": -6.031257935932705, "global_step": 73835, "epoch": 1757, "val_loss": 67610.421875} {"train_loss": -6.090425968170166, "global_step": 73836, "epoch": 1758} {"train_loss": -6.080265998840332, "global_step": 73837, "epoch": 1758} {"train_loss": -6.111853122711182, "global_step": 73838, "epoch": 1758} {"train_loss": -6.144044876098633, "global_step": 73839, "epoch": 1758} {"train_loss": -6.107680320739746, "global_step": 73840, "epoch": 1758} {"train_loss": -6.063971519470215, "global_step": 73841, "epoch": 1758} {"train_loss": -6.0379509925842285, "global_step": 73842, "epoch": 1758} {"train_loss": -6.171337127685547, "global_step": 73843, "epoch": 1758} {"train_loss": -5.892880439758301, "global_step": 73844, "epoch": 1758} {"train_loss": -6.0723371505737305, "global_step": 73845, "epoch": 1758} {"train_loss": -6.170699119567871, "global_step": 73846, "epoch": 1758} {"train_loss": -6.040247917175293, "global_step": 73847, "epoch": 1758} {"train_loss": -5.944906234741211, "global_step": 73848, "epoch": 1758} {"train_loss": -6.053140163421631, "global_step": 73849, "epoch": 1758} {"train_loss": -6.016532897949219, "global_step": 73850, "epoch": 1758} {"train_loss": -6.011249542236328, "global_step": 73851, "epoch": 1758} {"train_loss": -6.037945747375488, "global_step": 73852, "epoch": 1758} {"train_loss": -6.106815814971924, "global_step": 73853, "epoch": 1758} {"train_loss": -6.043270111083984, "global_step": 73854, "epoch": 1758} {"train_loss": -6.153133392333984, "global_step": 73855, "epoch": 1758} {"train_loss": -6.103010177612305, "global_step": 73856, "epoch": 1758} {"train_loss": -6.224715232849121, "global_step": 73857, "epoch": 1758} {"train_loss": -6.124173641204834, "global_step": 73858, "epoch": 1758} {"train_loss": -6.0218095779418945, "global_step": 73859, "epoch": 1758} {"train_loss": -6.1282854080200195, "global_step": 73860, "epoch": 1758} {"train_loss": -6.080750465393066, "global_step": 73861, "epoch": 1758} {"train_loss": -6.116563320159912, "global_step": 73862, "epoch": 1758} {"train_loss": -6.15050745010376, "global_step": 73863, "epoch": 1758} {"train_loss": -6.06191349029541, "global_step": 73864, "epoch": 1758} {"train_loss": -5.984813213348389, "global_step": 73865, "epoch": 1758} {"train_loss": -6.141043663024902, "global_step": 73866, "epoch": 1758} {"train_loss": -6.124731063842773, "global_step": 73867, "epoch": 1758} {"train_loss": -6.085794448852539, "global_step": 73868, "epoch": 1758} {"train_loss": -6.098412990570068, "global_step": 73869, "epoch": 1758} {"train_loss": -6.021932601928711, "global_step": 73870, "epoch": 1758} {"train_loss": -5.98903751373291, "global_step": 73871, "epoch": 1758} {"train_loss": -6.111902236938477, "global_step": 73872, "epoch": 1758} {"train_loss": -6.118433952331543, "global_step": 73873, "epoch": 1758} {"train_loss": -6.082680702209473, "global_step": 73874, "epoch": 1758} {"train_loss": -6.070308685302734, "global_step": 73875, "epoch": 1758} {"train_loss": -5.919487476348877, "global_step": 73876, "epoch": 1758} {"train_loss": -6.0759962399800616, "global_step": 73877, "epoch": 1758, "val_loss": 67214.390625} {"train_loss": -6.038658618927002, "global_step": 73878, "epoch": 1759} {"train_loss": -6.071529388427734, "global_step": 73879, "epoch": 1759} {"train_loss": -6.053620338439941, "global_step": 73880, "epoch": 1759} {"train_loss": -6.044378280639648, "global_step": 73881, "epoch": 1759} {"train_loss": -5.987135887145996, "global_step": 73882, "epoch": 1759} {"train_loss": -6.093703746795654, "global_step": 73883, "epoch": 1759} {"train_loss": -6.115242958068848, "global_step": 73884, "epoch": 1759} {"train_loss": -6.039018154144287, "global_step": 73885, "epoch": 1759} {"train_loss": -6.0778045654296875, "global_step": 73886, "epoch": 1759} {"train_loss": -6.044802665710449, "global_step": 73887, "epoch": 1759} {"train_loss": -6.078313827514648, "global_step": 73888, "epoch": 1759} {"train_loss": -5.995474338531494, "global_step": 73889, "epoch": 1759} {"train_loss": -6.024849891662598, "global_step": 73890, "epoch": 1759} {"train_loss": -6.005568981170654, "global_step": 73891, "epoch": 1759} {"train_loss": -6.115853309631348, "global_step": 73892, "epoch": 1759} {"train_loss": -5.949949264526367, "global_step": 73893, "epoch": 1759} {"train_loss": -6.026758193969727, "global_step": 73894, "epoch": 1759} {"train_loss": -6.061223030090332, "global_step": 73895, "epoch": 1759} {"train_loss": -5.918778419494629, "global_step": 73896, "epoch": 1759} {"train_loss": -6.067946434020996, "global_step": 73897, "epoch": 1759} {"train_loss": -5.927555084228516, "global_step": 73898, "epoch": 1759} {"train_loss": -6.087174415588379, "global_step": 73899, "epoch": 1759} {"train_loss": -6.036248207092285, "global_step": 73900, "epoch": 1759} {"train_loss": -6.009020805358887, "global_step": 73901, "epoch": 1759} {"train_loss": -6.199225902557373, "global_step": 73902, "epoch": 1759} {"train_loss": -5.940305709838867, "global_step": 73903, "epoch": 1759} {"train_loss": -6.0814208984375, "global_step": 73904, "epoch": 1759} {"train_loss": -6.0194172859191895, "global_step": 73905, "epoch": 1759} {"train_loss": -6.052529335021973, "global_step": 73906, "epoch": 1759} {"train_loss": -5.9061713218688965, "global_step": 73907, "epoch": 1759} {"train_loss": -6.040367126464844, "global_step": 73908, "epoch": 1759} {"train_loss": -6.033891201019287, "global_step": 73909, "epoch": 1759} {"train_loss": -6.170883655548096, "global_step": 73910, "epoch": 1759} {"train_loss": -6.046415328979492, "global_step": 73911, "epoch": 1759} {"train_loss": -5.8809404373168945, "global_step": 73912, "epoch": 1759} {"train_loss": -6.076663494110107, "global_step": 73913, "epoch": 1759} {"train_loss": -6.042227745056152, "global_step": 73914, "epoch": 1759} {"train_loss": -6.130542755126953, "global_step": 73915, "epoch": 1759} {"train_loss": -6.071366786956787, "global_step": 73916, "epoch": 1759} {"train_loss": -5.939764022827148, "global_step": 73917, "epoch": 1759} {"train_loss": -6.000864028930664, "global_step": 73918, "epoch": 1759} {"train_loss": -6.0353352682931085, "global_step": 73919, "epoch": 1759, "val_loss": 67368.0859375} {"train_loss": -5.992705821990967, "global_step": 73920, "epoch": 1760} {"train_loss": -6.000171661376953, "global_step": 73921, "epoch": 1760} {"train_loss": -6.059198379516602, "global_step": 73922, "epoch": 1760} {"train_loss": -6.000089645385742, "global_step": 73923, "epoch": 1760} {"train_loss": -6.072545051574707, "global_step": 73924, "epoch": 1760} {"train_loss": -6.094119071960449, "global_step": 73925, "epoch": 1760} {"train_loss": -6.050023555755615, "global_step": 73926, "epoch": 1760} {"train_loss": -6.016442775726318, "global_step": 73927, "epoch": 1760} {"train_loss": -5.97097635269165, "global_step": 73928, "epoch": 1760} {"train_loss": -5.974052429199219, "global_step": 73929, "epoch": 1760} {"train_loss": -6.0653557777404785, "global_step": 73930, "epoch": 1760} {"train_loss": -6.046131610870361, "global_step": 73931, "epoch": 1760} {"train_loss": -6.063701629638672, "global_step": 73932, "epoch": 1760} {"train_loss": -6.018063545227051, "global_step": 73933, "epoch": 1760} {"train_loss": -6.032365798950195, "global_step": 73934, "epoch": 1760} {"train_loss": -6.152225494384766, "global_step": 73935, "epoch": 1760} {"train_loss": -6.176257133483887, "global_step": 73936, "epoch": 1760} {"train_loss": -6.063556671142578, "global_step": 73937, "epoch": 1760} {"train_loss": -6.147244453430176, "global_step": 73938, "epoch": 1760} {"train_loss": -6.1587114334106445, "global_step": 73939, "epoch": 1760} {"train_loss": -5.933374404907227, "global_step": 73940, "epoch": 1760} {"train_loss": -5.943487167358398, "global_step": 73941, "epoch": 1760} {"train_loss": -6.168283462524414, "global_step": 73942, "epoch": 1760} {"train_loss": -5.9626688957214355, "global_step": 73943, "epoch": 1760} {"train_loss": -6.0434722900390625, "global_step": 73944, "epoch": 1760} {"train_loss": -6.075600624084473, "global_step": 73945, "epoch": 1760} {"train_loss": -5.887516021728516, "global_step": 73946, "epoch": 1760} {"train_loss": -6.065174579620361, "global_step": 73947, "epoch": 1760} {"train_loss": -5.921232223510742, "global_step": 73948, "epoch": 1760} {"train_loss": -5.994073867797852, "global_step": 73949, "epoch": 1760} {"train_loss": -6.068782329559326, "global_step": 73950, "epoch": 1760} {"train_loss": -5.897436618804932, "global_step": 73951, "epoch": 1760} {"train_loss": -5.946687698364258, "global_step": 73952, "epoch": 1760} {"train_loss": -5.948523998260498, "global_step": 73953, "epoch": 1760} {"train_loss": -6.077520370483398, "global_step": 73954, "epoch": 1760} {"train_loss": -6.0232977867126465, "global_step": 73955, "epoch": 1760} {"train_loss": -5.966862678527832, "global_step": 73956, "epoch": 1760} {"train_loss": -5.937573432922363, "global_step": 73957, "epoch": 1760} {"train_loss": -6.167674541473389, "global_step": 73958, "epoch": 1760} {"train_loss": -5.933145046234131, "global_step": 73959, "epoch": 1760} {"train_loss": -6.038658142089844, "global_step": 73960, "epoch": 1760} {"train_loss": -6.027256863457816, "global_step": 73961, "epoch": 1760, "val_loss": 67414.890625} {"train_loss": -5.955428600311279, "global_step": 73962, "epoch": 1761} {"train_loss": -5.933401107788086, "global_step": 73963, "epoch": 1761} {"train_loss": -6.012005805969238, "global_step": 73964, "epoch": 1761} {"train_loss": -6.013733386993408, "global_step": 73965, "epoch": 1761} {"train_loss": -6.033886909484863, "global_step": 73966, "epoch": 1761} {"train_loss": -6.007140159606934, "global_step": 73967, "epoch": 1761} {"train_loss": -6.086213111877441, "global_step": 73968, "epoch": 1761} {"train_loss": -6.091573715209961, "global_step": 73969, "epoch": 1761} {"train_loss": -6.094019889831543, "global_step": 73970, "epoch": 1761} {"train_loss": -6.056504726409912, "global_step": 73971, "epoch": 1761} {"train_loss": -6.05073356628418, "global_step": 73972, "epoch": 1761} {"train_loss": -5.9337053298950195, "global_step": 73973, "epoch": 1761} {"train_loss": -5.991738796234131, "global_step": 73974, "epoch": 1761} {"train_loss": -6.143397331237793, "global_step": 73975, "epoch": 1761} {"train_loss": -5.9435343742370605, "global_step": 73976, "epoch": 1761} {"train_loss": -6.0322113037109375, "global_step": 73977, "epoch": 1761} {"train_loss": -6.073634147644043, "global_step": 73978, "epoch": 1761} {"train_loss": -6.020239353179932, "global_step": 73979, "epoch": 1761} {"train_loss": -6.111505508422852, "global_step": 73980, "epoch": 1761} {"train_loss": -6.159483432769775, "global_step": 73981, "epoch": 1761} {"train_loss": -6.11757755279541, "global_step": 73982, "epoch": 1761} {"train_loss": -6.190891265869141, "global_step": 73983, "epoch": 1761} {"train_loss": -6.008117198944092, "global_step": 73984, "epoch": 1761} {"train_loss": -6.043677806854248, "global_step": 73985, "epoch": 1761} {"train_loss": -6.157327175140381, "global_step": 73986, "epoch": 1761} {"train_loss": -6.087308883666992, "global_step": 73987, "epoch": 1761} {"train_loss": -6.06980037689209, "global_step": 73988, "epoch": 1761} {"train_loss": -6.108041763305664, "global_step": 73989, "epoch": 1761} {"train_loss": -6.15682315826416, "global_step": 73990, "epoch": 1761} {"train_loss": -6.068849086761475, "global_step": 73991, "epoch": 1761} {"train_loss": -6.11605167388916, "global_step": 73992, "epoch": 1761} {"train_loss": -6.05754280090332, "global_step": 73993, "epoch": 1761} {"train_loss": -6.1712493896484375, "global_step": 73994, "epoch": 1761} {"train_loss": -6.106721878051758, "global_step": 73995, "epoch": 1761} {"train_loss": -6.069777965545654, "global_step": 73996, "epoch": 1761} {"train_loss": -6.036134243011475, "global_step": 73997, "epoch": 1761} {"train_loss": -6.127147197723389, "global_step": 73998, "epoch": 1761} {"train_loss": -6.177082061767578, "global_step": 73999, "epoch": 1761} {"train_loss": -5.9947099685668945, "global_step": 74000, "epoch": 1761} {"train_loss": -5.9892168045043945, "global_step": 74001, "epoch": 1761} {"train_loss": -6.009416580200195, "global_step": 74002, "epoch": 1761} {"train_loss": -6.065026544389271, "global_step": 74003, "epoch": 1761, "val_loss": 67708.484375} {"train_loss": -5.994448184967041, "global_step": 74004, "epoch": 1762} {"train_loss": -6.130924701690674, "global_step": 74005, "epoch": 1762} {"train_loss": -6.064489364624023, "global_step": 74006, "epoch": 1762} {"train_loss": -6.152945518493652, "global_step": 74007, "epoch": 1762} {"train_loss": -5.9771409034729, "global_step": 74008, "epoch": 1762} {"train_loss": -6.053433418273926, "global_step": 74009, "epoch": 1762} {"train_loss": -6.095090866088867, "global_step": 74010, "epoch": 1762} {"train_loss": -6.096469402313232, "global_step": 74011, "epoch": 1762} {"train_loss": -6.071252822875977, "global_step": 74012, "epoch": 1762} {"train_loss": -6.123088359832764, "global_step": 74013, "epoch": 1762} {"train_loss": -6.138818740844727, "global_step": 74014, "epoch": 1762} {"train_loss": -6.089046478271484, "global_step": 74015, "epoch": 1762} {"train_loss": -6.012391090393066, "global_step": 74016, "epoch": 1762} {"train_loss": -6.0612897872924805, "global_step": 74017, "epoch": 1762} {"train_loss": -5.982185363769531, "global_step": 74018, "epoch": 1762} {"train_loss": -6.0491838455200195, "global_step": 74019, "epoch": 1762} {"train_loss": -6.175589561462402, "global_step": 74020, "epoch": 1762} {"train_loss": -6.132514476776123, "global_step": 74021, "epoch": 1762} {"train_loss": -6.069289684295654, "global_step": 74022, "epoch": 1762} {"train_loss": -6.026371955871582, "global_step": 74023, "epoch": 1762} {"train_loss": -5.978784561157227, "global_step": 74024, "epoch": 1762} {"train_loss": -6.078597068786621, "global_step": 74025, "epoch": 1762} {"train_loss": -5.991936683654785, "global_step": 74026, "epoch": 1762} {"train_loss": -6.117759704589844, "global_step": 74027, "epoch": 1762} {"train_loss": -6.07602071762085, "global_step": 74028, "epoch": 1762} {"train_loss": -6.0691609382629395, "global_step": 74029, "epoch": 1762} {"train_loss": -5.931784629821777, "global_step": 74030, "epoch": 1762} {"train_loss": -6.007939338684082, "global_step": 74031, "epoch": 1762} {"train_loss": -5.962172985076904, "global_step": 74032, "epoch": 1762} {"train_loss": -5.975476264953613, "global_step": 74033, "epoch": 1762} {"train_loss": -6.180037498474121, "global_step": 74034, "epoch": 1762} {"train_loss": -6.093069076538086, "global_step": 74035, "epoch": 1762} {"train_loss": -5.878269195556641, "global_step": 74036, "epoch": 1762} {"train_loss": -5.980166435241699, "global_step": 74037, "epoch": 1762} {"train_loss": -6.099794864654541, "global_step": 74038, "epoch": 1762} {"train_loss": -6.052863597869873, "global_step": 74039, "epoch": 1762} {"train_loss": -6.003927707672119, "global_step": 74040, "epoch": 1762} {"train_loss": -5.935669422149658, "global_step": 74041, "epoch": 1762} {"train_loss": -5.9482808113098145, "global_step": 74042, "epoch": 1762} {"train_loss": -6.085236549377441, "global_step": 74043, "epoch": 1762} {"train_loss": -6.002267837524414, "global_step": 74044, "epoch": 1762} {"train_loss": -6.048212982359386, "global_step": 74045, "epoch": 1762, "val_loss": 67631.3984375} {"train_loss": -6.060519218444824, "global_step": 74046, "epoch": 1763} {"train_loss": -6.167597770690918, "global_step": 74047, "epoch": 1763} {"train_loss": -6.079024791717529, "global_step": 74048, "epoch": 1763} {"train_loss": -5.942026615142822, "global_step": 74049, "epoch": 1763} {"train_loss": -6.127926826477051, "global_step": 74050, "epoch": 1763} {"train_loss": -6.032892227172852, "global_step": 74051, "epoch": 1763} {"train_loss": -6.034920692443848, "global_step": 74052, "epoch": 1763} {"train_loss": -6.147463798522949, "global_step": 74053, "epoch": 1763} {"train_loss": -6.0281877517700195, "global_step": 74054, "epoch": 1763} {"train_loss": -6.006488800048828, "global_step": 74055, "epoch": 1763} {"train_loss": -6.018791675567627, "global_step": 74056, "epoch": 1763} {"train_loss": -6.015922546386719, "global_step": 74057, "epoch": 1763} {"train_loss": -6.055560111999512, "global_step": 74058, "epoch": 1763} {"train_loss": -6.133521556854248, "global_step": 74059, "epoch": 1763} {"train_loss": -6.054780006408691, "global_step": 74060, "epoch": 1763} {"train_loss": -6.137322902679443, "global_step": 74061, "epoch": 1763} {"train_loss": -6.0629472732543945, "global_step": 74062, "epoch": 1763} {"train_loss": -6.12502384185791, "global_step": 74063, "epoch": 1763} {"train_loss": -6.116388320922852, "global_step": 74064, "epoch": 1763} {"train_loss": -6.018084526062012, "global_step": 74065, "epoch": 1763} {"train_loss": -6.0674238204956055, "global_step": 74066, "epoch": 1763} {"train_loss": -6.120084285736084, "global_step": 74067, "epoch": 1763} {"train_loss": -6.140422821044922, "global_step": 74068, "epoch": 1763} {"train_loss": -6.069670677185059, "global_step": 74069, "epoch": 1763} {"train_loss": -5.996860504150391, "global_step": 74070, "epoch": 1763} {"train_loss": -6.061794281005859, "global_step": 74071, "epoch": 1763} {"train_loss": -6.13276481628418, "global_step": 74072, "epoch": 1763} {"train_loss": -6.087937355041504, "global_step": 74073, "epoch": 1763} {"train_loss": -6.070557594299316, "global_step": 74074, "epoch": 1763} {"train_loss": -6.113018035888672, "global_step": 74075, "epoch": 1763} {"train_loss": -6.082184791564941, "global_step": 74076, "epoch": 1763} {"train_loss": -6.097966194152832, "global_step": 74077, "epoch": 1763} {"train_loss": -6.151134014129639, "global_step": 74078, "epoch": 1763} {"train_loss": -6.000834941864014, "global_step": 74079, "epoch": 1763} {"train_loss": -6.114985466003418, "global_step": 74080, "epoch": 1763} {"train_loss": -6.024706840515137, "global_step": 74081, "epoch": 1763} {"train_loss": -6.087284088134766, "global_step": 74082, "epoch": 1763} {"train_loss": -6.1607208251953125, "global_step": 74083, "epoch": 1763} {"train_loss": -6.097031116485596, "global_step": 74084, "epoch": 1763} {"train_loss": -6.190110206604004, "global_step": 74085, "epoch": 1763} {"train_loss": -6.015841484069824, "global_step": 74086, "epoch": 1763} {"train_loss": -6.0758349895477295, "global_step": 74087, "epoch": 1763, "val_loss": 67528.9140625} {"train_loss": -6.1848859786987305, "global_step": 74088, "epoch": 1764} {"train_loss": -6.118047714233398, "global_step": 74089, "epoch": 1764} {"train_loss": -6.090106964111328, "global_step": 74090, "epoch": 1764} {"train_loss": -6.048447608947754, "global_step": 74091, "epoch": 1764} {"train_loss": -6.088733196258545, "global_step": 74092, "epoch": 1764} {"train_loss": -6.0763726234436035, "global_step": 74093, "epoch": 1764} {"train_loss": -6.05133581161499, "global_step": 74094, "epoch": 1764} {"train_loss": -6.082398414611816, "global_step": 74095, "epoch": 1764} {"train_loss": -6.088929176330566, "global_step": 74096, "epoch": 1764} {"train_loss": -5.9383320808410645, "global_step": 74097, "epoch": 1764} {"train_loss": -6.064915657043457, "global_step": 74098, "epoch": 1764} {"train_loss": -6.212026596069336, "global_step": 74099, "epoch": 1764} {"train_loss": -5.956973075866699, "global_step": 74100, "epoch": 1764} {"train_loss": -6.018553256988525, "global_step": 74101, "epoch": 1764} {"train_loss": -6.025880813598633, "global_step": 74102, "epoch": 1764} {"train_loss": -5.967796325683594, "global_step": 74103, "epoch": 1764} {"train_loss": -6.059362411499023, "global_step": 74104, "epoch": 1764} {"train_loss": -5.996454238891602, "global_step": 74105, "epoch": 1764} {"train_loss": -5.931119918823242, "global_step": 74106, "epoch": 1764} {"train_loss": -6.059808731079102, "global_step": 74107, "epoch": 1764} {"train_loss": -5.893950939178467, "global_step": 74108, "epoch": 1764} {"train_loss": -5.925614356994629, "global_step": 74109, "epoch": 1764} {"train_loss": -5.9530439376831055, "global_step": 74110, "epoch": 1764} {"train_loss": -5.948667526245117, "global_step": 74111, "epoch": 1764} {"train_loss": -6.053457260131836, "global_step": 74112, "epoch": 1764} {"train_loss": -5.9688639640808105, "global_step": 74113, "epoch": 1764} {"train_loss": -6.024280548095703, "global_step": 74114, "epoch": 1764} {"train_loss": -6.0858154296875, "global_step": 74115, "epoch": 1764} {"train_loss": -5.931002140045166, "global_step": 74116, "epoch": 1764} {"train_loss": -6.150290012359619, "global_step": 74117, "epoch": 1764} {"train_loss": -6.057472229003906, "global_step": 74118, "epoch": 1764} {"train_loss": -6.03361177444458, "global_step": 74119, "epoch": 1764} {"train_loss": -6.07492733001709, "global_step": 74120, "epoch": 1764} {"train_loss": -5.966616630554199, "global_step": 74121, "epoch": 1764} {"train_loss": -6.083118438720703, "global_step": 74122, "epoch": 1764} {"train_loss": -6.040579319000244, "global_step": 74123, "epoch": 1764} {"train_loss": -6.114017009735107, "global_step": 74124, "epoch": 1764} {"train_loss": -5.926122665405273, "global_step": 74125, "epoch": 1764} {"train_loss": -6.010140419006348, "global_step": 74126, "epoch": 1764} {"train_loss": -6.003094673156738, "global_step": 74127, "epoch": 1764} {"train_loss": -6.0037102699279785, "global_step": 74128, "epoch": 1764} {"train_loss": -6.031928766341436, "global_step": 74129, "epoch": 1764, "val_loss": 67500.21875} {"train_loss": -6.03046178817749, "global_step": 74130, "epoch": 1765} {"train_loss": -6.145860195159912, "global_step": 74131, "epoch": 1765} {"train_loss": -6.008210182189941, "global_step": 74132, "epoch": 1765} {"train_loss": -6.101437568664551, "global_step": 74133, "epoch": 1765} {"train_loss": -5.983019828796387, "global_step": 74134, "epoch": 1765} {"train_loss": -6.04410457611084, "global_step": 74135, "epoch": 1765} {"train_loss": -6.044880390167236, "global_step": 74136, "epoch": 1765} {"train_loss": -5.958276748657227, "global_step": 74137, "epoch": 1765} {"train_loss": -6.046904563903809, "global_step": 74138, "epoch": 1765} {"train_loss": -5.9288129806518555, "global_step": 74139, "epoch": 1765} {"train_loss": -5.976493835449219, "global_step": 74140, "epoch": 1765} {"train_loss": -5.970417022705078, "global_step": 74141, "epoch": 1765} {"train_loss": -6.046799659729004, "global_step": 74142, "epoch": 1765} {"train_loss": -6.000896453857422, "global_step": 74143, "epoch": 1765} {"train_loss": -5.970075607299805, "global_step": 74144, "epoch": 1765} {"train_loss": -5.963276386260986, "global_step": 74145, "epoch": 1765} {"train_loss": -6.151092529296875, "global_step": 74146, "epoch": 1765} {"train_loss": -6.048048496246338, "global_step": 74147, "epoch": 1765} {"train_loss": -6.0473175048828125, "global_step": 74148, "epoch": 1765} {"train_loss": -6.088016986846924, "global_step": 74149, "epoch": 1765} {"train_loss": -6.0312700271606445, "global_step": 74150, "epoch": 1765} {"train_loss": -6.125277519226074, "global_step": 74151, "epoch": 1765} {"train_loss": -5.9763593673706055, "global_step": 74152, "epoch": 1765} {"train_loss": -6.185876846313477, "global_step": 74153, "epoch": 1765} {"train_loss": -5.90457010269165, "global_step": 74154, "epoch": 1765} {"train_loss": -6.188973426818848, "global_step": 74155, "epoch": 1765} {"train_loss": -6.105988502502441, "global_step": 74156, "epoch": 1765} {"train_loss": -6.009442329406738, "global_step": 74157, "epoch": 1765} {"train_loss": -6.045385360717773, "global_step": 74158, "epoch": 1765} {"train_loss": -6.091649055480957, "global_step": 74159, "epoch": 1765} {"train_loss": -5.933093070983887, "global_step": 74160, "epoch": 1765} {"train_loss": -6.136923789978027, "global_step": 74161, "epoch": 1765} {"train_loss": -6.0486555099487305, "global_step": 74162, "epoch": 1765} {"train_loss": -6.074440002441406, "global_step": 74163, "epoch": 1765} {"train_loss": -5.95847225189209, "global_step": 74164, "epoch": 1765} {"train_loss": -6.152948379516602, "global_step": 74165, "epoch": 1765} {"train_loss": -6.004578590393066, "global_step": 74166, "epoch": 1765} {"train_loss": -6.133967399597168, "global_step": 74167, "epoch": 1765} {"train_loss": -6.118217468261719, "global_step": 74168, "epoch": 1765} {"train_loss": -6.059009075164795, "global_step": 74169, "epoch": 1765} {"train_loss": -6.056632995605469, "global_step": 74170, "epoch": 1765} {"train_loss": -6.046851090022495, "global_step": 74171, "epoch": 1765, "val_loss": 67388.9140625} {"train_loss": -6.022170543670654, "global_step": 74172, "epoch": 1766} {"train_loss": -5.927226543426514, "global_step": 74173, "epoch": 1766} {"train_loss": -5.989240646362305, "global_step": 74174, "epoch": 1766} {"train_loss": -6.145296573638916, "global_step": 74175, "epoch": 1766} {"train_loss": -5.890804290771484, "global_step": 74176, "epoch": 1766} {"train_loss": -5.896030426025391, "global_step": 74177, "epoch": 1766} {"train_loss": -5.949796676635742, "global_step": 74178, "epoch": 1766} {"train_loss": -6.145874500274658, "global_step": 74179, "epoch": 1766} {"train_loss": -6.073556900024414, "global_step": 74180, "epoch": 1766} {"train_loss": -6.049531936645508, "global_step": 74181, "epoch": 1766} {"train_loss": -6.046426296234131, "global_step": 74182, "epoch": 1766} {"train_loss": -6.003412246704102, "global_step": 74183, "epoch": 1766} {"train_loss": -6.047601222991943, "global_step": 74184, "epoch": 1766} {"train_loss": -6.100576400756836, "global_step": 74185, "epoch": 1766} {"train_loss": -6.092044353485107, "global_step": 74186, "epoch": 1766} {"train_loss": -6.013133525848389, "global_step": 74187, "epoch": 1766} {"train_loss": -6.1459527015686035, "global_step": 74188, "epoch": 1766} {"train_loss": -6.157697677612305, "global_step": 74189, "epoch": 1766} {"train_loss": -5.98784065246582, "global_step": 74190, "epoch": 1766} {"train_loss": -6.0637407302856445, "global_step": 74191, "epoch": 1766} {"train_loss": -6.0135111808776855, "global_step": 74192, "epoch": 1766} {"train_loss": -5.992216110229492, "global_step": 74193, "epoch": 1766} {"train_loss": -6.179351806640625, "global_step": 74194, "epoch": 1766} {"train_loss": -5.963192462921143, "global_step": 74195, "epoch": 1766} {"train_loss": -6.013082504272461, "global_step": 74196, "epoch": 1766} {"train_loss": -6.064784526824951, "global_step": 74197, "epoch": 1766} {"train_loss": -5.978667259216309, "global_step": 74198, "epoch": 1766} {"train_loss": -6.052835464477539, "global_step": 74199, "epoch": 1766} {"train_loss": -6.133631706237793, "global_step": 74200, "epoch": 1766} {"train_loss": -6.14369010925293, "global_step": 74201, "epoch": 1766} {"train_loss": -5.977313041687012, "global_step": 74202, "epoch": 1766} {"train_loss": -6.041114807128906, "global_step": 74203, "epoch": 1766} {"train_loss": -6.016449928283691, "global_step": 74204, "epoch": 1766} {"train_loss": -5.969079494476318, "global_step": 74205, "epoch": 1766} {"train_loss": -6.133825302124023, "global_step": 74206, "epoch": 1766} {"train_loss": -6.163900375366211, "global_step": 74207, "epoch": 1766} {"train_loss": -5.99976921081543, "global_step": 74208, "epoch": 1766} {"train_loss": -6.072894096374512, "global_step": 74209, "epoch": 1766} {"train_loss": -5.980305194854736, "global_step": 74210, "epoch": 1766} {"train_loss": -6.090725898742676, "global_step": 74211, "epoch": 1766} {"train_loss": -6.075899124145508, "global_step": 74212, "epoch": 1766} {"train_loss": -6.0455101898738315, "global_step": 74213, "epoch": 1766, "val_loss": 67297.765625} {"train_loss": -6.101463794708252, "global_step": 74214, "epoch": 1767} {"train_loss": -6.044396877288818, "global_step": 74215, "epoch": 1767} {"train_loss": -6.058905601501465, "global_step": 74216, "epoch": 1767} {"train_loss": -6.081472873687744, "global_step": 74217, "epoch": 1767} {"train_loss": -6.040239334106445, "global_step": 74218, "epoch": 1767} {"train_loss": -6.079744815826416, "global_step": 74219, "epoch": 1767} {"train_loss": -6.0319976806640625, "global_step": 74220, "epoch": 1767} {"train_loss": -6.117003917694092, "global_step": 74221, "epoch": 1767} {"train_loss": -6.1512451171875, "global_step": 74222, "epoch": 1767} {"train_loss": -6.087689399719238, "global_step": 74223, "epoch": 1767} {"train_loss": -6.040512561798096, "global_step": 74224, "epoch": 1767} {"train_loss": -6.015641212463379, "global_step": 74225, "epoch": 1767} {"train_loss": -6.101474761962891, "global_step": 74226, "epoch": 1767} {"train_loss": -6.109096527099609, "global_step": 74227, "epoch": 1767} {"train_loss": -6.130609035491943, "global_step": 74228, "epoch": 1767} {"train_loss": -6.0598626136779785, "global_step": 74229, "epoch": 1767} {"train_loss": -6.124597549438477, "global_step": 74230, "epoch": 1767} {"train_loss": -6.152314186096191, "global_step": 74231, "epoch": 1767} {"train_loss": -6.061285495758057, "global_step": 74232, "epoch": 1767} {"train_loss": -5.895899772644043, "global_step": 74233, "epoch": 1767} {"train_loss": -6.055567264556885, "global_step": 74234, "epoch": 1767} {"train_loss": -5.9633893966674805, "global_step": 74235, "epoch": 1767} {"train_loss": -6.073634147644043, "global_step": 74236, "epoch": 1767} {"train_loss": -6.009590148925781, "global_step": 74237, "epoch": 1767} {"train_loss": -6.0239362716674805, "global_step": 74238, "epoch": 1767} {"train_loss": -6.006143093109131, "global_step": 74239, "epoch": 1767} {"train_loss": -6.103619575500488, "global_step": 74240, "epoch": 1767} {"train_loss": -6.005889415740967, "global_step": 74241, "epoch": 1767} {"train_loss": -6.035994529724121, "global_step": 74242, "epoch": 1767} {"train_loss": -6.018296241760254, "global_step": 74243, "epoch": 1767} {"train_loss": -6.02479362487793, "global_step": 74244, "epoch": 1767} {"train_loss": -5.952507972717285, "global_step": 74245, "epoch": 1767} {"train_loss": -6.045679092407227, "global_step": 74246, "epoch": 1767} {"train_loss": -6.145349502563477, "global_step": 74247, "epoch": 1767} {"train_loss": -6.141927719116211, "global_step": 74248, "epoch": 1767} {"train_loss": -6.131947040557861, "global_step": 74249, "epoch": 1767} {"train_loss": -6.048308372497559, "global_step": 74250, "epoch": 1767} {"train_loss": -6.048588752746582, "global_step": 74251, "epoch": 1767} {"train_loss": -6.224695205688477, "global_step": 74252, "epoch": 1767} {"train_loss": -6.088461875915527, "global_step": 74253, "epoch": 1767} {"train_loss": -6.0121941566467285, "global_step": 74254, "epoch": 1767} {"train_loss": -6.061652251652309, "global_step": 74255, "epoch": 1767, "val_loss": 67399.1328125} {"train_loss": -6.145421028137207, "global_step": 74256, "epoch": 1768} {"train_loss": -6.131265640258789, "global_step": 74257, "epoch": 1768} {"train_loss": -6.017237663269043, "global_step": 74258, "epoch": 1768} {"train_loss": -6.059900283813477, "global_step": 74259, "epoch": 1768} {"train_loss": -6.004040718078613, "global_step": 74260, "epoch": 1768} {"train_loss": -6.101058483123779, "global_step": 74261, "epoch": 1768} {"train_loss": -5.996333599090576, "global_step": 74262, "epoch": 1768} {"train_loss": -5.956986427307129, "global_step": 74263, "epoch": 1768} {"train_loss": -5.964820861816406, "global_step": 74264, "epoch": 1768} {"train_loss": -5.929683685302734, "global_step": 74265, "epoch": 1768} {"train_loss": -6.223763465881348, "global_step": 74266, "epoch": 1768} {"train_loss": -6.107388973236084, "global_step": 74267, "epoch": 1768} {"train_loss": -6.106184482574463, "global_step": 74268, "epoch": 1768} {"train_loss": -6.019089698791504, "global_step": 74269, "epoch": 1768} {"train_loss": -6.0430192947387695, "global_step": 74270, "epoch": 1768} {"train_loss": -6.081149101257324, "global_step": 74271, "epoch": 1768} {"train_loss": -6.075175762176514, "global_step": 74272, "epoch": 1768} {"train_loss": -6.053947448730469, "global_step": 74273, "epoch": 1768} {"train_loss": -6.0101704597473145, "global_step": 74274, "epoch": 1768} {"train_loss": -6.114559173583984, "global_step": 74275, "epoch": 1768} {"train_loss": -6.058004379272461, "global_step": 74276, "epoch": 1768} {"train_loss": -6.038471221923828, "global_step": 74277, "epoch": 1768} {"train_loss": -6.138932228088379, "global_step": 74278, "epoch": 1768} {"train_loss": -6.088251113891602, "global_step": 74279, "epoch": 1768} {"train_loss": -5.97734260559082, "global_step": 74280, "epoch": 1768} {"train_loss": -5.978115081787109, "global_step": 74281, "epoch": 1768} {"train_loss": -6.1901092529296875, "global_step": 74282, "epoch": 1768} {"train_loss": -6.016790390014648, "global_step": 74283, "epoch": 1768} {"train_loss": -5.972683906555176, "global_step": 74284, "epoch": 1768} {"train_loss": -5.9987359046936035, "global_step": 74285, "epoch": 1768} {"train_loss": -6.099546432495117, "global_step": 74286, "epoch": 1768} {"train_loss": -6.089705944061279, "global_step": 74287, "epoch": 1768} {"train_loss": -6.14995813369751, "global_step": 74288, "epoch": 1768} {"train_loss": -5.957914352416992, "global_step": 74289, "epoch": 1768} {"train_loss": -6.085810661315918, "global_step": 74290, "epoch": 1768} {"train_loss": -5.996774673461914, "global_step": 74291, "epoch": 1768} {"train_loss": -6.082859516143799, "global_step": 74292, "epoch": 1768} {"train_loss": -6.108032703399658, "global_step": 74293, "epoch": 1768} {"train_loss": -5.976048946380615, "global_step": 74294, "epoch": 1768} {"train_loss": -5.917847633361816, "global_step": 74295, "epoch": 1768} {"train_loss": -6.119699478149414, "global_step": 74296, "epoch": 1768} {"train_loss": -6.055087350663685, "global_step": 74297, "epoch": 1768, "val_loss": 67099.8046875} {"train_loss": -6.160163402557373, "global_step": 74298, "epoch": 1769} {"train_loss": -5.990206241607666, "global_step": 74299, "epoch": 1769} {"train_loss": -6.007089138031006, "global_step": 74300, "epoch": 1769} {"train_loss": -6.124006748199463, "global_step": 74301, "epoch": 1769} {"train_loss": -6.033974647521973, "global_step": 74302, "epoch": 1769} {"train_loss": -5.99869441986084, "global_step": 74303, "epoch": 1769} {"train_loss": -5.998458385467529, "global_step": 74304, "epoch": 1769} {"train_loss": -6.1577677726745605, "global_step": 74305, "epoch": 1769} {"train_loss": -6.139512062072754, "global_step": 74306, "epoch": 1769} {"train_loss": -5.922473430633545, "global_step": 74307, "epoch": 1769} {"train_loss": -6.1637115478515625, "global_step": 74308, "epoch": 1769} {"train_loss": -6.011449813842773, "global_step": 74309, "epoch": 1769} {"train_loss": -6.031323432922363, "global_step": 74310, "epoch": 1769} {"train_loss": -6.08394718170166, "global_step": 74311, "epoch": 1769} {"train_loss": -6.067251205444336, "global_step": 74312, "epoch": 1769} {"train_loss": -6.193635940551758, "global_step": 74313, "epoch": 1769} {"train_loss": -6.093512535095215, "global_step": 74314, "epoch": 1769} {"train_loss": -6.047975540161133, "global_step": 74315, "epoch": 1769} {"train_loss": -5.930611610412598, "global_step": 74316, "epoch": 1769} {"train_loss": -6.0190110206604, "global_step": 74317, "epoch": 1769} {"train_loss": -6.125078201293945, "global_step": 74318, "epoch": 1769} {"train_loss": -5.989174842834473, "global_step": 74319, "epoch": 1769} {"train_loss": -6.121222496032715, "global_step": 74320, "epoch": 1769} {"train_loss": -6.084697723388672, "global_step": 74321, "epoch": 1769} {"train_loss": -6.000942707061768, "global_step": 74322, "epoch": 1769} {"train_loss": -6.162898063659668, "global_step": 74323, "epoch": 1769} {"train_loss": -6.07318639755249, "global_step": 74324, "epoch": 1769} {"train_loss": -5.9330525398254395, "global_step": 74325, "epoch": 1769} {"train_loss": -6.116899013519287, "global_step": 74326, "epoch": 1769} {"train_loss": -6.110964775085449, "global_step": 74327, "epoch": 1769} {"train_loss": -6.012860298156738, "global_step": 74328, "epoch": 1769} {"train_loss": -6.079665184020996, "global_step": 74329, "epoch": 1769} {"train_loss": -6.113563060760498, "global_step": 74330, "epoch": 1769} {"train_loss": -6.055172443389893, "global_step": 74331, "epoch": 1769} {"train_loss": -6.125650405883789, "global_step": 74332, "epoch": 1769} {"train_loss": -6.0449910163879395, "global_step": 74333, "epoch": 1769} {"train_loss": -6.060762405395508, "global_step": 74334, "epoch": 1769} {"train_loss": -6.019909858703613, "global_step": 74335, "epoch": 1769} {"train_loss": -5.963768005371094, "global_step": 74336, "epoch": 1769} {"train_loss": -6.086960792541504, "global_step": 74337, "epoch": 1769} {"train_loss": -6.068941593170166, "global_step": 74338, "epoch": 1769} {"train_loss": -6.057879016512916, "global_step": 74339, "epoch": 1769, "val_loss": 67294.0625} {"train_loss": -6.027788162231445, "global_step": 74340, "epoch": 1770} {"train_loss": -5.967566013336182, "global_step": 74341, "epoch": 1770} {"train_loss": -6.061135292053223, "global_step": 74342, "epoch": 1770} {"train_loss": -6.034519195556641, "global_step": 74343, "epoch": 1770} {"train_loss": -6.015993118286133, "global_step": 74344, "epoch": 1770} {"train_loss": -6.139916896820068, "global_step": 74345, "epoch": 1770} {"train_loss": -6.13965368270874, "global_step": 74346, "epoch": 1770} {"train_loss": -6.134535789489746, "global_step": 74347, "epoch": 1770} {"train_loss": -5.992160797119141, "global_step": 74348, "epoch": 1770} {"train_loss": -6.054976463317871, "global_step": 74349, "epoch": 1770} {"train_loss": -6.0479278564453125, "global_step": 74350, "epoch": 1770} {"train_loss": -6.157179832458496, "global_step": 74351, "epoch": 1770} {"train_loss": -6.036299705505371, "global_step": 74352, "epoch": 1770} {"train_loss": -6.1171875, "global_step": 74353, "epoch": 1770} {"train_loss": -6.018161773681641, "global_step": 74354, "epoch": 1770} {"train_loss": -6.027949810028076, "global_step": 74355, "epoch": 1770} {"train_loss": -5.8978071212768555, "global_step": 74356, "epoch": 1770} {"train_loss": -5.940511703491211, "global_step": 74357, "epoch": 1770} {"train_loss": -5.859606742858887, "global_step": 74358, "epoch": 1770} {"train_loss": -5.945949554443359, "global_step": 74359, "epoch": 1770} {"train_loss": -6.022861957550049, "global_step": 74360, "epoch": 1770} {"train_loss": -5.778654098510742, "global_step": 74361, "epoch": 1770} {"train_loss": -6.0755295753479, "global_step": 74362, "epoch": 1770} {"train_loss": -5.900811195373535, "global_step": 74363, "epoch": 1770} {"train_loss": -6.03105354309082, "global_step": 74364, "epoch": 1770} {"train_loss": -6.055908679962158, "global_step": 74365, "epoch": 1770} {"train_loss": -5.940672874450684, "global_step": 74366, "epoch": 1770} {"train_loss": -5.844999313354492, "global_step": 74367, "epoch": 1770} {"train_loss": -6.177999973297119, "global_step": 74368, "epoch": 1770} {"train_loss": -6.035957336425781, "global_step": 74369, "epoch": 1770} {"train_loss": -5.921300888061523, "global_step": 74370, "epoch": 1770} {"train_loss": -5.853434085845947, "global_step": 74371, "epoch": 1770} {"train_loss": -6.141388893127441, "global_step": 74372, "epoch": 1770} {"train_loss": -6.102324485778809, "global_step": 74373, "epoch": 1770} {"train_loss": -6.127676010131836, "global_step": 74374, "epoch": 1770} {"train_loss": -6.106546401977539, "global_step": 74375, "epoch": 1770} {"train_loss": -6.017083168029785, "global_step": 74376, "epoch": 1770} {"train_loss": -6.0540771484375, "global_step": 74377, "epoch": 1770} {"train_loss": -5.998418807983398, "global_step": 74378, "epoch": 1770} {"train_loss": -6.034066677093506, "global_step": 74379, "epoch": 1770} {"train_loss": -5.999911785125732, "global_step": 74380, "epoch": 1770} {"train_loss": -6.023104735783169, "global_step": 74381, "epoch": 1770, "val_loss": 67135.515625} {"train_loss": -6.070250511169434, "global_step": 74382, "epoch": 1771} {"train_loss": -6.218377590179443, "global_step": 74383, "epoch": 1771} {"train_loss": -6.107827186584473, "global_step": 74384, "epoch": 1771} {"train_loss": -6.122298240661621, "global_step": 74385, "epoch": 1771} {"train_loss": -6.112529754638672, "global_step": 74386, "epoch": 1771} {"train_loss": -6.119045257568359, "global_step": 74387, "epoch": 1771} {"train_loss": -6.122270584106445, "global_step": 74388, "epoch": 1771} {"train_loss": -6.020087242126465, "global_step": 74389, "epoch": 1771} {"train_loss": -5.992396831512451, "global_step": 74390, "epoch": 1771} {"train_loss": -6.071016788482666, "global_step": 74391, "epoch": 1771} {"train_loss": -6.002359390258789, "global_step": 74392, "epoch": 1771} {"train_loss": -6.100628852844238, "global_step": 74393, "epoch": 1771} {"train_loss": -6.123790264129639, "global_step": 74394, "epoch": 1771} {"train_loss": -6.0277814865112305, "global_step": 74395, "epoch": 1771} {"train_loss": -6.065802097320557, "global_step": 74396, "epoch": 1771} {"train_loss": -5.97036075592041, "global_step": 74397, "epoch": 1771} {"train_loss": -6.112912178039551, "global_step": 74398, "epoch": 1771} {"train_loss": -6.195411682128906, "global_step": 74399, "epoch": 1771} {"train_loss": -6.044613361358643, "global_step": 74400, "epoch": 1771} {"train_loss": -6.0073347091674805, "global_step": 74401, "epoch": 1771} {"train_loss": -6.027298450469971, "global_step": 74402, "epoch": 1771} {"train_loss": -6.073465824127197, "global_step": 74403, "epoch": 1771} {"train_loss": -6.102126121520996, "global_step": 74404, "epoch": 1771} {"train_loss": -5.974498271942139, "global_step": 74405, "epoch": 1771} {"train_loss": -6.069553852081299, "global_step": 74406, "epoch": 1771} {"train_loss": -6.0114030838012695, "global_step": 74407, "epoch": 1771} {"train_loss": -6.027113914489746, "global_step": 74408, "epoch": 1771} {"train_loss": -6.010765075683594, "global_step": 74409, "epoch": 1771} {"train_loss": -5.976913928985596, "global_step": 74410, "epoch": 1771} {"train_loss": -6.013896942138672, "global_step": 74411, "epoch": 1771} {"train_loss": -5.984845161437988, "global_step": 74412, "epoch": 1771} {"train_loss": -6.038824081420898, "global_step": 74413, "epoch": 1771} {"train_loss": -5.944450378417969, "global_step": 74414, "epoch": 1771} {"train_loss": -6.0985894203186035, "global_step": 74415, "epoch": 1771} {"train_loss": -6.092634201049805, "global_step": 74416, "epoch": 1771} {"train_loss": -5.967632293701172, "global_step": 74417, "epoch": 1771} {"train_loss": -6.112698554992676, "global_step": 74418, "epoch": 1771} {"train_loss": -5.988076210021973, "global_step": 74419, "epoch": 1771} {"train_loss": -6.054729461669922, "global_step": 74420, "epoch": 1771} {"train_loss": -6.075679779052734, "global_step": 74421, "epoch": 1771} {"train_loss": -6.070719242095947, "global_step": 74422, "epoch": 1771} {"train_loss": -6.056965816588629, "global_step": 74423, "epoch": 1771, "val_loss": 67315.8828125} {"train_loss": -6.200689315795898, "global_step": 74424, "epoch": 1772} {"train_loss": -6.051787376403809, "global_step": 74425, "epoch": 1772} {"train_loss": -6.168423652648926, "global_step": 74426, "epoch": 1772} {"train_loss": -6.112569808959961, "global_step": 74427, "epoch": 1772} {"train_loss": -6.022151470184326, "global_step": 74428, "epoch": 1772} {"train_loss": -6.203600883483887, "global_step": 74429, "epoch": 1772} {"train_loss": -6.018448829650879, "global_step": 74430, "epoch": 1772} {"train_loss": -6.099825382232666, "global_step": 74431, "epoch": 1772} {"train_loss": -6.08670711517334, "global_step": 74432, "epoch": 1772} {"train_loss": -6.208252429962158, "global_step": 74433, "epoch": 1772} {"train_loss": -6.1585164070129395, "global_step": 74434, "epoch": 1772} {"train_loss": -6.106680870056152, "global_step": 74435, "epoch": 1772} {"train_loss": -6.012152671813965, "global_step": 74436, "epoch": 1772} {"train_loss": -6.177708625793457, "global_step": 74437, "epoch": 1772} {"train_loss": -6.062561511993408, "global_step": 74438, "epoch": 1772} {"train_loss": -6.10428524017334, "global_step": 74439, "epoch": 1772} {"train_loss": -6.166278839111328, "global_step": 74440, "epoch": 1772} {"train_loss": -5.9517107009887695, "global_step": 74441, "epoch": 1772} {"train_loss": -5.975040435791016, "global_step": 74442, "epoch": 1772} {"train_loss": -6.103191375732422, "global_step": 74443, "epoch": 1772} {"train_loss": -6.050917625427246, "global_step": 74444, "epoch": 1772} {"train_loss": -6.02036190032959, "global_step": 74445, "epoch": 1772} {"train_loss": -5.924439430236816, "global_step": 74446, "epoch": 1772} {"train_loss": -6.071903705596924, "global_step": 74447, "epoch": 1772} {"train_loss": -6.132296085357666, "global_step": 74448, "epoch": 1772} {"train_loss": -6.117650985717773, "global_step": 74449, "epoch": 1772} {"train_loss": -6.066188335418701, "global_step": 74450, "epoch": 1772} {"train_loss": -6.114382743835449, "global_step": 74451, "epoch": 1772} {"train_loss": -5.912571907043457, "global_step": 74452, "epoch": 1772} {"train_loss": -6.064071178436279, "global_step": 74453, "epoch": 1772} {"train_loss": -5.973742961883545, "global_step": 74454, "epoch": 1772} {"train_loss": -6.100269794464111, "global_step": 74455, "epoch": 1772} {"train_loss": -6.065451145172119, "global_step": 74456, "epoch": 1772} {"train_loss": -6.04417610168457, "global_step": 74457, "epoch": 1772} {"train_loss": -6.001800537109375, "global_step": 74458, "epoch": 1772} {"train_loss": -5.970917701721191, "global_step": 74459, "epoch": 1772} {"train_loss": -6.129791259765625, "global_step": 74460, "epoch": 1772} {"train_loss": -6.010621070861816, "global_step": 74461, "epoch": 1772} {"train_loss": -5.956470966339111, "global_step": 74462, "epoch": 1772} {"train_loss": -6.1138787269592285, "global_step": 74463, "epoch": 1772} {"train_loss": -6.051534175872803, "global_step": 74464, "epoch": 1772} {"train_loss": -6.0691085656483965, "global_step": 74465, "epoch": 1772, "val_loss": 67287.390625} {"train_loss": -5.943201541900635, "global_step": 74466, "epoch": 1773} {"train_loss": -6.03120756149292, "global_step": 74467, "epoch": 1773} {"train_loss": -6.030191421508789, "global_step": 74468, "epoch": 1773} {"train_loss": -6.086409568786621, "global_step": 74469, "epoch": 1773} {"train_loss": -5.987510681152344, "global_step": 74470, "epoch": 1773} {"train_loss": -6.031908988952637, "global_step": 74471, "epoch": 1773} {"train_loss": -6.143799781799316, "global_step": 74472, "epoch": 1773} {"train_loss": -6.075446128845215, "global_step": 74473, "epoch": 1773} {"train_loss": -5.961040496826172, "global_step": 74474, "epoch": 1773} {"train_loss": -6.14442777633667, "global_step": 74475, "epoch": 1773} {"train_loss": -6.114708423614502, "global_step": 74476, "epoch": 1773} {"train_loss": -6.033849716186523, "global_step": 74477, "epoch": 1773} {"train_loss": -5.99949312210083, "global_step": 74478, "epoch": 1773} {"train_loss": -6.072139739990234, "global_step": 74479, "epoch": 1773} {"train_loss": -6.081323623657227, "global_step": 74480, "epoch": 1773} {"train_loss": -6.06276798248291, "global_step": 74481, "epoch": 1773} {"train_loss": -6.076269149780273, "global_step": 74482, "epoch": 1773} {"train_loss": -6.0342183113098145, "global_step": 74483, "epoch": 1773} {"train_loss": -6.0228376388549805, "global_step": 74484, "epoch": 1773} {"train_loss": -6.044108867645264, "global_step": 74485, "epoch": 1773} {"train_loss": -6.111082077026367, "global_step": 74486, "epoch": 1773} {"train_loss": -6.092167854309082, "global_step": 74487, "epoch": 1773} {"train_loss": -6.066716194152832, "global_step": 74488, "epoch": 1773} {"train_loss": -6.065102577209473, "global_step": 74489, "epoch": 1773} {"train_loss": -6.158173561096191, "global_step": 74490, "epoch": 1773} {"train_loss": -5.9455389976501465, "global_step": 74491, "epoch": 1773} {"train_loss": -6.144372463226318, "global_step": 74492, "epoch": 1773} {"train_loss": -6.107143878936768, "global_step": 74493, "epoch": 1773} {"train_loss": -6.038320541381836, "global_step": 74494, "epoch": 1773} {"train_loss": -6.113570213317871, "global_step": 74495, "epoch": 1773} {"train_loss": -6.0087385177612305, "global_step": 74496, "epoch": 1773} {"train_loss": -6.1527605056762695, "global_step": 74497, "epoch": 1773} {"train_loss": -6.143146991729736, "global_step": 74498, "epoch": 1773} {"train_loss": -5.986032485961914, "global_step": 74499, "epoch": 1773} {"train_loss": -6.067786693572998, "global_step": 74500, "epoch": 1773} {"train_loss": -6.081491947174072, "global_step": 74501, "epoch": 1773} {"train_loss": -6.099850654602051, "global_step": 74502, "epoch": 1773} {"train_loss": -6.116949081420898, "global_step": 74503, "epoch": 1773} {"train_loss": -6.1273579597473145, "global_step": 74504, "epoch": 1773} {"train_loss": -6.140458583831787, "global_step": 74505, "epoch": 1773} {"train_loss": -6.114245891571045, "global_step": 74506, "epoch": 1773} {"train_loss": -6.070167938868205, "global_step": 74507, "epoch": 1773, "val_loss": 67375.75} {"train_loss": -6.180903434753418, "global_step": 74508, "epoch": 1774} {"train_loss": -5.99934196472168, "global_step": 74509, "epoch": 1774} {"train_loss": -6.044527053833008, "global_step": 74510, "epoch": 1774} {"train_loss": -6.028168678283691, "global_step": 74511, "epoch": 1774} {"train_loss": -6.001656532287598, "global_step": 74512, "epoch": 1774} {"train_loss": -5.983436584472656, "global_step": 74513, "epoch": 1774} {"train_loss": -6.012942790985107, "global_step": 74514, "epoch": 1774} {"train_loss": -6.0641188621521, "global_step": 74515, "epoch": 1774} {"train_loss": -6.053499698638916, "global_step": 74516, "epoch": 1774} {"train_loss": -5.975553512573242, "global_step": 74517, "epoch": 1774} {"train_loss": -5.945492744445801, "global_step": 74518, "epoch": 1774} {"train_loss": -5.903355598449707, "global_step": 74519, "epoch": 1774} {"train_loss": -6.146005630493164, "global_step": 74520, "epoch": 1774} {"train_loss": -5.884263515472412, "global_step": 74521, "epoch": 1774} {"train_loss": -6.082063674926758, "global_step": 74522, "epoch": 1774} {"train_loss": -6.040711402893066, "global_step": 74523, "epoch": 1774} {"train_loss": -6.085411071777344, "global_step": 74524, "epoch": 1774} {"train_loss": -6.0073723793029785, "global_step": 74525, "epoch": 1774} {"train_loss": -6.022992134094238, "global_step": 74526, "epoch": 1774} {"train_loss": -6.1600799560546875, "global_step": 74527, "epoch": 1774} {"train_loss": -6.138895034790039, "global_step": 74528, "epoch": 1774} {"train_loss": -6.013167381286621, "global_step": 74529, "epoch": 1774} {"train_loss": -6.072385787963867, "global_step": 74530, "epoch": 1774} {"train_loss": -5.991302490234375, "global_step": 74531, "epoch": 1774} {"train_loss": -6.161923885345459, "global_step": 74532, "epoch": 1774} {"train_loss": -6.020927429199219, "global_step": 74533, "epoch": 1774} {"train_loss": -6.0682172775268555, "global_step": 74534, "epoch": 1774} {"train_loss": -6.12009334564209, "global_step": 74535, "epoch": 1774} {"train_loss": -6.097193717956543, "global_step": 74536, "epoch": 1774} {"train_loss": -6.143243312835693, "global_step": 74537, "epoch": 1774} {"train_loss": -6.114511966705322, "global_step": 74538, "epoch": 1774} {"train_loss": -6.023632526397705, "global_step": 74539, "epoch": 1774} {"train_loss": -6.085301399230957, "global_step": 74540, "epoch": 1774} {"train_loss": -6.005618095397949, "global_step": 74541, "epoch": 1774} {"train_loss": -6.054574489593506, "global_step": 74542, "epoch": 1774} {"train_loss": -6.025338649749756, "global_step": 74543, "epoch": 1774} {"train_loss": -6.100974082946777, "global_step": 74544, "epoch": 1774} {"train_loss": -6.044207572937012, "global_step": 74545, "epoch": 1774} {"train_loss": -6.113969802856445, "global_step": 74546, "epoch": 1774} {"train_loss": -6.1119561195373535, "global_step": 74547, "epoch": 1774} {"train_loss": -5.98572301864624, "global_step": 74548, "epoch": 1774} {"train_loss": -6.047769864400228, "global_step": 74549, "epoch": 1774, "val_loss": 67439.8359375} {"train_loss": -5.952691078186035, "global_step": 74550, "epoch": 1775} {"train_loss": -6.103970050811768, "global_step": 74551, "epoch": 1775} {"train_loss": -6.089674472808838, "global_step": 74552, "epoch": 1775} {"train_loss": -6.088939666748047, "global_step": 74553, "epoch": 1775} {"train_loss": -6.0078535079956055, "global_step": 74554, "epoch": 1775} {"train_loss": -6.054590702056885, "global_step": 74555, "epoch": 1775} {"train_loss": -6.024085998535156, "global_step": 74556, "epoch": 1775} {"train_loss": -5.997723579406738, "global_step": 74557, "epoch": 1775} {"train_loss": -6.189365386962891, "global_step": 74558, "epoch": 1775} {"train_loss": -5.9924635887146, "global_step": 74559, "epoch": 1775} {"train_loss": -6.073716163635254, "global_step": 74560, "epoch": 1775} {"train_loss": -6.136710166931152, "global_step": 74561, "epoch": 1775} {"train_loss": -6.135689735412598, "global_step": 74562, "epoch": 1775} {"train_loss": -6.116544246673584, "global_step": 74563, "epoch": 1775} {"train_loss": -6.092294692993164, "global_step": 74564, "epoch": 1775} {"train_loss": -6.110893249511719, "global_step": 74565, "epoch": 1775} {"train_loss": -6.146957874298096, "global_step": 74566, "epoch": 1775} {"train_loss": -6.132116794586182, "global_step": 74567, "epoch": 1775} {"train_loss": -6.079888820648193, "global_step": 74568, "epoch": 1775} {"train_loss": -6.120538711547852, "global_step": 74569, "epoch": 1775} {"train_loss": -6.054932594299316, "global_step": 74570, "epoch": 1775} {"train_loss": -6.13933801651001, "global_step": 74571, "epoch": 1775} {"train_loss": -5.968506813049316, "global_step": 74572, "epoch": 1775} {"train_loss": -6.096970081329346, "global_step": 74573, "epoch": 1775} {"train_loss": -5.978950023651123, "global_step": 74574, "epoch": 1775} {"train_loss": -6.063114166259766, "global_step": 74575, "epoch": 1775} {"train_loss": -6.0819091796875, "global_step": 74576, "epoch": 1775} {"train_loss": -6.205052375793457, "global_step": 74577, "epoch": 1775} {"train_loss": -6.017421245574951, "global_step": 74578, "epoch": 1775} {"train_loss": -6.000317573547363, "global_step": 74579, "epoch": 1775} {"train_loss": -6.107896327972412, "global_step": 74580, "epoch": 1775} {"train_loss": -6.111743927001953, "global_step": 74581, "epoch": 1775} {"train_loss": -6.129086494445801, "global_step": 74582, "epoch": 1775} {"train_loss": -6.201258659362793, "global_step": 74583, "epoch": 1775} {"train_loss": -6.028695106506348, "global_step": 74584, "epoch": 1775} {"train_loss": -6.016408920288086, "global_step": 74585, "epoch": 1775} {"train_loss": -6.075085639953613, "global_step": 74586, "epoch": 1775} {"train_loss": -5.995796203613281, "global_step": 74587, "epoch": 1775} {"train_loss": -6.182940483093262, "global_step": 74588, "epoch": 1775} {"train_loss": -6.101115703582764, "global_step": 74589, "epoch": 1775} {"train_loss": -6.006295204162598, "global_step": 74590, "epoch": 1775} {"train_loss": -6.0771700995309015, "global_step": 74591, "epoch": 1775, "val_loss": 67651.6171875} {"train_loss": -6.0789899826049805, "global_step": 74592, "epoch": 1776} {"train_loss": -6.1136932373046875, "global_step": 74593, "epoch": 1776} {"train_loss": -6.086530685424805, "global_step": 74594, "epoch": 1776} {"train_loss": -6.063149452209473, "global_step": 74595, "epoch": 1776} {"train_loss": -6.126965522766113, "global_step": 74596, "epoch": 1776} {"train_loss": -6.050824165344238, "global_step": 74597, "epoch": 1776} {"train_loss": -6.096881866455078, "global_step": 74598, "epoch": 1776} {"train_loss": -6.051180839538574, "global_step": 74599, "epoch": 1776} {"train_loss": -6.14841365814209, "global_step": 74600, "epoch": 1776} {"train_loss": -6.064140319824219, "global_step": 74601, "epoch": 1776} {"train_loss": -6.109146595001221, "global_step": 74602, "epoch": 1776} {"train_loss": -6.21608829498291, "global_step": 74603, "epoch": 1776} {"train_loss": -5.974000930786133, "global_step": 74604, "epoch": 1776} {"train_loss": -5.856047630310059, "global_step": 74605, "epoch": 1776} {"train_loss": -5.946089744567871, "global_step": 74606, "epoch": 1776} {"train_loss": -6.0833539962768555, "global_step": 74607, "epoch": 1776} {"train_loss": -5.959748268127441, "global_step": 74608, "epoch": 1776} {"train_loss": -6.143669128417969, "global_step": 74609, "epoch": 1776} {"train_loss": -5.971989631652832, "global_step": 74610, "epoch": 1776} {"train_loss": -6.067575931549072, "global_step": 74611, "epoch": 1776} {"train_loss": -6.072972297668457, "global_step": 74612, "epoch": 1776} {"train_loss": -6.155608654022217, "global_step": 74613, "epoch": 1776} {"train_loss": -6.092139720916748, "global_step": 74614, "epoch": 1776} {"train_loss": -6.133366584777832, "global_step": 74615, "epoch": 1776} {"train_loss": -5.945518493652344, "global_step": 74616, "epoch": 1776} {"train_loss": -6.085685729980469, "global_step": 74617, "epoch": 1776} {"train_loss": -6.137393951416016, "global_step": 74618, "epoch": 1776} {"train_loss": -6.014710903167725, "global_step": 74619, "epoch": 1776} {"train_loss": -6.1409149169921875, "global_step": 74620, "epoch": 1776} {"train_loss": -6.006822109222412, "global_step": 74621, "epoch": 1776} {"train_loss": -6.030648708343506, "global_step": 74622, "epoch": 1776} {"train_loss": -6.187620639801025, "global_step": 74623, "epoch": 1776} {"train_loss": -6.0466156005859375, "global_step": 74624, "epoch": 1776} {"train_loss": -6.088764667510986, "global_step": 74625, "epoch": 1776} {"train_loss": -6.0059967041015625, "global_step": 74626, "epoch": 1776} {"train_loss": -6.012284278869629, "global_step": 74627, "epoch": 1776} {"train_loss": -6.141136169433594, "global_step": 74628, "epoch": 1776} {"train_loss": -6.136178970336914, "global_step": 74629, "epoch": 1776} {"train_loss": -5.911130428314209, "global_step": 74630, "epoch": 1776} {"train_loss": -5.959031105041504, "global_step": 74631, "epoch": 1776} {"train_loss": -6.025430679321289, "global_step": 74632, "epoch": 1776} {"train_loss": -6.0610018117087225, "global_step": 74633, "epoch": 1776, "val_loss": 67485.0078125} {"train_loss": -5.920722484588623, "global_step": 74634, "epoch": 1777} {"train_loss": -5.96856689453125, "global_step": 74635, "epoch": 1777} {"train_loss": -6.040378570556641, "global_step": 74636, "epoch": 1777} {"train_loss": -6.006850242614746, "global_step": 74637, "epoch": 1777} {"train_loss": -6.040557384490967, "global_step": 74638, "epoch": 1777} {"train_loss": -6.03022575378418, "global_step": 74639, "epoch": 1777} {"train_loss": -6.078899383544922, "global_step": 74640, "epoch": 1777} {"train_loss": -6.147801399230957, "global_step": 74641, "epoch": 1777} {"train_loss": -6.17192268371582, "global_step": 74642, "epoch": 1777} {"train_loss": -6.08784294128418, "global_step": 74643, "epoch": 1777} {"train_loss": -6.162275791168213, "global_step": 74644, "epoch": 1777} {"train_loss": -6.108294486999512, "global_step": 74645, "epoch": 1777} {"train_loss": -6.050527572631836, "global_step": 74646, "epoch": 1777} {"train_loss": -6.09244441986084, "global_step": 74647, "epoch": 1777} {"train_loss": -6.17416524887085, "global_step": 74648, "epoch": 1777} {"train_loss": -6.010732650756836, "global_step": 74649, "epoch": 1777} {"train_loss": -6.001287460327148, "global_step": 74650, "epoch": 1777} {"train_loss": -6.129090309143066, "global_step": 74651, "epoch": 1777} {"train_loss": -6.021683692932129, "global_step": 74652, "epoch": 1777} {"train_loss": -6.010246276855469, "global_step": 74653, "epoch": 1777} {"train_loss": -5.936370849609375, "global_step": 74654, "epoch": 1777} {"train_loss": -6.111441135406494, "global_step": 74655, "epoch": 1777} {"train_loss": -6.17707633972168, "global_step": 74656, "epoch": 1777} {"train_loss": -6.054798126220703, "global_step": 74657, "epoch": 1777} {"train_loss": -6.037560939788818, "global_step": 74658, "epoch": 1777} {"train_loss": -6.059106349945068, "global_step": 74659, "epoch": 1777} {"train_loss": -6.064868450164795, "global_step": 74660, "epoch": 1777} {"train_loss": -6.0421857833862305, "global_step": 74661, "epoch": 1777} {"train_loss": -6.075264930725098, "global_step": 74662, "epoch": 1777} {"train_loss": -5.958810329437256, "global_step": 74663, "epoch": 1777} {"train_loss": -6.12649393081665, "global_step": 74664, "epoch": 1777} {"train_loss": -6.091496467590332, "global_step": 74665, "epoch": 1777} {"train_loss": -6.04810905456543, "global_step": 74666, "epoch": 1777} {"train_loss": -5.9739089012146, "global_step": 74667, "epoch": 1777} {"train_loss": -6.077897071838379, "global_step": 74668, "epoch": 1777} {"train_loss": -6.028900146484375, "global_step": 74669, "epoch": 1777} {"train_loss": -6.15255069732666, "global_step": 74670, "epoch": 1777} {"train_loss": -6.092968940734863, "global_step": 74671, "epoch": 1777} {"train_loss": -6.115307807922363, "global_step": 74672, "epoch": 1777} {"train_loss": -6.085812091827393, "global_step": 74673, "epoch": 1777} {"train_loss": -6.105001449584961, "global_step": 74674, "epoch": 1777} {"train_loss": -6.0664925802321665, "global_step": 74675, "epoch": 1777, "val_loss": 67450.4375} {"train_loss": -6.096339225769043, "global_step": 74676, "epoch": 1778} {"train_loss": -6.024110794067383, "global_step": 74677, "epoch": 1778} {"train_loss": -6.015841484069824, "global_step": 74678, "epoch": 1778} {"train_loss": -6.007800102233887, "global_step": 74679, "epoch": 1778} {"train_loss": -6.112186431884766, "global_step": 74680, "epoch": 1778} {"train_loss": -6.045358657836914, "global_step": 74681, "epoch": 1778} {"train_loss": -5.96368408203125, "global_step": 74682, "epoch": 1778} {"train_loss": -6.075316905975342, "global_step": 74683, "epoch": 1778} {"train_loss": -5.981095314025879, "global_step": 74684, "epoch": 1778} {"train_loss": -6.057966232299805, "global_step": 74685, "epoch": 1778} {"train_loss": -5.994451522827148, "global_step": 74686, "epoch": 1778} {"train_loss": -6.079945087432861, "global_step": 74687, "epoch": 1778} {"train_loss": -6.06019401550293, "global_step": 74688, "epoch": 1778} {"train_loss": -6.055022239685059, "global_step": 74689, "epoch": 1778} {"train_loss": -6.084427833557129, "global_step": 74690, "epoch": 1778} {"train_loss": -6.019467353820801, "global_step": 74691, "epoch": 1778} {"train_loss": -6.1081647872924805, "global_step": 74692, "epoch": 1778} {"train_loss": -6.04973030090332, "global_step": 74693, "epoch": 1778} {"train_loss": -6.050151348114014, "global_step": 74694, "epoch": 1778} {"train_loss": -5.985661029815674, "global_step": 74695, "epoch": 1778} {"train_loss": -6.061610221862793, "global_step": 74696, "epoch": 1778} {"train_loss": -6.094267845153809, "global_step": 74697, "epoch": 1778} {"train_loss": -6.067613124847412, "global_step": 74698, "epoch": 1778} {"train_loss": -6.0874762535095215, "global_step": 74699, "epoch": 1778} {"train_loss": -6.07977294921875, "global_step": 74700, "epoch": 1778} {"train_loss": -6.170356750488281, "global_step": 74701, "epoch": 1778} {"train_loss": -6.03712272644043, "global_step": 74702, "epoch": 1778} {"train_loss": -5.925655364990234, "global_step": 74703, "epoch": 1778} {"train_loss": -6.17791748046875, "global_step": 74704, "epoch": 1778} {"train_loss": -6.087291717529297, "global_step": 74705, "epoch": 1778} {"train_loss": -6.114046096801758, "global_step": 74706, "epoch": 1778} {"train_loss": -6.030033111572266, "global_step": 74707, "epoch": 1778} {"train_loss": -6.095721244812012, "global_step": 74708, "epoch": 1778} {"train_loss": -6.1297926902771, "global_step": 74709, "epoch": 1778} {"train_loss": -6.114129066467285, "global_step": 74710, "epoch": 1778} {"train_loss": -6.156101226806641, "global_step": 74711, "epoch": 1778} {"train_loss": -5.976638317108154, "global_step": 74712, "epoch": 1778} {"train_loss": -6.096487998962402, "global_step": 74713, "epoch": 1778} {"train_loss": -5.9756340980529785, "global_step": 74714, "epoch": 1778} {"train_loss": -6.082852363586426, "global_step": 74715, "epoch": 1778} {"train_loss": -6.057790279388428, "global_step": 74716, "epoch": 1778} {"train_loss": -6.063350961321876, "global_step": 74717, "epoch": 1778, "val_loss": 67306.34375} {"train_loss": -6.056910514831543, "global_step": 74718, "epoch": 1779} {"train_loss": -6.125927925109863, "global_step": 74719, "epoch": 1779} {"train_loss": -6.029999732971191, "global_step": 74720, "epoch": 1779} {"train_loss": -6.043505668640137, "global_step": 74721, "epoch": 1779} {"train_loss": -6.212637901306152, "global_step": 74722, "epoch": 1779} {"train_loss": -6.036803722381592, "global_step": 74723, "epoch": 1779} {"train_loss": -6.036593914031982, "global_step": 74724, "epoch": 1779} {"train_loss": -5.997641563415527, "global_step": 74725, "epoch": 1779} {"train_loss": -6.119326591491699, "global_step": 74726, "epoch": 1779} {"train_loss": -6.192248344421387, "global_step": 74727, "epoch": 1779} {"train_loss": -5.983465194702148, "global_step": 74728, "epoch": 1779} {"train_loss": -6.013501167297363, "global_step": 74729, "epoch": 1779} {"train_loss": -6.116145133972168, "global_step": 74730, "epoch": 1779} {"train_loss": -6.095076560974121, "global_step": 74731, "epoch": 1779} {"train_loss": -6.169406414031982, "global_step": 74732, "epoch": 1779} {"train_loss": -6.1419901847839355, "global_step": 74733, "epoch": 1779} {"train_loss": -6.188122749328613, "global_step": 74734, "epoch": 1779} {"train_loss": -6.105959892272949, "global_step": 74735, "epoch": 1779} {"train_loss": -6.067508220672607, "global_step": 74736, "epoch": 1779} {"train_loss": -6.166891098022461, "global_step": 74737, "epoch": 1779} {"train_loss": -6.044360160827637, "global_step": 74738, "epoch": 1779} {"train_loss": -6.079112529754639, "global_step": 74739, "epoch": 1779} {"train_loss": -6.125799655914307, "global_step": 74740, "epoch": 1779} {"train_loss": -6.165910720825195, "global_step": 74741, "epoch": 1779} {"train_loss": -6.131506443023682, "global_step": 74742, "epoch": 1779} {"train_loss": -6.0557451248168945, "global_step": 74743, "epoch": 1779} {"train_loss": -6.15349817276001, "global_step": 74744, "epoch": 1779} {"train_loss": -5.924380302429199, "global_step": 74745, "epoch": 1779} {"train_loss": -5.958978652954102, "global_step": 74746, "epoch": 1779} {"train_loss": -6.069117546081543, "global_step": 74747, "epoch": 1779} {"train_loss": -6.122189044952393, "global_step": 74748, "epoch": 1779} {"train_loss": -6.172411918640137, "global_step": 74749, "epoch": 1779} {"train_loss": -6.042239189147949, "global_step": 74750, "epoch": 1779} {"train_loss": -6.09367561340332, "global_step": 74751, "epoch": 1779} {"train_loss": -6.118839263916016, "global_step": 74752, "epoch": 1779} {"train_loss": -6.061253070831299, "global_step": 74753, "epoch": 1779} {"train_loss": -6.0313568115234375, "global_step": 74754, "epoch": 1779} {"train_loss": -6.140695571899414, "global_step": 74755, "epoch": 1779} {"train_loss": -6.042702674865723, "global_step": 74756, "epoch": 1779} {"train_loss": -6.115771293640137, "global_step": 74757, "epoch": 1779} {"train_loss": -6.210693359375, "global_step": 74758, "epoch": 1779} {"train_loss": -6.093656029020037, "global_step": 74759, "epoch": 1779, "val_loss": 67428.7421875} {"train_loss": -5.98758602142334, "global_step": 74760, "epoch": 1780} {"train_loss": -6.12500524520874, "global_step": 74761, "epoch": 1780} {"train_loss": -6.116204261779785, "global_step": 74762, "epoch": 1780} {"train_loss": -6.149741172790527, "global_step": 74763, "epoch": 1780} {"train_loss": -6.087347507476807, "global_step": 74764, "epoch": 1780} {"train_loss": -6.085970878601074, "global_step": 74765, "epoch": 1780} {"train_loss": -6.094300270080566, "global_step": 74766, "epoch": 1780} {"train_loss": -6.1204328536987305, "global_step": 74767, "epoch": 1780} {"train_loss": -6.084417819976807, "global_step": 74768, "epoch": 1780} {"train_loss": -5.9503092765808105, "global_step": 74769, "epoch": 1780} {"train_loss": -6.099522590637207, "global_step": 74770, "epoch": 1780} {"train_loss": -5.9777069091796875, "global_step": 74771, "epoch": 1780} {"train_loss": -6.02434778213501, "global_step": 74772, "epoch": 1780} {"train_loss": -6.024453163146973, "global_step": 74773, "epoch": 1780} {"train_loss": -6.100136756896973, "global_step": 74774, "epoch": 1780} {"train_loss": -6.061322212219238, "global_step": 74775, "epoch": 1780} {"train_loss": -6.157468318939209, "global_step": 74776, "epoch": 1780} {"train_loss": -6.084528923034668, "global_step": 74777, "epoch": 1780} {"train_loss": -6.009209632873535, "global_step": 74778, "epoch": 1780} {"train_loss": -6.125378608703613, "global_step": 74779, "epoch": 1780} {"train_loss": -5.959082126617432, "global_step": 74780, "epoch": 1780} {"train_loss": -6.040548324584961, "global_step": 74781, "epoch": 1780} {"train_loss": -5.878993034362793, "global_step": 74782, "epoch": 1780} {"train_loss": -5.895909309387207, "global_step": 74783, "epoch": 1780} {"train_loss": -6.137929439544678, "global_step": 74784, "epoch": 1780} {"train_loss": -6.151786804199219, "global_step": 74785, "epoch": 1780} {"train_loss": -6.0145111083984375, "global_step": 74786, "epoch": 1780} {"train_loss": -6.054100036621094, "global_step": 74787, "epoch": 1780} {"train_loss": -6.014057159423828, "global_step": 74788, "epoch": 1780} {"train_loss": -6.006518363952637, "global_step": 74789, "epoch": 1780} {"train_loss": -6.165751934051514, "global_step": 74790, "epoch": 1780} {"train_loss": -6.004612922668457, "global_step": 74791, "epoch": 1780} {"train_loss": -6.123337745666504, "global_step": 74792, "epoch": 1780} {"train_loss": -6.092983245849609, "global_step": 74793, "epoch": 1780} {"train_loss": -6.005242347717285, "global_step": 74794, "epoch": 1780} {"train_loss": -5.95224666595459, "global_step": 74795, "epoch": 1780} {"train_loss": -6.078348159790039, "global_step": 74796, "epoch": 1780} {"train_loss": -5.9936981201171875, "global_step": 74797, "epoch": 1780} {"train_loss": -6.079597473144531, "global_step": 74798, "epoch": 1780} {"train_loss": -5.973239898681641, "global_step": 74799, "epoch": 1780} {"train_loss": -5.999030590057373, "global_step": 74800, "epoch": 1780} {"train_loss": -6.050419035412016, "global_step": 74801, "epoch": 1780, "val_loss": 67454.765625} {"train_loss": -6.038543701171875, "global_step": 74802, "epoch": 1781} {"train_loss": -6.105504035949707, "global_step": 74803, "epoch": 1781} {"train_loss": -6.030608177185059, "global_step": 74804, "epoch": 1781} {"train_loss": -5.991034984588623, "global_step": 74805, "epoch": 1781} {"train_loss": -6.072518825531006, "global_step": 74806, "epoch": 1781} {"train_loss": -6.062155723571777, "global_step": 74807, "epoch": 1781} {"train_loss": -5.998711585998535, "global_step": 74808, "epoch": 1781} {"train_loss": -6.101726531982422, "global_step": 74809, "epoch": 1781} {"train_loss": -5.918669700622559, "global_step": 74810, "epoch": 1781} {"train_loss": -6.07251501083374, "global_step": 74811, "epoch": 1781} {"train_loss": -6.067546367645264, "global_step": 74812, "epoch": 1781} {"train_loss": -6.062707901000977, "global_step": 74813, "epoch": 1781} {"train_loss": -6.0991106033325195, "global_step": 74814, "epoch": 1781} {"train_loss": -6.02604341506958, "global_step": 74815, "epoch": 1781} {"train_loss": -5.990424156188965, "global_step": 74816, "epoch": 1781} {"train_loss": -6.072547435760498, "global_step": 74817, "epoch": 1781} {"train_loss": -6.041484832763672, "global_step": 74818, "epoch": 1781} {"train_loss": -6.166874885559082, "global_step": 74819, "epoch": 1781} {"train_loss": -6.088043212890625, "global_step": 74820, "epoch": 1781} {"train_loss": -6.123016357421875, "global_step": 74821, "epoch": 1781} {"train_loss": -6.074385643005371, "global_step": 74822, "epoch": 1781} {"train_loss": -6.261802673339844, "global_step": 74823, "epoch": 1781} {"train_loss": -6.095036506652832, "global_step": 74824, "epoch": 1781} {"train_loss": -5.959777355194092, "global_step": 74825, "epoch": 1781} {"train_loss": -6.144248962402344, "global_step": 74826, "epoch": 1781} {"train_loss": -6.195051193237305, "global_step": 74827, "epoch": 1781} {"train_loss": -6.0789570808410645, "global_step": 74828, "epoch": 1781} {"train_loss": -6.087375640869141, "global_step": 74829, "epoch": 1781} {"train_loss": -6.078151226043701, "global_step": 74830, "epoch": 1781} {"train_loss": -6.1580491065979, "global_step": 74831, "epoch": 1781} {"train_loss": -6.097010135650635, "global_step": 74832, "epoch": 1781} {"train_loss": -5.983910083770752, "global_step": 74833, "epoch": 1781} {"train_loss": -6.008691787719727, "global_step": 74834, "epoch": 1781} {"train_loss": -6.082155704498291, "global_step": 74835, "epoch": 1781} {"train_loss": -5.989381790161133, "global_step": 74836, "epoch": 1781} {"train_loss": -6.0223517417907715, "global_step": 74837, "epoch": 1781} {"train_loss": -6.1606245040893555, "global_step": 74838, "epoch": 1781} {"train_loss": -6.179778099060059, "global_step": 74839, "epoch": 1781} {"train_loss": -5.991393566131592, "global_step": 74840, "epoch": 1781} {"train_loss": -6.045186996459961, "global_step": 74841, "epoch": 1781} {"train_loss": -6.131473064422607, "global_step": 74842, "epoch": 1781} {"train_loss": -6.072661831265404, "global_step": 74843, "epoch": 1781, "val_loss": 67346.8359375} {"train_loss": -6.075568675994873, "global_step": 74844, "epoch": 1782} {"train_loss": -6.074748992919922, "global_step": 74845, "epoch": 1782} {"train_loss": -6.080314636230469, "global_step": 74846, "epoch": 1782} {"train_loss": -6.121878147125244, "global_step": 74847, "epoch": 1782} {"train_loss": -6.215097427368164, "global_step": 74848, "epoch": 1782} {"train_loss": -6.120170593261719, "global_step": 74849, "epoch": 1782} {"train_loss": -6.037934303283691, "global_step": 74850, "epoch": 1782} {"train_loss": -6.1270222663879395, "global_step": 74851, "epoch": 1782} {"train_loss": -6.063638687133789, "global_step": 74852, "epoch": 1782} {"train_loss": -6.098493576049805, "global_step": 74853, "epoch": 1782} {"train_loss": -6.060943126678467, "global_step": 74854, "epoch": 1782} {"train_loss": -5.990719795227051, "global_step": 74855, "epoch": 1782} {"train_loss": -6.1400065422058105, "global_step": 74856, "epoch": 1782} {"train_loss": -6.061405181884766, "global_step": 74857, "epoch": 1782} {"train_loss": -6.077054500579834, "global_step": 74858, "epoch": 1782} {"train_loss": -6.226711273193359, "global_step": 74859, "epoch": 1782} {"train_loss": -6.083855628967285, "global_step": 74860, "epoch": 1782} {"train_loss": -6.095459461212158, "global_step": 74861, "epoch": 1782} {"train_loss": -6.217050552368164, "global_step": 74862, "epoch": 1782} {"train_loss": -6.09524393081665, "global_step": 74863, "epoch": 1782} {"train_loss": -6.083843231201172, "global_step": 74864, "epoch": 1782} {"train_loss": -5.996289253234863, "global_step": 74865, "epoch": 1782} {"train_loss": -6.123661041259766, "global_step": 74866, "epoch": 1782} {"train_loss": -6.0497236251831055, "global_step": 74867, "epoch": 1782} {"train_loss": -5.954556941986084, "global_step": 74868, "epoch": 1782} {"train_loss": -6.04042911529541, "global_step": 74869, "epoch": 1782} {"train_loss": -5.992473602294922, "global_step": 74870, "epoch": 1782} {"train_loss": -6.040627479553223, "global_step": 74871, "epoch": 1782} {"train_loss": -5.847111225128174, "global_step": 74872, "epoch": 1782} {"train_loss": -6.022714138031006, "global_step": 74873, "epoch": 1782} {"train_loss": -6.024178504943848, "global_step": 74874, "epoch": 1782} {"train_loss": -5.832963943481445, "global_step": 74875, "epoch": 1782} {"train_loss": -6.041140556335449, "global_step": 74876, "epoch": 1782} {"train_loss": -5.951545238494873, "global_step": 74877, "epoch": 1782} {"train_loss": -6.082293510437012, "global_step": 74878, "epoch": 1782} {"train_loss": -6.028599739074707, "global_step": 74879, "epoch": 1782} {"train_loss": -5.948446273803711, "global_step": 74880, "epoch": 1782} {"train_loss": -5.980307579040527, "global_step": 74881, "epoch": 1782} {"train_loss": -6.03889274597168, "global_step": 74882, "epoch": 1782} {"train_loss": -6.041592597961426, "global_step": 74883, "epoch": 1782} {"train_loss": -5.797765254974365, "global_step": 74884, "epoch": 1782} {"train_loss": -6.0488307021913075, "global_step": 74885, "epoch": 1782, "val_loss": 67579.90625} {"train_loss": -5.999903678894043, "global_step": 74886, "epoch": 1783} {"train_loss": -5.986306190490723, "global_step": 74887, "epoch": 1783} {"train_loss": -5.854467391967773, "global_step": 74888, "epoch": 1783} {"train_loss": -6.083499431610107, "global_step": 74889, "epoch": 1783} {"train_loss": -6.010762691497803, "global_step": 74890, "epoch": 1783} {"train_loss": -5.991371154785156, "global_step": 74891, "epoch": 1783} {"train_loss": -6.073796272277832, "global_step": 74892, "epoch": 1783} {"train_loss": -5.995594024658203, "global_step": 74893, "epoch": 1783} {"train_loss": -6.075817108154297, "global_step": 74894, "epoch": 1783} {"train_loss": -6.032459259033203, "global_step": 74895, "epoch": 1783} {"train_loss": -5.940058708190918, "global_step": 74896, "epoch": 1783} {"train_loss": -6.174300670623779, "global_step": 74897, "epoch": 1783} {"train_loss": -5.899981498718262, "global_step": 74898, "epoch": 1783} {"train_loss": -6.212676048278809, "global_step": 74899, "epoch": 1783} {"train_loss": -6.059704780578613, "global_step": 74900, "epoch": 1783} {"train_loss": -6.1326518058776855, "global_step": 74901, "epoch": 1783} {"train_loss": -6.160488605499268, "global_step": 74902, "epoch": 1783} {"train_loss": -6.068172931671143, "global_step": 74903, "epoch": 1783} {"train_loss": -6.023751258850098, "global_step": 74904, "epoch": 1783} {"train_loss": -6.13953971862793, "global_step": 74905, "epoch": 1783} {"train_loss": -6.122708797454834, "global_step": 74906, "epoch": 1783} {"train_loss": -6.049005031585693, "global_step": 74907, "epoch": 1783} {"train_loss": -6.091102600097656, "global_step": 74908, "epoch": 1783} {"train_loss": -6.055110931396484, "global_step": 74909, "epoch": 1783} {"train_loss": -6.084099292755127, "global_step": 74910, "epoch": 1783} {"train_loss": -6.071042060852051, "global_step": 74911, "epoch": 1783} {"train_loss": -5.976810455322266, "global_step": 74912, "epoch": 1783} {"train_loss": -5.996641159057617, "global_step": 74913, "epoch": 1783} {"train_loss": -5.972131252288818, "global_step": 74914, "epoch": 1783} {"train_loss": -6.080144882202148, "global_step": 74915, "epoch": 1783} {"train_loss": -6.131442070007324, "global_step": 74916, "epoch": 1783} {"train_loss": -6.084142684936523, "global_step": 74917, "epoch": 1783} {"train_loss": -6.062197685241699, "global_step": 74918, "epoch": 1783} {"train_loss": -6.09972620010376, "global_step": 74919, "epoch": 1783} {"train_loss": -5.8851165771484375, "global_step": 74920, "epoch": 1783} {"train_loss": -5.988354206085205, "global_step": 74921, "epoch": 1783} {"train_loss": -6.077045440673828, "global_step": 74922, "epoch": 1783} {"train_loss": -5.99868631362915, "global_step": 74923, "epoch": 1783} {"train_loss": -6.056377410888672, "global_step": 74924, "epoch": 1783} {"train_loss": -5.971418380737305, "global_step": 74925, "epoch": 1783} {"train_loss": -5.8659749031066895, "global_step": 74926, "epoch": 1783} {"train_loss": -6.037487086795625, "global_step": 74927, "epoch": 1783, "val_loss": 67633.390625} {"train_loss": -6.026773452758789, "global_step": 74928, "epoch": 1784} {"train_loss": -6.047001838684082, "global_step": 74929, "epoch": 1784} {"train_loss": -6.060954570770264, "global_step": 74930, "epoch": 1784} {"train_loss": -6.118095397949219, "global_step": 74931, "epoch": 1784} {"train_loss": -5.9803266525268555, "global_step": 74932, "epoch": 1784} {"train_loss": -6.135165691375732, "global_step": 74933, "epoch": 1784} {"train_loss": -5.907236099243164, "global_step": 74934, "epoch": 1784} {"train_loss": -6.093788146972656, "global_step": 74935, "epoch": 1784} {"train_loss": -6.049251079559326, "global_step": 74936, "epoch": 1784} {"train_loss": -6.054560661315918, "global_step": 74937, "epoch": 1784} {"train_loss": -6.035401821136475, "global_step": 74938, "epoch": 1784} {"train_loss": -6.023898124694824, "global_step": 74939, "epoch": 1784} {"train_loss": -6.166416168212891, "global_step": 74940, "epoch": 1784} {"train_loss": -5.94661808013916, "global_step": 74941, "epoch": 1784} {"train_loss": -6.068448066711426, "global_step": 74942, "epoch": 1784} {"train_loss": -6.052775859832764, "global_step": 74943, "epoch": 1784} {"train_loss": -6.021028518676758, "global_step": 74944, "epoch": 1784} {"train_loss": -6.093263626098633, "global_step": 74945, "epoch": 1784} {"train_loss": -6.027012825012207, "global_step": 74946, "epoch": 1784} {"train_loss": -6.189267158508301, "global_step": 74947, "epoch": 1784} {"train_loss": -6.079649925231934, "global_step": 74948, "epoch": 1784} {"train_loss": -6.193730354309082, "global_step": 74949, "epoch": 1784} {"train_loss": -6.124283313751221, "global_step": 74950, "epoch": 1784} {"train_loss": -6.023800849914551, "global_step": 74951, "epoch": 1784} {"train_loss": -6.202874660491943, "global_step": 74952, "epoch": 1784} {"train_loss": -5.926821231842041, "global_step": 74953, "epoch": 1784} {"train_loss": -6.079597473144531, "global_step": 74954, "epoch": 1784} {"train_loss": -6.124608516693115, "global_step": 74955, "epoch": 1784} {"train_loss": -6.083603858947754, "global_step": 74956, "epoch": 1784} {"train_loss": -6.085223197937012, "global_step": 74957, "epoch": 1784} {"train_loss": -6.049117565155029, "global_step": 74958, "epoch": 1784} {"train_loss": -6.027534484863281, "global_step": 74959, "epoch": 1784} {"train_loss": -6.013820171356201, "global_step": 74960, "epoch": 1784} {"train_loss": -5.925192832946777, "global_step": 74961, "epoch": 1784} {"train_loss": -6.004207134246826, "global_step": 74962, "epoch": 1784} {"train_loss": -5.96510124206543, "global_step": 74963, "epoch": 1784} {"train_loss": -6.025617599487305, "global_step": 74964, "epoch": 1784} {"train_loss": -6.153336524963379, "global_step": 74965, "epoch": 1784} {"train_loss": -5.9925055503845215, "global_step": 74966, "epoch": 1784} {"train_loss": -6.162003040313721, "global_step": 74967, "epoch": 1784} {"train_loss": -6.083310127258301, "global_step": 74968, "epoch": 1784} {"train_loss": -6.060350304558163, "global_step": 74969, "epoch": 1784, "val_loss": 67555.984375} {"train_loss": -6.158034324645996, "global_step": 74970, "epoch": 1785} {"train_loss": -6.120616912841797, "global_step": 74971, "epoch": 1785} {"train_loss": -6.044404029846191, "global_step": 74972, "epoch": 1785} {"train_loss": -6.121640682220459, "global_step": 74973, "epoch": 1785} {"train_loss": -6.066132068634033, "global_step": 74974, "epoch": 1785} {"train_loss": -6.105029106140137, "global_step": 74975, "epoch": 1785} {"train_loss": -5.879273891448975, "global_step": 74976, "epoch": 1785} {"train_loss": -6.20136833190918, "global_step": 74977, "epoch": 1785} {"train_loss": -6.004217147827148, "global_step": 74978, "epoch": 1785} {"train_loss": -6.129312992095947, "global_step": 74979, "epoch": 1785} {"train_loss": -6.0310516357421875, "global_step": 74980, "epoch": 1785} {"train_loss": -6.161529541015625, "global_step": 74981, "epoch": 1785} {"train_loss": -6.271055221557617, "global_step": 74982, "epoch": 1785} {"train_loss": -6.022751808166504, "global_step": 74983, "epoch": 1785} {"train_loss": -6.107057571411133, "global_step": 74984, "epoch": 1785} {"train_loss": -6.038715362548828, "global_step": 74985, "epoch": 1785} {"train_loss": -6.130011558532715, "global_step": 74986, "epoch": 1785} {"train_loss": -6.041094779968262, "global_step": 74987, "epoch": 1785} {"train_loss": -6.059155464172363, "global_step": 74988, "epoch": 1785} {"train_loss": -5.979652404785156, "global_step": 74989, "epoch": 1785} {"train_loss": -6.084329605102539, "global_step": 74990, "epoch": 1785} {"train_loss": -5.991739273071289, "global_step": 74991, "epoch": 1785} {"train_loss": -6.06178092956543, "global_step": 74992, "epoch": 1785} {"train_loss": -6.062489032745361, "global_step": 74993, "epoch": 1785} {"train_loss": -5.977314472198486, "global_step": 74994, "epoch": 1785} {"train_loss": -6.0193281173706055, "global_step": 74995, "epoch": 1785} {"train_loss": -5.993344306945801, "global_step": 74996, "epoch": 1785} {"train_loss": -6.051970958709717, "global_step": 74997, "epoch": 1785} {"train_loss": -5.948709964752197, "global_step": 74998, "epoch": 1785} {"train_loss": -5.9645538330078125, "global_step": 74999, "epoch": 1785} {"train_loss": -6.039466857910156, "global_step": 75000, "epoch": 1785} {"train_loss": -5.912574291229248, "global_step": 75001, "epoch": 1785} {"train_loss": -6.063268661499023, "global_step": 75002, "epoch": 1785} {"train_loss": -6.017812728881836, "global_step": 75003, "epoch": 1785} {"train_loss": -6.070278644561768, "global_step": 75004, "epoch": 1785} {"train_loss": -6.039194107055664, "global_step": 75005, "epoch": 1785} {"train_loss": -6.01397180557251, "global_step": 75006, "epoch": 1785} {"train_loss": -6.043576240539551, "global_step": 75007, "epoch": 1785} {"train_loss": -5.9305853843688965, "global_step": 75008, "epoch": 1785} {"train_loss": -6.157668113708496, "global_step": 75009, "epoch": 1785} {"train_loss": -6.008795738220215, "global_step": 75010, "epoch": 1785} {"train_loss": -6.051409335363479, "global_step": 75011, "epoch": 1785, "val_loss": 67505.2734375} {"train_loss": -5.972413063049316, "global_step": 75012, "epoch": 1786} {"train_loss": -6.052616119384766, "global_step": 75013, "epoch": 1786} {"train_loss": -6.088890075683594, "global_step": 75014, "epoch": 1786} {"train_loss": -6.011143207550049, "global_step": 75015, "epoch": 1786} {"train_loss": -5.945920944213867, "global_step": 75016, "epoch": 1786} {"train_loss": -6.196498870849609, "global_step": 75017, "epoch": 1786} {"train_loss": -6.079676628112793, "global_step": 75018, "epoch": 1786} {"train_loss": -6.080972671508789, "global_step": 75019, "epoch": 1786} {"train_loss": -6.012974739074707, "global_step": 75020, "epoch": 1786} {"train_loss": -5.9945526123046875, "global_step": 75021, "epoch": 1786} {"train_loss": -6.1004319190979, "global_step": 75022, "epoch": 1786} {"train_loss": -6.012502193450928, "global_step": 75023, "epoch": 1786} {"train_loss": -6.1101837158203125, "global_step": 75024, "epoch": 1786} {"train_loss": -6.088360786437988, "global_step": 75025, "epoch": 1786} {"train_loss": -6.1021928787231445, "global_step": 75026, "epoch": 1786} {"train_loss": -6.190492153167725, "global_step": 75027, "epoch": 1786} {"train_loss": -5.940706253051758, "global_step": 75028, "epoch": 1786} {"train_loss": -6.005017280578613, "global_step": 75029, "epoch": 1786} {"train_loss": -6.060632705688477, "global_step": 75030, "epoch": 1786} {"train_loss": -6.094418525695801, "global_step": 75031, "epoch": 1786} {"train_loss": -5.853639602661133, "global_step": 75032, "epoch": 1786} {"train_loss": -5.975404739379883, "global_step": 75033, "epoch": 1786} {"train_loss": -6.096929550170898, "global_step": 75034, "epoch": 1786} {"train_loss": -6.018393516540527, "global_step": 75035, "epoch": 1786} {"train_loss": -6.135495185852051, "global_step": 75036, "epoch": 1786} {"train_loss": -6.075748920440674, "global_step": 75037, "epoch": 1786} {"train_loss": -6.11266565322876, "global_step": 75038, "epoch": 1786} {"train_loss": -6.059317588806152, "global_step": 75039, "epoch": 1786} {"train_loss": -6.104012966156006, "global_step": 75040, "epoch": 1786} {"train_loss": -6.170779228210449, "global_step": 75041, "epoch": 1786} {"train_loss": -6.0288405418396, "global_step": 75042, "epoch": 1786} {"train_loss": -6.157617092132568, "global_step": 75043, "epoch": 1786} {"train_loss": -6.052064895629883, "global_step": 75044, "epoch": 1786} {"train_loss": -6.056441307067871, "global_step": 75045, "epoch": 1786} {"train_loss": -6.020188331604004, "global_step": 75046, "epoch": 1786} {"train_loss": -6.144810199737549, "global_step": 75047, "epoch": 1786} {"train_loss": -5.9571380615234375, "global_step": 75048, "epoch": 1786} {"train_loss": -6.1141462326049805, "global_step": 75049, "epoch": 1786} {"train_loss": -6.140629768371582, "global_step": 75050, "epoch": 1786} {"train_loss": -6.104398727416992, "global_step": 75051, "epoch": 1786} {"train_loss": -6.088551998138428, "global_step": 75052, "epoch": 1786} {"train_loss": -6.061960333869571, "global_step": 75053, "epoch": 1786, "val_loss": 67542.1796875} {"train_loss": -5.947197914123535, "global_step": 75054, "epoch": 1787} {"train_loss": -6.086721420288086, "global_step": 75055, "epoch": 1787} {"train_loss": -6.185941696166992, "global_step": 75056, "epoch": 1787} {"train_loss": -6.0357537269592285, "global_step": 75057, "epoch": 1787} {"train_loss": -6.015209197998047, "global_step": 75058, "epoch": 1787} {"train_loss": -6.197333335876465, "global_step": 75059, "epoch": 1787} {"train_loss": -6.059187889099121, "global_step": 75060, "epoch": 1787} {"train_loss": -6.027444839477539, "global_step": 75061, "epoch": 1787} {"train_loss": -6.100415229797363, "global_step": 75062, "epoch": 1787} {"train_loss": -6.09800910949707, "global_step": 75063, "epoch": 1787} {"train_loss": -6.071010589599609, "global_step": 75064, "epoch": 1787} {"train_loss": -5.969374656677246, "global_step": 75065, "epoch": 1787} {"train_loss": -5.948887825012207, "global_step": 75066, "epoch": 1787} {"train_loss": -6.0264668464660645, "global_step": 75067, "epoch": 1787} {"train_loss": -6.086920738220215, "global_step": 75068, "epoch": 1787} {"train_loss": -5.956231117248535, "global_step": 75069, "epoch": 1787} {"train_loss": -6.08336067199707, "global_step": 75070, "epoch": 1787} {"train_loss": -6.064647674560547, "global_step": 75071, "epoch": 1787} {"train_loss": -6.092145919799805, "global_step": 75072, "epoch": 1787} {"train_loss": -6.007352352142334, "global_step": 75073, "epoch": 1787} {"train_loss": -6.112482070922852, "global_step": 75074, "epoch": 1787} {"train_loss": -6.168496131896973, "global_step": 75075, "epoch": 1787} {"train_loss": -6.0703582763671875, "global_step": 75076, "epoch": 1787} {"train_loss": -6.030016899108887, "global_step": 75077, "epoch": 1787} {"train_loss": -5.933144569396973, "global_step": 75078, "epoch": 1787} {"train_loss": -6.076407432556152, "global_step": 75079, "epoch": 1787} {"train_loss": -6.138815879821777, "global_step": 75080, "epoch": 1787} {"train_loss": -6.226896286010742, "global_step": 75081, "epoch": 1787} {"train_loss": -6.053238391876221, "global_step": 75082, "epoch": 1787} {"train_loss": -6.0574774742126465, "global_step": 75083, "epoch": 1787} {"train_loss": -6.008803367614746, "global_step": 75084, "epoch": 1787} {"train_loss": -6.075796127319336, "global_step": 75085, "epoch": 1787} {"train_loss": -5.95349645614624, "global_step": 75086, "epoch": 1787} {"train_loss": -6.0461530685424805, "global_step": 75087, "epoch": 1787} {"train_loss": -6.145620346069336, "global_step": 75088, "epoch": 1787} {"train_loss": -5.9507646560668945, "global_step": 75089, "epoch": 1787} {"train_loss": -6.031110763549805, "global_step": 75090, "epoch": 1787} {"train_loss": -6.028057098388672, "global_step": 75091, "epoch": 1787} {"train_loss": -6.055666446685791, "global_step": 75092, "epoch": 1787} {"train_loss": -6.06884765625, "global_step": 75093, "epoch": 1787} {"train_loss": -5.999869346618652, "global_step": 75094, "epoch": 1787} {"train_loss": -6.054324524743216, "global_step": 75095, "epoch": 1787, "val_loss": 67698.4140625} {"train_loss": -6.062559127807617, "global_step": 75096, "epoch": 1788} {"train_loss": -5.960789680480957, "global_step": 75097, "epoch": 1788} {"train_loss": -6.037538051605225, "global_step": 75098, "epoch": 1788} {"train_loss": -6.0771684646606445, "global_step": 75099, "epoch": 1788} {"train_loss": -6.025345325469971, "global_step": 75100, "epoch": 1788} {"train_loss": -6.002288818359375, "global_step": 75101, "epoch": 1788} {"train_loss": -5.981293678283691, "global_step": 75102, "epoch": 1788} {"train_loss": -6.1260480880737305, "global_step": 75103, "epoch": 1788} {"train_loss": -5.969827651977539, "global_step": 75104, "epoch": 1788} {"train_loss": -5.983290672302246, "global_step": 75105, "epoch": 1788} {"train_loss": -6.089092254638672, "global_step": 75106, "epoch": 1788} {"train_loss": -5.93231201171875, "global_step": 75107, "epoch": 1788} {"train_loss": -6.0793867111206055, "global_step": 75108, "epoch": 1788} {"train_loss": -6.040485382080078, "global_step": 75109, "epoch": 1788} {"train_loss": -5.9642534255981445, "global_step": 75110, "epoch": 1788} {"train_loss": -6.042344570159912, "global_step": 75111, "epoch": 1788} {"train_loss": -6.02161169052124, "global_step": 75112, "epoch": 1788} {"train_loss": -6.042899131774902, "global_step": 75113, "epoch": 1788} {"train_loss": -6.102321624755859, "global_step": 75114, "epoch": 1788} {"train_loss": -6.051748275756836, "global_step": 75115, "epoch": 1788} {"train_loss": -5.9981184005737305, "global_step": 75116, "epoch": 1788} {"train_loss": -6.023373603820801, "global_step": 75117, "epoch": 1788} {"train_loss": -6.128415107727051, "global_step": 75118, "epoch": 1788} {"train_loss": -6.173529148101807, "global_step": 75119, "epoch": 1788} {"train_loss": -5.9802165031433105, "global_step": 75120, "epoch": 1788} {"train_loss": -6.019275665283203, "global_step": 75121, "epoch": 1788} {"train_loss": -6.087946891784668, "global_step": 75122, "epoch": 1788} {"train_loss": -5.844965934753418, "global_step": 75123, "epoch": 1788} {"train_loss": -6.028769493103027, "global_step": 75124, "epoch": 1788} {"train_loss": -6.095618724822998, "global_step": 75125, "epoch": 1788} {"train_loss": -6.128487586975098, "global_step": 75126, "epoch": 1788} {"train_loss": -6.03861141204834, "global_step": 75127, "epoch": 1788} {"train_loss": -6.113965034484863, "global_step": 75128, "epoch": 1788} {"train_loss": -6.009732246398926, "global_step": 75129, "epoch": 1788} {"train_loss": -6.0825910568237305, "global_step": 75130, "epoch": 1788} {"train_loss": -6.0882391929626465, "global_step": 75131, "epoch": 1788} {"train_loss": -6.049739837646484, "global_step": 75132, "epoch": 1788} {"train_loss": -6.048806667327881, "global_step": 75133, "epoch": 1788} {"train_loss": -6.114097595214844, "global_step": 75134, "epoch": 1788} {"train_loss": -6.118281364440918, "global_step": 75135, "epoch": 1788} {"train_loss": -6.133078575134277, "global_step": 75136, "epoch": 1788} {"train_loss": -6.050199395134335, "global_step": 75137, "epoch": 1788, "val_loss": 67546.078125} {"train_loss": -6.134939670562744, "global_step": 75138, "epoch": 1789} {"train_loss": -6.170375823974609, "global_step": 75139, "epoch": 1789} {"train_loss": -6.148279190063477, "global_step": 75140, "epoch": 1789} {"train_loss": -6.060888290405273, "global_step": 75141, "epoch": 1789} {"train_loss": -6.162348747253418, "global_step": 75142, "epoch": 1789} {"train_loss": -6.116091728210449, "global_step": 75143, "epoch": 1789} {"train_loss": -6.115152359008789, "global_step": 75144, "epoch": 1789} {"train_loss": -5.9845147132873535, "global_step": 75145, "epoch": 1789} {"train_loss": -6.035370349884033, "global_step": 75146, "epoch": 1789} {"train_loss": -6.045917510986328, "global_step": 75147, "epoch": 1789} {"train_loss": -5.962262153625488, "global_step": 75148, "epoch": 1789} {"train_loss": -6.006496429443359, "global_step": 75149, "epoch": 1789} {"train_loss": -6.102802276611328, "global_step": 75150, "epoch": 1789} {"train_loss": -6.136408805847168, "global_step": 75151, "epoch": 1789} {"train_loss": -5.981595039367676, "global_step": 75152, "epoch": 1789} {"train_loss": -6.040204048156738, "global_step": 75153, "epoch": 1789} {"train_loss": -5.981168746948242, "global_step": 75154, "epoch": 1789} {"train_loss": -5.9541168212890625, "global_step": 75155, "epoch": 1789} {"train_loss": -6.01800537109375, "global_step": 75156, "epoch": 1789} {"train_loss": -6.005040168762207, "global_step": 75157, "epoch": 1789} {"train_loss": -6.076702117919922, "global_step": 75158, "epoch": 1789} {"train_loss": -6.1050519943237305, "global_step": 75159, "epoch": 1789} {"train_loss": -5.996384620666504, "global_step": 75160, "epoch": 1789} {"train_loss": -6.039023399353027, "global_step": 75161, "epoch": 1789} {"train_loss": -6.027295112609863, "global_step": 75162, "epoch": 1789} {"train_loss": -5.951193809509277, "global_step": 75163, "epoch": 1789} {"train_loss": -6.0467634201049805, "global_step": 75164, "epoch": 1789} {"train_loss": -6.029807090759277, "global_step": 75165, "epoch": 1789} {"train_loss": -6.049753665924072, "global_step": 75166, "epoch": 1789} {"train_loss": -5.974771499633789, "global_step": 75167, "epoch": 1789} {"train_loss": -6.1848344802856445, "global_step": 75168, "epoch": 1789} {"train_loss": -6.038276195526123, "global_step": 75169, "epoch": 1789} {"train_loss": -5.947184085845947, "global_step": 75170, "epoch": 1789} {"train_loss": -6.115991592407227, "global_step": 75171, "epoch": 1789} {"train_loss": -6.181411266326904, "global_step": 75172, "epoch": 1789} {"train_loss": -6.144752502441406, "global_step": 75173, "epoch": 1789} {"train_loss": -6.05638313293457, "global_step": 75174, "epoch": 1789} {"train_loss": -6.064430236816406, "global_step": 75175, "epoch": 1789} {"train_loss": -5.986315727233887, "global_step": 75176, "epoch": 1789} {"train_loss": -6.091420650482178, "global_step": 75177, "epoch": 1789} {"train_loss": -6.022363662719727, "global_step": 75178, "epoch": 1789} {"train_loss": -6.055781239554996, "global_step": 75179, "epoch": 1789, "val_loss": 67599.578125} {"train_loss": -6.024631500244141, "global_step": 75180, "epoch": 1790} {"train_loss": -6.043744087219238, "global_step": 75181, "epoch": 1790} {"train_loss": -6.208822727203369, "global_step": 75182, "epoch": 1790} {"train_loss": -6.018850326538086, "global_step": 75183, "epoch": 1790} {"train_loss": -6.061821937561035, "global_step": 75184, "epoch": 1790} {"train_loss": -6.175199508666992, "global_step": 75185, "epoch": 1790} {"train_loss": -6.066485404968262, "global_step": 75186, "epoch": 1790} {"train_loss": -6.115486145019531, "global_step": 75187, "epoch": 1790} {"train_loss": -6.015673637390137, "global_step": 75188, "epoch": 1790} {"train_loss": -6.146625995635986, "global_step": 75189, "epoch": 1790} {"train_loss": -6.034143447875977, "global_step": 75190, "epoch": 1790} {"train_loss": -6.05751895904541, "global_step": 75191, "epoch": 1790} {"train_loss": -5.945442199707031, "global_step": 75192, "epoch": 1790} {"train_loss": -6.106034278869629, "global_step": 75193, "epoch": 1790} {"train_loss": -6.197031497955322, "global_step": 75194, "epoch": 1790} {"train_loss": -6.066689491271973, "global_step": 75195, "epoch": 1790} {"train_loss": -6.089052200317383, "global_step": 75196, "epoch": 1790} {"train_loss": -6.142899513244629, "global_step": 75197, "epoch": 1790} {"train_loss": -6.129421234130859, "global_step": 75198, "epoch": 1790} {"train_loss": -6.160235404968262, "global_step": 75199, "epoch": 1790} {"train_loss": -6.074280738830566, "global_step": 75200, "epoch": 1790} {"train_loss": -6.166852951049805, "global_step": 75201, "epoch": 1790} {"train_loss": -6.016912937164307, "global_step": 75202, "epoch": 1790} {"train_loss": -5.959678649902344, "global_step": 75203, "epoch": 1790} {"train_loss": -6.051218032836914, "global_step": 75204, "epoch": 1790} {"train_loss": -6.172297477722168, "global_step": 75205, "epoch": 1790} {"train_loss": -6.0255584716796875, "global_step": 75206, "epoch": 1790} {"train_loss": -5.860362529754639, "global_step": 75207, "epoch": 1790} {"train_loss": -6.033665657043457, "global_step": 75208, "epoch": 1790} {"train_loss": -6.047364234924316, "global_step": 75209, "epoch": 1790} {"train_loss": -6.194831848144531, "global_step": 75210, "epoch": 1790} {"train_loss": -6.09020471572876, "global_step": 75211, "epoch": 1790} {"train_loss": -6.021607875823975, "global_step": 75212, "epoch": 1790} {"train_loss": -6.067407131195068, "global_step": 75213, "epoch": 1790} {"train_loss": -6.019444465637207, "global_step": 75214, "epoch": 1790} {"train_loss": -6.045477867126465, "global_step": 75215, "epoch": 1790} {"train_loss": -6.037042617797852, "global_step": 75216, "epoch": 1790} {"train_loss": -5.925343036651611, "global_step": 75217, "epoch": 1790} {"train_loss": -6.000247478485107, "global_step": 75218, "epoch": 1790} {"train_loss": -5.994942665100098, "global_step": 75219, "epoch": 1790} {"train_loss": -6.145241737365723, "global_step": 75220, "epoch": 1790} {"train_loss": -6.065229291007633, "global_step": 75221, "epoch": 1790, "val_loss": 67268.3203125} {"train_loss": -5.999037742614746, "global_step": 75222, "epoch": 1791} {"train_loss": -6.173905849456787, "global_step": 75223, "epoch": 1791} {"train_loss": -6.02229118347168, "global_step": 75224, "epoch": 1791} {"train_loss": -6.1224365234375, "global_step": 75225, "epoch": 1791} {"train_loss": -6.090751647949219, "global_step": 75226, "epoch": 1791} {"train_loss": -6.10837459564209, "global_step": 75227, "epoch": 1791} {"train_loss": -6.000558853149414, "global_step": 75228, "epoch": 1791} {"train_loss": -5.917130470275879, "global_step": 75229, "epoch": 1791} {"train_loss": -6.098879337310791, "global_step": 75230, "epoch": 1791} {"train_loss": -6.057267189025879, "global_step": 75231, "epoch": 1791} {"train_loss": -6.089585781097412, "global_step": 75232, "epoch": 1791} {"train_loss": -6.2664337158203125, "global_step": 75233, "epoch": 1791} {"train_loss": -6.058784484863281, "global_step": 75234, "epoch": 1791} {"train_loss": -6.060959339141846, "global_step": 75235, "epoch": 1791} {"train_loss": -6.067831993103027, "global_step": 75236, "epoch": 1791} {"train_loss": -5.861104965209961, "global_step": 75237, "epoch": 1791} {"train_loss": -6.020992279052734, "global_step": 75238, "epoch": 1791} {"train_loss": -6.152369499206543, "global_step": 75239, "epoch": 1791} {"train_loss": -6.016339302062988, "global_step": 75240, "epoch": 1791} {"train_loss": -6.116961479187012, "global_step": 75241, "epoch": 1791} {"train_loss": -6.1372480392456055, "global_step": 75242, "epoch": 1791} {"train_loss": -6.024301052093506, "global_step": 75243, "epoch": 1791} {"train_loss": -6.097224235534668, "global_step": 75244, "epoch": 1791} {"train_loss": -6.088351726531982, "global_step": 75245, "epoch": 1791} {"train_loss": -6.042971611022949, "global_step": 75246, "epoch": 1791} {"train_loss": -5.977270126342773, "global_step": 75247, "epoch": 1791} {"train_loss": -6.117136001586914, "global_step": 75248, "epoch": 1791} {"train_loss": -5.928945541381836, "global_step": 75249, "epoch": 1791} {"train_loss": -5.9459943771362305, "global_step": 75250, "epoch": 1791} {"train_loss": -6.067208290100098, "global_step": 75251, "epoch": 1791} {"train_loss": -5.905425548553467, "global_step": 75252, "epoch": 1791} {"train_loss": -6.073015213012695, "global_step": 75253, "epoch": 1791} {"train_loss": -5.922194004058838, "global_step": 75254, "epoch": 1791} {"train_loss": -6.030935287475586, "global_step": 75255, "epoch": 1791} {"train_loss": -5.881221771240234, "global_step": 75256, "epoch": 1791} {"train_loss": -5.955471038818359, "global_step": 75257, "epoch": 1791} {"train_loss": -6.155585289001465, "global_step": 75258, "epoch": 1791} {"train_loss": -6.040252685546875, "global_step": 75259, "epoch": 1791} {"train_loss": -6.0404510498046875, "global_step": 75260, "epoch": 1791} {"train_loss": -5.901003837585449, "global_step": 75261, "epoch": 1791} {"train_loss": -6.107748985290527, "global_step": 75262, "epoch": 1791} {"train_loss": -6.044619072051275, "global_step": 75263, "epoch": 1791, "val_loss": 67502.4921875} {"train_loss": -5.959442615509033, "global_step": 75264, "epoch": 1792} {"train_loss": -6.025149345397949, "global_step": 75265, "epoch": 1792} {"train_loss": -6.137782096862793, "global_step": 75266, "epoch": 1792} {"train_loss": -6.045673847198486, "global_step": 75267, "epoch": 1792} {"train_loss": -6.050201416015625, "global_step": 75268, "epoch": 1792} {"train_loss": -6.155918121337891, "global_step": 75269, "epoch": 1792} {"train_loss": -6.192892551422119, "global_step": 75270, "epoch": 1792} {"train_loss": -5.9261908531188965, "global_step": 75271, "epoch": 1792} {"train_loss": -6.097736835479736, "global_step": 75272, "epoch": 1792} {"train_loss": -6.159970283508301, "global_step": 75273, "epoch": 1792} {"train_loss": -6.175463676452637, "global_step": 75274, "epoch": 1792} {"train_loss": -6.123579025268555, "global_step": 75275, "epoch": 1792} {"train_loss": -6.193833351135254, "global_step": 75276, "epoch": 1792} {"train_loss": -6.147294521331787, "global_step": 75277, "epoch": 1792} {"train_loss": -6.105254173278809, "global_step": 75278, "epoch": 1792} {"train_loss": -6.010603904724121, "global_step": 75279, "epoch": 1792} {"train_loss": -5.996478080749512, "global_step": 75280, "epoch": 1792} {"train_loss": -6.103397369384766, "global_step": 75281, "epoch": 1792} {"train_loss": -6.139518737792969, "global_step": 75282, "epoch": 1792} {"train_loss": -6.2450761795043945, "global_step": 75283, "epoch": 1792} {"train_loss": -6.052633285522461, "global_step": 75284, "epoch": 1792} {"train_loss": -6.099656581878662, "global_step": 75285, "epoch": 1792} {"train_loss": -6.126219749450684, "global_step": 75286, "epoch": 1792} {"train_loss": -6.001310348510742, "global_step": 75287, "epoch": 1792} {"train_loss": -6.125693321228027, "global_step": 75288, "epoch": 1792} {"train_loss": -6.129937648773193, "global_step": 75289, "epoch": 1792} {"train_loss": -6.087347984313965, "global_step": 75290, "epoch": 1792} {"train_loss": -6.151793479919434, "global_step": 75291, "epoch": 1792} {"train_loss": -6.0184526443481445, "global_step": 75292, "epoch": 1792} {"train_loss": -5.978796005249023, "global_step": 75293, "epoch": 1792} {"train_loss": -6.024333477020264, "global_step": 75294, "epoch": 1792} {"train_loss": -6.116154670715332, "global_step": 75295, "epoch": 1792} {"train_loss": -6.103753089904785, "global_step": 75296, "epoch": 1792} {"train_loss": -6.130889415740967, "global_step": 75297, "epoch": 1792} {"train_loss": -5.979381084442139, "global_step": 75298, "epoch": 1792} {"train_loss": -6.131976127624512, "global_step": 75299, "epoch": 1792} {"train_loss": -6.054986476898193, "global_step": 75300, "epoch": 1792} {"train_loss": -6.022863864898682, "global_step": 75301, "epoch": 1792} {"train_loss": -6.082884311676025, "global_step": 75302, "epoch": 1792} {"train_loss": -5.978489875793457, "global_step": 75303, "epoch": 1792} {"train_loss": -6.100896835327148, "global_step": 75304, "epoch": 1792} {"train_loss": -6.085207473664057, "global_step": 75305, "epoch": 1792, "val_loss": 67479.265625} {"train_loss": -6.016294479370117, "global_step": 75306, "epoch": 1793} {"train_loss": -6.095515251159668, "global_step": 75307, "epoch": 1793} {"train_loss": -6.054751873016357, "global_step": 75308, "epoch": 1793} {"train_loss": -5.993303298950195, "global_step": 75309, "epoch": 1793} {"train_loss": -6.129049301147461, "global_step": 75310, "epoch": 1793} {"train_loss": -6.080788612365723, "global_step": 75311, "epoch": 1793} {"train_loss": -6.140406608581543, "global_step": 75312, "epoch": 1793} {"train_loss": -6.031739234924316, "global_step": 75313, "epoch": 1793} {"train_loss": -6.070176124572754, "global_step": 75314, "epoch": 1793} {"train_loss": -6.117344856262207, "global_step": 75315, "epoch": 1793} {"train_loss": -6.021995544433594, "global_step": 75316, "epoch": 1793} {"train_loss": -6.060635566711426, "global_step": 75317, "epoch": 1793} {"train_loss": -6.136830806732178, "global_step": 75318, "epoch": 1793} {"train_loss": -6.02494478225708, "global_step": 75319, "epoch": 1793} {"train_loss": -6.120612621307373, "global_step": 75320, "epoch": 1793} {"train_loss": -6.018488883972168, "global_step": 75321, "epoch": 1793} {"train_loss": -6.229477882385254, "global_step": 75322, "epoch": 1793} {"train_loss": -6.111597537994385, "global_step": 75323, "epoch": 1793} {"train_loss": -6.21299934387207, "global_step": 75324, "epoch": 1793} {"train_loss": -6.028068542480469, "global_step": 75325, "epoch": 1793} {"train_loss": -6.038812160491943, "global_step": 75326, "epoch": 1793} {"train_loss": -6.040615558624268, "global_step": 75327, "epoch": 1793} {"train_loss": -6.094426155090332, "global_step": 75328, "epoch": 1793} {"train_loss": -6.12324857711792, "global_step": 75329, "epoch": 1793} {"train_loss": -6.1432366371154785, "global_step": 75330, "epoch": 1793} {"train_loss": -6.098552703857422, "global_step": 75331, "epoch": 1793} {"train_loss": -5.975294589996338, "global_step": 75332, "epoch": 1793} {"train_loss": -6.107753753662109, "global_step": 75333, "epoch": 1793} {"train_loss": -6.012991428375244, "global_step": 75334, "epoch": 1793} {"train_loss": -6.09178352355957, "global_step": 75335, "epoch": 1793} {"train_loss": -6.059780597686768, "global_step": 75336, "epoch": 1793} {"train_loss": -6.163323879241943, "global_step": 75337, "epoch": 1793} {"train_loss": -6.133113861083984, "global_step": 75338, "epoch": 1793} {"train_loss": -6.02002477645874, "global_step": 75339, "epoch": 1793} {"train_loss": -6.067195415496826, "global_step": 75340, "epoch": 1793} {"train_loss": -6.056431293487549, "global_step": 75341, "epoch": 1793} {"train_loss": -6.011520862579346, "global_step": 75342, "epoch": 1793} {"train_loss": -6.0334153175354, "global_step": 75343, "epoch": 1793} {"train_loss": -6.108883857727051, "global_step": 75344, "epoch": 1793} {"train_loss": -6.079279899597168, "global_step": 75345, "epoch": 1793} {"train_loss": -6.1446685791015625, "global_step": 75346, "epoch": 1793} {"train_loss": -6.078590222767422, "global_step": 75347, "epoch": 1793, "val_loss": 67530.8515625} {"train_loss": -6.192084789276123, "global_step": 75348, "epoch": 1794} {"train_loss": -6.1500749588012695, "global_step": 75349, "epoch": 1794} {"train_loss": -6.130062580108643, "global_step": 75350, "epoch": 1794} {"train_loss": -6.042250156402588, "global_step": 75351, "epoch": 1794} {"train_loss": -6.006473064422607, "global_step": 75352, "epoch": 1794} {"train_loss": -6.045932769775391, "global_step": 75353, "epoch": 1794} {"train_loss": -6.194511413574219, "global_step": 75354, "epoch": 1794} {"train_loss": -6.150948524475098, "global_step": 75355, "epoch": 1794} {"train_loss": -6.141676425933838, "global_step": 75356, "epoch": 1794} {"train_loss": -6.044633388519287, "global_step": 75357, "epoch": 1794} {"train_loss": -6.006851673126221, "global_step": 75358, "epoch": 1794} {"train_loss": -6.081467628479004, "global_step": 75359, "epoch": 1794} {"train_loss": -6.041310787200928, "global_step": 75360, "epoch": 1794} {"train_loss": -5.992770671844482, "global_step": 75361, "epoch": 1794} {"train_loss": -6.1317033767700195, "global_step": 75362, "epoch": 1794} {"train_loss": -5.975470066070557, "global_step": 75363, "epoch": 1794} {"train_loss": -6.0862627029418945, "global_step": 75364, "epoch": 1794} {"train_loss": -6.113441467285156, "global_step": 75365, "epoch": 1794} {"train_loss": -6.11238956451416, "global_step": 75366, "epoch": 1794} {"train_loss": -5.98729133605957, "global_step": 75367, "epoch": 1794} {"train_loss": -6.055618762969971, "global_step": 75368, "epoch": 1794} {"train_loss": -6.156892776489258, "global_step": 75369, "epoch": 1794} {"train_loss": -6.111053466796875, "global_step": 75370, "epoch": 1794} {"train_loss": -5.980606555938721, "global_step": 75371, "epoch": 1794} {"train_loss": -6.014692306518555, "global_step": 75372, "epoch": 1794} {"train_loss": -6.1456146240234375, "global_step": 75373, "epoch": 1794} {"train_loss": -6.106271743774414, "global_step": 75374, "epoch": 1794} {"train_loss": -6.0090789794921875, "global_step": 75375, "epoch": 1794} {"train_loss": -5.947951316833496, "global_step": 75376, "epoch": 1794} {"train_loss": -6.159646987915039, "global_step": 75377, "epoch": 1794} {"train_loss": -6.1238112449646, "global_step": 75378, "epoch": 1794} {"train_loss": -5.954565525054932, "global_step": 75379, "epoch": 1794} {"train_loss": -6.186043739318848, "global_step": 75380, "epoch": 1794} {"train_loss": -6.1646013259887695, "global_step": 75381, "epoch": 1794} {"train_loss": -6.0944294929504395, "global_step": 75382, "epoch": 1794} {"train_loss": -6.036081314086914, "global_step": 75383, "epoch": 1794} {"train_loss": -6.075268745422363, "global_step": 75384, "epoch": 1794} {"train_loss": -5.969664573669434, "global_step": 75385, "epoch": 1794} {"train_loss": -6.068072319030762, "global_step": 75386, "epoch": 1794} {"train_loss": -5.999906539916992, "global_step": 75387, "epoch": 1794} {"train_loss": -6.002266883850098, "global_step": 75388, "epoch": 1794} {"train_loss": -6.071130321139381, "global_step": 75389, "epoch": 1794, "val_loss": 67424.8046875} {"train_loss": -6.086928367614746, "global_step": 75390, "epoch": 1795} {"train_loss": -5.959694862365723, "global_step": 75391, "epoch": 1795} {"train_loss": -6.229031562805176, "global_step": 75392, "epoch": 1795} {"train_loss": -6.107541561126709, "global_step": 75393, "epoch": 1795} {"train_loss": -6.086695671081543, "global_step": 75394, "epoch": 1795} {"train_loss": -6.179470539093018, "global_step": 75395, "epoch": 1795} {"train_loss": -6.110822677612305, "global_step": 75396, "epoch": 1795} {"train_loss": -6.004376411437988, "global_step": 75397, "epoch": 1795} {"train_loss": -6.162040710449219, "global_step": 75398, "epoch": 1795} {"train_loss": -6.043496608734131, "global_step": 75399, "epoch": 1795} {"train_loss": -5.96004581451416, "global_step": 75400, "epoch": 1795} {"train_loss": -6.109139919281006, "global_step": 75401, "epoch": 1795} {"train_loss": -5.996538162231445, "global_step": 75402, "epoch": 1795} {"train_loss": -5.933988571166992, "global_step": 75403, "epoch": 1795} {"train_loss": -6.1185455322265625, "global_step": 75404, "epoch": 1795} {"train_loss": -6.03680419921875, "global_step": 75405, "epoch": 1795} {"train_loss": -5.980906009674072, "global_step": 75406, "epoch": 1795} {"train_loss": -6.0380730628967285, "global_step": 75407, "epoch": 1795} {"train_loss": -6.069929122924805, "global_step": 75408, "epoch": 1795} {"train_loss": -6.081618309020996, "global_step": 75409, "epoch": 1795} {"train_loss": -6.02125358581543, "global_step": 75410, "epoch": 1795} {"train_loss": -6.068406105041504, "global_step": 75411, "epoch": 1795} {"train_loss": -6.0149335861206055, "global_step": 75412, "epoch": 1795} {"train_loss": -6.046964645385742, "global_step": 75413, "epoch": 1795} {"train_loss": -6.01535701751709, "global_step": 75414, "epoch": 1795} {"train_loss": -6.1064453125, "global_step": 75415, "epoch": 1795} {"train_loss": -6.164892196655273, "global_step": 75416, "epoch": 1795} {"train_loss": -5.978368759155273, "global_step": 75417, "epoch": 1795} {"train_loss": -6.233441352844238, "global_step": 75418, "epoch": 1795} {"train_loss": -5.981627941131592, "global_step": 75419, "epoch": 1795} {"train_loss": -6.024716854095459, "global_step": 75420, "epoch": 1795} {"train_loss": -5.979184150695801, "global_step": 75421, "epoch": 1795} {"train_loss": -6.083076477050781, "global_step": 75422, "epoch": 1795} {"train_loss": -6.010342597961426, "global_step": 75423, "epoch": 1795} {"train_loss": -5.960926532745361, "global_step": 75424, "epoch": 1795} {"train_loss": -6.163182258605957, "global_step": 75425, "epoch": 1795} {"train_loss": -6.0561676025390625, "global_step": 75426, "epoch": 1795} {"train_loss": -6.124034404754639, "global_step": 75427, "epoch": 1795} {"train_loss": -6.0820722579956055, "global_step": 75428, "epoch": 1795} {"train_loss": -5.870429039001465, "global_step": 75429, "epoch": 1795} {"train_loss": -6.147304534912109, "global_step": 75430, "epoch": 1795} {"train_loss": -6.057791607720511, "global_step": 75431, "epoch": 1795, "val_loss": 67611.484375} {"train_loss": -6.187469005584717, "global_step": 75432, "epoch": 1796} {"train_loss": -5.9796977043151855, "global_step": 75433, "epoch": 1796} {"train_loss": -5.951088905334473, "global_step": 75434, "epoch": 1796} {"train_loss": -6.161342620849609, "global_step": 75435, "epoch": 1796} {"train_loss": -6.112306118011475, "global_step": 75436, "epoch": 1796} {"train_loss": -6.1185126304626465, "global_step": 75437, "epoch": 1796} {"train_loss": -6.074180603027344, "global_step": 75438, "epoch": 1796} {"train_loss": -6.023771286010742, "global_step": 75439, "epoch": 1796} {"train_loss": -5.950162887573242, "global_step": 75440, "epoch": 1796} {"train_loss": -6.170058250427246, "global_step": 75441, "epoch": 1796} {"train_loss": -6.088464736938477, "global_step": 75442, "epoch": 1796} {"train_loss": -6.133267879486084, "global_step": 75443, "epoch": 1796} {"train_loss": -6.20172119140625, "global_step": 75444, "epoch": 1796} {"train_loss": -6.065250396728516, "global_step": 75445, "epoch": 1796} {"train_loss": -5.983680725097656, "global_step": 75446, "epoch": 1796} {"train_loss": -6.145802021026611, "global_step": 75447, "epoch": 1796} {"train_loss": -6.091012001037598, "global_step": 75448, "epoch": 1796} {"train_loss": -6.07142448425293, "global_step": 75449, "epoch": 1796} {"train_loss": -6.159196853637695, "global_step": 75450, "epoch": 1796} {"train_loss": -6.103043079376221, "global_step": 75451, "epoch": 1796} {"train_loss": -6.176306247711182, "global_step": 75452, "epoch": 1796} {"train_loss": -6.117100715637207, "global_step": 75453, "epoch": 1796} {"train_loss": -6.135727882385254, "global_step": 75454, "epoch": 1796} {"train_loss": -6.136993408203125, "global_step": 75455, "epoch": 1796} {"train_loss": -5.953171730041504, "global_step": 75456, "epoch": 1796} {"train_loss": -6.066333770751953, "global_step": 75457, "epoch": 1796} {"train_loss": -5.986193656921387, "global_step": 75458, "epoch": 1796} {"train_loss": -6.131110191345215, "global_step": 75459, "epoch": 1796} {"train_loss": -5.960810661315918, "global_step": 75460, "epoch": 1796} {"train_loss": -6.213870048522949, "global_step": 75461, "epoch": 1796} {"train_loss": -6.043370246887207, "global_step": 75462, "epoch": 1796} {"train_loss": -6.15248966217041, "global_step": 75463, "epoch": 1796} {"train_loss": -6.200686454772949, "global_step": 75464, "epoch": 1796} {"train_loss": -6.08206033706665, "global_step": 75465, "epoch": 1796} {"train_loss": -6.045083999633789, "global_step": 75466, "epoch": 1796} {"train_loss": -5.99400520324707, "global_step": 75467, "epoch": 1796} {"train_loss": -6.236309051513672, "global_step": 75468, "epoch": 1796} {"train_loss": -6.1305437088012695, "global_step": 75469, "epoch": 1796} {"train_loss": -6.066537857055664, "global_step": 75470, "epoch": 1796} {"train_loss": -6.038273334503174, "global_step": 75471, "epoch": 1796} {"train_loss": -6.090719223022461, "global_step": 75472, "epoch": 1796} {"train_loss": -6.092329513458979, "global_step": 75473, "epoch": 1796, "val_loss": 67518.765625} {"train_loss": -6.017821311950684, "global_step": 75474, "epoch": 1797} {"train_loss": -6.065726280212402, "global_step": 75475, "epoch": 1797} {"train_loss": -6.0833868980407715, "global_step": 75476, "epoch": 1797} {"train_loss": -6.067288875579834, "global_step": 75477, "epoch": 1797} {"train_loss": -6.125168800354004, "global_step": 75478, "epoch": 1797} {"train_loss": -6.106894493103027, "global_step": 75479, "epoch": 1797} {"train_loss": -6.069460391998291, "global_step": 75480, "epoch": 1797} {"train_loss": -5.9993391036987305, "global_step": 75481, "epoch": 1797} {"train_loss": -6.035839080810547, "global_step": 75482, "epoch": 1797} {"train_loss": -6.016732215881348, "global_step": 75483, "epoch": 1797} {"train_loss": -6.173806190490723, "global_step": 75484, "epoch": 1797} {"train_loss": -6.10359001159668, "global_step": 75485, "epoch": 1797} {"train_loss": -6.089892387390137, "global_step": 75486, "epoch": 1797} {"train_loss": -6.095849990844727, "global_step": 75487, "epoch": 1797} {"train_loss": -6.139743804931641, "global_step": 75488, "epoch": 1797} {"train_loss": -6.103041648864746, "global_step": 75489, "epoch": 1797} {"train_loss": -6.033866882324219, "global_step": 75490, "epoch": 1797} {"train_loss": -6.022171974182129, "global_step": 75491, "epoch": 1797} {"train_loss": -6.00652551651001, "global_step": 75492, "epoch": 1797} {"train_loss": -6.062965393066406, "global_step": 75493, "epoch": 1797} {"train_loss": -6.155646324157715, "global_step": 75494, "epoch": 1797} {"train_loss": -6.043139457702637, "global_step": 75495, "epoch": 1797} {"train_loss": -6.076718330383301, "global_step": 75496, "epoch": 1797} {"train_loss": -6.119322299957275, "global_step": 75497, "epoch": 1797} {"train_loss": -6.0330047607421875, "global_step": 75498, "epoch": 1797} {"train_loss": -6.018073081970215, "global_step": 75499, "epoch": 1797} {"train_loss": -6.128662109375, "global_step": 75500, "epoch": 1797} {"train_loss": -6.127410888671875, "global_step": 75501, "epoch": 1797} {"train_loss": -6.0079240798950195, "global_step": 75502, "epoch": 1797} {"train_loss": -5.938138961791992, "global_step": 75503, "epoch": 1797} {"train_loss": -6.0482048988342285, "global_step": 75504, "epoch": 1797} {"train_loss": -6.094662666320801, "global_step": 75505, "epoch": 1797} {"train_loss": -6.139288425445557, "global_step": 75506, "epoch": 1797} {"train_loss": -6.056557655334473, "global_step": 75507, "epoch": 1797} {"train_loss": -5.928021430969238, "global_step": 75508, "epoch": 1797} {"train_loss": -6.0216779708862305, "global_step": 75509, "epoch": 1797} {"train_loss": -6.062588691711426, "global_step": 75510, "epoch": 1797} {"train_loss": -5.913887023925781, "global_step": 75511, "epoch": 1797} {"train_loss": -6.084868907928467, "global_step": 75512, "epoch": 1797} {"train_loss": -5.880145072937012, "global_step": 75513, "epoch": 1797} {"train_loss": -6.047877311706543, "global_step": 75514, "epoch": 1797} {"train_loss": -6.056419679096767, "global_step": 75515, "epoch": 1797, "val_loss": 67519.7265625} {"train_loss": -5.957881927490234, "global_step": 75516, "epoch": 1798} {"train_loss": -6.018597602844238, "global_step": 75517, "epoch": 1798} {"train_loss": -5.950625419616699, "global_step": 75518, "epoch": 1798} {"train_loss": -5.990779876708984, "global_step": 75519, "epoch": 1798} {"train_loss": -6.030152320861816, "global_step": 75520, "epoch": 1798} {"train_loss": -5.983006000518799, "global_step": 75521, "epoch": 1798} {"train_loss": -6.055560111999512, "global_step": 75522, "epoch": 1798} {"train_loss": -5.967323303222656, "global_step": 75523, "epoch": 1798} {"train_loss": -5.955456733703613, "global_step": 75524, "epoch": 1798} {"train_loss": -5.9993133544921875, "global_step": 75525, "epoch": 1798} {"train_loss": -5.935340404510498, "global_step": 75526, "epoch": 1798} {"train_loss": -5.995120048522949, "global_step": 75527, "epoch": 1798} {"train_loss": -6.010703086853027, "global_step": 75528, "epoch": 1798} {"train_loss": -6.026397705078125, "global_step": 75529, "epoch": 1798} {"train_loss": -5.984584808349609, "global_step": 75530, "epoch": 1798} {"train_loss": -6.0366926193237305, "global_step": 75531, "epoch": 1798} {"train_loss": -5.975393295288086, "global_step": 75532, "epoch": 1798} {"train_loss": -6.0007710456848145, "global_step": 75533, "epoch": 1798} {"train_loss": -6.026213645935059, "global_step": 75534, "epoch": 1798} {"train_loss": -6.1041693687438965, "global_step": 75535, "epoch": 1798} {"train_loss": -6.0985612869262695, "global_step": 75536, "epoch": 1798} {"train_loss": -6.16916561126709, "global_step": 75537, "epoch": 1798} {"train_loss": -6.001928329467773, "global_step": 75538, "epoch": 1798} {"train_loss": -6.045627593994141, "global_step": 75539, "epoch": 1798} {"train_loss": -5.969433307647705, "global_step": 75540, "epoch": 1798} {"train_loss": -6.24395227432251, "global_step": 75541, "epoch": 1798} {"train_loss": -6.100530624389648, "global_step": 75542, "epoch": 1798} {"train_loss": -6.210248947143555, "global_step": 75543, "epoch": 1798} {"train_loss": -6.161439418792725, "global_step": 75544, "epoch": 1798} {"train_loss": -6.044585227966309, "global_step": 75545, "epoch": 1798} {"train_loss": -6.015409469604492, "global_step": 75546, "epoch": 1798} {"train_loss": -6.079255104064941, "global_step": 75547, "epoch": 1798} {"train_loss": -6.154263973236084, "global_step": 75548, "epoch": 1798} {"train_loss": -6.090243816375732, "global_step": 75549, "epoch": 1798} {"train_loss": -6.008244037628174, "global_step": 75550, "epoch": 1798} {"train_loss": -6.093921184539795, "global_step": 75551, "epoch": 1798} {"train_loss": -6.009375095367432, "global_step": 75552, "epoch": 1798} {"train_loss": -6.013160705566406, "global_step": 75553, "epoch": 1798} {"train_loss": -6.102463722229004, "global_step": 75554, "epoch": 1798} {"train_loss": -5.997239589691162, "global_step": 75555, "epoch": 1798} {"train_loss": -6.084042549133301, "global_step": 75556, "epoch": 1798} {"train_loss": -6.0436522506532215, "global_step": 75557, "epoch": 1798, "val_loss": 67933.8984375} {"train_loss": -5.903669357299805, "global_step": 75558, "epoch": 1799} {"train_loss": -5.9560465812683105, "global_step": 75559, "epoch": 1799} {"train_loss": -5.979180335998535, "global_step": 75560, "epoch": 1799} {"train_loss": -6.012777328491211, "global_step": 75561, "epoch": 1799} {"train_loss": -6.0416178703308105, "global_step": 75562, "epoch": 1799} {"train_loss": -5.916249752044678, "global_step": 75563, "epoch": 1799} {"train_loss": -6.04271125793457, "global_step": 75564, "epoch": 1799} {"train_loss": -6.185897350311279, "global_step": 75565, "epoch": 1799} {"train_loss": -5.973055362701416, "global_step": 75566, "epoch": 1799} {"train_loss": -6.086058616638184, "global_step": 75567, "epoch": 1799} {"train_loss": -6.022117614746094, "global_step": 75568, "epoch": 1799} {"train_loss": -6.020571708679199, "global_step": 75569, "epoch": 1799} {"train_loss": -5.981316089630127, "global_step": 75570, "epoch": 1799} {"train_loss": -5.933257102966309, "global_step": 75571, "epoch": 1799} {"train_loss": -5.944631099700928, "global_step": 75572, "epoch": 1799} {"train_loss": -6.062678813934326, "global_step": 75573, "epoch": 1799} {"train_loss": -6.071935653686523, "global_step": 75574, "epoch": 1799} {"train_loss": -6.077327728271484, "global_step": 75575, "epoch": 1799} {"train_loss": -5.949763298034668, "global_step": 75576, "epoch": 1799} {"train_loss": -6.052727699279785, "global_step": 75577, "epoch": 1799} {"train_loss": -5.986029624938965, "global_step": 75578, "epoch": 1799} {"train_loss": -5.964680194854736, "global_step": 75579, "epoch": 1799} {"train_loss": -6.123443603515625, "global_step": 75580, "epoch": 1799} {"train_loss": -6.0998125076293945, "global_step": 75581, "epoch": 1799} {"train_loss": -5.912201404571533, "global_step": 75582, "epoch": 1799} {"train_loss": -6.054123878479004, "global_step": 75583, "epoch": 1799} {"train_loss": -6.096759796142578, "global_step": 75584, "epoch": 1799} {"train_loss": -6.0503339767456055, "global_step": 75585, "epoch": 1799} {"train_loss": -6.190990447998047, "global_step": 75586, "epoch": 1799} {"train_loss": -5.886226654052734, "global_step": 75587, "epoch": 1799} {"train_loss": -5.992938995361328, "global_step": 75588, "epoch": 1799} {"train_loss": -6.183803558349609, "global_step": 75589, "epoch": 1799} {"train_loss": -5.962374687194824, "global_step": 75590, "epoch": 1799} {"train_loss": -6.02519416809082, "global_step": 75591, "epoch": 1799} {"train_loss": -6.1827545166015625, "global_step": 75592, "epoch": 1799} {"train_loss": -6.013813018798828, "global_step": 75593, "epoch": 1799} {"train_loss": -6.031084060668945, "global_step": 75594, "epoch": 1799} {"train_loss": -6.057917594909668, "global_step": 75595, "epoch": 1799} {"train_loss": -5.972735404968262, "global_step": 75596, "epoch": 1799} {"train_loss": -5.982602119445801, "global_step": 75597, "epoch": 1799} {"train_loss": -6.029283046722412, "global_step": 75598, "epoch": 1799} {"train_loss": -6.025450706481934, "global_step": 75599, "epoch": 1799, "val_loss": 67659.2734375} {"train_loss": -5.981145858764648, "global_step": 75600, "epoch": 1800} {"train_loss": -6.085249900817871, "global_step": 75601, "epoch": 1800} {"train_loss": -5.9882659912109375, "global_step": 75602, "epoch": 1800} {"train_loss": -6.087627410888672, "global_step": 75603, "epoch": 1800} {"train_loss": -6.244696140289307, "global_step": 75604, "epoch": 1800} {"train_loss": -6.0263872146606445, "global_step": 75605, "epoch": 1800} {"train_loss": -6.109783172607422, "global_step": 75606, "epoch": 1800} {"train_loss": -6.018461227416992, "global_step": 75607, "epoch": 1800} {"train_loss": -5.971963882446289, "global_step": 75608, "epoch": 1800} {"train_loss": -6.023200035095215, "global_step": 75609, "epoch": 1800} {"train_loss": -6.027961254119873, "global_step": 75610, "epoch": 1800} {"train_loss": -6.128084659576416, "global_step": 75611, "epoch": 1800} {"train_loss": -5.947671890258789, "global_step": 75612, "epoch": 1800} {"train_loss": -6.041721820831299, "global_step": 75613, "epoch": 1800} {"train_loss": -5.983950138092041, "global_step": 75614, "epoch": 1800} {"train_loss": -5.887346267700195, "global_step": 75615, "epoch": 1800} {"train_loss": -5.991076469421387, "global_step": 75616, "epoch": 1800} {"train_loss": -5.974708557128906, "global_step": 75617, "epoch": 1800} {"train_loss": -6.008090019226074, "global_step": 75618, "epoch": 1800} {"train_loss": -6.044612407684326, "global_step": 75619, "epoch": 1800} {"train_loss": -6.097782611846924, "global_step": 75620, "epoch": 1800} {"train_loss": -6.006159782409668, "global_step": 75621, "epoch": 1800} {"train_loss": -6.132728576660156, "global_step": 75622, "epoch": 1800} {"train_loss": -6.155318737030029, "global_step": 75623, "epoch": 1800} {"train_loss": -6.096295356750488, "global_step": 75624, "epoch": 1800} {"train_loss": -6.186422348022461, "global_step": 75625, "epoch": 1800} {"train_loss": -6.127871513366699, "global_step": 75626, "epoch": 1800} {"train_loss": -6.191313743591309, "global_step": 75627, "epoch": 1800} {"train_loss": -6.016141891479492, "global_step": 75628, "epoch": 1800} {"train_loss": -6.026974678039551, "global_step": 75629, "epoch": 1800} {"train_loss": -6.079252243041992, "global_step": 75630, "epoch": 1800} {"train_loss": -6.064266204833984, "global_step": 75631, "epoch": 1800} {"train_loss": -6.017197608947754, "global_step": 75632, "epoch": 1800} {"train_loss": -6.036105155944824, "global_step": 75633, "epoch": 1800} {"train_loss": -6.08742618560791, "global_step": 75634, "epoch": 1800} {"train_loss": -6.069204330444336, "global_step": 75635, "epoch": 1800} {"train_loss": -6.045575141906738, "global_step": 75636, "epoch": 1800} {"train_loss": -6.075258255004883, "global_step": 75637, "epoch": 1800} {"train_loss": -5.992430686950684, "global_step": 75638, "epoch": 1800} {"train_loss": -6.229270935058594, "global_step": 75639, "epoch": 1800} {"train_loss": -6.1510443687438965, "global_step": 75640, "epoch": 1800} {"train_loss": -6.061496325901577, "global_step": 75641, "epoch": 1800, "train/sim_max_reward_0": 0.21760432978491462, "train/sim_max_reward_1": 0.5137031196580011, "train/sim_max_reward_2": 0.3790785197408054, "train/sim_max_reward_3": 0.13440839352193937, "train/sim_max_reward_4": 0.979402828599026, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.23028506798423648, "test/sim_max_reward_4400001": 0.14281658866388916, "test/sim_max_reward_4400002": 0.19067023024745317, "test/sim_max_reward_4400003": 0.7626699881013393, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9443278936034084, "test/sim_max_reward_4400007": 0.8184837769802683, "test/sim_max_reward_4400008": 0.297163391140225, "test/sim_max_reward_4400009": 0.8840672159180689, "test/sim_max_reward_4400010": 0.27909202364636204, "test/sim_max_reward_4400011": 0.33581865914979464, "test/sim_max_reward_4400012": 0.8265391516923422, "test/sim_max_reward_4400013": 0.9504265197744608, "test/sim_max_reward_4400014": 0.375959173143978, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.31769629870721827, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.05187890910052829, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9374528908735223, "test/sim_max_reward_4400023": 0.09289910529879107, "test/sim_max_reward_4400024": 0.9489788146626718, "test/sim_max_reward_4400025": 0.2163606745897131, "test/sim_max_reward_4400026": 0.6975279253743054, "test/sim_max_reward_4400027": 0.06541753450764617, "test/sim_max_reward_4400028": 0.40072245996289874, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.878427011742672, "test/sim_max_reward_4400031": 0.3800567412561597, "test/sim_max_reward_4400032": 0.17225762621450336, "test/sim_max_reward_4400033": 0.5259418872025461, "test/sim_max_reward_4400034": 0.8305855191276622, "test/sim_max_reward_4400035": 0.4899224607205993, "test/sim_max_reward_4400036": 0.3291260453721742, "test/sim_max_reward_4400037": 0.9123652467358346, "test/sim_max_reward_4400038": 0.9288238743909898, "test/sim_max_reward_4400039": 0.7308814813346435, "test/sim_max_reward_4400040": 0.15829680476615204, "test/sim_max_reward_4400041": 0.8209615283764048, "test/sim_max_reward_4400042": 0.01613257225670879, "test/sim_max_reward_4400043": 0.8483038644126577, "test/sim_max_reward_4400044": 0.7815253948216797, "test/sim_max_reward_4400045": 0.9617343480697018, "test/sim_max_reward_4400046": 0.84980502706261, "test/sim_max_reward_4400047": 0.7743410029733347, "test/sim_max_reward_4400048": 0.6314748966107232, "test/sim_max_reward_4400049": 0.6611045704977141, "train/mean_score": 0.40286365844447897, "test/mean_score": 0.48228530731102803, "val_loss": 67290.90625} {"train_loss": -6.007018089294434, "global_step": 75642, "epoch": 1801} {"train_loss": -6.1561174392700195, "global_step": 75643, "epoch": 1801} {"train_loss": -6.116385459899902, "global_step": 75644, "epoch": 1801} {"train_loss": -5.989619255065918, "global_step": 75645, "epoch": 1801} {"train_loss": -6.1274943351745605, "global_step": 75646, "epoch": 1801} {"train_loss": -6.168935775756836, "global_step": 75647, "epoch": 1801} {"train_loss": -6.08915901184082, "global_step": 75648, "epoch": 1801} {"train_loss": -6.060906410217285, "global_step": 75649, "epoch": 1801} {"train_loss": -5.994530200958252, "global_step": 75650, "epoch": 1801} {"train_loss": -6.122871398925781, "global_step": 75651, "epoch": 1801} {"train_loss": -6.091336250305176, "global_step": 75652, "epoch": 1801} {"train_loss": -6.093036651611328, "global_step": 75653, "epoch": 1801} {"train_loss": -6.085670471191406, "global_step": 75654, "epoch": 1801} {"train_loss": -6.1799821853637695, "global_step": 75655, "epoch": 1801} {"train_loss": -6.146350860595703, "global_step": 75656, "epoch": 1801} {"train_loss": -6.13907527923584, "global_step": 75657, "epoch": 1801} {"train_loss": -6.0616679191589355, "global_step": 75658, "epoch": 1801} {"train_loss": -6.128261566162109, "global_step": 75659, "epoch": 1801} {"train_loss": -6.1069746017456055, "global_step": 75660, "epoch": 1801} {"train_loss": -6.041192054748535, "global_step": 75661, "epoch": 1801} {"train_loss": -6.068188667297363, "global_step": 75662, "epoch": 1801} {"train_loss": -6.040564060211182, "global_step": 75663, "epoch": 1801} {"train_loss": -6.09783935546875, "global_step": 75664, "epoch": 1801} {"train_loss": -6.139036178588867, "global_step": 75665, "epoch": 1801} {"train_loss": -6.212733268737793, "global_step": 75666, "epoch": 1801} {"train_loss": -6.014416694641113, "global_step": 75667, "epoch": 1801} {"train_loss": -5.9363532066345215, "global_step": 75668, "epoch": 1801} {"train_loss": -6.12447452545166, "global_step": 75669, "epoch": 1801} {"train_loss": -6.150771617889404, "global_step": 75670, "epoch": 1801} {"train_loss": -6.188170433044434, "global_step": 75671, "epoch": 1801} {"train_loss": -6.07283878326416, "global_step": 75672, "epoch": 1801} {"train_loss": -6.094736576080322, "global_step": 75673, "epoch": 1801} {"train_loss": -6.081213474273682, "global_step": 75674, "epoch": 1801} {"train_loss": -6.077859878540039, "global_step": 75675, "epoch": 1801} {"train_loss": -6.162625312805176, "global_step": 75676, "epoch": 1801} {"train_loss": -6.097715377807617, "global_step": 75677, "epoch": 1801} {"train_loss": -6.150657653808594, "global_step": 75678, "epoch": 1801} {"train_loss": -6.010476112365723, "global_step": 75679, "epoch": 1801} {"train_loss": -6.078091621398926, "global_step": 75680, "epoch": 1801} {"train_loss": -6.103295803070068, "global_step": 75681, "epoch": 1801} {"train_loss": -6.08878755569458, "global_step": 75682, "epoch": 1801} {"train_loss": -6.09513429233006, "global_step": 75683, "epoch": 1801, "val_loss": 67397.640625} {"train_loss": -6.066195964813232, "global_step": 75684, "epoch": 1802} {"train_loss": -6.024211406707764, "global_step": 75685, "epoch": 1802} {"train_loss": -6.120784759521484, "global_step": 75686, "epoch": 1802} {"train_loss": -6.141803741455078, "global_step": 75687, "epoch": 1802} {"train_loss": -6.015690326690674, "global_step": 75688, "epoch": 1802} {"train_loss": -6.037761211395264, "global_step": 75689, "epoch": 1802} {"train_loss": -6.147570610046387, "global_step": 75690, "epoch": 1802} {"train_loss": -6.18890380859375, "global_step": 75691, "epoch": 1802} {"train_loss": -6.235970497131348, "global_step": 75692, "epoch": 1802} {"train_loss": -6.115184307098389, "global_step": 75693, "epoch": 1802} {"train_loss": -6.0925822257995605, "global_step": 75694, "epoch": 1802} {"train_loss": -6.178719997406006, "global_step": 75695, "epoch": 1802} {"train_loss": -6.0238142013549805, "global_step": 75696, "epoch": 1802} {"train_loss": -6.131687641143799, "global_step": 75697, "epoch": 1802} {"train_loss": -6.119989395141602, "global_step": 75698, "epoch": 1802} {"train_loss": -6.08319091796875, "global_step": 75699, "epoch": 1802} {"train_loss": -6.166236877441406, "global_step": 75700, "epoch": 1802} {"train_loss": -6.183096885681152, "global_step": 75701, "epoch": 1802} {"train_loss": -6.227635860443115, "global_step": 75702, "epoch": 1802} {"train_loss": -5.961950302124023, "global_step": 75703, "epoch": 1802} {"train_loss": -6.106584548950195, "global_step": 75704, "epoch": 1802} {"train_loss": -6.102275848388672, "global_step": 75705, "epoch": 1802} {"train_loss": -5.958126068115234, "global_step": 75706, "epoch": 1802} {"train_loss": -5.991707801818848, "global_step": 75707, "epoch": 1802} {"train_loss": -6.114637851715088, "global_step": 75708, "epoch": 1802} {"train_loss": -6.052412986755371, "global_step": 75709, "epoch": 1802} {"train_loss": -6.076904296875, "global_step": 75710, "epoch": 1802} {"train_loss": -6.094237804412842, "global_step": 75711, "epoch": 1802} {"train_loss": -6.000736713409424, "global_step": 75712, "epoch": 1802} {"train_loss": -6.037962913513184, "global_step": 75713, "epoch": 1802} {"train_loss": -6.0518646240234375, "global_step": 75714, "epoch": 1802} {"train_loss": -6.116969585418701, "global_step": 75715, "epoch": 1802} {"train_loss": -6.0286760330200195, "global_step": 75716, "epoch": 1802} {"train_loss": -6.08260440826416, "global_step": 75717, "epoch": 1802} {"train_loss": -6.165216445922852, "global_step": 75718, "epoch": 1802} {"train_loss": -6.08730936050415, "global_step": 75719, "epoch": 1802} {"train_loss": -6.2244720458984375, "global_step": 75720, "epoch": 1802} {"train_loss": -5.825492858886719, "global_step": 75721, "epoch": 1802} {"train_loss": -6.062360763549805, "global_step": 75722, "epoch": 1802} {"train_loss": -5.973230361938477, "global_step": 75723, "epoch": 1802} {"train_loss": -6.140780925750732, "global_step": 75724, "epoch": 1802} {"train_loss": -6.086488451276507, "global_step": 75725, "epoch": 1802, "val_loss": 67638.2265625} {"train_loss": -6.209322452545166, "global_step": 75726, "epoch": 1803} {"train_loss": -6.127486705780029, "global_step": 75727, "epoch": 1803} {"train_loss": -6.102769374847412, "global_step": 75728, "epoch": 1803} {"train_loss": -6.111440658569336, "global_step": 75729, "epoch": 1803} {"train_loss": -6.189311981201172, "global_step": 75730, "epoch": 1803} {"train_loss": -5.993858337402344, "global_step": 75731, "epoch": 1803} {"train_loss": -5.978966236114502, "global_step": 75732, "epoch": 1803} {"train_loss": -6.091035842895508, "global_step": 75733, "epoch": 1803} {"train_loss": -6.036311149597168, "global_step": 75734, "epoch": 1803} {"train_loss": -6.072727680206299, "global_step": 75735, "epoch": 1803} {"train_loss": -6.010532855987549, "global_step": 75736, "epoch": 1803} {"train_loss": -6.155736446380615, "global_step": 75737, "epoch": 1803} {"train_loss": -6.054765701293945, "global_step": 75738, "epoch": 1803} {"train_loss": -6.126130104064941, "global_step": 75739, "epoch": 1803} {"train_loss": -6.147739410400391, "global_step": 75740, "epoch": 1803} {"train_loss": -6.051891803741455, "global_step": 75741, "epoch": 1803} {"train_loss": -6.109756946563721, "global_step": 75742, "epoch": 1803} {"train_loss": -6.025556564331055, "global_step": 75743, "epoch": 1803} {"train_loss": -6.1764726638793945, "global_step": 75744, "epoch": 1803} {"train_loss": -6.074252128601074, "global_step": 75745, "epoch": 1803} {"train_loss": -6.083474159240723, "global_step": 75746, "epoch": 1803} {"train_loss": -6.06428861618042, "global_step": 75747, "epoch": 1803} {"train_loss": -6.018594741821289, "global_step": 75748, "epoch": 1803} {"train_loss": -6.122129917144775, "global_step": 75749, "epoch": 1803} {"train_loss": -6.156491279602051, "global_step": 75750, "epoch": 1803} {"train_loss": -5.919984817504883, "global_step": 75751, "epoch": 1803} {"train_loss": -5.967517852783203, "global_step": 75752, "epoch": 1803} {"train_loss": -5.998331546783447, "global_step": 75753, "epoch": 1803} {"train_loss": -5.91972017288208, "global_step": 75754, "epoch": 1803} {"train_loss": -6.162099838256836, "global_step": 75755, "epoch": 1803} {"train_loss": -6.053630828857422, "global_step": 75756, "epoch": 1803} {"train_loss": -5.995365619659424, "global_step": 75757, "epoch": 1803} {"train_loss": -6.040640830993652, "global_step": 75758, "epoch": 1803} {"train_loss": -6.040015697479248, "global_step": 75759, "epoch": 1803} {"train_loss": -6.08712100982666, "global_step": 75760, "epoch": 1803} {"train_loss": -6.1162109375, "global_step": 75761, "epoch": 1803} {"train_loss": -6.061923027038574, "global_step": 75762, "epoch": 1803} {"train_loss": -6.034420490264893, "global_step": 75763, "epoch": 1803} {"train_loss": -6.0626115798950195, "global_step": 75764, "epoch": 1803} {"train_loss": -5.97749137878418, "global_step": 75765, "epoch": 1803} {"train_loss": -5.944687366485596, "global_step": 75766, "epoch": 1803} {"train_loss": -6.0654454458327525, "global_step": 75767, "epoch": 1803, "val_loss": 67712.328125} {"train_loss": -6.188446998596191, "global_step": 75768, "epoch": 1804} {"train_loss": -6.013584136962891, "global_step": 75769, "epoch": 1804} {"train_loss": -6.059416770935059, "global_step": 75770, "epoch": 1804} {"train_loss": -6.062679290771484, "global_step": 75771, "epoch": 1804} {"train_loss": -6.098856449127197, "global_step": 75772, "epoch": 1804} {"train_loss": -6.044611930847168, "global_step": 75773, "epoch": 1804} {"train_loss": -6.22070837020874, "global_step": 75774, "epoch": 1804} {"train_loss": -5.981950283050537, "global_step": 75775, "epoch": 1804} {"train_loss": -6.044344902038574, "global_step": 75776, "epoch": 1804} {"train_loss": -6.151069641113281, "global_step": 75777, "epoch": 1804} {"train_loss": -6.0060224533081055, "global_step": 75778, "epoch": 1804} {"train_loss": -6.033243179321289, "global_step": 75779, "epoch": 1804} {"train_loss": -6.070765018463135, "global_step": 75780, "epoch": 1804} {"train_loss": -6.038303852081299, "global_step": 75781, "epoch": 1804} {"train_loss": -6.1160688400268555, "global_step": 75782, "epoch": 1804} {"train_loss": -6.035630226135254, "global_step": 75783, "epoch": 1804} {"train_loss": -6.113956928253174, "global_step": 75784, "epoch": 1804} {"train_loss": -6.0197672843933105, "global_step": 75785, "epoch": 1804} {"train_loss": -6.127077102661133, "global_step": 75786, "epoch": 1804} {"train_loss": -6.071043014526367, "global_step": 75787, "epoch": 1804} {"train_loss": -5.889200210571289, "global_step": 75788, "epoch": 1804} {"train_loss": -6.1196136474609375, "global_step": 75789, "epoch": 1804} {"train_loss": -6.068746566772461, "global_step": 75790, "epoch": 1804} {"train_loss": -6.109477996826172, "global_step": 75791, "epoch": 1804} {"train_loss": -5.991123199462891, "global_step": 75792, "epoch": 1804} {"train_loss": -5.989933967590332, "global_step": 75793, "epoch": 1804} {"train_loss": -6.043466567993164, "global_step": 75794, "epoch": 1804} {"train_loss": -5.973655700683594, "global_step": 75795, "epoch": 1804} {"train_loss": -6.015488147735596, "global_step": 75796, "epoch": 1804} {"train_loss": -6.014054298400879, "global_step": 75797, "epoch": 1804} {"train_loss": -6.118905544281006, "global_step": 75798, "epoch": 1804} {"train_loss": -6.11839485168457, "global_step": 75799, "epoch": 1804} {"train_loss": -6.1175408363342285, "global_step": 75800, "epoch": 1804} {"train_loss": -6.054906845092773, "global_step": 75801, "epoch": 1804} {"train_loss": -6.042160511016846, "global_step": 75802, "epoch": 1804} {"train_loss": -6.0813775062561035, "global_step": 75803, "epoch": 1804} {"train_loss": -6.133484840393066, "global_step": 75804, "epoch": 1804} {"train_loss": -6.114753723144531, "global_step": 75805, "epoch": 1804} {"train_loss": -6.116401672363281, "global_step": 75806, "epoch": 1804} {"train_loss": -6.074031352996826, "global_step": 75807, "epoch": 1804} {"train_loss": -6.094864845275879, "global_step": 75808, "epoch": 1804} {"train_loss": -6.0683479990277975, "global_step": 75809, "epoch": 1804, "val_loss": 67519.03125} {"train_loss": -6.097530364990234, "global_step": 75810, "epoch": 1805} {"train_loss": -6.016425609588623, "global_step": 75811, "epoch": 1805} {"train_loss": -6.050302505493164, "global_step": 75812, "epoch": 1805} {"train_loss": -5.88344144821167, "global_step": 75813, "epoch": 1805} {"train_loss": -5.967270851135254, "global_step": 75814, "epoch": 1805} {"train_loss": -6.06065034866333, "global_step": 75815, "epoch": 1805} {"train_loss": -6.1183857917785645, "global_step": 75816, "epoch": 1805} {"train_loss": -6.0369720458984375, "global_step": 75817, "epoch": 1805} {"train_loss": -6.008338928222656, "global_step": 75818, "epoch": 1805} {"train_loss": -6.01664400100708, "global_step": 75819, "epoch": 1805} {"train_loss": -6.182085037231445, "global_step": 75820, "epoch": 1805} {"train_loss": -6.166383743286133, "global_step": 75821, "epoch": 1805} {"train_loss": -5.916752338409424, "global_step": 75822, "epoch": 1805} {"train_loss": -6.041407585144043, "global_step": 75823, "epoch": 1805} {"train_loss": -6.0411834716796875, "global_step": 75824, "epoch": 1805} {"train_loss": -6.0736985206604, "global_step": 75825, "epoch": 1805} {"train_loss": -6.012678623199463, "global_step": 75826, "epoch": 1805} {"train_loss": -5.992121696472168, "global_step": 75827, "epoch": 1805} {"train_loss": -6.04050350189209, "global_step": 75828, "epoch": 1805} {"train_loss": -6.077064514160156, "global_step": 75829, "epoch": 1805} {"train_loss": -6.132446765899658, "global_step": 75830, "epoch": 1805} {"train_loss": -6.205259323120117, "global_step": 75831, "epoch": 1805} {"train_loss": -5.998106956481934, "global_step": 75832, "epoch": 1805} {"train_loss": -6.157245635986328, "global_step": 75833, "epoch": 1805} {"train_loss": -5.985511779785156, "global_step": 75834, "epoch": 1805} {"train_loss": -6.118833065032959, "global_step": 75835, "epoch": 1805} {"train_loss": -6.034785270690918, "global_step": 75836, "epoch": 1805} {"train_loss": -6.031060218811035, "global_step": 75837, "epoch": 1805} {"train_loss": -6.020786762237549, "global_step": 75838, "epoch": 1805} {"train_loss": -6.034008979797363, "global_step": 75839, "epoch": 1805} {"train_loss": -5.963266372680664, "global_step": 75840, "epoch": 1805} {"train_loss": -5.9445343017578125, "global_step": 75841, "epoch": 1805} {"train_loss": -6.191582679748535, "global_step": 75842, "epoch": 1805} {"train_loss": -6.061634063720703, "global_step": 75843, "epoch": 1805} {"train_loss": -6.108625411987305, "global_step": 75844, "epoch": 1805} {"train_loss": -6.095634937286377, "global_step": 75845, "epoch": 1805} {"train_loss": -6.132116317749023, "global_step": 75846, "epoch": 1805} {"train_loss": -6.181014060974121, "global_step": 75847, "epoch": 1805} {"train_loss": -5.99085807800293, "global_step": 75848, "epoch": 1805} {"train_loss": -6.219019412994385, "global_step": 75849, "epoch": 1805} {"train_loss": -6.084971904754639, "global_step": 75850, "epoch": 1805} {"train_loss": -6.059539783568609, "global_step": 75851, "epoch": 1805, "val_loss": 67321.2578125} {"train_loss": -6.092836380004883, "global_step": 75852, "epoch": 1806} {"train_loss": -6.106916427612305, "global_step": 75853, "epoch": 1806} {"train_loss": -6.027347087860107, "global_step": 75854, "epoch": 1806} {"train_loss": -6.068479537963867, "global_step": 75855, "epoch": 1806} {"train_loss": -6.082542896270752, "global_step": 75856, "epoch": 1806} {"train_loss": -6.169123649597168, "global_step": 75857, "epoch": 1806} {"train_loss": -6.133720874786377, "global_step": 75858, "epoch": 1806} {"train_loss": -6.1192169189453125, "global_step": 75859, "epoch": 1806} {"train_loss": -5.976202011108398, "global_step": 75860, "epoch": 1806} {"train_loss": -5.974421977996826, "global_step": 75861, "epoch": 1806} {"train_loss": -6.075488567352295, "global_step": 75862, "epoch": 1806} {"train_loss": -6.097231864929199, "global_step": 75863, "epoch": 1806} {"train_loss": -6.126435279846191, "global_step": 75864, "epoch": 1806} {"train_loss": -6.054222583770752, "global_step": 75865, "epoch": 1806} {"train_loss": -6.173235893249512, "global_step": 75866, "epoch": 1806} {"train_loss": -6.123038291931152, "global_step": 75867, "epoch": 1806} {"train_loss": -6.075527191162109, "global_step": 75868, "epoch": 1806} {"train_loss": -6.08463191986084, "global_step": 75869, "epoch": 1806} {"train_loss": -6.054305553436279, "global_step": 75870, "epoch": 1806} {"train_loss": -6.151938438415527, "global_step": 75871, "epoch": 1806} {"train_loss": -6.105337142944336, "global_step": 75872, "epoch": 1806} {"train_loss": -6.082775115966797, "global_step": 75873, "epoch": 1806} {"train_loss": -6.113020896911621, "global_step": 75874, "epoch": 1806} {"train_loss": -6.009360313415527, "global_step": 75875, "epoch": 1806} {"train_loss": -6.0650835037231445, "global_step": 75876, "epoch": 1806} {"train_loss": -6.025393486022949, "global_step": 75877, "epoch": 1806} {"train_loss": -6.175124168395996, "global_step": 75878, "epoch": 1806} {"train_loss": -5.9612908363342285, "global_step": 75879, "epoch": 1806} {"train_loss": -6.162336349487305, "global_step": 75880, "epoch": 1806} {"train_loss": -6.098694324493408, "global_step": 75881, "epoch": 1806} {"train_loss": -5.972397804260254, "global_step": 75882, "epoch": 1806} {"train_loss": -6.026608943939209, "global_step": 75883, "epoch": 1806} {"train_loss": -6.076604843139648, "global_step": 75884, "epoch": 1806} {"train_loss": -5.996481418609619, "global_step": 75885, "epoch": 1806} {"train_loss": -6.217896938323975, "global_step": 75886, "epoch": 1806} {"train_loss": -6.072012901306152, "global_step": 75887, "epoch": 1806} {"train_loss": -6.116799831390381, "global_step": 75888, "epoch": 1806} {"train_loss": -6.065101623535156, "global_step": 75889, "epoch": 1806} {"train_loss": -5.91536283493042, "global_step": 75890, "epoch": 1806} {"train_loss": -6.046375274658203, "global_step": 75891, "epoch": 1806} {"train_loss": -6.013872146606445, "global_step": 75892, "epoch": 1806} {"train_loss": -6.07526547568185, "global_step": 75893, "epoch": 1806, "val_loss": 67751.5390625} {"train_loss": -6.075029373168945, "global_step": 75894, "epoch": 1807} {"train_loss": -6.195553302764893, "global_step": 75895, "epoch": 1807} {"train_loss": -6.025228500366211, "global_step": 75896, "epoch": 1807} {"train_loss": -5.964001655578613, "global_step": 75897, "epoch": 1807} {"train_loss": -6.192690849304199, "global_step": 75898, "epoch": 1807} {"train_loss": -5.871817588806152, "global_step": 75899, "epoch": 1807} {"train_loss": -6.021766662597656, "global_step": 75900, "epoch": 1807} {"train_loss": -6.058900833129883, "global_step": 75901, "epoch": 1807} {"train_loss": -6.083286285400391, "global_step": 75902, "epoch": 1807} {"train_loss": -6.102806568145752, "global_step": 75903, "epoch": 1807} {"train_loss": -5.991186141967773, "global_step": 75904, "epoch": 1807} {"train_loss": -6.126943588256836, "global_step": 75905, "epoch": 1807} {"train_loss": -6.019308090209961, "global_step": 75906, "epoch": 1807} {"train_loss": -6.049196720123291, "global_step": 75907, "epoch": 1807} {"train_loss": -6.018350601196289, "global_step": 75908, "epoch": 1807} {"train_loss": -6.005476474761963, "global_step": 75909, "epoch": 1807} {"train_loss": -6.088409423828125, "global_step": 75910, "epoch": 1807} {"train_loss": -5.928208827972412, "global_step": 75911, "epoch": 1807} {"train_loss": -6.039196968078613, "global_step": 75912, "epoch": 1807} {"train_loss": -5.94234561920166, "global_step": 75913, "epoch": 1807} {"train_loss": -6.050568580627441, "global_step": 75914, "epoch": 1807} {"train_loss": -6.1556549072265625, "global_step": 75915, "epoch": 1807} {"train_loss": -5.936823844909668, "global_step": 75916, "epoch": 1807} {"train_loss": -6.041451454162598, "global_step": 75917, "epoch": 1807} {"train_loss": -5.962795257568359, "global_step": 75918, "epoch": 1807} {"train_loss": -6.052853107452393, "global_step": 75919, "epoch": 1807} {"train_loss": -6.069793701171875, "global_step": 75920, "epoch": 1807} {"train_loss": -5.963481426239014, "global_step": 75921, "epoch": 1807} {"train_loss": -6.061033248901367, "global_step": 75922, "epoch": 1807} {"train_loss": -6.102360248565674, "global_step": 75923, "epoch": 1807} {"train_loss": -6.064207553863525, "global_step": 75924, "epoch": 1807} {"train_loss": -6.129598617553711, "global_step": 75925, "epoch": 1807} {"train_loss": -6.036489963531494, "global_step": 75926, "epoch": 1807} {"train_loss": -5.9655442237854, "global_step": 75927, "epoch": 1807} {"train_loss": -6.013843536376953, "global_step": 75928, "epoch": 1807} {"train_loss": -6.025608062744141, "global_step": 75929, "epoch": 1807} {"train_loss": -6.121180534362793, "global_step": 75930, "epoch": 1807} {"train_loss": -5.970095634460449, "global_step": 75931, "epoch": 1807} {"train_loss": -6.0668792724609375, "global_step": 75932, "epoch": 1807} {"train_loss": -6.17957878112793, "global_step": 75933, "epoch": 1807} {"train_loss": -6.005690574645996, "global_step": 75934, "epoch": 1807} {"train_loss": -6.043149493989491, "global_step": 75935, "epoch": 1807, "val_loss": 67365.1796875} {"train_loss": -5.981196403503418, "global_step": 75936, "epoch": 1808} {"train_loss": -5.964407920837402, "global_step": 75937, "epoch": 1808} {"train_loss": -6.029697418212891, "global_step": 75938, "epoch": 1808} {"train_loss": -6.0718841552734375, "global_step": 75939, "epoch": 1808} {"train_loss": -6.081647872924805, "global_step": 75940, "epoch": 1808} {"train_loss": -6.023162841796875, "global_step": 75941, "epoch": 1808} {"train_loss": -6.032788276672363, "global_step": 75942, "epoch": 1808} {"train_loss": -6.213037490844727, "global_step": 75943, "epoch": 1808} {"train_loss": -6.038120269775391, "global_step": 75944, "epoch": 1808} {"train_loss": -6.235224723815918, "global_step": 75945, "epoch": 1808} {"train_loss": -5.9292144775390625, "global_step": 75946, "epoch": 1808} {"train_loss": -6.1250433921813965, "global_step": 75947, "epoch": 1808} {"train_loss": -6.056131362915039, "global_step": 75948, "epoch": 1808} {"train_loss": -6.208735942840576, "global_step": 75949, "epoch": 1808} {"train_loss": -6.058785438537598, "global_step": 75950, "epoch": 1808} {"train_loss": -6.125674247741699, "global_step": 75951, "epoch": 1808} {"train_loss": -6.037397384643555, "global_step": 75952, "epoch": 1808} {"train_loss": -6.188510894775391, "global_step": 75953, "epoch": 1808} {"train_loss": -6.034235954284668, "global_step": 75954, "epoch": 1808} {"train_loss": -6.208757400512695, "global_step": 75955, "epoch": 1808} {"train_loss": -6.169135093688965, "global_step": 75956, "epoch": 1808} {"train_loss": -6.068682670593262, "global_step": 75957, "epoch": 1808} {"train_loss": -6.082763195037842, "global_step": 75958, "epoch": 1808} {"train_loss": -6.1342010498046875, "global_step": 75959, "epoch": 1808} {"train_loss": -5.986374378204346, "global_step": 75960, "epoch": 1808} {"train_loss": -6.287611961364746, "global_step": 75961, "epoch": 1808} {"train_loss": -6.202131271362305, "global_step": 75962, "epoch": 1808} {"train_loss": -5.951656341552734, "global_step": 75963, "epoch": 1808} {"train_loss": -5.991524696350098, "global_step": 75964, "epoch": 1808} {"train_loss": -6.180758476257324, "global_step": 75965, "epoch": 1808} {"train_loss": -6.061087608337402, "global_step": 75966, "epoch": 1808} {"train_loss": -6.084677696228027, "global_step": 75967, "epoch": 1808} {"train_loss": -6.169398307800293, "global_step": 75968, "epoch": 1808} {"train_loss": -6.048030376434326, "global_step": 75969, "epoch": 1808} {"train_loss": -6.081965446472168, "global_step": 75970, "epoch": 1808} {"train_loss": -6.140681266784668, "global_step": 75971, "epoch": 1808} {"train_loss": -6.132306098937988, "global_step": 75972, "epoch": 1808} {"train_loss": -6.06990385055542, "global_step": 75973, "epoch": 1808} {"train_loss": -6.056295394897461, "global_step": 75974, "epoch": 1808} {"train_loss": -5.9201788902282715, "global_step": 75975, "epoch": 1808} {"train_loss": -6.136758804321289, "global_step": 75976, "epoch": 1808} {"train_loss": -6.089646623248146, "global_step": 75977, "epoch": 1808, "val_loss": 67763.1171875} {"train_loss": -6.070085525512695, "global_step": 75978, "epoch": 1809} {"train_loss": -6.146302223205566, "global_step": 75979, "epoch": 1809} {"train_loss": -6.011465072631836, "global_step": 75980, "epoch": 1809} {"train_loss": -5.982287406921387, "global_step": 75981, "epoch": 1809} {"train_loss": -6.2290449142456055, "global_step": 75982, "epoch": 1809} {"train_loss": -6.139377593994141, "global_step": 75983, "epoch": 1809} {"train_loss": -6.07702112197876, "global_step": 75984, "epoch": 1809} {"train_loss": -6.146246433258057, "global_step": 75985, "epoch": 1809} {"train_loss": -5.987610816955566, "global_step": 75986, "epoch": 1809} {"train_loss": -6.10725212097168, "global_step": 75987, "epoch": 1809} {"train_loss": -6.111972808837891, "global_step": 75988, "epoch": 1809} {"train_loss": -6.15116548538208, "global_step": 75989, "epoch": 1809} {"train_loss": -6.161288261413574, "global_step": 75990, "epoch": 1809} {"train_loss": -6.14771842956543, "global_step": 75991, "epoch": 1809} {"train_loss": -6.087867259979248, "global_step": 75992, "epoch": 1809} {"train_loss": -6.1458282470703125, "global_step": 75993, "epoch": 1809} {"train_loss": -6.056544303894043, "global_step": 75994, "epoch": 1809} {"train_loss": -6.055375099182129, "global_step": 75995, "epoch": 1809} {"train_loss": -6.094054698944092, "global_step": 75996, "epoch": 1809} {"train_loss": -5.978873252868652, "global_step": 75997, "epoch": 1809} {"train_loss": -6.115793228149414, "global_step": 75998, "epoch": 1809} {"train_loss": -6.087779998779297, "global_step": 75999, "epoch": 1809} {"train_loss": -6.06230354309082, "global_step": 76000, "epoch": 1809} {"train_loss": -6.107449054718018, "global_step": 76001, "epoch": 1809} {"train_loss": -6.098489284515381, "global_step": 76002, "epoch": 1809} {"train_loss": -6.072181701660156, "global_step": 76003, "epoch": 1809} {"train_loss": -6.225612163543701, "global_step": 76004, "epoch": 1809} {"train_loss": -6.135784149169922, "global_step": 76005, "epoch": 1809} {"train_loss": -5.959439754486084, "global_step": 76006, "epoch": 1809} {"train_loss": -6.073439598083496, "global_step": 76007, "epoch": 1809} {"train_loss": -6.126852989196777, "global_step": 76008, "epoch": 1809} {"train_loss": -6.135206699371338, "global_step": 76009, "epoch": 1809} {"train_loss": -5.908928871154785, "global_step": 76010, "epoch": 1809} {"train_loss": -5.992626190185547, "global_step": 76011, "epoch": 1809} {"train_loss": -6.142853260040283, "global_step": 76012, "epoch": 1809} {"train_loss": -6.090232849121094, "global_step": 76013, "epoch": 1809} {"train_loss": -6.115203857421875, "global_step": 76014, "epoch": 1809} {"train_loss": -6.084588050842285, "global_step": 76015, "epoch": 1809} {"train_loss": -6.128270149230957, "global_step": 76016, "epoch": 1809} {"train_loss": -5.970796585083008, "global_step": 76017, "epoch": 1809} {"train_loss": -6.08803129196167, "global_step": 76018, "epoch": 1809} {"train_loss": -6.088443415505545, "global_step": 76019, "epoch": 1809, "val_loss": 67340.6640625} {"train_loss": -6.151818752288818, "global_step": 76020, "epoch": 1810} {"train_loss": -6.067651271820068, "global_step": 76021, "epoch": 1810} {"train_loss": -6.1740570068359375, "global_step": 76022, "epoch": 1810} {"train_loss": -6.189931869506836, "global_step": 76023, "epoch": 1810} {"train_loss": -5.998460292816162, "global_step": 76024, "epoch": 1810} {"train_loss": -6.144916534423828, "global_step": 76025, "epoch": 1810} {"train_loss": -6.043303966522217, "global_step": 76026, "epoch": 1810} {"train_loss": -6.098388671875, "global_step": 76027, "epoch": 1810} {"train_loss": -6.057888031005859, "global_step": 76028, "epoch": 1810} {"train_loss": -6.027561664581299, "global_step": 76029, "epoch": 1810} {"train_loss": -6.060121536254883, "global_step": 76030, "epoch": 1810} {"train_loss": -6.180968761444092, "global_step": 76031, "epoch": 1810} {"train_loss": -6.045464992523193, "global_step": 76032, "epoch": 1810} {"train_loss": -6.083828449249268, "global_step": 76033, "epoch": 1810} {"train_loss": -6.121509075164795, "global_step": 76034, "epoch": 1810} {"train_loss": -6.048419952392578, "global_step": 76035, "epoch": 1810} {"train_loss": -6.077742099761963, "global_step": 76036, "epoch": 1810} {"train_loss": -6.091622352600098, "global_step": 76037, "epoch": 1810} {"train_loss": -6.1784210205078125, "global_step": 76038, "epoch": 1810} {"train_loss": -6.026827812194824, "global_step": 76039, "epoch": 1810} {"train_loss": -6.098699569702148, "global_step": 76040, "epoch": 1810} {"train_loss": -6.140635967254639, "global_step": 76041, "epoch": 1810} {"train_loss": -6.075648307800293, "global_step": 76042, "epoch": 1810} {"train_loss": -6.085377216339111, "global_step": 76043, "epoch": 1810} {"train_loss": -6.0328898429870605, "global_step": 76044, "epoch": 1810} {"train_loss": -6.076265811920166, "global_step": 76045, "epoch": 1810} {"train_loss": -6.163681983947754, "global_step": 76046, "epoch": 1810} {"train_loss": -6.041905879974365, "global_step": 76047, "epoch": 1810} {"train_loss": -5.970341682434082, "global_step": 76048, "epoch": 1810} {"train_loss": -6.058495998382568, "global_step": 76049, "epoch": 1810} {"train_loss": -5.999366760253906, "global_step": 76050, "epoch": 1810} {"train_loss": -6.13376522064209, "global_step": 76051, "epoch": 1810} {"train_loss": -6.062859535217285, "global_step": 76052, "epoch": 1810} {"train_loss": -5.990391731262207, "global_step": 76053, "epoch": 1810} {"train_loss": -6.094743728637695, "global_step": 76054, "epoch": 1810} {"train_loss": -5.977054595947266, "global_step": 76055, "epoch": 1810} {"train_loss": -6.151815414428711, "global_step": 76056, "epoch": 1810} {"train_loss": -6.1035051345825195, "global_step": 76057, "epoch": 1810} {"train_loss": -5.98192024230957, "global_step": 76058, "epoch": 1810} {"train_loss": -6.079530715942383, "global_step": 76059, "epoch": 1810} {"train_loss": -5.933991432189941, "global_step": 76060, "epoch": 1810} {"train_loss": -6.074846142814273, "global_step": 76061, "epoch": 1810, "val_loss": 67629.0390625} {"train_loss": -6.010021209716797, "global_step": 76062, "epoch": 1811} {"train_loss": -6.029109477996826, "global_step": 76063, "epoch": 1811} {"train_loss": -6.132451057434082, "global_step": 76064, "epoch": 1811} {"train_loss": -6.12132453918457, "global_step": 76065, "epoch": 1811} {"train_loss": -6.082004547119141, "global_step": 76066, "epoch": 1811} {"train_loss": -6.062222480773926, "global_step": 76067, "epoch": 1811} {"train_loss": -6.0461039543151855, "global_step": 76068, "epoch": 1811} {"train_loss": -6.045814037322998, "global_step": 76069, "epoch": 1811} {"train_loss": -6.080780029296875, "global_step": 76070, "epoch": 1811} {"train_loss": -6.082119941711426, "global_step": 76071, "epoch": 1811} {"train_loss": -6.079007625579834, "global_step": 76072, "epoch": 1811} {"train_loss": -6.219780921936035, "global_step": 76073, "epoch": 1811} {"train_loss": -6.155215263366699, "global_step": 76074, "epoch": 1811} {"train_loss": -6.055802345275879, "global_step": 76075, "epoch": 1811} {"train_loss": -6.254912376403809, "global_step": 76076, "epoch": 1811} {"train_loss": -6.0406670570373535, "global_step": 76077, "epoch": 1811} {"train_loss": -6.144041061401367, "global_step": 76078, "epoch": 1811} {"train_loss": -6.078679084777832, "global_step": 76079, "epoch": 1811} {"train_loss": -5.983753681182861, "global_step": 76080, "epoch": 1811} {"train_loss": -6.086087226867676, "global_step": 76081, "epoch": 1811} {"train_loss": -5.987192153930664, "global_step": 76082, "epoch": 1811} {"train_loss": -6.086302757263184, "global_step": 76083, "epoch": 1811} {"train_loss": -6.096156597137451, "global_step": 76084, "epoch": 1811} {"train_loss": -5.946913719177246, "global_step": 76085, "epoch": 1811} {"train_loss": -6.095058441162109, "global_step": 76086, "epoch": 1811} {"train_loss": -6.039153099060059, "global_step": 76087, "epoch": 1811} {"train_loss": -6.023341178894043, "global_step": 76088, "epoch": 1811} {"train_loss": -6.119786262512207, "global_step": 76089, "epoch": 1811} {"train_loss": -6.131350994110107, "global_step": 76090, "epoch": 1811} {"train_loss": -6.027142524719238, "global_step": 76091, "epoch": 1811} {"train_loss": -6.054028511047363, "global_step": 76092, "epoch": 1811} {"train_loss": -6.096463203430176, "global_step": 76093, "epoch": 1811} {"train_loss": -6.111874580383301, "global_step": 76094, "epoch": 1811} {"train_loss": -6.169585227966309, "global_step": 76095, "epoch": 1811} {"train_loss": -6.151172637939453, "global_step": 76096, "epoch": 1811} {"train_loss": -5.983490943908691, "global_step": 76097, "epoch": 1811} {"train_loss": -5.954018592834473, "global_step": 76098, "epoch": 1811} {"train_loss": -6.034008502960205, "global_step": 76099, "epoch": 1811} {"train_loss": -6.073888778686523, "global_step": 76100, "epoch": 1811} {"train_loss": -6.059111595153809, "global_step": 76101, "epoch": 1811} {"train_loss": -6.04890251159668, "global_step": 76102, "epoch": 1811} {"train_loss": -6.075087013698759, "global_step": 76103, "epoch": 1811, "val_loss": 67891.2109375} {"train_loss": -6.0094146728515625, "global_step": 76104, "epoch": 1812} {"train_loss": -6.017576217651367, "global_step": 76105, "epoch": 1812} {"train_loss": -6.08620023727417, "global_step": 76106, "epoch": 1812} {"train_loss": -6.096395015716553, "global_step": 76107, "epoch": 1812} {"train_loss": -6.064411163330078, "global_step": 76108, "epoch": 1812} {"train_loss": -6.107816696166992, "global_step": 76109, "epoch": 1812} {"train_loss": -6.0272722244262695, "global_step": 76110, "epoch": 1812} {"train_loss": -6.102242946624756, "global_step": 76111, "epoch": 1812} {"train_loss": -6.144001483917236, "global_step": 76112, "epoch": 1812} {"train_loss": -6.130942344665527, "global_step": 76113, "epoch": 1812} {"train_loss": -6.001051902770996, "global_step": 76114, "epoch": 1812} {"train_loss": -6.12003231048584, "global_step": 76115, "epoch": 1812} {"train_loss": -6.013584136962891, "global_step": 76116, "epoch": 1812} {"train_loss": -6.0847625732421875, "global_step": 76117, "epoch": 1812} {"train_loss": -6.069180488586426, "global_step": 76118, "epoch": 1812} {"train_loss": -5.993460655212402, "global_step": 76119, "epoch": 1812} {"train_loss": -6.021598815917969, "global_step": 76120, "epoch": 1812} {"train_loss": -6.108560562133789, "global_step": 76121, "epoch": 1812} {"train_loss": -6.070204734802246, "global_step": 76122, "epoch": 1812} {"train_loss": -5.995100498199463, "global_step": 76123, "epoch": 1812} {"train_loss": -6.208227157592773, "global_step": 76124, "epoch": 1812} {"train_loss": -6.020880222320557, "global_step": 76125, "epoch": 1812} {"train_loss": -5.9834794998168945, "global_step": 76126, "epoch": 1812} {"train_loss": -6.069628715515137, "global_step": 76127, "epoch": 1812} {"train_loss": -6.050985813140869, "global_step": 76128, "epoch": 1812} {"train_loss": -6.023580074310303, "global_step": 76129, "epoch": 1812} {"train_loss": -6.065077781677246, "global_step": 76130, "epoch": 1812} {"train_loss": -6.071602821350098, "global_step": 76131, "epoch": 1812} {"train_loss": -5.948391914367676, "global_step": 76132, "epoch": 1812} {"train_loss": -6.064667224884033, "global_step": 76133, "epoch": 1812} {"train_loss": -6.06494140625, "global_step": 76134, "epoch": 1812} {"train_loss": -6.047537803649902, "global_step": 76135, "epoch": 1812} {"train_loss": -6.11339807510376, "global_step": 76136, "epoch": 1812} {"train_loss": -6.118243217468262, "global_step": 76137, "epoch": 1812} {"train_loss": -6.118689060211182, "global_step": 76138, "epoch": 1812} {"train_loss": -5.958988189697266, "global_step": 76139, "epoch": 1812} {"train_loss": -6.025425910949707, "global_step": 76140, "epoch": 1812} {"train_loss": -6.085574626922607, "global_step": 76141, "epoch": 1812} {"train_loss": -6.032903671264648, "global_step": 76142, "epoch": 1812} {"train_loss": -6.128049850463867, "global_step": 76143, "epoch": 1812} {"train_loss": -6.061694145202637, "global_step": 76144, "epoch": 1812} {"train_loss": -6.0631671860104515, "global_step": 76145, "epoch": 1812, "val_loss": 67485.984375} {"train_loss": -6.12893009185791, "global_step": 76146, "epoch": 1813} {"train_loss": -6.040765762329102, "global_step": 76147, "epoch": 1813} {"train_loss": -6.0464253425598145, "global_step": 76148, "epoch": 1813} {"train_loss": -6.113458156585693, "global_step": 76149, "epoch": 1813} {"train_loss": -5.992442607879639, "global_step": 76150, "epoch": 1813} {"train_loss": -6.13765287399292, "global_step": 76151, "epoch": 1813} {"train_loss": -6.146811485290527, "global_step": 76152, "epoch": 1813} {"train_loss": -6.003654479980469, "global_step": 76153, "epoch": 1813} {"train_loss": -6.070993423461914, "global_step": 76154, "epoch": 1813} {"train_loss": -6.1605424880981445, "global_step": 76155, "epoch": 1813} {"train_loss": -6.056070327758789, "global_step": 76156, "epoch": 1813} {"train_loss": -6.082010269165039, "global_step": 76157, "epoch": 1813} {"train_loss": -6.160419940948486, "global_step": 76158, "epoch": 1813} {"train_loss": -6.158360958099365, "global_step": 76159, "epoch": 1813} {"train_loss": -6.084877967834473, "global_step": 76160, "epoch": 1813} {"train_loss": -6.037282466888428, "global_step": 76161, "epoch": 1813} {"train_loss": -5.975588798522949, "global_step": 76162, "epoch": 1813} {"train_loss": -5.980121612548828, "global_step": 76163, "epoch": 1813} {"train_loss": -6.092464447021484, "global_step": 76164, "epoch": 1813} {"train_loss": -5.961982250213623, "global_step": 76165, "epoch": 1813} {"train_loss": -6.174269676208496, "global_step": 76166, "epoch": 1813} {"train_loss": -6.064333915710449, "global_step": 76167, "epoch": 1813} {"train_loss": -5.990156173706055, "global_step": 76168, "epoch": 1813} {"train_loss": -6.164088726043701, "global_step": 76169, "epoch": 1813} {"train_loss": -6.057564735412598, "global_step": 76170, "epoch": 1813} {"train_loss": -6.010951995849609, "global_step": 76171, "epoch": 1813} {"train_loss": -6.112261772155762, "global_step": 76172, "epoch": 1813} {"train_loss": -5.870070457458496, "global_step": 76173, "epoch": 1813} {"train_loss": -6.105622291564941, "global_step": 76174, "epoch": 1813} {"train_loss": -6.091331481933594, "global_step": 76175, "epoch": 1813} {"train_loss": -6.107583045959473, "global_step": 76176, "epoch": 1813} {"train_loss": -6.039241790771484, "global_step": 76177, "epoch": 1813} {"train_loss": -6.072717666625977, "global_step": 76178, "epoch": 1813} {"train_loss": -6.150475978851318, "global_step": 76179, "epoch": 1813} {"train_loss": -5.989057540893555, "global_step": 76180, "epoch": 1813} {"train_loss": -6.035246849060059, "global_step": 76181, "epoch": 1813} {"train_loss": -6.188411712646484, "global_step": 76182, "epoch": 1813} {"train_loss": -6.090427398681641, "global_step": 76183, "epoch": 1813} {"train_loss": -6.022217273712158, "global_step": 76184, "epoch": 1813} {"train_loss": -6.048849105834961, "global_step": 76185, "epoch": 1813} {"train_loss": -6.103764057159424, "global_step": 76186, "epoch": 1813} {"train_loss": -6.0734333992004395, "global_step": 76187, "epoch": 1813, "val_loss": 67517.265625} {"train_loss": -6.179146766662598, "global_step": 76188, "epoch": 1814} {"train_loss": -6.181951522827148, "global_step": 76189, "epoch": 1814} {"train_loss": -6.025174140930176, "global_step": 76190, "epoch": 1814} {"train_loss": -6.054962635040283, "global_step": 76191, "epoch": 1814} {"train_loss": -6.0336809158325195, "global_step": 76192, "epoch": 1814} {"train_loss": -6.017454147338867, "global_step": 76193, "epoch": 1814} {"train_loss": -6.152709007263184, "global_step": 76194, "epoch": 1814} {"train_loss": -6.110175609588623, "global_step": 76195, "epoch": 1814} {"train_loss": -6.203949928283691, "global_step": 76196, "epoch": 1814} {"train_loss": -6.127403259277344, "global_step": 76197, "epoch": 1814} {"train_loss": -6.13861608505249, "global_step": 76198, "epoch": 1814} {"train_loss": -6.154583930969238, "global_step": 76199, "epoch": 1814} {"train_loss": -6.037127494812012, "global_step": 76200, "epoch": 1814} {"train_loss": -6.118131637573242, "global_step": 76201, "epoch": 1814} {"train_loss": -6.062542915344238, "global_step": 76202, "epoch": 1814} {"train_loss": -6.090993881225586, "global_step": 76203, "epoch": 1814} {"train_loss": -6.117401123046875, "global_step": 76204, "epoch": 1814} {"train_loss": -6.07046365737915, "global_step": 76205, "epoch": 1814} {"train_loss": -6.095400333404541, "global_step": 76206, "epoch": 1814} {"train_loss": -6.084090232849121, "global_step": 76207, "epoch": 1814} {"train_loss": -6.090346813201904, "global_step": 76208, "epoch": 1814} {"train_loss": -6.138942718505859, "global_step": 76209, "epoch": 1814} {"train_loss": -6.122981548309326, "global_step": 76210, "epoch": 1814} {"train_loss": -6.138381004333496, "global_step": 76211, "epoch": 1814} {"train_loss": -6.117825984954834, "global_step": 76212, "epoch": 1814} {"train_loss": -6.032805919647217, "global_step": 76213, "epoch": 1814} {"train_loss": -6.114396095275879, "global_step": 76214, "epoch": 1814} {"train_loss": -6.085293769836426, "global_step": 76215, "epoch": 1814} {"train_loss": -6.038516998291016, "global_step": 76216, "epoch": 1814} {"train_loss": -6.043334484100342, "global_step": 76217, "epoch": 1814} {"train_loss": -5.972896575927734, "global_step": 76218, "epoch": 1814} {"train_loss": -6.161965370178223, "global_step": 76219, "epoch": 1814} {"train_loss": -6.085275650024414, "global_step": 76220, "epoch": 1814} {"train_loss": -6.127516269683838, "global_step": 76221, "epoch": 1814} {"train_loss": -6.06028938293457, "global_step": 76222, "epoch": 1814} {"train_loss": -6.025172233581543, "global_step": 76223, "epoch": 1814} {"train_loss": -6.067082405090332, "global_step": 76224, "epoch": 1814} {"train_loss": -6.128942489624023, "global_step": 76225, "epoch": 1814} {"train_loss": -6.098546028137207, "global_step": 76226, "epoch": 1814} {"train_loss": -5.99489688873291, "global_step": 76227, "epoch": 1814} {"train_loss": -6.0878520011901855, "global_step": 76228, "epoch": 1814} {"train_loss": -6.091039861951556, "global_step": 76229, "epoch": 1814, "val_loss": 67722.1484375} {"train_loss": -6.136290550231934, "global_step": 76230, "epoch": 1815} {"train_loss": -6.193933010101318, "global_step": 76231, "epoch": 1815} {"train_loss": -5.94873571395874, "global_step": 76232, "epoch": 1815} {"train_loss": -6.15344762802124, "global_step": 76233, "epoch": 1815} {"train_loss": -6.039388179779053, "global_step": 76234, "epoch": 1815} {"train_loss": -5.924249649047852, "global_step": 76235, "epoch": 1815} {"train_loss": -6.014106750488281, "global_step": 76236, "epoch": 1815} {"train_loss": -6.060346603393555, "global_step": 76237, "epoch": 1815} {"train_loss": -6.073637008666992, "global_step": 76238, "epoch": 1815} {"train_loss": -6.068943977355957, "global_step": 76239, "epoch": 1815} {"train_loss": -6.150808334350586, "global_step": 76240, "epoch": 1815} {"train_loss": -5.997358322143555, "global_step": 76241, "epoch": 1815} {"train_loss": -5.979114532470703, "global_step": 76242, "epoch": 1815} {"train_loss": -5.9753947257995605, "global_step": 76243, "epoch": 1815} {"train_loss": -6.11370849609375, "global_step": 76244, "epoch": 1815} {"train_loss": -6.023682117462158, "global_step": 76245, "epoch": 1815} {"train_loss": -6.078125953674316, "global_step": 76246, "epoch": 1815} {"train_loss": -6.163022518157959, "global_step": 76247, "epoch": 1815} {"train_loss": -5.916023254394531, "global_step": 76248, "epoch": 1815} {"train_loss": -6.073455810546875, "global_step": 76249, "epoch": 1815} {"train_loss": -6.093211650848389, "global_step": 76250, "epoch": 1815} {"train_loss": -5.938991546630859, "global_step": 76251, "epoch": 1815} {"train_loss": -6.107698917388916, "global_step": 76252, "epoch": 1815} {"train_loss": -5.886168479919434, "global_step": 76253, "epoch": 1815} {"train_loss": -5.895364761352539, "global_step": 76254, "epoch": 1815} {"train_loss": -6.195549011230469, "global_step": 76255, "epoch": 1815} {"train_loss": -6.02103853225708, "global_step": 76256, "epoch": 1815} {"train_loss": -6.095093727111816, "global_step": 76257, "epoch": 1815} {"train_loss": -5.941832065582275, "global_step": 76258, "epoch": 1815} {"train_loss": -6.145232200622559, "global_step": 76259, "epoch": 1815} {"train_loss": -6.12340784072876, "global_step": 76260, "epoch": 1815} {"train_loss": -6.0677690505981445, "global_step": 76261, "epoch": 1815} {"train_loss": -6.003509998321533, "global_step": 76262, "epoch": 1815} {"train_loss": -6.221198081970215, "global_step": 76263, "epoch": 1815} {"train_loss": -5.956938743591309, "global_step": 76264, "epoch": 1815} {"train_loss": -6.029214382171631, "global_step": 76265, "epoch": 1815} {"train_loss": -5.997002124786377, "global_step": 76266, "epoch": 1815} {"train_loss": -6.031856060028076, "global_step": 76267, "epoch": 1815} {"train_loss": -6.063783645629883, "global_step": 76268, "epoch": 1815} {"train_loss": -6.064271450042725, "global_step": 76269, "epoch": 1815} {"train_loss": -6.16058349609375, "global_step": 76270, "epoch": 1815} {"train_loss": -6.04926323890686, "global_step": 76271, "epoch": 1815, "val_loss": 67617.78125} {"train_loss": -6.1336588859558105, "global_step": 76272, "epoch": 1816} {"train_loss": -6.094679355621338, "global_step": 76273, "epoch": 1816} {"train_loss": -6.065826892852783, "global_step": 76274, "epoch": 1816} {"train_loss": -6.089870452880859, "global_step": 76275, "epoch": 1816} {"train_loss": -6.024114608764648, "global_step": 76276, "epoch": 1816} {"train_loss": -5.948433876037598, "global_step": 76277, "epoch": 1816} {"train_loss": -6.113333702087402, "global_step": 76278, "epoch": 1816} {"train_loss": -6.018141746520996, "global_step": 76279, "epoch": 1816} {"train_loss": -6.12309455871582, "global_step": 76280, "epoch": 1816} {"train_loss": -6.08875846862793, "global_step": 76281, "epoch": 1816} {"train_loss": -6.083789348602295, "global_step": 76282, "epoch": 1816} {"train_loss": -6.1818742752075195, "global_step": 76283, "epoch": 1816} {"train_loss": -6.004184246063232, "global_step": 76284, "epoch": 1816} {"train_loss": -5.988970756530762, "global_step": 76285, "epoch": 1816} {"train_loss": -6.03549861907959, "global_step": 76286, "epoch": 1816} {"train_loss": -6.104161739349365, "global_step": 76287, "epoch": 1816} {"train_loss": -6.193332672119141, "global_step": 76288, "epoch": 1816} {"train_loss": -6.079737663269043, "global_step": 76289, "epoch": 1816} {"train_loss": -6.04400110244751, "global_step": 76290, "epoch": 1816} {"train_loss": -6.13308048248291, "global_step": 76291, "epoch": 1816} {"train_loss": -6.092783451080322, "global_step": 76292, "epoch": 1816} {"train_loss": -6.091705799102783, "global_step": 76293, "epoch": 1816} {"train_loss": -6.149460792541504, "global_step": 76294, "epoch": 1816} {"train_loss": -6.136367321014404, "global_step": 76295, "epoch": 1816} {"train_loss": -5.978879928588867, "global_step": 76296, "epoch": 1816} {"train_loss": -6.1508870124816895, "global_step": 76297, "epoch": 1816} {"train_loss": -5.9998016357421875, "global_step": 76298, "epoch": 1816} {"train_loss": -6.091750144958496, "global_step": 76299, "epoch": 1816} {"train_loss": -6.078413963317871, "global_step": 76300, "epoch": 1816} {"train_loss": -6.170334339141846, "global_step": 76301, "epoch": 1816} {"train_loss": -6.001124382019043, "global_step": 76302, "epoch": 1816} {"train_loss": -6.15532922744751, "global_step": 76303, "epoch": 1816} {"train_loss": -6.218039512634277, "global_step": 76304, "epoch": 1816} {"train_loss": -6.123591899871826, "global_step": 76305, "epoch": 1816} {"train_loss": -6.138566493988037, "global_step": 76306, "epoch": 1816} {"train_loss": -6.060695648193359, "global_step": 76307, "epoch": 1816} {"train_loss": -6.2648725509643555, "global_step": 76308, "epoch": 1816} {"train_loss": -6.127419471740723, "global_step": 76309, "epoch": 1816} {"train_loss": -6.226104736328125, "global_step": 76310, "epoch": 1816} {"train_loss": -6.1520466804504395, "global_step": 76311, "epoch": 1816} {"train_loss": -6.0496015548706055, "global_step": 76312, "epoch": 1816} {"train_loss": -6.095305874234154, "global_step": 76313, "epoch": 1816, "val_loss": 67580.3515625} {"train_loss": -6.006710052490234, "global_step": 76314, "epoch": 1817} {"train_loss": -6.18497371673584, "global_step": 76315, "epoch": 1817} {"train_loss": -6.180761814117432, "global_step": 76316, "epoch": 1817} {"train_loss": -6.084420204162598, "global_step": 76317, "epoch": 1817} {"train_loss": -6.1023759841918945, "global_step": 76318, "epoch": 1817} {"train_loss": -6.14039421081543, "global_step": 76319, "epoch": 1817} {"train_loss": -6.117315769195557, "global_step": 76320, "epoch": 1817} {"train_loss": -6.058218955993652, "global_step": 76321, "epoch": 1817} {"train_loss": -6.096138000488281, "global_step": 76322, "epoch": 1817} {"train_loss": -6.148642539978027, "global_step": 76323, "epoch": 1817} {"train_loss": -6.053066253662109, "global_step": 76324, "epoch": 1817} {"train_loss": -6.037716865539551, "global_step": 76325, "epoch": 1817} {"train_loss": -6.221011161804199, "global_step": 76326, "epoch": 1817} {"train_loss": -6.126764297485352, "global_step": 76327, "epoch": 1817} {"train_loss": -6.170259952545166, "global_step": 76328, "epoch": 1817} {"train_loss": -6.173489093780518, "global_step": 76329, "epoch": 1817} {"train_loss": -6.007993698120117, "global_step": 76330, "epoch": 1817} {"train_loss": -6.082246780395508, "global_step": 76331, "epoch": 1817} {"train_loss": -6.181400299072266, "global_step": 76332, "epoch": 1817} {"train_loss": -6.047540664672852, "global_step": 76333, "epoch": 1817} {"train_loss": -6.233492374420166, "global_step": 76334, "epoch": 1817} {"train_loss": -6.100059509277344, "global_step": 76335, "epoch": 1817} {"train_loss": -6.049333572387695, "global_step": 76336, "epoch": 1817} {"train_loss": -6.12324333190918, "global_step": 76337, "epoch": 1817} {"train_loss": -6.1430840492248535, "global_step": 76338, "epoch": 1817} {"train_loss": -6.203481674194336, "global_step": 76339, "epoch": 1817} {"train_loss": -6.1833367347717285, "global_step": 76340, "epoch": 1817} {"train_loss": -6.1301751136779785, "global_step": 76341, "epoch": 1817} {"train_loss": -6.1681227684021, "global_step": 76342, "epoch": 1817} {"train_loss": -6.176639556884766, "global_step": 76343, "epoch": 1817} {"train_loss": -6.0871686935424805, "global_step": 76344, "epoch": 1817} {"train_loss": -6.072269439697266, "global_step": 76345, "epoch": 1817} {"train_loss": -6.002144813537598, "global_step": 76346, "epoch": 1817} {"train_loss": -6.0820441246032715, "global_step": 76347, "epoch": 1817} {"train_loss": -6.09762716293335, "global_step": 76348, "epoch": 1817} {"train_loss": -6.095219135284424, "global_step": 76349, "epoch": 1817} {"train_loss": -6.0740275382995605, "global_step": 76350, "epoch": 1817} {"train_loss": -5.950777053833008, "global_step": 76351, "epoch": 1817} {"train_loss": -6.103848457336426, "global_step": 76352, "epoch": 1817} {"train_loss": -6.050753593444824, "global_step": 76353, "epoch": 1817} {"train_loss": -5.943802356719971, "global_step": 76354, "epoch": 1817} {"train_loss": -6.104251986458188, "global_step": 76355, "epoch": 1817, "val_loss": 67419.1875} {"train_loss": -6.096526622772217, "global_step": 76356, "epoch": 1818} {"train_loss": -6.088359832763672, "global_step": 76357, "epoch": 1818} {"train_loss": -6.133100509643555, "global_step": 76358, "epoch": 1818} {"train_loss": -6.093655586242676, "global_step": 76359, "epoch": 1818} {"train_loss": -6.052262306213379, "global_step": 76360, "epoch": 1818} {"train_loss": -6.085201263427734, "global_step": 76361, "epoch": 1818} {"train_loss": -6.0839457511901855, "global_step": 76362, "epoch": 1818} {"train_loss": -6.077255725860596, "global_step": 76363, "epoch": 1818} {"train_loss": -6.043231964111328, "global_step": 76364, "epoch": 1818} {"train_loss": -6.1142897605896, "global_step": 76365, "epoch": 1818} {"train_loss": -5.995309829711914, "global_step": 76366, "epoch": 1818} {"train_loss": -6.064087867736816, "global_step": 76367, "epoch": 1818} {"train_loss": -5.918118953704834, "global_step": 76368, "epoch": 1818} {"train_loss": -6.0313029289245605, "global_step": 76369, "epoch": 1818} {"train_loss": -5.991590976715088, "global_step": 76370, "epoch": 1818} {"train_loss": -6.093426704406738, "global_step": 76371, "epoch": 1818} {"train_loss": -6.058187007904053, "global_step": 76372, "epoch": 1818} {"train_loss": -6.134406566619873, "global_step": 76373, "epoch": 1818} {"train_loss": -6.0620012283325195, "global_step": 76374, "epoch": 1818} {"train_loss": -6.064767360687256, "global_step": 76375, "epoch": 1818} {"train_loss": -6.067893028259277, "global_step": 76376, "epoch": 1818} {"train_loss": -6.097699165344238, "global_step": 76377, "epoch": 1818} {"train_loss": -6.165520191192627, "global_step": 76378, "epoch": 1818} {"train_loss": -6.051885604858398, "global_step": 76379, "epoch": 1818} {"train_loss": -6.088174819946289, "global_step": 76380, "epoch": 1818} {"train_loss": -6.135521411895752, "global_step": 76381, "epoch": 1818} {"train_loss": -6.176657676696777, "global_step": 76382, "epoch": 1818} {"train_loss": -6.0307159423828125, "global_step": 76383, "epoch": 1818} {"train_loss": -5.930540084838867, "global_step": 76384, "epoch": 1818} {"train_loss": -5.992376327514648, "global_step": 76385, "epoch": 1818} {"train_loss": -6.176059722900391, "global_step": 76386, "epoch": 1818} {"train_loss": -5.951969623565674, "global_step": 76387, "epoch": 1818} {"train_loss": -5.91963005065918, "global_step": 76388, "epoch": 1818} {"train_loss": -6.037247180938721, "global_step": 76389, "epoch": 1818} {"train_loss": -5.992387771606445, "global_step": 76390, "epoch": 1818} {"train_loss": -6.0859222412109375, "global_step": 76391, "epoch": 1818} {"train_loss": -5.97252082824707, "global_step": 76392, "epoch": 1818} {"train_loss": -6.0337724685668945, "global_step": 76393, "epoch": 1818} {"train_loss": -5.993799209594727, "global_step": 76394, "epoch": 1818} {"train_loss": -6.076229572296143, "global_step": 76395, "epoch": 1818} {"train_loss": -5.986329078674316, "global_step": 76396, "epoch": 1818} {"train_loss": -6.052444787252517, "global_step": 76397, "epoch": 1818, "val_loss": 67517.875} {"train_loss": -6.079301834106445, "global_step": 76398, "epoch": 1819} {"train_loss": -6.078456878662109, "global_step": 76399, "epoch": 1819} {"train_loss": -5.9216227531433105, "global_step": 76400, "epoch": 1819} {"train_loss": -6.012248516082764, "global_step": 76401, "epoch": 1819} {"train_loss": -5.842524528503418, "global_step": 76402, "epoch": 1819} {"train_loss": -6.046095848083496, "global_step": 76403, "epoch": 1819} {"train_loss": -6.197957992553711, "global_step": 76404, "epoch": 1819} {"train_loss": -5.898008346557617, "global_step": 76405, "epoch": 1819} {"train_loss": -6.0466694831848145, "global_step": 76406, "epoch": 1819} {"train_loss": -6.068704605102539, "global_step": 76407, "epoch": 1819} {"train_loss": -6.128923416137695, "global_step": 76408, "epoch": 1819} {"train_loss": -6.08735466003418, "global_step": 76409, "epoch": 1819} {"train_loss": -6.098423004150391, "global_step": 76410, "epoch": 1819} {"train_loss": -6.1434326171875, "global_step": 76411, "epoch": 1819} {"train_loss": -6.061519622802734, "global_step": 76412, "epoch": 1819} {"train_loss": -6.097197532653809, "global_step": 76413, "epoch": 1819} {"train_loss": -6.084108352661133, "global_step": 76414, "epoch": 1819} {"train_loss": -5.948759078979492, "global_step": 76415, "epoch": 1819} {"train_loss": -6.139400482177734, "global_step": 76416, "epoch": 1819} {"train_loss": -6.089540004730225, "global_step": 76417, "epoch": 1819} {"train_loss": -6.1409807205200195, "global_step": 76418, "epoch": 1819} {"train_loss": -5.988059997558594, "global_step": 76419, "epoch": 1819} {"train_loss": -6.000100135803223, "global_step": 76420, "epoch": 1819} {"train_loss": -6.0935893058776855, "global_step": 76421, "epoch": 1819} {"train_loss": -6.046657562255859, "global_step": 76422, "epoch": 1819} {"train_loss": -6.205068588256836, "global_step": 76423, "epoch": 1819} {"train_loss": -6.102298736572266, "global_step": 76424, "epoch": 1819} {"train_loss": -5.9910383224487305, "global_step": 76425, "epoch": 1819} {"train_loss": -6.17995548248291, "global_step": 76426, "epoch": 1819} {"train_loss": -5.990827560424805, "global_step": 76427, "epoch": 1819} {"train_loss": -6.005346298217773, "global_step": 76428, "epoch": 1819} {"train_loss": -6.078873634338379, "global_step": 76429, "epoch": 1819} {"train_loss": -6.162816047668457, "global_step": 76430, "epoch": 1819} {"train_loss": -6.094509124755859, "global_step": 76431, "epoch": 1819} {"train_loss": -6.070521831512451, "global_step": 76432, "epoch": 1819} {"train_loss": -5.8946533203125, "global_step": 76433, "epoch": 1819} {"train_loss": -6.124837875366211, "global_step": 76434, "epoch": 1819} {"train_loss": -5.917263507843018, "global_step": 76435, "epoch": 1819} {"train_loss": -6.067866325378418, "global_step": 76436, "epoch": 1819} {"train_loss": -6.066132545471191, "global_step": 76437, "epoch": 1819} {"train_loss": -5.935685157775879, "global_step": 76438, "epoch": 1819} {"train_loss": -6.052791674931844, "global_step": 76439, "epoch": 1819, "val_loss": 67727.109375} {"train_loss": -5.810957431793213, "global_step": 76440, "epoch": 1820} {"train_loss": -6.072617530822754, "global_step": 76441, "epoch": 1820} {"train_loss": -5.98757266998291, "global_step": 76442, "epoch": 1820} {"train_loss": -6.0537519454956055, "global_step": 76443, "epoch": 1820} {"train_loss": -6.008450031280518, "global_step": 76444, "epoch": 1820} {"train_loss": -6.007843971252441, "global_step": 76445, "epoch": 1820} {"train_loss": -6.040414810180664, "global_step": 76446, "epoch": 1820} {"train_loss": -6.162528991699219, "global_step": 76447, "epoch": 1820} {"train_loss": -6.031554222106934, "global_step": 76448, "epoch": 1820} {"train_loss": -6.080506801605225, "global_step": 76449, "epoch": 1820} {"train_loss": -6.171990394592285, "global_step": 76450, "epoch": 1820} {"train_loss": -6.0863189697265625, "global_step": 76451, "epoch": 1820} {"train_loss": -5.988618850708008, "global_step": 76452, "epoch": 1820} {"train_loss": -6.106264114379883, "global_step": 76453, "epoch": 1820} {"train_loss": -6.079881191253662, "global_step": 76454, "epoch": 1820} {"train_loss": -6.172148704528809, "global_step": 76455, "epoch": 1820} {"train_loss": -6.010550022125244, "global_step": 76456, "epoch": 1820} {"train_loss": -6.06849479675293, "global_step": 76457, "epoch": 1820} {"train_loss": -5.979619979858398, "global_step": 76458, "epoch": 1820} {"train_loss": -6.1530985832214355, "global_step": 76459, "epoch": 1820} {"train_loss": -6.0469818115234375, "global_step": 76460, "epoch": 1820} {"train_loss": -6.049124240875244, "global_step": 76461, "epoch": 1820} {"train_loss": -6.191900253295898, "global_step": 76462, "epoch": 1820} {"train_loss": -5.996000289916992, "global_step": 76463, "epoch": 1820} {"train_loss": -6.037907600402832, "global_step": 76464, "epoch": 1820} {"train_loss": -6.150696754455566, "global_step": 76465, "epoch": 1820} {"train_loss": -5.937417984008789, "global_step": 76466, "epoch": 1820} {"train_loss": -6.000813961029053, "global_step": 76467, "epoch": 1820} {"train_loss": -6.232610702514648, "global_step": 76468, "epoch": 1820} {"train_loss": -5.855041980743408, "global_step": 76469, "epoch": 1820} {"train_loss": -6.035429954528809, "global_step": 76470, "epoch": 1820} {"train_loss": -6.0176544189453125, "global_step": 76471, "epoch": 1820} {"train_loss": -6.004094123840332, "global_step": 76472, "epoch": 1820} {"train_loss": -6.076007843017578, "global_step": 76473, "epoch": 1820} {"train_loss": -6.066594123840332, "global_step": 76474, "epoch": 1820} {"train_loss": -6.126466274261475, "global_step": 76475, "epoch": 1820} {"train_loss": -6.132999420166016, "global_step": 76476, "epoch": 1820} {"train_loss": -6.157234191894531, "global_step": 76477, "epoch": 1820} {"train_loss": -6.139645576477051, "global_step": 76478, "epoch": 1820} {"train_loss": -6.096316337585449, "global_step": 76479, "epoch": 1820} {"train_loss": -6.091484069824219, "global_step": 76480, "epoch": 1820} {"train_loss": -6.0627433231898715, "global_step": 76481, "epoch": 1820, "val_loss": 67368.625} {"train_loss": -6.043230056762695, "global_step": 76482, "epoch": 1821} {"train_loss": -6.10006046295166, "global_step": 76483, "epoch": 1821} {"train_loss": -6.008812427520752, "global_step": 76484, "epoch": 1821} {"train_loss": -6.190539360046387, "global_step": 76485, "epoch": 1821} {"train_loss": -6.017387866973877, "global_step": 76486, "epoch": 1821} {"train_loss": -6.108502388000488, "global_step": 76487, "epoch": 1821} {"train_loss": -6.136285781860352, "global_step": 76488, "epoch": 1821} {"train_loss": -6.030036926269531, "global_step": 76489, "epoch": 1821} {"train_loss": -6.004173755645752, "global_step": 76490, "epoch": 1821} {"train_loss": -6.034388542175293, "global_step": 76491, "epoch": 1821} {"train_loss": -6.094677925109863, "global_step": 76492, "epoch": 1821} {"train_loss": -6.223744869232178, "global_step": 76493, "epoch": 1821} {"train_loss": -6.08880615234375, "global_step": 76494, "epoch": 1821} {"train_loss": -5.872398853302002, "global_step": 76495, "epoch": 1821} {"train_loss": -6.001949310302734, "global_step": 76496, "epoch": 1821} {"train_loss": -5.943268775939941, "global_step": 76497, "epoch": 1821} {"train_loss": -5.958145618438721, "global_step": 76498, "epoch": 1821} {"train_loss": -6.057652950286865, "global_step": 76499, "epoch": 1821} {"train_loss": -5.958600044250488, "global_step": 76500, "epoch": 1821} {"train_loss": -6.055487632751465, "global_step": 76501, "epoch": 1821} {"train_loss": -6.116922378540039, "global_step": 76502, "epoch": 1821} {"train_loss": -5.916921138763428, "global_step": 76503, "epoch": 1821} {"train_loss": -6.012215614318848, "global_step": 76504, "epoch": 1821} {"train_loss": -6.057801723480225, "global_step": 76505, "epoch": 1821} {"train_loss": -6.093477249145508, "global_step": 76506, "epoch": 1821} {"train_loss": -5.922214508056641, "global_step": 76507, "epoch": 1821} {"train_loss": -6.090628147125244, "global_step": 76508, "epoch": 1821} {"train_loss": -6.132573127746582, "global_step": 76509, "epoch": 1821} {"train_loss": -6.041364669799805, "global_step": 76510, "epoch": 1821} {"train_loss": -6.1287946701049805, "global_step": 76511, "epoch": 1821} {"train_loss": -6.230544090270996, "global_step": 76512, "epoch": 1821} {"train_loss": -6.096149444580078, "global_step": 76513, "epoch": 1821} {"train_loss": -6.223341941833496, "global_step": 76514, "epoch": 1821} {"train_loss": -6.099824905395508, "global_step": 76515, "epoch": 1821} {"train_loss": -6.083192348480225, "global_step": 76516, "epoch": 1821} {"train_loss": -6.121728420257568, "global_step": 76517, "epoch": 1821} {"train_loss": -6.13642692565918, "global_step": 76518, "epoch": 1821} {"train_loss": -6.130814552307129, "global_step": 76519, "epoch": 1821} {"train_loss": -6.1407694816589355, "global_step": 76520, "epoch": 1821} {"train_loss": -5.90085506439209, "global_step": 76521, "epoch": 1821} {"train_loss": -6.154180526733398, "global_step": 76522, "epoch": 1821} {"train_loss": -6.067315873645601, "global_step": 76523, "epoch": 1821, "val_loss": 67866.0859375} {"train_loss": -6.07697868347168, "global_step": 76524, "epoch": 1822} {"train_loss": -5.904810905456543, "global_step": 76525, "epoch": 1822} {"train_loss": -5.984178066253662, "global_step": 76526, "epoch": 1822} {"train_loss": -6.039968967437744, "global_step": 76527, "epoch": 1822} {"train_loss": -6.0579681396484375, "global_step": 76528, "epoch": 1822} {"train_loss": -6.1401872634887695, "global_step": 76529, "epoch": 1822} {"train_loss": -6.010195732116699, "global_step": 76530, "epoch": 1822} {"train_loss": -6.13968563079834, "global_step": 76531, "epoch": 1822} {"train_loss": -5.956961631774902, "global_step": 76532, "epoch": 1822} {"train_loss": -6.145379066467285, "global_step": 76533, "epoch": 1822} {"train_loss": -6.075773239135742, "global_step": 76534, "epoch": 1822} {"train_loss": -5.9859514236450195, "global_step": 76535, "epoch": 1822} {"train_loss": -6.042754650115967, "global_step": 76536, "epoch": 1822} {"train_loss": -6.087930679321289, "global_step": 76537, "epoch": 1822} {"train_loss": -6.034207820892334, "global_step": 76538, "epoch": 1822} {"train_loss": -6.0702009201049805, "global_step": 76539, "epoch": 1822} {"train_loss": -6.02537202835083, "global_step": 76540, "epoch": 1822} {"train_loss": -6.186419486999512, "global_step": 76541, "epoch": 1822} {"train_loss": -6.093759536743164, "global_step": 76542, "epoch": 1822} {"train_loss": -6.150104999542236, "global_step": 76543, "epoch": 1822} {"train_loss": -6.0536909103393555, "global_step": 76544, "epoch": 1822} {"train_loss": -6.146149635314941, "global_step": 76545, "epoch": 1822} {"train_loss": -6.208843231201172, "global_step": 76546, "epoch": 1822} {"train_loss": -5.992332458496094, "global_step": 76547, "epoch": 1822} {"train_loss": -6.018100738525391, "global_step": 76548, "epoch": 1822} {"train_loss": -6.165337085723877, "global_step": 76549, "epoch": 1822} {"train_loss": -6.1108527183532715, "global_step": 76550, "epoch": 1822} {"train_loss": -6.124014854431152, "global_step": 76551, "epoch": 1822} {"train_loss": -6.121419906616211, "global_step": 76552, "epoch": 1822} {"train_loss": -6.1524810791015625, "global_step": 76553, "epoch": 1822} {"train_loss": -6.14963436126709, "global_step": 76554, "epoch": 1822} {"train_loss": -6.071252822875977, "global_step": 76555, "epoch": 1822} {"train_loss": -6.058372497558594, "global_step": 76556, "epoch": 1822} {"train_loss": -6.074492454528809, "global_step": 76557, "epoch": 1822} {"train_loss": -6.048604965209961, "global_step": 76558, "epoch": 1822} {"train_loss": -5.999917030334473, "global_step": 76559, "epoch": 1822} {"train_loss": -6.050793647766113, "global_step": 76560, "epoch": 1822} {"train_loss": -6.039184093475342, "global_step": 76561, "epoch": 1822} {"train_loss": -6.09446382522583, "global_step": 76562, "epoch": 1822} {"train_loss": -5.925808429718018, "global_step": 76563, "epoch": 1822} {"train_loss": -6.031035900115967, "global_step": 76564, "epoch": 1822} {"train_loss": -6.070469209126064, "global_step": 76565, "epoch": 1822, "val_loss": 67816.8984375} {"train_loss": -5.9590888023376465, "global_step": 76566, "epoch": 1823} {"train_loss": -6.039133548736572, "global_step": 76567, "epoch": 1823} {"train_loss": -6.046754360198975, "global_step": 76568, "epoch": 1823} {"train_loss": -6.044688701629639, "global_step": 76569, "epoch": 1823} {"train_loss": -5.977269649505615, "global_step": 76570, "epoch": 1823} {"train_loss": -6.234009742736816, "global_step": 76571, "epoch": 1823} {"train_loss": -6.039150238037109, "global_step": 76572, "epoch": 1823} {"train_loss": -5.982956886291504, "global_step": 76573, "epoch": 1823} {"train_loss": -6.10383415222168, "global_step": 76574, "epoch": 1823} {"train_loss": -6.152483940124512, "global_step": 76575, "epoch": 1823} {"train_loss": -6.166479110717773, "global_step": 76576, "epoch": 1823} {"train_loss": -6.0351972579956055, "global_step": 76577, "epoch": 1823} {"train_loss": -6.017005920410156, "global_step": 76578, "epoch": 1823} {"train_loss": -6.10166072845459, "global_step": 76579, "epoch": 1823} {"train_loss": -6.071208953857422, "global_step": 76580, "epoch": 1823} {"train_loss": -6.103753089904785, "global_step": 76581, "epoch": 1823} {"train_loss": -5.987689018249512, "global_step": 76582, "epoch": 1823} {"train_loss": -6.155028343200684, "global_step": 76583, "epoch": 1823} {"train_loss": -6.0790019035339355, "global_step": 76584, "epoch": 1823} {"train_loss": -6.121879577636719, "global_step": 76585, "epoch": 1823} {"train_loss": -6.144241809844971, "global_step": 76586, "epoch": 1823} {"train_loss": -5.978909969329834, "global_step": 76587, "epoch": 1823} {"train_loss": -6.097501754760742, "global_step": 76588, "epoch": 1823} {"train_loss": -5.956418991088867, "global_step": 76589, "epoch": 1823} {"train_loss": -5.9818925857543945, "global_step": 76590, "epoch": 1823} {"train_loss": -6.186440467834473, "global_step": 76591, "epoch": 1823} {"train_loss": -6.011135101318359, "global_step": 76592, "epoch": 1823} {"train_loss": -5.986415863037109, "global_step": 76593, "epoch": 1823} {"train_loss": -6.002762794494629, "global_step": 76594, "epoch": 1823} {"train_loss": -6.135097026824951, "global_step": 76595, "epoch": 1823} {"train_loss": -6.108902931213379, "global_step": 76596, "epoch": 1823} {"train_loss": -6.025384902954102, "global_step": 76597, "epoch": 1823} {"train_loss": -6.270739555358887, "global_step": 76598, "epoch": 1823} {"train_loss": -6.113738059997559, "global_step": 76599, "epoch": 1823} {"train_loss": -6.158664226531982, "global_step": 76600, "epoch": 1823} {"train_loss": -6.157672882080078, "global_step": 76601, "epoch": 1823} {"train_loss": -6.1307902336120605, "global_step": 76602, "epoch": 1823} {"train_loss": -6.14556884765625, "global_step": 76603, "epoch": 1823} {"train_loss": -6.025237083435059, "global_step": 76604, "epoch": 1823} {"train_loss": -6.1802754402160645, "global_step": 76605, "epoch": 1823} {"train_loss": -6.089301109313965, "global_step": 76606, "epoch": 1823} {"train_loss": -6.0818230992271785, "global_step": 76607, "epoch": 1823, "val_loss": 67465.609375} {"train_loss": -6.1860551834106445, "global_step": 76608, "epoch": 1824} {"train_loss": -6.041969299316406, "global_step": 76609, "epoch": 1824} {"train_loss": -6.142745494842529, "global_step": 76610, "epoch": 1824} {"train_loss": -6.128301620483398, "global_step": 76611, "epoch": 1824} {"train_loss": -6.101451396942139, "global_step": 76612, "epoch": 1824} {"train_loss": -6.20840311050415, "global_step": 76613, "epoch": 1824} {"train_loss": -6.009396553039551, "global_step": 76614, "epoch": 1824} {"train_loss": -6.054551124572754, "global_step": 76615, "epoch": 1824} {"train_loss": -6.097699165344238, "global_step": 76616, "epoch": 1824} {"train_loss": -6.024548530578613, "global_step": 76617, "epoch": 1824} {"train_loss": -6.138730525970459, "global_step": 76618, "epoch": 1824} {"train_loss": -6.00019645690918, "global_step": 76619, "epoch": 1824} {"train_loss": -6.0693254470825195, "global_step": 76620, "epoch": 1824} {"train_loss": -6.054509162902832, "global_step": 76621, "epoch": 1824} {"train_loss": -5.962032794952393, "global_step": 76622, "epoch": 1824} {"train_loss": -6.052670478820801, "global_step": 76623, "epoch": 1824} {"train_loss": -6.181724548339844, "global_step": 76624, "epoch": 1824} {"train_loss": -6.089743614196777, "global_step": 76625, "epoch": 1824} {"train_loss": -6.086082458496094, "global_step": 76626, "epoch": 1824} {"train_loss": -6.1289448738098145, "global_step": 76627, "epoch": 1824} {"train_loss": -6.120322227478027, "global_step": 76628, "epoch": 1824} {"train_loss": -6.058725357055664, "global_step": 76629, "epoch": 1824} {"train_loss": -6.194767475128174, "global_step": 76630, "epoch": 1824} {"train_loss": -6.108644008636475, "global_step": 76631, "epoch": 1824} {"train_loss": -6.180210590362549, "global_step": 76632, "epoch": 1824} {"train_loss": -6.177844524383545, "global_step": 76633, "epoch": 1824} {"train_loss": -6.161071300506592, "global_step": 76634, "epoch": 1824} {"train_loss": -6.08648681640625, "global_step": 76635, "epoch": 1824} {"train_loss": -6.162843704223633, "global_step": 76636, "epoch": 1824} {"train_loss": -6.06892204284668, "global_step": 76637, "epoch": 1824} {"train_loss": -6.091271877288818, "global_step": 76638, "epoch": 1824} {"train_loss": -6.113607406616211, "global_step": 76639, "epoch": 1824} {"train_loss": -6.112648010253906, "global_step": 76640, "epoch": 1824} {"train_loss": -6.250425815582275, "global_step": 76641, "epoch": 1824} {"train_loss": -6.115647315979004, "global_step": 76642, "epoch": 1824} {"train_loss": -5.977481365203857, "global_step": 76643, "epoch": 1824} {"train_loss": -6.130212306976318, "global_step": 76644, "epoch": 1824} {"train_loss": -6.16460657119751, "global_step": 76645, "epoch": 1824} {"train_loss": -6.083545207977295, "global_step": 76646, "epoch": 1824} {"train_loss": -5.973382949829102, "global_step": 76647, "epoch": 1824} {"train_loss": -6.199052333831787, "global_step": 76648, "epoch": 1824} {"train_loss": -6.105411075410389, "global_step": 76649, "epoch": 1824, "val_loss": 67352.8203125} {"train_loss": -6.075443267822266, "global_step": 76650, "epoch": 1825} {"train_loss": -6.1523942947387695, "global_step": 76651, "epoch": 1825} {"train_loss": -6.163843154907227, "global_step": 76652, "epoch": 1825} {"train_loss": -6.125962257385254, "global_step": 76653, "epoch": 1825} {"train_loss": -6.123716354370117, "global_step": 76654, "epoch": 1825} {"train_loss": -6.068964958190918, "global_step": 76655, "epoch": 1825} {"train_loss": -6.171919822692871, "global_step": 76656, "epoch": 1825} {"train_loss": -6.0516767501831055, "global_step": 76657, "epoch": 1825} {"train_loss": -6.089337348937988, "global_step": 76658, "epoch": 1825} {"train_loss": -6.099688529968262, "global_step": 76659, "epoch": 1825} {"train_loss": -6.1497039794921875, "global_step": 76660, "epoch": 1825} {"train_loss": -6.144657135009766, "global_step": 76661, "epoch": 1825} {"train_loss": -5.953260898590088, "global_step": 76662, "epoch": 1825} {"train_loss": -6.172143936157227, "global_step": 76663, "epoch": 1825} {"train_loss": -6.049892425537109, "global_step": 76664, "epoch": 1825} {"train_loss": -6.083150863647461, "global_step": 76665, "epoch": 1825} {"train_loss": -6.124545574188232, "global_step": 76666, "epoch": 1825} {"train_loss": -5.941040992736816, "global_step": 76667, "epoch": 1825} {"train_loss": -6.098928928375244, "global_step": 76668, "epoch": 1825} {"train_loss": -5.960597038269043, "global_step": 76669, "epoch": 1825} {"train_loss": -6.129578590393066, "global_step": 76670, "epoch": 1825} {"train_loss": -6.033868312835693, "global_step": 76671, "epoch": 1825} {"train_loss": -5.992194652557373, "global_step": 76672, "epoch": 1825} {"train_loss": -6.170864105224609, "global_step": 76673, "epoch": 1825} {"train_loss": -6.103573799133301, "global_step": 76674, "epoch": 1825} {"train_loss": -6.052078723907471, "global_step": 76675, "epoch": 1825} {"train_loss": -5.870566368103027, "global_step": 76676, "epoch": 1825} {"train_loss": -6.024408340454102, "global_step": 76677, "epoch": 1825} {"train_loss": -6.100153923034668, "global_step": 76678, "epoch": 1825} {"train_loss": -6.007349491119385, "global_step": 76679, "epoch": 1825} {"train_loss": -6.074363708496094, "global_step": 76680, "epoch": 1825} {"train_loss": -6.022439956665039, "global_step": 76681, "epoch": 1825} {"train_loss": -6.081401348114014, "global_step": 76682, "epoch": 1825} {"train_loss": -6.094853401184082, "global_step": 76683, "epoch": 1825} {"train_loss": -6.042413711547852, "global_step": 76684, "epoch": 1825} {"train_loss": -6.135374546051025, "global_step": 76685, "epoch": 1825} {"train_loss": -5.858454704284668, "global_step": 76686, "epoch": 1825} {"train_loss": -6.149188995361328, "global_step": 76687, "epoch": 1825} {"train_loss": -6.043371200561523, "global_step": 76688, "epoch": 1825} {"train_loss": -5.935965061187744, "global_step": 76689, "epoch": 1825} {"train_loss": -6.0531816482543945, "global_step": 76690, "epoch": 1825} {"train_loss": -6.065560511180332, "global_step": 76691, "epoch": 1825, "val_loss": 67640.4921875} {"train_loss": -6.01295280456543, "global_step": 76692, "epoch": 1826} {"train_loss": -6.167200565338135, "global_step": 76693, "epoch": 1826} {"train_loss": -5.938443183898926, "global_step": 76694, "epoch": 1826} {"train_loss": -6.077388763427734, "global_step": 76695, "epoch": 1826} {"train_loss": -6.097646713256836, "global_step": 76696, "epoch": 1826} {"train_loss": -6.029929161071777, "global_step": 76697, "epoch": 1826} {"train_loss": -6.046850204467773, "global_step": 76698, "epoch": 1826} {"train_loss": -6.016432762145996, "global_step": 76699, "epoch": 1826} {"train_loss": -6.146273612976074, "global_step": 76700, "epoch": 1826} {"train_loss": -6.009762763977051, "global_step": 76701, "epoch": 1826} {"train_loss": -6.166044235229492, "global_step": 76702, "epoch": 1826} {"train_loss": -6.120576858520508, "global_step": 76703, "epoch": 1826} {"train_loss": -6.07913875579834, "global_step": 76704, "epoch": 1826} {"train_loss": -6.141304969787598, "global_step": 76705, "epoch": 1826} {"train_loss": -6.236072540283203, "global_step": 76706, "epoch": 1826} {"train_loss": -6.085627555847168, "global_step": 76707, "epoch": 1826} {"train_loss": -6.258925437927246, "global_step": 76708, "epoch": 1826} {"train_loss": -6.202688217163086, "global_step": 76709, "epoch": 1826} {"train_loss": -6.101025104522705, "global_step": 76710, "epoch": 1826} {"train_loss": -6.143064498901367, "global_step": 76711, "epoch": 1826} {"train_loss": -6.211301326751709, "global_step": 76712, "epoch": 1826} {"train_loss": -6.012197017669678, "global_step": 76713, "epoch": 1826} {"train_loss": -6.045263290405273, "global_step": 76714, "epoch": 1826} {"train_loss": -6.099625587463379, "global_step": 76715, "epoch": 1826} {"train_loss": -6.023726463317871, "global_step": 76716, "epoch": 1826} {"train_loss": -6.121999740600586, "global_step": 76717, "epoch": 1826} {"train_loss": -6.030487060546875, "global_step": 76718, "epoch": 1826} {"train_loss": -5.912015914916992, "global_step": 76719, "epoch": 1826} {"train_loss": -6.072885036468506, "global_step": 76720, "epoch": 1826} {"train_loss": -6.072904586791992, "global_step": 76721, "epoch": 1826} {"train_loss": -6.0127410888671875, "global_step": 76722, "epoch": 1826} {"train_loss": -6.034303188323975, "global_step": 76723, "epoch": 1826} {"train_loss": -5.999422550201416, "global_step": 76724, "epoch": 1826} {"train_loss": -6.087540149688721, "global_step": 76725, "epoch": 1826} {"train_loss": -6.012767791748047, "global_step": 76726, "epoch": 1826} {"train_loss": -6.068662643432617, "global_step": 76727, "epoch": 1826} {"train_loss": -6.059128284454346, "global_step": 76728, "epoch": 1826} {"train_loss": -6.119710922241211, "global_step": 76729, "epoch": 1826} {"train_loss": -5.964728832244873, "global_step": 76730, "epoch": 1826} {"train_loss": -6.262791633605957, "global_step": 76731, "epoch": 1826} {"train_loss": -5.90886926651001, "global_step": 76732, "epoch": 1826} {"train_loss": -6.078852403731573, "global_step": 76733, "epoch": 1826, "val_loss": 67673.2109375} {"train_loss": -6.121554374694824, "global_step": 76734, "epoch": 1827} {"train_loss": -6.126142978668213, "global_step": 76735, "epoch": 1827} {"train_loss": -6.02994966506958, "global_step": 76736, "epoch": 1827} {"train_loss": -6.0673627853393555, "global_step": 76737, "epoch": 1827} {"train_loss": -6.17866849899292, "global_step": 76738, "epoch": 1827} {"train_loss": -6.009727478027344, "global_step": 76739, "epoch": 1827} {"train_loss": -6.063360214233398, "global_step": 76740, "epoch": 1827} {"train_loss": -6.047574520111084, "global_step": 76741, "epoch": 1827} {"train_loss": -6.087623119354248, "global_step": 76742, "epoch": 1827} {"train_loss": -6.089617729187012, "global_step": 76743, "epoch": 1827} {"train_loss": -5.989284515380859, "global_step": 76744, "epoch": 1827} {"train_loss": -6.062880992889404, "global_step": 76745, "epoch": 1827} {"train_loss": -6.083317756652832, "global_step": 76746, "epoch": 1827} {"train_loss": -6.014402389526367, "global_step": 76747, "epoch": 1827} {"train_loss": -6.099225997924805, "global_step": 76748, "epoch": 1827} {"train_loss": -6.004189491271973, "global_step": 76749, "epoch": 1827} {"train_loss": -6.146483421325684, "global_step": 76750, "epoch": 1827} {"train_loss": -5.995800018310547, "global_step": 76751, "epoch": 1827} {"train_loss": -6.158059120178223, "global_step": 76752, "epoch": 1827} {"train_loss": -6.044596195220947, "global_step": 76753, "epoch": 1827} {"train_loss": -6.1220173835754395, "global_step": 76754, "epoch": 1827} {"train_loss": -6.087366104125977, "global_step": 76755, "epoch": 1827} {"train_loss": -6.13353967666626, "global_step": 76756, "epoch": 1827} {"train_loss": -6.181067943572998, "global_step": 76757, "epoch": 1827} {"train_loss": -6.152481555938721, "global_step": 76758, "epoch": 1827} {"train_loss": -6.093537330627441, "global_step": 76759, "epoch": 1827} {"train_loss": -6.133932590484619, "global_step": 76760, "epoch": 1827} {"train_loss": -6.075223445892334, "global_step": 76761, "epoch": 1827} {"train_loss": -6.143291473388672, "global_step": 76762, "epoch": 1827} {"train_loss": -6.182639122009277, "global_step": 76763, "epoch": 1827} {"train_loss": -6.066390514373779, "global_step": 76764, "epoch": 1827} {"train_loss": -6.112872123718262, "global_step": 76765, "epoch": 1827} {"train_loss": -6.160146713256836, "global_step": 76766, "epoch": 1827} {"train_loss": -6.11266565322876, "global_step": 76767, "epoch": 1827} {"train_loss": -6.132008075714111, "global_step": 76768, "epoch": 1827} {"train_loss": -6.089286804199219, "global_step": 76769, "epoch": 1827} {"train_loss": -6.1743340492248535, "global_step": 76770, "epoch": 1827} {"train_loss": -6.0667619705200195, "global_step": 76771, "epoch": 1827} {"train_loss": -5.999439716339111, "global_step": 76772, "epoch": 1827} {"train_loss": -6.168927192687988, "global_step": 76773, "epoch": 1827} {"train_loss": -6.120790481567383, "global_step": 76774, "epoch": 1827} {"train_loss": -6.096585069383893, "global_step": 76775, "epoch": 1827, "val_loss": 67533.1875} {"train_loss": -6.097633361816406, "global_step": 76776, "epoch": 1828} {"train_loss": -6.1933088302612305, "global_step": 76777, "epoch": 1828} {"train_loss": -6.169086456298828, "global_step": 76778, "epoch": 1828} {"train_loss": -6.144665718078613, "global_step": 76779, "epoch": 1828} {"train_loss": -6.088024616241455, "global_step": 76780, "epoch": 1828} {"train_loss": -6.183497905731201, "global_step": 76781, "epoch": 1828} {"train_loss": -6.11582088470459, "global_step": 76782, "epoch": 1828} {"train_loss": -6.102303504943848, "global_step": 76783, "epoch": 1828} {"train_loss": -6.129214763641357, "global_step": 76784, "epoch": 1828} {"train_loss": -6.0745158195495605, "global_step": 76785, "epoch": 1828} {"train_loss": -5.991628646850586, "global_step": 76786, "epoch": 1828} {"train_loss": -6.020307540893555, "global_step": 76787, "epoch": 1828} {"train_loss": -5.919337749481201, "global_step": 76788, "epoch": 1828} {"train_loss": -6.056687831878662, "global_step": 76789, "epoch": 1828} {"train_loss": -6.096035480499268, "global_step": 76790, "epoch": 1828} {"train_loss": -6.110686302185059, "global_step": 76791, "epoch": 1828} {"train_loss": -5.975401878356934, "global_step": 76792, "epoch": 1828} {"train_loss": -5.9360127449035645, "global_step": 76793, "epoch": 1828} {"train_loss": -6.090264797210693, "global_step": 76794, "epoch": 1828} {"train_loss": -5.976315498352051, "global_step": 76795, "epoch": 1828} {"train_loss": -6.0216522216796875, "global_step": 76796, "epoch": 1828} {"train_loss": -6.1648359298706055, "global_step": 76797, "epoch": 1828} {"train_loss": -6.064427375793457, "global_step": 76798, "epoch": 1828} {"train_loss": -6.153837203979492, "global_step": 76799, "epoch": 1828} {"train_loss": -6.19481897354126, "global_step": 76800, "epoch": 1828} {"train_loss": -6.010954856872559, "global_step": 76801, "epoch": 1828} {"train_loss": -6.035470008850098, "global_step": 76802, "epoch": 1828} {"train_loss": -6.093574047088623, "global_step": 76803, "epoch": 1828} {"train_loss": -6.073399066925049, "global_step": 76804, "epoch": 1828} {"train_loss": -6.132906436920166, "global_step": 76805, "epoch": 1828} {"train_loss": -5.976813793182373, "global_step": 76806, "epoch": 1828} {"train_loss": -6.048283100128174, "global_step": 76807, "epoch": 1828} {"train_loss": -6.065824508666992, "global_step": 76808, "epoch": 1828} {"train_loss": -6.00496244430542, "global_step": 76809, "epoch": 1828} {"train_loss": -6.005321025848389, "global_step": 76810, "epoch": 1828} {"train_loss": -6.0660529136657715, "global_step": 76811, "epoch": 1828} {"train_loss": -5.983184814453125, "global_step": 76812, "epoch": 1828} {"train_loss": -6.0493292808532715, "global_step": 76813, "epoch": 1828} {"train_loss": -6.135677814483643, "global_step": 76814, "epoch": 1828} {"train_loss": -6.083626747131348, "global_step": 76815, "epoch": 1828} {"train_loss": -6.176156997680664, "global_step": 76816, "epoch": 1828} {"train_loss": -6.073151122956049, "global_step": 76817, "epoch": 1828, "val_loss": 67812.3828125} {"train_loss": -6.117315292358398, "global_step": 76818, "epoch": 1829} {"train_loss": -6.002738952636719, "global_step": 76819, "epoch": 1829} {"train_loss": -6.011396884918213, "global_step": 76820, "epoch": 1829} {"train_loss": -6.0142412185668945, "global_step": 76821, "epoch": 1829} {"train_loss": -6.117836952209473, "global_step": 76822, "epoch": 1829} {"train_loss": -6.039742469787598, "global_step": 76823, "epoch": 1829} {"train_loss": -6.106927871704102, "global_step": 76824, "epoch": 1829} {"train_loss": -6.045337677001953, "global_step": 76825, "epoch": 1829} {"train_loss": -6.120652198791504, "global_step": 76826, "epoch": 1829} {"train_loss": -6.118424892425537, "global_step": 76827, "epoch": 1829} {"train_loss": -6.141903877258301, "global_step": 76828, "epoch": 1829} {"train_loss": -6.118813991546631, "global_step": 76829, "epoch": 1829} {"train_loss": -6.066224575042725, "global_step": 76830, "epoch": 1829} {"train_loss": -6.198920249938965, "global_step": 76831, "epoch": 1829} {"train_loss": -6.076157093048096, "global_step": 76832, "epoch": 1829} {"train_loss": -6.117374897003174, "global_step": 76833, "epoch": 1829} {"train_loss": -6.098354816436768, "global_step": 76834, "epoch": 1829} {"train_loss": -5.984110355377197, "global_step": 76835, "epoch": 1829} {"train_loss": -5.983395576477051, "global_step": 76836, "epoch": 1829} {"train_loss": -5.90596866607666, "global_step": 76837, "epoch": 1829} {"train_loss": -6.130561351776123, "global_step": 76838, "epoch": 1829} {"train_loss": -6.084261417388916, "global_step": 76839, "epoch": 1829} {"train_loss": -6.075589656829834, "global_step": 76840, "epoch": 1829} {"train_loss": -6.218494415283203, "global_step": 76841, "epoch": 1829} {"train_loss": -6.014098644256592, "global_step": 76842, "epoch": 1829} {"train_loss": -5.996318817138672, "global_step": 76843, "epoch": 1829} {"train_loss": -6.024899482727051, "global_step": 76844, "epoch": 1829} {"train_loss": -6.094496250152588, "global_step": 76845, "epoch": 1829} {"train_loss": -6.1573944091796875, "global_step": 76846, "epoch": 1829} {"train_loss": -6.1787638664245605, "global_step": 76847, "epoch": 1829} {"train_loss": -6.086538791656494, "global_step": 76848, "epoch": 1829} {"train_loss": -6.035545349121094, "global_step": 76849, "epoch": 1829} {"train_loss": -6.065446853637695, "global_step": 76850, "epoch": 1829} {"train_loss": -6.150448322296143, "global_step": 76851, "epoch": 1829} {"train_loss": -6.119157314300537, "global_step": 76852, "epoch": 1829} {"train_loss": -6.20083475112915, "global_step": 76853, "epoch": 1829} {"train_loss": -6.106319427490234, "global_step": 76854, "epoch": 1829} {"train_loss": -6.123357772827148, "global_step": 76855, "epoch": 1829} {"train_loss": -6.219205856323242, "global_step": 76856, "epoch": 1829} {"train_loss": -6.092937469482422, "global_step": 76857, "epoch": 1829} {"train_loss": -6.093252182006836, "global_step": 76858, "epoch": 1829} {"train_loss": -6.088833263942173, "global_step": 76859, "epoch": 1829, "val_loss": 67788.8125} {"train_loss": -6.149048805236816, "global_step": 76860, "epoch": 1830} {"train_loss": -6.209927082061768, "global_step": 76861, "epoch": 1830} {"train_loss": -6.134919166564941, "global_step": 76862, "epoch": 1830} {"train_loss": -6.0832085609436035, "global_step": 76863, "epoch": 1830} {"train_loss": -6.044317245483398, "global_step": 76864, "epoch": 1830} {"train_loss": -5.953011512756348, "global_step": 76865, "epoch": 1830} {"train_loss": -6.1413798332214355, "global_step": 76866, "epoch": 1830} {"train_loss": -6.004440784454346, "global_step": 76867, "epoch": 1830} {"train_loss": -5.956449508666992, "global_step": 76868, "epoch": 1830} {"train_loss": -6.146336078643799, "global_step": 76869, "epoch": 1830} {"train_loss": -6.004461288452148, "global_step": 76870, "epoch": 1830} {"train_loss": -6.087211608886719, "global_step": 76871, "epoch": 1830} {"train_loss": -6.025531768798828, "global_step": 76872, "epoch": 1830} {"train_loss": -6.061741828918457, "global_step": 76873, "epoch": 1830} {"train_loss": -6.076872825622559, "global_step": 76874, "epoch": 1830} {"train_loss": -6.067243576049805, "global_step": 76875, "epoch": 1830} {"train_loss": -6.026963710784912, "global_step": 76876, "epoch": 1830} {"train_loss": -5.993924617767334, "global_step": 76877, "epoch": 1830} {"train_loss": -6.012358665466309, "global_step": 76878, "epoch": 1830} {"train_loss": -6.077970027923584, "global_step": 76879, "epoch": 1830} {"train_loss": -5.983706474304199, "global_step": 76880, "epoch": 1830} {"train_loss": -6.0526556968688965, "global_step": 76881, "epoch": 1830} {"train_loss": -6.189545631408691, "global_step": 76882, "epoch": 1830} {"train_loss": -6.0522661209106445, "global_step": 76883, "epoch": 1830} {"train_loss": -5.995165824890137, "global_step": 76884, "epoch": 1830} {"train_loss": -6.127868175506592, "global_step": 76885, "epoch": 1830} {"train_loss": -6.091512203216553, "global_step": 76886, "epoch": 1830} {"train_loss": -6.006361961364746, "global_step": 76887, "epoch": 1830} {"train_loss": -6.149052143096924, "global_step": 76888, "epoch": 1830} {"train_loss": -5.986070156097412, "global_step": 76889, "epoch": 1830} {"train_loss": -6.130160808563232, "global_step": 76890, "epoch": 1830} {"train_loss": -6.070052623748779, "global_step": 76891, "epoch": 1830} {"train_loss": -6.1255998611450195, "global_step": 76892, "epoch": 1830} {"train_loss": -6.073686599731445, "global_step": 76893, "epoch": 1830} {"train_loss": -6.117925643920898, "global_step": 76894, "epoch": 1830} {"train_loss": -6.007734298706055, "global_step": 76895, "epoch": 1830} {"train_loss": -5.945333480834961, "global_step": 76896, "epoch": 1830} {"train_loss": -5.9850616455078125, "global_step": 76897, "epoch": 1830} {"train_loss": -6.010643005371094, "global_step": 76898, "epoch": 1830} {"train_loss": -6.049559116363525, "global_step": 76899, "epoch": 1830} {"train_loss": -5.960919380187988, "global_step": 76900, "epoch": 1830} {"train_loss": -6.059054056803386, "global_step": 76901, "epoch": 1830, "val_loss": 67549.28125} {"train_loss": -6.046253204345703, "global_step": 76902, "epoch": 1831} {"train_loss": -6.105746746063232, "global_step": 76903, "epoch": 1831} {"train_loss": -6.125360488891602, "global_step": 76904, "epoch": 1831} {"train_loss": -6.133728504180908, "global_step": 76905, "epoch": 1831} {"train_loss": -6.096168041229248, "global_step": 76906, "epoch": 1831} {"train_loss": -6.1318817138671875, "global_step": 76907, "epoch": 1831} {"train_loss": -6.041197776794434, "global_step": 76908, "epoch": 1831} {"train_loss": -5.885962963104248, "global_step": 76909, "epoch": 1831} {"train_loss": -5.958481788635254, "global_step": 76910, "epoch": 1831} {"train_loss": -6.140198707580566, "global_step": 76911, "epoch": 1831} {"train_loss": -6.068614959716797, "global_step": 76912, "epoch": 1831} {"train_loss": -6.061254978179932, "global_step": 76913, "epoch": 1831} {"train_loss": -6.204054832458496, "global_step": 76914, "epoch": 1831} {"train_loss": -6.1363396644592285, "global_step": 76915, "epoch": 1831} {"train_loss": -6.1574296951293945, "global_step": 76916, "epoch": 1831} {"train_loss": -6.073592662811279, "global_step": 76917, "epoch": 1831} {"train_loss": -6.108630180358887, "global_step": 76918, "epoch": 1831} {"train_loss": -6.011520862579346, "global_step": 76919, "epoch": 1831} {"train_loss": -6.027362823486328, "global_step": 76920, "epoch": 1831} {"train_loss": -6.118791580200195, "global_step": 76921, "epoch": 1831} {"train_loss": -6.147612571716309, "global_step": 76922, "epoch": 1831} {"train_loss": -6.116167068481445, "global_step": 76923, "epoch": 1831} {"train_loss": -6.139328479766846, "global_step": 76924, "epoch": 1831} {"train_loss": -6.239316940307617, "global_step": 76925, "epoch": 1831} {"train_loss": -6.099267959594727, "global_step": 76926, "epoch": 1831} {"train_loss": -6.060529708862305, "global_step": 76927, "epoch": 1831} {"train_loss": -6.055352687835693, "global_step": 76928, "epoch": 1831} {"train_loss": -6.127585411071777, "global_step": 76929, "epoch": 1831} {"train_loss": -6.158075332641602, "global_step": 76930, "epoch": 1831} {"train_loss": -6.1145920753479, "global_step": 76931, "epoch": 1831} {"train_loss": -6.1074018478393555, "global_step": 76932, "epoch": 1831} {"train_loss": -6.081628799438477, "global_step": 76933, "epoch": 1831} {"train_loss": -6.188572406768799, "global_step": 76934, "epoch": 1831} {"train_loss": -6.035067558288574, "global_step": 76935, "epoch": 1831} {"train_loss": -6.084563255310059, "global_step": 76936, "epoch": 1831} {"train_loss": -6.051126003265381, "global_step": 76937, "epoch": 1831} {"train_loss": -6.120815277099609, "global_step": 76938, "epoch": 1831} {"train_loss": -6.108624458312988, "global_step": 76939, "epoch": 1831} {"train_loss": -6.123926639556885, "global_step": 76940, "epoch": 1831} {"train_loss": -6.081433296203613, "global_step": 76941, "epoch": 1831} {"train_loss": -6.178242206573486, "global_step": 76942, "epoch": 1831} {"train_loss": -6.0998617353893465, "global_step": 76943, "epoch": 1831, "val_loss": 67474.40625} {"train_loss": -6.073180675506592, "global_step": 76944, "epoch": 1832} {"train_loss": -6.152830600738525, "global_step": 76945, "epoch": 1832} {"train_loss": -6.196869850158691, "global_step": 76946, "epoch": 1832} {"train_loss": -6.103390216827393, "global_step": 76947, "epoch": 1832} {"train_loss": -5.9240312576293945, "global_step": 76948, "epoch": 1832} {"train_loss": -6.035931587219238, "global_step": 76949, "epoch": 1832} {"train_loss": -6.087447166442871, "global_step": 76950, "epoch": 1832} {"train_loss": -6.006667137145996, "global_step": 76951, "epoch": 1832} {"train_loss": -6.140824317932129, "global_step": 76952, "epoch": 1832} {"train_loss": -6.2003631591796875, "global_step": 76953, "epoch": 1832} {"train_loss": -6.164216995239258, "global_step": 76954, "epoch": 1832} {"train_loss": -6.063125133514404, "global_step": 76955, "epoch": 1832} {"train_loss": -6.249207973480225, "global_step": 76956, "epoch": 1832} {"train_loss": -6.162842750549316, "global_step": 76957, "epoch": 1832} {"train_loss": -6.245182037353516, "global_step": 76958, "epoch": 1832} {"train_loss": -6.1403608322143555, "global_step": 76959, "epoch": 1832} {"train_loss": -5.96968936920166, "global_step": 76960, "epoch": 1832} {"train_loss": -6.1003618240356445, "global_step": 76961, "epoch": 1832} {"train_loss": -6.142656326293945, "global_step": 76962, "epoch": 1832} {"train_loss": -6.064606666564941, "global_step": 76963, "epoch": 1832} {"train_loss": -6.112151622772217, "global_step": 76964, "epoch": 1832} {"train_loss": -6.063083171844482, "global_step": 76965, "epoch": 1832} {"train_loss": -6.046492576599121, "global_step": 76966, "epoch": 1832} {"train_loss": -6.203907012939453, "global_step": 76967, "epoch": 1832} {"train_loss": -5.882317543029785, "global_step": 76968, "epoch": 1832} {"train_loss": -6.142825603485107, "global_step": 76969, "epoch": 1832} {"train_loss": -6.171987533569336, "global_step": 76970, "epoch": 1832} {"train_loss": -6.173547267913818, "global_step": 76971, "epoch": 1832} {"train_loss": -6.046918869018555, "global_step": 76972, "epoch": 1832} {"train_loss": -6.058280944824219, "global_step": 76973, "epoch": 1832} {"train_loss": -6.035423278808594, "global_step": 76974, "epoch": 1832} {"train_loss": -6.006318092346191, "global_step": 76975, "epoch": 1832} {"train_loss": -6.143862724304199, "global_step": 76976, "epoch": 1832} {"train_loss": -6.212212562561035, "global_step": 76977, "epoch": 1832} {"train_loss": -6.29633903503418, "global_step": 76978, "epoch": 1832} {"train_loss": -6.168307781219482, "global_step": 76979, "epoch": 1832} {"train_loss": -6.046336650848389, "global_step": 76980, "epoch": 1832} {"train_loss": -6.169909477233887, "global_step": 76981, "epoch": 1832} {"train_loss": -6.181201934814453, "global_step": 76982, "epoch": 1832} {"train_loss": -6.08832311630249, "global_step": 76983, "epoch": 1832} {"train_loss": -6.059349060058594, "global_step": 76984, "epoch": 1832} {"train_loss": -6.107877969741821, "global_step": 76985, "epoch": 1832, "val_loss": 67707.3359375} {"train_loss": -6.000374794006348, "global_step": 76986, "epoch": 1833} {"train_loss": -6.10289192199707, "global_step": 76987, "epoch": 1833} {"train_loss": -5.990107536315918, "global_step": 76988, "epoch": 1833} {"train_loss": -6.1853179931640625, "global_step": 76989, "epoch": 1833} {"train_loss": -6.007468223571777, "global_step": 76990, "epoch": 1833} {"train_loss": -6.015805721282959, "global_step": 76991, "epoch": 1833} {"train_loss": -6.122596263885498, "global_step": 76992, "epoch": 1833} {"train_loss": -6.070322036743164, "global_step": 76993, "epoch": 1833} {"train_loss": -6.066141128540039, "global_step": 76994, "epoch": 1833} {"train_loss": -6.096673965454102, "global_step": 76995, "epoch": 1833} {"train_loss": -6.094050407409668, "global_step": 76996, "epoch": 1833} {"train_loss": -6.020394802093506, "global_step": 76997, "epoch": 1833} {"train_loss": -6.112545967102051, "global_step": 76998, "epoch": 1833} {"train_loss": -6.100338935852051, "global_step": 76999, "epoch": 1833} {"train_loss": -6.129181385040283, "global_step": 77000, "epoch": 1833} {"train_loss": -6.147185802459717, "global_step": 77001, "epoch": 1833} {"train_loss": -6.007602691650391, "global_step": 77002, "epoch": 1833} {"train_loss": -5.996087074279785, "global_step": 77003, "epoch": 1833} {"train_loss": -6.112199783325195, "global_step": 77004, "epoch": 1833} {"train_loss": -6.110834121704102, "global_step": 77005, "epoch": 1833} {"train_loss": -6.123108863830566, "global_step": 77006, "epoch": 1833} {"train_loss": -6.00548791885376, "global_step": 77007, "epoch": 1833} {"train_loss": -6.040780067443848, "global_step": 77008, "epoch": 1833} {"train_loss": -6.053218841552734, "global_step": 77009, "epoch": 1833} {"train_loss": -6.114882469177246, "global_step": 77010, "epoch": 1833} {"train_loss": -6.0568718910217285, "global_step": 77011, "epoch": 1833} {"train_loss": -6.084626197814941, "global_step": 77012, "epoch": 1833} {"train_loss": -6.078606128692627, "global_step": 77013, "epoch": 1833} {"train_loss": -6.145540237426758, "global_step": 77014, "epoch": 1833} {"train_loss": -6.010001182556152, "global_step": 77015, "epoch": 1833} {"train_loss": -6.076541900634766, "global_step": 77016, "epoch": 1833} {"train_loss": -6.15521240234375, "global_step": 77017, "epoch": 1833} {"train_loss": -6.077404499053955, "global_step": 77018, "epoch": 1833} {"train_loss": -5.978492259979248, "global_step": 77019, "epoch": 1833} {"train_loss": -6.084610939025879, "global_step": 77020, "epoch": 1833} {"train_loss": -6.044747352600098, "global_step": 77021, "epoch": 1833} {"train_loss": -6.146732330322266, "global_step": 77022, "epoch": 1833} {"train_loss": -6.043953895568848, "global_step": 77023, "epoch": 1833} {"train_loss": -6.0195722579956055, "global_step": 77024, "epoch": 1833} {"train_loss": -6.067433834075928, "global_step": 77025, "epoch": 1833} {"train_loss": -6.045024871826172, "global_step": 77026, "epoch": 1833} {"train_loss": -6.0716915017082576, "global_step": 77027, "epoch": 1833, "val_loss": 67859.984375} {"train_loss": -6.050085067749023, "global_step": 77028, "epoch": 1834} {"train_loss": -6.080080509185791, "global_step": 77029, "epoch": 1834} {"train_loss": -6.081356525421143, "global_step": 77030, "epoch": 1834} {"train_loss": -6.162246227264404, "global_step": 77031, "epoch": 1834} {"train_loss": -6.140899658203125, "global_step": 77032, "epoch": 1834} {"train_loss": -6.053267478942871, "global_step": 77033, "epoch": 1834} {"train_loss": -6.137866020202637, "global_step": 77034, "epoch": 1834} {"train_loss": -6.047024726867676, "global_step": 77035, "epoch": 1834} {"train_loss": -6.066133499145508, "global_step": 77036, "epoch": 1834} {"train_loss": -6.142632484436035, "global_step": 77037, "epoch": 1834} {"train_loss": -6.075985908508301, "global_step": 77038, "epoch": 1834} {"train_loss": -6.083992958068848, "global_step": 77039, "epoch": 1834} {"train_loss": -6.161191463470459, "global_step": 77040, "epoch": 1834} {"train_loss": -6.07643985748291, "global_step": 77041, "epoch": 1834} {"train_loss": -5.993559837341309, "global_step": 77042, "epoch": 1834} {"train_loss": -6.076868057250977, "global_step": 77043, "epoch": 1834} {"train_loss": -6.091440200805664, "global_step": 77044, "epoch": 1834} {"train_loss": -6.191921234130859, "global_step": 77045, "epoch": 1834} {"train_loss": -6.163851737976074, "global_step": 77046, "epoch": 1834} {"train_loss": -6.1658935546875, "global_step": 77047, "epoch": 1834} {"train_loss": -6.049945831298828, "global_step": 77048, "epoch": 1834} {"train_loss": -6.199984550476074, "global_step": 77049, "epoch": 1834} {"train_loss": -6.07582950592041, "global_step": 77050, "epoch": 1834} {"train_loss": -6.10064172744751, "global_step": 77051, "epoch": 1834} {"train_loss": -6.122413635253906, "global_step": 77052, "epoch": 1834} {"train_loss": -6.202606201171875, "global_step": 77053, "epoch": 1834} {"train_loss": -6.112504959106445, "global_step": 77054, "epoch": 1834} {"train_loss": -6.048294544219971, "global_step": 77055, "epoch": 1834} {"train_loss": -6.116136074066162, "global_step": 77056, "epoch": 1834} {"train_loss": -6.17720890045166, "global_step": 77057, "epoch": 1834} {"train_loss": -6.275267601013184, "global_step": 77058, "epoch": 1834} {"train_loss": -6.180169105529785, "global_step": 77059, "epoch": 1834} {"train_loss": -6.044075012207031, "global_step": 77060, "epoch": 1834} {"train_loss": -6.074103832244873, "global_step": 77061, "epoch": 1834} {"train_loss": -6.087292671203613, "global_step": 77062, "epoch": 1834} {"train_loss": -5.902222633361816, "global_step": 77063, "epoch": 1834} {"train_loss": -6.067782402038574, "global_step": 77064, "epoch": 1834} {"train_loss": -5.985733985900879, "global_step": 77065, "epoch": 1834} {"train_loss": -6.0852251052856445, "global_step": 77066, "epoch": 1834} {"train_loss": -6.051779747009277, "global_step": 77067, "epoch": 1834} {"train_loss": -6.18304443359375, "global_step": 77068, "epoch": 1834} {"train_loss": -6.0992419719696045, "global_step": 77069, "epoch": 1834, "val_loss": 67358.2734375} {"train_loss": -6.100951194763184, "global_step": 77070, "epoch": 1835} {"train_loss": -6.179001808166504, "global_step": 77071, "epoch": 1835} {"train_loss": -5.96755313873291, "global_step": 77072, "epoch": 1835} {"train_loss": -6.0243754386901855, "global_step": 77073, "epoch": 1835} {"train_loss": -6.024514675140381, "global_step": 77074, "epoch": 1835} {"train_loss": -6.061009407043457, "global_step": 77075, "epoch": 1835} {"train_loss": -6.035762310028076, "global_step": 77076, "epoch": 1835} {"train_loss": -6.006746292114258, "global_step": 77077, "epoch": 1835} {"train_loss": -6.041961669921875, "global_step": 77078, "epoch": 1835} {"train_loss": -6.1923651695251465, "global_step": 77079, "epoch": 1835} {"train_loss": -6.014000415802002, "global_step": 77080, "epoch": 1835} {"train_loss": -6.107243061065674, "global_step": 77081, "epoch": 1835} {"train_loss": -6.131758689880371, "global_step": 77082, "epoch": 1835} {"train_loss": -5.99711799621582, "global_step": 77083, "epoch": 1835} {"train_loss": -6.0878472328186035, "global_step": 77084, "epoch": 1835} {"train_loss": -6.040637969970703, "global_step": 77085, "epoch": 1835} {"train_loss": -6.060796737670898, "global_step": 77086, "epoch": 1835} {"train_loss": -6.0069475173950195, "global_step": 77087, "epoch": 1835} {"train_loss": -6.085198402404785, "global_step": 77088, "epoch": 1835} {"train_loss": -6.093447208404541, "global_step": 77089, "epoch": 1835} {"train_loss": -6.002744197845459, "global_step": 77090, "epoch": 1835} {"train_loss": -6.125739097595215, "global_step": 77091, "epoch": 1835} {"train_loss": -6.217480659484863, "global_step": 77092, "epoch": 1835} {"train_loss": -6.080992698669434, "global_step": 77093, "epoch": 1835} {"train_loss": -6.125154495239258, "global_step": 77094, "epoch": 1835} {"train_loss": -6.189639091491699, "global_step": 77095, "epoch": 1835} {"train_loss": -6.064303398132324, "global_step": 77096, "epoch": 1835} {"train_loss": -6.24321985244751, "global_step": 77097, "epoch": 1835} {"train_loss": -6.024320602416992, "global_step": 77098, "epoch": 1835} {"train_loss": -6.026140213012695, "global_step": 77099, "epoch": 1835} {"train_loss": -6.106081008911133, "global_step": 77100, "epoch": 1835} {"train_loss": -6.159688949584961, "global_step": 77101, "epoch": 1835} {"train_loss": -6.0266571044921875, "global_step": 77102, "epoch": 1835} {"train_loss": -6.069942474365234, "global_step": 77103, "epoch": 1835} {"train_loss": -6.051994323730469, "global_step": 77104, "epoch": 1835} {"train_loss": -6.094069957733154, "global_step": 77105, "epoch": 1835} {"train_loss": -6.095236778259277, "global_step": 77106, "epoch": 1835} {"train_loss": -6.045571327209473, "global_step": 77107, "epoch": 1835} {"train_loss": -6.1163482666015625, "global_step": 77108, "epoch": 1835} {"train_loss": -6.144330024719238, "global_step": 77109, "epoch": 1835} {"train_loss": -6.038805961608887, "global_step": 77110, "epoch": 1835} {"train_loss": -6.08259703999474, "global_step": 77111, "epoch": 1835, "val_loss": 67434.1953125} {"train_loss": -6.072988033294678, "global_step": 77112, "epoch": 1836} {"train_loss": -6.158667087554932, "global_step": 77113, "epoch": 1836} {"train_loss": -6.087460041046143, "global_step": 77114, "epoch": 1836} {"train_loss": -6.123666763305664, "global_step": 77115, "epoch": 1836} {"train_loss": -6.059439659118652, "global_step": 77116, "epoch": 1836} {"train_loss": -5.988213062286377, "global_step": 77117, "epoch": 1836} {"train_loss": -6.023343086242676, "global_step": 77118, "epoch": 1836} {"train_loss": -6.158350944519043, "global_step": 77119, "epoch": 1836} {"train_loss": -6.011407852172852, "global_step": 77120, "epoch": 1836} {"train_loss": -6.1192779541015625, "global_step": 77121, "epoch": 1836} {"train_loss": -6.026913166046143, "global_step": 77122, "epoch": 1836} {"train_loss": -6.078892230987549, "global_step": 77123, "epoch": 1836} {"train_loss": -6.0521039962768555, "global_step": 77124, "epoch": 1836} {"train_loss": -6.187954425811768, "global_step": 77125, "epoch": 1836} {"train_loss": -6.133069038391113, "global_step": 77126, "epoch": 1836} {"train_loss": -5.9951605796813965, "global_step": 77127, "epoch": 1836} {"train_loss": -5.986125946044922, "global_step": 77128, "epoch": 1836} {"train_loss": -5.990200996398926, "global_step": 77129, "epoch": 1836} {"train_loss": -6.113131523132324, "global_step": 77130, "epoch": 1836} {"train_loss": -5.986026287078857, "global_step": 77131, "epoch": 1836} {"train_loss": -6.020801544189453, "global_step": 77132, "epoch": 1836} {"train_loss": -6.012429237365723, "global_step": 77133, "epoch": 1836} {"train_loss": -5.945257186889648, "global_step": 77134, "epoch": 1836} {"train_loss": -6.0842156410217285, "global_step": 77135, "epoch": 1836} {"train_loss": -6.0000457763671875, "global_step": 77136, "epoch": 1836} {"train_loss": -6.112026214599609, "global_step": 77137, "epoch": 1836} {"train_loss": -6.082774639129639, "global_step": 77138, "epoch": 1836} {"train_loss": -6.1606669425964355, "global_step": 77139, "epoch": 1836} {"train_loss": -6.031063079833984, "global_step": 77140, "epoch": 1836} {"train_loss": -6.136107444763184, "global_step": 77141, "epoch": 1836} {"train_loss": -5.979876518249512, "global_step": 77142, "epoch": 1836} {"train_loss": -6.022684097290039, "global_step": 77143, "epoch": 1836} {"train_loss": -5.929547309875488, "global_step": 77144, "epoch": 1836} {"train_loss": -6.091221809387207, "global_step": 77145, "epoch": 1836} {"train_loss": -6.162179946899414, "global_step": 77146, "epoch": 1836} {"train_loss": -6.10577917098999, "global_step": 77147, "epoch": 1836} {"train_loss": -6.167745113372803, "global_step": 77148, "epoch": 1836} {"train_loss": -5.99634313583374, "global_step": 77149, "epoch": 1836} {"train_loss": -6.073126792907715, "global_step": 77150, "epoch": 1836} {"train_loss": -6.153293132781982, "global_step": 77151, "epoch": 1836} {"train_loss": -6.144602298736572, "global_step": 77152, "epoch": 1836} {"train_loss": -6.0677578676314585, "global_step": 77153, "epoch": 1836, "val_loss": 67408.890625} {"train_loss": -6.144887924194336, "global_step": 77154, "epoch": 1837} {"train_loss": -6.137847900390625, "global_step": 77155, "epoch": 1837} {"train_loss": -6.092564582824707, "global_step": 77156, "epoch": 1837} {"train_loss": -6.1234822273254395, "global_step": 77157, "epoch": 1837} {"train_loss": -6.081783294677734, "global_step": 77158, "epoch": 1837} {"train_loss": -6.027365684509277, "global_step": 77159, "epoch": 1837} {"train_loss": -6.062493324279785, "global_step": 77160, "epoch": 1837} {"train_loss": -5.988336086273193, "global_step": 77161, "epoch": 1837} {"train_loss": -6.062817573547363, "global_step": 77162, "epoch": 1837} {"train_loss": -6.095336437225342, "global_step": 77163, "epoch": 1837} {"train_loss": -6.160569667816162, "global_step": 77164, "epoch": 1837} {"train_loss": -6.081064224243164, "global_step": 77165, "epoch": 1837} {"train_loss": -6.05816650390625, "global_step": 77166, "epoch": 1837} {"train_loss": -6.099238395690918, "global_step": 77167, "epoch": 1837} {"train_loss": -6.135662078857422, "global_step": 77168, "epoch": 1837} {"train_loss": -6.238085746765137, "global_step": 77169, "epoch": 1837} {"train_loss": -6.089450359344482, "global_step": 77170, "epoch": 1837} {"train_loss": -6.0998969078063965, "global_step": 77171, "epoch": 1837} {"train_loss": -6.1342692375183105, "global_step": 77172, "epoch": 1837} {"train_loss": -6.092737197875977, "global_step": 77173, "epoch": 1837} {"train_loss": -6.070472717285156, "global_step": 77174, "epoch": 1837} {"train_loss": -6.110292911529541, "global_step": 77175, "epoch": 1837} {"train_loss": -6.218219757080078, "global_step": 77176, "epoch": 1837} {"train_loss": -6.1824140548706055, "global_step": 77177, "epoch": 1837} {"train_loss": -6.061994552612305, "global_step": 77178, "epoch": 1837} {"train_loss": -6.165307998657227, "global_step": 77179, "epoch": 1837} {"train_loss": -6.120922088623047, "global_step": 77180, "epoch": 1837} {"train_loss": -6.220992565155029, "global_step": 77181, "epoch": 1837} {"train_loss": -5.950214385986328, "global_step": 77182, "epoch": 1837} {"train_loss": -6.00208044052124, "global_step": 77183, "epoch": 1837} {"train_loss": -6.208101272583008, "global_step": 77184, "epoch": 1837} {"train_loss": -6.122385025024414, "global_step": 77185, "epoch": 1837} {"train_loss": -6.014493942260742, "global_step": 77186, "epoch": 1837} {"train_loss": -5.986424446105957, "global_step": 77187, "epoch": 1837} {"train_loss": -6.071398735046387, "global_step": 77188, "epoch": 1837} {"train_loss": -6.1922736167907715, "global_step": 77189, "epoch": 1837} {"train_loss": -6.231900691986084, "global_step": 77190, "epoch": 1837} {"train_loss": -6.077371120452881, "global_step": 77191, "epoch": 1837} {"train_loss": -6.000000953674316, "global_step": 77192, "epoch": 1837} {"train_loss": -6.1805877685546875, "global_step": 77193, "epoch": 1837} {"train_loss": -6.075161457061768, "global_step": 77194, "epoch": 1837} {"train_loss": -6.105661982581729, "global_step": 77195, "epoch": 1837, "val_loss": 67462.6640625} {"train_loss": -6.0204315185546875, "global_step": 77196, "epoch": 1838} {"train_loss": -6.22002649307251, "global_step": 77197, "epoch": 1838} {"train_loss": -6.130849361419678, "global_step": 77198, "epoch": 1838} {"train_loss": -6.103818893432617, "global_step": 77199, "epoch": 1838} {"train_loss": -6.161765098571777, "global_step": 77200, "epoch": 1838} {"train_loss": -6.081724166870117, "global_step": 77201, "epoch": 1838} {"train_loss": -6.112895965576172, "global_step": 77202, "epoch": 1838} {"train_loss": -6.246639251708984, "global_step": 77203, "epoch": 1838} {"train_loss": -6.146747589111328, "global_step": 77204, "epoch": 1838} {"train_loss": -6.0578107833862305, "global_step": 77205, "epoch": 1838} {"train_loss": -6.174435615539551, "global_step": 77206, "epoch": 1838} {"train_loss": -6.171441078186035, "global_step": 77207, "epoch": 1838} {"train_loss": -6.176011085510254, "global_step": 77208, "epoch": 1838} {"train_loss": -6.101163864135742, "global_step": 77209, "epoch": 1838} {"train_loss": -6.22502326965332, "global_step": 77210, "epoch": 1838} {"train_loss": -6.157116413116455, "global_step": 77211, "epoch": 1838} {"train_loss": -6.2170820236206055, "global_step": 77212, "epoch": 1838} {"train_loss": -6.136317253112793, "global_step": 77213, "epoch": 1838} {"train_loss": -6.154749870300293, "global_step": 77214, "epoch": 1838} {"train_loss": -6.09231424331665, "global_step": 77215, "epoch": 1838} {"train_loss": -6.12615966796875, "global_step": 77216, "epoch": 1838} {"train_loss": -6.097231388092041, "global_step": 77217, "epoch": 1838} {"train_loss": -6.139501571655273, "global_step": 77218, "epoch": 1838} {"train_loss": -6.010729789733887, "global_step": 77219, "epoch": 1838} {"train_loss": -6.216590404510498, "global_step": 77220, "epoch": 1838} {"train_loss": -6.078588485717773, "global_step": 77221, "epoch": 1838} {"train_loss": -5.943221569061279, "global_step": 77222, "epoch": 1838} {"train_loss": -6.1062750816345215, "global_step": 77223, "epoch": 1838} {"train_loss": -5.958596229553223, "global_step": 77224, "epoch": 1838} {"train_loss": -5.962887763977051, "global_step": 77225, "epoch": 1838} {"train_loss": -6.076850891113281, "global_step": 77226, "epoch": 1838} {"train_loss": -6.055736064910889, "global_step": 77227, "epoch": 1838} {"train_loss": -6.060595512390137, "global_step": 77228, "epoch": 1838} {"train_loss": -5.929943561553955, "global_step": 77229, "epoch": 1838} {"train_loss": -5.95728063583374, "global_step": 77230, "epoch": 1838} {"train_loss": -6.044764041900635, "global_step": 77231, "epoch": 1838} {"train_loss": -6.159645080566406, "global_step": 77232, "epoch": 1838} {"train_loss": -5.987290859222412, "global_step": 77233, "epoch": 1838} {"train_loss": -6.0696258544921875, "global_step": 77234, "epoch": 1838} {"train_loss": -5.935520648956299, "global_step": 77235, "epoch": 1838} {"train_loss": -6.190879821777344, "global_step": 77236, "epoch": 1838} {"train_loss": -6.095723299753098, "global_step": 77237, "epoch": 1838, "val_loss": 67752.6328125} {"train_loss": -6.1708664894104, "global_step": 77238, "epoch": 1839} {"train_loss": -6.04831600189209, "global_step": 77239, "epoch": 1839} {"train_loss": -6.091226577758789, "global_step": 77240, "epoch": 1839} {"train_loss": -6.074339866638184, "global_step": 77241, "epoch": 1839} {"train_loss": -6.0709404945373535, "global_step": 77242, "epoch": 1839} {"train_loss": -6.117101669311523, "global_step": 77243, "epoch": 1839} {"train_loss": -6.060540199279785, "global_step": 77244, "epoch": 1839} {"train_loss": -6.261883735656738, "global_step": 77245, "epoch": 1839} {"train_loss": -6.018061637878418, "global_step": 77246, "epoch": 1839} {"train_loss": -6.025052070617676, "global_step": 77247, "epoch": 1839} {"train_loss": -6.125757694244385, "global_step": 77248, "epoch": 1839} {"train_loss": -6.027614116668701, "global_step": 77249, "epoch": 1839} {"train_loss": -6.118105888366699, "global_step": 77250, "epoch": 1839} {"train_loss": -6.0137810707092285, "global_step": 77251, "epoch": 1839} {"train_loss": -6.035945415496826, "global_step": 77252, "epoch": 1839} {"train_loss": -6.075754165649414, "global_step": 77253, "epoch": 1839} {"train_loss": -6.123965263366699, "global_step": 77254, "epoch": 1839} {"train_loss": -6.061221599578857, "global_step": 77255, "epoch": 1839} {"train_loss": -6.027201175689697, "global_step": 77256, "epoch": 1839} {"train_loss": -5.984862327575684, "global_step": 77257, "epoch": 1839} {"train_loss": -6.184171676635742, "global_step": 77258, "epoch": 1839} {"train_loss": -6.003226280212402, "global_step": 77259, "epoch": 1839} {"train_loss": -6.100730895996094, "global_step": 77260, "epoch": 1839} {"train_loss": -6.096388816833496, "global_step": 77261, "epoch": 1839} {"train_loss": -6.014497756958008, "global_step": 77262, "epoch": 1839} {"train_loss": -5.988642692565918, "global_step": 77263, "epoch": 1839} {"train_loss": -6.056122779846191, "global_step": 77264, "epoch": 1839} {"train_loss": -6.10225772857666, "global_step": 77265, "epoch": 1839} {"train_loss": -6.066271781921387, "global_step": 77266, "epoch": 1839} {"train_loss": -5.965104103088379, "global_step": 77267, "epoch": 1839} {"train_loss": -6.096565246582031, "global_step": 77268, "epoch": 1839} {"train_loss": -6.06223201751709, "global_step": 77269, "epoch": 1839} {"train_loss": -6.082783222198486, "global_step": 77270, "epoch": 1839} {"train_loss": -5.991131782531738, "global_step": 77271, "epoch": 1839} {"train_loss": -6.015185832977295, "global_step": 77272, "epoch": 1839} {"train_loss": -6.154272079467773, "global_step": 77273, "epoch": 1839} {"train_loss": -6.1119704246521, "global_step": 77274, "epoch": 1839} {"train_loss": -6.090412139892578, "global_step": 77275, "epoch": 1839} {"train_loss": -6.131710052490234, "global_step": 77276, "epoch": 1839} {"train_loss": -6.088675498962402, "global_step": 77277, "epoch": 1839} {"train_loss": -6.023700714111328, "global_step": 77278, "epoch": 1839} {"train_loss": -6.07456804457165, "global_step": 77279, "epoch": 1839, "val_loss": 67506.6640625} {"train_loss": -6.09848690032959, "global_step": 77280, "epoch": 1840} {"train_loss": -6.079444885253906, "global_step": 77281, "epoch": 1840} {"train_loss": -6.005510330200195, "global_step": 77282, "epoch": 1840} {"train_loss": -6.179107189178467, "global_step": 77283, "epoch": 1840} {"train_loss": -6.075229644775391, "global_step": 77284, "epoch": 1840} {"train_loss": -6.112872123718262, "global_step": 77285, "epoch": 1840} {"train_loss": -6.073397159576416, "global_step": 77286, "epoch": 1840} {"train_loss": -6.1280412673950195, "global_step": 77287, "epoch": 1840} {"train_loss": -6.106117248535156, "global_step": 77288, "epoch": 1840} {"train_loss": -6.056087017059326, "global_step": 77289, "epoch": 1840} {"train_loss": -6.119091510772705, "global_step": 77290, "epoch": 1840} {"train_loss": -6.073655128479004, "global_step": 77291, "epoch": 1840} {"train_loss": -6.038422584533691, "global_step": 77292, "epoch": 1840} {"train_loss": -6.135933876037598, "global_step": 77293, "epoch": 1840} {"train_loss": -6.1432108879089355, "global_step": 77294, "epoch": 1840} {"train_loss": -5.917971611022949, "global_step": 77295, "epoch": 1840} {"train_loss": -5.971601963043213, "global_step": 77296, "epoch": 1840} {"train_loss": -6.043262481689453, "global_step": 77297, "epoch": 1840} {"train_loss": -6.157261371612549, "global_step": 77298, "epoch": 1840} {"train_loss": -6.128108024597168, "global_step": 77299, "epoch": 1840} {"train_loss": -6.10042667388916, "global_step": 77300, "epoch": 1840} {"train_loss": -6.091533660888672, "global_step": 77301, "epoch": 1840} {"train_loss": -5.97107458114624, "global_step": 77302, "epoch": 1840} {"train_loss": -6.194176197052002, "global_step": 77303, "epoch": 1840} {"train_loss": -6.141869068145752, "global_step": 77304, "epoch": 1840} {"train_loss": -6.042829513549805, "global_step": 77305, "epoch": 1840} {"train_loss": -6.077208042144775, "global_step": 77306, "epoch": 1840} {"train_loss": -6.081707954406738, "global_step": 77307, "epoch": 1840} {"train_loss": -5.951718330383301, "global_step": 77308, "epoch": 1840} {"train_loss": -6.139656066894531, "global_step": 77309, "epoch": 1840} {"train_loss": -6.010719299316406, "global_step": 77310, "epoch": 1840} {"train_loss": -6.11122989654541, "global_step": 77311, "epoch": 1840} {"train_loss": -6.053476810455322, "global_step": 77312, "epoch": 1840} {"train_loss": -6.052532196044922, "global_step": 77313, "epoch": 1840} {"train_loss": -6.0220537185668945, "global_step": 77314, "epoch": 1840} {"train_loss": -6.123929023742676, "global_step": 77315, "epoch": 1840} {"train_loss": -6.004359245300293, "global_step": 77316, "epoch": 1840} {"train_loss": -6.001803874969482, "global_step": 77317, "epoch": 1840} {"train_loss": -6.188057899475098, "global_step": 77318, "epoch": 1840} {"train_loss": -6.086476802825928, "global_step": 77319, "epoch": 1840} {"train_loss": -6.02901554107666, "global_step": 77320, "epoch": 1840} {"train_loss": -6.07691562743414, "global_step": 77321, "epoch": 1840, "val_loss": 67564.375} {"train_loss": -6.030889987945557, "global_step": 77322, "epoch": 1841} {"train_loss": -5.996853828430176, "global_step": 77323, "epoch": 1841} {"train_loss": -6.174939155578613, "global_step": 77324, "epoch": 1841} {"train_loss": -6.018742561340332, "global_step": 77325, "epoch": 1841} {"train_loss": -6.07893180847168, "global_step": 77326, "epoch": 1841} {"train_loss": -6.024784088134766, "global_step": 77327, "epoch": 1841} {"train_loss": -6.159400939941406, "global_step": 77328, "epoch": 1841} {"train_loss": -6.088100433349609, "global_step": 77329, "epoch": 1841} {"train_loss": -6.054811000823975, "global_step": 77330, "epoch": 1841} {"train_loss": -6.088962554931641, "global_step": 77331, "epoch": 1841} {"train_loss": -6.143538951873779, "global_step": 77332, "epoch": 1841} {"train_loss": -6.048128604888916, "global_step": 77333, "epoch": 1841} {"train_loss": -6.185157775878906, "global_step": 77334, "epoch": 1841} {"train_loss": -6.079327583312988, "global_step": 77335, "epoch": 1841} {"train_loss": -6.095647811889648, "global_step": 77336, "epoch": 1841} {"train_loss": -6.023773193359375, "global_step": 77337, "epoch": 1841} {"train_loss": -6.076842308044434, "global_step": 77338, "epoch": 1841} {"train_loss": -6.074156761169434, "global_step": 77339, "epoch": 1841} {"train_loss": -6.062081336975098, "global_step": 77340, "epoch": 1841} {"train_loss": -5.987121105194092, "global_step": 77341, "epoch": 1841} {"train_loss": -6.137909412384033, "global_step": 77342, "epoch": 1841} {"train_loss": -5.955796241760254, "global_step": 77343, "epoch": 1841} {"train_loss": -6.106326580047607, "global_step": 77344, "epoch": 1841} {"train_loss": -5.986845016479492, "global_step": 77345, "epoch": 1841} {"train_loss": -6.018429756164551, "global_step": 77346, "epoch": 1841} {"train_loss": -6.05623722076416, "global_step": 77347, "epoch": 1841} {"train_loss": -5.920168399810791, "global_step": 77348, "epoch": 1841} {"train_loss": -6.10544490814209, "global_step": 77349, "epoch": 1841} {"train_loss": -5.962482452392578, "global_step": 77350, "epoch": 1841} {"train_loss": -6.05914831161499, "global_step": 77351, "epoch": 1841} {"train_loss": -5.911567211151123, "global_step": 77352, "epoch": 1841} {"train_loss": -6.093441009521484, "global_step": 77353, "epoch": 1841} {"train_loss": -6.004759311676025, "global_step": 77354, "epoch": 1841} {"train_loss": -6.04164457321167, "global_step": 77355, "epoch": 1841} {"train_loss": -5.997854232788086, "global_step": 77356, "epoch": 1841} {"train_loss": -6.059701442718506, "global_step": 77357, "epoch": 1841} {"train_loss": -6.02200174331665, "global_step": 77358, "epoch": 1841} {"train_loss": -6.070589065551758, "global_step": 77359, "epoch": 1841} {"train_loss": -5.973606109619141, "global_step": 77360, "epoch": 1841} {"train_loss": -5.999803066253662, "global_step": 77361, "epoch": 1841} {"train_loss": -6.083559989929199, "global_step": 77362, "epoch": 1841} {"train_loss": -6.050136452629452, "global_step": 77363, "epoch": 1841, "val_loss": 67466.84375} {"train_loss": -6.065821170806885, "global_step": 77364, "epoch": 1842} {"train_loss": -6.038626194000244, "global_step": 77365, "epoch": 1842} {"train_loss": -6.159293174743652, "global_step": 77366, "epoch": 1842} {"train_loss": -6.158029556274414, "global_step": 77367, "epoch": 1842} {"train_loss": -6.13489294052124, "global_step": 77368, "epoch": 1842} {"train_loss": -6.144721031188965, "global_step": 77369, "epoch": 1842} {"train_loss": -6.191671371459961, "global_step": 77370, "epoch": 1842} {"train_loss": -6.049078941345215, "global_step": 77371, "epoch": 1842} {"train_loss": -5.977542877197266, "global_step": 77372, "epoch": 1842} {"train_loss": -6.200688362121582, "global_step": 77373, "epoch": 1842} {"train_loss": -6.083071708679199, "global_step": 77374, "epoch": 1842} {"train_loss": -6.137022972106934, "global_step": 77375, "epoch": 1842} {"train_loss": -6.188831806182861, "global_step": 77376, "epoch": 1842} {"train_loss": -6.075047492980957, "global_step": 77377, "epoch": 1842} {"train_loss": -6.022818565368652, "global_step": 77378, "epoch": 1842} {"train_loss": -6.119238376617432, "global_step": 77379, "epoch": 1842} {"train_loss": -6.191476821899414, "global_step": 77380, "epoch": 1842} {"train_loss": -6.098682403564453, "global_step": 77381, "epoch": 1842} {"train_loss": -6.01071310043335, "global_step": 77382, "epoch": 1842} {"train_loss": -6.127191543579102, "global_step": 77383, "epoch": 1842} {"train_loss": -6.09890079498291, "global_step": 77384, "epoch": 1842} {"train_loss": -6.02127742767334, "global_step": 77385, "epoch": 1842} {"train_loss": -6.108208179473877, "global_step": 77386, "epoch": 1842} {"train_loss": -6.233400344848633, "global_step": 77387, "epoch": 1842} {"train_loss": -6.051886558532715, "global_step": 77388, "epoch": 1842} {"train_loss": -6.140594482421875, "global_step": 77389, "epoch": 1842} {"train_loss": -6.060947418212891, "global_step": 77390, "epoch": 1842} {"train_loss": -6.026411056518555, "global_step": 77391, "epoch": 1842} {"train_loss": -6.094667434692383, "global_step": 77392, "epoch": 1842} {"train_loss": -6.139863967895508, "global_step": 77393, "epoch": 1842} {"train_loss": -6.18061637878418, "global_step": 77394, "epoch": 1842} {"train_loss": -6.179190635681152, "global_step": 77395, "epoch": 1842} {"train_loss": -6.2337446212768555, "global_step": 77396, "epoch": 1842} {"train_loss": -6.131521701812744, "global_step": 77397, "epoch": 1842} {"train_loss": -5.98089599609375, "global_step": 77398, "epoch": 1842} {"train_loss": -6.175646781921387, "global_step": 77399, "epoch": 1842} {"train_loss": -6.107666969299316, "global_step": 77400, "epoch": 1842} {"train_loss": -6.216798782348633, "global_step": 77401, "epoch": 1842} {"train_loss": -6.134011745452881, "global_step": 77402, "epoch": 1842} {"train_loss": -6.026595592498779, "global_step": 77403, "epoch": 1842} {"train_loss": -6.132682800292969, "global_step": 77404, "epoch": 1842} {"train_loss": -6.116702533903576, "global_step": 77405, "epoch": 1842, "val_loss": 67623.8125} {"train_loss": -6.1093668937683105, "global_step": 77406, "epoch": 1843} {"train_loss": -6.155850410461426, "global_step": 77407, "epoch": 1843} {"train_loss": -6.055736064910889, "global_step": 77408, "epoch": 1843} {"train_loss": -6.107394218444824, "global_step": 77409, "epoch": 1843} {"train_loss": -6.103557109832764, "global_step": 77410, "epoch": 1843} {"train_loss": -6.070549011230469, "global_step": 77411, "epoch": 1843} {"train_loss": -6.063422679901123, "global_step": 77412, "epoch": 1843} {"train_loss": -6.071115016937256, "global_step": 77413, "epoch": 1843} {"train_loss": -6.050500392913818, "global_step": 77414, "epoch": 1843} {"train_loss": -6.066690444946289, "global_step": 77415, "epoch": 1843} {"train_loss": -6.160381317138672, "global_step": 77416, "epoch": 1843} {"train_loss": -6.129578590393066, "global_step": 77417, "epoch": 1843} {"train_loss": -6.11224889755249, "global_step": 77418, "epoch": 1843} {"train_loss": -6.095306396484375, "global_step": 77419, "epoch": 1843} {"train_loss": -6.10153865814209, "global_step": 77420, "epoch": 1843} {"train_loss": -6.08432674407959, "global_step": 77421, "epoch": 1843} {"train_loss": -6.047165870666504, "global_step": 77422, "epoch": 1843} {"train_loss": -6.063104629516602, "global_step": 77423, "epoch": 1843} {"train_loss": -6.077962875366211, "global_step": 77424, "epoch": 1843} {"train_loss": -6.013611793518066, "global_step": 77425, "epoch": 1843} {"train_loss": -6.053530216217041, "global_step": 77426, "epoch": 1843} {"train_loss": -6.006739139556885, "global_step": 77427, "epoch": 1843} {"train_loss": -5.998146057128906, "global_step": 77428, "epoch": 1843} {"train_loss": -5.937410354614258, "global_step": 77429, "epoch": 1843} {"train_loss": -6.1050615310668945, "global_step": 77430, "epoch": 1843} {"train_loss": -6.071467399597168, "global_step": 77431, "epoch": 1843} {"train_loss": -5.93896484375, "global_step": 77432, "epoch": 1843} {"train_loss": -6.046905517578125, "global_step": 77433, "epoch": 1843} {"train_loss": -5.936000823974609, "global_step": 77434, "epoch": 1843} {"train_loss": -6.103626251220703, "global_step": 77435, "epoch": 1843} {"train_loss": -6.050837993621826, "global_step": 77436, "epoch": 1843} {"train_loss": -5.849369049072266, "global_step": 77437, "epoch": 1843} {"train_loss": -6.151402473449707, "global_step": 77438, "epoch": 1843} {"train_loss": -6.013869285583496, "global_step": 77439, "epoch": 1843} {"train_loss": -6.058173179626465, "global_step": 77440, "epoch": 1843} {"train_loss": -6.092228412628174, "global_step": 77441, "epoch": 1843} {"train_loss": -5.992093563079834, "global_step": 77442, "epoch": 1843} {"train_loss": -6.072290420532227, "global_step": 77443, "epoch": 1843} {"train_loss": -6.049223899841309, "global_step": 77444, "epoch": 1843} {"train_loss": -5.966371059417725, "global_step": 77445, "epoch": 1843} {"train_loss": -5.955150604248047, "global_step": 77446, "epoch": 1843} {"train_loss": -6.05434961546035, "global_step": 77447, "epoch": 1843, "val_loss": 67752.15625} {"train_loss": -5.88444185256958, "global_step": 77448, "epoch": 1844} {"train_loss": -6.177934646606445, "global_step": 77449, "epoch": 1844} {"train_loss": -6.079771041870117, "global_step": 77450, "epoch": 1844} {"train_loss": -6.08793830871582, "global_step": 77451, "epoch": 1844} {"train_loss": -6.090694904327393, "global_step": 77452, "epoch": 1844} {"train_loss": -6.0655670166015625, "global_step": 77453, "epoch": 1844} {"train_loss": -6.102829933166504, "global_step": 77454, "epoch": 1844} {"train_loss": -6.102449893951416, "global_step": 77455, "epoch": 1844} {"train_loss": -6.106008052825928, "global_step": 77456, "epoch": 1844} {"train_loss": -6.091485977172852, "global_step": 77457, "epoch": 1844} {"train_loss": -6.093238830566406, "global_step": 77458, "epoch": 1844} {"train_loss": -6.122557640075684, "global_step": 77459, "epoch": 1844} {"train_loss": -6.025149345397949, "global_step": 77460, "epoch": 1844} {"train_loss": -6.057106971740723, "global_step": 77461, "epoch": 1844} {"train_loss": -5.8689446449279785, "global_step": 77462, "epoch": 1844} {"train_loss": -6.086128234863281, "global_step": 77463, "epoch": 1844} {"train_loss": -6.039438724517822, "global_step": 77464, "epoch": 1844} {"train_loss": -5.930570602416992, "global_step": 77465, "epoch": 1844} {"train_loss": -6.09938383102417, "global_step": 77466, "epoch": 1844} {"train_loss": -6.048358917236328, "global_step": 77467, "epoch": 1844} {"train_loss": -6.003757476806641, "global_step": 77468, "epoch": 1844} {"train_loss": -6.038122653961182, "global_step": 77469, "epoch": 1844} {"train_loss": -5.893959999084473, "global_step": 77470, "epoch": 1844} {"train_loss": -6.119772434234619, "global_step": 77471, "epoch": 1844} {"train_loss": -5.981447219848633, "global_step": 77472, "epoch": 1844} {"train_loss": -6.133903503417969, "global_step": 77473, "epoch": 1844} {"train_loss": -6.077888488769531, "global_step": 77474, "epoch": 1844} {"train_loss": -6.040791034698486, "global_step": 77475, "epoch": 1844} {"train_loss": -6.137536525726318, "global_step": 77476, "epoch": 1844} {"train_loss": -6.1075897216796875, "global_step": 77477, "epoch": 1844} {"train_loss": -6.054567813873291, "global_step": 77478, "epoch": 1844} {"train_loss": -6.110915184020996, "global_step": 77479, "epoch": 1844} {"train_loss": -6.216604232788086, "global_step": 77480, "epoch": 1844} {"train_loss": -5.975074768066406, "global_step": 77481, "epoch": 1844} {"train_loss": -6.14836311340332, "global_step": 77482, "epoch": 1844} {"train_loss": -6.099428653717041, "global_step": 77483, "epoch": 1844} {"train_loss": -6.11285924911499, "global_step": 77484, "epoch": 1844} {"train_loss": -6.088998317718506, "global_step": 77485, "epoch": 1844} {"train_loss": -6.093497276306152, "global_step": 77486, "epoch": 1844} {"train_loss": -6.149913311004639, "global_step": 77487, "epoch": 1844} {"train_loss": -6.032047271728516, "global_step": 77488, "epoch": 1844} {"train_loss": -6.071038393747239, "global_step": 77489, "epoch": 1844, "val_loss": 67644.6015625} {"train_loss": -6.175390243530273, "global_step": 77490, "epoch": 1845} {"train_loss": -6.129657745361328, "global_step": 77491, "epoch": 1845} {"train_loss": -5.971149444580078, "global_step": 77492, "epoch": 1845} {"train_loss": -6.065075397491455, "global_step": 77493, "epoch": 1845} {"train_loss": -5.941751480102539, "global_step": 77494, "epoch": 1845} {"train_loss": -6.116308689117432, "global_step": 77495, "epoch": 1845} {"train_loss": -6.066955089569092, "global_step": 77496, "epoch": 1845} {"train_loss": -6.108682155609131, "global_step": 77497, "epoch": 1845} {"train_loss": -6.078586101531982, "global_step": 77498, "epoch": 1845} {"train_loss": -6.121664524078369, "global_step": 77499, "epoch": 1845} {"train_loss": -6.260677337646484, "global_step": 77500, "epoch": 1845} {"train_loss": -6.01336669921875, "global_step": 77501, "epoch": 1845} {"train_loss": -6.123290061950684, "global_step": 77502, "epoch": 1845} {"train_loss": -6.0702667236328125, "global_step": 77503, "epoch": 1845} {"train_loss": -6.066355228424072, "global_step": 77504, "epoch": 1845} {"train_loss": -6.18008279800415, "global_step": 77505, "epoch": 1845} {"train_loss": -6.174897193908691, "global_step": 77506, "epoch": 1845} {"train_loss": -6.073762893676758, "global_step": 77507, "epoch": 1845} {"train_loss": -6.148469924926758, "global_step": 77508, "epoch": 1845} {"train_loss": -6.08902645111084, "global_step": 77509, "epoch": 1845} {"train_loss": -6.02394437789917, "global_step": 77510, "epoch": 1845} {"train_loss": -6.1420087814331055, "global_step": 77511, "epoch": 1845} {"train_loss": -6.053099155426025, "global_step": 77512, "epoch": 1845} {"train_loss": -6.000731468200684, "global_step": 77513, "epoch": 1845} {"train_loss": -6.069096088409424, "global_step": 77514, "epoch": 1845} {"train_loss": -6.136348724365234, "global_step": 77515, "epoch": 1845} {"train_loss": -6.120781898498535, "global_step": 77516, "epoch": 1845} {"train_loss": -6.218605995178223, "global_step": 77517, "epoch": 1845} {"train_loss": -6.172600269317627, "global_step": 77518, "epoch": 1845} {"train_loss": -6.062191963195801, "global_step": 77519, "epoch": 1845} {"train_loss": -6.312966346740723, "global_step": 77520, "epoch": 1845} {"train_loss": -6.163141250610352, "global_step": 77521, "epoch": 1845} {"train_loss": -6.12360143661499, "global_step": 77522, "epoch": 1845} {"train_loss": -6.242431640625, "global_step": 77523, "epoch": 1845} {"train_loss": -6.041945457458496, "global_step": 77524, "epoch": 1845} {"train_loss": -6.195186138153076, "global_step": 77525, "epoch": 1845} {"train_loss": -6.152339935302734, "global_step": 77526, "epoch": 1845} {"train_loss": -6.000142574310303, "global_step": 77527, "epoch": 1845} {"train_loss": -6.161219596862793, "global_step": 77528, "epoch": 1845} {"train_loss": -6.264618396759033, "global_step": 77529, "epoch": 1845} {"train_loss": -6.11941385269165, "global_step": 77530, "epoch": 1845} {"train_loss": -6.1144543034689764, "global_step": 77531, "epoch": 1845, "val_loss": 67559.8046875} {"train_loss": -6.090128421783447, "global_step": 77532, "epoch": 1846} {"train_loss": -6.059918403625488, "global_step": 77533, "epoch": 1846} {"train_loss": -6.094116687774658, "global_step": 77534, "epoch": 1846} {"train_loss": -6.067618370056152, "global_step": 77535, "epoch": 1846} {"train_loss": -6.063005447387695, "global_step": 77536, "epoch": 1846} {"train_loss": -6.098608016967773, "global_step": 77537, "epoch": 1846} {"train_loss": -6.208174705505371, "global_step": 77538, "epoch": 1846} {"train_loss": -6.14724063873291, "global_step": 77539, "epoch": 1846} {"train_loss": -6.25834846496582, "global_step": 77540, "epoch": 1846} {"train_loss": -6.088617324829102, "global_step": 77541, "epoch": 1846} {"train_loss": -6.164809703826904, "global_step": 77542, "epoch": 1846} {"train_loss": -6.045262813568115, "global_step": 77543, "epoch": 1846} {"train_loss": -6.089734077453613, "global_step": 77544, "epoch": 1846} {"train_loss": -6.10736608505249, "global_step": 77545, "epoch": 1846} {"train_loss": -5.971684455871582, "global_step": 77546, "epoch": 1846} {"train_loss": -6.200469017028809, "global_step": 77547, "epoch": 1846} {"train_loss": -6.085026741027832, "global_step": 77548, "epoch": 1846} {"train_loss": -6.1458539962768555, "global_step": 77549, "epoch": 1846} {"train_loss": -6.127627849578857, "global_step": 77550, "epoch": 1846} {"train_loss": -6.057967185974121, "global_step": 77551, "epoch": 1846} {"train_loss": -6.077001571655273, "global_step": 77552, "epoch": 1846} {"train_loss": -6.0189971923828125, "global_step": 77553, "epoch": 1846} {"train_loss": -6.258819580078125, "global_step": 77554, "epoch": 1846} {"train_loss": -6.138960361480713, "global_step": 77555, "epoch": 1846} {"train_loss": -6.049612998962402, "global_step": 77556, "epoch": 1846} {"train_loss": -6.078006267547607, "global_step": 77557, "epoch": 1846} {"train_loss": -5.997053146362305, "global_step": 77558, "epoch": 1846} {"train_loss": -5.949281692504883, "global_step": 77559, "epoch": 1846} {"train_loss": -6.046731948852539, "global_step": 77560, "epoch": 1846} {"train_loss": -6.149697303771973, "global_step": 77561, "epoch": 1846} {"train_loss": -5.97895622253418, "global_step": 77562, "epoch": 1846} {"train_loss": -6.102202415466309, "global_step": 77563, "epoch": 1846} {"train_loss": -6.066816806793213, "global_step": 77564, "epoch": 1846} {"train_loss": -6.075160980224609, "global_step": 77565, "epoch": 1846} {"train_loss": -6.067440032958984, "global_step": 77566, "epoch": 1846} {"train_loss": -6.025432586669922, "global_step": 77567, "epoch": 1846} {"train_loss": -5.926557540893555, "global_step": 77568, "epoch": 1846} {"train_loss": -6.025575637817383, "global_step": 77569, "epoch": 1846} {"train_loss": -5.984187602996826, "global_step": 77570, "epoch": 1846} {"train_loss": -5.956640243530273, "global_step": 77571, "epoch": 1846} {"train_loss": -6.077445983886719, "global_step": 77572, "epoch": 1846} {"train_loss": -6.0799071334657215, "global_step": 77573, "epoch": 1846, "val_loss": 67653.578125} {"train_loss": -6.1805620193481445, "global_step": 77574, "epoch": 1847} {"train_loss": -5.9469404220581055, "global_step": 77575, "epoch": 1847} {"train_loss": -6.155914306640625, "global_step": 77576, "epoch": 1847} {"train_loss": -6.168691635131836, "global_step": 77577, "epoch": 1847} {"train_loss": -6.136802673339844, "global_step": 77578, "epoch": 1847} {"train_loss": -6.050498962402344, "global_step": 77579, "epoch": 1847} {"train_loss": -6.2038774490356445, "global_step": 77580, "epoch": 1847} {"train_loss": -6.16147518157959, "global_step": 77581, "epoch": 1847} {"train_loss": -5.984000205993652, "global_step": 77582, "epoch": 1847} {"train_loss": -6.159221649169922, "global_step": 77583, "epoch": 1847} {"train_loss": -6.074807167053223, "global_step": 77584, "epoch": 1847} {"train_loss": -6.032757759094238, "global_step": 77585, "epoch": 1847} {"train_loss": -6.128968238830566, "global_step": 77586, "epoch": 1847} {"train_loss": -6.00556755065918, "global_step": 77587, "epoch": 1847} {"train_loss": -6.080577850341797, "global_step": 77588, "epoch": 1847} {"train_loss": -6.026204586029053, "global_step": 77589, "epoch": 1847} {"train_loss": -6.1074137687683105, "global_step": 77590, "epoch": 1847} {"train_loss": -6.040689945220947, "global_step": 77591, "epoch": 1847} {"train_loss": -5.86812162399292, "global_step": 77592, "epoch": 1847} {"train_loss": -6.033240795135498, "global_step": 77593, "epoch": 1847} {"train_loss": -6.108124256134033, "global_step": 77594, "epoch": 1847} {"train_loss": -5.984108924865723, "global_step": 77595, "epoch": 1847} {"train_loss": -5.999271392822266, "global_step": 77596, "epoch": 1847} {"train_loss": -6.117162227630615, "global_step": 77597, "epoch": 1847} {"train_loss": -6.042844772338867, "global_step": 77598, "epoch": 1847} {"train_loss": -6.185077667236328, "global_step": 77599, "epoch": 1847} {"train_loss": -6.11509895324707, "global_step": 77600, "epoch": 1847} {"train_loss": -6.218639373779297, "global_step": 77601, "epoch": 1847} {"train_loss": -6.139139175415039, "global_step": 77602, "epoch": 1847} {"train_loss": -6.137571334838867, "global_step": 77603, "epoch": 1847} {"train_loss": -6.209817886352539, "global_step": 77604, "epoch": 1847} {"train_loss": -6.105093002319336, "global_step": 77605, "epoch": 1847} {"train_loss": -6.096161365509033, "global_step": 77606, "epoch": 1847} {"train_loss": -6.083465576171875, "global_step": 77607, "epoch": 1847} {"train_loss": -6.073197364807129, "global_step": 77608, "epoch": 1847} {"train_loss": -6.109073162078857, "global_step": 77609, "epoch": 1847} {"train_loss": -5.9633684158325195, "global_step": 77610, "epoch": 1847} {"train_loss": -6.0358757972717285, "global_step": 77611, "epoch": 1847} {"train_loss": -6.077656269073486, "global_step": 77612, "epoch": 1847} {"train_loss": -5.905613422393799, "global_step": 77613, "epoch": 1847} {"train_loss": -6.006134033203125, "global_step": 77614, "epoch": 1847} {"train_loss": -6.078400214513143, "global_step": 77615, "epoch": 1847, "val_loss": 67849.09375} {"train_loss": -5.9947357177734375, "global_step": 77616, "epoch": 1848} {"train_loss": -5.979248046875, "global_step": 77617, "epoch": 1848} {"train_loss": -6.014476776123047, "global_step": 77618, "epoch": 1848} {"train_loss": -6.032151222229004, "global_step": 77619, "epoch": 1848} {"train_loss": -6.077448844909668, "global_step": 77620, "epoch": 1848} {"train_loss": -6.087895393371582, "global_step": 77621, "epoch": 1848} {"train_loss": -6.05662202835083, "global_step": 77622, "epoch": 1848} {"train_loss": -6.105137825012207, "global_step": 77623, "epoch": 1848} {"train_loss": -6.034564018249512, "global_step": 77624, "epoch": 1848} {"train_loss": -6.153210639953613, "global_step": 77625, "epoch": 1848} {"train_loss": -6.031594276428223, "global_step": 77626, "epoch": 1848} {"train_loss": -6.117646217346191, "global_step": 77627, "epoch": 1848} {"train_loss": -6.135746002197266, "global_step": 77628, "epoch": 1848} {"train_loss": -6.012160778045654, "global_step": 77629, "epoch": 1848} {"train_loss": -6.138390064239502, "global_step": 77630, "epoch": 1848} {"train_loss": -6.144835948944092, "global_step": 77631, "epoch": 1848} {"train_loss": -6.082681179046631, "global_step": 77632, "epoch": 1848} {"train_loss": -5.9757585525512695, "global_step": 77633, "epoch": 1848} {"train_loss": -6.102237224578857, "global_step": 77634, "epoch": 1848} {"train_loss": -6.08697509765625, "global_step": 77635, "epoch": 1848} {"train_loss": -6.173018455505371, "global_step": 77636, "epoch": 1848} {"train_loss": -6.094472408294678, "global_step": 77637, "epoch": 1848} {"train_loss": -6.099117279052734, "global_step": 77638, "epoch": 1848} {"train_loss": -6.067966938018799, "global_step": 77639, "epoch": 1848} {"train_loss": -6.036864757537842, "global_step": 77640, "epoch": 1848} {"train_loss": -6.091826438903809, "global_step": 77641, "epoch": 1848} {"train_loss": -6.142934322357178, "global_step": 77642, "epoch": 1848} {"train_loss": -6.112793445587158, "global_step": 77643, "epoch": 1848} {"train_loss": -6.1954426765441895, "global_step": 77644, "epoch": 1848} {"train_loss": -6.0920233726501465, "global_step": 77645, "epoch": 1848} {"train_loss": -6.199446678161621, "global_step": 77646, "epoch": 1848} {"train_loss": -6.041925430297852, "global_step": 77647, "epoch": 1848} {"train_loss": -6.167608261108398, "global_step": 77648, "epoch": 1848} {"train_loss": -6.063407897949219, "global_step": 77649, "epoch": 1848} {"train_loss": -6.123355865478516, "global_step": 77650, "epoch": 1848} {"train_loss": -6.259777069091797, "global_step": 77651, "epoch": 1848} {"train_loss": -6.046009063720703, "global_step": 77652, "epoch": 1848} {"train_loss": -6.084889888763428, "global_step": 77653, "epoch": 1848} {"train_loss": -6.074362277984619, "global_step": 77654, "epoch": 1848} {"train_loss": -5.99544620513916, "global_step": 77655, "epoch": 1848} {"train_loss": -6.090880393981934, "global_step": 77656, "epoch": 1848} {"train_loss": -6.0898296265375045, "global_step": 77657, "epoch": 1848, "val_loss": 67597.2890625} {"train_loss": -5.935696601867676, "global_step": 77658, "epoch": 1849} {"train_loss": -6.072565078735352, "global_step": 77659, "epoch": 1849} {"train_loss": -5.963359355926514, "global_step": 77660, "epoch": 1849} {"train_loss": -6.169978141784668, "global_step": 77661, "epoch": 1849} {"train_loss": -6.088495254516602, "global_step": 77662, "epoch": 1849} {"train_loss": -6.048859596252441, "global_step": 77663, "epoch": 1849} {"train_loss": -6.057380676269531, "global_step": 77664, "epoch": 1849} {"train_loss": -6.0156636238098145, "global_step": 77665, "epoch": 1849} {"train_loss": -5.969320297241211, "global_step": 77666, "epoch": 1849} {"train_loss": -5.988893985748291, "global_step": 77667, "epoch": 1849} {"train_loss": -5.981653213500977, "global_step": 77668, "epoch": 1849} {"train_loss": -6.119413375854492, "global_step": 77669, "epoch": 1849} {"train_loss": -6.110536098480225, "global_step": 77670, "epoch": 1849} {"train_loss": -6.108584403991699, "global_step": 77671, "epoch": 1849} {"train_loss": -6.107028007507324, "global_step": 77672, "epoch": 1849} {"train_loss": -6.048859596252441, "global_step": 77673, "epoch": 1849} {"train_loss": -5.984509468078613, "global_step": 77674, "epoch": 1849} {"train_loss": -6.126945972442627, "global_step": 77675, "epoch": 1849} {"train_loss": -6.021240711212158, "global_step": 77676, "epoch": 1849} {"train_loss": -6.203728675842285, "global_step": 77677, "epoch": 1849} {"train_loss": -6.213201522827148, "global_step": 77678, "epoch": 1849} {"train_loss": -6.051652431488037, "global_step": 77679, "epoch": 1849} {"train_loss": -6.135743141174316, "global_step": 77680, "epoch": 1849} {"train_loss": -6.015490531921387, "global_step": 77681, "epoch": 1849} {"train_loss": -6.197931289672852, "global_step": 77682, "epoch": 1849} {"train_loss": -6.1088032722473145, "global_step": 77683, "epoch": 1849} {"train_loss": -6.071887016296387, "global_step": 77684, "epoch": 1849} {"train_loss": -6.12635612487793, "global_step": 77685, "epoch": 1849} {"train_loss": -6.183589935302734, "global_step": 77686, "epoch": 1849} {"train_loss": -6.098115921020508, "global_step": 77687, "epoch": 1849} {"train_loss": -6.174004554748535, "global_step": 77688, "epoch": 1849} {"train_loss": -6.056613922119141, "global_step": 77689, "epoch": 1849} {"train_loss": -6.054942607879639, "global_step": 77690, "epoch": 1849} {"train_loss": -6.188539505004883, "global_step": 77691, "epoch": 1849} {"train_loss": -6.144451141357422, "global_step": 77692, "epoch": 1849} {"train_loss": -6.1272735595703125, "global_step": 77693, "epoch": 1849} {"train_loss": -5.978366851806641, "global_step": 77694, "epoch": 1849} {"train_loss": -6.17423152923584, "global_step": 77695, "epoch": 1849} {"train_loss": -6.1667070388793945, "global_step": 77696, "epoch": 1849} {"train_loss": -6.038527488708496, "global_step": 77697, "epoch": 1849} {"train_loss": -6.120616912841797, "global_step": 77698, "epoch": 1849} {"train_loss": -6.08534794762021, "global_step": 77699, "epoch": 1849, "val_loss": 67572.9609375} {"train_loss": -6.094871997833252, "global_step": 77700, "epoch": 1850} {"train_loss": -6.0348310470581055, "global_step": 77701, "epoch": 1850} {"train_loss": -6.075615882873535, "global_step": 77702, "epoch": 1850} {"train_loss": -6.046540260314941, "global_step": 77703, "epoch": 1850} {"train_loss": -6.124520301818848, "global_step": 77704, "epoch": 1850} {"train_loss": -6.064422607421875, "global_step": 77705, "epoch": 1850} {"train_loss": -6.160891532897949, "global_step": 77706, "epoch": 1850} {"train_loss": -6.053692817687988, "global_step": 77707, "epoch": 1850} {"train_loss": -6.158425331115723, "global_step": 77708, "epoch": 1850} {"train_loss": -6.1409807205200195, "global_step": 77709, "epoch": 1850} {"train_loss": -6.090632438659668, "global_step": 77710, "epoch": 1850} {"train_loss": -6.152801990509033, "global_step": 77711, "epoch": 1850} {"train_loss": -6.050140380859375, "global_step": 77712, "epoch": 1850} {"train_loss": -6.235616683959961, "global_step": 77713, "epoch": 1850} {"train_loss": -6.2252421379089355, "global_step": 77714, "epoch": 1850} {"train_loss": -6.124881267547607, "global_step": 77715, "epoch": 1850} {"train_loss": -5.938356876373291, "global_step": 77716, "epoch": 1850} {"train_loss": -6.138488292694092, "global_step": 77717, "epoch": 1850} {"train_loss": -5.946076393127441, "global_step": 77718, "epoch": 1850} {"train_loss": -6.063507556915283, "global_step": 77719, "epoch": 1850} {"train_loss": -6.04973030090332, "global_step": 77720, "epoch": 1850} {"train_loss": -6.140908718109131, "global_step": 77721, "epoch": 1850} {"train_loss": -6.257607460021973, "global_step": 77722, "epoch": 1850} {"train_loss": -6.072569847106934, "global_step": 77723, "epoch": 1850} {"train_loss": -6.156529426574707, "global_step": 77724, "epoch": 1850} {"train_loss": -6.0455169677734375, "global_step": 77725, "epoch": 1850} {"train_loss": -6.1566009521484375, "global_step": 77726, "epoch": 1850} {"train_loss": -5.955814838409424, "global_step": 77727, "epoch": 1850} {"train_loss": -6.065610885620117, "global_step": 77728, "epoch": 1850} {"train_loss": -6.125029563903809, "global_step": 77729, "epoch": 1850} {"train_loss": -5.816315174102783, "global_step": 77730, "epoch": 1850} {"train_loss": -6.048084259033203, "global_step": 77731, "epoch": 1850} {"train_loss": -6.017135143280029, "global_step": 77732, "epoch": 1850} {"train_loss": -6.026472568511963, "global_step": 77733, "epoch": 1850} {"train_loss": -6.01650333404541, "global_step": 77734, "epoch": 1850} {"train_loss": -6.067169189453125, "global_step": 77735, "epoch": 1850} {"train_loss": -6.067434310913086, "global_step": 77736, "epoch": 1850} {"train_loss": -6.004008769989014, "global_step": 77737, "epoch": 1850} {"train_loss": -6.035164833068848, "global_step": 77738, "epoch": 1850} {"train_loss": -6.0427398681640625, "global_step": 77739, "epoch": 1850} {"train_loss": -6.095479965209961, "global_step": 77740, "epoch": 1850} {"train_loss": -6.083122253417969, "global_step": 77741, "epoch": 1850, "train/sim_max_reward_0": 0.21599447266501262, "train/sim_max_reward_1": 0.7223581546973556, "train/sim_max_reward_2": 0.47585595951967125, "train/sim_max_reward_3": 0.14646411243656965, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9626928079355727, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.20021182993282965, "test/sim_max_reward_4400002": 0.4187466446770761, "test/sim_max_reward_4400003": 0.9895483413745373, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.3164506594283215, "test/sim_max_reward_4400006": 0.5109052824894802, "test/sim_max_reward_4400007": 0.007419670135059107, "test/sim_max_reward_4400008": 0.3261306389606873, "test/sim_max_reward_4400009": 0.4646336630442201, "test/sim_max_reward_4400010": 0.22698895596696192, "test/sim_max_reward_4400011": 0.20283430571927738, "test/sim_max_reward_4400012": 0.9751146580372799, "test/sim_max_reward_4400013": 0.9387072772323798, "test/sim_max_reward_4400014": 0.615453584829781, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.22861000837545414, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23558661312112172, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.7181699079435521, "test/sim_max_reward_4400022": 0.8384213218696404, "test/sim_max_reward_4400023": 0.09217511073980779, "test/sim_max_reward_4400024": 0.490666126164888, "test/sim_max_reward_4400025": 0.24287700689259964, "test/sim_max_reward_4400026": 0.9441629700616494, "test/sim_max_reward_4400027": 0.002032499822660275, "test/sim_max_reward_4400028": 0.7354713274465254, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.7682110310357566, "test/sim_max_reward_4400031": 0.8010866354681807, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.4881297269998424, "test/sim_max_reward_4400034": 0.9088724417173698, "test/sim_max_reward_4400035": 0.45221050239199284, "test/sim_max_reward_4400036": 0.3555549535052343, "test/sim_max_reward_4400037": 0.8996911273953523, "test/sim_max_reward_4400038": 0.9315703073026714, "test/sim_max_reward_4400039": 0.9295186961381748, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.635588179906704, "test/sim_max_reward_4400043": 0.7791622631293937, "test/sim_max_reward_4400044": 0.9662084176465378, "test/sim_max_reward_4400045": 0.933378269054419, "test/sim_max_reward_4400046": 0.7714743237852059, "test/sim_max_reward_4400047": 0.896702766923232, "test/sim_max_reward_4400048": 0.9199389868110367, "test/sim_max_reward_4400049": 0.8058747369691479, "train/mean_score": 0.5872275845423637, "test/mean_score": 0.522716997025451, "val_loss": 67710.4609375} {"train_loss": -6.151543140411377, "global_step": 77742, "epoch": 1851} {"train_loss": -6.205147743225098, "global_step": 77743, "epoch": 1851} {"train_loss": -6.228981971740723, "global_step": 77744, "epoch": 1851} {"train_loss": -6.064493179321289, "global_step": 77745, "epoch": 1851} {"train_loss": -6.138206958770752, "global_step": 77746, "epoch": 1851} {"train_loss": -6.084878444671631, "global_step": 77747, "epoch": 1851} {"train_loss": -5.989961624145508, "global_step": 77748, "epoch": 1851} {"train_loss": -6.02971076965332, "global_step": 77749, "epoch": 1851} {"train_loss": -6.067115783691406, "global_step": 77750, "epoch": 1851} {"train_loss": -5.929052352905273, "global_step": 77751, "epoch": 1851} {"train_loss": -6.089105129241943, "global_step": 77752, "epoch": 1851} {"train_loss": -5.978960037231445, "global_step": 77753, "epoch": 1851} {"train_loss": -6.038521766662598, "global_step": 77754, "epoch": 1851} {"train_loss": -6.0991435050964355, "global_step": 77755, "epoch": 1851} {"train_loss": -6.140125274658203, "global_step": 77756, "epoch": 1851} {"train_loss": -6.101693153381348, "global_step": 77757, "epoch": 1851} {"train_loss": -6.104500770568848, "global_step": 77758, "epoch": 1851} {"train_loss": -6.146989822387695, "global_step": 77759, "epoch": 1851} {"train_loss": -6.092113494873047, "global_step": 77760, "epoch": 1851} {"train_loss": -6.158819198608398, "global_step": 77761, "epoch": 1851} {"train_loss": -6.113033294677734, "global_step": 77762, "epoch": 1851} {"train_loss": -6.134240627288818, "global_step": 77763, "epoch": 1851} {"train_loss": -6.210746765136719, "global_step": 77764, "epoch": 1851} {"train_loss": -6.127978801727295, "global_step": 77765, "epoch": 1851} {"train_loss": -6.17057991027832, "global_step": 77766, "epoch": 1851} {"train_loss": -6.143911361694336, "global_step": 77767, "epoch": 1851} {"train_loss": -6.040865898132324, "global_step": 77768, "epoch": 1851} {"train_loss": -6.089507102966309, "global_step": 77769, "epoch": 1851} {"train_loss": -6.144260883331299, "global_step": 77770, "epoch": 1851} {"train_loss": -6.198663711547852, "global_step": 77771, "epoch": 1851} {"train_loss": -5.901978969573975, "global_step": 77772, "epoch": 1851} {"train_loss": -6.08157205581665, "global_step": 77773, "epoch": 1851} {"train_loss": -6.143657684326172, "global_step": 77774, "epoch": 1851} {"train_loss": -5.952343940734863, "global_step": 77775, "epoch": 1851} {"train_loss": -6.111699104309082, "global_step": 77776, "epoch": 1851} {"train_loss": -6.226108074188232, "global_step": 77777, "epoch": 1851} {"train_loss": -6.101829528808594, "global_step": 77778, "epoch": 1851} {"train_loss": -6.1851019859313965, "global_step": 77779, "epoch": 1851} {"train_loss": -6.049065113067627, "global_step": 77780, "epoch": 1851} {"train_loss": -6.0349273681640625, "global_step": 77781, "epoch": 1851} {"train_loss": -6.24477481842041, "global_step": 77782, "epoch": 1851} {"train_loss": -6.10009731565203, "global_step": 77783, "epoch": 1851, "val_loss": 67526.3359375} {"train_loss": -6.085019588470459, "global_step": 77784, "epoch": 1852} {"train_loss": -6.088825702667236, "global_step": 77785, "epoch": 1852} {"train_loss": -6.233057022094727, "global_step": 77786, "epoch": 1852} {"train_loss": -6.004823684692383, "global_step": 77787, "epoch": 1852} {"train_loss": -6.099367141723633, "global_step": 77788, "epoch": 1852} {"train_loss": -6.070797920227051, "global_step": 77789, "epoch": 1852} {"train_loss": -6.15334415435791, "global_step": 77790, "epoch": 1852} {"train_loss": -6.085626602172852, "global_step": 77791, "epoch": 1852} {"train_loss": -6.118844985961914, "global_step": 77792, "epoch": 1852} {"train_loss": -6.0567522048950195, "global_step": 77793, "epoch": 1852} {"train_loss": -6.173961639404297, "global_step": 77794, "epoch": 1852} {"train_loss": -6.107808589935303, "global_step": 77795, "epoch": 1852} {"train_loss": -6.042884826660156, "global_step": 77796, "epoch": 1852} {"train_loss": -6.1375837326049805, "global_step": 77797, "epoch": 1852} {"train_loss": -6.121128082275391, "global_step": 77798, "epoch": 1852} {"train_loss": -6.1232194900512695, "global_step": 77799, "epoch": 1852} {"train_loss": -6.099259376525879, "global_step": 77800, "epoch": 1852} {"train_loss": -6.058067321777344, "global_step": 77801, "epoch": 1852} {"train_loss": -5.985269546508789, "global_step": 77802, "epoch": 1852} {"train_loss": -6.086515426635742, "global_step": 77803, "epoch": 1852} {"train_loss": -6.0705156326293945, "global_step": 77804, "epoch": 1852} {"train_loss": -6.072881698608398, "global_step": 77805, "epoch": 1852} {"train_loss": -6.135282516479492, "global_step": 77806, "epoch": 1852} {"train_loss": -6.188494682312012, "global_step": 77807, "epoch": 1852} {"train_loss": -6.067080974578857, "global_step": 77808, "epoch": 1852} {"train_loss": -6.019663333892822, "global_step": 77809, "epoch": 1852} {"train_loss": -6.064662933349609, "global_step": 77810, "epoch": 1852} {"train_loss": -6.1335601806640625, "global_step": 77811, "epoch": 1852} {"train_loss": -6.200952529907227, "global_step": 77812, "epoch": 1852} {"train_loss": -6.119799613952637, "global_step": 77813, "epoch": 1852} {"train_loss": -6.053746700286865, "global_step": 77814, "epoch": 1852} {"train_loss": -6.171695709228516, "global_step": 77815, "epoch": 1852} {"train_loss": -6.25519323348999, "global_step": 77816, "epoch": 1852} {"train_loss": -6.1281867027282715, "global_step": 77817, "epoch": 1852} {"train_loss": -6.122909069061279, "global_step": 77818, "epoch": 1852} {"train_loss": -6.218219757080078, "global_step": 77819, "epoch": 1852} {"train_loss": -6.006235599517822, "global_step": 77820, "epoch": 1852} {"train_loss": -6.146982192993164, "global_step": 77821, "epoch": 1852} {"train_loss": -6.131796836853027, "global_step": 77822, "epoch": 1852} {"train_loss": -6.109347343444824, "global_step": 77823, "epoch": 1852} {"train_loss": -6.145852565765381, "global_step": 77824, "epoch": 1852} {"train_loss": -6.10917033467974, "global_step": 77825, "epoch": 1852, "val_loss": 67601.6015625} {"train_loss": -6.156137943267822, "global_step": 77826, "epoch": 1853} {"train_loss": -6.148824214935303, "global_step": 77827, "epoch": 1853} {"train_loss": -6.169994831085205, "global_step": 77828, "epoch": 1853} {"train_loss": -6.208352088928223, "global_step": 77829, "epoch": 1853} {"train_loss": -6.216569900512695, "global_step": 77830, "epoch": 1853} {"train_loss": -6.2089948654174805, "global_step": 77831, "epoch": 1853} {"train_loss": -6.097326278686523, "global_step": 77832, "epoch": 1853} {"train_loss": -6.229426383972168, "global_step": 77833, "epoch": 1853} {"train_loss": -6.181230545043945, "global_step": 77834, "epoch": 1853} {"train_loss": -6.1225666999816895, "global_step": 77835, "epoch": 1853} {"train_loss": -6.156572341918945, "global_step": 77836, "epoch": 1853} {"train_loss": -6.04137659072876, "global_step": 77837, "epoch": 1853} {"train_loss": -6.046090602874756, "global_step": 77838, "epoch": 1853} {"train_loss": -6.167367935180664, "global_step": 77839, "epoch": 1853} {"train_loss": -6.143735885620117, "global_step": 77840, "epoch": 1853} {"train_loss": -6.092538356781006, "global_step": 77841, "epoch": 1853} {"train_loss": -6.130331516265869, "global_step": 77842, "epoch": 1853} {"train_loss": -5.904508590698242, "global_step": 77843, "epoch": 1853} {"train_loss": -5.875365734100342, "global_step": 77844, "epoch": 1853} {"train_loss": -6.0169758796691895, "global_step": 77845, "epoch": 1853} {"train_loss": -5.987468242645264, "global_step": 77846, "epoch": 1853} {"train_loss": -6.244558334350586, "global_step": 77847, "epoch": 1853} {"train_loss": -5.95742130279541, "global_step": 77848, "epoch": 1853} {"train_loss": -6.121220111846924, "global_step": 77849, "epoch": 1853} {"train_loss": -6.0562286376953125, "global_step": 77850, "epoch": 1853} {"train_loss": -5.992499351501465, "global_step": 77851, "epoch": 1853} {"train_loss": -5.9536356925964355, "global_step": 77852, "epoch": 1853} {"train_loss": -6.0115461349487305, "global_step": 77853, "epoch": 1853} {"train_loss": -6.086164474487305, "global_step": 77854, "epoch": 1853} {"train_loss": -6.058032989501953, "global_step": 77855, "epoch": 1853} {"train_loss": -6.180958271026611, "global_step": 77856, "epoch": 1853} {"train_loss": -6.102628231048584, "global_step": 77857, "epoch": 1853} {"train_loss": -6.150677680969238, "global_step": 77858, "epoch": 1853} {"train_loss": -6.096472263336182, "global_step": 77859, "epoch": 1853} {"train_loss": -6.120733261108398, "global_step": 77860, "epoch": 1853} {"train_loss": -6.205566883087158, "global_step": 77861, "epoch": 1853} {"train_loss": -6.003974914550781, "global_step": 77862, "epoch": 1853} {"train_loss": -6.06702995300293, "global_step": 77863, "epoch": 1853} {"train_loss": -6.111172676086426, "global_step": 77864, "epoch": 1853} {"train_loss": -6.092551231384277, "global_step": 77865, "epoch": 1853} {"train_loss": -6.173415184020996, "global_step": 77866, "epoch": 1853} {"train_loss": -6.097262609572637, "global_step": 77867, "epoch": 1853, "val_loss": 67578.2421875} {"train_loss": -6.108205795288086, "global_step": 77868, "epoch": 1854} {"train_loss": -6.091061115264893, "global_step": 77869, "epoch": 1854} {"train_loss": -6.143461227416992, "global_step": 77870, "epoch": 1854} {"train_loss": -6.077409267425537, "global_step": 77871, "epoch": 1854} {"train_loss": -6.115999221801758, "global_step": 77872, "epoch": 1854} {"train_loss": -6.1163411140441895, "global_step": 77873, "epoch": 1854} {"train_loss": -6.053244113922119, "global_step": 77874, "epoch": 1854} {"train_loss": -6.07094144821167, "global_step": 77875, "epoch": 1854} {"train_loss": -6.080138206481934, "global_step": 77876, "epoch": 1854} {"train_loss": -6.162822723388672, "global_step": 77877, "epoch": 1854} {"train_loss": -6.017796039581299, "global_step": 77878, "epoch": 1854} {"train_loss": -6.099584579467773, "global_step": 77879, "epoch": 1854} {"train_loss": -6.074100971221924, "global_step": 77880, "epoch": 1854} {"train_loss": -6.218616485595703, "global_step": 77881, "epoch": 1854} {"train_loss": -6.230035305023193, "global_step": 77882, "epoch": 1854} {"train_loss": -6.038603782653809, "global_step": 77883, "epoch": 1854} {"train_loss": -6.116797924041748, "global_step": 77884, "epoch": 1854} {"train_loss": -6.140641212463379, "global_step": 77885, "epoch": 1854} {"train_loss": -6.192605972290039, "global_step": 77886, "epoch": 1854} {"train_loss": -6.080806255340576, "global_step": 77887, "epoch": 1854} {"train_loss": -6.107275009155273, "global_step": 77888, "epoch": 1854} {"train_loss": -6.109472751617432, "global_step": 77889, "epoch": 1854} {"train_loss": -6.118399620056152, "global_step": 77890, "epoch": 1854} {"train_loss": -6.188166618347168, "global_step": 77891, "epoch": 1854} {"train_loss": -6.046337127685547, "global_step": 77892, "epoch": 1854} {"train_loss": -6.042949676513672, "global_step": 77893, "epoch": 1854} {"train_loss": -6.065680980682373, "global_step": 77894, "epoch": 1854} {"train_loss": -6.019417762756348, "global_step": 77895, "epoch": 1854} {"train_loss": -6.059775352478027, "global_step": 77896, "epoch": 1854} {"train_loss": -6.100889205932617, "global_step": 77897, "epoch": 1854} {"train_loss": -6.055262565612793, "global_step": 77898, "epoch": 1854} {"train_loss": -6.149905204772949, "global_step": 77899, "epoch": 1854} {"train_loss": -5.989077568054199, "global_step": 77900, "epoch": 1854} {"train_loss": -6.104352951049805, "global_step": 77901, "epoch": 1854} {"train_loss": -6.1539998054504395, "global_step": 77902, "epoch": 1854} {"train_loss": -6.132846832275391, "global_step": 77903, "epoch": 1854} {"train_loss": -6.118900775909424, "global_step": 77904, "epoch": 1854} {"train_loss": -6.112025260925293, "global_step": 77905, "epoch": 1854} {"train_loss": -6.132022857666016, "global_step": 77906, "epoch": 1854} {"train_loss": -6.192706108093262, "global_step": 77907, "epoch": 1854} {"train_loss": -6.059635162353516, "global_step": 77908, "epoch": 1854} {"train_loss": -6.101660807927449, "global_step": 77909, "epoch": 1854, "val_loss": 67512.1796875} {"train_loss": -6.04026985168457, "global_step": 77910, "epoch": 1855} {"train_loss": -6.073415756225586, "global_step": 77911, "epoch": 1855} {"train_loss": -6.181271553039551, "global_step": 77912, "epoch": 1855} {"train_loss": -5.983264923095703, "global_step": 77913, "epoch": 1855} {"train_loss": -6.171730041503906, "global_step": 77914, "epoch": 1855} {"train_loss": -6.091488838195801, "global_step": 77915, "epoch": 1855} {"train_loss": -6.113035202026367, "global_step": 77916, "epoch": 1855} {"train_loss": -6.217057228088379, "global_step": 77917, "epoch": 1855} {"train_loss": -6.031327247619629, "global_step": 77918, "epoch": 1855} {"train_loss": -6.1570658683776855, "global_step": 77919, "epoch": 1855} {"train_loss": -6.190155506134033, "global_step": 77920, "epoch": 1855} {"train_loss": -6.096070289611816, "global_step": 77921, "epoch": 1855} {"train_loss": -6.228663921356201, "global_step": 77922, "epoch": 1855} {"train_loss": -5.994256973266602, "global_step": 77923, "epoch": 1855} {"train_loss": -6.205765724182129, "global_step": 77924, "epoch": 1855} {"train_loss": -6.134793758392334, "global_step": 77925, "epoch": 1855} {"train_loss": -6.176518440246582, "global_step": 77926, "epoch": 1855} {"train_loss": -6.15555477142334, "global_step": 77927, "epoch": 1855} {"train_loss": -6.162035942077637, "global_step": 77928, "epoch": 1855} {"train_loss": -6.134124279022217, "global_step": 77929, "epoch": 1855} {"train_loss": -6.146994590759277, "global_step": 77930, "epoch": 1855} {"train_loss": -6.126452445983887, "global_step": 77931, "epoch": 1855} {"train_loss": -6.081107139587402, "global_step": 77932, "epoch": 1855} {"train_loss": -6.122082710266113, "global_step": 77933, "epoch": 1855} {"train_loss": -6.140556335449219, "global_step": 77934, "epoch": 1855} {"train_loss": -6.114765167236328, "global_step": 77935, "epoch": 1855} {"train_loss": -6.050997734069824, "global_step": 77936, "epoch": 1855} {"train_loss": -6.008429527282715, "global_step": 77937, "epoch": 1855} {"train_loss": -5.948761463165283, "global_step": 77938, "epoch": 1855} {"train_loss": -6.184674263000488, "global_step": 77939, "epoch": 1855} {"train_loss": -5.960592746734619, "global_step": 77940, "epoch": 1855} {"train_loss": -6.083939075469971, "global_step": 77941, "epoch": 1855} {"train_loss": -6.066823959350586, "global_step": 77942, "epoch": 1855} {"train_loss": -5.924118518829346, "global_step": 77943, "epoch": 1855} {"train_loss": -6.151124000549316, "global_step": 77944, "epoch": 1855} {"train_loss": -6.116485595703125, "global_step": 77945, "epoch": 1855} {"train_loss": -5.996552467346191, "global_step": 77946, "epoch": 1855} {"train_loss": -6.185959815979004, "global_step": 77947, "epoch": 1855} {"train_loss": -6.028644561767578, "global_step": 77948, "epoch": 1855} {"train_loss": -5.9931254386901855, "global_step": 77949, "epoch": 1855} {"train_loss": -6.003777027130127, "global_step": 77950, "epoch": 1855} {"train_loss": -6.094866480146136, "global_step": 77951, "epoch": 1855, "val_loss": 67739.5390625} {"train_loss": -6.172157287597656, "global_step": 77952, "epoch": 1856} {"train_loss": -6.2369513511657715, "global_step": 77953, "epoch": 1856} {"train_loss": -6.043192386627197, "global_step": 77954, "epoch": 1856} {"train_loss": -5.991060256958008, "global_step": 77955, "epoch": 1856} {"train_loss": -6.237269401550293, "global_step": 77956, "epoch": 1856} {"train_loss": -6.068828105926514, "global_step": 77957, "epoch": 1856} {"train_loss": -6.048201560974121, "global_step": 77958, "epoch": 1856} {"train_loss": -6.123103141784668, "global_step": 77959, "epoch": 1856} {"train_loss": -5.891589164733887, "global_step": 77960, "epoch": 1856} {"train_loss": -6.213134288787842, "global_step": 77961, "epoch": 1856} {"train_loss": -6.077547073364258, "global_step": 77962, "epoch": 1856} {"train_loss": -5.907299995422363, "global_step": 77963, "epoch": 1856} {"train_loss": -6.1485419273376465, "global_step": 77964, "epoch": 1856} {"train_loss": -5.993160247802734, "global_step": 77965, "epoch": 1856} {"train_loss": -6.126852035522461, "global_step": 77966, "epoch": 1856} {"train_loss": -6.055188179016113, "global_step": 77967, "epoch": 1856} {"train_loss": -6.09052038192749, "global_step": 77968, "epoch": 1856} {"train_loss": -6.132724285125732, "global_step": 77969, "epoch": 1856} {"train_loss": -6.049055576324463, "global_step": 77970, "epoch": 1856} {"train_loss": -6.066422462463379, "global_step": 77971, "epoch": 1856} {"train_loss": -6.0094780921936035, "global_step": 77972, "epoch": 1856} {"train_loss": -6.016837120056152, "global_step": 77973, "epoch": 1856} {"train_loss": -6.058495998382568, "global_step": 77974, "epoch": 1856} {"train_loss": -6.035416603088379, "global_step": 77975, "epoch": 1856} {"train_loss": -6.093897819519043, "global_step": 77976, "epoch": 1856} {"train_loss": -6.133782386779785, "global_step": 77977, "epoch": 1856} {"train_loss": -6.0032877922058105, "global_step": 77978, "epoch": 1856} {"train_loss": -6.139632225036621, "global_step": 77979, "epoch": 1856} {"train_loss": -6.111973762512207, "global_step": 77980, "epoch": 1856} {"train_loss": -6.077943325042725, "global_step": 77981, "epoch": 1856} {"train_loss": -6.172727584838867, "global_step": 77982, "epoch": 1856} {"train_loss": -6.105526924133301, "global_step": 77983, "epoch": 1856} {"train_loss": -6.211870193481445, "global_step": 77984, "epoch": 1856} {"train_loss": -6.1008381843566895, "global_step": 77985, "epoch": 1856} {"train_loss": -6.177231311798096, "global_step": 77986, "epoch": 1856} {"train_loss": -6.103875637054443, "global_step": 77987, "epoch": 1856} {"train_loss": -6.035797119140625, "global_step": 77988, "epoch": 1856} {"train_loss": -6.039642333984375, "global_step": 77989, "epoch": 1856} {"train_loss": -6.126723289489746, "global_step": 77990, "epoch": 1856} {"train_loss": -6.039275169372559, "global_step": 77991, "epoch": 1856} {"train_loss": -6.1322808265686035, "global_step": 77992, "epoch": 1856} {"train_loss": -6.086840164093744, "global_step": 77993, "epoch": 1856, "val_loss": 67705.4453125} {"train_loss": -6.040285587310791, "global_step": 77994, "epoch": 1857} {"train_loss": -6.123546600341797, "global_step": 77995, "epoch": 1857} {"train_loss": -6.027011871337891, "global_step": 77996, "epoch": 1857} {"train_loss": -6.081357002258301, "global_step": 77997, "epoch": 1857} {"train_loss": -6.072670936584473, "global_step": 77998, "epoch": 1857} {"train_loss": -6.003138065338135, "global_step": 77999, "epoch": 1857} {"train_loss": -6.059819221496582, "global_step": 78000, "epoch": 1857} {"train_loss": -6.054503440856934, "global_step": 78001, "epoch": 1857} {"train_loss": -6.089893341064453, "global_step": 78002, "epoch": 1857} {"train_loss": -6.15402889251709, "global_step": 78003, "epoch": 1857} {"train_loss": -6.100711345672607, "global_step": 78004, "epoch": 1857} {"train_loss": -6.1088151931762695, "global_step": 78005, "epoch": 1857} {"train_loss": -6.1515069007873535, "global_step": 78006, "epoch": 1857} {"train_loss": -5.989090442657471, "global_step": 78007, "epoch": 1857} {"train_loss": -6.161702632904053, "global_step": 78008, "epoch": 1857} {"train_loss": -6.126542568206787, "global_step": 78009, "epoch": 1857} {"train_loss": -6.212380886077881, "global_step": 78010, "epoch": 1857} {"train_loss": -6.06820821762085, "global_step": 78011, "epoch": 1857} {"train_loss": -6.151838302612305, "global_step": 78012, "epoch": 1857} {"train_loss": -6.070213317871094, "global_step": 78013, "epoch": 1857} {"train_loss": -6.0866193771362305, "global_step": 78014, "epoch": 1857} {"train_loss": -6.047489166259766, "global_step": 78015, "epoch": 1857} {"train_loss": -6.211227893829346, "global_step": 78016, "epoch": 1857} {"train_loss": -5.934866905212402, "global_step": 78017, "epoch": 1857} {"train_loss": -6.094409942626953, "global_step": 78018, "epoch": 1857} {"train_loss": -6.030109405517578, "global_step": 78019, "epoch": 1857} {"train_loss": -5.991094589233398, "global_step": 78020, "epoch": 1857} {"train_loss": -6.066699028015137, "global_step": 78021, "epoch": 1857} {"train_loss": -6.045562267303467, "global_step": 78022, "epoch": 1857} {"train_loss": -6.043710708618164, "global_step": 78023, "epoch": 1857} {"train_loss": -6.02280855178833, "global_step": 78024, "epoch": 1857} {"train_loss": -6.1054768562316895, "global_step": 78025, "epoch": 1857} {"train_loss": -6.083206653594971, "global_step": 78026, "epoch": 1857} {"train_loss": -6.004755973815918, "global_step": 78027, "epoch": 1857} {"train_loss": -6.007246971130371, "global_step": 78028, "epoch": 1857} {"train_loss": -6.017277240753174, "global_step": 78029, "epoch": 1857} {"train_loss": -6.160540580749512, "global_step": 78030, "epoch": 1857} {"train_loss": -5.972049713134766, "global_step": 78031, "epoch": 1857} {"train_loss": -6.137424945831299, "global_step": 78032, "epoch": 1857} {"train_loss": -6.099645137786865, "global_step": 78033, "epoch": 1857} {"train_loss": -6.016270637512207, "global_step": 78034, "epoch": 1857} {"train_loss": -6.074124767666771, "global_step": 78035, "epoch": 1857, "val_loss": 67423.7890625} {"train_loss": -6.094682693481445, "global_step": 78036, "epoch": 1858} {"train_loss": -6.142528533935547, "global_step": 78037, "epoch": 1858} {"train_loss": -5.982341289520264, "global_step": 78038, "epoch": 1858} {"train_loss": -6.165379047393799, "global_step": 78039, "epoch": 1858} {"train_loss": -6.086835861206055, "global_step": 78040, "epoch": 1858} {"train_loss": -6.1550445556640625, "global_step": 78041, "epoch": 1858} {"train_loss": -6.085634231567383, "global_step": 78042, "epoch": 1858} {"train_loss": -6.193717002868652, "global_step": 78043, "epoch": 1858} {"train_loss": -6.1356706619262695, "global_step": 78044, "epoch": 1858} {"train_loss": -6.12459659576416, "global_step": 78045, "epoch": 1858} {"train_loss": -6.123697757720947, "global_step": 78046, "epoch": 1858} {"train_loss": -6.002391338348389, "global_step": 78047, "epoch": 1858} {"train_loss": -6.050851345062256, "global_step": 78048, "epoch": 1858} {"train_loss": -6.130064964294434, "global_step": 78049, "epoch": 1858} {"train_loss": -5.904776573181152, "global_step": 78050, "epoch": 1858} {"train_loss": -6.100205421447754, "global_step": 78051, "epoch": 1858} {"train_loss": -6.012823104858398, "global_step": 78052, "epoch": 1858} {"train_loss": -5.926271438598633, "global_step": 78053, "epoch": 1858} {"train_loss": -6.050649642944336, "global_step": 78054, "epoch": 1858} {"train_loss": -6.036523818969727, "global_step": 78055, "epoch": 1858} {"train_loss": -6.057415962219238, "global_step": 78056, "epoch": 1858} {"train_loss": -6.086909770965576, "global_step": 78057, "epoch": 1858} {"train_loss": -6.142364025115967, "global_step": 78058, "epoch": 1858} {"train_loss": -6.099173545837402, "global_step": 78059, "epoch": 1858} {"train_loss": -6.051032066345215, "global_step": 78060, "epoch": 1858} {"train_loss": -6.066069602966309, "global_step": 78061, "epoch": 1858} {"train_loss": -6.049554824829102, "global_step": 78062, "epoch": 1858} {"train_loss": -6.128591537475586, "global_step": 78063, "epoch": 1858} {"train_loss": -6.096068382263184, "global_step": 78064, "epoch": 1858} {"train_loss": -6.044844627380371, "global_step": 78065, "epoch": 1858} {"train_loss": -6.077372074127197, "global_step": 78066, "epoch": 1858} {"train_loss": -6.039255142211914, "global_step": 78067, "epoch": 1858} {"train_loss": -5.9915876388549805, "global_step": 78068, "epoch": 1858} {"train_loss": -5.973578929901123, "global_step": 78069, "epoch": 1858} {"train_loss": -6.138144493103027, "global_step": 78070, "epoch": 1858} {"train_loss": -6.206886291503906, "global_step": 78071, "epoch": 1858} {"train_loss": -6.062246322631836, "global_step": 78072, "epoch": 1858} {"train_loss": -5.988405227661133, "global_step": 78073, "epoch": 1858} {"train_loss": -6.094590187072754, "global_step": 78074, "epoch": 1858} {"train_loss": -6.049556732177734, "global_step": 78075, "epoch": 1858} {"train_loss": -6.094017028808594, "global_step": 78076, "epoch": 1858} {"train_loss": -6.076500007084438, "global_step": 78077, "epoch": 1858, "val_loss": 67467.5703125} {"train_loss": -6.147029876708984, "global_step": 78078, "epoch": 1859} {"train_loss": -6.200277805328369, "global_step": 78079, "epoch": 1859} {"train_loss": -6.063243865966797, "global_step": 78080, "epoch": 1859} {"train_loss": -6.042943954467773, "global_step": 78081, "epoch": 1859} {"train_loss": -6.1502180099487305, "global_step": 78082, "epoch": 1859} {"train_loss": -6.167674541473389, "global_step": 78083, "epoch": 1859} {"train_loss": -6.112638473510742, "global_step": 78084, "epoch": 1859} {"train_loss": -6.08403205871582, "global_step": 78085, "epoch": 1859} {"train_loss": -6.138232231140137, "global_step": 78086, "epoch": 1859} {"train_loss": -6.050753593444824, "global_step": 78087, "epoch": 1859} {"train_loss": -6.062298774719238, "global_step": 78088, "epoch": 1859} {"train_loss": -6.180746078491211, "global_step": 78089, "epoch": 1859} {"train_loss": -6.159281253814697, "global_step": 78090, "epoch": 1859} {"train_loss": -6.019984245300293, "global_step": 78091, "epoch": 1859} {"train_loss": -6.0080060958862305, "global_step": 78092, "epoch": 1859} {"train_loss": -6.066441535949707, "global_step": 78093, "epoch": 1859} {"train_loss": -6.145383834838867, "global_step": 78094, "epoch": 1859} {"train_loss": -6.108397483825684, "global_step": 78095, "epoch": 1859} {"train_loss": -6.102018356323242, "global_step": 78096, "epoch": 1859} {"train_loss": -6.2114763259887695, "global_step": 78097, "epoch": 1859} {"train_loss": -6.17527961730957, "global_step": 78098, "epoch": 1859} {"train_loss": -6.1834917068481445, "global_step": 78099, "epoch": 1859} {"train_loss": -6.038325309753418, "global_step": 78100, "epoch": 1859} {"train_loss": -6.106210231781006, "global_step": 78101, "epoch": 1859} {"train_loss": -6.214932441711426, "global_step": 78102, "epoch": 1859} {"train_loss": -6.05106258392334, "global_step": 78103, "epoch": 1859} {"train_loss": -6.217348098754883, "global_step": 78104, "epoch": 1859} {"train_loss": -6.075023651123047, "global_step": 78105, "epoch": 1859} {"train_loss": -6.167709827423096, "global_step": 78106, "epoch": 1859} {"train_loss": -6.14680814743042, "global_step": 78107, "epoch": 1859} {"train_loss": -6.09507942199707, "global_step": 78108, "epoch": 1859} {"train_loss": -6.203391075134277, "global_step": 78109, "epoch": 1859} {"train_loss": -5.961733341217041, "global_step": 78110, "epoch": 1859} {"train_loss": -6.150362014770508, "global_step": 78111, "epoch": 1859} {"train_loss": -6.135244369506836, "global_step": 78112, "epoch": 1859} {"train_loss": -6.112875938415527, "global_step": 78113, "epoch": 1859} {"train_loss": -6.100788116455078, "global_step": 78114, "epoch": 1859} {"train_loss": -6.1374616622924805, "global_step": 78115, "epoch": 1859} {"train_loss": -6.074150085449219, "global_step": 78116, "epoch": 1859} {"train_loss": -6.17557430267334, "global_step": 78117, "epoch": 1859} {"train_loss": -6.0976338386535645, "global_step": 78118, "epoch": 1859} {"train_loss": -6.119115046092442, "global_step": 78119, "epoch": 1859, "val_loss": 67560.171875} {"train_loss": -6.215558052062988, "global_step": 78120, "epoch": 1860} {"train_loss": -5.979599952697754, "global_step": 78121, "epoch": 1860} {"train_loss": -6.005124092102051, "global_step": 78122, "epoch": 1860} {"train_loss": -6.183266639709473, "global_step": 78123, "epoch": 1860} {"train_loss": -6.042666435241699, "global_step": 78124, "epoch": 1860} {"train_loss": -6.067296981811523, "global_step": 78125, "epoch": 1860} {"train_loss": -6.156107425689697, "global_step": 78126, "epoch": 1860} {"train_loss": -6.148754596710205, "global_step": 78127, "epoch": 1860} {"train_loss": -6.091897964477539, "global_step": 78128, "epoch": 1860} {"train_loss": -6.108216762542725, "global_step": 78129, "epoch": 1860} {"train_loss": -6.122046947479248, "global_step": 78130, "epoch": 1860} {"train_loss": -6.154542922973633, "global_step": 78131, "epoch": 1860} {"train_loss": -6.159029960632324, "global_step": 78132, "epoch": 1860} {"train_loss": -5.970740795135498, "global_step": 78133, "epoch": 1860} {"train_loss": -6.057373046875, "global_step": 78134, "epoch": 1860} {"train_loss": -6.009438991546631, "global_step": 78135, "epoch": 1860} {"train_loss": -6.090234756469727, "global_step": 78136, "epoch": 1860} {"train_loss": -6.2043256759643555, "global_step": 78137, "epoch": 1860} {"train_loss": -6.16265869140625, "global_step": 78138, "epoch": 1860} {"train_loss": -6.181449890136719, "global_step": 78139, "epoch": 1860} {"train_loss": -6.208531856536865, "global_step": 78140, "epoch": 1860} {"train_loss": -6.16690731048584, "global_step": 78141, "epoch": 1860} {"train_loss": -6.220016002655029, "global_step": 78142, "epoch": 1860} {"train_loss": -6.0732221603393555, "global_step": 78143, "epoch": 1860} {"train_loss": -6.160154819488525, "global_step": 78144, "epoch": 1860} {"train_loss": -6.112442970275879, "global_step": 78145, "epoch": 1860} {"train_loss": -6.186853885650635, "global_step": 78146, "epoch": 1860} {"train_loss": -6.143520832061768, "global_step": 78147, "epoch": 1860} {"train_loss": -6.246433258056641, "global_step": 78148, "epoch": 1860} {"train_loss": -6.1783671379089355, "global_step": 78149, "epoch": 1860} {"train_loss": -6.2187581062316895, "global_step": 78150, "epoch": 1860} {"train_loss": -6.128173828125, "global_step": 78151, "epoch": 1860} {"train_loss": -6.178584098815918, "global_step": 78152, "epoch": 1860} {"train_loss": -6.135095119476318, "global_step": 78153, "epoch": 1860} {"train_loss": -6.308836460113525, "global_step": 78154, "epoch": 1860} {"train_loss": -6.081611633300781, "global_step": 78155, "epoch": 1860} {"train_loss": -6.252121925354004, "global_step": 78156, "epoch": 1860} {"train_loss": -6.143367767333984, "global_step": 78157, "epoch": 1860} {"train_loss": -5.936152458190918, "global_step": 78158, "epoch": 1860} {"train_loss": -6.103928565979004, "global_step": 78159, "epoch": 1860} {"train_loss": -6.137226104736328, "global_step": 78160, "epoch": 1860} {"train_loss": -6.128802151907058, "global_step": 78161, "epoch": 1860, "val_loss": 67546.5625} {"train_loss": -6.17356014251709, "global_step": 78162, "epoch": 1861} {"train_loss": -6.083832740783691, "global_step": 78163, "epoch": 1861} {"train_loss": -6.100323677062988, "global_step": 78164, "epoch": 1861} {"train_loss": -6.189023017883301, "global_step": 78165, "epoch": 1861} {"train_loss": -6.24109411239624, "global_step": 78166, "epoch": 1861} {"train_loss": -6.193570137023926, "global_step": 78167, "epoch": 1861} {"train_loss": -6.119503021240234, "global_step": 78168, "epoch": 1861} {"train_loss": -6.112033367156982, "global_step": 78169, "epoch": 1861} {"train_loss": -6.129560470581055, "global_step": 78170, "epoch": 1861} {"train_loss": -6.087460041046143, "global_step": 78171, "epoch": 1861} {"train_loss": -6.1897077560424805, "global_step": 78172, "epoch": 1861} {"train_loss": -6.044672012329102, "global_step": 78173, "epoch": 1861} {"train_loss": -6.17066764831543, "global_step": 78174, "epoch": 1861} {"train_loss": -6.091011047363281, "global_step": 78175, "epoch": 1861} {"train_loss": -6.10146951675415, "global_step": 78176, "epoch": 1861} {"train_loss": -6.106655597686768, "global_step": 78177, "epoch": 1861} {"train_loss": -5.98635196685791, "global_step": 78178, "epoch": 1861} {"train_loss": -6.107522964477539, "global_step": 78179, "epoch": 1861} {"train_loss": -6.037115097045898, "global_step": 78180, "epoch": 1861} {"train_loss": -5.977288722991943, "global_step": 78181, "epoch": 1861} {"train_loss": -6.098992347717285, "global_step": 78182, "epoch": 1861} {"train_loss": -6.07421875, "global_step": 78183, "epoch": 1861} {"train_loss": -6.127225875854492, "global_step": 78184, "epoch": 1861} {"train_loss": -6.112269401550293, "global_step": 78185, "epoch": 1861} {"train_loss": -6.0491838455200195, "global_step": 78186, "epoch": 1861} {"train_loss": -6.104006290435791, "global_step": 78187, "epoch": 1861} {"train_loss": -6.0128173828125, "global_step": 78188, "epoch": 1861} {"train_loss": -6.0936408042907715, "global_step": 78189, "epoch": 1861} {"train_loss": -6.088706016540527, "global_step": 78190, "epoch": 1861} {"train_loss": -6.136973857879639, "global_step": 78191, "epoch": 1861} {"train_loss": -6.073016166687012, "global_step": 78192, "epoch": 1861} {"train_loss": -6.055446147918701, "global_step": 78193, "epoch": 1861} {"train_loss": -6.055602073669434, "global_step": 78194, "epoch": 1861} {"train_loss": -6.021774768829346, "global_step": 78195, "epoch": 1861} {"train_loss": -6.089451789855957, "global_step": 78196, "epoch": 1861} {"train_loss": -6.069015979766846, "global_step": 78197, "epoch": 1861} {"train_loss": -6.1352081298828125, "global_step": 78198, "epoch": 1861} {"train_loss": -5.979251384735107, "global_step": 78199, "epoch": 1861} {"train_loss": -6.178311347961426, "global_step": 78200, "epoch": 1861} {"train_loss": -6.12135124206543, "global_step": 78201, "epoch": 1861} {"train_loss": -6.030108451843262, "global_step": 78202, "epoch": 1861} {"train_loss": -6.096557798839751, "global_step": 78203, "epoch": 1861, "val_loss": 67709.7890625} {"train_loss": -6.1440935134887695, "global_step": 78204, "epoch": 1862} {"train_loss": -6.045069694519043, "global_step": 78205, "epoch": 1862} {"train_loss": -6.249451637268066, "global_step": 78206, "epoch": 1862} {"train_loss": -5.963311195373535, "global_step": 78207, "epoch": 1862} {"train_loss": -6.100728988647461, "global_step": 78208, "epoch": 1862} {"train_loss": -6.19332218170166, "global_step": 78209, "epoch": 1862} {"train_loss": -6.106695175170898, "global_step": 78210, "epoch": 1862} {"train_loss": -5.984414100646973, "global_step": 78211, "epoch": 1862} {"train_loss": -6.1241960525512695, "global_step": 78212, "epoch": 1862} {"train_loss": -6.060423851013184, "global_step": 78213, "epoch": 1862} {"train_loss": -6.073299407958984, "global_step": 78214, "epoch": 1862} {"train_loss": -6.02851676940918, "global_step": 78215, "epoch": 1862} {"train_loss": -6.177689075469971, "global_step": 78216, "epoch": 1862} {"train_loss": -6.171669006347656, "global_step": 78217, "epoch": 1862} {"train_loss": -5.969302177429199, "global_step": 78218, "epoch": 1862} {"train_loss": -6.063786506652832, "global_step": 78219, "epoch": 1862} {"train_loss": -6.010571002960205, "global_step": 78220, "epoch": 1862} {"train_loss": -6.156586647033691, "global_step": 78221, "epoch": 1862} {"train_loss": -5.987606525421143, "global_step": 78222, "epoch": 1862} {"train_loss": -6.085958480834961, "global_step": 78223, "epoch": 1862} {"train_loss": -6.118844032287598, "global_step": 78224, "epoch": 1862} {"train_loss": -6.0797576904296875, "global_step": 78225, "epoch": 1862} {"train_loss": -6.105980396270752, "global_step": 78226, "epoch": 1862} {"train_loss": -6.074654579162598, "global_step": 78227, "epoch": 1862} {"train_loss": -6.010284900665283, "global_step": 78228, "epoch": 1862} {"train_loss": -6.123842239379883, "global_step": 78229, "epoch": 1862} {"train_loss": -6.088162899017334, "global_step": 78230, "epoch": 1862} {"train_loss": -6.0960540771484375, "global_step": 78231, "epoch": 1862} {"train_loss": -6.173222541809082, "global_step": 78232, "epoch": 1862} {"train_loss": -6.0360565185546875, "global_step": 78233, "epoch": 1862} {"train_loss": -6.166118621826172, "global_step": 78234, "epoch": 1862} {"train_loss": -6.116828918457031, "global_step": 78235, "epoch": 1862} {"train_loss": -6.168231964111328, "global_step": 78236, "epoch": 1862} {"train_loss": -6.133942604064941, "global_step": 78237, "epoch": 1862} {"train_loss": -6.021484375, "global_step": 78238, "epoch": 1862} {"train_loss": -6.185352325439453, "global_step": 78239, "epoch": 1862} {"train_loss": -6.130158424377441, "global_step": 78240, "epoch": 1862} {"train_loss": -6.10514497756958, "global_step": 78241, "epoch": 1862} {"train_loss": -6.168737411499023, "global_step": 78242, "epoch": 1862} {"train_loss": -6.005647659301758, "global_step": 78243, "epoch": 1862} {"train_loss": -6.202826499938965, "global_step": 78244, "epoch": 1862} {"train_loss": -6.098275320870536, "global_step": 78245, "epoch": 1862, "val_loss": 67619.3515625} {"train_loss": -6.167448043823242, "global_step": 78246, "epoch": 1863} {"train_loss": -6.20176887512207, "global_step": 78247, "epoch": 1863} {"train_loss": -6.021547317504883, "global_step": 78248, "epoch": 1863} {"train_loss": -6.2825927734375, "global_step": 78249, "epoch": 1863} {"train_loss": -6.08534574508667, "global_step": 78250, "epoch": 1863} {"train_loss": -6.23989200592041, "global_step": 78251, "epoch": 1863} {"train_loss": -6.162540435791016, "global_step": 78252, "epoch": 1863} {"train_loss": -6.0692291259765625, "global_step": 78253, "epoch": 1863} {"train_loss": -6.13068151473999, "global_step": 78254, "epoch": 1863} {"train_loss": -6.139475345611572, "global_step": 78255, "epoch": 1863} {"train_loss": -6.14719295501709, "global_step": 78256, "epoch": 1863} {"train_loss": -6.201652526855469, "global_step": 78257, "epoch": 1863} {"train_loss": -6.089807510375977, "global_step": 78258, "epoch": 1863} {"train_loss": -6.113501071929932, "global_step": 78259, "epoch": 1863} {"train_loss": -6.182104110717773, "global_step": 78260, "epoch": 1863} {"train_loss": -6.086033821105957, "global_step": 78261, "epoch": 1863} {"train_loss": -6.160417556762695, "global_step": 78262, "epoch": 1863} {"train_loss": -6.0819597244262695, "global_step": 78263, "epoch": 1863} {"train_loss": -6.1401801109313965, "global_step": 78264, "epoch": 1863} {"train_loss": -6.082394599914551, "global_step": 78265, "epoch": 1863} {"train_loss": -6.157654762268066, "global_step": 78266, "epoch": 1863} {"train_loss": -6.1066389083862305, "global_step": 78267, "epoch": 1863} {"train_loss": -6.100140571594238, "global_step": 78268, "epoch": 1863} {"train_loss": -6.161004543304443, "global_step": 78269, "epoch": 1863} {"train_loss": -6.121260166168213, "global_step": 78270, "epoch": 1863} {"train_loss": -6.065332412719727, "global_step": 78271, "epoch": 1863} {"train_loss": -5.948988437652588, "global_step": 78272, "epoch": 1863} {"train_loss": -6.082433700561523, "global_step": 78273, "epoch": 1863} {"train_loss": -6.10444450378418, "global_step": 78274, "epoch": 1863} {"train_loss": -6.085029602050781, "global_step": 78275, "epoch": 1863} {"train_loss": -6.0365142822265625, "global_step": 78276, "epoch": 1863} {"train_loss": -6.0770158767700195, "global_step": 78277, "epoch": 1863} {"train_loss": -6.166446685791016, "global_step": 78278, "epoch": 1863} {"train_loss": -6.004985809326172, "global_step": 78279, "epoch": 1863} {"train_loss": -6.084957122802734, "global_step": 78280, "epoch": 1863} {"train_loss": -6.056281089782715, "global_step": 78281, "epoch": 1863} {"train_loss": -6.155026435852051, "global_step": 78282, "epoch": 1863} {"train_loss": -6.058246612548828, "global_step": 78283, "epoch": 1863} {"train_loss": -6.147417068481445, "global_step": 78284, "epoch": 1863} {"train_loss": -6.177335262298584, "global_step": 78285, "epoch": 1863} {"train_loss": -6.092280864715576, "global_step": 78286, "epoch": 1863} {"train_loss": -6.118070295878819, "global_step": 78287, "epoch": 1863, "val_loss": 67543.5078125} {"train_loss": -6.212061405181885, "global_step": 78288, "epoch": 1864} {"train_loss": -6.154416084289551, "global_step": 78289, "epoch": 1864} {"train_loss": -6.114886283874512, "global_step": 78290, "epoch": 1864} {"train_loss": -6.248618125915527, "global_step": 78291, "epoch": 1864} {"train_loss": -6.069808483123779, "global_step": 78292, "epoch": 1864} {"train_loss": -6.089521884918213, "global_step": 78293, "epoch": 1864} {"train_loss": -6.1612749099731445, "global_step": 78294, "epoch": 1864} {"train_loss": -6.027250289916992, "global_step": 78295, "epoch": 1864} {"train_loss": -6.151350975036621, "global_step": 78296, "epoch": 1864} {"train_loss": -6.183635711669922, "global_step": 78297, "epoch": 1864} {"train_loss": -5.9360032081604, "global_step": 78298, "epoch": 1864} {"train_loss": -6.07014799118042, "global_step": 78299, "epoch": 1864} {"train_loss": -5.960742950439453, "global_step": 78300, "epoch": 1864} {"train_loss": -5.986120223999023, "global_step": 78301, "epoch": 1864} {"train_loss": -6.123296737670898, "global_step": 78302, "epoch": 1864} {"train_loss": -6.096498012542725, "global_step": 78303, "epoch": 1864} {"train_loss": -6.249241352081299, "global_step": 78304, "epoch": 1864} {"train_loss": -6.10557746887207, "global_step": 78305, "epoch": 1864} {"train_loss": -6.066863059997559, "global_step": 78306, "epoch": 1864} {"train_loss": -6.0933308601379395, "global_step": 78307, "epoch": 1864} {"train_loss": -6.073668479919434, "global_step": 78308, "epoch": 1864} {"train_loss": -6.0204010009765625, "global_step": 78309, "epoch": 1864} {"train_loss": -5.934233665466309, "global_step": 78310, "epoch": 1864} {"train_loss": -6.117015361785889, "global_step": 78311, "epoch": 1864} {"train_loss": -6.0116987228393555, "global_step": 78312, "epoch": 1864} {"train_loss": -6.143869400024414, "global_step": 78313, "epoch": 1864} {"train_loss": -6.066571235656738, "global_step": 78314, "epoch": 1864} {"train_loss": -5.988219738006592, "global_step": 78315, "epoch": 1864} {"train_loss": -6.203677177429199, "global_step": 78316, "epoch": 1864} {"train_loss": -6.039737224578857, "global_step": 78317, "epoch": 1864} {"train_loss": -5.887423992156982, "global_step": 78318, "epoch": 1864} {"train_loss": -6.0253143310546875, "global_step": 78319, "epoch": 1864} {"train_loss": -6.12783670425415, "global_step": 78320, "epoch": 1864} {"train_loss": -6.016653537750244, "global_step": 78321, "epoch": 1864} {"train_loss": -6.050257205963135, "global_step": 78322, "epoch": 1864} {"train_loss": -6.069309711456299, "global_step": 78323, "epoch": 1864} {"train_loss": -6.1196441650390625, "global_step": 78324, "epoch": 1864} {"train_loss": -6.0779032707214355, "global_step": 78325, "epoch": 1864} {"train_loss": -6.292327404022217, "global_step": 78326, "epoch": 1864} {"train_loss": -6.0999555587768555, "global_step": 78327, "epoch": 1864} {"train_loss": -6.0641326904296875, "global_step": 78328, "epoch": 1864} {"train_loss": -6.0872032188233876, "global_step": 78329, "epoch": 1864, "val_loss": 67413.1875} {"train_loss": -6.206057071685791, "global_step": 78330, "epoch": 1865} {"train_loss": -6.081347465515137, "global_step": 78331, "epoch": 1865} {"train_loss": -6.13657808303833, "global_step": 78332, "epoch": 1865} {"train_loss": -6.048580169677734, "global_step": 78333, "epoch": 1865} {"train_loss": -6.115156173706055, "global_step": 78334, "epoch": 1865} {"train_loss": -6.164006233215332, "global_step": 78335, "epoch": 1865} {"train_loss": -6.115858554840088, "global_step": 78336, "epoch": 1865} {"train_loss": -6.080045700073242, "global_step": 78337, "epoch": 1865} {"train_loss": -6.132534027099609, "global_step": 78338, "epoch": 1865} {"train_loss": -6.104942321777344, "global_step": 78339, "epoch": 1865} {"train_loss": -6.185053825378418, "global_step": 78340, "epoch": 1865} {"train_loss": -6.086390018463135, "global_step": 78341, "epoch": 1865} {"train_loss": -6.10459041595459, "global_step": 78342, "epoch": 1865} {"train_loss": -6.137990474700928, "global_step": 78343, "epoch": 1865} {"train_loss": -6.112493991851807, "global_step": 78344, "epoch": 1865} {"train_loss": -6.10424280166626, "global_step": 78345, "epoch": 1865} {"train_loss": -6.092165946960449, "global_step": 78346, "epoch": 1865} {"train_loss": -6.228802680969238, "global_step": 78347, "epoch": 1865} {"train_loss": -6.196728706359863, "global_step": 78348, "epoch": 1865} {"train_loss": -6.2227067947387695, "global_step": 78349, "epoch": 1865} {"train_loss": -6.164023399353027, "global_step": 78350, "epoch": 1865} {"train_loss": -5.980093002319336, "global_step": 78351, "epoch": 1865} {"train_loss": -6.0625739097595215, "global_step": 78352, "epoch": 1865} {"train_loss": -6.11680793762207, "global_step": 78353, "epoch": 1865} {"train_loss": -6.020106792449951, "global_step": 78354, "epoch": 1865} {"train_loss": -6.073375225067139, "global_step": 78355, "epoch": 1865} {"train_loss": -6.055299282073975, "global_step": 78356, "epoch": 1865} {"train_loss": -6.0359392166137695, "global_step": 78357, "epoch": 1865} {"train_loss": -6.065431594848633, "global_step": 78358, "epoch": 1865} {"train_loss": -6.034733772277832, "global_step": 78359, "epoch": 1865} {"train_loss": -6.080647945404053, "global_step": 78360, "epoch": 1865} {"train_loss": -6.150978088378906, "global_step": 78361, "epoch": 1865} {"train_loss": -6.082054138183594, "global_step": 78362, "epoch": 1865} {"train_loss": -6.168274879455566, "global_step": 78363, "epoch": 1865} {"train_loss": -6.119114875793457, "global_step": 78364, "epoch": 1865} {"train_loss": -6.16564416885376, "global_step": 78365, "epoch": 1865} {"train_loss": -6.123011112213135, "global_step": 78366, "epoch": 1865} {"train_loss": -6.107625961303711, "global_step": 78367, "epoch": 1865} {"train_loss": -6.042074680328369, "global_step": 78368, "epoch": 1865} {"train_loss": -6.041121482849121, "global_step": 78369, "epoch": 1865} {"train_loss": -5.987590789794922, "global_step": 78370, "epoch": 1865} {"train_loss": -6.104115758623395, "global_step": 78371, "epoch": 1865, "val_loss": 67723.21875} {"train_loss": -5.969169616699219, "global_step": 78372, "epoch": 1866} {"train_loss": -6.044254779815674, "global_step": 78373, "epoch": 1866} {"train_loss": -6.122148513793945, "global_step": 78374, "epoch": 1866} {"train_loss": -6.088406562805176, "global_step": 78375, "epoch": 1866} {"train_loss": -6.160721778869629, "global_step": 78376, "epoch": 1866} {"train_loss": -6.062137603759766, "global_step": 78377, "epoch": 1866} {"train_loss": -6.036935806274414, "global_step": 78378, "epoch": 1866} {"train_loss": -6.105900764465332, "global_step": 78379, "epoch": 1866} {"train_loss": -6.070952415466309, "global_step": 78380, "epoch": 1866} {"train_loss": -6.155670642852783, "global_step": 78381, "epoch": 1866} {"train_loss": -6.147985935211182, "global_step": 78382, "epoch": 1866} {"train_loss": -6.144844055175781, "global_step": 78383, "epoch": 1866} {"train_loss": -6.013400077819824, "global_step": 78384, "epoch": 1866} {"train_loss": -5.985574245452881, "global_step": 78385, "epoch": 1866} {"train_loss": -6.007204055786133, "global_step": 78386, "epoch": 1866} {"train_loss": -5.9490814208984375, "global_step": 78387, "epoch": 1866} {"train_loss": -6.081308364868164, "global_step": 78388, "epoch": 1866} {"train_loss": -6.164915084838867, "global_step": 78389, "epoch": 1866} {"train_loss": -6.175795555114746, "global_step": 78390, "epoch": 1866} {"train_loss": -6.107024669647217, "global_step": 78391, "epoch": 1866} {"train_loss": -6.107696056365967, "global_step": 78392, "epoch": 1866} {"train_loss": -6.204300403594971, "global_step": 78393, "epoch": 1866} {"train_loss": -6.137139797210693, "global_step": 78394, "epoch": 1866} {"train_loss": -6.240611553192139, "global_step": 78395, "epoch": 1866} {"train_loss": -6.077925682067871, "global_step": 78396, "epoch": 1866} {"train_loss": -6.1325812339782715, "global_step": 78397, "epoch": 1866} {"train_loss": -6.098816871643066, "global_step": 78398, "epoch": 1866} {"train_loss": -6.013205051422119, "global_step": 78399, "epoch": 1866} {"train_loss": -6.231512069702148, "global_step": 78400, "epoch": 1866} {"train_loss": -5.944473743438721, "global_step": 78401, "epoch": 1866} {"train_loss": -6.0309014320373535, "global_step": 78402, "epoch": 1866} {"train_loss": -6.062933921813965, "global_step": 78403, "epoch": 1866} {"train_loss": -5.96728515625, "global_step": 78404, "epoch": 1866} {"train_loss": -6.091312408447266, "global_step": 78405, "epoch": 1866} {"train_loss": -6.018912315368652, "global_step": 78406, "epoch": 1866} {"train_loss": -6.030289649963379, "global_step": 78407, "epoch": 1866} {"train_loss": -6.1044440269470215, "global_step": 78408, "epoch": 1866} {"train_loss": -6.1232075691223145, "global_step": 78409, "epoch": 1866} {"train_loss": -6.085258960723877, "global_step": 78410, "epoch": 1866} {"train_loss": -6.006619930267334, "global_step": 78411, "epoch": 1866} {"train_loss": -6.025128364562988, "global_step": 78412, "epoch": 1866} {"train_loss": -6.0835519064040415, "global_step": 78413, "epoch": 1866, "val_loss": 67604.296875} {"train_loss": -5.939373970031738, "global_step": 78414, "epoch": 1867} {"train_loss": -6.123392581939697, "global_step": 78415, "epoch": 1867} {"train_loss": -6.031650066375732, "global_step": 78416, "epoch": 1867} {"train_loss": -5.960780143737793, "global_step": 78417, "epoch": 1867} {"train_loss": -6.030965328216553, "global_step": 78418, "epoch": 1867} {"train_loss": -6.1738762855529785, "global_step": 78419, "epoch": 1867} {"train_loss": -6.05851936340332, "global_step": 78420, "epoch": 1867} {"train_loss": -6.1047868728637695, "global_step": 78421, "epoch": 1867} {"train_loss": -6.202804088592529, "global_step": 78422, "epoch": 1867} {"train_loss": -5.985283374786377, "global_step": 78423, "epoch": 1867} {"train_loss": -5.99787712097168, "global_step": 78424, "epoch": 1867} {"train_loss": -6.124771595001221, "global_step": 78425, "epoch": 1867} {"train_loss": -6.085688591003418, "global_step": 78426, "epoch": 1867} {"train_loss": -5.978399276733398, "global_step": 78427, "epoch": 1867} {"train_loss": -6.100709915161133, "global_step": 78428, "epoch": 1867} {"train_loss": -6.05772066116333, "global_step": 78429, "epoch": 1867} {"train_loss": -5.973512649536133, "global_step": 78430, "epoch": 1867} {"train_loss": -6.0750555992126465, "global_step": 78431, "epoch": 1867} {"train_loss": -6.113636016845703, "global_step": 78432, "epoch": 1867} {"train_loss": -6.089798927307129, "global_step": 78433, "epoch": 1867} {"train_loss": -6.10984992980957, "global_step": 78434, "epoch": 1867} {"train_loss": -6.178177833557129, "global_step": 78435, "epoch": 1867} {"train_loss": -6.184744834899902, "global_step": 78436, "epoch": 1867} {"train_loss": -6.092389106750488, "global_step": 78437, "epoch": 1867} {"train_loss": -6.087467670440674, "global_step": 78438, "epoch": 1867} {"train_loss": -6.080878257751465, "global_step": 78439, "epoch": 1867} {"train_loss": -6.063728332519531, "global_step": 78440, "epoch": 1867} {"train_loss": -5.993183135986328, "global_step": 78441, "epoch": 1867} {"train_loss": -6.0409698486328125, "global_step": 78442, "epoch": 1867} {"train_loss": -5.9400129318237305, "global_step": 78443, "epoch": 1867} {"train_loss": -6.08276891708374, "global_step": 78444, "epoch": 1867} {"train_loss": -5.894189834594727, "global_step": 78445, "epoch": 1867} {"train_loss": -6.067170143127441, "global_step": 78446, "epoch": 1867} {"train_loss": -5.960038185119629, "global_step": 78447, "epoch": 1867} {"train_loss": -6.189347743988037, "global_step": 78448, "epoch": 1867} {"train_loss": -6.055272579193115, "global_step": 78449, "epoch": 1867} {"train_loss": -5.994034767150879, "global_step": 78450, "epoch": 1867} {"train_loss": -6.090814590454102, "global_step": 78451, "epoch": 1867} {"train_loss": -6.039851188659668, "global_step": 78452, "epoch": 1867} {"train_loss": -6.031563758850098, "global_step": 78453, "epoch": 1867} {"train_loss": -6.041393280029297, "global_step": 78454, "epoch": 1867} {"train_loss": -6.06196802003043, "global_step": 78455, "epoch": 1867, "val_loss": 67626.484375} {"train_loss": -6.185196876525879, "global_step": 78456, "epoch": 1868} {"train_loss": -6.120201110839844, "global_step": 78457, "epoch": 1868} {"train_loss": -6.166904449462891, "global_step": 78458, "epoch": 1868} {"train_loss": -6.021477699279785, "global_step": 78459, "epoch": 1868} {"train_loss": -6.081119537353516, "global_step": 78460, "epoch": 1868} {"train_loss": -6.175650596618652, "global_step": 78461, "epoch": 1868} {"train_loss": -5.989914417266846, "global_step": 78462, "epoch": 1868} {"train_loss": -6.056939125061035, "global_step": 78463, "epoch": 1868} {"train_loss": -6.010137557983398, "global_step": 78464, "epoch": 1868} {"train_loss": -6.167585372924805, "global_step": 78465, "epoch": 1868} {"train_loss": -5.965312957763672, "global_step": 78466, "epoch": 1868} {"train_loss": -6.020628929138184, "global_step": 78467, "epoch": 1868} {"train_loss": -6.204000473022461, "global_step": 78468, "epoch": 1868} {"train_loss": -5.992390155792236, "global_step": 78469, "epoch": 1868} {"train_loss": -6.069468021392822, "global_step": 78470, "epoch": 1868} {"train_loss": -6.0496296882629395, "global_step": 78471, "epoch": 1868} {"train_loss": -6.158782005310059, "global_step": 78472, "epoch": 1868} {"train_loss": -6.090440273284912, "global_step": 78473, "epoch": 1868} {"train_loss": -6.145139694213867, "global_step": 78474, "epoch": 1868} {"train_loss": -6.046329021453857, "global_step": 78475, "epoch": 1868} {"train_loss": -6.198757648468018, "global_step": 78476, "epoch": 1868} {"train_loss": -6.131539344787598, "global_step": 78477, "epoch": 1868} {"train_loss": -6.114075660705566, "global_step": 78478, "epoch": 1868} {"train_loss": -6.092341423034668, "global_step": 78479, "epoch": 1868} {"train_loss": -6.1571044921875, "global_step": 78480, "epoch": 1868} {"train_loss": -6.193083763122559, "global_step": 78481, "epoch": 1868} {"train_loss": -6.005164623260498, "global_step": 78482, "epoch": 1868} {"train_loss": -6.134186744689941, "global_step": 78483, "epoch": 1868} {"train_loss": -6.124776363372803, "global_step": 78484, "epoch": 1868} {"train_loss": -6.113263130187988, "global_step": 78485, "epoch": 1868} {"train_loss": -6.083592414855957, "global_step": 78486, "epoch": 1868} {"train_loss": -6.121554374694824, "global_step": 78487, "epoch": 1868} {"train_loss": -6.12468147277832, "global_step": 78488, "epoch": 1868} {"train_loss": -6.076882839202881, "global_step": 78489, "epoch": 1868} {"train_loss": -6.183930397033691, "global_step": 78490, "epoch": 1868} {"train_loss": -6.199953556060791, "global_step": 78491, "epoch": 1868} {"train_loss": -6.125690460205078, "global_step": 78492, "epoch": 1868} {"train_loss": -6.12640380859375, "global_step": 78493, "epoch": 1868} {"train_loss": -6.02994966506958, "global_step": 78494, "epoch": 1868} {"train_loss": -5.972629547119141, "global_step": 78495, "epoch": 1868} {"train_loss": -6.177769660949707, "global_step": 78496, "epoch": 1868} {"train_loss": -6.100986185527983, "global_step": 78497, "epoch": 1868, "val_loss": 67596.5859375} {"train_loss": -6.078522682189941, "global_step": 78498, "epoch": 1869} {"train_loss": -6.013578414916992, "global_step": 78499, "epoch": 1869} {"train_loss": -6.189811706542969, "global_step": 78500, "epoch": 1869} {"train_loss": -6.138968467712402, "global_step": 78501, "epoch": 1869} {"train_loss": -6.1737961769104, "global_step": 78502, "epoch": 1869} {"train_loss": -6.160869598388672, "global_step": 78503, "epoch": 1869} {"train_loss": -6.040841579437256, "global_step": 78504, "epoch": 1869} {"train_loss": -6.165966510772705, "global_step": 78505, "epoch": 1869} {"train_loss": -6.089982032775879, "global_step": 78506, "epoch": 1869} {"train_loss": -6.177994728088379, "global_step": 78507, "epoch": 1869} {"train_loss": -6.091485977172852, "global_step": 78508, "epoch": 1869} {"train_loss": -6.108782768249512, "global_step": 78509, "epoch": 1869} {"train_loss": -6.201084136962891, "global_step": 78510, "epoch": 1869} {"train_loss": -6.07744026184082, "global_step": 78511, "epoch": 1869} {"train_loss": -6.183019638061523, "global_step": 78512, "epoch": 1869} {"train_loss": -6.0923967361450195, "global_step": 78513, "epoch": 1869} {"train_loss": -6.207353591918945, "global_step": 78514, "epoch": 1869} {"train_loss": -6.174606800079346, "global_step": 78515, "epoch": 1869} {"train_loss": -6.022672653198242, "global_step": 78516, "epoch": 1869} {"train_loss": -6.1072998046875, "global_step": 78517, "epoch": 1869} {"train_loss": -5.980469703674316, "global_step": 78518, "epoch": 1869} {"train_loss": -6.112185955047607, "global_step": 78519, "epoch": 1869} {"train_loss": -6.175440788269043, "global_step": 78520, "epoch": 1869} {"train_loss": -6.094036102294922, "global_step": 78521, "epoch": 1869} {"train_loss": -6.025723934173584, "global_step": 78522, "epoch": 1869} {"train_loss": -6.166675567626953, "global_step": 78523, "epoch": 1869} {"train_loss": -6.058375358581543, "global_step": 78524, "epoch": 1869} {"train_loss": -6.041701316833496, "global_step": 78525, "epoch": 1869} {"train_loss": -6.173120498657227, "global_step": 78526, "epoch": 1869} {"train_loss": -6.016592979431152, "global_step": 78527, "epoch": 1869} {"train_loss": -6.1432952880859375, "global_step": 78528, "epoch": 1869} {"train_loss": -6.105679988861084, "global_step": 78529, "epoch": 1869} {"train_loss": -5.9509124755859375, "global_step": 78530, "epoch": 1869} {"train_loss": -6.181602478027344, "global_step": 78531, "epoch": 1869} {"train_loss": -5.9982805252075195, "global_step": 78532, "epoch": 1869} {"train_loss": -6.0461530685424805, "global_step": 78533, "epoch": 1869} {"train_loss": -6.104486465454102, "global_step": 78534, "epoch": 1869} {"train_loss": -6.093466758728027, "global_step": 78535, "epoch": 1869} {"train_loss": -6.102978706359863, "global_step": 78536, "epoch": 1869} {"train_loss": -6.046436786651611, "global_step": 78537, "epoch": 1869} {"train_loss": -6.12416410446167, "global_step": 78538, "epoch": 1869} {"train_loss": -6.101355643499465, "global_step": 78539, "epoch": 1869, "val_loss": 67552.5859375} {"train_loss": -6.1903605461120605, "global_step": 78540, "epoch": 1870} {"train_loss": -6.067086219787598, "global_step": 78541, "epoch": 1870} {"train_loss": -6.122139930725098, "global_step": 78542, "epoch": 1870} {"train_loss": -6.183601379394531, "global_step": 78543, "epoch": 1870} {"train_loss": -6.096547603607178, "global_step": 78544, "epoch": 1870} {"train_loss": -6.218803405761719, "global_step": 78545, "epoch": 1870} {"train_loss": -6.1081624031066895, "global_step": 78546, "epoch": 1870} {"train_loss": -6.143561363220215, "global_step": 78547, "epoch": 1870} {"train_loss": -6.0847272872924805, "global_step": 78548, "epoch": 1870} {"train_loss": -6.132778167724609, "global_step": 78549, "epoch": 1870} {"train_loss": -6.183414936065674, "global_step": 78550, "epoch": 1870} {"train_loss": -6.107203483581543, "global_step": 78551, "epoch": 1870} {"train_loss": -6.125303268432617, "global_step": 78552, "epoch": 1870} {"train_loss": -6.070098876953125, "global_step": 78553, "epoch": 1870} {"train_loss": -6.036054611206055, "global_step": 78554, "epoch": 1870} {"train_loss": -6.161805629730225, "global_step": 78555, "epoch": 1870} {"train_loss": -6.123694896697998, "global_step": 78556, "epoch": 1870} {"train_loss": -6.081377983093262, "global_step": 78557, "epoch": 1870} {"train_loss": -6.067795753479004, "global_step": 78558, "epoch": 1870} {"train_loss": -5.990428447723389, "global_step": 78559, "epoch": 1870} {"train_loss": -6.066872596740723, "global_step": 78560, "epoch": 1870} {"train_loss": -6.133047103881836, "global_step": 78561, "epoch": 1870} {"train_loss": -6.09475564956665, "global_step": 78562, "epoch": 1870} {"train_loss": -6.056515216827393, "global_step": 78563, "epoch": 1870} {"train_loss": -6.098973751068115, "global_step": 78564, "epoch": 1870} {"train_loss": -6.129075050354004, "global_step": 78565, "epoch": 1870} {"train_loss": -6.137330055236816, "global_step": 78566, "epoch": 1870} {"train_loss": -6.234150409698486, "global_step": 78567, "epoch": 1870} {"train_loss": -6.1798095703125, "global_step": 78568, "epoch": 1870} {"train_loss": -6.096697807312012, "global_step": 78569, "epoch": 1870} {"train_loss": -6.091917514801025, "global_step": 78570, "epoch": 1870} {"train_loss": -6.183993339538574, "global_step": 78571, "epoch": 1870} {"train_loss": -6.254408359527588, "global_step": 78572, "epoch": 1870} {"train_loss": -6.1201066970825195, "global_step": 78573, "epoch": 1870} {"train_loss": -6.108747482299805, "global_step": 78574, "epoch": 1870} {"train_loss": -6.043840408325195, "global_step": 78575, "epoch": 1870} {"train_loss": -6.209865570068359, "global_step": 78576, "epoch": 1870} {"train_loss": -6.046152114868164, "global_step": 78577, "epoch": 1870} {"train_loss": -6.035849094390869, "global_step": 78578, "epoch": 1870} {"train_loss": -6.079345703125, "global_step": 78579, "epoch": 1870} {"train_loss": -6.051002025604248, "global_step": 78580, "epoch": 1870} {"train_loss": -6.116810026622954, "global_step": 78581, "epoch": 1870, "val_loss": 67787.453125} {"train_loss": -6.180447578430176, "global_step": 78582, "epoch": 1871} {"train_loss": -6.1151814460754395, "global_step": 78583, "epoch": 1871} {"train_loss": -6.207776069641113, "global_step": 78584, "epoch": 1871} {"train_loss": -6.0508317947387695, "global_step": 78585, "epoch": 1871} {"train_loss": -6.158361434936523, "global_step": 78586, "epoch": 1871} {"train_loss": -6.160033226013184, "global_step": 78587, "epoch": 1871} {"train_loss": -6.222468376159668, "global_step": 78588, "epoch": 1871} {"train_loss": -6.10377311706543, "global_step": 78589, "epoch": 1871} {"train_loss": -6.011754035949707, "global_step": 78590, "epoch": 1871} {"train_loss": -5.97520637512207, "global_step": 78591, "epoch": 1871} {"train_loss": -6.138161659240723, "global_step": 78592, "epoch": 1871} {"train_loss": -6.1357598304748535, "global_step": 78593, "epoch": 1871} {"train_loss": -6.031970977783203, "global_step": 78594, "epoch": 1871} {"train_loss": -6.222501754760742, "global_step": 78595, "epoch": 1871} {"train_loss": -6.068201065063477, "global_step": 78596, "epoch": 1871} {"train_loss": -6.11102819442749, "global_step": 78597, "epoch": 1871} {"train_loss": -6.03154182434082, "global_step": 78598, "epoch": 1871} {"train_loss": -5.976308345794678, "global_step": 78599, "epoch": 1871} {"train_loss": -6.159438133239746, "global_step": 78600, "epoch": 1871} {"train_loss": -5.960747718811035, "global_step": 78601, "epoch": 1871} {"train_loss": -6.131951332092285, "global_step": 78602, "epoch": 1871} {"train_loss": -6.081040382385254, "global_step": 78603, "epoch": 1871} {"train_loss": -6.150201320648193, "global_step": 78604, "epoch": 1871} {"train_loss": -6.167072296142578, "global_step": 78605, "epoch": 1871} {"train_loss": -6.071459770202637, "global_step": 78606, "epoch": 1871} {"train_loss": -5.989984512329102, "global_step": 78607, "epoch": 1871} {"train_loss": -6.100612640380859, "global_step": 78608, "epoch": 1871} {"train_loss": -6.154590606689453, "global_step": 78609, "epoch": 1871} {"train_loss": -6.000176429748535, "global_step": 78610, "epoch": 1871} {"train_loss": -6.2390899658203125, "global_step": 78611, "epoch": 1871} {"train_loss": -6.051807880401611, "global_step": 78612, "epoch": 1871} {"train_loss": -6.0262837409973145, "global_step": 78613, "epoch": 1871} {"train_loss": -6.106173038482666, "global_step": 78614, "epoch": 1871} {"train_loss": -6.10138463973999, "global_step": 78615, "epoch": 1871} {"train_loss": -6.0474395751953125, "global_step": 78616, "epoch": 1871} {"train_loss": -6.03195858001709, "global_step": 78617, "epoch": 1871} {"train_loss": -6.056278228759766, "global_step": 78618, "epoch": 1871} {"train_loss": -6.128862380981445, "global_step": 78619, "epoch": 1871} {"train_loss": -6.07785177230835, "global_step": 78620, "epoch": 1871} {"train_loss": -6.1443586349487305, "global_step": 78621, "epoch": 1871} {"train_loss": -6.109444618225098, "global_step": 78622, "epoch": 1871} {"train_loss": -6.096569583529518, "global_step": 78623, "epoch": 1871, "val_loss": 67629.9375} {"train_loss": -6.155663013458252, "global_step": 78624, "epoch": 1872} {"train_loss": -6.190914630889893, "global_step": 78625, "epoch": 1872} {"train_loss": -6.136448383331299, "global_step": 78626, "epoch": 1872} {"train_loss": -6.095783233642578, "global_step": 78627, "epoch": 1872} {"train_loss": -6.154292106628418, "global_step": 78628, "epoch": 1872} {"train_loss": -6.032114505767822, "global_step": 78629, "epoch": 1872} {"train_loss": -6.105783462524414, "global_step": 78630, "epoch": 1872} {"train_loss": -6.105039596557617, "global_step": 78631, "epoch": 1872} {"train_loss": -6.119494438171387, "global_step": 78632, "epoch": 1872} {"train_loss": -5.964135646820068, "global_step": 78633, "epoch": 1872} {"train_loss": -5.983673095703125, "global_step": 78634, "epoch": 1872} {"train_loss": -6.176738739013672, "global_step": 78635, "epoch": 1872} {"train_loss": -6.049308776855469, "global_step": 78636, "epoch": 1872} {"train_loss": -6.246435642242432, "global_step": 78637, "epoch": 1872} {"train_loss": -6.113944053649902, "global_step": 78638, "epoch": 1872} {"train_loss": -6.008988380432129, "global_step": 78639, "epoch": 1872} {"train_loss": -6.088319778442383, "global_step": 78640, "epoch": 1872} {"train_loss": -6.0676398277282715, "global_step": 78641, "epoch": 1872} {"train_loss": -6.140767574310303, "global_step": 78642, "epoch": 1872} {"train_loss": -6.076784133911133, "global_step": 78643, "epoch": 1872} {"train_loss": -6.086285591125488, "global_step": 78644, "epoch": 1872} {"train_loss": -6.119083404541016, "global_step": 78645, "epoch": 1872} {"train_loss": -6.0530548095703125, "global_step": 78646, "epoch": 1872} {"train_loss": -6.1168928146362305, "global_step": 78647, "epoch": 1872} {"train_loss": -6.220086097717285, "global_step": 78648, "epoch": 1872} {"train_loss": -6.112842082977295, "global_step": 78649, "epoch": 1872} {"train_loss": -6.03975248336792, "global_step": 78650, "epoch": 1872} {"train_loss": -6.125262260437012, "global_step": 78651, "epoch": 1872} {"train_loss": -6.076106071472168, "global_step": 78652, "epoch": 1872} {"train_loss": -6.142065048217773, "global_step": 78653, "epoch": 1872} {"train_loss": -6.276912689208984, "global_step": 78654, "epoch": 1872} {"train_loss": -6.224698543548584, "global_step": 78655, "epoch": 1872} {"train_loss": -6.061816215515137, "global_step": 78656, "epoch": 1872} {"train_loss": -6.2204179763793945, "global_step": 78657, "epoch": 1872} {"train_loss": -6.21598482131958, "global_step": 78658, "epoch": 1872} {"train_loss": -6.170278549194336, "global_step": 78659, "epoch": 1872} {"train_loss": -6.223484992980957, "global_step": 78660, "epoch": 1872} {"train_loss": -6.165431976318359, "global_step": 78661, "epoch": 1872} {"train_loss": -6.217707633972168, "global_step": 78662, "epoch": 1872} {"train_loss": -6.094025135040283, "global_step": 78663, "epoch": 1872} {"train_loss": -6.086442470550537, "global_step": 78664, "epoch": 1872} {"train_loss": -6.121073018936884, "global_step": 78665, "epoch": 1872, "val_loss": 67520.578125} {"train_loss": -6.035802364349365, "global_step": 78666, "epoch": 1873} {"train_loss": -6.119353771209717, "global_step": 78667, "epoch": 1873} {"train_loss": -6.247427463531494, "global_step": 78668, "epoch": 1873} {"train_loss": -6.07469367980957, "global_step": 78669, "epoch": 1873} {"train_loss": -6.06581449508667, "global_step": 78670, "epoch": 1873} {"train_loss": -6.186392784118652, "global_step": 78671, "epoch": 1873} {"train_loss": -6.252270698547363, "global_step": 78672, "epoch": 1873} {"train_loss": -6.121589660644531, "global_step": 78673, "epoch": 1873} {"train_loss": -6.089084625244141, "global_step": 78674, "epoch": 1873} {"train_loss": -6.03253173828125, "global_step": 78675, "epoch": 1873} {"train_loss": -6.138410568237305, "global_step": 78676, "epoch": 1873} {"train_loss": -6.178592681884766, "global_step": 78677, "epoch": 1873} {"train_loss": -6.083406448364258, "global_step": 78678, "epoch": 1873} {"train_loss": -6.101898193359375, "global_step": 78679, "epoch": 1873} {"train_loss": -6.184086799621582, "global_step": 78680, "epoch": 1873} {"train_loss": -6.219194412231445, "global_step": 78681, "epoch": 1873} {"train_loss": -6.0745849609375, "global_step": 78682, "epoch": 1873} {"train_loss": -6.195493698120117, "global_step": 78683, "epoch": 1873} {"train_loss": -6.084205627441406, "global_step": 78684, "epoch": 1873} {"train_loss": -6.192795753479004, "global_step": 78685, "epoch": 1873} {"train_loss": -6.095439910888672, "global_step": 78686, "epoch": 1873} {"train_loss": -6.0900421142578125, "global_step": 78687, "epoch": 1873} {"train_loss": -6.1510725021362305, "global_step": 78688, "epoch": 1873} {"train_loss": -6.02226448059082, "global_step": 78689, "epoch": 1873} {"train_loss": -6.196601390838623, "global_step": 78690, "epoch": 1873} {"train_loss": -5.940756320953369, "global_step": 78691, "epoch": 1873} {"train_loss": -6.117733955383301, "global_step": 78692, "epoch": 1873} {"train_loss": -6.02639627456665, "global_step": 78693, "epoch": 1873} {"train_loss": -6.154755592346191, "global_step": 78694, "epoch": 1873} {"train_loss": -6.0795698165893555, "global_step": 78695, "epoch": 1873} {"train_loss": -6.099621772766113, "global_step": 78696, "epoch": 1873} {"train_loss": -6.11782693862915, "global_step": 78697, "epoch": 1873} {"train_loss": -5.949112892150879, "global_step": 78698, "epoch": 1873} {"train_loss": -6.09083366394043, "global_step": 78699, "epoch": 1873} {"train_loss": -6.0015482902526855, "global_step": 78700, "epoch": 1873} {"train_loss": -6.148052215576172, "global_step": 78701, "epoch": 1873} {"train_loss": -6.159344673156738, "global_step": 78702, "epoch": 1873} {"train_loss": -6.072344779968262, "global_step": 78703, "epoch": 1873} {"train_loss": -6.0616774559021, "global_step": 78704, "epoch": 1873} {"train_loss": -6.040573596954346, "global_step": 78705, "epoch": 1873} {"train_loss": -6.112709045410156, "global_step": 78706, "epoch": 1873} {"train_loss": -6.1055451801845, "global_step": 78707, "epoch": 1873, "val_loss": 67676.6640625} {"train_loss": -6.132154941558838, "global_step": 78708, "epoch": 1874} {"train_loss": -6.177999019622803, "global_step": 78709, "epoch": 1874} {"train_loss": -6.199819564819336, "global_step": 78710, "epoch": 1874} {"train_loss": -6.210820198059082, "global_step": 78711, "epoch": 1874} {"train_loss": -6.091520309448242, "global_step": 78712, "epoch": 1874} {"train_loss": -6.1810526847839355, "global_step": 78713, "epoch": 1874} {"train_loss": -6.195828437805176, "global_step": 78714, "epoch": 1874} {"train_loss": -6.211181640625, "global_step": 78715, "epoch": 1874} {"train_loss": -6.153947830200195, "global_step": 78716, "epoch": 1874} {"train_loss": -6.100486755371094, "global_step": 78717, "epoch": 1874} {"train_loss": -6.108245849609375, "global_step": 78718, "epoch": 1874} {"train_loss": -6.03361177444458, "global_step": 78719, "epoch": 1874} {"train_loss": -6.215905666351318, "global_step": 78720, "epoch": 1874} {"train_loss": -6.05559778213501, "global_step": 78721, "epoch": 1874} {"train_loss": -6.148481369018555, "global_step": 78722, "epoch": 1874} {"train_loss": -6.127536773681641, "global_step": 78723, "epoch": 1874} {"train_loss": -6.136263847351074, "global_step": 78724, "epoch": 1874} {"train_loss": -6.066096305847168, "global_step": 78725, "epoch": 1874} {"train_loss": -6.272228240966797, "global_step": 78726, "epoch": 1874} {"train_loss": -6.1361002922058105, "global_step": 78727, "epoch": 1874} {"train_loss": -6.129626750946045, "global_step": 78728, "epoch": 1874} {"train_loss": -6.184846878051758, "global_step": 78729, "epoch": 1874} {"train_loss": -6.018152236938477, "global_step": 78730, "epoch": 1874} {"train_loss": -6.144296646118164, "global_step": 78731, "epoch": 1874} {"train_loss": -6.137755393981934, "global_step": 78732, "epoch": 1874} {"train_loss": -6.157456398010254, "global_step": 78733, "epoch": 1874} {"train_loss": -6.120975494384766, "global_step": 78734, "epoch": 1874} {"train_loss": -6.150944709777832, "global_step": 78735, "epoch": 1874} {"train_loss": -6.203604698181152, "global_step": 78736, "epoch": 1874} {"train_loss": -6.053116321563721, "global_step": 78737, "epoch": 1874} {"train_loss": -6.045512676239014, "global_step": 78738, "epoch": 1874} {"train_loss": -6.148667812347412, "global_step": 78739, "epoch": 1874} {"train_loss": -5.958332061767578, "global_step": 78740, "epoch": 1874} {"train_loss": -6.010101795196533, "global_step": 78741, "epoch": 1874} {"train_loss": -5.983520984649658, "global_step": 78742, "epoch": 1874} {"train_loss": -6.053398132324219, "global_step": 78743, "epoch": 1874} {"train_loss": -6.026979446411133, "global_step": 78744, "epoch": 1874} {"train_loss": -6.039908409118652, "global_step": 78745, "epoch": 1874} {"train_loss": -6.054018020629883, "global_step": 78746, "epoch": 1874} {"train_loss": -6.063476085662842, "global_step": 78747, "epoch": 1874} {"train_loss": -6.030014514923096, "global_step": 78748, "epoch": 1874} {"train_loss": -6.1089907714298795, "global_step": 78749, "epoch": 1874, "val_loss": 67438.7890625} {"train_loss": -6.125068664550781, "global_step": 78750, "epoch": 1875} {"train_loss": -5.980107307434082, "global_step": 78751, "epoch": 1875} {"train_loss": -6.16281795501709, "global_step": 78752, "epoch": 1875} {"train_loss": -5.961270332336426, "global_step": 78753, "epoch": 1875} {"train_loss": -6.007633209228516, "global_step": 78754, "epoch": 1875} {"train_loss": -6.098797798156738, "global_step": 78755, "epoch": 1875} {"train_loss": -5.991546630859375, "global_step": 78756, "epoch": 1875} {"train_loss": -6.007573127746582, "global_step": 78757, "epoch": 1875} {"train_loss": -6.04243278503418, "global_step": 78758, "epoch": 1875} {"train_loss": -6.113712787628174, "global_step": 78759, "epoch": 1875} {"train_loss": -6.145443916320801, "global_step": 78760, "epoch": 1875} {"train_loss": -6.159442901611328, "global_step": 78761, "epoch": 1875} {"train_loss": -6.105169296264648, "global_step": 78762, "epoch": 1875} {"train_loss": -6.0317301750183105, "global_step": 78763, "epoch": 1875} {"train_loss": -5.939729690551758, "global_step": 78764, "epoch": 1875} {"train_loss": -6.145341873168945, "global_step": 78765, "epoch": 1875} {"train_loss": -5.923970699310303, "global_step": 78766, "epoch": 1875} {"train_loss": -5.905503273010254, "global_step": 78767, "epoch": 1875} {"train_loss": -5.93625545501709, "global_step": 78768, "epoch": 1875} {"train_loss": -5.960780620574951, "global_step": 78769, "epoch": 1875} {"train_loss": -6.15560245513916, "global_step": 78770, "epoch": 1875} {"train_loss": -6.065359115600586, "global_step": 78771, "epoch": 1875} {"train_loss": -6.210604667663574, "global_step": 78772, "epoch": 1875} {"train_loss": -6.1889328956604, "global_step": 78773, "epoch": 1875} {"train_loss": -6.201108455657959, "global_step": 78774, "epoch": 1875} {"train_loss": -6.249156951904297, "global_step": 78775, "epoch": 1875} {"train_loss": -6.186765670776367, "global_step": 78776, "epoch": 1875} {"train_loss": -6.14080286026001, "global_step": 78777, "epoch": 1875} {"train_loss": -6.19852352142334, "global_step": 78778, "epoch": 1875} {"train_loss": -6.0934977531433105, "global_step": 78779, "epoch": 1875} {"train_loss": -6.1110734939575195, "global_step": 78780, "epoch": 1875} {"train_loss": -6.152841567993164, "global_step": 78781, "epoch": 1875} {"train_loss": -6.12221622467041, "global_step": 78782, "epoch": 1875} {"train_loss": -6.1206817626953125, "global_step": 78783, "epoch": 1875} {"train_loss": -6.171815872192383, "global_step": 78784, "epoch": 1875} {"train_loss": -6.045155048370361, "global_step": 78785, "epoch": 1875} {"train_loss": -6.054507732391357, "global_step": 78786, "epoch": 1875} {"train_loss": -6.123969554901123, "global_step": 78787, "epoch": 1875} {"train_loss": -6.061190128326416, "global_step": 78788, "epoch": 1875} {"train_loss": -6.069069862365723, "global_step": 78789, "epoch": 1875} {"train_loss": -6.11257266998291, "global_step": 78790, "epoch": 1875} {"train_loss": -6.089695101692563, "global_step": 78791, "epoch": 1875, "val_loss": 67547.9921875} {"train_loss": -6.157576084136963, "global_step": 78792, "epoch": 1876} {"train_loss": -6.110740661621094, "global_step": 78793, "epoch": 1876} {"train_loss": -6.187801837921143, "global_step": 78794, "epoch": 1876} {"train_loss": -6.139074325561523, "global_step": 78795, "epoch": 1876} {"train_loss": -6.141878128051758, "global_step": 78796, "epoch": 1876} {"train_loss": -6.183056354522705, "global_step": 78797, "epoch": 1876} {"train_loss": -6.1906046867370605, "global_step": 78798, "epoch": 1876} {"train_loss": -6.111438751220703, "global_step": 78799, "epoch": 1876} {"train_loss": -6.087887763977051, "global_step": 78800, "epoch": 1876} {"train_loss": -6.125629425048828, "global_step": 78801, "epoch": 1876} {"train_loss": -6.079394340515137, "global_step": 78802, "epoch": 1876} {"train_loss": -6.0867486000061035, "global_step": 78803, "epoch": 1876} {"train_loss": -6.123598098754883, "global_step": 78804, "epoch": 1876} {"train_loss": -6.10243558883667, "global_step": 78805, "epoch": 1876} {"train_loss": -6.151666641235352, "global_step": 78806, "epoch": 1876} {"train_loss": -6.097958564758301, "global_step": 78807, "epoch": 1876} {"train_loss": -6.072673320770264, "global_step": 78808, "epoch": 1876} {"train_loss": -6.200659275054932, "global_step": 78809, "epoch": 1876} {"train_loss": -5.979763984680176, "global_step": 78810, "epoch": 1876} {"train_loss": -6.154197692871094, "global_step": 78811, "epoch": 1876} {"train_loss": -6.159402847290039, "global_step": 78812, "epoch": 1876} {"train_loss": -6.032654762268066, "global_step": 78813, "epoch": 1876} {"train_loss": -6.155420780181885, "global_step": 78814, "epoch": 1876} {"train_loss": -6.028841018676758, "global_step": 78815, "epoch": 1876} {"train_loss": -5.983356475830078, "global_step": 78816, "epoch": 1876} {"train_loss": -6.169747352600098, "global_step": 78817, "epoch": 1876} {"train_loss": -6.115377426147461, "global_step": 78818, "epoch": 1876} {"train_loss": -6.010357856750488, "global_step": 78819, "epoch": 1876} {"train_loss": -6.066856384277344, "global_step": 78820, "epoch": 1876} {"train_loss": -6.034880638122559, "global_step": 78821, "epoch": 1876} {"train_loss": -6.198537826538086, "global_step": 78822, "epoch": 1876} {"train_loss": -6.116888999938965, "global_step": 78823, "epoch": 1876} {"train_loss": -6.119849681854248, "global_step": 78824, "epoch": 1876} {"train_loss": -6.026790142059326, "global_step": 78825, "epoch": 1876} {"train_loss": -6.075596809387207, "global_step": 78826, "epoch": 1876} {"train_loss": -6.046148300170898, "global_step": 78827, "epoch": 1876} {"train_loss": -6.20088529586792, "global_step": 78828, "epoch": 1876} {"train_loss": -6.13468074798584, "global_step": 78829, "epoch": 1876} {"train_loss": -6.117300510406494, "global_step": 78830, "epoch": 1876} {"train_loss": -6.109768867492676, "global_step": 78831, "epoch": 1876} {"train_loss": -6.186932563781738, "global_step": 78832, "epoch": 1876} {"train_loss": -6.1130209763844805, "global_step": 78833, "epoch": 1876, "val_loss": 67553.3203125} {"train_loss": -6.114016532897949, "global_step": 78834, "epoch": 1877} {"train_loss": -6.144457817077637, "global_step": 78835, "epoch": 1877} {"train_loss": -6.091582298278809, "global_step": 78836, "epoch": 1877} {"train_loss": -6.193563461303711, "global_step": 78837, "epoch": 1877} {"train_loss": -6.15329122543335, "global_step": 78838, "epoch": 1877} {"train_loss": -6.061054229736328, "global_step": 78839, "epoch": 1877} {"train_loss": -6.155978679656982, "global_step": 78840, "epoch": 1877} {"train_loss": -6.039589881896973, "global_step": 78841, "epoch": 1877} {"train_loss": -6.180016040802002, "global_step": 78842, "epoch": 1877} {"train_loss": -6.181075096130371, "global_step": 78843, "epoch": 1877} {"train_loss": -6.061675071716309, "global_step": 78844, "epoch": 1877} {"train_loss": -6.108162879943848, "global_step": 78845, "epoch": 1877} {"train_loss": -6.124014377593994, "global_step": 78846, "epoch": 1877} {"train_loss": -6.153993606567383, "global_step": 78847, "epoch": 1877} {"train_loss": -6.2077317237854, "global_step": 78848, "epoch": 1877} {"train_loss": -6.07233190536499, "global_step": 78849, "epoch": 1877} {"train_loss": -6.0111799240112305, "global_step": 78850, "epoch": 1877} {"train_loss": -6.122747898101807, "global_step": 78851, "epoch": 1877} {"train_loss": -6.078814506530762, "global_step": 78852, "epoch": 1877} {"train_loss": -6.122933387756348, "global_step": 78853, "epoch": 1877} {"train_loss": -6.177026271820068, "global_step": 78854, "epoch": 1877} {"train_loss": -6.110843658447266, "global_step": 78855, "epoch": 1877} {"train_loss": -6.04866886138916, "global_step": 78856, "epoch": 1877} {"train_loss": -6.144953727722168, "global_step": 78857, "epoch": 1877} {"train_loss": -6.137659072875977, "global_step": 78858, "epoch": 1877} {"train_loss": -6.127864837646484, "global_step": 78859, "epoch": 1877} {"train_loss": -6.027162551879883, "global_step": 78860, "epoch": 1877} {"train_loss": -6.113065242767334, "global_step": 78861, "epoch": 1877} {"train_loss": -6.15782356262207, "global_step": 78862, "epoch": 1877} {"train_loss": -6.088031768798828, "global_step": 78863, "epoch": 1877} {"train_loss": -6.132763385772705, "global_step": 78864, "epoch": 1877} {"train_loss": -6.0605974197387695, "global_step": 78865, "epoch": 1877} {"train_loss": -6.050786018371582, "global_step": 78866, "epoch": 1877} {"train_loss": -6.144018173217773, "global_step": 78867, "epoch": 1877} {"train_loss": -5.985143661499023, "global_step": 78868, "epoch": 1877} {"train_loss": -6.128215789794922, "global_step": 78869, "epoch": 1877} {"train_loss": -6.101012229919434, "global_step": 78870, "epoch": 1877} {"train_loss": -6.035155773162842, "global_step": 78871, "epoch": 1877} {"train_loss": -6.131221294403076, "global_step": 78872, "epoch": 1877} {"train_loss": -6.071065902709961, "global_step": 78873, "epoch": 1877} {"train_loss": -6.0334086418151855, "global_step": 78874, "epoch": 1877} {"train_loss": -6.106507721401396, "global_step": 78875, "epoch": 1877, "val_loss": 67728.34375} {"train_loss": -5.964313507080078, "global_step": 78876, "epoch": 1878} {"train_loss": -6.048542022705078, "global_step": 78877, "epoch": 1878} {"train_loss": -6.0465803146362305, "global_step": 78878, "epoch": 1878} {"train_loss": -6.067105293273926, "global_step": 78879, "epoch": 1878} {"train_loss": -6.046158790588379, "global_step": 78880, "epoch": 1878} {"train_loss": -6.06896448135376, "global_step": 78881, "epoch": 1878} {"train_loss": -6.03606653213501, "global_step": 78882, "epoch": 1878} {"train_loss": -6.110860824584961, "global_step": 78883, "epoch": 1878} {"train_loss": -6.037027359008789, "global_step": 78884, "epoch": 1878} {"train_loss": -6.192620277404785, "global_step": 78885, "epoch": 1878} {"train_loss": -6.093862056732178, "global_step": 78886, "epoch": 1878} {"train_loss": -6.033238887786865, "global_step": 78887, "epoch": 1878} {"train_loss": -6.109172821044922, "global_step": 78888, "epoch": 1878} {"train_loss": -6.049079895019531, "global_step": 78889, "epoch": 1878} {"train_loss": -6.145718097686768, "global_step": 78890, "epoch": 1878} {"train_loss": -6.091466426849365, "global_step": 78891, "epoch": 1878} {"train_loss": -6.177181720733643, "global_step": 78892, "epoch": 1878} {"train_loss": -6.1101298332214355, "global_step": 78893, "epoch": 1878} {"train_loss": -6.140285015106201, "global_step": 78894, "epoch": 1878} {"train_loss": -6.146743297576904, "global_step": 78895, "epoch": 1878} {"train_loss": -6.1928815841674805, "global_step": 78896, "epoch": 1878} {"train_loss": -6.002188205718994, "global_step": 78897, "epoch": 1878} {"train_loss": -6.015498161315918, "global_step": 78898, "epoch": 1878} {"train_loss": -6.166425704956055, "global_step": 78899, "epoch": 1878} {"train_loss": -6.037837028503418, "global_step": 78900, "epoch": 1878} {"train_loss": -6.006597995758057, "global_step": 78901, "epoch": 1878} {"train_loss": -6.119497299194336, "global_step": 78902, "epoch": 1878} {"train_loss": -6.1235785484313965, "global_step": 78903, "epoch": 1878} {"train_loss": -6.087930679321289, "global_step": 78904, "epoch": 1878} {"train_loss": -6.057950973510742, "global_step": 78905, "epoch": 1878} {"train_loss": -5.998434066772461, "global_step": 78906, "epoch": 1878} {"train_loss": -6.191981315612793, "global_step": 78907, "epoch": 1878} {"train_loss": -6.242142200469971, "global_step": 78908, "epoch": 1878} {"train_loss": -6.195254325866699, "global_step": 78909, "epoch": 1878} {"train_loss": -6.131745338439941, "global_step": 78910, "epoch": 1878} {"train_loss": -6.164320945739746, "global_step": 78911, "epoch": 1878} {"train_loss": -6.1154093742370605, "global_step": 78912, "epoch": 1878} {"train_loss": -6.097329139709473, "global_step": 78913, "epoch": 1878} {"train_loss": -6.067582130432129, "global_step": 78914, "epoch": 1878} {"train_loss": -6.023559093475342, "global_step": 78915, "epoch": 1878} {"train_loss": -6.095128536224365, "global_step": 78916, "epoch": 1878} {"train_loss": -6.093451363699777, "global_step": 78917, "epoch": 1878, "val_loss": 67690.78125} {"train_loss": -6.103333473205566, "global_step": 78918, "epoch": 1879} {"train_loss": -6.13555908203125, "global_step": 78919, "epoch": 1879} {"train_loss": -6.102973937988281, "global_step": 78920, "epoch": 1879} {"train_loss": -6.257859230041504, "global_step": 78921, "epoch": 1879} {"train_loss": -6.114980220794678, "global_step": 78922, "epoch": 1879} {"train_loss": -6.102664947509766, "global_step": 78923, "epoch": 1879} {"train_loss": -6.230173110961914, "global_step": 78924, "epoch": 1879} {"train_loss": -6.090344429016113, "global_step": 78925, "epoch": 1879} {"train_loss": -6.183751106262207, "global_step": 78926, "epoch": 1879} {"train_loss": -6.068021774291992, "global_step": 78927, "epoch": 1879} {"train_loss": -6.075052738189697, "global_step": 78928, "epoch": 1879} {"train_loss": -5.981895446777344, "global_step": 78929, "epoch": 1879} {"train_loss": -5.9664812088012695, "global_step": 78930, "epoch": 1879} {"train_loss": -6.109958648681641, "global_step": 78931, "epoch": 1879} {"train_loss": -6.092536449432373, "global_step": 78932, "epoch": 1879} {"train_loss": -6.145971298217773, "global_step": 78933, "epoch": 1879} {"train_loss": -6.107999324798584, "global_step": 78934, "epoch": 1879} {"train_loss": -6.089773178100586, "global_step": 78935, "epoch": 1879} {"train_loss": -6.079476356506348, "global_step": 78936, "epoch": 1879} {"train_loss": -6.106296062469482, "global_step": 78937, "epoch": 1879} {"train_loss": -6.113468170166016, "global_step": 78938, "epoch": 1879} {"train_loss": -6.221452713012695, "global_step": 78939, "epoch": 1879} {"train_loss": -6.230584144592285, "global_step": 78940, "epoch": 1879} {"train_loss": -6.087155342102051, "global_step": 78941, "epoch": 1879} {"train_loss": -6.196226119995117, "global_step": 78942, "epoch": 1879} {"train_loss": -6.154453277587891, "global_step": 78943, "epoch": 1879} {"train_loss": -6.135499954223633, "global_step": 78944, "epoch": 1879} {"train_loss": -6.159212589263916, "global_step": 78945, "epoch": 1879} {"train_loss": -6.179739952087402, "global_step": 78946, "epoch": 1879} {"train_loss": -6.042986869812012, "global_step": 78947, "epoch": 1879} {"train_loss": -6.196562767028809, "global_step": 78948, "epoch": 1879} {"train_loss": -6.128543853759766, "global_step": 78949, "epoch": 1879} {"train_loss": -5.997308731079102, "global_step": 78950, "epoch": 1879} {"train_loss": -6.183907508850098, "global_step": 78951, "epoch": 1879} {"train_loss": -6.165122985839844, "global_step": 78952, "epoch": 1879} {"train_loss": -6.0311994552612305, "global_step": 78953, "epoch": 1879} {"train_loss": -6.0663933753967285, "global_step": 78954, "epoch": 1879} {"train_loss": -6.1316938400268555, "global_step": 78955, "epoch": 1879} {"train_loss": -6.239238739013672, "global_step": 78956, "epoch": 1879} {"train_loss": -6.094600677490234, "global_step": 78957, "epoch": 1879} {"train_loss": -6.117122650146484, "global_step": 78958, "epoch": 1879} {"train_loss": -6.122237682342529, "global_step": 78959, "epoch": 1879, "val_loss": 67771.265625} {"train_loss": -6.124359130859375, "global_step": 78960, "epoch": 1880} {"train_loss": -6.074358940124512, "global_step": 78961, "epoch": 1880} {"train_loss": -6.212152004241943, "global_step": 78962, "epoch": 1880} {"train_loss": -6.084129333496094, "global_step": 78963, "epoch": 1880} {"train_loss": -6.129784107208252, "global_step": 78964, "epoch": 1880} {"train_loss": -6.1425957679748535, "global_step": 78965, "epoch": 1880} {"train_loss": -6.042117118835449, "global_step": 78966, "epoch": 1880} {"train_loss": -6.098930358886719, "global_step": 78967, "epoch": 1880} {"train_loss": -6.134340763092041, "global_step": 78968, "epoch": 1880} {"train_loss": -6.108219146728516, "global_step": 78969, "epoch": 1880} {"train_loss": -6.116846084594727, "global_step": 78970, "epoch": 1880} {"train_loss": -5.912237167358398, "global_step": 78971, "epoch": 1880} {"train_loss": -6.226630687713623, "global_step": 78972, "epoch": 1880} {"train_loss": -6.074471950531006, "global_step": 78973, "epoch": 1880} {"train_loss": -6.1371026039123535, "global_step": 78974, "epoch": 1880} {"train_loss": -6.13975191116333, "global_step": 78975, "epoch": 1880} {"train_loss": -6.132124423980713, "global_step": 78976, "epoch": 1880} {"train_loss": -6.19862174987793, "global_step": 78977, "epoch": 1880} {"train_loss": -5.960694313049316, "global_step": 78978, "epoch": 1880} {"train_loss": -6.037563800811768, "global_step": 78979, "epoch": 1880} {"train_loss": -6.038995742797852, "global_step": 78980, "epoch": 1880} {"train_loss": -6.114953994750977, "global_step": 78981, "epoch": 1880} {"train_loss": -6.082450866699219, "global_step": 78982, "epoch": 1880} {"train_loss": -6.038636207580566, "global_step": 78983, "epoch": 1880} {"train_loss": -6.041532516479492, "global_step": 78984, "epoch": 1880} {"train_loss": -6.136887550354004, "global_step": 78985, "epoch": 1880} {"train_loss": -6.0196452140808105, "global_step": 78986, "epoch": 1880} {"train_loss": -5.971949577331543, "global_step": 78987, "epoch": 1880} {"train_loss": -6.162750244140625, "global_step": 78988, "epoch": 1880} {"train_loss": -6.066943168640137, "global_step": 78989, "epoch": 1880} {"train_loss": -6.091501235961914, "global_step": 78990, "epoch": 1880} {"train_loss": -6.126319408416748, "global_step": 78991, "epoch": 1880} {"train_loss": -5.902167320251465, "global_step": 78992, "epoch": 1880} {"train_loss": -6.185492515563965, "global_step": 78993, "epoch": 1880} {"train_loss": -5.98662805557251, "global_step": 78994, "epoch": 1880} {"train_loss": -5.978094100952148, "global_step": 78995, "epoch": 1880} {"train_loss": -6.155771255493164, "global_step": 78996, "epoch": 1880} {"train_loss": -6.096692085266113, "global_step": 78997, "epoch": 1880} {"train_loss": -6.114361763000488, "global_step": 78998, "epoch": 1880} {"train_loss": -6.1859283447265625, "global_step": 78999, "epoch": 1880} {"train_loss": -6.250340461730957, "global_step": 79000, "epoch": 1880} {"train_loss": -6.093571220125471, "global_step": 79001, "epoch": 1880, "val_loss": 67644.0703125} {"train_loss": -6.132687568664551, "global_step": 79002, "epoch": 1881} {"train_loss": -6.135746955871582, "global_step": 79003, "epoch": 1881} {"train_loss": -6.040597438812256, "global_step": 79004, "epoch": 1881} {"train_loss": -6.054086685180664, "global_step": 79005, "epoch": 1881} {"train_loss": -6.031379699707031, "global_step": 79006, "epoch": 1881} {"train_loss": -6.127305030822754, "global_step": 79007, "epoch": 1881} {"train_loss": -6.21873140335083, "global_step": 79008, "epoch": 1881} {"train_loss": -6.134291648864746, "global_step": 79009, "epoch": 1881} {"train_loss": -6.151946067810059, "global_step": 79010, "epoch": 1881} {"train_loss": -6.094663143157959, "global_step": 79011, "epoch": 1881} {"train_loss": -6.165127754211426, "global_step": 79012, "epoch": 1881} {"train_loss": -6.048543930053711, "global_step": 79013, "epoch": 1881} {"train_loss": -6.1763482093811035, "global_step": 79014, "epoch": 1881} {"train_loss": -6.1029205322265625, "global_step": 79015, "epoch": 1881} {"train_loss": -6.170633316040039, "global_step": 79016, "epoch": 1881} {"train_loss": -6.100558280944824, "global_step": 79017, "epoch": 1881} {"train_loss": -6.254825115203857, "global_step": 79018, "epoch": 1881} {"train_loss": -6.167014122009277, "global_step": 79019, "epoch": 1881} {"train_loss": -6.114544868469238, "global_step": 79020, "epoch": 1881} {"train_loss": -6.170623779296875, "global_step": 79021, "epoch": 1881} {"train_loss": -6.102154731750488, "global_step": 79022, "epoch": 1881} {"train_loss": -6.040527820587158, "global_step": 79023, "epoch": 1881} {"train_loss": -6.17898416519165, "global_step": 79024, "epoch": 1881} {"train_loss": -6.240688800811768, "global_step": 79025, "epoch": 1881} {"train_loss": -6.112238883972168, "global_step": 79026, "epoch": 1881} {"train_loss": -6.26074743270874, "global_step": 79027, "epoch": 1881} {"train_loss": -6.074781894683838, "global_step": 79028, "epoch": 1881} {"train_loss": -6.200471878051758, "global_step": 79029, "epoch": 1881} {"train_loss": -6.068965435028076, "global_step": 79030, "epoch": 1881} {"train_loss": -6.207686424255371, "global_step": 79031, "epoch": 1881} {"train_loss": -6.161143779754639, "global_step": 79032, "epoch": 1881} {"train_loss": -6.208300590515137, "global_step": 79033, "epoch": 1881} {"train_loss": -6.053433418273926, "global_step": 79034, "epoch": 1881} {"train_loss": -6.165173053741455, "global_step": 79035, "epoch": 1881} {"train_loss": -6.151629447937012, "global_step": 79036, "epoch": 1881} {"train_loss": -6.1586408615112305, "global_step": 79037, "epoch": 1881} {"train_loss": -6.053951740264893, "global_step": 79038, "epoch": 1881} {"train_loss": -6.04256534576416, "global_step": 79039, "epoch": 1881} {"train_loss": -5.952160835266113, "global_step": 79040, "epoch": 1881} {"train_loss": -6.084178924560547, "global_step": 79041, "epoch": 1881} {"train_loss": -6.142736434936523, "global_step": 79042, "epoch": 1881} {"train_loss": -6.127222844532558, "global_step": 79043, "epoch": 1881, "val_loss": 67770.7734375} {"train_loss": -6.162225723266602, "global_step": 79044, "epoch": 1882} {"train_loss": -6.150978088378906, "global_step": 79045, "epoch": 1882} {"train_loss": -6.12933349609375, "global_step": 79046, "epoch": 1882} {"train_loss": -6.155704498291016, "global_step": 79047, "epoch": 1882} {"train_loss": -6.037286758422852, "global_step": 79048, "epoch": 1882} {"train_loss": -6.1049394607543945, "global_step": 79049, "epoch": 1882} {"train_loss": -6.0839996337890625, "global_step": 79050, "epoch": 1882} {"train_loss": -6.12841796875, "global_step": 79051, "epoch": 1882} {"train_loss": -6.174934387207031, "global_step": 79052, "epoch": 1882} {"train_loss": -6.060976982116699, "global_step": 79053, "epoch": 1882} {"train_loss": -6.295054912567139, "global_step": 79054, "epoch": 1882} {"train_loss": -6.028195381164551, "global_step": 79055, "epoch": 1882} {"train_loss": -6.0901594161987305, "global_step": 79056, "epoch": 1882} {"train_loss": -6.006655693054199, "global_step": 79057, "epoch": 1882} {"train_loss": -6.170022487640381, "global_step": 79058, "epoch": 1882} {"train_loss": -6.284899711608887, "global_step": 79059, "epoch": 1882} {"train_loss": -6.112140655517578, "global_step": 79060, "epoch": 1882} {"train_loss": -6.271640777587891, "global_step": 79061, "epoch": 1882} {"train_loss": -6.239816665649414, "global_step": 79062, "epoch": 1882} {"train_loss": -6.097058296203613, "global_step": 79063, "epoch": 1882} {"train_loss": -6.180619239807129, "global_step": 79064, "epoch": 1882} {"train_loss": -6.111546039581299, "global_step": 79065, "epoch": 1882} {"train_loss": -6.124264717102051, "global_step": 79066, "epoch": 1882} {"train_loss": -6.084281921386719, "global_step": 79067, "epoch": 1882} {"train_loss": -6.137749195098877, "global_step": 79068, "epoch": 1882} {"train_loss": -6.070972442626953, "global_step": 79069, "epoch": 1882} {"train_loss": -6.020420074462891, "global_step": 79070, "epoch": 1882} {"train_loss": -6.114438056945801, "global_step": 79071, "epoch": 1882} {"train_loss": -6.232905387878418, "global_step": 79072, "epoch": 1882} {"train_loss": -6.1593475341796875, "global_step": 79073, "epoch": 1882} {"train_loss": -6.067020416259766, "global_step": 79074, "epoch": 1882} {"train_loss": -6.11838436126709, "global_step": 79075, "epoch": 1882} {"train_loss": -6.111846923828125, "global_step": 79076, "epoch": 1882} {"train_loss": -6.127473831176758, "global_step": 79077, "epoch": 1882} {"train_loss": -6.052649974822998, "global_step": 79078, "epoch": 1882} {"train_loss": -6.097187042236328, "global_step": 79079, "epoch": 1882} {"train_loss": -5.994368076324463, "global_step": 79080, "epoch": 1882} {"train_loss": -5.98279333114624, "global_step": 79081, "epoch": 1882} {"train_loss": -6.109363555908203, "global_step": 79082, "epoch": 1882} {"train_loss": -5.9084577560424805, "global_step": 79083, "epoch": 1882} {"train_loss": -6.019224166870117, "global_step": 79084, "epoch": 1882} {"train_loss": -6.111787103471302, "global_step": 79085, "epoch": 1882, "val_loss": 67642.2578125} {"train_loss": -5.968001365661621, "global_step": 79086, "epoch": 1883} {"train_loss": -6.121157646179199, "global_step": 79087, "epoch": 1883} {"train_loss": -5.9581804275512695, "global_step": 79088, "epoch": 1883} {"train_loss": -6.1679253578186035, "global_step": 79089, "epoch": 1883} {"train_loss": -6.065729141235352, "global_step": 79090, "epoch": 1883} {"train_loss": -6.074621200561523, "global_step": 79091, "epoch": 1883} {"train_loss": -5.945919036865234, "global_step": 79092, "epoch": 1883} {"train_loss": -6.0419769287109375, "global_step": 79093, "epoch": 1883} {"train_loss": -6.21068000793457, "global_step": 79094, "epoch": 1883} {"train_loss": -6.08376407623291, "global_step": 79095, "epoch": 1883} {"train_loss": -6.086063385009766, "global_step": 79096, "epoch": 1883} {"train_loss": -6.098048210144043, "global_step": 79097, "epoch": 1883} {"train_loss": -6.158143997192383, "global_step": 79098, "epoch": 1883} {"train_loss": -6.123090744018555, "global_step": 79099, "epoch": 1883} {"train_loss": -6.240067958831787, "global_step": 79100, "epoch": 1883} {"train_loss": -6.0947771072387695, "global_step": 79101, "epoch": 1883} {"train_loss": -6.061549186706543, "global_step": 79102, "epoch": 1883} {"train_loss": -6.052340030670166, "global_step": 79103, "epoch": 1883} {"train_loss": -6.111664295196533, "global_step": 79104, "epoch": 1883} {"train_loss": -6.22417688369751, "global_step": 79105, "epoch": 1883} {"train_loss": -6.1511335372924805, "global_step": 79106, "epoch": 1883} {"train_loss": -6.0962629318237305, "global_step": 79107, "epoch": 1883} {"train_loss": -6.108935356140137, "global_step": 79108, "epoch": 1883} {"train_loss": -5.981710433959961, "global_step": 79109, "epoch": 1883} {"train_loss": -6.1709442138671875, "global_step": 79110, "epoch": 1883} {"train_loss": -6.074499607086182, "global_step": 79111, "epoch": 1883} {"train_loss": -6.103037357330322, "global_step": 79112, "epoch": 1883} {"train_loss": -5.988094329833984, "global_step": 79113, "epoch": 1883} {"train_loss": -5.992280960083008, "global_step": 79114, "epoch": 1883} {"train_loss": -6.108975410461426, "global_step": 79115, "epoch": 1883} {"train_loss": -6.09217643737793, "global_step": 79116, "epoch": 1883} {"train_loss": -6.228209495544434, "global_step": 79117, "epoch": 1883} {"train_loss": -6.0342512130737305, "global_step": 79118, "epoch": 1883} {"train_loss": -6.197487831115723, "global_step": 79119, "epoch": 1883} {"train_loss": -6.178818702697754, "global_step": 79120, "epoch": 1883} {"train_loss": -6.0667948722839355, "global_step": 79121, "epoch": 1883} {"train_loss": -6.249443054199219, "global_step": 79122, "epoch": 1883} {"train_loss": -6.142352104187012, "global_step": 79123, "epoch": 1883} {"train_loss": -6.134463310241699, "global_step": 79124, "epoch": 1883} {"train_loss": -5.939723014831543, "global_step": 79125, "epoch": 1883} {"train_loss": -6.1025848388671875, "global_step": 79126, "epoch": 1883} {"train_loss": -6.100228343691144, "global_step": 79127, "epoch": 1883, "val_loss": 67526.625} {"train_loss": -6.180887699127197, "global_step": 79128, "epoch": 1884} {"train_loss": -6.029314994812012, "global_step": 79129, "epoch": 1884} {"train_loss": -6.012831687927246, "global_step": 79130, "epoch": 1884} {"train_loss": -6.148120880126953, "global_step": 79131, "epoch": 1884} {"train_loss": -6.121425628662109, "global_step": 79132, "epoch": 1884} {"train_loss": -6.160062789916992, "global_step": 79133, "epoch": 1884} {"train_loss": -6.066824913024902, "global_step": 79134, "epoch": 1884} {"train_loss": -6.142313003540039, "global_step": 79135, "epoch": 1884} {"train_loss": -6.117631435394287, "global_step": 79136, "epoch": 1884} {"train_loss": -6.0192670822143555, "global_step": 79137, "epoch": 1884} {"train_loss": -6.182649612426758, "global_step": 79138, "epoch": 1884} {"train_loss": -6.074011325836182, "global_step": 79139, "epoch": 1884} {"train_loss": -6.095898151397705, "global_step": 79140, "epoch": 1884} {"train_loss": -6.16702127456665, "global_step": 79141, "epoch": 1884} {"train_loss": -6.282055377960205, "global_step": 79142, "epoch": 1884} {"train_loss": -6.164670944213867, "global_step": 79143, "epoch": 1884} {"train_loss": -6.232216835021973, "global_step": 79144, "epoch": 1884} {"train_loss": -6.237441062927246, "global_step": 79145, "epoch": 1884} {"train_loss": -6.0908203125, "global_step": 79146, "epoch": 1884} {"train_loss": -6.107217788696289, "global_step": 79147, "epoch": 1884} {"train_loss": -6.222898960113525, "global_step": 79148, "epoch": 1884} {"train_loss": -6.137358665466309, "global_step": 79149, "epoch": 1884} {"train_loss": -6.132997035980225, "global_step": 79150, "epoch": 1884} {"train_loss": -6.131351947784424, "global_step": 79151, "epoch": 1884} {"train_loss": -6.141531944274902, "global_step": 79152, "epoch": 1884} {"train_loss": -6.117710113525391, "global_step": 79153, "epoch": 1884} {"train_loss": -6.161303520202637, "global_step": 79154, "epoch": 1884} {"train_loss": -6.039517402648926, "global_step": 79155, "epoch": 1884} {"train_loss": -6.100008964538574, "global_step": 79156, "epoch": 1884} {"train_loss": -6.219667434692383, "global_step": 79157, "epoch": 1884} {"train_loss": -6.165410041809082, "global_step": 79158, "epoch": 1884} {"train_loss": -6.143477916717529, "global_step": 79159, "epoch": 1884} {"train_loss": -6.052274703979492, "global_step": 79160, "epoch": 1884} {"train_loss": -6.148253440856934, "global_step": 79161, "epoch": 1884} {"train_loss": -6.066459655761719, "global_step": 79162, "epoch": 1884} {"train_loss": -6.0777740478515625, "global_step": 79163, "epoch": 1884} {"train_loss": -6.006324768066406, "global_step": 79164, "epoch": 1884} {"train_loss": -6.039108753204346, "global_step": 79165, "epoch": 1884} {"train_loss": -6.069553852081299, "global_step": 79166, "epoch": 1884} {"train_loss": -6.133330345153809, "global_step": 79167, "epoch": 1884} {"train_loss": -6.013699531555176, "global_step": 79168, "epoch": 1884} {"train_loss": -6.119650874819074, "global_step": 79169, "epoch": 1884, "val_loss": 67387.5859375} {"train_loss": -6.07172966003418, "global_step": 79170, "epoch": 1885} {"train_loss": -6.082972049713135, "global_step": 79171, "epoch": 1885} {"train_loss": -5.980847358703613, "global_step": 79172, "epoch": 1885} {"train_loss": -6.128487586975098, "global_step": 79173, "epoch": 1885} {"train_loss": -6.140000820159912, "global_step": 79174, "epoch": 1885} {"train_loss": -6.133254528045654, "global_step": 79175, "epoch": 1885} {"train_loss": -6.175498962402344, "global_step": 79176, "epoch": 1885} {"train_loss": -6.134062767028809, "global_step": 79177, "epoch": 1885} {"train_loss": -6.154279708862305, "global_step": 79178, "epoch": 1885} {"train_loss": -6.131336688995361, "global_step": 79179, "epoch": 1885} {"train_loss": -6.002091884613037, "global_step": 79180, "epoch": 1885} {"train_loss": -6.130727767944336, "global_step": 79181, "epoch": 1885} {"train_loss": -6.157833099365234, "global_step": 79182, "epoch": 1885} {"train_loss": -6.068572998046875, "global_step": 79183, "epoch": 1885} {"train_loss": -6.1806416511535645, "global_step": 79184, "epoch": 1885} {"train_loss": -6.105312347412109, "global_step": 79185, "epoch": 1885} {"train_loss": -6.071212291717529, "global_step": 79186, "epoch": 1885} {"train_loss": -6.084168910980225, "global_step": 79187, "epoch": 1885} {"train_loss": -6.079710006713867, "global_step": 79188, "epoch": 1885} {"train_loss": -6.23141622543335, "global_step": 79189, "epoch": 1885} {"train_loss": -6.116203784942627, "global_step": 79190, "epoch": 1885} {"train_loss": -5.956528663635254, "global_step": 79191, "epoch": 1885} {"train_loss": -6.140578269958496, "global_step": 79192, "epoch": 1885} {"train_loss": -6.142254829406738, "global_step": 79193, "epoch": 1885} {"train_loss": -5.973029136657715, "global_step": 79194, "epoch": 1885} {"train_loss": -6.1430511474609375, "global_step": 79195, "epoch": 1885} {"train_loss": -6.039080619812012, "global_step": 79196, "epoch": 1885} {"train_loss": -6.023490905761719, "global_step": 79197, "epoch": 1885} {"train_loss": -5.93132209777832, "global_step": 79198, "epoch": 1885} {"train_loss": -6.083089828491211, "global_step": 79199, "epoch": 1885} {"train_loss": -6.086353778839111, "global_step": 79200, "epoch": 1885} {"train_loss": -6.040680885314941, "global_step": 79201, "epoch": 1885} {"train_loss": -6.07414436340332, "global_step": 79202, "epoch": 1885} {"train_loss": -6.016900062561035, "global_step": 79203, "epoch": 1885} {"train_loss": -6.102579116821289, "global_step": 79204, "epoch": 1885} {"train_loss": -6.139927864074707, "global_step": 79205, "epoch": 1885} {"train_loss": -6.111669063568115, "global_step": 79206, "epoch": 1885} {"train_loss": -6.090834617614746, "global_step": 79207, "epoch": 1885} {"train_loss": -5.877694606781006, "global_step": 79208, "epoch": 1885} {"train_loss": -6.140517234802246, "global_step": 79209, "epoch": 1885} {"train_loss": -6.03157901763916, "global_step": 79210, "epoch": 1885} {"train_loss": -6.084532635552542, "global_step": 79211, "epoch": 1885, "val_loss": 67595.6875} {"train_loss": -6.070941925048828, "global_step": 79212, "epoch": 1886} {"train_loss": -6.054887294769287, "global_step": 79213, "epoch": 1886} {"train_loss": -6.039146423339844, "global_step": 79214, "epoch": 1886} {"train_loss": -6.088807582855225, "global_step": 79215, "epoch": 1886} {"train_loss": -6.041434288024902, "global_step": 79216, "epoch": 1886} {"train_loss": -6.230888843536377, "global_step": 79217, "epoch": 1886} {"train_loss": -6.133885860443115, "global_step": 79218, "epoch": 1886} {"train_loss": -6.096411228179932, "global_step": 79219, "epoch": 1886} {"train_loss": -6.153700828552246, "global_step": 79220, "epoch": 1886} {"train_loss": -6.124138832092285, "global_step": 79221, "epoch": 1886} {"train_loss": -6.087637901306152, "global_step": 79222, "epoch": 1886} {"train_loss": -6.118195533752441, "global_step": 79223, "epoch": 1886} {"train_loss": -6.177021026611328, "global_step": 79224, "epoch": 1886} {"train_loss": -6.138589382171631, "global_step": 79225, "epoch": 1886} {"train_loss": -6.176915168762207, "global_step": 79226, "epoch": 1886} {"train_loss": -6.105766296386719, "global_step": 79227, "epoch": 1886} {"train_loss": -6.018496990203857, "global_step": 79228, "epoch": 1886} {"train_loss": -6.090593338012695, "global_step": 79229, "epoch": 1886} {"train_loss": -6.099254608154297, "global_step": 79230, "epoch": 1886} {"train_loss": -6.167631149291992, "global_step": 79231, "epoch": 1886} {"train_loss": -6.091572284698486, "global_step": 79232, "epoch": 1886} {"train_loss": -6.225991249084473, "global_step": 79233, "epoch": 1886} {"train_loss": -6.178030014038086, "global_step": 79234, "epoch": 1886} {"train_loss": -6.095608711242676, "global_step": 79235, "epoch": 1886} {"train_loss": -6.151517868041992, "global_step": 79236, "epoch": 1886} {"train_loss": -6.052484512329102, "global_step": 79237, "epoch": 1886} {"train_loss": -6.113124847412109, "global_step": 79238, "epoch": 1886} {"train_loss": -6.058309555053711, "global_step": 79239, "epoch": 1886} {"train_loss": -6.023000717163086, "global_step": 79240, "epoch": 1886} {"train_loss": -6.062737464904785, "global_step": 79241, "epoch": 1886} {"train_loss": -6.11594820022583, "global_step": 79242, "epoch": 1886} {"train_loss": -6.041575908660889, "global_step": 79243, "epoch": 1886} {"train_loss": -6.140538692474365, "global_step": 79244, "epoch": 1886} {"train_loss": -5.9784440994262695, "global_step": 79245, "epoch": 1886} {"train_loss": -6.125738143920898, "global_step": 79246, "epoch": 1886} {"train_loss": -6.04172420501709, "global_step": 79247, "epoch": 1886} {"train_loss": -6.167736053466797, "global_step": 79248, "epoch": 1886} {"train_loss": -6.159222602844238, "global_step": 79249, "epoch": 1886} {"train_loss": -6.130671501159668, "global_step": 79250, "epoch": 1886} {"train_loss": -6.11152458190918, "global_step": 79251, "epoch": 1886} {"train_loss": -6.168237686157227, "global_step": 79252, "epoch": 1886} {"train_loss": -6.107140893027896, "global_step": 79253, "epoch": 1886, "val_loss": 67689.875} {"train_loss": -6.056191444396973, "global_step": 79254, "epoch": 1887} {"train_loss": -6.174598693847656, "global_step": 79255, "epoch": 1887} {"train_loss": -6.133181095123291, "global_step": 79256, "epoch": 1887} {"train_loss": -6.0943498611450195, "global_step": 79257, "epoch": 1887} {"train_loss": -6.104008674621582, "global_step": 79258, "epoch": 1887} {"train_loss": -6.1374053955078125, "global_step": 79259, "epoch": 1887} {"train_loss": -6.028055191040039, "global_step": 79260, "epoch": 1887} {"train_loss": -6.0741095542907715, "global_step": 79261, "epoch": 1887} {"train_loss": -6.117989540100098, "global_step": 79262, "epoch": 1887} {"train_loss": -6.100152015686035, "global_step": 79263, "epoch": 1887} {"train_loss": -6.121435165405273, "global_step": 79264, "epoch": 1887} {"train_loss": -6.015110969543457, "global_step": 79265, "epoch": 1887} {"train_loss": -6.091010570526123, "global_step": 79266, "epoch": 1887} {"train_loss": -6.196406364440918, "global_step": 79267, "epoch": 1887} {"train_loss": -6.113478660583496, "global_step": 79268, "epoch": 1887} {"train_loss": -6.170599937438965, "global_step": 79269, "epoch": 1887} {"train_loss": -6.1333746910095215, "global_step": 79270, "epoch": 1887} {"train_loss": -6.066740036010742, "global_step": 79271, "epoch": 1887} {"train_loss": -6.1379594802856445, "global_step": 79272, "epoch": 1887} {"train_loss": -6.084343910217285, "global_step": 79273, "epoch": 1887} {"train_loss": -6.032240390777588, "global_step": 79274, "epoch": 1887} {"train_loss": -6.157930374145508, "global_step": 79275, "epoch": 1887} {"train_loss": -6.067150115966797, "global_step": 79276, "epoch": 1887} {"train_loss": -6.1971330642700195, "global_step": 79277, "epoch": 1887} {"train_loss": -6.188357353210449, "global_step": 79278, "epoch": 1887} {"train_loss": -6.214359283447266, "global_step": 79279, "epoch": 1887} {"train_loss": -6.14076042175293, "global_step": 79280, "epoch": 1887} {"train_loss": -6.136523246765137, "global_step": 79281, "epoch": 1887} {"train_loss": -6.127984523773193, "global_step": 79282, "epoch": 1887} {"train_loss": -6.133550643920898, "global_step": 79283, "epoch": 1887} {"train_loss": -6.135021209716797, "global_step": 79284, "epoch": 1887} {"train_loss": -6.2649030685424805, "global_step": 79285, "epoch": 1887} {"train_loss": -6.142732620239258, "global_step": 79286, "epoch": 1887} {"train_loss": -6.119380950927734, "global_step": 79287, "epoch": 1887} {"train_loss": -6.186081886291504, "global_step": 79288, "epoch": 1887} {"train_loss": -6.234219551086426, "global_step": 79289, "epoch": 1887} {"train_loss": -6.17153263092041, "global_step": 79290, "epoch": 1887} {"train_loss": -6.200994968414307, "global_step": 79291, "epoch": 1887} {"train_loss": -6.041248321533203, "global_step": 79292, "epoch": 1887} {"train_loss": -6.121741771697998, "global_step": 79293, "epoch": 1887} {"train_loss": -6.005222320556641, "global_step": 79294, "epoch": 1887} {"train_loss": -6.123473984854562, "global_step": 79295, "epoch": 1887, "val_loss": 67504.7109375} {"train_loss": -6.234650611877441, "global_step": 79296, "epoch": 1888} {"train_loss": -6.076274394989014, "global_step": 79297, "epoch": 1888} {"train_loss": -6.16749906539917, "global_step": 79298, "epoch": 1888} {"train_loss": -6.068323135375977, "global_step": 79299, "epoch": 1888} {"train_loss": -6.068136215209961, "global_step": 79300, "epoch": 1888} {"train_loss": -6.110727310180664, "global_step": 79301, "epoch": 1888} {"train_loss": -6.102671146392822, "global_step": 79302, "epoch": 1888} {"train_loss": -6.12895393371582, "global_step": 79303, "epoch": 1888} {"train_loss": -6.135857582092285, "global_step": 79304, "epoch": 1888} {"train_loss": -6.031256675720215, "global_step": 79305, "epoch": 1888} {"train_loss": -6.16732120513916, "global_step": 79306, "epoch": 1888} {"train_loss": -6.144640922546387, "global_step": 79307, "epoch": 1888} {"train_loss": -6.001737117767334, "global_step": 79308, "epoch": 1888} {"train_loss": -6.004868984222412, "global_step": 79309, "epoch": 1888} {"train_loss": -6.156148910522461, "global_step": 79310, "epoch": 1888} {"train_loss": -6.0111589431762695, "global_step": 79311, "epoch": 1888} {"train_loss": -6.215110778808594, "global_step": 79312, "epoch": 1888} {"train_loss": -6.097533226013184, "global_step": 79313, "epoch": 1888} {"train_loss": -6.201650142669678, "global_step": 79314, "epoch": 1888} {"train_loss": -6.065142631530762, "global_step": 79315, "epoch": 1888} {"train_loss": -6.192728519439697, "global_step": 79316, "epoch": 1888} {"train_loss": -6.165282726287842, "global_step": 79317, "epoch": 1888} {"train_loss": -6.105079174041748, "global_step": 79318, "epoch": 1888} {"train_loss": -6.0008745193481445, "global_step": 79319, "epoch": 1888} {"train_loss": -6.221735000610352, "global_step": 79320, "epoch": 1888} {"train_loss": -6.1208977699279785, "global_step": 79321, "epoch": 1888} {"train_loss": -6.167110443115234, "global_step": 79322, "epoch": 1888} {"train_loss": -6.086794853210449, "global_step": 79323, "epoch": 1888} {"train_loss": -6.158703327178955, "global_step": 79324, "epoch": 1888} {"train_loss": -6.146335124969482, "global_step": 79325, "epoch": 1888} {"train_loss": -6.138498783111572, "global_step": 79326, "epoch": 1888} {"train_loss": -6.14629602432251, "global_step": 79327, "epoch": 1888} {"train_loss": -6.1229472160339355, "global_step": 79328, "epoch": 1888} {"train_loss": -6.024877071380615, "global_step": 79329, "epoch": 1888} {"train_loss": -6.0723652839660645, "global_step": 79330, "epoch": 1888} {"train_loss": -6.242072582244873, "global_step": 79331, "epoch": 1888} {"train_loss": -6.0672407150268555, "global_step": 79332, "epoch": 1888} {"train_loss": -6.1197509765625, "global_step": 79333, "epoch": 1888} {"train_loss": -6.155031681060791, "global_step": 79334, "epoch": 1888} {"train_loss": -6.11137056350708, "global_step": 79335, "epoch": 1888} {"train_loss": -6.214847564697266, "global_step": 79336, "epoch": 1888} {"train_loss": -6.121796017601376, "global_step": 79337, "epoch": 1888, "val_loss": 67780.640625} {"train_loss": -6.137040138244629, "global_step": 79338, "epoch": 1889} {"train_loss": -6.074131011962891, "global_step": 79339, "epoch": 1889} {"train_loss": -6.185471057891846, "global_step": 79340, "epoch": 1889} {"train_loss": -6.143802642822266, "global_step": 79341, "epoch": 1889} {"train_loss": -6.041361331939697, "global_step": 79342, "epoch": 1889} {"train_loss": -6.023582935333252, "global_step": 79343, "epoch": 1889} {"train_loss": -6.099694728851318, "global_step": 79344, "epoch": 1889} {"train_loss": -5.969244956970215, "global_step": 79345, "epoch": 1889} {"train_loss": -6.220320224761963, "global_step": 79346, "epoch": 1889} {"train_loss": -5.951681137084961, "global_step": 79347, "epoch": 1889} {"train_loss": -6.005164623260498, "global_step": 79348, "epoch": 1889} {"train_loss": -6.059877872467041, "global_step": 79349, "epoch": 1889} {"train_loss": -6.00162935256958, "global_step": 79350, "epoch": 1889} {"train_loss": -6.041047096252441, "global_step": 79351, "epoch": 1889} {"train_loss": -6.180519104003906, "global_step": 79352, "epoch": 1889} {"train_loss": -5.865847587585449, "global_step": 79353, "epoch": 1889} {"train_loss": -6.033515930175781, "global_step": 79354, "epoch": 1889} {"train_loss": -5.9071879386901855, "global_step": 79355, "epoch": 1889} {"train_loss": -6.024767875671387, "global_step": 79356, "epoch": 1889} {"train_loss": -5.952969551086426, "global_step": 79357, "epoch": 1889} {"train_loss": -5.952865123748779, "global_step": 79358, "epoch": 1889} {"train_loss": -5.995390892028809, "global_step": 79359, "epoch": 1889} {"train_loss": -6.068845748901367, "global_step": 79360, "epoch": 1889} {"train_loss": -6.182595729827881, "global_step": 79361, "epoch": 1889} {"train_loss": -6.059067249298096, "global_step": 79362, "epoch": 1889} {"train_loss": -6.012293338775635, "global_step": 79363, "epoch": 1889} {"train_loss": -6.102741718292236, "global_step": 79364, "epoch": 1889} {"train_loss": -6.110052108764648, "global_step": 79365, "epoch": 1889} {"train_loss": -6.055397987365723, "global_step": 79366, "epoch": 1889} {"train_loss": -6.252058029174805, "global_step": 79367, "epoch": 1889} {"train_loss": -5.989331245422363, "global_step": 79368, "epoch": 1889} {"train_loss": -6.113281726837158, "global_step": 79369, "epoch": 1889} {"train_loss": -6.035013198852539, "global_step": 79370, "epoch": 1889} {"train_loss": -6.154944896697998, "global_step": 79371, "epoch": 1889} {"train_loss": -6.110965728759766, "global_step": 79372, "epoch": 1889} {"train_loss": -6.057892799377441, "global_step": 79373, "epoch": 1889} {"train_loss": -5.975822448730469, "global_step": 79374, "epoch": 1889} {"train_loss": -6.088701248168945, "global_step": 79375, "epoch": 1889} {"train_loss": -6.196004867553711, "global_step": 79376, "epoch": 1889} {"train_loss": -6.10667610168457, "global_step": 79377, "epoch": 1889} {"train_loss": -6.04583740234375, "global_step": 79378, "epoch": 1889} {"train_loss": -6.063385077885219, "global_step": 79379, "epoch": 1889, "val_loss": 67587.375} {"train_loss": -6.112198829650879, "global_step": 79380, "epoch": 1890} {"train_loss": -6.157770156860352, "global_step": 79381, "epoch": 1890} {"train_loss": -6.175784111022949, "global_step": 79382, "epoch": 1890} {"train_loss": -6.284018039703369, "global_step": 79383, "epoch": 1890} {"train_loss": -6.200507164001465, "global_step": 79384, "epoch": 1890} {"train_loss": -6.175333023071289, "global_step": 79385, "epoch": 1890} {"train_loss": -6.178758144378662, "global_step": 79386, "epoch": 1890} {"train_loss": -6.133245468139648, "global_step": 79387, "epoch": 1890} {"train_loss": -6.114422798156738, "global_step": 79388, "epoch": 1890} {"train_loss": -5.973249912261963, "global_step": 79389, "epoch": 1890} {"train_loss": -6.063288688659668, "global_step": 79390, "epoch": 1890} {"train_loss": -6.0927815437316895, "global_step": 79391, "epoch": 1890} {"train_loss": -6.033609867095947, "global_step": 79392, "epoch": 1890} {"train_loss": -6.0913801193237305, "global_step": 79393, "epoch": 1890} {"train_loss": -6.021152973175049, "global_step": 79394, "epoch": 1890} {"train_loss": -6.004117965698242, "global_step": 79395, "epoch": 1890} {"train_loss": -6.123491287231445, "global_step": 79396, "epoch": 1890} {"train_loss": -6.0296430587768555, "global_step": 79397, "epoch": 1890} {"train_loss": -6.038496971130371, "global_step": 79398, "epoch": 1890} {"train_loss": -6.156081199645996, "global_step": 79399, "epoch": 1890} {"train_loss": -6.147290229797363, "global_step": 79400, "epoch": 1890} {"train_loss": -6.139258861541748, "global_step": 79401, "epoch": 1890} {"train_loss": -6.074148178100586, "global_step": 79402, "epoch": 1890} {"train_loss": -6.1229963302612305, "global_step": 79403, "epoch": 1890} {"train_loss": -6.022130012512207, "global_step": 79404, "epoch": 1890} {"train_loss": -6.199185371398926, "global_step": 79405, "epoch": 1890} {"train_loss": -6.104411602020264, "global_step": 79406, "epoch": 1890} {"train_loss": -6.11000919342041, "global_step": 79407, "epoch": 1890} {"train_loss": -6.136526584625244, "global_step": 79408, "epoch": 1890} {"train_loss": -6.1107940673828125, "global_step": 79409, "epoch": 1890} {"train_loss": -6.176286697387695, "global_step": 79410, "epoch": 1890} {"train_loss": -6.0505852699279785, "global_step": 79411, "epoch": 1890} {"train_loss": -6.145323753356934, "global_step": 79412, "epoch": 1890} {"train_loss": -6.097151756286621, "global_step": 79413, "epoch": 1890} {"train_loss": -6.091109752655029, "global_step": 79414, "epoch": 1890} {"train_loss": -6.1026611328125, "global_step": 79415, "epoch": 1890} {"train_loss": -6.223235607147217, "global_step": 79416, "epoch": 1890} {"train_loss": -6.032886028289795, "global_step": 79417, "epoch": 1890} {"train_loss": -6.132739543914795, "global_step": 79418, "epoch": 1890} {"train_loss": -6.1083879470825195, "global_step": 79419, "epoch": 1890} {"train_loss": -6.189570426940918, "global_step": 79420, "epoch": 1890} {"train_loss": -6.1134897981371195, "global_step": 79421, "epoch": 1890, "val_loss": 67662.8671875} {"train_loss": -6.187934398651123, "global_step": 79422, "epoch": 1891} {"train_loss": -6.136386871337891, "global_step": 79423, "epoch": 1891} {"train_loss": -6.225874900817871, "global_step": 79424, "epoch": 1891} {"train_loss": -6.1376447677612305, "global_step": 79425, "epoch": 1891} {"train_loss": -6.128178596496582, "global_step": 79426, "epoch": 1891} {"train_loss": -6.109698295593262, "global_step": 79427, "epoch": 1891} {"train_loss": -6.070015907287598, "global_step": 79428, "epoch": 1891} {"train_loss": -6.080807685852051, "global_step": 79429, "epoch": 1891} {"train_loss": -6.095949172973633, "global_step": 79430, "epoch": 1891} {"train_loss": -6.090110778808594, "global_step": 79431, "epoch": 1891} {"train_loss": -6.002904891967773, "global_step": 79432, "epoch": 1891} {"train_loss": -6.115635871887207, "global_step": 79433, "epoch": 1891} {"train_loss": -6.227164268493652, "global_step": 79434, "epoch": 1891} {"train_loss": -6.1165971755981445, "global_step": 79435, "epoch": 1891} {"train_loss": -6.180849552154541, "global_step": 79436, "epoch": 1891} {"train_loss": -6.052587032318115, "global_step": 79437, "epoch": 1891} {"train_loss": -6.125909805297852, "global_step": 79438, "epoch": 1891} {"train_loss": -6.119719505310059, "global_step": 79439, "epoch": 1891} {"train_loss": -6.052280426025391, "global_step": 79440, "epoch": 1891} {"train_loss": -6.063355922698975, "global_step": 79441, "epoch": 1891} {"train_loss": -6.230668067932129, "global_step": 79442, "epoch": 1891} {"train_loss": -6.120242118835449, "global_step": 79443, "epoch": 1891} {"train_loss": -5.988752841949463, "global_step": 79444, "epoch": 1891} {"train_loss": -6.105382919311523, "global_step": 79445, "epoch": 1891} {"train_loss": -6.216098785400391, "global_step": 79446, "epoch": 1891} {"train_loss": -6.097168922424316, "global_step": 79447, "epoch": 1891} {"train_loss": -6.192904472351074, "global_step": 79448, "epoch": 1891} {"train_loss": -6.179045677185059, "global_step": 79449, "epoch": 1891} {"train_loss": -6.050562381744385, "global_step": 79450, "epoch": 1891} {"train_loss": -6.130233287811279, "global_step": 79451, "epoch": 1891} {"train_loss": -6.141847133636475, "global_step": 79452, "epoch": 1891} {"train_loss": -6.113663673400879, "global_step": 79453, "epoch": 1891} {"train_loss": -6.104621887207031, "global_step": 79454, "epoch": 1891} {"train_loss": -5.979885101318359, "global_step": 79455, "epoch": 1891} {"train_loss": -6.03523588180542, "global_step": 79456, "epoch": 1891} {"train_loss": -6.134241104125977, "global_step": 79457, "epoch": 1891} {"train_loss": -6.031922817230225, "global_step": 79458, "epoch": 1891} {"train_loss": -6.169054985046387, "global_step": 79459, "epoch": 1891} {"train_loss": -6.103860855102539, "global_step": 79460, "epoch": 1891} {"train_loss": -6.096451282501221, "global_step": 79461, "epoch": 1891} {"train_loss": -6.140352249145508, "global_step": 79462, "epoch": 1891} {"train_loss": -6.115287372044155, "global_step": 79463, "epoch": 1891, "val_loss": 67607.8125} {"train_loss": -6.126608371734619, "global_step": 79464, "epoch": 1892} {"train_loss": -6.071022033691406, "global_step": 79465, "epoch": 1892} {"train_loss": -6.13386869430542, "global_step": 79466, "epoch": 1892} {"train_loss": -6.095737934112549, "global_step": 79467, "epoch": 1892} {"train_loss": -6.111090660095215, "global_step": 79468, "epoch": 1892} {"train_loss": -6.127812385559082, "global_step": 79469, "epoch": 1892} {"train_loss": -6.10983419418335, "global_step": 79470, "epoch": 1892} {"train_loss": -6.08784818649292, "global_step": 79471, "epoch": 1892} {"train_loss": -6.065630912780762, "global_step": 79472, "epoch": 1892} {"train_loss": -6.2352471351623535, "global_step": 79473, "epoch": 1892} {"train_loss": -6.080326080322266, "global_step": 79474, "epoch": 1892} {"train_loss": -6.178481101989746, "global_step": 79475, "epoch": 1892} {"train_loss": -6.1464033126831055, "global_step": 79476, "epoch": 1892} {"train_loss": -6.097867488861084, "global_step": 79477, "epoch": 1892} {"train_loss": -6.1364970207214355, "global_step": 79478, "epoch": 1892} {"train_loss": -6.177197456359863, "global_step": 79479, "epoch": 1892} {"train_loss": -6.057499885559082, "global_step": 79480, "epoch": 1892} {"train_loss": -6.145035743713379, "global_step": 79481, "epoch": 1892} {"train_loss": -6.134098052978516, "global_step": 79482, "epoch": 1892} {"train_loss": -6.022427558898926, "global_step": 79483, "epoch": 1892} {"train_loss": -6.075138568878174, "global_step": 79484, "epoch": 1892} {"train_loss": -6.124054431915283, "global_step": 79485, "epoch": 1892} {"train_loss": -6.166569709777832, "global_step": 79486, "epoch": 1892} {"train_loss": -6.118720054626465, "global_step": 79487, "epoch": 1892} {"train_loss": -6.093125820159912, "global_step": 79488, "epoch": 1892} {"train_loss": -6.1157355308532715, "global_step": 79489, "epoch": 1892} {"train_loss": -6.233428955078125, "global_step": 79490, "epoch": 1892} {"train_loss": -6.192981719970703, "global_step": 79491, "epoch": 1892} {"train_loss": -6.060357093811035, "global_step": 79492, "epoch": 1892} {"train_loss": -6.148796081542969, "global_step": 79493, "epoch": 1892} {"train_loss": -6.009978294372559, "global_step": 79494, "epoch": 1892} {"train_loss": -6.153984546661377, "global_step": 79495, "epoch": 1892} {"train_loss": -6.096706390380859, "global_step": 79496, "epoch": 1892} {"train_loss": -6.197928428649902, "global_step": 79497, "epoch": 1892} {"train_loss": -5.994204044342041, "global_step": 79498, "epoch": 1892} {"train_loss": -6.215211391448975, "global_step": 79499, "epoch": 1892} {"train_loss": -6.139441013336182, "global_step": 79500, "epoch": 1892} {"train_loss": -6.161238670349121, "global_step": 79501, "epoch": 1892} {"train_loss": -6.126981258392334, "global_step": 79502, "epoch": 1892} {"train_loss": -6.147429943084717, "global_step": 79503, "epoch": 1892} {"train_loss": -6.183307647705078, "global_step": 79504, "epoch": 1892} {"train_loss": -6.121285063879831, "global_step": 79505, "epoch": 1892, "val_loss": 67624.9140625} {"train_loss": -6.111228942871094, "global_step": 79506, "epoch": 1893} {"train_loss": -6.096990585327148, "global_step": 79507, "epoch": 1893} {"train_loss": -6.216456413269043, "global_step": 79508, "epoch": 1893} {"train_loss": -6.193829536437988, "global_step": 79509, "epoch": 1893} {"train_loss": -6.244103908538818, "global_step": 79510, "epoch": 1893} {"train_loss": -6.051645278930664, "global_step": 79511, "epoch": 1893} {"train_loss": -6.173368453979492, "global_step": 79512, "epoch": 1893} {"train_loss": -6.155613899230957, "global_step": 79513, "epoch": 1893} {"train_loss": -6.075464725494385, "global_step": 79514, "epoch": 1893} {"train_loss": -6.0688862800598145, "global_step": 79515, "epoch": 1893} {"train_loss": -6.081799507141113, "global_step": 79516, "epoch": 1893} {"train_loss": -6.0944414138793945, "global_step": 79517, "epoch": 1893} {"train_loss": -6.111380577087402, "global_step": 79518, "epoch": 1893} {"train_loss": -6.024217128753662, "global_step": 79519, "epoch": 1893} {"train_loss": -6.091507911682129, "global_step": 79520, "epoch": 1893} {"train_loss": -6.057017803192139, "global_step": 79521, "epoch": 1893} {"train_loss": -6.0587358474731445, "global_step": 79522, "epoch": 1893} {"train_loss": -6.149012565612793, "global_step": 79523, "epoch": 1893} {"train_loss": -6.232860088348389, "global_step": 79524, "epoch": 1893} {"train_loss": -6.175448417663574, "global_step": 79525, "epoch": 1893} {"train_loss": -6.199372291564941, "global_step": 79526, "epoch": 1893} {"train_loss": -6.02294921875, "global_step": 79527, "epoch": 1893} {"train_loss": -6.208379745483398, "global_step": 79528, "epoch": 1893} {"train_loss": -6.004833221435547, "global_step": 79529, "epoch": 1893} {"train_loss": -6.018431186676025, "global_step": 79530, "epoch": 1893} {"train_loss": -6.083566188812256, "global_step": 79531, "epoch": 1893} {"train_loss": -5.94770622253418, "global_step": 79532, "epoch": 1893} {"train_loss": -6.03333854675293, "global_step": 79533, "epoch": 1893} {"train_loss": -6.064306259155273, "global_step": 79534, "epoch": 1893} {"train_loss": -6.1078691482543945, "global_step": 79535, "epoch": 1893} {"train_loss": -6.073994159698486, "global_step": 79536, "epoch": 1893} {"train_loss": -6.155059814453125, "global_step": 79537, "epoch": 1893} {"train_loss": -6.053854942321777, "global_step": 79538, "epoch": 1893} {"train_loss": -6.100376605987549, "global_step": 79539, "epoch": 1893} {"train_loss": -6.136414527893066, "global_step": 79540, "epoch": 1893} {"train_loss": -6.057743072509766, "global_step": 79541, "epoch": 1893} {"train_loss": -6.189647197723389, "global_step": 79542, "epoch": 1893} {"train_loss": -6.201204299926758, "global_step": 79543, "epoch": 1893} {"train_loss": -6.0607171058654785, "global_step": 79544, "epoch": 1893} {"train_loss": -6.129913806915283, "global_step": 79545, "epoch": 1893} {"train_loss": -6.1673264503479, "global_step": 79546, "epoch": 1893} {"train_loss": -6.111047165734427, "global_step": 79547, "epoch": 1893, "val_loss": 67693.40625} {"train_loss": -6.1145548820495605, "global_step": 79548, "epoch": 1894} {"train_loss": -6.153652667999268, "global_step": 79549, "epoch": 1894} {"train_loss": -6.1287031173706055, "global_step": 79550, "epoch": 1894} {"train_loss": -6.248281478881836, "global_step": 79551, "epoch": 1894} {"train_loss": -6.0740509033203125, "global_step": 79552, "epoch": 1894} {"train_loss": -6.160921096801758, "global_step": 79553, "epoch": 1894} {"train_loss": -6.013494491577148, "global_step": 79554, "epoch": 1894} {"train_loss": -6.1043806076049805, "global_step": 79555, "epoch": 1894} {"train_loss": -6.249495506286621, "global_step": 79556, "epoch": 1894} {"train_loss": -6.0655293464660645, "global_step": 79557, "epoch": 1894} {"train_loss": -6.145439147949219, "global_step": 79558, "epoch": 1894} {"train_loss": -6.1663408279418945, "global_step": 79559, "epoch": 1894} {"train_loss": -6.075738430023193, "global_step": 79560, "epoch": 1894} {"train_loss": -6.057367324829102, "global_step": 79561, "epoch": 1894} {"train_loss": -6.239720344543457, "global_step": 79562, "epoch": 1894} {"train_loss": -5.983345031738281, "global_step": 79563, "epoch": 1894} {"train_loss": -6.157277584075928, "global_step": 79564, "epoch": 1894} {"train_loss": -6.072400093078613, "global_step": 79565, "epoch": 1894} {"train_loss": -6.042158603668213, "global_step": 79566, "epoch": 1894} {"train_loss": -6.207006454467773, "global_step": 79567, "epoch": 1894} {"train_loss": -6.077940940856934, "global_step": 79568, "epoch": 1894} {"train_loss": -5.980687141418457, "global_step": 79569, "epoch": 1894} {"train_loss": -6.171133518218994, "global_step": 79570, "epoch": 1894} {"train_loss": -6.100286960601807, "global_step": 79571, "epoch": 1894} {"train_loss": -6.124937057495117, "global_step": 79572, "epoch": 1894} {"train_loss": -6.037859916687012, "global_step": 79573, "epoch": 1894} {"train_loss": -6.23052978515625, "global_step": 79574, "epoch": 1894} {"train_loss": -6.170233726501465, "global_step": 79575, "epoch": 1894} {"train_loss": -6.285768508911133, "global_step": 79576, "epoch": 1894} {"train_loss": -6.182417392730713, "global_step": 79577, "epoch": 1894} {"train_loss": -6.225703239440918, "global_step": 79578, "epoch": 1894} {"train_loss": -6.210259437561035, "global_step": 79579, "epoch": 1894} {"train_loss": -6.187078475952148, "global_step": 79580, "epoch": 1894} {"train_loss": -6.130517959594727, "global_step": 79581, "epoch": 1894} {"train_loss": -6.189952850341797, "global_step": 79582, "epoch": 1894} {"train_loss": -6.225675582885742, "global_step": 79583, "epoch": 1894} {"train_loss": -5.997159004211426, "global_step": 79584, "epoch": 1894} {"train_loss": -6.187307357788086, "global_step": 79585, "epoch": 1894} {"train_loss": -6.016757011413574, "global_step": 79586, "epoch": 1894} {"train_loss": -6.02906608581543, "global_step": 79587, "epoch": 1894} {"train_loss": -6.083306789398193, "global_step": 79588, "epoch": 1894} {"train_loss": -6.1287262212662466, "global_step": 79589, "epoch": 1894, "val_loss": 67691.3984375} {"train_loss": -6.130413055419922, "global_step": 79590, "epoch": 1895} {"train_loss": -6.091480255126953, "global_step": 79591, "epoch": 1895} {"train_loss": -6.075255393981934, "global_step": 79592, "epoch": 1895} {"train_loss": -6.125943183898926, "global_step": 79593, "epoch": 1895} {"train_loss": -6.103728294372559, "global_step": 79594, "epoch": 1895} {"train_loss": -6.218230247497559, "global_step": 79595, "epoch": 1895} {"train_loss": -6.091376304626465, "global_step": 79596, "epoch": 1895} {"train_loss": -6.145848274230957, "global_step": 79597, "epoch": 1895} {"train_loss": -6.161983013153076, "global_step": 79598, "epoch": 1895} {"train_loss": -6.082353591918945, "global_step": 79599, "epoch": 1895} {"train_loss": -6.037445068359375, "global_step": 79600, "epoch": 1895} {"train_loss": -6.160709857940674, "global_step": 79601, "epoch": 1895} {"train_loss": -6.184979438781738, "global_step": 79602, "epoch": 1895} {"train_loss": -6.194533348083496, "global_step": 79603, "epoch": 1895} {"train_loss": -6.265851974487305, "global_step": 79604, "epoch": 1895} {"train_loss": -6.078341484069824, "global_step": 79605, "epoch": 1895} {"train_loss": -6.1542558670043945, "global_step": 79606, "epoch": 1895} {"train_loss": -6.1609344482421875, "global_step": 79607, "epoch": 1895} {"train_loss": -6.140522480010986, "global_step": 79608, "epoch": 1895} {"train_loss": -6.048047065734863, "global_step": 79609, "epoch": 1895} {"train_loss": -6.174932479858398, "global_step": 79610, "epoch": 1895} {"train_loss": -6.176599502563477, "global_step": 79611, "epoch": 1895} {"train_loss": -6.158952713012695, "global_step": 79612, "epoch": 1895} {"train_loss": -6.04674768447876, "global_step": 79613, "epoch": 1895} {"train_loss": -6.097843170166016, "global_step": 79614, "epoch": 1895} {"train_loss": -6.112178802490234, "global_step": 79615, "epoch": 1895} {"train_loss": -6.15872859954834, "global_step": 79616, "epoch": 1895} {"train_loss": -6.100899696350098, "global_step": 79617, "epoch": 1895} {"train_loss": -6.193199157714844, "global_step": 79618, "epoch": 1895} {"train_loss": -6.05947208404541, "global_step": 79619, "epoch": 1895} {"train_loss": -6.143070220947266, "global_step": 79620, "epoch": 1895} {"train_loss": -6.073435306549072, "global_step": 79621, "epoch": 1895} {"train_loss": -6.075360298156738, "global_step": 79622, "epoch": 1895} {"train_loss": -6.20170783996582, "global_step": 79623, "epoch": 1895} {"train_loss": -6.1776580810546875, "global_step": 79624, "epoch": 1895} {"train_loss": -6.14841890335083, "global_step": 79625, "epoch": 1895} {"train_loss": -6.074176788330078, "global_step": 79626, "epoch": 1895} {"train_loss": -6.108974456787109, "global_step": 79627, "epoch": 1895} {"train_loss": -5.981465816497803, "global_step": 79628, "epoch": 1895} {"train_loss": -6.071284770965576, "global_step": 79629, "epoch": 1895} {"train_loss": -6.160680770874023, "global_step": 79630, "epoch": 1895} {"train_loss": -6.124626795450847, "global_step": 79631, "epoch": 1895, "val_loss": 67599.15625} {"train_loss": -6.1402506828308105, "global_step": 79632, "epoch": 1896} {"train_loss": -6.231479644775391, "global_step": 79633, "epoch": 1896} {"train_loss": -6.015888214111328, "global_step": 79634, "epoch": 1896} {"train_loss": -6.075749397277832, "global_step": 79635, "epoch": 1896} {"train_loss": -6.133408546447754, "global_step": 79636, "epoch": 1896} {"train_loss": -6.105615615844727, "global_step": 79637, "epoch": 1896} {"train_loss": -6.1044721603393555, "global_step": 79638, "epoch": 1896} {"train_loss": -6.0541510581970215, "global_step": 79639, "epoch": 1896} {"train_loss": -6.089361190795898, "global_step": 79640, "epoch": 1896} {"train_loss": -6.156440734863281, "global_step": 79641, "epoch": 1896} {"train_loss": -6.128228187561035, "global_step": 79642, "epoch": 1896} {"train_loss": -6.167478084564209, "global_step": 79643, "epoch": 1896} {"train_loss": -6.252010345458984, "global_step": 79644, "epoch": 1896} {"train_loss": -6.153667449951172, "global_step": 79645, "epoch": 1896} {"train_loss": -6.038661003112793, "global_step": 79646, "epoch": 1896} {"train_loss": -6.111894607543945, "global_step": 79647, "epoch": 1896} {"train_loss": -6.17746639251709, "global_step": 79648, "epoch": 1896} {"train_loss": -6.0975446701049805, "global_step": 79649, "epoch": 1896} {"train_loss": -6.062138557434082, "global_step": 79650, "epoch": 1896} {"train_loss": -6.053636074066162, "global_step": 79651, "epoch": 1896} {"train_loss": -6.075335502624512, "global_step": 79652, "epoch": 1896} {"train_loss": -6.100981712341309, "global_step": 79653, "epoch": 1896} {"train_loss": -6.1434326171875, "global_step": 79654, "epoch": 1896} {"train_loss": -6.223351001739502, "global_step": 79655, "epoch": 1896} {"train_loss": -6.238821983337402, "global_step": 79656, "epoch": 1896} {"train_loss": -6.052980422973633, "global_step": 79657, "epoch": 1896} {"train_loss": -6.1801581382751465, "global_step": 79658, "epoch": 1896} {"train_loss": -6.153767108917236, "global_step": 79659, "epoch": 1896} {"train_loss": -5.783694267272949, "global_step": 79660, "epoch": 1896} {"train_loss": -6.2112579345703125, "global_step": 79661, "epoch": 1896} {"train_loss": -6.086264610290527, "global_step": 79662, "epoch": 1896} {"train_loss": -6.144705772399902, "global_step": 79663, "epoch": 1896} {"train_loss": -6.108457565307617, "global_step": 79664, "epoch": 1896} {"train_loss": -6.160799026489258, "global_step": 79665, "epoch": 1896} {"train_loss": -6.144009113311768, "global_step": 79666, "epoch": 1896} {"train_loss": -6.09614372253418, "global_step": 79667, "epoch": 1896} {"train_loss": -6.127760410308838, "global_step": 79668, "epoch": 1896} {"train_loss": -6.051998138427734, "global_step": 79669, "epoch": 1896} {"train_loss": -6.159337043762207, "global_step": 79670, "epoch": 1896} {"train_loss": -6.207777976989746, "global_step": 79671, "epoch": 1896} {"train_loss": -6.063519477844238, "global_step": 79672, "epoch": 1896} {"train_loss": -6.118107057753063, "global_step": 79673, "epoch": 1896, "val_loss": 67632.1484375} {"train_loss": -6.003855228424072, "global_step": 79674, "epoch": 1897} {"train_loss": -6.252821922302246, "global_step": 79675, "epoch": 1897} {"train_loss": -6.146945476531982, "global_step": 79676, "epoch": 1897} {"train_loss": -6.075157642364502, "global_step": 79677, "epoch": 1897} {"train_loss": -6.130470275878906, "global_step": 79678, "epoch": 1897} {"train_loss": -6.039247989654541, "global_step": 79679, "epoch": 1897} {"train_loss": -6.185466766357422, "global_step": 79680, "epoch": 1897} {"train_loss": -6.080517768859863, "global_step": 79681, "epoch": 1897} {"train_loss": -6.1681694984436035, "global_step": 79682, "epoch": 1897} {"train_loss": -6.019414901733398, "global_step": 79683, "epoch": 1897} {"train_loss": -5.948947906494141, "global_step": 79684, "epoch": 1897} {"train_loss": -6.140578269958496, "global_step": 79685, "epoch": 1897} {"train_loss": -6.151419162750244, "global_step": 79686, "epoch": 1897} {"train_loss": -6.165776252746582, "global_step": 79687, "epoch": 1897} {"train_loss": -6.226195335388184, "global_step": 79688, "epoch": 1897} {"train_loss": -6.170341491699219, "global_step": 79689, "epoch": 1897} {"train_loss": -6.172414779663086, "global_step": 79690, "epoch": 1897} {"train_loss": -6.1831159591674805, "global_step": 79691, "epoch": 1897} {"train_loss": -6.126180648803711, "global_step": 79692, "epoch": 1897} {"train_loss": -6.087283134460449, "global_step": 79693, "epoch": 1897} {"train_loss": -6.0864362716674805, "global_step": 79694, "epoch": 1897} {"train_loss": -6.193090915679932, "global_step": 79695, "epoch": 1897} {"train_loss": -6.219602584838867, "global_step": 79696, "epoch": 1897} {"train_loss": -6.079607963562012, "global_step": 79697, "epoch": 1897} {"train_loss": -6.079354286193848, "global_step": 79698, "epoch": 1897} {"train_loss": -6.159462928771973, "global_step": 79699, "epoch": 1897} {"train_loss": -6.169180393218994, "global_step": 79700, "epoch": 1897} {"train_loss": -6.1634979248046875, "global_step": 79701, "epoch": 1897} {"train_loss": -6.089416980743408, "global_step": 79702, "epoch": 1897} {"train_loss": -6.1313934326171875, "global_step": 79703, "epoch": 1897} {"train_loss": -6.1886491775512695, "global_step": 79704, "epoch": 1897} {"train_loss": -6.080279350280762, "global_step": 79705, "epoch": 1897} {"train_loss": -6.160926818847656, "global_step": 79706, "epoch": 1897} {"train_loss": -6.0600152015686035, "global_step": 79707, "epoch": 1897} {"train_loss": -6.151520729064941, "global_step": 79708, "epoch": 1897} {"train_loss": -6.004571914672852, "global_step": 79709, "epoch": 1897} {"train_loss": -6.071288585662842, "global_step": 79710, "epoch": 1897} {"train_loss": -6.037580966949463, "global_step": 79711, "epoch": 1897} {"train_loss": -6.076181888580322, "global_step": 79712, "epoch": 1897} {"train_loss": -6.119119644165039, "global_step": 79713, "epoch": 1897} {"train_loss": -6.201773643493652, "global_step": 79714, "epoch": 1897} {"train_loss": -6.119752895264399, "global_step": 79715, "epoch": 1897, "val_loss": 67638.7265625} {"train_loss": -6.0913472175598145, "global_step": 79716, "epoch": 1898} {"train_loss": -6.176722049713135, "global_step": 79717, "epoch": 1898} {"train_loss": -6.144867897033691, "global_step": 79718, "epoch": 1898} {"train_loss": -6.157273769378662, "global_step": 79719, "epoch": 1898} {"train_loss": -6.153953552246094, "global_step": 79720, "epoch": 1898} {"train_loss": -5.9889421463012695, "global_step": 79721, "epoch": 1898} {"train_loss": -6.187535762786865, "global_step": 79722, "epoch": 1898} {"train_loss": -6.119818687438965, "global_step": 79723, "epoch": 1898} {"train_loss": -6.126486778259277, "global_step": 79724, "epoch": 1898} {"train_loss": -6.154590129852295, "global_step": 79725, "epoch": 1898} {"train_loss": -6.052969932556152, "global_step": 79726, "epoch": 1898} {"train_loss": -6.014718532562256, "global_step": 79727, "epoch": 1898} {"train_loss": -6.115828037261963, "global_step": 79728, "epoch": 1898} {"train_loss": -6.040556907653809, "global_step": 79729, "epoch": 1898} {"train_loss": -6.060760021209717, "global_step": 79730, "epoch": 1898} {"train_loss": -6.11184024810791, "global_step": 79731, "epoch": 1898} {"train_loss": -6.038599491119385, "global_step": 79732, "epoch": 1898} {"train_loss": -6.119660377502441, "global_step": 79733, "epoch": 1898} {"train_loss": -6.008209228515625, "global_step": 79734, "epoch": 1898} {"train_loss": -6.157469749450684, "global_step": 79735, "epoch": 1898} {"train_loss": -6.121477127075195, "global_step": 79736, "epoch": 1898} {"train_loss": -6.1571831703186035, "global_step": 79737, "epoch": 1898} {"train_loss": -6.102227210998535, "global_step": 79738, "epoch": 1898} {"train_loss": -6.104832172393799, "global_step": 79739, "epoch": 1898} {"train_loss": -6.096035957336426, "global_step": 79740, "epoch": 1898} {"train_loss": -6.097837448120117, "global_step": 79741, "epoch": 1898} {"train_loss": -6.118226051330566, "global_step": 79742, "epoch": 1898} {"train_loss": -6.176708221435547, "global_step": 79743, "epoch": 1898} {"train_loss": -6.082115173339844, "global_step": 79744, "epoch": 1898} {"train_loss": -6.119036674499512, "global_step": 79745, "epoch": 1898} {"train_loss": -6.098400115966797, "global_step": 79746, "epoch": 1898} {"train_loss": -6.152082920074463, "global_step": 79747, "epoch": 1898} {"train_loss": -6.163280487060547, "global_step": 79748, "epoch": 1898} {"train_loss": -6.013851165771484, "global_step": 79749, "epoch": 1898} {"train_loss": -6.119907379150391, "global_step": 79750, "epoch": 1898} {"train_loss": -6.127871990203857, "global_step": 79751, "epoch": 1898} {"train_loss": -6.120184421539307, "global_step": 79752, "epoch": 1898} {"train_loss": -6.127852916717529, "global_step": 79753, "epoch": 1898} {"train_loss": -6.1432037353515625, "global_step": 79754, "epoch": 1898} {"train_loss": -5.954333782196045, "global_step": 79755, "epoch": 1898} {"train_loss": -5.980024337768555, "global_step": 79756, "epoch": 1898} {"train_loss": -6.100768463952201, "global_step": 79757, "epoch": 1898, "val_loss": 67741.9375} {"train_loss": -6.215976715087891, "global_step": 79758, "epoch": 1899} {"train_loss": -6.052290916442871, "global_step": 79759, "epoch": 1899} {"train_loss": -6.002903938293457, "global_step": 79760, "epoch": 1899} {"train_loss": -6.220137119293213, "global_step": 79761, "epoch": 1899} {"train_loss": -6.156772613525391, "global_step": 79762, "epoch": 1899} {"train_loss": -6.225560665130615, "global_step": 79763, "epoch": 1899} {"train_loss": -6.038923263549805, "global_step": 79764, "epoch": 1899} {"train_loss": -6.174178123474121, "global_step": 79765, "epoch": 1899} {"train_loss": -6.10624361038208, "global_step": 79766, "epoch": 1899} {"train_loss": -6.148550987243652, "global_step": 79767, "epoch": 1899} {"train_loss": -6.188288688659668, "global_step": 79768, "epoch": 1899} {"train_loss": -6.172430038452148, "global_step": 79769, "epoch": 1899} {"train_loss": -6.037992477416992, "global_step": 79770, "epoch": 1899} {"train_loss": -6.014901638031006, "global_step": 79771, "epoch": 1899} {"train_loss": -6.086212635040283, "global_step": 79772, "epoch": 1899} {"train_loss": -6.121767044067383, "global_step": 79773, "epoch": 1899} {"train_loss": -6.188608646392822, "global_step": 79774, "epoch": 1899} {"train_loss": -6.2368974685668945, "global_step": 79775, "epoch": 1899} {"train_loss": -6.105876922607422, "global_step": 79776, "epoch": 1899} {"train_loss": -6.181994438171387, "global_step": 79777, "epoch": 1899} {"train_loss": -6.200769424438477, "global_step": 79778, "epoch": 1899} {"train_loss": -6.103487968444824, "global_step": 79779, "epoch": 1899} {"train_loss": -6.0948944091796875, "global_step": 79780, "epoch": 1899} {"train_loss": -6.063263893127441, "global_step": 79781, "epoch": 1899} {"train_loss": -6.020916938781738, "global_step": 79782, "epoch": 1899} {"train_loss": -6.07925271987915, "global_step": 79783, "epoch": 1899} {"train_loss": -5.972411155700684, "global_step": 79784, "epoch": 1899} {"train_loss": -6.033326148986816, "global_step": 79785, "epoch": 1899} {"train_loss": -6.193229675292969, "global_step": 79786, "epoch": 1899} {"train_loss": -6.0203938484191895, "global_step": 79787, "epoch": 1899} {"train_loss": -6.152400970458984, "global_step": 79788, "epoch": 1899} {"train_loss": -6.180384159088135, "global_step": 79789, "epoch": 1899} {"train_loss": -6.157034873962402, "global_step": 79790, "epoch": 1899} {"train_loss": -6.108876705169678, "global_step": 79791, "epoch": 1899} {"train_loss": -6.120757102966309, "global_step": 79792, "epoch": 1899} {"train_loss": -6.13899564743042, "global_step": 79793, "epoch": 1899} {"train_loss": -6.141563415527344, "global_step": 79794, "epoch": 1899} {"train_loss": -6.039693832397461, "global_step": 79795, "epoch": 1899} {"train_loss": -6.002025604248047, "global_step": 79796, "epoch": 1899} {"train_loss": -6.131235599517822, "global_step": 79797, "epoch": 1899} {"train_loss": -6.10195779800415, "global_step": 79798, "epoch": 1899} {"train_loss": -6.116511583328247, "global_step": 79799, "epoch": 1899, "val_loss": 67481.625} {"train_loss": -6.212446212768555, "global_step": 79800, "epoch": 1900} {"train_loss": -6.158096790313721, "global_step": 79801, "epoch": 1900} {"train_loss": -6.213018417358398, "global_step": 79802, "epoch": 1900} {"train_loss": -6.077858924865723, "global_step": 79803, "epoch": 1900} {"train_loss": -6.142982482910156, "global_step": 79804, "epoch": 1900} {"train_loss": -6.105317115783691, "global_step": 79805, "epoch": 1900} {"train_loss": -5.999966621398926, "global_step": 79806, "epoch": 1900} {"train_loss": -6.152425765991211, "global_step": 79807, "epoch": 1900} {"train_loss": -6.099993705749512, "global_step": 79808, "epoch": 1900} {"train_loss": -6.095761299133301, "global_step": 79809, "epoch": 1900} {"train_loss": -6.185057640075684, "global_step": 79810, "epoch": 1900} {"train_loss": -6.12774658203125, "global_step": 79811, "epoch": 1900} {"train_loss": -6.042397975921631, "global_step": 79812, "epoch": 1900} {"train_loss": -6.064054489135742, "global_step": 79813, "epoch": 1900} {"train_loss": -6.159283638000488, "global_step": 79814, "epoch": 1900} {"train_loss": -6.238064765930176, "global_step": 79815, "epoch": 1900} {"train_loss": -6.03422737121582, "global_step": 79816, "epoch": 1900} {"train_loss": -6.220022678375244, "global_step": 79817, "epoch": 1900} {"train_loss": -5.996709823608398, "global_step": 79818, "epoch": 1900} {"train_loss": -6.092806816101074, "global_step": 79819, "epoch": 1900} {"train_loss": -6.100964546203613, "global_step": 79820, "epoch": 1900} {"train_loss": -6.027615547180176, "global_step": 79821, "epoch": 1900} {"train_loss": -6.079254150390625, "global_step": 79822, "epoch": 1900} {"train_loss": -6.1166863441467285, "global_step": 79823, "epoch": 1900} {"train_loss": -5.943841934204102, "global_step": 79824, "epoch": 1900} {"train_loss": -6.085891246795654, "global_step": 79825, "epoch": 1900} {"train_loss": -6.153951644897461, "global_step": 79826, "epoch": 1900} {"train_loss": -6.0272111892700195, "global_step": 79827, "epoch": 1900} {"train_loss": -6.087216854095459, "global_step": 79828, "epoch": 1900} {"train_loss": -6.078960418701172, "global_step": 79829, "epoch": 1900} {"train_loss": -6.093573570251465, "global_step": 79830, "epoch": 1900} {"train_loss": -6.08030891418457, "global_step": 79831, "epoch": 1900} {"train_loss": -6.169741630554199, "global_step": 79832, "epoch": 1900} {"train_loss": -6.033478736877441, "global_step": 79833, "epoch": 1900} {"train_loss": -6.127460479736328, "global_step": 79834, "epoch": 1900} {"train_loss": -6.191386699676514, "global_step": 79835, "epoch": 1900} {"train_loss": -6.053497314453125, "global_step": 79836, "epoch": 1900} {"train_loss": -6.174650192260742, "global_step": 79837, "epoch": 1900} {"train_loss": -5.98746395111084, "global_step": 79838, "epoch": 1900} {"train_loss": -6.0853400230407715, "global_step": 79839, "epoch": 1900} {"train_loss": -6.137880325317383, "global_step": 79840, "epoch": 1900} {"train_loss": -6.104535375322614, "global_step": 79841, "epoch": 1900, "train/sim_max_reward_0": 0.2217380310601885, "train/sim_max_reward_1": 0.43026203956757836, "train/sim_max_reward_2": 0.7748393063605059, "train/sim_max_reward_3": 0.15489548816656531, "train/sim_max_reward_4": 0.8924280346035717, "train/sim_max_reward_5": 0.21031164835182323, "test/sim_max_reward_4400000": 0.16168160849126897, "test/sim_max_reward_4400001": 0.9515049993882793, "test/sim_max_reward_4400002": 0.5288730350765359, "test/sim_max_reward_4400003": 0.8162059345783081, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.2292986909389869, "test/sim_max_reward_4400006": 0.4214805464757469, "test/sim_max_reward_4400007": 0.9226033361654817, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9228220552442935, "test/sim_max_reward_4400010": 0.16906944226902107, "test/sim_max_reward_4400011": 0.202376751782926, "test/sim_max_reward_4400012": 0.8449346721438118, "test/sim_max_reward_4400013": 0.24697872086315445, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.7200057627023103, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.5425558622432084, "test/sim_max_reward_4400022": 0.26313870622076335, "test/sim_max_reward_4400023": 0.42361226457339224, "test/sim_max_reward_4400024": 0.7548342718504991, "test/sim_max_reward_4400025": 0.27714383477663596, "test/sim_max_reward_4400026": 0.8888009305386387, "test/sim_max_reward_4400027": 0.0342270036747673, "test/sim_max_reward_4400028": 0.8682359960107053, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9676677017688582, "test/sim_max_reward_4400031": 0.9429629710105337, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9530857340057157, "test/sim_max_reward_4400034": 0.7453642390356977, "test/sim_max_reward_4400035": 0.917480019233317, "test/sim_max_reward_4400036": 0.37140335021613874, "test/sim_max_reward_4400037": 0.9588035477562816, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.863300709072458, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6612802832219322, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.9461973493202759, "test/sim_max_reward_4400044": 0.10059424033828882, "test/sim_max_reward_4400045": 0.8090652907797625, "test/sim_max_reward_4400046": 0.3760735546862703, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.7630464604919607, "train/mean_score": 0.44741242468503883, "test/mean_score": 0.4845289043207516, "val_loss": 67721.578125} {"train_loss": -6.152078628540039, "global_step": 79842, "epoch": 1901} {"train_loss": -6.1829376220703125, "global_step": 79843, "epoch": 1901} {"train_loss": -5.980962753295898, "global_step": 79844, "epoch": 1901} {"train_loss": -6.089694023132324, "global_step": 79845, "epoch": 1901} {"train_loss": -6.032593727111816, "global_step": 79846, "epoch": 1901} {"train_loss": -6.315301895141602, "global_step": 79847, "epoch": 1901} {"train_loss": -6.153191566467285, "global_step": 79848, "epoch": 1901} {"train_loss": -6.040168762207031, "global_step": 79849, "epoch": 1901} {"train_loss": -6.186563491821289, "global_step": 79850, "epoch": 1901} {"train_loss": -6.2267913818359375, "global_step": 79851, "epoch": 1901} {"train_loss": -6.145544528961182, "global_step": 79852, "epoch": 1901} {"train_loss": -6.099028587341309, "global_step": 79853, "epoch": 1901} {"train_loss": -6.094539642333984, "global_step": 79854, "epoch": 1901} {"train_loss": -6.11040735244751, "global_step": 79855, "epoch": 1901} {"train_loss": -6.115014553070068, "global_step": 79856, "epoch": 1901} {"train_loss": -6.067362308502197, "global_step": 79857, "epoch": 1901} {"train_loss": -5.981080055236816, "global_step": 79858, "epoch": 1901} {"train_loss": -6.074678897857666, "global_step": 79859, "epoch": 1901} {"train_loss": -5.976382732391357, "global_step": 79860, "epoch": 1901} {"train_loss": -6.090624809265137, "global_step": 79861, "epoch": 1901} {"train_loss": -6.176787376403809, "global_step": 79862, "epoch": 1901} {"train_loss": -6.198051929473877, "global_step": 79863, "epoch": 1901} {"train_loss": -6.000624179840088, "global_step": 79864, "epoch": 1901} {"train_loss": -6.1385650634765625, "global_step": 79865, "epoch": 1901} {"train_loss": -6.203281879425049, "global_step": 79866, "epoch": 1901} {"train_loss": -6.0836286544799805, "global_step": 79867, "epoch": 1901} {"train_loss": -6.077088356018066, "global_step": 79868, "epoch": 1901} {"train_loss": -6.139512538909912, "global_step": 79869, "epoch": 1901} {"train_loss": -6.205882549285889, "global_step": 79870, "epoch": 1901} {"train_loss": -6.135377883911133, "global_step": 79871, "epoch": 1901} {"train_loss": -6.195168972015381, "global_step": 79872, "epoch": 1901} {"train_loss": -6.158193588256836, "global_step": 79873, "epoch": 1901} {"train_loss": -6.156517028808594, "global_step": 79874, "epoch": 1901} {"train_loss": -6.170896530151367, "global_step": 79875, "epoch": 1901} {"train_loss": -6.071063995361328, "global_step": 79876, "epoch": 1901} {"train_loss": -6.121152877807617, "global_step": 79877, "epoch": 1901} {"train_loss": -6.112765312194824, "global_step": 79878, "epoch": 1901} {"train_loss": -6.085175514221191, "global_step": 79879, "epoch": 1901} {"train_loss": -6.090143203735352, "global_step": 79880, "epoch": 1901} {"train_loss": -6.190128326416016, "global_step": 79881, "epoch": 1901} {"train_loss": -6.07880973815918, "global_step": 79882, "epoch": 1901} {"train_loss": -6.119739963894799, "global_step": 79883, "epoch": 1901, "val_loss": 67306.0546875} {"train_loss": -6.137375831604004, "global_step": 79884, "epoch": 1902} {"train_loss": -6.152963638305664, "global_step": 79885, "epoch": 1902} {"train_loss": -6.252674579620361, "global_step": 79886, "epoch": 1902} {"train_loss": -6.137611389160156, "global_step": 79887, "epoch": 1902} {"train_loss": -6.239030838012695, "global_step": 79888, "epoch": 1902} {"train_loss": -6.260268211364746, "global_step": 79889, "epoch": 1902} {"train_loss": -6.248366832733154, "global_step": 79890, "epoch": 1902} {"train_loss": -6.070021629333496, "global_step": 79891, "epoch": 1902} {"train_loss": -6.198306083679199, "global_step": 79892, "epoch": 1902} {"train_loss": -6.089353561401367, "global_step": 79893, "epoch": 1902} {"train_loss": -6.18922758102417, "global_step": 79894, "epoch": 1902} {"train_loss": -6.06615686416626, "global_step": 79895, "epoch": 1902} {"train_loss": -6.18841552734375, "global_step": 79896, "epoch": 1902} {"train_loss": -6.110786437988281, "global_step": 79897, "epoch": 1902} {"train_loss": -6.106926918029785, "global_step": 79898, "epoch": 1902} {"train_loss": -6.090022563934326, "global_step": 79899, "epoch": 1902} {"train_loss": -6.100935935974121, "global_step": 79900, "epoch": 1902} {"train_loss": -6.066729545593262, "global_step": 79901, "epoch": 1902} {"train_loss": -5.965452671051025, "global_step": 79902, "epoch": 1902} {"train_loss": -6.177342414855957, "global_step": 79903, "epoch": 1902} {"train_loss": -5.995796203613281, "global_step": 79904, "epoch": 1902} {"train_loss": -5.88993501663208, "global_step": 79905, "epoch": 1902} {"train_loss": -5.917508602142334, "global_step": 79906, "epoch": 1902} {"train_loss": -6.0103864669799805, "global_step": 79907, "epoch": 1902} {"train_loss": -6.1674346923828125, "global_step": 79908, "epoch": 1902} {"train_loss": -6.0522685050964355, "global_step": 79909, "epoch": 1902} {"train_loss": -6.1351518630981445, "global_step": 79910, "epoch": 1902} {"train_loss": -6.120510101318359, "global_step": 79911, "epoch": 1902} {"train_loss": -5.991595268249512, "global_step": 79912, "epoch": 1902} {"train_loss": -6.007705211639404, "global_step": 79913, "epoch": 1902} {"train_loss": -6.121775150299072, "global_step": 79914, "epoch": 1902} {"train_loss": -6.132307052612305, "global_step": 79915, "epoch": 1902} {"train_loss": -6.017122268676758, "global_step": 79916, "epoch": 1902} {"train_loss": -6.031590938568115, "global_step": 79917, "epoch": 1902} {"train_loss": -6.139806747436523, "global_step": 79918, "epoch": 1902} {"train_loss": -6.180952548980713, "global_step": 79919, "epoch": 1902} {"train_loss": -6.134853363037109, "global_step": 79920, "epoch": 1902} {"train_loss": -6.026919364929199, "global_step": 79921, "epoch": 1902} {"train_loss": -6.052138328552246, "global_step": 79922, "epoch": 1902} {"train_loss": -5.986938953399658, "global_step": 79923, "epoch": 1902} {"train_loss": -6.21616792678833, "global_step": 79924, "epoch": 1902} {"train_loss": -6.104358264378139, "global_step": 79925, "epoch": 1902, "val_loss": 67632.4140625} {"train_loss": -6.108309745788574, "global_step": 79926, "epoch": 1903} {"train_loss": -6.036730766296387, "global_step": 79927, "epoch": 1903} {"train_loss": -6.002796173095703, "global_step": 79928, "epoch": 1903} {"train_loss": -6.1526994705200195, "global_step": 79929, "epoch": 1903} {"train_loss": -6.129947662353516, "global_step": 79930, "epoch": 1903} {"train_loss": -6.072724342346191, "global_step": 79931, "epoch": 1903} {"train_loss": -6.103499412536621, "global_step": 79932, "epoch": 1903} {"train_loss": -6.054185390472412, "global_step": 79933, "epoch": 1903} {"train_loss": -6.069805145263672, "global_step": 79934, "epoch": 1903} {"train_loss": -6.168133735656738, "global_step": 79935, "epoch": 1903} {"train_loss": -6.157863616943359, "global_step": 79936, "epoch": 1903} {"train_loss": -6.024874687194824, "global_step": 79937, "epoch": 1903} {"train_loss": -6.196917533874512, "global_step": 79938, "epoch": 1903} {"train_loss": -6.199836730957031, "global_step": 79939, "epoch": 1903} {"train_loss": -6.153792381286621, "global_step": 79940, "epoch": 1903} {"train_loss": -6.109153747558594, "global_step": 79941, "epoch": 1903} {"train_loss": -6.245500564575195, "global_step": 79942, "epoch": 1903} {"train_loss": -6.190961837768555, "global_step": 79943, "epoch": 1903} {"train_loss": -6.1662750244140625, "global_step": 79944, "epoch": 1903} {"train_loss": -6.122735977172852, "global_step": 79945, "epoch": 1903} {"train_loss": -6.239507675170898, "global_step": 79946, "epoch": 1903} {"train_loss": -6.211651802062988, "global_step": 79947, "epoch": 1903} {"train_loss": -6.181398391723633, "global_step": 79948, "epoch": 1903} {"train_loss": -6.298465728759766, "global_step": 79949, "epoch": 1903} {"train_loss": -6.158033847808838, "global_step": 79950, "epoch": 1903} {"train_loss": -6.085467338562012, "global_step": 79951, "epoch": 1903} {"train_loss": -6.247467517852783, "global_step": 79952, "epoch": 1903} {"train_loss": -6.167190074920654, "global_step": 79953, "epoch": 1903} {"train_loss": -6.041025638580322, "global_step": 79954, "epoch": 1903} {"train_loss": -6.1546220779418945, "global_step": 79955, "epoch": 1903} {"train_loss": -6.09202766418457, "global_step": 79956, "epoch": 1903} {"train_loss": -6.092307090759277, "global_step": 79957, "epoch": 1903} {"train_loss": -6.106616973876953, "global_step": 79958, "epoch": 1903} {"train_loss": -6.102336406707764, "global_step": 79959, "epoch": 1903} {"train_loss": -6.174019813537598, "global_step": 79960, "epoch": 1903} {"train_loss": -6.086366176605225, "global_step": 79961, "epoch": 1903} {"train_loss": -6.116127967834473, "global_step": 79962, "epoch": 1903} {"train_loss": -6.0573039054870605, "global_step": 79963, "epoch": 1903} {"train_loss": -6.234123229980469, "global_step": 79964, "epoch": 1903} {"train_loss": -5.984021186828613, "global_step": 79965, "epoch": 1903} {"train_loss": -6.019374370574951, "global_step": 79966, "epoch": 1903} {"train_loss": -6.127628689720517, "global_step": 79967, "epoch": 1903, "val_loss": 67689.59375} {"train_loss": -5.983320236206055, "global_step": 79968, "epoch": 1904} {"train_loss": -6.002168655395508, "global_step": 79969, "epoch": 1904} {"train_loss": -6.040887355804443, "global_step": 79970, "epoch": 1904} {"train_loss": -5.958427429199219, "global_step": 79971, "epoch": 1904} {"train_loss": -6.020688056945801, "global_step": 79972, "epoch": 1904} {"train_loss": -6.038841724395752, "global_step": 79973, "epoch": 1904} {"train_loss": -5.929569721221924, "global_step": 79974, "epoch": 1904} {"train_loss": -5.948990345001221, "global_step": 79975, "epoch": 1904} {"train_loss": -6.007615089416504, "global_step": 79976, "epoch": 1904} {"train_loss": -6.107472896575928, "global_step": 79977, "epoch": 1904} {"train_loss": -6.039499282836914, "global_step": 79978, "epoch": 1904} {"train_loss": -6.066230297088623, "global_step": 79979, "epoch": 1904} {"train_loss": -6.0713701248168945, "global_step": 79980, "epoch": 1904} {"train_loss": -6.07572078704834, "global_step": 79981, "epoch": 1904} {"train_loss": -6.045489311218262, "global_step": 79982, "epoch": 1904} {"train_loss": -5.983970642089844, "global_step": 79983, "epoch": 1904} {"train_loss": -6.149070739746094, "global_step": 79984, "epoch": 1904} {"train_loss": -6.11136531829834, "global_step": 79985, "epoch": 1904} {"train_loss": -6.142699241638184, "global_step": 79986, "epoch": 1904} {"train_loss": -6.0736870765686035, "global_step": 79987, "epoch": 1904} {"train_loss": -6.137221813201904, "global_step": 79988, "epoch": 1904} {"train_loss": -6.0260467529296875, "global_step": 79989, "epoch": 1904} {"train_loss": -6.018353462219238, "global_step": 79990, "epoch": 1904} {"train_loss": -6.107202053070068, "global_step": 79991, "epoch": 1904} {"train_loss": -6.1383771896362305, "global_step": 79992, "epoch": 1904} {"train_loss": -6.253366947174072, "global_step": 79993, "epoch": 1904} {"train_loss": -6.0539445877075195, "global_step": 79994, "epoch": 1904} {"train_loss": -6.172898292541504, "global_step": 79995, "epoch": 1904} {"train_loss": -6.218964099884033, "global_step": 79996, "epoch": 1904} {"train_loss": -6.191915512084961, "global_step": 79997, "epoch": 1904} {"train_loss": -6.230413436889648, "global_step": 79998, "epoch": 1904} {"train_loss": -6.198921203613281, "global_step": 79999, "epoch": 1904} {"train_loss": -6.074985504150391, "global_step": 80000, "epoch": 1904} {"train_loss": -6.112064361572266, "global_step": 80001, "epoch": 1904} {"train_loss": -6.117780685424805, "global_step": 80002, "epoch": 1904} {"train_loss": -6.154473304748535, "global_step": 80003, "epoch": 1904} {"train_loss": -6.210573196411133, "global_step": 80004, "epoch": 1904} {"train_loss": -6.21556282043457, "global_step": 80005, "epoch": 1904} {"train_loss": -6.187404155731201, "global_step": 80006, "epoch": 1904} {"train_loss": -6.2520012855529785, "global_step": 80007, "epoch": 1904} {"train_loss": -6.15970516204834, "global_step": 80008, "epoch": 1904} {"train_loss": -6.099261329287574, "global_step": 80009, "epoch": 1904, "val_loss": 67562.796875} {"train_loss": -6.147326469421387, "global_step": 80010, "epoch": 1905} {"train_loss": -6.174562931060791, "global_step": 80011, "epoch": 1905} {"train_loss": -6.070939064025879, "global_step": 80012, "epoch": 1905} {"train_loss": -6.058218955993652, "global_step": 80013, "epoch": 1905} {"train_loss": -6.211231708526611, "global_step": 80014, "epoch": 1905} {"train_loss": -6.262146472930908, "global_step": 80015, "epoch": 1905} {"train_loss": -6.200898170471191, "global_step": 80016, "epoch": 1905} {"train_loss": -6.121818542480469, "global_step": 80017, "epoch": 1905} {"train_loss": -6.0924296379089355, "global_step": 80018, "epoch": 1905} {"train_loss": -6.055234909057617, "global_step": 80019, "epoch": 1905} {"train_loss": -6.210628509521484, "global_step": 80020, "epoch": 1905} {"train_loss": -6.0715861320495605, "global_step": 80021, "epoch": 1905} {"train_loss": -6.183539390563965, "global_step": 80022, "epoch": 1905} {"train_loss": -6.1037116050720215, "global_step": 80023, "epoch": 1905} {"train_loss": -6.204066753387451, "global_step": 80024, "epoch": 1905} {"train_loss": -6.200682640075684, "global_step": 80025, "epoch": 1905} {"train_loss": -6.095787048339844, "global_step": 80026, "epoch": 1905} {"train_loss": -6.17288875579834, "global_step": 80027, "epoch": 1905} {"train_loss": -6.074422836303711, "global_step": 80028, "epoch": 1905} {"train_loss": -6.186915397644043, "global_step": 80029, "epoch": 1905} {"train_loss": -6.154317855834961, "global_step": 80030, "epoch": 1905} {"train_loss": -6.222528457641602, "global_step": 80031, "epoch": 1905} {"train_loss": -6.301970481872559, "global_step": 80032, "epoch": 1905} {"train_loss": -6.115861892700195, "global_step": 80033, "epoch": 1905} {"train_loss": -6.142454147338867, "global_step": 80034, "epoch": 1905} {"train_loss": -6.102190971374512, "global_step": 80035, "epoch": 1905} {"train_loss": -6.233043670654297, "global_step": 80036, "epoch": 1905} {"train_loss": -6.1228413581848145, "global_step": 80037, "epoch": 1905} {"train_loss": -6.093482971191406, "global_step": 80038, "epoch": 1905} {"train_loss": -6.196714878082275, "global_step": 80039, "epoch": 1905} {"train_loss": -6.137487411499023, "global_step": 80040, "epoch": 1905} {"train_loss": -6.125390529632568, "global_step": 80041, "epoch": 1905} {"train_loss": -6.117380142211914, "global_step": 80042, "epoch": 1905} {"train_loss": -6.221591472625732, "global_step": 80043, "epoch": 1905} {"train_loss": -6.091208457946777, "global_step": 80044, "epoch": 1905} {"train_loss": -6.234125137329102, "global_step": 80045, "epoch": 1905} {"train_loss": -6.165064334869385, "global_step": 80046, "epoch": 1905} {"train_loss": -6.1328935623168945, "global_step": 80047, "epoch": 1905} {"train_loss": -6.166943550109863, "global_step": 80048, "epoch": 1905} {"train_loss": -6.174901962280273, "global_step": 80049, "epoch": 1905} {"train_loss": -6.079831123352051, "global_step": 80050, "epoch": 1905} {"train_loss": -6.151081766401019, "global_step": 80051, "epoch": 1905, "val_loss": 67812.8125} {"train_loss": -6.0991387367248535, "global_step": 80052, "epoch": 1906} {"train_loss": -6.249650478363037, "global_step": 80053, "epoch": 1906} {"train_loss": -6.2312469482421875, "global_step": 80054, "epoch": 1906} {"train_loss": -6.015880584716797, "global_step": 80055, "epoch": 1906} {"train_loss": -6.025861740112305, "global_step": 80056, "epoch": 1906} {"train_loss": -6.132477760314941, "global_step": 80057, "epoch": 1906} {"train_loss": -6.109060764312744, "global_step": 80058, "epoch": 1906} {"train_loss": -6.0825347900390625, "global_step": 80059, "epoch": 1906} {"train_loss": -6.112936496734619, "global_step": 80060, "epoch": 1906} {"train_loss": -6.039732933044434, "global_step": 80061, "epoch": 1906} {"train_loss": -6.087998867034912, "global_step": 80062, "epoch": 1906} {"train_loss": -6.135019302368164, "global_step": 80063, "epoch": 1906} {"train_loss": -6.125432968139648, "global_step": 80064, "epoch": 1906} {"train_loss": -6.214080810546875, "global_step": 80065, "epoch": 1906} {"train_loss": -6.145706653594971, "global_step": 80066, "epoch": 1906} {"train_loss": -6.090050220489502, "global_step": 80067, "epoch": 1906} {"train_loss": -6.044552803039551, "global_step": 80068, "epoch": 1906} {"train_loss": -6.184900283813477, "global_step": 80069, "epoch": 1906} {"train_loss": -6.043750286102295, "global_step": 80070, "epoch": 1906} {"train_loss": -6.09575080871582, "global_step": 80071, "epoch": 1906} {"train_loss": -6.05703592300415, "global_step": 80072, "epoch": 1906} {"train_loss": -6.041219711303711, "global_step": 80073, "epoch": 1906} {"train_loss": -6.095006942749023, "global_step": 80074, "epoch": 1906} {"train_loss": -6.164457321166992, "global_step": 80075, "epoch": 1906} {"train_loss": -6.151133060455322, "global_step": 80076, "epoch": 1906} {"train_loss": -6.142589092254639, "global_step": 80077, "epoch": 1906} {"train_loss": -6.174897193908691, "global_step": 80078, "epoch": 1906} {"train_loss": -6.0796403884887695, "global_step": 80079, "epoch": 1906} {"train_loss": -6.067675590515137, "global_step": 80080, "epoch": 1906} {"train_loss": -6.182072639465332, "global_step": 80081, "epoch": 1906} {"train_loss": -6.101162433624268, "global_step": 80082, "epoch": 1906} {"train_loss": -6.151269912719727, "global_step": 80083, "epoch": 1906} {"train_loss": -6.167364120483398, "global_step": 80084, "epoch": 1906} {"train_loss": -6.240144729614258, "global_step": 80085, "epoch": 1906} {"train_loss": -6.155134201049805, "global_step": 80086, "epoch": 1906} {"train_loss": -6.1937031745910645, "global_step": 80087, "epoch": 1906} {"train_loss": -6.212242603302002, "global_step": 80088, "epoch": 1906} {"train_loss": -6.185385704040527, "global_step": 80089, "epoch": 1906} {"train_loss": -6.219642639160156, "global_step": 80090, "epoch": 1906} {"train_loss": -6.11583137512207, "global_step": 80091, "epoch": 1906} {"train_loss": -6.130702018737793, "global_step": 80092, "epoch": 1906} {"train_loss": -6.1275459811801, "global_step": 80093, "epoch": 1906, "val_loss": 67838.8046875} {"train_loss": -6.141878128051758, "global_step": 80094, "epoch": 1907} {"train_loss": -6.199010372161865, "global_step": 80095, "epoch": 1907} {"train_loss": -6.070751667022705, "global_step": 80096, "epoch": 1907} {"train_loss": -6.207178592681885, "global_step": 80097, "epoch": 1907} {"train_loss": -6.164791584014893, "global_step": 80098, "epoch": 1907} {"train_loss": -6.125951290130615, "global_step": 80099, "epoch": 1907} {"train_loss": -6.049016952514648, "global_step": 80100, "epoch": 1907} {"train_loss": -6.103653907775879, "global_step": 80101, "epoch": 1907} {"train_loss": -6.157783031463623, "global_step": 80102, "epoch": 1907} {"train_loss": -6.061570644378662, "global_step": 80103, "epoch": 1907} {"train_loss": -6.160922050476074, "global_step": 80104, "epoch": 1907} {"train_loss": -6.1947197914123535, "global_step": 80105, "epoch": 1907} {"train_loss": -6.130870819091797, "global_step": 80106, "epoch": 1907} {"train_loss": -6.241875171661377, "global_step": 80107, "epoch": 1907} {"train_loss": -6.0847015380859375, "global_step": 80108, "epoch": 1907} {"train_loss": -6.178287506103516, "global_step": 80109, "epoch": 1907} {"train_loss": -6.0808820724487305, "global_step": 80110, "epoch": 1907} {"train_loss": -6.090864181518555, "global_step": 80111, "epoch": 1907} {"train_loss": -6.092035293579102, "global_step": 80112, "epoch": 1907} {"train_loss": -6.129828453063965, "global_step": 80113, "epoch": 1907} {"train_loss": -6.241955757141113, "global_step": 80114, "epoch": 1907} {"train_loss": -6.132025241851807, "global_step": 80115, "epoch": 1907} {"train_loss": -6.179535865783691, "global_step": 80116, "epoch": 1907} {"train_loss": -6.081358909606934, "global_step": 80117, "epoch": 1907} {"train_loss": -6.16754150390625, "global_step": 80118, "epoch": 1907} {"train_loss": -6.16118049621582, "global_step": 80119, "epoch": 1907} {"train_loss": -6.1685261726379395, "global_step": 80120, "epoch": 1907} {"train_loss": -6.200826168060303, "global_step": 80121, "epoch": 1907} {"train_loss": -6.165765762329102, "global_step": 80122, "epoch": 1907} {"train_loss": -6.116642951965332, "global_step": 80123, "epoch": 1907} {"train_loss": -6.0968427658081055, "global_step": 80124, "epoch": 1907} {"train_loss": -6.171863555908203, "global_step": 80125, "epoch": 1907} {"train_loss": -6.081538200378418, "global_step": 80126, "epoch": 1907} {"train_loss": -6.014698028564453, "global_step": 80127, "epoch": 1907} {"train_loss": -6.0798726081848145, "global_step": 80128, "epoch": 1907} {"train_loss": -6.019989013671875, "global_step": 80129, "epoch": 1907} {"train_loss": -6.107056617736816, "global_step": 80130, "epoch": 1907} {"train_loss": -6.1099114418029785, "global_step": 80131, "epoch": 1907} {"train_loss": -6.087827682495117, "global_step": 80132, "epoch": 1907} {"train_loss": -6.128304481506348, "global_step": 80133, "epoch": 1907} {"train_loss": -6.108017921447754, "global_step": 80134, "epoch": 1907} {"train_loss": -6.12699049995059, "global_step": 80135, "epoch": 1907, "val_loss": 67797.9140625} {"train_loss": -6.154829025268555, "global_step": 80136, "epoch": 1908} {"train_loss": -6.145377159118652, "global_step": 80137, "epoch": 1908} {"train_loss": -5.9721879959106445, "global_step": 80138, "epoch": 1908} {"train_loss": -6.225644111633301, "global_step": 80139, "epoch": 1908} {"train_loss": -6.095294952392578, "global_step": 80140, "epoch": 1908} {"train_loss": -6.236462116241455, "global_step": 80141, "epoch": 1908} {"train_loss": -5.965434551239014, "global_step": 80142, "epoch": 1908} {"train_loss": -6.115495681762695, "global_step": 80143, "epoch": 1908} {"train_loss": -6.088443279266357, "global_step": 80144, "epoch": 1908} {"train_loss": -6.224300384521484, "global_step": 80145, "epoch": 1908} {"train_loss": -6.079771518707275, "global_step": 80146, "epoch": 1908} {"train_loss": -6.053389549255371, "global_step": 80147, "epoch": 1908} {"train_loss": -6.121557235717773, "global_step": 80148, "epoch": 1908} {"train_loss": -6.138795852661133, "global_step": 80149, "epoch": 1908} {"train_loss": -6.120242118835449, "global_step": 80150, "epoch": 1908} {"train_loss": -6.110940933227539, "global_step": 80151, "epoch": 1908} {"train_loss": -6.127616882324219, "global_step": 80152, "epoch": 1908} {"train_loss": -6.1438751220703125, "global_step": 80153, "epoch": 1908} {"train_loss": -6.18885612487793, "global_step": 80154, "epoch": 1908} {"train_loss": -6.155749320983887, "global_step": 80155, "epoch": 1908} {"train_loss": -6.12065315246582, "global_step": 80156, "epoch": 1908} {"train_loss": -6.195869445800781, "global_step": 80157, "epoch": 1908} {"train_loss": -5.984376907348633, "global_step": 80158, "epoch": 1908} {"train_loss": -6.066230297088623, "global_step": 80159, "epoch": 1908} {"train_loss": -5.9821600914001465, "global_step": 80160, "epoch": 1908} {"train_loss": -6.084054946899414, "global_step": 80161, "epoch": 1908} {"train_loss": -6.099663734436035, "global_step": 80162, "epoch": 1908} {"train_loss": -6.186676502227783, "global_step": 80163, "epoch": 1908} {"train_loss": -6.1188201904296875, "global_step": 80164, "epoch": 1908} {"train_loss": -6.019304275512695, "global_step": 80165, "epoch": 1908} {"train_loss": -6.090574741363525, "global_step": 80166, "epoch": 1908} {"train_loss": -6.119798183441162, "global_step": 80167, "epoch": 1908} {"train_loss": -6.063003063201904, "global_step": 80168, "epoch": 1908} {"train_loss": -6.165066719055176, "global_step": 80169, "epoch": 1908} {"train_loss": -6.015674114227295, "global_step": 80170, "epoch": 1908} {"train_loss": -6.038264274597168, "global_step": 80171, "epoch": 1908} {"train_loss": -6.164019584655762, "global_step": 80172, "epoch": 1908} {"train_loss": -6.093368053436279, "global_step": 80173, "epoch": 1908} {"train_loss": -6.036792755126953, "global_step": 80174, "epoch": 1908} {"train_loss": -6.217344284057617, "global_step": 80175, "epoch": 1908} {"train_loss": -6.152600288391113, "global_step": 80176, "epoch": 1908} {"train_loss": -6.111076320920672, "global_step": 80177, "epoch": 1908, "val_loss": 67766.015625} {"train_loss": -6.108309745788574, "global_step": 80178, "epoch": 1909} {"train_loss": -6.1037373542785645, "global_step": 80179, "epoch": 1909} {"train_loss": -6.087779998779297, "global_step": 80180, "epoch": 1909} {"train_loss": -6.075338363647461, "global_step": 80181, "epoch": 1909} {"train_loss": -6.152886390686035, "global_step": 80182, "epoch": 1909} {"train_loss": -6.17603874206543, "global_step": 80183, "epoch": 1909} {"train_loss": -6.1441121101379395, "global_step": 80184, "epoch": 1909} {"train_loss": -6.094226837158203, "global_step": 80185, "epoch": 1909} {"train_loss": -6.214734077453613, "global_step": 80186, "epoch": 1909} {"train_loss": -6.116480350494385, "global_step": 80187, "epoch": 1909} {"train_loss": -6.09572696685791, "global_step": 80188, "epoch": 1909} {"train_loss": -6.065786838531494, "global_step": 80189, "epoch": 1909} {"train_loss": -6.074925899505615, "global_step": 80190, "epoch": 1909} {"train_loss": -6.142692565917969, "global_step": 80191, "epoch": 1909} {"train_loss": -6.102573871612549, "global_step": 80192, "epoch": 1909} {"train_loss": -6.195030212402344, "global_step": 80193, "epoch": 1909} {"train_loss": -6.028680801391602, "global_step": 80194, "epoch": 1909} {"train_loss": -6.059413909912109, "global_step": 80195, "epoch": 1909} {"train_loss": -6.145902633666992, "global_step": 80196, "epoch": 1909} {"train_loss": -6.175970554351807, "global_step": 80197, "epoch": 1909} {"train_loss": -6.101681709289551, "global_step": 80198, "epoch": 1909} {"train_loss": -6.157702445983887, "global_step": 80199, "epoch": 1909} {"train_loss": -6.049914360046387, "global_step": 80200, "epoch": 1909} {"train_loss": -6.026515007019043, "global_step": 80201, "epoch": 1909} {"train_loss": -6.106304168701172, "global_step": 80202, "epoch": 1909} {"train_loss": -6.111631393432617, "global_step": 80203, "epoch": 1909} {"train_loss": -6.033689022064209, "global_step": 80204, "epoch": 1909} {"train_loss": -6.203896999359131, "global_step": 80205, "epoch": 1909} {"train_loss": -6.1857147216796875, "global_step": 80206, "epoch": 1909} {"train_loss": -6.076408386230469, "global_step": 80207, "epoch": 1909} {"train_loss": -6.2098212242126465, "global_step": 80208, "epoch": 1909} {"train_loss": -6.223933219909668, "global_step": 80209, "epoch": 1909} {"train_loss": -6.138543605804443, "global_step": 80210, "epoch": 1909} {"train_loss": -6.239076614379883, "global_step": 80211, "epoch": 1909} {"train_loss": -6.200560092926025, "global_step": 80212, "epoch": 1909} {"train_loss": -6.221642017364502, "global_step": 80213, "epoch": 1909} {"train_loss": -6.164919853210449, "global_step": 80214, "epoch": 1909} {"train_loss": -6.185317039489746, "global_step": 80215, "epoch": 1909} {"train_loss": -6.142745018005371, "global_step": 80216, "epoch": 1909} {"train_loss": -5.965113639831543, "global_step": 80217, "epoch": 1909} {"train_loss": -5.963432312011719, "global_step": 80218, "epoch": 1909} {"train_loss": -6.122883558273315, "global_step": 80219, "epoch": 1909, "val_loss": 67687.7890625} {"train_loss": -6.106782913208008, "global_step": 80220, "epoch": 1910} {"train_loss": -6.234478950500488, "global_step": 80221, "epoch": 1910} {"train_loss": -6.224085807800293, "global_step": 80222, "epoch": 1910} {"train_loss": -6.130817413330078, "global_step": 80223, "epoch": 1910} {"train_loss": -6.199672222137451, "global_step": 80224, "epoch": 1910} {"train_loss": -6.074687957763672, "global_step": 80225, "epoch": 1910} {"train_loss": -6.256789207458496, "global_step": 80226, "epoch": 1910} {"train_loss": -6.186555862426758, "global_step": 80227, "epoch": 1910} {"train_loss": -6.057951927185059, "global_step": 80228, "epoch": 1910} {"train_loss": -6.277533054351807, "global_step": 80229, "epoch": 1910} {"train_loss": -6.085893630981445, "global_step": 80230, "epoch": 1910} {"train_loss": -6.228377342224121, "global_step": 80231, "epoch": 1910} {"train_loss": -6.12130880355835, "global_step": 80232, "epoch": 1910} {"train_loss": -6.099200248718262, "global_step": 80233, "epoch": 1910} {"train_loss": -6.135257720947266, "global_step": 80234, "epoch": 1910} {"train_loss": -6.1309099197387695, "global_step": 80235, "epoch": 1910} {"train_loss": -6.18296480178833, "global_step": 80236, "epoch": 1910} {"train_loss": -6.091229438781738, "global_step": 80237, "epoch": 1910} {"train_loss": -6.265820503234863, "global_step": 80238, "epoch": 1910} {"train_loss": -6.134150505065918, "global_step": 80239, "epoch": 1910} {"train_loss": -6.029996395111084, "global_step": 80240, "epoch": 1910} {"train_loss": -6.069401264190674, "global_step": 80241, "epoch": 1910} {"train_loss": -6.039591312408447, "global_step": 80242, "epoch": 1910} {"train_loss": -6.115408897399902, "global_step": 80243, "epoch": 1910} {"train_loss": -6.235284805297852, "global_step": 80244, "epoch": 1910} {"train_loss": -6.033636093139648, "global_step": 80245, "epoch": 1910} {"train_loss": -6.101424694061279, "global_step": 80246, "epoch": 1910} {"train_loss": -6.075273036956787, "global_step": 80247, "epoch": 1910} {"train_loss": -6.164003372192383, "global_step": 80248, "epoch": 1910} {"train_loss": -6.127282619476318, "global_step": 80249, "epoch": 1910} {"train_loss": -5.991006851196289, "global_step": 80250, "epoch": 1910} {"train_loss": -6.166532516479492, "global_step": 80251, "epoch": 1910} {"train_loss": -6.061882972717285, "global_step": 80252, "epoch": 1910} {"train_loss": -6.179556846618652, "global_step": 80253, "epoch": 1910} {"train_loss": -6.147340774536133, "global_step": 80254, "epoch": 1910} {"train_loss": -6.12485933303833, "global_step": 80255, "epoch": 1910} {"train_loss": -6.117464542388916, "global_step": 80256, "epoch": 1910} {"train_loss": -5.991775989532471, "global_step": 80257, "epoch": 1910} {"train_loss": -6.186910629272461, "global_step": 80258, "epoch": 1910} {"train_loss": -6.14303731918335, "global_step": 80259, "epoch": 1910} {"train_loss": -6.042730331420898, "global_step": 80260, "epoch": 1910} {"train_loss": -6.130356255031767, "global_step": 80261, "epoch": 1910, "val_loss": 67712.890625} {"train_loss": -6.126690864562988, "global_step": 80262, "epoch": 1911} {"train_loss": -6.18263053894043, "global_step": 80263, "epoch": 1911} {"train_loss": -6.181313514709473, "global_step": 80264, "epoch": 1911} {"train_loss": -6.040279388427734, "global_step": 80265, "epoch": 1911} {"train_loss": -6.113994598388672, "global_step": 80266, "epoch": 1911} {"train_loss": -6.066910266876221, "global_step": 80267, "epoch": 1911} {"train_loss": -5.9896650314331055, "global_step": 80268, "epoch": 1911} {"train_loss": -6.226975440979004, "global_step": 80269, "epoch": 1911} {"train_loss": -6.142971038818359, "global_step": 80270, "epoch": 1911} {"train_loss": -6.202645778656006, "global_step": 80271, "epoch": 1911} {"train_loss": -6.086988925933838, "global_step": 80272, "epoch": 1911} {"train_loss": -6.125204086303711, "global_step": 80273, "epoch": 1911} {"train_loss": -6.054966449737549, "global_step": 80274, "epoch": 1911} {"train_loss": -6.11053466796875, "global_step": 80275, "epoch": 1911} {"train_loss": -6.170455455780029, "global_step": 80276, "epoch": 1911} {"train_loss": -6.110686779022217, "global_step": 80277, "epoch": 1911} {"train_loss": -6.214348316192627, "global_step": 80278, "epoch": 1911} {"train_loss": -6.2471489906311035, "global_step": 80279, "epoch": 1911} {"train_loss": -6.006455898284912, "global_step": 80280, "epoch": 1911} {"train_loss": -6.0553436279296875, "global_step": 80281, "epoch": 1911} {"train_loss": -6.0991411209106445, "global_step": 80282, "epoch": 1911} {"train_loss": -6.240553379058838, "global_step": 80283, "epoch": 1911} {"train_loss": -6.225218296051025, "global_step": 80284, "epoch": 1911} {"train_loss": -6.045480728149414, "global_step": 80285, "epoch": 1911} {"train_loss": -6.304184913635254, "global_step": 80286, "epoch": 1911} {"train_loss": -6.238948345184326, "global_step": 80287, "epoch": 1911} {"train_loss": -6.161504745483398, "global_step": 80288, "epoch": 1911} {"train_loss": -6.2721147537231445, "global_step": 80289, "epoch": 1911} {"train_loss": -6.183725357055664, "global_step": 80290, "epoch": 1911} {"train_loss": -6.134134292602539, "global_step": 80291, "epoch": 1911} {"train_loss": -6.139664173126221, "global_step": 80292, "epoch": 1911} {"train_loss": -6.048071384429932, "global_step": 80293, "epoch": 1911} {"train_loss": -5.974221229553223, "global_step": 80294, "epoch": 1911} {"train_loss": -6.111678123474121, "global_step": 80295, "epoch": 1911} {"train_loss": -6.200944900512695, "global_step": 80296, "epoch": 1911} {"train_loss": -6.047868728637695, "global_step": 80297, "epoch": 1911} {"train_loss": -6.200138568878174, "global_step": 80298, "epoch": 1911} {"train_loss": -6.181595802307129, "global_step": 80299, "epoch": 1911} {"train_loss": -6.1471099853515625, "global_step": 80300, "epoch": 1911} {"train_loss": -6.087432861328125, "global_step": 80301, "epoch": 1911} {"train_loss": -6.292407035827637, "global_step": 80302, "epoch": 1911} {"train_loss": -6.138760612124488, "global_step": 80303, "epoch": 1911, "val_loss": 67766.265625} {"train_loss": -6.21776819229126, "global_step": 80304, "epoch": 1912} {"train_loss": -6.166959762573242, "global_step": 80305, "epoch": 1912} {"train_loss": -6.142982006072998, "global_step": 80306, "epoch": 1912} {"train_loss": -6.163760185241699, "global_step": 80307, "epoch": 1912} {"train_loss": -6.112525463104248, "global_step": 80308, "epoch": 1912} {"train_loss": -6.123426914215088, "global_step": 80309, "epoch": 1912} {"train_loss": -6.0778045654296875, "global_step": 80310, "epoch": 1912} {"train_loss": -6.039883136749268, "global_step": 80311, "epoch": 1912} {"train_loss": -6.151400566101074, "global_step": 80312, "epoch": 1912} {"train_loss": -6.115535259246826, "global_step": 80313, "epoch": 1912} {"train_loss": -6.169580459594727, "global_step": 80314, "epoch": 1912} {"train_loss": -5.976924896240234, "global_step": 80315, "epoch": 1912} {"train_loss": -6.101315975189209, "global_step": 80316, "epoch": 1912} {"train_loss": -6.072264194488525, "global_step": 80317, "epoch": 1912} {"train_loss": -6.131263732910156, "global_step": 80318, "epoch": 1912} {"train_loss": -6.023175239562988, "global_step": 80319, "epoch": 1912} {"train_loss": -6.078964710235596, "global_step": 80320, "epoch": 1912} {"train_loss": -6.0509138107299805, "global_step": 80321, "epoch": 1912} {"train_loss": -6.23257303237915, "global_step": 80322, "epoch": 1912} {"train_loss": -6.105073928833008, "global_step": 80323, "epoch": 1912} {"train_loss": -6.263990879058838, "global_step": 80324, "epoch": 1912} {"train_loss": -6.015668869018555, "global_step": 80325, "epoch": 1912} {"train_loss": -6.202472686767578, "global_step": 80326, "epoch": 1912} {"train_loss": -6.210550308227539, "global_step": 80327, "epoch": 1912} {"train_loss": -6.174421310424805, "global_step": 80328, "epoch": 1912} {"train_loss": -6.061260223388672, "global_step": 80329, "epoch": 1912} {"train_loss": -6.093718528747559, "global_step": 80330, "epoch": 1912} {"train_loss": -6.058965682983398, "global_step": 80331, "epoch": 1912} {"train_loss": -6.107060432434082, "global_step": 80332, "epoch": 1912} {"train_loss": -6.2564005851745605, "global_step": 80333, "epoch": 1912} {"train_loss": -6.093562602996826, "global_step": 80334, "epoch": 1912} {"train_loss": -6.195010662078857, "global_step": 80335, "epoch": 1912} {"train_loss": -6.137602806091309, "global_step": 80336, "epoch": 1912} {"train_loss": -6.0840301513671875, "global_step": 80337, "epoch": 1912} {"train_loss": -6.1141767501831055, "global_step": 80338, "epoch": 1912} {"train_loss": -6.0739641189575195, "global_step": 80339, "epoch": 1912} {"train_loss": -6.159884452819824, "global_step": 80340, "epoch": 1912} {"train_loss": -6.019924163818359, "global_step": 80341, "epoch": 1912} {"train_loss": -6.109777450561523, "global_step": 80342, "epoch": 1912} {"train_loss": -6.105969429016113, "global_step": 80343, "epoch": 1912} {"train_loss": -6.06063175201416, "global_step": 80344, "epoch": 1912} {"train_loss": -6.11992487453279, "global_step": 80345, "epoch": 1912, "val_loss": 67740.625} {"train_loss": -6.022127151489258, "global_step": 80346, "epoch": 1913} {"train_loss": -6.103884696960449, "global_step": 80347, "epoch": 1913} {"train_loss": -6.045690536499023, "global_step": 80348, "epoch": 1913} {"train_loss": -6.198170185089111, "global_step": 80349, "epoch": 1913} {"train_loss": -6.017428398132324, "global_step": 80350, "epoch": 1913} {"train_loss": -6.102667808532715, "global_step": 80351, "epoch": 1913} {"train_loss": -6.0946550369262695, "global_step": 80352, "epoch": 1913} {"train_loss": -5.95909309387207, "global_step": 80353, "epoch": 1913} {"train_loss": -6.121252059936523, "global_step": 80354, "epoch": 1913} {"train_loss": -6.017579555511475, "global_step": 80355, "epoch": 1913} {"train_loss": -6.057853698730469, "global_step": 80356, "epoch": 1913} {"train_loss": -6.034066200256348, "global_step": 80357, "epoch": 1913} {"train_loss": -6.087001800537109, "global_step": 80358, "epoch": 1913} {"train_loss": -5.920560836791992, "global_step": 80359, "epoch": 1913} {"train_loss": -6.140066623687744, "global_step": 80360, "epoch": 1913} {"train_loss": -6.1029157638549805, "global_step": 80361, "epoch": 1913} {"train_loss": -5.9953413009643555, "global_step": 80362, "epoch": 1913} {"train_loss": -6.097577095031738, "global_step": 80363, "epoch": 1913} {"train_loss": -6.021896839141846, "global_step": 80364, "epoch": 1913} {"train_loss": -6.068461894989014, "global_step": 80365, "epoch": 1913} {"train_loss": -6.151895999908447, "global_step": 80366, "epoch": 1913} {"train_loss": -6.06036376953125, "global_step": 80367, "epoch": 1913} {"train_loss": -6.085031032562256, "global_step": 80368, "epoch": 1913} {"train_loss": -6.118956565856934, "global_step": 80369, "epoch": 1913} {"train_loss": -6.127117156982422, "global_step": 80370, "epoch": 1913} {"train_loss": -6.151617527008057, "global_step": 80371, "epoch": 1913} {"train_loss": -6.077211856842041, "global_step": 80372, "epoch": 1913} {"train_loss": -6.182130813598633, "global_step": 80373, "epoch": 1913} {"train_loss": -6.171257972717285, "global_step": 80374, "epoch": 1913} {"train_loss": -6.010560035705566, "global_step": 80375, "epoch": 1913} {"train_loss": -6.192103385925293, "global_step": 80376, "epoch": 1913} {"train_loss": -6.037197589874268, "global_step": 80377, "epoch": 1913} {"train_loss": -6.1483635902404785, "global_step": 80378, "epoch": 1913} {"train_loss": -5.985738754272461, "global_step": 80379, "epoch": 1913} {"train_loss": -6.0027852058410645, "global_step": 80380, "epoch": 1913} {"train_loss": -6.056530952453613, "global_step": 80381, "epoch": 1913} {"train_loss": -6.049074172973633, "global_step": 80382, "epoch": 1913} {"train_loss": -6.1300787925720215, "global_step": 80383, "epoch": 1913} {"train_loss": -6.153642654418945, "global_step": 80384, "epoch": 1913} {"train_loss": -6.030285835266113, "global_step": 80385, "epoch": 1913} {"train_loss": -6.071127891540527, "global_step": 80386, "epoch": 1913} {"train_loss": -6.077111176082066, "global_step": 80387, "epoch": 1913, "val_loss": 67492.21875} {"train_loss": -6.04603385925293, "global_step": 80388, "epoch": 1914} {"train_loss": -5.957918167114258, "global_step": 80389, "epoch": 1914} {"train_loss": -6.079263210296631, "global_step": 80390, "epoch": 1914} {"train_loss": -6.157492160797119, "global_step": 80391, "epoch": 1914} {"train_loss": -6.079947471618652, "global_step": 80392, "epoch": 1914} {"train_loss": -6.10657262802124, "global_step": 80393, "epoch": 1914} {"train_loss": -6.058016777038574, "global_step": 80394, "epoch": 1914} {"train_loss": -6.210570335388184, "global_step": 80395, "epoch": 1914} {"train_loss": -6.127715110778809, "global_step": 80396, "epoch": 1914} {"train_loss": -6.099176406860352, "global_step": 80397, "epoch": 1914} {"train_loss": -6.0944719314575195, "global_step": 80398, "epoch": 1914} {"train_loss": -6.097045421600342, "global_step": 80399, "epoch": 1914} {"train_loss": -6.014143466949463, "global_step": 80400, "epoch": 1914} {"train_loss": -6.10793399810791, "global_step": 80401, "epoch": 1914} {"train_loss": -6.0109710693359375, "global_step": 80402, "epoch": 1914} {"train_loss": -6.164398193359375, "global_step": 80403, "epoch": 1914} {"train_loss": -6.097461700439453, "global_step": 80404, "epoch": 1914} {"train_loss": -6.146551132202148, "global_step": 80405, "epoch": 1914} {"train_loss": -6.188601493835449, "global_step": 80406, "epoch": 1914} {"train_loss": -6.210367202758789, "global_step": 80407, "epoch": 1914} {"train_loss": -6.034675121307373, "global_step": 80408, "epoch": 1914} {"train_loss": -6.0900092124938965, "global_step": 80409, "epoch": 1914} {"train_loss": -6.10453462600708, "global_step": 80410, "epoch": 1914} {"train_loss": -5.923221588134766, "global_step": 80411, "epoch": 1914} {"train_loss": -6.066727638244629, "global_step": 80412, "epoch": 1914} {"train_loss": -6.1929216384887695, "global_step": 80413, "epoch": 1914} {"train_loss": -6.192131996154785, "global_step": 80414, "epoch": 1914} {"train_loss": -6.0822038650512695, "global_step": 80415, "epoch": 1914} {"train_loss": -6.077795028686523, "global_step": 80416, "epoch": 1914} {"train_loss": -6.190000534057617, "global_step": 80417, "epoch": 1914} {"train_loss": -6.052087783813477, "global_step": 80418, "epoch": 1914} {"train_loss": -6.128706455230713, "global_step": 80419, "epoch": 1914} {"train_loss": -6.211214065551758, "global_step": 80420, "epoch": 1914} {"train_loss": -6.111560821533203, "global_step": 80421, "epoch": 1914} {"train_loss": -6.09157133102417, "global_step": 80422, "epoch": 1914} {"train_loss": -6.169745445251465, "global_step": 80423, "epoch": 1914} {"train_loss": -6.267704963684082, "global_step": 80424, "epoch": 1914} {"train_loss": -6.213895320892334, "global_step": 80425, "epoch": 1914} {"train_loss": -6.112016677856445, "global_step": 80426, "epoch": 1914} {"train_loss": -6.1522603034973145, "global_step": 80427, "epoch": 1914} {"train_loss": -6.144038200378418, "global_step": 80428, "epoch": 1914} {"train_loss": -6.112903844742548, "global_step": 80429, "epoch": 1914, "val_loss": 67613.40625} {"train_loss": -6.139259338378906, "global_step": 80430, "epoch": 1915} {"train_loss": -6.174901008605957, "global_step": 80431, "epoch": 1915} {"train_loss": -6.168668746948242, "global_step": 80432, "epoch": 1915} {"train_loss": -6.137181282043457, "global_step": 80433, "epoch": 1915} {"train_loss": -6.207663059234619, "global_step": 80434, "epoch": 1915} {"train_loss": -6.030819892883301, "global_step": 80435, "epoch": 1915} {"train_loss": -6.169815540313721, "global_step": 80436, "epoch": 1915} {"train_loss": -6.236305236816406, "global_step": 80437, "epoch": 1915} {"train_loss": -6.18064546585083, "global_step": 80438, "epoch": 1915} {"train_loss": -6.1418962478637695, "global_step": 80439, "epoch": 1915} {"train_loss": -6.233634948730469, "global_step": 80440, "epoch": 1915} {"train_loss": -6.0713958740234375, "global_step": 80441, "epoch": 1915} {"train_loss": -6.107630729675293, "global_step": 80442, "epoch": 1915} {"train_loss": -6.105202674865723, "global_step": 80443, "epoch": 1915} {"train_loss": -6.166757106781006, "global_step": 80444, "epoch": 1915} {"train_loss": -6.109569549560547, "global_step": 80445, "epoch": 1915} {"train_loss": -6.141037940979004, "global_step": 80446, "epoch": 1915} {"train_loss": -6.098601341247559, "global_step": 80447, "epoch": 1915} {"train_loss": -6.231667995452881, "global_step": 80448, "epoch": 1915} {"train_loss": -6.222696304321289, "global_step": 80449, "epoch": 1915} {"train_loss": -6.105534076690674, "global_step": 80450, "epoch": 1915} {"train_loss": -6.23676872253418, "global_step": 80451, "epoch": 1915} {"train_loss": -6.146502494812012, "global_step": 80452, "epoch": 1915} {"train_loss": -6.167963981628418, "global_step": 80453, "epoch": 1915} {"train_loss": -6.157452583312988, "global_step": 80454, "epoch": 1915} {"train_loss": -6.264605522155762, "global_step": 80455, "epoch": 1915} {"train_loss": -6.187945365905762, "global_step": 80456, "epoch": 1915} {"train_loss": -6.050077438354492, "global_step": 80457, "epoch": 1915} {"train_loss": -6.080497741699219, "global_step": 80458, "epoch": 1915} {"train_loss": -6.090785980224609, "global_step": 80459, "epoch": 1915} {"train_loss": -6.146533966064453, "global_step": 80460, "epoch": 1915} {"train_loss": -6.060817718505859, "global_step": 80461, "epoch": 1915} {"train_loss": -6.049234390258789, "global_step": 80462, "epoch": 1915} {"train_loss": -5.932954788208008, "global_step": 80463, "epoch": 1915} {"train_loss": -6.01725959777832, "global_step": 80464, "epoch": 1915} {"train_loss": -5.968992233276367, "global_step": 80465, "epoch": 1915} {"train_loss": -6.032072067260742, "global_step": 80466, "epoch": 1915} {"train_loss": -6.117092132568359, "global_step": 80467, "epoch": 1915} {"train_loss": -6.034581184387207, "global_step": 80468, "epoch": 1915} {"train_loss": -6.188307762145996, "global_step": 80469, "epoch": 1915} {"train_loss": -6.085104942321777, "global_step": 80470, "epoch": 1915} {"train_loss": -6.124345858891805, "global_step": 80471, "epoch": 1915, "val_loss": 67539.1640625} {"train_loss": -5.98763370513916, "global_step": 80472, "epoch": 1916} {"train_loss": -6.136771202087402, "global_step": 80473, "epoch": 1916} {"train_loss": -6.1067399978637695, "global_step": 80474, "epoch": 1916} {"train_loss": -6.114521503448486, "global_step": 80475, "epoch": 1916} {"train_loss": -6.117203712463379, "global_step": 80476, "epoch": 1916} {"train_loss": -6.191462993621826, "global_step": 80477, "epoch": 1916} {"train_loss": -6.100657939910889, "global_step": 80478, "epoch": 1916} {"train_loss": -6.120295524597168, "global_step": 80479, "epoch": 1916} {"train_loss": -6.277846336364746, "global_step": 80480, "epoch": 1916} {"train_loss": -6.13518762588501, "global_step": 80481, "epoch": 1916} {"train_loss": -6.210906982421875, "global_step": 80482, "epoch": 1916} {"train_loss": -6.057929992675781, "global_step": 80483, "epoch": 1916} {"train_loss": -6.114045143127441, "global_step": 80484, "epoch": 1916} {"train_loss": -6.07466983795166, "global_step": 80485, "epoch": 1916} {"train_loss": -6.128512382507324, "global_step": 80486, "epoch": 1916} {"train_loss": -6.16151237487793, "global_step": 80487, "epoch": 1916} {"train_loss": -6.051450252532959, "global_step": 80488, "epoch": 1916} {"train_loss": -6.09145450592041, "global_step": 80489, "epoch": 1916} {"train_loss": -6.103555202484131, "global_step": 80490, "epoch": 1916} {"train_loss": -6.1106133460998535, "global_step": 80491, "epoch": 1916} {"train_loss": -6.2493133544921875, "global_step": 80492, "epoch": 1916} {"train_loss": -6.127326965332031, "global_step": 80493, "epoch": 1916} {"train_loss": -6.139112949371338, "global_step": 80494, "epoch": 1916} {"train_loss": -6.132023334503174, "global_step": 80495, "epoch": 1916} {"train_loss": -6.139888763427734, "global_step": 80496, "epoch": 1916} {"train_loss": -6.065550327301025, "global_step": 80497, "epoch": 1916} {"train_loss": -6.167571067810059, "global_step": 80498, "epoch": 1916} {"train_loss": -6.175871849060059, "global_step": 80499, "epoch": 1916} {"train_loss": -6.18743896484375, "global_step": 80500, "epoch": 1916} {"train_loss": -6.166119575500488, "global_step": 80501, "epoch": 1916} {"train_loss": -6.240771293640137, "global_step": 80502, "epoch": 1916} {"train_loss": -6.1324357986450195, "global_step": 80503, "epoch": 1916} {"train_loss": -6.290561676025391, "global_step": 80504, "epoch": 1916} {"train_loss": -6.143733978271484, "global_step": 80505, "epoch": 1916} {"train_loss": -6.152090549468994, "global_step": 80506, "epoch": 1916} {"train_loss": -6.071225166320801, "global_step": 80507, "epoch": 1916} {"train_loss": -6.025033950805664, "global_step": 80508, "epoch": 1916} {"train_loss": -6.194582939147949, "global_step": 80509, "epoch": 1916} {"train_loss": -6.101457595825195, "global_step": 80510, "epoch": 1916} {"train_loss": -6.199861526489258, "global_step": 80511, "epoch": 1916} {"train_loss": -6.025106430053711, "global_step": 80512, "epoch": 1916} {"train_loss": -6.133635327929542, "global_step": 80513, "epoch": 1916, "val_loss": 67549.125} {"train_loss": -6.0918803215026855, "global_step": 80514, "epoch": 1917} {"train_loss": -6.195113182067871, "global_step": 80515, "epoch": 1917} {"train_loss": -6.077276229858398, "global_step": 80516, "epoch": 1917} {"train_loss": -6.102017402648926, "global_step": 80517, "epoch": 1917} {"train_loss": -5.982908248901367, "global_step": 80518, "epoch": 1917} {"train_loss": -6.1745195388793945, "global_step": 80519, "epoch": 1917} {"train_loss": -6.11009407043457, "global_step": 80520, "epoch": 1917} {"train_loss": -6.168161869049072, "global_step": 80521, "epoch": 1917} {"train_loss": -6.120562553405762, "global_step": 80522, "epoch": 1917} {"train_loss": -6.157251358032227, "global_step": 80523, "epoch": 1917} {"train_loss": -6.224129676818848, "global_step": 80524, "epoch": 1917} {"train_loss": -6.021176815032959, "global_step": 80525, "epoch": 1917} {"train_loss": -6.185060977935791, "global_step": 80526, "epoch": 1917} {"train_loss": -6.048662185668945, "global_step": 80527, "epoch": 1917} {"train_loss": -6.122985363006592, "global_step": 80528, "epoch": 1917} {"train_loss": -6.0769267082214355, "global_step": 80529, "epoch": 1917} {"train_loss": -6.161108016967773, "global_step": 80530, "epoch": 1917} {"train_loss": -6.087348461151123, "global_step": 80531, "epoch": 1917} {"train_loss": -6.125882625579834, "global_step": 80532, "epoch": 1917} {"train_loss": -5.961843490600586, "global_step": 80533, "epoch": 1917} {"train_loss": -6.072428226470947, "global_step": 80534, "epoch": 1917} {"train_loss": -6.091118335723877, "global_step": 80535, "epoch": 1917} {"train_loss": -6.094883918762207, "global_step": 80536, "epoch": 1917} {"train_loss": -6.08167028427124, "global_step": 80537, "epoch": 1917} {"train_loss": -5.955776214599609, "global_step": 80538, "epoch": 1917} {"train_loss": -6.060751438140869, "global_step": 80539, "epoch": 1917} {"train_loss": -6.085583686828613, "global_step": 80540, "epoch": 1917} {"train_loss": -6.176774024963379, "global_step": 80541, "epoch": 1917} {"train_loss": -6.090957164764404, "global_step": 80542, "epoch": 1917} {"train_loss": -6.134300231933594, "global_step": 80543, "epoch": 1917} {"train_loss": -6.156848907470703, "global_step": 80544, "epoch": 1917} {"train_loss": -6.050717353820801, "global_step": 80545, "epoch": 1917} {"train_loss": -6.2140607833862305, "global_step": 80546, "epoch": 1917} {"train_loss": -6.146050453186035, "global_step": 80547, "epoch": 1917} {"train_loss": -6.011809825897217, "global_step": 80548, "epoch": 1917} {"train_loss": -6.027119159698486, "global_step": 80549, "epoch": 1917} {"train_loss": -6.199087142944336, "global_step": 80550, "epoch": 1917} {"train_loss": -6.000776767730713, "global_step": 80551, "epoch": 1917} {"train_loss": -6.099247455596924, "global_step": 80552, "epoch": 1917} {"train_loss": -6.019827365875244, "global_step": 80553, "epoch": 1917} {"train_loss": -6.022840976715088, "global_step": 80554, "epoch": 1917} {"train_loss": -6.099272262482416, "global_step": 80555, "epoch": 1917, "val_loss": 67930.1015625} {"train_loss": -6.031774997711182, "global_step": 80556, "epoch": 1918} {"train_loss": -6.143655776977539, "global_step": 80557, "epoch": 1918} {"train_loss": -5.993890762329102, "global_step": 80558, "epoch": 1918} {"train_loss": -6.167428016662598, "global_step": 80559, "epoch": 1918} {"train_loss": -6.048900604248047, "global_step": 80560, "epoch": 1918} {"train_loss": -6.071728706359863, "global_step": 80561, "epoch": 1918} {"train_loss": -5.9984564781188965, "global_step": 80562, "epoch": 1918} {"train_loss": -6.067541122436523, "global_step": 80563, "epoch": 1918} {"train_loss": -6.069462776184082, "global_step": 80564, "epoch": 1918} {"train_loss": -6.040592193603516, "global_step": 80565, "epoch": 1918} {"train_loss": -6.0643157958984375, "global_step": 80566, "epoch": 1918} {"train_loss": -6.102500915527344, "global_step": 80567, "epoch": 1918} {"train_loss": -6.1283183097839355, "global_step": 80568, "epoch": 1918} {"train_loss": -6.07513427734375, "global_step": 80569, "epoch": 1918} {"train_loss": -6.078255653381348, "global_step": 80570, "epoch": 1918} {"train_loss": -6.199706077575684, "global_step": 80571, "epoch": 1918} {"train_loss": -6.169357776641846, "global_step": 80572, "epoch": 1918} {"train_loss": -6.0223798751831055, "global_step": 80573, "epoch": 1918} {"train_loss": -6.06424617767334, "global_step": 80574, "epoch": 1918} {"train_loss": -6.236421585083008, "global_step": 80575, "epoch": 1918} {"train_loss": -6.011366844177246, "global_step": 80576, "epoch": 1918} {"train_loss": -5.9917449951171875, "global_step": 80577, "epoch": 1918} {"train_loss": -6.0710978507995605, "global_step": 80578, "epoch": 1918} {"train_loss": -6.158331871032715, "global_step": 80579, "epoch": 1918} {"train_loss": -6.195276260375977, "global_step": 80580, "epoch": 1918} {"train_loss": -6.232392311096191, "global_step": 80581, "epoch": 1918} {"train_loss": -6.096449851989746, "global_step": 80582, "epoch": 1918} {"train_loss": -6.153818607330322, "global_step": 80583, "epoch": 1918} {"train_loss": -6.125197410583496, "global_step": 80584, "epoch": 1918} {"train_loss": -6.137246131896973, "global_step": 80585, "epoch": 1918} {"train_loss": -6.07396125793457, "global_step": 80586, "epoch": 1918} {"train_loss": -6.229299545288086, "global_step": 80587, "epoch": 1918} {"train_loss": -6.180778980255127, "global_step": 80588, "epoch": 1918} {"train_loss": -6.044000625610352, "global_step": 80589, "epoch": 1918} {"train_loss": -6.122701168060303, "global_step": 80590, "epoch": 1918} {"train_loss": -6.20334529876709, "global_step": 80591, "epoch": 1918} {"train_loss": -6.137027740478516, "global_step": 80592, "epoch": 1918} {"train_loss": -6.069445610046387, "global_step": 80593, "epoch": 1918} {"train_loss": -6.162662506103516, "global_step": 80594, "epoch": 1918} {"train_loss": -6.1337080001831055, "global_step": 80595, "epoch": 1918} {"train_loss": -6.078766822814941, "global_step": 80596, "epoch": 1918} {"train_loss": -6.1065969580695745, "global_step": 80597, "epoch": 1918, "val_loss": 67726.1875} {"train_loss": -6.289518356323242, "global_step": 80598, "epoch": 1919} {"train_loss": -6.143871307373047, "global_step": 80599, "epoch": 1919} {"train_loss": -6.133087158203125, "global_step": 80600, "epoch": 1919} {"train_loss": -6.074361801147461, "global_step": 80601, "epoch": 1919} {"train_loss": -6.111091613769531, "global_step": 80602, "epoch": 1919} {"train_loss": -6.0859761238098145, "global_step": 80603, "epoch": 1919} {"train_loss": -6.125391483306885, "global_step": 80604, "epoch": 1919} {"train_loss": -6.1115617752075195, "global_step": 80605, "epoch": 1919} {"train_loss": -6.00477409362793, "global_step": 80606, "epoch": 1919} {"train_loss": -6.185421943664551, "global_step": 80607, "epoch": 1919} {"train_loss": -6.14521598815918, "global_step": 80608, "epoch": 1919} {"train_loss": -6.096390247344971, "global_step": 80609, "epoch": 1919} {"train_loss": -6.074924468994141, "global_step": 80610, "epoch": 1919} {"train_loss": -6.114139556884766, "global_step": 80611, "epoch": 1919} {"train_loss": -6.142011642456055, "global_step": 80612, "epoch": 1919} {"train_loss": -6.163147926330566, "global_step": 80613, "epoch": 1919} {"train_loss": -6.084412574768066, "global_step": 80614, "epoch": 1919} {"train_loss": -6.209177494049072, "global_step": 80615, "epoch": 1919} {"train_loss": -6.147296905517578, "global_step": 80616, "epoch": 1919} {"train_loss": -6.147058486938477, "global_step": 80617, "epoch": 1919} {"train_loss": -6.156300067901611, "global_step": 80618, "epoch": 1919} {"train_loss": -6.05802583694458, "global_step": 80619, "epoch": 1919} {"train_loss": -6.001131057739258, "global_step": 80620, "epoch": 1919} {"train_loss": -6.222590446472168, "global_step": 80621, "epoch": 1919} {"train_loss": -6.107260704040527, "global_step": 80622, "epoch": 1919} {"train_loss": -6.226954936981201, "global_step": 80623, "epoch": 1919} {"train_loss": -6.108392715454102, "global_step": 80624, "epoch": 1919} {"train_loss": -6.202432155609131, "global_step": 80625, "epoch": 1919} {"train_loss": -6.119390487670898, "global_step": 80626, "epoch": 1919} {"train_loss": -6.076079845428467, "global_step": 80627, "epoch": 1919} {"train_loss": -6.084819793701172, "global_step": 80628, "epoch": 1919} {"train_loss": -6.118142127990723, "global_step": 80629, "epoch": 1919} {"train_loss": -6.099134922027588, "global_step": 80630, "epoch": 1919} {"train_loss": -6.083286762237549, "global_step": 80631, "epoch": 1919} {"train_loss": -5.909275054931641, "global_step": 80632, "epoch": 1919} {"train_loss": -6.115751266479492, "global_step": 80633, "epoch": 1919} {"train_loss": -6.024355888366699, "global_step": 80634, "epoch": 1919} {"train_loss": -6.138354778289795, "global_step": 80635, "epoch": 1919} {"train_loss": -6.055319309234619, "global_step": 80636, "epoch": 1919} {"train_loss": -6.092006683349609, "global_step": 80637, "epoch": 1919} {"train_loss": -6.070608615875244, "global_step": 80638, "epoch": 1919} {"train_loss": -6.1094856943402975, "global_step": 80639, "epoch": 1919, "val_loss": 67697.890625} {"train_loss": -6.173019886016846, "global_step": 80640, "epoch": 1920} {"train_loss": -6.011928558349609, "global_step": 80641, "epoch": 1920} {"train_loss": -6.04570198059082, "global_step": 80642, "epoch": 1920} {"train_loss": -6.177559852600098, "global_step": 80643, "epoch": 1920} {"train_loss": -5.985979080200195, "global_step": 80644, "epoch": 1920} {"train_loss": -6.008814811706543, "global_step": 80645, "epoch": 1920} {"train_loss": -6.025522708892822, "global_step": 80646, "epoch": 1920} {"train_loss": -5.974498748779297, "global_step": 80647, "epoch": 1920} {"train_loss": -6.063202857971191, "global_step": 80648, "epoch": 1920} {"train_loss": -6.045740127563477, "global_step": 80649, "epoch": 1920} {"train_loss": -6.2196550369262695, "global_step": 80650, "epoch": 1920} {"train_loss": -6.087274074554443, "global_step": 80651, "epoch": 1920} {"train_loss": -6.157280445098877, "global_step": 80652, "epoch": 1920} {"train_loss": -5.98554801940918, "global_step": 80653, "epoch": 1920} {"train_loss": -6.14845085144043, "global_step": 80654, "epoch": 1920} {"train_loss": -6.1935272216796875, "global_step": 80655, "epoch": 1920} {"train_loss": -6.127558708190918, "global_step": 80656, "epoch": 1920} {"train_loss": -6.067168712615967, "global_step": 80657, "epoch": 1920} {"train_loss": -6.040103912353516, "global_step": 80658, "epoch": 1920} {"train_loss": -6.147704124450684, "global_step": 80659, "epoch": 1920} {"train_loss": -6.1212544441223145, "global_step": 80660, "epoch": 1920} {"train_loss": -6.1397576332092285, "global_step": 80661, "epoch": 1920} {"train_loss": -6.107645034790039, "global_step": 80662, "epoch": 1920} {"train_loss": -6.146618843078613, "global_step": 80663, "epoch": 1920} {"train_loss": -6.150815486907959, "global_step": 80664, "epoch": 1920} {"train_loss": -6.050018310546875, "global_step": 80665, "epoch": 1920} {"train_loss": -6.1100358963012695, "global_step": 80666, "epoch": 1920} {"train_loss": -6.097970008850098, "global_step": 80667, "epoch": 1920} {"train_loss": -6.19986629486084, "global_step": 80668, "epoch": 1920} {"train_loss": -6.002896785736084, "global_step": 80669, "epoch": 1920} {"train_loss": -6.114633083343506, "global_step": 80670, "epoch": 1920} {"train_loss": -6.168614864349365, "global_step": 80671, "epoch": 1920} {"train_loss": -6.1260223388671875, "global_step": 80672, "epoch": 1920} {"train_loss": -6.083450794219971, "global_step": 80673, "epoch": 1920} {"train_loss": -6.104347229003906, "global_step": 80674, "epoch": 1920} {"train_loss": -6.286013603210449, "global_step": 80675, "epoch": 1920} {"train_loss": -6.240062236785889, "global_step": 80676, "epoch": 1920} {"train_loss": -6.118605613708496, "global_step": 80677, "epoch": 1920} {"train_loss": -6.109717845916748, "global_step": 80678, "epoch": 1920} {"train_loss": -6.154543876647949, "global_step": 80679, "epoch": 1920} {"train_loss": -6.159727096557617, "global_step": 80680, "epoch": 1920} {"train_loss": -6.11059604372297, "global_step": 80681, "epoch": 1920, "val_loss": 67560.890625} {"train_loss": -6.199031829833984, "global_step": 80682, "epoch": 1921} {"train_loss": -6.2432684898376465, "global_step": 80683, "epoch": 1921} {"train_loss": -6.062174320220947, "global_step": 80684, "epoch": 1921} {"train_loss": -6.109294891357422, "global_step": 80685, "epoch": 1921} {"train_loss": -6.022677898406982, "global_step": 80686, "epoch": 1921} {"train_loss": -6.000181198120117, "global_step": 80687, "epoch": 1921} {"train_loss": -6.114651679992676, "global_step": 80688, "epoch": 1921} {"train_loss": -6.157009124755859, "global_step": 80689, "epoch": 1921} {"train_loss": -6.179198265075684, "global_step": 80690, "epoch": 1921} {"train_loss": -6.130130290985107, "global_step": 80691, "epoch": 1921} {"train_loss": -6.163541793823242, "global_step": 80692, "epoch": 1921} {"train_loss": -6.093984603881836, "global_step": 80693, "epoch": 1921} {"train_loss": -6.159521102905273, "global_step": 80694, "epoch": 1921} {"train_loss": -6.141963005065918, "global_step": 80695, "epoch": 1921} {"train_loss": -6.220635890960693, "global_step": 80696, "epoch": 1921} {"train_loss": -6.1041107177734375, "global_step": 80697, "epoch": 1921} {"train_loss": -6.083377361297607, "global_step": 80698, "epoch": 1921} {"train_loss": -6.002216815948486, "global_step": 80699, "epoch": 1921} {"train_loss": -6.102237701416016, "global_step": 80700, "epoch": 1921} {"train_loss": -6.054771423339844, "global_step": 80701, "epoch": 1921} {"train_loss": -6.1378397941589355, "global_step": 80702, "epoch": 1921} {"train_loss": -6.071176052093506, "global_step": 80703, "epoch": 1921} {"train_loss": -6.119929313659668, "global_step": 80704, "epoch": 1921} {"train_loss": -6.114361763000488, "global_step": 80705, "epoch": 1921} {"train_loss": -6.226643085479736, "global_step": 80706, "epoch": 1921} {"train_loss": -6.093918800354004, "global_step": 80707, "epoch": 1921} {"train_loss": -6.141696929931641, "global_step": 80708, "epoch": 1921} {"train_loss": -5.997333526611328, "global_step": 80709, "epoch": 1921} {"train_loss": -6.176196575164795, "global_step": 80710, "epoch": 1921} {"train_loss": -6.133327007293701, "global_step": 80711, "epoch": 1921} {"train_loss": -6.235354423522949, "global_step": 80712, "epoch": 1921} {"train_loss": -6.176362037658691, "global_step": 80713, "epoch": 1921} {"train_loss": -6.061675548553467, "global_step": 80714, "epoch": 1921} {"train_loss": -6.098119735717773, "global_step": 80715, "epoch": 1921} {"train_loss": -6.047933578491211, "global_step": 80716, "epoch": 1921} {"train_loss": -6.297220230102539, "global_step": 80717, "epoch": 1921} {"train_loss": -6.216248512268066, "global_step": 80718, "epoch": 1921} {"train_loss": -6.143874168395996, "global_step": 80719, "epoch": 1921} {"train_loss": -6.162814140319824, "global_step": 80720, "epoch": 1921} {"train_loss": -6.2484130859375, "global_step": 80721, "epoch": 1921} {"train_loss": -6.232665061950684, "global_step": 80722, "epoch": 1921} {"train_loss": -6.132979268119449, "global_step": 80723, "epoch": 1921, "val_loss": 67651.96875} {"train_loss": -6.131412506103516, "global_step": 80724, "epoch": 1922} {"train_loss": -6.1706318855285645, "global_step": 80725, "epoch": 1922} {"train_loss": -6.108146667480469, "global_step": 80726, "epoch": 1922} {"train_loss": -6.108258247375488, "global_step": 80727, "epoch": 1922} {"train_loss": -6.187685489654541, "global_step": 80728, "epoch": 1922} {"train_loss": -6.139233589172363, "global_step": 80729, "epoch": 1922} {"train_loss": -6.1612629890441895, "global_step": 80730, "epoch": 1922} {"train_loss": -6.165215492248535, "global_step": 80731, "epoch": 1922} {"train_loss": -6.056918621063232, "global_step": 80732, "epoch": 1922} {"train_loss": -5.953346252441406, "global_step": 80733, "epoch": 1922} {"train_loss": -6.217118740081787, "global_step": 80734, "epoch": 1922} {"train_loss": -5.939938545227051, "global_step": 80735, "epoch": 1922} {"train_loss": -6.148415565490723, "global_step": 80736, "epoch": 1922} {"train_loss": -6.1009416580200195, "global_step": 80737, "epoch": 1922} {"train_loss": -6.215712547302246, "global_step": 80738, "epoch": 1922} {"train_loss": -6.164721488952637, "global_step": 80739, "epoch": 1922} {"train_loss": -6.121090888977051, "global_step": 80740, "epoch": 1922} {"train_loss": -6.207130432128906, "global_step": 80741, "epoch": 1922} {"train_loss": -6.216611862182617, "global_step": 80742, "epoch": 1922} {"train_loss": -6.140947341918945, "global_step": 80743, "epoch": 1922} {"train_loss": -6.163352966308594, "global_step": 80744, "epoch": 1922} {"train_loss": -6.120081901550293, "global_step": 80745, "epoch": 1922} {"train_loss": -6.246031761169434, "global_step": 80746, "epoch": 1922} {"train_loss": -6.063086032867432, "global_step": 80747, "epoch": 1922} {"train_loss": -6.248743057250977, "global_step": 80748, "epoch": 1922} {"train_loss": -6.119983196258545, "global_step": 80749, "epoch": 1922} {"train_loss": -6.08482551574707, "global_step": 80750, "epoch": 1922} {"train_loss": -6.157094955444336, "global_step": 80751, "epoch": 1922} {"train_loss": -6.126372814178467, "global_step": 80752, "epoch": 1922} {"train_loss": -6.049912452697754, "global_step": 80753, "epoch": 1922} {"train_loss": -6.1037092208862305, "global_step": 80754, "epoch": 1922} {"train_loss": -6.061252117156982, "global_step": 80755, "epoch": 1922} {"train_loss": -6.233421325683594, "global_step": 80756, "epoch": 1922} {"train_loss": -6.0326666831970215, "global_step": 80757, "epoch": 1922} {"train_loss": -6.238176345825195, "global_step": 80758, "epoch": 1922} {"train_loss": -6.012542724609375, "global_step": 80759, "epoch": 1922} {"train_loss": -6.101264476776123, "global_step": 80760, "epoch": 1922} {"train_loss": -6.070775032043457, "global_step": 80761, "epoch": 1922} {"train_loss": -6.143750190734863, "global_step": 80762, "epoch": 1922} {"train_loss": -6.128262519836426, "global_step": 80763, "epoch": 1922} {"train_loss": -6.109005451202393, "global_step": 80764, "epoch": 1922} {"train_loss": -6.1298737071809315, "global_step": 80765, "epoch": 1922, "val_loss": 67781.53125} {"train_loss": -6.197544097900391, "global_step": 80766, "epoch": 1923} {"train_loss": -6.054996967315674, "global_step": 80767, "epoch": 1923} {"train_loss": -6.116024971008301, "global_step": 80768, "epoch": 1923} {"train_loss": -6.1715192794799805, "global_step": 80769, "epoch": 1923} {"train_loss": -6.141207695007324, "global_step": 80770, "epoch": 1923} {"train_loss": -6.027355194091797, "global_step": 80771, "epoch": 1923} {"train_loss": -6.065169334411621, "global_step": 80772, "epoch": 1923} {"train_loss": -6.104921340942383, "global_step": 80773, "epoch": 1923} {"train_loss": -6.144614219665527, "global_step": 80774, "epoch": 1923} {"train_loss": -6.0067057609558105, "global_step": 80775, "epoch": 1923} {"train_loss": -6.168628215789795, "global_step": 80776, "epoch": 1923} {"train_loss": -6.169992923736572, "global_step": 80777, "epoch": 1923} {"train_loss": -6.175692081451416, "global_step": 80778, "epoch": 1923} {"train_loss": -6.129143714904785, "global_step": 80779, "epoch": 1923} {"train_loss": -6.197465896606445, "global_step": 80780, "epoch": 1923} {"train_loss": -6.21881628036499, "global_step": 80781, "epoch": 1923} {"train_loss": -6.224644660949707, "global_step": 80782, "epoch": 1923} {"train_loss": -6.039332389831543, "global_step": 80783, "epoch": 1923} {"train_loss": -6.020567893981934, "global_step": 80784, "epoch": 1923} {"train_loss": -6.118579387664795, "global_step": 80785, "epoch": 1923} {"train_loss": -6.149523735046387, "global_step": 80786, "epoch": 1923} {"train_loss": -6.102768421173096, "global_step": 80787, "epoch": 1923} {"train_loss": -6.125507354736328, "global_step": 80788, "epoch": 1923} {"train_loss": -6.108644962310791, "global_step": 80789, "epoch": 1923} {"train_loss": -6.212375640869141, "global_step": 80790, "epoch": 1923} {"train_loss": -6.109078884124756, "global_step": 80791, "epoch": 1923} {"train_loss": -6.264103889465332, "global_step": 80792, "epoch": 1923} {"train_loss": -6.204553604125977, "global_step": 80793, "epoch": 1923} {"train_loss": -6.1028337478637695, "global_step": 80794, "epoch": 1923} {"train_loss": -6.131575107574463, "global_step": 80795, "epoch": 1923} {"train_loss": -6.220900535583496, "global_step": 80796, "epoch": 1923} {"train_loss": -6.016060829162598, "global_step": 80797, "epoch": 1923} {"train_loss": -6.156438827514648, "global_step": 80798, "epoch": 1923} {"train_loss": -6.140787124633789, "global_step": 80799, "epoch": 1923} {"train_loss": -6.162652015686035, "global_step": 80800, "epoch": 1923} {"train_loss": -6.119637489318848, "global_step": 80801, "epoch": 1923} {"train_loss": -6.141927719116211, "global_step": 80802, "epoch": 1923} {"train_loss": -6.034780025482178, "global_step": 80803, "epoch": 1923} {"train_loss": -6.0734052658081055, "global_step": 80804, "epoch": 1923} {"train_loss": -6.012524127960205, "global_step": 80805, "epoch": 1923} {"train_loss": -6.045657634735107, "global_step": 80806, "epoch": 1923} {"train_loss": -6.125797555560157, "global_step": 80807, "epoch": 1923, "val_loss": 67871.0234375} {"train_loss": -5.98393440246582, "global_step": 80808, "epoch": 1924} {"train_loss": -6.128007888793945, "global_step": 80809, "epoch": 1924} {"train_loss": -6.0713653564453125, "global_step": 80810, "epoch": 1924} {"train_loss": -6.019502639770508, "global_step": 80811, "epoch": 1924} {"train_loss": -6.058382987976074, "global_step": 80812, "epoch": 1924} {"train_loss": -6.108161449432373, "global_step": 80813, "epoch": 1924} {"train_loss": -6.221286773681641, "global_step": 80814, "epoch": 1924} {"train_loss": -6.188113212585449, "global_step": 80815, "epoch": 1924} {"train_loss": -6.095823764801025, "global_step": 80816, "epoch": 1924} {"train_loss": -6.1509199142456055, "global_step": 80817, "epoch": 1924} {"train_loss": -6.07661247253418, "global_step": 80818, "epoch": 1924} {"train_loss": -6.223350524902344, "global_step": 80819, "epoch": 1924} {"train_loss": -6.216562271118164, "global_step": 80820, "epoch": 1924} {"train_loss": -6.154272079467773, "global_step": 80821, "epoch": 1924} {"train_loss": -6.052980422973633, "global_step": 80822, "epoch": 1924} {"train_loss": -6.203258991241455, "global_step": 80823, "epoch": 1924} {"train_loss": -6.176755428314209, "global_step": 80824, "epoch": 1924} {"train_loss": -6.303450584411621, "global_step": 80825, "epoch": 1924} {"train_loss": -6.231925964355469, "global_step": 80826, "epoch": 1924} {"train_loss": -6.148685455322266, "global_step": 80827, "epoch": 1924} {"train_loss": -6.21000862121582, "global_step": 80828, "epoch": 1924} {"train_loss": -6.180800437927246, "global_step": 80829, "epoch": 1924} {"train_loss": -6.097469806671143, "global_step": 80830, "epoch": 1924} {"train_loss": -6.037424564361572, "global_step": 80831, "epoch": 1924} {"train_loss": -5.957856178283691, "global_step": 80832, "epoch": 1924} {"train_loss": -6.14145565032959, "global_step": 80833, "epoch": 1924} {"train_loss": -6.098339557647705, "global_step": 80834, "epoch": 1924} {"train_loss": -6.129452228546143, "global_step": 80835, "epoch": 1924} {"train_loss": -6.276668548583984, "global_step": 80836, "epoch": 1924} {"train_loss": -6.042231559753418, "global_step": 80837, "epoch": 1924} {"train_loss": -6.139263153076172, "global_step": 80838, "epoch": 1924} {"train_loss": -6.010586261749268, "global_step": 80839, "epoch": 1924} {"train_loss": -6.065957069396973, "global_step": 80840, "epoch": 1924} {"train_loss": -6.171142578125, "global_step": 80841, "epoch": 1924} {"train_loss": -6.026366233825684, "global_step": 80842, "epoch": 1924} {"train_loss": -6.183504104614258, "global_step": 80843, "epoch": 1924} {"train_loss": -6.099644660949707, "global_step": 80844, "epoch": 1924} {"train_loss": -6.04985237121582, "global_step": 80845, "epoch": 1924} {"train_loss": -6.071530818939209, "global_step": 80846, "epoch": 1924} {"train_loss": -6.066229820251465, "global_step": 80847, "epoch": 1924} {"train_loss": -6.210601806640625, "global_step": 80848, "epoch": 1924} {"train_loss": -6.124530542464483, "global_step": 80849, "epoch": 1924, "val_loss": 67701.7578125} {"train_loss": -6.080430030822754, "global_step": 80850, "epoch": 1925} {"train_loss": -6.2855634689331055, "global_step": 80851, "epoch": 1925} {"train_loss": -6.125927925109863, "global_step": 80852, "epoch": 1925} {"train_loss": -6.149059295654297, "global_step": 80853, "epoch": 1925} {"train_loss": -6.1373701095581055, "global_step": 80854, "epoch": 1925} {"train_loss": -6.107059478759766, "global_step": 80855, "epoch": 1925} {"train_loss": -6.1541852951049805, "global_step": 80856, "epoch": 1925} {"train_loss": -6.16157341003418, "global_step": 80857, "epoch": 1925} {"train_loss": -6.170928001403809, "global_step": 80858, "epoch": 1925} {"train_loss": -6.213988780975342, "global_step": 80859, "epoch": 1925} {"train_loss": -6.109975814819336, "global_step": 80860, "epoch": 1925} {"train_loss": -6.146880149841309, "global_step": 80861, "epoch": 1925} {"train_loss": -6.1845197677612305, "global_step": 80862, "epoch": 1925} {"train_loss": -6.093225955963135, "global_step": 80863, "epoch": 1925} {"train_loss": -6.203252792358398, "global_step": 80864, "epoch": 1925} {"train_loss": -6.261042594909668, "global_step": 80865, "epoch": 1925} {"train_loss": -6.197530746459961, "global_step": 80866, "epoch": 1925} {"train_loss": -6.145320892333984, "global_step": 80867, "epoch": 1925} {"train_loss": -6.222931861877441, "global_step": 80868, "epoch": 1925} {"train_loss": -6.147119045257568, "global_step": 80869, "epoch": 1925} {"train_loss": -6.0082478523254395, "global_step": 80870, "epoch": 1925} {"train_loss": -6.1356635093688965, "global_step": 80871, "epoch": 1925} {"train_loss": -6.057374954223633, "global_step": 80872, "epoch": 1925} {"train_loss": -6.087390422821045, "global_step": 80873, "epoch": 1925} {"train_loss": -6.185002326965332, "global_step": 80874, "epoch": 1925} {"train_loss": -6.127785682678223, "global_step": 80875, "epoch": 1925} {"train_loss": -6.162845134735107, "global_step": 80876, "epoch": 1925} {"train_loss": -6.131852149963379, "global_step": 80877, "epoch": 1925} {"train_loss": -6.046826362609863, "global_step": 80878, "epoch": 1925} {"train_loss": -6.17883825302124, "global_step": 80879, "epoch": 1925} {"train_loss": -6.069345474243164, "global_step": 80880, "epoch": 1925} {"train_loss": -6.049984931945801, "global_step": 80881, "epoch": 1925} {"train_loss": -6.259220123291016, "global_step": 80882, "epoch": 1925} {"train_loss": -6.190285682678223, "global_step": 80883, "epoch": 1925} {"train_loss": -6.23451042175293, "global_step": 80884, "epoch": 1925} {"train_loss": -6.086762428283691, "global_step": 80885, "epoch": 1925} {"train_loss": -6.169194221496582, "global_step": 80886, "epoch": 1925} {"train_loss": -6.123841285705566, "global_step": 80887, "epoch": 1925} {"train_loss": -5.9929399490356445, "global_step": 80888, "epoch": 1925} {"train_loss": -6.090489864349365, "global_step": 80889, "epoch": 1925} {"train_loss": -6.228682041168213, "global_step": 80890, "epoch": 1925} {"train_loss": -6.1426895913623625, "global_step": 80891, "epoch": 1925, "val_loss": 67837.0703125} {"train_loss": -6.187543869018555, "global_step": 80892, "epoch": 1926} {"train_loss": -6.138971328735352, "global_step": 80893, "epoch": 1926} {"train_loss": -6.230896949768066, "global_step": 80894, "epoch": 1926} {"train_loss": -6.111632347106934, "global_step": 80895, "epoch": 1926} {"train_loss": -6.096080780029297, "global_step": 80896, "epoch": 1926} {"train_loss": -6.186740875244141, "global_step": 80897, "epoch": 1926} {"train_loss": -6.058828353881836, "global_step": 80898, "epoch": 1926} {"train_loss": -6.0860595703125, "global_step": 80899, "epoch": 1926} {"train_loss": -6.182008743286133, "global_step": 80900, "epoch": 1926} {"train_loss": -6.1870574951171875, "global_step": 80901, "epoch": 1926} {"train_loss": -6.115180969238281, "global_step": 80902, "epoch": 1926} {"train_loss": -6.004334449768066, "global_step": 80903, "epoch": 1926} {"train_loss": -6.148989677429199, "global_step": 80904, "epoch": 1926} {"train_loss": -6.072155475616455, "global_step": 80905, "epoch": 1926} {"train_loss": -6.016263961791992, "global_step": 80906, "epoch": 1926} {"train_loss": -6.09769344329834, "global_step": 80907, "epoch": 1926} {"train_loss": -6.077340602874756, "global_step": 80908, "epoch": 1926} {"train_loss": -6.113426208496094, "global_step": 80909, "epoch": 1926} {"train_loss": -6.062737464904785, "global_step": 80910, "epoch": 1926} {"train_loss": -6.054321765899658, "global_step": 80911, "epoch": 1926} {"train_loss": -6.096923351287842, "global_step": 80912, "epoch": 1926} {"train_loss": -6.23671817779541, "global_step": 80913, "epoch": 1926} {"train_loss": -6.008140563964844, "global_step": 80914, "epoch": 1926} {"train_loss": -6.156579971313477, "global_step": 80915, "epoch": 1926} {"train_loss": -6.182028293609619, "global_step": 80916, "epoch": 1926} {"train_loss": -6.132740497589111, "global_step": 80917, "epoch": 1926} {"train_loss": -6.092182636260986, "global_step": 80918, "epoch": 1926} {"train_loss": -6.226760387420654, "global_step": 80919, "epoch": 1926} {"train_loss": -6.151978492736816, "global_step": 80920, "epoch": 1926} {"train_loss": -6.123586654663086, "global_step": 80921, "epoch": 1926} {"train_loss": -6.16750955581665, "global_step": 80922, "epoch": 1926} {"train_loss": -6.277366638183594, "global_step": 80923, "epoch": 1926} {"train_loss": -6.187334060668945, "global_step": 80924, "epoch": 1926} {"train_loss": -6.231420516967773, "global_step": 80925, "epoch": 1926} {"train_loss": -6.070455551147461, "global_step": 80926, "epoch": 1926} {"train_loss": -6.09943962097168, "global_step": 80927, "epoch": 1926} {"train_loss": -6.157758712768555, "global_step": 80928, "epoch": 1926} {"train_loss": -6.17095422744751, "global_step": 80929, "epoch": 1926} {"train_loss": -6.2173919677734375, "global_step": 80930, "epoch": 1926} {"train_loss": -6.153487205505371, "global_step": 80931, "epoch": 1926} {"train_loss": -6.104866027832031, "global_step": 80932, "epoch": 1926} {"train_loss": -6.135815745308285, "global_step": 80933, "epoch": 1926, "val_loss": 67717.375} {"train_loss": -6.062379837036133, "global_step": 80934, "epoch": 1927} {"train_loss": -6.052745819091797, "global_step": 80935, "epoch": 1927} {"train_loss": -6.288485050201416, "global_step": 80936, "epoch": 1927} {"train_loss": -6.09657096862793, "global_step": 80937, "epoch": 1927} {"train_loss": -6.097925662994385, "global_step": 80938, "epoch": 1927} {"train_loss": -6.090941429138184, "global_step": 80939, "epoch": 1927} {"train_loss": -6.183364391326904, "global_step": 80940, "epoch": 1927} {"train_loss": -6.089807987213135, "global_step": 80941, "epoch": 1927} {"train_loss": -6.202149391174316, "global_step": 80942, "epoch": 1927} {"train_loss": -6.070810317993164, "global_step": 80943, "epoch": 1927} {"train_loss": -6.176740646362305, "global_step": 80944, "epoch": 1927} {"train_loss": -6.15034294128418, "global_step": 80945, "epoch": 1927} {"train_loss": -6.1473236083984375, "global_step": 80946, "epoch": 1927} {"train_loss": -5.998495101928711, "global_step": 80947, "epoch": 1927} {"train_loss": -6.182442665100098, "global_step": 80948, "epoch": 1927} {"train_loss": -6.063983917236328, "global_step": 80949, "epoch": 1927} {"train_loss": -6.132368087768555, "global_step": 80950, "epoch": 1927} {"train_loss": -6.1724443435668945, "global_step": 80951, "epoch": 1927} {"train_loss": -6.046700477600098, "global_step": 80952, "epoch": 1927} {"train_loss": -6.252251625061035, "global_step": 80953, "epoch": 1927} {"train_loss": -6.174393653869629, "global_step": 80954, "epoch": 1927} {"train_loss": -6.1512346267700195, "global_step": 80955, "epoch": 1927} {"train_loss": -6.078951358795166, "global_step": 80956, "epoch": 1927} {"train_loss": -6.132265090942383, "global_step": 80957, "epoch": 1927} {"train_loss": -6.112791538238525, "global_step": 80958, "epoch": 1927} {"train_loss": -6.182704448699951, "global_step": 80959, "epoch": 1927} {"train_loss": -6.042213439941406, "global_step": 80960, "epoch": 1927} {"train_loss": -6.106654167175293, "global_step": 80961, "epoch": 1927} {"train_loss": -6.0545196533203125, "global_step": 80962, "epoch": 1927} {"train_loss": -6.113134384155273, "global_step": 80963, "epoch": 1927} {"train_loss": -6.105226516723633, "global_step": 80964, "epoch": 1927} {"train_loss": -6.170041561126709, "global_step": 80965, "epoch": 1927} {"train_loss": -6.109222888946533, "global_step": 80966, "epoch": 1927} {"train_loss": -6.132626533508301, "global_step": 80967, "epoch": 1927} {"train_loss": -6.204543113708496, "global_step": 80968, "epoch": 1927} {"train_loss": -6.067326545715332, "global_step": 80969, "epoch": 1927} {"train_loss": -6.114715576171875, "global_step": 80970, "epoch": 1927} {"train_loss": -6.094868183135986, "global_step": 80971, "epoch": 1927} {"train_loss": -6.167059421539307, "global_step": 80972, "epoch": 1927} {"train_loss": -6.275906562805176, "global_step": 80973, "epoch": 1927} {"train_loss": -6.1837077140808105, "global_step": 80974, "epoch": 1927} {"train_loss": -6.128302835282826, "global_step": 80975, "epoch": 1927, "val_loss": 67733.3828125} {"train_loss": -6.160050392150879, "global_step": 80976, "epoch": 1928} {"train_loss": -6.1256866455078125, "global_step": 80977, "epoch": 1928} {"train_loss": -6.265120029449463, "global_step": 80978, "epoch": 1928} {"train_loss": -6.239550590515137, "global_step": 80979, "epoch": 1928} {"train_loss": -6.065077781677246, "global_step": 80980, "epoch": 1928} {"train_loss": -6.2172770500183105, "global_step": 80981, "epoch": 1928} {"train_loss": -6.132608890533447, "global_step": 80982, "epoch": 1928} {"train_loss": -6.174119472503662, "global_step": 80983, "epoch": 1928} {"train_loss": -6.229369163513184, "global_step": 80984, "epoch": 1928} {"train_loss": -6.1426496505737305, "global_step": 80985, "epoch": 1928} {"train_loss": -6.183922290802002, "global_step": 80986, "epoch": 1928} {"train_loss": -6.144198417663574, "global_step": 80987, "epoch": 1928} {"train_loss": -6.198004722595215, "global_step": 80988, "epoch": 1928} {"train_loss": -6.2500200271606445, "global_step": 80989, "epoch": 1928} {"train_loss": -6.128951072692871, "global_step": 80990, "epoch": 1928} {"train_loss": -6.294436454772949, "global_step": 80991, "epoch": 1928} {"train_loss": -6.310237884521484, "global_step": 80992, "epoch": 1928} {"train_loss": -6.1861653327941895, "global_step": 80993, "epoch": 1928} {"train_loss": -6.154501914978027, "global_step": 80994, "epoch": 1928} {"train_loss": -6.25637149810791, "global_step": 80995, "epoch": 1928} {"train_loss": -6.206330299377441, "global_step": 80996, "epoch": 1928} {"train_loss": -6.130390644073486, "global_step": 80997, "epoch": 1928} {"train_loss": -6.0618696212768555, "global_step": 80998, "epoch": 1928} {"train_loss": -6.0809783935546875, "global_step": 80999, "epoch": 1928} {"train_loss": -6.0472002029418945, "global_step": 81000, "epoch": 1928} {"train_loss": -6.036846160888672, "global_step": 81001, "epoch": 1928} {"train_loss": -6.055022716522217, "global_step": 81002, "epoch": 1928} {"train_loss": -6.056192398071289, "global_step": 81003, "epoch": 1928} {"train_loss": -6.050595283508301, "global_step": 81004, "epoch": 1928} {"train_loss": -6.091734886169434, "global_step": 81005, "epoch": 1928} {"train_loss": -6.075466156005859, "global_step": 81006, "epoch": 1928} {"train_loss": -6.11177396774292, "global_step": 81007, "epoch": 1928} {"train_loss": -6.019481658935547, "global_step": 81008, "epoch": 1928} {"train_loss": -6.1971330642700195, "global_step": 81009, "epoch": 1928} {"train_loss": -6.094209671020508, "global_step": 81010, "epoch": 1928} {"train_loss": -6.169051170349121, "global_step": 81011, "epoch": 1928} {"train_loss": -6.01148796081543, "global_step": 81012, "epoch": 1928} {"train_loss": -6.14729118347168, "global_step": 81013, "epoch": 1928} {"train_loss": -6.086090087890625, "global_step": 81014, "epoch": 1928} {"train_loss": -6.144913673400879, "global_step": 81015, "epoch": 1928} {"train_loss": -6.156248569488525, "global_step": 81016, "epoch": 1928} {"train_loss": -6.143987280981881, "global_step": 81017, "epoch": 1928, "val_loss": 67687.8515625} {"train_loss": -6.061123371124268, "global_step": 81018, "epoch": 1929} {"train_loss": -6.156291484832764, "global_step": 81019, "epoch": 1929} {"train_loss": -6.193907260894775, "global_step": 81020, "epoch": 1929} {"train_loss": -6.139777183532715, "global_step": 81021, "epoch": 1929} {"train_loss": -6.2552337646484375, "global_step": 81022, "epoch": 1929} {"train_loss": -6.120126247406006, "global_step": 81023, "epoch": 1929} {"train_loss": -6.265481948852539, "global_step": 81024, "epoch": 1929} {"train_loss": -6.086062431335449, "global_step": 81025, "epoch": 1929} {"train_loss": -6.187259197235107, "global_step": 81026, "epoch": 1929} {"train_loss": -6.152252197265625, "global_step": 81027, "epoch": 1929} {"train_loss": -6.063702583312988, "global_step": 81028, "epoch": 1929} {"train_loss": -6.206186294555664, "global_step": 81029, "epoch": 1929} {"train_loss": -6.189976692199707, "global_step": 81030, "epoch": 1929} {"train_loss": -5.959779739379883, "global_step": 81031, "epoch": 1929} {"train_loss": -6.245022296905518, "global_step": 81032, "epoch": 1929} {"train_loss": -6.167333126068115, "global_step": 81033, "epoch": 1929} {"train_loss": -6.054364204406738, "global_step": 81034, "epoch": 1929} {"train_loss": -6.0491251945495605, "global_step": 81035, "epoch": 1929} {"train_loss": -6.045400142669678, "global_step": 81036, "epoch": 1929} {"train_loss": -6.096644401550293, "global_step": 81037, "epoch": 1929} {"train_loss": -6.080187797546387, "global_step": 81038, "epoch": 1929} {"train_loss": -5.995659828186035, "global_step": 81039, "epoch": 1929} {"train_loss": -6.021318435668945, "global_step": 81040, "epoch": 1929} {"train_loss": -6.127830505371094, "global_step": 81041, "epoch": 1929} {"train_loss": -6.123866081237793, "global_step": 81042, "epoch": 1929} {"train_loss": -6.171699047088623, "global_step": 81043, "epoch": 1929} {"train_loss": -6.10481071472168, "global_step": 81044, "epoch": 1929} {"train_loss": -6.10432243347168, "global_step": 81045, "epoch": 1929} {"train_loss": -6.145505905151367, "global_step": 81046, "epoch": 1929} {"train_loss": -6.049848556518555, "global_step": 81047, "epoch": 1929} {"train_loss": -6.028190612792969, "global_step": 81048, "epoch": 1929} {"train_loss": -6.0004191398620605, "global_step": 81049, "epoch": 1929} {"train_loss": -6.0889105796813965, "global_step": 81050, "epoch": 1929} {"train_loss": -6.152295112609863, "global_step": 81051, "epoch": 1929} {"train_loss": -6.073767185211182, "global_step": 81052, "epoch": 1929} {"train_loss": -6.047921657562256, "global_step": 81053, "epoch": 1929} {"train_loss": -6.015593528747559, "global_step": 81054, "epoch": 1929} {"train_loss": -6.079270362854004, "global_step": 81055, "epoch": 1929} {"train_loss": -6.0477190017700195, "global_step": 81056, "epoch": 1929} {"train_loss": -5.94547176361084, "global_step": 81057, "epoch": 1929} {"train_loss": -6.053442001342773, "global_step": 81058, "epoch": 1929} {"train_loss": -6.101045154389881, "global_step": 81059, "epoch": 1929, "val_loss": 67618.0} {"train_loss": -6.14460563659668, "global_step": 81060, "epoch": 1930} {"train_loss": -6.0980939865112305, "global_step": 81061, "epoch": 1930} {"train_loss": -5.97251033782959, "global_step": 81062, "epoch": 1930} {"train_loss": -6.166632652282715, "global_step": 81063, "epoch": 1930} {"train_loss": -6.195500373840332, "global_step": 81064, "epoch": 1930} {"train_loss": -6.052213668823242, "global_step": 81065, "epoch": 1930} {"train_loss": -6.1492156982421875, "global_step": 81066, "epoch": 1930} {"train_loss": -6.065140247344971, "global_step": 81067, "epoch": 1930} {"train_loss": -6.140328407287598, "global_step": 81068, "epoch": 1930} {"train_loss": -6.013855457305908, "global_step": 81069, "epoch": 1930} {"train_loss": -6.134523391723633, "global_step": 81070, "epoch": 1930} {"train_loss": -6.240042209625244, "global_step": 81071, "epoch": 1930} {"train_loss": -6.153966903686523, "global_step": 81072, "epoch": 1930} {"train_loss": -6.218453407287598, "global_step": 81073, "epoch": 1930} {"train_loss": -6.058516502380371, "global_step": 81074, "epoch": 1930} {"train_loss": -6.1181488037109375, "global_step": 81075, "epoch": 1930} {"train_loss": -6.13278865814209, "global_step": 81076, "epoch": 1930} {"train_loss": -6.115633964538574, "global_step": 81077, "epoch": 1930} {"train_loss": -6.1350297927856445, "global_step": 81078, "epoch": 1930} {"train_loss": -6.133704662322998, "global_step": 81079, "epoch": 1930} {"train_loss": -6.087728023529053, "global_step": 81080, "epoch": 1930} {"train_loss": -6.042564868927002, "global_step": 81081, "epoch": 1930} {"train_loss": -5.990050792694092, "global_step": 81082, "epoch": 1930} {"train_loss": -6.101353645324707, "global_step": 81083, "epoch": 1930} {"train_loss": -6.092051029205322, "global_step": 81084, "epoch": 1930} {"train_loss": -6.084317684173584, "global_step": 81085, "epoch": 1930} {"train_loss": -6.116755485534668, "global_step": 81086, "epoch": 1930} {"train_loss": -6.126492500305176, "global_step": 81087, "epoch": 1930} {"train_loss": -6.172604560852051, "global_step": 81088, "epoch": 1930} {"train_loss": -6.1779327392578125, "global_step": 81089, "epoch": 1930} {"train_loss": -6.122249603271484, "global_step": 81090, "epoch": 1930} {"train_loss": -6.0352325439453125, "global_step": 81091, "epoch": 1930} {"train_loss": -6.148236274719238, "global_step": 81092, "epoch": 1930} {"train_loss": -6.167505264282227, "global_step": 81093, "epoch": 1930} {"train_loss": -6.114713668823242, "global_step": 81094, "epoch": 1930} {"train_loss": -6.089071273803711, "global_step": 81095, "epoch": 1930} {"train_loss": -6.134943962097168, "global_step": 81096, "epoch": 1930} {"train_loss": -6.147830963134766, "global_step": 81097, "epoch": 1930} {"train_loss": -6.167638301849365, "global_step": 81098, "epoch": 1930} {"train_loss": -6.077157974243164, "global_step": 81099, "epoch": 1930} {"train_loss": -6.284845352172852, "global_step": 81100, "epoch": 1930} {"train_loss": -6.120201042720249, "global_step": 81101, "epoch": 1930, "val_loss": 67572.8046875} {"train_loss": -6.166345119476318, "global_step": 81102, "epoch": 1931} {"train_loss": -6.2538299560546875, "global_step": 81103, "epoch": 1931} {"train_loss": -6.137200355529785, "global_step": 81104, "epoch": 1931} {"train_loss": -6.252724647521973, "global_step": 81105, "epoch": 1931} {"train_loss": -6.149426460266113, "global_step": 81106, "epoch": 1931} {"train_loss": -6.229731559753418, "global_step": 81107, "epoch": 1931} {"train_loss": -6.102633476257324, "global_step": 81108, "epoch": 1931} {"train_loss": -6.065126419067383, "global_step": 81109, "epoch": 1931} {"train_loss": -6.145824909210205, "global_step": 81110, "epoch": 1931} {"train_loss": -6.160999298095703, "global_step": 81111, "epoch": 1931} {"train_loss": -6.158456802368164, "global_step": 81112, "epoch": 1931} {"train_loss": -6.0101847648620605, "global_step": 81113, "epoch": 1931} {"train_loss": -6.0458550453186035, "global_step": 81114, "epoch": 1931} {"train_loss": -6.236690521240234, "global_step": 81115, "epoch": 1931} {"train_loss": -6.116065979003906, "global_step": 81116, "epoch": 1931} {"train_loss": -6.113229751586914, "global_step": 81117, "epoch": 1931} {"train_loss": -6.179986476898193, "global_step": 81118, "epoch": 1931} {"train_loss": -5.972702980041504, "global_step": 81119, "epoch": 1931} {"train_loss": -6.111368179321289, "global_step": 81120, "epoch": 1931} {"train_loss": -6.128983497619629, "global_step": 81121, "epoch": 1931} {"train_loss": -6.0589704513549805, "global_step": 81122, "epoch": 1931} {"train_loss": -6.029743671417236, "global_step": 81123, "epoch": 1931} {"train_loss": -6.092395305633545, "global_step": 81124, "epoch": 1931} {"train_loss": -6.102384567260742, "global_step": 81125, "epoch": 1931} {"train_loss": -6.192817687988281, "global_step": 81126, "epoch": 1931} {"train_loss": -6.121756553649902, "global_step": 81127, "epoch": 1931} {"train_loss": -6.160185813903809, "global_step": 81128, "epoch": 1931} {"train_loss": -6.140014171600342, "global_step": 81129, "epoch": 1931} {"train_loss": -6.0740461349487305, "global_step": 81130, "epoch": 1931} {"train_loss": -6.215100288391113, "global_step": 81131, "epoch": 1931} {"train_loss": -6.204330921173096, "global_step": 81132, "epoch": 1931} {"train_loss": -6.119606971740723, "global_step": 81133, "epoch": 1931} {"train_loss": -6.206744194030762, "global_step": 81134, "epoch": 1931} {"train_loss": -6.038619041442871, "global_step": 81135, "epoch": 1931} {"train_loss": -6.091840744018555, "global_step": 81136, "epoch": 1931} {"train_loss": -6.079244613647461, "global_step": 81137, "epoch": 1931} {"train_loss": -6.044527053833008, "global_step": 81138, "epoch": 1931} {"train_loss": -6.089834213256836, "global_step": 81139, "epoch": 1931} {"train_loss": -6.161015033721924, "global_step": 81140, "epoch": 1931} {"train_loss": -6.061595439910889, "global_step": 81141, "epoch": 1931} {"train_loss": -6.076147079467773, "global_step": 81142, "epoch": 1931} {"train_loss": -6.126472223372686, "global_step": 81143, "epoch": 1931, "val_loss": 67620.71875} {"train_loss": -6.068622589111328, "global_step": 81144, "epoch": 1932} {"train_loss": -6.199247360229492, "global_step": 81145, "epoch": 1932} {"train_loss": -6.144619464874268, "global_step": 81146, "epoch": 1932} {"train_loss": -6.194910526275635, "global_step": 81147, "epoch": 1932} {"train_loss": -6.210521221160889, "global_step": 81148, "epoch": 1932} {"train_loss": -5.969308376312256, "global_step": 81149, "epoch": 1932} {"train_loss": -6.124659538269043, "global_step": 81150, "epoch": 1932} {"train_loss": -6.0505475997924805, "global_step": 81151, "epoch": 1932} {"train_loss": -6.172001361846924, "global_step": 81152, "epoch": 1932} {"train_loss": -6.163425922393799, "global_step": 81153, "epoch": 1932} {"train_loss": -6.188676357269287, "global_step": 81154, "epoch": 1932} {"train_loss": -6.218859672546387, "global_step": 81155, "epoch": 1932} {"train_loss": -6.178002834320068, "global_step": 81156, "epoch": 1932} {"train_loss": -6.230037689208984, "global_step": 81157, "epoch": 1932} {"train_loss": -6.087366104125977, "global_step": 81158, "epoch": 1932} {"train_loss": -6.056831359863281, "global_step": 81159, "epoch": 1932} {"train_loss": -6.205390930175781, "global_step": 81160, "epoch": 1932} {"train_loss": -6.057437419891357, "global_step": 81161, "epoch": 1932} {"train_loss": -6.108386039733887, "global_step": 81162, "epoch": 1932} {"train_loss": -6.038759231567383, "global_step": 81163, "epoch": 1932} {"train_loss": -6.182795524597168, "global_step": 81164, "epoch": 1932} {"train_loss": -6.164575099945068, "global_step": 81165, "epoch": 1932} {"train_loss": -6.239736557006836, "global_step": 81166, "epoch": 1932} {"train_loss": -6.1584858894348145, "global_step": 81167, "epoch": 1932} {"train_loss": -6.2451934814453125, "global_step": 81168, "epoch": 1932} {"train_loss": -5.8256025314331055, "global_step": 81169, "epoch": 1932} {"train_loss": -6.141326904296875, "global_step": 81170, "epoch": 1932} {"train_loss": -6.213921546936035, "global_step": 81171, "epoch": 1932} {"train_loss": -6.172580242156982, "global_step": 81172, "epoch": 1932} {"train_loss": -6.054190635681152, "global_step": 81173, "epoch": 1932} {"train_loss": -6.027157306671143, "global_step": 81174, "epoch": 1932} {"train_loss": -6.107274055480957, "global_step": 81175, "epoch": 1932} {"train_loss": -6.023683071136475, "global_step": 81176, "epoch": 1932} {"train_loss": -6.097232818603516, "global_step": 81177, "epoch": 1932} {"train_loss": -6.141689777374268, "global_step": 81178, "epoch": 1932} {"train_loss": -6.278356075286865, "global_step": 81179, "epoch": 1932} {"train_loss": -6.162919521331787, "global_step": 81180, "epoch": 1932} {"train_loss": -6.1113739013671875, "global_step": 81181, "epoch": 1932} {"train_loss": -6.179078578948975, "global_step": 81182, "epoch": 1932} {"train_loss": -6.1970367431640625, "global_step": 81183, "epoch": 1932} {"train_loss": -6.136762619018555, "global_step": 81184, "epoch": 1932} {"train_loss": -6.135654199691046, "global_step": 81185, "epoch": 1932, "val_loss": 67547.1953125} {"train_loss": -6.065980911254883, "global_step": 81186, "epoch": 1933} {"train_loss": -6.17777156829834, "global_step": 81187, "epoch": 1933} {"train_loss": -6.251357078552246, "global_step": 81188, "epoch": 1933} {"train_loss": -6.143880367279053, "global_step": 81189, "epoch": 1933} {"train_loss": -6.177918910980225, "global_step": 81190, "epoch": 1933} {"train_loss": -6.181719779968262, "global_step": 81191, "epoch": 1933} {"train_loss": -6.218348026275635, "global_step": 81192, "epoch": 1933} {"train_loss": -6.1853790283203125, "global_step": 81193, "epoch": 1933} {"train_loss": -6.091517448425293, "global_step": 81194, "epoch": 1933} {"train_loss": -6.139273643493652, "global_step": 81195, "epoch": 1933} {"train_loss": -6.072107315063477, "global_step": 81196, "epoch": 1933} {"train_loss": -6.223326683044434, "global_step": 81197, "epoch": 1933} {"train_loss": -6.13339900970459, "global_step": 81198, "epoch": 1933} {"train_loss": -6.1961669921875, "global_step": 81199, "epoch": 1933} {"train_loss": -6.155182838439941, "global_step": 81200, "epoch": 1933} {"train_loss": -6.083292484283447, "global_step": 81201, "epoch": 1933} {"train_loss": -6.245814800262451, "global_step": 81202, "epoch": 1933} {"train_loss": -6.141026020050049, "global_step": 81203, "epoch": 1933} {"train_loss": -6.170749664306641, "global_step": 81204, "epoch": 1933} {"train_loss": -6.092772960662842, "global_step": 81205, "epoch": 1933} {"train_loss": -6.237464427947998, "global_step": 81206, "epoch": 1933} {"train_loss": -6.076695919036865, "global_step": 81207, "epoch": 1933} {"train_loss": -6.1664910316467285, "global_step": 81208, "epoch": 1933} {"train_loss": -6.118099212646484, "global_step": 81209, "epoch": 1933} {"train_loss": -6.078117370605469, "global_step": 81210, "epoch": 1933} {"train_loss": -6.194338798522949, "global_step": 81211, "epoch": 1933} {"train_loss": -6.149990558624268, "global_step": 81212, "epoch": 1933} {"train_loss": -6.158301830291748, "global_step": 81213, "epoch": 1933} {"train_loss": -6.234579086303711, "global_step": 81214, "epoch": 1933} {"train_loss": -6.118408203125, "global_step": 81215, "epoch": 1933} {"train_loss": -6.14501428604126, "global_step": 81216, "epoch": 1933} {"train_loss": -6.221012592315674, "global_step": 81217, "epoch": 1933} {"train_loss": -5.966764450073242, "global_step": 81218, "epoch": 1933} {"train_loss": -6.062342643737793, "global_step": 81219, "epoch": 1933} {"train_loss": -6.049177169799805, "global_step": 81220, "epoch": 1933} {"train_loss": -6.052891731262207, "global_step": 81221, "epoch": 1933} {"train_loss": -6.081554412841797, "global_step": 81222, "epoch": 1933} {"train_loss": -5.981655597686768, "global_step": 81223, "epoch": 1933} {"train_loss": -6.21987247467041, "global_step": 81224, "epoch": 1933} {"train_loss": -6.070806503295898, "global_step": 81225, "epoch": 1933} {"train_loss": -6.181554794311523, "global_step": 81226, "epoch": 1933} {"train_loss": -6.137582336153303, "global_step": 81227, "epoch": 1933, "val_loss": 67764.125} {"train_loss": -6.07614803314209, "global_step": 81228, "epoch": 1934} {"train_loss": -6.144944190979004, "global_step": 81229, "epoch": 1934} {"train_loss": -6.035522937774658, "global_step": 81230, "epoch": 1934} {"train_loss": -6.1714067459106445, "global_step": 81231, "epoch": 1934} {"train_loss": -6.215824604034424, "global_step": 81232, "epoch": 1934} {"train_loss": -6.089159965515137, "global_step": 81233, "epoch": 1934} {"train_loss": -6.01753044128418, "global_step": 81234, "epoch": 1934} {"train_loss": -6.033688545227051, "global_step": 81235, "epoch": 1934} {"train_loss": -6.182041168212891, "global_step": 81236, "epoch": 1934} {"train_loss": -6.098354339599609, "global_step": 81237, "epoch": 1934} {"train_loss": -6.170685768127441, "global_step": 81238, "epoch": 1934} {"train_loss": -6.1620659828186035, "global_step": 81239, "epoch": 1934} {"train_loss": -6.148656845092773, "global_step": 81240, "epoch": 1934} {"train_loss": -6.162728309631348, "global_step": 81241, "epoch": 1934} {"train_loss": -6.021379470825195, "global_step": 81242, "epoch": 1934} {"train_loss": -6.132875442504883, "global_step": 81243, "epoch": 1934} {"train_loss": -6.074038505554199, "global_step": 81244, "epoch": 1934} {"train_loss": -6.053614139556885, "global_step": 81245, "epoch": 1934} {"train_loss": -6.178866386413574, "global_step": 81246, "epoch": 1934} {"train_loss": -6.167325973510742, "global_step": 81247, "epoch": 1934} {"train_loss": -6.285696029663086, "global_step": 81248, "epoch": 1934} {"train_loss": -6.154209136962891, "global_step": 81249, "epoch": 1934} {"train_loss": -6.022149562835693, "global_step": 81250, "epoch": 1934} {"train_loss": -6.164424896240234, "global_step": 81251, "epoch": 1934} {"train_loss": -6.0516581535339355, "global_step": 81252, "epoch": 1934} {"train_loss": -6.084510803222656, "global_step": 81253, "epoch": 1934} {"train_loss": -6.111942291259766, "global_step": 81254, "epoch": 1934} {"train_loss": -6.004613399505615, "global_step": 81255, "epoch": 1934} {"train_loss": -6.103053092956543, "global_step": 81256, "epoch": 1934} {"train_loss": -6.0896992683410645, "global_step": 81257, "epoch": 1934} {"train_loss": -6.159437656402588, "global_step": 81258, "epoch": 1934} {"train_loss": -5.992673873901367, "global_step": 81259, "epoch": 1934} {"train_loss": -6.072766304016113, "global_step": 81260, "epoch": 1934} {"train_loss": -6.094208717346191, "global_step": 81261, "epoch": 1934} {"train_loss": -6.146420001983643, "global_step": 81262, "epoch": 1934} {"train_loss": -6.08817720413208, "global_step": 81263, "epoch": 1934} {"train_loss": -6.143091201782227, "global_step": 81264, "epoch": 1934} {"train_loss": -6.131172180175781, "global_step": 81265, "epoch": 1934} {"train_loss": -6.213159561157227, "global_step": 81266, "epoch": 1934} {"train_loss": -6.151703834533691, "global_step": 81267, "epoch": 1934} {"train_loss": -6.1742095947265625, "global_step": 81268, "epoch": 1934} {"train_loss": -6.1168028854188465, "global_step": 81269, "epoch": 1934, "val_loss": 67419.390625} {"train_loss": -6.233151435852051, "global_step": 81270, "epoch": 1935} {"train_loss": -6.191588401794434, "global_step": 81271, "epoch": 1935} {"train_loss": -6.218631744384766, "global_step": 81272, "epoch": 1935} {"train_loss": -6.031126022338867, "global_step": 81273, "epoch": 1935} {"train_loss": -6.1039204597473145, "global_step": 81274, "epoch": 1935} {"train_loss": -6.170411109924316, "global_step": 81275, "epoch": 1935} {"train_loss": -6.129921913146973, "global_step": 81276, "epoch": 1935} {"train_loss": -6.066758155822754, "global_step": 81277, "epoch": 1935} {"train_loss": -5.984156131744385, "global_step": 81278, "epoch": 1935} {"train_loss": -6.069838523864746, "global_step": 81279, "epoch": 1935} {"train_loss": -6.1089558601379395, "global_step": 81280, "epoch": 1935} {"train_loss": -6.066300392150879, "global_step": 81281, "epoch": 1935} {"train_loss": -6.139951229095459, "global_step": 81282, "epoch": 1935} {"train_loss": -6.084117889404297, "global_step": 81283, "epoch": 1935} {"train_loss": -6.090787887573242, "global_step": 81284, "epoch": 1935} {"train_loss": -6.11451530456543, "global_step": 81285, "epoch": 1935} {"train_loss": -6.069367408752441, "global_step": 81286, "epoch": 1935} {"train_loss": -6.108076095581055, "global_step": 81287, "epoch": 1935} {"train_loss": -6.189384460449219, "global_step": 81288, "epoch": 1935} {"train_loss": -6.101686477661133, "global_step": 81289, "epoch": 1935} {"train_loss": -6.2619757652282715, "global_step": 81290, "epoch": 1935} {"train_loss": -6.051069736480713, "global_step": 81291, "epoch": 1935} {"train_loss": -6.155705451965332, "global_step": 81292, "epoch": 1935} {"train_loss": -6.20526647567749, "global_step": 81293, "epoch": 1935} {"train_loss": -6.214128017425537, "global_step": 81294, "epoch": 1935} {"train_loss": -6.260875701904297, "global_step": 81295, "epoch": 1935} {"train_loss": -6.224617958068848, "global_step": 81296, "epoch": 1935} {"train_loss": -6.2329912185668945, "global_step": 81297, "epoch": 1935} {"train_loss": -6.203761100769043, "global_step": 81298, "epoch": 1935} {"train_loss": -6.107973098754883, "global_step": 81299, "epoch": 1935} {"train_loss": -6.127824783325195, "global_step": 81300, "epoch": 1935} {"train_loss": -6.193509101867676, "global_step": 81301, "epoch": 1935} {"train_loss": -6.085997104644775, "global_step": 81302, "epoch": 1935} {"train_loss": -6.209575176239014, "global_step": 81303, "epoch": 1935} {"train_loss": -6.116660118103027, "global_step": 81304, "epoch": 1935} {"train_loss": -6.07352876663208, "global_step": 81305, "epoch": 1935} {"train_loss": -6.1724629402160645, "global_step": 81306, "epoch": 1935} {"train_loss": -6.310641288757324, "global_step": 81307, "epoch": 1935} {"train_loss": -6.200484275817871, "global_step": 81308, "epoch": 1935} {"train_loss": -6.223766326904297, "global_step": 81309, "epoch": 1935} {"train_loss": -6.00834846496582, "global_step": 81310, "epoch": 1935} {"train_loss": -6.144187223343622, "global_step": 81311, "epoch": 1935, "val_loss": 67886.3046875} {"train_loss": -6.155222415924072, "global_step": 81312, "epoch": 1936} {"train_loss": -6.074619293212891, "global_step": 81313, "epoch": 1936} {"train_loss": -6.121288299560547, "global_step": 81314, "epoch": 1936} {"train_loss": -6.104870796203613, "global_step": 81315, "epoch": 1936} {"train_loss": -6.262537002563477, "global_step": 81316, "epoch": 1936} {"train_loss": -6.107019424438477, "global_step": 81317, "epoch": 1936} {"train_loss": -6.170967102050781, "global_step": 81318, "epoch": 1936} {"train_loss": -6.215655326843262, "global_step": 81319, "epoch": 1936} {"train_loss": -6.125514030456543, "global_step": 81320, "epoch": 1936} {"train_loss": -6.157042503356934, "global_step": 81321, "epoch": 1936} {"train_loss": -6.101245880126953, "global_step": 81322, "epoch": 1936} {"train_loss": -6.1953654289245605, "global_step": 81323, "epoch": 1936} {"train_loss": -6.217822551727295, "global_step": 81324, "epoch": 1936} {"train_loss": -6.2615461349487305, "global_step": 81325, "epoch": 1936} {"train_loss": -6.017951488494873, "global_step": 81326, "epoch": 1936} {"train_loss": -6.233204364776611, "global_step": 81327, "epoch": 1936} {"train_loss": -6.18613338470459, "global_step": 81328, "epoch": 1936} {"train_loss": -6.184792518615723, "global_step": 81329, "epoch": 1936} {"train_loss": -6.06257438659668, "global_step": 81330, "epoch": 1936} {"train_loss": -6.191888332366943, "global_step": 81331, "epoch": 1936} {"train_loss": -6.087990760803223, "global_step": 81332, "epoch": 1936} {"train_loss": -6.20683479309082, "global_step": 81333, "epoch": 1936} {"train_loss": -6.120752811431885, "global_step": 81334, "epoch": 1936} {"train_loss": -5.936435222625732, "global_step": 81335, "epoch": 1936} {"train_loss": -6.200621604919434, "global_step": 81336, "epoch": 1936} {"train_loss": -6.001101016998291, "global_step": 81337, "epoch": 1936} {"train_loss": -6.13029146194458, "global_step": 81338, "epoch": 1936} {"train_loss": -5.97215461730957, "global_step": 81339, "epoch": 1936} {"train_loss": -6.1776580810546875, "global_step": 81340, "epoch": 1936} {"train_loss": -6.172046661376953, "global_step": 81341, "epoch": 1936} {"train_loss": -6.104249954223633, "global_step": 81342, "epoch": 1936} {"train_loss": -6.211198806762695, "global_step": 81343, "epoch": 1936} {"train_loss": -6.231550693511963, "global_step": 81344, "epoch": 1936} {"train_loss": -6.24743127822876, "global_step": 81345, "epoch": 1936} {"train_loss": -6.178890705108643, "global_step": 81346, "epoch": 1936} {"train_loss": -6.141678333282471, "global_step": 81347, "epoch": 1936} {"train_loss": -6.218212127685547, "global_step": 81348, "epoch": 1936} {"train_loss": -6.158815383911133, "global_step": 81349, "epoch": 1936} {"train_loss": -6.157783508300781, "global_step": 81350, "epoch": 1936} {"train_loss": -6.231761455535889, "global_step": 81351, "epoch": 1936} {"train_loss": -6.174527168273926, "global_step": 81352, "epoch": 1936} {"train_loss": -6.151493288221813, "global_step": 81353, "epoch": 1936, "val_loss": 67672.6171875} {"train_loss": -6.185143947601318, "global_step": 81354, "epoch": 1937} {"train_loss": -6.082520484924316, "global_step": 81355, "epoch": 1937} {"train_loss": -6.234374046325684, "global_step": 81356, "epoch": 1937} {"train_loss": -6.138459205627441, "global_step": 81357, "epoch": 1937} {"train_loss": -6.100940704345703, "global_step": 81358, "epoch": 1937} {"train_loss": -6.252663612365723, "global_step": 81359, "epoch": 1937} {"train_loss": -6.140435218811035, "global_step": 81360, "epoch": 1937} {"train_loss": -6.170478343963623, "global_step": 81361, "epoch": 1937} {"train_loss": -6.1464996337890625, "global_step": 81362, "epoch": 1937} {"train_loss": -6.180253982543945, "global_step": 81363, "epoch": 1937} {"train_loss": -6.314523696899414, "global_step": 81364, "epoch": 1937} {"train_loss": -6.169772148132324, "global_step": 81365, "epoch": 1937} {"train_loss": -6.113175868988037, "global_step": 81366, "epoch": 1937} {"train_loss": -6.182411193847656, "global_step": 81367, "epoch": 1937} {"train_loss": -6.120047092437744, "global_step": 81368, "epoch": 1937} {"train_loss": -6.258595943450928, "global_step": 81369, "epoch": 1937} {"train_loss": -6.169421195983887, "global_step": 81370, "epoch": 1937} {"train_loss": -6.185016632080078, "global_step": 81371, "epoch": 1937} {"train_loss": -6.181695938110352, "global_step": 81372, "epoch": 1937} {"train_loss": -6.283538818359375, "global_step": 81373, "epoch": 1937} {"train_loss": -6.136905193328857, "global_step": 81374, "epoch": 1937} {"train_loss": -6.076576232910156, "global_step": 81375, "epoch": 1937} {"train_loss": -6.176894187927246, "global_step": 81376, "epoch": 1937} {"train_loss": -6.250949382781982, "global_step": 81377, "epoch": 1937} {"train_loss": -6.028409957885742, "global_step": 81378, "epoch": 1937} {"train_loss": -6.095609664916992, "global_step": 81379, "epoch": 1937} {"train_loss": -6.219738483428955, "global_step": 81380, "epoch": 1937} {"train_loss": -6.114131927490234, "global_step": 81381, "epoch": 1937} {"train_loss": -6.242816925048828, "global_step": 81382, "epoch": 1937} {"train_loss": -6.133438587188721, "global_step": 81383, "epoch": 1937} {"train_loss": -6.074674606323242, "global_step": 81384, "epoch": 1937} {"train_loss": -6.043499946594238, "global_step": 81385, "epoch": 1937} {"train_loss": -6.136201858520508, "global_step": 81386, "epoch": 1937} {"train_loss": -6.056950569152832, "global_step": 81387, "epoch": 1937} {"train_loss": -6.088206768035889, "global_step": 81388, "epoch": 1937} {"train_loss": -6.095092296600342, "global_step": 81389, "epoch": 1937} {"train_loss": -6.157634258270264, "global_step": 81390, "epoch": 1937} {"train_loss": -6.123069763183594, "global_step": 81391, "epoch": 1937} {"train_loss": -6.111598014831543, "global_step": 81392, "epoch": 1937} {"train_loss": -6.194952964782715, "global_step": 81393, "epoch": 1937} {"train_loss": -6.242871284484863, "global_step": 81394, "epoch": 1937} {"train_loss": -6.154811166581654, "global_step": 81395, "epoch": 1937, "val_loss": 67849.265625} {"train_loss": -6.087395668029785, "global_step": 81396, "epoch": 1938} {"train_loss": -6.109091758728027, "global_step": 81397, "epoch": 1938} {"train_loss": -6.271405220031738, "global_step": 81398, "epoch": 1938} {"train_loss": -6.067625999450684, "global_step": 81399, "epoch": 1938} {"train_loss": -6.125946998596191, "global_step": 81400, "epoch": 1938} {"train_loss": -6.186611175537109, "global_step": 81401, "epoch": 1938} {"train_loss": -5.9972686767578125, "global_step": 81402, "epoch": 1938} {"train_loss": -6.220815181732178, "global_step": 81403, "epoch": 1938} {"train_loss": -6.274728775024414, "global_step": 81404, "epoch": 1938} {"train_loss": -6.0297417640686035, "global_step": 81405, "epoch": 1938} {"train_loss": -6.116451740264893, "global_step": 81406, "epoch": 1938} {"train_loss": -6.128073215484619, "global_step": 81407, "epoch": 1938} {"train_loss": -6.062984943389893, "global_step": 81408, "epoch": 1938} {"train_loss": -6.078127384185791, "global_step": 81409, "epoch": 1938} {"train_loss": -6.1190185546875, "global_step": 81410, "epoch": 1938} {"train_loss": -6.045334339141846, "global_step": 81411, "epoch": 1938} {"train_loss": -6.138127326965332, "global_step": 81412, "epoch": 1938} {"train_loss": -6.208113670349121, "global_step": 81413, "epoch": 1938} {"train_loss": -6.092040061950684, "global_step": 81414, "epoch": 1938} {"train_loss": -6.204512596130371, "global_step": 81415, "epoch": 1938} {"train_loss": -6.171322822570801, "global_step": 81416, "epoch": 1938} {"train_loss": -6.033481121063232, "global_step": 81417, "epoch": 1938} {"train_loss": -6.139821529388428, "global_step": 81418, "epoch": 1938} {"train_loss": -6.0750017166137695, "global_step": 81419, "epoch": 1938} {"train_loss": -6.233129501342773, "global_step": 81420, "epoch": 1938} {"train_loss": -6.019683837890625, "global_step": 81421, "epoch": 1938} {"train_loss": -6.2707438468933105, "global_step": 81422, "epoch": 1938} {"train_loss": -6.133208274841309, "global_step": 81423, "epoch": 1938} {"train_loss": -6.281646728515625, "global_step": 81424, "epoch": 1938} {"train_loss": -6.066623687744141, "global_step": 81425, "epoch": 1938} {"train_loss": -6.2274065017700195, "global_step": 81426, "epoch": 1938} {"train_loss": -6.036327362060547, "global_step": 81427, "epoch": 1938} {"train_loss": -6.122209548950195, "global_step": 81428, "epoch": 1938} {"train_loss": -6.10321569442749, "global_step": 81429, "epoch": 1938} {"train_loss": -6.084537506103516, "global_step": 81430, "epoch": 1938} {"train_loss": -6.099695205688477, "global_step": 81431, "epoch": 1938} {"train_loss": -6.215518474578857, "global_step": 81432, "epoch": 1938} {"train_loss": -6.038042068481445, "global_step": 81433, "epoch": 1938} {"train_loss": -6.113561630249023, "global_step": 81434, "epoch": 1938} {"train_loss": -6.14129638671875, "global_step": 81435, "epoch": 1938} {"train_loss": -6.034268379211426, "global_step": 81436, "epoch": 1938} {"train_loss": -6.127030383972895, "global_step": 81437, "epoch": 1938, "val_loss": 67824.9453125} {"train_loss": -6.022119522094727, "global_step": 81438, "epoch": 1939} {"train_loss": -6.071149826049805, "global_step": 81439, "epoch": 1939} {"train_loss": -6.021844863891602, "global_step": 81440, "epoch": 1939} {"train_loss": -6.12954044342041, "global_step": 81441, "epoch": 1939} {"train_loss": -6.030433654785156, "global_step": 81442, "epoch": 1939} {"train_loss": -6.097381591796875, "global_step": 81443, "epoch": 1939} {"train_loss": -6.17362642288208, "global_step": 81444, "epoch": 1939} {"train_loss": -5.99467658996582, "global_step": 81445, "epoch": 1939} {"train_loss": -6.150114059448242, "global_step": 81446, "epoch": 1939} {"train_loss": -6.077541351318359, "global_step": 81447, "epoch": 1939} {"train_loss": -5.976762294769287, "global_step": 81448, "epoch": 1939} {"train_loss": -6.062249660491943, "global_step": 81449, "epoch": 1939} {"train_loss": -6.147285461425781, "global_step": 81450, "epoch": 1939} {"train_loss": -6.211404323577881, "global_step": 81451, "epoch": 1939} {"train_loss": -6.166504859924316, "global_step": 81452, "epoch": 1939} {"train_loss": -6.171733856201172, "global_step": 81453, "epoch": 1939} {"train_loss": -6.090338706970215, "global_step": 81454, "epoch": 1939} {"train_loss": -6.0464043617248535, "global_step": 81455, "epoch": 1939} {"train_loss": -6.039037227630615, "global_step": 81456, "epoch": 1939} {"train_loss": -6.120522975921631, "global_step": 81457, "epoch": 1939} {"train_loss": -6.096508026123047, "global_step": 81458, "epoch": 1939} {"train_loss": -6.22615909576416, "global_step": 81459, "epoch": 1939} {"train_loss": -6.020198822021484, "global_step": 81460, "epoch": 1939} {"train_loss": -6.154514312744141, "global_step": 81461, "epoch": 1939} {"train_loss": -6.200916290283203, "global_step": 81462, "epoch": 1939} {"train_loss": -6.183791160583496, "global_step": 81463, "epoch": 1939} {"train_loss": -6.264060020446777, "global_step": 81464, "epoch": 1939} {"train_loss": -6.153661727905273, "global_step": 81465, "epoch": 1939} {"train_loss": -6.048793315887451, "global_step": 81466, "epoch": 1939} {"train_loss": -6.204287528991699, "global_step": 81467, "epoch": 1939} {"train_loss": -6.209122657775879, "global_step": 81468, "epoch": 1939} {"train_loss": -6.062943458557129, "global_step": 81469, "epoch": 1939} {"train_loss": -6.098154544830322, "global_step": 81470, "epoch": 1939} {"train_loss": -6.093160629272461, "global_step": 81471, "epoch": 1939} {"train_loss": -6.146759510040283, "global_step": 81472, "epoch": 1939} {"train_loss": -6.237021446228027, "global_step": 81473, "epoch": 1939} {"train_loss": -6.139936447143555, "global_step": 81474, "epoch": 1939} {"train_loss": -6.157238483428955, "global_step": 81475, "epoch": 1939} {"train_loss": -6.065625190734863, "global_step": 81476, "epoch": 1939} {"train_loss": -6.103480815887451, "global_step": 81477, "epoch": 1939} {"train_loss": -6.176344871520996, "global_step": 81478, "epoch": 1939} {"train_loss": -6.119237105051677, "global_step": 81479, "epoch": 1939, "val_loss": 67526.3125} {"train_loss": -6.1851911544799805, "global_step": 81480, "epoch": 1940} {"train_loss": -6.124111175537109, "global_step": 81481, "epoch": 1940} {"train_loss": -6.062575817108154, "global_step": 81482, "epoch": 1940} {"train_loss": -6.218274116516113, "global_step": 81483, "epoch": 1940} {"train_loss": -6.131536483764648, "global_step": 81484, "epoch": 1940} {"train_loss": -6.196297645568848, "global_step": 81485, "epoch": 1940} {"train_loss": -6.265843391418457, "global_step": 81486, "epoch": 1940} {"train_loss": -6.118607044219971, "global_step": 81487, "epoch": 1940} {"train_loss": -6.217622756958008, "global_step": 81488, "epoch": 1940} {"train_loss": -6.16546106338501, "global_step": 81489, "epoch": 1940} {"train_loss": -6.0698957443237305, "global_step": 81490, "epoch": 1940} {"train_loss": -6.188043594360352, "global_step": 81491, "epoch": 1940} {"train_loss": -6.242162227630615, "global_step": 81492, "epoch": 1940} {"train_loss": -6.1457905769348145, "global_step": 81493, "epoch": 1940} {"train_loss": -6.057736396789551, "global_step": 81494, "epoch": 1940} {"train_loss": -6.133576393127441, "global_step": 81495, "epoch": 1940} {"train_loss": -6.143302917480469, "global_step": 81496, "epoch": 1940} {"train_loss": -6.001213550567627, "global_step": 81497, "epoch": 1940} {"train_loss": -6.0171051025390625, "global_step": 81498, "epoch": 1940} {"train_loss": -6.048242568969727, "global_step": 81499, "epoch": 1940} {"train_loss": -6.310300350189209, "global_step": 81500, "epoch": 1940} {"train_loss": -6.173214912414551, "global_step": 81501, "epoch": 1940} {"train_loss": -6.122916221618652, "global_step": 81502, "epoch": 1940} {"train_loss": -6.2699480056762695, "global_step": 81503, "epoch": 1940} {"train_loss": -6.13220739364624, "global_step": 81504, "epoch": 1940} {"train_loss": -6.015607833862305, "global_step": 81505, "epoch": 1940} {"train_loss": -5.989556312561035, "global_step": 81506, "epoch": 1940} {"train_loss": -6.146444797515869, "global_step": 81507, "epoch": 1940} {"train_loss": -6.233425617218018, "global_step": 81508, "epoch": 1940} {"train_loss": -6.0424065589904785, "global_step": 81509, "epoch": 1940} {"train_loss": -6.109600067138672, "global_step": 81510, "epoch": 1940} {"train_loss": -6.204730987548828, "global_step": 81511, "epoch": 1940} {"train_loss": -6.240542411804199, "global_step": 81512, "epoch": 1940} {"train_loss": -6.139439582824707, "global_step": 81513, "epoch": 1940} {"train_loss": -6.1962127685546875, "global_step": 81514, "epoch": 1940} {"train_loss": -6.238554000854492, "global_step": 81515, "epoch": 1940} {"train_loss": -6.119476318359375, "global_step": 81516, "epoch": 1940} {"train_loss": -6.166818141937256, "global_step": 81517, "epoch": 1940} {"train_loss": -6.155788898468018, "global_step": 81518, "epoch": 1940} {"train_loss": -6.072636604309082, "global_step": 81519, "epoch": 1940} {"train_loss": -6.170077323913574, "global_step": 81520, "epoch": 1940} {"train_loss": -6.145331746055966, "global_step": 81521, "epoch": 1940, "val_loss": 67556.421875} {"train_loss": -6.128264904022217, "global_step": 81522, "epoch": 1941} {"train_loss": -6.044921875, "global_step": 81523, "epoch": 1941} {"train_loss": -6.126676559448242, "global_step": 81524, "epoch": 1941} {"train_loss": -6.165713310241699, "global_step": 81525, "epoch": 1941} {"train_loss": -6.028727054595947, "global_step": 81526, "epoch": 1941} {"train_loss": -6.111127853393555, "global_step": 81527, "epoch": 1941} {"train_loss": -6.1295952796936035, "global_step": 81528, "epoch": 1941} {"train_loss": -6.213266372680664, "global_step": 81529, "epoch": 1941} {"train_loss": -6.159725189208984, "global_step": 81530, "epoch": 1941} {"train_loss": -6.023133277893066, "global_step": 81531, "epoch": 1941} {"train_loss": -6.170340538024902, "global_step": 81532, "epoch": 1941} {"train_loss": -6.242036819458008, "global_step": 81533, "epoch": 1941} {"train_loss": -6.033570766448975, "global_step": 81534, "epoch": 1941} {"train_loss": -6.163853645324707, "global_step": 81535, "epoch": 1941} {"train_loss": -6.12847375869751, "global_step": 81536, "epoch": 1941} {"train_loss": -5.883711814880371, "global_step": 81537, "epoch": 1941} {"train_loss": -6.074459075927734, "global_step": 81538, "epoch": 1941} {"train_loss": -6.096682548522949, "global_step": 81539, "epoch": 1941} {"train_loss": -6.046032428741455, "global_step": 81540, "epoch": 1941} {"train_loss": -6.070522785186768, "global_step": 81541, "epoch": 1941} {"train_loss": -5.940141677856445, "global_step": 81542, "epoch": 1941} {"train_loss": -6.273385524749756, "global_step": 81543, "epoch": 1941} {"train_loss": -5.992188453674316, "global_step": 81544, "epoch": 1941} {"train_loss": -6.090790748596191, "global_step": 81545, "epoch": 1941} {"train_loss": -5.98575496673584, "global_step": 81546, "epoch": 1941} {"train_loss": -6.179901123046875, "global_step": 81547, "epoch": 1941} {"train_loss": -6.171895980834961, "global_step": 81548, "epoch": 1941} {"train_loss": -6.0876946449279785, "global_step": 81549, "epoch": 1941} {"train_loss": -6.105434417724609, "global_step": 81550, "epoch": 1941} {"train_loss": -6.0664496421813965, "global_step": 81551, "epoch": 1941} {"train_loss": -6.045466423034668, "global_step": 81552, "epoch": 1941} {"train_loss": -6.0365190505981445, "global_step": 81553, "epoch": 1941} {"train_loss": -6.212307929992676, "global_step": 81554, "epoch": 1941} {"train_loss": -6.042737007141113, "global_step": 81555, "epoch": 1941} {"train_loss": -6.152477741241455, "global_step": 81556, "epoch": 1941} {"train_loss": -6.061028003692627, "global_step": 81557, "epoch": 1941} {"train_loss": -6.077931880950928, "global_step": 81558, "epoch": 1941} {"train_loss": -5.976483345031738, "global_step": 81559, "epoch": 1941} {"train_loss": -6.041790008544922, "global_step": 81560, "epoch": 1941} {"train_loss": -6.036714553833008, "global_step": 81561, "epoch": 1941} {"train_loss": -5.975081920623779, "global_step": 81562, "epoch": 1941} {"train_loss": -6.089503901345389, "global_step": 81563, "epoch": 1941, "val_loss": 67892.078125} {"train_loss": -6.110815048217773, "global_step": 81564, "epoch": 1942} {"train_loss": -6.159456729888916, "global_step": 81565, "epoch": 1942} {"train_loss": -6.127692699432373, "global_step": 81566, "epoch": 1942} {"train_loss": -6.173462867736816, "global_step": 81567, "epoch": 1942} {"train_loss": -6.1218461990356445, "global_step": 81568, "epoch": 1942} {"train_loss": -6.049308776855469, "global_step": 81569, "epoch": 1942} {"train_loss": -6.129903793334961, "global_step": 81570, "epoch": 1942} {"train_loss": -6.033427715301514, "global_step": 81571, "epoch": 1942} {"train_loss": -6.080236911773682, "global_step": 81572, "epoch": 1942} {"train_loss": -6.080286979675293, "global_step": 81573, "epoch": 1942} {"train_loss": -6.104121208190918, "global_step": 81574, "epoch": 1942} {"train_loss": -6.137972831726074, "global_step": 81575, "epoch": 1942} {"train_loss": -6.189252853393555, "global_step": 81576, "epoch": 1942} {"train_loss": -6.1607561111450195, "global_step": 81577, "epoch": 1942} {"train_loss": -6.252571105957031, "global_step": 81578, "epoch": 1942} {"train_loss": -6.1768951416015625, "global_step": 81579, "epoch": 1942} {"train_loss": -6.22177791595459, "global_step": 81580, "epoch": 1942} {"train_loss": -6.218597412109375, "global_step": 81581, "epoch": 1942} {"train_loss": -6.195338726043701, "global_step": 81582, "epoch": 1942} {"train_loss": -6.217099666595459, "global_step": 81583, "epoch": 1942} {"train_loss": -6.220660209655762, "global_step": 81584, "epoch": 1942} {"train_loss": -6.097560882568359, "global_step": 81585, "epoch": 1942} {"train_loss": -6.142799377441406, "global_step": 81586, "epoch": 1942} {"train_loss": -6.28245210647583, "global_step": 81587, "epoch": 1942} {"train_loss": -6.105489730834961, "global_step": 81588, "epoch": 1942} {"train_loss": -6.211569786071777, "global_step": 81589, "epoch": 1942} {"train_loss": -6.12460994720459, "global_step": 81590, "epoch": 1942} {"train_loss": -6.122249603271484, "global_step": 81591, "epoch": 1942} {"train_loss": -6.063352108001709, "global_step": 81592, "epoch": 1942} {"train_loss": -6.100475788116455, "global_step": 81593, "epoch": 1942} {"train_loss": -6.182281017303467, "global_step": 81594, "epoch": 1942} {"train_loss": -6.0236663818359375, "global_step": 81595, "epoch": 1942} {"train_loss": -6.126560211181641, "global_step": 81596, "epoch": 1942} {"train_loss": -6.038013935089111, "global_step": 81597, "epoch": 1942} {"train_loss": -5.9322710037231445, "global_step": 81598, "epoch": 1942} {"train_loss": -6.131804466247559, "global_step": 81599, "epoch": 1942} {"train_loss": -6.07084846496582, "global_step": 81600, "epoch": 1942} {"train_loss": -6.031077861785889, "global_step": 81601, "epoch": 1942} {"train_loss": -6.033844470977783, "global_step": 81602, "epoch": 1942} {"train_loss": -6.161556243896484, "global_step": 81603, "epoch": 1942} {"train_loss": -6.071942329406738, "global_step": 81604, "epoch": 1942} {"train_loss": -6.128408295767648, "global_step": 81605, "epoch": 1942, "val_loss": 67640.21875} {"train_loss": -6.111752510070801, "global_step": 81606, "epoch": 1943} {"train_loss": -6.149579048156738, "global_step": 81607, "epoch": 1943} {"train_loss": -6.004249572753906, "global_step": 81608, "epoch": 1943} {"train_loss": -6.091487884521484, "global_step": 81609, "epoch": 1943} {"train_loss": -6.068618297576904, "global_step": 81610, "epoch": 1943} {"train_loss": -6.017734050750732, "global_step": 81611, "epoch": 1943} {"train_loss": -6.187644004821777, "global_step": 81612, "epoch": 1943} {"train_loss": -6.1285247802734375, "global_step": 81613, "epoch": 1943} {"train_loss": -6.028966903686523, "global_step": 81614, "epoch": 1943} {"train_loss": -5.999274253845215, "global_step": 81615, "epoch": 1943} {"train_loss": -6.102169036865234, "global_step": 81616, "epoch": 1943} {"train_loss": -6.1888532638549805, "global_step": 81617, "epoch": 1943} {"train_loss": -6.047338485717773, "global_step": 81618, "epoch": 1943} {"train_loss": -6.068135738372803, "global_step": 81619, "epoch": 1943} {"train_loss": -6.133755207061768, "global_step": 81620, "epoch": 1943} {"train_loss": -6.172112464904785, "global_step": 81621, "epoch": 1943} {"train_loss": -5.944356441497803, "global_step": 81622, "epoch": 1943} {"train_loss": -6.110256195068359, "global_step": 81623, "epoch": 1943} {"train_loss": -6.1187744140625, "global_step": 81624, "epoch": 1943} {"train_loss": -6.102442741394043, "global_step": 81625, "epoch": 1943} {"train_loss": -5.9723100662231445, "global_step": 81626, "epoch": 1943} {"train_loss": -6.096946716308594, "global_step": 81627, "epoch": 1943} {"train_loss": -6.000852584838867, "global_step": 81628, "epoch": 1943} {"train_loss": -6.203990936279297, "global_step": 81629, "epoch": 1943} {"train_loss": -6.1110005378723145, "global_step": 81630, "epoch": 1943} {"train_loss": -5.991355895996094, "global_step": 81631, "epoch": 1943} {"train_loss": -6.0926313400268555, "global_step": 81632, "epoch": 1943} {"train_loss": -6.046225547790527, "global_step": 81633, "epoch": 1943} {"train_loss": -6.203571796417236, "global_step": 81634, "epoch": 1943} {"train_loss": -6.212094306945801, "global_step": 81635, "epoch": 1943} {"train_loss": -6.1022138595581055, "global_step": 81636, "epoch": 1943} {"train_loss": -6.200104236602783, "global_step": 81637, "epoch": 1943} {"train_loss": -6.110156059265137, "global_step": 81638, "epoch": 1943} {"train_loss": -6.111144065856934, "global_step": 81639, "epoch": 1943} {"train_loss": -6.085204124450684, "global_step": 81640, "epoch": 1943} {"train_loss": -6.114161968231201, "global_step": 81641, "epoch": 1943} {"train_loss": -6.240171909332275, "global_step": 81642, "epoch": 1943} {"train_loss": -6.127466201782227, "global_step": 81643, "epoch": 1943} {"train_loss": -6.18887996673584, "global_step": 81644, "epoch": 1943} {"train_loss": -6.056219100952148, "global_step": 81645, "epoch": 1943} {"train_loss": -6.084765434265137, "global_step": 81646, "epoch": 1943} {"train_loss": -6.102320557548886, "global_step": 81647, "epoch": 1943, "val_loss": 67943.9609375} {"train_loss": -6.237337589263916, "global_step": 81648, "epoch": 1944} {"train_loss": -6.190114974975586, "global_step": 81649, "epoch": 1944} {"train_loss": -6.204094886779785, "global_step": 81650, "epoch": 1944} {"train_loss": -6.054816246032715, "global_step": 81651, "epoch": 1944} {"train_loss": -6.173836708068848, "global_step": 81652, "epoch": 1944} {"train_loss": -6.163766860961914, "global_step": 81653, "epoch": 1944} {"train_loss": -6.119480133056641, "global_step": 81654, "epoch": 1944} {"train_loss": -6.127320289611816, "global_step": 81655, "epoch": 1944} {"train_loss": -6.222344398498535, "global_step": 81656, "epoch": 1944} {"train_loss": -6.261402606964111, "global_step": 81657, "epoch": 1944} {"train_loss": -6.166821479797363, "global_step": 81658, "epoch": 1944} {"train_loss": -6.116458892822266, "global_step": 81659, "epoch": 1944} {"train_loss": -6.199092388153076, "global_step": 81660, "epoch": 1944} {"train_loss": -6.179002285003662, "global_step": 81661, "epoch": 1944} {"train_loss": -6.203737258911133, "global_step": 81662, "epoch": 1944} {"train_loss": -6.192684173583984, "global_step": 81663, "epoch": 1944} {"train_loss": -6.111244201660156, "global_step": 81664, "epoch": 1944} {"train_loss": -6.153988361358643, "global_step": 81665, "epoch": 1944} {"train_loss": -6.068275451660156, "global_step": 81666, "epoch": 1944} {"train_loss": -5.943031311035156, "global_step": 81667, "epoch": 1944} {"train_loss": -6.121392250061035, "global_step": 81668, "epoch": 1944} {"train_loss": -5.985905647277832, "global_step": 81669, "epoch": 1944} {"train_loss": -6.257389068603516, "global_step": 81670, "epoch": 1944} {"train_loss": -6.09202766418457, "global_step": 81671, "epoch": 1944} {"train_loss": -5.976858139038086, "global_step": 81672, "epoch": 1944} {"train_loss": -6.1541829109191895, "global_step": 81673, "epoch": 1944} {"train_loss": -6.00197696685791, "global_step": 81674, "epoch": 1944} {"train_loss": -6.20958137512207, "global_step": 81675, "epoch": 1944} {"train_loss": -5.963071823120117, "global_step": 81676, "epoch": 1944} {"train_loss": -6.072243690490723, "global_step": 81677, "epoch": 1944} {"train_loss": -5.998801231384277, "global_step": 81678, "epoch": 1944} {"train_loss": -5.979371070861816, "global_step": 81679, "epoch": 1944} {"train_loss": -6.031966209411621, "global_step": 81680, "epoch": 1944} {"train_loss": -5.96738338470459, "global_step": 81681, "epoch": 1944} {"train_loss": -6.17526388168335, "global_step": 81682, "epoch": 1944} {"train_loss": -6.1002092361450195, "global_step": 81683, "epoch": 1944} {"train_loss": -6.073532581329346, "global_step": 81684, "epoch": 1944} {"train_loss": -6.078977584838867, "global_step": 81685, "epoch": 1944} {"train_loss": -6.174715518951416, "global_step": 81686, "epoch": 1944} {"train_loss": -6.295536041259766, "global_step": 81687, "epoch": 1944} {"train_loss": -6.035910129547119, "global_step": 81688, "epoch": 1944} {"train_loss": -6.119928893588838, "global_step": 81689, "epoch": 1944, "val_loss": 67822.9375} {"train_loss": -6.263938903808594, "global_step": 81690, "epoch": 1945} {"train_loss": -6.225405693054199, "global_step": 81691, "epoch": 1945} {"train_loss": -5.95375919342041, "global_step": 81692, "epoch": 1945} {"train_loss": -6.277266502380371, "global_step": 81693, "epoch": 1945} {"train_loss": -6.12269401550293, "global_step": 81694, "epoch": 1945} {"train_loss": -6.176999568939209, "global_step": 81695, "epoch": 1945} {"train_loss": -5.963035583496094, "global_step": 81696, "epoch": 1945} {"train_loss": -6.168483734130859, "global_step": 81697, "epoch": 1945} {"train_loss": -6.147830009460449, "global_step": 81698, "epoch": 1945} {"train_loss": -6.188782215118408, "global_step": 81699, "epoch": 1945} {"train_loss": -6.159332275390625, "global_step": 81700, "epoch": 1945} {"train_loss": -6.2332234382629395, "global_step": 81701, "epoch": 1945} {"train_loss": -6.18095588684082, "global_step": 81702, "epoch": 1945} {"train_loss": -6.22825813293457, "global_step": 81703, "epoch": 1945} {"train_loss": -6.136599540710449, "global_step": 81704, "epoch": 1945} {"train_loss": -5.958682060241699, "global_step": 81705, "epoch": 1945} {"train_loss": -6.19003963470459, "global_step": 81706, "epoch": 1945} {"train_loss": -6.1235880851745605, "global_step": 81707, "epoch": 1945} {"train_loss": -6.117643356323242, "global_step": 81708, "epoch": 1945} {"train_loss": -6.169186592102051, "global_step": 81709, "epoch": 1945} {"train_loss": -6.23569393157959, "global_step": 81710, "epoch": 1945} {"train_loss": -6.1345319747924805, "global_step": 81711, "epoch": 1945} {"train_loss": -6.221710205078125, "global_step": 81712, "epoch": 1945} {"train_loss": -6.184840202331543, "global_step": 81713, "epoch": 1945} {"train_loss": -6.150452613830566, "global_step": 81714, "epoch": 1945} {"train_loss": -6.206650257110596, "global_step": 81715, "epoch": 1945} {"train_loss": -6.173227310180664, "global_step": 81716, "epoch": 1945} {"train_loss": -6.149689197540283, "global_step": 81717, "epoch": 1945} {"train_loss": -6.173442363739014, "global_step": 81718, "epoch": 1945} {"train_loss": -6.077383518218994, "global_step": 81719, "epoch": 1945} {"train_loss": -6.235343933105469, "global_step": 81720, "epoch": 1945} {"train_loss": -6.224291801452637, "global_step": 81721, "epoch": 1945} {"train_loss": -6.151319980621338, "global_step": 81722, "epoch": 1945} {"train_loss": -6.121519088745117, "global_step": 81723, "epoch": 1945} {"train_loss": -6.218601226806641, "global_step": 81724, "epoch": 1945} {"train_loss": -6.069053649902344, "global_step": 81725, "epoch": 1945} {"train_loss": -6.3135271072387695, "global_step": 81726, "epoch": 1945} {"train_loss": -6.106503009796143, "global_step": 81727, "epoch": 1945} {"train_loss": -6.181262016296387, "global_step": 81728, "epoch": 1945} {"train_loss": -6.103180408477783, "global_step": 81729, "epoch": 1945} {"train_loss": -6.243189811706543, "global_step": 81730, "epoch": 1945} {"train_loss": -6.1590469678243, "global_step": 81731, "epoch": 1945, "val_loss": 67669.7109375} {"train_loss": -6.098149299621582, "global_step": 81732, "epoch": 1946} {"train_loss": -6.163688659667969, "global_step": 81733, "epoch": 1946} {"train_loss": -6.059816360473633, "global_step": 81734, "epoch": 1946} {"train_loss": -6.134270668029785, "global_step": 81735, "epoch": 1946} {"train_loss": -6.1414008140563965, "global_step": 81736, "epoch": 1946} {"train_loss": -6.060694694519043, "global_step": 81737, "epoch": 1946} {"train_loss": -6.197603225708008, "global_step": 81738, "epoch": 1946} {"train_loss": -6.264570713043213, "global_step": 81739, "epoch": 1946} {"train_loss": -6.150031089782715, "global_step": 81740, "epoch": 1946} {"train_loss": -6.0408220291137695, "global_step": 81741, "epoch": 1946} {"train_loss": -6.176867961883545, "global_step": 81742, "epoch": 1946} {"train_loss": -6.207613945007324, "global_step": 81743, "epoch": 1946} {"train_loss": -6.1536359786987305, "global_step": 81744, "epoch": 1946} {"train_loss": -6.15775203704834, "global_step": 81745, "epoch": 1946} {"train_loss": -6.25860595703125, "global_step": 81746, "epoch": 1946} {"train_loss": -6.2044854164123535, "global_step": 81747, "epoch": 1946} {"train_loss": -6.088294982910156, "global_step": 81748, "epoch": 1946} {"train_loss": -6.098916053771973, "global_step": 81749, "epoch": 1946} {"train_loss": -6.198008060455322, "global_step": 81750, "epoch": 1946} {"train_loss": -6.119226932525635, "global_step": 81751, "epoch": 1946} {"train_loss": -6.2542805671691895, "global_step": 81752, "epoch": 1946} {"train_loss": -6.129162311553955, "global_step": 81753, "epoch": 1946} {"train_loss": -6.149951934814453, "global_step": 81754, "epoch": 1946} {"train_loss": -6.232775688171387, "global_step": 81755, "epoch": 1946} {"train_loss": -6.117180824279785, "global_step": 81756, "epoch": 1946} {"train_loss": -6.168585300445557, "global_step": 81757, "epoch": 1946} {"train_loss": -6.147650718688965, "global_step": 81758, "epoch": 1946} {"train_loss": -6.2277703285217285, "global_step": 81759, "epoch": 1946} {"train_loss": -6.26609992980957, "global_step": 81760, "epoch": 1946} {"train_loss": -6.18865966796875, "global_step": 81761, "epoch": 1946} {"train_loss": -6.063135623931885, "global_step": 81762, "epoch": 1946} {"train_loss": -6.107079982757568, "global_step": 81763, "epoch": 1946} {"train_loss": -6.169407844543457, "global_step": 81764, "epoch": 1946} {"train_loss": -6.100009918212891, "global_step": 81765, "epoch": 1946} {"train_loss": -6.106014728546143, "global_step": 81766, "epoch": 1946} {"train_loss": -6.166573524475098, "global_step": 81767, "epoch": 1946} {"train_loss": -6.134496212005615, "global_step": 81768, "epoch": 1946} {"train_loss": -6.100849628448486, "global_step": 81769, "epoch": 1946} {"train_loss": -6.179648399353027, "global_step": 81770, "epoch": 1946} {"train_loss": -6.135334491729736, "global_step": 81771, "epoch": 1946} {"train_loss": -6.219667911529541, "global_step": 81772, "epoch": 1946} {"train_loss": -6.154012101037162, "global_step": 81773, "epoch": 1946, "val_loss": 67819.703125} {"train_loss": -6.2394280433654785, "global_step": 81774, "epoch": 1947} {"train_loss": -6.161582946777344, "global_step": 81775, "epoch": 1947} {"train_loss": -6.0928120613098145, "global_step": 81776, "epoch": 1947} {"train_loss": -6.134749412536621, "global_step": 81777, "epoch": 1947} {"train_loss": -6.297646522521973, "global_step": 81778, "epoch": 1947} {"train_loss": -6.107614040374756, "global_step": 81779, "epoch": 1947} {"train_loss": -6.123771667480469, "global_step": 81780, "epoch": 1947} {"train_loss": -6.128791809082031, "global_step": 81781, "epoch": 1947} {"train_loss": -6.084973335266113, "global_step": 81782, "epoch": 1947} {"train_loss": -6.222447395324707, "global_step": 81783, "epoch": 1947} {"train_loss": -6.241095542907715, "global_step": 81784, "epoch": 1947} {"train_loss": -6.16250467300415, "global_step": 81785, "epoch": 1947} {"train_loss": -6.198554039001465, "global_step": 81786, "epoch": 1947} {"train_loss": -6.279358863830566, "global_step": 81787, "epoch": 1947} {"train_loss": -6.18076229095459, "global_step": 81788, "epoch": 1947} {"train_loss": -6.16030216217041, "global_step": 81789, "epoch": 1947} {"train_loss": -6.206274032592773, "global_step": 81790, "epoch": 1947} {"train_loss": -6.092388153076172, "global_step": 81791, "epoch": 1947} {"train_loss": -6.171726226806641, "global_step": 81792, "epoch": 1947} {"train_loss": -6.1888275146484375, "global_step": 81793, "epoch": 1947} {"train_loss": -6.091524124145508, "global_step": 81794, "epoch": 1947} {"train_loss": -6.132333755493164, "global_step": 81795, "epoch": 1947} {"train_loss": -6.190942764282227, "global_step": 81796, "epoch": 1947} {"train_loss": -6.136757850646973, "global_step": 81797, "epoch": 1947} {"train_loss": -6.2910380363464355, "global_step": 81798, "epoch": 1947} {"train_loss": -6.117263317108154, "global_step": 81799, "epoch": 1947} {"train_loss": -6.049041748046875, "global_step": 81800, "epoch": 1947} {"train_loss": -6.235599517822266, "global_step": 81801, "epoch": 1947} {"train_loss": -6.182487487792969, "global_step": 81802, "epoch": 1947} {"train_loss": -6.101459503173828, "global_step": 81803, "epoch": 1947} {"train_loss": -6.171451091766357, "global_step": 81804, "epoch": 1947} {"train_loss": -6.268280506134033, "global_step": 81805, "epoch": 1947} {"train_loss": -6.168687343597412, "global_step": 81806, "epoch": 1947} {"train_loss": -6.248861312866211, "global_step": 81807, "epoch": 1947} {"train_loss": -6.225438117980957, "global_step": 81808, "epoch": 1947} {"train_loss": -6.073244094848633, "global_step": 81809, "epoch": 1947} {"train_loss": -6.103635787963867, "global_step": 81810, "epoch": 1947} {"train_loss": -6.32958984375, "global_step": 81811, "epoch": 1947} {"train_loss": -6.294654846191406, "global_step": 81812, "epoch": 1947} {"train_loss": -6.1535749435424805, "global_step": 81813, "epoch": 1947} {"train_loss": -6.153313636779785, "global_step": 81814, "epoch": 1947} {"train_loss": -6.1752939110710505, "global_step": 81815, "epoch": 1947, "val_loss": 67597.28125} {"train_loss": -6.293536186218262, "global_step": 81816, "epoch": 1948} {"train_loss": -6.0956711769104, "global_step": 81817, "epoch": 1948} {"train_loss": -6.189934730529785, "global_step": 81818, "epoch": 1948} {"train_loss": -6.200199127197266, "global_step": 81819, "epoch": 1948} {"train_loss": -6.164202690124512, "global_step": 81820, "epoch": 1948} {"train_loss": -6.202068328857422, "global_step": 81821, "epoch": 1948} {"train_loss": -6.209267616271973, "global_step": 81822, "epoch": 1948} {"train_loss": -6.101812362670898, "global_step": 81823, "epoch": 1948} {"train_loss": -6.053487777709961, "global_step": 81824, "epoch": 1948} {"train_loss": -6.139616966247559, "global_step": 81825, "epoch": 1948} {"train_loss": -6.229820251464844, "global_step": 81826, "epoch": 1948} {"train_loss": -6.138511657714844, "global_step": 81827, "epoch": 1948} {"train_loss": -6.172928333282471, "global_step": 81828, "epoch": 1948} {"train_loss": -6.2096099853515625, "global_step": 81829, "epoch": 1948} {"train_loss": -6.228782653808594, "global_step": 81830, "epoch": 1948} {"train_loss": -6.1559553146362305, "global_step": 81831, "epoch": 1948} {"train_loss": -6.174426078796387, "global_step": 81832, "epoch": 1948} {"train_loss": -6.231719970703125, "global_step": 81833, "epoch": 1948} {"train_loss": -6.086147308349609, "global_step": 81834, "epoch": 1948} {"train_loss": -6.047889709472656, "global_step": 81835, "epoch": 1948} {"train_loss": -6.294372081756592, "global_step": 81836, "epoch": 1948} {"train_loss": -6.209614276885986, "global_step": 81837, "epoch": 1948} {"train_loss": -6.06056022644043, "global_step": 81838, "epoch": 1948} {"train_loss": -6.144451141357422, "global_step": 81839, "epoch": 1948} {"train_loss": -6.145723342895508, "global_step": 81840, "epoch": 1948} {"train_loss": -6.083771705627441, "global_step": 81841, "epoch": 1948} {"train_loss": -6.171734809875488, "global_step": 81842, "epoch": 1948} {"train_loss": -6.172142028808594, "global_step": 81843, "epoch": 1948} {"train_loss": -6.176179885864258, "global_step": 81844, "epoch": 1948} {"train_loss": -6.191509246826172, "global_step": 81845, "epoch": 1948} {"train_loss": -5.9861297607421875, "global_step": 81846, "epoch": 1948} {"train_loss": -6.060579299926758, "global_step": 81847, "epoch": 1948} {"train_loss": -5.932913780212402, "global_step": 81848, "epoch": 1948} {"train_loss": -6.175785064697266, "global_step": 81849, "epoch": 1948} {"train_loss": -6.1118950843811035, "global_step": 81850, "epoch": 1948} {"train_loss": -6.071507453918457, "global_step": 81851, "epoch": 1948} {"train_loss": -6.170555114746094, "global_step": 81852, "epoch": 1948} {"train_loss": -6.0383734703063965, "global_step": 81853, "epoch": 1948} {"train_loss": -6.157968997955322, "global_step": 81854, "epoch": 1948} {"train_loss": -6.235880374908447, "global_step": 81855, "epoch": 1948} {"train_loss": -6.100225448608398, "global_step": 81856, "epoch": 1948} {"train_loss": -6.146767604918707, "global_step": 81857, "epoch": 1948, "val_loss": 67610.8125} {"train_loss": -6.087148189544678, "global_step": 81858, "epoch": 1949} {"train_loss": -5.970694541931152, "global_step": 81859, "epoch": 1949} {"train_loss": -6.036442756652832, "global_step": 81860, "epoch": 1949} {"train_loss": -6.0109710693359375, "global_step": 81861, "epoch": 1949} {"train_loss": -6.162814140319824, "global_step": 81862, "epoch": 1949} {"train_loss": -6.0158796310424805, "global_step": 81863, "epoch": 1949} {"train_loss": -6.062016487121582, "global_step": 81864, "epoch": 1949} {"train_loss": -6.127540588378906, "global_step": 81865, "epoch": 1949} {"train_loss": -6.089728355407715, "global_step": 81866, "epoch": 1949} {"train_loss": -6.245535850524902, "global_step": 81867, "epoch": 1949} {"train_loss": -6.041927337646484, "global_step": 81868, "epoch": 1949} {"train_loss": -6.0963029861450195, "global_step": 81869, "epoch": 1949} {"train_loss": -6.201957702636719, "global_step": 81870, "epoch": 1949} {"train_loss": -6.057238578796387, "global_step": 81871, "epoch": 1949} {"train_loss": -6.082221984863281, "global_step": 81872, "epoch": 1949} {"train_loss": -6.048752784729004, "global_step": 81873, "epoch": 1949} {"train_loss": -6.127413749694824, "global_step": 81874, "epoch": 1949} {"train_loss": -6.100618362426758, "global_step": 81875, "epoch": 1949} {"train_loss": -5.966501235961914, "global_step": 81876, "epoch": 1949} {"train_loss": -6.102274417877197, "global_step": 81877, "epoch": 1949} {"train_loss": -6.173170566558838, "global_step": 81878, "epoch": 1949} {"train_loss": -6.08659553527832, "global_step": 81879, "epoch": 1949} {"train_loss": -6.145417213439941, "global_step": 81880, "epoch": 1949} {"train_loss": -6.147429466247559, "global_step": 81881, "epoch": 1949} {"train_loss": -6.099349498748779, "global_step": 81882, "epoch": 1949} {"train_loss": -6.311301231384277, "global_step": 81883, "epoch": 1949} {"train_loss": -6.200101375579834, "global_step": 81884, "epoch": 1949} {"train_loss": -6.102017879486084, "global_step": 81885, "epoch": 1949} {"train_loss": -6.0597944259643555, "global_step": 81886, "epoch": 1949} {"train_loss": -6.228606224060059, "global_step": 81887, "epoch": 1949} {"train_loss": -6.215280532836914, "global_step": 81888, "epoch": 1949} {"train_loss": -6.20289421081543, "global_step": 81889, "epoch": 1949} {"train_loss": -6.229784965515137, "global_step": 81890, "epoch": 1949} {"train_loss": -6.271679878234863, "global_step": 81891, "epoch": 1949} {"train_loss": -6.289112567901611, "global_step": 81892, "epoch": 1949} {"train_loss": -6.186275005340576, "global_step": 81893, "epoch": 1949} {"train_loss": -6.120837688446045, "global_step": 81894, "epoch": 1949} {"train_loss": -6.153129577636719, "global_step": 81895, "epoch": 1949} {"train_loss": -6.200099945068359, "global_step": 81896, "epoch": 1949} {"train_loss": -6.299753189086914, "global_step": 81897, "epoch": 1949} {"train_loss": -6.222362041473389, "global_step": 81898, "epoch": 1949} {"train_loss": -6.136006809416271, "global_step": 81899, "epoch": 1949, "val_loss": 67753.359375} {"train_loss": -6.319841384887695, "global_step": 81900, "epoch": 1950} {"train_loss": -6.078334808349609, "global_step": 81901, "epoch": 1950} {"train_loss": -6.142553329467773, "global_step": 81902, "epoch": 1950} {"train_loss": -6.191739082336426, "global_step": 81903, "epoch": 1950} {"train_loss": -6.108617782592773, "global_step": 81904, "epoch": 1950} {"train_loss": -6.136891841888428, "global_step": 81905, "epoch": 1950} {"train_loss": -6.040249347686768, "global_step": 81906, "epoch": 1950} {"train_loss": -6.109716415405273, "global_step": 81907, "epoch": 1950} {"train_loss": -6.269717216491699, "global_step": 81908, "epoch": 1950} {"train_loss": -6.020556926727295, "global_step": 81909, "epoch": 1950} {"train_loss": -6.054751873016357, "global_step": 81910, "epoch": 1950} {"train_loss": -6.087748050689697, "global_step": 81911, "epoch": 1950} {"train_loss": -6.050474166870117, "global_step": 81912, "epoch": 1950} {"train_loss": -6.098071098327637, "global_step": 81913, "epoch": 1950} {"train_loss": -6.149746894836426, "global_step": 81914, "epoch": 1950} {"train_loss": -6.051740646362305, "global_step": 81915, "epoch": 1950} {"train_loss": -6.111507415771484, "global_step": 81916, "epoch": 1950} {"train_loss": -6.118363857269287, "global_step": 81917, "epoch": 1950} {"train_loss": -6.131581783294678, "global_step": 81918, "epoch": 1950} {"train_loss": -6.104386329650879, "global_step": 81919, "epoch": 1950} {"train_loss": -6.239089012145996, "global_step": 81920, "epoch": 1950} {"train_loss": -6.071906089782715, "global_step": 81921, "epoch": 1950} {"train_loss": -6.207746982574463, "global_step": 81922, "epoch": 1950} {"train_loss": -6.203188896179199, "global_step": 81923, "epoch": 1950} {"train_loss": -6.127788543701172, "global_step": 81924, "epoch": 1950} {"train_loss": -6.0327229499816895, "global_step": 81925, "epoch": 1950} {"train_loss": -6.060947895050049, "global_step": 81926, "epoch": 1950} {"train_loss": -5.981023788452148, "global_step": 81927, "epoch": 1950} {"train_loss": -6.157806396484375, "global_step": 81928, "epoch": 1950} {"train_loss": -6.115047931671143, "global_step": 81929, "epoch": 1950} {"train_loss": -6.098679065704346, "global_step": 81930, "epoch": 1950} {"train_loss": -6.090386867523193, "global_step": 81931, "epoch": 1950} {"train_loss": -6.150856018066406, "global_step": 81932, "epoch": 1950} {"train_loss": -6.171587944030762, "global_step": 81933, "epoch": 1950} {"train_loss": -6.037167549133301, "global_step": 81934, "epoch": 1950} {"train_loss": -6.1755828857421875, "global_step": 81935, "epoch": 1950} {"train_loss": -6.1760640144348145, "global_step": 81936, "epoch": 1950} {"train_loss": -6.077339172363281, "global_step": 81937, "epoch": 1950} {"train_loss": -6.062600612640381, "global_step": 81938, "epoch": 1950} {"train_loss": -6.228708267211914, "global_step": 81939, "epoch": 1950} {"train_loss": -6.169451713562012, "global_step": 81940, "epoch": 1950} {"train_loss": -6.1234642551058815, "global_step": 81941, "epoch": 1950, "train/sim_max_reward_0": 0.2718117721361665, "train/sim_max_reward_1": 0.20889682018154707, "train/sim_max_reward_2": 0.2883707661348452, "train/sim_max_reward_3": 0.1410712985534655, "train/sim_max_reward_4": 0.838847197348271, "train/sim_max_reward_5": 0.9585967521159394, "test/sim_max_reward_4400000": 0.2383596092586402, "test/sim_max_reward_4400001": 0.20683436493339555, "test/sim_max_reward_4400002": 0.8721734518307565, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.8781754063915564, "test/sim_max_reward_4400006": 0.3625585079281217, "test/sim_max_reward_4400007": 0.39689305150837856, "test/sim_max_reward_4400008": 0.3092082585799287, "test/sim_max_reward_4400009": 0.549588349538018, "test/sim_max_reward_4400010": 0.9264597646059182, "test/sim_max_reward_4400011": 0.24842847713809682, "test/sim_max_reward_4400012": 0.9398626209711513, "test/sim_max_reward_4400013": 0.588405126680636, "test/sim_max_reward_4400014": 0.3327131313914296, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.22609125081625106, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.9662986761535534, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.998872942946593, "test/sim_max_reward_4400023": 0.32738568599312895, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.22418647503563668, "test/sim_max_reward_4400026": 0.9931656313366253, "test/sim_max_reward_4400027": 0.0006091345801796644, "test/sim_max_reward_4400028": 0.426744420262411, "test/sim_max_reward_4400029": 0.2299203160444116, "test/sim_max_reward_4400030": 0.4081061716720974, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.22874725509999308, "test/sim_max_reward_4400034": 0.7454231355449883, "test/sim_max_reward_4400035": 0.4446829174693708, "test/sim_max_reward_4400036": 0.5021215975245674, "test/sim_max_reward_4400037": 0.935846425988238, "test/sim_max_reward_4400038": 0.1774602570205386, "test/sim_max_reward_4400039": 0.8628884812588423, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6796362990252692, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.8711172861532674, "test/sim_max_reward_4400044": 0.9216566669514771, "test/sim_max_reward_4400045": 0.13792404511090284, "test/sim_max_reward_4400046": 0.9129099067473535, "test/sim_max_reward_4400047": 0.8772964144518377, "test/sim_max_reward_4400048": 0.6492842832703358, "test/sim_max_reward_4400049": 0.7497151560185287, "train/mean_score": 0.4512657677450391, "test/mean_score": 0.4583857486085593, "val_loss": 67627.53125} {"train_loss": -6.257590293884277, "global_step": 81942, "epoch": 1951} {"train_loss": -6.262328147888184, "global_step": 81943, "epoch": 1951} {"train_loss": -6.21083927154541, "global_step": 81944, "epoch": 1951} {"train_loss": -6.2607526779174805, "global_step": 81945, "epoch": 1951} {"train_loss": -6.222067832946777, "global_step": 81946, "epoch": 1951} {"train_loss": -6.285170078277588, "global_step": 81947, "epoch": 1951} {"train_loss": -6.135619163513184, "global_step": 81948, "epoch": 1951} {"train_loss": -6.076300621032715, "global_step": 81949, "epoch": 1951} {"train_loss": -6.16843318939209, "global_step": 81950, "epoch": 1951} {"train_loss": -6.136316299438477, "global_step": 81951, "epoch": 1951} {"train_loss": -6.168558597564697, "global_step": 81952, "epoch": 1951} {"train_loss": -6.210811614990234, "global_step": 81953, "epoch": 1951} {"train_loss": -6.105167388916016, "global_step": 81954, "epoch": 1951} {"train_loss": -6.17984676361084, "global_step": 81955, "epoch": 1951} {"train_loss": -6.153663158416748, "global_step": 81956, "epoch": 1951} {"train_loss": -6.1981000900268555, "global_step": 81957, "epoch": 1951} {"train_loss": -6.116627216339111, "global_step": 81958, "epoch": 1951} {"train_loss": -6.14508056640625, "global_step": 81959, "epoch": 1951} {"train_loss": -6.099033355712891, "global_step": 81960, "epoch": 1951} {"train_loss": -6.042242050170898, "global_step": 81961, "epoch": 1951} {"train_loss": -6.097684383392334, "global_step": 81962, "epoch": 1951} {"train_loss": -6.237839698791504, "global_step": 81963, "epoch": 1951} {"train_loss": -6.150894641876221, "global_step": 81964, "epoch": 1951} {"train_loss": -6.229351997375488, "global_step": 81965, "epoch": 1951} {"train_loss": -6.1231560707092285, "global_step": 81966, "epoch": 1951} {"train_loss": -6.141974925994873, "global_step": 81967, "epoch": 1951} {"train_loss": -6.116209983825684, "global_step": 81968, "epoch": 1951} {"train_loss": -6.220569610595703, "global_step": 81969, "epoch": 1951} {"train_loss": -6.223109722137451, "global_step": 81970, "epoch": 1951} {"train_loss": -6.248540878295898, "global_step": 81971, "epoch": 1951} {"train_loss": -6.133455276489258, "global_step": 81972, "epoch": 1951} {"train_loss": -6.238884449005127, "global_step": 81973, "epoch": 1951} {"train_loss": -6.034330368041992, "global_step": 81974, "epoch": 1951} {"train_loss": -6.23897647857666, "global_step": 81975, "epoch": 1951} {"train_loss": -6.216024875640869, "global_step": 81976, "epoch": 1951} {"train_loss": -6.147608757019043, "global_step": 81977, "epoch": 1951} {"train_loss": -6.142256736755371, "global_step": 81978, "epoch": 1951} {"train_loss": -6.078788757324219, "global_step": 81979, "epoch": 1951} {"train_loss": -6.158217430114746, "global_step": 81980, "epoch": 1951} {"train_loss": -6.153088569641113, "global_step": 81981, "epoch": 1951} {"train_loss": -6.039363384246826, "global_step": 81982, "epoch": 1951} {"train_loss": -6.166172640664237, "global_step": 81983, "epoch": 1951, "val_loss": 67606.265625} {"train_loss": -6.147455215454102, "global_step": 81984, "epoch": 1952} {"train_loss": -6.0413818359375, "global_step": 81985, "epoch": 1952} {"train_loss": -6.222135543823242, "global_step": 81986, "epoch": 1952} {"train_loss": -6.135409355163574, "global_step": 81987, "epoch": 1952} {"train_loss": -6.175562858581543, "global_step": 81988, "epoch": 1952} {"train_loss": -6.219332695007324, "global_step": 81989, "epoch": 1952} {"train_loss": -6.159528732299805, "global_step": 81990, "epoch": 1952} {"train_loss": -6.170354843139648, "global_step": 81991, "epoch": 1952} {"train_loss": -6.306318283081055, "global_step": 81992, "epoch": 1952} {"train_loss": -6.105710029602051, "global_step": 81993, "epoch": 1952} {"train_loss": -6.152923107147217, "global_step": 81994, "epoch": 1952} {"train_loss": -6.247254371643066, "global_step": 81995, "epoch": 1952} {"train_loss": -6.055666923522949, "global_step": 81996, "epoch": 1952} {"train_loss": -6.157863616943359, "global_step": 81997, "epoch": 1952} {"train_loss": -6.176914215087891, "global_step": 81998, "epoch": 1952} {"train_loss": -6.033891677856445, "global_step": 81999, "epoch": 1952} {"train_loss": -6.013454437255859, "global_step": 82000, "epoch": 1952} {"train_loss": -6.15196418762207, "global_step": 82001, "epoch": 1952} {"train_loss": -6.099023818969727, "global_step": 82002, "epoch": 1952} {"train_loss": -6.087845802307129, "global_step": 82003, "epoch": 1952} {"train_loss": -6.202338218688965, "global_step": 82004, "epoch": 1952} {"train_loss": -6.0459089279174805, "global_step": 82005, "epoch": 1952} {"train_loss": -6.155071258544922, "global_step": 82006, "epoch": 1952} {"train_loss": -6.217561721801758, "global_step": 82007, "epoch": 1952} {"train_loss": -6.056338310241699, "global_step": 82008, "epoch": 1952} {"train_loss": -6.104618549346924, "global_step": 82009, "epoch": 1952} {"train_loss": -6.080107688903809, "global_step": 82010, "epoch": 1952} {"train_loss": -5.9909443855285645, "global_step": 82011, "epoch": 1952} {"train_loss": -6.1611785888671875, "global_step": 82012, "epoch": 1952} {"train_loss": -6.149441719055176, "global_step": 82013, "epoch": 1952} {"train_loss": -5.952579975128174, "global_step": 82014, "epoch": 1952} {"train_loss": -6.154055595397949, "global_step": 82015, "epoch": 1952} {"train_loss": -6.163481712341309, "global_step": 82016, "epoch": 1952} {"train_loss": -6.003843307495117, "global_step": 82017, "epoch": 1952} {"train_loss": -6.00901985168457, "global_step": 82018, "epoch": 1952} {"train_loss": -6.181387901306152, "global_step": 82019, "epoch": 1952} {"train_loss": -6.065816402435303, "global_step": 82020, "epoch": 1952} {"train_loss": -6.109154224395752, "global_step": 82021, "epoch": 1952} {"train_loss": -6.106501579284668, "global_step": 82022, "epoch": 1952} {"train_loss": -6.040285587310791, "global_step": 82023, "epoch": 1952} {"train_loss": -6.068163871765137, "global_step": 82024, "epoch": 1952} {"train_loss": -6.119021358944121, "global_step": 82025, "epoch": 1952, "val_loss": 67816.2578125} {"train_loss": -6.23344612121582, "global_step": 82026, "epoch": 1953} {"train_loss": -5.8802714347839355, "global_step": 82027, "epoch": 1953} {"train_loss": -6.181148529052734, "global_step": 82028, "epoch": 1953} {"train_loss": -5.995257377624512, "global_step": 82029, "epoch": 1953} {"train_loss": -6.111088275909424, "global_step": 82030, "epoch": 1953} {"train_loss": -6.112676620483398, "global_step": 82031, "epoch": 1953} {"train_loss": -6.105378150939941, "global_step": 82032, "epoch": 1953} {"train_loss": -6.1490678787231445, "global_step": 82033, "epoch": 1953} {"train_loss": -6.224198341369629, "global_step": 82034, "epoch": 1953} {"train_loss": -6.147871971130371, "global_step": 82035, "epoch": 1953} {"train_loss": -6.024207592010498, "global_step": 82036, "epoch": 1953} {"train_loss": -6.205624580383301, "global_step": 82037, "epoch": 1953} {"train_loss": -6.064959526062012, "global_step": 82038, "epoch": 1953} {"train_loss": -6.002532958984375, "global_step": 82039, "epoch": 1953} {"train_loss": -6.045715808868408, "global_step": 82040, "epoch": 1953} {"train_loss": -6.150113105773926, "global_step": 82041, "epoch": 1953} {"train_loss": -6.212250709533691, "global_step": 82042, "epoch": 1953} {"train_loss": -6.007787227630615, "global_step": 82043, "epoch": 1953} {"train_loss": -6.2589006423950195, "global_step": 82044, "epoch": 1953} {"train_loss": -5.969845771789551, "global_step": 82045, "epoch": 1953} {"train_loss": -6.077933311462402, "global_step": 82046, "epoch": 1953} {"train_loss": -6.042519569396973, "global_step": 82047, "epoch": 1953} {"train_loss": -6.232423782348633, "global_step": 82048, "epoch": 1953} {"train_loss": -6.119251251220703, "global_step": 82049, "epoch": 1953} {"train_loss": -6.080829620361328, "global_step": 82050, "epoch": 1953} {"train_loss": -6.095844268798828, "global_step": 82051, "epoch": 1953} {"train_loss": -6.197141647338867, "global_step": 82052, "epoch": 1953} {"train_loss": -6.098822116851807, "global_step": 82053, "epoch": 1953} {"train_loss": -6.111555576324463, "global_step": 82054, "epoch": 1953} {"train_loss": -6.1336774826049805, "global_step": 82055, "epoch": 1953} {"train_loss": -6.1486101150512695, "global_step": 82056, "epoch": 1953} {"train_loss": -6.273077487945557, "global_step": 82057, "epoch": 1953} {"train_loss": -6.123607158660889, "global_step": 82058, "epoch": 1953} {"train_loss": -6.207642555236816, "global_step": 82059, "epoch": 1953} {"train_loss": -6.090939521789551, "global_step": 82060, "epoch": 1953} {"train_loss": -6.136201858520508, "global_step": 82061, "epoch": 1953} {"train_loss": -6.033138275146484, "global_step": 82062, "epoch": 1953} {"train_loss": -6.162838935852051, "global_step": 82063, "epoch": 1953} {"train_loss": -6.153267860412598, "global_step": 82064, "epoch": 1953} {"train_loss": -6.184647560119629, "global_step": 82065, "epoch": 1953} {"train_loss": -6.107186317443848, "global_step": 82066, "epoch": 1953} {"train_loss": -6.1192982878003805, "global_step": 82067, "epoch": 1953, "val_loss": 67754.9609375} {"train_loss": -6.153055191040039, "global_step": 82068, "epoch": 1954} {"train_loss": -6.070092678070068, "global_step": 82069, "epoch": 1954} {"train_loss": -6.226120948791504, "global_step": 82070, "epoch": 1954} {"train_loss": -6.171903133392334, "global_step": 82071, "epoch": 1954} {"train_loss": -6.201704502105713, "global_step": 82072, "epoch": 1954} {"train_loss": -6.093501567840576, "global_step": 82073, "epoch": 1954} {"train_loss": -6.213088035583496, "global_step": 82074, "epoch": 1954} {"train_loss": -6.024867057800293, "global_step": 82075, "epoch": 1954} {"train_loss": -6.109625816345215, "global_step": 82076, "epoch": 1954} {"train_loss": -6.115942001342773, "global_step": 82077, "epoch": 1954} {"train_loss": -6.178893089294434, "global_step": 82078, "epoch": 1954} {"train_loss": -6.086427211761475, "global_step": 82079, "epoch": 1954} {"train_loss": -6.15242862701416, "global_step": 82080, "epoch": 1954} {"train_loss": -6.148509979248047, "global_step": 82081, "epoch": 1954} {"train_loss": -6.114267349243164, "global_step": 82082, "epoch": 1954} {"train_loss": -6.179575443267822, "global_step": 82083, "epoch": 1954} {"train_loss": -6.129022121429443, "global_step": 82084, "epoch": 1954} {"train_loss": -6.135531902313232, "global_step": 82085, "epoch": 1954} {"train_loss": -6.111333847045898, "global_step": 82086, "epoch": 1954} {"train_loss": -6.167490005493164, "global_step": 82087, "epoch": 1954} {"train_loss": -6.126697540283203, "global_step": 82088, "epoch": 1954} {"train_loss": -6.099336624145508, "global_step": 82089, "epoch": 1954} {"train_loss": -6.17886209487915, "global_step": 82090, "epoch": 1954} {"train_loss": -6.247201919555664, "global_step": 82091, "epoch": 1954} {"train_loss": -6.179140090942383, "global_step": 82092, "epoch": 1954} {"train_loss": -6.09151554107666, "global_step": 82093, "epoch": 1954} {"train_loss": -6.105881214141846, "global_step": 82094, "epoch": 1954} {"train_loss": -6.177238941192627, "global_step": 82095, "epoch": 1954} {"train_loss": -6.28134298324585, "global_step": 82096, "epoch": 1954} {"train_loss": -6.084676742553711, "global_step": 82097, "epoch": 1954} {"train_loss": -6.146744728088379, "global_step": 82098, "epoch": 1954} {"train_loss": -6.097928047180176, "global_step": 82099, "epoch": 1954} {"train_loss": -6.09122371673584, "global_step": 82100, "epoch": 1954} {"train_loss": -6.195036888122559, "global_step": 82101, "epoch": 1954} {"train_loss": -6.1031718254089355, "global_step": 82102, "epoch": 1954} {"train_loss": -6.028308868408203, "global_step": 82103, "epoch": 1954} {"train_loss": -6.180402755737305, "global_step": 82104, "epoch": 1954} {"train_loss": -6.210293292999268, "global_step": 82105, "epoch": 1954} {"train_loss": -6.195425033569336, "global_step": 82106, "epoch": 1954} {"train_loss": -6.193844795227051, "global_step": 82107, "epoch": 1954} {"train_loss": -6.0962066650390625, "global_step": 82108, "epoch": 1954} {"train_loss": -6.146283944447835, "global_step": 82109, "epoch": 1954, "val_loss": 67724.8359375} {"train_loss": -6.096846103668213, "global_step": 82110, "epoch": 1955} {"train_loss": -6.030372619628906, "global_step": 82111, "epoch": 1955} {"train_loss": -6.2545013427734375, "global_step": 82112, "epoch": 1955} {"train_loss": -6.0992560386657715, "global_step": 82113, "epoch": 1955} {"train_loss": -6.1775126457214355, "global_step": 82114, "epoch": 1955} {"train_loss": -5.9956440925598145, "global_step": 82115, "epoch": 1955} {"train_loss": -6.130645751953125, "global_step": 82116, "epoch": 1955} {"train_loss": -6.155590534210205, "global_step": 82117, "epoch": 1955} {"train_loss": -6.175596237182617, "global_step": 82118, "epoch": 1955} {"train_loss": -6.147681713104248, "global_step": 82119, "epoch": 1955} {"train_loss": -6.122832298278809, "global_step": 82120, "epoch": 1955} {"train_loss": -6.157459259033203, "global_step": 82121, "epoch": 1955} {"train_loss": -6.128968715667725, "global_step": 82122, "epoch": 1955} {"train_loss": -6.044174671173096, "global_step": 82123, "epoch": 1955} {"train_loss": -6.223156929016113, "global_step": 82124, "epoch": 1955} {"train_loss": -6.145862102508545, "global_step": 82125, "epoch": 1955} {"train_loss": -6.120710849761963, "global_step": 82126, "epoch": 1955} {"train_loss": -6.1527910232543945, "global_step": 82127, "epoch": 1955} {"train_loss": -6.312274932861328, "global_step": 82128, "epoch": 1955} {"train_loss": -6.180782318115234, "global_step": 82129, "epoch": 1955} {"train_loss": -6.165737152099609, "global_step": 82130, "epoch": 1955} {"train_loss": -6.141257286071777, "global_step": 82131, "epoch": 1955} {"train_loss": -6.26894474029541, "global_step": 82132, "epoch": 1955} {"train_loss": -6.0569353103637695, "global_step": 82133, "epoch": 1955} {"train_loss": -6.039044380187988, "global_step": 82134, "epoch": 1955} {"train_loss": -6.081058502197266, "global_step": 82135, "epoch": 1955} {"train_loss": -5.992199897766113, "global_step": 82136, "epoch": 1955} {"train_loss": -6.1359429359436035, "global_step": 82137, "epoch": 1955} {"train_loss": -6.105575084686279, "global_step": 82138, "epoch": 1955} {"train_loss": -6.204078674316406, "global_step": 82139, "epoch": 1955} {"train_loss": -6.1349263191223145, "global_step": 82140, "epoch": 1955} {"train_loss": -6.110537052154541, "global_step": 82141, "epoch": 1955} {"train_loss": -6.133060455322266, "global_step": 82142, "epoch": 1955} {"train_loss": -6.168244361877441, "global_step": 82143, "epoch": 1955} {"train_loss": -6.01953125, "global_step": 82144, "epoch": 1955} {"train_loss": -6.3715009689331055, "global_step": 82145, "epoch": 1955} {"train_loss": -6.036515235900879, "global_step": 82146, "epoch": 1955} {"train_loss": -6.189899444580078, "global_step": 82147, "epoch": 1955} {"train_loss": -6.139965057373047, "global_step": 82148, "epoch": 1955} {"train_loss": -6.063229560852051, "global_step": 82149, "epoch": 1955} {"train_loss": -6.1641845703125, "global_step": 82150, "epoch": 1955} {"train_loss": -6.134316433043707, "global_step": 82151, "epoch": 1955, "val_loss": 67710.765625} {"train_loss": -6.200586795806885, "global_step": 82152, "epoch": 1956} {"train_loss": -5.960846424102783, "global_step": 82153, "epoch": 1956} {"train_loss": -6.258212089538574, "global_step": 82154, "epoch": 1956} {"train_loss": -6.205839157104492, "global_step": 82155, "epoch": 1956} {"train_loss": -6.150152206420898, "global_step": 82156, "epoch": 1956} {"train_loss": -6.149261951446533, "global_step": 82157, "epoch": 1956} {"train_loss": -6.028450965881348, "global_step": 82158, "epoch": 1956} {"train_loss": -6.0883331298828125, "global_step": 82159, "epoch": 1956} {"train_loss": -6.09261417388916, "global_step": 82160, "epoch": 1956} {"train_loss": -6.143511772155762, "global_step": 82161, "epoch": 1956} {"train_loss": -6.177950859069824, "global_step": 82162, "epoch": 1956} {"train_loss": -6.269651412963867, "global_step": 82163, "epoch": 1956} {"train_loss": -6.079006195068359, "global_step": 82164, "epoch": 1956} {"train_loss": -6.127815246582031, "global_step": 82165, "epoch": 1956} {"train_loss": -6.084402561187744, "global_step": 82166, "epoch": 1956} {"train_loss": -6.121273994445801, "global_step": 82167, "epoch": 1956} {"train_loss": -6.133626937866211, "global_step": 82168, "epoch": 1956} {"train_loss": -6.090371131896973, "global_step": 82169, "epoch": 1956} {"train_loss": -6.058473110198975, "global_step": 82170, "epoch": 1956} {"train_loss": -6.237344741821289, "global_step": 82171, "epoch": 1956} {"train_loss": -6.03585147857666, "global_step": 82172, "epoch": 1956} {"train_loss": -6.059633255004883, "global_step": 82173, "epoch": 1956} {"train_loss": -6.173557281494141, "global_step": 82174, "epoch": 1956} {"train_loss": -6.00930118560791, "global_step": 82175, "epoch": 1956} {"train_loss": -6.102268218994141, "global_step": 82176, "epoch": 1956} {"train_loss": -6.072181701660156, "global_step": 82177, "epoch": 1956} {"train_loss": -6.093228816986084, "global_step": 82178, "epoch": 1956} {"train_loss": -6.120089054107666, "global_step": 82179, "epoch": 1956} {"train_loss": -6.036212921142578, "global_step": 82180, "epoch": 1956} {"train_loss": -5.930591583251953, "global_step": 82181, "epoch": 1956} {"train_loss": -6.035714626312256, "global_step": 82182, "epoch": 1956} {"train_loss": -6.000002861022949, "global_step": 82183, "epoch": 1956} {"train_loss": -6.201676845550537, "global_step": 82184, "epoch": 1956} {"train_loss": -6.155323028564453, "global_step": 82185, "epoch": 1956} {"train_loss": -6.016327857971191, "global_step": 82186, "epoch": 1956} {"train_loss": -6.1003804206848145, "global_step": 82187, "epoch": 1956} {"train_loss": -6.066778182983398, "global_step": 82188, "epoch": 1956} {"train_loss": -6.123644828796387, "global_step": 82189, "epoch": 1956} {"train_loss": -6.164385795593262, "global_step": 82190, "epoch": 1956} {"train_loss": -6.115143775939941, "global_step": 82191, "epoch": 1956} {"train_loss": -6.191989421844482, "global_step": 82192, "epoch": 1956} {"train_loss": -6.107201632999239, "global_step": 82193, "epoch": 1956, "val_loss": 67809.359375} {"train_loss": -6.179644584655762, "global_step": 82194, "epoch": 1957} {"train_loss": -6.155601978302002, "global_step": 82195, "epoch": 1957} {"train_loss": -6.064267158508301, "global_step": 82196, "epoch": 1957} {"train_loss": -6.058345794677734, "global_step": 82197, "epoch": 1957} {"train_loss": -6.154670715332031, "global_step": 82198, "epoch": 1957} {"train_loss": -6.11196231842041, "global_step": 82199, "epoch": 1957} {"train_loss": -6.113485336303711, "global_step": 82200, "epoch": 1957} {"train_loss": -6.066269397735596, "global_step": 82201, "epoch": 1957} {"train_loss": -6.135235786437988, "global_step": 82202, "epoch": 1957} {"train_loss": -6.135712623596191, "global_step": 82203, "epoch": 1957} {"train_loss": -6.19302225112915, "global_step": 82204, "epoch": 1957} {"train_loss": -6.100141525268555, "global_step": 82205, "epoch": 1957} {"train_loss": -6.046202659606934, "global_step": 82206, "epoch": 1957} {"train_loss": -6.133266925811768, "global_step": 82207, "epoch": 1957} {"train_loss": -6.125289440155029, "global_step": 82208, "epoch": 1957} {"train_loss": -6.125021934509277, "global_step": 82209, "epoch": 1957} {"train_loss": -6.272477149963379, "global_step": 82210, "epoch": 1957} {"train_loss": -6.186344146728516, "global_step": 82211, "epoch": 1957} {"train_loss": -6.148272514343262, "global_step": 82212, "epoch": 1957} {"train_loss": -6.057898998260498, "global_step": 82213, "epoch": 1957} {"train_loss": -6.173854827880859, "global_step": 82214, "epoch": 1957} {"train_loss": -6.18815803527832, "global_step": 82215, "epoch": 1957} {"train_loss": -6.002140045166016, "global_step": 82216, "epoch": 1957} {"train_loss": -6.162320137023926, "global_step": 82217, "epoch": 1957} {"train_loss": -6.150784492492676, "global_step": 82218, "epoch": 1957} {"train_loss": -6.104681015014648, "global_step": 82219, "epoch": 1957} {"train_loss": -6.0565409660339355, "global_step": 82220, "epoch": 1957} {"train_loss": -6.175803184509277, "global_step": 82221, "epoch": 1957} {"train_loss": -6.122928142547607, "global_step": 82222, "epoch": 1957} {"train_loss": -6.089798927307129, "global_step": 82223, "epoch": 1957} {"train_loss": -6.1125617027282715, "global_step": 82224, "epoch": 1957} {"train_loss": -6.08160400390625, "global_step": 82225, "epoch": 1957} {"train_loss": -6.117266654968262, "global_step": 82226, "epoch": 1957} {"train_loss": -6.071849822998047, "global_step": 82227, "epoch": 1957} {"train_loss": -6.149348735809326, "global_step": 82228, "epoch": 1957} {"train_loss": -6.113737106323242, "global_step": 82229, "epoch": 1957} {"train_loss": -6.14141845703125, "global_step": 82230, "epoch": 1957} {"train_loss": -6.14646577835083, "global_step": 82231, "epoch": 1957} {"train_loss": -6.149289131164551, "global_step": 82232, "epoch": 1957} {"train_loss": -6.21235990524292, "global_step": 82233, "epoch": 1957} {"train_loss": -6.210817813873291, "global_step": 82234, "epoch": 1957} {"train_loss": -6.132030691419329, "global_step": 82235, "epoch": 1957, "val_loss": 67681.46875} {"train_loss": -6.2068400382995605, "global_step": 82236, "epoch": 1958} {"train_loss": -6.108340263366699, "global_step": 82237, "epoch": 1958} {"train_loss": -6.233600616455078, "global_step": 82238, "epoch": 1958} {"train_loss": -6.154399871826172, "global_step": 82239, "epoch": 1958} {"train_loss": -6.1530561447143555, "global_step": 82240, "epoch": 1958} {"train_loss": -6.230489253997803, "global_step": 82241, "epoch": 1958} {"train_loss": -6.2588043212890625, "global_step": 82242, "epoch": 1958} {"train_loss": -6.169377326965332, "global_step": 82243, "epoch": 1958} {"train_loss": -6.249708652496338, "global_step": 82244, "epoch": 1958} {"train_loss": -6.135066986083984, "global_step": 82245, "epoch": 1958} {"train_loss": -6.0800886154174805, "global_step": 82246, "epoch": 1958} {"train_loss": -6.214072227478027, "global_step": 82247, "epoch": 1958} {"train_loss": -6.256382942199707, "global_step": 82248, "epoch": 1958} {"train_loss": -6.176192283630371, "global_step": 82249, "epoch": 1958} {"train_loss": -6.153144836425781, "global_step": 82250, "epoch": 1958} {"train_loss": -6.149663925170898, "global_step": 82251, "epoch": 1958} {"train_loss": -6.016016006469727, "global_step": 82252, "epoch": 1958} {"train_loss": -6.180865287780762, "global_step": 82253, "epoch": 1958} {"train_loss": -6.153159141540527, "global_step": 82254, "epoch": 1958} {"train_loss": -6.279430389404297, "global_step": 82255, "epoch": 1958} {"train_loss": -6.043127059936523, "global_step": 82256, "epoch": 1958} {"train_loss": -6.0804123878479, "global_step": 82257, "epoch": 1958} {"train_loss": -6.1232099533081055, "global_step": 82258, "epoch": 1958} {"train_loss": -6.0860748291015625, "global_step": 82259, "epoch": 1958} {"train_loss": -6.268844127655029, "global_step": 82260, "epoch": 1958} {"train_loss": -6.189046859741211, "global_step": 82261, "epoch": 1958} {"train_loss": -6.211691856384277, "global_step": 82262, "epoch": 1958} {"train_loss": -6.099258899688721, "global_step": 82263, "epoch": 1958} {"train_loss": -6.123142719268799, "global_step": 82264, "epoch": 1958} {"train_loss": -6.105231761932373, "global_step": 82265, "epoch": 1958} {"train_loss": -6.030029296875, "global_step": 82266, "epoch": 1958} {"train_loss": -6.155346870422363, "global_step": 82267, "epoch": 1958} {"train_loss": -6.206881523132324, "global_step": 82268, "epoch": 1958} {"train_loss": -6.185328006744385, "global_step": 82269, "epoch": 1958} {"train_loss": -6.180715560913086, "global_step": 82270, "epoch": 1958} {"train_loss": -6.096811771392822, "global_step": 82271, "epoch": 1958} {"train_loss": -6.163474082946777, "global_step": 82272, "epoch": 1958} {"train_loss": -6.247668743133545, "global_step": 82273, "epoch": 1958} {"train_loss": -6.173371315002441, "global_step": 82274, "epoch": 1958} {"train_loss": -6.11279296875, "global_step": 82275, "epoch": 1958} {"train_loss": -6.0129289627075195, "global_step": 82276, "epoch": 1958} {"train_loss": -6.15669356073652, "global_step": 82277, "epoch": 1958, "val_loss": 67805.6015625} {"train_loss": -6.142575263977051, "global_step": 82278, "epoch": 1959} {"train_loss": -6.213382244110107, "global_step": 82279, "epoch": 1959} {"train_loss": -6.043181419372559, "global_step": 82280, "epoch": 1959} {"train_loss": -6.143392562866211, "global_step": 82281, "epoch": 1959} {"train_loss": -6.070472717285156, "global_step": 82282, "epoch": 1959} {"train_loss": -6.254497528076172, "global_step": 82283, "epoch": 1959} {"train_loss": -6.211906433105469, "global_step": 82284, "epoch": 1959} {"train_loss": -6.130070209503174, "global_step": 82285, "epoch": 1959} {"train_loss": -5.951376438140869, "global_step": 82286, "epoch": 1959} {"train_loss": -6.073265075683594, "global_step": 82287, "epoch": 1959} {"train_loss": -6.207389831542969, "global_step": 82288, "epoch": 1959} {"train_loss": -6.203373908996582, "global_step": 82289, "epoch": 1959} {"train_loss": -6.09696102142334, "global_step": 82290, "epoch": 1959} {"train_loss": -6.1427202224731445, "global_step": 82291, "epoch": 1959} {"train_loss": -6.030239582061768, "global_step": 82292, "epoch": 1959} {"train_loss": -6.105381965637207, "global_step": 82293, "epoch": 1959} {"train_loss": -6.10738468170166, "global_step": 82294, "epoch": 1959} {"train_loss": -6.163361549377441, "global_step": 82295, "epoch": 1959} {"train_loss": -6.159014701843262, "global_step": 82296, "epoch": 1959} {"train_loss": -6.1880388259887695, "global_step": 82297, "epoch": 1959} {"train_loss": -6.203360557556152, "global_step": 82298, "epoch": 1959} {"train_loss": -6.15706729888916, "global_step": 82299, "epoch": 1959} {"train_loss": -6.252394676208496, "global_step": 82300, "epoch": 1959} {"train_loss": -6.13007116317749, "global_step": 82301, "epoch": 1959} {"train_loss": -6.201412200927734, "global_step": 82302, "epoch": 1959} {"train_loss": -6.233552932739258, "global_step": 82303, "epoch": 1959} {"train_loss": -6.134026527404785, "global_step": 82304, "epoch": 1959} {"train_loss": -6.192255020141602, "global_step": 82305, "epoch": 1959} {"train_loss": -6.1924920082092285, "global_step": 82306, "epoch": 1959} {"train_loss": -6.234600067138672, "global_step": 82307, "epoch": 1959} {"train_loss": -6.166121482849121, "global_step": 82308, "epoch": 1959} {"train_loss": -6.146223068237305, "global_step": 82309, "epoch": 1959} {"train_loss": -6.227886199951172, "global_step": 82310, "epoch": 1959} {"train_loss": -6.102753162384033, "global_step": 82311, "epoch": 1959} {"train_loss": -6.136873245239258, "global_step": 82312, "epoch": 1959} {"train_loss": -6.242254257202148, "global_step": 82313, "epoch": 1959} {"train_loss": -5.917988300323486, "global_step": 82314, "epoch": 1959} {"train_loss": -6.074286460876465, "global_step": 82315, "epoch": 1959} {"train_loss": -6.111032485961914, "global_step": 82316, "epoch": 1959} {"train_loss": -6.049666881561279, "global_step": 82317, "epoch": 1959} {"train_loss": -6.12223482131958, "global_step": 82318, "epoch": 1959} {"train_loss": -6.145377863021124, "global_step": 82319, "epoch": 1959, "val_loss": 67917.7890625} {"train_loss": -6.07352352142334, "global_step": 82320, "epoch": 1960} {"train_loss": -6.198936462402344, "global_step": 82321, "epoch": 1960} {"train_loss": -6.116606712341309, "global_step": 82322, "epoch": 1960} {"train_loss": -6.1406450271606445, "global_step": 82323, "epoch": 1960} {"train_loss": -6.231888294219971, "global_step": 82324, "epoch": 1960} {"train_loss": -6.0840678215026855, "global_step": 82325, "epoch": 1960} {"train_loss": -6.28812313079834, "global_step": 82326, "epoch": 1960} {"train_loss": -6.137270927429199, "global_step": 82327, "epoch": 1960} {"train_loss": -6.132966995239258, "global_step": 82328, "epoch": 1960} {"train_loss": -6.1516547203063965, "global_step": 82329, "epoch": 1960} {"train_loss": -6.155538082122803, "global_step": 82330, "epoch": 1960} {"train_loss": -6.107578277587891, "global_step": 82331, "epoch": 1960} {"train_loss": -6.047403335571289, "global_step": 82332, "epoch": 1960} {"train_loss": -6.0321784019470215, "global_step": 82333, "epoch": 1960} {"train_loss": -6.287474632263184, "global_step": 82334, "epoch": 1960} {"train_loss": -6.118554592132568, "global_step": 82335, "epoch": 1960} {"train_loss": -6.168364524841309, "global_step": 82336, "epoch": 1960} {"train_loss": -6.110674858093262, "global_step": 82337, "epoch": 1960} {"train_loss": -6.118443489074707, "global_step": 82338, "epoch": 1960} {"train_loss": -6.180200576782227, "global_step": 82339, "epoch": 1960} {"train_loss": -6.126877784729004, "global_step": 82340, "epoch": 1960} {"train_loss": -6.0243988037109375, "global_step": 82341, "epoch": 1960} {"train_loss": -6.112057685852051, "global_step": 82342, "epoch": 1960} {"train_loss": -6.024975776672363, "global_step": 82343, "epoch": 1960} {"train_loss": -6.140408515930176, "global_step": 82344, "epoch": 1960} {"train_loss": -5.995100498199463, "global_step": 82345, "epoch": 1960} {"train_loss": -6.056380271911621, "global_step": 82346, "epoch": 1960} {"train_loss": -6.246917724609375, "global_step": 82347, "epoch": 1960} {"train_loss": -6.075811862945557, "global_step": 82348, "epoch": 1960} {"train_loss": -6.104938507080078, "global_step": 82349, "epoch": 1960} {"train_loss": -6.089441299438477, "global_step": 82350, "epoch": 1960} {"train_loss": -6.133994102478027, "global_step": 82351, "epoch": 1960} {"train_loss": -6.075586318969727, "global_step": 82352, "epoch": 1960} {"train_loss": -6.180332660675049, "global_step": 82353, "epoch": 1960} {"train_loss": -6.0847883224487305, "global_step": 82354, "epoch": 1960} {"train_loss": -6.099098205566406, "global_step": 82355, "epoch": 1960} {"train_loss": -6.091387748718262, "global_step": 82356, "epoch": 1960} {"train_loss": -6.046197891235352, "global_step": 82357, "epoch": 1960} {"train_loss": -6.166272163391113, "global_step": 82358, "epoch": 1960} {"train_loss": -6.117885112762451, "global_step": 82359, "epoch": 1960} {"train_loss": -6.2021942138671875, "global_step": 82360, "epoch": 1960} {"train_loss": -6.126222474234445, "global_step": 82361, "epoch": 1960, "val_loss": 67734.78125} {"train_loss": -6.137414932250977, "global_step": 82362, "epoch": 1961} {"train_loss": -6.159987449645996, "global_step": 82363, "epoch": 1961} {"train_loss": -6.091841697692871, "global_step": 82364, "epoch": 1961} {"train_loss": -6.2089691162109375, "global_step": 82365, "epoch": 1961} {"train_loss": -6.1466450691223145, "global_step": 82366, "epoch": 1961} {"train_loss": -6.227972984313965, "global_step": 82367, "epoch": 1961} {"train_loss": -6.067375659942627, "global_step": 82368, "epoch": 1961} {"train_loss": -6.214859485626221, "global_step": 82369, "epoch": 1961} {"train_loss": -6.169641494750977, "global_step": 82370, "epoch": 1961} {"train_loss": -6.055715560913086, "global_step": 82371, "epoch": 1961} {"train_loss": -6.2523322105407715, "global_step": 82372, "epoch": 1961} {"train_loss": -6.207403659820557, "global_step": 82373, "epoch": 1961} {"train_loss": -6.200911998748779, "global_step": 82374, "epoch": 1961} {"train_loss": -6.30078125, "global_step": 82375, "epoch": 1961} {"train_loss": -6.145597457885742, "global_step": 82376, "epoch": 1961} {"train_loss": -6.2626752853393555, "global_step": 82377, "epoch": 1961} {"train_loss": -6.090425491333008, "global_step": 82378, "epoch": 1961} {"train_loss": -6.062362194061279, "global_step": 82379, "epoch": 1961} {"train_loss": -6.169917106628418, "global_step": 82380, "epoch": 1961} {"train_loss": -6.095932483673096, "global_step": 82381, "epoch": 1961} {"train_loss": -6.20863151550293, "global_step": 82382, "epoch": 1961} {"train_loss": -6.099644660949707, "global_step": 82383, "epoch": 1961} {"train_loss": -6.225785255432129, "global_step": 82384, "epoch": 1961} {"train_loss": -6.226040840148926, "global_step": 82385, "epoch": 1961} {"train_loss": -6.1275763511657715, "global_step": 82386, "epoch": 1961} {"train_loss": -6.25722599029541, "global_step": 82387, "epoch": 1961} {"train_loss": -6.185052871704102, "global_step": 82388, "epoch": 1961} {"train_loss": -6.23319673538208, "global_step": 82389, "epoch": 1961} {"train_loss": -6.1894989013671875, "global_step": 82390, "epoch": 1961} {"train_loss": -6.189239025115967, "global_step": 82391, "epoch": 1961} {"train_loss": -6.172362327575684, "global_step": 82392, "epoch": 1961} {"train_loss": -6.168500900268555, "global_step": 82393, "epoch": 1961} {"train_loss": -6.207418441772461, "global_step": 82394, "epoch": 1961} {"train_loss": -6.119134902954102, "global_step": 82395, "epoch": 1961} {"train_loss": -6.225960731506348, "global_step": 82396, "epoch": 1961} {"train_loss": -6.182376384735107, "global_step": 82397, "epoch": 1961} {"train_loss": -6.148922920227051, "global_step": 82398, "epoch": 1961} {"train_loss": -6.035715103149414, "global_step": 82399, "epoch": 1961} {"train_loss": -6.232880592346191, "global_step": 82400, "epoch": 1961} {"train_loss": -6.1775970458984375, "global_step": 82401, "epoch": 1961} {"train_loss": -6.188438892364502, "global_step": 82402, "epoch": 1961} {"train_loss": -6.172803424653553, "global_step": 82403, "epoch": 1961, "val_loss": 67845.5546875} {"train_loss": -6.263845443725586, "global_step": 82404, "epoch": 1962} {"train_loss": -6.157947540283203, "global_step": 82405, "epoch": 1962} {"train_loss": -6.189443111419678, "global_step": 82406, "epoch": 1962} {"train_loss": -6.261806011199951, "global_step": 82407, "epoch": 1962} {"train_loss": -6.150107383728027, "global_step": 82408, "epoch": 1962} {"train_loss": -6.068718910217285, "global_step": 82409, "epoch": 1962} {"train_loss": -6.146490097045898, "global_step": 82410, "epoch": 1962} {"train_loss": -5.993785858154297, "global_step": 82411, "epoch": 1962} {"train_loss": -6.18702507019043, "global_step": 82412, "epoch": 1962} {"train_loss": -6.094237804412842, "global_step": 82413, "epoch": 1962} {"train_loss": -6.0557966232299805, "global_step": 82414, "epoch": 1962} {"train_loss": -6.096661567687988, "global_step": 82415, "epoch": 1962} {"train_loss": -6.0977373123168945, "global_step": 82416, "epoch": 1962} {"train_loss": -6.1458611488342285, "global_step": 82417, "epoch": 1962} {"train_loss": -6.101797103881836, "global_step": 82418, "epoch": 1962} {"train_loss": -6.05496883392334, "global_step": 82419, "epoch": 1962} {"train_loss": -6.092905521392822, "global_step": 82420, "epoch": 1962} {"train_loss": -6.157227039337158, "global_step": 82421, "epoch": 1962} {"train_loss": -6.050868034362793, "global_step": 82422, "epoch": 1962} {"train_loss": -6.110252380371094, "global_step": 82423, "epoch": 1962} {"train_loss": -6.075538158416748, "global_step": 82424, "epoch": 1962} {"train_loss": -6.042548179626465, "global_step": 82425, "epoch": 1962} {"train_loss": -6.137752532958984, "global_step": 82426, "epoch": 1962} {"train_loss": -6.152277946472168, "global_step": 82427, "epoch": 1962} {"train_loss": -6.165110111236572, "global_step": 82428, "epoch": 1962} {"train_loss": -6.107404708862305, "global_step": 82429, "epoch": 1962} {"train_loss": -6.099090099334717, "global_step": 82430, "epoch": 1962} {"train_loss": -6.19614315032959, "global_step": 82431, "epoch": 1962} {"train_loss": -6.078459739685059, "global_step": 82432, "epoch": 1962} {"train_loss": -6.220176696777344, "global_step": 82433, "epoch": 1962} {"train_loss": -6.120247840881348, "global_step": 82434, "epoch": 1962} {"train_loss": -6.126805305480957, "global_step": 82435, "epoch": 1962} {"train_loss": -6.143731117248535, "global_step": 82436, "epoch": 1962} {"train_loss": -6.151900768280029, "global_step": 82437, "epoch": 1962} {"train_loss": -6.231532573699951, "global_step": 82438, "epoch": 1962} {"train_loss": -6.169535160064697, "global_step": 82439, "epoch": 1962} {"train_loss": -6.192339897155762, "global_step": 82440, "epoch": 1962} {"train_loss": -6.160890102386475, "global_step": 82441, "epoch": 1962} {"train_loss": -6.02260684967041, "global_step": 82442, "epoch": 1962} {"train_loss": -6.192373275756836, "global_step": 82443, "epoch": 1962} {"train_loss": -6.182664394378662, "global_step": 82444, "epoch": 1962} {"train_loss": -6.1335344314575195, "global_step": 82445, "epoch": 1962, "val_loss": 67658.1640625} {"train_loss": -6.165249824523926, "global_step": 82446, "epoch": 1963} {"train_loss": -6.052163124084473, "global_step": 82447, "epoch": 1963} {"train_loss": -6.188055038452148, "global_step": 82448, "epoch": 1963} {"train_loss": -6.22303581237793, "global_step": 82449, "epoch": 1963} {"train_loss": -6.112013816833496, "global_step": 82450, "epoch": 1963} {"train_loss": -6.182918548583984, "global_step": 82451, "epoch": 1963} {"train_loss": -6.123928070068359, "global_step": 82452, "epoch": 1963} {"train_loss": -6.162479400634766, "global_step": 82453, "epoch": 1963} {"train_loss": -6.12199592590332, "global_step": 82454, "epoch": 1963} {"train_loss": -6.207118988037109, "global_step": 82455, "epoch": 1963} {"train_loss": -6.182082176208496, "global_step": 82456, "epoch": 1963} {"train_loss": -6.105713844299316, "global_step": 82457, "epoch": 1963} {"train_loss": -6.133843421936035, "global_step": 82458, "epoch": 1963} {"train_loss": -6.173689842224121, "global_step": 82459, "epoch": 1963} {"train_loss": -6.1960954666137695, "global_step": 82460, "epoch": 1963} {"train_loss": -6.277031898498535, "global_step": 82461, "epoch": 1963} {"train_loss": -6.125277042388916, "global_step": 82462, "epoch": 1963} {"train_loss": -6.239740371704102, "global_step": 82463, "epoch": 1963} {"train_loss": -6.127367973327637, "global_step": 82464, "epoch": 1963} {"train_loss": -6.122894287109375, "global_step": 82465, "epoch": 1963} {"train_loss": -6.053359031677246, "global_step": 82466, "epoch": 1963} {"train_loss": -6.152127742767334, "global_step": 82467, "epoch": 1963} {"train_loss": -6.168950080871582, "global_step": 82468, "epoch": 1963} {"train_loss": -6.132874965667725, "global_step": 82469, "epoch": 1963} {"train_loss": -6.059165000915527, "global_step": 82470, "epoch": 1963} {"train_loss": -6.166036128997803, "global_step": 82471, "epoch": 1963} {"train_loss": -6.188632011413574, "global_step": 82472, "epoch": 1963} {"train_loss": -6.02122163772583, "global_step": 82473, "epoch": 1963} {"train_loss": -6.268266677856445, "global_step": 82474, "epoch": 1963} {"train_loss": -6.159942150115967, "global_step": 82475, "epoch": 1963} {"train_loss": -6.116652011871338, "global_step": 82476, "epoch": 1963} {"train_loss": -6.115355968475342, "global_step": 82477, "epoch": 1963} {"train_loss": -6.210499286651611, "global_step": 82478, "epoch": 1963} {"train_loss": -6.251431941986084, "global_step": 82479, "epoch": 1963} {"train_loss": -6.190055847167969, "global_step": 82480, "epoch": 1963} {"train_loss": -6.124141216278076, "global_step": 82481, "epoch": 1963} {"train_loss": -6.246677875518799, "global_step": 82482, "epoch": 1963} {"train_loss": -6.1674909591674805, "global_step": 82483, "epoch": 1963} {"train_loss": -6.066669940948486, "global_step": 82484, "epoch": 1963} {"train_loss": -6.220278263092041, "global_step": 82485, "epoch": 1963} {"train_loss": -6.156045436859131, "global_step": 82486, "epoch": 1963} {"train_loss": -6.156250794728597, "global_step": 82487, "epoch": 1963, "val_loss": 67816.328125} {"train_loss": -6.043542385101318, "global_step": 82488, "epoch": 1964} {"train_loss": -6.251821994781494, "global_step": 82489, "epoch": 1964} {"train_loss": -6.1288557052612305, "global_step": 82490, "epoch": 1964} {"train_loss": -6.1785383224487305, "global_step": 82491, "epoch": 1964} {"train_loss": -6.241057395935059, "global_step": 82492, "epoch": 1964} {"train_loss": -6.1401262283325195, "global_step": 82493, "epoch": 1964} {"train_loss": -6.1009416580200195, "global_step": 82494, "epoch": 1964} {"train_loss": -6.142199516296387, "global_step": 82495, "epoch": 1964} {"train_loss": -5.980185508728027, "global_step": 82496, "epoch": 1964} {"train_loss": -6.096511363983154, "global_step": 82497, "epoch": 1964} {"train_loss": -6.093377113342285, "global_step": 82498, "epoch": 1964} {"train_loss": -6.11029052734375, "global_step": 82499, "epoch": 1964} {"train_loss": -6.289163589477539, "global_step": 82500, "epoch": 1964} {"train_loss": -6.132607460021973, "global_step": 82501, "epoch": 1964} {"train_loss": -6.2228899002075195, "global_step": 82502, "epoch": 1964} {"train_loss": -6.226430892944336, "global_step": 82503, "epoch": 1964} {"train_loss": -6.08467960357666, "global_step": 82504, "epoch": 1964} {"train_loss": -6.180145740509033, "global_step": 82505, "epoch": 1964} {"train_loss": -6.099352836608887, "global_step": 82506, "epoch": 1964} {"train_loss": -6.180514812469482, "global_step": 82507, "epoch": 1964} {"train_loss": -6.179125785827637, "global_step": 82508, "epoch": 1964} {"train_loss": -6.130774021148682, "global_step": 82509, "epoch": 1964} {"train_loss": -6.103428840637207, "global_step": 82510, "epoch": 1964} {"train_loss": -6.093206405639648, "global_step": 82511, "epoch": 1964} {"train_loss": -6.209444046020508, "global_step": 82512, "epoch": 1964} {"train_loss": -6.234338760375977, "global_step": 82513, "epoch": 1964} {"train_loss": -6.226408958435059, "global_step": 82514, "epoch": 1964} {"train_loss": -6.191331386566162, "global_step": 82515, "epoch": 1964} {"train_loss": -6.125974178314209, "global_step": 82516, "epoch": 1964} {"train_loss": -6.174220085144043, "global_step": 82517, "epoch": 1964} {"train_loss": -6.1955718994140625, "global_step": 82518, "epoch": 1964} {"train_loss": -6.216107368469238, "global_step": 82519, "epoch": 1964} {"train_loss": -6.234858512878418, "global_step": 82520, "epoch": 1964} {"train_loss": -6.249838829040527, "global_step": 82521, "epoch": 1964} {"train_loss": -6.241832256317139, "global_step": 82522, "epoch": 1964} {"train_loss": -6.153257369995117, "global_step": 82523, "epoch": 1964} {"train_loss": -6.139823913574219, "global_step": 82524, "epoch": 1964} {"train_loss": -6.100008964538574, "global_step": 82525, "epoch": 1964} {"train_loss": -6.085212707519531, "global_step": 82526, "epoch": 1964} {"train_loss": -6.085468292236328, "global_step": 82527, "epoch": 1964} {"train_loss": -6.061540126800537, "global_step": 82528, "epoch": 1964} {"train_loss": -6.15498077301752, "global_step": 82529, "epoch": 1964, "val_loss": 67779.359375} {"train_loss": -6.095280647277832, "global_step": 82530, "epoch": 1965} {"train_loss": -6.073615074157715, "global_step": 82531, "epoch": 1965} {"train_loss": -6.154318809509277, "global_step": 82532, "epoch": 1965} {"train_loss": -6.066166877746582, "global_step": 82533, "epoch": 1965} {"train_loss": -6.079957008361816, "global_step": 82534, "epoch": 1965} {"train_loss": -6.226239204406738, "global_step": 82535, "epoch": 1965} {"train_loss": -6.0241780281066895, "global_step": 82536, "epoch": 1965} {"train_loss": -6.183423042297363, "global_step": 82537, "epoch": 1965} {"train_loss": -6.247799873352051, "global_step": 82538, "epoch": 1965} {"train_loss": -6.072780609130859, "global_step": 82539, "epoch": 1965} {"train_loss": -6.2298736572265625, "global_step": 82540, "epoch": 1965} {"train_loss": -6.137948036193848, "global_step": 82541, "epoch": 1965} {"train_loss": -6.131214141845703, "global_step": 82542, "epoch": 1965} {"train_loss": -6.147656440734863, "global_step": 82543, "epoch": 1965} {"train_loss": -6.198325157165527, "global_step": 82544, "epoch": 1965} {"train_loss": -6.058274269104004, "global_step": 82545, "epoch": 1965} {"train_loss": -6.143645763397217, "global_step": 82546, "epoch": 1965} {"train_loss": -6.131664276123047, "global_step": 82547, "epoch": 1965} {"train_loss": -6.257029056549072, "global_step": 82548, "epoch": 1965} {"train_loss": -6.207216262817383, "global_step": 82549, "epoch": 1965} {"train_loss": -6.095067501068115, "global_step": 82550, "epoch": 1965} {"train_loss": -6.167304992675781, "global_step": 82551, "epoch": 1965} {"train_loss": -6.071595191955566, "global_step": 82552, "epoch": 1965} {"train_loss": -6.075153350830078, "global_step": 82553, "epoch": 1965} {"train_loss": -6.099414348602295, "global_step": 82554, "epoch": 1965} {"train_loss": -6.0357794761657715, "global_step": 82555, "epoch": 1965} {"train_loss": -6.139179706573486, "global_step": 82556, "epoch": 1965} {"train_loss": -6.130152225494385, "global_step": 82557, "epoch": 1965} {"train_loss": -6.107330322265625, "global_step": 82558, "epoch": 1965} {"train_loss": -6.143740653991699, "global_step": 82559, "epoch": 1965} {"train_loss": -6.161134719848633, "global_step": 82560, "epoch": 1965} {"train_loss": -6.006956577301025, "global_step": 82561, "epoch": 1965} {"train_loss": -6.080423355102539, "global_step": 82562, "epoch": 1965} {"train_loss": -6.093722343444824, "global_step": 82563, "epoch": 1965} {"train_loss": -6.109713554382324, "global_step": 82564, "epoch": 1965} {"train_loss": -6.160858631134033, "global_step": 82565, "epoch": 1965} {"train_loss": -6.099316120147705, "global_step": 82566, "epoch": 1965} {"train_loss": -6.137229919433594, "global_step": 82567, "epoch": 1965} {"train_loss": -6.114602088928223, "global_step": 82568, "epoch": 1965} {"train_loss": -6.19898796081543, "global_step": 82569, "epoch": 1965} {"train_loss": -6.196326732635498, "global_step": 82570, "epoch": 1965} {"train_loss": -6.130339213779995, "global_step": 82571, "epoch": 1965, "val_loss": 68005.0859375} {"train_loss": -6.1038103103637695, "global_step": 82572, "epoch": 1966} {"train_loss": -6.219738006591797, "global_step": 82573, "epoch": 1966} {"train_loss": -6.086145401000977, "global_step": 82574, "epoch": 1966} {"train_loss": -6.182176113128662, "global_step": 82575, "epoch": 1966} {"train_loss": -6.200887680053711, "global_step": 82576, "epoch": 1966} {"train_loss": -6.207685470581055, "global_step": 82577, "epoch": 1966} {"train_loss": -6.244494438171387, "global_step": 82578, "epoch": 1966} {"train_loss": -6.107744216918945, "global_step": 82579, "epoch": 1966} {"train_loss": -6.271106719970703, "global_step": 82580, "epoch": 1966} {"train_loss": -6.117491245269775, "global_step": 82581, "epoch": 1966} {"train_loss": -6.269323348999023, "global_step": 82582, "epoch": 1966} {"train_loss": -6.1263604164123535, "global_step": 82583, "epoch": 1966} {"train_loss": -6.154387950897217, "global_step": 82584, "epoch": 1966} {"train_loss": -6.060850143432617, "global_step": 82585, "epoch": 1966} {"train_loss": -6.190174102783203, "global_step": 82586, "epoch": 1966} {"train_loss": -6.233555793762207, "global_step": 82587, "epoch": 1966} {"train_loss": -6.182046890258789, "global_step": 82588, "epoch": 1966} {"train_loss": -6.229400634765625, "global_step": 82589, "epoch": 1966} {"train_loss": -6.187887668609619, "global_step": 82590, "epoch": 1966} {"train_loss": -6.160299777984619, "global_step": 82591, "epoch": 1966} {"train_loss": -6.279102802276611, "global_step": 82592, "epoch": 1966} {"train_loss": -6.0937957763671875, "global_step": 82593, "epoch": 1966} {"train_loss": -6.054135322570801, "global_step": 82594, "epoch": 1966} {"train_loss": -6.184854507446289, "global_step": 82595, "epoch": 1966} {"train_loss": -6.196688652038574, "global_step": 82596, "epoch": 1966} {"train_loss": -6.180954456329346, "global_step": 82597, "epoch": 1966} {"train_loss": -6.115470886230469, "global_step": 82598, "epoch": 1966} {"train_loss": -6.073746204376221, "global_step": 82599, "epoch": 1966} {"train_loss": -6.238232612609863, "global_step": 82600, "epoch": 1966} {"train_loss": -6.069005489349365, "global_step": 82601, "epoch": 1966} {"train_loss": -6.216519355773926, "global_step": 82602, "epoch": 1966} {"train_loss": -6.245292663574219, "global_step": 82603, "epoch": 1966} {"train_loss": -6.210742950439453, "global_step": 82604, "epoch": 1966} {"train_loss": -6.342106819152832, "global_step": 82605, "epoch": 1966} {"train_loss": -6.132896423339844, "global_step": 82606, "epoch": 1966} {"train_loss": -6.19603157043457, "global_step": 82607, "epoch": 1966} {"train_loss": -6.178895950317383, "global_step": 82608, "epoch": 1966} {"train_loss": -6.044926643371582, "global_step": 82609, "epoch": 1966} {"train_loss": -6.192079544067383, "global_step": 82610, "epoch": 1966} {"train_loss": -6.216133117675781, "global_step": 82611, "epoch": 1966} {"train_loss": -6.1939239501953125, "global_step": 82612, "epoch": 1966} {"train_loss": -6.176152342841739, "global_step": 82613, "epoch": 1966, "val_loss": 67616.3046875} {"train_loss": -6.105566024780273, "global_step": 82614, "epoch": 1967} {"train_loss": -6.266473770141602, "global_step": 82615, "epoch": 1967} {"train_loss": -6.224625110626221, "global_step": 82616, "epoch": 1967} {"train_loss": -6.227774143218994, "global_step": 82617, "epoch": 1967} {"train_loss": -6.158161640167236, "global_step": 82618, "epoch": 1967} {"train_loss": -6.115718841552734, "global_step": 82619, "epoch": 1967} {"train_loss": -6.148882865905762, "global_step": 82620, "epoch": 1967} {"train_loss": -6.176822662353516, "global_step": 82621, "epoch": 1967} {"train_loss": -6.302464485168457, "global_step": 82622, "epoch": 1967} {"train_loss": -6.232448101043701, "global_step": 82623, "epoch": 1967} {"train_loss": -6.145771503448486, "global_step": 82624, "epoch": 1967} {"train_loss": -6.073293209075928, "global_step": 82625, "epoch": 1967} {"train_loss": -6.249906539916992, "global_step": 82626, "epoch": 1967} {"train_loss": -6.043082237243652, "global_step": 82627, "epoch": 1967} {"train_loss": -6.08854866027832, "global_step": 82628, "epoch": 1967} {"train_loss": -6.174127101898193, "global_step": 82629, "epoch": 1967} {"train_loss": -6.262359619140625, "global_step": 82630, "epoch": 1967} {"train_loss": -6.235651969909668, "global_step": 82631, "epoch": 1967} {"train_loss": -6.114748954772949, "global_step": 82632, "epoch": 1967} {"train_loss": -6.09890079498291, "global_step": 82633, "epoch": 1967} {"train_loss": -6.182003021240234, "global_step": 82634, "epoch": 1967} {"train_loss": -6.161293029785156, "global_step": 82635, "epoch": 1967} {"train_loss": -6.158562183380127, "global_step": 82636, "epoch": 1967} {"train_loss": -6.184782028198242, "global_step": 82637, "epoch": 1967} {"train_loss": -6.151310920715332, "global_step": 82638, "epoch": 1967} {"train_loss": -6.182395935058594, "global_step": 82639, "epoch": 1967} {"train_loss": -6.103198051452637, "global_step": 82640, "epoch": 1967} {"train_loss": -6.188667297363281, "global_step": 82641, "epoch": 1967} {"train_loss": -6.1973876953125, "global_step": 82642, "epoch": 1967} {"train_loss": -6.131008148193359, "global_step": 82643, "epoch": 1967} {"train_loss": -6.2268452644348145, "global_step": 82644, "epoch": 1967} {"train_loss": -6.145232200622559, "global_step": 82645, "epoch": 1967} {"train_loss": -6.263023853302002, "global_step": 82646, "epoch": 1967} {"train_loss": -6.220170497894287, "global_step": 82647, "epoch": 1967} {"train_loss": -6.191732406616211, "global_step": 82648, "epoch": 1967} {"train_loss": -6.100080490112305, "global_step": 82649, "epoch": 1967} {"train_loss": -6.124666213989258, "global_step": 82650, "epoch": 1967} {"train_loss": -6.037877082824707, "global_step": 82651, "epoch": 1967} {"train_loss": -6.092277526855469, "global_step": 82652, "epoch": 1967} {"train_loss": -6.1579203605651855, "global_step": 82653, "epoch": 1967} {"train_loss": -6.317593574523926, "global_step": 82654, "epoch": 1967} {"train_loss": -6.166476828711374, "global_step": 82655, "epoch": 1967, "val_loss": 67785.3046875} {"train_loss": -6.09531831741333, "global_step": 82656, "epoch": 1968} {"train_loss": -6.13262414932251, "global_step": 82657, "epoch": 1968} {"train_loss": -5.986339569091797, "global_step": 82658, "epoch": 1968} {"train_loss": -6.104270935058594, "global_step": 82659, "epoch": 1968} {"train_loss": -6.264487266540527, "global_step": 82660, "epoch": 1968} {"train_loss": -6.182811260223389, "global_step": 82661, "epoch": 1968} {"train_loss": -6.105475902557373, "global_step": 82662, "epoch": 1968} {"train_loss": -6.199707508087158, "global_step": 82663, "epoch": 1968} {"train_loss": -6.132604122161865, "global_step": 82664, "epoch": 1968} {"train_loss": -6.098423480987549, "global_step": 82665, "epoch": 1968} {"train_loss": -6.189255714416504, "global_step": 82666, "epoch": 1968} {"train_loss": -6.056124687194824, "global_step": 82667, "epoch": 1968} {"train_loss": -6.100639343261719, "global_step": 82668, "epoch": 1968} {"train_loss": -6.15259313583374, "global_step": 82669, "epoch": 1968} {"train_loss": -6.116003036499023, "global_step": 82670, "epoch": 1968} {"train_loss": -6.134915351867676, "global_step": 82671, "epoch": 1968} {"train_loss": -6.203172206878662, "global_step": 82672, "epoch": 1968} {"train_loss": -6.107350826263428, "global_step": 82673, "epoch": 1968} {"train_loss": -6.147528171539307, "global_step": 82674, "epoch": 1968} {"train_loss": -6.204360008239746, "global_step": 82675, "epoch": 1968} {"train_loss": -6.117800712585449, "global_step": 82676, "epoch": 1968} {"train_loss": -6.169208526611328, "global_step": 82677, "epoch": 1968} {"train_loss": -6.067930221557617, "global_step": 82678, "epoch": 1968} {"train_loss": -6.061030387878418, "global_step": 82679, "epoch": 1968} {"train_loss": -6.156407356262207, "global_step": 82680, "epoch": 1968} {"train_loss": -6.041736125946045, "global_step": 82681, "epoch": 1968} {"train_loss": -6.02701473236084, "global_step": 82682, "epoch": 1968} {"train_loss": -6.1981964111328125, "global_step": 82683, "epoch": 1968} {"train_loss": -6.144153594970703, "global_step": 82684, "epoch": 1968} {"train_loss": -6.113391876220703, "global_step": 82685, "epoch": 1968} {"train_loss": -6.221671104431152, "global_step": 82686, "epoch": 1968} {"train_loss": -6.140027046203613, "global_step": 82687, "epoch": 1968} {"train_loss": -6.117963790893555, "global_step": 82688, "epoch": 1968} {"train_loss": -6.122880458831787, "global_step": 82689, "epoch": 1968} {"train_loss": -6.189037322998047, "global_step": 82690, "epoch": 1968} {"train_loss": -6.133021354675293, "global_step": 82691, "epoch": 1968} {"train_loss": -6.0710954666137695, "global_step": 82692, "epoch": 1968} {"train_loss": -6.234799385070801, "global_step": 82693, "epoch": 1968} {"train_loss": -6.121578216552734, "global_step": 82694, "epoch": 1968} {"train_loss": -6.209129333496094, "global_step": 82695, "epoch": 1968} {"train_loss": -6.151724338531494, "global_step": 82696, "epoch": 1968} {"train_loss": -6.135124002184186, "global_step": 82697, "epoch": 1968, "val_loss": 67790.671875} {"train_loss": -6.192924976348877, "global_step": 82698, "epoch": 1969} {"train_loss": -6.180181503295898, "global_step": 82699, "epoch": 1969} {"train_loss": -6.133175849914551, "global_step": 82700, "epoch": 1969} {"train_loss": -6.061861991882324, "global_step": 82701, "epoch": 1969} {"train_loss": -6.268692493438721, "global_step": 82702, "epoch": 1969} {"train_loss": -6.257138252258301, "global_step": 82703, "epoch": 1969} {"train_loss": -5.994123458862305, "global_step": 82704, "epoch": 1969} {"train_loss": -6.258705139160156, "global_step": 82705, "epoch": 1969} {"train_loss": -6.142945289611816, "global_step": 82706, "epoch": 1969} {"train_loss": -6.134914398193359, "global_step": 82707, "epoch": 1969} {"train_loss": -6.01013708114624, "global_step": 82708, "epoch": 1969} {"train_loss": -6.247042655944824, "global_step": 82709, "epoch": 1969} {"train_loss": -6.123659610748291, "global_step": 82710, "epoch": 1969} {"train_loss": -6.087018966674805, "global_step": 82711, "epoch": 1969} {"train_loss": -6.155117034912109, "global_step": 82712, "epoch": 1969} {"train_loss": -6.035470485687256, "global_step": 82713, "epoch": 1969} {"train_loss": -6.0887579917907715, "global_step": 82714, "epoch": 1969} {"train_loss": -6.1306915283203125, "global_step": 82715, "epoch": 1969} {"train_loss": -6.1465864181518555, "global_step": 82716, "epoch": 1969} {"train_loss": -6.093303680419922, "global_step": 82717, "epoch": 1969} {"train_loss": -6.108405113220215, "global_step": 82718, "epoch": 1969} {"train_loss": -6.159186363220215, "global_step": 82719, "epoch": 1969} {"train_loss": -6.1784443855285645, "global_step": 82720, "epoch": 1969} {"train_loss": -6.208965301513672, "global_step": 82721, "epoch": 1969} {"train_loss": -6.126508712768555, "global_step": 82722, "epoch": 1969} {"train_loss": -6.252162456512451, "global_step": 82723, "epoch": 1969} {"train_loss": -6.195841312408447, "global_step": 82724, "epoch": 1969} {"train_loss": -6.191859245300293, "global_step": 82725, "epoch": 1969} {"train_loss": -6.156633377075195, "global_step": 82726, "epoch": 1969} {"train_loss": -6.133840084075928, "global_step": 82727, "epoch": 1969} {"train_loss": -6.12540864944458, "global_step": 82728, "epoch": 1969} {"train_loss": -6.274936199188232, "global_step": 82729, "epoch": 1969} {"train_loss": -6.141629219055176, "global_step": 82730, "epoch": 1969} {"train_loss": -6.194607257843018, "global_step": 82731, "epoch": 1969} {"train_loss": -5.986920356750488, "global_step": 82732, "epoch": 1969} {"train_loss": -6.1666259765625, "global_step": 82733, "epoch": 1969} {"train_loss": -6.212212085723877, "global_step": 82734, "epoch": 1969} {"train_loss": -6.05239725112915, "global_step": 82735, "epoch": 1969} {"train_loss": -6.097470760345459, "global_step": 82736, "epoch": 1969} {"train_loss": -6.1338725090026855, "global_step": 82737, "epoch": 1969} {"train_loss": -6.006267547607422, "global_step": 82738, "epoch": 1969} {"train_loss": -6.144257920128958, "global_step": 82739, "epoch": 1969, "val_loss": 67871.46875} {"train_loss": -6.125905513763428, "global_step": 82740, "epoch": 1970} {"train_loss": -6.070101261138916, "global_step": 82741, "epoch": 1970} {"train_loss": -6.094692230224609, "global_step": 82742, "epoch": 1970} {"train_loss": -6.118265151977539, "global_step": 82743, "epoch": 1970} {"train_loss": -6.114151477813721, "global_step": 82744, "epoch": 1970} {"train_loss": -6.02666711807251, "global_step": 82745, "epoch": 1970} {"train_loss": -6.118801116943359, "global_step": 82746, "epoch": 1970} {"train_loss": -5.989882469177246, "global_step": 82747, "epoch": 1970} {"train_loss": -6.251491069793701, "global_step": 82748, "epoch": 1970} {"train_loss": -6.20436954498291, "global_step": 82749, "epoch": 1970} {"train_loss": -6.168525695800781, "global_step": 82750, "epoch": 1970} {"train_loss": -6.055543899536133, "global_step": 82751, "epoch": 1970} {"train_loss": -5.964251518249512, "global_step": 82752, "epoch": 1970} {"train_loss": -6.078121185302734, "global_step": 82753, "epoch": 1970} {"train_loss": -6.158135414123535, "global_step": 82754, "epoch": 1970} {"train_loss": -6.107386589050293, "global_step": 82755, "epoch": 1970} {"train_loss": -6.0840044021606445, "global_step": 82756, "epoch": 1970} {"train_loss": -6.197490692138672, "global_step": 82757, "epoch": 1970} {"train_loss": -6.058575630187988, "global_step": 82758, "epoch": 1970} {"train_loss": -6.0831451416015625, "global_step": 82759, "epoch": 1970} {"train_loss": -5.987379550933838, "global_step": 82760, "epoch": 1970} {"train_loss": -6.072167873382568, "global_step": 82761, "epoch": 1970} {"train_loss": -6.046850681304932, "global_step": 82762, "epoch": 1970} {"train_loss": -6.22810173034668, "global_step": 82763, "epoch": 1970} {"train_loss": -6.099613666534424, "global_step": 82764, "epoch": 1970} {"train_loss": -6.116953372955322, "global_step": 82765, "epoch": 1970} {"train_loss": -6.135324954986572, "global_step": 82766, "epoch": 1970} {"train_loss": -6.0321502685546875, "global_step": 82767, "epoch": 1970} {"train_loss": -6.224072456359863, "global_step": 82768, "epoch": 1970} {"train_loss": -6.088307857513428, "global_step": 82769, "epoch": 1970} {"train_loss": -6.174526214599609, "global_step": 82770, "epoch": 1970} {"train_loss": -6.09099817276001, "global_step": 82771, "epoch": 1970} {"train_loss": -6.031749248504639, "global_step": 82772, "epoch": 1970} {"train_loss": -6.071796894073486, "global_step": 82773, "epoch": 1970} {"train_loss": -6.057895660400391, "global_step": 82774, "epoch": 1970} {"train_loss": -6.07305908203125, "global_step": 82775, "epoch": 1970} {"train_loss": -6.1719794273376465, "global_step": 82776, "epoch": 1970} {"train_loss": -6.102545738220215, "global_step": 82777, "epoch": 1970} {"train_loss": -6.047194480895996, "global_step": 82778, "epoch": 1970} {"train_loss": -5.961297512054443, "global_step": 82779, "epoch": 1970} {"train_loss": -6.130047798156738, "global_step": 82780, "epoch": 1970} {"train_loss": -6.0979750497000555, "global_step": 82781, "epoch": 1970, "val_loss": 67860.078125} {"train_loss": -5.964034557342529, "global_step": 82782, "epoch": 1971} {"train_loss": -6.127234935760498, "global_step": 82783, "epoch": 1971} {"train_loss": -5.962069511413574, "global_step": 82784, "epoch": 1971} {"train_loss": -6.1622633934021, "global_step": 82785, "epoch": 1971} {"train_loss": -5.950106620788574, "global_step": 82786, "epoch": 1971} {"train_loss": -6.108400344848633, "global_step": 82787, "epoch": 1971} {"train_loss": -6.043392181396484, "global_step": 82788, "epoch": 1971} {"train_loss": -6.062705039978027, "global_step": 82789, "epoch": 1971} {"train_loss": -6.100741386413574, "global_step": 82790, "epoch": 1971} {"train_loss": -6.143469333648682, "global_step": 82791, "epoch": 1971} {"train_loss": -6.017539978027344, "global_step": 82792, "epoch": 1971} {"train_loss": -6.144112586975098, "global_step": 82793, "epoch": 1971} {"train_loss": -6.192973613739014, "global_step": 82794, "epoch": 1971} {"train_loss": -6.134987831115723, "global_step": 82795, "epoch": 1971} {"train_loss": -6.230940341949463, "global_step": 82796, "epoch": 1971} {"train_loss": -6.201145172119141, "global_step": 82797, "epoch": 1971} {"train_loss": -6.197671890258789, "global_step": 82798, "epoch": 1971} {"train_loss": -6.091161727905273, "global_step": 82799, "epoch": 1971} {"train_loss": -6.108011245727539, "global_step": 82800, "epoch": 1971} {"train_loss": -6.0240068435668945, "global_step": 82801, "epoch": 1971} {"train_loss": -6.056532382965088, "global_step": 82802, "epoch": 1971} {"train_loss": -6.075092315673828, "global_step": 82803, "epoch": 1971} {"train_loss": -6.182513236999512, "global_step": 82804, "epoch": 1971} {"train_loss": -6.1760969161987305, "global_step": 82805, "epoch": 1971} {"train_loss": -5.980837821960449, "global_step": 82806, "epoch": 1971} {"train_loss": -6.204736709594727, "global_step": 82807, "epoch": 1971} {"train_loss": -6.048314571380615, "global_step": 82808, "epoch": 1971} {"train_loss": -6.170152187347412, "global_step": 82809, "epoch": 1971} {"train_loss": -6.157848834991455, "global_step": 82810, "epoch": 1971} {"train_loss": -6.15065860748291, "global_step": 82811, "epoch": 1971} {"train_loss": -6.060702323913574, "global_step": 82812, "epoch": 1971} {"train_loss": -6.111527442932129, "global_step": 82813, "epoch": 1971} {"train_loss": -6.2168731689453125, "global_step": 82814, "epoch": 1971} {"train_loss": -6.242228984832764, "global_step": 82815, "epoch": 1971} {"train_loss": -6.1492109298706055, "global_step": 82816, "epoch": 1971} {"train_loss": -6.100080966949463, "global_step": 82817, "epoch": 1971} {"train_loss": -6.0988969802856445, "global_step": 82818, "epoch": 1971} {"train_loss": -6.079814434051514, "global_step": 82819, "epoch": 1971} {"train_loss": -6.110381126403809, "global_step": 82820, "epoch": 1971} {"train_loss": -6.152689456939697, "global_step": 82821, "epoch": 1971} {"train_loss": -6.197339057922363, "global_step": 82822, "epoch": 1971} {"train_loss": -6.117898464202881, "global_step": 82823, "epoch": 1971, "val_loss": 67664.2734375} {"train_loss": -6.254425048828125, "global_step": 82824, "epoch": 1972} {"train_loss": -6.04918098449707, "global_step": 82825, "epoch": 1972} {"train_loss": -6.155780792236328, "global_step": 82826, "epoch": 1972} {"train_loss": -6.163248538970947, "global_step": 82827, "epoch": 1972} {"train_loss": -6.136044025421143, "global_step": 82828, "epoch": 1972} {"train_loss": -6.266232490539551, "global_step": 82829, "epoch": 1972} {"train_loss": -6.207223892211914, "global_step": 82830, "epoch": 1972} {"train_loss": -6.110947132110596, "global_step": 82831, "epoch": 1972} {"train_loss": -6.253340721130371, "global_step": 82832, "epoch": 1972} {"train_loss": -6.171517372131348, "global_step": 82833, "epoch": 1972} {"train_loss": -6.122552394866943, "global_step": 82834, "epoch": 1972} {"train_loss": -6.084480285644531, "global_step": 82835, "epoch": 1972} {"train_loss": -6.194293975830078, "global_step": 82836, "epoch": 1972} {"train_loss": -6.18631649017334, "global_step": 82837, "epoch": 1972} {"train_loss": -6.140981674194336, "global_step": 82838, "epoch": 1972} {"train_loss": -6.205773830413818, "global_step": 82839, "epoch": 1972} {"train_loss": -6.175531387329102, "global_step": 82840, "epoch": 1972} {"train_loss": -6.158995151519775, "global_step": 82841, "epoch": 1972} {"train_loss": -6.104815483093262, "global_step": 82842, "epoch": 1972} {"train_loss": -6.169351100921631, "global_step": 82843, "epoch": 1972} {"train_loss": -6.224709510803223, "global_step": 82844, "epoch": 1972} {"train_loss": -6.009583473205566, "global_step": 82845, "epoch": 1972} {"train_loss": -6.1534881591796875, "global_step": 82846, "epoch": 1972} {"train_loss": -6.082704544067383, "global_step": 82847, "epoch": 1972} {"train_loss": -6.268575668334961, "global_step": 82848, "epoch": 1972} {"train_loss": -6.1409196853637695, "global_step": 82849, "epoch": 1972} {"train_loss": -6.216422080993652, "global_step": 82850, "epoch": 1972} {"train_loss": -6.19104528427124, "global_step": 82851, "epoch": 1972} {"train_loss": -6.257613182067871, "global_step": 82852, "epoch": 1972} {"train_loss": -6.182066917419434, "global_step": 82853, "epoch": 1972} {"train_loss": -6.143437385559082, "global_step": 82854, "epoch": 1972} {"train_loss": -6.191310882568359, "global_step": 82855, "epoch": 1972} {"train_loss": -6.237184524536133, "global_step": 82856, "epoch": 1972} {"train_loss": -6.215926170349121, "global_step": 82857, "epoch": 1972} {"train_loss": -6.197480201721191, "global_step": 82858, "epoch": 1972} {"train_loss": -6.242883682250977, "global_step": 82859, "epoch": 1972} {"train_loss": -6.209184646606445, "global_step": 82860, "epoch": 1972} {"train_loss": -6.175137519836426, "global_step": 82861, "epoch": 1972} {"train_loss": -6.156592845916748, "global_step": 82862, "epoch": 1972} {"train_loss": -6.1483001708984375, "global_step": 82863, "epoch": 1972} {"train_loss": -6.077724456787109, "global_step": 82864, "epoch": 1972} {"train_loss": -6.1722003391810825, "global_step": 82865, "epoch": 1972, "val_loss": 67672.71875} {"train_loss": -6.1422576904296875, "global_step": 82866, "epoch": 1973} {"train_loss": -6.255398750305176, "global_step": 82867, "epoch": 1973} {"train_loss": -6.174252510070801, "global_step": 82868, "epoch": 1973} {"train_loss": -6.303152084350586, "global_step": 82869, "epoch": 1973} {"train_loss": -6.233233451843262, "global_step": 82870, "epoch": 1973} {"train_loss": -6.237412452697754, "global_step": 82871, "epoch": 1973} {"train_loss": -6.172992706298828, "global_step": 82872, "epoch": 1973} {"train_loss": -6.05175256729126, "global_step": 82873, "epoch": 1973} {"train_loss": -6.206066608428955, "global_step": 82874, "epoch": 1973} {"train_loss": -6.146610736846924, "global_step": 82875, "epoch": 1973} {"train_loss": -6.155848503112793, "global_step": 82876, "epoch": 1973} {"train_loss": -6.214725494384766, "global_step": 82877, "epoch": 1973} {"train_loss": -6.166959762573242, "global_step": 82878, "epoch": 1973} {"train_loss": -6.179440021514893, "global_step": 82879, "epoch": 1973} {"train_loss": -6.096983909606934, "global_step": 82880, "epoch": 1973} {"train_loss": -6.145553112030029, "global_step": 82881, "epoch": 1973} {"train_loss": -6.201667308807373, "global_step": 82882, "epoch": 1973} {"train_loss": -6.1414794921875, "global_step": 82883, "epoch": 1973} {"train_loss": -6.122532844543457, "global_step": 82884, "epoch": 1973} {"train_loss": -6.170096397399902, "global_step": 82885, "epoch": 1973} {"train_loss": -6.2039384841918945, "global_step": 82886, "epoch": 1973} {"train_loss": -6.1492767333984375, "global_step": 82887, "epoch": 1973} {"train_loss": -6.097326278686523, "global_step": 82888, "epoch": 1973} {"train_loss": -6.122082710266113, "global_step": 82889, "epoch": 1973} {"train_loss": -6.172983169555664, "global_step": 82890, "epoch": 1973} {"train_loss": -6.100758075714111, "global_step": 82891, "epoch": 1973} {"train_loss": -6.024300575256348, "global_step": 82892, "epoch": 1973} {"train_loss": -6.166518688201904, "global_step": 82893, "epoch": 1973} {"train_loss": -6.002662181854248, "global_step": 82894, "epoch": 1973} {"train_loss": -6.183558464050293, "global_step": 82895, "epoch": 1973} {"train_loss": -6.167716979980469, "global_step": 82896, "epoch": 1973} {"train_loss": -6.192521095275879, "global_step": 82897, "epoch": 1973} {"train_loss": -6.111268520355225, "global_step": 82898, "epoch": 1973} {"train_loss": -6.105722427368164, "global_step": 82899, "epoch": 1973} {"train_loss": -6.209521770477295, "global_step": 82900, "epoch": 1973} {"train_loss": -6.102486610412598, "global_step": 82901, "epoch": 1973} {"train_loss": -6.141186714172363, "global_step": 82902, "epoch": 1973} {"train_loss": -6.1219892501831055, "global_step": 82903, "epoch": 1973} {"train_loss": -6.132088661193848, "global_step": 82904, "epoch": 1973} {"train_loss": -6.038237571716309, "global_step": 82905, "epoch": 1973} {"train_loss": -6.247662544250488, "global_step": 82906, "epoch": 1973} {"train_loss": -6.156159344173613, "global_step": 82907, "epoch": 1973, "val_loss": 67568.9140625} {"train_loss": -6.130063533782959, "global_step": 82908, "epoch": 1974} {"train_loss": -6.227633476257324, "global_step": 82909, "epoch": 1974} {"train_loss": -6.054670333862305, "global_step": 82910, "epoch": 1974} {"train_loss": -6.183686256408691, "global_step": 82911, "epoch": 1974} {"train_loss": -6.17623233795166, "global_step": 82912, "epoch": 1974} {"train_loss": -6.182895183563232, "global_step": 82913, "epoch": 1974} {"train_loss": -6.271512031555176, "global_step": 82914, "epoch": 1974} {"train_loss": -6.151869773864746, "global_step": 82915, "epoch": 1974} {"train_loss": -6.131402969360352, "global_step": 82916, "epoch": 1974} {"train_loss": -6.269457817077637, "global_step": 82917, "epoch": 1974} {"train_loss": -6.1912384033203125, "global_step": 82918, "epoch": 1974} {"train_loss": -6.206705093383789, "global_step": 82919, "epoch": 1974} {"train_loss": -6.0245513916015625, "global_step": 82920, "epoch": 1974} {"train_loss": -6.231535911560059, "global_step": 82921, "epoch": 1974} {"train_loss": -6.199067115783691, "global_step": 82922, "epoch": 1974} {"train_loss": -6.190320014953613, "global_step": 82923, "epoch": 1974} {"train_loss": -6.247383117675781, "global_step": 82924, "epoch": 1974} {"train_loss": -6.2003254890441895, "global_step": 82925, "epoch": 1974} {"train_loss": -6.171090126037598, "global_step": 82926, "epoch": 1974} {"train_loss": -6.289737701416016, "global_step": 82927, "epoch": 1974} {"train_loss": -6.257564544677734, "global_step": 82928, "epoch": 1974} {"train_loss": -6.126907825469971, "global_step": 82929, "epoch": 1974} {"train_loss": -6.248996257781982, "global_step": 82930, "epoch": 1974} {"train_loss": -6.291226387023926, "global_step": 82931, "epoch": 1974} {"train_loss": -6.044757843017578, "global_step": 82932, "epoch": 1974} {"train_loss": -6.0424299240112305, "global_step": 82933, "epoch": 1974} {"train_loss": -6.201157569885254, "global_step": 82934, "epoch": 1974} {"train_loss": -6.07725715637207, "global_step": 82935, "epoch": 1974} {"train_loss": -6.312429428100586, "global_step": 82936, "epoch": 1974} {"train_loss": -6.149349212646484, "global_step": 82937, "epoch": 1974} {"train_loss": -6.343921661376953, "global_step": 82938, "epoch": 1974} {"train_loss": -6.084879398345947, "global_step": 82939, "epoch": 1974} {"train_loss": -6.221372604370117, "global_step": 82940, "epoch": 1974} {"train_loss": -6.130223274230957, "global_step": 82941, "epoch": 1974} {"train_loss": -6.117142677307129, "global_step": 82942, "epoch": 1974} {"train_loss": -6.099232196807861, "global_step": 82943, "epoch": 1974} {"train_loss": -6.2274627685546875, "global_step": 82944, "epoch": 1974} {"train_loss": -6.0899858474731445, "global_step": 82945, "epoch": 1974} {"train_loss": -6.245548725128174, "global_step": 82946, "epoch": 1974} {"train_loss": -6.135036468505859, "global_step": 82947, "epoch": 1974} {"train_loss": -6.277690887451172, "global_step": 82948, "epoch": 1974} {"train_loss": -6.183577696482341, "global_step": 82949, "epoch": 1974, "val_loss": 67648.6796875} {"train_loss": -6.173102378845215, "global_step": 82950, "epoch": 1975} {"train_loss": -6.136346340179443, "global_step": 82951, "epoch": 1975} {"train_loss": -6.244935989379883, "global_step": 82952, "epoch": 1975} {"train_loss": -6.138272762298584, "global_step": 82953, "epoch": 1975} {"train_loss": -6.1738080978393555, "global_step": 82954, "epoch": 1975} {"train_loss": -6.158420085906982, "global_step": 82955, "epoch": 1975} {"train_loss": -6.162384986877441, "global_step": 82956, "epoch": 1975} {"train_loss": -6.1381707191467285, "global_step": 82957, "epoch": 1975} {"train_loss": -6.040135383605957, "global_step": 82958, "epoch": 1975} {"train_loss": -6.200194358825684, "global_step": 82959, "epoch": 1975} {"train_loss": -6.081225395202637, "global_step": 82960, "epoch": 1975} {"train_loss": -6.221162796020508, "global_step": 82961, "epoch": 1975} {"train_loss": -6.069133758544922, "global_step": 82962, "epoch": 1975} {"train_loss": -6.192094802856445, "global_step": 82963, "epoch": 1975} {"train_loss": -6.122594833374023, "global_step": 82964, "epoch": 1975} {"train_loss": -6.118770122528076, "global_step": 82965, "epoch": 1975} {"train_loss": -6.1732048988342285, "global_step": 82966, "epoch": 1975} {"train_loss": -5.994443893432617, "global_step": 82967, "epoch": 1975} {"train_loss": -6.034996509552002, "global_step": 82968, "epoch": 1975} {"train_loss": -6.110174179077148, "global_step": 82969, "epoch": 1975} {"train_loss": -6.037092685699463, "global_step": 82970, "epoch": 1975} {"train_loss": -5.976546764373779, "global_step": 82971, "epoch": 1975} {"train_loss": -5.943164825439453, "global_step": 82972, "epoch": 1975} {"train_loss": -5.89566707611084, "global_step": 82973, "epoch": 1975} {"train_loss": -6.15499210357666, "global_step": 82974, "epoch": 1975} {"train_loss": -5.899575233459473, "global_step": 82975, "epoch": 1975} {"train_loss": -6.0743207931518555, "global_step": 82976, "epoch": 1975} {"train_loss": -5.9668731689453125, "global_step": 82977, "epoch": 1975} {"train_loss": -6.113380432128906, "global_step": 82978, "epoch": 1975} {"train_loss": -6.169018268585205, "global_step": 82979, "epoch": 1975} {"train_loss": -5.9398908615112305, "global_step": 82980, "epoch": 1975} {"train_loss": -6.043265342712402, "global_step": 82981, "epoch": 1975} {"train_loss": -5.9683332443237305, "global_step": 82982, "epoch": 1975} {"train_loss": -6.151474952697754, "global_step": 82983, "epoch": 1975} {"train_loss": -6.099465370178223, "global_step": 82984, "epoch": 1975} {"train_loss": -6.196001052856445, "global_step": 82985, "epoch": 1975} {"train_loss": -6.1539201736450195, "global_step": 82986, "epoch": 1975} {"train_loss": -6.268675327301025, "global_step": 82987, "epoch": 1975} {"train_loss": -6.2034101486206055, "global_step": 82988, "epoch": 1975} {"train_loss": -6.0395708084106445, "global_step": 82989, "epoch": 1975} {"train_loss": -6.1262078285217285, "global_step": 82990, "epoch": 1975} {"train_loss": -6.101494834536598, "global_step": 82991, "epoch": 1975, "val_loss": 67678.5390625} {"train_loss": -6.204714298248291, "global_step": 82992, "epoch": 1976} {"train_loss": -6.111157417297363, "global_step": 82993, "epoch": 1976} {"train_loss": -6.152996063232422, "global_step": 82994, "epoch": 1976} {"train_loss": -6.1201066970825195, "global_step": 82995, "epoch": 1976} {"train_loss": -6.068304538726807, "global_step": 82996, "epoch": 1976} {"train_loss": -6.158779144287109, "global_step": 82997, "epoch": 1976} {"train_loss": -6.159088134765625, "global_step": 82998, "epoch": 1976} {"train_loss": -6.0794477462768555, "global_step": 82999, "epoch": 1976} {"train_loss": -6.201879978179932, "global_step": 83000, "epoch": 1976} {"train_loss": -6.122842788696289, "global_step": 83001, "epoch": 1976} {"train_loss": -6.109574317932129, "global_step": 83002, "epoch": 1976} {"train_loss": -6.26909875869751, "global_step": 83003, "epoch": 1976} {"train_loss": -6.268125057220459, "global_step": 83004, "epoch": 1976} {"train_loss": -6.096376419067383, "global_step": 83005, "epoch": 1976} {"train_loss": -6.155584335327148, "global_step": 83006, "epoch": 1976} {"train_loss": -6.111533164978027, "global_step": 83007, "epoch": 1976} {"train_loss": -6.13020133972168, "global_step": 83008, "epoch": 1976} {"train_loss": -6.170019149780273, "global_step": 83009, "epoch": 1976} {"train_loss": -6.123727321624756, "global_step": 83010, "epoch": 1976} {"train_loss": -6.179848670959473, "global_step": 83011, "epoch": 1976} {"train_loss": -6.151336669921875, "global_step": 83012, "epoch": 1976} {"train_loss": -6.191861152648926, "global_step": 83013, "epoch": 1976} {"train_loss": -6.20704460144043, "global_step": 83014, "epoch": 1976} {"train_loss": -6.144962787628174, "global_step": 83015, "epoch": 1976} {"train_loss": -6.171157360076904, "global_step": 83016, "epoch": 1976} {"train_loss": -6.228322505950928, "global_step": 83017, "epoch": 1976} {"train_loss": -6.0469279289245605, "global_step": 83018, "epoch": 1976} {"train_loss": -6.195488929748535, "global_step": 83019, "epoch": 1976} {"train_loss": -6.227002143859863, "global_step": 83020, "epoch": 1976} {"train_loss": -6.210568904876709, "global_step": 83021, "epoch": 1976} {"train_loss": -6.199938774108887, "global_step": 83022, "epoch": 1976} {"train_loss": -6.1539716720581055, "global_step": 83023, "epoch": 1976} {"train_loss": -6.124545097351074, "global_step": 83024, "epoch": 1976} {"train_loss": -6.058350086212158, "global_step": 83025, "epoch": 1976} {"train_loss": -6.239344120025635, "global_step": 83026, "epoch": 1976} {"train_loss": -6.220181941986084, "global_step": 83027, "epoch": 1976} {"train_loss": -6.264713287353516, "global_step": 83028, "epoch": 1976} {"train_loss": -6.210014820098877, "global_step": 83029, "epoch": 1976} {"train_loss": -6.201425552368164, "global_step": 83030, "epoch": 1976} {"train_loss": -6.221873760223389, "global_step": 83031, "epoch": 1976} {"train_loss": -6.096570014953613, "global_step": 83032, "epoch": 1976} {"train_loss": -6.1649260975065685, "global_step": 83033, "epoch": 1976, "val_loss": 67870.2109375} {"train_loss": -6.150865077972412, "global_step": 83034, "epoch": 1977} {"train_loss": -6.066642761230469, "global_step": 83035, "epoch": 1977} {"train_loss": -6.156261444091797, "global_step": 83036, "epoch": 1977} {"train_loss": -6.200338363647461, "global_step": 83037, "epoch": 1977} {"train_loss": -6.267084121704102, "global_step": 83038, "epoch": 1977} {"train_loss": -6.193940162658691, "global_step": 83039, "epoch": 1977} {"train_loss": -6.168766021728516, "global_step": 83040, "epoch": 1977} {"train_loss": -6.193108081817627, "global_step": 83041, "epoch": 1977} {"train_loss": -6.249157905578613, "global_step": 83042, "epoch": 1977} {"train_loss": -6.18726110458374, "global_step": 83043, "epoch": 1977} {"train_loss": -6.2079620361328125, "global_step": 83044, "epoch": 1977} {"train_loss": -6.173558235168457, "global_step": 83045, "epoch": 1977} {"train_loss": -6.220026016235352, "global_step": 83046, "epoch": 1977} {"train_loss": -6.222909450531006, "global_step": 83047, "epoch": 1977} {"train_loss": -6.14600944519043, "global_step": 83048, "epoch": 1977} {"train_loss": -6.357680320739746, "global_step": 83049, "epoch": 1977} {"train_loss": -6.237595081329346, "global_step": 83050, "epoch": 1977} {"train_loss": -6.27677583694458, "global_step": 83051, "epoch": 1977} {"train_loss": -6.179214954376221, "global_step": 83052, "epoch": 1977} {"train_loss": -6.289306640625, "global_step": 83053, "epoch": 1977} {"train_loss": -6.115409851074219, "global_step": 83054, "epoch": 1977} {"train_loss": -6.075151443481445, "global_step": 83055, "epoch": 1977} {"train_loss": -6.189521789550781, "global_step": 83056, "epoch": 1977} {"train_loss": -6.18304967880249, "global_step": 83057, "epoch": 1977} {"train_loss": -6.165310859680176, "global_step": 83058, "epoch": 1977} {"train_loss": -6.195248603820801, "global_step": 83059, "epoch": 1977} {"train_loss": -6.228989124298096, "global_step": 83060, "epoch": 1977} {"train_loss": -6.192344665527344, "global_step": 83061, "epoch": 1977} {"train_loss": -6.125722885131836, "global_step": 83062, "epoch": 1977} {"train_loss": -6.317810535430908, "global_step": 83063, "epoch": 1977} {"train_loss": -6.271818161010742, "global_step": 83064, "epoch": 1977} {"train_loss": -6.273462295532227, "global_step": 83065, "epoch": 1977} {"train_loss": -6.170300483703613, "global_step": 83066, "epoch": 1977} {"train_loss": -6.180627822875977, "global_step": 83067, "epoch": 1977} {"train_loss": -6.1322221755981445, "global_step": 83068, "epoch": 1977} {"train_loss": -6.18705940246582, "global_step": 83069, "epoch": 1977} {"train_loss": -6.093809127807617, "global_step": 83070, "epoch": 1977} {"train_loss": -6.214707374572754, "global_step": 83071, "epoch": 1977} {"train_loss": -6.243903636932373, "global_step": 83072, "epoch": 1977} {"train_loss": -6.117469310760498, "global_step": 83073, "epoch": 1977} {"train_loss": -6.259828567504883, "global_step": 83074, "epoch": 1977} {"train_loss": -6.1944262981414795, "global_step": 83075, "epoch": 1977, "val_loss": 67729.3515625} {"train_loss": -6.199042320251465, "global_step": 83076, "epoch": 1978} {"train_loss": -6.120088577270508, "global_step": 83077, "epoch": 1978} {"train_loss": -6.138978481292725, "global_step": 83078, "epoch": 1978} {"train_loss": -6.1117448806762695, "global_step": 83079, "epoch": 1978} {"train_loss": -6.140923023223877, "global_step": 83080, "epoch": 1978} {"train_loss": -6.109045505523682, "global_step": 83081, "epoch": 1978} {"train_loss": -6.18434476852417, "global_step": 83082, "epoch": 1978} {"train_loss": -6.090759754180908, "global_step": 83083, "epoch": 1978} {"train_loss": -6.135781288146973, "global_step": 83084, "epoch": 1978} {"train_loss": -6.140933990478516, "global_step": 83085, "epoch": 1978} {"train_loss": -6.094075679779053, "global_step": 83086, "epoch": 1978} {"train_loss": -6.051292896270752, "global_step": 83087, "epoch": 1978} {"train_loss": -6.153196334838867, "global_step": 83088, "epoch": 1978} {"train_loss": -6.183540344238281, "global_step": 83089, "epoch": 1978} {"train_loss": -6.141695976257324, "global_step": 83090, "epoch": 1978} {"train_loss": -6.044734001159668, "global_step": 83091, "epoch": 1978} {"train_loss": -6.1369829177856445, "global_step": 83092, "epoch": 1978} {"train_loss": -6.226629257202148, "global_step": 83093, "epoch": 1978} {"train_loss": -6.250528335571289, "global_step": 83094, "epoch": 1978} {"train_loss": -6.121115684509277, "global_step": 83095, "epoch": 1978} {"train_loss": -6.164968490600586, "global_step": 83096, "epoch": 1978} {"train_loss": -6.211847305297852, "global_step": 83097, "epoch": 1978} {"train_loss": -6.188932418823242, "global_step": 83098, "epoch": 1978} {"train_loss": -6.1473588943481445, "global_step": 83099, "epoch": 1978} {"train_loss": -6.253933906555176, "global_step": 83100, "epoch": 1978} {"train_loss": -6.190003395080566, "global_step": 83101, "epoch": 1978} {"train_loss": -6.159359931945801, "global_step": 83102, "epoch": 1978} {"train_loss": -6.255663871765137, "global_step": 83103, "epoch": 1978} {"train_loss": -6.0820722579956055, "global_step": 83104, "epoch": 1978} {"train_loss": -6.098318099975586, "global_step": 83105, "epoch": 1978} {"train_loss": -6.213587760925293, "global_step": 83106, "epoch": 1978} {"train_loss": -6.1961989402771, "global_step": 83107, "epoch": 1978} {"train_loss": -6.0914106369018555, "global_step": 83108, "epoch": 1978} {"train_loss": -6.217051982879639, "global_step": 83109, "epoch": 1978} {"train_loss": -6.096088886260986, "global_step": 83110, "epoch": 1978} {"train_loss": -6.103701591491699, "global_step": 83111, "epoch": 1978} {"train_loss": -6.260225772857666, "global_step": 83112, "epoch": 1978} {"train_loss": -6.0883402824401855, "global_step": 83113, "epoch": 1978} {"train_loss": -6.139588356018066, "global_step": 83114, "epoch": 1978} {"train_loss": -6.1277618408203125, "global_step": 83115, "epoch": 1978} {"train_loss": -6.0928544998168945, "global_step": 83116, "epoch": 1978} {"train_loss": -6.147280193510509, "global_step": 83117, "epoch": 1978, "val_loss": 67792.875} {"train_loss": -6.035165786743164, "global_step": 83118, "epoch": 1979} {"train_loss": -6.16367769241333, "global_step": 83119, "epoch": 1979} {"train_loss": -6.116127967834473, "global_step": 83120, "epoch": 1979} {"train_loss": -6.211162567138672, "global_step": 83121, "epoch": 1979} {"train_loss": -6.065473556518555, "global_step": 83122, "epoch": 1979} {"train_loss": -6.0968017578125, "global_step": 83123, "epoch": 1979} {"train_loss": -6.168656826019287, "global_step": 83124, "epoch": 1979} {"train_loss": -6.078090667724609, "global_step": 83125, "epoch": 1979} {"train_loss": -6.215743064880371, "global_step": 83126, "epoch": 1979} {"train_loss": -6.023821830749512, "global_step": 83127, "epoch": 1979} {"train_loss": -6.086699485778809, "global_step": 83128, "epoch": 1979} {"train_loss": -6.150298118591309, "global_step": 83129, "epoch": 1979} {"train_loss": -6.178239822387695, "global_step": 83130, "epoch": 1979} {"train_loss": -6.2056732177734375, "global_step": 83131, "epoch": 1979} {"train_loss": -6.209512710571289, "global_step": 83132, "epoch": 1979} {"train_loss": -6.175435543060303, "global_step": 83133, "epoch": 1979} {"train_loss": -6.257219314575195, "global_step": 83134, "epoch": 1979} {"train_loss": -6.195642948150635, "global_step": 83135, "epoch": 1979} {"train_loss": -6.281950950622559, "global_step": 83136, "epoch": 1979} {"train_loss": -6.183320999145508, "global_step": 83137, "epoch": 1979} {"train_loss": -6.16367244720459, "global_step": 83138, "epoch": 1979} {"train_loss": -6.133211135864258, "global_step": 83139, "epoch": 1979} {"train_loss": -6.163124084472656, "global_step": 83140, "epoch": 1979} {"train_loss": -6.232259750366211, "global_step": 83141, "epoch": 1979} {"train_loss": -6.142385482788086, "global_step": 83142, "epoch": 1979} {"train_loss": -6.295109748840332, "global_step": 83143, "epoch": 1979} {"train_loss": -6.161649703979492, "global_step": 83144, "epoch": 1979} {"train_loss": -6.134270668029785, "global_step": 83145, "epoch": 1979} {"train_loss": -6.169155597686768, "global_step": 83146, "epoch": 1979} {"train_loss": -6.129065990447998, "global_step": 83147, "epoch": 1979} {"train_loss": -5.9961748123168945, "global_step": 83148, "epoch": 1979} {"train_loss": -6.158809185028076, "global_step": 83149, "epoch": 1979} {"train_loss": -6.084107398986816, "global_step": 83150, "epoch": 1979} {"train_loss": -6.109709739685059, "global_step": 83151, "epoch": 1979} {"train_loss": -6.037268161773682, "global_step": 83152, "epoch": 1979} {"train_loss": -6.099373817443848, "global_step": 83153, "epoch": 1979} {"train_loss": -6.079233646392822, "global_step": 83154, "epoch": 1979} {"train_loss": -5.9609904289245605, "global_step": 83155, "epoch": 1979} {"train_loss": -6.276060104370117, "global_step": 83156, "epoch": 1979} {"train_loss": -6.1171112060546875, "global_step": 83157, "epoch": 1979} {"train_loss": -6.205480575561523, "global_step": 83158, "epoch": 1979} {"train_loss": -6.144958530153547, "global_step": 83159, "epoch": 1979, "val_loss": 68032.9140625} {"train_loss": -6.096569538116455, "global_step": 83160, "epoch": 1980} {"train_loss": -6.021163463592529, "global_step": 83161, "epoch": 1980} {"train_loss": -6.104934215545654, "global_step": 83162, "epoch": 1980} {"train_loss": -6.170539855957031, "global_step": 83163, "epoch": 1980} {"train_loss": -6.165066719055176, "global_step": 83164, "epoch": 1980} {"train_loss": -6.018963813781738, "global_step": 83165, "epoch": 1980} {"train_loss": -6.205368518829346, "global_step": 83166, "epoch": 1980} {"train_loss": -6.185210704803467, "global_step": 83167, "epoch": 1980} {"train_loss": -6.158323287963867, "global_step": 83168, "epoch": 1980} {"train_loss": -6.209098815917969, "global_step": 83169, "epoch": 1980} {"train_loss": -6.166144847869873, "global_step": 83170, "epoch": 1980} {"train_loss": -6.0375261306762695, "global_step": 83171, "epoch": 1980} {"train_loss": -6.134454727172852, "global_step": 83172, "epoch": 1980} {"train_loss": -6.119140625, "global_step": 83173, "epoch": 1980} {"train_loss": -6.252631664276123, "global_step": 83174, "epoch": 1980} {"train_loss": -6.103933334350586, "global_step": 83175, "epoch": 1980} {"train_loss": -6.174267768859863, "global_step": 83176, "epoch": 1980} {"train_loss": -6.1725568771362305, "global_step": 83177, "epoch": 1980} {"train_loss": -6.27769660949707, "global_step": 83178, "epoch": 1980} {"train_loss": -6.105593681335449, "global_step": 83179, "epoch": 1980} {"train_loss": -6.069624900817871, "global_step": 83180, "epoch": 1980} {"train_loss": -6.099702835083008, "global_step": 83181, "epoch": 1980} {"train_loss": -6.007817268371582, "global_step": 83182, "epoch": 1980} {"train_loss": -6.084744453430176, "global_step": 83183, "epoch": 1980} {"train_loss": -6.047730922698975, "global_step": 83184, "epoch": 1980} {"train_loss": -6.173086643218994, "global_step": 83185, "epoch": 1980} {"train_loss": -6.067509651184082, "global_step": 83186, "epoch": 1980} {"train_loss": -6.110476493835449, "global_step": 83187, "epoch": 1980} {"train_loss": -6.072174549102783, "global_step": 83188, "epoch": 1980} {"train_loss": -5.946482181549072, "global_step": 83189, "epoch": 1980} {"train_loss": -5.951706886291504, "global_step": 83190, "epoch": 1980} {"train_loss": -5.986147880554199, "global_step": 83191, "epoch": 1980} {"train_loss": -6.023791313171387, "global_step": 83192, "epoch": 1980} {"train_loss": -6.148911476135254, "global_step": 83193, "epoch": 1980} {"train_loss": -6.169004440307617, "global_step": 83194, "epoch": 1980} {"train_loss": -6.139016151428223, "global_step": 83195, "epoch": 1980} {"train_loss": -6.200615406036377, "global_step": 83196, "epoch": 1980} {"train_loss": -6.201934814453125, "global_step": 83197, "epoch": 1980} {"train_loss": -6.028014183044434, "global_step": 83198, "epoch": 1980} {"train_loss": -6.211404323577881, "global_step": 83199, "epoch": 1980} {"train_loss": -6.171483516693115, "global_step": 83200, "epoch": 1980} {"train_loss": -6.120428596224103, "global_step": 83201, "epoch": 1980, "val_loss": 68006.9296875} {"train_loss": -6.104565143585205, "global_step": 83202, "epoch": 1981} {"train_loss": -6.091012954711914, "global_step": 83203, "epoch": 1981} {"train_loss": -6.1526689529418945, "global_step": 83204, "epoch": 1981} {"train_loss": -6.200780868530273, "global_step": 83205, "epoch": 1981} {"train_loss": -6.13124418258667, "global_step": 83206, "epoch": 1981} {"train_loss": -6.118884086608887, "global_step": 83207, "epoch": 1981} {"train_loss": -6.193553924560547, "global_step": 83208, "epoch": 1981} {"train_loss": -6.205544471740723, "global_step": 83209, "epoch": 1981} {"train_loss": -6.207573413848877, "global_step": 83210, "epoch": 1981} {"train_loss": -6.109129428863525, "global_step": 83211, "epoch": 1981} {"train_loss": -6.104368686676025, "global_step": 83212, "epoch": 1981} {"train_loss": -6.220715522766113, "global_step": 83213, "epoch": 1981} {"train_loss": -6.136839866638184, "global_step": 83214, "epoch": 1981} {"train_loss": -6.124195098876953, "global_step": 83215, "epoch": 1981} {"train_loss": -6.2945966720581055, "global_step": 83216, "epoch": 1981} {"train_loss": -6.183357238769531, "global_step": 83217, "epoch": 1981} {"train_loss": -6.216127395629883, "global_step": 83218, "epoch": 1981} {"train_loss": -6.080751895904541, "global_step": 83219, "epoch": 1981} {"train_loss": -6.141982078552246, "global_step": 83220, "epoch": 1981} {"train_loss": -6.084869861602783, "global_step": 83221, "epoch": 1981} {"train_loss": -6.211552619934082, "global_step": 83222, "epoch": 1981} {"train_loss": -6.102108955383301, "global_step": 83223, "epoch": 1981} {"train_loss": -6.004276275634766, "global_step": 83224, "epoch": 1981} {"train_loss": -6.167228698730469, "global_step": 83225, "epoch": 1981} {"train_loss": -6.085850715637207, "global_step": 83226, "epoch": 1981} {"train_loss": -6.176874160766602, "global_step": 83227, "epoch": 1981} {"train_loss": -6.142722129821777, "global_step": 83228, "epoch": 1981} {"train_loss": -6.100928783416748, "global_step": 83229, "epoch": 1981} {"train_loss": -6.161245346069336, "global_step": 83230, "epoch": 1981} {"train_loss": -6.2171630859375, "global_step": 83231, "epoch": 1981} {"train_loss": -6.163823127746582, "global_step": 83232, "epoch": 1981} {"train_loss": -6.138556480407715, "global_step": 83233, "epoch": 1981} {"train_loss": -6.078784465789795, "global_step": 83234, "epoch": 1981} {"train_loss": -6.010612487792969, "global_step": 83235, "epoch": 1981} {"train_loss": -6.1898417472839355, "global_step": 83236, "epoch": 1981} {"train_loss": -6.263197898864746, "global_step": 83237, "epoch": 1981} {"train_loss": -6.2045063972473145, "global_step": 83238, "epoch": 1981} {"train_loss": -6.2091474533081055, "global_step": 83239, "epoch": 1981} {"train_loss": -6.092424392700195, "global_step": 83240, "epoch": 1981} {"train_loss": -6.104964256286621, "global_step": 83241, "epoch": 1981} {"train_loss": -6.278730869293213, "global_step": 83242, "epoch": 1981} {"train_loss": -6.151914869035993, "global_step": 83243, "epoch": 1981, "val_loss": 67869.5078125} {"train_loss": -6.272079944610596, "global_step": 83244, "epoch": 1982} {"train_loss": -6.1613264083862305, "global_step": 83245, "epoch": 1982} {"train_loss": -6.1356120109558105, "global_step": 83246, "epoch": 1982} {"train_loss": -6.199297904968262, "global_step": 83247, "epoch": 1982} {"train_loss": -6.160956382751465, "global_step": 83248, "epoch": 1982} {"train_loss": -6.203996658325195, "global_step": 83249, "epoch": 1982} {"train_loss": -6.194343566894531, "global_step": 83250, "epoch": 1982} {"train_loss": -6.203807353973389, "global_step": 83251, "epoch": 1982} {"train_loss": -6.091663837432861, "global_step": 83252, "epoch": 1982} {"train_loss": -6.172546863555908, "global_step": 83253, "epoch": 1982} {"train_loss": -6.160284042358398, "global_step": 83254, "epoch": 1982} {"train_loss": -6.078407287597656, "global_step": 83255, "epoch": 1982} {"train_loss": -6.048303127288818, "global_step": 83256, "epoch": 1982} {"train_loss": -6.25346565246582, "global_step": 83257, "epoch": 1982} {"train_loss": -5.975013732910156, "global_step": 83258, "epoch": 1982} {"train_loss": -6.031637191772461, "global_step": 83259, "epoch": 1982} {"train_loss": -6.070472717285156, "global_step": 83260, "epoch": 1982} {"train_loss": -6.094466209411621, "global_step": 83261, "epoch": 1982} {"train_loss": -6.140134811401367, "global_step": 83262, "epoch": 1982} {"train_loss": -6.1021504402160645, "global_step": 83263, "epoch": 1982} {"train_loss": -6.142365455627441, "global_step": 83264, "epoch": 1982} {"train_loss": -6.022815704345703, "global_step": 83265, "epoch": 1982} {"train_loss": -6.193441867828369, "global_step": 83266, "epoch": 1982} {"train_loss": -6.184420108795166, "global_step": 83267, "epoch": 1982} {"train_loss": -6.015119552612305, "global_step": 83268, "epoch": 1982} {"train_loss": -6.111701488494873, "global_step": 83269, "epoch": 1982} {"train_loss": -6.173785209655762, "global_step": 83270, "epoch": 1982} {"train_loss": -6.079702377319336, "global_step": 83271, "epoch": 1982} {"train_loss": -5.984678268432617, "global_step": 83272, "epoch": 1982} {"train_loss": -6.186743259429932, "global_step": 83273, "epoch": 1982} {"train_loss": -6.147686004638672, "global_step": 83274, "epoch": 1982} {"train_loss": -6.158653259277344, "global_step": 83275, "epoch": 1982} {"train_loss": -6.001168251037598, "global_step": 83276, "epoch": 1982} {"train_loss": -6.143314361572266, "global_step": 83277, "epoch": 1982} {"train_loss": -6.145752906799316, "global_step": 83278, "epoch": 1982} {"train_loss": -6.164886474609375, "global_step": 83279, "epoch": 1982} {"train_loss": -6.186828136444092, "global_step": 83280, "epoch": 1982} {"train_loss": -6.087641716003418, "global_step": 83281, "epoch": 1982} {"train_loss": -6.172908306121826, "global_step": 83282, "epoch": 1982} {"train_loss": -6.0489959716796875, "global_step": 83283, "epoch": 1982} {"train_loss": -6.20937442779541, "global_step": 83284, "epoch": 1982} {"train_loss": -6.129885821115403, "global_step": 83285, "epoch": 1982, "val_loss": 67762.8828125} {"train_loss": -6.198784828186035, "global_step": 83286, "epoch": 1983} {"train_loss": -6.239947319030762, "global_step": 83287, "epoch": 1983} {"train_loss": -6.168562889099121, "global_step": 83288, "epoch": 1983} {"train_loss": -6.23613977432251, "global_step": 83289, "epoch": 1983} {"train_loss": -6.196619510650635, "global_step": 83290, "epoch": 1983} {"train_loss": -6.188925743103027, "global_step": 83291, "epoch": 1983} {"train_loss": -6.318063259124756, "global_step": 83292, "epoch": 1983} {"train_loss": -6.173368453979492, "global_step": 83293, "epoch": 1983} {"train_loss": -6.212139129638672, "global_step": 83294, "epoch": 1983} {"train_loss": -6.087973594665527, "global_step": 83295, "epoch": 1983} {"train_loss": -6.082796096801758, "global_step": 83296, "epoch": 1983} {"train_loss": -6.074094772338867, "global_step": 83297, "epoch": 1983} {"train_loss": -6.153833389282227, "global_step": 83298, "epoch": 1983} {"train_loss": -6.198004245758057, "global_step": 83299, "epoch": 1983} {"train_loss": -6.1447553634643555, "global_step": 83300, "epoch": 1983} {"train_loss": -6.235430717468262, "global_step": 83301, "epoch": 1983} {"train_loss": -6.16229772567749, "global_step": 83302, "epoch": 1983} {"train_loss": -6.194852828979492, "global_step": 83303, "epoch": 1983} {"train_loss": -6.140290260314941, "global_step": 83304, "epoch": 1983} {"train_loss": -6.167603015899658, "global_step": 83305, "epoch": 1983} {"train_loss": -6.12769889831543, "global_step": 83306, "epoch": 1983} {"train_loss": -6.208794593811035, "global_step": 83307, "epoch": 1983} {"train_loss": -6.203463554382324, "global_step": 83308, "epoch": 1983} {"train_loss": -6.158426284790039, "global_step": 83309, "epoch": 1983} {"train_loss": -6.282054901123047, "global_step": 83310, "epoch": 1983} {"train_loss": -6.22096586227417, "global_step": 83311, "epoch": 1983} {"train_loss": -6.277406215667725, "global_step": 83312, "epoch": 1983} {"train_loss": -6.181480407714844, "global_step": 83313, "epoch": 1983} {"train_loss": -6.202527046203613, "global_step": 83314, "epoch": 1983} {"train_loss": -6.003384590148926, "global_step": 83315, "epoch": 1983} {"train_loss": -6.248648166656494, "global_step": 83316, "epoch": 1983} {"train_loss": -6.256206512451172, "global_step": 83317, "epoch": 1983} {"train_loss": -6.18890380859375, "global_step": 83318, "epoch": 1983} {"train_loss": -6.306562423706055, "global_step": 83319, "epoch": 1983} {"train_loss": -6.245410919189453, "global_step": 83320, "epoch": 1983} {"train_loss": -6.204007148742676, "global_step": 83321, "epoch": 1983} {"train_loss": -6.273723125457764, "global_step": 83322, "epoch": 1983} {"train_loss": -6.19474458694458, "global_step": 83323, "epoch": 1983} {"train_loss": -6.151377201080322, "global_step": 83324, "epoch": 1983} {"train_loss": -6.223079681396484, "global_step": 83325, "epoch": 1983} {"train_loss": -6.076182842254639, "global_step": 83326, "epoch": 1983} {"train_loss": -6.190373148236956, "global_step": 83327, "epoch": 1983, "val_loss": 67742.203125} {"train_loss": -6.133620738983154, "global_step": 83328, "epoch": 1984} {"train_loss": -6.245365142822266, "global_step": 83329, "epoch": 1984} {"train_loss": -6.105849266052246, "global_step": 83330, "epoch": 1984} {"train_loss": -6.255425453186035, "global_step": 83331, "epoch": 1984} {"train_loss": -6.224006652832031, "global_step": 83332, "epoch": 1984} {"train_loss": -6.142308235168457, "global_step": 83333, "epoch": 1984} {"train_loss": -6.278792381286621, "global_step": 83334, "epoch": 1984} {"train_loss": -6.088614463806152, "global_step": 83335, "epoch": 1984} {"train_loss": -6.237870216369629, "global_step": 83336, "epoch": 1984} {"train_loss": -6.207156181335449, "global_step": 83337, "epoch": 1984} {"train_loss": -6.182997226715088, "global_step": 83338, "epoch": 1984} {"train_loss": -6.184889793395996, "global_step": 83339, "epoch": 1984} {"train_loss": -6.259889602661133, "global_step": 83340, "epoch": 1984} {"train_loss": -6.143448829650879, "global_step": 83341, "epoch": 1984} {"train_loss": -6.028409957885742, "global_step": 83342, "epoch": 1984} {"train_loss": -6.15300178527832, "global_step": 83343, "epoch": 1984} {"train_loss": -6.023246765136719, "global_step": 83344, "epoch": 1984} {"train_loss": -6.182735443115234, "global_step": 83345, "epoch": 1984} {"train_loss": -6.173669338226318, "global_step": 83346, "epoch": 1984} {"train_loss": -6.120244979858398, "global_step": 83347, "epoch": 1984} {"train_loss": -6.005368232727051, "global_step": 83348, "epoch": 1984} {"train_loss": -6.211991310119629, "global_step": 83349, "epoch": 1984} {"train_loss": -6.150739669799805, "global_step": 83350, "epoch": 1984} {"train_loss": -6.138169765472412, "global_step": 83351, "epoch": 1984} {"train_loss": -6.135197639465332, "global_step": 83352, "epoch": 1984} {"train_loss": -6.271361351013184, "global_step": 83353, "epoch": 1984} {"train_loss": -6.205167770385742, "global_step": 83354, "epoch": 1984} {"train_loss": -6.228890895843506, "global_step": 83355, "epoch": 1984} {"train_loss": -6.051177978515625, "global_step": 83356, "epoch": 1984} {"train_loss": -6.154360294342041, "global_step": 83357, "epoch": 1984} {"train_loss": -6.1650614738464355, "global_step": 83358, "epoch": 1984} {"train_loss": -6.176945686340332, "global_step": 83359, "epoch": 1984} {"train_loss": -6.128126621246338, "global_step": 83360, "epoch": 1984} {"train_loss": -5.983689308166504, "global_step": 83361, "epoch": 1984} {"train_loss": -6.066462993621826, "global_step": 83362, "epoch": 1984} {"train_loss": -6.108280658721924, "global_step": 83363, "epoch": 1984} {"train_loss": -6.137172222137451, "global_step": 83364, "epoch": 1984} {"train_loss": -6.2273101806640625, "global_step": 83365, "epoch": 1984} {"train_loss": -6.228274822235107, "global_step": 83366, "epoch": 1984} {"train_loss": -6.249255180358887, "global_step": 83367, "epoch": 1984} {"train_loss": -6.127480983734131, "global_step": 83368, "epoch": 1984} {"train_loss": -6.159029086430867, "global_step": 83369, "epoch": 1984, "val_loss": 68020.6875} {"train_loss": -6.064414024353027, "global_step": 83370, "epoch": 1985} {"train_loss": -6.156158924102783, "global_step": 83371, "epoch": 1985} {"train_loss": -6.221590518951416, "global_step": 83372, "epoch": 1985} {"train_loss": -6.097247123718262, "global_step": 83373, "epoch": 1985} {"train_loss": -6.08052921295166, "global_step": 83374, "epoch": 1985} {"train_loss": -6.213870525360107, "global_step": 83375, "epoch": 1985} {"train_loss": -6.108579635620117, "global_step": 83376, "epoch": 1985} {"train_loss": -6.030804634094238, "global_step": 83377, "epoch": 1985} {"train_loss": -6.211804389953613, "global_step": 83378, "epoch": 1985} {"train_loss": -6.149500370025635, "global_step": 83379, "epoch": 1985} {"train_loss": -6.13623046875, "global_step": 83380, "epoch": 1985} {"train_loss": -6.271585941314697, "global_step": 83381, "epoch": 1985} {"train_loss": -6.1785101890563965, "global_step": 83382, "epoch": 1985} {"train_loss": -6.222073554992676, "global_step": 83383, "epoch": 1985} {"train_loss": -6.1078081130981445, "global_step": 83384, "epoch": 1985} {"train_loss": -6.146193504333496, "global_step": 83385, "epoch": 1985} {"train_loss": -6.190915107727051, "global_step": 83386, "epoch": 1985} {"train_loss": -6.3025054931640625, "global_step": 83387, "epoch": 1985} {"train_loss": -6.232357025146484, "global_step": 83388, "epoch": 1985} {"train_loss": -6.205246925354004, "global_step": 83389, "epoch": 1985} {"train_loss": -6.227583408355713, "global_step": 83390, "epoch": 1985} {"train_loss": -6.136477947235107, "global_step": 83391, "epoch": 1985} {"train_loss": -6.325100898742676, "global_step": 83392, "epoch": 1985} {"train_loss": -6.157331943511963, "global_step": 83393, "epoch": 1985} {"train_loss": -6.075619697570801, "global_step": 83394, "epoch": 1985} {"train_loss": -6.144433975219727, "global_step": 83395, "epoch": 1985} {"train_loss": -6.22850227355957, "global_step": 83396, "epoch": 1985} {"train_loss": -6.213431358337402, "global_step": 83397, "epoch": 1985} {"train_loss": -6.142730236053467, "global_step": 83398, "epoch": 1985} {"train_loss": -6.163895606994629, "global_step": 83399, "epoch": 1985} {"train_loss": -6.315556526184082, "global_step": 83400, "epoch": 1985} {"train_loss": -6.160731792449951, "global_step": 83401, "epoch": 1985} {"train_loss": -6.196384429931641, "global_step": 83402, "epoch": 1985} {"train_loss": -6.177785396575928, "global_step": 83403, "epoch": 1985} {"train_loss": -6.284765720367432, "global_step": 83404, "epoch": 1985} {"train_loss": -6.1171417236328125, "global_step": 83405, "epoch": 1985} {"train_loss": -6.116540431976318, "global_step": 83406, "epoch": 1985} {"train_loss": -6.115683555603027, "global_step": 83407, "epoch": 1985} {"train_loss": -6.071128845214844, "global_step": 83408, "epoch": 1985} {"train_loss": -6.207169532775879, "global_step": 83409, "epoch": 1985} {"train_loss": -6.247609615325928, "global_step": 83410, "epoch": 1985} {"train_loss": -6.171469143458775, "global_step": 83411, "epoch": 1985, "val_loss": 68028.875} {"train_loss": -6.097287654876709, "global_step": 83412, "epoch": 1986} {"train_loss": -6.106534004211426, "global_step": 83413, "epoch": 1986} {"train_loss": -6.0891523361206055, "global_step": 83414, "epoch": 1986} {"train_loss": -6.070014476776123, "global_step": 83415, "epoch": 1986} {"train_loss": -6.115983009338379, "global_step": 83416, "epoch": 1986} {"train_loss": -6.103506088256836, "global_step": 83417, "epoch": 1986} {"train_loss": -6.162731170654297, "global_step": 83418, "epoch": 1986} {"train_loss": -6.226622581481934, "global_step": 83419, "epoch": 1986} {"train_loss": -6.190305709838867, "global_step": 83420, "epoch": 1986} {"train_loss": -6.042499542236328, "global_step": 83421, "epoch": 1986} {"train_loss": -6.159000396728516, "global_step": 83422, "epoch": 1986} {"train_loss": -6.039973735809326, "global_step": 83423, "epoch": 1986} {"train_loss": -6.105313301086426, "global_step": 83424, "epoch": 1986} {"train_loss": -6.135190010070801, "global_step": 83425, "epoch": 1986} {"train_loss": -6.210118293762207, "global_step": 83426, "epoch": 1986} {"train_loss": -6.039990425109863, "global_step": 83427, "epoch": 1986} {"train_loss": -6.041182518005371, "global_step": 83428, "epoch": 1986} {"train_loss": -6.208010673522949, "global_step": 83429, "epoch": 1986} {"train_loss": -6.305671691894531, "global_step": 83430, "epoch": 1986} {"train_loss": -6.105471134185791, "global_step": 83431, "epoch": 1986} {"train_loss": -6.1179914474487305, "global_step": 83432, "epoch": 1986} {"train_loss": -6.081295967102051, "global_step": 83433, "epoch": 1986} {"train_loss": -6.1172776222229, "global_step": 83434, "epoch": 1986} {"train_loss": -6.1458940505981445, "global_step": 83435, "epoch": 1986} {"train_loss": -6.138803482055664, "global_step": 83436, "epoch": 1986} {"train_loss": -6.125499725341797, "global_step": 83437, "epoch": 1986} {"train_loss": -6.103700160980225, "global_step": 83438, "epoch": 1986} {"train_loss": -6.259535789489746, "global_step": 83439, "epoch": 1986} {"train_loss": -6.216071605682373, "global_step": 83440, "epoch": 1986} {"train_loss": -6.2206573486328125, "global_step": 83441, "epoch": 1986} {"train_loss": -6.206233978271484, "global_step": 83442, "epoch": 1986} {"train_loss": -6.339681148529053, "global_step": 83443, "epoch": 1986} {"train_loss": -6.0166730880737305, "global_step": 83444, "epoch": 1986} {"train_loss": -6.185992240905762, "global_step": 83445, "epoch": 1986} {"train_loss": -6.0705790519714355, "global_step": 83446, "epoch": 1986} {"train_loss": -6.086147308349609, "global_step": 83447, "epoch": 1986} {"train_loss": -6.206171989440918, "global_step": 83448, "epoch": 1986} {"train_loss": -6.151827335357666, "global_step": 83449, "epoch": 1986} {"train_loss": -6.2489142417907715, "global_step": 83450, "epoch": 1986} {"train_loss": -6.241025447845459, "global_step": 83451, "epoch": 1986} {"train_loss": -6.120573997497559, "global_step": 83452, "epoch": 1986} {"train_loss": -6.14753600529262, "global_step": 83453, "epoch": 1986, "val_loss": 67749.328125} {"train_loss": -6.188835144042969, "global_step": 83454, "epoch": 1987} {"train_loss": -6.177505970001221, "global_step": 83455, "epoch": 1987} {"train_loss": -6.233068466186523, "global_step": 83456, "epoch": 1987} {"train_loss": -6.0924224853515625, "global_step": 83457, "epoch": 1987} {"train_loss": -6.170856475830078, "global_step": 83458, "epoch": 1987} {"train_loss": -6.244147300720215, "global_step": 83459, "epoch": 1987} {"train_loss": -6.199165344238281, "global_step": 83460, "epoch": 1987} {"train_loss": -6.101531028747559, "global_step": 83461, "epoch": 1987} {"train_loss": -6.008588790893555, "global_step": 83462, "epoch": 1987} {"train_loss": -6.17594051361084, "global_step": 83463, "epoch": 1987} {"train_loss": -6.162642478942871, "global_step": 83464, "epoch": 1987} {"train_loss": -6.215333938598633, "global_step": 83465, "epoch": 1987} {"train_loss": -6.127865791320801, "global_step": 83466, "epoch": 1987} {"train_loss": -6.183307647705078, "global_step": 83467, "epoch": 1987} {"train_loss": -6.133059978485107, "global_step": 83468, "epoch": 1987} {"train_loss": -6.240789890289307, "global_step": 83469, "epoch": 1987} {"train_loss": -6.191005706787109, "global_step": 83470, "epoch": 1987} {"train_loss": -6.074044227600098, "global_step": 83471, "epoch": 1987} {"train_loss": -6.142596244812012, "global_step": 83472, "epoch": 1987} {"train_loss": -6.268191814422607, "global_step": 83473, "epoch": 1987} {"train_loss": -6.078685760498047, "global_step": 83474, "epoch": 1987} {"train_loss": -6.30268669128418, "global_step": 83475, "epoch": 1987} {"train_loss": -6.2661967277526855, "global_step": 83476, "epoch": 1987} {"train_loss": -6.27161979675293, "global_step": 83477, "epoch": 1987} {"train_loss": -6.202308654785156, "global_step": 83478, "epoch": 1987} {"train_loss": -6.21903133392334, "global_step": 83479, "epoch": 1987} {"train_loss": -5.999207496643066, "global_step": 83480, "epoch": 1987} {"train_loss": -6.131787300109863, "global_step": 83481, "epoch": 1987} {"train_loss": -6.0627875328063965, "global_step": 83482, "epoch": 1987} {"train_loss": -6.130239486694336, "global_step": 83483, "epoch": 1987} {"train_loss": -6.100604057312012, "global_step": 83484, "epoch": 1987} {"train_loss": -6.143624305725098, "global_step": 83485, "epoch": 1987} {"train_loss": -6.068511009216309, "global_step": 83486, "epoch": 1987} {"train_loss": -6.159548759460449, "global_step": 83487, "epoch": 1987} {"train_loss": -6.18344783782959, "global_step": 83488, "epoch": 1987} {"train_loss": -6.221283912658691, "global_step": 83489, "epoch": 1987} {"train_loss": -6.164379596710205, "global_step": 83490, "epoch": 1987} {"train_loss": -6.165834426879883, "global_step": 83491, "epoch": 1987} {"train_loss": -6.186007499694824, "global_step": 83492, "epoch": 1987} {"train_loss": -6.035067081451416, "global_step": 83493, "epoch": 1987} {"train_loss": -6.144637107849121, "global_step": 83494, "epoch": 1987} {"train_loss": -6.162699937820435, "global_step": 83495, "epoch": 1987, "val_loss": 67843.8046875} {"train_loss": -6.168652534484863, "global_step": 83496, "epoch": 1988} {"train_loss": -6.080376625061035, "global_step": 83497, "epoch": 1988} {"train_loss": -6.17903995513916, "global_step": 83498, "epoch": 1988} {"train_loss": -6.148467063903809, "global_step": 83499, "epoch": 1988} {"train_loss": -6.154031276702881, "global_step": 83500, "epoch": 1988} {"train_loss": -6.161418437957764, "global_step": 83501, "epoch": 1988} {"train_loss": -6.258891582489014, "global_step": 83502, "epoch": 1988} {"train_loss": -6.265377044677734, "global_step": 83503, "epoch": 1988} {"train_loss": -6.264077186584473, "global_step": 83504, "epoch": 1988} {"train_loss": -6.214966297149658, "global_step": 83505, "epoch": 1988} {"train_loss": -6.242959022521973, "global_step": 83506, "epoch": 1988} {"train_loss": -6.170481204986572, "global_step": 83507, "epoch": 1988} {"train_loss": -6.268023490905762, "global_step": 83508, "epoch": 1988} {"train_loss": -6.123629570007324, "global_step": 83509, "epoch": 1988} {"train_loss": -6.083216667175293, "global_step": 83510, "epoch": 1988} {"train_loss": -6.242636680603027, "global_step": 83511, "epoch": 1988} {"train_loss": -6.05641508102417, "global_step": 83512, "epoch": 1988} {"train_loss": -6.172990798950195, "global_step": 83513, "epoch": 1988} {"train_loss": -6.185186386108398, "global_step": 83514, "epoch": 1988} {"train_loss": -6.176478385925293, "global_step": 83515, "epoch": 1988} {"train_loss": -6.255049705505371, "global_step": 83516, "epoch": 1988} {"train_loss": -6.189610958099365, "global_step": 83517, "epoch": 1988} {"train_loss": -6.120721817016602, "global_step": 83518, "epoch": 1988} {"train_loss": -6.162102222442627, "global_step": 83519, "epoch": 1988} {"train_loss": -6.14234733581543, "global_step": 83520, "epoch": 1988} {"train_loss": -6.1962456703186035, "global_step": 83521, "epoch": 1988} {"train_loss": -6.137175559997559, "global_step": 83522, "epoch": 1988} {"train_loss": -6.1131463050842285, "global_step": 83523, "epoch": 1988} {"train_loss": -6.165295124053955, "global_step": 83524, "epoch": 1988} {"train_loss": -6.146572113037109, "global_step": 83525, "epoch": 1988} {"train_loss": -6.10956335067749, "global_step": 83526, "epoch": 1988} {"train_loss": -6.1773481369018555, "global_step": 83527, "epoch": 1988} {"train_loss": -6.1224493980407715, "global_step": 83528, "epoch": 1988} {"train_loss": -6.261052131652832, "global_step": 83529, "epoch": 1988} {"train_loss": -6.212925910949707, "global_step": 83530, "epoch": 1988} {"train_loss": -6.19889497756958, "global_step": 83531, "epoch": 1988} {"train_loss": -6.217451572418213, "global_step": 83532, "epoch": 1988} {"train_loss": -6.279548168182373, "global_step": 83533, "epoch": 1988} {"train_loss": -6.298775672912598, "global_step": 83534, "epoch": 1988} {"train_loss": -6.2037882804870605, "global_step": 83535, "epoch": 1988} {"train_loss": -6.203049659729004, "global_step": 83536, "epoch": 1988} {"train_loss": -6.183338051750546, "global_step": 83537, "epoch": 1988, "val_loss": 67743.6015625} {"train_loss": -6.223827362060547, "global_step": 83538, "epoch": 1989} {"train_loss": -6.123577117919922, "global_step": 83539, "epoch": 1989} {"train_loss": -6.157075881958008, "global_step": 83540, "epoch": 1989} {"train_loss": -6.212048530578613, "global_step": 83541, "epoch": 1989} {"train_loss": -6.073159694671631, "global_step": 83542, "epoch": 1989} {"train_loss": -6.161421775817871, "global_step": 83543, "epoch": 1989} {"train_loss": -6.2147932052612305, "global_step": 83544, "epoch": 1989} {"train_loss": -6.046115398406982, "global_step": 83545, "epoch": 1989} {"train_loss": -6.251494407653809, "global_step": 83546, "epoch": 1989} {"train_loss": -6.159924507141113, "global_step": 83547, "epoch": 1989} {"train_loss": -6.154542922973633, "global_step": 83548, "epoch": 1989} {"train_loss": -6.2281599044799805, "global_step": 83549, "epoch": 1989} {"train_loss": -6.113208770751953, "global_step": 83550, "epoch": 1989} {"train_loss": -6.302830219268799, "global_step": 83551, "epoch": 1989} {"train_loss": -6.155908584594727, "global_step": 83552, "epoch": 1989} {"train_loss": -6.183661460876465, "global_step": 83553, "epoch": 1989} {"train_loss": -6.184673309326172, "global_step": 83554, "epoch": 1989} {"train_loss": -6.172573089599609, "global_step": 83555, "epoch": 1989} {"train_loss": -6.159067153930664, "global_step": 83556, "epoch": 1989} {"train_loss": -6.022615432739258, "global_step": 83557, "epoch": 1989} {"train_loss": -6.125125408172607, "global_step": 83558, "epoch": 1989} {"train_loss": -6.214461326599121, "global_step": 83559, "epoch": 1989} {"train_loss": -6.157147407531738, "global_step": 83560, "epoch": 1989} {"train_loss": -6.211618900299072, "global_step": 83561, "epoch": 1989} {"train_loss": -6.177531719207764, "global_step": 83562, "epoch": 1989} {"train_loss": -6.2110395431518555, "global_step": 83563, "epoch": 1989} {"train_loss": -6.164290428161621, "global_step": 83564, "epoch": 1989} {"train_loss": -6.219208240509033, "global_step": 83565, "epoch": 1989} {"train_loss": -6.19229793548584, "global_step": 83566, "epoch": 1989} {"train_loss": -6.2436203956604, "global_step": 83567, "epoch": 1989} {"train_loss": -6.183986186981201, "global_step": 83568, "epoch": 1989} {"train_loss": -6.1919779777526855, "global_step": 83569, "epoch": 1989} {"train_loss": -6.208234786987305, "global_step": 83570, "epoch": 1989} {"train_loss": -6.202558517456055, "global_step": 83571, "epoch": 1989} {"train_loss": -6.0576372146606445, "global_step": 83572, "epoch": 1989} {"train_loss": -6.229825973510742, "global_step": 83573, "epoch": 1989} {"train_loss": -6.293540000915527, "global_step": 83574, "epoch": 1989} {"train_loss": -6.102151870727539, "global_step": 83575, "epoch": 1989} {"train_loss": -6.128537654876709, "global_step": 83576, "epoch": 1989} {"train_loss": -6.077847480773926, "global_step": 83577, "epoch": 1989} {"train_loss": -6.197984218597412, "global_step": 83578, "epoch": 1989} {"train_loss": -6.17147539910816, "global_step": 83579, "epoch": 1989, "val_loss": 67981.3203125} {"train_loss": -6.052045822143555, "global_step": 83580, "epoch": 1990} {"train_loss": -6.1546311378479, "global_step": 83581, "epoch": 1990} {"train_loss": -6.131973743438721, "global_step": 83582, "epoch": 1990} {"train_loss": -6.231316089630127, "global_step": 83583, "epoch": 1990} {"train_loss": -6.100116729736328, "global_step": 83584, "epoch": 1990} {"train_loss": -6.079165458679199, "global_step": 83585, "epoch": 1990} {"train_loss": -6.14420223236084, "global_step": 83586, "epoch": 1990} {"train_loss": -6.266526222229004, "global_step": 83587, "epoch": 1990} {"train_loss": -6.277412414550781, "global_step": 83588, "epoch": 1990} {"train_loss": -6.129913330078125, "global_step": 83589, "epoch": 1990} {"train_loss": -6.176579475402832, "global_step": 83590, "epoch": 1990} {"train_loss": -6.082940578460693, "global_step": 83591, "epoch": 1990} {"train_loss": -6.044099807739258, "global_step": 83592, "epoch": 1990} {"train_loss": -6.104006290435791, "global_step": 83593, "epoch": 1990} {"train_loss": -5.83059024810791, "global_step": 83594, "epoch": 1990} {"train_loss": -6.00789737701416, "global_step": 83595, "epoch": 1990} {"train_loss": -6.158605098724365, "global_step": 83596, "epoch": 1990} {"train_loss": -6.027168273925781, "global_step": 83597, "epoch": 1990} {"train_loss": -6.202826499938965, "global_step": 83598, "epoch": 1990} {"train_loss": -5.922493934631348, "global_step": 83599, "epoch": 1990} {"train_loss": -6.256646156311035, "global_step": 83600, "epoch": 1990} {"train_loss": -6.055049419403076, "global_step": 83601, "epoch": 1990} {"train_loss": -6.155947685241699, "global_step": 83602, "epoch": 1990} {"train_loss": -6.080153465270996, "global_step": 83603, "epoch": 1990} {"train_loss": -6.108274459838867, "global_step": 83604, "epoch": 1990} {"train_loss": -6.198020935058594, "global_step": 83605, "epoch": 1990} {"train_loss": -6.0115766525268555, "global_step": 83606, "epoch": 1990} {"train_loss": -5.977133750915527, "global_step": 83607, "epoch": 1990} {"train_loss": -6.083498001098633, "global_step": 83608, "epoch": 1990} {"train_loss": -5.945366859436035, "global_step": 83609, "epoch": 1990} {"train_loss": -6.113972187042236, "global_step": 83610, "epoch": 1990} {"train_loss": -6.156611919403076, "global_step": 83611, "epoch": 1990} {"train_loss": -6.156251907348633, "global_step": 83612, "epoch": 1990} {"train_loss": -6.051091194152832, "global_step": 83613, "epoch": 1990} {"train_loss": -6.011325359344482, "global_step": 83614, "epoch": 1990} {"train_loss": -6.198281288146973, "global_step": 83615, "epoch": 1990} {"train_loss": -6.22138786315918, "global_step": 83616, "epoch": 1990} {"train_loss": -6.1266703605651855, "global_step": 83617, "epoch": 1990} {"train_loss": -6.1330413818359375, "global_step": 83618, "epoch": 1990} {"train_loss": -6.178624153137207, "global_step": 83619, "epoch": 1990} {"train_loss": -6.112750053405762, "global_step": 83620, "epoch": 1990} {"train_loss": -6.110946291968936, "global_step": 83621, "epoch": 1990, "val_loss": 67795.3984375} {"train_loss": -6.2051873207092285, "global_step": 83622, "epoch": 1991} {"train_loss": -6.16267204284668, "global_step": 83623, "epoch": 1991} {"train_loss": -6.23225212097168, "global_step": 83624, "epoch": 1991} {"train_loss": -6.136707782745361, "global_step": 83625, "epoch": 1991} {"train_loss": -6.2005133628845215, "global_step": 83626, "epoch": 1991} {"train_loss": -6.147253036499023, "global_step": 83627, "epoch": 1991} {"train_loss": -6.163763046264648, "global_step": 83628, "epoch": 1991} {"train_loss": -6.215820789337158, "global_step": 83629, "epoch": 1991} {"train_loss": -6.178530693054199, "global_step": 83630, "epoch": 1991} {"train_loss": -6.123429298400879, "global_step": 83631, "epoch": 1991} {"train_loss": -6.1427717208862305, "global_step": 83632, "epoch": 1991} {"train_loss": -6.196719646453857, "global_step": 83633, "epoch": 1991} {"train_loss": -6.159893035888672, "global_step": 83634, "epoch": 1991} {"train_loss": -6.081029415130615, "global_step": 83635, "epoch": 1991} {"train_loss": -6.207307815551758, "global_step": 83636, "epoch": 1991} {"train_loss": -6.140130519866943, "global_step": 83637, "epoch": 1991} {"train_loss": -6.262312889099121, "global_step": 83638, "epoch": 1991} {"train_loss": -6.078401565551758, "global_step": 83639, "epoch": 1991} {"train_loss": -6.3380045890808105, "global_step": 83640, "epoch": 1991} {"train_loss": -6.050543785095215, "global_step": 83641, "epoch": 1991} {"train_loss": -6.182520866394043, "global_step": 83642, "epoch": 1991} {"train_loss": -6.102837085723877, "global_step": 83643, "epoch": 1991} {"train_loss": -6.079916477203369, "global_step": 83644, "epoch": 1991} {"train_loss": -6.19033670425415, "global_step": 83645, "epoch": 1991} {"train_loss": -6.2345757484436035, "global_step": 83646, "epoch": 1991} {"train_loss": -6.102913856506348, "global_step": 83647, "epoch": 1991} {"train_loss": -6.199603080749512, "global_step": 83648, "epoch": 1991} {"train_loss": -6.103874683380127, "global_step": 83649, "epoch": 1991} {"train_loss": -6.183282852172852, "global_step": 83650, "epoch": 1991} {"train_loss": -6.118778228759766, "global_step": 83651, "epoch": 1991} {"train_loss": -6.2109527587890625, "global_step": 83652, "epoch": 1991} {"train_loss": -6.191658020019531, "global_step": 83653, "epoch": 1991} {"train_loss": -6.19904899597168, "global_step": 83654, "epoch": 1991} {"train_loss": -6.15238094329834, "global_step": 83655, "epoch": 1991} {"train_loss": -6.139199256896973, "global_step": 83656, "epoch": 1991} {"train_loss": -6.175546169281006, "global_step": 83657, "epoch": 1991} {"train_loss": -6.271508693695068, "global_step": 83658, "epoch": 1991} {"train_loss": -6.1527323722839355, "global_step": 83659, "epoch": 1991} {"train_loss": -6.186586856842041, "global_step": 83660, "epoch": 1991} {"train_loss": -6.134622573852539, "global_step": 83661, "epoch": 1991} {"train_loss": -6.203803539276123, "global_step": 83662, "epoch": 1991} {"train_loss": -6.16851578439985, "global_step": 83663, "epoch": 1991, "val_loss": 67724.4609375} {"train_loss": -6.240085601806641, "global_step": 83664, "epoch": 1992} {"train_loss": -6.12237548828125, "global_step": 83665, "epoch": 1992} {"train_loss": -6.15501594543457, "global_step": 83666, "epoch": 1992} {"train_loss": -6.229550838470459, "global_step": 83667, "epoch": 1992} {"train_loss": -6.403587341308594, "global_step": 83668, "epoch": 1992} {"train_loss": -6.29705810546875, "global_step": 83669, "epoch": 1992} {"train_loss": -6.239532470703125, "global_step": 83670, "epoch": 1992} {"train_loss": -6.313709735870361, "global_step": 83671, "epoch": 1992} {"train_loss": -6.194790363311768, "global_step": 83672, "epoch": 1992} {"train_loss": -6.2435712814331055, "global_step": 83673, "epoch": 1992} {"train_loss": -6.102787971496582, "global_step": 83674, "epoch": 1992} {"train_loss": -6.19465970993042, "global_step": 83675, "epoch": 1992} {"train_loss": -6.224802494049072, "global_step": 83676, "epoch": 1992} {"train_loss": -6.179038047790527, "global_step": 83677, "epoch": 1992} {"train_loss": -6.282351016998291, "global_step": 83678, "epoch": 1992} {"train_loss": -6.163160800933838, "global_step": 83679, "epoch": 1992} {"train_loss": -6.180659770965576, "global_step": 83680, "epoch": 1992} {"train_loss": -6.207414627075195, "global_step": 83681, "epoch": 1992} {"train_loss": -6.109528541564941, "global_step": 83682, "epoch": 1992} {"train_loss": -6.107507705688477, "global_step": 83683, "epoch": 1992} {"train_loss": -6.189745903015137, "global_step": 83684, "epoch": 1992} {"train_loss": -6.250376224517822, "global_step": 83685, "epoch": 1992} {"train_loss": -6.164965629577637, "global_step": 83686, "epoch": 1992} {"train_loss": -6.104583740234375, "global_step": 83687, "epoch": 1992} {"train_loss": -6.179964065551758, "global_step": 83688, "epoch": 1992} {"train_loss": -6.098504066467285, "global_step": 83689, "epoch": 1992} {"train_loss": -6.060959815979004, "global_step": 83690, "epoch": 1992} {"train_loss": -6.208894729614258, "global_step": 83691, "epoch": 1992} {"train_loss": -6.1000752449035645, "global_step": 83692, "epoch": 1992} {"train_loss": -6.26486873626709, "global_step": 83693, "epoch": 1992} {"train_loss": -6.054141044616699, "global_step": 83694, "epoch": 1992} {"train_loss": -6.115626811981201, "global_step": 83695, "epoch": 1992} {"train_loss": -6.360419750213623, "global_step": 83696, "epoch": 1992} {"train_loss": -6.122696399688721, "global_step": 83697, "epoch": 1992} {"train_loss": -6.096051216125488, "global_step": 83698, "epoch": 1992} {"train_loss": -6.1159467697143555, "global_step": 83699, "epoch": 1992} {"train_loss": -6.053992748260498, "global_step": 83700, "epoch": 1992} {"train_loss": -6.180647850036621, "global_step": 83701, "epoch": 1992} {"train_loss": -6.1483635902404785, "global_step": 83702, "epoch": 1992} {"train_loss": -6.213059425354004, "global_step": 83703, "epoch": 1992} {"train_loss": -6.105997085571289, "global_step": 83704, "epoch": 1992} {"train_loss": -6.179619437172299, "global_step": 83705, "epoch": 1992, "val_loss": 67696.96875} {"train_loss": -6.123668670654297, "global_step": 83706, "epoch": 1993} {"train_loss": -6.183815002441406, "global_step": 83707, "epoch": 1993} {"train_loss": -6.265103816986084, "global_step": 83708, "epoch": 1993} {"train_loss": -6.344742298126221, "global_step": 83709, "epoch": 1993} {"train_loss": -6.245499610900879, "global_step": 83710, "epoch": 1993} {"train_loss": -6.256272315979004, "global_step": 83711, "epoch": 1993} {"train_loss": -6.188684463500977, "global_step": 83712, "epoch": 1993} {"train_loss": -6.19748592376709, "global_step": 83713, "epoch": 1993} {"train_loss": -6.255438804626465, "global_step": 83714, "epoch": 1993} {"train_loss": -6.124030113220215, "global_step": 83715, "epoch": 1993} {"train_loss": -6.191034317016602, "global_step": 83716, "epoch": 1993} {"train_loss": -6.194188117980957, "global_step": 83717, "epoch": 1993} {"train_loss": -6.0137939453125, "global_step": 83718, "epoch": 1993} {"train_loss": -6.160160541534424, "global_step": 83719, "epoch": 1993} {"train_loss": -6.0287933349609375, "global_step": 83720, "epoch": 1993} {"train_loss": -6.194632530212402, "global_step": 83721, "epoch": 1993} {"train_loss": -6.106955528259277, "global_step": 83722, "epoch": 1993} {"train_loss": -6.160676002502441, "global_step": 83723, "epoch": 1993} {"train_loss": -6.187808036804199, "global_step": 83724, "epoch": 1993} {"train_loss": -6.165066719055176, "global_step": 83725, "epoch": 1993} {"train_loss": -6.117506504058838, "global_step": 83726, "epoch": 1993} {"train_loss": -6.174775123596191, "global_step": 83727, "epoch": 1993} {"train_loss": -6.096463680267334, "global_step": 83728, "epoch": 1993} {"train_loss": -6.193909645080566, "global_step": 83729, "epoch": 1993} {"train_loss": -6.074619293212891, "global_step": 83730, "epoch": 1993} {"train_loss": -6.155776023864746, "global_step": 83731, "epoch": 1993} {"train_loss": -6.223244667053223, "global_step": 83732, "epoch": 1993} {"train_loss": -6.188063621520996, "global_step": 83733, "epoch": 1993} {"train_loss": -6.201927185058594, "global_step": 83734, "epoch": 1993} {"train_loss": -6.343501091003418, "global_step": 83735, "epoch": 1993} {"train_loss": -6.18389892578125, "global_step": 83736, "epoch": 1993} {"train_loss": -6.20168399810791, "global_step": 83737, "epoch": 1993} {"train_loss": -6.196388244628906, "global_step": 83738, "epoch": 1993} {"train_loss": -6.134715557098389, "global_step": 83739, "epoch": 1993} {"train_loss": -6.241209983825684, "global_step": 83740, "epoch": 1993} {"train_loss": -6.156549453735352, "global_step": 83741, "epoch": 1993} {"train_loss": -6.224160671234131, "global_step": 83742, "epoch": 1993} {"train_loss": -6.081263542175293, "global_step": 83743, "epoch": 1993} {"train_loss": -6.012721538543701, "global_step": 83744, "epoch": 1993} {"train_loss": -5.997747421264648, "global_step": 83745, "epoch": 1993} {"train_loss": -6.205751419067383, "global_step": 83746, "epoch": 1993} {"train_loss": -6.170794157754807, "global_step": 83747, "epoch": 1993, "val_loss": 68224.1640625} {"train_loss": -6.035466194152832, "global_step": 83748, "epoch": 1994} {"train_loss": -6.128855228424072, "global_step": 83749, "epoch": 1994} {"train_loss": -6.0673370361328125, "global_step": 83750, "epoch": 1994} {"train_loss": -6.010450839996338, "global_step": 83751, "epoch": 1994} {"train_loss": -6.163471221923828, "global_step": 83752, "epoch": 1994} {"train_loss": -6.028996467590332, "global_step": 83753, "epoch": 1994} {"train_loss": -6.1615495681762695, "global_step": 83754, "epoch": 1994} {"train_loss": -6.1778435707092285, "global_step": 83755, "epoch": 1994} {"train_loss": -6.191208362579346, "global_step": 83756, "epoch": 1994} {"train_loss": -6.073145866394043, "global_step": 83757, "epoch": 1994} {"train_loss": -6.115453243255615, "global_step": 83758, "epoch": 1994} {"train_loss": -6.214168548583984, "global_step": 83759, "epoch": 1994} {"train_loss": -6.1858415603637695, "global_step": 83760, "epoch": 1994} {"train_loss": -6.051841735839844, "global_step": 83761, "epoch": 1994} {"train_loss": -6.228997707366943, "global_step": 83762, "epoch": 1994} {"train_loss": -6.178846836090088, "global_step": 83763, "epoch": 1994} {"train_loss": -6.129387378692627, "global_step": 83764, "epoch": 1994} {"train_loss": -6.162984371185303, "global_step": 83765, "epoch": 1994} {"train_loss": -6.125034332275391, "global_step": 83766, "epoch": 1994} {"train_loss": -6.0707197189331055, "global_step": 83767, "epoch": 1994} {"train_loss": -6.108623027801514, "global_step": 83768, "epoch": 1994} {"train_loss": -6.066068649291992, "global_step": 83769, "epoch": 1994} {"train_loss": -6.028372287750244, "global_step": 83770, "epoch": 1994} {"train_loss": -6.070652008056641, "global_step": 83771, "epoch": 1994} {"train_loss": -6.11907958984375, "global_step": 83772, "epoch": 1994} {"train_loss": -6.07518196105957, "global_step": 83773, "epoch": 1994} {"train_loss": -6.060600280761719, "global_step": 83774, "epoch": 1994} {"train_loss": -6.263685703277588, "global_step": 83775, "epoch": 1994} {"train_loss": -6.022068023681641, "global_step": 83776, "epoch": 1994} {"train_loss": -6.105230331420898, "global_step": 83777, "epoch": 1994} {"train_loss": -6.167576789855957, "global_step": 83778, "epoch": 1994} {"train_loss": -6.193792343139648, "global_step": 83779, "epoch": 1994} {"train_loss": -6.139198303222656, "global_step": 83780, "epoch": 1994} {"train_loss": -6.113768577575684, "global_step": 83781, "epoch": 1994} {"train_loss": -6.218957901000977, "global_step": 83782, "epoch": 1994} {"train_loss": -6.136011600494385, "global_step": 83783, "epoch": 1994} {"train_loss": -6.1224470138549805, "global_step": 83784, "epoch": 1994} {"train_loss": -6.220698833465576, "global_step": 83785, "epoch": 1994} {"train_loss": -6.122725486755371, "global_step": 83786, "epoch": 1994} {"train_loss": -6.104828357696533, "global_step": 83787, "epoch": 1994} {"train_loss": -6.122483253479004, "global_step": 83788, "epoch": 1994} {"train_loss": -6.123479843139648, "global_step": 83789, "epoch": 1994, "val_loss": 67951.8203125} {"train_loss": -6.149805068969727, "global_step": 83790, "epoch": 1995} {"train_loss": -6.190820693969727, "global_step": 83791, "epoch": 1995} {"train_loss": -6.1555280685424805, "global_step": 83792, "epoch": 1995} {"train_loss": -6.104126930236816, "global_step": 83793, "epoch": 1995} {"train_loss": -6.163393020629883, "global_step": 83794, "epoch": 1995} {"train_loss": -6.265316009521484, "global_step": 83795, "epoch": 1995} {"train_loss": -6.13596773147583, "global_step": 83796, "epoch": 1995} {"train_loss": -6.250412464141846, "global_step": 83797, "epoch": 1995} {"train_loss": -6.21997594833374, "global_step": 83798, "epoch": 1995} {"train_loss": -6.119422912597656, "global_step": 83799, "epoch": 1995} {"train_loss": -6.202490329742432, "global_step": 83800, "epoch": 1995} {"train_loss": -6.216738700866699, "global_step": 83801, "epoch": 1995} {"train_loss": -6.151968955993652, "global_step": 83802, "epoch": 1995} {"train_loss": -6.123273849487305, "global_step": 83803, "epoch": 1995} {"train_loss": -6.086475372314453, "global_step": 83804, "epoch": 1995} {"train_loss": -6.194894790649414, "global_step": 83805, "epoch": 1995} {"train_loss": -6.148680210113525, "global_step": 83806, "epoch": 1995} {"train_loss": -6.170371055603027, "global_step": 83807, "epoch": 1995} {"train_loss": -6.0892791748046875, "global_step": 83808, "epoch": 1995} {"train_loss": -6.023447036743164, "global_step": 83809, "epoch": 1995} {"train_loss": -6.159741401672363, "global_step": 83810, "epoch": 1995} {"train_loss": -6.202045917510986, "global_step": 83811, "epoch": 1995} {"train_loss": -6.121076583862305, "global_step": 83812, "epoch": 1995} {"train_loss": -6.174951553344727, "global_step": 83813, "epoch": 1995} {"train_loss": -6.096487045288086, "global_step": 83814, "epoch": 1995} {"train_loss": -6.269561767578125, "global_step": 83815, "epoch": 1995} {"train_loss": -6.20378303527832, "global_step": 83816, "epoch": 1995} {"train_loss": -6.18043327331543, "global_step": 83817, "epoch": 1995} {"train_loss": -6.167313575744629, "global_step": 83818, "epoch": 1995} {"train_loss": -6.293720245361328, "global_step": 83819, "epoch": 1995} {"train_loss": -6.002134323120117, "global_step": 83820, "epoch": 1995} {"train_loss": -6.220865726470947, "global_step": 83821, "epoch": 1995} {"train_loss": -6.135879993438721, "global_step": 83822, "epoch": 1995} {"train_loss": -6.066178798675537, "global_step": 83823, "epoch": 1995} {"train_loss": -6.099592208862305, "global_step": 83824, "epoch": 1995} {"train_loss": -6.188056468963623, "global_step": 83825, "epoch": 1995} {"train_loss": -6.150984287261963, "global_step": 83826, "epoch": 1995} {"train_loss": -6.195686340332031, "global_step": 83827, "epoch": 1995} {"train_loss": -6.03936243057251, "global_step": 83828, "epoch": 1995} {"train_loss": -6.1293840408325195, "global_step": 83829, "epoch": 1995} {"train_loss": -6.231771469116211, "global_step": 83830, "epoch": 1995} {"train_loss": -6.155816804795038, "global_step": 83831, "epoch": 1995, "val_loss": 67776.6875} {"train_loss": -6.114801406860352, "global_step": 83832, "epoch": 1996} {"train_loss": -6.222300052642822, "global_step": 83833, "epoch": 1996} {"train_loss": -6.226503372192383, "global_step": 83834, "epoch": 1996} {"train_loss": -6.150093078613281, "global_step": 83835, "epoch": 1996} {"train_loss": -6.14202880859375, "global_step": 83836, "epoch": 1996} {"train_loss": -6.10636043548584, "global_step": 83837, "epoch": 1996} {"train_loss": -6.0176496505737305, "global_step": 83838, "epoch": 1996} {"train_loss": -6.248927593231201, "global_step": 83839, "epoch": 1996} {"train_loss": -6.138715744018555, "global_step": 83840, "epoch": 1996} {"train_loss": -6.263653755187988, "global_step": 83841, "epoch": 1996} {"train_loss": -6.159815311431885, "global_step": 83842, "epoch": 1996} {"train_loss": -6.220770835876465, "global_step": 83843, "epoch": 1996} {"train_loss": -6.191862106323242, "global_step": 83844, "epoch": 1996} {"train_loss": -6.232810020446777, "global_step": 83845, "epoch": 1996} {"train_loss": -6.310940742492676, "global_step": 83846, "epoch": 1996} {"train_loss": -6.215675354003906, "global_step": 83847, "epoch": 1996} {"train_loss": -6.28365421295166, "global_step": 83848, "epoch": 1996} {"train_loss": -6.245851993560791, "global_step": 83849, "epoch": 1996} {"train_loss": -6.137796401977539, "global_step": 83850, "epoch": 1996} {"train_loss": -6.249705791473389, "global_step": 83851, "epoch": 1996} {"train_loss": -6.08323860168457, "global_step": 83852, "epoch": 1996} {"train_loss": -6.2802734375, "global_step": 83853, "epoch": 1996} {"train_loss": -6.118062973022461, "global_step": 83854, "epoch": 1996} {"train_loss": -6.101619243621826, "global_step": 83855, "epoch": 1996} {"train_loss": -6.235654830932617, "global_step": 83856, "epoch": 1996} {"train_loss": -6.227294921875, "global_step": 83857, "epoch": 1996} {"train_loss": -6.139851093292236, "global_step": 83858, "epoch": 1996} {"train_loss": -6.10749626159668, "global_step": 83859, "epoch": 1996} {"train_loss": -6.17134952545166, "global_step": 83860, "epoch": 1996} {"train_loss": -6.170680046081543, "global_step": 83861, "epoch": 1996} {"train_loss": -6.016262531280518, "global_step": 83862, "epoch": 1996} {"train_loss": -6.195706367492676, "global_step": 83863, "epoch": 1996} {"train_loss": -6.265459060668945, "global_step": 83864, "epoch": 1996} {"train_loss": -6.1167097091674805, "global_step": 83865, "epoch": 1996} {"train_loss": -6.135842323303223, "global_step": 83866, "epoch": 1996} {"train_loss": -6.216785907745361, "global_step": 83867, "epoch": 1996} {"train_loss": -6.203673839569092, "global_step": 83868, "epoch": 1996} {"train_loss": -6.183647632598877, "global_step": 83869, "epoch": 1996} {"train_loss": -6.151391983032227, "global_step": 83870, "epoch": 1996} {"train_loss": -6.094956398010254, "global_step": 83871, "epoch": 1996} {"train_loss": -6.247398376464844, "global_step": 83872, "epoch": 1996} {"train_loss": -6.176328670410883, "global_step": 83873, "epoch": 1996, "val_loss": 67709.8203125} {"train_loss": -6.165994167327881, "global_step": 83874, "epoch": 1997} {"train_loss": -6.269969940185547, "global_step": 83875, "epoch": 1997} {"train_loss": -6.144466400146484, "global_step": 83876, "epoch": 1997} {"train_loss": -6.120331764221191, "global_step": 83877, "epoch": 1997} {"train_loss": -6.092809677124023, "global_step": 83878, "epoch": 1997} {"train_loss": -6.19644832611084, "global_step": 83879, "epoch": 1997} {"train_loss": -6.108757019042969, "global_step": 83880, "epoch": 1997} {"train_loss": -6.201442718505859, "global_step": 83881, "epoch": 1997} {"train_loss": -6.154160499572754, "global_step": 83882, "epoch": 1997} {"train_loss": -6.085177898406982, "global_step": 83883, "epoch": 1997} {"train_loss": -6.065729141235352, "global_step": 83884, "epoch": 1997} {"train_loss": -6.135561943054199, "global_step": 83885, "epoch": 1997} {"train_loss": -6.210149765014648, "global_step": 83886, "epoch": 1997} {"train_loss": -6.250718116760254, "global_step": 83887, "epoch": 1997} {"train_loss": -6.153929710388184, "global_step": 83888, "epoch": 1997} {"train_loss": -6.161448001861572, "global_step": 83889, "epoch": 1997} {"train_loss": -6.233551025390625, "global_step": 83890, "epoch": 1997} {"train_loss": -6.114799976348877, "global_step": 83891, "epoch": 1997} {"train_loss": -6.198436737060547, "global_step": 83892, "epoch": 1997} {"train_loss": -6.120621681213379, "global_step": 83893, "epoch": 1997} {"train_loss": -6.092705726623535, "global_step": 83894, "epoch": 1997} {"train_loss": -6.198124885559082, "global_step": 83895, "epoch": 1997} {"train_loss": -6.109440803527832, "global_step": 83896, "epoch": 1997} {"train_loss": -6.168987274169922, "global_step": 83897, "epoch": 1997} {"train_loss": -6.189459800720215, "global_step": 83898, "epoch": 1997} {"train_loss": -6.188292026519775, "global_step": 83899, "epoch": 1997} {"train_loss": -6.221155166625977, "global_step": 83900, "epoch": 1997} {"train_loss": -5.990734100341797, "global_step": 83901, "epoch": 1997} {"train_loss": -6.158385276794434, "global_step": 83902, "epoch": 1997} {"train_loss": -6.161933422088623, "global_step": 83903, "epoch": 1997} {"train_loss": -6.110857963562012, "global_step": 83904, "epoch": 1997} {"train_loss": -6.253660678863525, "global_step": 83905, "epoch": 1997} {"train_loss": -6.160261154174805, "global_step": 83906, "epoch": 1997} {"train_loss": -6.165113925933838, "global_step": 83907, "epoch": 1997} {"train_loss": -6.091977119445801, "global_step": 83908, "epoch": 1997} {"train_loss": -6.132533550262451, "global_step": 83909, "epoch": 1997} {"train_loss": -6.08164119720459, "global_step": 83910, "epoch": 1997} {"train_loss": -6.119153022766113, "global_step": 83911, "epoch": 1997} {"train_loss": -6.14259147644043, "global_step": 83912, "epoch": 1997} {"train_loss": -6.290863990783691, "global_step": 83913, "epoch": 1997} {"train_loss": -6.116178512573242, "global_step": 83914, "epoch": 1997} {"train_loss": -6.154314983458746, "global_step": 83915, "epoch": 1997, "val_loss": 68124.3125} {"train_loss": -6.192778587341309, "global_step": 83916, "epoch": 1998} {"train_loss": -6.138221740722656, "global_step": 83917, "epoch": 1998} {"train_loss": -6.196732521057129, "global_step": 83918, "epoch": 1998} {"train_loss": -6.128573417663574, "global_step": 83919, "epoch": 1998} {"train_loss": -6.285013198852539, "global_step": 83920, "epoch": 1998} {"train_loss": -6.354900360107422, "global_step": 83921, "epoch": 1998} {"train_loss": -6.201075553894043, "global_step": 83922, "epoch": 1998} {"train_loss": -6.160099983215332, "global_step": 83923, "epoch": 1998} {"train_loss": -6.122385025024414, "global_step": 83924, "epoch": 1998} {"train_loss": -6.254132270812988, "global_step": 83925, "epoch": 1998} {"train_loss": -6.130927085876465, "global_step": 83926, "epoch": 1998} {"train_loss": -6.122712135314941, "global_step": 83927, "epoch": 1998} {"train_loss": -6.0714616775512695, "global_step": 83928, "epoch": 1998} {"train_loss": -6.054998397827148, "global_step": 83929, "epoch": 1998} {"train_loss": -6.191070556640625, "global_step": 83930, "epoch": 1998} {"train_loss": -6.093024253845215, "global_step": 83931, "epoch": 1998} {"train_loss": -6.131850719451904, "global_step": 83932, "epoch": 1998} {"train_loss": -6.232857704162598, "global_step": 83933, "epoch": 1998} {"train_loss": -6.220279216766357, "global_step": 83934, "epoch": 1998} {"train_loss": -6.120197296142578, "global_step": 83935, "epoch": 1998} {"train_loss": -6.137753963470459, "global_step": 83936, "epoch": 1998} {"train_loss": -6.116854667663574, "global_step": 83937, "epoch": 1998} {"train_loss": -6.290816307067871, "global_step": 83938, "epoch": 1998} {"train_loss": -6.115564823150635, "global_step": 83939, "epoch": 1998} {"train_loss": -6.20921516418457, "global_step": 83940, "epoch": 1998} {"train_loss": -6.254373550415039, "global_step": 83941, "epoch": 1998} {"train_loss": -6.285111427307129, "global_step": 83942, "epoch": 1998} {"train_loss": -6.288253307342529, "global_step": 83943, "epoch": 1998} {"train_loss": -6.284518241882324, "global_step": 83944, "epoch": 1998} {"train_loss": -6.055944919586182, "global_step": 83945, "epoch": 1998} {"train_loss": -6.175107955932617, "global_step": 83946, "epoch": 1998} {"train_loss": -6.208616256713867, "global_step": 83947, "epoch": 1998} {"train_loss": -6.101485252380371, "global_step": 83948, "epoch": 1998} {"train_loss": -6.25538969039917, "global_step": 83949, "epoch": 1998} {"train_loss": -6.036612510681152, "global_step": 83950, "epoch": 1998} {"train_loss": -6.146888256072998, "global_step": 83951, "epoch": 1998} {"train_loss": -6.262915134429932, "global_step": 83952, "epoch": 1998} {"train_loss": -6.017184257507324, "global_step": 83953, "epoch": 1998} {"train_loss": -6.235502243041992, "global_step": 83954, "epoch": 1998} {"train_loss": -6.034075736999512, "global_step": 83955, "epoch": 1998} {"train_loss": -6.169577121734619, "global_step": 83956, "epoch": 1998} {"train_loss": -6.172914084934053, "global_step": 83957, "epoch": 1998, "val_loss": 68090.8359375} {"train_loss": -6.053362846374512, "global_step": 83958, "epoch": 1999} {"train_loss": -6.242114067077637, "global_step": 83959, "epoch": 1999} {"train_loss": -6.262461185455322, "global_step": 83960, "epoch": 1999} {"train_loss": -6.118366241455078, "global_step": 83961, "epoch": 1999} {"train_loss": -6.147475242614746, "global_step": 83962, "epoch": 1999} {"train_loss": -6.168453216552734, "global_step": 83963, "epoch": 1999} {"train_loss": -6.143135070800781, "global_step": 83964, "epoch": 1999} {"train_loss": -6.200765609741211, "global_step": 83965, "epoch": 1999} {"train_loss": -6.181741714477539, "global_step": 83966, "epoch": 1999} {"train_loss": -6.244623184204102, "global_step": 83967, "epoch": 1999} {"train_loss": -6.239139556884766, "global_step": 83968, "epoch": 1999} {"train_loss": -6.228114128112793, "global_step": 83969, "epoch": 1999} {"train_loss": -6.243568420410156, "global_step": 83970, "epoch": 1999} {"train_loss": -6.141608715057373, "global_step": 83971, "epoch": 1999} {"train_loss": -6.1436967849731445, "global_step": 83972, "epoch": 1999} {"train_loss": -6.192083835601807, "global_step": 83973, "epoch": 1999} {"train_loss": -6.055347919464111, "global_step": 83974, "epoch": 1999} {"train_loss": -6.084847927093506, "global_step": 83975, "epoch": 1999} {"train_loss": -6.067028999328613, "global_step": 83976, "epoch": 1999} {"train_loss": -6.173444747924805, "global_step": 83977, "epoch": 1999} {"train_loss": -6.100311279296875, "global_step": 83978, "epoch": 1999} {"train_loss": -6.247532844543457, "global_step": 83979, "epoch": 1999} {"train_loss": -6.169088363647461, "global_step": 83980, "epoch": 1999} {"train_loss": -6.1946940422058105, "global_step": 83981, "epoch": 1999} {"train_loss": -6.201784133911133, "global_step": 83982, "epoch": 1999} {"train_loss": -6.122166156768799, "global_step": 83983, "epoch": 1999} {"train_loss": -6.167032241821289, "global_step": 83984, "epoch": 1999} {"train_loss": -6.228305816650391, "global_step": 83985, "epoch": 1999} {"train_loss": -6.088593482971191, "global_step": 83986, "epoch": 1999} {"train_loss": -6.143461227416992, "global_step": 83987, "epoch": 1999} {"train_loss": -6.246047019958496, "global_step": 83988, "epoch": 1999} {"train_loss": -6.11666202545166, "global_step": 83989, "epoch": 1999} {"train_loss": -6.198122024536133, "global_step": 83990, "epoch": 1999} {"train_loss": -6.184699535369873, "global_step": 83991, "epoch": 1999} {"train_loss": -6.19315242767334, "global_step": 83992, "epoch": 1999} {"train_loss": -6.266415596008301, "global_step": 83993, "epoch": 1999} {"train_loss": -6.2895283699035645, "global_step": 83994, "epoch": 1999} {"train_loss": -6.290374279022217, "global_step": 83995, "epoch": 1999} {"train_loss": -6.198758125305176, "global_step": 83996, "epoch": 1999} {"train_loss": -6.142294883728027, "global_step": 83997, "epoch": 1999} {"train_loss": -6.164493560791016, "global_step": 83998, "epoch": 1999} {"train_loss": -6.175134590693882, "global_step": 83999, "epoch": 1999, "val_loss": 67799.0546875} {"train_loss": -6.2390031814575195, "global_step": 84000, "epoch": 2000} {"train_loss": -6.186051368713379, "global_step": 84001, "epoch": 2000} {"train_loss": -6.11454963684082, "global_step": 84002, "epoch": 2000} {"train_loss": -6.023096561431885, "global_step": 84003, "epoch": 2000} {"train_loss": -6.183271408081055, "global_step": 84004, "epoch": 2000} {"train_loss": -6.063999176025391, "global_step": 84005, "epoch": 2000} {"train_loss": -6.027669429779053, "global_step": 84006, "epoch": 2000} {"train_loss": -6.127406597137451, "global_step": 84007, "epoch": 2000} {"train_loss": -6.033716201782227, "global_step": 84008, "epoch": 2000} {"train_loss": -6.042482376098633, "global_step": 84009, "epoch": 2000} {"train_loss": -6.138916015625, "global_step": 84010, "epoch": 2000} {"train_loss": -6.007547378540039, "global_step": 84011, "epoch": 2000} {"train_loss": -6.104516506195068, "global_step": 84012, "epoch": 2000} {"train_loss": -6.065262794494629, "global_step": 84013, "epoch": 2000} {"train_loss": -6.1933674812316895, "global_step": 84014, "epoch": 2000} {"train_loss": -6.1412835121154785, "global_step": 84015, "epoch": 2000} {"train_loss": -6.024089813232422, "global_step": 84016, "epoch": 2000} {"train_loss": -6.180631637573242, "global_step": 84017, "epoch": 2000} {"train_loss": -6.0512285232543945, "global_step": 84018, "epoch": 2000} {"train_loss": -6.121047019958496, "global_step": 84019, "epoch": 2000} {"train_loss": -6.204062461853027, "global_step": 84020, "epoch": 2000} {"train_loss": -6.205746173858643, "global_step": 84021, "epoch": 2000} {"train_loss": -6.259390830993652, "global_step": 84022, "epoch": 2000} {"train_loss": -6.170623302459717, "global_step": 84023, "epoch": 2000} {"train_loss": -6.2267537117004395, "global_step": 84024, "epoch": 2000} {"train_loss": -6.101078987121582, "global_step": 84025, "epoch": 2000} {"train_loss": -6.111478328704834, "global_step": 84026, "epoch": 2000} {"train_loss": -6.225869178771973, "global_step": 84027, "epoch": 2000} {"train_loss": -6.286616325378418, "global_step": 84028, "epoch": 2000} {"train_loss": -6.135308265686035, "global_step": 84029, "epoch": 2000} {"train_loss": -6.188636302947998, "global_step": 84030, "epoch": 2000} {"train_loss": -6.211605072021484, "global_step": 84031, "epoch": 2000} {"train_loss": -6.20879602432251, "global_step": 84032, "epoch": 2000} {"train_loss": -6.176233291625977, "global_step": 84033, "epoch": 2000} {"train_loss": -6.216360569000244, "global_step": 84034, "epoch": 2000} {"train_loss": -6.200454235076904, "global_step": 84035, "epoch": 2000} {"train_loss": -6.130061149597168, "global_step": 84036, "epoch": 2000} {"train_loss": -6.2300333976745605, "global_step": 84037, "epoch": 2000} {"train_loss": -6.245061874389648, "global_step": 84038, "epoch": 2000} {"train_loss": -6.182680130004883, "global_step": 84039, "epoch": 2000} {"train_loss": -6.077853202819824, "global_step": 84040, "epoch": 2000} {"train_loss": -6.148233708881197, "global_step": 84041, "epoch": 2000, "train/sim_max_reward_0": 0.22505676432377458, "train/sim_max_reward_1": 0.7978804624622274, "train/sim_max_reward_2": 0.8956521080573575, "train/sim_max_reward_3": 0.13645920163352177, "train/sim_max_reward_4": 0.3096799133383422, "train/sim_max_reward_5": 0.7960660224004263, "test/sim_max_reward_4400000": 0.9054863115329292, "test/sim_max_reward_4400001": 0.17062148744047984, "test/sim_max_reward_4400002": 0.8897848915226955, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.6805463571269119, "test/sim_max_reward_4400007": 0.9162908655563641, "test/sim_max_reward_4400008": 0.3008113663129102, "test/sim_max_reward_4400009": 0.757098306120304, "test/sim_max_reward_4400010": 0.2874182753448173, "test/sim_max_reward_4400011": 0.21553450983269645, "test/sim_max_reward_4400012": 0.8786776881410422, "test/sim_max_reward_4400013": 0.9882098447513146, "test/sim_max_reward_4400014": 0.21112895758885203, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0935380059557606, "test/sim_max_reward_4400017": 0.7263778946849321, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.11889862864605281, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.624203107230682, "test/sim_max_reward_4400022": 0.9851874182627626, "test/sim_max_reward_4400023": 0.5010803870956632, "test/sim_max_reward_4400024": 0.34934758610372363, "test/sim_max_reward_4400025": 0.23621896554808947, "test/sim_max_reward_4400026": 0.23745535790602829, "test/sim_max_reward_4400027": 0.10980682346972523, "test/sim_max_reward_4400028": 0.44717855426219677, "test/sim_max_reward_4400029": 0.2780515423881038, "test/sim_max_reward_4400030": 0.8134450412629498, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.21293251783688008, "test/sim_max_reward_4400034": 0.9695450548484362, "test/sim_max_reward_4400035": 0.45477248931193937, "test/sim_max_reward_4400036": 0.8210411918185944, "test/sim_max_reward_4400037": 0.994896408591973, "test/sim_max_reward_4400038": 0.8178573293231286, "test/sim_max_reward_4400039": 0.5387083553631551, "test/sim_max_reward_4400040": 0.8834762978759803, "test/sim_max_reward_4400041": 0.8119239999933232, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.9498628575643925, "test/sim_max_reward_4400044": 0.46398120569763057, "test/sim_max_reward_4400045": 0.6666939160664058, "test/sim_max_reward_4400046": 0.8492728954267705, "test/sim_max_reward_4400047": 0.6177111019486483, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.5627630765878935, "train/mean_score": 0.5267990787026083, "test/mean_score": 0.49401816582557134, "val_loss": 67901.8359375} {"train_loss": -6.037825107574463, "global_step": 84042, "epoch": 2001} {"train_loss": -6.117347717285156, "global_step": 84043, "epoch": 2001} {"train_loss": -6.058811187744141, "global_step": 84044, "epoch": 2001} {"train_loss": -6.068647384643555, "global_step": 84045, "epoch": 2001} {"train_loss": -6.2081427574157715, "global_step": 84046, "epoch": 2001} {"train_loss": -6.184812068939209, "global_step": 84047, "epoch": 2001} {"train_loss": -6.185642242431641, "global_step": 84048, "epoch": 2001} {"train_loss": -6.231664657592773, "global_step": 84049, "epoch": 2001} {"train_loss": -6.159382343292236, "global_step": 84050, "epoch": 2001} {"train_loss": -6.02332878112793, "global_step": 84051, "epoch": 2001} {"train_loss": -6.008148193359375, "global_step": 84052, "epoch": 2001} {"train_loss": -6.2281494140625, "global_step": 84053, "epoch": 2001} {"train_loss": -6.225137710571289, "global_step": 84054, "epoch": 2001} {"train_loss": -6.165806770324707, "global_step": 84055, "epoch": 2001} {"train_loss": -6.200496196746826, "global_step": 84056, "epoch": 2001} {"train_loss": -6.165184497833252, "global_step": 84057, "epoch": 2001} {"train_loss": -6.096978187561035, "global_step": 84058, "epoch": 2001} {"train_loss": -6.173023223876953, "global_step": 84059, "epoch": 2001} {"train_loss": -6.172863006591797, "global_step": 84060, "epoch": 2001} {"train_loss": -6.169382095336914, "global_step": 84061, "epoch": 2001} {"train_loss": -6.124346733093262, "global_step": 84062, "epoch": 2001} {"train_loss": -6.197626113891602, "global_step": 84063, "epoch": 2001} {"train_loss": -6.1708784103393555, "global_step": 84064, "epoch": 2001} {"train_loss": -6.204587936401367, "global_step": 84065, "epoch": 2001} {"train_loss": -6.338526248931885, "global_step": 84066, "epoch": 2001} {"train_loss": -6.1879191398620605, "global_step": 84067, "epoch": 2001} {"train_loss": -6.226617813110352, "global_step": 84068, "epoch": 2001} {"train_loss": -6.10203742980957, "global_step": 84069, "epoch": 2001} {"train_loss": -6.119485855102539, "global_step": 84070, "epoch": 2001} {"train_loss": -6.1054840087890625, "global_step": 84071, "epoch": 2001} {"train_loss": -6.212862968444824, "global_step": 84072, "epoch": 2001} {"train_loss": -6.177163124084473, "global_step": 84073, "epoch": 2001} {"train_loss": -6.185348033905029, "global_step": 84074, "epoch": 2001} {"train_loss": -6.137373447418213, "global_step": 84075, "epoch": 2001} {"train_loss": -6.154580116271973, "global_step": 84076, "epoch": 2001} {"train_loss": -6.233023643493652, "global_step": 84077, "epoch": 2001} {"train_loss": -6.357585906982422, "global_step": 84078, "epoch": 2001} {"train_loss": -6.220798015594482, "global_step": 84079, "epoch": 2001} {"train_loss": -6.203548431396484, "global_step": 84080, "epoch": 2001} {"train_loss": -6.182559967041016, "global_step": 84081, "epoch": 2001} {"train_loss": -6.215882301330566, "global_step": 84082, "epoch": 2001} {"train_loss": -6.172074295225597, "global_step": 84083, "epoch": 2001, "val_loss": 67936.7578125} {"train_loss": -6.279048919677734, "global_step": 84084, "epoch": 2002} {"train_loss": -6.216532230377197, "global_step": 84085, "epoch": 2002} {"train_loss": -6.242412567138672, "global_step": 84086, "epoch": 2002} {"train_loss": -6.238229274749756, "global_step": 84087, "epoch": 2002} {"train_loss": -6.195524215698242, "global_step": 84088, "epoch": 2002} {"train_loss": -6.191718101501465, "global_step": 84089, "epoch": 2002} {"train_loss": -6.216836929321289, "global_step": 84090, "epoch": 2002} {"train_loss": -6.176002025604248, "global_step": 84091, "epoch": 2002} {"train_loss": -6.2489142417907715, "global_step": 84092, "epoch": 2002} {"train_loss": -6.203305244445801, "global_step": 84093, "epoch": 2002} {"train_loss": -6.113490104675293, "global_step": 84094, "epoch": 2002} {"train_loss": -6.166213035583496, "global_step": 84095, "epoch": 2002} {"train_loss": -6.166354656219482, "global_step": 84096, "epoch": 2002} {"train_loss": -6.143266677856445, "global_step": 84097, "epoch": 2002} {"train_loss": -6.143951892852783, "global_step": 84098, "epoch": 2002} {"train_loss": -6.192256927490234, "global_step": 84099, "epoch": 2002} {"train_loss": -6.137516975402832, "global_step": 84100, "epoch": 2002} {"train_loss": -6.206125259399414, "global_step": 84101, "epoch": 2002} {"train_loss": -6.125066757202148, "global_step": 84102, "epoch": 2002} {"train_loss": -6.067540645599365, "global_step": 84103, "epoch": 2002} {"train_loss": -6.219409942626953, "global_step": 84104, "epoch": 2002} {"train_loss": -6.016059875488281, "global_step": 84105, "epoch": 2002} {"train_loss": -6.158710956573486, "global_step": 84106, "epoch": 2002} {"train_loss": -6.215333461761475, "global_step": 84107, "epoch": 2002} {"train_loss": -6.1240081787109375, "global_step": 84108, "epoch": 2002} {"train_loss": -6.1764302253723145, "global_step": 84109, "epoch": 2002} {"train_loss": -6.227668762207031, "global_step": 84110, "epoch": 2002} {"train_loss": -6.135313510894775, "global_step": 84111, "epoch": 2002} {"train_loss": -6.234989166259766, "global_step": 84112, "epoch": 2002} {"train_loss": -6.263575553894043, "global_step": 84113, "epoch": 2002} {"train_loss": -6.117049217224121, "global_step": 84114, "epoch": 2002} {"train_loss": -6.260162353515625, "global_step": 84115, "epoch": 2002} {"train_loss": -6.109589099884033, "global_step": 84116, "epoch": 2002} {"train_loss": -6.184256553649902, "global_step": 84117, "epoch": 2002} {"train_loss": -6.118062973022461, "global_step": 84118, "epoch": 2002} {"train_loss": -6.081295967102051, "global_step": 84119, "epoch": 2002} {"train_loss": -6.0963897705078125, "global_step": 84120, "epoch": 2002} {"train_loss": -6.11460018157959, "global_step": 84121, "epoch": 2002} {"train_loss": -6.145555019378662, "global_step": 84122, "epoch": 2002} {"train_loss": -6.268738746643066, "global_step": 84123, "epoch": 2002} {"train_loss": -6.21401309967041, "global_step": 84124, "epoch": 2002} {"train_loss": -6.176510935737973, "global_step": 84125, "epoch": 2002, "val_loss": 67714.28125} {"train_loss": -6.164241313934326, "global_step": 84126, "epoch": 2003} {"train_loss": -6.240114212036133, "global_step": 84127, "epoch": 2003} {"train_loss": -6.211671829223633, "global_step": 84128, "epoch": 2003} {"train_loss": -6.197087287902832, "global_step": 84129, "epoch": 2003} {"train_loss": -6.274661064147949, "global_step": 84130, "epoch": 2003} {"train_loss": -6.328528881072998, "global_step": 84131, "epoch": 2003} {"train_loss": -6.241137504577637, "global_step": 84132, "epoch": 2003} {"train_loss": -6.208454132080078, "global_step": 84133, "epoch": 2003} {"train_loss": -6.283935546875, "global_step": 84134, "epoch": 2003} {"train_loss": -6.136471748352051, "global_step": 84135, "epoch": 2003} {"train_loss": -6.307363510131836, "global_step": 84136, "epoch": 2003} {"train_loss": -6.124485015869141, "global_step": 84137, "epoch": 2003} {"train_loss": -6.1980156898498535, "global_step": 84138, "epoch": 2003} {"train_loss": -6.140275001525879, "global_step": 84139, "epoch": 2003} {"train_loss": -5.9811248779296875, "global_step": 84140, "epoch": 2003} {"train_loss": -6.165008544921875, "global_step": 84141, "epoch": 2003} {"train_loss": -6.1945672035217285, "global_step": 84142, "epoch": 2003} {"train_loss": -6.045073986053467, "global_step": 84143, "epoch": 2003} {"train_loss": -6.090484619140625, "global_step": 84144, "epoch": 2003} {"train_loss": -6.295055389404297, "global_step": 84145, "epoch": 2003} {"train_loss": -6.186304092407227, "global_step": 84146, "epoch": 2003} {"train_loss": -6.195438385009766, "global_step": 84147, "epoch": 2003} {"train_loss": -6.142861366271973, "global_step": 84148, "epoch": 2003} {"train_loss": -6.166048049926758, "global_step": 84149, "epoch": 2003} {"train_loss": -6.1013712882995605, "global_step": 84150, "epoch": 2003} {"train_loss": -6.093907356262207, "global_step": 84151, "epoch": 2003} {"train_loss": -6.166895389556885, "global_step": 84152, "epoch": 2003} {"train_loss": -6.1213884353637695, "global_step": 84153, "epoch": 2003} {"train_loss": -6.121517181396484, "global_step": 84154, "epoch": 2003} {"train_loss": -6.04097843170166, "global_step": 84155, "epoch": 2003} {"train_loss": -6.171428680419922, "global_step": 84156, "epoch": 2003} {"train_loss": -6.256682395935059, "global_step": 84157, "epoch": 2003} {"train_loss": -6.103769302368164, "global_step": 84158, "epoch": 2003} {"train_loss": -6.128727912902832, "global_step": 84159, "epoch": 2003} {"train_loss": -6.153846740722656, "global_step": 84160, "epoch": 2003} {"train_loss": -6.179250717163086, "global_step": 84161, "epoch": 2003} {"train_loss": -6.161057472229004, "global_step": 84162, "epoch": 2003} {"train_loss": -6.162220478057861, "global_step": 84163, "epoch": 2003} {"train_loss": -6.202676773071289, "global_step": 84164, "epoch": 2003} {"train_loss": -6.182455062866211, "global_step": 84165, "epoch": 2003} {"train_loss": -6.0781426429748535, "global_step": 84166, "epoch": 2003} {"train_loss": -6.169940040225074, "global_step": 84167, "epoch": 2003, "val_loss": 68081.8046875} {"train_loss": -6.185294151306152, "global_step": 84168, "epoch": 2004} {"train_loss": -6.051168441772461, "global_step": 84169, "epoch": 2004} {"train_loss": -6.203932762145996, "global_step": 84170, "epoch": 2004} {"train_loss": -6.0254411697387695, "global_step": 84171, "epoch": 2004} {"train_loss": -6.290966987609863, "global_step": 84172, "epoch": 2004} {"train_loss": -6.165797233581543, "global_step": 84173, "epoch": 2004} {"train_loss": -6.216676712036133, "global_step": 84174, "epoch": 2004} {"train_loss": -6.22540807723999, "global_step": 84175, "epoch": 2004} {"train_loss": -6.174604415893555, "global_step": 84176, "epoch": 2004} {"train_loss": -6.139588832855225, "global_step": 84177, "epoch": 2004} {"train_loss": -6.214037895202637, "global_step": 84178, "epoch": 2004} {"train_loss": -6.101336479187012, "global_step": 84179, "epoch": 2004} {"train_loss": -6.187437057495117, "global_step": 84180, "epoch": 2004} {"train_loss": -6.084066390991211, "global_step": 84181, "epoch": 2004} {"train_loss": -6.2491254806518555, "global_step": 84182, "epoch": 2004} {"train_loss": -6.153960704803467, "global_step": 84183, "epoch": 2004} {"train_loss": -6.215585708618164, "global_step": 84184, "epoch": 2004} {"train_loss": -6.101293563842773, "global_step": 84185, "epoch": 2004} {"train_loss": -6.081676483154297, "global_step": 84186, "epoch": 2004} {"train_loss": -6.1427412033081055, "global_step": 84187, "epoch": 2004} {"train_loss": -6.182116985321045, "global_step": 84188, "epoch": 2004} {"train_loss": -6.044137001037598, "global_step": 84189, "epoch": 2004} {"train_loss": -6.032878875732422, "global_step": 84190, "epoch": 2004} {"train_loss": -6.1499762535095215, "global_step": 84191, "epoch": 2004} {"train_loss": -6.125452518463135, "global_step": 84192, "epoch": 2004} {"train_loss": -6.107149124145508, "global_step": 84193, "epoch": 2004} {"train_loss": -6.196432590484619, "global_step": 84194, "epoch": 2004} {"train_loss": -6.065411567687988, "global_step": 84195, "epoch": 2004} {"train_loss": -6.077980995178223, "global_step": 84196, "epoch": 2004} {"train_loss": -6.127144813537598, "global_step": 84197, "epoch": 2004} {"train_loss": -5.947772026062012, "global_step": 84198, "epoch": 2004} {"train_loss": -6.068031311035156, "global_step": 84199, "epoch": 2004} {"train_loss": -6.080551624298096, "global_step": 84200, "epoch": 2004} {"train_loss": -5.986856460571289, "global_step": 84201, "epoch": 2004} {"train_loss": -6.0611653327941895, "global_step": 84202, "epoch": 2004} {"train_loss": -6.132106781005859, "global_step": 84203, "epoch": 2004} {"train_loss": -6.08234167098999, "global_step": 84204, "epoch": 2004} {"train_loss": -6.244483947753906, "global_step": 84205, "epoch": 2004} {"train_loss": -6.058712959289551, "global_step": 84206, "epoch": 2004} {"train_loss": -6.129527568817139, "global_step": 84207, "epoch": 2004} {"train_loss": -6.148959159851074, "global_step": 84208, "epoch": 2004} {"train_loss": -6.123689288184757, "global_step": 84209, "epoch": 2004, "val_loss": 67798.2578125} {"train_loss": -6.2024335861206055, "global_step": 84210, "epoch": 2005} {"train_loss": -6.148836135864258, "global_step": 84211, "epoch": 2005} {"train_loss": -6.182089805603027, "global_step": 84212, "epoch": 2005} {"train_loss": -6.090075492858887, "global_step": 84213, "epoch": 2005} {"train_loss": -6.078342437744141, "global_step": 84214, "epoch": 2005} {"train_loss": -5.938179969787598, "global_step": 84215, "epoch": 2005} {"train_loss": -6.125299453735352, "global_step": 84216, "epoch": 2005} {"train_loss": -6.150467872619629, "global_step": 84217, "epoch": 2005} {"train_loss": -6.166592121124268, "global_step": 84218, "epoch": 2005} {"train_loss": -6.2187066078186035, "global_step": 84219, "epoch": 2005} {"train_loss": -6.041996479034424, "global_step": 84220, "epoch": 2005} {"train_loss": -6.179404258728027, "global_step": 84221, "epoch": 2005} {"train_loss": -6.119896411895752, "global_step": 84222, "epoch": 2005} {"train_loss": -6.213088512420654, "global_step": 84223, "epoch": 2005} {"train_loss": -6.237013816833496, "global_step": 84224, "epoch": 2005} {"train_loss": -6.132926940917969, "global_step": 84225, "epoch": 2005} {"train_loss": -6.191873550415039, "global_step": 84226, "epoch": 2005} {"train_loss": -6.178982734680176, "global_step": 84227, "epoch": 2005} {"train_loss": -6.0712690353393555, "global_step": 84228, "epoch": 2005} {"train_loss": -6.221071720123291, "global_step": 84229, "epoch": 2005} {"train_loss": -6.099325180053711, "global_step": 84230, "epoch": 2005} {"train_loss": -6.153924465179443, "global_step": 84231, "epoch": 2005} {"train_loss": -6.236608982086182, "global_step": 84232, "epoch": 2005} {"train_loss": -6.032824516296387, "global_step": 84233, "epoch": 2005} {"train_loss": -6.189625263214111, "global_step": 84234, "epoch": 2005} {"train_loss": -6.132635116577148, "global_step": 84235, "epoch": 2005} {"train_loss": -6.221722602844238, "global_step": 84236, "epoch": 2005} {"train_loss": -6.177042484283447, "global_step": 84237, "epoch": 2005} {"train_loss": -6.1571760177612305, "global_step": 84238, "epoch": 2005} {"train_loss": -6.176946640014648, "global_step": 84239, "epoch": 2005} {"train_loss": -6.306722640991211, "global_step": 84240, "epoch": 2005} {"train_loss": -6.198863983154297, "global_step": 84241, "epoch": 2005} {"train_loss": -6.130613327026367, "global_step": 84242, "epoch": 2005} {"train_loss": -6.0874223709106445, "global_step": 84243, "epoch": 2005} {"train_loss": -6.2817301750183105, "global_step": 84244, "epoch": 2005} {"train_loss": -6.136634826660156, "global_step": 84245, "epoch": 2005} {"train_loss": -6.205676078796387, "global_step": 84246, "epoch": 2005} {"train_loss": -6.121227741241455, "global_step": 84247, "epoch": 2005} {"train_loss": -6.1637420654296875, "global_step": 84248, "epoch": 2005} {"train_loss": -6.240734100341797, "global_step": 84249, "epoch": 2005} {"train_loss": -6.142023086547852, "global_step": 84250, "epoch": 2005} {"train_loss": -6.157680988311768, "global_step": 84251, "epoch": 2005, "val_loss": 67798.0546875} {"train_loss": -6.3033223152160645, "global_step": 84252, "epoch": 2006} {"train_loss": -6.129611968994141, "global_step": 84253, "epoch": 2006} {"train_loss": -6.205376625061035, "global_step": 84254, "epoch": 2006} {"train_loss": -6.195351600646973, "global_step": 84255, "epoch": 2006} {"train_loss": -6.207104682922363, "global_step": 84256, "epoch": 2006} {"train_loss": -6.263666152954102, "global_step": 84257, "epoch": 2006} {"train_loss": -6.116446495056152, "global_step": 84258, "epoch": 2006} {"train_loss": -6.2563157081604, "global_step": 84259, "epoch": 2006} {"train_loss": -6.217046737670898, "global_step": 84260, "epoch": 2006} {"train_loss": -6.17906379699707, "global_step": 84261, "epoch": 2006} {"train_loss": -6.1125030517578125, "global_step": 84262, "epoch": 2006} {"train_loss": -6.133686065673828, "global_step": 84263, "epoch": 2006} {"train_loss": -6.221733093261719, "global_step": 84264, "epoch": 2006} {"train_loss": -6.13301944732666, "global_step": 84265, "epoch": 2006} {"train_loss": -6.172456741333008, "global_step": 84266, "epoch": 2006} {"train_loss": -6.155715465545654, "global_step": 84267, "epoch": 2006} {"train_loss": -6.21359920501709, "global_step": 84268, "epoch": 2006} {"train_loss": -6.1873273849487305, "global_step": 84269, "epoch": 2006} {"train_loss": -6.144822120666504, "global_step": 84270, "epoch": 2006} {"train_loss": -6.138978481292725, "global_step": 84271, "epoch": 2006} {"train_loss": -6.219665050506592, "global_step": 84272, "epoch": 2006} {"train_loss": -6.225067138671875, "global_step": 84273, "epoch": 2006} {"train_loss": -6.096471786499023, "global_step": 84274, "epoch": 2006} {"train_loss": -6.09886360168457, "global_step": 84275, "epoch": 2006} {"train_loss": -6.262656211853027, "global_step": 84276, "epoch": 2006} {"train_loss": -6.241799354553223, "global_step": 84277, "epoch": 2006} {"train_loss": -6.147907257080078, "global_step": 84278, "epoch": 2006} {"train_loss": -6.082216262817383, "global_step": 84279, "epoch": 2006} {"train_loss": -6.1983537673950195, "global_step": 84280, "epoch": 2006} {"train_loss": -6.203704833984375, "global_step": 84281, "epoch": 2006} {"train_loss": -6.207900524139404, "global_step": 84282, "epoch": 2006} {"train_loss": -6.108712196350098, "global_step": 84283, "epoch": 2006} {"train_loss": -6.19553279876709, "global_step": 84284, "epoch": 2006} {"train_loss": -6.113280773162842, "global_step": 84285, "epoch": 2006} {"train_loss": -5.993814468383789, "global_step": 84286, "epoch": 2006} {"train_loss": -6.214822292327881, "global_step": 84287, "epoch": 2006} {"train_loss": -6.22313117980957, "global_step": 84288, "epoch": 2006} {"train_loss": -6.141382217407227, "global_step": 84289, "epoch": 2006} {"train_loss": -6.227855682373047, "global_step": 84290, "epoch": 2006} {"train_loss": -6.166947364807129, "global_step": 84291, "epoch": 2006} {"train_loss": -6.119912147521973, "global_step": 84292, "epoch": 2006} {"train_loss": -6.177111262366886, "global_step": 84293, "epoch": 2006, "val_loss": 67889.625} {"train_loss": -6.057573318481445, "global_step": 84294, "epoch": 2007} {"train_loss": -6.130270004272461, "global_step": 84295, "epoch": 2007} {"train_loss": -6.172133922576904, "global_step": 84296, "epoch": 2007} {"train_loss": -6.146761894226074, "global_step": 84297, "epoch": 2007} {"train_loss": -6.175458908081055, "global_step": 84298, "epoch": 2007} {"train_loss": -5.963184356689453, "global_step": 84299, "epoch": 2007} {"train_loss": -6.178192138671875, "global_step": 84300, "epoch": 2007} {"train_loss": -6.136585235595703, "global_step": 84301, "epoch": 2007} {"train_loss": -6.068081855773926, "global_step": 84302, "epoch": 2007} {"train_loss": -6.1405534744262695, "global_step": 84303, "epoch": 2007} {"train_loss": -6.096127986907959, "global_step": 84304, "epoch": 2007} {"train_loss": -6.167732238769531, "global_step": 84305, "epoch": 2007} {"train_loss": -6.080595970153809, "global_step": 84306, "epoch": 2007} {"train_loss": -6.103924751281738, "global_step": 84307, "epoch": 2007} {"train_loss": -6.252099990844727, "global_step": 84308, "epoch": 2007} {"train_loss": -6.129323482513428, "global_step": 84309, "epoch": 2007} {"train_loss": -6.168487548828125, "global_step": 84310, "epoch": 2007} {"train_loss": -6.239314079284668, "global_step": 84311, "epoch": 2007} {"train_loss": -6.101434707641602, "global_step": 84312, "epoch": 2007} {"train_loss": -6.162902355194092, "global_step": 84313, "epoch": 2007} {"train_loss": -6.095290184020996, "global_step": 84314, "epoch": 2007} {"train_loss": -6.139163970947266, "global_step": 84315, "epoch": 2007} {"train_loss": -6.175891399383545, "global_step": 84316, "epoch": 2007} {"train_loss": -6.181417465209961, "global_step": 84317, "epoch": 2007} {"train_loss": -6.015312194824219, "global_step": 84318, "epoch": 2007} {"train_loss": -6.084890365600586, "global_step": 84319, "epoch": 2007} {"train_loss": -6.227267265319824, "global_step": 84320, "epoch": 2007} {"train_loss": -6.028069496154785, "global_step": 84321, "epoch": 2007} {"train_loss": -6.111865520477295, "global_step": 84322, "epoch": 2007} {"train_loss": -6.059656143188477, "global_step": 84323, "epoch": 2007} {"train_loss": -6.133740425109863, "global_step": 84324, "epoch": 2007} {"train_loss": -6.181437015533447, "global_step": 84325, "epoch": 2007} {"train_loss": -6.120424270629883, "global_step": 84326, "epoch": 2007} {"train_loss": -6.1729302406311035, "global_step": 84327, "epoch": 2007} {"train_loss": -6.062625885009766, "global_step": 84328, "epoch": 2007} {"train_loss": -6.198952674865723, "global_step": 84329, "epoch": 2007} {"train_loss": -5.965444564819336, "global_step": 84330, "epoch": 2007} {"train_loss": -6.1698455810546875, "global_step": 84331, "epoch": 2007} {"train_loss": -6.14631986618042, "global_step": 84332, "epoch": 2007} {"train_loss": -6.095732688903809, "global_step": 84333, "epoch": 2007} {"train_loss": -6.242700576782227, "global_step": 84334, "epoch": 2007} {"train_loss": -6.129365659895397, "global_step": 84335, "epoch": 2007, "val_loss": 67750.75} {"train_loss": -6.227043628692627, "global_step": 84336, "epoch": 2008} {"train_loss": -6.244059085845947, "global_step": 84337, "epoch": 2008} {"train_loss": -6.169647693634033, "global_step": 84338, "epoch": 2008} {"train_loss": -6.211406707763672, "global_step": 84339, "epoch": 2008} {"train_loss": -6.14661979675293, "global_step": 84340, "epoch": 2008} {"train_loss": -6.160886287689209, "global_step": 84341, "epoch": 2008} {"train_loss": -6.141569137573242, "global_step": 84342, "epoch": 2008} {"train_loss": -6.237103462219238, "global_step": 84343, "epoch": 2008} {"train_loss": -6.162635326385498, "global_step": 84344, "epoch": 2008} {"train_loss": -6.088467597961426, "global_step": 84345, "epoch": 2008} {"train_loss": -6.26632022857666, "global_step": 84346, "epoch": 2008} {"train_loss": -6.203639984130859, "global_step": 84347, "epoch": 2008} {"train_loss": -6.1781110763549805, "global_step": 84348, "epoch": 2008} {"train_loss": -6.160100936889648, "global_step": 84349, "epoch": 2008} {"train_loss": -6.20558500289917, "global_step": 84350, "epoch": 2008} {"train_loss": -6.224339485168457, "global_step": 84351, "epoch": 2008} {"train_loss": -6.17249870300293, "global_step": 84352, "epoch": 2008} {"train_loss": -6.2064208984375, "global_step": 84353, "epoch": 2008} {"train_loss": -6.120619297027588, "global_step": 84354, "epoch": 2008} {"train_loss": -6.1248650550842285, "global_step": 84355, "epoch": 2008} {"train_loss": -6.2633514404296875, "global_step": 84356, "epoch": 2008} {"train_loss": -6.201114654541016, "global_step": 84357, "epoch": 2008} {"train_loss": -6.143550872802734, "global_step": 84358, "epoch": 2008} {"train_loss": -6.262032508850098, "global_step": 84359, "epoch": 2008} {"train_loss": -6.199871063232422, "global_step": 84360, "epoch": 2008} {"train_loss": -6.162636756896973, "global_step": 84361, "epoch": 2008} {"train_loss": -6.152353286743164, "global_step": 84362, "epoch": 2008} {"train_loss": -6.198330879211426, "global_step": 84363, "epoch": 2008} {"train_loss": -6.114288806915283, "global_step": 84364, "epoch": 2008} {"train_loss": -6.165979862213135, "global_step": 84365, "epoch": 2008} {"train_loss": -6.155538558959961, "global_step": 84366, "epoch": 2008} {"train_loss": -6.195822238922119, "global_step": 84367, "epoch": 2008} {"train_loss": -6.133307933807373, "global_step": 84368, "epoch": 2008} {"train_loss": -6.141855716705322, "global_step": 84369, "epoch": 2008} {"train_loss": -6.058743476867676, "global_step": 84370, "epoch": 2008} {"train_loss": -6.190857887268066, "global_step": 84371, "epoch": 2008} {"train_loss": -6.254817962646484, "global_step": 84372, "epoch": 2008} {"train_loss": -6.214078903198242, "global_step": 84373, "epoch": 2008} {"train_loss": -6.281002044677734, "global_step": 84374, "epoch": 2008} {"train_loss": -6.21146821975708, "global_step": 84375, "epoch": 2008} {"train_loss": -6.1598920822143555, "global_step": 84376, "epoch": 2008} {"train_loss": -6.183728513263521, "global_step": 84377, "epoch": 2008, "val_loss": 67827.8203125} {"train_loss": -6.188749313354492, "global_step": 84378, "epoch": 2009} {"train_loss": -6.112147808074951, "global_step": 84379, "epoch": 2009} {"train_loss": -6.326808929443359, "global_step": 84380, "epoch": 2009} {"train_loss": -6.101626396179199, "global_step": 84381, "epoch": 2009} {"train_loss": -6.177099704742432, "global_step": 84382, "epoch": 2009} {"train_loss": -6.208124160766602, "global_step": 84383, "epoch": 2009} {"train_loss": -6.196545600891113, "global_step": 84384, "epoch": 2009} {"train_loss": -6.19294548034668, "global_step": 84385, "epoch": 2009} {"train_loss": -6.282271385192871, "global_step": 84386, "epoch": 2009} {"train_loss": -6.1630072593688965, "global_step": 84387, "epoch": 2009} {"train_loss": -6.121713638305664, "global_step": 84388, "epoch": 2009} {"train_loss": -6.278341770172119, "global_step": 84389, "epoch": 2009} {"train_loss": -6.240785598754883, "global_step": 84390, "epoch": 2009} {"train_loss": -6.193140029907227, "global_step": 84391, "epoch": 2009} {"train_loss": -6.212799072265625, "global_step": 84392, "epoch": 2009} {"train_loss": -5.999810218811035, "global_step": 84393, "epoch": 2009} {"train_loss": -6.202935695648193, "global_step": 84394, "epoch": 2009} {"train_loss": -6.007773399353027, "global_step": 84395, "epoch": 2009} {"train_loss": -6.124361038208008, "global_step": 84396, "epoch": 2009} {"train_loss": -6.2250847816467285, "global_step": 84397, "epoch": 2009} {"train_loss": -6.226476669311523, "global_step": 84398, "epoch": 2009} {"train_loss": -5.983409881591797, "global_step": 84399, "epoch": 2009} {"train_loss": -6.1531476974487305, "global_step": 84400, "epoch": 2009} {"train_loss": -6.250885963439941, "global_step": 84401, "epoch": 2009} {"train_loss": -6.101440906524658, "global_step": 84402, "epoch": 2009} {"train_loss": -6.171648025512695, "global_step": 84403, "epoch": 2009} {"train_loss": -6.1053466796875, "global_step": 84404, "epoch": 2009} {"train_loss": -6.245018005371094, "global_step": 84405, "epoch": 2009} {"train_loss": -6.326589107513428, "global_step": 84406, "epoch": 2009} {"train_loss": -6.247500419616699, "global_step": 84407, "epoch": 2009} {"train_loss": -6.186163902282715, "global_step": 84408, "epoch": 2009} {"train_loss": -6.180840492248535, "global_step": 84409, "epoch": 2009} {"train_loss": -6.162138938903809, "global_step": 84410, "epoch": 2009} {"train_loss": -6.121478080749512, "global_step": 84411, "epoch": 2009} {"train_loss": -6.188850402832031, "global_step": 84412, "epoch": 2009} {"train_loss": -6.093828201293945, "global_step": 84413, "epoch": 2009} {"train_loss": -6.1996259689331055, "global_step": 84414, "epoch": 2009} {"train_loss": -6.080982685089111, "global_step": 84415, "epoch": 2009} {"train_loss": -6.06348991394043, "global_step": 84416, "epoch": 2009} {"train_loss": -6.063241958618164, "global_step": 84417, "epoch": 2009} {"train_loss": -6.018364906311035, "global_step": 84418, "epoch": 2009} {"train_loss": -6.1648835227603005, "global_step": 84419, "epoch": 2009, "val_loss": 68109.984375} {"train_loss": -6.038285255432129, "global_step": 84420, "epoch": 2010} {"train_loss": -6.117439270019531, "global_step": 84421, "epoch": 2010} {"train_loss": -6.1628007888793945, "global_step": 84422, "epoch": 2010} {"train_loss": -6.037384986877441, "global_step": 84423, "epoch": 2010} {"train_loss": -6.198830604553223, "global_step": 84424, "epoch": 2010} {"train_loss": -6.104283332824707, "global_step": 84425, "epoch": 2010} {"train_loss": -6.099431991577148, "global_step": 84426, "epoch": 2010} {"train_loss": -6.112977981567383, "global_step": 84427, "epoch": 2010} {"train_loss": -6.04215669631958, "global_step": 84428, "epoch": 2010} {"train_loss": -6.00718879699707, "global_step": 84429, "epoch": 2010} {"train_loss": -6.059854030609131, "global_step": 84430, "epoch": 2010} {"train_loss": -6.128755569458008, "global_step": 84431, "epoch": 2010} {"train_loss": -6.157796859741211, "global_step": 84432, "epoch": 2010} {"train_loss": -6.254565238952637, "global_step": 84433, "epoch": 2010} {"train_loss": -6.196403503417969, "global_step": 84434, "epoch": 2010} {"train_loss": -6.05277156829834, "global_step": 84435, "epoch": 2010} {"train_loss": -6.1147050857543945, "global_step": 84436, "epoch": 2010} {"train_loss": -6.29212760925293, "global_step": 84437, "epoch": 2010} {"train_loss": -6.212817192077637, "global_step": 84438, "epoch": 2010} {"train_loss": -6.215755462646484, "global_step": 84439, "epoch": 2010} {"train_loss": -6.164333820343018, "global_step": 84440, "epoch": 2010} {"train_loss": -6.048305988311768, "global_step": 84441, "epoch": 2010} {"train_loss": -6.101899147033691, "global_step": 84442, "epoch": 2010} {"train_loss": -6.160497188568115, "global_step": 84443, "epoch": 2010} {"train_loss": -6.0860795974731445, "global_step": 84444, "epoch": 2010} {"train_loss": -6.160120010375977, "global_step": 84445, "epoch": 2010} {"train_loss": -6.128975868225098, "global_step": 84446, "epoch": 2010} {"train_loss": -6.105623722076416, "global_step": 84447, "epoch": 2010} {"train_loss": -6.083776473999023, "global_step": 84448, "epoch": 2010} {"train_loss": -6.072833061218262, "global_step": 84449, "epoch": 2010} {"train_loss": -6.112565994262695, "global_step": 84450, "epoch": 2010} {"train_loss": -6.039127826690674, "global_step": 84451, "epoch": 2010} {"train_loss": -6.102972507476807, "global_step": 84452, "epoch": 2010} {"train_loss": -6.153533935546875, "global_step": 84453, "epoch": 2010} {"train_loss": -6.077089309692383, "global_step": 84454, "epoch": 2010} {"train_loss": -6.133033275604248, "global_step": 84455, "epoch": 2010} {"train_loss": -6.171639442443848, "global_step": 84456, "epoch": 2010} {"train_loss": -6.115849494934082, "global_step": 84457, "epoch": 2010} {"train_loss": -6.195547103881836, "global_step": 84458, "epoch": 2010} {"train_loss": -6.101231575012207, "global_step": 84459, "epoch": 2010} {"train_loss": -6.169410705566406, "global_step": 84460, "epoch": 2010} {"train_loss": -6.126001210439773, "global_step": 84461, "epoch": 2010, "val_loss": 67813.171875} {"train_loss": -6.155616283416748, "global_step": 84462, "epoch": 2011} {"train_loss": -6.10214900970459, "global_step": 84463, "epoch": 2011} {"train_loss": -6.154778480529785, "global_step": 84464, "epoch": 2011} {"train_loss": -6.130281925201416, "global_step": 84465, "epoch": 2011} {"train_loss": -6.286757946014404, "global_step": 84466, "epoch": 2011} {"train_loss": -6.193966388702393, "global_step": 84467, "epoch": 2011} {"train_loss": -6.21513557434082, "global_step": 84468, "epoch": 2011} {"train_loss": -6.159696578979492, "global_step": 84469, "epoch": 2011} {"train_loss": -6.082451343536377, "global_step": 84470, "epoch": 2011} {"train_loss": -6.158487319946289, "global_step": 84471, "epoch": 2011} {"train_loss": -6.145082473754883, "global_step": 84472, "epoch": 2011} {"train_loss": -6.219135284423828, "global_step": 84473, "epoch": 2011} {"train_loss": -6.252603530883789, "global_step": 84474, "epoch": 2011} {"train_loss": -6.1239519119262695, "global_step": 84475, "epoch": 2011} {"train_loss": -6.298494338989258, "global_step": 84476, "epoch": 2011} {"train_loss": -6.1002912521362305, "global_step": 84477, "epoch": 2011} {"train_loss": -6.200412750244141, "global_step": 84478, "epoch": 2011} {"train_loss": -6.2426652908325195, "global_step": 84479, "epoch": 2011} {"train_loss": -6.170520782470703, "global_step": 84480, "epoch": 2011} {"train_loss": -6.186751842498779, "global_step": 84481, "epoch": 2011} {"train_loss": -6.1551923751831055, "global_step": 84482, "epoch": 2011} {"train_loss": -6.1043267250061035, "global_step": 84483, "epoch": 2011} {"train_loss": -6.086418151855469, "global_step": 84484, "epoch": 2011} {"train_loss": -6.138609886169434, "global_step": 84485, "epoch": 2011} {"train_loss": -6.151711463928223, "global_step": 84486, "epoch": 2011} {"train_loss": -6.205948352813721, "global_step": 84487, "epoch": 2011} {"train_loss": -6.294568061828613, "global_step": 84488, "epoch": 2011} {"train_loss": -6.160340309143066, "global_step": 84489, "epoch": 2011} {"train_loss": -6.2304182052612305, "global_step": 84490, "epoch": 2011} {"train_loss": -6.2046403884887695, "global_step": 84491, "epoch": 2011} {"train_loss": -6.162083625793457, "global_step": 84492, "epoch": 2011} {"train_loss": -6.1465559005737305, "global_step": 84493, "epoch": 2011} {"train_loss": -6.229989051818848, "global_step": 84494, "epoch": 2011} {"train_loss": -6.078650951385498, "global_step": 84495, "epoch": 2011} {"train_loss": -6.036764144897461, "global_step": 84496, "epoch": 2011} {"train_loss": -6.162477493286133, "global_step": 84497, "epoch": 2011} {"train_loss": -6.009390354156494, "global_step": 84498, "epoch": 2011} {"train_loss": -6.099457740783691, "global_step": 84499, "epoch": 2011} {"train_loss": -6.141592502593994, "global_step": 84500, "epoch": 2011} {"train_loss": -6.147465705871582, "global_step": 84501, "epoch": 2011} {"train_loss": -6.166218280792236, "global_step": 84502, "epoch": 2011} {"train_loss": -6.160985469818115, "global_step": 84503, "epoch": 2011, "val_loss": 67723.703125} {"train_loss": -6.069074630737305, "global_step": 84504, "epoch": 2012} {"train_loss": -6.255338668823242, "global_step": 84505, "epoch": 2012} {"train_loss": -6.137209415435791, "global_step": 84506, "epoch": 2012} {"train_loss": -6.1877899169921875, "global_step": 84507, "epoch": 2012} {"train_loss": -6.040278434753418, "global_step": 84508, "epoch": 2012} {"train_loss": -6.166374206542969, "global_step": 84509, "epoch": 2012} {"train_loss": -6.24208402633667, "global_step": 84510, "epoch": 2012} {"train_loss": -6.086134910583496, "global_step": 84511, "epoch": 2012} {"train_loss": -6.188955307006836, "global_step": 84512, "epoch": 2012} {"train_loss": -6.211218357086182, "global_step": 84513, "epoch": 2012} {"train_loss": -6.254266262054443, "global_step": 84514, "epoch": 2012} {"train_loss": -6.175107479095459, "global_step": 84515, "epoch": 2012} {"train_loss": -6.127152442932129, "global_step": 84516, "epoch": 2012} {"train_loss": -6.161541938781738, "global_step": 84517, "epoch": 2012} {"train_loss": -6.066256046295166, "global_step": 84518, "epoch": 2012} {"train_loss": -6.154356479644775, "global_step": 84519, "epoch": 2012} {"train_loss": -6.255771636962891, "global_step": 84520, "epoch": 2012} {"train_loss": -6.2105560302734375, "global_step": 84521, "epoch": 2012} {"train_loss": -6.095555305480957, "global_step": 84522, "epoch": 2012} {"train_loss": -6.278292179107666, "global_step": 84523, "epoch": 2012} {"train_loss": -6.180696487426758, "global_step": 84524, "epoch": 2012} {"train_loss": -6.159287929534912, "global_step": 84525, "epoch": 2012} {"train_loss": -6.18480110168457, "global_step": 84526, "epoch": 2012} {"train_loss": -6.1444292068481445, "global_step": 84527, "epoch": 2012} {"train_loss": -6.226960182189941, "global_step": 84528, "epoch": 2012} {"train_loss": -6.120221138000488, "global_step": 84529, "epoch": 2012} {"train_loss": -6.118766784667969, "global_step": 84530, "epoch": 2012} {"train_loss": -6.284109115600586, "global_step": 84531, "epoch": 2012} {"train_loss": -6.199186325073242, "global_step": 84532, "epoch": 2012} {"train_loss": -6.1887102127075195, "global_step": 84533, "epoch": 2012} {"train_loss": -6.176407337188721, "global_step": 84534, "epoch": 2012} {"train_loss": -6.243687629699707, "global_step": 84535, "epoch": 2012} {"train_loss": -6.220679759979248, "global_step": 84536, "epoch": 2012} {"train_loss": -6.232204437255859, "global_step": 84537, "epoch": 2012} {"train_loss": -6.3549089431762695, "global_step": 84538, "epoch": 2012} {"train_loss": -6.196348190307617, "global_step": 84539, "epoch": 2012} {"train_loss": -6.154435634613037, "global_step": 84540, "epoch": 2012} {"train_loss": -6.164497375488281, "global_step": 84541, "epoch": 2012} {"train_loss": -6.1552581787109375, "global_step": 84542, "epoch": 2012} {"train_loss": -6.151412010192871, "global_step": 84543, "epoch": 2012} {"train_loss": -6.202199935913086, "global_step": 84544, "epoch": 2012} {"train_loss": -6.183193797156925, "global_step": 84545, "epoch": 2012, "val_loss": 67862.2734375} {"train_loss": -6.064451217651367, "global_step": 84546, "epoch": 2013} {"train_loss": -6.289897441864014, "global_step": 84547, "epoch": 2013} {"train_loss": -6.147830963134766, "global_step": 84548, "epoch": 2013} {"train_loss": -6.295854568481445, "global_step": 84549, "epoch": 2013} {"train_loss": -6.203448295593262, "global_step": 84550, "epoch": 2013} {"train_loss": -6.233729362487793, "global_step": 84551, "epoch": 2013} {"train_loss": -6.252898216247559, "global_step": 84552, "epoch": 2013} {"train_loss": -6.2340474128723145, "global_step": 84553, "epoch": 2013} {"train_loss": -6.2179131507873535, "global_step": 84554, "epoch": 2013} {"train_loss": -6.1004815101623535, "global_step": 84555, "epoch": 2013} {"train_loss": -6.1716532707214355, "global_step": 84556, "epoch": 2013} {"train_loss": -6.208289623260498, "global_step": 84557, "epoch": 2013} {"train_loss": -6.145099639892578, "global_step": 84558, "epoch": 2013} {"train_loss": -6.2236785888671875, "global_step": 84559, "epoch": 2013} {"train_loss": -6.291630744934082, "global_step": 84560, "epoch": 2013} {"train_loss": -6.23731803894043, "global_step": 84561, "epoch": 2013} {"train_loss": -6.246245861053467, "global_step": 84562, "epoch": 2013} {"train_loss": -6.197303771972656, "global_step": 84563, "epoch": 2013} {"train_loss": -6.255335330963135, "global_step": 84564, "epoch": 2013} {"train_loss": -6.1515583992004395, "global_step": 84565, "epoch": 2013} {"train_loss": -6.210341453552246, "global_step": 84566, "epoch": 2013} {"train_loss": -6.227663993835449, "global_step": 84567, "epoch": 2013} {"train_loss": -6.025738716125488, "global_step": 84568, "epoch": 2013} {"train_loss": -6.104930877685547, "global_step": 84569, "epoch": 2013} {"train_loss": -6.079660415649414, "global_step": 84570, "epoch": 2013} {"train_loss": -6.240879058837891, "global_step": 84571, "epoch": 2013} {"train_loss": -6.185487270355225, "global_step": 84572, "epoch": 2013} {"train_loss": -6.143755912780762, "global_step": 84573, "epoch": 2013} {"train_loss": -6.20273494720459, "global_step": 84574, "epoch": 2013} {"train_loss": -6.2059526443481445, "global_step": 84575, "epoch": 2013} {"train_loss": -6.217172622680664, "global_step": 84576, "epoch": 2013} {"train_loss": -6.298314571380615, "global_step": 84577, "epoch": 2013} {"train_loss": -6.196897506713867, "global_step": 84578, "epoch": 2013} {"train_loss": -6.099035263061523, "global_step": 84579, "epoch": 2013} {"train_loss": -6.328329086303711, "global_step": 84580, "epoch": 2013} {"train_loss": -6.235648155212402, "global_step": 84581, "epoch": 2013} {"train_loss": -6.201725959777832, "global_step": 84582, "epoch": 2013} {"train_loss": -6.107952117919922, "global_step": 84583, "epoch": 2013} {"train_loss": -6.260647296905518, "global_step": 84584, "epoch": 2013} {"train_loss": -6.303499221801758, "global_step": 84585, "epoch": 2013} {"train_loss": -6.188366889953613, "global_step": 84586, "epoch": 2013} {"train_loss": -6.202991213117327, "global_step": 84587, "epoch": 2013, "val_loss": 67602.9921875} {"train_loss": -6.189757347106934, "global_step": 84588, "epoch": 2014} {"train_loss": -6.291996955871582, "global_step": 84589, "epoch": 2014} {"train_loss": -6.135522365570068, "global_step": 84590, "epoch": 2014} {"train_loss": -6.221212387084961, "global_step": 84591, "epoch": 2014} {"train_loss": -6.13094425201416, "global_step": 84592, "epoch": 2014} {"train_loss": -6.26127290725708, "global_step": 84593, "epoch": 2014} {"train_loss": -6.257988452911377, "global_step": 84594, "epoch": 2014} {"train_loss": -6.3443450927734375, "global_step": 84595, "epoch": 2014} {"train_loss": -6.037615776062012, "global_step": 84596, "epoch": 2014} {"train_loss": -6.1211934089660645, "global_step": 84597, "epoch": 2014} {"train_loss": -6.1152753829956055, "global_step": 84598, "epoch": 2014} {"train_loss": -6.20994234085083, "global_step": 84599, "epoch": 2014} {"train_loss": -6.175209045410156, "global_step": 84600, "epoch": 2014} {"train_loss": -6.128077507019043, "global_step": 84601, "epoch": 2014} {"train_loss": -6.170535564422607, "global_step": 84602, "epoch": 2014} {"train_loss": -6.180935859680176, "global_step": 84603, "epoch": 2014} {"train_loss": -6.092911720275879, "global_step": 84604, "epoch": 2014} {"train_loss": -6.192719459533691, "global_step": 84605, "epoch": 2014} {"train_loss": -6.193592071533203, "global_step": 84606, "epoch": 2014} {"train_loss": -6.114917755126953, "global_step": 84607, "epoch": 2014} {"train_loss": -6.170122146606445, "global_step": 84608, "epoch": 2014} {"train_loss": -6.279443740844727, "global_step": 84609, "epoch": 2014} {"train_loss": -6.161083698272705, "global_step": 84610, "epoch": 2014} {"train_loss": -6.25074577331543, "global_step": 84611, "epoch": 2014} {"train_loss": -6.1448259353637695, "global_step": 84612, "epoch": 2014} {"train_loss": -6.2687578201293945, "global_step": 84613, "epoch": 2014} {"train_loss": -6.225728988647461, "global_step": 84614, "epoch": 2014} {"train_loss": -6.079830169677734, "global_step": 84615, "epoch": 2014} {"train_loss": -6.131758213043213, "global_step": 84616, "epoch": 2014} {"train_loss": -6.1997809410095215, "global_step": 84617, "epoch": 2014} {"train_loss": -6.231514930725098, "global_step": 84618, "epoch": 2014} {"train_loss": -6.29116153717041, "global_step": 84619, "epoch": 2014} {"train_loss": -6.295198440551758, "global_step": 84620, "epoch": 2014} {"train_loss": -6.162796974182129, "global_step": 84621, "epoch": 2014} {"train_loss": -6.272026062011719, "global_step": 84622, "epoch": 2014} {"train_loss": -6.200770378112793, "global_step": 84623, "epoch": 2014} {"train_loss": -6.312041759490967, "global_step": 84624, "epoch": 2014} {"train_loss": -6.065064430236816, "global_step": 84625, "epoch": 2014} {"train_loss": -6.130147933959961, "global_step": 84626, "epoch": 2014} {"train_loss": -6.103329181671143, "global_step": 84627, "epoch": 2014} {"train_loss": -6.188176155090332, "global_step": 84628, "epoch": 2014} {"train_loss": -6.186347371055966, "global_step": 84629, "epoch": 2014, "val_loss": 67855.84375} {"train_loss": -6.281669616699219, "global_step": 84630, "epoch": 2015} {"train_loss": -6.111123561859131, "global_step": 84631, "epoch": 2015} {"train_loss": -6.134157657623291, "global_step": 84632, "epoch": 2015} {"train_loss": -6.067607879638672, "global_step": 84633, "epoch": 2015} {"train_loss": -6.031877517700195, "global_step": 84634, "epoch": 2015} {"train_loss": -6.064264297485352, "global_step": 84635, "epoch": 2015} {"train_loss": -6.095800876617432, "global_step": 84636, "epoch": 2015} {"train_loss": -6.1917619705200195, "global_step": 84637, "epoch": 2015} {"train_loss": -6.0652666091918945, "global_step": 84638, "epoch": 2015} {"train_loss": -6.177339553833008, "global_step": 84639, "epoch": 2015} {"train_loss": -6.2160563468933105, "global_step": 84640, "epoch": 2015} {"train_loss": -6.160773754119873, "global_step": 84641, "epoch": 2015} {"train_loss": -6.183387756347656, "global_step": 84642, "epoch": 2015} {"train_loss": -6.144136905670166, "global_step": 84643, "epoch": 2015} {"train_loss": -6.195916175842285, "global_step": 84644, "epoch": 2015} {"train_loss": -6.244021892547607, "global_step": 84645, "epoch": 2015} {"train_loss": -6.100812911987305, "global_step": 84646, "epoch": 2015} {"train_loss": -6.187527179718018, "global_step": 84647, "epoch": 2015} {"train_loss": -6.2292022705078125, "global_step": 84648, "epoch": 2015} {"train_loss": -6.201663017272949, "global_step": 84649, "epoch": 2015} {"train_loss": -6.196640968322754, "global_step": 84650, "epoch": 2015} {"train_loss": -6.128326892852783, "global_step": 84651, "epoch": 2015} {"train_loss": -6.210371971130371, "global_step": 84652, "epoch": 2015} {"train_loss": -6.165554046630859, "global_step": 84653, "epoch": 2015} {"train_loss": -6.1005635261535645, "global_step": 84654, "epoch": 2015} {"train_loss": -6.26152229309082, "global_step": 84655, "epoch": 2015} {"train_loss": -6.244475364685059, "global_step": 84656, "epoch": 2015} {"train_loss": -6.171731948852539, "global_step": 84657, "epoch": 2015} {"train_loss": -6.293436527252197, "global_step": 84658, "epoch": 2015} {"train_loss": -6.128576755523682, "global_step": 84659, "epoch": 2015} {"train_loss": -6.254194259643555, "global_step": 84660, "epoch": 2015} {"train_loss": -6.194016456604004, "global_step": 84661, "epoch": 2015} {"train_loss": -6.094208717346191, "global_step": 84662, "epoch": 2015} {"train_loss": -6.243237495422363, "global_step": 84663, "epoch": 2015} {"train_loss": -6.245955467224121, "global_step": 84664, "epoch": 2015} {"train_loss": -6.2884602546691895, "global_step": 84665, "epoch": 2015} {"train_loss": -6.01815128326416, "global_step": 84666, "epoch": 2015} {"train_loss": -6.010896682739258, "global_step": 84667, "epoch": 2015} {"train_loss": -6.170954704284668, "global_step": 84668, "epoch": 2015} {"train_loss": -6.079352855682373, "global_step": 84669, "epoch": 2015} {"train_loss": -6.131017684936523, "global_step": 84670, "epoch": 2015} {"train_loss": -6.165423597608294, "global_step": 84671, "epoch": 2015, "val_loss": 67931.3046875} {"train_loss": -6.147459030151367, "global_step": 84672, "epoch": 2016} {"train_loss": -6.089931488037109, "global_step": 84673, "epoch": 2016} {"train_loss": -6.283253192901611, "global_step": 84674, "epoch": 2016} {"train_loss": -6.098607063293457, "global_step": 84675, "epoch": 2016} {"train_loss": -6.101637363433838, "global_step": 84676, "epoch": 2016} {"train_loss": -6.296692848205566, "global_step": 84677, "epoch": 2016} {"train_loss": -6.219003677368164, "global_step": 84678, "epoch": 2016} {"train_loss": -6.108983993530273, "global_step": 84679, "epoch": 2016} {"train_loss": -6.105981349945068, "global_step": 84680, "epoch": 2016} {"train_loss": -6.308358192443848, "global_step": 84681, "epoch": 2016} {"train_loss": -6.246438026428223, "global_step": 84682, "epoch": 2016} {"train_loss": -6.127133846282959, "global_step": 84683, "epoch": 2016} {"train_loss": -6.310971260070801, "global_step": 84684, "epoch": 2016} {"train_loss": -6.232346534729004, "global_step": 84685, "epoch": 2016} {"train_loss": -6.298521041870117, "global_step": 84686, "epoch": 2016} {"train_loss": -6.236489295959473, "global_step": 84687, "epoch": 2016} {"train_loss": -6.2596330642700195, "global_step": 84688, "epoch": 2016} {"train_loss": -6.202174186706543, "global_step": 84689, "epoch": 2016} {"train_loss": -6.218300819396973, "global_step": 84690, "epoch": 2016} {"train_loss": -6.175558567047119, "global_step": 84691, "epoch": 2016} {"train_loss": -6.243151664733887, "global_step": 84692, "epoch": 2016} {"train_loss": -6.260097503662109, "global_step": 84693, "epoch": 2016} {"train_loss": -6.186310291290283, "global_step": 84694, "epoch": 2016} {"train_loss": -6.169321537017822, "global_step": 84695, "epoch": 2016} {"train_loss": -6.226321220397949, "global_step": 84696, "epoch": 2016} {"train_loss": -6.183163642883301, "global_step": 84697, "epoch": 2016} {"train_loss": -6.130335807800293, "global_step": 84698, "epoch": 2016} {"train_loss": -6.270013332366943, "global_step": 84699, "epoch": 2016} {"train_loss": -6.217572212219238, "global_step": 84700, "epoch": 2016} {"train_loss": -6.162588119506836, "global_step": 84701, "epoch": 2016} {"train_loss": -6.1714959144592285, "global_step": 84702, "epoch": 2016} {"train_loss": -6.170506477355957, "global_step": 84703, "epoch": 2016} {"train_loss": -6.161282539367676, "global_step": 84704, "epoch": 2016} {"train_loss": -6.2331438064575195, "global_step": 84705, "epoch": 2016} {"train_loss": -6.210235595703125, "global_step": 84706, "epoch": 2016} {"train_loss": -6.161801815032959, "global_step": 84707, "epoch": 2016} {"train_loss": -6.207653999328613, "global_step": 84708, "epoch": 2016} {"train_loss": -6.201789379119873, "global_step": 84709, "epoch": 2016} {"train_loss": -6.169498443603516, "global_step": 84710, "epoch": 2016} {"train_loss": -6.107891082763672, "global_step": 84711, "epoch": 2016} {"train_loss": -6.122015953063965, "global_step": 84712, "epoch": 2016} {"train_loss": -6.19336994489034, "global_step": 84713, "epoch": 2016, "val_loss": 67944.359375} {"train_loss": -6.194488048553467, "global_step": 84714, "epoch": 2017} {"train_loss": -6.1822404861450195, "global_step": 84715, "epoch": 2017} {"train_loss": -6.141102313995361, "global_step": 84716, "epoch": 2017} {"train_loss": -6.155574798583984, "global_step": 84717, "epoch": 2017} {"train_loss": -6.207760810852051, "global_step": 84718, "epoch": 2017} {"train_loss": -6.222844123840332, "global_step": 84719, "epoch": 2017} {"train_loss": -6.068300247192383, "global_step": 84720, "epoch": 2017} {"train_loss": -6.142068862915039, "global_step": 84721, "epoch": 2017} {"train_loss": -6.161654949188232, "global_step": 84722, "epoch": 2017} {"train_loss": -6.127702236175537, "global_step": 84723, "epoch": 2017} {"train_loss": -6.0728936195373535, "global_step": 84724, "epoch": 2017} {"train_loss": -6.159472465515137, "global_step": 84725, "epoch": 2017} {"train_loss": -6.07279634475708, "global_step": 84726, "epoch": 2017} {"train_loss": -6.181543350219727, "global_step": 84727, "epoch": 2017} {"train_loss": -6.137670993804932, "global_step": 84728, "epoch": 2017} {"train_loss": -6.139674186706543, "global_step": 84729, "epoch": 2017} {"train_loss": -6.276066780090332, "global_step": 84730, "epoch": 2017} {"train_loss": -6.2557477951049805, "global_step": 84731, "epoch": 2017} {"train_loss": -6.191815376281738, "global_step": 84732, "epoch": 2017} {"train_loss": -6.266045570373535, "global_step": 84733, "epoch": 2017} {"train_loss": -6.157683849334717, "global_step": 84734, "epoch": 2017} {"train_loss": -6.106564998626709, "global_step": 84735, "epoch": 2017} {"train_loss": -6.171164035797119, "global_step": 84736, "epoch": 2017} {"train_loss": -6.166412353515625, "global_step": 84737, "epoch": 2017} {"train_loss": -6.2278547286987305, "global_step": 84738, "epoch": 2017} {"train_loss": -6.1267547607421875, "global_step": 84739, "epoch": 2017} {"train_loss": -6.060976982116699, "global_step": 84740, "epoch": 2017} {"train_loss": -6.138739109039307, "global_step": 84741, "epoch": 2017} {"train_loss": -6.115805625915527, "global_step": 84742, "epoch": 2017} {"train_loss": -6.232029914855957, "global_step": 84743, "epoch": 2017} {"train_loss": -6.080667972564697, "global_step": 84744, "epoch": 2017} {"train_loss": -6.209230899810791, "global_step": 84745, "epoch": 2017} {"train_loss": -6.128864288330078, "global_step": 84746, "epoch": 2017} {"train_loss": -6.110966682434082, "global_step": 84747, "epoch": 2017} {"train_loss": -6.232254505157471, "global_step": 84748, "epoch": 2017} {"train_loss": -6.250735282897949, "global_step": 84749, "epoch": 2017} {"train_loss": -6.203171730041504, "global_step": 84750, "epoch": 2017} {"train_loss": -6.078609943389893, "global_step": 84751, "epoch": 2017} {"train_loss": -6.103610992431641, "global_step": 84752, "epoch": 2017} {"train_loss": -6.155484199523926, "global_step": 84753, "epoch": 2017} {"train_loss": -6.1810078620910645, "global_step": 84754, "epoch": 2017} {"train_loss": -6.159549327123733, "global_step": 84755, "epoch": 2017, "val_loss": 67963.7421875} {"train_loss": -6.207243919372559, "global_step": 84756, "epoch": 2018} {"train_loss": -6.146328926086426, "global_step": 84757, "epoch": 2018} {"train_loss": -6.208040237426758, "global_step": 84758, "epoch": 2018} {"train_loss": -6.212671756744385, "global_step": 84759, "epoch": 2018} {"train_loss": -6.18727970123291, "global_step": 84760, "epoch": 2018} {"train_loss": -6.16995906829834, "global_step": 84761, "epoch": 2018} {"train_loss": -6.173352241516113, "global_step": 84762, "epoch": 2018} {"train_loss": -6.259206771850586, "global_step": 84763, "epoch": 2018} {"train_loss": -6.127267360687256, "global_step": 84764, "epoch": 2018} {"train_loss": -6.229342460632324, "global_step": 84765, "epoch": 2018} {"train_loss": -6.0095319747924805, "global_step": 84766, "epoch": 2018} {"train_loss": -6.293280124664307, "global_step": 84767, "epoch": 2018} {"train_loss": -6.218656539916992, "global_step": 84768, "epoch": 2018} {"train_loss": -6.092301845550537, "global_step": 84769, "epoch": 2018} {"train_loss": -6.257051467895508, "global_step": 84770, "epoch": 2018} {"train_loss": -6.15507698059082, "global_step": 84771, "epoch": 2018} {"train_loss": -6.077328681945801, "global_step": 84772, "epoch": 2018} {"train_loss": -6.163937091827393, "global_step": 84773, "epoch": 2018} {"train_loss": -6.28071403503418, "global_step": 84774, "epoch": 2018} {"train_loss": -6.199094295501709, "global_step": 84775, "epoch": 2018} {"train_loss": -6.2223100662231445, "global_step": 84776, "epoch": 2018} {"train_loss": -6.241004467010498, "global_step": 84777, "epoch": 2018} {"train_loss": -6.216808319091797, "global_step": 84778, "epoch": 2018} {"train_loss": -6.244036674499512, "global_step": 84779, "epoch": 2018} {"train_loss": -6.255475997924805, "global_step": 84780, "epoch": 2018} {"train_loss": -6.160062313079834, "global_step": 84781, "epoch": 2018} {"train_loss": -6.278461933135986, "global_step": 84782, "epoch": 2018} {"train_loss": -6.13661527633667, "global_step": 84783, "epoch": 2018} {"train_loss": -6.058111190795898, "global_step": 84784, "epoch": 2018} {"train_loss": -6.252337455749512, "global_step": 84785, "epoch": 2018} {"train_loss": -6.231508255004883, "global_step": 84786, "epoch": 2018} {"train_loss": -6.20316743850708, "global_step": 84787, "epoch": 2018} {"train_loss": -6.082261085510254, "global_step": 84788, "epoch": 2018} {"train_loss": -6.0626020431518555, "global_step": 84789, "epoch": 2018} {"train_loss": -6.2008466720581055, "global_step": 84790, "epoch": 2018} {"train_loss": -6.150712966918945, "global_step": 84791, "epoch": 2018} {"train_loss": -6.1693572998046875, "global_step": 84792, "epoch": 2018} {"train_loss": -6.02697229385376, "global_step": 84793, "epoch": 2018} {"train_loss": -6.277181625366211, "global_step": 84794, "epoch": 2018} {"train_loss": -6.144689559936523, "global_step": 84795, "epoch": 2018} {"train_loss": -6.190347671508789, "global_step": 84796, "epoch": 2018} {"train_loss": -6.181406747727167, "global_step": 84797, "epoch": 2018, "val_loss": 67684.125} {"train_loss": -6.10658073425293, "global_step": 84798, "epoch": 2019} {"train_loss": -6.221467971801758, "global_step": 84799, "epoch": 2019} {"train_loss": -6.146414756774902, "global_step": 84800, "epoch": 2019} {"train_loss": -6.228355407714844, "global_step": 84801, "epoch": 2019} {"train_loss": -6.247257709503174, "global_step": 84802, "epoch": 2019} {"train_loss": -6.2291059494018555, "global_step": 84803, "epoch": 2019} {"train_loss": -6.136756896972656, "global_step": 84804, "epoch": 2019} {"train_loss": -6.083110809326172, "global_step": 84805, "epoch": 2019} {"train_loss": -6.157607078552246, "global_step": 84806, "epoch": 2019} {"train_loss": -6.202258110046387, "global_step": 84807, "epoch": 2019} {"train_loss": -6.266497611999512, "global_step": 84808, "epoch": 2019} {"train_loss": -6.208045959472656, "global_step": 84809, "epoch": 2019} {"train_loss": -6.139410018920898, "global_step": 84810, "epoch": 2019} {"train_loss": -6.196592330932617, "global_step": 84811, "epoch": 2019} {"train_loss": -6.25396728515625, "global_step": 84812, "epoch": 2019} {"train_loss": -6.15163516998291, "global_step": 84813, "epoch": 2019} {"train_loss": -6.213207244873047, "global_step": 84814, "epoch": 2019} {"train_loss": -6.256206512451172, "global_step": 84815, "epoch": 2019} {"train_loss": -6.20605993270874, "global_step": 84816, "epoch": 2019} {"train_loss": -6.265113830566406, "global_step": 84817, "epoch": 2019} {"train_loss": -6.207060813903809, "global_step": 84818, "epoch": 2019} {"train_loss": -6.260802268981934, "global_step": 84819, "epoch": 2019} {"train_loss": -6.225121021270752, "global_step": 84820, "epoch": 2019} {"train_loss": -6.064279556274414, "global_step": 84821, "epoch": 2019} {"train_loss": -6.218731880187988, "global_step": 84822, "epoch": 2019} {"train_loss": -6.201232433319092, "global_step": 84823, "epoch": 2019} {"train_loss": -6.15131139755249, "global_step": 84824, "epoch": 2019} {"train_loss": -6.109806060791016, "global_step": 84825, "epoch": 2019} {"train_loss": -6.1964521408081055, "global_step": 84826, "epoch": 2019} {"train_loss": -6.088825225830078, "global_step": 84827, "epoch": 2019} {"train_loss": -6.146303176879883, "global_step": 84828, "epoch": 2019} {"train_loss": -6.087763786315918, "global_step": 84829, "epoch": 2019} {"train_loss": -6.2086181640625, "global_step": 84830, "epoch": 2019} {"train_loss": -6.065966606140137, "global_step": 84831, "epoch": 2019} {"train_loss": -6.100393772125244, "global_step": 84832, "epoch": 2019} {"train_loss": -6.120489120483398, "global_step": 84833, "epoch": 2019} {"train_loss": -6.1761698722839355, "global_step": 84834, "epoch": 2019} {"train_loss": -6.2430620193481445, "global_step": 84835, "epoch": 2019} {"train_loss": -6.150494575500488, "global_step": 84836, "epoch": 2019} {"train_loss": -6.201172828674316, "global_step": 84837, "epoch": 2019} {"train_loss": -6.093801498413086, "global_step": 84838, "epoch": 2019} {"train_loss": -6.17689003263201, "global_step": 84839, "epoch": 2019, "val_loss": 67851.3984375} {"train_loss": -6.117519378662109, "global_step": 84840, "epoch": 2020} {"train_loss": -6.2851409912109375, "global_step": 84841, "epoch": 2020} {"train_loss": -6.222774505615234, "global_step": 84842, "epoch": 2020} {"train_loss": -6.2149271965026855, "global_step": 84843, "epoch": 2020} {"train_loss": -6.090697765350342, "global_step": 84844, "epoch": 2020} {"train_loss": -6.173696041107178, "global_step": 84845, "epoch": 2020} {"train_loss": -6.203868865966797, "global_step": 84846, "epoch": 2020} {"train_loss": -6.261151313781738, "global_step": 84847, "epoch": 2020} {"train_loss": -6.072680473327637, "global_step": 84848, "epoch": 2020} {"train_loss": -6.169145584106445, "global_step": 84849, "epoch": 2020} {"train_loss": -6.1625471115112305, "global_step": 84850, "epoch": 2020} {"train_loss": -6.173743724822998, "global_step": 84851, "epoch": 2020} {"train_loss": -6.261446952819824, "global_step": 84852, "epoch": 2020} {"train_loss": -6.087424278259277, "global_step": 84853, "epoch": 2020} {"train_loss": -6.203283309936523, "global_step": 84854, "epoch": 2020} {"train_loss": -6.196243762969971, "global_step": 84855, "epoch": 2020} {"train_loss": -6.1258649826049805, "global_step": 84856, "epoch": 2020} {"train_loss": -6.1250996589660645, "global_step": 84857, "epoch": 2020} {"train_loss": -6.163821697235107, "global_step": 84858, "epoch": 2020} {"train_loss": -6.154687404632568, "global_step": 84859, "epoch": 2020} {"train_loss": -6.1060895919799805, "global_step": 84860, "epoch": 2020} {"train_loss": -6.081146717071533, "global_step": 84861, "epoch": 2020} {"train_loss": -6.22189474105835, "global_step": 84862, "epoch": 2020} {"train_loss": -6.017695426940918, "global_step": 84863, "epoch": 2020} {"train_loss": -6.2450385093688965, "global_step": 84864, "epoch": 2020} {"train_loss": -6.131185054779053, "global_step": 84865, "epoch": 2020} {"train_loss": -6.142606735229492, "global_step": 84866, "epoch": 2020} {"train_loss": -6.165022850036621, "global_step": 84867, "epoch": 2020} {"train_loss": -6.165998458862305, "global_step": 84868, "epoch": 2020} {"train_loss": -6.044709205627441, "global_step": 84869, "epoch": 2020} {"train_loss": -6.164783477783203, "global_step": 84870, "epoch": 2020} {"train_loss": -6.25065803527832, "global_step": 84871, "epoch": 2020} {"train_loss": -6.238922119140625, "global_step": 84872, "epoch": 2020} {"train_loss": -6.147221565246582, "global_step": 84873, "epoch": 2020} {"train_loss": -6.205663681030273, "global_step": 84874, "epoch": 2020} {"train_loss": -5.980616569519043, "global_step": 84875, "epoch": 2020} {"train_loss": -6.2443623542785645, "global_step": 84876, "epoch": 2020} {"train_loss": -6.051082611083984, "global_step": 84877, "epoch": 2020} {"train_loss": -6.243849754333496, "global_step": 84878, "epoch": 2020} {"train_loss": -6.0897626876831055, "global_step": 84879, "epoch": 2020} {"train_loss": -6.220654010772705, "global_step": 84880, "epoch": 2020} {"train_loss": -6.164959033330281, "global_step": 84881, "epoch": 2020, "val_loss": 67740.2109375} {"train_loss": -6.212410926818848, "global_step": 84882, "epoch": 2021} {"train_loss": -6.160621643066406, "global_step": 84883, "epoch": 2021} {"train_loss": -6.197624206542969, "global_step": 84884, "epoch": 2021} {"train_loss": -6.185443878173828, "global_step": 84885, "epoch": 2021} {"train_loss": -6.267740726470947, "global_step": 84886, "epoch": 2021} {"train_loss": -6.128618240356445, "global_step": 84887, "epoch": 2021} {"train_loss": -6.176509857177734, "global_step": 84888, "epoch": 2021} {"train_loss": -6.10978364944458, "global_step": 84889, "epoch": 2021} {"train_loss": -6.2359113693237305, "global_step": 84890, "epoch": 2021} {"train_loss": -6.1997880935668945, "global_step": 84891, "epoch": 2021} {"train_loss": -6.174481391906738, "global_step": 84892, "epoch": 2021} {"train_loss": -6.14198112487793, "global_step": 84893, "epoch": 2021} {"train_loss": -6.183740615844727, "global_step": 84894, "epoch": 2021} {"train_loss": -6.114325046539307, "global_step": 84895, "epoch": 2021} {"train_loss": -6.270742416381836, "global_step": 84896, "epoch": 2021} {"train_loss": -6.290322303771973, "global_step": 84897, "epoch": 2021} {"train_loss": -6.2584123611450195, "global_step": 84898, "epoch": 2021} {"train_loss": -6.094228267669678, "global_step": 84899, "epoch": 2021} {"train_loss": -6.128128528594971, "global_step": 84900, "epoch": 2021} {"train_loss": -6.202167510986328, "global_step": 84901, "epoch": 2021} {"train_loss": -6.31039571762085, "global_step": 84902, "epoch": 2021} {"train_loss": -6.06771183013916, "global_step": 84903, "epoch": 2021} {"train_loss": -6.248720169067383, "global_step": 84904, "epoch": 2021} {"train_loss": -6.067828178405762, "global_step": 84905, "epoch": 2021} {"train_loss": -6.10636043548584, "global_step": 84906, "epoch": 2021} {"train_loss": -6.180303573608398, "global_step": 84907, "epoch": 2021} {"train_loss": -6.142699241638184, "global_step": 84908, "epoch": 2021} {"train_loss": -6.168557167053223, "global_step": 84909, "epoch": 2021} {"train_loss": -6.199216842651367, "global_step": 84910, "epoch": 2021} {"train_loss": -6.062003135681152, "global_step": 84911, "epoch": 2021} {"train_loss": -6.18100643157959, "global_step": 84912, "epoch": 2021} {"train_loss": -6.193531513214111, "global_step": 84913, "epoch": 2021} {"train_loss": -6.0130934715271, "global_step": 84914, "epoch": 2021} {"train_loss": -6.209729194641113, "global_step": 84915, "epoch": 2021} {"train_loss": -5.928596019744873, "global_step": 84916, "epoch": 2021} {"train_loss": -6.148921966552734, "global_step": 84917, "epoch": 2021} {"train_loss": -6.088598251342773, "global_step": 84918, "epoch": 2021} {"train_loss": -6.118744850158691, "global_step": 84919, "epoch": 2021} {"train_loss": -6.221886157989502, "global_step": 84920, "epoch": 2021} {"train_loss": -6.140521049499512, "global_step": 84921, "epoch": 2021} {"train_loss": -6.158138275146484, "global_step": 84922, "epoch": 2021} {"train_loss": -6.163403397514706, "global_step": 84923, "epoch": 2021, "val_loss": 67988.265625} {"train_loss": -6.245621204376221, "global_step": 84924, "epoch": 2022} {"train_loss": -6.151708602905273, "global_step": 84925, "epoch": 2022} {"train_loss": -6.170989990234375, "global_step": 84926, "epoch": 2022} {"train_loss": -6.209954738616943, "global_step": 84927, "epoch": 2022} {"train_loss": -6.185178279876709, "global_step": 84928, "epoch": 2022} {"train_loss": -6.1879167556762695, "global_step": 84929, "epoch": 2022} {"train_loss": -6.138674736022949, "global_step": 84930, "epoch": 2022} {"train_loss": -6.233254432678223, "global_step": 84931, "epoch": 2022} {"train_loss": -6.181624412536621, "global_step": 84932, "epoch": 2022} {"train_loss": -6.1029558181762695, "global_step": 84933, "epoch": 2022} {"train_loss": -6.318017959594727, "global_step": 84934, "epoch": 2022} {"train_loss": -6.224189758300781, "global_step": 84935, "epoch": 2022} {"train_loss": -6.146122932434082, "global_step": 84936, "epoch": 2022} {"train_loss": -6.143132209777832, "global_step": 84937, "epoch": 2022} {"train_loss": -6.177891254425049, "global_step": 84938, "epoch": 2022} {"train_loss": -6.321868896484375, "global_step": 84939, "epoch": 2022} {"train_loss": -6.083556175231934, "global_step": 84940, "epoch": 2022} {"train_loss": -6.009780406951904, "global_step": 84941, "epoch": 2022} {"train_loss": -6.148093223571777, "global_step": 84942, "epoch": 2022} {"train_loss": -6.130988121032715, "global_step": 84943, "epoch": 2022} {"train_loss": -6.178854942321777, "global_step": 84944, "epoch": 2022} {"train_loss": -6.136711597442627, "global_step": 84945, "epoch": 2022} {"train_loss": -6.068365097045898, "global_step": 84946, "epoch": 2022} {"train_loss": -6.183460235595703, "global_step": 84947, "epoch": 2022} {"train_loss": -6.157445430755615, "global_step": 84948, "epoch": 2022} {"train_loss": -6.167834758758545, "global_step": 84949, "epoch": 2022} {"train_loss": -6.35577917098999, "global_step": 84950, "epoch": 2022} {"train_loss": -6.117281436920166, "global_step": 84951, "epoch": 2022} {"train_loss": -6.193509101867676, "global_step": 84952, "epoch": 2022} {"train_loss": -6.130999565124512, "global_step": 84953, "epoch": 2022} {"train_loss": -6.204827308654785, "global_step": 84954, "epoch": 2022} {"train_loss": -6.155396938323975, "global_step": 84955, "epoch": 2022} {"train_loss": -6.195589065551758, "global_step": 84956, "epoch": 2022} {"train_loss": -6.272260665893555, "global_step": 84957, "epoch": 2022} {"train_loss": -6.146064281463623, "global_step": 84958, "epoch": 2022} {"train_loss": -6.100903511047363, "global_step": 84959, "epoch": 2022} {"train_loss": -6.105169296264648, "global_step": 84960, "epoch": 2022} {"train_loss": -6.163382530212402, "global_step": 84961, "epoch": 2022} {"train_loss": -6.14532470703125, "global_step": 84962, "epoch": 2022} {"train_loss": -6.210900783538818, "global_step": 84963, "epoch": 2022} {"train_loss": -6.223557472229004, "global_step": 84964, "epoch": 2022} {"train_loss": -6.172300316038585, "global_step": 84965, "epoch": 2022, "val_loss": 67795.7265625} {"train_loss": -6.181954383850098, "global_step": 84966, "epoch": 2023} {"train_loss": -6.191061496734619, "global_step": 84967, "epoch": 2023} {"train_loss": -6.250885963439941, "global_step": 84968, "epoch": 2023} {"train_loss": -6.295578956604004, "global_step": 84969, "epoch": 2023} {"train_loss": -6.1877241134643555, "global_step": 84970, "epoch": 2023} {"train_loss": -6.2587785720825195, "global_step": 84971, "epoch": 2023} {"train_loss": -6.322107315063477, "global_step": 84972, "epoch": 2023} {"train_loss": -6.254678726196289, "global_step": 84973, "epoch": 2023} {"train_loss": -6.190499305725098, "global_step": 84974, "epoch": 2023} {"train_loss": -6.290183067321777, "global_step": 84975, "epoch": 2023} {"train_loss": -6.167229175567627, "global_step": 84976, "epoch": 2023} {"train_loss": -6.248945236206055, "global_step": 84977, "epoch": 2023} {"train_loss": -6.178632736206055, "global_step": 84978, "epoch": 2023} {"train_loss": -6.1476030349731445, "global_step": 84979, "epoch": 2023} {"train_loss": -6.155360221862793, "global_step": 84980, "epoch": 2023} {"train_loss": -6.157230377197266, "global_step": 84981, "epoch": 2023} {"train_loss": -6.228177070617676, "global_step": 84982, "epoch": 2023} {"train_loss": -6.125489234924316, "global_step": 84983, "epoch": 2023} {"train_loss": -6.204174995422363, "global_step": 84984, "epoch": 2023} {"train_loss": -6.206048965454102, "global_step": 84985, "epoch": 2023} {"train_loss": -6.300495147705078, "global_step": 84986, "epoch": 2023} {"train_loss": -6.178462028503418, "global_step": 84987, "epoch": 2023} {"train_loss": -6.123468399047852, "global_step": 84988, "epoch": 2023} {"train_loss": -6.137718200683594, "global_step": 84989, "epoch": 2023} {"train_loss": -6.1310882568359375, "global_step": 84990, "epoch": 2023} {"train_loss": -6.18593168258667, "global_step": 84991, "epoch": 2023} {"train_loss": -6.081085205078125, "global_step": 84992, "epoch": 2023} {"train_loss": -6.016938209533691, "global_step": 84993, "epoch": 2023} {"train_loss": -6.129602432250977, "global_step": 84994, "epoch": 2023} {"train_loss": -6.090494632720947, "global_step": 84995, "epoch": 2023} {"train_loss": -6.013603210449219, "global_step": 84996, "epoch": 2023} {"train_loss": -6.140160083770752, "global_step": 84997, "epoch": 2023} {"train_loss": -6.083379745483398, "global_step": 84998, "epoch": 2023} {"train_loss": -6.251780986785889, "global_step": 84999, "epoch": 2023} {"train_loss": -6.155222415924072, "global_step": 85000, "epoch": 2023} {"train_loss": -6.089834690093994, "global_step": 85001, "epoch": 2023} {"train_loss": -6.150177001953125, "global_step": 85002, "epoch": 2023} {"train_loss": -6.137500762939453, "global_step": 85003, "epoch": 2023} {"train_loss": -6.241208076477051, "global_step": 85004, "epoch": 2023} {"train_loss": -6.138477802276611, "global_step": 85005, "epoch": 2023} {"train_loss": -6.107346534729004, "global_step": 85006, "epoch": 2023} {"train_loss": -6.17681013970148, "global_step": 85007, "epoch": 2023, "val_loss": 67810.3125} {"train_loss": -6.125005722045898, "global_step": 85008, "epoch": 2024} {"train_loss": -6.0984368324279785, "global_step": 85009, "epoch": 2024} {"train_loss": -6.107769966125488, "global_step": 85010, "epoch": 2024} {"train_loss": -6.31942081451416, "global_step": 85011, "epoch": 2024} {"train_loss": -6.135176658630371, "global_step": 85012, "epoch": 2024} {"train_loss": -6.205597400665283, "global_step": 85013, "epoch": 2024} {"train_loss": -6.23455810546875, "global_step": 85014, "epoch": 2024} {"train_loss": -6.169234275817871, "global_step": 85015, "epoch": 2024} {"train_loss": -6.191994667053223, "global_step": 85016, "epoch": 2024} {"train_loss": -6.240388870239258, "global_step": 85017, "epoch": 2024} {"train_loss": -6.228016376495361, "global_step": 85018, "epoch": 2024} {"train_loss": -6.225865840911865, "global_step": 85019, "epoch": 2024} {"train_loss": -6.394415855407715, "global_step": 85020, "epoch": 2024} {"train_loss": -6.1784348487854, "global_step": 85021, "epoch": 2024} {"train_loss": -6.152800559997559, "global_step": 85022, "epoch": 2024} {"train_loss": -6.133825778961182, "global_step": 85023, "epoch": 2024} {"train_loss": -6.145276069641113, "global_step": 85024, "epoch": 2024} {"train_loss": -6.111780166625977, "global_step": 85025, "epoch": 2024} {"train_loss": -6.1660566329956055, "global_step": 85026, "epoch": 2024} {"train_loss": -6.167335510253906, "global_step": 85027, "epoch": 2024} {"train_loss": -6.212498664855957, "global_step": 85028, "epoch": 2024} {"train_loss": -6.179682731628418, "global_step": 85029, "epoch": 2024} {"train_loss": -6.175590515136719, "global_step": 85030, "epoch": 2024} {"train_loss": -6.048913955688477, "global_step": 85031, "epoch": 2024} {"train_loss": -6.165135860443115, "global_step": 85032, "epoch": 2024} {"train_loss": -6.280152797698975, "global_step": 85033, "epoch": 2024} {"train_loss": -6.183281898498535, "global_step": 85034, "epoch": 2024} {"train_loss": -6.224863052368164, "global_step": 85035, "epoch": 2024} {"train_loss": -6.113236427307129, "global_step": 85036, "epoch": 2024} {"train_loss": -6.207247734069824, "global_step": 85037, "epoch": 2024} {"train_loss": -6.2478251457214355, "global_step": 85038, "epoch": 2024} {"train_loss": -6.068752765655518, "global_step": 85039, "epoch": 2024} {"train_loss": -6.274345874786377, "global_step": 85040, "epoch": 2024} {"train_loss": -6.186492443084717, "global_step": 85041, "epoch": 2024} {"train_loss": -6.128997802734375, "global_step": 85042, "epoch": 2024} {"train_loss": -6.163827896118164, "global_step": 85043, "epoch": 2024} {"train_loss": -6.091941833496094, "global_step": 85044, "epoch": 2024} {"train_loss": -6.024557113647461, "global_step": 85045, "epoch": 2024} {"train_loss": -6.224490165710449, "global_step": 85046, "epoch": 2024} {"train_loss": -5.987600326538086, "global_step": 85047, "epoch": 2024} {"train_loss": -6.229222297668457, "global_step": 85048, "epoch": 2024} {"train_loss": -6.173760550362723, "global_step": 85049, "epoch": 2024, "val_loss": 68164.296875} {"train_loss": -6.142984390258789, "global_step": 85050, "epoch": 2025} {"train_loss": -6.214617729187012, "global_step": 85051, "epoch": 2025} {"train_loss": -6.171445369720459, "global_step": 85052, "epoch": 2025} {"train_loss": -6.145607948303223, "global_step": 85053, "epoch": 2025} {"train_loss": -6.037528038024902, "global_step": 85054, "epoch": 2025} {"train_loss": -6.168139457702637, "global_step": 85055, "epoch": 2025} {"train_loss": -6.256706237792969, "global_step": 85056, "epoch": 2025} {"train_loss": -6.16392707824707, "global_step": 85057, "epoch": 2025} {"train_loss": -6.142376899719238, "global_step": 85058, "epoch": 2025} {"train_loss": -6.1309003829956055, "global_step": 85059, "epoch": 2025} {"train_loss": -6.211860179901123, "global_step": 85060, "epoch": 2025} {"train_loss": -6.167374610900879, "global_step": 85061, "epoch": 2025} {"train_loss": -6.217765808105469, "global_step": 85062, "epoch": 2025} {"train_loss": -6.189669609069824, "global_step": 85063, "epoch": 2025} {"train_loss": -6.162835121154785, "global_step": 85064, "epoch": 2025} {"train_loss": -6.1715593338012695, "global_step": 85065, "epoch": 2025} {"train_loss": -6.215588569641113, "global_step": 85066, "epoch": 2025} {"train_loss": -6.075686454772949, "global_step": 85067, "epoch": 2025} {"train_loss": -6.230007648468018, "global_step": 85068, "epoch": 2025} {"train_loss": -6.051735877990723, "global_step": 85069, "epoch": 2025} {"train_loss": -6.178187370300293, "global_step": 85070, "epoch": 2025} {"train_loss": -6.1279072761535645, "global_step": 85071, "epoch": 2025} {"train_loss": -6.220951080322266, "global_step": 85072, "epoch": 2025} {"train_loss": -6.139426231384277, "global_step": 85073, "epoch": 2025} {"train_loss": -6.155206680297852, "global_step": 85074, "epoch": 2025} {"train_loss": -6.112233638763428, "global_step": 85075, "epoch": 2025} {"train_loss": -6.175029754638672, "global_step": 85076, "epoch": 2025} {"train_loss": -6.108046531677246, "global_step": 85077, "epoch": 2025} {"train_loss": -6.21808385848999, "global_step": 85078, "epoch": 2025} {"train_loss": -5.962939739227295, "global_step": 85079, "epoch": 2025} {"train_loss": -6.164798736572266, "global_step": 85080, "epoch": 2025} {"train_loss": -6.147978782653809, "global_step": 85081, "epoch": 2025} {"train_loss": -6.115151405334473, "global_step": 85082, "epoch": 2025} {"train_loss": -6.116879463195801, "global_step": 85083, "epoch": 2025} {"train_loss": -6.116695404052734, "global_step": 85084, "epoch": 2025} {"train_loss": -6.22121000289917, "global_step": 85085, "epoch": 2025} {"train_loss": -6.058483123779297, "global_step": 85086, "epoch": 2025} {"train_loss": -6.119747638702393, "global_step": 85087, "epoch": 2025} {"train_loss": -6.228938102722168, "global_step": 85088, "epoch": 2025} {"train_loss": -6.159891128540039, "global_step": 85089, "epoch": 2025} {"train_loss": -6.118210792541504, "global_step": 85090, "epoch": 2025} {"train_loss": -6.151363088971093, "global_step": 85091, "epoch": 2025, "val_loss": 67753.8515625} {"train_loss": -6.066844940185547, "global_step": 85092, "epoch": 2026} {"train_loss": -6.236064434051514, "global_step": 85093, "epoch": 2026} {"train_loss": -6.05531120300293, "global_step": 85094, "epoch": 2026} {"train_loss": -6.246013641357422, "global_step": 85095, "epoch": 2026} {"train_loss": -6.278356552124023, "global_step": 85096, "epoch": 2026} {"train_loss": -6.147881031036377, "global_step": 85097, "epoch": 2026} {"train_loss": -5.982302665710449, "global_step": 85098, "epoch": 2026} {"train_loss": -6.202426910400391, "global_step": 85099, "epoch": 2026} {"train_loss": -6.169546127319336, "global_step": 85100, "epoch": 2026} {"train_loss": -6.195435523986816, "global_step": 85101, "epoch": 2026} {"train_loss": -6.262241840362549, "global_step": 85102, "epoch": 2026} {"train_loss": -6.063046455383301, "global_step": 85103, "epoch": 2026} {"train_loss": -6.230337142944336, "global_step": 85104, "epoch": 2026} {"train_loss": -6.287554740905762, "global_step": 85105, "epoch": 2026} {"train_loss": -6.233072280883789, "global_step": 85106, "epoch": 2026} {"train_loss": -6.196008682250977, "global_step": 85107, "epoch": 2026} {"train_loss": -6.041962623596191, "global_step": 85108, "epoch": 2026} {"train_loss": -6.185551166534424, "global_step": 85109, "epoch": 2026} {"train_loss": -6.060474872589111, "global_step": 85110, "epoch": 2026} {"train_loss": -6.204902648925781, "global_step": 85111, "epoch": 2026} {"train_loss": -6.208367347717285, "global_step": 85112, "epoch": 2026} {"train_loss": -6.213225364685059, "global_step": 85113, "epoch": 2026} {"train_loss": -6.2014312744140625, "global_step": 85114, "epoch": 2026} {"train_loss": -6.091413497924805, "global_step": 85115, "epoch": 2026} {"train_loss": -6.1905622482299805, "global_step": 85116, "epoch": 2026} {"train_loss": -6.080316543579102, "global_step": 85117, "epoch": 2026} {"train_loss": -6.139462471008301, "global_step": 85118, "epoch": 2026} {"train_loss": -6.168418884277344, "global_step": 85119, "epoch": 2026} {"train_loss": -6.279306411743164, "global_step": 85120, "epoch": 2026} {"train_loss": -6.08042049407959, "global_step": 85121, "epoch": 2026} {"train_loss": -6.232387542724609, "global_step": 85122, "epoch": 2026} {"train_loss": -6.18023681640625, "global_step": 85123, "epoch": 2026} {"train_loss": -6.161167144775391, "global_step": 85124, "epoch": 2026} {"train_loss": -6.182674884796143, "global_step": 85125, "epoch": 2026} {"train_loss": -6.133285045623779, "global_step": 85126, "epoch": 2026} {"train_loss": -6.016944885253906, "global_step": 85127, "epoch": 2026} {"train_loss": -6.241140365600586, "global_step": 85128, "epoch": 2026} {"train_loss": -6.269676685333252, "global_step": 85129, "epoch": 2026} {"train_loss": -5.989687442779541, "global_step": 85130, "epoch": 2026} {"train_loss": -6.235507965087891, "global_step": 85131, "epoch": 2026} {"train_loss": -6.237283706665039, "global_step": 85132, "epoch": 2026} {"train_loss": -6.16919732093811, "global_step": 85133, "epoch": 2026, "val_loss": 67721.5} {"train_loss": -6.231595993041992, "global_step": 85134, "epoch": 2027} {"train_loss": -6.200617790222168, "global_step": 85135, "epoch": 2027} {"train_loss": -6.081404685974121, "global_step": 85136, "epoch": 2027} {"train_loss": -6.0606689453125, "global_step": 85137, "epoch": 2027} {"train_loss": -6.159722328186035, "global_step": 85138, "epoch": 2027} {"train_loss": -6.2570481300354, "global_step": 85139, "epoch": 2027} {"train_loss": -6.091863632202148, "global_step": 85140, "epoch": 2027} {"train_loss": -6.145707130432129, "global_step": 85141, "epoch": 2027} {"train_loss": -6.259152889251709, "global_step": 85142, "epoch": 2027} {"train_loss": -6.079843044281006, "global_step": 85143, "epoch": 2027} {"train_loss": -6.061009883880615, "global_step": 85144, "epoch": 2027} {"train_loss": -6.259785175323486, "global_step": 85145, "epoch": 2027} {"train_loss": -6.258617401123047, "global_step": 85146, "epoch": 2027} {"train_loss": -6.112626075744629, "global_step": 85147, "epoch": 2027} {"train_loss": -6.078334808349609, "global_step": 85148, "epoch": 2027} {"train_loss": -6.156787395477295, "global_step": 85149, "epoch": 2027} {"train_loss": -6.224001407623291, "global_step": 85150, "epoch": 2027} {"train_loss": -6.243062973022461, "global_step": 85151, "epoch": 2027} {"train_loss": -6.197153091430664, "global_step": 85152, "epoch": 2027} {"train_loss": -6.183560371398926, "global_step": 85153, "epoch": 2027} {"train_loss": -6.269603729248047, "global_step": 85154, "epoch": 2027} {"train_loss": -6.24553108215332, "global_step": 85155, "epoch": 2027} {"train_loss": -6.266639709472656, "global_step": 85156, "epoch": 2027} {"train_loss": -6.237666130065918, "global_step": 85157, "epoch": 2027} {"train_loss": -6.113216400146484, "global_step": 85158, "epoch": 2027} {"train_loss": -6.150849342346191, "global_step": 85159, "epoch": 2027} {"train_loss": -6.259162902832031, "global_step": 85160, "epoch": 2027} {"train_loss": -6.246647357940674, "global_step": 85161, "epoch": 2027} {"train_loss": -6.183200836181641, "global_step": 85162, "epoch": 2027} {"train_loss": -6.266100883483887, "global_step": 85163, "epoch": 2027} {"train_loss": -6.058394432067871, "global_step": 85164, "epoch": 2027} {"train_loss": -6.24415397644043, "global_step": 85165, "epoch": 2027} {"train_loss": -6.214944839477539, "global_step": 85166, "epoch": 2027} {"train_loss": -6.343764305114746, "global_step": 85167, "epoch": 2027} {"train_loss": -6.25417423248291, "global_step": 85168, "epoch": 2027} {"train_loss": -6.2476959228515625, "global_step": 85169, "epoch": 2027} {"train_loss": -6.150772571563721, "global_step": 85170, "epoch": 2027} {"train_loss": -6.253378868103027, "global_step": 85171, "epoch": 2027} {"train_loss": -6.100456237792969, "global_step": 85172, "epoch": 2027} {"train_loss": -6.288952827453613, "global_step": 85173, "epoch": 2027} {"train_loss": -6.133549690246582, "global_step": 85174, "epoch": 2027} {"train_loss": -6.1943106310708185, "global_step": 85175, "epoch": 2027, "val_loss": 67749.84375} {"train_loss": -6.309523582458496, "global_step": 85176, "epoch": 2028} {"train_loss": -6.148900985717773, "global_step": 85177, "epoch": 2028} {"train_loss": -6.317075729370117, "global_step": 85178, "epoch": 2028} {"train_loss": -6.145786285400391, "global_step": 85179, "epoch": 2028} {"train_loss": -6.215691566467285, "global_step": 85180, "epoch": 2028} {"train_loss": -6.326789379119873, "global_step": 85181, "epoch": 2028} {"train_loss": -6.0597944259643555, "global_step": 85182, "epoch": 2028} {"train_loss": -6.220493316650391, "global_step": 85183, "epoch": 2028} {"train_loss": -6.296499729156494, "global_step": 85184, "epoch": 2028} {"train_loss": -6.114902496337891, "global_step": 85185, "epoch": 2028} {"train_loss": -6.146003723144531, "global_step": 85186, "epoch": 2028} {"train_loss": -6.184850215911865, "global_step": 85187, "epoch": 2028} {"train_loss": -6.24821662902832, "global_step": 85188, "epoch": 2028} {"train_loss": -6.171526908874512, "global_step": 85189, "epoch": 2028} {"train_loss": -6.13504695892334, "global_step": 85190, "epoch": 2028} {"train_loss": -6.085878372192383, "global_step": 85191, "epoch": 2028} {"train_loss": -6.1467108726501465, "global_step": 85192, "epoch": 2028} {"train_loss": -6.201868057250977, "global_step": 85193, "epoch": 2028} {"train_loss": -6.014159202575684, "global_step": 85194, "epoch": 2028} {"train_loss": -6.103919982910156, "global_step": 85195, "epoch": 2028} {"train_loss": -6.144189357757568, "global_step": 85196, "epoch": 2028} {"train_loss": -6.0614519119262695, "global_step": 85197, "epoch": 2028} {"train_loss": -6.192227363586426, "global_step": 85198, "epoch": 2028} {"train_loss": -6.189607620239258, "global_step": 85199, "epoch": 2028} {"train_loss": -6.142921447753906, "global_step": 85200, "epoch": 2028} {"train_loss": -6.167906284332275, "global_step": 85201, "epoch": 2028} {"train_loss": -6.082374572753906, "global_step": 85202, "epoch": 2028} {"train_loss": -6.139418601989746, "global_step": 85203, "epoch": 2028} {"train_loss": -6.177146911621094, "global_step": 85204, "epoch": 2028} {"train_loss": -6.0731892585754395, "global_step": 85205, "epoch": 2028} {"train_loss": -6.093088150024414, "global_step": 85206, "epoch": 2028} {"train_loss": -6.279467582702637, "global_step": 85207, "epoch": 2028} {"train_loss": -6.153176307678223, "global_step": 85208, "epoch": 2028} {"train_loss": -6.106576442718506, "global_step": 85209, "epoch": 2028} {"train_loss": -6.231595516204834, "global_step": 85210, "epoch": 2028} {"train_loss": -6.194974422454834, "global_step": 85211, "epoch": 2028} {"train_loss": -6.105401039123535, "global_step": 85212, "epoch": 2028} {"train_loss": -6.094578742980957, "global_step": 85213, "epoch": 2028} {"train_loss": -6.124871253967285, "global_step": 85214, "epoch": 2028} {"train_loss": -6.100811004638672, "global_step": 85215, "epoch": 2028} {"train_loss": -6.146970272064209, "global_step": 85216, "epoch": 2028} {"train_loss": -6.160230012167068, "global_step": 85217, "epoch": 2028, "val_loss": 67749.1875} {"train_loss": -6.1362762451171875, "global_step": 85218, "epoch": 2029} {"train_loss": -6.183183193206787, "global_step": 85219, "epoch": 2029} {"train_loss": -6.183465957641602, "global_step": 85220, "epoch": 2029} {"train_loss": -5.951443195343018, "global_step": 85221, "epoch": 2029} {"train_loss": -6.2148284912109375, "global_step": 85222, "epoch": 2029} {"train_loss": -6.10087251663208, "global_step": 85223, "epoch": 2029} {"train_loss": -6.09650993347168, "global_step": 85224, "epoch": 2029} {"train_loss": -6.096063613891602, "global_step": 85225, "epoch": 2029} {"train_loss": -6.207095623016357, "global_step": 85226, "epoch": 2029} {"train_loss": -6.218794822692871, "global_step": 85227, "epoch": 2029} {"train_loss": -6.141436576843262, "global_step": 85228, "epoch": 2029} {"train_loss": -6.120708465576172, "global_step": 85229, "epoch": 2029} {"train_loss": -6.093268394470215, "global_step": 85230, "epoch": 2029} {"train_loss": -6.246519088745117, "global_step": 85231, "epoch": 2029} {"train_loss": -6.194211006164551, "global_step": 85232, "epoch": 2029} {"train_loss": -6.1798834800720215, "global_step": 85233, "epoch": 2029} {"train_loss": -6.408784866333008, "global_step": 85234, "epoch": 2029} {"train_loss": -6.176790714263916, "global_step": 85235, "epoch": 2029} {"train_loss": -6.1339030265808105, "global_step": 85236, "epoch": 2029} {"train_loss": -6.135931015014648, "global_step": 85237, "epoch": 2029} {"train_loss": -6.164272785186768, "global_step": 85238, "epoch": 2029} {"train_loss": -6.209794998168945, "global_step": 85239, "epoch": 2029} {"train_loss": -6.185766220092773, "global_step": 85240, "epoch": 2029} {"train_loss": -6.220677375793457, "global_step": 85241, "epoch": 2029} {"train_loss": -6.179253578186035, "global_step": 85242, "epoch": 2029} {"train_loss": -6.040142059326172, "global_step": 85243, "epoch": 2029} {"train_loss": -6.068077087402344, "global_step": 85244, "epoch": 2029} {"train_loss": -6.144870281219482, "global_step": 85245, "epoch": 2029} {"train_loss": -6.227353096008301, "global_step": 85246, "epoch": 2029} {"train_loss": -6.044689178466797, "global_step": 85247, "epoch": 2029} {"train_loss": -6.1731367111206055, "global_step": 85248, "epoch": 2029} {"train_loss": -6.182706356048584, "global_step": 85249, "epoch": 2029} {"train_loss": -6.044620037078857, "global_step": 85250, "epoch": 2029} {"train_loss": -6.191431045532227, "global_step": 85251, "epoch": 2029} {"train_loss": -6.089657306671143, "global_step": 85252, "epoch": 2029} {"train_loss": -6.033833026885986, "global_step": 85253, "epoch": 2029} {"train_loss": -6.279621601104736, "global_step": 85254, "epoch": 2029} {"train_loss": -6.214261054992676, "global_step": 85255, "epoch": 2029} {"train_loss": -6.15641450881958, "global_step": 85256, "epoch": 2029} {"train_loss": -6.236438274383545, "global_step": 85257, "epoch": 2029} {"train_loss": -6.175209045410156, "global_step": 85258, "epoch": 2029} {"train_loss": -6.155795585541498, "global_step": 85259, "epoch": 2029, "val_loss": 67601.171875} {"train_loss": -6.181858062744141, "global_step": 85260, "epoch": 2030} {"train_loss": -6.074639320373535, "global_step": 85261, "epoch": 2030} {"train_loss": -6.19425106048584, "global_step": 85262, "epoch": 2030} {"train_loss": -6.019891262054443, "global_step": 85263, "epoch": 2030} {"train_loss": -6.169929504394531, "global_step": 85264, "epoch": 2030} {"train_loss": -6.092376708984375, "global_step": 85265, "epoch": 2030} {"train_loss": -6.233578681945801, "global_step": 85266, "epoch": 2030} {"train_loss": -6.158945083618164, "global_step": 85267, "epoch": 2030} {"train_loss": -5.9708075523376465, "global_step": 85268, "epoch": 2030} {"train_loss": -6.115306854248047, "global_step": 85269, "epoch": 2030} {"train_loss": -5.970139503479004, "global_step": 85270, "epoch": 2030} {"train_loss": -6.139359474182129, "global_step": 85271, "epoch": 2030} {"train_loss": -6.282810688018799, "global_step": 85272, "epoch": 2030} {"train_loss": -6.201869964599609, "global_step": 85273, "epoch": 2030} {"train_loss": -6.111239910125732, "global_step": 85274, "epoch": 2030} {"train_loss": -6.114121913909912, "global_step": 85275, "epoch": 2030} {"train_loss": -6.18646240234375, "global_step": 85276, "epoch": 2030} {"train_loss": -6.267303466796875, "global_step": 85277, "epoch": 2030} {"train_loss": -6.191188812255859, "global_step": 85278, "epoch": 2030} {"train_loss": -6.263465881347656, "global_step": 85279, "epoch": 2030} {"train_loss": -6.009435653686523, "global_step": 85280, "epoch": 2030} {"train_loss": -6.222806930541992, "global_step": 85281, "epoch": 2030} {"train_loss": -6.1483635902404785, "global_step": 85282, "epoch": 2030} {"train_loss": -6.206463813781738, "global_step": 85283, "epoch": 2030} {"train_loss": -6.1581926345825195, "global_step": 85284, "epoch": 2030} {"train_loss": -6.074333190917969, "global_step": 85285, "epoch": 2030} {"train_loss": -6.147199630737305, "global_step": 85286, "epoch": 2030} {"train_loss": -6.255887031555176, "global_step": 85287, "epoch": 2030} {"train_loss": -6.178466796875, "global_step": 85288, "epoch": 2030} {"train_loss": -6.249406814575195, "global_step": 85289, "epoch": 2030} {"train_loss": -6.0886735916137695, "global_step": 85290, "epoch": 2030} {"train_loss": -6.0797224044799805, "global_step": 85291, "epoch": 2030} {"train_loss": -6.223276138305664, "global_step": 85292, "epoch": 2030} {"train_loss": -6.2088470458984375, "global_step": 85293, "epoch": 2030} {"train_loss": -5.995089530944824, "global_step": 85294, "epoch": 2030} {"train_loss": -6.216746807098389, "global_step": 85295, "epoch": 2030} {"train_loss": -6.0229926109313965, "global_step": 85296, "epoch": 2030} {"train_loss": -6.0836591720581055, "global_step": 85297, "epoch": 2030} {"train_loss": -6.1590423583984375, "global_step": 85298, "epoch": 2030} {"train_loss": -6.1833295822143555, "global_step": 85299, "epoch": 2030} {"train_loss": -6.211536407470703, "global_step": 85300, "epoch": 2030} {"train_loss": -6.147845188776652, "global_step": 85301, "epoch": 2030, "val_loss": 67772.6640625} {"train_loss": -6.046716690063477, "global_step": 85302, "epoch": 2031} {"train_loss": -6.0479536056518555, "global_step": 85303, "epoch": 2031} {"train_loss": -6.265995979309082, "global_step": 85304, "epoch": 2031} {"train_loss": -6.125200271606445, "global_step": 85305, "epoch": 2031} {"train_loss": -6.165317535400391, "global_step": 85306, "epoch": 2031} {"train_loss": -6.148988723754883, "global_step": 85307, "epoch": 2031} {"train_loss": -6.255675315856934, "global_step": 85308, "epoch": 2031} {"train_loss": -6.099167823791504, "global_step": 85309, "epoch": 2031} {"train_loss": -6.247852325439453, "global_step": 85310, "epoch": 2031} {"train_loss": -6.249980926513672, "global_step": 85311, "epoch": 2031} {"train_loss": -6.138846397399902, "global_step": 85312, "epoch": 2031} {"train_loss": -6.116427421569824, "global_step": 85313, "epoch": 2031} {"train_loss": -5.987706184387207, "global_step": 85314, "epoch": 2031} {"train_loss": -6.123999118804932, "global_step": 85315, "epoch": 2031} {"train_loss": -6.154716491699219, "global_step": 85316, "epoch": 2031} {"train_loss": -6.14433479309082, "global_step": 85317, "epoch": 2031} {"train_loss": -6.108839988708496, "global_step": 85318, "epoch": 2031} {"train_loss": -6.1200480461120605, "global_step": 85319, "epoch": 2031} {"train_loss": -6.122933864593506, "global_step": 85320, "epoch": 2031} {"train_loss": -6.1599321365356445, "global_step": 85321, "epoch": 2031} {"train_loss": -6.135494232177734, "global_step": 85322, "epoch": 2031} {"train_loss": -6.058335304260254, "global_step": 85323, "epoch": 2031} {"train_loss": -6.151198387145996, "global_step": 85324, "epoch": 2031} {"train_loss": -6.100679874420166, "global_step": 85325, "epoch": 2031} {"train_loss": -6.110459327697754, "global_step": 85326, "epoch": 2031} {"train_loss": -6.231539726257324, "global_step": 85327, "epoch": 2031} {"train_loss": -6.14354133605957, "global_step": 85328, "epoch": 2031} {"train_loss": -6.044766426086426, "global_step": 85329, "epoch": 2031} {"train_loss": -6.223559856414795, "global_step": 85330, "epoch": 2031} {"train_loss": -6.167236328125, "global_step": 85331, "epoch": 2031} {"train_loss": -6.253584384918213, "global_step": 85332, "epoch": 2031} {"train_loss": -6.224849700927734, "global_step": 85333, "epoch": 2031} {"train_loss": -6.134445667266846, "global_step": 85334, "epoch": 2031} {"train_loss": -6.20101261138916, "global_step": 85335, "epoch": 2031} {"train_loss": -6.161651611328125, "global_step": 85336, "epoch": 2031} {"train_loss": -5.996356010437012, "global_step": 85337, "epoch": 2031} {"train_loss": -6.313436508178711, "global_step": 85338, "epoch": 2031} {"train_loss": -6.17357873916626, "global_step": 85339, "epoch": 2031} {"train_loss": -6.200851917266846, "global_step": 85340, "epoch": 2031} {"train_loss": -6.109260559082031, "global_step": 85341, "epoch": 2031} {"train_loss": -6.175347805023193, "global_step": 85342, "epoch": 2031} {"train_loss": -6.150128932226272, "global_step": 85343, "epoch": 2031, "val_loss": 67962.734375} {"train_loss": -6.197904109954834, "global_step": 85344, "epoch": 2032} {"train_loss": -6.107472896575928, "global_step": 85345, "epoch": 2032} {"train_loss": -6.082635402679443, "global_step": 85346, "epoch": 2032} {"train_loss": -6.135217666625977, "global_step": 85347, "epoch": 2032} {"train_loss": -6.3124189376831055, "global_step": 85348, "epoch": 2032} {"train_loss": -6.247551918029785, "global_step": 85349, "epoch": 2032} {"train_loss": -6.209640979766846, "global_step": 85350, "epoch": 2032} {"train_loss": -6.132923603057861, "global_step": 85351, "epoch": 2032} {"train_loss": -6.244138240814209, "global_step": 85352, "epoch": 2032} {"train_loss": -6.186402797698975, "global_step": 85353, "epoch": 2032} {"train_loss": -6.216033935546875, "global_step": 85354, "epoch": 2032} {"train_loss": -6.066495895385742, "global_step": 85355, "epoch": 2032} {"train_loss": -6.183832168579102, "global_step": 85356, "epoch": 2032} {"train_loss": -6.128342628479004, "global_step": 85357, "epoch": 2032} {"train_loss": -6.162633895874023, "global_step": 85358, "epoch": 2032} {"train_loss": -6.1267290115356445, "global_step": 85359, "epoch": 2032} {"train_loss": -6.155584335327148, "global_step": 85360, "epoch": 2032} {"train_loss": -6.026446342468262, "global_step": 85361, "epoch": 2032} {"train_loss": -6.15324592590332, "global_step": 85362, "epoch": 2032} {"train_loss": -5.996133804321289, "global_step": 85363, "epoch": 2032} {"train_loss": -6.238626003265381, "global_step": 85364, "epoch": 2032} {"train_loss": -6.197298049926758, "global_step": 85365, "epoch": 2032} {"train_loss": -6.169721603393555, "global_step": 85366, "epoch": 2032} {"train_loss": -6.136773109436035, "global_step": 85367, "epoch": 2032} {"train_loss": -6.175914764404297, "global_step": 85368, "epoch": 2032} {"train_loss": -5.996273040771484, "global_step": 85369, "epoch": 2032} {"train_loss": -6.133401870727539, "global_step": 85370, "epoch": 2032} {"train_loss": -6.159818172454834, "global_step": 85371, "epoch": 2032} {"train_loss": -6.084585666656494, "global_step": 85372, "epoch": 2032} {"train_loss": -6.131757736206055, "global_step": 85373, "epoch": 2032} {"train_loss": -6.238021373748779, "global_step": 85374, "epoch": 2032} {"train_loss": -6.12122106552124, "global_step": 85375, "epoch": 2032} {"train_loss": -6.138562202453613, "global_step": 85376, "epoch": 2032} {"train_loss": -6.154090881347656, "global_step": 85377, "epoch": 2032} {"train_loss": -6.3847856521606445, "global_step": 85378, "epoch": 2032} {"train_loss": -6.238933563232422, "global_step": 85379, "epoch": 2032} {"train_loss": -6.170649528503418, "global_step": 85380, "epoch": 2032} {"train_loss": -6.191672325134277, "global_step": 85381, "epoch": 2032} {"train_loss": -6.110813617706299, "global_step": 85382, "epoch": 2032} {"train_loss": -6.07536506652832, "global_step": 85383, "epoch": 2032} {"train_loss": -6.160677909851074, "global_step": 85384, "epoch": 2032} {"train_loss": -6.158850227083478, "global_step": 85385, "epoch": 2032, "val_loss": 67785.96875} {"train_loss": -6.1331634521484375, "global_step": 85386, "epoch": 2033} {"train_loss": -6.193243980407715, "global_step": 85387, "epoch": 2033} {"train_loss": -6.224782943725586, "global_step": 85388, "epoch": 2033} {"train_loss": -6.222292423248291, "global_step": 85389, "epoch": 2033} {"train_loss": -6.244637966156006, "global_step": 85390, "epoch": 2033} {"train_loss": -6.274382591247559, "global_step": 85391, "epoch": 2033} {"train_loss": -6.187378883361816, "global_step": 85392, "epoch": 2033} {"train_loss": -6.104135036468506, "global_step": 85393, "epoch": 2033} {"train_loss": -6.277736186981201, "global_step": 85394, "epoch": 2033} {"train_loss": -6.1175127029418945, "global_step": 85395, "epoch": 2033} {"train_loss": -6.093710899353027, "global_step": 85396, "epoch": 2033} {"train_loss": -6.165271759033203, "global_step": 85397, "epoch": 2033} {"train_loss": -6.092975616455078, "global_step": 85398, "epoch": 2033} {"train_loss": -6.154719352722168, "global_step": 85399, "epoch": 2033} {"train_loss": -6.142064094543457, "global_step": 85400, "epoch": 2033} {"train_loss": -6.188213348388672, "global_step": 85401, "epoch": 2033} {"train_loss": -6.0522050857543945, "global_step": 85402, "epoch": 2033} {"train_loss": -6.205321311950684, "global_step": 85403, "epoch": 2033} {"train_loss": -6.239690780639648, "global_step": 85404, "epoch": 2033} {"train_loss": -6.077230453491211, "global_step": 85405, "epoch": 2033} {"train_loss": -6.1805830001831055, "global_step": 85406, "epoch": 2033} {"train_loss": -6.165413856506348, "global_step": 85407, "epoch": 2033} {"train_loss": -6.172144889831543, "global_step": 85408, "epoch": 2033} {"train_loss": -6.043938159942627, "global_step": 85409, "epoch": 2033} {"train_loss": -6.18907356262207, "global_step": 85410, "epoch": 2033} {"train_loss": -6.181679725646973, "global_step": 85411, "epoch": 2033} {"train_loss": -6.123340606689453, "global_step": 85412, "epoch": 2033} {"train_loss": -6.167428016662598, "global_step": 85413, "epoch": 2033} {"train_loss": -6.201948165893555, "global_step": 85414, "epoch": 2033} {"train_loss": -6.090290069580078, "global_step": 85415, "epoch": 2033} {"train_loss": -6.295168876647949, "global_step": 85416, "epoch": 2033} {"train_loss": -6.071659088134766, "global_step": 85417, "epoch": 2033} {"train_loss": -6.25726842880249, "global_step": 85418, "epoch": 2033} {"train_loss": -6.246628761291504, "global_step": 85419, "epoch": 2033} {"train_loss": -6.148468971252441, "global_step": 85420, "epoch": 2033} {"train_loss": -6.229089736938477, "global_step": 85421, "epoch": 2033} {"train_loss": -6.226838111877441, "global_step": 85422, "epoch": 2033} {"train_loss": -6.182244300842285, "global_step": 85423, "epoch": 2033} {"train_loss": -6.178810119628906, "global_step": 85424, "epoch": 2033} {"train_loss": -6.134060859680176, "global_step": 85425, "epoch": 2033} {"train_loss": -6.133907794952393, "global_step": 85426, "epoch": 2033} {"train_loss": -6.168111891973586, "global_step": 85427, "epoch": 2033, "val_loss": 67976.1640625} {"train_loss": -6.206490993499756, "global_step": 85428, "epoch": 2034} {"train_loss": -6.155312538146973, "global_step": 85429, "epoch": 2034} {"train_loss": -6.295772552490234, "global_step": 85430, "epoch": 2034} {"train_loss": -6.121912956237793, "global_step": 85431, "epoch": 2034} {"train_loss": -6.176300048828125, "global_step": 85432, "epoch": 2034} {"train_loss": -6.209733486175537, "global_step": 85433, "epoch": 2034} {"train_loss": -6.276784420013428, "global_step": 85434, "epoch": 2034} {"train_loss": -6.085305213928223, "global_step": 85435, "epoch": 2034} {"train_loss": -6.197055339813232, "global_step": 85436, "epoch": 2034} {"train_loss": -6.188876152038574, "global_step": 85437, "epoch": 2034} {"train_loss": -6.293305397033691, "global_step": 85438, "epoch": 2034} {"train_loss": -6.283379554748535, "global_step": 85439, "epoch": 2034} {"train_loss": -6.115401744842529, "global_step": 85440, "epoch": 2034} {"train_loss": -6.1922149658203125, "global_step": 85441, "epoch": 2034} {"train_loss": -6.02471923828125, "global_step": 85442, "epoch": 2034} {"train_loss": -6.168824672698975, "global_step": 85443, "epoch": 2034} {"train_loss": -6.244730472564697, "global_step": 85444, "epoch": 2034} {"train_loss": -6.227066993713379, "global_step": 85445, "epoch": 2034} {"train_loss": -6.154537200927734, "global_step": 85446, "epoch": 2034} {"train_loss": -6.15631103515625, "global_step": 85447, "epoch": 2034} {"train_loss": -6.150381088256836, "global_step": 85448, "epoch": 2034} {"train_loss": -6.110532760620117, "global_step": 85449, "epoch": 2034} {"train_loss": -6.1988983154296875, "global_step": 85450, "epoch": 2034} {"train_loss": -6.309947967529297, "global_step": 85451, "epoch": 2034} {"train_loss": -6.24885368347168, "global_step": 85452, "epoch": 2034} {"train_loss": -6.245967388153076, "global_step": 85453, "epoch": 2034} {"train_loss": -6.163464546203613, "global_step": 85454, "epoch": 2034} {"train_loss": -6.210893630981445, "global_step": 85455, "epoch": 2034} {"train_loss": -6.168834686279297, "global_step": 85456, "epoch": 2034} {"train_loss": -6.2201642990112305, "global_step": 85457, "epoch": 2034} {"train_loss": -6.164412498474121, "global_step": 85458, "epoch": 2034} {"train_loss": -6.266783714294434, "global_step": 85459, "epoch": 2034} {"train_loss": -6.312199115753174, "global_step": 85460, "epoch": 2034} {"train_loss": -6.1654839515686035, "global_step": 85461, "epoch": 2034} {"train_loss": -6.256721496582031, "global_step": 85462, "epoch": 2034} {"train_loss": -6.1561174392700195, "global_step": 85463, "epoch": 2034} {"train_loss": -6.161114692687988, "global_step": 85464, "epoch": 2034} {"train_loss": -6.159892559051514, "global_step": 85465, "epoch": 2034} {"train_loss": -6.215368747711182, "global_step": 85466, "epoch": 2034} {"train_loss": -6.110146999359131, "global_step": 85467, "epoch": 2034} {"train_loss": -6.097031116485596, "global_step": 85468, "epoch": 2034} {"train_loss": -6.190717163540068, "global_step": 85469, "epoch": 2034, "val_loss": 67805.0078125} {"train_loss": -6.002784729003906, "global_step": 85470, "epoch": 2035} {"train_loss": -6.181238651275635, "global_step": 85471, "epoch": 2035} {"train_loss": -6.254349708557129, "global_step": 85472, "epoch": 2035} {"train_loss": -6.212734222412109, "global_step": 85473, "epoch": 2035} {"train_loss": -6.215353488922119, "global_step": 85474, "epoch": 2035} {"train_loss": -6.385593891143799, "global_step": 85475, "epoch": 2035} {"train_loss": -6.230648994445801, "global_step": 85476, "epoch": 2035} {"train_loss": -6.193033695220947, "global_step": 85477, "epoch": 2035} {"train_loss": -6.141740322113037, "global_step": 85478, "epoch": 2035} {"train_loss": -6.215176582336426, "global_step": 85479, "epoch": 2035} {"train_loss": -6.139191627502441, "global_step": 85480, "epoch": 2035} {"train_loss": -6.35872220993042, "global_step": 85481, "epoch": 2035} {"train_loss": -6.185049533843994, "global_step": 85482, "epoch": 2035} {"train_loss": -6.229045867919922, "global_step": 85483, "epoch": 2035} {"train_loss": -6.298859596252441, "global_step": 85484, "epoch": 2035} {"train_loss": -6.169952392578125, "global_step": 85485, "epoch": 2035} {"train_loss": -6.292140960693359, "global_step": 85486, "epoch": 2035} {"train_loss": -6.277464389801025, "global_step": 85487, "epoch": 2035} {"train_loss": -6.135608673095703, "global_step": 85488, "epoch": 2035} {"train_loss": -6.134254455566406, "global_step": 85489, "epoch": 2035} {"train_loss": -6.168975353240967, "global_step": 85490, "epoch": 2035} {"train_loss": -6.283902168273926, "global_step": 85491, "epoch": 2035} {"train_loss": -6.116327285766602, "global_step": 85492, "epoch": 2035} {"train_loss": -6.176351070404053, "global_step": 85493, "epoch": 2035} {"train_loss": -6.29430627822876, "global_step": 85494, "epoch": 2035} {"train_loss": -6.209179878234863, "global_step": 85495, "epoch": 2035} {"train_loss": -6.2674560546875, "global_step": 85496, "epoch": 2035} {"train_loss": -6.2623610496521, "global_step": 85497, "epoch": 2035} {"train_loss": -6.25749397277832, "global_step": 85498, "epoch": 2035} {"train_loss": -6.267375469207764, "global_step": 85499, "epoch": 2035} {"train_loss": -6.330461025238037, "global_step": 85500, "epoch": 2035} {"train_loss": -6.215907096862793, "global_step": 85501, "epoch": 2035} {"train_loss": -6.147197723388672, "global_step": 85502, "epoch": 2035} {"train_loss": -6.240155220031738, "global_step": 85503, "epoch": 2035} {"train_loss": -6.2288055419921875, "global_step": 85504, "epoch": 2035} {"train_loss": -6.220746994018555, "global_step": 85505, "epoch": 2035} {"train_loss": -6.255720138549805, "global_step": 85506, "epoch": 2035} {"train_loss": -6.224822998046875, "global_step": 85507, "epoch": 2035} {"train_loss": -6.12445592880249, "global_step": 85508, "epoch": 2035} {"train_loss": -6.129697799682617, "global_step": 85509, "epoch": 2035} {"train_loss": -6.247235298156738, "global_step": 85510, "epoch": 2035} {"train_loss": -6.217186189833141, "global_step": 85511, "epoch": 2035, "val_loss": 67727.9140625} {"train_loss": -6.235226631164551, "global_step": 85512, "epoch": 2036} {"train_loss": -6.052210807800293, "global_step": 85513, "epoch": 2036} {"train_loss": -6.179821014404297, "global_step": 85514, "epoch": 2036} {"train_loss": -6.144119739532471, "global_step": 85515, "epoch": 2036} {"train_loss": -6.160022258758545, "global_step": 85516, "epoch": 2036} {"train_loss": -6.093255043029785, "global_step": 85517, "epoch": 2036} {"train_loss": -6.066400527954102, "global_step": 85518, "epoch": 2036} {"train_loss": -6.167976379394531, "global_step": 85519, "epoch": 2036} {"train_loss": -6.142961025238037, "global_step": 85520, "epoch": 2036} {"train_loss": -6.117870330810547, "global_step": 85521, "epoch": 2036} {"train_loss": -6.251164436340332, "global_step": 85522, "epoch": 2036} {"train_loss": -6.132019519805908, "global_step": 85523, "epoch": 2036} {"train_loss": -6.187613487243652, "global_step": 85524, "epoch": 2036} {"train_loss": -6.20566463470459, "global_step": 85525, "epoch": 2036} {"train_loss": -6.22207498550415, "global_step": 85526, "epoch": 2036} {"train_loss": -6.192445278167725, "global_step": 85527, "epoch": 2036} {"train_loss": -6.225140571594238, "global_step": 85528, "epoch": 2036} {"train_loss": -6.299295902252197, "global_step": 85529, "epoch": 2036} {"train_loss": -6.274475574493408, "global_step": 85530, "epoch": 2036} {"train_loss": -6.1520676612854, "global_step": 85531, "epoch": 2036} {"train_loss": -6.21076774597168, "global_step": 85532, "epoch": 2036} {"train_loss": -6.153354167938232, "global_step": 85533, "epoch": 2036} {"train_loss": -6.184288024902344, "global_step": 85534, "epoch": 2036} {"train_loss": -6.2479753494262695, "global_step": 85535, "epoch": 2036} {"train_loss": -6.249485015869141, "global_step": 85536, "epoch": 2036} {"train_loss": -6.196408748626709, "global_step": 85537, "epoch": 2036} {"train_loss": -6.235398769378662, "global_step": 85538, "epoch": 2036} {"train_loss": -6.103018760681152, "global_step": 85539, "epoch": 2036} {"train_loss": -6.256809234619141, "global_step": 85540, "epoch": 2036} {"train_loss": -6.156481742858887, "global_step": 85541, "epoch": 2036} {"train_loss": -6.162212371826172, "global_step": 85542, "epoch": 2036} {"train_loss": -6.194513320922852, "global_step": 85543, "epoch": 2036} {"train_loss": -6.112305641174316, "global_step": 85544, "epoch": 2036} {"train_loss": -6.082401752471924, "global_step": 85545, "epoch": 2036} {"train_loss": -6.23298978805542, "global_step": 85546, "epoch": 2036} {"train_loss": -6.056680202484131, "global_step": 85547, "epoch": 2036} {"train_loss": -6.069553852081299, "global_step": 85548, "epoch": 2036} {"train_loss": -5.938588619232178, "global_step": 85549, "epoch": 2036} {"train_loss": -6.102712631225586, "global_step": 85550, "epoch": 2036} {"train_loss": -6.046358108520508, "global_step": 85551, "epoch": 2036} {"train_loss": -5.989190101623535, "global_step": 85552, "epoch": 2036} {"train_loss": -6.157738696961176, "global_step": 85553, "epoch": 2036, "val_loss": 68046.2421875} {"train_loss": -6.04709005355835, "global_step": 85554, "epoch": 2037} {"train_loss": -5.9922356605529785, "global_step": 85555, "epoch": 2037} {"train_loss": -6.16306734085083, "global_step": 85556, "epoch": 2037} {"train_loss": -6.016044616699219, "global_step": 85557, "epoch": 2037} {"train_loss": -6.12091064453125, "global_step": 85558, "epoch": 2037} {"train_loss": -6.13035249710083, "global_step": 85559, "epoch": 2037} {"train_loss": -6.075371265411377, "global_step": 85560, "epoch": 2037} {"train_loss": -6.0465521812438965, "global_step": 85561, "epoch": 2037} {"train_loss": -6.281099319458008, "global_step": 85562, "epoch": 2037} {"train_loss": -6.022577285766602, "global_step": 85563, "epoch": 2037} {"train_loss": -6.1013054847717285, "global_step": 85564, "epoch": 2037} {"train_loss": -6.0498247146606445, "global_step": 85565, "epoch": 2037} {"train_loss": -6.177114486694336, "global_step": 85566, "epoch": 2037} {"train_loss": -6.121086120605469, "global_step": 85567, "epoch": 2037} {"train_loss": -6.001463890075684, "global_step": 85568, "epoch": 2037} {"train_loss": -6.140878677368164, "global_step": 85569, "epoch": 2037} {"train_loss": -6.183626174926758, "global_step": 85570, "epoch": 2037} {"train_loss": -6.166265964508057, "global_step": 85571, "epoch": 2037} {"train_loss": -6.1439595222473145, "global_step": 85572, "epoch": 2037} {"train_loss": -6.198154926300049, "global_step": 85573, "epoch": 2037} {"train_loss": -6.252974033355713, "global_step": 85574, "epoch": 2037} {"train_loss": -6.107672691345215, "global_step": 85575, "epoch": 2037} {"train_loss": -5.936976432800293, "global_step": 85576, "epoch": 2037} {"train_loss": -6.1759257316589355, "global_step": 85577, "epoch": 2037} {"train_loss": -6.028371810913086, "global_step": 85578, "epoch": 2037} {"train_loss": -6.196566104888916, "global_step": 85579, "epoch": 2037} {"train_loss": -6.100472450256348, "global_step": 85580, "epoch": 2037} {"train_loss": -6.208409309387207, "global_step": 85581, "epoch": 2037} {"train_loss": -6.239239692687988, "global_step": 85582, "epoch": 2037} {"train_loss": -6.186379432678223, "global_step": 85583, "epoch": 2037} {"train_loss": -6.221681594848633, "global_step": 85584, "epoch": 2037} {"train_loss": -6.077436447143555, "global_step": 85585, "epoch": 2037} {"train_loss": -6.16349458694458, "global_step": 85586, "epoch": 2037} {"train_loss": -6.165134906768799, "global_step": 85587, "epoch": 2037} {"train_loss": -6.135477066040039, "global_step": 85588, "epoch": 2037} {"train_loss": -6.055988311767578, "global_step": 85589, "epoch": 2037} {"train_loss": -6.1773786544799805, "global_step": 85590, "epoch": 2037} {"train_loss": -6.143473148345947, "global_step": 85591, "epoch": 2037} {"train_loss": -6.1138739585876465, "global_step": 85592, "epoch": 2037} {"train_loss": -6.241204738616943, "global_step": 85593, "epoch": 2037} {"train_loss": -6.0978851318359375, "global_step": 85594, "epoch": 2037} {"train_loss": -6.125921249389648, "global_step": 85595, "epoch": 2037, "val_loss": 67733.9375} {"train_loss": -6.158396244049072, "global_step": 85596, "epoch": 2038} {"train_loss": -6.203112602233887, "global_step": 85597, "epoch": 2038} {"train_loss": -6.254179954528809, "global_step": 85598, "epoch": 2038} {"train_loss": -6.072633266448975, "global_step": 85599, "epoch": 2038} {"train_loss": -6.041751861572266, "global_step": 85600, "epoch": 2038} {"train_loss": -6.085366725921631, "global_step": 85601, "epoch": 2038} {"train_loss": -6.1187262535095215, "global_step": 85602, "epoch": 2038} {"train_loss": -6.1557841300964355, "global_step": 85603, "epoch": 2038} {"train_loss": -6.0539631843566895, "global_step": 85604, "epoch": 2038} {"train_loss": -6.315334320068359, "global_step": 85605, "epoch": 2038} {"train_loss": -6.1130547523498535, "global_step": 85606, "epoch": 2038} {"train_loss": -6.180727005004883, "global_step": 85607, "epoch": 2038} {"train_loss": -6.165579795837402, "global_step": 85608, "epoch": 2038} {"train_loss": -6.169607162475586, "global_step": 85609, "epoch": 2038} {"train_loss": -6.164193153381348, "global_step": 85610, "epoch": 2038} {"train_loss": -6.140066146850586, "global_step": 85611, "epoch": 2038} {"train_loss": -6.142065048217773, "global_step": 85612, "epoch": 2038} {"train_loss": -6.303038120269775, "global_step": 85613, "epoch": 2038} {"train_loss": -6.139130592346191, "global_step": 85614, "epoch": 2038} {"train_loss": -6.228124618530273, "global_step": 85615, "epoch": 2038} {"train_loss": -6.097456455230713, "global_step": 85616, "epoch": 2038} {"train_loss": -6.2392659187316895, "global_step": 85617, "epoch": 2038} {"train_loss": -6.266417503356934, "global_step": 85618, "epoch": 2038} {"train_loss": -6.232326030731201, "global_step": 85619, "epoch": 2038} {"train_loss": -6.09339714050293, "global_step": 85620, "epoch": 2038} {"train_loss": -6.167631149291992, "global_step": 85621, "epoch": 2038} {"train_loss": -6.071531295776367, "global_step": 85622, "epoch": 2038} {"train_loss": -6.151622772216797, "global_step": 85623, "epoch": 2038} {"train_loss": -6.242718696594238, "global_step": 85624, "epoch": 2038} {"train_loss": -6.231459617614746, "global_step": 85625, "epoch": 2038} {"train_loss": -6.210893630981445, "global_step": 85626, "epoch": 2038} {"train_loss": -6.068610191345215, "global_step": 85627, "epoch": 2038} {"train_loss": -6.255941390991211, "global_step": 85628, "epoch": 2038} {"train_loss": -6.150216102600098, "global_step": 85629, "epoch": 2038} {"train_loss": -6.191789150238037, "global_step": 85630, "epoch": 2038} {"train_loss": -6.141266822814941, "global_step": 85631, "epoch": 2038} {"train_loss": -6.229435920715332, "global_step": 85632, "epoch": 2038} {"train_loss": -6.326231956481934, "global_step": 85633, "epoch": 2038} {"train_loss": -6.262722015380859, "global_step": 85634, "epoch": 2038} {"train_loss": -6.212167263031006, "global_step": 85635, "epoch": 2038} {"train_loss": -6.229083061218262, "global_step": 85636, "epoch": 2038} {"train_loss": -6.175968317758469, "global_step": 85637, "epoch": 2038, "val_loss": 67753.5078125} {"train_loss": -6.20012092590332, "global_step": 85638, "epoch": 2039} {"train_loss": -6.138349533081055, "global_step": 85639, "epoch": 2039} {"train_loss": -6.209063529968262, "global_step": 85640, "epoch": 2039} {"train_loss": -6.282952308654785, "global_step": 85641, "epoch": 2039} {"train_loss": -6.180262565612793, "global_step": 85642, "epoch": 2039} {"train_loss": -6.247133255004883, "global_step": 85643, "epoch": 2039} {"train_loss": -6.213220119476318, "global_step": 85644, "epoch": 2039} {"train_loss": -6.039224624633789, "global_step": 85645, "epoch": 2039} {"train_loss": -6.2135539054870605, "global_step": 85646, "epoch": 2039} {"train_loss": -6.170292854309082, "global_step": 85647, "epoch": 2039} {"train_loss": -6.3040056228637695, "global_step": 85648, "epoch": 2039} {"train_loss": -6.122314453125, "global_step": 85649, "epoch": 2039} {"train_loss": -6.010740280151367, "global_step": 85650, "epoch": 2039} {"train_loss": -6.14463472366333, "global_step": 85651, "epoch": 2039} {"train_loss": -6.1369428634643555, "global_step": 85652, "epoch": 2039} {"train_loss": -6.15939998626709, "global_step": 85653, "epoch": 2039} {"train_loss": -6.211367130279541, "global_step": 85654, "epoch": 2039} {"train_loss": -6.21751594543457, "global_step": 85655, "epoch": 2039} {"train_loss": -6.2041826248168945, "global_step": 85656, "epoch": 2039} {"train_loss": -5.997478485107422, "global_step": 85657, "epoch": 2039} {"train_loss": -6.116102695465088, "global_step": 85658, "epoch": 2039} {"train_loss": -6.2813215255737305, "global_step": 85659, "epoch": 2039} {"train_loss": -6.192143440246582, "global_step": 85660, "epoch": 2039} {"train_loss": -6.2140631675720215, "global_step": 85661, "epoch": 2039} {"train_loss": -6.056468963623047, "global_step": 85662, "epoch": 2039} {"train_loss": -6.119040489196777, "global_step": 85663, "epoch": 2039} {"train_loss": -6.087677955627441, "global_step": 85664, "epoch": 2039} {"train_loss": -6.155877113342285, "global_step": 85665, "epoch": 2039} {"train_loss": -6.208097457885742, "global_step": 85666, "epoch": 2039} {"train_loss": -6.010655403137207, "global_step": 85667, "epoch": 2039} {"train_loss": -5.981509685516357, "global_step": 85668, "epoch": 2039} {"train_loss": -6.124507904052734, "global_step": 85669, "epoch": 2039} {"train_loss": -6.03333854675293, "global_step": 85670, "epoch": 2039} {"train_loss": -6.125962257385254, "global_step": 85671, "epoch": 2039} {"train_loss": -5.929893493652344, "global_step": 85672, "epoch": 2039} {"train_loss": -6.096755027770996, "global_step": 85673, "epoch": 2039} {"train_loss": -6.057844161987305, "global_step": 85674, "epoch": 2039} {"train_loss": -6.138810157775879, "global_step": 85675, "epoch": 2039} {"train_loss": -6.081879615783691, "global_step": 85676, "epoch": 2039} {"train_loss": -6.061822891235352, "global_step": 85677, "epoch": 2039} {"train_loss": -6.233245849609375, "global_step": 85678, "epoch": 2039} {"train_loss": -6.138187510626657, "global_step": 85679, "epoch": 2039, "val_loss": 67717.96875} {"train_loss": -6.251632213592529, "global_step": 85680, "epoch": 2040} {"train_loss": -6.302361488342285, "global_step": 85681, "epoch": 2040} {"train_loss": -6.252333641052246, "global_step": 85682, "epoch": 2040} {"train_loss": -6.055393218994141, "global_step": 85683, "epoch": 2040} {"train_loss": -6.086586952209473, "global_step": 85684, "epoch": 2040} {"train_loss": -6.172590255737305, "global_step": 85685, "epoch": 2040} {"train_loss": -6.21240758895874, "global_step": 85686, "epoch": 2040} {"train_loss": -6.221236228942871, "global_step": 85687, "epoch": 2040} {"train_loss": -6.04176139831543, "global_step": 85688, "epoch": 2040} {"train_loss": -6.1700439453125, "global_step": 85689, "epoch": 2040} {"train_loss": -6.216172218322754, "global_step": 85690, "epoch": 2040} {"train_loss": -6.201613426208496, "global_step": 85691, "epoch": 2040} {"train_loss": -6.106222152709961, "global_step": 85692, "epoch": 2040} {"train_loss": -6.0966057777404785, "global_step": 85693, "epoch": 2040} {"train_loss": -6.1637773513793945, "global_step": 85694, "epoch": 2040} {"train_loss": -6.294679641723633, "global_step": 85695, "epoch": 2040} {"train_loss": -6.240101337432861, "global_step": 85696, "epoch": 2040} {"train_loss": -6.151888847351074, "global_step": 85697, "epoch": 2040} {"train_loss": -6.110431671142578, "global_step": 85698, "epoch": 2040} {"train_loss": -6.125353813171387, "global_step": 85699, "epoch": 2040} {"train_loss": -6.218973159790039, "global_step": 85700, "epoch": 2040} {"train_loss": -6.240157127380371, "global_step": 85701, "epoch": 2040} {"train_loss": -6.233011245727539, "global_step": 85702, "epoch": 2040} {"train_loss": -6.104118824005127, "global_step": 85703, "epoch": 2040} {"train_loss": -6.217113971710205, "global_step": 85704, "epoch": 2040} {"train_loss": -6.27159309387207, "global_step": 85705, "epoch": 2040} {"train_loss": -6.219998359680176, "global_step": 85706, "epoch": 2040} {"train_loss": -6.256165027618408, "global_step": 85707, "epoch": 2040} {"train_loss": -6.3390421867370605, "global_step": 85708, "epoch": 2040} {"train_loss": -6.088693141937256, "global_step": 85709, "epoch": 2040} {"train_loss": -6.201199531555176, "global_step": 85710, "epoch": 2040} {"train_loss": -6.153820037841797, "global_step": 85711, "epoch": 2040} {"train_loss": -6.16805362701416, "global_step": 85712, "epoch": 2040} {"train_loss": -6.380618095397949, "global_step": 85713, "epoch": 2040} {"train_loss": -6.213345527648926, "global_step": 85714, "epoch": 2040} {"train_loss": -6.191329002380371, "global_step": 85715, "epoch": 2040} {"train_loss": -6.220029830932617, "global_step": 85716, "epoch": 2040} {"train_loss": -6.26679801940918, "global_step": 85717, "epoch": 2040} {"train_loss": -6.1942853927612305, "global_step": 85718, "epoch": 2040} {"train_loss": -6.099103927612305, "global_step": 85719, "epoch": 2040} {"train_loss": -6.1634111404418945, "global_step": 85720, "epoch": 2040} {"train_loss": -6.1911673318772085, "global_step": 85721, "epoch": 2040, "val_loss": 67877.53125} {"train_loss": -6.1956892013549805, "global_step": 85722, "epoch": 2041} {"train_loss": -6.2582831382751465, "global_step": 85723, "epoch": 2041} {"train_loss": -6.306666851043701, "global_step": 85724, "epoch": 2041} {"train_loss": -6.209686279296875, "global_step": 85725, "epoch": 2041} {"train_loss": -6.293752670288086, "global_step": 85726, "epoch": 2041} {"train_loss": -6.277993202209473, "global_step": 85727, "epoch": 2041} {"train_loss": -6.146552562713623, "global_step": 85728, "epoch": 2041} {"train_loss": -6.179998397827148, "global_step": 85729, "epoch": 2041} {"train_loss": -6.182699203491211, "global_step": 85730, "epoch": 2041} {"train_loss": -6.192685127258301, "global_step": 85731, "epoch": 2041} {"train_loss": -6.271658897399902, "global_step": 85732, "epoch": 2041} {"train_loss": -6.137701988220215, "global_step": 85733, "epoch": 2041} {"train_loss": -6.325955390930176, "global_step": 85734, "epoch": 2041} {"train_loss": -6.250690460205078, "global_step": 85735, "epoch": 2041} {"train_loss": -6.133503437042236, "global_step": 85736, "epoch": 2041} {"train_loss": -6.28562068939209, "global_step": 85737, "epoch": 2041} {"train_loss": -6.212133407592773, "global_step": 85738, "epoch": 2041} {"train_loss": -6.225425720214844, "global_step": 85739, "epoch": 2041} {"train_loss": -6.132250785827637, "global_step": 85740, "epoch": 2041} {"train_loss": -6.058941841125488, "global_step": 85741, "epoch": 2041} {"train_loss": -6.141720294952393, "global_step": 85742, "epoch": 2041} {"train_loss": -6.087030410766602, "global_step": 85743, "epoch": 2041} {"train_loss": -6.286442756652832, "global_step": 85744, "epoch": 2041} {"train_loss": -6.1410231590271, "global_step": 85745, "epoch": 2041} {"train_loss": -6.238737106323242, "global_step": 85746, "epoch": 2041} {"train_loss": -6.281583786010742, "global_step": 85747, "epoch": 2041} {"train_loss": -6.226625919342041, "global_step": 85748, "epoch": 2041} {"train_loss": -6.250668525695801, "global_step": 85749, "epoch": 2041} {"train_loss": -6.225008010864258, "global_step": 85750, "epoch": 2041} {"train_loss": -6.154986381530762, "global_step": 85751, "epoch": 2041} {"train_loss": -6.30375862121582, "global_step": 85752, "epoch": 2041} {"train_loss": -6.253482341766357, "global_step": 85753, "epoch": 2041} {"train_loss": -6.196836471557617, "global_step": 85754, "epoch": 2041} {"train_loss": -6.1937384605407715, "global_step": 85755, "epoch": 2041} {"train_loss": -6.210112571716309, "global_step": 85756, "epoch": 2041} {"train_loss": -6.077572822570801, "global_step": 85757, "epoch": 2041} {"train_loss": -6.225833892822266, "global_step": 85758, "epoch": 2041} {"train_loss": -6.169497489929199, "global_step": 85759, "epoch": 2041} {"train_loss": -6.13047981262207, "global_step": 85760, "epoch": 2041} {"train_loss": -6.041831016540527, "global_step": 85761, "epoch": 2041} {"train_loss": -6.2153120040893555, "global_step": 85762, "epoch": 2041} {"train_loss": -6.2018696921212335, "global_step": 85763, "epoch": 2041, "val_loss": 67850.5} {"train_loss": -6.068362236022949, "global_step": 85764, "epoch": 2042} {"train_loss": -6.269625663757324, "global_step": 85765, "epoch": 2042} {"train_loss": -5.997237682342529, "global_step": 85766, "epoch": 2042} {"train_loss": -6.273078918457031, "global_step": 85767, "epoch": 2042} {"train_loss": -6.108705043792725, "global_step": 85768, "epoch": 2042} {"train_loss": -6.1188530921936035, "global_step": 85769, "epoch": 2042} {"train_loss": -6.311823844909668, "global_step": 85770, "epoch": 2042} {"train_loss": -6.174442291259766, "global_step": 85771, "epoch": 2042} {"train_loss": -6.2552714347839355, "global_step": 85772, "epoch": 2042} {"train_loss": -6.123910903930664, "global_step": 85773, "epoch": 2042} {"train_loss": -6.2252516746521, "global_step": 85774, "epoch": 2042} {"train_loss": -6.108711242675781, "global_step": 85775, "epoch": 2042} {"train_loss": -6.069469451904297, "global_step": 85776, "epoch": 2042} {"train_loss": -6.102507591247559, "global_step": 85777, "epoch": 2042} {"train_loss": -6.026140213012695, "global_step": 85778, "epoch": 2042} {"train_loss": -6.227725028991699, "global_step": 85779, "epoch": 2042} {"train_loss": -6.040291786193848, "global_step": 85780, "epoch": 2042} {"train_loss": -6.22234582901001, "global_step": 85781, "epoch": 2042} {"train_loss": -6.081960678100586, "global_step": 85782, "epoch": 2042} {"train_loss": -6.170035362243652, "global_step": 85783, "epoch": 2042} {"train_loss": -6.097308158874512, "global_step": 85784, "epoch": 2042} {"train_loss": -6.079521179199219, "global_step": 85785, "epoch": 2042} {"train_loss": -6.146461486816406, "global_step": 85786, "epoch": 2042} {"train_loss": -6.106853485107422, "global_step": 85787, "epoch": 2042} {"train_loss": -6.106040000915527, "global_step": 85788, "epoch": 2042} {"train_loss": -6.099215984344482, "global_step": 85789, "epoch": 2042} {"train_loss": -6.115370750427246, "global_step": 85790, "epoch": 2042} {"train_loss": -6.1299848556518555, "global_step": 85791, "epoch": 2042} {"train_loss": -6.186434745788574, "global_step": 85792, "epoch": 2042} {"train_loss": -6.266450881958008, "global_step": 85793, "epoch": 2042} {"train_loss": -6.0108160972595215, "global_step": 85794, "epoch": 2042} {"train_loss": -6.149425506591797, "global_step": 85795, "epoch": 2042} {"train_loss": -6.115766525268555, "global_step": 85796, "epoch": 2042} {"train_loss": -6.134496688842773, "global_step": 85797, "epoch": 2042} {"train_loss": -6.103893280029297, "global_step": 85798, "epoch": 2042} {"train_loss": -6.008420467376709, "global_step": 85799, "epoch": 2042} {"train_loss": -6.022021770477295, "global_step": 85800, "epoch": 2042} {"train_loss": -6.175876140594482, "global_step": 85801, "epoch": 2042} {"train_loss": -6.118148326873779, "global_step": 85802, "epoch": 2042} {"train_loss": -6.093757629394531, "global_step": 85803, "epoch": 2042} {"train_loss": -6.042551040649414, "global_step": 85804, "epoch": 2042} {"train_loss": -6.128583703722272, "global_step": 85805, "epoch": 2042, "val_loss": 67768.7578125} {"train_loss": -6.217710971832275, "global_step": 85806, "epoch": 2043} {"train_loss": -6.067418098449707, "global_step": 85807, "epoch": 2043} {"train_loss": -6.098250865936279, "global_step": 85808, "epoch": 2043} {"train_loss": -6.083707332611084, "global_step": 85809, "epoch": 2043} {"train_loss": -6.155097007751465, "global_step": 85810, "epoch": 2043} {"train_loss": -6.101753234863281, "global_step": 85811, "epoch": 2043} {"train_loss": -6.0816731452941895, "global_step": 85812, "epoch": 2043} {"train_loss": -6.136704444885254, "global_step": 85813, "epoch": 2043} {"train_loss": -6.01270055770874, "global_step": 85814, "epoch": 2043} {"train_loss": -6.184267997741699, "global_step": 85815, "epoch": 2043} {"train_loss": -6.16877555847168, "global_step": 85816, "epoch": 2043} {"train_loss": -6.218461036682129, "global_step": 85817, "epoch": 2043} {"train_loss": -6.18977165222168, "global_step": 85818, "epoch": 2043} {"train_loss": -6.22316312789917, "global_step": 85819, "epoch": 2043} {"train_loss": -6.1573486328125, "global_step": 85820, "epoch": 2043} {"train_loss": -6.155601501464844, "global_step": 85821, "epoch": 2043} {"train_loss": -6.106291770935059, "global_step": 85822, "epoch": 2043} {"train_loss": -6.2546281814575195, "global_step": 85823, "epoch": 2043} {"train_loss": -6.223842620849609, "global_step": 85824, "epoch": 2043} {"train_loss": -6.257126808166504, "global_step": 85825, "epoch": 2043} {"train_loss": -6.229930877685547, "global_step": 85826, "epoch": 2043} {"train_loss": -6.080005645751953, "global_step": 85827, "epoch": 2043} {"train_loss": -6.3139543533325195, "global_step": 85828, "epoch": 2043} {"train_loss": -6.160316467285156, "global_step": 85829, "epoch": 2043} {"train_loss": -6.188864707946777, "global_step": 85830, "epoch": 2043} {"train_loss": -6.202795028686523, "global_step": 85831, "epoch": 2043} {"train_loss": -6.238126754760742, "global_step": 85832, "epoch": 2043} {"train_loss": -6.237653732299805, "global_step": 85833, "epoch": 2043} {"train_loss": -6.244290828704834, "global_step": 85834, "epoch": 2043} {"train_loss": -6.216274261474609, "global_step": 85835, "epoch": 2043} {"train_loss": -6.1912946701049805, "global_step": 85836, "epoch": 2043} {"train_loss": -6.213095664978027, "global_step": 85837, "epoch": 2043} {"train_loss": -6.22196102142334, "global_step": 85838, "epoch": 2043} {"train_loss": -6.172418594360352, "global_step": 85839, "epoch": 2043} {"train_loss": -6.228212356567383, "global_step": 85840, "epoch": 2043} {"train_loss": -6.196900367736816, "global_step": 85841, "epoch": 2043} {"train_loss": -6.244261741638184, "global_step": 85842, "epoch": 2043} {"train_loss": -6.221859931945801, "global_step": 85843, "epoch": 2043} {"train_loss": -6.192765235900879, "global_step": 85844, "epoch": 2043} {"train_loss": -6.130997657775879, "global_step": 85845, "epoch": 2043} {"train_loss": -6.186915874481201, "global_step": 85846, "epoch": 2043} {"train_loss": -6.181056068057106, "global_step": 85847, "epoch": 2043, "val_loss": 67598.28125} {"train_loss": -6.264957427978516, "global_step": 85848, "epoch": 2044} {"train_loss": -6.207279682159424, "global_step": 85849, "epoch": 2044} {"train_loss": -6.224111557006836, "global_step": 85850, "epoch": 2044} {"train_loss": -6.343712329864502, "global_step": 85851, "epoch": 2044} {"train_loss": -6.226064205169678, "global_step": 85852, "epoch": 2044} {"train_loss": -6.189399719238281, "global_step": 85853, "epoch": 2044} {"train_loss": -6.244762897491455, "global_step": 85854, "epoch": 2044} {"train_loss": -6.153047561645508, "global_step": 85855, "epoch": 2044} {"train_loss": -6.195130348205566, "global_step": 85856, "epoch": 2044} {"train_loss": -6.155129432678223, "global_step": 85857, "epoch": 2044} {"train_loss": -6.182154655456543, "global_step": 85858, "epoch": 2044} {"train_loss": -6.165652275085449, "global_step": 85859, "epoch": 2044} {"train_loss": -6.241800785064697, "global_step": 85860, "epoch": 2044} {"train_loss": -6.201251983642578, "global_step": 85861, "epoch": 2044} {"train_loss": -6.1419358253479, "global_step": 85862, "epoch": 2044} {"train_loss": -6.275940418243408, "global_step": 85863, "epoch": 2044} {"train_loss": -6.207742214202881, "global_step": 85864, "epoch": 2044} {"train_loss": -6.100315570831299, "global_step": 85865, "epoch": 2044} {"train_loss": -6.155986785888672, "global_step": 85866, "epoch": 2044} {"train_loss": -6.062941551208496, "global_step": 85867, "epoch": 2044} {"train_loss": -6.058238506317139, "global_step": 85868, "epoch": 2044} {"train_loss": -6.152423858642578, "global_step": 85869, "epoch": 2044} {"train_loss": -6.1771368980407715, "global_step": 85870, "epoch": 2044} {"train_loss": -6.156231880187988, "global_step": 85871, "epoch": 2044} {"train_loss": -6.149031639099121, "global_step": 85872, "epoch": 2044} {"train_loss": -6.181266784667969, "global_step": 85873, "epoch": 2044} {"train_loss": -6.1275410652160645, "global_step": 85874, "epoch": 2044} {"train_loss": -6.2147932052612305, "global_step": 85875, "epoch": 2044} {"train_loss": -6.197680473327637, "global_step": 85876, "epoch": 2044} {"train_loss": -6.212769508361816, "global_step": 85877, "epoch": 2044} {"train_loss": -6.127901554107666, "global_step": 85878, "epoch": 2044} {"train_loss": -6.221808433532715, "global_step": 85879, "epoch": 2044} {"train_loss": -6.108536720275879, "global_step": 85880, "epoch": 2044} {"train_loss": -6.192988395690918, "global_step": 85881, "epoch": 2044} {"train_loss": -6.192306995391846, "global_step": 85882, "epoch": 2044} {"train_loss": -6.12806510925293, "global_step": 85883, "epoch": 2044} {"train_loss": -6.124117851257324, "global_step": 85884, "epoch": 2044} {"train_loss": -6.187005043029785, "global_step": 85885, "epoch": 2044} {"train_loss": -6.2407379150390625, "global_step": 85886, "epoch": 2044} {"train_loss": -6.140534400939941, "global_step": 85887, "epoch": 2044} {"train_loss": -6.174454689025879, "global_step": 85888, "epoch": 2044} {"train_loss": -6.1822172573634555, "global_step": 85889, "epoch": 2044, "val_loss": 67810.78125} {"train_loss": -6.1432390213012695, "global_step": 85890, "epoch": 2045} {"train_loss": -6.247427940368652, "global_step": 85891, "epoch": 2045} {"train_loss": -6.175405502319336, "global_step": 85892, "epoch": 2045} {"train_loss": -6.148929595947266, "global_step": 85893, "epoch": 2045} {"train_loss": -6.253378868103027, "global_step": 85894, "epoch": 2045} {"train_loss": -6.1030707359313965, "global_step": 85895, "epoch": 2045} {"train_loss": -6.264784812927246, "global_step": 85896, "epoch": 2045} {"train_loss": -6.221325397491455, "global_step": 85897, "epoch": 2045} {"train_loss": -6.244480609893799, "global_step": 85898, "epoch": 2045} {"train_loss": -6.231890678405762, "global_step": 85899, "epoch": 2045} {"train_loss": -6.203673839569092, "global_step": 85900, "epoch": 2045} {"train_loss": -6.2100725173950195, "global_step": 85901, "epoch": 2045} {"train_loss": -6.247196197509766, "global_step": 85902, "epoch": 2045} {"train_loss": -6.0714216232299805, "global_step": 85903, "epoch": 2045} {"train_loss": -6.221047401428223, "global_step": 85904, "epoch": 2045} {"train_loss": -6.236176013946533, "global_step": 85905, "epoch": 2045} {"train_loss": -6.145208358764648, "global_step": 85906, "epoch": 2045} {"train_loss": -6.1200714111328125, "global_step": 85907, "epoch": 2045} {"train_loss": -6.164899826049805, "global_step": 85908, "epoch": 2045} {"train_loss": -6.261312007904053, "global_step": 85909, "epoch": 2045} {"train_loss": -6.1382246017456055, "global_step": 85910, "epoch": 2045} {"train_loss": -6.149776935577393, "global_step": 85911, "epoch": 2045} {"train_loss": -6.09837532043457, "global_step": 85912, "epoch": 2045} {"train_loss": -6.068897247314453, "global_step": 85913, "epoch": 2045} {"train_loss": -6.172028541564941, "global_step": 85914, "epoch": 2045} {"train_loss": -6.146328926086426, "global_step": 85915, "epoch": 2045} {"train_loss": -6.193801403045654, "global_step": 85916, "epoch": 2045} {"train_loss": -6.132534027099609, "global_step": 85917, "epoch": 2045} {"train_loss": -6.143918514251709, "global_step": 85918, "epoch": 2045} {"train_loss": -6.219289302825928, "global_step": 85919, "epoch": 2045} {"train_loss": -6.093890190124512, "global_step": 85920, "epoch": 2045} {"train_loss": -6.166532516479492, "global_step": 85921, "epoch": 2045} {"train_loss": -6.2135138511657715, "global_step": 85922, "epoch": 2045} {"train_loss": -6.118354320526123, "global_step": 85923, "epoch": 2045} {"train_loss": -6.158434867858887, "global_step": 85924, "epoch": 2045} {"train_loss": -6.208359718322754, "global_step": 85925, "epoch": 2045} {"train_loss": -6.205230712890625, "global_step": 85926, "epoch": 2045} {"train_loss": -6.282662391662598, "global_step": 85927, "epoch": 2045} {"train_loss": -6.177921295166016, "global_step": 85928, "epoch": 2045} {"train_loss": -6.173179626464844, "global_step": 85929, "epoch": 2045} {"train_loss": -6.153778076171875, "global_step": 85930, "epoch": 2045} {"train_loss": -6.1783961568559915, "global_step": 85931, "epoch": 2045, "val_loss": 67912.0625} {"train_loss": -6.213125228881836, "global_step": 85932, "epoch": 2046} {"train_loss": -6.170746803283691, "global_step": 85933, "epoch": 2046} {"train_loss": -6.103891372680664, "global_step": 85934, "epoch": 2046} {"train_loss": -6.197391510009766, "global_step": 85935, "epoch": 2046} {"train_loss": -6.10733699798584, "global_step": 85936, "epoch": 2046} {"train_loss": -6.112588405609131, "global_step": 85937, "epoch": 2046} {"train_loss": -6.17494535446167, "global_step": 85938, "epoch": 2046} {"train_loss": -6.2034502029418945, "global_step": 85939, "epoch": 2046} {"train_loss": -6.155526638031006, "global_step": 85940, "epoch": 2046} {"train_loss": -6.257895469665527, "global_step": 85941, "epoch": 2046} {"train_loss": -6.026234149932861, "global_step": 85942, "epoch": 2046} {"train_loss": -6.250890731811523, "global_step": 85943, "epoch": 2046} {"train_loss": -6.325277328491211, "global_step": 85944, "epoch": 2046} {"train_loss": -6.323441505432129, "global_step": 85945, "epoch": 2046} {"train_loss": -6.236688613891602, "global_step": 85946, "epoch": 2046} {"train_loss": -6.26479434967041, "global_step": 85947, "epoch": 2046} {"train_loss": -6.166339874267578, "global_step": 85948, "epoch": 2046} {"train_loss": -6.18027400970459, "global_step": 85949, "epoch": 2046} {"train_loss": -6.2824506759643555, "global_step": 85950, "epoch": 2046} {"train_loss": -6.17863655090332, "global_step": 85951, "epoch": 2046} {"train_loss": -6.150594234466553, "global_step": 85952, "epoch": 2046} {"train_loss": -6.175060749053955, "global_step": 85953, "epoch": 2046} {"train_loss": -6.037158966064453, "global_step": 85954, "epoch": 2046} {"train_loss": -6.071462631225586, "global_step": 85955, "epoch": 2046} {"train_loss": -6.165866851806641, "global_step": 85956, "epoch": 2046} {"train_loss": -6.214944839477539, "global_step": 85957, "epoch": 2046} {"train_loss": -6.199909687042236, "global_step": 85958, "epoch": 2046} {"train_loss": -6.179231643676758, "global_step": 85959, "epoch": 2046} {"train_loss": -6.169216632843018, "global_step": 85960, "epoch": 2046} {"train_loss": -6.084408760070801, "global_step": 85961, "epoch": 2046} {"train_loss": -6.167069435119629, "global_step": 85962, "epoch": 2046} {"train_loss": -6.126903533935547, "global_step": 85963, "epoch": 2046} {"train_loss": -6.157434463500977, "global_step": 85964, "epoch": 2046} {"train_loss": -6.2102484703063965, "global_step": 85965, "epoch": 2046} {"train_loss": -6.285973072052002, "global_step": 85966, "epoch": 2046} {"train_loss": -6.250442981719971, "global_step": 85967, "epoch": 2046} {"train_loss": -6.287211894989014, "global_step": 85968, "epoch": 2046} {"train_loss": -6.223615646362305, "global_step": 85969, "epoch": 2046} {"train_loss": -6.159930229187012, "global_step": 85970, "epoch": 2046} {"train_loss": -6.226157188415527, "global_step": 85971, "epoch": 2046} {"train_loss": -6.157577991485596, "global_step": 85972, "epoch": 2046} {"train_loss": -6.187137910297939, "global_step": 85973, "epoch": 2046, "val_loss": 67902.46875} {"train_loss": -6.22468376159668, "global_step": 85974, "epoch": 2047} {"train_loss": -6.247464656829834, "global_step": 85975, "epoch": 2047} {"train_loss": -6.170255184173584, "global_step": 85976, "epoch": 2047} {"train_loss": -6.270684242248535, "global_step": 85977, "epoch": 2047} {"train_loss": -6.21850061416626, "global_step": 85978, "epoch": 2047} {"train_loss": -6.160400867462158, "global_step": 85979, "epoch": 2047} {"train_loss": -6.24887752532959, "global_step": 85980, "epoch": 2047} {"train_loss": -6.182494163513184, "global_step": 85981, "epoch": 2047} {"train_loss": -6.250068187713623, "global_step": 85982, "epoch": 2047} {"train_loss": -6.15952205657959, "global_step": 85983, "epoch": 2047} {"train_loss": -6.152911186218262, "global_step": 85984, "epoch": 2047} {"train_loss": -6.285091876983643, "global_step": 85985, "epoch": 2047} {"train_loss": -6.166217803955078, "global_step": 85986, "epoch": 2047} {"train_loss": -6.3074517250061035, "global_step": 85987, "epoch": 2047} {"train_loss": -6.168676853179932, "global_step": 85988, "epoch": 2047} {"train_loss": -6.153842926025391, "global_step": 85989, "epoch": 2047} {"train_loss": -6.296989440917969, "global_step": 85990, "epoch": 2047} {"train_loss": -6.241667747497559, "global_step": 85991, "epoch": 2047} {"train_loss": -6.187952995300293, "global_step": 85992, "epoch": 2047} {"train_loss": -6.396880626678467, "global_step": 85993, "epoch": 2047} {"train_loss": -6.124634742736816, "global_step": 85994, "epoch": 2047} {"train_loss": -6.199087142944336, "global_step": 85995, "epoch": 2047} {"train_loss": -6.211106777191162, "global_step": 85996, "epoch": 2047} {"train_loss": -6.199163913726807, "global_step": 85997, "epoch": 2047} {"train_loss": -6.135551452636719, "global_step": 85998, "epoch": 2047} {"train_loss": -6.24106502532959, "global_step": 85999, "epoch": 2047} {"train_loss": -6.210664749145508, "global_step": 86000, "epoch": 2047} {"train_loss": -6.266541004180908, "global_step": 86001, "epoch": 2047} {"train_loss": -6.146439552307129, "global_step": 86002, "epoch": 2047} {"train_loss": -6.15864896774292, "global_step": 86003, "epoch": 2047} {"train_loss": -6.151381492614746, "global_step": 86004, "epoch": 2047} {"train_loss": -6.270018577575684, "global_step": 86005, "epoch": 2047} {"train_loss": -6.279826641082764, "global_step": 86006, "epoch": 2047} {"train_loss": -6.202649116516113, "global_step": 86007, "epoch": 2047} {"train_loss": -6.1721038818359375, "global_step": 86008, "epoch": 2047} {"train_loss": -6.247722625732422, "global_step": 86009, "epoch": 2047} {"train_loss": -6.112135410308838, "global_step": 86010, "epoch": 2047} {"train_loss": -6.205395221710205, "global_step": 86011, "epoch": 2047} {"train_loss": -6.204314708709717, "global_step": 86012, "epoch": 2047} {"train_loss": -6.242232799530029, "global_step": 86013, "epoch": 2047} {"train_loss": -6.216690540313721, "global_step": 86014, "epoch": 2047} {"train_loss": -6.211321217673166, "global_step": 86015, "epoch": 2047, "val_loss": 67657.7109375} {"train_loss": -6.215062618255615, "global_step": 86016, "epoch": 2048} {"train_loss": -6.149102210998535, "global_step": 86017, "epoch": 2048} {"train_loss": -6.196658134460449, "global_step": 86018, "epoch": 2048} {"train_loss": -6.224017143249512, "global_step": 86019, "epoch": 2048} {"train_loss": -6.206851959228516, "global_step": 86020, "epoch": 2048} {"train_loss": -6.249540328979492, "global_step": 86021, "epoch": 2048} {"train_loss": -6.27271842956543, "global_step": 86022, "epoch": 2048} {"train_loss": -6.300379753112793, "global_step": 86023, "epoch": 2048} {"train_loss": -6.096934795379639, "global_step": 86024, "epoch": 2048} {"train_loss": -6.218143939971924, "global_step": 86025, "epoch": 2048} {"train_loss": -6.2877607345581055, "global_step": 86026, "epoch": 2048} {"train_loss": -6.151301860809326, "global_step": 86027, "epoch": 2048} {"train_loss": -6.152305603027344, "global_step": 86028, "epoch": 2048} {"train_loss": -6.305336952209473, "global_step": 86029, "epoch": 2048} {"train_loss": -6.268249034881592, "global_step": 86030, "epoch": 2048} {"train_loss": -6.048873424530029, "global_step": 86031, "epoch": 2048} {"train_loss": -6.223318099975586, "global_step": 86032, "epoch": 2048} {"train_loss": -6.126940727233887, "global_step": 86033, "epoch": 2048} {"train_loss": -6.08046817779541, "global_step": 86034, "epoch": 2048} {"train_loss": -6.228267192840576, "global_step": 86035, "epoch": 2048} {"train_loss": -6.194588661193848, "global_step": 86036, "epoch": 2048} {"train_loss": -6.246675491333008, "global_step": 86037, "epoch": 2048} {"train_loss": -6.149621963500977, "global_step": 86038, "epoch": 2048} {"train_loss": -6.226174831390381, "global_step": 86039, "epoch": 2048} {"train_loss": -6.160088062286377, "global_step": 86040, "epoch": 2048} {"train_loss": -6.174692153930664, "global_step": 86041, "epoch": 2048} {"train_loss": -6.244861602783203, "global_step": 86042, "epoch": 2048} {"train_loss": -6.066298007965088, "global_step": 86043, "epoch": 2048} {"train_loss": -6.241028785705566, "global_step": 86044, "epoch": 2048} {"train_loss": -6.2101640701293945, "global_step": 86045, "epoch": 2048} {"train_loss": -6.105315208435059, "global_step": 86046, "epoch": 2048} {"train_loss": -6.125825881958008, "global_step": 86047, "epoch": 2048} {"train_loss": -6.083276748657227, "global_step": 86048, "epoch": 2048} {"train_loss": -6.180513381958008, "global_step": 86049, "epoch": 2048} {"train_loss": -6.0189313888549805, "global_step": 86050, "epoch": 2048} {"train_loss": -6.009832859039307, "global_step": 86051, "epoch": 2048} {"train_loss": -6.1756181716918945, "global_step": 86052, "epoch": 2048} {"train_loss": -6.186397552490234, "global_step": 86053, "epoch": 2048} {"train_loss": -6.11964750289917, "global_step": 86054, "epoch": 2048} {"train_loss": -6.067882537841797, "global_step": 86055, "epoch": 2048} {"train_loss": -6.123452186584473, "global_step": 86056, "epoch": 2048} {"train_loss": -6.172200736545381, "global_step": 86057, "epoch": 2048, "val_loss": 68003.0625} {"train_loss": -6.137272834777832, "global_step": 86058, "epoch": 2049} {"train_loss": -6.043146133422852, "global_step": 86059, "epoch": 2049} {"train_loss": -6.133538246154785, "global_step": 86060, "epoch": 2049} {"train_loss": -6.129955291748047, "global_step": 86061, "epoch": 2049} {"train_loss": -6.272848129272461, "global_step": 86062, "epoch": 2049} {"train_loss": -6.191033363342285, "global_step": 86063, "epoch": 2049} {"train_loss": -6.036964416503906, "global_step": 86064, "epoch": 2049} {"train_loss": -6.108515739440918, "global_step": 86065, "epoch": 2049} {"train_loss": -6.170500755310059, "global_step": 86066, "epoch": 2049} {"train_loss": -6.250626564025879, "global_step": 86067, "epoch": 2049} {"train_loss": -6.126242637634277, "global_step": 86068, "epoch": 2049} {"train_loss": -6.122150421142578, "global_step": 86069, "epoch": 2049} {"train_loss": -6.080666542053223, "global_step": 86070, "epoch": 2049} {"train_loss": -6.095465660095215, "global_step": 86071, "epoch": 2049} {"train_loss": -6.216665267944336, "global_step": 86072, "epoch": 2049} {"train_loss": -6.113588333129883, "global_step": 86073, "epoch": 2049} {"train_loss": -6.19956636428833, "global_step": 86074, "epoch": 2049} {"train_loss": -6.130588531494141, "global_step": 86075, "epoch": 2049} {"train_loss": -6.166247844696045, "global_step": 86076, "epoch": 2049} {"train_loss": -6.068480491638184, "global_step": 86077, "epoch": 2049} {"train_loss": -6.043397903442383, "global_step": 86078, "epoch": 2049} {"train_loss": -6.095314025878906, "global_step": 86079, "epoch": 2049} {"train_loss": -6.2439422607421875, "global_step": 86080, "epoch": 2049} {"train_loss": -6.205852508544922, "global_step": 86081, "epoch": 2049} {"train_loss": -6.169353485107422, "global_step": 86082, "epoch": 2049} {"train_loss": -6.186895370483398, "global_step": 86083, "epoch": 2049} {"train_loss": -6.26824951171875, "global_step": 86084, "epoch": 2049} {"train_loss": -6.124613285064697, "global_step": 86085, "epoch": 2049} {"train_loss": -6.1779913902282715, "global_step": 86086, "epoch": 2049} {"train_loss": -6.191928863525391, "global_step": 86087, "epoch": 2049} {"train_loss": -6.207327842712402, "global_step": 86088, "epoch": 2049} {"train_loss": -6.210054397583008, "global_step": 86089, "epoch": 2049} {"train_loss": -6.34541130065918, "global_step": 86090, "epoch": 2049} {"train_loss": -6.26654577255249, "global_step": 86091, "epoch": 2049} {"train_loss": -6.171730041503906, "global_step": 86092, "epoch": 2049} {"train_loss": -6.215245246887207, "global_step": 86093, "epoch": 2049} {"train_loss": -6.116837978363037, "global_step": 86094, "epoch": 2049} {"train_loss": -6.16176700592041, "global_step": 86095, "epoch": 2049} {"train_loss": -6.182154655456543, "global_step": 86096, "epoch": 2049} {"train_loss": -6.231879234313965, "global_step": 86097, "epoch": 2049} {"train_loss": -6.185030937194824, "global_step": 86098, "epoch": 2049} {"train_loss": -6.167148998805454, "global_step": 86099, "epoch": 2049, "val_loss": 67980.578125} {"train_loss": -6.284659385681152, "global_step": 86100, "epoch": 2050} {"train_loss": -6.263974666595459, "global_step": 86101, "epoch": 2050} {"train_loss": -6.0850067138671875, "global_step": 86102, "epoch": 2050} {"train_loss": -6.110780715942383, "global_step": 86103, "epoch": 2050} {"train_loss": -6.114401340484619, "global_step": 86104, "epoch": 2050} {"train_loss": -6.246460914611816, "global_step": 86105, "epoch": 2050} {"train_loss": -6.266650199890137, "global_step": 86106, "epoch": 2050} {"train_loss": -6.193503379821777, "global_step": 86107, "epoch": 2050} {"train_loss": -6.1786956787109375, "global_step": 86108, "epoch": 2050} {"train_loss": -6.136094570159912, "global_step": 86109, "epoch": 2050} {"train_loss": -6.208895206451416, "global_step": 86110, "epoch": 2050} {"train_loss": -6.228743076324463, "global_step": 86111, "epoch": 2050} {"train_loss": -6.178292274475098, "global_step": 86112, "epoch": 2050} {"train_loss": -6.1243391036987305, "global_step": 86113, "epoch": 2050} {"train_loss": -6.183202743530273, "global_step": 86114, "epoch": 2050} {"train_loss": -6.208274841308594, "global_step": 86115, "epoch": 2050} {"train_loss": -6.2371721267700195, "global_step": 86116, "epoch": 2050} {"train_loss": -6.1356682777404785, "global_step": 86117, "epoch": 2050} {"train_loss": -6.342927932739258, "global_step": 86118, "epoch": 2050} {"train_loss": -6.218488693237305, "global_step": 86119, "epoch": 2050} {"train_loss": -6.243144989013672, "global_step": 86120, "epoch": 2050} {"train_loss": -6.210328102111816, "global_step": 86121, "epoch": 2050} {"train_loss": -6.290180206298828, "global_step": 86122, "epoch": 2050} {"train_loss": -6.226092338562012, "global_step": 86123, "epoch": 2050} {"train_loss": -6.157576560974121, "global_step": 86124, "epoch": 2050} {"train_loss": -6.173417091369629, "global_step": 86125, "epoch": 2050} {"train_loss": -6.331901550292969, "global_step": 86126, "epoch": 2050} {"train_loss": -6.235190391540527, "global_step": 86127, "epoch": 2050} {"train_loss": -6.243108749389648, "global_step": 86128, "epoch": 2050} {"train_loss": -6.206875324249268, "global_step": 86129, "epoch": 2050} {"train_loss": -6.157696723937988, "global_step": 86130, "epoch": 2050} {"train_loss": -6.381799697875977, "global_step": 86131, "epoch": 2050} {"train_loss": -6.206587791442871, "global_step": 86132, "epoch": 2050} {"train_loss": -6.230595588684082, "global_step": 86133, "epoch": 2050} {"train_loss": -6.232521057128906, "global_step": 86134, "epoch": 2050} {"train_loss": -6.192476272583008, "global_step": 86135, "epoch": 2050} {"train_loss": -6.127965450286865, "global_step": 86136, "epoch": 2050} {"train_loss": -6.153476715087891, "global_step": 86137, "epoch": 2050} {"train_loss": -6.2350263595581055, "global_step": 86138, "epoch": 2050} {"train_loss": -6.140523910522461, "global_step": 86139, "epoch": 2050} {"train_loss": -6.137197494506836, "global_step": 86140, "epoch": 2050} {"train_loss": -6.205993686403547, "global_step": 86141, "epoch": 2050, "train/sim_max_reward_0": 0.22265665247486185, "train/sim_max_reward_1": 0.9154027715529919, "train/sim_max_reward_2": 0.8094121605751856, "train/sim_max_reward_3": 0.1462073028124028, "train/sim_max_reward_4": 0.9204587365037435, "train/sim_max_reward_5": 0.9037711628652297, "test/sim_max_reward_4400000": 0.23756898370781837, "test/sim_max_reward_4400001": 0.951607893718814, "test/sim_max_reward_4400002": 0.8103395828961015, "test/sim_max_reward_4400003": 0.9586082991423905, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9228579380207887, "test/sim_max_reward_4400007": 0.8663062175066485, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.741860187237279, "test/sim_max_reward_4400010": 0.9217706000967231, "test/sim_max_reward_4400011": 0.23163464154598054, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.94482865651358, "test/sim_max_reward_4400014": 0.6971616583572576, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.09563723108858681, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.27830991438887726, "test/sim_max_reward_4400019": 0.12767328875688702, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.567095116578102, "test/sim_max_reward_4400023": 0.994420076939443, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.21080932547914277, "test/sim_max_reward_4400026": 0.04814633413635947, "test/sim_max_reward_4400027": 0.05864013440778389, "test/sim_max_reward_4400028": 0.84267075923949, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.031229597183181357, "test/sim_max_reward_4400031": 0.3749608485429921, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.5780700021536291, "test/sim_max_reward_4400034": 0.8705314514157657, "test/sim_max_reward_4400035": 0.8169633352639286, "test/sim_max_reward_4400036": 0.6294526360441581, "test/sim_max_reward_4400037": 0.9878258216678182, "test/sim_max_reward_4400038": 0.21135237070671833, "test/sim_max_reward_4400039": 0.41255357754718064, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9820496004103698, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.8940657709389627, "test/sim_max_reward_4400044": 0.8831914159800484, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.6726109300580315, "test/sim_max_reward_4400047": 0.9824993472060666, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 0.979115705954547, "train/mean_score": 0.6529847977974025, "test/mean_score": 0.5136566014757848, "val_loss": 67839.3828125} {"train_loss": -6.191901683807373, "global_step": 86142, "epoch": 2051} {"train_loss": -6.252808570861816, "global_step": 86143, "epoch": 2051} {"train_loss": -6.337854862213135, "global_step": 86144, "epoch": 2051} {"train_loss": -6.353341102600098, "global_step": 86145, "epoch": 2051} {"train_loss": -6.225929260253906, "global_step": 86146, "epoch": 2051} {"train_loss": -6.258868217468262, "global_step": 86147, "epoch": 2051} {"train_loss": -6.248944282531738, "global_step": 86148, "epoch": 2051} {"train_loss": -6.195754528045654, "global_step": 86149, "epoch": 2051} {"train_loss": -6.233185768127441, "global_step": 86150, "epoch": 2051} {"train_loss": -6.262943744659424, "global_step": 86151, "epoch": 2051} {"train_loss": -6.132014751434326, "global_step": 86152, "epoch": 2051} {"train_loss": -6.176980972290039, "global_step": 86153, "epoch": 2051} {"train_loss": -6.201665878295898, "global_step": 86154, "epoch": 2051} {"train_loss": -6.102356433868408, "global_step": 86155, "epoch": 2051} {"train_loss": -6.206317901611328, "global_step": 86156, "epoch": 2051} {"train_loss": -6.10076904296875, "global_step": 86157, "epoch": 2051} {"train_loss": -6.2694902420043945, "global_step": 86158, "epoch": 2051} {"train_loss": -6.124530792236328, "global_step": 86159, "epoch": 2051} {"train_loss": -6.204524993896484, "global_step": 86160, "epoch": 2051} {"train_loss": -6.161837577819824, "global_step": 86161, "epoch": 2051} {"train_loss": -6.155675888061523, "global_step": 86162, "epoch": 2051} {"train_loss": -6.316251277923584, "global_step": 86163, "epoch": 2051} {"train_loss": -6.076577663421631, "global_step": 86164, "epoch": 2051} {"train_loss": -6.151887893676758, "global_step": 86165, "epoch": 2051} {"train_loss": -6.177272319793701, "global_step": 86166, "epoch": 2051} {"train_loss": -6.156044960021973, "global_step": 86167, "epoch": 2051} {"train_loss": -6.228540897369385, "global_step": 86168, "epoch": 2051} {"train_loss": -6.181812286376953, "global_step": 86169, "epoch": 2051} {"train_loss": -6.252221584320068, "global_step": 86170, "epoch": 2051} {"train_loss": -6.239604949951172, "global_step": 86171, "epoch": 2051} {"train_loss": -6.263131141662598, "global_step": 86172, "epoch": 2051} {"train_loss": -6.152064800262451, "global_step": 86173, "epoch": 2051} {"train_loss": -6.18504524230957, "global_step": 86174, "epoch": 2051} {"train_loss": -6.264981269836426, "global_step": 86175, "epoch": 2051} {"train_loss": -6.155804634094238, "global_step": 86176, "epoch": 2051} {"train_loss": -6.144505500793457, "global_step": 86177, "epoch": 2051} {"train_loss": -6.11215877532959, "global_step": 86178, "epoch": 2051} {"train_loss": -6.092353820800781, "global_step": 86179, "epoch": 2051} {"train_loss": -6.276785850524902, "global_step": 86180, "epoch": 2051} {"train_loss": -6.206215858459473, "global_step": 86181, "epoch": 2051} {"train_loss": -6.231246471405029, "global_step": 86182, "epoch": 2051} {"train_loss": -6.202214468093145, "global_step": 86183, "epoch": 2051, "val_loss": 67911.171875} {"train_loss": -6.122511863708496, "global_step": 86184, "epoch": 2052} {"train_loss": -6.147498607635498, "global_step": 86185, "epoch": 2052} {"train_loss": -6.164615154266357, "global_step": 86186, "epoch": 2052} {"train_loss": -6.152129173278809, "global_step": 86187, "epoch": 2052} {"train_loss": -6.246658802032471, "global_step": 86188, "epoch": 2052} {"train_loss": -6.182831287384033, "global_step": 86189, "epoch": 2052} {"train_loss": -6.083318710327148, "global_step": 86190, "epoch": 2052} {"train_loss": -6.183017730712891, "global_step": 86191, "epoch": 2052} {"train_loss": -6.227426528930664, "global_step": 86192, "epoch": 2052} {"train_loss": -6.215206623077393, "global_step": 86193, "epoch": 2052} {"train_loss": -6.173053741455078, "global_step": 86194, "epoch": 2052} {"train_loss": -6.1717529296875, "global_step": 86195, "epoch": 2052} {"train_loss": -6.052640914916992, "global_step": 86196, "epoch": 2052} {"train_loss": -6.167358875274658, "global_step": 86197, "epoch": 2052} {"train_loss": -6.201066493988037, "global_step": 86198, "epoch": 2052} {"train_loss": -6.142894268035889, "global_step": 86199, "epoch": 2052} {"train_loss": -6.115483283996582, "global_step": 86200, "epoch": 2052} {"train_loss": -6.0955586433410645, "global_step": 86201, "epoch": 2052} {"train_loss": -6.208114147186279, "global_step": 86202, "epoch": 2052} {"train_loss": -6.203289985656738, "global_step": 86203, "epoch": 2052} {"train_loss": -6.295599937438965, "global_step": 86204, "epoch": 2052} {"train_loss": -6.242310523986816, "global_step": 86205, "epoch": 2052} {"train_loss": -6.262188911437988, "global_step": 86206, "epoch": 2052} {"train_loss": -6.193209648132324, "global_step": 86207, "epoch": 2052} {"train_loss": -5.997962474822998, "global_step": 86208, "epoch": 2052} {"train_loss": -6.210325717926025, "global_step": 86209, "epoch": 2052} {"train_loss": -6.216635704040527, "global_step": 86210, "epoch": 2052} {"train_loss": -6.108171463012695, "global_step": 86211, "epoch": 2052} {"train_loss": -6.156135559082031, "global_step": 86212, "epoch": 2052} {"train_loss": -6.1271209716796875, "global_step": 86213, "epoch": 2052} {"train_loss": -6.196518898010254, "global_step": 86214, "epoch": 2052} {"train_loss": -6.2162604331970215, "global_step": 86215, "epoch": 2052} {"train_loss": -6.23921537399292, "global_step": 86216, "epoch": 2052} {"train_loss": -6.215778350830078, "global_step": 86217, "epoch": 2052} {"train_loss": -6.176832675933838, "global_step": 86218, "epoch": 2052} {"train_loss": -6.130125045776367, "global_step": 86219, "epoch": 2052} {"train_loss": -6.27828311920166, "global_step": 86220, "epoch": 2052} {"train_loss": -6.371366500854492, "global_step": 86221, "epoch": 2052} {"train_loss": -6.225132942199707, "global_step": 86222, "epoch": 2052} {"train_loss": -6.209102153778076, "global_step": 86223, "epoch": 2052} {"train_loss": -6.300067901611328, "global_step": 86224, "epoch": 2052} {"train_loss": -6.18438872836885, "global_step": 86225, "epoch": 2052, "val_loss": 67755.9921875} {"train_loss": -6.258265495300293, "global_step": 86226, "epoch": 2053} {"train_loss": -6.203441619873047, "global_step": 86227, "epoch": 2053} {"train_loss": -6.258078098297119, "global_step": 86228, "epoch": 2053} {"train_loss": -6.322532653808594, "global_step": 86229, "epoch": 2053} {"train_loss": -6.277303695678711, "global_step": 86230, "epoch": 2053} {"train_loss": -6.244562149047852, "global_step": 86231, "epoch": 2053} {"train_loss": -6.289510726928711, "global_step": 86232, "epoch": 2053} {"train_loss": -6.2755656242370605, "global_step": 86233, "epoch": 2053} {"train_loss": -6.2110700607299805, "global_step": 86234, "epoch": 2053} {"train_loss": -6.12498664855957, "global_step": 86235, "epoch": 2053} {"train_loss": -6.138520240783691, "global_step": 86236, "epoch": 2053} {"train_loss": -6.210318088531494, "global_step": 86237, "epoch": 2053} {"train_loss": -6.179960250854492, "global_step": 86238, "epoch": 2053} {"train_loss": -6.17973518371582, "global_step": 86239, "epoch": 2053} {"train_loss": -6.147721290588379, "global_step": 86240, "epoch": 2053} {"train_loss": -6.256744384765625, "global_step": 86241, "epoch": 2053} {"train_loss": -6.227742671966553, "global_step": 86242, "epoch": 2053} {"train_loss": -5.996356010437012, "global_step": 86243, "epoch": 2053} {"train_loss": -6.078696250915527, "global_step": 86244, "epoch": 2053} {"train_loss": -6.257248401641846, "global_step": 86245, "epoch": 2053} {"train_loss": -6.074490547180176, "global_step": 86246, "epoch": 2053} {"train_loss": -6.192652702331543, "global_step": 86247, "epoch": 2053} {"train_loss": -6.122511863708496, "global_step": 86248, "epoch": 2053} {"train_loss": -6.197957992553711, "global_step": 86249, "epoch": 2053} {"train_loss": -6.077345848083496, "global_step": 86250, "epoch": 2053} {"train_loss": -6.187284469604492, "global_step": 86251, "epoch": 2053} {"train_loss": -6.103079795837402, "global_step": 86252, "epoch": 2053} {"train_loss": -6.0715837478637695, "global_step": 86253, "epoch": 2053} {"train_loss": -6.17539119720459, "global_step": 86254, "epoch": 2053} {"train_loss": -6.191266059875488, "global_step": 86255, "epoch": 2053} {"train_loss": -6.209600448608398, "global_step": 86256, "epoch": 2053} {"train_loss": -6.180715084075928, "global_step": 86257, "epoch": 2053} {"train_loss": -6.106518745422363, "global_step": 86258, "epoch": 2053} {"train_loss": -6.1549272537231445, "global_step": 86259, "epoch": 2053} {"train_loss": -6.30476188659668, "global_step": 86260, "epoch": 2053} {"train_loss": -6.1375885009765625, "global_step": 86261, "epoch": 2053} {"train_loss": -6.300281524658203, "global_step": 86262, "epoch": 2053} {"train_loss": -6.175939559936523, "global_step": 86263, "epoch": 2053} {"train_loss": -6.148239612579346, "global_step": 86264, "epoch": 2053} {"train_loss": -6.219751358032227, "global_step": 86265, "epoch": 2053} {"train_loss": -6.305294990539551, "global_step": 86266, "epoch": 2053} {"train_loss": -6.189948002497355, "global_step": 86267, "epoch": 2053, "val_loss": 67910.1953125} {"train_loss": -6.236907005310059, "global_step": 86268, "epoch": 2054} {"train_loss": -6.166618347167969, "global_step": 86269, "epoch": 2054} {"train_loss": -6.357891082763672, "global_step": 86270, "epoch": 2054} {"train_loss": -6.24895715713501, "global_step": 86271, "epoch": 2054} {"train_loss": -6.1407623291015625, "global_step": 86272, "epoch": 2054} {"train_loss": -6.268461227416992, "global_step": 86273, "epoch": 2054} {"train_loss": -6.125804901123047, "global_step": 86274, "epoch": 2054} {"train_loss": -6.133750915527344, "global_step": 86275, "epoch": 2054} {"train_loss": -6.188323497772217, "global_step": 86276, "epoch": 2054} {"train_loss": -6.0865020751953125, "global_step": 86277, "epoch": 2054} {"train_loss": -6.090004920959473, "global_step": 86278, "epoch": 2054} {"train_loss": -6.212288856506348, "global_step": 86279, "epoch": 2054} {"train_loss": -6.1485700607299805, "global_step": 86280, "epoch": 2054} {"train_loss": -6.159390926361084, "global_step": 86281, "epoch": 2054} {"train_loss": -6.190087795257568, "global_step": 86282, "epoch": 2054} {"train_loss": -6.284600257873535, "global_step": 86283, "epoch": 2054} {"train_loss": -6.199911117553711, "global_step": 86284, "epoch": 2054} {"train_loss": -6.175811767578125, "global_step": 86285, "epoch": 2054} {"train_loss": -6.241205215454102, "global_step": 86286, "epoch": 2054} {"train_loss": -6.249881744384766, "global_step": 86287, "epoch": 2054} {"train_loss": -6.148684501647949, "global_step": 86288, "epoch": 2054} {"train_loss": -6.142734050750732, "global_step": 86289, "epoch": 2054} {"train_loss": -6.203622817993164, "global_step": 86290, "epoch": 2054} {"train_loss": -6.2237162590026855, "global_step": 86291, "epoch": 2054} {"train_loss": -6.24675178527832, "global_step": 86292, "epoch": 2054} {"train_loss": -6.234684944152832, "global_step": 86293, "epoch": 2054} {"train_loss": -6.135972023010254, "global_step": 86294, "epoch": 2054} {"train_loss": -6.1921610832214355, "global_step": 86295, "epoch": 2054} {"train_loss": -6.108431816101074, "global_step": 86296, "epoch": 2054} {"train_loss": -6.147093296051025, "global_step": 86297, "epoch": 2054} {"train_loss": -6.188824653625488, "global_step": 86298, "epoch": 2054} {"train_loss": -6.269837856292725, "global_step": 86299, "epoch": 2054} {"train_loss": -6.179107189178467, "global_step": 86300, "epoch": 2054} {"train_loss": -6.0848822593688965, "global_step": 86301, "epoch": 2054} {"train_loss": -6.234816551208496, "global_step": 86302, "epoch": 2054} {"train_loss": -6.254003047943115, "global_step": 86303, "epoch": 2054} {"train_loss": -6.213255882263184, "global_step": 86304, "epoch": 2054} {"train_loss": -6.169144153594971, "global_step": 86305, "epoch": 2054} {"train_loss": -6.242167949676514, "global_step": 86306, "epoch": 2054} {"train_loss": -6.222904682159424, "global_step": 86307, "epoch": 2054} {"train_loss": -6.198005199432373, "global_step": 86308, "epoch": 2054} {"train_loss": -6.1911449772971014, "global_step": 86309, "epoch": 2054, "val_loss": 67782.1015625} {"train_loss": -6.132351875305176, "global_step": 86310, "epoch": 2055} {"train_loss": -6.230608940124512, "global_step": 86311, "epoch": 2055} {"train_loss": -6.221877098083496, "global_step": 86312, "epoch": 2055} {"train_loss": -6.166131019592285, "global_step": 86313, "epoch": 2055} {"train_loss": -6.268133640289307, "global_step": 86314, "epoch": 2055} {"train_loss": -6.0381011962890625, "global_step": 86315, "epoch": 2055} {"train_loss": -6.208630084991455, "global_step": 86316, "epoch": 2055} {"train_loss": -6.3104143142700195, "global_step": 86317, "epoch": 2055} {"train_loss": -6.296882152557373, "global_step": 86318, "epoch": 2055} {"train_loss": -6.160036087036133, "global_step": 86319, "epoch": 2055} {"train_loss": -6.14670991897583, "global_step": 86320, "epoch": 2055} {"train_loss": -6.243854999542236, "global_step": 86321, "epoch": 2055} {"train_loss": -6.1854047775268555, "global_step": 86322, "epoch": 2055} {"train_loss": -6.275727272033691, "global_step": 86323, "epoch": 2055} {"train_loss": -6.223343849182129, "global_step": 86324, "epoch": 2055} {"train_loss": -6.222926139831543, "global_step": 86325, "epoch": 2055} {"train_loss": -6.253905296325684, "global_step": 86326, "epoch": 2055} {"train_loss": -6.232585430145264, "global_step": 86327, "epoch": 2055} {"train_loss": -6.322293281555176, "global_step": 86328, "epoch": 2055} {"train_loss": -6.033923149108887, "global_step": 86329, "epoch": 2055} {"train_loss": -6.13970422744751, "global_step": 86330, "epoch": 2055} {"train_loss": -6.279768943786621, "global_step": 86331, "epoch": 2055} {"train_loss": -6.351345062255859, "global_step": 86332, "epoch": 2055} {"train_loss": -6.149761199951172, "global_step": 86333, "epoch": 2055} {"train_loss": -6.103331089019775, "global_step": 86334, "epoch": 2055} {"train_loss": -6.360113620758057, "global_step": 86335, "epoch": 2055} {"train_loss": -6.262381553649902, "global_step": 86336, "epoch": 2055} {"train_loss": -6.165940284729004, "global_step": 86337, "epoch": 2055} {"train_loss": -6.2993974685668945, "global_step": 86338, "epoch": 2055} {"train_loss": -6.239581108093262, "global_step": 86339, "epoch": 2055} {"train_loss": -6.231637954711914, "global_step": 86340, "epoch": 2055} {"train_loss": -6.248834609985352, "global_step": 86341, "epoch": 2055} {"train_loss": -6.235119819641113, "global_step": 86342, "epoch": 2055} {"train_loss": -6.047981262207031, "global_step": 86343, "epoch": 2055} {"train_loss": -6.254608154296875, "global_step": 86344, "epoch": 2055} {"train_loss": -6.228934288024902, "global_step": 86345, "epoch": 2055} {"train_loss": -6.301218032836914, "global_step": 86346, "epoch": 2055} {"train_loss": -6.333077430725098, "global_step": 86347, "epoch": 2055} {"train_loss": -6.2219696044921875, "global_step": 86348, "epoch": 2055} {"train_loss": -6.126887321472168, "global_step": 86349, "epoch": 2055} {"train_loss": -6.285032272338867, "global_step": 86350, "epoch": 2055} {"train_loss": -6.2188781556629, "global_step": 86351, "epoch": 2055, "val_loss": 67897.5078125} {"train_loss": -6.331820964813232, "global_step": 86352, "epoch": 2056} {"train_loss": -6.304757595062256, "global_step": 86353, "epoch": 2056} {"train_loss": -6.167867660522461, "global_step": 86354, "epoch": 2056} {"train_loss": -6.245116710662842, "global_step": 86355, "epoch": 2056} {"train_loss": -6.162506580352783, "global_step": 86356, "epoch": 2056} {"train_loss": -6.223384857177734, "global_step": 86357, "epoch": 2056} {"train_loss": -6.220783233642578, "global_step": 86358, "epoch": 2056} {"train_loss": -6.203298568725586, "global_step": 86359, "epoch": 2056} {"train_loss": -6.2688422203063965, "global_step": 86360, "epoch": 2056} {"train_loss": -6.183943271636963, "global_step": 86361, "epoch": 2056} {"train_loss": -6.016110420227051, "global_step": 86362, "epoch": 2056} {"train_loss": -6.149627685546875, "global_step": 86363, "epoch": 2056} {"train_loss": -6.174736976623535, "global_step": 86364, "epoch": 2056} {"train_loss": -6.102542877197266, "global_step": 86365, "epoch": 2056} {"train_loss": -6.16118860244751, "global_step": 86366, "epoch": 2056} {"train_loss": -6.209334373474121, "global_step": 86367, "epoch": 2056} {"train_loss": -6.123995780944824, "global_step": 86368, "epoch": 2056} {"train_loss": -6.173249244689941, "global_step": 86369, "epoch": 2056} {"train_loss": -6.006955623626709, "global_step": 86370, "epoch": 2056} {"train_loss": -6.3080902099609375, "global_step": 86371, "epoch": 2056} {"train_loss": -6.0533576011657715, "global_step": 86372, "epoch": 2056} {"train_loss": -6.169543266296387, "global_step": 86373, "epoch": 2056} {"train_loss": -6.227239608764648, "global_step": 86374, "epoch": 2056} {"train_loss": -6.082228183746338, "global_step": 86375, "epoch": 2056} {"train_loss": -6.231115818023682, "global_step": 86376, "epoch": 2056} {"train_loss": -6.163694381713867, "global_step": 86377, "epoch": 2056} {"train_loss": -6.222753047943115, "global_step": 86378, "epoch": 2056} {"train_loss": -6.171092987060547, "global_step": 86379, "epoch": 2056} {"train_loss": -6.0751214027404785, "global_step": 86380, "epoch": 2056} {"train_loss": -6.120085716247559, "global_step": 86381, "epoch": 2056} {"train_loss": -6.030948162078857, "global_step": 86382, "epoch": 2056} {"train_loss": -6.0214996337890625, "global_step": 86383, "epoch": 2056} {"train_loss": -6.162583351135254, "global_step": 86384, "epoch": 2056} {"train_loss": -6.097526550292969, "global_step": 86385, "epoch": 2056} {"train_loss": -6.209899425506592, "global_step": 86386, "epoch": 2056} {"train_loss": -6.128520965576172, "global_step": 86387, "epoch": 2056} {"train_loss": -6.142765045166016, "global_step": 86388, "epoch": 2056} {"train_loss": -6.20811653137207, "global_step": 86389, "epoch": 2056} {"train_loss": -6.156158447265625, "global_step": 86390, "epoch": 2056} {"train_loss": -6.24005126953125, "global_step": 86391, "epoch": 2056} {"train_loss": -6.24897575378418, "global_step": 86392, "epoch": 2056} {"train_loss": -6.168603806268601, "global_step": 86393, "epoch": 2056, "val_loss": 67852.1875} {"train_loss": -6.20399808883667, "global_step": 86394, "epoch": 2057} {"train_loss": -6.203878879547119, "global_step": 86395, "epoch": 2057} {"train_loss": -6.19709587097168, "global_step": 86396, "epoch": 2057} {"train_loss": -6.147344589233398, "global_step": 86397, "epoch": 2057} {"train_loss": -6.295842170715332, "global_step": 86398, "epoch": 2057} {"train_loss": -6.167720794677734, "global_step": 86399, "epoch": 2057} {"train_loss": -6.283291816711426, "global_step": 86400, "epoch": 2057} {"train_loss": -6.2101335525512695, "global_step": 86401, "epoch": 2057} {"train_loss": -6.229796409606934, "global_step": 86402, "epoch": 2057} {"train_loss": -6.224481582641602, "global_step": 86403, "epoch": 2057} {"train_loss": -6.2698869705200195, "global_step": 86404, "epoch": 2057} {"train_loss": -6.294439792633057, "global_step": 86405, "epoch": 2057} {"train_loss": -6.268665790557861, "global_step": 86406, "epoch": 2057} {"train_loss": -6.234408855438232, "global_step": 86407, "epoch": 2057} {"train_loss": -6.25916862487793, "global_step": 86408, "epoch": 2057} {"train_loss": -6.190256595611572, "global_step": 86409, "epoch": 2057} {"train_loss": -6.210781574249268, "global_step": 86410, "epoch": 2057} {"train_loss": -6.177382469177246, "global_step": 86411, "epoch": 2057} {"train_loss": -6.224860668182373, "global_step": 86412, "epoch": 2057} {"train_loss": -6.330865859985352, "global_step": 86413, "epoch": 2057} {"train_loss": -6.217615127563477, "global_step": 86414, "epoch": 2057} {"train_loss": -6.3362016677856445, "global_step": 86415, "epoch": 2057} {"train_loss": -6.222383499145508, "global_step": 86416, "epoch": 2057} {"train_loss": -6.225652694702148, "global_step": 86417, "epoch": 2057} {"train_loss": -6.155158042907715, "global_step": 86418, "epoch": 2057} {"train_loss": -6.215482234954834, "global_step": 86419, "epoch": 2057} {"train_loss": -6.267437934875488, "global_step": 86420, "epoch": 2057} {"train_loss": -6.125197410583496, "global_step": 86421, "epoch": 2057} {"train_loss": -6.27248477935791, "global_step": 86422, "epoch": 2057} {"train_loss": -6.27497673034668, "global_step": 86423, "epoch": 2057} {"train_loss": -6.14794921875, "global_step": 86424, "epoch": 2057} {"train_loss": -6.215073108673096, "global_step": 86425, "epoch": 2057} {"train_loss": -6.200778961181641, "global_step": 86426, "epoch": 2057} {"train_loss": -6.226742744445801, "global_step": 86427, "epoch": 2057} {"train_loss": -6.3506011962890625, "global_step": 86428, "epoch": 2057} {"train_loss": -6.344481945037842, "global_step": 86429, "epoch": 2057} {"train_loss": -6.312723159790039, "global_step": 86430, "epoch": 2057} {"train_loss": -6.135704040527344, "global_step": 86431, "epoch": 2057} {"train_loss": -6.147850513458252, "global_step": 86432, "epoch": 2057} {"train_loss": -6.142788887023926, "global_step": 86433, "epoch": 2057} {"train_loss": -6.187023162841797, "global_step": 86434, "epoch": 2057} {"train_loss": -6.2259284768785745, "global_step": 86435, "epoch": 2057, "val_loss": 67852.5} {"train_loss": -6.237946510314941, "global_step": 86436, "epoch": 2058} {"train_loss": -6.1863813400268555, "global_step": 86437, "epoch": 2058} {"train_loss": -5.979646682739258, "global_step": 86438, "epoch": 2058} {"train_loss": -6.177403926849365, "global_step": 86439, "epoch": 2058} {"train_loss": -6.227871894836426, "global_step": 86440, "epoch": 2058} {"train_loss": -6.249993324279785, "global_step": 86441, "epoch": 2058} {"train_loss": -6.228448867797852, "global_step": 86442, "epoch": 2058} {"train_loss": -6.263489723205566, "global_step": 86443, "epoch": 2058} {"train_loss": -6.1794233322143555, "global_step": 86444, "epoch": 2058} {"train_loss": -6.279773712158203, "global_step": 86445, "epoch": 2058} {"train_loss": -6.277033805847168, "global_step": 86446, "epoch": 2058} {"train_loss": -6.212611675262451, "global_step": 86447, "epoch": 2058} {"train_loss": -6.172548294067383, "global_step": 86448, "epoch": 2058} {"train_loss": -6.234244346618652, "global_step": 86449, "epoch": 2058} {"train_loss": -6.272849082946777, "global_step": 86450, "epoch": 2058} {"train_loss": -6.2404351234436035, "global_step": 86451, "epoch": 2058} {"train_loss": -6.04396390914917, "global_step": 86452, "epoch": 2058} {"train_loss": -6.192095756530762, "global_step": 86453, "epoch": 2058} {"train_loss": -6.096427917480469, "global_step": 86454, "epoch": 2058} {"train_loss": -6.177213191986084, "global_step": 86455, "epoch": 2058} {"train_loss": -6.133213996887207, "global_step": 86456, "epoch": 2058} {"train_loss": -6.065162658691406, "global_step": 86457, "epoch": 2058} {"train_loss": -6.031452178955078, "global_step": 86458, "epoch": 2058} {"train_loss": -6.171117305755615, "global_step": 86459, "epoch": 2058} {"train_loss": -6.1190972328186035, "global_step": 86460, "epoch": 2058} {"train_loss": -6.192417144775391, "global_step": 86461, "epoch": 2058} {"train_loss": -6.145364284515381, "global_step": 86462, "epoch": 2058} {"train_loss": -6.050039291381836, "global_step": 86463, "epoch": 2058} {"train_loss": -6.310903549194336, "global_step": 86464, "epoch": 2058} {"train_loss": -6.143732070922852, "global_step": 86465, "epoch": 2058} {"train_loss": -6.239595413208008, "global_step": 86466, "epoch": 2058} {"train_loss": -6.185011386871338, "global_step": 86467, "epoch": 2058} {"train_loss": -6.221055030822754, "global_step": 86468, "epoch": 2058} {"train_loss": -6.260810852050781, "global_step": 86469, "epoch": 2058} {"train_loss": -6.170373439788818, "global_step": 86470, "epoch": 2058} {"train_loss": -6.160434246063232, "global_step": 86471, "epoch": 2058} {"train_loss": -6.158803462982178, "global_step": 86472, "epoch": 2058} {"train_loss": -6.296450614929199, "global_step": 86473, "epoch": 2058} {"train_loss": -6.298315525054932, "global_step": 86474, "epoch": 2058} {"train_loss": -6.092024803161621, "global_step": 86475, "epoch": 2058} {"train_loss": -6.296733856201172, "global_step": 86476, "epoch": 2058} {"train_loss": -6.185354323614211, "global_step": 86477, "epoch": 2058, "val_loss": 67835.5078125} {"train_loss": -6.233512878417969, "global_step": 86478, "epoch": 2059} {"train_loss": -6.122028350830078, "global_step": 86479, "epoch": 2059} {"train_loss": -6.223734378814697, "global_step": 86480, "epoch": 2059} {"train_loss": -6.2511091232299805, "global_step": 86481, "epoch": 2059} {"train_loss": -6.130136966705322, "global_step": 86482, "epoch": 2059} {"train_loss": -6.222128868103027, "global_step": 86483, "epoch": 2059} {"train_loss": -6.225623607635498, "global_step": 86484, "epoch": 2059} {"train_loss": -6.175981044769287, "global_step": 86485, "epoch": 2059} {"train_loss": -6.1678900718688965, "global_step": 86486, "epoch": 2059} {"train_loss": -6.130046844482422, "global_step": 86487, "epoch": 2059} {"train_loss": -6.123909950256348, "global_step": 86488, "epoch": 2059} {"train_loss": -6.272860527038574, "global_step": 86489, "epoch": 2059} {"train_loss": -6.10607385635376, "global_step": 86490, "epoch": 2059} {"train_loss": -6.05002498626709, "global_step": 86491, "epoch": 2059} {"train_loss": -6.1760029792785645, "global_step": 86492, "epoch": 2059} {"train_loss": -6.1092329025268555, "global_step": 86493, "epoch": 2059} {"train_loss": -5.986039638519287, "global_step": 86494, "epoch": 2059} {"train_loss": -6.104379653930664, "global_step": 86495, "epoch": 2059} {"train_loss": -6.067561149597168, "global_step": 86496, "epoch": 2059} {"train_loss": -6.04351282119751, "global_step": 86497, "epoch": 2059} {"train_loss": -6.161748886108398, "global_step": 86498, "epoch": 2059} {"train_loss": -6.176774024963379, "global_step": 86499, "epoch": 2059} {"train_loss": -6.115525245666504, "global_step": 86500, "epoch": 2059} {"train_loss": -6.2316813468933105, "global_step": 86501, "epoch": 2059} {"train_loss": -6.102713584899902, "global_step": 86502, "epoch": 2059} {"train_loss": -6.170834064483643, "global_step": 86503, "epoch": 2059} {"train_loss": -6.259273529052734, "global_step": 86504, "epoch": 2059} {"train_loss": -6.223428726196289, "global_step": 86505, "epoch": 2059} {"train_loss": -6.16372537612915, "global_step": 86506, "epoch": 2059} {"train_loss": -6.26494026184082, "global_step": 86507, "epoch": 2059} {"train_loss": -6.167181015014648, "global_step": 86508, "epoch": 2059} {"train_loss": -6.200329780578613, "global_step": 86509, "epoch": 2059} {"train_loss": -6.064548969268799, "global_step": 86510, "epoch": 2059} {"train_loss": -6.124207019805908, "global_step": 86511, "epoch": 2059} {"train_loss": -6.145847797393799, "global_step": 86512, "epoch": 2059} {"train_loss": -6.0744218826293945, "global_step": 86513, "epoch": 2059} {"train_loss": -6.121084213256836, "global_step": 86514, "epoch": 2059} {"train_loss": -6.134537220001221, "global_step": 86515, "epoch": 2059} {"train_loss": -6.017174243927002, "global_step": 86516, "epoch": 2059} {"train_loss": -6.201075077056885, "global_step": 86517, "epoch": 2059} {"train_loss": -6.208931922912598, "global_step": 86518, "epoch": 2059} {"train_loss": -6.155158542451405, "global_step": 86519, "epoch": 2059, "val_loss": 67661.1875} {"train_loss": -6.184187412261963, "global_step": 86520, "epoch": 2060} {"train_loss": -6.121054172515869, "global_step": 86521, "epoch": 2060} {"train_loss": -6.221123218536377, "global_step": 86522, "epoch": 2060} {"train_loss": -6.220667839050293, "global_step": 86523, "epoch": 2060} {"train_loss": -6.201684474945068, "global_step": 86524, "epoch": 2060} {"train_loss": -6.167354583740234, "global_step": 86525, "epoch": 2060} {"train_loss": -6.1269330978393555, "global_step": 86526, "epoch": 2060} {"train_loss": -6.263986587524414, "global_step": 86527, "epoch": 2060} {"train_loss": -6.231602668762207, "global_step": 86528, "epoch": 2060} {"train_loss": -6.1716084480285645, "global_step": 86529, "epoch": 2060} {"train_loss": -6.246142864227295, "global_step": 86530, "epoch": 2060} {"train_loss": -6.199540138244629, "global_step": 86531, "epoch": 2060} {"train_loss": -6.11174201965332, "global_step": 86532, "epoch": 2060} {"train_loss": -6.1432037353515625, "global_step": 86533, "epoch": 2060} {"train_loss": -6.208439350128174, "global_step": 86534, "epoch": 2060} {"train_loss": -6.180633068084717, "global_step": 86535, "epoch": 2060} {"train_loss": -6.166231155395508, "global_step": 86536, "epoch": 2060} {"train_loss": -6.136473655700684, "global_step": 86537, "epoch": 2060} {"train_loss": -6.1812357902526855, "global_step": 86538, "epoch": 2060} {"train_loss": -6.316940784454346, "global_step": 86539, "epoch": 2060} {"train_loss": -6.228157043457031, "global_step": 86540, "epoch": 2060} {"train_loss": -6.260321617126465, "global_step": 86541, "epoch": 2060} {"train_loss": -6.094639778137207, "global_step": 86542, "epoch": 2060} {"train_loss": -6.266534805297852, "global_step": 86543, "epoch": 2060} {"train_loss": -6.151153564453125, "global_step": 86544, "epoch": 2060} {"train_loss": -6.232860565185547, "global_step": 86545, "epoch": 2060} {"train_loss": -6.183746337890625, "global_step": 86546, "epoch": 2060} {"train_loss": -6.161933898925781, "global_step": 86547, "epoch": 2060} {"train_loss": -6.17091703414917, "global_step": 86548, "epoch": 2060} {"train_loss": -6.210187911987305, "global_step": 86549, "epoch": 2060} {"train_loss": -6.143807411193848, "global_step": 86550, "epoch": 2060} {"train_loss": -6.312719345092773, "global_step": 86551, "epoch": 2060} {"train_loss": -6.225470542907715, "global_step": 86552, "epoch": 2060} {"train_loss": -6.198779106140137, "global_step": 86553, "epoch": 2060} {"train_loss": -6.255664825439453, "global_step": 86554, "epoch": 2060} {"train_loss": -6.361454963684082, "global_step": 86555, "epoch": 2060} {"train_loss": -6.143221378326416, "global_step": 86556, "epoch": 2060} {"train_loss": -6.339406490325928, "global_step": 86557, "epoch": 2060} {"train_loss": -6.314115524291992, "global_step": 86558, "epoch": 2060} {"train_loss": -6.351136684417725, "global_step": 86559, "epoch": 2060} {"train_loss": -6.328311920166016, "global_step": 86560, "epoch": 2060} {"train_loss": -6.213192667279925, "global_step": 86561, "epoch": 2060, "val_loss": 68007.765625} {"train_loss": -6.273755073547363, "global_step": 86562, "epoch": 2061} {"train_loss": -6.252690315246582, "global_step": 86563, "epoch": 2061} {"train_loss": -6.141904354095459, "global_step": 86564, "epoch": 2061} {"train_loss": -6.068662166595459, "global_step": 86565, "epoch": 2061} {"train_loss": -6.165709495544434, "global_step": 86566, "epoch": 2061} {"train_loss": -6.335367202758789, "global_step": 86567, "epoch": 2061} {"train_loss": -6.236695289611816, "global_step": 86568, "epoch": 2061} {"train_loss": -6.305643558502197, "global_step": 86569, "epoch": 2061} {"train_loss": -6.30499267578125, "global_step": 86570, "epoch": 2061} {"train_loss": -6.172605514526367, "global_step": 86571, "epoch": 2061} {"train_loss": -6.260125160217285, "global_step": 86572, "epoch": 2061} {"train_loss": -6.280697822570801, "global_step": 86573, "epoch": 2061} {"train_loss": -6.408520698547363, "global_step": 86574, "epoch": 2061} {"train_loss": -6.187494277954102, "global_step": 86575, "epoch": 2061} {"train_loss": -6.225161552429199, "global_step": 86576, "epoch": 2061} {"train_loss": -6.230477333068848, "global_step": 86577, "epoch": 2061} {"train_loss": -6.181130409240723, "global_step": 86578, "epoch": 2061} {"train_loss": -6.273403644561768, "global_step": 86579, "epoch": 2061} {"train_loss": -6.124791145324707, "global_step": 86580, "epoch": 2061} {"train_loss": -6.183719635009766, "global_step": 86581, "epoch": 2061} {"train_loss": -6.237477779388428, "global_step": 86582, "epoch": 2061} {"train_loss": -6.085474014282227, "global_step": 86583, "epoch": 2061} {"train_loss": -6.088858127593994, "global_step": 86584, "epoch": 2061} {"train_loss": -6.202452659606934, "global_step": 86585, "epoch": 2061} {"train_loss": -6.140810012817383, "global_step": 86586, "epoch": 2061} {"train_loss": -6.252009391784668, "global_step": 86587, "epoch": 2061} {"train_loss": -6.13419771194458, "global_step": 86588, "epoch": 2061} {"train_loss": -6.207200050354004, "global_step": 86589, "epoch": 2061} {"train_loss": -6.21741247177124, "global_step": 86590, "epoch": 2061} {"train_loss": -6.141655921936035, "global_step": 86591, "epoch": 2061} {"train_loss": -6.182437419891357, "global_step": 86592, "epoch": 2061} {"train_loss": -6.189040660858154, "global_step": 86593, "epoch": 2061} {"train_loss": -6.260209560394287, "global_step": 86594, "epoch": 2061} {"train_loss": -6.102721214294434, "global_step": 86595, "epoch": 2061} {"train_loss": -6.174276828765869, "global_step": 86596, "epoch": 2061} {"train_loss": -6.143986701965332, "global_step": 86597, "epoch": 2061} {"train_loss": -6.12285041809082, "global_step": 86598, "epoch": 2061} {"train_loss": -6.106787204742432, "global_step": 86599, "epoch": 2061} {"train_loss": -6.036457061767578, "global_step": 86600, "epoch": 2061} {"train_loss": -6.148885726928711, "global_step": 86601, "epoch": 2061} {"train_loss": -6.177350997924805, "global_step": 86602, "epoch": 2061} {"train_loss": -6.196771110807147, "global_step": 86603, "epoch": 2061, "val_loss": 67769.6484375} {"train_loss": -6.224819183349609, "global_step": 86604, "epoch": 2062} {"train_loss": -6.203958511352539, "global_step": 86605, "epoch": 2062} {"train_loss": -6.11926794052124, "global_step": 86606, "epoch": 2062} {"train_loss": -6.245421409606934, "global_step": 86607, "epoch": 2062} {"train_loss": -6.141726970672607, "global_step": 86608, "epoch": 2062} {"train_loss": -6.051627159118652, "global_step": 86609, "epoch": 2062} {"train_loss": -6.261425018310547, "global_step": 86610, "epoch": 2062} {"train_loss": -6.221334457397461, "global_step": 86611, "epoch": 2062} {"train_loss": -6.246692657470703, "global_step": 86612, "epoch": 2062} {"train_loss": -6.208745956420898, "global_step": 86613, "epoch": 2062} {"train_loss": -6.111790180206299, "global_step": 86614, "epoch": 2062} {"train_loss": -6.190625190734863, "global_step": 86615, "epoch": 2062} {"train_loss": -6.323214530944824, "global_step": 86616, "epoch": 2062} {"train_loss": -6.23500394821167, "global_step": 86617, "epoch": 2062} {"train_loss": -6.232685089111328, "global_step": 86618, "epoch": 2062} {"train_loss": -6.156647205352783, "global_step": 86619, "epoch": 2062} {"train_loss": -6.273360252380371, "global_step": 86620, "epoch": 2062} {"train_loss": -6.096745014190674, "global_step": 86621, "epoch": 2062} {"train_loss": -6.083738803863525, "global_step": 86622, "epoch": 2062} {"train_loss": -6.168525695800781, "global_step": 86623, "epoch": 2062} {"train_loss": -6.113554954528809, "global_step": 86624, "epoch": 2062} {"train_loss": -6.227357864379883, "global_step": 86625, "epoch": 2062} {"train_loss": -6.12135124206543, "global_step": 86626, "epoch": 2062} {"train_loss": -6.252931594848633, "global_step": 86627, "epoch": 2062} {"train_loss": -6.165834426879883, "global_step": 86628, "epoch": 2062} {"train_loss": -6.21103572845459, "global_step": 86629, "epoch": 2062} {"train_loss": -6.311119079589844, "global_step": 86630, "epoch": 2062} {"train_loss": -6.107951641082764, "global_step": 86631, "epoch": 2062} {"train_loss": -6.119353771209717, "global_step": 86632, "epoch": 2062} {"train_loss": -6.252810001373291, "global_step": 86633, "epoch": 2062} {"train_loss": -6.121791839599609, "global_step": 86634, "epoch": 2062} {"train_loss": -6.189476013183594, "global_step": 86635, "epoch": 2062} {"train_loss": -6.207868576049805, "global_step": 86636, "epoch": 2062} {"train_loss": -6.133721351623535, "global_step": 86637, "epoch": 2062} {"train_loss": -6.085757255554199, "global_step": 86638, "epoch": 2062} {"train_loss": -6.217616081237793, "global_step": 86639, "epoch": 2062} {"train_loss": -6.128416538238525, "global_step": 86640, "epoch": 2062} {"train_loss": -6.2106828689575195, "global_step": 86641, "epoch": 2062} {"train_loss": -6.203390598297119, "global_step": 86642, "epoch": 2062} {"train_loss": -6.2137298583984375, "global_step": 86643, "epoch": 2062} {"train_loss": -6.251744270324707, "global_step": 86644, "epoch": 2062} {"train_loss": -6.184730824970064, "global_step": 86645, "epoch": 2062, "val_loss": 67772.3984375} {"train_loss": -6.234077453613281, "global_step": 86646, "epoch": 2063} {"train_loss": -6.1615777015686035, "global_step": 86647, "epoch": 2063} {"train_loss": -6.2687668800354, "global_step": 86648, "epoch": 2063} {"train_loss": -6.182544231414795, "global_step": 86649, "epoch": 2063} {"train_loss": -6.055849075317383, "global_step": 86650, "epoch": 2063} {"train_loss": -6.136328220367432, "global_step": 86651, "epoch": 2063} {"train_loss": -6.209465503692627, "global_step": 86652, "epoch": 2063} {"train_loss": -6.04664421081543, "global_step": 86653, "epoch": 2063} {"train_loss": -6.102720260620117, "global_step": 86654, "epoch": 2063} {"train_loss": -6.252343654632568, "global_step": 86655, "epoch": 2063} {"train_loss": -6.083165168762207, "global_step": 86656, "epoch": 2063} {"train_loss": -6.16216516494751, "global_step": 86657, "epoch": 2063} {"train_loss": -6.2688212394714355, "global_step": 86658, "epoch": 2063} {"train_loss": -6.125722885131836, "global_step": 86659, "epoch": 2063} {"train_loss": -6.149138450622559, "global_step": 86660, "epoch": 2063} {"train_loss": -6.191563129425049, "global_step": 86661, "epoch": 2063} {"train_loss": -6.144437789916992, "global_step": 86662, "epoch": 2063} {"train_loss": -6.139918804168701, "global_step": 86663, "epoch": 2063} {"train_loss": -6.147485256195068, "global_step": 86664, "epoch": 2063} {"train_loss": -6.076992034912109, "global_step": 86665, "epoch": 2063} {"train_loss": -6.219839096069336, "global_step": 86666, "epoch": 2063} {"train_loss": -6.226116180419922, "global_step": 86667, "epoch": 2063} {"train_loss": -6.22150993347168, "global_step": 86668, "epoch": 2063} {"train_loss": -6.2087907791137695, "global_step": 86669, "epoch": 2063} {"train_loss": -6.206655502319336, "global_step": 86670, "epoch": 2063} {"train_loss": -6.109037399291992, "global_step": 86671, "epoch": 2063} {"train_loss": -6.197175979614258, "global_step": 86672, "epoch": 2063} {"train_loss": -6.169747352600098, "global_step": 86673, "epoch": 2063} {"train_loss": -6.294764518737793, "global_step": 86674, "epoch": 2063} {"train_loss": -6.293769836425781, "global_step": 86675, "epoch": 2063} {"train_loss": -6.17120885848999, "global_step": 86676, "epoch": 2063} {"train_loss": -6.17570686340332, "global_step": 86677, "epoch": 2063} {"train_loss": -6.303871154785156, "global_step": 86678, "epoch": 2063} {"train_loss": -6.234885215759277, "global_step": 86679, "epoch": 2063} {"train_loss": -6.179317474365234, "global_step": 86680, "epoch": 2063} {"train_loss": -6.189916610717773, "global_step": 86681, "epoch": 2063} {"train_loss": -6.218570232391357, "global_step": 86682, "epoch": 2063} {"train_loss": -6.270610332489014, "global_step": 86683, "epoch": 2063} {"train_loss": -6.169930458068848, "global_step": 86684, "epoch": 2063} {"train_loss": -6.215855598449707, "global_step": 86685, "epoch": 2063} {"train_loss": -6.2131123542785645, "global_step": 86686, "epoch": 2063} {"train_loss": -6.188219728923979, "global_step": 86687, "epoch": 2063, "val_loss": 67755.3984375} {"train_loss": -6.342597484588623, "global_step": 86688, "epoch": 2064} {"train_loss": -6.229726791381836, "global_step": 86689, "epoch": 2064} {"train_loss": -6.241695880889893, "global_step": 86690, "epoch": 2064} {"train_loss": -6.134998321533203, "global_step": 86691, "epoch": 2064} {"train_loss": -6.1647186279296875, "global_step": 86692, "epoch": 2064} {"train_loss": -6.256444454193115, "global_step": 86693, "epoch": 2064} {"train_loss": -6.133308410644531, "global_step": 86694, "epoch": 2064} {"train_loss": -6.134341239929199, "global_step": 86695, "epoch": 2064} {"train_loss": -6.22884464263916, "global_step": 86696, "epoch": 2064} {"train_loss": -6.275768756866455, "global_step": 86697, "epoch": 2064} {"train_loss": -6.270787715911865, "global_step": 86698, "epoch": 2064} {"train_loss": -6.247458457946777, "global_step": 86699, "epoch": 2064} {"train_loss": -6.276416301727295, "global_step": 86700, "epoch": 2064} {"train_loss": -6.135366916656494, "global_step": 86701, "epoch": 2064} {"train_loss": -6.144576072692871, "global_step": 86702, "epoch": 2064} {"train_loss": -6.2171220779418945, "global_step": 86703, "epoch": 2064} {"train_loss": -6.234874725341797, "global_step": 86704, "epoch": 2064} {"train_loss": -6.263192176818848, "global_step": 86705, "epoch": 2064} {"train_loss": -6.177797794342041, "global_step": 86706, "epoch": 2064} {"train_loss": -6.21196985244751, "global_step": 86707, "epoch": 2064} {"train_loss": -6.230682373046875, "global_step": 86708, "epoch": 2064} {"train_loss": -6.1069769859313965, "global_step": 86709, "epoch": 2064} {"train_loss": -6.279951095581055, "global_step": 86710, "epoch": 2064} {"train_loss": -6.143416881561279, "global_step": 86711, "epoch": 2064} {"train_loss": -6.202155590057373, "global_step": 86712, "epoch": 2064} {"train_loss": -6.216763496398926, "global_step": 86713, "epoch": 2064} {"train_loss": -6.183098316192627, "global_step": 86714, "epoch": 2064} {"train_loss": -6.233824729919434, "global_step": 86715, "epoch": 2064} {"train_loss": -6.155579566955566, "global_step": 86716, "epoch": 2064} {"train_loss": -6.210409164428711, "global_step": 86717, "epoch": 2064} {"train_loss": -6.259428024291992, "global_step": 86718, "epoch": 2064} {"train_loss": -6.109189033508301, "global_step": 86719, "epoch": 2064} {"train_loss": -6.1916632652282715, "global_step": 86720, "epoch": 2064} {"train_loss": -6.238083362579346, "global_step": 86721, "epoch": 2064} {"train_loss": -6.1669602394104, "global_step": 86722, "epoch": 2064} {"train_loss": -6.116233825683594, "global_step": 86723, "epoch": 2064} {"train_loss": -6.125675201416016, "global_step": 86724, "epoch": 2064} {"train_loss": -6.282334327697754, "global_step": 86725, "epoch": 2064} {"train_loss": -6.258581161499023, "global_step": 86726, "epoch": 2064} {"train_loss": -6.2406721115112305, "global_step": 86727, "epoch": 2064} {"train_loss": -6.258672714233398, "global_step": 86728, "epoch": 2064} {"train_loss": -6.208208401997884, "global_step": 86729, "epoch": 2064, "val_loss": 67702.1875} {"train_loss": -6.121406078338623, "global_step": 86730, "epoch": 2065} {"train_loss": -6.16678524017334, "global_step": 86731, "epoch": 2065} {"train_loss": -6.250097274780273, "global_step": 86732, "epoch": 2065} {"train_loss": -6.231476783752441, "global_step": 86733, "epoch": 2065} {"train_loss": -6.172593593597412, "global_step": 86734, "epoch": 2065} {"train_loss": -6.317357063293457, "global_step": 86735, "epoch": 2065} {"train_loss": -6.089127063751221, "global_step": 86736, "epoch": 2065} {"train_loss": -6.261462688446045, "global_step": 86737, "epoch": 2065} {"train_loss": -6.258809566497803, "global_step": 86738, "epoch": 2065} {"train_loss": -6.185513496398926, "global_step": 86739, "epoch": 2065} {"train_loss": -6.283656120300293, "global_step": 86740, "epoch": 2065} {"train_loss": -6.213597297668457, "global_step": 86741, "epoch": 2065} {"train_loss": -6.204146862030029, "global_step": 86742, "epoch": 2065} {"train_loss": -6.174898624420166, "global_step": 86743, "epoch": 2065} {"train_loss": -6.145697593688965, "global_step": 86744, "epoch": 2065} {"train_loss": -6.120342254638672, "global_step": 86745, "epoch": 2065} {"train_loss": -6.301469802856445, "global_step": 86746, "epoch": 2065} {"train_loss": -6.118386268615723, "global_step": 86747, "epoch": 2065} {"train_loss": -6.201046943664551, "global_step": 86748, "epoch": 2065} {"train_loss": -6.180699348449707, "global_step": 86749, "epoch": 2065} {"train_loss": -6.217192649841309, "global_step": 86750, "epoch": 2065} {"train_loss": -6.132499694824219, "global_step": 86751, "epoch": 2065} {"train_loss": -6.093107223510742, "global_step": 86752, "epoch": 2065} {"train_loss": -6.294114112854004, "global_step": 86753, "epoch": 2065} {"train_loss": -6.155218124389648, "global_step": 86754, "epoch": 2065} {"train_loss": -6.175360679626465, "global_step": 86755, "epoch": 2065} {"train_loss": -6.1688456535339355, "global_step": 86756, "epoch": 2065} {"train_loss": -6.141976356506348, "global_step": 86757, "epoch": 2065} {"train_loss": -6.165022850036621, "global_step": 86758, "epoch": 2065} {"train_loss": -6.149202346801758, "global_step": 86759, "epoch": 2065} {"train_loss": -6.229236602783203, "global_step": 86760, "epoch": 2065} {"train_loss": -6.272675514221191, "global_step": 86761, "epoch": 2065} {"train_loss": -6.202930450439453, "global_step": 86762, "epoch": 2065} {"train_loss": -6.236968517303467, "global_step": 86763, "epoch": 2065} {"train_loss": -6.208934783935547, "global_step": 86764, "epoch": 2065} {"train_loss": -6.17685604095459, "global_step": 86765, "epoch": 2065} {"train_loss": -6.24316930770874, "global_step": 86766, "epoch": 2065} {"train_loss": -6.249626159667969, "global_step": 86767, "epoch": 2065} {"train_loss": -6.213040828704834, "global_step": 86768, "epoch": 2065} {"train_loss": -6.290254592895508, "global_step": 86769, "epoch": 2065} {"train_loss": -6.233012676239014, "global_step": 86770, "epoch": 2065} {"train_loss": -6.20523662794204, "global_step": 86771, "epoch": 2065, "val_loss": 67833.0625} {"train_loss": -6.263566017150879, "global_step": 86772, "epoch": 2066} {"train_loss": -6.171026229858398, "global_step": 86773, "epoch": 2066} {"train_loss": -6.347761154174805, "global_step": 86774, "epoch": 2066} {"train_loss": -6.294291019439697, "global_step": 86775, "epoch": 2066} {"train_loss": -6.1257500648498535, "global_step": 86776, "epoch": 2066} {"train_loss": -6.20710563659668, "global_step": 86777, "epoch": 2066} {"train_loss": -6.208351135253906, "global_step": 86778, "epoch": 2066} {"train_loss": -6.213665962219238, "global_step": 86779, "epoch": 2066} {"train_loss": -6.020961761474609, "global_step": 86780, "epoch": 2066} {"train_loss": -6.209860801696777, "global_step": 86781, "epoch": 2066} {"train_loss": -6.214860916137695, "global_step": 86782, "epoch": 2066} {"train_loss": -6.247496128082275, "global_step": 86783, "epoch": 2066} {"train_loss": -6.200555801391602, "global_step": 86784, "epoch": 2066} {"train_loss": -6.128129005432129, "global_step": 86785, "epoch": 2066} {"train_loss": -6.1808552742004395, "global_step": 86786, "epoch": 2066} {"train_loss": -6.245741844177246, "global_step": 86787, "epoch": 2066} {"train_loss": -6.114203929901123, "global_step": 86788, "epoch": 2066} {"train_loss": -6.0559282302856445, "global_step": 86789, "epoch": 2066} {"train_loss": -6.196542263031006, "global_step": 86790, "epoch": 2066} {"train_loss": -6.127259731292725, "global_step": 86791, "epoch": 2066} {"train_loss": -6.112250804901123, "global_step": 86792, "epoch": 2066} {"train_loss": -6.229286193847656, "global_step": 86793, "epoch": 2066} {"train_loss": -6.045510292053223, "global_step": 86794, "epoch": 2066} {"train_loss": -6.132570266723633, "global_step": 86795, "epoch": 2066} {"train_loss": -6.16698694229126, "global_step": 86796, "epoch": 2066} {"train_loss": -6.10588264465332, "global_step": 86797, "epoch": 2066} {"train_loss": -6.222067832946777, "global_step": 86798, "epoch": 2066} {"train_loss": -6.037668228149414, "global_step": 86799, "epoch": 2066} {"train_loss": -6.067796230316162, "global_step": 86800, "epoch": 2066} {"train_loss": -6.206977844238281, "global_step": 86801, "epoch": 2066} {"train_loss": -6.2240495681762695, "global_step": 86802, "epoch": 2066} {"train_loss": -6.221611976623535, "global_step": 86803, "epoch": 2066} {"train_loss": -6.168895244598389, "global_step": 86804, "epoch": 2066} {"train_loss": -6.181645393371582, "global_step": 86805, "epoch": 2066} {"train_loss": -6.258832931518555, "global_step": 86806, "epoch": 2066} {"train_loss": -6.095895767211914, "global_step": 86807, "epoch": 2066} {"train_loss": -6.056617736816406, "global_step": 86808, "epoch": 2066} {"train_loss": -6.19671630859375, "global_step": 86809, "epoch": 2066} {"train_loss": -6.104274749755859, "global_step": 86810, "epoch": 2066} {"train_loss": -6.2475457191467285, "global_step": 86811, "epoch": 2066} {"train_loss": -6.0901265144348145, "global_step": 86812, "epoch": 2066} {"train_loss": -6.17068760735648, "global_step": 86813, "epoch": 2066, "val_loss": 67942.9140625} {"train_loss": -6.18967866897583, "global_step": 86814, "epoch": 2067} {"train_loss": -6.239117622375488, "global_step": 86815, "epoch": 2067} {"train_loss": -6.167752265930176, "global_step": 86816, "epoch": 2067} {"train_loss": -6.173104286193848, "global_step": 86817, "epoch": 2067} {"train_loss": -6.23778772354126, "global_step": 86818, "epoch": 2067} {"train_loss": -6.272708892822266, "global_step": 86819, "epoch": 2067} {"train_loss": -6.251899242401123, "global_step": 86820, "epoch": 2067} {"train_loss": -6.269783973693848, "global_step": 86821, "epoch": 2067} {"train_loss": -6.248908519744873, "global_step": 86822, "epoch": 2067} {"train_loss": -6.316747188568115, "global_step": 86823, "epoch": 2067} {"train_loss": -6.156518936157227, "global_step": 86824, "epoch": 2067} {"train_loss": -6.292131423950195, "global_step": 86825, "epoch": 2067} {"train_loss": -6.204659938812256, "global_step": 86826, "epoch": 2067} {"train_loss": -6.17142391204834, "global_step": 86827, "epoch": 2067} {"train_loss": -6.189063549041748, "global_step": 86828, "epoch": 2067} {"train_loss": -6.153259754180908, "global_step": 86829, "epoch": 2067} {"train_loss": -6.289080619812012, "global_step": 86830, "epoch": 2067} {"train_loss": -6.150221824645996, "global_step": 86831, "epoch": 2067} {"train_loss": -6.237213134765625, "global_step": 86832, "epoch": 2067} {"train_loss": -6.218545913696289, "global_step": 86833, "epoch": 2067} {"train_loss": -6.151577949523926, "global_step": 86834, "epoch": 2067} {"train_loss": -6.192339897155762, "global_step": 86835, "epoch": 2067} {"train_loss": -6.13806676864624, "global_step": 86836, "epoch": 2067} {"train_loss": -6.260995864868164, "global_step": 86837, "epoch": 2067} {"train_loss": -6.117549896240234, "global_step": 86838, "epoch": 2067} {"train_loss": -6.07081413269043, "global_step": 86839, "epoch": 2067} {"train_loss": -6.206316947937012, "global_step": 86840, "epoch": 2067} {"train_loss": -6.1727447509765625, "global_step": 86841, "epoch": 2067} {"train_loss": -6.169315338134766, "global_step": 86842, "epoch": 2067} {"train_loss": -6.234823703765869, "global_step": 86843, "epoch": 2067} {"train_loss": -6.222647190093994, "global_step": 86844, "epoch": 2067} {"train_loss": -6.174184799194336, "global_step": 86845, "epoch": 2067} {"train_loss": -6.153682231903076, "global_step": 86846, "epoch": 2067} {"train_loss": -6.20994758605957, "global_step": 86847, "epoch": 2067} {"train_loss": -6.188407897949219, "global_step": 86848, "epoch": 2067} {"train_loss": -6.380220413208008, "global_step": 86849, "epoch": 2067} {"train_loss": -6.183432579040527, "global_step": 86850, "epoch": 2067} {"train_loss": -6.08448600769043, "global_step": 86851, "epoch": 2067} {"train_loss": -6.185678005218506, "global_step": 86852, "epoch": 2067} {"train_loss": -6.183523178100586, "global_step": 86853, "epoch": 2067} {"train_loss": -6.301209449768066, "global_step": 86854, "epoch": 2067} {"train_loss": -6.210219996316092, "global_step": 86855, "epoch": 2067, "val_loss": 67790.6015625} {"train_loss": -6.227752685546875, "global_step": 86856, "epoch": 2068} {"train_loss": -6.2648210525512695, "global_step": 86857, "epoch": 2068} {"train_loss": -6.18521785736084, "global_step": 86858, "epoch": 2068} {"train_loss": -6.124913692474365, "global_step": 86859, "epoch": 2068} {"train_loss": -6.138801574707031, "global_step": 86860, "epoch": 2068} {"train_loss": -6.1454925537109375, "global_step": 86861, "epoch": 2068} {"train_loss": -6.197779655456543, "global_step": 86862, "epoch": 2068} {"train_loss": -6.247315406799316, "global_step": 86863, "epoch": 2068} {"train_loss": -6.157854080200195, "global_step": 86864, "epoch": 2068} {"train_loss": -6.180540084838867, "global_step": 86865, "epoch": 2068} {"train_loss": -6.215524673461914, "global_step": 86866, "epoch": 2068} {"train_loss": -6.173677444458008, "global_step": 86867, "epoch": 2068} {"train_loss": -6.278678894042969, "global_step": 86868, "epoch": 2068} {"train_loss": -6.329505920410156, "global_step": 86869, "epoch": 2068} {"train_loss": -6.133854866027832, "global_step": 86870, "epoch": 2068} {"train_loss": -6.283926010131836, "global_step": 86871, "epoch": 2068} {"train_loss": -6.199008941650391, "global_step": 86872, "epoch": 2068} {"train_loss": -6.137726783752441, "global_step": 86873, "epoch": 2068} {"train_loss": -6.331699371337891, "global_step": 86874, "epoch": 2068} {"train_loss": -6.255692481994629, "global_step": 86875, "epoch": 2068} {"train_loss": -6.078056335449219, "global_step": 86876, "epoch": 2068} {"train_loss": -6.269139766693115, "global_step": 86877, "epoch": 2068} {"train_loss": -6.081485748291016, "global_step": 86878, "epoch": 2068} {"train_loss": -6.213421821594238, "global_step": 86879, "epoch": 2068} {"train_loss": -6.321555137634277, "global_step": 86880, "epoch": 2068} {"train_loss": -6.279738426208496, "global_step": 86881, "epoch": 2068} {"train_loss": -6.2497687339782715, "global_step": 86882, "epoch": 2068} {"train_loss": -6.230405807495117, "global_step": 86883, "epoch": 2068} {"train_loss": -6.3371477127075195, "global_step": 86884, "epoch": 2068} {"train_loss": -6.287228584289551, "global_step": 86885, "epoch": 2068} {"train_loss": -6.181387901306152, "global_step": 86886, "epoch": 2068} {"train_loss": -6.238905906677246, "global_step": 86887, "epoch": 2068} {"train_loss": -6.227776050567627, "global_step": 86888, "epoch": 2068} {"train_loss": -6.198643684387207, "global_step": 86889, "epoch": 2068} {"train_loss": -6.233935356140137, "global_step": 86890, "epoch": 2068} {"train_loss": -6.223161697387695, "global_step": 86891, "epoch": 2068} {"train_loss": -6.2542524337768555, "global_step": 86892, "epoch": 2068} {"train_loss": -6.331404685974121, "global_step": 86893, "epoch": 2068} {"train_loss": -6.187901496887207, "global_step": 86894, "epoch": 2068} {"train_loss": -6.177171230316162, "global_step": 86895, "epoch": 2068} {"train_loss": -6.1552839279174805, "global_step": 86896, "epoch": 2068} {"train_loss": -6.220603261675153, "global_step": 86897, "epoch": 2068, "val_loss": 67794.484375} {"train_loss": -6.10910177230835, "global_step": 86898, "epoch": 2069} {"train_loss": -6.15291690826416, "global_step": 86899, "epoch": 2069} {"train_loss": -6.098121643066406, "global_step": 86900, "epoch": 2069} {"train_loss": -6.225207328796387, "global_step": 86901, "epoch": 2069} {"train_loss": -6.199186325073242, "global_step": 86902, "epoch": 2069} {"train_loss": -6.307320594787598, "global_step": 86903, "epoch": 2069} {"train_loss": -6.196681976318359, "global_step": 86904, "epoch": 2069} {"train_loss": -6.103503704071045, "global_step": 86905, "epoch": 2069} {"train_loss": -6.198264122009277, "global_step": 86906, "epoch": 2069} {"train_loss": -6.248856544494629, "global_step": 86907, "epoch": 2069} {"train_loss": -6.259284019470215, "global_step": 86908, "epoch": 2069} {"train_loss": -6.14141321182251, "global_step": 86909, "epoch": 2069} {"train_loss": -6.299729347229004, "global_step": 86910, "epoch": 2069} {"train_loss": -6.372123718261719, "global_step": 86911, "epoch": 2069} {"train_loss": -6.314436435699463, "global_step": 86912, "epoch": 2069} {"train_loss": -6.151357650756836, "global_step": 86913, "epoch": 2069} {"train_loss": -6.16879415512085, "global_step": 86914, "epoch": 2069} {"train_loss": -6.197569847106934, "global_step": 86915, "epoch": 2069} {"train_loss": -6.228172779083252, "global_step": 86916, "epoch": 2069} {"train_loss": -6.260605812072754, "global_step": 86917, "epoch": 2069} {"train_loss": -6.155107498168945, "global_step": 86918, "epoch": 2069} {"train_loss": -6.228096008300781, "global_step": 86919, "epoch": 2069} {"train_loss": -6.2197980880737305, "global_step": 86920, "epoch": 2069} {"train_loss": -6.239535331726074, "global_step": 86921, "epoch": 2069} {"train_loss": -6.156556129455566, "global_step": 86922, "epoch": 2069} {"train_loss": -6.20414400100708, "global_step": 86923, "epoch": 2069} {"train_loss": -6.133408546447754, "global_step": 86924, "epoch": 2069} {"train_loss": -6.216004371643066, "global_step": 86925, "epoch": 2069} {"train_loss": -6.310476303100586, "global_step": 86926, "epoch": 2069} {"train_loss": -6.176030158996582, "global_step": 86927, "epoch": 2069} {"train_loss": -6.178245544433594, "global_step": 86928, "epoch": 2069} {"train_loss": -6.310216903686523, "global_step": 86929, "epoch": 2069} {"train_loss": -6.157012939453125, "global_step": 86930, "epoch": 2069} {"train_loss": -6.242218971252441, "global_step": 86931, "epoch": 2069} {"train_loss": -6.157463550567627, "global_step": 86932, "epoch": 2069} {"train_loss": -6.128558158874512, "global_step": 86933, "epoch": 2069} {"train_loss": -6.248844146728516, "global_step": 86934, "epoch": 2069} {"train_loss": -6.192827224731445, "global_step": 86935, "epoch": 2069} {"train_loss": -6.1399383544921875, "global_step": 86936, "epoch": 2069} {"train_loss": -6.095659255981445, "global_step": 86937, "epoch": 2069} {"train_loss": -6.126988887786865, "global_step": 86938, "epoch": 2069} {"train_loss": -6.200175364812215, "global_step": 86939, "epoch": 2069, "val_loss": 67881.28125} {"train_loss": -6.214140892028809, "global_step": 86940, "epoch": 2070} {"train_loss": -6.200675964355469, "global_step": 86941, "epoch": 2070} {"train_loss": -6.255524635314941, "global_step": 86942, "epoch": 2070} {"train_loss": -6.135098457336426, "global_step": 86943, "epoch": 2070} {"train_loss": -6.293456554412842, "global_step": 86944, "epoch": 2070} {"train_loss": -6.241086006164551, "global_step": 86945, "epoch": 2070} {"train_loss": -6.1366682052612305, "global_step": 86946, "epoch": 2070} {"train_loss": -6.227359771728516, "global_step": 86947, "epoch": 2070} {"train_loss": -6.225419998168945, "global_step": 86948, "epoch": 2070} {"train_loss": -6.192880630493164, "global_step": 86949, "epoch": 2070} {"train_loss": -6.324581623077393, "global_step": 86950, "epoch": 2070} {"train_loss": -6.13134241104126, "global_step": 86951, "epoch": 2070} {"train_loss": -6.196828842163086, "global_step": 86952, "epoch": 2070} {"train_loss": -6.142891883850098, "global_step": 86953, "epoch": 2070} {"train_loss": -6.19268798828125, "global_step": 86954, "epoch": 2070} {"train_loss": -6.206005573272705, "global_step": 86955, "epoch": 2070} {"train_loss": -6.10080623626709, "global_step": 86956, "epoch": 2070} {"train_loss": -6.20610237121582, "global_step": 86957, "epoch": 2070} {"train_loss": -6.246490001678467, "global_step": 86958, "epoch": 2070} {"train_loss": -6.193324089050293, "global_step": 86959, "epoch": 2070} {"train_loss": -6.175032138824463, "global_step": 86960, "epoch": 2070} {"train_loss": -6.193914890289307, "global_step": 86961, "epoch": 2070} {"train_loss": -6.172277450561523, "global_step": 86962, "epoch": 2070} {"train_loss": -6.229067325592041, "global_step": 86963, "epoch": 2070} {"train_loss": -6.153249740600586, "global_step": 86964, "epoch": 2070} {"train_loss": -6.218411445617676, "global_step": 86965, "epoch": 2070} {"train_loss": -6.1473846435546875, "global_step": 86966, "epoch": 2070} {"train_loss": -6.2396721839904785, "global_step": 86967, "epoch": 2070} {"train_loss": -6.156680107116699, "global_step": 86968, "epoch": 2070} {"train_loss": -6.124391555786133, "global_step": 86969, "epoch": 2070} {"train_loss": -6.224116325378418, "global_step": 86970, "epoch": 2070} {"train_loss": -6.057119369506836, "global_step": 86971, "epoch": 2070} {"train_loss": -6.1378889083862305, "global_step": 86972, "epoch": 2070} {"train_loss": -6.19200325012207, "global_step": 86973, "epoch": 2070} {"train_loss": -6.1389312744140625, "global_step": 86974, "epoch": 2070} {"train_loss": -6.28520393371582, "global_step": 86975, "epoch": 2070} {"train_loss": -6.23597526550293, "global_step": 86976, "epoch": 2070} {"train_loss": -6.321846961975098, "global_step": 86977, "epoch": 2070} {"train_loss": -6.219944000244141, "global_step": 86978, "epoch": 2070} {"train_loss": -6.23417329788208, "global_step": 86979, "epoch": 2070} {"train_loss": -6.227823257446289, "global_step": 86980, "epoch": 2070} {"train_loss": -6.199198915844872, "global_step": 86981, "epoch": 2070, "val_loss": 67735.3046875} {"train_loss": -6.104903697967529, "global_step": 86982, "epoch": 2071} {"train_loss": -6.256672382354736, "global_step": 86983, "epoch": 2071} {"train_loss": -6.231420516967773, "global_step": 86984, "epoch": 2071} {"train_loss": -6.2225542068481445, "global_step": 86985, "epoch": 2071} {"train_loss": -6.285249710083008, "global_step": 86986, "epoch": 2071} {"train_loss": -6.137060165405273, "global_step": 86987, "epoch": 2071} {"train_loss": -6.243097305297852, "global_step": 86988, "epoch": 2071} {"train_loss": -6.311954498291016, "global_step": 86989, "epoch": 2071} {"train_loss": -6.267580986022949, "global_step": 86990, "epoch": 2071} {"train_loss": -6.296503067016602, "global_step": 86991, "epoch": 2071} {"train_loss": -6.23440408706665, "global_step": 86992, "epoch": 2071} {"train_loss": -6.340246677398682, "global_step": 86993, "epoch": 2071} {"train_loss": -6.189083576202393, "global_step": 86994, "epoch": 2071} {"train_loss": -6.282540321350098, "global_step": 86995, "epoch": 2071} {"train_loss": -6.0984954833984375, "global_step": 86996, "epoch": 2071} {"train_loss": -6.188709259033203, "global_step": 86997, "epoch": 2071} {"train_loss": -6.142977237701416, "global_step": 86998, "epoch": 2071} {"train_loss": -6.1569318771362305, "global_step": 86999, "epoch": 2071} {"train_loss": -6.1764984130859375, "global_step": 87000, "epoch": 2071} {"train_loss": -6.046004295349121, "global_step": 87001, "epoch": 2071} {"train_loss": -6.190468788146973, "global_step": 87002, "epoch": 2071} {"train_loss": -6.129506587982178, "global_step": 87003, "epoch": 2071} {"train_loss": -6.106473922729492, "global_step": 87004, "epoch": 2071} {"train_loss": -6.295358657836914, "global_step": 87005, "epoch": 2071} {"train_loss": -6.143196105957031, "global_step": 87006, "epoch": 2071} {"train_loss": -6.136753082275391, "global_step": 87007, "epoch": 2071} {"train_loss": -6.0876007080078125, "global_step": 87008, "epoch": 2071} {"train_loss": -6.345578670501709, "global_step": 87009, "epoch": 2071} {"train_loss": -6.262564659118652, "global_step": 87010, "epoch": 2071} {"train_loss": -6.214688301086426, "global_step": 87011, "epoch": 2071} {"train_loss": -6.109805107116699, "global_step": 87012, "epoch": 2071} {"train_loss": -6.236024856567383, "global_step": 87013, "epoch": 2071} {"train_loss": -6.110971450805664, "global_step": 87014, "epoch": 2071} {"train_loss": -6.215795993804932, "global_step": 87015, "epoch": 2071} {"train_loss": -6.204745292663574, "global_step": 87016, "epoch": 2071} {"train_loss": -6.274121284484863, "global_step": 87017, "epoch": 2071} {"train_loss": -6.216183662414551, "global_step": 87018, "epoch": 2071} {"train_loss": -6.245217323303223, "global_step": 87019, "epoch": 2071} {"train_loss": -6.2069501876831055, "global_step": 87020, "epoch": 2071} {"train_loss": -6.203190803527832, "global_step": 87021, "epoch": 2071} {"train_loss": -6.29688024520874, "global_step": 87022, "epoch": 2071} {"train_loss": -6.207591329302106, "global_step": 87023, "epoch": 2071, "val_loss": 68060.0390625} {"train_loss": -6.236490249633789, "global_step": 87024, "epoch": 2072} {"train_loss": -6.20742130279541, "global_step": 87025, "epoch": 2072} {"train_loss": -6.234086990356445, "global_step": 87026, "epoch": 2072} {"train_loss": -6.146825313568115, "global_step": 87027, "epoch": 2072} {"train_loss": -6.202032089233398, "global_step": 87028, "epoch": 2072} {"train_loss": -6.206000328063965, "global_step": 87029, "epoch": 2072} {"train_loss": -6.081691265106201, "global_step": 87030, "epoch": 2072} {"train_loss": -6.131595611572266, "global_step": 87031, "epoch": 2072} {"train_loss": -6.265697956085205, "global_step": 87032, "epoch": 2072} {"train_loss": -6.079478740692139, "global_step": 87033, "epoch": 2072} {"train_loss": -6.1986918449401855, "global_step": 87034, "epoch": 2072} {"train_loss": -6.173816680908203, "global_step": 87035, "epoch": 2072} {"train_loss": -6.122757434844971, "global_step": 87036, "epoch": 2072} {"train_loss": -6.272246837615967, "global_step": 87037, "epoch": 2072} {"train_loss": -6.094823360443115, "global_step": 87038, "epoch": 2072} {"train_loss": -6.135408401489258, "global_step": 87039, "epoch": 2072} {"train_loss": -6.144118785858154, "global_step": 87040, "epoch": 2072} {"train_loss": -6.135295391082764, "global_step": 87041, "epoch": 2072} {"train_loss": -6.065840244293213, "global_step": 87042, "epoch": 2072} {"train_loss": -6.000071048736572, "global_step": 87043, "epoch": 2072} {"train_loss": -6.235064506530762, "global_step": 87044, "epoch": 2072} {"train_loss": -6.1913909912109375, "global_step": 87045, "epoch": 2072} {"train_loss": -5.9974894523620605, "global_step": 87046, "epoch": 2072} {"train_loss": -6.133794784545898, "global_step": 87047, "epoch": 2072} {"train_loss": -6.218331336975098, "global_step": 87048, "epoch": 2072} {"train_loss": -6.284285545349121, "global_step": 87049, "epoch": 2072} {"train_loss": -6.189053535461426, "global_step": 87050, "epoch": 2072} {"train_loss": -6.132835388183594, "global_step": 87051, "epoch": 2072} {"train_loss": -6.128322601318359, "global_step": 87052, "epoch": 2072} {"train_loss": -6.24635124206543, "global_step": 87053, "epoch": 2072} {"train_loss": -6.14365291595459, "global_step": 87054, "epoch": 2072} {"train_loss": -6.189427375793457, "global_step": 87055, "epoch": 2072} {"train_loss": -6.218006134033203, "global_step": 87056, "epoch": 2072} {"train_loss": -6.256204605102539, "global_step": 87057, "epoch": 2072} {"train_loss": -6.175615310668945, "global_step": 87058, "epoch": 2072} {"train_loss": -6.0832929611206055, "global_step": 87059, "epoch": 2072} {"train_loss": -6.079925537109375, "global_step": 87060, "epoch": 2072} {"train_loss": -6.182190895080566, "global_step": 87061, "epoch": 2072} {"train_loss": -6.167266368865967, "global_step": 87062, "epoch": 2072} {"train_loss": -6.233001708984375, "global_step": 87063, "epoch": 2072} {"train_loss": -6.11898136138916, "global_step": 87064, "epoch": 2072} {"train_loss": -6.164165599005563, "global_step": 87065, "epoch": 2072, "val_loss": 67745.53125} {"train_loss": -6.176928520202637, "global_step": 87066, "epoch": 2073} {"train_loss": -6.099872589111328, "global_step": 87067, "epoch": 2073} {"train_loss": -6.191643714904785, "global_step": 87068, "epoch": 2073} {"train_loss": -6.221068382263184, "global_step": 87069, "epoch": 2073} {"train_loss": -6.165916442871094, "global_step": 87070, "epoch": 2073} {"train_loss": -6.2059736251831055, "global_step": 87071, "epoch": 2073} {"train_loss": -6.344676971435547, "global_step": 87072, "epoch": 2073} {"train_loss": -6.147336959838867, "global_step": 87073, "epoch": 2073} {"train_loss": -6.219708442687988, "global_step": 87074, "epoch": 2073} {"train_loss": -6.245966911315918, "global_step": 87075, "epoch": 2073} {"train_loss": -6.195130348205566, "global_step": 87076, "epoch": 2073} {"train_loss": -6.2233452796936035, "global_step": 87077, "epoch": 2073} {"train_loss": -6.205739974975586, "global_step": 87078, "epoch": 2073} {"train_loss": -6.248810768127441, "global_step": 87079, "epoch": 2073} {"train_loss": -6.153762340545654, "global_step": 87080, "epoch": 2073} {"train_loss": -6.175426483154297, "global_step": 87081, "epoch": 2073} {"train_loss": -6.290487766265869, "global_step": 87082, "epoch": 2073} {"train_loss": -6.05080509185791, "global_step": 87083, "epoch": 2073} {"train_loss": -6.094314098358154, "global_step": 87084, "epoch": 2073} {"train_loss": -6.327207565307617, "global_step": 87085, "epoch": 2073} {"train_loss": -6.273858070373535, "global_step": 87086, "epoch": 2073} {"train_loss": -6.239194393157959, "global_step": 87087, "epoch": 2073} {"train_loss": -6.117649078369141, "global_step": 87088, "epoch": 2073} {"train_loss": -6.040698528289795, "global_step": 87089, "epoch": 2073} {"train_loss": -6.128654479980469, "global_step": 87090, "epoch": 2073} {"train_loss": -6.074509620666504, "global_step": 87091, "epoch": 2073} {"train_loss": -6.071334362030029, "global_step": 87092, "epoch": 2073} {"train_loss": -6.0734453201293945, "global_step": 87093, "epoch": 2073} {"train_loss": -6.049465179443359, "global_step": 87094, "epoch": 2073} {"train_loss": -6.064483642578125, "global_step": 87095, "epoch": 2073} {"train_loss": -5.9940948486328125, "global_step": 87096, "epoch": 2073} {"train_loss": -6.110745429992676, "global_step": 87097, "epoch": 2073} {"train_loss": -6.045784950256348, "global_step": 87098, "epoch": 2073} {"train_loss": -6.219794273376465, "global_step": 87099, "epoch": 2073} {"train_loss": -6.2301716804504395, "global_step": 87100, "epoch": 2073} {"train_loss": -6.133597373962402, "global_step": 87101, "epoch": 2073} {"train_loss": -5.905544757843018, "global_step": 87102, "epoch": 2073} {"train_loss": -6.006373405456543, "global_step": 87103, "epoch": 2073} {"train_loss": -5.992025375366211, "global_step": 87104, "epoch": 2073} {"train_loss": -6.142851829528809, "global_step": 87105, "epoch": 2073} {"train_loss": -6.247907638549805, "global_step": 87106, "epoch": 2073} {"train_loss": -6.150025254204159, "global_step": 87107, "epoch": 2073, "val_loss": 68006.875} {"train_loss": -6.136203765869141, "global_step": 87108, "epoch": 2074} {"train_loss": -6.1117472648620605, "global_step": 87109, "epoch": 2074} {"train_loss": -6.065899848937988, "global_step": 87110, "epoch": 2074} {"train_loss": -6.07275390625, "global_step": 87111, "epoch": 2074} {"train_loss": -6.215963363647461, "global_step": 87112, "epoch": 2074} {"train_loss": -6.135885715484619, "global_step": 87113, "epoch": 2074} {"train_loss": -6.308723449707031, "global_step": 87114, "epoch": 2074} {"train_loss": -6.1800079345703125, "global_step": 87115, "epoch": 2074} {"train_loss": -6.216168403625488, "global_step": 87116, "epoch": 2074} {"train_loss": -6.136617660522461, "global_step": 87117, "epoch": 2074} {"train_loss": -6.243222236633301, "global_step": 87118, "epoch": 2074} {"train_loss": -6.202897548675537, "global_step": 87119, "epoch": 2074} {"train_loss": -6.113330841064453, "global_step": 87120, "epoch": 2074} {"train_loss": -6.132791042327881, "global_step": 87121, "epoch": 2074} {"train_loss": -6.137242317199707, "global_step": 87122, "epoch": 2074} {"train_loss": -6.141182899475098, "global_step": 87123, "epoch": 2074} {"train_loss": -6.013916015625, "global_step": 87124, "epoch": 2074} {"train_loss": -6.250105381011963, "global_step": 87125, "epoch": 2074} {"train_loss": -6.196701526641846, "global_step": 87126, "epoch": 2074} {"train_loss": -5.978033542633057, "global_step": 87127, "epoch": 2074} {"train_loss": -6.2794036865234375, "global_step": 87128, "epoch": 2074} {"train_loss": -6.172056198120117, "global_step": 87129, "epoch": 2074} {"train_loss": -6.097899436950684, "global_step": 87130, "epoch": 2074} {"train_loss": -6.085461139678955, "global_step": 87131, "epoch": 2074} {"train_loss": -6.088984966278076, "global_step": 87132, "epoch": 2074} {"train_loss": -6.235712051391602, "global_step": 87133, "epoch": 2074} {"train_loss": -6.36041259765625, "global_step": 87134, "epoch": 2074} {"train_loss": -6.181192398071289, "global_step": 87135, "epoch": 2074} {"train_loss": -6.13353967666626, "global_step": 87136, "epoch": 2074} {"train_loss": -6.191666603088379, "global_step": 87137, "epoch": 2074} {"train_loss": -6.142077922821045, "global_step": 87138, "epoch": 2074} {"train_loss": -6.18812370300293, "global_step": 87139, "epoch": 2074} {"train_loss": -6.110466003417969, "global_step": 87140, "epoch": 2074} {"train_loss": -6.325706958770752, "global_step": 87141, "epoch": 2074} {"train_loss": -6.206945896148682, "global_step": 87142, "epoch": 2074} {"train_loss": -6.165567398071289, "global_step": 87143, "epoch": 2074} {"train_loss": -6.216538429260254, "global_step": 87144, "epoch": 2074} {"train_loss": -6.188460350036621, "global_step": 87145, "epoch": 2074} {"train_loss": -6.27620267868042, "global_step": 87146, "epoch": 2074} {"train_loss": -6.387750625610352, "global_step": 87147, "epoch": 2074} {"train_loss": -6.181014060974121, "global_step": 87148, "epoch": 2074} {"train_loss": -6.176377875464303, "global_step": 87149, "epoch": 2074, "val_loss": 67887.46875} {"train_loss": -6.328423500061035, "global_step": 87150, "epoch": 2075} {"train_loss": -6.267608642578125, "global_step": 87151, "epoch": 2075} {"train_loss": -6.238511085510254, "global_step": 87152, "epoch": 2075} {"train_loss": -6.330972671508789, "global_step": 87153, "epoch": 2075} {"train_loss": -6.179891586303711, "global_step": 87154, "epoch": 2075} {"train_loss": -6.203113079071045, "global_step": 87155, "epoch": 2075} {"train_loss": -6.150081634521484, "global_step": 87156, "epoch": 2075} {"train_loss": -6.305966854095459, "global_step": 87157, "epoch": 2075} {"train_loss": -6.23291015625, "global_step": 87158, "epoch": 2075} {"train_loss": -6.159494400024414, "global_step": 87159, "epoch": 2075} {"train_loss": -6.228492736816406, "global_step": 87160, "epoch": 2075} {"train_loss": -6.198643684387207, "global_step": 87161, "epoch": 2075} {"train_loss": -6.206930160522461, "global_step": 87162, "epoch": 2075} {"train_loss": -6.2744293212890625, "global_step": 87163, "epoch": 2075} {"train_loss": -6.2179059982299805, "global_step": 87164, "epoch": 2075} {"train_loss": -6.174441814422607, "global_step": 87165, "epoch": 2075} {"train_loss": -6.210582733154297, "global_step": 87166, "epoch": 2075} {"train_loss": -6.232362270355225, "global_step": 87167, "epoch": 2075} {"train_loss": -6.202294826507568, "global_step": 87168, "epoch": 2075} {"train_loss": -6.268193244934082, "global_step": 87169, "epoch": 2075} {"train_loss": -6.169238567352295, "global_step": 87170, "epoch": 2075} {"train_loss": -6.322824478149414, "global_step": 87171, "epoch": 2075} {"train_loss": -6.246238708496094, "global_step": 87172, "epoch": 2075} {"train_loss": -6.293716907501221, "global_step": 87173, "epoch": 2075} {"train_loss": -6.185831069946289, "global_step": 87174, "epoch": 2075} {"train_loss": -6.192867279052734, "global_step": 87175, "epoch": 2075} {"train_loss": -6.22316837310791, "global_step": 87176, "epoch": 2075} {"train_loss": -6.115485191345215, "global_step": 87177, "epoch": 2075} {"train_loss": -6.223353385925293, "global_step": 87178, "epoch": 2075} {"train_loss": -6.083331108093262, "global_step": 87179, "epoch": 2075} {"train_loss": -6.20510196685791, "global_step": 87180, "epoch": 2075} {"train_loss": -6.215087413787842, "global_step": 87181, "epoch": 2075} {"train_loss": -6.244338035583496, "global_step": 87182, "epoch": 2075} {"train_loss": -6.2973737716674805, "global_step": 87183, "epoch": 2075} {"train_loss": -6.107607841491699, "global_step": 87184, "epoch": 2075} {"train_loss": -6.213742733001709, "global_step": 87185, "epoch": 2075} {"train_loss": -6.258737564086914, "global_step": 87186, "epoch": 2075} {"train_loss": -6.217759132385254, "global_step": 87187, "epoch": 2075} {"train_loss": -6.203920364379883, "global_step": 87188, "epoch": 2075} {"train_loss": -6.190101623535156, "global_step": 87189, "epoch": 2075} {"train_loss": -6.179101467132568, "global_step": 87190, "epoch": 2075} {"train_loss": -6.215705905641828, "global_step": 87191, "epoch": 2075, "val_loss": 67881.4375} {"train_loss": -6.288997650146484, "global_step": 87192, "epoch": 2076} {"train_loss": -6.224959850311279, "global_step": 87193, "epoch": 2076} {"train_loss": -6.205719947814941, "global_step": 87194, "epoch": 2076} {"train_loss": -6.199284553527832, "global_step": 87195, "epoch": 2076} {"train_loss": -6.2513346672058105, "global_step": 87196, "epoch": 2076} {"train_loss": -6.11317253112793, "global_step": 87197, "epoch": 2076} {"train_loss": -6.085959434509277, "global_step": 87198, "epoch": 2076} {"train_loss": -6.246860980987549, "global_step": 87199, "epoch": 2076} {"train_loss": -6.259539604187012, "global_step": 87200, "epoch": 2076} {"train_loss": -6.178455829620361, "global_step": 87201, "epoch": 2076} {"train_loss": -6.2052998542785645, "global_step": 87202, "epoch": 2076} {"train_loss": -6.067131996154785, "global_step": 87203, "epoch": 2076} {"train_loss": -6.229256629943848, "global_step": 87204, "epoch": 2076} {"train_loss": -6.163976192474365, "global_step": 87205, "epoch": 2076} {"train_loss": -6.169497966766357, "global_step": 87206, "epoch": 2076} {"train_loss": -6.160697937011719, "global_step": 87207, "epoch": 2076} {"train_loss": -6.228623390197754, "global_step": 87208, "epoch": 2076} {"train_loss": -6.123653411865234, "global_step": 87209, "epoch": 2076} {"train_loss": -6.217148303985596, "global_step": 87210, "epoch": 2076} {"train_loss": -6.272904396057129, "global_step": 87211, "epoch": 2076} {"train_loss": -6.226863861083984, "global_step": 87212, "epoch": 2076} {"train_loss": -6.306876182556152, "global_step": 87213, "epoch": 2076} {"train_loss": -6.1575927734375, "global_step": 87214, "epoch": 2076} {"train_loss": -6.14579963684082, "global_step": 87215, "epoch": 2076} {"train_loss": -6.144959449768066, "global_step": 87216, "epoch": 2076} {"train_loss": -6.22070837020874, "global_step": 87217, "epoch": 2076} {"train_loss": -6.275115966796875, "global_step": 87218, "epoch": 2076} {"train_loss": -6.122602462768555, "global_step": 87219, "epoch": 2076} {"train_loss": -6.217581272125244, "global_step": 87220, "epoch": 2076} {"train_loss": -6.157649040222168, "global_step": 87221, "epoch": 2076} {"train_loss": -6.141386985778809, "global_step": 87222, "epoch": 2076} {"train_loss": -6.083945274353027, "global_step": 87223, "epoch": 2076} {"train_loss": -6.131511688232422, "global_step": 87224, "epoch": 2076} {"train_loss": -6.183309555053711, "global_step": 87225, "epoch": 2076} {"train_loss": -6.297763824462891, "global_step": 87226, "epoch": 2076} {"train_loss": -6.226458549499512, "global_step": 87227, "epoch": 2076} {"train_loss": -6.278482437133789, "global_step": 87228, "epoch": 2076} {"train_loss": -6.188168525695801, "global_step": 87229, "epoch": 2076} {"train_loss": -6.21247673034668, "global_step": 87230, "epoch": 2076} {"train_loss": -6.215733528137207, "global_step": 87231, "epoch": 2076} {"train_loss": -6.170934677124023, "global_step": 87232, "epoch": 2076} {"train_loss": -6.194339343479702, "global_step": 87233, "epoch": 2076, "val_loss": 67775.453125} {"train_loss": -6.198413848876953, "global_step": 87234, "epoch": 2077} {"train_loss": -6.231868267059326, "global_step": 87235, "epoch": 2077} {"train_loss": -6.292119979858398, "global_step": 87236, "epoch": 2077} {"train_loss": -6.135624885559082, "global_step": 87237, "epoch": 2077} {"train_loss": -6.138216018676758, "global_step": 87238, "epoch": 2077} {"train_loss": -6.201109886169434, "global_step": 87239, "epoch": 2077} {"train_loss": -6.13245964050293, "global_step": 87240, "epoch": 2077} {"train_loss": -6.0894012451171875, "global_step": 87241, "epoch": 2077} {"train_loss": -6.2203216552734375, "global_step": 87242, "epoch": 2077} {"train_loss": -6.1944122314453125, "global_step": 87243, "epoch": 2077} {"train_loss": -6.224048614501953, "global_step": 87244, "epoch": 2077} {"train_loss": -6.063663482666016, "global_step": 87245, "epoch": 2077} {"train_loss": -6.296500205993652, "global_step": 87246, "epoch": 2077} {"train_loss": -6.239025115966797, "global_step": 87247, "epoch": 2077} {"train_loss": -6.103353500366211, "global_step": 87248, "epoch": 2077} {"train_loss": -6.195379734039307, "global_step": 87249, "epoch": 2077} {"train_loss": -6.039277076721191, "global_step": 87250, "epoch": 2077} {"train_loss": -6.225893974304199, "global_step": 87251, "epoch": 2077} {"train_loss": -6.230626583099365, "global_step": 87252, "epoch": 2077} {"train_loss": -6.166449546813965, "global_step": 87253, "epoch": 2077} {"train_loss": -6.163402557373047, "global_step": 87254, "epoch": 2077} {"train_loss": -6.079025745391846, "global_step": 87255, "epoch": 2077} {"train_loss": -6.256358623504639, "global_step": 87256, "epoch": 2077} {"train_loss": -6.192582607269287, "global_step": 87257, "epoch": 2077} {"train_loss": -6.210660457611084, "global_step": 87258, "epoch": 2077} {"train_loss": -6.227744102478027, "global_step": 87259, "epoch": 2077} {"train_loss": -6.221929550170898, "global_step": 87260, "epoch": 2077} {"train_loss": -6.206216812133789, "global_step": 87261, "epoch": 2077} {"train_loss": -6.224249839782715, "global_step": 87262, "epoch": 2077} {"train_loss": -6.114336967468262, "global_step": 87263, "epoch": 2077} {"train_loss": -6.246535778045654, "global_step": 87264, "epoch": 2077} {"train_loss": -6.160397052764893, "global_step": 87265, "epoch": 2077} {"train_loss": -6.096248626708984, "global_step": 87266, "epoch": 2077} {"train_loss": -6.2996063232421875, "global_step": 87267, "epoch": 2077} {"train_loss": -6.118298530578613, "global_step": 87268, "epoch": 2077} {"train_loss": -6.173180103302002, "global_step": 87269, "epoch": 2077} {"train_loss": -6.248723983764648, "global_step": 87270, "epoch": 2077} {"train_loss": -6.152387619018555, "global_step": 87271, "epoch": 2077} {"train_loss": -6.026247024536133, "global_step": 87272, "epoch": 2077} {"train_loss": -6.17232084274292, "global_step": 87273, "epoch": 2077} {"train_loss": -6.107804298400879, "global_step": 87274, "epoch": 2077} {"train_loss": -6.180758873621623, "global_step": 87275, "epoch": 2077, "val_loss": 68001.515625} {"train_loss": -6.138861656188965, "global_step": 87276, "epoch": 2078} {"train_loss": -6.177742958068848, "global_step": 87277, "epoch": 2078} {"train_loss": -6.172644138336182, "global_step": 87278, "epoch": 2078} {"train_loss": -6.124279975891113, "global_step": 87279, "epoch": 2078} {"train_loss": -6.227656364440918, "global_step": 87280, "epoch": 2078} {"train_loss": -6.104849815368652, "global_step": 87281, "epoch": 2078} {"train_loss": -6.255582809448242, "global_step": 87282, "epoch": 2078} {"train_loss": -6.148081302642822, "global_step": 87283, "epoch": 2078} {"train_loss": -6.218731880187988, "global_step": 87284, "epoch": 2078} {"train_loss": -6.09534215927124, "global_step": 87285, "epoch": 2078} {"train_loss": -6.2412519454956055, "global_step": 87286, "epoch": 2078} {"train_loss": -6.2358903884887695, "global_step": 87287, "epoch": 2078} {"train_loss": -6.177151679992676, "global_step": 87288, "epoch": 2078} {"train_loss": -6.142971515655518, "global_step": 87289, "epoch": 2078} {"train_loss": -6.230790138244629, "global_step": 87290, "epoch": 2078} {"train_loss": -6.063606262207031, "global_step": 87291, "epoch": 2078} {"train_loss": -6.181498050689697, "global_step": 87292, "epoch": 2078} {"train_loss": -6.09862756729126, "global_step": 87293, "epoch": 2078} {"train_loss": -6.278125286102295, "global_step": 87294, "epoch": 2078} {"train_loss": -6.129391670227051, "global_step": 87295, "epoch": 2078} {"train_loss": -6.301052093505859, "global_step": 87296, "epoch": 2078} {"train_loss": -6.121513366699219, "global_step": 87297, "epoch": 2078} {"train_loss": -6.280577182769775, "global_step": 87298, "epoch": 2078} {"train_loss": -6.255492687225342, "global_step": 87299, "epoch": 2078} {"train_loss": -6.278899192810059, "global_step": 87300, "epoch": 2078} {"train_loss": -6.301290512084961, "global_step": 87301, "epoch": 2078} {"train_loss": -6.223368167877197, "global_step": 87302, "epoch": 2078} {"train_loss": -6.137401580810547, "global_step": 87303, "epoch": 2078} {"train_loss": -6.318153381347656, "global_step": 87304, "epoch": 2078} {"train_loss": -6.229053974151611, "global_step": 87305, "epoch": 2078} {"train_loss": -6.278282642364502, "global_step": 87306, "epoch": 2078} {"train_loss": -6.2627854347229, "global_step": 87307, "epoch": 2078} {"train_loss": -6.22428560256958, "global_step": 87308, "epoch": 2078} {"train_loss": -6.209795951843262, "global_step": 87309, "epoch": 2078} {"train_loss": -6.172804832458496, "global_step": 87310, "epoch": 2078} {"train_loss": -6.256011962890625, "global_step": 87311, "epoch": 2078} {"train_loss": -6.261656761169434, "global_step": 87312, "epoch": 2078} {"train_loss": -6.129124641418457, "global_step": 87313, "epoch": 2078} {"train_loss": -6.223389625549316, "global_step": 87314, "epoch": 2078} {"train_loss": -6.085162162780762, "global_step": 87315, "epoch": 2078} {"train_loss": -6.12085485458374, "global_step": 87316, "epoch": 2078} {"train_loss": -6.198485374450684, "global_step": 87317, "epoch": 2078, "val_loss": 67838.609375} {"train_loss": -6.263638973236084, "global_step": 87318, "epoch": 2079} {"train_loss": -6.193086624145508, "global_step": 87319, "epoch": 2079} {"train_loss": -6.248714447021484, "global_step": 87320, "epoch": 2079} {"train_loss": -6.124691486358643, "global_step": 87321, "epoch": 2079} {"train_loss": -6.259171009063721, "global_step": 87322, "epoch": 2079} {"train_loss": -6.260522842407227, "global_step": 87323, "epoch": 2079} {"train_loss": -6.220721244812012, "global_step": 87324, "epoch": 2079} {"train_loss": -6.213345527648926, "global_step": 87325, "epoch": 2079} {"train_loss": -6.2326555252075195, "global_step": 87326, "epoch": 2079} {"train_loss": -6.252476692199707, "global_step": 87327, "epoch": 2079} {"train_loss": -6.251859188079834, "global_step": 87328, "epoch": 2079} {"train_loss": -6.2581024169921875, "global_step": 87329, "epoch": 2079} {"train_loss": -6.36042594909668, "global_step": 87330, "epoch": 2079} {"train_loss": -6.230838775634766, "global_step": 87331, "epoch": 2079} {"train_loss": -6.299572944641113, "global_step": 87332, "epoch": 2079} {"train_loss": -6.325458526611328, "global_step": 87333, "epoch": 2079} {"train_loss": -6.234306812286377, "global_step": 87334, "epoch": 2079} {"train_loss": -6.169476509094238, "global_step": 87335, "epoch": 2079} {"train_loss": -6.263000965118408, "global_step": 87336, "epoch": 2079} {"train_loss": -6.27655029296875, "global_step": 87337, "epoch": 2079} {"train_loss": -6.328314781188965, "global_step": 87338, "epoch": 2079} {"train_loss": -6.311430931091309, "global_step": 87339, "epoch": 2079} {"train_loss": -6.2193803787231445, "global_step": 87340, "epoch": 2079} {"train_loss": -6.18941593170166, "global_step": 87341, "epoch": 2079} {"train_loss": -6.196727752685547, "global_step": 87342, "epoch": 2079} {"train_loss": -6.1996049880981445, "global_step": 87343, "epoch": 2079} {"train_loss": -6.205373764038086, "global_step": 87344, "epoch": 2079} {"train_loss": -6.187674522399902, "global_step": 87345, "epoch": 2079} {"train_loss": -6.199124336242676, "global_step": 87346, "epoch": 2079} {"train_loss": -6.247450828552246, "global_step": 87347, "epoch": 2079} {"train_loss": -6.144965648651123, "global_step": 87348, "epoch": 2079} {"train_loss": -6.192431449890137, "global_step": 87349, "epoch": 2079} {"train_loss": -6.212916851043701, "global_step": 87350, "epoch": 2079} {"train_loss": -6.148828029632568, "global_step": 87351, "epoch": 2079} {"train_loss": -6.159509181976318, "global_step": 87352, "epoch": 2079} {"train_loss": -6.210573673248291, "global_step": 87353, "epoch": 2079} {"train_loss": -6.364719867706299, "global_step": 87354, "epoch": 2079} {"train_loss": -6.168457984924316, "global_step": 87355, "epoch": 2079} {"train_loss": -6.165435791015625, "global_step": 87356, "epoch": 2079} {"train_loss": -6.2207489013671875, "global_step": 87357, "epoch": 2079} {"train_loss": -6.136425018310547, "global_step": 87358, "epoch": 2079} {"train_loss": -6.228014696212042, "global_step": 87359, "epoch": 2079, "val_loss": 67779.4921875} {"train_loss": -6.243544101715088, "global_step": 87360, "epoch": 2080} {"train_loss": -6.097621917724609, "global_step": 87361, "epoch": 2080} {"train_loss": -6.137739181518555, "global_step": 87362, "epoch": 2080} {"train_loss": -6.2696709632873535, "global_step": 87363, "epoch": 2080} {"train_loss": -6.252995491027832, "global_step": 87364, "epoch": 2080} {"train_loss": -6.3513641357421875, "global_step": 87365, "epoch": 2080} {"train_loss": -6.1237359046936035, "global_step": 87366, "epoch": 2080} {"train_loss": -6.2496185302734375, "global_step": 87367, "epoch": 2080} {"train_loss": -6.265796661376953, "global_step": 87368, "epoch": 2080} {"train_loss": -6.287409782409668, "global_step": 87369, "epoch": 2080} {"train_loss": -6.229926586151123, "global_step": 87370, "epoch": 2080} {"train_loss": -6.309399604797363, "global_step": 87371, "epoch": 2080} {"train_loss": -6.147058486938477, "global_step": 87372, "epoch": 2080} {"train_loss": -6.21369743347168, "global_step": 87373, "epoch": 2080} {"train_loss": -6.292900085449219, "global_step": 87374, "epoch": 2080} {"train_loss": -6.133138656616211, "global_step": 87375, "epoch": 2080} {"train_loss": -6.19223690032959, "global_step": 87376, "epoch": 2080} {"train_loss": -6.226093292236328, "global_step": 87377, "epoch": 2080} {"train_loss": -6.262246608734131, "global_step": 87378, "epoch": 2080} {"train_loss": -6.251001358032227, "global_step": 87379, "epoch": 2080} {"train_loss": -6.215421676635742, "global_step": 87380, "epoch": 2080} {"train_loss": -6.169665336608887, "global_step": 87381, "epoch": 2080} {"train_loss": -6.312961578369141, "global_step": 87382, "epoch": 2080} {"train_loss": -6.1481781005859375, "global_step": 87383, "epoch": 2080} {"train_loss": -6.174952030181885, "global_step": 87384, "epoch": 2080} {"train_loss": -6.075128078460693, "global_step": 87385, "epoch": 2080} {"train_loss": -6.13494873046875, "global_step": 87386, "epoch": 2080} {"train_loss": -6.0073347091674805, "global_step": 87387, "epoch": 2080} {"train_loss": -6.192668914794922, "global_step": 87388, "epoch": 2080} {"train_loss": -6.068278789520264, "global_step": 87389, "epoch": 2080} {"train_loss": -6.056647300720215, "global_step": 87390, "epoch": 2080} {"train_loss": -6.101900577545166, "global_step": 87391, "epoch": 2080} {"train_loss": -6.223018646240234, "global_step": 87392, "epoch": 2080} {"train_loss": -6.221915245056152, "global_step": 87393, "epoch": 2080} {"train_loss": -6.11581563949585, "global_step": 87394, "epoch": 2080} {"train_loss": -6.191220283508301, "global_step": 87395, "epoch": 2080} {"train_loss": -6.159319877624512, "global_step": 87396, "epoch": 2080} {"train_loss": -6.116061687469482, "global_step": 87397, "epoch": 2080} {"train_loss": -6.099560260772705, "global_step": 87398, "epoch": 2080} {"train_loss": -6.212414264678955, "global_step": 87399, "epoch": 2080} {"train_loss": -6.17136287689209, "global_step": 87400, "epoch": 2080} {"train_loss": -6.18842829976763, "global_step": 87401, "epoch": 2080, "val_loss": 67963.6484375} {"train_loss": -6.13198184967041, "global_step": 87402, "epoch": 2081} {"train_loss": -6.1319732666015625, "global_step": 87403, "epoch": 2081} {"train_loss": -6.049599647521973, "global_step": 87404, "epoch": 2081} {"train_loss": -6.230656147003174, "global_step": 87405, "epoch": 2081} {"train_loss": -6.129324913024902, "global_step": 87406, "epoch": 2081} {"train_loss": -6.128352165222168, "global_step": 87407, "epoch": 2081} {"train_loss": -6.052331924438477, "global_step": 87408, "epoch": 2081} {"train_loss": -6.183853626251221, "global_step": 87409, "epoch": 2081} {"train_loss": -6.200957298278809, "global_step": 87410, "epoch": 2081} {"train_loss": -6.213129997253418, "global_step": 87411, "epoch": 2081} {"train_loss": -6.2362871170043945, "global_step": 87412, "epoch": 2081} {"train_loss": -6.282993316650391, "global_step": 87413, "epoch": 2081} {"train_loss": -6.1228179931640625, "global_step": 87414, "epoch": 2081} {"train_loss": -6.2119340896606445, "global_step": 87415, "epoch": 2081} {"train_loss": -6.213876724243164, "global_step": 87416, "epoch": 2081} {"train_loss": -6.226810455322266, "global_step": 87417, "epoch": 2081} {"train_loss": -6.100120544433594, "global_step": 87418, "epoch": 2081} {"train_loss": -6.306748390197754, "global_step": 87419, "epoch": 2081} {"train_loss": -6.1769866943359375, "global_step": 87420, "epoch": 2081} {"train_loss": -6.202062606811523, "global_step": 87421, "epoch": 2081} {"train_loss": -6.1154913902282715, "global_step": 87422, "epoch": 2081} {"train_loss": -6.21672248840332, "global_step": 87423, "epoch": 2081} {"train_loss": -6.14697265625, "global_step": 87424, "epoch": 2081} {"train_loss": -6.3209123611450195, "global_step": 87425, "epoch": 2081} {"train_loss": -6.100286483764648, "global_step": 87426, "epoch": 2081} {"train_loss": -6.282325744628906, "global_step": 87427, "epoch": 2081} {"train_loss": -6.2089619636535645, "global_step": 87428, "epoch": 2081} {"train_loss": -6.275857925415039, "global_step": 87429, "epoch": 2081} {"train_loss": -6.1183319091796875, "global_step": 87430, "epoch": 2081} {"train_loss": -6.248268127441406, "global_step": 87431, "epoch": 2081} {"train_loss": -6.234508037567139, "global_step": 87432, "epoch": 2081} {"train_loss": -6.232030868530273, "global_step": 87433, "epoch": 2081} {"train_loss": -6.1741132736206055, "global_step": 87434, "epoch": 2081} {"train_loss": -6.189087867736816, "global_step": 87435, "epoch": 2081} {"train_loss": -6.256476402282715, "global_step": 87436, "epoch": 2081} {"train_loss": -6.273313999176025, "global_step": 87437, "epoch": 2081} {"train_loss": -6.16475248336792, "global_step": 87438, "epoch": 2081} {"train_loss": -6.2259016036987305, "global_step": 87439, "epoch": 2081} {"train_loss": -6.134979248046875, "global_step": 87440, "epoch": 2081} {"train_loss": -6.180028915405273, "global_step": 87441, "epoch": 2081} {"train_loss": -6.253770351409912, "global_step": 87442, "epoch": 2081} {"train_loss": -6.1936403796786355, "global_step": 87443, "epoch": 2081, "val_loss": 67802.640625} {"train_loss": -6.019599437713623, "global_step": 87444, "epoch": 2082} {"train_loss": -6.248787879943848, "global_step": 87445, "epoch": 2082} {"train_loss": -6.272193431854248, "global_step": 87446, "epoch": 2082} {"train_loss": -6.148116588592529, "global_step": 87447, "epoch": 2082} {"train_loss": -6.282292366027832, "global_step": 87448, "epoch": 2082} {"train_loss": -6.164931774139404, "global_step": 87449, "epoch": 2082} {"train_loss": -6.19102668762207, "global_step": 87450, "epoch": 2082} {"train_loss": -6.3461127281188965, "global_step": 87451, "epoch": 2082} {"train_loss": -6.251224994659424, "global_step": 87452, "epoch": 2082} {"train_loss": -6.181714057922363, "global_step": 87453, "epoch": 2082} {"train_loss": -6.2908935546875, "global_step": 87454, "epoch": 2082} {"train_loss": -6.2688446044921875, "global_step": 87455, "epoch": 2082} {"train_loss": -6.315328598022461, "global_step": 87456, "epoch": 2082} {"train_loss": -6.128594875335693, "global_step": 87457, "epoch": 2082} {"train_loss": -6.118505001068115, "global_step": 87458, "epoch": 2082} {"train_loss": -6.190668106079102, "global_step": 87459, "epoch": 2082} {"train_loss": -6.125978946685791, "global_step": 87460, "epoch": 2082} {"train_loss": -6.285982131958008, "global_step": 87461, "epoch": 2082} {"train_loss": -6.331210136413574, "global_step": 87462, "epoch": 2082} {"train_loss": -6.093413352966309, "global_step": 87463, "epoch": 2082} {"train_loss": -6.202704906463623, "global_step": 87464, "epoch": 2082} {"train_loss": -6.298630237579346, "global_step": 87465, "epoch": 2082} {"train_loss": -6.22792387008667, "global_step": 87466, "epoch": 2082} {"train_loss": -6.249814033508301, "global_step": 87467, "epoch": 2082} {"train_loss": -6.147195816040039, "global_step": 87468, "epoch": 2082} {"train_loss": -6.1749773025512695, "global_step": 87469, "epoch": 2082} {"train_loss": -6.238122940063477, "global_step": 87470, "epoch": 2082} {"train_loss": -6.104639053344727, "global_step": 87471, "epoch": 2082} {"train_loss": -6.319732666015625, "global_step": 87472, "epoch": 2082} {"train_loss": -6.172553539276123, "global_step": 87473, "epoch": 2082} {"train_loss": -6.334061145782471, "global_step": 87474, "epoch": 2082} {"train_loss": -6.0487823486328125, "global_step": 87475, "epoch": 2082} {"train_loss": -6.231326103210449, "global_step": 87476, "epoch": 2082} {"train_loss": -6.224127769470215, "global_step": 87477, "epoch": 2082} {"train_loss": -6.086092472076416, "global_step": 87478, "epoch": 2082} {"train_loss": -6.064723014831543, "global_step": 87479, "epoch": 2082} {"train_loss": -6.200654983520508, "global_step": 87480, "epoch": 2082} {"train_loss": -6.183568477630615, "global_step": 87481, "epoch": 2082} {"train_loss": -6.1758270263671875, "global_step": 87482, "epoch": 2082} {"train_loss": -6.146108627319336, "global_step": 87483, "epoch": 2082} {"train_loss": -6.273994445800781, "global_step": 87484, "epoch": 2082} {"train_loss": -6.20271524928865, "global_step": 87485, "epoch": 2082, "val_loss": 67991.453125} {"train_loss": -6.1812896728515625, "global_step": 87486, "epoch": 2083} {"train_loss": -6.2892560958862305, "global_step": 87487, "epoch": 2083} {"train_loss": -6.159798622131348, "global_step": 87488, "epoch": 2083} {"train_loss": -6.259910583496094, "global_step": 87489, "epoch": 2083} {"train_loss": -6.231766700744629, "global_step": 87490, "epoch": 2083} {"train_loss": -6.225135803222656, "global_step": 87491, "epoch": 2083} {"train_loss": -6.107995510101318, "global_step": 87492, "epoch": 2083} {"train_loss": -6.215648651123047, "global_step": 87493, "epoch": 2083} {"train_loss": -6.129934310913086, "global_step": 87494, "epoch": 2083} {"train_loss": -6.236001968383789, "global_step": 87495, "epoch": 2083} {"train_loss": -6.240449905395508, "global_step": 87496, "epoch": 2083} {"train_loss": -6.283544063568115, "global_step": 87497, "epoch": 2083} {"train_loss": -6.264095306396484, "global_step": 87498, "epoch": 2083} {"train_loss": -6.232763290405273, "global_step": 87499, "epoch": 2083} {"train_loss": -6.056234359741211, "global_step": 87500, "epoch": 2083} {"train_loss": -6.202891826629639, "global_step": 87501, "epoch": 2083} {"train_loss": -6.176527976989746, "global_step": 87502, "epoch": 2083} {"train_loss": -6.146669864654541, "global_step": 87503, "epoch": 2083} {"train_loss": -6.262192249298096, "global_step": 87504, "epoch": 2083} {"train_loss": -6.169487953186035, "global_step": 87505, "epoch": 2083} {"train_loss": -6.118764400482178, "global_step": 87506, "epoch": 2083} {"train_loss": -6.15506649017334, "global_step": 87507, "epoch": 2083} {"train_loss": -6.0755133628845215, "global_step": 87508, "epoch": 2083} {"train_loss": -6.144253730773926, "global_step": 87509, "epoch": 2083} {"train_loss": -6.138673305511475, "global_step": 87510, "epoch": 2083} {"train_loss": -6.239987373352051, "global_step": 87511, "epoch": 2083} {"train_loss": -6.309106826782227, "global_step": 87512, "epoch": 2083} {"train_loss": -6.167908191680908, "global_step": 87513, "epoch": 2083} {"train_loss": -6.145486831665039, "global_step": 87514, "epoch": 2083} {"train_loss": -6.170521259307861, "global_step": 87515, "epoch": 2083} {"train_loss": -6.3153581619262695, "global_step": 87516, "epoch": 2083} {"train_loss": -6.140927791595459, "global_step": 87517, "epoch": 2083} {"train_loss": -6.174882888793945, "global_step": 87518, "epoch": 2083} {"train_loss": -6.226567268371582, "global_step": 87519, "epoch": 2083} {"train_loss": -6.216038703918457, "global_step": 87520, "epoch": 2083} {"train_loss": -6.221758842468262, "global_step": 87521, "epoch": 2083} {"train_loss": -6.185827255249023, "global_step": 87522, "epoch": 2083} {"train_loss": -6.171407699584961, "global_step": 87523, "epoch": 2083} {"train_loss": -6.113458633422852, "global_step": 87524, "epoch": 2083} {"train_loss": -6.091603755950928, "global_step": 87525, "epoch": 2083} {"train_loss": -6.051353931427002, "global_step": 87526, "epoch": 2083} {"train_loss": -6.1853374526614235, "global_step": 87527, "epoch": 2083, "val_loss": 67790.890625} {"train_loss": -6.167783260345459, "global_step": 87528, "epoch": 2084} {"train_loss": -6.243154525756836, "global_step": 87529, "epoch": 2084} {"train_loss": -6.082822799682617, "global_step": 87530, "epoch": 2084} {"train_loss": -6.200228214263916, "global_step": 87531, "epoch": 2084} {"train_loss": -6.1862592697143555, "global_step": 87532, "epoch": 2084} {"train_loss": -6.212556838989258, "global_step": 87533, "epoch": 2084} {"train_loss": -6.2047529220581055, "global_step": 87534, "epoch": 2084} {"train_loss": -6.244499683380127, "global_step": 87535, "epoch": 2084} {"train_loss": -6.090595722198486, "global_step": 87536, "epoch": 2084} {"train_loss": -6.203413009643555, "global_step": 87537, "epoch": 2084} {"train_loss": -6.24622106552124, "global_step": 87538, "epoch": 2084} {"train_loss": -6.092113494873047, "global_step": 87539, "epoch": 2084} {"train_loss": -6.219776153564453, "global_step": 87540, "epoch": 2084} {"train_loss": -6.030433654785156, "global_step": 87541, "epoch": 2084} {"train_loss": -6.303140640258789, "global_step": 87542, "epoch": 2084} {"train_loss": -6.088840484619141, "global_step": 87543, "epoch": 2084} {"train_loss": -6.235816955566406, "global_step": 87544, "epoch": 2084} {"train_loss": -6.316466331481934, "global_step": 87545, "epoch": 2084} {"train_loss": -6.180994510650635, "global_step": 87546, "epoch": 2084} {"train_loss": -6.161252975463867, "global_step": 87547, "epoch": 2084} {"train_loss": -6.187278747558594, "global_step": 87548, "epoch": 2084} {"train_loss": -6.278099536895752, "global_step": 87549, "epoch": 2084} {"train_loss": -6.151597023010254, "global_step": 87550, "epoch": 2084} {"train_loss": -6.281634330749512, "global_step": 87551, "epoch": 2084} {"train_loss": -6.26352596282959, "global_step": 87552, "epoch": 2084} {"train_loss": -6.146232604980469, "global_step": 87553, "epoch": 2084} {"train_loss": -6.177835464477539, "global_step": 87554, "epoch": 2084} {"train_loss": -6.25840425491333, "global_step": 87555, "epoch": 2084} {"train_loss": -6.142764091491699, "global_step": 87556, "epoch": 2084} {"train_loss": -6.237030982971191, "global_step": 87557, "epoch": 2084} {"train_loss": -6.1579179763793945, "global_step": 87558, "epoch": 2084} {"train_loss": -6.1586456298828125, "global_step": 87559, "epoch": 2084} {"train_loss": -6.269105911254883, "global_step": 87560, "epoch": 2084} {"train_loss": -6.065853595733643, "global_step": 87561, "epoch": 2084} {"train_loss": -6.258657455444336, "global_step": 87562, "epoch": 2084} {"train_loss": -6.208547115325928, "global_step": 87563, "epoch": 2084} {"train_loss": -6.117984771728516, "global_step": 87564, "epoch": 2084} {"train_loss": -6.080401420593262, "global_step": 87565, "epoch": 2084} {"train_loss": -6.201659202575684, "global_step": 87566, "epoch": 2084} {"train_loss": -6.237365245819092, "global_step": 87567, "epoch": 2084} {"train_loss": -6.193910121917725, "global_step": 87568, "epoch": 2084} {"train_loss": -6.190492016928537, "global_step": 87569, "epoch": 2084, "val_loss": 67702.71875} {"train_loss": -6.204971790313721, "global_step": 87570, "epoch": 2085} {"train_loss": -6.189144134521484, "global_step": 87571, "epoch": 2085} {"train_loss": -6.243479251861572, "global_step": 87572, "epoch": 2085} {"train_loss": -6.221536636352539, "global_step": 87573, "epoch": 2085} {"train_loss": -6.266278266906738, "global_step": 87574, "epoch": 2085} {"train_loss": -6.211690902709961, "global_step": 87575, "epoch": 2085} {"train_loss": -6.239819526672363, "global_step": 87576, "epoch": 2085} {"train_loss": -6.128891944885254, "global_step": 87577, "epoch": 2085} {"train_loss": -6.304784774780273, "global_step": 87578, "epoch": 2085} {"train_loss": -6.232755184173584, "global_step": 87579, "epoch": 2085} {"train_loss": -6.224688529968262, "global_step": 87580, "epoch": 2085} {"train_loss": -6.171136856079102, "global_step": 87581, "epoch": 2085} {"train_loss": -6.218479156494141, "global_step": 87582, "epoch": 2085} {"train_loss": -6.1422505378723145, "global_step": 87583, "epoch": 2085} {"train_loss": -6.234555244445801, "global_step": 87584, "epoch": 2085} {"train_loss": -6.246251106262207, "global_step": 87585, "epoch": 2085} {"train_loss": -6.199622631072998, "global_step": 87586, "epoch": 2085} {"train_loss": -6.311128616333008, "global_step": 87587, "epoch": 2085} {"train_loss": -6.213554382324219, "global_step": 87588, "epoch": 2085} {"train_loss": -6.114482879638672, "global_step": 87589, "epoch": 2085} {"train_loss": -6.081562042236328, "global_step": 87590, "epoch": 2085} {"train_loss": -5.994828224182129, "global_step": 87591, "epoch": 2085} {"train_loss": -6.3027143478393555, "global_step": 87592, "epoch": 2085} {"train_loss": -6.040018081665039, "global_step": 87593, "epoch": 2085} {"train_loss": -6.079420566558838, "global_step": 87594, "epoch": 2085} {"train_loss": -6.123380661010742, "global_step": 87595, "epoch": 2085} {"train_loss": -6.062089920043945, "global_step": 87596, "epoch": 2085} {"train_loss": -6.228445053100586, "global_step": 87597, "epoch": 2085} {"train_loss": -6.219489097595215, "global_step": 87598, "epoch": 2085} {"train_loss": -6.1542744636535645, "global_step": 87599, "epoch": 2085} {"train_loss": -6.121831893920898, "global_step": 87600, "epoch": 2085} {"train_loss": -6.074389457702637, "global_step": 87601, "epoch": 2085} {"train_loss": -6.307007789611816, "global_step": 87602, "epoch": 2085} {"train_loss": -6.197542667388916, "global_step": 87603, "epoch": 2085} {"train_loss": -6.160184860229492, "global_step": 87604, "epoch": 2085} {"train_loss": -6.123330593109131, "global_step": 87605, "epoch": 2085} {"train_loss": -6.068598747253418, "global_step": 87606, "epoch": 2085} {"train_loss": -6.236499309539795, "global_step": 87607, "epoch": 2085} {"train_loss": -6.103787899017334, "global_step": 87608, "epoch": 2085} {"train_loss": -6.209685325622559, "global_step": 87609, "epoch": 2085} {"train_loss": -6.115035533905029, "global_step": 87610, "epoch": 2085} {"train_loss": -6.179490986324492, "global_step": 87611, "epoch": 2085, "val_loss": 68078.4609375} {"train_loss": -6.154767990112305, "global_step": 87612, "epoch": 2086} {"train_loss": -6.1522603034973145, "global_step": 87613, "epoch": 2086} {"train_loss": -6.220005035400391, "global_step": 87614, "epoch": 2086} {"train_loss": -6.081189155578613, "global_step": 87615, "epoch": 2086} {"train_loss": -6.193478584289551, "global_step": 87616, "epoch": 2086} {"train_loss": -6.079350471496582, "global_step": 87617, "epoch": 2086} {"train_loss": -6.126535892486572, "global_step": 87618, "epoch": 2086} {"train_loss": -6.119789123535156, "global_step": 87619, "epoch": 2086} {"train_loss": -6.19215202331543, "global_step": 87620, "epoch": 2086} {"train_loss": -6.127080917358398, "global_step": 87621, "epoch": 2086} {"train_loss": -6.122411727905273, "global_step": 87622, "epoch": 2086} {"train_loss": -6.226586818695068, "global_step": 87623, "epoch": 2086} {"train_loss": -6.136286735534668, "global_step": 87624, "epoch": 2086} {"train_loss": -6.223184585571289, "global_step": 87625, "epoch": 2086} {"train_loss": -6.13717794418335, "global_step": 87626, "epoch": 2086} {"train_loss": -6.2136993408203125, "global_step": 87627, "epoch": 2086} {"train_loss": -6.184398174285889, "global_step": 87628, "epoch": 2086} {"train_loss": -6.204501152038574, "global_step": 87629, "epoch": 2086} {"train_loss": -6.059147357940674, "global_step": 87630, "epoch": 2086} {"train_loss": -6.023044586181641, "global_step": 87631, "epoch": 2086} {"train_loss": -6.24806022644043, "global_step": 87632, "epoch": 2086} {"train_loss": -6.11976957321167, "global_step": 87633, "epoch": 2086} {"train_loss": -6.106614112854004, "global_step": 87634, "epoch": 2086} {"train_loss": -6.132805347442627, "global_step": 87635, "epoch": 2086} {"train_loss": -6.18749475479126, "global_step": 87636, "epoch": 2086} {"train_loss": -6.17948055267334, "global_step": 87637, "epoch": 2086} {"train_loss": -6.179990768432617, "global_step": 87638, "epoch": 2086} {"train_loss": -6.162008285522461, "global_step": 87639, "epoch": 2086} {"train_loss": -6.283760070800781, "global_step": 87640, "epoch": 2086} {"train_loss": -6.095415115356445, "global_step": 87641, "epoch": 2086} {"train_loss": -6.146315574645996, "global_step": 87642, "epoch": 2086} {"train_loss": -6.294366836547852, "global_step": 87643, "epoch": 2086} {"train_loss": -6.267948150634766, "global_step": 87644, "epoch": 2086} {"train_loss": -6.2026472091674805, "global_step": 87645, "epoch": 2086} {"train_loss": -6.28290319442749, "global_step": 87646, "epoch": 2086} {"train_loss": -6.06103515625, "global_step": 87647, "epoch": 2086} {"train_loss": -6.146454811096191, "global_step": 87648, "epoch": 2086} {"train_loss": -6.2328691482543945, "global_step": 87649, "epoch": 2086} {"train_loss": -6.186816215515137, "global_step": 87650, "epoch": 2086} {"train_loss": -6.116515636444092, "global_step": 87651, "epoch": 2086} {"train_loss": -6.190680027008057, "global_step": 87652, "epoch": 2086} {"train_loss": -6.1662151245843795, "global_step": 87653, "epoch": 2086, "val_loss": 67908.5546875} {"train_loss": -6.257130146026611, "global_step": 87654, "epoch": 2087} {"train_loss": -6.084477424621582, "global_step": 87655, "epoch": 2087} {"train_loss": -6.220841884613037, "global_step": 87656, "epoch": 2087} {"train_loss": -6.2373576164245605, "global_step": 87657, "epoch": 2087} {"train_loss": -6.162528991699219, "global_step": 87658, "epoch": 2087} {"train_loss": -6.138448238372803, "global_step": 87659, "epoch": 2087} {"train_loss": -6.180953502655029, "global_step": 87660, "epoch": 2087} {"train_loss": -6.215938568115234, "global_step": 87661, "epoch": 2087} {"train_loss": -6.179645538330078, "global_step": 87662, "epoch": 2087} {"train_loss": -6.3086371421813965, "global_step": 87663, "epoch": 2087} {"train_loss": -6.1602373123168945, "global_step": 87664, "epoch": 2087} {"train_loss": -6.256988525390625, "global_step": 87665, "epoch": 2087} {"train_loss": -6.2294158935546875, "global_step": 87666, "epoch": 2087} {"train_loss": -6.233158111572266, "global_step": 87667, "epoch": 2087} {"train_loss": -6.25913143157959, "global_step": 87668, "epoch": 2087} {"train_loss": -6.254939079284668, "global_step": 87669, "epoch": 2087} {"train_loss": -6.190009117126465, "global_step": 87670, "epoch": 2087} {"train_loss": -6.250554084777832, "global_step": 87671, "epoch": 2087} {"train_loss": -6.223857402801514, "global_step": 87672, "epoch": 2087} {"train_loss": -6.147056579589844, "global_step": 87673, "epoch": 2087} {"train_loss": -6.142673492431641, "global_step": 87674, "epoch": 2087} {"train_loss": -6.2038421630859375, "global_step": 87675, "epoch": 2087} {"train_loss": -6.2299675941467285, "global_step": 87676, "epoch": 2087} {"train_loss": -6.14866304397583, "global_step": 87677, "epoch": 2087} {"train_loss": -6.1736860275268555, "global_step": 87678, "epoch": 2087} {"train_loss": -6.163016319274902, "global_step": 87679, "epoch": 2087} {"train_loss": -6.182729721069336, "global_step": 87680, "epoch": 2087} {"train_loss": -6.371520042419434, "global_step": 87681, "epoch": 2087} {"train_loss": -6.318824291229248, "global_step": 87682, "epoch": 2087} {"train_loss": -6.195822238922119, "global_step": 87683, "epoch": 2087} {"train_loss": -6.177790641784668, "global_step": 87684, "epoch": 2087} {"train_loss": -6.343421459197998, "global_step": 87685, "epoch": 2087} {"train_loss": -6.15640115737915, "global_step": 87686, "epoch": 2087} {"train_loss": -6.1876139640808105, "global_step": 87687, "epoch": 2087} {"train_loss": -6.23655366897583, "global_step": 87688, "epoch": 2087} {"train_loss": -6.205652236938477, "global_step": 87689, "epoch": 2087} {"train_loss": -6.18226432800293, "global_step": 87690, "epoch": 2087} {"train_loss": -6.18873929977417, "global_step": 87691, "epoch": 2087} {"train_loss": -6.220595836639404, "global_step": 87692, "epoch": 2087} {"train_loss": -6.224989414215088, "global_step": 87693, "epoch": 2087} {"train_loss": -6.214400768280029, "global_step": 87694, "epoch": 2087} {"train_loss": -6.211702153796241, "global_step": 87695, "epoch": 2087, "val_loss": 67718.9453125} {"train_loss": -6.2913360595703125, "global_step": 87696, "epoch": 2088} {"train_loss": -6.216235160827637, "global_step": 87697, "epoch": 2088} {"train_loss": -6.254909992218018, "global_step": 87698, "epoch": 2088} {"train_loss": -6.219844341278076, "global_step": 87699, "epoch": 2088} {"train_loss": -6.252974510192871, "global_step": 87700, "epoch": 2088} {"train_loss": -6.248998641967773, "global_step": 87701, "epoch": 2088} {"train_loss": -6.250394821166992, "global_step": 87702, "epoch": 2088} {"train_loss": -6.176860809326172, "global_step": 87703, "epoch": 2088} {"train_loss": -6.248889923095703, "global_step": 87704, "epoch": 2088} {"train_loss": -6.237979888916016, "global_step": 87705, "epoch": 2088} {"train_loss": -6.255993366241455, "global_step": 87706, "epoch": 2088} {"train_loss": -6.228638648986816, "global_step": 87707, "epoch": 2088} {"train_loss": -6.062743186950684, "global_step": 87708, "epoch": 2088} {"train_loss": -6.209560394287109, "global_step": 87709, "epoch": 2088} {"train_loss": -6.277839660644531, "global_step": 87710, "epoch": 2088} {"train_loss": -6.190114498138428, "global_step": 87711, "epoch": 2088} {"train_loss": -6.301824569702148, "global_step": 87712, "epoch": 2088} {"train_loss": -6.049709320068359, "global_step": 87713, "epoch": 2088} {"train_loss": -6.211309909820557, "global_step": 87714, "epoch": 2088} {"train_loss": -6.197912216186523, "global_step": 87715, "epoch": 2088} {"train_loss": -6.146103382110596, "global_step": 87716, "epoch": 2088} {"train_loss": -6.294866561889648, "global_step": 87717, "epoch": 2088} {"train_loss": -6.28867769241333, "global_step": 87718, "epoch": 2088} {"train_loss": -6.187705993652344, "global_step": 87719, "epoch": 2088} {"train_loss": -6.108744144439697, "global_step": 87720, "epoch": 2088} {"train_loss": -6.171327114105225, "global_step": 87721, "epoch": 2088} {"train_loss": -6.235828399658203, "global_step": 87722, "epoch": 2088} {"train_loss": -6.28049373626709, "global_step": 87723, "epoch": 2088} {"train_loss": -6.241294860839844, "global_step": 87724, "epoch": 2088} {"train_loss": -6.1548357009887695, "global_step": 87725, "epoch": 2088} {"train_loss": -6.232847690582275, "global_step": 87726, "epoch": 2088} {"train_loss": -6.190064430236816, "global_step": 87727, "epoch": 2088} {"train_loss": -6.183147430419922, "global_step": 87728, "epoch": 2088} {"train_loss": -6.214111804962158, "global_step": 87729, "epoch": 2088} {"train_loss": -6.089951515197754, "global_step": 87730, "epoch": 2088} {"train_loss": -6.20440673828125, "global_step": 87731, "epoch": 2088} {"train_loss": -6.184719085693359, "global_step": 87732, "epoch": 2088} {"train_loss": -6.263268947601318, "global_step": 87733, "epoch": 2088} {"train_loss": -6.266382694244385, "global_step": 87734, "epoch": 2088} {"train_loss": -6.204933166503906, "global_step": 87735, "epoch": 2088} {"train_loss": -6.270434379577637, "global_step": 87736, "epoch": 2088} {"train_loss": -6.215460027967181, "global_step": 87737, "epoch": 2088, "val_loss": 68061.578125} {"train_loss": -6.235782623291016, "global_step": 87738, "epoch": 2089} {"train_loss": -6.360628604888916, "global_step": 87739, "epoch": 2089} {"train_loss": -6.196676731109619, "global_step": 87740, "epoch": 2089} {"train_loss": -6.24356746673584, "global_step": 87741, "epoch": 2089} {"train_loss": -6.1746931076049805, "global_step": 87742, "epoch": 2089} {"train_loss": -6.27296257019043, "global_step": 87743, "epoch": 2089} {"train_loss": -6.16830587387085, "global_step": 87744, "epoch": 2089} {"train_loss": -6.2225213050842285, "global_step": 87745, "epoch": 2089} {"train_loss": -6.2655792236328125, "global_step": 87746, "epoch": 2089} {"train_loss": -6.299232482910156, "global_step": 87747, "epoch": 2089} {"train_loss": -6.219508171081543, "global_step": 87748, "epoch": 2089} {"train_loss": -6.225934982299805, "global_step": 87749, "epoch": 2089} {"train_loss": -6.15628719329834, "global_step": 87750, "epoch": 2089} {"train_loss": -6.312821388244629, "global_step": 87751, "epoch": 2089} {"train_loss": -6.143457412719727, "global_step": 87752, "epoch": 2089} {"train_loss": -6.1899590492248535, "global_step": 87753, "epoch": 2089} {"train_loss": -6.2363667488098145, "global_step": 87754, "epoch": 2089} {"train_loss": -6.20551872253418, "global_step": 87755, "epoch": 2089} {"train_loss": -6.2030534744262695, "global_step": 87756, "epoch": 2089} {"train_loss": -6.227947235107422, "global_step": 87757, "epoch": 2089} {"train_loss": -6.1240386962890625, "global_step": 87758, "epoch": 2089} {"train_loss": -6.241661071777344, "global_step": 87759, "epoch": 2089} {"train_loss": -6.251979827880859, "global_step": 87760, "epoch": 2089} {"train_loss": -6.306640625, "global_step": 87761, "epoch": 2089} {"train_loss": -6.174215316772461, "global_step": 87762, "epoch": 2089} {"train_loss": -6.188719749450684, "global_step": 87763, "epoch": 2089} {"train_loss": -6.253478527069092, "global_step": 87764, "epoch": 2089} {"train_loss": -6.327080726623535, "global_step": 87765, "epoch": 2089} {"train_loss": -6.317344665527344, "global_step": 87766, "epoch": 2089} {"train_loss": -6.254165172576904, "global_step": 87767, "epoch": 2089} {"train_loss": -6.280510902404785, "global_step": 87768, "epoch": 2089} {"train_loss": -6.1949310302734375, "global_step": 87769, "epoch": 2089} {"train_loss": -6.297419548034668, "global_step": 87770, "epoch": 2089} {"train_loss": -6.220175266265869, "global_step": 87771, "epoch": 2089} {"train_loss": -6.208975791931152, "global_step": 87772, "epoch": 2089} {"train_loss": -6.1415696144104, "global_step": 87773, "epoch": 2089} {"train_loss": -6.176784515380859, "global_step": 87774, "epoch": 2089} {"train_loss": -6.358915328979492, "global_step": 87775, "epoch": 2089} {"train_loss": -6.154236316680908, "global_step": 87776, "epoch": 2089} {"train_loss": -6.168797492980957, "global_step": 87777, "epoch": 2089} {"train_loss": -6.24542236328125, "global_step": 87778, "epoch": 2089} {"train_loss": -6.230646962211246, "global_step": 87779, "epoch": 2089, "val_loss": 67704.4453125} {"train_loss": -6.186288833618164, "global_step": 87780, "epoch": 2090} {"train_loss": -6.2407989501953125, "global_step": 87781, "epoch": 2090} {"train_loss": -6.205610275268555, "global_step": 87782, "epoch": 2090} {"train_loss": -6.2526750564575195, "global_step": 87783, "epoch": 2090} {"train_loss": -6.220336437225342, "global_step": 87784, "epoch": 2090} {"train_loss": -6.3068647384643555, "global_step": 87785, "epoch": 2090} {"train_loss": -6.276145935058594, "global_step": 87786, "epoch": 2090} {"train_loss": -6.174147605895996, "global_step": 87787, "epoch": 2090} {"train_loss": -6.268159866333008, "global_step": 87788, "epoch": 2090} {"train_loss": -6.249274730682373, "global_step": 87789, "epoch": 2090} {"train_loss": -6.197234153747559, "global_step": 87790, "epoch": 2090} {"train_loss": -6.245491981506348, "global_step": 87791, "epoch": 2090} {"train_loss": -6.268535137176514, "global_step": 87792, "epoch": 2090} {"train_loss": -6.157956600189209, "global_step": 87793, "epoch": 2090} {"train_loss": -6.220096588134766, "global_step": 87794, "epoch": 2090} {"train_loss": -6.207758903503418, "global_step": 87795, "epoch": 2090} {"train_loss": -6.203036308288574, "global_step": 87796, "epoch": 2090} {"train_loss": -6.180267333984375, "global_step": 87797, "epoch": 2090} {"train_loss": -6.309215545654297, "global_step": 87798, "epoch": 2090} {"train_loss": -6.262301445007324, "global_step": 87799, "epoch": 2090} {"train_loss": -6.241883754730225, "global_step": 87800, "epoch": 2090} {"train_loss": -6.246933937072754, "global_step": 87801, "epoch": 2090} {"train_loss": -6.206664562225342, "global_step": 87802, "epoch": 2090} {"train_loss": -6.180424690246582, "global_step": 87803, "epoch": 2090} {"train_loss": -6.149131774902344, "global_step": 87804, "epoch": 2090} {"train_loss": -6.257446765899658, "global_step": 87805, "epoch": 2090} {"train_loss": -6.214935302734375, "global_step": 87806, "epoch": 2090} {"train_loss": -6.2570600509643555, "global_step": 87807, "epoch": 2090} {"train_loss": -6.231454849243164, "global_step": 87808, "epoch": 2090} {"train_loss": -6.182780742645264, "global_step": 87809, "epoch": 2090} {"train_loss": -6.149866104125977, "global_step": 87810, "epoch": 2090} {"train_loss": -6.299205303192139, "global_step": 87811, "epoch": 2090} {"train_loss": -6.05543327331543, "global_step": 87812, "epoch": 2090} {"train_loss": -6.236052989959717, "global_step": 87813, "epoch": 2090} {"train_loss": -6.190360069274902, "global_step": 87814, "epoch": 2090} {"train_loss": -6.173924446105957, "global_step": 87815, "epoch": 2090} {"train_loss": -6.134049892425537, "global_step": 87816, "epoch": 2090} {"train_loss": -6.068360805511475, "global_step": 87817, "epoch": 2090} {"train_loss": -6.2360520362854, "global_step": 87818, "epoch": 2090} {"train_loss": -6.26857852935791, "global_step": 87819, "epoch": 2090} {"train_loss": -6.28727912902832, "global_step": 87820, "epoch": 2090} {"train_loss": -6.216359717505319, "global_step": 87821, "epoch": 2090, "val_loss": 67909.3984375} {"train_loss": -6.1106414794921875, "global_step": 87822, "epoch": 2091} {"train_loss": -6.213724136352539, "global_step": 87823, "epoch": 2091} {"train_loss": -6.0396504402160645, "global_step": 87824, "epoch": 2091} {"train_loss": -6.271556854248047, "global_step": 87825, "epoch": 2091} {"train_loss": -6.2376227378845215, "global_step": 87826, "epoch": 2091} {"train_loss": -6.285487174987793, "global_step": 87827, "epoch": 2091} {"train_loss": -6.2872161865234375, "global_step": 87828, "epoch": 2091} {"train_loss": -6.225790023803711, "global_step": 87829, "epoch": 2091} {"train_loss": -6.097465515136719, "global_step": 87830, "epoch": 2091} {"train_loss": -6.257587909698486, "global_step": 87831, "epoch": 2091} {"train_loss": -6.161681175231934, "global_step": 87832, "epoch": 2091} {"train_loss": -6.19497013092041, "global_step": 87833, "epoch": 2091} {"train_loss": -6.144828796386719, "global_step": 87834, "epoch": 2091} {"train_loss": -6.104985237121582, "global_step": 87835, "epoch": 2091} {"train_loss": -6.222287178039551, "global_step": 87836, "epoch": 2091} {"train_loss": -6.10899543762207, "global_step": 87837, "epoch": 2091} {"train_loss": -6.133497714996338, "global_step": 87838, "epoch": 2091} {"train_loss": -6.220973014831543, "global_step": 87839, "epoch": 2091} {"train_loss": -6.17056941986084, "global_step": 87840, "epoch": 2091} {"train_loss": -6.193325042724609, "global_step": 87841, "epoch": 2091} {"train_loss": -6.2133026123046875, "global_step": 87842, "epoch": 2091} {"train_loss": -6.150359630584717, "global_step": 87843, "epoch": 2091} {"train_loss": -6.175342559814453, "global_step": 87844, "epoch": 2091} {"train_loss": -6.210691452026367, "global_step": 87845, "epoch": 2091} {"train_loss": -6.156380653381348, "global_step": 87846, "epoch": 2091} {"train_loss": -6.3342485427856445, "global_step": 87847, "epoch": 2091} {"train_loss": -6.241056442260742, "global_step": 87848, "epoch": 2091} {"train_loss": -6.293540000915527, "global_step": 87849, "epoch": 2091} {"train_loss": -6.28797721862793, "global_step": 87850, "epoch": 2091} {"train_loss": -6.262564659118652, "global_step": 87851, "epoch": 2091} {"train_loss": -6.231767654418945, "global_step": 87852, "epoch": 2091} {"train_loss": -6.253212928771973, "global_step": 87853, "epoch": 2091} {"train_loss": -6.2210845947265625, "global_step": 87854, "epoch": 2091} {"train_loss": -6.226345062255859, "global_step": 87855, "epoch": 2091} {"train_loss": -6.133764266967773, "global_step": 87856, "epoch": 2091} {"train_loss": -6.286053657531738, "global_step": 87857, "epoch": 2091} {"train_loss": -6.093536376953125, "global_step": 87858, "epoch": 2091} {"train_loss": -6.1915364265441895, "global_step": 87859, "epoch": 2091} {"train_loss": -6.129383563995361, "global_step": 87860, "epoch": 2091} {"train_loss": -6.267675399780273, "global_step": 87861, "epoch": 2091} {"train_loss": -6.214211940765381, "global_step": 87862, "epoch": 2091} {"train_loss": -6.1997413748786565, "global_step": 87863, "epoch": 2091, "val_loss": 67891.1953125} {"train_loss": -6.33266019821167, "global_step": 87864, "epoch": 2092} {"train_loss": -6.1903581619262695, "global_step": 87865, "epoch": 2092} {"train_loss": -6.145910263061523, "global_step": 87866, "epoch": 2092} {"train_loss": -6.225200176239014, "global_step": 87867, "epoch": 2092} {"train_loss": -6.20556116104126, "global_step": 87868, "epoch": 2092} {"train_loss": -6.199400901794434, "global_step": 87869, "epoch": 2092} {"train_loss": -6.141808986663818, "global_step": 87870, "epoch": 2092} {"train_loss": -6.176137924194336, "global_step": 87871, "epoch": 2092} {"train_loss": -6.3048248291015625, "global_step": 87872, "epoch": 2092} {"train_loss": -6.1272172927856445, "global_step": 87873, "epoch": 2092} {"train_loss": -6.19618034362793, "global_step": 87874, "epoch": 2092} {"train_loss": -6.138467311859131, "global_step": 87875, "epoch": 2092} {"train_loss": -6.093883037567139, "global_step": 87876, "epoch": 2092} {"train_loss": -6.179415225982666, "global_step": 87877, "epoch": 2092} {"train_loss": -6.090236663818359, "global_step": 87878, "epoch": 2092} {"train_loss": -6.273138999938965, "global_step": 87879, "epoch": 2092} {"train_loss": -6.218964099884033, "global_step": 87880, "epoch": 2092} {"train_loss": -6.1800665855407715, "global_step": 87881, "epoch": 2092} {"train_loss": -6.043988227844238, "global_step": 87882, "epoch": 2092} {"train_loss": -6.308959484100342, "global_step": 87883, "epoch": 2092} {"train_loss": -6.235274314880371, "global_step": 87884, "epoch": 2092} {"train_loss": -6.114062309265137, "global_step": 87885, "epoch": 2092} {"train_loss": -6.25809383392334, "global_step": 87886, "epoch": 2092} {"train_loss": -6.19745397567749, "global_step": 87887, "epoch": 2092} {"train_loss": -6.206515312194824, "global_step": 87888, "epoch": 2092} {"train_loss": -6.225885391235352, "global_step": 87889, "epoch": 2092} {"train_loss": -6.378849983215332, "global_step": 87890, "epoch": 2092} {"train_loss": -6.28540563583374, "global_step": 87891, "epoch": 2092} {"train_loss": -6.1855082511901855, "global_step": 87892, "epoch": 2092} {"train_loss": -6.246974945068359, "global_step": 87893, "epoch": 2092} {"train_loss": -6.127444267272949, "global_step": 87894, "epoch": 2092} {"train_loss": -6.214536666870117, "global_step": 87895, "epoch": 2092} {"train_loss": -6.151571273803711, "global_step": 87896, "epoch": 2092} {"train_loss": -6.336816310882568, "global_step": 87897, "epoch": 2092} {"train_loss": -6.294732570648193, "global_step": 87898, "epoch": 2092} {"train_loss": -6.12387752532959, "global_step": 87899, "epoch": 2092} {"train_loss": -6.123902320861816, "global_step": 87900, "epoch": 2092} {"train_loss": -6.161803722381592, "global_step": 87901, "epoch": 2092} {"train_loss": -6.262026786804199, "global_step": 87902, "epoch": 2092} {"train_loss": -6.270402908325195, "global_step": 87903, "epoch": 2092} {"train_loss": -6.212610244750977, "global_step": 87904, "epoch": 2092} {"train_loss": -6.201519500641596, "global_step": 87905, "epoch": 2092, "val_loss": 67676.7109375} {"train_loss": -6.341418743133545, "global_step": 87906, "epoch": 2093} {"train_loss": -6.300384521484375, "global_step": 87907, "epoch": 2093} {"train_loss": -6.186922073364258, "global_step": 87908, "epoch": 2093} {"train_loss": -6.29187536239624, "global_step": 87909, "epoch": 2093} {"train_loss": -6.198957443237305, "global_step": 87910, "epoch": 2093} {"train_loss": -6.2684502601623535, "global_step": 87911, "epoch": 2093} {"train_loss": -6.219155311584473, "global_step": 87912, "epoch": 2093} {"train_loss": -6.177975654602051, "global_step": 87913, "epoch": 2093} {"train_loss": -6.182459831237793, "global_step": 87914, "epoch": 2093} {"train_loss": -6.148438930511475, "global_step": 87915, "epoch": 2093} {"train_loss": -6.2831711769104, "global_step": 87916, "epoch": 2093} {"train_loss": -6.223167419433594, "global_step": 87917, "epoch": 2093} {"train_loss": -6.39840030670166, "global_step": 87918, "epoch": 2093} {"train_loss": -6.225358009338379, "global_step": 87919, "epoch": 2093} {"train_loss": -6.272493362426758, "global_step": 87920, "epoch": 2093} {"train_loss": -6.195620059967041, "global_step": 87921, "epoch": 2093} {"train_loss": -6.250631332397461, "global_step": 87922, "epoch": 2093} {"train_loss": -6.291751384735107, "global_step": 87923, "epoch": 2093} {"train_loss": -6.261034965515137, "global_step": 87924, "epoch": 2093} {"train_loss": -6.23878812789917, "global_step": 87925, "epoch": 2093} {"train_loss": -6.2284321784973145, "global_step": 87926, "epoch": 2093} {"train_loss": -6.240694046020508, "global_step": 87927, "epoch": 2093} {"train_loss": -6.3263726234436035, "global_step": 87928, "epoch": 2093} {"train_loss": -6.1881608963012695, "global_step": 87929, "epoch": 2093} {"train_loss": -6.111955165863037, "global_step": 87930, "epoch": 2093} {"train_loss": -6.27189826965332, "global_step": 87931, "epoch": 2093} {"train_loss": -6.19001579284668, "global_step": 87932, "epoch": 2093} {"train_loss": -6.143141746520996, "global_step": 87933, "epoch": 2093} {"train_loss": -6.179872512817383, "global_step": 87934, "epoch": 2093} {"train_loss": -6.234516620635986, "global_step": 87935, "epoch": 2093} {"train_loss": -6.19734001159668, "global_step": 87936, "epoch": 2093} {"train_loss": -6.281174659729004, "global_step": 87937, "epoch": 2093} {"train_loss": -6.295161724090576, "global_step": 87938, "epoch": 2093} {"train_loss": -6.359323501586914, "global_step": 87939, "epoch": 2093} {"train_loss": -6.2043867111206055, "global_step": 87940, "epoch": 2093} {"train_loss": -6.179685592651367, "global_step": 87941, "epoch": 2093} {"train_loss": -6.278896331787109, "global_step": 87942, "epoch": 2093} {"train_loss": -6.231670379638672, "global_step": 87943, "epoch": 2093} {"train_loss": -6.082144737243652, "global_step": 87944, "epoch": 2093} {"train_loss": -6.234624862670898, "global_step": 87945, "epoch": 2093} {"train_loss": -6.22300910949707, "global_step": 87946, "epoch": 2093} {"train_loss": -6.232342901683989, "global_step": 87947, "epoch": 2093, "val_loss": 68017.390625} {"train_loss": -6.243512153625488, "global_step": 87948, "epoch": 2094} {"train_loss": -6.2285966873168945, "global_step": 87949, "epoch": 2094} {"train_loss": -6.181916236877441, "global_step": 87950, "epoch": 2094} {"train_loss": -6.273747444152832, "global_step": 87951, "epoch": 2094} {"train_loss": -6.201923370361328, "global_step": 87952, "epoch": 2094} {"train_loss": -6.122076511383057, "global_step": 87953, "epoch": 2094} {"train_loss": -6.076006889343262, "global_step": 87954, "epoch": 2094} {"train_loss": -6.141784191131592, "global_step": 87955, "epoch": 2094} {"train_loss": -6.2414703369140625, "global_step": 87956, "epoch": 2094} {"train_loss": -6.060417175292969, "global_step": 87957, "epoch": 2094} {"train_loss": -6.156233787536621, "global_step": 87958, "epoch": 2094} {"train_loss": -6.167136192321777, "global_step": 87959, "epoch": 2094} {"train_loss": -6.115208625793457, "global_step": 87960, "epoch": 2094} {"train_loss": -6.323857307434082, "global_step": 87961, "epoch": 2094} {"train_loss": -6.165186405181885, "global_step": 87962, "epoch": 2094} {"train_loss": -6.225994110107422, "global_step": 87963, "epoch": 2094} {"train_loss": -6.136293411254883, "global_step": 87964, "epoch": 2094} {"train_loss": -6.200074195861816, "global_step": 87965, "epoch": 2094} {"train_loss": -6.210750102996826, "global_step": 87966, "epoch": 2094} {"train_loss": -6.166064262390137, "global_step": 87967, "epoch": 2094} {"train_loss": -6.185736656188965, "global_step": 87968, "epoch": 2094} {"train_loss": -6.320954322814941, "global_step": 87969, "epoch": 2094} {"train_loss": -6.224870681762695, "global_step": 87970, "epoch": 2094} {"train_loss": -6.14874792098999, "global_step": 87971, "epoch": 2094} {"train_loss": -6.257184982299805, "global_step": 87972, "epoch": 2094} {"train_loss": -6.282084941864014, "global_step": 87973, "epoch": 2094} {"train_loss": -6.156559944152832, "global_step": 87974, "epoch": 2094} {"train_loss": -6.055733680725098, "global_step": 87975, "epoch": 2094} {"train_loss": -6.1646409034729, "global_step": 87976, "epoch": 2094} {"train_loss": -6.121649742126465, "global_step": 87977, "epoch": 2094} {"train_loss": -6.174192428588867, "global_step": 87978, "epoch": 2094} {"train_loss": -6.110959529876709, "global_step": 87979, "epoch": 2094} {"train_loss": -6.073879718780518, "global_step": 87980, "epoch": 2094} {"train_loss": -6.330846786499023, "global_step": 87981, "epoch": 2094} {"train_loss": -6.139138221740723, "global_step": 87982, "epoch": 2094} {"train_loss": -6.185895919799805, "global_step": 87983, "epoch": 2094} {"train_loss": -6.201747417449951, "global_step": 87984, "epoch": 2094} {"train_loss": -6.195173263549805, "global_step": 87985, "epoch": 2094} {"train_loss": -6.225313186645508, "global_step": 87986, "epoch": 2094} {"train_loss": -6.160906791687012, "global_step": 87987, "epoch": 2094} {"train_loss": -6.235852241516113, "global_step": 87988, "epoch": 2094} {"train_loss": -6.180186055955433, "global_step": 87989, "epoch": 2094, "val_loss": 67828.234375} {"train_loss": -6.097835540771484, "global_step": 87990, "epoch": 2095} {"train_loss": -6.163783550262451, "global_step": 87991, "epoch": 2095} {"train_loss": -6.0455427169799805, "global_step": 87992, "epoch": 2095} {"train_loss": -6.115231037139893, "global_step": 87993, "epoch": 2095} {"train_loss": -6.256274223327637, "global_step": 87994, "epoch": 2095} {"train_loss": -5.932297706604004, "global_step": 87995, "epoch": 2095} {"train_loss": -6.132412910461426, "global_step": 87996, "epoch": 2095} {"train_loss": -5.952911853790283, "global_step": 87997, "epoch": 2095} {"train_loss": -6.020625114440918, "global_step": 87998, "epoch": 2095} {"train_loss": -6.127688884735107, "global_step": 87999, "epoch": 2095} {"train_loss": -6.067055702209473, "global_step": 88000, "epoch": 2095} {"train_loss": -6.028103828430176, "global_step": 88001, "epoch": 2095} {"train_loss": -6.028944969177246, "global_step": 88002, "epoch": 2095} {"train_loss": -6.133604049682617, "global_step": 88003, "epoch": 2095} {"train_loss": -6.0829596519470215, "global_step": 88004, "epoch": 2095} {"train_loss": -6.058060169219971, "global_step": 88005, "epoch": 2095} {"train_loss": -6.22268009185791, "global_step": 88006, "epoch": 2095} {"train_loss": -6.155269145965576, "global_step": 88007, "epoch": 2095} {"train_loss": -5.961308002471924, "global_step": 88008, "epoch": 2095} {"train_loss": -6.141654968261719, "global_step": 88009, "epoch": 2095} {"train_loss": -6.093202590942383, "global_step": 88010, "epoch": 2095} {"train_loss": -6.090275287628174, "global_step": 88011, "epoch": 2095} {"train_loss": -6.102724075317383, "global_step": 88012, "epoch": 2095} {"train_loss": -6.254279136657715, "global_step": 88013, "epoch": 2095} {"train_loss": -6.078907012939453, "global_step": 88014, "epoch": 2095} {"train_loss": -6.0203423500061035, "global_step": 88015, "epoch": 2095} {"train_loss": -6.171280860900879, "global_step": 88016, "epoch": 2095} {"train_loss": -6.057870864868164, "global_step": 88017, "epoch": 2095} {"train_loss": -6.12174129486084, "global_step": 88018, "epoch": 2095} {"train_loss": -6.208614349365234, "global_step": 88019, "epoch": 2095} {"train_loss": -6.132602214813232, "global_step": 88020, "epoch": 2095} {"train_loss": -6.055192470550537, "global_step": 88021, "epoch": 2095} {"train_loss": -6.220767021179199, "global_step": 88022, "epoch": 2095} {"train_loss": -6.240522861480713, "global_step": 88023, "epoch": 2095} {"train_loss": -6.183001518249512, "global_step": 88024, "epoch": 2095} {"train_loss": -6.162619590759277, "global_step": 88025, "epoch": 2095} {"train_loss": -6.098535537719727, "global_step": 88026, "epoch": 2095} {"train_loss": -6.208801746368408, "global_step": 88027, "epoch": 2095} {"train_loss": -6.242544651031494, "global_step": 88028, "epoch": 2095} {"train_loss": -6.176661014556885, "global_step": 88029, "epoch": 2095} {"train_loss": -6.200413703918457, "global_step": 88030, "epoch": 2095} {"train_loss": -6.121667941411336, "global_step": 88031, "epoch": 2095, "val_loss": 67788.53125} {"train_loss": -5.98949670791626, "global_step": 88032, "epoch": 2096} {"train_loss": -6.332993507385254, "global_step": 88033, "epoch": 2096} {"train_loss": -6.175895690917969, "global_step": 88034, "epoch": 2096} {"train_loss": -6.261153697967529, "global_step": 88035, "epoch": 2096} {"train_loss": -6.314486503601074, "global_step": 88036, "epoch": 2096} {"train_loss": -6.117900848388672, "global_step": 88037, "epoch": 2096} {"train_loss": -6.120665073394775, "global_step": 88038, "epoch": 2096} {"train_loss": -6.179231643676758, "global_step": 88039, "epoch": 2096} {"train_loss": -6.165248870849609, "global_step": 88040, "epoch": 2096} {"train_loss": -6.141285419464111, "global_step": 88041, "epoch": 2096} {"train_loss": -6.168557167053223, "global_step": 88042, "epoch": 2096} {"train_loss": -6.240169525146484, "global_step": 88043, "epoch": 2096} {"train_loss": -6.1334733963012695, "global_step": 88044, "epoch": 2096} {"train_loss": -6.201271057128906, "global_step": 88045, "epoch": 2096} {"train_loss": -6.065882682800293, "global_step": 88046, "epoch": 2096} {"train_loss": -6.179194927215576, "global_step": 88047, "epoch": 2096} {"train_loss": -6.238193511962891, "global_step": 88048, "epoch": 2096} {"train_loss": -6.259188652038574, "global_step": 88049, "epoch": 2096} {"train_loss": -6.309601783752441, "global_step": 88050, "epoch": 2096} {"train_loss": -6.079557418823242, "global_step": 88051, "epoch": 2096} {"train_loss": -6.223156929016113, "global_step": 88052, "epoch": 2096} {"train_loss": -6.200770854949951, "global_step": 88053, "epoch": 2096} {"train_loss": -6.2487945556640625, "global_step": 88054, "epoch": 2096} {"train_loss": -6.375127792358398, "global_step": 88055, "epoch": 2096} {"train_loss": -6.192380905151367, "global_step": 88056, "epoch": 2096} {"train_loss": -6.171452522277832, "global_step": 88057, "epoch": 2096} {"train_loss": -6.183760166168213, "global_step": 88058, "epoch": 2096} {"train_loss": -6.10680627822876, "global_step": 88059, "epoch": 2096} {"train_loss": -6.17377233505249, "global_step": 88060, "epoch": 2096} {"train_loss": -6.210259914398193, "global_step": 88061, "epoch": 2096} {"train_loss": -6.19923210144043, "global_step": 88062, "epoch": 2096} {"train_loss": -6.191274642944336, "global_step": 88063, "epoch": 2096} {"train_loss": -6.175601959228516, "global_step": 88064, "epoch": 2096} {"train_loss": -6.194729804992676, "global_step": 88065, "epoch": 2096} {"train_loss": -6.226186752319336, "global_step": 88066, "epoch": 2096} {"train_loss": -6.369334697723389, "global_step": 88067, "epoch": 2096} {"train_loss": -6.329848289489746, "global_step": 88068, "epoch": 2096} {"train_loss": -6.234511375427246, "global_step": 88069, "epoch": 2096} {"train_loss": -6.249675273895264, "global_step": 88070, "epoch": 2096} {"train_loss": -6.26210880279541, "global_step": 88071, "epoch": 2096} {"train_loss": -6.30409049987793, "global_step": 88072, "epoch": 2096} {"train_loss": -6.205971377236502, "global_step": 88073, "epoch": 2096, "val_loss": 67849.625} {"train_loss": -6.186657905578613, "global_step": 88074, "epoch": 2097} {"train_loss": -6.21911096572876, "global_step": 88075, "epoch": 2097} {"train_loss": -6.2376508712768555, "global_step": 88076, "epoch": 2097} {"train_loss": -6.331456184387207, "global_step": 88077, "epoch": 2097} {"train_loss": -6.215498924255371, "global_step": 88078, "epoch": 2097} {"train_loss": -6.316568374633789, "global_step": 88079, "epoch": 2097} {"train_loss": -6.171433448791504, "global_step": 88080, "epoch": 2097} {"train_loss": -6.204753398895264, "global_step": 88081, "epoch": 2097} {"train_loss": -6.096197128295898, "global_step": 88082, "epoch": 2097} {"train_loss": -6.230323791503906, "global_step": 88083, "epoch": 2097} {"train_loss": -6.28278923034668, "global_step": 88084, "epoch": 2097} {"train_loss": -6.203250885009766, "global_step": 88085, "epoch": 2097} {"train_loss": -6.174902439117432, "global_step": 88086, "epoch": 2097} {"train_loss": -6.2187676429748535, "global_step": 88087, "epoch": 2097} {"train_loss": -6.262983322143555, "global_step": 88088, "epoch": 2097} {"train_loss": -6.252839088439941, "global_step": 88089, "epoch": 2097} {"train_loss": -6.330202102661133, "global_step": 88090, "epoch": 2097} {"train_loss": -6.200395107269287, "global_step": 88091, "epoch": 2097} {"train_loss": -6.23607063293457, "global_step": 88092, "epoch": 2097} {"train_loss": -6.287363052368164, "global_step": 88093, "epoch": 2097} {"train_loss": -6.284379005432129, "global_step": 88094, "epoch": 2097} {"train_loss": -6.30101203918457, "global_step": 88095, "epoch": 2097} {"train_loss": -6.267908096313477, "global_step": 88096, "epoch": 2097} {"train_loss": -6.161739349365234, "global_step": 88097, "epoch": 2097} {"train_loss": -6.2117109298706055, "global_step": 88098, "epoch": 2097} {"train_loss": -6.255428791046143, "global_step": 88099, "epoch": 2097} {"train_loss": -6.292122840881348, "global_step": 88100, "epoch": 2097} {"train_loss": -6.2010416984558105, "global_step": 88101, "epoch": 2097} {"train_loss": -6.191352844238281, "global_step": 88102, "epoch": 2097} {"train_loss": -6.253205299377441, "global_step": 88103, "epoch": 2097} {"train_loss": -6.273057460784912, "global_step": 88104, "epoch": 2097} {"train_loss": -6.105645179748535, "global_step": 88105, "epoch": 2097} {"train_loss": -6.187440395355225, "global_step": 88106, "epoch": 2097} {"train_loss": -6.2928385734558105, "global_step": 88107, "epoch": 2097} {"train_loss": -6.19077205657959, "global_step": 88108, "epoch": 2097} {"train_loss": -6.20320987701416, "global_step": 88109, "epoch": 2097} {"train_loss": -6.171655178070068, "global_step": 88110, "epoch": 2097} {"train_loss": -5.999905109405518, "global_step": 88111, "epoch": 2097} {"train_loss": -6.144275665283203, "global_step": 88112, "epoch": 2097} {"train_loss": -6.295737266540527, "global_step": 88113, "epoch": 2097} {"train_loss": -6.060060024261475, "global_step": 88114, "epoch": 2097} {"train_loss": -6.219093867710659, "global_step": 88115, "epoch": 2097, "val_loss": 68004.453125} {"train_loss": -6.129510879516602, "global_step": 88116, "epoch": 2098} {"train_loss": -6.305131912231445, "global_step": 88117, "epoch": 2098} {"train_loss": -6.262957572937012, "global_step": 88118, "epoch": 2098} {"train_loss": -6.19000244140625, "global_step": 88119, "epoch": 2098} {"train_loss": -6.2569169998168945, "global_step": 88120, "epoch": 2098} {"train_loss": -6.1777191162109375, "global_step": 88121, "epoch": 2098} {"train_loss": -6.227969169616699, "global_step": 88122, "epoch": 2098} {"train_loss": -6.088006019592285, "global_step": 88123, "epoch": 2098} {"train_loss": -6.229878902435303, "global_step": 88124, "epoch": 2098} {"train_loss": -6.0961151123046875, "global_step": 88125, "epoch": 2098} {"train_loss": -6.136994361877441, "global_step": 88126, "epoch": 2098} {"train_loss": -6.236612319946289, "global_step": 88127, "epoch": 2098} {"train_loss": -5.990079879760742, "global_step": 88128, "epoch": 2098} {"train_loss": -6.286956787109375, "global_step": 88129, "epoch": 2098} {"train_loss": -6.171998023986816, "global_step": 88130, "epoch": 2098} {"train_loss": -6.228565216064453, "global_step": 88131, "epoch": 2098} {"train_loss": -6.2276611328125, "global_step": 88132, "epoch": 2098} {"train_loss": -6.143310546875, "global_step": 88133, "epoch": 2098} {"train_loss": -6.196430206298828, "global_step": 88134, "epoch": 2098} {"train_loss": -6.216165065765381, "global_step": 88135, "epoch": 2098} {"train_loss": -6.276541709899902, "global_step": 88136, "epoch": 2098} {"train_loss": -6.199550628662109, "global_step": 88137, "epoch": 2098} {"train_loss": -6.159187316894531, "global_step": 88138, "epoch": 2098} {"train_loss": -6.04086971282959, "global_step": 88139, "epoch": 2098} {"train_loss": -6.168200492858887, "global_step": 88140, "epoch": 2098} {"train_loss": -6.185282230377197, "global_step": 88141, "epoch": 2098} {"train_loss": -6.226457595825195, "global_step": 88142, "epoch": 2098} {"train_loss": -6.263296127319336, "global_step": 88143, "epoch": 2098} {"train_loss": -6.139191627502441, "global_step": 88144, "epoch": 2098} {"train_loss": -6.206326484680176, "global_step": 88145, "epoch": 2098} {"train_loss": -6.147164344787598, "global_step": 88146, "epoch": 2098} {"train_loss": -6.157249927520752, "global_step": 88147, "epoch": 2098} {"train_loss": -6.226197242736816, "global_step": 88148, "epoch": 2098} {"train_loss": -6.233855247497559, "global_step": 88149, "epoch": 2098} {"train_loss": -6.0098347663879395, "global_step": 88150, "epoch": 2098} {"train_loss": -6.2657880783081055, "global_step": 88151, "epoch": 2098} {"train_loss": -6.173402786254883, "global_step": 88152, "epoch": 2098} {"train_loss": -6.18731689453125, "global_step": 88153, "epoch": 2098} {"train_loss": -6.180691719055176, "global_step": 88154, "epoch": 2098} {"train_loss": -6.157051086425781, "global_step": 88155, "epoch": 2098} {"train_loss": -6.158623695373535, "global_step": 88156, "epoch": 2098} {"train_loss": -6.181517669132778, "global_step": 88157, "epoch": 2098, "val_loss": 67848.1484375} {"train_loss": -6.125839710235596, "global_step": 88158, "epoch": 2099} {"train_loss": -6.1063127517700195, "global_step": 88159, "epoch": 2099} {"train_loss": -6.164052486419678, "global_step": 88160, "epoch": 2099} {"train_loss": -6.279674530029297, "global_step": 88161, "epoch": 2099} {"train_loss": -6.2179107666015625, "global_step": 88162, "epoch": 2099} {"train_loss": -6.154296398162842, "global_step": 88163, "epoch": 2099} {"train_loss": -6.077798843383789, "global_step": 88164, "epoch": 2099} {"train_loss": -6.143681526184082, "global_step": 88165, "epoch": 2099} {"train_loss": -6.140412330627441, "global_step": 88166, "epoch": 2099} {"train_loss": -6.1749267578125, "global_step": 88167, "epoch": 2099} {"train_loss": -6.133095741271973, "global_step": 88168, "epoch": 2099} {"train_loss": -6.197407245635986, "global_step": 88169, "epoch": 2099} {"train_loss": -6.249486923217773, "global_step": 88170, "epoch": 2099} {"train_loss": -6.130614280700684, "global_step": 88171, "epoch": 2099} {"train_loss": -6.122626304626465, "global_step": 88172, "epoch": 2099} {"train_loss": -6.268301963806152, "global_step": 88173, "epoch": 2099} {"train_loss": -6.260729789733887, "global_step": 88174, "epoch": 2099} {"train_loss": -6.1029205322265625, "global_step": 88175, "epoch": 2099} {"train_loss": -6.184021472930908, "global_step": 88176, "epoch": 2099} {"train_loss": -6.318545818328857, "global_step": 88177, "epoch": 2099} {"train_loss": -6.0789265632629395, "global_step": 88178, "epoch": 2099} {"train_loss": -6.15338659286499, "global_step": 88179, "epoch": 2099} {"train_loss": -6.1897873878479, "global_step": 88180, "epoch": 2099} {"train_loss": -6.218027114868164, "global_step": 88181, "epoch": 2099} {"train_loss": -6.279635906219482, "global_step": 88182, "epoch": 2099} {"train_loss": -6.203399181365967, "global_step": 88183, "epoch": 2099} {"train_loss": -6.269969463348389, "global_step": 88184, "epoch": 2099} {"train_loss": -6.175496578216553, "global_step": 88185, "epoch": 2099} {"train_loss": -6.250710487365723, "global_step": 88186, "epoch": 2099} {"train_loss": -6.153708457946777, "global_step": 88187, "epoch": 2099} {"train_loss": -6.238746166229248, "global_step": 88188, "epoch": 2099} {"train_loss": -6.177548408508301, "global_step": 88189, "epoch": 2099} {"train_loss": -6.157506465911865, "global_step": 88190, "epoch": 2099} {"train_loss": -6.137871742248535, "global_step": 88191, "epoch": 2099} {"train_loss": -6.17332649230957, "global_step": 88192, "epoch": 2099} {"train_loss": -6.294457912445068, "global_step": 88193, "epoch": 2099} {"train_loss": -6.097596168518066, "global_step": 88194, "epoch": 2099} {"train_loss": -6.216127395629883, "global_step": 88195, "epoch": 2099} {"train_loss": -6.1181640625, "global_step": 88196, "epoch": 2099} {"train_loss": -6.2237958908081055, "global_step": 88197, "epoch": 2099} {"train_loss": -6.148988723754883, "global_step": 88198, "epoch": 2099} {"train_loss": -6.182691528683617, "global_step": 88199, "epoch": 2099, "val_loss": 67998.921875} {"train_loss": -6.147207260131836, "global_step": 88200, "epoch": 2100} {"train_loss": -6.05242919921875, "global_step": 88201, "epoch": 2100} {"train_loss": -6.2558274269104, "global_step": 88202, "epoch": 2100} {"train_loss": -6.1262922286987305, "global_step": 88203, "epoch": 2100} {"train_loss": -6.161370277404785, "global_step": 88204, "epoch": 2100} {"train_loss": -6.159128189086914, "global_step": 88205, "epoch": 2100} {"train_loss": -5.955862998962402, "global_step": 88206, "epoch": 2100} {"train_loss": -6.1697564125061035, "global_step": 88207, "epoch": 2100} {"train_loss": -5.994932174682617, "global_step": 88208, "epoch": 2100} {"train_loss": -6.124825954437256, "global_step": 88209, "epoch": 2100} {"train_loss": -6.10264778137207, "global_step": 88210, "epoch": 2100} {"train_loss": -6.23628044128418, "global_step": 88211, "epoch": 2100} {"train_loss": -6.032048225402832, "global_step": 88212, "epoch": 2100} {"train_loss": -6.090930938720703, "global_step": 88213, "epoch": 2100} {"train_loss": -6.068685531616211, "global_step": 88214, "epoch": 2100} {"train_loss": -6.104305744171143, "global_step": 88215, "epoch": 2100} {"train_loss": -6.147817134857178, "global_step": 88216, "epoch": 2100} {"train_loss": -6.284205436706543, "global_step": 88217, "epoch": 2100} {"train_loss": -6.122443199157715, "global_step": 88218, "epoch": 2100} {"train_loss": -6.140677452087402, "global_step": 88219, "epoch": 2100} {"train_loss": -6.0800700187683105, "global_step": 88220, "epoch": 2100} {"train_loss": -6.200051784515381, "global_step": 88221, "epoch": 2100} {"train_loss": -6.188972473144531, "global_step": 88222, "epoch": 2100} {"train_loss": -6.147862911224365, "global_step": 88223, "epoch": 2100} {"train_loss": -6.098494052886963, "global_step": 88224, "epoch": 2100} {"train_loss": -6.158493995666504, "global_step": 88225, "epoch": 2100} {"train_loss": -6.287839412689209, "global_step": 88226, "epoch": 2100} {"train_loss": -6.173043251037598, "global_step": 88227, "epoch": 2100} {"train_loss": -6.274366855621338, "global_step": 88228, "epoch": 2100} {"train_loss": -6.156133651733398, "global_step": 88229, "epoch": 2100} {"train_loss": -6.022101402282715, "global_step": 88230, "epoch": 2100} {"train_loss": -6.115457534790039, "global_step": 88231, "epoch": 2100} {"train_loss": -6.060678005218506, "global_step": 88232, "epoch": 2100} {"train_loss": -6.1382646560668945, "global_step": 88233, "epoch": 2100} {"train_loss": -6.253217697143555, "global_step": 88234, "epoch": 2100} {"train_loss": -6.107507705688477, "global_step": 88235, "epoch": 2100} {"train_loss": -6.130031108856201, "global_step": 88236, "epoch": 2100} {"train_loss": -6.066117763519287, "global_step": 88237, "epoch": 2100} {"train_loss": -6.25340461730957, "global_step": 88238, "epoch": 2100} {"train_loss": -6.190230369567871, "global_step": 88239, "epoch": 2100} {"train_loss": -6.16270637512207, "global_step": 88240, "epoch": 2100} {"train_loss": -6.1423046588897705, "global_step": 88241, "epoch": 2100, "train/sim_max_reward_0": 0.20610298939402247, "train/sim_max_reward_1": 0.9481611715706895, "train/sim_max_reward_2": 0.36805628382575806, "train/sim_max_reward_3": 0.8166126436951071, "train/sim_max_reward_4": 0.7136792777240818, "train/sim_max_reward_5": 0.9504136951653154, "test/sim_max_reward_4400000": 0.2101444099110012, "test/sim_max_reward_4400001": 0.8845134245471008, "test/sim_max_reward_4400002": 0.8234452118881331, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.5192831366065537, "test/sim_max_reward_4400006": 0.8471712131413037, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.30735999140016645, "test/sim_max_reward_4400009": 0.9444732464473742, "test/sim_max_reward_4400010": 0.2424387013467612, "test/sim_max_reward_4400011": 0.20760070631947009, "test/sim_max_reward_4400012": 0.8953852380244124, "test/sim_max_reward_4400013": 0.9305857098845176, "test/sim_max_reward_4400014": 0.8349966104556336, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.07516996425106819, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23214686248729355, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.7771648789722062, "test/sim_max_reward_4400022": 0.8665212450239347, "test/sim_max_reward_4400023": 0.15849608346051694, "test/sim_max_reward_4400024": 0.7468312506867185, "test/sim_max_reward_4400025": 0.26045099883478695, "test/sim_max_reward_4400026": 0.9327642645655936, "test/sim_max_reward_4400027": 0.015619124344762949, "test/sim_max_reward_4400028": 0.3994577368765495, "test/sim_max_reward_4400029": 0.40925375479591797, "test/sim_max_reward_4400030": 0.8829830562951063, "test/sim_max_reward_4400031": 0.7952452918924372, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.3054097385752237, "test/sim_max_reward_4400034": 0.9710646243900495, "test/sim_max_reward_4400035": 0.39603236710522166, "test/sim_max_reward_4400036": 0.972039540883324, "test/sim_max_reward_4400037": 0.629047897035387, "test/sim_max_reward_4400038": 0.28914691482498134, "test/sim_max_reward_4400039": 0.866284213124013, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6042476756212094, "test/sim_max_reward_4400042": 0.9529030764024343, "test/sim_max_reward_4400043": 0.9120326358147774, "test/sim_max_reward_4400044": 0.6828058829408206, "test/sim_max_reward_4400045": 0.946243604124065, "test/sim_max_reward_4400046": 0.6261977159331922, "test/sim_max_reward_4400047": 0.939184328389732, "test/sim_max_reward_4400048": 0.97566636631315, "test/sim_max_reward_4400049": 0.8066745963090989, "train/mean_score": 0.6671710102291625, "test/mean_score": 0.5249168274214502, "val_loss": 68000.6171875} {"train_loss": -6.305828094482422, "global_step": 88242, "epoch": 2101} {"train_loss": -6.282207012176514, "global_step": 88243, "epoch": 2101} {"train_loss": -6.151494979858398, "global_step": 88244, "epoch": 2101} {"train_loss": -6.243001937866211, "global_step": 88245, "epoch": 2101} {"train_loss": -6.230461597442627, "global_step": 88246, "epoch": 2101} {"train_loss": -6.143773078918457, "global_step": 88247, "epoch": 2101} {"train_loss": -6.3727521896362305, "global_step": 88248, "epoch": 2101} {"train_loss": -6.270594596862793, "global_step": 88249, "epoch": 2101} {"train_loss": -6.399703502655029, "global_step": 88250, "epoch": 2101} {"train_loss": -6.207578182220459, "global_step": 88251, "epoch": 2101} {"train_loss": -6.282963752746582, "global_step": 88252, "epoch": 2101} {"train_loss": -6.201150894165039, "global_step": 88253, "epoch": 2101} {"train_loss": -6.25731086730957, "global_step": 88254, "epoch": 2101} {"train_loss": -6.294397830963135, "global_step": 88255, "epoch": 2101} {"train_loss": -6.279460906982422, "global_step": 88256, "epoch": 2101} {"train_loss": -6.263885974884033, "global_step": 88257, "epoch": 2101} {"train_loss": -6.266458511352539, "global_step": 88258, "epoch": 2101} {"train_loss": -6.005296230316162, "global_step": 88259, "epoch": 2101} {"train_loss": -6.230254173278809, "global_step": 88260, "epoch": 2101} {"train_loss": -6.075222969055176, "global_step": 88261, "epoch": 2101} {"train_loss": -6.152061462402344, "global_step": 88262, "epoch": 2101} {"train_loss": -6.2101311683654785, "global_step": 88263, "epoch": 2101} {"train_loss": -6.150373458862305, "global_step": 88264, "epoch": 2101} {"train_loss": -6.172183990478516, "global_step": 88265, "epoch": 2101} {"train_loss": -6.241792678833008, "global_step": 88266, "epoch": 2101} {"train_loss": -6.258680820465088, "global_step": 88267, "epoch": 2101} {"train_loss": -6.081396102905273, "global_step": 88268, "epoch": 2101} {"train_loss": -6.288839340209961, "global_step": 88269, "epoch": 2101} {"train_loss": -6.189648628234863, "global_step": 88270, "epoch": 2101} {"train_loss": -6.261366367340088, "global_step": 88271, "epoch": 2101} {"train_loss": -6.209544658660889, "global_step": 88272, "epoch": 2101} {"train_loss": -6.193815231323242, "global_step": 88273, "epoch": 2101} {"train_loss": -6.260860919952393, "global_step": 88274, "epoch": 2101} {"train_loss": -6.107780456542969, "global_step": 88275, "epoch": 2101} {"train_loss": -6.207422256469727, "global_step": 88276, "epoch": 2101} {"train_loss": -6.089512348175049, "global_step": 88277, "epoch": 2101} {"train_loss": -6.2252607345581055, "global_step": 88278, "epoch": 2101} {"train_loss": -6.2904863357543945, "global_step": 88279, "epoch": 2101} {"train_loss": -6.141253471374512, "global_step": 88280, "epoch": 2101} {"train_loss": -6.215156555175781, "global_step": 88281, "epoch": 2101} {"train_loss": -6.175192832946777, "global_step": 88282, "epoch": 2101} {"train_loss": -6.2116168567112515, "global_step": 88283, "epoch": 2101, "val_loss": 67872.171875} {"train_loss": -6.198947906494141, "global_step": 88284, "epoch": 2102} {"train_loss": -6.079361915588379, "global_step": 88285, "epoch": 2102} {"train_loss": -6.1981353759765625, "global_step": 88286, "epoch": 2102} {"train_loss": -6.179337501525879, "global_step": 88287, "epoch": 2102} {"train_loss": -6.183855056762695, "global_step": 88288, "epoch": 2102} {"train_loss": -6.131497859954834, "global_step": 88289, "epoch": 2102} {"train_loss": -6.127407073974609, "global_step": 88290, "epoch": 2102} {"train_loss": -6.251883506774902, "global_step": 88291, "epoch": 2102} {"train_loss": -6.2179951667785645, "global_step": 88292, "epoch": 2102} {"train_loss": -6.328301429748535, "global_step": 88293, "epoch": 2102} {"train_loss": -6.285648822784424, "global_step": 88294, "epoch": 2102} {"train_loss": -6.211667537689209, "global_step": 88295, "epoch": 2102} {"train_loss": -6.260074615478516, "global_step": 88296, "epoch": 2102} {"train_loss": -6.311741828918457, "global_step": 88297, "epoch": 2102} {"train_loss": -6.206735610961914, "global_step": 88298, "epoch": 2102} {"train_loss": -6.21159553527832, "global_step": 88299, "epoch": 2102} {"train_loss": -6.27345085144043, "global_step": 88300, "epoch": 2102} {"train_loss": -6.207254409790039, "global_step": 88301, "epoch": 2102} {"train_loss": -6.232641220092773, "global_step": 88302, "epoch": 2102} {"train_loss": -6.261667728424072, "global_step": 88303, "epoch": 2102} {"train_loss": -6.273679733276367, "global_step": 88304, "epoch": 2102} {"train_loss": -6.207080364227295, "global_step": 88305, "epoch": 2102} {"train_loss": -6.2806549072265625, "global_step": 88306, "epoch": 2102} {"train_loss": -6.117924690246582, "global_step": 88307, "epoch": 2102} {"train_loss": -6.084927558898926, "global_step": 88308, "epoch": 2102} {"train_loss": -6.171482086181641, "global_step": 88309, "epoch": 2102} {"train_loss": -6.284976959228516, "global_step": 88310, "epoch": 2102} {"train_loss": -6.173926830291748, "global_step": 88311, "epoch": 2102} {"train_loss": -6.220255374908447, "global_step": 88312, "epoch": 2102} {"train_loss": -6.129434585571289, "global_step": 88313, "epoch": 2102} {"train_loss": -6.2885284423828125, "global_step": 88314, "epoch": 2102} {"train_loss": -6.348503112792969, "global_step": 88315, "epoch": 2102} {"train_loss": -6.291433334350586, "global_step": 88316, "epoch": 2102} {"train_loss": -6.206586837768555, "global_step": 88317, "epoch": 2102} {"train_loss": -6.296782970428467, "global_step": 88318, "epoch": 2102} {"train_loss": -6.161731719970703, "global_step": 88319, "epoch": 2102} {"train_loss": -6.176332950592041, "global_step": 88320, "epoch": 2102} {"train_loss": -6.168265342712402, "global_step": 88321, "epoch": 2102} {"train_loss": -6.24645471572876, "global_step": 88322, "epoch": 2102} {"train_loss": -6.232067108154297, "global_step": 88323, "epoch": 2102} {"train_loss": -6.178049564361572, "global_step": 88324, "epoch": 2102} {"train_loss": -6.216704550243559, "global_step": 88325, "epoch": 2102, "val_loss": 67805.7890625} {"train_loss": -6.164880275726318, "global_step": 88326, "epoch": 2103} {"train_loss": -6.229254722595215, "global_step": 88327, "epoch": 2103} {"train_loss": -6.230337142944336, "global_step": 88328, "epoch": 2103} {"train_loss": -6.2211737632751465, "global_step": 88329, "epoch": 2103} {"train_loss": -6.261935234069824, "global_step": 88330, "epoch": 2103} {"train_loss": -6.353869438171387, "global_step": 88331, "epoch": 2103} {"train_loss": -6.228397369384766, "global_step": 88332, "epoch": 2103} {"train_loss": -6.173222541809082, "global_step": 88333, "epoch": 2103} {"train_loss": -6.289186477661133, "global_step": 88334, "epoch": 2103} {"train_loss": -6.283655166625977, "global_step": 88335, "epoch": 2103} {"train_loss": -6.171290874481201, "global_step": 88336, "epoch": 2103} {"train_loss": -6.250515937805176, "global_step": 88337, "epoch": 2103} {"train_loss": -6.31416130065918, "global_step": 88338, "epoch": 2103} {"train_loss": -6.247690200805664, "global_step": 88339, "epoch": 2103} {"train_loss": -6.1061201095581055, "global_step": 88340, "epoch": 2103} {"train_loss": -6.376979827880859, "global_step": 88341, "epoch": 2103} {"train_loss": -6.342103958129883, "global_step": 88342, "epoch": 2103} {"train_loss": -6.344836235046387, "global_step": 88343, "epoch": 2103} {"train_loss": -6.216374397277832, "global_step": 88344, "epoch": 2103} {"train_loss": -6.246098518371582, "global_step": 88345, "epoch": 2103} {"train_loss": -6.265569686889648, "global_step": 88346, "epoch": 2103} {"train_loss": -6.1827874183654785, "global_step": 88347, "epoch": 2103} {"train_loss": -6.217896461486816, "global_step": 88348, "epoch": 2103} {"train_loss": -6.179104804992676, "global_step": 88349, "epoch": 2103} {"train_loss": -6.204948902130127, "global_step": 88350, "epoch": 2103} {"train_loss": -6.30360746383667, "global_step": 88351, "epoch": 2103} {"train_loss": -6.246766090393066, "global_step": 88352, "epoch": 2103} {"train_loss": -6.047893524169922, "global_step": 88353, "epoch": 2103} {"train_loss": -6.230083465576172, "global_step": 88354, "epoch": 2103} {"train_loss": -6.242576599121094, "global_step": 88355, "epoch": 2103} {"train_loss": -6.26716947555542, "global_step": 88356, "epoch": 2103} {"train_loss": -6.17794132232666, "global_step": 88357, "epoch": 2103} {"train_loss": -6.105642318725586, "global_step": 88358, "epoch": 2103} {"train_loss": -6.261034965515137, "global_step": 88359, "epoch": 2103} {"train_loss": -6.32002067565918, "global_step": 88360, "epoch": 2103} {"train_loss": -6.25835657119751, "global_step": 88361, "epoch": 2103} {"train_loss": -6.149971008300781, "global_step": 88362, "epoch": 2103} {"train_loss": -6.259363174438477, "global_step": 88363, "epoch": 2103} {"train_loss": -6.248574733734131, "global_step": 88364, "epoch": 2103} {"train_loss": -6.298365592956543, "global_step": 88365, "epoch": 2103} {"train_loss": -6.216007232666016, "global_step": 88366, "epoch": 2103} {"train_loss": -6.236672526314145, "global_step": 88367, "epoch": 2103, "val_loss": 67953.765625} {"train_loss": -6.2215189933776855, "global_step": 88368, "epoch": 2104} {"train_loss": -6.382328987121582, "global_step": 88369, "epoch": 2104} {"train_loss": -6.302736282348633, "global_step": 88370, "epoch": 2104} {"train_loss": -6.136258602142334, "global_step": 88371, "epoch": 2104} {"train_loss": -6.177371978759766, "global_step": 88372, "epoch": 2104} {"train_loss": -6.187988758087158, "global_step": 88373, "epoch": 2104} {"train_loss": -6.290008068084717, "global_step": 88374, "epoch": 2104} {"train_loss": -6.402369022369385, "global_step": 88375, "epoch": 2104} {"train_loss": -6.206037521362305, "global_step": 88376, "epoch": 2104} {"train_loss": -6.242792129516602, "global_step": 88377, "epoch": 2104} {"train_loss": -6.142806529998779, "global_step": 88378, "epoch": 2104} {"train_loss": -6.319070816040039, "global_step": 88379, "epoch": 2104} {"train_loss": -6.165370941162109, "global_step": 88380, "epoch": 2104} {"train_loss": -6.360699653625488, "global_step": 88381, "epoch": 2104} {"train_loss": -6.230627059936523, "global_step": 88382, "epoch": 2104} {"train_loss": -6.289936065673828, "global_step": 88383, "epoch": 2104} {"train_loss": -6.3346757888793945, "global_step": 88384, "epoch": 2104} {"train_loss": -6.272162437438965, "global_step": 88385, "epoch": 2104} {"train_loss": -6.237491130828857, "global_step": 88386, "epoch": 2104} {"train_loss": -6.243664741516113, "global_step": 88387, "epoch": 2104} {"train_loss": -6.1681623458862305, "global_step": 88388, "epoch": 2104} {"train_loss": -6.3352203369140625, "global_step": 88389, "epoch": 2104} {"train_loss": -6.227878570556641, "global_step": 88390, "epoch": 2104} {"train_loss": -6.210999965667725, "global_step": 88391, "epoch": 2104} {"train_loss": -6.1825737953186035, "global_step": 88392, "epoch": 2104} {"train_loss": -6.253182411193848, "global_step": 88393, "epoch": 2104} {"train_loss": -6.2804341316223145, "global_step": 88394, "epoch": 2104} {"train_loss": -6.324042320251465, "global_step": 88395, "epoch": 2104} {"train_loss": -6.245131015777588, "global_step": 88396, "epoch": 2104} {"train_loss": -6.311962127685547, "global_step": 88397, "epoch": 2104} {"train_loss": -6.305793762207031, "global_step": 88398, "epoch": 2104} {"train_loss": -6.238208293914795, "global_step": 88399, "epoch": 2104} {"train_loss": -6.2520036697387695, "global_step": 88400, "epoch": 2104} {"train_loss": -6.244867324829102, "global_step": 88401, "epoch": 2104} {"train_loss": -6.177873611450195, "global_step": 88402, "epoch": 2104} {"train_loss": -6.195586204528809, "global_step": 88403, "epoch": 2104} {"train_loss": -6.146928787231445, "global_step": 88404, "epoch": 2104} {"train_loss": -6.150177955627441, "global_step": 88405, "epoch": 2104} {"train_loss": -6.070247173309326, "global_step": 88406, "epoch": 2104} {"train_loss": -6.138975143432617, "global_step": 88407, "epoch": 2104} {"train_loss": -6.305643081665039, "global_step": 88408, "epoch": 2104} {"train_loss": -6.237656252724784, "global_step": 88409, "epoch": 2104, "val_loss": 68241.4609375} {"train_loss": -6.111745834350586, "global_step": 88410, "epoch": 2105} {"train_loss": -6.269599914550781, "global_step": 88411, "epoch": 2105} {"train_loss": -6.272922515869141, "global_step": 88412, "epoch": 2105} {"train_loss": -6.106658935546875, "global_step": 88413, "epoch": 2105} {"train_loss": -6.194761276245117, "global_step": 88414, "epoch": 2105} {"train_loss": -6.095852851867676, "global_step": 88415, "epoch": 2105} {"train_loss": -6.107168197631836, "global_step": 88416, "epoch": 2105} {"train_loss": -6.114106178283691, "global_step": 88417, "epoch": 2105} {"train_loss": -6.208441257476807, "global_step": 88418, "epoch": 2105} {"train_loss": -6.1856689453125, "global_step": 88419, "epoch": 2105} {"train_loss": -6.169189453125, "global_step": 88420, "epoch": 2105} {"train_loss": -6.219221115112305, "global_step": 88421, "epoch": 2105} {"train_loss": -6.239830493927002, "global_step": 88422, "epoch": 2105} {"train_loss": -6.235915184020996, "global_step": 88423, "epoch": 2105} {"train_loss": -6.228558540344238, "global_step": 88424, "epoch": 2105} {"train_loss": -6.226629257202148, "global_step": 88425, "epoch": 2105} {"train_loss": -6.27166748046875, "global_step": 88426, "epoch": 2105} {"train_loss": -6.182987213134766, "global_step": 88427, "epoch": 2105} {"train_loss": -6.2395548820495605, "global_step": 88428, "epoch": 2105} {"train_loss": -6.2076287269592285, "global_step": 88429, "epoch": 2105} {"train_loss": -6.146358013153076, "global_step": 88430, "epoch": 2105} {"train_loss": -6.214962005615234, "global_step": 88431, "epoch": 2105} {"train_loss": -6.266039848327637, "global_step": 88432, "epoch": 2105} {"train_loss": -6.170899391174316, "global_step": 88433, "epoch": 2105} {"train_loss": -6.2928290367126465, "global_step": 88434, "epoch": 2105} {"train_loss": -6.2416887283325195, "global_step": 88435, "epoch": 2105} {"train_loss": -6.2000322341918945, "global_step": 88436, "epoch": 2105} {"train_loss": -6.148242950439453, "global_step": 88437, "epoch": 2105} {"train_loss": -6.234338760375977, "global_step": 88438, "epoch": 2105} {"train_loss": -6.070396900177002, "global_step": 88439, "epoch": 2105} {"train_loss": -6.335041522979736, "global_step": 88440, "epoch": 2105} {"train_loss": -6.22728157043457, "global_step": 88441, "epoch": 2105} {"train_loss": -6.342179775238037, "global_step": 88442, "epoch": 2105} {"train_loss": -6.175155162811279, "global_step": 88443, "epoch": 2105} {"train_loss": -6.240901947021484, "global_step": 88444, "epoch": 2105} {"train_loss": -6.065560340881348, "global_step": 88445, "epoch": 2105} {"train_loss": -6.136979103088379, "global_step": 88446, "epoch": 2105} {"train_loss": -6.082147598266602, "global_step": 88447, "epoch": 2105} {"train_loss": -6.312013626098633, "global_step": 88448, "epoch": 2105} {"train_loss": -6.303989410400391, "global_step": 88449, "epoch": 2105} {"train_loss": -6.218697547912598, "global_step": 88450, "epoch": 2105} {"train_loss": -6.203934283483596, "global_step": 88451, "epoch": 2105, "val_loss": 68134.921875} {"train_loss": -6.1775102615356445, "global_step": 88452, "epoch": 2106} {"train_loss": -6.237878799438477, "global_step": 88453, "epoch": 2106} {"train_loss": -6.2487945556640625, "global_step": 88454, "epoch": 2106} {"train_loss": -6.043207168579102, "global_step": 88455, "epoch": 2106} {"train_loss": -6.186577796936035, "global_step": 88456, "epoch": 2106} {"train_loss": -6.206958293914795, "global_step": 88457, "epoch": 2106} {"train_loss": -6.1637163162231445, "global_step": 88458, "epoch": 2106} {"train_loss": -6.169366359710693, "global_step": 88459, "epoch": 2106} {"train_loss": -6.2454705238342285, "global_step": 88460, "epoch": 2106} {"train_loss": -6.1900248527526855, "global_step": 88461, "epoch": 2106} {"train_loss": -6.221146583557129, "global_step": 88462, "epoch": 2106} {"train_loss": -6.23642110824585, "global_step": 88463, "epoch": 2106} {"train_loss": -6.2148823738098145, "global_step": 88464, "epoch": 2106} {"train_loss": -6.241475582122803, "global_step": 88465, "epoch": 2106} {"train_loss": -6.222893714904785, "global_step": 88466, "epoch": 2106} {"train_loss": -6.264128684997559, "global_step": 88467, "epoch": 2106} {"train_loss": -6.0986104011535645, "global_step": 88468, "epoch": 2106} {"train_loss": -6.196816921234131, "global_step": 88469, "epoch": 2106} {"train_loss": -6.327212333679199, "global_step": 88470, "epoch": 2106} {"train_loss": -6.169122695922852, "global_step": 88471, "epoch": 2106} {"train_loss": -6.126956939697266, "global_step": 88472, "epoch": 2106} {"train_loss": -6.213494300842285, "global_step": 88473, "epoch": 2106} {"train_loss": -6.256263732910156, "global_step": 88474, "epoch": 2106} {"train_loss": -6.26621150970459, "global_step": 88475, "epoch": 2106} {"train_loss": -6.1708526611328125, "global_step": 88476, "epoch": 2106} {"train_loss": -6.160233497619629, "global_step": 88477, "epoch": 2106} {"train_loss": -6.235405921936035, "global_step": 88478, "epoch": 2106} {"train_loss": -6.140381813049316, "global_step": 88479, "epoch": 2106} {"train_loss": -6.37239933013916, "global_step": 88480, "epoch": 2106} {"train_loss": -6.196864128112793, "global_step": 88481, "epoch": 2106} {"train_loss": -6.09459924697876, "global_step": 88482, "epoch": 2106} {"train_loss": -6.2516961097717285, "global_step": 88483, "epoch": 2106} {"train_loss": -6.233562469482422, "global_step": 88484, "epoch": 2106} {"train_loss": -6.3749189376831055, "global_step": 88485, "epoch": 2106} {"train_loss": -6.091886043548584, "global_step": 88486, "epoch": 2106} {"train_loss": -6.335677146911621, "global_step": 88487, "epoch": 2106} {"train_loss": -6.203334808349609, "global_step": 88488, "epoch": 2106} {"train_loss": -6.306266784667969, "global_step": 88489, "epoch": 2106} {"train_loss": -5.962813377380371, "global_step": 88490, "epoch": 2106} {"train_loss": -6.266217231750488, "global_step": 88491, "epoch": 2106} {"train_loss": -6.137857437133789, "global_step": 88492, "epoch": 2106} {"train_loss": -6.207397256578718, "global_step": 88493, "epoch": 2106, "val_loss": 67703.6640625} {"train_loss": -6.243781089782715, "global_step": 88494, "epoch": 2107} {"train_loss": -6.205310344696045, "global_step": 88495, "epoch": 2107} {"train_loss": -6.256315231323242, "global_step": 88496, "epoch": 2107} {"train_loss": -6.171838760375977, "global_step": 88497, "epoch": 2107} {"train_loss": -6.138709545135498, "global_step": 88498, "epoch": 2107} {"train_loss": -6.168548583984375, "global_step": 88499, "epoch": 2107} {"train_loss": -6.1152801513671875, "global_step": 88500, "epoch": 2107} {"train_loss": -6.094864845275879, "global_step": 88501, "epoch": 2107} {"train_loss": -6.225423336029053, "global_step": 88502, "epoch": 2107} {"train_loss": -6.006028175354004, "global_step": 88503, "epoch": 2107} {"train_loss": -6.200040817260742, "global_step": 88504, "epoch": 2107} {"train_loss": -6.16302490234375, "global_step": 88505, "epoch": 2107} {"train_loss": -6.083442211151123, "global_step": 88506, "epoch": 2107} {"train_loss": -6.055178642272949, "global_step": 88507, "epoch": 2107} {"train_loss": -6.200582981109619, "global_step": 88508, "epoch": 2107} {"train_loss": -6.227851390838623, "global_step": 88509, "epoch": 2107} {"train_loss": -6.2490386962890625, "global_step": 88510, "epoch": 2107} {"train_loss": -6.199484348297119, "global_step": 88511, "epoch": 2107} {"train_loss": -6.239715576171875, "global_step": 88512, "epoch": 2107} {"train_loss": -6.132333755493164, "global_step": 88513, "epoch": 2107} {"train_loss": -6.309885501861572, "global_step": 88514, "epoch": 2107} {"train_loss": -6.182966232299805, "global_step": 88515, "epoch": 2107} {"train_loss": -6.3317742347717285, "global_step": 88516, "epoch": 2107} {"train_loss": -6.351204872131348, "global_step": 88517, "epoch": 2107} {"train_loss": -6.17054557800293, "global_step": 88518, "epoch": 2107} {"train_loss": -6.156764507293701, "global_step": 88519, "epoch": 2107} {"train_loss": -6.170170307159424, "global_step": 88520, "epoch": 2107} {"train_loss": -6.256097316741943, "global_step": 88521, "epoch": 2107} {"train_loss": -6.242769241333008, "global_step": 88522, "epoch": 2107} {"train_loss": -6.251623630523682, "global_step": 88523, "epoch": 2107} {"train_loss": -6.283909797668457, "global_step": 88524, "epoch": 2107} {"train_loss": -6.298688888549805, "global_step": 88525, "epoch": 2107} {"train_loss": -6.1812744140625, "global_step": 88526, "epoch": 2107} {"train_loss": -6.296299934387207, "global_step": 88527, "epoch": 2107} {"train_loss": -6.165214538574219, "global_step": 88528, "epoch": 2107} {"train_loss": -6.224496841430664, "global_step": 88529, "epoch": 2107} {"train_loss": -6.1485276222229, "global_step": 88530, "epoch": 2107} {"train_loss": -6.111377239227295, "global_step": 88531, "epoch": 2107} {"train_loss": -6.1136932373046875, "global_step": 88532, "epoch": 2107} {"train_loss": -6.207834243774414, "global_step": 88533, "epoch": 2107} {"train_loss": -6.1352033615112305, "global_step": 88534, "epoch": 2107} {"train_loss": -6.195303496860323, "global_step": 88535, "epoch": 2107, "val_loss": 67863.09375} {"train_loss": -6.176486968994141, "global_step": 88536, "epoch": 2108} {"train_loss": -6.159519672393799, "global_step": 88537, "epoch": 2108} {"train_loss": -6.161789417266846, "global_step": 88538, "epoch": 2108} {"train_loss": -6.101217746734619, "global_step": 88539, "epoch": 2108} {"train_loss": -6.19896936416626, "global_step": 88540, "epoch": 2108} {"train_loss": -6.1743574142456055, "global_step": 88541, "epoch": 2108} {"train_loss": -6.239270210266113, "global_step": 88542, "epoch": 2108} {"train_loss": -6.196874618530273, "global_step": 88543, "epoch": 2108} {"train_loss": -6.155920028686523, "global_step": 88544, "epoch": 2108} {"train_loss": -6.226421356201172, "global_step": 88545, "epoch": 2108} {"train_loss": -6.173704147338867, "global_step": 88546, "epoch": 2108} {"train_loss": -6.259246349334717, "global_step": 88547, "epoch": 2108} {"train_loss": -6.059605121612549, "global_step": 88548, "epoch": 2108} {"train_loss": -6.050813674926758, "global_step": 88549, "epoch": 2108} {"train_loss": -6.174215316772461, "global_step": 88550, "epoch": 2108} {"train_loss": -6.120695114135742, "global_step": 88551, "epoch": 2108} {"train_loss": -6.218599319458008, "global_step": 88552, "epoch": 2108} {"train_loss": -6.219639301300049, "global_step": 88553, "epoch": 2108} {"train_loss": -6.272662162780762, "global_step": 88554, "epoch": 2108} {"train_loss": -6.2716898918151855, "global_step": 88555, "epoch": 2108} {"train_loss": -6.230564117431641, "global_step": 88556, "epoch": 2108} {"train_loss": -6.201530456542969, "global_step": 88557, "epoch": 2108} {"train_loss": -6.225992679595947, "global_step": 88558, "epoch": 2108} {"train_loss": -6.356886863708496, "global_step": 88559, "epoch": 2108} {"train_loss": -6.236720085144043, "global_step": 88560, "epoch": 2108} {"train_loss": -6.2176408767700195, "global_step": 88561, "epoch": 2108} {"train_loss": -6.234503746032715, "global_step": 88562, "epoch": 2108} {"train_loss": -6.322731018066406, "global_step": 88563, "epoch": 2108} {"train_loss": -6.232089042663574, "global_step": 88564, "epoch": 2108} {"train_loss": -6.21498966217041, "global_step": 88565, "epoch": 2108} {"train_loss": -6.164048194885254, "global_step": 88566, "epoch": 2108} {"train_loss": -6.318453311920166, "global_step": 88567, "epoch": 2108} {"train_loss": -6.306833267211914, "global_step": 88568, "epoch": 2108} {"train_loss": -6.208678245544434, "global_step": 88569, "epoch": 2108} {"train_loss": -6.239512920379639, "global_step": 88570, "epoch": 2108} {"train_loss": -6.219420433044434, "global_step": 88571, "epoch": 2108} {"train_loss": -6.261717319488525, "global_step": 88572, "epoch": 2108} {"train_loss": -6.27077579498291, "global_step": 88573, "epoch": 2108} {"train_loss": -6.176149368286133, "global_step": 88574, "epoch": 2108} {"train_loss": -6.1030497550964355, "global_step": 88575, "epoch": 2108} {"train_loss": -6.229349136352539, "global_step": 88576, "epoch": 2108} {"train_loss": -6.2133405322120305, "global_step": 88577, "epoch": 2108, "val_loss": 67725.421875} {"train_loss": -6.276257038116455, "global_step": 88578, "epoch": 2109} {"train_loss": -6.2785210609436035, "global_step": 88579, "epoch": 2109} {"train_loss": -6.274858474731445, "global_step": 88580, "epoch": 2109} {"train_loss": -6.173511505126953, "global_step": 88581, "epoch": 2109} {"train_loss": -6.281388282775879, "global_step": 88582, "epoch": 2109} {"train_loss": -6.24787712097168, "global_step": 88583, "epoch": 2109} {"train_loss": -6.401344299316406, "global_step": 88584, "epoch": 2109} {"train_loss": -6.257780075073242, "global_step": 88585, "epoch": 2109} {"train_loss": -6.203175067901611, "global_step": 88586, "epoch": 2109} {"train_loss": -6.271966934204102, "global_step": 88587, "epoch": 2109} {"train_loss": -6.256680488586426, "global_step": 88588, "epoch": 2109} {"train_loss": -6.250720024108887, "global_step": 88589, "epoch": 2109} {"train_loss": -6.368023872375488, "global_step": 88590, "epoch": 2109} {"train_loss": -6.231451034545898, "global_step": 88591, "epoch": 2109} {"train_loss": -6.2961626052856445, "global_step": 88592, "epoch": 2109} {"train_loss": -6.234627723693848, "global_step": 88593, "epoch": 2109} {"train_loss": -6.33128547668457, "global_step": 88594, "epoch": 2109} {"train_loss": -6.306832313537598, "global_step": 88595, "epoch": 2109} {"train_loss": -6.252834796905518, "global_step": 88596, "epoch": 2109} {"train_loss": -6.225298881530762, "global_step": 88597, "epoch": 2109} {"train_loss": -6.25345516204834, "global_step": 88598, "epoch": 2109} {"train_loss": -6.115182399749756, "global_step": 88599, "epoch": 2109} {"train_loss": -6.258296966552734, "global_step": 88600, "epoch": 2109} {"train_loss": -6.250726699829102, "global_step": 88601, "epoch": 2109} {"train_loss": -6.336336135864258, "global_step": 88602, "epoch": 2109} {"train_loss": -6.203198432922363, "global_step": 88603, "epoch": 2109} {"train_loss": -6.213338851928711, "global_step": 88604, "epoch": 2109} {"train_loss": -6.1706223487854, "global_step": 88605, "epoch": 2109} {"train_loss": -6.113478660583496, "global_step": 88606, "epoch": 2109} {"train_loss": -6.274957656860352, "global_step": 88607, "epoch": 2109} {"train_loss": -6.171491622924805, "global_step": 88608, "epoch": 2109} {"train_loss": -6.148922920227051, "global_step": 88609, "epoch": 2109} {"train_loss": -6.2444024085998535, "global_step": 88610, "epoch": 2109} {"train_loss": -6.139823913574219, "global_step": 88611, "epoch": 2109} {"train_loss": -6.340686798095703, "global_step": 88612, "epoch": 2109} {"train_loss": -6.177690505981445, "global_step": 88613, "epoch": 2109} {"train_loss": -6.167302131652832, "global_step": 88614, "epoch": 2109} {"train_loss": -6.190582275390625, "global_step": 88615, "epoch": 2109} {"train_loss": -6.271554946899414, "global_step": 88616, "epoch": 2109} {"train_loss": -6.345177173614502, "global_step": 88617, "epoch": 2109} {"train_loss": -6.258544921875, "global_step": 88618, "epoch": 2109} {"train_loss": -6.244605189278012, "global_step": 88619, "epoch": 2109, "val_loss": 67828.9140625} {"train_loss": -6.301348686218262, "global_step": 88620, "epoch": 2110} {"train_loss": -6.171402931213379, "global_step": 88621, "epoch": 2110} {"train_loss": -6.138001441955566, "global_step": 88622, "epoch": 2110} {"train_loss": -6.180006980895996, "global_step": 88623, "epoch": 2110} {"train_loss": -6.241928577423096, "global_step": 88624, "epoch": 2110} {"train_loss": -6.2492828369140625, "global_step": 88625, "epoch": 2110} {"train_loss": -6.241768836975098, "global_step": 88626, "epoch": 2110} {"train_loss": -6.212626934051514, "global_step": 88627, "epoch": 2110} {"train_loss": -6.255009174346924, "global_step": 88628, "epoch": 2110} {"train_loss": -6.2089948654174805, "global_step": 88629, "epoch": 2110} {"train_loss": -6.098354339599609, "global_step": 88630, "epoch": 2110} {"train_loss": -6.139779090881348, "global_step": 88631, "epoch": 2110} {"train_loss": -6.243699073791504, "global_step": 88632, "epoch": 2110} {"train_loss": -6.196473121643066, "global_step": 88633, "epoch": 2110} {"train_loss": -6.179536819458008, "global_step": 88634, "epoch": 2110} {"train_loss": -6.072776794433594, "global_step": 88635, "epoch": 2110} {"train_loss": -6.177126884460449, "global_step": 88636, "epoch": 2110} {"train_loss": -6.313900947570801, "global_step": 88637, "epoch": 2110} {"train_loss": -6.13675594329834, "global_step": 88638, "epoch": 2110} {"train_loss": -6.233440399169922, "global_step": 88639, "epoch": 2110} {"train_loss": -6.253133773803711, "global_step": 88640, "epoch": 2110} {"train_loss": -6.242203235626221, "global_step": 88641, "epoch": 2110} {"train_loss": -6.201390266418457, "global_step": 88642, "epoch": 2110} {"train_loss": -6.2109270095825195, "global_step": 88643, "epoch": 2110} {"train_loss": -6.320285797119141, "global_step": 88644, "epoch": 2110} {"train_loss": -6.311684608459473, "global_step": 88645, "epoch": 2110} {"train_loss": -6.237834453582764, "global_step": 88646, "epoch": 2110} {"train_loss": -6.172542572021484, "global_step": 88647, "epoch": 2110} {"train_loss": -6.310776710510254, "global_step": 88648, "epoch": 2110} {"train_loss": -6.331168174743652, "global_step": 88649, "epoch": 2110} {"train_loss": -6.278641223907471, "global_step": 88650, "epoch": 2110} {"train_loss": -6.179204940795898, "global_step": 88651, "epoch": 2110} {"train_loss": -6.288304805755615, "global_step": 88652, "epoch": 2110} {"train_loss": -6.350522994995117, "global_step": 88653, "epoch": 2110} {"train_loss": -6.2081732749938965, "global_step": 88654, "epoch": 2110} {"train_loss": -6.201172351837158, "global_step": 88655, "epoch": 2110} {"train_loss": -6.1953325271606445, "global_step": 88656, "epoch": 2110} {"train_loss": -6.245396137237549, "global_step": 88657, "epoch": 2110} {"train_loss": -6.256165981292725, "global_step": 88658, "epoch": 2110} {"train_loss": -6.267075538635254, "global_step": 88659, "epoch": 2110} {"train_loss": -6.324423789978027, "global_step": 88660, "epoch": 2110} {"train_loss": -6.230107375553676, "global_step": 88661, "epoch": 2110, "val_loss": 67862.234375} {"train_loss": -6.191305160522461, "global_step": 88662, "epoch": 2111} {"train_loss": -6.297987461090088, "global_step": 88663, "epoch": 2111} {"train_loss": -6.263272285461426, "global_step": 88664, "epoch": 2111} {"train_loss": -6.234655380249023, "global_step": 88665, "epoch": 2111} {"train_loss": -6.225703716278076, "global_step": 88666, "epoch": 2111} {"train_loss": -6.13045072555542, "global_step": 88667, "epoch": 2111} {"train_loss": -6.192974090576172, "global_step": 88668, "epoch": 2111} {"train_loss": -6.173201560974121, "global_step": 88669, "epoch": 2111} {"train_loss": -6.299267768859863, "global_step": 88670, "epoch": 2111} {"train_loss": -6.24950647354126, "global_step": 88671, "epoch": 2111} {"train_loss": -6.362570762634277, "global_step": 88672, "epoch": 2111} {"train_loss": -6.365665912628174, "global_step": 88673, "epoch": 2111} {"train_loss": -6.230180263519287, "global_step": 88674, "epoch": 2111} {"train_loss": -6.2671122550964355, "global_step": 88675, "epoch": 2111} {"train_loss": -6.185482501983643, "global_step": 88676, "epoch": 2111} {"train_loss": -6.275250434875488, "global_step": 88677, "epoch": 2111} {"train_loss": -6.299717426300049, "global_step": 88678, "epoch": 2111} {"train_loss": -6.231396198272705, "global_step": 88679, "epoch": 2111} {"train_loss": -6.176474571228027, "global_step": 88680, "epoch": 2111} {"train_loss": -6.202846527099609, "global_step": 88681, "epoch": 2111} {"train_loss": -6.164862155914307, "global_step": 88682, "epoch": 2111} {"train_loss": -6.086069107055664, "global_step": 88683, "epoch": 2111} {"train_loss": -6.328646183013916, "global_step": 88684, "epoch": 2111} {"train_loss": -6.093848705291748, "global_step": 88685, "epoch": 2111} {"train_loss": -6.138063430786133, "global_step": 88686, "epoch": 2111} {"train_loss": -6.180466175079346, "global_step": 88687, "epoch": 2111} {"train_loss": -6.113351345062256, "global_step": 88688, "epoch": 2111} {"train_loss": -6.196475028991699, "global_step": 88689, "epoch": 2111} {"train_loss": -6.184447288513184, "global_step": 88690, "epoch": 2111} {"train_loss": -6.126140594482422, "global_step": 88691, "epoch": 2111} {"train_loss": -6.288226127624512, "global_step": 88692, "epoch": 2111} {"train_loss": -6.167125225067139, "global_step": 88693, "epoch": 2111} {"train_loss": -6.187898635864258, "global_step": 88694, "epoch": 2111} {"train_loss": -6.093958377838135, "global_step": 88695, "epoch": 2111} {"train_loss": -6.1132636070251465, "global_step": 88696, "epoch": 2111} {"train_loss": -6.171767234802246, "global_step": 88697, "epoch": 2111} {"train_loss": -6.052350044250488, "global_step": 88698, "epoch": 2111} {"train_loss": -6.228425979614258, "global_step": 88699, "epoch": 2111} {"train_loss": -6.065252304077148, "global_step": 88700, "epoch": 2111} {"train_loss": -6.2398576736450195, "global_step": 88701, "epoch": 2111} {"train_loss": -6.131743907928467, "global_step": 88702, "epoch": 2111} {"train_loss": -6.197796026865642, "global_step": 88703, "epoch": 2111, "val_loss": 68070.96875} {"train_loss": -6.060044288635254, "global_step": 88704, "epoch": 2112} {"train_loss": -6.020057201385498, "global_step": 88705, "epoch": 2112} {"train_loss": -6.162870407104492, "global_step": 88706, "epoch": 2112} {"train_loss": -6.086528778076172, "global_step": 88707, "epoch": 2112} {"train_loss": -6.209502220153809, "global_step": 88708, "epoch": 2112} {"train_loss": -6.034968852996826, "global_step": 88709, "epoch": 2112} {"train_loss": -6.142726898193359, "global_step": 88710, "epoch": 2112} {"train_loss": -5.970038414001465, "global_step": 88711, "epoch": 2112} {"train_loss": -6.205117702484131, "global_step": 88712, "epoch": 2112} {"train_loss": -6.023777008056641, "global_step": 88713, "epoch": 2112} {"train_loss": -6.083830833435059, "global_step": 88714, "epoch": 2112} {"train_loss": -6.099637031555176, "global_step": 88715, "epoch": 2112} {"train_loss": -6.241076946258545, "global_step": 88716, "epoch": 2112} {"train_loss": -6.127884864807129, "global_step": 88717, "epoch": 2112} {"train_loss": -6.22927188873291, "global_step": 88718, "epoch": 2112} {"train_loss": -6.117435455322266, "global_step": 88719, "epoch": 2112} {"train_loss": -6.173238754272461, "global_step": 88720, "epoch": 2112} {"train_loss": -6.22713041305542, "global_step": 88721, "epoch": 2112} {"train_loss": -6.111444473266602, "global_step": 88722, "epoch": 2112} {"train_loss": -6.201615333557129, "global_step": 88723, "epoch": 2112} {"train_loss": -6.048585891723633, "global_step": 88724, "epoch": 2112} {"train_loss": -6.280750751495361, "global_step": 88725, "epoch": 2112} {"train_loss": -6.263554096221924, "global_step": 88726, "epoch": 2112} {"train_loss": -6.165590763092041, "global_step": 88727, "epoch": 2112} {"train_loss": -6.236351490020752, "global_step": 88728, "epoch": 2112} {"train_loss": -6.144637107849121, "global_step": 88729, "epoch": 2112} {"train_loss": -6.178108215332031, "global_step": 88730, "epoch": 2112} {"train_loss": -6.192331790924072, "global_step": 88731, "epoch": 2112} {"train_loss": -6.284913539886475, "global_step": 88732, "epoch": 2112} {"train_loss": -6.254148006439209, "global_step": 88733, "epoch": 2112} {"train_loss": -6.278746128082275, "global_step": 88734, "epoch": 2112} {"train_loss": -6.149430274963379, "global_step": 88735, "epoch": 2112} {"train_loss": -6.253814220428467, "global_step": 88736, "epoch": 2112} {"train_loss": -6.261629104614258, "global_step": 88737, "epoch": 2112} {"train_loss": -6.294661521911621, "global_step": 88738, "epoch": 2112} {"train_loss": -6.2203826904296875, "global_step": 88739, "epoch": 2112} {"train_loss": -6.278883934020996, "global_step": 88740, "epoch": 2112} {"train_loss": -6.310923099517822, "global_step": 88741, "epoch": 2112} {"train_loss": -6.252687454223633, "global_step": 88742, "epoch": 2112} {"train_loss": -6.2664971351623535, "global_step": 88743, "epoch": 2112} {"train_loss": -6.246808052062988, "global_step": 88744, "epoch": 2112} {"train_loss": -6.181355885096958, "global_step": 88745, "epoch": 2112, "val_loss": 67718.4609375} {"train_loss": -6.213335037231445, "global_step": 88746, "epoch": 2113} {"train_loss": -6.220184803009033, "global_step": 88747, "epoch": 2113} {"train_loss": -6.1670026779174805, "global_step": 88748, "epoch": 2113} {"train_loss": -6.152409076690674, "global_step": 88749, "epoch": 2113} {"train_loss": -6.207700729370117, "global_step": 88750, "epoch": 2113} {"train_loss": -6.2837324142456055, "global_step": 88751, "epoch": 2113} {"train_loss": -6.0581769943237305, "global_step": 88752, "epoch": 2113} {"train_loss": -6.190288543701172, "global_step": 88753, "epoch": 2113} {"train_loss": -6.36336612701416, "global_step": 88754, "epoch": 2113} {"train_loss": -6.160924911499023, "global_step": 88755, "epoch": 2113} {"train_loss": -6.269126892089844, "global_step": 88756, "epoch": 2113} {"train_loss": -6.263904094696045, "global_step": 88757, "epoch": 2113} {"train_loss": -6.206038475036621, "global_step": 88758, "epoch": 2113} {"train_loss": -6.209980010986328, "global_step": 88759, "epoch": 2113} {"train_loss": -6.2765607833862305, "global_step": 88760, "epoch": 2113} {"train_loss": -6.190120697021484, "global_step": 88761, "epoch": 2113} {"train_loss": -6.193301200866699, "global_step": 88762, "epoch": 2113} {"train_loss": -6.149321556091309, "global_step": 88763, "epoch": 2113} {"train_loss": -6.228283882141113, "global_step": 88764, "epoch": 2113} {"train_loss": -6.256502151489258, "global_step": 88765, "epoch": 2113} {"train_loss": -6.216681957244873, "global_step": 88766, "epoch": 2113} {"train_loss": -6.280609130859375, "global_step": 88767, "epoch": 2113} {"train_loss": -6.194246292114258, "global_step": 88768, "epoch": 2113} {"train_loss": -6.287654399871826, "global_step": 88769, "epoch": 2113} {"train_loss": -6.234095573425293, "global_step": 88770, "epoch": 2113} {"train_loss": -6.228212356567383, "global_step": 88771, "epoch": 2113} {"train_loss": -6.2418212890625, "global_step": 88772, "epoch": 2113} {"train_loss": -6.223946571350098, "global_step": 88773, "epoch": 2113} {"train_loss": -6.188041687011719, "global_step": 88774, "epoch": 2113} {"train_loss": -6.261016845703125, "global_step": 88775, "epoch": 2113} {"train_loss": -6.1589765548706055, "global_step": 88776, "epoch": 2113} {"train_loss": -6.188899993896484, "global_step": 88777, "epoch": 2113} {"train_loss": -6.115767478942871, "global_step": 88778, "epoch": 2113} {"train_loss": -6.144262313842773, "global_step": 88779, "epoch": 2113} {"train_loss": -6.065725803375244, "global_step": 88780, "epoch": 2113} {"train_loss": -6.1903581619262695, "global_step": 88781, "epoch": 2113} {"train_loss": -6.181303977966309, "global_step": 88782, "epoch": 2113} {"train_loss": -6.159770965576172, "global_step": 88783, "epoch": 2113} {"train_loss": -6.2016730308532715, "global_step": 88784, "epoch": 2113} {"train_loss": -6.155123233795166, "global_step": 88785, "epoch": 2113} {"train_loss": -6.1672444343566895, "global_step": 88786, "epoch": 2113} {"train_loss": -6.205550568444388, "global_step": 88787, "epoch": 2113, "val_loss": 67825.7109375} {"train_loss": -6.28386926651001, "global_step": 88788, "epoch": 2114} {"train_loss": -6.300500392913818, "global_step": 88789, "epoch": 2114} {"train_loss": -6.279172420501709, "global_step": 88790, "epoch": 2114} {"train_loss": -6.196422576904297, "global_step": 88791, "epoch": 2114} {"train_loss": -6.238513946533203, "global_step": 88792, "epoch": 2114} {"train_loss": -6.3281402587890625, "global_step": 88793, "epoch": 2114} {"train_loss": -6.269490718841553, "global_step": 88794, "epoch": 2114} {"train_loss": -6.302280902862549, "global_step": 88795, "epoch": 2114} {"train_loss": -6.238645553588867, "global_step": 88796, "epoch": 2114} {"train_loss": -6.2989373207092285, "global_step": 88797, "epoch": 2114} {"train_loss": -6.293663501739502, "global_step": 88798, "epoch": 2114} {"train_loss": -6.19075345993042, "global_step": 88799, "epoch": 2114} {"train_loss": -6.395135879516602, "global_step": 88800, "epoch": 2114} {"train_loss": -6.404955863952637, "global_step": 88801, "epoch": 2114} {"train_loss": -6.273937702178955, "global_step": 88802, "epoch": 2114} {"train_loss": -6.292758464813232, "global_step": 88803, "epoch": 2114} {"train_loss": -6.269838809967041, "global_step": 88804, "epoch": 2114} {"train_loss": -6.3119707107543945, "global_step": 88805, "epoch": 2114} {"train_loss": -6.156937122344971, "global_step": 88806, "epoch": 2114} {"train_loss": -6.267453670501709, "global_step": 88807, "epoch": 2114} {"train_loss": -6.223548412322998, "global_step": 88808, "epoch": 2114} {"train_loss": -6.24091911315918, "global_step": 88809, "epoch": 2114} {"train_loss": -6.245236396789551, "global_step": 88810, "epoch": 2114} {"train_loss": -6.211440086364746, "global_step": 88811, "epoch": 2114} {"train_loss": -6.154139518737793, "global_step": 88812, "epoch": 2114} {"train_loss": -6.190062999725342, "global_step": 88813, "epoch": 2114} {"train_loss": -6.386213302612305, "global_step": 88814, "epoch": 2114} {"train_loss": -6.112860679626465, "global_step": 88815, "epoch": 2114} {"train_loss": -6.2773637771606445, "global_step": 88816, "epoch": 2114} {"train_loss": -6.299650192260742, "global_step": 88817, "epoch": 2114} {"train_loss": -6.219926357269287, "global_step": 88818, "epoch": 2114} {"train_loss": -6.318510055541992, "global_step": 88819, "epoch": 2114} {"train_loss": -6.192390441894531, "global_step": 88820, "epoch": 2114} {"train_loss": -6.1549787521362305, "global_step": 88821, "epoch": 2114} {"train_loss": -6.133405685424805, "global_step": 88822, "epoch": 2114} {"train_loss": -6.045110702514648, "global_step": 88823, "epoch": 2114} {"train_loss": -6.2634172439575195, "global_step": 88824, "epoch": 2114} {"train_loss": -6.282516956329346, "global_step": 88825, "epoch": 2114} {"train_loss": -6.0196123123168945, "global_step": 88826, "epoch": 2114} {"train_loss": -6.170493125915527, "global_step": 88827, "epoch": 2114} {"train_loss": -6.119717597961426, "global_step": 88828, "epoch": 2114} {"train_loss": -6.23716800553458, "global_step": 88829, "epoch": 2114, "val_loss": 67956.96875} {"train_loss": -6.130885124206543, "global_step": 88830, "epoch": 2115} {"train_loss": -6.17681884765625, "global_step": 88831, "epoch": 2115} {"train_loss": -6.206212997436523, "global_step": 88832, "epoch": 2115} {"train_loss": -6.24450159072876, "global_step": 88833, "epoch": 2115} {"train_loss": -6.117639541625977, "global_step": 88834, "epoch": 2115} {"train_loss": -6.088854789733887, "global_step": 88835, "epoch": 2115} {"train_loss": -6.1858367919921875, "global_step": 88836, "epoch": 2115} {"train_loss": -6.172949314117432, "global_step": 88837, "epoch": 2115} {"train_loss": -6.23918342590332, "global_step": 88838, "epoch": 2115} {"train_loss": -6.181949615478516, "global_step": 88839, "epoch": 2115} {"train_loss": -6.138270378112793, "global_step": 88840, "epoch": 2115} {"train_loss": -6.250761985778809, "global_step": 88841, "epoch": 2115} {"train_loss": -6.089949607849121, "global_step": 88842, "epoch": 2115} {"train_loss": -6.292018890380859, "global_step": 88843, "epoch": 2115} {"train_loss": -6.256258010864258, "global_step": 88844, "epoch": 2115} {"train_loss": -6.105674743652344, "global_step": 88845, "epoch": 2115} {"train_loss": -6.177459239959717, "global_step": 88846, "epoch": 2115} {"train_loss": -6.2174530029296875, "global_step": 88847, "epoch": 2115} {"train_loss": -6.263790130615234, "global_step": 88848, "epoch": 2115} {"train_loss": -6.288232326507568, "global_step": 88849, "epoch": 2115} {"train_loss": -6.105199337005615, "global_step": 88850, "epoch": 2115} {"train_loss": -6.347231388092041, "global_step": 88851, "epoch": 2115} {"train_loss": -6.288776874542236, "global_step": 88852, "epoch": 2115} {"train_loss": -6.280966758728027, "global_step": 88853, "epoch": 2115} {"train_loss": -6.3681488037109375, "global_step": 88854, "epoch": 2115} {"train_loss": -6.2248945236206055, "global_step": 88855, "epoch": 2115} {"train_loss": -6.121591567993164, "global_step": 88856, "epoch": 2115} {"train_loss": -6.333495140075684, "global_step": 88857, "epoch": 2115} {"train_loss": -6.162936210632324, "global_step": 88858, "epoch": 2115} {"train_loss": -6.222243309020996, "global_step": 88859, "epoch": 2115} {"train_loss": -6.306743144989014, "global_step": 88860, "epoch": 2115} {"train_loss": -6.208395004272461, "global_step": 88861, "epoch": 2115} {"train_loss": -6.121744155883789, "global_step": 88862, "epoch": 2115} {"train_loss": -6.171684265136719, "global_step": 88863, "epoch": 2115} {"train_loss": -6.28117036819458, "global_step": 88864, "epoch": 2115} {"train_loss": -6.163424015045166, "global_step": 88865, "epoch": 2115} {"train_loss": -6.28990364074707, "global_step": 88866, "epoch": 2115} {"train_loss": -6.265959739685059, "global_step": 88867, "epoch": 2115} {"train_loss": -6.248249053955078, "global_step": 88868, "epoch": 2115} {"train_loss": -6.253507614135742, "global_step": 88869, "epoch": 2115} {"train_loss": -6.370992660522461, "global_step": 88870, "epoch": 2115} {"train_loss": -6.218003522782099, "global_step": 88871, "epoch": 2115, "val_loss": 67870.4609375} {"train_loss": -6.269627571105957, "global_step": 88872, "epoch": 2116} {"train_loss": -6.2729597091674805, "global_step": 88873, "epoch": 2116} {"train_loss": -6.125479698181152, "global_step": 88874, "epoch": 2116} {"train_loss": -6.269030570983887, "global_step": 88875, "epoch": 2116} {"train_loss": -6.17797327041626, "global_step": 88876, "epoch": 2116} {"train_loss": -6.277498245239258, "global_step": 88877, "epoch": 2116} {"train_loss": -6.2117414474487305, "global_step": 88878, "epoch": 2116} {"train_loss": -6.230720520019531, "global_step": 88879, "epoch": 2116} {"train_loss": -6.26165771484375, "global_step": 88880, "epoch": 2116} {"train_loss": -6.322062969207764, "global_step": 88881, "epoch": 2116} {"train_loss": -6.211313247680664, "global_step": 88882, "epoch": 2116} {"train_loss": -6.294052600860596, "global_step": 88883, "epoch": 2116} {"train_loss": -6.225894451141357, "global_step": 88884, "epoch": 2116} {"train_loss": -6.283442497253418, "global_step": 88885, "epoch": 2116} {"train_loss": -6.285566329956055, "global_step": 88886, "epoch": 2116} {"train_loss": -6.235141754150391, "global_step": 88887, "epoch": 2116} {"train_loss": -6.210294723510742, "global_step": 88888, "epoch": 2116} {"train_loss": -6.1410675048828125, "global_step": 88889, "epoch": 2116} {"train_loss": -6.184536933898926, "global_step": 88890, "epoch": 2116} {"train_loss": -6.250307083129883, "global_step": 88891, "epoch": 2116} {"train_loss": -6.296781539916992, "global_step": 88892, "epoch": 2116} {"train_loss": -6.067296028137207, "global_step": 88893, "epoch": 2116} {"train_loss": -6.182765960693359, "global_step": 88894, "epoch": 2116} {"train_loss": -6.052761554718018, "global_step": 88895, "epoch": 2116} {"train_loss": -6.118603706359863, "global_step": 88896, "epoch": 2116} {"train_loss": -6.144582271575928, "global_step": 88897, "epoch": 2116} {"train_loss": -6.20943546295166, "global_step": 88898, "epoch": 2116} {"train_loss": -6.217298984527588, "global_step": 88899, "epoch": 2116} {"train_loss": -6.179594039916992, "global_step": 88900, "epoch": 2116} {"train_loss": -6.085755348205566, "global_step": 88901, "epoch": 2116} {"train_loss": -6.18851375579834, "global_step": 88902, "epoch": 2116} {"train_loss": -6.19040584564209, "global_step": 88903, "epoch": 2116} {"train_loss": -6.075096130371094, "global_step": 88904, "epoch": 2116} {"train_loss": -6.248441219329834, "global_step": 88905, "epoch": 2116} {"train_loss": -6.2302117347717285, "global_step": 88906, "epoch": 2116} {"train_loss": -6.266700744628906, "global_step": 88907, "epoch": 2116} {"train_loss": -6.217476844787598, "global_step": 88908, "epoch": 2116} {"train_loss": -6.1998491287231445, "global_step": 88909, "epoch": 2116} {"train_loss": -6.277795314788818, "global_step": 88910, "epoch": 2116} {"train_loss": -6.167605876922607, "global_step": 88911, "epoch": 2116} {"train_loss": -6.139021396636963, "global_step": 88912, "epoch": 2116} {"train_loss": -6.208103679475331, "global_step": 88913, "epoch": 2116, "val_loss": 67823.8515625} {"train_loss": -6.284817218780518, "global_step": 88914, "epoch": 2117} {"train_loss": -6.171824932098389, "global_step": 88915, "epoch": 2117} {"train_loss": -6.266122817993164, "global_step": 88916, "epoch": 2117} {"train_loss": -6.152570724487305, "global_step": 88917, "epoch": 2117} {"train_loss": -6.263647079467773, "global_step": 88918, "epoch": 2117} {"train_loss": -6.38131046295166, "global_step": 88919, "epoch": 2117} {"train_loss": -6.1910247802734375, "global_step": 88920, "epoch": 2117} {"train_loss": -6.244034767150879, "global_step": 88921, "epoch": 2117} {"train_loss": -6.143932342529297, "global_step": 88922, "epoch": 2117} {"train_loss": -6.18350887298584, "global_step": 88923, "epoch": 2117} {"train_loss": -6.271676540374756, "global_step": 88924, "epoch": 2117} {"train_loss": -6.234663009643555, "global_step": 88925, "epoch": 2117} {"train_loss": -6.164778232574463, "global_step": 88926, "epoch": 2117} {"train_loss": -6.0504350662231445, "global_step": 88927, "epoch": 2117} {"train_loss": -6.193835258483887, "global_step": 88928, "epoch": 2117} {"train_loss": -6.178995132446289, "global_step": 88929, "epoch": 2117} {"train_loss": -6.134383678436279, "global_step": 88930, "epoch": 2117} {"train_loss": -6.1592912673950195, "global_step": 88931, "epoch": 2117} {"train_loss": -6.098837852478027, "global_step": 88932, "epoch": 2117} {"train_loss": -6.166921615600586, "global_step": 88933, "epoch": 2117} {"train_loss": -6.171435356140137, "global_step": 88934, "epoch": 2117} {"train_loss": -6.130030632019043, "global_step": 88935, "epoch": 2117} {"train_loss": -6.11863899230957, "global_step": 88936, "epoch": 2117} {"train_loss": -6.123665809631348, "global_step": 88937, "epoch": 2117} {"train_loss": -6.145783424377441, "global_step": 88938, "epoch": 2117} {"train_loss": -6.168560028076172, "global_step": 88939, "epoch": 2117} {"train_loss": -6.156720161437988, "global_step": 88940, "epoch": 2117} {"train_loss": -6.163913249969482, "global_step": 88941, "epoch": 2117} {"train_loss": -6.151340961456299, "global_step": 88942, "epoch": 2117} {"train_loss": -6.09033203125, "global_step": 88943, "epoch": 2117} {"train_loss": -6.219210624694824, "global_step": 88944, "epoch": 2117} {"train_loss": -6.189906120300293, "global_step": 88945, "epoch": 2117} {"train_loss": -6.165778160095215, "global_step": 88946, "epoch": 2117} {"train_loss": -6.2732415199279785, "global_step": 88947, "epoch": 2117} {"train_loss": -6.144476890563965, "global_step": 88948, "epoch": 2117} {"train_loss": -6.153990745544434, "global_step": 88949, "epoch": 2117} {"train_loss": -6.236135482788086, "global_step": 88950, "epoch": 2117} {"train_loss": -6.056439399719238, "global_step": 88951, "epoch": 2117} {"train_loss": -6.2007737159729, "global_step": 88952, "epoch": 2117} {"train_loss": -6.182031154632568, "global_step": 88953, "epoch": 2117} {"train_loss": -6.1025614738464355, "global_step": 88954, "epoch": 2117} {"train_loss": -6.176749978746686, "global_step": 88955, "epoch": 2117, "val_loss": 68047.90625} {"train_loss": -6.218637943267822, "global_step": 88956, "epoch": 2118} {"train_loss": -6.2283034324646, "global_step": 88957, "epoch": 2118} {"train_loss": -6.1928300857543945, "global_step": 88958, "epoch": 2118} {"train_loss": -6.143711090087891, "global_step": 88959, "epoch": 2118} {"train_loss": -6.146652698516846, "global_step": 88960, "epoch": 2118} {"train_loss": -6.176057815551758, "global_step": 88961, "epoch": 2118} {"train_loss": -6.29865026473999, "global_step": 88962, "epoch": 2118} {"train_loss": -6.23985481262207, "global_step": 88963, "epoch": 2118} {"train_loss": -6.128786087036133, "global_step": 88964, "epoch": 2118} {"train_loss": -6.225052833557129, "global_step": 88965, "epoch": 2118} {"train_loss": -6.275947093963623, "global_step": 88966, "epoch": 2118} {"train_loss": -6.2608747482299805, "global_step": 88967, "epoch": 2118} {"train_loss": -6.276135444641113, "global_step": 88968, "epoch": 2118} {"train_loss": -6.228935718536377, "global_step": 88969, "epoch": 2118} {"train_loss": -6.280159950256348, "global_step": 88970, "epoch": 2118} {"train_loss": -6.260826110839844, "global_step": 88971, "epoch": 2118} {"train_loss": -6.280323505401611, "global_step": 88972, "epoch": 2118} {"train_loss": -6.396158218383789, "global_step": 88973, "epoch": 2118} {"train_loss": -6.19483757019043, "global_step": 88974, "epoch": 2118} {"train_loss": -6.215074062347412, "global_step": 88975, "epoch": 2118} {"train_loss": -6.194366455078125, "global_step": 88976, "epoch": 2118} {"train_loss": -6.203189373016357, "global_step": 88977, "epoch": 2118} {"train_loss": -6.364109039306641, "global_step": 88978, "epoch": 2118} {"train_loss": -6.390526294708252, "global_step": 88979, "epoch": 2118} {"train_loss": -6.206992149353027, "global_step": 88980, "epoch": 2118} {"train_loss": -6.172768592834473, "global_step": 88981, "epoch": 2118} {"train_loss": -6.217267990112305, "global_step": 88982, "epoch": 2118} {"train_loss": -6.194476127624512, "global_step": 88983, "epoch": 2118} {"train_loss": -6.221491813659668, "global_step": 88984, "epoch": 2118} {"train_loss": -6.0850372314453125, "global_step": 88985, "epoch": 2118} {"train_loss": -6.200910568237305, "global_step": 88986, "epoch": 2118} {"train_loss": -6.24306583404541, "global_step": 88987, "epoch": 2118} {"train_loss": -6.277118682861328, "global_step": 88988, "epoch": 2118} {"train_loss": -6.2277936935424805, "global_step": 88989, "epoch": 2118} {"train_loss": -6.138608932495117, "global_step": 88990, "epoch": 2118} {"train_loss": -6.247321128845215, "global_step": 88991, "epoch": 2118} {"train_loss": -6.253790855407715, "global_step": 88992, "epoch": 2118} {"train_loss": -6.239745140075684, "global_step": 88993, "epoch": 2118} {"train_loss": -6.354640483856201, "global_step": 88994, "epoch": 2118} {"train_loss": -6.299107074737549, "global_step": 88995, "epoch": 2118} {"train_loss": -6.320857524871826, "global_step": 88996, "epoch": 2118} {"train_loss": -6.241465557189215, "global_step": 88997, "epoch": 2118, "val_loss": 67923.96875} {"train_loss": -6.179096698760986, "global_step": 88998, "epoch": 2119} {"train_loss": -6.203587532043457, "global_step": 88999, "epoch": 2119} {"train_loss": -6.326292991638184, "global_step": 89000, "epoch": 2119} {"train_loss": -6.1831135749816895, "global_step": 89001, "epoch": 2119} {"train_loss": -6.253873825073242, "global_step": 89002, "epoch": 2119} {"train_loss": -6.297300815582275, "global_step": 89003, "epoch": 2119} {"train_loss": -6.264467239379883, "global_step": 89004, "epoch": 2119} {"train_loss": -6.3413190841674805, "global_step": 89005, "epoch": 2119} {"train_loss": -6.260666847229004, "global_step": 89006, "epoch": 2119} {"train_loss": -6.263786792755127, "global_step": 89007, "epoch": 2119} {"train_loss": -6.130594253540039, "global_step": 89008, "epoch": 2119} {"train_loss": -6.248721122741699, "global_step": 89009, "epoch": 2119} {"train_loss": -6.302603721618652, "global_step": 89010, "epoch": 2119} {"train_loss": -6.265214920043945, "global_step": 89011, "epoch": 2119} {"train_loss": -6.251153469085693, "global_step": 89012, "epoch": 2119} {"train_loss": -6.190670967102051, "global_step": 89013, "epoch": 2119} {"train_loss": -6.204814910888672, "global_step": 89014, "epoch": 2119} {"train_loss": -6.25246000289917, "global_step": 89015, "epoch": 2119} {"train_loss": -6.121837615966797, "global_step": 89016, "epoch": 2119} {"train_loss": -6.166821479797363, "global_step": 89017, "epoch": 2119} {"train_loss": -6.302944183349609, "global_step": 89018, "epoch": 2119} {"train_loss": -6.255104064941406, "global_step": 89019, "epoch": 2119} {"train_loss": -6.27447509765625, "global_step": 89020, "epoch": 2119} {"train_loss": -6.166204929351807, "global_step": 89021, "epoch": 2119} {"train_loss": -6.286491394042969, "global_step": 89022, "epoch": 2119} {"train_loss": -6.198148250579834, "global_step": 89023, "epoch": 2119} {"train_loss": -6.117688179016113, "global_step": 89024, "epoch": 2119} {"train_loss": -6.1896209716796875, "global_step": 89025, "epoch": 2119} {"train_loss": -6.191099643707275, "global_step": 89026, "epoch": 2119} {"train_loss": -6.226628303527832, "global_step": 89027, "epoch": 2119} {"train_loss": -6.1449737548828125, "global_step": 89028, "epoch": 2119} {"train_loss": -6.289512634277344, "global_step": 89029, "epoch": 2119} {"train_loss": -6.254131317138672, "global_step": 89030, "epoch": 2119} {"train_loss": -6.063370227813721, "global_step": 89031, "epoch": 2119} {"train_loss": -6.235016822814941, "global_step": 89032, "epoch": 2119} {"train_loss": -6.306439399719238, "global_step": 89033, "epoch": 2119} {"train_loss": -6.174340724945068, "global_step": 89034, "epoch": 2119} {"train_loss": -6.234097003936768, "global_step": 89035, "epoch": 2119} {"train_loss": -6.229079246520996, "global_step": 89036, "epoch": 2119} {"train_loss": -6.050056457519531, "global_step": 89037, "epoch": 2119} {"train_loss": -6.161691665649414, "global_step": 89038, "epoch": 2119} {"train_loss": -6.220250163759504, "global_step": 89039, "epoch": 2119, "val_loss": 68145.09375} {"train_loss": -6.155923843383789, "global_step": 89040, "epoch": 2120} {"train_loss": -6.201890468597412, "global_step": 89041, "epoch": 2120} {"train_loss": -6.275629043579102, "global_step": 89042, "epoch": 2120} {"train_loss": -6.178238391876221, "global_step": 89043, "epoch": 2120} {"train_loss": -6.220343112945557, "global_step": 89044, "epoch": 2120} {"train_loss": -6.197143077850342, "global_step": 89045, "epoch": 2120} {"train_loss": -6.120110511779785, "global_step": 89046, "epoch": 2120} {"train_loss": -6.219330787658691, "global_step": 89047, "epoch": 2120} {"train_loss": -6.12802791595459, "global_step": 89048, "epoch": 2120} {"train_loss": -6.277797698974609, "global_step": 89049, "epoch": 2120} {"train_loss": -6.163390159606934, "global_step": 89050, "epoch": 2120} {"train_loss": -6.0858049392700195, "global_step": 89051, "epoch": 2120} {"train_loss": -6.2443647384643555, "global_step": 89052, "epoch": 2120} {"train_loss": -6.189326286315918, "global_step": 89053, "epoch": 2120} {"train_loss": -6.224297046661377, "global_step": 89054, "epoch": 2120} {"train_loss": -6.197626113891602, "global_step": 89055, "epoch": 2120} {"train_loss": -6.31016731262207, "global_step": 89056, "epoch": 2120} {"train_loss": -6.242590427398682, "global_step": 89057, "epoch": 2120} {"train_loss": -6.224825859069824, "global_step": 89058, "epoch": 2120} {"train_loss": -6.161869049072266, "global_step": 89059, "epoch": 2120} {"train_loss": -6.216952323913574, "global_step": 89060, "epoch": 2120} {"train_loss": -6.253692626953125, "global_step": 89061, "epoch": 2120} {"train_loss": -6.188887119293213, "global_step": 89062, "epoch": 2120} {"train_loss": -6.19809103012085, "global_step": 89063, "epoch": 2120} {"train_loss": -6.191082954406738, "global_step": 89064, "epoch": 2120} {"train_loss": -6.220732688903809, "global_step": 89065, "epoch": 2120} {"train_loss": -6.174187660217285, "global_step": 89066, "epoch": 2120} {"train_loss": -6.290903568267822, "global_step": 89067, "epoch": 2120} {"train_loss": -6.19865083694458, "global_step": 89068, "epoch": 2120} {"train_loss": -6.299776077270508, "global_step": 89069, "epoch": 2120} {"train_loss": -6.10823917388916, "global_step": 89070, "epoch": 2120} {"train_loss": -6.2064714431762695, "global_step": 89071, "epoch": 2120} {"train_loss": -6.152274131774902, "global_step": 89072, "epoch": 2120} {"train_loss": -6.185113906860352, "global_step": 89073, "epoch": 2120} {"train_loss": -6.228091716766357, "global_step": 89074, "epoch": 2120} {"train_loss": -6.126958847045898, "global_step": 89075, "epoch": 2120} {"train_loss": -6.284990310668945, "global_step": 89076, "epoch": 2120} {"train_loss": -6.126605033874512, "global_step": 89077, "epoch": 2120} {"train_loss": -6.2391462326049805, "global_step": 89078, "epoch": 2120} {"train_loss": -6.22953987121582, "global_step": 89079, "epoch": 2120} {"train_loss": -6.10641622543335, "global_step": 89080, "epoch": 2120} {"train_loss": -6.198853685742333, "global_step": 89081, "epoch": 2120, "val_loss": 68019.8125} {"train_loss": -6.121310234069824, "global_step": 89082, "epoch": 2121} {"train_loss": -6.176723480224609, "global_step": 89083, "epoch": 2121} {"train_loss": -6.078204154968262, "global_step": 89084, "epoch": 2121} {"train_loss": -6.262701988220215, "global_step": 89085, "epoch": 2121} {"train_loss": -6.140052795410156, "global_step": 89086, "epoch": 2121} {"train_loss": -6.2609124183654785, "global_step": 89087, "epoch": 2121} {"train_loss": -6.282792568206787, "global_step": 89088, "epoch": 2121} {"train_loss": -6.198184967041016, "global_step": 89089, "epoch": 2121} {"train_loss": -6.19012451171875, "global_step": 89090, "epoch": 2121} {"train_loss": -6.309575080871582, "global_step": 89091, "epoch": 2121} {"train_loss": -6.078805923461914, "global_step": 89092, "epoch": 2121} {"train_loss": -6.272587776184082, "global_step": 89093, "epoch": 2121} {"train_loss": -6.213665008544922, "global_step": 89094, "epoch": 2121} {"train_loss": -6.370796203613281, "global_step": 89095, "epoch": 2121} {"train_loss": -6.3063812255859375, "global_step": 89096, "epoch": 2121} {"train_loss": -6.163387298583984, "global_step": 89097, "epoch": 2121} {"train_loss": -6.1721086502075195, "global_step": 89098, "epoch": 2121} {"train_loss": -6.1527419090271, "global_step": 89099, "epoch": 2121} {"train_loss": -6.241548538208008, "global_step": 89100, "epoch": 2121} {"train_loss": -6.177235126495361, "global_step": 89101, "epoch": 2121} {"train_loss": -6.214262962341309, "global_step": 89102, "epoch": 2121} {"train_loss": -6.2244768142700195, "global_step": 89103, "epoch": 2121} {"train_loss": -6.263119220733643, "global_step": 89104, "epoch": 2121} {"train_loss": -6.199271202087402, "global_step": 89105, "epoch": 2121} {"train_loss": -6.285856246948242, "global_step": 89106, "epoch": 2121} {"train_loss": -6.331507682800293, "global_step": 89107, "epoch": 2121} {"train_loss": -6.130796432495117, "global_step": 89108, "epoch": 2121} {"train_loss": -6.095802307128906, "global_step": 89109, "epoch": 2121} {"train_loss": -6.16103982925415, "global_step": 89110, "epoch": 2121} {"train_loss": -6.304154872894287, "global_step": 89111, "epoch": 2121} {"train_loss": -6.228941917419434, "global_step": 89112, "epoch": 2121} {"train_loss": -6.106955528259277, "global_step": 89113, "epoch": 2121} {"train_loss": -6.2104716300964355, "global_step": 89114, "epoch": 2121} {"train_loss": -6.234281539916992, "global_step": 89115, "epoch": 2121} {"train_loss": -6.300251007080078, "global_step": 89116, "epoch": 2121} {"train_loss": -6.324573516845703, "global_step": 89117, "epoch": 2121} {"train_loss": -6.271340370178223, "global_step": 89118, "epoch": 2121} {"train_loss": -6.279810905456543, "global_step": 89119, "epoch": 2121} {"train_loss": -6.334518909454346, "global_step": 89120, "epoch": 2121} {"train_loss": -6.1596999168396, "global_step": 89121, "epoch": 2121} {"train_loss": -6.2713117599487305, "global_step": 89122, "epoch": 2121} {"train_loss": -6.2186331521897085, "global_step": 89123, "epoch": 2121, "val_loss": 67778.640625} {"train_loss": -6.348719596862793, "global_step": 89124, "epoch": 2122} {"train_loss": -6.259862899780273, "global_step": 89125, "epoch": 2122} {"train_loss": -6.254283428192139, "global_step": 89126, "epoch": 2122} {"train_loss": -6.295621395111084, "global_step": 89127, "epoch": 2122} {"train_loss": -6.247103691101074, "global_step": 89128, "epoch": 2122} {"train_loss": -6.2911882400512695, "global_step": 89129, "epoch": 2122} {"train_loss": -6.263395309448242, "global_step": 89130, "epoch": 2122} {"train_loss": -6.249054908752441, "global_step": 89131, "epoch": 2122} {"train_loss": -6.243587493896484, "global_step": 89132, "epoch": 2122} {"train_loss": -6.34945011138916, "global_step": 89133, "epoch": 2122} {"train_loss": -6.235682487487793, "global_step": 89134, "epoch": 2122} {"train_loss": -6.184393882751465, "global_step": 89135, "epoch": 2122} {"train_loss": -6.294056415557861, "global_step": 89136, "epoch": 2122} {"train_loss": -6.4651408195495605, "global_step": 89137, "epoch": 2122} {"train_loss": -6.270317077636719, "global_step": 89138, "epoch": 2122} {"train_loss": -6.229966163635254, "global_step": 89139, "epoch": 2122} {"train_loss": -6.217837333679199, "global_step": 89140, "epoch": 2122} {"train_loss": -6.302249908447266, "global_step": 89141, "epoch": 2122} {"train_loss": -6.335302352905273, "global_step": 89142, "epoch": 2122} {"train_loss": -6.221891403198242, "global_step": 89143, "epoch": 2122} {"train_loss": -6.245598316192627, "global_step": 89144, "epoch": 2122} {"train_loss": -6.329442024230957, "global_step": 89145, "epoch": 2122} {"train_loss": -6.18144416809082, "global_step": 89146, "epoch": 2122} {"train_loss": -6.1917219161987305, "global_step": 89147, "epoch": 2122} {"train_loss": -6.289936542510986, "global_step": 89148, "epoch": 2122} {"train_loss": -6.222257614135742, "global_step": 89149, "epoch": 2122} {"train_loss": -6.114921569824219, "global_step": 89150, "epoch": 2122} {"train_loss": -6.069783687591553, "global_step": 89151, "epoch": 2122} {"train_loss": -6.330774784088135, "global_step": 89152, "epoch": 2122} {"train_loss": -6.231233596801758, "global_step": 89153, "epoch": 2122} {"train_loss": -6.37642765045166, "global_step": 89154, "epoch": 2122} {"train_loss": -6.410930156707764, "global_step": 89155, "epoch": 2122} {"train_loss": -6.2821149826049805, "global_step": 89156, "epoch": 2122} {"train_loss": -6.3118205070495605, "global_step": 89157, "epoch": 2122} {"train_loss": -6.194269180297852, "global_step": 89158, "epoch": 2122} {"train_loss": -6.245862007141113, "global_step": 89159, "epoch": 2122} {"train_loss": -6.29973030090332, "global_step": 89160, "epoch": 2122} {"train_loss": -6.286380767822266, "global_step": 89161, "epoch": 2122} {"train_loss": -6.229704856872559, "global_step": 89162, "epoch": 2122} {"train_loss": -6.163775444030762, "global_step": 89163, "epoch": 2122} {"train_loss": -6.195697784423828, "global_step": 89164, "epoch": 2122} {"train_loss": -6.261488948549543, "global_step": 89165, "epoch": 2122, "val_loss": 67995.0546875} {"train_loss": -6.29741907119751, "global_step": 89166, "epoch": 2123} {"train_loss": -6.285007476806641, "global_step": 89167, "epoch": 2123} {"train_loss": -6.188424110412598, "global_step": 89168, "epoch": 2123} {"train_loss": -6.122028350830078, "global_step": 89169, "epoch": 2123} {"train_loss": -6.210618019104004, "global_step": 89170, "epoch": 2123} {"train_loss": -6.236686706542969, "global_step": 89171, "epoch": 2123} {"train_loss": -6.224867343902588, "global_step": 89172, "epoch": 2123} {"train_loss": -6.260869026184082, "global_step": 89173, "epoch": 2123} {"train_loss": -6.248829364776611, "global_step": 89174, "epoch": 2123} {"train_loss": -6.273441791534424, "global_step": 89175, "epoch": 2123} {"train_loss": -6.278351783752441, "global_step": 89176, "epoch": 2123} {"train_loss": -6.225906848907471, "global_step": 89177, "epoch": 2123} {"train_loss": -6.191493988037109, "global_step": 89178, "epoch": 2123} {"train_loss": -6.25141716003418, "global_step": 89179, "epoch": 2123} {"train_loss": -6.198590278625488, "global_step": 89180, "epoch": 2123} {"train_loss": -6.225203514099121, "global_step": 89181, "epoch": 2123} {"train_loss": -6.1810102462768555, "global_step": 89182, "epoch": 2123} {"train_loss": -6.204823970794678, "global_step": 89183, "epoch": 2123} {"train_loss": -6.3271942138671875, "global_step": 89184, "epoch": 2123} {"train_loss": -6.254208564758301, "global_step": 89185, "epoch": 2123} {"train_loss": -6.234315872192383, "global_step": 89186, "epoch": 2123} {"train_loss": -6.280594825744629, "global_step": 89187, "epoch": 2123} {"train_loss": -6.2862324714660645, "global_step": 89188, "epoch": 2123} {"train_loss": -6.12704610824585, "global_step": 89189, "epoch": 2123} {"train_loss": -6.2870097160339355, "global_step": 89190, "epoch": 2123} {"train_loss": -6.2059221267700195, "global_step": 89191, "epoch": 2123} {"train_loss": -6.225605010986328, "global_step": 89192, "epoch": 2123} {"train_loss": -6.331042289733887, "global_step": 89193, "epoch": 2123} {"train_loss": -6.145962238311768, "global_step": 89194, "epoch": 2123} {"train_loss": -6.28245210647583, "global_step": 89195, "epoch": 2123} {"train_loss": -6.138336181640625, "global_step": 89196, "epoch": 2123} {"train_loss": -6.2827653884887695, "global_step": 89197, "epoch": 2123} {"train_loss": -6.290976524353027, "global_step": 89198, "epoch": 2123} {"train_loss": -6.226459503173828, "global_step": 89199, "epoch": 2123} {"train_loss": -6.227551460266113, "global_step": 89200, "epoch": 2123} {"train_loss": -6.301911354064941, "global_step": 89201, "epoch": 2123} {"train_loss": -6.321725845336914, "global_step": 89202, "epoch": 2123} {"train_loss": -6.277229309082031, "global_step": 89203, "epoch": 2123} {"train_loss": -6.2239670753479, "global_step": 89204, "epoch": 2123} {"train_loss": -6.154631614685059, "global_step": 89205, "epoch": 2123} {"train_loss": -6.279806137084961, "global_step": 89206, "epoch": 2123} {"train_loss": -6.237758579708281, "global_step": 89207, "epoch": 2123, "val_loss": 67942.5546875} {"train_loss": -6.256689548492432, "global_step": 89208, "epoch": 2124} {"train_loss": -6.189509391784668, "global_step": 89209, "epoch": 2124} {"train_loss": -6.137166976928711, "global_step": 89210, "epoch": 2124} {"train_loss": -6.2612624168396, "global_step": 89211, "epoch": 2124} {"train_loss": -6.295727729797363, "global_step": 89212, "epoch": 2124} {"train_loss": -6.171578407287598, "global_step": 89213, "epoch": 2124} {"train_loss": -6.207108974456787, "global_step": 89214, "epoch": 2124} {"train_loss": -6.323948383331299, "global_step": 89215, "epoch": 2124} {"train_loss": -6.324028015136719, "global_step": 89216, "epoch": 2124} {"train_loss": -6.301604270935059, "global_step": 89217, "epoch": 2124} {"train_loss": -6.2119245529174805, "global_step": 89218, "epoch": 2124} {"train_loss": -6.212149143218994, "global_step": 89219, "epoch": 2124} {"train_loss": -6.215153217315674, "global_step": 89220, "epoch": 2124} {"train_loss": -6.267083168029785, "global_step": 89221, "epoch": 2124} {"train_loss": -6.227004051208496, "global_step": 89222, "epoch": 2124} {"train_loss": -6.217439651489258, "global_step": 89223, "epoch": 2124} {"train_loss": -6.231320858001709, "global_step": 89224, "epoch": 2124} {"train_loss": -6.177870273590088, "global_step": 89225, "epoch": 2124} {"train_loss": -6.282109260559082, "global_step": 89226, "epoch": 2124} {"train_loss": -6.216899394989014, "global_step": 89227, "epoch": 2124} {"train_loss": -6.233426570892334, "global_step": 89228, "epoch": 2124} {"train_loss": -6.173220634460449, "global_step": 89229, "epoch": 2124} {"train_loss": -6.147159099578857, "global_step": 89230, "epoch": 2124} {"train_loss": -6.155564785003662, "global_step": 89231, "epoch": 2124} {"train_loss": -6.210066795349121, "global_step": 89232, "epoch": 2124} {"train_loss": -6.25361967086792, "global_step": 89233, "epoch": 2124} {"train_loss": -6.158596038818359, "global_step": 89234, "epoch": 2124} {"train_loss": -6.259932041168213, "global_step": 89235, "epoch": 2124} {"train_loss": -6.198091506958008, "global_step": 89236, "epoch": 2124} {"train_loss": -6.130721569061279, "global_step": 89237, "epoch": 2124} {"train_loss": -6.237684726715088, "global_step": 89238, "epoch": 2124} {"train_loss": -6.305141448974609, "global_step": 89239, "epoch": 2124} {"train_loss": -6.242521286010742, "global_step": 89240, "epoch": 2124} {"train_loss": -6.38271427154541, "global_step": 89241, "epoch": 2124} {"train_loss": -6.150684356689453, "global_step": 89242, "epoch": 2124} {"train_loss": -6.286523342132568, "global_step": 89243, "epoch": 2124} {"train_loss": -6.2354326248168945, "global_step": 89244, "epoch": 2124} {"train_loss": -6.140480041503906, "global_step": 89245, "epoch": 2124} {"train_loss": -6.136431694030762, "global_step": 89246, "epoch": 2124} {"train_loss": -6.223114490509033, "global_step": 89247, "epoch": 2124} {"train_loss": -6.1751604080200195, "global_step": 89248, "epoch": 2124} {"train_loss": -6.222860018412272, "global_step": 89249, "epoch": 2124, "val_loss": 67963.078125} {"train_loss": -6.112044334411621, "global_step": 89250, "epoch": 2125} {"train_loss": -6.221224308013916, "global_step": 89251, "epoch": 2125} {"train_loss": -6.140509605407715, "global_step": 89252, "epoch": 2125} {"train_loss": -6.1437602043151855, "global_step": 89253, "epoch": 2125} {"train_loss": -6.215690612792969, "global_step": 89254, "epoch": 2125} {"train_loss": -6.1455841064453125, "global_step": 89255, "epoch": 2125} {"train_loss": -6.292795181274414, "global_step": 89256, "epoch": 2125} {"train_loss": -6.202385902404785, "global_step": 89257, "epoch": 2125} {"train_loss": -6.207958221435547, "global_step": 89258, "epoch": 2125} {"train_loss": -6.18459415435791, "global_step": 89259, "epoch": 2125} {"train_loss": -6.295294284820557, "global_step": 89260, "epoch": 2125} {"train_loss": -6.158690452575684, "global_step": 89261, "epoch": 2125} {"train_loss": -6.142762660980225, "global_step": 89262, "epoch": 2125} {"train_loss": -6.2349066734313965, "global_step": 89263, "epoch": 2125} {"train_loss": -6.233676910400391, "global_step": 89264, "epoch": 2125} {"train_loss": -6.258196830749512, "global_step": 89265, "epoch": 2125} {"train_loss": -6.358790397644043, "global_step": 89266, "epoch": 2125} {"train_loss": -6.226103782653809, "global_step": 89267, "epoch": 2125} {"train_loss": -6.2874369621276855, "global_step": 89268, "epoch": 2125} {"train_loss": -6.19100284576416, "global_step": 89269, "epoch": 2125} {"train_loss": -6.181182861328125, "global_step": 89270, "epoch": 2125} {"train_loss": -6.270072937011719, "global_step": 89271, "epoch": 2125} {"train_loss": -6.1942830085754395, "global_step": 89272, "epoch": 2125} {"train_loss": -6.353757381439209, "global_step": 89273, "epoch": 2125} {"train_loss": -6.24093770980835, "global_step": 89274, "epoch": 2125} {"train_loss": -6.283039569854736, "global_step": 89275, "epoch": 2125} {"train_loss": -6.327514171600342, "global_step": 89276, "epoch": 2125} {"train_loss": -6.185949325561523, "global_step": 89277, "epoch": 2125} {"train_loss": -6.268598556518555, "global_step": 89278, "epoch": 2125} {"train_loss": -6.244937419891357, "global_step": 89279, "epoch": 2125} {"train_loss": -6.116926193237305, "global_step": 89280, "epoch": 2125} {"train_loss": -6.1832122802734375, "global_step": 89281, "epoch": 2125} {"train_loss": -6.162586688995361, "global_step": 89282, "epoch": 2125} {"train_loss": -6.304605484008789, "global_step": 89283, "epoch": 2125} {"train_loss": -6.231273651123047, "global_step": 89284, "epoch": 2125} {"train_loss": -6.2498602867126465, "global_step": 89285, "epoch": 2125} {"train_loss": -6.227099418640137, "global_step": 89286, "epoch": 2125} {"train_loss": -6.262552261352539, "global_step": 89287, "epoch": 2125} {"train_loss": -6.242307662963867, "global_step": 89288, "epoch": 2125} {"train_loss": -6.184545516967773, "global_step": 89289, "epoch": 2125} {"train_loss": -6.223174571990967, "global_step": 89290, "epoch": 2125} {"train_loss": -6.225045987537929, "global_step": 89291, "epoch": 2125, "val_loss": 67913.078125} {"train_loss": -6.3792405128479, "global_step": 89292, "epoch": 2126} {"train_loss": -6.269325256347656, "global_step": 89293, "epoch": 2126} {"train_loss": -6.255174160003662, "global_step": 89294, "epoch": 2126} {"train_loss": -6.171984672546387, "global_step": 89295, "epoch": 2126} {"train_loss": -6.262667655944824, "global_step": 89296, "epoch": 2126} {"train_loss": -6.2708024978637695, "global_step": 89297, "epoch": 2126} {"train_loss": -6.267522811889648, "global_step": 89298, "epoch": 2126} {"train_loss": -6.270525932312012, "global_step": 89299, "epoch": 2126} {"train_loss": -6.266811370849609, "global_step": 89300, "epoch": 2126} {"train_loss": -6.219572067260742, "global_step": 89301, "epoch": 2126} {"train_loss": -6.193271160125732, "global_step": 89302, "epoch": 2126} {"train_loss": -6.176577568054199, "global_step": 89303, "epoch": 2126} {"train_loss": -6.184497833251953, "global_step": 89304, "epoch": 2126} {"train_loss": -6.15572452545166, "global_step": 89305, "epoch": 2126} {"train_loss": -6.1789350509643555, "global_step": 89306, "epoch": 2126} {"train_loss": -6.133256435394287, "global_step": 89307, "epoch": 2126} {"train_loss": -6.287501335144043, "global_step": 89308, "epoch": 2126} {"train_loss": -6.273202896118164, "global_step": 89309, "epoch": 2126} {"train_loss": -6.281742572784424, "global_step": 89310, "epoch": 2126} {"train_loss": -6.255341529846191, "global_step": 89311, "epoch": 2126} {"train_loss": -6.230507850646973, "global_step": 89312, "epoch": 2126} {"train_loss": -6.183811187744141, "global_step": 89313, "epoch": 2126} {"train_loss": -6.136898994445801, "global_step": 89314, "epoch": 2126} {"train_loss": -6.1589555740356445, "global_step": 89315, "epoch": 2126} {"train_loss": -6.191529750823975, "global_step": 89316, "epoch": 2126} {"train_loss": -6.208738327026367, "global_step": 89317, "epoch": 2126} {"train_loss": -6.123239517211914, "global_step": 89318, "epoch": 2126} {"train_loss": -6.315482139587402, "global_step": 89319, "epoch": 2126} {"train_loss": -6.1619791984558105, "global_step": 89320, "epoch": 2126} {"train_loss": -6.351347923278809, "global_step": 89321, "epoch": 2126} {"train_loss": -6.168589115142822, "global_step": 89322, "epoch": 2126} {"train_loss": -6.246293067932129, "global_step": 89323, "epoch": 2126} {"train_loss": -6.2964959144592285, "global_step": 89324, "epoch": 2126} {"train_loss": -6.28072452545166, "global_step": 89325, "epoch": 2126} {"train_loss": -6.1613006591796875, "global_step": 89326, "epoch": 2126} {"train_loss": -6.146388053894043, "global_step": 89327, "epoch": 2126} {"train_loss": -6.177445411682129, "global_step": 89328, "epoch": 2126} {"train_loss": -6.315306663513184, "global_step": 89329, "epoch": 2126} {"train_loss": -6.192910671234131, "global_step": 89330, "epoch": 2126} {"train_loss": -6.260953903198242, "global_step": 89331, "epoch": 2126} {"train_loss": -6.237174034118652, "global_step": 89332, "epoch": 2126} {"train_loss": -6.225328365961711, "global_step": 89333, "epoch": 2126, "val_loss": 67901.2109375} {"train_loss": -6.224642276763916, "global_step": 89334, "epoch": 2127} {"train_loss": -6.227188587188721, "global_step": 89335, "epoch": 2127} {"train_loss": -6.150791168212891, "global_step": 89336, "epoch": 2127} {"train_loss": -6.157636642456055, "global_step": 89337, "epoch": 2127} {"train_loss": -6.228762626647949, "global_step": 89338, "epoch": 2127} {"train_loss": -6.225857734680176, "global_step": 89339, "epoch": 2127} {"train_loss": -6.309628486633301, "global_step": 89340, "epoch": 2127} {"train_loss": -6.157115459442139, "global_step": 89341, "epoch": 2127} {"train_loss": -6.255667686462402, "global_step": 89342, "epoch": 2127} {"train_loss": -6.317573547363281, "global_step": 89343, "epoch": 2127} {"train_loss": -6.201462745666504, "global_step": 89344, "epoch": 2127} {"train_loss": -6.178845405578613, "global_step": 89345, "epoch": 2127} {"train_loss": -6.191877365112305, "global_step": 89346, "epoch": 2127} {"train_loss": -6.243297576904297, "global_step": 89347, "epoch": 2127} {"train_loss": -6.198792457580566, "global_step": 89348, "epoch": 2127} {"train_loss": -6.1253743171691895, "global_step": 89349, "epoch": 2127} {"train_loss": -6.199986457824707, "global_step": 89350, "epoch": 2127} {"train_loss": -6.328225135803223, "global_step": 89351, "epoch": 2127} {"train_loss": -6.1917724609375, "global_step": 89352, "epoch": 2127} {"train_loss": -6.208298683166504, "global_step": 89353, "epoch": 2127} {"train_loss": -6.211268901824951, "global_step": 89354, "epoch": 2127} {"train_loss": -6.198119163513184, "global_step": 89355, "epoch": 2127} {"train_loss": -6.101919174194336, "global_step": 89356, "epoch": 2127} {"train_loss": -6.234621524810791, "global_step": 89357, "epoch": 2127} {"train_loss": -6.2053351402282715, "global_step": 89358, "epoch": 2127} {"train_loss": -6.188766956329346, "global_step": 89359, "epoch": 2127} {"train_loss": -6.265594005584717, "global_step": 89360, "epoch": 2127} {"train_loss": -6.263799667358398, "global_step": 89361, "epoch": 2127} {"train_loss": -6.093545913696289, "global_step": 89362, "epoch": 2127} {"train_loss": -6.2721099853515625, "global_step": 89363, "epoch": 2127} {"train_loss": -6.1668572425842285, "global_step": 89364, "epoch": 2127} {"train_loss": -6.0845184326171875, "global_step": 89365, "epoch": 2127} {"train_loss": -6.186707496643066, "global_step": 89366, "epoch": 2127} {"train_loss": -6.180849075317383, "global_step": 89367, "epoch": 2127} {"train_loss": -6.250226020812988, "global_step": 89368, "epoch": 2127} {"train_loss": -6.206976890563965, "global_step": 89369, "epoch": 2127} {"train_loss": -6.046796798706055, "global_step": 89370, "epoch": 2127} {"train_loss": -6.249849319458008, "global_step": 89371, "epoch": 2127} {"train_loss": -6.1559295654296875, "global_step": 89372, "epoch": 2127} {"train_loss": -6.174516677856445, "global_step": 89373, "epoch": 2127} {"train_loss": -6.191122055053711, "global_step": 89374, "epoch": 2127} {"train_loss": -6.201325098673503, "global_step": 89375, "epoch": 2127, "val_loss": 67695.8515625} {"train_loss": -6.365743637084961, "global_step": 89376, "epoch": 2128} {"train_loss": -6.10327672958374, "global_step": 89377, "epoch": 2128} {"train_loss": -6.3130388259887695, "global_step": 89378, "epoch": 2128} {"train_loss": -6.147012233734131, "global_step": 89379, "epoch": 2128} {"train_loss": -6.2824554443359375, "global_step": 89380, "epoch": 2128} {"train_loss": -6.2959771156311035, "global_step": 89381, "epoch": 2128} {"train_loss": -6.245367050170898, "global_step": 89382, "epoch": 2128} {"train_loss": -6.272741317749023, "global_step": 89383, "epoch": 2128} {"train_loss": -6.307162761688232, "global_step": 89384, "epoch": 2128} {"train_loss": -6.173821926116943, "global_step": 89385, "epoch": 2128} {"train_loss": -6.18115758895874, "global_step": 89386, "epoch": 2128} {"train_loss": -6.282863140106201, "global_step": 89387, "epoch": 2128} {"train_loss": -6.350185871124268, "global_step": 89388, "epoch": 2128} {"train_loss": -6.204593658447266, "global_step": 89389, "epoch": 2128} {"train_loss": -6.210657596588135, "global_step": 89390, "epoch": 2128} {"train_loss": -6.287135124206543, "global_step": 89391, "epoch": 2128} {"train_loss": -6.300273418426514, "global_step": 89392, "epoch": 2128} {"train_loss": -6.198726654052734, "global_step": 89393, "epoch": 2128} {"train_loss": -6.254631042480469, "global_step": 89394, "epoch": 2128} {"train_loss": -6.296176910400391, "global_step": 89395, "epoch": 2128} {"train_loss": -6.286742210388184, "global_step": 89396, "epoch": 2128} {"train_loss": -6.3147759437561035, "global_step": 89397, "epoch": 2128} {"train_loss": -6.195289611816406, "global_step": 89398, "epoch": 2128} {"train_loss": -6.324619293212891, "global_step": 89399, "epoch": 2128} {"train_loss": -6.353231906890869, "global_step": 89400, "epoch": 2128} {"train_loss": -6.275943756103516, "global_step": 89401, "epoch": 2128} {"train_loss": -6.264641761779785, "global_step": 89402, "epoch": 2128} {"train_loss": -6.2631964683532715, "global_step": 89403, "epoch": 2128} {"train_loss": -6.204158782958984, "global_step": 89404, "epoch": 2128} {"train_loss": -6.233408451080322, "global_step": 89405, "epoch": 2128} {"train_loss": -6.170276641845703, "global_step": 89406, "epoch": 2128} {"train_loss": -6.216609001159668, "global_step": 89407, "epoch": 2128} {"train_loss": -6.267491340637207, "global_step": 89408, "epoch": 2128} {"train_loss": -6.408082962036133, "global_step": 89409, "epoch": 2128} {"train_loss": -6.157688140869141, "global_step": 89410, "epoch": 2128} {"train_loss": -6.270478248596191, "global_step": 89411, "epoch": 2128} {"train_loss": -6.3005595207214355, "global_step": 89412, "epoch": 2128} {"train_loss": -6.274177551269531, "global_step": 89413, "epoch": 2128} {"train_loss": -6.215751647949219, "global_step": 89414, "epoch": 2128} {"train_loss": -6.240757942199707, "global_step": 89415, "epoch": 2128} {"train_loss": -6.337902545928955, "global_step": 89416, "epoch": 2128} {"train_loss": -6.258608761287871, "global_step": 89417, "epoch": 2128, "val_loss": 67784.7890625} {"train_loss": -6.287901878356934, "global_step": 89418, "epoch": 2129} {"train_loss": -6.239579200744629, "global_step": 89419, "epoch": 2129} {"train_loss": -6.213156223297119, "global_step": 89420, "epoch": 2129} {"train_loss": -6.272744178771973, "global_step": 89421, "epoch": 2129} {"train_loss": -6.267825126647949, "global_step": 89422, "epoch": 2129} {"train_loss": -6.334573745727539, "global_step": 89423, "epoch": 2129} {"train_loss": -6.206691741943359, "global_step": 89424, "epoch": 2129} {"train_loss": -6.140044212341309, "global_step": 89425, "epoch": 2129} {"train_loss": -6.24532413482666, "global_step": 89426, "epoch": 2129} {"train_loss": -6.270453453063965, "global_step": 89427, "epoch": 2129} {"train_loss": -6.116009712219238, "global_step": 89428, "epoch": 2129} {"train_loss": -6.249993324279785, "global_step": 89429, "epoch": 2129} {"train_loss": -6.2721476554870605, "global_step": 89430, "epoch": 2129} {"train_loss": -6.3039703369140625, "global_step": 89431, "epoch": 2129} {"train_loss": -6.182587623596191, "global_step": 89432, "epoch": 2129} {"train_loss": -6.278320789337158, "global_step": 89433, "epoch": 2129} {"train_loss": -6.299731254577637, "global_step": 89434, "epoch": 2129} {"train_loss": -6.264899730682373, "global_step": 89435, "epoch": 2129} {"train_loss": -6.134849548339844, "global_step": 89436, "epoch": 2129} {"train_loss": -6.305858612060547, "global_step": 89437, "epoch": 2129} {"train_loss": -6.250171661376953, "global_step": 89438, "epoch": 2129} {"train_loss": -6.072079658508301, "global_step": 89439, "epoch": 2129} {"train_loss": -6.209977626800537, "global_step": 89440, "epoch": 2129} {"train_loss": -6.212651252746582, "global_step": 89441, "epoch": 2129} {"train_loss": -6.1327409744262695, "global_step": 89442, "epoch": 2129} {"train_loss": -6.318605422973633, "global_step": 89443, "epoch": 2129} {"train_loss": -6.168471336364746, "global_step": 89444, "epoch": 2129} {"train_loss": -6.219280242919922, "global_step": 89445, "epoch": 2129} {"train_loss": -6.219244480133057, "global_step": 89446, "epoch": 2129} {"train_loss": -6.331916809082031, "global_step": 89447, "epoch": 2129} {"train_loss": -6.254398822784424, "global_step": 89448, "epoch": 2129} {"train_loss": -6.162622451782227, "global_step": 89449, "epoch": 2129} {"train_loss": -6.314639568328857, "global_step": 89450, "epoch": 2129} {"train_loss": -6.198150634765625, "global_step": 89451, "epoch": 2129} {"train_loss": -6.364312171936035, "global_step": 89452, "epoch": 2129} {"train_loss": -6.294088363647461, "global_step": 89453, "epoch": 2129} {"train_loss": -6.228056907653809, "global_step": 89454, "epoch": 2129} {"train_loss": -6.197626113891602, "global_step": 89455, "epoch": 2129} {"train_loss": -6.345452785491943, "global_step": 89456, "epoch": 2129} {"train_loss": -6.206633567810059, "global_step": 89457, "epoch": 2129} {"train_loss": -6.223681449890137, "global_step": 89458, "epoch": 2129} {"train_loss": -6.237399123963856, "global_step": 89459, "epoch": 2129, "val_loss": 67892.03125} {"train_loss": -6.227019786834717, "global_step": 89460, "epoch": 2130} {"train_loss": -6.250078201293945, "global_step": 89461, "epoch": 2130} {"train_loss": -6.229808807373047, "global_step": 89462, "epoch": 2130} {"train_loss": -6.208544731140137, "global_step": 89463, "epoch": 2130} {"train_loss": -6.317924499511719, "global_step": 89464, "epoch": 2130} {"train_loss": -6.171900272369385, "global_step": 89465, "epoch": 2130} {"train_loss": -6.144619941711426, "global_step": 89466, "epoch": 2130} {"train_loss": -6.302856922149658, "global_step": 89467, "epoch": 2130} {"train_loss": -6.3646039962768555, "global_step": 89468, "epoch": 2130} {"train_loss": -6.23265266418457, "global_step": 89469, "epoch": 2130} {"train_loss": -6.238525867462158, "global_step": 89470, "epoch": 2130} {"train_loss": -6.269811630249023, "global_step": 89471, "epoch": 2130} {"train_loss": -6.2381744384765625, "global_step": 89472, "epoch": 2130} {"train_loss": -6.139272689819336, "global_step": 89473, "epoch": 2130} {"train_loss": -6.146543025970459, "global_step": 89474, "epoch": 2130} {"train_loss": -6.18794059753418, "global_step": 89475, "epoch": 2130} {"train_loss": -6.209773540496826, "global_step": 89476, "epoch": 2130} {"train_loss": -6.21385383605957, "global_step": 89477, "epoch": 2130} {"train_loss": -6.230981826782227, "global_step": 89478, "epoch": 2130} {"train_loss": -6.222586631774902, "global_step": 89479, "epoch": 2130} {"train_loss": -6.1676201820373535, "global_step": 89480, "epoch": 2130} {"train_loss": -6.133398056030273, "global_step": 89481, "epoch": 2130} {"train_loss": -6.123162746429443, "global_step": 89482, "epoch": 2130} {"train_loss": -6.159948825836182, "global_step": 89483, "epoch": 2130} {"train_loss": -6.127835750579834, "global_step": 89484, "epoch": 2130} {"train_loss": -6.340080261230469, "global_step": 89485, "epoch": 2130} {"train_loss": -6.147428035736084, "global_step": 89486, "epoch": 2130} {"train_loss": -6.153924465179443, "global_step": 89487, "epoch": 2130} {"train_loss": -6.31010103225708, "global_step": 89488, "epoch": 2130} {"train_loss": -6.171364784240723, "global_step": 89489, "epoch": 2130} {"train_loss": -6.195595741271973, "global_step": 89490, "epoch": 2130} {"train_loss": -6.298913955688477, "global_step": 89491, "epoch": 2130} {"train_loss": -6.177870273590088, "global_step": 89492, "epoch": 2130} {"train_loss": -6.285058498382568, "global_step": 89493, "epoch": 2130} {"train_loss": -6.216091156005859, "global_step": 89494, "epoch": 2130} {"train_loss": -6.137347221374512, "global_step": 89495, "epoch": 2130} {"train_loss": -6.237201690673828, "global_step": 89496, "epoch": 2130} {"train_loss": -6.247285842895508, "global_step": 89497, "epoch": 2130} {"train_loss": -6.192258834838867, "global_step": 89498, "epoch": 2130} {"train_loss": -6.287047386169434, "global_step": 89499, "epoch": 2130} {"train_loss": -6.267085552215576, "global_step": 89500, "epoch": 2130} {"train_loss": -6.21745320728847, "global_step": 89501, "epoch": 2130, "val_loss": 67885.90625} {"train_loss": -6.294998645782471, "global_step": 89502, "epoch": 2131} {"train_loss": -6.251657962799072, "global_step": 89503, "epoch": 2131} {"train_loss": -6.1699981689453125, "global_step": 89504, "epoch": 2131} {"train_loss": -6.264904022216797, "global_step": 89505, "epoch": 2131} {"train_loss": -6.18674373626709, "global_step": 89506, "epoch": 2131} {"train_loss": -6.305907726287842, "global_step": 89507, "epoch": 2131} {"train_loss": -6.184120178222656, "global_step": 89508, "epoch": 2131} {"train_loss": -6.20536994934082, "global_step": 89509, "epoch": 2131} {"train_loss": -6.302007675170898, "global_step": 89510, "epoch": 2131} {"train_loss": -6.217205047607422, "global_step": 89511, "epoch": 2131} {"train_loss": -6.316089630126953, "global_step": 89512, "epoch": 2131} {"train_loss": -6.259631633758545, "global_step": 89513, "epoch": 2131} {"train_loss": -6.264313697814941, "global_step": 89514, "epoch": 2131} {"train_loss": -6.233331680297852, "global_step": 89515, "epoch": 2131} {"train_loss": -6.1646318435668945, "global_step": 89516, "epoch": 2131} {"train_loss": -6.201069355010986, "global_step": 89517, "epoch": 2131} {"train_loss": -6.2049713134765625, "global_step": 89518, "epoch": 2131} {"train_loss": -6.198387145996094, "global_step": 89519, "epoch": 2131} {"train_loss": -6.141127109527588, "global_step": 89520, "epoch": 2131} {"train_loss": -6.090042591094971, "global_step": 89521, "epoch": 2131} {"train_loss": -6.343580722808838, "global_step": 89522, "epoch": 2131} {"train_loss": -6.152439117431641, "global_step": 89523, "epoch": 2131} {"train_loss": -6.2343573570251465, "global_step": 89524, "epoch": 2131} {"train_loss": -6.304808616638184, "global_step": 89525, "epoch": 2131} {"train_loss": -6.202484130859375, "global_step": 89526, "epoch": 2131} {"train_loss": -6.218117713928223, "global_step": 89527, "epoch": 2131} {"train_loss": -6.336173057556152, "global_step": 89528, "epoch": 2131} {"train_loss": -6.204054832458496, "global_step": 89529, "epoch": 2131} {"train_loss": -6.198616027832031, "global_step": 89530, "epoch": 2131} {"train_loss": -6.186470985412598, "global_step": 89531, "epoch": 2131} {"train_loss": -6.284322261810303, "global_step": 89532, "epoch": 2131} {"train_loss": -6.3371100425720215, "global_step": 89533, "epoch": 2131} {"train_loss": -6.176991939544678, "global_step": 89534, "epoch": 2131} {"train_loss": -6.308261871337891, "global_step": 89535, "epoch": 2131} {"train_loss": -6.275801181793213, "global_step": 89536, "epoch": 2131} {"train_loss": -6.297425746917725, "global_step": 89537, "epoch": 2131} {"train_loss": -6.370652198791504, "global_step": 89538, "epoch": 2131} {"train_loss": -6.234162330627441, "global_step": 89539, "epoch": 2131} {"train_loss": -6.282230377197266, "global_step": 89540, "epoch": 2131} {"train_loss": -6.276119232177734, "global_step": 89541, "epoch": 2131} {"train_loss": -6.213286876678467, "global_step": 89542, "epoch": 2131} {"train_loss": -6.240961074829102, "global_step": 89543, "epoch": 2131, "val_loss": 68001.3984375} {"train_loss": -6.276163101196289, "global_step": 89544, "epoch": 2132} {"train_loss": -6.204645156860352, "global_step": 89545, "epoch": 2132} {"train_loss": -6.157593727111816, "global_step": 89546, "epoch": 2132} {"train_loss": -6.3179216384887695, "global_step": 89547, "epoch": 2132} {"train_loss": -6.19238805770874, "global_step": 89548, "epoch": 2132} {"train_loss": -6.198170185089111, "global_step": 89549, "epoch": 2132} {"train_loss": -6.266181468963623, "global_step": 89550, "epoch": 2132} {"train_loss": -6.306589603424072, "global_step": 89551, "epoch": 2132} {"train_loss": -6.234002113342285, "global_step": 89552, "epoch": 2132} {"train_loss": -6.266195297241211, "global_step": 89553, "epoch": 2132} {"train_loss": -6.27834415435791, "global_step": 89554, "epoch": 2132} {"train_loss": -6.25422477722168, "global_step": 89555, "epoch": 2132} {"train_loss": -6.231844902038574, "global_step": 89556, "epoch": 2132} {"train_loss": -6.1685333251953125, "global_step": 89557, "epoch": 2132} {"train_loss": -6.135854721069336, "global_step": 89558, "epoch": 2132} {"train_loss": -6.181469917297363, "global_step": 89559, "epoch": 2132} {"train_loss": -6.202747821807861, "global_step": 89560, "epoch": 2132} {"train_loss": -5.994768142700195, "global_step": 89561, "epoch": 2132} {"train_loss": -6.16326904296875, "global_step": 89562, "epoch": 2132} {"train_loss": -6.2181596755981445, "global_step": 89563, "epoch": 2132} {"train_loss": -6.0805463790893555, "global_step": 89564, "epoch": 2132} {"train_loss": -6.205710411071777, "global_step": 89565, "epoch": 2132} {"train_loss": -6.101737022399902, "global_step": 89566, "epoch": 2132} {"train_loss": -6.2606201171875, "global_step": 89567, "epoch": 2132} {"train_loss": -6.158758163452148, "global_step": 89568, "epoch": 2132} {"train_loss": -6.18317985534668, "global_step": 89569, "epoch": 2132} {"train_loss": -6.136087417602539, "global_step": 89570, "epoch": 2132} {"train_loss": -6.202904224395752, "global_step": 89571, "epoch": 2132} {"train_loss": -6.206892967224121, "global_step": 89572, "epoch": 2132} {"train_loss": -6.075687408447266, "global_step": 89573, "epoch": 2132} {"train_loss": -6.216594219207764, "global_step": 89574, "epoch": 2132} {"train_loss": -6.113316059112549, "global_step": 89575, "epoch": 2132} {"train_loss": -6.181805610656738, "global_step": 89576, "epoch": 2132} {"train_loss": -6.222047805786133, "global_step": 89577, "epoch": 2132} {"train_loss": -6.150357723236084, "global_step": 89578, "epoch": 2132} {"train_loss": -6.158975124359131, "global_step": 89579, "epoch": 2132} {"train_loss": -6.191000938415527, "global_step": 89580, "epoch": 2132} {"train_loss": -6.271030426025391, "global_step": 89581, "epoch": 2132} {"train_loss": -6.188910484313965, "global_step": 89582, "epoch": 2132} {"train_loss": -6.167082786560059, "global_step": 89583, "epoch": 2132} {"train_loss": -6.27211856842041, "global_step": 89584, "epoch": 2132} {"train_loss": -6.196353957766578, "global_step": 89585, "epoch": 2132, "val_loss": 67834.1484375} {"train_loss": -6.152860641479492, "global_step": 89586, "epoch": 2133} {"train_loss": -6.279095649719238, "global_step": 89587, "epoch": 2133} {"train_loss": -6.205636978149414, "global_step": 89588, "epoch": 2133} {"train_loss": -6.10212516784668, "global_step": 89589, "epoch": 2133} {"train_loss": -6.1770524978637695, "global_step": 89590, "epoch": 2133} {"train_loss": -6.008903503417969, "global_step": 89591, "epoch": 2133} {"train_loss": -6.094692230224609, "global_step": 89592, "epoch": 2133} {"train_loss": -6.146947383880615, "global_step": 89593, "epoch": 2133} {"train_loss": -6.128639221191406, "global_step": 89594, "epoch": 2133} {"train_loss": -6.176873207092285, "global_step": 89595, "epoch": 2133} {"train_loss": -6.113788604736328, "global_step": 89596, "epoch": 2133} {"train_loss": -6.208515167236328, "global_step": 89597, "epoch": 2133} {"train_loss": -6.097900390625, "global_step": 89598, "epoch": 2133} {"train_loss": -6.260857582092285, "global_step": 89599, "epoch": 2133} {"train_loss": -6.2385735511779785, "global_step": 89600, "epoch": 2133} {"train_loss": -6.246931076049805, "global_step": 89601, "epoch": 2133} {"train_loss": -6.176807403564453, "global_step": 89602, "epoch": 2133} {"train_loss": -6.128819465637207, "global_step": 89603, "epoch": 2133} {"train_loss": -6.208286285400391, "global_step": 89604, "epoch": 2133} {"train_loss": -6.194500923156738, "global_step": 89605, "epoch": 2133} {"train_loss": -6.236241340637207, "global_step": 89606, "epoch": 2133} {"train_loss": -6.367172718048096, "global_step": 89607, "epoch": 2133} {"train_loss": -6.319704532623291, "global_step": 89608, "epoch": 2133} {"train_loss": -6.264638900756836, "global_step": 89609, "epoch": 2133} {"train_loss": -6.270206451416016, "global_step": 89610, "epoch": 2133} {"train_loss": -6.254398345947266, "global_step": 89611, "epoch": 2133} {"train_loss": -6.305642127990723, "global_step": 89612, "epoch": 2133} {"train_loss": -6.184542655944824, "global_step": 89613, "epoch": 2133} {"train_loss": -6.226186752319336, "global_step": 89614, "epoch": 2133} {"train_loss": -6.185564041137695, "global_step": 89615, "epoch": 2133} {"train_loss": -6.247854709625244, "global_step": 89616, "epoch": 2133} {"train_loss": -6.175840854644775, "global_step": 89617, "epoch": 2133} {"train_loss": -6.290987014770508, "global_step": 89618, "epoch": 2133} {"train_loss": -6.078529357910156, "global_step": 89619, "epoch": 2133} {"train_loss": -6.15855598449707, "global_step": 89620, "epoch": 2133} {"train_loss": -6.197608470916748, "global_step": 89621, "epoch": 2133} {"train_loss": -6.200658798217773, "global_step": 89622, "epoch": 2133} {"train_loss": -6.2533440589904785, "global_step": 89623, "epoch": 2133} {"train_loss": -6.117791175842285, "global_step": 89624, "epoch": 2133} {"train_loss": -6.1458001136779785, "global_step": 89625, "epoch": 2133} {"train_loss": -6.1172637939453125, "global_step": 89626, "epoch": 2133} {"train_loss": -6.194914942695981, "global_step": 89627, "epoch": 2133, "val_loss": 67875.828125} {"train_loss": -6.053457736968994, "global_step": 89628, "epoch": 2134} {"train_loss": -6.204505920410156, "global_step": 89629, "epoch": 2134} {"train_loss": -6.16949462890625, "global_step": 89630, "epoch": 2134} {"train_loss": -6.307882308959961, "global_step": 89631, "epoch": 2134} {"train_loss": -6.168169021606445, "global_step": 89632, "epoch": 2134} {"train_loss": -6.163858413696289, "global_step": 89633, "epoch": 2134} {"train_loss": -6.115103244781494, "global_step": 89634, "epoch": 2134} {"train_loss": -6.145834922790527, "global_step": 89635, "epoch": 2134} {"train_loss": -6.168925762176514, "global_step": 89636, "epoch": 2134} {"train_loss": -6.281027793884277, "global_step": 89637, "epoch": 2134} {"train_loss": -6.227150917053223, "global_step": 89638, "epoch": 2134} {"train_loss": -6.2494049072265625, "global_step": 89639, "epoch": 2134} {"train_loss": -6.142728805541992, "global_step": 89640, "epoch": 2134} {"train_loss": -6.248788833618164, "global_step": 89641, "epoch": 2134} {"train_loss": -6.284633159637451, "global_step": 89642, "epoch": 2134} {"train_loss": -6.133997440338135, "global_step": 89643, "epoch": 2134} {"train_loss": -6.083553791046143, "global_step": 89644, "epoch": 2134} {"train_loss": -6.276546478271484, "global_step": 89645, "epoch": 2134} {"train_loss": -6.135332107543945, "global_step": 89646, "epoch": 2134} {"train_loss": -6.1690521240234375, "global_step": 89647, "epoch": 2134} {"train_loss": -6.230830669403076, "global_step": 89648, "epoch": 2134} {"train_loss": -6.3429694175720215, "global_step": 89649, "epoch": 2134} {"train_loss": -6.133259296417236, "global_step": 89650, "epoch": 2134} {"train_loss": -6.314204692840576, "global_step": 89651, "epoch": 2134} {"train_loss": -6.225316047668457, "global_step": 89652, "epoch": 2134} {"train_loss": -6.1997833251953125, "global_step": 89653, "epoch": 2134} {"train_loss": -6.203376293182373, "global_step": 89654, "epoch": 2134} {"train_loss": -6.185318946838379, "global_step": 89655, "epoch": 2134} {"train_loss": -6.174262046813965, "global_step": 89656, "epoch": 2134} {"train_loss": -6.300005912780762, "global_step": 89657, "epoch": 2134} {"train_loss": -6.159644603729248, "global_step": 89658, "epoch": 2134} {"train_loss": -6.1449408531188965, "global_step": 89659, "epoch": 2134} {"train_loss": -6.0735626220703125, "global_step": 89660, "epoch": 2134} {"train_loss": -6.343174457550049, "global_step": 89661, "epoch": 2134} {"train_loss": -6.219111442565918, "global_step": 89662, "epoch": 2134} {"train_loss": -6.287392616271973, "global_step": 89663, "epoch": 2134} {"train_loss": -6.257148742675781, "global_step": 89664, "epoch": 2134} {"train_loss": -6.240102767944336, "global_step": 89665, "epoch": 2134} {"train_loss": -6.237153053283691, "global_step": 89666, "epoch": 2134} {"train_loss": -6.231717586517334, "global_step": 89667, "epoch": 2134} {"train_loss": -6.2858076095581055, "global_step": 89668, "epoch": 2134} {"train_loss": -6.206547748474848, "global_step": 89669, "epoch": 2134, "val_loss": 67931.3046875} {"train_loss": -6.300759315490723, "global_step": 89670, "epoch": 2135} {"train_loss": -6.182741165161133, "global_step": 89671, "epoch": 2135} {"train_loss": -6.243381977081299, "global_step": 89672, "epoch": 2135} {"train_loss": -6.235525131225586, "global_step": 89673, "epoch": 2135} {"train_loss": -6.241715431213379, "global_step": 89674, "epoch": 2135} {"train_loss": -6.196465492248535, "global_step": 89675, "epoch": 2135} {"train_loss": -6.335309982299805, "global_step": 89676, "epoch": 2135} {"train_loss": -6.337071418762207, "global_step": 89677, "epoch": 2135} {"train_loss": -6.346896648406982, "global_step": 89678, "epoch": 2135} {"train_loss": -6.243968486785889, "global_step": 89679, "epoch": 2135} {"train_loss": -6.1959428787231445, "global_step": 89680, "epoch": 2135} {"train_loss": -6.165128707885742, "global_step": 89681, "epoch": 2135} {"train_loss": -6.296012878417969, "global_step": 89682, "epoch": 2135} {"train_loss": -6.252457618713379, "global_step": 89683, "epoch": 2135} {"train_loss": -6.268036365509033, "global_step": 89684, "epoch": 2135} {"train_loss": -6.310447692871094, "global_step": 89685, "epoch": 2135} {"train_loss": -6.231521129608154, "global_step": 89686, "epoch": 2135} {"train_loss": -6.090986251831055, "global_step": 89687, "epoch": 2135} {"train_loss": -6.250403881072998, "global_step": 89688, "epoch": 2135} {"train_loss": -6.175236701965332, "global_step": 89689, "epoch": 2135} {"train_loss": -6.214066505432129, "global_step": 89690, "epoch": 2135} {"train_loss": -6.250551700592041, "global_step": 89691, "epoch": 2135} {"train_loss": -6.326471328735352, "global_step": 89692, "epoch": 2135} {"train_loss": -6.314514636993408, "global_step": 89693, "epoch": 2135} {"train_loss": -6.224423408508301, "global_step": 89694, "epoch": 2135} {"train_loss": -6.209997177124023, "global_step": 89695, "epoch": 2135} {"train_loss": -6.221580982208252, "global_step": 89696, "epoch": 2135} {"train_loss": -6.240072727203369, "global_step": 89697, "epoch": 2135} {"train_loss": -6.130049705505371, "global_step": 89698, "epoch": 2135} {"train_loss": -6.229463577270508, "global_step": 89699, "epoch": 2135} {"train_loss": -6.284274101257324, "global_step": 89700, "epoch": 2135} {"train_loss": -6.256616592407227, "global_step": 89701, "epoch": 2135} {"train_loss": -6.254073143005371, "global_step": 89702, "epoch": 2135} {"train_loss": -6.228423118591309, "global_step": 89703, "epoch": 2135} {"train_loss": -6.105060577392578, "global_step": 89704, "epoch": 2135} {"train_loss": -6.3211565017700195, "global_step": 89705, "epoch": 2135} {"train_loss": -6.162872791290283, "global_step": 89706, "epoch": 2135} {"train_loss": -6.078132629394531, "global_step": 89707, "epoch": 2135} {"train_loss": -6.151071548461914, "global_step": 89708, "epoch": 2135} {"train_loss": -6.2506914138793945, "global_step": 89709, "epoch": 2135} {"train_loss": -6.188714504241943, "global_step": 89710, "epoch": 2135} {"train_loss": -6.233740443275089, "global_step": 89711, "epoch": 2135, "val_loss": 67718.9921875} {"train_loss": -6.2485857009887695, "global_step": 89712, "epoch": 2136} {"train_loss": -6.233993053436279, "global_step": 89713, "epoch": 2136} {"train_loss": -6.311345100402832, "global_step": 89714, "epoch": 2136} {"train_loss": -6.318673133850098, "global_step": 89715, "epoch": 2136} {"train_loss": -6.253719329833984, "global_step": 89716, "epoch": 2136} {"train_loss": -6.196160793304443, "global_step": 89717, "epoch": 2136} {"train_loss": -6.219888687133789, "global_step": 89718, "epoch": 2136} {"train_loss": -6.320394039154053, "global_step": 89719, "epoch": 2136} {"train_loss": -6.253671646118164, "global_step": 89720, "epoch": 2136} {"train_loss": -6.273690700531006, "global_step": 89721, "epoch": 2136} {"train_loss": -6.294133186340332, "global_step": 89722, "epoch": 2136} {"train_loss": -6.361403465270996, "global_step": 89723, "epoch": 2136} {"train_loss": -6.168849945068359, "global_step": 89724, "epoch": 2136} {"train_loss": -6.255908966064453, "global_step": 89725, "epoch": 2136} {"train_loss": -6.18742561340332, "global_step": 89726, "epoch": 2136} {"train_loss": -6.226208686828613, "global_step": 89727, "epoch": 2136} {"train_loss": -6.21434211730957, "global_step": 89728, "epoch": 2136} {"train_loss": -6.284493446350098, "global_step": 89729, "epoch": 2136} {"train_loss": -6.307646751403809, "global_step": 89730, "epoch": 2136} {"train_loss": -6.257723808288574, "global_step": 89731, "epoch": 2136} {"train_loss": -6.247143745422363, "global_step": 89732, "epoch": 2136} {"train_loss": -6.314077377319336, "global_step": 89733, "epoch": 2136} {"train_loss": -6.194710731506348, "global_step": 89734, "epoch": 2136} {"train_loss": -6.238223075866699, "global_step": 89735, "epoch": 2136} {"train_loss": -6.178588390350342, "global_step": 89736, "epoch": 2136} {"train_loss": -6.225102424621582, "global_step": 89737, "epoch": 2136} {"train_loss": -6.257898330688477, "global_step": 89738, "epoch": 2136} {"train_loss": -6.201294422149658, "global_step": 89739, "epoch": 2136} {"train_loss": -6.296762466430664, "global_step": 89740, "epoch": 2136} {"train_loss": -6.203333854675293, "global_step": 89741, "epoch": 2136} {"train_loss": -6.248600006103516, "global_step": 89742, "epoch": 2136} {"train_loss": -6.106266498565674, "global_step": 89743, "epoch": 2136} {"train_loss": -6.356855392456055, "global_step": 89744, "epoch": 2136} {"train_loss": -6.2800750732421875, "global_step": 89745, "epoch": 2136} {"train_loss": -6.321986675262451, "global_step": 89746, "epoch": 2136} {"train_loss": -6.26616096496582, "global_step": 89747, "epoch": 2136} {"train_loss": -6.247865676879883, "global_step": 89748, "epoch": 2136} {"train_loss": -6.335948944091797, "global_step": 89749, "epoch": 2136} {"train_loss": -6.29360818862915, "global_step": 89750, "epoch": 2136} {"train_loss": -6.241604804992676, "global_step": 89751, "epoch": 2136} {"train_loss": -6.323883056640625, "global_step": 89752, "epoch": 2136} {"train_loss": -6.2573074840364, "global_step": 89753, "epoch": 2136, "val_loss": 67913.6796875} {"train_loss": -6.336706161499023, "global_step": 89754, "epoch": 2137} {"train_loss": -6.272046089172363, "global_step": 89755, "epoch": 2137} {"train_loss": -6.179328918457031, "global_step": 89756, "epoch": 2137} {"train_loss": -6.3557891845703125, "global_step": 89757, "epoch": 2137} {"train_loss": -6.262358665466309, "global_step": 89758, "epoch": 2137} {"train_loss": -6.279642105102539, "global_step": 89759, "epoch": 2137} {"train_loss": -6.394505500793457, "global_step": 89760, "epoch": 2137} {"train_loss": -6.151824474334717, "global_step": 89761, "epoch": 2137} {"train_loss": -6.245048522949219, "global_step": 89762, "epoch": 2137} {"train_loss": -6.151230812072754, "global_step": 89763, "epoch": 2137} {"train_loss": -6.311565399169922, "global_step": 89764, "epoch": 2137} {"train_loss": -6.295485973358154, "global_step": 89765, "epoch": 2137} {"train_loss": -6.175014495849609, "global_step": 89766, "epoch": 2137} {"train_loss": -6.239848613739014, "global_step": 89767, "epoch": 2137} {"train_loss": -6.309661865234375, "global_step": 89768, "epoch": 2137} {"train_loss": -6.2154998779296875, "global_step": 89769, "epoch": 2137} {"train_loss": -6.23232364654541, "global_step": 89770, "epoch": 2137} {"train_loss": -6.138167381286621, "global_step": 89771, "epoch": 2137} {"train_loss": -6.218499183654785, "global_step": 89772, "epoch": 2137} {"train_loss": -6.230156898498535, "global_step": 89773, "epoch": 2137} {"train_loss": -6.29069709777832, "global_step": 89774, "epoch": 2137} {"train_loss": -6.2633514404296875, "global_step": 89775, "epoch": 2137} {"train_loss": -6.245509624481201, "global_step": 89776, "epoch": 2137} {"train_loss": -6.266363620758057, "global_step": 89777, "epoch": 2137} {"train_loss": -6.221968650817871, "global_step": 89778, "epoch": 2137} {"train_loss": -6.186092376708984, "global_step": 89779, "epoch": 2137} {"train_loss": -6.178998947143555, "global_step": 89780, "epoch": 2137} {"train_loss": -6.361882209777832, "global_step": 89781, "epoch": 2137} {"train_loss": -6.335206031799316, "global_step": 89782, "epoch": 2137} {"train_loss": -6.171708583831787, "global_step": 89783, "epoch": 2137} {"train_loss": -6.249490737915039, "global_step": 89784, "epoch": 2137} {"train_loss": -6.143986701965332, "global_step": 89785, "epoch": 2137} {"train_loss": -6.088346481323242, "global_step": 89786, "epoch": 2137} {"train_loss": -6.195188522338867, "global_step": 89787, "epoch": 2137} {"train_loss": -6.08374547958374, "global_step": 89788, "epoch": 2137} {"train_loss": -6.159905910491943, "global_step": 89789, "epoch": 2137} {"train_loss": -6.176693439483643, "global_step": 89790, "epoch": 2137} {"train_loss": -6.182087421417236, "global_step": 89791, "epoch": 2137} {"train_loss": -6.053177356719971, "global_step": 89792, "epoch": 2137} {"train_loss": -6.261761665344238, "global_step": 89793, "epoch": 2137} {"train_loss": -6.202939033508301, "global_step": 89794, "epoch": 2137} {"train_loss": -6.227753786813645, "global_step": 89795, "epoch": 2137, "val_loss": 67928.9921875} {"train_loss": -6.194676399230957, "global_step": 89796, "epoch": 2138} {"train_loss": -6.157826900482178, "global_step": 89797, "epoch": 2138} {"train_loss": -6.308350563049316, "global_step": 89798, "epoch": 2138} {"train_loss": -6.292649269104004, "global_step": 89799, "epoch": 2138} {"train_loss": -6.14277982711792, "global_step": 89800, "epoch": 2138} {"train_loss": -6.1663947105407715, "global_step": 89801, "epoch": 2138} {"train_loss": -6.252679824829102, "global_step": 89802, "epoch": 2138} {"train_loss": -6.208423614501953, "global_step": 89803, "epoch": 2138} {"train_loss": -6.11318826675415, "global_step": 89804, "epoch": 2138} {"train_loss": -6.284151077270508, "global_step": 89805, "epoch": 2138} {"train_loss": -6.206944942474365, "global_step": 89806, "epoch": 2138} {"train_loss": -6.115542888641357, "global_step": 89807, "epoch": 2138} {"train_loss": -6.196544647216797, "global_step": 89808, "epoch": 2138} {"train_loss": -6.204427719116211, "global_step": 89809, "epoch": 2138} {"train_loss": -6.232877254486084, "global_step": 89810, "epoch": 2138} {"train_loss": -6.179697036743164, "global_step": 89811, "epoch": 2138} {"train_loss": -6.086350917816162, "global_step": 89812, "epoch": 2138} {"train_loss": -6.131802082061768, "global_step": 89813, "epoch": 2138} {"train_loss": -6.178403854370117, "global_step": 89814, "epoch": 2138} {"train_loss": -6.00771427154541, "global_step": 89815, "epoch": 2138} {"train_loss": -6.087045669555664, "global_step": 89816, "epoch": 2138} {"train_loss": -6.130679607391357, "global_step": 89817, "epoch": 2138} {"train_loss": -6.091368198394775, "global_step": 89818, "epoch": 2138} {"train_loss": -6.111924648284912, "global_step": 89819, "epoch": 2138} {"train_loss": -6.077446460723877, "global_step": 89820, "epoch": 2138} {"train_loss": -6.176161766052246, "global_step": 89821, "epoch": 2138} {"train_loss": -6.28466796875, "global_step": 89822, "epoch": 2138} {"train_loss": -6.150745391845703, "global_step": 89823, "epoch": 2138} {"train_loss": -6.183963775634766, "global_step": 89824, "epoch": 2138} {"train_loss": -6.221734046936035, "global_step": 89825, "epoch": 2138} {"train_loss": -6.228865623474121, "global_step": 89826, "epoch": 2138} {"train_loss": -6.240109920501709, "global_step": 89827, "epoch": 2138} {"train_loss": -6.250698089599609, "global_step": 89828, "epoch": 2138} {"train_loss": -6.223515510559082, "global_step": 89829, "epoch": 2138} {"train_loss": -6.199887275695801, "global_step": 89830, "epoch": 2138} {"train_loss": -6.265913009643555, "global_step": 89831, "epoch": 2138} {"train_loss": -6.349223613739014, "global_step": 89832, "epoch": 2138} {"train_loss": -6.20319128036499, "global_step": 89833, "epoch": 2138} {"train_loss": -6.20676326751709, "global_step": 89834, "epoch": 2138} {"train_loss": -6.268424034118652, "global_step": 89835, "epoch": 2138} {"train_loss": -6.148077964782715, "global_step": 89836, "epoch": 2138} {"train_loss": -6.194440353484381, "global_step": 89837, "epoch": 2138, "val_loss": 67739.0078125} {"train_loss": -6.237388610839844, "global_step": 89838, "epoch": 2139} {"train_loss": -6.197066307067871, "global_step": 89839, "epoch": 2139} {"train_loss": -6.2591471672058105, "global_step": 89840, "epoch": 2139} {"train_loss": -6.290608882904053, "global_step": 89841, "epoch": 2139} {"train_loss": -6.1808271408081055, "global_step": 89842, "epoch": 2139} {"train_loss": -6.224620819091797, "global_step": 89843, "epoch": 2139} {"train_loss": -6.3806562423706055, "global_step": 89844, "epoch": 2139} {"train_loss": -6.3834614753723145, "global_step": 89845, "epoch": 2139} {"train_loss": -6.186149597167969, "global_step": 89846, "epoch": 2139} {"train_loss": -6.302150726318359, "global_step": 89847, "epoch": 2139} {"train_loss": -6.2601423263549805, "global_step": 89848, "epoch": 2139} {"train_loss": -6.210361480712891, "global_step": 89849, "epoch": 2139} {"train_loss": -6.1927690505981445, "global_step": 89850, "epoch": 2139} {"train_loss": -6.1696977615356445, "global_step": 89851, "epoch": 2139} {"train_loss": -6.357601165771484, "global_step": 89852, "epoch": 2139} {"train_loss": -6.281617164611816, "global_step": 89853, "epoch": 2139} {"train_loss": -6.27216911315918, "global_step": 89854, "epoch": 2139} {"train_loss": -6.403109550476074, "global_step": 89855, "epoch": 2139} {"train_loss": -6.206705570220947, "global_step": 89856, "epoch": 2139} {"train_loss": -6.176181316375732, "global_step": 89857, "epoch": 2139} {"train_loss": -6.272058963775635, "global_step": 89858, "epoch": 2139} {"train_loss": -6.2418670654296875, "global_step": 89859, "epoch": 2139} {"train_loss": -6.300455093383789, "global_step": 89860, "epoch": 2139} {"train_loss": -6.2350897789001465, "global_step": 89861, "epoch": 2139} {"train_loss": -6.1839189529418945, "global_step": 89862, "epoch": 2139} {"train_loss": -6.292599678039551, "global_step": 89863, "epoch": 2139} {"train_loss": -6.380765914916992, "global_step": 89864, "epoch": 2139} {"train_loss": -6.236959934234619, "global_step": 89865, "epoch": 2139} {"train_loss": -6.267108917236328, "global_step": 89866, "epoch": 2139} {"train_loss": -6.132760047912598, "global_step": 89867, "epoch": 2139} {"train_loss": -6.291390419006348, "global_step": 89868, "epoch": 2139} {"train_loss": -6.29942512512207, "global_step": 89869, "epoch": 2139} {"train_loss": -6.222964286804199, "global_step": 89870, "epoch": 2139} {"train_loss": -6.167174339294434, "global_step": 89871, "epoch": 2139} {"train_loss": -6.324058532714844, "global_step": 89872, "epoch": 2139} {"train_loss": -6.3082427978515625, "global_step": 89873, "epoch": 2139} {"train_loss": -6.282240867614746, "global_step": 89874, "epoch": 2139} {"train_loss": -6.200722694396973, "global_step": 89875, "epoch": 2139} {"train_loss": -6.27764892578125, "global_step": 89876, "epoch": 2139} {"train_loss": -6.267734527587891, "global_step": 89877, "epoch": 2139} {"train_loss": -6.307448863983154, "global_step": 89878, "epoch": 2139} {"train_loss": -6.262477749869937, "global_step": 89879, "epoch": 2139, "val_loss": 67787.8125} {"train_loss": -6.298362731933594, "global_step": 89880, "epoch": 2140} {"train_loss": -6.293389320373535, "global_step": 89881, "epoch": 2140} {"train_loss": -6.190939903259277, "global_step": 89882, "epoch": 2140} {"train_loss": -6.2982401847839355, "global_step": 89883, "epoch": 2140} {"train_loss": -6.297089576721191, "global_step": 89884, "epoch": 2140} {"train_loss": -6.248315811157227, "global_step": 89885, "epoch": 2140} {"train_loss": -6.358114719390869, "global_step": 89886, "epoch": 2140} {"train_loss": -6.1302995681762695, "global_step": 89887, "epoch": 2140} {"train_loss": -6.160754203796387, "global_step": 89888, "epoch": 2140} {"train_loss": -6.300055027008057, "global_step": 89889, "epoch": 2140} {"train_loss": -6.2378339767456055, "global_step": 89890, "epoch": 2140} {"train_loss": -6.145400047302246, "global_step": 89891, "epoch": 2140} {"train_loss": -6.304643154144287, "global_step": 89892, "epoch": 2140} {"train_loss": -6.146145820617676, "global_step": 89893, "epoch": 2140} {"train_loss": -6.108582496643066, "global_step": 89894, "epoch": 2140} {"train_loss": -6.267920017242432, "global_step": 89895, "epoch": 2140} {"train_loss": -6.245274543762207, "global_step": 89896, "epoch": 2140} {"train_loss": -6.1866350173950195, "global_step": 89897, "epoch": 2140} {"train_loss": -6.206300258636475, "global_step": 89898, "epoch": 2140} {"train_loss": -6.230175971984863, "global_step": 89899, "epoch": 2140} {"train_loss": -6.204408645629883, "global_step": 89900, "epoch": 2140} {"train_loss": -6.124911785125732, "global_step": 89901, "epoch": 2140} {"train_loss": -6.178163528442383, "global_step": 89902, "epoch": 2140} {"train_loss": -6.277711391448975, "global_step": 89903, "epoch": 2140} {"train_loss": -6.330538749694824, "global_step": 89904, "epoch": 2140} {"train_loss": -6.2005720138549805, "global_step": 89905, "epoch": 2140} {"train_loss": -6.229783535003662, "global_step": 89906, "epoch": 2140} {"train_loss": -6.306269645690918, "global_step": 89907, "epoch": 2140} {"train_loss": -6.140824317932129, "global_step": 89908, "epoch": 2140} {"train_loss": -6.159718990325928, "global_step": 89909, "epoch": 2140} {"train_loss": -6.188963890075684, "global_step": 89910, "epoch": 2140} {"train_loss": -6.226137161254883, "global_step": 89911, "epoch": 2140} {"train_loss": -6.180177688598633, "global_step": 89912, "epoch": 2140} {"train_loss": -6.174644470214844, "global_step": 89913, "epoch": 2140} {"train_loss": -6.194580554962158, "global_step": 89914, "epoch": 2140} {"train_loss": -6.268185615539551, "global_step": 89915, "epoch": 2140} {"train_loss": -6.241364479064941, "global_step": 89916, "epoch": 2140} {"train_loss": -6.128745079040527, "global_step": 89917, "epoch": 2140} {"train_loss": -6.212393283843994, "global_step": 89918, "epoch": 2140} {"train_loss": -6.147622108459473, "global_step": 89919, "epoch": 2140} {"train_loss": -6.197315692901611, "global_step": 89920, "epoch": 2140} {"train_loss": -6.221272706985474, "global_step": 89921, "epoch": 2140, "val_loss": 68078.875} {"train_loss": -6.293245315551758, "global_step": 89922, "epoch": 2141} {"train_loss": -6.108570098876953, "global_step": 89923, "epoch": 2141} {"train_loss": -6.168923377990723, "global_step": 89924, "epoch": 2141} {"train_loss": -6.286412715911865, "global_step": 89925, "epoch": 2141} {"train_loss": -6.230248928070068, "global_step": 89926, "epoch": 2141} {"train_loss": -6.145853042602539, "global_step": 89927, "epoch": 2141} {"train_loss": -6.207873344421387, "global_step": 89928, "epoch": 2141} {"train_loss": -6.2887163162231445, "global_step": 89929, "epoch": 2141} {"train_loss": -6.357885360717773, "global_step": 89930, "epoch": 2141} {"train_loss": -6.289191246032715, "global_step": 89931, "epoch": 2141} {"train_loss": -6.282933235168457, "global_step": 89932, "epoch": 2141} {"train_loss": -6.189148902893066, "global_step": 89933, "epoch": 2141} {"train_loss": -6.3040032386779785, "global_step": 89934, "epoch": 2141} {"train_loss": -6.2421674728393555, "global_step": 89935, "epoch": 2141} {"train_loss": -6.308807849884033, "global_step": 89936, "epoch": 2141} {"train_loss": -6.23105525970459, "global_step": 89937, "epoch": 2141} {"train_loss": -6.276634693145752, "global_step": 89938, "epoch": 2141} {"train_loss": -6.074230194091797, "global_step": 89939, "epoch": 2141} {"train_loss": -6.136013031005859, "global_step": 89940, "epoch": 2141} {"train_loss": -5.994633197784424, "global_step": 89941, "epoch": 2141} {"train_loss": -6.155935287475586, "global_step": 89942, "epoch": 2141} {"train_loss": -6.145503044128418, "global_step": 89943, "epoch": 2141} {"train_loss": -6.138657569885254, "global_step": 89944, "epoch": 2141} {"train_loss": -6.083660125732422, "global_step": 89945, "epoch": 2141} {"train_loss": -6.226091384887695, "global_step": 89946, "epoch": 2141} {"train_loss": -6.053469657897949, "global_step": 89947, "epoch": 2141} {"train_loss": -6.241733551025391, "global_step": 89948, "epoch": 2141} {"train_loss": -6.008823394775391, "global_step": 89949, "epoch": 2141} {"train_loss": -6.268710613250732, "global_step": 89950, "epoch": 2141} {"train_loss": -6.175292015075684, "global_step": 89951, "epoch": 2141} {"train_loss": -6.083854675292969, "global_step": 89952, "epoch": 2141} {"train_loss": -6.237424850463867, "global_step": 89953, "epoch": 2141} {"train_loss": -6.239352703094482, "global_step": 89954, "epoch": 2141} {"train_loss": -6.19940185546875, "global_step": 89955, "epoch": 2141} {"train_loss": -6.177114963531494, "global_step": 89956, "epoch": 2141} {"train_loss": -6.251670837402344, "global_step": 89957, "epoch": 2141} {"train_loss": -6.247951984405518, "global_step": 89958, "epoch": 2141} {"train_loss": -6.257660865783691, "global_step": 89959, "epoch": 2141} {"train_loss": -6.177101135253906, "global_step": 89960, "epoch": 2141} {"train_loss": -6.214555740356445, "global_step": 89961, "epoch": 2141} {"train_loss": -6.212961196899414, "global_step": 89962, "epoch": 2141} {"train_loss": -6.200641019003732, "global_step": 89963, "epoch": 2141, "val_loss": 67781.390625} {"train_loss": -6.375953674316406, "global_step": 89964, "epoch": 2142} {"train_loss": -6.242931842803955, "global_step": 89965, "epoch": 2142} {"train_loss": -6.199522018432617, "global_step": 89966, "epoch": 2142} {"train_loss": -6.26777982711792, "global_step": 89967, "epoch": 2142} {"train_loss": -6.229379653930664, "global_step": 89968, "epoch": 2142} {"train_loss": -6.163898468017578, "global_step": 89969, "epoch": 2142} {"train_loss": -6.066112518310547, "global_step": 89970, "epoch": 2142} {"train_loss": -6.22914457321167, "global_step": 89971, "epoch": 2142} {"train_loss": -6.258209705352783, "global_step": 89972, "epoch": 2142} {"train_loss": -6.209577560424805, "global_step": 89973, "epoch": 2142} {"train_loss": -6.276149749755859, "global_step": 89974, "epoch": 2142} {"train_loss": -6.209869384765625, "global_step": 89975, "epoch": 2142} {"train_loss": -6.217859745025635, "global_step": 89976, "epoch": 2142} {"train_loss": -6.301559925079346, "global_step": 89977, "epoch": 2142} {"train_loss": -6.04473876953125, "global_step": 89978, "epoch": 2142} {"train_loss": -6.25871467590332, "global_step": 89979, "epoch": 2142} {"train_loss": -6.128281593322754, "global_step": 89980, "epoch": 2142} {"train_loss": -6.178251266479492, "global_step": 89981, "epoch": 2142} {"train_loss": -6.218181610107422, "global_step": 89982, "epoch": 2142} {"train_loss": -6.1472625732421875, "global_step": 89983, "epoch": 2142} {"train_loss": -6.330741882324219, "global_step": 89984, "epoch": 2142} {"train_loss": -6.18834114074707, "global_step": 89985, "epoch": 2142} {"train_loss": -6.089332580566406, "global_step": 89986, "epoch": 2142} {"train_loss": -6.199624061584473, "global_step": 89987, "epoch": 2142} {"train_loss": -6.236965179443359, "global_step": 89988, "epoch": 2142} {"train_loss": -6.276089191436768, "global_step": 89989, "epoch": 2142} {"train_loss": -6.080733776092529, "global_step": 89990, "epoch": 2142} {"train_loss": -6.105313301086426, "global_step": 89991, "epoch": 2142} {"train_loss": -6.140152454376221, "global_step": 89992, "epoch": 2142} {"train_loss": -6.146390914916992, "global_step": 89993, "epoch": 2142} {"train_loss": -6.273573398590088, "global_step": 89994, "epoch": 2142} {"train_loss": -6.205092430114746, "global_step": 89995, "epoch": 2142} {"train_loss": -6.21575927734375, "global_step": 89996, "epoch": 2142} {"train_loss": -6.140341758728027, "global_step": 89997, "epoch": 2142} {"train_loss": -6.210211753845215, "global_step": 89998, "epoch": 2142} {"train_loss": -6.267124176025391, "global_step": 89999, "epoch": 2142} {"train_loss": -6.116111755371094, "global_step": 90000, "epoch": 2142} {"train_loss": -6.203268051147461, "global_step": 90001, "epoch": 2142} {"train_loss": -6.220368385314941, "global_step": 90002, "epoch": 2142} {"train_loss": -6.147219657897949, "global_step": 90003, "epoch": 2142} {"train_loss": -6.329610824584961, "global_step": 90004, "epoch": 2142} {"train_loss": -6.204899424598331, "global_step": 90005, "epoch": 2142, "val_loss": 68058.515625} {"train_loss": -6.368861198425293, "global_step": 90006, "epoch": 2143} {"train_loss": -6.24008846282959, "global_step": 90007, "epoch": 2143} {"train_loss": -6.106052875518799, "global_step": 90008, "epoch": 2143} {"train_loss": -6.205813407897949, "global_step": 90009, "epoch": 2143} {"train_loss": -6.270624160766602, "global_step": 90010, "epoch": 2143} {"train_loss": -6.193630218505859, "global_step": 90011, "epoch": 2143} {"train_loss": -6.134370803833008, "global_step": 90012, "epoch": 2143} {"train_loss": -6.279077053070068, "global_step": 90013, "epoch": 2143} {"train_loss": -6.207477569580078, "global_step": 90014, "epoch": 2143} {"train_loss": -6.179725170135498, "global_step": 90015, "epoch": 2143} {"train_loss": -6.201897621154785, "global_step": 90016, "epoch": 2143} {"train_loss": -6.15546989440918, "global_step": 90017, "epoch": 2143} {"train_loss": -6.155511856079102, "global_step": 90018, "epoch": 2143} {"train_loss": -6.218873500823975, "global_step": 90019, "epoch": 2143} {"train_loss": -6.194877624511719, "global_step": 90020, "epoch": 2143} {"train_loss": -6.065803527832031, "global_step": 90021, "epoch": 2143} {"train_loss": -6.23538875579834, "global_step": 90022, "epoch": 2143} {"train_loss": -6.2350544929504395, "global_step": 90023, "epoch": 2143} {"train_loss": -6.272844314575195, "global_step": 90024, "epoch": 2143} {"train_loss": -6.294460296630859, "global_step": 90025, "epoch": 2143} {"train_loss": -6.189682483673096, "global_step": 90026, "epoch": 2143} {"train_loss": -6.271044731140137, "global_step": 90027, "epoch": 2143} {"train_loss": -6.237112045288086, "global_step": 90028, "epoch": 2143} {"train_loss": -6.218925952911377, "global_step": 90029, "epoch": 2143} {"train_loss": -6.278939723968506, "global_step": 90030, "epoch": 2143} {"train_loss": -6.329375267028809, "global_step": 90031, "epoch": 2143} {"train_loss": -6.223143577575684, "global_step": 90032, "epoch": 2143} {"train_loss": -6.132765293121338, "global_step": 90033, "epoch": 2143} {"train_loss": -6.1295061111450195, "global_step": 90034, "epoch": 2143} {"train_loss": -6.191527366638184, "global_step": 90035, "epoch": 2143} {"train_loss": -6.296652317047119, "global_step": 90036, "epoch": 2143} {"train_loss": -6.4195356369018555, "global_step": 90037, "epoch": 2143} {"train_loss": -6.22775936126709, "global_step": 90038, "epoch": 2143} {"train_loss": -6.287711143493652, "global_step": 90039, "epoch": 2143} {"train_loss": -6.190794467926025, "global_step": 90040, "epoch": 2143} {"train_loss": -6.254787445068359, "global_step": 90041, "epoch": 2143} {"train_loss": -6.127626895904541, "global_step": 90042, "epoch": 2143} {"train_loss": -6.228751182556152, "global_step": 90043, "epoch": 2143} {"train_loss": -6.148202419281006, "global_step": 90044, "epoch": 2143} {"train_loss": -6.249431610107422, "global_step": 90045, "epoch": 2143} {"train_loss": -6.209231376647949, "global_step": 90046, "epoch": 2143} {"train_loss": -6.220584699085781, "global_step": 90047, "epoch": 2143, "val_loss": 67691.7421875} {"train_loss": -6.252976417541504, "global_step": 90048, "epoch": 2144} {"train_loss": -6.177973747253418, "global_step": 90049, "epoch": 2144} {"train_loss": -6.314226150512695, "global_step": 90050, "epoch": 2144} {"train_loss": -6.263211727142334, "global_step": 90051, "epoch": 2144} {"train_loss": -6.243442535400391, "global_step": 90052, "epoch": 2144} {"train_loss": -6.215845108032227, "global_step": 90053, "epoch": 2144} {"train_loss": -6.31406831741333, "global_step": 90054, "epoch": 2144} {"train_loss": -6.16432523727417, "global_step": 90055, "epoch": 2144} {"train_loss": -6.300902843475342, "global_step": 90056, "epoch": 2144} {"train_loss": -6.354219436645508, "global_step": 90057, "epoch": 2144} {"train_loss": -6.230454921722412, "global_step": 90058, "epoch": 2144} {"train_loss": -6.140628337860107, "global_step": 90059, "epoch": 2144} {"train_loss": -6.175189971923828, "global_step": 90060, "epoch": 2144} {"train_loss": -6.3272552490234375, "global_step": 90061, "epoch": 2144} {"train_loss": -6.244607448577881, "global_step": 90062, "epoch": 2144} {"train_loss": -6.189735412597656, "global_step": 90063, "epoch": 2144} {"train_loss": -6.268638610839844, "global_step": 90064, "epoch": 2144} {"train_loss": -6.280983924865723, "global_step": 90065, "epoch": 2144} {"train_loss": -6.243669509887695, "global_step": 90066, "epoch": 2144} {"train_loss": -6.289111137390137, "global_step": 90067, "epoch": 2144} {"train_loss": -6.2822418212890625, "global_step": 90068, "epoch": 2144} {"train_loss": -6.25872802734375, "global_step": 90069, "epoch": 2144} {"train_loss": -6.134612083435059, "global_step": 90070, "epoch": 2144} {"train_loss": -6.272854328155518, "global_step": 90071, "epoch": 2144} {"train_loss": -6.286226272583008, "global_step": 90072, "epoch": 2144} {"train_loss": -6.172282695770264, "global_step": 90073, "epoch": 2144} {"train_loss": -6.235763072967529, "global_step": 90074, "epoch": 2144} {"train_loss": -6.184501647949219, "global_step": 90075, "epoch": 2144} {"train_loss": -6.241743087768555, "global_step": 90076, "epoch": 2144} {"train_loss": -6.150872230529785, "global_step": 90077, "epoch": 2144} {"train_loss": -6.414228916168213, "global_step": 90078, "epoch": 2144} {"train_loss": -6.244293212890625, "global_step": 90079, "epoch": 2144} {"train_loss": -6.282410621643066, "global_step": 90080, "epoch": 2144} {"train_loss": -6.339882850646973, "global_step": 90081, "epoch": 2144} {"train_loss": -6.16427755355835, "global_step": 90082, "epoch": 2144} {"train_loss": -6.13789176940918, "global_step": 90083, "epoch": 2144} {"train_loss": -6.2424116134643555, "global_step": 90084, "epoch": 2144} {"train_loss": -6.098351001739502, "global_step": 90085, "epoch": 2144} {"train_loss": -6.248628616333008, "global_step": 90086, "epoch": 2144} {"train_loss": -6.315950870513916, "global_step": 90087, "epoch": 2144} {"train_loss": -6.342800617218018, "global_step": 90088, "epoch": 2144} {"train_loss": -6.245517719359625, "global_step": 90089, "epoch": 2144, "val_loss": 68049.28125} {"train_loss": -6.1851806640625, "global_step": 90090, "epoch": 2145} {"train_loss": -6.243934631347656, "global_step": 90091, "epoch": 2145} {"train_loss": -6.176725387573242, "global_step": 90092, "epoch": 2145} {"train_loss": -6.282047271728516, "global_step": 90093, "epoch": 2145} {"train_loss": -6.306601524353027, "global_step": 90094, "epoch": 2145} {"train_loss": -6.231985092163086, "global_step": 90095, "epoch": 2145} {"train_loss": -6.120516777038574, "global_step": 90096, "epoch": 2145} {"train_loss": -6.129277229309082, "global_step": 90097, "epoch": 2145} {"train_loss": -6.132081985473633, "global_step": 90098, "epoch": 2145} {"train_loss": -6.194371700286865, "global_step": 90099, "epoch": 2145} {"train_loss": -6.176382064819336, "global_step": 90100, "epoch": 2145} {"train_loss": -6.137490272521973, "global_step": 90101, "epoch": 2145} {"train_loss": -6.254703521728516, "global_step": 90102, "epoch": 2145} {"train_loss": -6.177035808563232, "global_step": 90103, "epoch": 2145} {"train_loss": -6.217586040496826, "global_step": 90104, "epoch": 2145} {"train_loss": -6.322625637054443, "global_step": 90105, "epoch": 2145} {"train_loss": -6.266290664672852, "global_step": 90106, "epoch": 2145} {"train_loss": -6.234531402587891, "global_step": 90107, "epoch": 2145} {"train_loss": -6.216486930847168, "global_step": 90108, "epoch": 2145} {"train_loss": -6.156221866607666, "global_step": 90109, "epoch": 2145} {"train_loss": -6.2372236251831055, "global_step": 90110, "epoch": 2145} {"train_loss": -6.141627788543701, "global_step": 90111, "epoch": 2145} {"train_loss": -6.150053024291992, "global_step": 90112, "epoch": 2145} {"train_loss": -6.066998481750488, "global_step": 90113, "epoch": 2145} {"train_loss": -6.270252704620361, "global_step": 90114, "epoch": 2145} {"train_loss": -6.232685089111328, "global_step": 90115, "epoch": 2145} {"train_loss": -6.310264587402344, "global_step": 90116, "epoch": 2145} {"train_loss": -6.255805492401123, "global_step": 90117, "epoch": 2145} {"train_loss": -6.153331756591797, "global_step": 90118, "epoch": 2145} {"train_loss": -6.136199951171875, "global_step": 90119, "epoch": 2145} {"train_loss": -6.283989906311035, "global_step": 90120, "epoch": 2145} {"train_loss": -6.141016006469727, "global_step": 90121, "epoch": 2145} {"train_loss": -6.207503318786621, "global_step": 90122, "epoch": 2145} {"train_loss": -6.2104644775390625, "global_step": 90123, "epoch": 2145} {"train_loss": -6.264184951782227, "global_step": 90124, "epoch": 2145} {"train_loss": -6.124277114868164, "global_step": 90125, "epoch": 2145} {"train_loss": -6.289831161499023, "global_step": 90126, "epoch": 2145} {"train_loss": -6.225449085235596, "global_step": 90127, "epoch": 2145} {"train_loss": -6.2501220703125, "global_step": 90128, "epoch": 2145} {"train_loss": -6.19143009185791, "global_step": 90129, "epoch": 2145} {"train_loss": -6.224327564239502, "global_step": 90130, "epoch": 2145} {"train_loss": -6.209171987715221, "global_step": 90131, "epoch": 2145, "val_loss": 67787.8984375} {"train_loss": -6.107970237731934, "global_step": 90132, "epoch": 2146} {"train_loss": -6.281765937805176, "global_step": 90133, "epoch": 2146} {"train_loss": -6.223176002502441, "global_step": 90134, "epoch": 2146} {"train_loss": -6.22524356842041, "global_step": 90135, "epoch": 2146} {"train_loss": -6.231682777404785, "global_step": 90136, "epoch": 2146} {"train_loss": -6.300537109375, "global_step": 90137, "epoch": 2146} {"train_loss": -6.040197849273682, "global_step": 90138, "epoch": 2146} {"train_loss": -6.114537239074707, "global_step": 90139, "epoch": 2146} {"train_loss": -6.2476654052734375, "global_step": 90140, "epoch": 2146} {"train_loss": -6.248539447784424, "global_step": 90141, "epoch": 2146} {"train_loss": -6.213972091674805, "global_step": 90142, "epoch": 2146} {"train_loss": -6.263026237487793, "global_step": 90143, "epoch": 2146} {"train_loss": -6.134439468383789, "global_step": 90144, "epoch": 2146} {"train_loss": -6.233257293701172, "global_step": 90145, "epoch": 2146} {"train_loss": -6.117260932922363, "global_step": 90146, "epoch": 2146} {"train_loss": -6.196467399597168, "global_step": 90147, "epoch": 2146} {"train_loss": -6.304180145263672, "global_step": 90148, "epoch": 2146} {"train_loss": -6.133738994598389, "global_step": 90149, "epoch": 2146} {"train_loss": -6.262252330780029, "global_step": 90150, "epoch": 2146} {"train_loss": -6.375219345092773, "global_step": 90151, "epoch": 2146} {"train_loss": -6.182519912719727, "global_step": 90152, "epoch": 2146} {"train_loss": -6.262842655181885, "global_step": 90153, "epoch": 2146} {"train_loss": -6.100705146789551, "global_step": 90154, "epoch": 2146} {"train_loss": -6.316309452056885, "global_step": 90155, "epoch": 2146} {"train_loss": -6.272455215454102, "global_step": 90156, "epoch": 2146} {"train_loss": -6.124600887298584, "global_step": 90157, "epoch": 2146} {"train_loss": -6.247611045837402, "global_step": 90158, "epoch": 2146} {"train_loss": -6.173914909362793, "global_step": 90159, "epoch": 2146} {"train_loss": -6.35734748840332, "global_step": 90160, "epoch": 2146} {"train_loss": -6.173501968383789, "global_step": 90161, "epoch": 2146} {"train_loss": -6.072627067565918, "global_step": 90162, "epoch": 2146} {"train_loss": -6.233024597167969, "global_step": 90163, "epoch": 2146} {"train_loss": -6.271553039550781, "global_step": 90164, "epoch": 2146} {"train_loss": -6.247866630554199, "global_step": 90165, "epoch": 2146} {"train_loss": -6.180185317993164, "global_step": 90166, "epoch": 2146} {"train_loss": -6.119169235229492, "global_step": 90167, "epoch": 2146} {"train_loss": -6.1867828369140625, "global_step": 90168, "epoch": 2146} {"train_loss": -6.234888076782227, "global_step": 90169, "epoch": 2146} {"train_loss": -6.287364959716797, "global_step": 90170, "epoch": 2146} {"train_loss": -6.2163825035095215, "global_step": 90171, "epoch": 2146} {"train_loss": -6.188614368438721, "global_step": 90172, "epoch": 2146} {"train_loss": -6.211284830456688, "global_step": 90173, "epoch": 2146, "val_loss": 67767.625} {"train_loss": -6.266593933105469, "global_step": 90174, "epoch": 2147} {"train_loss": -6.157649993896484, "global_step": 90175, "epoch": 2147} {"train_loss": -6.235223293304443, "global_step": 90176, "epoch": 2147} {"train_loss": -6.176277160644531, "global_step": 90177, "epoch": 2147} {"train_loss": -6.213472366333008, "global_step": 90178, "epoch": 2147} {"train_loss": -6.311464309692383, "global_step": 90179, "epoch": 2147} {"train_loss": -6.316995620727539, "global_step": 90180, "epoch": 2147} {"train_loss": -6.2812819480896, "global_step": 90181, "epoch": 2147} {"train_loss": -6.342427730560303, "global_step": 90182, "epoch": 2147} {"train_loss": -6.3707685470581055, "global_step": 90183, "epoch": 2147} {"train_loss": -6.2787251472473145, "global_step": 90184, "epoch": 2147} {"train_loss": -6.283359050750732, "global_step": 90185, "epoch": 2147} {"train_loss": -6.250045299530029, "global_step": 90186, "epoch": 2147} {"train_loss": -6.341870307922363, "global_step": 90187, "epoch": 2147} {"train_loss": -6.294031143188477, "global_step": 90188, "epoch": 2147} {"train_loss": -6.254663467407227, "global_step": 90189, "epoch": 2147} {"train_loss": -6.171977996826172, "global_step": 90190, "epoch": 2147} {"train_loss": -6.161615371704102, "global_step": 90191, "epoch": 2147} {"train_loss": -6.302689075469971, "global_step": 90192, "epoch": 2147} {"train_loss": -6.307592868804932, "global_step": 90193, "epoch": 2147} {"train_loss": -6.114204406738281, "global_step": 90194, "epoch": 2147} {"train_loss": -6.271027565002441, "global_step": 90195, "epoch": 2147} {"train_loss": -6.208035469055176, "global_step": 90196, "epoch": 2147} {"train_loss": -6.283285617828369, "global_step": 90197, "epoch": 2147} {"train_loss": -6.169151306152344, "global_step": 90198, "epoch": 2147} {"train_loss": -6.380414962768555, "global_step": 90199, "epoch": 2147} {"train_loss": -6.273425102233887, "global_step": 90200, "epoch": 2147} {"train_loss": -6.298007965087891, "global_step": 90201, "epoch": 2147} {"train_loss": -6.206228256225586, "global_step": 90202, "epoch": 2147} {"train_loss": -6.33858585357666, "global_step": 90203, "epoch": 2147} {"train_loss": -6.27536153793335, "global_step": 90204, "epoch": 2147} {"train_loss": -6.222557067871094, "global_step": 90205, "epoch": 2147} {"train_loss": -6.255859375, "global_step": 90206, "epoch": 2147} {"train_loss": -6.17728853225708, "global_step": 90207, "epoch": 2147} {"train_loss": -6.337533950805664, "global_step": 90208, "epoch": 2147} {"train_loss": -6.212154388427734, "global_step": 90209, "epoch": 2147} {"train_loss": -6.265107154846191, "global_step": 90210, "epoch": 2147} {"train_loss": -6.245813369750977, "global_step": 90211, "epoch": 2147} {"train_loss": -6.324089527130127, "global_step": 90212, "epoch": 2147} {"train_loss": -6.274099349975586, "global_step": 90213, "epoch": 2147} {"train_loss": -6.179450035095215, "global_step": 90214, "epoch": 2147} {"train_loss": -6.259682814280192, "global_step": 90215, "epoch": 2147, "val_loss": 67693.8515625} {"train_loss": -6.2693328857421875, "global_step": 90216, "epoch": 2148} {"train_loss": -6.220680236816406, "global_step": 90217, "epoch": 2148} {"train_loss": -6.221670150756836, "global_step": 90218, "epoch": 2148} {"train_loss": -6.287374496459961, "global_step": 90219, "epoch": 2148} {"train_loss": -6.239402770996094, "global_step": 90220, "epoch": 2148} {"train_loss": -6.266419410705566, "global_step": 90221, "epoch": 2148} {"train_loss": -6.296722888946533, "global_step": 90222, "epoch": 2148} {"train_loss": -6.212813377380371, "global_step": 90223, "epoch": 2148} {"train_loss": -6.196420669555664, "global_step": 90224, "epoch": 2148} {"train_loss": -6.199967384338379, "global_step": 90225, "epoch": 2148} {"train_loss": -6.282322883605957, "global_step": 90226, "epoch": 2148} {"train_loss": -6.175335884094238, "global_step": 90227, "epoch": 2148} {"train_loss": -6.181097507476807, "global_step": 90228, "epoch": 2148} {"train_loss": -6.07420539855957, "global_step": 90229, "epoch": 2148} {"train_loss": -6.272625923156738, "global_step": 90230, "epoch": 2148} {"train_loss": -6.126276969909668, "global_step": 90231, "epoch": 2148} {"train_loss": -6.235628128051758, "global_step": 90232, "epoch": 2148} {"train_loss": -6.2271246910095215, "global_step": 90233, "epoch": 2148} {"train_loss": -6.3274688720703125, "global_step": 90234, "epoch": 2148} {"train_loss": -6.256133079528809, "global_step": 90235, "epoch": 2148} {"train_loss": -6.288631439208984, "global_step": 90236, "epoch": 2148} {"train_loss": -6.142949104309082, "global_step": 90237, "epoch": 2148} {"train_loss": -6.188935279846191, "global_step": 90238, "epoch": 2148} {"train_loss": -6.128921031951904, "global_step": 90239, "epoch": 2148} {"train_loss": -6.166725158691406, "global_step": 90240, "epoch": 2148} {"train_loss": -6.19052267074585, "global_step": 90241, "epoch": 2148} {"train_loss": -6.181514263153076, "global_step": 90242, "epoch": 2148} {"train_loss": -6.210882663726807, "global_step": 90243, "epoch": 2148} {"train_loss": -6.188681602478027, "global_step": 90244, "epoch": 2148} {"train_loss": -6.21138858795166, "global_step": 90245, "epoch": 2148} {"train_loss": -6.3022356033325195, "global_step": 90246, "epoch": 2148} {"train_loss": -6.302737236022949, "global_step": 90247, "epoch": 2148} {"train_loss": -6.237187385559082, "global_step": 90248, "epoch": 2148} {"train_loss": -6.40609073638916, "global_step": 90249, "epoch": 2148} {"train_loss": -6.0607428550720215, "global_step": 90250, "epoch": 2148} {"train_loss": -6.18520975112915, "global_step": 90251, "epoch": 2148} {"train_loss": -6.2394537925720215, "global_step": 90252, "epoch": 2148} {"train_loss": -6.233992576599121, "global_step": 90253, "epoch": 2148} {"train_loss": -6.209595680236816, "global_step": 90254, "epoch": 2148} {"train_loss": -6.212086200714111, "global_step": 90255, "epoch": 2148} {"train_loss": -6.1666154861450195, "global_step": 90256, "epoch": 2148} {"train_loss": -6.219532262711298, "global_step": 90257, "epoch": 2148, "val_loss": 68043.734375} {"train_loss": -6.199821472167969, "global_step": 90258, "epoch": 2149} {"train_loss": -6.292283058166504, "global_step": 90259, "epoch": 2149} {"train_loss": -6.292204856872559, "global_step": 90260, "epoch": 2149} {"train_loss": -6.342461109161377, "global_step": 90261, "epoch": 2149} {"train_loss": -6.262820243835449, "global_step": 90262, "epoch": 2149} {"train_loss": -6.214478492736816, "global_step": 90263, "epoch": 2149} {"train_loss": -6.356833457946777, "global_step": 90264, "epoch": 2149} {"train_loss": -6.276311874389648, "global_step": 90265, "epoch": 2149} {"train_loss": -6.361269950866699, "global_step": 90266, "epoch": 2149} {"train_loss": -6.251889705657959, "global_step": 90267, "epoch": 2149} {"train_loss": -6.327819347381592, "global_step": 90268, "epoch": 2149} {"train_loss": -6.161252021789551, "global_step": 90269, "epoch": 2149} {"train_loss": -6.243467807769775, "global_step": 90270, "epoch": 2149} {"train_loss": -6.276223182678223, "global_step": 90271, "epoch": 2149} {"train_loss": -6.285658836364746, "global_step": 90272, "epoch": 2149} {"train_loss": -6.236815452575684, "global_step": 90273, "epoch": 2149} {"train_loss": -6.316771507263184, "global_step": 90274, "epoch": 2149} {"train_loss": -6.26608419418335, "global_step": 90275, "epoch": 2149} {"train_loss": -6.177474021911621, "global_step": 90276, "epoch": 2149} {"train_loss": -6.260931015014648, "global_step": 90277, "epoch": 2149} {"train_loss": -6.265859127044678, "global_step": 90278, "epoch": 2149} {"train_loss": -6.219658851623535, "global_step": 90279, "epoch": 2149} {"train_loss": -6.087791442871094, "global_step": 90280, "epoch": 2149} {"train_loss": -6.2309722900390625, "global_step": 90281, "epoch": 2149} {"train_loss": -6.374247074127197, "global_step": 90282, "epoch": 2149} {"train_loss": -6.193562984466553, "global_step": 90283, "epoch": 2149} {"train_loss": -6.236350059509277, "global_step": 90284, "epoch": 2149} {"train_loss": -6.241193771362305, "global_step": 90285, "epoch": 2149} {"train_loss": -6.155372619628906, "global_step": 90286, "epoch": 2149} {"train_loss": -6.279833793640137, "global_step": 90287, "epoch": 2149} {"train_loss": -6.202576637268066, "global_step": 90288, "epoch": 2149} {"train_loss": -6.241525650024414, "global_step": 90289, "epoch": 2149} {"train_loss": -6.254034042358398, "global_step": 90290, "epoch": 2149} {"train_loss": -6.216691970825195, "global_step": 90291, "epoch": 2149} {"train_loss": -6.210968494415283, "global_step": 90292, "epoch": 2149} {"train_loss": -6.294346332550049, "global_step": 90293, "epoch": 2149} {"train_loss": -6.19104528427124, "global_step": 90294, "epoch": 2149} {"train_loss": -6.212042808532715, "global_step": 90295, "epoch": 2149} {"train_loss": -6.243013381958008, "global_step": 90296, "epoch": 2149} {"train_loss": -6.162250518798828, "global_step": 90297, "epoch": 2149} {"train_loss": -6.299176216125488, "global_step": 90298, "epoch": 2149} {"train_loss": -6.246986922763643, "global_step": 90299, "epoch": 2149, "val_loss": 67904.9453125} {"train_loss": -6.225788593292236, "global_step": 90300, "epoch": 2150} {"train_loss": -6.47272253036499, "global_step": 90301, "epoch": 2150} {"train_loss": -6.360634803771973, "global_step": 90302, "epoch": 2150} {"train_loss": -6.108263969421387, "global_step": 90303, "epoch": 2150} {"train_loss": -6.175025463104248, "global_step": 90304, "epoch": 2150} {"train_loss": -6.1477789878845215, "global_step": 90305, "epoch": 2150} {"train_loss": -6.259459495544434, "global_step": 90306, "epoch": 2150} {"train_loss": -6.192400932312012, "global_step": 90307, "epoch": 2150} {"train_loss": -6.248438835144043, "global_step": 90308, "epoch": 2150} {"train_loss": -6.233259677886963, "global_step": 90309, "epoch": 2150} {"train_loss": -6.261728763580322, "global_step": 90310, "epoch": 2150} {"train_loss": -6.2366814613342285, "global_step": 90311, "epoch": 2150} {"train_loss": -6.408476829528809, "global_step": 90312, "epoch": 2150} {"train_loss": -6.23663330078125, "global_step": 90313, "epoch": 2150} {"train_loss": -6.237088203430176, "global_step": 90314, "epoch": 2150} {"train_loss": -6.287312030792236, "global_step": 90315, "epoch": 2150} {"train_loss": -6.2204999923706055, "global_step": 90316, "epoch": 2150} {"train_loss": -6.207528114318848, "global_step": 90317, "epoch": 2150} {"train_loss": -6.240265846252441, "global_step": 90318, "epoch": 2150} {"train_loss": -6.173271179199219, "global_step": 90319, "epoch": 2150} {"train_loss": -6.286591529846191, "global_step": 90320, "epoch": 2150} {"train_loss": -6.281822204589844, "global_step": 90321, "epoch": 2150} {"train_loss": -6.264094829559326, "global_step": 90322, "epoch": 2150} {"train_loss": -6.301115036010742, "global_step": 90323, "epoch": 2150} {"train_loss": -6.275606155395508, "global_step": 90324, "epoch": 2150} {"train_loss": -6.294886589050293, "global_step": 90325, "epoch": 2150} {"train_loss": -6.20065975189209, "global_step": 90326, "epoch": 2150} {"train_loss": -6.152521133422852, "global_step": 90327, "epoch": 2150} {"train_loss": -6.1487016677856445, "global_step": 90328, "epoch": 2150} {"train_loss": -6.17640495300293, "global_step": 90329, "epoch": 2150} {"train_loss": -6.053147792816162, "global_step": 90330, "epoch": 2150} {"train_loss": -6.172417640686035, "global_step": 90331, "epoch": 2150} {"train_loss": -6.32737398147583, "global_step": 90332, "epoch": 2150} {"train_loss": -6.302194595336914, "global_step": 90333, "epoch": 2150} {"train_loss": -6.379717826843262, "global_step": 90334, "epoch": 2150} {"train_loss": -6.171481609344482, "global_step": 90335, "epoch": 2150} {"train_loss": -6.202178955078125, "global_step": 90336, "epoch": 2150} {"train_loss": -6.236660003662109, "global_step": 90337, "epoch": 2150} {"train_loss": -6.139871597290039, "global_step": 90338, "epoch": 2150} {"train_loss": -6.170283317565918, "global_step": 90339, "epoch": 2150} {"train_loss": -6.0524373054504395, "global_step": 90340, "epoch": 2150} {"train_loss": -6.228596460251581, "global_step": 90341, "epoch": 2150, "train/sim_max_reward_0": 0.22050295048557025, "train/sim_max_reward_1": 0.9666151706685664, "train/sim_max_reward_2": 0.3967745812227113, "train/sim_max_reward_3": 0.11783378283185623, "train/sim_max_reward_4": 0.8593309842955204, "train/sim_max_reward_5": 0.8365417463615038, "test/sim_max_reward_4400000": 0.19177219201119577, "test/sim_max_reward_4400001": 0.43752437610689504, "test/sim_max_reward_4400002": 0.8101229167325891, "test/sim_max_reward_4400003": 0.04547288973787058, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9653738470023524, "test/sim_max_reward_4400007": 0.8097036989571194, "test/sim_max_reward_4400008": 0.3033748795704623, "test/sim_max_reward_4400009": 0.8512372650145482, "test/sim_max_reward_4400010": 0.9862110480492828, "test/sim_max_reward_4400011": 0.8812165202603032, "test/sim_max_reward_4400012": 0.38633842316197636, "test/sim_max_reward_4400013": 0.7406296842914356, "test/sim_max_reward_4400014": 0.1519378958225628, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.21859903301129285, "test/sim_max_reward_4400019": 0.19464191845902648, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.9259297863296084, "test/sim_max_reward_4400022": 0.8646801840753809, "test/sim_max_reward_4400023": 0.16753608611635987, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.26039445976180703, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.019277721893882334, "test/sim_max_reward_4400028": 0.610008577596602, "test/sim_max_reward_4400029": 0.999270745595576, "test/sim_max_reward_4400030": 0.9151530703289806, "test/sim_max_reward_4400031": 0.923366558466945, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.19749637216232943, "test/sim_max_reward_4400034": 0.7413543108992097, "test/sim_max_reward_4400035": 0.4304358520383017, "test/sim_max_reward_4400036": 0.41826325268609593, "test/sim_max_reward_4400037": 0.8404961481404488, "test/sim_max_reward_4400038": 0.9397833275919987, "test/sim_max_reward_4400039": 0.9922080861182385, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6400665428789309, "test/sim_max_reward_4400042": 0.8134447840206268, "test/sim_max_reward_4400043": 0.8695550518874536, "test/sim_max_reward_4400044": 0.8838067183028884, "test/sim_max_reward_4400045": 0.4627419176433877, "test/sim_max_reward_4400046": 0.7344357480921855, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.7751278973371073, "test/sim_max_reward_4400049": 0.8061649859269245, "train/mean_score": 0.5662665359776214, "test/mean_score": 0.5094963900345667, "val_loss": 68009.3203125} {"train_loss": -6.1827073097229, "global_step": 90342, "epoch": 2151} {"train_loss": -6.054754734039307, "global_step": 90343, "epoch": 2151} {"train_loss": -6.270236015319824, "global_step": 90344, "epoch": 2151} {"train_loss": -6.236114501953125, "global_step": 90345, "epoch": 2151} {"train_loss": -6.223729133605957, "global_step": 90346, "epoch": 2151} {"train_loss": -6.243300437927246, "global_step": 90347, "epoch": 2151} {"train_loss": -6.121716499328613, "global_step": 90348, "epoch": 2151} {"train_loss": -6.282019138336182, "global_step": 90349, "epoch": 2151} {"train_loss": -6.178753852844238, "global_step": 90350, "epoch": 2151} {"train_loss": -6.15301513671875, "global_step": 90351, "epoch": 2151} {"train_loss": -6.16282320022583, "global_step": 90352, "epoch": 2151} {"train_loss": -6.279440879821777, "global_step": 90353, "epoch": 2151} {"train_loss": -6.243413925170898, "global_step": 90354, "epoch": 2151} {"train_loss": -6.322076797485352, "global_step": 90355, "epoch": 2151} {"train_loss": -6.285381317138672, "global_step": 90356, "epoch": 2151} {"train_loss": -6.29121208190918, "global_step": 90357, "epoch": 2151} {"train_loss": -6.253476619720459, "global_step": 90358, "epoch": 2151} {"train_loss": -6.285660743713379, "global_step": 90359, "epoch": 2151} {"train_loss": -6.278310298919678, "global_step": 90360, "epoch": 2151} {"train_loss": -6.231630325317383, "global_step": 90361, "epoch": 2151} {"train_loss": -6.186692714691162, "global_step": 90362, "epoch": 2151} {"train_loss": -6.124406814575195, "global_step": 90363, "epoch": 2151} {"train_loss": -6.222334384918213, "global_step": 90364, "epoch": 2151} {"train_loss": -6.2776689529418945, "global_step": 90365, "epoch": 2151} {"train_loss": -6.203384876251221, "global_step": 90366, "epoch": 2151} {"train_loss": -6.243980407714844, "global_step": 90367, "epoch": 2151} {"train_loss": -6.253982067108154, "global_step": 90368, "epoch": 2151} {"train_loss": -6.137803077697754, "global_step": 90369, "epoch": 2151} {"train_loss": -6.31545352935791, "global_step": 90370, "epoch": 2151} {"train_loss": -6.235306739807129, "global_step": 90371, "epoch": 2151} {"train_loss": -6.154330253601074, "global_step": 90372, "epoch": 2151} {"train_loss": -6.225281715393066, "global_step": 90373, "epoch": 2151} {"train_loss": -6.289562225341797, "global_step": 90374, "epoch": 2151} {"train_loss": -6.244581699371338, "global_step": 90375, "epoch": 2151} {"train_loss": -6.115685939788818, "global_step": 90376, "epoch": 2151} {"train_loss": -6.356663703918457, "global_step": 90377, "epoch": 2151} {"train_loss": -6.2217254638671875, "global_step": 90378, "epoch": 2151} {"train_loss": -6.217711448669434, "global_step": 90379, "epoch": 2151} {"train_loss": -6.2130231857299805, "global_step": 90380, "epoch": 2151} {"train_loss": -6.121200084686279, "global_step": 90381, "epoch": 2151} {"train_loss": -6.241281032562256, "global_step": 90382, "epoch": 2151} {"train_loss": -6.223893188294911, "global_step": 90383, "epoch": 2151, "val_loss": 67910.734375} {"train_loss": -6.2191877365112305, "global_step": 90384, "epoch": 2152} {"train_loss": -6.369881629943848, "global_step": 90385, "epoch": 2152} {"train_loss": -6.196530818939209, "global_step": 90386, "epoch": 2152} {"train_loss": -6.201108932495117, "global_step": 90387, "epoch": 2152} {"train_loss": -6.323225021362305, "global_step": 90388, "epoch": 2152} {"train_loss": -6.221219062805176, "global_step": 90389, "epoch": 2152} {"train_loss": -6.294304847717285, "global_step": 90390, "epoch": 2152} {"train_loss": -6.288698196411133, "global_step": 90391, "epoch": 2152} {"train_loss": -6.258428573608398, "global_step": 90392, "epoch": 2152} {"train_loss": -6.301571846008301, "global_step": 90393, "epoch": 2152} {"train_loss": -6.357627868652344, "global_step": 90394, "epoch": 2152} {"train_loss": -6.229282855987549, "global_step": 90395, "epoch": 2152} {"train_loss": -6.210107803344727, "global_step": 90396, "epoch": 2152} {"train_loss": -6.267054557800293, "global_step": 90397, "epoch": 2152} {"train_loss": -6.216318607330322, "global_step": 90398, "epoch": 2152} {"train_loss": -6.306230068206787, "global_step": 90399, "epoch": 2152} {"train_loss": -6.138742446899414, "global_step": 90400, "epoch": 2152} {"train_loss": -6.219564437866211, "global_step": 90401, "epoch": 2152} {"train_loss": -6.301135063171387, "global_step": 90402, "epoch": 2152} {"train_loss": -6.21627140045166, "global_step": 90403, "epoch": 2152} {"train_loss": -6.356444835662842, "global_step": 90404, "epoch": 2152} {"train_loss": -6.221574783325195, "global_step": 90405, "epoch": 2152} {"train_loss": -6.106398105621338, "global_step": 90406, "epoch": 2152} {"train_loss": -6.27552604675293, "global_step": 90407, "epoch": 2152} {"train_loss": -6.217677593231201, "global_step": 90408, "epoch": 2152} {"train_loss": -6.171810626983643, "global_step": 90409, "epoch": 2152} {"train_loss": -6.186100959777832, "global_step": 90410, "epoch": 2152} {"train_loss": -6.1658830642700195, "global_step": 90411, "epoch": 2152} {"train_loss": -6.338227272033691, "global_step": 90412, "epoch": 2152} {"train_loss": -6.099156379699707, "global_step": 90413, "epoch": 2152} {"train_loss": -6.345579624176025, "global_step": 90414, "epoch": 2152} {"train_loss": -6.2336506843566895, "global_step": 90415, "epoch": 2152} {"train_loss": -6.206062316894531, "global_step": 90416, "epoch": 2152} {"train_loss": -6.3148956298828125, "global_step": 90417, "epoch": 2152} {"train_loss": -6.372857093811035, "global_step": 90418, "epoch": 2152} {"train_loss": -6.245126724243164, "global_step": 90419, "epoch": 2152} {"train_loss": -6.23568058013916, "global_step": 90420, "epoch": 2152} {"train_loss": -6.260476112365723, "global_step": 90421, "epoch": 2152} {"train_loss": -6.110213279724121, "global_step": 90422, "epoch": 2152} {"train_loss": -6.277325630187988, "global_step": 90423, "epoch": 2152} {"train_loss": -6.118804931640625, "global_step": 90424, "epoch": 2152} {"train_loss": -6.245276485170637, "global_step": 90425, "epoch": 2152, "val_loss": 67642.8515625} {"train_loss": -6.276484489440918, "global_step": 90426, "epoch": 2153} {"train_loss": -6.189977645874023, "global_step": 90427, "epoch": 2153} {"train_loss": -6.236876487731934, "global_step": 90428, "epoch": 2153} {"train_loss": -6.145412445068359, "global_step": 90429, "epoch": 2153} {"train_loss": -6.1828203201293945, "global_step": 90430, "epoch": 2153} {"train_loss": -6.086730003356934, "global_step": 90431, "epoch": 2153} {"train_loss": -6.226478099822998, "global_step": 90432, "epoch": 2153} {"train_loss": -6.260729789733887, "global_step": 90433, "epoch": 2153} {"train_loss": -6.131259441375732, "global_step": 90434, "epoch": 2153} {"train_loss": -6.138838768005371, "global_step": 90435, "epoch": 2153} {"train_loss": -6.177534580230713, "global_step": 90436, "epoch": 2153} {"train_loss": -6.0985589027404785, "global_step": 90437, "epoch": 2153} {"train_loss": -6.341774940490723, "global_step": 90438, "epoch": 2153} {"train_loss": -6.239785194396973, "global_step": 90439, "epoch": 2153} {"train_loss": -6.022615909576416, "global_step": 90440, "epoch": 2153} {"train_loss": -6.191904544830322, "global_step": 90441, "epoch": 2153} {"train_loss": -6.0684404373168945, "global_step": 90442, "epoch": 2153} {"train_loss": -5.989495754241943, "global_step": 90443, "epoch": 2153} {"train_loss": -6.164436340332031, "global_step": 90444, "epoch": 2153} {"train_loss": -5.956659317016602, "global_step": 90445, "epoch": 2153} {"train_loss": -6.1324849128723145, "global_step": 90446, "epoch": 2153} {"train_loss": -5.91797399520874, "global_step": 90447, "epoch": 2153} {"train_loss": -6.219285011291504, "global_step": 90448, "epoch": 2153} {"train_loss": -5.995487213134766, "global_step": 90449, "epoch": 2153} {"train_loss": -6.139167308807373, "global_step": 90450, "epoch": 2153} {"train_loss": -6.121221542358398, "global_step": 90451, "epoch": 2153} {"train_loss": -6.0592875480651855, "global_step": 90452, "epoch": 2153} {"train_loss": -6.247694969177246, "global_step": 90453, "epoch": 2153} {"train_loss": -6.088449001312256, "global_step": 90454, "epoch": 2153} {"train_loss": -6.286664009094238, "global_step": 90455, "epoch": 2153} {"train_loss": -5.971496105194092, "global_step": 90456, "epoch": 2153} {"train_loss": -6.163443088531494, "global_step": 90457, "epoch": 2153} {"train_loss": -6.167945384979248, "global_step": 90458, "epoch": 2153} {"train_loss": -6.3459062576293945, "global_step": 90459, "epoch": 2153} {"train_loss": -6.173702239990234, "global_step": 90460, "epoch": 2153} {"train_loss": -6.245846748352051, "global_step": 90461, "epoch": 2153} {"train_loss": -6.189102649688721, "global_step": 90462, "epoch": 2153} {"train_loss": -6.307218074798584, "global_step": 90463, "epoch": 2153} {"train_loss": -6.206676959991455, "global_step": 90464, "epoch": 2153} {"train_loss": -6.295395851135254, "global_step": 90465, "epoch": 2153} {"train_loss": -6.276854515075684, "global_step": 90466, "epoch": 2153} {"train_loss": -6.163676647912888, "global_step": 90467, "epoch": 2153, "val_loss": 67799.171875} {"train_loss": -6.255824089050293, "global_step": 90468, "epoch": 2154} {"train_loss": -6.2221832275390625, "global_step": 90469, "epoch": 2154} {"train_loss": -6.181885719299316, "global_step": 90470, "epoch": 2154} {"train_loss": -6.244104385375977, "global_step": 90471, "epoch": 2154} {"train_loss": -6.222867965698242, "global_step": 90472, "epoch": 2154} {"train_loss": -6.194672584533691, "global_step": 90473, "epoch": 2154} {"train_loss": -6.306876182556152, "global_step": 90474, "epoch": 2154} {"train_loss": -6.254306316375732, "global_step": 90475, "epoch": 2154} {"train_loss": -6.199912071228027, "global_step": 90476, "epoch": 2154} {"train_loss": -6.338869094848633, "global_step": 90477, "epoch": 2154} {"train_loss": -6.280829429626465, "global_step": 90478, "epoch": 2154} {"train_loss": -6.280849456787109, "global_step": 90479, "epoch": 2154} {"train_loss": -6.278138160705566, "global_step": 90480, "epoch": 2154} {"train_loss": -6.292947769165039, "global_step": 90481, "epoch": 2154} {"train_loss": -6.309499263763428, "global_step": 90482, "epoch": 2154} {"train_loss": -6.239532470703125, "global_step": 90483, "epoch": 2154} {"train_loss": -6.125967979431152, "global_step": 90484, "epoch": 2154} {"train_loss": -6.256713390350342, "global_step": 90485, "epoch": 2154} {"train_loss": -6.286288261413574, "global_step": 90486, "epoch": 2154} {"train_loss": -6.220596790313721, "global_step": 90487, "epoch": 2154} {"train_loss": -6.288243770599365, "global_step": 90488, "epoch": 2154} {"train_loss": -6.3170576095581055, "global_step": 90489, "epoch": 2154} {"train_loss": -6.211359024047852, "global_step": 90490, "epoch": 2154} {"train_loss": -6.188372611999512, "global_step": 90491, "epoch": 2154} {"train_loss": -6.237710952758789, "global_step": 90492, "epoch": 2154} {"train_loss": -6.24455451965332, "global_step": 90493, "epoch": 2154} {"train_loss": -6.2407121658325195, "global_step": 90494, "epoch": 2154} {"train_loss": -6.2754669189453125, "global_step": 90495, "epoch": 2154} {"train_loss": -6.184910774230957, "global_step": 90496, "epoch": 2154} {"train_loss": -6.251563549041748, "global_step": 90497, "epoch": 2154} {"train_loss": -6.183584213256836, "global_step": 90498, "epoch": 2154} {"train_loss": -6.292272090911865, "global_step": 90499, "epoch": 2154} {"train_loss": -6.209173202514648, "global_step": 90500, "epoch": 2154} {"train_loss": -6.298900127410889, "global_step": 90501, "epoch": 2154} {"train_loss": -6.22944450378418, "global_step": 90502, "epoch": 2154} {"train_loss": -6.2565107345581055, "global_step": 90503, "epoch": 2154} {"train_loss": -6.353385925292969, "global_step": 90504, "epoch": 2154} {"train_loss": -6.2445068359375, "global_step": 90505, "epoch": 2154} {"train_loss": -6.230386257171631, "global_step": 90506, "epoch": 2154} {"train_loss": -6.222105026245117, "global_step": 90507, "epoch": 2154} {"train_loss": -6.217024803161621, "global_step": 90508, "epoch": 2154} {"train_loss": -6.246474822362264, "global_step": 90509, "epoch": 2154, "val_loss": 67729.4609375} {"train_loss": -6.3076958656311035, "global_step": 90510, "epoch": 2155} {"train_loss": -6.305297374725342, "global_step": 90511, "epoch": 2155} {"train_loss": -6.184794902801514, "global_step": 90512, "epoch": 2155} {"train_loss": -6.254365921020508, "global_step": 90513, "epoch": 2155} {"train_loss": -6.240578651428223, "global_step": 90514, "epoch": 2155} {"train_loss": -6.198467254638672, "global_step": 90515, "epoch": 2155} {"train_loss": -6.338944435119629, "global_step": 90516, "epoch": 2155} {"train_loss": -6.199801445007324, "global_step": 90517, "epoch": 2155} {"train_loss": -6.207858085632324, "global_step": 90518, "epoch": 2155} {"train_loss": -6.348132133483887, "global_step": 90519, "epoch": 2155} {"train_loss": -6.134760856628418, "global_step": 90520, "epoch": 2155} {"train_loss": -6.282752990722656, "global_step": 90521, "epoch": 2155} {"train_loss": -6.275032043457031, "global_step": 90522, "epoch": 2155} {"train_loss": -6.335226058959961, "global_step": 90523, "epoch": 2155} {"train_loss": -6.226646423339844, "global_step": 90524, "epoch": 2155} {"train_loss": -6.296896934509277, "global_step": 90525, "epoch": 2155} {"train_loss": -6.226836204528809, "global_step": 90526, "epoch": 2155} {"train_loss": -6.185051441192627, "global_step": 90527, "epoch": 2155} {"train_loss": -6.299498081207275, "global_step": 90528, "epoch": 2155} {"train_loss": -6.157167434692383, "global_step": 90529, "epoch": 2155} {"train_loss": -6.196486949920654, "global_step": 90530, "epoch": 2155} {"train_loss": -6.268096923828125, "global_step": 90531, "epoch": 2155} {"train_loss": -6.256673812866211, "global_step": 90532, "epoch": 2155} {"train_loss": -6.284214019775391, "global_step": 90533, "epoch": 2155} {"train_loss": -6.159570217132568, "global_step": 90534, "epoch": 2155} {"train_loss": -6.211006164550781, "global_step": 90535, "epoch": 2155} {"train_loss": -6.238397121429443, "global_step": 90536, "epoch": 2155} {"train_loss": -6.224049091339111, "global_step": 90537, "epoch": 2155} {"train_loss": -6.354331016540527, "global_step": 90538, "epoch": 2155} {"train_loss": -6.331418991088867, "global_step": 90539, "epoch": 2155} {"train_loss": -6.3200178146362305, "global_step": 90540, "epoch": 2155} {"train_loss": -6.233737468719482, "global_step": 90541, "epoch": 2155} {"train_loss": -6.219456195831299, "global_step": 90542, "epoch": 2155} {"train_loss": -6.306535720825195, "global_step": 90543, "epoch": 2155} {"train_loss": -6.261336326599121, "global_step": 90544, "epoch": 2155} {"train_loss": -6.294525146484375, "global_step": 90545, "epoch": 2155} {"train_loss": -6.22735595703125, "global_step": 90546, "epoch": 2155} {"train_loss": -6.300044059753418, "global_step": 90547, "epoch": 2155} {"train_loss": -6.268192291259766, "global_step": 90548, "epoch": 2155} {"train_loss": -6.309815406799316, "global_step": 90549, "epoch": 2155} {"train_loss": -6.317381858825684, "global_step": 90550, "epoch": 2155} {"train_loss": -6.2589039007822675, "global_step": 90551, "epoch": 2155, "val_loss": 67918.2265625} {"train_loss": -6.269957542419434, "global_step": 90552, "epoch": 2156} {"train_loss": -6.406379222869873, "global_step": 90553, "epoch": 2156} {"train_loss": -6.404869079589844, "global_step": 90554, "epoch": 2156} {"train_loss": -6.230640411376953, "global_step": 90555, "epoch": 2156} {"train_loss": -6.284243106842041, "global_step": 90556, "epoch": 2156} {"train_loss": -6.214058876037598, "global_step": 90557, "epoch": 2156} {"train_loss": -6.181412220001221, "global_step": 90558, "epoch": 2156} {"train_loss": -6.278349876403809, "global_step": 90559, "epoch": 2156} {"train_loss": -6.383179664611816, "global_step": 90560, "epoch": 2156} {"train_loss": -6.229243755340576, "global_step": 90561, "epoch": 2156} {"train_loss": -6.279855728149414, "global_step": 90562, "epoch": 2156} {"train_loss": -6.2672271728515625, "global_step": 90563, "epoch": 2156} {"train_loss": -6.303558826446533, "global_step": 90564, "epoch": 2156} {"train_loss": -6.19803524017334, "global_step": 90565, "epoch": 2156} {"train_loss": -6.31101131439209, "global_step": 90566, "epoch": 2156} {"train_loss": -6.344779014587402, "global_step": 90567, "epoch": 2156} {"train_loss": -6.3327317237854, "global_step": 90568, "epoch": 2156} {"train_loss": -6.240348815917969, "global_step": 90569, "epoch": 2156} {"train_loss": -6.262087345123291, "global_step": 90570, "epoch": 2156} {"train_loss": -6.236264705657959, "global_step": 90571, "epoch": 2156} {"train_loss": -6.290752410888672, "global_step": 90572, "epoch": 2156} {"train_loss": -6.361673831939697, "global_step": 90573, "epoch": 2156} {"train_loss": -6.3090362548828125, "global_step": 90574, "epoch": 2156} {"train_loss": -6.289666175842285, "global_step": 90575, "epoch": 2156} {"train_loss": -6.214275360107422, "global_step": 90576, "epoch": 2156} {"train_loss": -6.296072483062744, "global_step": 90577, "epoch": 2156} {"train_loss": -6.283974647521973, "global_step": 90578, "epoch": 2156} {"train_loss": -6.302121162414551, "global_step": 90579, "epoch": 2156} {"train_loss": -6.300728797912598, "global_step": 90580, "epoch": 2156} {"train_loss": -6.183856010437012, "global_step": 90581, "epoch": 2156} {"train_loss": -6.295620918273926, "global_step": 90582, "epoch": 2156} {"train_loss": -6.285472869873047, "global_step": 90583, "epoch": 2156} {"train_loss": -6.247452735900879, "global_step": 90584, "epoch": 2156} {"train_loss": -6.211747169494629, "global_step": 90585, "epoch": 2156} {"train_loss": -6.28813362121582, "global_step": 90586, "epoch": 2156} {"train_loss": -6.118433952331543, "global_step": 90587, "epoch": 2156} {"train_loss": -6.264066696166992, "global_step": 90588, "epoch": 2156} {"train_loss": -6.222018241882324, "global_step": 90589, "epoch": 2156} {"train_loss": -6.270013809204102, "global_step": 90590, "epoch": 2156} {"train_loss": -6.379024028778076, "global_step": 90591, "epoch": 2156} {"train_loss": -6.33272647857666, "global_step": 90592, "epoch": 2156} {"train_loss": -6.278235583078294, "global_step": 90593, "epoch": 2156, "val_loss": 67712.6640625} {"train_loss": -6.228800296783447, "global_step": 90594, "epoch": 2157} {"train_loss": -6.2983293533325195, "global_step": 90595, "epoch": 2157} {"train_loss": -6.297482967376709, "global_step": 90596, "epoch": 2157} {"train_loss": -6.268086910247803, "global_step": 90597, "epoch": 2157} {"train_loss": -6.319760799407959, "global_step": 90598, "epoch": 2157} {"train_loss": -6.220566749572754, "global_step": 90599, "epoch": 2157} {"train_loss": -6.358548164367676, "global_step": 90600, "epoch": 2157} {"train_loss": -6.212737083435059, "global_step": 90601, "epoch": 2157} {"train_loss": -6.291830062866211, "global_step": 90602, "epoch": 2157} {"train_loss": -6.287463188171387, "global_step": 90603, "epoch": 2157} {"train_loss": -6.249997615814209, "global_step": 90604, "epoch": 2157} {"train_loss": -6.209244728088379, "global_step": 90605, "epoch": 2157} {"train_loss": -6.358689308166504, "global_step": 90606, "epoch": 2157} {"train_loss": -6.218901634216309, "global_step": 90607, "epoch": 2157} {"train_loss": -6.256433963775635, "global_step": 90608, "epoch": 2157} {"train_loss": -6.339364051818848, "global_step": 90609, "epoch": 2157} {"train_loss": -6.2946319580078125, "global_step": 90610, "epoch": 2157} {"train_loss": -6.254899978637695, "global_step": 90611, "epoch": 2157} {"train_loss": -6.307154178619385, "global_step": 90612, "epoch": 2157} {"train_loss": -6.206149578094482, "global_step": 90613, "epoch": 2157} {"train_loss": -6.2808427810668945, "global_step": 90614, "epoch": 2157} {"train_loss": -6.108732223510742, "global_step": 90615, "epoch": 2157} {"train_loss": -6.126049041748047, "global_step": 90616, "epoch": 2157} {"train_loss": -6.18489933013916, "global_step": 90617, "epoch": 2157} {"train_loss": -6.200423717498779, "global_step": 90618, "epoch": 2157} {"train_loss": -6.144488334655762, "global_step": 90619, "epoch": 2157} {"train_loss": -6.179835319519043, "global_step": 90620, "epoch": 2157} {"train_loss": -6.177833557128906, "global_step": 90621, "epoch": 2157} {"train_loss": -6.175493240356445, "global_step": 90622, "epoch": 2157} {"train_loss": -6.298223495483398, "global_step": 90623, "epoch": 2157} {"train_loss": -6.309450626373291, "global_step": 90624, "epoch": 2157} {"train_loss": -6.205727577209473, "global_step": 90625, "epoch": 2157} {"train_loss": -6.098579406738281, "global_step": 90626, "epoch": 2157} {"train_loss": -6.185286521911621, "global_step": 90627, "epoch": 2157} {"train_loss": -6.195135593414307, "global_step": 90628, "epoch": 2157} {"train_loss": -6.303957939147949, "global_step": 90629, "epoch": 2157} {"train_loss": -6.241872787475586, "global_step": 90630, "epoch": 2157} {"train_loss": -6.058164596557617, "global_step": 90631, "epoch": 2157} {"train_loss": -6.189852714538574, "global_step": 90632, "epoch": 2157} {"train_loss": -6.248295783996582, "global_step": 90633, "epoch": 2157} {"train_loss": -6.134636878967285, "global_step": 90634, "epoch": 2157} {"train_loss": -6.23494967960176, "global_step": 90635, "epoch": 2157, "val_loss": 67958.6953125} {"train_loss": -6.161698341369629, "global_step": 90636, "epoch": 2158} {"train_loss": -6.371552467346191, "global_step": 90637, "epoch": 2158} {"train_loss": -6.147058963775635, "global_step": 90638, "epoch": 2158} {"train_loss": -6.244624137878418, "global_step": 90639, "epoch": 2158} {"train_loss": -6.1876220703125, "global_step": 90640, "epoch": 2158} {"train_loss": -6.240802764892578, "global_step": 90641, "epoch": 2158} {"train_loss": -6.311967372894287, "global_step": 90642, "epoch": 2158} {"train_loss": -6.22023344039917, "global_step": 90643, "epoch": 2158} {"train_loss": -6.225604057312012, "global_step": 90644, "epoch": 2158} {"train_loss": -6.225716590881348, "global_step": 90645, "epoch": 2158} {"train_loss": -6.188261985778809, "global_step": 90646, "epoch": 2158} {"train_loss": -6.089707374572754, "global_step": 90647, "epoch": 2158} {"train_loss": -6.134847164154053, "global_step": 90648, "epoch": 2158} {"train_loss": -6.282987594604492, "global_step": 90649, "epoch": 2158} {"train_loss": -6.182606220245361, "global_step": 90650, "epoch": 2158} {"train_loss": -6.148513317108154, "global_step": 90651, "epoch": 2158} {"train_loss": -6.298306465148926, "global_step": 90652, "epoch": 2158} {"train_loss": -6.156494140625, "global_step": 90653, "epoch": 2158} {"train_loss": -6.245963096618652, "global_step": 90654, "epoch": 2158} {"train_loss": -6.316318035125732, "global_step": 90655, "epoch": 2158} {"train_loss": -6.144937515258789, "global_step": 90656, "epoch": 2158} {"train_loss": -6.0795698165893555, "global_step": 90657, "epoch": 2158} {"train_loss": -6.139956474304199, "global_step": 90658, "epoch": 2158} {"train_loss": -6.1413984298706055, "global_step": 90659, "epoch": 2158} {"train_loss": -6.314392566680908, "global_step": 90660, "epoch": 2158} {"train_loss": -6.247366905212402, "global_step": 90661, "epoch": 2158} {"train_loss": -6.314579010009766, "global_step": 90662, "epoch": 2158} {"train_loss": -6.170570373535156, "global_step": 90663, "epoch": 2158} {"train_loss": -6.171321868896484, "global_step": 90664, "epoch": 2158} {"train_loss": -6.264157772064209, "global_step": 90665, "epoch": 2158} {"train_loss": -6.311359405517578, "global_step": 90666, "epoch": 2158} {"train_loss": -6.157067775726318, "global_step": 90667, "epoch": 2158} {"train_loss": -6.21217155456543, "global_step": 90668, "epoch": 2158} {"train_loss": -6.240572929382324, "global_step": 90669, "epoch": 2158} {"train_loss": -6.238258361816406, "global_step": 90670, "epoch": 2158} {"train_loss": -6.315637588500977, "global_step": 90671, "epoch": 2158} {"train_loss": -6.129874229431152, "global_step": 90672, "epoch": 2158} {"train_loss": -6.17799186706543, "global_step": 90673, "epoch": 2158} {"train_loss": -6.266695022583008, "global_step": 90674, "epoch": 2158} {"train_loss": -6.09044075012207, "global_step": 90675, "epoch": 2158} {"train_loss": -6.24748420715332, "global_step": 90676, "epoch": 2158} {"train_loss": -6.213786272775559, "global_step": 90677, "epoch": 2158, "val_loss": 68090.9609375} {"train_loss": -6.245525360107422, "global_step": 90678, "epoch": 2159} {"train_loss": -6.084844589233398, "global_step": 90679, "epoch": 2159} {"train_loss": -6.254314422607422, "global_step": 90680, "epoch": 2159} {"train_loss": -6.15242862701416, "global_step": 90681, "epoch": 2159} {"train_loss": -6.263965606689453, "global_step": 90682, "epoch": 2159} {"train_loss": -6.251845359802246, "global_step": 90683, "epoch": 2159} {"train_loss": -6.289157390594482, "global_step": 90684, "epoch": 2159} {"train_loss": -6.127057075500488, "global_step": 90685, "epoch": 2159} {"train_loss": -6.1605048179626465, "global_step": 90686, "epoch": 2159} {"train_loss": -6.25156831741333, "global_step": 90687, "epoch": 2159} {"train_loss": -6.106064796447754, "global_step": 90688, "epoch": 2159} {"train_loss": -6.273491859436035, "global_step": 90689, "epoch": 2159} {"train_loss": -6.178370475769043, "global_step": 90690, "epoch": 2159} {"train_loss": -6.228188514709473, "global_step": 90691, "epoch": 2159} {"train_loss": -6.327943325042725, "global_step": 90692, "epoch": 2159} {"train_loss": -6.146279811859131, "global_step": 90693, "epoch": 2159} {"train_loss": -6.219212532043457, "global_step": 90694, "epoch": 2159} {"train_loss": -6.050251007080078, "global_step": 90695, "epoch": 2159} {"train_loss": -6.1467742919921875, "global_step": 90696, "epoch": 2159} {"train_loss": -6.2688374519348145, "global_step": 90697, "epoch": 2159} {"train_loss": -6.093267440795898, "global_step": 90698, "epoch": 2159} {"train_loss": -6.155149459838867, "global_step": 90699, "epoch": 2159} {"train_loss": -6.227739334106445, "global_step": 90700, "epoch": 2159} {"train_loss": -6.232321739196777, "global_step": 90701, "epoch": 2159} {"train_loss": -6.179450035095215, "global_step": 90702, "epoch": 2159} {"train_loss": -6.219451904296875, "global_step": 90703, "epoch": 2159} {"train_loss": -6.279937744140625, "global_step": 90704, "epoch": 2159} {"train_loss": -6.34365701675415, "global_step": 90705, "epoch": 2159} {"train_loss": -6.212754249572754, "global_step": 90706, "epoch": 2159} {"train_loss": -6.1569342613220215, "global_step": 90707, "epoch": 2159} {"train_loss": -6.19720458984375, "global_step": 90708, "epoch": 2159} {"train_loss": -6.166701793670654, "global_step": 90709, "epoch": 2159} {"train_loss": -6.2017083168029785, "global_step": 90710, "epoch": 2159} {"train_loss": -6.163875579833984, "global_step": 90711, "epoch": 2159} {"train_loss": -6.258871555328369, "global_step": 90712, "epoch": 2159} {"train_loss": -6.089174747467041, "global_step": 90713, "epoch": 2159} {"train_loss": -6.077658653259277, "global_step": 90714, "epoch": 2159} {"train_loss": -6.310304164886475, "global_step": 90715, "epoch": 2159} {"train_loss": -6.217115879058838, "global_step": 90716, "epoch": 2159} {"train_loss": -6.178544521331787, "global_step": 90717, "epoch": 2159} {"train_loss": -6.259987831115723, "global_step": 90718, "epoch": 2159} {"train_loss": -6.203075647354126, "global_step": 90719, "epoch": 2159, "val_loss": 67896.9921875} {"train_loss": -6.265298843383789, "global_step": 90720, "epoch": 2160} {"train_loss": -6.216505527496338, "global_step": 90721, "epoch": 2160} {"train_loss": -6.296333312988281, "global_step": 90722, "epoch": 2160} {"train_loss": -6.244817733764648, "global_step": 90723, "epoch": 2160} {"train_loss": -6.233067035675049, "global_step": 90724, "epoch": 2160} {"train_loss": -6.245451927185059, "global_step": 90725, "epoch": 2160} {"train_loss": -6.280015468597412, "global_step": 90726, "epoch": 2160} {"train_loss": -6.348654747009277, "global_step": 90727, "epoch": 2160} {"train_loss": -6.279461860656738, "global_step": 90728, "epoch": 2160} {"train_loss": -6.242979049682617, "global_step": 90729, "epoch": 2160} {"train_loss": -6.339329719543457, "global_step": 90730, "epoch": 2160} {"train_loss": -6.160789489746094, "global_step": 90731, "epoch": 2160} {"train_loss": -6.221763610839844, "global_step": 90732, "epoch": 2160} {"train_loss": -6.297224521636963, "global_step": 90733, "epoch": 2160} {"train_loss": -6.27451229095459, "global_step": 90734, "epoch": 2160} {"train_loss": -6.303178787231445, "global_step": 90735, "epoch": 2160} {"train_loss": -6.402526378631592, "global_step": 90736, "epoch": 2160} {"train_loss": -6.2525954246521, "global_step": 90737, "epoch": 2160} {"train_loss": -6.142794132232666, "global_step": 90738, "epoch": 2160} {"train_loss": -6.320779800415039, "global_step": 90739, "epoch": 2160} {"train_loss": -6.333377361297607, "global_step": 90740, "epoch": 2160} {"train_loss": -6.214599609375, "global_step": 90741, "epoch": 2160} {"train_loss": -6.110147476196289, "global_step": 90742, "epoch": 2160} {"train_loss": -6.172375679016113, "global_step": 90743, "epoch": 2160} {"train_loss": -6.2296857833862305, "global_step": 90744, "epoch": 2160} {"train_loss": -6.1920576095581055, "global_step": 90745, "epoch": 2160} {"train_loss": -6.334272384643555, "global_step": 90746, "epoch": 2160} {"train_loss": -6.185518264770508, "global_step": 90747, "epoch": 2160} {"train_loss": -6.202539443969727, "global_step": 90748, "epoch": 2160} {"train_loss": -6.200898170471191, "global_step": 90749, "epoch": 2160} {"train_loss": -6.2602033615112305, "global_step": 90750, "epoch": 2160} {"train_loss": -6.113884925842285, "global_step": 90751, "epoch": 2160} {"train_loss": -6.112166404724121, "global_step": 90752, "epoch": 2160} {"train_loss": -6.209158897399902, "global_step": 90753, "epoch": 2160} {"train_loss": -6.2594451904296875, "global_step": 90754, "epoch": 2160} {"train_loss": -6.184270858764648, "global_step": 90755, "epoch": 2160} {"train_loss": -6.223971843719482, "global_step": 90756, "epoch": 2160} {"train_loss": -6.216177940368652, "global_step": 90757, "epoch": 2160} {"train_loss": -6.272684097290039, "global_step": 90758, "epoch": 2160} {"train_loss": -6.319251537322998, "global_step": 90759, "epoch": 2160} {"train_loss": -6.118181228637695, "global_step": 90760, "epoch": 2160} {"train_loss": -6.239350670859928, "global_step": 90761, "epoch": 2160, "val_loss": 68080.4140625} {"train_loss": -6.041575908660889, "global_step": 90762, "epoch": 2161} {"train_loss": -6.192744731903076, "global_step": 90763, "epoch": 2161} {"train_loss": -6.100772857666016, "global_step": 90764, "epoch": 2161} {"train_loss": -6.063722610473633, "global_step": 90765, "epoch": 2161} {"train_loss": -6.158932209014893, "global_step": 90766, "epoch": 2161} {"train_loss": -6.185534477233887, "global_step": 90767, "epoch": 2161} {"train_loss": -6.103132247924805, "global_step": 90768, "epoch": 2161} {"train_loss": -6.196962356567383, "global_step": 90769, "epoch": 2161} {"train_loss": -6.189600944519043, "global_step": 90770, "epoch": 2161} {"train_loss": -6.363557815551758, "global_step": 90771, "epoch": 2161} {"train_loss": -6.219099044799805, "global_step": 90772, "epoch": 2161} {"train_loss": -6.204007148742676, "global_step": 90773, "epoch": 2161} {"train_loss": -6.225226879119873, "global_step": 90774, "epoch": 2161} {"train_loss": -6.1903228759765625, "global_step": 90775, "epoch": 2161} {"train_loss": -6.208123207092285, "global_step": 90776, "epoch": 2161} {"train_loss": -6.116793155670166, "global_step": 90777, "epoch": 2161} {"train_loss": -6.035588264465332, "global_step": 90778, "epoch": 2161} {"train_loss": -6.221845626831055, "global_step": 90779, "epoch": 2161} {"train_loss": -6.189660549163818, "global_step": 90780, "epoch": 2161} {"train_loss": -6.201770782470703, "global_step": 90781, "epoch": 2161} {"train_loss": -6.124382019042969, "global_step": 90782, "epoch": 2161} {"train_loss": -6.11700439453125, "global_step": 90783, "epoch": 2161} {"train_loss": -6.207179069519043, "global_step": 90784, "epoch": 2161} {"train_loss": -6.257879734039307, "global_step": 90785, "epoch": 2161} {"train_loss": -6.232658386230469, "global_step": 90786, "epoch": 2161} {"train_loss": -6.181502819061279, "global_step": 90787, "epoch": 2161} {"train_loss": -6.289872646331787, "global_step": 90788, "epoch": 2161} {"train_loss": -6.126395225524902, "global_step": 90789, "epoch": 2161} {"train_loss": -6.158061981201172, "global_step": 90790, "epoch": 2161} {"train_loss": -6.284146785736084, "global_step": 90791, "epoch": 2161} {"train_loss": -6.217469692230225, "global_step": 90792, "epoch": 2161} {"train_loss": -6.189417362213135, "global_step": 90793, "epoch": 2161} {"train_loss": -6.148412227630615, "global_step": 90794, "epoch": 2161} {"train_loss": -6.146162033081055, "global_step": 90795, "epoch": 2161} {"train_loss": -6.2579240798950195, "global_step": 90796, "epoch": 2161} {"train_loss": -6.212576866149902, "global_step": 90797, "epoch": 2161} {"train_loss": -6.269896984100342, "global_step": 90798, "epoch": 2161} {"train_loss": -6.301658630371094, "global_step": 90799, "epoch": 2161} {"train_loss": -6.281816005706787, "global_step": 90800, "epoch": 2161} {"train_loss": -6.209760665893555, "global_step": 90801, "epoch": 2161} {"train_loss": -6.313143730163574, "global_step": 90802, "epoch": 2161} {"train_loss": -6.195053883961269, "global_step": 90803, "epoch": 2161, "val_loss": 68033.1171875} {"train_loss": -6.172105312347412, "global_step": 90804, "epoch": 2162} {"train_loss": -6.269648551940918, "global_step": 90805, "epoch": 2162} {"train_loss": -6.2271623611450195, "global_step": 90806, "epoch": 2162} {"train_loss": -6.237119674682617, "global_step": 90807, "epoch": 2162} {"train_loss": -6.212222099304199, "global_step": 90808, "epoch": 2162} {"train_loss": -6.219912528991699, "global_step": 90809, "epoch": 2162} {"train_loss": -6.29273796081543, "global_step": 90810, "epoch": 2162} {"train_loss": -6.109394073486328, "global_step": 90811, "epoch": 2162} {"train_loss": -6.359560966491699, "global_step": 90812, "epoch": 2162} {"train_loss": -6.196315288543701, "global_step": 90813, "epoch": 2162} {"train_loss": -6.328542709350586, "global_step": 90814, "epoch": 2162} {"train_loss": -6.26670503616333, "global_step": 90815, "epoch": 2162} {"train_loss": -6.119890213012695, "global_step": 90816, "epoch": 2162} {"train_loss": -6.34797477722168, "global_step": 90817, "epoch": 2162} {"train_loss": -6.159466743469238, "global_step": 90818, "epoch": 2162} {"train_loss": -6.170243263244629, "global_step": 90819, "epoch": 2162} {"train_loss": -6.254881381988525, "global_step": 90820, "epoch": 2162} {"train_loss": -6.171019077301025, "global_step": 90821, "epoch": 2162} {"train_loss": -6.300417900085449, "global_step": 90822, "epoch": 2162} {"train_loss": -6.239513397216797, "global_step": 90823, "epoch": 2162} {"train_loss": -6.23818826675415, "global_step": 90824, "epoch": 2162} {"train_loss": -6.174300193786621, "global_step": 90825, "epoch": 2162} {"train_loss": -6.197911262512207, "global_step": 90826, "epoch": 2162} {"train_loss": -6.21482515335083, "global_step": 90827, "epoch": 2162} {"train_loss": -6.181159973144531, "global_step": 90828, "epoch": 2162} {"train_loss": -6.125032901763916, "global_step": 90829, "epoch": 2162} {"train_loss": -6.187401294708252, "global_step": 90830, "epoch": 2162} {"train_loss": -6.2395477294921875, "global_step": 90831, "epoch": 2162} {"train_loss": -6.144722938537598, "global_step": 90832, "epoch": 2162} {"train_loss": -6.330495357513428, "global_step": 90833, "epoch": 2162} {"train_loss": -6.103504657745361, "global_step": 90834, "epoch": 2162} {"train_loss": -6.334090709686279, "global_step": 90835, "epoch": 2162} {"train_loss": -6.255107879638672, "global_step": 90836, "epoch": 2162} {"train_loss": -6.268899917602539, "global_step": 90837, "epoch": 2162} {"train_loss": -6.286078453063965, "global_step": 90838, "epoch": 2162} {"train_loss": -6.442392349243164, "global_step": 90839, "epoch": 2162} {"train_loss": -6.23018741607666, "global_step": 90840, "epoch": 2162} {"train_loss": -6.228992462158203, "global_step": 90841, "epoch": 2162} {"train_loss": -6.260541915893555, "global_step": 90842, "epoch": 2162} {"train_loss": -6.228634834289551, "global_step": 90843, "epoch": 2162} {"train_loss": -6.245236396789551, "global_step": 90844, "epoch": 2162} {"train_loss": -6.234141906102498, "global_step": 90845, "epoch": 2162, "val_loss": 68026.984375} {"train_loss": -6.166126251220703, "global_step": 90846, "epoch": 2163} {"train_loss": -6.244970798492432, "global_step": 90847, "epoch": 2163} {"train_loss": -6.2213873863220215, "global_step": 90848, "epoch": 2163} {"train_loss": -6.215228080749512, "global_step": 90849, "epoch": 2163} {"train_loss": -6.137182235717773, "global_step": 90850, "epoch": 2163} {"train_loss": -6.328187465667725, "global_step": 90851, "epoch": 2163} {"train_loss": -6.198224067687988, "global_step": 90852, "epoch": 2163} {"train_loss": -6.352183818817139, "global_step": 90853, "epoch": 2163} {"train_loss": -6.249468803405762, "global_step": 90854, "epoch": 2163} {"train_loss": -6.088770389556885, "global_step": 90855, "epoch": 2163} {"train_loss": -6.178501129150391, "global_step": 90856, "epoch": 2163} {"train_loss": -6.251070022583008, "global_step": 90857, "epoch": 2163} {"train_loss": -6.207894325256348, "global_step": 90858, "epoch": 2163} {"train_loss": -6.258380889892578, "global_step": 90859, "epoch": 2163} {"train_loss": -6.161505699157715, "global_step": 90860, "epoch": 2163} {"train_loss": -6.251245498657227, "global_step": 90861, "epoch": 2163} {"train_loss": -6.272101879119873, "global_step": 90862, "epoch": 2163} {"train_loss": -6.258880615234375, "global_step": 90863, "epoch": 2163} {"train_loss": -6.372855186462402, "global_step": 90864, "epoch": 2163} {"train_loss": -6.344278335571289, "global_step": 90865, "epoch": 2163} {"train_loss": -6.380062103271484, "global_step": 90866, "epoch": 2163} {"train_loss": -6.258705139160156, "global_step": 90867, "epoch": 2163} {"train_loss": -6.219714164733887, "global_step": 90868, "epoch": 2163} {"train_loss": -6.311008453369141, "global_step": 90869, "epoch": 2163} {"train_loss": -6.266274452209473, "global_step": 90870, "epoch": 2163} {"train_loss": -6.313138961791992, "global_step": 90871, "epoch": 2163} {"train_loss": -6.333613395690918, "global_step": 90872, "epoch": 2163} {"train_loss": -6.272997856140137, "global_step": 90873, "epoch": 2163} {"train_loss": -6.217698097229004, "global_step": 90874, "epoch": 2163} {"train_loss": -6.317763328552246, "global_step": 90875, "epoch": 2163} {"train_loss": -6.294528961181641, "global_step": 90876, "epoch": 2163} {"train_loss": -6.349945545196533, "global_step": 90877, "epoch": 2163} {"train_loss": -6.258271217346191, "global_step": 90878, "epoch": 2163} {"train_loss": -6.1353912353515625, "global_step": 90879, "epoch": 2163} {"train_loss": -6.250576019287109, "global_step": 90880, "epoch": 2163} {"train_loss": -6.040289878845215, "global_step": 90881, "epoch": 2163} {"train_loss": -6.169320583343506, "global_step": 90882, "epoch": 2163} {"train_loss": -6.327467918395996, "global_step": 90883, "epoch": 2163} {"train_loss": -6.293290615081787, "global_step": 90884, "epoch": 2163} {"train_loss": -6.261309623718262, "global_step": 90885, "epoch": 2163} {"train_loss": -6.37442684173584, "global_step": 90886, "epoch": 2163} {"train_loss": -6.253642104920887, "global_step": 90887, "epoch": 2163, "val_loss": 67786.4375} {"train_loss": -6.178475379943848, "global_step": 90888, "epoch": 2164} {"train_loss": -6.303895473480225, "global_step": 90889, "epoch": 2164} {"train_loss": -6.186949729919434, "global_step": 90890, "epoch": 2164} {"train_loss": -6.329129219055176, "global_step": 90891, "epoch": 2164} {"train_loss": -6.192960262298584, "global_step": 90892, "epoch": 2164} {"train_loss": -6.306032180786133, "global_step": 90893, "epoch": 2164} {"train_loss": -6.287315368652344, "global_step": 90894, "epoch": 2164} {"train_loss": -6.24130392074585, "global_step": 90895, "epoch": 2164} {"train_loss": -6.327963829040527, "global_step": 90896, "epoch": 2164} {"train_loss": -6.277924537658691, "global_step": 90897, "epoch": 2164} {"train_loss": -6.368757724761963, "global_step": 90898, "epoch": 2164} {"train_loss": -6.258392333984375, "global_step": 90899, "epoch": 2164} {"train_loss": -6.302260398864746, "global_step": 90900, "epoch": 2164} {"train_loss": -6.274951934814453, "global_step": 90901, "epoch": 2164} {"train_loss": -6.223529815673828, "global_step": 90902, "epoch": 2164} {"train_loss": -6.463652610778809, "global_step": 90903, "epoch": 2164} {"train_loss": -6.26533842086792, "global_step": 90904, "epoch": 2164} {"train_loss": -6.292411804199219, "global_step": 90905, "epoch": 2164} {"train_loss": -6.2176408767700195, "global_step": 90906, "epoch": 2164} {"train_loss": -6.3348283767700195, "global_step": 90907, "epoch": 2164} {"train_loss": -6.217130661010742, "global_step": 90908, "epoch": 2164} {"train_loss": -6.352441787719727, "global_step": 90909, "epoch": 2164} {"train_loss": -6.358443260192871, "global_step": 90910, "epoch": 2164} {"train_loss": -6.262716293334961, "global_step": 90911, "epoch": 2164} {"train_loss": -6.237576007843018, "global_step": 90912, "epoch": 2164} {"train_loss": -6.131312370300293, "global_step": 90913, "epoch": 2164} {"train_loss": -6.296542167663574, "global_step": 90914, "epoch": 2164} {"train_loss": -6.204552173614502, "global_step": 90915, "epoch": 2164} {"train_loss": -6.318392753601074, "global_step": 90916, "epoch": 2164} {"train_loss": -6.231957912445068, "global_step": 90917, "epoch": 2164} {"train_loss": -6.2061567306518555, "global_step": 90918, "epoch": 2164} {"train_loss": -6.315062522888184, "global_step": 90919, "epoch": 2164} {"train_loss": -6.015250205993652, "global_step": 90920, "epoch": 2164} {"train_loss": -6.189082622528076, "global_step": 90921, "epoch": 2164} {"train_loss": -6.2745561599731445, "global_step": 90922, "epoch": 2164} {"train_loss": -6.1953444480896, "global_step": 90923, "epoch": 2164} {"train_loss": -6.192277431488037, "global_step": 90924, "epoch": 2164} {"train_loss": -6.258413791656494, "global_step": 90925, "epoch": 2164} {"train_loss": -6.264272689819336, "global_step": 90926, "epoch": 2164} {"train_loss": -6.177090644836426, "global_step": 90927, "epoch": 2164} {"train_loss": -6.187500953674316, "global_step": 90928, "epoch": 2164} {"train_loss": -6.25338888168335, "global_step": 90929, "epoch": 2164, "val_loss": 68240.3515625} {"train_loss": -6.281867504119873, "global_step": 90930, "epoch": 2165} {"train_loss": -6.25736141204834, "global_step": 90931, "epoch": 2165} {"train_loss": -6.169158935546875, "global_step": 90932, "epoch": 2165} {"train_loss": -6.274770736694336, "global_step": 90933, "epoch": 2165} {"train_loss": -6.143601417541504, "global_step": 90934, "epoch": 2165} {"train_loss": -6.271658897399902, "global_step": 90935, "epoch": 2165} {"train_loss": -6.298245906829834, "global_step": 90936, "epoch": 2165} {"train_loss": -6.202582359313965, "global_step": 90937, "epoch": 2165} {"train_loss": -6.306922912597656, "global_step": 90938, "epoch": 2165} {"train_loss": -6.277087211608887, "global_step": 90939, "epoch": 2165} {"train_loss": -6.245105266571045, "global_step": 90940, "epoch": 2165} {"train_loss": -6.300713539123535, "global_step": 90941, "epoch": 2165} {"train_loss": -6.25136661529541, "global_step": 90942, "epoch": 2165} {"train_loss": -6.196030139923096, "global_step": 90943, "epoch": 2165} {"train_loss": -6.254327774047852, "global_step": 90944, "epoch": 2165} {"train_loss": -6.091732501983643, "global_step": 90945, "epoch": 2165} {"train_loss": -6.2715630531311035, "global_step": 90946, "epoch": 2165} {"train_loss": -6.133631706237793, "global_step": 90947, "epoch": 2165} {"train_loss": -6.0822553634643555, "global_step": 90948, "epoch": 2165} {"train_loss": -6.3329267501831055, "global_step": 90949, "epoch": 2165} {"train_loss": -6.311037063598633, "global_step": 90950, "epoch": 2165} {"train_loss": -6.252216339111328, "global_step": 90951, "epoch": 2165} {"train_loss": -6.2845377922058105, "global_step": 90952, "epoch": 2165} {"train_loss": -6.219959735870361, "global_step": 90953, "epoch": 2165} {"train_loss": -6.292632102966309, "global_step": 90954, "epoch": 2165} {"train_loss": -6.372306823730469, "global_step": 90955, "epoch": 2165} {"train_loss": -6.2476487159729, "global_step": 90956, "epoch": 2165} {"train_loss": -6.212944507598877, "global_step": 90957, "epoch": 2165} {"train_loss": -6.2079877853393555, "global_step": 90958, "epoch": 2165} {"train_loss": -6.309122562408447, "global_step": 90959, "epoch": 2165} {"train_loss": -6.325875282287598, "global_step": 90960, "epoch": 2165} {"train_loss": -6.325845241546631, "global_step": 90961, "epoch": 2165} {"train_loss": -6.284478187561035, "global_step": 90962, "epoch": 2165} {"train_loss": -6.165009021759033, "global_step": 90963, "epoch": 2165} {"train_loss": -6.177195072174072, "global_step": 90964, "epoch": 2165} {"train_loss": -6.217333793640137, "global_step": 90965, "epoch": 2165} {"train_loss": -6.250372886657715, "global_step": 90966, "epoch": 2165} {"train_loss": -6.27816915512085, "global_step": 90967, "epoch": 2165} {"train_loss": -6.150666236877441, "global_step": 90968, "epoch": 2165} {"train_loss": -6.206387042999268, "global_step": 90969, "epoch": 2165} {"train_loss": -6.246642589569092, "global_step": 90970, "epoch": 2165} {"train_loss": -6.242995057787214, "global_step": 90971, "epoch": 2165, "val_loss": 68078.6484375} {"train_loss": -6.2139482498168945, "global_step": 90972, "epoch": 2166} {"train_loss": -6.202890396118164, "global_step": 90973, "epoch": 2166} {"train_loss": -6.076845169067383, "global_step": 90974, "epoch": 2166} {"train_loss": -6.208788871765137, "global_step": 90975, "epoch": 2166} {"train_loss": -6.201828956604004, "global_step": 90976, "epoch": 2166} {"train_loss": -6.2035932540893555, "global_step": 90977, "epoch": 2166} {"train_loss": -6.2629714012146, "global_step": 90978, "epoch": 2166} {"train_loss": -6.1618452072143555, "global_step": 90979, "epoch": 2166} {"train_loss": -6.16693115234375, "global_step": 90980, "epoch": 2166} {"train_loss": -6.169098854064941, "global_step": 90981, "epoch": 2166} {"train_loss": -6.253761291503906, "global_step": 90982, "epoch": 2166} {"train_loss": -6.1167826652526855, "global_step": 90983, "epoch": 2166} {"train_loss": -6.148446559906006, "global_step": 90984, "epoch": 2166} {"train_loss": -6.22860050201416, "global_step": 90985, "epoch": 2166} {"train_loss": -6.303436279296875, "global_step": 90986, "epoch": 2166} {"train_loss": -6.231359481811523, "global_step": 90987, "epoch": 2166} {"train_loss": -6.313364505767822, "global_step": 90988, "epoch": 2166} {"train_loss": -6.268488883972168, "global_step": 90989, "epoch": 2166} {"train_loss": -6.232304573059082, "global_step": 90990, "epoch": 2166} {"train_loss": -6.322216033935547, "global_step": 90991, "epoch": 2166} {"train_loss": -6.315625190734863, "global_step": 90992, "epoch": 2166} {"train_loss": -6.252731800079346, "global_step": 90993, "epoch": 2166} {"train_loss": -6.26719331741333, "global_step": 90994, "epoch": 2166} {"train_loss": -6.234431266784668, "global_step": 90995, "epoch": 2166} {"train_loss": -6.3266143798828125, "global_step": 90996, "epoch": 2166} {"train_loss": -6.318943023681641, "global_step": 90997, "epoch": 2166} {"train_loss": -6.346528053283691, "global_step": 90998, "epoch": 2166} {"train_loss": -6.208930015563965, "global_step": 90999, "epoch": 2166} {"train_loss": -6.208784103393555, "global_step": 91000, "epoch": 2166} {"train_loss": -6.274138927459717, "global_step": 91001, "epoch": 2166} {"train_loss": -6.314591407775879, "global_step": 91002, "epoch": 2166} {"train_loss": -6.297593116760254, "global_step": 91003, "epoch": 2166} {"train_loss": -6.267246246337891, "global_step": 91004, "epoch": 2166} {"train_loss": -6.273185729980469, "global_step": 91005, "epoch": 2166} {"train_loss": -6.365482330322266, "global_step": 91006, "epoch": 2166} {"train_loss": -6.225696563720703, "global_step": 91007, "epoch": 2166} {"train_loss": -6.181373596191406, "global_step": 91008, "epoch": 2166} {"train_loss": -6.195821762084961, "global_step": 91009, "epoch": 2166} {"train_loss": -6.274111747741699, "global_step": 91010, "epoch": 2166} {"train_loss": -6.1862874031066895, "global_step": 91011, "epoch": 2166} {"train_loss": -6.263049602508545, "global_step": 91012, "epoch": 2166} {"train_loss": -6.242128474371774, "global_step": 91013, "epoch": 2166, "val_loss": 68253.46875} {"train_loss": -6.31378173828125, "global_step": 91014, "epoch": 2167} {"train_loss": -6.219388961791992, "global_step": 91015, "epoch": 2167} {"train_loss": -6.188310623168945, "global_step": 91016, "epoch": 2167} {"train_loss": -6.268028259277344, "global_step": 91017, "epoch": 2167} {"train_loss": -6.176758766174316, "global_step": 91018, "epoch": 2167} {"train_loss": -6.1943817138671875, "global_step": 91019, "epoch": 2167} {"train_loss": -6.025062084197998, "global_step": 91020, "epoch": 2167} {"train_loss": -6.387795925140381, "global_step": 91021, "epoch": 2167} {"train_loss": -6.065953254699707, "global_step": 91022, "epoch": 2167} {"train_loss": -6.148859024047852, "global_step": 91023, "epoch": 2167} {"train_loss": -6.179218769073486, "global_step": 91024, "epoch": 2167} {"train_loss": -6.091949462890625, "global_step": 91025, "epoch": 2167} {"train_loss": -6.361298084259033, "global_step": 91026, "epoch": 2167} {"train_loss": -6.10888671875, "global_step": 91027, "epoch": 2167} {"train_loss": -6.1538825035095215, "global_step": 91028, "epoch": 2167} {"train_loss": -6.027829170227051, "global_step": 91029, "epoch": 2167} {"train_loss": -6.25941276550293, "global_step": 91030, "epoch": 2167} {"train_loss": -5.987823009490967, "global_step": 91031, "epoch": 2167} {"train_loss": -6.292021751403809, "global_step": 91032, "epoch": 2167} {"train_loss": -6.203104019165039, "global_step": 91033, "epoch": 2167} {"train_loss": -6.152237892150879, "global_step": 91034, "epoch": 2167} {"train_loss": -6.256262302398682, "global_step": 91035, "epoch": 2167} {"train_loss": -6.155097007751465, "global_step": 91036, "epoch": 2167} {"train_loss": -6.208395957946777, "global_step": 91037, "epoch": 2167} {"train_loss": -6.207192420959473, "global_step": 91038, "epoch": 2167} {"train_loss": -6.126534461975098, "global_step": 91039, "epoch": 2167} {"train_loss": -6.250593185424805, "global_step": 91040, "epoch": 2167} {"train_loss": -6.171744346618652, "global_step": 91041, "epoch": 2167} {"train_loss": -6.2981672286987305, "global_step": 91042, "epoch": 2167} {"train_loss": -6.219236373901367, "global_step": 91043, "epoch": 2167} {"train_loss": -6.206578254699707, "global_step": 91044, "epoch": 2167} {"train_loss": -6.383172035217285, "global_step": 91045, "epoch": 2167} {"train_loss": -6.325953483581543, "global_step": 91046, "epoch": 2167} {"train_loss": -6.32342004776001, "global_step": 91047, "epoch": 2167} {"train_loss": -6.2719597816467285, "global_step": 91048, "epoch": 2167} {"train_loss": -6.230663299560547, "global_step": 91049, "epoch": 2167} {"train_loss": -6.242287635803223, "global_step": 91050, "epoch": 2167} {"train_loss": -6.284145355224609, "global_step": 91051, "epoch": 2167} {"train_loss": -6.331998825073242, "global_step": 91052, "epoch": 2167} {"train_loss": -6.256133079528809, "global_step": 91053, "epoch": 2167} {"train_loss": -6.281042098999023, "global_step": 91054, "epoch": 2167} {"train_loss": -6.214428311302548, "global_step": 91055, "epoch": 2167, "val_loss": 68248.3359375} {"train_loss": -6.2357354164123535, "global_step": 91056, "epoch": 2168} {"train_loss": -6.263728141784668, "global_step": 91057, "epoch": 2168} {"train_loss": -6.237251281738281, "global_step": 91058, "epoch": 2168} {"train_loss": -6.300141334533691, "global_step": 91059, "epoch": 2168} {"train_loss": -6.289071559906006, "global_step": 91060, "epoch": 2168} {"train_loss": -6.376073837280273, "global_step": 91061, "epoch": 2168} {"train_loss": -6.261541366577148, "global_step": 91062, "epoch": 2168} {"train_loss": -6.308916091918945, "global_step": 91063, "epoch": 2168} {"train_loss": -6.2145233154296875, "global_step": 91064, "epoch": 2168} {"train_loss": -6.1550140380859375, "global_step": 91065, "epoch": 2168} {"train_loss": -6.268892288208008, "global_step": 91066, "epoch": 2168} {"train_loss": -6.2486467361450195, "global_step": 91067, "epoch": 2168} {"train_loss": -6.201781749725342, "global_step": 91068, "epoch": 2168} {"train_loss": -6.263287544250488, "global_step": 91069, "epoch": 2168} {"train_loss": -6.2143049240112305, "global_step": 91070, "epoch": 2168} {"train_loss": -6.413339614868164, "global_step": 91071, "epoch": 2168} {"train_loss": -6.242490768432617, "global_step": 91072, "epoch": 2168} {"train_loss": -6.242180824279785, "global_step": 91073, "epoch": 2168} {"train_loss": -6.1248602867126465, "global_step": 91074, "epoch": 2168} {"train_loss": -6.337864875793457, "global_step": 91075, "epoch": 2168} {"train_loss": -6.218815326690674, "global_step": 91076, "epoch": 2168} {"train_loss": -6.286413192749023, "global_step": 91077, "epoch": 2168} {"train_loss": -6.238459587097168, "global_step": 91078, "epoch": 2168} {"train_loss": -6.154394149780273, "global_step": 91079, "epoch": 2168} {"train_loss": -6.249786853790283, "global_step": 91080, "epoch": 2168} {"train_loss": -6.249875545501709, "global_step": 91081, "epoch": 2168} {"train_loss": -6.290148735046387, "global_step": 91082, "epoch": 2168} {"train_loss": -6.095390319824219, "global_step": 91083, "epoch": 2168} {"train_loss": -6.28859806060791, "global_step": 91084, "epoch": 2168} {"train_loss": -6.220083236694336, "global_step": 91085, "epoch": 2168} {"train_loss": -6.359550952911377, "global_step": 91086, "epoch": 2168} {"train_loss": -6.245983123779297, "global_step": 91087, "epoch": 2168} {"train_loss": -6.2456889152526855, "global_step": 91088, "epoch": 2168} {"train_loss": -6.293720722198486, "global_step": 91089, "epoch": 2168} {"train_loss": -6.220969200134277, "global_step": 91090, "epoch": 2168} {"train_loss": -6.336157321929932, "global_step": 91091, "epoch": 2168} {"train_loss": -6.226428508758545, "global_step": 91092, "epoch": 2168} {"train_loss": -6.289120197296143, "global_step": 91093, "epoch": 2168} {"train_loss": -6.2155046463012695, "global_step": 91094, "epoch": 2168} {"train_loss": -6.240542411804199, "global_step": 91095, "epoch": 2168} {"train_loss": -6.276527404785156, "global_step": 91096, "epoch": 2168} {"train_loss": -6.254866429737636, "global_step": 91097, "epoch": 2168, "val_loss": 67885.4453125} {"train_loss": -6.3232879638671875, "global_step": 91098, "epoch": 2169} {"train_loss": -6.312046051025391, "global_step": 91099, "epoch": 2169} {"train_loss": -6.223071098327637, "global_step": 91100, "epoch": 2169} {"train_loss": -6.297573089599609, "global_step": 91101, "epoch": 2169} {"train_loss": -6.217243194580078, "global_step": 91102, "epoch": 2169} {"train_loss": -6.2976837158203125, "global_step": 91103, "epoch": 2169} {"train_loss": -6.209449768066406, "global_step": 91104, "epoch": 2169} {"train_loss": -6.203620910644531, "global_step": 91105, "epoch": 2169} {"train_loss": -6.22512149810791, "global_step": 91106, "epoch": 2169} {"train_loss": -6.325359344482422, "global_step": 91107, "epoch": 2169} {"train_loss": -6.355820655822754, "global_step": 91108, "epoch": 2169} {"train_loss": -6.250533580780029, "global_step": 91109, "epoch": 2169} {"train_loss": -6.37900447845459, "global_step": 91110, "epoch": 2169} {"train_loss": -6.174718856811523, "global_step": 91111, "epoch": 2169} {"train_loss": -6.286243438720703, "global_step": 91112, "epoch": 2169} {"train_loss": -6.2513227462768555, "global_step": 91113, "epoch": 2169} {"train_loss": -6.235684394836426, "global_step": 91114, "epoch": 2169} {"train_loss": -6.424568176269531, "global_step": 91115, "epoch": 2169} {"train_loss": -6.142210960388184, "global_step": 91116, "epoch": 2169} {"train_loss": -6.340947151184082, "global_step": 91117, "epoch": 2169} {"train_loss": -6.150576591491699, "global_step": 91118, "epoch": 2169} {"train_loss": -6.2702226638793945, "global_step": 91119, "epoch": 2169} {"train_loss": -6.3398237228393555, "global_step": 91120, "epoch": 2169} {"train_loss": -6.410953521728516, "global_step": 91121, "epoch": 2169} {"train_loss": -6.251682281494141, "global_step": 91122, "epoch": 2169} {"train_loss": -6.1844024658203125, "global_step": 91123, "epoch": 2169} {"train_loss": -6.34549617767334, "global_step": 91124, "epoch": 2169} {"train_loss": -6.274420738220215, "global_step": 91125, "epoch": 2169} {"train_loss": -6.320948600769043, "global_step": 91126, "epoch": 2169} {"train_loss": -6.165014266967773, "global_step": 91127, "epoch": 2169} {"train_loss": -6.2496819496154785, "global_step": 91128, "epoch": 2169} {"train_loss": -6.3073530197143555, "global_step": 91129, "epoch": 2169} {"train_loss": -6.244543075561523, "global_step": 91130, "epoch": 2169} {"train_loss": -6.283310413360596, "global_step": 91131, "epoch": 2169} {"train_loss": -6.345772743225098, "global_step": 91132, "epoch": 2169} {"train_loss": -6.225122451782227, "global_step": 91133, "epoch": 2169} {"train_loss": -6.274319648742676, "global_step": 91134, "epoch": 2169} {"train_loss": -6.370621681213379, "global_step": 91135, "epoch": 2169} {"train_loss": -6.249383926391602, "global_step": 91136, "epoch": 2169} {"train_loss": -6.204092502593994, "global_step": 91137, "epoch": 2169} {"train_loss": -6.314726829528809, "global_step": 91138, "epoch": 2169} {"train_loss": -6.277239890325637, "global_step": 91139, "epoch": 2169, "val_loss": 68105.4296875} {"train_loss": -6.368377685546875, "global_step": 91140, "epoch": 2170} {"train_loss": -6.15922737121582, "global_step": 91141, "epoch": 2170} {"train_loss": -6.359945297241211, "global_step": 91142, "epoch": 2170} {"train_loss": -6.234575271606445, "global_step": 91143, "epoch": 2170} {"train_loss": -6.255866050720215, "global_step": 91144, "epoch": 2170} {"train_loss": -6.278171539306641, "global_step": 91145, "epoch": 2170} {"train_loss": -6.307095527648926, "global_step": 91146, "epoch": 2170} {"train_loss": -6.222164630889893, "global_step": 91147, "epoch": 2170} {"train_loss": -6.226181507110596, "global_step": 91148, "epoch": 2170} {"train_loss": -6.236407279968262, "global_step": 91149, "epoch": 2170} {"train_loss": -6.12710428237915, "global_step": 91150, "epoch": 2170} {"train_loss": -6.142533779144287, "global_step": 91151, "epoch": 2170} {"train_loss": -6.230218410491943, "global_step": 91152, "epoch": 2170} {"train_loss": -6.148588180541992, "global_step": 91153, "epoch": 2170} {"train_loss": -6.208010673522949, "global_step": 91154, "epoch": 2170} {"train_loss": -6.126791954040527, "global_step": 91155, "epoch": 2170} {"train_loss": -5.97768497467041, "global_step": 91156, "epoch": 2170} {"train_loss": -6.0912275314331055, "global_step": 91157, "epoch": 2170} {"train_loss": -6.155738830566406, "global_step": 91158, "epoch": 2170} {"train_loss": -6.140987873077393, "global_step": 91159, "epoch": 2170} {"train_loss": -6.323448181152344, "global_step": 91160, "epoch": 2170} {"train_loss": -6.053427696228027, "global_step": 91161, "epoch": 2170} {"train_loss": -6.217410087585449, "global_step": 91162, "epoch": 2170} {"train_loss": -6.269432067871094, "global_step": 91163, "epoch": 2170} {"train_loss": -6.279995918273926, "global_step": 91164, "epoch": 2170} {"train_loss": -6.235607147216797, "global_step": 91165, "epoch": 2170} {"train_loss": -6.177948951721191, "global_step": 91166, "epoch": 2170} {"train_loss": -6.275361061096191, "global_step": 91167, "epoch": 2170} {"train_loss": -6.1930251121521, "global_step": 91168, "epoch": 2170} {"train_loss": -6.179706573486328, "global_step": 91169, "epoch": 2170} {"train_loss": -6.1931867599487305, "global_step": 91170, "epoch": 2170} {"train_loss": -6.300258636474609, "global_step": 91171, "epoch": 2170} {"train_loss": -6.28299617767334, "global_step": 91172, "epoch": 2170} {"train_loss": -6.188374996185303, "global_step": 91173, "epoch": 2170} {"train_loss": -6.235918998718262, "global_step": 91174, "epoch": 2170} {"train_loss": -6.24500846862793, "global_step": 91175, "epoch": 2170} {"train_loss": -6.156720161437988, "global_step": 91176, "epoch": 2170} {"train_loss": -6.322726249694824, "global_step": 91177, "epoch": 2170} {"train_loss": -6.273074150085449, "global_step": 91178, "epoch": 2170} {"train_loss": -6.229924201965332, "global_step": 91179, "epoch": 2170} {"train_loss": -6.284995079040527, "global_step": 91180, "epoch": 2170} {"train_loss": -6.215102808816092, "global_step": 91181, "epoch": 2170, "val_loss": 67965.546875} {"train_loss": -6.330795764923096, "global_step": 91182, "epoch": 2171} {"train_loss": -6.320193290710449, "global_step": 91183, "epoch": 2171} {"train_loss": -6.210528373718262, "global_step": 91184, "epoch": 2171} {"train_loss": -6.13360071182251, "global_step": 91185, "epoch": 2171} {"train_loss": -6.1622161865234375, "global_step": 91186, "epoch": 2171} {"train_loss": -6.190801620483398, "global_step": 91187, "epoch": 2171} {"train_loss": -6.2448883056640625, "global_step": 91188, "epoch": 2171} {"train_loss": -6.300986289978027, "global_step": 91189, "epoch": 2171} {"train_loss": -6.250459671020508, "global_step": 91190, "epoch": 2171} {"train_loss": -6.145956993103027, "global_step": 91191, "epoch": 2171} {"train_loss": -6.1271491050720215, "global_step": 91192, "epoch": 2171} {"train_loss": -6.261686325073242, "global_step": 91193, "epoch": 2171} {"train_loss": -6.206119537353516, "global_step": 91194, "epoch": 2171} {"train_loss": -6.174018859863281, "global_step": 91195, "epoch": 2171} {"train_loss": -6.1587629318237305, "global_step": 91196, "epoch": 2171} {"train_loss": -6.166207313537598, "global_step": 91197, "epoch": 2171} {"train_loss": -6.29788064956665, "global_step": 91198, "epoch": 2171} {"train_loss": -6.052801132202148, "global_step": 91199, "epoch": 2171} {"train_loss": -6.270276069641113, "global_step": 91200, "epoch": 2171} {"train_loss": -6.0760698318481445, "global_step": 91201, "epoch": 2171} {"train_loss": -6.1931328773498535, "global_step": 91202, "epoch": 2171} {"train_loss": -6.214529037475586, "global_step": 91203, "epoch": 2171} {"train_loss": -6.138199329376221, "global_step": 91204, "epoch": 2171} {"train_loss": -6.304790496826172, "global_step": 91205, "epoch": 2171} {"train_loss": -6.242842674255371, "global_step": 91206, "epoch": 2171} {"train_loss": -6.169056415557861, "global_step": 91207, "epoch": 2171} {"train_loss": -6.156567096710205, "global_step": 91208, "epoch": 2171} {"train_loss": -6.121382713317871, "global_step": 91209, "epoch": 2171} {"train_loss": -6.367733478546143, "global_step": 91210, "epoch": 2171} {"train_loss": -6.09486722946167, "global_step": 91211, "epoch": 2171} {"train_loss": -6.230640411376953, "global_step": 91212, "epoch": 2171} {"train_loss": -6.103855133056641, "global_step": 91213, "epoch": 2171} {"train_loss": -6.136190891265869, "global_step": 91214, "epoch": 2171} {"train_loss": -6.2247209548950195, "global_step": 91215, "epoch": 2171} {"train_loss": -6.273083209991455, "global_step": 91216, "epoch": 2171} {"train_loss": -6.296608924865723, "global_step": 91217, "epoch": 2171} {"train_loss": -6.285561561584473, "global_step": 91218, "epoch": 2171} {"train_loss": -6.217315673828125, "global_step": 91219, "epoch": 2171} {"train_loss": -6.2909626960754395, "global_step": 91220, "epoch": 2171} {"train_loss": -6.241981506347656, "global_step": 91221, "epoch": 2171} {"train_loss": -6.325395107269287, "global_step": 91222, "epoch": 2171} {"train_loss": -6.2143325578598745, "global_step": 91223, "epoch": 2171, "val_loss": 67960.6640625} {"train_loss": -6.3439249992370605, "global_step": 91224, "epoch": 2172} {"train_loss": -6.257089614868164, "global_step": 91225, "epoch": 2172} {"train_loss": -6.370192050933838, "global_step": 91226, "epoch": 2172} {"train_loss": -6.275801658630371, "global_step": 91227, "epoch": 2172} {"train_loss": -6.152805328369141, "global_step": 91228, "epoch": 2172} {"train_loss": -6.243985176086426, "global_step": 91229, "epoch": 2172} {"train_loss": -6.3145036697387695, "global_step": 91230, "epoch": 2172} {"train_loss": -6.306938171386719, "global_step": 91231, "epoch": 2172} {"train_loss": -6.255229949951172, "global_step": 91232, "epoch": 2172} {"train_loss": -6.352599143981934, "global_step": 91233, "epoch": 2172} {"train_loss": -6.344156265258789, "global_step": 91234, "epoch": 2172} {"train_loss": -6.305595874786377, "global_step": 91235, "epoch": 2172} {"train_loss": -6.25589656829834, "global_step": 91236, "epoch": 2172} {"train_loss": -6.169604778289795, "global_step": 91237, "epoch": 2172} {"train_loss": -6.207744598388672, "global_step": 91238, "epoch": 2172} {"train_loss": -6.080190658569336, "global_step": 91239, "epoch": 2172} {"train_loss": -6.19594669342041, "global_step": 91240, "epoch": 2172} {"train_loss": -6.2432661056518555, "global_step": 91241, "epoch": 2172} {"train_loss": -6.285189628601074, "global_step": 91242, "epoch": 2172} {"train_loss": -6.209169864654541, "global_step": 91243, "epoch": 2172} {"train_loss": -6.254581928253174, "global_step": 91244, "epoch": 2172} {"train_loss": -6.258615970611572, "global_step": 91245, "epoch": 2172} {"train_loss": -6.229660511016846, "global_step": 91246, "epoch": 2172} {"train_loss": -6.268838405609131, "global_step": 91247, "epoch": 2172} {"train_loss": -6.31138277053833, "global_step": 91248, "epoch": 2172} {"train_loss": -6.224336624145508, "global_step": 91249, "epoch": 2172} {"train_loss": -6.370857238769531, "global_step": 91250, "epoch": 2172} {"train_loss": -6.195224285125732, "global_step": 91251, "epoch": 2172} {"train_loss": -6.125884056091309, "global_step": 91252, "epoch": 2172} {"train_loss": -6.2119059562683105, "global_step": 91253, "epoch": 2172} {"train_loss": -6.1483869552612305, "global_step": 91254, "epoch": 2172} {"train_loss": -6.22322940826416, "global_step": 91255, "epoch": 2172} {"train_loss": -6.1552252769470215, "global_step": 91256, "epoch": 2172} {"train_loss": -6.256211280822754, "global_step": 91257, "epoch": 2172} {"train_loss": -6.287105560302734, "global_step": 91258, "epoch": 2172} {"train_loss": -6.13561487197876, "global_step": 91259, "epoch": 2172} {"train_loss": -6.182322025299072, "global_step": 91260, "epoch": 2172} {"train_loss": -6.281970977783203, "global_step": 91261, "epoch": 2172} {"train_loss": -6.210626125335693, "global_step": 91262, "epoch": 2172} {"train_loss": -6.168344497680664, "global_step": 91263, "epoch": 2172} {"train_loss": -6.2109785079956055, "global_step": 91264, "epoch": 2172} {"train_loss": -6.238563866842361, "global_step": 91265, "epoch": 2172, "val_loss": 67884.2421875} {"train_loss": -6.153567790985107, "global_step": 91266, "epoch": 2173} {"train_loss": -6.233034133911133, "global_step": 91267, "epoch": 2173} {"train_loss": -6.227944374084473, "global_step": 91268, "epoch": 2173} {"train_loss": -6.22244930267334, "global_step": 91269, "epoch": 2173} {"train_loss": -6.280441761016846, "global_step": 91270, "epoch": 2173} {"train_loss": -6.144854545593262, "global_step": 91271, "epoch": 2173} {"train_loss": -6.152958393096924, "global_step": 91272, "epoch": 2173} {"train_loss": -6.222397327423096, "global_step": 91273, "epoch": 2173} {"train_loss": -6.2267069816589355, "global_step": 91274, "epoch": 2173} {"train_loss": -6.358488082885742, "global_step": 91275, "epoch": 2173} {"train_loss": -6.266373634338379, "global_step": 91276, "epoch": 2173} {"train_loss": -6.235548973083496, "global_step": 91277, "epoch": 2173} {"train_loss": -6.263611793518066, "global_step": 91278, "epoch": 2173} {"train_loss": -6.1709675788879395, "global_step": 91279, "epoch": 2173} {"train_loss": -6.323306560516357, "global_step": 91280, "epoch": 2173} {"train_loss": -6.227619171142578, "global_step": 91281, "epoch": 2173} {"train_loss": -6.285284519195557, "global_step": 91282, "epoch": 2173} {"train_loss": -6.21484375, "global_step": 91283, "epoch": 2173} {"train_loss": -6.2940778732299805, "global_step": 91284, "epoch": 2173} {"train_loss": -6.2657060623168945, "global_step": 91285, "epoch": 2173} {"train_loss": -6.1931023597717285, "global_step": 91286, "epoch": 2173} {"train_loss": -6.189264297485352, "global_step": 91287, "epoch": 2173} {"train_loss": -6.192995548248291, "global_step": 91288, "epoch": 2173} {"train_loss": -6.225594520568848, "global_step": 91289, "epoch": 2173} {"train_loss": -6.335500240325928, "global_step": 91290, "epoch": 2173} {"train_loss": -6.292620658874512, "global_step": 91291, "epoch": 2173} {"train_loss": -6.15780782699585, "global_step": 91292, "epoch": 2173} {"train_loss": -6.247882843017578, "global_step": 91293, "epoch": 2173} {"train_loss": -6.331289768218994, "global_step": 91294, "epoch": 2173} {"train_loss": -6.219242095947266, "global_step": 91295, "epoch": 2173} {"train_loss": -6.203431129455566, "global_step": 91296, "epoch": 2173} {"train_loss": -6.196798801422119, "global_step": 91297, "epoch": 2173} {"train_loss": -6.228415489196777, "global_step": 91298, "epoch": 2173} {"train_loss": -6.2127685546875, "global_step": 91299, "epoch": 2173} {"train_loss": -6.224837303161621, "global_step": 91300, "epoch": 2173} {"train_loss": -6.248594760894775, "global_step": 91301, "epoch": 2173} {"train_loss": -6.1636576652526855, "global_step": 91302, "epoch": 2173} {"train_loss": -6.222587585449219, "global_step": 91303, "epoch": 2173} {"train_loss": -6.241754531860352, "global_step": 91304, "epoch": 2173} {"train_loss": -6.18906831741333, "global_step": 91305, "epoch": 2173} {"train_loss": -6.235452651977539, "global_step": 91306, "epoch": 2173} {"train_loss": -6.232009626570202, "global_step": 91307, "epoch": 2173, "val_loss": 67958.625} {"train_loss": -6.198443412780762, "global_step": 91308, "epoch": 2174} {"train_loss": -6.38687801361084, "global_step": 91309, "epoch": 2174} {"train_loss": -6.303079605102539, "global_step": 91310, "epoch": 2174} {"train_loss": -6.275062561035156, "global_step": 91311, "epoch": 2174} {"train_loss": -6.140139579772949, "global_step": 91312, "epoch": 2174} {"train_loss": -6.306323051452637, "global_step": 91313, "epoch": 2174} {"train_loss": -6.201676368713379, "global_step": 91314, "epoch": 2174} {"train_loss": -6.37623405456543, "global_step": 91315, "epoch": 2174} {"train_loss": -6.257561206817627, "global_step": 91316, "epoch": 2174} {"train_loss": -6.237550735473633, "global_step": 91317, "epoch": 2174} {"train_loss": -6.222324371337891, "global_step": 91318, "epoch": 2174} {"train_loss": -6.295478820800781, "global_step": 91319, "epoch": 2174} {"train_loss": -6.22749662399292, "global_step": 91320, "epoch": 2174} {"train_loss": -6.202927112579346, "global_step": 91321, "epoch": 2174} {"train_loss": -6.1587934494018555, "global_step": 91322, "epoch": 2174} {"train_loss": -6.236255645751953, "global_step": 91323, "epoch": 2174} {"train_loss": -6.097148895263672, "global_step": 91324, "epoch": 2174} {"train_loss": -6.179382801055908, "global_step": 91325, "epoch": 2174} {"train_loss": -6.286149024963379, "global_step": 91326, "epoch": 2174} {"train_loss": -6.171600818634033, "global_step": 91327, "epoch": 2174} {"train_loss": -6.311302185058594, "global_step": 91328, "epoch": 2174} {"train_loss": -6.221325874328613, "global_step": 91329, "epoch": 2174} {"train_loss": -6.174749374389648, "global_step": 91330, "epoch": 2174} {"train_loss": -6.1964616775512695, "global_step": 91331, "epoch": 2174} {"train_loss": -6.221461296081543, "global_step": 91332, "epoch": 2174} {"train_loss": -6.167680740356445, "global_step": 91333, "epoch": 2174} {"train_loss": -6.273228645324707, "global_step": 91334, "epoch": 2174} {"train_loss": -6.345446586608887, "global_step": 91335, "epoch": 2174} {"train_loss": -6.334198474884033, "global_step": 91336, "epoch": 2174} {"train_loss": -6.331745147705078, "global_step": 91337, "epoch": 2174} {"train_loss": -6.264345169067383, "global_step": 91338, "epoch": 2174} {"train_loss": -6.2870049476623535, "global_step": 91339, "epoch": 2174} {"train_loss": -6.2628936767578125, "global_step": 91340, "epoch": 2174} {"train_loss": -6.3052473068237305, "global_step": 91341, "epoch": 2174} {"train_loss": -6.254634380340576, "global_step": 91342, "epoch": 2174} {"train_loss": -6.198026657104492, "global_step": 91343, "epoch": 2174} {"train_loss": -6.31285285949707, "global_step": 91344, "epoch": 2174} {"train_loss": -6.207215785980225, "global_step": 91345, "epoch": 2174} {"train_loss": -6.351365089416504, "global_step": 91346, "epoch": 2174} {"train_loss": -6.239737510681152, "global_step": 91347, "epoch": 2174} {"train_loss": -6.35930061340332, "global_step": 91348, "epoch": 2174} {"train_loss": -6.256495839073544, "global_step": 91349, "epoch": 2174, "val_loss": 67824.328125} {"train_loss": -6.299622535705566, "global_step": 91350, "epoch": 2175} {"train_loss": -6.207064151763916, "global_step": 91351, "epoch": 2175} {"train_loss": -6.16625452041626, "global_step": 91352, "epoch": 2175} {"train_loss": -6.230325222015381, "global_step": 91353, "epoch": 2175} {"train_loss": -6.26838493347168, "global_step": 91354, "epoch": 2175} {"train_loss": -6.373122215270996, "global_step": 91355, "epoch": 2175} {"train_loss": -6.243120193481445, "global_step": 91356, "epoch": 2175} {"train_loss": -6.324736595153809, "global_step": 91357, "epoch": 2175} {"train_loss": -6.3199920654296875, "global_step": 91358, "epoch": 2175} {"train_loss": -6.216026306152344, "global_step": 91359, "epoch": 2175} {"train_loss": -6.265195846557617, "global_step": 91360, "epoch": 2175} {"train_loss": -6.445337295532227, "global_step": 91361, "epoch": 2175} {"train_loss": -6.292237281799316, "global_step": 91362, "epoch": 2175} {"train_loss": -6.226329326629639, "global_step": 91363, "epoch": 2175} {"train_loss": -6.225756645202637, "global_step": 91364, "epoch": 2175} {"train_loss": -6.272607803344727, "global_step": 91365, "epoch": 2175} {"train_loss": -6.249495983123779, "global_step": 91366, "epoch": 2175} {"train_loss": -6.223150253295898, "global_step": 91367, "epoch": 2175} {"train_loss": -6.369354248046875, "global_step": 91368, "epoch": 2175} {"train_loss": -6.26755952835083, "global_step": 91369, "epoch": 2175} {"train_loss": -6.278254508972168, "global_step": 91370, "epoch": 2175} {"train_loss": -6.2967681884765625, "global_step": 91371, "epoch": 2175} {"train_loss": -6.304777145385742, "global_step": 91372, "epoch": 2175} {"train_loss": -6.258871078491211, "global_step": 91373, "epoch": 2175} {"train_loss": -6.247747898101807, "global_step": 91374, "epoch": 2175} {"train_loss": -6.3503313064575195, "global_step": 91375, "epoch": 2175} {"train_loss": -6.270824432373047, "global_step": 91376, "epoch": 2175} {"train_loss": -6.273676872253418, "global_step": 91377, "epoch": 2175} {"train_loss": -6.347039222717285, "global_step": 91378, "epoch": 2175} {"train_loss": -6.305398941040039, "global_step": 91379, "epoch": 2175} {"train_loss": -6.415635108947754, "global_step": 91380, "epoch": 2175} {"train_loss": -6.211027145385742, "global_step": 91381, "epoch": 2175} {"train_loss": -6.180975914001465, "global_step": 91382, "epoch": 2175} {"train_loss": -6.272044658660889, "global_step": 91383, "epoch": 2175} {"train_loss": -6.242937088012695, "global_step": 91384, "epoch": 2175} {"train_loss": -6.17302942276001, "global_step": 91385, "epoch": 2175} {"train_loss": -6.362502574920654, "global_step": 91386, "epoch": 2175} {"train_loss": -6.2939252853393555, "global_step": 91387, "epoch": 2175} {"train_loss": -6.381993293762207, "global_step": 91388, "epoch": 2175} {"train_loss": -6.34368896484375, "global_step": 91389, "epoch": 2175} {"train_loss": -6.2554450035095215, "global_step": 91390, "epoch": 2175} {"train_loss": -6.284614824113392, "global_step": 91391, "epoch": 2175, "val_loss": 67820.8046875} {"train_loss": -6.306514263153076, "global_step": 91392, "epoch": 2176} {"train_loss": -6.2644267082214355, "global_step": 91393, "epoch": 2176} {"train_loss": -6.064576148986816, "global_step": 91394, "epoch": 2176} {"train_loss": -6.2033796310424805, "global_step": 91395, "epoch": 2176} {"train_loss": -6.239075183868408, "global_step": 91396, "epoch": 2176} {"train_loss": -6.2622833251953125, "global_step": 91397, "epoch": 2176} {"train_loss": -6.198554039001465, "global_step": 91398, "epoch": 2176} {"train_loss": -6.273977279663086, "global_step": 91399, "epoch": 2176} {"train_loss": -6.326001167297363, "global_step": 91400, "epoch": 2176} {"train_loss": -6.339159965515137, "global_step": 91401, "epoch": 2176} {"train_loss": -6.202476501464844, "global_step": 91402, "epoch": 2176} {"train_loss": -6.244760036468506, "global_step": 91403, "epoch": 2176} {"train_loss": -6.200953483581543, "global_step": 91404, "epoch": 2176} {"train_loss": -6.221244812011719, "global_step": 91405, "epoch": 2176} {"train_loss": -6.2425947189331055, "global_step": 91406, "epoch": 2176} {"train_loss": -6.185634136199951, "global_step": 91407, "epoch": 2176} {"train_loss": -6.271965980529785, "global_step": 91408, "epoch": 2176} {"train_loss": -6.159524917602539, "global_step": 91409, "epoch": 2176} {"train_loss": -6.187768936157227, "global_step": 91410, "epoch": 2176} {"train_loss": -6.282658100128174, "global_step": 91411, "epoch": 2176} {"train_loss": -6.193077087402344, "global_step": 91412, "epoch": 2176} {"train_loss": -6.225408554077148, "global_step": 91413, "epoch": 2176} {"train_loss": -6.222414970397949, "global_step": 91414, "epoch": 2176} {"train_loss": -6.111024856567383, "global_step": 91415, "epoch": 2176} {"train_loss": -6.282121658325195, "global_step": 91416, "epoch": 2176} {"train_loss": -6.285259246826172, "global_step": 91417, "epoch": 2176} {"train_loss": -6.164618015289307, "global_step": 91418, "epoch": 2176} {"train_loss": -6.263212203979492, "global_step": 91419, "epoch": 2176} {"train_loss": -6.306249141693115, "global_step": 91420, "epoch": 2176} {"train_loss": -6.162535667419434, "global_step": 91421, "epoch": 2176} {"train_loss": -6.310657501220703, "global_step": 91422, "epoch": 2176} {"train_loss": -6.2703447341918945, "global_step": 91423, "epoch": 2176} {"train_loss": -6.2309064865112305, "global_step": 91424, "epoch": 2176} {"train_loss": -6.246261119842529, "global_step": 91425, "epoch": 2176} {"train_loss": -6.057846546173096, "global_step": 91426, "epoch": 2176} {"train_loss": -6.247405052185059, "global_step": 91427, "epoch": 2176} {"train_loss": -6.283594131469727, "global_step": 91428, "epoch": 2176} {"train_loss": -6.127573490142822, "global_step": 91429, "epoch": 2176} {"train_loss": -6.204989433288574, "global_step": 91430, "epoch": 2176} {"train_loss": -6.193498611450195, "global_step": 91431, "epoch": 2176} {"train_loss": -6.158990859985352, "global_step": 91432, "epoch": 2176} {"train_loss": -6.224933794566563, "global_step": 91433, "epoch": 2176, "val_loss": 67808.3671875} {"train_loss": -6.1215925216674805, "global_step": 91434, "epoch": 2177} {"train_loss": -6.215463161468506, "global_step": 91435, "epoch": 2177} {"train_loss": -6.270801544189453, "global_step": 91436, "epoch": 2177} {"train_loss": -6.261476039886475, "global_step": 91437, "epoch": 2177} {"train_loss": -6.328711986541748, "global_step": 91438, "epoch": 2177} {"train_loss": -6.320557117462158, "global_step": 91439, "epoch": 2177} {"train_loss": -6.302583694458008, "global_step": 91440, "epoch": 2177} {"train_loss": -6.178028106689453, "global_step": 91441, "epoch": 2177} {"train_loss": -6.247303009033203, "global_step": 91442, "epoch": 2177} {"train_loss": -6.129112243652344, "global_step": 91443, "epoch": 2177} {"train_loss": -6.277791976928711, "global_step": 91444, "epoch": 2177} {"train_loss": -6.161257266998291, "global_step": 91445, "epoch": 2177} {"train_loss": -6.198611259460449, "global_step": 91446, "epoch": 2177} {"train_loss": -6.321775436401367, "global_step": 91447, "epoch": 2177} {"train_loss": -6.237880706787109, "global_step": 91448, "epoch": 2177} {"train_loss": -6.136879920959473, "global_step": 91449, "epoch": 2177} {"train_loss": -6.297685623168945, "global_step": 91450, "epoch": 2177} {"train_loss": -6.248363494873047, "global_step": 91451, "epoch": 2177} {"train_loss": -6.306669235229492, "global_step": 91452, "epoch": 2177} {"train_loss": -6.21849250793457, "global_step": 91453, "epoch": 2177} {"train_loss": -6.270486831665039, "global_step": 91454, "epoch": 2177} {"train_loss": -6.150575160980225, "global_step": 91455, "epoch": 2177} {"train_loss": -6.191044807434082, "global_step": 91456, "epoch": 2177} {"train_loss": -6.1906256675720215, "global_step": 91457, "epoch": 2177} {"train_loss": -6.008385181427002, "global_step": 91458, "epoch": 2177} {"train_loss": -6.191069602966309, "global_step": 91459, "epoch": 2177} {"train_loss": -6.232522010803223, "global_step": 91460, "epoch": 2177} {"train_loss": -6.283754348754883, "global_step": 91461, "epoch": 2177} {"train_loss": -6.12948751449585, "global_step": 91462, "epoch": 2177} {"train_loss": -6.1295013427734375, "global_step": 91463, "epoch": 2177} {"train_loss": -6.197084426879883, "global_step": 91464, "epoch": 2177} {"train_loss": -5.996502876281738, "global_step": 91465, "epoch": 2177} {"train_loss": -6.198740482330322, "global_step": 91466, "epoch": 2177} {"train_loss": -6.213122844696045, "global_step": 91467, "epoch": 2177} {"train_loss": -6.276797771453857, "global_step": 91468, "epoch": 2177} {"train_loss": -6.277442455291748, "global_step": 91469, "epoch": 2177} {"train_loss": -6.296658039093018, "global_step": 91470, "epoch": 2177} {"train_loss": -6.243967533111572, "global_step": 91471, "epoch": 2177} {"train_loss": -6.220232009887695, "global_step": 91472, "epoch": 2177} {"train_loss": -6.13034725189209, "global_step": 91473, "epoch": 2177} {"train_loss": -6.317379951477051, "global_step": 91474, "epoch": 2177} {"train_loss": -6.2183385235922675, "global_step": 91475, "epoch": 2177, "val_loss": 67793.296875} {"train_loss": -6.324265956878662, "global_step": 91476, "epoch": 2178} {"train_loss": -6.290825843811035, "global_step": 91477, "epoch": 2178} {"train_loss": -6.151910305023193, "global_step": 91478, "epoch": 2178} {"train_loss": -6.283051013946533, "global_step": 91479, "epoch": 2178} {"train_loss": -6.280038356781006, "global_step": 91480, "epoch": 2178} {"train_loss": -6.263210296630859, "global_step": 91481, "epoch": 2178} {"train_loss": -6.326347827911377, "global_step": 91482, "epoch": 2178} {"train_loss": -6.225217819213867, "global_step": 91483, "epoch": 2178} {"train_loss": -6.125675678253174, "global_step": 91484, "epoch": 2178} {"train_loss": -6.341687202453613, "global_step": 91485, "epoch": 2178} {"train_loss": -6.138754844665527, "global_step": 91486, "epoch": 2178} {"train_loss": -6.202816963195801, "global_step": 91487, "epoch": 2178} {"train_loss": -6.200152397155762, "global_step": 91488, "epoch": 2178} {"train_loss": -6.127816677093506, "global_step": 91489, "epoch": 2178} {"train_loss": -6.035944938659668, "global_step": 91490, "epoch": 2178} {"train_loss": -6.125072002410889, "global_step": 91491, "epoch": 2178} {"train_loss": -6.150588035583496, "global_step": 91492, "epoch": 2178} {"train_loss": -6.235570907592773, "global_step": 91493, "epoch": 2178} {"train_loss": -6.1980180740356445, "global_step": 91494, "epoch": 2178} {"train_loss": -6.209978103637695, "global_step": 91495, "epoch": 2178} {"train_loss": -6.265373229980469, "global_step": 91496, "epoch": 2178} {"train_loss": -6.25599479675293, "global_step": 91497, "epoch": 2178} {"train_loss": -6.108375549316406, "global_step": 91498, "epoch": 2178} {"train_loss": -6.243996620178223, "global_step": 91499, "epoch": 2178} {"train_loss": -6.238363265991211, "global_step": 91500, "epoch": 2178} {"train_loss": -6.152751445770264, "global_step": 91501, "epoch": 2178} {"train_loss": -6.189748764038086, "global_step": 91502, "epoch": 2178} {"train_loss": -6.190969944000244, "global_step": 91503, "epoch": 2178} {"train_loss": -6.310196876525879, "global_step": 91504, "epoch": 2178} {"train_loss": -6.208345890045166, "global_step": 91505, "epoch": 2178} {"train_loss": -6.283556938171387, "global_step": 91506, "epoch": 2178} {"train_loss": -6.322297096252441, "global_step": 91507, "epoch": 2178} {"train_loss": -6.246426582336426, "global_step": 91508, "epoch": 2178} {"train_loss": -6.197866439819336, "global_step": 91509, "epoch": 2178} {"train_loss": -6.293449401855469, "global_step": 91510, "epoch": 2178} {"train_loss": -6.215156555175781, "global_step": 91511, "epoch": 2178} {"train_loss": -6.270018577575684, "global_step": 91512, "epoch": 2178} {"train_loss": -6.114773750305176, "global_step": 91513, "epoch": 2178} {"train_loss": -6.166128158569336, "global_step": 91514, "epoch": 2178} {"train_loss": -6.344414710998535, "global_step": 91515, "epoch": 2178} {"train_loss": -6.206336975097656, "global_step": 91516, "epoch": 2178} {"train_loss": -6.222189222063337, "global_step": 91517, "epoch": 2178, "val_loss": 67881.8125} {"train_loss": -6.174524307250977, "global_step": 91518, "epoch": 2179} {"train_loss": -6.191956996917725, "global_step": 91519, "epoch": 2179} {"train_loss": -6.392963886260986, "global_step": 91520, "epoch": 2179} {"train_loss": -6.287928104400635, "global_step": 91521, "epoch": 2179} {"train_loss": -6.325511455535889, "global_step": 91522, "epoch": 2179} {"train_loss": -6.265073776245117, "global_step": 91523, "epoch": 2179} {"train_loss": -6.330930709838867, "global_step": 91524, "epoch": 2179} {"train_loss": -6.173773765563965, "global_step": 91525, "epoch": 2179} {"train_loss": -6.240840911865234, "global_step": 91526, "epoch": 2179} {"train_loss": -6.32740592956543, "global_step": 91527, "epoch": 2179} {"train_loss": -6.142019271850586, "global_step": 91528, "epoch": 2179} {"train_loss": -6.225606918334961, "global_step": 91529, "epoch": 2179} {"train_loss": -6.192967414855957, "global_step": 91530, "epoch": 2179} {"train_loss": -6.279203414916992, "global_step": 91531, "epoch": 2179} {"train_loss": -6.286760330200195, "global_step": 91532, "epoch": 2179} {"train_loss": -6.262336254119873, "global_step": 91533, "epoch": 2179} {"train_loss": -6.099936485290527, "global_step": 91534, "epoch": 2179} {"train_loss": -6.254532814025879, "global_step": 91535, "epoch": 2179} {"train_loss": -6.26485538482666, "global_step": 91536, "epoch": 2179} {"train_loss": -6.212736129760742, "global_step": 91537, "epoch": 2179} {"train_loss": -6.336053848266602, "global_step": 91538, "epoch": 2179} {"train_loss": -6.1663618087768555, "global_step": 91539, "epoch": 2179} {"train_loss": -6.239199638366699, "global_step": 91540, "epoch": 2179} {"train_loss": -6.270003318786621, "global_step": 91541, "epoch": 2179} {"train_loss": -6.38814115524292, "global_step": 91542, "epoch": 2179} {"train_loss": -6.338572025299072, "global_step": 91543, "epoch": 2179} {"train_loss": -6.315268516540527, "global_step": 91544, "epoch": 2179} {"train_loss": -6.159942626953125, "global_step": 91545, "epoch": 2179} {"train_loss": -6.26821231842041, "global_step": 91546, "epoch": 2179} {"train_loss": -6.257709980010986, "global_step": 91547, "epoch": 2179} {"train_loss": -6.2780914306640625, "global_step": 91548, "epoch": 2179} {"train_loss": -6.357212066650391, "global_step": 91549, "epoch": 2179} {"train_loss": -6.274899959564209, "global_step": 91550, "epoch": 2179} {"train_loss": -6.230440616607666, "global_step": 91551, "epoch": 2179} {"train_loss": -6.284060001373291, "global_step": 91552, "epoch": 2179} {"train_loss": -6.278380870819092, "global_step": 91553, "epoch": 2179} {"train_loss": -6.340307235717773, "global_step": 91554, "epoch": 2179} {"train_loss": -6.243579864501953, "global_step": 91555, "epoch": 2179} {"train_loss": -6.277434349060059, "global_step": 91556, "epoch": 2179} {"train_loss": -6.304544448852539, "global_step": 91557, "epoch": 2179} {"train_loss": -6.128199577331543, "global_step": 91558, "epoch": 2179} {"train_loss": -6.262719687961397, "global_step": 91559, "epoch": 2179, "val_loss": 67978.9375} {"train_loss": -6.257729530334473, "global_step": 91560, "epoch": 2180} {"train_loss": -6.260262489318848, "global_step": 91561, "epoch": 2180} {"train_loss": -6.264269828796387, "global_step": 91562, "epoch": 2180} {"train_loss": -6.128320693969727, "global_step": 91563, "epoch": 2180} {"train_loss": -6.145177841186523, "global_step": 91564, "epoch": 2180} {"train_loss": -6.268510818481445, "global_step": 91565, "epoch": 2180} {"train_loss": -6.198977470397949, "global_step": 91566, "epoch": 2180} {"train_loss": -6.152709007263184, "global_step": 91567, "epoch": 2180} {"train_loss": -6.227558135986328, "global_step": 91568, "epoch": 2180} {"train_loss": -6.384614944458008, "global_step": 91569, "epoch": 2180} {"train_loss": -6.247408866882324, "global_step": 91570, "epoch": 2180} {"train_loss": -6.164292335510254, "global_step": 91571, "epoch": 2180} {"train_loss": -6.180330753326416, "global_step": 91572, "epoch": 2180} {"train_loss": -6.330904006958008, "global_step": 91573, "epoch": 2180} {"train_loss": -6.309317588806152, "global_step": 91574, "epoch": 2180} {"train_loss": -6.2254838943481445, "global_step": 91575, "epoch": 2180} {"train_loss": -6.138822555541992, "global_step": 91576, "epoch": 2180} {"train_loss": -6.177332401275635, "global_step": 91577, "epoch": 2180} {"train_loss": -6.261153221130371, "global_step": 91578, "epoch": 2180} {"train_loss": -6.223820686340332, "global_step": 91579, "epoch": 2180} {"train_loss": -6.237216949462891, "global_step": 91580, "epoch": 2180} {"train_loss": -6.317060470581055, "global_step": 91581, "epoch": 2180} {"train_loss": -6.24423885345459, "global_step": 91582, "epoch": 2180} {"train_loss": -6.304218292236328, "global_step": 91583, "epoch": 2180} {"train_loss": -6.232729434967041, "global_step": 91584, "epoch": 2180} {"train_loss": -6.239109992980957, "global_step": 91585, "epoch": 2180} {"train_loss": -6.097825050354004, "global_step": 91586, "epoch": 2180} {"train_loss": -6.314769268035889, "global_step": 91587, "epoch": 2180} {"train_loss": -6.169695854187012, "global_step": 91588, "epoch": 2180} {"train_loss": -6.30873966217041, "global_step": 91589, "epoch": 2180} {"train_loss": -6.316929817199707, "global_step": 91590, "epoch": 2180} {"train_loss": -6.1725053787231445, "global_step": 91591, "epoch": 2180} {"train_loss": -6.3404340744018555, "global_step": 91592, "epoch": 2180} {"train_loss": -6.258998394012451, "global_step": 91593, "epoch": 2180} {"train_loss": -6.3367486000061035, "global_step": 91594, "epoch": 2180} {"train_loss": -6.188189506530762, "global_step": 91595, "epoch": 2180} {"train_loss": -6.115476608276367, "global_step": 91596, "epoch": 2180} {"train_loss": -6.322154998779297, "global_step": 91597, "epoch": 2180} {"train_loss": -6.165067195892334, "global_step": 91598, "epoch": 2180} {"train_loss": -6.289729118347168, "global_step": 91599, "epoch": 2180} {"train_loss": -6.209724426269531, "global_step": 91600, "epoch": 2180} {"train_loss": -6.236791690190633, "global_step": 91601, "epoch": 2180, "val_loss": 68003.3359375} {"train_loss": -6.2816290855407715, "global_step": 91602, "epoch": 2181} {"train_loss": -6.253914833068848, "global_step": 91603, "epoch": 2181} {"train_loss": -6.2248992919921875, "global_step": 91604, "epoch": 2181} {"train_loss": -6.200809478759766, "global_step": 91605, "epoch": 2181} {"train_loss": -6.0610857009887695, "global_step": 91606, "epoch": 2181} {"train_loss": -6.320836067199707, "global_step": 91607, "epoch": 2181} {"train_loss": -6.332577705383301, "global_step": 91608, "epoch": 2181} {"train_loss": -6.263460159301758, "global_step": 91609, "epoch": 2181} {"train_loss": -6.114416122436523, "global_step": 91610, "epoch": 2181} {"train_loss": -6.18901252746582, "global_step": 91611, "epoch": 2181} {"train_loss": -6.2282257080078125, "global_step": 91612, "epoch": 2181} {"train_loss": -6.189382076263428, "global_step": 91613, "epoch": 2181} {"train_loss": -6.180602550506592, "global_step": 91614, "epoch": 2181} {"train_loss": -6.265670299530029, "global_step": 91615, "epoch": 2181} {"train_loss": -6.159846305847168, "global_step": 91616, "epoch": 2181} {"train_loss": -6.349211692810059, "global_step": 91617, "epoch": 2181} {"train_loss": -6.335818767547607, "global_step": 91618, "epoch": 2181} {"train_loss": -6.29034423828125, "global_step": 91619, "epoch": 2181} {"train_loss": -6.209095478057861, "global_step": 91620, "epoch": 2181} {"train_loss": -6.26788854598999, "global_step": 91621, "epoch": 2181} {"train_loss": -6.26338005065918, "global_step": 91622, "epoch": 2181} {"train_loss": -6.290006637573242, "global_step": 91623, "epoch": 2181} {"train_loss": -6.200433731079102, "global_step": 91624, "epoch": 2181} {"train_loss": -6.242763996124268, "global_step": 91625, "epoch": 2181} {"train_loss": -6.30056095123291, "global_step": 91626, "epoch": 2181} {"train_loss": -6.322369575500488, "global_step": 91627, "epoch": 2181} {"train_loss": -6.237250804901123, "global_step": 91628, "epoch": 2181} {"train_loss": -6.282026767730713, "global_step": 91629, "epoch": 2181} {"train_loss": -6.242342948913574, "global_step": 91630, "epoch": 2181} {"train_loss": -6.283154487609863, "global_step": 91631, "epoch": 2181} {"train_loss": -6.288649559020996, "global_step": 91632, "epoch": 2181} {"train_loss": -6.172595024108887, "global_step": 91633, "epoch": 2181} {"train_loss": -6.15053653717041, "global_step": 91634, "epoch": 2181} {"train_loss": -6.298232078552246, "global_step": 91635, "epoch": 2181} {"train_loss": -6.247010231018066, "global_step": 91636, "epoch": 2181} {"train_loss": -6.1851043701171875, "global_step": 91637, "epoch": 2181} {"train_loss": -6.3123650550842285, "global_step": 91638, "epoch": 2181} {"train_loss": -6.170214653015137, "global_step": 91639, "epoch": 2181} {"train_loss": -6.171814918518066, "global_step": 91640, "epoch": 2181} {"train_loss": -6.25482177734375, "global_step": 91641, "epoch": 2181} {"train_loss": -6.203606605529785, "global_step": 91642, "epoch": 2181} {"train_loss": -6.2378811949775335, "global_step": 91643, "epoch": 2181, "val_loss": 67725.734375} {"train_loss": -6.186887264251709, "global_step": 91644, "epoch": 2182} {"train_loss": -6.165083885192871, "global_step": 91645, "epoch": 2182} {"train_loss": -6.217082977294922, "global_step": 91646, "epoch": 2182} {"train_loss": -6.249581813812256, "global_step": 91647, "epoch": 2182} {"train_loss": -6.165404319763184, "global_step": 91648, "epoch": 2182} {"train_loss": -6.190853118896484, "global_step": 91649, "epoch": 2182} {"train_loss": -6.312586307525635, "global_step": 91650, "epoch": 2182} {"train_loss": -6.088297367095947, "global_step": 91651, "epoch": 2182} {"train_loss": -6.053117752075195, "global_step": 91652, "epoch": 2182} {"train_loss": -6.272797107696533, "global_step": 91653, "epoch": 2182} {"train_loss": -6.168355941772461, "global_step": 91654, "epoch": 2182} {"train_loss": -6.269521713256836, "global_step": 91655, "epoch": 2182} {"train_loss": -6.211393356323242, "global_step": 91656, "epoch": 2182} {"train_loss": -6.201448917388916, "global_step": 91657, "epoch": 2182} {"train_loss": -6.385747909545898, "global_step": 91658, "epoch": 2182} {"train_loss": -6.1338653564453125, "global_step": 91659, "epoch": 2182} {"train_loss": -6.166953086853027, "global_step": 91660, "epoch": 2182} {"train_loss": -6.198126792907715, "global_step": 91661, "epoch": 2182} {"train_loss": -6.300101280212402, "global_step": 91662, "epoch": 2182} {"train_loss": -6.220987796783447, "global_step": 91663, "epoch": 2182} {"train_loss": -6.220829010009766, "global_step": 91664, "epoch": 2182} {"train_loss": -6.289349555969238, "global_step": 91665, "epoch": 2182} {"train_loss": -6.233541488647461, "global_step": 91666, "epoch": 2182} {"train_loss": -6.195722579956055, "global_step": 91667, "epoch": 2182} {"train_loss": -6.292764663696289, "global_step": 91668, "epoch": 2182} {"train_loss": -6.156271934509277, "global_step": 91669, "epoch": 2182} {"train_loss": -6.219988822937012, "global_step": 91670, "epoch": 2182} {"train_loss": -6.262923717498779, "global_step": 91671, "epoch": 2182} {"train_loss": -6.249626159667969, "global_step": 91672, "epoch": 2182} {"train_loss": -6.267116069793701, "global_step": 91673, "epoch": 2182} {"train_loss": -6.287990093231201, "global_step": 91674, "epoch": 2182} {"train_loss": -6.177530288696289, "global_step": 91675, "epoch": 2182} {"train_loss": -6.184403419494629, "global_step": 91676, "epoch": 2182} {"train_loss": -6.272512435913086, "global_step": 91677, "epoch": 2182} {"train_loss": -6.3380126953125, "global_step": 91678, "epoch": 2182} {"train_loss": -6.167293548583984, "global_step": 91679, "epoch": 2182} {"train_loss": -6.216638088226318, "global_step": 91680, "epoch": 2182} {"train_loss": -6.200630187988281, "global_step": 91681, "epoch": 2182} {"train_loss": -6.175754070281982, "global_step": 91682, "epoch": 2182} {"train_loss": -6.232396602630615, "global_step": 91683, "epoch": 2182} {"train_loss": -6.362359046936035, "global_step": 91684, "epoch": 2182} {"train_loss": -6.221346355619884, "global_step": 91685, "epoch": 2182, "val_loss": 67989.859375} {"train_loss": -6.077425003051758, "global_step": 91686, "epoch": 2183} {"train_loss": -6.158456802368164, "global_step": 91687, "epoch": 2183} {"train_loss": -6.105886459350586, "global_step": 91688, "epoch": 2183} {"train_loss": -6.3418779373168945, "global_step": 91689, "epoch": 2183} {"train_loss": -6.075495719909668, "global_step": 91690, "epoch": 2183} {"train_loss": -6.253177642822266, "global_step": 91691, "epoch": 2183} {"train_loss": -6.284799098968506, "global_step": 91692, "epoch": 2183} {"train_loss": -6.170428276062012, "global_step": 91693, "epoch": 2183} {"train_loss": -6.2081403732299805, "global_step": 91694, "epoch": 2183} {"train_loss": -6.3034162521362305, "global_step": 91695, "epoch": 2183} {"train_loss": -6.316062927246094, "global_step": 91696, "epoch": 2183} {"train_loss": -6.176384925842285, "global_step": 91697, "epoch": 2183} {"train_loss": -6.237126350402832, "global_step": 91698, "epoch": 2183} {"train_loss": -6.278434753417969, "global_step": 91699, "epoch": 2183} {"train_loss": -6.359930515289307, "global_step": 91700, "epoch": 2183} {"train_loss": -6.153460502624512, "global_step": 91701, "epoch": 2183} {"train_loss": -6.210925102233887, "global_step": 91702, "epoch": 2183} {"train_loss": -6.113279342651367, "global_step": 91703, "epoch": 2183} {"train_loss": -6.254849433898926, "global_step": 91704, "epoch": 2183} {"train_loss": -6.301754951477051, "global_step": 91705, "epoch": 2183} {"train_loss": -6.232419967651367, "global_step": 91706, "epoch": 2183} {"train_loss": -6.353288650512695, "global_step": 91707, "epoch": 2183} {"train_loss": -6.254443168640137, "global_step": 91708, "epoch": 2183} {"train_loss": -6.285137176513672, "global_step": 91709, "epoch": 2183} {"train_loss": -6.279317378997803, "global_step": 91710, "epoch": 2183} {"train_loss": -6.311033725738525, "global_step": 91711, "epoch": 2183} {"train_loss": -6.242369651794434, "global_step": 91712, "epoch": 2183} {"train_loss": -6.277990341186523, "global_step": 91713, "epoch": 2183} {"train_loss": -6.261145114898682, "global_step": 91714, "epoch": 2183} {"train_loss": -6.166138648986816, "global_step": 91715, "epoch": 2183} {"train_loss": -6.265613555908203, "global_step": 91716, "epoch": 2183} {"train_loss": -6.373507022857666, "global_step": 91717, "epoch": 2183} {"train_loss": -6.152818202972412, "global_step": 91718, "epoch": 2183} {"train_loss": -6.323217868804932, "global_step": 91719, "epoch": 2183} {"train_loss": -6.2564697265625, "global_step": 91720, "epoch": 2183} {"train_loss": -6.259913444519043, "global_step": 91721, "epoch": 2183} {"train_loss": -6.137835502624512, "global_step": 91722, "epoch": 2183} {"train_loss": -6.151673316955566, "global_step": 91723, "epoch": 2183} {"train_loss": -6.302531719207764, "global_step": 91724, "epoch": 2183} {"train_loss": -6.245576858520508, "global_step": 91725, "epoch": 2183} {"train_loss": -6.34589147567749, "global_step": 91726, "epoch": 2183} {"train_loss": -6.238813956578572, "global_step": 91727, "epoch": 2183, "val_loss": 67839.2109375} {"train_loss": -6.253485202789307, "global_step": 91728, "epoch": 2184} {"train_loss": -6.331489086151123, "global_step": 91729, "epoch": 2184} {"train_loss": -6.308156967163086, "global_step": 91730, "epoch": 2184} {"train_loss": -6.212846279144287, "global_step": 91731, "epoch": 2184} {"train_loss": -6.128194808959961, "global_step": 91732, "epoch": 2184} {"train_loss": -6.079051971435547, "global_step": 91733, "epoch": 2184} {"train_loss": -6.25887393951416, "global_step": 91734, "epoch": 2184} {"train_loss": -6.243579864501953, "global_step": 91735, "epoch": 2184} {"train_loss": -6.0439934730529785, "global_step": 91736, "epoch": 2184} {"train_loss": -6.294361591339111, "global_step": 91737, "epoch": 2184} {"train_loss": -6.176602840423584, "global_step": 91738, "epoch": 2184} {"train_loss": -6.138016700744629, "global_step": 91739, "epoch": 2184} {"train_loss": -6.152327537536621, "global_step": 91740, "epoch": 2184} {"train_loss": -6.188626289367676, "global_step": 91741, "epoch": 2184} {"train_loss": -6.204466342926025, "global_step": 91742, "epoch": 2184} {"train_loss": -6.008187770843506, "global_step": 91743, "epoch": 2184} {"train_loss": -6.256569862365723, "global_step": 91744, "epoch": 2184} {"train_loss": -6.186216831207275, "global_step": 91745, "epoch": 2184} {"train_loss": -6.338040828704834, "global_step": 91746, "epoch": 2184} {"train_loss": -6.118219375610352, "global_step": 91747, "epoch": 2184} {"train_loss": -6.332056045532227, "global_step": 91748, "epoch": 2184} {"train_loss": -6.193829536437988, "global_step": 91749, "epoch": 2184} {"train_loss": -6.211061477661133, "global_step": 91750, "epoch": 2184} {"train_loss": -6.203388214111328, "global_step": 91751, "epoch": 2184} {"train_loss": -6.137446880340576, "global_step": 91752, "epoch": 2184} {"train_loss": -6.22127628326416, "global_step": 91753, "epoch": 2184} {"train_loss": -6.280591011047363, "global_step": 91754, "epoch": 2184} {"train_loss": -6.291345596313477, "global_step": 91755, "epoch": 2184} {"train_loss": -6.390360355377197, "global_step": 91756, "epoch": 2184} {"train_loss": -6.153685569763184, "global_step": 91757, "epoch": 2184} {"train_loss": -6.284699440002441, "global_step": 91758, "epoch": 2184} {"train_loss": -6.244036674499512, "global_step": 91759, "epoch": 2184} {"train_loss": -6.238417625427246, "global_step": 91760, "epoch": 2184} {"train_loss": -6.268495559692383, "global_step": 91761, "epoch": 2184} {"train_loss": -6.235973358154297, "global_step": 91762, "epoch": 2184} {"train_loss": -6.180553436279297, "global_step": 91763, "epoch": 2184} {"train_loss": -6.356414794921875, "global_step": 91764, "epoch": 2184} {"train_loss": -6.288591384887695, "global_step": 91765, "epoch": 2184} {"train_loss": -6.187033653259277, "global_step": 91766, "epoch": 2184} {"train_loss": -6.194541931152344, "global_step": 91767, "epoch": 2184} {"train_loss": -6.305947303771973, "global_step": 91768, "epoch": 2184} {"train_loss": -6.224837916237967, "global_step": 91769, "epoch": 2184, "val_loss": 67959.328125} {"train_loss": -6.258175849914551, "global_step": 91770, "epoch": 2185} {"train_loss": -6.238533020019531, "global_step": 91771, "epoch": 2185} {"train_loss": -6.236486434936523, "global_step": 91772, "epoch": 2185} {"train_loss": -6.338336944580078, "global_step": 91773, "epoch": 2185} {"train_loss": -6.231837272644043, "global_step": 91774, "epoch": 2185} {"train_loss": -6.221843242645264, "global_step": 91775, "epoch": 2185} {"train_loss": -6.24217414855957, "global_step": 91776, "epoch": 2185} {"train_loss": -6.2928619384765625, "global_step": 91777, "epoch": 2185} {"train_loss": -6.191727638244629, "global_step": 91778, "epoch": 2185} {"train_loss": -6.156301498413086, "global_step": 91779, "epoch": 2185} {"train_loss": -6.199639797210693, "global_step": 91780, "epoch": 2185} {"train_loss": -6.2678542137146, "global_step": 91781, "epoch": 2185} {"train_loss": -6.255756378173828, "global_step": 91782, "epoch": 2185} {"train_loss": -6.158267021179199, "global_step": 91783, "epoch": 2185} {"train_loss": -6.29578971862793, "global_step": 91784, "epoch": 2185} {"train_loss": -6.213003158569336, "global_step": 91785, "epoch": 2185} {"train_loss": -6.233067512512207, "global_step": 91786, "epoch": 2185} {"train_loss": -6.261598587036133, "global_step": 91787, "epoch": 2185} {"train_loss": -6.266859531402588, "global_step": 91788, "epoch": 2185} {"train_loss": -6.342765808105469, "global_step": 91789, "epoch": 2185} {"train_loss": -6.166480541229248, "global_step": 91790, "epoch": 2185} {"train_loss": -6.16411018371582, "global_step": 91791, "epoch": 2185} {"train_loss": -6.213921546936035, "global_step": 91792, "epoch": 2185} {"train_loss": -6.198592185974121, "global_step": 91793, "epoch": 2185} {"train_loss": -6.187906265258789, "global_step": 91794, "epoch": 2185} {"train_loss": -6.182841777801514, "global_step": 91795, "epoch": 2185} {"train_loss": -6.256713390350342, "global_step": 91796, "epoch": 2185} {"train_loss": -6.24042272567749, "global_step": 91797, "epoch": 2185} {"train_loss": -6.1974687576293945, "global_step": 91798, "epoch": 2185} {"train_loss": -6.108430862426758, "global_step": 91799, "epoch": 2185} {"train_loss": -6.198666572570801, "global_step": 91800, "epoch": 2185} {"train_loss": -6.261042594909668, "global_step": 91801, "epoch": 2185} {"train_loss": -6.265472412109375, "global_step": 91802, "epoch": 2185} {"train_loss": -6.241044998168945, "global_step": 91803, "epoch": 2185} {"train_loss": -6.262080192565918, "global_step": 91804, "epoch": 2185} {"train_loss": -6.275997638702393, "global_step": 91805, "epoch": 2185} {"train_loss": -6.243472099304199, "global_step": 91806, "epoch": 2185} {"train_loss": -6.225724220275879, "global_step": 91807, "epoch": 2185} {"train_loss": -6.279906749725342, "global_step": 91808, "epoch": 2185} {"train_loss": -6.225335121154785, "global_step": 91809, "epoch": 2185} {"train_loss": -6.2362141609191895, "global_step": 91810, "epoch": 2185} {"train_loss": -6.230945484978812, "global_step": 91811, "epoch": 2185, "val_loss": 67777.3359375} {"train_loss": -6.2027482986450195, "global_step": 91812, "epoch": 2186} {"train_loss": -6.2006378173828125, "global_step": 91813, "epoch": 2186} {"train_loss": -6.282087326049805, "global_step": 91814, "epoch": 2186} {"train_loss": -6.293610572814941, "global_step": 91815, "epoch": 2186} {"train_loss": -6.318459510803223, "global_step": 91816, "epoch": 2186} {"train_loss": -6.334047317504883, "global_step": 91817, "epoch": 2186} {"train_loss": -6.228117942810059, "global_step": 91818, "epoch": 2186} {"train_loss": -6.188136100769043, "global_step": 91819, "epoch": 2186} {"train_loss": -6.28892707824707, "global_step": 91820, "epoch": 2186} {"train_loss": -6.303695201873779, "global_step": 91821, "epoch": 2186} {"train_loss": -6.308157444000244, "global_step": 91822, "epoch": 2186} {"train_loss": -6.320958614349365, "global_step": 91823, "epoch": 2186} {"train_loss": -6.2378010749816895, "global_step": 91824, "epoch": 2186} {"train_loss": -6.262627601623535, "global_step": 91825, "epoch": 2186} {"train_loss": -6.370034217834473, "global_step": 91826, "epoch": 2186} {"train_loss": -6.31888484954834, "global_step": 91827, "epoch": 2186} {"train_loss": -6.28984260559082, "global_step": 91828, "epoch": 2186} {"train_loss": -6.153958320617676, "global_step": 91829, "epoch": 2186} {"train_loss": -6.202797889709473, "global_step": 91830, "epoch": 2186} {"train_loss": -6.278105735778809, "global_step": 91831, "epoch": 2186} {"train_loss": -6.1303629875183105, "global_step": 91832, "epoch": 2186} {"train_loss": -6.187732696533203, "global_step": 91833, "epoch": 2186} {"train_loss": -6.222578525543213, "global_step": 91834, "epoch": 2186} {"train_loss": -6.274864196777344, "global_step": 91835, "epoch": 2186} {"train_loss": -6.230991363525391, "global_step": 91836, "epoch": 2186} {"train_loss": -6.329918384552002, "global_step": 91837, "epoch": 2186} {"train_loss": -6.237412452697754, "global_step": 91838, "epoch": 2186} {"train_loss": -6.257067680358887, "global_step": 91839, "epoch": 2186} {"train_loss": -6.344200134277344, "global_step": 91840, "epoch": 2186} {"train_loss": -6.330584526062012, "global_step": 91841, "epoch": 2186} {"train_loss": -6.280073165893555, "global_step": 91842, "epoch": 2186} {"train_loss": -6.286682605743408, "global_step": 91843, "epoch": 2186} {"train_loss": -6.297270774841309, "global_step": 91844, "epoch": 2186} {"train_loss": -6.290671348571777, "global_step": 91845, "epoch": 2186} {"train_loss": -6.14401388168335, "global_step": 91846, "epoch": 2186} {"train_loss": -6.3268914222717285, "global_step": 91847, "epoch": 2186} {"train_loss": -6.153505325317383, "global_step": 91848, "epoch": 2186} {"train_loss": -6.264595031738281, "global_step": 91849, "epoch": 2186} {"train_loss": -6.287812232971191, "global_step": 91850, "epoch": 2186} {"train_loss": -6.230569362640381, "global_step": 91851, "epoch": 2186} {"train_loss": -6.189089298248291, "global_step": 91852, "epoch": 2186} {"train_loss": -6.261605240049816, "global_step": 91853, "epoch": 2186, "val_loss": 67683.4921875} {"train_loss": -6.272974491119385, "global_step": 91854, "epoch": 2187} {"train_loss": -6.353909015655518, "global_step": 91855, "epoch": 2187} {"train_loss": -6.398105144500732, "global_step": 91856, "epoch": 2187} {"train_loss": -6.300488471984863, "global_step": 91857, "epoch": 2187} {"train_loss": -6.142431259155273, "global_step": 91858, "epoch": 2187} {"train_loss": -6.33758544921875, "global_step": 91859, "epoch": 2187} {"train_loss": -6.313968658447266, "global_step": 91860, "epoch": 2187} {"train_loss": -6.171486854553223, "global_step": 91861, "epoch": 2187} {"train_loss": -6.281030654907227, "global_step": 91862, "epoch": 2187} {"train_loss": -6.271616458892822, "global_step": 91863, "epoch": 2187} {"train_loss": -6.249779224395752, "global_step": 91864, "epoch": 2187} {"train_loss": -6.068414688110352, "global_step": 91865, "epoch": 2187} {"train_loss": -6.2475128173828125, "global_step": 91866, "epoch": 2187} {"train_loss": -6.328517913818359, "global_step": 91867, "epoch": 2187} {"train_loss": -6.20960807800293, "global_step": 91868, "epoch": 2187} {"train_loss": -6.19391393661499, "global_step": 91869, "epoch": 2187} {"train_loss": -6.279997825622559, "global_step": 91870, "epoch": 2187} {"train_loss": -6.252379894256592, "global_step": 91871, "epoch": 2187} {"train_loss": -6.130110740661621, "global_step": 91872, "epoch": 2187} {"train_loss": -6.189365386962891, "global_step": 91873, "epoch": 2187} {"train_loss": -6.280227184295654, "global_step": 91874, "epoch": 2187} {"train_loss": -6.285341739654541, "global_step": 91875, "epoch": 2187} {"train_loss": -6.296849250793457, "global_step": 91876, "epoch": 2187} {"train_loss": -6.220850467681885, "global_step": 91877, "epoch": 2187} {"train_loss": -6.238491058349609, "global_step": 91878, "epoch": 2187} {"train_loss": -6.170919418334961, "global_step": 91879, "epoch": 2187} {"train_loss": -6.174285888671875, "global_step": 91880, "epoch": 2187} {"train_loss": -6.215297222137451, "global_step": 91881, "epoch": 2187} {"train_loss": -6.3578081130981445, "global_step": 91882, "epoch": 2187} {"train_loss": -6.323038578033447, "global_step": 91883, "epoch": 2187} {"train_loss": -6.233792781829834, "global_step": 91884, "epoch": 2187} {"train_loss": -6.3064422607421875, "global_step": 91885, "epoch": 2187} {"train_loss": -6.272931098937988, "global_step": 91886, "epoch": 2187} {"train_loss": -6.2271552085876465, "global_step": 91887, "epoch": 2187} {"train_loss": -6.388903617858887, "global_step": 91888, "epoch": 2187} {"train_loss": -6.229619979858398, "global_step": 91889, "epoch": 2187} {"train_loss": -6.171085357666016, "global_step": 91890, "epoch": 2187} {"train_loss": -6.18306827545166, "global_step": 91891, "epoch": 2187} {"train_loss": -6.114091873168945, "global_step": 91892, "epoch": 2187} {"train_loss": -6.208898544311523, "global_step": 91893, "epoch": 2187} {"train_loss": -6.162435531616211, "global_step": 91894, "epoch": 2187} {"train_loss": -6.24060861269633, "global_step": 91895, "epoch": 2187, "val_loss": 68114.2578125} {"train_loss": -6.185651779174805, "global_step": 91896, "epoch": 2188} {"train_loss": -6.3304572105407715, "global_step": 91897, "epoch": 2188} {"train_loss": -6.199825286865234, "global_step": 91898, "epoch": 2188} {"train_loss": -6.248718738555908, "global_step": 91899, "epoch": 2188} {"train_loss": -6.289933204650879, "global_step": 91900, "epoch": 2188} {"train_loss": -6.273374557495117, "global_step": 91901, "epoch": 2188} {"train_loss": -6.240930557250977, "global_step": 91902, "epoch": 2188} {"train_loss": -6.313143730163574, "global_step": 91903, "epoch": 2188} {"train_loss": -6.2730231285095215, "global_step": 91904, "epoch": 2188} {"train_loss": -6.235593795776367, "global_step": 91905, "epoch": 2188} {"train_loss": -6.146892547607422, "global_step": 91906, "epoch": 2188} {"train_loss": -6.282927989959717, "global_step": 91907, "epoch": 2188} {"train_loss": -6.202448844909668, "global_step": 91908, "epoch": 2188} {"train_loss": -6.197787761688232, "global_step": 91909, "epoch": 2188} {"train_loss": -6.182046413421631, "global_step": 91910, "epoch": 2188} {"train_loss": -6.184074401855469, "global_step": 91911, "epoch": 2188} {"train_loss": -6.1958723068237305, "global_step": 91912, "epoch": 2188} {"train_loss": -6.209212303161621, "global_step": 91913, "epoch": 2188} {"train_loss": -6.208577632904053, "global_step": 91914, "epoch": 2188} {"train_loss": -6.228143215179443, "global_step": 91915, "epoch": 2188} {"train_loss": -6.187937259674072, "global_step": 91916, "epoch": 2188} {"train_loss": -6.288512229919434, "global_step": 91917, "epoch": 2188} {"train_loss": -6.246753692626953, "global_step": 91918, "epoch": 2188} {"train_loss": -6.1744585037231445, "global_step": 91919, "epoch": 2188} {"train_loss": -6.184388160705566, "global_step": 91920, "epoch": 2188} {"train_loss": -6.141261100769043, "global_step": 91921, "epoch": 2188} {"train_loss": -6.080446720123291, "global_step": 91922, "epoch": 2188} {"train_loss": -6.272472381591797, "global_step": 91923, "epoch": 2188} {"train_loss": -6.235259056091309, "global_step": 91924, "epoch": 2188} {"train_loss": -6.252594947814941, "global_step": 91925, "epoch": 2188} {"train_loss": -6.195504188537598, "global_step": 91926, "epoch": 2188} {"train_loss": -6.253994464874268, "global_step": 91927, "epoch": 2188} {"train_loss": -6.280536651611328, "global_step": 91928, "epoch": 2188} {"train_loss": -6.199274063110352, "global_step": 91929, "epoch": 2188} {"train_loss": -6.240460395812988, "global_step": 91930, "epoch": 2188} {"train_loss": -6.276240348815918, "global_step": 91931, "epoch": 2188} {"train_loss": -6.225998878479004, "global_step": 91932, "epoch": 2188} {"train_loss": -6.275134086608887, "global_step": 91933, "epoch": 2188} {"train_loss": -6.259953498840332, "global_step": 91934, "epoch": 2188} {"train_loss": -6.2087836265563965, "global_step": 91935, "epoch": 2188} {"train_loss": -6.302727699279785, "global_step": 91936, "epoch": 2188} {"train_loss": -6.230270226796468, "global_step": 91937, "epoch": 2188, "val_loss": 67881.484375} {"train_loss": -6.304358959197998, "global_step": 91938, "epoch": 2189} {"train_loss": -6.366496562957764, "global_step": 91939, "epoch": 2189} {"train_loss": -6.239372253417969, "global_step": 91940, "epoch": 2189} {"train_loss": -6.289355278015137, "global_step": 91941, "epoch": 2189} {"train_loss": -6.188657760620117, "global_step": 91942, "epoch": 2189} {"train_loss": -6.256278038024902, "global_step": 91943, "epoch": 2189} {"train_loss": -6.255936622619629, "global_step": 91944, "epoch": 2189} {"train_loss": -6.368775367736816, "global_step": 91945, "epoch": 2189} {"train_loss": -6.215071678161621, "global_step": 91946, "epoch": 2189} {"train_loss": -6.336207866668701, "global_step": 91947, "epoch": 2189} {"train_loss": -6.261929512023926, "global_step": 91948, "epoch": 2189} {"train_loss": -6.220477104187012, "global_step": 91949, "epoch": 2189} {"train_loss": -6.24043083190918, "global_step": 91950, "epoch": 2189} {"train_loss": -6.368776798248291, "global_step": 91951, "epoch": 2189} {"train_loss": -6.2613091468811035, "global_step": 91952, "epoch": 2189} {"train_loss": -6.331391334533691, "global_step": 91953, "epoch": 2189} {"train_loss": -6.379993438720703, "global_step": 91954, "epoch": 2189} {"train_loss": -6.335921287536621, "global_step": 91955, "epoch": 2189} {"train_loss": -6.314275741577148, "global_step": 91956, "epoch": 2189} {"train_loss": -6.362010955810547, "global_step": 91957, "epoch": 2189} {"train_loss": -6.286296844482422, "global_step": 91958, "epoch": 2189} {"train_loss": -6.272636890411377, "global_step": 91959, "epoch": 2189} {"train_loss": -6.313307762145996, "global_step": 91960, "epoch": 2189} {"train_loss": -6.302513599395752, "global_step": 91961, "epoch": 2189} {"train_loss": -6.130655288696289, "global_step": 91962, "epoch": 2189} {"train_loss": -6.19035530090332, "global_step": 91963, "epoch": 2189} {"train_loss": -6.240930557250977, "global_step": 91964, "epoch": 2189} {"train_loss": -6.286478042602539, "global_step": 91965, "epoch": 2189} {"train_loss": -6.303637504577637, "global_step": 91966, "epoch": 2189} {"train_loss": -6.197658538818359, "global_step": 91967, "epoch": 2189} {"train_loss": -6.130319595336914, "global_step": 91968, "epoch": 2189} {"train_loss": -6.307946681976318, "global_step": 91969, "epoch": 2189} {"train_loss": -6.196697235107422, "global_step": 91970, "epoch": 2189} {"train_loss": -6.2007246017456055, "global_step": 91971, "epoch": 2189} {"train_loss": -6.284284591674805, "global_step": 91972, "epoch": 2189} {"train_loss": -6.250686168670654, "global_step": 91973, "epoch": 2189} {"train_loss": -6.275750160217285, "global_step": 91974, "epoch": 2189} {"train_loss": -6.30672025680542, "global_step": 91975, "epoch": 2189} {"train_loss": -6.205852508544922, "global_step": 91976, "epoch": 2189} {"train_loss": -6.235706329345703, "global_step": 91977, "epoch": 2189} {"train_loss": -6.151365756988525, "global_step": 91978, "epoch": 2189} {"train_loss": -6.268956252506801, "global_step": 91979, "epoch": 2189, "val_loss": 68078.6484375} {"train_loss": -6.126286506652832, "global_step": 91980, "epoch": 2190} {"train_loss": -6.338324069976807, "global_step": 91981, "epoch": 2190} {"train_loss": -6.161067485809326, "global_step": 91982, "epoch": 2190} {"train_loss": -6.170216083526611, "global_step": 91983, "epoch": 2190} {"train_loss": -6.145801067352295, "global_step": 91984, "epoch": 2190} {"train_loss": -6.097084999084473, "global_step": 91985, "epoch": 2190} {"train_loss": -6.193376064300537, "global_step": 91986, "epoch": 2190} {"train_loss": -6.10646915435791, "global_step": 91987, "epoch": 2190} {"train_loss": -6.164510250091553, "global_step": 91988, "epoch": 2190} {"train_loss": -6.308192253112793, "global_step": 91989, "epoch": 2190} {"train_loss": -6.131406784057617, "global_step": 91990, "epoch": 2190} {"train_loss": -6.17822265625, "global_step": 91991, "epoch": 2190} {"train_loss": -6.128978729248047, "global_step": 91992, "epoch": 2190} {"train_loss": -6.24055814743042, "global_step": 91993, "epoch": 2190} {"train_loss": -6.125967025756836, "global_step": 91994, "epoch": 2190} {"train_loss": -6.2653350830078125, "global_step": 91995, "epoch": 2190} {"train_loss": -6.230614185333252, "global_step": 91996, "epoch": 2190} {"train_loss": -6.288409233093262, "global_step": 91997, "epoch": 2190} {"train_loss": -6.28153133392334, "global_step": 91998, "epoch": 2190} {"train_loss": -6.190878391265869, "global_step": 91999, "epoch": 2190} {"train_loss": -6.188271999359131, "global_step": 92000, "epoch": 2190} {"train_loss": -6.318490028381348, "global_step": 92001, "epoch": 2190} {"train_loss": -6.380677223205566, "global_step": 92002, "epoch": 2190} {"train_loss": -6.282397747039795, "global_step": 92003, "epoch": 2190} {"train_loss": -6.288127899169922, "global_step": 92004, "epoch": 2190} {"train_loss": -6.1726884841918945, "global_step": 92005, "epoch": 2190} {"train_loss": -6.274489402770996, "global_step": 92006, "epoch": 2190} {"train_loss": -6.23692512512207, "global_step": 92007, "epoch": 2190} {"train_loss": -6.275969982147217, "global_step": 92008, "epoch": 2190} {"train_loss": -6.309024333953857, "global_step": 92009, "epoch": 2190} {"train_loss": -6.309529781341553, "global_step": 92010, "epoch": 2190} {"train_loss": -6.2446064949035645, "global_step": 92011, "epoch": 2190} {"train_loss": -6.306694030761719, "global_step": 92012, "epoch": 2190} {"train_loss": -6.328508377075195, "global_step": 92013, "epoch": 2190} {"train_loss": -6.286839485168457, "global_step": 92014, "epoch": 2190} {"train_loss": -6.17612361907959, "global_step": 92015, "epoch": 2190} {"train_loss": -6.327580451965332, "global_step": 92016, "epoch": 2190} {"train_loss": -6.264357566833496, "global_step": 92017, "epoch": 2190} {"train_loss": -6.142653465270996, "global_step": 92018, "epoch": 2190} {"train_loss": -6.253993988037109, "global_step": 92019, "epoch": 2190} {"train_loss": -6.2971954345703125, "global_step": 92020, "epoch": 2190} {"train_loss": -6.230240708305722, "global_step": 92021, "epoch": 2190, "val_loss": 67792.65625} {"train_loss": -6.381941795349121, "global_step": 92022, "epoch": 2191} {"train_loss": -6.247527122497559, "global_step": 92023, "epoch": 2191} {"train_loss": -6.306262016296387, "global_step": 92024, "epoch": 2191} {"train_loss": -6.1453633308410645, "global_step": 92025, "epoch": 2191} {"train_loss": -6.252423286437988, "global_step": 92026, "epoch": 2191} {"train_loss": -6.258109092712402, "global_step": 92027, "epoch": 2191} {"train_loss": -6.249436378479004, "global_step": 92028, "epoch": 2191} {"train_loss": -6.144519805908203, "global_step": 92029, "epoch": 2191} {"train_loss": -6.302681922912598, "global_step": 92030, "epoch": 2191} {"train_loss": -6.2890424728393555, "global_step": 92031, "epoch": 2191} {"train_loss": -6.284085273742676, "global_step": 92032, "epoch": 2191} {"train_loss": -6.253034591674805, "global_step": 92033, "epoch": 2191} {"train_loss": -6.119228363037109, "global_step": 92034, "epoch": 2191} {"train_loss": -6.168705940246582, "global_step": 92035, "epoch": 2191} {"train_loss": -6.246530532836914, "global_step": 92036, "epoch": 2191} {"train_loss": -6.22591495513916, "global_step": 92037, "epoch": 2191} {"train_loss": -6.182509422302246, "global_step": 92038, "epoch": 2191} {"train_loss": -6.192590713500977, "global_step": 92039, "epoch": 2191} {"train_loss": -6.158519744873047, "global_step": 92040, "epoch": 2191} {"train_loss": -6.213407516479492, "global_step": 92041, "epoch": 2191} {"train_loss": -6.357819557189941, "global_step": 92042, "epoch": 2191} {"train_loss": -6.242715835571289, "global_step": 92043, "epoch": 2191} {"train_loss": -6.238196849822998, "global_step": 92044, "epoch": 2191} {"train_loss": -6.129023551940918, "global_step": 92045, "epoch": 2191} {"train_loss": -6.180606365203857, "global_step": 92046, "epoch": 2191} {"train_loss": -6.207901954650879, "global_step": 92047, "epoch": 2191} {"train_loss": -6.191030025482178, "global_step": 92048, "epoch": 2191} {"train_loss": -6.271541595458984, "global_step": 92049, "epoch": 2191} {"train_loss": -6.198333263397217, "global_step": 92050, "epoch": 2191} {"train_loss": -6.1707658767700195, "global_step": 92051, "epoch": 2191} {"train_loss": -6.316545486450195, "global_step": 92052, "epoch": 2191} {"train_loss": -6.167390823364258, "global_step": 92053, "epoch": 2191} {"train_loss": -6.184542179107666, "global_step": 92054, "epoch": 2191} {"train_loss": -6.238733291625977, "global_step": 92055, "epoch": 2191} {"train_loss": -6.312414169311523, "global_step": 92056, "epoch": 2191} {"train_loss": -6.2081146240234375, "global_step": 92057, "epoch": 2191} {"train_loss": -6.265904903411865, "global_step": 92058, "epoch": 2191} {"train_loss": -6.296224117279053, "global_step": 92059, "epoch": 2191} {"train_loss": -6.2240190505981445, "global_step": 92060, "epoch": 2191} {"train_loss": -6.169747829437256, "global_step": 92061, "epoch": 2191} {"train_loss": -6.188292503356934, "global_step": 92062, "epoch": 2191} {"train_loss": -6.231137775239491, "global_step": 92063, "epoch": 2191, "val_loss": 67888.3359375} {"train_loss": -6.28846549987793, "global_step": 92064, "epoch": 2192} {"train_loss": -6.24751091003418, "global_step": 92065, "epoch": 2192} {"train_loss": -6.321155071258545, "global_step": 92066, "epoch": 2192} {"train_loss": -6.32304573059082, "global_step": 92067, "epoch": 2192} {"train_loss": -6.295971870422363, "global_step": 92068, "epoch": 2192} {"train_loss": -6.278909683227539, "global_step": 92069, "epoch": 2192} {"train_loss": -6.216987609863281, "global_step": 92070, "epoch": 2192} {"train_loss": -6.23628044128418, "global_step": 92071, "epoch": 2192} {"train_loss": -6.345434665679932, "global_step": 92072, "epoch": 2192} {"train_loss": -6.4240403175354, "global_step": 92073, "epoch": 2192} {"train_loss": -6.246085166931152, "global_step": 92074, "epoch": 2192} {"train_loss": -6.358315467834473, "global_step": 92075, "epoch": 2192} {"train_loss": -6.199911594390869, "global_step": 92076, "epoch": 2192} {"train_loss": -6.322637557983398, "global_step": 92077, "epoch": 2192} {"train_loss": -6.39068078994751, "global_step": 92078, "epoch": 2192} {"train_loss": -6.294600486755371, "global_step": 92079, "epoch": 2192} {"train_loss": -6.302906036376953, "global_step": 92080, "epoch": 2192} {"train_loss": -6.400989055633545, "global_step": 92081, "epoch": 2192} {"train_loss": -6.245372295379639, "global_step": 92082, "epoch": 2192} {"train_loss": -6.186513423919678, "global_step": 92083, "epoch": 2192} {"train_loss": -6.24446964263916, "global_step": 92084, "epoch": 2192} {"train_loss": -6.217361927032471, "global_step": 92085, "epoch": 2192} {"train_loss": -6.135949611663818, "global_step": 92086, "epoch": 2192} {"train_loss": -6.32961368560791, "global_step": 92087, "epoch": 2192} {"train_loss": -6.317676544189453, "global_step": 92088, "epoch": 2192} {"train_loss": -6.252471923828125, "global_step": 92089, "epoch": 2192} {"train_loss": -6.2381696701049805, "global_step": 92090, "epoch": 2192} {"train_loss": -6.279751300811768, "global_step": 92091, "epoch": 2192} {"train_loss": -6.234830856323242, "global_step": 92092, "epoch": 2192} {"train_loss": -6.280900001525879, "global_step": 92093, "epoch": 2192} {"train_loss": -6.265636920928955, "global_step": 92094, "epoch": 2192} {"train_loss": -6.299694061279297, "global_step": 92095, "epoch": 2192} {"train_loss": -6.2286601066589355, "global_step": 92096, "epoch": 2192} {"train_loss": -6.214663505554199, "global_step": 92097, "epoch": 2192} {"train_loss": -6.185227394104004, "global_step": 92098, "epoch": 2192} {"train_loss": -6.190789699554443, "global_step": 92099, "epoch": 2192} {"train_loss": -6.168862342834473, "global_step": 92100, "epoch": 2192} {"train_loss": -6.143683910369873, "global_step": 92101, "epoch": 2192} {"train_loss": -6.319182395935059, "global_step": 92102, "epoch": 2192} {"train_loss": -6.301516532897949, "global_step": 92103, "epoch": 2192} {"train_loss": -6.2145609855651855, "global_step": 92104, "epoch": 2192} {"train_loss": -6.268152395884196, "global_step": 92105, "epoch": 2192, "val_loss": 67997.7578125} {"train_loss": -6.2692084312438965, "global_step": 92106, "epoch": 2193} {"train_loss": -6.205764293670654, "global_step": 92107, "epoch": 2193} {"train_loss": -6.372209548950195, "global_step": 92108, "epoch": 2193} {"train_loss": -6.291675567626953, "global_step": 92109, "epoch": 2193} {"train_loss": -6.32823371887207, "global_step": 92110, "epoch": 2193} {"train_loss": -6.129447937011719, "global_step": 92111, "epoch": 2193} {"train_loss": -6.319813251495361, "global_step": 92112, "epoch": 2193} {"train_loss": -6.304473876953125, "global_step": 92113, "epoch": 2193} {"train_loss": -6.323873519897461, "global_step": 92114, "epoch": 2193} {"train_loss": -6.279831886291504, "global_step": 92115, "epoch": 2193} {"train_loss": -6.297092437744141, "global_step": 92116, "epoch": 2193} {"train_loss": -6.259952068328857, "global_step": 92117, "epoch": 2193} {"train_loss": -6.317729473114014, "global_step": 92118, "epoch": 2193} {"train_loss": -6.328181743621826, "global_step": 92119, "epoch": 2193} {"train_loss": -6.298532009124756, "global_step": 92120, "epoch": 2193} {"train_loss": -6.347862243652344, "global_step": 92121, "epoch": 2193} {"train_loss": -6.257141590118408, "global_step": 92122, "epoch": 2193} {"train_loss": -6.233312606811523, "global_step": 92123, "epoch": 2193} {"train_loss": -6.346378326416016, "global_step": 92124, "epoch": 2193} {"train_loss": -6.305163383483887, "global_step": 92125, "epoch": 2193} {"train_loss": -6.3909735679626465, "global_step": 92126, "epoch": 2193} {"train_loss": -6.290256500244141, "global_step": 92127, "epoch": 2193} {"train_loss": -6.418216705322266, "global_step": 92128, "epoch": 2193} {"train_loss": -6.188309669494629, "global_step": 92129, "epoch": 2193} {"train_loss": -6.260906219482422, "global_step": 92130, "epoch": 2193} {"train_loss": -6.384763717651367, "global_step": 92131, "epoch": 2193} {"train_loss": -6.213836193084717, "global_step": 92132, "epoch": 2193} {"train_loss": -6.273069858551025, "global_step": 92133, "epoch": 2193} {"train_loss": -6.2549848556518555, "global_step": 92134, "epoch": 2193} {"train_loss": -6.180039405822754, "global_step": 92135, "epoch": 2193} {"train_loss": -6.290789604187012, "global_step": 92136, "epoch": 2193} {"train_loss": -6.1863298416137695, "global_step": 92137, "epoch": 2193} {"train_loss": -6.197681427001953, "global_step": 92138, "epoch": 2193} {"train_loss": -6.366533279418945, "global_step": 92139, "epoch": 2193} {"train_loss": -6.204179286956787, "global_step": 92140, "epoch": 2193} {"train_loss": -6.392777919769287, "global_step": 92141, "epoch": 2193} {"train_loss": -6.272972106933594, "global_step": 92142, "epoch": 2193} {"train_loss": -6.1701741218566895, "global_step": 92143, "epoch": 2193} {"train_loss": -6.329902648925781, "global_step": 92144, "epoch": 2193} {"train_loss": -6.311623573303223, "global_step": 92145, "epoch": 2193} {"train_loss": -6.328007698059082, "global_step": 92146, "epoch": 2193} {"train_loss": -6.2846915154230025, "global_step": 92147, "epoch": 2193, "val_loss": 67870.40625} {"train_loss": -6.261377334594727, "global_step": 92148, "epoch": 2194} {"train_loss": -6.3232951164245605, "global_step": 92149, "epoch": 2194} {"train_loss": -6.2417097091674805, "global_step": 92150, "epoch": 2194} {"train_loss": -6.26373291015625, "global_step": 92151, "epoch": 2194} {"train_loss": -6.213138580322266, "global_step": 92152, "epoch": 2194} {"train_loss": -6.227892875671387, "global_step": 92153, "epoch": 2194} {"train_loss": -6.15989351272583, "global_step": 92154, "epoch": 2194} {"train_loss": -6.095447540283203, "global_step": 92155, "epoch": 2194} {"train_loss": -6.32294225692749, "global_step": 92156, "epoch": 2194} {"train_loss": -6.202407360076904, "global_step": 92157, "epoch": 2194} {"train_loss": -6.25633430480957, "global_step": 92158, "epoch": 2194} {"train_loss": -6.2770891189575195, "global_step": 92159, "epoch": 2194} {"train_loss": -6.226722717285156, "global_step": 92160, "epoch": 2194} {"train_loss": -6.248115062713623, "global_step": 92161, "epoch": 2194} {"train_loss": -6.236249923706055, "global_step": 92162, "epoch": 2194} {"train_loss": -6.2457275390625, "global_step": 92163, "epoch": 2194} {"train_loss": -6.251879692077637, "global_step": 92164, "epoch": 2194} {"train_loss": -6.245068073272705, "global_step": 92165, "epoch": 2194} {"train_loss": -6.273433208465576, "global_step": 92166, "epoch": 2194} {"train_loss": -6.190443992614746, "global_step": 92167, "epoch": 2194} {"train_loss": -6.2956390380859375, "global_step": 92168, "epoch": 2194} {"train_loss": -6.088882923126221, "global_step": 92169, "epoch": 2194} {"train_loss": -6.135952949523926, "global_step": 92170, "epoch": 2194} {"train_loss": -6.197861671447754, "global_step": 92171, "epoch": 2194} {"train_loss": -6.27830696105957, "global_step": 92172, "epoch": 2194} {"train_loss": -6.331772804260254, "global_step": 92173, "epoch": 2194} {"train_loss": -6.151668548583984, "global_step": 92174, "epoch": 2194} {"train_loss": -6.329257011413574, "global_step": 92175, "epoch": 2194} {"train_loss": -6.3212361335754395, "global_step": 92176, "epoch": 2194} {"train_loss": -6.1851582527160645, "global_step": 92177, "epoch": 2194} {"train_loss": -6.2357072830200195, "global_step": 92178, "epoch": 2194} {"train_loss": -6.2333269119262695, "global_step": 92179, "epoch": 2194} {"train_loss": -6.278352737426758, "global_step": 92180, "epoch": 2194} {"train_loss": -6.238452434539795, "global_step": 92181, "epoch": 2194} {"train_loss": -6.141500949859619, "global_step": 92182, "epoch": 2194} {"train_loss": -6.2233076095581055, "global_step": 92183, "epoch": 2194} {"train_loss": -6.315347671508789, "global_step": 92184, "epoch": 2194} {"train_loss": -6.160928249359131, "global_step": 92185, "epoch": 2194} {"train_loss": -6.239562034606934, "global_step": 92186, "epoch": 2194} {"train_loss": -6.311627388000488, "global_step": 92187, "epoch": 2194} {"train_loss": -6.219353675842285, "global_step": 92188, "epoch": 2194} {"train_loss": -6.237115349088397, "global_step": 92189, "epoch": 2194, "val_loss": 68000.890625} {"train_loss": -6.175802230834961, "global_step": 92190, "epoch": 2195} {"train_loss": -6.353374481201172, "global_step": 92191, "epoch": 2195} {"train_loss": -6.164810657501221, "global_step": 92192, "epoch": 2195} {"train_loss": -6.299115180969238, "global_step": 92193, "epoch": 2195} {"train_loss": -6.130788803100586, "global_step": 92194, "epoch": 2195} {"train_loss": -6.273163795471191, "global_step": 92195, "epoch": 2195} {"train_loss": -6.247333526611328, "global_step": 92196, "epoch": 2195} {"train_loss": -6.341823577880859, "global_step": 92197, "epoch": 2195} {"train_loss": -6.163142681121826, "global_step": 92198, "epoch": 2195} {"train_loss": -6.329822540283203, "global_step": 92199, "epoch": 2195} {"train_loss": -6.250982761383057, "global_step": 92200, "epoch": 2195} {"train_loss": -6.132843017578125, "global_step": 92201, "epoch": 2195} {"train_loss": -6.28538179397583, "global_step": 92202, "epoch": 2195} {"train_loss": -6.319787979125977, "global_step": 92203, "epoch": 2195} {"train_loss": -6.23039436340332, "global_step": 92204, "epoch": 2195} {"train_loss": -6.268159866333008, "global_step": 92205, "epoch": 2195} {"train_loss": -6.145139694213867, "global_step": 92206, "epoch": 2195} {"train_loss": -6.20835018157959, "global_step": 92207, "epoch": 2195} {"train_loss": -6.205072402954102, "global_step": 92208, "epoch": 2195} {"train_loss": -6.245522975921631, "global_step": 92209, "epoch": 2195} {"train_loss": -6.260076999664307, "global_step": 92210, "epoch": 2195} {"train_loss": -6.22482967376709, "global_step": 92211, "epoch": 2195} {"train_loss": -6.353604793548584, "global_step": 92212, "epoch": 2195} {"train_loss": -6.166608810424805, "global_step": 92213, "epoch": 2195} {"train_loss": -6.323073387145996, "global_step": 92214, "epoch": 2195} {"train_loss": -6.173907279968262, "global_step": 92215, "epoch": 2195} {"train_loss": -6.275238037109375, "global_step": 92216, "epoch": 2195} {"train_loss": -6.3754167556762695, "global_step": 92217, "epoch": 2195} {"train_loss": -6.239948272705078, "global_step": 92218, "epoch": 2195} {"train_loss": -6.201438903808594, "global_step": 92219, "epoch": 2195} {"train_loss": -6.306801795959473, "global_step": 92220, "epoch": 2195} {"train_loss": -6.21915340423584, "global_step": 92221, "epoch": 2195} {"train_loss": -6.159843444824219, "global_step": 92222, "epoch": 2195} {"train_loss": -6.335740089416504, "global_step": 92223, "epoch": 2195} {"train_loss": -6.28674840927124, "global_step": 92224, "epoch": 2195} {"train_loss": -6.276582717895508, "global_step": 92225, "epoch": 2195} {"train_loss": -6.271202087402344, "global_step": 92226, "epoch": 2195} {"train_loss": -6.345372200012207, "global_step": 92227, "epoch": 2195} {"train_loss": -6.083124160766602, "global_step": 92228, "epoch": 2195} {"train_loss": -6.249362468719482, "global_step": 92229, "epoch": 2195} {"train_loss": -6.373516082763672, "global_step": 92230, "epoch": 2195} {"train_loss": -6.2540063971564885, "global_step": 92231, "epoch": 2195, "val_loss": 67845.8359375} {"train_loss": -6.343062400817871, "global_step": 92232, "epoch": 2196} {"train_loss": -6.343374252319336, "global_step": 92233, "epoch": 2196} {"train_loss": -6.226922035217285, "global_step": 92234, "epoch": 2196} {"train_loss": -6.244868278503418, "global_step": 92235, "epoch": 2196} {"train_loss": -6.156747341156006, "global_step": 92236, "epoch": 2196} {"train_loss": -6.395407199859619, "global_step": 92237, "epoch": 2196} {"train_loss": -6.038512229919434, "global_step": 92238, "epoch": 2196} {"train_loss": -6.252724647521973, "global_step": 92239, "epoch": 2196} {"train_loss": -6.233214855194092, "global_step": 92240, "epoch": 2196} {"train_loss": -6.228135108947754, "global_step": 92241, "epoch": 2196} {"train_loss": -6.2984232902526855, "global_step": 92242, "epoch": 2196} {"train_loss": -6.137887001037598, "global_step": 92243, "epoch": 2196} {"train_loss": -6.348136901855469, "global_step": 92244, "epoch": 2196} {"train_loss": -6.145549774169922, "global_step": 92245, "epoch": 2196} {"train_loss": -6.318847179412842, "global_step": 92246, "epoch": 2196} {"train_loss": -6.265607833862305, "global_step": 92247, "epoch": 2196} {"train_loss": -6.151135444641113, "global_step": 92248, "epoch": 2196} {"train_loss": -6.187919616699219, "global_step": 92249, "epoch": 2196} {"train_loss": -6.247498512268066, "global_step": 92250, "epoch": 2196} {"train_loss": -6.1429362297058105, "global_step": 92251, "epoch": 2196} {"train_loss": -6.085282325744629, "global_step": 92252, "epoch": 2196} {"train_loss": -6.159235954284668, "global_step": 92253, "epoch": 2196} {"train_loss": -6.181667327880859, "global_step": 92254, "epoch": 2196} {"train_loss": -6.08457088470459, "global_step": 92255, "epoch": 2196} {"train_loss": -6.07260799407959, "global_step": 92256, "epoch": 2196} {"train_loss": -6.197113990783691, "global_step": 92257, "epoch": 2196} {"train_loss": -6.018038749694824, "global_step": 92258, "epoch": 2196} {"train_loss": -6.196538925170898, "global_step": 92259, "epoch": 2196} {"train_loss": -6.157191276550293, "global_step": 92260, "epoch": 2196} {"train_loss": -6.3096022605896, "global_step": 92261, "epoch": 2196} {"train_loss": -6.218095779418945, "global_step": 92262, "epoch": 2196} {"train_loss": -6.172509670257568, "global_step": 92263, "epoch": 2196} {"train_loss": -6.123846054077148, "global_step": 92264, "epoch": 2196} {"train_loss": -6.22576379776001, "global_step": 92265, "epoch": 2196} {"train_loss": -6.169001579284668, "global_step": 92266, "epoch": 2196} {"train_loss": -6.338527679443359, "global_step": 92267, "epoch": 2196} {"train_loss": -6.2078633308410645, "global_step": 92268, "epoch": 2196} {"train_loss": -6.2335309982299805, "global_step": 92269, "epoch": 2196} {"train_loss": -6.205810546875, "global_step": 92270, "epoch": 2196} {"train_loss": -6.152667045593262, "global_step": 92271, "epoch": 2196} {"train_loss": -6.224905490875244, "global_step": 92272, "epoch": 2196} {"train_loss": -6.204462482815697, "global_step": 92273, "epoch": 2196, "val_loss": 67873.015625} {"train_loss": -6.238297462463379, "global_step": 92274, "epoch": 2197} {"train_loss": -6.240920066833496, "global_step": 92275, "epoch": 2197} {"train_loss": -6.0920562744140625, "global_step": 92276, "epoch": 2197} {"train_loss": -6.183266639709473, "global_step": 92277, "epoch": 2197} {"train_loss": -6.22471809387207, "global_step": 92278, "epoch": 2197} {"train_loss": -6.306113243103027, "global_step": 92279, "epoch": 2197} {"train_loss": -6.354914665222168, "global_step": 92280, "epoch": 2197} {"train_loss": -6.2691755294799805, "global_step": 92281, "epoch": 2197} {"train_loss": -6.20255184173584, "global_step": 92282, "epoch": 2197} {"train_loss": -6.2853169441223145, "global_step": 92283, "epoch": 2197} {"train_loss": -6.245285987854004, "global_step": 92284, "epoch": 2197} {"train_loss": -6.325892448425293, "global_step": 92285, "epoch": 2197} {"train_loss": -6.335623741149902, "global_step": 92286, "epoch": 2197} {"train_loss": -6.219046592712402, "global_step": 92287, "epoch": 2197} {"train_loss": -6.250045299530029, "global_step": 92288, "epoch": 2197} {"train_loss": -6.325831413269043, "global_step": 92289, "epoch": 2197} {"train_loss": -6.253100872039795, "global_step": 92290, "epoch": 2197} {"train_loss": -6.279184341430664, "global_step": 92291, "epoch": 2197} {"train_loss": -6.2753586769104, "global_step": 92292, "epoch": 2197} {"train_loss": -6.341883182525635, "global_step": 92293, "epoch": 2197} {"train_loss": -6.206247329711914, "global_step": 92294, "epoch": 2197} {"train_loss": -6.3041486740112305, "global_step": 92295, "epoch": 2197} {"train_loss": -6.317818641662598, "global_step": 92296, "epoch": 2197} {"train_loss": -6.370152473449707, "global_step": 92297, "epoch": 2197} {"train_loss": -6.328553199768066, "global_step": 92298, "epoch": 2197} {"train_loss": -6.268479347229004, "global_step": 92299, "epoch": 2197} {"train_loss": -6.2869415283203125, "global_step": 92300, "epoch": 2197} {"train_loss": -6.2221269607543945, "global_step": 92301, "epoch": 2197} {"train_loss": -6.214644432067871, "global_step": 92302, "epoch": 2197} {"train_loss": -6.21510124206543, "global_step": 92303, "epoch": 2197} {"train_loss": -6.317436695098877, "global_step": 92304, "epoch": 2197} {"train_loss": -6.25074577331543, "global_step": 92305, "epoch": 2197} {"train_loss": -6.383934020996094, "global_step": 92306, "epoch": 2197} {"train_loss": -6.22274923324585, "global_step": 92307, "epoch": 2197} {"train_loss": -6.2784504890441895, "global_step": 92308, "epoch": 2197} {"train_loss": -6.327150821685791, "global_step": 92309, "epoch": 2197} {"train_loss": -6.310210704803467, "global_step": 92310, "epoch": 2197} {"train_loss": -6.21118688583374, "global_step": 92311, "epoch": 2197} {"train_loss": -6.393459796905518, "global_step": 92312, "epoch": 2197} {"train_loss": -6.261127471923828, "global_step": 92313, "epoch": 2197} {"train_loss": -6.142369270324707, "global_step": 92314, "epoch": 2197} {"train_loss": -6.271999994913737, "global_step": 92315, "epoch": 2197, "val_loss": 67959.7265625} {"train_loss": -6.275519371032715, "global_step": 92316, "epoch": 2198} {"train_loss": -6.319827079772949, "global_step": 92317, "epoch": 2198} {"train_loss": -6.379491329193115, "global_step": 92318, "epoch": 2198} {"train_loss": -6.231672286987305, "global_step": 92319, "epoch": 2198} {"train_loss": -6.265471458435059, "global_step": 92320, "epoch": 2198} {"train_loss": -6.268365859985352, "global_step": 92321, "epoch": 2198} {"train_loss": -6.248915672302246, "global_step": 92322, "epoch": 2198} {"train_loss": -6.228826999664307, "global_step": 92323, "epoch": 2198} {"train_loss": -6.309176445007324, "global_step": 92324, "epoch": 2198} {"train_loss": -6.262923240661621, "global_step": 92325, "epoch": 2198} {"train_loss": -6.3027849197387695, "global_step": 92326, "epoch": 2198} {"train_loss": -6.115485191345215, "global_step": 92327, "epoch": 2198} {"train_loss": -6.230538368225098, "global_step": 92328, "epoch": 2198} {"train_loss": -6.1968488693237305, "global_step": 92329, "epoch": 2198} {"train_loss": -6.360323429107666, "global_step": 92330, "epoch": 2198} {"train_loss": -6.154462814331055, "global_step": 92331, "epoch": 2198} {"train_loss": -6.21761417388916, "global_step": 92332, "epoch": 2198} {"train_loss": -6.2371015548706055, "global_step": 92333, "epoch": 2198} {"train_loss": -6.371841907501221, "global_step": 92334, "epoch": 2198} {"train_loss": -6.250311851501465, "global_step": 92335, "epoch": 2198} {"train_loss": -6.127140045166016, "global_step": 92336, "epoch": 2198} {"train_loss": -6.291177272796631, "global_step": 92337, "epoch": 2198} {"train_loss": -6.275815010070801, "global_step": 92338, "epoch": 2198} {"train_loss": -6.144701957702637, "global_step": 92339, "epoch": 2198} {"train_loss": -6.353907108306885, "global_step": 92340, "epoch": 2198} {"train_loss": -6.235210418701172, "global_step": 92341, "epoch": 2198} {"train_loss": -6.275885105133057, "global_step": 92342, "epoch": 2198} {"train_loss": -6.348000526428223, "global_step": 92343, "epoch": 2198} {"train_loss": -6.342455863952637, "global_step": 92344, "epoch": 2198} {"train_loss": -6.343757629394531, "global_step": 92345, "epoch": 2198} {"train_loss": -6.184709072113037, "global_step": 92346, "epoch": 2198} {"train_loss": -6.330001354217529, "global_step": 92347, "epoch": 2198} {"train_loss": -6.2986602783203125, "global_step": 92348, "epoch": 2198} {"train_loss": -6.339913368225098, "global_step": 92349, "epoch": 2198} {"train_loss": -6.289259910583496, "global_step": 92350, "epoch": 2198} {"train_loss": -6.169309616088867, "global_step": 92351, "epoch": 2198} {"train_loss": -6.185018539428711, "global_step": 92352, "epoch": 2198} {"train_loss": -6.293121337890625, "global_step": 92353, "epoch": 2198} {"train_loss": -6.198033332824707, "global_step": 92354, "epoch": 2198} {"train_loss": -6.263843059539795, "global_step": 92355, "epoch": 2198} {"train_loss": -6.1856231689453125, "global_step": 92356, "epoch": 2198} {"train_loss": -6.258092051460629, "global_step": 92357, "epoch": 2198, "val_loss": 67845.328125} {"train_loss": -6.264120101928711, "global_step": 92358, "epoch": 2199} {"train_loss": -6.17091703414917, "global_step": 92359, "epoch": 2199} {"train_loss": -6.254166603088379, "global_step": 92360, "epoch": 2199} {"train_loss": -6.344592571258545, "global_step": 92361, "epoch": 2199} {"train_loss": -6.177268981933594, "global_step": 92362, "epoch": 2199} {"train_loss": -6.122894287109375, "global_step": 92363, "epoch": 2199} {"train_loss": -6.18302059173584, "global_step": 92364, "epoch": 2199} {"train_loss": -6.285842418670654, "global_step": 92365, "epoch": 2199} {"train_loss": -6.195442199707031, "global_step": 92366, "epoch": 2199} {"train_loss": -6.214983940124512, "global_step": 92367, "epoch": 2199} {"train_loss": -6.2490763664245605, "global_step": 92368, "epoch": 2199} {"train_loss": -6.209103584289551, "global_step": 92369, "epoch": 2199} {"train_loss": -6.139704704284668, "global_step": 92370, "epoch": 2199} {"train_loss": -6.2987189292907715, "global_step": 92371, "epoch": 2199} {"train_loss": -6.210078239440918, "global_step": 92372, "epoch": 2199} {"train_loss": -6.286760330200195, "global_step": 92373, "epoch": 2199} {"train_loss": -6.211521148681641, "global_step": 92374, "epoch": 2199} {"train_loss": -6.2969770431518555, "global_step": 92375, "epoch": 2199} {"train_loss": -6.288382053375244, "global_step": 92376, "epoch": 2199} {"train_loss": -6.221468925476074, "global_step": 92377, "epoch": 2199} {"train_loss": -6.26728630065918, "global_step": 92378, "epoch": 2199} {"train_loss": -6.260568141937256, "global_step": 92379, "epoch": 2199} {"train_loss": -6.441348552703857, "global_step": 92380, "epoch": 2199} {"train_loss": -6.329388618469238, "global_step": 92381, "epoch": 2199} {"train_loss": -6.352684497833252, "global_step": 92382, "epoch": 2199} {"train_loss": -6.121824264526367, "global_step": 92383, "epoch": 2199} {"train_loss": -6.232834815979004, "global_step": 92384, "epoch": 2199} {"train_loss": -6.278343200683594, "global_step": 92385, "epoch": 2199} {"train_loss": -6.392521381378174, "global_step": 92386, "epoch": 2199} {"train_loss": -6.2745041847229, "global_step": 92387, "epoch": 2199} {"train_loss": -6.269115447998047, "global_step": 92388, "epoch": 2199} {"train_loss": -6.258245468139648, "global_step": 92389, "epoch": 2199} {"train_loss": -6.2481584548950195, "global_step": 92390, "epoch": 2199} {"train_loss": -6.290307998657227, "global_step": 92391, "epoch": 2199} {"train_loss": -6.234901428222656, "global_step": 92392, "epoch": 2199} {"train_loss": -6.307992935180664, "global_step": 92393, "epoch": 2199} {"train_loss": -6.319269180297852, "global_step": 92394, "epoch": 2199} {"train_loss": -6.283591270446777, "global_step": 92395, "epoch": 2199} {"train_loss": -6.291268825531006, "global_step": 92396, "epoch": 2199} {"train_loss": -6.270684242248535, "global_step": 92397, "epoch": 2199} {"train_loss": -6.133284091949463, "global_step": 92398, "epoch": 2199} {"train_loss": -6.25570273399353, "global_step": 92399, "epoch": 2199, "val_loss": 67891.0859375} {"train_loss": -6.2801713943481445, "global_step": 92400, "epoch": 2200} {"train_loss": -6.196235179901123, "global_step": 92401, "epoch": 2200} {"train_loss": -6.385532379150391, "global_step": 92402, "epoch": 2200} {"train_loss": -6.3045148849487305, "global_step": 92403, "epoch": 2200} {"train_loss": -6.162940502166748, "global_step": 92404, "epoch": 2200} {"train_loss": -6.237526893615723, "global_step": 92405, "epoch": 2200} {"train_loss": -6.19815731048584, "global_step": 92406, "epoch": 2200} {"train_loss": -6.253974914550781, "global_step": 92407, "epoch": 2200} {"train_loss": -6.2836809158325195, "global_step": 92408, "epoch": 2200} {"train_loss": -6.211399078369141, "global_step": 92409, "epoch": 2200} {"train_loss": -6.178718090057373, "global_step": 92410, "epoch": 2200} {"train_loss": -6.229803085327148, "global_step": 92411, "epoch": 2200} {"train_loss": -6.271607398986816, "global_step": 92412, "epoch": 2200} {"train_loss": -6.340734958648682, "global_step": 92413, "epoch": 2200} {"train_loss": -6.24846076965332, "global_step": 92414, "epoch": 2200} {"train_loss": -6.367907524108887, "global_step": 92415, "epoch": 2200} {"train_loss": -6.373325347900391, "global_step": 92416, "epoch": 2200} {"train_loss": -6.389245986938477, "global_step": 92417, "epoch": 2200} {"train_loss": -6.239527702331543, "global_step": 92418, "epoch": 2200} {"train_loss": -6.255653381347656, "global_step": 92419, "epoch": 2200} {"train_loss": -6.233922958374023, "global_step": 92420, "epoch": 2200} {"train_loss": -6.346493721008301, "global_step": 92421, "epoch": 2200} {"train_loss": -6.184225559234619, "global_step": 92422, "epoch": 2200} {"train_loss": -6.246838569641113, "global_step": 92423, "epoch": 2200} {"train_loss": -6.199822902679443, "global_step": 92424, "epoch": 2200} {"train_loss": -6.27204704284668, "global_step": 92425, "epoch": 2200} {"train_loss": -6.220919609069824, "global_step": 92426, "epoch": 2200} {"train_loss": -6.094606876373291, "global_step": 92427, "epoch": 2200} {"train_loss": -6.345088958740234, "global_step": 92428, "epoch": 2200} {"train_loss": -6.295599937438965, "global_step": 92429, "epoch": 2200} {"train_loss": -6.14346981048584, "global_step": 92430, "epoch": 2200} {"train_loss": -6.2074360847473145, "global_step": 92431, "epoch": 2200} {"train_loss": -6.337368488311768, "global_step": 92432, "epoch": 2200} {"train_loss": -6.186455726623535, "global_step": 92433, "epoch": 2200} {"train_loss": -6.147735595703125, "global_step": 92434, "epoch": 2200} {"train_loss": -6.24107551574707, "global_step": 92435, "epoch": 2200} {"train_loss": -6.150432586669922, "global_step": 92436, "epoch": 2200} {"train_loss": -6.148798942565918, "global_step": 92437, "epoch": 2200} {"train_loss": -6.185062408447266, "global_step": 92438, "epoch": 2200} {"train_loss": -6.360935688018799, "global_step": 92439, "epoch": 2200} {"train_loss": -6.240886211395264, "global_step": 92440, "epoch": 2200} {"train_loss": -6.247649499348232, "global_step": 92441, "epoch": 2200, "train/sim_max_reward_0": 0.3892023074902871, "train/sim_max_reward_1": 0.8685662629611434, "train/sim_max_reward_2": 0.8762156640163938, "train/sim_max_reward_3": 0.1290306611040428, "train/sim_max_reward_4": 0.4416057067477801, "train/sim_max_reward_5": 0.9375658937828907, "test/sim_max_reward_4400000": 0.17138459011181803, "test/sim_max_reward_4400001": 0.2096193525898868, "test/sim_max_reward_4400002": 0.7447471642879882, "test/sim_max_reward_4400003": 0.9694660832406953, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9829796932852553, "test/sim_max_reward_4400007": 0.01552032508582053, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9359710374852518, "test/sim_max_reward_4400010": 0.26176941303878853, "test/sim_max_reward_4400011": 0.20795948579230708, "test/sim_max_reward_4400012": 0.9426580767135175, "test/sim_max_reward_4400013": 0.8953614206373345, "test/sim_max_reward_4400014": 0.49671489703359434, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.14200152346625414, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.16099673252633553, "test/sim_max_reward_4400023": 0.6751357009605057, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.18229477531233979, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0619181455663395, "test/sim_max_reward_4400028": 0.8903330515932124, "test/sim_max_reward_4400029": 0.5066312633368091, "test/sim_max_reward_4400030": 0.9529301833011788, "test/sim_max_reward_4400031": 0.8926745360131572, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.3690829977568579, "test/sim_max_reward_4400034": 0.8944585144919387, "test/sim_max_reward_4400035": 0.9565719847901857, "test/sim_max_reward_4400036": 0.3979989386337857, "test/sim_max_reward_4400037": 0.6574565640446557, "test/sim_max_reward_4400038": 0.8671909250158902, "test/sim_max_reward_4400039": 0.5823708167186044, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9199442873433076, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9509032936363593, "test/sim_max_reward_4400045": 0.8727773934424804, "test/sim_max_reward_4400046": 0.6981658810999494, "test/sim_max_reward_4400047": 0.958493591805732, "test/sim_max_reward_4400048": 0.9971419640045391, "test/sim_max_reward_4400049": 0.7774688174784138, "train/mean_score": 0.6070310826837564, "test/mean_score": 0.48518435165415574, "val_loss": 67833.125} {"train_loss": -6.186009407043457, "global_step": 92442, "epoch": 2201} {"train_loss": -6.161809921264648, "global_step": 92443, "epoch": 2201} {"train_loss": -6.193615913391113, "global_step": 92444, "epoch": 2201} {"train_loss": -6.255669116973877, "global_step": 92445, "epoch": 2201} {"train_loss": -6.221219062805176, "global_step": 92446, "epoch": 2201} {"train_loss": -6.258286476135254, "global_step": 92447, "epoch": 2201} {"train_loss": -6.2055864334106445, "global_step": 92448, "epoch": 2201} {"train_loss": -6.343049049377441, "global_step": 92449, "epoch": 2201} {"train_loss": -6.365965843200684, "global_step": 92450, "epoch": 2201} {"train_loss": -6.334531307220459, "global_step": 92451, "epoch": 2201} {"train_loss": -6.2555060386657715, "global_step": 92452, "epoch": 2201} {"train_loss": -6.358875274658203, "global_step": 92453, "epoch": 2201} {"train_loss": -6.081028938293457, "global_step": 92454, "epoch": 2201} {"train_loss": -6.34019136428833, "global_step": 92455, "epoch": 2201} {"train_loss": -6.1458234786987305, "global_step": 92456, "epoch": 2201} {"train_loss": -6.161272048950195, "global_step": 92457, "epoch": 2201} {"train_loss": -6.1771769523620605, "global_step": 92458, "epoch": 2201} {"train_loss": -6.2107977867126465, "global_step": 92459, "epoch": 2201} {"train_loss": -6.3929443359375, "global_step": 92460, "epoch": 2201} {"train_loss": -6.242840766906738, "global_step": 92461, "epoch": 2201} {"train_loss": -6.174716949462891, "global_step": 92462, "epoch": 2201} {"train_loss": -6.259848594665527, "global_step": 92463, "epoch": 2201} {"train_loss": -6.247321128845215, "global_step": 92464, "epoch": 2201} {"train_loss": -6.305385589599609, "global_step": 92465, "epoch": 2201} {"train_loss": -6.286773681640625, "global_step": 92466, "epoch": 2201} {"train_loss": -6.230533599853516, "global_step": 92467, "epoch": 2201} {"train_loss": -6.161112308502197, "global_step": 92468, "epoch": 2201} {"train_loss": -6.197480201721191, "global_step": 92469, "epoch": 2201} {"train_loss": -6.232124328613281, "global_step": 92470, "epoch": 2201} {"train_loss": -6.292581081390381, "global_step": 92471, "epoch": 2201} {"train_loss": -6.3411664962768555, "global_step": 92472, "epoch": 2201} {"train_loss": -6.2248854637146, "global_step": 92473, "epoch": 2201} {"train_loss": -6.273674011230469, "global_step": 92474, "epoch": 2201} {"train_loss": -6.194656848907471, "global_step": 92475, "epoch": 2201} {"train_loss": -6.232709884643555, "global_step": 92476, "epoch": 2201} {"train_loss": -6.252492427825928, "global_step": 92477, "epoch": 2201} {"train_loss": -6.3139472007751465, "global_step": 92478, "epoch": 2201} {"train_loss": -6.251136779785156, "global_step": 92479, "epoch": 2201} {"train_loss": -6.176907539367676, "global_step": 92480, "epoch": 2201} {"train_loss": -6.279845237731934, "global_step": 92481, "epoch": 2201} {"train_loss": -6.317359924316406, "global_step": 92482, "epoch": 2201} {"train_loss": -6.243979385920933, "global_step": 92483, "epoch": 2201, "val_loss": 67778.3671875} {"train_loss": -6.298111915588379, "global_step": 92484, "epoch": 2202} {"train_loss": -6.240951061248779, "global_step": 92485, "epoch": 2202} {"train_loss": -6.3379950523376465, "global_step": 92486, "epoch": 2202} {"train_loss": -6.2135419845581055, "global_step": 92487, "epoch": 2202} {"train_loss": -6.2393083572387695, "global_step": 92488, "epoch": 2202} {"train_loss": -6.329042434692383, "global_step": 92489, "epoch": 2202} {"train_loss": -6.353084087371826, "global_step": 92490, "epoch": 2202} {"train_loss": -6.218667030334473, "global_step": 92491, "epoch": 2202} {"train_loss": -6.2369489669799805, "global_step": 92492, "epoch": 2202} {"train_loss": -6.1494526863098145, "global_step": 92493, "epoch": 2202} {"train_loss": -6.303210258483887, "global_step": 92494, "epoch": 2202} {"train_loss": -6.210409164428711, "global_step": 92495, "epoch": 2202} {"train_loss": -6.249371528625488, "global_step": 92496, "epoch": 2202} {"train_loss": -6.267299652099609, "global_step": 92497, "epoch": 2202} {"train_loss": -6.2473835945129395, "global_step": 92498, "epoch": 2202} {"train_loss": -6.276516914367676, "global_step": 92499, "epoch": 2202} {"train_loss": -6.16511869430542, "global_step": 92500, "epoch": 2202} {"train_loss": -6.2086896896362305, "global_step": 92501, "epoch": 2202} {"train_loss": -6.193975925445557, "global_step": 92502, "epoch": 2202} {"train_loss": -6.202607154846191, "global_step": 92503, "epoch": 2202} {"train_loss": -6.163478851318359, "global_step": 92504, "epoch": 2202} {"train_loss": -6.176941871643066, "global_step": 92505, "epoch": 2202} {"train_loss": -6.287342071533203, "global_step": 92506, "epoch": 2202} {"train_loss": -6.148447036743164, "global_step": 92507, "epoch": 2202} {"train_loss": -6.23443078994751, "global_step": 92508, "epoch": 2202} {"train_loss": -6.178727149963379, "global_step": 92509, "epoch": 2202} {"train_loss": -6.179927349090576, "global_step": 92510, "epoch": 2202} {"train_loss": -6.12531042098999, "global_step": 92511, "epoch": 2202} {"train_loss": -6.224251747131348, "global_step": 92512, "epoch": 2202} {"train_loss": -6.211798667907715, "global_step": 92513, "epoch": 2202} {"train_loss": -6.173664569854736, "global_step": 92514, "epoch": 2202} {"train_loss": -6.110221862792969, "global_step": 92515, "epoch": 2202} {"train_loss": -6.222248554229736, "global_step": 92516, "epoch": 2202} {"train_loss": -6.169329643249512, "global_step": 92517, "epoch": 2202} {"train_loss": -6.029621124267578, "global_step": 92518, "epoch": 2202} {"train_loss": -6.281488418579102, "global_step": 92519, "epoch": 2202} {"train_loss": -6.187922477722168, "global_step": 92520, "epoch": 2202} {"train_loss": -6.193041801452637, "global_step": 92521, "epoch": 2202} {"train_loss": -6.1895551681518555, "global_step": 92522, "epoch": 2202} {"train_loss": -6.037312984466553, "global_step": 92523, "epoch": 2202} {"train_loss": -6.227776527404785, "global_step": 92524, "epoch": 2202} {"train_loss": -6.212398301987421, "global_step": 92525, "epoch": 2202, "val_loss": 68375.9375} {"train_loss": -6.121425151824951, "global_step": 92526, "epoch": 2203} {"train_loss": -6.099583625793457, "global_step": 92527, "epoch": 2203} {"train_loss": -6.229007720947266, "global_step": 92528, "epoch": 2203} {"train_loss": -6.200813293457031, "global_step": 92529, "epoch": 2203} {"train_loss": -6.114426612854004, "global_step": 92530, "epoch": 2203} {"train_loss": -6.252820014953613, "global_step": 92531, "epoch": 2203} {"train_loss": -6.171949863433838, "global_step": 92532, "epoch": 2203} {"train_loss": -6.081473350524902, "global_step": 92533, "epoch": 2203} {"train_loss": -6.149415969848633, "global_step": 92534, "epoch": 2203} {"train_loss": -6.114091873168945, "global_step": 92535, "epoch": 2203} {"train_loss": -6.294770240783691, "global_step": 92536, "epoch": 2203} {"train_loss": -6.240123271942139, "global_step": 92537, "epoch": 2203} {"train_loss": -6.201412677764893, "global_step": 92538, "epoch": 2203} {"train_loss": -6.190784931182861, "global_step": 92539, "epoch": 2203} {"train_loss": -6.161811828613281, "global_step": 92540, "epoch": 2203} {"train_loss": -6.301753044128418, "global_step": 92541, "epoch": 2203} {"train_loss": -6.347753047943115, "global_step": 92542, "epoch": 2203} {"train_loss": -6.270642280578613, "global_step": 92543, "epoch": 2203} {"train_loss": -6.254817962646484, "global_step": 92544, "epoch": 2203} {"train_loss": -6.368888854980469, "global_step": 92545, "epoch": 2203} {"train_loss": -6.304582595825195, "global_step": 92546, "epoch": 2203} {"train_loss": -6.246889114379883, "global_step": 92547, "epoch": 2203} {"train_loss": -6.18262243270874, "global_step": 92548, "epoch": 2203} {"train_loss": -6.321689128875732, "global_step": 92549, "epoch": 2203} {"train_loss": -6.198269367218018, "global_step": 92550, "epoch": 2203} {"train_loss": -6.255685806274414, "global_step": 92551, "epoch": 2203} {"train_loss": -6.368568420410156, "global_step": 92552, "epoch": 2203} {"train_loss": -6.392153739929199, "global_step": 92553, "epoch": 2203} {"train_loss": -6.338449478149414, "global_step": 92554, "epoch": 2203} {"train_loss": -6.292840957641602, "global_step": 92555, "epoch": 2203} {"train_loss": -6.297453880310059, "global_step": 92556, "epoch": 2203} {"train_loss": -6.322608947753906, "global_step": 92557, "epoch": 2203} {"train_loss": -6.173670768737793, "global_step": 92558, "epoch": 2203} {"train_loss": -6.370166778564453, "global_step": 92559, "epoch": 2203} {"train_loss": -6.190553665161133, "global_step": 92560, "epoch": 2203} {"train_loss": -6.205499172210693, "global_step": 92561, "epoch": 2203} {"train_loss": -6.227302551269531, "global_step": 92562, "epoch": 2203} {"train_loss": -6.2575531005859375, "global_step": 92563, "epoch": 2203} {"train_loss": -6.26123571395874, "global_step": 92564, "epoch": 2203} {"train_loss": -6.373662948608398, "global_step": 92565, "epoch": 2203} {"train_loss": -6.2676191329956055, "global_step": 92566, "epoch": 2203} {"train_loss": -6.2436937264033725, "global_step": 92567, "epoch": 2203, "val_loss": 68124.625} {"train_loss": -6.290513515472412, "global_step": 92568, "epoch": 2204} {"train_loss": -6.216463565826416, "global_step": 92569, "epoch": 2204} {"train_loss": -6.251082420349121, "global_step": 92570, "epoch": 2204} {"train_loss": -6.393735408782959, "global_step": 92571, "epoch": 2204} {"train_loss": -6.23085355758667, "global_step": 92572, "epoch": 2204} {"train_loss": -6.3896284103393555, "global_step": 92573, "epoch": 2204} {"train_loss": -6.3525567054748535, "global_step": 92574, "epoch": 2204} {"train_loss": -6.227447032928467, "global_step": 92575, "epoch": 2204} {"train_loss": -6.176949977874756, "global_step": 92576, "epoch": 2204} {"train_loss": -6.259627819061279, "global_step": 92577, "epoch": 2204} {"train_loss": -6.251607894897461, "global_step": 92578, "epoch": 2204} {"train_loss": -6.325526714324951, "global_step": 92579, "epoch": 2204} {"train_loss": -6.220417499542236, "global_step": 92580, "epoch": 2204} {"train_loss": -6.3363165855407715, "global_step": 92581, "epoch": 2204} {"train_loss": -6.372455596923828, "global_step": 92582, "epoch": 2204} {"train_loss": -6.248077869415283, "global_step": 92583, "epoch": 2204} {"train_loss": -6.270120620727539, "global_step": 92584, "epoch": 2204} {"train_loss": -6.247734546661377, "global_step": 92585, "epoch": 2204} {"train_loss": -6.291985988616943, "global_step": 92586, "epoch": 2204} {"train_loss": -6.312421798706055, "global_step": 92587, "epoch": 2204} {"train_loss": -6.310500144958496, "global_step": 92588, "epoch": 2204} {"train_loss": -6.202127456665039, "global_step": 92589, "epoch": 2204} {"train_loss": -6.280407905578613, "global_step": 92590, "epoch": 2204} {"train_loss": -6.209765434265137, "global_step": 92591, "epoch": 2204} {"train_loss": -6.2435150146484375, "global_step": 92592, "epoch": 2204} {"train_loss": -6.268158912658691, "global_step": 92593, "epoch": 2204} {"train_loss": -6.275668144226074, "global_step": 92594, "epoch": 2204} {"train_loss": -6.289769172668457, "global_step": 92595, "epoch": 2204} {"train_loss": -6.32551383972168, "global_step": 92596, "epoch": 2204} {"train_loss": -6.335530757904053, "global_step": 92597, "epoch": 2204} {"train_loss": -6.232430458068848, "global_step": 92598, "epoch": 2204} {"train_loss": -6.194517135620117, "global_step": 92599, "epoch": 2204} {"train_loss": -6.338403701782227, "global_step": 92600, "epoch": 2204} {"train_loss": -6.0973334312438965, "global_step": 92601, "epoch": 2204} {"train_loss": -6.1724443435668945, "global_step": 92602, "epoch": 2204} {"train_loss": -6.211627960205078, "global_step": 92603, "epoch": 2204} {"train_loss": -6.247764587402344, "global_step": 92604, "epoch": 2204} {"train_loss": -6.193864822387695, "global_step": 92605, "epoch": 2204} {"train_loss": -6.237977027893066, "global_step": 92606, "epoch": 2204} {"train_loss": -6.187189102172852, "global_step": 92607, "epoch": 2204} {"train_loss": -6.224860191345215, "global_step": 92608, "epoch": 2204} {"train_loss": -6.263011784780593, "global_step": 92609, "epoch": 2204, "val_loss": 67996.1640625} {"train_loss": -6.204164028167725, "global_step": 92610, "epoch": 2205} {"train_loss": -6.291203498840332, "global_step": 92611, "epoch": 2205} {"train_loss": -6.378941059112549, "global_step": 92612, "epoch": 2205} {"train_loss": -6.209773540496826, "global_step": 92613, "epoch": 2205} {"train_loss": -6.341335296630859, "global_step": 92614, "epoch": 2205} {"train_loss": -6.261272430419922, "global_step": 92615, "epoch": 2205} {"train_loss": -6.326979637145996, "global_step": 92616, "epoch": 2205} {"train_loss": -6.244194030761719, "global_step": 92617, "epoch": 2205} {"train_loss": -6.066791534423828, "global_step": 92618, "epoch": 2205} {"train_loss": -6.365198135375977, "global_step": 92619, "epoch": 2205} {"train_loss": -6.279268741607666, "global_step": 92620, "epoch": 2205} {"train_loss": -6.196595668792725, "global_step": 92621, "epoch": 2205} {"train_loss": -6.202109336853027, "global_step": 92622, "epoch": 2205} {"train_loss": -6.215057373046875, "global_step": 92623, "epoch": 2205} {"train_loss": -6.284472942352295, "global_step": 92624, "epoch": 2205} {"train_loss": -6.244662284851074, "global_step": 92625, "epoch": 2205} {"train_loss": -6.387234687805176, "global_step": 92626, "epoch": 2205} {"train_loss": -6.236462593078613, "global_step": 92627, "epoch": 2205} {"train_loss": -6.188817501068115, "global_step": 92628, "epoch": 2205} {"train_loss": -6.277292251586914, "global_step": 92629, "epoch": 2205} {"train_loss": -6.286809921264648, "global_step": 92630, "epoch": 2205} {"train_loss": -6.232306957244873, "global_step": 92631, "epoch": 2205} {"train_loss": -6.164097309112549, "global_step": 92632, "epoch": 2205} {"train_loss": -6.240393161773682, "global_step": 92633, "epoch": 2205} {"train_loss": -6.1284332275390625, "global_step": 92634, "epoch": 2205} {"train_loss": -6.288012981414795, "global_step": 92635, "epoch": 2205} {"train_loss": -6.272154808044434, "global_step": 92636, "epoch": 2205} {"train_loss": -6.214409828186035, "global_step": 92637, "epoch": 2205} {"train_loss": -6.294867992401123, "global_step": 92638, "epoch": 2205} {"train_loss": -6.243583679199219, "global_step": 92639, "epoch": 2205} {"train_loss": -6.306829452514648, "global_step": 92640, "epoch": 2205} {"train_loss": -6.176833152770996, "global_step": 92641, "epoch": 2205} {"train_loss": -6.189537525177002, "global_step": 92642, "epoch": 2205} {"train_loss": -6.23176908493042, "global_step": 92643, "epoch": 2205} {"train_loss": -6.298454284667969, "global_step": 92644, "epoch": 2205} {"train_loss": -6.25478982925415, "global_step": 92645, "epoch": 2205} {"train_loss": -6.287022113800049, "global_step": 92646, "epoch": 2205} {"train_loss": -6.274123668670654, "global_step": 92647, "epoch": 2205} {"train_loss": -6.283578872680664, "global_step": 92648, "epoch": 2205} {"train_loss": -6.238661766052246, "global_step": 92649, "epoch": 2205} {"train_loss": -6.112509250640869, "global_step": 92650, "epoch": 2205} {"train_loss": -6.2484287193843295, "global_step": 92651, "epoch": 2205, "val_loss": 67779.7109375} {"train_loss": -6.286746025085449, "global_step": 92652, "epoch": 2206} {"train_loss": -6.197624206542969, "global_step": 92653, "epoch": 2206} {"train_loss": -6.245723247528076, "global_step": 92654, "epoch": 2206} {"train_loss": -6.296817779541016, "global_step": 92655, "epoch": 2206} {"train_loss": -6.2733259201049805, "global_step": 92656, "epoch": 2206} {"train_loss": -6.269691467285156, "global_step": 92657, "epoch": 2206} {"train_loss": -6.302614212036133, "global_step": 92658, "epoch": 2206} {"train_loss": -6.326706886291504, "global_step": 92659, "epoch": 2206} {"train_loss": -6.239488124847412, "global_step": 92660, "epoch": 2206} {"train_loss": -6.138424873352051, "global_step": 92661, "epoch": 2206} {"train_loss": -6.199704170227051, "global_step": 92662, "epoch": 2206} {"train_loss": -6.17824125289917, "global_step": 92663, "epoch": 2206} {"train_loss": -6.261818885803223, "global_step": 92664, "epoch": 2206} {"train_loss": -6.239113807678223, "global_step": 92665, "epoch": 2206} {"train_loss": -6.248826026916504, "global_step": 92666, "epoch": 2206} {"train_loss": -6.335087776184082, "global_step": 92667, "epoch": 2206} {"train_loss": -6.245213508605957, "global_step": 92668, "epoch": 2206} {"train_loss": -6.260152816772461, "global_step": 92669, "epoch": 2206} {"train_loss": -6.344327926635742, "global_step": 92670, "epoch": 2206} {"train_loss": -6.22916316986084, "global_step": 92671, "epoch": 2206} {"train_loss": -6.318094253540039, "global_step": 92672, "epoch": 2206} {"train_loss": -6.3166279792785645, "global_step": 92673, "epoch": 2206} {"train_loss": -6.306058883666992, "global_step": 92674, "epoch": 2206} {"train_loss": -6.329013824462891, "global_step": 92675, "epoch": 2206} {"train_loss": -6.320218086242676, "global_step": 92676, "epoch": 2206} {"train_loss": -6.3645405769348145, "global_step": 92677, "epoch": 2206} {"train_loss": -6.348416328430176, "global_step": 92678, "epoch": 2206} {"train_loss": -6.40494966506958, "global_step": 92679, "epoch": 2206} {"train_loss": -6.345781326293945, "global_step": 92680, "epoch": 2206} {"train_loss": -6.24884033203125, "global_step": 92681, "epoch": 2206} {"train_loss": -6.295586585998535, "global_step": 92682, "epoch": 2206} {"train_loss": -6.252818584442139, "global_step": 92683, "epoch": 2206} {"train_loss": -6.300912857055664, "global_step": 92684, "epoch": 2206} {"train_loss": -6.315373420715332, "global_step": 92685, "epoch": 2206} {"train_loss": -6.251036643981934, "global_step": 92686, "epoch": 2206} {"train_loss": -6.315896987915039, "global_step": 92687, "epoch": 2206} {"train_loss": -6.215229034423828, "global_step": 92688, "epoch": 2206} {"train_loss": -6.207368850708008, "global_step": 92689, "epoch": 2206} {"train_loss": -6.325950622558594, "global_step": 92690, "epoch": 2206} {"train_loss": -6.345893859863281, "global_step": 92691, "epoch": 2206} {"train_loss": -6.227424621582031, "global_step": 92692, "epoch": 2206} {"train_loss": -6.2783696083795455, "global_step": 92693, "epoch": 2206, "val_loss": 67942.5078125} {"train_loss": -6.2374186515808105, "global_step": 92694, "epoch": 2207} {"train_loss": -6.2968854904174805, "global_step": 92695, "epoch": 2207} {"train_loss": -6.264463424682617, "global_step": 92696, "epoch": 2207} {"train_loss": -6.250807762145996, "global_step": 92697, "epoch": 2207} {"train_loss": -6.356478691101074, "global_step": 92698, "epoch": 2207} {"train_loss": -6.343918323516846, "global_step": 92699, "epoch": 2207} {"train_loss": -6.358068943023682, "global_step": 92700, "epoch": 2207} {"train_loss": -6.279486656188965, "global_step": 92701, "epoch": 2207} {"train_loss": -6.4191975593566895, "global_step": 92702, "epoch": 2207} {"train_loss": -6.163671493530273, "global_step": 92703, "epoch": 2207} {"train_loss": -6.192877292633057, "global_step": 92704, "epoch": 2207} {"train_loss": -6.253320693969727, "global_step": 92705, "epoch": 2207} {"train_loss": -6.28674840927124, "global_step": 92706, "epoch": 2207} {"train_loss": -6.215855121612549, "global_step": 92707, "epoch": 2207} {"train_loss": -6.265811920166016, "global_step": 92708, "epoch": 2207} {"train_loss": -6.132320404052734, "global_step": 92709, "epoch": 2207} {"train_loss": -6.274046897888184, "global_step": 92710, "epoch": 2207} {"train_loss": -6.271940231323242, "global_step": 92711, "epoch": 2207} {"train_loss": -6.218197822570801, "global_step": 92712, "epoch": 2207} {"train_loss": -6.386638641357422, "global_step": 92713, "epoch": 2207} {"train_loss": -6.138530731201172, "global_step": 92714, "epoch": 2207} {"train_loss": -6.307473182678223, "global_step": 92715, "epoch": 2207} {"train_loss": -6.17909574508667, "global_step": 92716, "epoch": 2207} {"train_loss": -6.3319172859191895, "global_step": 92717, "epoch": 2207} {"train_loss": -6.354034423828125, "global_step": 92718, "epoch": 2207} {"train_loss": -6.173867702484131, "global_step": 92719, "epoch": 2207} {"train_loss": -6.260676383972168, "global_step": 92720, "epoch": 2207} {"train_loss": -6.151453018188477, "global_step": 92721, "epoch": 2207} {"train_loss": -6.209315299987793, "global_step": 92722, "epoch": 2207} {"train_loss": -6.161014556884766, "global_step": 92723, "epoch": 2207} {"train_loss": -6.2901506423950195, "global_step": 92724, "epoch": 2207} {"train_loss": -6.218473434448242, "global_step": 92725, "epoch": 2207} {"train_loss": -6.266841888427734, "global_step": 92726, "epoch": 2207} {"train_loss": -6.116107940673828, "global_step": 92727, "epoch": 2207} {"train_loss": -6.187247276306152, "global_step": 92728, "epoch": 2207} {"train_loss": -6.14689302444458, "global_step": 92729, "epoch": 2207} {"train_loss": -6.3155317306518555, "global_step": 92730, "epoch": 2207} {"train_loss": -6.127630710601807, "global_step": 92731, "epoch": 2207} {"train_loss": -6.305305480957031, "global_step": 92732, "epoch": 2207} {"train_loss": -6.341118812561035, "global_step": 92733, "epoch": 2207} {"train_loss": -6.279237747192383, "global_step": 92734, "epoch": 2207} {"train_loss": -6.253037940888178, "global_step": 92735, "epoch": 2207, "val_loss": 67948.421875} {"train_loss": -6.318719387054443, "global_step": 92736, "epoch": 2208} {"train_loss": -6.256084442138672, "global_step": 92737, "epoch": 2208} {"train_loss": -6.248903274536133, "global_step": 92738, "epoch": 2208} {"train_loss": -6.330939292907715, "global_step": 92739, "epoch": 2208} {"train_loss": -6.30366325378418, "global_step": 92740, "epoch": 2208} {"train_loss": -6.330014228820801, "global_step": 92741, "epoch": 2208} {"train_loss": -6.259232997894287, "global_step": 92742, "epoch": 2208} {"train_loss": -6.253483772277832, "global_step": 92743, "epoch": 2208} {"train_loss": -6.383182525634766, "global_step": 92744, "epoch": 2208} {"train_loss": -6.2408766746521, "global_step": 92745, "epoch": 2208} {"train_loss": -6.195796012878418, "global_step": 92746, "epoch": 2208} {"train_loss": -6.1430253982543945, "global_step": 92747, "epoch": 2208} {"train_loss": -6.208527565002441, "global_step": 92748, "epoch": 2208} {"train_loss": -6.184502601623535, "global_step": 92749, "epoch": 2208} {"train_loss": -6.232358455657959, "global_step": 92750, "epoch": 2208} {"train_loss": -6.358813285827637, "global_step": 92751, "epoch": 2208} {"train_loss": -6.2254180908203125, "global_step": 92752, "epoch": 2208} {"train_loss": -6.354556560516357, "global_step": 92753, "epoch": 2208} {"train_loss": -6.2060089111328125, "global_step": 92754, "epoch": 2208} {"train_loss": -6.252345561981201, "global_step": 92755, "epoch": 2208} {"train_loss": -6.296573638916016, "global_step": 92756, "epoch": 2208} {"train_loss": -6.258114814758301, "global_step": 92757, "epoch": 2208} {"train_loss": -6.1939287185668945, "global_step": 92758, "epoch": 2208} {"train_loss": -6.332249641418457, "global_step": 92759, "epoch": 2208} {"train_loss": -6.298005104064941, "global_step": 92760, "epoch": 2208} {"train_loss": -6.301816463470459, "global_step": 92761, "epoch": 2208} {"train_loss": -6.128973960876465, "global_step": 92762, "epoch": 2208} {"train_loss": -6.386126518249512, "global_step": 92763, "epoch": 2208} {"train_loss": -6.353951454162598, "global_step": 92764, "epoch": 2208} {"train_loss": -6.345561981201172, "global_step": 92765, "epoch": 2208} {"train_loss": -6.386731147766113, "global_step": 92766, "epoch": 2208} {"train_loss": -6.279029846191406, "global_step": 92767, "epoch": 2208} {"train_loss": -6.349810600280762, "global_step": 92768, "epoch": 2208} {"train_loss": -6.457995891571045, "global_step": 92769, "epoch": 2208} {"train_loss": -6.272253036499023, "global_step": 92770, "epoch": 2208} {"train_loss": -6.2916460037231445, "global_step": 92771, "epoch": 2208} {"train_loss": -6.261446952819824, "global_step": 92772, "epoch": 2208} {"train_loss": -6.252490997314453, "global_step": 92773, "epoch": 2208} {"train_loss": -6.357695579528809, "global_step": 92774, "epoch": 2208} {"train_loss": -6.339540481567383, "global_step": 92775, "epoch": 2208} {"train_loss": -6.2811455726623535, "global_step": 92776, "epoch": 2208} {"train_loss": -6.282853955314273, "global_step": 92777, "epoch": 2208, "val_loss": 67765.484375} {"train_loss": -6.32294225692749, "global_step": 92778, "epoch": 2209} {"train_loss": -6.291721820831299, "global_step": 92779, "epoch": 2209} {"train_loss": -6.338853359222412, "global_step": 92780, "epoch": 2209} {"train_loss": -6.199924945831299, "global_step": 92781, "epoch": 2209} {"train_loss": -6.285090446472168, "global_step": 92782, "epoch": 2209} {"train_loss": -6.315288543701172, "global_step": 92783, "epoch": 2209} {"train_loss": -6.216226577758789, "global_step": 92784, "epoch": 2209} {"train_loss": -6.271319389343262, "global_step": 92785, "epoch": 2209} {"train_loss": -6.148144721984863, "global_step": 92786, "epoch": 2209} {"train_loss": -6.310090065002441, "global_step": 92787, "epoch": 2209} {"train_loss": -6.157252311706543, "global_step": 92788, "epoch": 2209} {"train_loss": -6.21523380279541, "global_step": 92789, "epoch": 2209} {"train_loss": -6.262002468109131, "global_step": 92790, "epoch": 2209} {"train_loss": -6.248159408569336, "global_step": 92791, "epoch": 2209} {"train_loss": -6.325875282287598, "global_step": 92792, "epoch": 2209} {"train_loss": -6.3151140213012695, "global_step": 92793, "epoch": 2209} {"train_loss": -6.263935089111328, "global_step": 92794, "epoch": 2209} {"train_loss": -6.234519004821777, "global_step": 92795, "epoch": 2209} {"train_loss": -6.265685081481934, "global_step": 92796, "epoch": 2209} {"train_loss": -6.271688461303711, "global_step": 92797, "epoch": 2209} {"train_loss": -6.265891075134277, "global_step": 92798, "epoch": 2209} {"train_loss": -6.278759479522705, "global_step": 92799, "epoch": 2209} {"train_loss": -6.32224702835083, "global_step": 92800, "epoch": 2209} {"train_loss": -6.297303199768066, "global_step": 92801, "epoch": 2209} {"train_loss": -6.340710163116455, "global_step": 92802, "epoch": 2209} {"train_loss": -6.208240509033203, "global_step": 92803, "epoch": 2209} {"train_loss": -6.189028263092041, "global_step": 92804, "epoch": 2209} {"train_loss": -6.248022079467773, "global_step": 92805, "epoch": 2209} {"train_loss": -6.254412651062012, "global_step": 92806, "epoch": 2209} {"train_loss": -6.129781723022461, "global_step": 92807, "epoch": 2209} {"train_loss": -6.215613842010498, "global_step": 92808, "epoch": 2209} {"train_loss": -6.319289207458496, "global_step": 92809, "epoch": 2209} {"train_loss": -6.224517345428467, "global_step": 92810, "epoch": 2209} {"train_loss": -6.219988822937012, "global_step": 92811, "epoch": 2209} {"train_loss": -6.235257148742676, "global_step": 92812, "epoch": 2209} {"train_loss": -6.108131408691406, "global_step": 92813, "epoch": 2209} {"train_loss": -6.1809868812561035, "global_step": 92814, "epoch": 2209} {"train_loss": -6.172562122344971, "global_step": 92815, "epoch": 2209} {"train_loss": -6.133932590484619, "global_step": 92816, "epoch": 2209} {"train_loss": -6.139858245849609, "global_step": 92817, "epoch": 2209} {"train_loss": -6.289313793182373, "global_step": 92818, "epoch": 2209} {"train_loss": -6.242845251446679, "global_step": 92819, "epoch": 2209, "val_loss": 68006.0546875} {"train_loss": -6.266821384429932, "global_step": 92820, "epoch": 2210} {"train_loss": -6.234854221343994, "global_step": 92821, "epoch": 2210} {"train_loss": -6.112297534942627, "global_step": 92822, "epoch": 2210} {"train_loss": -6.210644721984863, "global_step": 92823, "epoch": 2210} {"train_loss": -6.21895170211792, "global_step": 92824, "epoch": 2210} {"train_loss": -6.22472620010376, "global_step": 92825, "epoch": 2210} {"train_loss": -6.2736616134643555, "global_step": 92826, "epoch": 2210} {"train_loss": -6.310491561889648, "global_step": 92827, "epoch": 2210} {"train_loss": -6.19169807434082, "global_step": 92828, "epoch": 2210} {"train_loss": -6.3299760818481445, "global_step": 92829, "epoch": 2210} {"train_loss": -6.117111682891846, "global_step": 92830, "epoch": 2210} {"train_loss": -6.202877044677734, "global_step": 92831, "epoch": 2210} {"train_loss": -6.2440505027771, "global_step": 92832, "epoch": 2210} {"train_loss": -6.135623455047607, "global_step": 92833, "epoch": 2210} {"train_loss": -6.198810577392578, "global_step": 92834, "epoch": 2210} {"train_loss": -6.160897731781006, "global_step": 92835, "epoch": 2210} {"train_loss": -6.2403693199157715, "global_step": 92836, "epoch": 2210} {"train_loss": -6.261835098266602, "global_step": 92837, "epoch": 2210} {"train_loss": -6.239871501922607, "global_step": 92838, "epoch": 2210} {"train_loss": -6.167522430419922, "global_step": 92839, "epoch": 2210} {"train_loss": -6.352270603179932, "global_step": 92840, "epoch": 2210} {"train_loss": -6.297593593597412, "global_step": 92841, "epoch": 2210} {"train_loss": -6.233040809631348, "global_step": 92842, "epoch": 2210} {"train_loss": -6.159510135650635, "global_step": 92843, "epoch": 2210} {"train_loss": -6.11500358581543, "global_step": 92844, "epoch": 2210} {"train_loss": -6.225564956665039, "global_step": 92845, "epoch": 2210} {"train_loss": -6.228067398071289, "global_step": 92846, "epoch": 2210} {"train_loss": -6.189627170562744, "global_step": 92847, "epoch": 2210} {"train_loss": -6.242934703826904, "global_step": 92848, "epoch": 2210} {"train_loss": -6.161031246185303, "global_step": 92849, "epoch": 2210} {"train_loss": -6.264309406280518, "global_step": 92850, "epoch": 2210} {"train_loss": -6.118375778198242, "global_step": 92851, "epoch": 2210} {"train_loss": -6.232093811035156, "global_step": 92852, "epoch": 2210} {"train_loss": -6.1359052658081055, "global_step": 92853, "epoch": 2210} {"train_loss": -6.1512451171875, "global_step": 92854, "epoch": 2210} {"train_loss": -6.168259620666504, "global_step": 92855, "epoch": 2210} {"train_loss": -6.2316484451293945, "global_step": 92856, "epoch": 2210} {"train_loss": -6.1910624504089355, "global_step": 92857, "epoch": 2210} {"train_loss": -6.244926452636719, "global_step": 92858, "epoch": 2210} {"train_loss": -6.165476322174072, "global_step": 92859, "epoch": 2210} {"train_loss": -6.225971221923828, "global_step": 92860, "epoch": 2210} {"train_loss": -6.214600142978487, "global_step": 92861, "epoch": 2210, "val_loss": 68037.09375} {"train_loss": -6.140881061553955, "global_step": 92862, "epoch": 2211} {"train_loss": -6.261244773864746, "global_step": 92863, "epoch": 2211} {"train_loss": -6.133742332458496, "global_step": 92864, "epoch": 2211} {"train_loss": -6.295692443847656, "global_step": 92865, "epoch": 2211} {"train_loss": -6.225313663482666, "global_step": 92866, "epoch": 2211} {"train_loss": -6.139361381530762, "global_step": 92867, "epoch": 2211} {"train_loss": -6.281184196472168, "global_step": 92868, "epoch": 2211} {"train_loss": -6.242923736572266, "global_step": 92869, "epoch": 2211} {"train_loss": -6.262709617614746, "global_step": 92870, "epoch": 2211} {"train_loss": -6.252852439880371, "global_step": 92871, "epoch": 2211} {"train_loss": -6.280703544616699, "global_step": 92872, "epoch": 2211} {"train_loss": -6.317906379699707, "global_step": 92873, "epoch": 2211} {"train_loss": -6.154776573181152, "global_step": 92874, "epoch": 2211} {"train_loss": -6.3310394287109375, "global_step": 92875, "epoch": 2211} {"train_loss": -6.2220611572265625, "global_step": 92876, "epoch": 2211} {"train_loss": -6.375711917877197, "global_step": 92877, "epoch": 2211} {"train_loss": -6.2059712409973145, "global_step": 92878, "epoch": 2211} {"train_loss": -6.293954849243164, "global_step": 92879, "epoch": 2211} {"train_loss": -6.174671173095703, "global_step": 92880, "epoch": 2211} {"train_loss": -6.257467269897461, "global_step": 92881, "epoch": 2211} {"train_loss": -6.11946964263916, "global_step": 92882, "epoch": 2211} {"train_loss": -6.0895538330078125, "global_step": 92883, "epoch": 2211} {"train_loss": -6.076875686645508, "global_step": 92884, "epoch": 2211} {"train_loss": -6.29385232925415, "global_step": 92885, "epoch": 2211} {"train_loss": -6.202960968017578, "global_step": 92886, "epoch": 2211} {"train_loss": -6.213719844818115, "global_step": 92887, "epoch": 2211} {"train_loss": -6.264956474304199, "global_step": 92888, "epoch": 2211} {"train_loss": -6.2355499267578125, "global_step": 92889, "epoch": 2211} {"train_loss": -6.283027648925781, "global_step": 92890, "epoch": 2211} {"train_loss": -6.23856258392334, "global_step": 92891, "epoch": 2211} {"train_loss": -6.292186737060547, "global_step": 92892, "epoch": 2211} {"train_loss": -6.223346710205078, "global_step": 92893, "epoch": 2211} {"train_loss": -6.117023944854736, "global_step": 92894, "epoch": 2211} {"train_loss": -6.2089433670043945, "global_step": 92895, "epoch": 2211} {"train_loss": -6.161672592163086, "global_step": 92896, "epoch": 2211} {"train_loss": -6.2663116455078125, "global_step": 92897, "epoch": 2211} {"train_loss": -6.188534736633301, "global_step": 92898, "epoch": 2211} {"train_loss": -6.22245979309082, "global_step": 92899, "epoch": 2211} {"train_loss": -6.226680755615234, "global_step": 92900, "epoch": 2211} {"train_loss": -6.296104431152344, "global_step": 92901, "epoch": 2211} {"train_loss": -6.239968299865723, "global_step": 92902, "epoch": 2211} {"train_loss": -6.227636621111915, "global_step": 92903, "epoch": 2211, "val_loss": 67694.875} {"train_loss": -6.305233955383301, "global_step": 92904, "epoch": 2212} {"train_loss": -6.247253894805908, "global_step": 92905, "epoch": 2212} {"train_loss": -6.14744758605957, "global_step": 92906, "epoch": 2212} {"train_loss": -6.278340816497803, "global_step": 92907, "epoch": 2212} {"train_loss": -6.2516279220581055, "global_step": 92908, "epoch": 2212} {"train_loss": -6.216548919677734, "global_step": 92909, "epoch": 2212} {"train_loss": -6.304141998291016, "global_step": 92910, "epoch": 2212} {"train_loss": -6.260375022888184, "global_step": 92911, "epoch": 2212} {"train_loss": -6.240512847900391, "global_step": 92912, "epoch": 2212} {"train_loss": -6.340030193328857, "global_step": 92913, "epoch": 2212} {"train_loss": -6.322989463806152, "global_step": 92914, "epoch": 2212} {"train_loss": -6.20728063583374, "global_step": 92915, "epoch": 2212} {"train_loss": -6.2719597816467285, "global_step": 92916, "epoch": 2212} {"train_loss": -6.310290336608887, "global_step": 92917, "epoch": 2212} {"train_loss": -6.156671047210693, "global_step": 92918, "epoch": 2212} {"train_loss": -6.208396911621094, "global_step": 92919, "epoch": 2212} {"train_loss": -6.182770729064941, "global_step": 92920, "epoch": 2212} {"train_loss": -6.300271987915039, "global_step": 92921, "epoch": 2212} {"train_loss": -6.166990280151367, "global_step": 92922, "epoch": 2212} {"train_loss": -6.316935062408447, "global_step": 92923, "epoch": 2212} {"train_loss": -6.26624870300293, "global_step": 92924, "epoch": 2212} {"train_loss": -6.130948543548584, "global_step": 92925, "epoch": 2212} {"train_loss": -6.322397232055664, "global_step": 92926, "epoch": 2212} {"train_loss": -6.178231716156006, "global_step": 92927, "epoch": 2212} {"train_loss": -6.265096664428711, "global_step": 92928, "epoch": 2212} {"train_loss": -6.246941566467285, "global_step": 92929, "epoch": 2212} {"train_loss": -6.283750534057617, "global_step": 92930, "epoch": 2212} {"train_loss": -6.32795524597168, "global_step": 92931, "epoch": 2212} {"train_loss": -6.257059097290039, "global_step": 92932, "epoch": 2212} {"train_loss": -6.2589569091796875, "global_step": 92933, "epoch": 2212} {"train_loss": -6.239992141723633, "global_step": 92934, "epoch": 2212} {"train_loss": -6.3659563064575195, "global_step": 92935, "epoch": 2212} {"train_loss": -6.272353172302246, "global_step": 92936, "epoch": 2212} {"train_loss": -6.362409591674805, "global_step": 92937, "epoch": 2212} {"train_loss": -6.228877544403076, "global_step": 92938, "epoch": 2212} {"train_loss": -6.3101654052734375, "global_step": 92939, "epoch": 2212} {"train_loss": -6.2748541831970215, "global_step": 92940, "epoch": 2212} {"train_loss": -6.161099433898926, "global_step": 92941, "epoch": 2212} {"train_loss": -6.288991928100586, "global_step": 92942, "epoch": 2212} {"train_loss": -6.27435827255249, "global_step": 92943, "epoch": 2212} {"train_loss": -6.3955979347229, "global_step": 92944, "epoch": 2212} {"train_loss": -6.261091868082683, "global_step": 92945, "epoch": 2212, "val_loss": 67949.46875} {"train_loss": -6.243137359619141, "global_step": 92946, "epoch": 2213} {"train_loss": -6.374587059020996, "global_step": 92947, "epoch": 2213} {"train_loss": -6.366259574890137, "global_step": 92948, "epoch": 2213} {"train_loss": -6.243341445922852, "global_step": 92949, "epoch": 2213} {"train_loss": -6.261954307556152, "global_step": 92950, "epoch": 2213} {"train_loss": -6.405825138092041, "global_step": 92951, "epoch": 2213} {"train_loss": -6.131044864654541, "global_step": 92952, "epoch": 2213} {"train_loss": -6.384070873260498, "global_step": 92953, "epoch": 2213} {"train_loss": -6.260297775268555, "global_step": 92954, "epoch": 2213} {"train_loss": -6.191080570220947, "global_step": 92955, "epoch": 2213} {"train_loss": -6.325939655303955, "global_step": 92956, "epoch": 2213} {"train_loss": -6.316943168640137, "global_step": 92957, "epoch": 2213} {"train_loss": -6.248220443725586, "global_step": 92958, "epoch": 2213} {"train_loss": -6.2546515464782715, "global_step": 92959, "epoch": 2213} {"train_loss": -6.298540115356445, "global_step": 92960, "epoch": 2213} {"train_loss": -6.227249622344971, "global_step": 92961, "epoch": 2213} {"train_loss": -6.2957072257995605, "global_step": 92962, "epoch": 2213} {"train_loss": -6.257685661315918, "global_step": 92963, "epoch": 2213} {"train_loss": -6.253572463989258, "global_step": 92964, "epoch": 2213} {"train_loss": -6.254908561706543, "global_step": 92965, "epoch": 2213} {"train_loss": -6.263397216796875, "global_step": 92966, "epoch": 2213} {"train_loss": -6.137368679046631, "global_step": 92967, "epoch": 2213} {"train_loss": -6.269387722015381, "global_step": 92968, "epoch": 2213} {"train_loss": -6.2300825119018555, "global_step": 92969, "epoch": 2213} {"train_loss": -6.220973014831543, "global_step": 92970, "epoch": 2213} {"train_loss": -6.323844909667969, "global_step": 92971, "epoch": 2213} {"train_loss": -6.325850963592529, "global_step": 92972, "epoch": 2213} {"train_loss": -6.301377296447754, "global_step": 92973, "epoch": 2213} {"train_loss": -6.440967559814453, "global_step": 92974, "epoch": 2213} {"train_loss": -6.156951904296875, "global_step": 92975, "epoch": 2213} {"train_loss": -6.273490905761719, "global_step": 92976, "epoch": 2213} {"train_loss": -6.281467914581299, "global_step": 92977, "epoch": 2213} {"train_loss": -6.1278557777404785, "global_step": 92978, "epoch": 2213} {"train_loss": -6.200307369232178, "global_step": 92979, "epoch": 2213} {"train_loss": -6.171233654022217, "global_step": 92980, "epoch": 2213} {"train_loss": -6.23156213760376, "global_step": 92981, "epoch": 2213} {"train_loss": -6.247915267944336, "global_step": 92982, "epoch": 2213} {"train_loss": -6.341639518737793, "global_step": 92983, "epoch": 2213} {"train_loss": -6.308537483215332, "global_step": 92984, "epoch": 2213} {"train_loss": -6.253237724304199, "global_step": 92985, "epoch": 2213} {"train_loss": -6.395489692687988, "global_step": 92986, "epoch": 2213} {"train_loss": -6.2720066365741545, "global_step": 92987, "epoch": 2213, "val_loss": 67833.015625} {"train_loss": -6.136569976806641, "global_step": 92988, "epoch": 2214} {"train_loss": -6.233819007873535, "global_step": 92989, "epoch": 2214} {"train_loss": -6.253264427185059, "global_step": 92990, "epoch": 2214} {"train_loss": -6.298519134521484, "global_step": 92991, "epoch": 2214} {"train_loss": -6.320815086364746, "global_step": 92992, "epoch": 2214} {"train_loss": -6.413330078125, "global_step": 92993, "epoch": 2214} {"train_loss": -6.227279186248779, "global_step": 92994, "epoch": 2214} {"train_loss": -6.376107215881348, "global_step": 92995, "epoch": 2214} {"train_loss": -6.282530784606934, "global_step": 92996, "epoch": 2214} {"train_loss": -6.15870475769043, "global_step": 92997, "epoch": 2214} {"train_loss": -6.3468217849731445, "global_step": 92998, "epoch": 2214} {"train_loss": -6.242881774902344, "global_step": 92999, "epoch": 2214} {"train_loss": -6.185471534729004, "global_step": 93000, "epoch": 2214} {"train_loss": -6.32678747177124, "global_step": 93001, "epoch": 2214} {"train_loss": -6.2185187339782715, "global_step": 93002, "epoch": 2214} {"train_loss": -6.299673080444336, "global_step": 93003, "epoch": 2214} {"train_loss": -6.182122230529785, "global_step": 93004, "epoch": 2214} {"train_loss": -6.258062362670898, "global_step": 93005, "epoch": 2214} {"train_loss": -6.3220014572143555, "global_step": 93006, "epoch": 2214} {"train_loss": -6.219729423522949, "global_step": 93007, "epoch": 2214} {"train_loss": -6.317622184753418, "global_step": 93008, "epoch": 2214} {"train_loss": -6.1578826904296875, "global_step": 93009, "epoch": 2214} {"train_loss": -6.319084167480469, "global_step": 93010, "epoch": 2214} {"train_loss": -6.225480079650879, "global_step": 93011, "epoch": 2214} {"train_loss": -6.283512115478516, "global_step": 93012, "epoch": 2214} {"train_loss": -6.187910079956055, "global_step": 93013, "epoch": 2214} {"train_loss": -6.218015193939209, "global_step": 93014, "epoch": 2214} {"train_loss": -6.269088268280029, "global_step": 93015, "epoch": 2214} {"train_loss": -6.372563362121582, "global_step": 93016, "epoch": 2214} {"train_loss": -6.277024745941162, "global_step": 93017, "epoch": 2214} {"train_loss": -6.26381254196167, "global_step": 93018, "epoch": 2214} {"train_loss": -6.254138469696045, "global_step": 93019, "epoch": 2214} {"train_loss": -6.310233116149902, "global_step": 93020, "epoch": 2214} {"train_loss": -6.288368225097656, "global_step": 93021, "epoch": 2214} {"train_loss": -6.336292743682861, "global_step": 93022, "epoch": 2214} {"train_loss": -6.139404296875, "global_step": 93023, "epoch": 2214} {"train_loss": -6.243232250213623, "global_step": 93024, "epoch": 2214} {"train_loss": -6.21230411529541, "global_step": 93025, "epoch": 2214} {"train_loss": -6.169164657592773, "global_step": 93026, "epoch": 2214} {"train_loss": -6.38386869430542, "global_step": 93027, "epoch": 2214} {"train_loss": -6.298270225524902, "global_step": 93028, "epoch": 2214} {"train_loss": -6.265825328372774, "global_step": 93029, "epoch": 2214, "val_loss": 67968.1484375} {"train_loss": -6.238360404968262, "global_step": 93030, "epoch": 2215} {"train_loss": -6.27144718170166, "global_step": 93031, "epoch": 2215} {"train_loss": -6.3412275314331055, "global_step": 93032, "epoch": 2215} {"train_loss": -6.256036281585693, "global_step": 93033, "epoch": 2215} {"train_loss": -6.28342342376709, "global_step": 93034, "epoch": 2215} {"train_loss": -6.292258262634277, "global_step": 93035, "epoch": 2215} {"train_loss": -6.260043621063232, "global_step": 93036, "epoch": 2215} {"train_loss": -6.286254405975342, "global_step": 93037, "epoch": 2215} {"train_loss": -6.204719066619873, "global_step": 93038, "epoch": 2215} {"train_loss": -6.126959323883057, "global_step": 93039, "epoch": 2215} {"train_loss": -6.2437944412231445, "global_step": 93040, "epoch": 2215} {"train_loss": -6.209367752075195, "global_step": 93041, "epoch": 2215} {"train_loss": -6.301541328430176, "global_step": 93042, "epoch": 2215} {"train_loss": -6.228631019592285, "global_step": 93043, "epoch": 2215} {"train_loss": -6.205292224884033, "global_step": 93044, "epoch": 2215} {"train_loss": -6.308767318725586, "global_step": 93045, "epoch": 2215} {"train_loss": -6.170631408691406, "global_step": 93046, "epoch": 2215} {"train_loss": -6.256637096405029, "global_step": 93047, "epoch": 2215} {"train_loss": -6.233070373535156, "global_step": 93048, "epoch": 2215} {"train_loss": -6.162381172180176, "global_step": 93049, "epoch": 2215} {"train_loss": -6.199880599975586, "global_step": 93050, "epoch": 2215} {"train_loss": -6.24677038192749, "global_step": 93051, "epoch": 2215} {"train_loss": -6.204326629638672, "global_step": 93052, "epoch": 2215} {"train_loss": -6.205375671386719, "global_step": 93053, "epoch": 2215} {"train_loss": -6.181303024291992, "global_step": 93054, "epoch": 2215} {"train_loss": -6.319661617279053, "global_step": 93055, "epoch": 2215} {"train_loss": -6.146804332733154, "global_step": 93056, "epoch": 2215} {"train_loss": -6.190184593200684, "global_step": 93057, "epoch": 2215} {"train_loss": -6.276129722595215, "global_step": 93058, "epoch": 2215} {"train_loss": -6.146414756774902, "global_step": 93059, "epoch": 2215} {"train_loss": -6.252291679382324, "global_step": 93060, "epoch": 2215} {"train_loss": -6.050508499145508, "global_step": 93061, "epoch": 2215} {"train_loss": -6.151436805725098, "global_step": 93062, "epoch": 2215} {"train_loss": -6.307761192321777, "global_step": 93063, "epoch": 2215} {"train_loss": -6.178858757019043, "global_step": 93064, "epoch": 2215} {"train_loss": -6.146608352661133, "global_step": 93065, "epoch": 2215} {"train_loss": -6.148709297180176, "global_step": 93066, "epoch": 2215} {"train_loss": -6.291287422180176, "global_step": 93067, "epoch": 2215} {"train_loss": -6.265074729919434, "global_step": 93068, "epoch": 2215} {"train_loss": -6.288211345672607, "global_step": 93069, "epoch": 2215} {"train_loss": -6.28114128112793, "global_step": 93070, "epoch": 2215} {"train_loss": -6.229078610738118, "global_step": 93071, "epoch": 2215, "val_loss": 67998.5234375} {"train_loss": -6.343387603759766, "global_step": 93072, "epoch": 2216} {"train_loss": -6.247393608093262, "global_step": 93073, "epoch": 2216} {"train_loss": -6.238251209259033, "global_step": 93074, "epoch": 2216} {"train_loss": -6.269903182983398, "global_step": 93075, "epoch": 2216} {"train_loss": -6.364952087402344, "global_step": 93076, "epoch": 2216} {"train_loss": -6.2730302810668945, "global_step": 93077, "epoch": 2216} {"train_loss": -6.292103290557861, "global_step": 93078, "epoch": 2216} {"train_loss": -6.214719772338867, "global_step": 93079, "epoch": 2216} {"train_loss": -6.224043369293213, "global_step": 93080, "epoch": 2216} {"train_loss": -6.252493858337402, "global_step": 93081, "epoch": 2216} {"train_loss": -6.347036361694336, "global_step": 93082, "epoch": 2216} {"train_loss": -6.356734275817871, "global_step": 93083, "epoch": 2216} {"train_loss": -6.33221960067749, "global_step": 93084, "epoch": 2216} {"train_loss": -6.301342964172363, "global_step": 93085, "epoch": 2216} {"train_loss": -6.351240634918213, "global_step": 93086, "epoch": 2216} {"train_loss": -6.167519569396973, "global_step": 93087, "epoch": 2216} {"train_loss": -6.408782958984375, "global_step": 93088, "epoch": 2216} {"train_loss": -6.284004211425781, "global_step": 93089, "epoch": 2216} {"train_loss": -6.419684410095215, "global_step": 93090, "epoch": 2216} {"train_loss": -6.256554126739502, "global_step": 93091, "epoch": 2216} {"train_loss": -6.251751899719238, "global_step": 93092, "epoch": 2216} {"train_loss": -6.2786865234375, "global_step": 93093, "epoch": 2216} {"train_loss": -6.3064703941345215, "global_step": 93094, "epoch": 2216} {"train_loss": -6.274899005889893, "global_step": 93095, "epoch": 2216} {"train_loss": -6.293326377868652, "global_step": 93096, "epoch": 2216} {"train_loss": -6.245244026184082, "global_step": 93097, "epoch": 2216} {"train_loss": -6.29634428024292, "global_step": 93098, "epoch": 2216} {"train_loss": -6.225175857543945, "global_step": 93099, "epoch": 2216} {"train_loss": -6.243711471557617, "global_step": 93100, "epoch": 2216} {"train_loss": -6.201671600341797, "global_step": 93101, "epoch": 2216} {"train_loss": -6.271939277648926, "global_step": 93102, "epoch": 2216} {"train_loss": -6.15329647064209, "global_step": 93103, "epoch": 2216} {"train_loss": -6.3413262367248535, "global_step": 93104, "epoch": 2216} {"train_loss": -6.251770973205566, "global_step": 93105, "epoch": 2216} {"train_loss": -6.173020839691162, "global_step": 93106, "epoch": 2216} {"train_loss": -6.31415319442749, "global_step": 93107, "epoch": 2216} {"train_loss": -6.350256443023682, "global_step": 93108, "epoch": 2216} {"train_loss": -6.322215557098389, "global_step": 93109, "epoch": 2216} {"train_loss": -6.2282867431640625, "global_step": 93110, "epoch": 2216} {"train_loss": -6.234936237335205, "global_step": 93111, "epoch": 2216} {"train_loss": -6.303382873535156, "global_step": 93112, "epoch": 2216} {"train_loss": -6.28018890108381, "global_step": 93113, "epoch": 2216, "val_loss": 67838.1328125} {"train_loss": -6.362997055053711, "global_step": 93114, "epoch": 2217} {"train_loss": -6.353065013885498, "global_step": 93115, "epoch": 2217} {"train_loss": -6.2020087242126465, "global_step": 93116, "epoch": 2217} {"train_loss": -6.234615325927734, "global_step": 93117, "epoch": 2217} {"train_loss": -6.285459995269775, "global_step": 93118, "epoch": 2217} {"train_loss": -6.3039045333862305, "global_step": 93119, "epoch": 2217} {"train_loss": -6.354780197143555, "global_step": 93120, "epoch": 2217} {"train_loss": -6.278838634490967, "global_step": 93121, "epoch": 2217} {"train_loss": -6.227535247802734, "global_step": 93122, "epoch": 2217} {"train_loss": -6.3378400802612305, "global_step": 93123, "epoch": 2217} {"train_loss": -6.2235212326049805, "global_step": 93124, "epoch": 2217} {"train_loss": -6.315857887268066, "global_step": 93125, "epoch": 2217} {"train_loss": -6.275528907775879, "global_step": 93126, "epoch": 2217} {"train_loss": -6.248045921325684, "global_step": 93127, "epoch": 2217} {"train_loss": -6.182711124420166, "global_step": 93128, "epoch": 2217} {"train_loss": -6.275655269622803, "global_step": 93129, "epoch": 2217} {"train_loss": -6.190088272094727, "global_step": 93130, "epoch": 2217} {"train_loss": -6.313291549682617, "global_step": 93131, "epoch": 2217} {"train_loss": -6.266980171203613, "global_step": 93132, "epoch": 2217} {"train_loss": -6.220658302307129, "global_step": 93133, "epoch": 2217} {"train_loss": -6.326044082641602, "global_step": 93134, "epoch": 2217} {"train_loss": -6.2580084800720215, "global_step": 93135, "epoch": 2217} {"train_loss": -6.35950231552124, "global_step": 93136, "epoch": 2217} {"train_loss": -6.288238525390625, "global_step": 93137, "epoch": 2217} {"train_loss": -6.141323089599609, "global_step": 93138, "epoch": 2217} {"train_loss": -6.242979526519775, "global_step": 93139, "epoch": 2217} {"train_loss": -6.287336826324463, "global_step": 93140, "epoch": 2217} {"train_loss": -6.239221572875977, "global_step": 93141, "epoch": 2217} {"train_loss": -6.300936222076416, "global_step": 93142, "epoch": 2217} {"train_loss": -6.204294204711914, "global_step": 93143, "epoch": 2217} {"train_loss": -6.273301601409912, "global_step": 93144, "epoch": 2217} {"train_loss": -6.277605056762695, "global_step": 93145, "epoch": 2217} {"train_loss": -6.059653282165527, "global_step": 93146, "epoch": 2217} {"train_loss": -6.318184852600098, "global_step": 93147, "epoch": 2217} {"train_loss": -6.334877014160156, "global_step": 93148, "epoch": 2217} {"train_loss": -6.32244873046875, "global_step": 93149, "epoch": 2217} {"train_loss": -6.20914363861084, "global_step": 93150, "epoch": 2217} {"train_loss": -6.197142601013184, "global_step": 93151, "epoch": 2217} {"train_loss": -6.156431198120117, "global_step": 93152, "epoch": 2217} {"train_loss": -6.264751434326172, "global_step": 93153, "epoch": 2217} {"train_loss": -6.187832355499268, "global_step": 93154, "epoch": 2217} {"train_loss": -6.2619197482154485, "global_step": 93155, "epoch": 2217, "val_loss": 67812.8125} {"train_loss": -6.389146327972412, "global_step": 93156, "epoch": 2218} {"train_loss": -6.296750068664551, "global_step": 93157, "epoch": 2218} {"train_loss": -6.247557640075684, "global_step": 93158, "epoch": 2218} {"train_loss": -6.342373847961426, "global_step": 93159, "epoch": 2218} {"train_loss": -6.270973205566406, "global_step": 93160, "epoch": 2218} {"train_loss": -6.237997055053711, "global_step": 93161, "epoch": 2218} {"train_loss": -6.313205718994141, "global_step": 93162, "epoch": 2218} {"train_loss": -6.3237714767456055, "global_step": 93163, "epoch": 2218} {"train_loss": -6.316925048828125, "global_step": 93164, "epoch": 2218} {"train_loss": -6.2145256996154785, "global_step": 93165, "epoch": 2218} {"train_loss": -6.390979766845703, "global_step": 93166, "epoch": 2218} {"train_loss": -6.256448745727539, "global_step": 93167, "epoch": 2218} {"train_loss": -6.276769161224365, "global_step": 93168, "epoch": 2218} {"train_loss": -6.313076972961426, "global_step": 93169, "epoch": 2218} {"train_loss": -6.219196796417236, "global_step": 93170, "epoch": 2218} {"train_loss": -6.310844898223877, "global_step": 93171, "epoch": 2218} {"train_loss": -6.229698181152344, "global_step": 93172, "epoch": 2218} {"train_loss": -6.343696594238281, "global_step": 93173, "epoch": 2218} {"train_loss": -6.304626941680908, "global_step": 93174, "epoch": 2218} {"train_loss": -6.411289215087891, "global_step": 93175, "epoch": 2218} {"train_loss": -6.275351524353027, "global_step": 93176, "epoch": 2218} {"train_loss": -6.2599873542785645, "global_step": 93177, "epoch": 2218} {"train_loss": -6.409310340881348, "global_step": 93178, "epoch": 2218} {"train_loss": -6.257899284362793, "global_step": 93179, "epoch": 2218} {"train_loss": -6.178946018218994, "global_step": 93180, "epoch": 2218} {"train_loss": -6.345327377319336, "global_step": 93181, "epoch": 2218} {"train_loss": -6.28403902053833, "global_step": 93182, "epoch": 2218} {"train_loss": -6.29621696472168, "global_step": 93183, "epoch": 2218} {"train_loss": -6.277009010314941, "global_step": 93184, "epoch": 2218} {"train_loss": -6.32413911819458, "global_step": 93185, "epoch": 2218} {"train_loss": -6.360418796539307, "global_step": 93186, "epoch": 2218} {"train_loss": -6.264462471008301, "global_step": 93187, "epoch": 2218} {"train_loss": -6.158852577209473, "global_step": 93188, "epoch": 2218} {"train_loss": -6.233461380004883, "global_step": 93189, "epoch": 2218} {"train_loss": -6.141036033630371, "global_step": 93190, "epoch": 2218} {"train_loss": -6.206929683685303, "global_step": 93191, "epoch": 2218} {"train_loss": -6.289193630218506, "global_step": 93192, "epoch": 2218} {"train_loss": -6.300524711608887, "global_step": 93193, "epoch": 2218} {"train_loss": -6.254697799682617, "global_step": 93194, "epoch": 2218} {"train_loss": -6.363124847412109, "global_step": 93195, "epoch": 2218} {"train_loss": -6.348282814025879, "global_step": 93196, "epoch": 2218} {"train_loss": -6.285940942310152, "global_step": 93197, "epoch": 2218, "val_loss": 67848.734375} {"train_loss": -6.321856498718262, "global_step": 93198, "epoch": 2219} {"train_loss": -6.159123420715332, "global_step": 93199, "epoch": 2219} {"train_loss": -6.155359268188477, "global_step": 93200, "epoch": 2219} {"train_loss": -6.222166061401367, "global_step": 93201, "epoch": 2219} {"train_loss": -6.1586408615112305, "global_step": 93202, "epoch": 2219} {"train_loss": -6.198982238769531, "global_step": 93203, "epoch": 2219} {"train_loss": -6.20269250869751, "global_step": 93204, "epoch": 2219} {"train_loss": -6.198563575744629, "global_step": 93205, "epoch": 2219} {"train_loss": -6.238611698150635, "global_step": 93206, "epoch": 2219} {"train_loss": -6.29741096496582, "global_step": 93207, "epoch": 2219} {"train_loss": -6.230830669403076, "global_step": 93208, "epoch": 2219} {"train_loss": -6.129942893981934, "global_step": 93209, "epoch": 2219} {"train_loss": -6.210333824157715, "global_step": 93210, "epoch": 2219} {"train_loss": -6.243321418762207, "global_step": 93211, "epoch": 2219} {"train_loss": -6.2311177253723145, "global_step": 93212, "epoch": 2219} {"train_loss": -6.236091613769531, "global_step": 93213, "epoch": 2219} {"train_loss": -6.145559310913086, "global_step": 93214, "epoch": 2219} {"train_loss": -6.231989860534668, "global_step": 93215, "epoch": 2219} {"train_loss": -6.2837300300598145, "global_step": 93216, "epoch": 2219} {"train_loss": -6.365629196166992, "global_step": 93217, "epoch": 2219} {"train_loss": -6.142197608947754, "global_step": 93218, "epoch": 2219} {"train_loss": -6.223857402801514, "global_step": 93219, "epoch": 2219} {"train_loss": -6.252575397491455, "global_step": 93220, "epoch": 2219} {"train_loss": -6.245246887207031, "global_step": 93221, "epoch": 2219} {"train_loss": -6.300189018249512, "global_step": 93222, "epoch": 2219} {"train_loss": -6.25547981262207, "global_step": 93223, "epoch": 2219} {"train_loss": -6.310657978057861, "global_step": 93224, "epoch": 2219} {"train_loss": -6.2838287353515625, "global_step": 93225, "epoch": 2219} {"train_loss": -6.28339958190918, "global_step": 93226, "epoch": 2219} {"train_loss": -6.236049652099609, "global_step": 93227, "epoch": 2219} {"train_loss": -6.267980098724365, "global_step": 93228, "epoch": 2219} {"train_loss": -6.15123176574707, "global_step": 93229, "epoch": 2219} {"train_loss": -6.211872100830078, "global_step": 93230, "epoch": 2219} {"train_loss": -6.406193733215332, "global_step": 93231, "epoch": 2219} {"train_loss": -6.2641754150390625, "global_step": 93232, "epoch": 2219} {"train_loss": -6.217641353607178, "global_step": 93233, "epoch": 2219} {"train_loss": -6.237846374511719, "global_step": 93234, "epoch": 2219} {"train_loss": -6.245404243469238, "global_step": 93235, "epoch": 2219} {"train_loss": -6.307288646697998, "global_step": 93236, "epoch": 2219} {"train_loss": -6.206902503967285, "global_step": 93237, "epoch": 2219} {"train_loss": -6.337969779968262, "global_step": 93238, "epoch": 2219} {"train_loss": -6.240535452252343, "global_step": 93239, "epoch": 2219, "val_loss": 67979.0859375} {"train_loss": -6.225707054138184, "global_step": 93240, "epoch": 2220} {"train_loss": -6.303152084350586, "global_step": 93241, "epoch": 2220} {"train_loss": -6.3297014236450195, "global_step": 93242, "epoch": 2220} {"train_loss": -6.309228420257568, "global_step": 93243, "epoch": 2220} {"train_loss": -6.239315986633301, "global_step": 93244, "epoch": 2220} {"train_loss": -6.248569011688232, "global_step": 93245, "epoch": 2220} {"train_loss": -6.238123416900635, "global_step": 93246, "epoch": 2220} {"train_loss": -6.2318243980407715, "global_step": 93247, "epoch": 2220} {"train_loss": -6.316104888916016, "global_step": 93248, "epoch": 2220} {"train_loss": -6.245174884796143, "global_step": 93249, "epoch": 2220} {"train_loss": -6.214217662811279, "global_step": 93250, "epoch": 2220} {"train_loss": -6.308689117431641, "global_step": 93251, "epoch": 2220} {"train_loss": -6.322401523590088, "global_step": 93252, "epoch": 2220} {"train_loss": -6.212729454040527, "global_step": 93253, "epoch": 2220} {"train_loss": -6.2917375564575195, "global_step": 93254, "epoch": 2220} {"train_loss": -6.212066173553467, "global_step": 93255, "epoch": 2220} {"train_loss": -6.2822723388671875, "global_step": 93256, "epoch": 2220} {"train_loss": -6.160000324249268, "global_step": 93257, "epoch": 2220} {"train_loss": -6.2766804695129395, "global_step": 93258, "epoch": 2220} {"train_loss": -6.1735148429870605, "global_step": 93259, "epoch": 2220} {"train_loss": -6.265622138977051, "global_step": 93260, "epoch": 2220} {"train_loss": -6.263839244842529, "global_step": 93261, "epoch": 2220} {"train_loss": -6.261935710906982, "global_step": 93262, "epoch": 2220} {"train_loss": -6.234244346618652, "global_step": 93263, "epoch": 2220} {"train_loss": -6.262660980224609, "global_step": 93264, "epoch": 2220} {"train_loss": -6.147913932800293, "global_step": 93265, "epoch": 2220} {"train_loss": -6.182453155517578, "global_step": 93266, "epoch": 2220} {"train_loss": -6.206075668334961, "global_step": 93267, "epoch": 2220} {"train_loss": -6.306013107299805, "global_step": 93268, "epoch": 2220} {"train_loss": -6.272343635559082, "global_step": 93269, "epoch": 2220} {"train_loss": -6.311247825622559, "global_step": 93270, "epoch": 2220} {"train_loss": -6.32320499420166, "global_step": 93271, "epoch": 2220} {"train_loss": -6.401684761047363, "global_step": 93272, "epoch": 2220} {"train_loss": -6.298015594482422, "global_step": 93273, "epoch": 2220} {"train_loss": -6.265808582305908, "global_step": 93274, "epoch": 2220} {"train_loss": -6.363142967224121, "global_step": 93275, "epoch": 2220} {"train_loss": -6.274528503417969, "global_step": 93276, "epoch": 2220} {"train_loss": -6.252202987670898, "global_step": 93277, "epoch": 2220} {"train_loss": -6.342918872833252, "global_step": 93278, "epoch": 2220} {"train_loss": -6.344160079956055, "global_step": 93279, "epoch": 2220} {"train_loss": -6.255164623260498, "global_step": 93280, "epoch": 2220} {"train_loss": -6.266620817638579, "global_step": 93281, "epoch": 2220, "val_loss": 67956.71875} {"train_loss": -6.346404075622559, "global_step": 93282, "epoch": 2221} {"train_loss": -6.176730632781982, "global_step": 93283, "epoch": 2221} {"train_loss": -6.275633811950684, "global_step": 93284, "epoch": 2221} {"train_loss": -6.283995628356934, "global_step": 93285, "epoch": 2221} {"train_loss": -6.303439617156982, "global_step": 93286, "epoch": 2221} {"train_loss": -6.414391040802002, "global_step": 93287, "epoch": 2221} {"train_loss": -6.314069747924805, "global_step": 93288, "epoch": 2221} {"train_loss": -6.179190635681152, "global_step": 93289, "epoch": 2221} {"train_loss": -6.261853218078613, "global_step": 93290, "epoch": 2221} {"train_loss": -6.347903728485107, "global_step": 93291, "epoch": 2221} {"train_loss": -6.311400413513184, "global_step": 93292, "epoch": 2221} {"train_loss": -6.355989456176758, "global_step": 93293, "epoch": 2221} {"train_loss": -6.163210868835449, "global_step": 93294, "epoch": 2221} {"train_loss": -6.221571922302246, "global_step": 93295, "epoch": 2221} {"train_loss": -6.314295768737793, "global_step": 93296, "epoch": 2221} {"train_loss": -6.346794128417969, "global_step": 93297, "epoch": 2221} {"train_loss": -6.303169250488281, "global_step": 93298, "epoch": 2221} {"train_loss": -6.2749786376953125, "global_step": 93299, "epoch": 2221} {"train_loss": -6.39133882522583, "global_step": 93300, "epoch": 2221} {"train_loss": -6.233409881591797, "global_step": 93301, "epoch": 2221} {"train_loss": -6.324501037597656, "global_step": 93302, "epoch": 2221} {"train_loss": -6.402611255645752, "global_step": 93303, "epoch": 2221} {"train_loss": -6.255855560302734, "global_step": 93304, "epoch": 2221} {"train_loss": -6.264665603637695, "global_step": 93305, "epoch": 2221} {"train_loss": -6.351374626159668, "global_step": 93306, "epoch": 2221} {"train_loss": -6.332045555114746, "global_step": 93307, "epoch": 2221} {"train_loss": -6.246341705322266, "global_step": 93308, "epoch": 2221} {"train_loss": -6.314252853393555, "global_step": 93309, "epoch": 2221} {"train_loss": -6.4006757736206055, "global_step": 93310, "epoch": 2221} {"train_loss": -6.363796710968018, "global_step": 93311, "epoch": 2221} {"train_loss": -6.289907932281494, "global_step": 93312, "epoch": 2221} {"train_loss": -6.427978515625, "global_step": 93313, "epoch": 2221} {"train_loss": -6.221451282501221, "global_step": 93314, "epoch": 2221} {"train_loss": -6.227497100830078, "global_step": 93315, "epoch": 2221} {"train_loss": -6.210099220275879, "global_step": 93316, "epoch": 2221} {"train_loss": -6.326338768005371, "global_step": 93317, "epoch": 2221} {"train_loss": -6.303836822509766, "global_step": 93318, "epoch": 2221} {"train_loss": -6.260322093963623, "global_step": 93319, "epoch": 2221} {"train_loss": -6.24509334564209, "global_step": 93320, "epoch": 2221} {"train_loss": -6.346922397613525, "global_step": 93321, "epoch": 2221} {"train_loss": -6.224813461303711, "global_step": 93322, "epoch": 2221} {"train_loss": -6.293928702672322, "global_step": 93323, "epoch": 2221, "val_loss": 67939.8984375} {"train_loss": -6.3063459396362305, "global_step": 93324, "epoch": 2222} {"train_loss": -6.303572177886963, "global_step": 93325, "epoch": 2222} {"train_loss": -6.304680347442627, "global_step": 93326, "epoch": 2222} {"train_loss": -6.2127790451049805, "global_step": 93327, "epoch": 2222} {"train_loss": -6.242015838623047, "global_step": 93328, "epoch": 2222} {"train_loss": -6.301382064819336, "global_step": 93329, "epoch": 2222} {"train_loss": -6.240377902984619, "global_step": 93330, "epoch": 2222} {"train_loss": -6.278755187988281, "global_step": 93331, "epoch": 2222} {"train_loss": -6.192104339599609, "global_step": 93332, "epoch": 2222} {"train_loss": -6.335068702697754, "global_step": 93333, "epoch": 2222} {"train_loss": -6.166451454162598, "global_step": 93334, "epoch": 2222} {"train_loss": -6.196115970611572, "global_step": 93335, "epoch": 2222} {"train_loss": -6.2915940284729, "global_step": 93336, "epoch": 2222} {"train_loss": -6.193199157714844, "global_step": 93337, "epoch": 2222} {"train_loss": -6.246549606323242, "global_step": 93338, "epoch": 2222} {"train_loss": -6.256236553192139, "global_step": 93339, "epoch": 2222} {"train_loss": -6.185848712921143, "global_step": 93340, "epoch": 2222} {"train_loss": -6.247396469116211, "global_step": 93341, "epoch": 2222} {"train_loss": -6.220180988311768, "global_step": 93342, "epoch": 2222} {"train_loss": -6.235227584838867, "global_step": 93343, "epoch": 2222} {"train_loss": -6.187570571899414, "global_step": 93344, "epoch": 2222} {"train_loss": -6.1552581787109375, "global_step": 93345, "epoch": 2222} {"train_loss": -6.271180152893066, "global_step": 93346, "epoch": 2222} {"train_loss": -6.2049713134765625, "global_step": 93347, "epoch": 2222} {"train_loss": -6.189057350158691, "global_step": 93348, "epoch": 2222} {"train_loss": -6.192386627197266, "global_step": 93349, "epoch": 2222} {"train_loss": -6.229529857635498, "global_step": 93350, "epoch": 2222} {"train_loss": -6.3057475090026855, "global_step": 93351, "epoch": 2222} {"train_loss": -6.231990814208984, "global_step": 93352, "epoch": 2222} {"train_loss": -6.397150039672852, "global_step": 93353, "epoch": 2222} {"train_loss": -6.258988857269287, "global_step": 93354, "epoch": 2222} {"train_loss": -6.179113388061523, "global_step": 93355, "epoch": 2222} {"train_loss": -6.366885662078857, "global_step": 93356, "epoch": 2222} {"train_loss": -6.252809524536133, "global_step": 93357, "epoch": 2222} {"train_loss": -6.275378227233887, "global_step": 93358, "epoch": 2222} {"train_loss": -6.302245616912842, "global_step": 93359, "epoch": 2222} {"train_loss": -6.30515718460083, "global_step": 93360, "epoch": 2222} {"train_loss": -6.300684928894043, "global_step": 93361, "epoch": 2222} {"train_loss": -6.299692153930664, "global_step": 93362, "epoch": 2222} {"train_loss": -6.333273887634277, "global_step": 93363, "epoch": 2222} {"train_loss": -6.315899848937988, "global_step": 93364, "epoch": 2222} {"train_loss": -6.256795497167678, "global_step": 93365, "epoch": 2222, "val_loss": 67847.6015625} {"train_loss": -6.268387794494629, "global_step": 93366, "epoch": 2223} {"train_loss": -6.434115886688232, "global_step": 93367, "epoch": 2223} {"train_loss": -6.233157157897949, "global_step": 93368, "epoch": 2223} {"train_loss": -6.298133373260498, "global_step": 93369, "epoch": 2223} {"train_loss": -6.169100284576416, "global_step": 93370, "epoch": 2223} {"train_loss": -6.225572109222412, "global_step": 93371, "epoch": 2223} {"train_loss": -6.303234100341797, "global_step": 93372, "epoch": 2223} {"train_loss": -6.147174835205078, "global_step": 93373, "epoch": 2223} {"train_loss": -6.321677207946777, "global_step": 93374, "epoch": 2223} {"train_loss": -6.294214248657227, "global_step": 93375, "epoch": 2223} {"train_loss": -6.2323503494262695, "global_step": 93376, "epoch": 2223} {"train_loss": -6.222113609313965, "global_step": 93377, "epoch": 2223} {"train_loss": -6.323382377624512, "global_step": 93378, "epoch": 2223} {"train_loss": -6.294516086578369, "global_step": 93379, "epoch": 2223} {"train_loss": -6.3015666007995605, "global_step": 93380, "epoch": 2223} {"train_loss": -6.335040092468262, "global_step": 93381, "epoch": 2223} {"train_loss": -6.369453430175781, "global_step": 93382, "epoch": 2223} {"train_loss": -6.411595821380615, "global_step": 93383, "epoch": 2223} {"train_loss": -6.156862258911133, "global_step": 93384, "epoch": 2223} {"train_loss": -6.318044662475586, "global_step": 93385, "epoch": 2223} {"train_loss": -6.1871747970581055, "global_step": 93386, "epoch": 2223} {"train_loss": -6.33404541015625, "global_step": 93387, "epoch": 2223} {"train_loss": -6.247034072875977, "global_step": 93388, "epoch": 2223} {"train_loss": -6.329314708709717, "global_step": 93389, "epoch": 2223} {"train_loss": -6.296910762786865, "global_step": 93390, "epoch": 2223} {"train_loss": -6.414770126342773, "global_step": 93391, "epoch": 2223} {"train_loss": -6.377307891845703, "global_step": 93392, "epoch": 2223} {"train_loss": -6.29131555557251, "global_step": 93393, "epoch": 2223} {"train_loss": -6.346273422241211, "global_step": 93394, "epoch": 2223} {"train_loss": -6.299346923828125, "global_step": 93395, "epoch": 2223} {"train_loss": -6.3221354484558105, "global_step": 93396, "epoch": 2223} {"train_loss": -6.339554786682129, "global_step": 93397, "epoch": 2223} {"train_loss": -6.158699035644531, "global_step": 93398, "epoch": 2223} {"train_loss": -6.120216369628906, "global_step": 93399, "epoch": 2223} {"train_loss": -6.27388858795166, "global_step": 93400, "epoch": 2223} {"train_loss": -6.206435203552246, "global_step": 93401, "epoch": 2223} {"train_loss": -6.2072858810424805, "global_step": 93402, "epoch": 2223} {"train_loss": -6.400796890258789, "global_step": 93403, "epoch": 2223} {"train_loss": -6.1659255027771, "global_step": 93404, "epoch": 2223} {"train_loss": -6.302385330200195, "global_step": 93405, "epoch": 2223} {"train_loss": -6.217681884765625, "global_step": 93406, "epoch": 2223} {"train_loss": -6.278301102774484, "global_step": 93407, "epoch": 2223, "val_loss": 67745.9609375} {"train_loss": -6.296965599060059, "global_step": 93408, "epoch": 2224} {"train_loss": -6.425601005554199, "global_step": 93409, "epoch": 2224} {"train_loss": -6.239779472351074, "global_step": 93410, "epoch": 2224} {"train_loss": -6.26027774810791, "global_step": 93411, "epoch": 2224} {"train_loss": -6.319280624389648, "global_step": 93412, "epoch": 2224} {"train_loss": -6.336363315582275, "global_step": 93413, "epoch": 2224} {"train_loss": -6.223638534545898, "global_step": 93414, "epoch": 2224} {"train_loss": -6.243106842041016, "global_step": 93415, "epoch": 2224} {"train_loss": -6.194993495941162, "global_step": 93416, "epoch": 2224} {"train_loss": -6.193109512329102, "global_step": 93417, "epoch": 2224} {"train_loss": -6.107473850250244, "global_step": 93418, "epoch": 2224} {"train_loss": -6.2490129470825195, "global_step": 93419, "epoch": 2224} {"train_loss": -6.258149147033691, "global_step": 93420, "epoch": 2224} {"train_loss": -6.127021312713623, "global_step": 93421, "epoch": 2224} {"train_loss": -6.378252029418945, "global_step": 93422, "epoch": 2224} {"train_loss": -6.157815933227539, "global_step": 93423, "epoch": 2224} {"train_loss": -6.386109352111816, "global_step": 93424, "epoch": 2224} {"train_loss": -6.210517883300781, "global_step": 93425, "epoch": 2224} {"train_loss": -6.199898719787598, "global_step": 93426, "epoch": 2224} {"train_loss": -6.172309875488281, "global_step": 93427, "epoch": 2224} {"train_loss": -6.196255683898926, "global_step": 93428, "epoch": 2224} {"train_loss": -6.193665981292725, "global_step": 93429, "epoch": 2224} {"train_loss": -6.236817836761475, "global_step": 93430, "epoch": 2224} {"train_loss": -6.255143165588379, "global_step": 93431, "epoch": 2224} {"train_loss": -6.222410202026367, "global_step": 93432, "epoch": 2224} {"train_loss": -6.137194633483887, "global_step": 93433, "epoch": 2224} {"train_loss": -6.288362979888916, "global_step": 93434, "epoch": 2224} {"train_loss": -6.268444061279297, "global_step": 93435, "epoch": 2224} {"train_loss": -6.193545341491699, "global_step": 93436, "epoch": 2224} {"train_loss": -6.2293620109558105, "global_step": 93437, "epoch": 2224} {"train_loss": -6.278279781341553, "global_step": 93438, "epoch": 2224} {"train_loss": -6.295648574829102, "global_step": 93439, "epoch": 2224} {"train_loss": -6.1957478523254395, "global_step": 93440, "epoch": 2224} {"train_loss": -6.338557243347168, "global_step": 93441, "epoch": 2224} {"train_loss": -6.316039085388184, "global_step": 93442, "epoch": 2224} {"train_loss": -6.161884307861328, "global_step": 93443, "epoch": 2224} {"train_loss": -6.255281448364258, "global_step": 93444, "epoch": 2224} {"train_loss": -6.297974586486816, "global_step": 93445, "epoch": 2224} {"train_loss": -6.2206573486328125, "global_step": 93446, "epoch": 2224} {"train_loss": -6.153146266937256, "global_step": 93447, "epoch": 2224} {"train_loss": -6.23062801361084, "global_step": 93448, "epoch": 2224} {"train_loss": -6.243368557521275, "global_step": 93449, "epoch": 2224, "val_loss": 67841.8125} {"train_loss": -6.234918117523193, "global_step": 93450, "epoch": 2225} {"train_loss": -6.302877426147461, "global_step": 93451, "epoch": 2225} {"train_loss": -6.218474388122559, "global_step": 93452, "epoch": 2225} {"train_loss": -6.281111240386963, "global_step": 93453, "epoch": 2225} {"train_loss": -6.335737228393555, "global_step": 93454, "epoch": 2225} {"train_loss": -6.315720081329346, "global_step": 93455, "epoch": 2225} {"train_loss": -6.246255874633789, "global_step": 93456, "epoch": 2225} {"train_loss": -6.30844783782959, "global_step": 93457, "epoch": 2225} {"train_loss": -6.3838887214660645, "global_step": 93458, "epoch": 2225} {"train_loss": -6.087958335876465, "global_step": 93459, "epoch": 2225} {"train_loss": -6.282883167266846, "global_step": 93460, "epoch": 2225} {"train_loss": -6.295907974243164, "global_step": 93461, "epoch": 2225} {"train_loss": -6.243624687194824, "global_step": 93462, "epoch": 2225} {"train_loss": -6.1925458908081055, "global_step": 93463, "epoch": 2225} {"train_loss": -6.165352821350098, "global_step": 93464, "epoch": 2225} {"train_loss": -6.251566410064697, "global_step": 93465, "epoch": 2225} {"train_loss": -6.329195976257324, "global_step": 93466, "epoch": 2225} {"train_loss": -6.2376861572265625, "global_step": 93467, "epoch": 2225} {"train_loss": -6.261446952819824, "global_step": 93468, "epoch": 2225} {"train_loss": -6.290359020233154, "global_step": 93469, "epoch": 2225} {"train_loss": -6.303399085998535, "global_step": 93470, "epoch": 2225} {"train_loss": -6.33354377746582, "global_step": 93471, "epoch": 2225} {"train_loss": -6.377285003662109, "global_step": 93472, "epoch": 2225} {"train_loss": -6.225902557373047, "global_step": 93473, "epoch": 2225} {"train_loss": -6.2245330810546875, "global_step": 93474, "epoch": 2225} {"train_loss": -6.298946380615234, "global_step": 93475, "epoch": 2225} {"train_loss": -6.294881820678711, "global_step": 93476, "epoch": 2225} {"train_loss": -6.240162372589111, "global_step": 93477, "epoch": 2225} {"train_loss": -6.305703639984131, "global_step": 93478, "epoch": 2225} {"train_loss": -6.2406005859375, "global_step": 93479, "epoch": 2225} {"train_loss": -6.177268981933594, "global_step": 93480, "epoch": 2225} {"train_loss": -6.2503743171691895, "global_step": 93481, "epoch": 2225} {"train_loss": -6.265439987182617, "global_step": 93482, "epoch": 2225} {"train_loss": -6.304173469543457, "global_step": 93483, "epoch": 2225} {"train_loss": -6.2148637771606445, "global_step": 93484, "epoch": 2225} {"train_loss": -6.271674633026123, "global_step": 93485, "epoch": 2225} {"train_loss": -6.251630783081055, "global_step": 93486, "epoch": 2225} {"train_loss": -6.359477996826172, "global_step": 93487, "epoch": 2225} {"train_loss": -6.219244956970215, "global_step": 93488, "epoch": 2225} {"train_loss": -6.220890998840332, "global_step": 93489, "epoch": 2225} {"train_loss": -6.331377983093262, "global_step": 93490, "epoch": 2225} {"train_loss": -6.267294452303932, "global_step": 93491, "epoch": 2225, "val_loss": 67711.6953125} {"train_loss": -6.19261360168457, "global_step": 93492, "epoch": 2226} {"train_loss": -6.261302947998047, "global_step": 93493, "epoch": 2226} {"train_loss": -6.287491798400879, "global_step": 93494, "epoch": 2226} {"train_loss": -6.396160125732422, "global_step": 93495, "epoch": 2226} {"train_loss": -6.173897743225098, "global_step": 93496, "epoch": 2226} {"train_loss": -6.4430718421936035, "global_step": 93497, "epoch": 2226} {"train_loss": -6.326396465301514, "global_step": 93498, "epoch": 2226} {"train_loss": -6.241910934448242, "global_step": 93499, "epoch": 2226} {"train_loss": -6.407507419586182, "global_step": 93500, "epoch": 2226} {"train_loss": -6.3550028800964355, "global_step": 93501, "epoch": 2226} {"train_loss": -6.209469795227051, "global_step": 93502, "epoch": 2226} {"train_loss": -6.3786444664001465, "global_step": 93503, "epoch": 2226} {"train_loss": -6.337834358215332, "global_step": 93504, "epoch": 2226} {"train_loss": -6.306371212005615, "global_step": 93505, "epoch": 2226} {"train_loss": -6.338499069213867, "global_step": 93506, "epoch": 2226} {"train_loss": -6.28126335144043, "global_step": 93507, "epoch": 2226} {"train_loss": -6.229905605316162, "global_step": 93508, "epoch": 2226} {"train_loss": -6.288492202758789, "global_step": 93509, "epoch": 2226} {"train_loss": -6.334345817565918, "global_step": 93510, "epoch": 2226} {"train_loss": -6.281210422515869, "global_step": 93511, "epoch": 2226} {"train_loss": -6.276639938354492, "global_step": 93512, "epoch": 2226} {"train_loss": -6.248302936553955, "global_step": 93513, "epoch": 2226} {"train_loss": -6.212803363800049, "global_step": 93514, "epoch": 2226} {"train_loss": -6.2552900314331055, "global_step": 93515, "epoch": 2226} {"train_loss": -6.325964450836182, "global_step": 93516, "epoch": 2226} {"train_loss": -6.061992168426514, "global_step": 93517, "epoch": 2226} {"train_loss": -6.240506649017334, "global_step": 93518, "epoch": 2226} {"train_loss": -6.2746357917785645, "global_step": 93519, "epoch": 2226} {"train_loss": -6.237565040588379, "global_step": 93520, "epoch": 2226} {"train_loss": -6.285706520080566, "global_step": 93521, "epoch": 2226} {"train_loss": -6.35299825668335, "global_step": 93522, "epoch": 2226} {"train_loss": -6.247054100036621, "global_step": 93523, "epoch": 2226} {"train_loss": -6.2742719650268555, "global_step": 93524, "epoch": 2226} {"train_loss": -6.159858703613281, "global_step": 93525, "epoch": 2226} {"train_loss": -6.220074653625488, "global_step": 93526, "epoch": 2226} {"train_loss": -6.237445831298828, "global_step": 93527, "epoch": 2226} {"train_loss": -6.228510856628418, "global_step": 93528, "epoch": 2226} {"train_loss": -6.171381950378418, "global_step": 93529, "epoch": 2226} {"train_loss": -6.181230068206787, "global_step": 93530, "epoch": 2226} {"train_loss": -6.359842300415039, "global_step": 93531, "epoch": 2226} {"train_loss": -6.196680068969727, "global_step": 93532, "epoch": 2226} {"train_loss": -6.270402987798055, "global_step": 93533, "epoch": 2226, "val_loss": 67926.1953125} {"train_loss": -6.210411071777344, "global_step": 93534, "epoch": 2227} {"train_loss": -6.255955219268799, "global_step": 93535, "epoch": 2227} {"train_loss": -6.210395336151123, "global_step": 93536, "epoch": 2227} {"train_loss": -6.321227073669434, "global_step": 93537, "epoch": 2227} {"train_loss": -6.28566837310791, "global_step": 93538, "epoch": 2227} {"train_loss": -6.256442070007324, "global_step": 93539, "epoch": 2227} {"train_loss": -6.293283462524414, "global_step": 93540, "epoch": 2227} {"train_loss": -6.262823104858398, "global_step": 93541, "epoch": 2227} {"train_loss": -6.226288318634033, "global_step": 93542, "epoch": 2227} {"train_loss": -6.170727729797363, "global_step": 93543, "epoch": 2227} {"train_loss": -6.235184192657471, "global_step": 93544, "epoch": 2227} {"train_loss": -6.216011047363281, "global_step": 93545, "epoch": 2227} {"train_loss": -6.281076431274414, "global_step": 93546, "epoch": 2227} {"train_loss": -6.3232951164245605, "global_step": 93547, "epoch": 2227} {"train_loss": -6.326164722442627, "global_step": 93548, "epoch": 2227} {"train_loss": -6.285105228424072, "global_step": 93549, "epoch": 2227} {"train_loss": -6.352414131164551, "global_step": 93550, "epoch": 2227} {"train_loss": -6.304633140563965, "global_step": 93551, "epoch": 2227} {"train_loss": -6.2074480056762695, "global_step": 93552, "epoch": 2227} {"train_loss": -6.258795261383057, "global_step": 93553, "epoch": 2227} {"train_loss": -6.210036277770996, "global_step": 93554, "epoch": 2227} {"train_loss": -6.124519348144531, "global_step": 93555, "epoch": 2227} {"train_loss": -6.303786277770996, "global_step": 93556, "epoch": 2227} {"train_loss": -6.275125026702881, "global_step": 93557, "epoch": 2227} {"train_loss": -6.2431840896606445, "global_step": 93558, "epoch": 2227} {"train_loss": -6.288116455078125, "global_step": 93559, "epoch": 2227} {"train_loss": -6.304076194763184, "global_step": 93560, "epoch": 2227} {"train_loss": -6.188312530517578, "global_step": 93561, "epoch": 2227} {"train_loss": -6.289879322052002, "global_step": 93562, "epoch": 2227} {"train_loss": -6.233258247375488, "global_step": 93563, "epoch": 2227} {"train_loss": -6.287773132324219, "global_step": 93564, "epoch": 2227} {"train_loss": -6.34719181060791, "global_step": 93565, "epoch": 2227} {"train_loss": -6.140870094299316, "global_step": 93566, "epoch": 2227} {"train_loss": -6.235915184020996, "global_step": 93567, "epoch": 2227} {"train_loss": -6.143287181854248, "global_step": 93568, "epoch": 2227} {"train_loss": -6.306842803955078, "global_step": 93569, "epoch": 2227} {"train_loss": -6.451193809509277, "global_step": 93570, "epoch": 2227} {"train_loss": -6.208619594573975, "global_step": 93571, "epoch": 2227} {"train_loss": -6.299098014831543, "global_step": 93572, "epoch": 2227} {"train_loss": -6.224634647369385, "global_step": 93573, "epoch": 2227} {"train_loss": -6.109550952911377, "global_step": 93574, "epoch": 2227} {"train_loss": -6.258528868357341, "global_step": 93575, "epoch": 2227, "val_loss": 67869.25} {"train_loss": -6.277887344360352, "global_step": 93576, "epoch": 2228} {"train_loss": -6.336517810821533, "global_step": 93577, "epoch": 2228} {"train_loss": -6.3069329261779785, "global_step": 93578, "epoch": 2228} {"train_loss": -6.389438629150391, "global_step": 93579, "epoch": 2228} {"train_loss": -6.274357795715332, "global_step": 93580, "epoch": 2228} {"train_loss": -6.311161994934082, "global_step": 93581, "epoch": 2228} {"train_loss": -6.3700456619262695, "global_step": 93582, "epoch": 2228} {"train_loss": -6.347158432006836, "global_step": 93583, "epoch": 2228} {"train_loss": -6.331984043121338, "global_step": 93584, "epoch": 2228} {"train_loss": -6.223105430603027, "global_step": 93585, "epoch": 2228} {"train_loss": -6.306354999542236, "global_step": 93586, "epoch": 2228} {"train_loss": -6.389292240142822, "global_step": 93587, "epoch": 2228} {"train_loss": -6.298576831817627, "global_step": 93588, "epoch": 2228} {"train_loss": -6.2816162109375, "global_step": 93589, "epoch": 2228} {"train_loss": -6.271965026855469, "global_step": 93590, "epoch": 2228} {"train_loss": -6.300388336181641, "global_step": 93591, "epoch": 2228} {"train_loss": -6.335511207580566, "global_step": 93592, "epoch": 2228} {"train_loss": -6.290439605712891, "global_step": 93593, "epoch": 2228} {"train_loss": -6.311280250549316, "global_step": 93594, "epoch": 2228} {"train_loss": -6.364119529724121, "global_step": 93595, "epoch": 2228} {"train_loss": -6.252424240112305, "global_step": 93596, "epoch": 2228} {"train_loss": -6.3505144119262695, "global_step": 93597, "epoch": 2228} {"train_loss": -6.350162506103516, "global_step": 93598, "epoch": 2228} {"train_loss": -6.2908172607421875, "global_step": 93599, "epoch": 2228} {"train_loss": -6.252974510192871, "global_step": 93600, "epoch": 2228} {"train_loss": -6.303257465362549, "global_step": 93601, "epoch": 2228} {"train_loss": -6.307967185974121, "global_step": 93602, "epoch": 2228} {"train_loss": -6.16002893447876, "global_step": 93603, "epoch": 2228} {"train_loss": -6.276398658752441, "global_step": 93604, "epoch": 2228} {"train_loss": -6.220553398132324, "global_step": 93605, "epoch": 2228} {"train_loss": -6.166187286376953, "global_step": 93606, "epoch": 2228} {"train_loss": -6.246664047241211, "global_step": 93607, "epoch": 2228} {"train_loss": -6.094050407409668, "global_step": 93608, "epoch": 2228} {"train_loss": -6.121370315551758, "global_step": 93609, "epoch": 2228} {"train_loss": -6.198142051696777, "global_step": 93610, "epoch": 2228} {"train_loss": -6.3067779541015625, "global_step": 93611, "epoch": 2228} {"train_loss": -6.245795726776123, "global_step": 93612, "epoch": 2228} {"train_loss": -6.252865791320801, "global_step": 93613, "epoch": 2228} {"train_loss": -6.23907470703125, "global_step": 93614, "epoch": 2228} {"train_loss": -6.259635925292969, "global_step": 93615, "epoch": 2228} {"train_loss": -6.179884433746338, "global_step": 93616, "epoch": 2228} {"train_loss": -6.278960375558762, "global_step": 93617, "epoch": 2228, "val_loss": 67928.40625} {"train_loss": -6.139834403991699, "global_step": 93618, "epoch": 2229} {"train_loss": -6.228598594665527, "global_step": 93619, "epoch": 2229} {"train_loss": -6.165353775024414, "global_step": 93620, "epoch": 2229} {"train_loss": -6.135217189788818, "global_step": 93621, "epoch": 2229} {"train_loss": -6.296034336090088, "global_step": 93622, "epoch": 2229} {"train_loss": -6.228743076324463, "global_step": 93623, "epoch": 2229} {"train_loss": -6.234267234802246, "global_step": 93624, "epoch": 2229} {"train_loss": -6.271073341369629, "global_step": 93625, "epoch": 2229} {"train_loss": -6.147810935974121, "global_step": 93626, "epoch": 2229} {"train_loss": -6.108839988708496, "global_step": 93627, "epoch": 2229} {"train_loss": -6.129803657531738, "global_step": 93628, "epoch": 2229} {"train_loss": -6.2708539962768555, "global_step": 93629, "epoch": 2229} {"train_loss": -6.2738542556762695, "global_step": 93630, "epoch": 2229} {"train_loss": -6.229254722595215, "global_step": 93631, "epoch": 2229} {"train_loss": -6.255690574645996, "global_step": 93632, "epoch": 2229} {"train_loss": -6.170302391052246, "global_step": 93633, "epoch": 2229} {"train_loss": -6.3338727951049805, "global_step": 93634, "epoch": 2229} {"train_loss": -6.131884574890137, "global_step": 93635, "epoch": 2229} {"train_loss": -6.215694427490234, "global_step": 93636, "epoch": 2229} {"train_loss": -6.232308387756348, "global_step": 93637, "epoch": 2229} {"train_loss": -6.266294002532959, "global_step": 93638, "epoch": 2229} {"train_loss": -6.176924228668213, "global_step": 93639, "epoch": 2229} {"train_loss": -6.077898979187012, "global_step": 93640, "epoch": 2229} {"train_loss": -6.320313453674316, "global_step": 93641, "epoch": 2229} {"train_loss": -6.219206809997559, "global_step": 93642, "epoch": 2229} {"train_loss": -6.2323126792907715, "global_step": 93643, "epoch": 2229} {"train_loss": -6.28450870513916, "global_step": 93644, "epoch": 2229} {"train_loss": -6.330021381378174, "global_step": 93645, "epoch": 2229} {"train_loss": -6.2199859619140625, "global_step": 93646, "epoch": 2229} {"train_loss": -6.236239433288574, "global_step": 93647, "epoch": 2229} {"train_loss": -6.223650932312012, "global_step": 93648, "epoch": 2229} {"train_loss": -6.350322246551514, "global_step": 93649, "epoch": 2229} {"train_loss": -6.16404390335083, "global_step": 93650, "epoch": 2229} {"train_loss": -6.354729652404785, "global_step": 93651, "epoch": 2229} {"train_loss": -6.217016696929932, "global_step": 93652, "epoch": 2229} {"train_loss": -6.352619171142578, "global_step": 93653, "epoch": 2229} {"train_loss": -6.246188163757324, "global_step": 93654, "epoch": 2229} {"train_loss": -6.148503303527832, "global_step": 93655, "epoch": 2229} {"train_loss": -6.1935319900512695, "global_step": 93656, "epoch": 2229} {"train_loss": -6.213038444519043, "global_step": 93657, "epoch": 2229} {"train_loss": -6.208503723144531, "global_step": 93658, "epoch": 2229} {"train_loss": -6.225234463101342, "global_step": 93659, "epoch": 2229, "val_loss": 68049.6015625} {"train_loss": -6.160891056060791, "global_step": 93660, "epoch": 2230} {"train_loss": -6.163556098937988, "global_step": 93661, "epoch": 2230} {"train_loss": -6.271177768707275, "global_step": 93662, "epoch": 2230} {"train_loss": -6.191877365112305, "global_step": 93663, "epoch": 2230} {"train_loss": -6.344576835632324, "global_step": 93664, "epoch": 2230} {"train_loss": -6.299259662628174, "global_step": 93665, "epoch": 2230} {"train_loss": -6.185806751251221, "global_step": 93666, "epoch": 2230} {"train_loss": -6.26310920715332, "global_step": 93667, "epoch": 2230} {"train_loss": -6.279038429260254, "global_step": 93668, "epoch": 2230} {"train_loss": -6.232544422149658, "global_step": 93669, "epoch": 2230} {"train_loss": -6.349556922912598, "global_step": 93670, "epoch": 2230} {"train_loss": -6.324723243713379, "global_step": 93671, "epoch": 2230} {"train_loss": -6.258525371551514, "global_step": 93672, "epoch": 2230} {"train_loss": -6.341805458068848, "global_step": 93673, "epoch": 2230} {"train_loss": -6.183659553527832, "global_step": 93674, "epoch": 2230} {"train_loss": -6.352288722991943, "global_step": 93675, "epoch": 2230} {"train_loss": -6.242170333862305, "global_step": 93676, "epoch": 2230} {"train_loss": -6.316252708435059, "global_step": 93677, "epoch": 2230} {"train_loss": -6.340939998626709, "global_step": 93678, "epoch": 2230} {"train_loss": -6.284463882446289, "global_step": 93679, "epoch": 2230} {"train_loss": -6.235536575317383, "global_step": 93680, "epoch": 2230} {"train_loss": -6.394230842590332, "global_step": 93681, "epoch": 2230} {"train_loss": -6.249937534332275, "global_step": 93682, "epoch": 2230} {"train_loss": -6.189054012298584, "global_step": 93683, "epoch": 2230} {"train_loss": -6.415103435516357, "global_step": 93684, "epoch": 2230} {"train_loss": -6.277369499206543, "global_step": 93685, "epoch": 2230} {"train_loss": -6.33310604095459, "global_step": 93686, "epoch": 2230} {"train_loss": -6.286841869354248, "global_step": 93687, "epoch": 2230} {"train_loss": -6.277703285217285, "global_step": 93688, "epoch": 2230} {"train_loss": -6.21958065032959, "global_step": 93689, "epoch": 2230} {"train_loss": -6.402630805969238, "global_step": 93690, "epoch": 2230} {"train_loss": -6.322011947631836, "global_step": 93691, "epoch": 2230} {"train_loss": -6.377124786376953, "global_step": 93692, "epoch": 2230} {"train_loss": -6.235009670257568, "global_step": 93693, "epoch": 2230} {"train_loss": -6.225075721740723, "global_step": 93694, "epoch": 2230} {"train_loss": -6.281011581420898, "global_step": 93695, "epoch": 2230} {"train_loss": -6.242710113525391, "global_step": 93696, "epoch": 2230} {"train_loss": -6.39902400970459, "global_step": 93697, "epoch": 2230} {"train_loss": -6.378055572509766, "global_step": 93698, "epoch": 2230} {"train_loss": -6.269326210021973, "global_step": 93699, "epoch": 2230} {"train_loss": -6.34633731842041, "global_step": 93700, "epoch": 2230} {"train_loss": -6.2869769505092075, "global_step": 93701, "epoch": 2230, "val_loss": 68006.8828125} {"train_loss": -6.332635402679443, "global_step": 93702, "epoch": 2231} {"train_loss": -6.317485332489014, "global_step": 93703, "epoch": 2231} {"train_loss": -6.342512130737305, "global_step": 93704, "epoch": 2231} {"train_loss": -6.264638900756836, "global_step": 93705, "epoch": 2231} {"train_loss": -6.14740514755249, "global_step": 93706, "epoch": 2231} {"train_loss": -6.350264549255371, "global_step": 93707, "epoch": 2231} {"train_loss": -6.222176551818848, "global_step": 93708, "epoch": 2231} {"train_loss": -6.324495792388916, "global_step": 93709, "epoch": 2231} {"train_loss": -6.188679218292236, "global_step": 93710, "epoch": 2231} {"train_loss": -6.339718341827393, "global_step": 93711, "epoch": 2231} {"train_loss": -6.353702545166016, "global_step": 93712, "epoch": 2231} {"train_loss": -6.277571678161621, "global_step": 93713, "epoch": 2231} {"train_loss": -6.315168857574463, "global_step": 93714, "epoch": 2231} {"train_loss": -6.317266464233398, "global_step": 93715, "epoch": 2231} {"train_loss": -6.409129619598389, "global_step": 93716, "epoch": 2231} {"train_loss": -6.32869291305542, "global_step": 93717, "epoch": 2231} {"train_loss": -6.26155948638916, "global_step": 93718, "epoch": 2231} {"train_loss": -6.228283882141113, "global_step": 93719, "epoch": 2231} {"train_loss": -6.278125286102295, "global_step": 93720, "epoch": 2231} {"train_loss": -6.385043621063232, "global_step": 93721, "epoch": 2231} {"train_loss": -6.2735443115234375, "global_step": 93722, "epoch": 2231} {"train_loss": -6.246906757354736, "global_step": 93723, "epoch": 2231} {"train_loss": -6.197812080383301, "global_step": 93724, "epoch": 2231} {"train_loss": -6.293814659118652, "global_step": 93725, "epoch": 2231} {"train_loss": -6.2566986083984375, "global_step": 93726, "epoch": 2231} {"train_loss": -6.244472503662109, "global_step": 93727, "epoch": 2231} {"train_loss": -6.225668907165527, "global_step": 93728, "epoch": 2231} {"train_loss": -6.2162909507751465, "global_step": 93729, "epoch": 2231} {"train_loss": -6.348689079284668, "global_step": 93730, "epoch": 2231} {"train_loss": -6.176753997802734, "global_step": 93731, "epoch": 2231} {"train_loss": -6.252529144287109, "global_step": 93732, "epoch": 2231} {"train_loss": -6.3352837562561035, "global_step": 93733, "epoch": 2231} {"train_loss": -6.286271095275879, "global_step": 93734, "epoch": 2231} {"train_loss": -6.185375213623047, "global_step": 93735, "epoch": 2231} {"train_loss": -6.097415447235107, "global_step": 93736, "epoch": 2231} {"train_loss": -6.175508975982666, "global_step": 93737, "epoch": 2231} {"train_loss": -6.156004905700684, "global_step": 93738, "epoch": 2231} {"train_loss": -6.182761192321777, "global_step": 93739, "epoch": 2231} {"train_loss": -6.171509265899658, "global_step": 93740, "epoch": 2231} {"train_loss": -6.031227111816406, "global_step": 93741, "epoch": 2231} {"train_loss": -6.32578182220459, "global_step": 93742, "epoch": 2231} {"train_loss": -6.253554094405401, "global_step": 93743, "epoch": 2231, "val_loss": 67986.546875} {"train_loss": -6.262538433074951, "global_step": 93744, "epoch": 2232} {"train_loss": -6.19638204574585, "global_step": 93745, "epoch": 2232} {"train_loss": -6.180952072143555, "global_step": 93746, "epoch": 2232} {"train_loss": -6.168118476867676, "global_step": 93747, "epoch": 2232} {"train_loss": -6.176821708679199, "global_step": 93748, "epoch": 2232} {"train_loss": -6.075671195983887, "global_step": 93749, "epoch": 2232} {"train_loss": -6.191128730773926, "global_step": 93750, "epoch": 2232} {"train_loss": -6.1019511222839355, "global_step": 93751, "epoch": 2232} {"train_loss": -6.291265487670898, "global_step": 93752, "epoch": 2232} {"train_loss": -6.051767349243164, "global_step": 93753, "epoch": 2232} {"train_loss": -6.18641996383667, "global_step": 93754, "epoch": 2232} {"train_loss": -6.271642208099365, "global_step": 93755, "epoch": 2232} {"train_loss": -6.260123252868652, "global_step": 93756, "epoch": 2232} {"train_loss": -6.245419502258301, "global_step": 93757, "epoch": 2232} {"train_loss": -6.273615837097168, "global_step": 93758, "epoch": 2232} {"train_loss": -6.142887115478516, "global_step": 93759, "epoch": 2232} {"train_loss": -6.244344711303711, "global_step": 93760, "epoch": 2232} {"train_loss": -6.2902703285217285, "global_step": 93761, "epoch": 2232} {"train_loss": -6.156386375427246, "global_step": 93762, "epoch": 2232} {"train_loss": -6.213942527770996, "global_step": 93763, "epoch": 2232} {"train_loss": -6.138577938079834, "global_step": 93764, "epoch": 2232} {"train_loss": -6.226229667663574, "global_step": 93765, "epoch": 2232} {"train_loss": -6.223590850830078, "global_step": 93766, "epoch": 2232} {"train_loss": -6.123680114746094, "global_step": 93767, "epoch": 2232} {"train_loss": -6.271886348724365, "global_step": 93768, "epoch": 2232} {"train_loss": -6.284659385681152, "global_step": 93769, "epoch": 2232} {"train_loss": -6.33119010925293, "global_step": 93770, "epoch": 2232} {"train_loss": -6.160464286804199, "global_step": 93771, "epoch": 2232} {"train_loss": -6.196653366088867, "global_step": 93772, "epoch": 2232} {"train_loss": -6.225131511688232, "global_step": 93773, "epoch": 2232} {"train_loss": -6.331253528594971, "global_step": 93774, "epoch": 2232} {"train_loss": -6.378022193908691, "global_step": 93775, "epoch": 2232} {"train_loss": -6.287152290344238, "global_step": 93776, "epoch": 2232} {"train_loss": -6.286664962768555, "global_step": 93777, "epoch": 2232} {"train_loss": -6.360232830047607, "global_step": 93778, "epoch": 2232} {"train_loss": -6.358851432800293, "global_step": 93779, "epoch": 2232} {"train_loss": -6.282864570617676, "global_step": 93780, "epoch": 2232} {"train_loss": -6.340805530548096, "global_step": 93781, "epoch": 2232} {"train_loss": -6.431370735168457, "global_step": 93782, "epoch": 2232} {"train_loss": -6.265962600708008, "global_step": 93783, "epoch": 2232} {"train_loss": -6.275881767272949, "global_step": 93784, "epoch": 2232} {"train_loss": -6.236387763704572, "global_step": 93785, "epoch": 2232, "val_loss": 67824.375} {"train_loss": -6.44641637802124, "global_step": 93786, "epoch": 2233} {"train_loss": -6.29482364654541, "global_step": 93787, "epoch": 2233} {"train_loss": -6.2309465408325195, "global_step": 93788, "epoch": 2233} {"train_loss": -6.278916358947754, "global_step": 93789, "epoch": 2233} {"train_loss": -6.2742204666137695, "global_step": 93790, "epoch": 2233} {"train_loss": -6.311770915985107, "global_step": 93791, "epoch": 2233} {"train_loss": -6.330632209777832, "global_step": 93792, "epoch": 2233} {"train_loss": -6.339105606079102, "global_step": 93793, "epoch": 2233} {"train_loss": -6.3974289894104, "global_step": 93794, "epoch": 2233} {"train_loss": -6.319908142089844, "global_step": 93795, "epoch": 2233} {"train_loss": -6.279880523681641, "global_step": 93796, "epoch": 2233} {"train_loss": -6.276841640472412, "global_step": 93797, "epoch": 2233} {"train_loss": -6.202171325683594, "global_step": 93798, "epoch": 2233} {"train_loss": -6.270768642425537, "global_step": 93799, "epoch": 2233} {"train_loss": -6.458502769470215, "global_step": 93800, "epoch": 2233} {"train_loss": -6.322947025299072, "global_step": 93801, "epoch": 2233} {"train_loss": -6.277157783508301, "global_step": 93802, "epoch": 2233} {"train_loss": -6.311999320983887, "global_step": 93803, "epoch": 2233} {"train_loss": -6.229105472564697, "global_step": 93804, "epoch": 2233} {"train_loss": -6.368046760559082, "global_step": 93805, "epoch": 2233} {"train_loss": -6.259686470031738, "global_step": 93806, "epoch": 2233} {"train_loss": -6.2715301513671875, "global_step": 93807, "epoch": 2233} {"train_loss": -6.326598167419434, "global_step": 93808, "epoch": 2233} {"train_loss": -6.283095359802246, "global_step": 93809, "epoch": 2233} {"train_loss": -6.380781173706055, "global_step": 93810, "epoch": 2233} {"train_loss": -6.337942123413086, "global_step": 93811, "epoch": 2233} {"train_loss": -6.347731113433838, "global_step": 93812, "epoch": 2233} {"train_loss": -6.251365661621094, "global_step": 93813, "epoch": 2233} {"train_loss": -6.380646705627441, "global_step": 93814, "epoch": 2233} {"train_loss": -6.413643836975098, "global_step": 93815, "epoch": 2233} {"train_loss": -6.297762870788574, "global_step": 93816, "epoch": 2233} {"train_loss": -6.287396430969238, "global_step": 93817, "epoch": 2233} {"train_loss": -6.1863298416137695, "global_step": 93818, "epoch": 2233} {"train_loss": -6.223146915435791, "global_step": 93819, "epoch": 2233} {"train_loss": -6.251323699951172, "global_step": 93820, "epoch": 2233} {"train_loss": -6.365337371826172, "global_step": 93821, "epoch": 2233} {"train_loss": -6.37911319732666, "global_step": 93822, "epoch": 2233} {"train_loss": -6.3284406661987305, "global_step": 93823, "epoch": 2233} {"train_loss": -6.295678615570068, "global_step": 93824, "epoch": 2233} {"train_loss": -6.215878963470459, "global_step": 93825, "epoch": 2233} {"train_loss": -6.227693557739258, "global_step": 93826, "epoch": 2233} {"train_loss": -6.304773012797038, "global_step": 93827, "epoch": 2233, "val_loss": 67772.1171875} {"train_loss": -6.475053310394287, "global_step": 93828, "epoch": 2234} {"train_loss": -6.381561279296875, "global_step": 93829, "epoch": 2234} {"train_loss": -6.292819976806641, "global_step": 93830, "epoch": 2234} {"train_loss": -6.3303327560424805, "global_step": 93831, "epoch": 2234} {"train_loss": -6.2375898361206055, "global_step": 93832, "epoch": 2234} {"train_loss": -6.228709697723389, "global_step": 93833, "epoch": 2234} {"train_loss": -6.160121440887451, "global_step": 93834, "epoch": 2234} {"train_loss": -6.124608039855957, "global_step": 93835, "epoch": 2234} {"train_loss": -6.181289196014404, "global_step": 93836, "epoch": 2234} {"train_loss": -6.230546951293945, "global_step": 93837, "epoch": 2234} {"train_loss": -6.231827259063721, "global_step": 93838, "epoch": 2234} {"train_loss": -6.171562194824219, "global_step": 93839, "epoch": 2234} {"train_loss": -6.2534990310668945, "global_step": 93840, "epoch": 2234} {"train_loss": -6.2354631423950195, "global_step": 93841, "epoch": 2234} {"train_loss": -6.265453338623047, "global_step": 93842, "epoch": 2234} {"train_loss": -6.302824974060059, "global_step": 93843, "epoch": 2234} {"train_loss": -6.237585067749023, "global_step": 93844, "epoch": 2234} {"train_loss": -6.351927757263184, "global_step": 93845, "epoch": 2234} {"train_loss": -6.252019882202148, "global_step": 93846, "epoch": 2234} {"train_loss": -6.275486946105957, "global_step": 93847, "epoch": 2234} {"train_loss": -6.263721466064453, "global_step": 93848, "epoch": 2234} {"train_loss": -6.368720054626465, "global_step": 93849, "epoch": 2234} {"train_loss": -6.256490707397461, "global_step": 93850, "epoch": 2234} {"train_loss": -6.291604042053223, "global_step": 93851, "epoch": 2234} {"train_loss": -6.185011863708496, "global_step": 93852, "epoch": 2234} {"train_loss": -6.069392681121826, "global_step": 93853, "epoch": 2234} {"train_loss": -6.135152816772461, "global_step": 93854, "epoch": 2234} {"train_loss": -6.270956039428711, "global_step": 93855, "epoch": 2234} {"train_loss": -6.313610553741455, "global_step": 93856, "epoch": 2234} {"train_loss": -6.281068325042725, "global_step": 93857, "epoch": 2234} {"train_loss": -6.217063903808594, "global_step": 93858, "epoch": 2234} {"train_loss": -6.176944732666016, "global_step": 93859, "epoch": 2234} {"train_loss": -6.305685043334961, "global_step": 93860, "epoch": 2234} {"train_loss": -6.261979579925537, "global_step": 93861, "epoch": 2234} {"train_loss": -6.247984886169434, "global_step": 93862, "epoch": 2234} {"train_loss": -6.369841575622559, "global_step": 93863, "epoch": 2234} {"train_loss": -6.213648796081543, "global_step": 93864, "epoch": 2234} {"train_loss": -6.2869486808776855, "global_step": 93865, "epoch": 2234} {"train_loss": -6.275397777557373, "global_step": 93866, "epoch": 2234} {"train_loss": -6.394037246704102, "global_step": 93867, "epoch": 2234} {"train_loss": -6.286494731903076, "global_step": 93868, "epoch": 2234} {"train_loss": -6.259167092187064, "global_step": 93869, "epoch": 2234, "val_loss": 68027.6015625} {"train_loss": -6.23995304107666, "global_step": 93870, "epoch": 2235} {"train_loss": -6.291255474090576, "global_step": 93871, "epoch": 2235} {"train_loss": -6.291159629821777, "global_step": 93872, "epoch": 2235} {"train_loss": -6.392200469970703, "global_step": 93873, "epoch": 2235} {"train_loss": -6.272055149078369, "global_step": 93874, "epoch": 2235} {"train_loss": -6.2679572105407715, "global_step": 93875, "epoch": 2235} {"train_loss": -6.259368419647217, "global_step": 93876, "epoch": 2235} {"train_loss": -6.281282901763916, "global_step": 93877, "epoch": 2235} {"train_loss": -6.1847381591796875, "global_step": 93878, "epoch": 2235} {"train_loss": -6.349405288696289, "global_step": 93879, "epoch": 2235} {"train_loss": -6.341472148895264, "global_step": 93880, "epoch": 2235} {"train_loss": -6.292856693267822, "global_step": 93881, "epoch": 2235} {"train_loss": -6.292423248291016, "global_step": 93882, "epoch": 2235} {"train_loss": -6.274683952331543, "global_step": 93883, "epoch": 2235} {"train_loss": -6.318872451782227, "global_step": 93884, "epoch": 2235} {"train_loss": -6.290825843811035, "global_step": 93885, "epoch": 2235} {"train_loss": -6.30463981628418, "global_step": 93886, "epoch": 2235} {"train_loss": -6.3817138671875, "global_step": 93887, "epoch": 2235} {"train_loss": -6.255702018737793, "global_step": 93888, "epoch": 2235} {"train_loss": -6.271478176116943, "global_step": 93889, "epoch": 2235} {"train_loss": -6.127738952636719, "global_step": 93890, "epoch": 2235} {"train_loss": -6.289656639099121, "global_step": 93891, "epoch": 2235} {"train_loss": -6.137914657592773, "global_step": 93892, "epoch": 2235} {"train_loss": -6.1034040451049805, "global_step": 93893, "epoch": 2235} {"train_loss": -6.112089157104492, "global_step": 93894, "epoch": 2235} {"train_loss": -6.212838172912598, "global_step": 93895, "epoch": 2235} {"train_loss": -6.1727986335754395, "global_step": 93896, "epoch": 2235} {"train_loss": -6.325825214385986, "global_step": 93897, "epoch": 2235} {"train_loss": -6.285942077636719, "global_step": 93898, "epoch": 2235} {"train_loss": -6.267441749572754, "global_step": 93899, "epoch": 2235} {"train_loss": -6.283069133758545, "global_step": 93900, "epoch": 2235} {"train_loss": -6.293877601623535, "global_step": 93901, "epoch": 2235} {"train_loss": -6.314560890197754, "global_step": 93902, "epoch": 2235} {"train_loss": -6.122103214263916, "global_step": 93903, "epoch": 2235} {"train_loss": -6.182483196258545, "global_step": 93904, "epoch": 2235} {"train_loss": -6.2786784172058105, "global_step": 93905, "epoch": 2235} {"train_loss": -6.177457809448242, "global_step": 93906, "epoch": 2235} {"train_loss": -6.299492835998535, "global_step": 93907, "epoch": 2235} {"train_loss": -6.234048843383789, "global_step": 93908, "epoch": 2235} {"train_loss": -6.242814064025879, "global_step": 93909, "epoch": 2235} {"train_loss": -6.292150497436523, "global_step": 93910, "epoch": 2235} {"train_loss": -6.25764723051162, "global_step": 93911, "epoch": 2235, "val_loss": 67856.1015625} {"train_loss": -6.222540855407715, "global_step": 93912, "epoch": 2236} {"train_loss": -6.324776649475098, "global_step": 93913, "epoch": 2236} {"train_loss": -6.352387428283691, "global_step": 93914, "epoch": 2236} {"train_loss": -6.3099799156188965, "global_step": 93915, "epoch": 2236} {"train_loss": -6.306844711303711, "global_step": 93916, "epoch": 2236} {"train_loss": -6.300271034240723, "global_step": 93917, "epoch": 2236} {"train_loss": -6.372119426727295, "global_step": 93918, "epoch": 2236} {"train_loss": -6.300080299377441, "global_step": 93919, "epoch": 2236} {"train_loss": -6.185795783996582, "global_step": 93920, "epoch": 2236} {"train_loss": -6.276240348815918, "global_step": 93921, "epoch": 2236} {"train_loss": -6.26998233795166, "global_step": 93922, "epoch": 2236} {"train_loss": -6.252318382263184, "global_step": 93923, "epoch": 2236} {"train_loss": -6.403254508972168, "global_step": 93924, "epoch": 2236} {"train_loss": -6.420976161956787, "global_step": 93925, "epoch": 2236} {"train_loss": -6.230733394622803, "global_step": 93926, "epoch": 2236} {"train_loss": -6.247966289520264, "global_step": 93927, "epoch": 2236} {"train_loss": -6.313077449798584, "global_step": 93928, "epoch": 2236} {"train_loss": -6.288893222808838, "global_step": 93929, "epoch": 2236} {"train_loss": -6.122403621673584, "global_step": 93930, "epoch": 2236} {"train_loss": -6.317415237426758, "global_step": 93931, "epoch": 2236} {"train_loss": -6.227224349975586, "global_step": 93932, "epoch": 2236} {"train_loss": -6.31821870803833, "global_step": 93933, "epoch": 2236} {"train_loss": -6.284937858581543, "global_step": 93934, "epoch": 2236} {"train_loss": -6.2937421798706055, "global_step": 93935, "epoch": 2236} {"train_loss": -6.321393966674805, "global_step": 93936, "epoch": 2236} {"train_loss": -6.378250598907471, "global_step": 93937, "epoch": 2236} {"train_loss": -6.160844802856445, "global_step": 93938, "epoch": 2236} {"train_loss": -6.348570346832275, "global_step": 93939, "epoch": 2236} {"train_loss": -6.15119743347168, "global_step": 93940, "epoch": 2236} {"train_loss": -6.175209045410156, "global_step": 93941, "epoch": 2236} {"train_loss": -6.194365501403809, "global_step": 93942, "epoch": 2236} {"train_loss": -6.25080680847168, "global_step": 93943, "epoch": 2236} {"train_loss": -6.341568470001221, "global_step": 93944, "epoch": 2236} {"train_loss": -6.289111614227295, "global_step": 93945, "epoch": 2236} {"train_loss": -6.281569480895996, "global_step": 93946, "epoch": 2236} {"train_loss": -6.4455413818359375, "global_step": 93947, "epoch": 2236} {"train_loss": -6.227246284484863, "global_step": 93948, "epoch": 2236} {"train_loss": -6.280099391937256, "global_step": 93949, "epoch": 2236} {"train_loss": -6.23692512512207, "global_step": 93950, "epoch": 2236} {"train_loss": -6.3233642578125, "global_step": 93951, "epoch": 2236} {"train_loss": -6.190464019775391, "global_step": 93952, "epoch": 2236} {"train_loss": -6.286607027053833, "global_step": 93953, "epoch": 2236, "val_loss": 67761.8671875} {"train_loss": -6.4371232986450195, "global_step": 93954, "epoch": 2237} {"train_loss": -6.253190040588379, "global_step": 93955, "epoch": 2237} {"train_loss": -6.293497085571289, "global_step": 93956, "epoch": 2237} {"train_loss": -6.1928863525390625, "global_step": 93957, "epoch": 2237} {"train_loss": -6.322449684143066, "global_step": 93958, "epoch": 2237} {"train_loss": -6.234556198120117, "global_step": 93959, "epoch": 2237} {"train_loss": -6.30928373336792, "global_step": 93960, "epoch": 2237} {"train_loss": -6.343092441558838, "global_step": 93961, "epoch": 2237} {"train_loss": -6.31040096282959, "global_step": 93962, "epoch": 2237} {"train_loss": -6.30545711517334, "global_step": 93963, "epoch": 2237} {"train_loss": -6.263759613037109, "global_step": 93964, "epoch": 2237} {"train_loss": -6.2988996505737305, "global_step": 93965, "epoch": 2237} {"train_loss": -6.243832588195801, "global_step": 93966, "epoch": 2237} {"train_loss": -6.369913578033447, "global_step": 93967, "epoch": 2237} {"train_loss": -6.187870979309082, "global_step": 93968, "epoch": 2237} {"train_loss": -6.177822589874268, "global_step": 93969, "epoch": 2237} {"train_loss": -6.274847030639648, "global_step": 93970, "epoch": 2237} {"train_loss": -6.175500869750977, "global_step": 93971, "epoch": 2237} {"train_loss": -6.213014125823975, "global_step": 93972, "epoch": 2237} {"train_loss": -6.135372161865234, "global_step": 93973, "epoch": 2237} {"train_loss": -6.01252555847168, "global_step": 93974, "epoch": 2237} {"train_loss": -6.281402111053467, "global_step": 93975, "epoch": 2237} {"train_loss": -6.239285469055176, "global_step": 93976, "epoch": 2237} {"train_loss": -6.26754093170166, "global_step": 93977, "epoch": 2237} {"train_loss": -6.14130973815918, "global_step": 93978, "epoch": 2237} {"train_loss": -6.299646854400635, "global_step": 93979, "epoch": 2237} {"train_loss": -6.171079158782959, "global_step": 93980, "epoch": 2237} {"train_loss": -6.265132904052734, "global_step": 93981, "epoch": 2237} {"train_loss": -6.17202615737915, "global_step": 93982, "epoch": 2237} {"train_loss": -6.406679153442383, "global_step": 93983, "epoch": 2237} {"train_loss": -6.337450981140137, "global_step": 93984, "epoch": 2237} {"train_loss": -6.159423828125, "global_step": 93985, "epoch": 2237} {"train_loss": -6.342318534851074, "global_step": 93986, "epoch": 2237} {"train_loss": -6.203878879547119, "global_step": 93987, "epoch": 2237} {"train_loss": -6.18710994720459, "global_step": 93988, "epoch": 2237} {"train_loss": -6.235562324523926, "global_step": 93989, "epoch": 2237} {"train_loss": -6.254794597625732, "global_step": 93990, "epoch": 2237} {"train_loss": -6.370928764343262, "global_step": 93991, "epoch": 2237} {"train_loss": -6.292682647705078, "global_step": 93992, "epoch": 2237} {"train_loss": -6.205674171447754, "global_step": 93993, "epoch": 2237} {"train_loss": -6.395174026489258, "global_step": 93994, "epoch": 2237} {"train_loss": -6.2589301495325, "global_step": 93995, "epoch": 2237, "val_loss": 67757.5625} {"train_loss": -6.263425350189209, "global_step": 93996, "epoch": 2238} {"train_loss": -6.250284194946289, "global_step": 93997, "epoch": 2238} {"train_loss": -6.282390594482422, "global_step": 93998, "epoch": 2238} {"train_loss": -6.275620937347412, "global_step": 93999, "epoch": 2238} {"train_loss": -6.339509010314941, "global_step": 94000, "epoch": 2238} {"train_loss": -6.323213577270508, "global_step": 94001, "epoch": 2238} {"train_loss": -6.328666687011719, "global_step": 94002, "epoch": 2238} {"train_loss": -6.249025344848633, "global_step": 94003, "epoch": 2238} {"train_loss": -6.254351615905762, "global_step": 94004, "epoch": 2238} {"train_loss": -6.290848255157471, "global_step": 94005, "epoch": 2238} {"train_loss": -6.174727439880371, "global_step": 94006, "epoch": 2238} {"train_loss": -6.332780838012695, "global_step": 94007, "epoch": 2238} {"train_loss": -6.11827278137207, "global_step": 94008, "epoch": 2238} {"train_loss": -6.232356071472168, "global_step": 94009, "epoch": 2238} {"train_loss": -6.2699480056762695, "global_step": 94010, "epoch": 2238} {"train_loss": -6.21794319152832, "global_step": 94011, "epoch": 2238} {"train_loss": -6.185051918029785, "global_step": 94012, "epoch": 2238} {"train_loss": -6.152035713195801, "global_step": 94013, "epoch": 2238} {"train_loss": -6.2378339767456055, "global_step": 94014, "epoch": 2238} {"train_loss": -6.284558296203613, "global_step": 94015, "epoch": 2238} {"train_loss": -6.2272210121154785, "global_step": 94016, "epoch": 2238} {"train_loss": -6.095592498779297, "global_step": 94017, "epoch": 2238} {"train_loss": -6.099254608154297, "global_step": 94018, "epoch": 2238} {"train_loss": -6.218457221984863, "global_step": 94019, "epoch": 2238} {"train_loss": -6.196728706359863, "global_step": 94020, "epoch": 2238} {"train_loss": -6.235084056854248, "global_step": 94021, "epoch": 2238} {"train_loss": -6.275601387023926, "global_step": 94022, "epoch": 2238} {"train_loss": -6.175246238708496, "global_step": 94023, "epoch": 2238} {"train_loss": -6.276333808898926, "global_step": 94024, "epoch": 2238} {"train_loss": -6.237175941467285, "global_step": 94025, "epoch": 2238} {"train_loss": -6.218310356140137, "global_step": 94026, "epoch": 2238} {"train_loss": -6.096928596496582, "global_step": 94027, "epoch": 2238} {"train_loss": -6.241930961608887, "global_step": 94028, "epoch": 2238} {"train_loss": -6.297972679138184, "global_step": 94029, "epoch": 2238} {"train_loss": -6.200958251953125, "global_step": 94030, "epoch": 2238} {"train_loss": -6.38568115234375, "global_step": 94031, "epoch": 2238} {"train_loss": -6.188187122344971, "global_step": 94032, "epoch": 2238} {"train_loss": -6.326937675476074, "global_step": 94033, "epoch": 2238} {"train_loss": -6.2811737060546875, "global_step": 94034, "epoch": 2238} {"train_loss": -6.253929138183594, "global_step": 94035, "epoch": 2238} {"train_loss": -6.276739120483398, "global_step": 94036, "epoch": 2238} {"train_loss": -6.241812274569557, "global_step": 94037, "epoch": 2238, "val_loss": 67983.15625} {"train_loss": -6.309745788574219, "global_step": 94038, "epoch": 2239} {"train_loss": -6.362931728363037, "global_step": 94039, "epoch": 2239} {"train_loss": -6.431839466094971, "global_step": 94040, "epoch": 2239} {"train_loss": -6.325355529785156, "global_step": 94041, "epoch": 2239} {"train_loss": -6.250103950500488, "global_step": 94042, "epoch": 2239} {"train_loss": -6.308720588684082, "global_step": 94043, "epoch": 2239} {"train_loss": -6.415609359741211, "global_step": 94044, "epoch": 2239} {"train_loss": -6.414876937866211, "global_step": 94045, "epoch": 2239} {"train_loss": -6.211389064788818, "global_step": 94046, "epoch": 2239} {"train_loss": -6.312117576599121, "global_step": 94047, "epoch": 2239} {"train_loss": -6.3106489181518555, "global_step": 94048, "epoch": 2239} {"train_loss": -6.225825309753418, "global_step": 94049, "epoch": 2239} {"train_loss": -6.220436096191406, "global_step": 94050, "epoch": 2239} {"train_loss": -6.192253112792969, "global_step": 94051, "epoch": 2239} {"train_loss": -6.059208869934082, "global_step": 94052, "epoch": 2239} {"train_loss": -6.303285598754883, "global_step": 94053, "epoch": 2239} {"train_loss": -6.2736663818359375, "global_step": 94054, "epoch": 2239} {"train_loss": -6.215662479400635, "global_step": 94055, "epoch": 2239} {"train_loss": -6.337754249572754, "global_step": 94056, "epoch": 2239} {"train_loss": -6.245431900024414, "global_step": 94057, "epoch": 2239} {"train_loss": -6.210989952087402, "global_step": 94058, "epoch": 2239} {"train_loss": -6.252307891845703, "global_step": 94059, "epoch": 2239} {"train_loss": -6.4130096435546875, "global_step": 94060, "epoch": 2239} {"train_loss": -6.2416205406188965, "global_step": 94061, "epoch": 2239} {"train_loss": -6.267538070678711, "global_step": 94062, "epoch": 2239} {"train_loss": -6.232397079467773, "global_step": 94063, "epoch": 2239} {"train_loss": -6.308784484863281, "global_step": 94064, "epoch": 2239} {"train_loss": -6.3263421058654785, "global_step": 94065, "epoch": 2239} {"train_loss": -6.25331974029541, "global_step": 94066, "epoch": 2239} {"train_loss": -6.194263458251953, "global_step": 94067, "epoch": 2239} {"train_loss": -6.3315935134887695, "global_step": 94068, "epoch": 2239} {"train_loss": -6.440706729888916, "global_step": 94069, "epoch": 2239} {"train_loss": -6.181300163269043, "global_step": 94070, "epoch": 2239} {"train_loss": -6.230603218078613, "global_step": 94071, "epoch": 2239} {"train_loss": -6.2645263671875, "global_step": 94072, "epoch": 2239} {"train_loss": -6.301064491271973, "global_step": 94073, "epoch": 2239} {"train_loss": -6.250126361846924, "global_step": 94074, "epoch": 2239} {"train_loss": -6.248133659362793, "global_step": 94075, "epoch": 2239} {"train_loss": -6.205536365509033, "global_step": 94076, "epoch": 2239} {"train_loss": -6.19063663482666, "global_step": 94077, "epoch": 2239} {"train_loss": -6.252695083618164, "global_step": 94078, "epoch": 2239} {"train_loss": -6.277684961046491, "global_step": 94079, "epoch": 2239, "val_loss": 67940.3046875} {"train_loss": -6.334587097167969, "global_step": 94080, "epoch": 2240} {"train_loss": -6.2234601974487305, "global_step": 94081, "epoch": 2240} {"train_loss": -6.303980350494385, "global_step": 94082, "epoch": 2240} {"train_loss": -6.30394983291626, "global_step": 94083, "epoch": 2240} {"train_loss": -6.279302597045898, "global_step": 94084, "epoch": 2240} {"train_loss": -6.339719295501709, "global_step": 94085, "epoch": 2240} {"train_loss": -6.25955867767334, "global_step": 94086, "epoch": 2240} {"train_loss": -6.356374740600586, "global_step": 94087, "epoch": 2240} {"train_loss": -6.294524192810059, "global_step": 94088, "epoch": 2240} {"train_loss": -6.2889814376831055, "global_step": 94089, "epoch": 2240} {"train_loss": -6.308371543884277, "global_step": 94090, "epoch": 2240} {"train_loss": -6.2794036865234375, "global_step": 94091, "epoch": 2240} {"train_loss": -6.1993207931518555, "global_step": 94092, "epoch": 2240} {"train_loss": -6.338536262512207, "global_step": 94093, "epoch": 2240} {"train_loss": -6.288691997528076, "global_step": 94094, "epoch": 2240} {"train_loss": -6.293633460998535, "global_step": 94095, "epoch": 2240} {"train_loss": -6.373295307159424, "global_step": 94096, "epoch": 2240} {"train_loss": -6.262693405151367, "global_step": 94097, "epoch": 2240} {"train_loss": -6.2364349365234375, "global_step": 94098, "epoch": 2240} {"train_loss": -6.2751359939575195, "global_step": 94099, "epoch": 2240} {"train_loss": -6.171260833740234, "global_step": 94100, "epoch": 2240} {"train_loss": -6.244699478149414, "global_step": 94101, "epoch": 2240} {"train_loss": -6.190098762512207, "global_step": 94102, "epoch": 2240} {"train_loss": -6.43028450012207, "global_step": 94103, "epoch": 2240} {"train_loss": -6.223366737365723, "global_step": 94104, "epoch": 2240} {"train_loss": -6.360785007476807, "global_step": 94105, "epoch": 2240} {"train_loss": -6.237617492675781, "global_step": 94106, "epoch": 2240} {"train_loss": -6.262923240661621, "global_step": 94107, "epoch": 2240} {"train_loss": -6.295422554016113, "global_step": 94108, "epoch": 2240} {"train_loss": -6.317887306213379, "global_step": 94109, "epoch": 2240} {"train_loss": -6.180751800537109, "global_step": 94110, "epoch": 2240} {"train_loss": -6.25950813293457, "global_step": 94111, "epoch": 2240} {"train_loss": -6.29945182800293, "global_step": 94112, "epoch": 2240} {"train_loss": -6.246984481811523, "global_step": 94113, "epoch": 2240} {"train_loss": -6.2089738845825195, "global_step": 94114, "epoch": 2240} {"train_loss": -6.232856273651123, "global_step": 94115, "epoch": 2240} {"train_loss": -6.303483963012695, "global_step": 94116, "epoch": 2240} {"train_loss": -6.281249046325684, "global_step": 94117, "epoch": 2240} {"train_loss": -6.308701515197754, "global_step": 94118, "epoch": 2240} {"train_loss": -6.13416051864624, "global_step": 94119, "epoch": 2240} {"train_loss": -6.200479507446289, "global_step": 94120, "epoch": 2240} {"train_loss": -6.271463121686663, "global_step": 94121, "epoch": 2240, "val_loss": 67901.96875} {"train_loss": -6.244690895080566, "global_step": 94122, "epoch": 2241} {"train_loss": -6.120858192443848, "global_step": 94123, "epoch": 2241} {"train_loss": -6.166962623596191, "global_step": 94124, "epoch": 2241} {"train_loss": -6.329133987426758, "global_step": 94125, "epoch": 2241} {"train_loss": -6.300885200500488, "global_step": 94126, "epoch": 2241} {"train_loss": -6.085420608520508, "global_step": 94127, "epoch": 2241} {"train_loss": -6.460694313049316, "global_step": 94128, "epoch": 2241} {"train_loss": -6.137912273406982, "global_step": 94129, "epoch": 2241} {"train_loss": -6.264378547668457, "global_step": 94130, "epoch": 2241} {"train_loss": -6.278120994567871, "global_step": 94131, "epoch": 2241} {"train_loss": -6.2060699462890625, "global_step": 94132, "epoch": 2241} {"train_loss": -6.269512176513672, "global_step": 94133, "epoch": 2241} {"train_loss": -6.235474109649658, "global_step": 94134, "epoch": 2241} {"train_loss": -6.415719032287598, "global_step": 94135, "epoch": 2241} {"train_loss": -6.274896144866943, "global_step": 94136, "epoch": 2241} {"train_loss": -6.2177839279174805, "global_step": 94137, "epoch": 2241} {"train_loss": -6.236917495727539, "global_step": 94138, "epoch": 2241} {"train_loss": -6.223343849182129, "global_step": 94139, "epoch": 2241} {"train_loss": -6.223982810974121, "global_step": 94140, "epoch": 2241} {"train_loss": -6.218491554260254, "global_step": 94141, "epoch": 2241} {"train_loss": -6.231444358825684, "global_step": 94142, "epoch": 2241} {"train_loss": -6.294761657714844, "global_step": 94143, "epoch": 2241} {"train_loss": -6.185293674468994, "global_step": 94144, "epoch": 2241} {"train_loss": -6.297615051269531, "global_step": 94145, "epoch": 2241} {"train_loss": -6.390373706817627, "global_step": 94146, "epoch": 2241} {"train_loss": -6.311868190765381, "global_step": 94147, "epoch": 2241} {"train_loss": -6.316947937011719, "global_step": 94148, "epoch": 2241} {"train_loss": -6.341022491455078, "global_step": 94149, "epoch": 2241} {"train_loss": -6.343703269958496, "global_step": 94150, "epoch": 2241} {"train_loss": -6.340762138366699, "global_step": 94151, "epoch": 2241} {"train_loss": -6.2277326583862305, "global_step": 94152, "epoch": 2241} {"train_loss": -6.211521625518799, "global_step": 94153, "epoch": 2241} {"train_loss": -6.291411399841309, "global_step": 94154, "epoch": 2241} {"train_loss": -6.159091949462891, "global_step": 94155, "epoch": 2241} {"train_loss": -6.291581630706787, "global_step": 94156, "epoch": 2241} {"train_loss": -6.301848411560059, "global_step": 94157, "epoch": 2241} {"train_loss": -6.35037899017334, "global_step": 94158, "epoch": 2241} {"train_loss": -6.291166305541992, "global_step": 94159, "epoch": 2241} {"train_loss": -6.14068603515625, "global_step": 94160, "epoch": 2241} {"train_loss": -6.146007537841797, "global_step": 94161, "epoch": 2241} {"train_loss": -6.3763508796691895, "global_step": 94162, "epoch": 2241} {"train_loss": -6.259377138955252, "global_step": 94163, "epoch": 2241, "val_loss": 67850.921875} {"train_loss": -6.2906084060668945, "global_step": 94164, "epoch": 2242} {"train_loss": -6.2433271408081055, "global_step": 94165, "epoch": 2242} {"train_loss": -6.209782600402832, "global_step": 94166, "epoch": 2242} {"train_loss": -6.371689796447754, "global_step": 94167, "epoch": 2242} {"train_loss": -6.373160362243652, "global_step": 94168, "epoch": 2242} {"train_loss": -6.261466979980469, "global_step": 94169, "epoch": 2242} {"train_loss": -6.241823196411133, "global_step": 94170, "epoch": 2242} {"train_loss": -6.263461112976074, "global_step": 94171, "epoch": 2242} {"train_loss": -6.229320526123047, "global_step": 94172, "epoch": 2242} {"train_loss": -6.293996810913086, "global_step": 94173, "epoch": 2242} {"train_loss": -6.229700088500977, "global_step": 94174, "epoch": 2242} {"train_loss": -6.243032455444336, "global_step": 94175, "epoch": 2242} {"train_loss": -6.232905387878418, "global_step": 94176, "epoch": 2242} {"train_loss": -6.354248046875, "global_step": 94177, "epoch": 2242} {"train_loss": -6.273126602172852, "global_step": 94178, "epoch": 2242} {"train_loss": -6.127342224121094, "global_step": 94179, "epoch": 2242} {"train_loss": -6.211526870727539, "global_step": 94180, "epoch": 2242} {"train_loss": -6.271864891052246, "global_step": 94181, "epoch": 2242} {"train_loss": -6.194924354553223, "global_step": 94182, "epoch": 2242} {"train_loss": -6.1382317543029785, "global_step": 94183, "epoch": 2242} {"train_loss": -6.270129680633545, "global_step": 94184, "epoch": 2242} {"train_loss": -6.310805797576904, "global_step": 94185, "epoch": 2242} {"train_loss": -6.1851487159729, "global_step": 94186, "epoch": 2242} {"train_loss": -6.395159721374512, "global_step": 94187, "epoch": 2242} {"train_loss": -6.252702713012695, "global_step": 94188, "epoch": 2242} {"train_loss": -6.283665657043457, "global_step": 94189, "epoch": 2242} {"train_loss": -6.293025970458984, "global_step": 94190, "epoch": 2242} {"train_loss": -6.389374256134033, "global_step": 94191, "epoch": 2242} {"train_loss": -6.274320602416992, "global_step": 94192, "epoch": 2242} {"train_loss": -6.298398971557617, "global_step": 94193, "epoch": 2242} {"train_loss": -6.293875694274902, "global_step": 94194, "epoch": 2242} {"train_loss": -6.329821586608887, "global_step": 94195, "epoch": 2242} {"train_loss": -6.261478424072266, "global_step": 94196, "epoch": 2242} {"train_loss": -6.317000389099121, "global_step": 94197, "epoch": 2242} {"train_loss": -6.239131927490234, "global_step": 94198, "epoch": 2242} {"train_loss": -6.167360305786133, "global_step": 94199, "epoch": 2242} {"train_loss": -6.314258575439453, "global_step": 94200, "epoch": 2242} {"train_loss": -6.249814987182617, "global_step": 94201, "epoch": 2242} {"train_loss": -6.276294231414795, "global_step": 94202, "epoch": 2242} {"train_loss": -6.299920558929443, "global_step": 94203, "epoch": 2242} {"train_loss": -6.379217624664307, "global_step": 94204, "epoch": 2242} {"train_loss": -6.271373340061733, "global_step": 94205, "epoch": 2242, "val_loss": 67667.6953125} {"train_loss": -6.322879791259766, "global_step": 94206, "epoch": 2243} {"train_loss": -6.298433780670166, "global_step": 94207, "epoch": 2243} {"train_loss": -6.275007247924805, "global_step": 94208, "epoch": 2243} {"train_loss": -6.306440830230713, "global_step": 94209, "epoch": 2243} {"train_loss": -6.223816871643066, "global_step": 94210, "epoch": 2243} {"train_loss": -6.239572525024414, "global_step": 94211, "epoch": 2243} {"train_loss": -6.303958892822266, "global_step": 94212, "epoch": 2243} {"train_loss": -6.2174153327941895, "global_step": 94213, "epoch": 2243} {"train_loss": -6.23798131942749, "global_step": 94214, "epoch": 2243} {"train_loss": -6.212780952453613, "global_step": 94215, "epoch": 2243} {"train_loss": -6.365264415740967, "global_step": 94216, "epoch": 2243} {"train_loss": -6.230793476104736, "global_step": 94217, "epoch": 2243} {"train_loss": -6.178330421447754, "global_step": 94218, "epoch": 2243} {"train_loss": -6.308112144470215, "global_step": 94219, "epoch": 2243} {"train_loss": -6.32924747467041, "global_step": 94220, "epoch": 2243} {"train_loss": -6.239847183227539, "global_step": 94221, "epoch": 2243} {"train_loss": -6.313348770141602, "global_step": 94222, "epoch": 2243} {"train_loss": -6.411837100982666, "global_step": 94223, "epoch": 2243} {"train_loss": -6.358935356140137, "global_step": 94224, "epoch": 2243} {"train_loss": -6.134490489959717, "global_step": 94225, "epoch": 2243} {"train_loss": -6.325062274932861, "global_step": 94226, "epoch": 2243} {"train_loss": -6.384575366973877, "global_step": 94227, "epoch": 2243} {"train_loss": -6.391864776611328, "global_step": 94228, "epoch": 2243} {"train_loss": -6.219083309173584, "global_step": 94229, "epoch": 2243} {"train_loss": -6.206618309020996, "global_step": 94230, "epoch": 2243} {"train_loss": -6.239717960357666, "global_step": 94231, "epoch": 2243} {"train_loss": -6.35383939743042, "global_step": 94232, "epoch": 2243} {"train_loss": -6.235255241394043, "global_step": 94233, "epoch": 2243} {"train_loss": -6.19386100769043, "global_step": 94234, "epoch": 2243} {"train_loss": -6.3682169914245605, "global_step": 94235, "epoch": 2243} {"train_loss": -6.319307327270508, "global_step": 94236, "epoch": 2243} {"train_loss": -6.154755115509033, "global_step": 94237, "epoch": 2243} {"train_loss": -6.2463788986206055, "global_step": 94238, "epoch": 2243} {"train_loss": -6.152721405029297, "global_step": 94239, "epoch": 2243} {"train_loss": -6.289920806884766, "global_step": 94240, "epoch": 2243} {"train_loss": -6.283792972564697, "global_step": 94241, "epoch": 2243} {"train_loss": -6.342604637145996, "global_step": 94242, "epoch": 2243} {"train_loss": -6.344295024871826, "global_step": 94243, "epoch": 2243} {"train_loss": -6.0997772216796875, "global_step": 94244, "epoch": 2243} {"train_loss": -6.234464168548584, "global_step": 94245, "epoch": 2243} {"train_loss": -6.341179847717285, "global_step": 94246, "epoch": 2243} {"train_loss": -6.275992541086106, "global_step": 94247, "epoch": 2243, "val_loss": 67911.265625} {"train_loss": -6.359288215637207, "global_step": 94248, "epoch": 2244} {"train_loss": -6.182723045349121, "global_step": 94249, "epoch": 2244} {"train_loss": -6.391757488250732, "global_step": 94250, "epoch": 2244} {"train_loss": -6.377562999725342, "global_step": 94251, "epoch": 2244} {"train_loss": -6.337100982666016, "global_step": 94252, "epoch": 2244} {"train_loss": -6.326383590698242, "global_step": 94253, "epoch": 2244} {"train_loss": -6.339046478271484, "global_step": 94254, "epoch": 2244} {"train_loss": -6.4049530029296875, "global_step": 94255, "epoch": 2244} {"train_loss": -6.371219635009766, "global_step": 94256, "epoch": 2244} {"train_loss": -6.287275314331055, "global_step": 94257, "epoch": 2244} {"train_loss": -6.357220649719238, "global_step": 94258, "epoch": 2244} {"train_loss": -6.24752140045166, "global_step": 94259, "epoch": 2244} {"train_loss": -6.153059482574463, "global_step": 94260, "epoch": 2244} {"train_loss": -6.342879295349121, "global_step": 94261, "epoch": 2244} {"train_loss": -6.333751201629639, "global_step": 94262, "epoch": 2244} {"train_loss": -6.23775577545166, "global_step": 94263, "epoch": 2244} {"train_loss": -6.355208396911621, "global_step": 94264, "epoch": 2244} {"train_loss": -6.3039422035217285, "global_step": 94265, "epoch": 2244} {"train_loss": -6.239777565002441, "global_step": 94266, "epoch": 2244} {"train_loss": -6.23445987701416, "global_step": 94267, "epoch": 2244} {"train_loss": -6.224890232086182, "global_step": 94268, "epoch": 2244} {"train_loss": -6.2201738357543945, "global_step": 94269, "epoch": 2244} {"train_loss": -6.211870193481445, "global_step": 94270, "epoch": 2244} {"train_loss": -6.234255790710449, "global_step": 94271, "epoch": 2244} {"train_loss": -6.201018333435059, "global_step": 94272, "epoch": 2244} {"train_loss": -6.354998588562012, "global_step": 94273, "epoch": 2244} {"train_loss": -6.213963031768799, "global_step": 94274, "epoch": 2244} {"train_loss": -6.187318801879883, "global_step": 94275, "epoch": 2244} {"train_loss": -6.333230018615723, "global_step": 94276, "epoch": 2244} {"train_loss": -6.311303615570068, "global_step": 94277, "epoch": 2244} {"train_loss": -6.071672439575195, "global_step": 94278, "epoch": 2244} {"train_loss": -6.285591125488281, "global_step": 94279, "epoch": 2244} {"train_loss": -6.197178363800049, "global_step": 94280, "epoch": 2244} {"train_loss": -6.127500057220459, "global_step": 94281, "epoch": 2244} {"train_loss": -6.257852077484131, "global_step": 94282, "epoch": 2244} {"train_loss": -6.150187969207764, "global_step": 94283, "epoch": 2244} {"train_loss": -6.17537784576416, "global_step": 94284, "epoch": 2244} {"train_loss": -6.20534610748291, "global_step": 94285, "epoch": 2244} {"train_loss": -6.1938018798828125, "global_step": 94286, "epoch": 2244} {"train_loss": -6.312399387359619, "global_step": 94287, "epoch": 2244} {"train_loss": -6.1385178565979, "global_step": 94288, "epoch": 2244} {"train_loss": -6.264148121788388, "global_step": 94289, "epoch": 2244, "val_loss": 68301.0859375} {"train_loss": -6.31218147277832, "global_step": 94290, "epoch": 2245} {"train_loss": -6.2741923332214355, "global_step": 94291, "epoch": 2245} {"train_loss": -6.226273536682129, "global_step": 94292, "epoch": 2245} {"train_loss": -6.262568950653076, "global_step": 94293, "epoch": 2245} {"train_loss": -6.305192947387695, "global_step": 94294, "epoch": 2245} {"train_loss": -6.362601280212402, "global_step": 94295, "epoch": 2245} {"train_loss": -6.260082244873047, "global_step": 94296, "epoch": 2245} {"train_loss": -6.2836174964904785, "global_step": 94297, "epoch": 2245} {"train_loss": -6.278443336486816, "global_step": 94298, "epoch": 2245} {"train_loss": -6.172335147857666, "global_step": 94299, "epoch": 2245} {"train_loss": -6.360383033752441, "global_step": 94300, "epoch": 2245} {"train_loss": -6.211472511291504, "global_step": 94301, "epoch": 2245} {"train_loss": -6.312681198120117, "global_step": 94302, "epoch": 2245} {"train_loss": -6.163088798522949, "global_step": 94303, "epoch": 2245} {"train_loss": -6.161201477050781, "global_step": 94304, "epoch": 2245} {"train_loss": -6.326840877532959, "global_step": 94305, "epoch": 2245} {"train_loss": -6.291924953460693, "global_step": 94306, "epoch": 2245} {"train_loss": -6.336980819702148, "global_step": 94307, "epoch": 2245} {"train_loss": -6.241359233856201, "global_step": 94308, "epoch": 2245} {"train_loss": -6.110082626342773, "global_step": 94309, "epoch": 2245} {"train_loss": -6.213876724243164, "global_step": 94310, "epoch": 2245} {"train_loss": -6.262026786804199, "global_step": 94311, "epoch": 2245} {"train_loss": -6.318972587585449, "global_step": 94312, "epoch": 2245} {"train_loss": -6.221087455749512, "global_step": 94313, "epoch": 2245} {"train_loss": -6.355195999145508, "global_step": 94314, "epoch": 2245} {"train_loss": -6.341911315917969, "global_step": 94315, "epoch": 2245} {"train_loss": -6.186761856079102, "global_step": 94316, "epoch": 2245} {"train_loss": -6.346103668212891, "global_step": 94317, "epoch": 2245} {"train_loss": -6.200908184051514, "global_step": 94318, "epoch": 2245} {"train_loss": -6.322244644165039, "global_step": 94319, "epoch": 2245} {"train_loss": -6.2562456130981445, "global_step": 94320, "epoch": 2245} {"train_loss": -6.187280654907227, "global_step": 94321, "epoch": 2245} {"train_loss": -6.137572288513184, "global_step": 94322, "epoch": 2245} {"train_loss": -6.225275039672852, "global_step": 94323, "epoch": 2245} {"train_loss": -6.233958721160889, "global_step": 94324, "epoch": 2245} {"train_loss": -6.156160831451416, "global_step": 94325, "epoch": 2245} {"train_loss": -6.208150863647461, "global_step": 94326, "epoch": 2245} {"train_loss": -6.1173095703125, "global_step": 94327, "epoch": 2245} {"train_loss": -6.219212532043457, "global_step": 94328, "epoch": 2245} {"train_loss": -6.112290382385254, "global_step": 94329, "epoch": 2245} {"train_loss": -6.222033500671387, "global_step": 94330, "epoch": 2245} {"train_loss": -6.24519327708653, "global_step": 94331, "epoch": 2245, "val_loss": 68605.3515625} {"train_loss": -6.051492691040039, "global_step": 94332, "epoch": 2246} {"train_loss": -6.2498297691345215, "global_step": 94333, "epoch": 2246} {"train_loss": -6.292762756347656, "global_step": 94334, "epoch": 2246} {"train_loss": -6.309191703796387, "global_step": 94335, "epoch": 2246} {"train_loss": -6.128345489501953, "global_step": 94336, "epoch": 2246} {"train_loss": -6.283750534057617, "global_step": 94337, "epoch": 2246} {"train_loss": -6.215121269226074, "global_step": 94338, "epoch": 2246} {"train_loss": -6.282923698425293, "global_step": 94339, "epoch": 2246} {"train_loss": -6.142536163330078, "global_step": 94340, "epoch": 2246} {"train_loss": -6.173755645751953, "global_step": 94341, "epoch": 2246} {"train_loss": -6.202890872955322, "global_step": 94342, "epoch": 2246} {"train_loss": -6.138815879821777, "global_step": 94343, "epoch": 2246} {"train_loss": -6.2055463790893555, "global_step": 94344, "epoch": 2246} {"train_loss": -6.34578800201416, "global_step": 94345, "epoch": 2246} {"train_loss": -6.280508518218994, "global_step": 94346, "epoch": 2246} {"train_loss": -6.2281084060668945, "global_step": 94347, "epoch": 2246} {"train_loss": -6.313089370727539, "global_step": 94348, "epoch": 2246} {"train_loss": -6.3742523193359375, "global_step": 94349, "epoch": 2246} {"train_loss": -6.113908290863037, "global_step": 94350, "epoch": 2246} {"train_loss": -6.280324459075928, "global_step": 94351, "epoch": 2246} {"train_loss": -6.290112495422363, "global_step": 94352, "epoch": 2246} {"train_loss": -6.222923278808594, "global_step": 94353, "epoch": 2246} {"train_loss": -6.262247085571289, "global_step": 94354, "epoch": 2246} {"train_loss": -6.396707534790039, "global_step": 94355, "epoch": 2246} {"train_loss": -6.3137383460998535, "global_step": 94356, "epoch": 2246} {"train_loss": -6.16206169128418, "global_step": 94357, "epoch": 2246} {"train_loss": -6.329604625701904, "global_step": 94358, "epoch": 2246} {"train_loss": -6.382238388061523, "global_step": 94359, "epoch": 2246} {"train_loss": -6.345846176147461, "global_step": 94360, "epoch": 2246} {"train_loss": -6.425851821899414, "global_step": 94361, "epoch": 2246} {"train_loss": -6.124934673309326, "global_step": 94362, "epoch": 2246} {"train_loss": -6.173785209655762, "global_step": 94363, "epoch": 2246} {"train_loss": -6.352137088775635, "global_step": 94364, "epoch": 2246} {"train_loss": -6.173226356506348, "global_step": 94365, "epoch": 2246} {"train_loss": -6.390983581542969, "global_step": 94366, "epoch": 2246} {"train_loss": -6.321108341217041, "global_step": 94367, "epoch": 2246} {"train_loss": -6.347353458404541, "global_step": 94368, "epoch": 2246} {"train_loss": -6.321078300476074, "global_step": 94369, "epoch": 2246} {"train_loss": -6.248675346374512, "global_step": 94370, "epoch": 2246} {"train_loss": -6.233063220977783, "global_step": 94371, "epoch": 2246} {"train_loss": -6.22086763381958, "global_step": 94372, "epoch": 2246} {"train_loss": -6.262180703026908, "global_step": 94373, "epoch": 2246, "val_loss": 67693.421875} {"train_loss": -6.327668190002441, "global_step": 94374, "epoch": 2247} {"train_loss": -6.254339694976807, "global_step": 94375, "epoch": 2247} {"train_loss": -6.249434471130371, "global_step": 94376, "epoch": 2247} {"train_loss": -6.348826885223389, "global_step": 94377, "epoch": 2247} {"train_loss": -6.218832969665527, "global_step": 94378, "epoch": 2247} {"train_loss": -6.280196666717529, "global_step": 94379, "epoch": 2247} {"train_loss": -6.231448650360107, "global_step": 94380, "epoch": 2247} {"train_loss": -6.296101093292236, "global_step": 94381, "epoch": 2247} {"train_loss": -6.2803826332092285, "global_step": 94382, "epoch": 2247} {"train_loss": -6.130317211151123, "global_step": 94383, "epoch": 2247} {"train_loss": -6.073174476623535, "global_step": 94384, "epoch": 2247} {"train_loss": -6.290992736816406, "global_step": 94385, "epoch": 2247} {"train_loss": -6.252320289611816, "global_step": 94386, "epoch": 2247} {"train_loss": -6.159832954406738, "global_step": 94387, "epoch": 2247} {"train_loss": -6.31021785736084, "global_step": 94388, "epoch": 2247} {"train_loss": -6.224534511566162, "global_step": 94389, "epoch": 2247} {"train_loss": -6.125151634216309, "global_step": 94390, "epoch": 2247} {"train_loss": -6.365019798278809, "global_step": 94391, "epoch": 2247} {"train_loss": -6.2572197914123535, "global_step": 94392, "epoch": 2247} {"train_loss": -6.1613664627075195, "global_step": 94393, "epoch": 2247} {"train_loss": -6.376091003417969, "global_step": 94394, "epoch": 2247} {"train_loss": -6.184000492095947, "global_step": 94395, "epoch": 2247} {"train_loss": -6.158975124359131, "global_step": 94396, "epoch": 2247} {"train_loss": -6.2248454093933105, "global_step": 94397, "epoch": 2247} {"train_loss": -6.276144504547119, "global_step": 94398, "epoch": 2247} {"train_loss": -6.278964996337891, "global_step": 94399, "epoch": 2247} {"train_loss": -6.165435314178467, "global_step": 94400, "epoch": 2247} {"train_loss": -6.19737434387207, "global_step": 94401, "epoch": 2247} {"train_loss": -6.209420680999756, "global_step": 94402, "epoch": 2247} {"train_loss": -6.232750415802002, "global_step": 94403, "epoch": 2247} {"train_loss": -6.4004034996032715, "global_step": 94404, "epoch": 2247} {"train_loss": -6.223649024963379, "global_step": 94405, "epoch": 2247} {"train_loss": -6.177919864654541, "global_step": 94406, "epoch": 2247} {"train_loss": -6.253403663635254, "global_step": 94407, "epoch": 2247} {"train_loss": -6.175759315490723, "global_step": 94408, "epoch": 2247} {"train_loss": -6.31521463394165, "global_step": 94409, "epoch": 2247} {"train_loss": -6.213830947875977, "global_step": 94410, "epoch": 2247} {"train_loss": -6.257753849029541, "global_step": 94411, "epoch": 2247} {"train_loss": -6.2140727043151855, "global_step": 94412, "epoch": 2247} {"train_loss": -6.273395538330078, "global_step": 94413, "epoch": 2247} {"train_loss": -6.191690444946289, "global_step": 94414, "epoch": 2247} {"train_loss": -6.238446610314505, "global_step": 94415, "epoch": 2247, "val_loss": 67678.5625} {"train_loss": -6.2611260414123535, "global_step": 94416, "epoch": 2248} {"train_loss": -6.196142196655273, "global_step": 94417, "epoch": 2248} {"train_loss": -6.092453956604004, "global_step": 94418, "epoch": 2248} {"train_loss": -6.268651485443115, "global_step": 94419, "epoch": 2248} {"train_loss": -6.121064186096191, "global_step": 94420, "epoch": 2248} {"train_loss": -6.150341987609863, "global_step": 94421, "epoch": 2248} {"train_loss": -6.229545593261719, "global_step": 94422, "epoch": 2248} {"train_loss": -6.090397834777832, "global_step": 94423, "epoch": 2248} {"train_loss": -6.332165718078613, "global_step": 94424, "epoch": 2248} {"train_loss": -6.138275146484375, "global_step": 94425, "epoch": 2248} {"train_loss": -6.32902193069458, "global_step": 94426, "epoch": 2248} {"train_loss": -6.200471878051758, "global_step": 94427, "epoch": 2248} {"train_loss": -6.17240047454834, "global_step": 94428, "epoch": 2248} {"train_loss": -6.248672962188721, "global_step": 94429, "epoch": 2248} {"train_loss": -6.273471832275391, "global_step": 94430, "epoch": 2248} {"train_loss": -6.157155990600586, "global_step": 94431, "epoch": 2248} {"train_loss": -6.17827033996582, "global_step": 94432, "epoch": 2248} {"train_loss": -6.322546005249023, "global_step": 94433, "epoch": 2248} {"train_loss": -6.35295295715332, "global_step": 94434, "epoch": 2248} {"train_loss": -6.296871662139893, "global_step": 94435, "epoch": 2248} {"train_loss": -6.290591239929199, "global_step": 94436, "epoch": 2248} {"train_loss": -6.287106037139893, "global_step": 94437, "epoch": 2248} {"train_loss": -6.2686004638671875, "global_step": 94438, "epoch": 2248} {"train_loss": -6.362213134765625, "global_step": 94439, "epoch": 2248} {"train_loss": -6.252544403076172, "global_step": 94440, "epoch": 2248} {"train_loss": -6.390941619873047, "global_step": 94441, "epoch": 2248} {"train_loss": -6.310883522033691, "global_step": 94442, "epoch": 2248} {"train_loss": -6.1784162521362305, "global_step": 94443, "epoch": 2248} {"train_loss": -6.295614242553711, "global_step": 94444, "epoch": 2248} {"train_loss": -6.409242630004883, "global_step": 94445, "epoch": 2248} {"train_loss": -6.293868064880371, "global_step": 94446, "epoch": 2248} {"train_loss": -6.312862396240234, "global_step": 94447, "epoch": 2248} {"train_loss": -6.2352094650268555, "global_step": 94448, "epoch": 2248} {"train_loss": -6.276224613189697, "global_step": 94449, "epoch": 2248} {"train_loss": -6.328075408935547, "global_step": 94450, "epoch": 2248} {"train_loss": -6.422898292541504, "global_step": 94451, "epoch": 2248} {"train_loss": -6.292235374450684, "global_step": 94452, "epoch": 2248} {"train_loss": -6.270864486694336, "global_step": 94453, "epoch": 2248} {"train_loss": -6.325186252593994, "global_step": 94454, "epoch": 2248} {"train_loss": -6.3161211013793945, "global_step": 94455, "epoch": 2248} {"train_loss": -6.285898685455322, "global_step": 94456, "epoch": 2248} {"train_loss": -6.262341908046177, "global_step": 94457, "epoch": 2248, "val_loss": 68011.46875} {"train_loss": -6.275579452514648, "global_step": 94458, "epoch": 2249} {"train_loss": -6.247916221618652, "global_step": 94459, "epoch": 2249} {"train_loss": -6.324641227722168, "global_step": 94460, "epoch": 2249} {"train_loss": -6.305947303771973, "global_step": 94461, "epoch": 2249} {"train_loss": -6.286285400390625, "global_step": 94462, "epoch": 2249} {"train_loss": -6.276223182678223, "global_step": 94463, "epoch": 2249} {"train_loss": -6.253957748413086, "global_step": 94464, "epoch": 2249} {"train_loss": -6.231407165527344, "global_step": 94465, "epoch": 2249} {"train_loss": -6.190490245819092, "global_step": 94466, "epoch": 2249} {"train_loss": -6.242391109466553, "global_step": 94467, "epoch": 2249} {"train_loss": -6.320359706878662, "global_step": 94468, "epoch": 2249} {"train_loss": -6.268259048461914, "global_step": 94469, "epoch": 2249} {"train_loss": -6.289120674133301, "global_step": 94470, "epoch": 2249} {"train_loss": -6.361030578613281, "global_step": 94471, "epoch": 2249} {"train_loss": -6.307660102844238, "global_step": 94472, "epoch": 2249} {"train_loss": -6.409454345703125, "global_step": 94473, "epoch": 2249} {"train_loss": -6.183199405670166, "global_step": 94474, "epoch": 2249} {"train_loss": -6.27193546295166, "global_step": 94475, "epoch": 2249} {"train_loss": -6.340494632720947, "global_step": 94476, "epoch": 2249} {"train_loss": -6.318828582763672, "global_step": 94477, "epoch": 2249} {"train_loss": -6.246213912963867, "global_step": 94478, "epoch": 2249} {"train_loss": -6.26615047454834, "global_step": 94479, "epoch": 2249} {"train_loss": -6.326028823852539, "global_step": 94480, "epoch": 2249} {"train_loss": -6.235848426818848, "global_step": 94481, "epoch": 2249} {"train_loss": -6.288090705871582, "global_step": 94482, "epoch": 2249} {"train_loss": -6.23382568359375, "global_step": 94483, "epoch": 2249} {"train_loss": -6.3259968757629395, "global_step": 94484, "epoch": 2249} {"train_loss": -6.350645542144775, "global_step": 94485, "epoch": 2249} {"train_loss": -6.206153869628906, "global_step": 94486, "epoch": 2249} {"train_loss": -6.310427665710449, "global_step": 94487, "epoch": 2249} {"train_loss": -6.0933308601379395, "global_step": 94488, "epoch": 2249} {"train_loss": -6.23181676864624, "global_step": 94489, "epoch": 2249} {"train_loss": -6.33179235458374, "global_step": 94490, "epoch": 2249} {"train_loss": -6.324665069580078, "global_step": 94491, "epoch": 2249} {"train_loss": -6.168014049530029, "global_step": 94492, "epoch": 2249} {"train_loss": -6.15277099609375, "global_step": 94493, "epoch": 2249} {"train_loss": -6.226872444152832, "global_step": 94494, "epoch": 2249} {"train_loss": -6.32197380065918, "global_step": 94495, "epoch": 2249} {"train_loss": -6.267461776733398, "global_step": 94496, "epoch": 2249} {"train_loss": -6.375430107116699, "global_step": 94497, "epoch": 2249} {"train_loss": -6.289731025695801, "global_step": 94498, "epoch": 2249} {"train_loss": -6.276253927321661, "global_step": 94499, "epoch": 2249, "val_loss": 67808.28125} {"train_loss": -6.374665260314941, "global_step": 94500, "epoch": 2250} {"train_loss": -6.158903121948242, "global_step": 94501, "epoch": 2250} {"train_loss": -6.310971736907959, "global_step": 94502, "epoch": 2250} {"train_loss": -6.350276470184326, "global_step": 94503, "epoch": 2250} {"train_loss": -6.258966445922852, "global_step": 94504, "epoch": 2250} {"train_loss": -6.326939582824707, "global_step": 94505, "epoch": 2250} {"train_loss": -6.181818008422852, "global_step": 94506, "epoch": 2250} {"train_loss": -6.29182767868042, "global_step": 94507, "epoch": 2250} {"train_loss": -6.256825923919678, "global_step": 94508, "epoch": 2250} {"train_loss": -6.36552619934082, "global_step": 94509, "epoch": 2250} {"train_loss": -6.335522651672363, "global_step": 94510, "epoch": 2250} {"train_loss": -6.260089874267578, "global_step": 94511, "epoch": 2250} {"train_loss": -6.347724914550781, "global_step": 94512, "epoch": 2250} {"train_loss": -6.2456865310668945, "global_step": 94513, "epoch": 2250} {"train_loss": -6.306053161621094, "global_step": 94514, "epoch": 2250} {"train_loss": -6.269993782043457, "global_step": 94515, "epoch": 2250} {"train_loss": -6.266517639160156, "global_step": 94516, "epoch": 2250} {"train_loss": -6.287806034088135, "global_step": 94517, "epoch": 2250} {"train_loss": -6.360973358154297, "global_step": 94518, "epoch": 2250} {"train_loss": -6.359893798828125, "global_step": 94519, "epoch": 2250} {"train_loss": -6.2966718673706055, "global_step": 94520, "epoch": 2250} {"train_loss": -6.238786697387695, "global_step": 94521, "epoch": 2250} {"train_loss": -6.360069274902344, "global_step": 94522, "epoch": 2250} {"train_loss": -6.226261615753174, "global_step": 94523, "epoch": 2250} {"train_loss": -6.258883953094482, "global_step": 94524, "epoch": 2250} {"train_loss": -6.198825836181641, "global_step": 94525, "epoch": 2250} {"train_loss": -6.317949295043945, "global_step": 94526, "epoch": 2250} {"train_loss": -6.414412498474121, "global_step": 94527, "epoch": 2250} {"train_loss": -6.328338623046875, "global_step": 94528, "epoch": 2250} {"train_loss": -6.419869422912598, "global_step": 94529, "epoch": 2250} {"train_loss": -6.31503963470459, "global_step": 94530, "epoch": 2250} {"train_loss": -6.346341609954834, "global_step": 94531, "epoch": 2250} {"train_loss": -6.450983047485352, "global_step": 94532, "epoch": 2250} {"train_loss": -6.190585136413574, "global_step": 94533, "epoch": 2250} {"train_loss": -6.468245029449463, "global_step": 94534, "epoch": 2250} {"train_loss": -6.237861633300781, "global_step": 94535, "epoch": 2250} {"train_loss": -6.398763656616211, "global_step": 94536, "epoch": 2250} {"train_loss": -6.294042110443115, "global_step": 94537, "epoch": 2250} {"train_loss": -6.263092994689941, "global_step": 94538, "epoch": 2250} {"train_loss": -6.316971778869629, "global_step": 94539, "epoch": 2250} {"train_loss": -6.126774787902832, "global_step": 94540, "epoch": 2250} {"train_loss": -6.301861342929659, "global_step": 94541, "epoch": 2250, "train/sim_max_reward_0": 0.2537357040523988, "train/sim_max_reward_1": 0.33541322764336523, "train/sim_max_reward_2": 0.15554643316758157, "train/sim_max_reward_3": 0.14261304487956003, "train/sim_max_reward_4": 0.3660507730613328, "train/sim_max_reward_5": 0.9885604199629517, "test/sim_max_reward_4400000": 0.15739611677568902, "test/sim_max_reward_4400001": 0.9663271963953733, "test/sim_max_reward_4400002": 0.7628952134679511, "test/sim_max_reward_4400003": 2.5876426711054814e-05, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.825198001704375, "test/sim_max_reward_4400007": 0.004129723987382917, "test/sim_max_reward_4400008": 0.30610237540006835, "test/sim_max_reward_4400009": 0.9560410768738143, "test/sim_max_reward_4400010": 0.2807470955677931, "test/sim_max_reward_4400011": 0.3093842872468245, "test/sim_max_reward_4400012": 0.9345481661863586, "test/sim_max_reward_4400013": 0.5180293257665107, "test/sim_max_reward_4400014": 0.679590349299248, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.10375500108425173, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2065145350006385, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.92747782284751, "test/sim_max_reward_4400023": 0.24639005685662266, "test/sim_max_reward_4400024": 0.25316875973330916, "test/sim_max_reward_4400025": 0.2524285950965142, "test/sim_max_reward_4400026": 0.9142475175136987, "test/sim_max_reward_4400027": 0.03419582884223628, "test/sim_max_reward_4400028": 0.6012085050780857, "test/sim_max_reward_4400029": 0.4773930407511222, "test/sim_max_reward_4400030": 0.9264203707139762, "test/sim_max_reward_4400031": 0.9986311244139865, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.23314650926850128, "test/sim_max_reward_4400034": 0.8847649764915353, "test/sim_max_reward_4400035": 0.4856177063560718, "test/sim_max_reward_4400036": 0.40413959450389453, "test/sim_max_reward_4400037": 0.9268346590073668, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9346327076885418, "test/sim_max_reward_4400042": 0.9061055089879737, "test/sim_max_reward_4400043": 0.8874580429752403, "test/sim_max_reward_4400044": 0.9076662532981079, "test/sim_max_reward_4400045": 0.950824216660731, "test/sim_max_reward_4400046": 0.3162860875840551, "test/sim_max_reward_4400047": 0.9897275483682961, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.7550508661985086, "train/mean_score": 0.373653267127865, "test/mean_score": 0.4939588179279819, "val_loss": 68263.2421875} {"train_loss": -6.288771629333496, "global_step": 94542, "epoch": 2251} {"train_loss": -6.304630279541016, "global_step": 94543, "epoch": 2251} {"train_loss": -6.328359603881836, "global_step": 94544, "epoch": 2251} {"train_loss": -6.278543472290039, "global_step": 94545, "epoch": 2251} {"train_loss": -6.261991500854492, "global_step": 94546, "epoch": 2251} {"train_loss": -6.272778511047363, "global_step": 94547, "epoch": 2251} {"train_loss": -6.415101051330566, "global_step": 94548, "epoch": 2251} {"train_loss": -6.28772497177124, "global_step": 94549, "epoch": 2251} {"train_loss": -6.1628217697143555, "global_step": 94550, "epoch": 2251} {"train_loss": -6.237450122833252, "global_step": 94551, "epoch": 2251} {"train_loss": -6.3310136795043945, "global_step": 94552, "epoch": 2251} {"train_loss": -6.3658833503723145, "global_step": 94553, "epoch": 2251} {"train_loss": -6.343974590301514, "global_step": 94554, "epoch": 2251} {"train_loss": -6.406369209289551, "global_step": 94555, "epoch": 2251} {"train_loss": -6.237513542175293, "global_step": 94556, "epoch": 2251} {"train_loss": -6.271332740783691, "global_step": 94557, "epoch": 2251} {"train_loss": -6.326456069946289, "global_step": 94558, "epoch": 2251} {"train_loss": -6.268946647644043, "global_step": 94559, "epoch": 2251} {"train_loss": -6.344090461730957, "global_step": 94560, "epoch": 2251} {"train_loss": -6.4020915031433105, "global_step": 94561, "epoch": 2251} {"train_loss": -6.43328857421875, "global_step": 94562, "epoch": 2251} {"train_loss": -6.324233055114746, "global_step": 94563, "epoch": 2251} {"train_loss": -6.298158168792725, "global_step": 94564, "epoch": 2251} {"train_loss": -6.260943412780762, "global_step": 94565, "epoch": 2251} {"train_loss": -6.319446086883545, "global_step": 94566, "epoch": 2251} {"train_loss": -6.309482574462891, "global_step": 94567, "epoch": 2251} {"train_loss": -6.318268775939941, "global_step": 94568, "epoch": 2251} {"train_loss": -6.288801670074463, "global_step": 94569, "epoch": 2251} {"train_loss": -6.270965576171875, "global_step": 94570, "epoch": 2251} {"train_loss": -6.372628211975098, "global_step": 94571, "epoch": 2251} {"train_loss": -6.3104753494262695, "global_step": 94572, "epoch": 2251} {"train_loss": -6.3060221672058105, "global_step": 94573, "epoch": 2251} {"train_loss": -6.402957916259766, "global_step": 94574, "epoch": 2251} {"train_loss": -6.33851432800293, "global_step": 94575, "epoch": 2251} {"train_loss": -6.300529479980469, "global_step": 94576, "epoch": 2251} {"train_loss": -6.148007392883301, "global_step": 94577, "epoch": 2251} {"train_loss": -6.207152366638184, "global_step": 94578, "epoch": 2251} {"train_loss": -6.331282138824463, "global_step": 94579, "epoch": 2251} {"train_loss": -6.15462064743042, "global_step": 94580, "epoch": 2251} {"train_loss": -6.281245231628418, "global_step": 94581, "epoch": 2251} {"train_loss": -6.341888427734375, "global_step": 94582, "epoch": 2251} {"train_loss": -6.303269863128662, "global_step": 94583, "epoch": 2251, "val_loss": 67871.6875} {"train_loss": -6.422130584716797, "global_step": 94584, "epoch": 2252} {"train_loss": -6.285283088684082, "global_step": 94585, "epoch": 2252} {"train_loss": -6.249053001403809, "global_step": 94586, "epoch": 2252} {"train_loss": -6.247363567352295, "global_step": 94587, "epoch": 2252} {"train_loss": -6.315847396850586, "global_step": 94588, "epoch": 2252} {"train_loss": -6.251403331756592, "global_step": 94589, "epoch": 2252} {"train_loss": -6.222996234893799, "global_step": 94590, "epoch": 2252} {"train_loss": -6.342304229736328, "global_step": 94591, "epoch": 2252} {"train_loss": -6.322326183319092, "global_step": 94592, "epoch": 2252} {"train_loss": -6.308546543121338, "global_step": 94593, "epoch": 2252} {"train_loss": -6.330183029174805, "global_step": 94594, "epoch": 2252} {"train_loss": -6.3008832931518555, "global_step": 94595, "epoch": 2252} {"train_loss": -6.347894668579102, "global_step": 94596, "epoch": 2252} {"train_loss": -6.264558792114258, "global_step": 94597, "epoch": 2252} {"train_loss": -6.382834434509277, "global_step": 94598, "epoch": 2252} {"train_loss": -6.213762283325195, "global_step": 94599, "epoch": 2252} {"train_loss": -6.25389289855957, "global_step": 94600, "epoch": 2252} {"train_loss": -6.307238578796387, "global_step": 94601, "epoch": 2252} {"train_loss": -6.229310989379883, "global_step": 94602, "epoch": 2252} {"train_loss": -6.344595909118652, "global_step": 94603, "epoch": 2252} {"train_loss": -6.223528861999512, "global_step": 94604, "epoch": 2252} {"train_loss": -6.297429084777832, "global_step": 94605, "epoch": 2252} {"train_loss": -6.265779495239258, "global_step": 94606, "epoch": 2252} {"train_loss": -6.353043556213379, "global_step": 94607, "epoch": 2252} {"train_loss": -6.40338134765625, "global_step": 94608, "epoch": 2252} {"train_loss": -6.38716983795166, "global_step": 94609, "epoch": 2252} {"train_loss": -6.294695854187012, "global_step": 94610, "epoch": 2252} {"train_loss": -6.285400867462158, "global_step": 94611, "epoch": 2252} {"train_loss": -6.319331169128418, "global_step": 94612, "epoch": 2252} {"train_loss": -6.259078025817871, "global_step": 94613, "epoch": 2252} {"train_loss": -6.247297286987305, "global_step": 94614, "epoch": 2252} {"train_loss": -6.360754013061523, "global_step": 94615, "epoch": 2252} {"train_loss": -6.24046516418457, "global_step": 94616, "epoch": 2252} {"train_loss": -6.226537704467773, "global_step": 94617, "epoch": 2252} {"train_loss": -6.3452348709106445, "global_step": 94618, "epoch": 2252} {"train_loss": -6.351058006286621, "global_step": 94619, "epoch": 2252} {"train_loss": -6.214759826660156, "global_step": 94620, "epoch": 2252} {"train_loss": -6.252541542053223, "global_step": 94621, "epoch": 2252} {"train_loss": -6.267620086669922, "global_step": 94622, "epoch": 2252} {"train_loss": -6.276026725769043, "global_step": 94623, "epoch": 2252} {"train_loss": -6.364007472991943, "global_step": 94624, "epoch": 2252} {"train_loss": -6.297965969358172, "global_step": 94625, "epoch": 2252, "val_loss": 67798.609375} {"train_loss": -6.357419967651367, "global_step": 94626, "epoch": 2253} {"train_loss": -6.330699920654297, "global_step": 94627, "epoch": 2253} {"train_loss": -6.286415100097656, "global_step": 94628, "epoch": 2253} {"train_loss": -6.3446245193481445, "global_step": 94629, "epoch": 2253} {"train_loss": -6.190678119659424, "global_step": 94630, "epoch": 2253} {"train_loss": -6.346477508544922, "global_step": 94631, "epoch": 2253} {"train_loss": -6.313873767852783, "global_step": 94632, "epoch": 2253} {"train_loss": -6.249211311340332, "global_step": 94633, "epoch": 2253} {"train_loss": -6.354975700378418, "global_step": 94634, "epoch": 2253} {"train_loss": -6.349246025085449, "global_step": 94635, "epoch": 2253} {"train_loss": -6.313279151916504, "global_step": 94636, "epoch": 2253} {"train_loss": -6.21811580657959, "global_step": 94637, "epoch": 2253} {"train_loss": -6.338460922241211, "global_step": 94638, "epoch": 2253} {"train_loss": -6.332524299621582, "global_step": 94639, "epoch": 2253} {"train_loss": -6.2621917724609375, "global_step": 94640, "epoch": 2253} {"train_loss": -6.3657684326171875, "global_step": 94641, "epoch": 2253} {"train_loss": -6.273309707641602, "global_step": 94642, "epoch": 2253} {"train_loss": -6.388282299041748, "global_step": 94643, "epoch": 2253} {"train_loss": -6.226811408996582, "global_step": 94644, "epoch": 2253} {"train_loss": -6.303613662719727, "global_step": 94645, "epoch": 2253} {"train_loss": -6.362215042114258, "global_step": 94646, "epoch": 2253} {"train_loss": -6.130080223083496, "global_step": 94647, "epoch": 2253} {"train_loss": -6.365628719329834, "global_step": 94648, "epoch": 2253} {"train_loss": -6.254075050354004, "global_step": 94649, "epoch": 2253} {"train_loss": -6.315253257751465, "global_step": 94650, "epoch": 2253} {"train_loss": -6.408073425292969, "global_step": 94651, "epoch": 2253} {"train_loss": -6.359820365905762, "global_step": 94652, "epoch": 2253} {"train_loss": -6.260761260986328, "global_step": 94653, "epoch": 2253} {"train_loss": -6.128636837005615, "global_step": 94654, "epoch": 2253} {"train_loss": -6.311675548553467, "global_step": 94655, "epoch": 2253} {"train_loss": -6.2818193435668945, "global_step": 94656, "epoch": 2253} {"train_loss": -6.3413543701171875, "global_step": 94657, "epoch": 2253} {"train_loss": -6.25286340713501, "global_step": 94658, "epoch": 2253} {"train_loss": -6.264267921447754, "global_step": 94659, "epoch": 2253} {"train_loss": -6.3337178230285645, "global_step": 94660, "epoch": 2253} {"train_loss": -6.337532043457031, "global_step": 94661, "epoch": 2253} {"train_loss": -6.288865566253662, "global_step": 94662, "epoch": 2253} {"train_loss": -6.162176132202148, "global_step": 94663, "epoch": 2253} {"train_loss": -6.325657367706299, "global_step": 94664, "epoch": 2253} {"train_loss": -6.260891914367676, "global_step": 94665, "epoch": 2253} {"train_loss": -6.309410095214844, "global_step": 94666, "epoch": 2253} {"train_loss": -6.294455460139683, "global_step": 94667, "epoch": 2253, "val_loss": 68186.03125} {"train_loss": -6.234774589538574, "global_step": 94668, "epoch": 2254} {"train_loss": -6.114185333251953, "global_step": 94669, "epoch": 2254} {"train_loss": -6.261233806610107, "global_step": 94670, "epoch": 2254} {"train_loss": -6.310044288635254, "global_step": 94671, "epoch": 2254} {"train_loss": -6.218932628631592, "global_step": 94672, "epoch": 2254} {"train_loss": -6.254839897155762, "global_step": 94673, "epoch": 2254} {"train_loss": -6.1915740966796875, "global_step": 94674, "epoch": 2254} {"train_loss": -6.300788879394531, "global_step": 94675, "epoch": 2254} {"train_loss": -6.287667274475098, "global_step": 94676, "epoch": 2254} {"train_loss": -6.213564395904541, "global_step": 94677, "epoch": 2254} {"train_loss": -6.332554817199707, "global_step": 94678, "epoch": 2254} {"train_loss": -6.269975185394287, "global_step": 94679, "epoch": 2254} {"train_loss": -6.247908592224121, "global_step": 94680, "epoch": 2254} {"train_loss": -6.299546241760254, "global_step": 94681, "epoch": 2254} {"train_loss": -6.209941387176514, "global_step": 94682, "epoch": 2254} {"train_loss": -6.3369598388671875, "global_step": 94683, "epoch": 2254} {"train_loss": -6.430586338043213, "global_step": 94684, "epoch": 2254} {"train_loss": -6.266956806182861, "global_step": 94685, "epoch": 2254} {"train_loss": -6.370165824890137, "global_step": 94686, "epoch": 2254} {"train_loss": -6.212495803833008, "global_step": 94687, "epoch": 2254} {"train_loss": -6.244452476501465, "global_step": 94688, "epoch": 2254} {"train_loss": -6.393532752990723, "global_step": 94689, "epoch": 2254} {"train_loss": -6.293722629547119, "global_step": 94690, "epoch": 2254} {"train_loss": -6.147439956665039, "global_step": 94691, "epoch": 2254} {"train_loss": -6.241933822631836, "global_step": 94692, "epoch": 2254} {"train_loss": -6.318665981292725, "global_step": 94693, "epoch": 2254} {"train_loss": -6.242858409881592, "global_step": 94694, "epoch": 2254} {"train_loss": -6.284032821655273, "global_step": 94695, "epoch": 2254} {"train_loss": -6.234477996826172, "global_step": 94696, "epoch": 2254} {"train_loss": -6.373568534851074, "global_step": 94697, "epoch": 2254} {"train_loss": -6.230083465576172, "global_step": 94698, "epoch": 2254} {"train_loss": -6.244067668914795, "global_step": 94699, "epoch": 2254} {"train_loss": -6.312045097351074, "global_step": 94700, "epoch": 2254} {"train_loss": -6.292242050170898, "global_step": 94701, "epoch": 2254} {"train_loss": -6.169678211212158, "global_step": 94702, "epoch": 2254} {"train_loss": -6.3113908767700195, "global_step": 94703, "epoch": 2254} {"train_loss": -6.202022552490234, "global_step": 94704, "epoch": 2254} {"train_loss": -6.284078598022461, "global_step": 94705, "epoch": 2254} {"train_loss": -6.171509265899658, "global_step": 94706, "epoch": 2254} {"train_loss": -6.199118614196777, "global_step": 94707, "epoch": 2254} {"train_loss": -6.398741245269775, "global_step": 94708, "epoch": 2254} {"train_loss": -6.26753948983692, "global_step": 94709, "epoch": 2254, "val_loss": 67919.671875} {"train_loss": -6.284847736358643, "global_step": 94710, "epoch": 2255} {"train_loss": -6.329471588134766, "global_step": 94711, "epoch": 2255} {"train_loss": -6.315349578857422, "global_step": 94712, "epoch": 2255} {"train_loss": -6.246578693389893, "global_step": 94713, "epoch": 2255} {"train_loss": -6.335677146911621, "global_step": 94714, "epoch": 2255} {"train_loss": -6.362771511077881, "global_step": 94715, "epoch": 2255} {"train_loss": -6.3444719314575195, "global_step": 94716, "epoch": 2255} {"train_loss": -6.22769021987915, "global_step": 94717, "epoch": 2255} {"train_loss": -6.311584949493408, "global_step": 94718, "epoch": 2255} {"train_loss": -6.442609786987305, "global_step": 94719, "epoch": 2255} {"train_loss": -6.384215831756592, "global_step": 94720, "epoch": 2255} {"train_loss": -6.363032341003418, "global_step": 94721, "epoch": 2255} {"train_loss": -6.405741214752197, "global_step": 94722, "epoch": 2255} {"train_loss": -6.303571701049805, "global_step": 94723, "epoch": 2255} {"train_loss": -6.348182678222656, "global_step": 94724, "epoch": 2255} {"train_loss": -6.192233085632324, "global_step": 94725, "epoch": 2255} {"train_loss": -6.282384872436523, "global_step": 94726, "epoch": 2255} {"train_loss": -6.2545623779296875, "global_step": 94727, "epoch": 2255} {"train_loss": -6.1888580322265625, "global_step": 94728, "epoch": 2255} {"train_loss": -6.335196495056152, "global_step": 94729, "epoch": 2255} {"train_loss": -6.378762245178223, "global_step": 94730, "epoch": 2255} {"train_loss": -6.3404669761657715, "global_step": 94731, "epoch": 2255} {"train_loss": -6.304701805114746, "global_step": 94732, "epoch": 2255} {"train_loss": -6.234978675842285, "global_step": 94733, "epoch": 2255} {"train_loss": -6.216599464416504, "global_step": 94734, "epoch": 2255} {"train_loss": -6.200243949890137, "global_step": 94735, "epoch": 2255} {"train_loss": -6.342319965362549, "global_step": 94736, "epoch": 2255} {"train_loss": -6.267237186431885, "global_step": 94737, "epoch": 2255} {"train_loss": -6.2471699714660645, "global_step": 94738, "epoch": 2255} {"train_loss": -6.208255767822266, "global_step": 94739, "epoch": 2255} {"train_loss": -6.279184341430664, "global_step": 94740, "epoch": 2255} {"train_loss": -6.313481330871582, "global_step": 94741, "epoch": 2255} {"train_loss": -6.329342842102051, "global_step": 94742, "epoch": 2255} {"train_loss": -6.25661039352417, "global_step": 94743, "epoch": 2255} {"train_loss": -6.298530578613281, "global_step": 94744, "epoch": 2255} {"train_loss": -6.356526851654053, "global_step": 94745, "epoch": 2255} {"train_loss": -6.390937328338623, "global_step": 94746, "epoch": 2255} {"train_loss": -6.382903575897217, "global_step": 94747, "epoch": 2255} {"train_loss": -6.277133941650391, "global_step": 94748, "epoch": 2255} {"train_loss": -6.372409820556641, "global_step": 94749, "epoch": 2255} {"train_loss": -6.429451942443848, "global_step": 94750, "epoch": 2255} {"train_loss": -6.3111950897035145, "global_step": 94751, "epoch": 2255, "val_loss": 67950.28125} {"train_loss": -6.432598114013672, "global_step": 94752, "epoch": 2256} {"train_loss": -6.299327850341797, "global_step": 94753, "epoch": 2256} {"train_loss": -6.221351146697998, "global_step": 94754, "epoch": 2256} {"train_loss": -6.323952674865723, "global_step": 94755, "epoch": 2256} {"train_loss": -6.344965934753418, "global_step": 94756, "epoch": 2256} {"train_loss": -6.351980209350586, "global_step": 94757, "epoch": 2256} {"train_loss": -6.234978199005127, "global_step": 94758, "epoch": 2256} {"train_loss": -6.333020210266113, "global_step": 94759, "epoch": 2256} {"train_loss": -6.298680305480957, "global_step": 94760, "epoch": 2256} {"train_loss": -6.260576248168945, "global_step": 94761, "epoch": 2256} {"train_loss": -6.258569717407227, "global_step": 94762, "epoch": 2256} {"train_loss": -6.265225887298584, "global_step": 94763, "epoch": 2256} {"train_loss": -6.347977638244629, "global_step": 94764, "epoch": 2256} {"train_loss": -6.289382457733154, "global_step": 94765, "epoch": 2256} {"train_loss": -6.31618595123291, "global_step": 94766, "epoch": 2256} {"train_loss": -6.274375915527344, "global_step": 94767, "epoch": 2256} {"train_loss": -6.2395920753479, "global_step": 94768, "epoch": 2256} {"train_loss": -6.169182777404785, "global_step": 94769, "epoch": 2256} {"train_loss": -6.123093605041504, "global_step": 94770, "epoch": 2256} {"train_loss": -6.295354843139648, "global_step": 94771, "epoch": 2256} {"train_loss": -6.258732795715332, "global_step": 94772, "epoch": 2256} {"train_loss": -6.3915252685546875, "global_step": 94773, "epoch": 2256} {"train_loss": -6.239927768707275, "global_step": 94774, "epoch": 2256} {"train_loss": -6.226758003234863, "global_step": 94775, "epoch": 2256} {"train_loss": -6.199728488922119, "global_step": 94776, "epoch": 2256} {"train_loss": -6.233894348144531, "global_step": 94777, "epoch": 2256} {"train_loss": -6.211153984069824, "global_step": 94778, "epoch": 2256} {"train_loss": -6.295590400695801, "global_step": 94779, "epoch": 2256} {"train_loss": -6.381969451904297, "global_step": 94780, "epoch": 2256} {"train_loss": -6.179725170135498, "global_step": 94781, "epoch": 2256} {"train_loss": -6.272701740264893, "global_step": 94782, "epoch": 2256} {"train_loss": -6.345306873321533, "global_step": 94783, "epoch": 2256} {"train_loss": -6.330127716064453, "global_step": 94784, "epoch": 2256} {"train_loss": -6.371090888977051, "global_step": 94785, "epoch": 2256} {"train_loss": -6.259174346923828, "global_step": 94786, "epoch": 2256} {"train_loss": -6.250997066497803, "global_step": 94787, "epoch": 2256} {"train_loss": -6.2830400466918945, "global_step": 94788, "epoch": 2256} {"train_loss": -6.386406421661377, "global_step": 94789, "epoch": 2256} {"train_loss": -6.266644477844238, "global_step": 94790, "epoch": 2256} {"train_loss": -6.232298851013184, "global_step": 94791, "epoch": 2256} {"train_loss": -6.220064640045166, "global_step": 94792, "epoch": 2256} {"train_loss": -6.279634487061274, "global_step": 94793, "epoch": 2256, "val_loss": 68166.4453125} {"train_loss": -6.258763313293457, "global_step": 94794, "epoch": 2257} {"train_loss": -6.372711658477783, "global_step": 94795, "epoch": 2257} {"train_loss": -6.334896564483643, "global_step": 94796, "epoch": 2257} {"train_loss": -6.268409729003906, "global_step": 94797, "epoch": 2257} {"train_loss": -6.2482709884643555, "global_step": 94798, "epoch": 2257} {"train_loss": -6.423269748687744, "global_step": 94799, "epoch": 2257} {"train_loss": -6.283390998840332, "global_step": 94800, "epoch": 2257} {"train_loss": -6.143609523773193, "global_step": 94801, "epoch": 2257} {"train_loss": -6.260158061981201, "global_step": 94802, "epoch": 2257} {"train_loss": -6.297471046447754, "global_step": 94803, "epoch": 2257} {"train_loss": -6.128927230834961, "global_step": 94804, "epoch": 2257} {"train_loss": -6.321660995483398, "global_step": 94805, "epoch": 2257} {"train_loss": -6.327181816101074, "global_step": 94806, "epoch": 2257} {"train_loss": -6.178524494171143, "global_step": 94807, "epoch": 2257} {"train_loss": -6.256937026977539, "global_step": 94808, "epoch": 2257} {"train_loss": -6.259144306182861, "global_step": 94809, "epoch": 2257} {"train_loss": -6.3970561027526855, "global_step": 94810, "epoch": 2257} {"train_loss": -6.251028060913086, "global_step": 94811, "epoch": 2257} {"train_loss": -6.255953788757324, "global_step": 94812, "epoch": 2257} {"train_loss": -6.292079448699951, "global_step": 94813, "epoch": 2257} {"train_loss": -6.275527477264404, "global_step": 94814, "epoch": 2257} {"train_loss": -6.2841267585754395, "global_step": 94815, "epoch": 2257} {"train_loss": -6.28049373626709, "global_step": 94816, "epoch": 2257} {"train_loss": -6.340218544006348, "global_step": 94817, "epoch": 2257} {"train_loss": -6.269272804260254, "global_step": 94818, "epoch": 2257} {"train_loss": -6.285271644592285, "global_step": 94819, "epoch": 2257} {"train_loss": -6.24056339263916, "global_step": 94820, "epoch": 2257} {"train_loss": -6.279682159423828, "global_step": 94821, "epoch": 2257} {"train_loss": -6.220630168914795, "global_step": 94822, "epoch": 2257} {"train_loss": -6.275888442993164, "global_step": 94823, "epoch": 2257} {"train_loss": -6.288697242736816, "global_step": 94824, "epoch": 2257} {"train_loss": -6.304394721984863, "global_step": 94825, "epoch": 2257} {"train_loss": -6.2378339767456055, "global_step": 94826, "epoch": 2257} {"train_loss": -6.224175453186035, "global_step": 94827, "epoch": 2257} {"train_loss": -6.266519546508789, "global_step": 94828, "epoch": 2257} {"train_loss": -6.2190351486206055, "global_step": 94829, "epoch": 2257} {"train_loss": -6.239529609680176, "global_step": 94830, "epoch": 2257} {"train_loss": -6.213295936584473, "global_step": 94831, "epoch": 2257} {"train_loss": -6.228446006774902, "global_step": 94832, "epoch": 2257} {"train_loss": -6.227827072143555, "global_step": 94833, "epoch": 2257} {"train_loss": -6.252253532409668, "global_step": 94834, "epoch": 2257} {"train_loss": -6.267146065121605, "global_step": 94835, "epoch": 2257, "val_loss": 68057.3515625} {"train_loss": -6.286041736602783, "global_step": 94836, "epoch": 2258} {"train_loss": -6.221403121948242, "global_step": 94837, "epoch": 2258} {"train_loss": -6.113471984863281, "global_step": 94838, "epoch": 2258} {"train_loss": -6.232405662536621, "global_step": 94839, "epoch": 2258} {"train_loss": -6.178864479064941, "global_step": 94840, "epoch": 2258} {"train_loss": -6.17191743850708, "global_step": 94841, "epoch": 2258} {"train_loss": -6.233554840087891, "global_step": 94842, "epoch": 2258} {"train_loss": -6.346364974975586, "global_step": 94843, "epoch": 2258} {"train_loss": -6.333107948303223, "global_step": 94844, "epoch": 2258} {"train_loss": -6.319385528564453, "global_step": 94845, "epoch": 2258} {"train_loss": -6.2378621101379395, "global_step": 94846, "epoch": 2258} {"train_loss": -6.3277692794799805, "global_step": 94847, "epoch": 2258} {"train_loss": -6.271919250488281, "global_step": 94848, "epoch": 2258} {"train_loss": -6.372081279754639, "global_step": 94849, "epoch": 2258} {"train_loss": -6.352662086486816, "global_step": 94850, "epoch": 2258} {"train_loss": -6.315210342407227, "global_step": 94851, "epoch": 2258} {"train_loss": -6.387526988983154, "global_step": 94852, "epoch": 2258} {"train_loss": -6.308073043823242, "global_step": 94853, "epoch": 2258} {"train_loss": -6.233711242675781, "global_step": 94854, "epoch": 2258} {"train_loss": -6.281919956207275, "global_step": 94855, "epoch": 2258} {"train_loss": -6.232760906219482, "global_step": 94856, "epoch": 2258} {"train_loss": -6.265401363372803, "global_step": 94857, "epoch": 2258} {"train_loss": -6.198180198669434, "global_step": 94858, "epoch": 2258} {"train_loss": -6.29911994934082, "global_step": 94859, "epoch": 2258} {"train_loss": -6.372957229614258, "global_step": 94860, "epoch": 2258} {"train_loss": -6.295283317565918, "global_step": 94861, "epoch": 2258} {"train_loss": -6.268310546875, "global_step": 94862, "epoch": 2258} {"train_loss": -6.297645568847656, "global_step": 94863, "epoch": 2258} {"train_loss": -6.220461368560791, "global_step": 94864, "epoch": 2258} {"train_loss": -6.200865745544434, "global_step": 94865, "epoch": 2258} {"train_loss": -6.271641731262207, "global_step": 94866, "epoch": 2258} {"train_loss": -6.267381191253662, "global_step": 94867, "epoch": 2258} {"train_loss": -6.225063323974609, "global_step": 94868, "epoch": 2258} {"train_loss": -6.276351451873779, "global_step": 94869, "epoch": 2258} {"train_loss": -6.467448711395264, "global_step": 94870, "epoch": 2258} {"train_loss": -6.276291370391846, "global_step": 94871, "epoch": 2258} {"train_loss": -6.213294982910156, "global_step": 94872, "epoch": 2258} {"train_loss": -6.361566543579102, "global_step": 94873, "epoch": 2258} {"train_loss": -6.406105995178223, "global_step": 94874, "epoch": 2258} {"train_loss": -6.301991939544678, "global_step": 94875, "epoch": 2258} {"train_loss": -6.278724193572998, "global_step": 94876, "epoch": 2258} {"train_loss": -6.282185259319487, "global_step": 94877, "epoch": 2258, "val_loss": 67909.1484375} {"train_loss": -6.437090873718262, "global_step": 94878, "epoch": 2259} {"train_loss": -6.362762451171875, "global_step": 94879, "epoch": 2259} {"train_loss": -6.406149387359619, "global_step": 94880, "epoch": 2259} {"train_loss": -6.173446178436279, "global_step": 94881, "epoch": 2259} {"train_loss": -6.345376014709473, "global_step": 94882, "epoch": 2259} {"train_loss": -6.241145610809326, "global_step": 94883, "epoch": 2259} {"train_loss": -6.405162334442139, "global_step": 94884, "epoch": 2259} {"train_loss": -6.2922773361206055, "global_step": 94885, "epoch": 2259} {"train_loss": -6.3309102058410645, "global_step": 94886, "epoch": 2259} {"train_loss": -6.376274108886719, "global_step": 94887, "epoch": 2259} {"train_loss": -6.243206024169922, "global_step": 94888, "epoch": 2259} {"train_loss": -6.2515869140625, "global_step": 94889, "epoch": 2259} {"train_loss": -6.247957229614258, "global_step": 94890, "epoch": 2259} {"train_loss": -6.332285404205322, "global_step": 94891, "epoch": 2259} {"train_loss": -6.322269439697266, "global_step": 94892, "epoch": 2259} {"train_loss": -6.293338298797607, "global_step": 94893, "epoch": 2259} {"train_loss": -6.273951530456543, "global_step": 94894, "epoch": 2259} {"train_loss": -6.349091529846191, "global_step": 94895, "epoch": 2259} {"train_loss": -6.268579006195068, "global_step": 94896, "epoch": 2259} {"train_loss": -6.311620235443115, "global_step": 94897, "epoch": 2259} {"train_loss": -6.371735572814941, "global_step": 94898, "epoch": 2259} {"train_loss": -6.12806510925293, "global_step": 94899, "epoch": 2259} {"train_loss": -6.287109375, "global_step": 94900, "epoch": 2259} {"train_loss": -6.18594217300415, "global_step": 94901, "epoch": 2259} {"train_loss": -6.150653839111328, "global_step": 94902, "epoch": 2259} {"train_loss": -6.400472640991211, "global_step": 94903, "epoch": 2259} {"train_loss": -6.2292704582214355, "global_step": 94904, "epoch": 2259} {"train_loss": -6.306492328643799, "global_step": 94905, "epoch": 2259} {"train_loss": -6.269266128540039, "global_step": 94906, "epoch": 2259} {"train_loss": -6.182933807373047, "global_step": 94907, "epoch": 2259} {"train_loss": -6.283572196960449, "global_step": 94908, "epoch": 2259} {"train_loss": -6.3336896896362305, "global_step": 94909, "epoch": 2259} {"train_loss": -6.195823669433594, "global_step": 94910, "epoch": 2259} {"train_loss": -6.127651214599609, "global_step": 94911, "epoch": 2259} {"train_loss": -6.349069595336914, "global_step": 94912, "epoch": 2259} {"train_loss": -6.220864295959473, "global_step": 94913, "epoch": 2259} {"train_loss": -6.134138107299805, "global_step": 94914, "epoch": 2259} {"train_loss": -6.218715667724609, "global_step": 94915, "epoch": 2259} {"train_loss": -6.288429260253906, "global_step": 94916, "epoch": 2259} {"train_loss": -6.099509239196777, "global_step": 94917, "epoch": 2259} {"train_loss": -6.2625532150268555, "global_step": 94918, "epoch": 2259} {"train_loss": -6.277812446866717, "global_step": 94919, "epoch": 2259, "val_loss": 67888.5078125} {"train_loss": -6.186500549316406, "global_step": 94920, "epoch": 2260} {"train_loss": -6.27437686920166, "global_step": 94921, "epoch": 2260} {"train_loss": -6.3022589683532715, "global_step": 94922, "epoch": 2260} {"train_loss": -6.297959804534912, "global_step": 94923, "epoch": 2260} {"train_loss": -6.334617614746094, "global_step": 94924, "epoch": 2260} {"train_loss": -6.3953447341918945, "global_step": 94925, "epoch": 2260} {"train_loss": -6.313076019287109, "global_step": 94926, "epoch": 2260} {"train_loss": -6.286151885986328, "global_step": 94927, "epoch": 2260} {"train_loss": -6.2349443435668945, "global_step": 94928, "epoch": 2260} {"train_loss": -6.310878753662109, "global_step": 94929, "epoch": 2260} {"train_loss": -6.362876892089844, "global_step": 94930, "epoch": 2260} {"train_loss": -6.344963073730469, "global_step": 94931, "epoch": 2260} {"train_loss": -6.400510787963867, "global_step": 94932, "epoch": 2260} {"train_loss": -6.24630880355835, "global_step": 94933, "epoch": 2260} {"train_loss": -6.223107814788818, "global_step": 94934, "epoch": 2260} {"train_loss": -6.2980756759643555, "global_step": 94935, "epoch": 2260} {"train_loss": -6.287579536437988, "global_step": 94936, "epoch": 2260} {"train_loss": -6.323708534240723, "global_step": 94937, "epoch": 2260} {"train_loss": -6.227420806884766, "global_step": 94938, "epoch": 2260} {"train_loss": -6.305240631103516, "global_step": 94939, "epoch": 2260} {"train_loss": -6.339883804321289, "global_step": 94940, "epoch": 2260} {"train_loss": -6.271949768066406, "global_step": 94941, "epoch": 2260} {"train_loss": -6.348441123962402, "global_step": 94942, "epoch": 2260} {"train_loss": -6.302325248718262, "global_step": 94943, "epoch": 2260} {"train_loss": -6.217001914978027, "global_step": 94944, "epoch": 2260} {"train_loss": -6.371753692626953, "global_step": 94945, "epoch": 2260} {"train_loss": -6.278491020202637, "global_step": 94946, "epoch": 2260} {"train_loss": -6.247500896453857, "global_step": 94947, "epoch": 2260} {"train_loss": -6.318382263183594, "global_step": 94948, "epoch": 2260} {"train_loss": -6.29775333404541, "global_step": 94949, "epoch": 2260} {"train_loss": -6.4061503410339355, "global_step": 94950, "epoch": 2260} {"train_loss": -6.102115631103516, "global_step": 94951, "epoch": 2260} {"train_loss": -6.22150993347168, "global_step": 94952, "epoch": 2260} {"train_loss": -6.151302814483643, "global_step": 94953, "epoch": 2260} {"train_loss": -6.21156120300293, "global_step": 94954, "epoch": 2260} {"train_loss": -6.265478134155273, "global_step": 94955, "epoch": 2260} {"train_loss": -6.195937156677246, "global_step": 94956, "epoch": 2260} {"train_loss": -6.186714172363281, "global_step": 94957, "epoch": 2260} {"train_loss": -6.286993026733398, "global_step": 94958, "epoch": 2260} {"train_loss": -6.207562446594238, "global_step": 94959, "epoch": 2260} {"train_loss": -6.171372890472412, "global_step": 94960, "epoch": 2260} {"train_loss": -6.273811987468174, "global_step": 94961, "epoch": 2260, "val_loss": 68075.1484375} {"train_loss": -6.212874412536621, "global_step": 94962, "epoch": 2261} {"train_loss": -6.295424461364746, "global_step": 94963, "epoch": 2261} {"train_loss": -6.347475528717041, "global_step": 94964, "epoch": 2261} {"train_loss": -6.20732307434082, "global_step": 94965, "epoch": 2261} {"train_loss": -6.160562992095947, "global_step": 94966, "epoch": 2261} {"train_loss": -6.185544013977051, "global_step": 94967, "epoch": 2261} {"train_loss": -6.1348724365234375, "global_step": 94968, "epoch": 2261} {"train_loss": -6.2374749183654785, "global_step": 94969, "epoch": 2261} {"train_loss": -6.136144161224365, "global_step": 94970, "epoch": 2261} {"train_loss": -6.25868034362793, "global_step": 94971, "epoch": 2261} {"train_loss": -6.051203727722168, "global_step": 94972, "epoch": 2261} {"train_loss": -6.151355743408203, "global_step": 94973, "epoch": 2261} {"train_loss": -6.142241477966309, "global_step": 94974, "epoch": 2261} {"train_loss": -6.219362258911133, "global_step": 94975, "epoch": 2261} {"train_loss": -6.175374507904053, "global_step": 94976, "epoch": 2261} {"train_loss": -6.1993560791015625, "global_step": 94977, "epoch": 2261} {"train_loss": -6.246048927307129, "global_step": 94978, "epoch": 2261} {"train_loss": -6.036827087402344, "global_step": 94979, "epoch": 2261} {"train_loss": -6.186470985412598, "global_step": 94980, "epoch": 2261} {"train_loss": -6.227326393127441, "global_step": 94981, "epoch": 2261} {"train_loss": -6.2440290451049805, "global_step": 94982, "epoch": 2261} {"train_loss": -6.290378570556641, "global_step": 94983, "epoch": 2261} {"train_loss": -6.29991340637207, "global_step": 94984, "epoch": 2261} {"train_loss": -6.161831855773926, "global_step": 94985, "epoch": 2261} {"train_loss": -6.279292106628418, "global_step": 94986, "epoch": 2261} {"train_loss": -6.2766571044921875, "global_step": 94987, "epoch": 2261} {"train_loss": -6.267389297485352, "global_step": 94988, "epoch": 2261} {"train_loss": -6.252235412597656, "global_step": 94989, "epoch": 2261} {"train_loss": -6.252758979797363, "global_step": 94990, "epoch": 2261} {"train_loss": -6.193113327026367, "global_step": 94991, "epoch": 2261} {"train_loss": -6.211018085479736, "global_step": 94992, "epoch": 2261} {"train_loss": -6.146641731262207, "global_step": 94993, "epoch": 2261} {"train_loss": -6.3211188316345215, "global_step": 94994, "epoch": 2261} {"train_loss": -6.210082054138184, "global_step": 94995, "epoch": 2261} {"train_loss": -6.121735572814941, "global_step": 94996, "epoch": 2261} {"train_loss": -6.307365417480469, "global_step": 94997, "epoch": 2261} {"train_loss": -6.273285865783691, "global_step": 94998, "epoch": 2261} {"train_loss": -6.298285961151123, "global_step": 94999, "epoch": 2261} {"train_loss": -6.240169525146484, "global_step": 95000, "epoch": 2261} {"train_loss": -6.277450084686279, "global_step": 95001, "epoch": 2261} {"train_loss": -6.221278190612793, "global_step": 95002, "epoch": 2261} {"train_loss": -6.2202445098332, "global_step": 95003, "epoch": 2261, "val_loss": 67963.4765625} {"train_loss": -6.297749042510986, "global_step": 95004, "epoch": 2262} {"train_loss": -6.274833679199219, "global_step": 95005, "epoch": 2262} {"train_loss": -6.27064323425293, "global_step": 95006, "epoch": 2262} {"train_loss": -6.258242607116699, "global_step": 95007, "epoch": 2262} {"train_loss": -6.218092918395996, "global_step": 95008, "epoch": 2262} {"train_loss": -6.335391998291016, "global_step": 95009, "epoch": 2262} {"train_loss": -6.305656909942627, "global_step": 95010, "epoch": 2262} {"train_loss": -6.178091526031494, "global_step": 95011, "epoch": 2262} {"train_loss": -6.338926315307617, "global_step": 95012, "epoch": 2262} {"train_loss": -6.155020713806152, "global_step": 95013, "epoch": 2262} {"train_loss": -6.294126987457275, "global_step": 95014, "epoch": 2262} {"train_loss": -6.2852277755737305, "global_step": 95015, "epoch": 2262} {"train_loss": -6.230237007141113, "global_step": 95016, "epoch": 2262} {"train_loss": -6.367134094238281, "global_step": 95017, "epoch": 2262} {"train_loss": -6.4587082862854, "global_step": 95018, "epoch": 2262} {"train_loss": -6.339728355407715, "global_step": 95019, "epoch": 2262} {"train_loss": -6.254545211791992, "global_step": 95020, "epoch": 2262} {"train_loss": -6.371281147003174, "global_step": 95021, "epoch": 2262} {"train_loss": -6.305109977722168, "global_step": 95022, "epoch": 2262} {"train_loss": -6.382011413574219, "global_step": 95023, "epoch": 2262} {"train_loss": -6.380264759063721, "global_step": 95024, "epoch": 2262} {"train_loss": -6.457127571105957, "global_step": 95025, "epoch": 2262} {"train_loss": -6.326010227203369, "global_step": 95026, "epoch": 2262} {"train_loss": -6.328394412994385, "global_step": 95027, "epoch": 2262} {"train_loss": -6.274977684020996, "global_step": 95028, "epoch": 2262} {"train_loss": -6.284998893737793, "global_step": 95029, "epoch": 2262} {"train_loss": -6.2264556884765625, "global_step": 95030, "epoch": 2262} {"train_loss": -6.29688024520874, "global_step": 95031, "epoch": 2262} {"train_loss": -6.348878860473633, "global_step": 95032, "epoch": 2262} {"train_loss": -6.278633117675781, "global_step": 95033, "epoch": 2262} {"train_loss": -6.390499114990234, "global_step": 95034, "epoch": 2262} {"train_loss": -6.354841232299805, "global_step": 95035, "epoch": 2262} {"train_loss": -6.257567405700684, "global_step": 95036, "epoch": 2262} {"train_loss": -6.280756950378418, "global_step": 95037, "epoch": 2262} {"train_loss": -6.233031749725342, "global_step": 95038, "epoch": 2262} {"train_loss": -6.333744049072266, "global_step": 95039, "epoch": 2262} {"train_loss": -6.204680442810059, "global_step": 95040, "epoch": 2262} {"train_loss": -6.222155570983887, "global_step": 95041, "epoch": 2262} {"train_loss": -6.203524589538574, "global_step": 95042, "epoch": 2262} {"train_loss": -6.293279647827148, "global_step": 95043, "epoch": 2262} {"train_loss": -6.357080936431885, "global_step": 95044, "epoch": 2262} {"train_loss": -6.29670854977199, "global_step": 95045, "epoch": 2262, "val_loss": 68040.0859375} {"train_loss": -6.306278705596924, "global_step": 95046, "epoch": 2263} {"train_loss": -6.307476043701172, "global_step": 95047, "epoch": 2263} {"train_loss": -6.294716835021973, "global_step": 95048, "epoch": 2263} {"train_loss": -6.4386491775512695, "global_step": 95049, "epoch": 2263} {"train_loss": -6.306744575500488, "global_step": 95050, "epoch": 2263} {"train_loss": -6.300457000732422, "global_step": 95051, "epoch": 2263} {"train_loss": -6.3307342529296875, "global_step": 95052, "epoch": 2263} {"train_loss": -6.346105575561523, "global_step": 95053, "epoch": 2263} {"train_loss": -6.4697089195251465, "global_step": 95054, "epoch": 2263} {"train_loss": -6.299172401428223, "global_step": 95055, "epoch": 2263} {"train_loss": -6.251341342926025, "global_step": 95056, "epoch": 2263} {"train_loss": -6.330967903137207, "global_step": 95057, "epoch": 2263} {"train_loss": -6.27437686920166, "global_step": 95058, "epoch": 2263} {"train_loss": -6.332923412322998, "global_step": 95059, "epoch": 2263} {"train_loss": -6.190101623535156, "global_step": 95060, "epoch": 2263} {"train_loss": -6.425034046173096, "global_step": 95061, "epoch": 2263} {"train_loss": -6.199583053588867, "global_step": 95062, "epoch": 2263} {"train_loss": -6.281032562255859, "global_step": 95063, "epoch": 2263} {"train_loss": -6.376930236816406, "global_step": 95064, "epoch": 2263} {"train_loss": -6.314786911010742, "global_step": 95065, "epoch": 2263} {"train_loss": -6.303267002105713, "global_step": 95066, "epoch": 2263} {"train_loss": -6.413684844970703, "global_step": 95067, "epoch": 2263} {"train_loss": -6.256962776184082, "global_step": 95068, "epoch": 2263} {"train_loss": -6.254655361175537, "global_step": 95069, "epoch": 2263} {"train_loss": -6.3684844970703125, "global_step": 95070, "epoch": 2263} {"train_loss": -6.272003173828125, "global_step": 95071, "epoch": 2263} {"train_loss": -6.297758102416992, "global_step": 95072, "epoch": 2263} {"train_loss": -6.33056640625, "global_step": 95073, "epoch": 2263} {"train_loss": -6.424844741821289, "global_step": 95074, "epoch": 2263} {"train_loss": -6.347537994384766, "global_step": 95075, "epoch": 2263} {"train_loss": -6.368474006652832, "global_step": 95076, "epoch": 2263} {"train_loss": -6.323984622955322, "global_step": 95077, "epoch": 2263} {"train_loss": -6.2734761238098145, "global_step": 95078, "epoch": 2263} {"train_loss": -6.278992652893066, "global_step": 95079, "epoch": 2263} {"train_loss": -6.114123821258545, "global_step": 95080, "epoch": 2263} {"train_loss": -6.169272422790527, "global_step": 95081, "epoch": 2263} {"train_loss": -6.305335998535156, "global_step": 95082, "epoch": 2263} {"train_loss": -6.344954490661621, "global_step": 95083, "epoch": 2263} {"train_loss": -6.365201950073242, "global_step": 95084, "epoch": 2263} {"train_loss": -6.237448692321777, "global_step": 95085, "epoch": 2263} {"train_loss": -6.267399787902832, "global_step": 95086, "epoch": 2263} {"train_loss": -6.308751991816929, "global_step": 95087, "epoch": 2263, "val_loss": 67839.1484375} {"train_loss": -6.263969421386719, "global_step": 95088, "epoch": 2264} {"train_loss": -6.229273796081543, "global_step": 95089, "epoch": 2264} {"train_loss": -6.4746246337890625, "global_step": 95090, "epoch": 2264} {"train_loss": -6.450693130493164, "global_step": 95091, "epoch": 2264} {"train_loss": -6.286548614501953, "global_step": 95092, "epoch": 2264} {"train_loss": -6.383200645446777, "global_step": 95093, "epoch": 2264} {"train_loss": -6.332304954528809, "global_step": 95094, "epoch": 2264} {"train_loss": -6.3357086181640625, "global_step": 95095, "epoch": 2264} {"train_loss": -6.280410289764404, "global_step": 95096, "epoch": 2264} {"train_loss": -6.22502326965332, "global_step": 95097, "epoch": 2264} {"train_loss": -6.21150016784668, "global_step": 95098, "epoch": 2264} {"train_loss": -6.302254676818848, "global_step": 95099, "epoch": 2264} {"train_loss": -6.248101234436035, "global_step": 95100, "epoch": 2264} {"train_loss": -6.2415547370910645, "global_step": 95101, "epoch": 2264} {"train_loss": -6.3067216873168945, "global_step": 95102, "epoch": 2264} {"train_loss": -6.459409236907959, "global_step": 95103, "epoch": 2264} {"train_loss": -6.28913688659668, "global_step": 95104, "epoch": 2264} {"train_loss": -6.211566925048828, "global_step": 95105, "epoch": 2264} {"train_loss": -6.306638717651367, "global_step": 95106, "epoch": 2264} {"train_loss": -6.220047950744629, "global_step": 95107, "epoch": 2264} {"train_loss": -6.418056488037109, "global_step": 95108, "epoch": 2264} {"train_loss": -6.270310401916504, "global_step": 95109, "epoch": 2264} {"train_loss": -6.343050956726074, "global_step": 95110, "epoch": 2264} {"train_loss": -6.288042068481445, "global_step": 95111, "epoch": 2264} {"train_loss": -6.365293025970459, "global_step": 95112, "epoch": 2264} {"train_loss": -6.350042343139648, "global_step": 95113, "epoch": 2264} {"train_loss": -6.228787899017334, "global_step": 95114, "epoch": 2264} {"train_loss": -6.395817756652832, "global_step": 95115, "epoch": 2264} {"train_loss": -6.324406623840332, "global_step": 95116, "epoch": 2264} {"train_loss": -6.251160621643066, "global_step": 95117, "epoch": 2264} {"train_loss": -6.299312114715576, "global_step": 95118, "epoch": 2264} {"train_loss": -6.336773872375488, "global_step": 95119, "epoch": 2264} {"train_loss": -6.250540256500244, "global_step": 95120, "epoch": 2264} {"train_loss": -6.263250350952148, "global_step": 95121, "epoch": 2264} {"train_loss": -6.215445041656494, "global_step": 95122, "epoch": 2264} {"train_loss": -6.272176742553711, "global_step": 95123, "epoch": 2264} {"train_loss": -6.331402778625488, "global_step": 95124, "epoch": 2264} {"train_loss": -6.274532318115234, "global_step": 95125, "epoch": 2264} {"train_loss": -6.287572860717773, "global_step": 95126, "epoch": 2264} {"train_loss": -6.107387542724609, "global_step": 95127, "epoch": 2264} {"train_loss": -6.146859645843506, "global_step": 95128, "epoch": 2264} {"train_loss": -6.287632612955003, "global_step": 95129, "epoch": 2264, "val_loss": 68362.8359375} {"train_loss": -6.001830101013184, "global_step": 95130, "epoch": 2265} {"train_loss": -6.132986068725586, "global_step": 95131, "epoch": 2265} {"train_loss": -6.065360069274902, "global_step": 95132, "epoch": 2265} {"train_loss": -6.30750846862793, "global_step": 95133, "epoch": 2265} {"train_loss": -6.100905418395996, "global_step": 95134, "epoch": 2265} {"train_loss": -6.190064430236816, "global_step": 95135, "epoch": 2265} {"train_loss": -6.101166725158691, "global_step": 95136, "epoch": 2265} {"train_loss": -6.2010321617126465, "global_step": 95137, "epoch": 2265} {"train_loss": -6.132920742034912, "global_step": 95138, "epoch": 2265} {"train_loss": -6.236949443817139, "global_step": 95139, "epoch": 2265} {"train_loss": -6.227220058441162, "global_step": 95140, "epoch": 2265} {"train_loss": -6.210904598236084, "global_step": 95141, "epoch": 2265} {"train_loss": -6.20880126953125, "global_step": 95142, "epoch": 2265} {"train_loss": -6.261181831359863, "global_step": 95143, "epoch": 2265} {"train_loss": -6.226965427398682, "global_step": 95144, "epoch": 2265} {"train_loss": -6.118189334869385, "global_step": 95145, "epoch": 2265} {"train_loss": -6.318464279174805, "global_step": 95146, "epoch": 2265} {"train_loss": -6.340256690979004, "global_step": 95147, "epoch": 2265} {"train_loss": -6.205286026000977, "global_step": 95148, "epoch": 2265} {"train_loss": -6.246919631958008, "global_step": 95149, "epoch": 2265} {"train_loss": -6.2634124755859375, "global_step": 95150, "epoch": 2265} {"train_loss": -6.273775100708008, "global_step": 95151, "epoch": 2265} {"train_loss": -6.225741386413574, "global_step": 95152, "epoch": 2265} {"train_loss": -6.346248626708984, "global_step": 95153, "epoch": 2265} {"train_loss": -6.388083457946777, "global_step": 95154, "epoch": 2265} {"train_loss": -6.2014851570129395, "global_step": 95155, "epoch": 2265} {"train_loss": -6.291750907897949, "global_step": 95156, "epoch": 2265} {"train_loss": -6.435532569885254, "global_step": 95157, "epoch": 2265} {"train_loss": -6.331606864929199, "global_step": 95158, "epoch": 2265} {"train_loss": -6.276612281799316, "global_step": 95159, "epoch": 2265} {"train_loss": -6.222708225250244, "global_step": 95160, "epoch": 2265} {"train_loss": -6.269635200500488, "global_step": 95161, "epoch": 2265} {"train_loss": -6.3650288581848145, "global_step": 95162, "epoch": 2265} {"train_loss": -6.247058391571045, "global_step": 95163, "epoch": 2265} {"train_loss": -6.296223163604736, "global_step": 95164, "epoch": 2265} {"train_loss": -6.335447788238525, "global_step": 95165, "epoch": 2265} {"train_loss": -6.259376525878906, "global_step": 95166, "epoch": 2265} {"train_loss": -6.268048286437988, "global_step": 95167, "epoch": 2265} {"train_loss": -6.352752208709717, "global_step": 95168, "epoch": 2265} {"train_loss": -6.388350486755371, "global_step": 95169, "epoch": 2265} {"train_loss": -6.210166931152344, "global_step": 95170, "epoch": 2265} {"train_loss": -6.244046824319022, "global_step": 95171, "epoch": 2265, "val_loss": 67806.4921875} {"train_loss": -6.357454299926758, "global_step": 95172, "epoch": 2266} {"train_loss": -6.205432891845703, "global_step": 95173, "epoch": 2266} {"train_loss": -6.228281021118164, "global_step": 95174, "epoch": 2266} {"train_loss": -6.293756008148193, "global_step": 95175, "epoch": 2266} {"train_loss": -6.271770000457764, "global_step": 95176, "epoch": 2266} {"train_loss": -6.318948268890381, "global_step": 95177, "epoch": 2266} {"train_loss": -6.239436626434326, "global_step": 95178, "epoch": 2266} {"train_loss": -6.275639533996582, "global_step": 95179, "epoch": 2266} {"train_loss": -6.264310836791992, "global_step": 95180, "epoch": 2266} {"train_loss": -6.344723701477051, "global_step": 95181, "epoch": 2266} {"train_loss": -6.273759365081787, "global_step": 95182, "epoch": 2266} {"train_loss": -6.331843852996826, "global_step": 95183, "epoch": 2266} {"train_loss": -6.409419536590576, "global_step": 95184, "epoch": 2266} {"train_loss": -6.207868576049805, "global_step": 95185, "epoch": 2266} {"train_loss": -6.239637851715088, "global_step": 95186, "epoch": 2266} {"train_loss": -6.288830280303955, "global_step": 95187, "epoch": 2266} {"train_loss": -6.376967906951904, "global_step": 95188, "epoch": 2266} {"train_loss": -6.333160877227783, "global_step": 95189, "epoch": 2266} {"train_loss": -6.206347942352295, "global_step": 95190, "epoch": 2266} {"train_loss": -6.2701263427734375, "global_step": 95191, "epoch": 2266} {"train_loss": -6.3010993003845215, "global_step": 95192, "epoch": 2266} {"train_loss": -6.365840435028076, "global_step": 95193, "epoch": 2266} {"train_loss": -6.430421829223633, "global_step": 95194, "epoch": 2266} {"train_loss": -6.2846760749816895, "global_step": 95195, "epoch": 2266} {"train_loss": -6.219740867614746, "global_step": 95196, "epoch": 2266} {"train_loss": -6.294015884399414, "global_step": 95197, "epoch": 2266} {"train_loss": -6.438139915466309, "global_step": 95198, "epoch": 2266} {"train_loss": -6.275453567504883, "global_step": 95199, "epoch": 2266} {"train_loss": -6.28228759765625, "global_step": 95200, "epoch": 2266} {"train_loss": -6.274080276489258, "global_step": 95201, "epoch": 2266} {"train_loss": -6.2983245849609375, "global_step": 95202, "epoch": 2266} {"train_loss": -6.2999267578125, "global_step": 95203, "epoch": 2266} {"train_loss": -6.3878374099731445, "global_step": 95204, "epoch": 2266} {"train_loss": -6.32468843460083, "global_step": 95205, "epoch": 2266} {"train_loss": -6.297713756561279, "global_step": 95206, "epoch": 2266} {"train_loss": -6.177931785583496, "global_step": 95207, "epoch": 2266} {"train_loss": -6.2170305252075195, "global_step": 95208, "epoch": 2266} {"train_loss": -6.451972007751465, "global_step": 95209, "epoch": 2266} {"train_loss": -6.288200378417969, "global_step": 95210, "epoch": 2266} {"train_loss": -6.339819431304932, "global_step": 95211, "epoch": 2266} {"train_loss": -6.327524185180664, "global_step": 95212, "epoch": 2266} {"train_loss": -6.300505286171322, "global_step": 95213, "epoch": 2266, "val_loss": 68033.1796875} {"train_loss": -6.405248641967773, "global_step": 95214, "epoch": 2267} {"train_loss": -6.1671552658081055, "global_step": 95215, "epoch": 2267} {"train_loss": -6.278866767883301, "global_step": 95216, "epoch": 2267} {"train_loss": -6.334535598754883, "global_step": 95217, "epoch": 2267} {"train_loss": -6.2168779373168945, "global_step": 95218, "epoch": 2267} {"train_loss": -6.198123931884766, "global_step": 95219, "epoch": 2267} {"train_loss": -6.338488578796387, "global_step": 95220, "epoch": 2267} {"train_loss": -6.255777359008789, "global_step": 95221, "epoch": 2267} {"train_loss": -6.377959251403809, "global_step": 95222, "epoch": 2267} {"train_loss": -6.210502624511719, "global_step": 95223, "epoch": 2267} {"train_loss": -6.300901412963867, "global_step": 95224, "epoch": 2267} {"train_loss": -6.311688423156738, "global_step": 95225, "epoch": 2267} {"train_loss": -6.265355110168457, "global_step": 95226, "epoch": 2267} {"train_loss": -6.420035362243652, "global_step": 95227, "epoch": 2267} {"train_loss": -6.245949745178223, "global_step": 95228, "epoch": 2267} {"train_loss": -6.301008701324463, "global_step": 95229, "epoch": 2267} {"train_loss": -6.315371513366699, "global_step": 95230, "epoch": 2267} {"train_loss": -6.39923095703125, "global_step": 95231, "epoch": 2267} {"train_loss": -6.3302178382873535, "global_step": 95232, "epoch": 2267} {"train_loss": -6.410336494445801, "global_step": 95233, "epoch": 2267} {"train_loss": -6.319272994995117, "global_step": 95234, "epoch": 2267} {"train_loss": -6.312887191772461, "global_step": 95235, "epoch": 2267} {"train_loss": -6.389446258544922, "global_step": 95236, "epoch": 2267} {"train_loss": -6.250603675842285, "global_step": 95237, "epoch": 2267} {"train_loss": -6.303197383880615, "global_step": 95238, "epoch": 2267} {"train_loss": -6.2646331787109375, "global_step": 95239, "epoch": 2267} {"train_loss": -6.310782432556152, "global_step": 95240, "epoch": 2267} {"train_loss": -6.269898891448975, "global_step": 95241, "epoch": 2267} {"train_loss": -6.315151214599609, "global_step": 95242, "epoch": 2267} {"train_loss": -6.224028587341309, "global_step": 95243, "epoch": 2267} {"train_loss": -6.291938304901123, "global_step": 95244, "epoch": 2267} {"train_loss": -6.113879203796387, "global_step": 95245, "epoch": 2267} {"train_loss": -6.2614850997924805, "global_step": 95246, "epoch": 2267} {"train_loss": -6.399077415466309, "global_step": 95247, "epoch": 2267} {"train_loss": -6.290136337280273, "global_step": 95248, "epoch": 2267} {"train_loss": -6.374807357788086, "global_step": 95249, "epoch": 2267} {"train_loss": -6.237627983093262, "global_step": 95250, "epoch": 2267} {"train_loss": -6.465322971343994, "global_step": 95251, "epoch": 2267} {"train_loss": -6.376655578613281, "global_step": 95252, "epoch": 2267} {"train_loss": -6.276123046875, "global_step": 95253, "epoch": 2267} {"train_loss": -6.289287567138672, "global_step": 95254, "epoch": 2267} {"train_loss": -6.304422060648601, "global_step": 95255, "epoch": 2267, "val_loss": 68070.3984375} {"train_loss": -6.26239013671875, "global_step": 95256, "epoch": 2268} {"train_loss": -6.449957847595215, "global_step": 95257, "epoch": 2268} {"train_loss": -6.416540145874023, "global_step": 95258, "epoch": 2268} {"train_loss": -6.281355857849121, "global_step": 95259, "epoch": 2268} {"train_loss": -6.356266498565674, "global_step": 95260, "epoch": 2268} {"train_loss": -6.3844194412231445, "global_step": 95261, "epoch": 2268} {"train_loss": -6.19731330871582, "global_step": 95262, "epoch": 2268} {"train_loss": -6.195209503173828, "global_step": 95263, "epoch": 2268} {"train_loss": -6.268839359283447, "global_step": 95264, "epoch": 2268} {"train_loss": -6.206034183502197, "global_step": 95265, "epoch": 2268} {"train_loss": -6.282684803009033, "global_step": 95266, "epoch": 2268} {"train_loss": -6.3496856689453125, "global_step": 95267, "epoch": 2268} {"train_loss": -6.224271297454834, "global_step": 95268, "epoch": 2268} {"train_loss": -6.249856948852539, "global_step": 95269, "epoch": 2268} {"train_loss": -6.16531229019165, "global_step": 95270, "epoch": 2268} {"train_loss": -6.152929782867432, "global_step": 95271, "epoch": 2268} {"train_loss": -6.357996940612793, "global_step": 95272, "epoch": 2268} {"train_loss": -6.398809909820557, "global_step": 95273, "epoch": 2268} {"train_loss": -6.330785751342773, "global_step": 95274, "epoch": 2268} {"train_loss": -6.207675933837891, "global_step": 95275, "epoch": 2268} {"train_loss": -6.304658889770508, "global_step": 95276, "epoch": 2268} {"train_loss": -6.37673282623291, "global_step": 95277, "epoch": 2268} {"train_loss": -6.186384201049805, "global_step": 95278, "epoch": 2268} {"train_loss": -6.3368635177612305, "global_step": 95279, "epoch": 2268} {"train_loss": -6.3931989669799805, "global_step": 95280, "epoch": 2268} {"train_loss": -6.237890720367432, "global_step": 95281, "epoch": 2268} {"train_loss": -6.1861162185668945, "global_step": 95282, "epoch": 2268} {"train_loss": -6.326967239379883, "global_step": 95283, "epoch": 2268} {"train_loss": -6.321449279785156, "global_step": 95284, "epoch": 2268} {"train_loss": -6.338191986083984, "global_step": 95285, "epoch": 2268} {"train_loss": -6.254632472991943, "global_step": 95286, "epoch": 2268} {"train_loss": -6.410475730895996, "global_step": 95287, "epoch": 2268} {"train_loss": -6.325507164001465, "global_step": 95288, "epoch": 2268} {"train_loss": -6.294910907745361, "global_step": 95289, "epoch": 2268} {"train_loss": -6.232117176055908, "global_step": 95290, "epoch": 2268} {"train_loss": -6.390872955322266, "global_step": 95291, "epoch": 2268} {"train_loss": -6.219874858856201, "global_step": 95292, "epoch": 2268} {"train_loss": -6.337893486022949, "global_step": 95293, "epoch": 2268} {"train_loss": -6.278076648712158, "global_step": 95294, "epoch": 2268} {"train_loss": -6.286861419677734, "global_step": 95295, "epoch": 2268} {"train_loss": -6.324404716491699, "global_step": 95296, "epoch": 2268} {"train_loss": -6.296743960607619, "global_step": 95297, "epoch": 2268, "val_loss": 67927.515625} {"train_loss": -6.210749626159668, "global_step": 95298, "epoch": 2269} {"train_loss": -6.25676965713501, "global_step": 95299, "epoch": 2269} {"train_loss": -6.385379791259766, "global_step": 95300, "epoch": 2269} {"train_loss": -6.290441989898682, "global_step": 95301, "epoch": 2269} {"train_loss": -6.218671798706055, "global_step": 95302, "epoch": 2269} {"train_loss": -6.32951021194458, "global_step": 95303, "epoch": 2269} {"train_loss": -6.286607265472412, "global_step": 95304, "epoch": 2269} {"train_loss": -6.170041084289551, "global_step": 95305, "epoch": 2269} {"train_loss": -6.376559734344482, "global_step": 95306, "epoch": 2269} {"train_loss": -6.313299179077148, "global_step": 95307, "epoch": 2269} {"train_loss": -6.308908462524414, "global_step": 95308, "epoch": 2269} {"train_loss": -6.312733173370361, "global_step": 95309, "epoch": 2269} {"train_loss": -6.243195533752441, "global_step": 95310, "epoch": 2269} {"train_loss": -6.163204193115234, "global_step": 95311, "epoch": 2269} {"train_loss": -6.2572736740112305, "global_step": 95312, "epoch": 2269} {"train_loss": -6.195675849914551, "global_step": 95313, "epoch": 2269} {"train_loss": -6.394844055175781, "global_step": 95314, "epoch": 2269} {"train_loss": -6.200467586517334, "global_step": 95315, "epoch": 2269} {"train_loss": -6.223116397857666, "global_step": 95316, "epoch": 2269} {"train_loss": -6.350085258483887, "global_step": 95317, "epoch": 2269} {"train_loss": -6.310408592224121, "global_step": 95318, "epoch": 2269} {"train_loss": -6.271205902099609, "global_step": 95319, "epoch": 2269} {"train_loss": -6.284162521362305, "global_step": 95320, "epoch": 2269} {"train_loss": -6.307222366333008, "global_step": 95321, "epoch": 2269} {"train_loss": -6.28384256362915, "global_step": 95322, "epoch": 2269} {"train_loss": -6.24843692779541, "global_step": 95323, "epoch": 2269} {"train_loss": -6.291900634765625, "global_step": 95324, "epoch": 2269} {"train_loss": -6.33564567565918, "global_step": 95325, "epoch": 2269} {"train_loss": -6.3482346534729, "global_step": 95326, "epoch": 2269} {"train_loss": -6.293184280395508, "global_step": 95327, "epoch": 2269} {"train_loss": -6.229938983917236, "global_step": 95328, "epoch": 2269} {"train_loss": -6.2501678466796875, "global_step": 95329, "epoch": 2269} {"train_loss": -6.242730140686035, "global_step": 95330, "epoch": 2269} {"train_loss": -6.3554182052612305, "global_step": 95331, "epoch": 2269} {"train_loss": -6.318345546722412, "global_step": 95332, "epoch": 2269} {"train_loss": -6.255417823791504, "global_step": 95333, "epoch": 2269} {"train_loss": -6.356154441833496, "global_step": 95334, "epoch": 2269} {"train_loss": -6.157376289367676, "global_step": 95335, "epoch": 2269} {"train_loss": -6.300660610198975, "global_step": 95336, "epoch": 2269} {"train_loss": -6.381811618804932, "global_step": 95337, "epoch": 2269} {"train_loss": -6.317692279815674, "global_step": 95338, "epoch": 2269} {"train_loss": -6.283637728009905, "global_step": 95339, "epoch": 2269, "val_loss": 67817.0546875} {"train_loss": -6.235072135925293, "global_step": 95340, "epoch": 2270} {"train_loss": -6.300970554351807, "global_step": 95341, "epoch": 2270} {"train_loss": -6.345267295837402, "global_step": 95342, "epoch": 2270} {"train_loss": -6.404274940490723, "global_step": 95343, "epoch": 2270} {"train_loss": -6.2883758544921875, "global_step": 95344, "epoch": 2270} {"train_loss": -6.399628639221191, "global_step": 95345, "epoch": 2270} {"train_loss": -6.346792221069336, "global_step": 95346, "epoch": 2270} {"train_loss": -6.350237846374512, "global_step": 95347, "epoch": 2270} {"train_loss": -6.356419563293457, "global_step": 95348, "epoch": 2270} {"train_loss": -6.412360191345215, "global_step": 95349, "epoch": 2270} {"train_loss": -6.344648361206055, "global_step": 95350, "epoch": 2270} {"train_loss": -6.279061794281006, "global_step": 95351, "epoch": 2270} {"train_loss": -6.238000869750977, "global_step": 95352, "epoch": 2270} {"train_loss": -6.360618591308594, "global_step": 95353, "epoch": 2270} {"train_loss": -6.3116254806518555, "global_step": 95354, "epoch": 2270} {"train_loss": -6.164545059204102, "global_step": 95355, "epoch": 2270} {"train_loss": -6.328630447387695, "global_step": 95356, "epoch": 2270} {"train_loss": -6.385332107543945, "global_step": 95357, "epoch": 2270} {"train_loss": -6.29759407043457, "global_step": 95358, "epoch": 2270} {"train_loss": -6.346988677978516, "global_step": 95359, "epoch": 2270} {"train_loss": -6.220548629760742, "global_step": 95360, "epoch": 2270} {"train_loss": -6.420016765594482, "global_step": 95361, "epoch": 2270} {"train_loss": -6.347269535064697, "global_step": 95362, "epoch": 2270} {"train_loss": -6.308353900909424, "global_step": 95363, "epoch": 2270} {"train_loss": -6.329484939575195, "global_step": 95364, "epoch": 2270} {"train_loss": -6.172673225402832, "global_step": 95365, "epoch": 2270} {"train_loss": -6.237576484680176, "global_step": 95366, "epoch": 2270} {"train_loss": -6.424881935119629, "global_step": 95367, "epoch": 2270} {"train_loss": -6.192039489746094, "global_step": 95368, "epoch": 2270} {"train_loss": -6.205948829650879, "global_step": 95369, "epoch": 2270} {"train_loss": -6.30048942565918, "global_step": 95370, "epoch": 2270} {"train_loss": -6.211540222167969, "global_step": 95371, "epoch": 2270} {"train_loss": -6.278395652770996, "global_step": 95372, "epoch": 2270} {"train_loss": -6.200463771820068, "global_step": 95373, "epoch": 2270} {"train_loss": -6.123960971832275, "global_step": 95374, "epoch": 2270} {"train_loss": -6.2399396896362305, "global_step": 95375, "epoch": 2270} {"train_loss": -6.2509942054748535, "global_step": 95376, "epoch": 2270} {"train_loss": -6.205975532531738, "global_step": 95377, "epoch": 2270} {"train_loss": -6.2248029708862305, "global_step": 95378, "epoch": 2270} {"train_loss": -6.238491058349609, "global_step": 95379, "epoch": 2270} {"train_loss": -6.3197832107543945, "global_step": 95380, "epoch": 2270} {"train_loss": -6.292979808080764, "global_step": 95381, "epoch": 2270, "val_loss": 68074.140625} {"train_loss": -6.365373134613037, "global_step": 95382, "epoch": 2271} {"train_loss": -6.317481517791748, "global_step": 95383, "epoch": 2271} {"train_loss": -6.2472639083862305, "global_step": 95384, "epoch": 2271} {"train_loss": -6.181625843048096, "global_step": 95385, "epoch": 2271} {"train_loss": -6.333929061889648, "global_step": 95386, "epoch": 2271} {"train_loss": -6.303267955780029, "global_step": 95387, "epoch": 2271} {"train_loss": -6.282793045043945, "global_step": 95388, "epoch": 2271} {"train_loss": -6.273391246795654, "global_step": 95389, "epoch": 2271} {"train_loss": -6.320705413818359, "global_step": 95390, "epoch": 2271} {"train_loss": -6.215383529663086, "global_step": 95391, "epoch": 2271} {"train_loss": -6.226888179779053, "global_step": 95392, "epoch": 2271} {"train_loss": -6.267111778259277, "global_step": 95393, "epoch": 2271} {"train_loss": -6.298178672790527, "global_step": 95394, "epoch": 2271} {"train_loss": -6.3020124435424805, "global_step": 95395, "epoch": 2271} {"train_loss": -6.278403282165527, "global_step": 95396, "epoch": 2271} {"train_loss": -6.3279829025268555, "global_step": 95397, "epoch": 2271} {"train_loss": -6.248497009277344, "global_step": 95398, "epoch": 2271} {"train_loss": -6.270652770996094, "global_step": 95399, "epoch": 2271} {"train_loss": -6.296565055847168, "global_step": 95400, "epoch": 2271} {"train_loss": -6.295405864715576, "global_step": 95401, "epoch": 2271} {"train_loss": -6.22092342376709, "global_step": 95402, "epoch": 2271} {"train_loss": -6.286460876464844, "global_step": 95403, "epoch": 2271} {"train_loss": -6.184338569641113, "global_step": 95404, "epoch": 2271} {"train_loss": -6.190918922424316, "global_step": 95405, "epoch": 2271} {"train_loss": -6.2198638916015625, "global_step": 95406, "epoch": 2271} {"train_loss": -6.021547317504883, "global_step": 95407, "epoch": 2271} {"train_loss": -6.18547248840332, "global_step": 95408, "epoch": 2271} {"train_loss": -6.078588008880615, "global_step": 95409, "epoch": 2271} {"train_loss": -6.172513008117676, "global_step": 95410, "epoch": 2271} {"train_loss": -6.067461013793945, "global_step": 95411, "epoch": 2271} {"train_loss": -6.186796188354492, "global_step": 95412, "epoch": 2271} {"train_loss": -6.07459831237793, "global_step": 95413, "epoch": 2271} {"train_loss": -6.163087368011475, "global_step": 95414, "epoch": 2271} {"train_loss": -6.114188194274902, "global_step": 95415, "epoch": 2271} {"train_loss": -6.210622787475586, "global_step": 95416, "epoch": 2271} {"train_loss": -6.224677085876465, "global_step": 95417, "epoch": 2271} {"train_loss": -6.202592372894287, "global_step": 95418, "epoch": 2271} {"train_loss": -6.232871055603027, "global_step": 95419, "epoch": 2271} {"train_loss": -6.2440338134765625, "global_step": 95420, "epoch": 2271} {"train_loss": -6.168396472930908, "global_step": 95421, "epoch": 2271} {"train_loss": -6.197961807250977, "global_step": 95422, "epoch": 2271} {"train_loss": -6.224584681647165, "global_step": 95423, "epoch": 2271, "val_loss": 68151.09375} {"train_loss": -6.30108642578125, "global_step": 95424, "epoch": 2272} {"train_loss": -6.202962875366211, "global_step": 95425, "epoch": 2272} {"train_loss": -6.264923095703125, "global_step": 95426, "epoch": 2272} {"train_loss": -6.236968994140625, "global_step": 95427, "epoch": 2272} {"train_loss": -6.215513229370117, "global_step": 95428, "epoch": 2272} {"train_loss": -6.294037342071533, "global_step": 95429, "epoch": 2272} {"train_loss": -6.356529235839844, "global_step": 95430, "epoch": 2272} {"train_loss": -6.228014945983887, "global_step": 95431, "epoch": 2272} {"train_loss": -6.225103855133057, "global_step": 95432, "epoch": 2272} {"train_loss": -6.242844104766846, "global_step": 95433, "epoch": 2272} {"train_loss": -6.358468055725098, "global_step": 95434, "epoch": 2272} {"train_loss": -6.288388252258301, "global_step": 95435, "epoch": 2272} {"train_loss": -6.352437973022461, "global_step": 95436, "epoch": 2272} {"train_loss": -6.1673784255981445, "global_step": 95437, "epoch": 2272} {"train_loss": -6.316788196563721, "global_step": 95438, "epoch": 2272} {"train_loss": -6.35467529296875, "global_step": 95439, "epoch": 2272} {"train_loss": -6.274707317352295, "global_step": 95440, "epoch": 2272} {"train_loss": -6.169443607330322, "global_step": 95441, "epoch": 2272} {"train_loss": -6.409735679626465, "global_step": 95442, "epoch": 2272} {"train_loss": -6.244167327880859, "global_step": 95443, "epoch": 2272} {"train_loss": -6.331354141235352, "global_step": 95444, "epoch": 2272} {"train_loss": -6.324734687805176, "global_step": 95445, "epoch": 2272} {"train_loss": -6.302570819854736, "global_step": 95446, "epoch": 2272} {"train_loss": -6.330132484436035, "global_step": 95447, "epoch": 2272} {"train_loss": -6.190177917480469, "global_step": 95448, "epoch": 2272} {"train_loss": -6.220945358276367, "global_step": 95449, "epoch": 2272} {"train_loss": -6.269008159637451, "global_step": 95450, "epoch": 2272} {"train_loss": -6.235262870788574, "global_step": 95451, "epoch": 2272} {"train_loss": -6.195009231567383, "global_step": 95452, "epoch": 2272} {"train_loss": -6.313506603240967, "global_step": 95453, "epoch": 2272} {"train_loss": -6.26625919342041, "global_step": 95454, "epoch": 2272} {"train_loss": -6.2984819412231445, "global_step": 95455, "epoch": 2272} {"train_loss": -6.191954612731934, "global_step": 95456, "epoch": 2272} {"train_loss": -6.159446716308594, "global_step": 95457, "epoch": 2272} {"train_loss": -6.370321273803711, "global_step": 95458, "epoch": 2272} {"train_loss": -6.176974296569824, "global_step": 95459, "epoch": 2272} {"train_loss": -6.329947471618652, "global_step": 95460, "epoch": 2272} {"train_loss": -6.2040228843688965, "global_step": 95461, "epoch": 2272} {"train_loss": -6.297272682189941, "global_step": 95462, "epoch": 2272} {"train_loss": -6.203884601593018, "global_step": 95463, "epoch": 2272} {"train_loss": -6.303713798522949, "global_step": 95464, "epoch": 2272} {"train_loss": -6.271138089043753, "global_step": 95465, "epoch": 2272, "val_loss": 67890.3359375} {"train_loss": -6.1792778968811035, "global_step": 95466, "epoch": 2273} {"train_loss": -6.189937114715576, "global_step": 95467, "epoch": 2273} {"train_loss": -6.274940490722656, "global_step": 95468, "epoch": 2273} {"train_loss": -6.282639026641846, "global_step": 95469, "epoch": 2273} {"train_loss": -6.305126190185547, "global_step": 95470, "epoch": 2273} {"train_loss": -6.188607215881348, "global_step": 95471, "epoch": 2273} {"train_loss": -6.346155166625977, "global_step": 95472, "epoch": 2273} {"train_loss": -6.277144432067871, "global_step": 95473, "epoch": 2273} {"train_loss": -6.175824165344238, "global_step": 95474, "epoch": 2273} {"train_loss": -6.2485527992248535, "global_step": 95475, "epoch": 2273} {"train_loss": -6.293694972991943, "global_step": 95476, "epoch": 2273} {"train_loss": -6.23789644241333, "global_step": 95477, "epoch": 2273} {"train_loss": -6.3688154220581055, "global_step": 95478, "epoch": 2273} {"train_loss": -6.4163312911987305, "global_step": 95479, "epoch": 2273} {"train_loss": -6.373384475708008, "global_step": 95480, "epoch": 2273} {"train_loss": -6.225713729858398, "global_step": 95481, "epoch": 2273} {"train_loss": -6.297628402709961, "global_step": 95482, "epoch": 2273} {"train_loss": -6.314964294433594, "global_step": 95483, "epoch": 2273} {"train_loss": -6.260173320770264, "global_step": 95484, "epoch": 2273} {"train_loss": -6.262636184692383, "global_step": 95485, "epoch": 2273} {"train_loss": -6.358367443084717, "global_step": 95486, "epoch": 2273} {"train_loss": -6.224123001098633, "global_step": 95487, "epoch": 2273} {"train_loss": -6.149677276611328, "global_step": 95488, "epoch": 2273} {"train_loss": -6.268546104431152, "global_step": 95489, "epoch": 2273} {"train_loss": -6.3553266525268555, "global_step": 95490, "epoch": 2273} {"train_loss": -6.362621307373047, "global_step": 95491, "epoch": 2273} {"train_loss": -6.297413349151611, "global_step": 95492, "epoch": 2273} {"train_loss": -6.283763885498047, "global_step": 95493, "epoch": 2273} {"train_loss": -6.335521697998047, "global_step": 95494, "epoch": 2273} {"train_loss": -6.34337854385376, "global_step": 95495, "epoch": 2273} {"train_loss": -6.261094570159912, "global_step": 95496, "epoch": 2273} {"train_loss": -6.316978454589844, "global_step": 95497, "epoch": 2273} {"train_loss": -6.363470077514648, "global_step": 95498, "epoch": 2273} {"train_loss": -6.227665424346924, "global_step": 95499, "epoch": 2273} {"train_loss": -6.231258392333984, "global_step": 95500, "epoch": 2273} {"train_loss": -6.295461654663086, "global_step": 95501, "epoch": 2273} {"train_loss": -6.304704189300537, "global_step": 95502, "epoch": 2273} {"train_loss": -6.277451992034912, "global_step": 95503, "epoch": 2273} {"train_loss": -6.304549694061279, "global_step": 95504, "epoch": 2273} {"train_loss": -6.453957557678223, "global_step": 95505, "epoch": 2273} {"train_loss": -6.269509315490723, "global_step": 95506, "epoch": 2273} {"train_loss": -6.288372187387376, "global_step": 95507, "epoch": 2273, "val_loss": 68002.328125} {"train_loss": -6.424788475036621, "global_step": 95508, "epoch": 2274} {"train_loss": -6.167959213256836, "global_step": 95509, "epoch": 2274} {"train_loss": -6.46278190612793, "global_step": 95510, "epoch": 2274} {"train_loss": -6.282400608062744, "global_step": 95511, "epoch": 2274} {"train_loss": -6.389481544494629, "global_step": 95512, "epoch": 2274} {"train_loss": -6.241061687469482, "global_step": 95513, "epoch": 2274} {"train_loss": -6.324016094207764, "global_step": 95514, "epoch": 2274} {"train_loss": -6.439263343811035, "global_step": 95515, "epoch": 2274} {"train_loss": -6.2201385498046875, "global_step": 95516, "epoch": 2274} {"train_loss": -6.379307270050049, "global_step": 95517, "epoch": 2274} {"train_loss": -6.45253849029541, "global_step": 95518, "epoch": 2274} {"train_loss": -6.3022871017456055, "global_step": 95519, "epoch": 2274} {"train_loss": -6.327179908752441, "global_step": 95520, "epoch": 2274} {"train_loss": -6.403887748718262, "global_step": 95521, "epoch": 2274} {"train_loss": -6.492916107177734, "global_step": 95522, "epoch": 2274} {"train_loss": -6.34083890914917, "global_step": 95523, "epoch": 2274} {"train_loss": -6.336308002471924, "global_step": 95524, "epoch": 2274} {"train_loss": -6.328745365142822, "global_step": 95525, "epoch": 2274} {"train_loss": -6.291979789733887, "global_step": 95526, "epoch": 2274} {"train_loss": -6.311667442321777, "global_step": 95527, "epoch": 2274} {"train_loss": -6.3086042404174805, "global_step": 95528, "epoch": 2274} {"train_loss": -6.341296672821045, "global_step": 95529, "epoch": 2274} {"train_loss": -6.3867692947387695, "global_step": 95530, "epoch": 2274} {"train_loss": -6.395047187805176, "global_step": 95531, "epoch": 2274} {"train_loss": -6.296168327331543, "global_step": 95532, "epoch": 2274} {"train_loss": -6.254602432250977, "global_step": 95533, "epoch": 2274} {"train_loss": -6.275130271911621, "global_step": 95534, "epoch": 2274} {"train_loss": -6.249106407165527, "global_step": 95535, "epoch": 2274} {"train_loss": -6.367144584655762, "global_step": 95536, "epoch": 2274} {"train_loss": -6.296680450439453, "global_step": 95537, "epoch": 2274} {"train_loss": -6.2530059814453125, "global_step": 95538, "epoch": 2274} {"train_loss": -6.361695766448975, "global_step": 95539, "epoch": 2274} {"train_loss": -6.40263557434082, "global_step": 95540, "epoch": 2274} {"train_loss": -6.344574928283691, "global_step": 95541, "epoch": 2274} {"train_loss": -6.267433166503906, "global_step": 95542, "epoch": 2274} {"train_loss": -6.3252129554748535, "global_step": 95543, "epoch": 2274} {"train_loss": -6.30216121673584, "global_step": 95544, "epoch": 2274} {"train_loss": -6.3166327476501465, "global_step": 95545, "epoch": 2274} {"train_loss": -6.3587493896484375, "global_step": 95546, "epoch": 2274} {"train_loss": -6.2033610343933105, "global_step": 95547, "epoch": 2274} {"train_loss": -6.450812339782715, "global_step": 95548, "epoch": 2274} {"train_loss": -6.330790394828433, "global_step": 95549, "epoch": 2274, "val_loss": 67798.1953125} {"train_loss": -6.301853179931641, "global_step": 95550, "epoch": 2275} {"train_loss": -6.358360290527344, "global_step": 95551, "epoch": 2275} {"train_loss": -6.317478179931641, "global_step": 95552, "epoch": 2275} {"train_loss": -6.343504905700684, "global_step": 95553, "epoch": 2275} {"train_loss": -6.372028827667236, "global_step": 95554, "epoch": 2275} {"train_loss": -6.336767196655273, "global_step": 95555, "epoch": 2275} {"train_loss": -6.256864547729492, "global_step": 95556, "epoch": 2275} {"train_loss": -6.111584663391113, "global_step": 95557, "epoch": 2275} {"train_loss": -6.251039028167725, "global_step": 95558, "epoch": 2275} {"train_loss": -6.333338737487793, "global_step": 95559, "epoch": 2275} {"train_loss": -6.392678737640381, "global_step": 95560, "epoch": 2275} {"train_loss": -6.316439628601074, "global_step": 95561, "epoch": 2275} {"train_loss": -6.3461198806762695, "global_step": 95562, "epoch": 2275} {"train_loss": -6.259828567504883, "global_step": 95563, "epoch": 2275} {"train_loss": -6.146889686584473, "global_step": 95564, "epoch": 2275} {"train_loss": -6.227987289428711, "global_step": 95565, "epoch": 2275} {"train_loss": -6.254810333251953, "global_step": 95566, "epoch": 2275} {"train_loss": -6.18668794631958, "global_step": 95567, "epoch": 2275} {"train_loss": -6.178187370300293, "global_step": 95568, "epoch": 2275} {"train_loss": -6.261946678161621, "global_step": 95569, "epoch": 2275} {"train_loss": -6.29867696762085, "global_step": 95570, "epoch": 2275} {"train_loss": -6.244904041290283, "global_step": 95571, "epoch": 2275} {"train_loss": -6.308285236358643, "global_step": 95572, "epoch": 2275} {"train_loss": -6.121205806732178, "global_step": 95573, "epoch": 2275} {"train_loss": -6.231495380401611, "global_step": 95574, "epoch": 2275} {"train_loss": -6.208850860595703, "global_step": 95575, "epoch": 2275} {"train_loss": -6.416621208190918, "global_step": 95576, "epoch": 2275} {"train_loss": -6.247588634490967, "global_step": 95577, "epoch": 2275} {"train_loss": -6.3228960037231445, "global_step": 95578, "epoch": 2275} {"train_loss": -6.361163139343262, "global_step": 95579, "epoch": 2275} {"train_loss": -6.136661529541016, "global_step": 95580, "epoch": 2275} {"train_loss": -6.332276344299316, "global_step": 95581, "epoch": 2275} {"train_loss": -6.164994239807129, "global_step": 95582, "epoch": 2275} {"train_loss": -6.286846160888672, "global_step": 95583, "epoch": 2275} {"train_loss": -6.236632347106934, "global_step": 95584, "epoch": 2275} {"train_loss": -6.261915683746338, "global_step": 95585, "epoch": 2275} {"train_loss": -6.268644332885742, "global_step": 95586, "epoch": 2275} {"train_loss": -6.360842704772949, "global_step": 95587, "epoch": 2275} {"train_loss": -6.077671051025391, "global_step": 95588, "epoch": 2275} {"train_loss": -6.247010707855225, "global_step": 95589, "epoch": 2275} {"train_loss": -6.2951579093933105, "global_step": 95590, "epoch": 2275} {"train_loss": -6.268387453896659, "global_step": 95591, "epoch": 2275, "val_loss": 67993.1953125} {"train_loss": -6.222245693206787, "global_step": 95592, "epoch": 2276} {"train_loss": -6.280972957611084, "global_step": 95593, "epoch": 2276} {"train_loss": -6.203735828399658, "global_step": 95594, "epoch": 2276} {"train_loss": -6.271723747253418, "global_step": 95595, "epoch": 2276} {"train_loss": -6.296796798706055, "global_step": 95596, "epoch": 2276} {"train_loss": -6.284965515136719, "global_step": 95597, "epoch": 2276} {"train_loss": -6.188752174377441, "global_step": 95598, "epoch": 2276} {"train_loss": -6.314018249511719, "global_step": 95599, "epoch": 2276} {"train_loss": -6.139305114746094, "global_step": 95600, "epoch": 2276} {"train_loss": -6.318253993988037, "global_step": 95601, "epoch": 2276} {"train_loss": -6.326162338256836, "global_step": 95602, "epoch": 2276} {"train_loss": -6.068141937255859, "global_step": 95603, "epoch": 2276} {"train_loss": -6.287199020385742, "global_step": 95604, "epoch": 2276} {"train_loss": -6.11128044128418, "global_step": 95605, "epoch": 2276} {"train_loss": -6.224297523498535, "global_step": 95606, "epoch": 2276} {"train_loss": -6.251251697540283, "global_step": 95607, "epoch": 2276} {"train_loss": -6.191608905792236, "global_step": 95608, "epoch": 2276} {"train_loss": -6.268702983856201, "global_step": 95609, "epoch": 2276} {"train_loss": -6.360929489135742, "global_step": 95610, "epoch": 2276} {"train_loss": -6.2150559425354, "global_step": 95611, "epoch": 2276} {"train_loss": -6.335061073303223, "global_step": 95612, "epoch": 2276} {"train_loss": -6.212913513183594, "global_step": 95613, "epoch": 2276} {"train_loss": -6.3854570388793945, "global_step": 95614, "epoch": 2276} {"train_loss": -6.245430946350098, "global_step": 95615, "epoch": 2276} {"train_loss": -6.351787090301514, "global_step": 95616, "epoch": 2276} {"train_loss": -6.301463603973389, "global_step": 95617, "epoch": 2276} {"train_loss": -6.244534492492676, "global_step": 95618, "epoch": 2276} {"train_loss": -6.264767169952393, "global_step": 95619, "epoch": 2276} {"train_loss": -6.238230228424072, "global_step": 95620, "epoch": 2276} {"train_loss": -6.344232559204102, "global_step": 95621, "epoch": 2276} {"train_loss": -6.20515775680542, "global_step": 95622, "epoch": 2276} {"train_loss": -6.3310136795043945, "global_step": 95623, "epoch": 2276} {"train_loss": -6.333892822265625, "global_step": 95624, "epoch": 2276} {"train_loss": -6.333049774169922, "global_step": 95625, "epoch": 2276} {"train_loss": -6.192644119262695, "global_step": 95626, "epoch": 2276} {"train_loss": -6.170583724975586, "global_step": 95627, "epoch": 2276} {"train_loss": -6.403655052185059, "global_step": 95628, "epoch": 2276} {"train_loss": -6.315910816192627, "global_step": 95629, "epoch": 2276} {"train_loss": -6.245889663696289, "global_step": 95630, "epoch": 2276} {"train_loss": -6.259252548217773, "global_step": 95631, "epoch": 2276} {"train_loss": -6.24897575378418, "global_step": 95632, "epoch": 2276} {"train_loss": -6.264061950501942, "global_step": 95633, "epoch": 2276, "val_loss": 67828.015625} {"train_loss": -6.31782341003418, "global_step": 95634, "epoch": 2277} {"train_loss": -6.186563491821289, "global_step": 95635, "epoch": 2277} {"train_loss": -6.235784530639648, "global_step": 95636, "epoch": 2277} {"train_loss": -6.275091648101807, "global_step": 95637, "epoch": 2277} {"train_loss": -6.223791122436523, "global_step": 95638, "epoch": 2277} {"train_loss": -6.292097091674805, "global_step": 95639, "epoch": 2277} {"train_loss": -6.2178568840026855, "global_step": 95640, "epoch": 2277} {"train_loss": -6.344704627990723, "global_step": 95641, "epoch": 2277} {"train_loss": -6.2889580726623535, "global_step": 95642, "epoch": 2277} {"train_loss": -6.229082107543945, "global_step": 95643, "epoch": 2277} {"train_loss": -6.3928608894348145, "global_step": 95644, "epoch": 2277} {"train_loss": -6.231226921081543, "global_step": 95645, "epoch": 2277} {"train_loss": -6.265859603881836, "global_step": 95646, "epoch": 2277} {"train_loss": -6.345512390136719, "global_step": 95647, "epoch": 2277} {"train_loss": -6.348505973815918, "global_step": 95648, "epoch": 2277} {"train_loss": -6.305484294891357, "global_step": 95649, "epoch": 2277} {"train_loss": -6.342432498931885, "global_step": 95650, "epoch": 2277} {"train_loss": -6.2691144943237305, "global_step": 95651, "epoch": 2277} {"train_loss": -6.296350479125977, "global_step": 95652, "epoch": 2277} {"train_loss": -6.301907539367676, "global_step": 95653, "epoch": 2277} {"train_loss": -6.376182556152344, "global_step": 95654, "epoch": 2277} {"train_loss": -6.244224548339844, "global_step": 95655, "epoch": 2277} {"train_loss": -6.296540260314941, "global_step": 95656, "epoch": 2277} {"train_loss": -6.187507152557373, "global_step": 95657, "epoch": 2277} {"train_loss": -6.349651336669922, "global_step": 95658, "epoch": 2277} {"train_loss": -6.194584846496582, "global_step": 95659, "epoch": 2277} {"train_loss": -6.324123382568359, "global_step": 95660, "epoch": 2277} {"train_loss": -6.260629177093506, "global_step": 95661, "epoch": 2277} {"train_loss": -6.387114524841309, "global_step": 95662, "epoch": 2277} {"train_loss": -6.311979293823242, "global_step": 95663, "epoch": 2277} {"train_loss": -6.272320747375488, "global_step": 95664, "epoch": 2277} {"train_loss": -6.299729347229004, "global_step": 95665, "epoch": 2277} {"train_loss": -6.356069087982178, "global_step": 95666, "epoch": 2277} {"train_loss": -6.2638468742370605, "global_step": 95667, "epoch": 2277} {"train_loss": -6.240194797515869, "global_step": 95668, "epoch": 2277} {"train_loss": -6.397783279418945, "global_step": 95669, "epoch": 2277} {"train_loss": -6.366611480712891, "global_step": 95670, "epoch": 2277} {"train_loss": -6.355494499206543, "global_step": 95671, "epoch": 2277} {"train_loss": -6.431668758392334, "global_step": 95672, "epoch": 2277} {"train_loss": -6.357834815979004, "global_step": 95673, "epoch": 2277} {"train_loss": -6.323307991027832, "global_step": 95674, "epoch": 2277} {"train_loss": -6.302877687272572, "global_step": 95675, "epoch": 2277, "val_loss": 67787.3984375} {"train_loss": -6.239408493041992, "global_step": 95676, "epoch": 2278} {"train_loss": -6.225709915161133, "global_step": 95677, "epoch": 2278} {"train_loss": -6.386600971221924, "global_step": 95678, "epoch": 2278} {"train_loss": -6.365819454193115, "global_step": 95679, "epoch": 2278} {"train_loss": -6.313436985015869, "global_step": 95680, "epoch": 2278} {"train_loss": -6.3660454750061035, "global_step": 95681, "epoch": 2278} {"train_loss": -6.365690231323242, "global_step": 95682, "epoch": 2278} {"train_loss": -6.36232852935791, "global_step": 95683, "epoch": 2278} {"train_loss": -6.349886894226074, "global_step": 95684, "epoch": 2278} {"train_loss": -6.3225250244140625, "global_step": 95685, "epoch": 2278} {"train_loss": -6.185146331787109, "global_step": 95686, "epoch": 2278} {"train_loss": -6.352564811706543, "global_step": 95687, "epoch": 2278} {"train_loss": -6.340964317321777, "global_step": 95688, "epoch": 2278} {"train_loss": -6.245481491088867, "global_step": 95689, "epoch": 2278} {"train_loss": -6.20345401763916, "global_step": 95690, "epoch": 2278} {"train_loss": -6.233028411865234, "global_step": 95691, "epoch": 2278} {"train_loss": -6.241405963897705, "global_step": 95692, "epoch": 2278} {"train_loss": -6.2332916259765625, "global_step": 95693, "epoch": 2278} {"train_loss": -6.266883373260498, "global_step": 95694, "epoch": 2278} {"train_loss": -6.196739196777344, "global_step": 95695, "epoch": 2278} {"train_loss": -6.184812068939209, "global_step": 95696, "epoch": 2278} {"train_loss": -6.282814979553223, "global_step": 95697, "epoch": 2278} {"train_loss": -6.239001274108887, "global_step": 95698, "epoch": 2278} {"train_loss": -6.305999755859375, "global_step": 95699, "epoch": 2278} {"train_loss": -6.367439270019531, "global_step": 95700, "epoch": 2278} {"train_loss": -6.304862976074219, "global_step": 95701, "epoch": 2278} {"train_loss": -6.328868865966797, "global_step": 95702, "epoch": 2278} {"train_loss": -6.37938117980957, "global_step": 95703, "epoch": 2278} {"train_loss": -6.304081916809082, "global_step": 95704, "epoch": 2278} {"train_loss": -6.228135585784912, "global_step": 95705, "epoch": 2278} {"train_loss": -6.428163051605225, "global_step": 95706, "epoch": 2278} {"train_loss": -6.280289649963379, "global_step": 95707, "epoch": 2278} {"train_loss": -6.232458591461182, "global_step": 95708, "epoch": 2278} {"train_loss": -6.267735004425049, "global_step": 95709, "epoch": 2278} {"train_loss": -6.2338151931762695, "global_step": 95710, "epoch": 2278} {"train_loss": -6.272684574127197, "global_step": 95711, "epoch": 2278} {"train_loss": -6.303194522857666, "global_step": 95712, "epoch": 2278} {"train_loss": -6.190540313720703, "global_step": 95713, "epoch": 2278} {"train_loss": -6.24764347076416, "global_step": 95714, "epoch": 2278} {"train_loss": -6.411539077758789, "global_step": 95715, "epoch": 2278} {"train_loss": -6.377677917480469, "global_step": 95716, "epoch": 2278} {"train_loss": -6.292930580320812, "global_step": 95717, "epoch": 2278, "val_loss": 67983.171875} {"train_loss": -6.402200222015381, "global_step": 95718, "epoch": 2279} {"train_loss": -6.288240909576416, "global_step": 95719, "epoch": 2279} {"train_loss": -6.287076473236084, "global_step": 95720, "epoch": 2279} {"train_loss": -6.277132511138916, "global_step": 95721, "epoch": 2279} {"train_loss": -6.237767219543457, "global_step": 95722, "epoch": 2279} {"train_loss": -6.287259578704834, "global_step": 95723, "epoch": 2279} {"train_loss": -6.304193496704102, "global_step": 95724, "epoch": 2279} {"train_loss": -6.334061622619629, "global_step": 95725, "epoch": 2279} {"train_loss": -6.204408645629883, "global_step": 95726, "epoch": 2279} {"train_loss": -6.323078155517578, "global_step": 95727, "epoch": 2279} {"train_loss": -6.329458236694336, "global_step": 95728, "epoch": 2279} {"train_loss": -6.301638603210449, "global_step": 95729, "epoch": 2279} {"train_loss": -6.3305983543396, "global_step": 95730, "epoch": 2279} {"train_loss": -6.341530799865723, "global_step": 95731, "epoch": 2279} {"train_loss": -6.318472862243652, "global_step": 95732, "epoch": 2279} {"train_loss": -6.212269306182861, "global_step": 95733, "epoch": 2279} {"train_loss": -6.316062927246094, "global_step": 95734, "epoch": 2279} {"train_loss": -6.322016716003418, "global_step": 95735, "epoch": 2279} {"train_loss": -6.2822160720825195, "global_step": 95736, "epoch": 2279} {"train_loss": -6.271065711975098, "global_step": 95737, "epoch": 2279} {"train_loss": -6.296294212341309, "global_step": 95738, "epoch": 2279} {"train_loss": -6.319904327392578, "global_step": 95739, "epoch": 2279} {"train_loss": -6.372439384460449, "global_step": 95740, "epoch": 2279} {"train_loss": -6.269611358642578, "global_step": 95741, "epoch": 2279} {"train_loss": -6.219749450683594, "global_step": 95742, "epoch": 2279} {"train_loss": -6.202558517456055, "global_step": 95743, "epoch": 2279} {"train_loss": -6.168020248413086, "global_step": 95744, "epoch": 2279} {"train_loss": -6.352613925933838, "global_step": 95745, "epoch": 2279} {"train_loss": -6.089052200317383, "global_step": 95746, "epoch": 2279} {"train_loss": -6.300410270690918, "global_step": 95747, "epoch": 2279} {"train_loss": -6.159825801849365, "global_step": 95748, "epoch": 2279} {"train_loss": -6.331153869628906, "global_step": 95749, "epoch": 2279} {"train_loss": -6.26322078704834, "global_step": 95750, "epoch": 2279} {"train_loss": -6.251797199249268, "global_step": 95751, "epoch": 2279} {"train_loss": -6.280981063842773, "global_step": 95752, "epoch": 2279} {"train_loss": -6.227670669555664, "global_step": 95753, "epoch": 2279} {"train_loss": -6.368762969970703, "global_step": 95754, "epoch": 2279} {"train_loss": -6.384593486785889, "global_step": 95755, "epoch": 2279} {"train_loss": -6.269174575805664, "global_step": 95756, "epoch": 2279} {"train_loss": -6.320788383483887, "global_step": 95757, "epoch": 2279} {"train_loss": -6.291247367858887, "global_step": 95758, "epoch": 2279} {"train_loss": -6.284316585177467, "global_step": 95759, "epoch": 2279, "val_loss": 67784.4609375} {"train_loss": -6.383785247802734, "global_step": 95760, "epoch": 2280} {"train_loss": -6.2882890701293945, "global_step": 95761, "epoch": 2280} {"train_loss": -6.29841423034668, "global_step": 95762, "epoch": 2280} {"train_loss": -6.272663593292236, "global_step": 95763, "epoch": 2280} {"train_loss": -6.3871636390686035, "global_step": 95764, "epoch": 2280} {"train_loss": -6.347882270812988, "global_step": 95765, "epoch": 2280} {"train_loss": -6.325339317321777, "global_step": 95766, "epoch": 2280} {"train_loss": -6.336985111236572, "global_step": 95767, "epoch": 2280} {"train_loss": -6.271392822265625, "global_step": 95768, "epoch": 2280} {"train_loss": -6.3612189292907715, "global_step": 95769, "epoch": 2280} {"train_loss": -6.28623104095459, "global_step": 95770, "epoch": 2280} {"train_loss": -6.350166320800781, "global_step": 95771, "epoch": 2280} {"train_loss": -6.351061820983887, "global_step": 95772, "epoch": 2280} {"train_loss": -6.284038543701172, "global_step": 95773, "epoch": 2280} {"train_loss": -6.295754909515381, "global_step": 95774, "epoch": 2280} {"train_loss": -6.255612373352051, "global_step": 95775, "epoch": 2280} {"train_loss": -6.288877010345459, "global_step": 95776, "epoch": 2280} {"train_loss": -6.340788841247559, "global_step": 95777, "epoch": 2280} {"train_loss": -6.332857131958008, "global_step": 95778, "epoch": 2280} {"train_loss": -6.367685794830322, "global_step": 95779, "epoch": 2280} {"train_loss": -6.377532005310059, "global_step": 95780, "epoch": 2280} {"train_loss": -6.260708808898926, "global_step": 95781, "epoch": 2280} {"train_loss": -6.268085956573486, "global_step": 95782, "epoch": 2280} {"train_loss": -6.300039768218994, "global_step": 95783, "epoch": 2280} {"train_loss": -6.326360702514648, "global_step": 95784, "epoch": 2280} {"train_loss": -6.261802673339844, "global_step": 95785, "epoch": 2280} {"train_loss": -6.276758670806885, "global_step": 95786, "epoch": 2280} {"train_loss": -6.369028091430664, "global_step": 95787, "epoch": 2280} {"train_loss": -6.346880912780762, "global_step": 95788, "epoch": 2280} {"train_loss": -6.357436180114746, "global_step": 95789, "epoch": 2280} {"train_loss": -6.300864219665527, "global_step": 95790, "epoch": 2280} {"train_loss": -6.3722310066223145, "global_step": 95791, "epoch": 2280} {"train_loss": -6.425315856933594, "global_step": 95792, "epoch": 2280} {"train_loss": -6.358044147491455, "global_step": 95793, "epoch": 2280} {"train_loss": -6.29794454574585, "global_step": 95794, "epoch": 2280} {"train_loss": -6.393074989318848, "global_step": 95795, "epoch": 2280} {"train_loss": -6.2799248695373535, "global_step": 95796, "epoch": 2280} {"train_loss": -6.281939506530762, "global_step": 95797, "epoch": 2280} {"train_loss": -6.403688430786133, "global_step": 95798, "epoch": 2280} {"train_loss": -6.380916118621826, "global_step": 95799, "epoch": 2280} {"train_loss": -6.230495452880859, "global_step": 95800, "epoch": 2280} {"train_loss": -6.325579086939494, "global_step": 95801, "epoch": 2280, "val_loss": 67774.2578125} {"train_loss": -6.419166088104248, "global_step": 95802, "epoch": 2281} {"train_loss": -6.368134498596191, "global_step": 95803, "epoch": 2281} {"train_loss": -6.327624320983887, "global_step": 95804, "epoch": 2281} {"train_loss": -6.286686897277832, "global_step": 95805, "epoch": 2281} {"train_loss": -6.248055458068848, "global_step": 95806, "epoch": 2281} {"train_loss": -6.371515274047852, "global_step": 95807, "epoch": 2281} {"train_loss": -6.305314064025879, "global_step": 95808, "epoch": 2281} {"train_loss": -6.303886413574219, "global_step": 95809, "epoch": 2281} {"train_loss": -6.298069477081299, "global_step": 95810, "epoch": 2281} {"train_loss": -6.24299430847168, "global_step": 95811, "epoch": 2281} {"train_loss": -6.38822078704834, "global_step": 95812, "epoch": 2281} {"train_loss": -6.2645263671875, "global_step": 95813, "epoch": 2281} {"train_loss": -6.323112487792969, "global_step": 95814, "epoch": 2281} {"train_loss": -6.289938449859619, "global_step": 95815, "epoch": 2281} {"train_loss": -6.249210834503174, "global_step": 95816, "epoch": 2281} {"train_loss": -6.3009185791015625, "global_step": 95817, "epoch": 2281} {"train_loss": -6.369561195373535, "global_step": 95818, "epoch": 2281} {"train_loss": -6.310871124267578, "global_step": 95819, "epoch": 2281} {"train_loss": -6.394455909729004, "global_step": 95820, "epoch": 2281} {"train_loss": -6.28292179107666, "global_step": 95821, "epoch": 2281} {"train_loss": -6.330073356628418, "global_step": 95822, "epoch": 2281} {"train_loss": -6.204734802246094, "global_step": 95823, "epoch": 2281} {"train_loss": -6.209488868713379, "global_step": 95824, "epoch": 2281} {"train_loss": -6.283320426940918, "global_step": 95825, "epoch": 2281} {"train_loss": -6.242696285247803, "global_step": 95826, "epoch": 2281} {"train_loss": -6.298802852630615, "global_step": 95827, "epoch": 2281} {"train_loss": -6.259901523590088, "global_step": 95828, "epoch": 2281} {"train_loss": -6.185122966766357, "global_step": 95829, "epoch": 2281} {"train_loss": -6.406745910644531, "global_step": 95830, "epoch": 2281} {"train_loss": -6.378620147705078, "global_step": 95831, "epoch": 2281} {"train_loss": -6.328396797180176, "global_step": 95832, "epoch": 2281} {"train_loss": -6.301755905151367, "global_step": 95833, "epoch": 2281} {"train_loss": -6.251902103424072, "global_step": 95834, "epoch": 2281} {"train_loss": -6.303132057189941, "global_step": 95835, "epoch": 2281} {"train_loss": -6.391828536987305, "global_step": 95836, "epoch": 2281} {"train_loss": -6.300705909729004, "global_step": 95837, "epoch": 2281} {"train_loss": -6.2343430519104, "global_step": 95838, "epoch": 2281} {"train_loss": -6.332880020141602, "global_step": 95839, "epoch": 2281} {"train_loss": -6.235463619232178, "global_step": 95840, "epoch": 2281} {"train_loss": -6.188796520233154, "global_step": 95841, "epoch": 2281} {"train_loss": -6.267951011657715, "global_step": 95842, "epoch": 2281} {"train_loss": -6.2989726066589355, "global_step": 95843, "epoch": 2281, "val_loss": 67885.3125} {"train_loss": -6.399831771850586, "global_step": 95844, "epoch": 2282} {"train_loss": -6.3341240882873535, "global_step": 95845, "epoch": 2282} {"train_loss": -6.270354747772217, "global_step": 95846, "epoch": 2282} {"train_loss": -6.301233768463135, "global_step": 95847, "epoch": 2282} {"train_loss": -6.276165008544922, "global_step": 95848, "epoch": 2282} {"train_loss": -6.3740034103393555, "global_step": 95849, "epoch": 2282} {"train_loss": -6.4331865310668945, "global_step": 95850, "epoch": 2282} {"train_loss": -6.323054313659668, "global_step": 95851, "epoch": 2282} {"train_loss": -6.24495792388916, "global_step": 95852, "epoch": 2282} {"train_loss": -6.301145076751709, "global_step": 95853, "epoch": 2282} {"train_loss": -6.288975715637207, "global_step": 95854, "epoch": 2282} {"train_loss": -6.307258605957031, "global_step": 95855, "epoch": 2282} {"train_loss": -6.34433650970459, "global_step": 95856, "epoch": 2282} {"train_loss": -6.364802360534668, "global_step": 95857, "epoch": 2282} {"train_loss": -6.36337947845459, "global_step": 95858, "epoch": 2282} {"train_loss": -6.358489513397217, "global_step": 95859, "epoch": 2282} {"train_loss": -6.327825546264648, "global_step": 95860, "epoch": 2282} {"train_loss": -6.280048370361328, "global_step": 95861, "epoch": 2282} {"train_loss": -6.254634857177734, "global_step": 95862, "epoch": 2282} {"train_loss": -6.2486114501953125, "global_step": 95863, "epoch": 2282} {"train_loss": -6.294364929199219, "global_step": 95864, "epoch": 2282} {"train_loss": -6.297500133514404, "global_step": 95865, "epoch": 2282} {"train_loss": -6.274003505706787, "global_step": 95866, "epoch": 2282} {"train_loss": -6.340289115905762, "global_step": 95867, "epoch": 2282} {"train_loss": -6.339282989501953, "global_step": 95868, "epoch": 2282} {"train_loss": -6.224156379699707, "global_step": 95869, "epoch": 2282} {"train_loss": -6.323444843292236, "global_step": 95870, "epoch": 2282} {"train_loss": -6.120937347412109, "global_step": 95871, "epoch": 2282} {"train_loss": -6.243328094482422, "global_step": 95872, "epoch": 2282} {"train_loss": -6.362147808074951, "global_step": 95873, "epoch": 2282} {"train_loss": -6.116528511047363, "global_step": 95874, "epoch": 2282} {"train_loss": -6.179271697998047, "global_step": 95875, "epoch": 2282} {"train_loss": -6.27578067779541, "global_step": 95876, "epoch": 2282} {"train_loss": -6.234482765197754, "global_step": 95877, "epoch": 2282} {"train_loss": -6.274044036865234, "global_step": 95878, "epoch": 2282} {"train_loss": -6.20734167098999, "global_step": 95879, "epoch": 2282} {"train_loss": -6.2718658447265625, "global_step": 95880, "epoch": 2282} {"train_loss": -6.28432559967041, "global_step": 95881, "epoch": 2282} {"train_loss": -6.2734503746032715, "global_step": 95882, "epoch": 2282} {"train_loss": -6.229504585266113, "global_step": 95883, "epoch": 2282} {"train_loss": -6.269887924194336, "global_step": 95884, "epoch": 2282} {"train_loss": -6.287528548921857, "global_step": 95885, "epoch": 2282, "val_loss": 67986.4375} {"train_loss": -6.2904510498046875, "global_step": 95886, "epoch": 2283} {"train_loss": -6.306926250457764, "global_step": 95887, "epoch": 2283} {"train_loss": -6.328795433044434, "global_step": 95888, "epoch": 2283} {"train_loss": -6.250133991241455, "global_step": 95889, "epoch": 2283} {"train_loss": -6.247217178344727, "global_step": 95890, "epoch": 2283} {"train_loss": -6.374303817749023, "global_step": 95891, "epoch": 2283} {"train_loss": -6.14934778213501, "global_step": 95892, "epoch": 2283} {"train_loss": -6.329612731933594, "global_step": 95893, "epoch": 2283} {"train_loss": -6.299701690673828, "global_step": 95894, "epoch": 2283} {"train_loss": -6.233464241027832, "global_step": 95895, "epoch": 2283} {"train_loss": -6.239468574523926, "global_step": 95896, "epoch": 2283} {"train_loss": -6.310571670532227, "global_step": 95897, "epoch": 2283} {"train_loss": -6.2557573318481445, "global_step": 95898, "epoch": 2283} {"train_loss": -6.072596549987793, "global_step": 95899, "epoch": 2283} {"train_loss": -6.354640007019043, "global_step": 95900, "epoch": 2283} {"train_loss": -6.241454124450684, "global_step": 95901, "epoch": 2283} {"train_loss": -6.180814743041992, "global_step": 95902, "epoch": 2283} {"train_loss": -6.300873756408691, "global_step": 95903, "epoch": 2283} {"train_loss": -6.32757568359375, "global_step": 95904, "epoch": 2283} {"train_loss": -6.238970756530762, "global_step": 95905, "epoch": 2283} {"train_loss": -6.2968430519104, "global_step": 95906, "epoch": 2283} {"train_loss": -6.267582893371582, "global_step": 95907, "epoch": 2283} {"train_loss": -6.325807094573975, "global_step": 95908, "epoch": 2283} {"train_loss": -6.271024703979492, "global_step": 95909, "epoch": 2283} {"train_loss": -6.277490615844727, "global_step": 95910, "epoch": 2283} {"train_loss": -6.221332550048828, "global_step": 95911, "epoch": 2283} {"train_loss": -6.302847862243652, "global_step": 95912, "epoch": 2283} {"train_loss": -6.391428470611572, "global_step": 95913, "epoch": 2283} {"train_loss": -6.258201599121094, "global_step": 95914, "epoch": 2283} {"train_loss": -6.262294292449951, "global_step": 95915, "epoch": 2283} {"train_loss": -6.290090560913086, "global_step": 95916, "epoch": 2283} {"train_loss": -6.248559951782227, "global_step": 95917, "epoch": 2283} {"train_loss": -6.206544876098633, "global_step": 95918, "epoch": 2283} {"train_loss": -6.279888153076172, "global_step": 95919, "epoch": 2283} {"train_loss": -6.3682332038879395, "global_step": 95920, "epoch": 2283} {"train_loss": -6.309557914733887, "global_step": 95921, "epoch": 2283} {"train_loss": -6.36875057220459, "global_step": 95922, "epoch": 2283} {"train_loss": -6.286360740661621, "global_step": 95923, "epoch": 2283} {"train_loss": -6.249807834625244, "global_step": 95924, "epoch": 2283} {"train_loss": -6.330679416656494, "global_step": 95925, "epoch": 2283} {"train_loss": -6.252496719360352, "global_step": 95926, "epoch": 2283} {"train_loss": -6.279259045918782, "global_step": 95927, "epoch": 2283, "val_loss": 67968.8046875} {"train_loss": -6.358241081237793, "global_step": 95928, "epoch": 2284} {"train_loss": -6.298666954040527, "global_step": 95929, "epoch": 2284} {"train_loss": -6.25486946105957, "global_step": 95930, "epoch": 2284} {"train_loss": -6.347064971923828, "global_step": 95931, "epoch": 2284} {"train_loss": -6.40934419631958, "global_step": 95932, "epoch": 2284} {"train_loss": -6.238555908203125, "global_step": 95933, "epoch": 2284} {"train_loss": -6.351076126098633, "global_step": 95934, "epoch": 2284} {"train_loss": -6.35974645614624, "global_step": 95935, "epoch": 2284} {"train_loss": -6.351932525634766, "global_step": 95936, "epoch": 2284} {"train_loss": -6.274592399597168, "global_step": 95937, "epoch": 2284} {"train_loss": -6.34274435043335, "global_step": 95938, "epoch": 2284} {"train_loss": -6.27828311920166, "global_step": 95939, "epoch": 2284} {"train_loss": -6.133143424987793, "global_step": 95940, "epoch": 2284} {"train_loss": -6.382176399230957, "global_step": 95941, "epoch": 2284} {"train_loss": -6.330263614654541, "global_step": 95942, "epoch": 2284} {"train_loss": -6.170269966125488, "global_step": 95943, "epoch": 2284} {"train_loss": -6.402778625488281, "global_step": 95944, "epoch": 2284} {"train_loss": -6.307317733764648, "global_step": 95945, "epoch": 2284} {"train_loss": -6.318051338195801, "global_step": 95946, "epoch": 2284} {"train_loss": -6.2790021896362305, "global_step": 95947, "epoch": 2284} {"train_loss": -6.255894184112549, "global_step": 95948, "epoch": 2284} {"train_loss": -6.2336883544921875, "global_step": 95949, "epoch": 2284} {"train_loss": -6.3374433517456055, "global_step": 95950, "epoch": 2284} {"train_loss": -6.215665340423584, "global_step": 95951, "epoch": 2284} {"train_loss": -6.277416706085205, "global_step": 95952, "epoch": 2284} {"train_loss": -6.275355339050293, "global_step": 95953, "epoch": 2284} {"train_loss": -6.21621036529541, "global_step": 95954, "epoch": 2284} {"train_loss": -6.343634605407715, "global_step": 95955, "epoch": 2284} {"train_loss": -6.265256881713867, "global_step": 95956, "epoch": 2284} {"train_loss": -6.242215156555176, "global_step": 95957, "epoch": 2284} {"train_loss": -6.31138801574707, "global_step": 95958, "epoch": 2284} {"train_loss": -6.310018062591553, "global_step": 95959, "epoch": 2284} {"train_loss": -6.342843532562256, "global_step": 95960, "epoch": 2284} {"train_loss": -6.265195846557617, "global_step": 95961, "epoch": 2284} {"train_loss": -6.331106662750244, "global_step": 95962, "epoch": 2284} {"train_loss": -6.312673568725586, "global_step": 95963, "epoch": 2284} {"train_loss": -6.332368850708008, "global_step": 95964, "epoch": 2284} {"train_loss": -6.3483452796936035, "global_step": 95965, "epoch": 2284} {"train_loss": -6.290322303771973, "global_step": 95966, "epoch": 2284} {"train_loss": -6.4005279541015625, "global_step": 95967, "epoch": 2284} {"train_loss": -6.240008354187012, "global_step": 95968, "epoch": 2284} {"train_loss": -6.301206895283291, "global_step": 95969, "epoch": 2284, "val_loss": 67946.0546875} {"train_loss": -6.333383560180664, "global_step": 95970, "epoch": 2285} {"train_loss": -6.441415786743164, "global_step": 95971, "epoch": 2285} {"train_loss": -6.351258754730225, "global_step": 95972, "epoch": 2285} {"train_loss": -6.324885368347168, "global_step": 95973, "epoch": 2285} {"train_loss": -6.289073944091797, "global_step": 95974, "epoch": 2285} {"train_loss": -6.327908039093018, "global_step": 95975, "epoch": 2285} {"train_loss": -6.320894241333008, "global_step": 95976, "epoch": 2285} {"train_loss": -6.306161880493164, "global_step": 95977, "epoch": 2285} {"train_loss": -6.244851589202881, "global_step": 95978, "epoch": 2285} {"train_loss": -6.249808311462402, "global_step": 95979, "epoch": 2285} {"train_loss": -6.311860084533691, "global_step": 95980, "epoch": 2285} {"train_loss": -6.363903999328613, "global_step": 95981, "epoch": 2285} {"train_loss": -6.220973014831543, "global_step": 95982, "epoch": 2285} {"train_loss": -6.377715110778809, "global_step": 95983, "epoch": 2285} {"train_loss": -6.304563522338867, "global_step": 95984, "epoch": 2285} {"train_loss": -6.194295883178711, "global_step": 95985, "epoch": 2285} {"train_loss": -6.244935989379883, "global_step": 95986, "epoch": 2285} {"train_loss": -6.308648109436035, "global_step": 95987, "epoch": 2285} {"train_loss": -6.320830821990967, "global_step": 95988, "epoch": 2285} {"train_loss": -6.36611795425415, "global_step": 95989, "epoch": 2285} {"train_loss": -6.308891296386719, "global_step": 95990, "epoch": 2285} {"train_loss": -6.27893590927124, "global_step": 95991, "epoch": 2285} {"train_loss": -6.218784332275391, "global_step": 95992, "epoch": 2285} {"train_loss": -6.129661560058594, "global_step": 95993, "epoch": 2285} {"train_loss": -6.2110595703125, "global_step": 95994, "epoch": 2285} {"train_loss": -6.315331935882568, "global_step": 95995, "epoch": 2285} {"train_loss": -6.296501159667969, "global_step": 95996, "epoch": 2285} {"train_loss": -6.3444061279296875, "global_step": 95997, "epoch": 2285} {"train_loss": -6.320107460021973, "global_step": 95998, "epoch": 2285} {"train_loss": -6.368659019470215, "global_step": 95999, "epoch": 2285} {"train_loss": -6.32086181640625, "global_step": 96000, "epoch": 2285} {"train_loss": -6.361536026000977, "global_step": 96001, "epoch": 2285} {"train_loss": -6.339713096618652, "global_step": 96002, "epoch": 2285} {"train_loss": -6.232646942138672, "global_step": 96003, "epoch": 2285} {"train_loss": -6.306792259216309, "global_step": 96004, "epoch": 2285} {"train_loss": -6.304946422576904, "global_step": 96005, "epoch": 2285} {"train_loss": -6.158665180206299, "global_step": 96006, "epoch": 2285} {"train_loss": -6.3704047203063965, "global_step": 96007, "epoch": 2285} {"train_loss": -6.2438459396362305, "global_step": 96008, "epoch": 2285} {"train_loss": -6.261023998260498, "global_step": 96009, "epoch": 2285} {"train_loss": -6.29976224899292, "global_step": 96010, "epoch": 2285} {"train_loss": -6.297310749689738, "global_step": 96011, "epoch": 2285, "val_loss": 68265.109375} {"train_loss": -6.219966888427734, "global_step": 96012, "epoch": 2286} {"train_loss": -6.257041931152344, "global_step": 96013, "epoch": 2286} {"train_loss": -6.409521579742432, "global_step": 96014, "epoch": 2286} {"train_loss": -6.20546817779541, "global_step": 96015, "epoch": 2286} {"train_loss": -6.288651466369629, "global_step": 96016, "epoch": 2286} {"train_loss": -6.363229274749756, "global_step": 96017, "epoch": 2286} {"train_loss": -6.368889808654785, "global_step": 96018, "epoch": 2286} {"train_loss": -6.38315486907959, "global_step": 96019, "epoch": 2286} {"train_loss": -6.298573970794678, "global_step": 96020, "epoch": 2286} {"train_loss": -6.329424858093262, "global_step": 96021, "epoch": 2286} {"train_loss": -6.209725379943848, "global_step": 96022, "epoch": 2286} {"train_loss": -6.292154788970947, "global_step": 96023, "epoch": 2286} {"train_loss": -6.321039199829102, "global_step": 96024, "epoch": 2286} {"train_loss": -6.1540093421936035, "global_step": 96025, "epoch": 2286} {"train_loss": -6.336915969848633, "global_step": 96026, "epoch": 2286} {"train_loss": -6.180661201477051, "global_step": 96027, "epoch": 2286} {"train_loss": -6.334515571594238, "global_step": 96028, "epoch": 2286} {"train_loss": -6.23277473449707, "global_step": 96029, "epoch": 2286} {"train_loss": -6.141659736633301, "global_step": 96030, "epoch": 2286} {"train_loss": -6.274211883544922, "global_step": 96031, "epoch": 2286} {"train_loss": -6.205475330352783, "global_step": 96032, "epoch": 2286} {"train_loss": -6.175941467285156, "global_step": 96033, "epoch": 2286} {"train_loss": -6.259593963623047, "global_step": 96034, "epoch": 2286} {"train_loss": -6.4187164306640625, "global_step": 96035, "epoch": 2286} {"train_loss": -6.236601829528809, "global_step": 96036, "epoch": 2286} {"train_loss": -6.34218692779541, "global_step": 96037, "epoch": 2286} {"train_loss": -6.260663032531738, "global_step": 96038, "epoch": 2286} {"train_loss": -6.338866710662842, "global_step": 96039, "epoch": 2286} {"train_loss": -6.304218292236328, "global_step": 96040, "epoch": 2286} {"train_loss": -6.200056076049805, "global_step": 96041, "epoch": 2286} {"train_loss": -6.233279705047607, "global_step": 96042, "epoch": 2286} {"train_loss": -6.268296718597412, "global_step": 96043, "epoch": 2286} {"train_loss": -6.259566783905029, "global_step": 96044, "epoch": 2286} {"train_loss": -6.352066516876221, "global_step": 96045, "epoch": 2286} {"train_loss": -6.218505859375, "global_step": 96046, "epoch": 2286} {"train_loss": -6.306125640869141, "global_step": 96047, "epoch": 2286} {"train_loss": -6.343238830566406, "global_step": 96048, "epoch": 2286} {"train_loss": -6.244266510009766, "global_step": 96049, "epoch": 2286} {"train_loss": -6.304701805114746, "global_step": 96050, "epoch": 2286} {"train_loss": -6.2586212158203125, "global_step": 96051, "epoch": 2286} {"train_loss": -6.179747104644775, "global_step": 96052, "epoch": 2286} {"train_loss": -6.276275532586234, "global_step": 96053, "epoch": 2286, "val_loss": 67966.71875} {"train_loss": -6.273049354553223, "global_step": 96054, "epoch": 2287} {"train_loss": -6.318341255187988, "global_step": 96055, "epoch": 2287} {"train_loss": -6.361041069030762, "global_step": 96056, "epoch": 2287} {"train_loss": -6.305335521697998, "global_step": 96057, "epoch": 2287} {"train_loss": -6.2094011306762695, "global_step": 96058, "epoch": 2287} {"train_loss": -6.319267272949219, "global_step": 96059, "epoch": 2287} {"train_loss": -6.225436210632324, "global_step": 96060, "epoch": 2287} {"train_loss": -6.195464611053467, "global_step": 96061, "epoch": 2287} {"train_loss": -6.254674911499023, "global_step": 96062, "epoch": 2287} {"train_loss": -6.275147438049316, "global_step": 96063, "epoch": 2287} {"train_loss": -6.385334491729736, "global_step": 96064, "epoch": 2287} {"train_loss": -6.295171737670898, "global_step": 96065, "epoch": 2287} {"train_loss": -6.344023704528809, "global_step": 96066, "epoch": 2287} {"train_loss": -6.37678337097168, "global_step": 96067, "epoch": 2287} {"train_loss": -6.260416030883789, "global_step": 96068, "epoch": 2287} {"train_loss": -6.3071699142456055, "global_step": 96069, "epoch": 2287} {"train_loss": -6.319429874420166, "global_step": 96070, "epoch": 2287} {"train_loss": -6.155689239501953, "global_step": 96071, "epoch": 2287} {"train_loss": -6.2043609619140625, "global_step": 96072, "epoch": 2287} {"train_loss": -6.255078315734863, "global_step": 96073, "epoch": 2287} {"train_loss": -6.272695064544678, "global_step": 96074, "epoch": 2287} {"train_loss": -6.284479141235352, "global_step": 96075, "epoch": 2287} {"train_loss": -6.254057884216309, "global_step": 96076, "epoch": 2287} {"train_loss": -6.240715503692627, "global_step": 96077, "epoch": 2287} {"train_loss": -6.274728775024414, "global_step": 96078, "epoch": 2287} {"train_loss": -6.3035888671875, "global_step": 96079, "epoch": 2287} {"train_loss": -6.342221260070801, "global_step": 96080, "epoch": 2287} {"train_loss": -6.224212169647217, "global_step": 96081, "epoch": 2287} {"train_loss": -6.253905296325684, "global_step": 96082, "epoch": 2287} {"train_loss": -6.248685359954834, "global_step": 96083, "epoch": 2287} {"train_loss": -6.295116424560547, "global_step": 96084, "epoch": 2287} {"train_loss": -6.196111679077148, "global_step": 96085, "epoch": 2287} {"train_loss": -6.281026840209961, "global_step": 96086, "epoch": 2287} {"train_loss": -6.375123500823975, "global_step": 96087, "epoch": 2287} {"train_loss": -6.228941917419434, "global_step": 96088, "epoch": 2287} {"train_loss": -6.1708831787109375, "global_step": 96089, "epoch": 2287} {"train_loss": -6.2947492599487305, "global_step": 96090, "epoch": 2287} {"train_loss": -6.307924270629883, "global_step": 96091, "epoch": 2287} {"train_loss": -6.3828630447387695, "global_step": 96092, "epoch": 2287} {"train_loss": -6.305503845214844, "global_step": 96093, "epoch": 2287} {"train_loss": -6.397120952606201, "global_step": 96094, "epoch": 2287} {"train_loss": -6.282980056036086, "global_step": 96095, "epoch": 2287, "val_loss": 67760.484375} {"train_loss": -6.452104568481445, "global_step": 96096, "epoch": 2288} {"train_loss": -6.362119674682617, "global_step": 96097, "epoch": 2288} {"train_loss": -6.202463150024414, "global_step": 96098, "epoch": 2288} {"train_loss": -6.283357620239258, "global_step": 96099, "epoch": 2288} {"train_loss": -6.290222644805908, "global_step": 96100, "epoch": 2288} {"train_loss": -6.175034523010254, "global_step": 96101, "epoch": 2288} {"train_loss": -6.303388595581055, "global_step": 96102, "epoch": 2288} {"train_loss": -6.255589485168457, "global_step": 96103, "epoch": 2288} {"train_loss": -6.300459861755371, "global_step": 96104, "epoch": 2288} {"train_loss": -6.434983730316162, "global_step": 96105, "epoch": 2288} {"train_loss": -6.315546989440918, "global_step": 96106, "epoch": 2288} {"train_loss": -6.2783660888671875, "global_step": 96107, "epoch": 2288} {"train_loss": -6.27047061920166, "global_step": 96108, "epoch": 2288} {"train_loss": -6.2856245040893555, "global_step": 96109, "epoch": 2288} {"train_loss": -6.266782760620117, "global_step": 96110, "epoch": 2288} {"train_loss": -6.286797523498535, "global_step": 96111, "epoch": 2288} {"train_loss": -6.2865190505981445, "global_step": 96112, "epoch": 2288} {"train_loss": -6.191588878631592, "global_step": 96113, "epoch": 2288} {"train_loss": -6.2083611488342285, "global_step": 96114, "epoch": 2288} {"train_loss": -6.286472320556641, "global_step": 96115, "epoch": 2288} {"train_loss": -6.294485092163086, "global_step": 96116, "epoch": 2288} {"train_loss": -6.187069416046143, "global_step": 96117, "epoch": 2288} {"train_loss": -6.403465747833252, "global_step": 96118, "epoch": 2288} {"train_loss": -6.254924774169922, "global_step": 96119, "epoch": 2288} {"train_loss": -6.262031555175781, "global_step": 96120, "epoch": 2288} {"train_loss": -6.209590911865234, "global_step": 96121, "epoch": 2288} {"train_loss": -6.439213752746582, "global_step": 96122, "epoch": 2288} {"train_loss": -6.279915809631348, "global_step": 96123, "epoch": 2288} {"train_loss": -6.319946765899658, "global_step": 96124, "epoch": 2288} {"train_loss": -6.200473785400391, "global_step": 96125, "epoch": 2288} {"train_loss": -6.327909469604492, "global_step": 96126, "epoch": 2288} {"train_loss": -6.188725471496582, "global_step": 96127, "epoch": 2288} {"train_loss": -6.2509870529174805, "global_step": 96128, "epoch": 2288} {"train_loss": -6.168273448944092, "global_step": 96129, "epoch": 2288} {"train_loss": -6.325845241546631, "global_step": 96130, "epoch": 2288} {"train_loss": -6.354729652404785, "global_step": 96131, "epoch": 2288} {"train_loss": -6.362969398498535, "global_step": 96132, "epoch": 2288} {"train_loss": -6.429013252258301, "global_step": 96133, "epoch": 2288} {"train_loss": -6.223328590393066, "global_step": 96134, "epoch": 2288} {"train_loss": -6.311319351196289, "global_step": 96135, "epoch": 2288} {"train_loss": -6.196846008300781, "global_step": 96136, "epoch": 2288} {"train_loss": -6.287186679385957, "global_step": 96137, "epoch": 2288, "val_loss": 67688.21875} {"train_loss": -6.419341087341309, "global_step": 96138, "epoch": 2289} {"train_loss": -6.17430305480957, "global_step": 96139, "epoch": 2289} {"train_loss": -6.35682487487793, "global_step": 96140, "epoch": 2289} {"train_loss": -6.327646255493164, "global_step": 96141, "epoch": 2289} {"train_loss": -6.352312088012695, "global_step": 96142, "epoch": 2289} {"train_loss": -6.366308212280273, "global_step": 96143, "epoch": 2289} {"train_loss": -6.293454170227051, "global_step": 96144, "epoch": 2289} {"train_loss": -6.195216178894043, "global_step": 96145, "epoch": 2289} {"train_loss": -6.298154830932617, "global_step": 96146, "epoch": 2289} {"train_loss": -6.322232246398926, "global_step": 96147, "epoch": 2289} {"train_loss": -6.266213417053223, "global_step": 96148, "epoch": 2289} {"train_loss": -6.382296562194824, "global_step": 96149, "epoch": 2289} {"train_loss": -6.220144271850586, "global_step": 96150, "epoch": 2289} {"train_loss": -6.474063396453857, "global_step": 96151, "epoch": 2289} {"train_loss": -6.336570739746094, "global_step": 96152, "epoch": 2289} {"train_loss": -6.294087886810303, "global_step": 96153, "epoch": 2289} {"train_loss": -6.388483047485352, "global_step": 96154, "epoch": 2289} {"train_loss": -6.361627578735352, "global_step": 96155, "epoch": 2289} {"train_loss": -6.245067119598389, "global_step": 96156, "epoch": 2289} {"train_loss": -6.3863019943237305, "global_step": 96157, "epoch": 2289} {"train_loss": -6.357382297515869, "global_step": 96158, "epoch": 2289} {"train_loss": -6.248569488525391, "global_step": 96159, "epoch": 2289} {"train_loss": -6.223835468292236, "global_step": 96160, "epoch": 2289} {"train_loss": -6.288599967956543, "global_step": 96161, "epoch": 2289} {"train_loss": -6.348849773406982, "global_step": 96162, "epoch": 2289} {"train_loss": -6.381032943725586, "global_step": 96163, "epoch": 2289} {"train_loss": -6.256673336029053, "global_step": 96164, "epoch": 2289} {"train_loss": -6.339923858642578, "global_step": 96165, "epoch": 2289} {"train_loss": -6.305804252624512, "global_step": 96166, "epoch": 2289} {"train_loss": -6.393672943115234, "global_step": 96167, "epoch": 2289} {"train_loss": -6.303633213043213, "global_step": 96168, "epoch": 2289} {"train_loss": -6.314744472503662, "global_step": 96169, "epoch": 2289} {"train_loss": -6.3303751945495605, "global_step": 96170, "epoch": 2289} {"train_loss": -6.409788131713867, "global_step": 96171, "epoch": 2289} {"train_loss": -6.297435760498047, "global_step": 96172, "epoch": 2289} {"train_loss": -6.29586124420166, "global_step": 96173, "epoch": 2289} {"train_loss": -6.381011962890625, "global_step": 96174, "epoch": 2289} {"train_loss": -6.279593467712402, "global_step": 96175, "epoch": 2289} {"train_loss": -6.3825178146362305, "global_step": 96176, "epoch": 2289} {"train_loss": -6.319451808929443, "global_step": 96177, "epoch": 2289} {"train_loss": -6.3634138107299805, "global_step": 96178, "epoch": 2289} {"train_loss": -6.3221437476930165, "global_step": 96179, "epoch": 2289, "val_loss": 68025.4921875} {"train_loss": -6.345522880554199, "global_step": 96180, "epoch": 2290} {"train_loss": -6.350818634033203, "global_step": 96181, "epoch": 2290} {"train_loss": -6.357901573181152, "global_step": 96182, "epoch": 2290} {"train_loss": -6.365518569946289, "global_step": 96183, "epoch": 2290} {"train_loss": -6.350323677062988, "global_step": 96184, "epoch": 2290} {"train_loss": -6.298081398010254, "global_step": 96185, "epoch": 2290} {"train_loss": -6.385956764221191, "global_step": 96186, "epoch": 2290} {"train_loss": -6.42595911026001, "global_step": 96187, "epoch": 2290} {"train_loss": -6.302614212036133, "global_step": 96188, "epoch": 2290} {"train_loss": -6.375545501708984, "global_step": 96189, "epoch": 2290} {"train_loss": -6.292459487915039, "global_step": 96190, "epoch": 2290} {"train_loss": -6.345141410827637, "global_step": 96191, "epoch": 2290} {"train_loss": -6.293953895568848, "global_step": 96192, "epoch": 2290} {"train_loss": -6.291236400604248, "global_step": 96193, "epoch": 2290} {"train_loss": -6.299421310424805, "global_step": 96194, "epoch": 2290} {"train_loss": -6.31246280670166, "global_step": 96195, "epoch": 2290} {"train_loss": -6.269082069396973, "global_step": 96196, "epoch": 2290} {"train_loss": -6.352171897888184, "global_step": 96197, "epoch": 2290} {"train_loss": -6.263680934906006, "global_step": 96198, "epoch": 2290} {"train_loss": -6.369410514831543, "global_step": 96199, "epoch": 2290} {"train_loss": -6.144676685333252, "global_step": 96200, "epoch": 2290} {"train_loss": -6.1851277351379395, "global_step": 96201, "epoch": 2290} {"train_loss": -6.492106914520264, "global_step": 96202, "epoch": 2290} {"train_loss": -6.297269821166992, "global_step": 96203, "epoch": 2290} {"train_loss": -6.312623023986816, "global_step": 96204, "epoch": 2290} {"train_loss": -6.398717403411865, "global_step": 96205, "epoch": 2290} {"train_loss": -6.335592269897461, "global_step": 96206, "epoch": 2290} {"train_loss": -6.41262149810791, "global_step": 96207, "epoch": 2290} {"train_loss": -6.388275623321533, "global_step": 96208, "epoch": 2290} {"train_loss": -6.308475494384766, "global_step": 96209, "epoch": 2290} {"train_loss": -6.302579402923584, "global_step": 96210, "epoch": 2290} {"train_loss": -6.355769157409668, "global_step": 96211, "epoch": 2290} {"train_loss": -6.448028564453125, "global_step": 96212, "epoch": 2290} {"train_loss": -6.224431037902832, "global_step": 96213, "epoch": 2290} {"train_loss": -6.229724884033203, "global_step": 96214, "epoch": 2290} {"train_loss": -6.378718852996826, "global_step": 96215, "epoch": 2290} {"train_loss": -6.204815864562988, "global_step": 96216, "epoch": 2290} {"train_loss": -6.315604209899902, "global_step": 96217, "epoch": 2290} {"train_loss": -6.351853370666504, "global_step": 96218, "epoch": 2290} {"train_loss": -6.161885738372803, "global_step": 96219, "epoch": 2290} {"train_loss": -6.214662551879883, "global_step": 96220, "epoch": 2290} {"train_loss": -6.3189018453870505, "global_step": 96221, "epoch": 2290, "val_loss": 68163.4375} {"train_loss": -6.275332450866699, "global_step": 96222, "epoch": 2291} {"train_loss": -6.207305431365967, "global_step": 96223, "epoch": 2291} {"train_loss": -6.315284729003906, "global_step": 96224, "epoch": 2291} {"train_loss": -6.208962440490723, "global_step": 96225, "epoch": 2291} {"train_loss": -6.2785563468933105, "global_step": 96226, "epoch": 2291} {"train_loss": -6.293242454528809, "global_step": 96227, "epoch": 2291} {"train_loss": -6.351021766662598, "global_step": 96228, "epoch": 2291} {"train_loss": -6.247625350952148, "global_step": 96229, "epoch": 2291} {"train_loss": -6.176181793212891, "global_step": 96230, "epoch": 2291} {"train_loss": -6.282655715942383, "global_step": 96231, "epoch": 2291} {"train_loss": -6.2637481689453125, "global_step": 96232, "epoch": 2291} {"train_loss": -6.301329135894775, "global_step": 96233, "epoch": 2291} {"train_loss": -6.249849319458008, "global_step": 96234, "epoch": 2291} {"train_loss": -6.263189315795898, "global_step": 96235, "epoch": 2291} {"train_loss": -6.173619747161865, "global_step": 96236, "epoch": 2291} {"train_loss": -6.153045654296875, "global_step": 96237, "epoch": 2291} {"train_loss": -6.151659965515137, "global_step": 96238, "epoch": 2291} {"train_loss": -6.273730278015137, "global_step": 96239, "epoch": 2291} {"train_loss": -6.297754287719727, "global_step": 96240, "epoch": 2291} {"train_loss": -6.263473033905029, "global_step": 96241, "epoch": 2291} {"train_loss": -6.2833123207092285, "global_step": 96242, "epoch": 2291} {"train_loss": -6.444375991821289, "global_step": 96243, "epoch": 2291} {"train_loss": -6.233555316925049, "global_step": 96244, "epoch": 2291} {"train_loss": -6.250823974609375, "global_step": 96245, "epoch": 2291} {"train_loss": -6.292360305786133, "global_step": 96246, "epoch": 2291} {"train_loss": -6.389476299285889, "global_step": 96247, "epoch": 2291} {"train_loss": -6.298628807067871, "global_step": 96248, "epoch": 2291} {"train_loss": -6.181948661804199, "global_step": 96249, "epoch": 2291} {"train_loss": -6.396200180053711, "global_step": 96250, "epoch": 2291} {"train_loss": -6.363229751586914, "global_step": 96251, "epoch": 2291} {"train_loss": -6.301290512084961, "global_step": 96252, "epoch": 2291} {"train_loss": -6.316949844360352, "global_step": 96253, "epoch": 2291} {"train_loss": -6.241098403930664, "global_step": 96254, "epoch": 2291} {"train_loss": -6.351940631866455, "global_step": 96255, "epoch": 2291} {"train_loss": -6.243191719055176, "global_step": 96256, "epoch": 2291} {"train_loss": -6.3109307289123535, "global_step": 96257, "epoch": 2291} {"train_loss": -6.250653266906738, "global_step": 96258, "epoch": 2291} {"train_loss": -6.288543701171875, "global_step": 96259, "epoch": 2291} {"train_loss": -6.27794885635376, "global_step": 96260, "epoch": 2291} {"train_loss": -6.296627998352051, "global_step": 96261, "epoch": 2291} {"train_loss": -6.284046173095703, "global_step": 96262, "epoch": 2291} {"train_loss": -6.276876029514131, "global_step": 96263, "epoch": 2291, "val_loss": 68373.0546875} {"train_loss": -6.286386489868164, "global_step": 96264, "epoch": 2292} {"train_loss": -6.247815132141113, "global_step": 96265, "epoch": 2292} {"train_loss": -6.218079090118408, "global_step": 96266, "epoch": 2292} {"train_loss": -6.29605770111084, "global_step": 96267, "epoch": 2292} {"train_loss": -6.1337456703186035, "global_step": 96268, "epoch": 2292} {"train_loss": -6.199692726135254, "global_step": 96269, "epoch": 2292} {"train_loss": -6.25014591217041, "global_step": 96270, "epoch": 2292} {"train_loss": -6.232082366943359, "global_step": 96271, "epoch": 2292} {"train_loss": -6.262348175048828, "global_step": 96272, "epoch": 2292} {"train_loss": -6.344331741333008, "global_step": 96273, "epoch": 2292} {"train_loss": -6.284579753875732, "global_step": 96274, "epoch": 2292} {"train_loss": -6.245278358459473, "global_step": 96275, "epoch": 2292} {"train_loss": -6.2062482833862305, "global_step": 96276, "epoch": 2292} {"train_loss": -6.23129415512085, "global_step": 96277, "epoch": 2292} {"train_loss": -6.321747779846191, "global_step": 96278, "epoch": 2292} {"train_loss": -6.163641929626465, "global_step": 96279, "epoch": 2292} {"train_loss": -6.414210796356201, "global_step": 96280, "epoch": 2292} {"train_loss": -6.375378608703613, "global_step": 96281, "epoch": 2292} {"train_loss": -6.243225574493408, "global_step": 96282, "epoch": 2292} {"train_loss": -6.213260650634766, "global_step": 96283, "epoch": 2292} {"train_loss": -6.313347816467285, "global_step": 96284, "epoch": 2292} {"train_loss": -6.2919745445251465, "global_step": 96285, "epoch": 2292} {"train_loss": -6.245394706726074, "global_step": 96286, "epoch": 2292} {"train_loss": -6.351357936859131, "global_step": 96287, "epoch": 2292} {"train_loss": -6.196283340454102, "global_step": 96288, "epoch": 2292} {"train_loss": -6.319796085357666, "global_step": 96289, "epoch": 2292} {"train_loss": -6.320287704467773, "global_step": 96290, "epoch": 2292} {"train_loss": -6.395857334136963, "global_step": 96291, "epoch": 2292} {"train_loss": -6.304584503173828, "global_step": 96292, "epoch": 2292} {"train_loss": -6.272226333618164, "global_step": 96293, "epoch": 2292} {"train_loss": -6.291995525360107, "global_step": 96294, "epoch": 2292} {"train_loss": -6.40718936920166, "global_step": 96295, "epoch": 2292} {"train_loss": -6.323685646057129, "global_step": 96296, "epoch": 2292} {"train_loss": -6.301403999328613, "global_step": 96297, "epoch": 2292} {"train_loss": -6.257629871368408, "global_step": 96298, "epoch": 2292} {"train_loss": -6.263239860534668, "global_step": 96299, "epoch": 2292} {"train_loss": -6.168841361999512, "global_step": 96300, "epoch": 2292} {"train_loss": -6.330760478973389, "global_step": 96301, "epoch": 2292} {"train_loss": -6.306541442871094, "global_step": 96302, "epoch": 2292} {"train_loss": -6.369065284729004, "global_step": 96303, "epoch": 2292} {"train_loss": -6.286140441894531, "global_step": 96304, "epoch": 2292} {"train_loss": -6.280429533549717, "global_step": 96305, "epoch": 2292, "val_loss": 67870.578125} {"train_loss": -6.352633953094482, "global_step": 96306, "epoch": 2293} {"train_loss": -6.225319862365723, "global_step": 96307, "epoch": 2293} {"train_loss": -6.361204147338867, "global_step": 96308, "epoch": 2293} {"train_loss": -6.324169158935547, "global_step": 96309, "epoch": 2293} {"train_loss": -6.233241558074951, "global_step": 96310, "epoch": 2293} {"train_loss": -6.347965717315674, "global_step": 96311, "epoch": 2293} {"train_loss": -6.2662153244018555, "global_step": 96312, "epoch": 2293} {"train_loss": -6.398857116699219, "global_step": 96313, "epoch": 2293} {"train_loss": -6.290570259094238, "global_step": 96314, "epoch": 2293} {"train_loss": -6.292116165161133, "global_step": 96315, "epoch": 2293} {"train_loss": -6.319833755493164, "global_step": 96316, "epoch": 2293} {"train_loss": -6.3578996658325195, "global_step": 96317, "epoch": 2293} {"train_loss": -6.3836669921875, "global_step": 96318, "epoch": 2293} {"train_loss": -6.312274932861328, "global_step": 96319, "epoch": 2293} {"train_loss": -6.4463701248168945, "global_step": 96320, "epoch": 2293} {"train_loss": -6.271402359008789, "global_step": 96321, "epoch": 2293} {"train_loss": -6.30865478515625, "global_step": 96322, "epoch": 2293} {"train_loss": -6.301139831542969, "global_step": 96323, "epoch": 2293} {"train_loss": -6.32810640335083, "global_step": 96324, "epoch": 2293} {"train_loss": -6.399935245513916, "global_step": 96325, "epoch": 2293} {"train_loss": -6.260586738586426, "global_step": 96326, "epoch": 2293} {"train_loss": -6.271847724914551, "global_step": 96327, "epoch": 2293} {"train_loss": -6.301661014556885, "global_step": 96328, "epoch": 2293} {"train_loss": -6.353635787963867, "global_step": 96329, "epoch": 2293} {"train_loss": -6.25502872467041, "global_step": 96330, "epoch": 2293} {"train_loss": -6.2940592765808105, "global_step": 96331, "epoch": 2293} {"train_loss": -6.336668014526367, "global_step": 96332, "epoch": 2293} {"train_loss": -6.316075325012207, "global_step": 96333, "epoch": 2293} {"train_loss": -6.414399147033691, "global_step": 96334, "epoch": 2293} {"train_loss": -6.3004255294799805, "global_step": 96335, "epoch": 2293} {"train_loss": -6.268350124359131, "global_step": 96336, "epoch": 2293} {"train_loss": -6.345572471618652, "global_step": 96337, "epoch": 2293} {"train_loss": -6.324437141418457, "global_step": 96338, "epoch": 2293} {"train_loss": -6.299283981323242, "global_step": 96339, "epoch": 2293} {"train_loss": -6.249283790588379, "global_step": 96340, "epoch": 2293} {"train_loss": -6.375149726867676, "global_step": 96341, "epoch": 2293} {"train_loss": -6.301382541656494, "global_step": 96342, "epoch": 2293} {"train_loss": -6.353388786315918, "global_step": 96343, "epoch": 2293} {"train_loss": -6.383705139160156, "global_step": 96344, "epoch": 2293} {"train_loss": -6.332061767578125, "global_step": 96345, "epoch": 2293} {"train_loss": -6.33017635345459, "global_step": 96346, "epoch": 2293} {"train_loss": -6.320549317768642, "global_step": 96347, "epoch": 2293, "val_loss": 68005.9140625} {"train_loss": -6.254727363586426, "global_step": 96348, "epoch": 2294} {"train_loss": -6.268039226531982, "global_step": 96349, "epoch": 2294} {"train_loss": -6.268028736114502, "global_step": 96350, "epoch": 2294} {"train_loss": -6.279829502105713, "global_step": 96351, "epoch": 2294} {"train_loss": -6.316515922546387, "global_step": 96352, "epoch": 2294} {"train_loss": -6.424941062927246, "global_step": 96353, "epoch": 2294} {"train_loss": -6.352799415588379, "global_step": 96354, "epoch": 2294} {"train_loss": -6.484016418457031, "global_step": 96355, "epoch": 2294} {"train_loss": -6.386082172393799, "global_step": 96356, "epoch": 2294} {"train_loss": -6.420942783355713, "global_step": 96357, "epoch": 2294} {"train_loss": -6.305129051208496, "global_step": 96358, "epoch": 2294} {"train_loss": -6.346749305725098, "global_step": 96359, "epoch": 2294} {"train_loss": -6.26422643661499, "global_step": 96360, "epoch": 2294} {"train_loss": -6.321909427642822, "global_step": 96361, "epoch": 2294} {"train_loss": -6.359472274780273, "global_step": 96362, "epoch": 2294} {"train_loss": -6.210050582885742, "global_step": 96363, "epoch": 2294} {"train_loss": -6.229058265686035, "global_step": 96364, "epoch": 2294} {"train_loss": -6.1549577713012695, "global_step": 96365, "epoch": 2294} {"train_loss": -6.396432876586914, "global_step": 96366, "epoch": 2294} {"train_loss": -6.33135986328125, "global_step": 96367, "epoch": 2294} {"train_loss": -6.283738136291504, "global_step": 96368, "epoch": 2294} {"train_loss": -6.281497001647949, "global_step": 96369, "epoch": 2294} {"train_loss": -6.281708240509033, "global_step": 96370, "epoch": 2294} {"train_loss": -6.314431190490723, "global_step": 96371, "epoch": 2294} {"train_loss": -6.316342830657959, "global_step": 96372, "epoch": 2294} {"train_loss": -6.358783721923828, "global_step": 96373, "epoch": 2294} {"train_loss": -6.322276592254639, "global_step": 96374, "epoch": 2294} {"train_loss": -6.3623552322387695, "global_step": 96375, "epoch": 2294} {"train_loss": -6.254976272583008, "global_step": 96376, "epoch": 2294} {"train_loss": -6.326667785644531, "global_step": 96377, "epoch": 2294} {"train_loss": -6.295321941375732, "global_step": 96378, "epoch": 2294} {"train_loss": -6.376022815704346, "global_step": 96379, "epoch": 2294} {"train_loss": -6.210649490356445, "global_step": 96380, "epoch": 2294} {"train_loss": -6.313021659851074, "global_step": 96381, "epoch": 2294} {"train_loss": -6.299760818481445, "global_step": 96382, "epoch": 2294} {"train_loss": -6.295136451721191, "global_step": 96383, "epoch": 2294} {"train_loss": -6.332277297973633, "global_step": 96384, "epoch": 2294} {"train_loss": -6.246078968048096, "global_step": 96385, "epoch": 2294} {"train_loss": -6.239072322845459, "global_step": 96386, "epoch": 2294} {"train_loss": -6.368954658508301, "global_step": 96387, "epoch": 2294} {"train_loss": -6.322977542877197, "global_step": 96388, "epoch": 2294} {"train_loss": -6.311368749255226, "global_step": 96389, "epoch": 2294, "val_loss": 67992.40625} {"train_loss": -6.325870037078857, "global_step": 96390, "epoch": 2295} {"train_loss": -6.320381164550781, "global_step": 96391, "epoch": 2295} {"train_loss": -6.213863372802734, "global_step": 96392, "epoch": 2295} {"train_loss": -6.202086448669434, "global_step": 96393, "epoch": 2295} {"train_loss": -6.313050270080566, "global_step": 96394, "epoch": 2295} {"train_loss": -6.351855754852295, "global_step": 96395, "epoch": 2295} {"train_loss": -6.349190711975098, "global_step": 96396, "epoch": 2295} {"train_loss": -6.29396915435791, "global_step": 96397, "epoch": 2295} {"train_loss": -6.40864896774292, "global_step": 96398, "epoch": 2295} {"train_loss": -6.276451110839844, "global_step": 96399, "epoch": 2295} {"train_loss": -6.406915187835693, "global_step": 96400, "epoch": 2295} {"train_loss": -6.382330894470215, "global_step": 96401, "epoch": 2295} {"train_loss": -6.304656982421875, "global_step": 96402, "epoch": 2295} {"train_loss": -6.21162223815918, "global_step": 96403, "epoch": 2295} {"train_loss": -6.415265083312988, "global_step": 96404, "epoch": 2295} {"train_loss": -6.311526298522949, "global_step": 96405, "epoch": 2295} {"train_loss": -6.3283257484436035, "global_step": 96406, "epoch": 2295} {"train_loss": -6.380129814147949, "global_step": 96407, "epoch": 2295} {"train_loss": -6.308692932128906, "global_step": 96408, "epoch": 2295} {"train_loss": -6.34068489074707, "global_step": 96409, "epoch": 2295} {"train_loss": -6.268130779266357, "global_step": 96410, "epoch": 2295} {"train_loss": -6.312000751495361, "global_step": 96411, "epoch": 2295} {"train_loss": -6.444867134094238, "global_step": 96412, "epoch": 2295} {"train_loss": -6.3487701416015625, "global_step": 96413, "epoch": 2295} {"train_loss": -6.231592178344727, "global_step": 96414, "epoch": 2295} {"train_loss": -6.439791679382324, "global_step": 96415, "epoch": 2295} {"train_loss": -6.234647274017334, "global_step": 96416, "epoch": 2295} {"train_loss": -6.352751731872559, "global_step": 96417, "epoch": 2295} {"train_loss": -6.356363296508789, "global_step": 96418, "epoch": 2295} {"train_loss": -6.244524002075195, "global_step": 96419, "epoch": 2295} {"train_loss": -6.21968936920166, "global_step": 96420, "epoch": 2295} {"train_loss": -6.268185615539551, "global_step": 96421, "epoch": 2295} {"train_loss": -6.143207550048828, "global_step": 96422, "epoch": 2295} {"train_loss": -6.272861480712891, "global_step": 96423, "epoch": 2295} {"train_loss": -6.29707670211792, "global_step": 96424, "epoch": 2295} {"train_loss": -6.2699384689331055, "global_step": 96425, "epoch": 2295} {"train_loss": -6.192676544189453, "global_step": 96426, "epoch": 2295} {"train_loss": -6.193370819091797, "global_step": 96427, "epoch": 2295} {"train_loss": -6.112307071685791, "global_step": 96428, "epoch": 2295} {"train_loss": -6.216206073760986, "global_step": 96429, "epoch": 2295} {"train_loss": -6.16267204284668, "global_step": 96430, "epoch": 2295} {"train_loss": -6.292766843523298, "global_step": 96431, "epoch": 2295, "val_loss": 67860.8125} {"train_loss": -6.227044105529785, "global_step": 96432, "epoch": 2296} {"train_loss": -6.3756794929504395, "global_step": 96433, "epoch": 2296} {"train_loss": -6.176055431365967, "global_step": 96434, "epoch": 2296} {"train_loss": -6.292801380157471, "global_step": 96435, "epoch": 2296} {"train_loss": -6.387292861938477, "global_step": 96436, "epoch": 2296} {"train_loss": -6.319607734680176, "global_step": 96437, "epoch": 2296} {"train_loss": -6.222476959228516, "global_step": 96438, "epoch": 2296} {"train_loss": -6.3792595863342285, "global_step": 96439, "epoch": 2296} {"train_loss": -6.290730953216553, "global_step": 96440, "epoch": 2296} {"train_loss": -6.374140739440918, "global_step": 96441, "epoch": 2296} {"train_loss": -6.345062732696533, "global_step": 96442, "epoch": 2296} {"train_loss": -6.306629180908203, "global_step": 96443, "epoch": 2296} {"train_loss": -6.339617729187012, "global_step": 96444, "epoch": 2296} {"train_loss": -6.294142723083496, "global_step": 96445, "epoch": 2296} {"train_loss": -6.383143424987793, "global_step": 96446, "epoch": 2296} {"train_loss": -6.251943588256836, "global_step": 96447, "epoch": 2296} {"train_loss": -6.219388961791992, "global_step": 96448, "epoch": 2296} {"train_loss": -6.2157063484191895, "global_step": 96449, "epoch": 2296} {"train_loss": -6.330709934234619, "global_step": 96450, "epoch": 2296} {"train_loss": -6.308167457580566, "global_step": 96451, "epoch": 2296} {"train_loss": -6.204211711883545, "global_step": 96452, "epoch": 2296} {"train_loss": -6.358834266662598, "global_step": 96453, "epoch": 2296} {"train_loss": -6.213509559631348, "global_step": 96454, "epoch": 2296} {"train_loss": -6.391016960144043, "global_step": 96455, "epoch": 2296} {"train_loss": -6.226245880126953, "global_step": 96456, "epoch": 2296} {"train_loss": -6.25887393951416, "global_step": 96457, "epoch": 2296} {"train_loss": -6.323733806610107, "global_step": 96458, "epoch": 2296} {"train_loss": -6.262300491333008, "global_step": 96459, "epoch": 2296} {"train_loss": -6.388741493225098, "global_step": 96460, "epoch": 2296} {"train_loss": -6.305202484130859, "global_step": 96461, "epoch": 2296} {"train_loss": -6.211705207824707, "global_step": 96462, "epoch": 2296} {"train_loss": -6.316578388214111, "global_step": 96463, "epoch": 2296} {"train_loss": -6.2757978439331055, "global_step": 96464, "epoch": 2296} {"train_loss": -6.234515190124512, "global_step": 96465, "epoch": 2296} {"train_loss": -6.191078186035156, "global_step": 96466, "epoch": 2296} {"train_loss": -6.296083927154541, "global_step": 96467, "epoch": 2296} {"train_loss": -6.165478706359863, "global_step": 96468, "epoch": 2296} {"train_loss": -6.22091007232666, "global_step": 96469, "epoch": 2296} {"train_loss": -6.244803428649902, "global_step": 96470, "epoch": 2296} {"train_loss": -6.302108287811279, "global_step": 96471, "epoch": 2296} {"train_loss": -6.360116958618164, "global_step": 96472, "epoch": 2296} {"train_loss": -6.286809194655645, "global_step": 96473, "epoch": 2296, "val_loss": 68118.859375} {"train_loss": -6.2504425048828125, "global_step": 96474, "epoch": 2297} {"train_loss": -6.226180076599121, "global_step": 96475, "epoch": 2297} {"train_loss": -6.275674343109131, "global_step": 96476, "epoch": 2297} {"train_loss": -6.230802536010742, "global_step": 96477, "epoch": 2297} {"train_loss": -6.243148326873779, "global_step": 96478, "epoch": 2297} {"train_loss": -6.266947269439697, "global_step": 96479, "epoch": 2297} {"train_loss": -6.226914405822754, "global_step": 96480, "epoch": 2297} {"train_loss": -6.292325019836426, "global_step": 96481, "epoch": 2297} {"train_loss": -6.309065341949463, "global_step": 96482, "epoch": 2297} {"train_loss": -6.209660053253174, "global_step": 96483, "epoch": 2297} {"train_loss": -6.353798866271973, "global_step": 96484, "epoch": 2297} {"train_loss": -6.361400604248047, "global_step": 96485, "epoch": 2297} {"train_loss": -6.361602783203125, "global_step": 96486, "epoch": 2297} {"train_loss": -6.320606231689453, "global_step": 96487, "epoch": 2297} {"train_loss": -6.265250205993652, "global_step": 96488, "epoch": 2297} {"train_loss": -6.25833797454834, "global_step": 96489, "epoch": 2297} {"train_loss": -6.27443790435791, "global_step": 96490, "epoch": 2297} {"train_loss": -6.152005195617676, "global_step": 96491, "epoch": 2297} {"train_loss": -6.319394588470459, "global_step": 96492, "epoch": 2297} {"train_loss": -6.211922645568848, "global_step": 96493, "epoch": 2297} {"train_loss": -6.308300971984863, "global_step": 96494, "epoch": 2297} {"train_loss": -6.262006759643555, "global_step": 96495, "epoch": 2297} {"train_loss": -6.287082672119141, "global_step": 96496, "epoch": 2297} {"train_loss": -6.3091139793396, "global_step": 96497, "epoch": 2297} {"train_loss": -6.302334785461426, "global_step": 96498, "epoch": 2297} {"train_loss": -6.260517120361328, "global_step": 96499, "epoch": 2297} {"train_loss": -6.174548625946045, "global_step": 96500, "epoch": 2297} {"train_loss": -6.264766693115234, "global_step": 96501, "epoch": 2297} {"train_loss": -6.14468240737915, "global_step": 96502, "epoch": 2297} {"train_loss": -6.301535606384277, "global_step": 96503, "epoch": 2297} {"train_loss": -6.291886329650879, "global_step": 96504, "epoch": 2297} {"train_loss": -6.27927827835083, "global_step": 96505, "epoch": 2297} {"train_loss": -6.3264079093933105, "global_step": 96506, "epoch": 2297} {"train_loss": -6.294646739959717, "global_step": 96507, "epoch": 2297} {"train_loss": -6.2562255859375, "global_step": 96508, "epoch": 2297} {"train_loss": -6.339283466339111, "global_step": 96509, "epoch": 2297} {"train_loss": -6.1611127853393555, "global_step": 96510, "epoch": 2297} {"train_loss": -6.16249942779541, "global_step": 96511, "epoch": 2297} {"train_loss": -6.321745872497559, "global_step": 96512, "epoch": 2297} {"train_loss": -6.120368957519531, "global_step": 96513, "epoch": 2297} {"train_loss": -6.183903217315674, "global_step": 96514, "epoch": 2297} {"train_loss": -6.260332868212745, "global_step": 96515, "epoch": 2297, "val_loss": 67911.0546875} {"train_loss": -6.3140411376953125, "global_step": 96516, "epoch": 2298} {"train_loss": -6.168187141418457, "global_step": 96517, "epoch": 2298} {"train_loss": -6.200666904449463, "global_step": 96518, "epoch": 2298} {"train_loss": -6.206646919250488, "global_step": 96519, "epoch": 2298} {"train_loss": -6.375367164611816, "global_step": 96520, "epoch": 2298} {"train_loss": -6.218514442443848, "global_step": 96521, "epoch": 2298} {"train_loss": -6.211791515350342, "global_step": 96522, "epoch": 2298} {"train_loss": -6.18155574798584, "global_step": 96523, "epoch": 2298} {"train_loss": -6.196283340454102, "global_step": 96524, "epoch": 2298} {"train_loss": -6.264028072357178, "global_step": 96525, "epoch": 2298} {"train_loss": -6.153154373168945, "global_step": 96526, "epoch": 2298} {"train_loss": -6.315313339233398, "global_step": 96527, "epoch": 2298} {"train_loss": -6.104593276977539, "global_step": 96528, "epoch": 2298} {"train_loss": -6.170563697814941, "global_step": 96529, "epoch": 2298} {"train_loss": -6.207239627838135, "global_step": 96530, "epoch": 2298} {"train_loss": -6.2122416496276855, "global_step": 96531, "epoch": 2298} {"train_loss": -6.304608345031738, "global_step": 96532, "epoch": 2298} {"train_loss": -6.260649681091309, "global_step": 96533, "epoch": 2298} {"train_loss": -6.317206382751465, "global_step": 96534, "epoch": 2298} {"train_loss": -6.32452392578125, "global_step": 96535, "epoch": 2298} {"train_loss": -6.225338935852051, "global_step": 96536, "epoch": 2298} {"train_loss": -6.169497966766357, "global_step": 96537, "epoch": 2298} {"train_loss": -6.304455757141113, "global_step": 96538, "epoch": 2298} {"train_loss": -6.151675701141357, "global_step": 96539, "epoch": 2298} {"train_loss": -6.244626998901367, "global_step": 96540, "epoch": 2298} {"train_loss": -6.174291133880615, "global_step": 96541, "epoch": 2298} {"train_loss": -6.218608856201172, "global_step": 96542, "epoch": 2298} {"train_loss": -6.272469520568848, "global_step": 96543, "epoch": 2298} {"train_loss": -6.248760223388672, "global_step": 96544, "epoch": 2298} {"train_loss": -6.255305290222168, "global_step": 96545, "epoch": 2298} {"train_loss": -6.131793975830078, "global_step": 96546, "epoch": 2298} {"train_loss": -6.250881195068359, "global_step": 96547, "epoch": 2298} {"train_loss": -6.295399188995361, "global_step": 96548, "epoch": 2298} {"train_loss": -6.128320693969727, "global_step": 96549, "epoch": 2298} {"train_loss": -6.302281379699707, "global_step": 96550, "epoch": 2298} {"train_loss": -6.431806564331055, "global_step": 96551, "epoch": 2298} {"train_loss": -6.283710479736328, "global_step": 96552, "epoch": 2298} {"train_loss": -6.324758529663086, "global_step": 96553, "epoch": 2298} {"train_loss": -6.257296562194824, "global_step": 96554, "epoch": 2298} {"train_loss": -6.243177890777588, "global_step": 96555, "epoch": 2298} {"train_loss": -6.27858829498291, "global_step": 96556, "epoch": 2298} {"train_loss": -6.2457976795378185, "global_step": 96557, "epoch": 2298, "val_loss": 67926.984375} {"train_loss": -6.332612037658691, "global_step": 96558, "epoch": 2299} {"train_loss": -6.241724967956543, "global_step": 96559, "epoch": 2299} {"train_loss": -6.324456214904785, "global_step": 96560, "epoch": 2299} {"train_loss": -6.258042335510254, "global_step": 96561, "epoch": 2299} {"train_loss": -6.373591423034668, "global_step": 96562, "epoch": 2299} {"train_loss": -6.367556571960449, "global_step": 96563, "epoch": 2299} {"train_loss": -6.174680709838867, "global_step": 96564, "epoch": 2299} {"train_loss": -6.226221084594727, "global_step": 96565, "epoch": 2299} {"train_loss": -6.321250915527344, "global_step": 96566, "epoch": 2299} {"train_loss": -6.1574249267578125, "global_step": 96567, "epoch": 2299} {"train_loss": -6.280015468597412, "global_step": 96568, "epoch": 2299} {"train_loss": -6.077719211578369, "global_step": 96569, "epoch": 2299} {"train_loss": -6.312131881713867, "global_step": 96570, "epoch": 2299} {"train_loss": -6.248464584350586, "global_step": 96571, "epoch": 2299} {"train_loss": -6.460002899169922, "global_step": 96572, "epoch": 2299} {"train_loss": -6.286099433898926, "global_step": 96573, "epoch": 2299} {"train_loss": -6.165073394775391, "global_step": 96574, "epoch": 2299} {"train_loss": -6.330177307128906, "global_step": 96575, "epoch": 2299} {"train_loss": -6.325356960296631, "global_step": 96576, "epoch": 2299} {"train_loss": -6.299917697906494, "global_step": 96577, "epoch": 2299} {"train_loss": -6.264187335968018, "global_step": 96578, "epoch": 2299} {"train_loss": -6.366735458374023, "global_step": 96579, "epoch": 2299} {"train_loss": -6.3665924072265625, "global_step": 96580, "epoch": 2299} {"train_loss": -6.244452476501465, "global_step": 96581, "epoch": 2299} {"train_loss": -6.210439205169678, "global_step": 96582, "epoch": 2299} {"train_loss": -6.212034702301025, "global_step": 96583, "epoch": 2299} {"train_loss": -6.208526611328125, "global_step": 96584, "epoch": 2299} {"train_loss": -6.243165016174316, "global_step": 96585, "epoch": 2299} {"train_loss": -6.270378589630127, "global_step": 96586, "epoch": 2299} {"train_loss": -6.252944469451904, "global_step": 96587, "epoch": 2299} {"train_loss": -6.285405158996582, "global_step": 96588, "epoch": 2299} {"train_loss": -6.3733320236206055, "global_step": 96589, "epoch": 2299} {"train_loss": -6.340362071990967, "global_step": 96590, "epoch": 2299} {"train_loss": -6.211056232452393, "global_step": 96591, "epoch": 2299} {"train_loss": -6.428035736083984, "global_step": 96592, "epoch": 2299} {"train_loss": -6.17540979385376, "global_step": 96593, "epoch": 2299} {"train_loss": -6.285948753356934, "global_step": 96594, "epoch": 2299} {"train_loss": -6.335930824279785, "global_step": 96595, "epoch": 2299} {"train_loss": -6.262047290802002, "global_step": 96596, "epoch": 2299} {"train_loss": -6.340899467468262, "global_step": 96597, "epoch": 2299} {"train_loss": -6.267365455627441, "global_step": 96598, "epoch": 2299} {"train_loss": -6.279903797876267, "global_step": 96599, "epoch": 2299, "val_loss": 67825.859375} {"train_loss": -6.3523945808410645, "global_step": 96600, "epoch": 2300} {"train_loss": -6.378876686096191, "global_step": 96601, "epoch": 2300} {"train_loss": -6.305179595947266, "global_step": 96602, "epoch": 2300} {"train_loss": -6.277835845947266, "global_step": 96603, "epoch": 2300} {"train_loss": -6.276155471801758, "global_step": 96604, "epoch": 2300} {"train_loss": -6.399578094482422, "global_step": 96605, "epoch": 2300} {"train_loss": -6.29958963394165, "global_step": 96606, "epoch": 2300} {"train_loss": -6.252946853637695, "global_step": 96607, "epoch": 2300} {"train_loss": -6.295995235443115, "global_step": 96608, "epoch": 2300} {"train_loss": -6.230802536010742, "global_step": 96609, "epoch": 2300} {"train_loss": -6.337372779846191, "global_step": 96610, "epoch": 2300} {"train_loss": -6.272111892700195, "global_step": 96611, "epoch": 2300} {"train_loss": -6.2799296379089355, "global_step": 96612, "epoch": 2300} {"train_loss": -6.336979389190674, "global_step": 96613, "epoch": 2300} {"train_loss": -6.298486709594727, "global_step": 96614, "epoch": 2300} {"train_loss": -6.2325639724731445, "global_step": 96615, "epoch": 2300} {"train_loss": -6.3206868171691895, "global_step": 96616, "epoch": 2300} {"train_loss": -6.392230033874512, "global_step": 96617, "epoch": 2300} {"train_loss": -6.2952165603637695, "global_step": 96618, "epoch": 2300} {"train_loss": -6.342535972595215, "global_step": 96619, "epoch": 2300} {"train_loss": -6.392107963562012, "global_step": 96620, "epoch": 2300} {"train_loss": -6.2570390701293945, "global_step": 96621, "epoch": 2300} {"train_loss": -6.5081000328063965, "global_step": 96622, "epoch": 2300} {"train_loss": -6.268027305603027, "global_step": 96623, "epoch": 2300} {"train_loss": -6.33476448059082, "global_step": 96624, "epoch": 2300} {"train_loss": -6.3395538330078125, "global_step": 96625, "epoch": 2300} {"train_loss": -6.3983073234558105, "global_step": 96626, "epoch": 2300} {"train_loss": -6.32605504989624, "global_step": 96627, "epoch": 2300} {"train_loss": -6.188549041748047, "global_step": 96628, "epoch": 2300} {"train_loss": -6.308615684509277, "global_step": 96629, "epoch": 2300} {"train_loss": -6.309844970703125, "global_step": 96630, "epoch": 2300} {"train_loss": -6.362850189208984, "global_step": 96631, "epoch": 2300} {"train_loss": -6.305375099182129, "global_step": 96632, "epoch": 2300} {"train_loss": -6.319091796875, "global_step": 96633, "epoch": 2300} {"train_loss": -6.3266096115112305, "global_step": 96634, "epoch": 2300} {"train_loss": -6.447972774505615, "global_step": 96635, "epoch": 2300} {"train_loss": -6.357350826263428, "global_step": 96636, "epoch": 2300} {"train_loss": -6.432900428771973, "global_step": 96637, "epoch": 2300} {"train_loss": -6.374682903289795, "global_step": 96638, "epoch": 2300} {"train_loss": -6.304633140563965, "global_step": 96639, "epoch": 2300} {"train_loss": -6.38209867477417, "global_step": 96640, "epoch": 2300} {"train_loss": -6.327698332922799, "global_step": 96641, "epoch": 2300, "train/sim_max_reward_0": 0.415979133981636, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.1283257021995788, "train/sim_max_reward_3": 0.13806358806212254, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.8787237892265499, "test/sim_max_reward_4400000": 0.9316847305635062, "test/sim_max_reward_4400001": 0.9292197748313934, "test/sim_max_reward_4400002": 0.521178899733921, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9074947286071621, "test/sim_max_reward_4400006": 0.6771847642906482, "test/sim_max_reward_4400007": 0.8637268502247722, "test/sim_max_reward_4400008": 0.3020535315665783, "test/sim_max_reward_4400009": 0.5086954925278983, "test/sim_max_reward_4400010": 0.2182625015548132, "test/sim_max_reward_4400011": 0.2404302170717656, "test/sim_max_reward_4400012": 0.9850554138049302, "test/sim_max_reward_4400013": 0.969862354682524, "test/sim_max_reward_4400014": 0.8679832122767981, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2032493357823996, "test/sim_max_reward_4400019": 0.3252078703951492, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8813705408362472, "test/sim_max_reward_4400023": 0.4175685147126971, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.2706682996859118, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 4.114803761337679e-07, "test/sim_max_reward_4400028": 0.9869107218253915, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9611110955566408, "test/sim_max_reward_4400031": 0.9493945612482149, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.20902804079858614, "test/sim_max_reward_4400034": 0.8754702133114355, "test/sim_max_reward_4400035": 0.5463435716924886, "test/sim_max_reward_4400036": 0.37394266365690776, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.8302344291590267, "test/sim_max_reward_4400039": 0.8708047092352834, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.890156350658686, "test/sim_max_reward_4400042": 0.8864528857349149, "test/sim_max_reward_4400043": 0.6721865665443969, "test/sim_max_reward_4400044": 0.8687320049581934, "test/sim_max_reward_4400045": 0.993798370292283, "test/sim_max_reward_4400046": 0.8850852508931347, "test/sim_max_reward_4400047": 0.9754319811011952, "test/sim_max_reward_4400048": 0.0008498798065148638, "test/sim_max_reward_4400049": 0.8646130299991847, "train/mean_score": 0.5935153689116479, "test/mean_score": 0.5246638134780767, "val_loss": 67901.5546875} {"train_loss": -6.464827060699463, "global_step": 96642, "epoch": 2301} {"train_loss": -6.459038257598877, "global_step": 96643, "epoch": 2301} {"train_loss": -6.394283294677734, "global_step": 96644, "epoch": 2301} {"train_loss": -6.27662992477417, "global_step": 96645, "epoch": 2301} {"train_loss": -6.350006580352783, "global_step": 96646, "epoch": 2301} {"train_loss": -6.156198978424072, "global_step": 96647, "epoch": 2301} {"train_loss": -6.403641700744629, "global_step": 96648, "epoch": 2301} {"train_loss": -6.288473606109619, "global_step": 96649, "epoch": 2301} {"train_loss": -6.299861907958984, "global_step": 96650, "epoch": 2301} {"train_loss": -6.438992977142334, "global_step": 96651, "epoch": 2301} {"train_loss": -6.265705108642578, "global_step": 96652, "epoch": 2301} {"train_loss": -6.365229606628418, "global_step": 96653, "epoch": 2301} {"train_loss": -6.301364898681641, "global_step": 96654, "epoch": 2301} {"train_loss": -6.24232816696167, "global_step": 96655, "epoch": 2301} {"train_loss": -6.3382673263549805, "global_step": 96656, "epoch": 2301} {"train_loss": -6.2417144775390625, "global_step": 96657, "epoch": 2301} {"train_loss": -6.345043659210205, "global_step": 96658, "epoch": 2301} {"train_loss": -6.314327239990234, "global_step": 96659, "epoch": 2301} {"train_loss": -6.354969024658203, "global_step": 96660, "epoch": 2301} {"train_loss": -6.392041206359863, "global_step": 96661, "epoch": 2301} {"train_loss": -6.244268417358398, "global_step": 96662, "epoch": 2301} {"train_loss": -6.288870334625244, "global_step": 96663, "epoch": 2301} {"train_loss": -6.424446105957031, "global_step": 96664, "epoch": 2301} {"train_loss": -6.317933082580566, "global_step": 96665, "epoch": 2301} {"train_loss": -6.3073039054870605, "global_step": 96666, "epoch": 2301} {"train_loss": -6.365495681762695, "global_step": 96667, "epoch": 2301} {"train_loss": -6.289763450622559, "global_step": 96668, "epoch": 2301} {"train_loss": -6.323075294494629, "global_step": 96669, "epoch": 2301} {"train_loss": -6.3214263916015625, "global_step": 96670, "epoch": 2301} {"train_loss": -6.383835792541504, "global_step": 96671, "epoch": 2301} {"train_loss": -6.248151779174805, "global_step": 96672, "epoch": 2301} {"train_loss": -6.473930358886719, "global_step": 96673, "epoch": 2301} {"train_loss": -6.381649971008301, "global_step": 96674, "epoch": 2301} {"train_loss": -6.328009605407715, "global_step": 96675, "epoch": 2301} {"train_loss": -6.296023368835449, "global_step": 96676, "epoch": 2301} {"train_loss": -6.210545063018799, "global_step": 96677, "epoch": 2301} {"train_loss": -6.253701686859131, "global_step": 96678, "epoch": 2301} {"train_loss": -6.319838523864746, "global_step": 96679, "epoch": 2301} {"train_loss": -6.2135162353515625, "global_step": 96680, "epoch": 2301} {"train_loss": -6.244372367858887, "global_step": 96681, "epoch": 2301} {"train_loss": -6.26619815826416, "global_step": 96682, "epoch": 2301} {"train_loss": -6.317832288287935, "global_step": 96683, "epoch": 2301, "val_loss": 67984.7421875} {"train_loss": -6.307244777679443, "global_step": 96684, "epoch": 2302} {"train_loss": -6.2243194580078125, "global_step": 96685, "epoch": 2302} {"train_loss": -6.326399326324463, "global_step": 96686, "epoch": 2302} {"train_loss": -6.262709140777588, "global_step": 96687, "epoch": 2302} {"train_loss": -6.393096923828125, "global_step": 96688, "epoch": 2302} {"train_loss": -6.289982318878174, "global_step": 96689, "epoch": 2302} {"train_loss": -6.279855251312256, "global_step": 96690, "epoch": 2302} {"train_loss": -6.31589412689209, "global_step": 96691, "epoch": 2302} {"train_loss": -6.328039646148682, "global_step": 96692, "epoch": 2302} {"train_loss": -6.427875518798828, "global_step": 96693, "epoch": 2302} {"train_loss": -6.34301233291626, "global_step": 96694, "epoch": 2302} {"train_loss": -6.369245529174805, "global_step": 96695, "epoch": 2302} {"train_loss": -6.331646919250488, "global_step": 96696, "epoch": 2302} {"train_loss": -6.407934188842773, "global_step": 96697, "epoch": 2302} {"train_loss": -6.295042991638184, "global_step": 96698, "epoch": 2302} {"train_loss": -6.391449928283691, "global_step": 96699, "epoch": 2302} {"train_loss": -6.423330307006836, "global_step": 96700, "epoch": 2302} {"train_loss": -6.4085373878479, "global_step": 96701, "epoch": 2302} {"train_loss": -6.296840667724609, "global_step": 96702, "epoch": 2302} {"train_loss": -6.296116828918457, "global_step": 96703, "epoch": 2302} {"train_loss": -6.369664669036865, "global_step": 96704, "epoch": 2302} {"train_loss": -6.235123157501221, "global_step": 96705, "epoch": 2302} {"train_loss": -6.325791358947754, "global_step": 96706, "epoch": 2302} {"train_loss": -6.331109046936035, "global_step": 96707, "epoch": 2302} {"train_loss": -6.287927150726318, "global_step": 96708, "epoch": 2302} {"train_loss": -6.321593284606934, "global_step": 96709, "epoch": 2302} {"train_loss": -6.279529094696045, "global_step": 96710, "epoch": 2302} {"train_loss": -6.389400005340576, "global_step": 96711, "epoch": 2302} {"train_loss": -6.317078590393066, "global_step": 96712, "epoch": 2302} {"train_loss": -6.39146614074707, "global_step": 96713, "epoch": 2302} {"train_loss": -6.240402698516846, "global_step": 96714, "epoch": 2302} {"train_loss": -6.510403156280518, "global_step": 96715, "epoch": 2302} {"train_loss": -6.354983806610107, "global_step": 96716, "epoch": 2302} {"train_loss": -6.289678573608398, "global_step": 96717, "epoch": 2302} {"train_loss": -6.312559127807617, "global_step": 96718, "epoch": 2302} {"train_loss": -6.182387351989746, "global_step": 96719, "epoch": 2302} {"train_loss": -6.144786834716797, "global_step": 96720, "epoch": 2302} {"train_loss": -6.28359842300415, "global_step": 96721, "epoch": 2302} {"train_loss": -6.29653263092041, "global_step": 96722, "epoch": 2302} {"train_loss": -6.224183082580566, "global_step": 96723, "epoch": 2302} {"train_loss": -6.241901397705078, "global_step": 96724, "epoch": 2302} {"train_loss": -6.3197676454271585, "global_step": 96725, "epoch": 2302, "val_loss": 67768.0} {"train_loss": -6.354580879211426, "global_step": 96726, "epoch": 2303} {"train_loss": -6.321295738220215, "global_step": 96727, "epoch": 2303} {"train_loss": -6.423730850219727, "global_step": 96728, "epoch": 2303} {"train_loss": -6.434992790222168, "global_step": 96729, "epoch": 2303} {"train_loss": -6.36734676361084, "global_step": 96730, "epoch": 2303} {"train_loss": -6.385111331939697, "global_step": 96731, "epoch": 2303} {"train_loss": -6.355380535125732, "global_step": 96732, "epoch": 2303} {"train_loss": -6.327381134033203, "global_step": 96733, "epoch": 2303} {"train_loss": -6.311129570007324, "global_step": 96734, "epoch": 2303} {"train_loss": -6.375020980834961, "global_step": 96735, "epoch": 2303} {"train_loss": -6.252655982971191, "global_step": 96736, "epoch": 2303} {"train_loss": -6.261256694793701, "global_step": 96737, "epoch": 2303} {"train_loss": -6.1797075271606445, "global_step": 96738, "epoch": 2303} {"train_loss": -6.239021301269531, "global_step": 96739, "epoch": 2303} {"train_loss": -6.333841323852539, "global_step": 96740, "epoch": 2303} {"train_loss": -6.346312999725342, "global_step": 96741, "epoch": 2303} {"train_loss": -6.336698532104492, "global_step": 96742, "epoch": 2303} {"train_loss": -6.282374382019043, "global_step": 96743, "epoch": 2303} {"train_loss": -6.260534763336182, "global_step": 96744, "epoch": 2303} {"train_loss": -6.39921236038208, "global_step": 96745, "epoch": 2303} {"train_loss": -6.336528778076172, "global_step": 96746, "epoch": 2303} {"train_loss": -6.374844551086426, "global_step": 96747, "epoch": 2303} {"train_loss": -6.244353294372559, "global_step": 96748, "epoch": 2303} {"train_loss": -6.272688865661621, "global_step": 96749, "epoch": 2303} {"train_loss": -6.321913242340088, "global_step": 96750, "epoch": 2303} {"train_loss": -6.193567276000977, "global_step": 96751, "epoch": 2303} {"train_loss": -6.304356098175049, "global_step": 96752, "epoch": 2303} {"train_loss": -6.191462993621826, "global_step": 96753, "epoch": 2303} {"train_loss": -6.289800643920898, "global_step": 96754, "epoch": 2303} {"train_loss": -6.188457489013672, "global_step": 96755, "epoch": 2303} {"train_loss": -6.189609527587891, "global_step": 96756, "epoch": 2303} {"train_loss": -6.138476371765137, "global_step": 96757, "epoch": 2303} {"train_loss": -6.199214935302734, "global_step": 96758, "epoch": 2303} {"train_loss": -6.3534040451049805, "global_step": 96759, "epoch": 2303} {"train_loss": -6.44110631942749, "global_step": 96760, "epoch": 2303} {"train_loss": -6.241881370544434, "global_step": 96761, "epoch": 2303} {"train_loss": -6.268945693969727, "global_step": 96762, "epoch": 2303} {"train_loss": -6.227985382080078, "global_step": 96763, "epoch": 2303} {"train_loss": -6.246354103088379, "global_step": 96764, "epoch": 2303} {"train_loss": -6.237897872924805, "global_step": 96765, "epoch": 2303} {"train_loss": -6.284656047821045, "global_step": 96766, "epoch": 2303} {"train_loss": -6.295462472098214, "global_step": 96767, "epoch": 2303, "val_loss": 67899.765625} {"train_loss": -6.305716037750244, "global_step": 96768, "epoch": 2304} {"train_loss": -6.309212684631348, "global_step": 96769, "epoch": 2304} {"train_loss": -6.406847953796387, "global_step": 96770, "epoch": 2304} {"train_loss": -6.308788299560547, "global_step": 96771, "epoch": 2304} {"train_loss": -6.394979476928711, "global_step": 96772, "epoch": 2304} {"train_loss": -6.176692008972168, "global_step": 96773, "epoch": 2304} {"train_loss": -6.346523284912109, "global_step": 96774, "epoch": 2304} {"train_loss": -6.250692367553711, "global_step": 96775, "epoch": 2304} {"train_loss": -6.395628929138184, "global_step": 96776, "epoch": 2304} {"train_loss": -6.2317705154418945, "global_step": 96777, "epoch": 2304} {"train_loss": -6.289404392242432, "global_step": 96778, "epoch": 2304} {"train_loss": -6.188796043395996, "global_step": 96779, "epoch": 2304} {"train_loss": -6.291301250457764, "global_step": 96780, "epoch": 2304} {"train_loss": -6.257750511169434, "global_step": 96781, "epoch": 2304} {"train_loss": -6.372646331787109, "global_step": 96782, "epoch": 2304} {"train_loss": -6.27774715423584, "global_step": 96783, "epoch": 2304} {"train_loss": -6.229244709014893, "global_step": 96784, "epoch": 2304} {"train_loss": -6.321739196777344, "global_step": 96785, "epoch": 2304} {"train_loss": -6.248959541320801, "global_step": 96786, "epoch": 2304} {"train_loss": -6.22941780090332, "global_step": 96787, "epoch": 2304} {"train_loss": -6.356044769287109, "global_step": 96788, "epoch": 2304} {"train_loss": -6.3151702880859375, "global_step": 96789, "epoch": 2304} {"train_loss": -6.299880504608154, "global_step": 96790, "epoch": 2304} {"train_loss": -6.270051002502441, "global_step": 96791, "epoch": 2304} {"train_loss": -6.309872627258301, "global_step": 96792, "epoch": 2304} {"train_loss": -6.269601821899414, "global_step": 96793, "epoch": 2304} {"train_loss": -6.219647407531738, "global_step": 96794, "epoch": 2304} {"train_loss": -6.318367958068848, "global_step": 96795, "epoch": 2304} {"train_loss": -6.252507209777832, "global_step": 96796, "epoch": 2304} {"train_loss": -6.377740859985352, "global_step": 96797, "epoch": 2304} {"train_loss": -6.345301628112793, "global_step": 96798, "epoch": 2304} {"train_loss": -6.293054103851318, "global_step": 96799, "epoch": 2304} {"train_loss": -6.312483787536621, "global_step": 96800, "epoch": 2304} {"train_loss": -6.405448913574219, "global_step": 96801, "epoch": 2304} {"train_loss": -6.221569061279297, "global_step": 96802, "epoch": 2304} {"train_loss": -6.316620826721191, "global_step": 96803, "epoch": 2304} {"train_loss": -6.374784469604492, "global_step": 96804, "epoch": 2304} {"train_loss": -6.381685256958008, "global_step": 96805, "epoch": 2304} {"train_loss": -6.375185966491699, "global_step": 96806, "epoch": 2304} {"train_loss": -6.315817356109619, "global_step": 96807, "epoch": 2304} {"train_loss": -6.213382720947266, "global_step": 96808, "epoch": 2304} {"train_loss": -6.301550933292934, "global_step": 96809, "epoch": 2304, "val_loss": 68075.7890625} {"train_loss": -6.2014617919921875, "global_step": 96810, "epoch": 2305} {"train_loss": -6.177009582519531, "global_step": 96811, "epoch": 2305} {"train_loss": -6.324306488037109, "global_step": 96812, "epoch": 2305} {"train_loss": -6.288822174072266, "global_step": 96813, "epoch": 2305} {"train_loss": -6.170639991760254, "global_step": 96814, "epoch": 2305} {"train_loss": -6.271598815917969, "global_step": 96815, "epoch": 2305} {"train_loss": -6.241781234741211, "global_step": 96816, "epoch": 2305} {"train_loss": -6.35488224029541, "global_step": 96817, "epoch": 2305} {"train_loss": -6.245505332946777, "global_step": 96818, "epoch": 2305} {"train_loss": -6.305452823638916, "global_step": 96819, "epoch": 2305} {"train_loss": -6.455221652984619, "global_step": 96820, "epoch": 2305} {"train_loss": -6.329833030700684, "global_step": 96821, "epoch": 2305} {"train_loss": -6.2520270347595215, "global_step": 96822, "epoch": 2305} {"train_loss": -6.298463344573975, "global_step": 96823, "epoch": 2305} {"train_loss": -6.251430511474609, "global_step": 96824, "epoch": 2305} {"train_loss": -6.235539436340332, "global_step": 96825, "epoch": 2305} {"train_loss": -6.326847553253174, "global_step": 96826, "epoch": 2305} {"train_loss": -6.293551445007324, "global_step": 96827, "epoch": 2305} {"train_loss": -6.313643932342529, "global_step": 96828, "epoch": 2305} {"train_loss": -6.290557861328125, "global_step": 96829, "epoch": 2305} {"train_loss": -6.33945369720459, "global_step": 96830, "epoch": 2305} {"train_loss": -6.286218643188477, "global_step": 96831, "epoch": 2305} {"train_loss": -6.282022476196289, "global_step": 96832, "epoch": 2305} {"train_loss": -6.279973030090332, "global_step": 96833, "epoch": 2305} {"train_loss": -6.284209251403809, "global_step": 96834, "epoch": 2305} {"train_loss": -6.347175121307373, "global_step": 96835, "epoch": 2305} {"train_loss": -6.395723819732666, "global_step": 96836, "epoch": 2305} {"train_loss": -6.325296401977539, "global_step": 96837, "epoch": 2305} {"train_loss": -6.275542259216309, "global_step": 96838, "epoch": 2305} {"train_loss": -6.338923454284668, "global_step": 96839, "epoch": 2305} {"train_loss": -6.143411636352539, "global_step": 96840, "epoch": 2305} {"train_loss": -6.212268352508545, "global_step": 96841, "epoch": 2305} {"train_loss": -6.418735980987549, "global_step": 96842, "epoch": 2305} {"train_loss": -6.334088325500488, "global_step": 96843, "epoch": 2305} {"train_loss": -6.333376884460449, "global_step": 96844, "epoch": 2305} {"train_loss": -6.417727947235107, "global_step": 96845, "epoch": 2305} {"train_loss": -6.286924362182617, "global_step": 96846, "epoch": 2305} {"train_loss": -6.271366596221924, "global_step": 96847, "epoch": 2305} {"train_loss": -6.3852219581604, "global_step": 96848, "epoch": 2305} {"train_loss": -6.267764091491699, "global_step": 96849, "epoch": 2305} {"train_loss": -6.23775053024292, "global_step": 96850, "epoch": 2305} {"train_loss": -6.293290921619961, "global_step": 96851, "epoch": 2305, "val_loss": 67846.90625} {"train_loss": -6.337133407592773, "global_step": 96852, "epoch": 2306} {"train_loss": -6.22493839263916, "global_step": 96853, "epoch": 2306} {"train_loss": -6.319735050201416, "global_step": 96854, "epoch": 2306} {"train_loss": -6.1669135093688965, "global_step": 96855, "epoch": 2306} {"train_loss": -6.315940856933594, "global_step": 96856, "epoch": 2306} {"train_loss": -6.312707901000977, "global_step": 96857, "epoch": 2306} {"train_loss": -6.455316543579102, "global_step": 96858, "epoch": 2306} {"train_loss": -6.2999372482299805, "global_step": 96859, "epoch": 2306} {"train_loss": -6.311616897583008, "global_step": 96860, "epoch": 2306} {"train_loss": -6.369433403015137, "global_step": 96861, "epoch": 2306} {"train_loss": -6.3019022941589355, "global_step": 96862, "epoch": 2306} {"train_loss": -6.323711395263672, "global_step": 96863, "epoch": 2306} {"train_loss": -6.2857747077941895, "global_step": 96864, "epoch": 2306} {"train_loss": -6.266106605529785, "global_step": 96865, "epoch": 2306} {"train_loss": -6.337653160095215, "global_step": 96866, "epoch": 2306} {"train_loss": -6.280271530151367, "global_step": 96867, "epoch": 2306} {"train_loss": -6.427515983581543, "global_step": 96868, "epoch": 2306} {"train_loss": -6.305252552032471, "global_step": 96869, "epoch": 2306} {"train_loss": -6.26062536239624, "global_step": 96870, "epoch": 2306} {"train_loss": -6.360884189605713, "global_step": 96871, "epoch": 2306} {"train_loss": -6.29848575592041, "global_step": 96872, "epoch": 2306} {"train_loss": -6.414420127868652, "global_step": 96873, "epoch": 2306} {"train_loss": -6.293142795562744, "global_step": 96874, "epoch": 2306} {"train_loss": -6.3804402351379395, "global_step": 96875, "epoch": 2306} {"train_loss": -6.3130998611450195, "global_step": 96876, "epoch": 2306} {"train_loss": -6.32095193862915, "global_step": 96877, "epoch": 2306} {"train_loss": -6.281822204589844, "global_step": 96878, "epoch": 2306} {"train_loss": -6.380760192871094, "global_step": 96879, "epoch": 2306} {"train_loss": -6.212118148803711, "global_step": 96880, "epoch": 2306} {"train_loss": -6.25987434387207, "global_step": 96881, "epoch": 2306} {"train_loss": -6.327889919281006, "global_step": 96882, "epoch": 2306} {"train_loss": -6.355009078979492, "global_step": 96883, "epoch": 2306} {"train_loss": -6.2988600730896, "global_step": 96884, "epoch": 2306} {"train_loss": -6.425924301147461, "global_step": 96885, "epoch": 2306} {"train_loss": -6.353765487670898, "global_step": 96886, "epoch": 2306} {"train_loss": -6.208712100982666, "global_step": 96887, "epoch": 2306} {"train_loss": -6.3036603927612305, "global_step": 96888, "epoch": 2306} {"train_loss": -6.293274402618408, "global_step": 96889, "epoch": 2306} {"train_loss": -6.3597917556762695, "global_step": 96890, "epoch": 2306} {"train_loss": -6.351927757263184, "global_step": 96891, "epoch": 2306} {"train_loss": -6.312695026397705, "global_step": 96892, "epoch": 2306} {"train_loss": -6.315882171903338, "global_step": 96893, "epoch": 2306, "val_loss": 67912.1484375} {"train_loss": -6.1863694190979, "global_step": 96894, "epoch": 2307} {"train_loss": -6.349083423614502, "global_step": 96895, "epoch": 2307} {"train_loss": -6.4008636474609375, "global_step": 96896, "epoch": 2307} {"train_loss": -6.223268985748291, "global_step": 96897, "epoch": 2307} {"train_loss": -6.363988876342773, "global_step": 96898, "epoch": 2307} {"train_loss": -6.288514137268066, "global_step": 96899, "epoch": 2307} {"train_loss": -6.367035865783691, "global_step": 96900, "epoch": 2307} {"train_loss": -6.412267684936523, "global_step": 96901, "epoch": 2307} {"train_loss": -6.257052898406982, "global_step": 96902, "epoch": 2307} {"train_loss": -6.236333847045898, "global_step": 96903, "epoch": 2307} {"train_loss": -6.402805328369141, "global_step": 96904, "epoch": 2307} {"train_loss": -6.414562225341797, "global_step": 96905, "epoch": 2307} {"train_loss": -6.362010955810547, "global_step": 96906, "epoch": 2307} {"train_loss": -6.324852466583252, "global_step": 96907, "epoch": 2307} {"train_loss": -6.258091926574707, "global_step": 96908, "epoch": 2307} {"train_loss": -6.23397159576416, "global_step": 96909, "epoch": 2307} {"train_loss": -6.384735107421875, "global_step": 96910, "epoch": 2307} {"train_loss": -6.278419017791748, "global_step": 96911, "epoch": 2307} {"train_loss": -6.35792350769043, "global_step": 96912, "epoch": 2307} {"train_loss": -6.325506210327148, "global_step": 96913, "epoch": 2307} {"train_loss": -6.315473556518555, "global_step": 96914, "epoch": 2307} {"train_loss": -6.288854598999023, "global_step": 96915, "epoch": 2307} {"train_loss": -6.237379550933838, "global_step": 96916, "epoch": 2307} {"train_loss": -6.367402076721191, "global_step": 96917, "epoch": 2307} {"train_loss": -6.431041240692139, "global_step": 96918, "epoch": 2307} {"train_loss": -6.317197799682617, "global_step": 96919, "epoch": 2307} {"train_loss": -6.267435550689697, "global_step": 96920, "epoch": 2307} {"train_loss": -6.443576812744141, "global_step": 96921, "epoch": 2307} {"train_loss": -6.227084159851074, "global_step": 96922, "epoch": 2307} {"train_loss": -6.193523406982422, "global_step": 96923, "epoch": 2307} {"train_loss": -6.264988899230957, "global_step": 96924, "epoch": 2307} {"train_loss": -6.259370803833008, "global_step": 96925, "epoch": 2307} {"train_loss": -6.295294284820557, "global_step": 96926, "epoch": 2307} {"train_loss": -6.2976837158203125, "global_step": 96927, "epoch": 2307} {"train_loss": -6.307117462158203, "global_step": 96928, "epoch": 2307} {"train_loss": -6.279689311981201, "global_step": 96929, "epoch": 2307} {"train_loss": -6.338573455810547, "global_step": 96930, "epoch": 2307} {"train_loss": -6.267908573150635, "global_step": 96931, "epoch": 2307} {"train_loss": -6.201958656311035, "global_step": 96932, "epoch": 2307} {"train_loss": -6.3888468742370605, "global_step": 96933, "epoch": 2307} {"train_loss": -6.22695255279541, "global_step": 96934, "epoch": 2307} {"train_loss": -6.307519231523786, "global_step": 96935, "epoch": 2307, "val_loss": 68106.046875} {"train_loss": -6.343181610107422, "global_step": 96936, "epoch": 2308} {"train_loss": -6.148186206817627, "global_step": 96937, "epoch": 2308} {"train_loss": -6.310880184173584, "global_step": 96938, "epoch": 2308} {"train_loss": -6.38437557220459, "global_step": 96939, "epoch": 2308} {"train_loss": -6.334526062011719, "global_step": 96940, "epoch": 2308} {"train_loss": -6.390254020690918, "global_step": 96941, "epoch": 2308} {"train_loss": -6.457296371459961, "global_step": 96942, "epoch": 2308} {"train_loss": -6.2044453620910645, "global_step": 96943, "epoch": 2308} {"train_loss": -6.444592475891113, "global_step": 96944, "epoch": 2308} {"train_loss": -6.42115592956543, "global_step": 96945, "epoch": 2308} {"train_loss": -6.341856002807617, "global_step": 96946, "epoch": 2308} {"train_loss": -6.340188503265381, "global_step": 96947, "epoch": 2308} {"train_loss": -6.282764434814453, "global_step": 96948, "epoch": 2308} {"train_loss": -6.247443675994873, "global_step": 96949, "epoch": 2308} {"train_loss": -6.3061604499816895, "global_step": 96950, "epoch": 2308} {"train_loss": -6.319624423980713, "global_step": 96951, "epoch": 2308} {"train_loss": -6.211443901062012, "global_step": 96952, "epoch": 2308} {"train_loss": -6.231895923614502, "global_step": 96953, "epoch": 2308} {"train_loss": -6.3295111656188965, "global_step": 96954, "epoch": 2308} {"train_loss": -6.315637588500977, "global_step": 96955, "epoch": 2308} {"train_loss": -6.331283092498779, "global_step": 96956, "epoch": 2308} {"train_loss": -6.375150680541992, "global_step": 96957, "epoch": 2308} {"train_loss": -6.360374450683594, "global_step": 96958, "epoch": 2308} {"train_loss": -6.376883029937744, "global_step": 96959, "epoch": 2308} {"train_loss": -6.293042182922363, "global_step": 96960, "epoch": 2308} {"train_loss": -6.321951866149902, "global_step": 96961, "epoch": 2308} {"train_loss": -6.381735801696777, "global_step": 96962, "epoch": 2308} {"train_loss": -6.298744201660156, "global_step": 96963, "epoch": 2308} {"train_loss": -6.435061931610107, "global_step": 96964, "epoch": 2308} {"train_loss": -6.371771812438965, "global_step": 96965, "epoch": 2308} {"train_loss": -6.491987228393555, "global_step": 96966, "epoch": 2308} {"train_loss": -6.319484710693359, "global_step": 96967, "epoch": 2308} {"train_loss": -6.389123916625977, "global_step": 96968, "epoch": 2308} {"train_loss": -6.32102108001709, "global_step": 96969, "epoch": 2308} {"train_loss": -6.349352836608887, "global_step": 96970, "epoch": 2308} {"train_loss": -6.334688663482666, "global_step": 96971, "epoch": 2308} {"train_loss": -6.243030071258545, "global_step": 96972, "epoch": 2308} {"train_loss": -6.312261581420898, "global_step": 96973, "epoch": 2308} {"train_loss": -6.259720802307129, "global_step": 96974, "epoch": 2308} {"train_loss": -6.216463088989258, "global_step": 96975, "epoch": 2308} {"train_loss": -6.306563377380371, "global_step": 96976, "epoch": 2308} {"train_loss": -6.326432205381847, "global_step": 96977, "epoch": 2308, "val_loss": 67904.65625} {"train_loss": -6.365164756774902, "global_step": 96978, "epoch": 2309} {"train_loss": -6.302492141723633, "global_step": 96979, "epoch": 2309} {"train_loss": -6.383386611938477, "global_step": 96980, "epoch": 2309} {"train_loss": -6.347343444824219, "global_step": 96981, "epoch": 2309} {"train_loss": -6.382957935333252, "global_step": 96982, "epoch": 2309} {"train_loss": -6.383352279663086, "global_step": 96983, "epoch": 2309} {"train_loss": -6.259336471557617, "global_step": 96984, "epoch": 2309} {"train_loss": -6.313495635986328, "global_step": 96985, "epoch": 2309} {"train_loss": -6.298711776733398, "global_step": 96986, "epoch": 2309} {"train_loss": -6.393230438232422, "global_step": 96987, "epoch": 2309} {"train_loss": -6.246901512145996, "global_step": 96988, "epoch": 2309} {"train_loss": -6.161527633666992, "global_step": 96989, "epoch": 2309} {"train_loss": -6.29550838470459, "global_step": 96990, "epoch": 2309} {"train_loss": -6.291101455688477, "global_step": 96991, "epoch": 2309} {"train_loss": -6.050020217895508, "global_step": 96992, "epoch": 2309} {"train_loss": -6.294511795043945, "global_step": 96993, "epoch": 2309} {"train_loss": -6.195150375366211, "global_step": 96994, "epoch": 2309} {"train_loss": -6.363827228546143, "global_step": 96995, "epoch": 2309} {"train_loss": -6.267361164093018, "global_step": 96996, "epoch": 2309} {"train_loss": -6.353155136108398, "global_step": 96997, "epoch": 2309} {"train_loss": -6.338710308074951, "global_step": 96998, "epoch": 2309} {"train_loss": -6.346478462219238, "global_step": 96999, "epoch": 2309} {"train_loss": -6.3590989112854, "global_step": 97000, "epoch": 2309} {"train_loss": -6.302117347717285, "global_step": 97001, "epoch": 2309} {"train_loss": -6.25042724609375, "global_step": 97002, "epoch": 2309} {"train_loss": -6.251894950866699, "global_step": 97003, "epoch": 2309} {"train_loss": -6.231065273284912, "global_step": 97004, "epoch": 2309} {"train_loss": -6.296688556671143, "global_step": 97005, "epoch": 2309} {"train_loss": -6.278457164764404, "global_step": 97006, "epoch": 2309} {"train_loss": -6.304836750030518, "global_step": 97007, "epoch": 2309} {"train_loss": -6.288732528686523, "global_step": 97008, "epoch": 2309} {"train_loss": -6.121707916259766, "global_step": 97009, "epoch": 2309} {"train_loss": -6.287830829620361, "global_step": 97010, "epoch": 2309} {"train_loss": -6.338593006134033, "global_step": 97011, "epoch": 2309} {"train_loss": -6.316842079162598, "global_step": 97012, "epoch": 2309} {"train_loss": -6.248128890991211, "global_step": 97013, "epoch": 2309} {"train_loss": -6.3396453857421875, "global_step": 97014, "epoch": 2309} {"train_loss": -6.287958145141602, "global_step": 97015, "epoch": 2309} {"train_loss": -6.181937217712402, "global_step": 97016, "epoch": 2309} {"train_loss": -6.387325286865234, "global_step": 97017, "epoch": 2309} {"train_loss": -6.142140865325928, "global_step": 97018, "epoch": 2309} {"train_loss": -6.28680682182312, "global_step": 97019, "epoch": 2309, "val_loss": 68105.59375} {"train_loss": -6.290149688720703, "global_step": 97020, "epoch": 2310} {"train_loss": -6.321078300476074, "global_step": 97021, "epoch": 2310} {"train_loss": -6.226931095123291, "global_step": 97022, "epoch": 2310} {"train_loss": -6.262184143066406, "global_step": 97023, "epoch": 2310} {"train_loss": -6.227588653564453, "global_step": 97024, "epoch": 2310} {"train_loss": -6.268980979919434, "global_step": 97025, "epoch": 2310} {"train_loss": -6.2637200355529785, "global_step": 97026, "epoch": 2310} {"train_loss": -6.325221061706543, "global_step": 97027, "epoch": 2310} {"train_loss": -6.258288860321045, "global_step": 97028, "epoch": 2310} {"train_loss": -6.391470909118652, "global_step": 97029, "epoch": 2310} {"train_loss": -6.296992301940918, "global_step": 97030, "epoch": 2310} {"train_loss": -6.34854793548584, "global_step": 97031, "epoch": 2310} {"train_loss": -6.450503349304199, "global_step": 97032, "epoch": 2310} {"train_loss": -6.347582817077637, "global_step": 97033, "epoch": 2310} {"train_loss": -6.304068565368652, "global_step": 97034, "epoch": 2310} {"train_loss": -6.262957572937012, "global_step": 97035, "epoch": 2310} {"train_loss": -6.179679870605469, "global_step": 97036, "epoch": 2310} {"train_loss": -6.349656105041504, "global_step": 97037, "epoch": 2310} {"train_loss": -6.479665756225586, "global_step": 97038, "epoch": 2310} {"train_loss": -6.317464828491211, "global_step": 97039, "epoch": 2310} {"train_loss": -6.39999532699585, "global_step": 97040, "epoch": 2310} {"train_loss": -6.204829216003418, "global_step": 97041, "epoch": 2310} {"train_loss": -6.242213249206543, "global_step": 97042, "epoch": 2310} {"train_loss": -6.291838645935059, "global_step": 97043, "epoch": 2310} {"train_loss": -6.321889400482178, "global_step": 97044, "epoch": 2310} {"train_loss": -6.351953506469727, "global_step": 97045, "epoch": 2310} {"train_loss": -6.234015464782715, "global_step": 97046, "epoch": 2310} {"train_loss": -6.295600414276123, "global_step": 97047, "epoch": 2310} {"train_loss": -6.399461269378662, "global_step": 97048, "epoch": 2310} {"train_loss": -6.3846964836120605, "global_step": 97049, "epoch": 2310} {"train_loss": -6.321991920471191, "global_step": 97050, "epoch": 2310} {"train_loss": -6.329135894775391, "global_step": 97051, "epoch": 2310} {"train_loss": -6.3402910232543945, "global_step": 97052, "epoch": 2310} {"train_loss": -6.281989574432373, "global_step": 97053, "epoch": 2310} {"train_loss": -6.2486796379089355, "global_step": 97054, "epoch": 2310} {"train_loss": -6.358380317687988, "global_step": 97055, "epoch": 2310} {"train_loss": -6.343411445617676, "global_step": 97056, "epoch": 2310} {"train_loss": -6.321980953216553, "global_step": 97057, "epoch": 2310} {"train_loss": -6.246407985687256, "global_step": 97058, "epoch": 2310} {"train_loss": -6.184652328491211, "global_step": 97059, "epoch": 2310} {"train_loss": -6.192895412445068, "global_step": 97060, "epoch": 2310} {"train_loss": -6.299990824290684, "global_step": 97061, "epoch": 2310, "val_loss": 68023.5703125} {"train_loss": -6.317495346069336, "global_step": 97062, "epoch": 2311} {"train_loss": -6.1645708084106445, "global_step": 97063, "epoch": 2311} {"train_loss": -6.136498928070068, "global_step": 97064, "epoch": 2311} {"train_loss": -6.273397445678711, "global_step": 97065, "epoch": 2311} {"train_loss": -6.086077690124512, "global_step": 97066, "epoch": 2311} {"train_loss": -6.333612442016602, "global_step": 97067, "epoch": 2311} {"train_loss": -6.163179397583008, "global_step": 97068, "epoch": 2311} {"train_loss": -6.195321559906006, "global_step": 97069, "epoch": 2311} {"train_loss": -6.34560489654541, "global_step": 97070, "epoch": 2311} {"train_loss": -6.043573379516602, "global_step": 97071, "epoch": 2311} {"train_loss": -6.26305627822876, "global_step": 97072, "epoch": 2311} {"train_loss": -6.130224227905273, "global_step": 97073, "epoch": 2311} {"train_loss": -6.323075294494629, "global_step": 97074, "epoch": 2311} {"train_loss": -6.193253517150879, "global_step": 97075, "epoch": 2311} {"train_loss": -6.2168989181518555, "global_step": 97076, "epoch": 2311} {"train_loss": -6.1456193923950195, "global_step": 97077, "epoch": 2311} {"train_loss": -6.274491310119629, "global_step": 97078, "epoch": 2311} {"train_loss": -5.992177963256836, "global_step": 97079, "epoch": 2311} {"train_loss": -6.371796607971191, "global_step": 97080, "epoch": 2311} {"train_loss": -6.20915412902832, "global_step": 97081, "epoch": 2311} {"train_loss": -6.116789817810059, "global_step": 97082, "epoch": 2311} {"train_loss": -6.1595659255981445, "global_step": 97083, "epoch": 2311} {"train_loss": -6.218255996704102, "global_step": 97084, "epoch": 2311} {"train_loss": -6.20832633972168, "global_step": 97085, "epoch": 2311} {"train_loss": -6.356627464294434, "global_step": 97086, "epoch": 2311} {"train_loss": -6.301417827606201, "global_step": 97087, "epoch": 2311} {"train_loss": -6.358014106750488, "global_step": 97088, "epoch": 2311} {"train_loss": -6.234674453735352, "global_step": 97089, "epoch": 2311} {"train_loss": -6.223537445068359, "global_step": 97090, "epoch": 2311} {"train_loss": -6.335327625274658, "global_step": 97091, "epoch": 2311} {"train_loss": -6.284027099609375, "global_step": 97092, "epoch": 2311} {"train_loss": -6.273734092712402, "global_step": 97093, "epoch": 2311} {"train_loss": -6.358799934387207, "global_step": 97094, "epoch": 2311} {"train_loss": -6.280774116516113, "global_step": 97095, "epoch": 2311} {"train_loss": -6.407907962799072, "global_step": 97096, "epoch": 2311} {"train_loss": -6.3603515625, "global_step": 97097, "epoch": 2311} {"train_loss": -6.361577987670898, "global_step": 97098, "epoch": 2311} {"train_loss": -6.327169418334961, "global_step": 97099, "epoch": 2311} {"train_loss": -6.243023872375488, "global_step": 97100, "epoch": 2311} {"train_loss": -6.359200477600098, "global_step": 97101, "epoch": 2311} {"train_loss": -6.244868755340576, "global_step": 97102, "epoch": 2311} {"train_loss": -6.247650566555205, "global_step": 97103, "epoch": 2311, "val_loss": 67920.5625} {"train_loss": -6.295505523681641, "global_step": 97104, "epoch": 2312} {"train_loss": -6.305179595947266, "global_step": 97105, "epoch": 2312} {"train_loss": -6.398407936096191, "global_step": 97106, "epoch": 2312} {"train_loss": -6.388636589050293, "global_step": 97107, "epoch": 2312} {"train_loss": -6.352133274078369, "global_step": 97108, "epoch": 2312} {"train_loss": -6.346988677978516, "global_step": 97109, "epoch": 2312} {"train_loss": -6.295393466949463, "global_step": 97110, "epoch": 2312} {"train_loss": -6.396300315856934, "global_step": 97111, "epoch": 2312} {"train_loss": -6.434704780578613, "global_step": 97112, "epoch": 2312} {"train_loss": -6.446423053741455, "global_step": 97113, "epoch": 2312} {"train_loss": -6.315691947937012, "global_step": 97114, "epoch": 2312} {"train_loss": -6.374594688415527, "global_step": 97115, "epoch": 2312} {"train_loss": -6.232555389404297, "global_step": 97116, "epoch": 2312} {"train_loss": -6.344986915588379, "global_step": 97117, "epoch": 2312} {"train_loss": -6.284327507019043, "global_step": 97118, "epoch": 2312} {"train_loss": -6.180187225341797, "global_step": 97119, "epoch": 2312} {"train_loss": -6.331897258758545, "global_step": 97120, "epoch": 2312} {"train_loss": -6.35401725769043, "global_step": 97121, "epoch": 2312} {"train_loss": -6.200362682342529, "global_step": 97122, "epoch": 2312} {"train_loss": -6.319400787353516, "global_step": 97123, "epoch": 2312} {"train_loss": -6.308434009552002, "global_step": 97124, "epoch": 2312} {"train_loss": -6.2136993408203125, "global_step": 97125, "epoch": 2312} {"train_loss": -6.359206676483154, "global_step": 97126, "epoch": 2312} {"train_loss": -6.335970878601074, "global_step": 97127, "epoch": 2312} {"train_loss": -6.290780067443848, "global_step": 97128, "epoch": 2312} {"train_loss": -6.171414375305176, "global_step": 97129, "epoch": 2312} {"train_loss": -6.28752326965332, "global_step": 97130, "epoch": 2312} {"train_loss": -6.326938629150391, "global_step": 97131, "epoch": 2312} {"train_loss": -6.481969356536865, "global_step": 97132, "epoch": 2312} {"train_loss": -6.294395446777344, "global_step": 97133, "epoch": 2312} {"train_loss": -6.247215747833252, "global_step": 97134, "epoch": 2312} {"train_loss": -6.401675224304199, "global_step": 97135, "epoch": 2312} {"train_loss": -6.336730003356934, "global_step": 97136, "epoch": 2312} {"train_loss": -6.264385223388672, "global_step": 97137, "epoch": 2312} {"train_loss": -6.2820634841918945, "global_step": 97138, "epoch": 2312} {"train_loss": -6.382547855377197, "global_step": 97139, "epoch": 2312} {"train_loss": -6.298151016235352, "global_step": 97140, "epoch": 2312} {"train_loss": -6.400534629821777, "global_step": 97141, "epoch": 2312} {"train_loss": -6.308199882507324, "global_step": 97142, "epoch": 2312} {"train_loss": -6.463014602661133, "global_step": 97143, "epoch": 2312} {"train_loss": -6.3167829513549805, "global_step": 97144, "epoch": 2312} {"train_loss": -6.325104463668096, "global_step": 97145, "epoch": 2312, "val_loss": 67963.875} {"train_loss": -6.237729549407959, "global_step": 97146, "epoch": 2313} {"train_loss": -6.404680252075195, "global_step": 97147, "epoch": 2313} {"train_loss": -6.349037170410156, "global_step": 97148, "epoch": 2313} {"train_loss": -6.242384910583496, "global_step": 97149, "epoch": 2313} {"train_loss": -6.349084377288818, "global_step": 97150, "epoch": 2313} {"train_loss": -6.286755084991455, "global_step": 97151, "epoch": 2313} {"train_loss": -6.142171382904053, "global_step": 97152, "epoch": 2313} {"train_loss": -6.241705417633057, "global_step": 97153, "epoch": 2313} {"train_loss": -6.287710189819336, "global_step": 97154, "epoch": 2313} {"train_loss": -6.2793097496032715, "global_step": 97155, "epoch": 2313} {"train_loss": -6.391627788543701, "global_step": 97156, "epoch": 2313} {"train_loss": -6.369731903076172, "global_step": 97157, "epoch": 2313} {"train_loss": -6.387825012207031, "global_step": 97158, "epoch": 2313} {"train_loss": -6.331136703491211, "global_step": 97159, "epoch": 2313} {"train_loss": -6.282948017120361, "global_step": 97160, "epoch": 2313} {"train_loss": -6.319362163543701, "global_step": 97161, "epoch": 2313} {"train_loss": -6.3251543045043945, "global_step": 97162, "epoch": 2313} {"train_loss": -6.3017706871032715, "global_step": 97163, "epoch": 2313} {"train_loss": -6.193462371826172, "global_step": 97164, "epoch": 2313} {"train_loss": -6.288818359375, "global_step": 97165, "epoch": 2313} {"train_loss": -6.299871444702148, "global_step": 97166, "epoch": 2313} {"train_loss": -6.379724502563477, "global_step": 97167, "epoch": 2313} {"train_loss": -6.33444881439209, "global_step": 97168, "epoch": 2313} {"train_loss": -6.344242095947266, "global_step": 97169, "epoch": 2313} {"train_loss": -6.256259918212891, "global_step": 97170, "epoch": 2313} {"train_loss": -6.286021709442139, "global_step": 97171, "epoch": 2313} {"train_loss": -6.391118049621582, "global_step": 97172, "epoch": 2313} {"train_loss": -6.364923477172852, "global_step": 97173, "epoch": 2313} {"train_loss": -6.302733421325684, "global_step": 97174, "epoch": 2313} {"train_loss": -6.301497459411621, "global_step": 97175, "epoch": 2313} {"train_loss": -6.310254096984863, "global_step": 97176, "epoch": 2313} {"train_loss": -6.342120170593262, "global_step": 97177, "epoch": 2313} {"train_loss": -6.339014053344727, "global_step": 97178, "epoch": 2313} {"train_loss": -6.316870212554932, "global_step": 97179, "epoch": 2313} {"train_loss": -6.294283866882324, "global_step": 97180, "epoch": 2313} {"train_loss": -6.331503868103027, "global_step": 97181, "epoch": 2313} {"train_loss": -6.185592174530029, "global_step": 97182, "epoch": 2313} {"train_loss": -6.275234222412109, "global_step": 97183, "epoch": 2313} {"train_loss": -6.286694049835205, "global_step": 97184, "epoch": 2313} {"train_loss": -6.232744216918945, "global_step": 97185, "epoch": 2313} {"train_loss": -6.299722671508789, "global_step": 97186, "epoch": 2313} {"train_loss": -6.305773610160465, "global_step": 97187, "epoch": 2313, "val_loss": 68235.21875} {"train_loss": -6.270681381225586, "global_step": 97188, "epoch": 2314} {"train_loss": -6.421995639801025, "global_step": 97189, "epoch": 2314} {"train_loss": -6.205282211303711, "global_step": 97190, "epoch": 2314} {"train_loss": -6.109683036804199, "global_step": 97191, "epoch": 2314} {"train_loss": -6.319866180419922, "global_step": 97192, "epoch": 2314} {"train_loss": -6.204140663146973, "global_step": 97193, "epoch": 2314} {"train_loss": -6.272805690765381, "global_step": 97194, "epoch": 2314} {"train_loss": -6.241119861602783, "global_step": 97195, "epoch": 2314} {"train_loss": -6.331731796264648, "global_step": 97196, "epoch": 2314} {"train_loss": -6.308050632476807, "global_step": 97197, "epoch": 2314} {"train_loss": -6.292264461517334, "global_step": 97198, "epoch": 2314} {"train_loss": -6.299284934997559, "global_step": 97199, "epoch": 2314} {"train_loss": -6.215961456298828, "global_step": 97200, "epoch": 2314} {"train_loss": -6.1874518394470215, "global_step": 97201, "epoch": 2314} {"train_loss": -6.188037872314453, "global_step": 97202, "epoch": 2314} {"train_loss": -6.304786682128906, "global_step": 97203, "epoch": 2314} {"train_loss": -6.34206485748291, "global_step": 97204, "epoch": 2314} {"train_loss": -6.351800918579102, "global_step": 97205, "epoch": 2314} {"train_loss": -6.324469089508057, "global_step": 97206, "epoch": 2314} {"train_loss": -6.261073112487793, "global_step": 97207, "epoch": 2314} {"train_loss": -6.227330207824707, "global_step": 97208, "epoch": 2314} {"train_loss": -6.3338422775268555, "global_step": 97209, "epoch": 2314} {"train_loss": -6.359062194824219, "global_step": 97210, "epoch": 2314} {"train_loss": -6.208011627197266, "global_step": 97211, "epoch": 2314} {"train_loss": -6.283090591430664, "global_step": 97212, "epoch": 2314} {"train_loss": -6.300655841827393, "global_step": 97213, "epoch": 2314} {"train_loss": -6.2137651443481445, "global_step": 97214, "epoch": 2314} {"train_loss": -6.3312811851501465, "global_step": 97215, "epoch": 2314} {"train_loss": -6.21162223815918, "global_step": 97216, "epoch": 2314} {"train_loss": -6.312816619873047, "global_step": 97217, "epoch": 2314} {"train_loss": -6.4809346199035645, "global_step": 97218, "epoch": 2314} {"train_loss": -6.282282829284668, "global_step": 97219, "epoch": 2314} {"train_loss": -6.297178268432617, "global_step": 97220, "epoch": 2314} {"train_loss": -6.162026405334473, "global_step": 97221, "epoch": 2314} {"train_loss": -6.328310966491699, "global_step": 97222, "epoch": 2314} {"train_loss": -6.2654571533203125, "global_step": 97223, "epoch": 2314} {"train_loss": -6.308647155761719, "global_step": 97224, "epoch": 2314} {"train_loss": -6.178476333618164, "global_step": 97225, "epoch": 2314} {"train_loss": -6.356025695800781, "global_step": 97226, "epoch": 2314} {"train_loss": -6.212128639221191, "global_step": 97227, "epoch": 2314} {"train_loss": -6.269044399261475, "global_step": 97228, "epoch": 2314} {"train_loss": -6.277318579810006, "global_step": 97229, "epoch": 2314, "val_loss": 68334.2890625} {"train_loss": -6.321065902709961, "global_step": 97230, "epoch": 2315} {"train_loss": -6.3043532371521, "global_step": 97231, "epoch": 2315} {"train_loss": -6.2467360496521, "global_step": 97232, "epoch": 2315} {"train_loss": -6.185100555419922, "global_step": 97233, "epoch": 2315} {"train_loss": -6.2940216064453125, "global_step": 97234, "epoch": 2315} {"train_loss": -6.233554840087891, "global_step": 97235, "epoch": 2315} {"train_loss": -6.413520812988281, "global_step": 97236, "epoch": 2315} {"train_loss": -6.420212745666504, "global_step": 97237, "epoch": 2315} {"train_loss": -6.311689853668213, "global_step": 97238, "epoch": 2315} {"train_loss": -6.384927749633789, "global_step": 97239, "epoch": 2315} {"train_loss": -6.384467124938965, "global_step": 97240, "epoch": 2315} {"train_loss": -6.205112934112549, "global_step": 97241, "epoch": 2315} {"train_loss": -6.4233856201171875, "global_step": 97242, "epoch": 2315} {"train_loss": -6.169858932495117, "global_step": 97243, "epoch": 2315} {"train_loss": -6.158735752105713, "global_step": 97244, "epoch": 2315} {"train_loss": -6.227612018585205, "global_step": 97245, "epoch": 2315} {"train_loss": -6.400757789611816, "global_step": 97246, "epoch": 2315} {"train_loss": -6.261407375335693, "global_step": 97247, "epoch": 2315} {"train_loss": -6.214988708496094, "global_step": 97248, "epoch": 2315} {"train_loss": -6.3713483810424805, "global_step": 97249, "epoch": 2315} {"train_loss": -6.211369514465332, "global_step": 97250, "epoch": 2315} {"train_loss": -6.323847770690918, "global_step": 97251, "epoch": 2315} {"train_loss": -6.225943565368652, "global_step": 97252, "epoch": 2315} {"train_loss": -6.324551582336426, "global_step": 97253, "epoch": 2315} {"train_loss": -6.30042028427124, "global_step": 97254, "epoch": 2315} {"train_loss": -6.244829177856445, "global_step": 97255, "epoch": 2315} {"train_loss": -6.374293327331543, "global_step": 97256, "epoch": 2315} {"train_loss": -6.1925506591796875, "global_step": 97257, "epoch": 2315} {"train_loss": -6.2897162437438965, "global_step": 97258, "epoch": 2315} {"train_loss": -6.248998641967773, "global_step": 97259, "epoch": 2315} {"train_loss": -6.298779487609863, "global_step": 97260, "epoch": 2315} {"train_loss": -6.325839042663574, "global_step": 97261, "epoch": 2315} {"train_loss": -6.314672946929932, "global_step": 97262, "epoch": 2315} {"train_loss": -6.318197250366211, "global_step": 97263, "epoch": 2315} {"train_loss": -6.239889144897461, "global_step": 97264, "epoch": 2315} {"train_loss": -6.330588340759277, "global_step": 97265, "epoch": 2315} {"train_loss": -6.390344619750977, "global_step": 97266, "epoch": 2315} {"train_loss": -6.270663261413574, "global_step": 97267, "epoch": 2315} {"train_loss": -6.379177093505859, "global_step": 97268, "epoch": 2315} {"train_loss": -6.400641918182373, "global_step": 97269, "epoch": 2315} {"train_loss": -6.315877914428711, "global_step": 97270, "epoch": 2315} {"train_loss": -6.296660502751668, "global_step": 97271, "epoch": 2315, "val_loss": 67962.125} {"train_loss": -6.365570068359375, "global_step": 97272, "epoch": 2316} {"train_loss": -6.355510711669922, "global_step": 97273, "epoch": 2316} {"train_loss": -6.307559967041016, "global_step": 97274, "epoch": 2316} {"train_loss": -6.327816009521484, "global_step": 97275, "epoch": 2316} {"train_loss": -6.35546875, "global_step": 97276, "epoch": 2316} {"train_loss": -6.254386901855469, "global_step": 97277, "epoch": 2316} {"train_loss": -6.269426345825195, "global_step": 97278, "epoch": 2316} {"train_loss": -6.389161586761475, "global_step": 97279, "epoch": 2316} {"train_loss": -6.3018717765808105, "global_step": 97280, "epoch": 2316} {"train_loss": -6.195849418640137, "global_step": 97281, "epoch": 2316} {"train_loss": -6.293666839599609, "global_step": 97282, "epoch": 2316} {"train_loss": -6.2785210609436035, "global_step": 97283, "epoch": 2316} {"train_loss": -6.400275230407715, "global_step": 97284, "epoch": 2316} {"train_loss": -6.3252081871032715, "global_step": 97285, "epoch": 2316} {"train_loss": -6.369100570678711, "global_step": 97286, "epoch": 2316} {"train_loss": -6.324695587158203, "global_step": 97287, "epoch": 2316} {"train_loss": -6.231794834136963, "global_step": 97288, "epoch": 2316} {"train_loss": -6.318215370178223, "global_step": 97289, "epoch": 2316} {"train_loss": -6.304698944091797, "global_step": 97290, "epoch": 2316} {"train_loss": -6.352794170379639, "global_step": 97291, "epoch": 2316} {"train_loss": -6.340550899505615, "global_step": 97292, "epoch": 2316} {"train_loss": -6.327069282531738, "global_step": 97293, "epoch": 2316} {"train_loss": -6.371903896331787, "global_step": 97294, "epoch": 2316} {"train_loss": -6.316064357757568, "global_step": 97295, "epoch": 2316} {"train_loss": -6.260097980499268, "global_step": 97296, "epoch": 2316} {"train_loss": -6.309013366699219, "global_step": 97297, "epoch": 2316} {"train_loss": -6.3426971435546875, "global_step": 97298, "epoch": 2316} {"train_loss": -6.344208240509033, "global_step": 97299, "epoch": 2316} {"train_loss": -6.222774505615234, "global_step": 97300, "epoch": 2316} {"train_loss": -6.41878604888916, "global_step": 97301, "epoch": 2316} {"train_loss": -6.4028849601745605, "global_step": 97302, "epoch": 2316} {"train_loss": -6.367976665496826, "global_step": 97303, "epoch": 2316} {"train_loss": -6.316079616546631, "global_step": 97304, "epoch": 2316} {"train_loss": -6.4223480224609375, "global_step": 97305, "epoch": 2316} {"train_loss": -6.236961841583252, "global_step": 97306, "epoch": 2316} {"train_loss": -6.339170455932617, "global_step": 97307, "epoch": 2316} {"train_loss": -6.415555000305176, "global_step": 97308, "epoch": 2316} {"train_loss": -6.201423168182373, "global_step": 97309, "epoch": 2316} {"train_loss": -6.455322265625, "global_step": 97310, "epoch": 2316} {"train_loss": -6.305502891540527, "global_step": 97311, "epoch": 2316} {"train_loss": -6.320706844329834, "global_step": 97312, "epoch": 2316} {"train_loss": -6.328953811100551, "global_step": 97313, "epoch": 2316, "val_loss": 67908.984375} {"train_loss": -6.394163131713867, "global_step": 97314, "epoch": 2317} {"train_loss": -6.304793357849121, "global_step": 97315, "epoch": 2317} {"train_loss": -6.26271915435791, "global_step": 97316, "epoch": 2317} {"train_loss": -6.426371097564697, "global_step": 97317, "epoch": 2317} {"train_loss": -6.3147125244140625, "global_step": 97318, "epoch": 2317} {"train_loss": -6.3203816413879395, "global_step": 97319, "epoch": 2317} {"train_loss": -6.369630813598633, "global_step": 97320, "epoch": 2317} {"train_loss": -6.342069149017334, "global_step": 97321, "epoch": 2317} {"train_loss": -6.339136123657227, "global_step": 97322, "epoch": 2317} {"train_loss": -6.278092384338379, "global_step": 97323, "epoch": 2317} {"train_loss": -6.275842666625977, "global_step": 97324, "epoch": 2317} {"train_loss": -6.454980850219727, "global_step": 97325, "epoch": 2317} {"train_loss": -6.392714977264404, "global_step": 97326, "epoch": 2317} {"train_loss": -6.385647773742676, "global_step": 97327, "epoch": 2317} {"train_loss": -6.282122611999512, "global_step": 97328, "epoch": 2317} {"train_loss": -6.351661682128906, "global_step": 97329, "epoch": 2317} {"train_loss": -6.338027477264404, "global_step": 97330, "epoch": 2317} {"train_loss": -6.306236743927002, "global_step": 97331, "epoch": 2317} {"train_loss": -6.285320281982422, "global_step": 97332, "epoch": 2317} {"train_loss": -6.3551926612854, "global_step": 97333, "epoch": 2317} {"train_loss": -6.278322219848633, "global_step": 97334, "epoch": 2317} {"train_loss": -6.468777656555176, "global_step": 97335, "epoch": 2317} {"train_loss": -6.17723274230957, "global_step": 97336, "epoch": 2317} {"train_loss": -6.378881931304932, "global_step": 97337, "epoch": 2317} {"train_loss": -6.310619354248047, "global_step": 97338, "epoch": 2317} {"train_loss": -6.25623893737793, "global_step": 97339, "epoch": 2317} {"train_loss": -6.2034196853637695, "global_step": 97340, "epoch": 2317} {"train_loss": -6.226459503173828, "global_step": 97341, "epoch": 2317} {"train_loss": -6.350236415863037, "global_step": 97342, "epoch": 2317} {"train_loss": -6.276407241821289, "global_step": 97343, "epoch": 2317} {"train_loss": -6.225812911987305, "global_step": 97344, "epoch": 2317} {"train_loss": -6.3061604499816895, "global_step": 97345, "epoch": 2317} {"train_loss": -6.302030563354492, "global_step": 97346, "epoch": 2317} {"train_loss": -6.3431925773620605, "global_step": 97347, "epoch": 2317} {"train_loss": -6.233189582824707, "global_step": 97348, "epoch": 2317} {"train_loss": -6.22274923324585, "global_step": 97349, "epoch": 2317} {"train_loss": -6.436678886413574, "global_step": 97350, "epoch": 2317} {"train_loss": -6.213382720947266, "global_step": 97351, "epoch": 2317} {"train_loss": -6.26572322845459, "global_step": 97352, "epoch": 2317} {"train_loss": -6.229077339172363, "global_step": 97353, "epoch": 2317} {"train_loss": -6.186321258544922, "global_step": 97354, "epoch": 2317} {"train_loss": -6.306078195571899, "global_step": 97355, "epoch": 2317, "val_loss": 67736.3671875} {"train_loss": -6.350900650024414, "global_step": 97356, "epoch": 2318} {"train_loss": -6.269998073577881, "global_step": 97357, "epoch": 2318} {"train_loss": -6.349849700927734, "global_step": 97358, "epoch": 2318} {"train_loss": -6.227145195007324, "global_step": 97359, "epoch": 2318} {"train_loss": -6.309235572814941, "global_step": 97360, "epoch": 2318} {"train_loss": -6.280800819396973, "global_step": 97361, "epoch": 2318} {"train_loss": -6.321746826171875, "global_step": 97362, "epoch": 2318} {"train_loss": -6.424742698669434, "global_step": 97363, "epoch": 2318} {"train_loss": -6.384538650512695, "global_step": 97364, "epoch": 2318} {"train_loss": -6.359112739562988, "global_step": 97365, "epoch": 2318} {"train_loss": -6.332156181335449, "global_step": 97366, "epoch": 2318} {"train_loss": -6.322988986968994, "global_step": 97367, "epoch": 2318} {"train_loss": -6.3696417808532715, "global_step": 97368, "epoch": 2318} {"train_loss": -6.274735450744629, "global_step": 97369, "epoch": 2318} {"train_loss": -6.315199851989746, "global_step": 97370, "epoch": 2318} {"train_loss": -6.29822301864624, "global_step": 97371, "epoch": 2318} {"train_loss": -6.249459266662598, "global_step": 97372, "epoch": 2318} {"train_loss": -6.221798896789551, "global_step": 97373, "epoch": 2318} {"train_loss": -6.348977565765381, "global_step": 97374, "epoch": 2318} {"train_loss": -6.339060306549072, "global_step": 97375, "epoch": 2318} {"train_loss": -6.405245780944824, "global_step": 97376, "epoch": 2318} {"train_loss": -6.308568477630615, "global_step": 97377, "epoch": 2318} {"train_loss": -6.226617813110352, "global_step": 97378, "epoch": 2318} {"train_loss": -6.283936023712158, "global_step": 97379, "epoch": 2318} {"train_loss": -6.3414483070373535, "global_step": 97380, "epoch": 2318} {"train_loss": -6.416512966156006, "global_step": 97381, "epoch": 2318} {"train_loss": -6.230050086975098, "global_step": 97382, "epoch": 2318} {"train_loss": -6.535102844238281, "global_step": 97383, "epoch": 2318} {"train_loss": -6.364914894104004, "global_step": 97384, "epoch": 2318} {"train_loss": -6.311958312988281, "global_step": 97385, "epoch": 2318} {"train_loss": -6.294494152069092, "global_step": 97386, "epoch": 2318} {"train_loss": -6.328125, "global_step": 97387, "epoch": 2318} {"train_loss": -6.316451072692871, "global_step": 97388, "epoch": 2318} {"train_loss": -6.3839311599731445, "global_step": 97389, "epoch": 2318} {"train_loss": -6.348799705505371, "global_step": 97390, "epoch": 2318} {"train_loss": -6.236740589141846, "global_step": 97391, "epoch": 2318} {"train_loss": -6.292229175567627, "global_step": 97392, "epoch": 2318} {"train_loss": -6.250107765197754, "global_step": 97393, "epoch": 2318} {"train_loss": -6.42814826965332, "global_step": 97394, "epoch": 2318} {"train_loss": -6.193589210510254, "global_step": 97395, "epoch": 2318} {"train_loss": -6.231760025024414, "global_step": 97396, "epoch": 2318} {"train_loss": -6.3186947618212015, "global_step": 97397, "epoch": 2318, "val_loss": 68178.9921875} {"train_loss": -6.204672813415527, "global_step": 97398, "epoch": 2319} {"train_loss": -6.353710174560547, "global_step": 97399, "epoch": 2319} {"train_loss": -6.173440456390381, "global_step": 97400, "epoch": 2319} {"train_loss": -6.166186332702637, "global_step": 97401, "epoch": 2319} {"train_loss": -6.348355293273926, "global_step": 97402, "epoch": 2319} {"train_loss": -6.282729148864746, "global_step": 97403, "epoch": 2319} {"train_loss": -6.252039909362793, "global_step": 97404, "epoch": 2319} {"train_loss": -6.381652355194092, "global_step": 97405, "epoch": 2319} {"train_loss": -6.2679853439331055, "global_step": 97406, "epoch": 2319} {"train_loss": -6.457508087158203, "global_step": 97407, "epoch": 2319} {"train_loss": -6.252192497253418, "global_step": 97408, "epoch": 2319} {"train_loss": -6.4375, "global_step": 97409, "epoch": 2319} {"train_loss": -6.393204212188721, "global_step": 97410, "epoch": 2319} {"train_loss": -6.3041090965271, "global_step": 97411, "epoch": 2319} {"train_loss": -6.421489715576172, "global_step": 97412, "epoch": 2319} {"train_loss": -6.41757869720459, "global_step": 97413, "epoch": 2319} {"train_loss": -6.352916240692139, "global_step": 97414, "epoch": 2319} {"train_loss": -6.3495001792907715, "global_step": 97415, "epoch": 2319} {"train_loss": -6.312753200531006, "global_step": 97416, "epoch": 2319} {"train_loss": -6.314947605133057, "global_step": 97417, "epoch": 2319} {"train_loss": -6.25557804107666, "global_step": 97418, "epoch": 2319} {"train_loss": -6.304620742797852, "global_step": 97419, "epoch": 2319} {"train_loss": -6.304810523986816, "global_step": 97420, "epoch": 2319} {"train_loss": -6.265179634094238, "global_step": 97421, "epoch": 2319} {"train_loss": -6.23605489730835, "global_step": 97422, "epoch": 2319} {"train_loss": -6.281479835510254, "global_step": 97423, "epoch": 2319} {"train_loss": -6.091442584991455, "global_step": 97424, "epoch": 2319} {"train_loss": -6.237884521484375, "global_step": 97425, "epoch": 2319} {"train_loss": -6.258796691894531, "global_step": 97426, "epoch": 2319} {"train_loss": -6.197775840759277, "global_step": 97427, "epoch": 2319} {"train_loss": -6.321743488311768, "global_step": 97428, "epoch": 2319} {"train_loss": -6.12813138961792, "global_step": 97429, "epoch": 2319} {"train_loss": -6.22782564163208, "global_step": 97430, "epoch": 2319} {"train_loss": -6.177121162414551, "global_step": 97431, "epoch": 2319} {"train_loss": -6.2432637214660645, "global_step": 97432, "epoch": 2319} {"train_loss": -6.310796737670898, "global_step": 97433, "epoch": 2319} {"train_loss": -6.356400012969971, "global_step": 97434, "epoch": 2319} {"train_loss": -6.226893424987793, "global_step": 97435, "epoch": 2319} {"train_loss": -6.347742080688477, "global_step": 97436, "epoch": 2319} {"train_loss": -6.3671159744262695, "global_step": 97437, "epoch": 2319} {"train_loss": -6.211207866668701, "global_step": 97438, "epoch": 2319} {"train_loss": -6.288797367186773, "global_step": 97439, "epoch": 2319, "val_loss": 68070.4140625} {"train_loss": -6.157599449157715, "global_step": 97440, "epoch": 2320} {"train_loss": -6.2699737548828125, "global_step": 97441, "epoch": 2320} {"train_loss": -6.304145812988281, "global_step": 97442, "epoch": 2320} {"train_loss": -6.321733474731445, "global_step": 97443, "epoch": 2320} {"train_loss": -6.44992733001709, "global_step": 97444, "epoch": 2320} {"train_loss": -6.356858253479004, "global_step": 97445, "epoch": 2320} {"train_loss": -6.281431198120117, "global_step": 97446, "epoch": 2320} {"train_loss": -6.305449485778809, "global_step": 97447, "epoch": 2320} {"train_loss": -6.243579864501953, "global_step": 97448, "epoch": 2320} {"train_loss": -6.251881122589111, "global_step": 97449, "epoch": 2320} {"train_loss": -6.267794132232666, "global_step": 97450, "epoch": 2320} {"train_loss": -6.3038649559021, "global_step": 97451, "epoch": 2320} {"train_loss": -6.310145378112793, "global_step": 97452, "epoch": 2320} {"train_loss": -6.2907843589782715, "global_step": 97453, "epoch": 2320} {"train_loss": -6.3205342292785645, "global_step": 97454, "epoch": 2320} {"train_loss": -6.2810258865356445, "global_step": 97455, "epoch": 2320} {"train_loss": -6.329126358032227, "global_step": 97456, "epoch": 2320} {"train_loss": -6.297913551330566, "global_step": 97457, "epoch": 2320} {"train_loss": -6.336413860321045, "global_step": 97458, "epoch": 2320} {"train_loss": -6.384639739990234, "global_step": 97459, "epoch": 2320} {"train_loss": -6.391349792480469, "global_step": 97460, "epoch": 2320} {"train_loss": -6.321740627288818, "global_step": 97461, "epoch": 2320} {"train_loss": -6.359506130218506, "global_step": 97462, "epoch": 2320} {"train_loss": -6.329463481903076, "global_step": 97463, "epoch": 2320} {"train_loss": -6.281505107879639, "global_step": 97464, "epoch": 2320} {"train_loss": -6.284806728363037, "global_step": 97465, "epoch": 2320} {"train_loss": -6.268667221069336, "global_step": 97466, "epoch": 2320} {"train_loss": -6.350052833557129, "global_step": 97467, "epoch": 2320} {"train_loss": -6.3606367111206055, "global_step": 97468, "epoch": 2320} {"train_loss": -6.434118747711182, "global_step": 97469, "epoch": 2320} {"train_loss": -6.251263618469238, "global_step": 97470, "epoch": 2320} {"train_loss": -6.341569900512695, "global_step": 97471, "epoch": 2320} {"train_loss": -6.381806373596191, "global_step": 97472, "epoch": 2320} {"train_loss": -6.3076982498168945, "global_step": 97473, "epoch": 2320} {"train_loss": -6.446844100952148, "global_step": 97474, "epoch": 2320} {"train_loss": -6.287039756774902, "global_step": 97475, "epoch": 2320} {"train_loss": -6.3054656982421875, "global_step": 97476, "epoch": 2320} {"train_loss": -6.326151371002197, "global_step": 97477, "epoch": 2320} {"train_loss": -6.312882423400879, "global_step": 97478, "epoch": 2320} {"train_loss": -6.400762557983398, "global_step": 97479, "epoch": 2320} {"train_loss": -6.394775867462158, "global_step": 97480, "epoch": 2320} {"train_loss": -6.323502540588379, "global_step": 97481, "epoch": 2320, "val_loss": 68026.6484375} {"train_loss": -6.3138298988342285, "global_step": 97482, "epoch": 2321} {"train_loss": -6.366694927215576, "global_step": 97483, "epoch": 2321} {"train_loss": -6.38836145401001, "global_step": 97484, "epoch": 2321} {"train_loss": -6.291465759277344, "global_step": 97485, "epoch": 2321} {"train_loss": -6.140484809875488, "global_step": 97486, "epoch": 2321} {"train_loss": -6.325414657592773, "global_step": 97487, "epoch": 2321} {"train_loss": -6.328988075256348, "global_step": 97488, "epoch": 2321} {"train_loss": -6.330726146697998, "global_step": 97489, "epoch": 2321} {"train_loss": -6.277979850769043, "global_step": 97490, "epoch": 2321} {"train_loss": -6.432370185852051, "global_step": 97491, "epoch": 2321} {"train_loss": -6.289756774902344, "global_step": 97492, "epoch": 2321} {"train_loss": -6.279512405395508, "global_step": 97493, "epoch": 2321} {"train_loss": -6.348830223083496, "global_step": 97494, "epoch": 2321} {"train_loss": -6.332466125488281, "global_step": 97495, "epoch": 2321} {"train_loss": -6.394899845123291, "global_step": 97496, "epoch": 2321} {"train_loss": -6.299123764038086, "global_step": 97497, "epoch": 2321} {"train_loss": -6.344338417053223, "global_step": 97498, "epoch": 2321} {"train_loss": -6.29582405090332, "global_step": 97499, "epoch": 2321} {"train_loss": -6.325636386871338, "global_step": 97500, "epoch": 2321} {"train_loss": -6.325098037719727, "global_step": 97501, "epoch": 2321} {"train_loss": -6.382348537445068, "global_step": 97502, "epoch": 2321} {"train_loss": -6.3398213386535645, "global_step": 97503, "epoch": 2321} {"train_loss": -6.216447830200195, "global_step": 97504, "epoch": 2321} {"train_loss": -6.328821182250977, "global_step": 97505, "epoch": 2321} {"train_loss": -6.274376392364502, "global_step": 97506, "epoch": 2321} {"train_loss": -6.315442085266113, "global_step": 97507, "epoch": 2321} {"train_loss": -6.219295024871826, "global_step": 97508, "epoch": 2321} {"train_loss": -6.296517372131348, "global_step": 97509, "epoch": 2321} {"train_loss": -6.348169803619385, "global_step": 97510, "epoch": 2321} {"train_loss": -6.314982891082764, "global_step": 97511, "epoch": 2321} {"train_loss": -6.3006978034973145, "global_step": 97512, "epoch": 2321} {"train_loss": -6.245096206665039, "global_step": 97513, "epoch": 2321} {"train_loss": -6.288930416107178, "global_step": 97514, "epoch": 2321} {"train_loss": -6.33403205871582, "global_step": 97515, "epoch": 2321} {"train_loss": -6.348913669586182, "global_step": 97516, "epoch": 2321} {"train_loss": -6.298932075500488, "global_step": 97517, "epoch": 2321} {"train_loss": -6.418164253234863, "global_step": 97518, "epoch": 2321} {"train_loss": -6.263957977294922, "global_step": 97519, "epoch": 2321} {"train_loss": -6.288238525390625, "global_step": 97520, "epoch": 2321} {"train_loss": -6.353782653808594, "global_step": 97521, "epoch": 2321} {"train_loss": -6.455404758453369, "global_step": 97522, "epoch": 2321} {"train_loss": -6.3183098293486095, "global_step": 97523, "epoch": 2321, "val_loss": 68140.515625} {"train_loss": -6.309935569763184, "global_step": 97524, "epoch": 2322} {"train_loss": -6.2873382568359375, "global_step": 97525, "epoch": 2322} {"train_loss": -6.273879051208496, "global_step": 97526, "epoch": 2322} {"train_loss": -6.3470354080200195, "global_step": 97527, "epoch": 2322} {"train_loss": -6.380154609680176, "global_step": 97528, "epoch": 2322} {"train_loss": -6.404180526733398, "global_step": 97529, "epoch": 2322} {"train_loss": -6.341038703918457, "global_step": 97530, "epoch": 2322} {"train_loss": -6.29694938659668, "global_step": 97531, "epoch": 2322} {"train_loss": -6.2865753173828125, "global_step": 97532, "epoch": 2322} {"train_loss": -6.4277496337890625, "global_step": 97533, "epoch": 2322} {"train_loss": -6.227169036865234, "global_step": 97534, "epoch": 2322} {"train_loss": -6.291842937469482, "global_step": 97535, "epoch": 2322} {"train_loss": -6.268978118896484, "global_step": 97536, "epoch": 2322} {"train_loss": -6.3318257331848145, "global_step": 97537, "epoch": 2322} {"train_loss": -6.243612766265869, "global_step": 97538, "epoch": 2322} {"train_loss": -6.349222183227539, "global_step": 97539, "epoch": 2322} {"train_loss": -6.378350257873535, "global_step": 97540, "epoch": 2322} {"train_loss": -6.277975082397461, "global_step": 97541, "epoch": 2322} {"train_loss": -6.285015106201172, "global_step": 97542, "epoch": 2322} {"train_loss": -6.3133955001831055, "global_step": 97543, "epoch": 2322} {"train_loss": -6.237110614776611, "global_step": 97544, "epoch": 2322} {"train_loss": -6.244035243988037, "global_step": 97545, "epoch": 2322} {"train_loss": -6.352302551269531, "global_step": 97546, "epoch": 2322} {"train_loss": -6.313169479370117, "global_step": 97547, "epoch": 2322} {"train_loss": -6.260249614715576, "global_step": 97548, "epoch": 2322} {"train_loss": -6.340121269226074, "global_step": 97549, "epoch": 2322} {"train_loss": -6.235466480255127, "global_step": 97550, "epoch": 2322} {"train_loss": -6.154818534851074, "global_step": 97551, "epoch": 2322} {"train_loss": -6.2865777015686035, "global_step": 97552, "epoch": 2322} {"train_loss": -6.303905963897705, "global_step": 97553, "epoch": 2322} {"train_loss": -6.162868499755859, "global_step": 97554, "epoch": 2322} {"train_loss": -6.194892883300781, "global_step": 97555, "epoch": 2322} {"train_loss": -6.330902576446533, "global_step": 97556, "epoch": 2322} {"train_loss": -6.16402530670166, "global_step": 97557, "epoch": 2322} {"train_loss": -6.350342750549316, "global_step": 97558, "epoch": 2322} {"train_loss": -6.308358192443848, "global_step": 97559, "epoch": 2322} {"train_loss": -6.181465148925781, "global_step": 97560, "epoch": 2322} {"train_loss": -6.222887992858887, "global_step": 97561, "epoch": 2322} {"train_loss": -6.269985198974609, "global_step": 97562, "epoch": 2322} {"train_loss": -6.288180351257324, "global_step": 97563, "epoch": 2322} {"train_loss": -6.394722938537598, "global_step": 97564, "epoch": 2322} {"train_loss": -6.288888034366426, "global_step": 97565, "epoch": 2322, "val_loss": 68077.0625} {"train_loss": -6.283111572265625, "global_step": 97566, "epoch": 2323} {"train_loss": -6.3097243309021, "global_step": 97567, "epoch": 2323} {"train_loss": -6.271960735321045, "global_step": 97568, "epoch": 2323} {"train_loss": -6.214633941650391, "global_step": 97569, "epoch": 2323} {"train_loss": -6.407615661621094, "global_step": 97570, "epoch": 2323} {"train_loss": -6.345128059387207, "global_step": 97571, "epoch": 2323} {"train_loss": -6.337821006774902, "global_step": 97572, "epoch": 2323} {"train_loss": -6.338127136230469, "global_step": 97573, "epoch": 2323} {"train_loss": -6.130418300628662, "global_step": 97574, "epoch": 2323} {"train_loss": -6.345332145690918, "global_step": 97575, "epoch": 2323} {"train_loss": -6.284759521484375, "global_step": 97576, "epoch": 2323} {"train_loss": -6.258816242218018, "global_step": 97577, "epoch": 2323} {"train_loss": -6.338579177856445, "global_step": 97578, "epoch": 2323} {"train_loss": -6.2186279296875, "global_step": 97579, "epoch": 2323} {"train_loss": -6.272953987121582, "global_step": 97580, "epoch": 2323} {"train_loss": -6.168914318084717, "global_step": 97581, "epoch": 2323} {"train_loss": -6.374781608581543, "global_step": 97582, "epoch": 2323} {"train_loss": -6.397773742675781, "global_step": 97583, "epoch": 2323} {"train_loss": -6.265759468078613, "global_step": 97584, "epoch": 2323} {"train_loss": -6.3169403076171875, "global_step": 97585, "epoch": 2323} {"train_loss": -6.3230390548706055, "global_step": 97586, "epoch": 2323} {"train_loss": -6.263681411743164, "global_step": 97587, "epoch": 2323} {"train_loss": -6.3428168296813965, "global_step": 97588, "epoch": 2323} {"train_loss": -6.393221855163574, "global_step": 97589, "epoch": 2323} {"train_loss": -6.229487419128418, "global_step": 97590, "epoch": 2323} {"train_loss": -6.415215015411377, "global_step": 97591, "epoch": 2323} {"train_loss": -6.431380271911621, "global_step": 97592, "epoch": 2323} {"train_loss": -6.363802909851074, "global_step": 97593, "epoch": 2323} {"train_loss": -6.405274391174316, "global_step": 97594, "epoch": 2323} {"train_loss": -6.250039577484131, "global_step": 97595, "epoch": 2323} {"train_loss": -6.325132369995117, "global_step": 97596, "epoch": 2323} {"train_loss": -6.27855110168457, "global_step": 97597, "epoch": 2323} {"train_loss": -6.180136680603027, "global_step": 97598, "epoch": 2323} {"train_loss": -6.380626678466797, "global_step": 97599, "epoch": 2323} {"train_loss": -6.33126163482666, "global_step": 97600, "epoch": 2323} {"train_loss": -6.340489387512207, "global_step": 97601, "epoch": 2323} {"train_loss": -6.306312561035156, "global_step": 97602, "epoch": 2323} {"train_loss": -6.270668029785156, "global_step": 97603, "epoch": 2323} {"train_loss": -6.282341003417969, "global_step": 97604, "epoch": 2323} {"train_loss": -6.3957624435424805, "global_step": 97605, "epoch": 2323} {"train_loss": -6.282470226287842, "global_step": 97606, "epoch": 2323} {"train_loss": -6.309284380504063, "global_step": 97607, "epoch": 2323, "val_loss": 68185.5625} {"train_loss": -6.228798866271973, "global_step": 97608, "epoch": 2324} {"train_loss": -6.371762275695801, "global_step": 97609, "epoch": 2324} {"train_loss": -6.216512680053711, "global_step": 97610, "epoch": 2324} {"train_loss": -6.1168975830078125, "global_step": 97611, "epoch": 2324} {"train_loss": -6.251739025115967, "global_step": 97612, "epoch": 2324} {"train_loss": -6.30839729309082, "global_step": 97613, "epoch": 2324} {"train_loss": -6.298296928405762, "global_step": 97614, "epoch": 2324} {"train_loss": -6.249800682067871, "global_step": 97615, "epoch": 2324} {"train_loss": -6.32725191116333, "global_step": 97616, "epoch": 2324} {"train_loss": -6.333290100097656, "global_step": 97617, "epoch": 2324} {"train_loss": -6.36491060256958, "global_step": 97618, "epoch": 2324} {"train_loss": -6.355188369750977, "global_step": 97619, "epoch": 2324} {"train_loss": -6.300281524658203, "global_step": 97620, "epoch": 2324} {"train_loss": -6.369761943817139, "global_step": 97621, "epoch": 2324} {"train_loss": -6.236002445220947, "global_step": 97622, "epoch": 2324} {"train_loss": -6.435615539550781, "global_step": 97623, "epoch": 2324} {"train_loss": -6.44162654876709, "global_step": 97624, "epoch": 2324} {"train_loss": -6.328449249267578, "global_step": 97625, "epoch": 2324} {"train_loss": -6.329482078552246, "global_step": 97626, "epoch": 2324} {"train_loss": -6.266940116882324, "global_step": 97627, "epoch": 2324} {"train_loss": -6.337541580200195, "global_step": 97628, "epoch": 2324} {"train_loss": -6.330362796783447, "global_step": 97629, "epoch": 2324} {"train_loss": -6.569252967834473, "global_step": 97630, "epoch": 2324} {"train_loss": -6.265588760375977, "global_step": 97631, "epoch": 2324} {"train_loss": -6.360201835632324, "global_step": 97632, "epoch": 2324} {"train_loss": -6.371901035308838, "global_step": 97633, "epoch": 2324} {"train_loss": -6.284913063049316, "global_step": 97634, "epoch": 2324} {"train_loss": -6.1964263916015625, "global_step": 97635, "epoch": 2324} {"train_loss": -6.314016342163086, "global_step": 97636, "epoch": 2324} {"train_loss": -6.246185302734375, "global_step": 97637, "epoch": 2324} {"train_loss": -6.269232749938965, "global_step": 97638, "epoch": 2324} {"train_loss": -6.306200981140137, "global_step": 97639, "epoch": 2324} {"train_loss": -6.284925937652588, "global_step": 97640, "epoch": 2324} {"train_loss": -6.309958457946777, "global_step": 97641, "epoch": 2324} {"train_loss": -6.362676620483398, "global_step": 97642, "epoch": 2324} {"train_loss": -6.287961006164551, "global_step": 97643, "epoch": 2324} {"train_loss": -6.374026298522949, "global_step": 97644, "epoch": 2324} {"train_loss": -6.3786725997924805, "global_step": 97645, "epoch": 2324} {"train_loss": -6.355636119842529, "global_step": 97646, "epoch": 2324} {"train_loss": -6.307010650634766, "global_step": 97647, "epoch": 2324} {"train_loss": -6.37523078918457, "global_step": 97648, "epoch": 2324} {"train_loss": -6.316432294391451, "global_step": 97649, "epoch": 2324, "val_loss": 67857.28125} {"train_loss": -6.218807697296143, "global_step": 97650, "epoch": 2325} {"train_loss": -6.3280930519104, "global_step": 97651, "epoch": 2325} {"train_loss": -6.129487991333008, "global_step": 97652, "epoch": 2325} {"train_loss": -6.343354225158691, "global_step": 97653, "epoch": 2325} {"train_loss": -6.299262046813965, "global_step": 97654, "epoch": 2325} {"train_loss": -6.2786946296691895, "global_step": 97655, "epoch": 2325} {"train_loss": -6.310948371887207, "global_step": 97656, "epoch": 2325} {"train_loss": -6.28450870513916, "global_step": 97657, "epoch": 2325} {"train_loss": -6.308753967285156, "global_step": 97658, "epoch": 2325} {"train_loss": -6.241052627563477, "global_step": 97659, "epoch": 2325} {"train_loss": -6.268885612487793, "global_step": 97660, "epoch": 2325} {"train_loss": -6.304046630859375, "global_step": 97661, "epoch": 2325} {"train_loss": -6.426913738250732, "global_step": 97662, "epoch": 2325} {"train_loss": -6.388128757476807, "global_step": 97663, "epoch": 2325} {"train_loss": -6.36966609954834, "global_step": 97664, "epoch": 2325} {"train_loss": -6.44895601272583, "global_step": 97665, "epoch": 2325} {"train_loss": -6.413442134857178, "global_step": 97666, "epoch": 2325} {"train_loss": -6.374455451965332, "global_step": 97667, "epoch": 2325} {"train_loss": -6.432064056396484, "global_step": 97668, "epoch": 2325} {"train_loss": -6.284162521362305, "global_step": 97669, "epoch": 2325} {"train_loss": -6.417851448059082, "global_step": 97670, "epoch": 2325} {"train_loss": -6.281839370727539, "global_step": 97671, "epoch": 2325} {"train_loss": -6.446122169494629, "global_step": 97672, "epoch": 2325} {"train_loss": -6.336771488189697, "global_step": 97673, "epoch": 2325} {"train_loss": -6.35458517074585, "global_step": 97674, "epoch": 2325} {"train_loss": -6.276886463165283, "global_step": 97675, "epoch": 2325} {"train_loss": -6.377914905548096, "global_step": 97676, "epoch": 2325} {"train_loss": -6.363792896270752, "global_step": 97677, "epoch": 2325} {"train_loss": -6.481359004974365, "global_step": 97678, "epoch": 2325} {"train_loss": -6.267416477203369, "global_step": 97679, "epoch": 2325} {"train_loss": -6.368025302886963, "global_step": 97680, "epoch": 2325} {"train_loss": -6.288670539855957, "global_step": 97681, "epoch": 2325} {"train_loss": -6.277853012084961, "global_step": 97682, "epoch": 2325} {"train_loss": -6.26001501083374, "global_step": 97683, "epoch": 2325} {"train_loss": -6.209503173828125, "global_step": 97684, "epoch": 2325} {"train_loss": -6.187448978424072, "global_step": 97685, "epoch": 2325} {"train_loss": -6.259443759918213, "global_step": 97686, "epoch": 2325} {"train_loss": -6.126591205596924, "global_step": 97687, "epoch": 2325} {"train_loss": -6.3254804611206055, "global_step": 97688, "epoch": 2325} {"train_loss": -6.310792922973633, "global_step": 97689, "epoch": 2325} {"train_loss": -6.176094055175781, "global_step": 97690, "epoch": 2325} {"train_loss": -6.314822072074527, "global_step": 97691, "epoch": 2325, "val_loss": 68055.96875} {"train_loss": -6.2887959480285645, "global_step": 97692, "epoch": 2326} {"train_loss": -6.266170978546143, "global_step": 97693, "epoch": 2326} {"train_loss": -6.235092639923096, "global_step": 97694, "epoch": 2326} {"train_loss": -6.262232303619385, "global_step": 97695, "epoch": 2326} {"train_loss": -6.353243827819824, "global_step": 97696, "epoch": 2326} {"train_loss": -6.308015823364258, "global_step": 97697, "epoch": 2326} {"train_loss": -6.261408805847168, "global_step": 97698, "epoch": 2326} {"train_loss": -6.302001953125, "global_step": 97699, "epoch": 2326} {"train_loss": -6.270544052124023, "global_step": 97700, "epoch": 2326} {"train_loss": -6.153353691101074, "global_step": 97701, "epoch": 2326} {"train_loss": -6.443042278289795, "global_step": 97702, "epoch": 2326} {"train_loss": -6.262580871582031, "global_step": 97703, "epoch": 2326} {"train_loss": -6.317081928253174, "global_step": 97704, "epoch": 2326} {"train_loss": -6.251809120178223, "global_step": 97705, "epoch": 2326} {"train_loss": -6.290286064147949, "global_step": 97706, "epoch": 2326} {"train_loss": -6.361428260803223, "global_step": 97707, "epoch": 2326} {"train_loss": -6.279240608215332, "global_step": 97708, "epoch": 2326} {"train_loss": -6.258676528930664, "global_step": 97709, "epoch": 2326} {"train_loss": -6.355625152587891, "global_step": 97710, "epoch": 2326} {"train_loss": -6.33673620223999, "global_step": 97711, "epoch": 2326} {"train_loss": -6.408184051513672, "global_step": 97712, "epoch": 2326} {"train_loss": -6.287172317504883, "global_step": 97713, "epoch": 2326} {"train_loss": -6.3950653076171875, "global_step": 97714, "epoch": 2326} {"train_loss": -6.311871528625488, "global_step": 97715, "epoch": 2326} {"train_loss": -6.186279296875, "global_step": 97716, "epoch": 2326} {"train_loss": -6.374236106872559, "global_step": 97717, "epoch": 2326} {"train_loss": -6.234190940856934, "global_step": 97718, "epoch": 2326} {"train_loss": -6.322547912597656, "global_step": 97719, "epoch": 2326} {"train_loss": -6.30790901184082, "global_step": 97720, "epoch": 2326} {"train_loss": -6.324182510375977, "global_step": 97721, "epoch": 2326} {"train_loss": -6.255876064300537, "global_step": 97722, "epoch": 2326} {"train_loss": -6.246601104736328, "global_step": 97723, "epoch": 2326} {"train_loss": -6.197807312011719, "global_step": 97724, "epoch": 2326} {"train_loss": -6.33164119720459, "global_step": 97725, "epoch": 2326} {"train_loss": -6.404366970062256, "global_step": 97726, "epoch": 2326} {"train_loss": -6.208768844604492, "global_step": 97727, "epoch": 2326} {"train_loss": -6.218681335449219, "global_step": 97728, "epoch": 2326} {"train_loss": -6.224824905395508, "global_step": 97729, "epoch": 2326} {"train_loss": -6.238372802734375, "global_step": 97730, "epoch": 2326} {"train_loss": -6.2123565673828125, "global_step": 97731, "epoch": 2326} {"train_loss": -6.212516784667969, "global_step": 97732, "epoch": 2326} {"train_loss": -6.285500764846802, "global_step": 97733, "epoch": 2326, "val_loss": 68278.734375} {"train_loss": -6.168056488037109, "global_step": 97734, "epoch": 2327} {"train_loss": -6.231911659240723, "global_step": 97735, "epoch": 2327} {"train_loss": -6.317043304443359, "global_step": 97736, "epoch": 2327} {"train_loss": -6.278662204742432, "global_step": 97737, "epoch": 2327} {"train_loss": -6.400637626647949, "global_step": 97738, "epoch": 2327} {"train_loss": -6.287598609924316, "global_step": 97739, "epoch": 2327} {"train_loss": -6.31463623046875, "global_step": 97740, "epoch": 2327} {"train_loss": -6.253403186798096, "global_step": 97741, "epoch": 2327} {"train_loss": -6.3309831619262695, "global_step": 97742, "epoch": 2327} {"train_loss": -6.346170425415039, "global_step": 97743, "epoch": 2327} {"train_loss": -6.385583400726318, "global_step": 97744, "epoch": 2327} {"train_loss": -6.392910003662109, "global_step": 97745, "epoch": 2327} {"train_loss": -6.438190460205078, "global_step": 97746, "epoch": 2327} {"train_loss": -6.279184341430664, "global_step": 97747, "epoch": 2327} {"train_loss": -6.358209609985352, "global_step": 97748, "epoch": 2327} {"train_loss": -6.314483642578125, "global_step": 97749, "epoch": 2327} {"train_loss": -6.34520959854126, "global_step": 97750, "epoch": 2327} {"train_loss": -6.288974761962891, "global_step": 97751, "epoch": 2327} {"train_loss": -6.481564044952393, "global_step": 97752, "epoch": 2327} {"train_loss": -6.251854419708252, "global_step": 97753, "epoch": 2327} {"train_loss": -6.386285781860352, "global_step": 97754, "epoch": 2327} {"train_loss": -6.339264869689941, "global_step": 97755, "epoch": 2327} {"train_loss": -6.355310440063477, "global_step": 97756, "epoch": 2327} {"train_loss": -6.329277992248535, "global_step": 97757, "epoch": 2327} {"train_loss": -6.2609968185424805, "global_step": 97758, "epoch": 2327} {"train_loss": -6.346922397613525, "global_step": 97759, "epoch": 2327} {"train_loss": -6.307243347167969, "global_step": 97760, "epoch": 2327} {"train_loss": -6.23723030090332, "global_step": 97761, "epoch": 2327} {"train_loss": -6.284756183624268, "global_step": 97762, "epoch": 2327} {"train_loss": -6.297427177429199, "global_step": 97763, "epoch": 2327} {"train_loss": -6.381458759307861, "global_step": 97764, "epoch": 2327} {"train_loss": -6.295632362365723, "global_step": 97765, "epoch": 2327} {"train_loss": -6.264190196990967, "global_step": 97766, "epoch": 2327} {"train_loss": -6.280729293823242, "global_step": 97767, "epoch": 2327} {"train_loss": -6.196381568908691, "global_step": 97768, "epoch": 2327} {"train_loss": -6.440277099609375, "global_step": 97769, "epoch": 2327} {"train_loss": -6.348632335662842, "global_step": 97770, "epoch": 2327} {"train_loss": -6.302772521972656, "global_step": 97771, "epoch": 2327} {"train_loss": -6.331596374511719, "global_step": 97772, "epoch": 2327} {"train_loss": -6.431941986083984, "global_step": 97773, "epoch": 2327} {"train_loss": -6.32893705368042, "global_step": 97774, "epoch": 2327} {"train_loss": -6.323966139838809, "global_step": 97775, "epoch": 2327, "val_loss": 68068.9140625} {"train_loss": -6.381673812866211, "global_step": 97776, "epoch": 2328} {"train_loss": -6.388265609741211, "global_step": 97777, "epoch": 2328} {"train_loss": -6.340429306030273, "global_step": 97778, "epoch": 2328} {"train_loss": -6.435845375061035, "global_step": 97779, "epoch": 2328} {"train_loss": -6.234031677246094, "global_step": 97780, "epoch": 2328} {"train_loss": -6.403676986694336, "global_step": 97781, "epoch": 2328} {"train_loss": -6.315377235412598, "global_step": 97782, "epoch": 2328} {"train_loss": -6.36317253112793, "global_step": 97783, "epoch": 2328} {"train_loss": -6.448395729064941, "global_step": 97784, "epoch": 2328} {"train_loss": -6.456006050109863, "global_step": 97785, "epoch": 2328} {"train_loss": -6.394432544708252, "global_step": 97786, "epoch": 2328} {"train_loss": -6.394659996032715, "global_step": 97787, "epoch": 2328} {"train_loss": -6.224581241607666, "global_step": 97788, "epoch": 2328} {"train_loss": -6.284811973571777, "global_step": 97789, "epoch": 2328} {"train_loss": -6.412675380706787, "global_step": 97790, "epoch": 2328} {"train_loss": -6.391785621643066, "global_step": 97791, "epoch": 2328} {"train_loss": -6.290693759918213, "global_step": 97792, "epoch": 2328} {"train_loss": -6.30225944519043, "global_step": 97793, "epoch": 2328} {"train_loss": -6.466561317443848, "global_step": 97794, "epoch": 2328} {"train_loss": -6.342292785644531, "global_step": 97795, "epoch": 2328} {"train_loss": -6.402438163757324, "global_step": 97796, "epoch": 2328} {"train_loss": -6.259232044219971, "global_step": 97797, "epoch": 2328} {"train_loss": -6.337013244628906, "global_step": 97798, "epoch": 2328} {"train_loss": -6.252248764038086, "global_step": 97799, "epoch": 2328} {"train_loss": -6.290815830230713, "global_step": 97800, "epoch": 2328} {"train_loss": -6.469874382019043, "global_step": 97801, "epoch": 2328} {"train_loss": -6.34968900680542, "global_step": 97802, "epoch": 2328} {"train_loss": -6.255078315734863, "global_step": 97803, "epoch": 2328} {"train_loss": -6.2531890869140625, "global_step": 97804, "epoch": 2328} {"train_loss": -6.245823860168457, "global_step": 97805, "epoch": 2328} {"train_loss": -6.17434024810791, "global_step": 97806, "epoch": 2328} {"train_loss": -6.232203006744385, "global_step": 97807, "epoch": 2328} {"train_loss": -6.20654821395874, "global_step": 97808, "epoch": 2328} {"train_loss": -6.235821723937988, "global_step": 97809, "epoch": 2328} {"train_loss": -6.356822967529297, "global_step": 97810, "epoch": 2328} {"train_loss": -6.181468486785889, "global_step": 97811, "epoch": 2328} {"train_loss": -6.319990158081055, "global_step": 97812, "epoch": 2328} {"train_loss": -6.251239776611328, "global_step": 97813, "epoch": 2328} {"train_loss": -6.18244743347168, "global_step": 97814, "epoch": 2328} {"train_loss": -6.248187065124512, "global_step": 97815, "epoch": 2328} {"train_loss": -6.346806526184082, "global_step": 97816, "epoch": 2328} {"train_loss": -6.321182421275547, "global_step": 97817, "epoch": 2328, "val_loss": 67901.7578125} {"train_loss": -6.3352556228637695, "global_step": 97818, "epoch": 2329} {"train_loss": -6.310488224029541, "global_step": 97819, "epoch": 2329} {"train_loss": -6.186238765716553, "global_step": 97820, "epoch": 2329} {"train_loss": -6.402981281280518, "global_step": 97821, "epoch": 2329} {"train_loss": -6.335007667541504, "global_step": 97822, "epoch": 2329} {"train_loss": -6.270820617675781, "global_step": 97823, "epoch": 2329} {"train_loss": -6.253141403198242, "global_step": 97824, "epoch": 2329} {"train_loss": -6.171974182128906, "global_step": 97825, "epoch": 2329} {"train_loss": -6.348869323730469, "global_step": 97826, "epoch": 2329} {"train_loss": -6.256862640380859, "global_step": 97827, "epoch": 2329} {"train_loss": -6.167658805847168, "global_step": 97828, "epoch": 2329} {"train_loss": -6.356626033782959, "global_step": 97829, "epoch": 2329} {"train_loss": -6.29518985748291, "global_step": 97830, "epoch": 2329} {"train_loss": -6.4223432540893555, "global_step": 97831, "epoch": 2329} {"train_loss": -6.271083831787109, "global_step": 97832, "epoch": 2329} {"train_loss": -6.3177289962768555, "global_step": 97833, "epoch": 2329} {"train_loss": -6.294215202331543, "global_step": 97834, "epoch": 2329} {"train_loss": -6.206930637359619, "global_step": 97835, "epoch": 2329} {"train_loss": -6.2965497970581055, "global_step": 97836, "epoch": 2329} {"train_loss": -6.179898262023926, "global_step": 97837, "epoch": 2329} {"train_loss": -6.330100059509277, "global_step": 97838, "epoch": 2329} {"train_loss": -6.193233489990234, "global_step": 97839, "epoch": 2329} {"train_loss": -6.285065650939941, "global_step": 97840, "epoch": 2329} {"train_loss": -6.275034427642822, "global_step": 97841, "epoch": 2329} {"train_loss": -6.287217140197754, "global_step": 97842, "epoch": 2329} {"train_loss": -6.436347484588623, "global_step": 97843, "epoch": 2329} {"train_loss": -6.28151273727417, "global_step": 97844, "epoch": 2329} {"train_loss": -6.238041400909424, "global_step": 97845, "epoch": 2329} {"train_loss": -6.355529308319092, "global_step": 97846, "epoch": 2329} {"train_loss": -6.194731712341309, "global_step": 97847, "epoch": 2329} {"train_loss": -6.261518478393555, "global_step": 97848, "epoch": 2329} {"train_loss": -6.181708335876465, "global_step": 97849, "epoch": 2329} {"train_loss": -6.24163293838501, "global_step": 97850, "epoch": 2329} {"train_loss": -6.241765975952148, "global_step": 97851, "epoch": 2329} {"train_loss": -6.307083606719971, "global_step": 97852, "epoch": 2329} {"train_loss": -6.332121849060059, "global_step": 97853, "epoch": 2329} {"train_loss": -6.167635917663574, "global_step": 97854, "epoch": 2329} {"train_loss": -6.2089457511901855, "global_step": 97855, "epoch": 2329} {"train_loss": -6.321959972381592, "global_step": 97856, "epoch": 2329} {"train_loss": -6.270225524902344, "global_step": 97857, "epoch": 2329} {"train_loss": -6.512265205383301, "global_step": 97858, "epoch": 2329} {"train_loss": -6.284824462164016, "global_step": 97859, "epoch": 2329, "val_loss": 67788.0859375} {"train_loss": -6.231148719787598, "global_step": 97860, "epoch": 2330} {"train_loss": -6.309171676635742, "global_step": 97861, "epoch": 2330} {"train_loss": -6.363462924957275, "global_step": 97862, "epoch": 2330} {"train_loss": -6.384200572967529, "global_step": 97863, "epoch": 2330} {"train_loss": -6.268470764160156, "global_step": 97864, "epoch": 2330} {"train_loss": -6.298335075378418, "global_step": 97865, "epoch": 2330} {"train_loss": -6.2920451164245605, "global_step": 97866, "epoch": 2330} {"train_loss": -6.31147575378418, "global_step": 97867, "epoch": 2330} {"train_loss": -6.372704982757568, "global_step": 97868, "epoch": 2330} {"train_loss": -6.250844478607178, "global_step": 97869, "epoch": 2330} {"train_loss": -6.21198034286499, "global_step": 97870, "epoch": 2330} {"train_loss": -6.308900833129883, "global_step": 97871, "epoch": 2330} {"train_loss": -6.2826313972473145, "global_step": 97872, "epoch": 2330} {"train_loss": -6.386929512023926, "global_step": 97873, "epoch": 2330} {"train_loss": -6.2217254638671875, "global_step": 97874, "epoch": 2330} {"train_loss": -6.415678977966309, "global_step": 97875, "epoch": 2330} {"train_loss": -6.307534217834473, "global_step": 97876, "epoch": 2330} {"train_loss": -6.431496620178223, "global_step": 97877, "epoch": 2330} {"train_loss": -6.199042320251465, "global_step": 97878, "epoch": 2330} {"train_loss": -6.262399673461914, "global_step": 97879, "epoch": 2330} {"train_loss": -6.437143325805664, "global_step": 97880, "epoch": 2330} {"train_loss": -6.409961223602295, "global_step": 97881, "epoch": 2330} {"train_loss": -6.399700164794922, "global_step": 97882, "epoch": 2330} {"train_loss": -6.262829303741455, "global_step": 97883, "epoch": 2330} {"train_loss": -6.2553558349609375, "global_step": 97884, "epoch": 2330} {"train_loss": -6.318351745605469, "global_step": 97885, "epoch": 2330} {"train_loss": -6.347705364227295, "global_step": 97886, "epoch": 2330} {"train_loss": -6.257907867431641, "global_step": 97887, "epoch": 2330} {"train_loss": -6.3042144775390625, "global_step": 97888, "epoch": 2330} {"train_loss": -6.291821479797363, "global_step": 97889, "epoch": 2330} {"train_loss": -6.366568088531494, "global_step": 97890, "epoch": 2330} {"train_loss": -6.3733110427856445, "global_step": 97891, "epoch": 2330} {"train_loss": -6.357736110687256, "global_step": 97892, "epoch": 2330} {"train_loss": -6.249630451202393, "global_step": 97893, "epoch": 2330} {"train_loss": -6.24443244934082, "global_step": 97894, "epoch": 2330} {"train_loss": -6.243680477142334, "global_step": 97895, "epoch": 2330} {"train_loss": -6.274695873260498, "global_step": 97896, "epoch": 2330} {"train_loss": -6.353653907775879, "global_step": 97897, "epoch": 2330} {"train_loss": -6.229396343231201, "global_step": 97898, "epoch": 2330} {"train_loss": -6.270941734313965, "global_step": 97899, "epoch": 2330} {"train_loss": -6.314560890197754, "global_step": 97900, "epoch": 2330} {"train_loss": -6.310759544372559, "global_step": 97901, "epoch": 2330, "val_loss": 67810.53125} {"train_loss": -6.339163780212402, "global_step": 97902, "epoch": 2331} {"train_loss": -6.316944599151611, "global_step": 97903, "epoch": 2331} {"train_loss": -6.311517715454102, "global_step": 97904, "epoch": 2331} {"train_loss": -6.374647617340088, "global_step": 97905, "epoch": 2331} {"train_loss": -6.416018486022949, "global_step": 97906, "epoch": 2331} {"train_loss": -6.376830101013184, "global_step": 97907, "epoch": 2331} {"train_loss": -6.286534309387207, "global_step": 97908, "epoch": 2331} {"train_loss": -6.307949542999268, "global_step": 97909, "epoch": 2331} {"train_loss": -6.373818397521973, "global_step": 97910, "epoch": 2331} {"train_loss": -6.223799228668213, "global_step": 97911, "epoch": 2331} {"train_loss": -6.425137519836426, "global_step": 97912, "epoch": 2331} {"train_loss": -6.258707046508789, "global_step": 97913, "epoch": 2331} {"train_loss": -6.326957702636719, "global_step": 97914, "epoch": 2331} {"train_loss": -6.335290908813477, "global_step": 97915, "epoch": 2331} {"train_loss": -6.3833842277526855, "global_step": 97916, "epoch": 2331} {"train_loss": -6.311903953552246, "global_step": 97917, "epoch": 2331} {"train_loss": -6.272449493408203, "global_step": 97918, "epoch": 2331} {"train_loss": -6.251315116882324, "global_step": 97919, "epoch": 2331} {"train_loss": -6.266552925109863, "global_step": 97920, "epoch": 2331} {"train_loss": -6.327346324920654, "global_step": 97921, "epoch": 2331} {"train_loss": -6.192726135253906, "global_step": 97922, "epoch": 2331} {"train_loss": -6.2889509201049805, "global_step": 97923, "epoch": 2331} {"train_loss": -6.269277572631836, "global_step": 97924, "epoch": 2331} {"train_loss": -6.245750427246094, "global_step": 97925, "epoch": 2331} {"train_loss": -6.287426948547363, "global_step": 97926, "epoch": 2331} {"train_loss": -6.203725814819336, "global_step": 97927, "epoch": 2331} {"train_loss": -6.3012495040893555, "global_step": 97928, "epoch": 2331} {"train_loss": -6.265420436859131, "global_step": 97929, "epoch": 2331} {"train_loss": -6.298646450042725, "global_step": 97930, "epoch": 2331} {"train_loss": -6.409967422485352, "global_step": 97931, "epoch": 2331} {"train_loss": -6.336812973022461, "global_step": 97932, "epoch": 2331} {"train_loss": -6.296934127807617, "global_step": 97933, "epoch": 2331} {"train_loss": -6.375161170959473, "global_step": 97934, "epoch": 2331} {"train_loss": -6.304543495178223, "global_step": 97935, "epoch": 2331} {"train_loss": -6.325693130493164, "global_step": 97936, "epoch": 2331} {"train_loss": -6.378052711486816, "global_step": 97937, "epoch": 2331} {"train_loss": -6.385282516479492, "global_step": 97938, "epoch": 2331} {"train_loss": -6.326685428619385, "global_step": 97939, "epoch": 2331} {"train_loss": -6.204341888427734, "global_step": 97940, "epoch": 2331} {"train_loss": -6.372066497802734, "global_step": 97941, "epoch": 2331} {"train_loss": -6.4122419357299805, "global_step": 97942, "epoch": 2331} {"train_loss": -6.317043610981533, "global_step": 97943, "epoch": 2331, "val_loss": 67868.078125} {"train_loss": -6.340917587280273, "global_step": 97944, "epoch": 2332} {"train_loss": -6.4268317222595215, "global_step": 97945, "epoch": 2332} {"train_loss": -6.363893985748291, "global_step": 97946, "epoch": 2332} {"train_loss": -6.40557861328125, "global_step": 97947, "epoch": 2332} {"train_loss": -6.243451118469238, "global_step": 97948, "epoch": 2332} {"train_loss": -6.293482780456543, "global_step": 97949, "epoch": 2332} {"train_loss": -6.323405742645264, "global_step": 97950, "epoch": 2332} {"train_loss": -6.307130336761475, "global_step": 97951, "epoch": 2332} {"train_loss": -6.297642707824707, "global_step": 97952, "epoch": 2332} {"train_loss": -6.277888298034668, "global_step": 97953, "epoch": 2332} {"train_loss": -6.37166690826416, "global_step": 97954, "epoch": 2332} {"train_loss": -6.302850723266602, "global_step": 97955, "epoch": 2332} {"train_loss": -6.170469284057617, "global_step": 97956, "epoch": 2332} {"train_loss": -6.370754241943359, "global_step": 97957, "epoch": 2332} {"train_loss": -6.400755882263184, "global_step": 97958, "epoch": 2332} {"train_loss": -6.299688816070557, "global_step": 97959, "epoch": 2332} {"train_loss": -6.307868003845215, "global_step": 97960, "epoch": 2332} {"train_loss": -6.308446884155273, "global_step": 97961, "epoch": 2332} {"train_loss": -6.418429374694824, "global_step": 97962, "epoch": 2332} {"train_loss": -6.431501388549805, "global_step": 97963, "epoch": 2332} {"train_loss": -6.324725151062012, "global_step": 97964, "epoch": 2332} {"train_loss": -6.275304794311523, "global_step": 97965, "epoch": 2332} {"train_loss": -6.154294967651367, "global_step": 97966, "epoch": 2332} {"train_loss": -6.318995475769043, "global_step": 97967, "epoch": 2332} {"train_loss": -6.304367542266846, "global_step": 97968, "epoch": 2332} {"train_loss": -6.326419830322266, "global_step": 97969, "epoch": 2332} {"train_loss": -6.290617942810059, "global_step": 97970, "epoch": 2332} {"train_loss": -6.226282119750977, "global_step": 97971, "epoch": 2332} {"train_loss": -6.380085468292236, "global_step": 97972, "epoch": 2332} {"train_loss": -6.386413097381592, "global_step": 97973, "epoch": 2332} {"train_loss": -6.259643077850342, "global_step": 97974, "epoch": 2332} {"train_loss": -6.421754837036133, "global_step": 97975, "epoch": 2332} {"train_loss": -6.35996150970459, "global_step": 97976, "epoch": 2332} {"train_loss": -6.321173667907715, "global_step": 97977, "epoch": 2332} {"train_loss": -6.2652201652526855, "global_step": 97978, "epoch": 2332} {"train_loss": -6.344971179962158, "global_step": 97979, "epoch": 2332} {"train_loss": -6.295492649078369, "global_step": 97980, "epoch": 2332} {"train_loss": -6.283944129943848, "global_step": 97981, "epoch": 2332} {"train_loss": -6.323064804077148, "global_step": 97982, "epoch": 2332} {"train_loss": -6.3592209815979, "global_step": 97983, "epoch": 2332} {"train_loss": -6.237584590911865, "global_step": 97984, "epoch": 2332} {"train_loss": -6.316267456327166, "global_step": 97985, "epoch": 2332, "val_loss": 68037.8125} {"train_loss": -6.216504096984863, "global_step": 97986, "epoch": 2333} {"train_loss": -6.243269920349121, "global_step": 97987, "epoch": 2333} {"train_loss": -6.407696723937988, "global_step": 97988, "epoch": 2333} {"train_loss": -6.153451919555664, "global_step": 97989, "epoch": 2333} {"train_loss": -6.129532814025879, "global_step": 97990, "epoch": 2333} {"train_loss": -6.348714828491211, "global_step": 97991, "epoch": 2333} {"train_loss": -6.235249042510986, "global_step": 97992, "epoch": 2333} {"train_loss": -6.253976345062256, "global_step": 97993, "epoch": 2333} {"train_loss": -6.085047721862793, "global_step": 97994, "epoch": 2333} {"train_loss": -6.3630757331848145, "global_step": 97995, "epoch": 2333} {"train_loss": -6.127633094787598, "global_step": 97996, "epoch": 2333} {"train_loss": -6.282356262207031, "global_step": 97997, "epoch": 2333} {"train_loss": -6.092744827270508, "global_step": 97998, "epoch": 2333} {"train_loss": -6.31296968460083, "global_step": 97999, "epoch": 2333} {"train_loss": -6.236831188201904, "global_step": 98000, "epoch": 2333} {"train_loss": -6.299201488494873, "global_step": 98001, "epoch": 2333} {"train_loss": -6.246146202087402, "global_step": 98002, "epoch": 2333} {"train_loss": -6.328131675720215, "global_step": 98003, "epoch": 2333} {"train_loss": -6.277678489685059, "global_step": 98004, "epoch": 2333} {"train_loss": -6.204645156860352, "global_step": 98005, "epoch": 2333} {"train_loss": -6.335813522338867, "global_step": 98006, "epoch": 2333} {"train_loss": -6.197656631469727, "global_step": 98007, "epoch": 2333} {"train_loss": -6.308304786682129, "global_step": 98008, "epoch": 2333} {"train_loss": -6.283327579498291, "global_step": 98009, "epoch": 2333} {"train_loss": -6.287881374359131, "global_step": 98010, "epoch": 2333} {"train_loss": -6.303866863250732, "global_step": 98011, "epoch": 2333} {"train_loss": -6.267136096954346, "global_step": 98012, "epoch": 2333} {"train_loss": -6.372008323669434, "global_step": 98013, "epoch": 2333} {"train_loss": -6.204360485076904, "global_step": 98014, "epoch": 2333} {"train_loss": -6.329604148864746, "global_step": 98015, "epoch": 2333} {"train_loss": -6.375328063964844, "global_step": 98016, "epoch": 2333} {"train_loss": -6.368509769439697, "global_step": 98017, "epoch": 2333} {"train_loss": -6.351840019226074, "global_step": 98018, "epoch": 2333} {"train_loss": -6.21297550201416, "global_step": 98019, "epoch": 2333} {"train_loss": -6.287564277648926, "global_step": 98020, "epoch": 2333} {"train_loss": -6.28346586227417, "global_step": 98021, "epoch": 2333} {"train_loss": -6.227335453033447, "global_step": 98022, "epoch": 2333} {"train_loss": -6.337574005126953, "global_step": 98023, "epoch": 2333} {"train_loss": -6.253358364105225, "global_step": 98024, "epoch": 2333} {"train_loss": -6.3246893882751465, "global_step": 98025, "epoch": 2333} {"train_loss": -6.368552207946777, "global_step": 98026, "epoch": 2333} {"train_loss": -6.271838630948748, "global_step": 98027, "epoch": 2333, "val_loss": 67755.6015625} {"train_loss": -6.234668731689453, "global_step": 98028, "epoch": 2334} {"train_loss": -6.375770568847656, "global_step": 98029, "epoch": 2334} {"train_loss": -6.2877302169799805, "global_step": 98030, "epoch": 2334} {"train_loss": -6.256624698638916, "global_step": 98031, "epoch": 2334} {"train_loss": -6.306093215942383, "global_step": 98032, "epoch": 2334} {"train_loss": -6.3600873947143555, "global_step": 98033, "epoch": 2334} {"train_loss": -6.267977714538574, "global_step": 98034, "epoch": 2334} {"train_loss": -6.331015110015869, "global_step": 98035, "epoch": 2334} {"train_loss": -6.084348678588867, "global_step": 98036, "epoch": 2334} {"train_loss": -6.283723831176758, "global_step": 98037, "epoch": 2334} {"train_loss": -6.154864311218262, "global_step": 98038, "epoch": 2334} {"train_loss": -6.206113815307617, "global_step": 98039, "epoch": 2334} {"train_loss": -6.273960113525391, "global_step": 98040, "epoch": 2334} {"train_loss": -6.144699573516846, "global_step": 98041, "epoch": 2334} {"train_loss": -6.221895217895508, "global_step": 98042, "epoch": 2334} {"train_loss": -6.125208854675293, "global_step": 98043, "epoch": 2334} {"train_loss": -6.17608118057251, "global_step": 98044, "epoch": 2334} {"train_loss": -6.198943614959717, "global_step": 98045, "epoch": 2334} {"train_loss": -6.230314254760742, "global_step": 98046, "epoch": 2334} {"train_loss": -6.130702495574951, "global_step": 98047, "epoch": 2334} {"train_loss": -6.137372016906738, "global_step": 98048, "epoch": 2334} {"train_loss": -6.276976585388184, "global_step": 98049, "epoch": 2334} {"train_loss": -6.275362491607666, "global_step": 98050, "epoch": 2334} {"train_loss": -6.15736198425293, "global_step": 98051, "epoch": 2334} {"train_loss": -6.354046821594238, "global_step": 98052, "epoch": 2334} {"train_loss": -6.16745662689209, "global_step": 98053, "epoch": 2334} {"train_loss": -6.246068477630615, "global_step": 98054, "epoch": 2334} {"train_loss": -6.17324161529541, "global_step": 98055, "epoch": 2334} {"train_loss": -6.290870189666748, "global_step": 98056, "epoch": 2334} {"train_loss": -6.260321140289307, "global_step": 98057, "epoch": 2334} {"train_loss": -6.3701300621032715, "global_step": 98058, "epoch": 2334} {"train_loss": -6.2286577224731445, "global_step": 98059, "epoch": 2334} {"train_loss": -6.2902374267578125, "global_step": 98060, "epoch": 2334} {"train_loss": -6.341677665710449, "global_step": 98061, "epoch": 2334} {"train_loss": -6.327504634857178, "global_step": 98062, "epoch": 2334} {"train_loss": -6.383518695831299, "global_step": 98063, "epoch": 2334} {"train_loss": -6.367431640625, "global_step": 98064, "epoch": 2334} {"train_loss": -6.290483474731445, "global_step": 98065, "epoch": 2334} {"train_loss": -6.334846019744873, "global_step": 98066, "epoch": 2334} {"train_loss": -6.37255859375, "global_step": 98067, "epoch": 2334} {"train_loss": -6.332420825958252, "global_step": 98068, "epoch": 2334} {"train_loss": -6.260035514831543, "global_step": 98069, "epoch": 2334, "val_loss": 68190.125} {"train_loss": -6.273284435272217, "global_step": 98070, "epoch": 2335} {"train_loss": -6.256527900695801, "global_step": 98071, "epoch": 2335} {"train_loss": -6.390801906585693, "global_step": 98072, "epoch": 2335} {"train_loss": -6.301755428314209, "global_step": 98073, "epoch": 2335} {"train_loss": -6.497300148010254, "global_step": 98074, "epoch": 2335} {"train_loss": -6.318221092224121, "global_step": 98075, "epoch": 2335} {"train_loss": -6.3109450340271, "global_step": 98076, "epoch": 2335} {"train_loss": -6.380005836486816, "global_step": 98077, "epoch": 2335} {"train_loss": -6.2301154136657715, "global_step": 98078, "epoch": 2335} {"train_loss": -6.210721015930176, "global_step": 98079, "epoch": 2335} {"train_loss": -6.347207069396973, "global_step": 98080, "epoch": 2335} {"train_loss": -6.17128849029541, "global_step": 98081, "epoch": 2335} {"train_loss": -6.382396221160889, "global_step": 98082, "epoch": 2335} {"train_loss": -6.356450080871582, "global_step": 98083, "epoch": 2335} {"train_loss": -6.212283134460449, "global_step": 98084, "epoch": 2335} {"train_loss": -6.199696063995361, "global_step": 98085, "epoch": 2335} {"train_loss": -6.415718078613281, "global_step": 98086, "epoch": 2335} {"train_loss": -6.250922679901123, "global_step": 98087, "epoch": 2335} {"train_loss": -6.264782905578613, "global_step": 98088, "epoch": 2335} {"train_loss": -6.316437721252441, "global_step": 98089, "epoch": 2335} {"train_loss": -6.310123443603516, "global_step": 98090, "epoch": 2335} {"train_loss": -6.26662540435791, "global_step": 98091, "epoch": 2335} {"train_loss": -6.247574806213379, "global_step": 98092, "epoch": 2335} {"train_loss": -6.378931999206543, "global_step": 98093, "epoch": 2335} {"train_loss": -6.266359806060791, "global_step": 98094, "epoch": 2335} {"train_loss": -6.314976692199707, "global_step": 98095, "epoch": 2335} {"train_loss": -6.407789707183838, "global_step": 98096, "epoch": 2335} {"train_loss": -6.195596694946289, "global_step": 98097, "epoch": 2335} {"train_loss": -6.223479270935059, "global_step": 98098, "epoch": 2335} {"train_loss": -6.337637424468994, "global_step": 98099, "epoch": 2335} {"train_loss": -6.323491096496582, "global_step": 98100, "epoch": 2335} {"train_loss": -6.317395210266113, "global_step": 98101, "epoch": 2335} {"train_loss": -6.34736442565918, "global_step": 98102, "epoch": 2335} {"train_loss": -6.326400279998779, "global_step": 98103, "epoch": 2335} {"train_loss": -6.337970733642578, "global_step": 98104, "epoch": 2335} {"train_loss": -6.2736287117004395, "global_step": 98105, "epoch": 2335} {"train_loss": -6.3277692794799805, "global_step": 98106, "epoch": 2335} {"train_loss": -6.3158860206604, "global_step": 98107, "epoch": 2335} {"train_loss": -6.306929111480713, "global_step": 98108, "epoch": 2335} {"train_loss": -6.389799118041992, "global_step": 98109, "epoch": 2335} {"train_loss": -6.393779754638672, "global_step": 98110, "epoch": 2335} {"train_loss": -6.310830297924223, "global_step": 98111, "epoch": 2335, "val_loss": 68183.5546875} {"train_loss": -6.211703300476074, "global_step": 98112, "epoch": 2336} {"train_loss": -6.4107232093811035, "global_step": 98113, "epoch": 2336} {"train_loss": -6.3318586349487305, "global_step": 98114, "epoch": 2336} {"train_loss": -6.331732749938965, "global_step": 98115, "epoch": 2336} {"train_loss": -6.328937530517578, "global_step": 98116, "epoch": 2336} {"train_loss": -6.3450727462768555, "global_step": 98117, "epoch": 2336} {"train_loss": -6.4801530838012695, "global_step": 98118, "epoch": 2336} {"train_loss": -6.309656620025635, "global_step": 98119, "epoch": 2336} {"train_loss": -6.253691673278809, "global_step": 98120, "epoch": 2336} {"train_loss": -6.229855537414551, "global_step": 98121, "epoch": 2336} {"train_loss": -6.315013885498047, "global_step": 98122, "epoch": 2336} {"train_loss": -6.45942497253418, "global_step": 98123, "epoch": 2336} {"train_loss": -6.310707092285156, "global_step": 98124, "epoch": 2336} {"train_loss": -6.279313564300537, "global_step": 98125, "epoch": 2336} {"train_loss": -6.417665004730225, "global_step": 98126, "epoch": 2336} {"train_loss": -6.1992950439453125, "global_step": 98127, "epoch": 2336} {"train_loss": -6.300601005554199, "global_step": 98128, "epoch": 2336} {"train_loss": -6.212829113006592, "global_step": 98129, "epoch": 2336} {"train_loss": -6.350721836090088, "global_step": 98130, "epoch": 2336} {"train_loss": -6.334071636199951, "global_step": 98131, "epoch": 2336} {"train_loss": -6.353596210479736, "global_step": 98132, "epoch": 2336} {"train_loss": -6.279482841491699, "global_step": 98133, "epoch": 2336} {"train_loss": -6.367344856262207, "global_step": 98134, "epoch": 2336} {"train_loss": -6.222164154052734, "global_step": 98135, "epoch": 2336} {"train_loss": -6.417705535888672, "global_step": 98136, "epoch": 2336} {"train_loss": -6.386124610900879, "global_step": 98137, "epoch": 2336} {"train_loss": -6.351626873016357, "global_step": 98138, "epoch": 2336} {"train_loss": -6.390999794006348, "global_step": 98139, "epoch": 2336} {"train_loss": -6.36398458480835, "global_step": 98140, "epoch": 2336} {"train_loss": -6.302976608276367, "global_step": 98141, "epoch": 2336} {"train_loss": -6.33004093170166, "global_step": 98142, "epoch": 2336} {"train_loss": -6.4596381187438965, "global_step": 98143, "epoch": 2336} {"train_loss": -6.252492904663086, "global_step": 98144, "epoch": 2336} {"train_loss": -6.312533378601074, "global_step": 98145, "epoch": 2336} {"train_loss": -6.375638961791992, "global_step": 98146, "epoch": 2336} {"train_loss": -6.347377777099609, "global_step": 98147, "epoch": 2336} {"train_loss": -6.410258769989014, "global_step": 98148, "epoch": 2336} {"train_loss": -6.373223304748535, "global_step": 98149, "epoch": 2336} {"train_loss": -6.372847080230713, "global_step": 98150, "epoch": 2336} {"train_loss": -6.35426139831543, "global_step": 98151, "epoch": 2336} {"train_loss": -6.350156307220459, "global_step": 98152, "epoch": 2336} {"train_loss": -6.336834952944801, "global_step": 98153, "epoch": 2336, "val_loss": 68097.3515625} {"train_loss": -6.30338716506958, "global_step": 98154, "epoch": 2337} {"train_loss": -6.39111328125, "global_step": 98155, "epoch": 2337} {"train_loss": -6.3126301765441895, "global_step": 98156, "epoch": 2337} {"train_loss": -6.303544044494629, "global_step": 98157, "epoch": 2337} {"train_loss": -6.3322343826293945, "global_step": 98158, "epoch": 2337} {"train_loss": -6.276716232299805, "global_step": 98159, "epoch": 2337} {"train_loss": -6.242973327636719, "global_step": 98160, "epoch": 2337} {"train_loss": -6.371212482452393, "global_step": 98161, "epoch": 2337} {"train_loss": -6.292581081390381, "global_step": 98162, "epoch": 2337} {"train_loss": -6.3004937171936035, "global_step": 98163, "epoch": 2337} {"train_loss": -6.370820045471191, "global_step": 98164, "epoch": 2337} {"train_loss": -6.445769309997559, "global_step": 98165, "epoch": 2337} {"train_loss": -6.460053443908691, "global_step": 98166, "epoch": 2337} {"train_loss": -6.321525573730469, "global_step": 98167, "epoch": 2337} {"train_loss": -6.326371669769287, "global_step": 98168, "epoch": 2337} {"train_loss": -6.2944231033325195, "global_step": 98169, "epoch": 2337} {"train_loss": -6.275747776031494, "global_step": 98170, "epoch": 2337} {"train_loss": -6.308865547180176, "global_step": 98171, "epoch": 2337} {"train_loss": -6.323822498321533, "global_step": 98172, "epoch": 2337} {"train_loss": -6.41642951965332, "global_step": 98173, "epoch": 2337} {"train_loss": -6.240233421325684, "global_step": 98174, "epoch": 2337} {"train_loss": -6.352071762084961, "global_step": 98175, "epoch": 2337} {"train_loss": -6.221175193786621, "global_step": 98176, "epoch": 2337} {"train_loss": -6.268730640411377, "global_step": 98177, "epoch": 2337} {"train_loss": -6.338831901550293, "global_step": 98178, "epoch": 2337} {"train_loss": -6.280741214752197, "global_step": 98179, "epoch": 2337} {"train_loss": -6.234750270843506, "global_step": 98180, "epoch": 2337} {"train_loss": -6.370148658752441, "global_step": 98181, "epoch": 2337} {"train_loss": -6.415681838989258, "global_step": 98182, "epoch": 2337} {"train_loss": -6.4306535720825195, "global_step": 98183, "epoch": 2337} {"train_loss": -6.2594218254089355, "global_step": 98184, "epoch": 2337} {"train_loss": -6.3283162117004395, "global_step": 98185, "epoch": 2337} {"train_loss": -6.362730026245117, "global_step": 98186, "epoch": 2337} {"train_loss": -6.3091139793396, "global_step": 98187, "epoch": 2337} {"train_loss": -6.3710784912109375, "global_step": 98188, "epoch": 2337} {"train_loss": -6.345102310180664, "global_step": 98189, "epoch": 2337} {"train_loss": -6.302524566650391, "global_step": 98190, "epoch": 2337} {"train_loss": -6.185013294219971, "global_step": 98191, "epoch": 2337} {"train_loss": -6.306944847106934, "global_step": 98192, "epoch": 2337} {"train_loss": -6.280932426452637, "global_step": 98193, "epoch": 2337} {"train_loss": -6.331057548522949, "global_step": 98194, "epoch": 2337} {"train_loss": -6.321736937477475, "global_step": 98195, "epoch": 2337, "val_loss": 67928.6484375} {"train_loss": -6.351363182067871, "global_step": 98196, "epoch": 2338} {"train_loss": -6.451745986938477, "global_step": 98197, "epoch": 2338} {"train_loss": -6.357064247131348, "global_step": 98198, "epoch": 2338} {"train_loss": -6.212090969085693, "global_step": 98199, "epoch": 2338} {"train_loss": -6.449400901794434, "global_step": 98200, "epoch": 2338} {"train_loss": -6.307187080383301, "global_step": 98201, "epoch": 2338} {"train_loss": -6.4380269050598145, "global_step": 98202, "epoch": 2338} {"train_loss": -6.39921236038208, "global_step": 98203, "epoch": 2338} {"train_loss": -6.450263977050781, "global_step": 98204, "epoch": 2338} {"train_loss": -6.353201866149902, "global_step": 98205, "epoch": 2338} {"train_loss": -6.445671081542969, "global_step": 98206, "epoch": 2338} {"train_loss": -6.236450672149658, "global_step": 98207, "epoch": 2338} {"train_loss": -6.321081638336182, "global_step": 98208, "epoch": 2338} {"train_loss": -6.386548042297363, "global_step": 98209, "epoch": 2338} {"train_loss": -6.245584964752197, "global_step": 98210, "epoch": 2338} {"train_loss": -6.226964473724365, "global_step": 98211, "epoch": 2338} {"train_loss": -6.2626800537109375, "global_step": 98212, "epoch": 2338} {"train_loss": -6.474140167236328, "global_step": 98213, "epoch": 2338} {"train_loss": -6.157463073730469, "global_step": 98214, "epoch": 2338} {"train_loss": -6.2460527420043945, "global_step": 98215, "epoch": 2338} {"train_loss": -6.230019569396973, "global_step": 98216, "epoch": 2338} {"train_loss": -6.258331298828125, "global_step": 98217, "epoch": 2338} {"train_loss": -6.309025764465332, "global_step": 98218, "epoch": 2338} {"train_loss": -6.308816432952881, "global_step": 98219, "epoch": 2338} {"train_loss": -6.274131774902344, "global_step": 98220, "epoch": 2338} {"train_loss": -6.225985527038574, "global_step": 98221, "epoch": 2338} {"train_loss": -6.286219596862793, "global_step": 98222, "epoch": 2338} {"train_loss": -6.352441787719727, "global_step": 98223, "epoch": 2338} {"train_loss": -6.256423473358154, "global_step": 98224, "epoch": 2338} {"train_loss": -6.371844291687012, "global_step": 98225, "epoch": 2338} {"train_loss": -6.2569780349731445, "global_step": 98226, "epoch": 2338} {"train_loss": -6.344123840332031, "global_step": 98227, "epoch": 2338} {"train_loss": -6.371687889099121, "global_step": 98228, "epoch": 2338} {"train_loss": -6.402163028717041, "global_step": 98229, "epoch": 2338} {"train_loss": -6.180220603942871, "global_step": 98230, "epoch": 2338} {"train_loss": -6.309391975402832, "global_step": 98231, "epoch": 2338} {"train_loss": -6.248077869415283, "global_step": 98232, "epoch": 2338} {"train_loss": -6.254278182983398, "global_step": 98233, "epoch": 2338} {"train_loss": -6.235846996307373, "global_step": 98234, "epoch": 2338} {"train_loss": -6.22934627532959, "global_step": 98235, "epoch": 2338} {"train_loss": -6.474477767944336, "global_step": 98236, "epoch": 2338} {"train_loss": -6.318670125234695, "global_step": 98237, "epoch": 2338, "val_loss": 67903.1875} {"train_loss": -6.321904182434082, "global_step": 98238, "epoch": 2339} {"train_loss": -6.349174976348877, "global_step": 98239, "epoch": 2339} {"train_loss": -6.312162399291992, "global_step": 98240, "epoch": 2339} {"train_loss": -6.227536201477051, "global_step": 98241, "epoch": 2339} {"train_loss": -6.3502044677734375, "global_step": 98242, "epoch": 2339} {"train_loss": -6.363943099975586, "global_step": 98243, "epoch": 2339} {"train_loss": -6.349509239196777, "global_step": 98244, "epoch": 2339} {"train_loss": -6.374892234802246, "global_step": 98245, "epoch": 2339} {"train_loss": -6.308286666870117, "global_step": 98246, "epoch": 2339} {"train_loss": -6.26841402053833, "global_step": 98247, "epoch": 2339} {"train_loss": -6.3823747634887695, "global_step": 98248, "epoch": 2339} {"train_loss": -6.269509315490723, "global_step": 98249, "epoch": 2339} {"train_loss": -6.227916717529297, "global_step": 98250, "epoch": 2339} {"train_loss": -6.407975673675537, "global_step": 98251, "epoch": 2339} {"train_loss": -6.269883632659912, "global_step": 98252, "epoch": 2339} {"train_loss": -6.351729393005371, "global_step": 98253, "epoch": 2339} {"train_loss": -6.355391502380371, "global_step": 98254, "epoch": 2339} {"train_loss": -6.263664722442627, "global_step": 98255, "epoch": 2339} {"train_loss": -6.356432914733887, "global_step": 98256, "epoch": 2339} {"train_loss": -6.392767429351807, "global_step": 98257, "epoch": 2339} {"train_loss": -6.303877830505371, "global_step": 98258, "epoch": 2339} {"train_loss": -6.3306498527526855, "global_step": 98259, "epoch": 2339} {"train_loss": -6.407841682434082, "global_step": 98260, "epoch": 2339} {"train_loss": -6.409798622131348, "global_step": 98261, "epoch": 2339} {"train_loss": -6.380536079406738, "global_step": 98262, "epoch": 2339} {"train_loss": -6.30458927154541, "global_step": 98263, "epoch": 2339} {"train_loss": -6.291844367980957, "global_step": 98264, "epoch": 2339} {"train_loss": -6.286243438720703, "global_step": 98265, "epoch": 2339} {"train_loss": -6.362240791320801, "global_step": 98266, "epoch": 2339} {"train_loss": -6.196540832519531, "global_step": 98267, "epoch": 2339} {"train_loss": -6.359341144561768, "global_step": 98268, "epoch": 2339} {"train_loss": -6.200122833251953, "global_step": 98269, "epoch": 2339} {"train_loss": -6.22672176361084, "global_step": 98270, "epoch": 2339} {"train_loss": -6.19651985168457, "global_step": 98271, "epoch": 2339} {"train_loss": -6.316839218139648, "global_step": 98272, "epoch": 2339} {"train_loss": -6.242719650268555, "global_step": 98273, "epoch": 2339} {"train_loss": -6.250123023986816, "global_step": 98274, "epoch": 2339} {"train_loss": -6.094319820404053, "global_step": 98275, "epoch": 2339} {"train_loss": -6.279389381408691, "global_step": 98276, "epoch": 2339} {"train_loss": -6.264454364776611, "global_step": 98277, "epoch": 2339} {"train_loss": -6.318418979644775, "global_step": 98278, "epoch": 2339} {"train_loss": -6.304658038275583, "global_step": 98279, "epoch": 2339, "val_loss": 67851.8515625} {"train_loss": -6.128386974334717, "global_step": 98280, "epoch": 2340} {"train_loss": -6.327043533325195, "global_step": 98281, "epoch": 2340} {"train_loss": -6.227555274963379, "global_step": 98282, "epoch": 2340} {"train_loss": -6.322646141052246, "global_step": 98283, "epoch": 2340} {"train_loss": -6.260279178619385, "global_step": 98284, "epoch": 2340} {"train_loss": -6.350866794586182, "global_step": 98285, "epoch": 2340} {"train_loss": -6.316509246826172, "global_step": 98286, "epoch": 2340} {"train_loss": -6.271980285644531, "global_step": 98287, "epoch": 2340} {"train_loss": -6.367314338684082, "global_step": 98288, "epoch": 2340} {"train_loss": -6.372616767883301, "global_step": 98289, "epoch": 2340} {"train_loss": -6.310407638549805, "global_step": 98290, "epoch": 2340} {"train_loss": -6.41627836227417, "global_step": 98291, "epoch": 2340} {"train_loss": -6.415355682373047, "global_step": 98292, "epoch": 2340} {"train_loss": -6.307391166687012, "global_step": 98293, "epoch": 2340} {"train_loss": -6.351523399353027, "global_step": 98294, "epoch": 2340} {"train_loss": -6.393764972686768, "global_step": 98295, "epoch": 2340} {"train_loss": -6.335376739501953, "global_step": 98296, "epoch": 2340} {"train_loss": -6.376100063323975, "global_step": 98297, "epoch": 2340} {"train_loss": -6.29703950881958, "global_step": 98298, "epoch": 2340} {"train_loss": -6.35305118560791, "global_step": 98299, "epoch": 2340} {"train_loss": -6.362128257751465, "global_step": 98300, "epoch": 2340} {"train_loss": -6.3296098709106445, "global_step": 98301, "epoch": 2340} {"train_loss": -6.239041328430176, "global_step": 98302, "epoch": 2340} {"train_loss": -6.2851338386535645, "global_step": 98303, "epoch": 2340} {"train_loss": -6.392874717712402, "global_step": 98304, "epoch": 2340} {"train_loss": -6.283875465393066, "global_step": 98305, "epoch": 2340} {"train_loss": -6.4042205810546875, "global_step": 98306, "epoch": 2340} {"train_loss": -6.435090065002441, "global_step": 98307, "epoch": 2340} {"train_loss": -6.483604431152344, "global_step": 98308, "epoch": 2340} {"train_loss": -6.321376323699951, "global_step": 98309, "epoch": 2340} {"train_loss": -6.289913177490234, "global_step": 98310, "epoch": 2340} {"train_loss": -6.224795341491699, "global_step": 98311, "epoch": 2340} {"train_loss": -6.395872116088867, "global_step": 98312, "epoch": 2340} {"train_loss": -6.333909511566162, "global_step": 98313, "epoch": 2340} {"train_loss": -6.184654235839844, "global_step": 98314, "epoch": 2340} {"train_loss": -6.410641670227051, "global_step": 98315, "epoch": 2340} {"train_loss": -6.2602739334106445, "global_step": 98316, "epoch": 2340} {"train_loss": -6.28102445602417, "global_step": 98317, "epoch": 2340} {"train_loss": -6.260956764221191, "global_step": 98318, "epoch": 2340} {"train_loss": -6.441958427429199, "global_step": 98319, "epoch": 2340} {"train_loss": -6.217559814453125, "global_step": 98320, "epoch": 2340} {"train_loss": -6.323298249925886, "global_step": 98321, "epoch": 2340, "val_loss": 67911.4140625} {"train_loss": -6.322332382202148, "global_step": 98322, "epoch": 2341} {"train_loss": -6.285144329071045, "global_step": 98323, "epoch": 2341} {"train_loss": -6.359923362731934, "global_step": 98324, "epoch": 2341} {"train_loss": -6.3745527267456055, "global_step": 98325, "epoch": 2341} {"train_loss": -6.36043643951416, "global_step": 98326, "epoch": 2341} {"train_loss": -6.41596794128418, "global_step": 98327, "epoch": 2341} {"train_loss": -6.382898330688477, "global_step": 98328, "epoch": 2341} {"train_loss": -6.3272199630737305, "global_step": 98329, "epoch": 2341} {"train_loss": -6.394333362579346, "global_step": 98330, "epoch": 2341} {"train_loss": -6.35008430480957, "global_step": 98331, "epoch": 2341} {"train_loss": -6.3916096687316895, "global_step": 98332, "epoch": 2341} {"train_loss": -6.421525955200195, "global_step": 98333, "epoch": 2341} {"train_loss": -6.2776994705200195, "global_step": 98334, "epoch": 2341} {"train_loss": -6.415834426879883, "global_step": 98335, "epoch": 2341} {"train_loss": -6.419144630432129, "global_step": 98336, "epoch": 2341} {"train_loss": -6.417017936706543, "global_step": 98337, "epoch": 2341} {"train_loss": -6.321996688842773, "global_step": 98338, "epoch": 2341} {"train_loss": -6.295336723327637, "global_step": 98339, "epoch": 2341} {"train_loss": -6.295868873596191, "global_step": 98340, "epoch": 2341} {"train_loss": -6.294279098510742, "global_step": 98341, "epoch": 2341} {"train_loss": -6.357105255126953, "global_step": 98342, "epoch": 2341} {"train_loss": -6.348106384277344, "global_step": 98343, "epoch": 2341} {"train_loss": -6.178372859954834, "global_step": 98344, "epoch": 2341} {"train_loss": -6.391200065612793, "global_step": 98345, "epoch": 2341} {"train_loss": -6.3513689041137695, "global_step": 98346, "epoch": 2341} {"train_loss": -6.464110374450684, "global_step": 98347, "epoch": 2341} {"train_loss": -6.326396942138672, "global_step": 98348, "epoch": 2341} {"train_loss": -6.204531669616699, "global_step": 98349, "epoch": 2341} {"train_loss": -6.2586212158203125, "global_step": 98350, "epoch": 2341} {"train_loss": -6.312458515167236, "global_step": 98351, "epoch": 2341} {"train_loss": -6.322357177734375, "global_step": 98352, "epoch": 2341} {"train_loss": -6.260099411010742, "global_step": 98353, "epoch": 2341} {"train_loss": -6.323529243469238, "global_step": 98354, "epoch": 2341} {"train_loss": -6.286076545715332, "global_step": 98355, "epoch": 2341} {"train_loss": -6.221889495849609, "global_step": 98356, "epoch": 2341} {"train_loss": -6.3499603271484375, "global_step": 98357, "epoch": 2341} {"train_loss": -6.386109352111816, "global_step": 98358, "epoch": 2341} {"train_loss": -6.307661056518555, "global_step": 98359, "epoch": 2341} {"train_loss": -6.307939052581787, "global_step": 98360, "epoch": 2341} {"train_loss": -6.356270790100098, "global_step": 98361, "epoch": 2341} {"train_loss": -6.373864650726318, "global_step": 98362, "epoch": 2341} {"train_loss": -6.337365774881272, "global_step": 98363, "epoch": 2341, "val_loss": 67965.125} {"train_loss": -6.279693603515625, "global_step": 98364, "epoch": 2342} {"train_loss": -6.438356876373291, "global_step": 98365, "epoch": 2342} {"train_loss": -6.344825267791748, "global_step": 98366, "epoch": 2342} {"train_loss": -6.3670268058776855, "global_step": 98367, "epoch": 2342} {"train_loss": -6.42576265335083, "global_step": 98368, "epoch": 2342} {"train_loss": -6.297379970550537, "global_step": 98369, "epoch": 2342} {"train_loss": -6.246603012084961, "global_step": 98370, "epoch": 2342} {"train_loss": -6.396523475646973, "global_step": 98371, "epoch": 2342} {"train_loss": -6.37061882019043, "global_step": 98372, "epoch": 2342} {"train_loss": -6.343245506286621, "global_step": 98373, "epoch": 2342} {"train_loss": -6.334391117095947, "global_step": 98374, "epoch": 2342} {"train_loss": -6.396447658538818, "global_step": 98375, "epoch": 2342} {"train_loss": -6.268735885620117, "global_step": 98376, "epoch": 2342} {"train_loss": -6.417147636413574, "global_step": 98377, "epoch": 2342} {"train_loss": -6.352194786071777, "global_step": 98378, "epoch": 2342} {"train_loss": -6.306082725524902, "global_step": 98379, "epoch": 2342} {"train_loss": -6.287409782409668, "global_step": 98380, "epoch": 2342} {"train_loss": -6.271296501159668, "global_step": 98381, "epoch": 2342} {"train_loss": -6.354587554931641, "global_step": 98382, "epoch": 2342} {"train_loss": -6.399657249450684, "global_step": 98383, "epoch": 2342} {"train_loss": -6.146088600158691, "global_step": 98384, "epoch": 2342} {"train_loss": -6.401263236999512, "global_step": 98385, "epoch": 2342} {"train_loss": -6.392148017883301, "global_step": 98386, "epoch": 2342} {"train_loss": -6.270421981811523, "global_step": 98387, "epoch": 2342} {"train_loss": -6.259537696838379, "global_step": 98388, "epoch": 2342} {"train_loss": -6.296369552612305, "global_step": 98389, "epoch": 2342} {"train_loss": -6.178135871887207, "global_step": 98390, "epoch": 2342} {"train_loss": -6.394579887390137, "global_step": 98391, "epoch": 2342} {"train_loss": -6.370795249938965, "global_step": 98392, "epoch": 2342} {"train_loss": -6.2968268394470215, "global_step": 98393, "epoch": 2342} {"train_loss": -6.286899089813232, "global_step": 98394, "epoch": 2342} {"train_loss": -6.252652168273926, "global_step": 98395, "epoch": 2342} {"train_loss": -6.392449378967285, "global_step": 98396, "epoch": 2342} {"train_loss": -6.358165740966797, "global_step": 98397, "epoch": 2342} {"train_loss": -6.423405647277832, "global_step": 98398, "epoch": 2342} {"train_loss": -6.393125057220459, "global_step": 98399, "epoch": 2342} {"train_loss": -6.336690902709961, "global_step": 98400, "epoch": 2342} {"train_loss": -6.319788932800293, "global_step": 98401, "epoch": 2342} {"train_loss": -6.289009094238281, "global_step": 98402, "epoch": 2342} {"train_loss": -6.279288291931152, "global_step": 98403, "epoch": 2342} {"train_loss": -6.301625728607178, "global_step": 98404, "epoch": 2342} {"train_loss": -6.3277002175649, "global_step": 98405, "epoch": 2342, "val_loss": 67930.6015625} {"train_loss": -6.320260047912598, "global_step": 98406, "epoch": 2343} {"train_loss": -6.308210849761963, "global_step": 98407, "epoch": 2343} {"train_loss": -6.306671142578125, "global_step": 98408, "epoch": 2343} {"train_loss": -6.352921009063721, "global_step": 98409, "epoch": 2343} {"train_loss": -6.35658597946167, "global_step": 98410, "epoch": 2343} {"train_loss": -6.428096771240234, "global_step": 98411, "epoch": 2343} {"train_loss": -6.300193786621094, "global_step": 98412, "epoch": 2343} {"train_loss": -6.194313049316406, "global_step": 98413, "epoch": 2343} {"train_loss": -6.401580333709717, "global_step": 98414, "epoch": 2343} {"train_loss": -6.314056396484375, "global_step": 98415, "epoch": 2343} {"train_loss": -6.3734049797058105, "global_step": 98416, "epoch": 2343} {"train_loss": -6.287621021270752, "global_step": 98417, "epoch": 2343} {"train_loss": -6.10639762878418, "global_step": 98418, "epoch": 2343} {"train_loss": -6.277035713195801, "global_step": 98419, "epoch": 2343} {"train_loss": -6.355328559875488, "global_step": 98420, "epoch": 2343} {"train_loss": -6.1996259689331055, "global_step": 98421, "epoch": 2343} {"train_loss": -6.161380290985107, "global_step": 98422, "epoch": 2343} {"train_loss": -6.2982635498046875, "global_step": 98423, "epoch": 2343} {"train_loss": -6.12080717086792, "global_step": 98424, "epoch": 2343} {"train_loss": -6.243818283081055, "global_step": 98425, "epoch": 2343} {"train_loss": -6.279614448547363, "global_step": 98426, "epoch": 2343} {"train_loss": -6.1323089599609375, "global_step": 98427, "epoch": 2343} {"train_loss": -6.325242519378662, "global_step": 98428, "epoch": 2343} {"train_loss": -6.206186771392822, "global_step": 98429, "epoch": 2343} {"train_loss": -6.177568435668945, "global_step": 98430, "epoch": 2343} {"train_loss": -6.328095436096191, "global_step": 98431, "epoch": 2343} {"train_loss": -6.2752814292907715, "global_step": 98432, "epoch": 2343} {"train_loss": -6.263389587402344, "global_step": 98433, "epoch": 2343} {"train_loss": -6.282863616943359, "global_step": 98434, "epoch": 2343} {"train_loss": -6.310596466064453, "global_step": 98435, "epoch": 2343} {"train_loss": -6.348350524902344, "global_step": 98436, "epoch": 2343} {"train_loss": -6.308763027191162, "global_step": 98437, "epoch": 2343} {"train_loss": -6.185640811920166, "global_step": 98438, "epoch": 2343} {"train_loss": -6.261289596557617, "global_step": 98439, "epoch": 2343} {"train_loss": -6.258325099945068, "global_step": 98440, "epoch": 2343} {"train_loss": -6.40419340133667, "global_step": 98441, "epoch": 2343} {"train_loss": -6.276612281799316, "global_step": 98442, "epoch": 2343} {"train_loss": -6.244223594665527, "global_step": 98443, "epoch": 2343} {"train_loss": -6.1965436935424805, "global_step": 98444, "epoch": 2343} {"train_loss": -6.230258941650391, "global_step": 98445, "epoch": 2343} {"train_loss": -6.28573751449585, "global_step": 98446, "epoch": 2343} {"train_loss": -6.273738168534779, "global_step": 98447, "epoch": 2343, "val_loss": 67980.625} {"train_loss": -6.422142505645752, "global_step": 98448, "epoch": 2344} {"train_loss": -6.283637046813965, "global_step": 98449, "epoch": 2344} {"train_loss": -6.26132869720459, "global_step": 98450, "epoch": 2344} {"train_loss": -6.22271203994751, "global_step": 98451, "epoch": 2344} {"train_loss": -6.299434661865234, "global_step": 98452, "epoch": 2344} {"train_loss": -6.261876106262207, "global_step": 98453, "epoch": 2344} {"train_loss": -6.302157878875732, "global_step": 98454, "epoch": 2344} {"train_loss": -6.180500030517578, "global_step": 98455, "epoch": 2344} {"train_loss": -6.282576560974121, "global_step": 98456, "epoch": 2344} {"train_loss": -6.396204948425293, "global_step": 98457, "epoch": 2344} {"train_loss": -6.345572471618652, "global_step": 98458, "epoch": 2344} {"train_loss": -6.3058671951293945, "global_step": 98459, "epoch": 2344} {"train_loss": -6.397069931030273, "global_step": 98460, "epoch": 2344} {"train_loss": -6.311507701873779, "global_step": 98461, "epoch": 2344} {"train_loss": -6.31656551361084, "global_step": 98462, "epoch": 2344} {"train_loss": -6.422346115112305, "global_step": 98463, "epoch": 2344} {"train_loss": -6.364343643188477, "global_step": 98464, "epoch": 2344} {"train_loss": -6.364558219909668, "global_step": 98465, "epoch": 2344} {"train_loss": -6.327179908752441, "global_step": 98466, "epoch": 2344} {"train_loss": -6.389433860778809, "global_step": 98467, "epoch": 2344} {"train_loss": -6.401311874389648, "global_step": 98468, "epoch": 2344} {"train_loss": -6.295637130737305, "global_step": 98469, "epoch": 2344} {"train_loss": -6.188089370727539, "global_step": 98470, "epoch": 2344} {"train_loss": -6.3017578125, "global_step": 98471, "epoch": 2344} {"train_loss": -6.326520919799805, "global_step": 98472, "epoch": 2344} {"train_loss": -6.342043876647949, "global_step": 98473, "epoch": 2344} {"train_loss": -6.275172710418701, "global_step": 98474, "epoch": 2344} {"train_loss": -6.240021228790283, "global_step": 98475, "epoch": 2344} {"train_loss": -6.356506824493408, "global_step": 98476, "epoch": 2344} {"train_loss": -6.211404323577881, "global_step": 98477, "epoch": 2344} {"train_loss": -6.258543968200684, "global_step": 98478, "epoch": 2344} {"train_loss": -6.341639518737793, "global_step": 98479, "epoch": 2344} {"train_loss": -6.335912704467773, "global_step": 98480, "epoch": 2344} {"train_loss": -6.284320831298828, "global_step": 98481, "epoch": 2344} {"train_loss": -6.240475654602051, "global_step": 98482, "epoch": 2344} {"train_loss": -6.239289283752441, "global_step": 98483, "epoch": 2344} {"train_loss": -6.362932205200195, "global_step": 98484, "epoch": 2344} {"train_loss": -6.329520225524902, "global_step": 98485, "epoch": 2344} {"train_loss": -6.401732444763184, "global_step": 98486, "epoch": 2344} {"train_loss": -6.220945358276367, "global_step": 98487, "epoch": 2344} {"train_loss": -6.405576229095459, "global_step": 98488, "epoch": 2344} {"train_loss": -6.314986569540841, "global_step": 98489, "epoch": 2344, "val_loss": 67991.7890625} {"train_loss": -6.355165481567383, "global_step": 98490, "epoch": 2345} {"train_loss": -6.39040470123291, "global_step": 98491, "epoch": 2345} {"train_loss": -6.4772491455078125, "global_step": 98492, "epoch": 2345} {"train_loss": -6.462569236755371, "global_step": 98493, "epoch": 2345} {"train_loss": -6.43251895904541, "global_step": 98494, "epoch": 2345} {"train_loss": -6.285438537597656, "global_step": 98495, "epoch": 2345} {"train_loss": -6.327985763549805, "global_step": 98496, "epoch": 2345} {"train_loss": -6.299584865570068, "global_step": 98497, "epoch": 2345} {"train_loss": -6.36985969543457, "global_step": 98498, "epoch": 2345} {"train_loss": -6.3675947189331055, "global_step": 98499, "epoch": 2345} {"train_loss": -6.300972938537598, "global_step": 98500, "epoch": 2345} {"train_loss": -6.355679035186768, "global_step": 98501, "epoch": 2345} {"train_loss": -6.334962844848633, "global_step": 98502, "epoch": 2345} {"train_loss": -6.281623840332031, "global_step": 98503, "epoch": 2345} {"train_loss": -6.316835403442383, "global_step": 98504, "epoch": 2345} {"train_loss": -6.235260009765625, "global_step": 98505, "epoch": 2345} {"train_loss": -6.297972679138184, "global_step": 98506, "epoch": 2345} {"train_loss": -6.160550117492676, "global_step": 98507, "epoch": 2345} {"train_loss": -6.234942436218262, "global_step": 98508, "epoch": 2345} {"train_loss": -6.309152603149414, "global_step": 98509, "epoch": 2345} {"train_loss": -6.355092525482178, "global_step": 98510, "epoch": 2345} {"train_loss": -6.295626640319824, "global_step": 98511, "epoch": 2345} {"train_loss": -6.259117603302002, "global_step": 98512, "epoch": 2345} {"train_loss": -6.429200172424316, "global_step": 98513, "epoch": 2345} {"train_loss": -6.2631707191467285, "global_step": 98514, "epoch": 2345} {"train_loss": -6.290203094482422, "global_step": 98515, "epoch": 2345} {"train_loss": -6.293755531311035, "global_step": 98516, "epoch": 2345} {"train_loss": -6.358438968658447, "global_step": 98517, "epoch": 2345} {"train_loss": -6.366615295410156, "global_step": 98518, "epoch": 2345} {"train_loss": -6.312961578369141, "global_step": 98519, "epoch": 2345} {"train_loss": -6.36284065246582, "global_step": 98520, "epoch": 2345} {"train_loss": -6.437376022338867, "global_step": 98521, "epoch": 2345} {"train_loss": -6.387704849243164, "global_step": 98522, "epoch": 2345} {"train_loss": -6.265349864959717, "global_step": 98523, "epoch": 2345} {"train_loss": -6.295776844024658, "global_step": 98524, "epoch": 2345} {"train_loss": -6.390743255615234, "global_step": 98525, "epoch": 2345} {"train_loss": -6.323111534118652, "global_step": 98526, "epoch": 2345} {"train_loss": -6.208065509796143, "global_step": 98527, "epoch": 2345} {"train_loss": -6.355462074279785, "global_step": 98528, "epoch": 2345} {"train_loss": -6.235876560211182, "global_step": 98529, "epoch": 2345} {"train_loss": -6.412629127502441, "global_step": 98530, "epoch": 2345} {"train_loss": -6.3281661215282625, "global_step": 98531, "epoch": 2345, "val_loss": 67931.5546875} {"train_loss": -6.335962295532227, "global_step": 98532, "epoch": 2346} {"train_loss": -6.447751045227051, "global_step": 98533, "epoch": 2346} {"train_loss": -6.299237251281738, "global_step": 98534, "epoch": 2346} {"train_loss": -6.329375267028809, "global_step": 98535, "epoch": 2346} {"train_loss": -6.255490303039551, "global_step": 98536, "epoch": 2346} {"train_loss": -6.335940361022949, "global_step": 98537, "epoch": 2346} {"train_loss": -6.366573333740234, "global_step": 98538, "epoch": 2346} {"train_loss": -6.360886573791504, "global_step": 98539, "epoch": 2346} {"train_loss": -6.18814754486084, "global_step": 98540, "epoch": 2346} {"train_loss": -6.380178451538086, "global_step": 98541, "epoch": 2346} {"train_loss": -6.2708587646484375, "global_step": 98542, "epoch": 2346} {"train_loss": -6.263025283813477, "global_step": 98543, "epoch": 2346} {"train_loss": -6.467099189758301, "global_step": 98544, "epoch": 2346} {"train_loss": -6.294565677642822, "global_step": 98545, "epoch": 2346} {"train_loss": -6.408020973205566, "global_step": 98546, "epoch": 2346} {"train_loss": -6.392504692077637, "global_step": 98547, "epoch": 2346} {"train_loss": -6.295873641967773, "global_step": 98548, "epoch": 2346} {"train_loss": -6.223946571350098, "global_step": 98549, "epoch": 2346} {"train_loss": -6.272833824157715, "global_step": 98550, "epoch": 2346} {"train_loss": -6.361800193786621, "global_step": 98551, "epoch": 2346} {"train_loss": -6.332233428955078, "global_step": 98552, "epoch": 2346} {"train_loss": -6.263195991516113, "global_step": 98553, "epoch": 2346} {"train_loss": -6.404951095581055, "global_step": 98554, "epoch": 2346} {"train_loss": -6.376983642578125, "global_step": 98555, "epoch": 2346} {"train_loss": -6.338960647583008, "global_step": 98556, "epoch": 2346} {"train_loss": -6.174793720245361, "global_step": 98557, "epoch": 2346} {"train_loss": -6.338334083557129, "global_step": 98558, "epoch": 2346} {"train_loss": -6.426394939422607, "global_step": 98559, "epoch": 2346} {"train_loss": -6.464286804199219, "global_step": 98560, "epoch": 2346} {"train_loss": -6.330157279968262, "global_step": 98561, "epoch": 2346} {"train_loss": -6.386262893676758, "global_step": 98562, "epoch": 2346} {"train_loss": -6.387617111206055, "global_step": 98563, "epoch": 2346} {"train_loss": -6.32486629486084, "global_step": 98564, "epoch": 2346} {"train_loss": -6.195095539093018, "global_step": 98565, "epoch": 2346} {"train_loss": -6.279280662536621, "global_step": 98566, "epoch": 2346} {"train_loss": -6.272420883178711, "global_step": 98567, "epoch": 2346} {"train_loss": -6.22025728225708, "global_step": 98568, "epoch": 2346} {"train_loss": -6.2613115310668945, "global_step": 98569, "epoch": 2346} {"train_loss": -6.350487232208252, "global_step": 98570, "epoch": 2346} {"train_loss": -6.365317344665527, "global_step": 98571, "epoch": 2346} {"train_loss": -6.360372066497803, "global_step": 98572, "epoch": 2346} {"train_loss": -6.3276657944633845, "global_step": 98573, "epoch": 2346, "val_loss": 67810.3046875} {"train_loss": -6.288668632507324, "global_step": 98574, "epoch": 2347} {"train_loss": -6.383283615112305, "global_step": 98575, "epoch": 2347} {"train_loss": -6.361412525177002, "global_step": 98576, "epoch": 2347} {"train_loss": -6.312861442565918, "global_step": 98577, "epoch": 2347} {"train_loss": -6.376138687133789, "global_step": 98578, "epoch": 2347} {"train_loss": -6.311000823974609, "global_step": 98579, "epoch": 2347} {"train_loss": -6.440404891967773, "global_step": 98580, "epoch": 2347} {"train_loss": -6.332475185394287, "global_step": 98581, "epoch": 2347} {"train_loss": -6.332700729370117, "global_step": 98582, "epoch": 2347} {"train_loss": -6.31671142578125, "global_step": 98583, "epoch": 2347} {"train_loss": -6.408121109008789, "global_step": 98584, "epoch": 2347} {"train_loss": -6.317062854766846, "global_step": 98585, "epoch": 2347} {"train_loss": -6.2762837409973145, "global_step": 98586, "epoch": 2347} {"train_loss": -6.321469306945801, "global_step": 98587, "epoch": 2347} {"train_loss": -6.393972873687744, "global_step": 98588, "epoch": 2347} {"train_loss": -6.3855881690979, "global_step": 98589, "epoch": 2347} {"train_loss": -6.35572624206543, "global_step": 98590, "epoch": 2347} {"train_loss": -6.368264198303223, "global_step": 98591, "epoch": 2347} {"train_loss": -6.323510646820068, "global_step": 98592, "epoch": 2347} {"train_loss": -6.422342300415039, "global_step": 98593, "epoch": 2347} {"train_loss": -6.210340976715088, "global_step": 98594, "epoch": 2347} {"train_loss": -6.2736616134643555, "global_step": 98595, "epoch": 2347} {"train_loss": -6.403187274932861, "global_step": 98596, "epoch": 2347} {"train_loss": -6.29423189163208, "global_step": 98597, "epoch": 2347} {"train_loss": -6.423886775970459, "global_step": 98598, "epoch": 2347} {"train_loss": -6.377841949462891, "global_step": 98599, "epoch": 2347} {"train_loss": -6.335077285766602, "global_step": 98600, "epoch": 2347} {"train_loss": -6.349845886230469, "global_step": 98601, "epoch": 2347} {"train_loss": -6.290090560913086, "global_step": 98602, "epoch": 2347} {"train_loss": -6.272873878479004, "global_step": 98603, "epoch": 2347} {"train_loss": -6.325803756713867, "global_step": 98604, "epoch": 2347} {"train_loss": -6.3651533126831055, "global_step": 98605, "epoch": 2347} {"train_loss": -6.434814929962158, "global_step": 98606, "epoch": 2347} {"train_loss": -6.272604942321777, "global_step": 98607, "epoch": 2347} {"train_loss": -6.421429634094238, "global_step": 98608, "epoch": 2347} {"train_loss": -6.413758277893066, "global_step": 98609, "epoch": 2347} {"train_loss": -6.370399475097656, "global_step": 98610, "epoch": 2347} {"train_loss": -6.28224515914917, "global_step": 98611, "epoch": 2347} {"train_loss": -6.16986608505249, "global_step": 98612, "epoch": 2347} {"train_loss": -6.3559722900390625, "global_step": 98613, "epoch": 2347} {"train_loss": -6.29598331451416, "global_step": 98614, "epoch": 2347} {"train_loss": -6.3400007883707685, "global_step": 98615, "epoch": 2347, "val_loss": 68061.2890625} {"train_loss": -6.392043113708496, "global_step": 98616, "epoch": 2348} {"train_loss": -6.442266464233398, "global_step": 98617, "epoch": 2348} {"train_loss": -6.372969627380371, "global_step": 98618, "epoch": 2348} {"train_loss": -6.2961745262146, "global_step": 98619, "epoch": 2348} {"train_loss": -6.306641578674316, "global_step": 98620, "epoch": 2348} {"train_loss": -6.283483505249023, "global_step": 98621, "epoch": 2348} {"train_loss": -6.292040824890137, "global_step": 98622, "epoch": 2348} {"train_loss": -6.338945388793945, "global_step": 98623, "epoch": 2348} {"train_loss": -6.388352394104004, "global_step": 98624, "epoch": 2348} {"train_loss": -6.29693603515625, "global_step": 98625, "epoch": 2348} {"train_loss": -6.272456169128418, "global_step": 98626, "epoch": 2348} {"train_loss": -6.429168224334717, "global_step": 98627, "epoch": 2348} {"train_loss": -6.275311470031738, "global_step": 98628, "epoch": 2348} {"train_loss": -6.329644203186035, "global_step": 98629, "epoch": 2348} {"train_loss": -6.383824825286865, "global_step": 98630, "epoch": 2348} {"train_loss": -6.220333099365234, "global_step": 98631, "epoch": 2348} {"train_loss": -6.4389872550964355, "global_step": 98632, "epoch": 2348} {"train_loss": -6.165205478668213, "global_step": 98633, "epoch": 2348} {"train_loss": -6.302506446838379, "global_step": 98634, "epoch": 2348} {"train_loss": -6.352401256561279, "global_step": 98635, "epoch": 2348} {"train_loss": -6.23762321472168, "global_step": 98636, "epoch": 2348} {"train_loss": -6.367518901824951, "global_step": 98637, "epoch": 2348} {"train_loss": -6.2968363761901855, "global_step": 98638, "epoch": 2348} {"train_loss": -6.355401992797852, "global_step": 98639, "epoch": 2348} {"train_loss": -6.3068084716796875, "global_step": 98640, "epoch": 2348} {"train_loss": -6.151388168334961, "global_step": 98641, "epoch": 2348} {"train_loss": -6.338560581207275, "global_step": 98642, "epoch": 2348} {"train_loss": -6.332840919494629, "global_step": 98643, "epoch": 2348} {"train_loss": -6.370674133300781, "global_step": 98644, "epoch": 2348} {"train_loss": -6.298675537109375, "global_step": 98645, "epoch": 2348} {"train_loss": -6.417044639587402, "global_step": 98646, "epoch": 2348} {"train_loss": -6.333682060241699, "global_step": 98647, "epoch": 2348} {"train_loss": -6.310843467712402, "global_step": 98648, "epoch": 2348} {"train_loss": -6.424800872802734, "global_step": 98649, "epoch": 2348} {"train_loss": -6.426610469818115, "global_step": 98650, "epoch": 2348} {"train_loss": -6.330546855926514, "global_step": 98651, "epoch": 2348} {"train_loss": -6.407199859619141, "global_step": 98652, "epoch": 2348} {"train_loss": -6.401117324829102, "global_step": 98653, "epoch": 2348} {"train_loss": -6.281384468078613, "global_step": 98654, "epoch": 2348} {"train_loss": -6.37797737121582, "global_step": 98655, "epoch": 2348} {"train_loss": -6.460308074951172, "global_step": 98656, "epoch": 2348} {"train_loss": -6.3377688612256735, "global_step": 98657, "epoch": 2348, "val_loss": 67914.109375} {"train_loss": -6.257922172546387, "global_step": 98658, "epoch": 2349} {"train_loss": -6.410587310791016, "global_step": 98659, "epoch": 2349} {"train_loss": -6.369136333465576, "global_step": 98660, "epoch": 2349} {"train_loss": -6.322877883911133, "global_step": 98661, "epoch": 2349} {"train_loss": -6.249539375305176, "global_step": 98662, "epoch": 2349} {"train_loss": -6.271476745605469, "global_step": 98663, "epoch": 2349} {"train_loss": -6.265366077423096, "global_step": 98664, "epoch": 2349} {"train_loss": -6.35582160949707, "global_step": 98665, "epoch": 2349} {"train_loss": -6.367527484893799, "global_step": 98666, "epoch": 2349} {"train_loss": -6.364800453186035, "global_step": 98667, "epoch": 2349} {"train_loss": -6.375618934631348, "global_step": 98668, "epoch": 2349} {"train_loss": -6.353230953216553, "global_step": 98669, "epoch": 2349} {"train_loss": -6.396901607513428, "global_step": 98670, "epoch": 2349} {"train_loss": -6.298103332519531, "global_step": 98671, "epoch": 2349} {"train_loss": -6.365567207336426, "global_step": 98672, "epoch": 2349} {"train_loss": -6.3325700759887695, "global_step": 98673, "epoch": 2349} {"train_loss": -6.3264055252075195, "global_step": 98674, "epoch": 2349} {"train_loss": -6.3478899002075195, "global_step": 98675, "epoch": 2349} {"train_loss": -6.371715545654297, "global_step": 98676, "epoch": 2349} {"train_loss": -6.37998104095459, "global_step": 98677, "epoch": 2349} {"train_loss": -6.2319841384887695, "global_step": 98678, "epoch": 2349} {"train_loss": -6.403888702392578, "global_step": 98679, "epoch": 2349} {"train_loss": -6.416477203369141, "global_step": 98680, "epoch": 2349} {"train_loss": -6.379792213439941, "global_step": 98681, "epoch": 2349} {"train_loss": -6.319291114807129, "global_step": 98682, "epoch": 2349} {"train_loss": -6.26042366027832, "global_step": 98683, "epoch": 2349} {"train_loss": -6.301602363586426, "global_step": 98684, "epoch": 2349} {"train_loss": -6.308466911315918, "global_step": 98685, "epoch": 2349} {"train_loss": -6.371188163757324, "global_step": 98686, "epoch": 2349} {"train_loss": -6.345155715942383, "global_step": 98687, "epoch": 2349} {"train_loss": -6.343815803527832, "global_step": 98688, "epoch": 2349} {"train_loss": -6.31712007522583, "global_step": 98689, "epoch": 2349} {"train_loss": -6.462018013000488, "global_step": 98690, "epoch": 2349} {"train_loss": -6.4440412521362305, "global_step": 98691, "epoch": 2349} {"train_loss": -6.3756632804870605, "global_step": 98692, "epoch": 2349} {"train_loss": -6.338157653808594, "global_step": 98693, "epoch": 2349} {"train_loss": -6.354804992675781, "global_step": 98694, "epoch": 2349} {"train_loss": -6.35911226272583, "global_step": 98695, "epoch": 2349} {"train_loss": -6.275508880615234, "global_step": 98696, "epoch": 2349} {"train_loss": -6.25732946395874, "global_step": 98697, "epoch": 2349} {"train_loss": -6.339447975158691, "global_step": 98698, "epoch": 2349} {"train_loss": -6.338703269050235, "global_step": 98699, "epoch": 2349, "val_loss": 67966.3828125} {"train_loss": -6.308525085449219, "global_step": 98700, "epoch": 2350} {"train_loss": -6.1960601806640625, "global_step": 98701, "epoch": 2350} {"train_loss": -6.025287628173828, "global_step": 98702, "epoch": 2350} {"train_loss": -6.297138690948486, "global_step": 98703, "epoch": 2350} {"train_loss": -6.285277366638184, "global_step": 98704, "epoch": 2350} {"train_loss": -6.357278823852539, "global_step": 98705, "epoch": 2350} {"train_loss": -6.053231239318848, "global_step": 98706, "epoch": 2350} {"train_loss": -6.148237228393555, "global_step": 98707, "epoch": 2350} {"train_loss": -6.143819808959961, "global_step": 98708, "epoch": 2350} {"train_loss": -6.157381057739258, "global_step": 98709, "epoch": 2350} {"train_loss": -6.180302619934082, "global_step": 98710, "epoch": 2350} {"train_loss": -6.1038079261779785, "global_step": 98711, "epoch": 2350} {"train_loss": -6.331735134124756, "global_step": 98712, "epoch": 2350} {"train_loss": -6.303460121154785, "global_step": 98713, "epoch": 2350} {"train_loss": -6.144373893737793, "global_step": 98714, "epoch": 2350} {"train_loss": -6.1916303634643555, "global_step": 98715, "epoch": 2350} {"train_loss": -6.286555767059326, "global_step": 98716, "epoch": 2350} {"train_loss": -6.236598491668701, "global_step": 98717, "epoch": 2350} {"train_loss": -6.22932243347168, "global_step": 98718, "epoch": 2350} {"train_loss": -6.223415374755859, "global_step": 98719, "epoch": 2350} {"train_loss": -6.25335168838501, "global_step": 98720, "epoch": 2350} {"train_loss": -6.332486152648926, "global_step": 98721, "epoch": 2350} {"train_loss": -6.313928604125977, "global_step": 98722, "epoch": 2350} {"train_loss": -6.394500255584717, "global_step": 98723, "epoch": 2350} {"train_loss": -6.295855522155762, "global_step": 98724, "epoch": 2350} {"train_loss": -6.230257987976074, "global_step": 98725, "epoch": 2350} {"train_loss": -6.269357681274414, "global_step": 98726, "epoch": 2350} {"train_loss": -6.188848972320557, "global_step": 98727, "epoch": 2350} {"train_loss": -6.291618347167969, "global_step": 98728, "epoch": 2350} {"train_loss": -6.227838516235352, "global_step": 98729, "epoch": 2350} {"train_loss": -6.364512920379639, "global_step": 98730, "epoch": 2350} {"train_loss": -6.34877872467041, "global_step": 98731, "epoch": 2350} {"train_loss": -6.255433559417725, "global_step": 98732, "epoch": 2350} {"train_loss": -6.317499160766602, "global_step": 98733, "epoch": 2350} {"train_loss": -6.347005844116211, "global_step": 98734, "epoch": 2350} {"train_loss": -6.196220397949219, "global_step": 98735, "epoch": 2350} {"train_loss": -6.353426933288574, "global_step": 98736, "epoch": 2350} {"train_loss": -6.245448112487793, "global_step": 98737, "epoch": 2350} {"train_loss": -6.181475639343262, "global_step": 98738, "epoch": 2350} {"train_loss": -6.393815994262695, "global_step": 98739, "epoch": 2350} {"train_loss": -6.251203536987305, "global_step": 98740, "epoch": 2350} {"train_loss": -6.252710092635382, "global_step": 98741, "epoch": 2350, "train/sim_max_reward_0": 0.1916942951886523, "train/sim_max_reward_1": 0.9230341164647123, "train/sim_max_reward_2": 0.2946937380843425, "train/sim_max_reward_3": 0.14271231141429214, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9326919087188538, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.15611860639562836, "test/sim_max_reward_4400002": 0.8101585389671313, "test/sim_max_reward_4400003": 0.9170780009823339, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.6459032299107154, "test/sim_max_reward_4400007": 0.7876562718181482, "test/sim_max_reward_4400008": 0.2978573175296399, "test/sim_max_reward_4400009": 0.7701528754433499, "test/sim_max_reward_4400010": 0.22687933847481828, "test/sim_max_reward_4400011": 0.9313728683611244, "test/sim_max_reward_4400012": 0.8313506620534566, "test/sim_max_reward_4400013": 0.6690643057120801, "test/sim_max_reward_4400014": 0.8441325650810628, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.19171333810891625, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.07595490475983975, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8324275543664096, "test/sim_max_reward_4400023": 0.4842489282601627, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.22047127630025837, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 0.018582008038432348, "test/sim_max_reward_4400028": 0.8857752139914814, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9009151125301041, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8461863510931675, "test/sim_max_reward_4400034": 0.920209958524684, "test/sim_max_reward_4400035": 0.7130476644917603, "test/sim_max_reward_4400036": 0.5054464751308043, "test/sim_max_reward_4400037": 0.9770342023453146, "test/sim_max_reward_4400038": 0.9592909346187498, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9974582096065943, "test/sim_max_reward_4400042": 0.8531499039661878, "test/sim_max_reward_4400043": 0.9085670118050868, "test/sim_max_reward_4400044": 0.658879222255192, "test/sim_max_reward_4400045": 0.5407249875798891, "test/sim_max_reward_4400046": 0.8037878301106884, "test/sim_max_reward_4400047": 0.9608941462293034, "test/sim_max_reward_4400048": 0.7240427975284977, "test/sim_max_reward_4400049": 0.9253060896847477, "train/mean_score": 0.5808043949784755, "test/mean_score": 0.567267503585026, "val_loss": 67928.484375} {"train_loss": -6.327700614929199, "global_step": 98742, "epoch": 2351} {"train_loss": -6.241320610046387, "global_step": 98743, "epoch": 2351} {"train_loss": -6.254488945007324, "global_step": 98744, "epoch": 2351} {"train_loss": -6.2408037185668945, "global_step": 98745, "epoch": 2351} {"train_loss": -6.134957313537598, "global_step": 98746, "epoch": 2351} {"train_loss": -6.372700214385986, "global_step": 98747, "epoch": 2351} {"train_loss": -6.310675144195557, "global_step": 98748, "epoch": 2351} {"train_loss": -6.21474027633667, "global_step": 98749, "epoch": 2351} {"train_loss": -6.335273742675781, "global_step": 98750, "epoch": 2351} {"train_loss": -6.33233642578125, "global_step": 98751, "epoch": 2351} {"train_loss": -6.344572067260742, "global_step": 98752, "epoch": 2351} {"train_loss": -6.368413925170898, "global_step": 98753, "epoch": 2351} {"train_loss": -6.431083679199219, "global_step": 98754, "epoch": 2351} {"train_loss": -6.376274108886719, "global_step": 98755, "epoch": 2351} {"train_loss": -6.33709716796875, "global_step": 98756, "epoch": 2351} {"train_loss": -6.212378025054932, "global_step": 98757, "epoch": 2351} {"train_loss": -6.192777156829834, "global_step": 98758, "epoch": 2351} {"train_loss": -6.380321502685547, "global_step": 98759, "epoch": 2351} {"train_loss": -6.282111644744873, "global_step": 98760, "epoch": 2351} {"train_loss": -6.307459831237793, "global_step": 98761, "epoch": 2351} {"train_loss": -6.441280364990234, "global_step": 98762, "epoch": 2351} {"train_loss": -6.212640762329102, "global_step": 98763, "epoch": 2351} {"train_loss": -6.469558238983154, "global_step": 98764, "epoch": 2351} {"train_loss": -6.248310089111328, "global_step": 98765, "epoch": 2351} {"train_loss": -6.1480631828308105, "global_step": 98766, "epoch": 2351} {"train_loss": -6.32328462600708, "global_step": 98767, "epoch": 2351} {"train_loss": -6.3761773109436035, "global_step": 98768, "epoch": 2351} {"train_loss": -6.3252177238464355, "global_step": 98769, "epoch": 2351} {"train_loss": -6.392916679382324, "global_step": 98770, "epoch": 2351} {"train_loss": -6.3567609786987305, "global_step": 98771, "epoch": 2351} {"train_loss": -6.30202054977417, "global_step": 98772, "epoch": 2351} {"train_loss": -6.389404773712158, "global_step": 98773, "epoch": 2351} {"train_loss": -6.350549697875977, "global_step": 98774, "epoch": 2351} {"train_loss": -6.387711048126221, "global_step": 98775, "epoch": 2351} {"train_loss": -6.278097152709961, "global_step": 98776, "epoch": 2351} {"train_loss": -6.274672508239746, "global_step": 98777, "epoch": 2351} {"train_loss": -6.326694011688232, "global_step": 98778, "epoch": 2351} {"train_loss": -6.2783284187316895, "global_step": 98779, "epoch": 2351} {"train_loss": -6.257021903991699, "global_step": 98780, "epoch": 2351} {"train_loss": -6.315609931945801, "global_step": 98781, "epoch": 2351} {"train_loss": -6.34238338470459, "global_step": 98782, "epoch": 2351} {"train_loss": -6.307840846833729, "global_step": 98783, "epoch": 2351, "val_loss": 67999.0625} {"train_loss": -6.247173309326172, "global_step": 98784, "epoch": 2352} {"train_loss": -6.372955322265625, "global_step": 98785, "epoch": 2352} {"train_loss": -6.267366409301758, "global_step": 98786, "epoch": 2352} {"train_loss": -6.245096206665039, "global_step": 98787, "epoch": 2352} {"train_loss": -6.240236282348633, "global_step": 98788, "epoch": 2352} {"train_loss": -6.2585039138793945, "global_step": 98789, "epoch": 2352} {"train_loss": -6.153304100036621, "global_step": 98790, "epoch": 2352} {"train_loss": -6.234843730926514, "global_step": 98791, "epoch": 2352} {"train_loss": -6.203052520751953, "global_step": 98792, "epoch": 2352} {"train_loss": -6.248380661010742, "global_step": 98793, "epoch": 2352} {"train_loss": -6.327826023101807, "global_step": 98794, "epoch": 2352} {"train_loss": -6.209843158721924, "global_step": 98795, "epoch": 2352} {"train_loss": -6.158034324645996, "global_step": 98796, "epoch": 2352} {"train_loss": -6.371743202209473, "global_step": 98797, "epoch": 2352} {"train_loss": -6.322222709655762, "global_step": 98798, "epoch": 2352} {"train_loss": -6.152756690979004, "global_step": 98799, "epoch": 2352} {"train_loss": -6.17482852935791, "global_step": 98800, "epoch": 2352} {"train_loss": -6.267189979553223, "global_step": 98801, "epoch": 2352} {"train_loss": -6.24883508682251, "global_step": 98802, "epoch": 2352} {"train_loss": -6.210221290588379, "global_step": 98803, "epoch": 2352} {"train_loss": -6.278419494628906, "global_step": 98804, "epoch": 2352} {"train_loss": -6.191980361938477, "global_step": 98805, "epoch": 2352} {"train_loss": -6.294632911682129, "global_step": 98806, "epoch": 2352} {"train_loss": -6.279916763305664, "global_step": 98807, "epoch": 2352} {"train_loss": -6.222491264343262, "global_step": 98808, "epoch": 2352} {"train_loss": -6.3053812980651855, "global_step": 98809, "epoch": 2352} {"train_loss": -6.402176856994629, "global_step": 98810, "epoch": 2352} {"train_loss": -6.323102951049805, "global_step": 98811, "epoch": 2352} {"train_loss": -6.288938522338867, "global_step": 98812, "epoch": 2352} {"train_loss": -6.25537109375, "global_step": 98813, "epoch": 2352} {"train_loss": -6.340182781219482, "global_step": 98814, "epoch": 2352} {"train_loss": -6.314228057861328, "global_step": 98815, "epoch": 2352} {"train_loss": -6.216327667236328, "global_step": 98816, "epoch": 2352} {"train_loss": -6.274180889129639, "global_step": 98817, "epoch": 2352} {"train_loss": -6.238750457763672, "global_step": 98818, "epoch": 2352} {"train_loss": -6.3707594871521, "global_step": 98819, "epoch": 2352} {"train_loss": -6.42342472076416, "global_step": 98820, "epoch": 2352} {"train_loss": -6.346400260925293, "global_step": 98821, "epoch": 2352} {"train_loss": -6.308423042297363, "global_step": 98822, "epoch": 2352} {"train_loss": -6.316223621368408, "global_step": 98823, "epoch": 2352} {"train_loss": -6.351433753967285, "global_step": 98824, "epoch": 2352} {"train_loss": -6.274579547700428, "global_step": 98825, "epoch": 2352, "val_loss": 67964.734375} {"train_loss": -6.224041938781738, "global_step": 98826, "epoch": 2353} {"train_loss": -6.294172286987305, "global_step": 98827, "epoch": 2353} {"train_loss": -6.171513080596924, "global_step": 98828, "epoch": 2353} {"train_loss": -6.341291904449463, "global_step": 98829, "epoch": 2353} {"train_loss": -6.255919456481934, "global_step": 98830, "epoch": 2353} {"train_loss": -6.37446403503418, "global_step": 98831, "epoch": 2353} {"train_loss": -6.317103385925293, "global_step": 98832, "epoch": 2353} {"train_loss": -6.180039405822754, "global_step": 98833, "epoch": 2353} {"train_loss": -6.3708672523498535, "global_step": 98834, "epoch": 2353} {"train_loss": -6.363473892211914, "global_step": 98835, "epoch": 2353} {"train_loss": -6.359602928161621, "global_step": 98836, "epoch": 2353} {"train_loss": -6.39363431930542, "global_step": 98837, "epoch": 2353} {"train_loss": -6.223665714263916, "global_step": 98838, "epoch": 2353} {"train_loss": -6.368356227874756, "global_step": 98839, "epoch": 2353} {"train_loss": -6.438692569732666, "global_step": 98840, "epoch": 2353} {"train_loss": -6.165896892547607, "global_step": 98841, "epoch": 2353} {"train_loss": -6.3436279296875, "global_step": 98842, "epoch": 2353} {"train_loss": -6.323448181152344, "global_step": 98843, "epoch": 2353} {"train_loss": -6.254295825958252, "global_step": 98844, "epoch": 2353} {"train_loss": -6.311156272888184, "global_step": 98845, "epoch": 2353} {"train_loss": -6.2755022048950195, "global_step": 98846, "epoch": 2353} {"train_loss": -6.2697906494140625, "global_step": 98847, "epoch": 2353} {"train_loss": -6.257152557373047, "global_step": 98848, "epoch": 2353} {"train_loss": -6.254939079284668, "global_step": 98849, "epoch": 2353} {"train_loss": -6.3775858879089355, "global_step": 98850, "epoch": 2353} {"train_loss": -6.319832801818848, "global_step": 98851, "epoch": 2353} {"train_loss": -6.353456020355225, "global_step": 98852, "epoch": 2353} {"train_loss": -6.380084991455078, "global_step": 98853, "epoch": 2353} {"train_loss": -6.193583011627197, "global_step": 98854, "epoch": 2353} {"train_loss": -6.321279525756836, "global_step": 98855, "epoch": 2353} {"train_loss": -6.279685974121094, "global_step": 98856, "epoch": 2353} {"train_loss": -6.163972854614258, "global_step": 98857, "epoch": 2353} {"train_loss": -6.310359954833984, "global_step": 98858, "epoch": 2353} {"train_loss": -6.228697776794434, "global_step": 98859, "epoch": 2353} {"train_loss": -6.366451263427734, "global_step": 98860, "epoch": 2353} {"train_loss": -6.415866851806641, "global_step": 98861, "epoch": 2353} {"train_loss": -6.195131301879883, "global_step": 98862, "epoch": 2353} {"train_loss": -6.307207107543945, "global_step": 98863, "epoch": 2353} {"train_loss": -6.387439250946045, "global_step": 98864, "epoch": 2353} {"train_loss": -6.427700042724609, "global_step": 98865, "epoch": 2353} {"train_loss": -6.3658127784729, "global_step": 98866, "epoch": 2353} {"train_loss": -6.308401823043823, "global_step": 98867, "epoch": 2353, "val_loss": 68007.96875} {"train_loss": -6.150250434875488, "global_step": 98868, "epoch": 2354} {"train_loss": -6.274375915527344, "global_step": 98869, "epoch": 2354} {"train_loss": -6.183895587921143, "global_step": 98870, "epoch": 2354} {"train_loss": -6.416804790496826, "global_step": 98871, "epoch": 2354} {"train_loss": -6.222931385040283, "global_step": 98872, "epoch": 2354} {"train_loss": -6.354501724243164, "global_step": 98873, "epoch": 2354} {"train_loss": -6.270658016204834, "global_step": 98874, "epoch": 2354} {"train_loss": -6.320871353149414, "global_step": 98875, "epoch": 2354} {"train_loss": -6.332364082336426, "global_step": 98876, "epoch": 2354} {"train_loss": -6.347325801849365, "global_step": 98877, "epoch": 2354} {"train_loss": -6.402029514312744, "global_step": 98878, "epoch": 2354} {"train_loss": -6.377693176269531, "global_step": 98879, "epoch": 2354} {"train_loss": -6.280767917633057, "global_step": 98880, "epoch": 2354} {"train_loss": -6.254476070404053, "global_step": 98881, "epoch": 2354} {"train_loss": -6.294605255126953, "global_step": 98882, "epoch": 2354} {"train_loss": -6.380825042724609, "global_step": 98883, "epoch": 2354} {"train_loss": -6.3267340660095215, "global_step": 98884, "epoch": 2354} {"train_loss": -6.400996208190918, "global_step": 98885, "epoch": 2354} {"train_loss": -6.359748840332031, "global_step": 98886, "epoch": 2354} {"train_loss": -6.362915992736816, "global_step": 98887, "epoch": 2354} {"train_loss": -6.317979335784912, "global_step": 98888, "epoch": 2354} {"train_loss": -6.24782657623291, "global_step": 98889, "epoch": 2354} {"train_loss": -6.2719621658325195, "global_step": 98890, "epoch": 2354} {"train_loss": -6.2693562507629395, "global_step": 98891, "epoch": 2354} {"train_loss": -6.25074577331543, "global_step": 98892, "epoch": 2354} {"train_loss": -6.340526103973389, "global_step": 98893, "epoch": 2354} {"train_loss": -6.36030387878418, "global_step": 98894, "epoch": 2354} {"train_loss": -6.41928243637085, "global_step": 98895, "epoch": 2354} {"train_loss": -6.406152248382568, "global_step": 98896, "epoch": 2354} {"train_loss": -6.413674354553223, "global_step": 98897, "epoch": 2354} {"train_loss": -6.30488395690918, "global_step": 98898, "epoch": 2354} {"train_loss": -6.358267784118652, "global_step": 98899, "epoch": 2354} {"train_loss": -6.364063262939453, "global_step": 98900, "epoch": 2354} {"train_loss": -6.23087215423584, "global_step": 98901, "epoch": 2354} {"train_loss": -6.317593097686768, "global_step": 98902, "epoch": 2354} {"train_loss": -6.4510955810546875, "global_step": 98903, "epoch": 2354} {"train_loss": -6.263408660888672, "global_step": 98904, "epoch": 2354} {"train_loss": -6.253433704376221, "global_step": 98905, "epoch": 2354} {"train_loss": -6.272664546966553, "global_step": 98906, "epoch": 2354} {"train_loss": -6.3668060302734375, "global_step": 98907, "epoch": 2354} {"train_loss": -6.452944755554199, "global_step": 98908, "epoch": 2354} {"train_loss": -6.32327877907526, "global_step": 98909, "epoch": 2354, "val_loss": 68017.21875} {"train_loss": -6.451287269592285, "global_step": 98910, "epoch": 2355} {"train_loss": -6.335360527038574, "global_step": 98911, "epoch": 2355} {"train_loss": -6.401369571685791, "global_step": 98912, "epoch": 2355} {"train_loss": -6.368350982666016, "global_step": 98913, "epoch": 2355} {"train_loss": -6.314315319061279, "global_step": 98914, "epoch": 2355} {"train_loss": -6.292119979858398, "global_step": 98915, "epoch": 2355} {"train_loss": -6.294553279876709, "global_step": 98916, "epoch": 2355} {"train_loss": -6.389536380767822, "global_step": 98917, "epoch": 2355} {"train_loss": -6.258022308349609, "global_step": 98918, "epoch": 2355} {"train_loss": -6.47930908203125, "global_step": 98919, "epoch": 2355} {"train_loss": -6.406162261962891, "global_step": 98920, "epoch": 2355} {"train_loss": -6.377312660217285, "global_step": 98921, "epoch": 2355} {"train_loss": -6.413308143615723, "global_step": 98922, "epoch": 2355} {"train_loss": -6.408524513244629, "global_step": 98923, "epoch": 2355} {"train_loss": -6.415729522705078, "global_step": 98924, "epoch": 2355} {"train_loss": -6.300992488861084, "global_step": 98925, "epoch": 2355} {"train_loss": -6.399443626403809, "global_step": 98926, "epoch": 2355} {"train_loss": -6.271417617797852, "global_step": 98927, "epoch": 2355} {"train_loss": -6.3267502784729, "global_step": 98928, "epoch": 2355} {"train_loss": -6.282417297363281, "global_step": 98929, "epoch": 2355} {"train_loss": -6.358920097351074, "global_step": 98930, "epoch": 2355} {"train_loss": -6.321163177490234, "global_step": 98931, "epoch": 2355} {"train_loss": -6.345310688018799, "global_step": 98932, "epoch": 2355} {"train_loss": -6.277840614318848, "global_step": 98933, "epoch": 2355} {"train_loss": -6.486720085144043, "global_step": 98934, "epoch": 2355} {"train_loss": -6.3391008377075195, "global_step": 98935, "epoch": 2355} {"train_loss": -6.394671440124512, "global_step": 98936, "epoch": 2355} {"train_loss": -6.1212921142578125, "global_step": 98937, "epoch": 2355} {"train_loss": -6.4164276123046875, "global_step": 98938, "epoch": 2355} {"train_loss": -6.354067802429199, "global_step": 98939, "epoch": 2355} {"train_loss": -6.268013000488281, "global_step": 98940, "epoch": 2355} {"train_loss": -6.365706443786621, "global_step": 98941, "epoch": 2355} {"train_loss": -6.3129119873046875, "global_step": 98942, "epoch": 2355} {"train_loss": -6.392644882202148, "global_step": 98943, "epoch": 2355} {"train_loss": -6.384746551513672, "global_step": 98944, "epoch": 2355} {"train_loss": -6.393451690673828, "global_step": 98945, "epoch": 2355} {"train_loss": -6.303868293762207, "global_step": 98946, "epoch": 2355} {"train_loss": -6.38702392578125, "global_step": 98947, "epoch": 2355} {"train_loss": -6.29448938369751, "global_step": 98948, "epoch": 2355} {"train_loss": -6.264463424682617, "global_step": 98949, "epoch": 2355} {"train_loss": -6.287300109863281, "global_step": 98950, "epoch": 2355} {"train_loss": -6.346973419189453, "global_step": 98951, "epoch": 2355, "val_loss": 67800.5390625} {"train_loss": -6.308423042297363, "global_step": 98952, "epoch": 2356} {"train_loss": -6.342904567718506, "global_step": 98953, "epoch": 2356} {"train_loss": -6.344052791595459, "global_step": 98954, "epoch": 2356} {"train_loss": -6.201354026794434, "global_step": 98955, "epoch": 2356} {"train_loss": -6.393242835998535, "global_step": 98956, "epoch": 2356} {"train_loss": -6.406365394592285, "global_step": 98957, "epoch": 2356} {"train_loss": -6.334256649017334, "global_step": 98958, "epoch": 2356} {"train_loss": -6.312351226806641, "global_step": 98959, "epoch": 2356} {"train_loss": -6.242889881134033, "global_step": 98960, "epoch": 2356} {"train_loss": -6.394057750701904, "global_step": 98961, "epoch": 2356} {"train_loss": -6.44379997253418, "global_step": 98962, "epoch": 2356} {"train_loss": -6.2808837890625, "global_step": 98963, "epoch": 2356} {"train_loss": -6.293422222137451, "global_step": 98964, "epoch": 2356} {"train_loss": -6.300759792327881, "global_step": 98965, "epoch": 2356} {"train_loss": -6.311589241027832, "global_step": 98966, "epoch": 2356} {"train_loss": -6.3939528465271, "global_step": 98967, "epoch": 2356} {"train_loss": -6.476780891418457, "global_step": 98968, "epoch": 2356} {"train_loss": -6.232095241546631, "global_step": 98969, "epoch": 2356} {"train_loss": -6.342167377471924, "global_step": 98970, "epoch": 2356} {"train_loss": -6.195314884185791, "global_step": 98971, "epoch": 2356} {"train_loss": -6.311331748962402, "global_step": 98972, "epoch": 2356} {"train_loss": -6.433810710906982, "global_step": 98973, "epoch": 2356} {"train_loss": -6.260373592376709, "global_step": 98974, "epoch": 2356} {"train_loss": -6.359752655029297, "global_step": 98975, "epoch": 2356} {"train_loss": -6.285860061645508, "global_step": 98976, "epoch": 2356} {"train_loss": -6.1979522705078125, "global_step": 98977, "epoch": 2356} {"train_loss": -6.3534979820251465, "global_step": 98978, "epoch": 2356} {"train_loss": -6.376626014709473, "global_step": 98979, "epoch": 2356} {"train_loss": -6.375579833984375, "global_step": 98980, "epoch": 2356} {"train_loss": -6.2739410400390625, "global_step": 98981, "epoch": 2356} {"train_loss": -6.2392425537109375, "global_step": 98982, "epoch": 2356} {"train_loss": -6.2774553298950195, "global_step": 98983, "epoch": 2356} {"train_loss": -6.265143394470215, "global_step": 98984, "epoch": 2356} {"train_loss": -6.115480899810791, "global_step": 98985, "epoch": 2356} {"train_loss": -6.1328020095825195, "global_step": 98986, "epoch": 2356} {"train_loss": -6.123790264129639, "global_step": 98987, "epoch": 2356} {"train_loss": -6.157871723175049, "global_step": 98988, "epoch": 2356} {"train_loss": -5.958874702453613, "global_step": 98989, "epoch": 2356} {"train_loss": -6.184346675872803, "global_step": 98990, "epoch": 2356} {"train_loss": -6.089053630828857, "global_step": 98991, "epoch": 2356} {"train_loss": -6.129695892333984, "global_step": 98992, "epoch": 2356} {"train_loss": -6.278930652709234, "global_step": 98993, "epoch": 2356, "val_loss": 67989.46875} {"train_loss": -6.195559501647949, "global_step": 98994, "epoch": 2357} {"train_loss": -6.156850337982178, "global_step": 98995, "epoch": 2357} {"train_loss": -6.12207555770874, "global_step": 98996, "epoch": 2357} {"train_loss": -6.206634521484375, "global_step": 98997, "epoch": 2357} {"train_loss": -6.277170658111572, "global_step": 98998, "epoch": 2357} {"train_loss": -6.20759391784668, "global_step": 98999, "epoch": 2357} {"train_loss": -6.254998683929443, "global_step": 99000, "epoch": 2357} {"train_loss": -6.218906402587891, "global_step": 99001, "epoch": 2357} {"train_loss": -6.251760005950928, "global_step": 99002, "epoch": 2357} {"train_loss": -6.252712726593018, "global_step": 99003, "epoch": 2357} {"train_loss": -6.326866626739502, "global_step": 99004, "epoch": 2357} {"train_loss": -6.304401874542236, "global_step": 99005, "epoch": 2357} {"train_loss": -6.1566057205200195, "global_step": 99006, "epoch": 2357} {"train_loss": -6.230241775512695, "global_step": 99007, "epoch": 2357} {"train_loss": -6.3655500411987305, "global_step": 99008, "epoch": 2357} {"train_loss": -6.270182132720947, "global_step": 99009, "epoch": 2357} {"train_loss": -6.322442054748535, "global_step": 99010, "epoch": 2357} {"train_loss": -6.35885763168335, "global_step": 99011, "epoch": 2357} {"train_loss": -6.360135078430176, "global_step": 99012, "epoch": 2357} {"train_loss": -6.293632507324219, "global_step": 99013, "epoch": 2357} {"train_loss": -6.446629524230957, "global_step": 99014, "epoch": 2357} {"train_loss": -6.2950439453125, "global_step": 99015, "epoch": 2357} {"train_loss": -6.335485458374023, "global_step": 99016, "epoch": 2357} {"train_loss": -6.363600730895996, "global_step": 99017, "epoch": 2357} {"train_loss": -6.336388111114502, "global_step": 99018, "epoch": 2357} {"train_loss": -6.277659893035889, "global_step": 99019, "epoch": 2357} {"train_loss": -6.421023368835449, "global_step": 99020, "epoch": 2357} {"train_loss": -6.396018028259277, "global_step": 99021, "epoch": 2357} {"train_loss": -6.2788190841674805, "global_step": 99022, "epoch": 2357} {"train_loss": -6.357414722442627, "global_step": 99023, "epoch": 2357} {"train_loss": -6.356942176818848, "global_step": 99024, "epoch": 2357} {"train_loss": -6.338659286499023, "global_step": 99025, "epoch": 2357} {"train_loss": -6.325874328613281, "global_step": 99026, "epoch": 2357} {"train_loss": -6.3712158203125, "global_step": 99027, "epoch": 2357} {"train_loss": -6.326192378997803, "global_step": 99028, "epoch": 2357} {"train_loss": -6.348739147186279, "global_step": 99029, "epoch": 2357} {"train_loss": -6.28325080871582, "global_step": 99030, "epoch": 2357} {"train_loss": -6.316370964050293, "global_step": 99031, "epoch": 2357} {"train_loss": -6.333649635314941, "global_step": 99032, "epoch": 2357} {"train_loss": -6.206630706787109, "global_step": 99033, "epoch": 2357} {"train_loss": -6.27530574798584, "global_step": 99034, "epoch": 2357} {"train_loss": -6.295086554118565, "global_step": 99035, "epoch": 2357, "val_loss": 67934.546875} {"train_loss": -6.296540260314941, "global_step": 99036, "epoch": 2358} {"train_loss": -6.176000118255615, "global_step": 99037, "epoch": 2358} {"train_loss": -6.45762825012207, "global_step": 99038, "epoch": 2358} {"train_loss": -6.312355041503906, "global_step": 99039, "epoch": 2358} {"train_loss": -6.325289726257324, "global_step": 99040, "epoch": 2358} {"train_loss": -6.368039131164551, "global_step": 99041, "epoch": 2358} {"train_loss": -6.2312421798706055, "global_step": 99042, "epoch": 2358} {"train_loss": -6.419746398925781, "global_step": 99043, "epoch": 2358} {"train_loss": -6.251221179962158, "global_step": 99044, "epoch": 2358} {"train_loss": -6.365897178649902, "global_step": 99045, "epoch": 2358} {"train_loss": -6.316664218902588, "global_step": 99046, "epoch": 2358} {"train_loss": -6.372325897216797, "global_step": 99047, "epoch": 2358} {"train_loss": -6.242907524108887, "global_step": 99048, "epoch": 2358} {"train_loss": -6.187984943389893, "global_step": 99049, "epoch": 2358} {"train_loss": -6.226862907409668, "global_step": 99050, "epoch": 2358} {"train_loss": -6.235278606414795, "global_step": 99051, "epoch": 2358} {"train_loss": -6.338873386383057, "global_step": 99052, "epoch": 2358} {"train_loss": -6.402001857757568, "global_step": 99053, "epoch": 2358} {"train_loss": -6.322056770324707, "global_step": 99054, "epoch": 2358} {"train_loss": -6.341104507446289, "global_step": 99055, "epoch": 2358} {"train_loss": -6.3420915603637695, "global_step": 99056, "epoch": 2358} {"train_loss": -6.4428205490112305, "global_step": 99057, "epoch": 2358} {"train_loss": -6.270367622375488, "global_step": 99058, "epoch": 2358} {"train_loss": -6.311426639556885, "global_step": 99059, "epoch": 2358} {"train_loss": -6.408671855926514, "global_step": 99060, "epoch": 2358} {"train_loss": -6.328282356262207, "global_step": 99061, "epoch": 2358} {"train_loss": -6.29149866104126, "global_step": 99062, "epoch": 2358} {"train_loss": -6.407127380371094, "global_step": 99063, "epoch": 2358} {"train_loss": -6.424171447753906, "global_step": 99064, "epoch": 2358} {"train_loss": -6.265018463134766, "global_step": 99065, "epoch": 2358} {"train_loss": -6.281219482421875, "global_step": 99066, "epoch": 2358} {"train_loss": -6.285741329193115, "global_step": 99067, "epoch": 2358} {"train_loss": -6.218481540679932, "global_step": 99068, "epoch": 2358} {"train_loss": -6.279059410095215, "global_step": 99069, "epoch": 2358} {"train_loss": -6.369359970092773, "global_step": 99070, "epoch": 2358} {"train_loss": -6.342703819274902, "global_step": 99071, "epoch": 2358} {"train_loss": -6.214168548583984, "global_step": 99072, "epoch": 2358} {"train_loss": -6.23111629486084, "global_step": 99073, "epoch": 2358} {"train_loss": -6.418241500854492, "global_step": 99074, "epoch": 2358} {"train_loss": -6.255279541015625, "global_step": 99075, "epoch": 2358} {"train_loss": -6.373335838317871, "global_step": 99076, "epoch": 2358} {"train_loss": -6.317397412799654, "global_step": 99077, "epoch": 2358, "val_loss": 68146.7578125} {"train_loss": -6.267498970031738, "global_step": 99078, "epoch": 2359} {"train_loss": -6.386544704437256, "global_step": 99079, "epoch": 2359} {"train_loss": -6.347840309143066, "global_step": 99080, "epoch": 2359} {"train_loss": -6.384126663208008, "global_step": 99081, "epoch": 2359} {"train_loss": -6.30328369140625, "global_step": 99082, "epoch": 2359} {"train_loss": -6.344270706176758, "global_step": 99083, "epoch": 2359} {"train_loss": -6.329641819000244, "global_step": 99084, "epoch": 2359} {"train_loss": -6.3392510414123535, "global_step": 99085, "epoch": 2359} {"train_loss": -6.296932697296143, "global_step": 99086, "epoch": 2359} {"train_loss": -6.2311506271362305, "global_step": 99087, "epoch": 2359} {"train_loss": -6.365578651428223, "global_step": 99088, "epoch": 2359} {"train_loss": -6.303783893585205, "global_step": 99089, "epoch": 2359} {"train_loss": -6.366285800933838, "global_step": 99090, "epoch": 2359} {"train_loss": -6.30522346496582, "global_step": 99091, "epoch": 2359} {"train_loss": -6.18070650100708, "global_step": 99092, "epoch": 2359} {"train_loss": -6.402499675750732, "global_step": 99093, "epoch": 2359} {"train_loss": -6.319243431091309, "global_step": 99094, "epoch": 2359} {"train_loss": -6.129374980926514, "global_step": 99095, "epoch": 2359} {"train_loss": -6.401297092437744, "global_step": 99096, "epoch": 2359} {"train_loss": -6.225740432739258, "global_step": 99097, "epoch": 2359} {"train_loss": -6.241529941558838, "global_step": 99098, "epoch": 2359} {"train_loss": -6.312582015991211, "global_step": 99099, "epoch": 2359} {"train_loss": -6.2755279541015625, "global_step": 99100, "epoch": 2359} {"train_loss": -6.259061813354492, "global_step": 99101, "epoch": 2359} {"train_loss": -6.207520484924316, "global_step": 99102, "epoch": 2359} {"train_loss": -6.300198554992676, "global_step": 99103, "epoch": 2359} {"train_loss": -6.247299671173096, "global_step": 99104, "epoch": 2359} {"train_loss": -6.29705810546875, "global_step": 99105, "epoch": 2359} {"train_loss": -6.3895487785339355, "global_step": 99106, "epoch": 2359} {"train_loss": -6.195647239685059, "global_step": 99107, "epoch": 2359} {"train_loss": -6.194243431091309, "global_step": 99108, "epoch": 2359} {"train_loss": -6.289563179016113, "global_step": 99109, "epoch": 2359} {"train_loss": -6.243783950805664, "global_step": 99110, "epoch": 2359} {"train_loss": -6.374920845031738, "global_step": 99111, "epoch": 2359} {"train_loss": -6.288167953491211, "global_step": 99112, "epoch": 2359} {"train_loss": -6.386490821838379, "global_step": 99113, "epoch": 2359} {"train_loss": -6.235105991363525, "global_step": 99114, "epoch": 2359} {"train_loss": -6.200875759124756, "global_step": 99115, "epoch": 2359} {"train_loss": -6.356833457946777, "global_step": 99116, "epoch": 2359} {"train_loss": -6.41880464553833, "global_step": 99117, "epoch": 2359} {"train_loss": -6.306632995605469, "global_step": 99118, "epoch": 2359} {"train_loss": -6.300274758111863, "global_step": 99119, "epoch": 2359, "val_loss": 67897.640625} {"train_loss": -6.339090347290039, "global_step": 99120, "epoch": 2360} {"train_loss": -6.271164417266846, "global_step": 99121, "epoch": 2360} {"train_loss": -6.389801979064941, "global_step": 99122, "epoch": 2360} {"train_loss": -6.319024085998535, "global_step": 99123, "epoch": 2360} {"train_loss": -6.401681900024414, "global_step": 99124, "epoch": 2360} {"train_loss": -6.335691928863525, "global_step": 99125, "epoch": 2360} {"train_loss": -6.298283576965332, "global_step": 99126, "epoch": 2360} {"train_loss": -6.232285499572754, "global_step": 99127, "epoch": 2360} {"train_loss": -6.335024356842041, "global_step": 99128, "epoch": 2360} {"train_loss": -6.3238725662231445, "global_step": 99129, "epoch": 2360} {"train_loss": -6.42401647567749, "global_step": 99130, "epoch": 2360} {"train_loss": -6.4321441650390625, "global_step": 99131, "epoch": 2360} {"train_loss": -6.266993522644043, "global_step": 99132, "epoch": 2360} {"train_loss": -6.339506149291992, "global_step": 99133, "epoch": 2360} {"train_loss": -6.299825668334961, "global_step": 99134, "epoch": 2360} {"train_loss": -6.356230735778809, "global_step": 99135, "epoch": 2360} {"train_loss": -6.335532188415527, "global_step": 99136, "epoch": 2360} {"train_loss": -6.329174041748047, "global_step": 99137, "epoch": 2360} {"train_loss": -6.283268451690674, "global_step": 99138, "epoch": 2360} {"train_loss": -6.252203941345215, "global_step": 99139, "epoch": 2360} {"train_loss": -6.4224395751953125, "global_step": 99140, "epoch": 2360} {"train_loss": -6.264731407165527, "global_step": 99141, "epoch": 2360} {"train_loss": -6.282018661499023, "global_step": 99142, "epoch": 2360} {"train_loss": -6.260323524475098, "global_step": 99143, "epoch": 2360} {"train_loss": -6.306768417358398, "global_step": 99144, "epoch": 2360} {"train_loss": -6.334072113037109, "global_step": 99145, "epoch": 2360} {"train_loss": -6.36496114730835, "global_step": 99146, "epoch": 2360} {"train_loss": -6.386349678039551, "global_step": 99147, "epoch": 2360} {"train_loss": -6.296847343444824, "global_step": 99148, "epoch": 2360} {"train_loss": -6.352631092071533, "global_step": 99149, "epoch": 2360} {"train_loss": -6.30286979675293, "global_step": 99150, "epoch": 2360} {"train_loss": -6.184323787689209, "global_step": 99151, "epoch": 2360} {"train_loss": -6.300798416137695, "global_step": 99152, "epoch": 2360} {"train_loss": -6.3245673179626465, "global_step": 99153, "epoch": 2360} {"train_loss": -6.354447364807129, "global_step": 99154, "epoch": 2360} {"train_loss": -6.3778886795043945, "global_step": 99155, "epoch": 2360} {"train_loss": -6.337817192077637, "global_step": 99156, "epoch": 2360} {"train_loss": -6.251075744628906, "global_step": 99157, "epoch": 2360} {"train_loss": -6.328644275665283, "global_step": 99158, "epoch": 2360} {"train_loss": -6.323781967163086, "global_step": 99159, "epoch": 2360} {"train_loss": -6.267764568328857, "global_step": 99160, "epoch": 2360} {"train_loss": -6.32253707022894, "global_step": 99161, "epoch": 2360, "val_loss": 67778.4921875} {"train_loss": -6.437651634216309, "global_step": 99162, "epoch": 2361} {"train_loss": -6.3666462898254395, "global_step": 99163, "epoch": 2361} {"train_loss": -6.399397850036621, "global_step": 99164, "epoch": 2361} {"train_loss": -6.276072978973389, "global_step": 99165, "epoch": 2361} {"train_loss": -6.389321327209473, "global_step": 99166, "epoch": 2361} {"train_loss": -6.35089635848999, "global_step": 99167, "epoch": 2361} {"train_loss": -6.327143669128418, "global_step": 99168, "epoch": 2361} {"train_loss": -6.353536605834961, "global_step": 99169, "epoch": 2361} {"train_loss": -6.358789443969727, "global_step": 99170, "epoch": 2361} {"train_loss": -6.340288162231445, "global_step": 99171, "epoch": 2361} {"train_loss": -6.325336933135986, "global_step": 99172, "epoch": 2361} {"train_loss": -6.261318683624268, "global_step": 99173, "epoch": 2361} {"train_loss": -6.415946006774902, "global_step": 99174, "epoch": 2361} {"train_loss": -6.370254993438721, "global_step": 99175, "epoch": 2361} {"train_loss": -6.25916051864624, "global_step": 99176, "epoch": 2361} {"train_loss": -6.289389610290527, "global_step": 99177, "epoch": 2361} {"train_loss": -6.414826393127441, "global_step": 99178, "epoch": 2361} {"train_loss": -6.3936872482299805, "global_step": 99179, "epoch": 2361} {"train_loss": -6.51938533782959, "global_step": 99180, "epoch": 2361} {"train_loss": -6.375820159912109, "global_step": 99181, "epoch": 2361} {"train_loss": -6.427136421203613, "global_step": 99182, "epoch": 2361} {"train_loss": -6.324931621551514, "global_step": 99183, "epoch": 2361} {"train_loss": -6.394100189208984, "global_step": 99184, "epoch": 2361} {"train_loss": -6.3090667724609375, "global_step": 99185, "epoch": 2361} {"train_loss": -6.40142297744751, "global_step": 99186, "epoch": 2361} {"train_loss": -6.421219825744629, "global_step": 99187, "epoch": 2361} {"train_loss": -6.415914535522461, "global_step": 99188, "epoch": 2361} {"train_loss": -6.517942428588867, "global_step": 99189, "epoch": 2361} {"train_loss": -6.3522443771362305, "global_step": 99190, "epoch": 2361} {"train_loss": -6.242039680480957, "global_step": 99191, "epoch": 2361} {"train_loss": -6.318173885345459, "global_step": 99192, "epoch": 2361} {"train_loss": -6.35159158706665, "global_step": 99193, "epoch": 2361} {"train_loss": -6.318700313568115, "global_step": 99194, "epoch": 2361} {"train_loss": -6.312626838684082, "global_step": 99195, "epoch": 2361} {"train_loss": -6.330959320068359, "global_step": 99196, "epoch": 2361} {"train_loss": -6.262578964233398, "global_step": 99197, "epoch": 2361} {"train_loss": -6.282515525817871, "global_step": 99198, "epoch": 2361} {"train_loss": -6.329751014709473, "global_step": 99199, "epoch": 2361} {"train_loss": -6.281198501586914, "global_step": 99200, "epoch": 2361} {"train_loss": -6.334729194641113, "global_step": 99201, "epoch": 2361} {"train_loss": -6.391566276550293, "global_step": 99202, "epoch": 2361} {"train_loss": -6.355839854195004, "global_step": 99203, "epoch": 2361, "val_loss": 67815.015625} {"train_loss": -6.2706499099731445, "global_step": 99204, "epoch": 2362} {"train_loss": -6.388017654418945, "global_step": 99205, "epoch": 2362} {"train_loss": -6.359701156616211, "global_step": 99206, "epoch": 2362} {"train_loss": -6.201247215270996, "global_step": 99207, "epoch": 2362} {"train_loss": -6.427328586578369, "global_step": 99208, "epoch": 2362} {"train_loss": -6.407491683959961, "global_step": 99209, "epoch": 2362} {"train_loss": -6.275143146514893, "global_step": 99210, "epoch": 2362} {"train_loss": -6.333495140075684, "global_step": 99211, "epoch": 2362} {"train_loss": -6.394096374511719, "global_step": 99212, "epoch": 2362} {"train_loss": -6.243844985961914, "global_step": 99213, "epoch": 2362} {"train_loss": -6.354931354522705, "global_step": 99214, "epoch": 2362} {"train_loss": -6.351986408233643, "global_step": 99215, "epoch": 2362} {"train_loss": -6.301693916320801, "global_step": 99216, "epoch": 2362} {"train_loss": -6.354459762573242, "global_step": 99217, "epoch": 2362} {"train_loss": -6.444580554962158, "global_step": 99218, "epoch": 2362} {"train_loss": -6.351049900054932, "global_step": 99219, "epoch": 2362} {"train_loss": -6.324244499206543, "global_step": 99220, "epoch": 2362} {"train_loss": -6.366698265075684, "global_step": 99221, "epoch": 2362} {"train_loss": -6.283746242523193, "global_step": 99222, "epoch": 2362} {"train_loss": -6.351283073425293, "global_step": 99223, "epoch": 2362} {"train_loss": -6.3267316818237305, "global_step": 99224, "epoch": 2362} {"train_loss": -6.360786437988281, "global_step": 99225, "epoch": 2362} {"train_loss": -6.305368423461914, "global_step": 99226, "epoch": 2362} {"train_loss": -6.258643627166748, "global_step": 99227, "epoch": 2362} {"train_loss": -6.340696334838867, "global_step": 99228, "epoch": 2362} {"train_loss": -6.287389755249023, "global_step": 99229, "epoch": 2362} {"train_loss": -6.444349765777588, "global_step": 99230, "epoch": 2362} {"train_loss": -6.389394760131836, "global_step": 99231, "epoch": 2362} {"train_loss": -6.328316688537598, "global_step": 99232, "epoch": 2362} {"train_loss": -6.458885669708252, "global_step": 99233, "epoch": 2362} {"train_loss": -6.199073314666748, "global_step": 99234, "epoch": 2362} {"train_loss": -6.361680507659912, "global_step": 99235, "epoch": 2362} {"train_loss": -6.18295431137085, "global_step": 99236, "epoch": 2362} {"train_loss": -6.309943199157715, "global_step": 99237, "epoch": 2362} {"train_loss": -6.393093109130859, "global_step": 99238, "epoch": 2362} {"train_loss": -6.411789417266846, "global_step": 99239, "epoch": 2362} {"train_loss": -6.360129356384277, "global_step": 99240, "epoch": 2362} {"train_loss": -6.316289901733398, "global_step": 99241, "epoch": 2362} {"train_loss": -6.377243995666504, "global_step": 99242, "epoch": 2362} {"train_loss": -6.380550384521484, "global_step": 99243, "epoch": 2362} {"train_loss": -6.294095993041992, "global_step": 99244, "epoch": 2362} {"train_loss": -6.338612454278128, "global_step": 99245, "epoch": 2362, "val_loss": 67911.859375} {"train_loss": -6.339303016662598, "global_step": 99246, "epoch": 2363} {"train_loss": -6.433723449707031, "global_step": 99247, "epoch": 2363} {"train_loss": -6.39859676361084, "global_step": 99248, "epoch": 2363} {"train_loss": -6.453029632568359, "global_step": 99249, "epoch": 2363} {"train_loss": -6.390491962432861, "global_step": 99250, "epoch": 2363} {"train_loss": -6.410353183746338, "global_step": 99251, "epoch": 2363} {"train_loss": -6.277150630950928, "global_step": 99252, "epoch": 2363} {"train_loss": -6.349701881408691, "global_step": 99253, "epoch": 2363} {"train_loss": -6.336157321929932, "global_step": 99254, "epoch": 2363} {"train_loss": -6.419388294219971, "global_step": 99255, "epoch": 2363} {"train_loss": -6.276293754577637, "global_step": 99256, "epoch": 2363} {"train_loss": -6.449820518493652, "global_step": 99257, "epoch": 2363} {"train_loss": -6.333782196044922, "global_step": 99258, "epoch": 2363} {"train_loss": -6.341238975524902, "global_step": 99259, "epoch": 2363} {"train_loss": -6.271425247192383, "global_step": 99260, "epoch": 2363} {"train_loss": -6.336061477661133, "global_step": 99261, "epoch": 2363} {"train_loss": -6.243565559387207, "global_step": 99262, "epoch": 2363} {"train_loss": -6.300932884216309, "global_step": 99263, "epoch": 2363} {"train_loss": -6.259378433227539, "global_step": 99264, "epoch": 2363} {"train_loss": -6.30052375793457, "global_step": 99265, "epoch": 2363} {"train_loss": -6.147957801818848, "global_step": 99266, "epoch": 2363} {"train_loss": -6.3907880783081055, "global_step": 99267, "epoch": 2363} {"train_loss": -6.3445305824279785, "global_step": 99268, "epoch": 2363} {"train_loss": -6.327404022216797, "global_step": 99269, "epoch": 2363} {"train_loss": -6.381817817687988, "global_step": 99270, "epoch": 2363} {"train_loss": -6.254417896270752, "global_step": 99271, "epoch": 2363} {"train_loss": -6.368492126464844, "global_step": 99272, "epoch": 2363} {"train_loss": -6.355246067047119, "global_step": 99273, "epoch": 2363} {"train_loss": -6.348271369934082, "global_step": 99274, "epoch": 2363} {"train_loss": -6.481509208679199, "global_step": 99275, "epoch": 2363} {"train_loss": -6.208756923675537, "global_step": 99276, "epoch": 2363} {"train_loss": -6.256241321563721, "global_step": 99277, "epoch": 2363} {"train_loss": -6.285080909729004, "global_step": 99278, "epoch": 2363} {"train_loss": -6.343206882476807, "global_step": 99279, "epoch": 2363} {"train_loss": -6.3427534103393555, "global_step": 99280, "epoch": 2363} {"train_loss": -6.407846450805664, "global_step": 99281, "epoch": 2363} {"train_loss": -6.342967987060547, "global_step": 99282, "epoch": 2363} {"train_loss": -6.332887649536133, "global_step": 99283, "epoch": 2363} {"train_loss": -6.296810626983643, "global_step": 99284, "epoch": 2363} {"train_loss": -6.378636360168457, "global_step": 99285, "epoch": 2363} {"train_loss": -6.421020984649658, "global_step": 99286, "epoch": 2363} {"train_loss": -6.341409546988351, "global_step": 99287, "epoch": 2363, "val_loss": 67850.5546875} {"train_loss": -6.235936164855957, "global_step": 99288, "epoch": 2364} {"train_loss": -6.346057415008545, "global_step": 99289, "epoch": 2364} {"train_loss": -6.291668891906738, "global_step": 99290, "epoch": 2364} {"train_loss": -6.286847114562988, "global_step": 99291, "epoch": 2364} {"train_loss": -6.388686180114746, "global_step": 99292, "epoch": 2364} {"train_loss": -6.396422386169434, "global_step": 99293, "epoch": 2364} {"train_loss": -6.3554582595825195, "global_step": 99294, "epoch": 2364} {"train_loss": -6.276505470275879, "global_step": 99295, "epoch": 2364} {"train_loss": -6.271917819976807, "global_step": 99296, "epoch": 2364} {"train_loss": -6.3643879890441895, "global_step": 99297, "epoch": 2364} {"train_loss": -6.367959976196289, "global_step": 99298, "epoch": 2364} {"train_loss": -6.300943851470947, "global_step": 99299, "epoch": 2364} {"train_loss": -6.318524360656738, "global_step": 99300, "epoch": 2364} {"train_loss": -6.306344032287598, "global_step": 99301, "epoch": 2364} {"train_loss": -6.302420139312744, "global_step": 99302, "epoch": 2364} {"train_loss": -6.382929801940918, "global_step": 99303, "epoch": 2364} {"train_loss": -6.3230414390563965, "global_step": 99304, "epoch": 2364} {"train_loss": -6.338755130767822, "global_step": 99305, "epoch": 2364} {"train_loss": -6.37741231918335, "global_step": 99306, "epoch": 2364} {"train_loss": -6.38138484954834, "global_step": 99307, "epoch": 2364} {"train_loss": -6.426915168762207, "global_step": 99308, "epoch": 2364} {"train_loss": -6.3012895584106445, "global_step": 99309, "epoch": 2364} {"train_loss": -6.428044319152832, "global_step": 99310, "epoch": 2364} {"train_loss": -6.319086074829102, "global_step": 99311, "epoch": 2364} {"train_loss": -6.294704914093018, "global_step": 99312, "epoch": 2364} {"train_loss": -6.291820526123047, "global_step": 99313, "epoch": 2364} {"train_loss": -6.274093151092529, "global_step": 99314, "epoch": 2364} {"train_loss": -6.337080955505371, "global_step": 99315, "epoch": 2364} {"train_loss": -6.407817363739014, "global_step": 99316, "epoch": 2364} {"train_loss": -6.189550876617432, "global_step": 99317, "epoch": 2364} {"train_loss": -6.273575305938721, "global_step": 99318, "epoch": 2364} {"train_loss": -6.343260765075684, "global_step": 99319, "epoch": 2364} {"train_loss": -6.345858573913574, "global_step": 99320, "epoch": 2364} {"train_loss": -6.273897171020508, "global_step": 99321, "epoch": 2364} {"train_loss": -6.407471656799316, "global_step": 99322, "epoch": 2364} {"train_loss": -6.333004474639893, "global_step": 99323, "epoch": 2364} {"train_loss": -6.255627155303955, "global_step": 99324, "epoch": 2364} {"train_loss": -6.479693412780762, "global_step": 99325, "epoch": 2364} {"train_loss": -6.327535152435303, "global_step": 99326, "epoch": 2364} {"train_loss": -6.356146335601807, "global_step": 99327, "epoch": 2364} {"train_loss": -6.318381309509277, "global_step": 99328, "epoch": 2364} {"train_loss": -6.331421363921392, "global_step": 99329, "epoch": 2364, "val_loss": 67881.234375} {"train_loss": -6.294127941131592, "global_step": 99330, "epoch": 2365} {"train_loss": -6.333004951477051, "global_step": 99331, "epoch": 2365} {"train_loss": -6.297181129455566, "global_step": 99332, "epoch": 2365} {"train_loss": -6.492496967315674, "global_step": 99333, "epoch": 2365} {"train_loss": -6.391838073730469, "global_step": 99334, "epoch": 2365} {"train_loss": -6.345751762390137, "global_step": 99335, "epoch": 2365} {"train_loss": -6.268454551696777, "global_step": 99336, "epoch": 2365} {"train_loss": -6.305352210998535, "global_step": 99337, "epoch": 2365} {"train_loss": -6.372331142425537, "global_step": 99338, "epoch": 2365} {"train_loss": -6.258222579956055, "global_step": 99339, "epoch": 2365} {"train_loss": -6.379456996917725, "global_step": 99340, "epoch": 2365} {"train_loss": -6.311615943908691, "global_step": 99341, "epoch": 2365} {"train_loss": -6.347289085388184, "global_step": 99342, "epoch": 2365} {"train_loss": -6.305569171905518, "global_step": 99343, "epoch": 2365} {"train_loss": -6.349985599517822, "global_step": 99344, "epoch": 2365} {"train_loss": -6.245054721832275, "global_step": 99345, "epoch": 2365} {"train_loss": -6.392414093017578, "global_step": 99346, "epoch": 2365} {"train_loss": -6.393887519836426, "global_step": 99347, "epoch": 2365} {"train_loss": -6.268006801605225, "global_step": 99348, "epoch": 2365} {"train_loss": -6.357337474822998, "global_step": 99349, "epoch": 2365} {"train_loss": -6.412267208099365, "global_step": 99350, "epoch": 2365} {"train_loss": -6.420045375823975, "global_step": 99351, "epoch": 2365} {"train_loss": -6.3592963218688965, "global_step": 99352, "epoch": 2365} {"train_loss": -6.409064769744873, "global_step": 99353, "epoch": 2365} {"train_loss": -6.33997106552124, "global_step": 99354, "epoch": 2365} {"train_loss": -6.3168511390686035, "global_step": 99355, "epoch": 2365} {"train_loss": -6.335061073303223, "global_step": 99356, "epoch": 2365} {"train_loss": -6.335562705993652, "global_step": 99357, "epoch": 2365} {"train_loss": -6.324582099914551, "global_step": 99358, "epoch": 2365} {"train_loss": -6.399605751037598, "global_step": 99359, "epoch": 2365} {"train_loss": -6.312070369720459, "global_step": 99360, "epoch": 2365} {"train_loss": -6.303927421569824, "global_step": 99361, "epoch": 2365} {"train_loss": -6.233392238616943, "global_step": 99362, "epoch": 2365} {"train_loss": -6.354189395904541, "global_step": 99363, "epoch": 2365} {"train_loss": -6.437506675720215, "global_step": 99364, "epoch": 2365} {"train_loss": -6.382872104644775, "global_step": 99365, "epoch": 2365} {"train_loss": -6.465462684631348, "global_step": 99366, "epoch": 2365} {"train_loss": -6.391596794128418, "global_step": 99367, "epoch": 2365} {"train_loss": -6.348555088043213, "global_step": 99368, "epoch": 2365} {"train_loss": -6.318130970001221, "global_step": 99369, "epoch": 2365} {"train_loss": -6.376482963562012, "global_step": 99370, "epoch": 2365} {"train_loss": -6.347999107270014, "global_step": 99371, "epoch": 2365, "val_loss": 67903.6953125} {"train_loss": -6.335317611694336, "global_step": 99372, "epoch": 2366} {"train_loss": -6.41524600982666, "global_step": 99373, "epoch": 2366} {"train_loss": -6.434016227722168, "global_step": 99374, "epoch": 2366} {"train_loss": -6.394449710845947, "global_step": 99375, "epoch": 2366} {"train_loss": -6.248905181884766, "global_step": 99376, "epoch": 2366} {"train_loss": -6.413636207580566, "global_step": 99377, "epoch": 2366} {"train_loss": -6.526881694793701, "global_step": 99378, "epoch": 2366} {"train_loss": -6.466498851776123, "global_step": 99379, "epoch": 2366} {"train_loss": -6.507262229919434, "global_step": 99380, "epoch": 2366} {"train_loss": -6.320810317993164, "global_step": 99381, "epoch": 2366} {"train_loss": -6.33030891418457, "global_step": 99382, "epoch": 2366} {"train_loss": -6.412117004394531, "global_step": 99383, "epoch": 2366} {"train_loss": -6.257678985595703, "global_step": 99384, "epoch": 2366} {"train_loss": -6.484006881713867, "global_step": 99385, "epoch": 2366} {"train_loss": -6.3526787757873535, "global_step": 99386, "epoch": 2366} {"train_loss": -6.330533981323242, "global_step": 99387, "epoch": 2366} {"train_loss": -6.3897809982299805, "global_step": 99388, "epoch": 2366} {"train_loss": -6.350800037384033, "global_step": 99389, "epoch": 2366} {"train_loss": -6.444849967956543, "global_step": 99390, "epoch": 2366} {"train_loss": -6.4087324142456055, "global_step": 99391, "epoch": 2366} {"train_loss": -6.378077983856201, "global_step": 99392, "epoch": 2366} {"train_loss": -6.293409824371338, "global_step": 99393, "epoch": 2366} {"train_loss": -6.340572357177734, "global_step": 99394, "epoch": 2366} {"train_loss": -6.259244918823242, "global_step": 99395, "epoch": 2366} {"train_loss": -6.241750717163086, "global_step": 99396, "epoch": 2366} {"train_loss": -6.304627418518066, "global_step": 99397, "epoch": 2366} {"train_loss": -6.170032501220703, "global_step": 99398, "epoch": 2366} {"train_loss": -6.261307239532471, "global_step": 99399, "epoch": 2366} {"train_loss": -6.35457706451416, "global_step": 99400, "epoch": 2366} {"train_loss": -6.254517555236816, "global_step": 99401, "epoch": 2366} {"train_loss": -6.2238664627075195, "global_step": 99402, "epoch": 2366} {"train_loss": -6.33390998840332, "global_step": 99403, "epoch": 2366} {"train_loss": -6.2802042961120605, "global_step": 99404, "epoch": 2366} {"train_loss": -6.291424751281738, "global_step": 99405, "epoch": 2366} {"train_loss": -6.254421234130859, "global_step": 99406, "epoch": 2366} {"train_loss": -6.39746618270874, "global_step": 99407, "epoch": 2366} {"train_loss": -6.372839450836182, "global_step": 99408, "epoch": 2366} {"train_loss": -6.242582321166992, "global_step": 99409, "epoch": 2366} {"train_loss": -6.220106601715088, "global_step": 99410, "epoch": 2366} {"train_loss": -6.426525115966797, "global_step": 99411, "epoch": 2366} {"train_loss": -6.428495407104492, "global_step": 99412, "epoch": 2366} {"train_loss": -6.343771026248024, "global_step": 99413, "epoch": 2366, "val_loss": 67648.6875} {"train_loss": -6.34000301361084, "global_step": 99414, "epoch": 2367} {"train_loss": -6.4433488845825195, "global_step": 99415, "epoch": 2367} {"train_loss": -6.302743434906006, "global_step": 99416, "epoch": 2367} {"train_loss": -6.386653900146484, "global_step": 99417, "epoch": 2367} {"train_loss": -6.454964637756348, "global_step": 99418, "epoch": 2367} {"train_loss": -6.322683334350586, "global_step": 99419, "epoch": 2367} {"train_loss": -6.3258843421936035, "global_step": 99420, "epoch": 2367} {"train_loss": -6.235389232635498, "global_step": 99421, "epoch": 2367} {"train_loss": -6.279097557067871, "global_step": 99422, "epoch": 2367} {"train_loss": -6.205022811889648, "global_step": 99423, "epoch": 2367} {"train_loss": -6.228687286376953, "global_step": 99424, "epoch": 2367} {"train_loss": -6.244804859161377, "global_step": 99425, "epoch": 2367} {"train_loss": -6.278074741363525, "global_step": 99426, "epoch": 2367} {"train_loss": -6.43330192565918, "global_step": 99427, "epoch": 2367} {"train_loss": -6.17591667175293, "global_step": 99428, "epoch": 2367} {"train_loss": -6.329255104064941, "global_step": 99429, "epoch": 2367} {"train_loss": -6.287197113037109, "global_step": 99430, "epoch": 2367} {"train_loss": -6.198669910430908, "global_step": 99431, "epoch": 2367} {"train_loss": -6.319676876068115, "global_step": 99432, "epoch": 2367} {"train_loss": -6.180304050445557, "global_step": 99433, "epoch": 2367} {"train_loss": -6.3036699295043945, "global_step": 99434, "epoch": 2367} {"train_loss": -6.188362121582031, "global_step": 99435, "epoch": 2367} {"train_loss": -6.343576431274414, "global_step": 99436, "epoch": 2367} {"train_loss": -6.307180404663086, "global_step": 99437, "epoch": 2367} {"train_loss": -6.281525611877441, "global_step": 99438, "epoch": 2367} {"train_loss": -6.326314449310303, "global_step": 99439, "epoch": 2367} {"train_loss": -6.19968843460083, "global_step": 99440, "epoch": 2367} {"train_loss": -6.400538921356201, "global_step": 99441, "epoch": 2367} {"train_loss": -6.39576530456543, "global_step": 99442, "epoch": 2367} {"train_loss": -6.231647491455078, "global_step": 99443, "epoch": 2367} {"train_loss": -6.313565731048584, "global_step": 99444, "epoch": 2367} {"train_loss": -6.35774564743042, "global_step": 99445, "epoch": 2367} {"train_loss": -6.181929588317871, "global_step": 99446, "epoch": 2367} {"train_loss": -6.420123100280762, "global_step": 99447, "epoch": 2367} {"train_loss": -6.2719526290893555, "global_step": 99448, "epoch": 2367} {"train_loss": -6.334907531738281, "global_step": 99449, "epoch": 2367} {"train_loss": -6.294750213623047, "global_step": 99450, "epoch": 2367} {"train_loss": -6.410186767578125, "global_step": 99451, "epoch": 2367} {"train_loss": -6.339014053344727, "global_step": 99452, "epoch": 2367} {"train_loss": -6.23121452331543, "global_step": 99453, "epoch": 2367} {"train_loss": -6.273784637451172, "global_step": 99454, "epoch": 2367} {"train_loss": -6.30294546626863, "global_step": 99455, "epoch": 2367, "val_loss": 67886.734375} {"train_loss": -6.3441057205200195, "global_step": 99456, "epoch": 2368} {"train_loss": -6.282952785491943, "global_step": 99457, "epoch": 2368} {"train_loss": -6.314617156982422, "global_step": 99458, "epoch": 2368} {"train_loss": -6.230409145355225, "global_step": 99459, "epoch": 2368} {"train_loss": -6.232954025268555, "global_step": 99460, "epoch": 2368} {"train_loss": -6.345182418823242, "global_step": 99461, "epoch": 2368} {"train_loss": -6.403144836425781, "global_step": 99462, "epoch": 2368} {"train_loss": -6.288675308227539, "global_step": 99463, "epoch": 2368} {"train_loss": -6.264010429382324, "global_step": 99464, "epoch": 2368} {"train_loss": -6.32853889465332, "global_step": 99465, "epoch": 2368} {"train_loss": -6.364825248718262, "global_step": 99466, "epoch": 2368} {"train_loss": -6.387846946716309, "global_step": 99467, "epoch": 2368} {"train_loss": -6.369246482849121, "global_step": 99468, "epoch": 2368} {"train_loss": -6.394493579864502, "global_step": 99469, "epoch": 2368} {"train_loss": -6.265483856201172, "global_step": 99470, "epoch": 2368} {"train_loss": -6.421902179718018, "global_step": 99471, "epoch": 2368} {"train_loss": -6.096399784088135, "global_step": 99472, "epoch": 2368} {"train_loss": -6.3716139793396, "global_step": 99473, "epoch": 2368} {"train_loss": -6.336997985839844, "global_step": 99474, "epoch": 2368} {"train_loss": -6.336694717407227, "global_step": 99475, "epoch": 2368} {"train_loss": -6.377928733825684, "global_step": 99476, "epoch": 2368} {"train_loss": -6.315173149108887, "global_step": 99477, "epoch": 2368} {"train_loss": -6.3082733154296875, "global_step": 99478, "epoch": 2368} {"train_loss": -6.275198936462402, "global_step": 99479, "epoch": 2368} {"train_loss": -6.327218055725098, "global_step": 99480, "epoch": 2368} {"train_loss": -6.3018951416015625, "global_step": 99481, "epoch": 2368} {"train_loss": -6.270077705383301, "global_step": 99482, "epoch": 2368} {"train_loss": -6.3294854164123535, "global_step": 99483, "epoch": 2368} {"train_loss": -6.3073883056640625, "global_step": 99484, "epoch": 2368} {"train_loss": -6.359989166259766, "global_step": 99485, "epoch": 2368} {"train_loss": -6.227143287658691, "global_step": 99486, "epoch": 2368} {"train_loss": -6.303756237030029, "global_step": 99487, "epoch": 2368} {"train_loss": -6.314213752746582, "global_step": 99488, "epoch": 2368} {"train_loss": -6.256914138793945, "global_step": 99489, "epoch": 2368} {"train_loss": -6.325943470001221, "global_step": 99490, "epoch": 2368} {"train_loss": -6.3641581535339355, "global_step": 99491, "epoch": 2368} {"train_loss": -6.266785621643066, "global_step": 99492, "epoch": 2368} {"train_loss": -6.352805137634277, "global_step": 99493, "epoch": 2368} {"train_loss": -6.308500289916992, "global_step": 99494, "epoch": 2368} {"train_loss": -6.294527053833008, "global_step": 99495, "epoch": 2368} {"train_loss": -6.2657012939453125, "global_step": 99496, "epoch": 2368} {"train_loss": -6.314557427451724, "global_step": 99497, "epoch": 2368, "val_loss": 67999.21875} {"train_loss": -6.425665855407715, "global_step": 99498, "epoch": 2369} {"train_loss": -6.362229347229004, "global_step": 99499, "epoch": 2369} {"train_loss": -6.431859493255615, "global_step": 99500, "epoch": 2369} {"train_loss": -6.2768449783325195, "global_step": 99501, "epoch": 2369} {"train_loss": -6.270209312438965, "global_step": 99502, "epoch": 2369} {"train_loss": -6.312901496887207, "global_step": 99503, "epoch": 2369} {"train_loss": -6.38571834564209, "global_step": 99504, "epoch": 2369} {"train_loss": -6.331577301025391, "global_step": 99505, "epoch": 2369} {"train_loss": -6.222126007080078, "global_step": 99506, "epoch": 2369} {"train_loss": -6.332184314727783, "global_step": 99507, "epoch": 2369} {"train_loss": -6.151673793792725, "global_step": 99508, "epoch": 2369} {"train_loss": -6.216541290283203, "global_step": 99509, "epoch": 2369} {"train_loss": -6.219291687011719, "global_step": 99510, "epoch": 2369} {"train_loss": -6.200211524963379, "global_step": 99511, "epoch": 2369} {"train_loss": -6.228086471557617, "global_step": 99512, "epoch": 2369} {"train_loss": -6.194857597351074, "global_step": 99513, "epoch": 2369} {"train_loss": -6.284980773925781, "global_step": 99514, "epoch": 2369} {"train_loss": -6.120499610900879, "global_step": 99515, "epoch": 2369} {"train_loss": -6.259443283081055, "global_step": 99516, "epoch": 2369} {"train_loss": -6.345406532287598, "global_step": 99517, "epoch": 2369} {"train_loss": -6.202581405639648, "global_step": 99518, "epoch": 2369} {"train_loss": -6.322528839111328, "global_step": 99519, "epoch": 2369} {"train_loss": -6.228083610534668, "global_step": 99520, "epoch": 2369} {"train_loss": -6.369882106781006, "global_step": 99521, "epoch": 2369} {"train_loss": -6.2336249351501465, "global_step": 99522, "epoch": 2369} {"train_loss": -6.409274101257324, "global_step": 99523, "epoch": 2369} {"train_loss": -6.304742336273193, "global_step": 99524, "epoch": 2369} {"train_loss": -6.1977739334106445, "global_step": 99525, "epoch": 2369} {"train_loss": -6.184551239013672, "global_step": 99526, "epoch": 2369} {"train_loss": -6.328968048095703, "global_step": 99527, "epoch": 2369} {"train_loss": -6.323040962219238, "global_step": 99528, "epoch": 2369} {"train_loss": -6.272038459777832, "global_step": 99529, "epoch": 2369} {"train_loss": -6.259953498840332, "global_step": 99530, "epoch": 2369} {"train_loss": -6.276119232177734, "global_step": 99531, "epoch": 2369} {"train_loss": -6.296744346618652, "global_step": 99532, "epoch": 2369} {"train_loss": -6.227543830871582, "global_step": 99533, "epoch": 2369} {"train_loss": -6.300718307495117, "global_step": 99534, "epoch": 2369} {"train_loss": -6.279232978820801, "global_step": 99535, "epoch": 2369} {"train_loss": -6.311534881591797, "global_step": 99536, "epoch": 2369} {"train_loss": -6.1606340408325195, "global_step": 99537, "epoch": 2369} {"train_loss": -6.243829250335693, "global_step": 99538, "epoch": 2369} {"train_loss": -6.277869621912639, "global_step": 99539, "epoch": 2369, "val_loss": 67887.765625} {"train_loss": -6.324089050292969, "global_step": 99540, "epoch": 2370} {"train_loss": -6.304210662841797, "global_step": 99541, "epoch": 2370} {"train_loss": -6.326430320739746, "global_step": 99542, "epoch": 2370} {"train_loss": -6.399430274963379, "global_step": 99543, "epoch": 2370} {"train_loss": -6.3346357345581055, "global_step": 99544, "epoch": 2370} {"train_loss": -6.364956378936768, "global_step": 99545, "epoch": 2370} {"train_loss": -6.395937442779541, "global_step": 99546, "epoch": 2370} {"train_loss": -6.362645149230957, "global_step": 99547, "epoch": 2370} {"train_loss": -6.344468116760254, "global_step": 99548, "epoch": 2370} {"train_loss": -6.239431381225586, "global_step": 99549, "epoch": 2370} {"train_loss": -6.498909950256348, "global_step": 99550, "epoch": 2370} {"train_loss": -6.350277423858643, "global_step": 99551, "epoch": 2370} {"train_loss": -6.41743278503418, "global_step": 99552, "epoch": 2370} {"train_loss": -6.27274751663208, "global_step": 99553, "epoch": 2370} {"train_loss": -6.2797393798828125, "global_step": 99554, "epoch": 2370} {"train_loss": -6.3369855880737305, "global_step": 99555, "epoch": 2370} {"train_loss": -6.3476176261901855, "global_step": 99556, "epoch": 2370} {"train_loss": -6.380946159362793, "global_step": 99557, "epoch": 2370} {"train_loss": -6.252200126647949, "global_step": 99558, "epoch": 2370} {"train_loss": -6.254842758178711, "global_step": 99559, "epoch": 2370} {"train_loss": -6.342485427856445, "global_step": 99560, "epoch": 2370} {"train_loss": -6.269043922424316, "global_step": 99561, "epoch": 2370} {"train_loss": -6.37533712387085, "global_step": 99562, "epoch": 2370} {"train_loss": -6.27323055267334, "global_step": 99563, "epoch": 2370} {"train_loss": -6.362887859344482, "global_step": 99564, "epoch": 2370} {"train_loss": -6.407968521118164, "global_step": 99565, "epoch": 2370} {"train_loss": -6.34104061126709, "global_step": 99566, "epoch": 2370} {"train_loss": -6.369953155517578, "global_step": 99567, "epoch": 2370} {"train_loss": -6.312948703765869, "global_step": 99568, "epoch": 2370} {"train_loss": -6.188359260559082, "global_step": 99569, "epoch": 2370} {"train_loss": -6.3849592208862305, "global_step": 99570, "epoch": 2370} {"train_loss": -6.36586856842041, "global_step": 99571, "epoch": 2370} {"train_loss": -6.328230857849121, "global_step": 99572, "epoch": 2370} {"train_loss": -6.426968574523926, "global_step": 99573, "epoch": 2370} {"train_loss": -6.272093772888184, "global_step": 99574, "epoch": 2370} {"train_loss": -6.264583587646484, "global_step": 99575, "epoch": 2370} {"train_loss": -6.316263198852539, "global_step": 99576, "epoch": 2370} {"train_loss": -6.259524345397949, "global_step": 99577, "epoch": 2370} {"train_loss": -6.301109790802002, "global_step": 99578, "epoch": 2370} {"train_loss": -6.3783063888549805, "global_step": 99579, "epoch": 2370} {"train_loss": -6.1331634521484375, "global_step": 99580, "epoch": 2370} {"train_loss": -6.3297093368711925, "global_step": 99581, "epoch": 2370, "val_loss": 68055.8359375} {"train_loss": -6.187967777252197, "global_step": 99582, "epoch": 2371} {"train_loss": -6.412319660186768, "global_step": 99583, "epoch": 2371} {"train_loss": -6.282934665679932, "global_step": 99584, "epoch": 2371} {"train_loss": -6.298205375671387, "global_step": 99585, "epoch": 2371} {"train_loss": -6.304078102111816, "global_step": 99586, "epoch": 2371} {"train_loss": -6.436069488525391, "global_step": 99587, "epoch": 2371} {"train_loss": -6.395930290222168, "global_step": 99588, "epoch": 2371} {"train_loss": -6.28151798248291, "global_step": 99589, "epoch": 2371} {"train_loss": -6.273920059204102, "global_step": 99590, "epoch": 2371} {"train_loss": -6.425379753112793, "global_step": 99591, "epoch": 2371} {"train_loss": -6.296846389770508, "global_step": 99592, "epoch": 2371} {"train_loss": -6.370304107666016, "global_step": 99593, "epoch": 2371} {"train_loss": -6.394451141357422, "global_step": 99594, "epoch": 2371} {"train_loss": -6.361670970916748, "global_step": 99595, "epoch": 2371} {"train_loss": -6.4413862228393555, "global_step": 99596, "epoch": 2371} {"train_loss": -6.385692596435547, "global_step": 99597, "epoch": 2371} {"train_loss": -6.25051736831665, "global_step": 99598, "epoch": 2371} {"train_loss": -6.3562116622924805, "global_step": 99599, "epoch": 2371} {"train_loss": -6.387485504150391, "global_step": 99600, "epoch": 2371} {"train_loss": -6.266666889190674, "global_step": 99601, "epoch": 2371} {"train_loss": -6.427937030792236, "global_step": 99602, "epoch": 2371} {"train_loss": -6.337369441986084, "global_step": 99603, "epoch": 2371} {"train_loss": -6.336120128631592, "global_step": 99604, "epoch": 2371} {"train_loss": -6.380922794342041, "global_step": 99605, "epoch": 2371} {"train_loss": -6.458730697631836, "global_step": 99606, "epoch": 2371} {"train_loss": -6.345251083374023, "global_step": 99607, "epoch": 2371} {"train_loss": -6.461546421051025, "global_step": 99608, "epoch": 2371} {"train_loss": -6.305215358734131, "global_step": 99609, "epoch": 2371} {"train_loss": -6.479404926300049, "global_step": 99610, "epoch": 2371} {"train_loss": -6.33629035949707, "global_step": 99611, "epoch": 2371} {"train_loss": -6.253968238830566, "global_step": 99612, "epoch": 2371} {"train_loss": -6.349904537200928, "global_step": 99613, "epoch": 2371} {"train_loss": -6.318363189697266, "global_step": 99614, "epoch": 2371} {"train_loss": -6.336519241333008, "global_step": 99615, "epoch": 2371} {"train_loss": -6.341497898101807, "global_step": 99616, "epoch": 2371} {"train_loss": -6.303403854370117, "global_step": 99617, "epoch": 2371} {"train_loss": -6.317538261413574, "global_step": 99618, "epoch": 2371} {"train_loss": -6.271816730499268, "global_step": 99619, "epoch": 2371} {"train_loss": -6.425684928894043, "global_step": 99620, "epoch": 2371} {"train_loss": -6.337451934814453, "global_step": 99621, "epoch": 2371} {"train_loss": -6.279486656188965, "global_step": 99622, "epoch": 2371} {"train_loss": -6.345912172680809, "global_step": 99623, "epoch": 2371, "val_loss": 68011.578125} {"train_loss": -6.385916709899902, "global_step": 99624, "epoch": 2372} {"train_loss": -6.434717178344727, "global_step": 99625, "epoch": 2372} {"train_loss": -6.402325630187988, "global_step": 99626, "epoch": 2372} {"train_loss": -6.299250602722168, "global_step": 99627, "epoch": 2372} {"train_loss": -6.299783706665039, "global_step": 99628, "epoch": 2372} {"train_loss": -6.409592628479004, "global_step": 99629, "epoch": 2372} {"train_loss": -6.206926345825195, "global_step": 99630, "epoch": 2372} {"train_loss": -6.298835277557373, "global_step": 99631, "epoch": 2372} {"train_loss": -6.364455223083496, "global_step": 99632, "epoch": 2372} {"train_loss": -6.21198844909668, "global_step": 99633, "epoch": 2372} {"train_loss": -6.430699348449707, "global_step": 99634, "epoch": 2372} {"train_loss": -6.212433815002441, "global_step": 99635, "epoch": 2372} {"train_loss": -6.351962089538574, "global_step": 99636, "epoch": 2372} {"train_loss": -6.420604705810547, "global_step": 99637, "epoch": 2372} {"train_loss": -6.345320224761963, "global_step": 99638, "epoch": 2372} {"train_loss": -6.303829669952393, "global_step": 99639, "epoch": 2372} {"train_loss": -6.346443176269531, "global_step": 99640, "epoch": 2372} {"train_loss": -6.381967544555664, "global_step": 99641, "epoch": 2372} {"train_loss": -6.409850120544434, "global_step": 99642, "epoch": 2372} {"train_loss": -6.390398979187012, "global_step": 99643, "epoch": 2372} {"train_loss": -6.296609401702881, "global_step": 99644, "epoch": 2372} {"train_loss": -6.500805854797363, "global_step": 99645, "epoch": 2372} {"train_loss": -6.455264091491699, "global_step": 99646, "epoch": 2372} {"train_loss": -6.364611625671387, "global_step": 99647, "epoch": 2372} {"train_loss": -6.501913547515869, "global_step": 99648, "epoch": 2372} {"train_loss": -6.523399353027344, "global_step": 99649, "epoch": 2372} {"train_loss": -6.354390621185303, "global_step": 99650, "epoch": 2372} {"train_loss": -6.292023658752441, "global_step": 99651, "epoch": 2372} {"train_loss": -6.184025764465332, "global_step": 99652, "epoch": 2372} {"train_loss": -6.287158966064453, "global_step": 99653, "epoch": 2372} {"train_loss": -6.321479320526123, "global_step": 99654, "epoch": 2372} {"train_loss": -6.169000148773193, "global_step": 99655, "epoch": 2372} {"train_loss": -6.259731769561768, "global_step": 99656, "epoch": 2372} {"train_loss": -6.2978129386901855, "global_step": 99657, "epoch": 2372} {"train_loss": -6.147412300109863, "global_step": 99658, "epoch": 2372} {"train_loss": -6.383075714111328, "global_step": 99659, "epoch": 2372} {"train_loss": -6.2552289962768555, "global_step": 99660, "epoch": 2372} {"train_loss": -6.172430038452148, "global_step": 99661, "epoch": 2372} {"train_loss": -6.140836238861084, "global_step": 99662, "epoch": 2372} {"train_loss": -6.160848617553711, "global_step": 99663, "epoch": 2372} {"train_loss": -6.1822967529296875, "global_step": 99664, "epoch": 2372} {"train_loss": -6.315286170868647, "global_step": 99665, "epoch": 2372, "val_loss": 68122.7265625} {"train_loss": -6.235994338989258, "global_step": 99666, "epoch": 2373} {"train_loss": -6.241018295288086, "global_step": 99667, "epoch": 2373} {"train_loss": -6.287066459655762, "global_step": 99668, "epoch": 2373} {"train_loss": -6.176165580749512, "global_step": 99669, "epoch": 2373} {"train_loss": -6.257948398590088, "global_step": 99670, "epoch": 2373} {"train_loss": -6.27514123916626, "global_step": 99671, "epoch": 2373} {"train_loss": -6.376179218292236, "global_step": 99672, "epoch": 2373} {"train_loss": -6.2544941902160645, "global_step": 99673, "epoch": 2373} {"train_loss": -6.158872127532959, "global_step": 99674, "epoch": 2373} {"train_loss": -6.297736644744873, "global_step": 99675, "epoch": 2373} {"train_loss": -6.271069526672363, "global_step": 99676, "epoch": 2373} {"train_loss": -6.442013740539551, "global_step": 99677, "epoch": 2373} {"train_loss": -6.313170433044434, "global_step": 99678, "epoch": 2373} {"train_loss": -6.273810386657715, "global_step": 99679, "epoch": 2373} {"train_loss": -6.344266414642334, "global_step": 99680, "epoch": 2373} {"train_loss": -6.4020209312438965, "global_step": 99681, "epoch": 2373} {"train_loss": -6.322212219238281, "global_step": 99682, "epoch": 2373} {"train_loss": -6.278386116027832, "global_step": 99683, "epoch": 2373} {"train_loss": -6.340683460235596, "global_step": 99684, "epoch": 2373} {"train_loss": -6.449272155761719, "global_step": 99685, "epoch": 2373} {"train_loss": -6.205286502838135, "global_step": 99686, "epoch": 2373} {"train_loss": -6.352129936218262, "global_step": 99687, "epoch": 2373} {"train_loss": -6.318039417266846, "global_step": 99688, "epoch": 2373} {"train_loss": -6.3101959228515625, "global_step": 99689, "epoch": 2373} {"train_loss": -6.314501762390137, "global_step": 99690, "epoch": 2373} {"train_loss": -6.305949687957764, "global_step": 99691, "epoch": 2373} {"train_loss": -6.339700698852539, "global_step": 99692, "epoch": 2373} {"train_loss": -6.383835792541504, "global_step": 99693, "epoch": 2373} {"train_loss": -6.447268486022949, "global_step": 99694, "epoch": 2373} {"train_loss": -6.371830940246582, "global_step": 99695, "epoch": 2373} {"train_loss": -6.351726531982422, "global_step": 99696, "epoch": 2373} {"train_loss": -6.384030342102051, "global_step": 99697, "epoch": 2373} {"train_loss": -6.299216270446777, "global_step": 99698, "epoch": 2373} {"train_loss": -6.459511756896973, "global_step": 99699, "epoch": 2373} {"train_loss": -6.200641632080078, "global_step": 99700, "epoch": 2373} {"train_loss": -6.228930473327637, "global_step": 99701, "epoch": 2373} {"train_loss": -6.360208511352539, "global_step": 99702, "epoch": 2373} {"train_loss": -6.467747688293457, "global_step": 99703, "epoch": 2373} {"train_loss": -6.359445095062256, "global_step": 99704, "epoch": 2373} {"train_loss": -6.34544038772583, "global_step": 99705, "epoch": 2373} {"train_loss": -6.363130569458008, "global_step": 99706, "epoch": 2373} {"train_loss": -6.32112869762239, "global_step": 99707, "epoch": 2373, "val_loss": 67861.84375} {"train_loss": -6.197296619415283, "global_step": 99708, "epoch": 2374} {"train_loss": -6.399266242980957, "global_step": 99709, "epoch": 2374} {"train_loss": -6.378142356872559, "global_step": 99710, "epoch": 2374} {"train_loss": -6.255336284637451, "global_step": 99711, "epoch": 2374} {"train_loss": -6.362331867218018, "global_step": 99712, "epoch": 2374} {"train_loss": -6.493446350097656, "global_step": 99713, "epoch": 2374} {"train_loss": -6.447455883026123, "global_step": 99714, "epoch": 2374} {"train_loss": -6.290604591369629, "global_step": 99715, "epoch": 2374} {"train_loss": -6.422606468200684, "global_step": 99716, "epoch": 2374} {"train_loss": -6.300192832946777, "global_step": 99717, "epoch": 2374} {"train_loss": -6.390314102172852, "global_step": 99718, "epoch": 2374} {"train_loss": -6.371365547180176, "global_step": 99719, "epoch": 2374} {"train_loss": -6.368564128875732, "global_step": 99720, "epoch": 2374} {"train_loss": -6.480669975280762, "global_step": 99721, "epoch": 2374} {"train_loss": -6.3956451416015625, "global_step": 99722, "epoch": 2374} {"train_loss": -6.278902053833008, "global_step": 99723, "epoch": 2374} {"train_loss": -6.440717697143555, "global_step": 99724, "epoch": 2374} {"train_loss": -6.401496887207031, "global_step": 99725, "epoch": 2374} {"train_loss": -6.3522844314575195, "global_step": 99726, "epoch": 2374} {"train_loss": -6.363022804260254, "global_step": 99727, "epoch": 2374} {"train_loss": -6.390141487121582, "global_step": 99728, "epoch": 2374} {"train_loss": -6.350473403930664, "global_step": 99729, "epoch": 2374} {"train_loss": -6.420686721801758, "global_step": 99730, "epoch": 2374} {"train_loss": -6.435171127319336, "global_step": 99731, "epoch": 2374} {"train_loss": -6.395554542541504, "global_step": 99732, "epoch": 2374} {"train_loss": -6.298285484313965, "global_step": 99733, "epoch": 2374} {"train_loss": -6.417291641235352, "global_step": 99734, "epoch": 2374} {"train_loss": -6.270008087158203, "global_step": 99735, "epoch": 2374} {"train_loss": -6.299304008483887, "global_step": 99736, "epoch": 2374} {"train_loss": -6.4673051834106445, "global_step": 99737, "epoch": 2374} {"train_loss": -6.316287517547607, "global_step": 99738, "epoch": 2374} {"train_loss": -6.406274795532227, "global_step": 99739, "epoch": 2374} {"train_loss": -6.3166351318359375, "global_step": 99740, "epoch": 2374} {"train_loss": -6.363160133361816, "global_step": 99741, "epoch": 2374} {"train_loss": -6.232545852661133, "global_step": 99742, "epoch": 2374} {"train_loss": -6.288667678833008, "global_step": 99743, "epoch": 2374} {"train_loss": -6.244135856628418, "global_step": 99744, "epoch": 2374} {"train_loss": -6.272393226623535, "global_step": 99745, "epoch": 2374} {"train_loss": -6.371399879455566, "global_step": 99746, "epoch": 2374} {"train_loss": -6.341159820556641, "global_step": 99747, "epoch": 2374} {"train_loss": -6.419827461242676, "global_step": 99748, "epoch": 2374} {"train_loss": -6.358161449432373, "global_step": 99749, "epoch": 2374, "val_loss": 67850.109375} {"train_loss": -6.28923225402832, "global_step": 99750, "epoch": 2375} {"train_loss": -6.347123146057129, "global_step": 99751, "epoch": 2375} {"train_loss": -6.287468910217285, "global_step": 99752, "epoch": 2375} {"train_loss": -6.365984916687012, "global_step": 99753, "epoch": 2375} {"train_loss": -6.434549331665039, "global_step": 99754, "epoch": 2375} {"train_loss": -6.3536272048950195, "global_step": 99755, "epoch": 2375} {"train_loss": -6.378389358520508, "global_step": 99756, "epoch": 2375} {"train_loss": -6.286640644073486, "global_step": 99757, "epoch": 2375} {"train_loss": -6.286670684814453, "global_step": 99758, "epoch": 2375} {"train_loss": -6.291919231414795, "global_step": 99759, "epoch": 2375} {"train_loss": -6.316999435424805, "global_step": 99760, "epoch": 2375} {"train_loss": -6.272671222686768, "global_step": 99761, "epoch": 2375} {"train_loss": -6.367088317871094, "global_step": 99762, "epoch": 2375} {"train_loss": -6.30937385559082, "global_step": 99763, "epoch": 2375} {"train_loss": -6.348761081695557, "global_step": 99764, "epoch": 2375} {"train_loss": -6.334666728973389, "global_step": 99765, "epoch": 2375} {"train_loss": -6.238565444946289, "global_step": 99766, "epoch": 2375} {"train_loss": -6.196082592010498, "global_step": 99767, "epoch": 2375} {"train_loss": -6.381234169006348, "global_step": 99768, "epoch": 2375} {"train_loss": -6.289318084716797, "global_step": 99769, "epoch": 2375} {"train_loss": -6.367709159851074, "global_step": 99770, "epoch": 2375} {"train_loss": -6.429924964904785, "global_step": 99771, "epoch": 2375} {"train_loss": -6.314788818359375, "global_step": 99772, "epoch": 2375} {"train_loss": -6.334831237792969, "global_step": 99773, "epoch": 2375} {"train_loss": -6.451138496398926, "global_step": 99774, "epoch": 2375} {"train_loss": -6.388042449951172, "global_step": 99775, "epoch": 2375} {"train_loss": -6.447443962097168, "global_step": 99776, "epoch": 2375} {"train_loss": -6.365720272064209, "global_step": 99777, "epoch": 2375} {"train_loss": -6.4160871505737305, "global_step": 99778, "epoch": 2375} {"train_loss": -6.330482482910156, "global_step": 99779, "epoch": 2375} {"train_loss": -6.313973426818848, "global_step": 99780, "epoch": 2375} {"train_loss": -6.377251148223877, "global_step": 99781, "epoch": 2375} {"train_loss": -6.504452228546143, "global_step": 99782, "epoch": 2375} {"train_loss": -6.326066493988037, "global_step": 99783, "epoch": 2375} {"train_loss": -6.38646125793457, "global_step": 99784, "epoch": 2375} {"train_loss": -6.40411376953125, "global_step": 99785, "epoch": 2375} {"train_loss": -6.29777717590332, "global_step": 99786, "epoch": 2375} {"train_loss": -6.3666887283325195, "global_step": 99787, "epoch": 2375} {"train_loss": -6.363544464111328, "global_step": 99788, "epoch": 2375} {"train_loss": -6.415078639984131, "global_step": 99789, "epoch": 2375} {"train_loss": -6.423286437988281, "global_step": 99790, "epoch": 2375} {"train_loss": -6.348860014052618, "global_step": 99791, "epoch": 2375, "val_loss": 68078.90625} {"train_loss": -6.345300197601318, "global_step": 99792, "epoch": 2376} {"train_loss": -6.322688102722168, "global_step": 99793, "epoch": 2376} {"train_loss": -6.416306018829346, "global_step": 99794, "epoch": 2376} {"train_loss": -6.361108303070068, "global_step": 99795, "epoch": 2376} {"train_loss": -6.431537628173828, "global_step": 99796, "epoch": 2376} {"train_loss": -6.437247276306152, "global_step": 99797, "epoch": 2376} {"train_loss": -6.381925582885742, "global_step": 99798, "epoch": 2376} {"train_loss": -6.35359001159668, "global_step": 99799, "epoch": 2376} {"train_loss": -6.326740264892578, "global_step": 99800, "epoch": 2376} {"train_loss": -6.344991683959961, "global_step": 99801, "epoch": 2376} {"train_loss": -6.3185906410217285, "global_step": 99802, "epoch": 2376} {"train_loss": -6.3860626220703125, "global_step": 99803, "epoch": 2376} {"train_loss": -6.458033561706543, "global_step": 99804, "epoch": 2376} {"train_loss": -6.305355072021484, "global_step": 99805, "epoch": 2376} {"train_loss": -6.441205978393555, "global_step": 99806, "epoch": 2376} {"train_loss": -6.339568138122559, "global_step": 99807, "epoch": 2376} {"train_loss": -6.365371227264404, "global_step": 99808, "epoch": 2376} {"train_loss": -6.398095607757568, "global_step": 99809, "epoch": 2376} {"train_loss": -6.272334098815918, "global_step": 99810, "epoch": 2376} {"train_loss": -6.23990535736084, "global_step": 99811, "epoch": 2376} {"train_loss": -6.3056111335754395, "global_step": 99812, "epoch": 2376} {"train_loss": -6.234679222106934, "global_step": 99813, "epoch": 2376} {"train_loss": -6.270557403564453, "global_step": 99814, "epoch": 2376} {"train_loss": -6.387974262237549, "global_step": 99815, "epoch": 2376} {"train_loss": -6.251288414001465, "global_step": 99816, "epoch": 2376} {"train_loss": -6.229979991912842, "global_step": 99817, "epoch": 2376} {"train_loss": -6.361126899719238, "global_step": 99818, "epoch": 2376} {"train_loss": -6.203516483306885, "global_step": 99819, "epoch": 2376} {"train_loss": -6.30374813079834, "global_step": 99820, "epoch": 2376} {"train_loss": -6.226324558258057, "global_step": 99821, "epoch": 2376} {"train_loss": -6.289863586425781, "global_step": 99822, "epoch": 2376} {"train_loss": -6.365904331207275, "global_step": 99823, "epoch": 2376} {"train_loss": -6.380421161651611, "global_step": 99824, "epoch": 2376} {"train_loss": -6.322138786315918, "global_step": 99825, "epoch": 2376} {"train_loss": -6.249102592468262, "global_step": 99826, "epoch": 2376} {"train_loss": -6.3982625007629395, "global_step": 99827, "epoch": 2376} {"train_loss": -6.308831214904785, "global_step": 99828, "epoch": 2376} {"train_loss": -6.353382587432861, "global_step": 99829, "epoch": 2376} {"train_loss": -6.431365489959717, "global_step": 99830, "epoch": 2376} {"train_loss": -6.438919544219971, "global_step": 99831, "epoch": 2376} {"train_loss": -6.393459796905518, "global_step": 99832, "epoch": 2376} {"train_loss": -6.339071307863508, "global_step": 99833, "epoch": 2376, "val_loss": 67916.3515625} {"train_loss": -6.464568614959717, "global_step": 99834, "epoch": 2377} {"train_loss": -6.274641990661621, "global_step": 99835, "epoch": 2377} {"train_loss": -6.388328552246094, "global_step": 99836, "epoch": 2377} {"train_loss": -6.34912109375, "global_step": 99837, "epoch": 2377} {"train_loss": -6.41523551940918, "global_step": 99838, "epoch": 2377} {"train_loss": -6.209651947021484, "global_step": 99839, "epoch": 2377} {"train_loss": -6.379547119140625, "global_step": 99840, "epoch": 2377} {"train_loss": -6.378419876098633, "global_step": 99841, "epoch": 2377} {"train_loss": -6.3263750076293945, "global_step": 99842, "epoch": 2377} {"train_loss": -6.29587459564209, "global_step": 99843, "epoch": 2377} {"train_loss": -6.357877731323242, "global_step": 99844, "epoch": 2377} {"train_loss": -6.418193817138672, "global_step": 99845, "epoch": 2377} {"train_loss": -6.356985092163086, "global_step": 99846, "epoch": 2377} {"train_loss": -6.352325916290283, "global_step": 99847, "epoch": 2377} {"train_loss": -6.319620132446289, "global_step": 99848, "epoch": 2377} {"train_loss": -6.260171890258789, "global_step": 99849, "epoch": 2377} {"train_loss": -6.34267520904541, "global_step": 99850, "epoch": 2377} {"train_loss": -6.229805946350098, "global_step": 99851, "epoch": 2377} {"train_loss": -6.419259548187256, "global_step": 99852, "epoch": 2377} {"train_loss": -6.381451606750488, "global_step": 99853, "epoch": 2377} {"train_loss": -6.255348205566406, "global_step": 99854, "epoch": 2377} {"train_loss": -6.330204010009766, "global_step": 99855, "epoch": 2377} {"train_loss": -6.431194305419922, "global_step": 99856, "epoch": 2377} {"train_loss": -6.317788124084473, "global_step": 99857, "epoch": 2377} {"train_loss": -6.219480037689209, "global_step": 99858, "epoch": 2377} {"train_loss": -6.390865325927734, "global_step": 99859, "epoch": 2377} {"train_loss": -6.393531799316406, "global_step": 99860, "epoch": 2377} {"train_loss": -6.328396797180176, "global_step": 99861, "epoch": 2377} {"train_loss": -6.3001017570495605, "global_step": 99862, "epoch": 2377} {"train_loss": -6.366823673248291, "global_step": 99863, "epoch": 2377} {"train_loss": -6.382858753204346, "global_step": 99864, "epoch": 2377} {"train_loss": -6.317498683929443, "global_step": 99865, "epoch": 2377} {"train_loss": -6.470727920532227, "global_step": 99866, "epoch": 2377} {"train_loss": -6.218767166137695, "global_step": 99867, "epoch": 2377} {"train_loss": -6.358253479003906, "global_step": 99868, "epoch": 2377} {"train_loss": -6.3808488845825195, "global_step": 99869, "epoch": 2377} {"train_loss": -6.391185760498047, "global_step": 99870, "epoch": 2377} {"train_loss": -6.38491153717041, "global_step": 99871, "epoch": 2377} {"train_loss": -6.231471061706543, "global_step": 99872, "epoch": 2377} {"train_loss": -6.294613838195801, "global_step": 99873, "epoch": 2377} {"train_loss": -6.350988388061523, "global_step": 99874, "epoch": 2377} {"train_loss": -6.339730626060849, "global_step": 99875, "epoch": 2377, "val_loss": 67860.5859375} {"train_loss": -6.328022480010986, "global_step": 99876, "epoch": 2378} {"train_loss": -6.294318199157715, "global_step": 99877, "epoch": 2378} {"train_loss": -6.362270355224609, "global_step": 99878, "epoch": 2378} {"train_loss": -6.217201232910156, "global_step": 99879, "epoch": 2378} {"train_loss": -6.238701820373535, "global_step": 99880, "epoch": 2378} {"train_loss": -6.406442165374756, "global_step": 99881, "epoch": 2378} {"train_loss": -6.192471027374268, "global_step": 99882, "epoch": 2378} {"train_loss": -6.36635684967041, "global_step": 99883, "epoch": 2378} {"train_loss": -6.245800018310547, "global_step": 99884, "epoch": 2378} {"train_loss": -6.429017066955566, "global_step": 99885, "epoch": 2378} {"train_loss": -6.243610382080078, "global_step": 99886, "epoch": 2378} {"train_loss": -6.398691654205322, "global_step": 99887, "epoch": 2378} {"train_loss": -6.197430610656738, "global_step": 99888, "epoch": 2378} {"train_loss": -6.247795104980469, "global_step": 99889, "epoch": 2378} {"train_loss": -6.3647308349609375, "global_step": 99890, "epoch": 2378} {"train_loss": -6.2580108642578125, "global_step": 99891, "epoch": 2378} {"train_loss": -6.073693752288818, "global_step": 99892, "epoch": 2378} {"train_loss": -6.376375675201416, "global_step": 99893, "epoch": 2378} {"train_loss": -6.137263298034668, "global_step": 99894, "epoch": 2378} {"train_loss": -6.165834426879883, "global_step": 99895, "epoch": 2378} {"train_loss": -6.262999057769775, "global_step": 99896, "epoch": 2378} {"train_loss": -6.259706020355225, "global_step": 99897, "epoch": 2378} {"train_loss": -6.23219633102417, "global_step": 99898, "epoch": 2378} {"train_loss": -6.20059871673584, "global_step": 99899, "epoch": 2378} {"train_loss": -6.284490585327148, "global_step": 99900, "epoch": 2378} {"train_loss": -6.25865364074707, "global_step": 99901, "epoch": 2378} {"train_loss": -6.305315017700195, "global_step": 99902, "epoch": 2378} {"train_loss": -6.1513190269470215, "global_step": 99903, "epoch": 2378} {"train_loss": -6.211274147033691, "global_step": 99904, "epoch": 2378} {"train_loss": -6.318722724914551, "global_step": 99905, "epoch": 2378} {"train_loss": -6.210143089294434, "global_step": 99906, "epoch": 2378} {"train_loss": -6.336493968963623, "global_step": 99907, "epoch": 2378} {"train_loss": -6.344108581542969, "global_step": 99908, "epoch": 2378} {"train_loss": -6.359857559204102, "global_step": 99909, "epoch": 2378} {"train_loss": -6.342310905456543, "global_step": 99910, "epoch": 2378} {"train_loss": -6.429627418518066, "global_step": 99911, "epoch": 2378} {"train_loss": -6.333522796630859, "global_step": 99912, "epoch": 2378} {"train_loss": -6.296436309814453, "global_step": 99913, "epoch": 2378} {"train_loss": -6.308734893798828, "global_step": 99914, "epoch": 2378} {"train_loss": -6.318511962890625, "global_step": 99915, "epoch": 2378} {"train_loss": -6.381979942321777, "global_step": 99916, "epoch": 2378} {"train_loss": -6.286658048629761, "global_step": 99917, "epoch": 2378, "val_loss": 67892.9453125} {"train_loss": -6.385275363922119, "global_step": 99918, "epoch": 2379} {"train_loss": -6.235474586486816, "global_step": 99919, "epoch": 2379} {"train_loss": -6.441659927368164, "global_step": 99920, "epoch": 2379} {"train_loss": -6.320204257965088, "global_step": 99921, "epoch": 2379} {"train_loss": -6.297239780426025, "global_step": 99922, "epoch": 2379} {"train_loss": -6.457985877990723, "global_step": 99923, "epoch": 2379} {"train_loss": -6.329571723937988, "global_step": 99924, "epoch": 2379} {"train_loss": -6.474452018737793, "global_step": 99925, "epoch": 2379} {"train_loss": -6.418318271636963, "global_step": 99926, "epoch": 2379} {"train_loss": -6.426273345947266, "global_step": 99927, "epoch": 2379} {"train_loss": -6.345843315124512, "global_step": 99928, "epoch": 2379} {"train_loss": -6.2338666915893555, "global_step": 99929, "epoch": 2379} {"train_loss": -6.359363555908203, "global_step": 99930, "epoch": 2379} {"train_loss": -6.274190902709961, "global_step": 99931, "epoch": 2379} {"train_loss": -6.457082748413086, "global_step": 99932, "epoch": 2379} {"train_loss": -6.41478157043457, "global_step": 99933, "epoch": 2379} {"train_loss": -6.395912170410156, "global_step": 99934, "epoch": 2379} {"train_loss": -6.347956657409668, "global_step": 99935, "epoch": 2379} {"train_loss": -6.345273971557617, "global_step": 99936, "epoch": 2379} {"train_loss": -6.316631317138672, "global_step": 99937, "epoch": 2379} {"train_loss": -6.331411838531494, "global_step": 99938, "epoch": 2379} {"train_loss": -6.273388862609863, "global_step": 99939, "epoch": 2379} {"train_loss": -6.369329452514648, "global_step": 99940, "epoch": 2379} {"train_loss": -6.221878528594971, "global_step": 99941, "epoch": 2379} {"train_loss": -6.207135200500488, "global_step": 99942, "epoch": 2379} {"train_loss": -6.453289031982422, "global_step": 99943, "epoch": 2379} {"train_loss": -6.277987003326416, "global_step": 99944, "epoch": 2379} {"train_loss": -6.225295066833496, "global_step": 99945, "epoch": 2379} {"train_loss": -6.340231418609619, "global_step": 99946, "epoch": 2379} {"train_loss": -6.305488109588623, "global_step": 99947, "epoch": 2379} {"train_loss": -6.400323390960693, "global_step": 99948, "epoch": 2379} {"train_loss": -6.340890407562256, "global_step": 99949, "epoch": 2379} {"train_loss": -6.3461456298828125, "global_step": 99950, "epoch": 2379} {"train_loss": -6.314342498779297, "global_step": 99951, "epoch": 2379} {"train_loss": -6.236812114715576, "global_step": 99952, "epoch": 2379} {"train_loss": -6.228493690490723, "global_step": 99953, "epoch": 2379} {"train_loss": -6.269708633422852, "global_step": 99954, "epoch": 2379} {"train_loss": -6.410113334655762, "global_step": 99955, "epoch": 2379} {"train_loss": -6.359712600708008, "global_step": 99956, "epoch": 2379} {"train_loss": -6.436637878417969, "global_step": 99957, "epoch": 2379} {"train_loss": -6.427521705627441, "global_step": 99958, "epoch": 2379} {"train_loss": -6.339847144626436, "global_step": 99959, "epoch": 2379, "val_loss": 67850.3984375} {"train_loss": -6.383023738861084, "global_step": 99960, "epoch": 2380} {"train_loss": -6.212523937225342, "global_step": 99961, "epoch": 2380} {"train_loss": -6.316929817199707, "global_step": 99962, "epoch": 2380} {"train_loss": -6.357879638671875, "global_step": 99963, "epoch": 2380} {"train_loss": -6.233067512512207, "global_step": 99964, "epoch": 2380} {"train_loss": -6.3190202713012695, "global_step": 99965, "epoch": 2380} {"train_loss": -6.352036476135254, "global_step": 99966, "epoch": 2380} {"train_loss": -6.214625358581543, "global_step": 99967, "epoch": 2380} {"train_loss": -6.159959316253662, "global_step": 99968, "epoch": 2380} {"train_loss": -6.262848377227783, "global_step": 99969, "epoch": 2380} {"train_loss": -6.188327312469482, "global_step": 99970, "epoch": 2380} {"train_loss": -6.1422624588012695, "global_step": 99971, "epoch": 2380} {"train_loss": -6.245179176330566, "global_step": 99972, "epoch": 2380} {"train_loss": -6.12653923034668, "global_step": 99973, "epoch": 2380} {"train_loss": -6.2659077644348145, "global_step": 99974, "epoch": 2380} {"train_loss": -6.190104007720947, "global_step": 99975, "epoch": 2380} {"train_loss": -6.300627708435059, "global_step": 99976, "epoch": 2380} {"train_loss": -5.980023384094238, "global_step": 99977, "epoch": 2380} {"train_loss": -6.26430606842041, "global_step": 99978, "epoch": 2380} {"train_loss": -6.183244705200195, "global_step": 99979, "epoch": 2380} {"train_loss": -6.061701774597168, "global_step": 99980, "epoch": 2380} {"train_loss": -6.112085819244385, "global_step": 99981, "epoch": 2380} {"train_loss": -6.3043622970581055, "global_step": 99982, "epoch": 2380} {"train_loss": -6.167285442352295, "global_step": 99983, "epoch": 2380} {"train_loss": -6.2006659507751465, "global_step": 99984, "epoch": 2380} {"train_loss": -6.24887228012085, "global_step": 99985, "epoch": 2380} {"train_loss": -6.074673652648926, "global_step": 99986, "epoch": 2380} {"train_loss": -6.2855329513549805, "global_step": 99987, "epoch": 2380} {"train_loss": -6.2804365158081055, "global_step": 99988, "epoch": 2380} {"train_loss": -6.216826915740967, "global_step": 99989, "epoch": 2380} {"train_loss": -6.027408599853516, "global_step": 99990, "epoch": 2380} {"train_loss": -6.1576247215271, "global_step": 99991, "epoch": 2380} {"train_loss": -6.192501068115234, "global_step": 99992, "epoch": 2380} {"train_loss": -6.203982830047607, "global_step": 99993, "epoch": 2380} {"train_loss": -6.2253499031066895, "global_step": 99994, "epoch": 2380} {"train_loss": -6.235785484313965, "global_step": 99995, "epoch": 2380} {"train_loss": -6.292031288146973, "global_step": 99996, "epoch": 2380} {"train_loss": -6.406846046447754, "global_step": 99997, "epoch": 2380} {"train_loss": -6.364628791809082, "global_step": 99998, "epoch": 2380} {"train_loss": -6.4131083488464355, "global_step": 99999, "epoch": 2380} {"train_loss": -6.427634239196777, "global_step": 100000, "epoch": 2380} {"train_loss": -6.234425646918161, "global_step": 100001, "epoch": 2380, "val_loss": 68023.828125} {"train_loss": -6.26313591003418, "global_step": 100002, "epoch": 2381} {"train_loss": -6.321230411529541, "global_step": 100003, "epoch": 2381} {"train_loss": -6.349059104919434, "global_step": 100004, "epoch": 2381} {"train_loss": -6.206822872161865, "global_step": 100005, "epoch": 2381} {"train_loss": -6.309011459350586, "global_step": 100006, "epoch": 2381} {"train_loss": -6.447324752807617, "global_step": 100007, "epoch": 2381} {"train_loss": -6.486783027648926, "global_step": 100008, "epoch": 2381} {"train_loss": -6.460393905639648, "global_step": 100009, "epoch": 2381} {"train_loss": -6.321833610534668, "global_step": 100010, "epoch": 2381} {"train_loss": -6.417318344116211, "global_step": 100011, "epoch": 2381} {"train_loss": -6.3488874435424805, "global_step": 100012, "epoch": 2381} {"train_loss": -6.496438980102539, "global_step": 100013, "epoch": 2381} {"train_loss": -6.326918125152588, "global_step": 100014, "epoch": 2381} {"train_loss": -6.365800857543945, "global_step": 100015, "epoch": 2381} {"train_loss": -6.394680500030518, "global_step": 100016, "epoch": 2381} {"train_loss": -6.432498455047607, "global_step": 100017, "epoch": 2381} {"train_loss": -6.365403652191162, "global_step": 100018, "epoch": 2381} {"train_loss": -6.3769121170043945, "global_step": 100019, "epoch": 2381} {"train_loss": -6.142045497894287, "global_step": 100020, "epoch": 2381} {"train_loss": -6.366986274719238, "global_step": 100021, "epoch": 2381} {"train_loss": -6.314453125, "global_step": 100022, "epoch": 2381} {"train_loss": -6.322131633758545, "global_step": 100023, "epoch": 2381} {"train_loss": -6.269615173339844, "global_step": 100024, "epoch": 2381} {"train_loss": -6.325780391693115, "global_step": 100025, "epoch": 2381} {"train_loss": -6.353933334350586, "global_step": 100026, "epoch": 2381} {"train_loss": -6.370020866394043, "global_step": 100027, "epoch": 2381} {"train_loss": -6.316713809967041, "global_step": 100028, "epoch": 2381} {"train_loss": -6.38463020324707, "global_step": 100029, "epoch": 2381} {"train_loss": -6.343635559082031, "global_step": 100030, "epoch": 2381} {"train_loss": -6.39846134185791, "global_step": 100031, "epoch": 2381} {"train_loss": -6.351176738739014, "global_step": 100032, "epoch": 2381} {"train_loss": -6.228381156921387, "global_step": 100033, "epoch": 2381} {"train_loss": -6.411938667297363, "global_step": 100034, "epoch": 2381} {"train_loss": -6.440850257873535, "global_step": 100035, "epoch": 2381} {"train_loss": -6.4431657791137695, "global_step": 100036, "epoch": 2381} {"train_loss": -6.331240653991699, "global_step": 100037, "epoch": 2381} {"train_loss": -6.298498630523682, "global_step": 100038, "epoch": 2381} {"train_loss": -6.4356279373168945, "global_step": 100039, "epoch": 2381} {"train_loss": -6.315526008605957, "global_step": 100040, "epoch": 2381} {"train_loss": -6.4065327644348145, "global_step": 100041, "epoch": 2381} {"train_loss": -6.441905975341797, "global_step": 100042, "epoch": 2381} {"train_loss": -6.355645452226911, "global_step": 100043, "epoch": 2381, "val_loss": 67818.984375} {"train_loss": -6.34619665145874, "global_step": 100044, "epoch": 2382} {"train_loss": -6.410743713378906, "global_step": 100045, "epoch": 2382} {"train_loss": -6.26865291595459, "global_step": 100046, "epoch": 2382} {"train_loss": -6.347011566162109, "global_step": 100047, "epoch": 2382} {"train_loss": -6.290143966674805, "global_step": 100048, "epoch": 2382} {"train_loss": -6.342428207397461, "global_step": 100049, "epoch": 2382} {"train_loss": -6.294502258300781, "global_step": 100050, "epoch": 2382} {"train_loss": -6.19770622253418, "global_step": 100051, "epoch": 2382} {"train_loss": -6.332036972045898, "global_step": 100052, "epoch": 2382} {"train_loss": -6.328641414642334, "global_step": 100053, "epoch": 2382} {"train_loss": -6.326137542724609, "global_step": 100054, "epoch": 2382} {"train_loss": -6.153266906738281, "global_step": 100055, "epoch": 2382} {"train_loss": -6.255130767822266, "global_step": 100056, "epoch": 2382} {"train_loss": -6.276150703430176, "global_step": 100057, "epoch": 2382} {"train_loss": -6.432605266571045, "global_step": 100058, "epoch": 2382} {"train_loss": -6.387728691101074, "global_step": 100059, "epoch": 2382} {"train_loss": -6.365199089050293, "global_step": 100060, "epoch": 2382} {"train_loss": -6.422931671142578, "global_step": 100061, "epoch": 2382} {"train_loss": -6.362973690032959, "global_step": 100062, "epoch": 2382} {"train_loss": -6.461265563964844, "global_step": 100063, "epoch": 2382} {"train_loss": -6.367020130157471, "global_step": 100064, "epoch": 2382} {"train_loss": -6.367292404174805, "global_step": 100065, "epoch": 2382} {"train_loss": -6.316638946533203, "global_step": 100066, "epoch": 2382} {"train_loss": -6.358746528625488, "global_step": 100067, "epoch": 2382} {"train_loss": -6.334644317626953, "global_step": 100068, "epoch": 2382} {"train_loss": -6.408048629760742, "global_step": 100069, "epoch": 2382} {"train_loss": -6.36560583114624, "global_step": 100070, "epoch": 2382} {"train_loss": -6.339513778686523, "global_step": 100071, "epoch": 2382} {"train_loss": -6.485551834106445, "global_step": 100072, "epoch": 2382} {"train_loss": -6.396584510803223, "global_step": 100073, "epoch": 2382} {"train_loss": -6.341696739196777, "global_step": 100074, "epoch": 2382} {"train_loss": -6.565201759338379, "global_step": 100075, "epoch": 2382} {"train_loss": -6.294343948364258, "global_step": 100076, "epoch": 2382} {"train_loss": -6.3348388671875, "global_step": 100077, "epoch": 2382} {"train_loss": -6.3060479164123535, "global_step": 100078, "epoch": 2382} {"train_loss": -6.31948709487915, "global_step": 100079, "epoch": 2382} {"train_loss": -6.313865661621094, "global_step": 100080, "epoch": 2382} {"train_loss": -6.264326095581055, "global_step": 100081, "epoch": 2382} {"train_loss": -6.336750030517578, "global_step": 100082, "epoch": 2382} {"train_loss": -6.299755573272705, "global_step": 100083, "epoch": 2382} {"train_loss": -6.4643731117248535, "global_step": 100084, "epoch": 2382} {"train_loss": -6.346942935671125, "global_step": 100085, "epoch": 2382, "val_loss": 67847.453125} {"train_loss": -6.308207988739014, "global_step": 100086, "epoch": 2383} {"train_loss": -6.415555953979492, "global_step": 100087, "epoch": 2383} {"train_loss": -6.318695545196533, "global_step": 100088, "epoch": 2383} {"train_loss": -6.392549514770508, "global_step": 100089, "epoch": 2383} {"train_loss": -6.320058822631836, "global_step": 100090, "epoch": 2383} {"train_loss": -6.433599472045898, "global_step": 100091, "epoch": 2383} {"train_loss": -6.336613178253174, "global_step": 100092, "epoch": 2383} {"train_loss": -6.283595085144043, "global_step": 100093, "epoch": 2383} {"train_loss": -6.344627380371094, "global_step": 100094, "epoch": 2383} {"train_loss": -6.489955902099609, "global_step": 100095, "epoch": 2383} {"train_loss": -6.436036109924316, "global_step": 100096, "epoch": 2383} {"train_loss": -6.337096214294434, "global_step": 100097, "epoch": 2383} {"train_loss": -6.2438154220581055, "global_step": 100098, "epoch": 2383} {"train_loss": -6.376785755157471, "global_step": 100099, "epoch": 2383} {"train_loss": -6.302716255187988, "global_step": 100100, "epoch": 2383} {"train_loss": -6.392319679260254, "global_step": 100101, "epoch": 2383} {"train_loss": -6.312131881713867, "global_step": 100102, "epoch": 2383} {"train_loss": -6.4169921875, "global_step": 100103, "epoch": 2383} {"train_loss": -6.331910133361816, "global_step": 100104, "epoch": 2383} {"train_loss": -6.381478309631348, "global_step": 100105, "epoch": 2383} {"train_loss": -6.388189792633057, "global_step": 100106, "epoch": 2383} {"train_loss": -6.406670093536377, "global_step": 100107, "epoch": 2383} {"train_loss": -6.3331475257873535, "global_step": 100108, "epoch": 2383} {"train_loss": -6.331233978271484, "global_step": 100109, "epoch": 2383} {"train_loss": -6.361688137054443, "global_step": 100110, "epoch": 2383} {"train_loss": -6.312289237976074, "global_step": 100111, "epoch": 2383} {"train_loss": -6.335659980773926, "global_step": 100112, "epoch": 2383} {"train_loss": -6.300749778747559, "global_step": 100113, "epoch": 2383} {"train_loss": -6.390130043029785, "global_step": 100114, "epoch": 2383} {"train_loss": -6.323359966278076, "global_step": 100115, "epoch": 2383} {"train_loss": -6.408137321472168, "global_step": 100116, "epoch": 2383} {"train_loss": -6.29205322265625, "global_step": 100117, "epoch": 2383} {"train_loss": -6.369915962219238, "global_step": 100118, "epoch": 2383} {"train_loss": -6.354660987854004, "global_step": 100119, "epoch": 2383} {"train_loss": -6.32213020324707, "global_step": 100120, "epoch": 2383} {"train_loss": -6.322259426116943, "global_step": 100121, "epoch": 2383} {"train_loss": -6.336902618408203, "global_step": 100122, "epoch": 2383} {"train_loss": -6.290289878845215, "global_step": 100123, "epoch": 2383} {"train_loss": -6.382482528686523, "global_step": 100124, "epoch": 2383} {"train_loss": -6.320788383483887, "global_step": 100125, "epoch": 2383} {"train_loss": -6.3679399490356445, "global_step": 100126, "epoch": 2383} {"train_loss": -6.353228148959932, "global_step": 100127, "epoch": 2383, "val_loss": 67943.8125} {"train_loss": -6.303297519683838, "global_step": 100128, "epoch": 2384} {"train_loss": -6.329143524169922, "global_step": 100129, "epoch": 2384} {"train_loss": -6.345328330993652, "global_step": 100130, "epoch": 2384} {"train_loss": -6.433875560760498, "global_step": 100131, "epoch": 2384} {"train_loss": -6.4828877449035645, "global_step": 100132, "epoch": 2384} {"train_loss": -6.342977523803711, "global_step": 100133, "epoch": 2384} {"train_loss": -6.356712341308594, "global_step": 100134, "epoch": 2384} {"train_loss": -6.3890886306762695, "global_step": 100135, "epoch": 2384} {"train_loss": -6.304900169372559, "global_step": 100136, "epoch": 2384} {"train_loss": -6.369969844818115, "global_step": 100137, "epoch": 2384} {"train_loss": -6.3237786293029785, "global_step": 100138, "epoch": 2384} {"train_loss": -6.338564872741699, "global_step": 100139, "epoch": 2384} {"train_loss": -6.4029717445373535, "global_step": 100140, "epoch": 2384} {"train_loss": -6.293644905090332, "global_step": 100141, "epoch": 2384} {"train_loss": -6.415480613708496, "global_step": 100142, "epoch": 2384} {"train_loss": -6.271023750305176, "global_step": 100143, "epoch": 2384} {"train_loss": -6.573603630065918, "global_step": 100144, "epoch": 2384} {"train_loss": -6.367772102355957, "global_step": 100145, "epoch": 2384} {"train_loss": -6.371694564819336, "global_step": 100146, "epoch": 2384} {"train_loss": -6.410245895385742, "global_step": 100147, "epoch": 2384} {"train_loss": -6.382019996643066, "global_step": 100148, "epoch": 2384} {"train_loss": -6.3654022216796875, "global_step": 100149, "epoch": 2384} {"train_loss": -6.258888244628906, "global_step": 100150, "epoch": 2384} {"train_loss": -6.360976219177246, "global_step": 100151, "epoch": 2384} {"train_loss": -6.289897918701172, "global_step": 100152, "epoch": 2384} {"train_loss": -6.366513252258301, "global_step": 100153, "epoch": 2384} {"train_loss": -6.499697685241699, "global_step": 100154, "epoch": 2384} {"train_loss": -6.235469818115234, "global_step": 100155, "epoch": 2384} {"train_loss": -6.292352676391602, "global_step": 100156, "epoch": 2384} {"train_loss": -6.443206787109375, "global_step": 100157, "epoch": 2384} {"train_loss": -6.474453449249268, "global_step": 100158, "epoch": 2384} {"train_loss": -6.342591285705566, "global_step": 100159, "epoch": 2384} {"train_loss": -6.38252067565918, "global_step": 100160, "epoch": 2384} {"train_loss": -6.345758438110352, "global_step": 100161, "epoch": 2384} {"train_loss": -6.396124362945557, "global_step": 100162, "epoch": 2384} {"train_loss": -6.226823806762695, "global_step": 100163, "epoch": 2384} {"train_loss": -6.395918846130371, "global_step": 100164, "epoch": 2384} {"train_loss": -6.329662799835205, "global_step": 100165, "epoch": 2384} {"train_loss": -6.266432285308838, "global_step": 100166, "epoch": 2384} {"train_loss": -6.401768684387207, "global_step": 100167, "epoch": 2384} {"train_loss": -6.370379447937012, "global_step": 100168, "epoch": 2384} {"train_loss": -6.364152703966413, "global_step": 100169, "epoch": 2384, "val_loss": 68042.9140625} {"train_loss": -6.4108991622924805, "global_step": 100170, "epoch": 2385} {"train_loss": -6.203180313110352, "global_step": 100171, "epoch": 2385} {"train_loss": -6.415749549865723, "global_step": 100172, "epoch": 2385} {"train_loss": -6.403700828552246, "global_step": 100173, "epoch": 2385} {"train_loss": -6.324867248535156, "global_step": 100174, "epoch": 2385} {"train_loss": -6.26197624206543, "global_step": 100175, "epoch": 2385} {"train_loss": -6.2827372550964355, "global_step": 100176, "epoch": 2385} {"train_loss": -6.3774333000183105, "global_step": 100177, "epoch": 2385} {"train_loss": -6.329336166381836, "global_step": 100178, "epoch": 2385} {"train_loss": -6.3256001472473145, "global_step": 100179, "epoch": 2385} {"train_loss": -6.361192226409912, "global_step": 100180, "epoch": 2385} {"train_loss": -6.290007591247559, "global_step": 100181, "epoch": 2385} {"train_loss": -6.31265926361084, "global_step": 100182, "epoch": 2385} {"train_loss": -6.371668815612793, "global_step": 100183, "epoch": 2385} {"train_loss": -6.28678035736084, "global_step": 100184, "epoch": 2385} {"train_loss": -6.291441917419434, "global_step": 100185, "epoch": 2385} {"train_loss": -6.350020408630371, "global_step": 100186, "epoch": 2385} {"train_loss": -6.339232444763184, "global_step": 100187, "epoch": 2385} {"train_loss": -6.287624359130859, "global_step": 100188, "epoch": 2385} {"train_loss": -6.294760227203369, "global_step": 100189, "epoch": 2385} {"train_loss": -6.341009140014648, "global_step": 100190, "epoch": 2385} {"train_loss": -6.3995232582092285, "global_step": 100191, "epoch": 2385} {"train_loss": -6.203680038452148, "global_step": 100192, "epoch": 2385} {"train_loss": -6.219738960266113, "global_step": 100193, "epoch": 2385} {"train_loss": -6.233814239501953, "global_step": 100194, "epoch": 2385} {"train_loss": -6.290022850036621, "global_step": 100195, "epoch": 2385} {"train_loss": -6.24976110458374, "global_step": 100196, "epoch": 2385} {"train_loss": -6.321674346923828, "global_step": 100197, "epoch": 2385} {"train_loss": -6.458613395690918, "global_step": 100198, "epoch": 2385} {"train_loss": -6.2756195068359375, "global_step": 100199, "epoch": 2385} {"train_loss": -6.330300331115723, "global_step": 100200, "epoch": 2385} {"train_loss": -6.320825576782227, "global_step": 100201, "epoch": 2385} {"train_loss": -6.249202251434326, "global_step": 100202, "epoch": 2385} {"train_loss": -6.329190254211426, "global_step": 100203, "epoch": 2385} {"train_loss": -6.298847675323486, "global_step": 100204, "epoch": 2385} {"train_loss": -6.26011848449707, "global_step": 100205, "epoch": 2385} {"train_loss": -6.286893367767334, "global_step": 100206, "epoch": 2385} {"train_loss": -6.289400100708008, "global_step": 100207, "epoch": 2385} {"train_loss": -6.403092384338379, "global_step": 100208, "epoch": 2385} {"train_loss": -6.446538925170898, "global_step": 100209, "epoch": 2385} {"train_loss": -6.290789604187012, "global_step": 100210, "epoch": 2385} {"train_loss": -6.318356650216239, "global_step": 100211, "epoch": 2385, "val_loss": 67977.015625} {"train_loss": -6.339127540588379, "global_step": 100212, "epoch": 2386} {"train_loss": -6.478104591369629, "global_step": 100213, "epoch": 2386} {"train_loss": -6.320456504821777, "global_step": 100214, "epoch": 2386} {"train_loss": -6.360042572021484, "global_step": 100215, "epoch": 2386} {"train_loss": -6.354941368103027, "global_step": 100216, "epoch": 2386} {"train_loss": -6.330013751983643, "global_step": 100217, "epoch": 2386} {"train_loss": -6.398073196411133, "global_step": 100218, "epoch": 2386} {"train_loss": -6.410172462463379, "global_step": 100219, "epoch": 2386} {"train_loss": -6.324285507202148, "global_step": 100220, "epoch": 2386} {"train_loss": -6.235548496246338, "global_step": 100221, "epoch": 2386} {"train_loss": -6.343475341796875, "global_step": 100222, "epoch": 2386} {"train_loss": -6.299903392791748, "global_step": 100223, "epoch": 2386} {"train_loss": -6.475496292114258, "global_step": 100224, "epoch": 2386} {"train_loss": -6.292686462402344, "global_step": 100225, "epoch": 2386} {"train_loss": -6.356232166290283, "global_step": 100226, "epoch": 2386} {"train_loss": -6.331382751464844, "global_step": 100227, "epoch": 2386} {"train_loss": -6.3927412033081055, "global_step": 100228, "epoch": 2386} {"train_loss": -6.371842384338379, "global_step": 100229, "epoch": 2386} {"train_loss": -6.34743595123291, "global_step": 100230, "epoch": 2386} {"train_loss": -6.287702560424805, "global_step": 100231, "epoch": 2386} {"train_loss": -6.377931594848633, "global_step": 100232, "epoch": 2386} {"train_loss": -6.38143253326416, "global_step": 100233, "epoch": 2386} {"train_loss": -6.36421012878418, "global_step": 100234, "epoch": 2386} {"train_loss": -6.3003950119018555, "global_step": 100235, "epoch": 2386} {"train_loss": -6.416631698608398, "global_step": 100236, "epoch": 2386} {"train_loss": -6.306032657623291, "global_step": 100237, "epoch": 2386} {"train_loss": -6.343851566314697, "global_step": 100238, "epoch": 2386} {"train_loss": -6.248687267303467, "global_step": 100239, "epoch": 2386} {"train_loss": -6.044764518737793, "global_step": 100240, "epoch": 2386} {"train_loss": -6.299764633178711, "global_step": 100241, "epoch": 2386} {"train_loss": -6.359185218811035, "global_step": 100242, "epoch": 2386} {"train_loss": -6.194003582000732, "global_step": 100243, "epoch": 2386} {"train_loss": -6.494304656982422, "global_step": 100244, "epoch": 2386} {"train_loss": -6.292074203491211, "global_step": 100245, "epoch": 2386} {"train_loss": -6.323631286621094, "global_step": 100246, "epoch": 2386} {"train_loss": -6.258723258972168, "global_step": 100247, "epoch": 2386} {"train_loss": -6.294816970825195, "global_step": 100248, "epoch": 2386} {"train_loss": -6.347309112548828, "global_step": 100249, "epoch": 2386} {"train_loss": -6.357450008392334, "global_step": 100250, "epoch": 2386} {"train_loss": -6.416531562805176, "global_step": 100251, "epoch": 2386} {"train_loss": -6.332234859466553, "global_step": 100252, "epoch": 2386} {"train_loss": -6.3379544871194025, "global_step": 100253, "epoch": 2386, "val_loss": 68005.96875} {"train_loss": -6.423495292663574, "global_step": 100254, "epoch": 2387} {"train_loss": -6.475720405578613, "global_step": 100255, "epoch": 2387} {"train_loss": -6.399934768676758, "global_step": 100256, "epoch": 2387} {"train_loss": -6.29960298538208, "global_step": 100257, "epoch": 2387} {"train_loss": -6.258153438568115, "global_step": 100258, "epoch": 2387} {"train_loss": -6.358556747436523, "global_step": 100259, "epoch": 2387} {"train_loss": -6.3515472412109375, "global_step": 100260, "epoch": 2387} {"train_loss": -6.395041465759277, "global_step": 100261, "epoch": 2387} {"train_loss": -6.281261920928955, "global_step": 100262, "epoch": 2387} {"train_loss": -6.303448677062988, "global_step": 100263, "epoch": 2387} {"train_loss": -6.378970146179199, "global_step": 100264, "epoch": 2387} {"train_loss": -6.3618621826171875, "global_step": 100265, "epoch": 2387} {"train_loss": -6.343094825744629, "global_step": 100266, "epoch": 2387} {"train_loss": -6.351686954498291, "global_step": 100267, "epoch": 2387} {"train_loss": -6.359879493713379, "global_step": 100268, "epoch": 2387} {"train_loss": -6.288356781005859, "global_step": 100269, "epoch": 2387} {"train_loss": -6.26860237121582, "global_step": 100270, "epoch": 2387} {"train_loss": -6.3114013671875, "global_step": 100271, "epoch": 2387} {"train_loss": -6.385377883911133, "global_step": 100272, "epoch": 2387} {"train_loss": -6.380033493041992, "global_step": 100273, "epoch": 2387} {"train_loss": -6.464789867401123, "global_step": 100274, "epoch": 2387} {"train_loss": -6.320879936218262, "global_step": 100275, "epoch": 2387} {"train_loss": -6.269636631011963, "global_step": 100276, "epoch": 2387} {"train_loss": -6.3532938957214355, "global_step": 100277, "epoch": 2387} {"train_loss": -6.448349952697754, "global_step": 100278, "epoch": 2387} {"train_loss": -6.417500019073486, "global_step": 100279, "epoch": 2387} {"train_loss": -6.363391876220703, "global_step": 100280, "epoch": 2387} {"train_loss": -6.34318733215332, "global_step": 100281, "epoch": 2387} {"train_loss": -6.224638938903809, "global_step": 100282, "epoch": 2387} {"train_loss": -6.384861946105957, "global_step": 100283, "epoch": 2387} {"train_loss": -6.255300521850586, "global_step": 100284, "epoch": 2387} {"train_loss": -6.530111312866211, "global_step": 100285, "epoch": 2387} {"train_loss": -6.359277248382568, "global_step": 100286, "epoch": 2387} {"train_loss": -6.367873191833496, "global_step": 100287, "epoch": 2387} {"train_loss": -6.35081672668457, "global_step": 100288, "epoch": 2387} {"train_loss": -6.405858993530273, "global_step": 100289, "epoch": 2387} {"train_loss": -6.308110237121582, "global_step": 100290, "epoch": 2387} {"train_loss": -6.357895851135254, "global_step": 100291, "epoch": 2387} {"train_loss": -6.410602569580078, "global_step": 100292, "epoch": 2387} {"train_loss": -6.2507452964782715, "global_step": 100293, "epoch": 2387} {"train_loss": -6.3952436447143555, "global_step": 100294, "epoch": 2387} {"train_loss": -6.35429767199925, "global_step": 100295, "epoch": 2387, "val_loss": 68063.140625} {"train_loss": -6.378823757171631, "global_step": 100296, "epoch": 2388} {"train_loss": -6.280535697937012, "global_step": 100297, "epoch": 2388} {"train_loss": -6.313630104064941, "global_step": 100298, "epoch": 2388} {"train_loss": -6.352952003479004, "global_step": 100299, "epoch": 2388} {"train_loss": -6.37192440032959, "global_step": 100300, "epoch": 2388} {"train_loss": -6.350467681884766, "global_step": 100301, "epoch": 2388} {"train_loss": -6.363267421722412, "global_step": 100302, "epoch": 2388} {"train_loss": -6.3107500076293945, "global_step": 100303, "epoch": 2388} {"train_loss": -6.210203170776367, "global_step": 100304, "epoch": 2388} {"train_loss": -6.244935035705566, "global_step": 100305, "epoch": 2388} {"train_loss": -6.458695411682129, "global_step": 100306, "epoch": 2388} {"train_loss": -6.276294231414795, "global_step": 100307, "epoch": 2388} {"train_loss": -6.47149658203125, "global_step": 100308, "epoch": 2388} {"train_loss": -6.392402648925781, "global_step": 100309, "epoch": 2388} {"train_loss": -6.179018020629883, "global_step": 100310, "epoch": 2388} {"train_loss": -6.437921524047852, "global_step": 100311, "epoch": 2388} {"train_loss": -6.315408229827881, "global_step": 100312, "epoch": 2388} {"train_loss": -6.353122711181641, "global_step": 100313, "epoch": 2388} {"train_loss": -6.2923359870910645, "global_step": 100314, "epoch": 2388} {"train_loss": -6.334323883056641, "global_step": 100315, "epoch": 2388} {"train_loss": -6.290705680847168, "global_step": 100316, "epoch": 2388} {"train_loss": -6.335260391235352, "global_step": 100317, "epoch": 2388} {"train_loss": -6.37990140914917, "global_step": 100318, "epoch": 2388} {"train_loss": -6.426571369171143, "global_step": 100319, "epoch": 2388} {"train_loss": -6.313767433166504, "global_step": 100320, "epoch": 2388} {"train_loss": -6.397240161895752, "global_step": 100321, "epoch": 2388} {"train_loss": -6.315927505493164, "global_step": 100322, "epoch": 2388} {"train_loss": -6.297719955444336, "global_step": 100323, "epoch": 2388} {"train_loss": -6.510229110717773, "global_step": 100324, "epoch": 2388} {"train_loss": -6.365140914916992, "global_step": 100325, "epoch": 2388} {"train_loss": -6.222166538238525, "global_step": 100326, "epoch": 2388} {"train_loss": -6.306232452392578, "global_step": 100327, "epoch": 2388} {"train_loss": -6.453258991241455, "global_step": 100328, "epoch": 2388} {"train_loss": -6.3385443687438965, "global_step": 100329, "epoch": 2388} {"train_loss": -6.310253143310547, "global_step": 100330, "epoch": 2388} {"train_loss": -6.331644058227539, "global_step": 100331, "epoch": 2388} {"train_loss": -6.472052574157715, "global_step": 100332, "epoch": 2388} {"train_loss": -6.226106643676758, "global_step": 100333, "epoch": 2388} {"train_loss": -6.205469608306885, "global_step": 100334, "epoch": 2388} {"train_loss": -6.410633087158203, "global_step": 100335, "epoch": 2388} {"train_loss": -6.2751264572143555, "global_step": 100336, "epoch": 2388} {"train_loss": -6.335771765027728, "global_step": 100337, "epoch": 2388, "val_loss": 67865.2890625} {"train_loss": -6.277636528015137, "global_step": 100338, "epoch": 2389} {"train_loss": -6.429318428039551, "global_step": 100339, "epoch": 2389} {"train_loss": -6.331052780151367, "global_step": 100340, "epoch": 2389} {"train_loss": -6.308158874511719, "global_step": 100341, "epoch": 2389} {"train_loss": -6.3193864822387695, "global_step": 100342, "epoch": 2389} {"train_loss": -6.341061592102051, "global_step": 100343, "epoch": 2389} {"train_loss": -6.371880531311035, "global_step": 100344, "epoch": 2389} {"train_loss": -6.235313415527344, "global_step": 100345, "epoch": 2389} {"train_loss": -6.27840518951416, "global_step": 100346, "epoch": 2389} {"train_loss": -6.346355438232422, "global_step": 100347, "epoch": 2389} {"train_loss": -6.220925331115723, "global_step": 100348, "epoch": 2389} {"train_loss": -6.2402424812316895, "global_step": 100349, "epoch": 2389} {"train_loss": -6.38832950592041, "global_step": 100350, "epoch": 2389} {"train_loss": -6.316313743591309, "global_step": 100351, "epoch": 2389} {"train_loss": -6.400003910064697, "global_step": 100352, "epoch": 2389} {"train_loss": -6.242940902709961, "global_step": 100353, "epoch": 2389} {"train_loss": -6.258925914764404, "global_step": 100354, "epoch": 2389} {"train_loss": -6.259972095489502, "global_step": 100355, "epoch": 2389} {"train_loss": -6.274002552032471, "global_step": 100356, "epoch": 2389} {"train_loss": -6.311652183532715, "global_step": 100357, "epoch": 2389} {"train_loss": -6.1085968017578125, "global_step": 100358, "epoch": 2389} {"train_loss": -6.319916248321533, "global_step": 100359, "epoch": 2389} {"train_loss": -6.364382266998291, "global_step": 100360, "epoch": 2389} {"train_loss": -6.3285813331604, "global_step": 100361, "epoch": 2389} {"train_loss": -6.271655559539795, "global_step": 100362, "epoch": 2389} {"train_loss": -6.275457382202148, "global_step": 100363, "epoch": 2389} {"train_loss": -6.299660682678223, "global_step": 100364, "epoch": 2389} {"train_loss": -6.337376594543457, "global_step": 100365, "epoch": 2389} {"train_loss": -6.31846809387207, "global_step": 100366, "epoch": 2389} {"train_loss": -6.29749870300293, "global_step": 100367, "epoch": 2389} {"train_loss": -6.315796375274658, "global_step": 100368, "epoch": 2389} {"train_loss": -6.374221324920654, "global_step": 100369, "epoch": 2389} {"train_loss": -6.2175822257995605, "global_step": 100370, "epoch": 2389} {"train_loss": -6.299069404602051, "global_step": 100371, "epoch": 2389} {"train_loss": -6.267627716064453, "global_step": 100372, "epoch": 2389} {"train_loss": -6.276843547821045, "global_step": 100373, "epoch": 2389} {"train_loss": -6.2970781326293945, "global_step": 100374, "epoch": 2389} {"train_loss": -6.341790199279785, "global_step": 100375, "epoch": 2389} {"train_loss": -6.294902324676514, "global_step": 100376, "epoch": 2389} {"train_loss": -6.320829391479492, "global_step": 100377, "epoch": 2389} {"train_loss": -6.311748504638672, "global_step": 100378, "epoch": 2389} {"train_loss": -6.30162254969279, "global_step": 100379, "epoch": 2389, "val_loss": 68159.0859375} {"train_loss": -6.283544540405273, "global_step": 100380, "epoch": 2390} {"train_loss": -6.422846794128418, "global_step": 100381, "epoch": 2390} {"train_loss": -6.225360870361328, "global_step": 100382, "epoch": 2390} {"train_loss": -6.160303115844727, "global_step": 100383, "epoch": 2390} {"train_loss": -6.372068405151367, "global_step": 100384, "epoch": 2390} {"train_loss": -6.4277801513671875, "global_step": 100385, "epoch": 2390} {"train_loss": -6.335547924041748, "global_step": 100386, "epoch": 2390} {"train_loss": -6.348323822021484, "global_step": 100387, "epoch": 2390} {"train_loss": -6.286555290222168, "global_step": 100388, "epoch": 2390} {"train_loss": -6.297118663787842, "global_step": 100389, "epoch": 2390} {"train_loss": -6.273229598999023, "global_step": 100390, "epoch": 2390} {"train_loss": -6.352663040161133, "global_step": 100391, "epoch": 2390} {"train_loss": -6.336075782775879, "global_step": 100392, "epoch": 2390} {"train_loss": -6.35929012298584, "global_step": 100393, "epoch": 2390} {"train_loss": -6.275692462921143, "global_step": 100394, "epoch": 2390} {"train_loss": -6.4794921875, "global_step": 100395, "epoch": 2390} {"train_loss": -6.2553181648254395, "global_step": 100396, "epoch": 2390} {"train_loss": -6.333791732788086, "global_step": 100397, "epoch": 2390} {"train_loss": -6.295529842376709, "global_step": 100398, "epoch": 2390} {"train_loss": -6.245416641235352, "global_step": 100399, "epoch": 2390} {"train_loss": -6.343367576599121, "global_step": 100400, "epoch": 2390} {"train_loss": -6.401300430297852, "global_step": 100401, "epoch": 2390} {"train_loss": -6.282104015350342, "global_step": 100402, "epoch": 2390} {"train_loss": -6.311007499694824, "global_step": 100403, "epoch": 2390} {"train_loss": -6.3770551681518555, "global_step": 100404, "epoch": 2390} {"train_loss": -6.270912170410156, "global_step": 100405, "epoch": 2390} {"train_loss": -6.348594665527344, "global_step": 100406, "epoch": 2390} {"train_loss": -6.404681205749512, "global_step": 100407, "epoch": 2390} {"train_loss": -6.403043746948242, "global_step": 100408, "epoch": 2390} {"train_loss": -6.481476783752441, "global_step": 100409, "epoch": 2390} {"train_loss": -6.4109601974487305, "global_step": 100410, "epoch": 2390} {"train_loss": -6.413609981536865, "global_step": 100411, "epoch": 2390} {"train_loss": -6.260739326477051, "global_step": 100412, "epoch": 2390} {"train_loss": -6.29990816116333, "global_step": 100413, "epoch": 2390} {"train_loss": -6.374427318572998, "global_step": 100414, "epoch": 2390} {"train_loss": -6.2736897468566895, "global_step": 100415, "epoch": 2390} {"train_loss": -6.35152530670166, "global_step": 100416, "epoch": 2390} {"train_loss": -6.481107234954834, "global_step": 100417, "epoch": 2390} {"train_loss": -6.393831729888916, "global_step": 100418, "epoch": 2390} {"train_loss": -6.319118499755859, "global_step": 100419, "epoch": 2390} {"train_loss": -6.43305778503418, "global_step": 100420, "epoch": 2390} {"train_loss": -6.339392571222215, "global_step": 100421, "epoch": 2390, "val_loss": 68020.8125} {"train_loss": -6.4010491371154785, "global_step": 100422, "epoch": 2391} {"train_loss": -6.436995029449463, "global_step": 100423, "epoch": 2391} {"train_loss": -6.3245768547058105, "global_step": 100424, "epoch": 2391} {"train_loss": -6.281358242034912, "global_step": 100425, "epoch": 2391} {"train_loss": -6.376832962036133, "global_step": 100426, "epoch": 2391} {"train_loss": -6.347769737243652, "global_step": 100427, "epoch": 2391} {"train_loss": -6.421240329742432, "global_step": 100428, "epoch": 2391} {"train_loss": -6.324435234069824, "global_step": 100429, "epoch": 2391} {"train_loss": -6.345384120941162, "global_step": 100430, "epoch": 2391} {"train_loss": -6.300473213195801, "global_step": 100431, "epoch": 2391} {"train_loss": -6.4000749588012695, "global_step": 100432, "epoch": 2391} {"train_loss": -6.528103828430176, "global_step": 100433, "epoch": 2391} {"train_loss": -6.394064903259277, "global_step": 100434, "epoch": 2391} {"train_loss": -6.322223663330078, "global_step": 100435, "epoch": 2391} {"train_loss": -6.276812553405762, "global_step": 100436, "epoch": 2391} {"train_loss": -6.219829559326172, "global_step": 100437, "epoch": 2391} {"train_loss": -6.360774517059326, "global_step": 100438, "epoch": 2391} {"train_loss": -6.358043670654297, "global_step": 100439, "epoch": 2391} {"train_loss": -6.228112697601318, "global_step": 100440, "epoch": 2391} {"train_loss": -6.258092403411865, "global_step": 100441, "epoch": 2391} {"train_loss": -6.282443046569824, "global_step": 100442, "epoch": 2391} {"train_loss": -6.294578552246094, "global_step": 100443, "epoch": 2391} {"train_loss": -6.366814613342285, "global_step": 100444, "epoch": 2391} {"train_loss": -6.2118377685546875, "global_step": 100445, "epoch": 2391} {"train_loss": -6.362780570983887, "global_step": 100446, "epoch": 2391} {"train_loss": -6.352628707885742, "global_step": 100447, "epoch": 2391} {"train_loss": -6.35446310043335, "global_step": 100448, "epoch": 2391} {"train_loss": -6.4821624755859375, "global_step": 100449, "epoch": 2391} {"train_loss": -6.246751308441162, "global_step": 100450, "epoch": 2391} {"train_loss": -6.218925476074219, "global_step": 100451, "epoch": 2391} {"train_loss": -6.276144027709961, "global_step": 100452, "epoch": 2391} {"train_loss": -6.29502534866333, "global_step": 100453, "epoch": 2391} {"train_loss": -6.264135360717773, "global_step": 100454, "epoch": 2391} {"train_loss": -6.359811782836914, "global_step": 100455, "epoch": 2391} {"train_loss": -6.342052936553955, "global_step": 100456, "epoch": 2391} {"train_loss": -6.449506759643555, "global_step": 100457, "epoch": 2391} {"train_loss": -6.340404510498047, "global_step": 100458, "epoch": 2391} {"train_loss": -6.2180633544921875, "global_step": 100459, "epoch": 2391} {"train_loss": -6.294183254241943, "global_step": 100460, "epoch": 2391} {"train_loss": -6.332499980926514, "global_step": 100461, "epoch": 2391} {"train_loss": -6.369499683380127, "global_step": 100462, "epoch": 2391} {"train_loss": -6.330807640438988, "global_step": 100463, "epoch": 2391, "val_loss": 67904.0546875} {"train_loss": -6.468717098236084, "global_step": 100464, "epoch": 2392} {"train_loss": -6.337729454040527, "global_step": 100465, "epoch": 2392} {"train_loss": -6.334572792053223, "global_step": 100466, "epoch": 2392} {"train_loss": -6.408506393432617, "global_step": 100467, "epoch": 2392} {"train_loss": -6.38740348815918, "global_step": 100468, "epoch": 2392} {"train_loss": -6.3948798179626465, "global_step": 100469, "epoch": 2392} {"train_loss": -6.412233829498291, "global_step": 100470, "epoch": 2392} {"train_loss": -6.408341407775879, "global_step": 100471, "epoch": 2392} {"train_loss": -6.3604736328125, "global_step": 100472, "epoch": 2392} {"train_loss": -6.38319730758667, "global_step": 100473, "epoch": 2392} {"train_loss": -6.427013397216797, "global_step": 100474, "epoch": 2392} {"train_loss": -6.456574440002441, "global_step": 100475, "epoch": 2392} {"train_loss": -6.396458625793457, "global_step": 100476, "epoch": 2392} {"train_loss": -6.31367826461792, "global_step": 100477, "epoch": 2392} {"train_loss": -6.371437072753906, "global_step": 100478, "epoch": 2392} {"train_loss": -6.460605621337891, "global_step": 100479, "epoch": 2392} {"train_loss": -6.41208028793335, "global_step": 100480, "epoch": 2392} {"train_loss": -6.383315086364746, "global_step": 100481, "epoch": 2392} {"train_loss": -6.353123188018799, "global_step": 100482, "epoch": 2392} {"train_loss": -6.3410844802856445, "global_step": 100483, "epoch": 2392} {"train_loss": -6.324031829833984, "global_step": 100484, "epoch": 2392} {"train_loss": -6.3096842765808105, "global_step": 100485, "epoch": 2392} {"train_loss": -6.310516357421875, "global_step": 100486, "epoch": 2392} {"train_loss": -6.309561729431152, "global_step": 100487, "epoch": 2392} {"train_loss": -6.253576278686523, "global_step": 100488, "epoch": 2392} {"train_loss": -6.420435905456543, "global_step": 100489, "epoch": 2392} {"train_loss": -6.312837600708008, "global_step": 100490, "epoch": 2392} {"train_loss": -6.34244966506958, "global_step": 100491, "epoch": 2392} {"train_loss": -6.370815277099609, "global_step": 100492, "epoch": 2392} {"train_loss": -6.27668571472168, "global_step": 100493, "epoch": 2392} {"train_loss": -6.261016845703125, "global_step": 100494, "epoch": 2392} {"train_loss": -6.444923400878906, "global_step": 100495, "epoch": 2392} {"train_loss": -6.3300323486328125, "global_step": 100496, "epoch": 2392} {"train_loss": -6.324749946594238, "global_step": 100497, "epoch": 2392} {"train_loss": -6.33115291595459, "global_step": 100498, "epoch": 2392} {"train_loss": -6.358193874359131, "global_step": 100499, "epoch": 2392} {"train_loss": -6.332736015319824, "global_step": 100500, "epoch": 2392} {"train_loss": -6.428253650665283, "global_step": 100501, "epoch": 2392} {"train_loss": -6.371992588043213, "global_step": 100502, "epoch": 2392} {"train_loss": -6.357367515563965, "global_step": 100503, "epoch": 2392} {"train_loss": -6.357276439666748, "global_step": 100504, "epoch": 2392} {"train_loss": -6.365614993231637, "global_step": 100505, "epoch": 2392, "val_loss": 68020.4140625} {"train_loss": -6.374052047729492, "global_step": 100506, "epoch": 2393} {"train_loss": -6.44828987121582, "global_step": 100507, "epoch": 2393} {"train_loss": -6.339795112609863, "global_step": 100508, "epoch": 2393} {"train_loss": -6.319733619689941, "global_step": 100509, "epoch": 2393} {"train_loss": -6.396448135375977, "global_step": 100510, "epoch": 2393} {"train_loss": -6.246110916137695, "global_step": 100511, "epoch": 2393} {"train_loss": -6.355948448181152, "global_step": 100512, "epoch": 2393} {"train_loss": -6.368608474731445, "global_step": 100513, "epoch": 2393} {"train_loss": -6.342153549194336, "global_step": 100514, "epoch": 2393} {"train_loss": -6.396571159362793, "global_step": 100515, "epoch": 2393} {"train_loss": -6.298083305358887, "global_step": 100516, "epoch": 2393} {"train_loss": -6.35723352432251, "global_step": 100517, "epoch": 2393} {"train_loss": -6.411087989807129, "global_step": 100518, "epoch": 2393} {"train_loss": -6.347599029541016, "global_step": 100519, "epoch": 2393} {"train_loss": -6.373044013977051, "global_step": 100520, "epoch": 2393} {"train_loss": -6.380764007568359, "global_step": 100521, "epoch": 2393} {"train_loss": -6.211740493774414, "global_step": 100522, "epoch": 2393} {"train_loss": -6.272821426391602, "global_step": 100523, "epoch": 2393} {"train_loss": -6.33017110824585, "global_step": 100524, "epoch": 2393} {"train_loss": -6.27680778503418, "global_step": 100525, "epoch": 2393} {"train_loss": -6.396283149719238, "global_step": 100526, "epoch": 2393} {"train_loss": -6.390686988830566, "global_step": 100527, "epoch": 2393} {"train_loss": -6.343735218048096, "global_step": 100528, "epoch": 2393} {"train_loss": -6.376760482788086, "global_step": 100529, "epoch": 2393} {"train_loss": -6.301843166351318, "global_step": 100530, "epoch": 2393} {"train_loss": -6.3505048751831055, "global_step": 100531, "epoch": 2393} {"train_loss": -6.4077348709106445, "global_step": 100532, "epoch": 2393} {"train_loss": -6.298980712890625, "global_step": 100533, "epoch": 2393} {"train_loss": -6.3241729736328125, "global_step": 100534, "epoch": 2393} {"train_loss": -6.382824420928955, "global_step": 100535, "epoch": 2393} {"train_loss": -6.280124187469482, "global_step": 100536, "epoch": 2393} {"train_loss": -6.3604416847229, "global_step": 100537, "epoch": 2393} {"train_loss": -6.368688106536865, "global_step": 100538, "epoch": 2393} {"train_loss": -6.277329444885254, "global_step": 100539, "epoch": 2393} {"train_loss": -6.243443012237549, "global_step": 100540, "epoch": 2393} {"train_loss": -6.420042514801025, "global_step": 100541, "epoch": 2393} {"train_loss": -6.26439094543457, "global_step": 100542, "epoch": 2393} {"train_loss": -6.376620769500732, "global_step": 100543, "epoch": 2393} {"train_loss": -6.426044940948486, "global_step": 100544, "epoch": 2393} {"train_loss": -6.30867862701416, "global_step": 100545, "epoch": 2393} {"train_loss": -6.389928340911865, "global_step": 100546, "epoch": 2393} {"train_loss": -6.344424327214559, "global_step": 100547, "epoch": 2393, "val_loss": 67968.4140625} {"train_loss": -6.275578498840332, "global_step": 100548, "epoch": 2394} {"train_loss": -6.29318904876709, "global_step": 100549, "epoch": 2394} {"train_loss": -6.396452903747559, "global_step": 100550, "epoch": 2394} {"train_loss": -6.321967124938965, "global_step": 100551, "epoch": 2394} {"train_loss": -6.300695419311523, "global_step": 100552, "epoch": 2394} {"train_loss": -6.344679832458496, "global_step": 100553, "epoch": 2394} {"train_loss": -6.4177961349487305, "global_step": 100554, "epoch": 2394} {"train_loss": -6.312029838562012, "global_step": 100555, "epoch": 2394} {"train_loss": -6.421265602111816, "global_step": 100556, "epoch": 2394} {"train_loss": -6.273252964019775, "global_step": 100557, "epoch": 2394} {"train_loss": -6.276866436004639, "global_step": 100558, "epoch": 2394} {"train_loss": -6.399141311645508, "global_step": 100559, "epoch": 2394} {"train_loss": -6.354620933532715, "global_step": 100560, "epoch": 2394} {"train_loss": -6.442018508911133, "global_step": 100561, "epoch": 2394} {"train_loss": -6.325011730194092, "global_step": 100562, "epoch": 2394} {"train_loss": -6.358745574951172, "global_step": 100563, "epoch": 2394} {"train_loss": -6.35991907119751, "global_step": 100564, "epoch": 2394} {"train_loss": -6.370151042938232, "global_step": 100565, "epoch": 2394} {"train_loss": -6.463326930999756, "global_step": 100566, "epoch": 2394} {"train_loss": -6.393930912017822, "global_step": 100567, "epoch": 2394} {"train_loss": -6.379367351531982, "global_step": 100568, "epoch": 2394} {"train_loss": -6.3514509201049805, "global_step": 100569, "epoch": 2394} {"train_loss": -6.434839248657227, "global_step": 100570, "epoch": 2394} {"train_loss": -6.415078163146973, "global_step": 100571, "epoch": 2394} {"train_loss": -6.374640464782715, "global_step": 100572, "epoch": 2394} {"train_loss": -6.295340538024902, "global_step": 100573, "epoch": 2394} {"train_loss": -6.2949981689453125, "global_step": 100574, "epoch": 2394} {"train_loss": -6.435133934020996, "global_step": 100575, "epoch": 2394} {"train_loss": -6.3118696212768555, "global_step": 100576, "epoch": 2394} {"train_loss": -6.353481292724609, "global_step": 100577, "epoch": 2394} {"train_loss": -6.280118942260742, "global_step": 100578, "epoch": 2394} {"train_loss": -6.394346714019775, "global_step": 100579, "epoch": 2394} {"train_loss": -6.33505916595459, "global_step": 100580, "epoch": 2394} {"train_loss": -6.263694763183594, "global_step": 100581, "epoch": 2394} {"train_loss": -6.275205612182617, "global_step": 100582, "epoch": 2394} {"train_loss": -6.33074951171875, "global_step": 100583, "epoch": 2394} {"train_loss": -6.2802910804748535, "global_step": 100584, "epoch": 2394} {"train_loss": -6.402565002441406, "global_step": 100585, "epoch": 2394} {"train_loss": -6.256269454956055, "global_step": 100586, "epoch": 2394} {"train_loss": -6.366452693939209, "global_step": 100587, "epoch": 2394} {"train_loss": -6.398555755615234, "global_step": 100588, "epoch": 2394} {"train_loss": -6.347478151321411, "global_step": 100589, "epoch": 2394, "val_loss": 68331.7578125} {"train_loss": -6.301361083984375, "global_step": 100590, "epoch": 2395} {"train_loss": -6.323145389556885, "global_step": 100591, "epoch": 2395} {"train_loss": -6.186234951019287, "global_step": 100592, "epoch": 2395} {"train_loss": -6.391835689544678, "global_step": 100593, "epoch": 2395} {"train_loss": -6.279817581176758, "global_step": 100594, "epoch": 2395} {"train_loss": -6.355229377746582, "global_step": 100595, "epoch": 2395} {"train_loss": -6.304767608642578, "global_step": 100596, "epoch": 2395} {"train_loss": -6.37984561920166, "global_step": 100597, "epoch": 2395} {"train_loss": -6.39683723449707, "global_step": 100598, "epoch": 2395} {"train_loss": -6.299220085144043, "global_step": 100599, "epoch": 2395} {"train_loss": -6.340933322906494, "global_step": 100600, "epoch": 2395} {"train_loss": -6.289637565612793, "global_step": 100601, "epoch": 2395} {"train_loss": -6.320032119750977, "global_step": 100602, "epoch": 2395} {"train_loss": -6.436547756195068, "global_step": 100603, "epoch": 2395} {"train_loss": -6.414292335510254, "global_step": 100604, "epoch": 2395} {"train_loss": -6.447943687438965, "global_step": 100605, "epoch": 2395} {"train_loss": -6.398048400878906, "global_step": 100606, "epoch": 2395} {"train_loss": -6.365700721740723, "global_step": 100607, "epoch": 2395} {"train_loss": -6.3572492599487305, "global_step": 100608, "epoch": 2395} {"train_loss": -6.371756553649902, "global_step": 100609, "epoch": 2395} {"train_loss": -6.378182411193848, "global_step": 100610, "epoch": 2395} {"train_loss": -6.233745574951172, "global_step": 100611, "epoch": 2395} {"train_loss": -6.400489807128906, "global_step": 100612, "epoch": 2395} {"train_loss": -6.429091453552246, "global_step": 100613, "epoch": 2395} {"train_loss": -6.369386672973633, "global_step": 100614, "epoch": 2395} {"train_loss": -6.371458530426025, "global_step": 100615, "epoch": 2395} {"train_loss": -6.345677852630615, "global_step": 100616, "epoch": 2395} {"train_loss": -6.34146785736084, "global_step": 100617, "epoch": 2395} {"train_loss": -6.287688732147217, "global_step": 100618, "epoch": 2395} {"train_loss": -6.354084014892578, "global_step": 100619, "epoch": 2395} {"train_loss": -6.3226118087768555, "global_step": 100620, "epoch": 2395} {"train_loss": -6.431268215179443, "global_step": 100621, "epoch": 2395} {"train_loss": -6.451329231262207, "global_step": 100622, "epoch": 2395} {"train_loss": -6.467040538787842, "global_step": 100623, "epoch": 2395} {"train_loss": -6.378836154937744, "global_step": 100624, "epoch": 2395} {"train_loss": -6.335330486297607, "global_step": 100625, "epoch": 2395} {"train_loss": -6.3662919998168945, "global_step": 100626, "epoch": 2395} {"train_loss": -6.388875961303711, "global_step": 100627, "epoch": 2395} {"train_loss": -6.298576354980469, "global_step": 100628, "epoch": 2395} {"train_loss": -6.32032585144043, "global_step": 100629, "epoch": 2395} {"train_loss": -6.376047611236572, "global_step": 100630, "epoch": 2395} {"train_loss": -6.354884193057106, "global_step": 100631, "epoch": 2395, "val_loss": 68035.953125} {"train_loss": -6.2087812423706055, "global_step": 100632, "epoch": 2396} {"train_loss": -6.250180244445801, "global_step": 100633, "epoch": 2396} {"train_loss": -6.470973014831543, "global_step": 100634, "epoch": 2396} {"train_loss": -6.313714981079102, "global_step": 100635, "epoch": 2396} {"train_loss": -6.364828109741211, "global_step": 100636, "epoch": 2396} {"train_loss": -6.376213550567627, "global_step": 100637, "epoch": 2396} {"train_loss": -6.382996559143066, "global_step": 100638, "epoch": 2396} {"train_loss": -6.318559646606445, "global_step": 100639, "epoch": 2396} {"train_loss": -6.34037446975708, "global_step": 100640, "epoch": 2396} {"train_loss": -6.364931106567383, "global_step": 100641, "epoch": 2396} {"train_loss": -6.370326995849609, "global_step": 100642, "epoch": 2396} {"train_loss": -6.276965141296387, "global_step": 100643, "epoch": 2396} {"train_loss": -6.408669471740723, "global_step": 100644, "epoch": 2396} {"train_loss": -6.464564800262451, "global_step": 100645, "epoch": 2396} {"train_loss": -6.339168071746826, "global_step": 100646, "epoch": 2396} {"train_loss": -6.301980018615723, "global_step": 100647, "epoch": 2396} {"train_loss": -6.380022048950195, "global_step": 100648, "epoch": 2396} {"train_loss": -6.349551200866699, "global_step": 100649, "epoch": 2396} {"train_loss": -6.324240684509277, "global_step": 100650, "epoch": 2396} {"train_loss": -6.422708034515381, "global_step": 100651, "epoch": 2396} {"train_loss": -6.421815872192383, "global_step": 100652, "epoch": 2396} {"train_loss": -6.388025283813477, "global_step": 100653, "epoch": 2396} {"train_loss": -6.3519744873046875, "global_step": 100654, "epoch": 2396} {"train_loss": -6.501436233520508, "global_step": 100655, "epoch": 2396} {"train_loss": -6.2339558601379395, "global_step": 100656, "epoch": 2396} {"train_loss": -6.398836612701416, "global_step": 100657, "epoch": 2396} {"train_loss": -6.369915962219238, "global_step": 100658, "epoch": 2396} {"train_loss": -6.490852355957031, "global_step": 100659, "epoch": 2396} {"train_loss": -6.378290176391602, "global_step": 100660, "epoch": 2396} {"train_loss": -6.325344085693359, "global_step": 100661, "epoch": 2396} {"train_loss": -6.330702304840088, "global_step": 100662, "epoch": 2396} {"train_loss": -6.386568069458008, "global_step": 100663, "epoch": 2396} {"train_loss": -6.199763774871826, "global_step": 100664, "epoch": 2396} {"train_loss": -6.4566168785095215, "global_step": 100665, "epoch": 2396} {"train_loss": -6.401087284088135, "global_step": 100666, "epoch": 2396} {"train_loss": -6.249843120574951, "global_step": 100667, "epoch": 2396} {"train_loss": -6.324965476989746, "global_step": 100668, "epoch": 2396} {"train_loss": -6.361286163330078, "global_step": 100669, "epoch": 2396} {"train_loss": -6.3786492347717285, "global_step": 100670, "epoch": 2396} {"train_loss": -6.382465362548828, "global_step": 100671, "epoch": 2396} {"train_loss": -6.471151828765869, "global_step": 100672, "epoch": 2396} {"train_loss": -6.359659580957322, "global_step": 100673, "epoch": 2396, "val_loss": 67835.5078125} {"train_loss": -6.378996849060059, "global_step": 100674, "epoch": 2397} {"train_loss": -6.292580604553223, "global_step": 100675, "epoch": 2397} {"train_loss": -6.484137535095215, "global_step": 100676, "epoch": 2397} {"train_loss": -6.415182113647461, "global_step": 100677, "epoch": 2397} {"train_loss": -6.420228004455566, "global_step": 100678, "epoch": 2397} {"train_loss": -6.406735897064209, "global_step": 100679, "epoch": 2397} {"train_loss": -6.244931221008301, "global_step": 100680, "epoch": 2397} {"train_loss": -6.373906135559082, "global_step": 100681, "epoch": 2397} {"train_loss": -6.386940956115723, "global_step": 100682, "epoch": 2397} {"train_loss": -6.192485332489014, "global_step": 100683, "epoch": 2397} {"train_loss": -6.26400089263916, "global_step": 100684, "epoch": 2397} {"train_loss": -6.3432159423828125, "global_step": 100685, "epoch": 2397} {"train_loss": -6.295162200927734, "global_step": 100686, "epoch": 2397} {"train_loss": -6.384876251220703, "global_step": 100687, "epoch": 2397} {"train_loss": -6.270528316497803, "global_step": 100688, "epoch": 2397} {"train_loss": -6.354860305786133, "global_step": 100689, "epoch": 2397} {"train_loss": -6.332064628601074, "global_step": 100690, "epoch": 2397} {"train_loss": -6.466264724731445, "global_step": 100691, "epoch": 2397} {"train_loss": -6.331883907318115, "global_step": 100692, "epoch": 2397} {"train_loss": -6.368661403656006, "global_step": 100693, "epoch": 2397} {"train_loss": -6.213126182556152, "global_step": 100694, "epoch": 2397} {"train_loss": -6.284173011779785, "global_step": 100695, "epoch": 2397} {"train_loss": -6.327866554260254, "global_step": 100696, "epoch": 2397} {"train_loss": -6.307183265686035, "global_step": 100697, "epoch": 2397} {"train_loss": -6.391966819763184, "global_step": 100698, "epoch": 2397} {"train_loss": -6.220790863037109, "global_step": 100699, "epoch": 2397} {"train_loss": -6.331986427307129, "global_step": 100700, "epoch": 2397} {"train_loss": -6.324911594390869, "global_step": 100701, "epoch": 2397} {"train_loss": -6.295246124267578, "global_step": 100702, "epoch": 2397} {"train_loss": -6.4727783203125, "global_step": 100703, "epoch": 2397} {"train_loss": -6.288066864013672, "global_step": 100704, "epoch": 2397} {"train_loss": -6.318428039550781, "global_step": 100705, "epoch": 2397} {"train_loss": -6.3321685791015625, "global_step": 100706, "epoch": 2397} {"train_loss": -6.279940128326416, "global_step": 100707, "epoch": 2397} {"train_loss": -6.3629655838012695, "global_step": 100708, "epoch": 2397} {"train_loss": -6.338372230529785, "global_step": 100709, "epoch": 2397} {"train_loss": -6.377659797668457, "global_step": 100710, "epoch": 2397} {"train_loss": -6.274996280670166, "global_step": 100711, "epoch": 2397} {"train_loss": -6.40178108215332, "global_step": 100712, "epoch": 2397} {"train_loss": -6.310900688171387, "global_step": 100713, "epoch": 2397} {"train_loss": -6.316616058349609, "global_step": 100714, "epoch": 2397} {"train_loss": -6.335411412375314, "global_step": 100715, "epoch": 2397, "val_loss": 67793.90625} {"train_loss": -6.34830379486084, "global_step": 100716, "epoch": 2398} {"train_loss": -6.416950225830078, "global_step": 100717, "epoch": 2398} {"train_loss": -6.409926414489746, "global_step": 100718, "epoch": 2398} {"train_loss": -6.263392448425293, "global_step": 100719, "epoch": 2398} {"train_loss": -6.423315525054932, "global_step": 100720, "epoch": 2398} {"train_loss": -6.435892581939697, "global_step": 100721, "epoch": 2398} {"train_loss": -6.259697437286377, "global_step": 100722, "epoch": 2398} {"train_loss": -6.32711935043335, "global_step": 100723, "epoch": 2398} {"train_loss": -6.27479887008667, "global_step": 100724, "epoch": 2398} {"train_loss": -6.299211502075195, "global_step": 100725, "epoch": 2398} {"train_loss": -6.497398376464844, "global_step": 100726, "epoch": 2398} {"train_loss": -6.316686630249023, "global_step": 100727, "epoch": 2398} {"train_loss": -6.3579206466674805, "global_step": 100728, "epoch": 2398} {"train_loss": -6.359769821166992, "global_step": 100729, "epoch": 2398} {"train_loss": -6.311070442199707, "global_step": 100730, "epoch": 2398} {"train_loss": -6.416627407073975, "global_step": 100731, "epoch": 2398} {"train_loss": -6.16337251663208, "global_step": 100732, "epoch": 2398} {"train_loss": -6.120204448699951, "global_step": 100733, "epoch": 2398} {"train_loss": -6.493451118469238, "global_step": 100734, "epoch": 2398} {"train_loss": -6.324419021606445, "global_step": 100735, "epoch": 2398} {"train_loss": -6.175966262817383, "global_step": 100736, "epoch": 2398} {"train_loss": -6.360732078552246, "global_step": 100737, "epoch": 2398} {"train_loss": -6.203887462615967, "global_step": 100738, "epoch": 2398} {"train_loss": -6.162558078765869, "global_step": 100739, "epoch": 2398} {"train_loss": -6.258195877075195, "global_step": 100740, "epoch": 2398} {"train_loss": -6.212284564971924, "global_step": 100741, "epoch": 2398} {"train_loss": -6.374241828918457, "global_step": 100742, "epoch": 2398} {"train_loss": -6.343549728393555, "global_step": 100743, "epoch": 2398} {"train_loss": -6.225298881530762, "global_step": 100744, "epoch": 2398} {"train_loss": -6.372779369354248, "global_step": 100745, "epoch": 2398} {"train_loss": -6.326968193054199, "global_step": 100746, "epoch": 2398} {"train_loss": -6.309349060058594, "global_step": 100747, "epoch": 2398} {"train_loss": -6.4849700927734375, "global_step": 100748, "epoch": 2398} {"train_loss": -6.364649772644043, "global_step": 100749, "epoch": 2398} {"train_loss": -6.33381462097168, "global_step": 100750, "epoch": 2398} {"train_loss": -6.4067840576171875, "global_step": 100751, "epoch": 2398} {"train_loss": -6.524582386016846, "global_step": 100752, "epoch": 2398} {"train_loss": -6.309222221374512, "global_step": 100753, "epoch": 2398} {"train_loss": -6.375492095947266, "global_step": 100754, "epoch": 2398} {"train_loss": -6.441043376922607, "global_step": 100755, "epoch": 2398} {"train_loss": -6.309212684631348, "global_step": 100756, "epoch": 2398} {"train_loss": -6.330606948761713, "global_step": 100757, "epoch": 2398, "val_loss": 67758.1484375} {"train_loss": -6.379542827606201, "global_step": 100758, "epoch": 2399} {"train_loss": -6.284371852874756, "global_step": 100759, "epoch": 2399} {"train_loss": -6.275723934173584, "global_step": 100760, "epoch": 2399} {"train_loss": -6.343906402587891, "global_step": 100761, "epoch": 2399} {"train_loss": -6.396523952484131, "global_step": 100762, "epoch": 2399} {"train_loss": -6.245875358581543, "global_step": 100763, "epoch": 2399} {"train_loss": -6.240483283996582, "global_step": 100764, "epoch": 2399} {"train_loss": -6.399003982543945, "global_step": 100765, "epoch": 2399} {"train_loss": -6.237246990203857, "global_step": 100766, "epoch": 2399} {"train_loss": -6.376755237579346, "global_step": 100767, "epoch": 2399} {"train_loss": -6.381136894226074, "global_step": 100768, "epoch": 2399} {"train_loss": -6.478173732757568, "global_step": 100769, "epoch": 2399} {"train_loss": -6.261262893676758, "global_step": 100770, "epoch": 2399} {"train_loss": -6.459725379943848, "global_step": 100771, "epoch": 2399} {"train_loss": -6.516297340393066, "global_step": 100772, "epoch": 2399} {"train_loss": -6.476541519165039, "global_step": 100773, "epoch": 2399} {"train_loss": -6.3202996253967285, "global_step": 100774, "epoch": 2399} {"train_loss": -6.425258636474609, "global_step": 100775, "epoch": 2399} {"train_loss": -6.393694877624512, "global_step": 100776, "epoch": 2399} {"train_loss": -6.250123023986816, "global_step": 100777, "epoch": 2399} {"train_loss": -6.41791296005249, "global_step": 100778, "epoch": 2399} {"train_loss": -6.328446865081787, "global_step": 100779, "epoch": 2399} {"train_loss": -6.3859171867370605, "global_step": 100780, "epoch": 2399} {"train_loss": -6.330462455749512, "global_step": 100781, "epoch": 2399} {"train_loss": -6.245670795440674, "global_step": 100782, "epoch": 2399} {"train_loss": -6.423705101013184, "global_step": 100783, "epoch": 2399} {"train_loss": -6.314376354217529, "global_step": 100784, "epoch": 2399} {"train_loss": -6.288667678833008, "global_step": 100785, "epoch": 2399} {"train_loss": -6.40717887878418, "global_step": 100786, "epoch": 2399} {"train_loss": -6.331902503967285, "global_step": 100787, "epoch": 2399} {"train_loss": -6.142364978790283, "global_step": 100788, "epoch": 2399} {"train_loss": -6.264034271240234, "global_step": 100789, "epoch": 2399} {"train_loss": -6.176311492919922, "global_step": 100790, "epoch": 2399} {"train_loss": -6.082451820373535, "global_step": 100791, "epoch": 2399} {"train_loss": -6.353453636169434, "global_step": 100792, "epoch": 2399} {"train_loss": -6.13803768157959, "global_step": 100793, "epoch": 2399} {"train_loss": -6.335585594177246, "global_step": 100794, "epoch": 2399} {"train_loss": -6.210196495056152, "global_step": 100795, "epoch": 2399} {"train_loss": -6.238926887512207, "global_step": 100796, "epoch": 2399} {"train_loss": -6.2844648361206055, "global_step": 100797, "epoch": 2399} {"train_loss": -6.131974220275879, "global_step": 100798, "epoch": 2399} {"train_loss": -6.313608532860165, "global_step": 100799, "epoch": 2399, "val_loss": 68293.5546875} {"train_loss": -6.101131916046143, "global_step": 100800, "epoch": 2400} {"train_loss": -6.248326301574707, "global_step": 100801, "epoch": 2400} {"train_loss": -6.2535552978515625, "global_step": 100802, "epoch": 2400} {"train_loss": -6.300763130187988, "global_step": 100803, "epoch": 2400} {"train_loss": -6.16064453125, "global_step": 100804, "epoch": 2400} {"train_loss": -6.418425559997559, "global_step": 100805, "epoch": 2400} {"train_loss": -6.2194976806640625, "global_step": 100806, "epoch": 2400} {"train_loss": -6.232070446014404, "global_step": 100807, "epoch": 2400} {"train_loss": -6.221344470977783, "global_step": 100808, "epoch": 2400} {"train_loss": -6.384043216705322, "global_step": 100809, "epoch": 2400} {"train_loss": -6.201087951660156, "global_step": 100810, "epoch": 2400} {"train_loss": -6.366299629211426, "global_step": 100811, "epoch": 2400} {"train_loss": -6.258840560913086, "global_step": 100812, "epoch": 2400} {"train_loss": -6.277149200439453, "global_step": 100813, "epoch": 2400} {"train_loss": -6.340600967407227, "global_step": 100814, "epoch": 2400} {"train_loss": -6.225856781005859, "global_step": 100815, "epoch": 2400} {"train_loss": -6.358580589294434, "global_step": 100816, "epoch": 2400} {"train_loss": -6.286617279052734, "global_step": 100817, "epoch": 2400} {"train_loss": -6.379974365234375, "global_step": 100818, "epoch": 2400} {"train_loss": -6.356389045715332, "global_step": 100819, "epoch": 2400} {"train_loss": -6.461279392242432, "global_step": 100820, "epoch": 2400} {"train_loss": -6.375210285186768, "global_step": 100821, "epoch": 2400} {"train_loss": -6.334682941436768, "global_step": 100822, "epoch": 2400} {"train_loss": -6.281214714050293, "global_step": 100823, "epoch": 2400} {"train_loss": -6.377131462097168, "global_step": 100824, "epoch": 2400} {"train_loss": -6.487290382385254, "global_step": 100825, "epoch": 2400} {"train_loss": -6.43170690536499, "global_step": 100826, "epoch": 2400} {"train_loss": -6.268885135650635, "global_step": 100827, "epoch": 2400} {"train_loss": -6.291019916534424, "global_step": 100828, "epoch": 2400} {"train_loss": -6.355598449707031, "global_step": 100829, "epoch": 2400} {"train_loss": -6.313509464263916, "global_step": 100830, "epoch": 2400} {"train_loss": -6.463397026062012, "global_step": 100831, "epoch": 2400} {"train_loss": -6.4184417724609375, "global_step": 100832, "epoch": 2400} {"train_loss": -6.357548713684082, "global_step": 100833, "epoch": 2400} {"train_loss": -6.315155029296875, "global_step": 100834, "epoch": 2400} {"train_loss": -6.305660724639893, "global_step": 100835, "epoch": 2400} {"train_loss": -6.394870281219482, "global_step": 100836, "epoch": 2400} {"train_loss": -6.386275291442871, "global_step": 100837, "epoch": 2400} {"train_loss": -6.191709518432617, "global_step": 100838, "epoch": 2400} {"train_loss": -6.382175445556641, "global_step": 100839, "epoch": 2400} {"train_loss": -6.434640884399414, "global_step": 100840, "epoch": 2400} {"train_loss": -6.322020087923322, "global_step": 100841, "epoch": 2400, "train/sim_max_reward_0": 0.24027202325588048, "train/sim_max_reward_1": 0.9656252336651622, "train/sim_max_reward_2": 0.47463405308533907, "train/sim_max_reward_3": 0.13531133359328715, "train/sim_max_reward_4": 0.8939062561312633, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.44009104861328874, "test/sim_max_reward_4400001": 0.15425472136567384, "test/sim_max_reward_4400002": 0.9135431571470981, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9498925601085425, "test/sim_max_reward_4400007": 0.8983160122355399, "test/sim_max_reward_4400008": 0.31645049320296414, "test/sim_max_reward_4400009": 0.9814560276437642, "test/sim_max_reward_4400010": 0.27436741469930687, "test/sim_max_reward_4400011": 0.2111499322778157, "test/sim_max_reward_4400012": 0.8687362040531037, "test/sim_max_reward_4400013": 0.9759996303325575, "test/sim_max_reward_4400014": 0.20820638146573336, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.20310365056713256, "test/sim_max_reward_4400019": 0.1879565796478618, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8174700135913754, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.2729428381902434, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 0.0014509064160487847, "test/sim_max_reward_4400028": 0.44000075327293797, "test/sim_max_reward_4400029": 0.5519541423014346, "test/sim_max_reward_4400030": 0.9866042309110924, "test/sim_max_reward_4400031": 0.9566267758489462, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7578872544013942, "test/sim_max_reward_4400034": 0.9408078467992197, "test/sim_max_reward_4400035": 0.6879802379971144, "test/sim_max_reward_4400036": 0.9955244302815266, "test/sim_max_reward_4400037": 0.9241170040084788, "test/sim_max_reward_4400038": 0.7967858692399779, "test/sim_max_reward_4400039": 0.9206415978680771, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7495614124945813, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.9737257054723258, "test/sim_max_reward_4400044": 0.9763473131001354, "test/sim_max_reward_4400045": 0.8703948404978086, "test/sim_max_reward_4400046": 0.849841004166262, "test/sim_max_reward_4400047": 0.9744237539027376, "test/sim_max_reward_4400048": 0.12117517904820103, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.4837889431821866, "test/mean_score": 0.5144306765194433, "val_loss": 67889.578125} {"train_loss": -6.401578426361084, "global_step": 100842, "epoch": 2401} {"train_loss": -6.246726989746094, "global_step": 100843, "epoch": 2401} {"train_loss": -6.339254379272461, "global_step": 100844, "epoch": 2401} {"train_loss": -6.361690521240234, "global_step": 100845, "epoch": 2401} {"train_loss": -6.243111610412598, "global_step": 100846, "epoch": 2401} {"train_loss": -6.393887996673584, "global_step": 100847, "epoch": 2401} {"train_loss": -6.303492546081543, "global_step": 100848, "epoch": 2401} {"train_loss": -6.309164047241211, "global_step": 100849, "epoch": 2401} {"train_loss": -6.4285888671875, "global_step": 100850, "epoch": 2401} {"train_loss": -6.456875801086426, "global_step": 100851, "epoch": 2401} {"train_loss": -6.414546012878418, "global_step": 100852, "epoch": 2401} {"train_loss": -6.3310136795043945, "global_step": 100853, "epoch": 2401} {"train_loss": -6.3537116050720215, "global_step": 100854, "epoch": 2401} {"train_loss": -6.394865036010742, "global_step": 100855, "epoch": 2401} {"train_loss": -6.375851631164551, "global_step": 100856, "epoch": 2401} {"train_loss": -6.311180591583252, "global_step": 100857, "epoch": 2401} {"train_loss": -6.36981201171875, "global_step": 100858, "epoch": 2401} {"train_loss": -6.338118553161621, "global_step": 100859, "epoch": 2401} {"train_loss": -6.2622456550598145, "global_step": 100860, "epoch": 2401} {"train_loss": -6.428840637207031, "global_step": 100861, "epoch": 2401} {"train_loss": -6.396584987640381, "global_step": 100862, "epoch": 2401} {"train_loss": -6.464107990264893, "global_step": 100863, "epoch": 2401} {"train_loss": -6.363948345184326, "global_step": 100864, "epoch": 2401} {"train_loss": -6.422067642211914, "global_step": 100865, "epoch": 2401} {"train_loss": -6.28461217880249, "global_step": 100866, "epoch": 2401} {"train_loss": -6.334050178527832, "global_step": 100867, "epoch": 2401} {"train_loss": -6.312252044677734, "global_step": 100868, "epoch": 2401} {"train_loss": -6.444677829742432, "global_step": 100869, "epoch": 2401} {"train_loss": -6.4793314933776855, "global_step": 100870, "epoch": 2401} {"train_loss": -6.357361793518066, "global_step": 100871, "epoch": 2401} {"train_loss": -6.291414260864258, "global_step": 100872, "epoch": 2401} {"train_loss": -6.394900321960449, "global_step": 100873, "epoch": 2401} {"train_loss": -6.356289863586426, "global_step": 100874, "epoch": 2401} {"train_loss": -6.406259536743164, "global_step": 100875, "epoch": 2401} {"train_loss": -6.436336994171143, "global_step": 100876, "epoch": 2401} {"train_loss": -6.35471773147583, "global_step": 100877, "epoch": 2401} {"train_loss": -6.320987224578857, "global_step": 100878, "epoch": 2401} {"train_loss": -6.2885847091674805, "global_step": 100879, "epoch": 2401} {"train_loss": -6.39205265045166, "global_step": 100880, "epoch": 2401} {"train_loss": -6.3632965087890625, "global_step": 100881, "epoch": 2401} {"train_loss": -6.2427778244018555, "global_step": 100882, "epoch": 2401} {"train_loss": -6.357015439442226, "global_step": 100883, "epoch": 2401, "val_loss": 67728.890625} {"train_loss": -6.300706386566162, "global_step": 100884, "epoch": 2402} {"train_loss": -6.3186750411987305, "global_step": 100885, "epoch": 2402} {"train_loss": -6.260673999786377, "global_step": 100886, "epoch": 2402} {"train_loss": -6.303476810455322, "global_step": 100887, "epoch": 2402} {"train_loss": -6.286626815795898, "global_step": 100888, "epoch": 2402} {"train_loss": -6.384870529174805, "global_step": 100889, "epoch": 2402} {"train_loss": -6.402299404144287, "global_step": 100890, "epoch": 2402} {"train_loss": -6.351991176605225, "global_step": 100891, "epoch": 2402} {"train_loss": -6.251319885253906, "global_step": 100892, "epoch": 2402} {"train_loss": -6.385078430175781, "global_step": 100893, "epoch": 2402} {"train_loss": -6.377536773681641, "global_step": 100894, "epoch": 2402} {"train_loss": -6.3740339279174805, "global_step": 100895, "epoch": 2402} {"train_loss": -6.419991970062256, "global_step": 100896, "epoch": 2402} {"train_loss": -6.412591934204102, "global_step": 100897, "epoch": 2402} {"train_loss": -6.393677234649658, "global_step": 100898, "epoch": 2402} {"train_loss": -6.372259140014648, "global_step": 100899, "epoch": 2402} {"train_loss": -6.397523880004883, "global_step": 100900, "epoch": 2402} {"train_loss": -6.344701766967773, "global_step": 100901, "epoch": 2402} {"train_loss": -6.445743560791016, "global_step": 100902, "epoch": 2402} {"train_loss": -6.369887351989746, "global_step": 100903, "epoch": 2402} {"train_loss": -6.381828784942627, "global_step": 100904, "epoch": 2402} {"train_loss": -6.322824478149414, "global_step": 100905, "epoch": 2402} {"train_loss": -6.419393539428711, "global_step": 100906, "epoch": 2402} {"train_loss": -6.391321182250977, "global_step": 100907, "epoch": 2402} {"train_loss": -6.312117576599121, "global_step": 100908, "epoch": 2402} {"train_loss": -6.422013282775879, "global_step": 100909, "epoch": 2402} {"train_loss": -6.270682334899902, "global_step": 100910, "epoch": 2402} {"train_loss": -6.4099555015563965, "global_step": 100911, "epoch": 2402} {"train_loss": -6.290544509887695, "global_step": 100912, "epoch": 2402} {"train_loss": -6.409084320068359, "global_step": 100913, "epoch": 2402} {"train_loss": -6.36034631729126, "global_step": 100914, "epoch": 2402} {"train_loss": -6.369503974914551, "global_step": 100915, "epoch": 2402} {"train_loss": -6.306486129760742, "global_step": 100916, "epoch": 2402} {"train_loss": -6.398739337921143, "global_step": 100917, "epoch": 2402} {"train_loss": -6.260570526123047, "global_step": 100918, "epoch": 2402} {"train_loss": -6.382883071899414, "global_step": 100919, "epoch": 2402} {"train_loss": -6.29448938369751, "global_step": 100920, "epoch": 2402} {"train_loss": -6.3397064208984375, "global_step": 100921, "epoch": 2402} {"train_loss": -6.357142448425293, "global_step": 100922, "epoch": 2402} {"train_loss": -6.390244960784912, "global_step": 100923, "epoch": 2402} {"train_loss": -6.34499454498291, "global_step": 100924, "epoch": 2402} {"train_loss": -6.357246660050892, "global_step": 100925, "epoch": 2402, "val_loss": 68067.6171875} {"train_loss": -6.354416847229004, "global_step": 100926, "epoch": 2403} {"train_loss": -6.3797831535339355, "global_step": 100927, "epoch": 2403} {"train_loss": -6.406680107116699, "global_step": 100928, "epoch": 2403} {"train_loss": -6.375490188598633, "global_step": 100929, "epoch": 2403} {"train_loss": -6.302106857299805, "global_step": 100930, "epoch": 2403} {"train_loss": -6.3866729736328125, "global_step": 100931, "epoch": 2403} {"train_loss": -6.328068256378174, "global_step": 100932, "epoch": 2403} {"train_loss": -6.322387218475342, "global_step": 100933, "epoch": 2403} {"train_loss": -6.369126319885254, "global_step": 100934, "epoch": 2403} {"train_loss": -6.252991676330566, "global_step": 100935, "epoch": 2403} {"train_loss": -6.296858787536621, "global_step": 100936, "epoch": 2403} {"train_loss": -6.306626319885254, "global_step": 100937, "epoch": 2403} {"train_loss": -6.238157272338867, "global_step": 100938, "epoch": 2403} {"train_loss": -6.246584892272949, "global_step": 100939, "epoch": 2403} {"train_loss": -6.234921455383301, "global_step": 100940, "epoch": 2403} {"train_loss": -6.322868824005127, "global_step": 100941, "epoch": 2403} {"train_loss": -6.259871482849121, "global_step": 100942, "epoch": 2403} {"train_loss": -6.329102516174316, "global_step": 100943, "epoch": 2403} {"train_loss": -6.346271991729736, "global_step": 100944, "epoch": 2403} {"train_loss": -6.263287544250488, "global_step": 100945, "epoch": 2403} {"train_loss": -6.312893390655518, "global_step": 100946, "epoch": 2403} {"train_loss": -6.367907524108887, "global_step": 100947, "epoch": 2403} {"train_loss": -6.411211013793945, "global_step": 100948, "epoch": 2403} {"train_loss": -6.4495697021484375, "global_step": 100949, "epoch": 2403} {"train_loss": -6.3503336906433105, "global_step": 100950, "epoch": 2403} {"train_loss": -6.415594577789307, "global_step": 100951, "epoch": 2403} {"train_loss": -6.320960998535156, "global_step": 100952, "epoch": 2403} {"train_loss": -6.3661675453186035, "global_step": 100953, "epoch": 2403} {"train_loss": -6.437845230102539, "global_step": 100954, "epoch": 2403} {"train_loss": -6.335908889770508, "global_step": 100955, "epoch": 2403} {"train_loss": -6.393665313720703, "global_step": 100956, "epoch": 2403} {"train_loss": -6.352546691894531, "global_step": 100957, "epoch": 2403} {"train_loss": -6.325036525726318, "global_step": 100958, "epoch": 2403} {"train_loss": -6.385494232177734, "global_step": 100959, "epoch": 2403} {"train_loss": -6.404000282287598, "global_step": 100960, "epoch": 2403} {"train_loss": -6.3753838539123535, "global_step": 100961, "epoch": 2403} {"train_loss": -6.453225135803223, "global_step": 100962, "epoch": 2403} {"train_loss": -6.461668968200684, "global_step": 100963, "epoch": 2403} {"train_loss": -6.431480884552002, "global_step": 100964, "epoch": 2403} {"train_loss": -6.389110565185547, "global_step": 100965, "epoch": 2403} {"train_loss": -6.512195587158203, "global_step": 100966, "epoch": 2403} {"train_loss": -6.355224881853376, "global_step": 100967, "epoch": 2403, "val_loss": 67883.625} {"train_loss": -6.42030143737793, "global_step": 100968, "epoch": 2404} {"train_loss": -6.265723705291748, "global_step": 100969, "epoch": 2404} {"train_loss": -6.429923057556152, "global_step": 100970, "epoch": 2404} {"train_loss": -6.411531448364258, "global_step": 100971, "epoch": 2404} {"train_loss": -6.325214385986328, "global_step": 100972, "epoch": 2404} {"train_loss": -6.279208183288574, "global_step": 100973, "epoch": 2404} {"train_loss": -6.499658584594727, "global_step": 100974, "epoch": 2404} {"train_loss": -6.2665791511535645, "global_step": 100975, "epoch": 2404} {"train_loss": -6.3579816818237305, "global_step": 100976, "epoch": 2404} {"train_loss": -6.355764389038086, "global_step": 100977, "epoch": 2404} {"train_loss": -6.36292839050293, "global_step": 100978, "epoch": 2404} {"train_loss": -6.319570064544678, "global_step": 100979, "epoch": 2404} {"train_loss": -6.374011993408203, "global_step": 100980, "epoch": 2404} {"train_loss": -6.218003273010254, "global_step": 100981, "epoch": 2404} {"train_loss": -6.436612129211426, "global_step": 100982, "epoch": 2404} {"train_loss": -6.342079162597656, "global_step": 100983, "epoch": 2404} {"train_loss": -6.211585521697998, "global_step": 100984, "epoch": 2404} {"train_loss": -6.41316032409668, "global_step": 100985, "epoch": 2404} {"train_loss": -6.365560531616211, "global_step": 100986, "epoch": 2404} {"train_loss": -6.323592185974121, "global_step": 100987, "epoch": 2404} {"train_loss": -6.42011833190918, "global_step": 100988, "epoch": 2404} {"train_loss": -6.408238410949707, "global_step": 100989, "epoch": 2404} {"train_loss": -6.3360915184021, "global_step": 100990, "epoch": 2404} {"train_loss": -6.3124260902404785, "global_step": 100991, "epoch": 2404} {"train_loss": -6.321531772613525, "global_step": 100992, "epoch": 2404} {"train_loss": -6.346812725067139, "global_step": 100993, "epoch": 2404} {"train_loss": -6.476434230804443, "global_step": 100994, "epoch": 2404} {"train_loss": -6.440731525421143, "global_step": 100995, "epoch": 2404} {"train_loss": -6.453701019287109, "global_step": 100996, "epoch": 2404} {"train_loss": -6.359131813049316, "global_step": 100997, "epoch": 2404} {"train_loss": -6.390601634979248, "global_step": 100998, "epoch": 2404} {"train_loss": -6.300717353820801, "global_step": 100999, "epoch": 2404} {"train_loss": -6.3059916496276855, "global_step": 101000, "epoch": 2404} {"train_loss": -6.222728252410889, "global_step": 101001, "epoch": 2404} {"train_loss": -6.27597188949585, "global_step": 101002, "epoch": 2404} {"train_loss": -6.230160236358643, "global_step": 101003, "epoch": 2404} {"train_loss": -6.229448318481445, "global_step": 101004, "epoch": 2404} {"train_loss": -6.295511245727539, "global_step": 101005, "epoch": 2404} {"train_loss": -6.334115982055664, "global_step": 101006, "epoch": 2404} {"train_loss": -6.282609939575195, "global_step": 101007, "epoch": 2404} {"train_loss": -6.334274768829346, "global_step": 101008, "epoch": 2404} {"train_loss": -6.343562920888265, "global_step": 101009, "epoch": 2404, "val_loss": 68121.515625} {"train_loss": -6.271326065063477, "global_step": 101010, "epoch": 2405} {"train_loss": -6.320070266723633, "global_step": 101011, "epoch": 2405} {"train_loss": -6.322084426879883, "global_step": 101012, "epoch": 2405} {"train_loss": -6.3684515953063965, "global_step": 101013, "epoch": 2405} {"train_loss": -6.426689147949219, "global_step": 101014, "epoch": 2405} {"train_loss": -6.339039325714111, "global_step": 101015, "epoch": 2405} {"train_loss": -6.373250484466553, "global_step": 101016, "epoch": 2405} {"train_loss": -6.365803241729736, "global_step": 101017, "epoch": 2405} {"train_loss": -6.309259414672852, "global_step": 101018, "epoch": 2405} {"train_loss": -6.332428932189941, "global_step": 101019, "epoch": 2405} {"train_loss": -6.390320301055908, "global_step": 101020, "epoch": 2405} {"train_loss": -6.380810260772705, "global_step": 101021, "epoch": 2405} {"train_loss": -6.333189010620117, "global_step": 101022, "epoch": 2405} {"train_loss": -6.357328414916992, "global_step": 101023, "epoch": 2405} {"train_loss": -6.38511848449707, "global_step": 101024, "epoch": 2405} {"train_loss": -6.398437976837158, "global_step": 101025, "epoch": 2405} {"train_loss": -6.152505874633789, "global_step": 101026, "epoch": 2405} {"train_loss": -6.167221546173096, "global_step": 101027, "epoch": 2405} {"train_loss": -6.230769157409668, "global_step": 101028, "epoch": 2405} {"train_loss": -6.154631614685059, "global_step": 101029, "epoch": 2405} {"train_loss": -6.2972283363342285, "global_step": 101030, "epoch": 2405} {"train_loss": -6.146705627441406, "global_step": 101031, "epoch": 2405} {"train_loss": -6.305803298950195, "global_step": 101032, "epoch": 2405} {"train_loss": -6.222115516662598, "global_step": 101033, "epoch": 2405} {"train_loss": -6.2401909828186035, "global_step": 101034, "epoch": 2405} {"train_loss": -6.381037712097168, "global_step": 101035, "epoch": 2405} {"train_loss": -6.130204200744629, "global_step": 101036, "epoch": 2405} {"train_loss": -6.314443588256836, "global_step": 101037, "epoch": 2405} {"train_loss": -6.3254523277282715, "global_step": 101038, "epoch": 2405} {"train_loss": -6.346043586730957, "global_step": 101039, "epoch": 2405} {"train_loss": -6.276647567749023, "global_step": 101040, "epoch": 2405} {"train_loss": -6.184446334838867, "global_step": 101041, "epoch": 2405} {"train_loss": -6.263301849365234, "global_step": 101042, "epoch": 2405} {"train_loss": -6.336525917053223, "global_step": 101043, "epoch": 2405} {"train_loss": -6.273550987243652, "global_step": 101044, "epoch": 2405} {"train_loss": -6.281139850616455, "global_step": 101045, "epoch": 2405} {"train_loss": -6.358920097351074, "global_step": 101046, "epoch": 2405} {"train_loss": -6.288393974304199, "global_step": 101047, "epoch": 2405} {"train_loss": -6.5054426193237305, "global_step": 101048, "epoch": 2405} {"train_loss": -6.246550559997559, "global_step": 101049, "epoch": 2405} {"train_loss": -6.338051795959473, "global_step": 101050, "epoch": 2405} {"train_loss": -6.3067893868400935, "global_step": 101051, "epoch": 2405, "val_loss": 68102.3046875} {"train_loss": -6.2475714683532715, "global_step": 101052, "epoch": 2406} {"train_loss": -6.352264404296875, "global_step": 101053, "epoch": 2406} {"train_loss": -6.355090141296387, "global_step": 101054, "epoch": 2406} {"train_loss": -6.3305182456970215, "global_step": 101055, "epoch": 2406} {"train_loss": -6.346050262451172, "global_step": 101056, "epoch": 2406} {"train_loss": -6.422426223754883, "global_step": 101057, "epoch": 2406} {"train_loss": -6.360586643218994, "global_step": 101058, "epoch": 2406} {"train_loss": -6.315232276916504, "global_step": 101059, "epoch": 2406} {"train_loss": -6.416707515716553, "global_step": 101060, "epoch": 2406} {"train_loss": -6.425390243530273, "global_step": 101061, "epoch": 2406} {"train_loss": -6.423336029052734, "global_step": 101062, "epoch": 2406} {"train_loss": -6.370512962341309, "global_step": 101063, "epoch": 2406} {"train_loss": -6.337464809417725, "global_step": 101064, "epoch": 2406} {"train_loss": -6.420627593994141, "global_step": 101065, "epoch": 2406} {"train_loss": -6.347620010375977, "global_step": 101066, "epoch": 2406} {"train_loss": -6.405339241027832, "global_step": 101067, "epoch": 2406} {"train_loss": -6.407289028167725, "global_step": 101068, "epoch": 2406} {"train_loss": -6.482089996337891, "global_step": 101069, "epoch": 2406} {"train_loss": -6.4026336669921875, "global_step": 101070, "epoch": 2406} {"train_loss": -6.3416242599487305, "global_step": 101071, "epoch": 2406} {"train_loss": -6.473074436187744, "global_step": 101072, "epoch": 2406} {"train_loss": -6.387299537658691, "global_step": 101073, "epoch": 2406} {"train_loss": -6.334103107452393, "global_step": 101074, "epoch": 2406} {"train_loss": -6.437417984008789, "global_step": 101075, "epoch": 2406} {"train_loss": -6.367834091186523, "global_step": 101076, "epoch": 2406} {"train_loss": -6.297977447509766, "global_step": 101077, "epoch": 2406} {"train_loss": -6.358701705932617, "global_step": 101078, "epoch": 2406} {"train_loss": -6.353907108306885, "global_step": 101079, "epoch": 2406} {"train_loss": -6.275938987731934, "global_step": 101080, "epoch": 2406} {"train_loss": -6.41049861907959, "global_step": 101081, "epoch": 2406} {"train_loss": -6.275387763977051, "global_step": 101082, "epoch": 2406} {"train_loss": -6.282522201538086, "global_step": 101083, "epoch": 2406} {"train_loss": -6.299992561340332, "global_step": 101084, "epoch": 2406} {"train_loss": -6.494429588317871, "global_step": 101085, "epoch": 2406} {"train_loss": -6.287593841552734, "global_step": 101086, "epoch": 2406} {"train_loss": -6.272287845611572, "global_step": 101087, "epoch": 2406} {"train_loss": -6.299284934997559, "global_step": 101088, "epoch": 2406} {"train_loss": -6.335413932800293, "global_step": 101089, "epoch": 2406} {"train_loss": -6.351620674133301, "global_step": 101090, "epoch": 2406} {"train_loss": -6.387809753417969, "global_step": 101091, "epoch": 2406} {"train_loss": -6.262474060058594, "global_step": 101092, "epoch": 2406} {"train_loss": -6.3611649785723, "global_step": 101093, "epoch": 2406, "val_loss": 67974.6171875} {"train_loss": -6.31408166885376, "global_step": 101094, "epoch": 2407} {"train_loss": -6.36164665222168, "global_step": 101095, "epoch": 2407} {"train_loss": -6.395165920257568, "global_step": 101096, "epoch": 2407} {"train_loss": -6.2549824714660645, "global_step": 101097, "epoch": 2407} {"train_loss": -6.360630035400391, "global_step": 101098, "epoch": 2407} {"train_loss": -6.269283771514893, "global_step": 101099, "epoch": 2407} {"train_loss": -6.400285720825195, "global_step": 101100, "epoch": 2407} {"train_loss": -6.379059791564941, "global_step": 101101, "epoch": 2407} {"train_loss": -6.324287414550781, "global_step": 101102, "epoch": 2407} {"train_loss": -6.438244342803955, "global_step": 101103, "epoch": 2407} {"train_loss": -6.239421367645264, "global_step": 101104, "epoch": 2407} {"train_loss": -6.343480587005615, "global_step": 101105, "epoch": 2407} {"train_loss": -6.242338180541992, "global_step": 101106, "epoch": 2407} {"train_loss": -6.392043590545654, "global_step": 101107, "epoch": 2407} {"train_loss": -6.284402370452881, "global_step": 101108, "epoch": 2407} {"train_loss": -6.32313346862793, "global_step": 101109, "epoch": 2407} {"train_loss": -6.415825366973877, "global_step": 101110, "epoch": 2407} {"train_loss": -6.189186096191406, "global_step": 101111, "epoch": 2407} {"train_loss": -6.255533218383789, "global_step": 101112, "epoch": 2407} {"train_loss": -6.138005256652832, "global_step": 101113, "epoch": 2407} {"train_loss": -6.287602424621582, "global_step": 101114, "epoch": 2407} {"train_loss": -6.3161540031433105, "global_step": 101115, "epoch": 2407} {"train_loss": -6.312177658081055, "global_step": 101116, "epoch": 2407} {"train_loss": -6.30103063583374, "global_step": 101117, "epoch": 2407} {"train_loss": -6.267398834228516, "global_step": 101118, "epoch": 2407} {"train_loss": -6.3045148849487305, "global_step": 101119, "epoch": 2407} {"train_loss": -6.157289505004883, "global_step": 101120, "epoch": 2407} {"train_loss": -6.294867515563965, "global_step": 101121, "epoch": 2407} {"train_loss": -6.37625789642334, "global_step": 101122, "epoch": 2407} {"train_loss": -6.381799697875977, "global_step": 101123, "epoch": 2407} {"train_loss": -6.2576704025268555, "global_step": 101124, "epoch": 2407} {"train_loss": -6.324775695800781, "global_step": 101125, "epoch": 2407} {"train_loss": -6.449906349182129, "global_step": 101126, "epoch": 2407} {"train_loss": -6.386057376861572, "global_step": 101127, "epoch": 2407} {"train_loss": -6.252449035644531, "global_step": 101128, "epoch": 2407} {"train_loss": -6.308104515075684, "global_step": 101129, "epoch": 2407} {"train_loss": -6.262308120727539, "global_step": 101130, "epoch": 2407} {"train_loss": -6.441227912902832, "global_step": 101131, "epoch": 2407} {"train_loss": -6.479859828948975, "global_step": 101132, "epoch": 2407} {"train_loss": -6.355664253234863, "global_step": 101133, "epoch": 2407} {"train_loss": -6.426548957824707, "global_step": 101134, "epoch": 2407} {"train_loss": -6.326197442554292, "global_step": 101135, "epoch": 2407, "val_loss": 67852.671875} {"train_loss": -6.4091997146606445, "global_step": 101136, "epoch": 2408} {"train_loss": -6.523570537567139, "global_step": 101137, "epoch": 2408} {"train_loss": -6.157686233520508, "global_step": 101138, "epoch": 2408} {"train_loss": -6.329083442687988, "global_step": 101139, "epoch": 2408} {"train_loss": -6.3347320556640625, "global_step": 101140, "epoch": 2408} {"train_loss": -6.217100143432617, "global_step": 101141, "epoch": 2408} {"train_loss": -6.32187032699585, "global_step": 101142, "epoch": 2408} {"train_loss": -6.406458854675293, "global_step": 101143, "epoch": 2408} {"train_loss": -6.330989837646484, "global_step": 101144, "epoch": 2408} {"train_loss": -6.362318992614746, "global_step": 101145, "epoch": 2408} {"train_loss": -6.373849391937256, "global_step": 101146, "epoch": 2408} {"train_loss": -6.225465774536133, "global_step": 101147, "epoch": 2408} {"train_loss": -6.322043418884277, "global_step": 101148, "epoch": 2408} {"train_loss": -6.346158504486084, "global_step": 101149, "epoch": 2408} {"train_loss": -6.298665523529053, "global_step": 101150, "epoch": 2408} {"train_loss": -6.309575080871582, "global_step": 101151, "epoch": 2408} {"train_loss": -6.267258644104004, "global_step": 101152, "epoch": 2408} {"train_loss": -6.348716735839844, "global_step": 101153, "epoch": 2408} {"train_loss": -6.294371604919434, "global_step": 101154, "epoch": 2408} {"train_loss": -6.4420695304870605, "global_step": 101155, "epoch": 2408} {"train_loss": -6.346799850463867, "global_step": 101156, "epoch": 2408} {"train_loss": -6.345037937164307, "global_step": 101157, "epoch": 2408} {"train_loss": -6.373918533325195, "global_step": 101158, "epoch": 2408} {"train_loss": -6.307947635650635, "global_step": 101159, "epoch": 2408} {"train_loss": -6.361658096313477, "global_step": 101160, "epoch": 2408} {"train_loss": -6.413371562957764, "global_step": 101161, "epoch": 2408} {"train_loss": -6.385168075561523, "global_step": 101162, "epoch": 2408} {"train_loss": -6.252384185791016, "global_step": 101163, "epoch": 2408} {"train_loss": -6.329848766326904, "global_step": 101164, "epoch": 2408} {"train_loss": -6.453005790710449, "global_step": 101165, "epoch": 2408} {"train_loss": -6.42302942276001, "global_step": 101166, "epoch": 2408} {"train_loss": -6.40704345703125, "global_step": 101167, "epoch": 2408} {"train_loss": -6.296487808227539, "global_step": 101168, "epoch": 2408} {"train_loss": -6.324508190155029, "global_step": 101169, "epoch": 2408} {"train_loss": -6.473016738891602, "global_step": 101170, "epoch": 2408} {"train_loss": -6.414272308349609, "global_step": 101171, "epoch": 2408} {"train_loss": -6.3766398429870605, "global_step": 101172, "epoch": 2408} {"train_loss": -6.354360103607178, "global_step": 101173, "epoch": 2408} {"train_loss": -6.354309558868408, "global_step": 101174, "epoch": 2408} {"train_loss": -6.319668769836426, "global_step": 101175, "epoch": 2408} {"train_loss": -6.374154090881348, "global_step": 101176, "epoch": 2408} {"train_loss": -6.350923504148211, "global_step": 101177, "epoch": 2408, "val_loss": 67930.015625} {"train_loss": -6.389595031738281, "global_step": 101178, "epoch": 2409} {"train_loss": -6.306303977966309, "global_step": 101179, "epoch": 2409} {"train_loss": -6.266735076904297, "global_step": 101180, "epoch": 2409} {"train_loss": -6.305550575256348, "global_step": 101181, "epoch": 2409} {"train_loss": -6.333827495574951, "global_step": 101182, "epoch": 2409} {"train_loss": -6.377252578735352, "global_step": 101183, "epoch": 2409} {"train_loss": -6.385890483856201, "global_step": 101184, "epoch": 2409} {"train_loss": -6.217085361480713, "global_step": 101185, "epoch": 2409} {"train_loss": -6.318300247192383, "global_step": 101186, "epoch": 2409} {"train_loss": -6.42498779296875, "global_step": 101187, "epoch": 2409} {"train_loss": -6.396103858947754, "global_step": 101188, "epoch": 2409} {"train_loss": -6.372159957885742, "global_step": 101189, "epoch": 2409} {"train_loss": -6.421117782592773, "global_step": 101190, "epoch": 2409} {"train_loss": -6.253873825073242, "global_step": 101191, "epoch": 2409} {"train_loss": -6.354745388031006, "global_step": 101192, "epoch": 2409} {"train_loss": -6.326356887817383, "global_step": 101193, "epoch": 2409} {"train_loss": -6.312959671020508, "global_step": 101194, "epoch": 2409} {"train_loss": -6.387918949127197, "global_step": 101195, "epoch": 2409} {"train_loss": -6.384224891662598, "global_step": 101196, "epoch": 2409} {"train_loss": -6.268640041351318, "global_step": 101197, "epoch": 2409} {"train_loss": -6.277277946472168, "global_step": 101198, "epoch": 2409} {"train_loss": -6.402582168579102, "global_step": 101199, "epoch": 2409} {"train_loss": -6.350005149841309, "global_step": 101200, "epoch": 2409} {"train_loss": -6.440299987792969, "global_step": 101201, "epoch": 2409} {"train_loss": -6.500615119934082, "global_step": 101202, "epoch": 2409} {"train_loss": -6.403261184692383, "global_step": 101203, "epoch": 2409} {"train_loss": -6.2388014793396, "global_step": 101204, "epoch": 2409} {"train_loss": -6.370182991027832, "global_step": 101205, "epoch": 2409} {"train_loss": -6.181229591369629, "global_step": 101206, "epoch": 2409} {"train_loss": -6.432621002197266, "global_step": 101207, "epoch": 2409} {"train_loss": -6.281671524047852, "global_step": 101208, "epoch": 2409} {"train_loss": -6.352215766906738, "global_step": 101209, "epoch": 2409} {"train_loss": -6.402334690093994, "global_step": 101210, "epoch": 2409} {"train_loss": -6.364048004150391, "global_step": 101211, "epoch": 2409} {"train_loss": -6.375443458557129, "global_step": 101212, "epoch": 2409} {"train_loss": -6.224767208099365, "global_step": 101213, "epoch": 2409} {"train_loss": -6.346181869506836, "global_step": 101214, "epoch": 2409} {"train_loss": -6.354027271270752, "global_step": 101215, "epoch": 2409} {"train_loss": -6.254587173461914, "global_step": 101216, "epoch": 2409} {"train_loss": -6.394905090332031, "global_step": 101217, "epoch": 2409} {"train_loss": -6.296097278594971, "global_step": 101218, "epoch": 2409} {"train_loss": -6.341497602916899, "global_step": 101219, "epoch": 2409, "val_loss": 68012.8515625} {"train_loss": -6.371850967407227, "global_step": 101220, "epoch": 2410} {"train_loss": -6.404246807098389, "global_step": 101221, "epoch": 2410} {"train_loss": -6.34569787979126, "global_step": 101222, "epoch": 2410} {"train_loss": -6.35744047164917, "global_step": 101223, "epoch": 2410} {"train_loss": -6.311810493469238, "global_step": 101224, "epoch": 2410} {"train_loss": -6.413163185119629, "global_step": 101225, "epoch": 2410} {"train_loss": -6.300588130950928, "global_step": 101226, "epoch": 2410} {"train_loss": -6.329982280731201, "global_step": 101227, "epoch": 2410} {"train_loss": -6.273928165435791, "global_step": 101228, "epoch": 2410} {"train_loss": -6.402329444885254, "global_step": 101229, "epoch": 2410} {"train_loss": -6.249490737915039, "global_step": 101230, "epoch": 2410} {"train_loss": -6.407978057861328, "global_step": 101231, "epoch": 2410} {"train_loss": -6.331184387207031, "global_step": 101232, "epoch": 2410} {"train_loss": -6.298645973205566, "global_step": 101233, "epoch": 2410} {"train_loss": -6.334518909454346, "global_step": 101234, "epoch": 2410} {"train_loss": -6.135951995849609, "global_step": 101235, "epoch": 2410} {"train_loss": -6.288009166717529, "global_step": 101236, "epoch": 2410} {"train_loss": -6.313745021820068, "global_step": 101237, "epoch": 2410} {"train_loss": -6.195792198181152, "global_step": 101238, "epoch": 2410} {"train_loss": -6.336450576782227, "global_step": 101239, "epoch": 2410} {"train_loss": -6.241525173187256, "global_step": 101240, "epoch": 2410} {"train_loss": -6.336689472198486, "global_step": 101241, "epoch": 2410} {"train_loss": -6.236419677734375, "global_step": 101242, "epoch": 2410} {"train_loss": -6.2648515701293945, "global_step": 101243, "epoch": 2410} {"train_loss": -6.315349578857422, "global_step": 101244, "epoch": 2410} {"train_loss": -6.270127296447754, "global_step": 101245, "epoch": 2410} {"train_loss": -6.303711414337158, "global_step": 101246, "epoch": 2410} {"train_loss": -6.271625995635986, "global_step": 101247, "epoch": 2410} {"train_loss": -6.320688247680664, "global_step": 101248, "epoch": 2410} {"train_loss": -6.328751564025879, "global_step": 101249, "epoch": 2410} {"train_loss": -6.351649284362793, "global_step": 101250, "epoch": 2410} {"train_loss": -6.102809906005859, "global_step": 101251, "epoch": 2410} {"train_loss": -6.420757293701172, "global_step": 101252, "epoch": 2410} {"train_loss": -6.319870471954346, "global_step": 101253, "epoch": 2410} {"train_loss": -6.2782182693481445, "global_step": 101254, "epoch": 2410} {"train_loss": -6.302839756011963, "global_step": 101255, "epoch": 2410} {"train_loss": -6.385984420776367, "global_step": 101256, "epoch": 2410} {"train_loss": -6.310783386230469, "global_step": 101257, "epoch": 2410} {"train_loss": -6.27864933013916, "global_step": 101258, "epoch": 2410} {"train_loss": -6.401447296142578, "global_step": 101259, "epoch": 2410} {"train_loss": -6.1855669021606445, "global_step": 101260, "epoch": 2410} {"train_loss": -6.3082998025984995, "global_step": 101261, "epoch": 2410, "val_loss": 67942.3828125} {"train_loss": -6.376864433288574, "global_step": 101262, "epoch": 2411} {"train_loss": -6.318690299987793, "global_step": 101263, "epoch": 2411} {"train_loss": -6.345269203186035, "global_step": 101264, "epoch": 2411} {"train_loss": -6.26655387878418, "global_step": 101265, "epoch": 2411} {"train_loss": -6.398784637451172, "global_step": 101266, "epoch": 2411} {"train_loss": -6.187522888183594, "global_step": 101267, "epoch": 2411} {"train_loss": -6.442076683044434, "global_step": 101268, "epoch": 2411} {"train_loss": -6.4709882736206055, "global_step": 101269, "epoch": 2411} {"train_loss": -6.36077356338501, "global_step": 101270, "epoch": 2411} {"train_loss": -6.188653945922852, "global_step": 101271, "epoch": 2411} {"train_loss": -6.29672908782959, "global_step": 101272, "epoch": 2411} {"train_loss": -6.339451789855957, "global_step": 101273, "epoch": 2411} {"train_loss": -6.486090660095215, "global_step": 101274, "epoch": 2411} {"train_loss": -6.357435703277588, "global_step": 101275, "epoch": 2411} {"train_loss": -6.341628551483154, "global_step": 101276, "epoch": 2411} {"train_loss": -6.248647212982178, "global_step": 101277, "epoch": 2411} {"train_loss": -6.296213626861572, "global_step": 101278, "epoch": 2411} {"train_loss": -6.302525520324707, "global_step": 101279, "epoch": 2411} {"train_loss": -6.397565841674805, "global_step": 101280, "epoch": 2411} {"train_loss": -6.404659271240234, "global_step": 101281, "epoch": 2411} {"train_loss": -6.196586608886719, "global_step": 101282, "epoch": 2411} {"train_loss": -6.319334030151367, "global_step": 101283, "epoch": 2411} {"train_loss": -6.174116611480713, "global_step": 101284, "epoch": 2411} {"train_loss": -6.363516330718994, "global_step": 101285, "epoch": 2411} {"train_loss": -6.4210968017578125, "global_step": 101286, "epoch": 2411} {"train_loss": -6.216190814971924, "global_step": 101287, "epoch": 2411} {"train_loss": -6.311847686767578, "global_step": 101288, "epoch": 2411} {"train_loss": -6.367275238037109, "global_step": 101289, "epoch": 2411} {"train_loss": -6.26911735534668, "global_step": 101290, "epoch": 2411} {"train_loss": -6.30961275100708, "global_step": 101291, "epoch": 2411} {"train_loss": -6.272322177886963, "global_step": 101292, "epoch": 2411} {"train_loss": -6.309096336364746, "global_step": 101293, "epoch": 2411} {"train_loss": -6.289304733276367, "global_step": 101294, "epoch": 2411} {"train_loss": -6.313161373138428, "global_step": 101295, "epoch": 2411} {"train_loss": -6.539433479309082, "global_step": 101296, "epoch": 2411} {"train_loss": -6.341577529907227, "global_step": 101297, "epoch": 2411} {"train_loss": -6.344150543212891, "global_step": 101298, "epoch": 2411} {"train_loss": -6.406181335449219, "global_step": 101299, "epoch": 2411} {"train_loss": -6.402413845062256, "global_step": 101300, "epoch": 2411} {"train_loss": -6.291716575622559, "global_step": 101301, "epoch": 2411} {"train_loss": -6.347900390625, "global_step": 101302, "epoch": 2411} {"train_loss": -6.331688358670189, "global_step": 101303, "epoch": 2411, "val_loss": 67843.625} {"train_loss": -6.304701328277588, "global_step": 101304, "epoch": 2412} {"train_loss": -6.386052131652832, "global_step": 101305, "epoch": 2412} {"train_loss": -6.267953395843506, "global_step": 101306, "epoch": 2412} {"train_loss": -6.405070781707764, "global_step": 101307, "epoch": 2412} {"train_loss": -6.330175399780273, "global_step": 101308, "epoch": 2412} {"train_loss": -6.395074844360352, "global_step": 101309, "epoch": 2412} {"train_loss": -6.4409685134887695, "global_step": 101310, "epoch": 2412} {"train_loss": -6.344430446624756, "global_step": 101311, "epoch": 2412} {"train_loss": -6.364996910095215, "global_step": 101312, "epoch": 2412} {"train_loss": -6.347349166870117, "global_step": 101313, "epoch": 2412} {"train_loss": -6.37288761138916, "global_step": 101314, "epoch": 2412} {"train_loss": -6.265521049499512, "global_step": 101315, "epoch": 2412} {"train_loss": -6.376789093017578, "global_step": 101316, "epoch": 2412} {"train_loss": -6.300021171569824, "global_step": 101317, "epoch": 2412} {"train_loss": -6.3949995040893555, "global_step": 101318, "epoch": 2412} {"train_loss": -6.444327354431152, "global_step": 101319, "epoch": 2412} {"train_loss": -6.402067184448242, "global_step": 101320, "epoch": 2412} {"train_loss": -6.2815351486206055, "global_step": 101321, "epoch": 2412} {"train_loss": -6.449955940246582, "global_step": 101322, "epoch": 2412} {"train_loss": -6.372358798980713, "global_step": 101323, "epoch": 2412} {"train_loss": -6.2958478927612305, "global_step": 101324, "epoch": 2412} {"train_loss": -6.288076400756836, "global_step": 101325, "epoch": 2412} {"train_loss": -6.375121116638184, "global_step": 101326, "epoch": 2412} {"train_loss": -6.357151985168457, "global_step": 101327, "epoch": 2412} {"train_loss": -6.402772426605225, "global_step": 101328, "epoch": 2412} {"train_loss": -6.224776268005371, "global_step": 101329, "epoch": 2412} {"train_loss": -6.4490966796875, "global_step": 101330, "epoch": 2412} {"train_loss": -6.47753381729126, "global_step": 101331, "epoch": 2412} {"train_loss": -6.4237380027771, "global_step": 101332, "epoch": 2412} {"train_loss": -6.457115650177002, "global_step": 101333, "epoch": 2412} {"train_loss": -6.386872291564941, "global_step": 101334, "epoch": 2412} {"train_loss": -6.280796051025391, "global_step": 101335, "epoch": 2412} {"train_loss": -6.275700092315674, "global_step": 101336, "epoch": 2412} {"train_loss": -6.355961799621582, "global_step": 101337, "epoch": 2412} {"train_loss": -6.319942474365234, "global_step": 101338, "epoch": 2412} {"train_loss": -6.423313140869141, "global_step": 101339, "epoch": 2412} {"train_loss": -6.336363792419434, "global_step": 101340, "epoch": 2412} {"train_loss": -6.282999515533447, "global_step": 101341, "epoch": 2412} {"train_loss": -6.365818977355957, "global_step": 101342, "epoch": 2412} {"train_loss": -6.415477752685547, "global_step": 101343, "epoch": 2412} {"train_loss": -6.35517692565918, "global_step": 101344, "epoch": 2412} {"train_loss": -6.361979416438511, "global_step": 101345, "epoch": 2412, "val_loss": 67814.0859375} {"train_loss": -6.322486400604248, "global_step": 101346, "epoch": 2413} {"train_loss": -6.41032600402832, "global_step": 101347, "epoch": 2413} {"train_loss": -6.305383205413818, "global_step": 101348, "epoch": 2413} {"train_loss": -6.34322452545166, "global_step": 101349, "epoch": 2413} {"train_loss": -6.357510566711426, "global_step": 101350, "epoch": 2413} {"train_loss": -6.374417304992676, "global_step": 101351, "epoch": 2413} {"train_loss": -6.497082710266113, "global_step": 101352, "epoch": 2413} {"train_loss": -6.549127101898193, "global_step": 101353, "epoch": 2413} {"train_loss": -6.292161464691162, "global_step": 101354, "epoch": 2413} {"train_loss": -6.346556663513184, "global_step": 101355, "epoch": 2413} {"train_loss": -6.370007514953613, "global_step": 101356, "epoch": 2413} {"train_loss": -6.366688251495361, "global_step": 101357, "epoch": 2413} {"train_loss": -6.239679336547852, "global_step": 101358, "epoch": 2413} {"train_loss": -6.363691329956055, "global_step": 101359, "epoch": 2413} {"train_loss": -6.3052167892456055, "global_step": 101360, "epoch": 2413} {"train_loss": -6.406956195831299, "global_step": 101361, "epoch": 2413} {"train_loss": -6.359068870544434, "global_step": 101362, "epoch": 2413} {"train_loss": -6.355206489562988, "global_step": 101363, "epoch": 2413} {"train_loss": -6.367112159729004, "global_step": 101364, "epoch": 2413} {"train_loss": -6.3817949295043945, "global_step": 101365, "epoch": 2413} {"train_loss": -6.212515830993652, "global_step": 101366, "epoch": 2413} {"train_loss": -6.299352169036865, "global_step": 101367, "epoch": 2413} {"train_loss": -6.442325592041016, "global_step": 101368, "epoch": 2413} {"train_loss": -6.281702041625977, "global_step": 101369, "epoch": 2413} {"train_loss": -6.344357490539551, "global_step": 101370, "epoch": 2413} {"train_loss": -6.261649131774902, "global_step": 101371, "epoch": 2413} {"train_loss": -6.360857963562012, "global_step": 101372, "epoch": 2413} {"train_loss": -6.3473992347717285, "global_step": 101373, "epoch": 2413} {"train_loss": -6.281814098358154, "global_step": 101374, "epoch": 2413} {"train_loss": -6.455717086791992, "global_step": 101375, "epoch": 2413} {"train_loss": -6.386040210723877, "global_step": 101376, "epoch": 2413} {"train_loss": -6.341326713562012, "global_step": 101377, "epoch": 2413} {"train_loss": -6.467471599578857, "global_step": 101378, "epoch": 2413} {"train_loss": -6.3461480140686035, "global_step": 101379, "epoch": 2413} {"train_loss": -6.419336795806885, "global_step": 101380, "epoch": 2413} {"train_loss": -6.415776252746582, "global_step": 101381, "epoch": 2413} {"train_loss": -6.195004463195801, "global_step": 101382, "epoch": 2413} {"train_loss": -6.280637741088867, "global_step": 101383, "epoch": 2413} {"train_loss": -6.2740936279296875, "global_step": 101384, "epoch": 2413} {"train_loss": -6.250120639801025, "global_step": 101385, "epoch": 2413} {"train_loss": -6.274552822113037, "global_step": 101386, "epoch": 2413} {"train_loss": -6.344961041495914, "global_step": 101387, "epoch": 2413, "val_loss": 68056.4609375} {"train_loss": -6.258995532989502, "global_step": 101388, "epoch": 2414} {"train_loss": -6.306585311889648, "global_step": 101389, "epoch": 2414} {"train_loss": -6.304232597351074, "global_step": 101390, "epoch": 2414} {"train_loss": -6.328620910644531, "global_step": 101391, "epoch": 2414} {"train_loss": -6.337176322937012, "global_step": 101392, "epoch": 2414} {"train_loss": -6.28695011138916, "global_step": 101393, "epoch": 2414} {"train_loss": -6.356161117553711, "global_step": 101394, "epoch": 2414} {"train_loss": -6.187966346740723, "global_step": 101395, "epoch": 2414} {"train_loss": -6.283109188079834, "global_step": 101396, "epoch": 2414} {"train_loss": -6.4185004234313965, "global_step": 101397, "epoch": 2414} {"train_loss": -6.206201553344727, "global_step": 101398, "epoch": 2414} {"train_loss": -6.310693740844727, "global_step": 101399, "epoch": 2414} {"train_loss": -6.256461143493652, "global_step": 101400, "epoch": 2414} {"train_loss": -6.346149444580078, "global_step": 101401, "epoch": 2414} {"train_loss": -6.440615653991699, "global_step": 101402, "epoch": 2414} {"train_loss": -6.379622936248779, "global_step": 101403, "epoch": 2414} {"train_loss": -6.348535537719727, "global_step": 101404, "epoch": 2414} {"train_loss": -6.43581485748291, "global_step": 101405, "epoch": 2414} {"train_loss": -6.355355739593506, "global_step": 101406, "epoch": 2414} {"train_loss": -6.407397270202637, "global_step": 101407, "epoch": 2414} {"train_loss": -6.3579607009887695, "global_step": 101408, "epoch": 2414} {"train_loss": -6.445345878601074, "global_step": 101409, "epoch": 2414} {"train_loss": -6.480199813842773, "global_step": 101410, "epoch": 2414} {"train_loss": -6.403420925140381, "global_step": 101411, "epoch": 2414} {"train_loss": -6.337321758270264, "global_step": 101412, "epoch": 2414} {"train_loss": -6.353568077087402, "global_step": 101413, "epoch": 2414} {"train_loss": -6.34161901473999, "global_step": 101414, "epoch": 2414} {"train_loss": -6.335749626159668, "global_step": 101415, "epoch": 2414} {"train_loss": -6.3238372802734375, "global_step": 101416, "epoch": 2414} {"train_loss": -6.424332141876221, "global_step": 101417, "epoch": 2414} {"train_loss": -6.377768039703369, "global_step": 101418, "epoch": 2414} {"train_loss": -6.2519636154174805, "global_step": 101419, "epoch": 2414} {"train_loss": -6.3020453453063965, "global_step": 101420, "epoch": 2414} {"train_loss": -6.370278835296631, "global_step": 101421, "epoch": 2414} {"train_loss": -6.3973164558410645, "global_step": 101422, "epoch": 2414} {"train_loss": -6.383747100830078, "global_step": 101423, "epoch": 2414} {"train_loss": -6.314400672912598, "global_step": 101424, "epoch": 2414} {"train_loss": -6.392783164978027, "global_step": 101425, "epoch": 2414} {"train_loss": -6.311635494232178, "global_step": 101426, "epoch": 2414} {"train_loss": -6.346243381500244, "global_step": 101427, "epoch": 2414} {"train_loss": -6.35340690612793, "global_step": 101428, "epoch": 2414} {"train_loss": -6.343888282775879, "global_step": 101429, "epoch": 2414, "val_loss": 67921.671875} {"train_loss": -6.464204788208008, "global_step": 101430, "epoch": 2415} {"train_loss": -6.181497573852539, "global_step": 101431, "epoch": 2415} {"train_loss": -6.303404808044434, "global_step": 101432, "epoch": 2415} {"train_loss": -6.336450576782227, "global_step": 101433, "epoch": 2415} {"train_loss": -6.2737836837768555, "global_step": 101434, "epoch": 2415} {"train_loss": -6.314819812774658, "global_step": 101435, "epoch": 2415} {"train_loss": -6.347504615783691, "global_step": 101436, "epoch": 2415} {"train_loss": -6.39564323425293, "global_step": 101437, "epoch": 2415} {"train_loss": -6.320252418518066, "global_step": 101438, "epoch": 2415} {"train_loss": -6.288732051849365, "global_step": 101439, "epoch": 2415} {"train_loss": -6.259515762329102, "global_step": 101440, "epoch": 2415} {"train_loss": -6.367293357849121, "global_step": 101441, "epoch": 2415} {"train_loss": -6.352232933044434, "global_step": 101442, "epoch": 2415} {"train_loss": -6.296120643615723, "global_step": 101443, "epoch": 2415} {"train_loss": -6.3373703956604, "global_step": 101444, "epoch": 2415} {"train_loss": -6.380331039428711, "global_step": 101445, "epoch": 2415} {"train_loss": -6.332435607910156, "global_step": 101446, "epoch": 2415} {"train_loss": -6.401334285736084, "global_step": 101447, "epoch": 2415} {"train_loss": -6.443334579467773, "global_step": 101448, "epoch": 2415} {"train_loss": -6.448661804199219, "global_step": 101449, "epoch": 2415} {"train_loss": -6.394876003265381, "global_step": 101450, "epoch": 2415} {"train_loss": -6.339359760284424, "global_step": 101451, "epoch": 2415} {"train_loss": -6.235068321228027, "global_step": 101452, "epoch": 2415} {"train_loss": -6.289525032043457, "global_step": 101453, "epoch": 2415} {"train_loss": -6.351635932922363, "global_step": 101454, "epoch": 2415} {"train_loss": -6.461190223693848, "global_step": 101455, "epoch": 2415} {"train_loss": -6.4280571937561035, "global_step": 101456, "epoch": 2415} {"train_loss": -6.379342555999756, "global_step": 101457, "epoch": 2415} {"train_loss": -6.356638431549072, "global_step": 101458, "epoch": 2415} {"train_loss": -6.371431350708008, "global_step": 101459, "epoch": 2415} {"train_loss": -6.250786781311035, "global_step": 101460, "epoch": 2415} {"train_loss": -6.393730163574219, "global_step": 101461, "epoch": 2415} {"train_loss": -6.4114580154418945, "global_step": 101462, "epoch": 2415} {"train_loss": -6.410499095916748, "global_step": 101463, "epoch": 2415} {"train_loss": -6.183374404907227, "global_step": 101464, "epoch": 2415} {"train_loss": -6.359781742095947, "global_step": 101465, "epoch": 2415} {"train_loss": -6.457729339599609, "global_step": 101466, "epoch": 2415} {"train_loss": -6.204911231994629, "global_step": 101467, "epoch": 2415} {"train_loss": -6.257864952087402, "global_step": 101468, "epoch": 2415} {"train_loss": -6.330083847045898, "global_step": 101469, "epoch": 2415} {"train_loss": -6.32573127746582, "global_step": 101470, "epoch": 2415} {"train_loss": -6.344835724149432, "global_step": 101471, "epoch": 2415, "val_loss": 68068.5703125} {"train_loss": -6.383908271789551, "global_step": 101472, "epoch": 2416} {"train_loss": -6.446612358093262, "global_step": 101473, "epoch": 2416} {"train_loss": -6.369178295135498, "global_step": 101474, "epoch": 2416} {"train_loss": -6.254561424255371, "global_step": 101475, "epoch": 2416} {"train_loss": -6.392642974853516, "global_step": 101476, "epoch": 2416} {"train_loss": -6.27622127532959, "global_step": 101477, "epoch": 2416} {"train_loss": -6.387697696685791, "global_step": 101478, "epoch": 2416} {"train_loss": -6.382785797119141, "global_step": 101479, "epoch": 2416} {"train_loss": -6.2516679763793945, "global_step": 101480, "epoch": 2416} {"train_loss": -6.329150676727295, "global_step": 101481, "epoch": 2416} {"train_loss": -6.3836445808410645, "global_step": 101482, "epoch": 2416} {"train_loss": -6.37321662902832, "global_step": 101483, "epoch": 2416} {"train_loss": -6.279641628265381, "global_step": 101484, "epoch": 2416} {"train_loss": -6.40789794921875, "global_step": 101485, "epoch": 2416} {"train_loss": -6.219822883605957, "global_step": 101486, "epoch": 2416} {"train_loss": -6.4100341796875, "global_step": 101487, "epoch": 2416} {"train_loss": -6.425745010375977, "global_step": 101488, "epoch": 2416} {"train_loss": -6.355954170227051, "global_step": 101489, "epoch": 2416} {"train_loss": -6.366509914398193, "global_step": 101490, "epoch": 2416} {"train_loss": -6.334292411804199, "global_step": 101491, "epoch": 2416} {"train_loss": -6.301037788391113, "global_step": 101492, "epoch": 2416} {"train_loss": -6.266626358032227, "global_step": 101493, "epoch": 2416} {"train_loss": -6.356738090515137, "global_step": 101494, "epoch": 2416} {"train_loss": -6.336562156677246, "global_step": 101495, "epoch": 2416} {"train_loss": -6.320251941680908, "global_step": 101496, "epoch": 2416} {"train_loss": -6.414411544799805, "global_step": 101497, "epoch": 2416} {"train_loss": -6.324188232421875, "global_step": 101498, "epoch": 2416} {"train_loss": -6.4071760177612305, "global_step": 101499, "epoch": 2416} {"train_loss": -6.45506477355957, "global_step": 101500, "epoch": 2416} {"train_loss": -6.385498046875, "global_step": 101501, "epoch": 2416} {"train_loss": -6.325089454650879, "global_step": 101502, "epoch": 2416} {"train_loss": -6.430880546569824, "global_step": 101503, "epoch": 2416} {"train_loss": -6.342840671539307, "global_step": 101504, "epoch": 2416} {"train_loss": -6.387423038482666, "global_step": 101505, "epoch": 2416} {"train_loss": -6.265469551086426, "global_step": 101506, "epoch": 2416} {"train_loss": -6.393735885620117, "global_step": 101507, "epoch": 2416} {"train_loss": -6.321866035461426, "global_step": 101508, "epoch": 2416} {"train_loss": -6.329695701599121, "global_step": 101509, "epoch": 2416} {"train_loss": -6.253995895385742, "global_step": 101510, "epoch": 2416} {"train_loss": -6.437507629394531, "global_step": 101511, "epoch": 2416} {"train_loss": -6.38469123840332, "global_step": 101512, "epoch": 2416} {"train_loss": -6.349630628313337, "global_step": 101513, "epoch": 2416, "val_loss": 67881.25} {"train_loss": -6.343451023101807, "global_step": 101514, "epoch": 2417} {"train_loss": -6.308296203613281, "global_step": 101515, "epoch": 2417} {"train_loss": -6.390373229980469, "global_step": 101516, "epoch": 2417} {"train_loss": -6.201357364654541, "global_step": 101517, "epoch": 2417} {"train_loss": -6.33233642578125, "global_step": 101518, "epoch": 2417} {"train_loss": -6.3387603759765625, "global_step": 101519, "epoch": 2417} {"train_loss": -6.3248138427734375, "global_step": 101520, "epoch": 2417} {"train_loss": -6.305139541625977, "global_step": 101521, "epoch": 2417} {"train_loss": -6.260892868041992, "global_step": 101522, "epoch": 2417} {"train_loss": -6.277520179748535, "global_step": 101523, "epoch": 2417} {"train_loss": -6.397618293762207, "global_step": 101524, "epoch": 2417} {"train_loss": -6.383289337158203, "global_step": 101525, "epoch": 2417} {"train_loss": -6.277735710144043, "global_step": 101526, "epoch": 2417} {"train_loss": -6.428836822509766, "global_step": 101527, "epoch": 2417} {"train_loss": -6.339935302734375, "global_step": 101528, "epoch": 2417} {"train_loss": -6.189178466796875, "global_step": 101529, "epoch": 2417} {"train_loss": -6.3876824378967285, "global_step": 101530, "epoch": 2417} {"train_loss": -6.172734260559082, "global_step": 101531, "epoch": 2417} {"train_loss": -6.427751541137695, "global_step": 101532, "epoch": 2417} {"train_loss": -6.260796546936035, "global_step": 101533, "epoch": 2417} {"train_loss": -6.400820732116699, "global_step": 101534, "epoch": 2417} {"train_loss": -6.195240020751953, "global_step": 101535, "epoch": 2417} {"train_loss": -6.1957926750183105, "global_step": 101536, "epoch": 2417} {"train_loss": -6.389001846313477, "global_step": 101537, "epoch": 2417} {"train_loss": -6.240518569946289, "global_step": 101538, "epoch": 2417} {"train_loss": -6.3462300300598145, "global_step": 101539, "epoch": 2417} {"train_loss": -6.273110389709473, "global_step": 101540, "epoch": 2417} {"train_loss": -6.299897193908691, "global_step": 101541, "epoch": 2417} {"train_loss": -6.2310590744018555, "global_step": 101542, "epoch": 2417} {"train_loss": -6.244500160217285, "global_step": 101543, "epoch": 2417} {"train_loss": -6.219005584716797, "global_step": 101544, "epoch": 2417} {"train_loss": -6.374265193939209, "global_step": 101545, "epoch": 2417} {"train_loss": -6.252111434936523, "global_step": 101546, "epoch": 2417} {"train_loss": -6.393331527709961, "global_step": 101547, "epoch": 2417} {"train_loss": -6.288180828094482, "global_step": 101548, "epoch": 2417} {"train_loss": -6.33515739440918, "global_step": 101549, "epoch": 2417} {"train_loss": -6.325165748596191, "global_step": 101550, "epoch": 2417} {"train_loss": -6.3356781005859375, "global_step": 101551, "epoch": 2417} {"train_loss": -6.444768905639648, "global_step": 101552, "epoch": 2417} {"train_loss": -6.32930850982666, "global_step": 101553, "epoch": 2417} {"train_loss": -6.302803993225098, "global_step": 101554, "epoch": 2417} {"train_loss": -6.311194442567372, "global_step": 101555, "epoch": 2417, "val_loss": 67984.6875} {"train_loss": -6.412478923797607, "global_step": 101556, "epoch": 2418} {"train_loss": -6.372883319854736, "global_step": 101557, "epoch": 2418} {"train_loss": -6.284719467163086, "global_step": 101558, "epoch": 2418} {"train_loss": -6.361021518707275, "global_step": 101559, "epoch": 2418} {"train_loss": -6.287988662719727, "global_step": 101560, "epoch": 2418} {"train_loss": -6.323995590209961, "global_step": 101561, "epoch": 2418} {"train_loss": -6.351591110229492, "global_step": 101562, "epoch": 2418} {"train_loss": -6.469656944274902, "global_step": 101563, "epoch": 2418} {"train_loss": -6.34884786605835, "global_step": 101564, "epoch": 2418} {"train_loss": -6.373429775238037, "global_step": 101565, "epoch": 2418} {"train_loss": -6.454413890838623, "global_step": 101566, "epoch": 2418} {"train_loss": -6.424027919769287, "global_step": 101567, "epoch": 2418} {"train_loss": -6.315020561218262, "global_step": 101568, "epoch": 2418} {"train_loss": -6.350661277770996, "global_step": 101569, "epoch": 2418} {"train_loss": -6.3080949783325195, "global_step": 101570, "epoch": 2418} {"train_loss": -6.227473735809326, "global_step": 101571, "epoch": 2418} {"train_loss": -6.3196563720703125, "global_step": 101572, "epoch": 2418} {"train_loss": -6.358861923217773, "global_step": 101573, "epoch": 2418} {"train_loss": -6.320065498352051, "global_step": 101574, "epoch": 2418} {"train_loss": -6.238234996795654, "global_step": 101575, "epoch": 2418} {"train_loss": -6.421593189239502, "global_step": 101576, "epoch": 2418} {"train_loss": -6.377108573913574, "global_step": 101577, "epoch": 2418} {"train_loss": -6.377553939819336, "global_step": 101578, "epoch": 2418} {"train_loss": -6.370612144470215, "global_step": 101579, "epoch": 2418} {"train_loss": -6.262208461761475, "global_step": 101580, "epoch": 2418} {"train_loss": -6.240476131439209, "global_step": 101581, "epoch": 2418} {"train_loss": -6.353464603424072, "global_step": 101582, "epoch": 2418} {"train_loss": -6.436135768890381, "global_step": 101583, "epoch": 2418} {"train_loss": -6.379216194152832, "global_step": 101584, "epoch": 2418} {"train_loss": -6.225910186767578, "global_step": 101585, "epoch": 2418} {"train_loss": -6.400408744812012, "global_step": 101586, "epoch": 2418} {"train_loss": -6.299261093139648, "global_step": 101587, "epoch": 2418} {"train_loss": -6.396719932556152, "global_step": 101588, "epoch": 2418} {"train_loss": -6.332848072052002, "global_step": 101589, "epoch": 2418} {"train_loss": -6.22211217880249, "global_step": 101590, "epoch": 2418} {"train_loss": -6.355224609375, "global_step": 101591, "epoch": 2418} {"train_loss": -6.3862433433532715, "global_step": 101592, "epoch": 2418} {"train_loss": -6.3607587814331055, "global_step": 101593, "epoch": 2418} {"train_loss": -6.464312553405762, "global_step": 101594, "epoch": 2418} {"train_loss": -6.359494686126709, "global_step": 101595, "epoch": 2418} {"train_loss": -6.368935585021973, "global_step": 101596, "epoch": 2418} {"train_loss": -6.348317350660052, "global_step": 101597, "epoch": 2418, "val_loss": 67809.5390625} {"train_loss": -6.401135444641113, "global_step": 101598, "epoch": 2419} {"train_loss": -6.416130065917969, "global_step": 101599, "epoch": 2419} {"train_loss": -6.434505939483643, "global_step": 101600, "epoch": 2419} {"train_loss": -6.380722999572754, "global_step": 101601, "epoch": 2419} {"train_loss": -6.408777236938477, "global_step": 101602, "epoch": 2419} {"train_loss": -6.362832069396973, "global_step": 101603, "epoch": 2419} {"train_loss": -6.449342727661133, "global_step": 101604, "epoch": 2419} {"train_loss": -6.428792953491211, "global_step": 101605, "epoch": 2419} {"train_loss": -6.22468376159668, "global_step": 101606, "epoch": 2419} {"train_loss": -6.407041072845459, "global_step": 101607, "epoch": 2419} {"train_loss": -6.374760627746582, "global_step": 101608, "epoch": 2419} {"train_loss": -6.303508758544922, "global_step": 101609, "epoch": 2419} {"train_loss": -6.3406524658203125, "global_step": 101610, "epoch": 2419} {"train_loss": -6.357450485229492, "global_step": 101611, "epoch": 2419} {"train_loss": -6.18447732925415, "global_step": 101612, "epoch": 2419} {"train_loss": -6.287115097045898, "global_step": 101613, "epoch": 2419} {"train_loss": -6.367374420166016, "global_step": 101614, "epoch": 2419} {"train_loss": -6.354776382446289, "global_step": 101615, "epoch": 2419} {"train_loss": -6.3335185050964355, "global_step": 101616, "epoch": 2419} {"train_loss": -6.253023624420166, "global_step": 101617, "epoch": 2419} {"train_loss": -6.167962074279785, "global_step": 101618, "epoch": 2419} {"train_loss": -6.368464469909668, "global_step": 101619, "epoch": 2419} {"train_loss": -6.264840602874756, "global_step": 101620, "epoch": 2419} {"train_loss": -6.307170867919922, "global_step": 101621, "epoch": 2419} {"train_loss": -6.452201843261719, "global_step": 101622, "epoch": 2419} {"train_loss": -6.252674102783203, "global_step": 101623, "epoch": 2419} {"train_loss": -6.264256954193115, "global_step": 101624, "epoch": 2419} {"train_loss": -6.291598796844482, "global_step": 101625, "epoch": 2419} {"train_loss": -6.2428364753723145, "global_step": 101626, "epoch": 2419} {"train_loss": -6.223515510559082, "global_step": 101627, "epoch": 2419} {"train_loss": -6.352424621582031, "global_step": 101628, "epoch": 2419} {"train_loss": -6.362186908721924, "global_step": 101629, "epoch": 2419} {"train_loss": -6.354038715362549, "global_step": 101630, "epoch": 2419} {"train_loss": -6.264921188354492, "global_step": 101631, "epoch": 2419} {"train_loss": -6.272653579711914, "global_step": 101632, "epoch": 2419} {"train_loss": -6.370050430297852, "global_step": 101633, "epoch": 2419} {"train_loss": -6.534066677093506, "global_step": 101634, "epoch": 2419} {"train_loss": -6.299858570098877, "global_step": 101635, "epoch": 2419} {"train_loss": -6.25189733505249, "global_step": 101636, "epoch": 2419} {"train_loss": -6.424263954162598, "global_step": 101637, "epoch": 2419} {"train_loss": -6.328050136566162, "global_step": 101638, "epoch": 2419} {"train_loss": -6.3350284440176825, "global_step": 101639, "epoch": 2419, "val_loss": 67754.6484375} {"train_loss": -6.323406219482422, "global_step": 101640, "epoch": 2420} {"train_loss": -6.398369312286377, "global_step": 101641, "epoch": 2420} {"train_loss": -6.39325475692749, "global_step": 101642, "epoch": 2420} {"train_loss": -6.346874713897705, "global_step": 101643, "epoch": 2420} {"train_loss": -6.469470977783203, "global_step": 101644, "epoch": 2420} {"train_loss": -6.308189392089844, "global_step": 101645, "epoch": 2420} {"train_loss": -6.265621662139893, "global_step": 101646, "epoch": 2420} {"train_loss": -6.255074501037598, "global_step": 101647, "epoch": 2420} {"train_loss": -6.458020210266113, "global_step": 101648, "epoch": 2420} {"train_loss": -6.3660569190979, "global_step": 101649, "epoch": 2420} {"train_loss": -6.181236743927002, "global_step": 101650, "epoch": 2420} {"train_loss": -6.189077854156494, "global_step": 101651, "epoch": 2420} {"train_loss": -6.280879020690918, "global_step": 101652, "epoch": 2420} {"train_loss": -6.316688537597656, "global_step": 101653, "epoch": 2420} {"train_loss": -6.268800735473633, "global_step": 101654, "epoch": 2420} {"train_loss": -6.457435607910156, "global_step": 101655, "epoch": 2420} {"train_loss": -6.3358049392700195, "global_step": 101656, "epoch": 2420} {"train_loss": -6.161001682281494, "global_step": 101657, "epoch": 2420} {"train_loss": -6.165579795837402, "global_step": 101658, "epoch": 2420} {"train_loss": -6.227662086486816, "global_step": 101659, "epoch": 2420} {"train_loss": -6.2156243324279785, "global_step": 101660, "epoch": 2420} {"train_loss": -6.3536224365234375, "global_step": 101661, "epoch": 2420} {"train_loss": -6.330133438110352, "global_step": 101662, "epoch": 2420} {"train_loss": -6.1197710037231445, "global_step": 101663, "epoch": 2420} {"train_loss": -6.372481346130371, "global_step": 101664, "epoch": 2420} {"train_loss": -6.358859062194824, "global_step": 101665, "epoch": 2420} {"train_loss": -6.45003604888916, "global_step": 101666, "epoch": 2420} {"train_loss": -6.285573482513428, "global_step": 101667, "epoch": 2420} {"train_loss": -6.362889766693115, "global_step": 101668, "epoch": 2420} {"train_loss": -6.471068859100342, "global_step": 101669, "epoch": 2420} {"train_loss": -6.338928699493408, "global_step": 101670, "epoch": 2420} {"train_loss": -6.305511951446533, "global_step": 101671, "epoch": 2420} {"train_loss": -6.293600082397461, "global_step": 101672, "epoch": 2420} {"train_loss": -6.395745277404785, "global_step": 101673, "epoch": 2420} {"train_loss": -6.181853294372559, "global_step": 101674, "epoch": 2420} {"train_loss": -6.444824695587158, "global_step": 101675, "epoch": 2420} {"train_loss": -6.369040012359619, "global_step": 101676, "epoch": 2420} {"train_loss": -6.338069438934326, "global_step": 101677, "epoch": 2420} {"train_loss": -6.352725982666016, "global_step": 101678, "epoch": 2420} {"train_loss": -6.330155849456787, "global_step": 101679, "epoch": 2420} {"train_loss": -6.480241775512695, "global_step": 101680, "epoch": 2420} {"train_loss": -6.326521385283697, "global_step": 101681, "epoch": 2420, "val_loss": 67802.515625} {"train_loss": -6.344738483428955, "global_step": 101682, "epoch": 2421} {"train_loss": -6.330619812011719, "global_step": 101683, "epoch": 2421} {"train_loss": -6.434552192687988, "global_step": 101684, "epoch": 2421} {"train_loss": -6.343661308288574, "global_step": 101685, "epoch": 2421} {"train_loss": -6.375258445739746, "global_step": 101686, "epoch": 2421} {"train_loss": -6.317779541015625, "global_step": 101687, "epoch": 2421} {"train_loss": -6.289583206176758, "global_step": 101688, "epoch": 2421} {"train_loss": -6.386228084564209, "global_step": 101689, "epoch": 2421} {"train_loss": -6.361892223358154, "global_step": 101690, "epoch": 2421} {"train_loss": -6.237457275390625, "global_step": 101691, "epoch": 2421} {"train_loss": -6.264801979064941, "global_step": 101692, "epoch": 2421} {"train_loss": -6.390500545501709, "global_step": 101693, "epoch": 2421} {"train_loss": -6.233963489532471, "global_step": 101694, "epoch": 2421} {"train_loss": -6.369245529174805, "global_step": 101695, "epoch": 2421} {"train_loss": -6.24444580078125, "global_step": 101696, "epoch": 2421} {"train_loss": -6.295957565307617, "global_step": 101697, "epoch": 2421} {"train_loss": -6.3618621826171875, "global_step": 101698, "epoch": 2421} {"train_loss": -6.391671180725098, "global_step": 101699, "epoch": 2421} {"train_loss": -6.404289722442627, "global_step": 101700, "epoch": 2421} {"train_loss": -6.354363441467285, "global_step": 101701, "epoch": 2421} {"train_loss": -6.445466995239258, "global_step": 101702, "epoch": 2421} {"train_loss": -6.250316619873047, "global_step": 101703, "epoch": 2421} {"train_loss": -6.266368865966797, "global_step": 101704, "epoch": 2421} {"train_loss": -6.408802509307861, "global_step": 101705, "epoch": 2421} {"train_loss": -6.292191982269287, "global_step": 101706, "epoch": 2421} {"train_loss": -6.346854209899902, "global_step": 101707, "epoch": 2421} {"train_loss": -6.3276848793029785, "global_step": 101708, "epoch": 2421} {"train_loss": -6.222716331481934, "global_step": 101709, "epoch": 2421} {"train_loss": -6.357785224914551, "global_step": 101710, "epoch": 2421} {"train_loss": -6.239707946777344, "global_step": 101711, "epoch": 2421} {"train_loss": -6.285175323486328, "global_step": 101712, "epoch": 2421} {"train_loss": -6.400619029998779, "global_step": 101713, "epoch": 2421} {"train_loss": -6.386727333068848, "global_step": 101714, "epoch": 2421} {"train_loss": -6.281057834625244, "global_step": 101715, "epoch": 2421} {"train_loss": -6.30218505859375, "global_step": 101716, "epoch": 2421} {"train_loss": -6.375651836395264, "global_step": 101717, "epoch": 2421} {"train_loss": -6.39808988571167, "global_step": 101718, "epoch": 2421} {"train_loss": -6.498595237731934, "global_step": 101719, "epoch": 2421} {"train_loss": -6.460205078125, "global_step": 101720, "epoch": 2421} {"train_loss": -6.433506488800049, "global_step": 101721, "epoch": 2421} {"train_loss": -6.2850871086120605, "global_step": 101722, "epoch": 2421} {"train_loss": -6.343444177082607, "global_step": 101723, "epoch": 2421, "val_loss": 68000.421875} {"train_loss": -6.526739120483398, "global_step": 101724, "epoch": 2422} {"train_loss": -6.391432762145996, "global_step": 101725, "epoch": 2422} {"train_loss": -6.296017646789551, "global_step": 101726, "epoch": 2422} {"train_loss": -6.434722423553467, "global_step": 101727, "epoch": 2422} {"train_loss": -6.36751651763916, "global_step": 101728, "epoch": 2422} {"train_loss": -6.3984479904174805, "global_step": 101729, "epoch": 2422} {"train_loss": -6.294031620025635, "global_step": 101730, "epoch": 2422} {"train_loss": -6.360189914703369, "global_step": 101731, "epoch": 2422} {"train_loss": -6.326894760131836, "global_step": 101732, "epoch": 2422} {"train_loss": -6.339027404785156, "global_step": 101733, "epoch": 2422} {"train_loss": -6.257181167602539, "global_step": 101734, "epoch": 2422} {"train_loss": -6.337414264678955, "global_step": 101735, "epoch": 2422} {"train_loss": -6.329659461975098, "global_step": 101736, "epoch": 2422} {"train_loss": -6.364633560180664, "global_step": 101737, "epoch": 2422} {"train_loss": -6.296224594116211, "global_step": 101738, "epoch": 2422} {"train_loss": -6.4233078956604, "global_step": 101739, "epoch": 2422} {"train_loss": -6.387446880340576, "global_step": 101740, "epoch": 2422} {"train_loss": -6.318772315979004, "global_step": 101741, "epoch": 2422} {"train_loss": -6.217106342315674, "global_step": 101742, "epoch": 2422} {"train_loss": -6.380344390869141, "global_step": 101743, "epoch": 2422} {"train_loss": -6.267147064208984, "global_step": 101744, "epoch": 2422} {"train_loss": -6.328091144561768, "global_step": 101745, "epoch": 2422} {"train_loss": -6.339020729064941, "global_step": 101746, "epoch": 2422} {"train_loss": -6.337265491485596, "global_step": 101747, "epoch": 2422} {"train_loss": -6.40043306350708, "global_step": 101748, "epoch": 2422} {"train_loss": -6.369574546813965, "global_step": 101749, "epoch": 2422} {"train_loss": -6.368083477020264, "global_step": 101750, "epoch": 2422} {"train_loss": -6.448742866516113, "global_step": 101751, "epoch": 2422} {"train_loss": -6.356417655944824, "global_step": 101752, "epoch": 2422} {"train_loss": -6.517324924468994, "global_step": 101753, "epoch": 2422} {"train_loss": -6.429464340209961, "global_step": 101754, "epoch": 2422} {"train_loss": -6.285515785217285, "global_step": 101755, "epoch": 2422} {"train_loss": -6.336273193359375, "global_step": 101756, "epoch": 2422} {"train_loss": -6.380158424377441, "global_step": 101757, "epoch": 2422} {"train_loss": -6.313651084899902, "global_step": 101758, "epoch": 2422} {"train_loss": -6.439003944396973, "global_step": 101759, "epoch": 2422} {"train_loss": -6.4136643409729, "global_step": 101760, "epoch": 2422} {"train_loss": -6.3561110496521, "global_step": 101761, "epoch": 2422} {"train_loss": -6.530242443084717, "global_step": 101762, "epoch": 2422} {"train_loss": -6.372472763061523, "global_step": 101763, "epoch": 2422} {"train_loss": -6.378506660461426, "global_step": 101764, "epoch": 2422} {"train_loss": -6.367316007614136, "global_step": 101765, "epoch": 2422, "val_loss": 67779.625} {"train_loss": -6.471305847167969, "global_step": 101766, "epoch": 2423} {"train_loss": -6.406898498535156, "global_step": 101767, "epoch": 2423} {"train_loss": -6.417686462402344, "global_step": 101768, "epoch": 2423} {"train_loss": -6.306758880615234, "global_step": 101769, "epoch": 2423} {"train_loss": -6.273301601409912, "global_step": 101770, "epoch": 2423} {"train_loss": -6.310842037200928, "global_step": 101771, "epoch": 2423} {"train_loss": -6.505722999572754, "global_step": 101772, "epoch": 2423} {"train_loss": -6.298337936401367, "global_step": 101773, "epoch": 2423} {"train_loss": -6.413398742675781, "global_step": 101774, "epoch": 2423} {"train_loss": -6.356203556060791, "global_step": 101775, "epoch": 2423} {"train_loss": -6.299253463745117, "global_step": 101776, "epoch": 2423} {"train_loss": -6.443822383880615, "global_step": 101777, "epoch": 2423} {"train_loss": -6.368553161621094, "global_step": 101778, "epoch": 2423} {"train_loss": -6.3474578857421875, "global_step": 101779, "epoch": 2423} {"train_loss": -6.365788459777832, "global_step": 101780, "epoch": 2423} {"train_loss": -6.2834367752075195, "global_step": 101781, "epoch": 2423} {"train_loss": -6.471797943115234, "global_step": 101782, "epoch": 2423} {"train_loss": -6.4750518798828125, "global_step": 101783, "epoch": 2423} {"train_loss": -6.236153602600098, "global_step": 101784, "epoch": 2423} {"train_loss": -6.440351963043213, "global_step": 101785, "epoch": 2423} {"train_loss": -6.469229221343994, "global_step": 101786, "epoch": 2423} {"train_loss": -6.340904235839844, "global_step": 101787, "epoch": 2423} {"train_loss": -6.391473293304443, "global_step": 101788, "epoch": 2423} {"train_loss": -6.426290512084961, "global_step": 101789, "epoch": 2423} {"train_loss": -6.467796802520752, "global_step": 101790, "epoch": 2423} {"train_loss": -6.362855434417725, "global_step": 101791, "epoch": 2423} {"train_loss": -6.382342338562012, "global_step": 101792, "epoch": 2423} {"train_loss": -6.465414524078369, "global_step": 101793, "epoch": 2423} {"train_loss": -6.441484451293945, "global_step": 101794, "epoch": 2423} {"train_loss": -6.283553123474121, "global_step": 101795, "epoch": 2423} {"train_loss": -6.452070236206055, "global_step": 101796, "epoch": 2423} {"train_loss": -6.366695404052734, "global_step": 101797, "epoch": 2423} {"train_loss": -6.418064117431641, "global_step": 101798, "epoch": 2423} {"train_loss": -6.293972492218018, "global_step": 101799, "epoch": 2423} {"train_loss": -6.303763389587402, "global_step": 101800, "epoch": 2423} {"train_loss": -6.288460731506348, "global_step": 101801, "epoch": 2423} {"train_loss": -6.331906318664551, "global_step": 101802, "epoch": 2423} {"train_loss": -6.4517035484313965, "global_step": 101803, "epoch": 2423} {"train_loss": -6.3803791999816895, "global_step": 101804, "epoch": 2423} {"train_loss": -6.377902030944824, "global_step": 101805, "epoch": 2423} {"train_loss": -6.345740795135498, "global_step": 101806, "epoch": 2423} {"train_loss": -6.380486352103097, "global_step": 101807, "epoch": 2423, "val_loss": 67957.5859375} {"train_loss": -6.433352470397949, "global_step": 101808, "epoch": 2424} {"train_loss": -6.351358413696289, "global_step": 101809, "epoch": 2424} {"train_loss": -6.4361653327941895, "global_step": 101810, "epoch": 2424} {"train_loss": -6.29523229598999, "global_step": 101811, "epoch": 2424} {"train_loss": -6.415377616882324, "global_step": 101812, "epoch": 2424} {"train_loss": -6.328118801116943, "global_step": 101813, "epoch": 2424} {"train_loss": -6.359471797943115, "global_step": 101814, "epoch": 2424} {"train_loss": -6.410571575164795, "global_step": 101815, "epoch": 2424} {"train_loss": -6.494292259216309, "global_step": 101816, "epoch": 2424} {"train_loss": -6.317753791809082, "global_step": 101817, "epoch": 2424} {"train_loss": -6.3256425857543945, "global_step": 101818, "epoch": 2424} {"train_loss": -6.468107223510742, "global_step": 101819, "epoch": 2424} {"train_loss": -6.313799858093262, "global_step": 101820, "epoch": 2424} {"train_loss": -6.312447547912598, "global_step": 101821, "epoch": 2424} {"train_loss": -6.369892120361328, "global_step": 101822, "epoch": 2424} {"train_loss": -6.2644500732421875, "global_step": 101823, "epoch": 2424} {"train_loss": -6.322484016418457, "global_step": 101824, "epoch": 2424} {"train_loss": -6.364031791687012, "global_step": 101825, "epoch": 2424} {"train_loss": -6.17874813079834, "global_step": 101826, "epoch": 2424} {"train_loss": -6.337551593780518, "global_step": 101827, "epoch": 2424} {"train_loss": -6.276918888092041, "global_step": 101828, "epoch": 2424} {"train_loss": -6.275404930114746, "global_step": 101829, "epoch": 2424} {"train_loss": -6.380124568939209, "global_step": 101830, "epoch": 2424} {"train_loss": -6.230960845947266, "global_step": 101831, "epoch": 2424} {"train_loss": -6.378223419189453, "global_step": 101832, "epoch": 2424} {"train_loss": -6.37178897857666, "global_step": 101833, "epoch": 2424} {"train_loss": -6.220086097717285, "global_step": 101834, "epoch": 2424} {"train_loss": -6.307905673980713, "global_step": 101835, "epoch": 2424} {"train_loss": -6.3063812255859375, "global_step": 101836, "epoch": 2424} {"train_loss": -6.301063060760498, "global_step": 101837, "epoch": 2424} {"train_loss": -6.178360939025879, "global_step": 101838, "epoch": 2424} {"train_loss": -6.3361663818359375, "global_step": 101839, "epoch": 2424} {"train_loss": -6.247214317321777, "global_step": 101840, "epoch": 2424} {"train_loss": -6.262009620666504, "global_step": 101841, "epoch": 2424} {"train_loss": -6.422482967376709, "global_step": 101842, "epoch": 2424} {"train_loss": -6.266989707946777, "global_step": 101843, "epoch": 2424} {"train_loss": -6.341471195220947, "global_step": 101844, "epoch": 2424} {"train_loss": -6.238917350769043, "global_step": 101845, "epoch": 2424} {"train_loss": -6.361722946166992, "global_step": 101846, "epoch": 2424} {"train_loss": -6.311023712158203, "global_step": 101847, "epoch": 2424} {"train_loss": -6.39617919921875, "global_step": 101848, "epoch": 2424} {"train_loss": -6.3280710606347945, "global_step": 101849, "epoch": 2424, "val_loss": 67906.0859375} {"train_loss": -6.187483787536621, "global_step": 101850, "epoch": 2425} {"train_loss": -6.336546421051025, "global_step": 101851, "epoch": 2425} {"train_loss": -6.487746238708496, "global_step": 101852, "epoch": 2425} {"train_loss": -6.310973167419434, "global_step": 101853, "epoch": 2425} {"train_loss": -6.314268112182617, "global_step": 101854, "epoch": 2425} {"train_loss": -6.390277862548828, "global_step": 101855, "epoch": 2425} {"train_loss": -6.4397501945495605, "global_step": 101856, "epoch": 2425} {"train_loss": -6.303747177124023, "global_step": 101857, "epoch": 2425} {"train_loss": -6.317073345184326, "global_step": 101858, "epoch": 2425} {"train_loss": -6.471946716308594, "global_step": 101859, "epoch": 2425} {"train_loss": -6.312555313110352, "global_step": 101860, "epoch": 2425} {"train_loss": -6.273841857910156, "global_step": 101861, "epoch": 2425} {"train_loss": -6.432896137237549, "global_step": 101862, "epoch": 2425} {"train_loss": -6.403318881988525, "global_step": 101863, "epoch": 2425} {"train_loss": -6.420011520385742, "global_step": 101864, "epoch": 2425} {"train_loss": -6.360228538513184, "global_step": 101865, "epoch": 2425} {"train_loss": -6.395354747772217, "global_step": 101866, "epoch": 2425} {"train_loss": -6.296443939208984, "global_step": 101867, "epoch": 2425} {"train_loss": -6.322609901428223, "global_step": 101868, "epoch": 2425} {"train_loss": -6.333156585693359, "global_step": 101869, "epoch": 2425} {"train_loss": -6.302000045776367, "global_step": 101870, "epoch": 2425} {"train_loss": -6.322083473205566, "global_step": 101871, "epoch": 2425} {"train_loss": -6.459804534912109, "global_step": 101872, "epoch": 2425} {"train_loss": -6.258725166320801, "global_step": 101873, "epoch": 2425} {"train_loss": -6.446712493896484, "global_step": 101874, "epoch": 2425} {"train_loss": -6.308452606201172, "global_step": 101875, "epoch": 2425} {"train_loss": -6.352100849151611, "global_step": 101876, "epoch": 2425} {"train_loss": -6.346085071563721, "global_step": 101877, "epoch": 2425} {"train_loss": -6.317091941833496, "global_step": 101878, "epoch": 2425} {"train_loss": -6.335696220397949, "global_step": 101879, "epoch": 2425} {"train_loss": -6.3735456466674805, "global_step": 101880, "epoch": 2425} {"train_loss": -6.3582682609558105, "global_step": 101881, "epoch": 2425} {"train_loss": -6.344857215881348, "global_step": 101882, "epoch": 2425} {"train_loss": -6.259088516235352, "global_step": 101883, "epoch": 2425} {"train_loss": -6.263236999511719, "global_step": 101884, "epoch": 2425} {"train_loss": -6.368827819824219, "global_step": 101885, "epoch": 2425} {"train_loss": -6.3694562911987305, "global_step": 101886, "epoch": 2425} {"train_loss": -6.346796989440918, "global_step": 101887, "epoch": 2425} {"train_loss": -6.317691802978516, "global_step": 101888, "epoch": 2425} {"train_loss": -6.495743751525879, "global_step": 101889, "epoch": 2425} {"train_loss": -6.374642848968506, "global_step": 101890, "epoch": 2425} {"train_loss": -6.3518165066128685, "global_step": 101891, "epoch": 2425, "val_loss": 67791.9140625} {"train_loss": -6.307705879211426, "global_step": 101892, "epoch": 2426} {"train_loss": -6.385108947753906, "global_step": 101893, "epoch": 2426} {"train_loss": -6.361694812774658, "global_step": 101894, "epoch": 2426} {"train_loss": -6.489509582519531, "global_step": 101895, "epoch": 2426} {"train_loss": -6.464146614074707, "global_step": 101896, "epoch": 2426} {"train_loss": -6.282872200012207, "global_step": 101897, "epoch": 2426} {"train_loss": -6.325680732727051, "global_step": 101898, "epoch": 2426} {"train_loss": -6.444257736206055, "global_step": 101899, "epoch": 2426} {"train_loss": -6.370579719543457, "global_step": 101900, "epoch": 2426} {"train_loss": -6.306221961975098, "global_step": 101901, "epoch": 2426} {"train_loss": -6.259594917297363, "global_step": 101902, "epoch": 2426} {"train_loss": -6.275617599487305, "global_step": 101903, "epoch": 2426} {"train_loss": -6.385373115539551, "global_step": 101904, "epoch": 2426} {"train_loss": -6.312256813049316, "global_step": 101905, "epoch": 2426} {"train_loss": -6.384054660797119, "global_step": 101906, "epoch": 2426} {"train_loss": -6.343613624572754, "global_step": 101907, "epoch": 2426} {"train_loss": -6.333469390869141, "global_step": 101908, "epoch": 2426} {"train_loss": -6.408528804779053, "global_step": 101909, "epoch": 2426} {"train_loss": -6.362177848815918, "global_step": 101910, "epoch": 2426} {"train_loss": -6.282052040100098, "global_step": 101911, "epoch": 2426} {"train_loss": -6.388829231262207, "global_step": 101912, "epoch": 2426} {"train_loss": -6.418732643127441, "global_step": 101913, "epoch": 2426} {"train_loss": -6.3781538009643555, "global_step": 101914, "epoch": 2426} {"train_loss": -6.376208782196045, "global_step": 101915, "epoch": 2426} {"train_loss": -6.47039794921875, "global_step": 101916, "epoch": 2426} {"train_loss": -6.384786605834961, "global_step": 101917, "epoch": 2426} {"train_loss": -6.322279453277588, "global_step": 101918, "epoch": 2426} {"train_loss": -6.35427188873291, "global_step": 101919, "epoch": 2426} {"train_loss": -6.412384986877441, "global_step": 101920, "epoch": 2426} {"train_loss": -6.411614894866943, "global_step": 101921, "epoch": 2426} {"train_loss": -6.433978080749512, "global_step": 101922, "epoch": 2426} {"train_loss": -6.336361408233643, "global_step": 101923, "epoch": 2426} {"train_loss": -6.294305801391602, "global_step": 101924, "epoch": 2426} {"train_loss": -6.397231578826904, "global_step": 101925, "epoch": 2426} {"train_loss": -6.358542442321777, "global_step": 101926, "epoch": 2426} {"train_loss": -6.380781173706055, "global_step": 101927, "epoch": 2426} {"train_loss": -6.3455119132995605, "global_step": 101928, "epoch": 2426} {"train_loss": -6.4000444412231445, "global_step": 101929, "epoch": 2426} {"train_loss": -6.270652770996094, "global_step": 101930, "epoch": 2426} {"train_loss": -6.310828685760498, "global_step": 101931, "epoch": 2426} {"train_loss": -6.334507942199707, "global_step": 101932, "epoch": 2426} {"train_loss": -6.362731729234968, "global_step": 101933, "epoch": 2426, "val_loss": 67916.171875} {"train_loss": -6.390590667724609, "global_step": 101934, "epoch": 2427} {"train_loss": -6.2846574783325195, "global_step": 101935, "epoch": 2427} {"train_loss": -6.249626159667969, "global_step": 101936, "epoch": 2427} {"train_loss": -6.284257888793945, "global_step": 101937, "epoch": 2427} {"train_loss": -6.38025426864624, "global_step": 101938, "epoch": 2427} {"train_loss": -6.261410713195801, "global_step": 101939, "epoch": 2427} {"train_loss": -6.35529088973999, "global_step": 101940, "epoch": 2427} {"train_loss": -6.469647407531738, "global_step": 101941, "epoch": 2427} {"train_loss": -6.352083683013916, "global_step": 101942, "epoch": 2427} {"train_loss": -6.410600662231445, "global_step": 101943, "epoch": 2427} {"train_loss": -6.485169410705566, "global_step": 101944, "epoch": 2427} {"train_loss": -6.3544111251831055, "global_step": 101945, "epoch": 2427} {"train_loss": -6.402118682861328, "global_step": 101946, "epoch": 2427} {"train_loss": -6.429417610168457, "global_step": 101947, "epoch": 2427} {"train_loss": -6.319781303405762, "global_step": 101948, "epoch": 2427} {"train_loss": -6.429453372955322, "global_step": 101949, "epoch": 2427} {"train_loss": -6.372199058532715, "global_step": 101950, "epoch": 2427} {"train_loss": -6.435744285583496, "global_step": 101951, "epoch": 2427} {"train_loss": -6.469179153442383, "global_step": 101952, "epoch": 2427} {"train_loss": -6.502606391906738, "global_step": 101953, "epoch": 2427} {"train_loss": -6.484797954559326, "global_step": 101954, "epoch": 2427} {"train_loss": -6.3918046951293945, "global_step": 101955, "epoch": 2427} {"train_loss": -6.399250030517578, "global_step": 101956, "epoch": 2427} {"train_loss": -6.388207912445068, "global_step": 101957, "epoch": 2427} {"train_loss": -6.289264678955078, "global_step": 101958, "epoch": 2427} {"train_loss": -6.2665486335754395, "global_step": 101959, "epoch": 2427} {"train_loss": -6.4083123207092285, "global_step": 101960, "epoch": 2427} {"train_loss": -6.367613792419434, "global_step": 101961, "epoch": 2427} {"train_loss": -6.411533355712891, "global_step": 101962, "epoch": 2427} {"train_loss": -6.476762771606445, "global_step": 101963, "epoch": 2427} {"train_loss": -6.39178466796875, "global_step": 101964, "epoch": 2427} {"train_loss": -6.367171287536621, "global_step": 101965, "epoch": 2427} {"train_loss": -6.4879865646362305, "global_step": 101966, "epoch": 2427} {"train_loss": -6.272655487060547, "global_step": 101967, "epoch": 2427} {"train_loss": -6.428450107574463, "global_step": 101968, "epoch": 2427} {"train_loss": -6.2829976081848145, "global_step": 101969, "epoch": 2427} {"train_loss": -6.314344882965088, "global_step": 101970, "epoch": 2427} {"train_loss": -6.243088245391846, "global_step": 101971, "epoch": 2427} {"train_loss": -6.292654037475586, "global_step": 101972, "epoch": 2427} {"train_loss": -6.264383316040039, "global_step": 101973, "epoch": 2427} {"train_loss": -6.341883182525635, "global_step": 101974, "epoch": 2427} {"train_loss": -6.369156564985003, "global_step": 101975, "epoch": 2427, "val_loss": 68023.1640625} {"train_loss": -6.351055145263672, "global_step": 101976, "epoch": 2428} {"train_loss": -6.370637893676758, "global_step": 101977, "epoch": 2428} {"train_loss": -6.3916168212890625, "global_step": 101978, "epoch": 2428} {"train_loss": -6.250374794006348, "global_step": 101979, "epoch": 2428} {"train_loss": -6.341128349304199, "global_step": 101980, "epoch": 2428} {"train_loss": -6.401050090789795, "global_step": 101981, "epoch": 2428} {"train_loss": -6.228577613830566, "global_step": 101982, "epoch": 2428} {"train_loss": -6.417272567749023, "global_step": 101983, "epoch": 2428} {"train_loss": -6.241393566131592, "global_step": 101984, "epoch": 2428} {"train_loss": -6.286606788635254, "global_step": 101985, "epoch": 2428} {"train_loss": -6.4115777015686035, "global_step": 101986, "epoch": 2428} {"train_loss": -6.273886680603027, "global_step": 101987, "epoch": 2428} {"train_loss": -6.36052942276001, "global_step": 101988, "epoch": 2428} {"train_loss": -6.271020889282227, "global_step": 101989, "epoch": 2428} {"train_loss": -6.287928581237793, "global_step": 101990, "epoch": 2428} {"train_loss": -6.34144401550293, "global_step": 101991, "epoch": 2428} {"train_loss": -6.26307487487793, "global_step": 101992, "epoch": 2428} {"train_loss": -6.416804790496826, "global_step": 101993, "epoch": 2428} {"train_loss": -6.2911176681518555, "global_step": 101994, "epoch": 2428} {"train_loss": -6.321347236633301, "global_step": 101995, "epoch": 2428} {"train_loss": -6.363811492919922, "global_step": 101996, "epoch": 2428} {"train_loss": -6.331551551818848, "global_step": 101997, "epoch": 2428} {"train_loss": -6.327909469604492, "global_step": 101998, "epoch": 2428} {"train_loss": -6.179440975189209, "global_step": 101999, "epoch": 2428} {"train_loss": -6.441934585571289, "global_step": 102000, "epoch": 2428} {"train_loss": -6.353297233581543, "global_step": 102001, "epoch": 2428} {"train_loss": -6.3452277183532715, "global_step": 102002, "epoch": 2428} {"train_loss": -6.317660331726074, "global_step": 102003, "epoch": 2428} {"train_loss": -6.232058048248291, "global_step": 102004, "epoch": 2428} {"train_loss": -6.335323333740234, "global_step": 102005, "epoch": 2428} {"train_loss": -6.419188499450684, "global_step": 102006, "epoch": 2428} {"train_loss": -6.263369560241699, "global_step": 102007, "epoch": 2428} {"train_loss": -6.392533779144287, "global_step": 102008, "epoch": 2428} {"train_loss": -6.2279791831970215, "global_step": 102009, "epoch": 2428} {"train_loss": -6.348194122314453, "global_step": 102010, "epoch": 2428} {"train_loss": -6.365490913391113, "global_step": 102011, "epoch": 2428} {"train_loss": -6.339221000671387, "global_step": 102012, "epoch": 2428} {"train_loss": -6.320503234863281, "global_step": 102013, "epoch": 2428} {"train_loss": -6.237831115722656, "global_step": 102014, "epoch": 2428} {"train_loss": -6.212390899658203, "global_step": 102015, "epoch": 2428} {"train_loss": -6.308103561401367, "global_step": 102016, "epoch": 2428} {"train_loss": -6.31889576003665, "global_step": 102017, "epoch": 2428, "val_loss": 67923.5078125} {"train_loss": -6.306056499481201, "global_step": 102018, "epoch": 2429} {"train_loss": -6.281240463256836, "global_step": 102019, "epoch": 2429} {"train_loss": -6.282751560211182, "global_step": 102020, "epoch": 2429} {"train_loss": -6.362165451049805, "global_step": 102021, "epoch": 2429} {"train_loss": -6.289669036865234, "global_step": 102022, "epoch": 2429} {"train_loss": -6.3166913986206055, "global_step": 102023, "epoch": 2429} {"train_loss": -6.36175012588501, "global_step": 102024, "epoch": 2429} {"train_loss": -6.367506980895996, "global_step": 102025, "epoch": 2429} {"train_loss": -6.368890285491943, "global_step": 102026, "epoch": 2429} {"train_loss": -6.316804885864258, "global_step": 102027, "epoch": 2429} {"train_loss": -6.308185577392578, "global_step": 102028, "epoch": 2429} {"train_loss": -6.370723724365234, "global_step": 102029, "epoch": 2429} {"train_loss": -6.3806962966918945, "global_step": 102030, "epoch": 2429} {"train_loss": -6.371217727661133, "global_step": 102031, "epoch": 2429} {"train_loss": -6.518996715545654, "global_step": 102032, "epoch": 2429} {"train_loss": -6.351113796234131, "global_step": 102033, "epoch": 2429} {"train_loss": -6.305217742919922, "global_step": 102034, "epoch": 2429} {"train_loss": -6.419310569763184, "global_step": 102035, "epoch": 2429} {"train_loss": -6.38495397567749, "global_step": 102036, "epoch": 2429} {"train_loss": -6.394670486450195, "global_step": 102037, "epoch": 2429} {"train_loss": -6.295316696166992, "global_step": 102038, "epoch": 2429} {"train_loss": -6.391172885894775, "global_step": 102039, "epoch": 2429} {"train_loss": -6.348447799682617, "global_step": 102040, "epoch": 2429} {"train_loss": -6.307581424713135, "global_step": 102041, "epoch": 2429} {"train_loss": -6.455018520355225, "global_step": 102042, "epoch": 2429} {"train_loss": -6.360894203186035, "global_step": 102043, "epoch": 2429} {"train_loss": -6.447117805480957, "global_step": 102044, "epoch": 2429} {"train_loss": -6.4327392578125, "global_step": 102045, "epoch": 2429} {"train_loss": -6.289919853210449, "global_step": 102046, "epoch": 2429} {"train_loss": -6.414564609527588, "global_step": 102047, "epoch": 2429} {"train_loss": -6.3443732261657715, "global_step": 102048, "epoch": 2429} {"train_loss": -6.375332832336426, "global_step": 102049, "epoch": 2429} {"train_loss": -6.374434947967529, "global_step": 102050, "epoch": 2429} {"train_loss": -6.362825393676758, "global_step": 102051, "epoch": 2429} {"train_loss": -6.4392852783203125, "global_step": 102052, "epoch": 2429} {"train_loss": -6.457249641418457, "global_step": 102053, "epoch": 2429} {"train_loss": -6.254813194274902, "global_step": 102054, "epoch": 2429} {"train_loss": -6.28986930847168, "global_step": 102055, "epoch": 2429} {"train_loss": -6.285757064819336, "global_step": 102056, "epoch": 2429} {"train_loss": -6.361887454986572, "global_step": 102057, "epoch": 2429} {"train_loss": -6.3982086181640625, "global_step": 102058, "epoch": 2429} {"train_loss": -6.3585260936192105, "global_step": 102059, "epoch": 2429, "val_loss": 68215.7734375} {"train_loss": -6.332881927490234, "global_step": 102060, "epoch": 2430} {"train_loss": -6.3973307609558105, "global_step": 102061, "epoch": 2430} {"train_loss": -6.403796195983887, "global_step": 102062, "epoch": 2430} {"train_loss": -6.329218864440918, "global_step": 102063, "epoch": 2430} {"train_loss": -6.470874309539795, "global_step": 102064, "epoch": 2430} {"train_loss": -6.270997047424316, "global_step": 102065, "epoch": 2430} {"train_loss": -6.403370380401611, "global_step": 102066, "epoch": 2430} {"train_loss": -6.528250217437744, "global_step": 102067, "epoch": 2430} {"train_loss": -6.3841118812561035, "global_step": 102068, "epoch": 2430} {"train_loss": -6.387007236480713, "global_step": 102069, "epoch": 2430} {"train_loss": -6.392189025878906, "global_step": 102070, "epoch": 2430} {"train_loss": -6.389447212219238, "global_step": 102071, "epoch": 2430} {"train_loss": -6.370724678039551, "global_step": 102072, "epoch": 2430} {"train_loss": -6.357461929321289, "global_step": 102073, "epoch": 2430} {"train_loss": -6.379646301269531, "global_step": 102074, "epoch": 2430} {"train_loss": -6.374965667724609, "global_step": 102075, "epoch": 2430} {"train_loss": -6.499146938323975, "global_step": 102076, "epoch": 2430} {"train_loss": -6.4584479331970215, "global_step": 102077, "epoch": 2430} {"train_loss": -6.391319751739502, "global_step": 102078, "epoch": 2430} {"train_loss": -6.478311538696289, "global_step": 102079, "epoch": 2430} {"train_loss": -6.296563148498535, "global_step": 102080, "epoch": 2430} {"train_loss": -6.327253341674805, "global_step": 102081, "epoch": 2430} {"train_loss": -6.473365783691406, "global_step": 102082, "epoch": 2430} {"train_loss": -6.443173408508301, "global_step": 102083, "epoch": 2430} {"train_loss": -6.218070030212402, "global_step": 102084, "epoch": 2430} {"train_loss": -6.371513366699219, "global_step": 102085, "epoch": 2430} {"train_loss": -6.345357894897461, "global_step": 102086, "epoch": 2430} {"train_loss": -6.26231050491333, "global_step": 102087, "epoch": 2430} {"train_loss": -6.3330559730529785, "global_step": 102088, "epoch": 2430} {"train_loss": -6.348381519317627, "global_step": 102089, "epoch": 2430} {"train_loss": -6.273711204528809, "global_step": 102090, "epoch": 2430} {"train_loss": -6.245395183563232, "global_step": 102091, "epoch": 2430} {"train_loss": -6.489629745483398, "global_step": 102092, "epoch": 2430} {"train_loss": -6.412206649780273, "global_step": 102093, "epoch": 2430} {"train_loss": -6.429977893829346, "global_step": 102094, "epoch": 2430} {"train_loss": -6.40354585647583, "global_step": 102095, "epoch": 2430} {"train_loss": -6.287121772766113, "global_step": 102096, "epoch": 2430} {"train_loss": -6.309436798095703, "global_step": 102097, "epoch": 2430} {"train_loss": -6.318576812744141, "global_step": 102098, "epoch": 2430} {"train_loss": -6.222601413726807, "global_step": 102099, "epoch": 2430} {"train_loss": -6.373597621917725, "global_step": 102100, "epoch": 2430} {"train_loss": -6.3700938905988425, "global_step": 102101, "epoch": 2430, "val_loss": 68205.8515625} {"train_loss": -6.221882343292236, "global_step": 102102, "epoch": 2431} {"train_loss": -6.39051628112793, "global_step": 102103, "epoch": 2431} {"train_loss": -6.304217338562012, "global_step": 102104, "epoch": 2431} {"train_loss": -6.234527587890625, "global_step": 102105, "epoch": 2431} {"train_loss": -6.446681022644043, "global_step": 102106, "epoch": 2431} {"train_loss": -6.395595073699951, "global_step": 102107, "epoch": 2431} {"train_loss": -6.268913269042969, "global_step": 102108, "epoch": 2431} {"train_loss": -6.333097457885742, "global_step": 102109, "epoch": 2431} {"train_loss": -6.3492255210876465, "global_step": 102110, "epoch": 2431} {"train_loss": -6.263545036315918, "global_step": 102111, "epoch": 2431} {"train_loss": -6.4051618576049805, "global_step": 102112, "epoch": 2431} {"train_loss": -6.171661853790283, "global_step": 102113, "epoch": 2431} {"train_loss": -6.405620574951172, "global_step": 102114, "epoch": 2431} {"train_loss": -6.173084259033203, "global_step": 102115, "epoch": 2431} {"train_loss": -6.447251319885254, "global_step": 102116, "epoch": 2431} {"train_loss": -6.405906677246094, "global_step": 102117, "epoch": 2431} {"train_loss": -6.380897045135498, "global_step": 102118, "epoch": 2431} {"train_loss": -6.325559616088867, "global_step": 102119, "epoch": 2431} {"train_loss": -6.367457389831543, "global_step": 102120, "epoch": 2431} {"train_loss": -6.307671070098877, "global_step": 102121, "epoch": 2431} {"train_loss": -6.344140529632568, "global_step": 102122, "epoch": 2431} {"train_loss": -6.383011817932129, "global_step": 102123, "epoch": 2431} {"train_loss": -6.296661376953125, "global_step": 102124, "epoch": 2431} {"train_loss": -6.273673057556152, "global_step": 102125, "epoch": 2431} {"train_loss": -6.343080520629883, "global_step": 102126, "epoch": 2431} {"train_loss": -6.443566799163818, "global_step": 102127, "epoch": 2431} {"train_loss": -6.282951354980469, "global_step": 102128, "epoch": 2431} {"train_loss": -6.397103309631348, "global_step": 102129, "epoch": 2431} {"train_loss": -6.285654544830322, "global_step": 102130, "epoch": 2431} {"train_loss": -6.321070194244385, "global_step": 102131, "epoch": 2431} {"train_loss": -6.282684326171875, "global_step": 102132, "epoch": 2431} {"train_loss": -6.5038347244262695, "global_step": 102133, "epoch": 2431} {"train_loss": -6.353135108947754, "global_step": 102134, "epoch": 2431} {"train_loss": -6.381797790527344, "global_step": 102135, "epoch": 2431} {"train_loss": -6.40150785446167, "global_step": 102136, "epoch": 2431} {"train_loss": -6.449956893920898, "global_step": 102137, "epoch": 2431} {"train_loss": -6.367219924926758, "global_step": 102138, "epoch": 2431} {"train_loss": -6.353219032287598, "global_step": 102139, "epoch": 2431} {"train_loss": -6.20887565612793, "global_step": 102140, "epoch": 2431} {"train_loss": -6.3662309646606445, "global_step": 102141, "epoch": 2431} {"train_loss": -6.2834882736206055, "global_step": 102142, "epoch": 2431} {"train_loss": -6.337413538069952, "global_step": 102143, "epoch": 2431, "val_loss": 68023.6953125} {"train_loss": -6.362452030181885, "global_step": 102144, "epoch": 2432} {"train_loss": -6.3544535636901855, "global_step": 102145, "epoch": 2432} {"train_loss": -6.379741191864014, "global_step": 102146, "epoch": 2432} {"train_loss": -6.438260555267334, "global_step": 102147, "epoch": 2432} {"train_loss": -6.306232929229736, "global_step": 102148, "epoch": 2432} {"train_loss": -6.3939313888549805, "global_step": 102149, "epoch": 2432} {"train_loss": -6.4135847091674805, "global_step": 102150, "epoch": 2432} {"train_loss": -6.282536506652832, "global_step": 102151, "epoch": 2432} {"train_loss": -6.43321418762207, "global_step": 102152, "epoch": 2432} {"train_loss": -6.2868170738220215, "global_step": 102153, "epoch": 2432} {"train_loss": -6.352621078491211, "global_step": 102154, "epoch": 2432} {"train_loss": -6.346370697021484, "global_step": 102155, "epoch": 2432} {"train_loss": -6.2468109130859375, "global_step": 102156, "epoch": 2432} {"train_loss": -6.334178447723389, "global_step": 102157, "epoch": 2432} {"train_loss": -6.461945533752441, "global_step": 102158, "epoch": 2432} {"train_loss": -6.351062774658203, "global_step": 102159, "epoch": 2432} {"train_loss": -6.442233085632324, "global_step": 102160, "epoch": 2432} {"train_loss": -6.42525577545166, "global_step": 102161, "epoch": 2432} {"train_loss": -6.288283348083496, "global_step": 102162, "epoch": 2432} {"train_loss": -6.271119117736816, "global_step": 102163, "epoch": 2432} {"train_loss": -6.360466957092285, "global_step": 102164, "epoch": 2432} {"train_loss": -6.364454746246338, "global_step": 102165, "epoch": 2432} {"train_loss": -6.343627452850342, "global_step": 102166, "epoch": 2432} {"train_loss": -6.34112024307251, "global_step": 102167, "epoch": 2432} {"train_loss": -6.30858039855957, "global_step": 102168, "epoch": 2432} {"train_loss": -6.358658790588379, "global_step": 102169, "epoch": 2432} {"train_loss": -6.371538162231445, "global_step": 102170, "epoch": 2432} {"train_loss": -6.289806365966797, "global_step": 102171, "epoch": 2432} {"train_loss": -6.220525741577148, "global_step": 102172, "epoch": 2432} {"train_loss": -6.368607521057129, "global_step": 102173, "epoch": 2432} {"train_loss": -6.382164001464844, "global_step": 102174, "epoch": 2432} {"train_loss": -6.3247785568237305, "global_step": 102175, "epoch": 2432} {"train_loss": -6.343198299407959, "global_step": 102176, "epoch": 2432} {"train_loss": -6.399742126464844, "global_step": 102177, "epoch": 2432} {"train_loss": -6.314533710479736, "global_step": 102178, "epoch": 2432} {"train_loss": -6.376854419708252, "global_step": 102179, "epoch": 2432} {"train_loss": -6.318621635437012, "global_step": 102180, "epoch": 2432} {"train_loss": -6.362362861633301, "global_step": 102181, "epoch": 2432} {"train_loss": -6.2631402015686035, "global_step": 102182, "epoch": 2432} {"train_loss": -6.429527759552002, "global_step": 102183, "epoch": 2432} {"train_loss": -6.431641101837158, "global_step": 102184, "epoch": 2432} {"train_loss": -6.352709679376511, "global_step": 102185, "epoch": 2432, "val_loss": 68106.6484375} {"train_loss": -6.462516784667969, "global_step": 102186, "epoch": 2433} {"train_loss": -6.388340473175049, "global_step": 102187, "epoch": 2433} {"train_loss": -6.305735111236572, "global_step": 102188, "epoch": 2433} {"train_loss": -6.426607608795166, "global_step": 102189, "epoch": 2433} {"train_loss": -6.369638442993164, "global_step": 102190, "epoch": 2433} {"train_loss": -6.447540283203125, "global_step": 102191, "epoch": 2433} {"train_loss": -6.331300735473633, "global_step": 102192, "epoch": 2433} {"train_loss": -6.3268890380859375, "global_step": 102193, "epoch": 2433} {"train_loss": -6.484251022338867, "global_step": 102194, "epoch": 2433} {"train_loss": -6.314978122711182, "global_step": 102195, "epoch": 2433} {"train_loss": -6.253392219543457, "global_step": 102196, "epoch": 2433} {"train_loss": -6.33900260925293, "global_step": 102197, "epoch": 2433} {"train_loss": -6.243846416473389, "global_step": 102198, "epoch": 2433} {"train_loss": -6.450660228729248, "global_step": 102199, "epoch": 2433} {"train_loss": -6.248239994049072, "global_step": 102200, "epoch": 2433} {"train_loss": -6.370579719543457, "global_step": 102201, "epoch": 2433} {"train_loss": -6.249528408050537, "global_step": 102202, "epoch": 2433} {"train_loss": -6.243626594543457, "global_step": 102203, "epoch": 2433} {"train_loss": -6.3670454025268555, "global_step": 102204, "epoch": 2433} {"train_loss": -6.297357559204102, "global_step": 102205, "epoch": 2433} {"train_loss": -6.356960296630859, "global_step": 102206, "epoch": 2433} {"train_loss": -6.253348350524902, "global_step": 102207, "epoch": 2433} {"train_loss": -6.315256118774414, "global_step": 102208, "epoch": 2433} {"train_loss": -6.33872652053833, "global_step": 102209, "epoch": 2433} {"train_loss": -6.234651565551758, "global_step": 102210, "epoch": 2433} {"train_loss": -6.336691379547119, "global_step": 102211, "epoch": 2433} {"train_loss": -6.3283538818359375, "global_step": 102212, "epoch": 2433} {"train_loss": -6.365496635437012, "global_step": 102213, "epoch": 2433} {"train_loss": -6.316690444946289, "global_step": 102214, "epoch": 2433} {"train_loss": -6.325352668762207, "global_step": 102215, "epoch": 2433} {"train_loss": -6.178199768066406, "global_step": 102216, "epoch": 2433} {"train_loss": -6.3619842529296875, "global_step": 102217, "epoch": 2433} {"train_loss": -6.40578556060791, "global_step": 102218, "epoch": 2433} {"train_loss": -6.316495418548584, "global_step": 102219, "epoch": 2433} {"train_loss": -6.380146026611328, "global_step": 102220, "epoch": 2433} {"train_loss": -6.3422441482543945, "global_step": 102221, "epoch": 2433} {"train_loss": -6.407766342163086, "global_step": 102222, "epoch": 2433} {"train_loss": -6.352063179016113, "global_step": 102223, "epoch": 2433} {"train_loss": -6.48657751083374, "global_step": 102224, "epoch": 2433} {"train_loss": -6.391510963439941, "global_step": 102225, "epoch": 2433} {"train_loss": -6.44403076171875, "global_step": 102226, "epoch": 2433} {"train_loss": -6.344277745201474, "global_step": 102227, "epoch": 2433, "val_loss": 67807.9609375} {"train_loss": -6.332030296325684, "global_step": 102228, "epoch": 2434} {"train_loss": -6.431374549865723, "global_step": 102229, "epoch": 2434} {"train_loss": -6.343277931213379, "global_step": 102230, "epoch": 2434} {"train_loss": -6.309659481048584, "global_step": 102231, "epoch": 2434} {"train_loss": -6.323687553405762, "global_step": 102232, "epoch": 2434} {"train_loss": -6.438052654266357, "global_step": 102233, "epoch": 2434} {"train_loss": -6.31407356262207, "global_step": 102234, "epoch": 2434} {"train_loss": -6.3122053146362305, "global_step": 102235, "epoch": 2434} {"train_loss": -6.392094135284424, "global_step": 102236, "epoch": 2434} {"train_loss": -6.180123805999756, "global_step": 102237, "epoch": 2434} {"train_loss": -6.387509346008301, "global_step": 102238, "epoch": 2434} {"train_loss": -6.292084693908691, "global_step": 102239, "epoch": 2434} {"train_loss": -6.231427192687988, "global_step": 102240, "epoch": 2434} {"train_loss": -6.561970233917236, "global_step": 102241, "epoch": 2434} {"train_loss": -6.371536731719971, "global_step": 102242, "epoch": 2434} {"train_loss": -6.42964506149292, "global_step": 102243, "epoch": 2434} {"train_loss": -6.353179454803467, "global_step": 102244, "epoch": 2434} {"train_loss": -6.2534894943237305, "global_step": 102245, "epoch": 2434} {"train_loss": -6.19244384765625, "global_step": 102246, "epoch": 2434} {"train_loss": -6.1146159172058105, "global_step": 102247, "epoch": 2434} {"train_loss": -6.127861976623535, "global_step": 102248, "epoch": 2434} {"train_loss": -6.297092437744141, "global_step": 102249, "epoch": 2434} {"train_loss": -6.073752403259277, "global_step": 102250, "epoch": 2434} {"train_loss": -6.268074035644531, "global_step": 102251, "epoch": 2434} {"train_loss": -6.187398433685303, "global_step": 102252, "epoch": 2434} {"train_loss": -6.254708290100098, "global_step": 102253, "epoch": 2434} {"train_loss": -6.181432723999023, "global_step": 102254, "epoch": 2434} {"train_loss": -6.1506781578063965, "global_step": 102255, "epoch": 2434} {"train_loss": -6.2798075675964355, "global_step": 102256, "epoch": 2434} {"train_loss": -6.304080963134766, "global_step": 102257, "epoch": 2434} {"train_loss": -6.282166004180908, "global_step": 102258, "epoch": 2434} {"train_loss": -6.350673198699951, "global_step": 102259, "epoch": 2434} {"train_loss": -6.29048490524292, "global_step": 102260, "epoch": 2434} {"train_loss": -6.2033891677856445, "global_step": 102261, "epoch": 2434} {"train_loss": -6.3506879806518555, "global_step": 102262, "epoch": 2434} {"train_loss": -6.4096174240112305, "global_step": 102263, "epoch": 2434} {"train_loss": -6.344633102416992, "global_step": 102264, "epoch": 2434} {"train_loss": -6.2768073081970215, "global_step": 102265, "epoch": 2434} {"train_loss": -6.354143142700195, "global_step": 102266, "epoch": 2434} {"train_loss": -6.331971645355225, "global_step": 102267, "epoch": 2434} {"train_loss": -6.351091384887695, "global_step": 102268, "epoch": 2434} {"train_loss": -6.302153837113154, "global_step": 102269, "epoch": 2434, "val_loss": 67831.34375} {"train_loss": -6.326554775238037, "global_step": 102270, "epoch": 2435} {"train_loss": -6.342241287231445, "global_step": 102271, "epoch": 2435} {"train_loss": -6.265289783477783, "global_step": 102272, "epoch": 2435} {"train_loss": -6.423032760620117, "global_step": 102273, "epoch": 2435} {"train_loss": -6.2547125816345215, "global_step": 102274, "epoch": 2435} {"train_loss": -6.385324478149414, "global_step": 102275, "epoch": 2435} {"train_loss": -6.453303813934326, "global_step": 102276, "epoch": 2435} {"train_loss": -6.382436752319336, "global_step": 102277, "epoch": 2435} {"train_loss": -6.444143295288086, "global_step": 102278, "epoch": 2435} {"train_loss": -6.410782337188721, "global_step": 102279, "epoch": 2435} {"train_loss": -6.4872589111328125, "global_step": 102280, "epoch": 2435} {"train_loss": -6.389250755310059, "global_step": 102281, "epoch": 2435} {"train_loss": -6.503037452697754, "global_step": 102282, "epoch": 2435} {"train_loss": -6.347277641296387, "global_step": 102283, "epoch": 2435} {"train_loss": -6.376543045043945, "global_step": 102284, "epoch": 2435} {"train_loss": -6.478993892669678, "global_step": 102285, "epoch": 2435} {"train_loss": -6.40950870513916, "global_step": 102286, "epoch": 2435} {"train_loss": -6.287100791931152, "global_step": 102287, "epoch": 2435} {"train_loss": -6.444293975830078, "global_step": 102288, "epoch": 2435} {"train_loss": -6.39088249206543, "global_step": 102289, "epoch": 2435} {"train_loss": -6.318975448608398, "global_step": 102290, "epoch": 2435} {"train_loss": -6.374298095703125, "global_step": 102291, "epoch": 2435} {"train_loss": -6.398776054382324, "global_step": 102292, "epoch": 2435} {"train_loss": -6.400636672973633, "global_step": 102293, "epoch": 2435} {"train_loss": -6.339625835418701, "global_step": 102294, "epoch": 2435} {"train_loss": -6.33266544342041, "global_step": 102295, "epoch": 2435} {"train_loss": -6.414558410644531, "global_step": 102296, "epoch": 2435} {"train_loss": -6.344323635101318, "global_step": 102297, "epoch": 2435} {"train_loss": -6.343664169311523, "global_step": 102298, "epoch": 2435} {"train_loss": -6.366029739379883, "global_step": 102299, "epoch": 2435} {"train_loss": -6.353193759918213, "global_step": 102300, "epoch": 2435} {"train_loss": -6.416093349456787, "global_step": 102301, "epoch": 2435} {"train_loss": -6.327113151550293, "global_step": 102302, "epoch": 2435} {"train_loss": -6.395500659942627, "global_step": 102303, "epoch": 2435} {"train_loss": -6.430946350097656, "global_step": 102304, "epoch": 2435} {"train_loss": -6.360416412353516, "global_step": 102305, "epoch": 2435} {"train_loss": -6.494068622589111, "global_step": 102306, "epoch": 2435} {"train_loss": -6.440454483032227, "global_step": 102307, "epoch": 2435} {"train_loss": -6.4225382804870605, "global_step": 102308, "epoch": 2435} {"train_loss": -6.420950889587402, "global_step": 102309, "epoch": 2435} {"train_loss": -6.352624416351318, "global_step": 102310, "epoch": 2435} {"train_loss": -6.384403739656721, "global_step": 102311, "epoch": 2435, "val_loss": 67842.96875} {"train_loss": -6.437582969665527, "global_step": 102312, "epoch": 2436} {"train_loss": -6.500160217285156, "global_step": 102313, "epoch": 2436} {"train_loss": -6.390353202819824, "global_step": 102314, "epoch": 2436} {"train_loss": -6.447844982147217, "global_step": 102315, "epoch": 2436} {"train_loss": -6.311770439147949, "global_step": 102316, "epoch": 2436} {"train_loss": -6.477594375610352, "global_step": 102317, "epoch": 2436} {"train_loss": -6.406079292297363, "global_step": 102318, "epoch": 2436} {"train_loss": -6.349705696105957, "global_step": 102319, "epoch": 2436} {"train_loss": -6.345976829528809, "global_step": 102320, "epoch": 2436} {"train_loss": -6.303095817565918, "global_step": 102321, "epoch": 2436} {"train_loss": -6.312227249145508, "global_step": 102322, "epoch": 2436} {"train_loss": -6.368563652038574, "global_step": 102323, "epoch": 2436} {"train_loss": -6.436816215515137, "global_step": 102324, "epoch": 2436} {"train_loss": -6.367030620574951, "global_step": 102325, "epoch": 2436} {"train_loss": -6.505589962005615, "global_step": 102326, "epoch": 2436} {"train_loss": -6.294605255126953, "global_step": 102327, "epoch": 2436} {"train_loss": -6.435797691345215, "global_step": 102328, "epoch": 2436} {"train_loss": -6.300292015075684, "global_step": 102329, "epoch": 2436} {"train_loss": -6.253579139709473, "global_step": 102330, "epoch": 2436} {"train_loss": -6.264921188354492, "global_step": 102331, "epoch": 2436} {"train_loss": -6.346031665802002, "global_step": 102332, "epoch": 2436} {"train_loss": -6.343575954437256, "global_step": 102333, "epoch": 2436} {"train_loss": -6.312610626220703, "global_step": 102334, "epoch": 2436} {"train_loss": -6.312966823577881, "global_step": 102335, "epoch": 2436} {"train_loss": -6.294281005859375, "global_step": 102336, "epoch": 2436} {"train_loss": -6.255846977233887, "global_step": 102337, "epoch": 2436} {"train_loss": -6.506179332733154, "global_step": 102338, "epoch": 2436} {"train_loss": -6.300002098083496, "global_step": 102339, "epoch": 2436} {"train_loss": -6.291696548461914, "global_step": 102340, "epoch": 2436} {"train_loss": -6.320147514343262, "global_step": 102341, "epoch": 2436} {"train_loss": -6.509815216064453, "global_step": 102342, "epoch": 2436} {"train_loss": -6.360477447509766, "global_step": 102343, "epoch": 2436} {"train_loss": -6.378951549530029, "global_step": 102344, "epoch": 2436} {"train_loss": -6.372872829437256, "global_step": 102345, "epoch": 2436} {"train_loss": -6.499336242675781, "global_step": 102346, "epoch": 2436} {"train_loss": -6.368322849273682, "global_step": 102347, "epoch": 2436} {"train_loss": -6.364948749542236, "global_step": 102348, "epoch": 2436} {"train_loss": -6.4306159019470215, "global_step": 102349, "epoch": 2436} {"train_loss": -6.442653656005859, "global_step": 102350, "epoch": 2436} {"train_loss": -6.419307708740234, "global_step": 102351, "epoch": 2436} {"train_loss": -6.468711853027344, "global_step": 102352, "epoch": 2436} {"train_loss": -6.375126793271019, "global_step": 102353, "epoch": 2436, "val_loss": 67931.0703125} {"train_loss": -6.392011642456055, "global_step": 102354, "epoch": 2437} {"train_loss": -6.405173301696777, "global_step": 102355, "epoch": 2437} {"train_loss": -6.316558837890625, "global_step": 102356, "epoch": 2437} {"train_loss": -6.3706512451171875, "global_step": 102357, "epoch": 2437} {"train_loss": -6.384711265563965, "global_step": 102358, "epoch": 2437} {"train_loss": -6.383238315582275, "global_step": 102359, "epoch": 2437} {"train_loss": -6.364587783813477, "global_step": 102360, "epoch": 2437} {"train_loss": -6.285020351409912, "global_step": 102361, "epoch": 2437} {"train_loss": -6.429159164428711, "global_step": 102362, "epoch": 2437} {"train_loss": -6.436634063720703, "global_step": 102363, "epoch": 2437} {"train_loss": -6.365628242492676, "global_step": 102364, "epoch": 2437} {"train_loss": -6.426808834075928, "global_step": 102365, "epoch": 2437} {"train_loss": -6.417301177978516, "global_step": 102366, "epoch": 2437} {"train_loss": -6.321318626403809, "global_step": 102367, "epoch": 2437} {"train_loss": -6.445714950561523, "global_step": 102368, "epoch": 2437} {"train_loss": -6.378280162811279, "global_step": 102369, "epoch": 2437} {"train_loss": -6.427239894866943, "global_step": 102370, "epoch": 2437} {"train_loss": -6.412686347961426, "global_step": 102371, "epoch": 2437} {"train_loss": -6.522919654846191, "global_step": 102372, "epoch": 2437} {"train_loss": -6.26821231842041, "global_step": 102373, "epoch": 2437} {"train_loss": -6.345554351806641, "global_step": 102374, "epoch": 2437} {"train_loss": -6.3147172927856445, "global_step": 102375, "epoch": 2437} {"train_loss": -6.375221252441406, "global_step": 102376, "epoch": 2437} {"train_loss": -6.433239936828613, "global_step": 102377, "epoch": 2437} {"train_loss": -6.335427284240723, "global_step": 102378, "epoch": 2437} {"train_loss": -6.415368556976318, "global_step": 102379, "epoch": 2437} {"train_loss": -6.2773332595825195, "global_step": 102380, "epoch": 2437} {"train_loss": -6.487114906311035, "global_step": 102381, "epoch": 2437} {"train_loss": -6.371819019317627, "global_step": 102382, "epoch": 2437} {"train_loss": -6.338399887084961, "global_step": 102383, "epoch": 2437} {"train_loss": -6.317587852478027, "global_step": 102384, "epoch": 2437} {"train_loss": -6.163211822509766, "global_step": 102385, "epoch": 2437} {"train_loss": -6.394221782684326, "global_step": 102386, "epoch": 2437} {"train_loss": -6.332010269165039, "global_step": 102387, "epoch": 2437} {"train_loss": -6.195428848266602, "global_step": 102388, "epoch": 2437} {"train_loss": -6.3495564460754395, "global_step": 102389, "epoch": 2437} {"train_loss": -6.302726745605469, "global_step": 102390, "epoch": 2437} {"train_loss": -6.177298545837402, "global_step": 102391, "epoch": 2437} {"train_loss": -6.229175090789795, "global_step": 102392, "epoch": 2437} {"train_loss": -6.21422004699707, "global_step": 102393, "epoch": 2437} {"train_loss": -6.3455400466918945, "global_step": 102394, "epoch": 2437} {"train_loss": -6.349034808930897, "global_step": 102395, "epoch": 2437, "val_loss": 68397.9453125} {"train_loss": -6.132671356201172, "global_step": 102396, "epoch": 2438} {"train_loss": -6.107141494750977, "global_step": 102397, "epoch": 2438} {"train_loss": -6.324027061462402, "global_step": 102398, "epoch": 2438} {"train_loss": -6.210102081298828, "global_step": 102399, "epoch": 2438} {"train_loss": -6.190081596374512, "global_step": 102400, "epoch": 2438} {"train_loss": -6.184140205383301, "global_step": 102401, "epoch": 2438} {"train_loss": -6.199044227600098, "global_step": 102402, "epoch": 2438} {"train_loss": -6.287878036499023, "global_step": 102403, "epoch": 2438} {"train_loss": -6.183140277862549, "global_step": 102404, "epoch": 2438} {"train_loss": -6.356260299682617, "global_step": 102405, "epoch": 2438} {"train_loss": -6.263411521911621, "global_step": 102406, "epoch": 2438} {"train_loss": -6.222181797027588, "global_step": 102407, "epoch": 2438} {"train_loss": -6.271686553955078, "global_step": 102408, "epoch": 2438} {"train_loss": -6.201673984527588, "global_step": 102409, "epoch": 2438} {"train_loss": -6.34193754196167, "global_step": 102410, "epoch": 2438} {"train_loss": -6.329860210418701, "global_step": 102411, "epoch": 2438} {"train_loss": -6.380589962005615, "global_step": 102412, "epoch": 2438} {"train_loss": -6.319065570831299, "global_step": 102413, "epoch": 2438} {"train_loss": -6.390960693359375, "global_step": 102414, "epoch": 2438} {"train_loss": -6.367157936096191, "global_step": 102415, "epoch": 2438} {"train_loss": -6.32805871963501, "global_step": 102416, "epoch": 2438} {"train_loss": -6.299099922180176, "global_step": 102417, "epoch": 2438} {"train_loss": -6.364460468292236, "global_step": 102418, "epoch": 2438} {"train_loss": -6.440662384033203, "global_step": 102419, "epoch": 2438} {"train_loss": -6.383782386779785, "global_step": 102420, "epoch": 2438} {"train_loss": -6.427947044372559, "global_step": 102421, "epoch": 2438} {"train_loss": -6.42080545425415, "global_step": 102422, "epoch": 2438} {"train_loss": -6.359961986541748, "global_step": 102423, "epoch": 2438} {"train_loss": -6.291478157043457, "global_step": 102424, "epoch": 2438} {"train_loss": -6.288993835449219, "global_step": 102425, "epoch": 2438} {"train_loss": -6.2942214012146, "global_step": 102426, "epoch": 2438} {"train_loss": -6.3556389808654785, "global_step": 102427, "epoch": 2438} {"train_loss": -6.301482200622559, "global_step": 102428, "epoch": 2438} {"train_loss": -6.373770713806152, "global_step": 102429, "epoch": 2438} {"train_loss": -6.282313346862793, "global_step": 102430, "epoch": 2438} {"train_loss": -6.314905166625977, "global_step": 102431, "epoch": 2438} {"train_loss": -6.391783237457275, "global_step": 102432, "epoch": 2438} {"train_loss": -6.221168041229248, "global_step": 102433, "epoch": 2438} {"train_loss": -6.355627536773682, "global_step": 102434, "epoch": 2438} {"train_loss": -6.383059024810791, "global_step": 102435, "epoch": 2438} {"train_loss": -6.287758827209473, "global_step": 102436, "epoch": 2438} {"train_loss": -6.30147089276995, "global_step": 102437, "epoch": 2438, "val_loss": 67906.265625} {"train_loss": -6.248762607574463, "global_step": 102438, "epoch": 2439} {"train_loss": -6.388208866119385, "global_step": 102439, "epoch": 2439} {"train_loss": -6.4371795654296875, "global_step": 102440, "epoch": 2439} {"train_loss": -6.297530651092529, "global_step": 102441, "epoch": 2439} {"train_loss": -6.395052433013916, "global_step": 102442, "epoch": 2439} {"train_loss": -6.354750156402588, "global_step": 102443, "epoch": 2439} {"train_loss": -6.34538459777832, "global_step": 102444, "epoch": 2439} {"train_loss": -6.294572830200195, "global_step": 102445, "epoch": 2439} {"train_loss": -6.380582809448242, "global_step": 102446, "epoch": 2439} {"train_loss": -6.424054145812988, "global_step": 102447, "epoch": 2439} {"train_loss": -6.349565505981445, "global_step": 102448, "epoch": 2439} {"train_loss": -6.3805251121521, "global_step": 102449, "epoch": 2439} {"train_loss": -6.337283611297607, "global_step": 102450, "epoch": 2439} {"train_loss": -6.435585975646973, "global_step": 102451, "epoch": 2439} {"train_loss": -6.434691429138184, "global_step": 102452, "epoch": 2439} {"train_loss": -6.459059715270996, "global_step": 102453, "epoch": 2439} {"train_loss": -6.45335054397583, "global_step": 102454, "epoch": 2439} {"train_loss": -6.280130386352539, "global_step": 102455, "epoch": 2439} {"train_loss": -6.355489730834961, "global_step": 102456, "epoch": 2439} {"train_loss": -6.456334114074707, "global_step": 102457, "epoch": 2439} {"train_loss": -6.33130407333374, "global_step": 102458, "epoch": 2439} {"train_loss": -6.434412956237793, "global_step": 102459, "epoch": 2439} {"train_loss": -6.479948043823242, "global_step": 102460, "epoch": 2439} {"train_loss": -6.299866199493408, "global_step": 102461, "epoch": 2439} {"train_loss": -6.4300127029418945, "global_step": 102462, "epoch": 2439} {"train_loss": -6.494637966156006, "global_step": 102463, "epoch": 2439} {"train_loss": -6.370758056640625, "global_step": 102464, "epoch": 2439} {"train_loss": -6.41265869140625, "global_step": 102465, "epoch": 2439} {"train_loss": -6.441717624664307, "global_step": 102466, "epoch": 2439} {"train_loss": -6.411200046539307, "global_step": 102467, "epoch": 2439} {"train_loss": -6.392599105834961, "global_step": 102468, "epoch": 2439} {"train_loss": -6.2986555099487305, "global_step": 102469, "epoch": 2439} {"train_loss": -6.334957122802734, "global_step": 102470, "epoch": 2439} {"train_loss": -6.33260440826416, "global_step": 102471, "epoch": 2439} {"train_loss": -6.33207893371582, "global_step": 102472, "epoch": 2439} {"train_loss": -6.262180328369141, "global_step": 102473, "epoch": 2439} {"train_loss": -6.386631011962891, "global_step": 102474, "epoch": 2439} {"train_loss": -6.280574798583984, "global_step": 102475, "epoch": 2439} {"train_loss": -6.312442779541016, "global_step": 102476, "epoch": 2439} {"train_loss": -6.244407653808594, "global_step": 102477, "epoch": 2439} {"train_loss": -6.389062404632568, "global_step": 102478, "epoch": 2439} {"train_loss": -6.368831475575765, "global_step": 102479, "epoch": 2439, "val_loss": 68081.5859375} {"train_loss": -6.329949378967285, "global_step": 102480, "epoch": 2440} {"train_loss": -6.410401821136475, "global_step": 102481, "epoch": 2440} {"train_loss": -6.364252090454102, "global_step": 102482, "epoch": 2440} {"train_loss": -6.438480854034424, "global_step": 102483, "epoch": 2440} {"train_loss": -6.235200881958008, "global_step": 102484, "epoch": 2440} {"train_loss": -6.404060363769531, "global_step": 102485, "epoch": 2440} {"train_loss": -6.26837682723999, "global_step": 102486, "epoch": 2440} {"train_loss": -6.469203948974609, "global_step": 102487, "epoch": 2440} {"train_loss": -6.391117572784424, "global_step": 102488, "epoch": 2440} {"train_loss": -6.383474826812744, "global_step": 102489, "epoch": 2440} {"train_loss": -6.282687664031982, "global_step": 102490, "epoch": 2440} {"train_loss": -6.298645973205566, "global_step": 102491, "epoch": 2440} {"train_loss": -6.312952041625977, "global_step": 102492, "epoch": 2440} {"train_loss": -6.438365936279297, "global_step": 102493, "epoch": 2440} {"train_loss": -6.369950771331787, "global_step": 102494, "epoch": 2440} {"train_loss": -6.256698131561279, "global_step": 102495, "epoch": 2440} {"train_loss": -6.254332542419434, "global_step": 102496, "epoch": 2440} {"train_loss": -6.391777038574219, "global_step": 102497, "epoch": 2440} {"train_loss": -6.290854454040527, "global_step": 102498, "epoch": 2440} {"train_loss": -6.382038116455078, "global_step": 102499, "epoch": 2440} {"train_loss": -6.417724609375, "global_step": 102500, "epoch": 2440} {"train_loss": -6.420401573181152, "global_step": 102501, "epoch": 2440} {"train_loss": -6.304518699645996, "global_step": 102502, "epoch": 2440} {"train_loss": -6.379988670349121, "global_step": 102503, "epoch": 2440} {"train_loss": -6.293361663818359, "global_step": 102504, "epoch": 2440} {"train_loss": -6.4329304695129395, "global_step": 102505, "epoch": 2440} {"train_loss": -6.363995552062988, "global_step": 102506, "epoch": 2440} {"train_loss": -6.325760841369629, "global_step": 102507, "epoch": 2440} {"train_loss": -6.427542686462402, "global_step": 102508, "epoch": 2440} {"train_loss": -6.257048606872559, "global_step": 102509, "epoch": 2440} {"train_loss": -6.304454803466797, "global_step": 102510, "epoch": 2440} {"train_loss": -6.425585746765137, "global_step": 102511, "epoch": 2440} {"train_loss": -6.418304443359375, "global_step": 102512, "epoch": 2440} {"train_loss": -6.436950206756592, "global_step": 102513, "epoch": 2440} {"train_loss": -6.2591118812561035, "global_step": 102514, "epoch": 2440} {"train_loss": -6.425361633300781, "global_step": 102515, "epoch": 2440} {"train_loss": -6.321484565734863, "global_step": 102516, "epoch": 2440} {"train_loss": -6.454676628112793, "global_step": 102517, "epoch": 2440} {"train_loss": -6.375845909118652, "global_step": 102518, "epoch": 2440} {"train_loss": -6.343588829040527, "global_step": 102519, "epoch": 2440} {"train_loss": -6.385410785675049, "global_step": 102520, "epoch": 2440} {"train_loss": -6.361405122847784, "global_step": 102521, "epoch": 2440, "val_loss": 68005.2890625} {"train_loss": -6.396541595458984, "global_step": 102522, "epoch": 2441} {"train_loss": -6.447067737579346, "global_step": 102523, "epoch": 2441} {"train_loss": -6.345613956451416, "global_step": 102524, "epoch": 2441} {"train_loss": -6.2877092361450195, "global_step": 102525, "epoch": 2441} {"train_loss": -6.503387928009033, "global_step": 102526, "epoch": 2441} {"train_loss": -6.3749284744262695, "global_step": 102527, "epoch": 2441} {"train_loss": -6.360738754272461, "global_step": 102528, "epoch": 2441} {"train_loss": -6.348423004150391, "global_step": 102529, "epoch": 2441} {"train_loss": -6.3503265380859375, "global_step": 102530, "epoch": 2441} {"train_loss": -6.389701843261719, "global_step": 102531, "epoch": 2441} {"train_loss": -6.410370826721191, "global_step": 102532, "epoch": 2441} {"train_loss": -6.415386199951172, "global_step": 102533, "epoch": 2441} {"train_loss": -6.300025463104248, "global_step": 102534, "epoch": 2441} {"train_loss": -6.409697532653809, "global_step": 102535, "epoch": 2441} {"train_loss": -6.324939727783203, "global_step": 102536, "epoch": 2441} {"train_loss": -6.497949600219727, "global_step": 102537, "epoch": 2441} {"train_loss": -6.494054317474365, "global_step": 102538, "epoch": 2441} {"train_loss": -6.328056335449219, "global_step": 102539, "epoch": 2441} {"train_loss": -6.465235710144043, "global_step": 102540, "epoch": 2441} {"train_loss": -6.501153945922852, "global_step": 102541, "epoch": 2441} {"train_loss": -6.439370155334473, "global_step": 102542, "epoch": 2441} {"train_loss": -6.434031963348389, "global_step": 102543, "epoch": 2441} {"train_loss": -6.34516716003418, "global_step": 102544, "epoch": 2441} {"train_loss": -6.334500789642334, "global_step": 102545, "epoch": 2441} {"train_loss": -6.393182754516602, "global_step": 102546, "epoch": 2441} {"train_loss": -6.339574337005615, "global_step": 102547, "epoch": 2441} {"train_loss": -6.283655166625977, "global_step": 102548, "epoch": 2441} {"train_loss": -6.424840927124023, "global_step": 102549, "epoch": 2441} {"train_loss": -6.326786041259766, "global_step": 102550, "epoch": 2441} {"train_loss": -6.377682209014893, "global_step": 102551, "epoch": 2441} {"train_loss": -6.355771064758301, "global_step": 102552, "epoch": 2441} {"train_loss": -6.2804107666015625, "global_step": 102553, "epoch": 2441} {"train_loss": -6.2913079261779785, "global_step": 102554, "epoch": 2441} {"train_loss": -6.440756797790527, "global_step": 102555, "epoch": 2441} {"train_loss": -6.366809844970703, "global_step": 102556, "epoch": 2441} {"train_loss": -6.4282379150390625, "global_step": 102557, "epoch": 2441} {"train_loss": -6.404470443725586, "global_step": 102558, "epoch": 2441} {"train_loss": -6.35524845123291, "global_step": 102559, "epoch": 2441} {"train_loss": -6.456491470336914, "global_step": 102560, "epoch": 2441} {"train_loss": -6.466797351837158, "global_step": 102561, "epoch": 2441} {"train_loss": -6.442075729370117, "global_step": 102562, "epoch": 2441} {"train_loss": -6.3865112236567905, "global_step": 102563, "epoch": 2441, "val_loss": 67922.390625} {"train_loss": -6.456901550292969, "global_step": 102564, "epoch": 2442} {"train_loss": -6.404337406158447, "global_step": 102565, "epoch": 2442} {"train_loss": -6.370316505432129, "global_step": 102566, "epoch": 2442} {"train_loss": -6.365910530090332, "global_step": 102567, "epoch": 2442} {"train_loss": -6.306581497192383, "global_step": 102568, "epoch": 2442} {"train_loss": -6.337489604949951, "global_step": 102569, "epoch": 2442} {"train_loss": -6.369318962097168, "global_step": 102570, "epoch": 2442} {"train_loss": -6.3402228355407715, "global_step": 102571, "epoch": 2442} {"train_loss": -6.473243713378906, "global_step": 102572, "epoch": 2442} {"train_loss": -6.382926940917969, "global_step": 102573, "epoch": 2442} {"train_loss": -6.484389305114746, "global_step": 102574, "epoch": 2442} {"train_loss": -6.303914546966553, "global_step": 102575, "epoch": 2442} {"train_loss": -6.285561561584473, "global_step": 102576, "epoch": 2442} {"train_loss": -6.416009902954102, "global_step": 102577, "epoch": 2442} {"train_loss": -6.304711818695068, "global_step": 102578, "epoch": 2442} {"train_loss": -6.407303333282471, "global_step": 102579, "epoch": 2442} {"train_loss": -6.330362319946289, "global_step": 102580, "epoch": 2442} {"train_loss": -6.3584442138671875, "global_step": 102581, "epoch": 2442} {"train_loss": -6.409828186035156, "global_step": 102582, "epoch": 2442} {"train_loss": -6.384530544281006, "global_step": 102583, "epoch": 2442} {"train_loss": -6.452182292938232, "global_step": 102584, "epoch": 2442} {"train_loss": -6.361135482788086, "global_step": 102585, "epoch": 2442} {"train_loss": -6.367329120635986, "global_step": 102586, "epoch": 2442} {"train_loss": -6.436143398284912, "global_step": 102587, "epoch": 2442} {"train_loss": -6.397671222686768, "global_step": 102588, "epoch": 2442} {"train_loss": -6.272054672241211, "global_step": 102589, "epoch": 2442} {"train_loss": -6.369686126708984, "global_step": 102590, "epoch": 2442} {"train_loss": -6.2625346183776855, "global_step": 102591, "epoch": 2442} {"train_loss": -6.320869445800781, "global_step": 102592, "epoch": 2442} {"train_loss": -6.322750091552734, "global_step": 102593, "epoch": 2442} {"train_loss": -6.413541793823242, "global_step": 102594, "epoch": 2442} {"train_loss": -6.294076919555664, "global_step": 102595, "epoch": 2442} {"train_loss": -6.422124862670898, "global_step": 102596, "epoch": 2442} {"train_loss": -6.222413063049316, "global_step": 102597, "epoch": 2442} {"train_loss": -6.325005531311035, "global_step": 102598, "epoch": 2442} {"train_loss": -6.142462730407715, "global_step": 102599, "epoch": 2442} {"train_loss": -6.300077438354492, "global_step": 102600, "epoch": 2442} {"train_loss": -6.31566858291626, "global_step": 102601, "epoch": 2442} {"train_loss": -6.242986679077148, "global_step": 102602, "epoch": 2442} {"train_loss": -6.346134185791016, "global_step": 102603, "epoch": 2442} {"train_loss": -6.335065841674805, "global_step": 102604, "epoch": 2442} {"train_loss": -6.349855672745478, "global_step": 102605, "epoch": 2442, "val_loss": 67844.53125} {"train_loss": -6.251485347747803, "global_step": 102606, "epoch": 2443} {"train_loss": -6.318180561065674, "global_step": 102607, "epoch": 2443} {"train_loss": -6.2757978439331055, "global_step": 102608, "epoch": 2443} {"train_loss": -6.434581279754639, "global_step": 102609, "epoch": 2443} {"train_loss": -6.375735282897949, "global_step": 102610, "epoch": 2443} {"train_loss": -6.371946334838867, "global_step": 102611, "epoch": 2443} {"train_loss": -6.323965072631836, "global_step": 102612, "epoch": 2443} {"train_loss": -6.320191383361816, "global_step": 102613, "epoch": 2443} {"train_loss": -6.43715238571167, "global_step": 102614, "epoch": 2443} {"train_loss": -6.3135528564453125, "global_step": 102615, "epoch": 2443} {"train_loss": -6.300361633300781, "global_step": 102616, "epoch": 2443} {"train_loss": -6.27815055847168, "global_step": 102617, "epoch": 2443} {"train_loss": -6.321579933166504, "global_step": 102618, "epoch": 2443} {"train_loss": -6.304871559143066, "global_step": 102619, "epoch": 2443} {"train_loss": -6.253477096557617, "global_step": 102620, "epoch": 2443} {"train_loss": -6.402716159820557, "global_step": 102621, "epoch": 2443} {"train_loss": -6.311287879943848, "global_step": 102622, "epoch": 2443} {"train_loss": -6.261172771453857, "global_step": 102623, "epoch": 2443} {"train_loss": -6.265644073486328, "global_step": 102624, "epoch": 2443} {"train_loss": -6.27473783493042, "global_step": 102625, "epoch": 2443} {"train_loss": -6.40668249130249, "global_step": 102626, "epoch": 2443} {"train_loss": -6.5021867752075195, "global_step": 102627, "epoch": 2443} {"train_loss": -6.4150471687316895, "global_step": 102628, "epoch": 2443} {"train_loss": -6.413965702056885, "global_step": 102629, "epoch": 2443} {"train_loss": -6.265758037567139, "global_step": 102630, "epoch": 2443} {"train_loss": -6.334407806396484, "global_step": 102631, "epoch": 2443} {"train_loss": -6.3735246658325195, "global_step": 102632, "epoch": 2443} {"train_loss": -6.3200201988220215, "global_step": 102633, "epoch": 2443} {"train_loss": -6.280370235443115, "global_step": 102634, "epoch": 2443} {"train_loss": -6.448182106018066, "global_step": 102635, "epoch": 2443} {"train_loss": -6.3636250495910645, "global_step": 102636, "epoch": 2443} {"train_loss": -6.231900215148926, "global_step": 102637, "epoch": 2443} {"train_loss": -6.30000114440918, "global_step": 102638, "epoch": 2443} {"train_loss": -6.351168155670166, "global_step": 102639, "epoch": 2443} {"train_loss": -6.406249046325684, "global_step": 102640, "epoch": 2443} {"train_loss": -6.34775447845459, "global_step": 102641, "epoch": 2443} {"train_loss": -6.3924760818481445, "global_step": 102642, "epoch": 2443} {"train_loss": -6.341031074523926, "global_step": 102643, "epoch": 2443} {"train_loss": -6.3600311279296875, "global_step": 102644, "epoch": 2443} {"train_loss": -6.404345989227295, "global_step": 102645, "epoch": 2443} {"train_loss": -6.391884803771973, "global_step": 102646, "epoch": 2443} {"train_loss": -6.34321539742606, "global_step": 102647, "epoch": 2443, "val_loss": 67786.515625} {"train_loss": -6.349958419799805, "global_step": 102648, "epoch": 2444} {"train_loss": -6.300762176513672, "global_step": 102649, "epoch": 2444} {"train_loss": -6.339516639709473, "global_step": 102650, "epoch": 2444} {"train_loss": -6.421297550201416, "global_step": 102651, "epoch": 2444} {"train_loss": -6.394905090332031, "global_step": 102652, "epoch": 2444} {"train_loss": -6.496687889099121, "global_step": 102653, "epoch": 2444} {"train_loss": -6.254915237426758, "global_step": 102654, "epoch": 2444} {"train_loss": -6.3976287841796875, "global_step": 102655, "epoch": 2444} {"train_loss": -6.348694801330566, "global_step": 102656, "epoch": 2444} {"train_loss": -6.305446624755859, "global_step": 102657, "epoch": 2444} {"train_loss": -6.386897563934326, "global_step": 102658, "epoch": 2444} {"train_loss": -6.255958557128906, "global_step": 102659, "epoch": 2444} {"train_loss": -6.282936096191406, "global_step": 102660, "epoch": 2444} {"train_loss": -6.243410587310791, "global_step": 102661, "epoch": 2444} {"train_loss": -6.359086036682129, "global_step": 102662, "epoch": 2444} {"train_loss": -6.365478992462158, "global_step": 102663, "epoch": 2444} {"train_loss": -6.307250499725342, "global_step": 102664, "epoch": 2444} {"train_loss": -6.386903762817383, "global_step": 102665, "epoch": 2444} {"train_loss": -6.258544445037842, "global_step": 102666, "epoch": 2444} {"train_loss": -6.235291481018066, "global_step": 102667, "epoch": 2444} {"train_loss": -6.322038650512695, "global_step": 102668, "epoch": 2444} {"train_loss": -6.317706108093262, "global_step": 102669, "epoch": 2444} {"train_loss": -6.2235212326049805, "global_step": 102670, "epoch": 2444} {"train_loss": -6.239968299865723, "global_step": 102671, "epoch": 2444} {"train_loss": -6.3462677001953125, "global_step": 102672, "epoch": 2444} {"train_loss": -6.349483489990234, "global_step": 102673, "epoch": 2444} {"train_loss": -6.455908298492432, "global_step": 102674, "epoch": 2444} {"train_loss": -6.28377103805542, "global_step": 102675, "epoch": 2444} {"train_loss": -6.446651935577393, "global_step": 102676, "epoch": 2444} {"train_loss": -6.400385856628418, "global_step": 102677, "epoch": 2444} {"train_loss": -6.2219929695129395, "global_step": 102678, "epoch": 2444} {"train_loss": -6.363308906555176, "global_step": 102679, "epoch": 2444} {"train_loss": -6.360537528991699, "global_step": 102680, "epoch": 2444} {"train_loss": -6.344481468200684, "global_step": 102681, "epoch": 2444} {"train_loss": -6.428534507751465, "global_step": 102682, "epoch": 2444} {"train_loss": -6.283736228942871, "global_step": 102683, "epoch": 2444} {"train_loss": -6.321353435516357, "global_step": 102684, "epoch": 2444} {"train_loss": -6.397161483764648, "global_step": 102685, "epoch": 2444} {"train_loss": -6.453611373901367, "global_step": 102686, "epoch": 2444} {"train_loss": -6.380380630493164, "global_step": 102687, "epoch": 2444} {"train_loss": -6.308013916015625, "global_step": 102688, "epoch": 2444} {"train_loss": -6.3394250983283635, "global_step": 102689, "epoch": 2444, "val_loss": 68106.2265625} {"train_loss": -6.18176794052124, "global_step": 102690, "epoch": 2445} {"train_loss": -6.465386867523193, "global_step": 102691, "epoch": 2445} {"train_loss": -6.3197922706604, "global_step": 102692, "epoch": 2445} {"train_loss": -6.379079818725586, "global_step": 102693, "epoch": 2445} {"train_loss": -6.308037757873535, "global_step": 102694, "epoch": 2445} {"train_loss": -6.378130912780762, "global_step": 102695, "epoch": 2445} {"train_loss": -6.3991241455078125, "global_step": 102696, "epoch": 2445} {"train_loss": -6.41964054107666, "global_step": 102697, "epoch": 2445} {"train_loss": -6.295183181762695, "global_step": 102698, "epoch": 2445} {"train_loss": -6.28594446182251, "global_step": 102699, "epoch": 2445} {"train_loss": -6.502729892730713, "global_step": 102700, "epoch": 2445} {"train_loss": -6.312987804412842, "global_step": 102701, "epoch": 2445} {"train_loss": -6.310528755187988, "global_step": 102702, "epoch": 2445} {"train_loss": -6.386763572692871, "global_step": 102703, "epoch": 2445} {"train_loss": -6.264997482299805, "global_step": 102704, "epoch": 2445} {"train_loss": -6.299216270446777, "global_step": 102705, "epoch": 2445} {"train_loss": -6.2975568771362305, "global_step": 102706, "epoch": 2445} {"train_loss": -6.30522346496582, "global_step": 102707, "epoch": 2445} {"train_loss": -6.4064412117004395, "global_step": 102708, "epoch": 2445} {"train_loss": -6.333041191101074, "global_step": 102709, "epoch": 2445} {"train_loss": -6.350268840789795, "global_step": 102710, "epoch": 2445} {"train_loss": -6.387407302856445, "global_step": 102711, "epoch": 2445} {"train_loss": -6.381163120269775, "global_step": 102712, "epoch": 2445} {"train_loss": -6.522188663482666, "global_step": 102713, "epoch": 2445} {"train_loss": -6.431436538696289, "global_step": 102714, "epoch": 2445} {"train_loss": -6.410336494445801, "global_step": 102715, "epoch": 2445} {"train_loss": -6.421724796295166, "global_step": 102716, "epoch": 2445} {"train_loss": -6.328249931335449, "global_step": 102717, "epoch": 2445} {"train_loss": -6.324911117553711, "global_step": 102718, "epoch": 2445} {"train_loss": -6.345693588256836, "global_step": 102719, "epoch": 2445} {"train_loss": -6.348928928375244, "global_step": 102720, "epoch": 2445} {"train_loss": -6.335466384887695, "global_step": 102721, "epoch": 2445} {"train_loss": -6.363050937652588, "global_step": 102722, "epoch": 2445} {"train_loss": -6.388678550720215, "global_step": 102723, "epoch": 2445} {"train_loss": -6.343690872192383, "global_step": 102724, "epoch": 2445} {"train_loss": -6.319344997406006, "global_step": 102725, "epoch": 2445} {"train_loss": -6.421849250793457, "global_step": 102726, "epoch": 2445} {"train_loss": -6.361520767211914, "global_step": 102727, "epoch": 2445} {"train_loss": -6.541267395019531, "global_step": 102728, "epoch": 2445} {"train_loss": -6.421737194061279, "global_step": 102729, "epoch": 2445} {"train_loss": -6.453235626220703, "global_step": 102730, "epoch": 2445} {"train_loss": -6.366425287155878, "global_step": 102731, "epoch": 2445, "val_loss": 67861.578125} {"train_loss": -6.381869792938232, "global_step": 102732, "epoch": 2446} {"train_loss": -6.417759895324707, "global_step": 102733, "epoch": 2446} {"train_loss": -6.5599517822265625, "global_step": 102734, "epoch": 2446} {"train_loss": -6.491782188415527, "global_step": 102735, "epoch": 2446} {"train_loss": -6.2706298828125, "global_step": 102736, "epoch": 2446} {"train_loss": -6.423409461975098, "global_step": 102737, "epoch": 2446} {"train_loss": -6.39225435256958, "global_step": 102738, "epoch": 2446} {"train_loss": -6.290103912353516, "global_step": 102739, "epoch": 2446} {"train_loss": -6.403757095336914, "global_step": 102740, "epoch": 2446} {"train_loss": -6.427508354187012, "global_step": 102741, "epoch": 2446} {"train_loss": -6.403745651245117, "global_step": 102742, "epoch": 2446} {"train_loss": -6.348276138305664, "global_step": 102743, "epoch": 2446} {"train_loss": -6.333232879638672, "global_step": 102744, "epoch": 2446} {"train_loss": -6.340052127838135, "global_step": 102745, "epoch": 2446} {"train_loss": -6.368093967437744, "global_step": 102746, "epoch": 2446} {"train_loss": -6.46331262588501, "global_step": 102747, "epoch": 2446} {"train_loss": -6.446122646331787, "global_step": 102748, "epoch": 2446} {"train_loss": -6.342808246612549, "global_step": 102749, "epoch": 2446} {"train_loss": -6.439238548278809, "global_step": 102750, "epoch": 2446} {"train_loss": -6.3917388916015625, "global_step": 102751, "epoch": 2446} {"train_loss": -6.504474639892578, "global_step": 102752, "epoch": 2446} {"train_loss": -6.395893096923828, "global_step": 102753, "epoch": 2446} {"train_loss": -6.358320713043213, "global_step": 102754, "epoch": 2446} {"train_loss": -6.349521636962891, "global_step": 102755, "epoch": 2446} {"train_loss": -6.336554527282715, "global_step": 102756, "epoch": 2446} {"train_loss": -6.384091377258301, "global_step": 102757, "epoch": 2446} {"train_loss": -6.356966018676758, "global_step": 102758, "epoch": 2446} {"train_loss": -6.4509172439575195, "global_step": 102759, "epoch": 2446} {"train_loss": -6.3584675788879395, "global_step": 102760, "epoch": 2446} {"train_loss": -6.423735618591309, "global_step": 102761, "epoch": 2446} {"train_loss": -6.304776668548584, "global_step": 102762, "epoch": 2446} {"train_loss": -6.4201788902282715, "global_step": 102763, "epoch": 2446} {"train_loss": -6.419171333312988, "global_step": 102764, "epoch": 2446} {"train_loss": -6.377795219421387, "global_step": 102765, "epoch": 2446} {"train_loss": -6.388071060180664, "global_step": 102766, "epoch": 2446} {"train_loss": -6.293488502502441, "global_step": 102767, "epoch": 2446} {"train_loss": -6.244680404663086, "global_step": 102768, "epoch": 2446} {"train_loss": -6.348694324493408, "global_step": 102769, "epoch": 2446} {"train_loss": -6.322456359863281, "global_step": 102770, "epoch": 2446} {"train_loss": -6.293471336364746, "global_step": 102771, "epoch": 2446} {"train_loss": -6.3032636642456055, "global_step": 102772, "epoch": 2446} {"train_loss": -6.378394785381499, "global_step": 102773, "epoch": 2446, "val_loss": 68268.59375} {"train_loss": -6.229547500610352, "global_step": 102774, "epoch": 2447} {"train_loss": -6.457578659057617, "global_step": 102775, "epoch": 2447} {"train_loss": -6.306014060974121, "global_step": 102776, "epoch": 2447} {"train_loss": -6.320788860321045, "global_step": 102777, "epoch": 2447} {"train_loss": -6.426987648010254, "global_step": 102778, "epoch": 2447} {"train_loss": -6.356597900390625, "global_step": 102779, "epoch": 2447} {"train_loss": -6.3367109298706055, "global_step": 102780, "epoch": 2447} {"train_loss": -6.311614036560059, "global_step": 102781, "epoch": 2447} {"train_loss": -6.436988353729248, "global_step": 102782, "epoch": 2447} {"train_loss": -6.34782600402832, "global_step": 102783, "epoch": 2447} {"train_loss": -6.484244346618652, "global_step": 102784, "epoch": 2447} {"train_loss": -6.281665802001953, "global_step": 102785, "epoch": 2447} {"train_loss": -6.425811767578125, "global_step": 102786, "epoch": 2447} {"train_loss": -6.290979862213135, "global_step": 102787, "epoch": 2447} {"train_loss": -6.429965496063232, "global_step": 102788, "epoch": 2447} {"train_loss": -6.389974594116211, "global_step": 102789, "epoch": 2447} {"train_loss": -6.430863380432129, "global_step": 102790, "epoch": 2447} {"train_loss": -6.335274696350098, "global_step": 102791, "epoch": 2447} {"train_loss": -6.359539985656738, "global_step": 102792, "epoch": 2447} {"train_loss": -6.406905174255371, "global_step": 102793, "epoch": 2447} {"train_loss": -6.451259136199951, "global_step": 102794, "epoch": 2447} {"train_loss": -6.409517765045166, "global_step": 102795, "epoch": 2447} {"train_loss": -6.400006294250488, "global_step": 102796, "epoch": 2447} {"train_loss": -6.448311805725098, "global_step": 102797, "epoch": 2447} {"train_loss": -6.458508491516113, "global_step": 102798, "epoch": 2447} {"train_loss": -6.317318916320801, "global_step": 102799, "epoch": 2447} {"train_loss": -6.403267860412598, "global_step": 102800, "epoch": 2447} {"train_loss": -6.509922504425049, "global_step": 102801, "epoch": 2447} {"train_loss": -6.316705703735352, "global_step": 102802, "epoch": 2447} {"train_loss": -6.315200328826904, "global_step": 102803, "epoch": 2447} {"train_loss": -6.342504501342773, "global_step": 102804, "epoch": 2447} {"train_loss": -6.433001518249512, "global_step": 102805, "epoch": 2447} {"train_loss": -6.373478412628174, "global_step": 102806, "epoch": 2447} {"train_loss": -6.38383674621582, "global_step": 102807, "epoch": 2447} {"train_loss": -6.2603960037231445, "global_step": 102808, "epoch": 2447} {"train_loss": -6.188180923461914, "global_step": 102809, "epoch": 2447} {"train_loss": -6.354046821594238, "global_step": 102810, "epoch": 2447} {"train_loss": -6.433652400970459, "global_step": 102811, "epoch": 2447} {"train_loss": -6.22310209274292, "global_step": 102812, "epoch": 2447} {"train_loss": -6.323709487915039, "global_step": 102813, "epoch": 2447} {"train_loss": -6.330383777618408, "global_step": 102814, "epoch": 2447} {"train_loss": -6.366602012089321, "global_step": 102815, "epoch": 2447, "val_loss": 67913.7890625} {"train_loss": -6.376073837280273, "global_step": 102816, "epoch": 2448} {"train_loss": -6.252730846405029, "global_step": 102817, "epoch": 2448} {"train_loss": -6.3748016357421875, "global_step": 102818, "epoch": 2448} {"train_loss": -6.328045845031738, "global_step": 102819, "epoch": 2448} {"train_loss": -6.313236236572266, "global_step": 102820, "epoch": 2448} {"train_loss": -6.353271484375, "global_step": 102821, "epoch": 2448} {"train_loss": -6.262242317199707, "global_step": 102822, "epoch": 2448} {"train_loss": -6.269367218017578, "global_step": 102823, "epoch": 2448} {"train_loss": -6.435937404632568, "global_step": 102824, "epoch": 2448} {"train_loss": -6.295940399169922, "global_step": 102825, "epoch": 2448} {"train_loss": -6.430299758911133, "global_step": 102826, "epoch": 2448} {"train_loss": -6.2876787185668945, "global_step": 102827, "epoch": 2448} {"train_loss": -6.367791175842285, "global_step": 102828, "epoch": 2448} {"train_loss": -6.399752616882324, "global_step": 102829, "epoch": 2448} {"train_loss": -6.4063005447387695, "global_step": 102830, "epoch": 2448} {"train_loss": -6.376676082611084, "global_step": 102831, "epoch": 2448} {"train_loss": -6.344592094421387, "global_step": 102832, "epoch": 2448} {"train_loss": -6.311538219451904, "global_step": 102833, "epoch": 2448} {"train_loss": -6.392559051513672, "global_step": 102834, "epoch": 2448} {"train_loss": -6.425502300262451, "global_step": 102835, "epoch": 2448} {"train_loss": -6.409989833831787, "global_step": 102836, "epoch": 2448} {"train_loss": -6.253998756408691, "global_step": 102837, "epoch": 2448} {"train_loss": -6.456072807312012, "global_step": 102838, "epoch": 2448} {"train_loss": -6.447348594665527, "global_step": 102839, "epoch": 2448} {"train_loss": -6.349072456359863, "global_step": 102840, "epoch": 2448} {"train_loss": -6.421038627624512, "global_step": 102841, "epoch": 2448} {"train_loss": -6.426957607269287, "global_step": 102842, "epoch": 2448} {"train_loss": -6.367705345153809, "global_step": 102843, "epoch": 2448} {"train_loss": -6.229825973510742, "global_step": 102844, "epoch": 2448} {"train_loss": -6.208322525024414, "global_step": 102845, "epoch": 2448} {"train_loss": -6.464811325073242, "global_step": 102846, "epoch": 2448} {"train_loss": -6.352951526641846, "global_step": 102847, "epoch": 2448} {"train_loss": -6.366479873657227, "global_step": 102848, "epoch": 2448} {"train_loss": -6.288817405700684, "global_step": 102849, "epoch": 2448} {"train_loss": -6.290675163269043, "global_step": 102850, "epoch": 2448} {"train_loss": -6.351621627807617, "global_step": 102851, "epoch": 2448} {"train_loss": -6.342752456665039, "global_step": 102852, "epoch": 2448} {"train_loss": -6.309874057769775, "global_step": 102853, "epoch": 2448} {"train_loss": -6.3947601318359375, "global_step": 102854, "epoch": 2448} {"train_loss": -6.539457321166992, "global_step": 102855, "epoch": 2448} {"train_loss": -6.4464616775512695, "global_step": 102856, "epoch": 2448} {"train_loss": -6.35758147920881, "global_step": 102857, "epoch": 2448, "val_loss": 67802.7890625} {"train_loss": -6.360609531402588, "global_step": 102858, "epoch": 2449} {"train_loss": -6.272153854370117, "global_step": 102859, "epoch": 2449} {"train_loss": -6.535033226013184, "global_step": 102860, "epoch": 2449} {"train_loss": -6.5454816818237305, "global_step": 102861, "epoch": 2449} {"train_loss": -6.33076286315918, "global_step": 102862, "epoch": 2449} {"train_loss": -6.406171798706055, "global_step": 102863, "epoch": 2449} {"train_loss": -6.490477561950684, "global_step": 102864, "epoch": 2449} {"train_loss": -6.336958408355713, "global_step": 102865, "epoch": 2449} {"train_loss": -6.448294639587402, "global_step": 102866, "epoch": 2449} {"train_loss": -6.375226020812988, "global_step": 102867, "epoch": 2449} {"train_loss": -6.348223686218262, "global_step": 102868, "epoch": 2449} {"train_loss": -6.398648738861084, "global_step": 102869, "epoch": 2449} {"train_loss": -6.39454460144043, "global_step": 102870, "epoch": 2449} {"train_loss": -6.42983865737915, "global_step": 102871, "epoch": 2449} {"train_loss": -6.332503318786621, "global_step": 102872, "epoch": 2449} {"train_loss": -6.370514392852783, "global_step": 102873, "epoch": 2449} {"train_loss": -6.362064361572266, "global_step": 102874, "epoch": 2449} {"train_loss": -6.292178153991699, "global_step": 102875, "epoch": 2449} {"train_loss": -6.371060371398926, "global_step": 102876, "epoch": 2449} {"train_loss": -6.448079586029053, "global_step": 102877, "epoch": 2449} {"train_loss": -6.340221405029297, "global_step": 102878, "epoch": 2449} {"train_loss": -6.356814384460449, "global_step": 102879, "epoch": 2449} {"train_loss": -6.381133079528809, "global_step": 102880, "epoch": 2449} {"train_loss": -6.253281116485596, "global_step": 102881, "epoch": 2449} {"train_loss": -6.399894714355469, "global_step": 102882, "epoch": 2449} {"train_loss": -6.377222061157227, "global_step": 102883, "epoch": 2449} {"train_loss": -6.209062099456787, "global_step": 102884, "epoch": 2449} {"train_loss": -6.288114070892334, "global_step": 102885, "epoch": 2449} {"train_loss": -6.3117547035217285, "global_step": 102886, "epoch": 2449} {"train_loss": -6.174884796142578, "global_step": 102887, "epoch": 2449} {"train_loss": -6.262523651123047, "global_step": 102888, "epoch": 2449} {"train_loss": -6.224347114562988, "global_step": 102889, "epoch": 2449} {"train_loss": -6.418206214904785, "global_step": 102890, "epoch": 2449} {"train_loss": -6.3529534339904785, "global_step": 102891, "epoch": 2449} {"train_loss": -6.324956893920898, "global_step": 102892, "epoch": 2449} {"train_loss": -6.272513389587402, "global_step": 102893, "epoch": 2449} {"train_loss": -6.252566337585449, "global_step": 102894, "epoch": 2449} {"train_loss": -6.214942932128906, "global_step": 102895, "epoch": 2449} {"train_loss": -6.253408432006836, "global_step": 102896, "epoch": 2449} {"train_loss": -6.313459396362305, "global_step": 102897, "epoch": 2449} {"train_loss": -6.271972179412842, "global_step": 102898, "epoch": 2449} {"train_loss": -6.342610665730068, "global_step": 102899, "epoch": 2449, "val_loss": 67785.421875} {"train_loss": -6.319648742675781, "global_step": 102900, "epoch": 2450} {"train_loss": -6.246389389038086, "global_step": 102901, "epoch": 2450} {"train_loss": -6.295186519622803, "global_step": 102902, "epoch": 2450} {"train_loss": -6.3683247566223145, "global_step": 102903, "epoch": 2450} {"train_loss": -6.303455352783203, "global_step": 102904, "epoch": 2450} {"train_loss": -6.466240882873535, "global_step": 102905, "epoch": 2450} {"train_loss": -6.377375602722168, "global_step": 102906, "epoch": 2450} {"train_loss": -6.406895160675049, "global_step": 102907, "epoch": 2450} {"train_loss": -6.348424911499023, "global_step": 102908, "epoch": 2450} {"train_loss": -6.390544891357422, "global_step": 102909, "epoch": 2450} {"train_loss": -6.453010082244873, "global_step": 102910, "epoch": 2450} {"train_loss": -6.3432769775390625, "global_step": 102911, "epoch": 2450} {"train_loss": -6.338077068328857, "global_step": 102912, "epoch": 2450} {"train_loss": -6.407159805297852, "global_step": 102913, "epoch": 2450} {"train_loss": -6.3104047775268555, "global_step": 102914, "epoch": 2450} {"train_loss": -6.4420928955078125, "global_step": 102915, "epoch": 2450} {"train_loss": -6.246486663818359, "global_step": 102916, "epoch": 2450} {"train_loss": -6.364409446716309, "global_step": 102917, "epoch": 2450} {"train_loss": -6.36051082611084, "global_step": 102918, "epoch": 2450} {"train_loss": -6.283333778381348, "global_step": 102919, "epoch": 2450} {"train_loss": -6.413032531738281, "global_step": 102920, "epoch": 2450} {"train_loss": -6.351319313049316, "global_step": 102921, "epoch": 2450} {"train_loss": -6.417710304260254, "global_step": 102922, "epoch": 2450} {"train_loss": -6.410266876220703, "global_step": 102923, "epoch": 2450} {"train_loss": -6.453318119049072, "global_step": 102924, "epoch": 2450} {"train_loss": -6.440857410430908, "global_step": 102925, "epoch": 2450} {"train_loss": -6.3672943115234375, "global_step": 102926, "epoch": 2450} {"train_loss": -6.438417911529541, "global_step": 102927, "epoch": 2450} {"train_loss": -6.269750595092773, "global_step": 102928, "epoch": 2450} {"train_loss": -6.39634895324707, "global_step": 102929, "epoch": 2450} {"train_loss": -6.533360004425049, "global_step": 102930, "epoch": 2450} {"train_loss": -6.426905155181885, "global_step": 102931, "epoch": 2450} {"train_loss": -6.530839443206787, "global_step": 102932, "epoch": 2450} {"train_loss": -6.45339298248291, "global_step": 102933, "epoch": 2450} {"train_loss": -6.399528503417969, "global_step": 102934, "epoch": 2450} {"train_loss": -6.277322769165039, "global_step": 102935, "epoch": 2450} {"train_loss": -6.285182952880859, "global_step": 102936, "epoch": 2450} {"train_loss": -6.542557239532471, "global_step": 102937, "epoch": 2450} {"train_loss": -6.337058067321777, "global_step": 102938, "epoch": 2450} {"train_loss": -6.464391708374023, "global_step": 102939, "epoch": 2450} {"train_loss": -6.39072322845459, "global_step": 102940, "epoch": 2450} {"train_loss": -6.381377129327683, "global_step": 102941, "epoch": 2450, "train/sim_max_reward_0": 0.21254725307014555, "train/sim_max_reward_1": 0.9005948894083987, "train/sim_max_reward_2": 0.1869978166734001, "train/sim_max_reward_3": 0.14470616946360507, "train/sim_max_reward_4": 0.8147328338443454, "train/sim_max_reward_5": 0.8635629562456114, "test/sim_max_reward_4400000": 0.9703137876869569, "test/sim_max_reward_4400001": 0.14753945451599904, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.28237376051110225, "test/sim_max_reward_4400006": 0.3491077918225214, "test/sim_max_reward_4400007": 0.9741032076328023, "test/sim_max_reward_4400008": 0.2974127788926182, "test/sim_max_reward_4400009": 0.4636962259415506, "test/sim_max_reward_4400010": 0.3722150828548377, "test/sim_max_reward_4400011": 0.8937799084721376, "test/sim_max_reward_4400012": 0.89809899759675, "test/sim_max_reward_4400013": 0.3281031784808967, "test/sim_max_reward_4400014": 0.8837200814438486, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24055714053123728, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.20538440008137332, "test/sim_max_reward_4400023": 0.9560564305514401, "test/sim_max_reward_4400024": 0.44752807165978625, "test/sim_max_reward_4400025": 0.2508375725843325, "test/sim_max_reward_4400026": 0.956398237641901, "test/sim_max_reward_4400027": 0.06535310400998845, "test/sim_max_reward_4400028": 0.5370267232409529, "test/sim_max_reward_4400029": 0.7012363952047027, "test/sim_max_reward_4400030": 0.9761797096137808, "test/sim_max_reward_4400031": 0.8758487080154652, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.2035753628030097, "test/sim_max_reward_4400034": 0.8557813719031659, "test/sim_max_reward_4400035": 0.464584854284442, "test/sim_max_reward_4400036": 0.7048967271936852, "test/sim_max_reward_4400037": 0.9838898350557927, "test/sim_max_reward_4400038": 0.559526602185115, "test/sim_max_reward_4400039": 0.8407141629098799, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9008076813740158, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.8162889029875143, "test/sim_max_reward_4400044": 0.9379882849932349, "test/sim_max_reward_4400045": 0.8396248443160474, "test/sim_max_reward_4400046": 0.403606770678511, "test/sim_max_reward_4400047": 0.6922937514483286, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8113935159397996, "train/mean_score": 0.5205236531175844, "test/mean_score": 0.5121381178268659, "val_loss": 68053.2734375} {"train_loss": -6.430423259735107, "global_step": 102942, "epoch": 2451} {"train_loss": -6.443246364593506, "global_step": 102943, "epoch": 2451} {"train_loss": -6.212440490722656, "global_step": 102944, "epoch": 2451} {"train_loss": -6.431734085083008, "global_step": 102945, "epoch": 2451} {"train_loss": -6.320289611816406, "global_step": 102946, "epoch": 2451} {"train_loss": -6.262429237365723, "global_step": 102947, "epoch": 2451} {"train_loss": -6.491155624389648, "global_step": 102948, "epoch": 2451} {"train_loss": -6.47724723815918, "global_step": 102949, "epoch": 2451} {"train_loss": -6.312585830688477, "global_step": 102950, "epoch": 2451} {"train_loss": -6.423070430755615, "global_step": 102951, "epoch": 2451} {"train_loss": -6.274048328399658, "global_step": 102952, "epoch": 2451} {"train_loss": -6.3940510749816895, "global_step": 102953, "epoch": 2451} {"train_loss": -6.367022514343262, "global_step": 102954, "epoch": 2451} {"train_loss": -6.24125862121582, "global_step": 102955, "epoch": 2451} {"train_loss": -6.37244987487793, "global_step": 102956, "epoch": 2451} {"train_loss": -6.441076278686523, "global_step": 102957, "epoch": 2451} {"train_loss": -6.289555549621582, "global_step": 102958, "epoch": 2451} {"train_loss": -6.363980770111084, "global_step": 102959, "epoch": 2451} {"train_loss": -6.382915496826172, "global_step": 102960, "epoch": 2451} {"train_loss": -6.343713283538818, "global_step": 102961, "epoch": 2451} {"train_loss": -6.3779296875, "global_step": 102962, "epoch": 2451} {"train_loss": -6.311225891113281, "global_step": 102963, "epoch": 2451} {"train_loss": -6.37044620513916, "global_step": 102964, "epoch": 2451} {"train_loss": -6.365039348602295, "global_step": 102965, "epoch": 2451} {"train_loss": -6.274377822875977, "global_step": 102966, "epoch": 2451} {"train_loss": -6.504103183746338, "global_step": 102967, "epoch": 2451} {"train_loss": -6.317996501922607, "global_step": 102968, "epoch": 2451} {"train_loss": -6.339924335479736, "global_step": 102969, "epoch": 2451} {"train_loss": -6.310887813568115, "global_step": 102970, "epoch": 2451} {"train_loss": -6.396234512329102, "global_step": 102971, "epoch": 2451} {"train_loss": -6.462815761566162, "global_step": 102972, "epoch": 2451} {"train_loss": -6.352149963378906, "global_step": 102973, "epoch": 2451} {"train_loss": -6.3553266525268555, "global_step": 102974, "epoch": 2451} {"train_loss": -6.447896957397461, "global_step": 102975, "epoch": 2451} {"train_loss": -6.433845520019531, "global_step": 102976, "epoch": 2451} {"train_loss": -6.317264080047607, "global_step": 102977, "epoch": 2451} {"train_loss": -6.418980598449707, "global_step": 102978, "epoch": 2451} {"train_loss": -6.215765953063965, "global_step": 102979, "epoch": 2451} {"train_loss": -6.332863807678223, "global_step": 102980, "epoch": 2451} {"train_loss": -6.260166168212891, "global_step": 102981, "epoch": 2451} {"train_loss": -6.226918697357178, "global_step": 102982, "epoch": 2451} {"train_loss": -6.357661724090576, "global_step": 102983, "epoch": 2451, "val_loss": 67890.84375} {"train_loss": -6.4278059005737305, "global_step": 102984, "epoch": 2452} {"train_loss": -6.397182464599609, "global_step": 102985, "epoch": 2452} {"train_loss": -6.257204055786133, "global_step": 102986, "epoch": 2452} {"train_loss": -6.3506574630737305, "global_step": 102987, "epoch": 2452} {"train_loss": -6.3646955490112305, "global_step": 102988, "epoch": 2452} {"train_loss": -6.358061790466309, "global_step": 102989, "epoch": 2452} {"train_loss": -6.336284637451172, "global_step": 102990, "epoch": 2452} {"train_loss": -6.318606853485107, "global_step": 102991, "epoch": 2452} {"train_loss": -6.358473777770996, "global_step": 102992, "epoch": 2452} {"train_loss": -6.381712436676025, "global_step": 102993, "epoch": 2452} {"train_loss": -6.43094539642334, "global_step": 102994, "epoch": 2452} {"train_loss": -6.42864990234375, "global_step": 102995, "epoch": 2452} {"train_loss": -6.415763854980469, "global_step": 102996, "epoch": 2452} {"train_loss": -6.254214286804199, "global_step": 102997, "epoch": 2452} {"train_loss": -6.4303460121154785, "global_step": 102998, "epoch": 2452} {"train_loss": -6.364825248718262, "global_step": 102999, "epoch": 2452} {"train_loss": -6.465682506561279, "global_step": 103000, "epoch": 2452} {"train_loss": -6.43533992767334, "global_step": 103001, "epoch": 2452} {"train_loss": -6.410099029541016, "global_step": 103002, "epoch": 2452} {"train_loss": -6.4110565185546875, "global_step": 103003, "epoch": 2452} {"train_loss": -6.355276107788086, "global_step": 103004, "epoch": 2452} {"train_loss": -6.366690635681152, "global_step": 103005, "epoch": 2452} {"train_loss": -6.39483642578125, "global_step": 103006, "epoch": 2452} {"train_loss": -6.417187213897705, "global_step": 103007, "epoch": 2452} {"train_loss": -6.314215660095215, "global_step": 103008, "epoch": 2452} {"train_loss": -6.437737464904785, "global_step": 103009, "epoch": 2452} {"train_loss": -6.3385515213012695, "global_step": 103010, "epoch": 2452} {"train_loss": -6.251518249511719, "global_step": 103011, "epoch": 2452} {"train_loss": -6.3067193031311035, "global_step": 103012, "epoch": 2452} {"train_loss": -6.2933502197265625, "global_step": 103013, "epoch": 2452} {"train_loss": -6.281455039978027, "global_step": 103014, "epoch": 2452} {"train_loss": -6.366522312164307, "global_step": 103015, "epoch": 2452} {"train_loss": -6.444730758666992, "global_step": 103016, "epoch": 2452} {"train_loss": -6.309612274169922, "global_step": 103017, "epoch": 2452} {"train_loss": -6.351110935211182, "global_step": 103018, "epoch": 2452} {"train_loss": -6.299407005310059, "global_step": 103019, "epoch": 2452} {"train_loss": -6.430391311645508, "global_step": 103020, "epoch": 2452} {"train_loss": -6.344362258911133, "global_step": 103021, "epoch": 2452} {"train_loss": -6.3271989822387695, "global_step": 103022, "epoch": 2452} {"train_loss": -6.408339023590088, "global_step": 103023, "epoch": 2452} {"train_loss": -6.424235820770264, "global_step": 103024, "epoch": 2452} {"train_loss": -6.366932324000767, "global_step": 103025, "epoch": 2452, "val_loss": 67814.359375} {"train_loss": -6.275957107543945, "global_step": 103026, "epoch": 2453} {"train_loss": -6.334610462188721, "global_step": 103027, "epoch": 2453} {"train_loss": -6.488709449768066, "global_step": 103028, "epoch": 2453} {"train_loss": -6.367690086364746, "global_step": 103029, "epoch": 2453} {"train_loss": -6.342123985290527, "global_step": 103030, "epoch": 2453} {"train_loss": -6.463072776794434, "global_step": 103031, "epoch": 2453} {"train_loss": -6.558615684509277, "global_step": 103032, "epoch": 2453} {"train_loss": -6.261264801025391, "global_step": 103033, "epoch": 2453} {"train_loss": -6.4576640129089355, "global_step": 103034, "epoch": 2453} {"train_loss": -6.372565746307373, "global_step": 103035, "epoch": 2453} {"train_loss": -6.341097831726074, "global_step": 103036, "epoch": 2453} {"train_loss": -6.380236625671387, "global_step": 103037, "epoch": 2453} {"train_loss": -6.3733015060424805, "global_step": 103038, "epoch": 2453} {"train_loss": -6.4825897216796875, "global_step": 103039, "epoch": 2453} {"train_loss": -6.453879356384277, "global_step": 103040, "epoch": 2453} {"train_loss": -6.365604400634766, "global_step": 103041, "epoch": 2453} {"train_loss": -6.393324375152588, "global_step": 103042, "epoch": 2453} {"train_loss": -6.357454299926758, "global_step": 103043, "epoch": 2453} {"train_loss": -6.334047794342041, "global_step": 103044, "epoch": 2453} {"train_loss": -6.410587310791016, "global_step": 103045, "epoch": 2453} {"train_loss": -6.380218505859375, "global_step": 103046, "epoch": 2453} {"train_loss": -6.373493194580078, "global_step": 103047, "epoch": 2453} {"train_loss": -6.375744819641113, "global_step": 103048, "epoch": 2453} {"train_loss": -6.3017072677612305, "global_step": 103049, "epoch": 2453} {"train_loss": -6.4388556480407715, "global_step": 103050, "epoch": 2453} {"train_loss": -6.318921089172363, "global_step": 103051, "epoch": 2453} {"train_loss": -6.410342693328857, "global_step": 103052, "epoch": 2453} {"train_loss": -6.359671592712402, "global_step": 103053, "epoch": 2453} {"train_loss": -6.326782703399658, "global_step": 103054, "epoch": 2453} {"train_loss": -6.441854000091553, "global_step": 103055, "epoch": 2453} {"train_loss": -6.489928722381592, "global_step": 103056, "epoch": 2453} {"train_loss": -6.455824851989746, "global_step": 103057, "epoch": 2453} {"train_loss": -6.387893199920654, "global_step": 103058, "epoch": 2453} {"train_loss": -6.390841484069824, "global_step": 103059, "epoch": 2453} {"train_loss": -6.314193248748779, "global_step": 103060, "epoch": 2453} {"train_loss": -6.490391731262207, "global_step": 103061, "epoch": 2453} {"train_loss": -6.353672981262207, "global_step": 103062, "epoch": 2453} {"train_loss": -6.444610595703125, "global_step": 103063, "epoch": 2453} {"train_loss": -6.435389041900635, "global_step": 103064, "epoch": 2453} {"train_loss": -6.303784370422363, "global_step": 103065, "epoch": 2453} {"train_loss": -6.3711161613464355, "global_step": 103066, "epoch": 2453} {"train_loss": -6.390268836702619, "global_step": 103067, "epoch": 2453, "val_loss": 67978.75} {"train_loss": -6.454252243041992, "global_step": 103068, "epoch": 2454} {"train_loss": -6.319338798522949, "global_step": 103069, "epoch": 2454} {"train_loss": -6.380475044250488, "global_step": 103070, "epoch": 2454} {"train_loss": -6.330067157745361, "global_step": 103071, "epoch": 2454} {"train_loss": -6.486678123474121, "global_step": 103072, "epoch": 2454} {"train_loss": -6.543574333190918, "global_step": 103073, "epoch": 2454} {"train_loss": -6.476747035980225, "global_step": 103074, "epoch": 2454} {"train_loss": -6.427035331726074, "global_step": 103075, "epoch": 2454} {"train_loss": -6.407463073730469, "global_step": 103076, "epoch": 2454} {"train_loss": -6.3466596603393555, "global_step": 103077, "epoch": 2454} {"train_loss": -6.412163734436035, "global_step": 103078, "epoch": 2454} {"train_loss": -6.476912021636963, "global_step": 103079, "epoch": 2454} {"train_loss": -6.451934814453125, "global_step": 103080, "epoch": 2454} {"train_loss": -6.423303604125977, "global_step": 103081, "epoch": 2454} {"train_loss": -6.380669593811035, "global_step": 103082, "epoch": 2454} {"train_loss": -6.280661582946777, "global_step": 103083, "epoch": 2454} {"train_loss": -6.305436611175537, "global_step": 103084, "epoch": 2454} {"train_loss": -6.410898208618164, "global_step": 103085, "epoch": 2454} {"train_loss": -6.219995975494385, "global_step": 103086, "epoch": 2454} {"train_loss": -6.333244323730469, "global_step": 103087, "epoch": 2454} {"train_loss": -6.273825168609619, "global_step": 103088, "epoch": 2454} {"train_loss": -6.2059326171875, "global_step": 103089, "epoch": 2454} {"train_loss": -6.32324743270874, "global_step": 103090, "epoch": 2454} {"train_loss": -6.318816661834717, "global_step": 103091, "epoch": 2454} {"train_loss": -6.354139804840088, "global_step": 103092, "epoch": 2454} {"train_loss": -6.352835655212402, "global_step": 103093, "epoch": 2454} {"train_loss": -6.382465362548828, "global_step": 103094, "epoch": 2454} {"train_loss": -6.363493919372559, "global_step": 103095, "epoch": 2454} {"train_loss": -6.402677059173584, "global_step": 103096, "epoch": 2454} {"train_loss": -6.30689001083374, "global_step": 103097, "epoch": 2454} {"train_loss": -6.3736419677734375, "global_step": 103098, "epoch": 2454} {"train_loss": -6.392278671264648, "global_step": 103099, "epoch": 2454} {"train_loss": -6.363097667694092, "global_step": 103100, "epoch": 2454} {"train_loss": -6.406785011291504, "global_step": 103101, "epoch": 2454} {"train_loss": -6.330771446228027, "global_step": 103102, "epoch": 2454} {"train_loss": -6.427173614501953, "global_step": 103103, "epoch": 2454} {"train_loss": -6.426706314086914, "global_step": 103104, "epoch": 2454} {"train_loss": -6.287430763244629, "global_step": 103105, "epoch": 2454} {"train_loss": -6.314184188842773, "global_step": 103106, "epoch": 2454} {"train_loss": -6.399649620056152, "global_step": 103107, "epoch": 2454} {"train_loss": -6.260678768157959, "global_step": 103108, "epoch": 2454} {"train_loss": -6.370601097742717, "global_step": 103109, "epoch": 2454, "val_loss": 67780.7578125} {"train_loss": -6.419544219970703, "global_step": 103110, "epoch": 2455} {"train_loss": -6.482620716094971, "global_step": 103111, "epoch": 2455} {"train_loss": -6.476981163024902, "global_step": 103112, "epoch": 2455} {"train_loss": -6.432374954223633, "global_step": 103113, "epoch": 2455} {"train_loss": -6.3012166023254395, "global_step": 103114, "epoch": 2455} {"train_loss": -6.406859874725342, "global_step": 103115, "epoch": 2455} {"train_loss": -6.509143829345703, "global_step": 103116, "epoch": 2455} {"train_loss": -6.3073201179504395, "global_step": 103117, "epoch": 2455} {"train_loss": -6.372747421264648, "global_step": 103118, "epoch": 2455} {"train_loss": -6.461911201477051, "global_step": 103119, "epoch": 2455} {"train_loss": -6.380825042724609, "global_step": 103120, "epoch": 2455} {"train_loss": -6.380146026611328, "global_step": 103121, "epoch": 2455} {"train_loss": -6.32417106628418, "global_step": 103122, "epoch": 2455} {"train_loss": -6.39547061920166, "global_step": 103123, "epoch": 2455} {"train_loss": -6.282134532928467, "global_step": 103124, "epoch": 2455} {"train_loss": -6.493628025054932, "global_step": 103125, "epoch": 2455} {"train_loss": -6.348836898803711, "global_step": 103126, "epoch": 2455} {"train_loss": -6.2903971672058105, "global_step": 103127, "epoch": 2455} {"train_loss": -6.3717122077941895, "global_step": 103128, "epoch": 2455} {"train_loss": -6.384899616241455, "global_step": 103129, "epoch": 2455} {"train_loss": -6.299365997314453, "global_step": 103130, "epoch": 2455} {"train_loss": -6.454638481140137, "global_step": 103131, "epoch": 2455} {"train_loss": -6.371514320373535, "global_step": 103132, "epoch": 2455} {"train_loss": -6.349931716918945, "global_step": 103133, "epoch": 2455} {"train_loss": -6.370062828063965, "global_step": 103134, "epoch": 2455} {"train_loss": -6.367143630981445, "global_step": 103135, "epoch": 2455} {"train_loss": -6.305464267730713, "global_step": 103136, "epoch": 2455} {"train_loss": -6.366311550140381, "global_step": 103137, "epoch": 2455} {"train_loss": -6.394765853881836, "global_step": 103138, "epoch": 2455} {"train_loss": -6.362891674041748, "global_step": 103139, "epoch": 2455} {"train_loss": -6.257114887237549, "global_step": 103140, "epoch": 2455} {"train_loss": -6.401656150817871, "global_step": 103141, "epoch": 2455} {"train_loss": -6.320376396179199, "global_step": 103142, "epoch": 2455} {"train_loss": -6.295038223266602, "global_step": 103143, "epoch": 2455} {"train_loss": -6.280681610107422, "global_step": 103144, "epoch": 2455} {"train_loss": -6.34526252746582, "global_step": 103145, "epoch": 2455} {"train_loss": -6.282913684844971, "global_step": 103146, "epoch": 2455} {"train_loss": -6.2732086181640625, "global_step": 103147, "epoch": 2455} {"train_loss": -6.382356643676758, "global_step": 103148, "epoch": 2455} {"train_loss": -6.335413932800293, "global_step": 103149, "epoch": 2455} {"train_loss": -6.338013172149658, "global_step": 103150, "epoch": 2455} {"train_loss": -6.366199879419236, "global_step": 103151, "epoch": 2455, "val_loss": 67827.984375} {"train_loss": -6.397054672241211, "global_step": 103152, "epoch": 2456} {"train_loss": -6.36599063873291, "global_step": 103153, "epoch": 2456} {"train_loss": -6.273460865020752, "global_step": 103154, "epoch": 2456} {"train_loss": -6.280454635620117, "global_step": 103155, "epoch": 2456} {"train_loss": -6.395766735076904, "global_step": 103156, "epoch": 2456} {"train_loss": -6.430795669555664, "global_step": 103157, "epoch": 2456} {"train_loss": -6.422289848327637, "global_step": 103158, "epoch": 2456} {"train_loss": -6.3418660163879395, "global_step": 103159, "epoch": 2456} {"train_loss": -6.151861190795898, "global_step": 103160, "epoch": 2456} {"train_loss": -6.283405780792236, "global_step": 103161, "epoch": 2456} {"train_loss": -6.36296272277832, "global_step": 103162, "epoch": 2456} {"train_loss": -6.329949378967285, "global_step": 103163, "epoch": 2456} {"train_loss": -6.30604362487793, "global_step": 103164, "epoch": 2456} {"train_loss": -6.387083053588867, "global_step": 103165, "epoch": 2456} {"train_loss": -6.454850196838379, "global_step": 103166, "epoch": 2456} {"train_loss": -6.3094587326049805, "global_step": 103167, "epoch": 2456} {"train_loss": -6.190998077392578, "global_step": 103168, "epoch": 2456} {"train_loss": -6.335818767547607, "global_step": 103169, "epoch": 2456} {"train_loss": -6.39081335067749, "global_step": 103170, "epoch": 2456} {"train_loss": -6.251287460327148, "global_step": 103171, "epoch": 2456} {"train_loss": -6.333370208740234, "global_step": 103172, "epoch": 2456} {"train_loss": -6.375003814697266, "global_step": 103173, "epoch": 2456} {"train_loss": -6.390900135040283, "global_step": 103174, "epoch": 2456} {"train_loss": -6.230759620666504, "global_step": 103175, "epoch": 2456} {"train_loss": -6.46626615524292, "global_step": 103176, "epoch": 2456} {"train_loss": -6.365322113037109, "global_step": 103177, "epoch": 2456} {"train_loss": -6.391551494598389, "global_step": 103178, "epoch": 2456} {"train_loss": -6.263141632080078, "global_step": 103179, "epoch": 2456} {"train_loss": -6.365268707275391, "global_step": 103180, "epoch": 2456} {"train_loss": -6.413764476776123, "global_step": 103181, "epoch": 2456} {"train_loss": -6.363621711730957, "global_step": 103182, "epoch": 2456} {"train_loss": -6.293300628662109, "global_step": 103183, "epoch": 2456} {"train_loss": -6.358038902282715, "global_step": 103184, "epoch": 2456} {"train_loss": -6.280280590057373, "global_step": 103185, "epoch": 2456} {"train_loss": -6.4439802169799805, "global_step": 103186, "epoch": 2456} {"train_loss": -6.3086700439453125, "global_step": 103187, "epoch": 2456} {"train_loss": -6.463199138641357, "global_step": 103188, "epoch": 2456} {"train_loss": -6.357837200164795, "global_step": 103189, "epoch": 2456} {"train_loss": -6.390727996826172, "global_step": 103190, "epoch": 2456} {"train_loss": -6.443122386932373, "global_step": 103191, "epoch": 2456} {"train_loss": -6.383306980133057, "global_step": 103192, "epoch": 2456} {"train_loss": -6.350498244875953, "global_step": 103193, "epoch": 2456, "val_loss": 67776.671875} {"train_loss": -6.414964199066162, "global_step": 103194, "epoch": 2457} {"train_loss": -6.383533477783203, "global_step": 103195, "epoch": 2457} {"train_loss": -6.316120624542236, "global_step": 103196, "epoch": 2457} {"train_loss": -6.470579147338867, "global_step": 103197, "epoch": 2457} {"train_loss": -6.458075523376465, "global_step": 103198, "epoch": 2457} {"train_loss": -6.435917854309082, "global_step": 103199, "epoch": 2457} {"train_loss": -6.463031768798828, "global_step": 103200, "epoch": 2457} {"train_loss": -6.277181625366211, "global_step": 103201, "epoch": 2457} {"train_loss": -6.3054938316345215, "global_step": 103202, "epoch": 2457} {"train_loss": -6.382763385772705, "global_step": 103203, "epoch": 2457} {"train_loss": -6.354151725769043, "global_step": 103204, "epoch": 2457} {"train_loss": -6.304198265075684, "global_step": 103205, "epoch": 2457} {"train_loss": -6.527984619140625, "global_step": 103206, "epoch": 2457} {"train_loss": -6.302018642425537, "global_step": 103207, "epoch": 2457} {"train_loss": -6.3096418380737305, "global_step": 103208, "epoch": 2457} {"train_loss": -6.426341533660889, "global_step": 103209, "epoch": 2457} {"train_loss": -6.343292713165283, "global_step": 103210, "epoch": 2457} {"train_loss": -6.323028087615967, "global_step": 103211, "epoch": 2457} {"train_loss": -6.439900875091553, "global_step": 103212, "epoch": 2457} {"train_loss": -6.177484512329102, "global_step": 103213, "epoch": 2457} {"train_loss": -6.416443347930908, "global_step": 103214, "epoch": 2457} {"train_loss": -6.2906999588012695, "global_step": 103215, "epoch": 2457} {"train_loss": -6.3276190757751465, "global_step": 103216, "epoch": 2457} {"train_loss": -6.34631872177124, "global_step": 103217, "epoch": 2457} {"train_loss": -6.352657318115234, "global_step": 103218, "epoch": 2457} {"train_loss": -6.401339054107666, "global_step": 103219, "epoch": 2457} {"train_loss": -6.3764190673828125, "global_step": 103220, "epoch": 2457} {"train_loss": -6.3528571128845215, "global_step": 103221, "epoch": 2457} {"train_loss": -6.261048316955566, "global_step": 103222, "epoch": 2457} {"train_loss": -6.507054328918457, "global_step": 103223, "epoch": 2457} {"train_loss": -6.328592300415039, "global_step": 103224, "epoch": 2457} {"train_loss": -6.281320571899414, "global_step": 103225, "epoch": 2457} {"train_loss": -6.276064872741699, "global_step": 103226, "epoch": 2457} {"train_loss": -6.390661239624023, "global_step": 103227, "epoch": 2457} {"train_loss": -6.33775520324707, "global_step": 103228, "epoch": 2457} {"train_loss": -6.444270610809326, "global_step": 103229, "epoch": 2457} {"train_loss": -6.421995162963867, "global_step": 103230, "epoch": 2457} {"train_loss": -6.322247505187988, "global_step": 103231, "epoch": 2457} {"train_loss": -6.322327613830566, "global_step": 103232, "epoch": 2457} {"train_loss": -6.406956672668457, "global_step": 103233, "epoch": 2457} {"train_loss": -6.255704402923584, "global_step": 103234, "epoch": 2457} {"train_loss": -6.361978735242571, "global_step": 103235, "epoch": 2457, "val_loss": 67919.5390625} {"train_loss": -6.415064811706543, "global_step": 103236, "epoch": 2458} {"train_loss": -6.348145961761475, "global_step": 103237, "epoch": 2458} {"train_loss": -6.399069786071777, "global_step": 103238, "epoch": 2458} {"train_loss": -6.411038398742676, "global_step": 103239, "epoch": 2458} {"train_loss": -6.4248528480529785, "global_step": 103240, "epoch": 2458} {"train_loss": -6.411528587341309, "global_step": 103241, "epoch": 2458} {"train_loss": -6.398628234863281, "global_step": 103242, "epoch": 2458} {"train_loss": -6.4444379806518555, "global_step": 103243, "epoch": 2458} {"train_loss": -6.33821439743042, "global_step": 103244, "epoch": 2458} {"train_loss": -6.297077178955078, "global_step": 103245, "epoch": 2458} {"train_loss": -6.481175422668457, "global_step": 103246, "epoch": 2458} {"train_loss": -6.312997817993164, "global_step": 103247, "epoch": 2458} {"train_loss": -6.402594566345215, "global_step": 103248, "epoch": 2458} {"train_loss": -6.416599750518799, "global_step": 103249, "epoch": 2458} {"train_loss": -6.320880889892578, "global_step": 103250, "epoch": 2458} {"train_loss": -6.418190002441406, "global_step": 103251, "epoch": 2458} {"train_loss": -6.402219772338867, "global_step": 103252, "epoch": 2458} {"train_loss": -6.324738025665283, "global_step": 103253, "epoch": 2458} {"train_loss": -6.38629674911499, "global_step": 103254, "epoch": 2458} {"train_loss": -6.410454750061035, "global_step": 103255, "epoch": 2458} {"train_loss": -6.32203483581543, "global_step": 103256, "epoch": 2458} {"train_loss": -6.284286975860596, "global_step": 103257, "epoch": 2458} {"train_loss": -6.380035400390625, "global_step": 103258, "epoch": 2458} {"train_loss": -6.344228744506836, "global_step": 103259, "epoch": 2458} {"train_loss": -6.345803260803223, "global_step": 103260, "epoch": 2458} {"train_loss": -6.404984951019287, "global_step": 103261, "epoch": 2458} {"train_loss": -6.306854724884033, "global_step": 103262, "epoch": 2458} {"train_loss": -6.290517807006836, "global_step": 103263, "epoch": 2458} {"train_loss": -6.40116024017334, "global_step": 103264, "epoch": 2458} {"train_loss": -6.3314032554626465, "global_step": 103265, "epoch": 2458} {"train_loss": -6.397246360778809, "global_step": 103266, "epoch": 2458} {"train_loss": -6.366385459899902, "global_step": 103267, "epoch": 2458} {"train_loss": -6.366174697875977, "global_step": 103268, "epoch": 2458} {"train_loss": -6.3310394287109375, "global_step": 103269, "epoch": 2458} {"train_loss": -6.340415000915527, "global_step": 103270, "epoch": 2458} {"train_loss": -6.396208763122559, "global_step": 103271, "epoch": 2458} {"train_loss": -6.301113605499268, "global_step": 103272, "epoch": 2458} {"train_loss": -6.324899196624756, "global_step": 103273, "epoch": 2458} {"train_loss": -6.383487701416016, "global_step": 103274, "epoch": 2458} {"train_loss": -6.54773473739624, "global_step": 103275, "epoch": 2458} {"train_loss": -6.375266075134277, "global_step": 103276, "epoch": 2458} {"train_loss": -6.373885745093936, "global_step": 103277, "epoch": 2458, "val_loss": 67977.015625} {"train_loss": -6.308286666870117, "global_step": 103278, "epoch": 2459} {"train_loss": -6.440045356750488, "global_step": 103279, "epoch": 2459} {"train_loss": -6.4424262046813965, "global_step": 103280, "epoch": 2459} {"train_loss": -6.378406524658203, "global_step": 103281, "epoch": 2459} {"train_loss": -6.433703422546387, "global_step": 103282, "epoch": 2459} {"train_loss": -6.501975059509277, "global_step": 103283, "epoch": 2459} {"train_loss": -6.298166751861572, "global_step": 103284, "epoch": 2459} {"train_loss": -6.388628005981445, "global_step": 103285, "epoch": 2459} {"train_loss": -6.331567287445068, "global_step": 103286, "epoch": 2459} {"train_loss": -6.274777412414551, "global_step": 103287, "epoch": 2459} {"train_loss": -6.41407585144043, "global_step": 103288, "epoch": 2459} {"train_loss": -6.32236385345459, "global_step": 103289, "epoch": 2459} {"train_loss": -6.4267401695251465, "global_step": 103290, "epoch": 2459} {"train_loss": -6.292977333068848, "global_step": 103291, "epoch": 2459} {"train_loss": -6.284834861755371, "global_step": 103292, "epoch": 2459} {"train_loss": -6.266172409057617, "global_step": 103293, "epoch": 2459} {"train_loss": -6.30911922454834, "global_step": 103294, "epoch": 2459} {"train_loss": -6.4064531326293945, "global_step": 103295, "epoch": 2459} {"train_loss": -6.4115777015686035, "global_step": 103296, "epoch": 2459} {"train_loss": -6.324237823486328, "global_step": 103297, "epoch": 2459} {"train_loss": -6.436090469360352, "global_step": 103298, "epoch": 2459} {"train_loss": -6.431483268737793, "global_step": 103299, "epoch": 2459} {"train_loss": -6.258379936218262, "global_step": 103300, "epoch": 2459} {"train_loss": -6.3636016845703125, "global_step": 103301, "epoch": 2459} {"train_loss": -6.3980255126953125, "global_step": 103302, "epoch": 2459} {"train_loss": -6.291110038757324, "global_step": 103303, "epoch": 2459} {"train_loss": -6.342872619628906, "global_step": 103304, "epoch": 2459} {"train_loss": -6.329640865325928, "global_step": 103305, "epoch": 2459} {"train_loss": -6.332639694213867, "global_step": 103306, "epoch": 2459} {"train_loss": -6.372337341308594, "global_step": 103307, "epoch": 2459} {"train_loss": -6.268107891082764, "global_step": 103308, "epoch": 2459} {"train_loss": -6.477584362030029, "global_step": 103309, "epoch": 2459} {"train_loss": -6.364243507385254, "global_step": 103310, "epoch": 2459} {"train_loss": -6.410273551940918, "global_step": 103311, "epoch": 2459} {"train_loss": -6.374894142150879, "global_step": 103312, "epoch": 2459} {"train_loss": -6.376254081726074, "global_step": 103313, "epoch": 2459} {"train_loss": -6.251135349273682, "global_step": 103314, "epoch": 2459} {"train_loss": -6.390012741088867, "global_step": 103315, "epoch": 2459} {"train_loss": -6.377019882202148, "global_step": 103316, "epoch": 2459} {"train_loss": -6.322218894958496, "global_step": 103317, "epoch": 2459} {"train_loss": -6.324248313903809, "global_step": 103318, "epoch": 2459} {"train_loss": -6.359491836457026, "global_step": 103319, "epoch": 2459, "val_loss": 67962.7421875} {"train_loss": -6.328977584838867, "global_step": 103320, "epoch": 2460} {"train_loss": -6.272182941436768, "global_step": 103321, "epoch": 2460} {"train_loss": -6.387454986572266, "global_step": 103322, "epoch": 2460} {"train_loss": -6.333051681518555, "global_step": 103323, "epoch": 2460} {"train_loss": -6.306704044342041, "global_step": 103324, "epoch": 2460} {"train_loss": -6.425110340118408, "global_step": 103325, "epoch": 2460} {"train_loss": -6.351058006286621, "global_step": 103326, "epoch": 2460} {"train_loss": -6.2781476974487305, "global_step": 103327, "epoch": 2460} {"train_loss": -6.2258453369140625, "global_step": 103328, "epoch": 2460} {"train_loss": -6.33797550201416, "global_step": 103329, "epoch": 2460} {"train_loss": -6.346064567565918, "global_step": 103330, "epoch": 2460} {"train_loss": -6.322259902954102, "global_step": 103331, "epoch": 2460} {"train_loss": -6.428800106048584, "global_step": 103332, "epoch": 2460} {"train_loss": -6.282379150390625, "global_step": 103333, "epoch": 2460} {"train_loss": -6.2628278732299805, "global_step": 103334, "epoch": 2460} {"train_loss": -6.417357444763184, "global_step": 103335, "epoch": 2460} {"train_loss": -6.268207550048828, "global_step": 103336, "epoch": 2460} {"train_loss": -6.486513137817383, "global_step": 103337, "epoch": 2460} {"train_loss": -6.4048943519592285, "global_step": 103338, "epoch": 2460} {"train_loss": -6.270386219024658, "global_step": 103339, "epoch": 2460} {"train_loss": -6.390198230743408, "global_step": 103340, "epoch": 2460} {"train_loss": -6.350926399230957, "global_step": 103341, "epoch": 2460} {"train_loss": -6.313819408416748, "global_step": 103342, "epoch": 2460} {"train_loss": -6.3089752197265625, "global_step": 103343, "epoch": 2460} {"train_loss": -6.380557060241699, "global_step": 103344, "epoch": 2460} {"train_loss": -6.355047225952148, "global_step": 103345, "epoch": 2460} {"train_loss": -6.413046836853027, "global_step": 103346, "epoch": 2460} {"train_loss": -6.348658084869385, "global_step": 103347, "epoch": 2460} {"train_loss": -6.195330619812012, "global_step": 103348, "epoch": 2460} {"train_loss": -6.401422500610352, "global_step": 103349, "epoch": 2460} {"train_loss": -6.258058071136475, "global_step": 103350, "epoch": 2460} {"train_loss": -6.317071914672852, "global_step": 103351, "epoch": 2460} {"train_loss": -6.342358589172363, "global_step": 103352, "epoch": 2460} {"train_loss": -6.251440048217773, "global_step": 103353, "epoch": 2460} {"train_loss": -6.387701988220215, "global_step": 103354, "epoch": 2460} {"train_loss": -6.446294784545898, "global_step": 103355, "epoch": 2460} {"train_loss": -6.331155776977539, "global_step": 103356, "epoch": 2460} {"train_loss": -6.276156425476074, "global_step": 103357, "epoch": 2460} {"train_loss": -6.406108856201172, "global_step": 103358, "epoch": 2460} {"train_loss": -6.495629787445068, "global_step": 103359, "epoch": 2460} {"train_loss": -6.317774772644043, "global_step": 103360, "epoch": 2460} {"train_loss": -6.3431565534500844, "global_step": 103361, "epoch": 2460, "val_loss": 68038.328125} {"train_loss": -6.345208168029785, "global_step": 103362, "epoch": 2461} {"train_loss": -6.319273948669434, "global_step": 103363, "epoch": 2461} {"train_loss": -6.3421244621276855, "global_step": 103364, "epoch": 2461} {"train_loss": -6.398027420043945, "global_step": 103365, "epoch": 2461} {"train_loss": -6.55000638961792, "global_step": 103366, "epoch": 2461} {"train_loss": -6.381557464599609, "global_step": 103367, "epoch": 2461} {"train_loss": -6.270435810089111, "global_step": 103368, "epoch": 2461} {"train_loss": -6.262844085693359, "global_step": 103369, "epoch": 2461} {"train_loss": -6.268773555755615, "global_step": 103370, "epoch": 2461} {"train_loss": -6.397167682647705, "global_step": 103371, "epoch": 2461} {"train_loss": -6.345851898193359, "global_step": 103372, "epoch": 2461} {"train_loss": -6.411322116851807, "global_step": 103373, "epoch": 2461} {"train_loss": -6.426135063171387, "global_step": 103374, "epoch": 2461} {"train_loss": -6.298654556274414, "global_step": 103375, "epoch": 2461} {"train_loss": -6.369994640350342, "global_step": 103376, "epoch": 2461} {"train_loss": -6.34622859954834, "global_step": 103377, "epoch": 2461} {"train_loss": -6.413726329803467, "global_step": 103378, "epoch": 2461} {"train_loss": -6.475862503051758, "global_step": 103379, "epoch": 2461} {"train_loss": -6.308574676513672, "global_step": 103380, "epoch": 2461} {"train_loss": -6.400032043457031, "global_step": 103381, "epoch": 2461} {"train_loss": -6.395926475524902, "global_step": 103382, "epoch": 2461} {"train_loss": -6.33912467956543, "global_step": 103383, "epoch": 2461} {"train_loss": -6.276980400085449, "global_step": 103384, "epoch": 2461} {"train_loss": -6.326938629150391, "global_step": 103385, "epoch": 2461} {"train_loss": -6.423017501831055, "global_step": 103386, "epoch": 2461} {"train_loss": -6.279636383056641, "global_step": 103387, "epoch": 2461} {"train_loss": -6.430542469024658, "global_step": 103388, "epoch": 2461} {"train_loss": -6.254683494567871, "global_step": 103389, "epoch": 2461} {"train_loss": -6.389485836029053, "global_step": 103390, "epoch": 2461} {"train_loss": -6.323488235473633, "global_step": 103391, "epoch": 2461} {"train_loss": -6.258579254150391, "global_step": 103392, "epoch": 2461} {"train_loss": -6.263042449951172, "global_step": 103393, "epoch": 2461} {"train_loss": -6.420931816101074, "global_step": 103394, "epoch": 2461} {"train_loss": -6.35698127746582, "global_step": 103395, "epoch": 2461} {"train_loss": -6.177568435668945, "global_step": 103396, "epoch": 2461} {"train_loss": -6.303572654724121, "global_step": 103397, "epoch": 2461} {"train_loss": -6.282161712646484, "global_step": 103398, "epoch": 2461} {"train_loss": -6.450517654418945, "global_step": 103399, "epoch": 2461} {"train_loss": -6.253540992736816, "global_step": 103400, "epoch": 2461} {"train_loss": -6.360569953918457, "global_step": 103401, "epoch": 2461} {"train_loss": -6.199592590332031, "global_step": 103402, "epoch": 2461} {"train_loss": -6.341123240334647, "global_step": 103403, "epoch": 2461, "val_loss": 67854.765625} {"train_loss": -6.363180160522461, "global_step": 103404, "epoch": 2462} {"train_loss": -6.263916492462158, "global_step": 103405, "epoch": 2462} {"train_loss": -6.362730979919434, "global_step": 103406, "epoch": 2462} {"train_loss": -6.355766296386719, "global_step": 103407, "epoch": 2462} {"train_loss": -6.306446075439453, "global_step": 103408, "epoch": 2462} {"train_loss": -6.384811878204346, "global_step": 103409, "epoch": 2462} {"train_loss": -6.28939151763916, "global_step": 103410, "epoch": 2462} {"train_loss": -6.2855706214904785, "global_step": 103411, "epoch": 2462} {"train_loss": -6.302773952484131, "global_step": 103412, "epoch": 2462} {"train_loss": -6.3404364585876465, "global_step": 103413, "epoch": 2462} {"train_loss": -6.275549411773682, "global_step": 103414, "epoch": 2462} {"train_loss": -6.328719139099121, "global_step": 103415, "epoch": 2462} {"train_loss": -6.362166404724121, "global_step": 103416, "epoch": 2462} {"train_loss": -6.217598915100098, "global_step": 103417, "epoch": 2462} {"train_loss": -6.453646183013916, "global_step": 103418, "epoch": 2462} {"train_loss": -6.359827995300293, "global_step": 103419, "epoch": 2462} {"train_loss": -6.311505317687988, "global_step": 103420, "epoch": 2462} {"train_loss": -6.3649139404296875, "global_step": 103421, "epoch": 2462} {"train_loss": -6.411898612976074, "global_step": 103422, "epoch": 2462} {"train_loss": -6.492449760437012, "global_step": 103423, "epoch": 2462} {"train_loss": -6.3376617431640625, "global_step": 103424, "epoch": 2462} {"train_loss": -6.432652473449707, "global_step": 103425, "epoch": 2462} {"train_loss": -6.46215295791626, "global_step": 103426, "epoch": 2462} {"train_loss": -6.439411640167236, "global_step": 103427, "epoch": 2462} {"train_loss": -6.302491188049316, "global_step": 103428, "epoch": 2462} {"train_loss": -6.5248847007751465, "global_step": 103429, "epoch": 2462} {"train_loss": -6.3693928718566895, "global_step": 103430, "epoch": 2462} {"train_loss": -6.384773254394531, "global_step": 103431, "epoch": 2462} {"train_loss": -6.2996344566345215, "global_step": 103432, "epoch": 2462} {"train_loss": -6.24229621887207, "global_step": 103433, "epoch": 2462} {"train_loss": -6.327122688293457, "global_step": 103434, "epoch": 2462} {"train_loss": -6.343726634979248, "global_step": 103435, "epoch": 2462} {"train_loss": -6.384218215942383, "global_step": 103436, "epoch": 2462} {"train_loss": -6.438418865203857, "global_step": 103437, "epoch": 2462} {"train_loss": -6.358098030090332, "global_step": 103438, "epoch": 2462} {"train_loss": -6.33492374420166, "global_step": 103439, "epoch": 2462} {"train_loss": -6.290797233581543, "global_step": 103440, "epoch": 2462} {"train_loss": -6.342563629150391, "global_step": 103441, "epoch": 2462} {"train_loss": -6.398219108581543, "global_step": 103442, "epoch": 2462} {"train_loss": -6.400479793548584, "global_step": 103443, "epoch": 2462} {"train_loss": -6.471309185028076, "global_step": 103444, "epoch": 2462} {"train_loss": -6.360224644343059, "global_step": 103445, "epoch": 2462, "val_loss": 68025.9140625} {"train_loss": -6.34212589263916, "global_step": 103446, "epoch": 2463} {"train_loss": -6.370621681213379, "global_step": 103447, "epoch": 2463} {"train_loss": -6.411400318145752, "global_step": 103448, "epoch": 2463} {"train_loss": -6.453068733215332, "global_step": 103449, "epoch": 2463} {"train_loss": -6.500977039337158, "global_step": 103450, "epoch": 2463} {"train_loss": -6.37932014465332, "global_step": 103451, "epoch": 2463} {"train_loss": -6.376947402954102, "global_step": 103452, "epoch": 2463} {"train_loss": -6.468533515930176, "global_step": 103453, "epoch": 2463} {"train_loss": -6.2704854011535645, "global_step": 103454, "epoch": 2463} {"train_loss": -6.436245918273926, "global_step": 103455, "epoch": 2463} {"train_loss": -6.456667900085449, "global_step": 103456, "epoch": 2463} {"train_loss": -6.339077949523926, "global_step": 103457, "epoch": 2463} {"train_loss": -6.402254104614258, "global_step": 103458, "epoch": 2463} {"train_loss": -6.447505474090576, "global_step": 103459, "epoch": 2463} {"train_loss": -6.332745552062988, "global_step": 103460, "epoch": 2463} {"train_loss": -6.38918924331665, "global_step": 103461, "epoch": 2463} {"train_loss": -6.386558532714844, "global_step": 103462, "epoch": 2463} {"train_loss": -6.342041015625, "global_step": 103463, "epoch": 2463} {"train_loss": -6.382265090942383, "global_step": 103464, "epoch": 2463} {"train_loss": -6.432336330413818, "global_step": 103465, "epoch": 2463} {"train_loss": -6.519453048706055, "global_step": 103466, "epoch": 2463} {"train_loss": -6.3063130378723145, "global_step": 103467, "epoch": 2463} {"train_loss": -6.238351345062256, "global_step": 103468, "epoch": 2463} {"train_loss": -6.419538497924805, "global_step": 103469, "epoch": 2463} {"train_loss": -6.38743257522583, "global_step": 103470, "epoch": 2463} {"train_loss": -6.405020713806152, "global_step": 103471, "epoch": 2463} {"train_loss": -6.297417640686035, "global_step": 103472, "epoch": 2463} {"train_loss": -6.456212043762207, "global_step": 103473, "epoch": 2463} {"train_loss": -6.388833999633789, "global_step": 103474, "epoch": 2463} {"train_loss": -6.318866729736328, "global_step": 103475, "epoch": 2463} {"train_loss": -6.459602355957031, "global_step": 103476, "epoch": 2463} {"train_loss": -6.363070487976074, "global_step": 103477, "epoch": 2463} {"train_loss": -6.361730575561523, "global_step": 103478, "epoch": 2463} {"train_loss": -6.312829971313477, "global_step": 103479, "epoch": 2463} {"train_loss": -6.301845550537109, "global_step": 103480, "epoch": 2463} {"train_loss": -6.404770851135254, "global_step": 103481, "epoch": 2463} {"train_loss": -6.359738349914551, "global_step": 103482, "epoch": 2463} {"train_loss": -6.469268321990967, "global_step": 103483, "epoch": 2463} {"train_loss": -6.337063789367676, "global_step": 103484, "epoch": 2463} {"train_loss": -6.377558708190918, "global_step": 103485, "epoch": 2463} {"train_loss": -6.329741477966309, "global_step": 103486, "epoch": 2463} {"train_loss": -6.381570850099836, "global_step": 103487, "epoch": 2463, "val_loss": 68121.078125} {"train_loss": -6.31479549407959, "global_step": 103488, "epoch": 2464} {"train_loss": -6.529679298400879, "global_step": 103489, "epoch": 2464} {"train_loss": -6.3798675537109375, "global_step": 103490, "epoch": 2464} {"train_loss": -6.293540954589844, "global_step": 103491, "epoch": 2464} {"train_loss": -6.329639911651611, "global_step": 103492, "epoch": 2464} {"train_loss": -6.238402366638184, "global_step": 103493, "epoch": 2464} {"train_loss": -6.456929683685303, "global_step": 103494, "epoch": 2464} {"train_loss": -6.316974639892578, "global_step": 103495, "epoch": 2464} {"train_loss": -6.1319379806518555, "global_step": 103496, "epoch": 2464} {"train_loss": -6.438863754272461, "global_step": 103497, "epoch": 2464} {"train_loss": -6.1688337326049805, "global_step": 103498, "epoch": 2464} {"train_loss": -6.170570373535156, "global_step": 103499, "epoch": 2464} {"train_loss": -6.252264976501465, "global_step": 103500, "epoch": 2464} {"train_loss": -6.273772239685059, "global_step": 103501, "epoch": 2464} {"train_loss": -6.421758651733398, "global_step": 103502, "epoch": 2464} {"train_loss": -6.237957954406738, "global_step": 103503, "epoch": 2464} {"train_loss": -6.282384872436523, "global_step": 103504, "epoch": 2464} {"train_loss": -6.287213325500488, "global_step": 103505, "epoch": 2464} {"train_loss": -6.3230509757995605, "global_step": 103506, "epoch": 2464} {"train_loss": -6.327247619628906, "global_step": 103507, "epoch": 2464} {"train_loss": -6.307149887084961, "global_step": 103508, "epoch": 2464} {"train_loss": -6.42738151550293, "global_step": 103509, "epoch": 2464} {"train_loss": -6.283329486846924, "global_step": 103510, "epoch": 2464} {"train_loss": -6.440309524536133, "global_step": 103511, "epoch": 2464} {"train_loss": -6.317984104156494, "global_step": 103512, "epoch": 2464} {"train_loss": -6.329617977142334, "global_step": 103513, "epoch": 2464} {"train_loss": -6.428970813751221, "global_step": 103514, "epoch": 2464} {"train_loss": -6.287854194641113, "global_step": 103515, "epoch": 2464} {"train_loss": -6.231572151184082, "global_step": 103516, "epoch": 2464} {"train_loss": -6.417182922363281, "global_step": 103517, "epoch": 2464} {"train_loss": -6.336408615112305, "global_step": 103518, "epoch": 2464} {"train_loss": -6.336766242980957, "global_step": 103519, "epoch": 2464} {"train_loss": -6.394517421722412, "global_step": 103520, "epoch": 2464} {"train_loss": -6.33596134185791, "global_step": 103521, "epoch": 2464} {"train_loss": -6.369077205657959, "global_step": 103522, "epoch": 2464} {"train_loss": -6.395484924316406, "global_step": 103523, "epoch": 2464} {"train_loss": -6.515310764312744, "global_step": 103524, "epoch": 2464} {"train_loss": -6.437869071960449, "global_step": 103525, "epoch": 2464} {"train_loss": -6.326738357543945, "global_step": 103526, "epoch": 2464} {"train_loss": -6.280838489532471, "global_step": 103527, "epoch": 2464} {"train_loss": -6.456529140472412, "global_step": 103528, "epoch": 2464} {"train_loss": -6.33845405351548, "global_step": 103529, "epoch": 2464, "val_loss": 67969.53125} {"train_loss": -6.4238762855529785, "global_step": 103530, "epoch": 2465} {"train_loss": -6.42342472076416, "global_step": 103531, "epoch": 2465} {"train_loss": -6.385028839111328, "global_step": 103532, "epoch": 2465} {"train_loss": -6.568911552429199, "global_step": 103533, "epoch": 2465} {"train_loss": -6.378237724304199, "global_step": 103534, "epoch": 2465} {"train_loss": -6.391155242919922, "global_step": 103535, "epoch": 2465} {"train_loss": -6.427525520324707, "global_step": 103536, "epoch": 2465} {"train_loss": -6.37394905090332, "global_step": 103537, "epoch": 2465} {"train_loss": -6.315759181976318, "global_step": 103538, "epoch": 2465} {"train_loss": -6.284612655639648, "global_step": 103539, "epoch": 2465} {"train_loss": -6.435708522796631, "global_step": 103540, "epoch": 2465} {"train_loss": -6.182147026062012, "global_step": 103541, "epoch": 2465} {"train_loss": -6.433562278747559, "global_step": 103542, "epoch": 2465} {"train_loss": -6.452914714813232, "global_step": 103543, "epoch": 2465} {"train_loss": -6.342766761779785, "global_step": 103544, "epoch": 2465} {"train_loss": -6.278916358947754, "global_step": 103545, "epoch": 2465} {"train_loss": -6.371528148651123, "global_step": 103546, "epoch": 2465} {"train_loss": -6.422342300415039, "global_step": 103547, "epoch": 2465} {"train_loss": -6.396277904510498, "global_step": 103548, "epoch": 2465} {"train_loss": -6.451516151428223, "global_step": 103549, "epoch": 2465} {"train_loss": -6.333069801330566, "global_step": 103550, "epoch": 2465} {"train_loss": -6.313137054443359, "global_step": 103551, "epoch": 2465} {"train_loss": -6.437671184539795, "global_step": 103552, "epoch": 2465} {"train_loss": -6.35870885848999, "global_step": 103553, "epoch": 2465} {"train_loss": -6.378417015075684, "global_step": 103554, "epoch": 2465} {"train_loss": -6.404778957366943, "global_step": 103555, "epoch": 2465} {"train_loss": -6.373826026916504, "global_step": 103556, "epoch": 2465} {"train_loss": -6.440573692321777, "global_step": 103557, "epoch": 2465} {"train_loss": -6.3305864334106445, "global_step": 103558, "epoch": 2465} {"train_loss": -6.209371089935303, "global_step": 103559, "epoch": 2465} {"train_loss": -6.388139247894287, "global_step": 103560, "epoch": 2465} {"train_loss": -6.458339214324951, "global_step": 103561, "epoch": 2465} {"train_loss": -6.423284530639648, "global_step": 103562, "epoch": 2465} {"train_loss": -6.47766637802124, "global_step": 103563, "epoch": 2465} {"train_loss": -6.46104621887207, "global_step": 103564, "epoch": 2465} {"train_loss": -6.380222320556641, "global_step": 103565, "epoch": 2465} {"train_loss": -6.266972541809082, "global_step": 103566, "epoch": 2465} {"train_loss": -6.412838935852051, "global_step": 103567, "epoch": 2465} {"train_loss": -6.309627532958984, "global_step": 103568, "epoch": 2465} {"train_loss": -6.370882987976074, "global_step": 103569, "epoch": 2465} {"train_loss": -6.233579635620117, "global_step": 103570, "epoch": 2465} {"train_loss": -6.377601033165341, "global_step": 103571, "epoch": 2465, "val_loss": 67866.078125} {"train_loss": -6.3613762855529785, "global_step": 103572, "epoch": 2466} {"train_loss": -6.28284215927124, "global_step": 103573, "epoch": 2466} {"train_loss": -6.374161720275879, "global_step": 103574, "epoch": 2466} {"train_loss": -6.264264106750488, "global_step": 103575, "epoch": 2466} {"train_loss": -6.339288234710693, "global_step": 103576, "epoch": 2466} {"train_loss": -6.248866081237793, "global_step": 103577, "epoch": 2466} {"train_loss": -6.312239170074463, "global_step": 103578, "epoch": 2466} {"train_loss": -6.361699104309082, "global_step": 103579, "epoch": 2466} {"train_loss": -6.204999923706055, "global_step": 103580, "epoch": 2466} {"train_loss": -6.356988906860352, "global_step": 103581, "epoch": 2466} {"train_loss": -6.1886887550354, "global_step": 103582, "epoch": 2466} {"train_loss": -6.357030868530273, "global_step": 103583, "epoch": 2466} {"train_loss": -6.238996982574463, "global_step": 103584, "epoch": 2466} {"train_loss": -6.490962982177734, "global_step": 103585, "epoch": 2466} {"train_loss": -6.208981990814209, "global_step": 103586, "epoch": 2466} {"train_loss": -6.325766563415527, "global_step": 103587, "epoch": 2466} {"train_loss": -6.391523361206055, "global_step": 103588, "epoch": 2466} {"train_loss": -6.360357284545898, "global_step": 103589, "epoch": 2466} {"train_loss": -6.370213508605957, "global_step": 103590, "epoch": 2466} {"train_loss": -6.261621475219727, "global_step": 103591, "epoch": 2466} {"train_loss": -6.379850387573242, "global_step": 103592, "epoch": 2466} {"train_loss": -6.3074774742126465, "global_step": 103593, "epoch": 2466} {"train_loss": -6.315924644470215, "global_step": 103594, "epoch": 2466} {"train_loss": -6.3887553215026855, "global_step": 103595, "epoch": 2466} {"train_loss": -6.424091815948486, "global_step": 103596, "epoch": 2466} {"train_loss": -6.389343738555908, "global_step": 103597, "epoch": 2466} {"train_loss": -6.4301557540893555, "global_step": 103598, "epoch": 2466} {"train_loss": -6.297511100769043, "global_step": 103599, "epoch": 2466} {"train_loss": -6.316241264343262, "global_step": 103600, "epoch": 2466} {"train_loss": -6.442778587341309, "global_step": 103601, "epoch": 2466} {"train_loss": -6.245452404022217, "global_step": 103602, "epoch": 2466} {"train_loss": -6.414467811584473, "global_step": 103603, "epoch": 2466} {"train_loss": -6.378426551818848, "global_step": 103604, "epoch": 2466} {"train_loss": -6.379570960998535, "global_step": 103605, "epoch": 2466} {"train_loss": -6.465162754058838, "global_step": 103606, "epoch": 2466} {"train_loss": -6.306205749511719, "global_step": 103607, "epoch": 2466} {"train_loss": -6.436928749084473, "global_step": 103608, "epoch": 2466} {"train_loss": -6.315440654754639, "global_step": 103609, "epoch": 2466} {"train_loss": -6.396535396575928, "global_step": 103610, "epoch": 2466} {"train_loss": -6.400951385498047, "global_step": 103611, "epoch": 2466} {"train_loss": -6.484164714813232, "global_step": 103612, "epoch": 2466} {"train_loss": -6.348090115047636, "global_step": 103613, "epoch": 2466, "val_loss": 67949.8828125} {"train_loss": -6.369631767272949, "global_step": 103614, "epoch": 2467} {"train_loss": -6.405181884765625, "global_step": 103615, "epoch": 2467} {"train_loss": -6.365639686584473, "global_step": 103616, "epoch": 2467} {"train_loss": -6.374377250671387, "global_step": 103617, "epoch": 2467} {"train_loss": -6.471244812011719, "global_step": 103618, "epoch": 2467} {"train_loss": -6.3610944747924805, "global_step": 103619, "epoch": 2467} {"train_loss": -6.320935249328613, "global_step": 103620, "epoch": 2467} {"train_loss": -6.412140846252441, "global_step": 103621, "epoch": 2467} {"train_loss": -6.49629020690918, "global_step": 103622, "epoch": 2467} {"train_loss": -6.39749813079834, "global_step": 103623, "epoch": 2467} {"train_loss": -6.39116907119751, "global_step": 103624, "epoch": 2467} {"train_loss": -6.500059127807617, "global_step": 103625, "epoch": 2467} {"train_loss": -6.223662853240967, "global_step": 103626, "epoch": 2467} {"train_loss": -6.4478440284729, "global_step": 103627, "epoch": 2467} {"train_loss": -6.371302127838135, "global_step": 103628, "epoch": 2467} {"train_loss": -6.278438568115234, "global_step": 103629, "epoch": 2467} {"train_loss": -6.383437156677246, "global_step": 103630, "epoch": 2467} {"train_loss": -6.379111289978027, "global_step": 103631, "epoch": 2467} {"train_loss": -6.3109564781188965, "global_step": 103632, "epoch": 2467} {"train_loss": -6.410200119018555, "global_step": 103633, "epoch": 2467} {"train_loss": -6.341829776763916, "global_step": 103634, "epoch": 2467} {"train_loss": -6.295451641082764, "global_step": 103635, "epoch": 2467} {"train_loss": -6.291414737701416, "global_step": 103636, "epoch": 2467} {"train_loss": -6.414122104644775, "global_step": 103637, "epoch": 2467} {"train_loss": -6.195766448974609, "global_step": 103638, "epoch": 2467} {"train_loss": -6.454424858093262, "global_step": 103639, "epoch": 2467} {"train_loss": -6.297484397888184, "global_step": 103640, "epoch": 2467} {"train_loss": -6.349896430969238, "global_step": 103641, "epoch": 2467} {"train_loss": -6.303134918212891, "global_step": 103642, "epoch": 2467} {"train_loss": -6.316530227661133, "global_step": 103643, "epoch": 2467} {"train_loss": -6.320709228515625, "global_step": 103644, "epoch": 2467} {"train_loss": -6.193023681640625, "global_step": 103645, "epoch": 2467} {"train_loss": -6.384642124176025, "global_step": 103646, "epoch": 2467} {"train_loss": -6.373632431030273, "global_step": 103647, "epoch": 2467} {"train_loss": -6.3194684982299805, "global_step": 103648, "epoch": 2467} {"train_loss": -6.297675132751465, "global_step": 103649, "epoch": 2467} {"train_loss": -6.188488006591797, "global_step": 103650, "epoch": 2467} {"train_loss": -6.30861234664917, "global_step": 103651, "epoch": 2467} {"train_loss": -6.412457466125488, "global_step": 103652, "epoch": 2467} {"train_loss": -6.47303581237793, "global_step": 103653, "epoch": 2467} {"train_loss": -6.405848026275635, "global_step": 103654, "epoch": 2467} {"train_loss": -6.357194480441866, "global_step": 103655, "epoch": 2467, "val_loss": 67972.359375} {"train_loss": -6.248905181884766, "global_step": 103656, "epoch": 2468} {"train_loss": -6.270074367523193, "global_step": 103657, "epoch": 2468} {"train_loss": -6.412550449371338, "global_step": 103658, "epoch": 2468} {"train_loss": -6.414427280426025, "global_step": 103659, "epoch": 2468} {"train_loss": -6.354462146759033, "global_step": 103660, "epoch": 2468} {"train_loss": -6.444286823272705, "global_step": 103661, "epoch": 2468} {"train_loss": -6.384187698364258, "global_step": 103662, "epoch": 2468} {"train_loss": -6.361617565155029, "global_step": 103663, "epoch": 2468} {"train_loss": -6.483330726623535, "global_step": 103664, "epoch": 2468} {"train_loss": -6.387116432189941, "global_step": 103665, "epoch": 2468} {"train_loss": -6.404995918273926, "global_step": 103666, "epoch": 2468} {"train_loss": -6.335883140563965, "global_step": 103667, "epoch": 2468} {"train_loss": -6.335311412811279, "global_step": 103668, "epoch": 2468} {"train_loss": -6.380807876586914, "global_step": 103669, "epoch": 2468} {"train_loss": -6.426103115081787, "global_step": 103670, "epoch": 2468} {"train_loss": -6.471693515777588, "global_step": 103671, "epoch": 2468} {"train_loss": -6.519379615783691, "global_step": 103672, "epoch": 2468} {"train_loss": -6.452047348022461, "global_step": 103673, "epoch": 2468} {"train_loss": -6.399631500244141, "global_step": 103674, "epoch": 2468} {"train_loss": -6.380311965942383, "global_step": 103675, "epoch": 2468} {"train_loss": -6.372682571411133, "global_step": 103676, "epoch": 2468} {"train_loss": -6.296005725860596, "global_step": 103677, "epoch": 2468} {"train_loss": -6.371387481689453, "global_step": 103678, "epoch": 2468} {"train_loss": -6.375310897827148, "global_step": 103679, "epoch": 2468} {"train_loss": -6.286741733551025, "global_step": 103680, "epoch": 2468} {"train_loss": -6.212624549865723, "global_step": 103681, "epoch": 2468} {"train_loss": -6.353213310241699, "global_step": 103682, "epoch": 2468} {"train_loss": -6.395504951477051, "global_step": 103683, "epoch": 2468} {"train_loss": -6.237414360046387, "global_step": 103684, "epoch": 2468} {"train_loss": -6.198385715484619, "global_step": 103685, "epoch": 2468} {"train_loss": -6.321754455566406, "global_step": 103686, "epoch": 2468} {"train_loss": -6.309520721435547, "global_step": 103687, "epoch": 2468} {"train_loss": -6.376425743103027, "global_step": 103688, "epoch": 2468} {"train_loss": -6.343845367431641, "global_step": 103689, "epoch": 2468} {"train_loss": -6.377560615539551, "global_step": 103690, "epoch": 2468} {"train_loss": -6.253817558288574, "global_step": 103691, "epoch": 2468} {"train_loss": -6.33465576171875, "global_step": 103692, "epoch": 2468} {"train_loss": -6.384078025817871, "global_step": 103693, "epoch": 2468} {"train_loss": -6.325965881347656, "global_step": 103694, "epoch": 2468} {"train_loss": -6.321447372436523, "global_step": 103695, "epoch": 2468} {"train_loss": -6.379639625549316, "global_step": 103696, "epoch": 2468} {"train_loss": -6.356874897366478, "global_step": 103697, "epoch": 2468, "val_loss": 67864.203125} {"train_loss": -6.340163230895996, "global_step": 103698, "epoch": 2469} {"train_loss": -6.397988319396973, "global_step": 103699, "epoch": 2469} {"train_loss": -6.398899555206299, "global_step": 103700, "epoch": 2469} {"train_loss": -6.299847602844238, "global_step": 103701, "epoch": 2469} {"train_loss": -6.442285537719727, "global_step": 103702, "epoch": 2469} {"train_loss": -6.312019348144531, "global_step": 103703, "epoch": 2469} {"train_loss": -6.221088409423828, "global_step": 103704, "epoch": 2469} {"train_loss": -6.344099998474121, "global_step": 103705, "epoch": 2469} {"train_loss": -6.400543212890625, "global_step": 103706, "epoch": 2469} {"train_loss": -6.3079447746276855, "global_step": 103707, "epoch": 2469} {"train_loss": -6.290549278259277, "global_step": 103708, "epoch": 2469} {"train_loss": -6.396641254425049, "global_step": 103709, "epoch": 2469} {"train_loss": -6.3299665451049805, "global_step": 103710, "epoch": 2469} {"train_loss": -6.231972694396973, "global_step": 103711, "epoch": 2469} {"train_loss": -6.402353286743164, "global_step": 103712, "epoch": 2469} {"train_loss": -6.273738861083984, "global_step": 103713, "epoch": 2469} {"train_loss": -6.29168701171875, "global_step": 103714, "epoch": 2469} {"train_loss": -6.359801292419434, "global_step": 103715, "epoch": 2469} {"train_loss": -6.1287007331848145, "global_step": 103716, "epoch": 2469} {"train_loss": -6.362884521484375, "global_step": 103717, "epoch": 2469} {"train_loss": -6.19265079498291, "global_step": 103718, "epoch": 2469} {"train_loss": -6.192564010620117, "global_step": 103719, "epoch": 2469} {"train_loss": -6.272139549255371, "global_step": 103720, "epoch": 2469} {"train_loss": -6.059815406799316, "global_step": 103721, "epoch": 2469} {"train_loss": -6.379156112670898, "global_step": 103722, "epoch": 2469} {"train_loss": -6.008058071136475, "global_step": 103723, "epoch": 2469} {"train_loss": -6.359589576721191, "global_step": 103724, "epoch": 2469} {"train_loss": -6.090227127075195, "global_step": 103725, "epoch": 2469} {"train_loss": -6.419100761413574, "global_step": 103726, "epoch": 2469} {"train_loss": -6.0823469161987305, "global_step": 103727, "epoch": 2469} {"train_loss": -6.203706741333008, "global_step": 103728, "epoch": 2469} {"train_loss": -6.305262565612793, "global_step": 103729, "epoch": 2469} {"train_loss": -6.21356201171875, "global_step": 103730, "epoch": 2469} {"train_loss": -6.236793518066406, "global_step": 103731, "epoch": 2469} {"train_loss": -6.319846153259277, "global_step": 103732, "epoch": 2469} {"train_loss": -6.242104530334473, "global_step": 103733, "epoch": 2469} {"train_loss": -6.174406051635742, "global_step": 103734, "epoch": 2469} {"train_loss": -6.176813125610352, "global_step": 103735, "epoch": 2469} {"train_loss": -6.266107559204102, "global_step": 103736, "epoch": 2469} {"train_loss": -6.297011852264404, "global_step": 103737, "epoch": 2469} {"train_loss": -6.240643501281738, "global_step": 103738, "epoch": 2469} {"train_loss": -6.272772244044712, "global_step": 103739, "epoch": 2469, "val_loss": 67890.9296875} {"train_loss": -6.304542064666748, "global_step": 103740, "epoch": 2470} {"train_loss": -6.271356582641602, "global_step": 103741, "epoch": 2470} {"train_loss": -6.352783203125, "global_step": 103742, "epoch": 2470} {"train_loss": -6.266061305999756, "global_step": 103743, "epoch": 2470} {"train_loss": -6.374938011169434, "global_step": 103744, "epoch": 2470} {"train_loss": -6.350701332092285, "global_step": 103745, "epoch": 2470} {"train_loss": -6.309017181396484, "global_step": 103746, "epoch": 2470} {"train_loss": -6.395977973937988, "global_step": 103747, "epoch": 2470} {"train_loss": -6.313560962677002, "global_step": 103748, "epoch": 2470} {"train_loss": -6.353214263916016, "global_step": 103749, "epoch": 2470} {"train_loss": -6.27269172668457, "global_step": 103750, "epoch": 2470} {"train_loss": -6.437919616699219, "global_step": 103751, "epoch": 2470} {"train_loss": -6.236594200134277, "global_step": 103752, "epoch": 2470} {"train_loss": -6.335024356842041, "global_step": 103753, "epoch": 2470} {"train_loss": -6.294623374938965, "global_step": 103754, "epoch": 2470} {"train_loss": -6.444999694824219, "global_step": 103755, "epoch": 2470} {"train_loss": -6.354106903076172, "global_step": 103756, "epoch": 2470} {"train_loss": -6.282320499420166, "global_step": 103757, "epoch": 2470} {"train_loss": -6.325846195220947, "global_step": 103758, "epoch": 2470} {"train_loss": -6.230136394500732, "global_step": 103759, "epoch": 2470} {"train_loss": -6.344409942626953, "global_step": 103760, "epoch": 2470} {"train_loss": -6.333761692047119, "global_step": 103761, "epoch": 2470} {"train_loss": -6.418801784515381, "global_step": 103762, "epoch": 2470} {"train_loss": -6.371318817138672, "global_step": 103763, "epoch": 2470} {"train_loss": -6.330106735229492, "global_step": 103764, "epoch": 2470} {"train_loss": -6.337839603424072, "global_step": 103765, "epoch": 2470} {"train_loss": -6.408517360687256, "global_step": 103766, "epoch": 2470} {"train_loss": -6.297350883483887, "global_step": 103767, "epoch": 2470} {"train_loss": -6.407200813293457, "global_step": 103768, "epoch": 2470} {"train_loss": -6.305200576782227, "global_step": 103769, "epoch": 2470} {"train_loss": -6.35567045211792, "global_step": 103770, "epoch": 2470} {"train_loss": -6.411518573760986, "global_step": 103771, "epoch": 2470} {"train_loss": -6.359073162078857, "global_step": 103772, "epoch": 2470} {"train_loss": -6.3358049392700195, "global_step": 103773, "epoch": 2470} {"train_loss": -6.293352127075195, "global_step": 103774, "epoch": 2470} {"train_loss": -6.479488849639893, "global_step": 103775, "epoch": 2470} {"train_loss": -6.381281852722168, "global_step": 103776, "epoch": 2470} {"train_loss": -6.2630462646484375, "global_step": 103777, "epoch": 2470} {"train_loss": -6.3680219650268555, "global_step": 103778, "epoch": 2470} {"train_loss": -6.372707366943359, "global_step": 103779, "epoch": 2470} {"train_loss": -6.384451866149902, "global_step": 103780, "epoch": 2470} {"train_loss": -6.344255629039946, "global_step": 103781, "epoch": 2470, "val_loss": 67635.7890625} {"train_loss": -6.3867974281311035, "global_step": 103782, "epoch": 2471} {"train_loss": -6.370889186859131, "global_step": 103783, "epoch": 2471} {"train_loss": -6.434792518615723, "global_step": 103784, "epoch": 2471} {"train_loss": -6.460444450378418, "global_step": 103785, "epoch": 2471} {"train_loss": -6.380102634429932, "global_step": 103786, "epoch": 2471} {"train_loss": -6.446224212646484, "global_step": 103787, "epoch": 2471} {"train_loss": -6.304928302764893, "global_step": 103788, "epoch": 2471} {"train_loss": -6.366252422332764, "global_step": 103789, "epoch": 2471} {"train_loss": -6.326009750366211, "global_step": 103790, "epoch": 2471} {"train_loss": -6.444222450256348, "global_step": 103791, "epoch": 2471} {"train_loss": -6.4701409339904785, "global_step": 103792, "epoch": 2471} {"train_loss": -6.379383087158203, "global_step": 103793, "epoch": 2471} {"train_loss": -6.370622158050537, "global_step": 103794, "epoch": 2471} {"train_loss": -6.50649356842041, "global_step": 103795, "epoch": 2471} {"train_loss": -6.34473991394043, "global_step": 103796, "epoch": 2471} {"train_loss": -6.405649662017822, "global_step": 103797, "epoch": 2471} {"train_loss": -6.36530065536499, "global_step": 103798, "epoch": 2471} {"train_loss": -6.328785419464111, "global_step": 103799, "epoch": 2471} {"train_loss": -6.350747108459473, "global_step": 103800, "epoch": 2471} {"train_loss": -6.277834892272949, "global_step": 103801, "epoch": 2471} {"train_loss": -6.317509174346924, "global_step": 103802, "epoch": 2471} {"train_loss": -6.399681091308594, "global_step": 103803, "epoch": 2471} {"train_loss": -6.48262882232666, "global_step": 103804, "epoch": 2471} {"train_loss": -6.43507194519043, "global_step": 103805, "epoch": 2471} {"train_loss": -6.3894548416137695, "global_step": 103806, "epoch": 2471} {"train_loss": -6.464964866638184, "global_step": 103807, "epoch": 2471} {"train_loss": -6.37983512878418, "global_step": 103808, "epoch": 2471} {"train_loss": -6.496152877807617, "global_step": 103809, "epoch": 2471} {"train_loss": -6.382868766784668, "global_step": 103810, "epoch": 2471} {"train_loss": -6.345074653625488, "global_step": 103811, "epoch": 2471} {"train_loss": -6.366470813751221, "global_step": 103812, "epoch": 2471} {"train_loss": -6.453026294708252, "global_step": 103813, "epoch": 2471} {"train_loss": -6.392264366149902, "global_step": 103814, "epoch": 2471} {"train_loss": -6.439412593841553, "global_step": 103815, "epoch": 2471} {"train_loss": -6.488821029663086, "global_step": 103816, "epoch": 2471} {"train_loss": -6.392001152038574, "global_step": 103817, "epoch": 2471} {"train_loss": -6.377681732177734, "global_step": 103818, "epoch": 2471} {"train_loss": -6.490904808044434, "global_step": 103819, "epoch": 2471} {"train_loss": -6.439362525939941, "global_step": 103820, "epoch": 2471} {"train_loss": -6.3776140213012695, "global_step": 103821, "epoch": 2471} {"train_loss": -6.466330528259277, "global_step": 103822, "epoch": 2471} {"train_loss": -6.402298246111188, "global_step": 103823, "epoch": 2471, "val_loss": 67778.859375} {"train_loss": -6.436429977416992, "global_step": 103824, "epoch": 2472} {"train_loss": -6.445374011993408, "global_step": 103825, "epoch": 2472} {"train_loss": -6.465124607086182, "global_step": 103826, "epoch": 2472} {"train_loss": -6.47650146484375, "global_step": 103827, "epoch": 2472} {"train_loss": -6.269986629486084, "global_step": 103828, "epoch": 2472} {"train_loss": -6.4159932136535645, "global_step": 103829, "epoch": 2472} {"train_loss": -6.345897674560547, "global_step": 103830, "epoch": 2472} {"train_loss": -6.440755367279053, "global_step": 103831, "epoch": 2472} {"train_loss": -6.475587844848633, "global_step": 103832, "epoch": 2472} {"train_loss": -6.417194843292236, "global_step": 103833, "epoch": 2472} {"train_loss": -6.460519790649414, "global_step": 103834, "epoch": 2472} {"train_loss": -6.454714298248291, "global_step": 103835, "epoch": 2472} {"train_loss": -6.2600884437561035, "global_step": 103836, "epoch": 2472} {"train_loss": -6.38170051574707, "global_step": 103837, "epoch": 2472} {"train_loss": -6.390992164611816, "global_step": 103838, "epoch": 2472} {"train_loss": -6.417128562927246, "global_step": 103839, "epoch": 2472} {"train_loss": -6.435312271118164, "global_step": 103840, "epoch": 2472} {"train_loss": -6.391373157501221, "global_step": 103841, "epoch": 2472} {"train_loss": -6.498023509979248, "global_step": 103842, "epoch": 2472} {"train_loss": -6.439882278442383, "global_step": 103843, "epoch": 2472} {"train_loss": -6.438793182373047, "global_step": 103844, "epoch": 2472} {"train_loss": -6.387648582458496, "global_step": 103845, "epoch": 2472} {"train_loss": -6.563401222229004, "global_step": 103846, "epoch": 2472} {"train_loss": -6.380610942840576, "global_step": 103847, "epoch": 2472} {"train_loss": -6.411594867706299, "global_step": 103848, "epoch": 2472} {"train_loss": -6.392107963562012, "global_step": 103849, "epoch": 2472} {"train_loss": -6.5733256340026855, "global_step": 103850, "epoch": 2472} {"train_loss": -6.425546646118164, "global_step": 103851, "epoch": 2472} {"train_loss": -6.3000359535217285, "global_step": 103852, "epoch": 2472} {"train_loss": -6.349884033203125, "global_step": 103853, "epoch": 2472} {"train_loss": -6.399682998657227, "global_step": 103854, "epoch": 2472} {"train_loss": -6.399964332580566, "global_step": 103855, "epoch": 2472} {"train_loss": -6.421626091003418, "global_step": 103856, "epoch": 2472} {"train_loss": -6.388823509216309, "global_step": 103857, "epoch": 2472} {"train_loss": -6.300239562988281, "global_step": 103858, "epoch": 2472} {"train_loss": -6.460120677947998, "global_step": 103859, "epoch": 2472} {"train_loss": -6.5026631355285645, "global_step": 103860, "epoch": 2472} {"train_loss": -6.394153118133545, "global_step": 103861, "epoch": 2472} {"train_loss": -6.487152099609375, "global_step": 103862, "epoch": 2472} {"train_loss": -6.291766166687012, "global_step": 103863, "epoch": 2472} {"train_loss": -6.4120073318481445, "global_step": 103864, "epoch": 2472} {"train_loss": -6.416471787861416, "global_step": 103865, "epoch": 2472, "val_loss": 67944.609375} {"train_loss": -6.404226303100586, "global_step": 103866, "epoch": 2473} {"train_loss": -6.404205799102783, "global_step": 103867, "epoch": 2473} {"train_loss": -6.334381103515625, "global_step": 103868, "epoch": 2473} {"train_loss": -6.442865371704102, "global_step": 103869, "epoch": 2473} {"train_loss": -6.319060325622559, "global_step": 103870, "epoch": 2473} {"train_loss": -6.361794948577881, "global_step": 103871, "epoch": 2473} {"train_loss": -6.409269332885742, "global_step": 103872, "epoch": 2473} {"train_loss": -6.424040794372559, "global_step": 103873, "epoch": 2473} {"train_loss": -6.308452606201172, "global_step": 103874, "epoch": 2473} {"train_loss": -6.400511264801025, "global_step": 103875, "epoch": 2473} {"train_loss": -6.347935199737549, "global_step": 103876, "epoch": 2473} {"train_loss": -6.380474090576172, "global_step": 103877, "epoch": 2473} {"train_loss": -6.3235554695129395, "global_step": 103878, "epoch": 2473} {"train_loss": -6.398407459259033, "global_step": 103879, "epoch": 2473} {"train_loss": -6.412001132965088, "global_step": 103880, "epoch": 2473} {"train_loss": -6.36706018447876, "global_step": 103881, "epoch": 2473} {"train_loss": -6.3315582275390625, "global_step": 103882, "epoch": 2473} {"train_loss": -6.243724346160889, "global_step": 103883, "epoch": 2473} {"train_loss": -6.33188533782959, "global_step": 103884, "epoch": 2473} {"train_loss": -6.231289863586426, "global_step": 103885, "epoch": 2473} {"train_loss": -6.31878662109375, "global_step": 103886, "epoch": 2473} {"train_loss": -6.320005416870117, "global_step": 103887, "epoch": 2473} {"train_loss": -6.3574371337890625, "global_step": 103888, "epoch": 2473} {"train_loss": -6.359340667724609, "global_step": 103889, "epoch": 2473} {"train_loss": -6.362609386444092, "global_step": 103890, "epoch": 2473} {"train_loss": -6.365458965301514, "global_step": 103891, "epoch": 2473} {"train_loss": -6.383460521697998, "global_step": 103892, "epoch": 2473} {"train_loss": -6.265466690063477, "global_step": 103893, "epoch": 2473} {"train_loss": -6.348231792449951, "global_step": 103894, "epoch": 2473} {"train_loss": -6.321437835693359, "global_step": 103895, "epoch": 2473} {"train_loss": -6.380958080291748, "global_step": 103896, "epoch": 2473} {"train_loss": -6.2419023513793945, "global_step": 103897, "epoch": 2473} {"train_loss": -6.366170883178711, "global_step": 103898, "epoch": 2473} {"train_loss": -6.32563591003418, "global_step": 103899, "epoch": 2473} {"train_loss": -6.293654441833496, "global_step": 103900, "epoch": 2473} {"train_loss": -6.313984394073486, "global_step": 103901, "epoch": 2473} {"train_loss": -6.3932390213012695, "global_step": 103902, "epoch": 2473} {"train_loss": -6.3129496574401855, "global_step": 103903, "epoch": 2473} {"train_loss": -6.382718086242676, "global_step": 103904, "epoch": 2473} {"train_loss": -6.415281772613525, "global_step": 103905, "epoch": 2473} {"train_loss": -6.383914947509766, "global_step": 103906, "epoch": 2473} {"train_loss": -6.351681391398112, "global_step": 103907, "epoch": 2473, "val_loss": 67977.6328125} {"train_loss": -6.338932037353516, "global_step": 103908, "epoch": 2474} {"train_loss": -6.323946952819824, "global_step": 103909, "epoch": 2474} {"train_loss": -6.511017799377441, "global_step": 103910, "epoch": 2474} {"train_loss": -6.520469665527344, "global_step": 103911, "epoch": 2474} {"train_loss": -6.397644996643066, "global_step": 103912, "epoch": 2474} {"train_loss": -6.340287685394287, "global_step": 103913, "epoch": 2474} {"train_loss": -6.420111179351807, "global_step": 103914, "epoch": 2474} {"train_loss": -6.2850542068481445, "global_step": 103915, "epoch": 2474} {"train_loss": -6.357850074768066, "global_step": 103916, "epoch": 2474} {"train_loss": -6.385525226593018, "global_step": 103917, "epoch": 2474} {"train_loss": -6.285879135131836, "global_step": 103918, "epoch": 2474} {"train_loss": -6.475011348724365, "global_step": 103919, "epoch": 2474} {"train_loss": -6.254761695861816, "global_step": 103920, "epoch": 2474} {"train_loss": -6.440277576446533, "global_step": 103921, "epoch": 2474} {"train_loss": -6.35855770111084, "global_step": 103922, "epoch": 2474} {"train_loss": -6.393169403076172, "global_step": 103923, "epoch": 2474} {"train_loss": -6.315823554992676, "global_step": 103924, "epoch": 2474} {"train_loss": -6.424724578857422, "global_step": 103925, "epoch": 2474} {"train_loss": -6.383245944976807, "global_step": 103926, "epoch": 2474} {"train_loss": -6.344597339630127, "global_step": 103927, "epoch": 2474} {"train_loss": -6.363214492797852, "global_step": 103928, "epoch": 2474} {"train_loss": -6.269378185272217, "global_step": 103929, "epoch": 2474} {"train_loss": -6.402112007141113, "global_step": 103930, "epoch": 2474} {"train_loss": -6.321975231170654, "global_step": 103931, "epoch": 2474} {"train_loss": -6.455456733703613, "global_step": 103932, "epoch": 2474} {"train_loss": -6.345763683319092, "global_step": 103933, "epoch": 2474} {"train_loss": -6.392270565032959, "global_step": 103934, "epoch": 2474} {"train_loss": -6.487288475036621, "global_step": 103935, "epoch": 2474} {"train_loss": -6.412445545196533, "global_step": 103936, "epoch": 2474} {"train_loss": -6.210479736328125, "global_step": 103937, "epoch": 2474} {"train_loss": -6.406317710876465, "global_step": 103938, "epoch": 2474} {"train_loss": -6.379184722900391, "global_step": 103939, "epoch": 2474} {"train_loss": -6.4030609130859375, "global_step": 103940, "epoch": 2474} {"train_loss": -6.2918500900268555, "global_step": 103941, "epoch": 2474} {"train_loss": -6.36688756942749, "global_step": 103942, "epoch": 2474} {"train_loss": -6.326737403869629, "global_step": 103943, "epoch": 2474} {"train_loss": -6.258200645446777, "global_step": 103944, "epoch": 2474} {"train_loss": -6.314329147338867, "global_step": 103945, "epoch": 2474} {"train_loss": -6.4240899085998535, "global_step": 103946, "epoch": 2474} {"train_loss": -6.290853500366211, "global_step": 103947, "epoch": 2474} {"train_loss": -6.508625030517578, "global_step": 103948, "epoch": 2474} {"train_loss": -6.371623538789295, "global_step": 103949, "epoch": 2474, "val_loss": 67737.9921875} {"train_loss": -6.4205169677734375, "global_step": 103950, "epoch": 2475} {"train_loss": -6.458727836608887, "global_step": 103951, "epoch": 2475} {"train_loss": -6.381653308868408, "global_step": 103952, "epoch": 2475} {"train_loss": -6.397335052490234, "global_step": 103953, "epoch": 2475} {"train_loss": -6.325479507446289, "global_step": 103954, "epoch": 2475} {"train_loss": -6.4433746337890625, "global_step": 103955, "epoch": 2475} {"train_loss": -6.460860252380371, "global_step": 103956, "epoch": 2475} {"train_loss": -6.454885005950928, "global_step": 103957, "epoch": 2475} {"train_loss": -6.519549369812012, "global_step": 103958, "epoch": 2475} {"train_loss": -6.356820106506348, "global_step": 103959, "epoch": 2475} {"train_loss": -6.448514938354492, "global_step": 103960, "epoch": 2475} {"train_loss": -6.261495113372803, "global_step": 103961, "epoch": 2475} {"train_loss": -6.408214092254639, "global_step": 103962, "epoch": 2475} {"train_loss": -6.479510307312012, "global_step": 103963, "epoch": 2475} {"train_loss": -6.403647422790527, "global_step": 103964, "epoch": 2475} {"train_loss": -6.361113548278809, "global_step": 103965, "epoch": 2475} {"train_loss": -6.416130542755127, "global_step": 103966, "epoch": 2475} {"train_loss": -6.437824726104736, "global_step": 103967, "epoch": 2475} {"train_loss": -6.450129508972168, "global_step": 103968, "epoch": 2475} {"train_loss": -6.373594284057617, "global_step": 103969, "epoch": 2475} {"train_loss": -6.379763603210449, "global_step": 103970, "epoch": 2475} {"train_loss": -6.323691368103027, "global_step": 103971, "epoch": 2475} {"train_loss": -6.312592029571533, "global_step": 103972, "epoch": 2475} {"train_loss": -6.37904167175293, "global_step": 103973, "epoch": 2475} {"train_loss": -6.398041725158691, "global_step": 103974, "epoch": 2475} {"train_loss": -6.484488010406494, "global_step": 103975, "epoch": 2475} {"train_loss": -6.357993125915527, "global_step": 103976, "epoch": 2475} {"train_loss": -6.306813716888428, "global_step": 103977, "epoch": 2475} {"train_loss": -6.273451805114746, "global_step": 103978, "epoch": 2475} {"train_loss": -6.21876335144043, "global_step": 103979, "epoch": 2475} {"train_loss": -6.302594184875488, "global_step": 103980, "epoch": 2475} {"train_loss": -6.309998512268066, "global_step": 103981, "epoch": 2475} {"train_loss": -6.274446964263916, "global_step": 103982, "epoch": 2475} {"train_loss": -6.40194845199585, "global_step": 103983, "epoch": 2475} {"train_loss": -6.294796943664551, "global_step": 103984, "epoch": 2475} {"train_loss": -6.415284156799316, "global_step": 103985, "epoch": 2475} {"train_loss": -6.311295032501221, "global_step": 103986, "epoch": 2475} {"train_loss": -6.311547756195068, "global_step": 103987, "epoch": 2475} {"train_loss": -6.406166076660156, "global_step": 103988, "epoch": 2475} {"train_loss": -6.391180038452148, "global_step": 103989, "epoch": 2475} {"train_loss": -6.311104774475098, "global_step": 103990, "epoch": 2475} {"train_loss": -6.374921458108084, "global_step": 103991, "epoch": 2475, "val_loss": 67786.96875} {"train_loss": -6.307064056396484, "global_step": 103992, "epoch": 2476} {"train_loss": -6.47956657409668, "global_step": 103993, "epoch": 2476} {"train_loss": -6.459040641784668, "global_step": 103994, "epoch": 2476} {"train_loss": -6.350828170776367, "global_step": 103995, "epoch": 2476} {"train_loss": -6.340188026428223, "global_step": 103996, "epoch": 2476} {"train_loss": -6.415552139282227, "global_step": 103997, "epoch": 2476} {"train_loss": -6.446416854858398, "global_step": 103998, "epoch": 2476} {"train_loss": -6.244971752166748, "global_step": 103999, "epoch": 2476} {"train_loss": -6.398586750030518, "global_step": 104000, "epoch": 2476} {"train_loss": -6.287629127502441, "global_step": 104001, "epoch": 2476} {"train_loss": -6.454341888427734, "global_step": 104002, "epoch": 2476} {"train_loss": -6.368502616882324, "global_step": 104003, "epoch": 2476} {"train_loss": -6.381134033203125, "global_step": 104004, "epoch": 2476} {"train_loss": -6.436209678649902, "global_step": 104005, "epoch": 2476} {"train_loss": -6.415316581726074, "global_step": 104006, "epoch": 2476} {"train_loss": -6.370693206787109, "global_step": 104007, "epoch": 2476} {"train_loss": -6.413628101348877, "global_step": 104008, "epoch": 2476} {"train_loss": -6.455377101898193, "global_step": 104009, "epoch": 2476} {"train_loss": -6.393501281738281, "global_step": 104010, "epoch": 2476} {"train_loss": -6.312282562255859, "global_step": 104011, "epoch": 2476} {"train_loss": -6.403336048126221, "global_step": 104012, "epoch": 2476} {"train_loss": -6.388999938964844, "global_step": 104013, "epoch": 2476} {"train_loss": -6.411569595336914, "global_step": 104014, "epoch": 2476} {"train_loss": -6.499159812927246, "global_step": 104015, "epoch": 2476} {"train_loss": -6.327866554260254, "global_step": 104016, "epoch": 2476} {"train_loss": -6.392971992492676, "global_step": 104017, "epoch": 2476} {"train_loss": -6.3190436363220215, "global_step": 104018, "epoch": 2476} {"train_loss": -6.414735794067383, "global_step": 104019, "epoch": 2476} {"train_loss": -6.401386737823486, "global_step": 104020, "epoch": 2476} {"train_loss": -6.47238826751709, "global_step": 104021, "epoch": 2476} {"train_loss": -6.388643264770508, "global_step": 104022, "epoch": 2476} {"train_loss": -6.318029403686523, "global_step": 104023, "epoch": 2476} {"train_loss": -6.381510257720947, "global_step": 104024, "epoch": 2476} {"train_loss": -6.443417072296143, "global_step": 104025, "epoch": 2476} {"train_loss": -6.519017696380615, "global_step": 104026, "epoch": 2476} {"train_loss": -6.451047897338867, "global_step": 104027, "epoch": 2476} {"train_loss": -6.484929084777832, "global_step": 104028, "epoch": 2476} {"train_loss": -6.240411758422852, "global_step": 104029, "epoch": 2476} {"train_loss": -6.457545757293701, "global_step": 104030, "epoch": 2476} {"train_loss": -6.425319671630859, "global_step": 104031, "epoch": 2476} {"train_loss": -6.407050132751465, "global_step": 104032, "epoch": 2476} {"train_loss": -6.3955133983067105, "global_step": 104033, "epoch": 2476, "val_loss": 67871.140625} {"train_loss": -6.425060272216797, "global_step": 104034, "epoch": 2477} {"train_loss": -6.424698829650879, "global_step": 104035, "epoch": 2477} {"train_loss": -6.461747169494629, "global_step": 104036, "epoch": 2477} {"train_loss": -6.477829456329346, "global_step": 104037, "epoch": 2477} {"train_loss": -6.387073516845703, "global_step": 104038, "epoch": 2477} {"train_loss": -6.3860578536987305, "global_step": 104039, "epoch": 2477} {"train_loss": -6.337071895599365, "global_step": 104040, "epoch": 2477} {"train_loss": -6.344097137451172, "global_step": 104041, "epoch": 2477} {"train_loss": -6.312229633331299, "global_step": 104042, "epoch": 2477} {"train_loss": -6.4169416427612305, "global_step": 104043, "epoch": 2477} {"train_loss": -6.397672653198242, "global_step": 104044, "epoch": 2477} {"train_loss": -6.400773048400879, "global_step": 104045, "epoch": 2477} {"train_loss": -6.327728748321533, "global_step": 104046, "epoch": 2477} {"train_loss": -6.369939804077148, "global_step": 104047, "epoch": 2477} {"train_loss": -6.413761138916016, "global_step": 104048, "epoch": 2477} {"train_loss": -6.423643112182617, "global_step": 104049, "epoch": 2477} {"train_loss": -6.350655555725098, "global_step": 104050, "epoch": 2477} {"train_loss": -6.413414001464844, "global_step": 104051, "epoch": 2477} {"train_loss": -6.306478023529053, "global_step": 104052, "epoch": 2477} {"train_loss": -6.416412353515625, "global_step": 104053, "epoch": 2477} {"train_loss": -6.254899978637695, "global_step": 104054, "epoch": 2477} {"train_loss": -6.46453857421875, "global_step": 104055, "epoch": 2477} {"train_loss": -6.1262125968933105, "global_step": 104056, "epoch": 2477} {"train_loss": -6.440570831298828, "global_step": 104057, "epoch": 2477} {"train_loss": -6.434178352355957, "global_step": 104058, "epoch": 2477} {"train_loss": -6.400652885437012, "global_step": 104059, "epoch": 2477} {"train_loss": -6.351587295532227, "global_step": 104060, "epoch": 2477} {"train_loss": -6.460129737854004, "global_step": 104061, "epoch": 2477} {"train_loss": -6.488058090209961, "global_step": 104062, "epoch": 2477} {"train_loss": -6.555440902709961, "global_step": 104063, "epoch": 2477} {"train_loss": -6.385470867156982, "global_step": 104064, "epoch": 2477} {"train_loss": -6.399293899536133, "global_step": 104065, "epoch": 2477} {"train_loss": -6.432537078857422, "global_step": 104066, "epoch": 2477} {"train_loss": -6.386666297912598, "global_step": 104067, "epoch": 2477} {"train_loss": -6.343172073364258, "global_step": 104068, "epoch": 2477} {"train_loss": -6.430647850036621, "global_step": 104069, "epoch": 2477} {"train_loss": -6.376873970031738, "global_step": 104070, "epoch": 2477} {"train_loss": -6.550396919250488, "global_step": 104071, "epoch": 2477} {"train_loss": -6.515324115753174, "global_step": 104072, "epoch": 2477} {"train_loss": -6.362002849578857, "global_step": 104073, "epoch": 2477} {"train_loss": -6.402021408081055, "global_step": 104074, "epoch": 2477} {"train_loss": -6.399364880153111, "global_step": 104075, "epoch": 2477, "val_loss": 67817.828125} {"train_loss": -6.322890758514404, "global_step": 104076, "epoch": 2478} {"train_loss": -6.3582916259765625, "global_step": 104077, "epoch": 2478} {"train_loss": -6.357316970825195, "global_step": 104078, "epoch": 2478} {"train_loss": -6.514763832092285, "global_step": 104079, "epoch": 2478} {"train_loss": -6.405516624450684, "global_step": 104080, "epoch": 2478} {"train_loss": -6.458107948303223, "global_step": 104081, "epoch": 2478} {"train_loss": -6.46157693862915, "global_step": 104082, "epoch": 2478} {"train_loss": -6.483885288238525, "global_step": 104083, "epoch": 2478} {"train_loss": -6.549351215362549, "global_step": 104084, "epoch": 2478} {"train_loss": -6.515971660614014, "global_step": 104085, "epoch": 2478} {"train_loss": -6.451720714569092, "global_step": 104086, "epoch": 2478} {"train_loss": -6.529711723327637, "global_step": 104087, "epoch": 2478} {"train_loss": -6.333987236022949, "global_step": 104088, "epoch": 2478} {"train_loss": -6.386801242828369, "global_step": 104089, "epoch": 2478} {"train_loss": -6.497159004211426, "global_step": 104090, "epoch": 2478} {"train_loss": -6.351408958435059, "global_step": 104091, "epoch": 2478} {"train_loss": -6.375977993011475, "global_step": 104092, "epoch": 2478} {"train_loss": -6.4202880859375, "global_step": 104093, "epoch": 2478} {"train_loss": -6.449366569519043, "global_step": 104094, "epoch": 2478} {"train_loss": -6.516161918640137, "global_step": 104095, "epoch": 2478} {"train_loss": -6.397459030151367, "global_step": 104096, "epoch": 2478} {"train_loss": -6.400725364685059, "global_step": 104097, "epoch": 2478} {"train_loss": -6.313391208648682, "global_step": 104098, "epoch": 2478} {"train_loss": -6.458591461181641, "global_step": 104099, "epoch": 2478} {"train_loss": -6.31520938873291, "global_step": 104100, "epoch": 2478} {"train_loss": -6.35563850402832, "global_step": 104101, "epoch": 2478} {"train_loss": -6.334025859832764, "global_step": 104102, "epoch": 2478} {"train_loss": -6.4566545486450195, "global_step": 104103, "epoch": 2478} {"train_loss": -6.381110668182373, "global_step": 104104, "epoch": 2478} {"train_loss": -6.3953938484191895, "global_step": 104105, "epoch": 2478} {"train_loss": -6.477661609649658, "global_step": 104106, "epoch": 2478} {"train_loss": -6.436673641204834, "global_step": 104107, "epoch": 2478} {"train_loss": -6.433658599853516, "global_step": 104108, "epoch": 2478} {"train_loss": -6.4429850578308105, "global_step": 104109, "epoch": 2478} {"train_loss": -6.45309591293335, "global_step": 104110, "epoch": 2478} {"train_loss": -6.383398532867432, "global_step": 104111, "epoch": 2478} {"train_loss": -6.320732116699219, "global_step": 104112, "epoch": 2478} {"train_loss": -6.279764175415039, "global_step": 104113, "epoch": 2478} {"train_loss": -6.264570236206055, "global_step": 104114, "epoch": 2478} {"train_loss": -6.441336631774902, "global_step": 104115, "epoch": 2478} {"train_loss": -6.258111000061035, "global_step": 104116, "epoch": 2478} {"train_loss": -6.409733420326596, "global_step": 104117, "epoch": 2478, "val_loss": 68044.640625} {"train_loss": -6.3362040519714355, "global_step": 104118, "epoch": 2479} {"train_loss": -6.384392738342285, "global_step": 104119, "epoch": 2479} {"train_loss": -6.432587623596191, "global_step": 104120, "epoch": 2479} {"train_loss": -6.396434783935547, "global_step": 104121, "epoch": 2479} {"train_loss": -6.318720817565918, "global_step": 104122, "epoch": 2479} {"train_loss": -6.413379669189453, "global_step": 104123, "epoch": 2479} {"train_loss": -6.415716171264648, "global_step": 104124, "epoch": 2479} {"train_loss": -6.322077751159668, "global_step": 104125, "epoch": 2479} {"train_loss": -6.4430670738220215, "global_step": 104126, "epoch": 2479} {"train_loss": -6.366564750671387, "global_step": 104127, "epoch": 2479} {"train_loss": -6.432347297668457, "global_step": 104128, "epoch": 2479} {"train_loss": -6.409887790679932, "global_step": 104129, "epoch": 2479} {"train_loss": -6.413433074951172, "global_step": 104130, "epoch": 2479} {"train_loss": -6.3731255531311035, "global_step": 104131, "epoch": 2479} {"train_loss": -6.342641830444336, "global_step": 104132, "epoch": 2479} {"train_loss": -6.413283348083496, "global_step": 104133, "epoch": 2479} {"train_loss": -6.365345478057861, "global_step": 104134, "epoch": 2479} {"train_loss": -6.30183744430542, "global_step": 104135, "epoch": 2479} {"train_loss": -6.4073052406311035, "global_step": 104136, "epoch": 2479} {"train_loss": -6.417123317718506, "global_step": 104137, "epoch": 2479} {"train_loss": -6.4557576179504395, "global_step": 104138, "epoch": 2479} {"train_loss": -6.3036675453186035, "global_step": 104139, "epoch": 2479} {"train_loss": -6.438462734222412, "global_step": 104140, "epoch": 2479} {"train_loss": -6.305402755737305, "global_step": 104141, "epoch": 2479} {"train_loss": -6.468711853027344, "global_step": 104142, "epoch": 2479} {"train_loss": -6.319736003875732, "global_step": 104143, "epoch": 2479} {"train_loss": -6.4480485916137695, "global_step": 104144, "epoch": 2479} {"train_loss": -6.578146457672119, "global_step": 104145, "epoch": 2479} {"train_loss": -6.2048749923706055, "global_step": 104146, "epoch": 2479} {"train_loss": -6.37398624420166, "global_step": 104147, "epoch": 2479} {"train_loss": -6.354711532592773, "global_step": 104148, "epoch": 2479} {"train_loss": -6.320340156555176, "global_step": 104149, "epoch": 2479} {"train_loss": -6.295515537261963, "global_step": 104150, "epoch": 2479} {"train_loss": -6.2912516593933105, "global_step": 104151, "epoch": 2479} {"train_loss": -6.3533453941345215, "global_step": 104152, "epoch": 2479} {"train_loss": -6.3935322761535645, "global_step": 104153, "epoch": 2479} {"train_loss": -6.346060276031494, "global_step": 104154, "epoch": 2479} {"train_loss": -6.341524124145508, "global_step": 104155, "epoch": 2479} {"train_loss": -6.460111618041992, "global_step": 104156, "epoch": 2479} {"train_loss": -6.357809066772461, "global_step": 104157, "epoch": 2479} {"train_loss": -6.399403095245361, "global_step": 104158, "epoch": 2479} {"train_loss": -6.379246802557082, "global_step": 104159, "epoch": 2479, "val_loss": 68142.6328125} {"train_loss": -6.359626293182373, "global_step": 104160, "epoch": 2480} {"train_loss": -6.4280500411987305, "global_step": 104161, "epoch": 2480} {"train_loss": -6.428468227386475, "global_step": 104162, "epoch": 2480} {"train_loss": -6.435164451599121, "global_step": 104163, "epoch": 2480} {"train_loss": -6.455363750457764, "global_step": 104164, "epoch": 2480} {"train_loss": -6.454327583312988, "global_step": 104165, "epoch": 2480} {"train_loss": -6.521045684814453, "global_step": 104166, "epoch": 2480} {"train_loss": -6.387179374694824, "global_step": 104167, "epoch": 2480} {"train_loss": -6.3486223220825195, "global_step": 104168, "epoch": 2480} {"train_loss": -6.3683319091796875, "global_step": 104169, "epoch": 2480} {"train_loss": -6.332309246063232, "global_step": 104170, "epoch": 2480} {"train_loss": -6.445631980895996, "global_step": 104171, "epoch": 2480} {"train_loss": -6.45128059387207, "global_step": 104172, "epoch": 2480} {"train_loss": -6.414891242980957, "global_step": 104173, "epoch": 2480} {"train_loss": -6.3767852783203125, "global_step": 104174, "epoch": 2480} {"train_loss": -6.420232772827148, "global_step": 104175, "epoch": 2480} {"train_loss": -6.459042549133301, "global_step": 104176, "epoch": 2480} {"train_loss": -6.431606292724609, "global_step": 104177, "epoch": 2480} {"train_loss": -6.592958450317383, "global_step": 104178, "epoch": 2480} {"train_loss": -6.455357551574707, "global_step": 104179, "epoch": 2480} {"train_loss": -6.404171466827393, "global_step": 104180, "epoch": 2480} {"train_loss": -6.47569465637207, "global_step": 104181, "epoch": 2480} {"train_loss": -6.3636040687561035, "global_step": 104182, "epoch": 2480} {"train_loss": -6.418038368225098, "global_step": 104183, "epoch": 2480} {"train_loss": -6.422763824462891, "global_step": 104184, "epoch": 2480} {"train_loss": -6.468070030212402, "global_step": 104185, "epoch": 2480} {"train_loss": -6.422259330749512, "global_step": 104186, "epoch": 2480} {"train_loss": -6.406254768371582, "global_step": 104187, "epoch": 2480} {"train_loss": -6.371891498565674, "global_step": 104188, "epoch": 2480} {"train_loss": -6.315989017486572, "global_step": 104189, "epoch": 2480} {"train_loss": -6.400135040283203, "global_step": 104190, "epoch": 2480} {"train_loss": -6.443027973175049, "global_step": 104191, "epoch": 2480} {"train_loss": -6.375972270965576, "global_step": 104192, "epoch": 2480} {"train_loss": -6.366991996765137, "global_step": 104193, "epoch": 2480} {"train_loss": -6.415935516357422, "global_step": 104194, "epoch": 2480} {"train_loss": -6.400861740112305, "global_step": 104195, "epoch": 2480} {"train_loss": -6.3993425369262695, "global_step": 104196, "epoch": 2480} {"train_loss": -6.401046276092529, "global_step": 104197, "epoch": 2480} {"train_loss": -6.404726505279541, "global_step": 104198, "epoch": 2480} {"train_loss": -6.30485725402832, "global_step": 104199, "epoch": 2480} {"train_loss": -6.300650596618652, "global_step": 104200, "epoch": 2480} {"train_loss": -6.411191849481492, "global_step": 104201, "epoch": 2480, "val_loss": 67871.6796875} {"train_loss": -6.276243209838867, "global_step": 104202, "epoch": 2481} {"train_loss": -6.438087463378906, "global_step": 104203, "epoch": 2481} {"train_loss": -6.44110631942749, "global_step": 104204, "epoch": 2481} {"train_loss": -6.464520454406738, "global_step": 104205, "epoch": 2481} {"train_loss": -6.271212100982666, "global_step": 104206, "epoch": 2481} {"train_loss": -6.386836528778076, "global_step": 104207, "epoch": 2481} {"train_loss": -6.378995895385742, "global_step": 104208, "epoch": 2481} {"train_loss": -6.316217422485352, "global_step": 104209, "epoch": 2481} {"train_loss": -6.357309341430664, "global_step": 104210, "epoch": 2481} {"train_loss": -6.375415802001953, "global_step": 104211, "epoch": 2481} {"train_loss": -6.412888050079346, "global_step": 104212, "epoch": 2481} {"train_loss": -6.378339767456055, "global_step": 104213, "epoch": 2481} {"train_loss": -6.373935222625732, "global_step": 104214, "epoch": 2481} {"train_loss": -6.33303165435791, "global_step": 104215, "epoch": 2481} {"train_loss": -6.431869983673096, "global_step": 104216, "epoch": 2481} {"train_loss": -6.366345405578613, "global_step": 104217, "epoch": 2481} {"train_loss": -6.5286970138549805, "global_step": 104218, "epoch": 2481} {"train_loss": -6.461766719818115, "global_step": 104219, "epoch": 2481} {"train_loss": -6.36433219909668, "global_step": 104220, "epoch": 2481} {"train_loss": -6.456146240234375, "global_step": 104221, "epoch": 2481} {"train_loss": -6.395459175109863, "global_step": 104222, "epoch": 2481} {"train_loss": -6.422951698303223, "global_step": 104223, "epoch": 2481} {"train_loss": -6.443965911865234, "global_step": 104224, "epoch": 2481} {"train_loss": -6.482456684112549, "global_step": 104225, "epoch": 2481} {"train_loss": -6.4716081619262695, "global_step": 104226, "epoch": 2481} {"train_loss": -6.304559230804443, "global_step": 104227, "epoch": 2481} {"train_loss": -6.483264923095703, "global_step": 104228, "epoch": 2481} {"train_loss": -6.5114946365356445, "global_step": 104229, "epoch": 2481} {"train_loss": -6.3648481369018555, "global_step": 104230, "epoch": 2481} {"train_loss": -6.340221405029297, "global_step": 104231, "epoch": 2481} {"train_loss": -6.397973537445068, "global_step": 104232, "epoch": 2481} {"train_loss": -6.544471740722656, "global_step": 104233, "epoch": 2481} {"train_loss": -6.39849328994751, "global_step": 104234, "epoch": 2481} {"train_loss": -6.386301040649414, "global_step": 104235, "epoch": 2481} {"train_loss": -6.360591888427734, "global_step": 104236, "epoch": 2481} {"train_loss": -6.538365364074707, "global_step": 104237, "epoch": 2481} {"train_loss": -6.436654090881348, "global_step": 104238, "epoch": 2481} {"train_loss": -6.381617069244385, "global_step": 104239, "epoch": 2481} {"train_loss": -6.423435211181641, "global_step": 104240, "epoch": 2481} {"train_loss": -6.432281494140625, "global_step": 104241, "epoch": 2481} {"train_loss": -6.292932987213135, "global_step": 104242, "epoch": 2481} {"train_loss": -6.407657180513654, "global_step": 104243, "epoch": 2481, "val_loss": 68073.4140625} {"train_loss": -6.430386543273926, "global_step": 104244, "epoch": 2482} {"train_loss": -6.386261940002441, "global_step": 104245, "epoch": 2482} {"train_loss": -6.499062538146973, "global_step": 104246, "epoch": 2482} {"train_loss": -6.414215087890625, "global_step": 104247, "epoch": 2482} {"train_loss": -6.30767822265625, "global_step": 104248, "epoch": 2482} {"train_loss": -6.380307197570801, "global_step": 104249, "epoch": 2482} {"train_loss": -6.433262825012207, "global_step": 104250, "epoch": 2482} {"train_loss": -6.397809028625488, "global_step": 104251, "epoch": 2482} {"train_loss": -6.435715675354004, "global_step": 104252, "epoch": 2482} {"train_loss": -6.514181613922119, "global_step": 104253, "epoch": 2482} {"train_loss": -6.469875812530518, "global_step": 104254, "epoch": 2482} {"train_loss": -6.46326208114624, "global_step": 104255, "epoch": 2482} {"train_loss": -6.521969795227051, "global_step": 104256, "epoch": 2482} {"train_loss": -6.354519844055176, "global_step": 104257, "epoch": 2482} {"train_loss": -6.400528907775879, "global_step": 104258, "epoch": 2482} {"train_loss": -6.436890602111816, "global_step": 104259, "epoch": 2482} {"train_loss": -6.351693153381348, "global_step": 104260, "epoch": 2482} {"train_loss": -6.431535720825195, "global_step": 104261, "epoch": 2482} {"train_loss": -6.436017990112305, "global_step": 104262, "epoch": 2482} {"train_loss": -6.371898174285889, "global_step": 104263, "epoch": 2482} {"train_loss": -6.399884223937988, "global_step": 104264, "epoch": 2482} {"train_loss": -6.513476371765137, "global_step": 104265, "epoch": 2482} {"train_loss": -6.346617698669434, "global_step": 104266, "epoch": 2482} {"train_loss": -6.375750541687012, "global_step": 104267, "epoch": 2482} {"train_loss": -6.441031455993652, "global_step": 104268, "epoch": 2482} {"train_loss": -6.2834367752075195, "global_step": 104269, "epoch": 2482} {"train_loss": -6.345236778259277, "global_step": 104270, "epoch": 2482} {"train_loss": -6.375753879547119, "global_step": 104271, "epoch": 2482} {"train_loss": -6.196197986602783, "global_step": 104272, "epoch": 2482} {"train_loss": -6.235711097717285, "global_step": 104273, "epoch": 2482} {"train_loss": -6.274219512939453, "global_step": 104274, "epoch": 2482} {"train_loss": -6.309908866882324, "global_step": 104275, "epoch": 2482} {"train_loss": -6.301131248474121, "global_step": 104276, "epoch": 2482} {"train_loss": -6.338225841522217, "global_step": 104277, "epoch": 2482} {"train_loss": -6.423149108886719, "global_step": 104278, "epoch": 2482} {"train_loss": -6.300811290740967, "global_step": 104279, "epoch": 2482} {"train_loss": -6.374910354614258, "global_step": 104280, "epoch": 2482} {"train_loss": -6.339831352233887, "global_step": 104281, "epoch": 2482} {"train_loss": -6.240072250366211, "global_step": 104282, "epoch": 2482} {"train_loss": -6.403324604034424, "global_step": 104283, "epoch": 2482} {"train_loss": -6.333804130554199, "global_step": 104284, "epoch": 2482} {"train_loss": -6.3795808610462, "global_step": 104285, "epoch": 2482, "val_loss": 67912.5} {"train_loss": -6.268324851989746, "global_step": 104286, "epoch": 2483} {"train_loss": -6.532863616943359, "global_step": 104287, "epoch": 2483} {"train_loss": -6.40743350982666, "global_step": 104288, "epoch": 2483} {"train_loss": -6.40553092956543, "global_step": 104289, "epoch": 2483} {"train_loss": -6.310022830963135, "global_step": 104290, "epoch": 2483} {"train_loss": -6.293122291564941, "global_step": 104291, "epoch": 2483} {"train_loss": -6.228514194488525, "global_step": 104292, "epoch": 2483} {"train_loss": -6.295284271240234, "global_step": 104293, "epoch": 2483} {"train_loss": -6.542522430419922, "global_step": 104294, "epoch": 2483} {"train_loss": -6.364261627197266, "global_step": 104295, "epoch": 2483} {"train_loss": -6.294200897216797, "global_step": 104296, "epoch": 2483} {"train_loss": -6.404253005981445, "global_step": 104297, "epoch": 2483} {"train_loss": -6.392894744873047, "global_step": 104298, "epoch": 2483} {"train_loss": -6.37156867980957, "global_step": 104299, "epoch": 2483} {"train_loss": -6.316093444824219, "global_step": 104300, "epoch": 2483} {"train_loss": -6.368194580078125, "global_step": 104301, "epoch": 2483} {"train_loss": -6.299948692321777, "global_step": 104302, "epoch": 2483} {"train_loss": -6.345427513122559, "global_step": 104303, "epoch": 2483} {"train_loss": -6.428913116455078, "global_step": 104304, "epoch": 2483} {"train_loss": -6.368592739105225, "global_step": 104305, "epoch": 2483} {"train_loss": -6.286870956420898, "global_step": 104306, "epoch": 2483} {"train_loss": -6.356383323669434, "global_step": 104307, "epoch": 2483} {"train_loss": -6.462679862976074, "global_step": 104308, "epoch": 2483} {"train_loss": -6.3161540031433105, "global_step": 104309, "epoch": 2483} {"train_loss": -6.374285697937012, "global_step": 104310, "epoch": 2483} {"train_loss": -6.280221939086914, "global_step": 104311, "epoch": 2483} {"train_loss": -6.29721212387085, "global_step": 104312, "epoch": 2483} {"train_loss": -6.288499355316162, "global_step": 104313, "epoch": 2483} {"train_loss": -6.4771013259887695, "global_step": 104314, "epoch": 2483} {"train_loss": -6.421572208404541, "global_step": 104315, "epoch": 2483} {"train_loss": -6.339842319488525, "global_step": 104316, "epoch": 2483} {"train_loss": -6.304808616638184, "global_step": 104317, "epoch": 2483} {"train_loss": -6.411631107330322, "global_step": 104318, "epoch": 2483} {"train_loss": -6.290103912353516, "global_step": 104319, "epoch": 2483} {"train_loss": -6.347827911376953, "global_step": 104320, "epoch": 2483} {"train_loss": -6.357098579406738, "global_step": 104321, "epoch": 2483} {"train_loss": -6.34480619430542, "global_step": 104322, "epoch": 2483} {"train_loss": -6.19912052154541, "global_step": 104323, "epoch": 2483} {"train_loss": -6.381776332855225, "global_step": 104324, "epoch": 2483} {"train_loss": -6.3282246589660645, "global_step": 104325, "epoch": 2483} {"train_loss": -6.354082107543945, "global_step": 104326, "epoch": 2483} {"train_loss": -6.3527914342426115, "global_step": 104327, "epoch": 2483, "val_loss": 67811.15625} {"train_loss": -6.5217180252075195, "global_step": 104328, "epoch": 2484} {"train_loss": -6.280160427093506, "global_step": 104329, "epoch": 2484} {"train_loss": -6.551743030548096, "global_step": 104330, "epoch": 2484} {"train_loss": -6.333845138549805, "global_step": 104331, "epoch": 2484} {"train_loss": -6.481015682220459, "global_step": 104332, "epoch": 2484} {"train_loss": -6.3565592765808105, "global_step": 104333, "epoch": 2484} {"train_loss": -6.2971014976501465, "global_step": 104334, "epoch": 2484} {"train_loss": -6.289924621582031, "global_step": 104335, "epoch": 2484} {"train_loss": -6.4416399002075195, "global_step": 104336, "epoch": 2484} {"train_loss": -6.333878517150879, "global_step": 104337, "epoch": 2484} {"train_loss": -6.352191925048828, "global_step": 104338, "epoch": 2484} {"train_loss": -6.395961284637451, "global_step": 104339, "epoch": 2484} {"train_loss": -6.2936248779296875, "global_step": 104340, "epoch": 2484} {"train_loss": -6.398020267486572, "global_step": 104341, "epoch": 2484} {"train_loss": -6.426618576049805, "global_step": 104342, "epoch": 2484} {"train_loss": -6.469010353088379, "global_step": 104343, "epoch": 2484} {"train_loss": -6.461406230926514, "global_step": 104344, "epoch": 2484} {"train_loss": -6.396327018737793, "global_step": 104345, "epoch": 2484} {"train_loss": -6.5047783851623535, "global_step": 104346, "epoch": 2484} {"train_loss": -6.348555564880371, "global_step": 104347, "epoch": 2484} {"train_loss": -6.460700511932373, "global_step": 104348, "epoch": 2484} {"train_loss": -6.461615085601807, "global_step": 104349, "epoch": 2484} {"train_loss": -6.272430419921875, "global_step": 104350, "epoch": 2484} {"train_loss": -6.339550018310547, "global_step": 104351, "epoch": 2484} {"train_loss": -6.406145095825195, "global_step": 104352, "epoch": 2484} {"train_loss": -6.316262245178223, "global_step": 104353, "epoch": 2484} {"train_loss": -6.238543510437012, "global_step": 104354, "epoch": 2484} {"train_loss": -6.4020490646362305, "global_step": 104355, "epoch": 2484} {"train_loss": -6.266617774963379, "global_step": 104356, "epoch": 2484} {"train_loss": -6.319684982299805, "global_step": 104357, "epoch": 2484} {"train_loss": -6.48654842376709, "global_step": 104358, "epoch": 2484} {"train_loss": -6.283055305480957, "global_step": 104359, "epoch": 2484} {"train_loss": -6.433261871337891, "global_step": 104360, "epoch": 2484} {"train_loss": -6.367293834686279, "global_step": 104361, "epoch": 2484} {"train_loss": -6.263803482055664, "global_step": 104362, "epoch": 2484} {"train_loss": -6.416866779327393, "global_step": 104363, "epoch": 2484} {"train_loss": -6.364623069763184, "global_step": 104364, "epoch": 2484} {"train_loss": -6.529560089111328, "global_step": 104365, "epoch": 2484} {"train_loss": -6.327375411987305, "global_step": 104366, "epoch": 2484} {"train_loss": -6.36212682723999, "global_step": 104367, "epoch": 2484} {"train_loss": -6.461915969848633, "global_step": 104368, "epoch": 2484} {"train_loss": -6.383959497724261, "global_step": 104369, "epoch": 2484, "val_loss": 67972.5625} {"train_loss": -6.2922821044921875, "global_step": 104370, "epoch": 2485} {"train_loss": -6.3542585372924805, "global_step": 104371, "epoch": 2485} {"train_loss": -6.39048957824707, "global_step": 104372, "epoch": 2485} {"train_loss": -6.404675006866455, "global_step": 104373, "epoch": 2485} {"train_loss": -6.353923797607422, "global_step": 104374, "epoch": 2485} {"train_loss": -6.36185884475708, "global_step": 104375, "epoch": 2485} {"train_loss": -6.333860874176025, "global_step": 104376, "epoch": 2485} {"train_loss": -6.236600399017334, "global_step": 104377, "epoch": 2485} {"train_loss": -6.358863353729248, "global_step": 104378, "epoch": 2485} {"train_loss": -6.184194564819336, "global_step": 104379, "epoch": 2485} {"train_loss": -6.291616439819336, "global_step": 104380, "epoch": 2485} {"train_loss": -6.2799882888793945, "global_step": 104381, "epoch": 2485} {"train_loss": -6.401176929473877, "global_step": 104382, "epoch": 2485} {"train_loss": -6.251605987548828, "global_step": 104383, "epoch": 2485} {"train_loss": -6.329425811767578, "global_step": 104384, "epoch": 2485} {"train_loss": -6.259499549865723, "global_step": 104385, "epoch": 2485} {"train_loss": -6.307531833648682, "global_step": 104386, "epoch": 2485} {"train_loss": -6.466666221618652, "global_step": 104387, "epoch": 2485} {"train_loss": -6.329401016235352, "global_step": 104388, "epoch": 2485} {"train_loss": -6.326460838317871, "global_step": 104389, "epoch": 2485} {"train_loss": -6.364067077636719, "global_step": 104390, "epoch": 2485} {"train_loss": -6.358231067657471, "global_step": 104391, "epoch": 2485} {"train_loss": -6.327288627624512, "global_step": 104392, "epoch": 2485} {"train_loss": -6.309451103210449, "global_step": 104393, "epoch": 2485} {"train_loss": -6.321584224700928, "global_step": 104394, "epoch": 2485} {"train_loss": -6.3022260665893555, "global_step": 104395, "epoch": 2485} {"train_loss": -6.305151462554932, "global_step": 104396, "epoch": 2485} {"train_loss": -6.300766944885254, "global_step": 104397, "epoch": 2485} {"train_loss": -6.4514594078063965, "global_step": 104398, "epoch": 2485} {"train_loss": -6.384695053100586, "global_step": 104399, "epoch": 2485} {"train_loss": -6.433376312255859, "global_step": 104400, "epoch": 2485} {"train_loss": -6.313921928405762, "global_step": 104401, "epoch": 2485} {"train_loss": -6.474508762359619, "global_step": 104402, "epoch": 2485} {"train_loss": -6.308836936950684, "global_step": 104403, "epoch": 2485} {"train_loss": -6.373579025268555, "global_step": 104404, "epoch": 2485} {"train_loss": -6.444299697875977, "global_step": 104405, "epoch": 2485} {"train_loss": -6.401294708251953, "global_step": 104406, "epoch": 2485} {"train_loss": -6.349907875061035, "global_step": 104407, "epoch": 2485} {"train_loss": -6.426443099975586, "global_step": 104408, "epoch": 2485} {"train_loss": -6.437165260314941, "global_step": 104409, "epoch": 2485} {"train_loss": -6.275829315185547, "global_step": 104410, "epoch": 2485} {"train_loss": -6.347375994636899, "global_step": 104411, "epoch": 2485, "val_loss": 67924.375} {"train_loss": -6.334212779998779, "global_step": 104412, "epoch": 2486} {"train_loss": -6.300105571746826, "global_step": 104413, "epoch": 2486} {"train_loss": -6.4507904052734375, "global_step": 104414, "epoch": 2486} {"train_loss": -6.346896171569824, "global_step": 104415, "epoch": 2486} {"train_loss": -6.307225227355957, "global_step": 104416, "epoch": 2486} {"train_loss": -6.448777675628662, "global_step": 104417, "epoch": 2486} {"train_loss": -6.397857666015625, "global_step": 104418, "epoch": 2486} {"train_loss": -6.3508100509643555, "global_step": 104419, "epoch": 2486} {"train_loss": -6.3683180809021, "global_step": 104420, "epoch": 2486} {"train_loss": -6.281309127807617, "global_step": 104421, "epoch": 2486} {"train_loss": -6.384608745574951, "global_step": 104422, "epoch": 2486} {"train_loss": -6.468839645385742, "global_step": 104423, "epoch": 2486} {"train_loss": -6.43942928314209, "global_step": 104424, "epoch": 2486} {"train_loss": -6.245375633239746, "global_step": 104425, "epoch": 2486} {"train_loss": -6.391625881195068, "global_step": 104426, "epoch": 2486} {"train_loss": -6.41737699508667, "global_step": 104427, "epoch": 2486} {"train_loss": -6.305218696594238, "global_step": 104428, "epoch": 2486} {"train_loss": -6.399057865142822, "global_step": 104429, "epoch": 2486} {"train_loss": -6.460086822509766, "global_step": 104430, "epoch": 2486} {"train_loss": -6.454127311706543, "global_step": 104431, "epoch": 2486} {"train_loss": -6.448456764221191, "global_step": 104432, "epoch": 2486} {"train_loss": -6.446228504180908, "global_step": 104433, "epoch": 2486} {"train_loss": -6.469809055328369, "global_step": 104434, "epoch": 2486} {"train_loss": -6.462614059448242, "global_step": 104435, "epoch": 2486} {"train_loss": -6.449550628662109, "global_step": 104436, "epoch": 2486} {"train_loss": -6.508829116821289, "global_step": 104437, "epoch": 2486} {"train_loss": -6.324578762054443, "global_step": 104438, "epoch": 2486} {"train_loss": -6.459957122802734, "global_step": 104439, "epoch": 2486} {"train_loss": -6.371323585510254, "global_step": 104440, "epoch": 2486} {"train_loss": -6.424754619598389, "global_step": 104441, "epoch": 2486} {"train_loss": -6.4211955070495605, "global_step": 104442, "epoch": 2486} {"train_loss": -6.393752574920654, "global_step": 104443, "epoch": 2486} {"train_loss": -6.464548110961914, "global_step": 104444, "epoch": 2486} {"train_loss": -6.402979850769043, "global_step": 104445, "epoch": 2486} {"train_loss": -6.490016460418701, "global_step": 104446, "epoch": 2486} {"train_loss": -6.409981727600098, "global_step": 104447, "epoch": 2486} {"train_loss": -6.535116195678711, "global_step": 104448, "epoch": 2486} {"train_loss": -6.334831237792969, "global_step": 104449, "epoch": 2486} {"train_loss": -6.355496406555176, "global_step": 104450, "epoch": 2486} {"train_loss": -6.411590576171875, "global_step": 104451, "epoch": 2486} {"train_loss": -6.347929000854492, "global_step": 104452, "epoch": 2486} {"train_loss": -6.40176949046907, "global_step": 104453, "epoch": 2486, "val_loss": 67856.84375} {"train_loss": -6.468423366546631, "global_step": 104454, "epoch": 2487} {"train_loss": -6.482030391693115, "global_step": 104455, "epoch": 2487} {"train_loss": -6.4133100509643555, "global_step": 104456, "epoch": 2487} {"train_loss": -6.420943260192871, "global_step": 104457, "epoch": 2487} {"train_loss": -6.388858795166016, "global_step": 104458, "epoch": 2487} {"train_loss": -6.444660663604736, "global_step": 104459, "epoch": 2487} {"train_loss": -6.431275367736816, "global_step": 104460, "epoch": 2487} {"train_loss": -6.478050708770752, "global_step": 104461, "epoch": 2487} {"train_loss": -6.288748741149902, "global_step": 104462, "epoch": 2487} {"train_loss": -6.454766750335693, "global_step": 104463, "epoch": 2487} {"train_loss": -6.489601135253906, "global_step": 104464, "epoch": 2487} {"train_loss": -6.2620697021484375, "global_step": 104465, "epoch": 2487} {"train_loss": -6.4896626472473145, "global_step": 104466, "epoch": 2487} {"train_loss": -6.4637298583984375, "global_step": 104467, "epoch": 2487} {"train_loss": -6.397797107696533, "global_step": 104468, "epoch": 2487} {"train_loss": -6.351696968078613, "global_step": 104469, "epoch": 2487} {"train_loss": -6.365885257720947, "global_step": 104470, "epoch": 2487} {"train_loss": -6.343184947967529, "global_step": 104471, "epoch": 2487} {"train_loss": -6.473289489746094, "global_step": 104472, "epoch": 2487} {"train_loss": -6.363697528839111, "global_step": 104473, "epoch": 2487} {"train_loss": -6.261793613433838, "global_step": 104474, "epoch": 2487} {"train_loss": -6.384922027587891, "global_step": 104475, "epoch": 2487} {"train_loss": -6.387874603271484, "global_step": 104476, "epoch": 2487} {"train_loss": -6.269165992736816, "global_step": 104477, "epoch": 2487} {"train_loss": -6.2853546142578125, "global_step": 104478, "epoch": 2487} {"train_loss": -6.342307090759277, "global_step": 104479, "epoch": 2487} {"train_loss": -6.370248317718506, "global_step": 104480, "epoch": 2487} {"train_loss": -6.531207084655762, "global_step": 104481, "epoch": 2487} {"train_loss": -6.431071758270264, "global_step": 104482, "epoch": 2487} {"train_loss": -6.457906723022461, "global_step": 104483, "epoch": 2487} {"train_loss": -6.2482805252075195, "global_step": 104484, "epoch": 2487} {"train_loss": -6.356624603271484, "global_step": 104485, "epoch": 2487} {"train_loss": -6.456584930419922, "global_step": 104486, "epoch": 2487} {"train_loss": -6.460683345794678, "global_step": 104487, "epoch": 2487} {"train_loss": -6.366270065307617, "global_step": 104488, "epoch": 2487} {"train_loss": -6.4394731521606445, "global_step": 104489, "epoch": 2487} {"train_loss": -6.357654571533203, "global_step": 104490, "epoch": 2487} {"train_loss": -6.284085273742676, "global_step": 104491, "epoch": 2487} {"train_loss": -6.370359897613525, "global_step": 104492, "epoch": 2487} {"train_loss": -6.354679107666016, "global_step": 104493, "epoch": 2487} {"train_loss": -6.355712890625, "global_step": 104494, "epoch": 2487} {"train_loss": -6.392254136857533, "global_step": 104495, "epoch": 2487, "val_loss": 68022.328125} {"train_loss": -6.420586109161377, "global_step": 104496, "epoch": 2488} {"train_loss": -6.325469493865967, "global_step": 104497, "epoch": 2488} {"train_loss": -6.41185188293457, "global_step": 104498, "epoch": 2488} {"train_loss": -6.283020973205566, "global_step": 104499, "epoch": 2488} {"train_loss": -6.407338619232178, "global_step": 104500, "epoch": 2488} {"train_loss": -6.399681568145752, "global_step": 104501, "epoch": 2488} {"train_loss": -6.349491119384766, "global_step": 104502, "epoch": 2488} {"train_loss": -6.40770149230957, "global_step": 104503, "epoch": 2488} {"train_loss": -6.450070381164551, "global_step": 104504, "epoch": 2488} {"train_loss": -6.474462509155273, "global_step": 104505, "epoch": 2488} {"train_loss": -6.475729942321777, "global_step": 104506, "epoch": 2488} {"train_loss": -6.488540172576904, "global_step": 104507, "epoch": 2488} {"train_loss": -6.405770301818848, "global_step": 104508, "epoch": 2488} {"train_loss": -6.505317211151123, "global_step": 104509, "epoch": 2488} {"train_loss": -6.330316543579102, "global_step": 104510, "epoch": 2488} {"train_loss": -6.353516578674316, "global_step": 104511, "epoch": 2488} {"train_loss": -6.468147277832031, "global_step": 104512, "epoch": 2488} {"train_loss": -6.338814735412598, "global_step": 104513, "epoch": 2488} {"train_loss": -6.492508888244629, "global_step": 104514, "epoch": 2488} {"train_loss": -6.346914291381836, "global_step": 104515, "epoch": 2488} {"train_loss": -6.312017917633057, "global_step": 104516, "epoch": 2488} {"train_loss": -6.3466291427612305, "global_step": 104517, "epoch": 2488} {"train_loss": -6.299314498901367, "global_step": 104518, "epoch": 2488} {"train_loss": -6.485591888427734, "global_step": 104519, "epoch": 2488} {"train_loss": -6.258018493652344, "global_step": 104520, "epoch": 2488} {"train_loss": -6.336329460144043, "global_step": 104521, "epoch": 2488} {"train_loss": -6.303829193115234, "global_step": 104522, "epoch": 2488} {"train_loss": -6.314199447631836, "global_step": 104523, "epoch": 2488} {"train_loss": -6.347609519958496, "global_step": 104524, "epoch": 2488} {"train_loss": -6.377624988555908, "global_step": 104525, "epoch": 2488} {"train_loss": -6.361491680145264, "global_step": 104526, "epoch": 2488} {"train_loss": -6.288654804229736, "global_step": 104527, "epoch": 2488} {"train_loss": -6.423982620239258, "global_step": 104528, "epoch": 2488} {"train_loss": -6.341504096984863, "global_step": 104529, "epoch": 2488} {"train_loss": -6.409790992736816, "global_step": 104530, "epoch": 2488} {"train_loss": -6.37025260925293, "global_step": 104531, "epoch": 2488} {"train_loss": -6.408507347106934, "global_step": 104532, "epoch": 2488} {"train_loss": -6.321118354797363, "global_step": 104533, "epoch": 2488} {"train_loss": -6.349441051483154, "global_step": 104534, "epoch": 2488} {"train_loss": -6.455164909362793, "global_step": 104535, "epoch": 2488} {"train_loss": -6.412543296813965, "global_step": 104536, "epoch": 2488} {"train_loss": -6.3820660681951615, "global_step": 104537, "epoch": 2488, "val_loss": 67913.484375} {"train_loss": -6.457050323486328, "global_step": 104538, "epoch": 2489} {"train_loss": -6.409071922302246, "global_step": 104539, "epoch": 2489} {"train_loss": -6.290217399597168, "global_step": 104540, "epoch": 2489} {"train_loss": -6.4403557777404785, "global_step": 104541, "epoch": 2489} {"train_loss": -6.382049083709717, "global_step": 104542, "epoch": 2489} {"train_loss": -6.418956756591797, "global_step": 104543, "epoch": 2489} {"train_loss": -6.391446113586426, "global_step": 104544, "epoch": 2489} {"train_loss": -6.327826499938965, "global_step": 104545, "epoch": 2489} {"train_loss": -6.343405723571777, "global_step": 104546, "epoch": 2489} {"train_loss": -6.544466972351074, "global_step": 104547, "epoch": 2489} {"train_loss": -6.430233955383301, "global_step": 104548, "epoch": 2489} {"train_loss": -6.393733978271484, "global_step": 104549, "epoch": 2489} {"train_loss": -6.255126953125, "global_step": 104550, "epoch": 2489} {"train_loss": -6.4145612716674805, "global_step": 104551, "epoch": 2489} {"train_loss": -6.258815765380859, "global_step": 104552, "epoch": 2489} {"train_loss": -6.513550281524658, "global_step": 104553, "epoch": 2489} {"train_loss": -6.310378551483154, "global_step": 104554, "epoch": 2489} {"train_loss": -6.344544410705566, "global_step": 104555, "epoch": 2489} {"train_loss": -6.447749137878418, "global_step": 104556, "epoch": 2489} {"train_loss": -6.341681480407715, "global_step": 104557, "epoch": 2489} {"train_loss": -6.370099067687988, "global_step": 104558, "epoch": 2489} {"train_loss": -6.3178558349609375, "global_step": 104559, "epoch": 2489} {"train_loss": -6.376650333404541, "global_step": 104560, "epoch": 2489} {"train_loss": -6.330204963684082, "global_step": 104561, "epoch": 2489} {"train_loss": -6.390683650970459, "global_step": 104562, "epoch": 2489} {"train_loss": -6.313485145568848, "global_step": 104563, "epoch": 2489} {"train_loss": -6.374172210693359, "global_step": 104564, "epoch": 2489} {"train_loss": -6.310455799102783, "global_step": 104565, "epoch": 2489} {"train_loss": -6.277105331420898, "global_step": 104566, "epoch": 2489} {"train_loss": -6.281867027282715, "global_step": 104567, "epoch": 2489} {"train_loss": -6.324618339538574, "global_step": 104568, "epoch": 2489} {"train_loss": -6.350248336791992, "global_step": 104569, "epoch": 2489} {"train_loss": -6.320672988891602, "global_step": 104570, "epoch": 2489} {"train_loss": -6.2828874588012695, "global_step": 104571, "epoch": 2489} {"train_loss": -6.300424575805664, "global_step": 104572, "epoch": 2489} {"train_loss": -6.300747871398926, "global_step": 104573, "epoch": 2489} {"train_loss": -6.40455436706543, "global_step": 104574, "epoch": 2489} {"train_loss": -6.404963493347168, "global_step": 104575, "epoch": 2489} {"train_loss": -6.433967590332031, "global_step": 104576, "epoch": 2489} {"train_loss": -6.375259876251221, "global_step": 104577, "epoch": 2489} {"train_loss": -6.316001892089844, "global_step": 104578, "epoch": 2489} {"train_loss": -6.363016344252086, "global_step": 104579, "epoch": 2489, "val_loss": 67774.640625} {"train_loss": -6.4514336585998535, "global_step": 104580, "epoch": 2490} {"train_loss": -6.360698699951172, "global_step": 104581, "epoch": 2490} {"train_loss": -6.4304609298706055, "global_step": 104582, "epoch": 2490} {"train_loss": -6.421404838562012, "global_step": 104583, "epoch": 2490} {"train_loss": -6.245464324951172, "global_step": 104584, "epoch": 2490} {"train_loss": -6.265357494354248, "global_step": 104585, "epoch": 2490} {"train_loss": -6.246342182159424, "global_step": 104586, "epoch": 2490} {"train_loss": -6.53267765045166, "global_step": 104587, "epoch": 2490} {"train_loss": -6.420182228088379, "global_step": 104588, "epoch": 2490} {"train_loss": -6.365759372711182, "global_step": 104589, "epoch": 2490} {"train_loss": -6.296723365783691, "global_step": 104590, "epoch": 2490} {"train_loss": -6.297099590301514, "global_step": 104591, "epoch": 2490} {"train_loss": -6.599700450897217, "global_step": 104592, "epoch": 2490} {"train_loss": -6.374286651611328, "global_step": 104593, "epoch": 2490} {"train_loss": -6.331045150756836, "global_step": 104594, "epoch": 2490} {"train_loss": -6.371369361877441, "global_step": 104595, "epoch": 2490} {"train_loss": -6.3602800369262695, "global_step": 104596, "epoch": 2490} {"train_loss": -6.381699562072754, "global_step": 104597, "epoch": 2490} {"train_loss": -6.381840705871582, "global_step": 104598, "epoch": 2490} {"train_loss": -6.414592742919922, "global_step": 104599, "epoch": 2490} {"train_loss": -6.434288024902344, "global_step": 104600, "epoch": 2490} {"train_loss": -6.341182708740234, "global_step": 104601, "epoch": 2490} {"train_loss": -6.429267406463623, "global_step": 104602, "epoch": 2490} {"train_loss": -6.370751857757568, "global_step": 104603, "epoch": 2490} {"train_loss": -6.444787502288818, "global_step": 104604, "epoch": 2490} {"train_loss": -6.46516227722168, "global_step": 104605, "epoch": 2490} {"train_loss": -6.307114124298096, "global_step": 104606, "epoch": 2490} {"train_loss": -6.4749250411987305, "global_step": 104607, "epoch": 2490} {"train_loss": -6.26810884475708, "global_step": 104608, "epoch": 2490} {"train_loss": -6.347891807556152, "global_step": 104609, "epoch": 2490} {"train_loss": -6.459753036499023, "global_step": 104610, "epoch": 2490} {"train_loss": -6.31816291809082, "global_step": 104611, "epoch": 2490} {"train_loss": -6.444828033447266, "global_step": 104612, "epoch": 2490} {"train_loss": -6.514773368835449, "global_step": 104613, "epoch": 2490} {"train_loss": -6.2634382247924805, "global_step": 104614, "epoch": 2490} {"train_loss": -6.513373374938965, "global_step": 104615, "epoch": 2490} {"train_loss": -6.214517593383789, "global_step": 104616, "epoch": 2490} {"train_loss": -6.472306728363037, "global_step": 104617, "epoch": 2490} {"train_loss": -6.42413330078125, "global_step": 104618, "epoch": 2490} {"train_loss": -6.37534236907959, "global_step": 104619, "epoch": 2490} {"train_loss": -6.414798736572266, "global_step": 104620, "epoch": 2490} {"train_loss": -6.385324217024303, "global_step": 104621, "epoch": 2490, "val_loss": 67762.90625} {"train_loss": -6.368293762207031, "global_step": 104622, "epoch": 2491} {"train_loss": -6.258386135101318, "global_step": 104623, "epoch": 2491} {"train_loss": -6.4311418533325195, "global_step": 104624, "epoch": 2491} {"train_loss": -6.367250442504883, "global_step": 104625, "epoch": 2491} {"train_loss": -6.290473937988281, "global_step": 104626, "epoch": 2491} {"train_loss": -6.374743461608887, "global_step": 104627, "epoch": 2491} {"train_loss": -6.493303298950195, "global_step": 104628, "epoch": 2491} {"train_loss": -6.436375617980957, "global_step": 104629, "epoch": 2491} {"train_loss": -6.341851711273193, "global_step": 104630, "epoch": 2491} {"train_loss": -6.426992416381836, "global_step": 104631, "epoch": 2491} {"train_loss": -6.338814735412598, "global_step": 104632, "epoch": 2491} {"train_loss": -6.513175010681152, "global_step": 104633, "epoch": 2491} {"train_loss": -6.4352827072143555, "global_step": 104634, "epoch": 2491} {"train_loss": -6.493214130401611, "global_step": 104635, "epoch": 2491} {"train_loss": -6.458054065704346, "global_step": 104636, "epoch": 2491} {"train_loss": -6.322075366973877, "global_step": 104637, "epoch": 2491} {"train_loss": -6.409677505493164, "global_step": 104638, "epoch": 2491} {"train_loss": -6.369414329528809, "global_step": 104639, "epoch": 2491} {"train_loss": -6.455554008483887, "global_step": 104640, "epoch": 2491} {"train_loss": -6.282386302947998, "global_step": 104641, "epoch": 2491} {"train_loss": -6.3729071617126465, "global_step": 104642, "epoch": 2491} {"train_loss": -6.287678241729736, "global_step": 104643, "epoch": 2491} {"train_loss": -6.490907192230225, "global_step": 104644, "epoch": 2491} {"train_loss": -6.287506103515625, "global_step": 104645, "epoch": 2491} {"train_loss": -6.4408650398254395, "global_step": 104646, "epoch": 2491} {"train_loss": -6.474066734313965, "global_step": 104647, "epoch": 2491} {"train_loss": -6.378145217895508, "global_step": 104648, "epoch": 2491} {"train_loss": -6.451703071594238, "global_step": 104649, "epoch": 2491} {"train_loss": -6.433868408203125, "global_step": 104650, "epoch": 2491} {"train_loss": -6.404941082000732, "global_step": 104651, "epoch": 2491} {"train_loss": -6.40101432800293, "global_step": 104652, "epoch": 2491} {"train_loss": -6.290375709533691, "global_step": 104653, "epoch": 2491} {"train_loss": -6.404661178588867, "global_step": 104654, "epoch": 2491} {"train_loss": -6.396636009216309, "global_step": 104655, "epoch": 2491} {"train_loss": -6.334129333496094, "global_step": 104656, "epoch": 2491} {"train_loss": -6.309892654418945, "global_step": 104657, "epoch": 2491} {"train_loss": -6.291889190673828, "global_step": 104658, "epoch": 2491} {"train_loss": -6.340526580810547, "global_step": 104659, "epoch": 2491} {"train_loss": -6.291901588439941, "global_step": 104660, "epoch": 2491} {"train_loss": -6.219864845275879, "global_step": 104661, "epoch": 2491} {"train_loss": -6.220186233520508, "global_step": 104662, "epoch": 2491} {"train_loss": -6.3774196193331765, "global_step": 104663, "epoch": 2491, "val_loss": 68163.2890625} {"train_loss": -6.363410949707031, "global_step": 104664, "epoch": 2492} {"train_loss": -6.416730880737305, "global_step": 104665, "epoch": 2492} {"train_loss": -6.431065559387207, "global_step": 104666, "epoch": 2492} {"train_loss": -6.3844709396362305, "global_step": 104667, "epoch": 2492} {"train_loss": -6.381076335906982, "global_step": 104668, "epoch": 2492} {"train_loss": -6.456031799316406, "global_step": 104669, "epoch": 2492} {"train_loss": -6.483229637145996, "global_step": 104670, "epoch": 2492} {"train_loss": -6.345066070556641, "global_step": 104671, "epoch": 2492} {"train_loss": -6.348559856414795, "global_step": 104672, "epoch": 2492} {"train_loss": -6.431002140045166, "global_step": 104673, "epoch": 2492} {"train_loss": -6.491090297698975, "global_step": 104674, "epoch": 2492} {"train_loss": -6.415361404418945, "global_step": 104675, "epoch": 2492} {"train_loss": -6.476842880249023, "global_step": 104676, "epoch": 2492} {"train_loss": -6.459953784942627, "global_step": 104677, "epoch": 2492} {"train_loss": -6.407031536102295, "global_step": 104678, "epoch": 2492} {"train_loss": -6.430449962615967, "global_step": 104679, "epoch": 2492} {"train_loss": -6.430202484130859, "global_step": 104680, "epoch": 2492} {"train_loss": -6.441151142120361, "global_step": 104681, "epoch": 2492} {"train_loss": -6.396807670593262, "global_step": 104682, "epoch": 2492} {"train_loss": -6.298774719238281, "global_step": 104683, "epoch": 2492} {"train_loss": -6.343733787536621, "global_step": 104684, "epoch": 2492} {"train_loss": -6.252216339111328, "global_step": 104685, "epoch": 2492} {"train_loss": -6.243036270141602, "global_step": 104686, "epoch": 2492} {"train_loss": -6.36528205871582, "global_step": 104687, "epoch": 2492} {"train_loss": -6.300428867340088, "global_step": 104688, "epoch": 2492} {"train_loss": -6.2552032470703125, "global_step": 104689, "epoch": 2492} {"train_loss": -6.277290344238281, "global_step": 104690, "epoch": 2492} {"train_loss": -6.288280963897705, "global_step": 104691, "epoch": 2492} {"train_loss": -6.375556468963623, "global_step": 104692, "epoch": 2492} {"train_loss": -6.314105033874512, "global_step": 104693, "epoch": 2492} {"train_loss": -6.33365535736084, "global_step": 104694, "epoch": 2492} {"train_loss": -6.31463623046875, "global_step": 104695, "epoch": 2492} {"train_loss": -6.321503639221191, "global_step": 104696, "epoch": 2492} {"train_loss": -6.299533843994141, "global_step": 104697, "epoch": 2492} {"train_loss": -6.234429359436035, "global_step": 104698, "epoch": 2492} {"train_loss": -6.4106292724609375, "global_step": 104699, "epoch": 2492} {"train_loss": -6.311697959899902, "global_step": 104700, "epoch": 2492} {"train_loss": -6.2069807052612305, "global_step": 104701, "epoch": 2492} {"train_loss": -6.330502510070801, "global_step": 104702, "epoch": 2492} {"train_loss": -6.176006317138672, "global_step": 104703, "epoch": 2492} {"train_loss": -6.369939804077148, "global_step": 104704, "epoch": 2492} {"train_loss": -6.353698912121001, "global_step": 104705, "epoch": 2492, "val_loss": 68059.71875} {"train_loss": -6.342029571533203, "global_step": 104706, "epoch": 2493} {"train_loss": -6.445535659790039, "global_step": 104707, "epoch": 2493} {"train_loss": -6.450618743896484, "global_step": 104708, "epoch": 2493} {"train_loss": -6.414378643035889, "global_step": 104709, "epoch": 2493} {"train_loss": -6.416950702667236, "global_step": 104710, "epoch": 2493} {"train_loss": -6.278163433074951, "global_step": 104711, "epoch": 2493} {"train_loss": -6.2689361572265625, "global_step": 104712, "epoch": 2493} {"train_loss": -6.321005821228027, "global_step": 104713, "epoch": 2493} {"train_loss": -6.310967445373535, "global_step": 104714, "epoch": 2493} {"train_loss": -6.325080394744873, "global_step": 104715, "epoch": 2493} {"train_loss": -6.257579326629639, "global_step": 104716, "epoch": 2493} {"train_loss": -6.297069072723389, "global_step": 104717, "epoch": 2493} {"train_loss": -6.408928871154785, "global_step": 104718, "epoch": 2493} {"train_loss": -6.375389099121094, "global_step": 104719, "epoch": 2493} {"train_loss": -6.213529586791992, "global_step": 104720, "epoch": 2493} {"train_loss": -6.389346122741699, "global_step": 104721, "epoch": 2493} {"train_loss": -6.424660682678223, "global_step": 104722, "epoch": 2493} {"train_loss": -6.286038398742676, "global_step": 104723, "epoch": 2493} {"train_loss": -6.420787811279297, "global_step": 104724, "epoch": 2493} {"train_loss": -6.431756973266602, "global_step": 104725, "epoch": 2493} {"train_loss": -6.434347152709961, "global_step": 104726, "epoch": 2493} {"train_loss": -6.4265546798706055, "global_step": 104727, "epoch": 2493} {"train_loss": -6.447190284729004, "global_step": 104728, "epoch": 2493} {"train_loss": -6.414040565490723, "global_step": 104729, "epoch": 2493} {"train_loss": -6.354500770568848, "global_step": 104730, "epoch": 2493} {"train_loss": -6.408074378967285, "global_step": 104731, "epoch": 2493} {"train_loss": -6.41856050491333, "global_step": 104732, "epoch": 2493} {"train_loss": -6.390588760375977, "global_step": 104733, "epoch": 2493} {"train_loss": -6.4607086181640625, "global_step": 104734, "epoch": 2493} {"train_loss": -6.339874267578125, "global_step": 104735, "epoch": 2493} {"train_loss": -6.382559776306152, "global_step": 104736, "epoch": 2493} {"train_loss": -6.489065647125244, "global_step": 104737, "epoch": 2493} {"train_loss": -6.440484523773193, "global_step": 104738, "epoch": 2493} {"train_loss": -6.300814151763916, "global_step": 104739, "epoch": 2493} {"train_loss": -6.410870552062988, "global_step": 104740, "epoch": 2493} {"train_loss": -6.377532005310059, "global_step": 104741, "epoch": 2493} {"train_loss": -6.34597110748291, "global_step": 104742, "epoch": 2493} {"train_loss": -6.325191497802734, "global_step": 104743, "epoch": 2493} {"train_loss": -6.381267547607422, "global_step": 104744, "epoch": 2493} {"train_loss": -6.375112056732178, "global_step": 104745, "epoch": 2493} {"train_loss": -6.4496355056762695, "global_step": 104746, "epoch": 2493} {"train_loss": -6.3757190363747736, "global_step": 104747, "epoch": 2493, "val_loss": 67817.5546875} {"train_loss": -6.346517562866211, "global_step": 104748, "epoch": 2494} {"train_loss": -6.539470672607422, "global_step": 104749, "epoch": 2494} {"train_loss": -6.458131313323975, "global_step": 104750, "epoch": 2494} {"train_loss": -6.356199264526367, "global_step": 104751, "epoch": 2494} {"train_loss": -6.350931167602539, "global_step": 104752, "epoch": 2494} {"train_loss": -6.4110002517700195, "global_step": 104753, "epoch": 2494} {"train_loss": -6.47133731842041, "global_step": 104754, "epoch": 2494} {"train_loss": -6.426435470581055, "global_step": 104755, "epoch": 2494} {"train_loss": -6.321977615356445, "global_step": 104756, "epoch": 2494} {"train_loss": -6.420680999755859, "global_step": 104757, "epoch": 2494} {"train_loss": -6.435824394226074, "global_step": 104758, "epoch": 2494} {"train_loss": -6.296364784240723, "global_step": 104759, "epoch": 2494} {"train_loss": -6.238794803619385, "global_step": 104760, "epoch": 2494} {"train_loss": -6.479983329772949, "global_step": 104761, "epoch": 2494} {"train_loss": -6.354403972625732, "global_step": 104762, "epoch": 2494} {"train_loss": -6.365867614746094, "global_step": 104763, "epoch": 2494} {"train_loss": -6.146886825561523, "global_step": 104764, "epoch": 2494} {"train_loss": -6.339056968688965, "global_step": 104765, "epoch": 2494} {"train_loss": -6.3714141845703125, "global_step": 104766, "epoch": 2494} {"train_loss": -6.317838668823242, "global_step": 104767, "epoch": 2494} {"train_loss": -6.18936014175415, "global_step": 104768, "epoch": 2494} {"train_loss": -6.443652153015137, "global_step": 104769, "epoch": 2494} {"train_loss": -6.40245246887207, "global_step": 104770, "epoch": 2494} {"train_loss": -6.314662456512451, "global_step": 104771, "epoch": 2494} {"train_loss": -6.367804527282715, "global_step": 104772, "epoch": 2494} {"train_loss": -6.359708786010742, "global_step": 104773, "epoch": 2494} {"train_loss": -6.3415374755859375, "global_step": 104774, "epoch": 2494} {"train_loss": -6.407240867614746, "global_step": 104775, "epoch": 2494} {"train_loss": -6.308384418487549, "global_step": 104776, "epoch": 2494} {"train_loss": -6.358992576599121, "global_step": 104777, "epoch": 2494} {"train_loss": -6.211579322814941, "global_step": 104778, "epoch": 2494} {"train_loss": -6.409358024597168, "global_step": 104779, "epoch": 2494} {"train_loss": -6.3361310958862305, "global_step": 104780, "epoch": 2494} {"train_loss": -6.357213973999023, "global_step": 104781, "epoch": 2494} {"train_loss": -6.379185676574707, "global_step": 104782, "epoch": 2494} {"train_loss": -6.529563903808594, "global_step": 104783, "epoch": 2494} {"train_loss": -6.248963356018066, "global_step": 104784, "epoch": 2494} {"train_loss": -6.423976898193359, "global_step": 104785, "epoch": 2494} {"train_loss": -6.302028179168701, "global_step": 104786, "epoch": 2494} {"train_loss": -6.40891170501709, "global_step": 104787, "epoch": 2494} {"train_loss": -6.392014503479004, "global_step": 104788, "epoch": 2494} {"train_loss": -6.359330063774472, "global_step": 104789, "epoch": 2494, "val_loss": 67882.7578125} {"train_loss": -6.376106262207031, "global_step": 104790, "epoch": 2495} {"train_loss": -6.325403213500977, "global_step": 104791, "epoch": 2495} {"train_loss": -6.363750457763672, "global_step": 104792, "epoch": 2495} {"train_loss": -6.378840446472168, "global_step": 104793, "epoch": 2495} {"train_loss": -6.462841033935547, "global_step": 104794, "epoch": 2495} {"train_loss": -6.251118183135986, "global_step": 104795, "epoch": 2495} {"train_loss": -6.1837053298950195, "global_step": 104796, "epoch": 2495} {"train_loss": -6.300527572631836, "global_step": 104797, "epoch": 2495} {"train_loss": -6.2892961502075195, "global_step": 104798, "epoch": 2495} {"train_loss": -6.267793655395508, "global_step": 104799, "epoch": 2495} {"train_loss": -6.216516017913818, "global_step": 104800, "epoch": 2495} {"train_loss": -6.132706165313721, "global_step": 104801, "epoch": 2495} {"train_loss": -6.278424263000488, "global_step": 104802, "epoch": 2495} {"train_loss": -6.087338924407959, "global_step": 104803, "epoch": 2495} {"train_loss": -6.372906684875488, "global_step": 104804, "epoch": 2495} {"train_loss": -5.9954833984375, "global_step": 104805, "epoch": 2495} {"train_loss": -6.182244777679443, "global_step": 104806, "epoch": 2495} {"train_loss": -6.185019493103027, "global_step": 104807, "epoch": 2495} {"train_loss": -6.281859397888184, "global_step": 104808, "epoch": 2495} {"train_loss": -6.2167558670043945, "global_step": 104809, "epoch": 2495} {"train_loss": -6.275570869445801, "global_step": 104810, "epoch": 2495} {"train_loss": -6.147191047668457, "global_step": 104811, "epoch": 2495} {"train_loss": -6.302829265594482, "global_step": 104812, "epoch": 2495} {"train_loss": -6.338142395019531, "global_step": 104813, "epoch": 2495} {"train_loss": -6.252479553222656, "global_step": 104814, "epoch": 2495} {"train_loss": -6.297477722167969, "global_step": 104815, "epoch": 2495} {"train_loss": -6.307713508605957, "global_step": 104816, "epoch": 2495} {"train_loss": -6.2447614669799805, "global_step": 104817, "epoch": 2495} {"train_loss": -6.256181240081787, "global_step": 104818, "epoch": 2495} {"train_loss": -6.2845306396484375, "global_step": 104819, "epoch": 2495} {"train_loss": -6.334645748138428, "global_step": 104820, "epoch": 2495} {"train_loss": -6.329956531524658, "global_step": 104821, "epoch": 2495} {"train_loss": -6.421701431274414, "global_step": 104822, "epoch": 2495} {"train_loss": -6.259421348571777, "global_step": 104823, "epoch": 2495} {"train_loss": -6.270569801330566, "global_step": 104824, "epoch": 2495} {"train_loss": -6.42024040222168, "global_step": 104825, "epoch": 2495} {"train_loss": -6.422184467315674, "global_step": 104826, "epoch": 2495} {"train_loss": -6.384955883026123, "global_step": 104827, "epoch": 2495} {"train_loss": -6.333361625671387, "global_step": 104828, "epoch": 2495} {"train_loss": -6.362055778503418, "global_step": 104829, "epoch": 2495} {"train_loss": -6.279772758483887, "global_step": 104830, "epoch": 2495} {"train_loss": -6.286653007779803, "global_step": 104831, "epoch": 2495, "val_loss": 67908.140625} {"train_loss": -6.423966407775879, "global_step": 104832, "epoch": 2496} {"train_loss": -6.432981967926025, "global_step": 104833, "epoch": 2496} {"train_loss": -6.394733905792236, "global_step": 104834, "epoch": 2496} {"train_loss": -6.344926834106445, "global_step": 104835, "epoch": 2496} {"train_loss": -6.4408488273620605, "global_step": 104836, "epoch": 2496} {"train_loss": -6.306948661804199, "global_step": 104837, "epoch": 2496} {"train_loss": -6.412494659423828, "global_step": 104838, "epoch": 2496} {"train_loss": -6.419770240783691, "global_step": 104839, "epoch": 2496} {"train_loss": -6.463620185852051, "global_step": 104840, "epoch": 2496} {"train_loss": -6.3881378173828125, "global_step": 104841, "epoch": 2496} {"train_loss": -6.473160743713379, "global_step": 104842, "epoch": 2496} {"train_loss": -6.429454803466797, "global_step": 104843, "epoch": 2496} {"train_loss": -6.408146858215332, "global_step": 104844, "epoch": 2496} {"train_loss": -6.333099842071533, "global_step": 104845, "epoch": 2496} {"train_loss": -6.440253257751465, "global_step": 104846, "epoch": 2496} {"train_loss": -6.346323013305664, "global_step": 104847, "epoch": 2496} {"train_loss": -6.434729099273682, "global_step": 104848, "epoch": 2496} {"train_loss": -6.416353225708008, "global_step": 104849, "epoch": 2496} {"train_loss": -6.411700248718262, "global_step": 104850, "epoch": 2496} {"train_loss": -6.271020889282227, "global_step": 104851, "epoch": 2496} {"train_loss": -6.441407680511475, "global_step": 104852, "epoch": 2496} {"train_loss": -6.31251335144043, "global_step": 104853, "epoch": 2496} {"train_loss": -6.482888221740723, "global_step": 104854, "epoch": 2496} {"train_loss": -6.474238395690918, "global_step": 104855, "epoch": 2496} {"train_loss": -6.464877605438232, "global_step": 104856, "epoch": 2496} {"train_loss": -6.322799205780029, "global_step": 104857, "epoch": 2496} {"train_loss": -6.470109939575195, "global_step": 104858, "epoch": 2496} {"train_loss": -6.3753204345703125, "global_step": 104859, "epoch": 2496} {"train_loss": -6.332146167755127, "global_step": 104860, "epoch": 2496} {"train_loss": -6.477839469909668, "global_step": 104861, "epoch": 2496} {"train_loss": -6.473331451416016, "global_step": 104862, "epoch": 2496} {"train_loss": -6.317460536956787, "global_step": 104863, "epoch": 2496} {"train_loss": -6.455104827880859, "global_step": 104864, "epoch": 2496} {"train_loss": -6.395811080932617, "global_step": 104865, "epoch": 2496} {"train_loss": -6.366544723510742, "global_step": 104866, "epoch": 2496} {"train_loss": -6.4478278160095215, "global_step": 104867, "epoch": 2496} {"train_loss": -6.373391151428223, "global_step": 104868, "epoch": 2496} {"train_loss": -6.464493751525879, "global_step": 104869, "epoch": 2496} {"train_loss": -6.340003967285156, "global_step": 104870, "epoch": 2496} {"train_loss": -6.460781574249268, "global_step": 104871, "epoch": 2496} {"train_loss": -6.393111228942871, "global_step": 104872, "epoch": 2496} {"train_loss": -6.403917607806978, "global_step": 104873, "epoch": 2496, "val_loss": 68207.4375} {"train_loss": -6.3725996017456055, "global_step": 104874, "epoch": 2497} {"train_loss": -6.387948036193848, "global_step": 104875, "epoch": 2497} {"train_loss": -6.404977798461914, "global_step": 104876, "epoch": 2497} {"train_loss": -6.46959114074707, "global_step": 104877, "epoch": 2497} {"train_loss": -6.3141584396362305, "global_step": 104878, "epoch": 2497} {"train_loss": -6.415464401245117, "global_step": 104879, "epoch": 2497} {"train_loss": -6.311098098754883, "global_step": 104880, "epoch": 2497} {"train_loss": -6.366844177246094, "global_step": 104881, "epoch": 2497} {"train_loss": -6.443889617919922, "global_step": 104882, "epoch": 2497} {"train_loss": -6.414715766906738, "global_step": 104883, "epoch": 2497} {"train_loss": -6.474157810211182, "global_step": 104884, "epoch": 2497} {"train_loss": -6.4077253341674805, "global_step": 104885, "epoch": 2497} {"train_loss": -6.432792663574219, "global_step": 104886, "epoch": 2497} {"train_loss": -6.451300621032715, "global_step": 104887, "epoch": 2497} {"train_loss": -6.378533363342285, "global_step": 104888, "epoch": 2497} {"train_loss": -6.363546371459961, "global_step": 104889, "epoch": 2497} {"train_loss": -6.355278015136719, "global_step": 104890, "epoch": 2497} {"train_loss": -6.469777584075928, "global_step": 104891, "epoch": 2497} {"train_loss": -6.395421981811523, "global_step": 104892, "epoch": 2497} {"train_loss": -6.399468421936035, "global_step": 104893, "epoch": 2497} {"train_loss": -6.335051536560059, "global_step": 104894, "epoch": 2497} {"train_loss": -6.4376983642578125, "global_step": 104895, "epoch": 2497} {"train_loss": -6.4425153732299805, "global_step": 104896, "epoch": 2497} {"train_loss": -6.427474021911621, "global_step": 104897, "epoch": 2497} {"train_loss": -6.408390998840332, "global_step": 104898, "epoch": 2497} {"train_loss": -6.322925567626953, "global_step": 104899, "epoch": 2497} {"train_loss": -6.408531188964844, "global_step": 104900, "epoch": 2497} {"train_loss": -6.491791248321533, "global_step": 104901, "epoch": 2497} {"train_loss": -6.387231826782227, "global_step": 104902, "epoch": 2497} {"train_loss": -6.319807529449463, "global_step": 104903, "epoch": 2497} {"train_loss": -6.2453107833862305, "global_step": 104904, "epoch": 2497} {"train_loss": -6.4018144607543945, "global_step": 104905, "epoch": 2497} {"train_loss": -6.374289512634277, "global_step": 104906, "epoch": 2497} {"train_loss": -6.451000213623047, "global_step": 104907, "epoch": 2497} {"train_loss": -6.414456367492676, "global_step": 104908, "epoch": 2497} {"train_loss": -6.44907283782959, "global_step": 104909, "epoch": 2497} {"train_loss": -6.364366054534912, "global_step": 104910, "epoch": 2497} {"train_loss": -6.414758682250977, "global_step": 104911, "epoch": 2497} {"train_loss": -6.400923728942871, "global_step": 104912, "epoch": 2497} {"train_loss": -6.313345909118652, "global_step": 104913, "epoch": 2497} {"train_loss": -6.405791282653809, "global_step": 104914, "epoch": 2497} {"train_loss": -6.39861045564924, "global_step": 104915, "epoch": 2497, "val_loss": 67993.2265625} {"train_loss": -6.296505928039551, "global_step": 104916, "epoch": 2498} {"train_loss": -6.525785446166992, "global_step": 104917, "epoch": 2498} {"train_loss": -6.367783546447754, "global_step": 104918, "epoch": 2498} {"train_loss": -6.361611366271973, "global_step": 104919, "epoch": 2498} {"train_loss": -6.479101657867432, "global_step": 104920, "epoch": 2498} {"train_loss": -6.4216766357421875, "global_step": 104921, "epoch": 2498} {"train_loss": -6.424673557281494, "global_step": 104922, "epoch": 2498} {"train_loss": -6.487307548522949, "global_step": 104923, "epoch": 2498} {"train_loss": -6.442874908447266, "global_step": 104924, "epoch": 2498} {"train_loss": -6.348345756530762, "global_step": 104925, "epoch": 2498} {"train_loss": -6.301340579986572, "global_step": 104926, "epoch": 2498} {"train_loss": -6.451277732849121, "global_step": 104927, "epoch": 2498} {"train_loss": -6.3896942138671875, "global_step": 104928, "epoch": 2498} {"train_loss": -6.364803314208984, "global_step": 104929, "epoch": 2498} {"train_loss": -6.436663627624512, "global_step": 104930, "epoch": 2498} {"train_loss": -6.470984935760498, "global_step": 104931, "epoch": 2498} {"train_loss": -6.374735355377197, "global_step": 104932, "epoch": 2498} {"train_loss": -6.356621742248535, "global_step": 104933, "epoch": 2498} {"train_loss": -6.400651454925537, "global_step": 104934, "epoch": 2498} {"train_loss": -6.423389434814453, "global_step": 104935, "epoch": 2498} {"train_loss": -6.396623611450195, "global_step": 104936, "epoch": 2498} {"train_loss": -6.378363132476807, "global_step": 104937, "epoch": 2498} {"train_loss": -6.298377990722656, "global_step": 104938, "epoch": 2498} {"train_loss": -6.425017833709717, "global_step": 104939, "epoch": 2498} {"train_loss": -6.457232475280762, "global_step": 104940, "epoch": 2498} {"train_loss": -6.34014892578125, "global_step": 104941, "epoch": 2498} {"train_loss": -6.342100143432617, "global_step": 104942, "epoch": 2498} {"train_loss": -6.399941444396973, "global_step": 104943, "epoch": 2498} {"train_loss": -6.4389190673828125, "global_step": 104944, "epoch": 2498} {"train_loss": -6.1863603591918945, "global_step": 104945, "epoch": 2498} {"train_loss": -6.284543514251709, "global_step": 104946, "epoch": 2498} {"train_loss": -6.317904472351074, "global_step": 104947, "epoch": 2498} {"train_loss": -6.37050724029541, "global_step": 104948, "epoch": 2498} {"train_loss": -6.318167686462402, "global_step": 104949, "epoch": 2498} {"train_loss": -6.2413458824157715, "global_step": 104950, "epoch": 2498} {"train_loss": -6.350322723388672, "global_step": 104951, "epoch": 2498} {"train_loss": -6.158475875854492, "global_step": 104952, "epoch": 2498} {"train_loss": -6.3400774002075195, "global_step": 104953, "epoch": 2498} {"train_loss": -6.270997524261475, "global_step": 104954, "epoch": 2498} {"train_loss": -6.357701301574707, "global_step": 104955, "epoch": 2498} {"train_loss": -6.244645118713379, "global_step": 104956, "epoch": 2498} {"train_loss": -6.365521317436581, "global_step": 104957, "epoch": 2498, "val_loss": 67968.3125} {"train_loss": -6.3494157791137695, "global_step": 104958, "epoch": 2499} {"train_loss": -6.270959854125977, "global_step": 104959, "epoch": 2499} {"train_loss": -6.397667407989502, "global_step": 104960, "epoch": 2499} {"train_loss": -6.296156883239746, "global_step": 104961, "epoch": 2499} {"train_loss": -6.301328182220459, "global_step": 104962, "epoch": 2499} {"train_loss": -6.317988872528076, "global_step": 104963, "epoch": 2499} {"train_loss": -6.311554908752441, "global_step": 104964, "epoch": 2499} {"train_loss": -6.388129234313965, "global_step": 104965, "epoch": 2499} {"train_loss": -6.352944374084473, "global_step": 104966, "epoch": 2499} {"train_loss": -6.40933084487915, "global_step": 104967, "epoch": 2499} {"train_loss": -6.415785312652588, "global_step": 104968, "epoch": 2499} {"train_loss": -6.384040355682373, "global_step": 104969, "epoch": 2499} {"train_loss": -6.456933498382568, "global_step": 104970, "epoch": 2499} {"train_loss": -6.378268241882324, "global_step": 104971, "epoch": 2499} {"train_loss": -6.391386985778809, "global_step": 104972, "epoch": 2499} {"train_loss": -6.339494228363037, "global_step": 104973, "epoch": 2499} {"train_loss": -6.3504958152771, "global_step": 104974, "epoch": 2499} {"train_loss": -6.341269493103027, "global_step": 104975, "epoch": 2499} {"train_loss": -6.530695915222168, "global_step": 104976, "epoch": 2499} {"train_loss": -6.44876766204834, "global_step": 104977, "epoch": 2499} {"train_loss": -6.350341796875, "global_step": 104978, "epoch": 2499} {"train_loss": -6.365483283996582, "global_step": 104979, "epoch": 2499} {"train_loss": -6.281966209411621, "global_step": 104980, "epoch": 2499} {"train_loss": -6.429080009460449, "global_step": 104981, "epoch": 2499} {"train_loss": -6.397159576416016, "global_step": 104982, "epoch": 2499} {"train_loss": -6.313404560089111, "global_step": 104983, "epoch": 2499} {"train_loss": -6.5474348068237305, "global_step": 104984, "epoch": 2499} {"train_loss": -6.338920593261719, "global_step": 104985, "epoch": 2499} {"train_loss": -6.376964569091797, "global_step": 104986, "epoch": 2499} {"train_loss": -6.406074523925781, "global_step": 104987, "epoch": 2499} {"train_loss": -6.369272232055664, "global_step": 104988, "epoch": 2499} {"train_loss": -6.301639556884766, "global_step": 104989, "epoch": 2499} {"train_loss": -6.396225452423096, "global_step": 104990, "epoch": 2499} {"train_loss": -6.474775791168213, "global_step": 104991, "epoch": 2499} {"train_loss": -6.220792770385742, "global_step": 104992, "epoch": 2499} {"train_loss": -6.473295211791992, "global_step": 104993, "epoch": 2499} {"train_loss": -6.438699245452881, "global_step": 104994, "epoch": 2499} {"train_loss": -6.42238712310791, "global_step": 104995, "epoch": 2499} {"train_loss": -6.437009811401367, "global_step": 104996, "epoch": 2499} {"train_loss": -6.492421627044678, "global_step": 104997, "epoch": 2499} {"train_loss": -6.394686222076416, "global_step": 104998, "epoch": 2499} {"train_loss": -6.384068693433489, "global_step": 104999, "epoch": 2499, "val_loss": 67864.171875} {"train_loss": -6.4911789894104, "global_step": 105000, "epoch": 2500} {"train_loss": -6.480451583862305, "global_step": 105001, "epoch": 2500} {"train_loss": -6.42559814453125, "global_step": 105002, "epoch": 2500} {"train_loss": -6.3599324226379395, "global_step": 105003, "epoch": 2500} {"train_loss": -6.447168350219727, "global_step": 105004, "epoch": 2500} {"train_loss": -6.481472015380859, "global_step": 105005, "epoch": 2500} {"train_loss": -6.432888984680176, "global_step": 105006, "epoch": 2500} {"train_loss": -6.5010199546813965, "global_step": 105007, "epoch": 2500} {"train_loss": -6.403777122497559, "global_step": 105008, "epoch": 2500} {"train_loss": -6.44770622253418, "global_step": 105009, "epoch": 2500} {"train_loss": -6.399018287658691, "global_step": 105010, "epoch": 2500} {"train_loss": -6.459450721740723, "global_step": 105011, "epoch": 2500} {"train_loss": -6.43349027633667, "global_step": 105012, "epoch": 2500} {"train_loss": -6.374360084533691, "global_step": 105013, "epoch": 2500} {"train_loss": -6.402449131011963, "global_step": 105014, "epoch": 2500} {"train_loss": -6.376646995544434, "global_step": 105015, "epoch": 2500} {"train_loss": -6.32639217376709, "global_step": 105016, "epoch": 2500} {"train_loss": -6.3929948806762695, "global_step": 105017, "epoch": 2500} {"train_loss": -6.320291519165039, "global_step": 105018, "epoch": 2500} {"train_loss": -6.522404670715332, "global_step": 105019, "epoch": 2500} {"train_loss": -6.342803955078125, "global_step": 105020, "epoch": 2500} {"train_loss": -6.411301612854004, "global_step": 105021, "epoch": 2500} {"train_loss": -6.54524040222168, "global_step": 105022, "epoch": 2500} {"train_loss": -6.215753078460693, "global_step": 105023, "epoch": 2500} {"train_loss": -6.420722961425781, "global_step": 105024, "epoch": 2500} {"train_loss": -6.4798078536987305, "global_step": 105025, "epoch": 2500} {"train_loss": -6.416134834289551, "global_step": 105026, "epoch": 2500} {"train_loss": -6.4329729080200195, "global_step": 105027, "epoch": 2500} {"train_loss": -6.26077938079834, "global_step": 105028, "epoch": 2500} {"train_loss": -6.488945484161377, "global_step": 105029, "epoch": 2500} {"train_loss": -6.248966693878174, "global_step": 105030, "epoch": 2500} {"train_loss": -6.278504371643066, "global_step": 105031, "epoch": 2500} {"train_loss": -6.4766645431518555, "global_step": 105032, "epoch": 2500} {"train_loss": -6.313826560974121, "global_step": 105033, "epoch": 2500} {"train_loss": -6.300475597381592, "global_step": 105034, "epoch": 2500} {"train_loss": -6.281069755554199, "global_step": 105035, "epoch": 2500} {"train_loss": -6.406792163848877, "global_step": 105036, "epoch": 2500} {"train_loss": -6.453117370605469, "global_step": 105037, "epoch": 2500} {"train_loss": -6.250332832336426, "global_step": 105038, "epoch": 2500} {"train_loss": -6.342706680297852, "global_step": 105039, "epoch": 2500} {"train_loss": -6.357109069824219, "global_step": 105040, "epoch": 2500} {"train_loss": -6.393832433791387, "global_step": 105041, "epoch": 2500, "train/sim_max_reward_0": 0.23244889399856908, "train/sim_max_reward_1": 0.9410164184468418, "train/sim_max_reward_2": 0.15825874247839028, "train/sim_max_reward_3": 0.32532533730387414, "train/sim_max_reward_4": 0.40861639810266664, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.1759393259760009, "test/sim_max_reward_4400001": 0.23711586487888445, "test/sim_max_reward_4400002": 0.8525609943068609, "test/sim_max_reward_4400003": 0.9819777751329176, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.7499043201275283, "test/sim_max_reward_4400006": 0.880420472288932, "test/sim_max_reward_4400007": 0.9376582671595216, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.7069349238697744, "test/sim_max_reward_4400010": 0.28594609516809055, "test/sim_max_reward_4400011": 0.3162412550236583, "test/sim_max_reward_4400012": 0.8074803276445266, "test/sim_max_reward_4400013": 0.4517360254553968, "test/sim_max_reward_4400014": 0.15176655084196175, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0650535428847191, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.22181008623388657, "test/sim_max_reward_4400019": 0.38902254012633025, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9851105308450295, "test/sim_max_reward_4400023": 0.7763936171463613, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.23767779686782461, "test/sim_max_reward_4400026": 0.6683150195363792, "test/sim_max_reward_4400027": 0.02049718502151042, "test/sim_max_reward_4400028": 0.42364005046839903, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9587890704098961, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9072193739354255, "test/sim_max_reward_4400034": 0.8640965392732803, "test/sim_max_reward_4400035": 0.6592199039143845, "test/sim_max_reward_4400036": 0.40814023070028244, "test/sim_max_reward_4400037": 0.9910419657272425, "test/sim_max_reward_4400038": 0.97276032640731, "test/sim_max_reward_4400039": 0.9898973159653129, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9403351221147016, "test/sim_max_reward_4400042": 0.8921858312179464, "test/sim_max_reward_4400043": 0.9622024486910723, "test/sim_max_reward_4400044": 0.8145421968687405, "test/sim_max_reward_4400045": 0.9599580057021839, "test/sim_max_reward_4400046": 0.9791072656163095, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 0.869454415474674, "train/mean_score": 0.37644175828208826, "test/mean_score": 0.5672112680396209, "val_loss": 68016.8125} {"train_loss": -6.433271408081055, "global_step": 105042, "epoch": 2501} {"train_loss": -6.371564865112305, "global_step": 105043, "epoch": 2501} {"train_loss": -6.442094326019287, "global_step": 105044, "epoch": 2501} {"train_loss": -6.383955478668213, "global_step": 105045, "epoch": 2501} {"train_loss": -6.3642754554748535, "global_step": 105046, "epoch": 2501} {"train_loss": -6.332252025604248, "global_step": 105047, "epoch": 2501} {"train_loss": -6.3346099853515625, "global_step": 105048, "epoch": 2501} {"train_loss": -6.387971878051758, "global_step": 105049, "epoch": 2501} {"train_loss": -6.418824195861816, "global_step": 105050, "epoch": 2501} {"train_loss": -6.506814956665039, "global_step": 105051, "epoch": 2501} {"train_loss": -6.377715110778809, "global_step": 105052, "epoch": 2501} {"train_loss": -6.335146903991699, "global_step": 105053, "epoch": 2501} {"train_loss": -6.400622367858887, "global_step": 105054, "epoch": 2501} {"train_loss": -6.415656089782715, "global_step": 105055, "epoch": 2501} {"train_loss": -6.471824645996094, "global_step": 105056, "epoch": 2501} {"train_loss": -6.411921501159668, "global_step": 105057, "epoch": 2501} {"train_loss": -6.35629940032959, "global_step": 105058, "epoch": 2501} {"train_loss": -6.310215473175049, "global_step": 105059, "epoch": 2501} {"train_loss": -6.42041015625, "global_step": 105060, "epoch": 2501} {"train_loss": -6.401849269866943, "global_step": 105061, "epoch": 2501} {"train_loss": -6.355891227722168, "global_step": 105062, "epoch": 2501} {"train_loss": -6.390561580657959, "global_step": 105063, "epoch": 2501} {"train_loss": -6.269815921783447, "global_step": 105064, "epoch": 2501} {"train_loss": -6.3761186599731445, "global_step": 105065, "epoch": 2501} {"train_loss": -6.520881652832031, "global_step": 105066, "epoch": 2501} {"train_loss": -6.43399715423584, "global_step": 105067, "epoch": 2501} {"train_loss": -6.334402084350586, "global_step": 105068, "epoch": 2501} {"train_loss": -6.402329921722412, "global_step": 105069, "epoch": 2501} {"train_loss": -6.428594589233398, "global_step": 105070, "epoch": 2501} {"train_loss": -6.355358123779297, "global_step": 105071, "epoch": 2501} {"train_loss": -6.251739501953125, "global_step": 105072, "epoch": 2501} {"train_loss": -6.401371955871582, "global_step": 105073, "epoch": 2501} {"train_loss": -6.254100799560547, "global_step": 105074, "epoch": 2501} {"train_loss": -6.439716815948486, "global_step": 105075, "epoch": 2501} {"train_loss": -6.428194999694824, "global_step": 105076, "epoch": 2501} {"train_loss": -6.429402828216553, "global_step": 105077, "epoch": 2501} {"train_loss": -6.364293098449707, "global_step": 105078, "epoch": 2501} {"train_loss": -6.476807594299316, "global_step": 105079, "epoch": 2501} {"train_loss": -6.291213035583496, "global_step": 105080, "epoch": 2501} {"train_loss": -6.317070007324219, "global_step": 105081, "epoch": 2501} {"train_loss": -6.399070739746094, "global_step": 105082, "epoch": 2501} {"train_loss": -6.386186497552054, "global_step": 105083, "epoch": 2501, "val_loss": 67889.828125} {"train_loss": -6.268828392028809, "global_step": 105084, "epoch": 2502} {"train_loss": -6.467555999755859, "global_step": 105085, "epoch": 2502} {"train_loss": -6.334013938903809, "global_step": 105086, "epoch": 2502} {"train_loss": -6.4219231605529785, "global_step": 105087, "epoch": 2502} {"train_loss": -6.379655361175537, "global_step": 105088, "epoch": 2502} {"train_loss": -6.384353160858154, "global_step": 105089, "epoch": 2502} {"train_loss": -6.27598762512207, "global_step": 105090, "epoch": 2502} {"train_loss": -6.346778869628906, "global_step": 105091, "epoch": 2502} {"train_loss": -6.269955635070801, "global_step": 105092, "epoch": 2502} {"train_loss": -6.379887580871582, "global_step": 105093, "epoch": 2502} {"train_loss": -6.417815208435059, "global_step": 105094, "epoch": 2502} {"train_loss": -6.458740234375, "global_step": 105095, "epoch": 2502} {"train_loss": -6.398093223571777, "global_step": 105096, "epoch": 2502} {"train_loss": -6.3101582527160645, "global_step": 105097, "epoch": 2502} {"train_loss": -6.33052396774292, "global_step": 105098, "epoch": 2502} {"train_loss": -6.408138275146484, "global_step": 105099, "epoch": 2502} {"train_loss": -6.396722316741943, "global_step": 105100, "epoch": 2502} {"train_loss": -6.374432563781738, "global_step": 105101, "epoch": 2502} {"train_loss": -6.432497024536133, "global_step": 105102, "epoch": 2502} {"train_loss": -6.434905052185059, "global_step": 105103, "epoch": 2502} {"train_loss": -6.426821708679199, "global_step": 105104, "epoch": 2502} {"train_loss": -6.457292556762695, "global_step": 105105, "epoch": 2502} {"train_loss": -6.31743860244751, "global_step": 105106, "epoch": 2502} {"train_loss": -6.420166015625, "global_step": 105107, "epoch": 2502} {"train_loss": -6.345442771911621, "global_step": 105108, "epoch": 2502} {"train_loss": -6.347281455993652, "global_step": 105109, "epoch": 2502} {"train_loss": -6.475184440612793, "global_step": 105110, "epoch": 2502} {"train_loss": -6.425779819488525, "global_step": 105111, "epoch": 2502} {"train_loss": -6.333245754241943, "global_step": 105112, "epoch": 2502} {"train_loss": -6.48658561706543, "global_step": 105113, "epoch": 2502} {"train_loss": -6.430225849151611, "global_step": 105114, "epoch": 2502} {"train_loss": -6.490352630615234, "global_step": 105115, "epoch": 2502} {"train_loss": -6.418528079986572, "global_step": 105116, "epoch": 2502} {"train_loss": -6.414324760437012, "global_step": 105117, "epoch": 2502} {"train_loss": -6.459763526916504, "global_step": 105118, "epoch": 2502} {"train_loss": -6.417869567871094, "global_step": 105119, "epoch": 2502} {"train_loss": -6.351566314697266, "global_step": 105120, "epoch": 2502} {"train_loss": -6.375617027282715, "global_step": 105121, "epoch": 2502} {"train_loss": -6.425112247467041, "global_step": 105122, "epoch": 2502} {"train_loss": -6.474661827087402, "global_step": 105123, "epoch": 2502} {"train_loss": -6.517027854919434, "global_step": 105124, "epoch": 2502} {"train_loss": -6.399009057453701, "global_step": 105125, "epoch": 2502, "val_loss": 67712.90625} {"train_loss": -6.522548675537109, "global_step": 105126, "epoch": 2503} {"train_loss": -6.478700637817383, "global_step": 105127, "epoch": 2503} {"train_loss": -6.512799263000488, "global_step": 105128, "epoch": 2503} {"train_loss": -6.445725440979004, "global_step": 105129, "epoch": 2503} {"train_loss": -6.480985641479492, "global_step": 105130, "epoch": 2503} {"train_loss": -6.48797082901001, "global_step": 105131, "epoch": 2503} {"train_loss": -6.416608810424805, "global_step": 105132, "epoch": 2503} {"train_loss": -6.5425567626953125, "global_step": 105133, "epoch": 2503} {"train_loss": -6.41231632232666, "global_step": 105134, "epoch": 2503} {"train_loss": -6.556225776672363, "global_step": 105135, "epoch": 2503} {"train_loss": -6.408356666564941, "global_step": 105136, "epoch": 2503} {"train_loss": -6.476605415344238, "global_step": 105137, "epoch": 2503} {"train_loss": -6.463356971740723, "global_step": 105138, "epoch": 2503} {"train_loss": -6.322770118713379, "global_step": 105139, "epoch": 2503} {"train_loss": -6.412891387939453, "global_step": 105140, "epoch": 2503} {"train_loss": -6.438619136810303, "global_step": 105141, "epoch": 2503} {"train_loss": -6.426511764526367, "global_step": 105142, "epoch": 2503} {"train_loss": -6.338346481323242, "global_step": 105143, "epoch": 2503} {"train_loss": -6.376812934875488, "global_step": 105144, "epoch": 2503} {"train_loss": -6.298861503601074, "global_step": 105145, "epoch": 2503} {"train_loss": -6.3825554847717285, "global_step": 105146, "epoch": 2503} {"train_loss": -6.320514678955078, "global_step": 105147, "epoch": 2503} {"train_loss": -6.32662296295166, "global_step": 105148, "epoch": 2503} {"train_loss": -6.356783390045166, "global_step": 105149, "epoch": 2503} {"train_loss": -6.427595615386963, "global_step": 105150, "epoch": 2503} {"train_loss": -6.255824089050293, "global_step": 105151, "epoch": 2503} {"train_loss": -6.437324523925781, "global_step": 105152, "epoch": 2503} {"train_loss": -6.304728031158447, "global_step": 105153, "epoch": 2503} {"train_loss": -6.238407611846924, "global_step": 105154, "epoch": 2503} {"train_loss": -6.388762474060059, "global_step": 105155, "epoch": 2503} {"train_loss": -6.447880744934082, "global_step": 105156, "epoch": 2503} {"train_loss": -6.335235118865967, "global_step": 105157, "epoch": 2503} {"train_loss": -6.469413757324219, "global_step": 105158, "epoch": 2503} {"train_loss": -6.365077018737793, "global_step": 105159, "epoch": 2503} {"train_loss": -6.40056848526001, "global_step": 105160, "epoch": 2503} {"train_loss": -6.386728286743164, "global_step": 105161, "epoch": 2503} {"train_loss": -6.369699478149414, "global_step": 105162, "epoch": 2503} {"train_loss": -6.258536338806152, "global_step": 105163, "epoch": 2503} {"train_loss": -6.4908552169799805, "global_step": 105164, "epoch": 2503} {"train_loss": -6.4019575119018555, "global_step": 105165, "epoch": 2503} {"train_loss": -6.37613582611084, "global_step": 105166, "epoch": 2503} {"train_loss": -6.404759770347958, "global_step": 105167, "epoch": 2503, "val_loss": 67928.265625} {"train_loss": -6.361104965209961, "global_step": 105168, "epoch": 2504} {"train_loss": -6.466710090637207, "global_step": 105169, "epoch": 2504} {"train_loss": -6.252015590667725, "global_step": 105170, "epoch": 2504} {"train_loss": -6.364240646362305, "global_step": 105171, "epoch": 2504} {"train_loss": -6.328940391540527, "global_step": 105172, "epoch": 2504} {"train_loss": -6.257205963134766, "global_step": 105173, "epoch": 2504} {"train_loss": -6.457047939300537, "global_step": 105174, "epoch": 2504} {"train_loss": -6.331188678741455, "global_step": 105175, "epoch": 2504} {"train_loss": -6.282013416290283, "global_step": 105176, "epoch": 2504} {"train_loss": -6.351091384887695, "global_step": 105177, "epoch": 2504} {"train_loss": -6.465811252593994, "global_step": 105178, "epoch": 2504} {"train_loss": -6.471728324890137, "global_step": 105179, "epoch": 2504} {"train_loss": -6.4268388748168945, "global_step": 105180, "epoch": 2504} {"train_loss": -6.425477504730225, "global_step": 105181, "epoch": 2504} {"train_loss": -6.367652416229248, "global_step": 105182, "epoch": 2504} {"train_loss": -6.377572536468506, "global_step": 105183, "epoch": 2504} {"train_loss": -6.396062850952148, "global_step": 105184, "epoch": 2504} {"train_loss": -6.365836143493652, "global_step": 105185, "epoch": 2504} {"train_loss": -6.412023067474365, "global_step": 105186, "epoch": 2504} {"train_loss": -6.377134323120117, "global_step": 105187, "epoch": 2504} {"train_loss": -6.452396392822266, "global_step": 105188, "epoch": 2504} {"train_loss": -6.28553581237793, "global_step": 105189, "epoch": 2504} {"train_loss": -6.2502923011779785, "global_step": 105190, "epoch": 2504} {"train_loss": -6.3133625984191895, "global_step": 105191, "epoch": 2504} {"train_loss": -6.30599308013916, "global_step": 105192, "epoch": 2504} {"train_loss": -6.354671478271484, "global_step": 105193, "epoch": 2504} {"train_loss": -6.276311874389648, "global_step": 105194, "epoch": 2504} {"train_loss": -6.403568267822266, "global_step": 105195, "epoch": 2504} {"train_loss": -6.406462669372559, "global_step": 105196, "epoch": 2504} {"train_loss": -6.215277671813965, "global_step": 105197, "epoch": 2504} {"train_loss": -6.452572345733643, "global_step": 105198, "epoch": 2504} {"train_loss": -6.320428848266602, "global_step": 105199, "epoch": 2504} {"train_loss": -6.387781143188477, "global_step": 105200, "epoch": 2504} {"train_loss": -6.212118148803711, "global_step": 105201, "epoch": 2504} {"train_loss": -6.217828750610352, "global_step": 105202, "epoch": 2504} {"train_loss": -6.332016944885254, "global_step": 105203, "epoch": 2504} {"train_loss": -6.299724578857422, "global_step": 105204, "epoch": 2504} {"train_loss": -6.329014778137207, "global_step": 105205, "epoch": 2504} {"train_loss": -6.338075637817383, "global_step": 105206, "epoch": 2504} {"train_loss": -6.253100872039795, "global_step": 105207, "epoch": 2504} {"train_loss": -6.323976516723633, "global_step": 105208, "epoch": 2504} {"train_loss": -6.349314996174404, "global_step": 105209, "epoch": 2504, "val_loss": 67908.3359375} {"train_loss": -6.437203884124756, "global_step": 105210, "epoch": 2505} {"train_loss": -6.3422017097473145, "global_step": 105211, "epoch": 2505} {"train_loss": -6.34100341796875, "global_step": 105212, "epoch": 2505} {"train_loss": -6.435112953186035, "global_step": 105213, "epoch": 2505} {"train_loss": -6.431069374084473, "global_step": 105214, "epoch": 2505} {"train_loss": -6.316850662231445, "global_step": 105215, "epoch": 2505} {"train_loss": -6.376699447631836, "global_step": 105216, "epoch": 2505} {"train_loss": -6.357306480407715, "global_step": 105217, "epoch": 2505} {"train_loss": -6.402718544006348, "global_step": 105218, "epoch": 2505} {"train_loss": -6.473354339599609, "global_step": 105219, "epoch": 2505} {"train_loss": -6.5855255126953125, "global_step": 105220, "epoch": 2505} {"train_loss": -6.504161834716797, "global_step": 105221, "epoch": 2505} {"train_loss": -6.391783714294434, "global_step": 105222, "epoch": 2505} {"train_loss": -6.423508167266846, "global_step": 105223, "epoch": 2505} {"train_loss": -6.380558490753174, "global_step": 105224, "epoch": 2505} {"train_loss": -6.440615177154541, "global_step": 105225, "epoch": 2505} {"train_loss": -6.363444805145264, "global_step": 105226, "epoch": 2505} {"train_loss": -6.384126663208008, "global_step": 105227, "epoch": 2505} {"train_loss": -6.384153366088867, "global_step": 105228, "epoch": 2505} {"train_loss": -6.495547771453857, "global_step": 105229, "epoch": 2505} {"train_loss": -6.4447221755981445, "global_step": 105230, "epoch": 2505} {"train_loss": -6.45539665222168, "global_step": 105231, "epoch": 2505} {"train_loss": -6.3290910720825195, "global_step": 105232, "epoch": 2505} {"train_loss": -6.343906879425049, "global_step": 105233, "epoch": 2505} {"train_loss": -6.372520446777344, "global_step": 105234, "epoch": 2505} {"train_loss": -6.344217777252197, "global_step": 105235, "epoch": 2505} {"train_loss": -6.433235168457031, "global_step": 105236, "epoch": 2505} {"train_loss": -6.446033477783203, "global_step": 105237, "epoch": 2505} {"train_loss": -6.430273532867432, "global_step": 105238, "epoch": 2505} {"train_loss": -6.4689741134643555, "global_step": 105239, "epoch": 2505} {"train_loss": -6.39855432510376, "global_step": 105240, "epoch": 2505} {"train_loss": -6.410935401916504, "global_step": 105241, "epoch": 2505} {"train_loss": -6.373133182525635, "global_step": 105242, "epoch": 2505} {"train_loss": -6.298818111419678, "global_step": 105243, "epoch": 2505} {"train_loss": -6.425229549407959, "global_step": 105244, "epoch": 2505} {"train_loss": -6.388284206390381, "global_step": 105245, "epoch": 2505} {"train_loss": -6.314181327819824, "global_step": 105246, "epoch": 2505} {"train_loss": -6.454230308532715, "global_step": 105247, "epoch": 2505} {"train_loss": -6.476012229919434, "global_step": 105248, "epoch": 2505} {"train_loss": -6.3472394943237305, "global_step": 105249, "epoch": 2505} {"train_loss": -6.4645304679870605, "global_step": 105250, "epoch": 2505} {"train_loss": -6.408189603260586, "global_step": 105251, "epoch": 2505, "val_loss": 67853.515625} {"train_loss": -6.46675968170166, "global_step": 105252, "epoch": 2506} {"train_loss": -6.477609634399414, "global_step": 105253, "epoch": 2506} {"train_loss": -6.4685869216918945, "global_step": 105254, "epoch": 2506} {"train_loss": -6.508626937866211, "global_step": 105255, "epoch": 2506} {"train_loss": -6.485589504241943, "global_step": 105256, "epoch": 2506} {"train_loss": -6.332850456237793, "global_step": 105257, "epoch": 2506} {"train_loss": -6.384092330932617, "global_step": 105258, "epoch": 2506} {"train_loss": -6.440976142883301, "global_step": 105259, "epoch": 2506} {"train_loss": -6.457907199859619, "global_step": 105260, "epoch": 2506} {"train_loss": -6.397082805633545, "global_step": 105261, "epoch": 2506} {"train_loss": -6.46397590637207, "global_step": 105262, "epoch": 2506} {"train_loss": -6.538435935974121, "global_step": 105263, "epoch": 2506} {"train_loss": -6.4914960861206055, "global_step": 105264, "epoch": 2506} {"train_loss": -6.453533172607422, "global_step": 105265, "epoch": 2506} {"train_loss": -6.392395973205566, "global_step": 105266, "epoch": 2506} {"train_loss": -6.432063102722168, "global_step": 105267, "epoch": 2506} {"train_loss": -6.4460883140563965, "global_step": 105268, "epoch": 2506} {"train_loss": -6.573459625244141, "global_step": 105269, "epoch": 2506} {"train_loss": -6.404731273651123, "global_step": 105270, "epoch": 2506} {"train_loss": -6.37647819519043, "global_step": 105271, "epoch": 2506} {"train_loss": -6.361371040344238, "global_step": 105272, "epoch": 2506} {"train_loss": -6.395280838012695, "global_step": 105273, "epoch": 2506} {"train_loss": -6.443963050842285, "global_step": 105274, "epoch": 2506} {"train_loss": -6.468301773071289, "global_step": 105275, "epoch": 2506} {"train_loss": -6.4351806640625, "global_step": 105276, "epoch": 2506} {"train_loss": -6.45271110534668, "global_step": 105277, "epoch": 2506} {"train_loss": -6.469758033752441, "global_step": 105278, "epoch": 2506} {"train_loss": -6.444498062133789, "global_step": 105279, "epoch": 2506} {"train_loss": -6.451457977294922, "global_step": 105280, "epoch": 2506} {"train_loss": -6.588827133178711, "global_step": 105281, "epoch": 2506} {"train_loss": -6.4073166847229, "global_step": 105282, "epoch": 2506} {"train_loss": -6.493126392364502, "global_step": 105283, "epoch": 2506} {"train_loss": -6.372300148010254, "global_step": 105284, "epoch": 2506} {"train_loss": -6.485937118530273, "global_step": 105285, "epoch": 2506} {"train_loss": -6.389470100402832, "global_step": 105286, "epoch": 2506} {"train_loss": -6.401639461517334, "global_step": 105287, "epoch": 2506} {"train_loss": -6.375892162322998, "global_step": 105288, "epoch": 2506} {"train_loss": -6.545445442199707, "global_step": 105289, "epoch": 2506} {"train_loss": -6.45476770401001, "global_step": 105290, "epoch": 2506} {"train_loss": -6.503108024597168, "global_step": 105291, "epoch": 2506} {"train_loss": -6.349919319152832, "global_step": 105292, "epoch": 2506} {"train_loss": -6.444954452060518, "global_step": 105293, "epoch": 2506, "val_loss": 67906.03125} {"train_loss": -6.435906410217285, "global_step": 105294, "epoch": 2507} {"train_loss": -6.406430721282959, "global_step": 105295, "epoch": 2507} {"train_loss": -6.435142517089844, "global_step": 105296, "epoch": 2507} {"train_loss": -6.2674560546875, "global_step": 105297, "epoch": 2507} {"train_loss": -6.339913368225098, "global_step": 105298, "epoch": 2507} {"train_loss": -6.363471031188965, "global_step": 105299, "epoch": 2507} {"train_loss": -6.476004600524902, "global_step": 105300, "epoch": 2507} {"train_loss": -6.294926643371582, "global_step": 105301, "epoch": 2507} {"train_loss": -6.442016124725342, "global_step": 105302, "epoch": 2507} {"train_loss": -6.341151237487793, "global_step": 105303, "epoch": 2507} {"train_loss": -6.381731033325195, "global_step": 105304, "epoch": 2507} {"train_loss": -6.421931266784668, "global_step": 105305, "epoch": 2507} {"train_loss": -6.27689266204834, "global_step": 105306, "epoch": 2507} {"train_loss": -6.348536491394043, "global_step": 105307, "epoch": 2507} {"train_loss": -6.402437210083008, "global_step": 105308, "epoch": 2507} {"train_loss": -6.321595191955566, "global_step": 105309, "epoch": 2507} {"train_loss": -6.279819488525391, "global_step": 105310, "epoch": 2507} {"train_loss": -6.173937797546387, "global_step": 105311, "epoch": 2507} {"train_loss": -6.406088829040527, "global_step": 105312, "epoch": 2507} {"train_loss": -6.522332191467285, "global_step": 105313, "epoch": 2507} {"train_loss": -6.286036968231201, "global_step": 105314, "epoch": 2507} {"train_loss": -6.3654327392578125, "global_step": 105315, "epoch": 2507} {"train_loss": -6.481443405151367, "global_step": 105316, "epoch": 2507} {"train_loss": -6.26679801940918, "global_step": 105317, "epoch": 2507} {"train_loss": -6.331204891204834, "global_step": 105318, "epoch": 2507} {"train_loss": -6.44498348236084, "global_step": 105319, "epoch": 2507} {"train_loss": -6.391399383544922, "global_step": 105320, "epoch": 2507} {"train_loss": -6.478500843048096, "global_step": 105321, "epoch": 2507} {"train_loss": -6.391836643218994, "global_step": 105322, "epoch": 2507} {"train_loss": -6.279976844787598, "global_step": 105323, "epoch": 2507} {"train_loss": -6.345611572265625, "global_step": 105324, "epoch": 2507} {"train_loss": -6.42190408706665, "global_step": 105325, "epoch": 2507} {"train_loss": -6.2652082443237305, "global_step": 105326, "epoch": 2507} {"train_loss": -6.425124168395996, "global_step": 105327, "epoch": 2507} {"train_loss": -6.346879959106445, "global_step": 105328, "epoch": 2507} {"train_loss": -6.36027717590332, "global_step": 105329, "epoch": 2507} {"train_loss": -6.562437057495117, "global_step": 105330, "epoch": 2507} {"train_loss": -6.494823455810547, "global_step": 105331, "epoch": 2507} {"train_loss": -6.416646957397461, "global_step": 105332, "epoch": 2507} {"train_loss": -6.324567794799805, "global_step": 105333, "epoch": 2507} {"train_loss": -6.498539924621582, "global_step": 105334, "epoch": 2507} {"train_loss": -6.3798001153128485, "global_step": 105335, "epoch": 2507, "val_loss": 67766.03125} {"train_loss": -6.341005325317383, "global_step": 105336, "epoch": 2508} {"train_loss": -6.345999240875244, "global_step": 105337, "epoch": 2508} {"train_loss": -6.32600736618042, "global_step": 105338, "epoch": 2508} {"train_loss": -6.466240882873535, "global_step": 105339, "epoch": 2508} {"train_loss": -6.488337516784668, "global_step": 105340, "epoch": 2508} {"train_loss": -6.37070369720459, "global_step": 105341, "epoch": 2508} {"train_loss": -6.495285987854004, "global_step": 105342, "epoch": 2508} {"train_loss": -6.475033760070801, "global_step": 105343, "epoch": 2508} {"train_loss": -6.406028747558594, "global_step": 105344, "epoch": 2508} {"train_loss": -6.333605766296387, "global_step": 105345, "epoch": 2508} {"train_loss": -6.430109977722168, "global_step": 105346, "epoch": 2508} {"train_loss": -6.462764739990234, "global_step": 105347, "epoch": 2508} {"train_loss": -6.318131446838379, "global_step": 105348, "epoch": 2508} {"train_loss": -6.3878936767578125, "global_step": 105349, "epoch": 2508} {"train_loss": -6.413699150085449, "global_step": 105350, "epoch": 2508} {"train_loss": -6.21819543838501, "global_step": 105351, "epoch": 2508} {"train_loss": -6.353116989135742, "global_step": 105352, "epoch": 2508} {"train_loss": -6.362506866455078, "global_step": 105353, "epoch": 2508} {"train_loss": -6.427912712097168, "global_step": 105354, "epoch": 2508} {"train_loss": -6.436854362487793, "global_step": 105355, "epoch": 2508} {"train_loss": -6.381186485290527, "global_step": 105356, "epoch": 2508} {"train_loss": -6.42487907409668, "global_step": 105357, "epoch": 2508} {"train_loss": -6.442292213439941, "global_step": 105358, "epoch": 2508} {"train_loss": -6.413206577301025, "global_step": 105359, "epoch": 2508} {"train_loss": -6.372159004211426, "global_step": 105360, "epoch": 2508} {"train_loss": -6.485021114349365, "global_step": 105361, "epoch": 2508} {"train_loss": -6.445256233215332, "global_step": 105362, "epoch": 2508} {"train_loss": -6.485597610473633, "global_step": 105363, "epoch": 2508} {"train_loss": -6.475242614746094, "global_step": 105364, "epoch": 2508} {"train_loss": -6.466152191162109, "global_step": 105365, "epoch": 2508} {"train_loss": -6.48094367980957, "global_step": 105366, "epoch": 2508} {"train_loss": -6.357686996459961, "global_step": 105367, "epoch": 2508} {"train_loss": -6.426495552062988, "global_step": 105368, "epoch": 2508} {"train_loss": -6.417148113250732, "global_step": 105369, "epoch": 2508} {"train_loss": -6.4337992668151855, "global_step": 105370, "epoch": 2508} {"train_loss": -6.438398838043213, "global_step": 105371, "epoch": 2508} {"train_loss": -6.224949836730957, "global_step": 105372, "epoch": 2508} {"train_loss": -6.418705463409424, "global_step": 105373, "epoch": 2508} {"train_loss": -6.529157638549805, "global_step": 105374, "epoch": 2508} {"train_loss": -6.3987812995910645, "global_step": 105375, "epoch": 2508} {"train_loss": -6.306064128875732, "global_step": 105376, "epoch": 2508} {"train_loss": -6.406258321943737, "global_step": 105377, "epoch": 2508, "val_loss": 67831.53125} {"train_loss": -6.422850131988525, "global_step": 105378, "epoch": 2509} {"train_loss": -6.4060235023498535, "global_step": 105379, "epoch": 2509} {"train_loss": -6.464602947235107, "global_step": 105380, "epoch": 2509} {"train_loss": -6.444930076599121, "global_step": 105381, "epoch": 2509} {"train_loss": -6.396243095397949, "global_step": 105382, "epoch": 2509} {"train_loss": -6.521745204925537, "global_step": 105383, "epoch": 2509} {"train_loss": -6.283012390136719, "global_step": 105384, "epoch": 2509} {"train_loss": -6.309642314910889, "global_step": 105385, "epoch": 2509} {"train_loss": -6.466680526733398, "global_step": 105386, "epoch": 2509} {"train_loss": -6.448718070983887, "global_step": 105387, "epoch": 2509} {"train_loss": -6.489256858825684, "global_step": 105388, "epoch": 2509} {"train_loss": -6.357442378997803, "global_step": 105389, "epoch": 2509} {"train_loss": -6.300418376922607, "global_step": 105390, "epoch": 2509} {"train_loss": -6.388422966003418, "global_step": 105391, "epoch": 2509} {"train_loss": -6.372450351715088, "global_step": 105392, "epoch": 2509} {"train_loss": -6.3497467041015625, "global_step": 105393, "epoch": 2509} {"train_loss": -6.4296650886535645, "global_step": 105394, "epoch": 2509} {"train_loss": -6.466984748840332, "global_step": 105395, "epoch": 2509} {"train_loss": -6.392092227935791, "global_step": 105396, "epoch": 2509} {"train_loss": -6.35397481918335, "global_step": 105397, "epoch": 2509} {"train_loss": -6.534948825836182, "global_step": 105398, "epoch": 2509} {"train_loss": -6.343783378601074, "global_step": 105399, "epoch": 2509} {"train_loss": -6.2920918464660645, "global_step": 105400, "epoch": 2509} {"train_loss": -6.305039405822754, "global_step": 105401, "epoch": 2509} {"train_loss": -6.367907524108887, "global_step": 105402, "epoch": 2509} {"train_loss": -6.382384777069092, "global_step": 105403, "epoch": 2509} {"train_loss": -6.332826614379883, "global_step": 105404, "epoch": 2509} {"train_loss": -6.333571910858154, "global_step": 105405, "epoch": 2509} {"train_loss": -6.464339256286621, "global_step": 105406, "epoch": 2509} {"train_loss": -6.290795803070068, "global_step": 105407, "epoch": 2509} {"train_loss": -6.271276473999023, "global_step": 105408, "epoch": 2509} {"train_loss": -6.366035461425781, "global_step": 105409, "epoch": 2509} {"train_loss": -6.372323989868164, "global_step": 105410, "epoch": 2509} {"train_loss": -6.310512065887451, "global_step": 105411, "epoch": 2509} {"train_loss": -6.280826568603516, "global_step": 105412, "epoch": 2509} {"train_loss": -6.370120048522949, "global_step": 105413, "epoch": 2509} {"train_loss": -6.329868316650391, "global_step": 105414, "epoch": 2509} {"train_loss": -6.371340751647949, "global_step": 105415, "epoch": 2509} {"train_loss": -6.196086883544922, "global_step": 105416, "epoch": 2509} {"train_loss": -6.242169380187988, "global_step": 105417, "epoch": 2509} {"train_loss": -6.2999114990234375, "global_step": 105418, "epoch": 2509} {"train_loss": -6.363185632796514, "global_step": 105419, "epoch": 2509, "val_loss": 68029.59375} {"train_loss": -6.36909294128418, "global_step": 105420, "epoch": 2510} {"train_loss": -6.2826008796691895, "global_step": 105421, "epoch": 2510} {"train_loss": -6.290943145751953, "global_step": 105422, "epoch": 2510} {"train_loss": -6.24930477142334, "global_step": 105423, "epoch": 2510} {"train_loss": -6.220681190490723, "global_step": 105424, "epoch": 2510} {"train_loss": -6.285527229309082, "global_step": 105425, "epoch": 2510} {"train_loss": -6.308152198791504, "global_step": 105426, "epoch": 2510} {"train_loss": -6.254942893981934, "global_step": 105427, "epoch": 2510} {"train_loss": -6.276220798492432, "global_step": 105428, "epoch": 2510} {"train_loss": -6.377334117889404, "global_step": 105429, "epoch": 2510} {"train_loss": -6.348853588104248, "global_step": 105430, "epoch": 2510} {"train_loss": -6.277134895324707, "global_step": 105431, "epoch": 2510} {"train_loss": -6.293979644775391, "global_step": 105432, "epoch": 2510} {"train_loss": -6.421658992767334, "global_step": 105433, "epoch": 2510} {"train_loss": -6.253175735473633, "global_step": 105434, "epoch": 2510} {"train_loss": -6.323456764221191, "global_step": 105435, "epoch": 2510} {"train_loss": -6.331986427307129, "global_step": 105436, "epoch": 2510} {"train_loss": -6.436675071716309, "global_step": 105437, "epoch": 2510} {"train_loss": -6.487798690795898, "global_step": 105438, "epoch": 2510} {"train_loss": -6.333305835723877, "global_step": 105439, "epoch": 2510} {"train_loss": -6.330295562744141, "global_step": 105440, "epoch": 2510} {"train_loss": -6.211423873901367, "global_step": 105441, "epoch": 2510} {"train_loss": -6.412259101867676, "global_step": 105442, "epoch": 2510} {"train_loss": -6.366746425628662, "global_step": 105443, "epoch": 2510} {"train_loss": -6.2660088539123535, "global_step": 105444, "epoch": 2510} {"train_loss": -6.3176469802856445, "global_step": 105445, "epoch": 2510} {"train_loss": -6.288752555847168, "global_step": 105446, "epoch": 2510} {"train_loss": -6.411216735839844, "global_step": 105447, "epoch": 2510} {"train_loss": -6.308541297912598, "global_step": 105448, "epoch": 2510} {"train_loss": -6.286931991577148, "global_step": 105449, "epoch": 2510} {"train_loss": -6.3771772384643555, "global_step": 105450, "epoch": 2510} {"train_loss": -6.391443252563477, "global_step": 105451, "epoch": 2510} {"train_loss": -6.311943531036377, "global_step": 105452, "epoch": 2510} {"train_loss": -6.373488426208496, "global_step": 105453, "epoch": 2510} {"train_loss": -6.439490795135498, "global_step": 105454, "epoch": 2510} {"train_loss": -6.377202033996582, "global_step": 105455, "epoch": 2510} {"train_loss": -6.456681251525879, "global_step": 105456, "epoch": 2510} {"train_loss": -6.3574113845825195, "global_step": 105457, "epoch": 2510} {"train_loss": -6.384967803955078, "global_step": 105458, "epoch": 2510} {"train_loss": -6.288295269012451, "global_step": 105459, "epoch": 2510} {"train_loss": -6.338409900665283, "global_step": 105460, "epoch": 2510} {"train_loss": -6.33535775684175, "global_step": 105461, "epoch": 2510, "val_loss": 67844.0859375} {"train_loss": -6.310992240905762, "global_step": 105462, "epoch": 2511} {"train_loss": -6.323671340942383, "global_step": 105463, "epoch": 2511} {"train_loss": -6.407764911651611, "global_step": 105464, "epoch": 2511} {"train_loss": -6.468621253967285, "global_step": 105465, "epoch": 2511} {"train_loss": -6.349541187286377, "global_step": 105466, "epoch": 2511} {"train_loss": -6.401577949523926, "global_step": 105467, "epoch": 2511} {"train_loss": -6.2804856300354, "global_step": 105468, "epoch": 2511} {"train_loss": -6.345511436462402, "global_step": 105469, "epoch": 2511} {"train_loss": -6.265641212463379, "global_step": 105470, "epoch": 2511} {"train_loss": -6.378006458282471, "global_step": 105471, "epoch": 2511} {"train_loss": -6.463115215301514, "global_step": 105472, "epoch": 2511} {"train_loss": -6.331184387207031, "global_step": 105473, "epoch": 2511} {"train_loss": -6.320248603820801, "global_step": 105474, "epoch": 2511} {"train_loss": -6.405209064483643, "global_step": 105475, "epoch": 2511} {"train_loss": -6.368224143981934, "global_step": 105476, "epoch": 2511} {"train_loss": -6.456037521362305, "global_step": 105477, "epoch": 2511} {"train_loss": -6.447082042694092, "global_step": 105478, "epoch": 2511} {"train_loss": -6.354367256164551, "global_step": 105479, "epoch": 2511} {"train_loss": -6.436214447021484, "global_step": 105480, "epoch": 2511} {"train_loss": -6.295454978942871, "global_step": 105481, "epoch": 2511} {"train_loss": -6.407449245452881, "global_step": 105482, "epoch": 2511} {"train_loss": -6.294526100158691, "global_step": 105483, "epoch": 2511} {"train_loss": -6.27708625793457, "global_step": 105484, "epoch": 2511} {"train_loss": -6.345366477966309, "global_step": 105485, "epoch": 2511} {"train_loss": -6.367156982421875, "global_step": 105486, "epoch": 2511} {"train_loss": -6.40717887878418, "global_step": 105487, "epoch": 2511} {"train_loss": -6.477164268493652, "global_step": 105488, "epoch": 2511} {"train_loss": -6.425459861755371, "global_step": 105489, "epoch": 2511} {"train_loss": -6.445507049560547, "global_step": 105490, "epoch": 2511} {"train_loss": -6.5855512619018555, "global_step": 105491, "epoch": 2511} {"train_loss": -6.355023384094238, "global_step": 105492, "epoch": 2511} {"train_loss": -6.37939453125, "global_step": 105493, "epoch": 2511} {"train_loss": -6.475433826446533, "global_step": 105494, "epoch": 2511} {"train_loss": -6.375210285186768, "global_step": 105495, "epoch": 2511} {"train_loss": -6.351568222045898, "global_step": 105496, "epoch": 2511} {"train_loss": -6.40500545501709, "global_step": 105497, "epoch": 2511} {"train_loss": -6.431832313537598, "global_step": 105498, "epoch": 2511} {"train_loss": -6.362211227416992, "global_step": 105499, "epoch": 2511} {"train_loss": -6.527097702026367, "global_step": 105500, "epoch": 2511} {"train_loss": -6.4124650955200195, "global_step": 105501, "epoch": 2511} {"train_loss": -6.436919212341309, "global_step": 105502, "epoch": 2511} {"train_loss": -6.390986578805106, "global_step": 105503, "epoch": 2511, "val_loss": 67748.6015625} {"train_loss": -6.383914947509766, "global_step": 105504, "epoch": 2512} {"train_loss": -6.397616386413574, "global_step": 105505, "epoch": 2512} {"train_loss": -6.3975749015808105, "global_step": 105506, "epoch": 2512} {"train_loss": -6.399813175201416, "global_step": 105507, "epoch": 2512} {"train_loss": -6.363551616668701, "global_step": 105508, "epoch": 2512} {"train_loss": -6.365162372589111, "global_step": 105509, "epoch": 2512} {"train_loss": -6.274868488311768, "global_step": 105510, "epoch": 2512} {"train_loss": -6.44329833984375, "global_step": 105511, "epoch": 2512} {"train_loss": -6.405132293701172, "global_step": 105512, "epoch": 2512} {"train_loss": -6.240914344787598, "global_step": 105513, "epoch": 2512} {"train_loss": -6.38460111618042, "global_step": 105514, "epoch": 2512} {"train_loss": -6.387782573699951, "global_step": 105515, "epoch": 2512} {"train_loss": -6.277759552001953, "global_step": 105516, "epoch": 2512} {"train_loss": -6.495792865753174, "global_step": 105517, "epoch": 2512} {"train_loss": -6.344875335693359, "global_step": 105518, "epoch": 2512} {"train_loss": -6.44614315032959, "global_step": 105519, "epoch": 2512} {"train_loss": -6.353386878967285, "global_step": 105520, "epoch": 2512} {"train_loss": -6.314266681671143, "global_step": 105521, "epoch": 2512} {"train_loss": -6.519064903259277, "global_step": 105522, "epoch": 2512} {"train_loss": -6.374457359313965, "global_step": 105523, "epoch": 2512} {"train_loss": -6.449961185455322, "global_step": 105524, "epoch": 2512} {"train_loss": -6.375180244445801, "global_step": 105525, "epoch": 2512} {"train_loss": -6.409025192260742, "global_step": 105526, "epoch": 2512} {"train_loss": -6.460033416748047, "global_step": 105527, "epoch": 2512} {"train_loss": -6.3334808349609375, "global_step": 105528, "epoch": 2512} {"train_loss": -6.492033958435059, "global_step": 105529, "epoch": 2512} {"train_loss": -6.560956001281738, "global_step": 105530, "epoch": 2512} {"train_loss": -6.438593864440918, "global_step": 105531, "epoch": 2512} {"train_loss": -6.323541641235352, "global_step": 105532, "epoch": 2512} {"train_loss": -6.3838887214660645, "global_step": 105533, "epoch": 2512} {"train_loss": -6.445134162902832, "global_step": 105534, "epoch": 2512} {"train_loss": -6.3473968505859375, "global_step": 105535, "epoch": 2512} {"train_loss": -6.386635780334473, "global_step": 105536, "epoch": 2512} {"train_loss": -6.330992221832275, "global_step": 105537, "epoch": 2512} {"train_loss": -6.377599716186523, "global_step": 105538, "epoch": 2512} {"train_loss": -6.342250823974609, "global_step": 105539, "epoch": 2512} {"train_loss": -6.397259712219238, "global_step": 105540, "epoch": 2512} {"train_loss": -6.384574890136719, "global_step": 105541, "epoch": 2512} {"train_loss": -6.323476314544678, "global_step": 105542, "epoch": 2512} {"train_loss": -6.409463882446289, "global_step": 105543, "epoch": 2512} {"train_loss": -6.393290996551514, "global_step": 105544, "epoch": 2512} {"train_loss": -6.389963388442993, "global_step": 105545, "epoch": 2512, "val_loss": 67647.390625} {"train_loss": -6.390692234039307, "global_step": 105546, "epoch": 2513} {"train_loss": -6.414710998535156, "global_step": 105547, "epoch": 2513} {"train_loss": -6.3500871658325195, "global_step": 105548, "epoch": 2513} {"train_loss": -6.481752872467041, "global_step": 105549, "epoch": 2513} {"train_loss": -6.380675315856934, "global_step": 105550, "epoch": 2513} {"train_loss": -6.3913421630859375, "global_step": 105551, "epoch": 2513} {"train_loss": -6.299323081970215, "global_step": 105552, "epoch": 2513} {"train_loss": -6.4906907081604, "global_step": 105553, "epoch": 2513} {"train_loss": -6.477400779724121, "global_step": 105554, "epoch": 2513} {"train_loss": -6.3776679039001465, "global_step": 105555, "epoch": 2513} {"train_loss": -6.429168701171875, "global_step": 105556, "epoch": 2513} {"train_loss": -6.398052215576172, "global_step": 105557, "epoch": 2513} {"train_loss": -6.470358848571777, "global_step": 105558, "epoch": 2513} {"train_loss": -6.544690132141113, "global_step": 105559, "epoch": 2513} {"train_loss": -6.453823089599609, "global_step": 105560, "epoch": 2513} {"train_loss": -6.378817558288574, "global_step": 105561, "epoch": 2513} {"train_loss": -6.468467712402344, "global_step": 105562, "epoch": 2513} {"train_loss": -6.380120754241943, "global_step": 105563, "epoch": 2513} {"train_loss": -6.482037544250488, "global_step": 105564, "epoch": 2513} {"train_loss": -6.418467998504639, "global_step": 105565, "epoch": 2513} {"train_loss": -6.5325446128845215, "global_step": 105566, "epoch": 2513} {"train_loss": -6.320306777954102, "global_step": 105567, "epoch": 2513} {"train_loss": -6.484375, "global_step": 105568, "epoch": 2513} {"train_loss": -6.498737335205078, "global_step": 105569, "epoch": 2513} {"train_loss": -6.3919267654418945, "global_step": 105570, "epoch": 2513} {"train_loss": -6.411441802978516, "global_step": 105571, "epoch": 2513} {"train_loss": -6.483802318572998, "global_step": 105572, "epoch": 2513} {"train_loss": -6.488863468170166, "global_step": 105573, "epoch": 2513} {"train_loss": -6.397445201873779, "global_step": 105574, "epoch": 2513} {"train_loss": -6.306869029998779, "global_step": 105575, "epoch": 2513} {"train_loss": -6.5366315841674805, "global_step": 105576, "epoch": 2513} {"train_loss": -6.52786111831665, "global_step": 105577, "epoch": 2513} {"train_loss": -6.362858772277832, "global_step": 105578, "epoch": 2513} {"train_loss": -6.427168846130371, "global_step": 105579, "epoch": 2513} {"train_loss": -6.3639678955078125, "global_step": 105580, "epoch": 2513} {"train_loss": -6.298000812530518, "global_step": 105581, "epoch": 2513} {"train_loss": -6.355803966522217, "global_step": 105582, "epoch": 2513} {"train_loss": -6.379765510559082, "global_step": 105583, "epoch": 2513} {"train_loss": -6.5300445556640625, "global_step": 105584, "epoch": 2513} {"train_loss": -6.42214298248291, "global_step": 105585, "epoch": 2513} {"train_loss": -6.388426780700684, "global_step": 105586, "epoch": 2513} {"train_loss": -6.423743758882795, "global_step": 105587, "epoch": 2513, "val_loss": 67763.40625} {"train_loss": -6.483015060424805, "global_step": 105588, "epoch": 2514} {"train_loss": -6.406460762023926, "global_step": 105589, "epoch": 2514} {"train_loss": -6.284754753112793, "global_step": 105590, "epoch": 2514} {"train_loss": -6.340551376342773, "global_step": 105591, "epoch": 2514} {"train_loss": -6.424778461456299, "global_step": 105592, "epoch": 2514} {"train_loss": -6.517173767089844, "global_step": 105593, "epoch": 2514} {"train_loss": -6.456416130065918, "global_step": 105594, "epoch": 2514} {"train_loss": -6.320896148681641, "global_step": 105595, "epoch": 2514} {"train_loss": -6.4273176193237305, "global_step": 105596, "epoch": 2514} {"train_loss": -6.476530075073242, "global_step": 105597, "epoch": 2514} {"train_loss": -6.380273818969727, "global_step": 105598, "epoch": 2514} {"train_loss": -6.491877555847168, "global_step": 105599, "epoch": 2514} {"train_loss": -6.5393548011779785, "global_step": 105600, "epoch": 2514} {"train_loss": -6.51479959487915, "global_step": 105601, "epoch": 2514} {"train_loss": -6.345219612121582, "global_step": 105602, "epoch": 2514} {"train_loss": -6.304526329040527, "global_step": 105603, "epoch": 2514} {"train_loss": -6.3455424308776855, "global_step": 105604, "epoch": 2514} {"train_loss": -6.383486747741699, "global_step": 105605, "epoch": 2514} {"train_loss": -6.5416460037231445, "global_step": 105606, "epoch": 2514} {"train_loss": -6.337322235107422, "global_step": 105607, "epoch": 2514} {"train_loss": -6.515793800354004, "global_step": 105608, "epoch": 2514} {"train_loss": -6.443551063537598, "global_step": 105609, "epoch": 2514} {"train_loss": -6.366713523864746, "global_step": 105610, "epoch": 2514} {"train_loss": -6.448532581329346, "global_step": 105611, "epoch": 2514} {"train_loss": -6.376228332519531, "global_step": 105612, "epoch": 2514} {"train_loss": -6.336911678314209, "global_step": 105613, "epoch": 2514} {"train_loss": -6.442779541015625, "global_step": 105614, "epoch": 2514} {"train_loss": -6.352245807647705, "global_step": 105615, "epoch": 2514} {"train_loss": -6.404454708099365, "global_step": 105616, "epoch": 2514} {"train_loss": -6.389191150665283, "global_step": 105617, "epoch": 2514} {"train_loss": -6.361401557922363, "global_step": 105618, "epoch": 2514} {"train_loss": -6.320655345916748, "global_step": 105619, "epoch": 2514} {"train_loss": -6.336635589599609, "global_step": 105620, "epoch": 2514} {"train_loss": -6.580781936645508, "global_step": 105621, "epoch": 2514} {"train_loss": -6.504165172576904, "global_step": 105622, "epoch": 2514} {"train_loss": -6.449638366699219, "global_step": 105623, "epoch": 2514} {"train_loss": -6.502514839172363, "global_step": 105624, "epoch": 2514} {"train_loss": -6.521305084228516, "global_step": 105625, "epoch": 2514} {"train_loss": -6.39609432220459, "global_step": 105626, "epoch": 2514} {"train_loss": -6.404170989990234, "global_step": 105627, "epoch": 2514} {"train_loss": -6.426980495452881, "global_step": 105628, "epoch": 2514} {"train_loss": -6.4212205296471, "global_step": 105629, "epoch": 2514, "val_loss": 67951.1328125} {"train_loss": -6.342558860778809, "global_step": 105630, "epoch": 2515} {"train_loss": -6.4722490310668945, "global_step": 105631, "epoch": 2515} {"train_loss": -6.435755729675293, "global_step": 105632, "epoch": 2515} {"train_loss": -6.382169723510742, "global_step": 105633, "epoch": 2515} {"train_loss": -6.40123176574707, "global_step": 105634, "epoch": 2515} {"train_loss": -6.438797950744629, "global_step": 105635, "epoch": 2515} {"train_loss": -6.347237586975098, "global_step": 105636, "epoch": 2515} {"train_loss": -6.229423522949219, "global_step": 105637, "epoch": 2515} {"train_loss": -6.453407287597656, "global_step": 105638, "epoch": 2515} {"train_loss": -6.4010844230651855, "global_step": 105639, "epoch": 2515} {"train_loss": -6.297182083129883, "global_step": 105640, "epoch": 2515} {"train_loss": -6.429559707641602, "global_step": 105641, "epoch": 2515} {"train_loss": -6.459861755371094, "global_step": 105642, "epoch": 2515} {"train_loss": -6.418292045593262, "global_step": 105643, "epoch": 2515} {"train_loss": -6.3991193771362305, "global_step": 105644, "epoch": 2515} {"train_loss": -6.308438777923584, "global_step": 105645, "epoch": 2515} {"train_loss": -6.178008079528809, "global_step": 105646, "epoch": 2515} {"train_loss": -6.3422393798828125, "global_step": 105647, "epoch": 2515} {"train_loss": -6.352977752685547, "global_step": 105648, "epoch": 2515} {"train_loss": -6.291415691375732, "global_step": 105649, "epoch": 2515} {"train_loss": -6.450445175170898, "global_step": 105650, "epoch": 2515} {"train_loss": -6.3869829177856445, "global_step": 105651, "epoch": 2515} {"train_loss": -6.42746639251709, "global_step": 105652, "epoch": 2515} {"train_loss": -6.452461242675781, "global_step": 105653, "epoch": 2515} {"train_loss": -6.297850608825684, "global_step": 105654, "epoch": 2515} {"train_loss": -6.462885856628418, "global_step": 105655, "epoch": 2515} {"train_loss": -6.384695529937744, "global_step": 105656, "epoch": 2515} {"train_loss": -6.464756965637207, "global_step": 105657, "epoch": 2515} {"train_loss": -6.428757667541504, "global_step": 105658, "epoch": 2515} {"train_loss": -6.384710311889648, "global_step": 105659, "epoch": 2515} {"train_loss": -6.494234085083008, "global_step": 105660, "epoch": 2515} {"train_loss": -6.311141490936279, "global_step": 105661, "epoch": 2515} {"train_loss": -6.333831787109375, "global_step": 105662, "epoch": 2515} {"train_loss": -6.305281639099121, "global_step": 105663, "epoch": 2515} {"train_loss": -6.468556880950928, "global_step": 105664, "epoch": 2515} {"train_loss": -6.425833702087402, "global_step": 105665, "epoch": 2515} {"train_loss": -6.292623043060303, "global_step": 105666, "epoch": 2515} {"train_loss": -6.459164619445801, "global_step": 105667, "epoch": 2515} {"train_loss": -6.387643814086914, "global_step": 105668, "epoch": 2515} {"train_loss": -6.343135833740234, "global_step": 105669, "epoch": 2515} {"train_loss": -6.372913837432861, "global_step": 105670, "epoch": 2515} {"train_loss": -6.382182178043184, "global_step": 105671, "epoch": 2515, "val_loss": 67857.984375} {"train_loss": -6.4045515060424805, "global_step": 105672, "epoch": 2516} {"train_loss": -6.454285621643066, "global_step": 105673, "epoch": 2516} {"train_loss": -6.375785827636719, "global_step": 105674, "epoch": 2516} {"train_loss": -6.435152053833008, "global_step": 105675, "epoch": 2516} {"train_loss": -6.402730941772461, "global_step": 105676, "epoch": 2516} {"train_loss": -6.321752548217773, "global_step": 105677, "epoch": 2516} {"train_loss": -6.262110710144043, "global_step": 105678, "epoch": 2516} {"train_loss": -6.552055835723877, "global_step": 105679, "epoch": 2516} {"train_loss": -6.383237361907959, "global_step": 105680, "epoch": 2516} {"train_loss": -6.429591655731201, "global_step": 105681, "epoch": 2516} {"train_loss": -6.485311508178711, "global_step": 105682, "epoch": 2516} {"train_loss": -6.368027687072754, "global_step": 105683, "epoch": 2516} {"train_loss": -6.377321243286133, "global_step": 105684, "epoch": 2516} {"train_loss": -6.463764667510986, "global_step": 105685, "epoch": 2516} {"train_loss": -6.398894309997559, "global_step": 105686, "epoch": 2516} {"train_loss": -6.470348358154297, "global_step": 105687, "epoch": 2516} {"train_loss": -6.517737865447998, "global_step": 105688, "epoch": 2516} {"train_loss": -6.3551764488220215, "global_step": 105689, "epoch": 2516} {"train_loss": -6.499407768249512, "global_step": 105690, "epoch": 2516} {"train_loss": -6.338006973266602, "global_step": 105691, "epoch": 2516} {"train_loss": -6.414212703704834, "global_step": 105692, "epoch": 2516} {"train_loss": -6.442063331604004, "global_step": 105693, "epoch": 2516} {"train_loss": -6.474881172180176, "global_step": 105694, "epoch": 2516} {"train_loss": -6.507704257965088, "global_step": 105695, "epoch": 2516} {"train_loss": -6.4898529052734375, "global_step": 105696, "epoch": 2516} {"train_loss": -6.346423149108887, "global_step": 105697, "epoch": 2516} {"train_loss": -6.439093589782715, "global_step": 105698, "epoch": 2516} {"train_loss": -6.355284690856934, "global_step": 105699, "epoch": 2516} {"train_loss": -6.416055202484131, "global_step": 105700, "epoch": 2516} {"train_loss": -6.466009140014648, "global_step": 105701, "epoch": 2516} {"train_loss": -6.421849250793457, "global_step": 105702, "epoch": 2516} {"train_loss": -6.4661784172058105, "global_step": 105703, "epoch": 2516} {"train_loss": -6.486443042755127, "global_step": 105704, "epoch": 2516} {"train_loss": -6.35451602935791, "global_step": 105705, "epoch": 2516} {"train_loss": -6.387278079986572, "global_step": 105706, "epoch": 2516} {"train_loss": -6.364467620849609, "global_step": 105707, "epoch": 2516} {"train_loss": -6.317836284637451, "global_step": 105708, "epoch": 2516} {"train_loss": -6.325078964233398, "global_step": 105709, "epoch": 2516} {"train_loss": -6.437458515167236, "global_step": 105710, "epoch": 2516} {"train_loss": -6.37992000579834, "global_step": 105711, "epoch": 2516} {"train_loss": -6.435613632202148, "global_step": 105712, "epoch": 2516} {"train_loss": -6.4144674482799715, "global_step": 105713, "epoch": 2516, "val_loss": 67924.3984375} {"train_loss": -6.440101623535156, "global_step": 105714, "epoch": 2517} {"train_loss": -6.356586933135986, "global_step": 105715, "epoch": 2517} {"train_loss": -6.495751857757568, "global_step": 105716, "epoch": 2517} {"train_loss": -6.4680376052856445, "global_step": 105717, "epoch": 2517} {"train_loss": -6.433028221130371, "global_step": 105718, "epoch": 2517} {"train_loss": -6.410245895385742, "global_step": 105719, "epoch": 2517} {"train_loss": -6.414578914642334, "global_step": 105720, "epoch": 2517} {"train_loss": -6.420256614685059, "global_step": 105721, "epoch": 2517} {"train_loss": -6.412301063537598, "global_step": 105722, "epoch": 2517} {"train_loss": -6.453871250152588, "global_step": 105723, "epoch": 2517} {"train_loss": -6.416196823120117, "global_step": 105724, "epoch": 2517} {"train_loss": -6.296626091003418, "global_step": 105725, "epoch": 2517} {"train_loss": -6.356496334075928, "global_step": 105726, "epoch": 2517} {"train_loss": -6.317117691040039, "global_step": 105727, "epoch": 2517} {"train_loss": -6.388552665710449, "global_step": 105728, "epoch": 2517} {"train_loss": -6.33801794052124, "global_step": 105729, "epoch": 2517} {"train_loss": -6.344133377075195, "global_step": 105730, "epoch": 2517} {"train_loss": -6.306388854980469, "global_step": 105731, "epoch": 2517} {"train_loss": -6.389021873474121, "global_step": 105732, "epoch": 2517} {"train_loss": -6.354737281799316, "global_step": 105733, "epoch": 2517} {"train_loss": -6.4052581787109375, "global_step": 105734, "epoch": 2517} {"train_loss": -6.338315010070801, "global_step": 105735, "epoch": 2517} {"train_loss": -6.347109317779541, "global_step": 105736, "epoch": 2517} {"train_loss": -6.3284196853637695, "global_step": 105737, "epoch": 2517} {"train_loss": -6.271601676940918, "global_step": 105738, "epoch": 2517} {"train_loss": -6.439871788024902, "global_step": 105739, "epoch": 2517} {"train_loss": -6.3346147537231445, "global_step": 105740, "epoch": 2517} {"train_loss": -6.403111457824707, "global_step": 105741, "epoch": 2517} {"train_loss": -6.455657005310059, "global_step": 105742, "epoch": 2517} {"train_loss": -6.375245571136475, "global_step": 105743, "epoch": 2517} {"train_loss": -6.27074670791626, "global_step": 105744, "epoch": 2517} {"train_loss": -6.475228309631348, "global_step": 105745, "epoch": 2517} {"train_loss": -6.427614212036133, "global_step": 105746, "epoch": 2517} {"train_loss": -6.449708938598633, "global_step": 105747, "epoch": 2517} {"train_loss": -6.504430770874023, "global_step": 105748, "epoch": 2517} {"train_loss": -6.435781478881836, "global_step": 105749, "epoch": 2517} {"train_loss": -6.483431816101074, "global_step": 105750, "epoch": 2517} {"train_loss": -6.34633731842041, "global_step": 105751, "epoch": 2517} {"train_loss": -6.3747735023498535, "global_step": 105752, "epoch": 2517} {"train_loss": -6.470905303955078, "global_step": 105753, "epoch": 2517} {"train_loss": -6.437979698181152, "global_step": 105754, "epoch": 2517} {"train_loss": -6.393819195883615, "global_step": 105755, "epoch": 2517, "val_loss": 67932.359375} {"train_loss": -6.442676067352295, "global_step": 105756, "epoch": 2518} {"train_loss": -6.470954418182373, "global_step": 105757, "epoch": 2518} {"train_loss": -6.390268325805664, "global_step": 105758, "epoch": 2518} {"train_loss": -6.382124900817871, "global_step": 105759, "epoch": 2518} {"train_loss": -6.493825912475586, "global_step": 105760, "epoch": 2518} {"train_loss": -6.292447566986084, "global_step": 105761, "epoch": 2518} {"train_loss": -6.332143306732178, "global_step": 105762, "epoch": 2518} {"train_loss": -6.413381099700928, "global_step": 105763, "epoch": 2518} {"train_loss": -6.345582962036133, "global_step": 105764, "epoch": 2518} {"train_loss": -6.370532035827637, "global_step": 105765, "epoch": 2518} {"train_loss": -6.296647071838379, "global_step": 105766, "epoch": 2518} {"train_loss": -6.332247734069824, "global_step": 105767, "epoch": 2518} {"train_loss": -6.481367111206055, "global_step": 105768, "epoch": 2518} {"train_loss": -6.337021827697754, "global_step": 105769, "epoch": 2518} {"train_loss": -6.359977722167969, "global_step": 105770, "epoch": 2518} {"train_loss": -6.366994380950928, "global_step": 105771, "epoch": 2518} {"train_loss": -6.422476768493652, "global_step": 105772, "epoch": 2518} {"train_loss": -6.367326736450195, "global_step": 105773, "epoch": 2518} {"train_loss": -6.2926483154296875, "global_step": 105774, "epoch": 2518} {"train_loss": -6.401302337646484, "global_step": 105775, "epoch": 2518} {"train_loss": -6.311105728149414, "global_step": 105776, "epoch": 2518} {"train_loss": -6.379298210144043, "global_step": 105777, "epoch": 2518} {"train_loss": -6.211896896362305, "global_step": 105778, "epoch": 2518} {"train_loss": -6.344969749450684, "global_step": 105779, "epoch": 2518} {"train_loss": -6.384513854980469, "global_step": 105780, "epoch": 2518} {"train_loss": -6.259803771972656, "global_step": 105781, "epoch": 2518} {"train_loss": -6.2946977615356445, "global_step": 105782, "epoch": 2518} {"train_loss": -6.305047988891602, "global_step": 105783, "epoch": 2518} {"train_loss": -6.2118730545043945, "global_step": 105784, "epoch": 2518} {"train_loss": -6.338088035583496, "global_step": 105785, "epoch": 2518} {"train_loss": -6.311513900756836, "global_step": 105786, "epoch": 2518} {"train_loss": -6.314215660095215, "global_step": 105787, "epoch": 2518} {"train_loss": -6.369495391845703, "global_step": 105788, "epoch": 2518} {"train_loss": -6.373309135437012, "global_step": 105789, "epoch": 2518} {"train_loss": -6.3217339515686035, "global_step": 105790, "epoch": 2518} {"train_loss": -6.32793664932251, "global_step": 105791, "epoch": 2518} {"train_loss": -6.346166610717773, "global_step": 105792, "epoch": 2518} {"train_loss": -6.217583656311035, "global_step": 105793, "epoch": 2518} {"train_loss": -6.476929187774658, "global_step": 105794, "epoch": 2518} {"train_loss": -6.3729248046875, "global_step": 105795, "epoch": 2518} {"train_loss": -6.406095504760742, "global_step": 105796, "epoch": 2518} {"train_loss": -6.352702367873419, "global_step": 105797, "epoch": 2518, "val_loss": 67853.7109375} {"train_loss": -6.450876712799072, "global_step": 105798, "epoch": 2519} {"train_loss": -6.297512054443359, "global_step": 105799, "epoch": 2519} {"train_loss": -6.378487586975098, "global_step": 105800, "epoch": 2519} {"train_loss": -6.401697158813477, "global_step": 105801, "epoch": 2519} {"train_loss": -6.3476667404174805, "global_step": 105802, "epoch": 2519} {"train_loss": -6.4189558029174805, "global_step": 105803, "epoch": 2519} {"train_loss": -6.366504669189453, "global_step": 105804, "epoch": 2519} {"train_loss": -6.484238624572754, "global_step": 105805, "epoch": 2519} {"train_loss": -6.381845474243164, "global_step": 105806, "epoch": 2519} {"train_loss": -6.297968864440918, "global_step": 105807, "epoch": 2519} {"train_loss": -6.407656669616699, "global_step": 105808, "epoch": 2519} {"train_loss": -6.360143184661865, "global_step": 105809, "epoch": 2519} {"train_loss": -6.484161376953125, "global_step": 105810, "epoch": 2519} {"train_loss": -6.3552327156066895, "global_step": 105811, "epoch": 2519} {"train_loss": -6.429239273071289, "global_step": 105812, "epoch": 2519} {"train_loss": -6.474725246429443, "global_step": 105813, "epoch": 2519} {"train_loss": -6.32271671295166, "global_step": 105814, "epoch": 2519} {"train_loss": -6.425678253173828, "global_step": 105815, "epoch": 2519} {"train_loss": -6.390657424926758, "global_step": 105816, "epoch": 2519} {"train_loss": -6.396700859069824, "global_step": 105817, "epoch": 2519} {"train_loss": -6.310826778411865, "global_step": 105818, "epoch": 2519} {"train_loss": -6.402919292449951, "global_step": 105819, "epoch": 2519} {"train_loss": -6.310917854309082, "global_step": 105820, "epoch": 2519} {"train_loss": -6.328547477722168, "global_step": 105821, "epoch": 2519} {"train_loss": -6.458447456359863, "global_step": 105822, "epoch": 2519} {"train_loss": -6.233930587768555, "global_step": 105823, "epoch": 2519} {"train_loss": -6.387415409088135, "global_step": 105824, "epoch": 2519} {"train_loss": -6.433831214904785, "global_step": 105825, "epoch": 2519} {"train_loss": -6.60502815246582, "global_step": 105826, "epoch": 2519} {"train_loss": -6.430777549743652, "global_step": 105827, "epoch": 2519} {"train_loss": -6.4336066246032715, "global_step": 105828, "epoch": 2519} {"train_loss": -6.47143030166626, "global_step": 105829, "epoch": 2519} {"train_loss": -6.308913230895996, "global_step": 105830, "epoch": 2519} {"train_loss": -6.299783229827881, "global_step": 105831, "epoch": 2519} {"train_loss": -6.416993618011475, "global_step": 105832, "epoch": 2519} {"train_loss": -6.480731964111328, "global_step": 105833, "epoch": 2519} {"train_loss": -6.3242645263671875, "global_step": 105834, "epoch": 2519} {"train_loss": -6.4732465744018555, "global_step": 105835, "epoch": 2519} {"train_loss": -6.378274917602539, "global_step": 105836, "epoch": 2519} {"train_loss": -6.316401958465576, "global_step": 105837, "epoch": 2519} {"train_loss": -6.4915618896484375, "global_step": 105838, "epoch": 2519} {"train_loss": -6.395235583895729, "global_step": 105839, "epoch": 2519, "val_loss": 67915.0078125} {"train_loss": -6.431279182434082, "global_step": 105840, "epoch": 2520} {"train_loss": -6.424046993255615, "global_step": 105841, "epoch": 2520} {"train_loss": -6.471310615539551, "global_step": 105842, "epoch": 2520} {"train_loss": -6.375936508178711, "global_step": 105843, "epoch": 2520} {"train_loss": -6.3813652992248535, "global_step": 105844, "epoch": 2520} {"train_loss": -6.512284278869629, "global_step": 105845, "epoch": 2520} {"train_loss": -6.4118547439575195, "global_step": 105846, "epoch": 2520} {"train_loss": -6.352849006652832, "global_step": 105847, "epoch": 2520} {"train_loss": -6.418601036071777, "global_step": 105848, "epoch": 2520} {"train_loss": -6.323352813720703, "global_step": 105849, "epoch": 2520} {"train_loss": -6.358881950378418, "global_step": 105850, "epoch": 2520} {"train_loss": -6.379953384399414, "global_step": 105851, "epoch": 2520} {"train_loss": -6.466431617736816, "global_step": 105852, "epoch": 2520} {"train_loss": -6.4212799072265625, "global_step": 105853, "epoch": 2520} {"train_loss": -6.390170574188232, "global_step": 105854, "epoch": 2520} {"train_loss": -6.423359394073486, "global_step": 105855, "epoch": 2520} {"train_loss": -6.356341361999512, "global_step": 105856, "epoch": 2520} {"train_loss": -6.2095947265625, "global_step": 105857, "epoch": 2520} {"train_loss": -6.453023910522461, "global_step": 105858, "epoch": 2520} {"train_loss": -6.3856916427612305, "global_step": 105859, "epoch": 2520} {"train_loss": -6.517294406890869, "global_step": 105860, "epoch": 2520} {"train_loss": -6.547883033752441, "global_step": 105861, "epoch": 2520} {"train_loss": -6.482646942138672, "global_step": 105862, "epoch": 2520} {"train_loss": -6.422250747680664, "global_step": 105863, "epoch": 2520} {"train_loss": -6.514170169830322, "global_step": 105864, "epoch": 2520} {"train_loss": -6.498587608337402, "global_step": 105865, "epoch": 2520} {"train_loss": -6.5563459396362305, "global_step": 105866, "epoch": 2520} {"train_loss": -6.433518409729004, "global_step": 105867, "epoch": 2520} {"train_loss": -6.388531684875488, "global_step": 105868, "epoch": 2520} {"train_loss": -6.480645656585693, "global_step": 105869, "epoch": 2520} {"train_loss": -6.493557929992676, "global_step": 105870, "epoch": 2520} {"train_loss": -6.417641639709473, "global_step": 105871, "epoch": 2520} {"train_loss": -6.482107162475586, "global_step": 105872, "epoch": 2520} {"train_loss": -6.541381359100342, "global_step": 105873, "epoch": 2520} {"train_loss": -6.439091682434082, "global_step": 105874, "epoch": 2520} {"train_loss": -6.421292781829834, "global_step": 105875, "epoch": 2520} {"train_loss": -6.405635356903076, "global_step": 105876, "epoch": 2520} {"train_loss": -6.303292751312256, "global_step": 105877, "epoch": 2520} {"train_loss": -6.225883483886719, "global_step": 105878, "epoch": 2520} {"train_loss": -6.532780647277832, "global_step": 105879, "epoch": 2520} {"train_loss": -6.421599864959717, "global_step": 105880, "epoch": 2520} {"train_loss": -6.423960038593838, "global_step": 105881, "epoch": 2520, "val_loss": 68104.234375} {"train_loss": -6.301620006561279, "global_step": 105882, "epoch": 2521} {"train_loss": -6.413525581359863, "global_step": 105883, "epoch": 2521} {"train_loss": -6.369908332824707, "global_step": 105884, "epoch": 2521} {"train_loss": -6.5250701904296875, "global_step": 105885, "epoch": 2521} {"train_loss": -6.354440689086914, "global_step": 105886, "epoch": 2521} {"train_loss": -6.339388370513916, "global_step": 105887, "epoch": 2521} {"train_loss": -6.509735107421875, "global_step": 105888, "epoch": 2521} {"train_loss": -6.495363235473633, "global_step": 105889, "epoch": 2521} {"train_loss": -6.4145708084106445, "global_step": 105890, "epoch": 2521} {"train_loss": -6.480325222015381, "global_step": 105891, "epoch": 2521} {"train_loss": -6.411022186279297, "global_step": 105892, "epoch": 2521} {"train_loss": -6.399710655212402, "global_step": 105893, "epoch": 2521} {"train_loss": -6.380435466766357, "global_step": 105894, "epoch": 2521} {"train_loss": -6.465726852416992, "global_step": 105895, "epoch": 2521} {"train_loss": -6.4286956787109375, "global_step": 105896, "epoch": 2521} {"train_loss": -6.398965358734131, "global_step": 105897, "epoch": 2521} {"train_loss": -6.489964485168457, "global_step": 105898, "epoch": 2521} {"train_loss": -6.420163631439209, "global_step": 105899, "epoch": 2521} {"train_loss": -6.43022346496582, "global_step": 105900, "epoch": 2521} {"train_loss": -6.4419660568237305, "global_step": 105901, "epoch": 2521} {"train_loss": -6.398003578186035, "global_step": 105902, "epoch": 2521} {"train_loss": -6.326571464538574, "global_step": 105903, "epoch": 2521} {"train_loss": -6.394729137420654, "global_step": 105904, "epoch": 2521} {"train_loss": -6.325492858886719, "global_step": 105905, "epoch": 2521} {"train_loss": -6.298496723175049, "global_step": 105906, "epoch": 2521} {"train_loss": -6.309194564819336, "global_step": 105907, "epoch": 2521} {"train_loss": -6.347847938537598, "global_step": 105908, "epoch": 2521} {"train_loss": -6.327943325042725, "global_step": 105909, "epoch": 2521} {"train_loss": -6.277830123901367, "global_step": 105910, "epoch": 2521} {"train_loss": -6.309942245483398, "global_step": 105911, "epoch": 2521} {"train_loss": -6.355852127075195, "global_step": 105912, "epoch": 2521} {"train_loss": -6.305544853210449, "global_step": 105913, "epoch": 2521} {"train_loss": -6.253325462341309, "global_step": 105914, "epoch": 2521} {"train_loss": -6.378990173339844, "global_step": 105915, "epoch": 2521} {"train_loss": -6.210633754730225, "global_step": 105916, "epoch": 2521} {"train_loss": -6.293898582458496, "global_step": 105917, "epoch": 2521} {"train_loss": -6.157530784606934, "global_step": 105918, "epoch": 2521} {"train_loss": -6.303844451904297, "global_step": 105919, "epoch": 2521} {"train_loss": -6.409626483917236, "global_step": 105920, "epoch": 2521} {"train_loss": -6.394189357757568, "global_step": 105921, "epoch": 2521} {"train_loss": -6.361508369445801, "global_step": 105922, "epoch": 2521} {"train_loss": -6.369275365556989, "global_step": 105923, "epoch": 2521, "val_loss": 68139.9140625} {"train_loss": -6.385753631591797, "global_step": 105924, "epoch": 2522} {"train_loss": -6.327333450317383, "global_step": 105925, "epoch": 2522} {"train_loss": -6.390381813049316, "global_step": 105926, "epoch": 2522} {"train_loss": -6.2984795570373535, "global_step": 105927, "epoch": 2522} {"train_loss": -6.4102582931518555, "global_step": 105928, "epoch": 2522} {"train_loss": -6.298346519470215, "global_step": 105929, "epoch": 2522} {"train_loss": -6.377004623413086, "global_step": 105930, "epoch": 2522} {"train_loss": -6.3873291015625, "global_step": 105931, "epoch": 2522} {"train_loss": -6.389432907104492, "global_step": 105932, "epoch": 2522} {"train_loss": -6.417551517486572, "global_step": 105933, "epoch": 2522} {"train_loss": -6.36319637298584, "global_step": 105934, "epoch": 2522} {"train_loss": -6.440521240234375, "global_step": 105935, "epoch": 2522} {"train_loss": -6.356117248535156, "global_step": 105936, "epoch": 2522} {"train_loss": -6.40986442565918, "global_step": 105937, "epoch": 2522} {"train_loss": -6.3462724685668945, "global_step": 105938, "epoch": 2522} {"train_loss": -6.570924758911133, "global_step": 105939, "epoch": 2522} {"train_loss": -6.437399864196777, "global_step": 105940, "epoch": 2522} {"train_loss": -6.395898342132568, "global_step": 105941, "epoch": 2522} {"train_loss": -6.326653957366943, "global_step": 105942, "epoch": 2522} {"train_loss": -6.4139204025268555, "global_step": 105943, "epoch": 2522} {"train_loss": -6.445833206176758, "global_step": 105944, "epoch": 2522} {"train_loss": -6.347268104553223, "global_step": 105945, "epoch": 2522} {"train_loss": -6.360618591308594, "global_step": 105946, "epoch": 2522} {"train_loss": -6.332571506500244, "global_step": 105947, "epoch": 2522} {"train_loss": -6.411620140075684, "global_step": 105948, "epoch": 2522} {"train_loss": -6.352451324462891, "global_step": 105949, "epoch": 2522} {"train_loss": -6.353048801422119, "global_step": 105950, "epoch": 2522} {"train_loss": -6.261519432067871, "global_step": 105951, "epoch": 2522} {"train_loss": -6.395272731781006, "global_step": 105952, "epoch": 2522} {"train_loss": -6.376038074493408, "global_step": 105953, "epoch": 2522} {"train_loss": -6.2097978591918945, "global_step": 105954, "epoch": 2522} {"train_loss": -6.494305610656738, "global_step": 105955, "epoch": 2522} {"train_loss": -6.25038480758667, "global_step": 105956, "epoch": 2522} {"train_loss": -6.328428268432617, "global_step": 105957, "epoch": 2522} {"train_loss": -6.336103916168213, "global_step": 105958, "epoch": 2522} {"train_loss": -6.346993446350098, "global_step": 105959, "epoch": 2522} {"train_loss": -6.320384979248047, "global_step": 105960, "epoch": 2522} {"train_loss": -6.241161823272705, "global_step": 105961, "epoch": 2522} {"train_loss": -6.278385162353516, "global_step": 105962, "epoch": 2522} {"train_loss": -6.451578617095947, "global_step": 105963, "epoch": 2522} {"train_loss": -6.39911413192749, "global_step": 105964, "epoch": 2522} {"train_loss": -6.365767740067982, "global_step": 105965, "epoch": 2522, "val_loss": 67857.875} {"train_loss": -6.315577030181885, "global_step": 105966, "epoch": 2523} {"train_loss": -6.3946404457092285, "global_step": 105967, "epoch": 2523} {"train_loss": -6.476415157318115, "global_step": 105968, "epoch": 2523} {"train_loss": -6.395406723022461, "global_step": 105969, "epoch": 2523} {"train_loss": -6.292712211608887, "global_step": 105970, "epoch": 2523} {"train_loss": -6.454878330230713, "global_step": 105971, "epoch": 2523} {"train_loss": -6.454702854156494, "global_step": 105972, "epoch": 2523} {"train_loss": -6.552178382873535, "global_step": 105973, "epoch": 2523} {"train_loss": -6.474327087402344, "global_step": 105974, "epoch": 2523} {"train_loss": -6.444169998168945, "global_step": 105975, "epoch": 2523} {"train_loss": -6.422711372375488, "global_step": 105976, "epoch": 2523} {"train_loss": -6.398571491241455, "global_step": 105977, "epoch": 2523} {"train_loss": -6.419433116912842, "global_step": 105978, "epoch": 2523} {"train_loss": -6.34234619140625, "global_step": 105979, "epoch": 2523} {"train_loss": -6.205223083496094, "global_step": 105980, "epoch": 2523} {"train_loss": -6.354774475097656, "global_step": 105981, "epoch": 2523} {"train_loss": -6.447993755340576, "global_step": 105982, "epoch": 2523} {"train_loss": -6.4280290603637695, "global_step": 105983, "epoch": 2523} {"train_loss": -6.323405742645264, "global_step": 105984, "epoch": 2523} {"train_loss": -6.338296890258789, "global_step": 105985, "epoch": 2523} {"train_loss": -6.320103645324707, "global_step": 105986, "epoch": 2523} {"train_loss": -6.381547451019287, "global_step": 105987, "epoch": 2523} {"train_loss": -6.402032852172852, "global_step": 105988, "epoch": 2523} {"train_loss": -6.455721855163574, "global_step": 105989, "epoch": 2523} {"train_loss": -6.357884883880615, "global_step": 105990, "epoch": 2523} {"train_loss": -6.414054870605469, "global_step": 105991, "epoch": 2523} {"train_loss": -6.274875164031982, "global_step": 105992, "epoch": 2523} {"train_loss": -6.318807601928711, "global_step": 105993, "epoch": 2523} {"train_loss": -6.444486618041992, "global_step": 105994, "epoch": 2523} {"train_loss": -6.32942533493042, "global_step": 105995, "epoch": 2523} {"train_loss": -6.449465751647949, "global_step": 105996, "epoch": 2523} {"train_loss": -6.335255146026611, "global_step": 105997, "epoch": 2523} {"train_loss": -6.414588928222656, "global_step": 105998, "epoch": 2523} {"train_loss": -6.456845760345459, "global_step": 105999, "epoch": 2523} {"train_loss": -6.413535118103027, "global_step": 106000, "epoch": 2523} {"train_loss": -6.399899482727051, "global_step": 106001, "epoch": 2523} {"train_loss": -6.493237495422363, "global_step": 106002, "epoch": 2523} {"train_loss": -6.469660758972168, "global_step": 106003, "epoch": 2523} {"train_loss": -6.351661682128906, "global_step": 106004, "epoch": 2523} {"train_loss": -6.4443559646606445, "global_step": 106005, "epoch": 2523} {"train_loss": -6.335331916809082, "global_step": 106006, "epoch": 2523} {"train_loss": -6.394545350755964, "global_step": 106007, "epoch": 2523, "val_loss": 67978.0546875} {"train_loss": -6.434324264526367, "global_step": 106008, "epoch": 2524} {"train_loss": -6.353353023529053, "global_step": 106009, "epoch": 2524} {"train_loss": -6.405849456787109, "global_step": 106010, "epoch": 2524} {"train_loss": -6.467411041259766, "global_step": 106011, "epoch": 2524} {"train_loss": -6.524767875671387, "global_step": 106012, "epoch": 2524} {"train_loss": -6.474699020385742, "global_step": 106013, "epoch": 2524} {"train_loss": -6.462737083435059, "global_step": 106014, "epoch": 2524} {"train_loss": -6.416765213012695, "global_step": 106015, "epoch": 2524} {"train_loss": -6.350508213043213, "global_step": 106016, "epoch": 2524} {"train_loss": -6.383380889892578, "global_step": 106017, "epoch": 2524} {"train_loss": -6.413702964782715, "global_step": 106018, "epoch": 2524} {"train_loss": -6.360054016113281, "global_step": 106019, "epoch": 2524} {"train_loss": -6.332332134246826, "global_step": 106020, "epoch": 2524} {"train_loss": -6.4997148513793945, "global_step": 106021, "epoch": 2524} {"train_loss": -6.409093856811523, "global_step": 106022, "epoch": 2524} {"train_loss": -6.341213703155518, "global_step": 106023, "epoch": 2524} {"train_loss": -6.437831401824951, "global_step": 106024, "epoch": 2524} {"train_loss": -6.416805267333984, "global_step": 106025, "epoch": 2524} {"train_loss": -6.359189033508301, "global_step": 106026, "epoch": 2524} {"train_loss": -6.45920467376709, "global_step": 106027, "epoch": 2524} {"train_loss": -6.3921380043029785, "global_step": 106028, "epoch": 2524} {"train_loss": -6.414389610290527, "global_step": 106029, "epoch": 2524} {"train_loss": -6.414168357849121, "global_step": 106030, "epoch": 2524} {"train_loss": -6.278809547424316, "global_step": 106031, "epoch": 2524} {"train_loss": -6.406974792480469, "global_step": 106032, "epoch": 2524} {"train_loss": -6.51395320892334, "global_step": 106033, "epoch": 2524} {"train_loss": -6.14610481262207, "global_step": 106034, "epoch": 2524} {"train_loss": -6.295449256896973, "global_step": 106035, "epoch": 2524} {"train_loss": -6.373971462249756, "global_step": 106036, "epoch": 2524} {"train_loss": -6.366976737976074, "global_step": 106037, "epoch": 2524} {"train_loss": -6.157827377319336, "global_step": 106038, "epoch": 2524} {"train_loss": -6.34012508392334, "global_step": 106039, "epoch": 2524} {"train_loss": -6.25543212890625, "global_step": 106040, "epoch": 2524} {"train_loss": -6.33380126953125, "global_step": 106041, "epoch": 2524} {"train_loss": -6.184216499328613, "global_step": 106042, "epoch": 2524} {"train_loss": -6.363468170166016, "global_step": 106043, "epoch": 2524} {"train_loss": -6.378204345703125, "global_step": 106044, "epoch": 2524} {"train_loss": -6.329127311706543, "global_step": 106045, "epoch": 2524} {"train_loss": -6.246975898742676, "global_step": 106046, "epoch": 2524} {"train_loss": -6.398682117462158, "global_step": 106047, "epoch": 2524} {"train_loss": -6.365585803985596, "global_step": 106048, "epoch": 2524} {"train_loss": -6.370889130092802, "global_step": 106049, "epoch": 2524, "val_loss": 67791.90625} {"train_loss": -6.321752548217773, "global_step": 106050, "epoch": 2525} {"train_loss": -6.260682106018066, "global_step": 106051, "epoch": 2525} {"train_loss": -6.308056831359863, "global_step": 106052, "epoch": 2525} {"train_loss": -6.3766350746154785, "global_step": 106053, "epoch": 2525} {"train_loss": -6.176485061645508, "global_step": 106054, "epoch": 2525} {"train_loss": -6.309481620788574, "global_step": 106055, "epoch": 2525} {"train_loss": -6.347381591796875, "global_step": 106056, "epoch": 2525} {"train_loss": -6.414151191711426, "global_step": 106057, "epoch": 2525} {"train_loss": -6.352235794067383, "global_step": 106058, "epoch": 2525} {"train_loss": -6.260018348693848, "global_step": 106059, "epoch": 2525} {"train_loss": -6.466007232666016, "global_step": 106060, "epoch": 2525} {"train_loss": -6.326360702514648, "global_step": 106061, "epoch": 2525} {"train_loss": -6.233650207519531, "global_step": 106062, "epoch": 2525} {"train_loss": -6.412672996520996, "global_step": 106063, "epoch": 2525} {"train_loss": -6.3180036544799805, "global_step": 106064, "epoch": 2525} {"train_loss": -6.450439453125, "global_step": 106065, "epoch": 2525} {"train_loss": -6.424152374267578, "global_step": 106066, "epoch": 2525} {"train_loss": -6.3332624435424805, "global_step": 106067, "epoch": 2525} {"train_loss": -6.329764366149902, "global_step": 106068, "epoch": 2525} {"train_loss": -6.379299640655518, "global_step": 106069, "epoch": 2525} {"train_loss": -6.321687698364258, "global_step": 106070, "epoch": 2525} {"train_loss": -6.352169990539551, "global_step": 106071, "epoch": 2525} {"train_loss": -6.365830421447754, "global_step": 106072, "epoch": 2525} {"train_loss": -6.392999649047852, "global_step": 106073, "epoch": 2525} {"train_loss": -6.433766841888428, "global_step": 106074, "epoch": 2525} {"train_loss": -6.31797981262207, "global_step": 106075, "epoch": 2525} {"train_loss": -6.459071159362793, "global_step": 106076, "epoch": 2525} {"train_loss": -6.410673141479492, "global_step": 106077, "epoch": 2525} {"train_loss": -6.4842848777771, "global_step": 106078, "epoch": 2525} {"train_loss": -6.409710884094238, "global_step": 106079, "epoch": 2525} {"train_loss": -6.4461822509765625, "global_step": 106080, "epoch": 2525} {"train_loss": -6.419661998748779, "global_step": 106081, "epoch": 2525} {"train_loss": -6.23887825012207, "global_step": 106082, "epoch": 2525} {"train_loss": -6.492046356201172, "global_step": 106083, "epoch": 2525} {"train_loss": -6.432524681091309, "global_step": 106084, "epoch": 2525} {"train_loss": -6.3210554122924805, "global_step": 106085, "epoch": 2525} {"train_loss": -6.331140518188477, "global_step": 106086, "epoch": 2525} {"train_loss": -6.322811126708984, "global_step": 106087, "epoch": 2525} {"train_loss": -6.36920690536499, "global_step": 106088, "epoch": 2525} {"train_loss": -6.368636608123779, "global_step": 106089, "epoch": 2525} {"train_loss": -6.312580585479736, "global_step": 106090, "epoch": 2525} {"train_loss": -6.362490177154541, "global_step": 106091, "epoch": 2525, "val_loss": 67844.234375} {"train_loss": -6.39438533782959, "global_step": 106092, "epoch": 2526} {"train_loss": -6.34263801574707, "global_step": 106093, "epoch": 2526} {"train_loss": -6.4698944091796875, "global_step": 106094, "epoch": 2526} {"train_loss": -6.424248218536377, "global_step": 106095, "epoch": 2526} {"train_loss": -6.29729700088501, "global_step": 106096, "epoch": 2526} {"train_loss": -6.387767791748047, "global_step": 106097, "epoch": 2526} {"train_loss": -6.250394821166992, "global_step": 106098, "epoch": 2526} {"train_loss": -6.493363380432129, "global_step": 106099, "epoch": 2526} {"train_loss": -6.4200568199157715, "global_step": 106100, "epoch": 2526} {"train_loss": -6.348060131072998, "global_step": 106101, "epoch": 2526} {"train_loss": -6.363085746765137, "global_step": 106102, "epoch": 2526} {"train_loss": -6.492337703704834, "global_step": 106103, "epoch": 2526} {"train_loss": -6.41554069519043, "global_step": 106104, "epoch": 2526} {"train_loss": -6.43481969833374, "global_step": 106105, "epoch": 2526} {"train_loss": -6.455385208129883, "global_step": 106106, "epoch": 2526} {"train_loss": -6.464925765991211, "global_step": 106107, "epoch": 2526} {"train_loss": -6.422561168670654, "global_step": 106108, "epoch": 2526} {"train_loss": -6.411330699920654, "global_step": 106109, "epoch": 2526} {"train_loss": -6.478676795959473, "global_step": 106110, "epoch": 2526} {"train_loss": -6.300967216491699, "global_step": 106111, "epoch": 2526} {"train_loss": -6.381231784820557, "global_step": 106112, "epoch": 2526} {"train_loss": -6.405597686767578, "global_step": 106113, "epoch": 2526} {"train_loss": -6.497220993041992, "global_step": 106114, "epoch": 2526} {"train_loss": -6.46885347366333, "global_step": 106115, "epoch": 2526} {"train_loss": -6.412409782409668, "global_step": 106116, "epoch": 2526} {"train_loss": -6.328182220458984, "global_step": 106117, "epoch": 2526} {"train_loss": -6.372886657714844, "global_step": 106118, "epoch": 2526} {"train_loss": -6.431528091430664, "global_step": 106119, "epoch": 2526} {"train_loss": -6.338509559631348, "global_step": 106120, "epoch": 2526} {"train_loss": -6.396402835845947, "global_step": 106121, "epoch": 2526} {"train_loss": -6.39957332611084, "global_step": 106122, "epoch": 2526} {"train_loss": -6.428067207336426, "global_step": 106123, "epoch": 2526} {"train_loss": -6.471841812133789, "global_step": 106124, "epoch": 2526} {"train_loss": -6.4544758796691895, "global_step": 106125, "epoch": 2526} {"train_loss": -6.412105083465576, "global_step": 106126, "epoch": 2526} {"train_loss": -6.33862829208374, "global_step": 106127, "epoch": 2526} {"train_loss": -6.384700775146484, "global_step": 106128, "epoch": 2526} {"train_loss": -6.418636798858643, "global_step": 106129, "epoch": 2526} {"train_loss": -6.33559513092041, "global_step": 106130, "epoch": 2526} {"train_loss": -6.429265975952148, "global_step": 106131, "epoch": 2526} {"train_loss": -6.445947647094727, "global_step": 106132, "epoch": 2526} {"train_loss": -6.404261032740275, "global_step": 106133, "epoch": 2526, "val_loss": 68050.859375} {"train_loss": -6.282459259033203, "global_step": 106134, "epoch": 2527} {"train_loss": -6.367332458496094, "global_step": 106135, "epoch": 2527} {"train_loss": -6.52044153213501, "global_step": 106136, "epoch": 2527} {"train_loss": -6.541206359863281, "global_step": 106137, "epoch": 2527} {"train_loss": -6.418826580047607, "global_step": 106138, "epoch": 2527} {"train_loss": -6.337930679321289, "global_step": 106139, "epoch": 2527} {"train_loss": -6.410502910614014, "global_step": 106140, "epoch": 2527} {"train_loss": -6.3776655197143555, "global_step": 106141, "epoch": 2527} {"train_loss": -6.269506454467773, "global_step": 106142, "epoch": 2527} {"train_loss": -6.436222076416016, "global_step": 106143, "epoch": 2527} {"train_loss": -6.43449592590332, "global_step": 106144, "epoch": 2527} {"train_loss": -6.473110675811768, "global_step": 106145, "epoch": 2527} {"train_loss": -6.459291458129883, "global_step": 106146, "epoch": 2527} {"train_loss": -6.321272373199463, "global_step": 106147, "epoch": 2527} {"train_loss": -6.393054962158203, "global_step": 106148, "epoch": 2527} {"train_loss": -6.418375492095947, "global_step": 106149, "epoch": 2527} {"train_loss": -6.380823612213135, "global_step": 106150, "epoch": 2527} {"train_loss": -6.396070957183838, "global_step": 106151, "epoch": 2527} {"train_loss": -6.385989189147949, "global_step": 106152, "epoch": 2527} {"train_loss": -6.46113920211792, "global_step": 106153, "epoch": 2527} {"train_loss": -6.397603511810303, "global_step": 106154, "epoch": 2527} {"train_loss": -6.3863983154296875, "global_step": 106155, "epoch": 2527} {"train_loss": -6.4015350341796875, "global_step": 106156, "epoch": 2527} {"train_loss": -6.352903366088867, "global_step": 106157, "epoch": 2527} {"train_loss": -6.454322814941406, "global_step": 106158, "epoch": 2527} {"train_loss": -6.453162670135498, "global_step": 106159, "epoch": 2527} {"train_loss": -6.433344841003418, "global_step": 106160, "epoch": 2527} {"train_loss": -6.250584602355957, "global_step": 106161, "epoch": 2527} {"train_loss": -6.476275444030762, "global_step": 106162, "epoch": 2527} {"train_loss": -6.287325382232666, "global_step": 106163, "epoch": 2527} {"train_loss": -6.47686243057251, "global_step": 106164, "epoch": 2527} {"train_loss": -6.367612838745117, "global_step": 106165, "epoch": 2527} {"train_loss": -6.338071823120117, "global_step": 106166, "epoch": 2527} {"train_loss": -6.405721187591553, "global_step": 106167, "epoch": 2527} {"train_loss": -6.5016279220581055, "global_step": 106168, "epoch": 2527} {"train_loss": -6.265834331512451, "global_step": 106169, "epoch": 2527} {"train_loss": -6.422530174255371, "global_step": 106170, "epoch": 2527} {"train_loss": -6.390254020690918, "global_step": 106171, "epoch": 2527} {"train_loss": -6.338109970092773, "global_step": 106172, "epoch": 2527} {"train_loss": -6.441798686981201, "global_step": 106173, "epoch": 2527} {"train_loss": -6.329213619232178, "global_step": 106174, "epoch": 2527} {"train_loss": -6.395866848173595, "global_step": 106175, "epoch": 2527, "val_loss": 67906.9609375} {"train_loss": -6.409644603729248, "global_step": 106176, "epoch": 2528} {"train_loss": -6.418425559997559, "global_step": 106177, "epoch": 2528} {"train_loss": -6.511046886444092, "global_step": 106178, "epoch": 2528} {"train_loss": -6.578733444213867, "global_step": 106179, "epoch": 2528} {"train_loss": -6.511578559875488, "global_step": 106180, "epoch": 2528} {"train_loss": -6.400079250335693, "global_step": 106181, "epoch": 2528} {"train_loss": -6.479791641235352, "global_step": 106182, "epoch": 2528} {"train_loss": -6.534712791442871, "global_step": 106183, "epoch": 2528} {"train_loss": -6.350337028503418, "global_step": 106184, "epoch": 2528} {"train_loss": -6.402950763702393, "global_step": 106185, "epoch": 2528} {"train_loss": -6.463720798492432, "global_step": 106186, "epoch": 2528} {"train_loss": -6.350980758666992, "global_step": 106187, "epoch": 2528} {"train_loss": -6.360942840576172, "global_step": 106188, "epoch": 2528} {"train_loss": -6.504528045654297, "global_step": 106189, "epoch": 2528} {"train_loss": -6.423551559448242, "global_step": 106190, "epoch": 2528} {"train_loss": -6.3921732902526855, "global_step": 106191, "epoch": 2528} {"train_loss": -6.5117506980896, "global_step": 106192, "epoch": 2528} {"train_loss": -6.459615707397461, "global_step": 106193, "epoch": 2528} {"train_loss": -6.400956153869629, "global_step": 106194, "epoch": 2528} {"train_loss": -6.392923831939697, "global_step": 106195, "epoch": 2528} {"train_loss": -6.333664894104004, "global_step": 106196, "epoch": 2528} {"train_loss": -6.344975471496582, "global_step": 106197, "epoch": 2528} {"train_loss": -6.547259330749512, "global_step": 106198, "epoch": 2528} {"train_loss": -6.3229475021362305, "global_step": 106199, "epoch": 2528} {"train_loss": -6.4910759925842285, "global_step": 106200, "epoch": 2528} {"train_loss": -6.345506191253662, "global_step": 106201, "epoch": 2528} {"train_loss": -6.399348258972168, "global_step": 106202, "epoch": 2528} {"train_loss": -6.326507568359375, "global_step": 106203, "epoch": 2528} {"train_loss": -6.415095329284668, "global_step": 106204, "epoch": 2528} {"train_loss": -6.363195896148682, "global_step": 106205, "epoch": 2528} {"train_loss": -6.460539817810059, "global_step": 106206, "epoch": 2528} {"train_loss": -6.328352928161621, "global_step": 106207, "epoch": 2528} {"train_loss": -6.350339412689209, "global_step": 106208, "epoch": 2528} {"train_loss": -6.5856475830078125, "global_step": 106209, "epoch": 2528} {"train_loss": -6.343036651611328, "global_step": 106210, "epoch": 2528} {"train_loss": -6.4172043800354, "global_step": 106211, "epoch": 2528} {"train_loss": -6.464385986328125, "global_step": 106212, "epoch": 2528} {"train_loss": -6.347072124481201, "global_step": 106213, "epoch": 2528} {"train_loss": -6.4503173828125, "global_step": 106214, "epoch": 2528} {"train_loss": -6.434122562408447, "global_step": 106215, "epoch": 2528} {"train_loss": -6.4032464027404785, "global_step": 106216, "epoch": 2528} {"train_loss": -6.423557315553937, "global_step": 106217, "epoch": 2528, "val_loss": 67684.015625} {"train_loss": -6.465601444244385, "global_step": 106218, "epoch": 2529} {"train_loss": -6.348321914672852, "global_step": 106219, "epoch": 2529} {"train_loss": -6.440188407897949, "global_step": 106220, "epoch": 2529} {"train_loss": -6.397627830505371, "global_step": 106221, "epoch": 2529} {"train_loss": -6.422152042388916, "global_step": 106222, "epoch": 2529} {"train_loss": -6.310687065124512, "global_step": 106223, "epoch": 2529} {"train_loss": -6.406782150268555, "global_step": 106224, "epoch": 2529} {"train_loss": -6.34975528717041, "global_step": 106225, "epoch": 2529} {"train_loss": -6.29677152633667, "global_step": 106226, "epoch": 2529} {"train_loss": -6.456563472747803, "global_step": 106227, "epoch": 2529} {"train_loss": -6.373734474182129, "global_step": 106228, "epoch": 2529} {"train_loss": -6.322358131408691, "global_step": 106229, "epoch": 2529} {"train_loss": -6.439311981201172, "global_step": 106230, "epoch": 2529} {"train_loss": -6.457310676574707, "global_step": 106231, "epoch": 2529} {"train_loss": -6.400596618652344, "global_step": 106232, "epoch": 2529} {"train_loss": -6.358989715576172, "global_step": 106233, "epoch": 2529} {"train_loss": -6.428778648376465, "global_step": 106234, "epoch": 2529} {"train_loss": -6.5306830406188965, "global_step": 106235, "epoch": 2529} {"train_loss": -6.492940425872803, "global_step": 106236, "epoch": 2529} {"train_loss": -6.418703079223633, "global_step": 106237, "epoch": 2529} {"train_loss": -6.409392833709717, "global_step": 106238, "epoch": 2529} {"train_loss": -6.34792423248291, "global_step": 106239, "epoch": 2529} {"train_loss": -6.395616054534912, "global_step": 106240, "epoch": 2529} {"train_loss": -6.437323093414307, "global_step": 106241, "epoch": 2529} {"train_loss": -6.347315311431885, "global_step": 106242, "epoch": 2529} {"train_loss": -6.4449334144592285, "global_step": 106243, "epoch": 2529} {"train_loss": -6.290771007537842, "global_step": 106244, "epoch": 2529} {"train_loss": -6.3232598304748535, "global_step": 106245, "epoch": 2529} {"train_loss": -6.4141526222229, "global_step": 106246, "epoch": 2529} {"train_loss": -6.391010284423828, "global_step": 106247, "epoch": 2529} {"train_loss": -6.186987400054932, "global_step": 106248, "epoch": 2529} {"train_loss": -6.347024917602539, "global_step": 106249, "epoch": 2529} {"train_loss": -6.293025016784668, "global_step": 106250, "epoch": 2529} {"train_loss": -6.367041110992432, "global_step": 106251, "epoch": 2529} {"train_loss": -6.382920742034912, "global_step": 106252, "epoch": 2529} {"train_loss": -6.52597188949585, "global_step": 106253, "epoch": 2529} {"train_loss": -6.432329177856445, "global_step": 106254, "epoch": 2529} {"train_loss": -6.411533832550049, "global_step": 106255, "epoch": 2529} {"train_loss": -6.436625003814697, "global_step": 106256, "epoch": 2529} {"train_loss": -6.374819755554199, "global_step": 106257, "epoch": 2529} {"train_loss": -6.341078758239746, "global_step": 106258, "epoch": 2529} {"train_loss": -6.390217247463408, "global_step": 106259, "epoch": 2529, "val_loss": 67665.40625} {"train_loss": -6.412914276123047, "global_step": 106260, "epoch": 2530} {"train_loss": -6.410272121429443, "global_step": 106261, "epoch": 2530} {"train_loss": -6.376251220703125, "global_step": 106262, "epoch": 2530} {"train_loss": -6.279085159301758, "global_step": 106263, "epoch": 2530} {"train_loss": -6.2350873947143555, "global_step": 106264, "epoch": 2530} {"train_loss": -6.290548324584961, "global_step": 106265, "epoch": 2530} {"train_loss": -6.185263156890869, "global_step": 106266, "epoch": 2530} {"train_loss": -6.333690166473389, "global_step": 106267, "epoch": 2530} {"train_loss": -6.212550640106201, "global_step": 106268, "epoch": 2530} {"train_loss": -6.3087029457092285, "global_step": 106269, "epoch": 2530} {"train_loss": -6.264822006225586, "global_step": 106270, "epoch": 2530} {"train_loss": -6.381122589111328, "global_step": 106271, "epoch": 2530} {"train_loss": -6.40297794342041, "global_step": 106272, "epoch": 2530} {"train_loss": -6.276390075683594, "global_step": 106273, "epoch": 2530} {"train_loss": -6.357151985168457, "global_step": 106274, "epoch": 2530} {"train_loss": -6.194873809814453, "global_step": 106275, "epoch": 2530} {"train_loss": -6.420118808746338, "global_step": 106276, "epoch": 2530} {"train_loss": -6.301279067993164, "global_step": 106277, "epoch": 2530} {"train_loss": -6.293091297149658, "global_step": 106278, "epoch": 2530} {"train_loss": -6.265167236328125, "global_step": 106279, "epoch": 2530} {"train_loss": -6.388338088989258, "global_step": 106280, "epoch": 2530} {"train_loss": -6.211819648742676, "global_step": 106281, "epoch": 2530} {"train_loss": -6.278138160705566, "global_step": 106282, "epoch": 2530} {"train_loss": -6.328695774078369, "global_step": 106283, "epoch": 2530} {"train_loss": -6.35343074798584, "global_step": 106284, "epoch": 2530} {"train_loss": -6.305171012878418, "global_step": 106285, "epoch": 2530} {"train_loss": -6.415329456329346, "global_step": 106286, "epoch": 2530} {"train_loss": -6.368786334991455, "global_step": 106287, "epoch": 2530} {"train_loss": -6.397464752197266, "global_step": 106288, "epoch": 2530} {"train_loss": -6.193206787109375, "global_step": 106289, "epoch": 2530} {"train_loss": -6.361767768859863, "global_step": 106290, "epoch": 2530} {"train_loss": -6.352271556854248, "global_step": 106291, "epoch": 2530} {"train_loss": -6.427969455718994, "global_step": 106292, "epoch": 2530} {"train_loss": -6.247004985809326, "global_step": 106293, "epoch": 2530} {"train_loss": -6.329105377197266, "global_step": 106294, "epoch": 2530} {"train_loss": -6.425336837768555, "global_step": 106295, "epoch": 2530} {"train_loss": -6.397798538208008, "global_step": 106296, "epoch": 2530} {"train_loss": -6.455928802490234, "global_step": 106297, "epoch": 2530} {"train_loss": -6.368600368499756, "global_step": 106298, "epoch": 2530} {"train_loss": -6.2706522941589355, "global_step": 106299, "epoch": 2530} {"train_loss": -6.534984111785889, "global_step": 106300, "epoch": 2530} {"train_loss": -6.332751103809902, "global_step": 106301, "epoch": 2530, "val_loss": 67936.6796875} {"train_loss": -6.48261022567749, "global_step": 106302, "epoch": 2531} {"train_loss": -6.420969009399414, "global_step": 106303, "epoch": 2531} {"train_loss": -6.442076683044434, "global_step": 106304, "epoch": 2531} {"train_loss": -6.415604591369629, "global_step": 106305, "epoch": 2531} {"train_loss": -6.365825653076172, "global_step": 106306, "epoch": 2531} {"train_loss": -6.357318878173828, "global_step": 106307, "epoch": 2531} {"train_loss": -6.494961261749268, "global_step": 106308, "epoch": 2531} {"train_loss": -6.476784706115723, "global_step": 106309, "epoch": 2531} {"train_loss": -6.356741905212402, "global_step": 106310, "epoch": 2531} {"train_loss": -6.3511128425598145, "global_step": 106311, "epoch": 2531} {"train_loss": -6.300012588500977, "global_step": 106312, "epoch": 2531} {"train_loss": -6.444441795349121, "global_step": 106313, "epoch": 2531} {"train_loss": -6.421922206878662, "global_step": 106314, "epoch": 2531} {"train_loss": -6.470712661743164, "global_step": 106315, "epoch": 2531} {"train_loss": -6.394942283630371, "global_step": 106316, "epoch": 2531} {"train_loss": -6.343857765197754, "global_step": 106317, "epoch": 2531} {"train_loss": -6.402858257293701, "global_step": 106318, "epoch": 2531} {"train_loss": -6.4657745361328125, "global_step": 106319, "epoch": 2531} {"train_loss": -6.246725082397461, "global_step": 106320, "epoch": 2531} {"train_loss": -6.238188743591309, "global_step": 106321, "epoch": 2531} {"train_loss": -6.35544490814209, "global_step": 106322, "epoch": 2531} {"train_loss": -6.3056817054748535, "global_step": 106323, "epoch": 2531} {"train_loss": -6.376125812530518, "global_step": 106324, "epoch": 2531} {"train_loss": -6.455399513244629, "global_step": 106325, "epoch": 2531} {"train_loss": -6.391088008880615, "global_step": 106326, "epoch": 2531} {"train_loss": -6.35109806060791, "global_step": 106327, "epoch": 2531} {"train_loss": -6.376152038574219, "global_step": 106328, "epoch": 2531} {"train_loss": -6.374185562133789, "global_step": 106329, "epoch": 2531} {"train_loss": -6.381399154663086, "global_step": 106330, "epoch": 2531} {"train_loss": -6.360156059265137, "global_step": 106331, "epoch": 2531} {"train_loss": -6.391274452209473, "global_step": 106332, "epoch": 2531} {"train_loss": -6.354082107543945, "global_step": 106333, "epoch": 2531} {"train_loss": -6.223087310791016, "global_step": 106334, "epoch": 2531} {"train_loss": -6.500936508178711, "global_step": 106335, "epoch": 2531} {"train_loss": -6.337704658508301, "global_step": 106336, "epoch": 2531} {"train_loss": -6.290867805480957, "global_step": 106337, "epoch": 2531} {"train_loss": -6.373562335968018, "global_step": 106338, "epoch": 2531} {"train_loss": -6.221102714538574, "global_step": 106339, "epoch": 2531} {"train_loss": -6.293240070343018, "global_step": 106340, "epoch": 2531} {"train_loss": -6.274749755859375, "global_step": 106341, "epoch": 2531} {"train_loss": -6.476604461669922, "global_step": 106342, "epoch": 2531} {"train_loss": -6.370288383393061, "global_step": 106343, "epoch": 2531, "val_loss": 67811.578125} {"train_loss": -6.398568153381348, "global_step": 106344, "epoch": 2532} {"train_loss": -6.27799654006958, "global_step": 106345, "epoch": 2532} {"train_loss": -6.396289825439453, "global_step": 106346, "epoch": 2532} {"train_loss": -6.314750671386719, "global_step": 106347, "epoch": 2532} {"train_loss": -6.394386291503906, "global_step": 106348, "epoch": 2532} {"train_loss": -6.332920074462891, "global_step": 106349, "epoch": 2532} {"train_loss": -6.40318489074707, "global_step": 106350, "epoch": 2532} {"train_loss": -6.239134788513184, "global_step": 106351, "epoch": 2532} {"train_loss": -6.307507514953613, "global_step": 106352, "epoch": 2532} {"train_loss": -6.454282760620117, "global_step": 106353, "epoch": 2532} {"train_loss": -6.315850257873535, "global_step": 106354, "epoch": 2532} {"train_loss": -6.391360282897949, "global_step": 106355, "epoch": 2532} {"train_loss": -6.3539137840271, "global_step": 106356, "epoch": 2532} {"train_loss": -6.477337837219238, "global_step": 106357, "epoch": 2532} {"train_loss": -6.366830825805664, "global_step": 106358, "epoch": 2532} {"train_loss": -6.477740287780762, "global_step": 106359, "epoch": 2532} {"train_loss": -6.373889923095703, "global_step": 106360, "epoch": 2532} {"train_loss": -6.453519344329834, "global_step": 106361, "epoch": 2532} {"train_loss": -6.4688615798950195, "global_step": 106362, "epoch": 2532} {"train_loss": -6.303244590759277, "global_step": 106363, "epoch": 2532} {"train_loss": -6.343581676483154, "global_step": 106364, "epoch": 2532} {"train_loss": -6.432488441467285, "global_step": 106365, "epoch": 2532} {"train_loss": -6.507123947143555, "global_step": 106366, "epoch": 2532} {"train_loss": -6.418028831481934, "global_step": 106367, "epoch": 2532} {"train_loss": -6.436979293823242, "global_step": 106368, "epoch": 2532} {"train_loss": -6.385519981384277, "global_step": 106369, "epoch": 2532} {"train_loss": -6.391888618469238, "global_step": 106370, "epoch": 2532} {"train_loss": -6.314623832702637, "global_step": 106371, "epoch": 2532} {"train_loss": -6.424678802490234, "global_step": 106372, "epoch": 2532} {"train_loss": -6.386811256408691, "global_step": 106373, "epoch": 2532} {"train_loss": -6.38539981842041, "global_step": 106374, "epoch": 2532} {"train_loss": -6.372136116027832, "global_step": 106375, "epoch": 2532} {"train_loss": -6.462671756744385, "global_step": 106376, "epoch": 2532} {"train_loss": -6.264026641845703, "global_step": 106377, "epoch": 2532} {"train_loss": -6.492266654968262, "global_step": 106378, "epoch": 2532} {"train_loss": -6.446092128753662, "global_step": 106379, "epoch": 2532} {"train_loss": -6.338354110717773, "global_step": 106380, "epoch": 2532} {"train_loss": -6.330319404602051, "global_step": 106381, "epoch": 2532} {"train_loss": -6.414505958557129, "global_step": 106382, "epoch": 2532} {"train_loss": -6.415314674377441, "global_step": 106383, "epoch": 2532} {"train_loss": -6.393976211547852, "global_step": 106384, "epoch": 2532} {"train_loss": -6.391089893522716, "global_step": 106385, "epoch": 2532, "val_loss": 67818.0390625} {"train_loss": -6.482414722442627, "global_step": 106386, "epoch": 2533} {"train_loss": -6.485994815826416, "global_step": 106387, "epoch": 2533} {"train_loss": -6.485134124755859, "global_step": 106388, "epoch": 2533} {"train_loss": -6.436535835266113, "global_step": 106389, "epoch": 2533} {"train_loss": -6.527109622955322, "global_step": 106390, "epoch": 2533} {"train_loss": -6.427328109741211, "global_step": 106391, "epoch": 2533} {"train_loss": -6.407068729400635, "global_step": 106392, "epoch": 2533} {"train_loss": -6.474936008453369, "global_step": 106393, "epoch": 2533} {"train_loss": -6.311530113220215, "global_step": 106394, "epoch": 2533} {"train_loss": -6.394281387329102, "global_step": 106395, "epoch": 2533} {"train_loss": -6.531448841094971, "global_step": 106396, "epoch": 2533} {"train_loss": -6.379743576049805, "global_step": 106397, "epoch": 2533} {"train_loss": -6.543698310852051, "global_step": 106398, "epoch": 2533} {"train_loss": -6.507136344909668, "global_step": 106399, "epoch": 2533} {"train_loss": -6.574061393737793, "global_step": 106400, "epoch": 2533} {"train_loss": -6.4881744384765625, "global_step": 106401, "epoch": 2533} {"train_loss": -6.364891052246094, "global_step": 106402, "epoch": 2533} {"train_loss": -6.419761657714844, "global_step": 106403, "epoch": 2533} {"train_loss": -6.392066478729248, "global_step": 106404, "epoch": 2533} {"train_loss": -6.363743782043457, "global_step": 106405, "epoch": 2533} {"train_loss": -6.489893913269043, "global_step": 106406, "epoch": 2533} {"train_loss": -6.418431282043457, "global_step": 106407, "epoch": 2533} {"train_loss": -6.377056121826172, "global_step": 106408, "epoch": 2533} {"train_loss": -6.379298210144043, "global_step": 106409, "epoch": 2533} {"train_loss": -6.463987827301025, "global_step": 106410, "epoch": 2533} {"train_loss": -6.396834373474121, "global_step": 106411, "epoch": 2533} {"train_loss": -6.433366775512695, "global_step": 106412, "epoch": 2533} {"train_loss": -6.459924697875977, "global_step": 106413, "epoch": 2533} {"train_loss": -6.4327192306518555, "global_step": 106414, "epoch": 2533} {"train_loss": -6.429760932922363, "global_step": 106415, "epoch": 2533} {"train_loss": -6.47078800201416, "global_step": 106416, "epoch": 2533} {"train_loss": -6.401821613311768, "global_step": 106417, "epoch": 2533} {"train_loss": -6.351062774658203, "global_step": 106418, "epoch": 2533} {"train_loss": -6.318558692932129, "global_step": 106419, "epoch": 2533} {"train_loss": -6.401195049285889, "global_step": 106420, "epoch": 2533} {"train_loss": -6.438478469848633, "global_step": 106421, "epoch": 2533} {"train_loss": -6.333926200866699, "global_step": 106422, "epoch": 2533} {"train_loss": -6.461962699890137, "global_step": 106423, "epoch": 2533} {"train_loss": -6.502243995666504, "global_step": 106424, "epoch": 2533} {"train_loss": -6.388811111450195, "global_step": 106425, "epoch": 2533} {"train_loss": -6.337739944458008, "global_step": 106426, "epoch": 2533} {"train_loss": -6.4328861350104924, "global_step": 106427, "epoch": 2533, "val_loss": 67777.234375} {"train_loss": -6.408748626708984, "global_step": 106428, "epoch": 2534} {"train_loss": -6.346200942993164, "global_step": 106429, "epoch": 2534} {"train_loss": -6.397272109985352, "global_step": 106430, "epoch": 2534} {"train_loss": -6.403465270996094, "global_step": 106431, "epoch": 2534} {"train_loss": -6.384207248687744, "global_step": 106432, "epoch": 2534} {"train_loss": -6.391049385070801, "global_step": 106433, "epoch": 2534} {"train_loss": -6.466401100158691, "global_step": 106434, "epoch": 2534} {"train_loss": -6.432567596435547, "global_step": 106435, "epoch": 2534} {"train_loss": -6.427668571472168, "global_step": 106436, "epoch": 2534} {"train_loss": -6.312900543212891, "global_step": 106437, "epoch": 2534} {"train_loss": -6.470231056213379, "global_step": 106438, "epoch": 2534} {"train_loss": -6.367780685424805, "global_step": 106439, "epoch": 2534} {"train_loss": -6.372453689575195, "global_step": 106440, "epoch": 2534} {"train_loss": -6.226164817810059, "global_step": 106441, "epoch": 2534} {"train_loss": -6.468203544616699, "global_step": 106442, "epoch": 2534} {"train_loss": -6.3405985832214355, "global_step": 106443, "epoch": 2534} {"train_loss": -6.361114978790283, "global_step": 106444, "epoch": 2534} {"train_loss": -6.396971225738525, "global_step": 106445, "epoch": 2534} {"train_loss": -6.389791488647461, "global_step": 106446, "epoch": 2534} {"train_loss": -6.43897819519043, "global_step": 106447, "epoch": 2534} {"train_loss": -6.405638694763184, "global_step": 106448, "epoch": 2534} {"train_loss": -6.455601215362549, "global_step": 106449, "epoch": 2534} {"train_loss": -6.421736717224121, "global_step": 106450, "epoch": 2534} {"train_loss": -6.496954917907715, "global_step": 106451, "epoch": 2534} {"train_loss": -6.418690204620361, "global_step": 106452, "epoch": 2534} {"train_loss": -6.397268295288086, "global_step": 106453, "epoch": 2534} {"train_loss": -6.448375701904297, "global_step": 106454, "epoch": 2534} {"train_loss": -6.447234630584717, "global_step": 106455, "epoch": 2534} {"train_loss": -6.471837997436523, "global_step": 106456, "epoch": 2534} {"train_loss": -6.372237205505371, "global_step": 106457, "epoch": 2534} {"train_loss": -6.355301380157471, "global_step": 106458, "epoch": 2534} {"train_loss": -6.418191432952881, "global_step": 106459, "epoch": 2534} {"train_loss": -6.398439407348633, "global_step": 106460, "epoch": 2534} {"train_loss": -6.400585174560547, "global_step": 106461, "epoch": 2534} {"train_loss": -6.391913414001465, "global_step": 106462, "epoch": 2534} {"train_loss": -6.328798294067383, "global_step": 106463, "epoch": 2534} {"train_loss": -6.370630264282227, "global_step": 106464, "epoch": 2534} {"train_loss": -6.381745338439941, "global_step": 106465, "epoch": 2534} {"train_loss": -6.31947135925293, "global_step": 106466, "epoch": 2534} {"train_loss": -6.344402313232422, "global_step": 106467, "epoch": 2534} {"train_loss": -6.479058265686035, "global_step": 106468, "epoch": 2534} {"train_loss": -6.396848428817022, "global_step": 106469, "epoch": 2534, "val_loss": 68106.171875} {"train_loss": -6.419007301330566, "global_step": 106470, "epoch": 2535} {"train_loss": -6.447513103485107, "global_step": 106471, "epoch": 2535} {"train_loss": -6.457513332366943, "global_step": 106472, "epoch": 2535} {"train_loss": -6.376351833343506, "global_step": 106473, "epoch": 2535} {"train_loss": -6.366214752197266, "global_step": 106474, "epoch": 2535} {"train_loss": -6.355978012084961, "global_step": 106475, "epoch": 2535} {"train_loss": -6.395686149597168, "global_step": 106476, "epoch": 2535} {"train_loss": -6.285978317260742, "global_step": 106477, "epoch": 2535} {"train_loss": -6.299203872680664, "global_step": 106478, "epoch": 2535} {"train_loss": -6.545017719268799, "global_step": 106479, "epoch": 2535} {"train_loss": -6.35413122177124, "global_step": 106480, "epoch": 2535} {"train_loss": -6.335196495056152, "global_step": 106481, "epoch": 2535} {"train_loss": -6.436445236206055, "global_step": 106482, "epoch": 2535} {"train_loss": -6.307925224304199, "global_step": 106483, "epoch": 2535} {"train_loss": -6.486965179443359, "global_step": 106484, "epoch": 2535} {"train_loss": -6.364426612854004, "global_step": 106485, "epoch": 2535} {"train_loss": -6.421647071838379, "global_step": 106486, "epoch": 2535} {"train_loss": -6.300246238708496, "global_step": 106487, "epoch": 2535} {"train_loss": -6.311159133911133, "global_step": 106488, "epoch": 2535} {"train_loss": -6.406981468200684, "global_step": 106489, "epoch": 2535} {"train_loss": -6.313085079193115, "global_step": 106490, "epoch": 2535} {"train_loss": -6.49281120300293, "global_step": 106491, "epoch": 2535} {"train_loss": -6.4747819900512695, "global_step": 106492, "epoch": 2535} {"train_loss": -6.3631591796875, "global_step": 106493, "epoch": 2535} {"train_loss": -6.425262451171875, "global_step": 106494, "epoch": 2535} {"train_loss": -6.442462921142578, "global_step": 106495, "epoch": 2535} {"train_loss": -6.525781154632568, "global_step": 106496, "epoch": 2535} {"train_loss": -6.508052825927734, "global_step": 106497, "epoch": 2535} {"train_loss": -6.361159324645996, "global_step": 106498, "epoch": 2535} {"train_loss": -6.433455467224121, "global_step": 106499, "epoch": 2535} {"train_loss": -6.427550792694092, "global_step": 106500, "epoch": 2535} {"train_loss": -6.4209699630737305, "global_step": 106501, "epoch": 2535} {"train_loss": -6.464877128601074, "global_step": 106502, "epoch": 2535} {"train_loss": -6.527975559234619, "global_step": 106503, "epoch": 2535} {"train_loss": -6.435971260070801, "global_step": 106504, "epoch": 2535} {"train_loss": -6.435386657714844, "global_step": 106505, "epoch": 2535} {"train_loss": -6.380466461181641, "global_step": 106506, "epoch": 2535} {"train_loss": -6.2859601974487305, "global_step": 106507, "epoch": 2535} {"train_loss": -6.495781421661377, "global_step": 106508, "epoch": 2535} {"train_loss": -6.420149803161621, "global_step": 106509, "epoch": 2535} {"train_loss": -6.4417724609375, "global_step": 106510, "epoch": 2535} {"train_loss": -6.409738903953915, "global_step": 106511, "epoch": 2535, "val_loss": 67994.171875} {"train_loss": -6.534743785858154, "global_step": 106512, "epoch": 2536} {"train_loss": -6.343338489532471, "global_step": 106513, "epoch": 2536} {"train_loss": -6.470391750335693, "global_step": 106514, "epoch": 2536} {"train_loss": -6.489566326141357, "global_step": 106515, "epoch": 2536} {"train_loss": -6.463720321655273, "global_step": 106516, "epoch": 2536} {"train_loss": -6.455815315246582, "global_step": 106517, "epoch": 2536} {"train_loss": -6.443770408630371, "global_step": 106518, "epoch": 2536} {"train_loss": -6.459987640380859, "global_step": 106519, "epoch": 2536} {"train_loss": -6.373465061187744, "global_step": 106520, "epoch": 2536} {"train_loss": -6.398697853088379, "global_step": 106521, "epoch": 2536} {"train_loss": -6.479339122772217, "global_step": 106522, "epoch": 2536} {"train_loss": -6.426766872406006, "global_step": 106523, "epoch": 2536} {"train_loss": -6.626076698303223, "global_step": 106524, "epoch": 2536} {"train_loss": -6.4294753074646, "global_step": 106525, "epoch": 2536} {"train_loss": -6.452653884887695, "global_step": 106526, "epoch": 2536} {"train_loss": -6.5210347175598145, "global_step": 106527, "epoch": 2536} {"train_loss": -6.250326156616211, "global_step": 106528, "epoch": 2536} {"train_loss": -6.348027229309082, "global_step": 106529, "epoch": 2536} {"train_loss": -6.321863174438477, "global_step": 106530, "epoch": 2536} {"train_loss": -6.27016544342041, "global_step": 106531, "epoch": 2536} {"train_loss": -6.400887966156006, "global_step": 106532, "epoch": 2536} {"train_loss": -6.394444465637207, "global_step": 106533, "epoch": 2536} {"train_loss": -6.378511428833008, "global_step": 106534, "epoch": 2536} {"train_loss": -6.346547603607178, "global_step": 106535, "epoch": 2536} {"train_loss": -6.474841117858887, "global_step": 106536, "epoch": 2536} {"train_loss": -6.342080116271973, "global_step": 106537, "epoch": 2536} {"train_loss": -6.323487758636475, "global_step": 106538, "epoch": 2536} {"train_loss": -6.454383850097656, "global_step": 106539, "epoch": 2536} {"train_loss": -6.325766563415527, "global_step": 106540, "epoch": 2536} {"train_loss": -6.5294013023376465, "global_step": 106541, "epoch": 2536} {"train_loss": -6.344144821166992, "global_step": 106542, "epoch": 2536} {"train_loss": -6.218570232391357, "global_step": 106543, "epoch": 2536} {"train_loss": -6.302836894989014, "global_step": 106544, "epoch": 2536} {"train_loss": -6.340425491333008, "global_step": 106545, "epoch": 2536} {"train_loss": -6.400390625, "global_step": 106546, "epoch": 2536} {"train_loss": -6.279413223266602, "global_step": 106547, "epoch": 2536} {"train_loss": -6.316825866699219, "global_step": 106548, "epoch": 2536} {"train_loss": -6.183781623840332, "global_step": 106549, "epoch": 2536} {"train_loss": -6.252124309539795, "global_step": 106550, "epoch": 2536} {"train_loss": -6.377070426940918, "global_step": 106551, "epoch": 2536} {"train_loss": -6.370909690856934, "global_step": 106552, "epoch": 2536} {"train_loss": -6.38702993165879, "global_step": 106553, "epoch": 2536, "val_loss": 67940.109375} {"train_loss": -6.360581398010254, "global_step": 106554, "epoch": 2537} {"train_loss": -6.267867088317871, "global_step": 106555, "epoch": 2537} {"train_loss": -6.410120010375977, "global_step": 106556, "epoch": 2537} {"train_loss": -6.26799201965332, "global_step": 106557, "epoch": 2537} {"train_loss": -6.4510111808776855, "global_step": 106558, "epoch": 2537} {"train_loss": -6.330855846405029, "global_step": 106559, "epoch": 2537} {"train_loss": -6.599993705749512, "global_step": 106560, "epoch": 2537} {"train_loss": -6.419355392456055, "global_step": 106561, "epoch": 2537} {"train_loss": -6.429699897766113, "global_step": 106562, "epoch": 2537} {"train_loss": -6.498337268829346, "global_step": 106563, "epoch": 2537} {"train_loss": -6.333950519561768, "global_step": 106564, "epoch": 2537} {"train_loss": -6.430217266082764, "global_step": 106565, "epoch": 2537} {"train_loss": -6.45661735534668, "global_step": 106566, "epoch": 2537} {"train_loss": -6.333797454833984, "global_step": 106567, "epoch": 2537} {"train_loss": -6.340893745422363, "global_step": 106568, "epoch": 2537} {"train_loss": -6.32574987411499, "global_step": 106569, "epoch": 2537} {"train_loss": -6.391817092895508, "global_step": 106570, "epoch": 2537} {"train_loss": -6.378025531768799, "global_step": 106571, "epoch": 2537} {"train_loss": -6.202574253082275, "global_step": 106572, "epoch": 2537} {"train_loss": -6.42579984664917, "global_step": 106573, "epoch": 2537} {"train_loss": -6.413904190063477, "global_step": 106574, "epoch": 2537} {"train_loss": -6.138444423675537, "global_step": 106575, "epoch": 2537} {"train_loss": -6.3307881355285645, "global_step": 106576, "epoch": 2537} {"train_loss": -6.298717021942139, "global_step": 106577, "epoch": 2537} {"train_loss": -6.321817398071289, "global_step": 106578, "epoch": 2537} {"train_loss": -6.376192092895508, "global_step": 106579, "epoch": 2537} {"train_loss": -6.331876754760742, "global_step": 106580, "epoch": 2537} {"train_loss": -6.415132522583008, "global_step": 106581, "epoch": 2537} {"train_loss": -6.207568168640137, "global_step": 106582, "epoch": 2537} {"train_loss": -6.356043338775635, "global_step": 106583, "epoch": 2537} {"train_loss": -6.3202056884765625, "global_step": 106584, "epoch": 2537} {"train_loss": -6.315404891967773, "global_step": 106585, "epoch": 2537} {"train_loss": -6.398617267608643, "global_step": 106586, "epoch": 2537} {"train_loss": -6.304501533508301, "global_step": 106587, "epoch": 2537} {"train_loss": -6.385227203369141, "global_step": 106588, "epoch": 2537} {"train_loss": -6.299854755401611, "global_step": 106589, "epoch": 2537} {"train_loss": -6.319062232971191, "global_step": 106590, "epoch": 2537} {"train_loss": -6.419472694396973, "global_step": 106591, "epoch": 2537} {"train_loss": -6.397603988647461, "global_step": 106592, "epoch": 2537} {"train_loss": -6.332462310791016, "global_step": 106593, "epoch": 2537} {"train_loss": -6.3558349609375, "global_step": 106594, "epoch": 2537} {"train_loss": -6.359633763631185, "global_step": 106595, "epoch": 2537, "val_loss": 67791.5} {"train_loss": -6.343698501586914, "global_step": 106596, "epoch": 2538} {"train_loss": -6.369999885559082, "global_step": 106597, "epoch": 2538} {"train_loss": -6.393710136413574, "global_step": 106598, "epoch": 2538} {"train_loss": -6.29378604888916, "global_step": 106599, "epoch": 2538} {"train_loss": -6.358148574829102, "global_step": 106600, "epoch": 2538} {"train_loss": -6.439458847045898, "global_step": 106601, "epoch": 2538} {"train_loss": -6.435099124908447, "global_step": 106602, "epoch": 2538} {"train_loss": -6.475460052490234, "global_step": 106603, "epoch": 2538} {"train_loss": -6.290236473083496, "global_step": 106604, "epoch": 2538} {"train_loss": -6.389936447143555, "global_step": 106605, "epoch": 2538} {"train_loss": -6.433381080627441, "global_step": 106606, "epoch": 2538} {"train_loss": -6.398345947265625, "global_step": 106607, "epoch": 2538} {"train_loss": -6.237121105194092, "global_step": 106608, "epoch": 2538} {"train_loss": -6.3910675048828125, "global_step": 106609, "epoch": 2538} {"train_loss": -6.380895137786865, "global_step": 106610, "epoch": 2538} {"train_loss": -6.380975723266602, "global_step": 106611, "epoch": 2538} {"train_loss": -6.473970890045166, "global_step": 106612, "epoch": 2538} {"train_loss": -6.418829917907715, "global_step": 106613, "epoch": 2538} {"train_loss": -6.385766983032227, "global_step": 106614, "epoch": 2538} {"train_loss": -6.363457679748535, "global_step": 106615, "epoch": 2538} {"train_loss": -6.317112445831299, "global_step": 106616, "epoch": 2538} {"train_loss": -6.428920269012451, "global_step": 106617, "epoch": 2538} {"train_loss": -6.363508224487305, "global_step": 106618, "epoch": 2538} {"train_loss": -6.457235813140869, "global_step": 106619, "epoch": 2538} {"train_loss": -6.314401149749756, "global_step": 106620, "epoch": 2538} {"train_loss": -6.3764543533325195, "global_step": 106621, "epoch": 2538} {"train_loss": -6.435526371002197, "global_step": 106622, "epoch": 2538} {"train_loss": -6.452546119689941, "global_step": 106623, "epoch": 2538} {"train_loss": -6.371709823608398, "global_step": 106624, "epoch": 2538} {"train_loss": -6.526027202606201, "global_step": 106625, "epoch": 2538} {"train_loss": -6.3662519454956055, "global_step": 106626, "epoch": 2538} {"train_loss": -6.3310651779174805, "global_step": 106627, "epoch": 2538} {"train_loss": -6.4289751052856445, "global_step": 106628, "epoch": 2538} {"train_loss": -6.416350364685059, "global_step": 106629, "epoch": 2538} {"train_loss": -6.3581085205078125, "global_step": 106630, "epoch": 2538} {"train_loss": -6.402956485748291, "global_step": 106631, "epoch": 2538} {"train_loss": -6.448125839233398, "global_step": 106632, "epoch": 2538} {"train_loss": -6.467996120452881, "global_step": 106633, "epoch": 2538} {"train_loss": -6.402551174163818, "global_step": 106634, "epoch": 2538} {"train_loss": -6.306520462036133, "global_step": 106635, "epoch": 2538} {"train_loss": -6.337162971496582, "global_step": 106636, "epoch": 2538} {"train_loss": -6.388536226181757, "global_step": 106637, "epoch": 2538, "val_loss": 68042.6328125} {"train_loss": -6.439702033996582, "global_step": 106638, "epoch": 2539} {"train_loss": -6.342517852783203, "global_step": 106639, "epoch": 2539} {"train_loss": -6.239973068237305, "global_step": 106640, "epoch": 2539} {"train_loss": -6.333791732788086, "global_step": 106641, "epoch": 2539} {"train_loss": -6.442633628845215, "global_step": 106642, "epoch": 2539} {"train_loss": -6.410912990570068, "global_step": 106643, "epoch": 2539} {"train_loss": -6.286703586578369, "global_step": 106644, "epoch": 2539} {"train_loss": -6.45134162902832, "global_step": 106645, "epoch": 2539} {"train_loss": -6.339870452880859, "global_step": 106646, "epoch": 2539} {"train_loss": -6.308198928833008, "global_step": 106647, "epoch": 2539} {"train_loss": -6.383506774902344, "global_step": 106648, "epoch": 2539} {"train_loss": -6.347484111785889, "global_step": 106649, "epoch": 2539} {"train_loss": -6.445518493652344, "global_step": 106650, "epoch": 2539} {"train_loss": -6.396358489990234, "global_step": 106651, "epoch": 2539} {"train_loss": -6.458662033081055, "global_step": 106652, "epoch": 2539} {"train_loss": -6.359438896179199, "global_step": 106653, "epoch": 2539} {"train_loss": -6.423846244812012, "global_step": 106654, "epoch": 2539} {"train_loss": -6.355570316314697, "global_step": 106655, "epoch": 2539} {"train_loss": -6.350494384765625, "global_step": 106656, "epoch": 2539} {"train_loss": -6.400599479675293, "global_step": 106657, "epoch": 2539} {"train_loss": -6.341470241546631, "global_step": 106658, "epoch": 2539} {"train_loss": -6.348300457000732, "global_step": 106659, "epoch": 2539} {"train_loss": -6.480257987976074, "global_step": 106660, "epoch": 2539} {"train_loss": -6.48014497756958, "global_step": 106661, "epoch": 2539} {"train_loss": -6.4147539138793945, "global_step": 106662, "epoch": 2539} {"train_loss": -6.4045305252075195, "global_step": 106663, "epoch": 2539} {"train_loss": -6.328731536865234, "global_step": 106664, "epoch": 2539} {"train_loss": -6.417766571044922, "global_step": 106665, "epoch": 2539} {"train_loss": -6.295475959777832, "global_step": 106666, "epoch": 2539} {"train_loss": -6.423707962036133, "global_step": 106667, "epoch": 2539} {"train_loss": -6.419522762298584, "global_step": 106668, "epoch": 2539} {"train_loss": -6.34501838684082, "global_step": 106669, "epoch": 2539} {"train_loss": -6.406686305999756, "global_step": 106670, "epoch": 2539} {"train_loss": -6.305816173553467, "global_step": 106671, "epoch": 2539} {"train_loss": -6.387124538421631, "global_step": 106672, "epoch": 2539} {"train_loss": -6.307965278625488, "global_step": 106673, "epoch": 2539} {"train_loss": -6.427394390106201, "global_step": 106674, "epoch": 2539} {"train_loss": -6.389484882354736, "global_step": 106675, "epoch": 2539} {"train_loss": -6.360420227050781, "global_step": 106676, "epoch": 2539} {"train_loss": -6.3497314453125, "global_step": 106677, "epoch": 2539} {"train_loss": -6.311581611633301, "global_step": 106678, "epoch": 2539} {"train_loss": -6.376851717631022, "global_step": 106679, "epoch": 2539, "val_loss": 68064.1015625} {"train_loss": -6.3808817863464355, "global_step": 106680, "epoch": 2540} {"train_loss": -6.291413307189941, "global_step": 106681, "epoch": 2540} {"train_loss": -6.3714094161987305, "global_step": 106682, "epoch": 2540} {"train_loss": -6.232466220855713, "global_step": 106683, "epoch": 2540} {"train_loss": -6.283094882965088, "global_step": 106684, "epoch": 2540} {"train_loss": -6.317421913146973, "global_step": 106685, "epoch": 2540} {"train_loss": -6.27640438079834, "global_step": 106686, "epoch": 2540} {"train_loss": -6.326015472412109, "global_step": 106687, "epoch": 2540} {"train_loss": -6.4598846435546875, "global_step": 106688, "epoch": 2540} {"train_loss": -6.211317539215088, "global_step": 106689, "epoch": 2540} {"train_loss": -6.360134601593018, "global_step": 106690, "epoch": 2540} {"train_loss": -6.188083648681641, "global_step": 106691, "epoch": 2540} {"train_loss": -6.230148792266846, "global_step": 106692, "epoch": 2540} {"train_loss": -6.3667802810668945, "global_step": 106693, "epoch": 2540} {"train_loss": -6.298937797546387, "global_step": 106694, "epoch": 2540} {"train_loss": -6.322723388671875, "global_step": 106695, "epoch": 2540} {"train_loss": -6.295929431915283, "global_step": 106696, "epoch": 2540} {"train_loss": -6.367988586425781, "global_step": 106697, "epoch": 2540} {"train_loss": -6.238273620605469, "global_step": 106698, "epoch": 2540} {"train_loss": -6.298606872558594, "global_step": 106699, "epoch": 2540} {"train_loss": -6.346410751342773, "global_step": 106700, "epoch": 2540} {"train_loss": -6.32222318649292, "global_step": 106701, "epoch": 2540} {"train_loss": -6.3910393714904785, "global_step": 106702, "epoch": 2540} {"train_loss": -6.40489387512207, "global_step": 106703, "epoch": 2540} {"train_loss": -6.372590065002441, "global_step": 106704, "epoch": 2540} {"train_loss": -6.312826156616211, "global_step": 106705, "epoch": 2540} {"train_loss": -6.33643913269043, "global_step": 106706, "epoch": 2540} {"train_loss": -6.272512435913086, "global_step": 106707, "epoch": 2540} {"train_loss": -6.295992851257324, "global_step": 106708, "epoch": 2540} {"train_loss": -6.35152530670166, "global_step": 106709, "epoch": 2540} {"train_loss": -6.288973331451416, "global_step": 106710, "epoch": 2540} {"train_loss": -6.403325080871582, "global_step": 106711, "epoch": 2540} {"train_loss": -6.347672462463379, "global_step": 106712, "epoch": 2540} {"train_loss": -6.311977386474609, "global_step": 106713, "epoch": 2540} {"train_loss": -6.408288955688477, "global_step": 106714, "epoch": 2540} {"train_loss": -6.350237846374512, "global_step": 106715, "epoch": 2540} {"train_loss": -6.453166961669922, "global_step": 106716, "epoch": 2540} {"train_loss": -6.376953601837158, "global_step": 106717, "epoch": 2540} {"train_loss": -6.288661479949951, "global_step": 106718, "epoch": 2540} {"train_loss": -6.4414825439453125, "global_step": 106719, "epoch": 2540} {"train_loss": -6.351506233215332, "global_step": 106720, "epoch": 2540} {"train_loss": -6.332894120897565, "global_step": 106721, "epoch": 2540, "val_loss": 67928.046875} {"train_loss": -6.444214820861816, "global_step": 106722, "epoch": 2541} {"train_loss": -6.386560440063477, "global_step": 106723, "epoch": 2541} {"train_loss": -6.489606857299805, "global_step": 106724, "epoch": 2541} {"train_loss": -6.319762229919434, "global_step": 106725, "epoch": 2541} {"train_loss": -6.480095863342285, "global_step": 106726, "epoch": 2541} {"train_loss": -6.366296768188477, "global_step": 106727, "epoch": 2541} {"train_loss": -6.396123886108398, "global_step": 106728, "epoch": 2541} {"train_loss": -6.4748735427856445, "global_step": 106729, "epoch": 2541} {"train_loss": -6.355895042419434, "global_step": 106730, "epoch": 2541} {"train_loss": -6.283768653869629, "global_step": 106731, "epoch": 2541} {"train_loss": -6.4823503494262695, "global_step": 106732, "epoch": 2541} {"train_loss": -6.487173557281494, "global_step": 106733, "epoch": 2541} {"train_loss": -6.416982650756836, "global_step": 106734, "epoch": 2541} {"train_loss": -6.423731803894043, "global_step": 106735, "epoch": 2541} {"train_loss": -6.330356121063232, "global_step": 106736, "epoch": 2541} {"train_loss": -6.374605178833008, "global_step": 106737, "epoch": 2541} {"train_loss": -6.433073997497559, "global_step": 106738, "epoch": 2541} {"train_loss": -6.402606010437012, "global_step": 106739, "epoch": 2541} {"train_loss": -6.417915344238281, "global_step": 106740, "epoch": 2541} {"train_loss": -6.366464138031006, "global_step": 106741, "epoch": 2541} {"train_loss": -6.47337532043457, "global_step": 106742, "epoch": 2541} {"train_loss": -6.5014967918396, "global_step": 106743, "epoch": 2541} {"train_loss": -6.404635429382324, "global_step": 106744, "epoch": 2541} {"train_loss": -6.399986743927002, "global_step": 106745, "epoch": 2541} {"train_loss": -6.416284084320068, "global_step": 106746, "epoch": 2541} {"train_loss": -6.404097557067871, "global_step": 106747, "epoch": 2541} {"train_loss": -6.445439338684082, "global_step": 106748, "epoch": 2541} {"train_loss": -6.358052730560303, "global_step": 106749, "epoch": 2541} {"train_loss": -6.325242042541504, "global_step": 106750, "epoch": 2541} {"train_loss": -6.411767482757568, "global_step": 106751, "epoch": 2541} {"train_loss": -6.365746974945068, "global_step": 106752, "epoch": 2541} {"train_loss": -6.392273902893066, "global_step": 106753, "epoch": 2541} {"train_loss": -6.380814552307129, "global_step": 106754, "epoch": 2541} {"train_loss": -6.393743515014648, "global_step": 106755, "epoch": 2541} {"train_loss": -6.425483703613281, "global_step": 106756, "epoch": 2541} {"train_loss": -6.426741600036621, "global_step": 106757, "epoch": 2541} {"train_loss": -6.46310567855835, "global_step": 106758, "epoch": 2541} {"train_loss": -6.498370170593262, "global_step": 106759, "epoch": 2541} {"train_loss": -6.378405570983887, "global_step": 106760, "epoch": 2541} {"train_loss": -6.465129852294922, "global_step": 106761, "epoch": 2541} {"train_loss": -6.437039375305176, "global_step": 106762, "epoch": 2541} {"train_loss": -6.411545753479004, "global_step": 106763, "epoch": 2541, "val_loss": 67833.3515625} {"train_loss": -6.46838903427124, "global_step": 106764, "epoch": 2542} {"train_loss": -6.4896979331970215, "global_step": 106765, "epoch": 2542} {"train_loss": -6.486235618591309, "global_step": 106766, "epoch": 2542} {"train_loss": -6.411140441894531, "global_step": 106767, "epoch": 2542} {"train_loss": -6.446900367736816, "global_step": 106768, "epoch": 2542} {"train_loss": -6.408520698547363, "global_step": 106769, "epoch": 2542} {"train_loss": -6.3991923332214355, "global_step": 106770, "epoch": 2542} {"train_loss": -6.550433158874512, "global_step": 106771, "epoch": 2542} {"train_loss": -6.471402645111084, "global_step": 106772, "epoch": 2542} {"train_loss": -6.390605926513672, "global_step": 106773, "epoch": 2542} {"train_loss": -6.326096057891846, "global_step": 106774, "epoch": 2542} {"train_loss": -6.454240798950195, "global_step": 106775, "epoch": 2542} {"train_loss": -6.451333045959473, "global_step": 106776, "epoch": 2542} {"train_loss": -6.465987205505371, "global_step": 106777, "epoch": 2542} {"train_loss": -6.550492763519287, "global_step": 106778, "epoch": 2542} {"train_loss": -6.391254425048828, "global_step": 106779, "epoch": 2542} {"train_loss": -6.4565749168396, "global_step": 106780, "epoch": 2542} {"train_loss": -6.45345401763916, "global_step": 106781, "epoch": 2542} {"train_loss": -6.370306491851807, "global_step": 106782, "epoch": 2542} {"train_loss": -6.391942024230957, "global_step": 106783, "epoch": 2542} {"train_loss": -6.463822841644287, "global_step": 106784, "epoch": 2542} {"train_loss": -6.4027934074401855, "global_step": 106785, "epoch": 2542} {"train_loss": -6.485981464385986, "global_step": 106786, "epoch": 2542} {"train_loss": -6.503324508666992, "global_step": 106787, "epoch": 2542} {"train_loss": -6.368934631347656, "global_step": 106788, "epoch": 2542} {"train_loss": -6.487645149230957, "global_step": 106789, "epoch": 2542} {"train_loss": -6.438889503479004, "global_step": 106790, "epoch": 2542} {"train_loss": -6.4445672035217285, "global_step": 106791, "epoch": 2542} {"train_loss": -6.440476894378662, "global_step": 106792, "epoch": 2542} {"train_loss": -6.524369239807129, "global_step": 106793, "epoch": 2542} {"train_loss": -6.424824237823486, "global_step": 106794, "epoch": 2542} {"train_loss": -6.4714508056640625, "global_step": 106795, "epoch": 2542} {"train_loss": -6.397424697875977, "global_step": 106796, "epoch": 2542} {"train_loss": -6.4092817306518555, "global_step": 106797, "epoch": 2542} {"train_loss": -6.472665786743164, "global_step": 106798, "epoch": 2542} {"train_loss": -6.4244065284729, "global_step": 106799, "epoch": 2542} {"train_loss": -6.380939960479736, "global_step": 106800, "epoch": 2542} {"train_loss": -6.393874168395996, "global_step": 106801, "epoch": 2542} {"train_loss": -6.3474531173706055, "global_step": 106802, "epoch": 2542} {"train_loss": -6.401549816131592, "global_step": 106803, "epoch": 2542} {"train_loss": -6.4459123611450195, "global_step": 106804, "epoch": 2542} {"train_loss": -6.436528796241397, "global_step": 106805, "epoch": 2542, "val_loss": 67922.78125} {"train_loss": -6.413726806640625, "global_step": 106806, "epoch": 2543} {"train_loss": -6.404934406280518, "global_step": 106807, "epoch": 2543} {"train_loss": -6.373382568359375, "global_step": 106808, "epoch": 2543} {"train_loss": -6.47549295425415, "global_step": 106809, "epoch": 2543} {"train_loss": -6.344871997833252, "global_step": 106810, "epoch": 2543} {"train_loss": -6.384825706481934, "global_step": 106811, "epoch": 2543} {"train_loss": -6.476422309875488, "global_step": 106812, "epoch": 2543} {"train_loss": -6.512930870056152, "global_step": 106813, "epoch": 2543} {"train_loss": -6.307209014892578, "global_step": 106814, "epoch": 2543} {"train_loss": -6.531780242919922, "global_step": 106815, "epoch": 2543} {"train_loss": -6.463327407836914, "global_step": 106816, "epoch": 2543} {"train_loss": -6.342442512512207, "global_step": 106817, "epoch": 2543} {"train_loss": -6.456301689147949, "global_step": 106818, "epoch": 2543} {"train_loss": -6.281902313232422, "global_step": 106819, "epoch": 2543} {"train_loss": -6.344110488891602, "global_step": 106820, "epoch": 2543} {"train_loss": -6.3615641593933105, "global_step": 106821, "epoch": 2543} {"train_loss": -6.448156356811523, "global_step": 106822, "epoch": 2543} {"train_loss": -6.489314556121826, "global_step": 106823, "epoch": 2543} {"train_loss": -6.330904006958008, "global_step": 106824, "epoch": 2543} {"train_loss": -6.291362762451172, "global_step": 106825, "epoch": 2543} {"train_loss": -6.396947860717773, "global_step": 106826, "epoch": 2543} {"train_loss": -6.362571716308594, "global_step": 106827, "epoch": 2543} {"train_loss": -6.379798889160156, "global_step": 106828, "epoch": 2543} {"train_loss": -6.237079620361328, "global_step": 106829, "epoch": 2543} {"train_loss": -6.336853504180908, "global_step": 106830, "epoch": 2543} {"train_loss": -6.411377906799316, "global_step": 106831, "epoch": 2543} {"train_loss": -6.455965995788574, "global_step": 106832, "epoch": 2543} {"train_loss": -6.304722785949707, "global_step": 106833, "epoch": 2543} {"train_loss": -6.319913864135742, "global_step": 106834, "epoch": 2543} {"train_loss": -6.439027786254883, "global_step": 106835, "epoch": 2543} {"train_loss": -6.240195274353027, "global_step": 106836, "epoch": 2543} {"train_loss": -6.461662769317627, "global_step": 106837, "epoch": 2543} {"train_loss": -6.290392875671387, "global_step": 106838, "epoch": 2543} {"train_loss": -6.348964691162109, "global_step": 106839, "epoch": 2543} {"train_loss": -6.377317428588867, "global_step": 106840, "epoch": 2543} {"train_loss": -6.305122375488281, "global_step": 106841, "epoch": 2543} {"train_loss": -6.34677267074585, "global_step": 106842, "epoch": 2543} {"train_loss": -6.249537467956543, "global_step": 106843, "epoch": 2543} {"train_loss": -6.321355819702148, "global_step": 106844, "epoch": 2543} {"train_loss": -6.304238319396973, "global_step": 106845, "epoch": 2543} {"train_loss": -6.419435501098633, "global_step": 106846, "epoch": 2543} {"train_loss": -6.37093566712879, "global_step": 106847, "epoch": 2543, "val_loss": 67918.078125} {"train_loss": -6.286023139953613, "global_step": 106848, "epoch": 2544} {"train_loss": -6.386112213134766, "global_step": 106849, "epoch": 2544} {"train_loss": -6.3584184646606445, "global_step": 106850, "epoch": 2544} {"train_loss": -6.357698440551758, "global_step": 106851, "epoch": 2544} {"train_loss": -6.323816299438477, "global_step": 106852, "epoch": 2544} {"train_loss": -6.287362098693848, "global_step": 106853, "epoch": 2544} {"train_loss": -6.382844924926758, "global_step": 106854, "epoch": 2544} {"train_loss": -6.461857795715332, "global_step": 106855, "epoch": 2544} {"train_loss": -6.48915958404541, "global_step": 106856, "epoch": 2544} {"train_loss": -6.431507587432861, "global_step": 106857, "epoch": 2544} {"train_loss": -6.4551544189453125, "global_step": 106858, "epoch": 2544} {"train_loss": -6.443450450897217, "global_step": 106859, "epoch": 2544} {"train_loss": -6.357714653015137, "global_step": 106860, "epoch": 2544} {"train_loss": -6.378775596618652, "global_step": 106861, "epoch": 2544} {"train_loss": -6.424988746643066, "global_step": 106862, "epoch": 2544} {"train_loss": -6.395994186401367, "global_step": 106863, "epoch": 2544} {"train_loss": -6.4503302574157715, "global_step": 106864, "epoch": 2544} {"train_loss": -6.537656784057617, "global_step": 106865, "epoch": 2544} {"train_loss": -6.464399337768555, "global_step": 106866, "epoch": 2544} {"train_loss": -6.452984809875488, "global_step": 106867, "epoch": 2544} {"train_loss": -6.4054670333862305, "global_step": 106868, "epoch": 2544} {"train_loss": -6.433531761169434, "global_step": 106869, "epoch": 2544} {"train_loss": -6.383735656738281, "global_step": 106870, "epoch": 2544} {"train_loss": -6.431934356689453, "global_step": 106871, "epoch": 2544} {"train_loss": -6.313695907592773, "global_step": 106872, "epoch": 2544} {"train_loss": -6.428948402404785, "global_step": 106873, "epoch": 2544} {"train_loss": -6.468964576721191, "global_step": 106874, "epoch": 2544} {"train_loss": -6.427116870880127, "global_step": 106875, "epoch": 2544} {"train_loss": -6.388125896453857, "global_step": 106876, "epoch": 2544} {"train_loss": -6.417737007141113, "global_step": 106877, "epoch": 2544} {"train_loss": -6.4527130126953125, "global_step": 106878, "epoch": 2544} {"train_loss": -6.4078779220581055, "global_step": 106879, "epoch": 2544} {"train_loss": -6.382636547088623, "global_step": 106880, "epoch": 2544} {"train_loss": -6.48297119140625, "global_step": 106881, "epoch": 2544} {"train_loss": -6.35871696472168, "global_step": 106882, "epoch": 2544} {"train_loss": -6.52608060836792, "global_step": 106883, "epoch": 2544} {"train_loss": -6.472413063049316, "global_step": 106884, "epoch": 2544} {"train_loss": -6.4366841316223145, "global_step": 106885, "epoch": 2544} {"train_loss": -6.334420680999756, "global_step": 106886, "epoch": 2544} {"train_loss": -6.433225154876709, "global_step": 106887, "epoch": 2544} {"train_loss": -6.37559700012207, "global_step": 106888, "epoch": 2544} {"train_loss": -6.414402575719924, "global_step": 106889, "epoch": 2544, "val_loss": 67828.7421875} {"train_loss": -6.556757926940918, "global_step": 106890, "epoch": 2545} {"train_loss": -6.3734331130981445, "global_step": 106891, "epoch": 2545} {"train_loss": -6.4282426834106445, "global_step": 106892, "epoch": 2545} {"train_loss": -6.395099639892578, "global_step": 106893, "epoch": 2545} {"train_loss": -6.423349857330322, "global_step": 106894, "epoch": 2545} {"train_loss": -6.451729774475098, "global_step": 106895, "epoch": 2545} {"train_loss": -6.404560089111328, "global_step": 106896, "epoch": 2545} {"train_loss": -6.477328300476074, "global_step": 106897, "epoch": 2545} {"train_loss": -6.422001838684082, "global_step": 106898, "epoch": 2545} {"train_loss": -6.336920738220215, "global_step": 106899, "epoch": 2545} {"train_loss": -6.300918102264404, "global_step": 106900, "epoch": 2545} {"train_loss": -6.411235809326172, "global_step": 106901, "epoch": 2545} {"train_loss": -6.2833404541015625, "global_step": 106902, "epoch": 2545} {"train_loss": -6.372838497161865, "global_step": 106903, "epoch": 2545} {"train_loss": -6.333385467529297, "global_step": 106904, "epoch": 2545} {"train_loss": -6.349639892578125, "global_step": 106905, "epoch": 2545} {"train_loss": -6.361124038696289, "global_step": 106906, "epoch": 2545} {"train_loss": -6.356316566467285, "global_step": 106907, "epoch": 2545} {"train_loss": -6.337261199951172, "global_step": 106908, "epoch": 2545} {"train_loss": -6.2836151123046875, "global_step": 106909, "epoch": 2545} {"train_loss": -6.361477851867676, "global_step": 106910, "epoch": 2545} {"train_loss": -6.50599479675293, "global_step": 106911, "epoch": 2545} {"train_loss": -6.402502059936523, "global_step": 106912, "epoch": 2545} {"train_loss": -6.400328159332275, "global_step": 106913, "epoch": 2545} {"train_loss": -6.549165725708008, "global_step": 106914, "epoch": 2545} {"train_loss": -6.443791389465332, "global_step": 106915, "epoch": 2545} {"train_loss": -6.474573135375977, "global_step": 106916, "epoch": 2545} {"train_loss": -6.404261589050293, "global_step": 106917, "epoch": 2545} {"train_loss": -6.53358268737793, "global_step": 106918, "epoch": 2545} {"train_loss": -6.491159915924072, "global_step": 106919, "epoch": 2545} {"train_loss": -6.399155139923096, "global_step": 106920, "epoch": 2545} {"train_loss": -6.5204362869262695, "global_step": 106921, "epoch": 2545} {"train_loss": -6.428049564361572, "global_step": 106922, "epoch": 2545} {"train_loss": -6.45711612701416, "global_step": 106923, "epoch": 2545} {"train_loss": -6.463996887207031, "global_step": 106924, "epoch": 2545} {"train_loss": -6.4486846923828125, "global_step": 106925, "epoch": 2545} {"train_loss": -6.435577392578125, "global_step": 106926, "epoch": 2545} {"train_loss": -6.49212121963501, "global_step": 106927, "epoch": 2545} {"train_loss": -6.428886413574219, "global_step": 106928, "epoch": 2545} {"train_loss": -6.480071067810059, "global_step": 106929, "epoch": 2545} {"train_loss": -6.417627811431885, "global_step": 106930, "epoch": 2545} {"train_loss": -6.415614139466059, "global_step": 106931, "epoch": 2545, "val_loss": 67918.2265625} {"train_loss": -6.382205486297607, "global_step": 106932, "epoch": 2546} {"train_loss": -6.362940788269043, "global_step": 106933, "epoch": 2546} {"train_loss": -6.381155014038086, "global_step": 106934, "epoch": 2546} {"train_loss": -6.397793769836426, "global_step": 106935, "epoch": 2546} {"train_loss": -6.391788482666016, "global_step": 106936, "epoch": 2546} {"train_loss": -6.464453220367432, "global_step": 106937, "epoch": 2546} {"train_loss": -6.4627580642700195, "global_step": 106938, "epoch": 2546} {"train_loss": -6.35509729385376, "global_step": 106939, "epoch": 2546} {"train_loss": -6.337795257568359, "global_step": 106940, "epoch": 2546} {"train_loss": -6.517153263092041, "global_step": 106941, "epoch": 2546} {"train_loss": -6.344461441040039, "global_step": 106942, "epoch": 2546} {"train_loss": -6.343709945678711, "global_step": 106943, "epoch": 2546} {"train_loss": -6.26948881149292, "global_step": 106944, "epoch": 2546} {"train_loss": -6.227298259735107, "global_step": 106945, "epoch": 2546} {"train_loss": -6.420407295227051, "global_step": 106946, "epoch": 2546} {"train_loss": -6.3801116943359375, "global_step": 106947, "epoch": 2546} {"train_loss": -6.448568820953369, "global_step": 106948, "epoch": 2546} {"train_loss": -6.358980178833008, "global_step": 106949, "epoch": 2546} {"train_loss": -6.415985107421875, "global_step": 106950, "epoch": 2546} {"train_loss": -6.438470840454102, "global_step": 106951, "epoch": 2546} {"train_loss": -6.353796005249023, "global_step": 106952, "epoch": 2546} {"train_loss": -6.381540775299072, "global_step": 106953, "epoch": 2546} {"train_loss": -6.391419410705566, "global_step": 106954, "epoch": 2546} {"train_loss": -6.360651969909668, "global_step": 106955, "epoch": 2546} {"train_loss": -6.466381072998047, "global_step": 106956, "epoch": 2546} {"train_loss": -6.3714470863342285, "global_step": 106957, "epoch": 2546} {"train_loss": -6.485776424407959, "global_step": 106958, "epoch": 2546} {"train_loss": -6.387416362762451, "global_step": 106959, "epoch": 2546} {"train_loss": -6.3930158615112305, "global_step": 106960, "epoch": 2546} {"train_loss": -6.499570846557617, "global_step": 106961, "epoch": 2546} {"train_loss": -6.447273254394531, "global_step": 106962, "epoch": 2546} {"train_loss": -6.46921443939209, "global_step": 106963, "epoch": 2546} {"train_loss": -6.321140289306641, "global_step": 106964, "epoch": 2546} {"train_loss": -6.392059803009033, "global_step": 106965, "epoch": 2546} {"train_loss": -6.3758649826049805, "global_step": 106966, "epoch": 2546} {"train_loss": -6.409719467163086, "global_step": 106967, "epoch": 2546} {"train_loss": -6.433102607727051, "global_step": 106968, "epoch": 2546} {"train_loss": -6.318462371826172, "global_step": 106969, "epoch": 2546} {"train_loss": -6.394712448120117, "global_step": 106970, "epoch": 2546} {"train_loss": -6.378515243530273, "global_step": 106971, "epoch": 2546} {"train_loss": -6.44265079498291, "global_step": 106972, "epoch": 2546} {"train_loss": -6.396136499586559, "global_step": 106973, "epoch": 2546, "val_loss": 68114.015625} {"train_loss": -6.355053901672363, "global_step": 106974, "epoch": 2547} {"train_loss": -6.285661220550537, "global_step": 106975, "epoch": 2547} {"train_loss": -6.375674247741699, "global_step": 106976, "epoch": 2547} {"train_loss": -6.378118991851807, "global_step": 106977, "epoch": 2547} {"train_loss": -6.317466735839844, "global_step": 106978, "epoch": 2547} {"train_loss": -6.401846885681152, "global_step": 106979, "epoch": 2547} {"train_loss": -6.230280876159668, "global_step": 106980, "epoch": 2547} {"train_loss": -6.418846607208252, "global_step": 106981, "epoch": 2547} {"train_loss": -6.347265720367432, "global_step": 106982, "epoch": 2547} {"train_loss": -6.407840251922607, "global_step": 106983, "epoch": 2547} {"train_loss": -6.333661079406738, "global_step": 106984, "epoch": 2547} {"train_loss": -6.357043266296387, "global_step": 106985, "epoch": 2547} {"train_loss": -6.335400581359863, "global_step": 106986, "epoch": 2547} {"train_loss": -6.3166656494140625, "global_step": 106987, "epoch": 2547} {"train_loss": -6.173694610595703, "global_step": 106988, "epoch": 2547} {"train_loss": -6.484762191772461, "global_step": 106989, "epoch": 2547} {"train_loss": -6.346345901489258, "global_step": 106990, "epoch": 2547} {"train_loss": -6.378586292266846, "global_step": 106991, "epoch": 2547} {"train_loss": -6.359841823577881, "global_step": 106992, "epoch": 2547} {"train_loss": -6.382501602172852, "global_step": 106993, "epoch": 2547} {"train_loss": -6.452342987060547, "global_step": 106994, "epoch": 2547} {"train_loss": -6.443264484405518, "global_step": 106995, "epoch": 2547} {"train_loss": -6.446981430053711, "global_step": 106996, "epoch": 2547} {"train_loss": -6.385627269744873, "global_step": 106997, "epoch": 2547} {"train_loss": -6.459585189819336, "global_step": 106998, "epoch": 2547} {"train_loss": -6.467479705810547, "global_step": 106999, "epoch": 2547} {"train_loss": -6.424078941345215, "global_step": 107000, "epoch": 2547} {"train_loss": -6.26954460144043, "global_step": 107001, "epoch": 2547} {"train_loss": -6.478072643280029, "global_step": 107002, "epoch": 2547} {"train_loss": -6.411768436431885, "global_step": 107003, "epoch": 2547} {"train_loss": -6.434370040893555, "global_step": 107004, "epoch": 2547} {"train_loss": -6.474332332611084, "global_step": 107005, "epoch": 2547} {"train_loss": -6.389822006225586, "global_step": 107006, "epoch": 2547} {"train_loss": -6.308572769165039, "global_step": 107007, "epoch": 2547} {"train_loss": -6.315506935119629, "global_step": 107008, "epoch": 2547} {"train_loss": -6.335182189941406, "global_step": 107009, "epoch": 2547} {"train_loss": -6.360595226287842, "global_step": 107010, "epoch": 2547} {"train_loss": -6.363304138183594, "global_step": 107011, "epoch": 2547} {"train_loss": -6.321986198425293, "global_step": 107012, "epoch": 2547} {"train_loss": -6.455972671508789, "global_step": 107013, "epoch": 2547} {"train_loss": -6.36068058013916, "global_step": 107014, "epoch": 2547} {"train_loss": -6.375614245732625, "global_step": 107015, "epoch": 2547, "val_loss": 68028.625} {"train_loss": -6.4756927490234375, "global_step": 107016, "epoch": 2548} {"train_loss": -6.3587846755981445, "global_step": 107017, "epoch": 2548} {"train_loss": -6.411575794219971, "global_step": 107018, "epoch": 2548} {"train_loss": -6.343353271484375, "global_step": 107019, "epoch": 2548} {"train_loss": -6.346602916717529, "global_step": 107020, "epoch": 2548} {"train_loss": -6.331809997558594, "global_step": 107021, "epoch": 2548} {"train_loss": -6.350104331970215, "global_step": 107022, "epoch": 2548} {"train_loss": -6.2846784591674805, "global_step": 107023, "epoch": 2548} {"train_loss": -6.3863019943237305, "global_step": 107024, "epoch": 2548} {"train_loss": -6.386502265930176, "global_step": 107025, "epoch": 2548} {"train_loss": -6.4704484939575195, "global_step": 107026, "epoch": 2548} {"train_loss": -6.459445476531982, "global_step": 107027, "epoch": 2548} {"train_loss": -6.376194477081299, "global_step": 107028, "epoch": 2548} {"train_loss": -6.306490421295166, "global_step": 107029, "epoch": 2548} {"train_loss": -6.417335510253906, "global_step": 107030, "epoch": 2548} {"train_loss": -6.3282060623168945, "global_step": 107031, "epoch": 2548} {"train_loss": -6.469771385192871, "global_step": 107032, "epoch": 2548} {"train_loss": -6.378659248352051, "global_step": 107033, "epoch": 2548} {"train_loss": -6.3246612548828125, "global_step": 107034, "epoch": 2548} {"train_loss": -6.424472332000732, "global_step": 107035, "epoch": 2548} {"train_loss": -6.336945533752441, "global_step": 107036, "epoch": 2548} {"train_loss": -6.45945930480957, "global_step": 107037, "epoch": 2548} {"train_loss": -6.360436916351318, "global_step": 107038, "epoch": 2548} {"train_loss": -6.393914222717285, "global_step": 107039, "epoch": 2548} {"train_loss": -6.471357345581055, "global_step": 107040, "epoch": 2548} {"train_loss": -6.333437442779541, "global_step": 107041, "epoch": 2548} {"train_loss": -6.425930023193359, "global_step": 107042, "epoch": 2548} {"train_loss": -6.381509780883789, "global_step": 107043, "epoch": 2548} {"train_loss": -6.479992389678955, "global_step": 107044, "epoch": 2548} {"train_loss": -6.420901298522949, "global_step": 107045, "epoch": 2548} {"train_loss": -6.470691680908203, "global_step": 107046, "epoch": 2548} {"train_loss": -6.398300647735596, "global_step": 107047, "epoch": 2548} {"train_loss": -6.402068138122559, "global_step": 107048, "epoch": 2548} {"train_loss": -6.377953052520752, "global_step": 107049, "epoch": 2548} {"train_loss": -6.462068557739258, "global_step": 107050, "epoch": 2548} {"train_loss": -6.437618732452393, "global_step": 107051, "epoch": 2548} {"train_loss": -6.443019866943359, "global_step": 107052, "epoch": 2548} {"train_loss": -6.439704895019531, "global_step": 107053, "epoch": 2548} {"train_loss": -6.238976001739502, "global_step": 107054, "epoch": 2548} {"train_loss": -6.223546028137207, "global_step": 107055, "epoch": 2548} {"train_loss": -6.479162216186523, "global_step": 107056, "epoch": 2548} {"train_loss": -6.3917003359113425, "global_step": 107057, "epoch": 2548, "val_loss": 67807.1484375} {"train_loss": -6.328038692474365, "global_step": 107058, "epoch": 2549} {"train_loss": -6.5505218505859375, "global_step": 107059, "epoch": 2549} {"train_loss": -6.277202606201172, "global_step": 107060, "epoch": 2549} {"train_loss": -6.3929924964904785, "global_step": 107061, "epoch": 2549} {"train_loss": -6.440267562866211, "global_step": 107062, "epoch": 2549} {"train_loss": -6.384161949157715, "global_step": 107063, "epoch": 2549} {"train_loss": -6.458835601806641, "global_step": 107064, "epoch": 2549} {"train_loss": -6.355751991271973, "global_step": 107065, "epoch": 2549} {"train_loss": -6.410004615783691, "global_step": 107066, "epoch": 2549} {"train_loss": -6.280621528625488, "global_step": 107067, "epoch": 2549} {"train_loss": -6.343721389770508, "global_step": 107068, "epoch": 2549} {"train_loss": -6.388521194458008, "global_step": 107069, "epoch": 2549} {"train_loss": -6.335951328277588, "global_step": 107070, "epoch": 2549} {"train_loss": -6.419340133666992, "global_step": 107071, "epoch": 2549} {"train_loss": -6.378391265869141, "global_step": 107072, "epoch": 2549} {"train_loss": -6.388078689575195, "global_step": 107073, "epoch": 2549} {"train_loss": -6.517648696899414, "global_step": 107074, "epoch": 2549} {"train_loss": -6.57913064956665, "global_step": 107075, "epoch": 2549} {"train_loss": -6.4223527908325195, "global_step": 107076, "epoch": 2549} {"train_loss": -6.436118125915527, "global_step": 107077, "epoch": 2549} {"train_loss": -6.386028289794922, "global_step": 107078, "epoch": 2549} {"train_loss": -6.418052673339844, "global_step": 107079, "epoch": 2549} {"train_loss": -6.346611976623535, "global_step": 107080, "epoch": 2549} {"train_loss": -6.4363250732421875, "global_step": 107081, "epoch": 2549} {"train_loss": -6.37302303314209, "global_step": 107082, "epoch": 2549} {"train_loss": -6.382296562194824, "global_step": 107083, "epoch": 2549} {"train_loss": -6.34796142578125, "global_step": 107084, "epoch": 2549} {"train_loss": -6.444392681121826, "global_step": 107085, "epoch": 2549} {"train_loss": -6.490388870239258, "global_step": 107086, "epoch": 2549} {"train_loss": -6.432185649871826, "global_step": 107087, "epoch": 2549} {"train_loss": -6.409891605377197, "global_step": 107088, "epoch": 2549} {"train_loss": -6.535643577575684, "global_step": 107089, "epoch": 2549} {"train_loss": -6.412419319152832, "global_step": 107090, "epoch": 2549} {"train_loss": -6.503355979919434, "global_step": 107091, "epoch": 2549} {"train_loss": -6.523818016052246, "global_step": 107092, "epoch": 2549} {"train_loss": -6.499239921569824, "global_step": 107093, "epoch": 2549} {"train_loss": -6.43903923034668, "global_step": 107094, "epoch": 2549} {"train_loss": -6.429247856140137, "global_step": 107095, "epoch": 2549} {"train_loss": -6.59783935546875, "global_step": 107096, "epoch": 2549} {"train_loss": -6.486370086669922, "global_step": 107097, "epoch": 2549} {"train_loss": -6.4437150955200195, "global_step": 107098, "epoch": 2549} {"train_loss": -6.4284086000351675, "global_step": 107099, "epoch": 2549, "val_loss": 67736.2421875} {"train_loss": -6.431339263916016, "global_step": 107100, "epoch": 2550} {"train_loss": -6.408400058746338, "global_step": 107101, "epoch": 2550} {"train_loss": -6.552922248840332, "global_step": 107102, "epoch": 2550} {"train_loss": -6.366705894470215, "global_step": 107103, "epoch": 2550} {"train_loss": -6.6088714599609375, "global_step": 107104, "epoch": 2550} {"train_loss": -6.355046272277832, "global_step": 107105, "epoch": 2550} {"train_loss": -6.51232385635376, "global_step": 107106, "epoch": 2550} {"train_loss": -6.409712314605713, "global_step": 107107, "epoch": 2550} {"train_loss": -6.334121227264404, "global_step": 107108, "epoch": 2550} {"train_loss": -6.400196075439453, "global_step": 107109, "epoch": 2550} {"train_loss": -6.355932712554932, "global_step": 107110, "epoch": 2550} {"train_loss": -6.339169979095459, "global_step": 107111, "epoch": 2550} {"train_loss": -6.383271217346191, "global_step": 107112, "epoch": 2550} {"train_loss": -6.400756359100342, "global_step": 107113, "epoch": 2550} {"train_loss": -6.308034896850586, "global_step": 107114, "epoch": 2550} {"train_loss": -6.365818023681641, "global_step": 107115, "epoch": 2550} {"train_loss": -6.482688903808594, "global_step": 107116, "epoch": 2550} {"train_loss": -6.3395843505859375, "global_step": 107117, "epoch": 2550} {"train_loss": -6.417839050292969, "global_step": 107118, "epoch": 2550} {"train_loss": -6.261725902557373, "global_step": 107119, "epoch": 2550} {"train_loss": -6.372405052185059, "global_step": 107120, "epoch": 2550} {"train_loss": -6.561239719390869, "global_step": 107121, "epoch": 2550} {"train_loss": -6.350523948669434, "global_step": 107122, "epoch": 2550} {"train_loss": -6.420392036437988, "global_step": 107123, "epoch": 2550} {"train_loss": -6.429452419281006, "global_step": 107124, "epoch": 2550} {"train_loss": -6.241886138916016, "global_step": 107125, "epoch": 2550} {"train_loss": -6.469785690307617, "global_step": 107126, "epoch": 2550} {"train_loss": -6.283775329589844, "global_step": 107127, "epoch": 2550} {"train_loss": -6.392488479614258, "global_step": 107128, "epoch": 2550} {"train_loss": -6.412908554077148, "global_step": 107129, "epoch": 2550} {"train_loss": -6.3346662521362305, "global_step": 107130, "epoch": 2550} {"train_loss": -6.319314002990723, "global_step": 107131, "epoch": 2550} {"train_loss": -6.415642738342285, "global_step": 107132, "epoch": 2550} {"train_loss": -6.411374092102051, "global_step": 107133, "epoch": 2550} {"train_loss": -6.368321895599365, "global_step": 107134, "epoch": 2550} {"train_loss": -6.3027472496032715, "global_step": 107135, "epoch": 2550} {"train_loss": -6.302311897277832, "global_step": 107136, "epoch": 2550} {"train_loss": -6.359901428222656, "global_step": 107137, "epoch": 2550} {"train_loss": -6.404607772827148, "global_step": 107138, "epoch": 2550} {"train_loss": -6.50799560546875, "global_step": 107139, "epoch": 2550} {"train_loss": -6.384557723999023, "global_step": 107140, "epoch": 2550} {"train_loss": -6.394440719059536, "global_step": 107141, "epoch": 2550, "train/sim_max_reward_0": 0.22484664911162303, "train/sim_max_reward_1": 0.3943573326686702, "train/sim_max_reward_2": 0.23592772084826427, "train/sim_max_reward_3": 0.8585424264829953, "train/sim_max_reward_4": 0.9940437509006339, "train/sim_max_reward_5": 0.9921104989539453, "test/sim_max_reward_4400000": 0.18437469112810687, "test/sim_max_reward_4400001": 0.18600109224934025, "test/sim_max_reward_4400002": 0.9677575064582596, "test/sim_max_reward_4400003": 0.7739357963701755, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9748462857512515, "test/sim_max_reward_4400007": 0.9240584522337912, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.5181488634672685, "test/sim_max_reward_4400010": 0.8648726551036242, "test/sim_max_reward_4400011": 0.1930988228467204, "test/sim_max_reward_4400012": 0.8728446200429014, "test/sim_max_reward_4400013": 0.9284316229450867, "test/sim_max_reward_4400014": 0.877347236134288, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.16118050266656336, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23083579436440715, "test/sim_max_reward_4400019": 0.034784404929879095, "test/sim_max_reward_4400020": 0.00015448269447084474, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9107415372317895, "test/sim_max_reward_4400023": 0.485795408748368, "test/sim_max_reward_4400024": 0.8092991950040074, "test/sim_max_reward_4400025": 0.23898922578522075, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.032087801356658126, "test/sim_max_reward_4400028": 0.5122521156079584, "test/sim_max_reward_4400029": 0.5908055810942948, "test/sim_max_reward_4400030": 0.8269778891842454, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9469931278691858, "test/sim_max_reward_4400034": 0.8501103968489281, "test/sim_max_reward_4400035": 0.6185403486491802, "test/sim_max_reward_4400036": 0.3664073415033818, "test/sim_max_reward_4400037": 0.9161823554875617, "test/sim_max_reward_4400038": 0.7624438501897226, "test/sim_max_reward_4400039": 0.8836891504473644, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.44271904632444326, "test/sim_max_reward_4400042": 0.8960452490968385, "test/sim_max_reward_4400043": 0.9967577763871882, "test/sim_max_reward_4400044": 0.9355134261792184, "test/sim_max_reward_4400045": 0.47803774841862323, "test/sim_max_reward_4400046": 0.968441626194053, "test/sim_max_reward_4400047": 0.9587262892335808, "test/sim_max_reward_4400048": 0.8918158712974062, "test/sim_max_reward_4400049": 0.8582571425178422, "train/mean_score": 0.6166380631610219, "test/mean_score": 0.5528039216114603, "val_loss": 67936.625} {"train_loss": -6.344995021820068, "global_step": 107142, "epoch": 2551} {"train_loss": -6.441568374633789, "global_step": 107143, "epoch": 2551} {"train_loss": -6.361124038696289, "global_step": 107144, "epoch": 2551} {"train_loss": -6.398397445678711, "global_step": 107145, "epoch": 2551} {"train_loss": -6.42142915725708, "global_step": 107146, "epoch": 2551} {"train_loss": -6.389288425445557, "global_step": 107147, "epoch": 2551} {"train_loss": -6.425082206726074, "global_step": 107148, "epoch": 2551} {"train_loss": -6.306303977966309, "global_step": 107149, "epoch": 2551} {"train_loss": -6.420888900756836, "global_step": 107150, "epoch": 2551} {"train_loss": -6.416499137878418, "global_step": 107151, "epoch": 2551} {"train_loss": -6.40977668762207, "global_step": 107152, "epoch": 2551} {"train_loss": -6.510195732116699, "global_step": 107153, "epoch": 2551} {"train_loss": -6.3247480392456055, "global_step": 107154, "epoch": 2551} {"train_loss": -6.424552917480469, "global_step": 107155, "epoch": 2551} {"train_loss": -6.543018341064453, "global_step": 107156, "epoch": 2551} {"train_loss": -6.4398393630981445, "global_step": 107157, "epoch": 2551} {"train_loss": -6.421395301818848, "global_step": 107158, "epoch": 2551} {"train_loss": -6.480820655822754, "global_step": 107159, "epoch": 2551} {"train_loss": -6.489553451538086, "global_step": 107160, "epoch": 2551} {"train_loss": -6.378559112548828, "global_step": 107161, "epoch": 2551} {"train_loss": -6.463054656982422, "global_step": 107162, "epoch": 2551} {"train_loss": -6.387539386749268, "global_step": 107163, "epoch": 2551} {"train_loss": -6.460139751434326, "global_step": 107164, "epoch": 2551} {"train_loss": -6.439970016479492, "global_step": 107165, "epoch": 2551} {"train_loss": -6.414535999298096, "global_step": 107166, "epoch": 2551} {"train_loss": -6.449682712554932, "global_step": 107167, "epoch": 2551} {"train_loss": -6.288517951965332, "global_step": 107168, "epoch": 2551} {"train_loss": -6.484360694885254, "global_step": 107169, "epoch": 2551} {"train_loss": -6.2816972732543945, "global_step": 107170, "epoch": 2551} {"train_loss": -6.360988616943359, "global_step": 107171, "epoch": 2551} {"train_loss": -6.461103439331055, "global_step": 107172, "epoch": 2551} {"train_loss": -6.394632816314697, "global_step": 107173, "epoch": 2551} {"train_loss": -6.320026874542236, "global_step": 107174, "epoch": 2551} {"train_loss": -6.400531768798828, "global_step": 107175, "epoch": 2551} {"train_loss": -6.359087944030762, "global_step": 107176, "epoch": 2551} {"train_loss": -6.414144515991211, "global_step": 107177, "epoch": 2551} {"train_loss": -6.351595401763916, "global_step": 107178, "epoch": 2551} {"train_loss": -6.414420127868652, "global_step": 107179, "epoch": 2551} {"train_loss": -6.473711967468262, "global_step": 107180, "epoch": 2551} {"train_loss": -6.368466854095459, "global_step": 107181, "epoch": 2551} {"train_loss": -6.429521560668945, "global_step": 107182, "epoch": 2551} {"train_loss": -6.406564803350539, "global_step": 107183, "epoch": 2551, "val_loss": 67914.8125} {"train_loss": -6.342150688171387, "global_step": 107184, "epoch": 2552} {"train_loss": -6.518719673156738, "global_step": 107185, "epoch": 2552} {"train_loss": -6.348601818084717, "global_step": 107186, "epoch": 2552} {"train_loss": -6.374436378479004, "global_step": 107187, "epoch": 2552} {"train_loss": -6.415580749511719, "global_step": 107188, "epoch": 2552} {"train_loss": -6.321955680847168, "global_step": 107189, "epoch": 2552} {"train_loss": -6.367929458618164, "global_step": 107190, "epoch": 2552} {"train_loss": -6.404603481292725, "global_step": 107191, "epoch": 2552} {"train_loss": -6.4165449142456055, "global_step": 107192, "epoch": 2552} {"train_loss": -6.369082450866699, "global_step": 107193, "epoch": 2552} {"train_loss": -6.40938663482666, "global_step": 107194, "epoch": 2552} {"train_loss": -6.4476494789123535, "global_step": 107195, "epoch": 2552} {"train_loss": -6.382512092590332, "global_step": 107196, "epoch": 2552} {"train_loss": -6.34972620010376, "global_step": 107197, "epoch": 2552} {"train_loss": -6.467860221862793, "global_step": 107198, "epoch": 2552} {"train_loss": -6.427213668823242, "global_step": 107199, "epoch": 2552} {"train_loss": -6.4404377937316895, "global_step": 107200, "epoch": 2552} {"train_loss": -6.588115692138672, "global_step": 107201, "epoch": 2552} {"train_loss": -6.36760139465332, "global_step": 107202, "epoch": 2552} {"train_loss": -6.449803352355957, "global_step": 107203, "epoch": 2552} {"train_loss": -6.472175598144531, "global_step": 107204, "epoch": 2552} {"train_loss": -6.419916152954102, "global_step": 107205, "epoch": 2552} {"train_loss": -6.405230522155762, "global_step": 107206, "epoch": 2552} {"train_loss": -6.463761806488037, "global_step": 107207, "epoch": 2552} {"train_loss": -6.332691192626953, "global_step": 107208, "epoch": 2552} {"train_loss": -6.439721584320068, "global_step": 107209, "epoch": 2552} {"train_loss": -6.475166320800781, "global_step": 107210, "epoch": 2552} {"train_loss": -6.443909168243408, "global_step": 107211, "epoch": 2552} {"train_loss": -6.355569362640381, "global_step": 107212, "epoch": 2552} {"train_loss": -6.345563888549805, "global_step": 107213, "epoch": 2552} {"train_loss": -6.400467395782471, "global_step": 107214, "epoch": 2552} {"train_loss": -6.425436496734619, "global_step": 107215, "epoch": 2552} {"train_loss": -6.393087387084961, "global_step": 107216, "epoch": 2552} {"train_loss": -6.373024940490723, "global_step": 107217, "epoch": 2552} {"train_loss": -6.32719612121582, "global_step": 107218, "epoch": 2552} {"train_loss": -6.444475173950195, "global_step": 107219, "epoch": 2552} {"train_loss": -6.534261703491211, "global_step": 107220, "epoch": 2552} {"train_loss": -6.39369010925293, "global_step": 107221, "epoch": 2552} {"train_loss": -6.451296329498291, "global_step": 107222, "epoch": 2552} {"train_loss": -6.350057601928711, "global_step": 107223, "epoch": 2552} {"train_loss": -6.381113529205322, "global_step": 107224, "epoch": 2552} {"train_loss": -6.409654322124663, "global_step": 107225, "epoch": 2552, "val_loss": 67833.5390625} {"train_loss": -6.41373348236084, "global_step": 107226, "epoch": 2553} {"train_loss": -6.369271755218506, "global_step": 107227, "epoch": 2553} {"train_loss": -6.373610496520996, "global_step": 107228, "epoch": 2553} {"train_loss": -6.440971851348877, "global_step": 107229, "epoch": 2553} {"train_loss": -6.3933796882629395, "global_step": 107230, "epoch": 2553} {"train_loss": -6.39711856842041, "global_step": 107231, "epoch": 2553} {"train_loss": -6.476527214050293, "global_step": 107232, "epoch": 2553} {"train_loss": -6.341017246246338, "global_step": 107233, "epoch": 2553} {"train_loss": -6.557618141174316, "global_step": 107234, "epoch": 2553} {"train_loss": -6.445575714111328, "global_step": 107235, "epoch": 2553} {"train_loss": -6.383101463317871, "global_step": 107236, "epoch": 2553} {"train_loss": -6.519199371337891, "global_step": 107237, "epoch": 2553} {"train_loss": -6.332652568817139, "global_step": 107238, "epoch": 2553} {"train_loss": -6.41915225982666, "global_step": 107239, "epoch": 2553} {"train_loss": -6.376131057739258, "global_step": 107240, "epoch": 2553} {"train_loss": -6.386757850646973, "global_step": 107241, "epoch": 2553} {"train_loss": -6.31658411026001, "global_step": 107242, "epoch": 2553} {"train_loss": -6.367324352264404, "global_step": 107243, "epoch": 2553} {"train_loss": -6.354840278625488, "global_step": 107244, "epoch": 2553} {"train_loss": -6.251037120819092, "global_step": 107245, "epoch": 2553} {"train_loss": -6.410906791687012, "global_step": 107246, "epoch": 2553} {"train_loss": -6.320420265197754, "global_step": 107247, "epoch": 2553} {"train_loss": -6.290659427642822, "global_step": 107248, "epoch": 2553} {"train_loss": -6.5128068923950195, "global_step": 107249, "epoch": 2553} {"train_loss": -6.372958183288574, "global_step": 107250, "epoch": 2553} {"train_loss": -6.256706237792969, "global_step": 107251, "epoch": 2553} {"train_loss": -6.374598503112793, "global_step": 107252, "epoch": 2553} {"train_loss": -6.414979934692383, "global_step": 107253, "epoch": 2553} {"train_loss": -6.339939594268799, "global_step": 107254, "epoch": 2553} {"train_loss": -6.417787551879883, "global_step": 107255, "epoch": 2553} {"train_loss": -6.417026519775391, "global_step": 107256, "epoch": 2553} {"train_loss": -6.274683475494385, "global_step": 107257, "epoch": 2553} {"train_loss": -6.333646297454834, "global_step": 107258, "epoch": 2553} {"train_loss": -6.408149242401123, "global_step": 107259, "epoch": 2553} {"train_loss": -6.402644157409668, "global_step": 107260, "epoch": 2553} {"train_loss": -6.416486740112305, "global_step": 107261, "epoch": 2553} {"train_loss": -6.365238189697266, "global_step": 107262, "epoch": 2553} {"train_loss": -6.349855899810791, "global_step": 107263, "epoch": 2553} {"train_loss": -6.275952339172363, "global_step": 107264, "epoch": 2553} {"train_loss": -6.294051170349121, "global_step": 107265, "epoch": 2553} {"train_loss": -6.39840030670166, "global_step": 107266, "epoch": 2553} {"train_loss": -6.378622225352696, "global_step": 107267, "epoch": 2553, "val_loss": 68159.6640625} {"train_loss": -6.366024971008301, "global_step": 107268, "epoch": 2554} {"train_loss": -6.386518478393555, "global_step": 107269, "epoch": 2554} {"train_loss": -6.4321184158325195, "global_step": 107270, "epoch": 2554} {"train_loss": -6.320400238037109, "global_step": 107271, "epoch": 2554} {"train_loss": -6.329451560974121, "global_step": 107272, "epoch": 2554} {"train_loss": -6.525169372558594, "global_step": 107273, "epoch": 2554} {"train_loss": -6.484187126159668, "global_step": 107274, "epoch": 2554} {"train_loss": -6.359135150909424, "global_step": 107275, "epoch": 2554} {"train_loss": -6.492489814758301, "global_step": 107276, "epoch": 2554} {"train_loss": -6.494878768920898, "global_step": 107277, "epoch": 2554} {"train_loss": -6.450986862182617, "global_step": 107278, "epoch": 2554} {"train_loss": -6.420429706573486, "global_step": 107279, "epoch": 2554} {"train_loss": -6.364475250244141, "global_step": 107280, "epoch": 2554} {"train_loss": -6.397278785705566, "global_step": 107281, "epoch": 2554} {"train_loss": -6.497971534729004, "global_step": 107282, "epoch": 2554} {"train_loss": -6.430449485778809, "global_step": 107283, "epoch": 2554} {"train_loss": -6.506763458251953, "global_step": 107284, "epoch": 2554} {"train_loss": -6.4594831466674805, "global_step": 107285, "epoch": 2554} {"train_loss": -6.402032852172852, "global_step": 107286, "epoch": 2554} {"train_loss": -6.452913761138916, "global_step": 107287, "epoch": 2554} {"train_loss": -6.321793079376221, "global_step": 107288, "epoch": 2554} {"train_loss": -6.519660472869873, "global_step": 107289, "epoch": 2554} {"train_loss": -6.499045372009277, "global_step": 107290, "epoch": 2554} {"train_loss": -6.416022777557373, "global_step": 107291, "epoch": 2554} {"train_loss": -6.404473304748535, "global_step": 107292, "epoch": 2554} {"train_loss": -6.515158176422119, "global_step": 107293, "epoch": 2554} {"train_loss": -6.398991107940674, "global_step": 107294, "epoch": 2554} {"train_loss": -6.409273624420166, "global_step": 107295, "epoch": 2554} {"train_loss": -6.398709297180176, "global_step": 107296, "epoch": 2554} {"train_loss": -6.388792514801025, "global_step": 107297, "epoch": 2554} {"train_loss": -6.481016635894775, "global_step": 107298, "epoch": 2554} {"train_loss": -6.3682403564453125, "global_step": 107299, "epoch": 2554} {"train_loss": -6.378275394439697, "global_step": 107300, "epoch": 2554} {"train_loss": -6.368512153625488, "global_step": 107301, "epoch": 2554} {"train_loss": -6.454158782958984, "global_step": 107302, "epoch": 2554} {"train_loss": -6.365904808044434, "global_step": 107303, "epoch": 2554} {"train_loss": -6.359942436218262, "global_step": 107304, "epoch": 2554} {"train_loss": -6.454092025756836, "global_step": 107305, "epoch": 2554} {"train_loss": -6.4187517166137695, "global_step": 107306, "epoch": 2554} {"train_loss": -6.445842266082764, "global_step": 107307, "epoch": 2554} {"train_loss": -6.415475845336914, "global_step": 107308, "epoch": 2554} {"train_loss": -6.420480467024303, "global_step": 107309, "epoch": 2554, "val_loss": 67630.9609375} {"train_loss": -6.365490913391113, "global_step": 107310, "epoch": 2555} {"train_loss": -6.461481094360352, "global_step": 107311, "epoch": 2555} {"train_loss": -6.505491256713867, "global_step": 107312, "epoch": 2555} {"train_loss": -6.342057228088379, "global_step": 107313, "epoch": 2555} {"train_loss": -6.496194839477539, "global_step": 107314, "epoch": 2555} {"train_loss": -6.400920867919922, "global_step": 107315, "epoch": 2555} {"train_loss": -6.505338668823242, "global_step": 107316, "epoch": 2555} {"train_loss": -6.333393573760986, "global_step": 107317, "epoch": 2555} {"train_loss": -6.403192520141602, "global_step": 107318, "epoch": 2555} {"train_loss": -6.403934478759766, "global_step": 107319, "epoch": 2555} {"train_loss": -6.3296709060668945, "global_step": 107320, "epoch": 2555} {"train_loss": -6.431344032287598, "global_step": 107321, "epoch": 2555} {"train_loss": -6.539350986480713, "global_step": 107322, "epoch": 2555} {"train_loss": -6.44498872756958, "global_step": 107323, "epoch": 2555} {"train_loss": -6.462376594543457, "global_step": 107324, "epoch": 2555} {"train_loss": -6.313782691955566, "global_step": 107325, "epoch": 2555} {"train_loss": -6.334813117980957, "global_step": 107326, "epoch": 2555} {"train_loss": -6.287259578704834, "global_step": 107327, "epoch": 2555} {"train_loss": -6.41086483001709, "global_step": 107328, "epoch": 2555} {"train_loss": -6.478609085083008, "global_step": 107329, "epoch": 2555} {"train_loss": -6.348528861999512, "global_step": 107330, "epoch": 2555} {"train_loss": -6.537637710571289, "global_step": 107331, "epoch": 2555} {"train_loss": -6.4695281982421875, "global_step": 107332, "epoch": 2555} {"train_loss": -6.341504096984863, "global_step": 107333, "epoch": 2555} {"train_loss": -6.484521865844727, "global_step": 107334, "epoch": 2555} {"train_loss": -6.402843475341797, "global_step": 107335, "epoch": 2555} {"train_loss": -6.407395362854004, "global_step": 107336, "epoch": 2555} {"train_loss": -6.462745189666748, "global_step": 107337, "epoch": 2555} {"train_loss": -6.49995231628418, "global_step": 107338, "epoch": 2555} {"train_loss": -6.446083068847656, "global_step": 107339, "epoch": 2555} {"train_loss": -6.377651214599609, "global_step": 107340, "epoch": 2555} {"train_loss": -6.539151668548584, "global_step": 107341, "epoch": 2555} {"train_loss": -6.439440727233887, "global_step": 107342, "epoch": 2555} {"train_loss": -6.4873881340026855, "global_step": 107343, "epoch": 2555} {"train_loss": -6.587067604064941, "global_step": 107344, "epoch": 2555} {"train_loss": -6.530336380004883, "global_step": 107345, "epoch": 2555} {"train_loss": -6.3454389572143555, "global_step": 107346, "epoch": 2555} {"train_loss": -6.452906608581543, "global_step": 107347, "epoch": 2555} {"train_loss": -6.3592529296875, "global_step": 107348, "epoch": 2555} {"train_loss": -6.283255577087402, "global_step": 107349, "epoch": 2555} {"train_loss": -6.560462951660156, "global_step": 107350, "epoch": 2555} {"train_loss": -6.429228056044805, "global_step": 107351, "epoch": 2555, "val_loss": 68019.65625} {"train_loss": -6.279911518096924, "global_step": 107352, "epoch": 2556} {"train_loss": -6.444777488708496, "global_step": 107353, "epoch": 2556} {"train_loss": -6.443029403686523, "global_step": 107354, "epoch": 2556} {"train_loss": -6.474165439605713, "global_step": 107355, "epoch": 2556} {"train_loss": -6.460554599761963, "global_step": 107356, "epoch": 2556} {"train_loss": -6.547850608825684, "global_step": 107357, "epoch": 2556} {"train_loss": -6.31390905380249, "global_step": 107358, "epoch": 2556} {"train_loss": -6.413111686706543, "global_step": 107359, "epoch": 2556} {"train_loss": -6.406447410583496, "global_step": 107360, "epoch": 2556} {"train_loss": -6.419731616973877, "global_step": 107361, "epoch": 2556} {"train_loss": -6.397180557250977, "global_step": 107362, "epoch": 2556} {"train_loss": -6.485105037689209, "global_step": 107363, "epoch": 2556} {"train_loss": -6.434117317199707, "global_step": 107364, "epoch": 2556} {"train_loss": -6.361024856567383, "global_step": 107365, "epoch": 2556} {"train_loss": -6.407934188842773, "global_step": 107366, "epoch": 2556} {"train_loss": -6.382935523986816, "global_step": 107367, "epoch": 2556} {"train_loss": -6.333735466003418, "global_step": 107368, "epoch": 2556} {"train_loss": -6.4409661293029785, "global_step": 107369, "epoch": 2556} {"train_loss": -6.404548168182373, "global_step": 107370, "epoch": 2556} {"train_loss": -6.302684783935547, "global_step": 107371, "epoch": 2556} {"train_loss": -6.393592834472656, "global_step": 107372, "epoch": 2556} {"train_loss": -6.38453483581543, "global_step": 107373, "epoch": 2556} {"train_loss": -6.418519020080566, "global_step": 107374, "epoch": 2556} {"train_loss": -6.316091537475586, "global_step": 107375, "epoch": 2556} {"train_loss": -6.443165302276611, "global_step": 107376, "epoch": 2556} {"train_loss": -6.418867588043213, "global_step": 107377, "epoch": 2556} {"train_loss": -6.44619083404541, "global_step": 107378, "epoch": 2556} {"train_loss": -6.417666912078857, "global_step": 107379, "epoch": 2556} {"train_loss": -6.273348808288574, "global_step": 107380, "epoch": 2556} {"train_loss": -6.322513103485107, "global_step": 107381, "epoch": 2556} {"train_loss": -6.396113395690918, "global_step": 107382, "epoch": 2556} {"train_loss": -6.352041244506836, "global_step": 107383, "epoch": 2556} {"train_loss": -6.48707914352417, "global_step": 107384, "epoch": 2556} {"train_loss": -6.342854022979736, "global_step": 107385, "epoch": 2556} {"train_loss": -6.307770252227783, "global_step": 107386, "epoch": 2556} {"train_loss": -6.511754512786865, "global_step": 107387, "epoch": 2556} {"train_loss": -6.383953094482422, "global_step": 107388, "epoch": 2556} {"train_loss": -6.3743486404418945, "global_step": 107389, "epoch": 2556} {"train_loss": -6.438404083251953, "global_step": 107390, "epoch": 2556} {"train_loss": -6.409156799316406, "global_step": 107391, "epoch": 2556} {"train_loss": -6.541627883911133, "global_step": 107392, "epoch": 2556} {"train_loss": -6.405194418770926, "global_step": 107393, "epoch": 2556, "val_loss": 68072.0390625} {"train_loss": -6.324771881103516, "global_step": 107394, "epoch": 2557} {"train_loss": -6.474847793579102, "global_step": 107395, "epoch": 2557} {"train_loss": -6.321716785430908, "global_step": 107396, "epoch": 2557} {"train_loss": -6.366482734680176, "global_step": 107397, "epoch": 2557} {"train_loss": -6.370704650878906, "global_step": 107398, "epoch": 2557} {"train_loss": -6.395659446716309, "global_step": 107399, "epoch": 2557} {"train_loss": -6.308206081390381, "global_step": 107400, "epoch": 2557} {"train_loss": -6.361164569854736, "global_step": 107401, "epoch": 2557} {"train_loss": -6.307718276977539, "global_step": 107402, "epoch": 2557} {"train_loss": -6.416006088256836, "global_step": 107403, "epoch": 2557} {"train_loss": -6.399523735046387, "global_step": 107404, "epoch": 2557} {"train_loss": -6.435550689697266, "global_step": 107405, "epoch": 2557} {"train_loss": -6.385969638824463, "global_step": 107406, "epoch": 2557} {"train_loss": -6.539422988891602, "global_step": 107407, "epoch": 2557} {"train_loss": -6.376563549041748, "global_step": 107408, "epoch": 2557} {"train_loss": -6.450371265411377, "global_step": 107409, "epoch": 2557} {"train_loss": -6.451519966125488, "global_step": 107410, "epoch": 2557} {"train_loss": -6.418140888214111, "global_step": 107411, "epoch": 2557} {"train_loss": -6.38040828704834, "global_step": 107412, "epoch": 2557} {"train_loss": -6.404843330383301, "global_step": 107413, "epoch": 2557} {"train_loss": -6.396608352661133, "global_step": 107414, "epoch": 2557} {"train_loss": -6.423455238342285, "global_step": 107415, "epoch": 2557} {"train_loss": -6.325657367706299, "global_step": 107416, "epoch": 2557} {"train_loss": -6.405422687530518, "global_step": 107417, "epoch": 2557} {"train_loss": -6.385822772979736, "global_step": 107418, "epoch": 2557} {"train_loss": -6.427257537841797, "global_step": 107419, "epoch": 2557} {"train_loss": -6.471288681030273, "global_step": 107420, "epoch": 2557} {"train_loss": -6.407798767089844, "global_step": 107421, "epoch": 2557} {"train_loss": -6.353340148925781, "global_step": 107422, "epoch": 2557} {"train_loss": -6.382900238037109, "global_step": 107423, "epoch": 2557} {"train_loss": -6.426762580871582, "global_step": 107424, "epoch": 2557} {"train_loss": -6.390866756439209, "global_step": 107425, "epoch": 2557} {"train_loss": -6.43699836730957, "global_step": 107426, "epoch": 2557} {"train_loss": -6.2945756912231445, "global_step": 107427, "epoch": 2557} {"train_loss": -6.293653964996338, "global_step": 107428, "epoch": 2557} {"train_loss": -6.368313789367676, "global_step": 107429, "epoch": 2557} {"train_loss": -6.337864875793457, "global_step": 107430, "epoch": 2557} {"train_loss": -6.399403095245361, "global_step": 107431, "epoch": 2557} {"train_loss": -6.371346473693848, "global_step": 107432, "epoch": 2557} {"train_loss": -6.344704627990723, "global_step": 107433, "epoch": 2557} {"train_loss": -6.403890609741211, "global_step": 107434, "epoch": 2557} {"train_loss": -6.390551294599261, "global_step": 107435, "epoch": 2557, "val_loss": 67971.6484375} {"train_loss": -6.315770149230957, "global_step": 107436, "epoch": 2558} {"train_loss": -6.49200439453125, "global_step": 107437, "epoch": 2558} {"train_loss": -6.325613975524902, "global_step": 107438, "epoch": 2558} {"train_loss": -6.401633262634277, "global_step": 107439, "epoch": 2558} {"train_loss": -6.436193466186523, "global_step": 107440, "epoch": 2558} {"train_loss": -6.384519577026367, "global_step": 107441, "epoch": 2558} {"train_loss": -6.494521617889404, "global_step": 107442, "epoch": 2558} {"train_loss": -6.472597122192383, "global_step": 107443, "epoch": 2558} {"train_loss": -6.463534355163574, "global_step": 107444, "epoch": 2558} {"train_loss": -6.466405868530273, "global_step": 107445, "epoch": 2558} {"train_loss": -6.387381553649902, "global_step": 107446, "epoch": 2558} {"train_loss": -6.357751846313477, "global_step": 107447, "epoch": 2558} {"train_loss": -6.521195888519287, "global_step": 107448, "epoch": 2558} {"train_loss": -6.469773292541504, "global_step": 107449, "epoch": 2558} {"train_loss": -6.443746566772461, "global_step": 107450, "epoch": 2558} {"train_loss": -6.377937316894531, "global_step": 107451, "epoch": 2558} {"train_loss": -6.398694038391113, "global_step": 107452, "epoch": 2558} {"train_loss": -6.406253814697266, "global_step": 107453, "epoch": 2558} {"train_loss": -6.60664176940918, "global_step": 107454, "epoch": 2558} {"train_loss": -6.353854179382324, "global_step": 107455, "epoch": 2558} {"train_loss": -6.366140365600586, "global_step": 107456, "epoch": 2558} {"train_loss": -6.372689723968506, "global_step": 107457, "epoch": 2558} {"train_loss": -6.6048583984375, "global_step": 107458, "epoch": 2558} {"train_loss": -6.318955421447754, "global_step": 107459, "epoch": 2558} {"train_loss": -6.479592323303223, "global_step": 107460, "epoch": 2558} {"train_loss": -6.450963497161865, "global_step": 107461, "epoch": 2558} {"train_loss": -6.482314109802246, "global_step": 107462, "epoch": 2558} {"train_loss": -6.485219955444336, "global_step": 107463, "epoch": 2558} {"train_loss": -6.341577529907227, "global_step": 107464, "epoch": 2558} {"train_loss": -6.399653434753418, "global_step": 107465, "epoch": 2558} {"train_loss": -6.479301929473877, "global_step": 107466, "epoch": 2558} {"train_loss": -6.412451267242432, "global_step": 107467, "epoch": 2558} {"train_loss": -6.501236915588379, "global_step": 107468, "epoch": 2558} {"train_loss": -6.457186698913574, "global_step": 107469, "epoch": 2558} {"train_loss": -6.437960624694824, "global_step": 107470, "epoch": 2558} {"train_loss": -6.439133644104004, "global_step": 107471, "epoch": 2558} {"train_loss": -6.4687089920043945, "global_step": 107472, "epoch": 2558} {"train_loss": -6.324568748474121, "global_step": 107473, "epoch": 2558} {"train_loss": -6.296999931335449, "global_step": 107474, "epoch": 2558} {"train_loss": -6.482428550720215, "global_step": 107475, "epoch": 2558} {"train_loss": -6.21861457824707, "global_step": 107476, "epoch": 2558} {"train_loss": -6.424743561517625, "global_step": 107477, "epoch": 2558, "val_loss": 68132.2421875} {"train_loss": -6.335426330566406, "global_step": 107478, "epoch": 2559} {"train_loss": -6.317436695098877, "global_step": 107479, "epoch": 2559} {"train_loss": -6.458835601806641, "global_step": 107480, "epoch": 2559} {"train_loss": -6.248935699462891, "global_step": 107481, "epoch": 2559} {"train_loss": -6.263395309448242, "global_step": 107482, "epoch": 2559} {"train_loss": -6.404657363891602, "global_step": 107483, "epoch": 2559} {"train_loss": -6.381761074066162, "global_step": 107484, "epoch": 2559} {"train_loss": -6.310985565185547, "global_step": 107485, "epoch": 2559} {"train_loss": -6.335820198059082, "global_step": 107486, "epoch": 2559} {"train_loss": -6.378491401672363, "global_step": 107487, "epoch": 2559} {"train_loss": -6.308242321014404, "global_step": 107488, "epoch": 2559} {"train_loss": -6.388782501220703, "global_step": 107489, "epoch": 2559} {"train_loss": -6.462889671325684, "global_step": 107490, "epoch": 2559} {"train_loss": -6.339561462402344, "global_step": 107491, "epoch": 2559} {"train_loss": -6.35272216796875, "global_step": 107492, "epoch": 2559} {"train_loss": -6.3546037673950195, "global_step": 107493, "epoch": 2559} {"train_loss": -6.316333770751953, "global_step": 107494, "epoch": 2559} {"train_loss": -6.515137195587158, "global_step": 107495, "epoch": 2559} {"train_loss": -6.418408393859863, "global_step": 107496, "epoch": 2559} {"train_loss": -6.433444023132324, "global_step": 107497, "epoch": 2559} {"train_loss": -6.535163879394531, "global_step": 107498, "epoch": 2559} {"train_loss": -6.426623344421387, "global_step": 107499, "epoch": 2559} {"train_loss": -6.574291706085205, "global_step": 107500, "epoch": 2559} {"train_loss": -6.539714813232422, "global_step": 107501, "epoch": 2559} {"train_loss": -6.39721155166626, "global_step": 107502, "epoch": 2559} {"train_loss": -6.507978439331055, "global_step": 107503, "epoch": 2559} {"train_loss": -6.479101657867432, "global_step": 107504, "epoch": 2559} {"train_loss": -6.369504928588867, "global_step": 107505, "epoch": 2559} {"train_loss": -6.415275573730469, "global_step": 107506, "epoch": 2559} {"train_loss": -6.33078670501709, "global_step": 107507, "epoch": 2559} {"train_loss": -6.487517356872559, "global_step": 107508, "epoch": 2559} {"train_loss": -6.383203506469727, "global_step": 107509, "epoch": 2559} {"train_loss": -6.455913543701172, "global_step": 107510, "epoch": 2559} {"train_loss": -6.393657207489014, "global_step": 107511, "epoch": 2559} {"train_loss": -6.366929531097412, "global_step": 107512, "epoch": 2559} {"train_loss": -6.294190406799316, "global_step": 107513, "epoch": 2559} {"train_loss": -6.335182189941406, "global_step": 107514, "epoch": 2559} {"train_loss": -6.487454891204834, "global_step": 107515, "epoch": 2559} {"train_loss": -6.474563121795654, "global_step": 107516, "epoch": 2559} {"train_loss": -6.387679576873779, "global_step": 107517, "epoch": 2559} {"train_loss": -6.442686557769775, "global_step": 107518, "epoch": 2559} {"train_loss": -6.400502307074411, "global_step": 107519, "epoch": 2559, "val_loss": 68010.0078125} {"train_loss": -6.482911109924316, "global_step": 107520, "epoch": 2560} {"train_loss": -6.4509429931640625, "global_step": 107521, "epoch": 2560} {"train_loss": -6.414425849914551, "global_step": 107522, "epoch": 2560} {"train_loss": -6.349968910217285, "global_step": 107523, "epoch": 2560} {"train_loss": -6.445117473602295, "global_step": 107524, "epoch": 2560} {"train_loss": -6.485332012176514, "global_step": 107525, "epoch": 2560} {"train_loss": -6.353919982910156, "global_step": 107526, "epoch": 2560} {"train_loss": -6.471757888793945, "global_step": 107527, "epoch": 2560} {"train_loss": -6.409849643707275, "global_step": 107528, "epoch": 2560} {"train_loss": -6.471746444702148, "global_step": 107529, "epoch": 2560} {"train_loss": -6.375490188598633, "global_step": 107530, "epoch": 2560} {"train_loss": -6.376067161560059, "global_step": 107531, "epoch": 2560} {"train_loss": -6.482667922973633, "global_step": 107532, "epoch": 2560} {"train_loss": -6.403331756591797, "global_step": 107533, "epoch": 2560} {"train_loss": -6.442799091339111, "global_step": 107534, "epoch": 2560} {"train_loss": -6.570068836212158, "global_step": 107535, "epoch": 2560} {"train_loss": -6.470703125, "global_step": 107536, "epoch": 2560} {"train_loss": -6.428689002990723, "global_step": 107537, "epoch": 2560} {"train_loss": -6.510409355163574, "global_step": 107538, "epoch": 2560} {"train_loss": -6.3817853927612305, "global_step": 107539, "epoch": 2560} {"train_loss": -6.473161697387695, "global_step": 107540, "epoch": 2560} {"train_loss": -6.453808784484863, "global_step": 107541, "epoch": 2560} {"train_loss": -6.42767333984375, "global_step": 107542, "epoch": 2560} {"train_loss": -6.520606994628906, "global_step": 107543, "epoch": 2560} {"train_loss": -6.495754718780518, "global_step": 107544, "epoch": 2560} {"train_loss": -6.498187065124512, "global_step": 107545, "epoch": 2560} {"train_loss": -6.322970390319824, "global_step": 107546, "epoch": 2560} {"train_loss": -6.427702903747559, "global_step": 107547, "epoch": 2560} {"train_loss": -6.408675670623779, "global_step": 107548, "epoch": 2560} {"train_loss": -6.399506568908691, "global_step": 107549, "epoch": 2560} {"train_loss": -6.408200740814209, "global_step": 107550, "epoch": 2560} {"train_loss": -6.449398994445801, "global_step": 107551, "epoch": 2560} {"train_loss": -6.487578392028809, "global_step": 107552, "epoch": 2560} {"train_loss": -6.459257125854492, "global_step": 107553, "epoch": 2560} {"train_loss": -6.456311225891113, "global_step": 107554, "epoch": 2560} {"train_loss": -6.326385974884033, "global_step": 107555, "epoch": 2560} {"train_loss": -6.373485088348389, "global_step": 107556, "epoch": 2560} {"train_loss": -6.387942790985107, "global_step": 107557, "epoch": 2560} {"train_loss": -6.461289405822754, "global_step": 107558, "epoch": 2560} {"train_loss": -6.426884174346924, "global_step": 107559, "epoch": 2560} {"train_loss": -6.497989654541016, "global_step": 107560, "epoch": 2560} {"train_loss": -6.435161477043515, "global_step": 107561, "epoch": 2560, "val_loss": 67692.8828125} {"train_loss": -6.348023414611816, "global_step": 107562, "epoch": 2561} {"train_loss": -6.508297443389893, "global_step": 107563, "epoch": 2561} {"train_loss": -6.355963230133057, "global_step": 107564, "epoch": 2561} {"train_loss": -6.400873184204102, "global_step": 107565, "epoch": 2561} {"train_loss": -6.318111419677734, "global_step": 107566, "epoch": 2561} {"train_loss": -6.479006290435791, "global_step": 107567, "epoch": 2561} {"train_loss": -6.453207969665527, "global_step": 107568, "epoch": 2561} {"train_loss": -6.335643768310547, "global_step": 107569, "epoch": 2561} {"train_loss": -6.479150295257568, "global_step": 107570, "epoch": 2561} {"train_loss": -6.431312561035156, "global_step": 107571, "epoch": 2561} {"train_loss": -6.421720504760742, "global_step": 107572, "epoch": 2561} {"train_loss": -6.355316638946533, "global_step": 107573, "epoch": 2561} {"train_loss": -6.453174591064453, "global_step": 107574, "epoch": 2561} {"train_loss": -6.466336250305176, "global_step": 107575, "epoch": 2561} {"train_loss": -6.384836196899414, "global_step": 107576, "epoch": 2561} {"train_loss": -6.2691802978515625, "global_step": 107577, "epoch": 2561} {"train_loss": -6.343073844909668, "global_step": 107578, "epoch": 2561} {"train_loss": -6.429962158203125, "global_step": 107579, "epoch": 2561} {"train_loss": -6.353913307189941, "global_step": 107580, "epoch": 2561} {"train_loss": -6.4527668952941895, "global_step": 107581, "epoch": 2561} {"train_loss": -6.347906589508057, "global_step": 107582, "epoch": 2561} {"train_loss": -6.503283500671387, "global_step": 107583, "epoch": 2561} {"train_loss": -6.440561294555664, "global_step": 107584, "epoch": 2561} {"train_loss": -6.336666107177734, "global_step": 107585, "epoch": 2561} {"train_loss": -6.324690818786621, "global_step": 107586, "epoch": 2561} {"train_loss": -6.350854396820068, "global_step": 107587, "epoch": 2561} {"train_loss": -6.243068695068359, "global_step": 107588, "epoch": 2561} {"train_loss": -6.362578868865967, "global_step": 107589, "epoch": 2561} {"train_loss": -6.345501899719238, "global_step": 107590, "epoch": 2561} {"train_loss": -6.273263931274414, "global_step": 107591, "epoch": 2561} {"train_loss": -6.394347190856934, "global_step": 107592, "epoch": 2561} {"train_loss": -6.385683059692383, "global_step": 107593, "epoch": 2561} {"train_loss": -6.3177618980407715, "global_step": 107594, "epoch": 2561} {"train_loss": -6.3045759201049805, "global_step": 107595, "epoch": 2561} {"train_loss": -6.342559337615967, "global_step": 107596, "epoch": 2561} {"train_loss": -6.343839168548584, "global_step": 107597, "epoch": 2561} {"train_loss": -6.272984504699707, "global_step": 107598, "epoch": 2561} {"train_loss": -6.361754417419434, "global_step": 107599, "epoch": 2561} {"train_loss": -6.342482566833496, "global_step": 107600, "epoch": 2561} {"train_loss": -6.29005765914917, "global_step": 107601, "epoch": 2561} {"train_loss": -6.29479455947876, "global_step": 107602, "epoch": 2561} {"train_loss": -6.371666522253127, "global_step": 107603, "epoch": 2561, "val_loss": 68035.6953125} {"train_loss": -6.304654121398926, "global_step": 107604, "epoch": 2562} {"train_loss": -6.297717094421387, "global_step": 107605, "epoch": 2562} {"train_loss": -6.335488319396973, "global_step": 107606, "epoch": 2562} {"train_loss": -6.283597946166992, "global_step": 107607, "epoch": 2562} {"train_loss": -6.327169418334961, "global_step": 107608, "epoch": 2562} {"train_loss": -6.367198944091797, "global_step": 107609, "epoch": 2562} {"train_loss": -6.256580352783203, "global_step": 107610, "epoch": 2562} {"train_loss": -6.504581451416016, "global_step": 107611, "epoch": 2562} {"train_loss": -6.319514274597168, "global_step": 107612, "epoch": 2562} {"train_loss": -6.389167785644531, "global_step": 107613, "epoch": 2562} {"train_loss": -6.276285648345947, "global_step": 107614, "epoch": 2562} {"train_loss": -6.391390323638916, "global_step": 107615, "epoch": 2562} {"train_loss": -6.362354755401611, "global_step": 107616, "epoch": 2562} {"train_loss": -6.474601745605469, "global_step": 107617, "epoch": 2562} {"train_loss": -6.21435546875, "global_step": 107618, "epoch": 2562} {"train_loss": -6.433444976806641, "global_step": 107619, "epoch": 2562} {"train_loss": -6.343437671661377, "global_step": 107620, "epoch": 2562} {"train_loss": -6.425823211669922, "global_step": 107621, "epoch": 2562} {"train_loss": -6.351072311401367, "global_step": 107622, "epoch": 2562} {"train_loss": -6.433911323547363, "global_step": 107623, "epoch": 2562} {"train_loss": -6.4116387367248535, "global_step": 107624, "epoch": 2562} {"train_loss": -6.4555816650390625, "global_step": 107625, "epoch": 2562} {"train_loss": -6.413460731506348, "global_step": 107626, "epoch": 2562} {"train_loss": -6.441338539123535, "global_step": 107627, "epoch": 2562} {"train_loss": -6.418354511260986, "global_step": 107628, "epoch": 2562} {"train_loss": -6.427836894989014, "global_step": 107629, "epoch": 2562} {"train_loss": -6.382513523101807, "global_step": 107630, "epoch": 2562} {"train_loss": -6.443205833435059, "global_step": 107631, "epoch": 2562} {"train_loss": -6.3661208152771, "global_step": 107632, "epoch": 2562} {"train_loss": -6.340228080749512, "global_step": 107633, "epoch": 2562} {"train_loss": -6.369821548461914, "global_step": 107634, "epoch": 2562} {"train_loss": -6.4027419090271, "global_step": 107635, "epoch": 2562} {"train_loss": -6.425505638122559, "global_step": 107636, "epoch": 2562} {"train_loss": -6.416335105895996, "global_step": 107637, "epoch": 2562} {"train_loss": -6.404811859130859, "global_step": 107638, "epoch": 2562} {"train_loss": -6.468136787414551, "global_step": 107639, "epoch": 2562} {"train_loss": -6.469973564147949, "global_step": 107640, "epoch": 2562} {"train_loss": -6.384359359741211, "global_step": 107641, "epoch": 2562} {"train_loss": -6.403378486633301, "global_step": 107642, "epoch": 2562} {"train_loss": -6.208532810211182, "global_step": 107643, "epoch": 2562} {"train_loss": -6.532704830169678, "global_step": 107644, "epoch": 2562} {"train_loss": -6.383693468003046, "global_step": 107645, "epoch": 2562, "val_loss": 67831.875} {"train_loss": -6.45285177230835, "global_step": 107646, "epoch": 2563} {"train_loss": -6.506758213043213, "global_step": 107647, "epoch": 2563} {"train_loss": -6.352578163146973, "global_step": 107648, "epoch": 2563} {"train_loss": -6.500322341918945, "global_step": 107649, "epoch": 2563} {"train_loss": -6.413202285766602, "global_step": 107650, "epoch": 2563} {"train_loss": -6.391333103179932, "global_step": 107651, "epoch": 2563} {"train_loss": -6.380918502807617, "global_step": 107652, "epoch": 2563} {"train_loss": -6.4429473876953125, "global_step": 107653, "epoch": 2563} {"train_loss": -6.444757461547852, "global_step": 107654, "epoch": 2563} {"train_loss": -6.431058883666992, "global_step": 107655, "epoch": 2563} {"train_loss": -6.446059226989746, "global_step": 107656, "epoch": 2563} {"train_loss": -6.490669250488281, "global_step": 107657, "epoch": 2563} {"train_loss": -6.255716800689697, "global_step": 107658, "epoch": 2563} {"train_loss": -6.283041000366211, "global_step": 107659, "epoch": 2563} {"train_loss": -6.445255279541016, "global_step": 107660, "epoch": 2563} {"train_loss": -6.342994689941406, "global_step": 107661, "epoch": 2563} {"train_loss": -6.344030857086182, "global_step": 107662, "epoch": 2563} {"train_loss": -6.367774963378906, "global_step": 107663, "epoch": 2563} {"train_loss": -6.413640022277832, "global_step": 107664, "epoch": 2563} {"train_loss": -6.402220726013184, "global_step": 107665, "epoch": 2563} {"train_loss": -6.466035842895508, "global_step": 107666, "epoch": 2563} {"train_loss": -6.40671443939209, "global_step": 107667, "epoch": 2563} {"train_loss": -6.386516094207764, "global_step": 107668, "epoch": 2563} {"train_loss": -6.3679118156433105, "global_step": 107669, "epoch": 2563} {"train_loss": -6.322657585144043, "global_step": 107670, "epoch": 2563} {"train_loss": -6.352380275726318, "global_step": 107671, "epoch": 2563} {"train_loss": -6.414831638336182, "global_step": 107672, "epoch": 2563} {"train_loss": -6.344006061553955, "global_step": 107673, "epoch": 2563} {"train_loss": -6.50825309753418, "global_step": 107674, "epoch": 2563} {"train_loss": -6.364584445953369, "global_step": 107675, "epoch": 2563} {"train_loss": -6.452979564666748, "global_step": 107676, "epoch": 2563} {"train_loss": -6.52984619140625, "global_step": 107677, "epoch": 2563} {"train_loss": -6.438842296600342, "global_step": 107678, "epoch": 2563} {"train_loss": -6.541662216186523, "global_step": 107679, "epoch": 2563} {"train_loss": -6.414829730987549, "global_step": 107680, "epoch": 2563} {"train_loss": -6.341410160064697, "global_step": 107681, "epoch": 2563} {"train_loss": -6.433305740356445, "global_step": 107682, "epoch": 2563} {"train_loss": -6.331846237182617, "global_step": 107683, "epoch": 2563} {"train_loss": -6.364231109619141, "global_step": 107684, "epoch": 2563} {"train_loss": -6.391443252563477, "global_step": 107685, "epoch": 2563} {"train_loss": -6.521367073059082, "global_step": 107686, "epoch": 2563} {"train_loss": -6.410229172025408, "global_step": 107687, "epoch": 2563, "val_loss": 67743.7265625} {"train_loss": -6.462774276733398, "global_step": 107688, "epoch": 2564} {"train_loss": -6.471234321594238, "global_step": 107689, "epoch": 2564} {"train_loss": -6.361472129821777, "global_step": 107690, "epoch": 2564} {"train_loss": -6.584658622741699, "global_step": 107691, "epoch": 2564} {"train_loss": -6.451786994934082, "global_step": 107692, "epoch": 2564} {"train_loss": -6.53864860534668, "global_step": 107693, "epoch": 2564} {"train_loss": -6.512766361236572, "global_step": 107694, "epoch": 2564} {"train_loss": -6.375702381134033, "global_step": 107695, "epoch": 2564} {"train_loss": -6.395256996154785, "global_step": 107696, "epoch": 2564} {"train_loss": -6.425009727478027, "global_step": 107697, "epoch": 2564} {"train_loss": -6.424378395080566, "global_step": 107698, "epoch": 2564} {"train_loss": -6.33841609954834, "global_step": 107699, "epoch": 2564} {"train_loss": -6.525808334350586, "global_step": 107700, "epoch": 2564} {"train_loss": -6.427611351013184, "global_step": 107701, "epoch": 2564} {"train_loss": -6.433306694030762, "global_step": 107702, "epoch": 2564} {"train_loss": -6.474315643310547, "global_step": 107703, "epoch": 2564} {"train_loss": -6.378045082092285, "global_step": 107704, "epoch": 2564} {"train_loss": -6.43399715423584, "global_step": 107705, "epoch": 2564} {"train_loss": -6.343761444091797, "global_step": 107706, "epoch": 2564} {"train_loss": -6.323917865753174, "global_step": 107707, "epoch": 2564} {"train_loss": -6.348320960998535, "global_step": 107708, "epoch": 2564} {"train_loss": -6.419877052307129, "global_step": 107709, "epoch": 2564} {"train_loss": -6.472179412841797, "global_step": 107710, "epoch": 2564} {"train_loss": -6.586646556854248, "global_step": 107711, "epoch": 2564} {"train_loss": -6.337629318237305, "global_step": 107712, "epoch": 2564} {"train_loss": -6.449357986450195, "global_step": 107713, "epoch": 2564} {"train_loss": -6.302849769592285, "global_step": 107714, "epoch": 2564} {"train_loss": -6.435222625732422, "global_step": 107715, "epoch": 2564} {"train_loss": -6.419565200805664, "global_step": 107716, "epoch": 2564} {"train_loss": -6.418597221374512, "global_step": 107717, "epoch": 2564} {"train_loss": -6.423264026641846, "global_step": 107718, "epoch": 2564} {"train_loss": -6.402281284332275, "global_step": 107719, "epoch": 2564} {"train_loss": -6.361948013305664, "global_step": 107720, "epoch": 2564} {"train_loss": -6.420522689819336, "global_step": 107721, "epoch": 2564} {"train_loss": -6.504896640777588, "global_step": 107722, "epoch": 2564} {"train_loss": -6.304478168487549, "global_step": 107723, "epoch": 2564} {"train_loss": -6.431532382965088, "global_step": 107724, "epoch": 2564} {"train_loss": -6.4795637130737305, "global_step": 107725, "epoch": 2564} {"train_loss": -6.308966159820557, "global_step": 107726, "epoch": 2564} {"train_loss": -6.427570819854736, "global_step": 107727, "epoch": 2564} {"train_loss": -6.466732025146484, "global_step": 107728, "epoch": 2564} {"train_loss": -6.4237985497429255, "global_step": 107729, "epoch": 2564, "val_loss": 67902.7890625} {"train_loss": -6.460413932800293, "global_step": 107730, "epoch": 2565} {"train_loss": -6.380647659301758, "global_step": 107731, "epoch": 2565} {"train_loss": -6.413825988769531, "global_step": 107732, "epoch": 2565} {"train_loss": -6.358242511749268, "global_step": 107733, "epoch": 2565} {"train_loss": -6.394492149353027, "global_step": 107734, "epoch": 2565} {"train_loss": -6.453371047973633, "global_step": 107735, "epoch": 2565} {"train_loss": -6.380245685577393, "global_step": 107736, "epoch": 2565} {"train_loss": -6.321966171264648, "global_step": 107737, "epoch": 2565} {"train_loss": -6.381723403930664, "global_step": 107738, "epoch": 2565} {"train_loss": -6.421586036682129, "global_step": 107739, "epoch": 2565} {"train_loss": -6.264540195465088, "global_step": 107740, "epoch": 2565} {"train_loss": -6.312778949737549, "global_step": 107741, "epoch": 2565} {"train_loss": -6.488965034484863, "global_step": 107742, "epoch": 2565} {"train_loss": -6.2621965408325195, "global_step": 107743, "epoch": 2565} {"train_loss": -6.330114364624023, "global_step": 107744, "epoch": 2565} {"train_loss": -6.33151912689209, "global_step": 107745, "epoch": 2565} {"train_loss": -6.459171772003174, "global_step": 107746, "epoch": 2565} {"train_loss": -6.217922210693359, "global_step": 107747, "epoch": 2565} {"train_loss": -6.427535057067871, "global_step": 107748, "epoch": 2565} {"train_loss": -6.394594669342041, "global_step": 107749, "epoch": 2565} {"train_loss": -6.291706085205078, "global_step": 107750, "epoch": 2565} {"train_loss": -6.31827449798584, "global_step": 107751, "epoch": 2565} {"train_loss": -6.304064750671387, "global_step": 107752, "epoch": 2565} {"train_loss": -6.278581619262695, "global_step": 107753, "epoch": 2565} {"train_loss": -6.355222702026367, "global_step": 107754, "epoch": 2565} {"train_loss": -6.33359432220459, "global_step": 107755, "epoch": 2565} {"train_loss": -6.311729431152344, "global_step": 107756, "epoch": 2565} {"train_loss": -6.329345226287842, "global_step": 107757, "epoch": 2565} {"train_loss": -6.366988658905029, "global_step": 107758, "epoch": 2565} {"train_loss": -6.464674949645996, "global_step": 107759, "epoch": 2565} {"train_loss": -6.473081111907959, "global_step": 107760, "epoch": 2565} {"train_loss": -6.366123676300049, "global_step": 107761, "epoch": 2565} {"train_loss": -6.4308671951293945, "global_step": 107762, "epoch": 2565} {"train_loss": -6.404361724853516, "global_step": 107763, "epoch": 2565} {"train_loss": -6.313982963562012, "global_step": 107764, "epoch": 2565} {"train_loss": -6.340012550354004, "global_step": 107765, "epoch": 2565} {"train_loss": -6.350006580352783, "global_step": 107766, "epoch": 2565} {"train_loss": -6.2891950607299805, "global_step": 107767, "epoch": 2565} {"train_loss": -6.512954235076904, "global_step": 107768, "epoch": 2565} {"train_loss": -6.485672950744629, "global_step": 107769, "epoch": 2565} {"train_loss": -6.37521505355835, "global_step": 107770, "epoch": 2565} {"train_loss": -6.369562012808664, "global_step": 107771, "epoch": 2565, "val_loss": 67801.59375} {"train_loss": -6.393619060516357, "global_step": 107772, "epoch": 2566} {"train_loss": -6.475218296051025, "global_step": 107773, "epoch": 2566} {"train_loss": -6.487784385681152, "global_step": 107774, "epoch": 2566} {"train_loss": -6.399625778198242, "global_step": 107775, "epoch": 2566} {"train_loss": -6.433834075927734, "global_step": 107776, "epoch": 2566} {"train_loss": -6.518575191497803, "global_step": 107777, "epoch": 2566} {"train_loss": -6.291666030883789, "global_step": 107778, "epoch": 2566} {"train_loss": -6.432545185089111, "global_step": 107779, "epoch": 2566} {"train_loss": -6.306872367858887, "global_step": 107780, "epoch": 2566} {"train_loss": -6.307036399841309, "global_step": 107781, "epoch": 2566} {"train_loss": -6.472820281982422, "global_step": 107782, "epoch": 2566} {"train_loss": -6.3855743408203125, "global_step": 107783, "epoch": 2566} {"train_loss": -6.420432090759277, "global_step": 107784, "epoch": 2566} {"train_loss": -6.3437676429748535, "global_step": 107785, "epoch": 2566} {"train_loss": -6.456673622131348, "global_step": 107786, "epoch": 2566} {"train_loss": -6.424252033233643, "global_step": 107787, "epoch": 2566} {"train_loss": -6.301787376403809, "global_step": 107788, "epoch": 2566} {"train_loss": -6.353315830230713, "global_step": 107789, "epoch": 2566} {"train_loss": -6.32802677154541, "global_step": 107790, "epoch": 2566} {"train_loss": -6.351944923400879, "global_step": 107791, "epoch": 2566} {"train_loss": -6.368266582489014, "global_step": 107792, "epoch": 2566} {"train_loss": -6.4412970542907715, "global_step": 107793, "epoch": 2566} {"train_loss": -6.4571380615234375, "global_step": 107794, "epoch": 2566} {"train_loss": -6.410384654998779, "global_step": 107795, "epoch": 2566} {"train_loss": -6.474931240081787, "global_step": 107796, "epoch": 2566} {"train_loss": -6.334639549255371, "global_step": 107797, "epoch": 2566} {"train_loss": -6.543661117553711, "global_step": 107798, "epoch": 2566} {"train_loss": -6.427776336669922, "global_step": 107799, "epoch": 2566} {"train_loss": -6.4289398193359375, "global_step": 107800, "epoch": 2566} {"train_loss": -6.459223747253418, "global_step": 107801, "epoch": 2566} {"train_loss": -6.360971450805664, "global_step": 107802, "epoch": 2566} {"train_loss": -6.403375148773193, "global_step": 107803, "epoch": 2566} {"train_loss": -6.391385078430176, "global_step": 107804, "epoch": 2566} {"train_loss": -6.397709846496582, "global_step": 107805, "epoch": 2566} {"train_loss": -6.410614967346191, "global_step": 107806, "epoch": 2566} {"train_loss": -6.383355140686035, "global_step": 107807, "epoch": 2566} {"train_loss": -6.390685558319092, "global_step": 107808, "epoch": 2566} {"train_loss": -6.514287948608398, "global_step": 107809, "epoch": 2566} {"train_loss": -6.414666652679443, "global_step": 107810, "epoch": 2566} {"train_loss": -6.304499626159668, "global_step": 107811, "epoch": 2566} {"train_loss": -6.338606834411621, "global_step": 107812, "epoch": 2566} {"train_loss": -6.401112794876099, "global_step": 107813, "epoch": 2566, "val_loss": 67894.0} {"train_loss": -6.32700252532959, "global_step": 107814, "epoch": 2567} {"train_loss": -6.288637161254883, "global_step": 107815, "epoch": 2567} {"train_loss": -6.337786674499512, "global_step": 107816, "epoch": 2567} {"train_loss": -6.389352321624756, "global_step": 107817, "epoch": 2567} {"train_loss": -6.336138725280762, "global_step": 107818, "epoch": 2567} {"train_loss": -6.4576005935668945, "global_step": 107819, "epoch": 2567} {"train_loss": -6.361503601074219, "global_step": 107820, "epoch": 2567} {"train_loss": -6.359248638153076, "global_step": 107821, "epoch": 2567} {"train_loss": -6.267311096191406, "global_step": 107822, "epoch": 2567} {"train_loss": -6.483052730560303, "global_step": 107823, "epoch": 2567} {"train_loss": -6.387940406799316, "global_step": 107824, "epoch": 2567} {"train_loss": -6.488884925842285, "global_step": 107825, "epoch": 2567} {"train_loss": -6.394547462463379, "global_step": 107826, "epoch": 2567} {"train_loss": -6.410305976867676, "global_step": 107827, "epoch": 2567} {"train_loss": -6.394187927246094, "global_step": 107828, "epoch": 2567} {"train_loss": -6.5662384033203125, "global_step": 107829, "epoch": 2567} {"train_loss": -6.415036201477051, "global_step": 107830, "epoch": 2567} {"train_loss": -6.530938148498535, "global_step": 107831, "epoch": 2567} {"train_loss": -6.373152732849121, "global_step": 107832, "epoch": 2567} {"train_loss": -6.4587297439575195, "global_step": 107833, "epoch": 2567} {"train_loss": -6.417637348175049, "global_step": 107834, "epoch": 2567} {"train_loss": -6.471393585205078, "global_step": 107835, "epoch": 2567} {"train_loss": -6.367949962615967, "global_step": 107836, "epoch": 2567} {"train_loss": -6.440377235412598, "global_step": 107837, "epoch": 2567} {"train_loss": -6.364952087402344, "global_step": 107838, "epoch": 2567} {"train_loss": -6.460922718048096, "global_step": 107839, "epoch": 2567} {"train_loss": -6.484962463378906, "global_step": 107840, "epoch": 2567} {"train_loss": -6.463470458984375, "global_step": 107841, "epoch": 2567} {"train_loss": -6.409173011779785, "global_step": 107842, "epoch": 2567} {"train_loss": -6.344797611236572, "global_step": 107843, "epoch": 2567} {"train_loss": -6.346550941467285, "global_step": 107844, "epoch": 2567} {"train_loss": -6.306779861450195, "global_step": 107845, "epoch": 2567} {"train_loss": -6.2046217918396, "global_step": 107846, "epoch": 2567} {"train_loss": -6.455680847167969, "global_step": 107847, "epoch": 2567} {"train_loss": -6.351315498352051, "global_step": 107848, "epoch": 2567} {"train_loss": -6.284916877746582, "global_step": 107849, "epoch": 2567} {"train_loss": -6.2943010330200195, "global_step": 107850, "epoch": 2567} {"train_loss": -6.39260196685791, "global_step": 107851, "epoch": 2567} {"train_loss": -6.43101167678833, "global_step": 107852, "epoch": 2567} {"train_loss": -6.284944534301758, "global_step": 107853, "epoch": 2567} {"train_loss": -6.345357894897461, "global_step": 107854, "epoch": 2567} {"train_loss": -6.386976469130743, "global_step": 107855, "epoch": 2567, "val_loss": 67861.109375} {"train_loss": -6.423436164855957, "global_step": 107856, "epoch": 2568} {"train_loss": -6.411488056182861, "global_step": 107857, "epoch": 2568} {"train_loss": -6.359633445739746, "global_step": 107858, "epoch": 2568} {"train_loss": -6.463847637176514, "global_step": 107859, "epoch": 2568} {"train_loss": -6.427915573120117, "global_step": 107860, "epoch": 2568} {"train_loss": -6.2751970291137695, "global_step": 107861, "epoch": 2568} {"train_loss": -6.28955078125, "global_step": 107862, "epoch": 2568} {"train_loss": -6.457109451293945, "global_step": 107863, "epoch": 2568} {"train_loss": -6.421485424041748, "global_step": 107864, "epoch": 2568} {"train_loss": -6.296088218688965, "global_step": 107865, "epoch": 2568} {"train_loss": -6.443265438079834, "global_step": 107866, "epoch": 2568} {"train_loss": -6.335747241973877, "global_step": 107867, "epoch": 2568} {"train_loss": -6.410940647125244, "global_step": 107868, "epoch": 2568} {"train_loss": -6.478198051452637, "global_step": 107869, "epoch": 2568} {"train_loss": -6.444084167480469, "global_step": 107870, "epoch": 2568} {"train_loss": -6.4768218994140625, "global_step": 107871, "epoch": 2568} {"train_loss": -6.426401138305664, "global_step": 107872, "epoch": 2568} {"train_loss": -6.515597820281982, "global_step": 107873, "epoch": 2568} {"train_loss": -6.515180587768555, "global_step": 107874, "epoch": 2568} {"train_loss": -6.385097026824951, "global_step": 107875, "epoch": 2568} {"train_loss": -6.396864891052246, "global_step": 107876, "epoch": 2568} {"train_loss": -6.5073676109313965, "global_step": 107877, "epoch": 2568} {"train_loss": -6.450926780700684, "global_step": 107878, "epoch": 2568} {"train_loss": -6.269473075866699, "global_step": 107879, "epoch": 2568} {"train_loss": -6.33274507522583, "global_step": 107880, "epoch": 2568} {"train_loss": -6.478950500488281, "global_step": 107881, "epoch": 2568} {"train_loss": -6.3302106857299805, "global_step": 107882, "epoch": 2568} {"train_loss": -6.301942825317383, "global_step": 107883, "epoch": 2568} {"train_loss": -6.464730262756348, "global_step": 107884, "epoch": 2568} {"train_loss": -6.451407432556152, "global_step": 107885, "epoch": 2568} {"train_loss": -6.438534736633301, "global_step": 107886, "epoch": 2568} {"train_loss": -6.408184051513672, "global_step": 107887, "epoch": 2568} {"train_loss": -6.518103122711182, "global_step": 107888, "epoch": 2568} {"train_loss": -6.347015857696533, "global_step": 107889, "epoch": 2568} {"train_loss": -6.403838634490967, "global_step": 107890, "epoch": 2568} {"train_loss": -6.368251800537109, "global_step": 107891, "epoch": 2568} {"train_loss": -6.2702131271362305, "global_step": 107892, "epoch": 2568} {"train_loss": -6.426442623138428, "global_step": 107893, "epoch": 2568} {"train_loss": -6.457510948181152, "global_step": 107894, "epoch": 2568} {"train_loss": -6.399674415588379, "global_step": 107895, "epoch": 2568} {"train_loss": -6.443795204162598, "global_step": 107896, "epoch": 2568} {"train_loss": -6.406547387440999, "global_step": 107897, "epoch": 2568, "val_loss": 67743.7578125} {"train_loss": -6.408605098724365, "global_step": 107898, "epoch": 2569} {"train_loss": -6.443686485290527, "global_step": 107899, "epoch": 2569} {"train_loss": -6.538422107696533, "global_step": 107900, "epoch": 2569} {"train_loss": -6.528841018676758, "global_step": 107901, "epoch": 2569} {"train_loss": -6.376442909240723, "global_step": 107902, "epoch": 2569} {"train_loss": -6.4002275466918945, "global_step": 107903, "epoch": 2569} {"train_loss": -6.357532501220703, "global_step": 107904, "epoch": 2569} {"train_loss": -6.411351680755615, "global_step": 107905, "epoch": 2569} {"train_loss": -6.410639762878418, "global_step": 107906, "epoch": 2569} {"train_loss": -6.421131134033203, "global_step": 107907, "epoch": 2569} {"train_loss": -6.433248519897461, "global_step": 107908, "epoch": 2569} {"train_loss": -6.456562042236328, "global_step": 107909, "epoch": 2569} {"train_loss": -6.446104526519775, "global_step": 107910, "epoch": 2569} {"train_loss": -6.382472991943359, "global_step": 107911, "epoch": 2569} {"train_loss": -6.5051188468933105, "global_step": 107912, "epoch": 2569} {"train_loss": -6.423619270324707, "global_step": 107913, "epoch": 2569} {"train_loss": -6.423683166503906, "global_step": 107914, "epoch": 2569} {"train_loss": -6.318563461303711, "global_step": 107915, "epoch": 2569} {"train_loss": -6.358026027679443, "global_step": 107916, "epoch": 2569} {"train_loss": -6.425727367401123, "global_step": 107917, "epoch": 2569} {"train_loss": -6.351052284240723, "global_step": 107918, "epoch": 2569} {"train_loss": -6.399080276489258, "global_step": 107919, "epoch": 2569} {"train_loss": -6.426976203918457, "global_step": 107920, "epoch": 2569} {"train_loss": -6.368670463562012, "global_step": 107921, "epoch": 2569} {"train_loss": -6.48762845993042, "global_step": 107922, "epoch": 2569} {"train_loss": -6.406084060668945, "global_step": 107923, "epoch": 2569} {"train_loss": -6.4317169189453125, "global_step": 107924, "epoch": 2569} {"train_loss": -6.299696922302246, "global_step": 107925, "epoch": 2569} {"train_loss": -6.430648326873779, "global_step": 107926, "epoch": 2569} {"train_loss": -6.261236190795898, "global_step": 107927, "epoch": 2569} {"train_loss": -6.4511942863464355, "global_step": 107928, "epoch": 2569} {"train_loss": -6.441702365875244, "global_step": 107929, "epoch": 2569} {"train_loss": -6.44548225402832, "global_step": 107930, "epoch": 2569} {"train_loss": -6.479100227355957, "global_step": 107931, "epoch": 2569} {"train_loss": -6.45849609375, "global_step": 107932, "epoch": 2569} {"train_loss": -6.4431586265563965, "global_step": 107933, "epoch": 2569} {"train_loss": -6.493253707885742, "global_step": 107934, "epoch": 2569} {"train_loss": -6.424796104431152, "global_step": 107935, "epoch": 2569} {"train_loss": -6.491468906402588, "global_step": 107936, "epoch": 2569} {"train_loss": -6.492049217224121, "global_step": 107937, "epoch": 2569} {"train_loss": -6.411670684814453, "global_step": 107938, "epoch": 2569} {"train_loss": -6.423821789877755, "global_step": 107939, "epoch": 2569, "val_loss": 67699.7421875} {"train_loss": -6.468898773193359, "global_step": 107940, "epoch": 2570} {"train_loss": -6.467493057250977, "global_step": 107941, "epoch": 2570} {"train_loss": -6.446539402008057, "global_step": 107942, "epoch": 2570} {"train_loss": -6.481064796447754, "global_step": 107943, "epoch": 2570} {"train_loss": -6.486510753631592, "global_step": 107944, "epoch": 2570} {"train_loss": -6.420719146728516, "global_step": 107945, "epoch": 2570} {"train_loss": -6.53264856338501, "global_step": 107946, "epoch": 2570} {"train_loss": -6.431875705718994, "global_step": 107947, "epoch": 2570} {"train_loss": -6.322676181793213, "global_step": 107948, "epoch": 2570} {"train_loss": -6.424045085906982, "global_step": 107949, "epoch": 2570} {"train_loss": -6.415677547454834, "global_step": 107950, "epoch": 2570} {"train_loss": -6.454651832580566, "global_step": 107951, "epoch": 2570} {"train_loss": -6.446099758148193, "global_step": 107952, "epoch": 2570} {"train_loss": -6.396913528442383, "global_step": 107953, "epoch": 2570} {"train_loss": -6.295657157897949, "global_step": 107954, "epoch": 2570} {"train_loss": -6.426885604858398, "global_step": 107955, "epoch": 2570} {"train_loss": -6.395709991455078, "global_step": 107956, "epoch": 2570} {"train_loss": -6.490146636962891, "global_step": 107957, "epoch": 2570} {"train_loss": -6.461549758911133, "global_step": 107958, "epoch": 2570} {"train_loss": -6.3323974609375, "global_step": 107959, "epoch": 2570} {"train_loss": -6.430248737335205, "global_step": 107960, "epoch": 2570} {"train_loss": -6.426448822021484, "global_step": 107961, "epoch": 2570} {"train_loss": -6.347087860107422, "global_step": 107962, "epoch": 2570} {"train_loss": -6.3730549812316895, "global_step": 107963, "epoch": 2570} {"train_loss": -6.455744743347168, "global_step": 107964, "epoch": 2570} {"train_loss": -6.389253616333008, "global_step": 107965, "epoch": 2570} {"train_loss": -6.563835144042969, "global_step": 107966, "epoch": 2570} {"train_loss": -6.300779819488525, "global_step": 107967, "epoch": 2570} {"train_loss": -6.439321517944336, "global_step": 107968, "epoch": 2570} {"train_loss": -6.445681571960449, "global_step": 107969, "epoch": 2570} {"train_loss": -6.39459228515625, "global_step": 107970, "epoch": 2570} {"train_loss": -6.366300106048584, "global_step": 107971, "epoch": 2570} {"train_loss": -6.436781883239746, "global_step": 107972, "epoch": 2570} {"train_loss": -6.29623556137085, "global_step": 107973, "epoch": 2570} {"train_loss": -6.353461265563965, "global_step": 107974, "epoch": 2570} {"train_loss": -6.313652515411377, "global_step": 107975, "epoch": 2570} {"train_loss": -6.439228057861328, "global_step": 107976, "epoch": 2570} {"train_loss": -6.293368816375732, "global_step": 107977, "epoch": 2570} {"train_loss": -6.352522850036621, "global_step": 107978, "epoch": 2570} {"train_loss": -6.449387073516846, "global_step": 107979, "epoch": 2570} {"train_loss": -6.381748676300049, "global_step": 107980, "epoch": 2570} {"train_loss": -6.411826962516422, "global_step": 107981, "epoch": 2570, "val_loss": 67912.0625} {"train_loss": -6.483419895172119, "global_step": 107982, "epoch": 2571} {"train_loss": -6.419475078582764, "global_step": 107983, "epoch": 2571} {"train_loss": -6.32280158996582, "global_step": 107984, "epoch": 2571} {"train_loss": -6.354613780975342, "global_step": 107985, "epoch": 2571} {"train_loss": -6.436751842498779, "global_step": 107986, "epoch": 2571} {"train_loss": -6.422700881958008, "global_step": 107987, "epoch": 2571} {"train_loss": -6.548654556274414, "global_step": 107988, "epoch": 2571} {"train_loss": -6.498831748962402, "global_step": 107989, "epoch": 2571} {"train_loss": -6.466913223266602, "global_step": 107990, "epoch": 2571} {"train_loss": -6.360376358032227, "global_step": 107991, "epoch": 2571} {"train_loss": -6.444940567016602, "global_step": 107992, "epoch": 2571} {"train_loss": -6.443514347076416, "global_step": 107993, "epoch": 2571} {"train_loss": -6.540035724639893, "global_step": 107994, "epoch": 2571} {"train_loss": -6.458172798156738, "global_step": 107995, "epoch": 2571} {"train_loss": -6.466924667358398, "global_step": 107996, "epoch": 2571} {"train_loss": -6.417850494384766, "global_step": 107997, "epoch": 2571} {"train_loss": -6.47705602645874, "global_step": 107998, "epoch": 2571} {"train_loss": -6.4860310554504395, "global_step": 107999, "epoch": 2571} {"train_loss": -6.481602668762207, "global_step": 108000, "epoch": 2571} {"train_loss": -6.488410472869873, "global_step": 108001, "epoch": 2571} {"train_loss": -6.5824503898620605, "global_step": 108002, "epoch": 2571} {"train_loss": -6.471399307250977, "global_step": 108003, "epoch": 2571} {"train_loss": -6.506231307983398, "global_step": 108004, "epoch": 2571} {"train_loss": -6.3621931076049805, "global_step": 108005, "epoch": 2571} {"train_loss": -6.509445667266846, "global_step": 108006, "epoch": 2571} {"train_loss": -6.497711181640625, "global_step": 108007, "epoch": 2571} {"train_loss": -6.41927433013916, "global_step": 108008, "epoch": 2571} {"train_loss": -6.484464645385742, "global_step": 108009, "epoch": 2571} {"train_loss": -6.439856052398682, "global_step": 108010, "epoch": 2571} {"train_loss": -6.5183515548706055, "global_step": 108011, "epoch": 2571} {"train_loss": -6.379245758056641, "global_step": 108012, "epoch": 2571} {"train_loss": -6.490041732788086, "global_step": 108013, "epoch": 2571} {"train_loss": -6.46366024017334, "global_step": 108014, "epoch": 2571} {"train_loss": -6.416050434112549, "global_step": 108015, "epoch": 2571} {"train_loss": -6.491762161254883, "global_step": 108016, "epoch": 2571} {"train_loss": -6.417158126831055, "global_step": 108017, "epoch": 2571} {"train_loss": -6.47316837310791, "global_step": 108018, "epoch": 2571} {"train_loss": -6.473777770996094, "global_step": 108019, "epoch": 2571} {"train_loss": -6.453376770019531, "global_step": 108020, "epoch": 2571} {"train_loss": -6.486319541931152, "global_step": 108021, "epoch": 2571} {"train_loss": -6.45742130279541, "global_step": 108022, "epoch": 2571} {"train_loss": -6.458748295193627, "global_step": 108023, "epoch": 2571, "val_loss": 67859.9453125} {"train_loss": -6.33125638961792, "global_step": 108024, "epoch": 2572} {"train_loss": -6.3598713874816895, "global_step": 108025, "epoch": 2572} {"train_loss": -6.395359992980957, "global_step": 108026, "epoch": 2572} {"train_loss": -6.298325061798096, "global_step": 108027, "epoch": 2572} {"train_loss": -6.383747100830078, "global_step": 108028, "epoch": 2572} {"train_loss": -6.375875949859619, "global_step": 108029, "epoch": 2572} {"train_loss": -6.3666534423828125, "global_step": 108030, "epoch": 2572} {"train_loss": -6.481067657470703, "global_step": 108031, "epoch": 2572} {"train_loss": -6.384076118469238, "global_step": 108032, "epoch": 2572} {"train_loss": -6.437961101531982, "global_step": 108033, "epoch": 2572} {"train_loss": -6.575840473175049, "global_step": 108034, "epoch": 2572} {"train_loss": -6.411853790283203, "global_step": 108035, "epoch": 2572} {"train_loss": -6.369791030883789, "global_step": 108036, "epoch": 2572} {"train_loss": -6.236984729766846, "global_step": 108037, "epoch": 2572} {"train_loss": -6.406428337097168, "global_step": 108038, "epoch": 2572} {"train_loss": -6.435248374938965, "global_step": 108039, "epoch": 2572} {"train_loss": -6.4068121910095215, "global_step": 108040, "epoch": 2572} {"train_loss": -6.5081329345703125, "global_step": 108041, "epoch": 2572} {"train_loss": -6.346719741821289, "global_step": 108042, "epoch": 2572} {"train_loss": -6.324831962585449, "global_step": 108043, "epoch": 2572} {"train_loss": -6.4581804275512695, "global_step": 108044, "epoch": 2572} {"train_loss": -6.319504261016846, "global_step": 108045, "epoch": 2572} {"train_loss": -6.442234039306641, "global_step": 108046, "epoch": 2572} {"train_loss": -6.44399881362915, "global_step": 108047, "epoch": 2572} {"train_loss": -6.336030960083008, "global_step": 108048, "epoch": 2572} {"train_loss": -6.450940132141113, "global_step": 108049, "epoch": 2572} {"train_loss": -6.422979831695557, "global_step": 108050, "epoch": 2572} {"train_loss": -6.38987398147583, "global_step": 108051, "epoch": 2572} {"train_loss": -6.4263596534729, "global_step": 108052, "epoch": 2572} {"train_loss": -6.315449237823486, "global_step": 108053, "epoch": 2572} {"train_loss": -6.341316223144531, "global_step": 108054, "epoch": 2572} {"train_loss": -6.304516315460205, "global_step": 108055, "epoch": 2572} {"train_loss": -6.417037010192871, "global_step": 108056, "epoch": 2572} {"train_loss": -6.400947093963623, "global_step": 108057, "epoch": 2572} {"train_loss": -6.427030563354492, "global_step": 108058, "epoch": 2572} {"train_loss": -6.38756799697876, "global_step": 108059, "epoch": 2572} {"train_loss": -6.3678131103515625, "global_step": 108060, "epoch": 2572} {"train_loss": -6.412635803222656, "global_step": 108061, "epoch": 2572} {"train_loss": -6.404989242553711, "global_step": 108062, "epoch": 2572} {"train_loss": -6.300141334533691, "global_step": 108063, "epoch": 2572} {"train_loss": -6.555763244628906, "global_step": 108064, "epoch": 2572} {"train_loss": -6.391574484961374, "global_step": 108065, "epoch": 2572, "val_loss": 67887.9375} {"train_loss": -6.37578010559082, "global_step": 108066, "epoch": 2573} {"train_loss": -6.448760032653809, "global_step": 108067, "epoch": 2573} {"train_loss": -6.270684242248535, "global_step": 108068, "epoch": 2573} {"train_loss": -6.315537929534912, "global_step": 108069, "epoch": 2573} {"train_loss": -6.412837982177734, "global_step": 108070, "epoch": 2573} {"train_loss": -6.382453918457031, "global_step": 108071, "epoch": 2573} {"train_loss": -6.303611755371094, "global_step": 108072, "epoch": 2573} {"train_loss": -6.3706231117248535, "global_step": 108073, "epoch": 2573} {"train_loss": -6.344120025634766, "global_step": 108074, "epoch": 2573} {"train_loss": -6.369199752807617, "global_step": 108075, "epoch": 2573} {"train_loss": -6.318324089050293, "global_step": 108076, "epoch": 2573} {"train_loss": -6.340428352355957, "global_step": 108077, "epoch": 2573} {"train_loss": -6.323911666870117, "global_step": 108078, "epoch": 2573} {"train_loss": -6.286355018615723, "global_step": 108079, "epoch": 2573} {"train_loss": -6.519712924957275, "global_step": 108080, "epoch": 2573} {"train_loss": -6.391674518585205, "global_step": 108081, "epoch": 2573} {"train_loss": -6.456516265869141, "global_step": 108082, "epoch": 2573} {"train_loss": -6.352113723754883, "global_step": 108083, "epoch": 2573} {"train_loss": -6.361813068389893, "global_step": 108084, "epoch": 2573} {"train_loss": -6.3907856941223145, "global_step": 108085, "epoch": 2573} {"train_loss": -6.392408847808838, "global_step": 108086, "epoch": 2573} {"train_loss": -6.4993896484375, "global_step": 108087, "epoch": 2573} {"train_loss": -6.405184745788574, "global_step": 108088, "epoch": 2573} {"train_loss": -6.405799388885498, "global_step": 108089, "epoch": 2573} {"train_loss": -6.358278274536133, "global_step": 108090, "epoch": 2573} {"train_loss": -6.377531051635742, "global_step": 108091, "epoch": 2573} {"train_loss": -6.439633369445801, "global_step": 108092, "epoch": 2573} {"train_loss": -6.4419732093811035, "global_step": 108093, "epoch": 2573} {"train_loss": -6.33335018157959, "global_step": 108094, "epoch": 2573} {"train_loss": -6.394761085510254, "global_step": 108095, "epoch": 2573} {"train_loss": -6.435732841491699, "global_step": 108096, "epoch": 2573} {"train_loss": -6.412727355957031, "global_step": 108097, "epoch": 2573} {"train_loss": -6.431721210479736, "global_step": 108098, "epoch": 2573} {"train_loss": -6.38227653503418, "global_step": 108099, "epoch": 2573} {"train_loss": -6.476133346557617, "global_step": 108100, "epoch": 2573} {"train_loss": -6.502985954284668, "global_step": 108101, "epoch": 2573} {"train_loss": -6.390317916870117, "global_step": 108102, "epoch": 2573} {"train_loss": -6.4492597579956055, "global_step": 108103, "epoch": 2573} {"train_loss": -6.428243637084961, "global_step": 108104, "epoch": 2573} {"train_loss": -6.4477314949035645, "global_step": 108105, "epoch": 2573} {"train_loss": -6.430118560791016, "global_step": 108106, "epoch": 2573} {"train_loss": -6.393872329166958, "global_step": 108107, "epoch": 2573, "val_loss": 68055.0390625} {"train_loss": -6.425442218780518, "global_step": 108108, "epoch": 2574} {"train_loss": -6.417690277099609, "global_step": 108109, "epoch": 2574} {"train_loss": -6.337861061096191, "global_step": 108110, "epoch": 2574} {"train_loss": -6.427203178405762, "global_step": 108111, "epoch": 2574} {"train_loss": -6.398289680480957, "global_step": 108112, "epoch": 2574} {"train_loss": -6.525760650634766, "global_step": 108113, "epoch": 2574} {"train_loss": -6.436724662780762, "global_step": 108114, "epoch": 2574} {"train_loss": -6.498517990112305, "global_step": 108115, "epoch": 2574} {"train_loss": -6.412012100219727, "global_step": 108116, "epoch": 2574} {"train_loss": -6.483876705169678, "global_step": 108117, "epoch": 2574} {"train_loss": -6.4336371421813965, "global_step": 108118, "epoch": 2574} {"train_loss": -6.400600433349609, "global_step": 108119, "epoch": 2574} {"train_loss": -6.454297065734863, "global_step": 108120, "epoch": 2574} {"train_loss": -6.4374542236328125, "global_step": 108121, "epoch": 2574} {"train_loss": -6.37177038192749, "global_step": 108122, "epoch": 2574} {"train_loss": -6.489659309387207, "global_step": 108123, "epoch": 2574} {"train_loss": -6.569698810577393, "global_step": 108124, "epoch": 2574} {"train_loss": -6.4825897216796875, "global_step": 108125, "epoch": 2574} {"train_loss": -6.326334476470947, "global_step": 108126, "epoch": 2574} {"train_loss": -6.498398780822754, "global_step": 108127, "epoch": 2574} {"train_loss": -6.398156642913818, "global_step": 108128, "epoch": 2574} {"train_loss": -6.411600112915039, "global_step": 108129, "epoch": 2574} {"train_loss": -6.383517265319824, "global_step": 108130, "epoch": 2574} {"train_loss": -6.564370155334473, "global_step": 108131, "epoch": 2574} {"train_loss": -6.570330619812012, "global_step": 108132, "epoch": 2574} {"train_loss": -6.405935287475586, "global_step": 108133, "epoch": 2574} {"train_loss": -6.379173755645752, "global_step": 108134, "epoch": 2574} {"train_loss": -6.441170692443848, "global_step": 108135, "epoch": 2574} {"train_loss": -6.526364803314209, "global_step": 108136, "epoch": 2574} {"train_loss": -6.362700462341309, "global_step": 108137, "epoch": 2574} {"train_loss": -6.3659138679504395, "global_step": 108138, "epoch": 2574} {"train_loss": -6.315321922302246, "global_step": 108139, "epoch": 2574} {"train_loss": -6.301260948181152, "global_step": 108140, "epoch": 2574} {"train_loss": -6.4062700271606445, "global_step": 108141, "epoch": 2574} {"train_loss": -6.41520881652832, "global_step": 108142, "epoch": 2574} {"train_loss": -6.382761001586914, "global_step": 108143, "epoch": 2574} {"train_loss": -6.469642162322998, "global_step": 108144, "epoch": 2574} {"train_loss": -6.5030927658081055, "global_step": 108145, "epoch": 2574} {"train_loss": -6.3962721824646, "global_step": 108146, "epoch": 2574} {"train_loss": -6.435115337371826, "global_step": 108147, "epoch": 2574} {"train_loss": -6.315090179443359, "global_step": 108148, "epoch": 2574} {"train_loss": -6.4299951394399, "global_step": 108149, "epoch": 2574, "val_loss": 67944.15625} {"train_loss": -6.378251075744629, "global_step": 108150, "epoch": 2575} {"train_loss": -6.534886360168457, "global_step": 108151, "epoch": 2575} {"train_loss": -6.481592178344727, "global_step": 108152, "epoch": 2575} {"train_loss": -6.407785892486572, "global_step": 108153, "epoch": 2575} {"train_loss": -6.378100395202637, "global_step": 108154, "epoch": 2575} {"train_loss": -6.454733848571777, "global_step": 108155, "epoch": 2575} {"train_loss": -6.422459125518799, "global_step": 108156, "epoch": 2575} {"train_loss": -6.354748725891113, "global_step": 108157, "epoch": 2575} {"train_loss": -6.457959175109863, "global_step": 108158, "epoch": 2575} {"train_loss": -6.4626617431640625, "global_step": 108159, "epoch": 2575} {"train_loss": -6.461423873901367, "global_step": 108160, "epoch": 2575} {"train_loss": -6.449687957763672, "global_step": 108161, "epoch": 2575} {"train_loss": -6.501523017883301, "global_step": 108162, "epoch": 2575} {"train_loss": -6.353835105895996, "global_step": 108163, "epoch": 2575} {"train_loss": -6.518490791320801, "global_step": 108164, "epoch": 2575} {"train_loss": -6.432209014892578, "global_step": 108165, "epoch": 2575} {"train_loss": -6.3535566329956055, "global_step": 108166, "epoch": 2575} {"train_loss": -6.5408477783203125, "global_step": 108167, "epoch": 2575} {"train_loss": -6.461559295654297, "global_step": 108168, "epoch": 2575} {"train_loss": -6.349477291107178, "global_step": 108169, "epoch": 2575} {"train_loss": -6.366011619567871, "global_step": 108170, "epoch": 2575} {"train_loss": -6.413383483886719, "global_step": 108171, "epoch": 2575} {"train_loss": -6.391338348388672, "global_step": 108172, "epoch": 2575} {"train_loss": -6.415834426879883, "global_step": 108173, "epoch": 2575} {"train_loss": -6.230821132659912, "global_step": 108174, "epoch": 2575} {"train_loss": -6.423439979553223, "global_step": 108175, "epoch": 2575} {"train_loss": -6.280971050262451, "global_step": 108176, "epoch": 2575} {"train_loss": -6.336295127868652, "global_step": 108177, "epoch": 2575} {"train_loss": -6.388883113861084, "global_step": 108178, "epoch": 2575} {"train_loss": -6.429593086242676, "global_step": 108179, "epoch": 2575} {"train_loss": -6.4654693603515625, "global_step": 108180, "epoch": 2575} {"train_loss": -6.332883834838867, "global_step": 108181, "epoch": 2575} {"train_loss": -6.445740699768066, "global_step": 108182, "epoch": 2575} {"train_loss": -6.427721977233887, "global_step": 108183, "epoch": 2575} {"train_loss": -6.384594440460205, "global_step": 108184, "epoch": 2575} {"train_loss": -6.492519855499268, "global_step": 108185, "epoch": 2575} {"train_loss": -6.303159713745117, "global_step": 108186, "epoch": 2575} {"train_loss": -6.302366256713867, "global_step": 108187, "epoch": 2575} {"train_loss": -6.423281669616699, "global_step": 108188, "epoch": 2575} {"train_loss": -6.362936019897461, "global_step": 108189, "epoch": 2575} {"train_loss": -6.459083557128906, "global_step": 108190, "epoch": 2575} {"train_loss": -6.407680488768078, "global_step": 108191, "epoch": 2575, "val_loss": 67839.90625} {"train_loss": -6.445279121398926, "global_step": 108192, "epoch": 2576} {"train_loss": -6.3557658195495605, "global_step": 108193, "epoch": 2576} {"train_loss": -6.256276607513428, "global_step": 108194, "epoch": 2576} {"train_loss": -6.384533882141113, "global_step": 108195, "epoch": 2576} {"train_loss": -6.43454647064209, "global_step": 108196, "epoch": 2576} {"train_loss": -6.197007179260254, "global_step": 108197, "epoch": 2576} {"train_loss": -6.535953044891357, "global_step": 108198, "epoch": 2576} {"train_loss": -6.377684593200684, "global_step": 108199, "epoch": 2576} {"train_loss": -6.36635684967041, "global_step": 108200, "epoch": 2576} {"train_loss": -6.421597480773926, "global_step": 108201, "epoch": 2576} {"train_loss": -6.379373550415039, "global_step": 108202, "epoch": 2576} {"train_loss": -6.453517436981201, "global_step": 108203, "epoch": 2576} {"train_loss": -6.292852401733398, "global_step": 108204, "epoch": 2576} {"train_loss": -6.445209980010986, "global_step": 108205, "epoch": 2576} {"train_loss": -6.519495964050293, "global_step": 108206, "epoch": 2576} {"train_loss": -6.503252029418945, "global_step": 108207, "epoch": 2576} {"train_loss": -6.388932228088379, "global_step": 108208, "epoch": 2576} {"train_loss": -6.448665142059326, "global_step": 108209, "epoch": 2576} {"train_loss": -6.422203540802002, "global_step": 108210, "epoch": 2576} {"train_loss": -6.442263603210449, "global_step": 108211, "epoch": 2576} {"train_loss": -6.363980293273926, "global_step": 108212, "epoch": 2576} {"train_loss": -6.425060272216797, "global_step": 108213, "epoch": 2576} {"train_loss": -6.523149490356445, "global_step": 108214, "epoch": 2576} {"train_loss": -6.470561981201172, "global_step": 108215, "epoch": 2576} {"train_loss": -6.369598388671875, "global_step": 108216, "epoch": 2576} {"train_loss": -6.366715908050537, "global_step": 108217, "epoch": 2576} {"train_loss": -6.339533805847168, "global_step": 108218, "epoch": 2576} {"train_loss": -6.477721691131592, "global_step": 108219, "epoch": 2576} {"train_loss": -6.5478196144104, "global_step": 108220, "epoch": 2576} {"train_loss": -6.4274749755859375, "global_step": 108221, "epoch": 2576} {"train_loss": -6.4528117179870605, "global_step": 108222, "epoch": 2576} {"train_loss": -6.493335723876953, "global_step": 108223, "epoch": 2576} {"train_loss": -6.421619415283203, "global_step": 108224, "epoch": 2576} {"train_loss": -6.541534423828125, "global_step": 108225, "epoch": 2576} {"train_loss": -6.395182132720947, "global_step": 108226, "epoch": 2576} {"train_loss": -6.427719593048096, "global_step": 108227, "epoch": 2576} {"train_loss": -6.39872407913208, "global_step": 108228, "epoch": 2576} {"train_loss": -6.49205207824707, "global_step": 108229, "epoch": 2576} {"train_loss": -6.433035373687744, "global_step": 108230, "epoch": 2576} {"train_loss": -6.432198524475098, "global_step": 108231, "epoch": 2576} {"train_loss": -6.44482946395874, "global_step": 108232, "epoch": 2576} {"train_loss": -6.420388709931147, "global_step": 108233, "epoch": 2576, "val_loss": 67829.1328125} {"train_loss": -6.385814666748047, "global_step": 108234, "epoch": 2577} {"train_loss": -6.4142961502075195, "global_step": 108235, "epoch": 2577} {"train_loss": -6.454358100891113, "global_step": 108236, "epoch": 2577} {"train_loss": -6.52630615234375, "global_step": 108237, "epoch": 2577} {"train_loss": -6.336970329284668, "global_step": 108238, "epoch": 2577} {"train_loss": -6.417821407318115, "global_step": 108239, "epoch": 2577} {"train_loss": -6.4383111000061035, "global_step": 108240, "epoch": 2577} {"train_loss": -6.432563781738281, "global_step": 108241, "epoch": 2577} {"train_loss": -6.451179027557373, "global_step": 108242, "epoch": 2577} {"train_loss": -6.459170818328857, "global_step": 108243, "epoch": 2577} {"train_loss": -6.4880266189575195, "global_step": 108244, "epoch": 2577} {"train_loss": -6.4551100730896, "global_step": 108245, "epoch": 2577} {"train_loss": -6.496285438537598, "global_step": 108246, "epoch": 2577} {"train_loss": -6.42342472076416, "global_step": 108247, "epoch": 2577} {"train_loss": -6.424827575683594, "global_step": 108248, "epoch": 2577} {"train_loss": -6.475069522857666, "global_step": 108249, "epoch": 2577} {"train_loss": -6.4440107345581055, "global_step": 108250, "epoch": 2577} {"train_loss": -6.488720417022705, "global_step": 108251, "epoch": 2577} {"train_loss": -6.42786979675293, "global_step": 108252, "epoch": 2577} {"train_loss": -6.512510299682617, "global_step": 108253, "epoch": 2577} {"train_loss": -6.382321357727051, "global_step": 108254, "epoch": 2577} {"train_loss": -6.469205856323242, "global_step": 108255, "epoch": 2577} {"train_loss": -6.425535202026367, "global_step": 108256, "epoch": 2577} {"train_loss": -6.444154739379883, "global_step": 108257, "epoch": 2577} {"train_loss": -6.3730621337890625, "global_step": 108258, "epoch": 2577} {"train_loss": -6.491545677185059, "global_step": 108259, "epoch": 2577} {"train_loss": -6.478477954864502, "global_step": 108260, "epoch": 2577} {"train_loss": -6.4734625816345215, "global_step": 108261, "epoch": 2577} {"train_loss": -6.424015998840332, "global_step": 108262, "epoch": 2577} {"train_loss": -6.41921854019165, "global_step": 108263, "epoch": 2577} {"train_loss": -6.44215202331543, "global_step": 108264, "epoch": 2577} {"train_loss": -6.55659818649292, "global_step": 108265, "epoch": 2577} {"train_loss": -6.439207077026367, "global_step": 108266, "epoch": 2577} {"train_loss": -6.401238441467285, "global_step": 108267, "epoch": 2577} {"train_loss": -6.489200592041016, "global_step": 108268, "epoch": 2577} {"train_loss": -6.436077117919922, "global_step": 108269, "epoch": 2577} {"train_loss": -6.448883056640625, "global_step": 108270, "epoch": 2577} {"train_loss": -6.475732803344727, "global_step": 108271, "epoch": 2577} {"train_loss": -6.358038902282715, "global_step": 108272, "epoch": 2577} {"train_loss": -6.485097885131836, "global_step": 108273, "epoch": 2577} {"train_loss": -6.344971179962158, "global_step": 108274, "epoch": 2577} {"train_loss": -6.441817930766514, "global_step": 108275, "epoch": 2577, "val_loss": 67962.8515625} {"train_loss": -6.493823051452637, "global_step": 108276, "epoch": 2578} {"train_loss": -6.401177406311035, "global_step": 108277, "epoch": 2578} {"train_loss": -6.364113807678223, "global_step": 108278, "epoch": 2578} {"train_loss": -6.305036544799805, "global_step": 108279, "epoch": 2578} {"train_loss": -6.512947082519531, "global_step": 108280, "epoch": 2578} {"train_loss": -6.357869625091553, "global_step": 108281, "epoch": 2578} {"train_loss": -6.327415943145752, "global_step": 108282, "epoch": 2578} {"train_loss": -6.468988418579102, "global_step": 108283, "epoch": 2578} {"train_loss": -6.428415298461914, "global_step": 108284, "epoch": 2578} {"train_loss": -6.470854759216309, "global_step": 108285, "epoch": 2578} {"train_loss": -6.326169490814209, "global_step": 108286, "epoch": 2578} {"train_loss": -6.284025192260742, "global_step": 108287, "epoch": 2578} {"train_loss": -6.3143720626831055, "global_step": 108288, "epoch": 2578} {"train_loss": -6.292000770568848, "global_step": 108289, "epoch": 2578} {"train_loss": -6.234663963317871, "global_step": 108290, "epoch": 2578} {"train_loss": -6.374332427978516, "global_step": 108291, "epoch": 2578} {"train_loss": -6.251464366912842, "global_step": 108292, "epoch": 2578} {"train_loss": -6.427238941192627, "global_step": 108293, "epoch": 2578} {"train_loss": -6.415280342102051, "global_step": 108294, "epoch": 2578} {"train_loss": -6.257315635681152, "global_step": 108295, "epoch": 2578} {"train_loss": -6.510710716247559, "global_step": 108296, "epoch": 2578} {"train_loss": -6.326096534729004, "global_step": 108297, "epoch": 2578} {"train_loss": -6.430208206176758, "global_step": 108298, "epoch": 2578} {"train_loss": -6.431966781616211, "global_step": 108299, "epoch": 2578} {"train_loss": -6.378115653991699, "global_step": 108300, "epoch": 2578} {"train_loss": -6.3673505783081055, "global_step": 108301, "epoch": 2578} {"train_loss": -6.444570541381836, "global_step": 108302, "epoch": 2578} {"train_loss": -6.436003684997559, "global_step": 108303, "epoch": 2578} {"train_loss": -6.409656524658203, "global_step": 108304, "epoch": 2578} {"train_loss": -6.390814304351807, "global_step": 108305, "epoch": 2578} {"train_loss": -6.393080711364746, "global_step": 108306, "epoch": 2578} {"train_loss": -6.381199836730957, "global_step": 108307, "epoch": 2578} {"train_loss": -6.350127696990967, "global_step": 108308, "epoch": 2578} {"train_loss": -6.349516868591309, "global_step": 108309, "epoch": 2578} {"train_loss": -6.495667457580566, "global_step": 108310, "epoch": 2578} {"train_loss": -6.43085241317749, "global_step": 108311, "epoch": 2578} {"train_loss": -6.5187249183654785, "global_step": 108312, "epoch": 2578} {"train_loss": -6.406352996826172, "global_step": 108313, "epoch": 2578} {"train_loss": -6.386321067810059, "global_step": 108314, "epoch": 2578} {"train_loss": -6.436425685882568, "global_step": 108315, "epoch": 2578} {"train_loss": -6.51783561706543, "global_step": 108316, "epoch": 2578} {"train_loss": -6.390439408166068, "global_step": 108317, "epoch": 2578, "val_loss": 67992.2890625} {"train_loss": -6.407837390899658, "global_step": 108318, "epoch": 2579} {"train_loss": -6.402108192443848, "global_step": 108319, "epoch": 2579} {"train_loss": -6.479432582855225, "global_step": 108320, "epoch": 2579} {"train_loss": -6.414560317993164, "global_step": 108321, "epoch": 2579} {"train_loss": -6.4272356033325195, "global_step": 108322, "epoch": 2579} {"train_loss": -6.45777702331543, "global_step": 108323, "epoch": 2579} {"train_loss": -6.390009880065918, "global_step": 108324, "epoch": 2579} {"train_loss": -6.466211318969727, "global_step": 108325, "epoch": 2579} {"train_loss": -6.281296730041504, "global_step": 108326, "epoch": 2579} {"train_loss": -6.464418411254883, "global_step": 108327, "epoch": 2579} {"train_loss": -6.417647361755371, "global_step": 108328, "epoch": 2579} {"train_loss": -6.354119777679443, "global_step": 108329, "epoch": 2579} {"train_loss": -6.5129594802856445, "global_step": 108330, "epoch": 2579} {"train_loss": -6.500391483306885, "global_step": 108331, "epoch": 2579} {"train_loss": -6.389303207397461, "global_step": 108332, "epoch": 2579} {"train_loss": -6.49451208114624, "global_step": 108333, "epoch": 2579} {"train_loss": -6.475255966186523, "global_step": 108334, "epoch": 2579} {"train_loss": -6.359528541564941, "global_step": 108335, "epoch": 2579} {"train_loss": -6.443782806396484, "global_step": 108336, "epoch": 2579} {"train_loss": -6.371893405914307, "global_step": 108337, "epoch": 2579} {"train_loss": -6.4395880699157715, "global_step": 108338, "epoch": 2579} {"train_loss": -6.440431118011475, "global_step": 108339, "epoch": 2579} {"train_loss": -6.420793056488037, "global_step": 108340, "epoch": 2579} {"train_loss": -6.398212432861328, "global_step": 108341, "epoch": 2579} {"train_loss": -6.438077449798584, "global_step": 108342, "epoch": 2579} {"train_loss": -6.436270713806152, "global_step": 108343, "epoch": 2579} {"train_loss": -6.338962554931641, "global_step": 108344, "epoch": 2579} {"train_loss": -6.343979835510254, "global_step": 108345, "epoch": 2579} {"train_loss": -6.491564750671387, "global_step": 108346, "epoch": 2579} {"train_loss": -6.448004245758057, "global_step": 108347, "epoch": 2579} {"train_loss": -6.360482215881348, "global_step": 108348, "epoch": 2579} {"train_loss": -6.352344989776611, "global_step": 108349, "epoch": 2579} {"train_loss": -6.450834274291992, "global_step": 108350, "epoch": 2579} {"train_loss": -6.496126651763916, "global_step": 108351, "epoch": 2579} {"train_loss": -6.4052910804748535, "global_step": 108352, "epoch": 2579} {"train_loss": -6.330327033996582, "global_step": 108353, "epoch": 2579} {"train_loss": -6.518287181854248, "global_step": 108354, "epoch": 2579} {"train_loss": -6.574270248413086, "global_step": 108355, "epoch": 2579} {"train_loss": -6.513090133666992, "global_step": 108356, "epoch": 2579} {"train_loss": -6.3317461013793945, "global_step": 108357, "epoch": 2579} {"train_loss": -6.411191463470459, "global_step": 108358, "epoch": 2579} {"train_loss": -6.429225126902263, "global_step": 108359, "epoch": 2579, "val_loss": 67874.578125} {"train_loss": -6.352296352386475, "global_step": 108360, "epoch": 2580} {"train_loss": -6.352819442749023, "global_step": 108361, "epoch": 2580} {"train_loss": -6.591238975524902, "global_step": 108362, "epoch": 2580} {"train_loss": -6.441741466522217, "global_step": 108363, "epoch": 2580} {"train_loss": -6.508795261383057, "global_step": 108364, "epoch": 2580} {"train_loss": -6.5795512199401855, "global_step": 108365, "epoch": 2580} {"train_loss": -6.390774726867676, "global_step": 108366, "epoch": 2580} {"train_loss": -6.444988250732422, "global_step": 108367, "epoch": 2580} {"train_loss": -6.432182788848877, "global_step": 108368, "epoch": 2580} {"train_loss": -6.480832099914551, "global_step": 108369, "epoch": 2580} {"train_loss": -6.516435623168945, "global_step": 108370, "epoch": 2580} {"train_loss": -6.382932662963867, "global_step": 108371, "epoch": 2580} {"train_loss": -6.428043842315674, "global_step": 108372, "epoch": 2580} {"train_loss": -6.5115861892700195, "global_step": 108373, "epoch": 2580} {"train_loss": -6.470359802246094, "global_step": 108374, "epoch": 2580} {"train_loss": -6.405279159545898, "global_step": 108375, "epoch": 2580} {"train_loss": -6.531501293182373, "global_step": 108376, "epoch": 2580} {"train_loss": -6.397768974304199, "global_step": 108377, "epoch": 2580} {"train_loss": -6.460925102233887, "global_step": 108378, "epoch": 2580} {"train_loss": -6.452800273895264, "global_step": 108379, "epoch": 2580} {"train_loss": -6.481015205383301, "global_step": 108380, "epoch": 2580} {"train_loss": -6.350872993469238, "global_step": 108381, "epoch": 2580} {"train_loss": -6.51028299331665, "global_step": 108382, "epoch": 2580} {"train_loss": -6.542420387268066, "global_step": 108383, "epoch": 2580} {"train_loss": -6.442661285400391, "global_step": 108384, "epoch": 2580} {"train_loss": -6.477110862731934, "global_step": 108385, "epoch": 2580} {"train_loss": -6.43411922454834, "global_step": 108386, "epoch": 2580} {"train_loss": -6.336782455444336, "global_step": 108387, "epoch": 2580} {"train_loss": -6.234649658203125, "global_step": 108388, "epoch": 2580} {"train_loss": -6.238877296447754, "global_step": 108389, "epoch": 2580} {"train_loss": -6.3091020584106445, "global_step": 108390, "epoch": 2580} {"train_loss": -6.373675346374512, "global_step": 108391, "epoch": 2580} {"train_loss": -6.4095072746276855, "global_step": 108392, "epoch": 2580} {"train_loss": -6.267637252807617, "global_step": 108393, "epoch": 2580} {"train_loss": -6.31424617767334, "global_step": 108394, "epoch": 2580} {"train_loss": -6.267159461975098, "global_step": 108395, "epoch": 2580} {"train_loss": -6.277223587036133, "global_step": 108396, "epoch": 2580} {"train_loss": -6.267393112182617, "global_step": 108397, "epoch": 2580} {"train_loss": -6.502959251403809, "global_step": 108398, "epoch": 2580} {"train_loss": -6.403444766998291, "global_step": 108399, "epoch": 2580} {"train_loss": -6.3134613037109375, "global_step": 108400, "epoch": 2580} {"train_loss": -6.409855570111956, "global_step": 108401, "epoch": 2580, "val_loss": 68112.4921875} {"train_loss": -6.518832206726074, "global_step": 108402, "epoch": 2581} {"train_loss": -6.331521987915039, "global_step": 108403, "epoch": 2581} {"train_loss": -6.268568992614746, "global_step": 108404, "epoch": 2581} {"train_loss": -6.384306907653809, "global_step": 108405, "epoch": 2581} {"train_loss": -6.354185581207275, "global_step": 108406, "epoch": 2581} {"train_loss": -6.350246429443359, "global_step": 108407, "epoch": 2581} {"train_loss": -6.389133930206299, "global_step": 108408, "epoch": 2581} {"train_loss": -6.4198150634765625, "global_step": 108409, "epoch": 2581} {"train_loss": -6.339751243591309, "global_step": 108410, "epoch": 2581} {"train_loss": -6.4126081466674805, "global_step": 108411, "epoch": 2581} {"train_loss": -6.329898834228516, "global_step": 108412, "epoch": 2581} {"train_loss": -6.382930755615234, "global_step": 108413, "epoch": 2581} {"train_loss": -6.4144463539123535, "global_step": 108414, "epoch": 2581} {"train_loss": -6.331089973449707, "global_step": 108415, "epoch": 2581} {"train_loss": -6.393312931060791, "global_step": 108416, "epoch": 2581} {"train_loss": -6.383605480194092, "global_step": 108417, "epoch": 2581} {"train_loss": -6.282445907592773, "global_step": 108418, "epoch": 2581} {"train_loss": -6.527775764465332, "global_step": 108419, "epoch": 2581} {"train_loss": -6.226619720458984, "global_step": 108420, "epoch": 2581} {"train_loss": -6.382603168487549, "global_step": 108421, "epoch": 2581} {"train_loss": -6.428525924682617, "global_step": 108422, "epoch": 2581} {"train_loss": -6.412489891052246, "global_step": 108423, "epoch": 2581} {"train_loss": -6.414809226989746, "global_step": 108424, "epoch": 2581} {"train_loss": -6.427918434143066, "global_step": 108425, "epoch": 2581} {"train_loss": -6.431995391845703, "global_step": 108426, "epoch": 2581} {"train_loss": -6.3699727058410645, "global_step": 108427, "epoch": 2581} {"train_loss": -6.444530963897705, "global_step": 108428, "epoch": 2581} {"train_loss": -6.474358558654785, "global_step": 108429, "epoch": 2581} {"train_loss": -6.481359481811523, "global_step": 108430, "epoch": 2581} {"train_loss": -6.382871150970459, "global_step": 108431, "epoch": 2581} {"train_loss": -6.429844379425049, "global_step": 108432, "epoch": 2581} {"train_loss": -6.441618919372559, "global_step": 108433, "epoch": 2581} {"train_loss": -6.462795734405518, "global_step": 108434, "epoch": 2581} {"train_loss": -6.478414058685303, "global_step": 108435, "epoch": 2581} {"train_loss": -6.4088640213012695, "global_step": 108436, "epoch": 2581} {"train_loss": -6.5741729736328125, "global_step": 108437, "epoch": 2581} {"train_loss": -6.485964775085449, "global_step": 108438, "epoch": 2581} {"train_loss": -6.391087055206299, "global_step": 108439, "epoch": 2581} {"train_loss": -6.575876235961914, "global_step": 108440, "epoch": 2581} {"train_loss": -6.40355920791626, "global_step": 108441, "epoch": 2581} {"train_loss": -6.311887264251709, "global_step": 108442, "epoch": 2581} {"train_loss": -6.407602060408819, "global_step": 108443, "epoch": 2581, "val_loss": 67589.5859375} {"train_loss": -6.49569034576416, "global_step": 108444, "epoch": 2582} {"train_loss": -6.457487106323242, "global_step": 108445, "epoch": 2582} {"train_loss": -6.592513084411621, "global_step": 108446, "epoch": 2582} {"train_loss": -6.428915023803711, "global_step": 108447, "epoch": 2582} {"train_loss": -6.538849353790283, "global_step": 108448, "epoch": 2582} {"train_loss": -6.478703022003174, "global_step": 108449, "epoch": 2582} {"train_loss": -6.373320579528809, "global_step": 108450, "epoch": 2582} {"train_loss": -6.571493148803711, "global_step": 108451, "epoch": 2582} {"train_loss": -6.5643205642700195, "global_step": 108452, "epoch": 2582} {"train_loss": -6.367334842681885, "global_step": 108453, "epoch": 2582} {"train_loss": -6.361150741577148, "global_step": 108454, "epoch": 2582} {"train_loss": -6.431137561798096, "global_step": 108455, "epoch": 2582} {"train_loss": -6.40623664855957, "global_step": 108456, "epoch": 2582} {"train_loss": -6.333915710449219, "global_step": 108457, "epoch": 2582} {"train_loss": -6.350739479064941, "global_step": 108458, "epoch": 2582} {"train_loss": -6.182283401489258, "global_step": 108459, "epoch": 2582} {"train_loss": -6.453960418701172, "global_step": 108460, "epoch": 2582} {"train_loss": -6.391715049743652, "global_step": 108461, "epoch": 2582} {"train_loss": -6.271181583404541, "global_step": 108462, "epoch": 2582} {"train_loss": -6.35025691986084, "global_step": 108463, "epoch": 2582} {"train_loss": -6.504359245300293, "global_step": 108464, "epoch": 2582} {"train_loss": -6.437253952026367, "global_step": 108465, "epoch": 2582} {"train_loss": -6.379793167114258, "global_step": 108466, "epoch": 2582} {"train_loss": -6.440062046051025, "global_step": 108467, "epoch": 2582} {"train_loss": -6.374309062957764, "global_step": 108468, "epoch": 2582} {"train_loss": -6.426068305969238, "global_step": 108469, "epoch": 2582} {"train_loss": -6.411968231201172, "global_step": 108470, "epoch": 2582} {"train_loss": -6.455923557281494, "global_step": 108471, "epoch": 2582} {"train_loss": -6.423148155212402, "global_step": 108472, "epoch": 2582} {"train_loss": -6.479720115661621, "global_step": 108473, "epoch": 2582} {"train_loss": -6.364408016204834, "global_step": 108474, "epoch": 2582} {"train_loss": -6.38157320022583, "global_step": 108475, "epoch": 2582} {"train_loss": -6.410353183746338, "global_step": 108476, "epoch": 2582} {"train_loss": -6.454901695251465, "global_step": 108477, "epoch": 2582} {"train_loss": -6.450582504272461, "global_step": 108478, "epoch": 2582} {"train_loss": -6.365233421325684, "global_step": 108479, "epoch": 2582} {"train_loss": -6.420688629150391, "global_step": 108480, "epoch": 2582} {"train_loss": -6.538978576660156, "global_step": 108481, "epoch": 2582} {"train_loss": -6.415099620819092, "global_step": 108482, "epoch": 2582} {"train_loss": -6.423670768737793, "global_step": 108483, "epoch": 2582} {"train_loss": -6.350461959838867, "global_step": 108484, "epoch": 2582} {"train_loss": -6.421969277518136, "global_step": 108485, "epoch": 2582, "val_loss": 67891.6953125} {"train_loss": -6.411728858947754, "global_step": 108486, "epoch": 2583} {"train_loss": -6.503456115722656, "global_step": 108487, "epoch": 2583} {"train_loss": -6.428988933563232, "global_step": 108488, "epoch": 2583} {"train_loss": -6.361265659332275, "global_step": 108489, "epoch": 2583} {"train_loss": -6.401060581207275, "global_step": 108490, "epoch": 2583} {"train_loss": -6.546327590942383, "global_step": 108491, "epoch": 2583} {"train_loss": -6.446741580963135, "global_step": 108492, "epoch": 2583} {"train_loss": -6.481800079345703, "global_step": 108493, "epoch": 2583} {"train_loss": -6.569406509399414, "global_step": 108494, "epoch": 2583} {"train_loss": -6.475275993347168, "global_step": 108495, "epoch": 2583} {"train_loss": -6.407223701477051, "global_step": 108496, "epoch": 2583} {"train_loss": -6.337015628814697, "global_step": 108497, "epoch": 2583} {"train_loss": -6.494592666625977, "global_step": 108498, "epoch": 2583} {"train_loss": -6.440823554992676, "global_step": 108499, "epoch": 2583} {"train_loss": -6.440108776092529, "global_step": 108500, "epoch": 2583} {"train_loss": -6.427488327026367, "global_step": 108501, "epoch": 2583} {"train_loss": -6.453794479370117, "global_step": 108502, "epoch": 2583} {"train_loss": -6.320622444152832, "global_step": 108503, "epoch": 2583} {"train_loss": -6.541677474975586, "global_step": 108504, "epoch": 2583} {"train_loss": -6.409748077392578, "global_step": 108505, "epoch": 2583} {"train_loss": -6.489173889160156, "global_step": 108506, "epoch": 2583} {"train_loss": -6.500553131103516, "global_step": 108507, "epoch": 2583} {"train_loss": -6.392848968505859, "global_step": 108508, "epoch": 2583} {"train_loss": -6.551002502441406, "global_step": 108509, "epoch": 2583} {"train_loss": -6.425164699554443, "global_step": 108510, "epoch": 2583} {"train_loss": -6.473424434661865, "global_step": 108511, "epoch": 2583} {"train_loss": -6.489092826843262, "global_step": 108512, "epoch": 2583} {"train_loss": -6.3995490074157715, "global_step": 108513, "epoch": 2583} {"train_loss": -6.309262275695801, "global_step": 108514, "epoch": 2583} {"train_loss": -6.483656883239746, "global_step": 108515, "epoch": 2583} {"train_loss": -6.4157023429870605, "global_step": 108516, "epoch": 2583} {"train_loss": -6.398386001586914, "global_step": 108517, "epoch": 2583} {"train_loss": -6.527511119842529, "global_step": 108518, "epoch": 2583} {"train_loss": -6.268646717071533, "global_step": 108519, "epoch": 2583} {"train_loss": -6.3118767738342285, "global_step": 108520, "epoch": 2583} {"train_loss": -6.387416839599609, "global_step": 108521, "epoch": 2583} {"train_loss": -6.367885589599609, "global_step": 108522, "epoch": 2583} {"train_loss": -6.459908485412598, "global_step": 108523, "epoch": 2583} {"train_loss": -6.466873645782471, "global_step": 108524, "epoch": 2583} {"train_loss": -6.2649030685424805, "global_step": 108525, "epoch": 2583} {"train_loss": -6.4656081199646, "global_step": 108526, "epoch": 2583} {"train_loss": -6.42901907648359, "global_step": 108527, "epoch": 2583, "val_loss": 68151.671875} {"train_loss": -6.430230140686035, "global_step": 108528, "epoch": 2584} {"train_loss": -6.37062406539917, "global_step": 108529, "epoch": 2584} {"train_loss": -6.234398365020752, "global_step": 108530, "epoch": 2584} {"train_loss": -6.418770790100098, "global_step": 108531, "epoch": 2584} {"train_loss": -6.292872905731201, "global_step": 108532, "epoch": 2584} {"train_loss": -6.592824459075928, "global_step": 108533, "epoch": 2584} {"train_loss": -6.296656608581543, "global_step": 108534, "epoch": 2584} {"train_loss": -6.46349573135376, "global_step": 108535, "epoch": 2584} {"train_loss": -6.173821449279785, "global_step": 108536, "epoch": 2584} {"train_loss": -6.405065536499023, "global_step": 108537, "epoch": 2584} {"train_loss": -6.185011863708496, "global_step": 108538, "epoch": 2584} {"train_loss": -6.399532794952393, "global_step": 108539, "epoch": 2584} {"train_loss": -6.341769218444824, "global_step": 108540, "epoch": 2584} {"train_loss": -6.309986114501953, "global_step": 108541, "epoch": 2584} {"train_loss": -6.33264684677124, "global_step": 108542, "epoch": 2584} {"train_loss": -6.387416362762451, "global_step": 108543, "epoch": 2584} {"train_loss": -6.469302177429199, "global_step": 108544, "epoch": 2584} {"train_loss": -6.18453311920166, "global_step": 108545, "epoch": 2584} {"train_loss": -6.277904987335205, "global_step": 108546, "epoch": 2584} {"train_loss": -6.173941612243652, "global_step": 108547, "epoch": 2584} {"train_loss": -6.3778581619262695, "global_step": 108548, "epoch": 2584} {"train_loss": -6.229667663574219, "global_step": 108549, "epoch": 2584} {"train_loss": -6.432674884796143, "global_step": 108550, "epoch": 2584} {"train_loss": -6.266120433807373, "global_step": 108551, "epoch": 2584} {"train_loss": -6.45167350769043, "global_step": 108552, "epoch": 2584} {"train_loss": -6.245209693908691, "global_step": 108553, "epoch": 2584} {"train_loss": -6.440588474273682, "global_step": 108554, "epoch": 2584} {"train_loss": -6.275419235229492, "global_step": 108555, "epoch": 2584} {"train_loss": -6.353323936462402, "global_step": 108556, "epoch": 2584} {"train_loss": -6.348172187805176, "global_step": 108557, "epoch": 2584} {"train_loss": -6.345298767089844, "global_step": 108558, "epoch": 2584} {"train_loss": -6.4598307609558105, "global_step": 108559, "epoch": 2584} {"train_loss": -6.520076751708984, "global_step": 108560, "epoch": 2584} {"train_loss": -6.374119281768799, "global_step": 108561, "epoch": 2584} {"train_loss": -6.379574775695801, "global_step": 108562, "epoch": 2584} {"train_loss": -6.38887882232666, "global_step": 108563, "epoch": 2584} {"train_loss": -6.435522556304932, "global_step": 108564, "epoch": 2584} {"train_loss": -6.402888298034668, "global_step": 108565, "epoch": 2584} {"train_loss": -6.350748062133789, "global_step": 108566, "epoch": 2584} {"train_loss": -6.420854091644287, "global_step": 108567, "epoch": 2584} {"train_loss": -6.444597244262695, "global_step": 108568, "epoch": 2584} {"train_loss": -6.360183693113781, "global_step": 108569, "epoch": 2584, "val_loss": 67828.46875} {"train_loss": -6.369507789611816, "global_step": 108570, "epoch": 2585} {"train_loss": -6.337798118591309, "global_step": 108571, "epoch": 2585} {"train_loss": -6.336400985717773, "global_step": 108572, "epoch": 2585} {"train_loss": -6.443066596984863, "global_step": 108573, "epoch": 2585} {"train_loss": -6.445769786834717, "global_step": 108574, "epoch": 2585} {"train_loss": -6.372053146362305, "global_step": 108575, "epoch": 2585} {"train_loss": -6.4042205810546875, "global_step": 108576, "epoch": 2585} {"train_loss": -6.332833290100098, "global_step": 108577, "epoch": 2585} {"train_loss": -6.377840995788574, "global_step": 108578, "epoch": 2585} {"train_loss": -6.558283805847168, "global_step": 108579, "epoch": 2585} {"train_loss": -6.349436283111572, "global_step": 108580, "epoch": 2585} {"train_loss": -6.472199440002441, "global_step": 108581, "epoch": 2585} {"train_loss": -6.356790542602539, "global_step": 108582, "epoch": 2585} {"train_loss": -6.449166297912598, "global_step": 108583, "epoch": 2585} {"train_loss": -6.387300968170166, "global_step": 108584, "epoch": 2585} {"train_loss": -6.377071380615234, "global_step": 108585, "epoch": 2585} {"train_loss": -6.492888450622559, "global_step": 108586, "epoch": 2585} {"train_loss": -6.47006893157959, "global_step": 108587, "epoch": 2585} {"train_loss": -6.448371410369873, "global_step": 108588, "epoch": 2585} {"train_loss": -6.551914215087891, "global_step": 108589, "epoch": 2585} {"train_loss": -6.355881690979004, "global_step": 108590, "epoch": 2585} {"train_loss": -6.375330448150635, "global_step": 108591, "epoch": 2585} {"train_loss": -6.518031597137451, "global_step": 108592, "epoch": 2585} {"train_loss": -6.485814571380615, "global_step": 108593, "epoch": 2585} {"train_loss": -6.458343505859375, "global_step": 108594, "epoch": 2585} {"train_loss": -6.4152374267578125, "global_step": 108595, "epoch": 2585} {"train_loss": -6.583686828613281, "global_step": 108596, "epoch": 2585} {"train_loss": -6.275045871734619, "global_step": 108597, "epoch": 2585} {"train_loss": -6.423953533172607, "global_step": 108598, "epoch": 2585} {"train_loss": -6.495388507843018, "global_step": 108599, "epoch": 2585} {"train_loss": -6.3819260597229, "global_step": 108600, "epoch": 2585} {"train_loss": -6.467779636383057, "global_step": 108601, "epoch": 2585} {"train_loss": -6.494226455688477, "global_step": 108602, "epoch": 2585} {"train_loss": -6.520421981811523, "global_step": 108603, "epoch": 2585} {"train_loss": -6.451520919799805, "global_step": 108604, "epoch": 2585} {"train_loss": -6.361500263214111, "global_step": 108605, "epoch": 2585} {"train_loss": -6.386114597320557, "global_step": 108606, "epoch": 2585} {"train_loss": -6.371614933013916, "global_step": 108607, "epoch": 2585} {"train_loss": -6.459684371948242, "global_step": 108608, "epoch": 2585} {"train_loss": -6.477643966674805, "global_step": 108609, "epoch": 2585} {"train_loss": -6.3266801834106445, "global_step": 108610, "epoch": 2585} {"train_loss": -6.425468433470953, "global_step": 108611, "epoch": 2585, "val_loss": 67748.6171875} {"train_loss": -6.517542839050293, "global_step": 108612, "epoch": 2586} {"train_loss": -6.436616897583008, "global_step": 108613, "epoch": 2586} {"train_loss": -6.513813018798828, "global_step": 108614, "epoch": 2586} {"train_loss": -6.514955043792725, "global_step": 108615, "epoch": 2586} {"train_loss": -6.397078990936279, "global_step": 108616, "epoch": 2586} {"train_loss": -6.351423740386963, "global_step": 108617, "epoch": 2586} {"train_loss": -6.598568916320801, "global_step": 108618, "epoch": 2586} {"train_loss": -6.492842674255371, "global_step": 108619, "epoch": 2586} {"train_loss": -6.447631359100342, "global_step": 108620, "epoch": 2586} {"train_loss": -6.460923671722412, "global_step": 108621, "epoch": 2586} {"train_loss": -6.377307891845703, "global_step": 108622, "epoch": 2586} {"train_loss": -6.503759384155273, "global_step": 108623, "epoch": 2586} {"train_loss": -6.318473815917969, "global_step": 108624, "epoch": 2586} {"train_loss": -6.389310359954834, "global_step": 108625, "epoch": 2586} {"train_loss": -6.542516231536865, "global_step": 108626, "epoch": 2586} {"train_loss": -6.361008644104004, "global_step": 108627, "epoch": 2586} {"train_loss": -6.507610321044922, "global_step": 108628, "epoch": 2586} {"train_loss": -6.49442195892334, "global_step": 108629, "epoch": 2586} {"train_loss": -6.4417924880981445, "global_step": 108630, "epoch": 2586} {"train_loss": -6.276912689208984, "global_step": 108631, "epoch": 2586} {"train_loss": -6.427379608154297, "global_step": 108632, "epoch": 2586} {"train_loss": -6.401998996734619, "global_step": 108633, "epoch": 2586} {"train_loss": -6.45327615737915, "global_step": 108634, "epoch": 2586} {"train_loss": -6.336016654968262, "global_step": 108635, "epoch": 2586} {"train_loss": -6.323154449462891, "global_step": 108636, "epoch": 2586} {"train_loss": -6.362411975860596, "global_step": 108637, "epoch": 2586} {"train_loss": -6.3674635887146, "global_step": 108638, "epoch": 2586} {"train_loss": -6.438304901123047, "global_step": 108639, "epoch": 2586} {"train_loss": -6.3989577293396, "global_step": 108640, "epoch": 2586} {"train_loss": -6.41629695892334, "global_step": 108641, "epoch": 2586} {"train_loss": -6.466566562652588, "global_step": 108642, "epoch": 2586} {"train_loss": -6.361005783081055, "global_step": 108643, "epoch": 2586} {"train_loss": -6.499411582946777, "global_step": 108644, "epoch": 2586} {"train_loss": -6.4373602867126465, "global_step": 108645, "epoch": 2586} {"train_loss": -6.445694446563721, "global_step": 108646, "epoch": 2586} {"train_loss": -6.513649940490723, "global_step": 108647, "epoch": 2586} {"train_loss": -6.447719573974609, "global_step": 108648, "epoch": 2586} {"train_loss": -6.46109676361084, "global_step": 108649, "epoch": 2586} {"train_loss": -6.37819766998291, "global_step": 108650, "epoch": 2586} {"train_loss": -6.399338722229004, "global_step": 108651, "epoch": 2586} {"train_loss": -6.455688953399658, "global_step": 108652, "epoch": 2586} {"train_loss": -6.4357836700621105, "global_step": 108653, "epoch": 2586, "val_loss": 67846.53125} {"train_loss": -6.422487258911133, "global_step": 108654, "epoch": 2587} {"train_loss": -6.385709762573242, "global_step": 108655, "epoch": 2587} {"train_loss": -6.573224067687988, "global_step": 108656, "epoch": 2587} {"train_loss": -6.586236476898193, "global_step": 108657, "epoch": 2587} {"train_loss": -6.448683738708496, "global_step": 108658, "epoch": 2587} {"train_loss": -6.420495986938477, "global_step": 108659, "epoch": 2587} {"train_loss": -6.41732120513916, "global_step": 108660, "epoch": 2587} {"train_loss": -6.544534206390381, "global_step": 108661, "epoch": 2587} {"train_loss": -6.522559642791748, "global_step": 108662, "epoch": 2587} {"train_loss": -6.443870544433594, "global_step": 108663, "epoch": 2587} {"train_loss": -6.3751606941223145, "global_step": 108664, "epoch": 2587} {"train_loss": -6.289506912231445, "global_step": 108665, "epoch": 2587} {"train_loss": -6.42243766784668, "global_step": 108666, "epoch": 2587} {"train_loss": -6.501613616943359, "global_step": 108667, "epoch": 2587} {"train_loss": -6.342843532562256, "global_step": 108668, "epoch": 2587} {"train_loss": -6.4528608322143555, "global_step": 108669, "epoch": 2587} {"train_loss": -6.421051502227783, "global_step": 108670, "epoch": 2587} {"train_loss": -6.375794410705566, "global_step": 108671, "epoch": 2587} {"train_loss": -6.320554256439209, "global_step": 108672, "epoch": 2587} {"train_loss": -6.405577659606934, "global_step": 108673, "epoch": 2587} {"train_loss": -6.403103828430176, "global_step": 108674, "epoch": 2587} {"train_loss": -6.423141956329346, "global_step": 108675, "epoch": 2587} {"train_loss": -6.312436103820801, "global_step": 108676, "epoch": 2587} {"train_loss": -6.411970138549805, "global_step": 108677, "epoch": 2587} {"train_loss": -6.324332237243652, "global_step": 108678, "epoch": 2587} {"train_loss": -6.440108299255371, "global_step": 108679, "epoch": 2587} {"train_loss": -6.463600158691406, "global_step": 108680, "epoch": 2587} {"train_loss": -6.432192325592041, "global_step": 108681, "epoch": 2587} {"train_loss": -6.45128059387207, "global_step": 108682, "epoch": 2587} {"train_loss": -6.265680313110352, "global_step": 108683, "epoch": 2587} {"train_loss": -6.375658988952637, "global_step": 108684, "epoch": 2587} {"train_loss": -6.345920562744141, "global_step": 108685, "epoch": 2587} {"train_loss": -6.555818557739258, "global_step": 108686, "epoch": 2587} {"train_loss": -6.3040452003479, "global_step": 108687, "epoch": 2587} {"train_loss": -6.4166412353515625, "global_step": 108688, "epoch": 2587} {"train_loss": -6.437307357788086, "global_step": 108689, "epoch": 2587} {"train_loss": -6.349809646606445, "global_step": 108690, "epoch": 2587} {"train_loss": -6.470321178436279, "global_step": 108691, "epoch": 2587} {"train_loss": -6.399093151092529, "global_step": 108692, "epoch": 2587} {"train_loss": -6.4041852951049805, "global_step": 108693, "epoch": 2587} {"train_loss": -6.454400539398193, "global_step": 108694, "epoch": 2587} {"train_loss": -6.417799824760074, "global_step": 108695, "epoch": 2587, "val_loss": 67833.078125} {"train_loss": -6.484906196594238, "global_step": 108696, "epoch": 2588} {"train_loss": -6.418153762817383, "global_step": 108697, "epoch": 2588} {"train_loss": -6.53452205657959, "global_step": 108698, "epoch": 2588} {"train_loss": -6.3596014976501465, "global_step": 108699, "epoch": 2588} {"train_loss": -6.448678493499756, "global_step": 108700, "epoch": 2588} {"train_loss": -6.521512031555176, "global_step": 108701, "epoch": 2588} {"train_loss": -6.466611862182617, "global_step": 108702, "epoch": 2588} {"train_loss": -6.49119758605957, "global_step": 108703, "epoch": 2588} {"train_loss": -6.351223945617676, "global_step": 108704, "epoch": 2588} {"train_loss": -6.432638168334961, "global_step": 108705, "epoch": 2588} {"train_loss": -6.355549335479736, "global_step": 108706, "epoch": 2588} {"train_loss": -6.5369415283203125, "global_step": 108707, "epoch": 2588} {"train_loss": -6.502955436706543, "global_step": 108708, "epoch": 2588} {"train_loss": -6.596780776977539, "global_step": 108709, "epoch": 2588} {"train_loss": -6.471255302429199, "global_step": 108710, "epoch": 2588} {"train_loss": -6.52481746673584, "global_step": 108711, "epoch": 2588} {"train_loss": -6.425448417663574, "global_step": 108712, "epoch": 2588} {"train_loss": -6.499397277832031, "global_step": 108713, "epoch": 2588} {"train_loss": -6.460610866546631, "global_step": 108714, "epoch": 2588} {"train_loss": -6.470387935638428, "global_step": 108715, "epoch": 2588} {"train_loss": -6.408965110778809, "global_step": 108716, "epoch": 2588} {"train_loss": -6.361833572387695, "global_step": 108717, "epoch": 2588} {"train_loss": -6.539909362792969, "global_step": 108718, "epoch": 2588} {"train_loss": -6.382411479949951, "global_step": 108719, "epoch": 2588} {"train_loss": -6.432817459106445, "global_step": 108720, "epoch": 2588} {"train_loss": -6.350357532501221, "global_step": 108721, "epoch": 2588} {"train_loss": -6.374319076538086, "global_step": 108722, "epoch": 2588} {"train_loss": -6.441354274749756, "global_step": 108723, "epoch": 2588} {"train_loss": -6.321811199188232, "global_step": 108724, "epoch": 2588} {"train_loss": -6.404888153076172, "global_step": 108725, "epoch": 2588} {"train_loss": -6.403299331665039, "global_step": 108726, "epoch": 2588} {"train_loss": -6.38592529296875, "global_step": 108727, "epoch": 2588} {"train_loss": -6.3855695724487305, "global_step": 108728, "epoch": 2588} {"train_loss": -6.405465602874756, "global_step": 108729, "epoch": 2588} {"train_loss": -6.454030990600586, "global_step": 108730, "epoch": 2588} {"train_loss": -6.4613142013549805, "global_step": 108731, "epoch": 2588} {"train_loss": -6.405716896057129, "global_step": 108732, "epoch": 2588} {"train_loss": -6.323563098907471, "global_step": 108733, "epoch": 2588} {"train_loss": -6.444048881530762, "global_step": 108734, "epoch": 2588} {"train_loss": -6.4597368240356445, "global_step": 108735, "epoch": 2588} {"train_loss": -6.342142105102539, "global_step": 108736, "epoch": 2588} {"train_loss": -6.433704353514171, "global_step": 108737, "epoch": 2588, "val_loss": 67897.59375} {"train_loss": -6.315864086151123, "global_step": 108738, "epoch": 2589} {"train_loss": -6.402688026428223, "global_step": 108739, "epoch": 2589} {"train_loss": -6.376552581787109, "global_step": 108740, "epoch": 2589} {"train_loss": -6.414261817932129, "global_step": 108741, "epoch": 2589} {"train_loss": -6.475135803222656, "global_step": 108742, "epoch": 2589} {"train_loss": -6.460533142089844, "global_step": 108743, "epoch": 2589} {"train_loss": -6.2714338302612305, "global_step": 108744, "epoch": 2589} {"train_loss": -6.33272647857666, "global_step": 108745, "epoch": 2589} {"train_loss": -6.47201681137085, "global_step": 108746, "epoch": 2589} {"train_loss": -6.39984130859375, "global_step": 108747, "epoch": 2589} {"train_loss": -6.365716934204102, "global_step": 108748, "epoch": 2589} {"train_loss": -6.3115234375, "global_step": 108749, "epoch": 2589} {"train_loss": -6.404454231262207, "global_step": 108750, "epoch": 2589} {"train_loss": -6.447800636291504, "global_step": 108751, "epoch": 2589} {"train_loss": -6.362381935119629, "global_step": 108752, "epoch": 2589} {"train_loss": -6.3555755615234375, "global_step": 108753, "epoch": 2589} {"train_loss": -6.41202449798584, "global_step": 108754, "epoch": 2589} {"train_loss": -6.423730373382568, "global_step": 108755, "epoch": 2589} {"train_loss": -6.344138145446777, "global_step": 108756, "epoch": 2589} {"train_loss": -6.389394760131836, "global_step": 108757, "epoch": 2589} {"train_loss": -6.3259382247924805, "global_step": 108758, "epoch": 2589} {"train_loss": -6.360861301422119, "global_step": 108759, "epoch": 2589} {"train_loss": -6.267645835876465, "global_step": 108760, "epoch": 2589} {"train_loss": -6.3967084884643555, "global_step": 108761, "epoch": 2589} {"train_loss": -6.441518306732178, "global_step": 108762, "epoch": 2589} {"train_loss": -6.308777332305908, "global_step": 108763, "epoch": 2589} {"train_loss": -6.373455047607422, "global_step": 108764, "epoch": 2589} {"train_loss": -6.360888957977295, "global_step": 108765, "epoch": 2589} {"train_loss": -6.483266830444336, "global_step": 108766, "epoch": 2589} {"train_loss": -6.28150749206543, "global_step": 108767, "epoch": 2589} {"train_loss": -6.342719554901123, "global_step": 108768, "epoch": 2589} {"train_loss": -6.378289699554443, "global_step": 108769, "epoch": 2589} {"train_loss": -6.370533466339111, "global_step": 108770, "epoch": 2589} {"train_loss": -6.3028764724731445, "global_step": 108771, "epoch": 2589} {"train_loss": -6.420280456542969, "global_step": 108772, "epoch": 2589} {"train_loss": -6.405608177185059, "global_step": 108773, "epoch": 2589} {"train_loss": -6.446597099304199, "global_step": 108774, "epoch": 2589} {"train_loss": -6.423369884490967, "global_step": 108775, "epoch": 2589} {"train_loss": -6.396219253540039, "global_step": 108776, "epoch": 2589} {"train_loss": -6.367220401763916, "global_step": 108777, "epoch": 2589} {"train_loss": -6.419772624969482, "global_step": 108778, "epoch": 2589} {"train_loss": -6.382723672049386, "global_step": 108779, "epoch": 2589, "val_loss": 67755.7265625} {"train_loss": -6.359317779541016, "global_step": 108780, "epoch": 2590} {"train_loss": -6.385500907897949, "global_step": 108781, "epoch": 2590} {"train_loss": -6.435639381408691, "global_step": 108782, "epoch": 2590} {"train_loss": -6.321767807006836, "global_step": 108783, "epoch": 2590} {"train_loss": -6.435578346252441, "global_step": 108784, "epoch": 2590} {"train_loss": -6.458108901977539, "global_step": 108785, "epoch": 2590} {"train_loss": -6.389695167541504, "global_step": 108786, "epoch": 2590} {"train_loss": -6.449410438537598, "global_step": 108787, "epoch": 2590} {"train_loss": -6.413806915283203, "global_step": 108788, "epoch": 2590} {"train_loss": -6.395030975341797, "global_step": 108789, "epoch": 2590} {"train_loss": -6.5063018798828125, "global_step": 108790, "epoch": 2590} {"train_loss": -6.405414581298828, "global_step": 108791, "epoch": 2590} {"train_loss": -6.339550971984863, "global_step": 108792, "epoch": 2590} {"train_loss": -6.495491981506348, "global_step": 108793, "epoch": 2590} {"train_loss": -6.442856788635254, "global_step": 108794, "epoch": 2590} {"train_loss": -6.360477447509766, "global_step": 108795, "epoch": 2590} {"train_loss": -6.475207805633545, "global_step": 108796, "epoch": 2590} {"train_loss": -6.443371295928955, "global_step": 108797, "epoch": 2590} {"train_loss": -6.492315292358398, "global_step": 108798, "epoch": 2590} {"train_loss": -6.421482086181641, "global_step": 108799, "epoch": 2590} {"train_loss": -6.4330549240112305, "global_step": 108800, "epoch": 2590} {"train_loss": -6.410708427429199, "global_step": 108801, "epoch": 2590} {"train_loss": -6.479644298553467, "global_step": 108802, "epoch": 2590} {"train_loss": -6.461474418640137, "global_step": 108803, "epoch": 2590} {"train_loss": -6.439488887786865, "global_step": 108804, "epoch": 2590} {"train_loss": -6.426504135131836, "global_step": 108805, "epoch": 2590} {"train_loss": -6.48484992980957, "global_step": 108806, "epoch": 2590} {"train_loss": -6.3509202003479, "global_step": 108807, "epoch": 2590} {"train_loss": -6.377233028411865, "global_step": 108808, "epoch": 2590} {"train_loss": -6.394903182983398, "global_step": 108809, "epoch": 2590} {"train_loss": -6.493566036224365, "global_step": 108810, "epoch": 2590} {"train_loss": -6.405240535736084, "global_step": 108811, "epoch": 2590} {"train_loss": -6.405947685241699, "global_step": 108812, "epoch": 2590} {"train_loss": -6.312142372131348, "global_step": 108813, "epoch": 2590} {"train_loss": -6.320987701416016, "global_step": 108814, "epoch": 2590} {"train_loss": -6.535660266876221, "global_step": 108815, "epoch": 2590} {"train_loss": -6.349888324737549, "global_step": 108816, "epoch": 2590} {"train_loss": -6.359504222869873, "global_step": 108817, "epoch": 2590} {"train_loss": -6.443387985229492, "global_step": 108818, "epoch": 2590} {"train_loss": -6.377756118774414, "global_step": 108819, "epoch": 2590} {"train_loss": -6.344793319702148, "global_step": 108820, "epoch": 2590} {"train_loss": -6.414110933031354, "global_step": 108821, "epoch": 2590, "val_loss": 68089.6640625} {"train_loss": -6.411048889160156, "global_step": 108822, "epoch": 2591} {"train_loss": -6.4209136962890625, "global_step": 108823, "epoch": 2591} {"train_loss": -6.450482368469238, "global_step": 108824, "epoch": 2591} {"train_loss": -6.463896751403809, "global_step": 108825, "epoch": 2591} {"train_loss": -6.44612455368042, "global_step": 108826, "epoch": 2591} {"train_loss": -6.508047103881836, "global_step": 108827, "epoch": 2591} {"train_loss": -6.356270790100098, "global_step": 108828, "epoch": 2591} {"train_loss": -6.363415718078613, "global_step": 108829, "epoch": 2591} {"train_loss": -6.356320381164551, "global_step": 108830, "epoch": 2591} {"train_loss": -6.301479339599609, "global_step": 108831, "epoch": 2591} {"train_loss": -6.325694561004639, "global_step": 108832, "epoch": 2591} {"train_loss": -6.4574809074401855, "global_step": 108833, "epoch": 2591} {"train_loss": -6.501056671142578, "global_step": 108834, "epoch": 2591} {"train_loss": -6.415231227874756, "global_step": 108835, "epoch": 2591} {"train_loss": -6.309066295623779, "global_step": 108836, "epoch": 2591} {"train_loss": -6.238712310791016, "global_step": 108837, "epoch": 2591} {"train_loss": -6.35636043548584, "global_step": 108838, "epoch": 2591} {"train_loss": -6.28535795211792, "global_step": 108839, "epoch": 2591} {"train_loss": -6.238708019256592, "global_step": 108840, "epoch": 2591} {"train_loss": -6.424714088439941, "global_step": 108841, "epoch": 2591} {"train_loss": -6.319248199462891, "global_step": 108842, "epoch": 2591} {"train_loss": -6.318633079528809, "global_step": 108843, "epoch": 2591} {"train_loss": -6.404582500457764, "global_step": 108844, "epoch": 2591} {"train_loss": -6.306411266326904, "global_step": 108845, "epoch": 2591} {"train_loss": -6.306268215179443, "global_step": 108846, "epoch": 2591} {"train_loss": -6.442187309265137, "global_step": 108847, "epoch": 2591} {"train_loss": -6.215816974639893, "global_step": 108848, "epoch": 2591} {"train_loss": -6.35576057434082, "global_step": 108849, "epoch": 2591} {"train_loss": -6.305809020996094, "global_step": 108850, "epoch": 2591} {"train_loss": -6.357921600341797, "global_step": 108851, "epoch": 2591} {"train_loss": -6.220372200012207, "global_step": 108852, "epoch": 2591} {"train_loss": -6.377927780151367, "global_step": 108853, "epoch": 2591} {"train_loss": -6.3068037033081055, "global_step": 108854, "epoch": 2591} {"train_loss": -6.446352481842041, "global_step": 108855, "epoch": 2591} {"train_loss": -6.374573707580566, "global_step": 108856, "epoch": 2591} {"train_loss": -6.371203422546387, "global_step": 108857, "epoch": 2591} {"train_loss": -6.404806137084961, "global_step": 108858, "epoch": 2591} {"train_loss": -6.2581467628479, "global_step": 108859, "epoch": 2591} {"train_loss": -6.298737049102783, "global_step": 108860, "epoch": 2591} {"train_loss": -6.406354904174805, "global_step": 108861, "epoch": 2591} {"train_loss": -6.467796802520752, "global_step": 108862, "epoch": 2591} {"train_loss": -6.366849070503598, "global_step": 108863, "epoch": 2591, "val_loss": 68031.6484375} {"train_loss": -6.485189437866211, "global_step": 108864, "epoch": 2592} {"train_loss": -6.445462226867676, "global_step": 108865, "epoch": 2592} {"train_loss": -6.480180740356445, "global_step": 108866, "epoch": 2592} {"train_loss": -6.385354042053223, "global_step": 108867, "epoch": 2592} {"train_loss": -6.342337131500244, "global_step": 108868, "epoch": 2592} {"train_loss": -6.421728610992432, "global_step": 108869, "epoch": 2592} {"train_loss": -6.367560386657715, "global_step": 108870, "epoch": 2592} {"train_loss": -6.492440223693848, "global_step": 108871, "epoch": 2592} {"train_loss": -6.475522994995117, "global_step": 108872, "epoch": 2592} {"train_loss": -6.31747579574585, "global_step": 108873, "epoch": 2592} {"train_loss": -6.401043891906738, "global_step": 108874, "epoch": 2592} {"train_loss": -6.428815841674805, "global_step": 108875, "epoch": 2592} {"train_loss": -6.356936454772949, "global_step": 108876, "epoch": 2592} {"train_loss": -6.321388244628906, "global_step": 108877, "epoch": 2592} {"train_loss": -6.3243608474731445, "global_step": 108878, "epoch": 2592} {"train_loss": -6.301700115203857, "global_step": 108879, "epoch": 2592} {"train_loss": -6.46159029006958, "global_step": 108880, "epoch": 2592} {"train_loss": -6.433556079864502, "global_step": 108881, "epoch": 2592} {"train_loss": -6.466870307922363, "global_step": 108882, "epoch": 2592} {"train_loss": -6.3715105056762695, "global_step": 108883, "epoch": 2592} {"train_loss": -6.391790390014648, "global_step": 108884, "epoch": 2592} {"train_loss": -6.299499034881592, "global_step": 108885, "epoch": 2592} {"train_loss": -6.396542549133301, "global_step": 108886, "epoch": 2592} {"train_loss": -6.391490936279297, "global_step": 108887, "epoch": 2592} {"train_loss": -6.339741230010986, "global_step": 108888, "epoch": 2592} {"train_loss": -6.401475429534912, "global_step": 108889, "epoch": 2592} {"train_loss": -6.436992168426514, "global_step": 108890, "epoch": 2592} {"train_loss": -6.516946792602539, "global_step": 108891, "epoch": 2592} {"train_loss": -6.4623003005981445, "global_step": 108892, "epoch": 2592} {"train_loss": -6.487252712249756, "global_step": 108893, "epoch": 2592} {"train_loss": -6.421041488647461, "global_step": 108894, "epoch": 2592} {"train_loss": -6.513291835784912, "global_step": 108895, "epoch": 2592} {"train_loss": -6.319480895996094, "global_step": 108896, "epoch": 2592} {"train_loss": -6.410723686218262, "global_step": 108897, "epoch": 2592} {"train_loss": -6.334403991699219, "global_step": 108898, "epoch": 2592} {"train_loss": -6.4011430740356445, "global_step": 108899, "epoch": 2592} {"train_loss": -6.403012752532959, "global_step": 108900, "epoch": 2592} {"train_loss": -6.515368938446045, "global_step": 108901, "epoch": 2592} {"train_loss": -6.462853908538818, "global_step": 108902, "epoch": 2592} {"train_loss": -6.362030982971191, "global_step": 108903, "epoch": 2592} {"train_loss": -6.491708755493164, "global_step": 108904, "epoch": 2592} {"train_loss": -6.411406414849417, "global_step": 108905, "epoch": 2592, "val_loss": 67849.109375} {"train_loss": -6.383811950683594, "global_step": 108906, "epoch": 2593} {"train_loss": -6.404160976409912, "global_step": 108907, "epoch": 2593} {"train_loss": -6.455442905426025, "global_step": 108908, "epoch": 2593} {"train_loss": -6.4747633934021, "global_step": 108909, "epoch": 2593} {"train_loss": -6.38908052444458, "global_step": 108910, "epoch": 2593} {"train_loss": -6.393815994262695, "global_step": 108911, "epoch": 2593} {"train_loss": -6.292326927185059, "global_step": 108912, "epoch": 2593} {"train_loss": -6.429408073425293, "global_step": 108913, "epoch": 2593} {"train_loss": -6.489128112792969, "global_step": 108914, "epoch": 2593} {"train_loss": -6.424318790435791, "global_step": 108915, "epoch": 2593} {"train_loss": -6.34727668762207, "global_step": 108916, "epoch": 2593} {"train_loss": -6.4199347496032715, "global_step": 108917, "epoch": 2593} {"train_loss": -6.47673225402832, "global_step": 108918, "epoch": 2593} {"train_loss": -6.444402694702148, "global_step": 108919, "epoch": 2593} {"train_loss": -6.420809268951416, "global_step": 108920, "epoch": 2593} {"train_loss": -6.530747413635254, "global_step": 108921, "epoch": 2593} {"train_loss": -6.479037284851074, "global_step": 108922, "epoch": 2593} {"train_loss": -6.419960975646973, "global_step": 108923, "epoch": 2593} {"train_loss": -6.551196575164795, "global_step": 108924, "epoch": 2593} {"train_loss": -6.406011581420898, "global_step": 108925, "epoch": 2593} {"train_loss": -6.614653587341309, "global_step": 108926, "epoch": 2593} {"train_loss": -6.496181488037109, "global_step": 108927, "epoch": 2593} {"train_loss": -6.503066062927246, "global_step": 108928, "epoch": 2593} {"train_loss": -6.528486251831055, "global_step": 108929, "epoch": 2593} {"train_loss": -6.522913932800293, "global_step": 108930, "epoch": 2593} {"train_loss": -6.538627624511719, "global_step": 108931, "epoch": 2593} {"train_loss": -6.453922271728516, "global_step": 108932, "epoch": 2593} {"train_loss": -6.486255168914795, "global_step": 108933, "epoch": 2593} {"train_loss": -6.466580390930176, "global_step": 108934, "epoch": 2593} {"train_loss": -6.48541259765625, "global_step": 108935, "epoch": 2593} {"train_loss": -6.5350751876831055, "global_step": 108936, "epoch": 2593} {"train_loss": -6.433098793029785, "global_step": 108937, "epoch": 2593} {"train_loss": -6.58770227432251, "global_step": 108938, "epoch": 2593} {"train_loss": -6.516017913818359, "global_step": 108939, "epoch": 2593} {"train_loss": -6.600063323974609, "global_step": 108940, "epoch": 2593} {"train_loss": -6.39121150970459, "global_step": 108941, "epoch": 2593} {"train_loss": -6.488798141479492, "global_step": 108942, "epoch": 2593} {"train_loss": -6.393714904785156, "global_step": 108943, "epoch": 2593} {"train_loss": -6.426509857177734, "global_step": 108944, "epoch": 2593} {"train_loss": -6.34596061706543, "global_step": 108945, "epoch": 2593} {"train_loss": -6.538084030151367, "global_step": 108946, "epoch": 2593} {"train_loss": -6.463551634833927, "global_step": 108947, "epoch": 2593, "val_loss": 68076.9375} {"train_loss": -6.225561141967773, "global_step": 108948, "epoch": 2594} {"train_loss": -6.473231315612793, "global_step": 108949, "epoch": 2594} {"train_loss": -6.45462703704834, "global_step": 108950, "epoch": 2594} {"train_loss": -6.319239616394043, "global_step": 108951, "epoch": 2594} {"train_loss": -6.446503162384033, "global_step": 108952, "epoch": 2594} {"train_loss": -6.488302707672119, "global_step": 108953, "epoch": 2594} {"train_loss": -6.481027603149414, "global_step": 108954, "epoch": 2594} {"train_loss": -6.4991455078125, "global_step": 108955, "epoch": 2594} {"train_loss": -6.440291404724121, "global_step": 108956, "epoch": 2594} {"train_loss": -6.43869686126709, "global_step": 108957, "epoch": 2594} {"train_loss": -6.417762756347656, "global_step": 108958, "epoch": 2594} {"train_loss": -6.374981880187988, "global_step": 108959, "epoch": 2594} {"train_loss": -6.443636417388916, "global_step": 108960, "epoch": 2594} {"train_loss": -6.473300457000732, "global_step": 108961, "epoch": 2594} {"train_loss": -6.334112167358398, "global_step": 108962, "epoch": 2594} {"train_loss": -6.4338788986206055, "global_step": 108963, "epoch": 2594} {"train_loss": -6.368322849273682, "global_step": 108964, "epoch": 2594} {"train_loss": -6.476534843444824, "global_step": 108965, "epoch": 2594} {"train_loss": -6.430570125579834, "global_step": 108966, "epoch": 2594} {"train_loss": -6.399187088012695, "global_step": 108967, "epoch": 2594} {"train_loss": -6.430654048919678, "global_step": 108968, "epoch": 2594} {"train_loss": -6.2996826171875, "global_step": 108969, "epoch": 2594} {"train_loss": -6.450831413269043, "global_step": 108970, "epoch": 2594} {"train_loss": -6.46592378616333, "global_step": 108971, "epoch": 2594} {"train_loss": -6.511564254760742, "global_step": 108972, "epoch": 2594} {"train_loss": -6.45705509185791, "global_step": 108973, "epoch": 2594} {"train_loss": -6.497988224029541, "global_step": 108974, "epoch": 2594} {"train_loss": -6.33001708984375, "global_step": 108975, "epoch": 2594} {"train_loss": -6.451642990112305, "global_step": 108976, "epoch": 2594} {"train_loss": -6.43757438659668, "global_step": 108977, "epoch": 2594} {"train_loss": -6.356751918792725, "global_step": 108978, "epoch": 2594} {"train_loss": -6.402932167053223, "global_step": 108979, "epoch": 2594} {"train_loss": -6.415559768676758, "global_step": 108980, "epoch": 2594} {"train_loss": -6.358156204223633, "global_step": 108981, "epoch": 2594} {"train_loss": -6.32546329498291, "global_step": 108982, "epoch": 2594} {"train_loss": -6.399649620056152, "global_step": 108983, "epoch": 2594} {"train_loss": -6.433618545532227, "global_step": 108984, "epoch": 2594} {"train_loss": -6.316460609436035, "global_step": 108985, "epoch": 2594} {"train_loss": -6.365156173706055, "global_step": 108986, "epoch": 2594} {"train_loss": -6.482521057128906, "global_step": 108987, "epoch": 2594} {"train_loss": -6.313263416290283, "global_step": 108988, "epoch": 2594} {"train_loss": -6.412493319738479, "global_step": 108989, "epoch": 2594, "val_loss": 67897.5859375} {"train_loss": -6.3895721435546875, "global_step": 108990, "epoch": 2595} {"train_loss": -6.336831092834473, "global_step": 108991, "epoch": 2595} {"train_loss": -6.380661964416504, "global_step": 108992, "epoch": 2595} {"train_loss": -6.469895362854004, "global_step": 108993, "epoch": 2595} {"train_loss": -6.340181827545166, "global_step": 108994, "epoch": 2595} {"train_loss": -6.37050724029541, "global_step": 108995, "epoch": 2595} {"train_loss": -6.557522296905518, "global_step": 108996, "epoch": 2595} {"train_loss": -6.394927978515625, "global_step": 108997, "epoch": 2595} {"train_loss": -6.4813995361328125, "global_step": 108998, "epoch": 2595} {"train_loss": -6.438979148864746, "global_step": 108999, "epoch": 2595} {"train_loss": -6.47471284866333, "global_step": 109000, "epoch": 2595} {"train_loss": -6.40372896194458, "global_step": 109001, "epoch": 2595} {"train_loss": -6.438983917236328, "global_step": 109002, "epoch": 2595} {"train_loss": -6.432394027709961, "global_step": 109003, "epoch": 2595} {"train_loss": -6.4660210609436035, "global_step": 109004, "epoch": 2595} {"train_loss": -6.528444766998291, "global_step": 109005, "epoch": 2595} {"train_loss": -6.342260360717773, "global_step": 109006, "epoch": 2595} {"train_loss": -6.373554229736328, "global_step": 109007, "epoch": 2595} {"train_loss": -6.434181213378906, "global_step": 109008, "epoch": 2595} {"train_loss": -6.356432914733887, "global_step": 109009, "epoch": 2595} {"train_loss": -6.464262008666992, "global_step": 109010, "epoch": 2595} {"train_loss": -6.449660778045654, "global_step": 109011, "epoch": 2595} {"train_loss": -6.448385238647461, "global_step": 109012, "epoch": 2595} {"train_loss": -6.449087619781494, "global_step": 109013, "epoch": 2595} {"train_loss": -6.425583362579346, "global_step": 109014, "epoch": 2595} {"train_loss": -6.3488664627075195, "global_step": 109015, "epoch": 2595} {"train_loss": -6.357976913452148, "global_step": 109016, "epoch": 2595} {"train_loss": -6.4729695320129395, "global_step": 109017, "epoch": 2595} {"train_loss": -6.368057727813721, "global_step": 109018, "epoch": 2595} {"train_loss": -6.418067932128906, "global_step": 109019, "epoch": 2595} {"train_loss": -6.459066390991211, "global_step": 109020, "epoch": 2595} {"train_loss": -6.419635772705078, "global_step": 109021, "epoch": 2595} {"train_loss": -6.407038688659668, "global_step": 109022, "epoch": 2595} {"train_loss": -6.383522033691406, "global_step": 109023, "epoch": 2595} {"train_loss": -6.444470405578613, "global_step": 109024, "epoch": 2595} {"train_loss": -6.368947982788086, "global_step": 109025, "epoch": 2595} {"train_loss": -6.2823710441589355, "global_step": 109026, "epoch": 2595} {"train_loss": -6.482600688934326, "global_step": 109027, "epoch": 2595} {"train_loss": -6.330932140350342, "global_step": 109028, "epoch": 2595} {"train_loss": -6.276926040649414, "global_step": 109029, "epoch": 2595} {"train_loss": -6.335871696472168, "global_step": 109030, "epoch": 2595} {"train_loss": -6.409999052683513, "global_step": 109031, "epoch": 2595, "val_loss": 67663.0546875} {"train_loss": -6.446587085723877, "global_step": 109032, "epoch": 2596} {"train_loss": -6.474892616271973, "global_step": 109033, "epoch": 2596} {"train_loss": -6.4310712814331055, "global_step": 109034, "epoch": 2596} {"train_loss": -6.494115829467773, "global_step": 109035, "epoch": 2596} {"train_loss": -6.404375076293945, "global_step": 109036, "epoch": 2596} {"train_loss": -6.564438819885254, "global_step": 109037, "epoch": 2596} {"train_loss": -6.506987571716309, "global_step": 109038, "epoch": 2596} {"train_loss": -6.3289265632629395, "global_step": 109039, "epoch": 2596} {"train_loss": -6.427042007446289, "global_step": 109040, "epoch": 2596} {"train_loss": -6.362636566162109, "global_step": 109041, "epoch": 2596} {"train_loss": -6.464799880981445, "global_step": 109042, "epoch": 2596} {"train_loss": -6.500612258911133, "global_step": 109043, "epoch": 2596} {"train_loss": -6.481605529785156, "global_step": 109044, "epoch": 2596} {"train_loss": -6.310004234313965, "global_step": 109045, "epoch": 2596} {"train_loss": -6.528265953063965, "global_step": 109046, "epoch": 2596} {"train_loss": -6.439430236816406, "global_step": 109047, "epoch": 2596} {"train_loss": -6.393498420715332, "global_step": 109048, "epoch": 2596} {"train_loss": -6.5488691329956055, "global_step": 109049, "epoch": 2596} {"train_loss": -6.488021373748779, "global_step": 109050, "epoch": 2596} {"train_loss": -6.414762020111084, "global_step": 109051, "epoch": 2596} {"train_loss": -6.510195255279541, "global_step": 109052, "epoch": 2596} {"train_loss": -6.374709129333496, "global_step": 109053, "epoch": 2596} {"train_loss": -6.544560432434082, "global_step": 109054, "epoch": 2596} {"train_loss": -6.487286567687988, "global_step": 109055, "epoch": 2596} {"train_loss": -6.505270957946777, "global_step": 109056, "epoch": 2596} {"train_loss": -6.581742763519287, "global_step": 109057, "epoch": 2596} {"train_loss": -6.407922744750977, "global_step": 109058, "epoch": 2596} {"train_loss": -6.337008953094482, "global_step": 109059, "epoch": 2596} {"train_loss": -6.4395904541015625, "global_step": 109060, "epoch": 2596} {"train_loss": -6.397951126098633, "global_step": 109061, "epoch": 2596} {"train_loss": -6.407993316650391, "global_step": 109062, "epoch": 2596} {"train_loss": -6.406162261962891, "global_step": 109063, "epoch": 2596} {"train_loss": -6.460304260253906, "global_step": 109064, "epoch": 2596} {"train_loss": -6.333664417266846, "global_step": 109065, "epoch": 2596} {"train_loss": -6.369763374328613, "global_step": 109066, "epoch": 2596} {"train_loss": -6.299009323120117, "global_step": 109067, "epoch": 2596} {"train_loss": -6.330194473266602, "global_step": 109068, "epoch": 2596} {"train_loss": -6.389266014099121, "global_step": 109069, "epoch": 2596} {"train_loss": -6.288000583648682, "global_step": 109070, "epoch": 2596} {"train_loss": -6.434257507324219, "global_step": 109071, "epoch": 2596} {"train_loss": -6.255106449127197, "global_step": 109072, "epoch": 2596} {"train_loss": -6.425295341582525, "global_step": 109073, "epoch": 2596, "val_loss": 67975.171875} {"train_loss": -6.454074859619141, "global_step": 109074, "epoch": 2597} {"train_loss": -6.381486892700195, "global_step": 109075, "epoch": 2597} {"train_loss": -6.3724164962768555, "global_step": 109076, "epoch": 2597} {"train_loss": -6.224231243133545, "global_step": 109077, "epoch": 2597} {"train_loss": -6.36497688293457, "global_step": 109078, "epoch": 2597} {"train_loss": -6.397279739379883, "global_step": 109079, "epoch": 2597} {"train_loss": -6.3643598556518555, "global_step": 109080, "epoch": 2597} {"train_loss": -6.403826713562012, "global_step": 109081, "epoch": 2597} {"train_loss": -6.398859024047852, "global_step": 109082, "epoch": 2597} {"train_loss": -6.3824028968811035, "global_step": 109083, "epoch": 2597} {"train_loss": -6.437198162078857, "global_step": 109084, "epoch": 2597} {"train_loss": -6.470491409301758, "global_step": 109085, "epoch": 2597} {"train_loss": -6.383345127105713, "global_step": 109086, "epoch": 2597} {"train_loss": -6.324532985687256, "global_step": 109087, "epoch": 2597} {"train_loss": -6.352977752685547, "global_step": 109088, "epoch": 2597} {"train_loss": -6.3558526039123535, "global_step": 109089, "epoch": 2597} {"train_loss": -6.366086483001709, "global_step": 109090, "epoch": 2597} {"train_loss": -6.265032768249512, "global_step": 109091, "epoch": 2597} {"train_loss": -6.322998046875, "global_step": 109092, "epoch": 2597} {"train_loss": -6.408001899719238, "global_step": 109093, "epoch": 2597} {"train_loss": -6.495100975036621, "global_step": 109094, "epoch": 2597} {"train_loss": -6.515580177307129, "global_step": 109095, "epoch": 2597} {"train_loss": -6.48221492767334, "global_step": 109096, "epoch": 2597} {"train_loss": -6.4592671394348145, "global_step": 109097, "epoch": 2597} {"train_loss": -6.37168025970459, "global_step": 109098, "epoch": 2597} {"train_loss": -6.476130962371826, "global_step": 109099, "epoch": 2597} {"train_loss": -6.440601348876953, "global_step": 109100, "epoch": 2597} {"train_loss": -6.4702911376953125, "global_step": 109101, "epoch": 2597} {"train_loss": -6.571049690246582, "global_step": 109102, "epoch": 2597} {"train_loss": -6.411611557006836, "global_step": 109103, "epoch": 2597} {"train_loss": -6.536820888519287, "global_step": 109104, "epoch": 2597} {"train_loss": -6.457824230194092, "global_step": 109105, "epoch": 2597} {"train_loss": -6.437465667724609, "global_step": 109106, "epoch": 2597} {"train_loss": -6.354025363922119, "global_step": 109107, "epoch": 2597} {"train_loss": -6.506218910217285, "global_step": 109108, "epoch": 2597} {"train_loss": -6.417957305908203, "global_step": 109109, "epoch": 2597} {"train_loss": -6.429337024688721, "global_step": 109110, "epoch": 2597} {"train_loss": -6.305240631103516, "global_step": 109111, "epoch": 2597} {"train_loss": -6.36699104309082, "global_step": 109112, "epoch": 2597} {"train_loss": -6.411559104919434, "global_step": 109113, "epoch": 2597} {"train_loss": -6.3347625732421875, "global_step": 109114, "epoch": 2597} {"train_loss": -6.407883382978893, "global_step": 109115, "epoch": 2597, "val_loss": 67782.859375} {"train_loss": -6.4007744789123535, "global_step": 109116, "epoch": 2598} {"train_loss": -6.367526531219482, "global_step": 109117, "epoch": 2598} {"train_loss": -6.297163009643555, "global_step": 109118, "epoch": 2598} {"train_loss": -6.364850044250488, "global_step": 109119, "epoch": 2598} {"train_loss": -6.3354105949401855, "global_step": 109120, "epoch": 2598} {"train_loss": -6.381295680999756, "global_step": 109121, "epoch": 2598} {"train_loss": -6.385627746582031, "global_step": 109122, "epoch": 2598} {"train_loss": -6.355325698852539, "global_step": 109123, "epoch": 2598} {"train_loss": -6.414931297302246, "global_step": 109124, "epoch": 2598} {"train_loss": -6.328629970550537, "global_step": 109125, "epoch": 2598} {"train_loss": -6.373327732086182, "global_step": 109126, "epoch": 2598} {"train_loss": -6.4265971183776855, "global_step": 109127, "epoch": 2598} {"train_loss": -6.30843448638916, "global_step": 109128, "epoch": 2598} {"train_loss": -6.381999492645264, "global_step": 109129, "epoch": 2598} {"train_loss": -6.503716468811035, "global_step": 109130, "epoch": 2598} {"train_loss": -6.451904296875, "global_step": 109131, "epoch": 2598} {"train_loss": -6.437711715698242, "global_step": 109132, "epoch": 2598} {"train_loss": -6.323701858520508, "global_step": 109133, "epoch": 2598} {"train_loss": -6.433326721191406, "global_step": 109134, "epoch": 2598} {"train_loss": -6.338515281677246, "global_step": 109135, "epoch": 2598} {"train_loss": -6.459761619567871, "global_step": 109136, "epoch": 2598} {"train_loss": -6.506917953491211, "global_step": 109137, "epoch": 2598} {"train_loss": -6.406866073608398, "global_step": 109138, "epoch": 2598} {"train_loss": -6.328402519226074, "global_step": 109139, "epoch": 2598} {"train_loss": -6.458432197570801, "global_step": 109140, "epoch": 2598} {"train_loss": -6.357800483703613, "global_step": 109141, "epoch": 2598} {"train_loss": -6.420441150665283, "global_step": 109142, "epoch": 2598} {"train_loss": -6.3871355056762695, "global_step": 109143, "epoch": 2598} {"train_loss": -6.434511184692383, "global_step": 109144, "epoch": 2598} {"train_loss": -6.442174911499023, "global_step": 109145, "epoch": 2598} {"train_loss": -6.347626209259033, "global_step": 109146, "epoch": 2598} {"train_loss": -6.435033321380615, "global_step": 109147, "epoch": 2598} {"train_loss": -6.329617023468018, "global_step": 109148, "epoch": 2598} {"train_loss": -6.401710033416748, "global_step": 109149, "epoch": 2598} {"train_loss": -6.450430393218994, "global_step": 109150, "epoch": 2598} {"train_loss": -6.326610565185547, "global_step": 109151, "epoch": 2598} {"train_loss": -6.386905670166016, "global_step": 109152, "epoch": 2598} {"train_loss": -6.533872604370117, "global_step": 109153, "epoch": 2598} {"train_loss": -6.319282054901123, "global_step": 109154, "epoch": 2598} {"train_loss": -6.473818302154541, "global_step": 109155, "epoch": 2598} {"train_loss": -6.299837589263916, "global_step": 109156, "epoch": 2598} {"train_loss": -6.393877438136509, "global_step": 109157, "epoch": 2598, "val_loss": 67834.953125} {"train_loss": -6.515448093414307, "global_step": 109158, "epoch": 2599} {"train_loss": -6.2434868812561035, "global_step": 109159, "epoch": 2599} {"train_loss": -6.481980323791504, "global_step": 109160, "epoch": 2599} {"train_loss": -6.3765740394592285, "global_step": 109161, "epoch": 2599} {"train_loss": -6.359797477722168, "global_step": 109162, "epoch": 2599} {"train_loss": -6.518096446990967, "global_step": 109163, "epoch": 2599} {"train_loss": -6.404969215393066, "global_step": 109164, "epoch": 2599} {"train_loss": -6.486179828643799, "global_step": 109165, "epoch": 2599} {"train_loss": -6.532242298126221, "global_step": 109166, "epoch": 2599} {"train_loss": -6.391770839691162, "global_step": 109167, "epoch": 2599} {"train_loss": -6.368049144744873, "global_step": 109168, "epoch": 2599} {"train_loss": -6.45094108581543, "global_step": 109169, "epoch": 2599} {"train_loss": -6.4154462814331055, "global_step": 109170, "epoch": 2599} {"train_loss": -6.528460502624512, "global_step": 109171, "epoch": 2599} {"train_loss": -6.379420280456543, "global_step": 109172, "epoch": 2599} {"train_loss": -6.386105060577393, "global_step": 109173, "epoch": 2599} {"train_loss": -6.4876837730407715, "global_step": 109174, "epoch": 2599} {"train_loss": -6.534317493438721, "global_step": 109175, "epoch": 2599} {"train_loss": -6.374292373657227, "global_step": 109176, "epoch": 2599} {"train_loss": -6.517102241516113, "global_step": 109177, "epoch": 2599} {"train_loss": -6.173340320587158, "global_step": 109178, "epoch": 2599} {"train_loss": -6.463230609893799, "global_step": 109179, "epoch": 2599} {"train_loss": -6.529912948608398, "global_step": 109180, "epoch": 2599} {"train_loss": -6.493383407592773, "global_step": 109181, "epoch": 2599} {"train_loss": -6.552502632141113, "global_step": 109182, "epoch": 2599} {"train_loss": -6.443682670593262, "global_step": 109183, "epoch": 2599} {"train_loss": -6.587678909301758, "global_step": 109184, "epoch": 2599} {"train_loss": -6.421905517578125, "global_step": 109185, "epoch": 2599} {"train_loss": -6.454532146453857, "global_step": 109186, "epoch": 2599} {"train_loss": -6.435706615447998, "global_step": 109187, "epoch": 2599} {"train_loss": -6.312987804412842, "global_step": 109188, "epoch": 2599} {"train_loss": -6.484140872955322, "global_step": 109189, "epoch": 2599} {"train_loss": -6.510447978973389, "global_step": 109190, "epoch": 2599} {"train_loss": -6.364360809326172, "global_step": 109191, "epoch": 2599} {"train_loss": -6.438112258911133, "global_step": 109192, "epoch": 2599} {"train_loss": -6.394352912902832, "global_step": 109193, "epoch": 2599} {"train_loss": -6.388620376586914, "global_step": 109194, "epoch": 2599} {"train_loss": -6.513409614562988, "global_step": 109195, "epoch": 2599} {"train_loss": -6.436732769012451, "global_step": 109196, "epoch": 2599} {"train_loss": -6.484860420227051, "global_step": 109197, "epoch": 2599} {"train_loss": -6.3912858963012695, "global_step": 109198, "epoch": 2599} {"train_loss": -6.438535145350865, "global_step": 109199, "epoch": 2599, "val_loss": 67997.6171875} {"train_loss": -6.3112993240356445, "global_step": 109200, "epoch": 2600} {"train_loss": -6.321997165679932, "global_step": 109201, "epoch": 2600} {"train_loss": -6.455862045288086, "global_step": 109202, "epoch": 2600} {"train_loss": -6.370437145233154, "global_step": 109203, "epoch": 2600} {"train_loss": -6.456007957458496, "global_step": 109204, "epoch": 2600} {"train_loss": -6.411070823669434, "global_step": 109205, "epoch": 2600} {"train_loss": -6.532435417175293, "global_step": 109206, "epoch": 2600} {"train_loss": -6.466699600219727, "global_step": 109207, "epoch": 2600} {"train_loss": -6.479764461517334, "global_step": 109208, "epoch": 2600} {"train_loss": -6.55192756652832, "global_step": 109209, "epoch": 2600} {"train_loss": -6.528573036193848, "global_step": 109210, "epoch": 2600} {"train_loss": -6.352187156677246, "global_step": 109211, "epoch": 2600} {"train_loss": -6.425124645233154, "global_step": 109212, "epoch": 2600} {"train_loss": -6.374877452850342, "global_step": 109213, "epoch": 2600} {"train_loss": -6.369345188140869, "global_step": 109214, "epoch": 2600} {"train_loss": -6.4876251220703125, "global_step": 109215, "epoch": 2600} {"train_loss": -6.429381370544434, "global_step": 109216, "epoch": 2600} {"train_loss": -6.402588844299316, "global_step": 109217, "epoch": 2600} {"train_loss": -6.536170959472656, "global_step": 109218, "epoch": 2600} {"train_loss": -6.48730993270874, "global_step": 109219, "epoch": 2600} {"train_loss": -6.464786529541016, "global_step": 109220, "epoch": 2600} {"train_loss": -6.378512382507324, "global_step": 109221, "epoch": 2600} {"train_loss": -6.543717384338379, "global_step": 109222, "epoch": 2600} {"train_loss": -6.39719820022583, "global_step": 109223, "epoch": 2600} {"train_loss": -6.417284965515137, "global_step": 109224, "epoch": 2600} {"train_loss": -6.47999382019043, "global_step": 109225, "epoch": 2600} {"train_loss": -6.358017921447754, "global_step": 109226, "epoch": 2600} {"train_loss": -6.456110954284668, "global_step": 109227, "epoch": 2600} {"train_loss": -6.40242862701416, "global_step": 109228, "epoch": 2600} {"train_loss": -6.463423252105713, "global_step": 109229, "epoch": 2600} {"train_loss": -6.375984191894531, "global_step": 109230, "epoch": 2600} {"train_loss": -6.468923568725586, "global_step": 109231, "epoch": 2600} {"train_loss": -6.396383762359619, "global_step": 109232, "epoch": 2600} {"train_loss": -6.388819694519043, "global_step": 109233, "epoch": 2600} {"train_loss": -6.378948211669922, "global_step": 109234, "epoch": 2600} {"train_loss": -6.349161624908447, "global_step": 109235, "epoch": 2600} {"train_loss": -6.405717372894287, "global_step": 109236, "epoch": 2600} {"train_loss": -6.408146381378174, "global_step": 109237, "epoch": 2600} {"train_loss": -6.398435592651367, "global_step": 109238, "epoch": 2600} {"train_loss": -6.35317325592041, "global_step": 109239, "epoch": 2600} {"train_loss": -6.436129570007324, "global_step": 109240, "epoch": 2600} {"train_loss": -6.42891214007423, "global_step": 109241, "epoch": 2600, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.9399916896164466, "train/sim_max_reward_2": 0.4449860194627369, "train/sim_max_reward_3": 0.1414524487276667, "train/sim_max_reward_4": 0.8621137789624197, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.9379545225487729, "test/sim_max_reward_4400001": 0.21606196284229473, "test/sim_max_reward_4400002": 0.8149359918525473, "test/sim_max_reward_4400003": 0.5899574859993117, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.3840831206000084, "test/sim_max_reward_4400006": 0.9439321171040547, "test/sim_max_reward_4400007": 0.8415161447450785, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.8353103839885444, "test/sim_max_reward_4400010": 0.5442108604034237, "test/sim_max_reward_4400011": 0.4876135872881336, "test/sim_max_reward_4400012": 0.9576328147548777, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.7812145581934062, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.15893163025174137, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.22704069058083765, "test/sim_max_reward_4400019": 0.38822859772132806, "test/sim_max_reward_4400020": 9.053692637229422e-05, "test/sim_max_reward_4400021": 0.31018381833679926, "test/sim_max_reward_4400022": 0.7338291814880239, "test/sim_max_reward_4400023": 0.4074450843844163, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.259869906851199, "test/sim_max_reward_4400026": 0.759897930045327, "test/sim_max_reward_4400027": 0.010542989454110587, "test/sim_max_reward_4400028": 0.4358957397887104, "test/sim_max_reward_4400029": 3.31207173812906e-05, "test/sim_max_reward_4400030": 0.9517126043929457, "test/sim_max_reward_4400031": 0.9559071655788591, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.39969753755211407, "test/sim_max_reward_4400034": 0.8169108139590069, "test/sim_max_reward_4400035": 0.46496911844843114, "test/sim_max_reward_4400036": 0.8167912310731016, "test/sim_max_reward_4400037": 0.967421810582191, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9810219530155593, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.854366423848014, "test/sim_max_reward_4400042": 0.6478148723810403, "test/sim_max_reward_4400043": 0.9945468860794074, "test/sim_max_reward_4400044": 0.8963946718788283, "test/sim_max_reward_4400045": 0.5775414091312889, "test/sim_max_reward_4400046": 0.9388829356441595, "test/sim_max_reward_4400047": 0.9784078974403841, "test/sim_max_reward_4400048": 0.849078533949514, "test/sim_max_reward_4400049": 0.677126957704697, "train/mean_score": 0.46197103212291823, "test/mean_score": 0.5672224764344799, "val_loss": 67912.5703125} {"train_loss": -6.37923526763916, "global_step": 109242, "epoch": 2601} {"train_loss": -6.381601333618164, "global_step": 109243, "epoch": 2601} {"train_loss": -6.490952491760254, "global_step": 109244, "epoch": 2601} {"train_loss": -6.5158281326293945, "global_step": 109245, "epoch": 2601} {"train_loss": -6.39321231842041, "global_step": 109246, "epoch": 2601} {"train_loss": -6.426048755645752, "global_step": 109247, "epoch": 2601} {"train_loss": -6.4185943603515625, "global_step": 109248, "epoch": 2601} {"train_loss": -6.375873565673828, "global_step": 109249, "epoch": 2601} {"train_loss": -6.4599289894104, "global_step": 109250, "epoch": 2601} {"train_loss": -6.470178604125977, "global_step": 109251, "epoch": 2601} {"train_loss": -6.387153625488281, "global_step": 109252, "epoch": 2601} {"train_loss": -6.413320541381836, "global_step": 109253, "epoch": 2601} {"train_loss": -6.304187297821045, "global_step": 109254, "epoch": 2601} {"train_loss": -6.4648213386535645, "global_step": 109255, "epoch": 2601} {"train_loss": -6.493697166442871, "global_step": 109256, "epoch": 2601} {"train_loss": -6.498579502105713, "global_step": 109257, "epoch": 2601} {"train_loss": -6.5218095779418945, "global_step": 109258, "epoch": 2601} {"train_loss": -6.5977935791015625, "global_step": 109259, "epoch": 2601} {"train_loss": -6.423295021057129, "global_step": 109260, "epoch": 2601} {"train_loss": -6.434678077697754, "global_step": 109261, "epoch": 2601} {"train_loss": -6.458016395568848, "global_step": 109262, "epoch": 2601} {"train_loss": -6.430758953094482, "global_step": 109263, "epoch": 2601} {"train_loss": -6.468605995178223, "global_step": 109264, "epoch": 2601} {"train_loss": -6.463479042053223, "global_step": 109265, "epoch": 2601} {"train_loss": -6.458291053771973, "global_step": 109266, "epoch": 2601} {"train_loss": -6.373957633972168, "global_step": 109267, "epoch": 2601} {"train_loss": -6.4104509353637695, "global_step": 109268, "epoch": 2601} {"train_loss": -6.5035481452941895, "global_step": 109269, "epoch": 2601} {"train_loss": -6.47304630279541, "global_step": 109270, "epoch": 2601} {"train_loss": -6.474990367889404, "global_step": 109271, "epoch": 2601} {"train_loss": -6.386989593505859, "global_step": 109272, "epoch": 2601} {"train_loss": -6.393592834472656, "global_step": 109273, "epoch": 2601} {"train_loss": -6.3578782081604, "global_step": 109274, "epoch": 2601} {"train_loss": -6.325416088104248, "global_step": 109275, "epoch": 2601} {"train_loss": -6.483987808227539, "global_step": 109276, "epoch": 2601} {"train_loss": -6.392943859100342, "global_step": 109277, "epoch": 2601} {"train_loss": -6.331233978271484, "global_step": 109278, "epoch": 2601} {"train_loss": -6.4075822830200195, "global_step": 109279, "epoch": 2601} {"train_loss": -6.514441967010498, "global_step": 109280, "epoch": 2601} {"train_loss": -6.553076267242432, "global_step": 109281, "epoch": 2601} {"train_loss": -6.450498580932617, "global_step": 109282, "epoch": 2601} {"train_loss": -6.437647478921073, "global_step": 109283, "epoch": 2601, "val_loss": 67770.078125} {"train_loss": -6.533682823181152, "global_step": 109284, "epoch": 2602} {"train_loss": -6.427650451660156, "global_step": 109285, "epoch": 2602} {"train_loss": -6.463895797729492, "global_step": 109286, "epoch": 2602} {"train_loss": -6.474434852600098, "global_step": 109287, "epoch": 2602} {"train_loss": -6.494108200073242, "global_step": 109288, "epoch": 2602} {"train_loss": -6.338684558868408, "global_step": 109289, "epoch": 2602} {"train_loss": -6.44844913482666, "global_step": 109290, "epoch": 2602} {"train_loss": -6.506397724151611, "global_step": 109291, "epoch": 2602} {"train_loss": -6.454486846923828, "global_step": 109292, "epoch": 2602} {"train_loss": -6.502718925476074, "global_step": 109293, "epoch": 2602} {"train_loss": -6.485928535461426, "global_step": 109294, "epoch": 2602} {"train_loss": -6.524043083190918, "global_step": 109295, "epoch": 2602} {"train_loss": -6.528906345367432, "global_step": 109296, "epoch": 2602} {"train_loss": -6.412937164306641, "global_step": 109297, "epoch": 2602} {"train_loss": -6.471363067626953, "global_step": 109298, "epoch": 2602} {"train_loss": -6.489651679992676, "global_step": 109299, "epoch": 2602} {"train_loss": -6.400524139404297, "global_step": 109300, "epoch": 2602} {"train_loss": -6.4433393478393555, "global_step": 109301, "epoch": 2602} {"train_loss": -6.452441215515137, "global_step": 109302, "epoch": 2602} {"train_loss": -6.441621780395508, "global_step": 109303, "epoch": 2602} {"train_loss": -6.436434745788574, "global_step": 109304, "epoch": 2602} {"train_loss": -6.5075483322143555, "global_step": 109305, "epoch": 2602} {"train_loss": -6.538208961486816, "global_step": 109306, "epoch": 2602} {"train_loss": -6.504344463348389, "global_step": 109307, "epoch": 2602} {"train_loss": -6.486758232116699, "global_step": 109308, "epoch": 2602} {"train_loss": -6.356827735900879, "global_step": 109309, "epoch": 2602} {"train_loss": -6.429097652435303, "global_step": 109310, "epoch": 2602} {"train_loss": -6.417407989501953, "global_step": 109311, "epoch": 2602} {"train_loss": -6.407352447509766, "global_step": 109312, "epoch": 2602} {"train_loss": -6.493803977966309, "global_step": 109313, "epoch": 2602} {"train_loss": -6.3605852127075195, "global_step": 109314, "epoch": 2602} {"train_loss": -6.441433429718018, "global_step": 109315, "epoch": 2602} {"train_loss": -6.415297508239746, "global_step": 109316, "epoch": 2602} {"train_loss": -6.382651329040527, "global_step": 109317, "epoch": 2602} {"train_loss": -6.423988342285156, "global_step": 109318, "epoch": 2602} {"train_loss": -6.558788299560547, "global_step": 109319, "epoch": 2602} {"train_loss": -6.357853889465332, "global_step": 109320, "epoch": 2602} {"train_loss": -6.446394920349121, "global_step": 109321, "epoch": 2602} {"train_loss": -6.375840663909912, "global_step": 109322, "epoch": 2602} {"train_loss": -6.425694465637207, "global_step": 109323, "epoch": 2602} {"train_loss": -6.413270950317383, "global_step": 109324, "epoch": 2602} {"train_loss": -6.450921319779896, "global_step": 109325, "epoch": 2602, "val_loss": 67794.8125} {"train_loss": -6.364463806152344, "global_step": 109326, "epoch": 2603} {"train_loss": -6.34796142578125, "global_step": 109327, "epoch": 2603} {"train_loss": -6.42444372177124, "global_step": 109328, "epoch": 2603} {"train_loss": -6.500883102416992, "global_step": 109329, "epoch": 2603} {"train_loss": -6.443674087524414, "global_step": 109330, "epoch": 2603} {"train_loss": -6.425939083099365, "global_step": 109331, "epoch": 2603} {"train_loss": -6.579537391662598, "global_step": 109332, "epoch": 2603} {"train_loss": -6.369844913482666, "global_step": 109333, "epoch": 2603} {"train_loss": -6.407318592071533, "global_step": 109334, "epoch": 2603} {"train_loss": -6.372926235198975, "global_step": 109335, "epoch": 2603} {"train_loss": -6.272014617919922, "global_step": 109336, "epoch": 2603} {"train_loss": -6.44652795791626, "global_step": 109337, "epoch": 2603} {"train_loss": -6.405771255493164, "global_step": 109338, "epoch": 2603} {"train_loss": -6.3750224113464355, "global_step": 109339, "epoch": 2603} {"train_loss": -6.3972978591918945, "global_step": 109340, "epoch": 2603} {"train_loss": -6.405341625213623, "global_step": 109341, "epoch": 2603} {"train_loss": -6.440643310546875, "global_step": 109342, "epoch": 2603} {"train_loss": -6.459445476531982, "global_step": 109343, "epoch": 2603} {"train_loss": -6.365859031677246, "global_step": 109344, "epoch": 2603} {"train_loss": -6.522245407104492, "global_step": 109345, "epoch": 2603} {"train_loss": -6.5565185546875, "global_step": 109346, "epoch": 2603} {"train_loss": -6.357142448425293, "global_step": 109347, "epoch": 2603} {"train_loss": -6.556902885437012, "global_step": 109348, "epoch": 2603} {"train_loss": -6.394709587097168, "global_step": 109349, "epoch": 2603} {"train_loss": -6.448759078979492, "global_step": 109350, "epoch": 2603} {"train_loss": -6.527642250061035, "global_step": 109351, "epoch": 2603} {"train_loss": -6.446825981140137, "global_step": 109352, "epoch": 2603} {"train_loss": -6.623237609863281, "global_step": 109353, "epoch": 2603} {"train_loss": -6.360257625579834, "global_step": 109354, "epoch": 2603} {"train_loss": -6.506641387939453, "global_step": 109355, "epoch": 2603} {"train_loss": -6.451046943664551, "global_step": 109356, "epoch": 2603} {"train_loss": -6.3184051513671875, "global_step": 109357, "epoch": 2603} {"train_loss": -6.384788990020752, "global_step": 109358, "epoch": 2603} {"train_loss": -6.385465621948242, "global_step": 109359, "epoch": 2603} {"train_loss": -6.515235900878906, "global_step": 109360, "epoch": 2603} {"train_loss": -6.425037384033203, "global_step": 109361, "epoch": 2603} {"train_loss": -6.417285919189453, "global_step": 109362, "epoch": 2603} {"train_loss": -6.480001449584961, "global_step": 109363, "epoch": 2603} {"train_loss": -6.469815731048584, "global_step": 109364, "epoch": 2603} {"train_loss": -6.4136762619018555, "global_step": 109365, "epoch": 2603} {"train_loss": -6.541119575500488, "global_step": 109366, "epoch": 2603} {"train_loss": -6.436764864694505, "global_step": 109367, "epoch": 2603, "val_loss": 67789.1015625} {"train_loss": -6.330897808074951, "global_step": 109368, "epoch": 2604} {"train_loss": -6.35650634765625, "global_step": 109369, "epoch": 2604} {"train_loss": -6.438939094543457, "global_step": 109370, "epoch": 2604} {"train_loss": -6.357247352600098, "global_step": 109371, "epoch": 2604} {"train_loss": -6.451933860778809, "global_step": 109372, "epoch": 2604} {"train_loss": -6.504759788513184, "global_step": 109373, "epoch": 2604} {"train_loss": -6.398344039916992, "global_step": 109374, "epoch": 2604} {"train_loss": -6.364120960235596, "global_step": 109375, "epoch": 2604} {"train_loss": -6.381645679473877, "global_step": 109376, "epoch": 2604} {"train_loss": -6.306187152862549, "global_step": 109377, "epoch": 2604} {"train_loss": -6.409808158874512, "global_step": 109378, "epoch": 2604} {"train_loss": -6.43085241317749, "global_step": 109379, "epoch": 2604} {"train_loss": -6.336764335632324, "global_step": 109380, "epoch": 2604} {"train_loss": -6.497858047485352, "global_step": 109381, "epoch": 2604} {"train_loss": -6.3806257247924805, "global_step": 109382, "epoch": 2604} {"train_loss": -6.406163215637207, "global_step": 109383, "epoch": 2604} {"train_loss": -6.428184509277344, "global_step": 109384, "epoch": 2604} {"train_loss": -6.454707145690918, "global_step": 109385, "epoch": 2604} {"train_loss": -6.4091081619262695, "global_step": 109386, "epoch": 2604} {"train_loss": -6.316275596618652, "global_step": 109387, "epoch": 2604} {"train_loss": -6.410700798034668, "global_step": 109388, "epoch": 2604} {"train_loss": -6.357536315917969, "global_step": 109389, "epoch": 2604} {"train_loss": -6.501828193664551, "global_step": 109390, "epoch": 2604} {"train_loss": -6.341405868530273, "global_step": 109391, "epoch": 2604} {"train_loss": -6.403996467590332, "global_step": 109392, "epoch": 2604} {"train_loss": -6.448546409606934, "global_step": 109393, "epoch": 2604} {"train_loss": -6.370176315307617, "global_step": 109394, "epoch": 2604} {"train_loss": -6.50786018371582, "global_step": 109395, "epoch": 2604} {"train_loss": -6.396207332611084, "global_step": 109396, "epoch": 2604} {"train_loss": -6.364674091339111, "global_step": 109397, "epoch": 2604} {"train_loss": -6.544773578643799, "global_step": 109398, "epoch": 2604} {"train_loss": -6.362872123718262, "global_step": 109399, "epoch": 2604} {"train_loss": -6.379990577697754, "global_step": 109400, "epoch": 2604} {"train_loss": -6.402750492095947, "global_step": 109401, "epoch": 2604} {"train_loss": -6.408189296722412, "global_step": 109402, "epoch": 2604} {"train_loss": -6.434720039367676, "global_step": 109403, "epoch": 2604} {"train_loss": -6.419808864593506, "global_step": 109404, "epoch": 2604} {"train_loss": -6.371232986450195, "global_step": 109405, "epoch": 2604} {"train_loss": -6.41249942779541, "global_step": 109406, "epoch": 2604} {"train_loss": -6.394794464111328, "global_step": 109407, "epoch": 2604} {"train_loss": -6.507444381713867, "global_step": 109408, "epoch": 2604} {"train_loss": -6.406011899312337, "global_step": 109409, "epoch": 2604, "val_loss": 67841.6484375} {"train_loss": -6.375374794006348, "global_step": 109410, "epoch": 2605} {"train_loss": -6.437075614929199, "global_step": 109411, "epoch": 2605} {"train_loss": -6.427402496337891, "global_step": 109412, "epoch": 2605} {"train_loss": -6.327532768249512, "global_step": 109413, "epoch": 2605} {"train_loss": -6.227553367614746, "global_step": 109414, "epoch": 2605} {"train_loss": -6.385305404663086, "global_step": 109415, "epoch": 2605} {"train_loss": -6.42531681060791, "global_step": 109416, "epoch": 2605} {"train_loss": -6.39011287689209, "global_step": 109417, "epoch": 2605} {"train_loss": -6.386157035827637, "global_step": 109418, "epoch": 2605} {"train_loss": -6.405505180358887, "global_step": 109419, "epoch": 2605} {"train_loss": -6.541485786437988, "global_step": 109420, "epoch": 2605} {"train_loss": -6.400870323181152, "global_step": 109421, "epoch": 2605} {"train_loss": -6.327803611755371, "global_step": 109422, "epoch": 2605} {"train_loss": -6.528709411621094, "global_step": 109423, "epoch": 2605} {"train_loss": -6.3391876220703125, "global_step": 109424, "epoch": 2605} {"train_loss": -6.462124824523926, "global_step": 109425, "epoch": 2605} {"train_loss": -6.295820236206055, "global_step": 109426, "epoch": 2605} {"train_loss": -6.572844505310059, "global_step": 109427, "epoch": 2605} {"train_loss": -6.305666923522949, "global_step": 109428, "epoch": 2605} {"train_loss": -6.259653568267822, "global_step": 109429, "epoch": 2605} {"train_loss": -6.410192489624023, "global_step": 109430, "epoch": 2605} {"train_loss": -6.1577324867248535, "global_step": 109431, "epoch": 2605} {"train_loss": -6.378620147705078, "global_step": 109432, "epoch": 2605} {"train_loss": -6.1992902755737305, "global_step": 109433, "epoch": 2605} {"train_loss": -6.384960174560547, "global_step": 109434, "epoch": 2605} {"train_loss": -6.38169002532959, "global_step": 109435, "epoch": 2605} {"train_loss": -6.296795845031738, "global_step": 109436, "epoch": 2605} {"train_loss": -6.368633270263672, "global_step": 109437, "epoch": 2605} {"train_loss": -6.372378826141357, "global_step": 109438, "epoch": 2605} {"train_loss": -6.371238708496094, "global_step": 109439, "epoch": 2605} {"train_loss": -6.322144508361816, "global_step": 109440, "epoch": 2605} {"train_loss": -6.276650428771973, "global_step": 109441, "epoch": 2605} {"train_loss": -6.346770763397217, "global_step": 109442, "epoch": 2605} {"train_loss": -6.475890159606934, "global_step": 109443, "epoch": 2605} {"train_loss": -6.467708110809326, "global_step": 109444, "epoch": 2605} {"train_loss": -6.411160469055176, "global_step": 109445, "epoch": 2605} {"train_loss": -6.335048675537109, "global_step": 109446, "epoch": 2605} {"train_loss": -6.3878374099731445, "global_step": 109447, "epoch": 2605} {"train_loss": -6.40158748626709, "global_step": 109448, "epoch": 2605} {"train_loss": -6.520459175109863, "global_step": 109449, "epoch": 2605} {"train_loss": -6.522693634033203, "global_step": 109450, "epoch": 2605} {"train_loss": -6.3834046976906915, "global_step": 109451, "epoch": 2605, "val_loss": 67494.6640625} {"train_loss": -6.556605339050293, "global_step": 109452, "epoch": 2606} {"train_loss": -6.480672836303711, "global_step": 109453, "epoch": 2606} {"train_loss": -6.411323547363281, "global_step": 109454, "epoch": 2606} {"train_loss": -6.451728820800781, "global_step": 109455, "epoch": 2606} {"train_loss": -6.380289077758789, "global_step": 109456, "epoch": 2606} {"train_loss": -6.41573429107666, "global_step": 109457, "epoch": 2606} {"train_loss": -6.511903285980225, "global_step": 109458, "epoch": 2606} {"train_loss": -6.352425575256348, "global_step": 109459, "epoch": 2606} {"train_loss": -6.465217113494873, "global_step": 109460, "epoch": 2606} {"train_loss": -6.4841766357421875, "global_step": 109461, "epoch": 2606} {"train_loss": -6.3748064041137695, "global_step": 109462, "epoch": 2606} {"train_loss": -6.355617523193359, "global_step": 109463, "epoch": 2606} {"train_loss": -6.321323394775391, "global_step": 109464, "epoch": 2606} {"train_loss": -6.389194965362549, "global_step": 109465, "epoch": 2606} {"train_loss": -6.484501361846924, "global_step": 109466, "epoch": 2606} {"train_loss": -6.23438835144043, "global_step": 109467, "epoch": 2606} {"train_loss": -6.324124336242676, "global_step": 109468, "epoch": 2606} {"train_loss": -6.414311408996582, "global_step": 109469, "epoch": 2606} {"train_loss": -6.342580795288086, "global_step": 109470, "epoch": 2606} {"train_loss": -6.559793949127197, "global_step": 109471, "epoch": 2606} {"train_loss": -6.245922088623047, "global_step": 109472, "epoch": 2606} {"train_loss": -6.323821067810059, "global_step": 109473, "epoch": 2606} {"train_loss": -6.248764991760254, "global_step": 109474, "epoch": 2606} {"train_loss": -6.315423965454102, "global_step": 109475, "epoch": 2606} {"train_loss": -6.344085693359375, "global_step": 109476, "epoch": 2606} {"train_loss": -6.419963836669922, "global_step": 109477, "epoch": 2606} {"train_loss": -6.344853401184082, "global_step": 109478, "epoch": 2606} {"train_loss": -6.268411159515381, "global_step": 109479, "epoch": 2606} {"train_loss": -6.391256332397461, "global_step": 109480, "epoch": 2606} {"train_loss": -6.3663482666015625, "global_step": 109481, "epoch": 2606} {"train_loss": -6.326155662536621, "global_step": 109482, "epoch": 2606} {"train_loss": -6.290791034698486, "global_step": 109483, "epoch": 2606} {"train_loss": -6.385235786437988, "global_step": 109484, "epoch": 2606} {"train_loss": -6.445406436920166, "global_step": 109485, "epoch": 2606} {"train_loss": -6.396294593811035, "global_step": 109486, "epoch": 2606} {"train_loss": -6.402733325958252, "global_step": 109487, "epoch": 2606} {"train_loss": -6.436382293701172, "global_step": 109488, "epoch": 2606} {"train_loss": -6.356123924255371, "global_step": 109489, "epoch": 2606} {"train_loss": -6.5323076248168945, "global_step": 109490, "epoch": 2606} {"train_loss": -6.466925621032715, "global_step": 109491, "epoch": 2606} {"train_loss": -6.459915637969971, "global_step": 109492, "epoch": 2606} {"train_loss": -6.391667524973552, "global_step": 109493, "epoch": 2606, "val_loss": 68009.5234375} {"train_loss": -6.480310440063477, "global_step": 109494, "epoch": 2607} {"train_loss": -6.371920585632324, "global_step": 109495, "epoch": 2607} {"train_loss": -6.38608455657959, "global_step": 109496, "epoch": 2607} {"train_loss": -6.454955101013184, "global_step": 109497, "epoch": 2607} {"train_loss": -6.431751728057861, "global_step": 109498, "epoch": 2607} {"train_loss": -6.399359703063965, "global_step": 109499, "epoch": 2607} {"train_loss": -6.365860939025879, "global_step": 109500, "epoch": 2607} {"train_loss": -6.372325897216797, "global_step": 109501, "epoch": 2607} {"train_loss": -6.4418864250183105, "global_step": 109502, "epoch": 2607} {"train_loss": -6.445892333984375, "global_step": 109503, "epoch": 2607} {"train_loss": -6.502167224884033, "global_step": 109504, "epoch": 2607} {"train_loss": -6.529608726501465, "global_step": 109505, "epoch": 2607} {"train_loss": -6.51475191116333, "global_step": 109506, "epoch": 2607} {"train_loss": -6.522390365600586, "global_step": 109507, "epoch": 2607} {"train_loss": -6.3954057693481445, "global_step": 109508, "epoch": 2607} {"train_loss": -6.31904411315918, "global_step": 109509, "epoch": 2607} {"train_loss": -6.4595537185668945, "global_step": 109510, "epoch": 2607} {"train_loss": -6.4159674644470215, "global_step": 109511, "epoch": 2607} {"train_loss": -6.531399726867676, "global_step": 109512, "epoch": 2607} {"train_loss": -6.48552131652832, "global_step": 109513, "epoch": 2607} {"train_loss": -6.473456382751465, "global_step": 109514, "epoch": 2607} {"train_loss": -6.604338645935059, "global_step": 109515, "epoch": 2607} {"train_loss": -6.327670574188232, "global_step": 109516, "epoch": 2607} {"train_loss": -6.440548419952393, "global_step": 109517, "epoch": 2607} {"train_loss": -6.535007476806641, "global_step": 109518, "epoch": 2607} {"train_loss": -6.541049003601074, "global_step": 109519, "epoch": 2607} {"train_loss": -6.554066181182861, "global_step": 109520, "epoch": 2607} {"train_loss": -6.389686584472656, "global_step": 109521, "epoch": 2607} {"train_loss": -6.521737098693848, "global_step": 109522, "epoch": 2607} {"train_loss": -6.567164421081543, "global_step": 109523, "epoch": 2607} {"train_loss": -6.457119941711426, "global_step": 109524, "epoch": 2607} {"train_loss": -6.471091270446777, "global_step": 109525, "epoch": 2607} {"train_loss": -6.441925048828125, "global_step": 109526, "epoch": 2607} {"train_loss": -6.3885321617126465, "global_step": 109527, "epoch": 2607} {"train_loss": -6.428207874298096, "global_step": 109528, "epoch": 2607} {"train_loss": -6.382129669189453, "global_step": 109529, "epoch": 2607} {"train_loss": -6.468886852264404, "global_step": 109530, "epoch": 2607} {"train_loss": -6.447957992553711, "global_step": 109531, "epoch": 2607} {"train_loss": -6.352721214294434, "global_step": 109532, "epoch": 2607} {"train_loss": -6.469590663909912, "global_step": 109533, "epoch": 2607} {"train_loss": -6.403984069824219, "global_step": 109534, "epoch": 2607} {"train_loss": -6.4507116703760055, "global_step": 109535, "epoch": 2607, "val_loss": 67912.9921875} {"train_loss": -6.468764305114746, "global_step": 109536, "epoch": 2608} {"train_loss": -6.337960720062256, "global_step": 109537, "epoch": 2608} {"train_loss": -6.47885274887085, "global_step": 109538, "epoch": 2608} {"train_loss": -6.473923683166504, "global_step": 109539, "epoch": 2608} {"train_loss": -6.337736129760742, "global_step": 109540, "epoch": 2608} {"train_loss": -6.389218330383301, "global_step": 109541, "epoch": 2608} {"train_loss": -6.425695419311523, "global_step": 109542, "epoch": 2608} {"train_loss": -6.575597763061523, "global_step": 109543, "epoch": 2608} {"train_loss": -6.3444342613220215, "global_step": 109544, "epoch": 2608} {"train_loss": -6.522947311401367, "global_step": 109545, "epoch": 2608} {"train_loss": -6.400224208831787, "global_step": 109546, "epoch": 2608} {"train_loss": -6.318113327026367, "global_step": 109547, "epoch": 2608} {"train_loss": -6.4022417068481445, "global_step": 109548, "epoch": 2608} {"train_loss": -6.232546806335449, "global_step": 109549, "epoch": 2608} {"train_loss": -6.38517427444458, "global_step": 109550, "epoch": 2608} {"train_loss": -6.522324562072754, "global_step": 109551, "epoch": 2608} {"train_loss": -6.424561500549316, "global_step": 109552, "epoch": 2608} {"train_loss": -6.332809925079346, "global_step": 109553, "epoch": 2608} {"train_loss": -6.280612945556641, "global_step": 109554, "epoch": 2608} {"train_loss": -6.420543193817139, "global_step": 109555, "epoch": 2608} {"train_loss": -6.325441360473633, "global_step": 109556, "epoch": 2608} {"train_loss": -6.3553009033203125, "global_step": 109557, "epoch": 2608} {"train_loss": -6.379507541656494, "global_step": 109558, "epoch": 2608} {"train_loss": -6.272492408752441, "global_step": 109559, "epoch": 2608} {"train_loss": -6.384463310241699, "global_step": 109560, "epoch": 2608} {"train_loss": -6.319772720336914, "global_step": 109561, "epoch": 2608} {"train_loss": -6.471931457519531, "global_step": 109562, "epoch": 2608} {"train_loss": -6.252429962158203, "global_step": 109563, "epoch": 2608} {"train_loss": -6.421751976013184, "global_step": 109564, "epoch": 2608} {"train_loss": -6.451648712158203, "global_step": 109565, "epoch": 2608} {"train_loss": -6.429263591766357, "global_step": 109566, "epoch": 2608} {"train_loss": -6.36336612701416, "global_step": 109567, "epoch": 2608} {"train_loss": -6.304433822631836, "global_step": 109568, "epoch": 2608} {"train_loss": -6.403752326965332, "global_step": 109569, "epoch": 2608} {"train_loss": -6.386359214782715, "global_step": 109570, "epoch": 2608} {"train_loss": -6.40762996673584, "global_step": 109571, "epoch": 2608} {"train_loss": -6.407248497009277, "global_step": 109572, "epoch": 2608} {"train_loss": -6.325085639953613, "global_step": 109573, "epoch": 2608} {"train_loss": -6.443680286407471, "global_step": 109574, "epoch": 2608} {"train_loss": -6.386855125427246, "global_step": 109575, "epoch": 2608} {"train_loss": -6.496478080749512, "global_step": 109576, "epoch": 2608} {"train_loss": -6.391801845459711, "global_step": 109577, "epoch": 2608, "val_loss": 68000.984375} {"train_loss": -6.342197418212891, "global_step": 109578, "epoch": 2609} {"train_loss": -6.4492411613464355, "global_step": 109579, "epoch": 2609} {"train_loss": -6.469138145446777, "global_step": 109580, "epoch": 2609} {"train_loss": -6.462282180786133, "global_step": 109581, "epoch": 2609} {"train_loss": -6.407426834106445, "global_step": 109582, "epoch": 2609} {"train_loss": -6.52431058883667, "global_step": 109583, "epoch": 2609} {"train_loss": -6.46042013168335, "global_step": 109584, "epoch": 2609} {"train_loss": -6.359528541564941, "global_step": 109585, "epoch": 2609} {"train_loss": -6.392939567565918, "global_step": 109586, "epoch": 2609} {"train_loss": -6.4753947257995605, "global_step": 109587, "epoch": 2609} {"train_loss": -6.441012859344482, "global_step": 109588, "epoch": 2609} {"train_loss": -6.440366744995117, "global_step": 109589, "epoch": 2609} {"train_loss": -6.506590366363525, "global_step": 109590, "epoch": 2609} {"train_loss": -6.380764007568359, "global_step": 109591, "epoch": 2609} {"train_loss": -6.518373966217041, "global_step": 109592, "epoch": 2609} {"train_loss": -6.445374488830566, "global_step": 109593, "epoch": 2609} {"train_loss": -6.51008415222168, "global_step": 109594, "epoch": 2609} {"train_loss": -6.486999034881592, "global_step": 109595, "epoch": 2609} {"train_loss": -6.500750541687012, "global_step": 109596, "epoch": 2609} {"train_loss": -6.491965293884277, "global_step": 109597, "epoch": 2609} {"train_loss": -6.597301006317139, "global_step": 109598, "epoch": 2609} {"train_loss": -6.461909770965576, "global_step": 109599, "epoch": 2609} {"train_loss": -6.52823543548584, "global_step": 109600, "epoch": 2609} {"train_loss": -6.512287616729736, "global_step": 109601, "epoch": 2609} {"train_loss": -6.527283668518066, "global_step": 109602, "epoch": 2609} {"train_loss": -6.450796604156494, "global_step": 109603, "epoch": 2609} {"train_loss": -6.362818717956543, "global_step": 109604, "epoch": 2609} {"train_loss": -6.421313285827637, "global_step": 109605, "epoch": 2609} {"train_loss": -6.392999649047852, "global_step": 109606, "epoch": 2609} {"train_loss": -6.587561130523682, "global_step": 109607, "epoch": 2609} {"train_loss": -6.527857780456543, "global_step": 109608, "epoch": 2609} {"train_loss": -6.467992782592773, "global_step": 109609, "epoch": 2609} {"train_loss": -6.479907989501953, "global_step": 109610, "epoch": 2609} {"train_loss": -6.478874206542969, "global_step": 109611, "epoch": 2609} {"train_loss": -6.363041877746582, "global_step": 109612, "epoch": 2609} {"train_loss": -6.4547200202941895, "global_step": 109613, "epoch": 2609} {"train_loss": -6.344789028167725, "global_step": 109614, "epoch": 2609} {"train_loss": -6.472721099853516, "global_step": 109615, "epoch": 2609} {"train_loss": -6.309042930603027, "global_step": 109616, "epoch": 2609} {"train_loss": -6.54886531829834, "global_step": 109617, "epoch": 2609} {"train_loss": -6.395605087280273, "global_step": 109618, "epoch": 2609} {"train_loss": -6.459952888034639, "global_step": 109619, "epoch": 2609, "val_loss": 67775.609375} {"train_loss": -6.445786476135254, "global_step": 109620, "epoch": 2610} {"train_loss": -6.388100624084473, "global_step": 109621, "epoch": 2610} {"train_loss": -6.402918815612793, "global_step": 109622, "epoch": 2610} {"train_loss": -6.422882080078125, "global_step": 109623, "epoch": 2610} {"train_loss": -6.450623512268066, "global_step": 109624, "epoch": 2610} {"train_loss": -6.451488494873047, "global_step": 109625, "epoch": 2610} {"train_loss": -6.465930938720703, "global_step": 109626, "epoch": 2610} {"train_loss": -6.372821807861328, "global_step": 109627, "epoch": 2610} {"train_loss": -6.468675136566162, "global_step": 109628, "epoch": 2610} {"train_loss": -6.494675636291504, "global_step": 109629, "epoch": 2610} {"train_loss": -6.331348419189453, "global_step": 109630, "epoch": 2610} {"train_loss": -6.446322441101074, "global_step": 109631, "epoch": 2610} {"train_loss": -6.393074989318848, "global_step": 109632, "epoch": 2610} {"train_loss": -6.3894147872924805, "global_step": 109633, "epoch": 2610} {"train_loss": -6.421630382537842, "global_step": 109634, "epoch": 2610} {"train_loss": -6.431291580200195, "global_step": 109635, "epoch": 2610} {"train_loss": -6.461627960205078, "global_step": 109636, "epoch": 2610} {"train_loss": -6.42832088470459, "global_step": 109637, "epoch": 2610} {"train_loss": -6.491028785705566, "global_step": 109638, "epoch": 2610} {"train_loss": -6.324643135070801, "global_step": 109639, "epoch": 2610} {"train_loss": -6.444742679595947, "global_step": 109640, "epoch": 2610} {"train_loss": -6.357669830322266, "global_step": 109641, "epoch": 2610} {"train_loss": -6.296870708465576, "global_step": 109642, "epoch": 2610} {"train_loss": -6.4449052810668945, "global_step": 109643, "epoch": 2610} {"train_loss": -6.357692241668701, "global_step": 109644, "epoch": 2610} {"train_loss": -6.441591262817383, "global_step": 109645, "epoch": 2610} {"train_loss": -6.524121284484863, "global_step": 109646, "epoch": 2610} {"train_loss": -6.355103492736816, "global_step": 109647, "epoch": 2610} {"train_loss": -6.537742614746094, "global_step": 109648, "epoch": 2610} {"train_loss": -6.479541778564453, "global_step": 109649, "epoch": 2610} {"train_loss": -6.436940670013428, "global_step": 109650, "epoch": 2610} {"train_loss": -6.385235786437988, "global_step": 109651, "epoch": 2610} {"train_loss": -6.489012718200684, "global_step": 109652, "epoch": 2610} {"train_loss": -6.411697864532471, "global_step": 109653, "epoch": 2610} {"train_loss": -6.429521560668945, "global_step": 109654, "epoch": 2610} {"train_loss": -6.4866838455200195, "global_step": 109655, "epoch": 2610} {"train_loss": -6.412497520446777, "global_step": 109656, "epoch": 2610} {"train_loss": -6.438918113708496, "global_step": 109657, "epoch": 2610} {"train_loss": -6.583857536315918, "global_step": 109658, "epoch": 2610} {"train_loss": -6.437646865844727, "global_step": 109659, "epoch": 2610} {"train_loss": -6.409951210021973, "global_step": 109660, "epoch": 2610} {"train_loss": -6.426263888676961, "global_step": 109661, "epoch": 2610, "val_loss": 67874.4921875} {"train_loss": -6.534482955932617, "global_step": 109662, "epoch": 2611} {"train_loss": -6.46921968460083, "global_step": 109663, "epoch": 2611} {"train_loss": -6.491297721862793, "global_step": 109664, "epoch": 2611} {"train_loss": -6.415547847747803, "global_step": 109665, "epoch": 2611} {"train_loss": -6.510266304016113, "global_step": 109666, "epoch": 2611} {"train_loss": -6.397585391998291, "global_step": 109667, "epoch": 2611} {"train_loss": -6.547317028045654, "global_step": 109668, "epoch": 2611} {"train_loss": -6.5446624755859375, "global_step": 109669, "epoch": 2611} {"train_loss": -6.371274471282959, "global_step": 109670, "epoch": 2611} {"train_loss": -6.466635704040527, "global_step": 109671, "epoch": 2611} {"train_loss": -6.43559455871582, "global_step": 109672, "epoch": 2611} {"train_loss": -6.312438011169434, "global_step": 109673, "epoch": 2611} {"train_loss": -6.278258323669434, "global_step": 109674, "epoch": 2611} {"train_loss": -6.417434215545654, "global_step": 109675, "epoch": 2611} {"train_loss": -6.467734336853027, "global_step": 109676, "epoch": 2611} {"train_loss": -6.293464660644531, "global_step": 109677, "epoch": 2611} {"train_loss": -6.34902286529541, "global_step": 109678, "epoch": 2611} {"train_loss": -6.365096092224121, "global_step": 109679, "epoch": 2611} {"train_loss": -6.3539137840271, "global_step": 109680, "epoch": 2611} {"train_loss": -6.2963480949401855, "global_step": 109681, "epoch": 2611} {"train_loss": -6.488368034362793, "global_step": 109682, "epoch": 2611} {"train_loss": -6.398815631866455, "global_step": 109683, "epoch": 2611} {"train_loss": -6.4317216873168945, "global_step": 109684, "epoch": 2611} {"train_loss": -6.536923885345459, "global_step": 109685, "epoch": 2611} {"train_loss": -6.483962059020996, "global_step": 109686, "epoch": 2611} {"train_loss": -6.544323444366455, "global_step": 109687, "epoch": 2611} {"train_loss": -6.454113483428955, "global_step": 109688, "epoch": 2611} {"train_loss": -6.507016181945801, "global_step": 109689, "epoch": 2611} {"train_loss": -6.464211463928223, "global_step": 109690, "epoch": 2611} {"train_loss": -6.449853897094727, "global_step": 109691, "epoch": 2611} {"train_loss": -6.451960563659668, "global_step": 109692, "epoch": 2611} {"train_loss": -6.475584030151367, "global_step": 109693, "epoch": 2611} {"train_loss": -6.462942600250244, "global_step": 109694, "epoch": 2611} {"train_loss": -6.458045959472656, "global_step": 109695, "epoch": 2611} {"train_loss": -6.410419940948486, "global_step": 109696, "epoch": 2611} {"train_loss": -6.395220756530762, "global_step": 109697, "epoch": 2611} {"train_loss": -6.503264904022217, "global_step": 109698, "epoch": 2611} {"train_loss": -6.374235153198242, "global_step": 109699, "epoch": 2611} {"train_loss": -6.439896106719971, "global_step": 109700, "epoch": 2611} {"train_loss": -6.406435012817383, "global_step": 109701, "epoch": 2611} {"train_loss": -6.566577911376953, "global_step": 109702, "epoch": 2611} {"train_loss": -6.441365605308896, "global_step": 109703, "epoch": 2611, "val_loss": 67907.21875} {"train_loss": -6.457799434661865, "global_step": 109704, "epoch": 2612} {"train_loss": -6.415020942687988, "global_step": 109705, "epoch": 2612} {"train_loss": -6.496797561645508, "global_step": 109706, "epoch": 2612} {"train_loss": -6.581861972808838, "global_step": 109707, "epoch": 2612} {"train_loss": -6.426352024078369, "global_step": 109708, "epoch": 2612} {"train_loss": -6.433837413787842, "global_step": 109709, "epoch": 2612} {"train_loss": -6.517767906188965, "global_step": 109710, "epoch": 2612} {"train_loss": -6.4379096031188965, "global_step": 109711, "epoch": 2612} {"train_loss": -6.4720258712768555, "global_step": 109712, "epoch": 2612} {"train_loss": -6.440830230712891, "global_step": 109713, "epoch": 2612} {"train_loss": -6.324314594268799, "global_step": 109714, "epoch": 2612} {"train_loss": -6.497902870178223, "global_step": 109715, "epoch": 2612} {"train_loss": -6.489040851593018, "global_step": 109716, "epoch": 2612} {"train_loss": -6.358786582946777, "global_step": 109717, "epoch": 2612} {"train_loss": -6.441039562225342, "global_step": 109718, "epoch": 2612} {"train_loss": -6.389540672302246, "global_step": 109719, "epoch": 2612} {"train_loss": -6.404845237731934, "global_step": 109720, "epoch": 2612} {"train_loss": -6.354959487915039, "global_step": 109721, "epoch": 2612} {"train_loss": -6.2520575523376465, "global_step": 109722, "epoch": 2612} {"train_loss": -6.435892105102539, "global_step": 109723, "epoch": 2612} {"train_loss": -6.2938385009765625, "global_step": 109724, "epoch": 2612} {"train_loss": -6.460999488830566, "global_step": 109725, "epoch": 2612} {"train_loss": -6.325845718383789, "global_step": 109726, "epoch": 2612} {"train_loss": -6.32918643951416, "global_step": 109727, "epoch": 2612} {"train_loss": -6.444328784942627, "global_step": 109728, "epoch": 2612} {"train_loss": -6.389090061187744, "global_step": 109729, "epoch": 2612} {"train_loss": -6.418458938598633, "global_step": 109730, "epoch": 2612} {"train_loss": -6.485848903656006, "global_step": 109731, "epoch": 2612} {"train_loss": -6.547544956207275, "global_step": 109732, "epoch": 2612} {"train_loss": -6.437926769256592, "global_step": 109733, "epoch": 2612} {"train_loss": -6.425323009490967, "global_step": 109734, "epoch": 2612} {"train_loss": -6.318574905395508, "global_step": 109735, "epoch": 2612} {"train_loss": -6.486307144165039, "global_step": 109736, "epoch": 2612} {"train_loss": -6.437224388122559, "global_step": 109737, "epoch": 2612} {"train_loss": -6.450454235076904, "global_step": 109738, "epoch": 2612} {"train_loss": -6.437887191772461, "global_step": 109739, "epoch": 2612} {"train_loss": -6.429961681365967, "global_step": 109740, "epoch": 2612} {"train_loss": -6.5050811767578125, "global_step": 109741, "epoch": 2612} {"train_loss": -6.324110984802246, "global_step": 109742, "epoch": 2612} {"train_loss": -6.385320663452148, "global_step": 109743, "epoch": 2612} {"train_loss": -6.481893539428711, "global_step": 109744, "epoch": 2612} {"train_loss": -6.426174913133893, "global_step": 109745, "epoch": 2612, "val_loss": 67803.4140625} {"train_loss": -6.612611770629883, "global_step": 109746, "epoch": 2613} {"train_loss": -6.440056800842285, "global_step": 109747, "epoch": 2613} {"train_loss": -6.290036201477051, "global_step": 109748, "epoch": 2613} {"train_loss": -6.452723503112793, "global_step": 109749, "epoch": 2613} {"train_loss": -6.347209930419922, "global_step": 109750, "epoch": 2613} {"train_loss": -6.405179977416992, "global_step": 109751, "epoch": 2613} {"train_loss": -6.414584159851074, "global_step": 109752, "epoch": 2613} {"train_loss": -6.329892635345459, "global_step": 109753, "epoch": 2613} {"train_loss": -6.457281589508057, "global_step": 109754, "epoch": 2613} {"train_loss": -6.461658477783203, "global_step": 109755, "epoch": 2613} {"train_loss": -6.256258010864258, "global_step": 109756, "epoch": 2613} {"train_loss": -6.423241138458252, "global_step": 109757, "epoch": 2613} {"train_loss": -6.385982513427734, "global_step": 109758, "epoch": 2613} {"train_loss": -6.295772075653076, "global_step": 109759, "epoch": 2613} {"train_loss": -6.389493942260742, "global_step": 109760, "epoch": 2613} {"train_loss": -6.418052673339844, "global_step": 109761, "epoch": 2613} {"train_loss": -6.3116044998168945, "global_step": 109762, "epoch": 2613} {"train_loss": -6.457021713256836, "global_step": 109763, "epoch": 2613} {"train_loss": -6.378456115722656, "global_step": 109764, "epoch": 2613} {"train_loss": -6.395485877990723, "global_step": 109765, "epoch": 2613} {"train_loss": -6.510788917541504, "global_step": 109766, "epoch": 2613} {"train_loss": -6.428977012634277, "global_step": 109767, "epoch": 2613} {"train_loss": -6.447114944458008, "global_step": 109768, "epoch": 2613} {"train_loss": -6.455414295196533, "global_step": 109769, "epoch": 2613} {"train_loss": -6.399779319763184, "global_step": 109770, "epoch": 2613} {"train_loss": -6.519700527191162, "global_step": 109771, "epoch": 2613} {"train_loss": -6.494136810302734, "global_step": 109772, "epoch": 2613} {"train_loss": -6.420614719390869, "global_step": 109773, "epoch": 2613} {"train_loss": -6.4743499755859375, "global_step": 109774, "epoch": 2613} {"train_loss": -6.439434051513672, "global_step": 109775, "epoch": 2613} {"train_loss": -6.387567520141602, "global_step": 109776, "epoch": 2613} {"train_loss": -6.494064807891846, "global_step": 109777, "epoch": 2613} {"train_loss": -6.475192546844482, "global_step": 109778, "epoch": 2613} {"train_loss": -6.484283447265625, "global_step": 109779, "epoch": 2613} {"train_loss": -6.439253807067871, "global_step": 109780, "epoch": 2613} {"train_loss": -6.489668846130371, "global_step": 109781, "epoch": 2613} {"train_loss": -6.601487159729004, "global_step": 109782, "epoch": 2613} {"train_loss": -6.434815883636475, "global_step": 109783, "epoch": 2613} {"train_loss": -6.4489030838012695, "global_step": 109784, "epoch": 2613} {"train_loss": -6.441245079040527, "global_step": 109785, "epoch": 2613} {"train_loss": -6.5325188636779785, "global_step": 109786, "epoch": 2613} {"train_loss": -6.433545861925397, "global_step": 109787, "epoch": 2613, "val_loss": 67935.1484375} {"train_loss": -6.460258960723877, "global_step": 109788, "epoch": 2614} {"train_loss": -6.490433692932129, "global_step": 109789, "epoch": 2614} {"train_loss": -6.427061080932617, "global_step": 109790, "epoch": 2614} {"train_loss": -6.305456161499023, "global_step": 109791, "epoch": 2614} {"train_loss": -6.519383907318115, "global_step": 109792, "epoch": 2614} {"train_loss": -6.464250564575195, "global_step": 109793, "epoch": 2614} {"train_loss": -6.458189964294434, "global_step": 109794, "epoch": 2614} {"train_loss": -6.509993553161621, "global_step": 109795, "epoch": 2614} {"train_loss": -6.527978897094727, "global_step": 109796, "epoch": 2614} {"train_loss": -6.383200645446777, "global_step": 109797, "epoch": 2614} {"train_loss": -6.4072442054748535, "global_step": 109798, "epoch": 2614} {"train_loss": -6.424246788024902, "global_step": 109799, "epoch": 2614} {"train_loss": -6.46811056137085, "global_step": 109800, "epoch": 2614} {"train_loss": -6.431375503540039, "global_step": 109801, "epoch": 2614} {"train_loss": -6.546897888183594, "global_step": 109802, "epoch": 2614} {"train_loss": -6.468984127044678, "global_step": 109803, "epoch": 2614} {"train_loss": -6.609339714050293, "global_step": 109804, "epoch": 2614} {"train_loss": -6.396862983703613, "global_step": 109805, "epoch": 2614} {"train_loss": -6.431981086730957, "global_step": 109806, "epoch": 2614} {"train_loss": -6.555288314819336, "global_step": 109807, "epoch": 2614} {"train_loss": -6.4129638671875, "global_step": 109808, "epoch": 2614} {"train_loss": -6.333126544952393, "global_step": 109809, "epoch": 2614} {"train_loss": -6.48432731628418, "global_step": 109810, "epoch": 2614} {"train_loss": -6.391826629638672, "global_step": 109811, "epoch": 2614} {"train_loss": -6.35941219329834, "global_step": 109812, "epoch": 2614} {"train_loss": -6.531205177307129, "global_step": 109813, "epoch": 2614} {"train_loss": -6.396371364593506, "global_step": 109814, "epoch": 2614} {"train_loss": -6.383184432983398, "global_step": 109815, "epoch": 2614} {"train_loss": -6.452940940856934, "global_step": 109816, "epoch": 2614} {"train_loss": -6.403337478637695, "global_step": 109817, "epoch": 2614} {"train_loss": -6.516389846801758, "global_step": 109818, "epoch": 2614} {"train_loss": -6.426008224487305, "global_step": 109819, "epoch": 2614} {"train_loss": -6.494841575622559, "global_step": 109820, "epoch": 2614} {"train_loss": -6.508231163024902, "global_step": 109821, "epoch": 2614} {"train_loss": -6.413339614868164, "global_step": 109822, "epoch": 2614} {"train_loss": -6.419029712677002, "global_step": 109823, "epoch": 2614} {"train_loss": -6.417068004608154, "global_step": 109824, "epoch": 2614} {"train_loss": -6.440838813781738, "global_step": 109825, "epoch": 2614} {"train_loss": -6.429035186767578, "global_step": 109826, "epoch": 2614} {"train_loss": -6.388378143310547, "global_step": 109827, "epoch": 2614} {"train_loss": -6.466641902923584, "global_step": 109828, "epoch": 2614} {"train_loss": -6.450054407119751, "global_step": 109829, "epoch": 2614, "val_loss": 67847.8515625} {"train_loss": -6.435324668884277, "global_step": 109830, "epoch": 2615} {"train_loss": -6.444258689880371, "global_step": 109831, "epoch": 2615} {"train_loss": -6.429365158081055, "global_step": 109832, "epoch": 2615} {"train_loss": -6.4708757400512695, "global_step": 109833, "epoch": 2615} {"train_loss": -6.544168472290039, "global_step": 109834, "epoch": 2615} {"train_loss": -6.426486015319824, "global_step": 109835, "epoch": 2615} {"train_loss": -6.516280174255371, "global_step": 109836, "epoch": 2615} {"train_loss": -6.447965621948242, "global_step": 109837, "epoch": 2615} {"train_loss": -6.485908031463623, "global_step": 109838, "epoch": 2615} {"train_loss": -6.546459197998047, "global_step": 109839, "epoch": 2615} {"train_loss": -6.489875793457031, "global_step": 109840, "epoch": 2615} {"train_loss": -6.368109226226807, "global_step": 109841, "epoch": 2615} {"train_loss": -6.522974014282227, "global_step": 109842, "epoch": 2615} {"train_loss": -6.371502876281738, "global_step": 109843, "epoch": 2615} {"train_loss": -6.506035804748535, "global_step": 109844, "epoch": 2615} {"train_loss": -6.3749189376831055, "global_step": 109845, "epoch": 2615} {"train_loss": -6.374025344848633, "global_step": 109846, "epoch": 2615} {"train_loss": -6.472595691680908, "global_step": 109847, "epoch": 2615} {"train_loss": -6.443964004516602, "global_step": 109848, "epoch": 2615} {"train_loss": -6.347695827484131, "global_step": 109849, "epoch": 2615} {"train_loss": -6.467752933502197, "global_step": 109850, "epoch": 2615} {"train_loss": -6.5125041007995605, "global_step": 109851, "epoch": 2615} {"train_loss": -6.34682559967041, "global_step": 109852, "epoch": 2615} {"train_loss": -6.368533134460449, "global_step": 109853, "epoch": 2615} {"train_loss": -6.539798259735107, "global_step": 109854, "epoch": 2615} {"train_loss": -6.48422384262085, "global_step": 109855, "epoch": 2615} {"train_loss": -6.532232284545898, "global_step": 109856, "epoch": 2615} {"train_loss": -6.443864822387695, "global_step": 109857, "epoch": 2615} {"train_loss": -6.454800605773926, "global_step": 109858, "epoch": 2615} {"train_loss": -6.331891059875488, "global_step": 109859, "epoch": 2615} {"train_loss": -6.344890117645264, "global_step": 109860, "epoch": 2615} {"train_loss": -6.452855587005615, "global_step": 109861, "epoch": 2615} {"train_loss": -6.397547245025635, "global_step": 109862, "epoch": 2615} {"train_loss": -6.393800735473633, "global_step": 109863, "epoch": 2615} {"train_loss": -6.474401473999023, "global_step": 109864, "epoch": 2615} {"train_loss": -6.4657883644104, "global_step": 109865, "epoch": 2615} {"train_loss": -6.504287242889404, "global_step": 109866, "epoch": 2615} {"train_loss": -6.342041015625, "global_step": 109867, "epoch": 2615} {"train_loss": -6.525996208190918, "global_step": 109868, "epoch": 2615} {"train_loss": -6.425616264343262, "global_step": 109869, "epoch": 2615} {"train_loss": -6.426332473754883, "global_step": 109870, "epoch": 2615} {"train_loss": -6.446869611740112, "global_step": 109871, "epoch": 2615, "val_loss": 67931.53125} {"train_loss": -6.358816146850586, "global_step": 109872, "epoch": 2616} {"train_loss": -6.418532848358154, "global_step": 109873, "epoch": 2616} {"train_loss": -6.513509750366211, "global_step": 109874, "epoch": 2616} {"train_loss": -6.443896293640137, "global_step": 109875, "epoch": 2616} {"train_loss": -6.606916904449463, "global_step": 109876, "epoch": 2616} {"train_loss": -6.505798816680908, "global_step": 109877, "epoch": 2616} {"train_loss": -6.588690757751465, "global_step": 109878, "epoch": 2616} {"train_loss": -6.443456649780273, "global_step": 109879, "epoch": 2616} {"train_loss": -6.439310073852539, "global_step": 109880, "epoch": 2616} {"train_loss": -6.409482002258301, "global_step": 109881, "epoch": 2616} {"train_loss": -6.5198493003845215, "global_step": 109882, "epoch": 2616} {"train_loss": -6.209986686706543, "global_step": 109883, "epoch": 2616} {"train_loss": -6.441765785217285, "global_step": 109884, "epoch": 2616} {"train_loss": -6.414894104003906, "global_step": 109885, "epoch": 2616} {"train_loss": -6.391348361968994, "global_step": 109886, "epoch": 2616} {"train_loss": -6.465198993682861, "global_step": 109887, "epoch": 2616} {"train_loss": -6.320347785949707, "global_step": 109888, "epoch": 2616} {"train_loss": -6.467392444610596, "global_step": 109889, "epoch": 2616} {"train_loss": -6.513466835021973, "global_step": 109890, "epoch": 2616} {"train_loss": -6.4506425857543945, "global_step": 109891, "epoch": 2616} {"train_loss": -6.477897644042969, "global_step": 109892, "epoch": 2616} {"train_loss": -6.418598651885986, "global_step": 109893, "epoch": 2616} {"train_loss": -6.33762264251709, "global_step": 109894, "epoch": 2616} {"train_loss": -6.517635345458984, "global_step": 109895, "epoch": 2616} {"train_loss": -6.551836013793945, "global_step": 109896, "epoch": 2616} {"train_loss": -6.42371940612793, "global_step": 109897, "epoch": 2616} {"train_loss": -6.512580871582031, "global_step": 109898, "epoch": 2616} {"train_loss": -6.371283531188965, "global_step": 109899, "epoch": 2616} {"train_loss": -6.403075218200684, "global_step": 109900, "epoch": 2616} {"train_loss": -6.386851787567139, "global_step": 109901, "epoch": 2616} {"train_loss": -6.502408504486084, "global_step": 109902, "epoch": 2616} {"train_loss": -6.4086480140686035, "global_step": 109903, "epoch": 2616} {"train_loss": -6.549891948699951, "global_step": 109904, "epoch": 2616} {"train_loss": -6.476813316345215, "global_step": 109905, "epoch": 2616} {"train_loss": -6.434262275695801, "global_step": 109906, "epoch": 2616} {"train_loss": -6.370871543884277, "global_step": 109907, "epoch": 2616} {"train_loss": -6.408631801605225, "global_step": 109908, "epoch": 2616} {"train_loss": -6.4980998039245605, "global_step": 109909, "epoch": 2616} {"train_loss": -6.407059669494629, "global_step": 109910, "epoch": 2616} {"train_loss": -6.449337959289551, "global_step": 109911, "epoch": 2616} {"train_loss": -6.521009922027588, "global_step": 109912, "epoch": 2616} {"train_loss": -6.448325316111247, "global_step": 109913, "epoch": 2616, "val_loss": 67778.96875} {"train_loss": -6.481444358825684, "global_step": 109914, "epoch": 2617} {"train_loss": -6.590431213378906, "global_step": 109915, "epoch": 2617} {"train_loss": -6.422281265258789, "global_step": 109916, "epoch": 2617} {"train_loss": -6.484338760375977, "global_step": 109917, "epoch": 2617} {"train_loss": -6.475239276885986, "global_step": 109918, "epoch": 2617} {"train_loss": -6.492321491241455, "global_step": 109919, "epoch": 2617} {"train_loss": -6.533400535583496, "global_step": 109920, "epoch": 2617} {"train_loss": -6.500413417816162, "global_step": 109921, "epoch": 2617} {"train_loss": -6.387050151824951, "global_step": 109922, "epoch": 2617} {"train_loss": -6.445219039916992, "global_step": 109923, "epoch": 2617} {"train_loss": -6.560254096984863, "global_step": 109924, "epoch": 2617} {"train_loss": -6.52460241317749, "global_step": 109925, "epoch": 2617} {"train_loss": -6.447117805480957, "global_step": 109926, "epoch": 2617} {"train_loss": -6.416604042053223, "global_step": 109927, "epoch": 2617} {"train_loss": -6.321711540222168, "global_step": 109928, "epoch": 2617} {"train_loss": -6.515144348144531, "global_step": 109929, "epoch": 2617} {"train_loss": -6.2572431564331055, "global_step": 109930, "epoch": 2617} {"train_loss": -6.560306549072266, "global_step": 109931, "epoch": 2617} {"train_loss": -6.4566192626953125, "global_step": 109932, "epoch": 2617} {"train_loss": -6.569404602050781, "global_step": 109933, "epoch": 2617} {"train_loss": -6.5109710693359375, "global_step": 109934, "epoch": 2617} {"train_loss": -6.362212181091309, "global_step": 109935, "epoch": 2617} {"train_loss": -6.356552600860596, "global_step": 109936, "epoch": 2617} {"train_loss": -6.476144313812256, "global_step": 109937, "epoch": 2617} {"train_loss": -6.423111915588379, "global_step": 109938, "epoch": 2617} {"train_loss": -6.474738121032715, "global_step": 109939, "epoch": 2617} {"train_loss": -6.5723490715026855, "global_step": 109940, "epoch": 2617} {"train_loss": -6.475625991821289, "global_step": 109941, "epoch": 2617} {"train_loss": -6.50396728515625, "global_step": 109942, "epoch": 2617} {"train_loss": -6.412881851196289, "global_step": 109943, "epoch": 2617} {"train_loss": -6.550726890563965, "global_step": 109944, "epoch": 2617} {"train_loss": -6.472753047943115, "global_step": 109945, "epoch": 2617} {"train_loss": -6.434540271759033, "global_step": 109946, "epoch": 2617} {"train_loss": -6.599093437194824, "global_step": 109947, "epoch": 2617} {"train_loss": -6.4638824462890625, "global_step": 109948, "epoch": 2617} {"train_loss": -6.450852394104004, "global_step": 109949, "epoch": 2617} {"train_loss": -6.3571624755859375, "global_step": 109950, "epoch": 2617} {"train_loss": -6.461481094360352, "global_step": 109951, "epoch": 2617} {"train_loss": -6.470491886138916, "global_step": 109952, "epoch": 2617} {"train_loss": -6.441251754760742, "global_step": 109953, "epoch": 2617} {"train_loss": -6.36814022064209, "global_step": 109954, "epoch": 2617} {"train_loss": -6.46536127726237, "global_step": 109955, "epoch": 2617, "val_loss": 67887.6875} {"train_loss": -6.570202827453613, "global_step": 109956, "epoch": 2618} {"train_loss": -6.304618835449219, "global_step": 109957, "epoch": 2618} {"train_loss": -6.462740421295166, "global_step": 109958, "epoch": 2618} {"train_loss": -6.464591979980469, "global_step": 109959, "epoch": 2618} {"train_loss": -6.424312591552734, "global_step": 109960, "epoch": 2618} {"train_loss": -6.339777946472168, "global_step": 109961, "epoch": 2618} {"train_loss": -6.3464274406433105, "global_step": 109962, "epoch": 2618} {"train_loss": -6.422033786773682, "global_step": 109963, "epoch": 2618} {"train_loss": -6.40171480178833, "global_step": 109964, "epoch": 2618} {"train_loss": -6.378973960876465, "global_step": 109965, "epoch": 2618} {"train_loss": -6.474222660064697, "global_step": 109966, "epoch": 2618} {"train_loss": -6.284739971160889, "global_step": 109967, "epoch": 2618} {"train_loss": -6.499080181121826, "global_step": 109968, "epoch": 2618} {"train_loss": -6.41080379486084, "global_step": 109969, "epoch": 2618} {"train_loss": -6.4322099685668945, "global_step": 109970, "epoch": 2618} {"train_loss": -6.518167495727539, "global_step": 109971, "epoch": 2618} {"train_loss": -6.53497314453125, "global_step": 109972, "epoch": 2618} {"train_loss": -6.464061737060547, "global_step": 109973, "epoch": 2618} {"train_loss": -6.447653770446777, "global_step": 109974, "epoch": 2618} {"train_loss": -6.441019535064697, "global_step": 109975, "epoch": 2618} {"train_loss": -6.484389781951904, "global_step": 109976, "epoch": 2618} {"train_loss": -6.463829040527344, "global_step": 109977, "epoch": 2618} {"train_loss": -6.355243682861328, "global_step": 109978, "epoch": 2618} {"train_loss": -6.424059867858887, "global_step": 109979, "epoch": 2618} {"train_loss": -6.4773406982421875, "global_step": 109980, "epoch": 2618} {"train_loss": -6.500575065612793, "global_step": 109981, "epoch": 2618} {"train_loss": -6.366135597229004, "global_step": 109982, "epoch": 2618} {"train_loss": -6.403872489929199, "global_step": 109983, "epoch": 2618} {"train_loss": -6.542647361755371, "global_step": 109984, "epoch": 2618} {"train_loss": -6.404352188110352, "global_step": 109985, "epoch": 2618} {"train_loss": -6.398078918457031, "global_step": 109986, "epoch": 2618} {"train_loss": -6.520810604095459, "global_step": 109987, "epoch": 2618} {"train_loss": -6.4326276779174805, "global_step": 109988, "epoch": 2618} {"train_loss": -6.419032096862793, "global_step": 109989, "epoch": 2618} {"train_loss": -6.581748008728027, "global_step": 109990, "epoch": 2618} {"train_loss": -6.4554524421691895, "global_step": 109991, "epoch": 2618} {"train_loss": -6.431604385375977, "global_step": 109992, "epoch": 2618} {"train_loss": -6.442495346069336, "global_step": 109993, "epoch": 2618} {"train_loss": -6.432704448699951, "global_step": 109994, "epoch": 2618} {"train_loss": -6.4206085205078125, "global_step": 109995, "epoch": 2618} {"train_loss": -6.4087934494018555, "global_step": 109996, "epoch": 2618} {"train_loss": -6.436922391255696, "global_step": 109997, "epoch": 2618, "val_loss": 67824.3046875} {"train_loss": -6.345299243927002, "global_step": 109998, "epoch": 2619} {"train_loss": -6.320196628570557, "global_step": 109999, "epoch": 2619} {"train_loss": -6.478987216949463, "global_step": 110000, "epoch": 2619} {"train_loss": -6.399862289428711, "global_step": 110001, "epoch": 2619} {"train_loss": -6.393747329711914, "global_step": 110002, "epoch": 2619} {"train_loss": -6.470223426818848, "global_step": 110003, "epoch": 2619} {"train_loss": -6.463801383972168, "global_step": 110004, "epoch": 2619} {"train_loss": -6.471004486083984, "global_step": 110005, "epoch": 2619} {"train_loss": -6.422621250152588, "global_step": 110006, "epoch": 2619} {"train_loss": -6.458896160125732, "global_step": 110007, "epoch": 2619} {"train_loss": -6.366420745849609, "global_step": 110008, "epoch": 2619} {"train_loss": -6.51078987121582, "global_step": 110009, "epoch": 2619} {"train_loss": -6.441862106323242, "global_step": 110010, "epoch": 2619} {"train_loss": -6.4131011962890625, "global_step": 110011, "epoch": 2619} {"train_loss": -6.409094333648682, "global_step": 110012, "epoch": 2619} {"train_loss": -6.46579647064209, "global_step": 110013, "epoch": 2619} {"train_loss": -6.324254035949707, "global_step": 110014, "epoch": 2619} {"train_loss": -6.458944320678711, "global_step": 110015, "epoch": 2619} {"train_loss": -6.421053886413574, "global_step": 110016, "epoch": 2619} {"train_loss": -6.4994707107543945, "global_step": 110017, "epoch": 2619} {"train_loss": -6.511230945587158, "global_step": 110018, "epoch": 2619} {"train_loss": -6.3119096755981445, "global_step": 110019, "epoch": 2619} {"train_loss": -6.5042009353637695, "global_step": 110020, "epoch": 2619} {"train_loss": -6.378755569458008, "global_step": 110021, "epoch": 2619} {"train_loss": -6.418753147125244, "global_step": 110022, "epoch": 2619} {"train_loss": -6.461363792419434, "global_step": 110023, "epoch": 2619} {"train_loss": -6.517731666564941, "global_step": 110024, "epoch": 2619} {"train_loss": -6.419208526611328, "global_step": 110025, "epoch": 2619} {"train_loss": -6.323034286499023, "global_step": 110026, "epoch": 2619} {"train_loss": -6.431626796722412, "global_step": 110027, "epoch": 2619} {"train_loss": -6.430447578430176, "global_step": 110028, "epoch": 2619} {"train_loss": -6.258371353149414, "global_step": 110029, "epoch": 2619} {"train_loss": -6.501368999481201, "global_step": 110030, "epoch": 2619} {"train_loss": -6.237470626831055, "global_step": 110031, "epoch": 2619} {"train_loss": -6.3404951095581055, "global_step": 110032, "epoch": 2619} {"train_loss": -6.3306427001953125, "global_step": 110033, "epoch": 2619} {"train_loss": -6.35092306137085, "global_step": 110034, "epoch": 2619} {"train_loss": -6.449021339416504, "global_step": 110035, "epoch": 2619} {"train_loss": -6.385579586029053, "global_step": 110036, "epoch": 2619} {"train_loss": -6.309667110443115, "global_step": 110037, "epoch": 2619} {"train_loss": -6.406810283660889, "global_step": 110038, "epoch": 2619} {"train_loss": -6.409012408483596, "global_step": 110039, "epoch": 2619, "val_loss": 68014.2109375} {"train_loss": -6.464088439941406, "global_step": 110040, "epoch": 2620} {"train_loss": -6.448641777038574, "global_step": 110041, "epoch": 2620} {"train_loss": -6.406255722045898, "global_step": 110042, "epoch": 2620} {"train_loss": -6.256023406982422, "global_step": 110043, "epoch": 2620} {"train_loss": -6.459373950958252, "global_step": 110044, "epoch": 2620} {"train_loss": -6.348470687866211, "global_step": 110045, "epoch": 2620} {"train_loss": -6.432940483093262, "global_step": 110046, "epoch": 2620} {"train_loss": -6.403663635253906, "global_step": 110047, "epoch": 2620} {"train_loss": -6.41685676574707, "global_step": 110048, "epoch": 2620} {"train_loss": -6.39253044128418, "global_step": 110049, "epoch": 2620} {"train_loss": -6.454699516296387, "global_step": 110050, "epoch": 2620} {"train_loss": -6.393488883972168, "global_step": 110051, "epoch": 2620} {"train_loss": -6.483072757720947, "global_step": 110052, "epoch": 2620} {"train_loss": -6.477077484130859, "global_step": 110053, "epoch": 2620} {"train_loss": -6.450252532958984, "global_step": 110054, "epoch": 2620} {"train_loss": -6.451403617858887, "global_step": 110055, "epoch": 2620} {"train_loss": -6.549872398376465, "global_step": 110056, "epoch": 2620} {"train_loss": -6.384372234344482, "global_step": 110057, "epoch": 2620} {"train_loss": -6.417479991912842, "global_step": 110058, "epoch": 2620} {"train_loss": -6.395076274871826, "global_step": 110059, "epoch": 2620} {"train_loss": -6.520216941833496, "global_step": 110060, "epoch": 2620} {"train_loss": -6.598752021789551, "global_step": 110061, "epoch": 2620} {"train_loss": -6.487286567687988, "global_step": 110062, "epoch": 2620} {"train_loss": -6.44379186630249, "global_step": 110063, "epoch": 2620} {"train_loss": -6.514045715332031, "global_step": 110064, "epoch": 2620} {"train_loss": -6.477550029754639, "global_step": 110065, "epoch": 2620} {"train_loss": -6.547670364379883, "global_step": 110066, "epoch": 2620} {"train_loss": -6.434148788452148, "global_step": 110067, "epoch": 2620} {"train_loss": -6.581966400146484, "global_step": 110068, "epoch": 2620} {"train_loss": -6.327249526977539, "global_step": 110069, "epoch": 2620} {"train_loss": -6.52082633972168, "global_step": 110070, "epoch": 2620} {"train_loss": -6.431827545166016, "global_step": 110071, "epoch": 2620} {"train_loss": -6.528998851776123, "global_step": 110072, "epoch": 2620} {"train_loss": -6.4043378829956055, "global_step": 110073, "epoch": 2620} {"train_loss": -6.487340927124023, "global_step": 110074, "epoch": 2620} {"train_loss": -6.366209983825684, "global_step": 110075, "epoch": 2620} {"train_loss": -6.485320091247559, "global_step": 110076, "epoch": 2620} {"train_loss": -6.633538246154785, "global_step": 110077, "epoch": 2620} {"train_loss": -6.420922756195068, "global_step": 110078, "epoch": 2620} {"train_loss": -6.4520978927612305, "global_step": 110079, "epoch": 2620} {"train_loss": -6.374286651611328, "global_step": 110080, "epoch": 2620} {"train_loss": -6.451206332161313, "global_step": 110081, "epoch": 2620, "val_loss": 67917.4609375} {"train_loss": -6.557941913604736, "global_step": 110082, "epoch": 2621} {"train_loss": -6.416463375091553, "global_step": 110083, "epoch": 2621} {"train_loss": -6.492159843444824, "global_step": 110084, "epoch": 2621} {"train_loss": -6.418992042541504, "global_step": 110085, "epoch": 2621} {"train_loss": -6.373571395874023, "global_step": 110086, "epoch": 2621} {"train_loss": -6.356444358825684, "global_step": 110087, "epoch": 2621} {"train_loss": -6.623243808746338, "global_step": 110088, "epoch": 2621} {"train_loss": -6.394264221191406, "global_step": 110089, "epoch": 2621} {"train_loss": -6.441981315612793, "global_step": 110090, "epoch": 2621} {"train_loss": -6.4721784591674805, "global_step": 110091, "epoch": 2621} {"train_loss": -6.483424186706543, "global_step": 110092, "epoch": 2621} {"train_loss": -6.576043128967285, "global_step": 110093, "epoch": 2621} {"train_loss": -6.348372459411621, "global_step": 110094, "epoch": 2621} {"train_loss": -6.494479179382324, "global_step": 110095, "epoch": 2621} {"train_loss": -6.514638900756836, "global_step": 110096, "epoch": 2621} {"train_loss": -6.4542365074157715, "global_step": 110097, "epoch": 2621} {"train_loss": -6.4924163818359375, "global_step": 110098, "epoch": 2621} {"train_loss": -6.5272674560546875, "global_step": 110099, "epoch": 2621} {"train_loss": -6.40938663482666, "global_step": 110100, "epoch": 2621} {"train_loss": -6.456569194793701, "global_step": 110101, "epoch": 2621} {"train_loss": -6.368472099304199, "global_step": 110102, "epoch": 2621} {"train_loss": -6.481423854827881, "global_step": 110103, "epoch": 2621} {"train_loss": -6.503872871398926, "global_step": 110104, "epoch": 2621} {"train_loss": -6.370843887329102, "global_step": 110105, "epoch": 2621} {"train_loss": -6.367649078369141, "global_step": 110106, "epoch": 2621} {"train_loss": -6.452565670013428, "global_step": 110107, "epoch": 2621} {"train_loss": -6.483644008636475, "global_step": 110108, "epoch": 2621} {"train_loss": -6.440408706665039, "global_step": 110109, "epoch": 2621} {"train_loss": -6.47606897354126, "global_step": 110110, "epoch": 2621} {"train_loss": -6.389249801635742, "global_step": 110111, "epoch": 2621} {"train_loss": -6.381814002990723, "global_step": 110112, "epoch": 2621} {"train_loss": -6.373959541320801, "global_step": 110113, "epoch": 2621} {"train_loss": -6.3305277824401855, "global_step": 110114, "epoch": 2621} {"train_loss": -6.4170989990234375, "global_step": 110115, "epoch": 2621} {"train_loss": -6.365570068359375, "global_step": 110116, "epoch": 2621} {"train_loss": -6.21037483215332, "global_step": 110117, "epoch": 2621} {"train_loss": -6.396369934082031, "global_step": 110118, "epoch": 2621} {"train_loss": -6.366581916809082, "global_step": 110119, "epoch": 2621} {"train_loss": -6.43146276473999, "global_step": 110120, "epoch": 2621} {"train_loss": -6.397645950317383, "global_step": 110121, "epoch": 2621} {"train_loss": -6.458882808685303, "global_step": 110122, "epoch": 2621} {"train_loss": -6.4324127946581156, "global_step": 110123, "epoch": 2621, "val_loss": 67696.125} {"train_loss": -6.448441028594971, "global_step": 110124, "epoch": 2622} {"train_loss": -6.3988494873046875, "global_step": 110125, "epoch": 2622} {"train_loss": -6.409066200256348, "global_step": 110126, "epoch": 2622} {"train_loss": -6.398297309875488, "global_step": 110127, "epoch": 2622} {"train_loss": -6.376049518585205, "global_step": 110128, "epoch": 2622} {"train_loss": -6.332587242126465, "global_step": 110129, "epoch": 2622} {"train_loss": -6.423969268798828, "global_step": 110130, "epoch": 2622} {"train_loss": -6.390883445739746, "global_step": 110131, "epoch": 2622} {"train_loss": -6.391406536102295, "global_step": 110132, "epoch": 2622} {"train_loss": -6.401795387268066, "global_step": 110133, "epoch": 2622} {"train_loss": -6.465236663818359, "global_step": 110134, "epoch": 2622} {"train_loss": -6.425516128540039, "global_step": 110135, "epoch": 2622} {"train_loss": -6.555377960205078, "global_step": 110136, "epoch": 2622} {"train_loss": -6.4563679695129395, "global_step": 110137, "epoch": 2622} {"train_loss": -6.331327438354492, "global_step": 110138, "epoch": 2622} {"train_loss": -6.367989540100098, "global_step": 110139, "epoch": 2622} {"train_loss": -6.486090660095215, "global_step": 110140, "epoch": 2622} {"train_loss": -6.359892845153809, "global_step": 110141, "epoch": 2622} {"train_loss": -6.391145706176758, "global_step": 110142, "epoch": 2622} {"train_loss": -6.5009355545043945, "global_step": 110143, "epoch": 2622} {"train_loss": -6.318697929382324, "global_step": 110144, "epoch": 2622} {"train_loss": -6.518802642822266, "global_step": 110145, "epoch": 2622} {"train_loss": -6.392085075378418, "global_step": 110146, "epoch": 2622} {"train_loss": -6.517364978790283, "global_step": 110147, "epoch": 2622} {"train_loss": -6.446044445037842, "global_step": 110148, "epoch": 2622} {"train_loss": -6.397034645080566, "global_step": 110149, "epoch": 2622} {"train_loss": -6.4097900390625, "global_step": 110150, "epoch": 2622} {"train_loss": -6.423350811004639, "global_step": 110151, "epoch": 2622} {"train_loss": -6.501040935516357, "global_step": 110152, "epoch": 2622} {"train_loss": -6.528133869171143, "global_step": 110153, "epoch": 2622} {"train_loss": -6.411411762237549, "global_step": 110154, "epoch": 2622} {"train_loss": -6.578983783721924, "global_step": 110155, "epoch": 2622} {"train_loss": -6.52117919921875, "global_step": 110156, "epoch": 2622} {"train_loss": -6.308685779571533, "global_step": 110157, "epoch": 2622} {"train_loss": -6.480714797973633, "global_step": 110158, "epoch": 2622} {"train_loss": -6.34589958190918, "global_step": 110159, "epoch": 2622} {"train_loss": -6.430408000946045, "global_step": 110160, "epoch": 2622} {"train_loss": -6.407924175262451, "global_step": 110161, "epoch": 2622} {"train_loss": -6.418025016784668, "global_step": 110162, "epoch": 2622} {"train_loss": -6.438863754272461, "global_step": 110163, "epoch": 2622} {"train_loss": -6.587821960449219, "global_step": 110164, "epoch": 2622} {"train_loss": -6.434468575886318, "global_step": 110165, "epoch": 2622, "val_loss": 67791.4765625} {"train_loss": -6.590242385864258, "global_step": 110166, "epoch": 2623} {"train_loss": -6.461680889129639, "global_step": 110167, "epoch": 2623} {"train_loss": -6.391219615936279, "global_step": 110168, "epoch": 2623} {"train_loss": -6.406325817108154, "global_step": 110169, "epoch": 2623} {"train_loss": -6.390398979187012, "global_step": 110170, "epoch": 2623} {"train_loss": -6.472512245178223, "global_step": 110171, "epoch": 2623} {"train_loss": -6.347173690795898, "global_step": 110172, "epoch": 2623} {"train_loss": -6.311001777648926, "global_step": 110173, "epoch": 2623} {"train_loss": -6.406707763671875, "global_step": 110174, "epoch": 2623} {"train_loss": -6.446450233459473, "global_step": 110175, "epoch": 2623} {"train_loss": -6.378714561462402, "global_step": 110176, "epoch": 2623} {"train_loss": -6.446014881134033, "global_step": 110177, "epoch": 2623} {"train_loss": -6.474665641784668, "global_step": 110178, "epoch": 2623} {"train_loss": -6.353973388671875, "global_step": 110179, "epoch": 2623} {"train_loss": -6.404630661010742, "global_step": 110180, "epoch": 2623} {"train_loss": -6.43406867980957, "global_step": 110181, "epoch": 2623} {"train_loss": -6.39793586730957, "global_step": 110182, "epoch": 2623} {"train_loss": -6.419776916503906, "global_step": 110183, "epoch": 2623} {"train_loss": -6.49030065536499, "global_step": 110184, "epoch": 2623} {"train_loss": -6.548681735992432, "global_step": 110185, "epoch": 2623} {"train_loss": -6.475497722625732, "global_step": 110186, "epoch": 2623} {"train_loss": -6.357903957366943, "global_step": 110187, "epoch": 2623} {"train_loss": -6.443183898925781, "global_step": 110188, "epoch": 2623} {"train_loss": -6.344452857971191, "global_step": 110189, "epoch": 2623} {"train_loss": -6.536211013793945, "global_step": 110190, "epoch": 2623} {"train_loss": -6.4617743492126465, "global_step": 110191, "epoch": 2623} {"train_loss": -6.480659484863281, "global_step": 110192, "epoch": 2623} {"train_loss": -6.460732936859131, "global_step": 110193, "epoch": 2623} {"train_loss": -6.501893997192383, "global_step": 110194, "epoch": 2623} {"train_loss": -6.528072834014893, "global_step": 110195, "epoch": 2623} {"train_loss": -6.538211822509766, "global_step": 110196, "epoch": 2623} {"train_loss": -6.377228736877441, "global_step": 110197, "epoch": 2623} {"train_loss": -6.437740325927734, "global_step": 110198, "epoch": 2623} {"train_loss": -6.478370666503906, "global_step": 110199, "epoch": 2623} {"train_loss": -6.3762311935424805, "global_step": 110200, "epoch": 2623} {"train_loss": -6.482388496398926, "global_step": 110201, "epoch": 2623} {"train_loss": -6.423932075500488, "global_step": 110202, "epoch": 2623} {"train_loss": -6.419564723968506, "global_step": 110203, "epoch": 2623} {"train_loss": -6.517338752746582, "global_step": 110204, "epoch": 2623} {"train_loss": -6.444056510925293, "global_step": 110205, "epoch": 2623} {"train_loss": -6.316620826721191, "global_step": 110206, "epoch": 2623} {"train_loss": -6.4365169661385675, "global_step": 110207, "epoch": 2623, "val_loss": 68148.609375} {"train_loss": -6.3270263671875, "global_step": 110208, "epoch": 2624} {"train_loss": -6.406652927398682, "global_step": 110209, "epoch": 2624} {"train_loss": -6.423431396484375, "global_step": 110210, "epoch": 2624} {"train_loss": -6.342995643615723, "global_step": 110211, "epoch": 2624} {"train_loss": -6.538144111633301, "global_step": 110212, "epoch": 2624} {"train_loss": -6.337148666381836, "global_step": 110213, "epoch": 2624} {"train_loss": -6.409970283508301, "global_step": 110214, "epoch": 2624} {"train_loss": -6.439637184143066, "global_step": 110215, "epoch": 2624} {"train_loss": -6.500945568084717, "global_step": 110216, "epoch": 2624} {"train_loss": -6.49299430847168, "global_step": 110217, "epoch": 2624} {"train_loss": -6.362250328063965, "global_step": 110218, "epoch": 2624} {"train_loss": -6.426652908325195, "global_step": 110219, "epoch": 2624} {"train_loss": -6.482168674468994, "global_step": 110220, "epoch": 2624} {"train_loss": -6.478883266448975, "global_step": 110221, "epoch": 2624} {"train_loss": -6.39478874206543, "global_step": 110222, "epoch": 2624} {"train_loss": -6.478868007659912, "global_step": 110223, "epoch": 2624} {"train_loss": -6.4175262451171875, "global_step": 110224, "epoch": 2624} {"train_loss": -6.433358192443848, "global_step": 110225, "epoch": 2624} {"train_loss": -6.384581565856934, "global_step": 110226, "epoch": 2624} {"train_loss": -6.554515838623047, "global_step": 110227, "epoch": 2624} {"train_loss": -6.338422775268555, "global_step": 110228, "epoch": 2624} {"train_loss": -6.4081034660339355, "global_step": 110229, "epoch": 2624} {"train_loss": -6.422898292541504, "global_step": 110230, "epoch": 2624} {"train_loss": -6.436561584472656, "global_step": 110231, "epoch": 2624} {"train_loss": -6.275461196899414, "global_step": 110232, "epoch": 2624} {"train_loss": -6.465798854827881, "global_step": 110233, "epoch": 2624} {"train_loss": -6.303222179412842, "global_step": 110234, "epoch": 2624} {"train_loss": -6.4322381019592285, "global_step": 110235, "epoch": 2624} {"train_loss": -6.279160499572754, "global_step": 110236, "epoch": 2624} {"train_loss": -6.381841659545898, "global_step": 110237, "epoch": 2624} {"train_loss": -6.388850212097168, "global_step": 110238, "epoch": 2624} {"train_loss": -6.457347393035889, "global_step": 110239, "epoch": 2624} {"train_loss": -6.381261825561523, "global_step": 110240, "epoch": 2624} {"train_loss": -6.414411544799805, "global_step": 110241, "epoch": 2624} {"train_loss": -6.4033002853393555, "global_step": 110242, "epoch": 2624} {"train_loss": -6.390127658843994, "global_step": 110243, "epoch": 2624} {"train_loss": -6.399089813232422, "global_step": 110244, "epoch": 2624} {"train_loss": -6.387537002563477, "global_step": 110245, "epoch": 2624} {"train_loss": -6.367798328399658, "global_step": 110246, "epoch": 2624} {"train_loss": -6.4361772537231445, "global_step": 110247, "epoch": 2624} {"train_loss": -6.365556716918945, "global_step": 110248, "epoch": 2624} {"train_loss": -6.407606329236712, "global_step": 110249, "epoch": 2624, "val_loss": 67935.625} {"train_loss": -6.441094398498535, "global_step": 110250, "epoch": 2625} {"train_loss": -6.481073379516602, "global_step": 110251, "epoch": 2625} {"train_loss": -6.421682834625244, "global_step": 110252, "epoch": 2625} {"train_loss": -6.477519989013672, "global_step": 110253, "epoch": 2625} {"train_loss": -6.507366180419922, "global_step": 110254, "epoch": 2625} {"train_loss": -6.459150314331055, "global_step": 110255, "epoch": 2625} {"train_loss": -6.404979228973389, "global_step": 110256, "epoch": 2625} {"train_loss": -6.505768775939941, "global_step": 110257, "epoch": 2625} {"train_loss": -6.434420108795166, "global_step": 110258, "epoch": 2625} {"train_loss": -6.461172103881836, "global_step": 110259, "epoch": 2625} {"train_loss": -6.408425331115723, "global_step": 110260, "epoch": 2625} {"train_loss": -6.471430778503418, "global_step": 110261, "epoch": 2625} {"train_loss": -6.40109920501709, "global_step": 110262, "epoch": 2625} {"train_loss": -6.395653247833252, "global_step": 110263, "epoch": 2625} {"train_loss": -6.399532318115234, "global_step": 110264, "epoch": 2625} {"train_loss": -6.491408348083496, "global_step": 110265, "epoch": 2625} {"train_loss": -6.52709436416626, "global_step": 110266, "epoch": 2625} {"train_loss": -6.447556495666504, "global_step": 110267, "epoch": 2625} {"train_loss": -6.501936912536621, "global_step": 110268, "epoch": 2625} {"train_loss": -6.476120948791504, "global_step": 110269, "epoch": 2625} {"train_loss": -6.465841293334961, "global_step": 110270, "epoch": 2625} {"train_loss": -6.437145233154297, "global_step": 110271, "epoch": 2625} {"train_loss": -6.465629577636719, "global_step": 110272, "epoch": 2625} {"train_loss": -6.471982002258301, "global_step": 110273, "epoch": 2625} {"train_loss": -6.279839038848877, "global_step": 110274, "epoch": 2625} {"train_loss": -6.550169944763184, "global_step": 110275, "epoch": 2625} {"train_loss": -6.4265289306640625, "global_step": 110276, "epoch": 2625} {"train_loss": -6.439145088195801, "global_step": 110277, "epoch": 2625} {"train_loss": -6.472230911254883, "global_step": 110278, "epoch": 2625} {"train_loss": -6.466301918029785, "global_step": 110279, "epoch": 2625} {"train_loss": -6.341161251068115, "global_step": 110280, "epoch": 2625} {"train_loss": -6.485711574554443, "global_step": 110281, "epoch": 2625} {"train_loss": -6.327010154724121, "global_step": 110282, "epoch": 2625} {"train_loss": -6.450543403625488, "global_step": 110283, "epoch": 2625} {"train_loss": -6.447660446166992, "global_step": 110284, "epoch": 2625} {"train_loss": -6.471792697906494, "global_step": 110285, "epoch": 2625} {"train_loss": -6.414278507232666, "global_step": 110286, "epoch": 2625} {"train_loss": -6.418201446533203, "global_step": 110287, "epoch": 2625} {"train_loss": -6.436700820922852, "global_step": 110288, "epoch": 2625} {"train_loss": -6.467659950256348, "global_step": 110289, "epoch": 2625} {"train_loss": -6.5579376220703125, "global_step": 110290, "epoch": 2625} {"train_loss": -6.448607660475231, "global_step": 110291, "epoch": 2625, "val_loss": 67814.3359375} {"train_loss": -6.478349685668945, "global_step": 110292, "epoch": 2626} {"train_loss": -6.484910011291504, "global_step": 110293, "epoch": 2626} {"train_loss": -6.337091445922852, "global_step": 110294, "epoch": 2626} {"train_loss": -6.332995414733887, "global_step": 110295, "epoch": 2626} {"train_loss": -6.339706897735596, "global_step": 110296, "epoch": 2626} {"train_loss": -6.566359519958496, "global_step": 110297, "epoch": 2626} {"train_loss": -6.4858856201171875, "global_step": 110298, "epoch": 2626} {"train_loss": -6.523982048034668, "global_step": 110299, "epoch": 2626} {"train_loss": -6.576557636260986, "global_step": 110300, "epoch": 2626} {"train_loss": -6.516181945800781, "global_step": 110301, "epoch": 2626} {"train_loss": -6.540781021118164, "global_step": 110302, "epoch": 2626} {"train_loss": -6.5105719566345215, "global_step": 110303, "epoch": 2626} {"train_loss": -6.510173320770264, "global_step": 110304, "epoch": 2626} {"train_loss": -6.5690507888793945, "global_step": 110305, "epoch": 2626} {"train_loss": -6.424921989440918, "global_step": 110306, "epoch": 2626} {"train_loss": -6.497889995574951, "global_step": 110307, "epoch": 2626} {"train_loss": -6.50048303604126, "global_step": 110308, "epoch": 2626} {"train_loss": -6.525322914123535, "global_step": 110309, "epoch": 2626} {"train_loss": -6.490901947021484, "global_step": 110310, "epoch": 2626} {"train_loss": -6.444710731506348, "global_step": 110311, "epoch": 2626} {"train_loss": -6.510711193084717, "global_step": 110312, "epoch": 2626} {"train_loss": -6.487391471862793, "global_step": 110313, "epoch": 2626} {"train_loss": -6.433321475982666, "global_step": 110314, "epoch": 2626} {"train_loss": -6.453632354736328, "global_step": 110315, "epoch": 2626} {"train_loss": -6.454975128173828, "global_step": 110316, "epoch": 2626} {"train_loss": -6.351903438568115, "global_step": 110317, "epoch": 2626} {"train_loss": -6.39688777923584, "global_step": 110318, "epoch": 2626} {"train_loss": -6.425219535827637, "global_step": 110319, "epoch": 2626} {"train_loss": -6.505809307098389, "global_step": 110320, "epoch": 2626} {"train_loss": -6.418288230895996, "global_step": 110321, "epoch": 2626} {"train_loss": -6.60554313659668, "global_step": 110322, "epoch": 2626} {"train_loss": -6.392383575439453, "global_step": 110323, "epoch": 2626} {"train_loss": -6.42899227142334, "global_step": 110324, "epoch": 2626} {"train_loss": -6.401317119598389, "global_step": 110325, "epoch": 2626} {"train_loss": -6.519412517547607, "global_step": 110326, "epoch": 2626} {"train_loss": -6.372564315795898, "global_step": 110327, "epoch": 2626} {"train_loss": -6.407205104827881, "global_step": 110328, "epoch": 2626} {"train_loss": -6.44223165512085, "global_step": 110329, "epoch": 2626} {"train_loss": -6.483523368835449, "global_step": 110330, "epoch": 2626} {"train_loss": -6.488247871398926, "global_step": 110331, "epoch": 2626} {"train_loss": -6.363141059875488, "global_step": 110332, "epoch": 2626} {"train_loss": -6.463421889713833, "global_step": 110333, "epoch": 2626, "val_loss": 67865.921875} {"train_loss": -6.4716668128967285, "global_step": 110334, "epoch": 2627} {"train_loss": -6.394761085510254, "global_step": 110335, "epoch": 2627} {"train_loss": -6.514119625091553, "global_step": 110336, "epoch": 2627} {"train_loss": -6.431263446807861, "global_step": 110337, "epoch": 2627} {"train_loss": -6.4572343826293945, "global_step": 110338, "epoch": 2627} {"train_loss": -6.525428295135498, "global_step": 110339, "epoch": 2627} {"train_loss": -6.4161176681518555, "global_step": 110340, "epoch": 2627} {"train_loss": -6.4349684715271, "global_step": 110341, "epoch": 2627} {"train_loss": -6.453275680541992, "global_step": 110342, "epoch": 2627} {"train_loss": -6.430642604827881, "global_step": 110343, "epoch": 2627} {"train_loss": -6.481379985809326, "global_step": 110344, "epoch": 2627} {"train_loss": -6.624176025390625, "global_step": 110345, "epoch": 2627} {"train_loss": -6.426723480224609, "global_step": 110346, "epoch": 2627} {"train_loss": -6.375572204589844, "global_step": 110347, "epoch": 2627} {"train_loss": -6.32136869430542, "global_step": 110348, "epoch": 2627} {"train_loss": -6.388641357421875, "global_step": 110349, "epoch": 2627} {"train_loss": -6.53128719329834, "global_step": 110350, "epoch": 2627} {"train_loss": -6.442388534545898, "global_step": 110351, "epoch": 2627} {"train_loss": -6.4537248611450195, "global_step": 110352, "epoch": 2627} {"train_loss": -6.387725353240967, "global_step": 110353, "epoch": 2627} {"train_loss": -6.544645309448242, "global_step": 110354, "epoch": 2627} {"train_loss": -6.327428817749023, "global_step": 110355, "epoch": 2627} {"train_loss": -6.495626449584961, "global_step": 110356, "epoch": 2627} {"train_loss": -6.493278503417969, "global_step": 110357, "epoch": 2627} {"train_loss": -6.432089805603027, "global_step": 110358, "epoch": 2627} {"train_loss": -6.496682167053223, "global_step": 110359, "epoch": 2627} {"train_loss": -6.333362579345703, "global_step": 110360, "epoch": 2627} {"train_loss": -6.538585662841797, "global_step": 110361, "epoch": 2627} {"train_loss": -6.32150411605835, "global_step": 110362, "epoch": 2627} {"train_loss": -6.341591835021973, "global_step": 110363, "epoch": 2627} {"train_loss": -6.418588638305664, "global_step": 110364, "epoch": 2627} {"train_loss": -6.285088539123535, "global_step": 110365, "epoch": 2627} {"train_loss": -6.48321533203125, "global_step": 110366, "epoch": 2627} {"train_loss": -6.3847198486328125, "global_step": 110367, "epoch": 2627} {"train_loss": -6.489789962768555, "global_step": 110368, "epoch": 2627} {"train_loss": -6.3292741775512695, "global_step": 110369, "epoch": 2627} {"train_loss": -6.300840377807617, "global_step": 110370, "epoch": 2627} {"train_loss": -6.417810916900635, "global_step": 110371, "epoch": 2627} {"train_loss": -6.304937362670898, "global_step": 110372, "epoch": 2627} {"train_loss": -6.477170944213867, "global_step": 110373, "epoch": 2627} {"train_loss": -6.340900421142578, "global_step": 110374, "epoch": 2627} {"train_loss": -6.4243922006516225, "global_step": 110375, "epoch": 2627, "val_loss": 67956.1875} {"train_loss": -6.401342868804932, "global_step": 110376, "epoch": 2628} {"train_loss": -6.402323246002197, "global_step": 110377, "epoch": 2628} {"train_loss": -6.38727331161499, "global_step": 110378, "epoch": 2628} {"train_loss": -6.455921173095703, "global_step": 110379, "epoch": 2628} {"train_loss": -6.411130905151367, "global_step": 110380, "epoch": 2628} {"train_loss": -6.317872524261475, "global_step": 110381, "epoch": 2628} {"train_loss": -6.4715256690979, "global_step": 110382, "epoch": 2628} {"train_loss": -6.4162421226501465, "global_step": 110383, "epoch": 2628} {"train_loss": -6.41446590423584, "global_step": 110384, "epoch": 2628} {"train_loss": -6.5429887771606445, "global_step": 110385, "epoch": 2628} {"train_loss": -6.4768242835998535, "global_step": 110386, "epoch": 2628} {"train_loss": -6.4151225090026855, "global_step": 110387, "epoch": 2628} {"train_loss": -6.447326183319092, "global_step": 110388, "epoch": 2628} {"train_loss": -6.45680570602417, "global_step": 110389, "epoch": 2628} {"train_loss": -6.37465238571167, "global_step": 110390, "epoch": 2628} {"train_loss": -6.433571815490723, "global_step": 110391, "epoch": 2628} {"train_loss": -6.54359245300293, "global_step": 110392, "epoch": 2628} {"train_loss": -6.434439182281494, "global_step": 110393, "epoch": 2628} {"train_loss": -6.431347846984863, "global_step": 110394, "epoch": 2628} {"train_loss": -6.501964569091797, "global_step": 110395, "epoch": 2628} {"train_loss": -6.316117286682129, "global_step": 110396, "epoch": 2628} {"train_loss": -6.41886568069458, "global_step": 110397, "epoch": 2628} {"train_loss": -6.4032158851623535, "global_step": 110398, "epoch": 2628} {"train_loss": -6.437665939331055, "global_step": 110399, "epoch": 2628} {"train_loss": -6.462606906890869, "global_step": 110400, "epoch": 2628} {"train_loss": -6.354667663574219, "global_step": 110401, "epoch": 2628} {"train_loss": -6.471177101135254, "global_step": 110402, "epoch": 2628} {"train_loss": -6.412677764892578, "global_step": 110403, "epoch": 2628} {"train_loss": -6.439882755279541, "global_step": 110404, "epoch": 2628} {"train_loss": -6.373816013336182, "global_step": 110405, "epoch": 2628} {"train_loss": -6.388999938964844, "global_step": 110406, "epoch": 2628} {"train_loss": -6.52677059173584, "global_step": 110407, "epoch": 2628} {"train_loss": -6.371070861816406, "global_step": 110408, "epoch": 2628} {"train_loss": -6.375705242156982, "global_step": 110409, "epoch": 2628} {"train_loss": -6.395158767700195, "global_step": 110410, "epoch": 2628} {"train_loss": -6.412229537963867, "global_step": 110411, "epoch": 2628} {"train_loss": -6.41463565826416, "global_step": 110412, "epoch": 2628} {"train_loss": -6.347428321838379, "global_step": 110413, "epoch": 2628} {"train_loss": -6.328183650970459, "global_step": 110414, "epoch": 2628} {"train_loss": -6.494032859802246, "global_step": 110415, "epoch": 2628} {"train_loss": -6.478756904602051, "global_step": 110416, "epoch": 2628} {"train_loss": -6.423551979519072, "global_step": 110417, "epoch": 2628, "val_loss": 67937.2578125} {"train_loss": -6.455642223358154, "global_step": 110418, "epoch": 2629} {"train_loss": -6.593435287475586, "global_step": 110419, "epoch": 2629} {"train_loss": -6.574698448181152, "global_step": 110420, "epoch": 2629} {"train_loss": -6.48581075668335, "global_step": 110421, "epoch": 2629} {"train_loss": -6.512650012969971, "global_step": 110422, "epoch": 2629} {"train_loss": -6.506516456604004, "global_step": 110423, "epoch": 2629} {"train_loss": -6.555122375488281, "global_step": 110424, "epoch": 2629} {"train_loss": -6.412744522094727, "global_step": 110425, "epoch": 2629} {"train_loss": -6.502887725830078, "global_step": 110426, "epoch": 2629} {"train_loss": -6.369024276733398, "global_step": 110427, "epoch": 2629} {"train_loss": -6.453180313110352, "global_step": 110428, "epoch": 2629} {"train_loss": -6.397214889526367, "global_step": 110429, "epoch": 2629} {"train_loss": -6.430706024169922, "global_step": 110430, "epoch": 2629} {"train_loss": -6.33985710144043, "global_step": 110431, "epoch": 2629} {"train_loss": -6.46584939956665, "global_step": 110432, "epoch": 2629} {"train_loss": -6.498610019683838, "global_step": 110433, "epoch": 2629} {"train_loss": -6.542105197906494, "global_step": 110434, "epoch": 2629} {"train_loss": -6.475950717926025, "global_step": 110435, "epoch": 2629} {"train_loss": -6.436861038208008, "global_step": 110436, "epoch": 2629} {"train_loss": -6.277618408203125, "global_step": 110437, "epoch": 2629} {"train_loss": -6.501913070678711, "global_step": 110438, "epoch": 2629} {"train_loss": -6.477278232574463, "global_step": 110439, "epoch": 2629} {"train_loss": -6.421849250793457, "global_step": 110440, "epoch": 2629} {"train_loss": -6.30927848815918, "global_step": 110441, "epoch": 2629} {"train_loss": -6.549775123596191, "global_step": 110442, "epoch": 2629} {"train_loss": -6.460382461547852, "global_step": 110443, "epoch": 2629} {"train_loss": -6.3868408203125, "global_step": 110444, "epoch": 2629} {"train_loss": -6.564858436584473, "global_step": 110445, "epoch": 2629} {"train_loss": -6.32372522354126, "global_step": 110446, "epoch": 2629} {"train_loss": -6.373524188995361, "global_step": 110447, "epoch": 2629} {"train_loss": -6.444206237792969, "global_step": 110448, "epoch": 2629} {"train_loss": -6.496298313140869, "global_step": 110449, "epoch": 2629} {"train_loss": -6.492859840393066, "global_step": 110450, "epoch": 2629} {"train_loss": -6.415599822998047, "global_step": 110451, "epoch": 2629} {"train_loss": -6.399560928344727, "global_step": 110452, "epoch": 2629} {"train_loss": -6.518396854400635, "global_step": 110453, "epoch": 2629} {"train_loss": -6.461362838745117, "global_step": 110454, "epoch": 2629} {"train_loss": -6.467439651489258, "global_step": 110455, "epoch": 2629} {"train_loss": -6.434131622314453, "global_step": 110456, "epoch": 2629} {"train_loss": -6.327645301818848, "global_step": 110457, "epoch": 2629} {"train_loss": -6.390212059020996, "global_step": 110458, "epoch": 2629} {"train_loss": -6.45327565783546, "global_step": 110459, "epoch": 2629, "val_loss": 67896.984375} {"train_loss": -6.398487567901611, "global_step": 110460, "epoch": 2630} {"train_loss": -6.368535041809082, "global_step": 110461, "epoch": 2630} {"train_loss": -6.502204418182373, "global_step": 110462, "epoch": 2630} {"train_loss": -6.4392900466918945, "global_step": 110463, "epoch": 2630} {"train_loss": -6.430934906005859, "global_step": 110464, "epoch": 2630} {"train_loss": -6.406506538391113, "global_step": 110465, "epoch": 2630} {"train_loss": -6.461914539337158, "global_step": 110466, "epoch": 2630} {"train_loss": -6.566061973571777, "global_step": 110467, "epoch": 2630} {"train_loss": -6.413710594177246, "global_step": 110468, "epoch": 2630} {"train_loss": -6.492051124572754, "global_step": 110469, "epoch": 2630} {"train_loss": -6.4777069091796875, "global_step": 110470, "epoch": 2630} {"train_loss": -6.423413276672363, "global_step": 110471, "epoch": 2630} {"train_loss": -6.56869649887085, "global_step": 110472, "epoch": 2630} {"train_loss": -6.381600379943848, "global_step": 110473, "epoch": 2630} {"train_loss": -6.286891937255859, "global_step": 110474, "epoch": 2630} {"train_loss": -6.441860675811768, "global_step": 110475, "epoch": 2630} {"train_loss": -6.584161758422852, "global_step": 110476, "epoch": 2630} {"train_loss": -6.390408039093018, "global_step": 110477, "epoch": 2630} {"train_loss": -6.423791408538818, "global_step": 110478, "epoch": 2630} {"train_loss": -6.3762898445129395, "global_step": 110479, "epoch": 2630} {"train_loss": -6.341034889221191, "global_step": 110480, "epoch": 2630} {"train_loss": -6.390790939331055, "global_step": 110481, "epoch": 2630} {"train_loss": -6.462039947509766, "global_step": 110482, "epoch": 2630} {"train_loss": -6.413108825683594, "global_step": 110483, "epoch": 2630} {"train_loss": -6.482813358306885, "global_step": 110484, "epoch": 2630} {"train_loss": -6.446117401123047, "global_step": 110485, "epoch": 2630} {"train_loss": -6.300803184509277, "global_step": 110486, "epoch": 2630} {"train_loss": -6.501842498779297, "global_step": 110487, "epoch": 2630} {"train_loss": -6.502506732940674, "global_step": 110488, "epoch": 2630} {"train_loss": -6.399691581726074, "global_step": 110489, "epoch": 2630} {"train_loss": -6.447456359863281, "global_step": 110490, "epoch": 2630} {"train_loss": -6.457149028778076, "global_step": 110491, "epoch": 2630} {"train_loss": -6.429783821105957, "global_step": 110492, "epoch": 2630} {"train_loss": -6.376526832580566, "global_step": 110493, "epoch": 2630} {"train_loss": -6.468868732452393, "global_step": 110494, "epoch": 2630} {"train_loss": -6.529901504516602, "global_step": 110495, "epoch": 2630} {"train_loss": -6.481749534606934, "global_step": 110496, "epoch": 2630} {"train_loss": -6.368870735168457, "global_step": 110497, "epoch": 2630} {"train_loss": -6.472232818603516, "global_step": 110498, "epoch": 2630} {"train_loss": -6.460299491882324, "global_step": 110499, "epoch": 2630} {"train_loss": -6.46919059753418, "global_step": 110500, "epoch": 2630} {"train_loss": -6.4403876804170155, "global_step": 110501, "epoch": 2630, "val_loss": 67831.25} {"train_loss": -6.543990135192871, "global_step": 110502, "epoch": 2631} {"train_loss": -6.3836350440979, "global_step": 110503, "epoch": 2631} {"train_loss": -6.484931945800781, "global_step": 110504, "epoch": 2631} {"train_loss": -6.555715560913086, "global_step": 110505, "epoch": 2631} {"train_loss": -6.402604579925537, "global_step": 110506, "epoch": 2631} {"train_loss": -6.360882759094238, "global_step": 110507, "epoch": 2631} {"train_loss": -6.399631500244141, "global_step": 110508, "epoch": 2631} {"train_loss": -6.428299903869629, "global_step": 110509, "epoch": 2631} {"train_loss": -6.286812782287598, "global_step": 110510, "epoch": 2631} {"train_loss": -6.434572219848633, "global_step": 110511, "epoch": 2631} {"train_loss": -6.40993595123291, "global_step": 110512, "epoch": 2631} {"train_loss": -6.389854431152344, "global_step": 110513, "epoch": 2631} {"train_loss": -6.391299247741699, "global_step": 110514, "epoch": 2631} {"train_loss": -6.376066207885742, "global_step": 110515, "epoch": 2631} {"train_loss": -6.37342643737793, "global_step": 110516, "epoch": 2631} {"train_loss": -6.220212459564209, "global_step": 110517, "epoch": 2631} {"train_loss": -6.554997444152832, "global_step": 110518, "epoch": 2631} {"train_loss": -6.475323677062988, "global_step": 110519, "epoch": 2631} {"train_loss": -6.426176071166992, "global_step": 110520, "epoch": 2631} {"train_loss": -6.362544059753418, "global_step": 110521, "epoch": 2631} {"train_loss": -6.404024124145508, "global_step": 110522, "epoch": 2631} {"train_loss": -6.464562892913818, "global_step": 110523, "epoch": 2631} {"train_loss": -6.425823211669922, "global_step": 110524, "epoch": 2631} {"train_loss": -6.492708206176758, "global_step": 110525, "epoch": 2631} {"train_loss": -6.318778991699219, "global_step": 110526, "epoch": 2631} {"train_loss": -6.51307487487793, "global_step": 110527, "epoch": 2631} {"train_loss": -6.313244342803955, "global_step": 110528, "epoch": 2631} {"train_loss": -6.400948524475098, "global_step": 110529, "epoch": 2631} {"train_loss": -6.409843444824219, "global_step": 110530, "epoch": 2631} {"train_loss": -6.435303211212158, "global_step": 110531, "epoch": 2631} {"train_loss": -6.413689613342285, "global_step": 110532, "epoch": 2631} {"train_loss": -6.388435363769531, "global_step": 110533, "epoch": 2631} {"train_loss": -6.499875545501709, "global_step": 110534, "epoch": 2631} {"train_loss": -6.447605133056641, "global_step": 110535, "epoch": 2631} {"train_loss": -6.452297210693359, "global_step": 110536, "epoch": 2631} {"train_loss": -6.622920513153076, "global_step": 110537, "epoch": 2631} {"train_loss": -6.522854804992676, "global_step": 110538, "epoch": 2631} {"train_loss": -6.523689270019531, "global_step": 110539, "epoch": 2631} {"train_loss": -6.306704044342041, "global_step": 110540, "epoch": 2631} {"train_loss": -6.459418296813965, "global_step": 110541, "epoch": 2631} {"train_loss": -6.369131088256836, "global_step": 110542, "epoch": 2631} {"train_loss": -6.427500747499012, "global_step": 110543, "epoch": 2631, "val_loss": 67795.2265625} {"train_loss": -6.469282150268555, "global_step": 110544, "epoch": 2632} {"train_loss": -6.4463396072387695, "global_step": 110545, "epoch": 2632} {"train_loss": -6.36726188659668, "global_step": 110546, "epoch": 2632} {"train_loss": -6.484763145446777, "global_step": 110547, "epoch": 2632} {"train_loss": -6.554182052612305, "global_step": 110548, "epoch": 2632} {"train_loss": -6.407437324523926, "global_step": 110549, "epoch": 2632} {"train_loss": -6.46917200088501, "global_step": 110550, "epoch": 2632} {"train_loss": -6.493575096130371, "global_step": 110551, "epoch": 2632} {"train_loss": -6.376001834869385, "global_step": 110552, "epoch": 2632} {"train_loss": -6.391493797302246, "global_step": 110553, "epoch": 2632} {"train_loss": -6.458854675292969, "global_step": 110554, "epoch": 2632} {"train_loss": -6.315993309020996, "global_step": 110555, "epoch": 2632} {"train_loss": -6.411620140075684, "global_step": 110556, "epoch": 2632} {"train_loss": -6.491628170013428, "global_step": 110557, "epoch": 2632} {"train_loss": -6.399560451507568, "global_step": 110558, "epoch": 2632} {"train_loss": -6.46196985244751, "global_step": 110559, "epoch": 2632} {"train_loss": -6.348832130432129, "global_step": 110560, "epoch": 2632} {"train_loss": -6.477901458740234, "global_step": 110561, "epoch": 2632} {"train_loss": -6.434113502502441, "global_step": 110562, "epoch": 2632} {"train_loss": -6.437034606933594, "global_step": 110563, "epoch": 2632} {"train_loss": -6.591299057006836, "global_step": 110564, "epoch": 2632} {"train_loss": -6.42365837097168, "global_step": 110565, "epoch": 2632} {"train_loss": -6.404531478881836, "global_step": 110566, "epoch": 2632} {"train_loss": -6.4108476638793945, "global_step": 110567, "epoch": 2632} {"train_loss": -6.524881362915039, "global_step": 110568, "epoch": 2632} {"train_loss": -6.414963245391846, "global_step": 110569, "epoch": 2632} {"train_loss": -6.494311809539795, "global_step": 110570, "epoch": 2632} {"train_loss": -6.466794490814209, "global_step": 110571, "epoch": 2632} {"train_loss": -6.414017677307129, "global_step": 110572, "epoch": 2632} {"train_loss": -6.605260848999023, "global_step": 110573, "epoch": 2632} {"train_loss": -6.49403715133667, "global_step": 110574, "epoch": 2632} {"train_loss": -6.531142234802246, "global_step": 110575, "epoch": 2632} {"train_loss": -6.527626991271973, "global_step": 110576, "epoch": 2632} {"train_loss": -6.479621887207031, "global_step": 110577, "epoch": 2632} {"train_loss": -6.405652046203613, "global_step": 110578, "epoch": 2632} {"train_loss": -6.49005126953125, "global_step": 110579, "epoch": 2632} {"train_loss": -6.448647499084473, "global_step": 110580, "epoch": 2632} {"train_loss": -6.43696403503418, "global_step": 110581, "epoch": 2632} {"train_loss": -6.467833995819092, "global_step": 110582, "epoch": 2632} {"train_loss": -6.381045341491699, "global_step": 110583, "epoch": 2632} {"train_loss": -6.310733795166016, "global_step": 110584, "epoch": 2632} {"train_loss": -6.450948749269758, "global_step": 110585, "epoch": 2632, "val_loss": 67930.515625} {"train_loss": -6.5122294425964355, "global_step": 110586, "epoch": 2633} {"train_loss": -6.430666446685791, "global_step": 110587, "epoch": 2633} {"train_loss": -6.542418479919434, "global_step": 110588, "epoch": 2633} {"train_loss": -6.515522003173828, "global_step": 110589, "epoch": 2633} {"train_loss": -6.583028793334961, "global_step": 110590, "epoch": 2633} {"train_loss": -6.5281572341918945, "global_step": 110591, "epoch": 2633} {"train_loss": -6.427079677581787, "global_step": 110592, "epoch": 2633} {"train_loss": -6.563256740570068, "global_step": 110593, "epoch": 2633} {"train_loss": -6.457353591918945, "global_step": 110594, "epoch": 2633} {"train_loss": -6.398929595947266, "global_step": 110595, "epoch": 2633} {"train_loss": -6.456464767456055, "global_step": 110596, "epoch": 2633} {"train_loss": -6.443842887878418, "global_step": 110597, "epoch": 2633} {"train_loss": -6.446068286895752, "global_step": 110598, "epoch": 2633} {"train_loss": -6.378368377685547, "global_step": 110599, "epoch": 2633} {"train_loss": -6.4537811279296875, "global_step": 110600, "epoch": 2633} {"train_loss": -6.497067928314209, "global_step": 110601, "epoch": 2633} {"train_loss": -6.427614212036133, "global_step": 110602, "epoch": 2633} {"train_loss": -6.43442440032959, "global_step": 110603, "epoch": 2633} {"train_loss": -6.476914882659912, "global_step": 110604, "epoch": 2633} {"train_loss": -6.509573936462402, "global_step": 110605, "epoch": 2633} {"train_loss": -6.388221740722656, "global_step": 110606, "epoch": 2633} {"train_loss": -6.448537826538086, "global_step": 110607, "epoch": 2633} {"train_loss": -6.493875503540039, "global_step": 110608, "epoch": 2633} {"train_loss": -6.346942901611328, "global_step": 110609, "epoch": 2633} {"train_loss": -6.441672325134277, "global_step": 110610, "epoch": 2633} {"train_loss": -6.47913932800293, "global_step": 110611, "epoch": 2633} {"train_loss": -6.428879737854004, "global_step": 110612, "epoch": 2633} {"train_loss": -6.407223701477051, "global_step": 110613, "epoch": 2633} {"train_loss": -6.451149940490723, "global_step": 110614, "epoch": 2633} {"train_loss": -6.4954657554626465, "global_step": 110615, "epoch": 2633} {"train_loss": -6.405609130859375, "global_step": 110616, "epoch": 2633} {"train_loss": -6.470686912536621, "global_step": 110617, "epoch": 2633} {"train_loss": -6.515181541442871, "global_step": 110618, "epoch": 2633} {"train_loss": -6.402003288269043, "global_step": 110619, "epoch": 2633} {"train_loss": -6.434968948364258, "global_step": 110620, "epoch": 2633} {"train_loss": -6.417296409606934, "global_step": 110621, "epoch": 2633} {"train_loss": -6.307066440582275, "global_step": 110622, "epoch": 2633} {"train_loss": -6.3201398849487305, "global_step": 110623, "epoch": 2633} {"train_loss": -6.363224029541016, "global_step": 110624, "epoch": 2633} {"train_loss": -6.3980488777160645, "global_step": 110625, "epoch": 2633} {"train_loss": -6.367218494415283, "global_step": 110626, "epoch": 2633} {"train_loss": -6.442743630636306, "global_step": 110627, "epoch": 2633, "val_loss": 67963.2109375} {"train_loss": -6.519432544708252, "global_step": 110628, "epoch": 2634} {"train_loss": -6.482030391693115, "global_step": 110629, "epoch": 2634} {"train_loss": -6.35740852355957, "global_step": 110630, "epoch": 2634} {"train_loss": -6.365939140319824, "global_step": 110631, "epoch": 2634} {"train_loss": -6.519688606262207, "global_step": 110632, "epoch": 2634} {"train_loss": -6.443546295166016, "global_step": 110633, "epoch": 2634} {"train_loss": -6.463532447814941, "global_step": 110634, "epoch": 2634} {"train_loss": -6.496264457702637, "global_step": 110635, "epoch": 2634} {"train_loss": -6.453303337097168, "global_step": 110636, "epoch": 2634} {"train_loss": -6.390375137329102, "global_step": 110637, "epoch": 2634} {"train_loss": -6.454679012298584, "global_step": 110638, "epoch": 2634} {"train_loss": -6.452847480773926, "global_step": 110639, "epoch": 2634} {"train_loss": -6.4518513679504395, "global_step": 110640, "epoch": 2634} {"train_loss": -6.512040615081787, "global_step": 110641, "epoch": 2634} {"train_loss": -6.402020454406738, "global_step": 110642, "epoch": 2634} {"train_loss": -6.459137916564941, "global_step": 110643, "epoch": 2634} {"train_loss": -6.533083915710449, "global_step": 110644, "epoch": 2634} {"train_loss": -6.389894008636475, "global_step": 110645, "epoch": 2634} {"train_loss": -6.441327095031738, "global_step": 110646, "epoch": 2634} {"train_loss": -6.490737438201904, "global_step": 110647, "epoch": 2634} {"train_loss": -6.437414646148682, "global_step": 110648, "epoch": 2634} {"train_loss": -6.581972122192383, "global_step": 110649, "epoch": 2634} {"train_loss": -6.443321228027344, "global_step": 110650, "epoch": 2634} {"train_loss": -6.436924934387207, "global_step": 110651, "epoch": 2634} {"train_loss": -6.38212776184082, "global_step": 110652, "epoch": 2634} {"train_loss": -6.403747081756592, "global_step": 110653, "epoch": 2634} {"train_loss": -6.516031265258789, "global_step": 110654, "epoch": 2634} {"train_loss": -6.446496963500977, "global_step": 110655, "epoch": 2634} {"train_loss": -6.458081245422363, "global_step": 110656, "epoch": 2634} {"train_loss": -6.418506622314453, "global_step": 110657, "epoch": 2634} {"train_loss": -6.443640232086182, "global_step": 110658, "epoch": 2634} {"train_loss": -6.592681407928467, "global_step": 110659, "epoch": 2634} {"train_loss": -6.5286641120910645, "global_step": 110660, "epoch": 2634} {"train_loss": -6.502416133880615, "global_step": 110661, "epoch": 2634} {"train_loss": -6.442413330078125, "global_step": 110662, "epoch": 2634} {"train_loss": -6.4238362312316895, "global_step": 110663, "epoch": 2634} {"train_loss": -6.5741987228393555, "global_step": 110664, "epoch": 2634} {"train_loss": -6.489132881164551, "global_step": 110665, "epoch": 2634} {"train_loss": -6.359382629394531, "global_step": 110666, "epoch": 2634} {"train_loss": -6.535944938659668, "global_step": 110667, "epoch": 2634} {"train_loss": -6.485713005065918, "global_step": 110668, "epoch": 2634} {"train_loss": -6.464311270486741, "global_step": 110669, "epoch": 2634, "val_loss": 67905.75} {"train_loss": -6.445514678955078, "global_step": 110670, "epoch": 2635} {"train_loss": -6.381640911102295, "global_step": 110671, "epoch": 2635} {"train_loss": -6.40766716003418, "global_step": 110672, "epoch": 2635} {"train_loss": -6.371644020080566, "global_step": 110673, "epoch": 2635} {"train_loss": -6.370668411254883, "global_step": 110674, "epoch": 2635} {"train_loss": -6.286185264587402, "global_step": 110675, "epoch": 2635} {"train_loss": -6.412738800048828, "global_step": 110676, "epoch": 2635} {"train_loss": -6.431475639343262, "global_step": 110677, "epoch": 2635} {"train_loss": -6.395902633666992, "global_step": 110678, "epoch": 2635} {"train_loss": -6.515196323394775, "global_step": 110679, "epoch": 2635} {"train_loss": -6.461030960083008, "global_step": 110680, "epoch": 2635} {"train_loss": -6.433253765106201, "global_step": 110681, "epoch": 2635} {"train_loss": -6.436595439910889, "global_step": 110682, "epoch": 2635} {"train_loss": -6.398601531982422, "global_step": 110683, "epoch": 2635} {"train_loss": -6.349246025085449, "global_step": 110684, "epoch": 2635} {"train_loss": -6.446678161621094, "global_step": 110685, "epoch": 2635} {"train_loss": -6.365791320800781, "global_step": 110686, "epoch": 2635} {"train_loss": -6.348183631896973, "global_step": 110687, "epoch": 2635} {"train_loss": -6.385852813720703, "global_step": 110688, "epoch": 2635} {"train_loss": -6.4351115226745605, "global_step": 110689, "epoch": 2635} {"train_loss": -6.612619400024414, "global_step": 110690, "epoch": 2635} {"train_loss": -6.459670066833496, "global_step": 110691, "epoch": 2635} {"train_loss": -6.436302185058594, "global_step": 110692, "epoch": 2635} {"train_loss": -6.410017013549805, "global_step": 110693, "epoch": 2635} {"train_loss": -6.485632419586182, "global_step": 110694, "epoch": 2635} {"train_loss": -6.406380653381348, "global_step": 110695, "epoch": 2635} {"train_loss": -6.424093723297119, "global_step": 110696, "epoch": 2635} {"train_loss": -6.515413284301758, "global_step": 110697, "epoch": 2635} {"train_loss": -6.477686882019043, "global_step": 110698, "epoch": 2635} {"train_loss": -6.490360260009766, "global_step": 110699, "epoch": 2635} {"train_loss": -6.451506614685059, "global_step": 110700, "epoch": 2635} {"train_loss": -6.425456523895264, "global_step": 110701, "epoch": 2635} {"train_loss": -6.420114994049072, "global_step": 110702, "epoch": 2635} {"train_loss": -6.397177696228027, "global_step": 110703, "epoch": 2635} {"train_loss": -6.507987022399902, "global_step": 110704, "epoch": 2635} {"train_loss": -6.487964153289795, "global_step": 110705, "epoch": 2635} {"train_loss": -6.400091171264648, "global_step": 110706, "epoch": 2635} {"train_loss": -6.2915191650390625, "global_step": 110707, "epoch": 2635} {"train_loss": -6.450444221496582, "global_step": 110708, "epoch": 2635} {"train_loss": -6.427087306976318, "global_step": 110709, "epoch": 2635} {"train_loss": -6.276046276092529, "global_step": 110710, "epoch": 2635} {"train_loss": -6.4213831424713135, "global_step": 110711, "epoch": 2635, "val_loss": 67799.7265625} {"train_loss": -6.529401779174805, "global_step": 110712, "epoch": 2636} {"train_loss": -6.322115898132324, "global_step": 110713, "epoch": 2636} {"train_loss": -6.457919597625732, "global_step": 110714, "epoch": 2636} {"train_loss": -6.381813049316406, "global_step": 110715, "epoch": 2636} {"train_loss": -6.306696891784668, "global_step": 110716, "epoch": 2636} {"train_loss": -6.437652587890625, "global_step": 110717, "epoch": 2636} {"train_loss": -6.383634567260742, "global_step": 110718, "epoch": 2636} {"train_loss": -6.480702877044678, "global_step": 110719, "epoch": 2636} {"train_loss": -6.5295491218566895, "global_step": 110720, "epoch": 2636} {"train_loss": -6.357216835021973, "global_step": 110721, "epoch": 2636} {"train_loss": -6.3774614334106445, "global_step": 110722, "epoch": 2636} {"train_loss": -6.454257965087891, "global_step": 110723, "epoch": 2636} {"train_loss": -6.419861316680908, "global_step": 110724, "epoch": 2636} {"train_loss": -6.48020076751709, "global_step": 110725, "epoch": 2636} {"train_loss": -6.536213397979736, "global_step": 110726, "epoch": 2636} {"train_loss": -6.4607625007629395, "global_step": 110727, "epoch": 2636} {"train_loss": -6.464071273803711, "global_step": 110728, "epoch": 2636} {"train_loss": -6.487215995788574, "global_step": 110729, "epoch": 2636} {"train_loss": -6.494809150695801, "global_step": 110730, "epoch": 2636} {"train_loss": -6.558901786804199, "global_step": 110731, "epoch": 2636} {"train_loss": -6.619467735290527, "global_step": 110732, "epoch": 2636} {"train_loss": -6.496654510498047, "global_step": 110733, "epoch": 2636} {"train_loss": -6.56899356842041, "global_step": 110734, "epoch": 2636} {"train_loss": -6.517034530639648, "global_step": 110735, "epoch": 2636} {"train_loss": -6.517871856689453, "global_step": 110736, "epoch": 2636} {"train_loss": -6.521139144897461, "global_step": 110737, "epoch": 2636} {"train_loss": -6.373662948608398, "global_step": 110738, "epoch": 2636} {"train_loss": -6.447060585021973, "global_step": 110739, "epoch": 2636} {"train_loss": -6.396773815155029, "global_step": 110740, "epoch": 2636} {"train_loss": -6.32151460647583, "global_step": 110741, "epoch": 2636} {"train_loss": -6.205012321472168, "global_step": 110742, "epoch": 2636} {"train_loss": -6.446045875549316, "global_step": 110743, "epoch": 2636} {"train_loss": -6.21158504486084, "global_step": 110744, "epoch": 2636} {"train_loss": -6.257246017456055, "global_step": 110745, "epoch": 2636} {"train_loss": -6.359284400939941, "global_step": 110746, "epoch": 2636} {"train_loss": -6.133944511413574, "global_step": 110747, "epoch": 2636} {"train_loss": -6.236631393432617, "global_step": 110748, "epoch": 2636} {"train_loss": -6.225460052490234, "global_step": 110749, "epoch": 2636} {"train_loss": -6.363117694854736, "global_step": 110750, "epoch": 2636} {"train_loss": -6.122125625610352, "global_step": 110751, "epoch": 2636} {"train_loss": -6.332931995391846, "global_step": 110752, "epoch": 2636} {"train_loss": -6.396850551877703, "global_step": 110753, "epoch": 2636, "val_loss": 67926.859375} {"train_loss": -6.377580642700195, "global_step": 110754, "epoch": 2637} {"train_loss": -6.171448707580566, "global_step": 110755, "epoch": 2637} {"train_loss": -6.426140785217285, "global_step": 110756, "epoch": 2637} {"train_loss": -6.327291488647461, "global_step": 110757, "epoch": 2637} {"train_loss": -6.336703777313232, "global_step": 110758, "epoch": 2637} {"train_loss": -6.220771312713623, "global_step": 110759, "epoch": 2637} {"train_loss": -6.24177885055542, "global_step": 110760, "epoch": 2637} {"train_loss": -6.384624004364014, "global_step": 110761, "epoch": 2637} {"train_loss": -6.3015217781066895, "global_step": 110762, "epoch": 2637} {"train_loss": -6.206373691558838, "global_step": 110763, "epoch": 2637} {"train_loss": -6.437504768371582, "global_step": 110764, "epoch": 2637} {"train_loss": -6.3927106857299805, "global_step": 110765, "epoch": 2637} {"train_loss": -6.243836879730225, "global_step": 110766, "epoch": 2637} {"train_loss": -6.411127090454102, "global_step": 110767, "epoch": 2637} {"train_loss": -6.293398857116699, "global_step": 110768, "epoch": 2637} {"train_loss": -6.38496208190918, "global_step": 110769, "epoch": 2637} {"train_loss": -6.39061164855957, "global_step": 110770, "epoch": 2637} {"train_loss": -6.377144813537598, "global_step": 110771, "epoch": 2637} {"train_loss": -6.309139251708984, "global_step": 110772, "epoch": 2637} {"train_loss": -6.417012691497803, "global_step": 110773, "epoch": 2637} {"train_loss": -6.460788726806641, "global_step": 110774, "epoch": 2637} {"train_loss": -6.30305814743042, "global_step": 110775, "epoch": 2637} {"train_loss": -6.391872406005859, "global_step": 110776, "epoch": 2637} {"train_loss": -6.30886697769165, "global_step": 110777, "epoch": 2637} {"train_loss": -6.435113906860352, "global_step": 110778, "epoch": 2637} {"train_loss": -6.283535957336426, "global_step": 110779, "epoch": 2637} {"train_loss": -6.360543727874756, "global_step": 110780, "epoch": 2637} {"train_loss": -6.3625311851501465, "global_step": 110781, "epoch": 2637} {"train_loss": -6.440611839294434, "global_step": 110782, "epoch": 2637} {"train_loss": -6.369925498962402, "global_step": 110783, "epoch": 2637} {"train_loss": -6.331205368041992, "global_step": 110784, "epoch": 2637} {"train_loss": -6.342963695526123, "global_step": 110785, "epoch": 2637} {"train_loss": -6.394815444946289, "global_step": 110786, "epoch": 2637} {"train_loss": -6.43943977355957, "global_step": 110787, "epoch": 2637} {"train_loss": -6.508951187133789, "global_step": 110788, "epoch": 2637} {"train_loss": -6.407211780548096, "global_step": 110789, "epoch": 2637} {"train_loss": -6.350589752197266, "global_step": 110790, "epoch": 2637} {"train_loss": -6.37834358215332, "global_step": 110791, "epoch": 2637} {"train_loss": -6.441905498504639, "global_step": 110792, "epoch": 2637} {"train_loss": -6.364735126495361, "global_step": 110793, "epoch": 2637} {"train_loss": -6.417747497558594, "global_step": 110794, "epoch": 2637} {"train_loss": -6.36145373753139, "global_step": 110795, "epoch": 2637, "val_loss": 67853.390625} {"train_loss": -6.366578102111816, "global_step": 110796, "epoch": 2638} {"train_loss": -6.4133172035217285, "global_step": 110797, "epoch": 2638} {"train_loss": -6.516209125518799, "global_step": 110798, "epoch": 2638} {"train_loss": -6.445214748382568, "global_step": 110799, "epoch": 2638} {"train_loss": -6.418485164642334, "global_step": 110800, "epoch": 2638} {"train_loss": -6.46270227432251, "global_step": 110801, "epoch": 2638} {"train_loss": -6.4654436111450195, "global_step": 110802, "epoch": 2638} {"train_loss": -6.453219413757324, "global_step": 110803, "epoch": 2638} {"train_loss": -6.551270484924316, "global_step": 110804, "epoch": 2638} {"train_loss": -6.316709041595459, "global_step": 110805, "epoch": 2638} {"train_loss": -6.457297325134277, "global_step": 110806, "epoch": 2638} {"train_loss": -6.517634391784668, "global_step": 110807, "epoch": 2638} {"train_loss": -6.433980941772461, "global_step": 110808, "epoch": 2638} {"train_loss": -6.41691780090332, "global_step": 110809, "epoch": 2638} {"train_loss": -6.533644676208496, "global_step": 110810, "epoch": 2638} {"train_loss": -6.414922714233398, "global_step": 110811, "epoch": 2638} {"train_loss": -6.518550872802734, "global_step": 110812, "epoch": 2638} {"train_loss": -6.504587173461914, "global_step": 110813, "epoch": 2638} {"train_loss": -6.53254508972168, "global_step": 110814, "epoch": 2638} {"train_loss": -6.451519012451172, "global_step": 110815, "epoch": 2638} {"train_loss": -6.430065155029297, "global_step": 110816, "epoch": 2638} {"train_loss": -6.329753398895264, "global_step": 110817, "epoch": 2638} {"train_loss": -6.399197578430176, "global_step": 110818, "epoch": 2638} {"train_loss": -6.5743327140808105, "global_step": 110819, "epoch": 2638} {"train_loss": -6.385537147521973, "global_step": 110820, "epoch": 2638} {"train_loss": -6.468235015869141, "global_step": 110821, "epoch": 2638} {"train_loss": -6.469350337982178, "global_step": 110822, "epoch": 2638} {"train_loss": -6.486574172973633, "global_step": 110823, "epoch": 2638} {"train_loss": -6.421311855316162, "global_step": 110824, "epoch": 2638} {"train_loss": -6.567556381225586, "global_step": 110825, "epoch": 2638} {"train_loss": -6.545899391174316, "global_step": 110826, "epoch": 2638} {"train_loss": -6.507780075073242, "global_step": 110827, "epoch": 2638} {"train_loss": -6.422952175140381, "global_step": 110828, "epoch": 2638} {"train_loss": -6.433216571807861, "global_step": 110829, "epoch": 2638} {"train_loss": -6.4800519943237305, "global_step": 110830, "epoch": 2638} {"train_loss": -6.461075782775879, "global_step": 110831, "epoch": 2638} {"train_loss": -6.571372985839844, "global_step": 110832, "epoch": 2638} {"train_loss": -6.347187042236328, "global_step": 110833, "epoch": 2638} {"train_loss": -6.473465919494629, "global_step": 110834, "epoch": 2638} {"train_loss": -6.452829360961914, "global_step": 110835, "epoch": 2638} {"train_loss": -6.2271270751953125, "global_step": 110836, "epoch": 2638} {"train_loss": -6.458895319984073, "global_step": 110837, "epoch": 2638, "val_loss": 68185.109375} {"train_loss": -6.393729209899902, "global_step": 110838, "epoch": 2639} {"train_loss": -6.369648456573486, "global_step": 110839, "epoch": 2639} {"train_loss": -6.417821884155273, "global_step": 110840, "epoch": 2639} {"train_loss": -6.376153469085693, "global_step": 110841, "epoch": 2639} {"train_loss": -6.51387882232666, "global_step": 110842, "epoch": 2639} {"train_loss": -6.413933277130127, "global_step": 110843, "epoch": 2639} {"train_loss": -6.329678535461426, "global_step": 110844, "epoch": 2639} {"train_loss": -6.364495277404785, "global_step": 110845, "epoch": 2639} {"train_loss": -6.375770568847656, "global_step": 110846, "epoch": 2639} {"train_loss": -6.277204990386963, "global_step": 110847, "epoch": 2639} {"train_loss": -6.372317314147949, "global_step": 110848, "epoch": 2639} {"train_loss": -6.427650451660156, "global_step": 110849, "epoch": 2639} {"train_loss": -6.482487201690674, "global_step": 110850, "epoch": 2639} {"train_loss": -6.4649739265441895, "global_step": 110851, "epoch": 2639} {"train_loss": -6.4048004150390625, "global_step": 110852, "epoch": 2639} {"train_loss": -6.416842460632324, "global_step": 110853, "epoch": 2639} {"train_loss": -6.395997047424316, "global_step": 110854, "epoch": 2639} {"train_loss": -6.530474662780762, "global_step": 110855, "epoch": 2639} {"train_loss": -6.452297210693359, "global_step": 110856, "epoch": 2639} {"train_loss": -6.469233512878418, "global_step": 110857, "epoch": 2639} {"train_loss": -6.474788188934326, "global_step": 110858, "epoch": 2639} {"train_loss": -6.4461565017700195, "global_step": 110859, "epoch": 2639} {"train_loss": -6.37937593460083, "global_step": 110860, "epoch": 2639} {"train_loss": -6.415851593017578, "global_step": 110861, "epoch": 2639} {"train_loss": -6.5144758224487305, "global_step": 110862, "epoch": 2639} {"train_loss": -6.462805271148682, "global_step": 110863, "epoch": 2639} {"train_loss": -6.442309379577637, "global_step": 110864, "epoch": 2639} {"train_loss": -6.315371513366699, "global_step": 110865, "epoch": 2639} {"train_loss": -6.347186088562012, "global_step": 110866, "epoch": 2639} {"train_loss": -6.465737819671631, "global_step": 110867, "epoch": 2639} {"train_loss": -6.445734977722168, "global_step": 110868, "epoch": 2639} {"train_loss": -6.401369571685791, "global_step": 110869, "epoch": 2639} {"train_loss": -6.4670634269714355, "global_step": 110870, "epoch": 2639} {"train_loss": -6.360433578491211, "global_step": 110871, "epoch": 2639} {"train_loss": -6.402947902679443, "global_step": 110872, "epoch": 2639} {"train_loss": -6.413902282714844, "global_step": 110873, "epoch": 2639} {"train_loss": -6.383601188659668, "global_step": 110874, "epoch": 2639} {"train_loss": -6.473858833312988, "global_step": 110875, "epoch": 2639} {"train_loss": -6.215633392333984, "global_step": 110876, "epoch": 2639} {"train_loss": -6.461211681365967, "global_step": 110877, "epoch": 2639} {"train_loss": -6.345257759094238, "global_step": 110878, "epoch": 2639} {"train_loss": -6.410846085775466, "global_step": 110879, "epoch": 2639, "val_loss": 68004.078125} {"train_loss": -6.4466962814331055, "global_step": 110880, "epoch": 2640} {"train_loss": -6.481991291046143, "global_step": 110881, "epoch": 2640} {"train_loss": -6.481420993804932, "global_step": 110882, "epoch": 2640} {"train_loss": -6.393283843994141, "global_step": 110883, "epoch": 2640} {"train_loss": -6.437963485717773, "global_step": 110884, "epoch": 2640} {"train_loss": -6.332780838012695, "global_step": 110885, "epoch": 2640} {"train_loss": -6.576413154602051, "global_step": 110886, "epoch": 2640} {"train_loss": -6.4371137619018555, "global_step": 110887, "epoch": 2640} {"train_loss": -6.514153003692627, "global_step": 110888, "epoch": 2640} {"train_loss": -6.400800704956055, "global_step": 110889, "epoch": 2640} {"train_loss": -6.347196578979492, "global_step": 110890, "epoch": 2640} {"train_loss": -6.516712188720703, "global_step": 110891, "epoch": 2640} {"train_loss": -6.489021301269531, "global_step": 110892, "epoch": 2640} {"train_loss": -6.56151008605957, "global_step": 110893, "epoch": 2640} {"train_loss": -6.332251071929932, "global_step": 110894, "epoch": 2640} {"train_loss": -6.524538516998291, "global_step": 110895, "epoch": 2640} {"train_loss": -6.4862565994262695, "global_step": 110896, "epoch": 2640} {"train_loss": -6.4524431228637695, "global_step": 110897, "epoch": 2640} {"train_loss": -6.435336112976074, "global_step": 110898, "epoch": 2640} {"train_loss": -6.339766502380371, "global_step": 110899, "epoch": 2640} {"train_loss": -6.348853588104248, "global_step": 110900, "epoch": 2640} {"train_loss": -6.374795913696289, "global_step": 110901, "epoch": 2640} {"train_loss": -6.559263229370117, "global_step": 110902, "epoch": 2640} {"train_loss": -6.457217216491699, "global_step": 110903, "epoch": 2640} {"train_loss": -6.413575172424316, "global_step": 110904, "epoch": 2640} {"train_loss": -6.428680896759033, "global_step": 110905, "epoch": 2640} {"train_loss": -6.41397762298584, "global_step": 110906, "epoch": 2640} {"train_loss": -6.44023323059082, "global_step": 110907, "epoch": 2640} {"train_loss": -6.480508804321289, "global_step": 110908, "epoch": 2640} {"train_loss": -6.403541564941406, "global_step": 110909, "epoch": 2640} {"train_loss": -6.4379963874816895, "global_step": 110910, "epoch": 2640} {"train_loss": -6.3591814041137695, "global_step": 110911, "epoch": 2640} {"train_loss": -6.433929443359375, "global_step": 110912, "epoch": 2640} {"train_loss": -6.5313262939453125, "global_step": 110913, "epoch": 2640} {"train_loss": -6.5243821144104, "global_step": 110914, "epoch": 2640} {"train_loss": -6.436356544494629, "global_step": 110915, "epoch": 2640} {"train_loss": -6.545194149017334, "global_step": 110916, "epoch": 2640} {"train_loss": -6.586939811706543, "global_step": 110917, "epoch": 2640} {"train_loss": -6.479963302612305, "global_step": 110918, "epoch": 2640} {"train_loss": -6.646089553833008, "global_step": 110919, "epoch": 2640} {"train_loss": -6.456711769104004, "global_step": 110920, "epoch": 2640} {"train_loss": -6.459138552347819, "global_step": 110921, "epoch": 2640, "val_loss": 67717.4375} {"train_loss": -6.534156322479248, "global_step": 110922, "epoch": 2641} {"train_loss": -6.530641078948975, "global_step": 110923, "epoch": 2641} {"train_loss": -6.548486709594727, "global_step": 110924, "epoch": 2641} {"train_loss": -6.406215667724609, "global_step": 110925, "epoch": 2641} {"train_loss": -6.491954803466797, "global_step": 110926, "epoch": 2641} {"train_loss": -6.477560520172119, "global_step": 110927, "epoch": 2641} {"train_loss": -6.555658340454102, "global_step": 110928, "epoch": 2641} {"train_loss": -6.480254173278809, "global_step": 110929, "epoch": 2641} {"train_loss": -6.602888584136963, "global_step": 110930, "epoch": 2641} {"train_loss": -6.475427627563477, "global_step": 110931, "epoch": 2641} {"train_loss": -6.362785339355469, "global_step": 110932, "epoch": 2641} {"train_loss": -6.421750068664551, "global_step": 110933, "epoch": 2641} {"train_loss": -6.473395347595215, "global_step": 110934, "epoch": 2641} {"train_loss": -6.552048683166504, "global_step": 110935, "epoch": 2641} {"train_loss": -6.536600589752197, "global_step": 110936, "epoch": 2641} {"train_loss": -6.409526824951172, "global_step": 110937, "epoch": 2641} {"train_loss": -6.45855188369751, "global_step": 110938, "epoch": 2641} {"train_loss": -6.429755210876465, "global_step": 110939, "epoch": 2641} {"train_loss": -6.416928768157959, "global_step": 110940, "epoch": 2641} {"train_loss": -6.490987777709961, "global_step": 110941, "epoch": 2641} {"train_loss": -6.538722515106201, "global_step": 110942, "epoch": 2641} {"train_loss": -6.449213027954102, "global_step": 110943, "epoch": 2641} {"train_loss": -6.418698310852051, "global_step": 110944, "epoch": 2641} {"train_loss": -6.513632297515869, "global_step": 110945, "epoch": 2641} {"train_loss": -6.5185546875, "global_step": 110946, "epoch": 2641} {"train_loss": -6.507220268249512, "global_step": 110947, "epoch": 2641} {"train_loss": -6.457259178161621, "global_step": 110948, "epoch": 2641} {"train_loss": -6.538923740386963, "global_step": 110949, "epoch": 2641} {"train_loss": -6.379505634307861, "global_step": 110950, "epoch": 2641} {"train_loss": -6.46122932434082, "global_step": 110951, "epoch": 2641} {"train_loss": -6.388346195220947, "global_step": 110952, "epoch": 2641} {"train_loss": -6.288491249084473, "global_step": 110953, "epoch": 2641} {"train_loss": -6.343432903289795, "global_step": 110954, "epoch": 2641} {"train_loss": -6.406523704528809, "global_step": 110955, "epoch": 2641} {"train_loss": -6.269865989685059, "global_step": 110956, "epoch": 2641} {"train_loss": -6.444736003875732, "global_step": 110957, "epoch": 2641} {"train_loss": -6.456752777099609, "global_step": 110958, "epoch": 2641} {"train_loss": -6.42861270904541, "global_step": 110959, "epoch": 2641} {"train_loss": -6.384207725524902, "global_step": 110960, "epoch": 2641} {"train_loss": -6.401118278503418, "global_step": 110961, "epoch": 2641} {"train_loss": -6.475330829620361, "global_step": 110962, "epoch": 2641} {"train_loss": -6.455560979389009, "global_step": 110963, "epoch": 2641, "val_loss": 67828.109375} {"train_loss": -6.47623348236084, "global_step": 110964, "epoch": 2642} {"train_loss": -6.377076148986816, "global_step": 110965, "epoch": 2642} {"train_loss": -6.419536590576172, "global_step": 110966, "epoch": 2642} {"train_loss": -6.371453285217285, "global_step": 110967, "epoch": 2642} {"train_loss": -6.58956241607666, "global_step": 110968, "epoch": 2642} {"train_loss": -6.3076324462890625, "global_step": 110969, "epoch": 2642} {"train_loss": -6.540627479553223, "global_step": 110970, "epoch": 2642} {"train_loss": -6.420126438140869, "global_step": 110971, "epoch": 2642} {"train_loss": -6.419805526733398, "global_step": 110972, "epoch": 2642} {"train_loss": -6.42976188659668, "global_step": 110973, "epoch": 2642} {"train_loss": -6.41485595703125, "global_step": 110974, "epoch": 2642} {"train_loss": -6.529407978057861, "global_step": 110975, "epoch": 2642} {"train_loss": -6.421846389770508, "global_step": 110976, "epoch": 2642} {"train_loss": -6.511481285095215, "global_step": 110977, "epoch": 2642} {"train_loss": -6.407883644104004, "global_step": 110978, "epoch": 2642} {"train_loss": -6.4563727378845215, "global_step": 110979, "epoch": 2642} {"train_loss": -6.455682754516602, "global_step": 110980, "epoch": 2642} {"train_loss": -6.5318756103515625, "global_step": 110981, "epoch": 2642} {"train_loss": -6.500842094421387, "global_step": 110982, "epoch": 2642} {"train_loss": -6.488616943359375, "global_step": 110983, "epoch": 2642} {"train_loss": -6.450216293334961, "global_step": 110984, "epoch": 2642} {"train_loss": -6.478305339813232, "global_step": 110985, "epoch": 2642} {"train_loss": -6.406277656555176, "global_step": 110986, "epoch": 2642} {"train_loss": -6.4217529296875, "global_step": 110987, "epoch": 2642} {"train_loss": -6.486308574676514, "global_step": 110988, "epoch": 2642} {"train_loss": -6.545964241027832, "global_step": 110989, "epoch": 2642} {"train_loss": -6.473815441131592, "global_step": 110990, "epoch": 2642} {"train_loss": -6.369937896728516, "global_step": 110991, "epoch": 2642} {"train_loss": -6.4730143547058105, "global_step": 110992, "epoch": 2642} {"train_loss": -6.57524299621582, "global_step": 110993, "epoch": 2642} {"train_loss": -6.3271589279174805, "global_step": 110994, "epoch": 2642} {"train_loss": -6.315110683441162, "global_step": 110995, "epoch": 2642} {"train_loss": -6.4724440574646, "global_step": 110996, "epoch": 2642} {"train_loss": -6.319519996643066, "global_step": 110997, "epoch": 2642} {"train_loss": -6.477935791015625, "global_step": 110998, "epoch": 2642} {"train_loss": -6.452648162841797, "global_step": 110999, "epoch": 2642} {"train_loss": -6.275338172912598, "global_step": 111000, "epoch": 2642} {"train_loss": -6.309135437011719, "global_step": 111001, "epoch": 2642} {"train_loss": -6.477823257446289, "global_step": 111002, "epoch": 2642} {"train_loss": -6.3161773681640625, "global_step": 111003, "epoch": 2642} {"train_loss": -6.468220233917236, "global_step": 111004, "epoch": 2642} {"train_loss": -6.436458303814843, "global_step": 111005, "epoch": 2642, "val_loss": 67864.9921875} {"train_loss": -6.432287693023682, "global_step": 111006, "epoch": 2643} {"train_loss": -6.3357744216918945, "global_step": 111007, "epoch": 2643} {"train_loss": -6.432244300842285, "global_step": 111008, "epoch": 2643} {"train_loss": -6.4225311279296875, "global_step": 111009, "epoch": 2643} {"train_loss": -6.399041175842285, "global_step": 111010, "epoch": 2643} {"train_loss": -6.424912452697754, "global_step": 111011, "epoch": 2643} {"train_loss": -6.3962907791137695, "global_step": 111012, "epoch": 2643} {"train_loss": -6.462707042694092, "global_step": 111013, "epoch": 2643} {"train_loss": -6.476815223693848, "global_step": 111014, "epoch": 2643} {"train_loss": -6.480623245239258, "global_step": 111015, "epoch": 2643} {"train_loss": -6.463815689086914, "global_step": 111016, "epoch": 2643} {"train_loss": -6.367514133453369, "global_step": 111017, "epoch": 2643} {"train_loss": -6.4670090675354, "global_step": 111018, "epoch": 2643} {"train_loss": -6.451211452484131, "global_step": 111019, "epoch": 2643} {"train_loss": -6.525359630584717, "global_step": 111020, "epoch": 2643} {"train_loss": -6.49273681640625, "global_step": 111021, "epoch": 2643} {"train_loss": -6.446287155151367, "global_step": 111022, "epoch": 2643} {"train_loss": -6.36950159072876, "global_step": 111023, "epoch": 2643} {"train_loss": -6.482370376586914, "global_step": 111024, "epoch": 2643} {"train_loss": -6.343299865722656, "global_step": 111025, "epoch": 2643} {"train_loss": -6.528039932250977, "global_step": 111026, "epoch": 2643} {"train_loss": -6.393957138061523, "global_step": 111027, "epoch": 2643} {"train_loss": -6.498340129852295, "global_step": 111028, "epoch": 2643} {"train_loss": -6.482636451721191, "global_step": 111029, "epoch": 2643} {"train_loss": -6.341925621032715, "global_step": 111030, "epoch": 2643} {"train_loss": -6.343341827392578, "global_step": 111031, "epoch": 2643} {"train_loss": -6.312521934509277, "global_step": 111032, "epoch": 2643} {"train_loss": -6.518616676330566, "global_step": 111033, "epoch": 2643} {"train_loss": -6.187619686126709, "global_step": 111034, "epoch": 2643} {"train_loss": -6.247424125671387, "global_step": 111035, "epoch": 2643} {"train_loss": -6.490762710571289, "global_step": 111036, "epoch": 2643} {"train_loss": -6.372315406799316, "global_step": 111037, "epoch": 2643} {"train_loss": -6.35292911529541, "global_step": 111038, "epoch": 2643} {"train_loss": -6.459369659423828, "global_step": 111039, "epoch": 2643} {"train_loss": -6.3450727462768555, "global_step": 111040, "epoch": 2643} {"train_loss": -6.408536911010742, "global_step": 111041, "epoch": 2643} {"train_loss": -6.377200126647949, "global_step": 111042, "epoch": 2643} {"train_loss": -6.344210624694824, "global_step": 111043, "epoch": 2643} {"train_loss": -6.264598846435547, "global_step": 111044, "epoch": 2643} {"train_loss": -6.428765296936035, "global_step": 111045, "epoch": 2643} {"train_loss": -6.335906505584717, "global_step": 111046, "epoch": 2643} {"train_loss": -6.408515737170265, "global_step": 111047, "epoch": 2643, "val_loss": 68275.0546875} {"train_loss": -6.283148288726807, "global_step": 111048, "epoch": 2644} {"train_loss": -6.4769182205200195, "global_step": 111049, "epoch": 2644} {"train_loss": -6.4335455894470215, "global_step": 111050, "epoch": 2644} {"train_loss": -6.491302490234375, "global_step": 111051, "epoch": 2644} {"train_loss": -6.409621238708496, "global_step": 111052, "epoch": 2644} {"train_loss": -6.382568359375, "global_step": 111053, "epoch": 2644} {"train_loss": -6.433525562286377, "global_step": 111054, "epoch": 2644} {"train_loss": -6.3870038986206055, "global_step": 111055, "epoch": 2644} {"train_loss": -6.462396144866943, "global_step": 111056, "epoch": 2644} {"train_loss": -6.4042840003967285, "global_step": 111057, "epoch": 2644} {"train_loss": -6.359029293060303, "global_step": 111058, "epoch": 2644} {"train_loss": -6.362095832824707, "global_step": 111059, "epoch": 2644} {"train_loss": -6.374622821807861, "global_step": 111060, "epoch": 2644} {"train_loss": -6.498475074768066, "global_step": 111061, "epoch": 2644} {"train_loss": -6.430574417114258, "global_step": 111062, "epoch": 2644} {"train_loss": -6.385682582855225, "global_step": 111063, "epoch": 2644} {"train_loss": -6.3384199142456055, "global_step": 111064, "epoch": 2644} {"train_loss": -6.423823833465576, "global_step": 111065, "epoch": 2644} {"train_loss": -6.498004913330078, "global_step": 111066, "epoch": 2644} {"train_loss": -6.470428466796875, "global_step": 111067, "epoch": 2644} {"train_loss": -6.501456260681152, "global_step": 111068, "epoch": 2644} {"train_loss": -6.428942680358887, "global_step": 111069, "epoch": 2644} {"train_loss": -6.477293014526367, "global_step": 111070, "epoch": 2644} {"train_loss": -6.42803430557251, "global_step": 111071, "epoch": 2644} {"train_loss": -6.465671539306641, "global_step": 111072, "epoch": 2644} {"train_loss": -6.441402435302734, "global_step": 111073, "epoch": 2644} {"train_loss": -6.458869457244873, "global_step": 111074, "epoch": 2644} {"train_loss": -6.435702323913574, "global_step": 111075, "epoch": 2644} {"train_loss": -6.349757194519043, "global_step": 111076, "epoch": 2644} {"train_loss": -6.474912643432617, "global_step": 111077, "epoch": 2644} {"train_loss": -6.316603660583496, "global_step": 111078, "epoch": 2644} {"train_loss": -6.365121841430664, "global_step": 111079, "epoch": 2644} {"train_loss": -6.470020294189453, "global_step": 111080, "epoch": 2644} {"train_loss": -6.289134979248047, "global_step": 111081, "epoch": 2644} {"train_loss": -6.493106842041016, "global_step": 111082, "epoch": 2644} {"train_loss": -6.568308353424072, "global_step": 111083, "epoch": 2644} {"train_loss": -6.3186163902282715, "global_step": 111084, "epoch": 2644} {"train_loss": -6.5066375732421875, "global_step": 111085, "epoch": 2644} {"train_loss": -6.317638397216797, "global_step": 111086, "epoch": 2644} {"train_loss": -6.353431701660156, "global_step": 111087, "epoch": 2644} {"train_loss": -6.458837032318115, "global_step": 111088, "epoch": 2644} {"train_loss": -6.422685929707119, "global_step": 111089, "epoch": 2644, "val_loss": 67819.4453125} {"train_loss": -6.36325740814209, "global_step": 111090, "epoch": 2645} {"train_loss": -6.424485206604004, "global_step": 111091, "epoch": 2645} {"train_loss": -6.522436618804932, "global_step": 111092, "epoch": 2645} {"train_loss": -6.504863739013672, "global_step": 111093, "epoch": 2645} {"train_loss": -6.603830337524414, "global_step": 111094, "epoch": 2645} {"train_loss": -6.389206886291504, "global_step": 111095, "epoch": 2645} {"train_loss": -6.5223388671875, "global_step": 111096, "epoch": 2645} {"train_loss": -6.573889255523682, "global_step": 111097, "epoch": 2645} {"train_loss": -6.543543815612793, "global_step": 111098, "epoch": 2645} {"train_loss": -6.498123645782471, "global_step": 111099, "epoch": 2645} {"train_loss": -6.473954677581787, "global_step": 111100, "epoch": 2645} {"train_loss": -6.5351762771606445, "global_step": 111101, "epoch": 2645} {"train_loss": -6.507022857666016, "global_step": 111102, "epoch": 2645} {"train_loss": -6.464881420135498, "global_step": 111103, "epoch": 2645} {"train_loss": -6.603480339050293, "global_step": 111104, "epoch": 2645} {"train_loss": -6.496623516082764, "global_step": 111105, "epoch": 2645} {"train_loss": -6.612255096435547, "global_step": 111106, "epoch": 2645} {"train_loss": -6.418225288391113, "global_step": 111107, "epoch": 2645} {"train_loss": -6.456735134124756, "global_step": 111108, "epoch": 2645} {"train_loss": -6.551875114440918, "global_step": 111109, "epoch": 2645} {"train_loss": -6.5379319190979, "global_step": 111110, "epoch": 2645} {"train_loss": -6.423976421356201, "global_step": 111111, "epoch": 2645} {"train_loss": -6.4464111328125, "global_step": 111112, "epoch": 2645} {"train_loss": -6.470881462097168, "global_step": 111113, "epoch": 2645} {"train_loss": -6.510855197906494, "global_step": 111114, "epoch": 2645} {"train_loss": -6.503385543823242, "global_step": 111115, "epoch": 2645} {"train_loss": -6.443228244781494, "global_step": 111116, "epoch": 2645} {"train_loss": -6.414866924285889, "global_step": 111117, "epoch": 2645} {"train_loss": -6.438773155212402, "global_step": 111118, "epoch": 2645} {"train_loss": -6.539236068725586, "global_step": 111119, "epoch": 2645} {"train_loss": -6.519766807556152, "global_step": 111120, "epoch": 2645} {"train_loss": -6.460582256317139, "global_step": 111121, "epoch": 2645} {"train_loss": -6.403177261352539, "global_step": 111122, "epoch": 2645} {"train_loss": -6.439116477966309, "global_step": 111123, "epoch": 2645} {"train_loss": -6.450550556182861, "global_step": 111124, "epoch": 2645} {"train_loss": -6.3554205894470215, "global_step": 111125, "epoch": 2645} {"train_loss": -6.478543281555176, "global_step": 111126, "epoch": 2645} {"train_loss": -6.456203460693359, "global_step": 111127, "epoch": 2645} {"train_loss": -6.378299713134766, "global_step": 111128, "epoch": 2645} {"train_loss": -6.470349311828613, "global_step": 111129, "epoch": 2645} {"train_loss": -6.413989543914795, "global_step": 111130, "epoch": 2645} {"train_loss": -6.479233446575346, "global_step": 111131, "epoch": 2645, "val_loss": 68040.8203125} {"train_loss": -6.4933881759643555, "global_step": 111132, "epoch": 2646} {"train_loss": -6.473577499389648, "global_step": 111133, "epoch": 2646} {"train_loss": -6.525424480438232, "global_step": 111134, "epoch": 2646} {"train_loss": -6.481732368469238, "global_step": 111135, "epoch": 2646} {"train_loss": -6.541254043579102, "global_step": 111136, "epoch": 2646} {"train_loss": -6.4686408042907715, "global_step": 111137, "epoch": 2646} {"train_loss": -6.5236663818359375, "global_step": 111138, "epoch": 2646} {"train_loss": -6.529816150665283, "global_step": 111139, "epoch": 2646} {"train_loss": -6.3572235107421875, "global_step": 111140, "epoch": 2646} {"train_loss": -6.583234786987305, "global_step": 111141, "epoch": 2646} {"train_loss": -6.386941432952881, "global_step": 111142, "epoch": 2646} {"train_loss": -6.487883567810059, "global_step": 111143, "epoch": 2646} {"train_loss": -6.533018589019775, "global_step": 111144, "epoch": 2646} {"train_loss": -6.467095375061035, "global_step": 111145, "epoch": 2646} {"train_loss": -6.566390514373779, "global_step": 111146, "epoch": 2646} {"train_loss": -6.411782741546631, "global_step": 111147, "epoch": 2646} {"train_loss": -6.502496242523193, "global_step": 111148, "epoch": 2646} {"train_loss": -6.427918434143066, "global_step": 111149, "epoch": 2646} {"train_loss": -6.720342636108398, "global_step": 111150, "epoch": 2646} {"train_loss": -6.380671977996826, "global_step": 111151, "epoch": 2646} {"train_loss": -6.362701416015625, "global_step": 111152, "epoch": 2646} {"train_loss": -6.458163261413574, "global_step": 111153, "epoch": 2646} {"train_loss": -6.4106831550598145, "global_step": 111154, "epoch": 2646} {"train_loss": -6.488883018493652, "global_step": 111155, "epoch": 2646} {"train_loss": -6.462729454040527, "global_step": 111156, "epoch": 2646} {"train_loss": -6.386613845825195, "global_step": 111157, "epoch": 2646} {"train_loss": -6.390904426574707, "global_step": 111158, "epoch": 2646} {"train_loss": -6.51668643951416, "global_step": 111159, "epoch": 2646} {"train_loss": -6.453088760375977, "global_step": 111160, "epoch": 2646} {"train_loss": -6.367405414581299, "global_step": 111161, "epoch": 2646} {"train_loss": -6.520750045776367, "global_step": 111162, "epoch": 2646} {"train_loss": -6.3633036613464355, "global_step": 111163, "epoch": 2646} {"train_loss": -6.3061676025390625, "global_step": 111164, "epoch": 2646} {"train_loss": -6.404492378234863, "global_step": 111165, "epoch": 2646} {"train_loss": -6.344616889953613, "global_step": 111166, "epoch": 2646} {"train_loss": -6.359066009521484, "global_step": 111167, "epoch": 2646} {"train_loss": -6.449103832244873, "global_step": 111168, "epoch": 2646} {"train_loss": -6.289971351623535, "global_step": 111169, "epoch": 2646} {"train_loss": -6.41970157623291, "global_step": 111170, "epoch": 2646} {"train_loss": -6.290774345397949, "global_step": 111171, "epoch": 2646} {"train_loss": -6.422298431396484, "global_step": 111172, "epoch": 2646} {"train_loss": -6.446552515029907, "global_step": 111173, "epoch": 2646, "val_loss": 68342.4921875} {"train_loss": -6.415617942810059, "global_step": 111174, "epoch": 2647} {"train_loss": -6.361300468444824, "global_step": 111175, "epoch": 2647} {"train_loss": -6.482654094696045, "global_step": 111176, "epoch": 2647} {"train_loss": -6.245698928833008, "global_step": 111177, "epoch": 2647} {"train_loss": -6.325079441070557, "global_step": 111178, "epoch": 2647} {"train_loss": -6.437093734741211, "global_step": 111179, "epoch": 2647} {"train_loss": -6.3984785079956055, "global_step": 111180, "epoch": 2647} {"train_loss": -6.452330112457275, "global_step": 111181, "epoch": 2647} {"train_loss": -6.344263553619385, "global_step": 111182, "epoch": 2647} {"train_loss": -6.595947265625, "global_step": 111183, "epoch": 2647} {"train_loss": -6.332761764526367, "global_step": 111184, "epoch": 2647} {"train_loss": -6.385523796081543, "global_step": 111185, "epoch": 2647} {"train_loss": -6.358482837677002, "global_step": 111186, "epoch": 2647} {"train_loss": -6.466072082519531, "global_step": 111187, "epoch": 2647} {"train_loss": -6.351505279541016, "global_step": 111188, "epoch": 2647} {"train_loss": -6.381330966949463, "global_step": 111189, "epoch": 2647} {"train_loss": -6.397935390472412, "global_step": 111190, "epoch": 2647} {"train_loss": -6.418357849121094, "global_step": 111191, "epoch": 2647} {"train_loss": -6.38883638381958, "global_step": 111192, "epoch": 2647} {"train_loss": -6.358451843261719, "global_step": 111193, "epoch": 2647} {"train_loss": -6.334558963775635, "global_step": 111194, "epoch": 2647} {"train_loss": -6.244069576263428, "global_step": 111195, "epoch": 2647} {"train_loss": -6.456018924713135, "global_step": 111196, "epoch": 2647} {"train_loss": -6.463067054748535, "global_step": 111197, "epoch": 2647} {"train_loss": -6.35653018951416, "global_step": 111198, "epoch": 2647} {"train_loss": -6.471632957458496, "global_step": 111199, "epoch": 2647} {"train_loss": -6.289930820465088, "global_step": 111200, "epoch": 2647} {"train_loss": -6.479875564575195, "global_step": 111201, "epoch": 2647} {"train_loss": -6.33492374420166, "global_step": 111202, "epoch": 2647} {"train_loss": -6.419611930847168, "global_step": 111203, "epoch": 2647} {"train_loss": -6.385982036590576, "global_step": 111204, "epoch": 2647} {"train_loss": -6.4845685958862305, "global_step": 111205, "epoch": 2647} {"train_loss": -6.343367099761963, "global_step": 111206, "epoch": 2647} {"train_loss": -6.240264415740967, "global_step": 111207, "epoch": 2647} {"train_loss": -6.525361061096191, "global_step": 111208, "epoch": 2647} {"train_loss": -6.377429962158203, "global_step": 111209, "epoch": 2647} {"train_loss": -6.365455150604248, "global_step": 111210, "epoch": 2647} {"train_loss": -6.430304527282715, "global_step": 111211, "epoch": 2647} {"train_loss": -6.498621940612793, "global_step": 111212, "epoch": 2647} {"train_loss": -6.421214580535889, "global_step": 111213, "epoch": 2647} {"train_loss": -6.300920486450195, "global_step": 111214, "epoch": 2647} {"train_loss": -6.390892675944737, "global_step": 111215, "epoch": 2647, "val_loss": 67982.6484375} {"train_loss": -6.3304290771484375, "global_step": 111216, "epoch": 2648} {"train_loss": -6.332493782043457, "global_step": 111217, "epoch": 2648} {"train_loss": -6.284912586212158, "global_step": 111218, "epoch": 2648} {"train_loss": -6.439016342163086, "global_step": 111219, "epoch": 2648} {"train_loss": -6.335862636566162, "global_step": 111220, "epoch": 2648} {"train_loss": -6.4416961669921875, "global_step": 111221, "epoch": 2648} {"train_loss": -6.423168659210205, "global_step": 111222, "epoch": 2648} {"train_loss": -6.470042705535889, "global_step": 111223, "epoch": 2648} {"train_loss": -6.450997352600098, "global_step": 111224, "epoch": 2648} {"train_loss": -6.361334800720215, "global_step": 111225, "epoch": 2648} {"train_loss": -6.508544921875, "global_step": 111226, "epoch": 2648} {"train_loss": -6.376697540283203, "global_step": 111227, "epoch": 2648} {"train_loss": -6.4644670486450195, "global_step": 111228, "epoch": 2648} {"train_loss": -6.513761043548584, "global_step": 111229, "epoch": 2648} {"train_loss": -6.381993293762207, "global_step": 111230, "epoch": 2648} {"train_loss": -6.512192726135254, "global_step": 111231, "epoch": 2648} {"train_loss": -6.538280963897705, "global_step": 111232, "epoch": 2648} {"train_loss": -6.487713813781738, "global_step": 111233, "epoch": 2648} {"train_loss": -6.478938102722168, "global_step": 111234, "epoch": 2648} {"train_loss": -6.428580284118652, "global_step": 111235, "epoch": 2648} {"train_loss": -6.454436779022217, "global_step": 111236, "epoch": 2648} {"train_loss": -6.398782730102539, "global_step": 111237, "epoch": 2648} {"train_loss": -6.482185363769531, "global_step": 111238, "epoch": 2648} {"train_loss": -6.403655052185059, "global_step": 111239, "epoch": 2648} {"train_loss": -6.378762245178223, "global_step": 111240, "epoch": 2648} {"train_loss": -6.432539463043213, "global_step": 111241, "epoch": 2648} {"train_loss": -6.476524353027344, "global_step": 111242, "epoch": 2648} {"train_loss": -6.447684288024902, "global_step": 111243, "epoch": 2648} {"train_loss": -6.456303119659424, "global_step": 111244, "epoch": 2648} {"train_loss": -6.439525127410889, "global_step": 111245, "epoch": 2648} {"train_loss": -6.56999397277832, "global_step": 111246, "epoch": 2648} {"train_loss": -6.385459899902344, "global_step": 111247, "epoch": 2648} {"train_loss": -6.439046859741211, "global_step": 111248, "epoch": 2648} {"train_loss": -6.451736927032471, "global_step": 111249, "epoch": 2648} {"train_loss": -6.575483322143555, "global_step": 111250, "epoch": 2648} {"train_loss": -6.421401023864746, "global_step": 111251, "epoch": 2648} {"train_loss": -6.457737922668457, "global_step": 111252, "epoch": 2648} {"train_loss": -6.463564395904541, "global_step": 111253, "epoch": 2648} {"train_loss": -6.323665618896484, "global_step": 111254, "epoch": 2648} {"train_loss": -6.497640609741211, "global_step": 111255, "epoch": 2648} {"train_loss": -6.542600631713867, "global_step": 111256, "epoch": 2648} {"train_loss": -6.4362209524427145, "global_step": 111257, "epoch": 2648, "val_loss": 68076.640625} {"train_loss": -6.400047302246094, "global_step": 111258, "epoch": 2649} {"train_loss": -6.406500816345215, "global_step": 111259, "epoch": 2649} {"train_loss": -6.3522257804870605, "global_step": 111260, "epoch": 2649} {"train_loss": -6.372969627380371, "global_step": 111261, "epoch": 2649} {"train_loss": -6.320614814758301, "global_step": 111262, "epoch": 2649} {"train_loss": -6.237270355224609, "global_step": 111263, "epoch": 2649} {"train_loss": -6.465359687805176, "global_step": 111264, "epoch": 2649} {"train_loss": -6.316624641418457, "global_step": 111265, "epoch": 2649} {"train_loss": -6.369576454162598, "global_step": 111266, "epoch": 2649} {"train_loss": -6.4873857498168945, "global_step": 111267, "epoch": 2649} {"train_loss": -6.338799953460693, "global_step": 111268, "epoch": 2649} {"train_loss": -6.4482269287109375, "global_step": 111269, "epoch": 2649} {"train_loss": -6.520528793334961, "global_step": 111270, "epoch": 2649} {"train_loss": -6.516602039337158, "global_step": 111271, "epoch": 2649} {"train_loss": -6.371390342712402, "global_step": 111272, "epoch": 2649} {"train_loss": -6.522292137145996, "global_step": 111273, "epoch": 2649} {"train_loss": -6.38986873626709, "global_step": 111274, "epoch": 2649} {"train_loss": -6.350281238555908, "global_step": 111275, "epoch": 2649} {"train_loss": -6.361522197723389, "global_step": 111276, "epoch": 2649} {"train_loss": -6.4028167724609375, "global_step": 111277, "epoch": 2649} {"train_loss": -6.399181842803955, "global_step": 111278, "epoch": 2649} {"train_loss": -6.418728351593018, "global_step": 111279, "epoch": 2649} {"train_loss": -6.545826435089111, "global_step": 111280, "epoch": 2649} {"train_loss": -6.482780456542969, "global_step": 111281, "epoch": 2649} {"train_loss": -6.461147785186768, "global_step": 111282, "epoch": 2649} {"train_loss": -6.465227127075195, "global_step": 111283, "epoch": 2649} {"train_loss": -6.5147857666015625, "global_step": 111284, "epoch": 2649} {"train_loss": -6.314565658569336, "global_step": 111285, "epoch": 2649} {"train_loss": -6.427490711212158, "global_step": 111286, "epoch": 2649} {"train_loss": -6.436592102050781, "global_step": 111287, "epoch": 2649} {"train_loss": -6.432831287384033, "global_step": 111288, "epoch": 2649} {"train_loss": -6.580280303955078, "global_step": 111289, "epoch": 2649} {"train_loss": -6.369446754455566, "global_step": 111290, "epoch": 2649} {"train_loss": -6.4207048416137695, "global_step": 111291, "epoch": 2649} {"train_loss": -6.529481410980225, "global_step": 111292, "epoch": 2649} {"train_loss": -6.539096832275391, "global_step": 111293, "epoch": 2649} {"train_loss": -6.4527997970581055, "global_step": 111294, "epoch": 2649} {"train_loss": -6.473762035369873, "global_step": 111295, "epoch": 2649} {"train_loss": -6.584128379821777, "global_step": 111296, "epoch": 2649} {"train_loss": -6.448733329772949, "global_step": 111297, "epoch": 2649} {"train_loss": -6.3947038650512695, "global_step": 111298, "epoch": 2649} {"train_loss": -6.4320509660811656, "global_step": 111299, "epoch": 2649, "val_loss": 67916.7890625} {"train_loss": -6.488123893737793, "global_step": 111300, "epoch": 2650} {"train_loss": -6.4644856452941895, "global_step": 111301, "epoch": 2650} {"train_loss": -6.466257572174072, "global_step": 111302, "epoch": 2650} {"train_loss": -6.527927398681641, "global_step": 111303, "epoch": 2650} {"train_loss": -6.374334812164307, "global_step": 111304, "epoch": 2650} {"train_loss": -6.509372711181641, "global_step": 111305, "epoch": 2650} {"train_loss": -6.444220542907715, "global_step": 111306, "epoch": 2650} {"train_loss": -6.42523193359375, "global_step": 111307, "epoch": 2650} {"train_loss": -6.543832778930664, "global_step": 111308, "epoch": 2650} {"train_loss": -6.458722114562988, "global_step": 111309, "epoch": 2650} {"train_loss": -6.5075225830078125, "global_step": 111310, "epoch": 2650} {"train_loss": -6.451862335205078, "global_step": 111311, "epoch": 2650} {"train_loss": -6.414053916931152, "global_step": 111312, "epoch": 2650} {"train_loss": -6.429298400878906, "global_step": 111313, "epoch": 2650} {"train_loss": -6.441533088684082, "global_step": 111314, "epoch": 2650} {"train_loss": -6.563020706176758, "global_step": 111315, "epoch": 2650} {"train_loss": -6.571010589599609, "global_step": 111316, "epoch": 2650} {"train_loss": -6.556336879730225, "global_step": 111317, "epoch": 2650} {"train_loss": -6.423352241516113, "global_step": 111318, "epoch": 2650} {"train_loss": -6.463825225830078, "global_step": 111319, "epoch": 2650} {"train_loss": -6.530738830566406, "global_step": 111320, "epoch": 2650} {"train_loss": -6.558125972747803, "global_step": 111321, "epoch": 2650} {"train_loss": -6.500800609588623, "global_step": 111322, "epoch": 2650} {"train_loss": -6.484097480773926, "global_step": 111323, "epoch": 2650} {"train_loss": -6.431426525115967, "global_step": 111324, "epoch": 2650} {"train_loss": -6.3099260330200195, "global_step": 111325, "epoch": 2650} {"train_loss": -6.387160301208496, "global_step": 111326, "epoch": 2650} {"train_loss": -6.454580783843994, "global_step": 111327, "epoch": 2650} {"train_loss": -6.4887847900390625, "global_step": 111328, "epoch": 2650} {"train_loss": -6.403915882110596, "global_step": 111329, "epoch": 2650} {"train_loss": -6.457954406738281, "global_step": 111330, "epoch": 2650} {"train_loss": -6.442633628845215, "global_step": 111331, "epoch": 2650} {"train_loss": -6.536993503570557, "global_step": 111332, "epoch": 2650} {"train_loss": -6.468910217285156, "global_step": 111333, "epoch": 2650} {"train_loss": -6.511160373687744, "global_step": 111334, "epoch": 2650} {"train_loss": -6.44320011138916, "global_step": 111335, "epoch": 2650} {"train_loss": -6.423725128173828, "global_step": 111336, "epoch": 2650} {"train_loss": -6.539046287536621, "global_step": 111337, "epoch": 2650} {"train_loss": -6.5044403076171875, "global_step": 111338, "epoch": 2650} {"train_loss": -6.453646183013916, "global_step": 111339, "epoch": 2650} {"train_loss": -6.584720611572266, "global_step": 111340, "epoch": 2650} {"train_loss": -6.4727958384014315, "global_step": 111341, "epoch": 2650, "train/sim_max_reward_0": 0.2282917191847046, "train/sim_max_reward_1": 0.9908834721762206, "train/sim_max_reward_2": 0.2775615246560199, "train/sim_max_reward_3": 0.14048350060457518, "train/sim_max_reward_4": 0.7608531415016714, "train/sim_max_reward_5": 0.961990769833721, "test/sim_max_reward_4400000": 0.9175500799362453, "test/sim_max_reward_4400001": 0.590650888756548, "test/sim_max_reward_4400002": 0.0746669797828149, "test/sim_max_reward_4400003": 0.05040225610882584, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.8460406101231389, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 0.23256390736614335, "test/sim_max_reward_4400011": 0.9397990634042724, "test/sim_max_reward_4400012": 0.8811376607234951, "test/sim_max_reward_4400013": 0.8951708570041073, "test/sim_max_reward_4400014": 0.7873923057631196, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.1824709891528949, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23816727195727802, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 8.004751997105799e-05, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.7501226724740513, "test/sim_max_reward_4400023": 0.40265899926854837, "test/sim_max_reward_4400024": 0.9789739228327117, "test/sim_max_reward_4400025": 0.25558358668461995, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.016872392419436884, "test/sim_max_reward_4400028": 0.7290063238674048, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.946668443767214, "test/sim_max_reward_4400031": 0.8696678292095441, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.3213758696375221, "test/sim_max_reward_4400034": 0.7725234260967502, "test/sim_max_reward_4400035": 0.9309092728663686, "test/sim_max_reward_4400036": 0.362049935388239, "test/sim_max_reward_4400037": 0.9185618090828195, "test/sim_max_reward_4400038": 0.35639069211305546, "test/sim_max_reward_4400039": 0.9394011758000572, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9322690840027816, "test/sim_max_reward_4400042": 0.05615056271204394, "test/sim_max_reward_4400043": 0.974547612473894, "test/sim_max_reward_4400044": 0.9232900360700792, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8637006629482853, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.9632181958039261, "train/mean_score": 0.5600106879928187, "test/mean_score": 0.49339858347296045, "val_loss": 67990.625} {"train_loss": -6.413481712341309, "global_step": 111342, "epoch": 2651} {"train_loss": -6.403914451599121, "global_step": 111343, "epoch": 2651} {"train_loss": -6.4176154136657715, "global_step": 111344, "epoch": 2651} {"train_loss": -6.300419807434082, "global_step": 111345, "epoch": 2651} {"train_loss": -6.347768306732178, "global_step": 111346, "epoch": 2651} {"train_loss": -6.422058582305908, "global_step": 111347, "epoch": 2651} {"train_loss": -6.238865375518799, "global_step": 111348, "epoch": 2651} {"train_loss": -6.434536933898926, "global_step": 111349, "epoch": 2651} {"train_loss": -6.487810134887695, "global_step": 111350, "epoch": 2651} {"train_loss": -6.392971038818359, "global_step": 111351, "epoch": 2651} {"train_loss": -6.4918012619018555, "global_step": 111352, "epoch": 2651} {"train_loss": -6.428007125854492, "global_step": 111353, "epoch": 2651} {"train_loss": -6.465934753417969, "global_step": 111354, "epoch": 2651} {"train_loss": -6.454570770263672, "global_step": 111355, "epoch": 2651} {"train_loss": -6.36555290222168, "global_step": 111356, "epoch": 2651} {"train_loss": -6.57936954498291, "global_step": 111357, "epoch": 2651} {"train_loss": -6.428637981414795, "global_step": 111358, "epoch": 2651} {"train_loss": -6.523901462554932, "global_step": 111359, "epoch": 2651} {"train_loss": -6.444858074188232, "global_step": 111360, "epoch": 2651} {"train_loss": -6.301967620849609, "global_step": 111361, "epoch": 2651} {"train_loss": -6.4832000732421875, "global_step": 111362, "epoch": 2651} {"train_loss": -6.276096343994141, "global_step": 111363, "epoch": 2651} {"train_loss": -6.4833574295043945, "global_step": 111364, "epoch": 2651} {"train_loss": -6.329757213592529, "global_step": 111365, "epoch": 2651} {"train_loss": -6.440759658813477, "global_step": 111366, "epoch": 2651} {"train_loss": -6.452998161315918, "global_step": 111367, "epoch": 2651} {"train_loss": -6.4706878662109375, "global_step": 111368, "epoch": 2651} {"train_loss": -6.4553303718566895, "global_step": 111369, "epoch": 2651} {"train_loss": -6.4783854484558105, "global_step": 111370, "epoch": 2651} {"train_loss": -6.385190963745117, "global_step": 111371, "epoch": 2651} {"train_loss": -6.436296463012695, "global_step": 111372, "epoch": 2651} {"train_loss": -6.440252304077148, "global_step": 111373, "epoch": 2651} {"train_loss": -6.372299671173096, "global_step": 111374, "epoch": 2651} {"train_loss": -6.325901508331299, "global_step": 111375, "epoch": 2651} {"train_loss": -6.396698951721191, "global_step": 111376, "epoch": 2651} {"train_loss": -6.348911285400391, "global_step": 111377, "epoch": 2651} {"train_loss": -6.436263084411621, "global_step": 111378, "epoch": 2651} {"train_loss": -6.379347801208496, "global_step": 111379, "epoch": 2651} {"train_loss": -6.403383255004883, "global_step": 111380, "epoch": 2651} {"train_loss": -6.520194053649902, "global_step": 111381, "epoch": 2651} {"train_loss": -6.410332202911377, "global_step": 111382, "epoch": 2651} {"train_loss": -6.4168804713657925, "global_step": 111383, "epoch": 2651, "val_loss": 67926.453125} {"train_loss": -6.3893632888793945, "global_step": 111384, "epoch": 2652} {"train_loss": -6.342198848724365, "global_step": 111385, "epoch": 2652} {"train_loss": -6.458003520965576, "global_step": 111386, "epoch": 2652} {"train_loss": -6.373723983764648, "global_step": 111387, "epoch": 2652} {"train_loss": -6.4956254959106445, "global_step": 111388, "epoch": 2652} {"train_loss": -6.650585174560547, "global_step": 111389, "epoch": 2652} {"train_loss": -6.4627814292907715, "global_step": 111390, "epoch": 2652} {"train_loss": -6.306929588317871, "global_step": 111391, "epoch": 2652} {"train_loss": -6.440347671508789, "global_step": 111392, "epoch": 2652} {"train_loss": -6.347336769104004, "global_step": 111393, "epoch": 2652} {"train_loss": -6.325973987579346, "global_step": 111394, "epoch": 2652} {"train_loss": -6.396319389343262, "global_step": 111395, "epoch": 2652} {"train_loss": -6.45743989944458, "global_step": 111396, "epoch": 2652} {"train_loss": -6.510975360870361, "global_step": 111397, "epoch": 2652} {"train_loss": -6.513813495635986, "global_step": 111398, "epoch": 2652} {"train_loss": -6.568154335021973, "global_step": 111399, "epoch": 2652} {"train_loss": -6.425731658935547, "global_step": 111400, "epoch": 2652} {"train_loss": -6.434211730957031, "global_step": 111401, "epoch": 2652} {"train_loss": -6.4989118576049805, "global_step": 111402, "epoch": 2652} {"train_loss": -6.399384498596191, "global_step": 111403, "epoch": 2652} {"train_loss": -6.447566509246826, "global_step": 111404, "epoch": 2652} {"train_loss": -6.449716567993164, "global_step": 111405, "epoch": 2652} {"train_loss": -6.372189044952393, "global_step": 111406, "epoch": 2652} {"train_loss": -6.651181221008301, "global_step": 111407, "epoch": 2652} {"train_loss": -6.398571968078613, "global_step": 111408, "epoch": 2652} {"train_loss": -6.436126232147217, "global_step": 111409, "epoch": 2652} {"train_loss": -6.543811798095703, "global_step": 111410, "epoch": 2652} {"train_loss": -6.446830749511719, "global_step": 111411, "epoch": 2652} {"train_loss": -6.508528232574463, "global_step": 111412, "epoch": 2652} {"train_loss": -6.494953632354736, "global_step": 111413, "epoch": 2652} {"train_loss": -6.461932182312012, "global_step": 111414, "epoch": 2652} {"train_loss": -6.501385688781738, "global_step": 111415, "epoch": 2652} {"train_loss": -6.524299144744873, "global_step": 111416, "epoch": 2652} {"train_loss": -6.441644668579102, "global_step": 111417, "epoch": 2652} {"train_loss": -6.517064094543457, "global_step": 111418, "epoch": 2652} {"train_loss": -6.447976589202881, "global_step": 111419, "epoch": 2652} {"train_loss": -6.505964279174805, "global_step": 111420, "epoch": 2652} {"train_loss": -6.631841659545898, "global_step": 111421, "epoch": 2652} {"train_loss": -6.570728302001953, "global_step": 111422, "epoch": 2652} {"train_loss": -6.485451698303223, "global_step": 111423, "epoch": 2652} {"train_loss": -6.545607566833496, "global_step": 111424, "epoch": 2652} {"train_loss": -6.468967914581299, "global_step": 111425, "epoch": 2652, "val_loss": 67877.3359375} {"train_loss": -6.61334228515625, "global_step": 111426, "epoch": 2653} {"train_loss": -6.407973289489746, "global_step": 111427, "epoch": 2653} {"train_loss": -6.437796592712402, "global_step": 111428, "epoch": 2653} {"train_loss": -6.408664226531982, "global_step": 111429, "epoch": 2653} {"train_loss": -6.351502418518066, "global_step": 111430, "epoch": 2653} {"train_loss": -6.603631496429443, "global_step": 111431, "epoch": 2653} {"train_loss": -6.518784046173096, "global_step": 111432, "epoch": 2653} {"train_loss": -6.559591770172119, "global_step": 111433, "epoch": 2653} {"train_loss": -6.554527282714844, "global_step": 111434, "epoch": 2653} {"train_loss": -6.427356243133545, "global_step": 111435, "epoch": 2653} {"train_loss": -6.629712104797363, "global_step": 111436, "epoch": 2653} {"train_loss": -6.435729503631592, "global_step": 111437, "epoch": 2653} {"train_loss": -6.508633613586426, "global_step": 111438, "epoch": 2653} {"train_loss": -6.474506855010986, "global_step": 111439, "epoch": 2653} {"train_loss": -6.412275314331055, "global_step": 111440, "epoch": 2653} {"train_loss": -6.511653423309326, "global_step": 111441, "epoch": 2653} {"train_loss": -6.319863319396973, "global_step": 111442, "epoch": 2653} {"train_loss": -6.48695182800293, "global_step": 111443, "epoch": 2653} {"train_loss": -6.500647068023682, "global_step": 111444, "epoch": 2653} {"train_loss": -6.509152889251709, "global_step": 111445, "epoch": 2653} {"train_loss": -6.4047088623046875, "global_step": 111446, "epoch": 2653} {"train_loss": -6.333285808563232, "global_step": 111447, "epoch": 2653} {"train_loss": -6.476650238037109, "global_step": 111448, "epoch": 2653} {"train_loss": -6.5476603507995605, "global_step": 111449, "epoch": 2653} {"train_loss": -6.461055278778076, "global_step": 111450, "epoch": 2653} {"train_loss": -6.419740676879883, "global_step": 111451, "epoch": 2653} {"train_loss": -6.402222633361816, "global_step": 111452, "epoch": 2653} {"train_loss": -6.443957328796387, "global_step": 111453, "epoch": 2653} {"train_loss": -6.403189659118652, "global_step": 111454, "epoch": 2653} {"train_loss": -6.476367950439453, "global_step": 111455, "epoch": 2653} {"train_loss": -6.488505840301514, "global_step": 111456, "epoch": 2653} {"train_loss": -6.473106384277344, "global_step": 111457, "epoch": 2653} {"train_loss": -6.534757137298584, "global_step": 111458, "epoch": 2653} {"train_loss": -6.438434600830078, "global_step": 111459, "epoch": 2653} {"train_loss": -6.442525386810303, "global_step": 111460, "epoch": 2653} {"train_loss": -6.480306625366211, "global_step": 111461, "epoch": 2653} {"train_loss": -6.528360366821289, "global_step": 111462, "epoch": 2653} {"train_loss": -6.470914840698242, "global_step": 111463, "epoch": 2653} {"train_loss": -6.521860599517822, "global_step": 111464, "epoch": 2653} {"train_loss": -6.310798645019531, "global_step": 111465, "epoch": 2653} {"train_loss": -6.492651462554932, "global_step": 111466, "epoch": 2653} {"train_loss": -6.468450682503836, "global_step": 111467, "epoch": 2653, "val_loss": 68018.6875} {"train_loss": -6.411669731140137, "global_step": 111468, "epoch": 2654} {"train_loss": -6.346242904663086, "global_step": 111469, "epoch": 2654} {"train_loss": -6.457378387451172, "global_step": 111470, "epoch": 2654} {"train_loss": -6.401576042175293, "global_step": 111471, "epoch": 2654} {"train_loss": -6.383111000061035, "global_step": 111472, "epoch": 2654} {"train_loss": -6.469873428344727, "global_step": 111473, "epoch": 2654} {"train_loss": -6.32149076461792, "global_step": 111474, "epoch": 2654} {"train_loss": -6.430615425109863, "global_step": 111475, "epoch": 2654} {"train_loss": -6.425411224365234, "global_step": 111476, "epoch": 2654} {"train_loss": -6.315727710723877, "global_step": 111477, "epoch": 2654} {"train_loss": -6.4243903160095215, "global_step": 111478, "epoch": 2654} {"train_loss": -6.277556419372559, "global_step": 111479, "epoch": 2654} {"train_loss": -6.382180690765381, "global_step": 111480, "epoch": 2654} {"train_loss": -6.403416633605957, "global_step": 111481, "epoch": 2654} {"train_loss": -6.41819953918457, "global_step": 111482, "epoch": 2654} {"train_loss": -6.291384220123291, "global_step": 111483, "epoch": 2654} {"train_loss": -6.283575057983398, "global_step": 111484, "epoch": 2654} {"train_loss": -6.321133136749268, "global_step": 111485, "epoch": 2654} {"train_loss": -6.401891708374023, "global_step": 111486, "epoch": 2654} {"train_loss": -6.338695526123047, "global_step": 111487, "epoch": 2654} {"train_loss": -6.27723503112793, "global_step": 111488, "epoch": 2654} {"train_loss": -6.367241382598877, "global_step": 111489, "epoch": 2654} {"train_loss": -6.524498462677002, "global_step": 111490, "epoch": 2654} {"train_loss": -6.456415176391602, "global_step": 111491, "epoch": 2654} {"train_loss": -6.396319389343262, "global_step": 111492, "epoch": 2654} {"train_loss": -6.358287334442139, "global_step": 111493, "epoch": 2654} {"train_loss": -6.342839241027832, "global_step": 111494, "epoch": 2654} {"train_loss": -6.444744110107422, "global_step": 111495, "epoch": 2654} {"train_loss": -6.486538887023926, "global_step": 111496, "epoch": 2654} {"train_loss": -6.496700286865234, "global_step": 111497, "epoch": 2654} {"train_loss": -6.486431121826172, "global_step": 111498, "epoch": 2654} {"train_loss": -6.384607315063477, "global_step": 111499, "epoch": 2654} {"train_loss": -6.473575592041016, "global_step": 111500, "epoch": 2654} {"train_loss": -6.455743789672852, "global_step": 111501, "epoch": 2654} {"train_loss": -6.43288516998291, "global_step": 111502, "epoch": 2654} {"train_loss": -6.43705940246582, "global_step": 111503, "epoch": 2654} {"train_loss": -6.361968517303467, "global_step": 111504, "epoch": 2654} {"train_loss": -6.346958637237549, "global_step": 111505, "epoch": 2654} {"train_loss": -6.473498821258545, "global_step": 111506, "epoch": 2654} {"train_loss": -6.422408103942871, "global_step": 111507, "epoch": 2654} {"train_loss": -6.473000526428223, "global_step": 111508, "epoch": 2654} {"train_loss": -6.40088289124625, "global_step": 111509, "epoch": 2654, "val_loss": 68088.5546875} {"train_loss": -6.405146598815918, "global_step": 111510, "epoch": 2655} {"train_loss": -6.432175636291504, "global_step": 111511, "epoch": 2655} {"train_loss": -6.466217041015625, "global_step": 111512, "epoch": 2655} {"train_loss": -6.358273029327393, "global_step": 111513, "epoch": 2655} {"train_loss": -6.319736480712891, "global_step": 111514, "epoch": 2655} {"train_loss": -6.375770568847656, "global_step": 111515, "epoch": 2655} {"train_loss": -6.3620758056640625, "global_step": 111516, "epoch": 2655} {"train_loss": -6.3857574462890625, "global_step": 111517, "epoch": 2655} {"train_loss": -6.484159469604492, "global_step": 111518, "epoch": 2655} {"train_loss": -6.598254203796387, "global_step": 111519, "epoch": 2655} {"train_loss": -6.367581844329834, "global_step": 111520, "epoch": 2655} {"train_loss": -6.52278995513916, "global_step": 111521, "epoch": 2655} {"train_loss": -6.460238456726074, "global_step": 111522, "epoch": 2655} {"train_loss": -6.476166725158691, "global_step": 111523, "epoch": 2655} {"train_loss": -6.373968601226807, "global_step": 111524, "epoch": 2655} {"train_loss": -6.52934455871582, "global_step": 111525, "epoch": 2655} {"train_loss": -6.627492904663086, "global_step": 111526, "epoch": 2655} {"train_loss": -6.530014991760254, "global_step": 111527, "epoch": 2655} {"train_loss": -6.551139831542969, "global_step": 111528, "epoch": 2655} {"train_loss": -6.424862861633301, "global_step": 111529, "epoch": 2655} {"train_loss": -6.618161201477051, "global_step": 111530, "epoch": 2655} {"train_loss": -6.468922138214111, "global_step": 111531, "epoch": 2655} {"train_loss": -6.623398303985596, "global_step": 111532, "epoch": 2655} {"train_loss": -6.57029914855957, "global_step": 111533, "epoch": 2655} {"train_loss": -6.4720354080200195, "global_step": 111534, "epoch": 2655} {"train_loss": -6.56902551651001, "global_step": 111535, "epoch": 2655} {"train_loss": -6.48026704788208, "global_step": 111536, "epoch": 2655} {"train_loss": -6.567625045776367, "global_step": 111537, "epoch": 2655} {"train_loss": -6.502300262451172, "global_step": 111538, "epoch": 2655} {"train_loss": -6.474773406982422, "global_step": 111539, "epoch": 2655} {"train_loss": -6.423389911651611, "global_step": 111540, "epoch": 2655} {"train_loss": -6.506870269775391, "global_step": 111541, "epoch": 2655} {"train_loss": -6.391498565673828, "global_step": 111542, "epoch": 2655} {"train_loss": -6.5512518882751465, "global_step": 111543, "epoch": 2655} {"train_loss": -6.477994918823242, "global_step": 111544, "epoch": 2655} {"train_loss": -6.423776626586914, "global_step": 111545, "epoch": 2655} {"train_loss": -6.3854804039001465, "global_step": 111546, "epoch": 2655} {"train_loss": -6.380859851837158, "global_step": 111547, "epoch": 2655} {"train_loss": -6.373980522155762, "global_step": 111548, "epoch": 2655} {"train_loss": -6.555293560028076, "global_step": 111549, "epoch": 2655} {"train_loss": -6.495884418487549, "global_step": 111550, "epoch": 2655} {"train_loss": -6.469187339146932, "global_step": 111551, "epoch": 2655, "val_loss": 68178.21875} {"train_loss": -6.343946933746338, "global_step": 111552, "epoch": 2656} {"train_loss": -6.6101789474487305, "global_step": 111553, "epoch": 2656} {"train_loss": -6.270531177520752, "global_step": 111554, "epoch": 2656} {"train_loss": -6.342028617858887, "global_step": 111555, "epoch": 2656} {"train_loss": -6.491488933563232, "global_step": 111556, "epoch": 2656} {"train_loss": -6.355630874633789, "global_step": 111557, "epoch": 2656} {"train_loss": -6.54906702041626, "global_step": 111558, "epoch": 2656} {"train_loss": -6.4197587966918945, "global_step": 111559, "epoch": 2656} {"train_loss": -6.455544471740723, "global_step": 111560, "epoch": 2656} {"train_loss": -6.351271629333496, "global_step": 111561, "epoch": 2656} {"train_loss": -6.388291358947754, "global_step": 111562, "epoch": 2656} {"train_loss": -6.351452827453613, "global_step": 111563, "epoch": 2656} {"train_loss": -6.478946685791016, "global_step": 111564, "epoch": 2656} {"train_loss": -6.417508125305176, "global_step": 111565, "epoch": 2656} {"train_loss": -6.335055351257324, "global_step": 111566, "epoch": 2656} {"train_loss": -6.437594413757324, "global_step": 111567, "epoch": 2656} {"train_loss": -6.274405479431152, "global_step": 111568, "epoch": 2656} {"train_loss": -6.4093708992004395, "global_step": 111569, "epoch": 2656} {"train_loss": -6.538809776306152, "global_step": 111570, "epoch": 2656} {"train_loss": -6.350554466247559, "global_step": 111571, "epoch": 2656} {"train_loss": -6.495963096618652, "global_step": 111572, "epoch": 2656} {"train_loss": -6.420022010803223, "global_step": 111573, "epoch": 2656} {"train_loss": -6.3640289306640625, "global_step": 111574, "epoch": 2656} {"train_loss": -6.441285610198975, "global_step": 111575, "epoch": 2656} {"train_loss": -6.370718479156494, "global_step": 111576, "epoch": 2656} {"train_loss": -6.463797569274902, "global_step": 111577, "epoch": 2656} {"train_loss": -6.4211530685424805, "global_step": 111578, "epoch": 2656} {"train_loss": -6.411391735076904, "global_step": 111579, "epoch": 2656} {"train_loss": -6.413905143737793, "global_step": 111580, "epoch": 2656} {"train_loss": -6.310834884643555, "global_step": 111581, "epoch": 2656} {"train_loss": -6.39426326751709, "global_step": 111582, "epoch": 2656} {"train_loss": -6.41041374206543, "global_step": 111583, "epoch": 2656} {"train_loss": -6.317890167236328, "global_step": 111584, "epoch": 2656} {"train_loss": -6.295848846435547, "global_step": 111585, "epoch": 2656} {"train_loss": -6.470309257507324, "global_step": 111586, "epoch": 2656} {"train_loss": -6.345522880554199, "global_step": 111587, "epoch": 2656} {"train_loss": -6.347723960876465, "global_step": 111588, "epoch": 2656} {"train_loss": -6.2892537117004395, "global_step": 111589, "epoch": 2656} {"train_loss": -6.395175933837891, "global_step": 111590, "epoch": 2656} {"train_loss": -6.367522239685059, "global_step": 111591, "epoch": 2656} {"train_loss": -6.3722968101501465, "global_step": 111592, "epoch": 2656} {"train_loss": -6.398366394497099, "global_step": 111593, "epoch": 2656, "val_loss": 67982.671875} {"train_loss": -6.378887176513672, "global_step": 111594, "epoch": 2657} {"train_loss": -6.509618759155273, "global_step": 111595, "epoch": 2657} {"train_loss": -6.258639335632324, "global_step": 111596, "epoch": 2657} {"train_loss": -6.459171295166016, "global_step": 111597, "epoch": 2657} {"train_loss": -6.459472179412842, "global_step": 111598, "epoch": 2657} {"train_loss": -6.433548927307129, "global_step": 111599, "epoch": 2657} {"train_loss": -6.244551658630371, "global_step": 111600, "epoch": 2657} {"train_loss": -6.477583885192871, "global_step": 111601, "epoch": 2657} {"train_loss": -6.495936393737793, "global_step": 111602, "epoch": 2657} {"train_loss": -6.361135482788086, "global_step": 111603, "epoch": 2657} {"train_loss": -6.3621978759765625, "global_step": 111604, "epoch": 2657} {"train_loss": -6.371520042419434, "global_step": 111605, "epoch": 2657} {"train_loss": -6.339808940887451, "global_step": 111606, "epoch": 2657} {"train_loss": -6.50706672668457, "global_step": 111607, "epoch": 2657} {"train_loss": -6.408825874328613, "global_step": 111608, "epoch": 2657} {"train_loss": -6.530702114105225, "global_step": 111609, "epoch": 2657} {"train_loss": -6.546393394470215, "global_step": 111610, "epoch": 2657} {"train_loss": -6.375295639038086, "global_step": 111611, "epoch": 2657} {"train_loss": -6.375539779663086, "global_step": 111612, "epoch": 2657} {"train_loss": -6.458756923675537, "global_step": 111613, "epoch": 2657} {"train_loss": -6.522289276123047, "global_step": 111614, "epoch": 2657} {"train_loss": -6.426760196685791, "global_step": 111615, "epoch": 2657} {"train_loss": -6.3914666175842285, "global_step": 111616, "epoch": 2657} {"train_loss": -6.469884872436523, "global_step": 111617, "epoch": 2657} {"train_loss": -6.453895092010498, "global_step": 111618, "epoch": 2657} {"train_loss": -6.394166946411133, "global_step": 111619, "epoch": 2657} {"train_loss": -6.54432487487793, "global_step": 111620, "epoch": 2657} {"train_loss": -6.434325218200684, "global_step": 111621, "epoch": 2657} {"train_loss": -6.555788516998291, "global_step": 111622, "epoch": 2657} {"train_loss": -6.4596147537231445, "global_step": 111623, "epoch": 2657} {"train_loss": -6.560998916625977, "global_step": 111624, "epoch": 2657} {"train_loss": -6.573002815246582, "global_step": 111625, "epoch": 2657} {"train_loss": -6.515947341918945, "global_step": 111626, "epoch": 2657} {"train_loss": -6.442065238952637, "global_step": 111627, "epoch": 2657} {"train_loss": -6.347325325012207, "global_step": 111628, "epoch": 2657} {"train_loss": -6.377901077270508, "global_step": 111629, "epoch": 2657} {"train_loss": -6.458047866821289, "global_step": 111630, "epoch": 2657} {"train_loss": -6.57902717590332, "global_step": 111631, "epoch": 2657} {"train_loss": -6.437674522399902, "global_step": 111632, "epoch": 2657} {"train_loss": -6.427373886108398, "global_step": 111633, "epoch": 2657} {"train_loss": -6.513952732086182, "global_step": 111634, "epoch": 2657} {"train_loss": -6.446755602246239, "global_step": 111635, "epoch": 2657, "val_loss": 67799.6484375} {"train_loss": -6.469036102294922, "global_step": 111636, "epoch": 2658} {"train_loss": -6.489077568054199, "global_step": 111637, "epoch": 2658} {"train_loss": -6.401301860809326, "global_step": 111638, "epoch": 2658} {"train_loss": -6.42556095123291, "global_step": 111639, "epoch": 2658} {"train_loss": -6.346826553344727, "global_step": 111640, "epoch": 2658} {"train_loss": -6.5155439376831055, "global_step": 111641, "epoch": 2658} {"train_loss": -6.59063720703125, "global_step": 111642, "epoch": 2658} {"train_loss": -6.542754173278809, "global_step": 111643, "epoch": 2658} {"train_loss": -6.532620429992676, "global_step": 111644, "epoch": 2658} {"train_loss": -6.4675397872924805, "global_step": 111645, "epoch": 2658} {"train_loss": -6.304442882537842, "global_step": 111646, "epoch": 2658} {"train_loss": -6.477699279785156, "global_step": 111647, "epoch": 2658} {"train_loss": -6.4409942626953125, "global_step": 111648, "epoch": 2658} {"train_loss": -6.440363883972168, "global_step": 111649, "epoch": 2658} {"train_loss": -6.420760631561279, "global_step": 111650, "epoch": 2658} {"train_loss": -6.413599491119385, "global_step": 111651, "epoch": 2658} {"train_loss": -6.396212100982666, "global_step": 111652, "epoch": 2658} {"train_loss": -6.369392395019531, "global_step": 111653, "epoch": 2658} {"train_loss": -6.5018415451049805, "global_step": 111654, "epoch": 2658} {"train_loss": -6.405937671661377, "global_step": 111655, "epoch": 2658} {"train_loss": -6.40665340423584, "global_step": 111656, "epoch": 2658} {"train_loss": -6.507461071014404, "global_step": 111657, "epoch": 2658} {"train_loss": -6.302788257598877, "global_step": 111658, "epoch": 2658} {"train_loss": -6.436369895935059, "global_step": 111659, "epoch": 2658} {"train_loss": -6.583229064941406, "global_step": 111660, "epoch": 2658} {"train_loss": -6.47490119934082, "global_step": 111661, "epoch": 2658} {"train_loss": -6.422231674194336, "global_step": 111662, "epoch": 2658} {"train_loss": -6.441829681396484, "global_step": 111663, "epoch": 2658} {"train_loss": -6.5499372482299805, "global_step": 111664, "epoch": 2658} {"train_loss": -6.477230548858643, "global_step": 111665, "epoch": 2658} {"train_loss": -6.3919677734375, "global_step": 111666, "epoch": 2658} {"train_loss": -6.549739360809326, "global_step": 111667, "epoch": 2658} {"train_loss": -6.548873424530029, "global_step": 111668, "epoch": 2658} {"train_loss": -6.400134086608887, "global_step": 111669, "epoch": 2658} {"train_loss": -6.396746635437012, "global_step": 111670, "epoch": 2658} {"train_loss": -6.458049297332764, "global_step": 111671, "epoch": 2658} {"train_loss": -6.444352149963379, "global_step": 111672, "epoch": 2658} {"train_loss": -6.44584846496582, "global_step": 111673, "epoch": 2658} {"train_loss": -6.443209648132324, "global_step": 111674, "epoch": 2658} {"train_loss": -6.35792875289917, "global_step": 111675, "epoch": 2658} {"train_loss": -6.421239852905273, "global_step": 111676, "epoch": 2658} {"train_loss": -6.448293822152274, "global_step": 111677, "epoch": 2658, "val_loss": 67885.8359375} {"train_loss": -6.494381904602051, "global_step": 111678, "epoch": 2659} {"train_loss": -6.393503189086914, "global_step": 111679, "epoch": 2659} {"train_loss": -6.400264739990234, "global_step": 111680, "epoch": 2659} {"train_loss": -6.40893030166626, "global_step": 111681, "epoch": 2659} {"train_loss": -6.458369255065918, "global_step": 111682, "epoch": 2659} {"train_loss": -6.3892741203308105, "global_step": 111683, "epoch": 2659} {"train_loss": -6.467161178588867, "global_step": 111684, "epoch": 2659} {"train_loss": -6.501461505889893, "global_step": 111685, "epoch": 2659} {"train_loss": -6.4819111824035645, "global_step": 111686, "epoch": 2659} {"train_loss": -6.565339088439941, "global_step": 111687, "epoch": 2659} {"train_loss": -6.4193434715271, "global_step": 111688, "epoch": 2659} {"train_loss": -6.550914764404297, "global_step": 111689, "epoch": 2659} {"train_loss": -6.397406101226807, "global_step": 111690, "epoch": 2659} {"train_loss": -6.535975456237793, "global_step": 111691, "epoch": 2659} {"train_loss": -6.560091018676758, "global_step": 111692, "epoch": 2659} {"train_loss": -6.437203407287598, "global_step": 111693, "epoch": 2659} {"train_loss": -6.501008033752441, "global_step": 111694, "epoch": 2659} {"train_loss": -6.5154619216918945, "global_step": 111695, "epoch": 2659} {"train_loss": -6.47915506362915, "global_step": 111696, "epoch": 2659} {"train_loss": -6.57861852645874, "global_step": 111697, "epoch": 2659} {"train_loss": -6.505204677581787, "global_step": 111698, "epoch": 2659} {"train_loss": -6.4909348487854, "global_step": 111699, "epoch": 2659} {"train_loss": -6.438633918762207, "global_step": 111700, "epoch": 2659} {"train_loss": -6.5523681640625, "global_step": 111701, "epoch": 2659} {"train_loss": -6.445427894592285, "global_step": 111702, "epoch": 2659} {"train_loss": -6.573224067687988, "global_step": 111703, "epoch": 2659} {"train_loss": -6.489990234375, "global_step": 111704, "epoch": 2659} {"train_loss": -6.520254611968994, "global_step": 111705, "epoch": 2659} {"train_loss": -6.561562538146973, "global_step": 111706, "epoch": 2659} {"train_loss": -6.462465286254883, "global_step": 111707, "epoch": 2659} {"train_loss": -6.548936367034912, "global_step": 111708, "epoch": 2659} {"train_loss": -6.559582710266113, "global_step": 111709, "epoch": 2659} {"train_loss": -6.466648578643799, "global_step": 111710, "epoch": 2659} {"train_loss": -6.508726119995117, "global_step": 111711, "epoch": 2659} {"train_loss": -6.447331428527832, "global_step": 111712, "epoch": 2659} {"train_loss": -6.415318489074707, "global_step": 111713, "epoch": 2659} {"train_loss": -6.426557540893555, "global_step": 111714, "epoch": 2659} {"train_loss": -6.472711086273193, "global_step": 111715, "epoch": 2659} {"train_loss": -6.430971145629883, "global_step": 111716, "epoch": 2659} {"train_loss": -6.465259552001953, "global_step": 111717, "epoch": 2659} {"train_loss": -6.449833393096924, "global_step": 111718, "epoch": 2659} {"train_loss": -6.48436214810326, "global_step": 111719, "epoch": 2659, "val_loss": 67761.59375} {"train_loss": -6.455190658569336, "global_step": 111720, "epoch": 2660} {"train_loss": -6.470733165740967, "global_step": 111721, "epoch": 2660} {"train_loss": -6.470954895019531, "global_step": 111722, "epoch": 2660} {"train_loss": -6.48544979095459, "global_step": 111723, "epoch": 2660} {"train_loss": -6.510157585144043, "global_step": 111724, "epoch": 2660} {"train_loss": -6.357852935791016, "global_step": 111725, "epoch": 2660} {"train_loss": -6.422837257385254, "global_step": 111726, "epoch": 2660} {"train_loss": -6.239455223083496, "global_step": 111727, "epoch": 2660} {"train_loss": -6.4377522468566895, "global_step": 111728, "epoch": 2660} {"train_loss": -6.5124359130859375, "global_step": 111729, "epoch": 2660} {"train_loss": -6.418390274047852, "global_step": 111730, "epoch": 2660} {"train_loss": -6.427786827087402, "global_step": 111731, "epoch": 2660} {"train_loss": -6.3293538093566895, "global_step": 111732, "epoch": 2660} {"train_loss": -6.367271423339844, "global_step": 111733, "epoch": 2660} {"train_loss": -6.231971263885498, "global_step": 111734, "epoch": 2660} {"train_loss": -6.493429183959961, "global_step": 111735, "epoch": 2660} {"train_loss": -6.333408832550049, "global_step": 111736, "epoch": 2660} {"train_loss": -6.3526763916015625, "global_step": 111737, "epoch": 2660} {"train_loss": -6.461982250213623, "global_step": 111738, "epoch": 2660} {"train_loss": -6.381049156188965, "global_step": 111739, "epoch": 2660} {"train_loss": -6.464419841766357, "global_step": 111740, "epoch": 2660} {"train_loss": -6.411208152770996, "global_step": 111741, "epoch": 2660} {"train_loss": -6.420938491821289, "global_step": 111742, "epoch": 2660} {"train_loss": -6.306634426116943, "global_step": 111743, "epoch": 2660} {"train_loss": -6.400819301605225, "global_step": 111744, "epoch": 2660} {"train_loss": -6.40281343460083, "global_step": 111745, "epoch": 2660} {"train_loss": -6.4621195793151855, "global_step": 111746, "epoch": 2660} {"train_loss": -6.451335906982422, "global_step": 111747, "epoch": 2660} {"train_loss": -6.509521007537842, "global_step": 111748, "epoch": 2660} {"train_loss": -6.371029853820801, "global_step": 111749, "epoch": 2660} {"train_loss": -6.478522300720215, "global_step": 111750, "epoch": 2660} {"train_loss": -6.381845474243164, "global_step": 111751, "epoch": 2660} {"train_loss": -6.415096282958984, "global_step": 111752, "epoch": 2660} {"train_loss": -6.438455581665039, "global_step": 111753, "epoch": 2660} {"train_loss": -6.326302528381348, "global_step": 111754, "epoch": 2660} {"train_loss": -6.448073387145996, "global_step": 111755, "epoch": 2660} {"train_loss": -6.4035773277282715, "global_step": 111756, "epoch": 2660} {"train_loss": -6.359728813171387, "global_step": 111757, "epoch": 2660} {"train_loss": -6.546724319458008, "global_step": 111758, "epoch": 2660} {"train_loss": -6.389490127563477, "global_step": 111759, "epoch": 2660} {"train_loss": -6.470470428466797, "global_step": 111760, "epoch": 2660} {"train_loss": -6.412714685712542, "global_step": 111761, "epoch": 2660, "val_loss": 67767.6875} {"train_loss": -6.469045639038086, "global_step": 111762, "epoch": 2661} {"train_loss": -6.409412384033203, "global_step": 111763, "epoch": 2661} {"train_loss": -6.382697582244873, "global_step": 111764, "epoch": 2661} {"train_loss": -6.397626876831055, "global_step": 111765, "epoch": 2661} {"train_loss": -6.362781524658203, "global_step": 111766, "epoch": 2661} {"train_loss": -6.372855186462402, "global_step": 111767, "epoch": 2661} {"train_loss": -6.4082350730896, "global_step": 111768, "epoch": 2661} {"train_loss": -6.401070594787598, "global_step": 111769, "epoch": 2661} {"train_loss": -6.324228763580322, "global_step": 111770, "epoch": 2661} {"train_loss": -6.51905632019043, "global_step": 111771, "epoch": 2661} {"train_loss": -6.347003936767578, "global_step": 111772, "epoch": 2661} {"train_loss": -6.459275245666504, "global_step": 111773, "epoch": 2661} {"train_loss": -6.512152671813965, "global_step": 111774, "epoch": 2661} {"train_loss": -6.374312877655029, "global_step": 111775, "epoch": 2661} {"train_loss": -6.463974475860596, "global_step": 111776, "epoch": 2661} {"train_loss": -6.4735918045043945, "global_step": 111777, "epoch": 2661} {"train_loss": -6.44145393371582, "global_step": 111778, "epoch": 2661} {"train_loss": -6.489480972290039, "global_step": 111779, "epoch": 2661} {"train_loss": -6.489629745483398, "global_step": 111780, "epoch": 2661} {"train_loss": -6.515324592590332, "global_step": 111781, "epoch": 2661} {"train_loss": -6.412006378173828, "global_step": 111782, "epoch": 2661} {"train_loss": -6.350569725036621, "global_step": 111783, "epoch": 2661} {"train_loss": -6.399540901184082, "global_step": 111784, "epoch": 2661} {"train_loss": -6.382317543029785, "global_step": 111785, "epoch": 2661} {"train_loss": -6.436860084533691, "global_step": 111786, "epoch": 2661} {"train_loss": -6.494709014892578, "global_step": 111787, "epoch": 2661} {"train_loss": -6.526641845703125, "global_step": 111788, "epoch": 2661} {"train_loss": -6.5070343017578125, "global_step": 111789, "epoch": 2661} {"train_loss": -6.429032325744629, "global_step": 111790, "epoch": 2661} {"train_loss": -6.480044841766357, "global_step": 111791, "epoch": 2661} {"train_loss": -6.451613426208496, "global_step": 111792, "epoch": 2661} {"train_loss": -6.457571029663086, "global_step": 111793, "epoch": 2661} {"train_loss": -6.498653411865234, "global_step": 111794, "epoch": 2661} {"train_loss": -6.622720718383789, "global_step": 111795, "epoch": 2661} {"train_loss": -6.497326850891113, "global_step": 111796, "epoch": 2661} {"train_loss": -6.4951395988464355, "global_step": 111797, "epoch": 2661} {"train_loss": -6.516073226928711, "global_step": 111798, "epoch": 2661} {"train_loss": -6.49385404586792, "global_step": 111799, "epoch": 2661} {"train_loss": -6.500980377197266, "global_step": 111800, "epoch": 2661} {"train_loss": -6.388754844665527, "global_step": 111801, "epoch": 2661} {"train_loss": -6.6484479904174805, "global_step": 111802, "epoch": 2661} {"train_loss": -6.4555758862268355, "global_step": 111803, "epoch": 2661, "val_loss": 67816.171875} {"train_loss": -6.566193103790283, "global_step": 111804, "epoch": 2662} {"train_loss": -6.560822486877441, "global_step": 111805, "epoch": 2662} {"train_loss": -6.494106292724609, "global_step": 111806, "epoch": 2662} {"train_loss": -6.465945243835449, "global_step": 111807, "epoch": 2662} {"train_loss": -6.478419303894043, "global_step": 111808, "epoch": 2662} {"train_loss": -6.4821906089782715, "global_step": 111809, "epoch": 2662} {"train_loss": -6.455214500427246, "global_step": 111810, "epoch": 2662} {"train_loss": -6.563295364379883, "global_step": 111811, "epoch": 2662} {"train_loss": -6.571327209472656, "global_step": 111812, "epoch": 2662} {"train_loss": -6.475623607635498, "global_step": 111813, "epoch": 2662} {"train_loss": -6.389472484588623, "global_step": 111814, "epoch": 2662} {"train_loss": -6.456124305725098, "global_step": 111815, "epoch": 2662} {"train_loss": -6.462420463562012, "global_step": 111816, "epoch": 2662} {"train_loss": -6.508950710296631, "global_step": 111817, "epoch": 2662} {"train_loss": -6.409322738647461, "global_step": 111818, "epoch": 2662} {"train_loss": -6.4757537841796875, "global_step": 111819, "epoch": 2662} {"train_loss": -6.336289405822754, "global_step": 111820, "epoch": 2662} {"train_loss": -6.565741062164307, "global_step": 111821, "epoch": 2662} {"train_loss": -6.430941581726074, "global_step": 111822, "epoch": 2662} {"train_loss": -6.358327865600586, "global_step": 111823, "epoch": 2662} {"train_loss": -6.378401279449463, "global_step": 111824, "epoch": 2662} {"train_loss": -6.346847057342529, "global_step": 111825, "epoch": 2662} {"train_loss": -6.363010883331299, "global_step": 111826, "epoch": 2662} {"train_loss": -6.442212104797363, "global_step": 111827, "epoch": 2662} {"train_loss": -6.3749895095825195, "global_step": 111828, "epoch": 2662} {"train_loss": -6.429330348968506, "global_step": 111829, "epoch": 2662} {"train_loss": -6.431489944458008, "global_step": 111830, "epoch": 2662} {"train_loss": -6.369851112365723, "global_step": 111831, "epoch": 2662} {"train_loss": -6.3927226066589355, "global_step": 111832, "epoch": 2662} {"train_loss": -6.4214959144592285, "global_step": 111833, "epoch": 2662} {"train_loss": -6.392889976501465, "global_step": 111834, "epoch": 2662} {"train_loss": -6.383569717407227, "global_step": 111835, "epoch": 2662} {"train_loss": -6.423218727111816, "global_step": 111836, "epoch": 2662} {"train_loss": -6.537072658538818, "global_step": 111837, "epoch": 2662} {"train_loss": -6.327247619628906, "global_step": 111838, "epoch": 2662} {"train_loss": -6.409376621246338, "global_step": 111839, "epoch": 2662} {"train_loss": -6.33640193939209, "global_step": 111840, "epoch": 2662} {"train_loss": -6.389344215393066, "global_step": 111841, "epoch": 2662} {"train_loss": -6.397942543029785, "global_step": 111842, "epoch": 2662} {"train_loss": -6.431982517242432, "global_step": 111843, "epoch": 2662} {"train_loss": -6.594449996948242, "global_step": 111844, "epoch": 2662} {"train_loss": -6.441547507331485, "global_step": 111845, "epoch": 2662, "val_loss": 67853.7265625} {"train_loss": -6.427704811096191, "global_step": 111846, "epoch": 2663} {"train_loss": -6.44174337387085, "global_step": 111847, "epoch": 2663} {"train_loss": -6.44764518737793, "global_step": 111848, "epoch": 2663} {"train_loss": -6.484471321105957, "global_step": 111849, "epoch": 2663} {"train_loss": -6.471620559692383, "global_step": 111850, "epoch": 2663} {"train_loss": -6.476747989654541, "global_step": 111851, "epoch": 2663} {"train_loss": -6.554952621459961, "global_step": 111852, "epoch": 2663} {"train_loss": -6.414218425750732, "global_step": 111853, "epoch": 2663} {"train_loss": -6.5470356941223145, "global_step": 111854, "epoch": 2663} {"train_loss": -6.597923278808594, "global_step": 111855, "epoch": 2663} {"train_loss": -6.553433895111084, "global_step": 111856, "epoch": 2663} {"train_loss": -6.510382652282715, "global_step": 111857, "epoch": 2663} {"train_loss": -6.6417083740234375, "global_step": 111858, "epoch": 2663} {"train_loss": -6.51063871383667, "global_step": 111859, "epoch": 2663} {"train_loss": -6.543891906738281, "global_step": 111860, "epoch": 2663} {"train_loss": -6.547408103942871, "global_step": 111861, "epoch": 2663} {"train_loss": -6.558908462524414, "global_step": 111862, "epoch": 2663} {"train_loss": -6.515192985534668, "global_step": 111863, "epoch": 2663} {"train_loss": -6.557958126068115, "global_step": 111864, "epoch": 2663} {"train_loss": -6.506968975067139, "global_step": 111865, "epoch": 2663} {"train_loss": -6.372864246368408, "global_step": 111866, "epoch": 2663} {"train_loss": -6.429415702819824, "global_step": 111867, "epoch": 2663} {"train_loss": -6.484689712524414, "global_step": 111868, "epoch": 2663} {"train_loss": -6.519359111785889, "global_step": 111869, "epoch": 2663} {"train_loss": -6.559883117675781, "global_step": 111870, "epoch": 2663} {"train_loss": -6.546023368835449, "global_step": 111871, "epoch": 2663} {"train_loss": -6.477302551269531, "global_step": 111872, "epoch": 2663} {"train_loss": -6.454165935516357, "global_step": 111873, "epoch": 2663} {"train_loss": -6.410697937011719, "global_step": 111874, "epoch": 2663} {"train_loss": -6.443320274353027, "global_step": 111875, "epoch": 2663} {"train_loss": -6.35936164855957, "global_step": 111876, "epoch": 2663} {"train_loss": -6.414658546447754, "global_step": 111877, "epoch": 2663} {"train_loss": -6.398509979248047, "global_step": 111878, "epoch": 2663} {"train_loss": -6.565131187438965, "global_step": 111879, "epoch": 2663} {"train_loss": -6.380713939666748, "global_step": 111880, "epoch": 2663} {"train_loss": -6.388112545013428, "global_step": 111881, "epoch": 2663} {"train_loss": -6.474858283996582, "global_step": 111882, "epoch": 2663} {"train_loss": -6.446072578430176, "global_step": 111883, "epoch": 2663} {"train_loss": -6.404003143310547, "global_step": 111884, "epoch": 2663} {"train_loss": -6.3574299812316895, "global_step": 111885, "epoch": 2663} {"train_loss": -6.332912445068359, "global_step": 111886, "epoch": 2663} {"train_loss": -6.4755610057285855, "global_step": 111887, "epoch": 2663, "val_loss": 68146.0859375} {"train_loss": -6.416591644287109, "global_step": 111888, "epoch": 2664} {"train_loss": -6.417652130126953, "global_step": 111889, "epoch": 2664} {"train_loss": -6.445746898651123, "global_step": 111890, "epoch": 2664} {"train_loss": -6.435952186584473, "global_step": 111891, "epoch": 2664} {"train_loss": -6.413245677947998, "global_step": 111892, "epoch": 2664} {"train_loss": -6.317382335662842, "global_step": 111893, "epoch": 2664} {"train_loss": -6.353382587432861, "global_step": 111894, "epoch": 2664} {"train_loss": -6.426083564758301, "global_step": 111895, "epoch": 2664} {"train_loss": -6.438368797302246, "global_step": 111896, "epoch": 2664} {"train_loss": -6.291532516479492, "global_step": 111897, "epoch": 2664} {"train_loss": -6.449039936065674, "global_step": 111898, "epoch": 2664} {"train_loss": -6.4533610343933105, "global_step": 111899, "epoch": 2664} {"train_loss": -6.4615325927734375, "global_step": 111900, "epoch": 2664} {"train_loss": -6.474391937255859, "global_step": 111901, "epoch": 2664} {"train_loss": -6.408954620361328, "global_step": 111902, "epoch": 2664} {"train_loss": -6.583349704742432, "global_step": 111903, "epoch": 2664} {"train_loss": -6.3652496337890625, "global_step": 111904, "epoch": 2664} {"train_loss": -6.487113952636719, "global_step": 111905, "epoch": 2664} {"train_loss": -6.428546905517578, "global_step": 111906, "epoch": 2664} {"train_loss": -6.472909450531006, "global_step": 111907, "epoch": 2664} {"train_loss": -6.579873561859131, "global_step": 111908, "epoch": 2664} {"train_loss": -6.4302592277526855, "global_step": 111909, "epoch": 2664} {"train_loss": -6.461935997009277, "global_step": 111910, "epoch": 2664} {"train_loss": -6.547102928161621, "global_step": 111911, "epoch": 2664} {"train_loss": -6.4716901779174805, "global_step": 111912, "epoch": 2664} {"train_loss": -6.520352840423584, "global_step": 111913, "epoch": 2664} {"train_loss": -6.454756736755371, "global_step": 111914, "epoch": 2664} {"train_loss": -6.549004554748535, "global_step": 111915, "epoch": 2664} {"train_loss": -6.454501628875732, "global_step": 111916, "epoch": 2664} {"train_loss": -6.4219160079956055, "global_step": 111917, "epoch": 2664} {"train_loss": -6.384815216064453, "global_step": 111918, "epoch": 2664} {"train_loss": -6.342161178588867, "global_step": 111919, "epoch": 2664} {"train_loss": -6.489472389221191, "global_step": 111920, "epoch": 2664} {"train_loss": -6.437350749969482, "global_step": 111921, "epoch": 2664} {"train_loss": -6.457065105438232, "global_step": 111922, "epoch": 2664} {"train_loss": -6.44196891784668, "global_step": 111923, "epoch": 2664} {"train_loss": -6.415117263793945, "global_step": 111924, "epoch": 2664} {"train_loss": -6.424694061279297, "global_step": 111925, "epoch": 2664} {"train_loss": -6.346010208129883, "global_step": 111926, "epoch": 2664} {"train_loss": -6.361760139465332, "global_step": 111927, "epoch": 2664} {"train_loss": -6.45876407623291, "global_step": 111928, "epoch": 2664} {"train_loss": -6.439472550437564, "global_step": 111929, "epoch": 2664, "val_loss": 67986.4140625} {"train_loss": -6.464254379272461, "global_step": 111930, "epoch": 2665} {"train_loss": -6.444997310638428, "global_step": 111931, "epoch": 2665} {"train_loss": -6.263784885406494, "global_step": 111932, "epoch": 2665} {"train_loss": -6.47934627532959, "global_step": 111933, "epoch": 2665} {"train_loss": -6.427887439727783, "global_step": 111934, "epoch": 2665} {"train_loss": -6.387136936187744, "global_step": 111935, "epoch": 2665} {"train_loss": -6.532095432281494, "global_step": 111936, "epoch": 2665} {"train_loss": -6.490904331207275, "global_step": 111937, "epoch": 2665} {"train_loss": -6.380939483642578, "global_step": 111938, "epoch": 2665} {"train_loss": -6.495263576507568, "global_step": 111939, "epoch": 2665} {"train_loss": -6.557258605957031, "global_step": 111940, "epoch": 2665} {"train_loss": -6.4450578689575195, "global_step": 111941, "epoch": 2665} {"train_loss": -6.3357672691345215, "global_step": 111942, "epoch": 2665} {"train_loss": -6.44205379486084, "global_step": 111943, "epoch": 2665} {"train_loss": -6.520323753356934, "global_step": 111944, "epoch": 2665} {"train_loss": -6.372535705566406, "global_step": 111945, "epoch": 2665} {"train_loss": -6.495047569274902, "global_step": 111946, "epoch": 2665} {"train_loss": -6.599908828735352, "global_step": 111947, "epoch": 2665} {"train_loss": -6.461014747619629, "global_step": 111948, "epoch": 2665} {"train_loss": -6.546167373657227, "global_step": 111949, "epoch": 2665} {"train_loss": -6.425890922546387, "global_step": 111950, "epoch": 2665} {"train_loss": -6.4340667724609375, "global_step": 111951, "epoch": 2665} {"train_loss": -6.5724005699157715, "global_step": 111952, "epoch": 2665} {"train_loss": -6.63290548324585, "global_step": 111953, "epoch": 2665} {"train_loss": -6.5637125968933105, "global_step": 111954, "epoch": 2665} {"train_loss": -6.431072235107422, "global_step": 111955, "epoch": 2665} {"train_loss": -6.486262321472168, "global_step": 111956, "epoch": 2665} {"train_loss": -6.489500999450684, "global_step": 111957, "epoch": 2665} {"train_loss": -6.508027076721191, "global_step": 111958, "epoch": 2665} {"train_loss": -6.506263732910156, "global_step": 111959, "epoch": 2665} {"train_loss": -6.411726474761963, "global_step": 111960, "epoch": 2665} {"train_loss": -6.391328811645508, "global_step": 111961, "epoch": 2665} {"train_loss": -6.48320198059082, "global_step": 111962, "epoch": 2665} {"train_loss": -6.356956481933594, "global_step": 111963, "epoch": 2665} {"train_loss": -6.458835601806641, "global_step": 111964, "epoch": 2665} {"train_loss": -6.356170177459717, "global_step": 111965, "epoch": 2665} {"train_loss": -6.4198899269104, "global_step": 111966, "epoch": 2665} {"train_loss": -6.515007019042969, "global_step": 111967, "epoch": 2665} {"train_loss": -6.374808311462402, "global_step": 111968, "epoch": 2665} {"train_loss": -6.225928783416748, "global_step": 111969, "epoch": 2665} {"train_loss": -6.508881568908691, "global_step": 111970, "epoch": 2665} {"train_loss": -6.455298015049526, "global_step": 111971, "epoch": 2665, "val_loss": 67690.4140625} {"train_loss": -6.460283279418945, "global_step": 111972, "epoch": 2666} {"train_loss": -6.453085899353027, "global_step": 111973, "epoch": 2666} {"train_loss": -6.229811668395996, "global_step": 111974, "epoch": 2666} {"train_loss": -6.495543479919434, "global_step": 111975, "epoch": 2666} {"train_loss": -6.3212361335754395, "global_step": 111976, "epoch": 2666} {"train_loss": -6.440009117126465, "global_step": 111977, "epoch": 2666} {"train_loss": -6.41449499130249, "global_step": 111978, "epoch": 2666} {"train_loss": -6.441822052001953, "global_step": 111979, "epoch": 2666} {"train_loss": -6.443920135498047, "global_step": 111980, "epoch": 2666} {"train_loss": -6.32124137878418, "global_step": 111981, "epoch": 2666} {"train_loss": -6.554632663726807, "global_step": 111982, "epoch": 2666} {"train_loss": -6.443746566772461, "global_step": 111983, "epoch": 2666} {"train_loss": -6.413471221923828, "global_step": 111984, "epoch": 2666} {"train_loss": -6.570953369140625, "global_step": 111985, "epoch": 2666} {"train_loss": -6.421808242797852, "global_step": 111986, "epoch": 2666} {"train_loss": -6.343332290649414, "global_step": 111987, "epoch": 2666} {"train_loss": -6.5376482009887695, "global_step": 111988, "epoch": 2666} {"train_loss": -6.3761138916015625, "global_step": 111989, "epoch": 2666} {"train_loss": -6.424330234527588, "global_step": 111990, "epoch": 2666} {"train_loss": -6.539254188537598, "global_step": 111991, "epoch": 2666} {"train_loss": -6.492769241333008, "global_step": 111992, "epoch": 2666} {"train_loss": -6.39510440826416, "global_step": 111993, "epoch": 2666} {"train_loss": -6.484799861907959, "global_step": 111994, "epoch": 2666} {"train_loss": -6.430880546569824, "global_step": 111995, "epoch": 2666} {"train_loss": -6.424213409423828, "global_step": 111996, "epoch": 2666} {"train_loss": -6.335106372833252, "global_step": 111997, "epoch": 2666} {"train_loss": -6.325634002685547, "global_step": 111998, "epoch": 2666} {"train_loss": -6.445472717285156, "global_step": 111999, "epoch": 2666} {"train_loss": -6.42098331451416, "global_step": 112000, "epoch": 2666} {"train_loss": -6.462728500366211, "global_step": 112001, "epoch": 2666} {"train_loss": -6.5064849853515625, "global_step": 112002, "epoch": 2666} {"train_loss": -6.424511909484863, "global_step": 112003, "epoch": 2666} {"train_loss": -6.5036211013793945, "global_step": 112004, "epoch": 2666} {"train_loss": -6.401993751525879, "global_step": 112005, "epoch": 2666} {"train_loss": -6.604559421539307, "global_step": 112006, "epoch": 2666} {"train_loss": -6.533193588256836, "global_step": 112007, "epoch": 2666} {"train_loss": -6.454532146453857, "global_step": 112008, "epoch": 2666} {"train_loss": -6.477964878082275, "global_step": 112009, "epoch": 2666} {"train_loss": -6.448369979858398, "global_step": 112010, "epoch": 2666} {"train_loss": -6.5157151222229, "global_step": 112011, "epoch": 2666} {"train_loss": -6.41201639175415, "global_step": 112012, "epoch": 2666} {"train_loss": -6.440579085122971, "global_step": 112013, "epoch": 2666, "val_loss": 67939.03125} {"train_loss": -6.434929370880127, "global_step": 112014, "epoch": 2667} {"train_loss": -6.412339210510254, "global_step": 112015, "epoch": 2667} {"train_loss": -6.415780067443848, "global_step": 112016, "epoch": 2667} {"train_loss": -6.501787185668945, "global_step": 112017, "epoch": 2667} {"train_loss": -6.412321090698242, "global_step": 112018, "epoch": 2667} {"train_loss": -6.433074951171875, "global_step": 112019, "epoch": 2667} {"train_loss": -6.447565078735352, "global_step": 112020, "epoch": 2667} {"train_loss": -6.499884605407715, "global_step": 112021, "epoch": 2667} {"train_loss": -6.418569564819336, "global_step": 112022, "epoch": 2667} {"train_loss": -6.496103286743164, "global_step": 112023, "epoch": 2667} {"train_loss": -6.550839900970459, "global_step": 112024, "epoch": 2667} {"train_loss": -6.536171913146973, "global_step": 112025, "epoch": 2667} {"train_loss": -6.350168704986572, "global_step": 112026, "epoch": 2667} {"train_loss": -6.435758590698242, "global_step": 112027, "epoch": 2667} {"train_loss": -6.53409481048584, "global_step": 112028, "epoch": 2667} {"train_loss": -6.2325639724731445, "global_step": 112029, "epoch": 2667} {"train_loss": -6.49448299407959, "global_step": 112030, "epoch": 2667} {"train_loss": -6.51576042175293, "global_step": 112031, "epoch": 2667} {"train_loss": -6.4102678298950195, "global_step": 112032, "epoch": 2667} {"train_loss": -6.397947311401367, "global_step": 112033, "epoch": 2667} {"train_loss": -6.462952136993408, "global_step": 112034, "epoch": 2667} {"train_loss": -6.606942653656006, "global_step": 112035, "epoch": 2667} {"train_loss": -6.446091651916504, "global_step": 112036, "epoch": 2667} {"train_loss": -6.475333213806152, "global_step": 112037, "epoch": 2667} {"train_loss": -6.408207893371582, "global_step": 112038, "epoch": 2667} {"train_loss": -6.52381706237793, "global_step": 112039, "epoch": 2667} {"train_loss": -6.476539611816406, "global_step": 112040, "epoch": 2667} {"train_loss": -6.444819927215576, "global_step": 112041, "epoch": 2667} {"train_loss": -6.2931976318359375, "global_step": 112042, "epoch": 2667} {"train_loss": -6.448513507843018, "global_step": 112043, "epoch": 2667} {"train_loss": -6.219143867492676, "global_step": 112044, "epoch": 2667} {"train_loss": -6.285069465637207, "global_step": 112045, "epoch": 2667} {"train_loss": -6.336117267608643, "global_step": 112046, "epoch": 2667} {"train_loss": -6.357054233551025, "global_step": 112047, "epoch": 2667} {"train_loss": -6.30865478515625, "global_step": 112048, "epoch": 2667} {"train_loss": -6.369898796081543, "global_step": 112049, "epoch": 2667} {"train_loss": -6.359585285186768, "global_step": 112050, "epoch": 2667} {"train_loss": -6.3134846687316895, "global_step": 112051, "epoch": 2667} {"train_loss": -6.373574256896973, "global_step": 112052, "epoch": 2667} {"train_loss": -6.389050483703613, "global_step": 112053, "epoch": 2667} {"train_loss": -6.350366592407227, "global_step": 112054, "epoch": 2667} {"train_loss": -6.418171087900798, "global_step": 112055, "epoch": 2667, "val_loss": 67918.140625} {"train_loss": -6.462841987609863, "global_step": 112056, "epoch": 2668} {"train_loss": -6.519496917724609, "global_step": 112057, "epoch": 2668} {"train_loss": -6.399974822998047, "global_step": 112058, "epoch": 2668} {"train_loss": -6.5068159103393555, "global_step": 112059, "epoch": 2668} {"train_loss": -6.4666924476623535, "global_step": 112060, "epoch": 2668} {"train_loss": -6.365574836730957, "global_step": 112061, "epoch": 2668} {"train_loss": -6.480249404907227, "global_step": 112062, "epoch": 2668} {"train_loss": -6.449491500854492, "global_step": 112063, "epoch": 2668} {"train_loss": -6.4617815017700195, "global_step": 112064, "epoch": 2668} {"train_loss": -6.501256942749023, "global_step": 112065, "epoch": 2668} {"train_loss": -6.521448135375977, "global_step": 112066, "epoch": 2668} {"train_loss": -6.507042407989502, "global_step": 112067, "epoch": 2668} {"train_loss": -6.535017013549805, "global_step": 112068, "epoch": 2668} {"train_loss": -6.495965003967285, "global_step": 112069, "epoch": 2668} {"train_loss": -6.500535488128662, "global_step": 112070, "epoch": 2668} {"train_loss": -6.318402290344238, "global_step": 112071, "epoch": 2668} {"train_loss": -6.475788116455078, "global_step": 112072, "epoch": 2668} {"train_loss": -6.437099933624268, "global_step": 112073, "epoch": 2668} {"train_loss": -6.502740859985352, "global_step": 112074, "epoch": 2668} {"train_loss": -6.48879337310791, "global_step": 112075, "epoch": 2668} {"train_loss": -6.566349029541016, "global_step": 112076, "epoch": 2668} {"train_loss": -6.425162315368652, "global_step": 112077, "epoch": 2668} {"train_loss": -6.643816947937012, "global_step": 112078, "epoch": 2668} {"train_loss": -6.5443243980407715, "global_step": 112079, "epoch": 2668} {"train_loss": -6.525569915771484, "global_step": 112080, "epoch": 2668} {"train_loss": -6.450553894042969, "global_step": 112081, "epoch": 2668} {"train_loss": -6.436692714691162, "global_step": 112082, "epoch": 2668} {"train_loss": -6.540622711181641, "global_step": 112083, "epoch": 2668} {"train_loss": -6.503774166107178, "global_step": 112084, "epoch": 2668} {"train_loss": -6.465899467468262, "global_step": 112085, "epoch": 2668} {"train_loss": -6.546679496765137, "global_step": 112086, "epoch": 2668} {"train_loss": -6.515316486358643, "global_step": 112087, "epoch": 2668} {"train_loss": -6.533323764801025, "global_step": 112088, "epoch": 2668} {"train_loss": -6.573095798492432, "global_step": 112089, "epoch": 2668} {"train_loss": -6.45424747467041, "global_step": 112090, "epoch": 2668} {"train_loss": -6.447359561920166, "global_step": 112091, "epoch": 2668} {"train_loss": -6.363138198852539, "global_step": 112092, "epoch": 2668} {"train_loss": -6.580179691314697, "global_step": 112093, "epoch": 2668} {"train_loss": -6.527398109436035, "global_step": 112094, "epoch": 2668} {"train_loss": -6.539699554443359, "global_step": 112095, "epoch": 2668} {"train_loss": -6.477021217346191, "global_step": 112096, "epoch": 2668} {"train_loss": -6.488876081648327, "global_step": 112097, "epoch": 2668, "val_loss": 67804.9375} {"train_loss": -6.541045665740967, "global_step": 112098, "epoch": 2669} {"train_loss": -6.414618492126465, "global_step": 112099, "epoch": 2669} {"train_loss": -6.525238990783691, "global_step": 112100, "epoch": 2669} {"train_loss": -6.477145671844482, "global_step": 112101, "epoch": 2669} {"train_loss": -6.546199798583984, "global_step": 112102, "epoch": 2669} {"train_loss": -6.501229763031006, "global_step": 112103, "epoch": 2669} {"train_loss": -6.584516525268555, "global_step": 112104, "epoch": 2669} {"train_loss": -6.4354424476623535, "global_step": 112105, "epoch": 2669} {"train_loss": -6.408531665802002, "global_step": 112106, "epoch": 2669} {"train_loss": -6.637104511260986, "global_step": 112107, "epoch": 2669} {"train_loss": -6.4396562576293945, "global_step": 112108, "epoch": 2669} {"train_loss": -6.49106502532959, "global_step": 112109, "epoch": 2669} {"train_loss": -6.416173458099365, "global_step": 112110, "epoch": 2669} {"train_loss": -6.421086311340332, "global_step": 112111, "epoch": 2669} {"train_loss": -6.413167953491211, "global_step": 112112, "epoch": 2669} {"train_loss": -6.484250545501709, "global_step": 112113, "epoch": 2669} {"train_loss": -6.428682327270508, "global_step": 112114, "epoch": 2669} {"train_loss": -6.606743812561035, "global_step": 112115, "epoch": 2669} {"train_loss": -6.53116512298584, "global_step": 112116, "epoch": 2669} {"train_loss": -6.440628528594971, "global_step": 112117, "epoch": 2669} {"train_loss": -6.466711044311523, "global_step": 112118, "epoch": 2669} {"train_loss": -6.427922248840332, "global_step": 112119, "epoch": 2669} {"train_loss": -6.369296073913574, "global_step": 112120, "epoch": 2669} {"train_loss": -6.416721820831299, "global_step": 112121, "epoch": 2669} {"train_loss": -6.48614501953125, "global_step": 112122, "epoch": 2669} {"train_loss": -6.427742958068848, "global_step": 112123, "epoch": 2669} {"train_loss": -6.46302604675293, "global_step": 112124, "epoch": 2669} {"train_loss": -6.434439659118652, "global_step": 112125, "epoch": 2669} {"train_loss": -6.408498287200928, "global_step": 112126, "epoch": 2669} {"train_loss": -6.35628604888916, "global_step": 112127, "epoch": 2669} {"train_loss": -6.516404151916504, "global_step": 112128, "epoch": 2669} {"train_loss": -6.417263031005859, "global_step": 112129, "epoch": 2669} {"train_loss": -6.495197296142578, "global_step": 112130, "epoch": 2669} {"train_loss": -6.502079486846924, "global_step": 112131, "epoch": 2669} {"train_loss": -6.414125919342041, "global_step": 112132, "epoch": 2669} {"train_loss": -6.5311479568481445, "global_step": 112133, "epoch": 2669} {"train_loss": -6.384315490722656, "global_step": 112134, "epoch": 2669} {"train_loss": -6.420889854431152, "global_step": 112135, "epoch": 2669} {"train_loss": -6.4894609451293945, "global_step": 112136, "epoch": 2669} {"train_loss": -6.275904655456543, "global_step": 112137, "epoch": 2669} {"train_loss": -6.389688491821289, "global_step": 112138, "epoch": 2669} {"train_loss": -6.458362636112032, "global_step": 112139, "epoch": 2669, "val_loss": 68030.5390625} {"train_loss": -6.390726089477539, "global_step": 112140, "epoch": 2670} {"train_loss": -6.461383819580078, "global_step": 112141, "epoch": 2670} {"train_loss": -6.510350227355957, "global_step": 112142, "epoch": 2670} {"train_loss": -6.6096343994140625, "global_step": 112143, "epoch": 2670} {"train_loss": -6.434571266174316, "global_step": 112144, "epoch": 2670} {"train_loss": -6.43626070022583, "global_step": 112145, "epoch": 2670} {"train_loss": -6.459578990936279, "global_step": 112146, "epoch": 2670} {"train_loss": -6.58601188659668, "global_step": 112147, "epoch": 2670} {"train_loss": -6.474600315093994, "global_step": 112148, "epoch": 2670} {"train_loss": -6.536628246307373, "global_step": 112149, "epoch": 2670} {"train_loss": -6.518853187561035, "global_step": 112150, "epoch": 2670} {"train_loss": -6.466556549072266, "global_step": 112151, "epoch": 2670} {"train_loss": -6.434214115142822, "global_step": 112152, "epoch": 2670} {"train_loss": -6.438236236572266, "global_step": 112153, "epoch": 2670} {"train_loss": -6.5156707763671875, "global_step": 112154, "epoch": 2670} {"train_loss": -6.428495407104492, "global_step": 112155, "epoch": 2670} {"train_loss": -6.344053268432617, "global_step": 112156, "epoch": 2670} {"train_loss": -6.558053970336914, "global_step": 112157, "epoch": 2670} {"train_loss": -6.529772758483887, "global_step": 112158, "epoch": 2670} {"train_loss": -6.517910957336426, "global_step": 112159, "epoch": 2670} {"train_loss": -6.457798957824707, "global_step": 112160, "epoch": 2670} {"train_loss": -6.355809211730957, "global_step": 112161, "epoch": 2670} {"train_loss": -6.404289245605469, "global_step": 112162, "epoch": 2670} {"train_loss": -6.536646842956543, "global_step": 112163, "epoch": 2670} {"train_loss": -6.531527996063232, "global_step": 112164, "epoch": 2670} {"train_loss": -6.4560866355896, "global_step": 112165, "epoch": 2670} {"train_loss": -6.443069934844971, "global_step": 112166, "epoch": 2670} {"train_loss": -6.445244789123535, "global_step": 112167, "epoch": 2670} {"train_loss": -6.471871852874756, "global_step": 112168, "epoch": 2670} {"train_loss": -6.525206565856934, "global_step": 112169, "epoch": 2670} {"train_loss": -6.5438032150268555, "global_step": 112170, "epoch": 2670} {"train_loss": -6.412140846252441, "global_step": 112171, "epoch": 2670} {"train_loss": -6.564751625061035, "global_step": 112172, "epoch": 2670} {"train_loss": -6.4899678230285645, "global_step": 112173, "epoch": 2670} {"train_loss": -6.582381248474121, "global_step": 112174, "epoch": 2670} {"train_loss": -6.62605619430542, "global_step": 112175, "epoch": 2670} {"train_loss": -6.452054500579834, "global_step": 112176, "epoch": 2670} {"train_loss": -6.535357475280762, "global_step": 112177, "epoch": 2670} {"train_loss": -6.520963668823242, "global_step": 112178, "epoch": 2670} {"train_loss": -6.476205825805664, "global_step": 112179, "epoch": 2670} {"train_loss": -6.512722492218018, "global_step": 112180, "epoch": 2670} {"train_loss": -6.488787446703229, "global_step": 112181, "epoch": 2670, "val_loss": 68171.09375} {"train_loss": -6.325183391571045, "global_step": 112182, "epoch": 2671} {"train_loss": -6.547787189483643, "global_step": 112183, "epoch": 2671} {"train_loss": -6.556060314178467, "global_step": 112184, "epoch": 2671} {"train_loss": -6.397015571594238, "global_step": 112185, "epoch": 2671} {"train_loss": -6.500962734222412, "global_step": 112186, "epoch": 2671} {"train_loss": -6.512640476226807, "global_step": 112187, "epoch": 2671} {"train_loss": -6.3975067138671875, "global_step": 112188, "epoch": 2671} {"train_loss": -6.446567535400391, "global_step": 112189, "epoch": 2671} {"train_loss": -6.503783226013184, "global_step": 112190, "epoch": 2671} {"train_loss": -6.471289157867432, "global_step": 112191, "epoch": 2671} {"train_loss": -6.509652137756348, "global_step": 112192, "epoch": 2671} {"train_loss": -6.477558135986328, "global_step": 112193, "epoch": 2671} {"train_loss": -6.509134292602539, "global_step": 112194, "epoch": 2671} {"train_loss": -6.564557075500488, "global_step": 112195, "epoch": 2671} {"train_loss": -6.5986738204956055, "global_step": 112196, "epoch": 2671} {"train_loss": -6.374582290649414, "global_step": 112197, "epoch": 2671} {"train_loss": -6.465524673461914, "global_step": 112198, "epoch": 2671} {"train_loss": -6.51596212387085, "global_step": 112199, "epoch": 2671} {"train_loss": -6.53745174407959, "global_step": 112200, "epoch": 2671} {"train_loss": -6.564536094665527, "global_step": 112201, "epoch": 2671} {"train_loss": -6.475302696228027, "global_step": 112202, "epoch": 2671} {"train_loss": -6.55781364440918, "global_step": 112203, "epoch": 2671} {"train_loss": -6.482246398925781, "global_step": 112204, "epoch": 2671} {"train_loss": -6.519069671630859, "global_step": 112205, "epoch": 2671} {"train_loss": -6.686560153961182, "global_step": 112206, "epoch": 2671} {"train_loss": -6.471521377563477, "global_step": 112207, "epoch": 2671} {"train_loss": -6.500595569610596, "global_step": 112208, "epoch": 2671} {"train_loss": -6.427644729614258, "global_step": 112209, "epoch": 2671} {"train_loss": -6.504203796386719, "global_step": 112210, "epoch": 2671} {"train_loss": -6.547628402709961, "global_step": 112211, "epoch": 2671} {"train_loss": -6.491310119628906, "global_step": 112212, "epoch": 2671} {"train_loss": -6.3855695724487305, "global_step": 112213, "epoch": 2671} {"train_loss": -6.379862308502197, "global_step": 112214, "epoch": 2671} {"train_loss": -6.538041591644287, "global_step": 112215, "epoch": 2671} {"train_loss": -6.438229560852051, "global_step": 112216, "epoch": 2671} {"train_loss": -6.248344421386719, "global_step": 112217, "epoch": 2671} {"train_loss": -6.477949142456055, "global_step": 112218, "epoch": 2671} {"train_loss": -6.4362406730651855, "global_step": 112219, "epoch": 2671} {"train_loss": -6.437032699584961, "global_step": 112220, "epoch": 2671} {"train_loss": -6.295711517333984, "global_step": 112221, "epoch": 2671} {"train_loss": -6.480293273925781, "global_step": 112222, "epoch": 2671} {"train_loss": -6.473561457225254, "global_step": 112223, "epoch": 2671, "val_loss": 67759.625} {"train_loss": -6.373732089996338, "global_step": 112224, "epoch": 2672} {"train_loss": -6.440657615661621, "global_step": 112225, "epoch": 2672} {"train_loss": -6.565666198730469, "global_step": 112226, "epoch": 2672} {"train_loss": -6.521485805511475, "global_step": 112227, "epoch": 2672} {"train_loss": -6.472019195556641, "global_step": 112228, "epoch": 2672} {"train_loss": -6.505307197570801, "global_step": 112229, "epoch": 2672} {"train_loss": -6.462062358856201, "global_step": 112230, "epoch": 2672} {"train_loss": -6.355993270874023, "global_step": 112231, "epoch": 2672} {"train_loss": -6.457070350646973, "global_step": 112232, "epoch": 2672} {"train_loss": -6.509926795959473, "global_step": 112233, "epoch": 2672} {"train_loss": -6.491419792175293, "global_step": 112234, "epoch": 2672} {"train_loss": -6.509562969207764, "global_step": 112235, "epoch": 2672} {"train_loss": -6.476561546325684, "global_step": 112236, "epoch": 2672} {"train_loss": -6.472769260406494, "global_step": 112237, "epoch": 2672} {"train_loss": -6.543257713317871, "global_step": 112238, "epoch": 2672} {"train_loss": -6.447844982147217, "global_step": 112239, "epoch": 2672} {"train_loss": -6.377523422241211, "global_step": 112240, "epoch": 2672} {"train_loss": -6.578329086303711, "global_step": 112241, "epoch": 2672} {"train_loss": -6.455299377441406, "global_step": 112242, "epoch": 2672} {"train_loss": -6.579961776733398, "global_step": 112243, "epoch": 2672} {"train_loss": -6.394976615905762, "global_step": 112244, "epoch": 2672} {"train_loss": -6.398082733154297, "global_step": 112245, "epoch": 2672} {"train_loss": -6.3611226081848145, "global_step": 112246, "epoch": 2672} {"train_loss": -6.447271347045898, "global_step": 112247, "epoch": 2672} {"train_loss": -6.402256011962891, "global_step": 112248, "epoch": 2672} {"train_loss": -6.439655780792236, "global_step": 112249, "epoch": 2672} {"train_loss": -6.401800632476807, "global_step": 112250, "epoch": 2672} {"train_loss": -6.370436668395996, "global_step": 112251, "epoch": 2672} {"train_loss": -6.424504280090332, "global_step": 112252, "epoch": 2672} {"train_loss": -6.389522552490234, "global_step": 112253, "epoch": 2672} {"train_loss": -6.451194763183594, "global_step": 112254, "epoch": 2672} {"train_loss": -6.497457504272461, "global_step": 112255, "epoch": 2672} {"train_loss": -6.390892028808594, "global_step": 112256, "epoch": 2672} {"train_loss": -6.43474006652832, "global_step": 112257, "epoch": 2672} {"train_loss": -6.428664207458496, "global_step": 112258, "epoch": 2672} {"train_loss": -6.489550590515137, "global_step": 112259, "epoch": 2672} {"train_loss": -6.300579071044922, "global_step": 112260, "epoch": 2672} {"train_loss": -6.312182426452637, "global_step": 112261, "epoch": 2672} {"train_loss": -6.372570991516113, "global_step": 112262, "epoch": 2672} {"train_loss": -6.42559814453125, "global_step": 112263, "epoch": 2672} {"train_loss": -6.429019451141357, "global_step": 112264, "epoch": 2672} {"train_loss": -6.444453659511748, "global_step": 112265, "epoch": 2672, "val_loss": 67731.96875} {"train_loss": -6.440102577209473, "global_step": 112266, "epoch": 2673} {"train_loss": -6.3784332275390625, "global_step": 112267, "epoch": 2673} {"train_loss": -6.347198963165283, "global_step": 112268, "epoch": 2673} {"train_loss": -6.368083953857422, "global_step": 112269, "epoch": 2673} {"train_loss": -6.485539436340332, "global_step": 112270, "epoch": 2673} {"train_loss": -6.523040771484375, "global_step": 112271, "epoch": 2673} {"train_loss": -6.467474937438965, "global_step": 112272, "epoch": 2673} {"train_loss": -6.458285808563232, "global_step": 112273, "epoch": 2673} {"train_loss": -6.501962184906006, "global_step": 112274, "epoch": 2673} {"train_loss": -6.473971366882324, "global_step": 112275, "epoch": 2673} {"train_loss": -6.444911003112793, "global_step": 112276, "epoch": 2673} {"train_loss": -6.489285945892334, "global_step": 112277, "epoch": 2673} {"train_loss": -6.488460540771484, "global_step": 112278, "epoch": 2673} {"train_loss": -6.289952278137207, "global_step": 112279, "epoch": 2673} {"train_loss": -6.488821029663086, "global_step": 112280, "epoch": 2673} {"train_loss": -6.419219017028809, "global_step": 112281, "epoch": 2673} {"train_loss": -6.384906768798828, "global_step": 112282, "epoch": 2673} {"train_loss": -6.4947829246521, "global_step": 112283, "epoch": 2673} {"train_loss": -6.467293739318848, "global_step": 112284, "epoch": 2673} {"train_loss": -6.425353050231934, "global_step": 112285, "epoch": 2673} {"train_loss": -6.330820560455322, "global_step": 112286, "epoch": 2673} {"train_loss": -6.468868255615234, "global_step": 112287, "epoch": 2673} {"train_loss": -6.483983993530273, "global_step": 112288, "epoch": 2673} {"train_loss": -6.41985559463501, "global_step": 112289, "epoch": 2673} {"train_loss": -6.549996852874756, "global_step": 112290, "epoch": 2673} {"train_loss": -6.447698593139648, "global_step": 112291, "epoch": 2673} {"train_loss": -6.447188854217529, "global_step": 112292, "epoch": 2673} {"train_loss": -6.484446048736572, "global_step": 112293, "epoch": 2673} {"train_loss": -6.463963031768799, "global_step": 112294, "epoch": 2673} {"train_loss": -6.482447147369385, "global_step": 112295, "epoch": 2673} {"train_loss": -6.586256504058838, "global_step": 112296, "epoch": 2673} {"train_loss": -6.419744491577148, "global_step": 112297, "epoch": 2673} {"train_loss": -6.519320011138916, "global_step": 112298, "epoch": 2673} {"train_loss": -6.537065029144287, "global_step": 112299, "epoch": 2673} {"train_loss": -6.377086639404297, "global_step": 112300, "epoch": 2673} {"train_loss": -6.3609724044799805, "global_step": 112301, "epoch": 2673} {"train_loss": -6.488237380981445, "global_step": 112302, "epoch": 2673} {"train_loss": -6.475586891174316, "global_step": 112303, "epoch": 2673} {"train_loss": -6.411252021789551, "global_step": 112304, "epoch": 2673} {"train_loss": -6.436368942260742, "global_step": 112305, "epoch": 2673} {"train_loss": -6.448119640350342, "global_step": 112306, "epoch": 2673} {"train_loss": -6.451531523749942, "global_step": 112307, "epoch": 2673, "val_loss": 67899.359375} {"train_loss": -6.429845333099365, "global_step": 112308, "epoch": 2674} {"train_loss": -6.516404151916504, "global_step": 112309, "epoch": 2674} {"train_loss": -6.491208553314209, "global_step": 112310, "epoch": 2674} {"train_loss": -6.475606441497803, "global_step": 112311, "epoch": 2674} {"train_loss": -6.462925910949707, "global_step": 112312, "epoch": 2674} {"train_loss": -6.458235740661621, "global_step": 112313, "epoch": 2674} {"train_loss": -6.387099266052246, "global_step": 112314, "epoch": 2674} {"train_loss": -6.410582542419434, "global_step": 112315, "epoch": 2674} {"train_loss": -6.475714206695557, "global_step": 112316, "epoch": 2674} {"train_loss": -6.484874725341797, "global_step": 112317, "epoch": 2674} {"train_loss": -6.421952247619629, "global_step": 112318, "epoch": 2674} {"train_loss": -6.451874732971191, "global_step": 112319, "epoch": 2674} {"train_loss": -6.449974060058594, "global_step": 112320, "epoch": 2674} {"train_loss": -6.518989562988281, "global_step": 112321, "epoch": 2674} {"train_loss": -6.388708114624023, "global_step": 112322, "epoch": 2674} {"train_loss": -6.48408317565918, "global_step": 112323, "epoch": 2674} {"train_loss": -6.579407691955566, "global_step": 112324, "epoch": 2674} {"train_loss": -6.478574752807617, "global_step": 112325, "epoch": 2674} {"train_loss": -6.423995018005371, "global_step": 112326, "epoch": 2674} {"train_loss": -6.454259395599365, "global_step": 112327, "epoch": 2674} {"train_loss": -6.416036128997803, "global_step": 112328, "epoch": 2674} {"train_loss": -6.5046610832214355, "global_step": 112329, "epoch": 2674} {"train_loss": -6.56217622756958, "global_step": 112330, "epoch": 2674} {"train_loss": -6.500827312469482, "global_step": 112331, "epoch": 2674} {"train_loss": -6.434433460235596, "global_step": 112332, "epoch": 2674} {"train_loss": -6.520566463470459, "global_step": 112333, "epoch": 2674} {"train_loss": -6.583128452301025, "global_step": 112334, "epoch": 2674} {"train_loss": -6.4997477531433105, "global_step": 112335, "epoch": 2674} {"train_loss": -6.596673965454102, "global_step": 112336, "epoch": 2674} {"train_loss": -6.586825370788574, "global_step": 112337, "epoch": 2674} {"train_loss": -6.491635322570801, "global_step": 112338, "epoch": 2674} {"train_loss": -6.473852157592773, "global_step": 112339, "epoch": 2674} {"train_loss": -6.400184631347656, "global_step": 112340, "epoch": 2674} {"train_loss": -6.479475975036621, "global_step": 112341, "epoch": 2674} {"train_loss": -6.473114967346191, "global_step": 112342, "epoch": 2674} {"train_loss": -6.368077754974365, "global_step": 112343, "epoch": 2674} {"train_loss": -6.505759239196777, "global_step": 112344, "epoch": 2674} {"train_loss": -6.461543083190918, "global_step": 112345, "epoch": 2674} {"train_loss": -6.393429756164551, "global_step": 112346, "epoch": 2674} {"train_loss": -6.524264812469482, "global_step": 112347, "epoch": 2674} {"train_loss": -6.4042534828186035, "global_step": 112348, "epoch": 2674} {"train_loss": -6.471792414074852, "global_step": 112349, "epoch": 2674, "val_loss": 67967.6796875} {"train_loss": -6.424941062927246, "global_step": 112350, "epoch": 2675} {"train_loss": -6.560638904571533, "global_step": 112351, "epoch": 2675} {"train_loss": -6.508785724639893, "global_step": 112352, "epoch": 2675} {"train_loss": -6.456464767456055, "global_step": 112353, "epoch": 2675} {"train_loss": -6.579113960266113, "global_step": 112354, "epoch": 2675} {"train_loss": -6.57014274597168, "global_step": 112355, "epoch": 2675} {"train_loss": -6.439842224121094, "global_step": 112356, "epoch": 2675} {"train_loss": -6.463859558105469, "global_step": 112357, "epoch": 2675} {"train_loss": -6.541701793670654, "global_step": 112358, "epoch": 2675} {"train_loss": -6.442564964294434, "global_step": 112359, "epoch": 2675} {"train_loss": -6.565223693847656, "global_step": 112360, "epoch": 2675} {"train_loss": -6.452845573425293, "global_step": 112361, "epoch": 2675} {"train_loss": -6.373592376708984, "global_step": 112362, "epoch": 2675} {"train_loss": -6.468529224395752, "global_step": 112363, "epoch": 2675} {"train_loss": -6.513000011444092, "global_step": 112364, "epoch": 2675} {"train_loss": -6.572707176208496, "global_step": 112365, "epoch": 2675} {"train_loss": -6.546614170074463, "global_step": 112366, "epoch": 2675} {"train_loss": -6.513974666595459, "global_step": 112367, "epoch": 2675} {"train_loss": -6.443760871887207, "global_step": 112368, "epoch": 2675} {"train_loss": -6.452660083770752, "global_step": 112369, "epoch": 2675} {"train_loss": -6.385179042816162, "global_step": 112370, "epoch": 2675} {"train_loss": -6.590181827545166, "global_step": 112371, "epoch": 2675} {"train_loss": -6.5201215744018555, "global_step": 112372, "epoch": 2675} {"train_loss": -6.577727317810059, "global_step": 112373, "epoch": 2675} {"train_loss": -6.430498123168945, "global_step": 112374, "epoch": 2675} {"train_loss": -6.529447555541992, "global_step": 112375, "epoch": 2675} {"train_loss": -6.523963928222656, "global_step": 112376, "epoch": 2675} {"train_loss": -6.5172295570373535, "global_step": 112377, "epoch": 2675} {"train_loss": -6.529049873352051, "global_step": 112378, "epoch": 2675} {"train_loss": -6.354170799255371, "global_step": 112379, "epoch": 2675} {"train_loss": -6.390057563781738, "global_step": 112380, "epoch": 2675} {"train_loss": -6.456056594848633, "global_step": 112381, "epoch": 2675} {"train_loss": -6.549054145812988, "global_step": 112382, "epoch": 2675} {"train_loss": -6.582934856414795, "global_step": 112383, "epoch": 2675} {"train_loss": -6.4624104499816895, "global_step": 112384, "epoch": 2675} {"train_loss": -6.358942985534668, "global_step": 112385, "epoch": 2675} {"train_loss": -6.4596052169799805, "global_step": 112386, "epoch": 2675} {"train_loss": -6.47932243347168, "global_step": 112387, "epoch": 2675} {"train_loss": -6.542075157165527, "global_step": 112388, "epoch": 2675} {"train_loss": -6.457024574279785, "global_step": 112389, "epoch": 2675} {"train_loss": -6.411298751831055, "global_step": 112390, "epoch": 2675} {"train_loss": -6.484959704535348, "global_step": 112391, "epoch": 2675, "val_loss": 67768.5625} {"train_loss": -6.472908020019531, "global_step": 112392, "epoch": 2676} {"train_loss": -6.4025959968566895, "global_step": 112393, "epoch": 2676} {"train_loss": -6.383508682250977, "global_step": 112394, "epoch": 2676} {"train_loss": -6.477062702178955, "global_step": 112395, "epoch": 2676} {"train_loss": -6.365206718444824, "global_step": 112396, "epoch": 2676} {"train_loss": -6.423998832702637, "global_step": 112397, "epoch": 2676} {"train_loss": -6.358510494232178, "global_step": 112398, "epoch": 2676} {"train_loss": -6.290952205657959, "global_step": 112399, "epoch": 2676} {"train_loss": -6.513697624206543, "global_step": 112400, "epoch": 2676} {"train_loss": -6.37959098815918, "global_step": 112401, "epoch": 2676} {"train_loss": -6.306323528289795, "global_step": 112402, "epoch": 2676} {"train_loss": -6.298369884490967, "global_step": 112403, "epoch": 2676} {"train_loss": -6.424347877502441, "global_step": 112404, "epoch": 2676} {"train_loss": -6.492685317993164, "global_step": 112405, "epoch": 2676} {"train_loss": -6.367546081542969, "global_step": 112406, "epoch": 2676} {"train_loss": -6.331581115722656, "global_step": 112407, "epoch": 2676} {"train_loss": -6.275737762451172, "global_step": 112408, "epoch": 2676} {"train_loss": -6.363241195678711, "global_step": 112409, "epoch": 2676} {"train_loss": -6.480110168457031, "global_step": 112410, "epoch": 2676} {"train_loss": -6.518128395080566, "global_step": 112411, "epoch": 2676} {"train_loss": -6.49628210067749, "global_step": 112412, "epoch": 2676} {"train_loss": -6.415171146392822, "global_step": 112413, "epoch": 2676} {"train_loss": -6.534019947052002, "global_step": 112414, "epoch": 2676} {"train_loss": -6.542187690734863, "global_step": 112415, "epoch": 2676} {"train_loss": -6.455729007720947, "global_step": 112416, "epoch": 2676} {"train_loss": -6.474214553833008, "global_step": 112417, "epoch": 2676} {"train_loss": -6.510369777679443, "global_step": 112418, "epoch": 2676} {"train_loss": -6.475430488586426, "global_step": 112419, "epoch": 2676} {"train_loss": -6.619150638580322, "global_step": 112420, "epoch": 2676} {"train_loss": -6.452768325805664, "global_step": 112421, "epoch": 2676} {"train_loss": -6.426953315734863, "global_step": 112422, "epoch": 2676} {"train_loss": -6.484405040740967, "global_step": 112423, "epoch": 2676} {"train_loss": -6.420441627502441, "global_step": 112424, "epoch": 2676} {"train_loss": -6.398890495300293, "global_step": 112425, "epoch": 2676} {"train_loss": -6.559841632843018, "global_step": 112426, "epoch": 2676} {"train_loss": -6.477723121643066, "global_step": 112427, "epoch": 2676} {"train_loss": -6.539752006530762, "global_step": 112428, "epoch": 2676} {"train_loss": -6.508011817932129, "global_step": 112429, "epoch": 2676} {"train_loss": -6.371718883514404, "global_step": 112430, "epoch": 2676} {"train_loss": -6.452574253082275, "global_step": 112431, "epoch": 2676} {"train_loss": -6.413915634155273, "global_step": 112432, "epoch": 2676} {"train_loss": -6.437446457999093, "global_step": 112433, "epoch": 2676, "val_loss": 67932.8125} {"train_loss": -6.57219123840332, "global_step": 112434, "epoch": 2677} {"train_loss": -6.450887680053711, "global_step": 112435, "epoch": 2677} {"train_loss": -6.435070037841797, "global_step": 112436, "epoch": 2677} {"train_loss": -6.597962379455566, "global_step": 112437, "epoch": 2677} {"train_loss": -6.529415607452393, "global_step": 112438, "epoch": 2677} {"train_loss": -6.478060245513916, "global_step": 112439, "epoch": 2677} {"train_loss": -6.513144493103027, "global_step": 112440, "epoch": 2677} {"train_loss": -6.422702789306641, "global_step": 112441, "epoch": 2677} {"train_loss": -6.453523635864258, "global_step": 112442, "epoch": 2677} {"train_loss": -6.342223644256592, "global_step": 112443, "epoch": 2677} {"train_loss": -6.487616539001465, "global_step": 112444, "epoch": 2677} {"train_loss": -6.535844802856445, "global_step": 112445, "epoch": 2677} {"train_loss": -6.485133647918701, "global_step": 112446, "epoch": 2677} {"train_loss": -6.4435343742370605, "global_step": 112447, "epoch": 2677} {"train_loss": -6.5670318603515625, "global_step": 112448, "epoch": 2677} {"train_loss": -6.522013187408447, "global_step": 112449, "epoch": 2677} {"train_loss": -6.498331069946289, "global_step": 112450, "epoch": 2677} {"train_loss": -6.386638641357422, "global_step": 112451, "epoch": 2677} {"train_loss": -6.353545188903809, "global_step": 112452, "epoch": 2677} {"train_loss": -6.408536911010742, "global_step": 112453, "epoch": 2677} {"train_loss": -6.522769927978516, "global_step": 112454, "epoch": 2677} {"train_loss": -6.236273288726807, "global_step": 112455, "epoch": 2677} {"train_loss": -6.45415735244751, "global_step": 112456, "epoch": 2677} {"train_loss": -6.424749374389648, "global_step": 112457, "epoch": 2677} {"train_loss": -6.467264175415039, "global_step": 112458, "epoch": 2677} {"train_loss": -6.403031349182129, "global_step": 112459, "epoch": 2677} {"train_loss": -6.429606914520264, "global_step": 112460, "epoch": 2677} {"train_loss": -6.4012322425842285, "global_step": 112461, "epoch": 2677} {"train_loss": -6.283349990844727, "global_step": 112462, "epoch": 2677} {"train_loss": -6.6912055015563965, "global_step": 112463, "epoch": 2677} {"train_loss": -6.368703365325928, "global_step": 112464, "epoch": 2677} {"train_loss": -6.357390880584717, "global_step": 112465, "epoch": 2677} {"train_loss": -6.531744956970215, "global_step": 112466, "epoch": 2677} {"train_loss": -6.3350725173950195, "global_step": 112467, "epoch": 2677} {"train_loss": -6.45571756362915, "global_step": 112468, "epoch": 2677} {"train_loss": -6.504917144775391, "global_step": 112469, "epoch": 2677} {"train_loss": -6.400038242340088, "global_step": 112470, "epoch": 2677} {"train_loss": -6.492382049560547, "global_step": 112471, "epoch": 2677} {"train_loss": -6.493613243103027, "global_step": 112472, "epoch": 2677} {"train_loss": -6.457157135009766, "global_step": 112473, "epoch": 2677} {"train_loss": -6.322590351104736, "global_step": 112474, "epoch": 2677} {"train_loss": -6.449444180443173, "global_step": 112475, "epoch": 2677, "val_loss": 67824.140625} {"train_loss": -6.413044452667236, "global_step": 112476, "epoch": 2678} {"train_loss": -6.532038688659668, "global_step": 112477, "epoch": 2678} {"train_loss": -6.538527011871338, "global_step": 112478, "epoch": 2678} {"train_loss": -6.528636455535889, "global_step": 112479, "epoch": 2678} {"train_loss": -6.508237838745117, "global_step": 112480, "epoch": 2678} {"train_loss": -6.6159868240356445, "global_step": 112481, "epoch": 2678} {"train_loss": -6.491335868835449, "global_step": 112482, "epoch": 2678} {"train_loss": -6.397028923034668, "global_step": 112483, "epoch": 2678} {"train_loss": -6.576918601989746, "global_step": 112484, "epoch": 2678} {"train_loss": -6.540012836456299, "global_step": 112485, "epoch": 2678} {"train_loss": -6.537479400634766, "global_step": 112486, "epoch": 2678} {"train_loss": -6.539309024810791, "global_step": 112487, "epoch": 2678} {"train_loss": -6.507107734680176, "global_step": 112488, "epoch": 2678} {"train_loss": -6.450736999511719, "global_step": 112489, "epoch": 2678} {"train_loss": -6.442452430725098, "global_step": 112490, "epoch": 2678} {"train_loss": -6.512414455413818, "global_step": 112491, "epoch": 2678} {"train_loss": -6.410304069519043, "global_step": 112492, "epoch": 2678} {"train_loss": -6.480556011199951, "global_step": 112493, "epoch": 2678} {"train_loss": -6.499324798583984, "global_step": 112494, "epoch": 2678} {"train_loss": -6.526266574859619, "global_step": 112495, "epoch": 2678} {"train_loss": -6.498836517333984, "global_step": 112496, "epoch": 2678} {"train_loss": -6.541961669921875, "global_step": 112497, "epoch": 2678} {"train_loss": -6.483248710632324, "global_step": 112498, "epoch": 2678} {"train_loss": -6.572464466094971, "global_step": 112499, "epoch": 2678} {"train_loss": -6.541074752807617, "global_step": 112500, "epoch": 2678} {"train_loss": -6.4259514808654785, "global_step": 112501, "epoch": 2678} {"train_loss": -6.456406593322754, "global_step": 112502, "epoch": 2678} {"train_loss": -6.490751266479492, "global_step": 112503, "epoch": 2678} {"train_loss": -6.492522239685059, "global_step": 112504, "epoch": 2678} {"train_loss": -6.581795692443848, "global_step": 112505, "epoch": 2678} {"train_loss": -6.453088760375977, "global_step": 112506, "epoch": 2678} {"train_loss": -6.483755111694336, "global_step": 112507, "epoch": 2678} {"train_loss": -6.50289249420166, "global_step": 112508, "epoch": 2678} {"train_loss": -6.497607707977295, "global_step": 112509, "epoch": 2678} {"train_loss": -6.448128700256348, "global_step": 112510, "epoch": 2678} {"train_loss": -6.566424369812012, "global_step": 112511, "epoch": 2678} {"train_loss": -6.4439592361450195, "global_step": 112512, "epoch": 2678} {"train_loss": -6.453860282897949, "global_step": 112513, "epoch": 2678} {"train_loss": -6.486687660217285, "global_step": 112514, "epoch": 2678} {"train_loss": -6.565916061401367, "global_step": 112515, "epoch": 2678} {"train_loss": -6.592483997344971, "global_step": 112516, "epoch": 2678} {"train_loss": -6.504921663375128, "global_step": 112517, "epoch": 2678, "val_loss": 67681.03125} {"train_loss": -6.48985481262207, "global_step": 112518, "epoch": 2679} {"train_loss": -6.4064459800720215, "global_step": 112519, "epoch": 2679} {"train_loss": -6.638865947723389, "global_step": 112520, "epoch": 2679} {"train_loss": -6.626517295837402, "global_step": 112521, "epoch": 2679} {"train_loss": -6.421677589416504, "global_step": 112522, "epoch": 2679} {"train_loss": -6.423397541046143, "global_step": 112523, "epoch": 2679} {"train_loss": -6.4970173835754395, "global_step": 112524, "epoch": 2679} {"train_loss": -6.4470977783203125, "global_step": 112525, "epoch": 2679} {"train_loss": -6.401941299438477, "global_step": 112526, "epoch": 2679} {"train_loss": -6.4420952796936035, "global_step": 112527, "epoch": 2679} {"train_loss": -6.457221031188965, "global_step": 112528, "epoch": 2679} {"train_loss": -6.297697067260742, "global_step": 112529, "epoch": 2679} {"train_loss": -6.284663200378418, "global_step": 112530, "epoch": 2679} {"train_loss": -6.476708889007568, "global_step": 112531, "epoch": 2679} {"train_loss": -6.483682632446289, "global_step": 112532, "epoch": 2679} {"train_loss": -6.4003753662109375, "global_step": 112533, "epoch": 2679} {"train_loss": -6.416296005249023, "global_step": 112534, "epoch": 2679} {"train_loss": -6.3841705322265625, "global_step": 112535, "epoch": 2679} {"train_loss": -6.450860977172852, "global_step": 112536, "epoch": 2679} {"train_loss": -6.4313178062438965, "global_step": 112537, "epoch": 2679} {"train_loss": -6.457716941833496, "global_step": 112538, "epoch": 2679} {"train_loss": -6.437644958496094, "global_step": 112539, "epoch": 2679} {"train_loss": -6.518594741821289, "global_step": 112540, "epoch": 2679} {"train_loss": -6.525735855102539, "global_step": 112541, "epoch": 2679} {"train_loss": -6.48029899597168, "global_step": 112542, "epoch": 2679} {"train_loss": -6.410951614379883, "global_step": 112543, "epoch": 2679} {"train_loss": -6.4654860496521, "global_step": 112544, "epoch": 2679} {"train_loss": -6.5053205490112305, "global_step": 112545, "epoch": 2679} {"train_loss": -6.44847297668457, "global_step": 112546, "epoch": 2679} {"train_loss": -6.502541542053223, "global_step": 112547, "epoch": 2679} {"train_loss": -6.543279647827148, "global_step": 112548, "epoch": 2679} {"train_loss": -6.489892482757568, "global_step": 112549, "epoch": 2679} {"train_loss": -6.494952201843262, "global_step": 112550, "epoch": 2679} {"train_loss": -6.526782035827637, "global_step": 112551, "epoch": 2679} {"train_loss": -6.5174150466918945, "global_step": 112552, "epoch": 2679} {"train_loss": -6.443272590637207, "global_step": 112553, "epoch": 2679} {"train_loss": -6.463869094848633, "global_step": 112554, "epoch": 2679} {"train_loss": -6.529958248138428, "global_step": 112555, "epoch": 2679} {"train_loss": -6.3886494636535645, "global_step": 112556, "epoch": 2679} {"train_loss": -6.524239540100098, "global_step": 112557, "epoch": 2679} {"train_loss": -6.488031387329102, "global_step": 112558, "epoch": 2679} {"train_loss": -6.463734740302677, "global_step": 112559, "epoch": 2679, "val_loss": 67839.734375} {"train_loss": -6.639801979064941, "global_step": 112560, "epoch": 2680} {"train_loss": -6.460330963134766, "global_step": 112561, "epoch": 2680} {"train_loss": -6.350241184234619, "global_step": 112562, "epoch": 2680} {"train_loss": -6.489351749420166, "global_step": 112563, "epoch": 2680} {"train_loss": -6.497016906738281, "global_step": 112564, "epoch": 2680} {"train_loss": -6.428623676300049, "global_step": 112565, "epoch": 2680} {"train_loss": -6.494516849517822, "global_step": 112566, "epoch": 2680} {"train_loss": -6.498379707336426, "global_step": 112567, "epoch": 2680} {"train_loss": -6.474126815795898, "global_step": 112568, "epoch": 2680} {"train_loss": -6.463968276977539, "global_step": 112569, "epoch": 2680} {"train_loss": -6.57225227355957, "global_step": 112570, "epoch": 2680} {"train_loss": -6.41740083694458, "global_step": 112571, "epoch": 2680} {"train_loss": -6.45181131362915, "global_step": 112572, "epoch": 2680} {"train_loss": -6.353727340698242, "global_step": 112573, "epoch": 2680} {"train_loss": -6.484941482543945, "global_step": 112574, "epoch": 2680} {"train_loss": -6.529478549957275, "global_step": 112575, "epoch": 2680} {"train_loss": -6.395993232727051, "global_step": 112576, "epoch": 2680} {"train_loss": -6.429697036743164, "global_step": 112577, "epoch": 2680} {"train_loss": -6.515411376953125, "global_step": 112578, "epoch": 2680} {"train_loss": -6.46396541595459, "global_step": 112579, "epoch": 2680} {"train_loss": -6.390130996704102, "global_step": 112580, "epoch": 2680} {"train_loss": -6.472839832305908, "global_step": 112581, "epoch": 2680} {"train_loss": -6.378140449523926, "global_step": 112582, "epoch": 2680} {"train_loss": -6.520005702972412, "global_step": 112583, "epoch": 2680} {"train_loss": -6.606840133666992, "global_step": 112584, "epoch": 2680} {"train_loss": -6.49946403503418, "global_step": 112585, "epoch": 2680} {"train_loss": -6.55426025390625, "global_step": 112586, "epoch": 2680} {"train_loss": -6.474815368652344, "global_step": 112587, "epoch": 2680} {"train_loss": -6.468891620635986, "global_step": 112588, "epoch": 2680} {"train_loss": -6.287222862243652, "global_step": 112589, "epoch": 2680} {"train_loss": -6.43868350982666, "global_step": 112590, "epoch": 2680} {"train_loss": -6.424955368041992, "global_step": 112591, "epoch": 2680} {"train_loss": -6.4340410232543945, "global_step": 112592, "epoch": 2680} {"train_loss": -6.531919479370117, "global_step": 112593, "epoch": 2680} {"train_loss": -6.42457914352417, "global_step": 112594, "epoch": 2680} {"train_loss": -6.347064018249512, "global_step": 112595, "epoch": 2680} {"train_loss": -6.448835849761963, "global_step": 112596, "epoch": 2680} {"train_loss": -6.246801376342773, "global_step": 112597, "epoch": 2680} {"train_loss": -6.195494651794434, "global_step": 112598, "epoch": 2680} {"train_loss": -6.470976829528809, "global_step": 112599, "epoch": 2680} {"train_loss": -6.295612335205078, "global_step": 112600, "epoch": 2680} {"train_loss": -6.449004729588826, "global_step": 112601, "epoch": 2680, "val_loss": 68189.0390625} {"train_loss": -6.295015335083008, "global_step": 112602, "epoch": 2681} {"train_loss": -6.389991283416748, "global_step": 112603, "epoch": 2681} {"train_loss": -6.303255081176758, "global_step": 112604, "epoch": 2681} {"train_loss": -6.363262176513672, "global_step": 112605, "epoch": 2681} {"train_loss": -6.357590198516846, "global_step": 112606, "epoch": 2681} {"train_loss": -6.311367034912109, "global_step": 112607, "epoch": 2681} {"train_loss": -6.369964122772217, "global_step": 112608, "epoch": 2681} {"train_loss": -6.408043384552002, "global_step": 112609, "epoch": 2681} {"train_loss": -6.357306480407715, "global_step": 112610, "epoch": 2681} {"train_loss": -6.333330154418945, "global_step": 112611, "epoch": 2681} {"train_loss": -6.240682125091553, "global_step": 112612, "epoch": 2681} {"train_loss": -6.23777437210083, "global_step": 112613, "epoch": 2681} {"train_loss": -6.456157207489014, "global_step": 112614, "epoch": 2681} {"train_loss": -6.274754047393799, "global_step": 112615, "epoch": 2681} {"train_loss": -6.331569671630859, "global_step": 112616, "epoch": 2681} {"train_loss": -6.392720699310303, "global_step": 112617, "epoch": 2681} {"train_loss": -6.41597843170166, "global_step": 112618, "epoch": 2681} {"train_loss": -6.227779388427734, "global_step": 112619, "epoch": 2681} {"train_loss": -6.361866474151611, "global_step": 112620, "epoch": 2681} {"train_loss": -6.433585166931152, "global_step": 112621, "epoch": 2681} {"train_loss": -6.393150329589844, "global_step": 112622, "epoch": 2681} {"train_loss": -6.3990092277526855, "global_step": 112623, "epoch": 2681} {"train_loss": -6.415663242340088, "global_step": 112624, "epoch": 2681} {"train_loss": -6.321285247802734, "global_step": 112625, "epoch": 2681} {"train_loss": -6.564815044403076, "global_step": 112626, "epoch": 2681} {"train_loss": -6.467556953430176, "global_step": 112627, "epoch": 2681} {"train_loss": -6.420415878295898, "global_step": 112628, "epoch": 2681} {"train_loss": -6.484122276306152, "global_step": 112629, "epoch": 2681} {"train_loss": -6.518980026245117, "global_step": 112630, "epoch": 2681} {"train_loss": -6.420597076416016, "global_step": 112631, "epoch": 2681} {"train_loss": -6.5446014404296875, "global_step": 112632, "epoch": 2681} {"train_loss": -6.299184322357178, "global_step": 112633, "epoch": 2681} {"train_loss": -6.507831573486328, "global_step": 112634, "epoch": 2681} {"train_loss": -6.434108734130859, "global_step": 112635, "epoch": 2681} {"train_loss": -6.363157272338867, "global_step": 112636, "epoch": 2681} {"train_loss": -6.45266056060791, "global_step": 112637, "epoch": 2681} {"train_loss": -6.396775722503662, "global_step": 112638, "epoch": 2681} {"train_loss": -6.515887260437012, "global_step": 112639, "epoch": 2681} {"train_loss": -6.517951965332031, "global_step": 112640, "epoch": 2681} {"train_loss": -6.399138450622559, "global_step": 112641, "epoch": 2681} {"train_loss": -6.490420341491699, "global_step": 112642, "epoch": 2681} {"train_loss": -6.395382392974127, "global_step": 112643, "epoch": 2681, "val_loss": 67981.46875} {"train_loss": -6.525918006896973, "global_step": 112644, "epoch": 2682} {"train_loss": -6.4159417152404785, "global_step": 112645, "epoch": 2682} {"train_loss": -6.32093620300293, "global_step": 112646, "epoch": 2682} {"train_loss": -6.408242225646973, "global_step": 112647, "epoch": 2682} {"train_loss": -6.424949645996094, "global_step": 112648, "epoch": 2682} {"train_loss": -6.39337158203125, "global_step": 112649, "epoch": 2682} {"train_loss": -6.438076972961426, "global_step": 112650, "epoch": 2682} {"train_loss": -6.502374649047852, "global_step": 112651, "epoch": 2682} {"train_loss": -6.390639781951904, "global_step": 112652, "epoch": 2682} {"train_loss": -6.407161235809326, "global_step": 112653, "epoch": 2682} {"train_loss": -6.46760368347168, "global_step": 112654, "epoch": 2682} {"train_loss": -6.445263862609863, "global_step": 112655, "epoch": 2682} {"train_loss": -6.482285976409912, "global_step": 112656, "epoch": 2682} {"train_loss": -6.444118976593018, "global_step": 112657, "epoch": 2682} {"train_loss": -6.523582458496094, "global_step": 112658, "epoch": 2682} {"train_loss": -6.420223712921143, "global_step": 112659, "epoch": 2682} {"train_loss": -6.57591438293457, "global_step": 112660, "epoch": 2682} {"train_loss": -6.4631733894348145, "global_step": 112661, "epoch": 2682} {"train_loss": -6.45890998840332, "global_step": 112662, "epoch": 2682} {"train_loss": -6.439992904663086, "global_step": 112663, "epoch": 2682} {"train_loss": -6.4734110832214355, "global_step": 112664, "epoch": 2682} {"train_loss": -6.546679496765137, "global_step": 112665, "epoch": 2682} {"train_loss": -6.557751178741455, "global_step": 112666, "epoch": 2682} {"train_loss": -6.41310977935791, "global_step": 112667, "epoch": 2682} {"train_loss": -6.505853652954102, "global_step": 112668, "epoch": 2682} {"train_loss": -6.48044490814209, "global_step": 112669, "epoch": 2682} {"train_loss": -6.576846599578857, "global_step": 112670, "epoch": 2682} {"train_loss": -6.591531276702881, "global_step": 112671, "epoch": 2682} {"train_loss": -6.63370418548584, "global_step": 112672, "epoch": 2682} {"train_loss": -6.5521745681762695, "global_step": 112673, "epoch": 2682} {"train_loss": -6.491161823272705, "global_step": 112674, "epoch": 2682} {"train_loss": -6.513601303100586, "global_step": 112675, "epoch": 2682} {"train_loss": -6.391724586486816, "global_step": 112676, "epoch": 2682} {"train_loss": -6.388796806335449, "global_step": 112677, "epoch": 2682} {"train_loss": -6.594737529754639, "global_step": 112678, "epoch": 2682} {"train_loss": -6.533595561981201, "global_step": 112679, "epoch": 2682} {"train_loss": -6.490157127380371, "global_step": 112680, "epoch": 2682} {"train_loss": -6.465606689453125, "global_step": 112681, "epoch": 2682} {"train_loss": -6.578463554382324, "global_step": 112682, "epoch": 2682} {"train_loss": -6.526219844818115, "global_step": 112683, "epoch": 2682} {"train_loss": -6.496034145355225, "global_step": 112684, "epoch": 2682} {"train_loss": -6.4820774509793235, "global_step": 112685, "epoch": 2682, "val_loss": 67974.859375} {"train_loss": -6.4646806716918945, "global_step": 112686, "epoch": 2683} {"train_loss": -6.471297740936279, "global_step": 112687, "epoch": 2683} {"train_loss": -6.517187118530273, "global_step": 112688, "epoch": 2683} {"train_loss": -6.5854105949401855, "global_step": 112689, "epoch": 2683} {"train_loss": -6.507806301116943, "global_step": 112690, "epoch": 2683} {"train_loss": -6.597478866577148, "global_step": 112691, "epoch": 2683} {"train_loss": -6.52113151550293, "global_step": 112692, "epoch": 2683} {"train_loss": -6.448604106903076, "global_step": 112693, "epoch": 2683} {"train_loss": -6.414301872253418, "global_step": 112694, "epoch": 2683} {"train_loss": -6.566481590270996, "global_step": 112695, "epoch": 2683} {"train_loss": -6.529892444610596, "global_step": 112696, "epoch": 2683} {"train_loss": -6.407447814941406, "global_step": 112697, "epoch": 2683} {"train_loss": -6.547727108001709, "global_step": 112698, "epoch": 2683} {"train_loss": -6.485886573791504, "global_step": 112699, "epoch": 2683} {"train_loss": -6.504645347595215, "global_step": 112700, "epoch": 2683} {"train_loss": -6.5502424240112305, "global_step": 112701, "epoch": 2683} {"train_loss": -6.43936824798584, "global_step": 112702, "epoch": 2683} {"train_loss": -6.453342437744141, "global_step": 112703, "epoch": 2683} {"train_loss": -6.409405708312988, "global_step": 112704, "epoch": 2683} {"train_loss": -6.436276435852051, "global_step": 112705, "epoch": 2683} {"train_loss": -6.433221340179443, "global_step": 112706, "epoch": 2683} {"train_loss": -6.456437110900879, "global_step": 112707, "epoch": 2683} {"train_loss": -6.355772018432617, "global_step": 112708, "epoch": 2683} {"train_loss": -6.575345039367676, "global_step": 112709, "epoch": 2683} {"train_loss": -6.5156474113464355, "global_step": 112710, "epoch": 2683} {"train_loss": -6.386333465576172, "global_step": 112711, "epoch": 2683} {"train_loss": -6.450839042663574, "global_step": 112712, "epoch": 2683} {"train_loss": -6.48115348815918, "global_step": 112713, "epoch": 2683} {"train_loss": -6.511821746826172, "global_step": 112714, "epoch": 2683} {"train_loss": -6.430724620819092, "global_step": 112715, "epoch": 2683} {"train_loss": -6.539320468902588, "global_step": 112716, "epoch": 2683} {"train_loss": -6.499741554260254, "global_step": 112717, "epoch": 2683} {"train_loss": -6.394567012786865, "global_step": 112718, "epoch": 2683} {"train_loss": -6.520590782165527, "global_step": 112719, "epoch": 2683} {"train_loss": -6.58888053894043, "global_step": 112720, "epoch": 2683} {"train_loss": -6.499082565307617, "global_step": 112721, "epoch": 2683} {"train_loss": -6.498276710510254, "global_step": 112722, "epoch": 2683} {"train_loss": -6.507080554962158, "global_step": 112723, "epoch": 2683} {"train_loss": -6.483807563781738, "global_step": 112724, "epoch": 2683} {"train_loss": -6.493032455444336, "global_step": 112725, "epoch": 2683} {"train_loss": -6.486789703369141, "global_step": 112726, "epoch": 2683} {"train_loss": -6.490618092673166, "global_step": 112727, "epoch": 2683, "val_loss": 68068.9453125} {"train_loss": -6.535943031311035, "global_step": 112728, "epoch": 2684} {"train_loss": -6.56144905090332, "global_step": 112729, "epoch": 2684} {"train_loss": -6.5983991622924805, "global_step": 112730, "epoch": 2684} {"train_loss": -6.4561567306518555, "global_step": 112731, "epoch": 2684} {"train_loss": -6.442256927490234, "global_step": 112732, "epoch": 2684} {"train_loss": -6.498589515686035, "global_step": 112733, "epoch": 2684} {"train_loss": -6.249317169189453, "global_step": 112734, "epoch": 2684} {"train_loss": -6.555429458618164, "global_step": 112735, "epoch": 2684} {"train_loss": -6.461801528930664, "global_step": 112736, "epoch": 2684} {"train_loss": -6.338789463043213, "global_step": 112737, "epoch": 2684} {"train_loss": -6.465428352355957, "global_step": 112738, "epoch": 2684} {"train_loss": -6.474429130554199, "global_step": 112739, "epoch": 2684} {"train_loss": -6.545708656311035, "global_step": 112740, "epoch": 2684} {"train_loss": -6.471372604370117, "global_step": 112741, "epoch": 2684} {"train_loss": -6.4744720458984375, "global_step": 112742, "epoch": 2684} {"train_loss": -6.42371940612793, "global_step": 112743, "epoch": 2684} {"train_loss": -6.423903942108154, "global_step": 112744, "epoch": 2684} {"train_loss": -6.4074811935424805, "global_step": 112745, "epoch": 2684} {"train_loss": -6.374494552612305, "global_step": 112746, "epoch": 2684} {"train_loss": -6.378668785095215, "global_step": 112747, "epoch": 2684} {"train_loss": -6.381448745727539, "global_step": 112748, "epoch": 2684} {"train_loss": -6.5397419929504395, "global_step": 112749, "epoch": 2684} {"train_loss": -6.439707279205322, "global_step": 112750, "epoch": 2684} {"train_loss": -6.474643707275391, "global_step": 112751, "epoch": 2684} {"train_loss": -6.382765769958496, "global_step": 112752, "epoch": 2684} {"train_loss": -6.505353927612305, "global_step": 112753, "epoch": 2684} {"train_loss": -6.348784446716309, "global_step": 112754, "epoch": 2684} {"train_loss": -6.412952423095703, "global_step": 112755, "epoch": 2684} {"train_loss": -6.436927795410156, "global_step": 112756, "epoch": 2684} {"train_loss": -6.385462760925293, "global_step": 112757, "epoch": 2684} {"train_loss": -6.471681594848633, "global_step": 112758, "epoch": 2684} {"train_loss": -6.530728340148926, "global_step": 112759, "epoch": 2684} {"train_loss": -6.3618621826171875, "global_step": 112760, "epoch": 2684} {"train_loss": -6.400634765625, "global_step": 112761, "epoch": 2684} {"train_loss": -6.426313400268555, "global_step": 112762, "epoch": 2684} {"train_loss": -6.50526237487793, "global_step": 112763, "epoch": 2684} {"train_loss": -6.509000778198242, "global_step": 112764, "epoch": 2684} {"train_loss": -6.421004295349121, "global_step": 112765, "epoch": 2684} {"train_loss": -6.385397434234619, "global_step": 112766, "epoch": 2684} {"train_loss": -6.4409565925598145, "global_step": 112767, "epoch": 2684} {"train_loss": -6.414651870727539, "global_step": 112768, "epoch": 2684} {"train_loss": -6.447528328214373, "global_step": 112769, "epoch": 2684, "val_loss": 67745.8984375} {"train_loss": -6.47157096862793, "global_step": 112770, "epoch": 2685} {"train_loss": -6.515666961669922, "global_step": 112771, "epoch": 2685} {"train_loss": -6.4641828536987305, "global_step": 112772, "epoch": 2685} {"train_loss": -6.515120506286621, "global_step": 112773, "epoch": 2685} {"train_loss": -6.531332969665527, "global_step": 112774, "epoch": 2685} {"train_loss": -6.445237636566162, "global_step": 112775, "epoch": 2685} {"train_loss": -6.411201000213623, "global_step": 112776, "epoch": 2685} {"train_loss": -6.520973205566406, "global_step": 112777, "epoch": 2685} {"train_loss": -6.468054294586182, "global_step": 112778, "epoch": 2685} {"train_loss": -6.5039963722229, "global_step": 112779, "epoch": 2685} {"train_loss": -6.391860485076904, "global_step": 112780, "epoch": 2685} {"train_loss": -6.405014991760254, "global_step": 112781, "epoch": 2685} {"train_loss": -6.533050060272217, "global_step": 112782, "epoch": 2685} {"train_loss": -6.46970272064209, "global_step": 112783, "epoch": 2685} {"train_loss": -6.345129489898682, "global_step": 112784, "epoch": 2685} {"train_loss": -6.465015888214111, "global_step": 112785, "epoch": 2685} {"train_loss": -6.385410308837891, "global_step": 112786, "epoch": 2685} {"train_loss": -6.400649070739746, "global_step": 112787, "epoch": 2685} {"train_loss": -6.268397331237793, "global_step": 112788, "epoch": 2685} {"train_loss": -6.441732406616211, "global_step": 112789, "epoch": 2685} {"train_loss": -6.430602550506592, "global_step": 112790, "epoch": 2685} {"train_loss": -6.436999320983887, "global_step": 112791, "epoch": 2685} {"train_loss": -6.542545318603516, "global_step": 112792, "epoch": 2685} {"train_loss": -6.579524517059326, "global_step": 112793, "epoch": 2685} {"train_loss": -6.4207353591918945, "global_step": 112794, "epoch": 2685} {"train_loss": -6.348201751708984, "global_step": 112795, "epoch": 2685} {"train_loss": -6.401847839355469, "global_step": 112796, "epoch": 2685} {"train_loss": -6.539397239685059, "global_step": 112797, "epoch": 2685} {"train_loss": -6.371852874755859, "global_step": 112798, "epoch": 2685} {"train_loss": -6.379465103149414, "global_step": 112799, "epoch": 2685} {"train_loss": -6.446695804595947, "global_step": 112800, "epoch": 2685} {"train_loss": -6.423459053039551, "global_step": 112801, "epoch": 2685} {"train_loss": -6.4680867195129395, "global_step": 112802, "epoch": 2685} {"train_loss": -6.462886810302734, "global_step": 112803, "epoch": 2685} {"train_loss": -6.502582550048828, "global_step": 112804, "epoch": 2685} {"train_loss": -6.47115421295166, "global_step": 112805, "epoch": 2685} {"train_loss": -6.482966423034668, "global_step": 112806, "epoch": 2685} {"train_loss": -6.5031232833862305, "global_step": 112807, "epoch": 2685} {"train_loss": -6.422053813934326, "global_step": 112808, "epoch": 2685} {"train_loss": -6.47639274597168, "global_step": 112809, "epoch": 2685} {"train_loss": -6.4516377449035645, "global_step": 112810, "epoch": 2685} {"train_loss": -6.451224872044155, "global_step": 112811, "epoch": 2685, "val_loss": 67838.0625} {"train_loss": -6.568333625793457, "global_step": 112812, "epoch": 2686} {"train_loss": -6.488017559051514, "global_step": 112813, "epoch": 2686} {"train_loss": -6.591379642486572, "global_step": 112814, "epoch": 2686} {"train_loss": -6.503116607666016, "global_step": 112815, "epoch": 2686} {"train_loss": -6.437941551208496, "global_step": 112816, "epoch": 2686} {"train_loss": -6.493313312530518, "global_step": 112817, "epoch": 2686} {"train_loss": -6.332444190979004, "global_step": 112818, "epoch": 2686} {"train_loss": -6.465273857116699, "global_step": 112819, "epoch": 2686} {"train_loss": -6.466878414154053, "global_step": 112820, "epoch": 2686} {"train_loss": -6.463925838470459, "global_step": 112821, "epoch": 2686} {"train_loss": -6.454136848449707, "global_step": 112822, "epoch": 2686} {"train_loss": -6.442791938781738, "global_step": 112823, "epoch": 2686} {"train_loss": -6.454227447509766, "global_step": 112824, "epoch": 2686} {"train_loss": -6.434598922729492, "global_step": 112825, "epoch": 2686} {"train_loss": -6.31613826751709, "global_step": 112826, "epoch": 2686} {"train_loss": -6.5139007568359375, "global_step": 112827, "epoch": 2686} {"train_loss": -6.440406799316406, "global_step": 112828, "epoch": 2686} {"train_loss": -6.529205322265625, "global_step": 112829, "epoch": 2686} {"train_loss": -6.4703240394592285, "global_step": 112830, "epoch": 2686} {"train_loss": -6.429925918579102, "global_step": 112831, "epoch": 2686} {"train_loss": -6.463868141174316, "global_step": 112832, "epoch": 2686} {"train_loss": -6.3559041023254395, "global_step": 112833, "epoch": 2686} {"train_loss": -6.491178512573242, "global_step": 112834, "epoch": 2686} {"train_loss": -6.343780517578125, "global_step": 112835, "epoch": 2686} {"train_loss": -6.505684852600098, "global_step": 112836, "epoch": 2686} {"train_loss": -6.492023468017578, "global_step": 112837, "epoch": 2686} {"train_loss": -6.315677165985107, "global_step": 112838, "epoch": 2686} {"train_loss": -6.383133888244629, "global_step": 112839, "epoch": 2686} {"train_loss": -6.38585090637207, "global_step": 112840, "epoch": 2686} {"train_loss": -6.354202747344971, "global_step": 112841, "epoch": 2686} {"train_loss": -6.436274528503418, "global_step": 112842, "epoch": 2686} {"train_loss": -6.558603286743164, "global_step": 112843, "epoch": 2686} {"train_loss": -6.395479202270508, "global_step": 112844, "epoch": 2686} {"train_loss": -6.502254962921143, "global_step": 112845, "epoch": 2686} {"train_loss": -6.3556928634643555, "global_step": 112846, "epoch": 2686} {"train_loss": -6.395200729370117, "global_step": 112847, "epoch": 2686} {"train_loss": -6.401756286621094, "global_step": 112848, "epoch": 2686} {"train_loss": -6.345625400543213, "global_step": 112849, "epoch": 2686} {"train_loss": -6.4681806564331055, "global_step": 112850, "epoch": 2686} {"train_loss": -6.314975738525391, "global_step": 112851, "epoch": 2686} {"train_loss": -6.512885093688965, "global_step": 112852, "epoch": 2686} {"train_loss": -6.438107615425473, "global_step": 112853, "epoch": 2686, "val_loss": 67880.7578125} {"train_loss": -6.492856979370117, "global_step": 112854, "epoch": 2687} {"train_loss": -6.5032806396484375, "global_step": 112855, "epoch": 2687} {"train_loss": -6.473546028137207, "global_step": 112856, "epoch": 2687} {"train_loss": -6.429643630981445, "global_step": 112857, "epoch": 2687} {"train_loss": -6.378289222717285, "global_step": 112858, "epoch": 2687} {"train_loss": -6.460911750793457, "global_step": 112859, "epoch": 2687} {"train_loss": -6.319711685180664, "global_step": 112860, "epoch": 2687} {"train_loss": -6.468837738037109, "global_step": 112861, "epoch": 2687} {"train_loss": -6.535392761230469, "global_step": 112862, "epoch": 2687} {"train_loss": -6.385974884033203, "global_step": 112863, "epoch": 2687} {"train_loss": -6.435150146484375, "global_step": 112864, "epoch": 2687} {"train_loss": -6.3582868576049805, "global_step": 112865, "epoch": 2687} {"train_loss": -6.602769374847412, "global_step": 112866, "epoch": 2687} {"train_loss": -6.532163619995117, "global_step": 112867, "epoch": 2687} {"train_loss": -6.490203857421875, "global_step": 112868, "epoch": 2687} {"train_loss": -6.497421741485596, "global_step": 112869, "epoch": 2687} {"train_loss": -6.585687637329102, "global_step": 112870, "epoch": 2687} {"train_loss": -6.486038684844971, "global_step": 112871, "epoch": 2687} {"train_loss": -6.552752494812012, "global_step": 112872, "epoch": 2687} {"train_loss": -6.542390823364258, "global_step": 112873, "epoch": 2687} {"train_loss": -6.522037029266357, "global_step": 112874, "epoch": 2687} {"train_loss": -6.442302703857422, "global_step": 112875, "epoch": 2687} {"train_loss": -6.478653430938721, "global_step": 112876, "epoch": 2687} {"train_loss": -6.461699485778809, "global_step": 112877, "epoch": 2687} {"train_loss": -6.417558670043945, "global_step": 112878, "epoch": 2687} {"train_loss": -6.498466968536377, "global_step": 112879, "epoch": 2687} {"train_loss": -6.4523725509643555, "global_step": 112880, "epoch": 2687} {"train_loss": -6.440537452697754, "global_step": 112881, "epoch": 2687} {"train_loss": -6.404604911804199, "global_step": 112882, "epoch": 2687} {"train_loss": -6.431674480438232, "global_step": 112883, "epoch": 2687} {"train_loss": -6.494612693786621, "global_step": 112884, "epoch": 2687} {"train_loss": -6.388002395629883, "global_step": 112885, "epoch": 2687} {"train_loss": -6.417751312255859, "global_step": 112886, "epoch": 2687} {"train_loss": -6.493429183959961, "global_step": 112887, "epoch": 2687} {"train_loss": -6.416606426239014, "global_step": 112888, "epoch": 2687} {"train_loss": -6.566426753997803, "global_step": 112889, "epoch": 2687} {"train_loss": -6.3185811042785645, "global_step": 112890, "epoch": 2687} {"train_loss": -6.460279941558838, "global_step": 112891, "epoch": 2687} {"train_loss": -6.431259632110596, "global_step": 112892, "epoch": 2687} {"train_loss": -6.327352523803711, "global_step": 112893, "epoch": 2687} {"train_loss": -6.450684547424316, "global_step": 112894, "epoch": 2687} {"train_loss": -6.459287450427101, "global_step": 112895, "epoch": 2687, "val_loss": 68171.7890625} {"train_loss": -6.417775630950928, "global_step": 112896, "epoch": 2688} {"train_loss": -6.568244934082031, "global_step": 112897, "epoch": 2688} {"train_loss": -6.5040202140808105, "global_step": 112898, "epoch": 2688} {"train_loss": -6.4123735427856445, "global_step": 112899, "epoch": 2688} {"train_loss": -6.398536205291748, "global_step": 112900, "epoch": 2688} {"train_loss": -6.476839065551758, "global_step": 112901, "epoch": 2688} {"train_loss": -6.545444965362549, "global_step": 112902, "epoch": 2688} {"train_loss": -6.570435047149658, "global_step": 112903, "epoch": 2688} {"train_loss": -6.505230903625488, "global_step": 112904, "epoch": 2688} {"train_loss": -6.5642595291137695, "global_step": 112905, "epoch": 2688} {"train_loss": -6.295578956604004, "global_step": 112906, "epoch": 2688} {"train_loss": -6.40364933013916, "global_step": 112907, "epoch": 2688} {"train_loss": -6.599837303161621, "global_step": 112908, "epoch": 2688} {"train_loss": -6.319297790527344, "global_step": 112909, "epoch": 2688} {"train_loss": -6.534353733062744, "global_step": 112910, "epoch": 2688} {"train_loss": -6.595261573791504, "global_step": 112911, "epoch": 2688} {"train_loss": -6.45311975479126, "global_step": 112912, "epoch": 2688} {"train_loss": -6.310464859008789, "global_step": 112913, "epoch": 2688} {"train_loss": -6.647857666015625, "global_step": 112914, "epoch": 2688} {"train_loss": -6.363675117492676, "global_step": 112915, "epoch": 2688} {"train_loss": -6.379333019256592, "global_step": 112916, "epoch": 2688} {"train_loss": -6.407676696777344, "global_step": 112917, "epoch": 2688} {"train_loss": -6.390298843383789, "global_step": 112918, "epoch": 2688} {"train_loss": -6.492481231689453, "global_step": 112919, "epoch": 2688} {"train_loss": -6.375635147094727, "global_step": 112920, "epoch": 2688} {"train_loss": -6.486375331878662, "global_step": 112921, "epoch": 2688} {"train_loss": -6.432662487030029, "global_step": 112922, "epoch": 2688} {"train_loss": -6.479959964752197, "global_step": 112923, "epoch": 2688} {"train_loss": -6.407533168792725, "global_step": 112924, "epoch": 2688} {"train_loss": -6.471490383148193, "global_step": 112925, "epoch": 2688} {"train_loss": -6.41175651550293, "global_step": 112926, "epoch": 2688} {"train_loss": -6.448790073394775, "global_step": 112927, "epoch": 2688} {"train_loss": -6.4029998779296875, "global_step": 112928, "epoch": 2688} {"train_loss": -6.401018142700195, "global_step": 112929, "epoch": 2688} {"train_loss": -6.517963409423828, "global_step": 112930, "epoch": 2688} {"train_loss": -6.475345611572266, "global_step": 112931, "epoch": 2688} {"train_loss": -6.501020908355713, "global_step": 112932, "epoch": 2688} {"train_loss": -6.682867527008057, "global_step": 112933, "epoch": 2688} {"train_loss": -6.3324360847473145, "global_step": 112934, "epoch": 2688} {"train_loss": -6.578657627105713, "global_step": 112935, "epoch": 2688} {"train_loss": -6.509547233581543, "global_step": 112936, "epoch": 2688} {"train_loss": -6.4652213255564375, "global_step": 112937, "epoch": 2688, "val_loss": 67887.7109375} {"train_loss": -6.458144187927246, "global_step": 112938, "epoch": 2689} {"train_loss": -6.539772033691406, "global_step": 112939, "epoch": 2689} {"train_loss": -6.504361152648926, "global_step": 112940, "epoch": 2689} {"train_loss": -6.544439792633057, "global_step": 112941, "epoch": 2689} {"train_loss": -6.504021644592285, "global_step": 112942, "epoch": 2689} {"train_loss": -6.536460876464844, "global_step": 112943, "epoch": 2689} {"train_loss": -6.478297710418701, "global_step": 112944, "epoch": 2689} {"train_loss": -6.497014045715332, "global_step": 112945, "epoch": 2689} {"train_loss": -6.5398101806640625, "global_step": 112946, "epoch": 2689} {"train_loss": -6.5214104652404785, "global_step": 112947, "epoch": 2689} {"train_loss": -6.481325149536133, "global_step": 112948, "epoch": 2689} {"train_loss": -6.46864652633667, "global_step": 112949, "epoch": 2689} {"train_loss": -6.426255226135254, "global_step": 112950, "epoch": 2689} {"train_loss": -6.483804702758789, "global_step": 112951, "epoch": 2689} {"train_loss": -6.577335357666016, "global_step": 112952, "epoch": 2689} {"train_loss": -6.503218650817871, "global_step": 112953, "epoch": 2689} {"train_loss": -6.555181503295898, "global_step": 112954, "epoch": 2689} {"train_loss": -6.465887546539307, "global_step": 112955, "epoch": 2689} {"train_loss": -6.403464317321777, "global_step": 112956, "epoch": 2689} {"train_loss": -6.431203365325928, "global_step": 112957, "epoch": 2689} {"train_loss": -6.616466522216797, "global_step": 112958, "epoch": 2689} {"train_loss": -6.331421375274658, "global_step": 112959, "epoch": 2689} {"train_loss": -6.309051513671875, "global_step": 112960, "epoch": 2689} {"train_loss": -6.383870601654053, "global_step": 112961, "epoch": 2689} {"train_loss": -6.350566864013672, "global_step": 112962, "epoch": 2689} {"train_loss": -6.28061580657959, "global_step": 112963, "epoch": 2689} {"train_loss": -6.534523010253906, "global_step": 112964, "epoch": 2689} {"train_loss": -6.474452018737793, "global_step": 112965, "epoch": 2689} {"train_loss": -6.413347244262695, "global_step": 112966, "epoch": 2689} {"train_loss": -6.468786716461182, "global_step": 112967, "epoch": 2689} {"train_loss": -6.299996376037598, "global_step": 112968, "epoch": 2689} {"train_loss": -6.5020952224731445, "global_step": 112969, "epoch": 2689} {"train_loss": -6.3634748458862305, "global_step": 112970, "epoch": 2689} {"train_loss": -6.287109851837158, "global_step": 112971, "epoch": 2689} {"train_loss": -6.391887187957764, "global_step": 112972, "epoch": 2689} {"train_loss": -6.278166770935059, "global_step": 112973, "epoch": 2689} {"train_loss": -6.2687668800354, "global_step": 112974, "epoch": 2689} {"train_loss": -6.403242588043213, "global_step": 112975, "epoch": 2689} {"train_loss": -6.395413875579834, "global_step": 112976, "epoch": 2689} {"train_loss": -6.458899974822998, "global_step": 112977, "epoch": 2689} {"train_loss": -6.447983741760254, "global_step": 112978, "epoch": 2689} {"train_loss": -6.444091558456421, "global_step": 112979, "epoch": 2689, "val_loss": 67724.9375} {"train_loss": -6.4465484619140625, "global_step": 112980, "epoch": 2690} {"train_loss": -6.441877365112305, "global_step": 112981, "epoch": 2690} {"train_loss": -6.432117462158203, "global_step": 112982, "epoch": 2690} {"train_loss": -6.483073711395264, "global_step": 112983, "epoch": 2690} {"train_loss": -6.480424880981445, "global_step": 112984, "epoch": 2690} {"train_loss": -6.555792808532715, "global_step": 112985, "epoch": 2690} {"train_loss": -6.357399940490723, "global_step": 112986, "epoch": 2690} {"train_loss": -6.483020782470703, "global_step": 112987, "epoch": 2690} {"train_loss": -6.371175289154053, "global_step": 112988, "epoch": 2690} {"train_loss": -6.4565534591674805, "global_step": 112989, "epoch": 2690} {"train_loss": -6.349452018737793, "global_step": 112990, "epoch": 2690} {"train_loss": -6.382899284362793, "global_step": 112991, "epoch": 2690} {"train_loss": -6.493472099304199, "global_step": 112992, "epoch": 2690} {"train_loss": -6.456057548522949, "global_step": 112993, "epoch": 2690} {"train_loss": -6.488894939422607, "global_step": 112994, "epoch": 2690} {"train_loss": -6.575568199157715, "global_step": 112995, "epoch": 2690} {"train_loss": -6.437243461608887, "global_step": 112996, "epoch": 2690} {"train_loss": -6.603106498718262, "global_step": 112997, "epoch": 2690} {"train_loss": -6.459396839141846, "global_step": 112998, "epoch": 2690} {"train_loss": -6.51845121383667, "global_step": 112999, "epoch": 2690} {"train_loss": -6.453560829162598, "global_step": 113000, "epoch": 2690} {"train_loss": -6.494000434875488, "global_step": 113001, "epoch": 2690} {"train_loss": -6.446008682250977, "global_step": 113002, "epoch": 2690} {"train_loss": -6.4640045166015625, "global_step": 113003, "epoch": 2690} {"train_loss": -6.446331024169922, "global_step": 113004, "epoch": 2690} {"train_loss": -6.503978252410889, "global_step": 113005, "epoch": 2690} {"train_loss": -6.435669898986816, "global_step": 113006, "epoch": 2690} {"train_loss": -6.483882904052734, "global_step": 113007, "epoch": 2690} {"train_loss": -6.567300796508789, "global_step": 113008, "epoch": 2690} {"train_loss": -6.439389228820801, "global_step": 113009, "epoch": 2690} {"train_loss": -6.550034523010254, "global_step": 113010, "epoch": 2690} {"train_loss": -6.428246974945068, "global_step": 113011, "epoch": 2690} {"train_loss": -6.402906894683838, "global_step": 113012, "epoch": 2690} {"train_loss": -6.403452396392822, "global_step": 113013, "epoch": 2690} {"train_loss": -6.567946434020996, "global_step": 113014, "epoch": 2690} {"train_loss": -6.4742751121521, "global_step": 113015, "epoch": 2690} {"train_loss": -6.427107334136963, "global_step": 113016, "epoch": 2690} {"train_loss": -6.320469856262207, "global_step": 113017, "epoch": 2690} {"train_loss": -6.396341800689697, "global_step": 113018, "epoch": 2690} {"train_loss": -6.568845748901367, "global_step": 113019, "epoch": 2690} {"train_loss": -6.422882556915283, "global_step": 113020, "epoch": 2690} {"train_loss": -6.459882168542771, "global_step": 113021, "epoch": 2690, "val_loss": 68045.59375} {"train_loss": -6.503657341003418, "global_step": 113022, "epoch": 2691} {"train_loss": -6.525549411773682, "global_step": 113023, "epoch": 2691} {"train_loss": -6.511748313903809, "global_step": 113024, "epoch": 2691} {"train_loss": -6.523065090179443, "global_step": 113025, "epoch": 2691} {"train_loss": -6.396936416625977, "global_step": 113026, "epoch": 2691} {"train_loss": -6.5376877784729, "global_step": 113027, "epoch": 2691} {"train_loss": -6.497637748718262, "global_step": 113028, "epoch": 2691} {"train_loss": -6.542903900146484, "global_step": 113029, "epoch": 2691} {"train_loss": -6.517740249633789, "global_step": 113030, "epoch": 2691} {"train_loss": -6.486912727355957, "global_step": 113031, "epoch": 2691} {"train_loss": -6.536349773406982, "global_step": 113032, "epoch": 2691} {"train_loss": -6.465911865234375, "global_step": 113033, "epoch": 2691} {"train_loss": -6.426675796508789, "global_step": 113034, "epoch": 2691} {"train_loss": -6.360598087310791, "global_step": 113035, "epoch": 2691} {"train_loss": -6.453059196472168, "global_step": 113036, "epoch": 2691} {"train_loss": -6.442384243011475, "global_step": 113037, "epoch": 2691} {"train_loss": -6.4660186767578125, "global_step": 113038, "epoch": 2691} {"train_loss": -6.399423599243164, "global_step": 113039, "epoch": 2691} {"train_loss": -6.367013931274414, "global_step": 113040, "epoch": 2691} {"train_loss": -6.439682960510254, "global_step": 113041, "epoch": 2691} {"train_loss": -6.4714250564575195, "global_step": 113042, "epoch": 2691} {"train_loss": -6.41809606552124, "global_step": 113043, "epoch": 2691} {"train_loss": -6.422422409057617, "global_step": 113044, "epoch": 2691} {"train_loss": -6.518829345703125, "global_step": 113045, "epoch": 2691} {"train_loss": -6.395785331726074, "global_step": 113046, "epoch": 2691} {"train_loss": -6.428149700164795, "global_step": 113047, "epoch": 2691} {"train_loss": -6.526088714599609, "global_step": 113048, "epoch": 2691} {"train_loss": -6.314128398895264, "global_step": 113049, "epoch": 2691} {"train_loss": -6.5442657470703125, "global_step": 113050, "epoch": 2691} {"train_loss": -6.4970855712890625, "global_step": 113051, "epoch": 2691} {"train_loss": -6.475460052490234, "global_step": 113052, "epoch": 2691} {"train_loss": -6.441025733947754, "global_step": 113053, "epoch": 2691} {"train_loss": -6.452635765075684, "global_step": 113054, "epoch": 2691} {"train_loss": -6.423957824707031, "global_step": 113055, "epoch": 2691} {"train_loss": -6.535172462463379, "global_step": 113056, "epoch": 2691} {"train_loss": -6.4076995849609375, "global_step": 113057, "epoch": 2691} {"train_loss": -6.398942947387695, "global_step": 113058, "epoch": 2691} {"train_loss": -6.3962578773498535, "global_step": 113059, "epoch": 2691} {"train_loss": -6.500168800354004, "global_step": 113060, "epoch": 2691} {"train_loss": -6.459782600402832, "global_step": 113061, "epoch": 2691} {"train_loss": -6.43480110168457, "global_step": 113062, "epoch": 2691} {"train_loss": -6.457854452587309, "global_step": 113063, "epoch": 2691, "val_loss": 67802.5078125} {"train_loss": -6.478713035583496, "global_step": 113064, "epoch": 2692} {"train_loss": -6.258266448974609, "global_step": 113065, "epoch": 2692} {"train_loss": -6.42317008972168, "global_step": 113066, "epoch": 2692} {"train_loss": -6.473404884338379, "global_step": 113067, "epoch": 2692} {"train_loss": -6.500907897949219, "global_step": 113068, "epoch": 2692} {"train_loss": -6.516387939453125, "global_step": 113069, "epoch": 2692} {"train_loss": -6.531461715698242, "global_step": 113070, "epoch": 2692} {"train_loss": -6.542225360870361, "global_step": 113071, "epoch": 2692} {"train_loss": -6.673702716827393, "global_step": 113072, "epoch": 2692} {"train_loss": -6.518427848815918, "global_step": 113073, "epoch": 2692} {"train_loss": -6.5389862060546875, "global_step": 113074, "epoch": 2692} {"train_loss": -6.5806169509887695, "global_step": 113075, "epoch": 2692} {"train_loss": -6.571781158447266, "global_step": 113076, "epoch": 2692} {"train_loss": -6.49848747253418, "global_step": 113077, "epoch": 2692} {"train_loss": -6.434190273284912, "global_step": 113078, "epoch": 2692} {"train_loss": -6.5634989738464355, "global_step": 113079, "epoch": 2692} {"train_loss": -6.525937080383301, "global_step": 113080, "epoch": 2692} {"train_loss": -6.543297290802002, "global_step": 113081, "epoch": 2692} {"train_loss": -6.656553268432617, "global_step": 113082, "epoch": 2692} {"train_loss": -6.53639030456543, "global_step": 113083, "epoch": 2692} {"train_loss": -6.500985145568848, "global_step": 113084, "epoch": 2692} {"train_loss": -6.382452964782715, "global_step": 113085, "epoch": 2692} {"train_loss": -6.387690544128418, "global_step": 113086, "epoch": 2692} {"train_loss": -6.485790252685547, "global_step": 113087, "epoch": 2692} {"train_loss": -6.428252696990967, "global_step": 113088, "epoch": 2692} {"train_loss": -6.43228006362915, "global_step": 113089, "epoch": 2692} {"train_loss": -6.510159492492676, "global_step": 113090, "epoch": 2692} {"train_loss": -6.360500335693359, "global_step": 113091, "epoch": 2692} {"train_loss": -6.391702651977539, "global_step": 113092, "epoch": 2692} {"train_loss": -6.4766645431518555, "global_step": 113093, "epoch": 2692} {"train_loss": -6.406368255615234, "global_step": 113094, "epoch": 2692} {"train_loss": -6.525651454925537, "global_step": 113095, "epoch": 2692} {"train_loss": -6.443095684051514, "global_step": 113096, "epoch": 2692} {"train_loss": -6.452758312225342, "global_step": 113097, "epoch": 2692} {"train_loss": -6.361607551574707, "global_step": 113098, "epoch": 2692} {"train_loss": -6.4536261558532715, "global_step": 113099, "epoch": 2692} {"train_loss": -6.399017333984375, "global_step": 113100, "epoch": 2692} {"train_loss": -6.46999454498291, "global_step": 113101, "epoch": 2692} {"train_loss": -6.413852691650391, "global_step": 113102, "epoch": 2692} {"train_loss": -6.415012359619141, "global_step": 113103, "epoch": 2692} {"train_loss": -6.427361011505127, "global_step": 113104, "epoch": 2692} {"train_loss": -6.475057976586478, "global_step": 113105, "epoch": 2692, "val_loss": 68030.7109375} {"train_loss": -6.45150089263916, "global_step": 113106, "epoch": 2693} {"train_loss": -6.3530097007751465, "global_step": 113107, "epoch": 2693} {"train_loss": -6.515726566314697, "global_step": 113108, "epoch": 2693} {"train_loss": -6.439487457275391, "global_step": 113109, "epoch": 2693} {"train_loss": -6.373365879058838, "global_step": 113110, "epoch": 2693} {"train_loss": -6.4734039306640625, "global_step": 113111, "epoch": 2693} {"train_loss": -6.195713043212891, "global_step": 113112, "epoch": 2693} {"train_loss": -6.3246026039123535, "global_step": 113113, "epoch": 2693} {"train_loss": -6.381669044494629, "global_step": 113114, "epoch": 2693} {"train_loss": -6.479292869567871, "global_step": 113115, "epoch": 2693} {"train_loss": -6.5550665855407715, "global_step": 113116, "epoch": 2693} {"train_loss": -6.409124374389648, "global_step": 113117, "epoch": 2693} {"train_loss": -6.4153852462768555, "global_step": 113118, "epoch": 2693} {"train_loss": -6.47500467300415, "global_step": 113119, "epoch": 2693} {"train_loss": -6.451326370239258, "global_step": 113120, "epoch": 2693} {"train_loss": -6.4193267822265625, "global_step": 113121, "epoch": 2693} {"train_loss": -6.445005893707275, "global_step": 113122, "epoch": 2693} {"train_loss": -6.448626518249512, "global_step": 113123, "epoch": 2693} {"train_loss": -6.435894012451172, "global_step": 113124, "epoch": 2693} {"train_loss": -6.494115352630615, "global_step": 113125, "epoch": 2693} {"train_loss": -6.48361349105835, "global_step": 113126, "epoch": 2693} {"train_loss": -6.476071357727051, "global_step": 113127, "epoch": 2693} {"train_loss": -6.499019622802734, "global_step": 113128, "epoch": 2693} {"train_loss": -6.517579078674316, "global_step": 113129, "epoch": 2693} {"train_loss": -6.38143253326416, "global_step": 113130, "epoch": 2693} {"train_loss": -6.368208885192871, "global_step": 113131, "epoch": 2693} {"train_loss": -6.424712181091309, "global_step": 113132, "epoch": 2693} {"train_loss": -6.5088396072387695, "global_step": 113133, "epoch": 2693} {"train_loss": -6.493220329284668, "global_step": 113134, "epoch": 2693} {"train_loss": -6.459719657897949, "global_step": 113135, "epoch": 2693} {"train_loss": -6.385028839111328, "global_step": 113136, "epoch": 2693} {"train_loss": -6.570281982421875, "global_step": 113137, "epoch": 2693} {"train_loss": -6.611255645751953, "global_step": 113138, "epoch": 2693} {"train_loss": -6.517940521240234, "global_step": 113139, "epoch": 2693} {"train_loss": -6.459546089172363, "global_step": 113140, "epoch": 2693} {"train_loss": -6.616061210632324, "global_step": 113141, "epoch": 2693} {"train_loss": -6.4348649978637695, "global_step": 113142, "epoch": 2693} {"train_loss": -6.418065071105957, "global_step": 113143, "epoch": 2693} {"train_loss": -6.548525333404541, "global_step": 113144, "epoch": 2693} {"train_loss": -6.475653648376465, "global_step": 113145, "epoch": 2693} {"train_loss": -6.440064430236816, "global_step": 113146, "epoch": 2693} {"train_loss": -6.454181852794829, "global_step": 113147, "epoch": 2693, "val_loss": 67908.7578125} {"train_loss": -6.482863426208496, "global_step": 113148, "epoch": 2694} {"train_loss": -6.379215240478516, "global_step": 113149, "epoch": 2694} {"train_loss": -6.44744873046875, "global_step": 113150, "epoch": 2694} {"train_loss": -6.483436584472656, "global_step": 113151, "epoch": 2694} {"train_loss": -6.500039100646973, "global_step": 113152, "epoch": 2694} {"train_loss": -6.3707380294799805, "global_step": 113153, "epoch": 2694} {"train_loss": -6.53859806060791, "global_step": 113154, "epoch": 2694} {"train_loss": -6.470433712005615, "global_step": 113155, "epoch": 2694} {"train_loss": -6.441718101501465, "global_step": 113156, "epoch": 2694} {"train_loss": -6.405731201171875, "global_step": 113157, "epoch": 2694} {"train_loss": -6.366817474365234, "global_step": 113158, "epoch": 2694} {"train_loss": -6.454838275909424, "global_step": 113159, "epoch": 2694} {"train_loss": -6.544888496398926, "global_step": 113160, "epoch": 2694} {"train_loss": -6.424776077270508, "global_step": 113161, "epoch": 2694} {"train_loss": -6.493719100952148, "global_step": 113162, "epoch": 2694} {"train_loss": -6.4173455238342285, "global_step": 113163, "epoch": 2694} {"train_loss": -6.458017826080322, "global_step": 113164, "epoch": 2694} {"train_loss": -6.528895378112793, "global_step": 113165, "epoch": 2694} {"train_loss": -6.498467922210693, "global_step": 113166, "epoch": 2694} {"train_loss": -6.4195051193237305, "global_step": 113167, "epoch": 2694} {"train_loss": -6.469838619232178, "global_step": 113168, "epoch": 2694} {"train_loss": -6.456933975219727, "global_step": 113169, "epoch": 2694} {"train_loss": -6.40940523147583, "global_step": 113170, "epoch": 2694} {"train_loss": -6.404375076293945, "global_step": 113171, "epoch": 2694} {"train_loss": -6.429021835327148, "global_step": 113172, "epoch": 2694} {"train_loss": -6.422491073608398, "global_step": 113173, "epoch": 2694} {"train_loss": -6.445588111877441, "global_step": 113174, "epoch": 2694} {"train_loss": -6.5049357414245605, "global_step": 113175, "epoch": 2694} {"train_loss": -6.58560037612915, "global_step": 113176, "epoch": 2694} {"train_loss": -6.492012023925781, "global_step": 113177, "epoch": 2694} {"train_loss": -6.529669284820557, "global_step": 113178, "epoch": 2694} {"train_loss": -6.467298984527588, "global_step": 113179, "epoch": 2694} {"train_loss": -6.356805801391602, "global_step": 113180, "epoch": 2694} {"train_loss": -6.44749641418457, "global_step": 113181, "epoch": 2694} {"train_loss": -6.551140785217285, "global_step": 113182, "epoch": 2694} {"train_loss": -6.340015888214111, "global_step": 113183, "epoch": 2694} {"train_loss": -6.465105056762695, "global_step": 113184, "epoch": 2694} {"train_loss": -6.496944427490234, "global_step": 113185, "epoch": 2694} {"train_loss": -6.370221138000488, "global_step": 113186, "epoch": 2694} {"train_loss": -6.470732688903809, "global_step": 113187, "epoch": 2694} {"train_loss": -6.457470417022705, "global_step": 113188, "epoch": 2694} {"train_loss": -6.458546377363659, "global_step": 113189, "epoch": 2694, "val_loss": 67840.6328125} {"train_loss": -6.485762596130371, "global_step": 113190, "epoch": 2695} {"train_loss": -6.503820419311523, "global_step": 113191, "epoch": 2695} {"train_loss": -6.454911708831787, "global_step": 113192, "epoch": 2695} {"train_loss": -6.385817527770996, "global_step": 113193, "epoch": 2695} {"train_loss": -6.417243957519531, "global_step": 113194, "epoch": 2695} {"train_loss": -6.4782209396362305, "global_step": 113195, "epoch": 2695} {"train_loss": -6.436766624450684, "global_step": 113196, "epoch": 2695} {"train_loss": -6.451132774353027, "global_step": 113197, "epoch": 2695} {"train_loss": -6.374299049377441, "global_step": 113198, "epoch": 2695} {"train_loss": -6.442237854003906, "global_step": 113199, "epoch": 2695} {"train_loss": -6.4862189292907715, "global_step": 113200, "epoch": 2695} {"train_loss": -6.3954362869262695, "global_step": 113201, "epoch": 2695} {"train_loss": -6.481361389160156, "global_step": 113202, "epoch": 2695} {"train_loss": -6.445511817932129, "global_step": 113203, "epoch": 2695} {"train_loss": -6.476626396179199, "global_step": 113204, "epoch": 2695} {"train_loss": -6.493956089019775, "global_step": 113205, "epoch": 2695} {"train_loss": -6.492539405822754, "global_step": 113206, "epoch": 2695} {"train_loss": -6.527339935302734, "global_step": 113207, "epoch": 2695} {"train_loss": -6.451476573944092, "global_step": 113208, "epoch": 2695} {"train_loss": -6.4248456954956055, "global_step": 113209, "epoch": 2695} {"train_loss": -6.422289848327637, "global_step": 113210, "epoch": 2695} {"train_loss": -6.488901138305664, "global_step": 113211, "epoch": 2695} {"train_loss": -6.495932579040527, "global_step": 113212, "epoch": 2695} {"train_loss": -6.4470062255859375, "global_step": 113213, "epoch": 2695} {"train_loss": -6.42165470123291, "global_step": 113214, "epoch": 2695} {"train_loss": -6.577362537384033, "global_step": 113215, "epoch": 2695} {"train_loss": -6.534045696258545, "global_step": 113216, "epoch": 2695} {"train_loss": -6.490095138549805, "global_step": 113217, "epoch": 2695} {"train_loss": -6.472034931182861, "global_step": 113218, "epoch": 2695} {"train_loss": -6.485875129699707, "global_step": 113219, "epoch": 2695} {"train_loss": -6.460219383239746, "global_step": 113220, "epoch": 2695} {"train_loss": -6.5209269523620605, "global_step": 113221, "epoch": 2695} {"train_loss": -6.4251837730407715, "global_step": 113222, "epoch": 2695} {"train_loss": -6.439141273498535, "global_step": 113223, "epoch": 2695} {"train_loss": -6.533606052398682, "global_step": 113224, "epoch": 2695} {"train_loss": -6.44647741317749, "global_step": 113225, "epoch": 2695} {"train_loss": -6.370160102844238, "global_step": 113226, "epoch": 2695} {"train_loss": -6.434696197509766, "global_step": 113227, "epoch": 2695} {"train_loss": -6.546643257141113, "global_step": 113228, "epoch": 2695} {"train_loss": -6.492116928100586, "global_step": 113229, "epoch": 2695} {"train_loss": -6.497745513916016, "global_step": 113230, "epoch": 2695} {"train_loss": -6.467946245556786, "global_step": 113231, "epoch": 2695, "val_loss": 67786.84375} {"train_loss": -6.456864833831787, "global_step": 113232, "epoch": 2696} {"train_loss": -6.505626678466797, "global_step": 113233, "epoch": 2696} {"train_loss": -6.45676326751709, "global_step": 113234, "epoch": 2696} {"train_loss": -6.48403263092041, "global_step": 113235, "epoch": 2696} {"train_loss": -6.4339799880981445, "global_step": 113236, "epoch": 2696} {"train_loss": -6.449216365814209, "global_step": 113237, "epoch": 2696} {"train_loss": -6.305404186248779, "global_step": 113238, "epoch": 2696} {"train_loss": -6.4808149337768555, "global_step": 113239, "epoch": 2696} {"train_loss": -6.320481777191162, "global_step": 113240, "epoch": 2696} {"train_loss": -6.407074451446533, "global_step": 113241, "epoch": 2696} {"train_loss": -6.475212574005127, "global_step": 113242, "epoch": 2696} {"train_loss": -6.425049781799316, "global_step": 113243, "epoch": 2696} {"train_loss": -6.279346942901611, "global_step": 113244, "epoch": 2696} {"train_loss": -6.4405670166015625, "global_step": 113245, "epoch": 2696} {"train_loss": -6.460072994232178, "global_step": 113246, "epoch": 2696} {"train_loss": -6.4174017906188965, "global_step": 113247, "epoch": 2696} {"train_loss": -6.435494422912598, "global_step": 113248, "epoch": 2696} {"train_loss": -6.541152000427246, "global_step": 113249, "epoch": 2696} {"train_loss": -6.5427470207214355, "global_step": 113250, "epoch": 2696} {"train_loss": -6.350378513336182, "global_step": 113251, "epoch": 2696} {"train_loss": -6.510951042175293, "global_step": 113252, "epoch": 2696} {"train_loss": -6.450838088989258, "global_step": 113253, "epoch": 2696} {"train_loss": -6.406549453735352, "global_step": 113254, "epoch": 2696} {"train_loss": -6.3992133140563965, "global_step": 113255, "epoch": 2696} {"train_loss": -6.2444658279418945, "global_step": 113256, "epoch": 2696} {"train_loss": -6.418094635009766, "global_step": 113257, "epoch": 2696} {"train_loss": -6.5531768798828125, "global_step": 113258, "epoch": 2696} {"train_loss": -6.356451034545898, "global_step": 113259, "epoch": 2696} {"train_loss": -6.337528228759766, "global_step": 113260, "epoch": 2696} {"train_loss": -6.424566745758057, "global_step": 113261, "epoch": 2696} {"train_loss": -6.3785576820373535, "global_step": 113262, "epoch": 2696} {"train_loss": -6.31043815612793, "global_step": 113263, "epoch": 2696} {"train_loss": -6.27480936050415, "global_step": 113264, "epoch": 2696} {"train_loss": -6.447098731994629, "global_step": 113265, "epoch": 2696} {"train_loss": -6.420985221862793, "global_step": 113266, "epoch": 2696} {"train_loss": -6.529534339904785, "global_step": 113267, "epoch": 2696} {"train_loss": -6.445881366729736, "global_step": 113268, "epoch": 2696} {"train_loss": -6.490485668182373, "global_step": 113269, "epoch": 2696} {"train_loss": -6.446168422698975, "global_step": 113270, "epoch": 2696} {"train_loss": -6.4333391189575195, "global_step": 113271, "epoch": 2696} {"train_loss": -6.385933876037598, "global_step": 113272, "epoch": 2696} {"train_loss": -6.426184415817261, "global_step": 113273, "epoch": 2696, "val_loss": 67981.1875} {"train_loss": -6.474082946777344, "global_step": 113274, "epoch": 2697} {"train_loss": -6.451389312744141, "global_step": 113275, "epoch": 2697} {"train_loss": -6.311841011047363, "global_step": 113276, "epoch": 2697} {"train_loss": -6.54307746887207, "global_step": 113277, "epoch": 2697} {"train_loss": -6.496445655822754, "global_step": 113278, "epoch": 2697} {"train_loss": -6.458827972412109, "global_step": 113279, "epoch": 2697} {"train_loss": -6.465744972229004, "global_step": 113280, "epoch": 2697} {"train_loss": -6.438270568847656, "global_step": 113281, "epoch": 2697} {"train_loss": -6.35916805267334, "global_step": 113282, "epoch": 2697} {"train_loss": -6.473832607269287, "global_step": 113283, "epoch": 2697} {"train_loss": -6.533638000488281, "global_step": 113284, "epoch": 2697} {"train_loss": -6.470595359802246, "global_step": 113285, "epoch": 2697} {"train_loss": -6.480927467346191, "global_step": 113286, "epoch": 2697} {"train_loss": -6.4924211502075195, "global_step": 113287, "epoch": 2697} {"train_loss": -6.469045639038086, "global_step": 113288, "epoch": 2697} {"train_loss": -6.544003486633301, "global_step": 113289, "epoch": 2697} {"train_loss": -6.534702301025391, "global_step": 113290, "epoch": 2697} {"train_loss": -6.419985771179199, "global_step": 113291, "epoch": 2697} {"train_loss": -6.398930549621582, "global_step": 113292, "epoch": 2697} {"train_loss": -6.519903182983398, "global_step": 113293, "epoch": 2697} {"train_loss": -6.406993389129639, "global_step": 113294, "epoch": 2697} {"train_loss": -6.388825416564941, "global_step": 113295, "epoch": 2697} {"train_loss": -6.3722639083862305, "global_step": 113296, "epoch": 2697} {"train_loss": -6.584811687469482, "global_step": 113297, "epoch": 2697} {"train_loss": -6.475379943847656, "global_step": 113298, "epoch": 2697} {"train_loss": -6.505221366882324, "global_step": 113299, "epoch": 2697} {"train_loss": -6.484710693359375, "global_step": 113300, "epoch": 2697} {"train_loss": -6.460868835449219, "global_step": 113301, "epoch": 2697} {"train_loss": -6.531237602233887, "global_step": 113302, "epoch": 2697} {"train_loss": -6.541983604431152, "global_step": 113303, "epoch": 2697} {"train_loss": -6.479378700256348, "global_step": 113304, "epoch": 2697} {"train_loss": -6.4692535400390625, "global_step": 113305, "epoch": 2697} {"train_loss": -6.433834552764893, "global_step": 113306, "epoch": 2697} {"train_loss": -6.5028910636901855, "global_step": 113307, "epoch": 2697} {"train_loss": -6.5540924072265625, "global_step": 113308, "epoch": 2697} {"train_loss": -6.462381362915039, "global_step": 113309, "epoch": 2697} {"train_loss": -6.5354132652282715, "global_step": 113310, "epoch": 2697} {"train_loss": -6.525886535644531, "global_step": 113311, "epoch": 2697} {"train_loss": -6.5244460105896, "global_step": 113312, "epoch": 2697} {"train_loss": -6.424671173095703, "global_step": 113313, "epoch": 2697} {"train_loss": -6.4789838790893555, "global_step": 113314, "epoch": 2697} {"train_loss": -6.475982552482968, "global_step": 113315, "epoch": 2697, "val_loss": 67860.4609375} {"train_loss": -6.506324291229248, "global_step": 113316, "epoch": 2698} {"train_loss": -6.523210048675537, "global_step": 113317, "epoch": 2698} {"train_loss": -6.444598197937012, "global_step": 113318, "epoch": 2698} {"train_loss": -6.574139595031738, "global_step": 113319, "epoch": 2698} {"train_loss": -6.33027982711792, "global_step": 113320, "epoch": 2698} {"train_loss": -6.326223373413086, "global_step": 113321, "epoch": 2698} {"train_loss": -6.553793907165527, "global_step": 113322, "epoch": 2698} {"train_loss": -6.374737739562988, "global_step": 113323, "epoch": 2698} {"train_loss": -6.454991340637207, "global_step": 113324, "epoch": 2698} {"train_loss": -6.460927963256836, "global_step": 113325, "epoch": 2698} {"train_loss": -6.357353687286377, "global_step": 113326, "epoch": 2698} {"train_loss": -6.412317752838135, "global_step": 113327, "epoch": 2698} {"train_loss": -6.3652544021606445, "global_step": 113328, "epoch": 2698} {"train_loss": -6.371452331542969, "global_step": 113329, "epoch": 2698} {"train_loss": -6.473631858825684, "global_step": 113330, "epoch": 2698} {"train_loss": -6.478477478027344, "global_step": 113331, "epoch": 2698} {"train_loss": -6.406210422515869, "global_step": 113332, "epoch": 2698} {"train_loss": -6.3596696853637695, "global_step": 113333, "epoch": 2698} {"train_loss": -6.375990867614746, "global_step": 113334, "epoch": 2698} {"train_loss": -6.311073303222656, "global_step": 113335, "epoch": 2698} {"train_loss": -6.444911479949951, "global_step": 113336, "epoch": 2698} {"train_loss": -6.404261589050293, "global_step": 113337, "epoch": 2698} {"train_loss": -6.39663553237915, "global_step": 113338, "epoch": 2698} {"train_loss": -6.3706464767456055, "global_step": 113339, "epoch": 2698} {"train_loss": -6.393836498260498, "global_step": 113340, "epoch": 2698} {"train_loss": -6.4473161697387695, "global_step": 113341, "epoch": 2698} {"train_loss": -6.563774108886719, "global_step": 113342, "epoch": 2698} {"train_loss": -6.443500995635986, "global_step": 113343, "epoch": 2698} {"train_loss": -6.461600303649902, "global_step": 113344, "epoch": 2698} {"train_loss": -6.458509922027588, "global_step": 113345, "epoch": 2698} {"train_loss": -6.329240798950195, "global_step": 113346, "epoch": 2698} {"train_loss": -6.588909149169922, "global_step": 113347, "epoch": 2698} {"train_loss": -6.421133995056152, "global_step": 113348, "epoch": 2698} {"train_loss": -6.4018754959106445, "global_step": 113349, "epoch": 2698} {"train_loss": -6.501930236816406, "global_step": 113350, "epoch": 2698} {"train_loss": -6.264063835144043, "global_step": 113351, "epoch": 2698} {"train_loss": -6.454872131347656, "global_step": 113352, "epoch": 2698} {"train_loss": -6.32969331741333, "global_step": 113353, "epoch": 2698} {"train_loss": -6.385512351989746, "global_step": 113354, "epoch": 2698} {"train_loss": -6.3842668533325195, "global_step": 113355, "epoch": 2698} {"train_loss": -6.3876800537109375, "global_step": 113356, "epoch": 2698} {"train_loss": -6.423072292691185, "global_step": 113357, "epoch": 2698, "val_loss": 68014.6484375} {"train_loss": -6.356486797332764, "global_step": 113358, "epoch": 2699} {"train_loss": -6.399126052856445, "global_step": 113359, "epoch": 2699} {"train_loss": -6.53476619720459, "global_step": 113360, "epoch": 2699} {"train_loss": -6.437959671020508, "global_step": 113361, "epoch": 2699} {"train_loss": -6.528422832489014, "global_step": 113362, "epoch": 2699} {"train_loss": -6.340154647827148, "global_step": 113363, "epoch": 2699} {"train_loss": -6.491264820098877, "global_step": 113364, "epoch": 2699} {"train_loss": -6.463028430938721, "global_step": 113365, "epoch": 2699} {"train_loss": -6.541015625, "global_step": 113366, "epoch": 2699} {"train_loss": -6.540065765380859, "global_step": 113367, "epoch": 2699} {"train_loss": -6.3072285652160645, "global_step": 113368, "epoch": 2699} {"train_loss": -6.485298156738281, "global_step": 113369, "epoch": 2699} {"train_loss": -6.590811252593994, "global_step": 113370, "epoch": 2699} {"train_loss": -6.501436233520508, "global_step": 113371, "epoch": 2699} {"train_loss": -6.391729354858398, "global_step": 113372, "epoch": 2699} {"train_loss": -6.393342971801758, "global_step": 113373, "epoch": 2699} {"train_loss": -6.54432487487793, "global_step": 113374, "epoch": 2699} {"train_loss": -6.515053749084473, "global_step": 113375, "epoch": 2699} {"train_loss": -6.590919494628906, "global_step": 113376, "epoch": 2699} {"train_loss": -6.563027381896973, "global_step": 113377, "epoch": 2699} {"train_loss": -6.461664199829102, "global_step": 113378, "epoch": 2699} {"train_loss": -6.576122760772705, "global_step": 113379, "epoch": 2699} {"train_loss": -6.407577991485596, "global_step": 113380, "epoch": 2699} {"train_loss": -6.498257637023926, "global_step": 113381, "epoch": 2699} {"train_loss": -6.575477600097656, "global_step": 113382, "epoch": 2699} {"train_loss": -6.639333724975586, "global_step": 113383, "epoch": 2699} {"train_loss": -6.493409156799316, "global_step": 113384, "epoch": 2699} {"train_loss": -6.469151973724365, "global_step": 113385, "epoch": 2699} {"train_loss": -6.439243316650391, "global_step": 113386, "epoch": 2699} {"train_loss": -6.466898441314697, "global_step": 113387, "epoch": 2699} {"train_loss": -6.343557357788086, "global_step": 113388, "epoch": 2699} {"train_loss": -6.44075870513916, "global_step": 113389, "epoch": 2699} {"train_loss": -6.431244850158691, "global_step": 113390, "epoch": 2699} {"train_loss": -6.4267778396606445, "global_step": 113391, "epoch": 2699} {"train_loss": -6.357174873352051, "global_step": 113392, "epoch": 2699} {"train_loss": -6.423741340637207, "global_step": 113393, "epoch": 2699} {"train_loss": -6.610036373138428, "global_step": 113394, "epoch": 2699} {"train_loss": -6.443143844604492, "global_step": 113395, "epoch": 2699} {"train_loss": -6.393871307373047, "global_step": 113396, "epoch": 2699} {"train_loss": -6.465676307678223, "global_step": 113397, "epoch": 2699} {"train_loss": -6.356293201446533, "global_step": 113398, "epoch": 2699} {"train_loss": -6.47197056951977, "global_step": 113399, "epoch": 2699, "val_loss": 67979.640625} {"train_loss": -6.374547481536865, "global_step": 113400, "epoch": 2700} {"train_loss": -6.440690994262695, "global_step": 113401, "epoch": 2700} {"train_loss": -6.473064422607422, "global_step": 113402, "epoch": 2700} {"train_loss": -6.364043235778809, "global_step": 113403, "epoch": 2700} {"train_loss": -6.424093723297119, "global_step": 113404, "epoch": 2700} {"train_loss": -6.374630451202393, "global_step": 113405, "epoch": 2700} {"train_loss": -6.404420852661133, "global_step": 113406, "epoch": 2700} {"train_loss": -6.424318790435791, "global_step": 113407, "epoch": 2700} {"train_loss": -6.337855339050293, "global_step": 113408, "epoch": 2700} {"train_loss": -6.413870811462402, "global_step": 113409, "epoch": 2700} {"train_loss": -6.576032638549805, "global_step": 113410, "epoch": 2700} {"train_loss": -6.4293718338012695, "global_step": 113411, "epoch": 2700} {"train_loss": -6.2942657470703125, "global_step": 113412, "epoch": 2700} {"train_loss": -6.325300216674805, "global_step": 113413, "epoch": 2700} {"train_loss": -6.352254867553711, "global_step": 113414, "epoch": 2700} {"train_loss": -6.506711006164551, "global_step": 113415, "epoch": 2700} {"train_loss": -6.479928970336914, "global_step": 113416, "epoch": 2700} {"train_loss": -6.407567024230957, "global_step": 113417, "epoch": 2700} {"train_loss": -6.484694480895996, "global_step": 113418, "epoch": 2700} {"train_loss": -6.330275535583496, "global_step": 113419, "epoch": 2700} {"train_loss": -6.364398956298828, "global_step": 113420, "epoch": 2700} {"train_loss": -6.344168663024902, "global_step": 113421, "epoch": 2700} {"train_loss": -6.360340118408203, "global_step": 113422, "epoch": 2700} {"train_loss": -6.457111358642578, "global_step": 113423, "epoch": 2700} {"train_loss": -6.330432891845703, "global_step": 113424, "epoch": 2700} {"train_loss": -6.48356294631958, "global_step": 113425, "epoch": 2700} {"train_loss": -6.510855674743652, "global_step": 113426, "epoch": 2700} {"train_loss": -6.551548957824707, "global_step": 113427, "epoch": 2700} {"train_loss": -6.429220676422119, "global_step": 113428, "epoch": 2700} {"train_loss": -6.433520317077637, "global_step": 113429, "epoch": 2700} {"train_loss": -6.431347846984863, "global_step": 113430, "epoch": 2700} {"train_loss": -6.55533504486084, "global_step": 113431, "epoch": 2700} {"train_loss": -6.390594005584717, "global_step": 113432, "epoch": 2700} {"train_loss": -6.436685562133789, "global_step": 113433, "epoch": 2700} {"train_loss": -6.423197269439697, "global_step": 113434, "epoch": 2700} {"train_loss": -6.540701866149902, "global_step": 113435, "epoch": 2700} {"train_loss": -6.4286603927612305, "global_step": 113436, "epoch": 2700} {"train_loss": -6.438282012939453, "global_step": 113437, "epoch": 2700} {"train_loss": -6.546668529510498, "global_step": 113438, "epoch": 2700} {"train_loss": -6.369100093841553, "global_step": 113439, "epoch": 2700} {"train_loss": -6.549073696136475, "global_step": 113440, "epoch": 2700} {"train_loss": -6.430280674071539, "global_step": 113441, "epoch": 2700, "train/sim_max_reward_0": 0.2498803093115323, "train/sim_max_reward_1": 0.9205885616401033, "train/sim_max_reward_2": 0.3267810263222026, "train/sim_max_reward_3": 0.14099714779276942, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9398769276035428, "test/sim_max_reward_4400000": 0.22299258070848305, "test/sim_max_reward_4400001": 0.1526769931448519, "test/sim_max_reward_4400002": 0.47923169653271125, "test/sim_max_reward_4400003": 0.4589651062426158, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9992305518550538, "test/sim_max_reward_4400006": 0.975007568190813, "test/sim_max_reward_4400007": 0.8501627985958349, "test/sim_max_reward_4400008": 0.29871175419621404, "test/sim_max_reward_4400009": 0.9189783004305362, "test/sim_max_reward_4400010": 0.2549382546094043, "test/sim_max_reward_4400011": 0.9169216487101394, "test/sim_max_reward_4400012": 0.7312053393762425, "test/sim_max_reward_4400013": 0.3489884113534679, "test/sim_max_reward_4400014": 0.5608563697218977, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.07299363358165041, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23376813805340596, "test/sim_max_reward_4400019": 0.9914738163174348, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.7587847549268503, "test/sim_max_reward_4400023": 0.9550838903518798, "test/sim_max_reward_4400024": 0.8957606618494394, "test/sim_max_reward_4400025": 0.254528731058646, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.07317763298104343, "test/sim_max_reward_4400028": 0.4641556322745853, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9459913679338832, "test/sim_max_reward_4400031": 0.8636744561057453, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7163493793676722, "test/sim_max_reward_4400034": 0.8690315250974296, "test/sim_max_reward_4400035": 0.7712076151712535, "test/sim_max_reward_4400036": 0.36388820106341824, "test/sim_max_reward_4400037": 0.9368876290599101, "test/sim_max_reward_4400038": 0.9693102100511584, "test/sim_max_reward_4400039": 0.952538132730297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.4936433379245112, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.9119593783546808, "test/sim_max_reward_4400044": 0.8571027771811215, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.8608919924457477, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.9670222807328119, "test/sim_max_reward_4400049": 0.8928318617105168, "train/mean_score": 0.5963539954450251, "test/mean_score": 0.5542872933194716, "val_loss": 67758.328125} {"train_loss": -6.4631242752075195, "global_step": 113442, "epoch": 2701} {"train_loss": -6.52470588684082, "global_step": 113443, "epoch": 2701} {"train_loss": -6.488006591796875, "global_step": 113444, "epoch": 2701} {"train_loss": -6.605013847351074, "global_step": 113445, "epoch": 2701} {"train_loss": -6.570914268493652, "global_step": 113446, "epoch": 2701} {"train_loss": -6.466917514801025, "global_step": 113447, "epoch": 2701} {"train_loss": -6.520444869995117, "global_step": 113448, "epoch": 2701} {"train_loss": -6.468301773071289, "global_step": 113449, "epoch": 2701} {"train_loss": -6.381518363952637, "global_step": 113450, "epoch": 2701} {"train_loss": -6.564060211181641, "global_step": 113451, "epoch": 2701} {"train_loss": -6.45838737487793, "global_step": 113452, "epoch": 2701} {"train_loss": -6.42600679397583, "global_step": 113453, "epoch": 2701} {"train_loss": -6.541879177093506, "global_step": 113454, "epoch": 2701} {"train_loss": -6.448026657104492, "global_step": 113455, "epoch": 2701} {"train_loss": -6.443963050842285, "global_step": 113456, "epoch": 2701} {"train_loss": -6.355396270751953, "global_step": 113457, "epoch": 2701} {"train_loss": -6.482149124145508, "global_step": 113458, "epoch": 2701} {"train_loss": -6.558149337768555, "global_step": 113459, "epoch": 2701} {"train_loss": -6.441632270812988, "global_step": 113460, "epoch": 2701} {"train_loss": -6.502716064453125, "global_step": 113461, "epoch": 2701} {"train_loss": -6.393770217895508, "global_step": 113462, "epoch": 2701} {"train_loss": -6.482447147369385, "global_step": 113463, "epoch": 2701} {"train_loss": -6.322293758392334, "global_step": 113464, "epoch": 2701} {"train_loss": -6.487273216247559, "global_step": 113465, "epoch": 2701} {"train_loss": -6.488981246948242, "global_step": 113466, "epoch": 2701} {"train_loss": -6.598261833190918, "global_step": 113467, "epoch": 2701} {"train_loss": -6.493561267852783, "global_step": 113468, "epoch": 2701} {"train_loss": -6.430361270904541, "global_step": 113469, "epoch": 2701} {"train_loss": -6.521894454956055, "global_step": 113470, "epoch": 2701} {"train_loss": -6.433514595031738, "global_step": 113471, "epoch": 2701} {"train_loss": -6.604304313659668, "global_step": 113472, "epoch": 2701} {"train_loss": -6.361875534057617, "global_step": 113473, "epoch": 2701} {"train_loss": -6.505178451538086, "global_step": 113474, "epoch": 2701} {"train_loss": -6.493348121643066, "global_step": 113475, "epoch": 2701} {"train_loss": -6.375085830688477, "global_step": 113476, "epoch": 2701} {"train_loss": -6.467832565307617, "global_step": 113477, "epoch": 2701} {"train_loss": -6.4114179611206055, "global_step": 113478, "epoch": 2701} {"train_loss": -6.371089458465576, "global_step": 113479, "epoch": 2701} {"train_loss": -6.513307571411133, "global_step": 113480, "epoch": 2701} {"train_loss": -6.4596967697143555, "global_step": 113481, "epoch": 2701} {"train_loss": -6.459573268890381, "global_step": 113482, "epoch": 2701} {"train_loss": -6.468996751876104, "global_step": 113483, "epoch": 2701, "val_loss": 68223.3203125} {"train_loss": -6.412137031555176, "global_step": 113484, "epoch": 2702} {"train_loss": -6.6139326095581055, "global_step": 113485, "epoch": 2702} {"train_loss": -6.4045610427856445, "global_step": 113486, "epoch": 2702} {"train_loss": -6.484263896942139, "global_step": 113487, "epoch": 2702} {"train_loss": -6.454173564910889, "global_step": 113488, "epoch": 2702} {"train_loss": -6.49799919128418, "global_step": 113489, "epoch": 2702} {"train_loss": -6.456837177276611, "global_step": 113490, "epoch": 2702} {"train_loss": -6.475222587585449, "global_step": 113491, "epoch": 2702} {"train_loss": -6.497104644775391, "global_step": 113492, "epoch": 2702} {"train_loss": -6.5080060958862305, "global_step": 113493, "epoch": 2702} {"train_loss": -6.4102463722229, "global_step": 113494, "epoch": 2702} {"train_loss": -6.487113952636719, "global_step": 113495, "epoch": 2702} {"train_loss": -6.450522422790527, "global_step": 113496, "epoch": 2702} {"train_loss": -6.5066022872924805, "global_step": 113497, "epoch": 2702} {"train_loss": -6.474998474121094, "global_step": 113498, "epoch": 2702} {"train_loss": -6.489570140838623, "global_step": 113499, "epoch": 2702} {"train_loss": -6.510270118713379, "global_step": 113500, "epoch": 2702} {"train_loss": -6.395327091217041, "global_step": 113501, "epoch": 2702} {"train_loss": -6.493901252746582, "global_step": 113502, "epoch": 2702} {"train_loss": -6.423187255859375, "global_step": 113503, "epoch": 2702} {"train_loss": -6.531611442565918, "global_step": 113504, "epoch": 2702} {"train_loss": -6.4220733642578125, "global_step": 113505, "epoch": 2702} {"train_loss": -6.518529415130615, "global_step": 113506, "epoch": 2702} {"train_loss": -6.454909324645996, "global_step": 113507, "epoch": 2702} {"train_loss": -6.456169128417969, "global_step": 113508, "epoch": 2702} {"train_loss": -6.529102802276611, "global_step": 113509, "epoch": 2702} {"train_loss": -6.51612663269043, "global_step": 113510, "epoch": 2702} {"train_loss": -6.460552215576172, "global_step": 113511, "epoch": 2702} {"train_loss": -6.56857967376709, "global_step": 113512, "epoch": 2702} {"train_loss": -6.4386796951293945, "global_step": 113513, "epoch": 2702} {"train_loss": -6.474579811096191, "global_step": 113514, "epoch": 2702} {"train_loss": -6.390788555145264, "global_step": 113515, "epoch": 2702} {"train_loss": -6.377462863922119, "global_step": 113516, "epoch": 2702} {"train_loss": -6.503933906555176, "global_step": 113517, "epoch": 2702} {"train_loss": -6.584151744842529, "global_step": 113518, "epoch": 2702} {"train_loss": -6.543882846832275, "global_step": 113519, "epoch": 2702} {"train_loss": -6.447724342346191, "global_step": 113520, "epoch": 2702} {"train_loss": -6.482246398925781, "global_step": 113521, "epoch": 2702} {"train_loss": -6.445711135864258, "global_step": 113522, "epoch": 2702} {"train_loss": -6.38731575012207, "global_step": 113523, "epoch": 2702} {"train_loss": -6.5744218826293945, "global_step": 113524, "epoch": 2702} {"train_loss": -6.475785857155209, "global_step": 113525, "epoch": 2702, "val_loss": 67796.4609375} {"train_loss": -6.439141273498535, "global_step": 113526, "epoch": 2703} {"train_loss": -6.4431986808776855, "global_step": 113527, "epoch": 2703} {"train_loss": -6.5444440841674805, "global_step": 113528, "epoch": 2703} {"train_loss": -6.617162704467773, "global_step": 113529, "epoch": 2703} {"train_loss": -6.440346717834473, "global_step": 113530, "epoch": 2703} {"train_loss": -6.3703789710998535, "global_step": 113531, "epoch": 2703} {"train_loss": -6.464008331298828, "global_step": 113532, "epoch": 2703} {"train_loss": -6.466580867767334, "global_step": 113533, "epoch": 2703} {"train_loss": -6.459385871887207, "global_step": 113534, "epoch": 2703} {"train_loss": -6.372433662414551, "global_step": 113535, "epoch": 2703} {"train_loss": -6.432354927062988, "global_step": 113536, "epoch": 2703} {"train_loss": -6.381723403930664, "global_step": 113537, "epoch": 2703} {"train_loss": -6.339583396911621, "global_step": 113538, "epoch": 2703} {"train_loss": -6.452439308166504, "global_step": 113539, "epoch": 2703} {"train_loss": -6.491702079772949, "global_step": 113540, "epoch": 2703} {"train_loss": -6.4635210037231445, "global_step": 113541, "epoch": 2703} {"train_loss": -6.535387992858887, "global_step": 113542, "epoch": 2703} {"train_loss": -6.4771904945373535, "global_step": 113543, "epoch": 2703} {"train_loss": -6.550519943237305, "global_step": 113544, "epoch": 2703} {"train_loss": -6.469705104827881, "global_step": 113545, "epoch": 2703} {"train_loss": -6.404454231262207, "global_step": 113546, "epoch": 2703} {"train_loss": -6.396373748779297, "global_step": 113547, "epoch": 2703} {"train_loss": -6.570524215698242, "global_step": 113548, "epoch": 2703} {"train_loss": -6.469028472900391, "global_step": 113549, "epoch": 2703} {"train_loss": -6.456113815307617, "global_step": 113550, "epoch": 2703} {"train_loss": -6.430520057678223, "global_step": 113551, "epoch": 2703} {"train_loss": -6.482940196990967, "global_step": 113552, "epoch": 2703} {"train_loss": -6.517841815948486, "global_step": 113553, "epoch": 2703} {"train_loss": -6.581448554992676, "global_step": 113554, "epoch": 2703} {"train_loss": -6.43350887298584, "global_step": 113555, "epoch": 2703} {"train_loss": -6.470850944519043, "global_step": 113556, "epoch": 2703} {"train_loss": -6.468152046203613, "global_step": 113557, "epoch": 2703} {"train_loss": -6.4491119384765625, "global_step": 113558, "epoch": 2703} {"train_loss": -6.416931629180908, "global_step": 113559, "epoch": 2703} {"train_loss": -6.592772006988525, "global_step": 113560, "epoch": 2703} {"train_loss": -6.435464382171631, "global_step": 113561, "epoch": 2703} {"train_loss": -6.451625823974609, "global_step": 113562, "epoch": 2703} {"train_loss": -6.351462364196777, "global_step": 113563, "epoch": 2703} {"train_loss": -6.508259296417236, "global_step": 113564, "epoch": 2703} {"train_loss": -6.455832481384277, "global_step": 113565, "epoch": 2703} {"train_loss": -6.349932670593262, "global_step": 113566, "epoch": 2703} {"train_loss": -6.462516137531826, "global_step": 113567, "epoch": 2703, "val_loss": 67996.0625} {"train_loss": -6.541731834411621, "global_step": 113568, "epoch": 2704} {"train_loss": -6.401599884033203, "global_step": 113569, "epoch": 2704} {"train_loss": -6.366913318634033, "global_step": 113570, "epoch": 2704} {"train_loss": -6.44990873336792, "global_step": 113571, "epoch": 2704} {"train_loss": -6.448616981506348, "global_step": 113572, "epoch": 2704} {"train_loss": -6.332193374633789, "global_step": 113573, "epoch": 2704} {"train_loss": -6.4614739418029785, "global_step": 113574, "epoch": 2704} {"train_loss": -6.404512405395508, "global_step": 113575, "epoch": 2704} {"train_loss": -6.343650817871094, "global_step": 113576, "epoch": 2704} {"train_loss": -6.4380950927734375, "global_step": 113577, "epoch": 2704} {"train_loss": -6.5042877197265625, "global_step": 113578, "epoch": 2704} {"train_loss": -6.535504341125488, "global_step": 113579, "epoch": 2704} {"train_loss": -6.480973243713379, "global_step": 113580, "epoch": 2704} {"train_loss": -6.478114604949951, "global_step": 113581, "epoch": 2704} {"train_loss": -6.3421759605407715, "global_step": 113582, "epoch": 2704} {"train_loss": -6.49186897277832, "global_step": 113583, "epoch": 2704} {"train_loss": -6.524232864379883, "global_step": 113584, "epoch": 2704} {"train_loss": -6.478786468505859, "global_step": 113585, "epoch": 2704} {"train_loss": -6.545950889587402, "global_step": 113586, "epoch": 2704} {"train_loss": -6.52523136138916, "global_step": 113587, "epoch": 2704} {"train_loss": -6.344198226928711, "global_step": 113588, "epoch": 2704} {"train_loss": -6.4264373779296875, "global_step": 113589, "epoch": 2704} {"train_loss": -6.474368095397949, "global_step": 113590, "epoch": 2704} {"train_loss": -6.560459136962891, "global_step": 113591, "epoch": 2704} {"train_loss": -6.5078020095825195, "global_step": 113592, "epoch": 2704} {"train_loss": -6.450658798217773, "global_step": 113593, "epoch": 2704} {"train_loss": -6.445684909820557, "global_step": 113594, "epoch": 2704} {"train_loss": -6.591465950012207, "global_step": 113595, "epoch": 2704} {"train_loss": -6.417389869689941, "global_step": 113596, "epoch": 2704} {"train_loss": -6.445658206939697, "global_step": 113597, "epoch": 2704} {"train_loss": -6.519717693328857, "global_step": 113598, "epoch": 2704} {"train_loss": -6.51444149017334, "global_step": 113599, "epoch": 2704} {"train_loss": -6.447343826293945, "global_step": 113600, "epoch": 2704} {"train_loss": -6.544679641723633, "global_step": 113601, "epoch": 2704} {"train_loss": -6.513159275054932, "global_step": 113602, "epoch": 2704} {"train_loss": -6.453453063964844, "global_step": 113603, "epoch": 2704} {"train_loss": -6.458831787109375, "global_step": 113604, "epoch": 2704} {"train_loss": -6.514225006103516, "global_step": 113605, "epoch": 2704} {"train_loss": -6.412986755371094, "global_step": 113606, "epoch": 2704} {"train_loss": -6.483434200286865, "global_step": 113607, "epoch": 2704} {"train_loss": -6.514422416687012, "global_step": 113608, "epoch": 2704} {"train_loss": -6.4674842811766124, "global_step": 113609, "epoch": 2704, "val_loss": 67767.859375} {"train_loss": -6.442404747009277, "global_step": 113610, "epoch": 2705} {"train_loss": -6.498818397521973, "global_step": 113611, "epoch": 2705} {"train_loss": -6.510969161987305, "global_step": 113612, "epoch": 2705} {"train_loss": -6.513725280761719, "global_step": 113613, "epoch": 2705} {"train_loss": -6.541903495788574, "global_step": 113614, "epoch": 2705} {"train_loss": -6.459669589996338, "global_step": 113615, "epoch": 2705} {"train_loss": -6.518425941467285, "global_step": 113616, "epoch": 2705} {"train_loss": -6.431929588317871, "global_step": 113617, "epoch": 2705} {"train_loss": -6.417307376861572, "global_step": 113618, "epoch": 2705} {"train_loss": -6.456708908081055, "global_step": 113619, "epoch": 2705} {"train_loss": -6.380411148071289, "global_step": 113620, "epoch": 2705} {"train_loss": -6.416664123535156, "global_step": 113621, "epoch": 2705} {"train_loss": -6.567231178283691, "global_step": 113622, "epoch": 2705} {"train_loss": -6.458518981933594, "global_step": 113623, "epoch": 2705} {"train_loss": -6.46107292175293, "global_step": 113624, "epoch": 2705} {"train_loss": -6.426562309265137, "global_step": 113625, "epoch": 2705} {"train_loss": -6.409150123596191, "global_step": 113626, "epoch": 2705} {"train_loss": -6.530121803283691, "global_step": 113627, "epoch": 2705} {"train_loss": -6.406735420227051, "global_step": 113628, "epoch": 2705} {"train_loss": -6.438190460205078, "global_step": 113629, "epoch": 2705} {"train_loss": -6.482845783233643, "global_step": 113630, "epoch": 2705} {"train_loss": -6.388427734375, "global_step": 113631, "epoch": 2705} {"train_loss": -6.416632652282715, "global_step": 113632, "epoch": 2705} {"train_loss": -6.436572074890137, "global_step": 113633, "epoch": 2705} {"train_loss": -6.444715976715088, "global_step": 113634, "epoch": 2705} {"train_loss": -6.618611812591553, "global_step": 113635, "epoch": 2705} {"train_loss": -6.350550651550293, "global_step": 113636, "epoch": 2705} {"train_loss": -6.50164794921875, "global_step": 113637, "epoch": 2705} {"train_loss": -6.538033485412598, "global_step": 113638, "epoch": 2705} {"train_loss": -6.538480281829834, "global_step": 113639, "epoch": 2705} {"train_loss": -6.545173645019531, "global_step": 113640, "epoch": 2705} {"train_loss": -6.556666851043701, "global_step": 113641, "epoch": 2705} {"train_loss": -6.533166885375977, "global_step": 113642, "epoch": 2705} {"train_loss": -6.3413543701171875, "global_step": 113643, "epoch": 2705} {"train_loss": -6.433478832244873, "global_step": 113644, "epoch": 2705} {"train_loss": -6.415509223937988, "global_step": 113645, "epoch": 2705} {"train_loss": -6.542596817016602, "global_step": 113646, "epoch": 2705} {"train_loss": -6.526081562042236, "global_step": 113647, "epoch": 2705} {"train_loss": -6.515393257141113, "global_step": 113648, "epoch": 2705} {"train_loss": -6.52401876449585, "global_step": 113649, "epoch": 2705} {"train_loss": -6.5659589767456055, "global_step": 113650, "epoch": 2705} {"train_loss": -6.4752001875922796, "global_step": 113651, "epoch": 2705, "val_loss": 67901.4453125} {"train_loss": -6.473824501037598, "global_step": 113652, "epoch": 2706} {"train_loss": -6.481616020202637, "global_step": 113653, "epoch": 2706} {"train_loss": -6.522479057312012, "global_step": 113654, "epoch": 2706} {"train_loss": -6.481647968292236, "global_step": 113655, "epoch": 2706} {"train_loss": -6.482012748718262, "global_step": 113656, "epoch": 2706} {"train_loss": -6.556612014770508, "global_step": 113657, "epoch": 2706} {"train_loss": -6.438089370727539, "global_step": 113658, "epoch": 2706} {"train_loss": -6.416912078857422, "global_step": 113659, "epoch": 2706} {"train_loss": -6.541771411895752, "global_step": 113660, "epoch": 2706} {"train_loss": -6.463003158569336, "global_step": 113661, "epoch": 2706} {"train_loss": -6.547612190246582, "global_step": 113662, "epoch": 2706} {"train_loss": -6.4696855545043945, "global_step": 113663, "epoch": 2706} {"train_loss": -6.477572917938232, "global_step": 113664, "epoch": 2706} {"train_loss": -6.534053802490234, "global_step": 113665, "epoch": 2706} {"train_loss": -6.535804748535156, "global_step": 113666, "epoch": 2706} {"train_loss": -6.533611297607422, "global_step": 113667, "epoch": 2706} {"train_loss": -6.3940205574035645, "global_step": 113668, "epoch": 2706} {"train_loss": -6.535362243652344, "global_step": 113669, "epoch": 2706} {"train_loss": -6.382142066955566, "global_step": 113670, "epoch": 2706} {"train_loss": -6.460839748382568, "global_step": 113671, "epoch": 2706} {"train_loss": -6.539433479309082, "global_step": 113672, "epoch": 2706} {"train_loss": -6.544776916503906, "global_step": 113673, "epoch": 2706} {"train_loss": -6.557123184204102, "global_step": 113674, "epoch": 2706} {"train_loss": -6.472607612609863, "global_step": 113675, "epoch": 2706} {"train_loss": -6.498317718505859, "global_step": 113676, "epoch": 2706} {"train_loss": -6.49824333190918, "global_step": 113677, "epoch": 2706} {"train_loss": -6.473180770874023, "global_step": 113678, "epoch": 2706} {"train_loss": -6.405228614807129, "global_step": 113679, "epoch": 2706} {"train_loss": -6.401337623596191, "global_step": 113680, "epoch": 2706} {"train_loss": -6.481729507446289, "global_step": 113681, "epoch": 2706} {"train_loss": -6.492175102233887, "global_step": 113682, "epoch": 2706} {"train_loss": -6.473359107971191, "global_step": 113683, "epoch": 2706} {"train_loss": -6.471096038818359, "global_step": 113684, "epoch": 2706} {"train_loss": -6.408259391784668, "global_step": 113685, "epoch": 2706} {"train_loss": -6.386290073394775, "global_step": 113686, "epoch": 2706} {"train_loss": -6.373884201049805, "global_step": 113687, "epoch": 2706} {"train_loss": -6.3345489501953125, "global_step": 113688, "epoch": 2706} {"train_loss": -6.507830619812012, "global_step": 113689, "epoch": 2706} {"train_loss": -6.438019275665283, "global_step": 113690, "epoch": 2706} {"train_loss": -6.404971122741699, "global_step": 113691, "epoch": 2706} {"train_loss": -6.4277849197387695, "global_step": 113692, "epoch": 2706} {"train_loss": -6.469274202982585, "global_step": 113693, "epoch": 2706, "val_loss": 67975.8125} {"train_loss": -6.431438446044922, "global_step": 113694, "epoch": 2707} {"train_loss": -6.40850830078125, "global_step": 113695, "epoch": 2707} {"train_loss": -6.420159816741943, "global_step": 113696, "epoch": 2707} {"train_loss": -6.517019271850586, "global_step": 113697, "epoch": 2707} {"train_loss": -6.383053779602051, "global_step": 113698, "epoch": 2707} {"train_loss": -6.377236366271973, "global_step": 113699, "epoch": 2707} {"train_loss": -6.436589241027832, "global_step": 113700, "epoch": 2707} {"train_loss": -6.458063125610352, "global_step": 113701, "epoch": 2707} {"train_loss": -6.576875686645508, "global_step": 113702, "epoch": 2707} {"train_loss": -6.442902565002441, "global_step": 113703, "epoch": 2707} {"train_loss": -6.589517593383789, "global_step": 113704, "epoch": 2707} {"train_loss": -6.507889747619629, "global_step": 113705, "epoch": 2707} {"train_loss": -6.5594987869262695, "global_step": 113706, "epoch": 2707} {"train_loss": -6.516729354858398, "global_step": 113707, "epoch": 2707} {"train_loss": -6.581666469573975, "global_step": 113708, "epoch": 2707} {"train_loss": -6.575765609741211, "global_step": 113709, "epoch": 2707} {"train_loss": -6.568669319152832, "global_step": 113710, "epoch": 2707} {"train_loss": -6.45952033996582, "global_step": 113711, "epoch": 2707} {"train_loss": -6.394731044769287, "global_step": 113712, "epoch": 2707} {"train_loss": -6.442983150482178, "global_step": 113713, "epoch": 2707} {"train_loss": -6.479615211486816, "global_step": 113714, "epoch": 2707} {"train_loss": -6.443498611450195, "global_step": 113715, "epoch": 2707} {"train_loss": -6.498497486114502, "global_step": 113716, "epoch": 2707} {"train_loss": -6.491270065307617, "global_step": 113717, "epoch": 2707} {"train_loss": -6.436107635498047, "global_step": 113718, "epoch": 2707} {"train_loss": -6.3343505859375, "global_step": 113719, "epoch": 2707} {"train_loss": -6.398555755615234, "global_step": 113720, "epoch": 2707} {"train_loss": -6.436445713043213, "global_step": 113721, "epoch": 2707} {"train_loss": -6.480322360992432, "global_step": 113722, "epoch": 2707} {"train_loss": -6.480767250061035, "global_step": 113723, "epoch": 2707} {"train_loss": -6.409771919250488, "global_step": 113724, "epoch": 2707} {"train_loss": -6.285284996032715, "global_step": 113725, "epoch": 2707} {"train_loss": -6.508750915527344, "global_step": 113726, "epoch": 2707} {"train_loss": -6.44489049911499, "global_step": 113727, "epoch": 2707} {"train_loss": -6.454305648803711, "global_step": 113728, "epoch": 2707} {"train_loss": -6.498804092407227, "global_step": 113729, "epoch": 2707} {"train_loss": -6.351016044616699, "global_step": 113730, "epoch": 2707} {"train_loss": -6.461321830749512, "global_step": 113731, "epoch": 2707} {"train_loss": -6.5414838790893555, "global_step": 113732, "epoch": 2707} {"train_loss": -6.474675178527832, "global_step": 113733, "epoch": 2707} {"train_loss": -6.394121170043945, "global_step": 113734, "epoch": 2707} {"train_loss": -6.460459879466465, "global_step": 113735, "epoch": 2707, "val_loss": 68017.40625} {"train_loss": -6.370535373687744, "global_step": 113736, "epoch": 2708} {"train_loss": -6.516580104827881, "global_step": 113737, "epoch": 2708} {"train_loss": -6.521112442016602, "global_step": 113738, "epoch": 2708} {"train_loss": -6.417192459106445, "global_step": 113739, "epoch": 2708} {"train_loss": -6.5218706130981445, "global_step": 113740, "epoch": 2708} {"train_loss": -6.497082710266113, "global_step": 113741, "epoch": 2708} {"train_loss": -6.51109504699707, "global_step": 113742, "epoch": 2708} {"train_loss": -6.402477741241455, "global_step": 113743, "epoch": 2708} {"train_loss": -6.515789985656738, "global_step": 113744, "epoch": 2708} {"train_loss": -6.498777389526367, "global_step": 113745, "epoch": 2708} {"train_loss": -6.409791469573975, "global_step": 113746, "epoch": 2708} {"train_loss": -6.532136917114258, "global_step": 113747, "epoch": 2708} {"train_loss": -6.525468349456787, "global_step": 113748, "epoch": 2708} {"train_loss": -6.450610637664795, "global_step": 113749, "epoch": 2708} {"train_loss": -6.415282249450684, "global_step": 113750, "epoch": 2708} {"train_loss": -6.447695732116699, "global_step": 113751, "epoch": 2708} {"train_loss": -6.453392028808594, "global_step": 113752, "epoch": 2708} {"train_loss": -6.586526870727539, "global_step": 113753, "epoch": 2708} {"train_loss": -6.467638969421387, "global_step": 113754, "epoch": 2708} {"train_loss": -6.484565734863281, "global_step": 113755, "epoch": 2708} {"train_loss": -6.402592658996582, "global_step": 113756, "epoch": 2708} {"train_loss": -6.4754815101623535, "global_step": 113757, "epoch": 2708} {"train_loss": -6.447940826416016, "global_step": 113758, "epoch": 2708} {"train_loss": -6.398221969604492, "global_step": 113759, "epoch": 2708} {"train_loss": -6.505695819854736, "global_step": 113760, "epoch": 2708} {"train_loss": -6.494231700897217, "global_step": 113761, "epoch": 2708} {"train_loss": -6.477199077606201, "global_step": 113762, "epoch": 2708} {"train_loss": -6.465206146240234, "global_step": 113763, "epoch": 2708} {"train_loss": -6.438227653503418, "global_step": 113764, "epoch": 2708} {"train_loss": -6.342912673950195, "global_step": 113765, "epoch": 2708} {"train_loss": -6.529163837432861, "global_step": 113766, "epoch": 2708} {"train_loss": -6.573843955993652, "global_step": 113767, "epoch": 2708} {"train_loss": -6.3852996826171875, "global_step": 113768, "epoch": 2708} {"train_loss": -6.4893951416015625, "global_step": 113769, "epoch": 2708} {"train_loss": -6.407336235046387, "global_step": 113770, "epoch": 2708} {"train_loss": -6.557418346405029, "global_step": 113771, "epoch": 2708} {"train_loss": -6.40914249420166, "global_step": 113772, "epoch": 2708} {"train_loss": -6.543787002563477, "global_step": 113773, "epoch": 2708} {"train_loss": -6.565854072570801, "global_step": 113774, "epoch": 2708} {"train_loss": -6.47340202331543, "global_step": 113775, "epoch": 2708} {"train_loss": -6.450623035430908, "global_step": 113776, "epoch": 2708} {"train_loss": -6.4728811014266245, "global_step": 113777, "epoch": 2708, "val_loss": 67985.390625} {"train_loss": -6.585132598876953, "global_step": 113778, "epoch": 2709} {"train_loss": -6.523403167724609, "global_step": 113779, "epoch": 2709} {"train_loss": -6.377422332763672, "global_step": 113780, "epoch": 2709} {"train_loss": -6.577668190002441, "global_step": 113781, "epoch": 2709} {"train_loss": -6.601052284240723, "global_step": 113782, "epoch": 2709} {"train_loss": -6.434453964233398, "global_step": 113783, "epoch": 2709} {"train_loss": -6.612934112548828, "global_step": 113784, "epoch": 2709} {"train_loss": -6.4713897705078125, "global_step": 113785, "epoch": 2709} {"train_loss": -6.5976786613464355, "global_step": 113786, "epoch": 2709} {"train_loss": -6.549005031585693, "global_step": 113787, "epoch": 2709} {"train_loss": -6.464739799499512, "global_step": 113788, "epoch": 2709} {"train_loss": -6.538346290588379, "global_step": 113789, "epoch": 2709} {"train_loss": -6.3276262283325195, "global_step": 113790, "epoch": 2709} {"train_loss": -6.499792575836182, "global_step": 113791, "epoch": 2709} {"train_loss": -6.409029960632324, "global_step": 113792, "epoch": 2709} {"train_loss": -6.332388877868652, "global_step": 113793, "epoch": 2709} {"train_loss": -6.425950050354004, "global_step": 113794, "epoch": 2709} {"train_loss": -6.403663635253906, "global_step": 113795, "epoch": 2709} {"train_loss": -6.290537357330322, "global_step": 113796, "epoch": 2709} {"train_loss": -6.360158920288086, "global_step": 113797, "epoch": 2709} {"train_loss": -6.438554763793945, "global_step": 113798, "epoch": 2709} {"train_loss": -6.351563930511475, "global_step": 113799, "epoch": 2709} {"train_loss": -6.440511703491211, "global_step": 113800, "epoch": 2709} {"train_loss": -6.36981725692749, "global_step": 113801, "epoch": 2709} {"train_loss": -6.291630744934082, "global_step": 113802, "epoch": 2709} {"train_loss": -6.48371696472168, "global_step": 113803, "epoch": 2709} {"train_loss": -6.323178291320801, "global_step": 113804, "epoch": 2709} {"train_loss": -6.358794212341309, "global_step": 113805, "epoch": 2709} {"train_loss": -6.38871955871582, "global_step": 113806, "epoch": 2709} {"train_loss": -6.359737396240234, "global_step": 113807, "epoch": 2709} {"train_loss": -6.443545818328857, "global_step": 113808, "epoch": 2709} {"train_loss": -6.355266571044922, "global_step": 113809, "epoch": 2709} {"train_loss": -6.452034950256348, "global_step": 113810, "epoch": 2709} {"train_loss": -6.426034927368164, "global_step": 113811, "epoch": 2709} {"train_loss": -6.45855712890625, "global_step": 113812, "epoch": 2709} {"train_loss": -6.466607093811035, "global_step": 113813, "epoch": 2709} {"train_loss": -6.379508972167969, "global_step": 113814, "epoch": 2709} {"train_loss": -6.427774429321289, "global_step": 113815, "epoch": 2709} {"train_loss": -6.386328220367432, "global_step": 113816, "epoch": 2709} {"train_loss": -6.309507369995117, "global_step": 113817, "epoch": 2709} {"train_loss": -6.49254846572876, "global_step": 113818, "epoch": 2709} {"train_loss": -6.434028477895827, "global_step": 113819, "epoch": 2709, "val_loss": 67804.015625} {"train_loss": -6.3841352462768555, "global_step": 113820, "epoch": 2710} {"train_loss": -6.484959602355957, "global_step": 113821, "epoch": 2710} {"train_loss": -6.539735794067383, "global_step": 113822, "epoch": 2710} {"train_loss": -6.402942657470703, "global_step": 113823, "epoch": 2710} {"train_loss": -6.515239715576172, "global_step": 113824, "epoch": 2710} {"train_loss": -6.5177154541015625, "global_step": 113825, "epoch": 2710} {"train_loss": -6.583380699157715, "global_step": 113826, "epoch": 2710} {"train_loss": -6.442380905151367, "global_step": 113827, "epoch": 2710} {"train_loss": -6.42775821685791, "global_step": 113828, "epoch": 2710} {"train_loss": -6.4741058349609375, "global_step": 113829, "epoch": 2710} {"train_loss": -6.244295120239258, "global_step": 113830, "epoch": 2710} {"train_loss": -6.506032943725586, "global_step": 113831, "epoch": 2710} {"train_loss": -6.515970230102539, "global_step": 113832, "epoch": 2710} {"train_loss": -6.3191070556640625, "global_step": 113833, "epoch": 2710} {"train_loss": -6.400327682495117, "global_step": 113834, "epoch": 2710} {"train_loss": -6.4026408195495605, "global_step": 113835, "epoch": 2710} {"train_loss": -6.4234466552734375, "global_step": 113836, "epoch": 2710} {"train_loss": -6.49191427230835, "global_step": 113837, "epoch": 2710} {"train_loss": -6.304011344909668, "global_step": 113838, "epoch": 2710} {"train_loss": -6.425760269165039, "global_step": 113839, "epoch": 2710} {"train_loss": -6.416102409362793, "global_step": 113840, "epoch": 2710} {"train_loss": -6.36357307434082, "global_step": 113841, "epoch": 2710} {"train_loss": -6.477378845214844, "global_step": 113842, "epoch": 2710} {"train_loss": -6.399202823638916, "global_step": 113843, "epoch": 2710} {"train_loss": -6.278033256530762, "global_step": 113844, "epoch": 2710} {"train_loss": -6.330820083618164, "global_step": 113845, "epoch": 2710} {"train_loss": -6.268475532531738, "global_step": 113846, "epoch": 2710} {"train_loss": -6.369002342224121, "global_step": 113847, "epoch": 2710} {"train_loss": -6.405016899108887, "global_step": 113848, "epoch": 2710} {"train_loss": -6.323896408081055, "global_step": 113849, "epoch": 2710} {"train_loss": -6.48795223236084, "global_step": 113850, "epoch": 2710} {"train_loss": -6.436131477355957, "global_step": 113851, "epoch": 2710} {"train_loss": -6.541594505310059, "global_step": 113852, "epoch": 2710} {"train_loss": -6.497574806213379, "global_step": 113853, "epoch": 2710} {"train_loss": -6.456280708312988, "global_step": 113854, "epoch": 2710} {"train_loss": -6.35974645614624, "global_step": 113855, "epoch": 2710} {"train_loss": -6.408120632171631, "global_step": 113856, "epoch": 2710} {"train_loss": -6.481776237487793, "global_step": 113857, "epoch": 2710} {"train_loss": -6.4722580909729, "global_step": 113858, "epoch": 2710} {"train_loss": -6.494067192077637, "global_step": 113859, "epoch": 2710} {"train_loss": -6.450289249420166, "global_step": 113860, "epoch": 2710} {"train_loss": -6.425251858575003, "global_step": 113861, "epoch": 2710, "val_loss": 67841.765625} {"train_loss": -6.5007219314575195, "global_step": 113862, "epoch": 2711} {"train_loss": -6.427360534667969, "global_step": 113863, "epoch": 2711} {"train_loss": -6.451452732086182, "global_step": 113864, "epoch": 2711} {"train_loss": -6.5658769607543945, "global_step": 113865, "epoch": 2711} {"train_loss": -6.448522090911865, "global_step": 113866, "epoch": 2711} {"train_loss": -6.448925971984863, "global_step": 113867, "epoch": 2711} {"train_loss": -6.493398189544678, "global_step": 113868, "epoch": 2711} {"train_loss": -6.498281955718994, "global_step": 113869, "epoch": 2711} {"train_loss": -6.421410083770752, "global_step": 113870, "epoch": 2711} {"train_loss": -6.375590801239014, "global_step": 113871, "epoch": 2711} {"train_loss": -6.347100257873535, "global_step": 113872, "epoch": 2711} {"train_loss": -6.473519325256348, "global_step": 113873, "epoch": 2711} {"train_loss": -6.5265045166015625, "global_step": 113874, "epoch": 2711} {"train_loss": -6.388004302978516, "global_step": 113875, "epoch": 2711} {"train_loss": -6.552009582519531, "global_step": 113876, "epoch": 2711} {"train_loss": -6.460524559020996, "global_step": 113877, "epoch": 2711} {"train_loss": -6.358913421630859, "global_step": 113878, "epoch": 2711} {"train_loss": -6.498932361602783, "global_step": 113879, "epoch": 2711} {"train_loss": -6.37473726272583, "global_step": 113880, "epoch": 2711} {"train_loss": -6.396073341369629, "global_step": 113881, "epoch": 2711} {"train_loss": -6.673951148986816, "global_step": 113882, "epoch": 2711} {"train_loss": -6.436407566070557, "global_step": 113883, "epoch": 2711} {"train_loss": -6.533144474029541, "global_step": 113884, "epoch": 2711} {"train_loss": -6.49797248840332, "global_step": 113885, "epoch": 2711} {"train_loss": -6.443338394165039, "global_step": 113886, "epoch": 2711} {"train_loss": -6.6029510498046875, "global_step": 113887, "epoch": 2711} {"train_loss": -6.437500953674316, "global_step": 113888, "epoch": 2711} {"train_loss": -6.445338249206543, "global_step": 113889, "epoch": 2711} {"train_loss": -6.490401268005371, "global_step": 113890, "epoch": 2711} {"train_loss": -6.473825454711914, "global_step": 113891, "epoch": 2711} {"train_loss": -6.488138198852539, "global_step": 113892, "epoch": 2711} {"train_loss": -6.407644271850586, "global_step": 113893, "epoch": 2711} {"train_loss": -6.548872947692871, "global_step": 113894, "epoch": 2711} {"train_loss": -6.541810989379883, "global_step": 113895, "epoch": 2711} {"train_loss": -6.485047340393066, "global_step": 113896, "epoch": 2711} {"train_loss": -6.545490264892578, "global_step": 113897, "epoch": 2711} {"train_loss": -6.39776611328125, "global_step": 113898, "epoch": 2711} {"train_loss": -6.613862991333008, "global_step": 113899, "epoch": 2711} {"train_loss": -6.469649314880371, "global_step": 113900, "epoch": 2711} {"train_loss": -6.42186975479126, "global_step": 113901, "epoch": 2711} {"train_loss": -6.529735088348389, "global_step": 113902, "epoch": 2711} {"train_loss": -6.475058998380389, "global_step": 113903, "epoch": 2711, "val_loss": 67867.390625} {"train_loss": -6.52834415435791, "global_step": 113904, "epoch": 2712} {"train_loss": -6.471348285675049, "global_step": 113905, "epoch": 2712} {"train_loss": -6.515130519866943, "global_step": 113906, "epoch": 2712} {"train_loss": -6.555179119110107, "global_step": 113907, "epoch": 2712} {"train_loss": -6.5325117111206055, "global_step": 113908, "epoch": 2712} {"train_loss": -6.504306793212891, "global_step": 113909, "epoch": 2712} {"train_loss": -6.552803039550781, "global_step": 113910, "epoch": 2712} {"train_loss": -6.522027015686035, "global_step": 113911, "epoch": 2712} {"train_loss": -6.394160270690918, "global_step": 113912, "epoch": 2712} {"train_loss": -6.463006496429443, "global_step": 113913, "epoch": 2712} {"train_loss": -6.547616004943848, "global_step": 113914, "epoch": 2712} {"train_loss": -6.447269439697266, "global_step": 113915, "epoch": 2712} {"train_loss": -6.547136306762695, "global_step": 113916, "epoch": 2712} {"train_loss": -6.478039741516113, "global_step": 113917, "epoch": 2712} {"train_loss": -6.394848823547363, "global_step": 113918, "epoch": 2712} {"train_loss": -6.551440238952637, "global_step": 113919, "epoch": 2712} {"train_loss": -6.47221040725708, "global_step": 113920, "epoch": 2712} {"train_loss": -6.459475517272949, "global_step": 113921, "epoch": 2712} {"train_loss": -6.4641008377075195, "global_step": 113922, "epoch": 2712} {"train_loss": -6.621810436248779, "global_step": 113923, "epoch": 2712} {"train_loss": -6.530963897705078, "global_step": 113924, "epoch": 2712} {"train_loss": -6.426431179046631, "global_step": 113925, "epoch": 2712} {"train_loss": -6.570506572723389, "global_step": 113926, "epoch": 2712} {"train_loss": -6.4962334632873535, "global_step": 113927, "epoch": 2712} {"train_loss": -6.497333526611328, "global_step": 113928, "epoch": 2712} {"train_loss": -6.431638240814209, "global_step": 113929, "epoch": 2712} {"train_loss": -6.595307350158691, "global_step": 113930, "epoch": 2712} {"train_loss": -6.431916236877441, "global_step": 113931, "epoch": 2712} {"train_loss": -6.4263916015625, "global_step": 113932, "epoch": 2712} {"train_loss": -6.424439430236816, "global_step": 113933, "epoch": 2712} {"train_loss": -6.445760726928711, "global_step": 113934, "epoch": 2712} {"train_loss": -6.493069648742676, "global_step": 113935, "epoch": 2712} {"train_loss": -6.362727165222168, "global_step": 113936, "epoch": 2712} {"train_loss": -6.416562557220459, "global_step": 113937, "epoch": 2712} {"train_loss": -6.443781852722168, "global_step": 113938, "epoch": 2712} {"train_loss": -6.37127685546875, "global_step": 113939, "epoch": 2712} {"train_loss": -6.524107933044434, "global_step": 113940, "epoch": 2712} {"train_loss": -6.551888465881348, "global_step": 113941, "epoch": 2712} {"train_loss": -6.372876167297363, "global_step": 113942, "epoch": 2712} {"train_loss": -6.450565338134766, "global_step": 113943, "epoch": 2712} {"train_loss": -6.417410373687744, "global_step": 113944, "epoch": 2712} {"train_loss": -6.4800678207760765, "global_step": 113945, "epoch": 2712, "val_loss": 67853.6484375} {"train_loss": -6.451519966125488, "global_step": 113946, "epoch": 2713} {"train_loss": -6.430142879486084, "global_step": 113947, "epoch": 2713} {"train_loss": -6.427431583404541, "global_step": 113948, "epoch": 2713} {"train_loss": -6.524469375610352, "global_step": 113949, "epoch": 2713} {"train_loss": -6.419748306274414, "global_step": 113950, "epoch": 2713} {"train_loss": -6.497320175170898, "global_step": 113951, "epoch": 2713} {"train_loss": -6.43139123916626, "global_step": 113952, "epoch": 2713} {"train_loss": -6.459228038787842, "global_step": 113953, "epoch": 2713} {"train_loss": -6.618131637573242, "global_step": 113954, "epoch": 2713} {"train_loss": -6.3982439041137695, "global_step": 113955, "epoch": 2713} {"train_loss": -6.4546942710876465, "global_step": 113956, "epoch": 2713} {"train_loss": -6.428597450256348, "global_step": 113957, "epoch": 2713} {"train_loss": -6.477299690246582, "global_step": 113958, "epoch": 2713} {"train_loss": -6.543578147888184, "global_step": 113959, "epoch": 2713} {"train_loss": -6.452505588531494, "global_step": 113960, "epoch": 2713} {"train_loss": -6.4809465408325195, "global_step": 113961, "epoch": 2713} {"train_loss": -6.454129219055176, "global_step": 113962, "epoch": 2713} {"train_loss": -6.439330101013184, "global_step": 113963, "epoch": 2713} {"train_loss": -6.540602684020996, "global_step": 113964, "epoch": 2713} {"train_loss": -6.529231548309326, "global_step": 113965, "epoch": 2713} {"train_loss": -6.503807544708252, "global_step": 113966, "epoch": 2713} {"train_loss": -6.485848426818848, "global_step": 113967, "epoch": 2713} {"train_loss": -6.485498905181885, "global_step": 113968, "epoch": 2713} {"train_loss": -6.382925033569336, "global_step": 113969, "epoch": 2713} {"train_loss": -6.460263729095459, "global_step": 113970, "epoch": 2713} {"train_loss": -6.508727550506592, "global_step": 113971, "epoch": 2713} {"train_loss": -6.434235572814941, "global_step": 113972, "epoch": 2713} {"train_loss": -6.407179832458496, "global_step": 113973, "epoch": 2713} {"train_loss": -6.458223342895508, "global_step": 113974, "epoch": 2713} {"train_loss": -6.529518127441406, "global_step": 113975, "epoch": 2713} {"train_loss": -6.456548690795898, "global_step": 113976, "epoch": 2713} {"train_loss": -6.32597541809082, "global_step": 113977, "epoch": 2713} {"train_loss": -6.5256757736206055, "global_step": 113978, "epoch": 2713} {"train_loss": -6.495119094848633, "global_step": 113979, "epoch": 2713} {"train_loss": -6.453979015350342, "global_step": 113980, "epoch": 2713} {"train_loss": -6.439014434814453, "global_step": 113981, "epoch": 2713} {"train_loss": -6.500628471374512, "global_step": 113982, "epoch": 2713} {"train_loss": -6.545683860778809, "global_step": 113983, "epoch": 2713} {"train_loss": -6.565072536468506, "global_step": 113984, "epoch": 2713} {"train_loss": -6.437786102294922, "global_step": 113985, "epoch": 2713} {"train_loss": -6.441895484924316, "global_step": 113986, "epoch": 2713} {"train_loss": -6.470779055640811, "global_step": 113987, "epoch": 2713, "val_loss": 67802.9921875} {"train_loss": -6.449365615844727, "global_step": 113988, "epoch": 2714} {"train_loss": -6.441204071044922, "global_step": 113989, "epoch": 2714} {"train_loss": -6.515870094299316, "global_step": 113990, "epoch": 2714} {"train_loss": -6.474462509155273, "global_step": 113991, "epoch": 2714} {"train_loss": -6.602272033691406, "global_step": 113992, "epoch": 2714} {"train_loss": -6.455739974975586, "global_step": 113993, "epoch": 2714} {"train_loss": -6.49955940246582, "global_step": 113994, "epoch": 2714} {"train_loss": -6.4701080322265625, "global_step": 113995, "epoch": 2714} {"train_loss": -6.46815824508667, "global_step": 113996, "epoch": 2714} {"train_loss": -6.333889007568359, "global_step": 113997, "epoch": 2714} {"train_loss": -6.549866676330566, "global_step": 113998, "epoch": 2714} {"train_loss": -6.423247814178467, "global_step": 113999, "epoch": 2714} {"train_loss": -6.522327423095703, "global_step": 114000, "epoch": 2714} {"train_loss": -6.367995262145996, "global_step": 114001, "epoch": 2714} {"train_loss": -6.3880815505981445, "global_step": 114002, "epoch": 2714} {"train_loss": -6.501357078552246, "global_step": 114003, "epoch": 2714} {"train_loss": -6.397449970245361, "global_step": 114004, "epoch": 2714} {"train_loss": -6.315128326416016, "global_step": 114005, "epoch": 2714} {"train_loss": -6.444009780883789, "global_step": 114006, "epoch": 2714} {"train_loss": -6.435927391052246, "global_step": 114007, "epoch": 2714} {"train_loss": -6.44873046875, "global_step": 114008, "epoch": 2714} {"train_loss": -6.394340515136719, "global_step": 114009, "epoch": 2714} {"train_loss": -6.481032371520996, "global_step": 114010, "epoch": 2714} {"train_loss": -6.334424018859863, "global_step": 114011, "epoch": 2714} {"train_loss": -6.495599746704102, "global_step": 114012, "epoch": 2714} {"train_loss": -6.393699645996094, "global_step": 114013, "epoch": 2714} {"train_loss": -6.284131050109863, "global_step": 114014, "epoch": 2714} {"train_loss": -6.476107597351074, "global_step": 114015, "epoch": 2714} {"train_loss": -6.393270492553711, "global_step": 114016, "epoch": 2714} {"train_loss": -6.3778862953186035, "global_step": 114017, "epoch": 2714} {"train_loss": -6.42460823059082, "global_step": 114018, "epoch": 2714} {"train_loss": -6.435379981994629, "global_step": 114019, "epoch": 2714} {"train_loss": -6.4793620109558105, "global_step": 114020, "epoch": 2714} {"train_loss": -6.519207000732422, "global_step": 114021, "epoch": 2714} {"train_loss": -6.483275890350342, "global_step": 114022, "epoch": 2714} {"train_loss": -6.457701683044434, "global_step": 114023, "epoch": 2714} {"train_loss": -6.357837200164795, "global_step": 114024, "epoch": 2714} {"train_loss": -6.501919269561768, "global_step": 114025, "epoch": 2714} {"train_loss": -6.44483757019043, "global_step": 114026, "epoch": 2714} {"train_loss": -6.360716819763184, "global_step": 114027, "epoch": 2714} {"train_loss": -6.459298610687256, "global_step": 114028, "epoch": 2714} {"train_loss": -6.442197652090163, "global_step": 114029, "epoch": 2714, "val_loss": 67867.59375} {"train_loss": -6.4979753494262695, "global_step": 114030, "epoch": 2715} {"train_loss": -6.498417854309082, "global_step": 114031, "epoch": 2715} {"train_loss": -6.466607093811035, "global_step": 114032, "epoch": 2715} {"train_loss": -6.4342193603515625, "global_step": 114033, "epoch": 2715} {"train_loss": -6.604457855224609, "global_step": 114034, "epoch": 2715} {"train_loss": -6.552845478057861, "global_step": 114035, "epoch": 2715} {"train_loss": -6.518345832824707, "global_step": 114036, "epoch": 2715} {"train_loss": -6.401707649230957, "global_step": 114037, "epoch": 2715} {"train_loss": -6.546725273132324, "global_step": 114038, "epoch": 2715} {"train_loss": -6.460114479064941, "global_step": 114039, "epoch": 2715} {"train_loss": -6.508057594299316, "global_step": 114040, "epoch": 2715} {"train_loss": -6.493145942687988, "global_step": 114041, "epoch": 2715} {"train_loss": -6.570028305053711, "global_step": 114042, "epoch": 2715} {"train_loss": -6.556720733642578, "global_step": 114043, "epoch": 2715} {"train_loss": -6.541499137878418, "global_step": 114044, "epoch": 2715} {"train_loss": -6.5037841796875, "global_step": 114045, "epoch": 2715} {"train_loss": -6.538613319396973, "global_step": 114046, "epoch": 2715} {"train_loss": -6.500953674316406, "global_step": 114047, "epoch": 2715} {"train_loss": -6.576113700866699, "global_step": 114048, "epoch": 2715} {"train_loss": -6.428400993347168, "global_step": 114049, "epoch": 2715} {"train_loss": -6.321928977966309, "global_step": 114050, "epoch": 2715} {"train_loss": -6.391749382019043, "global_step": 114051, "epoch": 2715} {"train_loss": -6.398475646972656, "global_step": 114052, "epoch": 2715} {"train_loss": -6.469511985778809, "global_step": 114053, "epoch": 2715} {"train_loss": -6.403231620788574, "global_step": 114054, "epoch": 2715} {"train_loss": -6.392242431640625, "global_step": 114055, "epoch": 2715} {"train_loss": -6.3221635818481445, "global_step": 114056, "epoch": 2715} {"train_loss": -6.333966255187988, "global_step": 114057, "epoch": 2715} {"train_loss": -6.499786376953125, "global_step": 114058, "epoch": 2715} {"train_loss": -6.567752838134766, "global_step": 114059, "epoch": 2715} {"train_loss": -6.52478551864624, "global_step": 114060, "epoch": 2715} {"train_loss": -6.497072219848633, "global_step": 114061, "epoch": 2715} {"train_loss": -6.4996161460876465, "global_step": 114062, "epoch": 2715} {"train_loss": -6.328741073608398, "global_step": 114063, "epoch": 2715} {"train_loss": -6.494926929473877, "global_step": 114064, "epoch": 2715} {"train_loss": -6.514976501464844, "global_step": 114065, "epoch": 2715} {"train_loss": -6.4656267166137695, "global_step": 114066, "epoch": 2715} {"train_loss": -6.376677513122559, "global_step": 114067, "epoch": 2715} {"train_loss": -6.521933555603027, "global_step": 114068, "epoch": 2715} {"train_loss": -6.517720699310303, "global_step": 114069, "epoch": 2715} {"train_loss": -6.426502227783203, "global_step": 114070, "epoch": 2715} {"train_loss": -6.473503180912563, "global_step": 114071, "epoch": 2715, "val_loss": 67802.375} {"train_loss": -6.543895244598389, "global_step": 114072, "epoch": 2716} {"train_loss": -6.401730537414551, "global_step": 114073, "epoch": 2716} {"train_loss": -6.516749382019043, "global_step": 114074, "epoch": 2716} {"train_loss": -6.450918197631836, "global_step": 114075, "epoch": 2716} {"train_loss": -6.420161724090576, "global_step": 114076, "epoch": 2716} {"train_loss": -6.419493198394775, "global_step": 114077, "epoch": 2716} {"train_loss": -6.412379741668701, "global_step": 114078, "epoch": 2716} {"train_loss": -6.557168960571289, "global_step": 114079, "epoch": 2716} {"train_loss": -6.396758079528809, "global_step": 114080, "epoch": 2716} {"train_loss": -6.4736328125, "global_step": 114081, "epoch": 2716} {"train_loss": -6.433473587036133, "global_step": 114082, "epoch": 2716} {"train_loss": -6.429675102233887, "global_step": 114083, "epoch": 2716} {"train_loss": -6.4201884269714355, "global_step": 114084, "epoch": 2716} {"train_loss": -6.522510528564453, "global_step": 114085, "epoch": 2716} {"train_loss": -6.598865509033203, "global_step": 114086, "epoch": 2716} {"train_loss": -6.451313018798828, "global_step": 114087, "epoch": 2716} {"train_loss": -6.538732528686523, "global_step": 114088, "epoch": 2716} {"train_loss": -6.472058296203613, "global_step": 114089, "epoch": 2716} {"train_loss": -6.37571907043457, "global_step": 114090, "epoch": 2716} {"train_loss": -6.42298698425293, "global_step": 114091, "epoch": 2716} {"train_loss": -6.405856132507324, "global_step": 114092, "epoch": 2716} {"train_loss": -6.444057464599609, "global_step": 114093, "epoch": 2716} {"train_loss": -6.509031772613525, "global_step": 114094, "epoch": 2716} {"train_loss": -6.352048873901367, "global_step": 114095, "epoch": 2716} {"train_loss": -6.568212509155273, "global_step": 114096, "epoch": 2716} {"train_loss": -6.402093410491943, "global_step": 114097, "epoch": 2716} {"train_loss": -6.30845832824707, "global_step": 114098, "epoch": 2716} {"train_loss": -6.43805456161499, "global_step": 114099, "epoch": 2716} {"train_loss": -6.417349815368652, "global_step": 114100, "epoch": 2716} {"train_loss": -6.400871753692627, "global_step": 114101, "epoch": 2716} {"train_loss": -6.528491020202637, "global_step": 114102, "epoch": 2716} {"train_loss": -6.594264507293701, "global_step": 114103, "epoch": 2716} {"train_loss": -6.425508499145508, "global_step": 114104, "epoch": 2716} {"train_loss": -6.564482688903809, "global_step": 114105, "epoch": 2716} {"train_loss": -6.488918304443359, "global_step": 114106, "epoch": 2716} {"train_loss": -6.560451984405518, "global_step": 114107, "epoch": 2716} {"train_loss": -6.556341171264648, "global_step": 114108, "epoch": 2716} {"train_loss": -6.494112968444824, "global_step": 114109, "epoch": 2716} {"train_loss": -6.474332332611084, "global_step": 114110, "epoch": 2716} {"train_loss": -6.636744976043701, "global_step": 114111, "epoch": 2716} {"train_loss": -6.52567195892334, "global_step": 114112, "epoch": 2716} {"train_loss": -6.4720877352215, "global_step": 114113, "epoch": 2716, "val_loss": 67951.1015625} {"train_loss": -6.561882495880127, "global_step": 114114, "epoch": 2717} {"train_loss": -6.474796295166016, "global_step": 114115, "epoch": 2717} {"train_loss": -6.528566360473633, "global_step": 114116, "epoch": 2717} {"train_loss": -6.479101181030273, "global_step": 114117, "epoch": 2717} {"train_loss": -6.451345443725586, "global_step": 114118, "epoch": 2717} {"train_loss": -6.507772922515869, "global_step": 114119, "epoch": 2717} {"train_loss": -6.330410957336426, "global_step": 114120, "epoch": 2717} {"train_loss": -6.519269943237305, "global_step": 114121, "epoch": 2717} {"train_loss": -6.524487495422363, "global_step": 114122, "epoch": 2717} {"train_loss": -6.593125343322754, "global_step": 114123, "epoch": 2717} {"train_loss": -6.526562690734863, "global_step": 114124, "epoch": 2717} {"train_loss": -6.5743303298950195, "global_step": 114125, "epoch": 2717} {"train_loss": -6.505483150482178, "global_step": 114126, "epoch": 2717} {"train_loss": -6.566013813018799, "global_step": 114127, "epoch": 2717} {"train_loss": -6.47447395324707, "global_step": 114128, "epoch": 2717} {"train_loss": -6.431277275085449, "global_step": 114129, "epoch": 2717} {"train_loss": -6.52305793762207, "global_step": 114130, "epoch": 2717} {"train_loss": -6.396040916442871, "global_step": 114131, "epoch": 2717} {"train_loss": -6.4181365966796875, "global_step": 114132, "epoch": 2717} {"train_loss": -6.333266735076904, "global_step": 114133, "epoch": 2717} {"train_loss": -6.517850875854492, "global_step": 114134, "epoch": 2717} {"train_loss": -6.4598388671875, "global_step": 114135, "epoch": 2717} {"train_loss": -6.342015266418457, "global_step": 114136, "epoch": 2717} {"train_loss": -6.211050987243652, "global_step": 114137, "epoch": 2717} {"train_loss": -6.483091354370117, "global_step": 114138, "epoch": 2717} {"train_loss": -6.308892726898193, "global_step": 114139, "epoch": 2717} {"train_loss": -6.335987091064453, "global_step": 114140, "epoch": 2717} {"train_loss": -6.275507926940918, "global_step": 114141, "epoch": 2717} {"train_loss": -6.390806198120117, "global_step": 114142, "epoch": 2717} {"train_loss": -6.389777183532715, "global_step": 114143, "epoch": 2717} {"train_loss": -6.356744766235352, "global_step": 114144, "epoch": 2717} {"train_loss": -6.385695934295654, "global_step": 114145, "epoch": 2717} {"train_loss": -6.402833938598633, "global_step": 114146, "epoch": 2717} {"train_loss": -6.3360443115234375, "global_step": 114147, "epoch": 2717} {"train_loss": -6.4156365394592285, "global_step": 114148, "epoch": 2717} {"train_loss": -6.314000606536865, "global_step": 114149, "epoch": 2717} {"train_loss": -6.532373905181885, "global_step": 114150, "epoch": 2717} {"train_loss": -6.304572105407715, "global_step": 114151, "epoch": 2717} {"train_loss": -6.404077529907227, "global_step": 114152, "epoch": 2717} {"train_loss": -6.53383207321167, "global_step": 114153, "epoch": 2717} {"train_loss": -6.472259521484375, "global_step": 114154, "epoch": 2717} {"train_loss": -6.43503246988569, "global_step": 114155, "epoch": 2717, "val_loss": 67934.359375} {"train_loss": -6.451711177825928, "global_step": 114156, "epoch": 2718} {"train_loss": -6.473140716552734, "global_step": 114157, "epoch": 2718} {"train_loss": -6.407564163208008, "global_step": 114158, "epoch": 2718} {"train_loss": -6.457150459289551, "global_step": 114159, "epoch": 2718} {"train_loss": -6.419466972351074, "global_step": 114160, "epoch": 2718} {"train_loss": -6.595235824584961, "global_step": 114161, "epoch": 2718} {"train_loss": -6.420929908752441, "global_step": 114162, "epoch": 2718} {"train_loss": -6.445154666900635, "global_step": 114163, "epoch": 2718} {"train_loss": -6.455811023712158, "global_step": 114164, "epoch": 2718} {"train_loss": -6.474329471588135, "global_step": 114165, "epoch": 2718} {"train_loss": -6.466030120849609, "global_step": 114166, "epoch": 2718} {"train_loss": -6.456023216247559, "global_step": 114167, "epoch": 2718} {"train_loss": -6.394880294799805, "global_step": 114168, "epoch": 2718} {"train_loss": -6.485980033874512, "global_step": 114169, "epoch": 2718} {"train_loss": -6.448563575744629, "global_step": 114170, "epoch": 2718} {"train_loss": -6.5288405418396, "global_step": 114171, "epoch": 2718} {"train_loss": -6.474366188049316, "global_step": 114172, "epoch": 2718} {"train_loss": -6.44093132019043, "global_step": 114173, "epoch": 2718} {"train_loss": -6.43099308013916, "global_step": 114174, "epoch": 2718} {"train_loss": -6.478630542755127, "global_step": 114175, "epoch": 2718} {"train_loss": -6.421609401702881, "global_step": 114176, "epoch": 2718} {"train_loss": -6.523675918579102, "global_step": 114177, "epoch": 2718} {"train_loss": -6.509592533111572, "global_step": 114178, "epoch": 2718} {"train_loss": -6.61939001083374, "global_step": 114179, "epoch": 2718} {"train_loss": -6.478341579437256, "global_step": 114180, "epoch": 2718} {"train_loss": -6.489758491516113, "global_step": 114181, "epoch": 2718} {"train_loss": -6.688789367675781, "global_step": 114182, "epoch": 2718} {"train_loss": -6.513832092285156, "global_step": 114183, "epoch": 2718} {"train_loss": -6.477800369262695, "global_step": 114184, "epoch": 2718} {"train_loss": -6.494585990905762, "global_step": 114185, "epoch": 2718} {"train_loss": -6.470158100128174, "global_step": 114186, "epoch": 2718} {"train_loss": -6.414461135864258, "global_step": 114187, "epoch": 2718} {"train_loss": -6.444681167602539, "global_step": 114188, "epoch": 2718} {"train_loss": -6.401654243469238, "global_step": 114189, "epoch": 2718} {"train_loss": -6.572049617767334, "global_step": 114190, "epoch": 2718} {"train_loss": -6.375165939331055, "global_step": 114191, "epoch": 2718} {"train_loss": -6.636889457702637, "global_step": 114192, "epoch": 2718} {"train_loss": -6.55047607421875, "global_step": 114193, "epoch": 2718} {"train_loss": -6.461911201477051, "global_step": 114194, "epoch": 2718} {"train_loss": -6.505871772766113, "global_step": 114195, "epoch": 2718} {"train_loss": -6.549714088439941, "global_step": 114196, "epoch": 2718} {"train_loss": -6.481853882471721, "global_step": 114197, "epoch": 2718, "val_loss": 67938.109375} {"train_loss": -6.4963202476501465, "global_step": 114198, "epoch": 2719} {"train_loss": -6.506399154663086, "global_step": 114199, "epoch": 2719} {"train_loss": -6.501577377319336, "global_step": 114200, "epoch": 2719} {"train_loss": -6.571752071380615, "global_step": 114201, "epoch": 2719} {"train_loss": -6.439191818237305, "global_step": 114202, "epoch": 2719} {"train_loss": -6.4269514083862305, "global_step": 114203, "epoch": 2719} {"train_loss": -6.436221122741699, "global_step": 114204, "epoch": 2719} {"train_loss": -6.41623592376709, "global_step": 114205, "epoch": 2719} {"train_loss": -6.495858192443848, "global_step": 114206, "epoch": 2719} {"train_loss": -6.433821678161621, "global_step": 114207, "epoch": 2719} {"train_loss": -6.486767768859863, "global_step": 114208, "epoch": 2719} {"train_loss": -6.3915791511535645, "global_step": 114209, "epoch": 2719} {"train_loss": -6.5116167068481445, "global_step": 114210, "epoch": 2719} {"train_loss": -6.48560094833374, "global_step": 114211, "epoch": 2719} {"train_loss": -6.563912391662598, "global_step": 114212, "epoch": 2719} {"train_loss": -6.466612339019775, "global_step": 114213, "epoch": 2719} {"train_loss": -6.567824363708496, "global_step": 114214, "epoch": 2719} {"train_loss": -6.550943374633789, "global_step": 114215, "epoch": 2719} {"train_loss": -6.4488525390625, "global_step": 114216, "epoch": 2719} {"train_loss": -6.451611518859863, "global_step": 114217, "epoch": 2719} {"train_loss": -6.47998046875, "global_step": 114218, "epoch": 2719} {"train_loss": -6.573266506195068, "global_step": 114219, "epoch": 2719} {"train_loss": -6.404055118560791, "global_step": 114220, "epoch": 2719} {"train_loss": -6.546655178070068, "global_step": 114221, "epoch": 2719} {"train_loss": -6.586946487426758, "global_step": 114222, "epoch": 2719} {"train_loss": -6.499852180480957, "global_step": 114223, "epoch": 2719} {"train_loss": -6.6633219718933105, "global_step": 114224, "epoch": 2719} {"train_loss": -6.380192279815674, "global_step": 114225, "epoch": 2719} {"train_loss": -6.479169845581055, "global_step": 114226, "epoch": 2719} {"train_loss": -6.442951202392578, "global_step": 114227, "epoch": 2719} {"train_loss": -6.5052409172058105, "global_step": 114228, "epoch": 2719} {"train_loss": -6.500341415405273, "global_step": 114229, "epoch": 2719} {"train_loss": -6.59101676940918, "global_step": 114230, "epoch": 2719} {"train_loss": -6.673969268798828, "global_step": 114231, "epoch": 2719} {"train_loss": -6.490880966186523, "global_step": 114232, "epoch": 2719} {"train_loss": -6.482840538024902, "global_step": 114233, "epoch": 2719} {"train_loss": -6.580893516540527, "global_step": 114234, "epoch": 2719} {"train_loss": -6.427321434020996, "global_step": 114235, "epoch": 2719} {"train_loss": -6.4544291496276855, "global_step": 114236, "epoch": 2719} {"train_loss": -6.485295295715332, "global_step": 114237, "epoch": 2719} {"train_loss": -6.612595081329346, "global_step": 114238, "epoch": 2719} {"train_loss": -6.499637910297939, "global_step": 114239, "epoch": 2719, "val_loss": 67955.4140625} {"train_loss": -6.617897033691406, "global_step": 114240, "epoch": 2720} {"train_loss": -6.481470584869385, "global_step": 114241, "epoch": 2720} {"train_loss": -6.627571105957031, "global_step": 114242, "epoch": 2720} {"train_loss": -6.551340579986572, "global_step": 114243, "epoch": 2720} {"train_loss": -6.492625713348389, "global_step": 114244, "epoch": 2720} {"train_loss": -6.585759162902832, "global_step": 114245, "epoch": 2720} {"train_loss": -6.5473127365112305, "global_step": 114246, "epoch": 2720} {"train_loss": -6.491138935089111, "global_step": 114247, "epoch": 2720} {"train_loss": -6.563849925994873, "global_step": 114248, "epoch": 2720} {"train_loss": -6.529662609100342, "global_step": 114249, "epoch": 2720} {"train_loss": -6.505478858947754, "global_step": 114250, "epoch": 2720} {"train_loss": -6.481095314025879, "global_step": 114251, "epoch": 2720} {"train_loss": -6.539289951324463, "global_step": 114252, "epoch": 2720} {"train_loss": -6.412383079528809, "global_step": 114253, "epoch": 2720} {"train_loss": -6.435711860656738, "global_step": 114254, "epoch": 2720} {"train_loss": -6.515684127807617, "global_step": 114255, "epoch": 2720} {"train_loss": -6.532615661621094, "global_step": 114256, "epoch": 2720} {"train_loss": -6.533908843994141, "global_step": 114257, "epoch": 2720} {"train_loss": -6.557791709899902, "global_step": 114258, "epoch": 2720} {"train_loss": -6.467477798461914, "global_step": 114259, "epoch": 2720} {"train_loss": -6.483549118041992, "global_step": 114260, "epoch": 2720} {"train_loss": -6.563442230224609, "global_step": 114261, "epoch": 2720} {"train_loss": -6.411332130432129, "global_step": 114262, "epoch": 2720} {"train_loss": -6.41927433013916, "global_step": 114263, "epoch": 2720} {"train_loss": -6.4471755027771, "global_step": 114264, "epoch": 2720} {"train_loss": -6.453840732574463, "global_step": 114265, "epoch": 2720} {"train_loss": -6.54524564743042, "global_step": 114266, "epoch": 2720} {"train_loss": -6.5028839111328125, "global_step": 114267, "epoch": 2720} {"train_loss": -6.606478691101074, "global_step": 114268, "epoch": 2720} {"train_loss": -6.518674373626709, "global_step": 114269, "epoch": 2720} {"train_loss": -6.623126983642578, "global_step": 114270, "epoch": 2720} {"train_loss": -6.529674053192139, "global_step": 114271, "epoch": 2720} {"train_loss": -6.409610748291016, "global_step": 114272, "epoch": 2720} {"train_loss": -6.465214252471924, "global_step": 114273, "epoch": 2720} {"train_loss": -6.5017619132995605, "global_step": 114274, "epoch": 2720} {"train_loss": -6.451754570007324, "global_step": 114275, "epoch": 2720} {"train_loss": -6.28206729888916, "global_step": 114276, "epoch": 2720} {"train_loss": -6.45367956161499, "global_step": 114277, "epoch": 2720} {"train_loss": -6.45658016204834, "global_step": 114278, "epoch": 2720} {"train_loss": -6.514567852020264, "global_step": 114279, "epoch": 2720} {"train_loss": -6.4186835289001465, "global_step": 114280, "epoch": 2720} {"train_loss": -6.499533812204997, "global_step": 114281, "epoch": 2720, "val_loss": 67897.1640625} {"train_loss": -6.625675678253174, "global_step": 114282, "epoch": 2721} {"train_loss": -6.498391151428223, "global_step": 114283, "epoch": 2721} {"train_loss": -6.47446870803833, "global_step": 114284, "epoch": 2721} {"train_loss": -6.567946434020996, "global_step": 114285, "epoch": 2721} {"train_loss": -6.534544944763184, "global_step": 114286, "epoch": 2721} {"train_loss": -6.5416669845581055, "global_step": 114287, "epoch": 2721} {"train_loss": -6.536675930023193, "global_step": 114288, "epoch": 2721} {"train_loss": -6.4375152587890625, "global_step": 114289, "epoch": 2721} {"train_loss": -6.668072700500488, "global_step": 114290, "epoch": 2721} {"train_loss": -6.594607353210449, "global_step": 114291, "epoch": 2721} {"train_loss": -6.413693904876709, "global_step": 114292, "epoch": 2721} {"train_loss": -6.495726585388184, "global_step": 114293, "epoch": 2721} {"train_loss": -6.489712715148926, "global_step": 114294, "epoch": 2721} {"train_loss": -6.4580488204956055, "global_step": 114295, "epoch": 2721} {"train_loss": -6.358779430389404, "global_step": 114296, "epoch": 2721} {"train_loss": -6.5006866455078125, "global_step": 114297, "epoch": 2721} {"train_loss": -6.603278160095215, "global_step": 114298, "epoch": 2721} {"train_loss": -6.430201530456543, "global_step": 114299, "epoch": 2721} {"train_loss": -6.426811218261719, "global_step": 114300, "epoch": 2721} {"train_loss": -6.5489277839660645, "global_step": 114301, "epoch": 2721} {"train_loss": -6.449367046356201, "global_step": 114302, "epoch": 2721} {"train_loss": -6.505087852478027, "global_step": 114303, "epoch": 2721} {"train_loss": -6.4972429275512695, "global_step": 114304, "epoch": 2721} {"train_loss": -6.3925628662109375, "global_step": 114305, "epoch": 2721} {"train_loss": -6.467931270599365, "global_step": 114306, "epoch": 2721} {"train_loss": -6.38510799407959, "global_step": 114307, "epoch": 2721} {"train_loss": -6.403320789337158, "global_step": 114308, "epoch": 2721} {"train_loss": -6.374840259552002, "global_step": 114309, "epoch": 2721} {"train_loss": -6.434427738189697, "global_step": 114310, "epoch": 2721} {"train_loss": -6.434959411621094, "global_step": 114311, "epoch": 2721} {"train_loss": -6.4583330154418945, "global_step": 114312, "epoch": 2721} {"train_loss": -6.625608921051025, "global_step": 114313, "epoch": 2721} {"train_loss": -6.2562255859375, "global_step": 114314, "epoch": 2721} {"train_loss": -6.3729400634765625, "global_step": 114315, "epoch": 2721} {"train_loss": -6.458683967590332, "global_step": 114316, "epoch": 2721} {"train_loss": -6.377406597137451, "global_step": 114317, "epoch": 2721} {"train_loss": -6.489907264709473, "global_step": 114318, "epoch": 2721} {"train_loss": -6.50830078125, "global_step": 114319, "epoch": 2721} {"train_loss": -6.448182582855225, "global_step": 114320, "epoch": 2721} {"train_loss": -6.42342472076416, "global_step": 114321, "epoch": 2721} {"train_loss": -6.416571140289307, "global_step": 114322, "epoch": 2721} {"train_loss": -6.473603521074567, "global_step": 114323, "epoch": 2721, "val_loss": 67875.8125} {"train_loss": -6.586083889007568, "global_step": 114324, "epoch": 2722} {"train_loss": -6.509274959564209, "global_step": 114325, "epoch": 2722} {"train_loss": -6.423168182373047, "global_step": 114326, "epoch": 2722} {"train_loss": -6.506290435791016, "global_step": 114327, "epoch": 2722} {"train_loss": -6.4864630699157715, "global_step": 114328, "epoch": 2722} {"train_loss": -6.39569091796875, "global_step": 114329, "epoch": 2722} {"train_loss": -6.506041049957275, "global_step": 114330, "epoch": 2722} {"train_loss": -6.411301136016846, "global_step": 114331, "epoch": 2722} {"train_loss": -6.400702476501465, "global_step": 114332, "epoch": 2722} {"train_loss": -6.554867744445801, "global_step": 114333, "epoch": 2722} {"train_loss": -6.251427173614502, "global_step": 114334, "epoch": 2722} {"train_loss": -6.419145584106445, "global_step": 114335, "epoch": 2722} {"train_loss": -6.575032711029053, "global_step": 114336, "epoch": 2722} {"train_loss": -6.269551753997803, "global_step": 114337, "epoch": 2722} {"train_loss": -6.567569732666016, "global_step": 114338, "epoch": 2722} {"train_loss": -6.52541971206665, "global_step": 114339, "epoch": 2722} {"train_loss": -6.337064743041992, "global_step": 114340, "epoch": 2722} {"train_loss": -6.441153049468994, "global_step": 114341, "epoch": 2722} {"train_loss": -6.379039764404297, "global_step": 114342, "epoch": 2722} {"train_loss": -6.440072059631348, "global_step": 114343, "epoch": 2722} {"train_loss": -6.509577751159668, "global_step": 114344, "epoch": 2722} {"train_loss": -6.488387584686279, "global_step": 114345, "epoch": 2722} {"train_loss": -6.4997100830078125, "global_step": 114346, "epoch": 2722} {"train_loss": -6.503836631774902, "global_step": 114347, "epoch": 2722} {"train_loss": -6.4535231590271, "global_step": 114348, "epoch": 2722} {"train_loss": -6.353292465209961, "global_step": 114349, "epoch": 2722} {"train_loss": -6.364676475524902, "global_step": 114350, "epoch": 2722} {"train_loss": -6.515122413635254, "global_step": 114351, "epoch": 2722} {"train_loss": -6.434340953826904, "global_step": 114352, "epoch": 2722} {"train_loss": -6.352004051208496, "global_step": 114353, "epoch": 2722} {"train_loss": -6.437292098999023, "global_step": 114354, "epoch": 2722} {"train_loss": -6.40573263168335, "global_step": 114355, "epoch": 2722} {"train_loss": -6.306364059448242, "global_step": 114356, "epoch": 2722} {"train_loss": -6.407439708709717, "global_step": 114357, "epoch": 2722} {"train_loss": -6.360658168792725, "global_step": 114358, "epoch": 2722} {"train_loss": -6.53658390045166, "global_step": 114359, "epoch": 2722} {"train_loss": -6.369841575622559, "global_step": 114360, "epoch": 2722} {"train_loss": -6.393691062927246, "global_step": 114361, "epoch": 2722} {"train_loss": -6.382815361022949, "global_step": 114362, "epoch": 2722} {"train_loss": -6.529611587524414, "global_step": 114363, "epoch": 2722} {"train_loss": -6.419342994689941, "global_step": 114364, "epoch": 2722} {"train_loss": -6.439239729018438, "global_step": 114365, "epoch": 2722, "val_loss": 67776.046875} {"train_loss": -6.552035808563232, "global_step": 114366, "epoch": 2723} {"train_loss": -6.487326622009277, "global_step": 114367, "epoch": 2723} {"train_loss": -6.582732200622559, "global_step": 114368, "epoch": 2723} {"train_loss": -6.407533645629883, "global_step": 114369, "epoch": 2723} {"train_loss": -6.390401840209961, "global_step": 114370, "epoch": 2723} {"train_loss": -6.557632923126221, "global_step": 114371, "epoch": 2723} {"train_loss": -6.494879722595215, "global_step": 114372, "epoch": 2723} {"train_loss": -6.478585243225098, "global_step": 114373, "epoch": 2723} {"train_loss": -6.487790107727051, "global_step": 114374, "epoch": 2723} {"train_loss": -6.430556774139404, "global_step": 114375, "epoch": 2723} {"train_loss": -6.351337432861328, "global_step": 114376, "epoch": 2723} {"train_loss": -6.427708148956299, "global_step": 114377, "epoch": 2723} {"train_loss": -6.391819000244141, "global_step": 114378, "epoch": 2723} {"train_loss": -6.441832542419434, "global_step": 114379, "epoch": 2723} {"train_loss": -6.401333808898926, "global_step": 114380, "epoch": 2723} {"train_loss": -6.4523162841796875, "global_step": 114381, "epoch": 2723} {"train_loss": -6.499147891998291, "global_step": 114382, "epoch": 2723} {"train_loss": -6.448237419128418, "global_step": 114383, "epoch": 2723} {"train_loss": -6.443131446838379, "global_step": 114384, "epoch": 2723} {"train_loss": -6.408605098724365, "global_step": 114385, "epoch": 2723} {"train_loss": -6.482550621032715, "global_step": 114386, "epoch": 2723} {"train_loss": -6.4822869300842285, "global_step": 114387, "epoch": 2723} {"train_loss": -6.494746208190918, "global_step": 114388, "epoch": 2723} {"train_loss": -6.5203022956848145, "global_step": 114389, "epoch": 2723} {"train_loss": -6.53022575378418, "global_step": 114390, "epoch": 2723} {"train_loss": -6.517694473266602, "global_step": 114391, "epoch": 2723} {"train_loss": -6.440735816955566, "global_step": 114392, "epoch": 2723} {"train_loss": -6.4512939453125, "global_step": 114393, "epoch": 2723} {"train_loss": -6.575037002563477, "global_step": 114394, "epoch": 2723} {"train_loss": -6.361391067504883, "global_step": 114395, "epoch": 2723} {"train_loss": -6.509035110473633, "global_step": 114396, "epoch": 2723} {"train_loss": -6.573476314544678, "global_step": 114397, "epoch": 2723} {"train_loss": -6.511219024658203, "global_step": 114398, "epoch": 2723} {"train_loss": -6.558218002319336, "global_step": 114399, "epoch": 2723} {"train_loss": -6.5757155418396, "global_step": 114400, "epoch": 2723} {"train_loss": -6.586373329162598, "global_step": 114401, "epoch": 2723} {"train_loss": -6.521846771240234, "global_step": 114402, "epoch": 2723} {"train_loss": -6.419505596160889, "global_step": 114403, "epoch": 2723} {"train_loss": -6.5002827644348145, "global_step": 114404, "epoch": 2723} {"train_loss": -6.5724053382873535, "global_step": 114405, "epoch": 2723} {"train_loss": -6.576239585876465, "global_step": 114406, "epoch": 2723} {"train_loss": -6.485209658032372, "global_step": 114407, "epoch": 2723, "val_loss": 67967.0234375} {"train_loss": -6.616665363311768, "global_step": 114408, "epoch": 2724} {"train_loss": -6.566822052001953, "global_step": 114409, "epoch": 2724} {"train_loss": -6.4543962478637695, "global_step": 114410, "epoch": 2724} {"train_loss": -6.5368170738220215, "global_step": 114411, "epoch": 2724} {"train_loss": -6.532212257385254, "global_step": 114412, "epoch": 2724} {"train_loss": -6.434085845947266, "global_step": 114413, "epoch": 2724} {"train_loss": -6.426970958709717, "global_step": 114414, "epoch": 2724} {"train_loss": -6.449424743652344, "global_step": 114415, "epoch": 2724} {"train_loss": -6.403604507446289, "global_step": 114416, "epoch": 2724} {"train_loss": -6.526398658752441, "global_step": 114417, "epoch": 2724} {"train_loss": -6.417666435241699, "global_step": 114418, "epoch": 2724} {"train_loss": -6.337380409240723, "global_step": 114419, "epoch": 2724} {"train_loss": -6.383941650390625, "global_step": 114420, "epoch": 2724} {"train_loss": -6.361812591552734, "global_step": 114421, "epoch": 2724} {"train_loss": -6.2225542068481445, "global_step": 114422, "epoch": 2724} {"train_loss": -6.5076904296875, "global_step": 114423, "epoch": 2724} {"train_loss": -6.460324764251709, "global_step": 114424, "epoch": 2724} {"train_loss": -6.4380598068237305, "global_step": 114425, "epoch": 2724} {"train_loss": -6.382401466369629, "global_step": 114426, "epoch": 2724} {"train_loss": -6.368546485900879, "global_step": 114427, "epoch": 2724} {"train_loss": -6.489021301269531, "global_step": 114428, "epoch": 2724} {"train_loss": -6.43497371673584, "global_step": 114429, "epoch": 2724} {"train_loss": -6.340827941894531, "global_step": 114430, "epoch": 2724} {"train_loss": -6.402626037597656, "global_step": 114431, "epoch": 2724} {"train_loss": -6.425015449523926, "global_step": 114432, "epoch": 2724} {"train_loss": -6.425168514251709, "global_step": 114433, "epoch": 2724} {"train_loss": -6.476951599121094, "global_step": 114434, "epoch": 2724} {"train_loss": -6.483619213104248, "global_step": 114435, "epoch": 2724} {"train_loss": -6.492610931396484, "global_step": 114436, "epoch": 2724} {"train_loss": -6.543447494506836, "global_step": 114437, "epoch": 2724} {"train_loss": -6.506425380706787, "global_step": 114438, "epoch": 2724} {"train_loss": -6.592724800109863, "global_step": 114439, "epoch": 2724} {"train_loss": -6.524569034576416, "global_step": 114440, "epoch": 2724} {"train_loss": -6.469639778137207, "global_step": 114441, "epoch": 2724} {"train_loss": -6.403011322021484, "global_step": 114442, "epoch": 2724} {"train_loss": -6.367789268493652, "global_step": 114443, "epoch": 2724} {"train_loss": -6.418656349182129, "global_step": 114444, "epoch": 2724} {"train_loss": -6.538491249084473, "global_step": 114445, "epoch": 2724} {"train_loss": -6.398949146270752, "global_step": 114446, "epoch": 2724} {"train_loss": -6.365909576416016, "global_step": 114447, "epoch": 2724} {"train_loss": -6.49931526184082, "global_step": 114448, "epoch": 2724} {"train_loss": -6.4475117183866955, "global_step": 114449, "epoch": 2724, "val_loss": 67816.5390625} {"train_loss": -6.44661808013916, "global_step": 114450, "epoch": 2725} {"train_loss": -6.366084575653076, "global_step": 114451, "epoch": 2725} {"train_loss": -6.369109153747559, "global_step": 114452, "epoch": 2725} {"train_loss": -6.516736030578613, "global_step": 114453, "epoch": 2725} {"train_loss": -6.260336875915527, "global_step": 114454, "epoch": 2725} {"train_loss": -6.5037455558776855, "global_step": 114455, "epoch": 2725} {"train_loss": -6.346320152282715, "global_step": 114456, "epoch": 2725} {"train_loss": -6.361979961395264, "global_step": 114457, "epoch": 2725} {"train_loss": -6.528688430786133, "global_step": 114458, "epoch": 2725} {"train_loss": -6.413434028625488, "global_step": 114459, "epoch": 2725} {"train_loss": -6.332794189453125, "global_step": 114460, "epoch": 2725} {"train_loss": -6.388950824737549, "global_step": 114461, "epoch": 2725} {"train_loss": -6.377811431884766, "global_step": 114462, "epoch": 2725} {"train_loss": -6.367633819580078, "global_step": 114463, "epoch": 2725} {"train_loss": -6.437172889709473, "global_step": 114464, "epoch": 2725} {"train_loss": -6.563905715942383, "global_step": 114465, "epoch": 2725} {"train_loss": -6.511754989624023, "global_step": 114466, "epoch": 2725} {"train_loss": -6.435074806213379, "global_step": 114467, "epoch": 2725} {"train_loss": -6.3774824142456055, "global_step": 114468, "epoch": 2725} {"train_loss": -6.442413806915283, "global_step": 114469, "epoch": 2725} {"train_loss": -6.475227355957031, "global_step": 114470, "epoch": 2725} {"train_loss": -6.419886589050293, "global_step": 114471, "epoch": 2725} {"train_loss": -6.427162170410156, "global_step": 114472, "epoch": 2725} {"train_loss": -6.521409034729004, "global_step": 114473, "epoch": 2725} {"train_loss": -6.528811454772949, "global_step": 114474, "epoch": 2725} {"train_loss": -6.514003753662109, "global_step": 114475, "epoch": 2725} {"train_loss": -6.451442241668701, "global_step": 114476, "epoch": 2725} {"train_loss": -6.54819393157959, "global_step": 114477, "epoch": 2725} {"train_loss": -6.391369819641113, "global_step": 114478, "epoch": 2725} {"train_loss": -6.513781547546387, "global_step": 114479, "epoch": 2725} {"train_loss": -6.429052352905273, "global_step": 114480, "epoch": 2725} {"train_loss": -6.499544143676758, "global_step": 114481, "epoch": 2725} {"train_loss": -6.531970500946045, "global_step": 114482, "epoch": 2725} {"train_loss": -6.449807167053223, "global_step": 114483, "epoch": 2725} {"train_loss": -6.593866348266602, "global_step": 114484, "epoch": 2725} {"train_loss": -6.508694171905518, "global_step": 114485, "epoch": 2725} {"train_loss": -6.465671062469482, "global_step": 114486, "epoch": 2725} {"train_loss": -6.486443519592285, "global_step": 114487, "epoch": 2725} {"train_loss": -6.620649337768555, "global_step": 114488, "epoch": 2725} {"train_loss": -6.620438098907471, "global_step": 114489, "epoch": 2725} {"train_loss": -6.406976699829102, "global_step": 114490, "epoch": 2725} {"train_loss": -6.457284802482242, "global_step": 114491, "epoch": 2725, "val_loss": 67864.7109375} {"train_loss": -6.342988967895508, "global_step": 114492, "epoch": 2726} {"train_loss": -6.5414533615112305, "global_step": 114493, "epoch": 2726} {"train_loss": -6.519151210784912, "global_step": 114494, "epoch": 2726} {"train_loss": -6.428467750549316, "global_step": 114495, "epoch": 2726} {"train_loss": -6.535679817199707, "global_step": 114496, "epoch": 2726} {"train_loss": -6.523365497589111, "global_step": 114497, "epoch": 2726} {"train_loss": -6.393786430358887, "global_step": 114498, "epoch": 2726} {"train_loss": -6.497594833374023, "global_step": 114499, "epoch": 2726} {"train_loss": -6.450551986694336, "global_step": 114500, "epoch": 2726} {"train_loss": -6.463604927062988, "global_step": 114501, "epoch": 2726} {"train_loss": -6.509406089782715, "global_step": 114502, "epoch": 2726} {"train_loss": -6.4656853675842285, "global_step": 114503, "epoch": 2726} {"train_loss": -6.50816535949707, "global_step": 114504, "epoch": 2726} {"train_loss": -6.443636417388916, "global_step": 114505, "epoch": 2726} {"train_loss": -6.379295349121094, "global_step": 114506, "epoch": 2726} {"train_loss": -6.626139163970947, "global_step": 114507, "epoch": 2726} {"train_loss": -6.394821643829346, "global_step": 114508, "epoch": 2726} {"train_loss": -6.4348907470703125, "global_step": 114509, "epoch": 2726} {"train_loss": -6.41902494430542, "global_step": 114510, "epoch": 2726} {"train_loss": -6.307796478271484, "global_step": 114511, "epoch": 2726} {"train_loss": -6.444379806518555, "global_step": 114512, "epoch": 2726} {"train_loss": -6.466819763183594, "global_step": 114513, "epoch": 2726} {"train_loss": -6.339188575744629, "global_step": 114514, "epoch": 2726} {"train_loss": -6.546087741851807, "global_step": 114515, "epoch": 2726} {"train_loss": -6.4961700439453125, "global_step": 114516, "epoch": 2726} {"train_loss": -6.458586692810059, "global_step": 114517, "epoch": 2726} {"train_loss": -6.475563049316406, "global_step": 114518, "epoch": 2726} {"train_loss": -6.466483116149902, "global_step": 114519, "epoch": 2726} {"train_loss": -6.380867004394531, "global_step": 114520, "epoch": 2726} {"train_loss": -6.460463523864746, "global_step": 114521, "epoch": 2726} {"train_loss": -6.548583507537842, "global_step": 114522, "epoch": 2726} {"train_loss": -6.464620590209961, "global_step": 114523, "epoch": 2726} {"train_loss": -6.465143203735352, "global_step": 114524, "epoch": 2726} {"train_loss": -6.403628349304199, "global_step": 114525, "epoch": 2726} {"train_loss": -6.555612564086914, "global_step": 114526, "epoch": 2726} {"train_loss": -6.547463417053223, "global_step": 114527, "epoch": 2726} {"train_loss": -6.500821113586426, "global_step": 114528, "epoch": 2726} {"train_loss": -6.695797920227051, "global_step": 114529, "epoch": 2726} {"train_loss": -6.445857048034668, "global_step": 114530, "epoch": 2726} {"train_loss": -6.4690446853637695, "global_step": 114531, "epoch": 2726} {"train_loss": -6.48005485534668, "global_step": 114532, "epoch": 2726} {"train_loss": -6.471427758534749, "global_step": 114533, "epoch": 2726, "val_loss": 67950.6953125} {"train_loss": -6.343235015869141, "global_step": 114534, "epoch": 2727} {"train_loss": -6.52143669128418, "global_step": 114535, "epoch": 2727} {"train_loss": -6.414213180541992, "global_step": 114536, "epoch": 2727} {"train_loss": -6.518775463104248, "global_step": 114537, "epoch": 2727} {"train_loss": -6.466493129730225, "global_step": 114538, "epoch": 2727} {"train_loss": -6.6087446212768555, "global_step": 114539, "epoch": 2727} {"train_loss": -6.447604179382324, "global_step": 114540, "epoch": 2727} {"train_loss": -6.402352333068848, "global_step": 114541, "epoch": 2727} {"train_loss": -6.550882339477539, "global_step": 114542, "epoch": 2727} {"train_loss": -6.541766166687012, "global_step": 114543, "epoch": 2727} {"train_loss": -6.576850891113281, "global_step": 114544, "epoch": 2727} {"train_loss": -6.5055832862854, "global_step": 114545, "epoch": 2727} {"train_loss": -6.585014343261719, "global_step": 114546, "epoch": 2727} {"train_loss": -6.571127891540527, "global_step": 114547, "epoch": 2727} {"train_loss": -6.4904680252075195, "global_step": 114548, "epoch": 2727} {"train_loss": -6.512573719024658, "global_step": 114549, "epoch": 2727} {"train_loss": -6.404702186584473, "global_step": 114550, "epoch": 2727} {"train_loss": -6.506389617919922, "global_step": 114551, "epoch": 2727} {"train_loss": -6.542376518249512, "global_step": 114552, "epoch": 2727} {"train_loss": -6.546393871307373, "global_step": 114553, "epoch": 2727} {"train_loss": -6.348749160766602, "global_step": 114554, "epoch": 2727} {"train_loss": -6.4354939460754395, "global_step": 114555, "epoch": 2727} {"train_loss": -6.4188232421875, "global_step": 114556, "epoch": 2727} {"train_loss": -6.50305700302124, "global_step": 114557, "epoch": 2727} {"train_loss": -6.449797630310059, "global_step": 114558, "epoch": 2727} {"train_loss": -6.493252754211426, "global_step": 114559, "epoch": 2727} {"train_loss": -6.403099060058594, "global_step": 114560, "epoch": 2727} {"train_loss": -6.400078773498535, "global_step": 114561, "epoch": 2727} {"train_loss": -6.507613182067871, "global_step": 114562, "epoch": 2727} {"train_loss": -6.441061973571777, "global_step": 114563, "epoch": 2727} {"train_loss": -6.398684024810791, "global_step": 114564, "epoch": 2727} {"train_loss": -6.462160587310791, "global_step": 114565, "epoch": 2727} {"train_loss": -6.484594821929932, "global_step": 114566, "epoch": 2727} {"train_loss": -6.480771064758301, "global_step": 114567, "epoch": 2727} {"train_loss": -6.4660964012146, "global_step": 114568, "epoch": 2727} {"train_loss": -6.49850606918335, "global_step": 114569, "epoch": 2727} {"train_loss": -6.501113414764404, "global_step": 114570, "epoch": 2727} {"train_loss": -6.492762565612793, "global_step": 114571, "epoch": 2727} {"train_loss": -6.518562316894531, "global_step": 114572, "epoch": 2727} {"train_loss": -6.448497772216797, "global_step": 114573, "epoch": 2727} {"train_loss": -6.419840335845947, "global_step": 114574, "epoch": 2727} {"train_loss": -6.480593931107294, "global_step": 114575, "epoch": 2727, "val_loss": 67971.40625} {"train_loss": -6.373679161071777, "global_step": 114576, "epoch": 2728} {"train_loss": -6.354558944702148, "global_step": 114577, "epoch": 2728} {"train_loss": -6.539334297180176, "global_step": 114578, "epoch": 2728} {"train_loss": -6.435527324676514, "global_step": 114579, "epoch": 2728} {"train_loss": -6.48862361907959, "global_step": 114580, "epoch": 2728} {"train_loss": -6.459914207458496, "global_step": 114581, "epoch": 2728} {"train_loss": -6.479767799377441, "global_step": 114582, "epoch": 2728} {"train_loss": -6.623324871063232, "global_step": 114583, "epoch": 2728} {"train_loss": -6.449631690979004, "global_step": 114584, "epoch": 2728} {"train_loss": -6.42849063873291, "global_step": 114585, "epoch": 2728} {"train_loss": -6.420182228088379, "global_step": 114586, "epoch": 2728} {"train_loss": -6.553530693054199, "global_step": 114587, "epoch": 2728} {"train_loss": -6.49979305267334, "global_step": 114588, "epoch": 2728} {"train_loss": -6.617005348205566, "global_step": 114589, "epoch": 2728} {"train_loss": -6.477534294128418, "global_step": 114590, "epoch": 2728} {"train_loss": -6.518579483032227, "global_step": 114591, "epoch": 2728} {"train_loss": -6.57484245300293, "global_step": 114592, "epoch": 2728} {"train_loss": -6.552584648132324, "global_step": 114593, "epoch": 2728} {"train_loss": -6.4284796714782715, "global_step": 114594, "epoch": 2728} {"train_loss": -6.5377349853515625, "global_step": 114595, "epoch": 2728} {"train_loss": -6.480288505554199, "global_step": 114596, "epoch": 2728} {"train_loss": -6.351806163787842, "global_step": 114597, "epoch": 2728} {"train_loss": -6.483869552612305, "global_step": 114598, "epoch": 2728} {"train_loss": -6.464461326599121, "global_step": 114599, "epoch": 2728} {"train_loss": -6.403083801269531, "global_step": 114600, "epoch": 2728} {"train_loss": -6.413602828979492, "global_step": 114601, "epoch": 2728} {"train_loss": -6.400702476501465, "global_step": 114602, "epoch": 2728} {"train_loss": -6.480294227600098, "global_step": 114603, "epoch": 2728} {"train_loss": -6.402788162231445, "global_step": 114604, "epoch": 2728} {"train_loss": -6.441283226013184, "global_step": 114605, "epoch": 2728} {"train_loss": -6.449796676635742, "global_step": 114606, "epoch": 2728} {"train_loss": -6.496459007263184, "global_step": 114607, "epoch": 2728} {"train_loss": -6.392816543579102, "global_step": 114608, "epoch": 2728} {"train_loss": -6.399068355560303, "global_step": 114609, "epoch": 2728} {"train_loss": -6.413761615753174, "global_step": 114610, "epoch": 2728} {"train_loss": -6.525240898132324, "global_step": 114611, "epoch": 2728} {"train_loss": -6.5259528160095215, "global_step": 114612, "epoch": 2728} {"train_loss": -6.427604675292969, "global_step": 114613, "epoch": 2728} {"train_loss": -6.511435508728027, "global_step": 114614, "epoch": 2728} {"train_loss": -6.627972602844238, "global_step": 114615, "epoch": 2728} {"train_loss": -6.427689075469971, "global_step": 114616, "epoch": 2728} {"train_loss": -6.471972737993513, "global_step": 114617, "epoch": 2728, "val_loss": 67849.0078125} {"train_loss": -6.444925308227539, "global_step": 114618, "epoch": 2729} {"train_loss": -6.48127555847168, "global_step": 114619, "epoch": 2729} {"train_loss": -6.497809410095215, "global_step": 114620, "epoch": 2729} {"train_loss": -6.44268798828125, "global_step": 114621, "epoch": 2729} {"train_loss": -6.603137493133545, "global_step": 114622, "epoch": 2729} {"train_loss": -6.509495735168457, "global_step": 114623, "epoch": 2729} {"train_loss": -6.399453163146973, "global_step": 114624, "epoch": 2729} {"train_loss": -6.598056793212891, "global_step": 114625, "epoch": 2729} {"train_loss": -6.632294178009033, "global_step": 114626, "epoch": 2729} {"train_loss": -6.61817741394043, "global_step": 114627, "epoch": 2729} {"train_loss": -6.435323715209961, "global_step": 114628, "epoch": 2729} {"train_loss": -6.63928747177124, "global_step": 114629, "epoch": 2729} {"train_loss": -6.590349197387695, "global_step": 114630, "epoch": 2729} {"train_loss": -6.434321880340576, "global_step": 114631, "epoch": 2729} {"train_loss": -6.434493064880371, "global_step": 114632, "epoch": 2729} {"train_loss": -6.5390706062316895, "global_step": 114633, "epoch": 2729} {"train_loss": -6.552114486694336, "global_step": 114634, "epoch": 2729} {"train_loss": -6.41424036026001, "global_step": 114635, "epoch": 2729} {"train_loss": -6.4567155838012695, "global_step": 114636, "epoch": 2729} {"train_loss": -6.459454536437988, "global_step": 114637, "epoch": 2729} {"train_loss": -6.478425979614258, "global_step": 114638, "epoch": 2729} {"train_loss": -6.496991157531738, "global_step": 114639, "epoch": 2729} {"train_loss": -6.460869789123535, "global_step": 114640, "epoch": 2729} {"train_loss": -6.529193878173828, "global_step": 114641, "epoch": 2729} {"train_loss": -6.480751991271973, "global_step": 114642, "epoch": 2729} {"train_loss": -6.488725662231445, "global_step": 114643, "epoch": 2729} {"train_loss": -6.468356609344482, "global_step": 114644, "epoch": 2729} {"train_loss": -6.306436538696289, "global_step": 114645, "epoch": 2729} {"train_loss": -6.622650623321533, "global_step": 114646, "epoch": 2729} {"train_loss": -6.5362653732299805, "global_step": 114647, "epoch": 2729} {"train_loss": -6.50107479095459, "global_step": 114648, "epoch": 2729} {"train_loss": -6.3392791748046875, "global_step": 114649, "epoch": 2729} {"train_loss": -6.5249528884887695, "global_step": 114650, "epoch": 2729} {"train_loss": -6.580456256866455, "global_step": 114651, "epoch": 2729} {"train_loss": -6.570277690887451, "global_step": 114652, "epoch": 2729} {"train_loss": -6.615133285522461, "global_step": 114653, "epoch": 2729} {"train_loss": -6.3910627365112305, "global_step": 114654, "epoch": 2729} {"train_loss": -6.453289985656738, "global_step": 114655, "epoch": 2729} {"train_loss": -6.508403778076172, "global_step": 114656, "epoch": 2729} {"train_loss": -6.468048095703125, "global_step": 114657, "epoch": 2729} {"train_loss": -6.479661464691162, "global_step": 114658, "epoch": 2729} {"train_loss": -6.501884210677374, "global_step": 114659, "epoch": 2729, "val_loss": 67832.2578125} {"train_loss": -6.510950565338135, "global_step": 114660, "epoch": 2730} {"train_loss": -6.441305160522461, "global_step": 114661, "epoch": 2730} {"train_loss": -6.519711494445801, "global_step": 114662, "epoch": 2730} {"train_loss": -6.4659104347229, "global_step": 114663, "epoch": 2730} {"train_loss": -6.452408313751221, "global_step": 114664, "epoch": 2730} {"train_loss": -6.5157999992370605, "global_step": 114665, "epoch": 2730} {"train_loss": -6.490571022033691, "global_step": 114666, "epoch": 2730} {"train_loss": -6.539790153503418, "global_step": 114667, "epoch": 2730} {"train_loss": -6.445738792419434, "global_step": 114668, "epoch": 2730} {"train_loss": -6.34969425201416, "global_step": 114669, "epoch": 2730} {"train_loss": -6.4372968673706055, "global_step": 114670, "epoch": 2730} {"train_loss": -6.523118495941162, "global_step": 114671, "epoch": 2730} {"train_loss": -6.489156723022461, "global_step": 114672, "epoch": 2730} {"train_loss": -6.528524875640869, "global_step": 114673, "epoch": 2730} {"train_loss": -6.539031982421875, "global_step": 114674, "epoch": 2730} {"train_loss": -6.449679374694824, "global_step": 114675, "epoch": 2730} {"train_loss": -6.525637626647949, "global_step": 114676, "epoch": 2730} {"train_loss": -6.421355724334717, "global_step": 114677, "epoch": 2730} {"train_loss": -6.51288366317749, "global_step": 114678, "epoch": 2730} {"train_loss": -6.499821662902832, "global_step": 114679, "epoch": 2730} {"train_loss": -6.404767036437988, "global_step": 114680, "epoch": 2730} {"train_loss": -6.503408908843994, "global_step": 114681, "epoch": 2730} {"train_loss": -6.541378974914551, "global_step": 114682, "epoch": 2730} {"train_loss": -6.550236701965332, "global_step": 114683, "epoch": 2730} {"train_loss": -6.603884696960449, "global_step": 114684, "epoch": 2730} {"train_loss": -6.473798751831055, "global_step": 114685, "epoch": 2730} {"train_loss": -6.290821075439453, "global_step": 114686, "epoch": 2730} {"train_loss": -6.534313678741455, "global_step": 114687, "epoch": 2730} {"train_loss": -6.465500354766846, "global_step": 114688, "epoch": 2730} {"train_loss": -6.504893779754639, "global_step": 114689, "epoch": 2730} {"train_loss": -6.559953212738037, "global_step": 114690, "epoch": 2730} {"train_loss": -6.572120189666748, "global_step": 114691, "epoch": 2730} {"train_loss": -6.504042625427246, "global_step": 114692, "epoch": 2730} {"train_loss": -6.404641151428223, "global_step": 114693, "epoch": 2730} {"train_loss": -6.482964992523193, "global_step": 114694, "epoch": 2730} {"train_loss": -6.475944995880127, "global_step": 114695, "epoch": 2730} {"train_loss": -6.584400177001953, "global_step": 114696, "epoch": 2730} {"train_loss": -6.344897270202637, "global_step": 114697, "epoch": 2730} {"train_loss": -6.46126651763916, "global_step": 114698, "epoch": 2730} {"train_loss": -6.428006172180176, "global_step": 114699, "epoch": 2730} {"train_loss": -6.524226665496826, "global_step": 114700, "epoch": 2730} {"train_loss": -6.484986248470488, "global_step": 114701, "epoch": 2730, "val_loss": 67907.0859375} {"train_loss": -6.490075588226318, "global_step": 114702, "epoch": 2731} {"train_loss": -6.405089378356934, "global_step": 114703, "epoch": 2731} {"train_loss": -6.461856842041016, "global_step": 114704, "epoch": 2731} {"train_loss": -6.48913049697876, "global_step": 114705, "epoch": 2731} {"train_loss": -6.52140998840332, "global_step": 114706, "epoch": 2731} {"train_loss": -6.533840656280518, "global_step": 114707, "epoch": 2731} {"train_loss": -6.448205471038818, "global_step": 114708, "epoch": 2731} {"train_loss": -6.483205318450928, "global_step": 114709, "epoch": 2731} {"train_loss": -6.434283256530762, "global_step": 114710, "epoch": 2731} {"train_loss": -6.427646636962891, "global_step": 114711, "epoch": 2731} {"train_loss": -6.432443141937256, "global_step": 114712, "epoch": 2731} {"train_loss": -6.461508750915527, "global_step": 114713, "epoch": 2731} {"train_loss": -6.44957160949707, "global_step": 114714, "epoch": 2731} {"train_loss": -6.495552062988281, "global_step": 114715, "epoch": 2731} {"train_loss": -6.444817543029785, "global_step": 114716, "epoch": 2731} {"train_loss": -6.431268692016602, "global_step": 114717, "epoch": 2731} {"train_loss": -6.487417221069336, "global_step": 114718, "epoch": 2731} {"train_loss": -6.384421348571777, "global_step": 114719, "epoch": 2731} {"train_loss": -6.491545677185059, "global_step": 114720, "epoch": 2731} {"train_loss": -6.387373924255371, "global_step": 114721, "epoch": 2731} {"train_loss": -6.427512168884277, "global_step": 114722, "epoch": 2731} {"train_loss": -6.3904619216918945, "global_step": 114723, "epoch": 2731} {"train_loss": -6.401853084564209, "global_step": 114724, "epoch": 2731} {"train_loss": -6.413902759552002, "global_step": 114725, "epoch": 2731} {"train_loss": -6.295389175415039, "global_step": 114726, "epoch": 2731} {"train_loss": -6.408238410949707, "global_step": 114727, "epoch": 2731} {"train_loss": -6.420138359069824, "global_step": 114728, "epoch": 2731} {"train_loss": -6.44001579284668, "global_step": 114729, "epoch": 2731} {"train_loss": -6.370401382446289, "global_step": 114730, "epoch": 2731} {"train_loss": -6.508935451507568, "global_step": 114731, "epoch": 2731} {"train_loss": -6.4044575691223145, "global_step": 114732, "epoch": 2731} {"train_loss": -6.492986679077148, "global_step": 114733, "epoch": 2731} {"train_loss": -6.542569160461426, "global_step": 114734, "epoch": 2731} {"train_loss": -6.334304332733154, "global_step": 114735, "epoch": 2731} {"train_loss": -6.468179702758789, "global_step": 114736, "epoch": 2731} {"train_loss": -6.392102241516113, "global_step": 114737, "epoch": 2731} {"train_loss": -6.532496452331543, "global_step": 114738, "epoch": 2731} {"train_loss": -6.354185104370117, "global_step": 114739, "epoch": 2731} {"train_loss": -6.4214324951171875, "global_step": 114740, "epoch": 2731} {"train_loss": -6.4608564376831055, "global_step": 114741, "epoch": 2731} {"train_loss": -6.317673683166504, "global_step": 114742, "epoch": 2731} {"train_loss": -6.4375151452564054, "global_step": 114743, "epoch": 2731, "val_loss": 67694.9453125} {"train_loss": -6.476950168609619, "global_step": 114744, "epoch": 2732} {"train_loss": -6.368168830871582, "global_step": 114745, "epoch": 2732} {"train_loss": -6.449253559112549, "global_step": 114746, "epoch": 2732} {"train_loss": -6.445742607116699, "global_step": 114747, "epoch": 2732} {"train_loss": -6.458037376403809, "global_step": 114748, "epoch": 2732} {"train_loss": -6.501626014709473, "global_step": 114749, "epoch": 2732} {"train_loss": -6.433254241943359, "global_step": 114750, "epoch": 2732} {"train_loss": -6.562216758728027, "global_step": 114751, "epoch": 2732} {"train_loss": -6.467147350311279, "global_step": 114752, "epoch": 2732} {"train_loss": -6.4495015144348145, "global_step": 114753, "epoch": 2732} {"train_loss": -6.436573028564453, "global_step": 114754, "epoch": 2732} {"train_loss": -6.569267272949219, "global_step": 114755, "epoch": 2732} {"train_loss": -6.461001873016357, "global_step": 114756, "epoch": 2732} {"train_loss": -6.615727424621582, "global_step": 114757, "epoch": 2732} {"train_loss": -6.5081024169921875, "global_step": 114758, "epoch": 2732} {"train_loss": -6.554987907409668, "global_step": 114759, "epoch": 2732} {"train_loss": -6.491911888122559, "global_step": 114760, "epoch": 2732} {"train_loss": -6.499178886413574, "global_step": 114761, "epoch": 2732} {"train_loss": -6.447318077087402, "global_step": 114762, "epoch": 2732} {"train_loss": -6.500148773193359, "global_step": 114763, "epoch": 2732} {"train_loss": -6.388278007507324, "global_step": 114764, "epoch": 2732} {"train_loss": -6.470273971557617, "global_step": 114765, "epoch": 2732} {"train_loss": -6.387931823730469, "global_step": 114766, "epoch": 2732} {"train_loss": -6.5612382888793945, "global_step": 114767, "epoch": 2732} {"train_loss": -6.557058334350586, "global_step": 114768, "epoch": 2732} {"train_loss": -6.405401229858398, "global_step": 114769, "epoch": 2732} {"train_loss": -6.576423645019531, "global_step": 114770, "epoch": 2732} {"train_loss": -6.557610988616943, "global_step": 114771, "epoch": 2732} {"train_loss": -6.423041343688965, "global_step": 114772, "epoch": 2732} {"train_loss": -6.578819274902344, "global_step": 114773, "epoch": 2732} {"train_loss": -6.435983180999756, "global_step": 114774, "epoch": 2732} {"train_loss": -6.29527473449707, "global_step": 114775, "epoch": 2732} {"train_loss": -6.448023796081543, "global_step": 114776, "epoch": 2732} {"train_loss": -6.3549957275390625, "global_step": 114777, "epoch": 2732} {"train_loss": -6.453169822692871, "global_step": 114778, "epoch": 2732} {"train_loss": -6.562538146972656, "global_step": 114779, "epoch": 2732} {"train_loss": -6.418992042541504, "global_step": 114780, "epoch": 2732} {"train_loss": -6.372269153594971, "global_step": 114781, "epoch": 2732} {"train_loss": -6.450894355773926, "global_step": 114782, "epoch": 2732} {"train_loss": -6.419855117797852, "global_step": 114783, "epoch": 2732} {"train_loss": -6.457311630249023, "global_step": 114784, "epoch": 2732} {"train_loss": -6.469153029578073, "global_step": 114785, "epoch": 2732, "val_loss": 68004.59375} {"train_loss": -6.499778747558594, "global_step": 114786, "epoch": 2733} {"train_loss": -6.519384384155273, "global_step": 114787, "epoch": 2733} {"train_loss": -6.554866790771484, "global_step": 114788, "epoch": 2733} {"train_loss": -6.511836528778076, "global_step": 114789, "epoch": 2733} {"train_loss": -6.516266822814941, "global_step": 114790, "epoch": 2733} {"train_loss": -6.465348243713379, "global_step": 114791, "epoch": 2733} {"train_loss": -6.532088279724121, "global_step": 114792, "epoch": 2733} {"train_loss": -6.567795276641846, "global_step": 114793, "epoch": 2733} {"train_loss": -6.313948631286621, "global_step": 114794, "epoch": 2733} {"train_loss": -6.500125885009766, "global_step": 114795, "epoch": 2733} {"train_loss": -6.4842987060546875, "global_step": 114796, "epoch": 2733} {"train_loss": -6.520586967468262, "global_step": 114797, "epoch": 2733} {"train_loss": -6.4142165184021, "global_step": 114798, "epoch": 2733} {"train_loss": -6.523272514343262, "global_step": 114799, "epoch": 2733} {"train_loss": -6.627814292907715, "global_step": 114800, "epoch": 2733} {"train_loss": -6.521247863769531, "global_step": 114801, "epoch": 2733} {"train_loss": -6.483929634094238, "global_step": 114802, "epoch": 2733} {"train_loss": -6.5737810134887695, "global_step": 114803, "epoch": 2733} {"train_loss": -6.518707275390625, "global_step": 114804, "epoch": 2733} {"train_loss": -6.483852386474609, "global_step": 114805, "epoch": 2733} {"train_loss": -6.379362106323242, "global_step": 114806, "epoch": 2733} {"train_loss": -6.582018852233887, "global_step": 114807, "epoch": 2733} {"train_loss": -6.505660057067871, "global_step": 114808, "epoch": 2733} {"train_loss": -6.6088738441467285, "global_step": 114809, "epoch": 2733} {"train_loss": -6.614066123962402, "global_step": 114810, "epoch": 2733} {"train_loss": -6.418994903564453, "global_step": 114811, "epoch": 2733} {"train_loss": -6.419564247131348, "global_step": 114812, "epoch": 2733} {"train_loss": -6.521312713623047, "global_step": 114813, "epoch": 2733} {"train_loss": -6.501216888427734, "global_step": 114814, "epoch": 2733} {"train_loss": -6.514538764953613, "global_step": 114815, "epoch": 2733} {"train_loss": -6.544909477233887, "global_step": 114816, "epoch": 2733} {"train_loss": -6.520877838134766, "global_step": 114817, "epoch": 2733} {"train_loss": -6.495500564575195, "global_step": 114818, "epoch": 2733} {"train_loss": -6.558394432067871, "global_step": 114819, "epoch": 2733} {"train_loss": -6.536764621734619, "global_step": 114820, "epoch": 2733} {"train_loss": -6.458648681640625, "global_step": 114821, "epoch": 2733} {"train_loss": -6.442195415496826, "global_step": 114822, "epoch": 2733} {"train_loss": -6.505434989929199, "global_step": 114823, "epoch": 2733} {"train_loss": -6.425597667694092, "global_step": 114824, "epoch": 2733} {"train_loss": -6.503909587860107, "global_step": 114825, "epoch": 2733} {"train_loss": -6.454275131225586, "global_step": 114826, "epoch": 2733} {"train_loss": -6.5035834312438965, "global_step": 114827, "epoch": 2733, "val_loss": 67758.828125} {"train_loss": -6.461965084075928, "global_step": 114828, "epoch": 2734} {"train_loss": -6.554888725280762, "global_step": 114829, "epoch": 2734} {"train_loss": -6.5074944496154785, "global_step": 114830, "epoch": 2734} {"train_loss": -6.641117572784424, "global_step": 114831, "epoch": 2734} {"train_loss": -6.52357816696167, "global_step": 114832, "epoch": 2734} {"train_loss": -6.477404594421387, "global_step": 114833, "epoch": 2734} {"train_loss": -6.463009357452393, "global_step": 114834, "epoch": 2734} {"train_loss": -6.497994422912598, "global_step": 114835, "epoch": 2734} {"train_loss": -6.506838798522949, "global_step": 114836, "epoch": 2734} {"train_loss": -6.495732307434082, "global_step": 114837, "epoch": 2734} {"train_loss": -6.55499267578125, "global_step": 114838, "epoch": 2734} {"train_loss": -6.569644451141357, "global_step": 114839, "epoch": 2734} {"train_loss": -6.548153400421143, "global_step": 114840, "epoch": 2734} {"train_loss": -6.437473297119141, "global_step": 114841, "epoch": 2734} {"train_loss": -6.428711891174316, "global_step": 114842, "epoch": 2734} {"train_loss": -6.5021467208862305, "global_step": 114843, "epoch": 2734} {"train_loss": -6.472897052764893, "global_step": 114844, "epoch": 2734} {"train_loss": -6.329230308532715, "global_step": 114845, "epoch": 2734} {"train_loss": -6.529297828674316, "global_step": 114846, "epoch": 2734} {"train_loss": -6.400359153747559, "global_step": 114847, "epoch": 2734} {"train_loss": -6.50494384765625, "global_step": 114848, "epoch": 2734} {"train_loss": -6.477076530456543, "global_step": 114849, "epoch": 2734} {"train_loss": -6.387510776519775, "global_step": 114850, "epoch": 2734} {"train_loss": -6.488131999969482, "global_step": 114851, "epoch": 2734} {"train_loss": -6.511338233947754, "global_step": 114852, "epoch": 2734} {"train_loss": -6.4458489418029785, "global_step": 114853, "epoch": 2734} {"train_loss": -6.4983229637146, "global_step": 114854, "epoch": 2734} {"train_loss": -6.428565502166748, "global_step": 114855, "epoch": 2734} {"train_loss": -6.485939979553223, "global_step": 114856, "epoch": 2734} {"train_loss": -6.451295852661133, "global_step": 114857, "epoch": 2734} {"train_loss": -6.438762187957764, "global_step": 114858, "epoch": 2734} {"train_loss": -6.379947662353516, "global_step": 114859, "epoch": 2734} {"train_loss": -6.553906440734863, "global_step": 114860, "epoch": 2734} {"train_loss": -6.377650260925293, "global_step": 114861, "epoch": 2734} {"train_loss": -6.635867118835449, "global_step": 114862, "epoch": 2734} {"train_loss": -6.476367950439453, "global_step": 114863, "epoch": 2734} {"train_loss": -6.512380599975586, "global_step": 114864, "epoch": 2734} {"train_loss": -6.512104511260986, "global_step": 114865, "epoch": 2734} {"train_loss": -6.555913925170898, "global_step": 114866, "epoch": 2734} {"train_loss": -6.406458854675293, "global_step": 114867, "epoch": 2734} {"train_loss": -6.545622825622559, "global_step": 114868, "epoch": 2734} {"train_loss": -6.488588219597226, "global_step": 114869, "epoch": 2734, "val_loss": 67875.171875} {"train_loss": -6.444992542266846, "global_step": 114870, "epoch": 2735} {"train_loss": -6.409165382385254, "global_step": 114871, "epoch": 2735} {"train_loss": -6.41495418548584, "global_step": 114872, "epoch": 2735} {"train_loss": -6.437252998352051, "global_step": 114873, "epoch": 2735} {"train_loss": -6.3658127784729, "global_step": 114874, "epoch": 2735} {"train_loss": -6.523704528808594, "global_step": 114875, "epoch": 2735} {"train_loss": -6.34099006652832, "global_step": 114876, "epoch": 2735} {"train_loss": -6.535797595977783, "global_step": 114877, "epoch": 2735} {"train_loss": -6.5533366203308105, "global_step": 114878, "epoch": 2735} {"train_loss": -6.492349147796631, "global_step": 114879, "epoch": 2735} {"train_loss": -6.557675361633301, "global_step": 114880, "epoch": 2735} {"train_loss": -6.486814498901367, "global_step": 114881, "epoch": 2735} {"train_loss": -6.525043487548828, "global_step": 114882, "epoch": 2735} {"train_loss": -6.507552146911621, "global_step": 114883, "epoch": 2735} {"train_loss": -6.379028797149658, "global_step": 114884, "epoch": 2735} {"train_loss": -6.62054443359375, "global_step": 114885, "epoch": 2735} {"train_loss": -6.620979309082031, "global_step": 114886, "epoch": 2735} {"train_loss": -6.511051654815674, "global_step": 114887, "epoch": 2735} {"train_loss": -6.544647216796875, "global_step": 114888, "epoch": 2735} {"train_loss": -6.430097579956055, "global_step": 114889, "epoch": 2735} {"train_loss": -6.543502330780029, "global_step": 114890, "epoch": 2735} {"train_loss": -6.600840091705322, "global_step": 114891, "epoch": 2735} {"train_loss": -6.454221248626709, "global_step": 114892, "epoch": 2735} {"train_loss": -6.6495137214660645, "global_step": 114893, "epoch": 2735} {"train_loss": -6.402053356170654, "global_step": 114894, "epoch": 2735} {"train_loss": -6.356488227844238, "global_step": 114895, "epoch": 2735} {"train_loss": -6.542851448059082, "global_step": 114896, "epoch": 2735} {"train_loss": -6.410933494567871, "global_step": 114897, "epoch": 2735} {"train_loss": -6.522918701171875, "global_step": 114898, "epoch": 2735} {"train_loss": -6.536193370819092, "global_step": 114899, "epoch": 2735} {"train_loss": -6.539952278137207, "global_step": 114900, "epoch": 2735} {"train_loss": -6.410004615783691, "global_step": 114901, "epoch": 2735} {"train_loss": -6.42008113861084, "global_step": 114902, "epoch": 2735} {"train_loss": -6.316709041595459, "global_step": 114903, "epoch": 2735} {"train_loss": -6.428617477416992, "global_step": 114904, "epoch": 2735} {"train_loss": -6.367543697357178, "global_step": 114905, "epoch": 2735} {"train_loss": -6.494462966918945, "global_step": 114906, "epoch": 2735} {"train_loss": -6.485966682434082, "global_step": 114907, "epoch": 2735} {"train_loss": -6.417151927947998, "global_step": 114908, "epoch": 2735} {"train_loss": -6.51922607421875, "global_step": 114909, "epoch": 2735} {"train_loss": -6.3490142822265625, "global_step": 114910, "epoch": 2735} {"train_loss": -6.476311365763347, "global_step": 114911, "epoch": 2735, "val_loss": 68051.3984375} {"train_loss": -6.544666290283203, "global_step": 114912, "epoch": 2736} {"train_loss": -6.549045562744141, "global_step": 114913, "epoch": 2736} {"train_loss": -6.5028886795043945, "global_step": 114914, "epoch": 2736} {"train_loss": -6.424713134765625, "global_step": 114915, "epoch": 2736} {"train_loss": -6.386115550994873, "global_step": 114916, "epoch": 2736} {"train_loss": -6.478395462036133, "global_step": 114917, "epoch": 2736} {"train_loss": -6.475484371185303, "global_step": 114918, "epoch": 2736} {"train_loss": -6.434491157531738, "global_step": 114919, "epoch": 2736} {"train_loss": -6.359627723693848, "global_step": 114920, "epoch": 2736} {"train_loss": -6.52082633972168, "global_step": 114921, "epoch": 2736} {"train_loss": -6.429924964904785, "global_step": 114922, "epoch": 2736} {"train_loss": -6.435693264007568, "global_step": 114923, "epoch": 2736} {"train_loss": -6.4334306716918945, "global_step": 114924, "epoch": 2736} {"train_loss": -6.450428009033203, "global_step": 114925, "epoch": 2736} {"train_loss": -6.386634826660156, "global_step": 114926, "epoch": 2736} {"train_loss": -6.343807697296143, "global_step": 114927, "epoch": 2736} {"train_loss": -6.480420112609863, "global_step": 114928, "epoch": 2736} {"train_loss": -6.436407089233398, "global_step": 114929, "epoch": 2736} {"train_loss": -6.46024227142334, "global_step": 114930, "epoch": 2736} {"train_loss": -6.516419887542725, "global_step": 114931, "epoch": 2736} {"train_loss": -6.413550853729248, "global_step": 114932, "epoch": 2736} {"train_loss": -6.546327590942383, "global_step": 114933, "epoch": 2736} {"train_loss": -6.517528533935547, "global_step": 114934, "epoch": 2736} {"train_loss": -6.464717864990234, "global_step": 114935, "epoch": 2736} {"train_loss": -6.451927185058594, "global_step": 114936, "epoch": 2736} {"train_loss": -6.522461891174316, "global_step": 114937, "epoch": 2736} {"train_loss": -6.544102668762207, "global_step": 114938, "epoch": 2736} {"train_loss": -6.484323501586914, "global_step": 114939, "epoch": 2736} {"train_loss": -6.494263648986816, "global_step": 114940, "epoch": 2736} {"train_loss": -6.359124183654785, "global_step": 114941, "epoch": 2736} {"train_loss": -6.447910308837891, "global_step": 114942, "epoch": 2736} {"train_loss": -6.491644859313965, "global_step": 114943, "epoch": 2736} {"train_loss": -6.496157169342041, "global_step": 114944, "epoch": 2736} {"train_loss": -6.499845504760742, "global_step": 114945, "epoch": 2736} {"train_loss": -6.4456682205200195, "global_step": 114946, "epoch": 2736} {"train_loss": -6.367345809936523, "global_step": 114947, "epoch": 2736} {"train_loss": -6.623446941375732, "global_step": 114948, "epoch": 2736} {"train_loss": -6.447542190551758, "global_step": 114949, "epoch": 2736} {"train_loss": -6.484555244445801, "global_step": 114950, "epoch": 2736} {"train_loss": -6.41086483001709, "global_step": 114951, "epoch": 2736} {"train_loss": -6.462215423583984, "global_step": 114952, "epoch": 2736} {"train_loss": -6.466162443161011, "global_step": 114953, "epoch": 2736, "val_loss": 67810.4609375} {"train_loss": -6.564035415649414, "global_step": 114954, "epoch": 2737} {"train_loss": -6.509761810302734, "global_step": 114955, "epoch": 2737} {"train_loss": -6.559808731079102, "global_step": 114956, "epoch": 2737} {"train_loss": -6.541191101074219, "global_step": 114957, "epoch": 2737} {"train_loss": -6.437079429626465, "global_step": 114958, "epoch": 2737} {"train_loss": -6.567195892333984, "global_step": 114959, "epoch": 2737} {"train_loss": -6.499493598937988, "global_step": 114960, "epoch": 2737} {"train_loss": -6.481814384460449, "global_step": 114961, "epoch": 2737} {"train_loss": -6.47554874420166, "global_step": 114962, "epoch": 2737} {"train_loss": -6.298476696014404, "global_step": 114963, "epoch": 2737} {"train_loss": -6.369905471801758, "global_step": 114964, "epoch": 2737} {"train_loss": -6.368919849395752, "global_step": 114965, "epoch": 2737} {"train_loss": -6.442294120788574, "global_step": 114966, "epoch": 2737} {"train_loss": -6.455523490905762, "global_step": 114967, "epoch": 2737} {"train_loss": -6.550599575042725, "global_step": 114968, "epoch": 2737} {"train_loss": -6.492217063903809, "global_step": 114969, "epoch": 2737} {"train_loss": -6.423464775085449, "global_step": 114970, "epoch": 2737} {"train_loss": -6.542523384094238, "global_step": 114971, "epoch": 2737} {"train_loss": -6.371711730957031, "global_step": 114972, "epoch": 2737} {"train_loss": -6.381098747253418, "global_step": 114973, "epoch": 2737} {"train_loss": -6.44888162612915, "global_step": 114974, "epoch": 2737} {"train_loss": -6.41518497467041, "global_step": 114975, "epoch": 2737} {"train_loss": -6.444679260253906, "global_step": 114976, "epoch": 2737} {"train_loss": -6.462516784667969, "global_step": 114977, "epoch": 2737} {"train_loss": -6.454333305358887, "global_step": 114978, "epoch": 2737} {"train_loss": -6.5414581298828125, "global_step": 114979, "epoch": 2737} {"train_loss": -6.4882636070251465, "global_step": 114980, "epoch": 2737} {"train_loss": -6.527101516723633, "global_step": 114981, "epoch": 2737} {"train_loss": -6.495014667510986, "global_step": 114982, "epoch": 2737} {"train_loss": -6.578302383422852, "global_step": 114983, "epoch": 2737} {"train_loss": -6.488594055175781, "global_step": 114984, "epoch": 2737} {"train_loss": -6.459000587463379, "global_step": 114985, "epoch": 2737} {"train_loss": -6.537580490112305, "global_step": 114986, "epoch": 2737} {"train_loss": -6.606939315795898, "global_step": 114987, "epoch": 2737} {"train_loss": -6.535179138183594, "global_step": 114988, "epoch": 2737} {"train_loss": -6.601081371307373, "global_step": 114989, "epoch": 2737} {"train_loss": -6.496258735656738, "global_step": 114990, "epoch": 2737} {"train_loss": -6.52191162109375, "global_step": 114991, "epoch": 2737} {"train_loss": -6.515501022338867, "global_step": 114992, "epoch": 2737} {"train_loss": -6.516368389129639, "global_step": 114993, "epoch": 2737} {"train_loss": -6.415800094604492, "global_step": 114994, "epoch": 2737} {"train_loss": -6.48563764208839, "global_step": 114995, "epoch": 2737, "val_loss": 67798.859375} {"train_loss": -6.625087738037109, "global_step": 114996, "epoch": 2738} {"train_loss": -6.413324356079102, "global_step": 114997, "epoch": 2738} {"train_loss": -6.467947483062744, "global_step": 114998, "epoch": 2738} {"train_loss": -6.463894367218018, "global_step": 114999, "epoch": 2738} {"train_loss": -6.5309624671936035, "global_step": 115000, "epoch": 2738} {"train_loss": -6.540614128112793, "global_step": 115001, "epoch": 2738} {"train_loss": -6.586154460906982, "global_step": 115002, "epoch": 2738} {"train_loss": -6.4416327476501465, "global_step": 115003, "epoch": 2738} {"train_loss": -6.536499500274658, "global_step": 115004, "epoch": 2738} {"train_loss": -6.544918060302734, "global_step": 115005, "epoch": 2738} {"train_loss": -6.437614917755127, "global_step": 115006, "epoch": 2738} {"train_loss": -6.481868743896484, "global_step": 115007, "epoch": 2738} {"train_loss": -6.429380416870117, "global_step": 115008, "epoch": 2738} {"train_loss": -6.467430114746094, "global_step": 115009, "epoch": 2738} {"train_loss": -6.560018539428711, "global_step": 115010, "epoch": 2738} {"train_loss": -6.486638069152832, "global_step": 115011, "epoch": 2738} {"train_loss": -6.360313415527344, "global_step": 115012, "epoch": 2738} {"train_loss": -6.4506072998046875, "global_step": 115013, "epoch": 2738} {"train_loss": -6.279933929443359, "global_step": 115014, "epoch": 2738} {"train_loss": -6.574542999267578, "global_step": 115015, "epoch": 2738} {"train_loss": -6.429854393005371, "global_step": 115016, "epoch": 2738} {"train_loss": -6.49023962020874, "global_step": 115017, "epoch": 2738} {"train_loss": -6.5720953941345215, "global_step": 115018, "epoch": 2738} {"train_loss": -6.246821403503418, "global_step": 115019, "epoch": 2738} {"train_loss": -6.614809036254883, "global_step": 115020, "epoch": 2738} {"train_loss": -6.500585079193115, "global_step": 115021, "epoch": 2738} {"train_loss": -6.426060676574707, "global_step": 115022, "epoch": 2738} {"train_loss": -6.466792106628418, "global_step": 115023, "epoch": 2738} {"train_loss": -6.355579376220703, "global_step": 115024, "epoch": 2738} {"train_loss": -6.601582050323486, "global_step": 115025, "epoch": 2738} {"train_loss": -6.450699806213379, "global_step": 115026, "epoch": 2738} {"train_loss": -6.533084869384766, "global_step": 115027, "epoch": 2738} {"train_loss": -6.445243835449219, "global_step": 115028, "epoch": 2738} {"train_loss": -6.324731826782227, "global_step": 115029, "epoch": 2738} {"train_loss": -6.467019081115723, "global_step": 115030, "epoch": 2738} {"train_loss": -6.479485511779785, "global_step": 115031, "epoch": 2738} {"train_loss": -6.542010307312012, "global_step": 115032, "epoch": 2738} {"train_loss": -6.357524394989014, "global_step": 115033, "epoch": 2738} {"train_loss": -6.5848236083984375, "global_step": 115034, "epoch": 2738} {"train_loss": -6.451040267944336, "global_step": 115035, "epoch": 2738} {"train_loss": -6.471545219421387, "global_step": 115036, "epoch": 2738} {"train_loss": -6.474448737644014, "global_step": 115037, "epoch": 2738, "val_loss": 67972.0546875} {"train_loss": -6.528443336486816, "global_step": 115038, "epoch": 2739} {"train_loss": -6.55265998840332, "global_step": 115039, "epoch": 2739} {"train_loss": -6.445696830749512, "global_step": 115040, "epoch": 2739} {"train_loss": -6.557722091674805, "global_step": 115041, "epoch": 2739} {"train_loss": -6.524203300476074, "global_step": 115042, "epoch": 2739} {"train_loss": -6.396831512451172, "global_step": 115043, "epoch": 2739} {"train_loss": -6.410239219665527, "global_step": 115044, "epoch": 2739} {"train_loss": -6.329707145690918, "global_step": 115045, "epoch": 2739} {"train_loss": -6.311978340148926, "global_step": 115046, "epoch": 2739} {"train_loss": -6.326716423034668, "global_step": 115047, "epoch": 2739} {"train_loss": -6.413122177124023, "global_step": 115048, "epoch": 2739} {"train_loss": -6.5141801834106445, "global_step": 115049, "epoch": 2739} {"train_loss": -6.436689376831055, "global_step": 115050, "epoch": 2739} {"train_loss": -6.545346260070801, "global_step": 115051, "epoch": 2739} {"train_loss": -6.396020889282227, "global_step": 115052, "epoch": 2739} {"train_loss": -6.4520673751831055, "global_step": 115053, "epoch": 2739} {"train_loss": -6.451038360595703, "global_step": 115054, "epoch": 2739} {"train_loss": -6.349193572998047, "global_step": 115055, "epoch": 2739} {"train_loss": -6.497689723968506, "global_step": 115056, "epoch": 2739} {"train_loss": -6.34574556350708, "global_step": 115057, "epoch": 2739} {"train_loss": -6.554653644561768, "global_step": 115058, "epoch": 2739} {"train_loss": -6.4416022300720215, "global_step": 115059, "epoch": 2739} {"train_loss": -6.4019269943237305, "global_step": 115060, "epoch": 2739} {"train_loss": -6.42968225479126, "global_step": 115061, "epoch": 2739} {"train_loss": -6.317534923553467, "global_step": 115062, "epoch": 2739} {"train_loss": -6.473320960998535, "global_step": 115063, "epoch": 2739} {"train_loss": -6.233359336853027, "global_step": 115064, "epoch": 2739} {"train_loss": -6.533332824707031, "global_step": 115065, "epoch": 2739} {"train_loss": -6.3943986892700195, "global_step": 115066, "epoch": 2739} {"train_loss": -6.282123565673828, "global_step": 115067, "epoch": 2739} {"train_loss": -6.400847911834717, "global_step": 115068, "epoch": 2739} {"train_loss": -6.250824928283691, "global_step": 115069, "epoch": 2739} {"train_loss": -6.502279758453369, "global_step": 115070, "epoch": 2739} {"train_loss": -6.448236465454102, "global_step": 115071, "epoch": 2739} {"train_loss": -6.323385238647461, "global_step": 115072, "epoch": 2739} {"train_loss": -6.277736186981201, "global_step": 115073, "epoch": 2739} {"train_loss": -6.449700832366943, "global_step": 115074, "epoch": 2739} {"train_loss": -6.446270942687988, "global_step": 115075, "epoch": 2739} {"train_loss": -6.461709022521973, "global_step": 115076, "epoch": 2739} {"train_loss": -6.448960304260254, "global_step": 115077, "epoch": 2739} {"train_loss": -6.422484397888184, "global_step": 115078, "epoch": 2739} {"train_loss": -6.423984152930124, "global_step": 115079, "epoch": 2739, "val_loss": 67750.078125} {"train_loss": -6.358875274658203, "global_step": 115080, "epoch": 2740} {"train_loss": -6.5099897384643555, "global_step": 115081, "epoch": 2740} {"train_loss": -6.358683109283447, "global_step": 115082, "epoch": 2740} {"train_loss": -6.450397968292236, "global_step": 115083, "epoch": 2740} {"train_loss": -6.404529571533203, "global_step": 115084, "epoch": 2740} {"train_loss": -6.567558288574219, "global_step": 115085, "epoch": 2740} {"train_loss": -6.495380878448486, "global_step": 115086, "epoch": 2740} {"train_loss": -6.415024757385254, "global_step": 115087, "epoch": 2740} {"train_loss": -6.618376731872559, "global_step": 115088, "epoch": 2740} {"train_loss": -6.544611930847168, "global_step": 115089, "epoch": 2740} {"train_loss": -6.544323921203613, "global_step": 115090, "epoch": 2740} {"train_loss": -6.417942047119141, "global_step": 115091, "epoch": 2740} {"train_loss": -6.444458484649658, "global_step": 115092, "epoch": 2740} {"train_loss": -6.548509120941162, "global_step": 115093, "epoch": 2740} {"train_loss": -6.357926368713379, "global_step": 115094, "epoch": 2740} {"train_loss": -6.431179046630859, "global_step": 115095, "epoch": 2740} {"train_loss": -6.40739107131958, "global_step": 115096, "epoch": 2740} {"train_loss": -6.419754981994629, "global_step": 115097, "epoch": 2740} {"train_loss": -6.335484027862549, "global_step": 115098, "epoch": 2740} {"train_loss": -6.417468070983887, "global_step": 115099, "epoch": 2740} {"train_loss": -6.497714519500732, "global_step": 115100, "epoch": 2740} {"train_loss": -6.363008975982666, "global_step": 115101, "epoch": 2740} {"train_loss": -6.4173431396484375, "global_step": 115102, "epoch": 2740} {"train_loss": -6.407025337219238, "global_step": 115103, "epoch": 2740} {"train_loss": -6.419277191162109, "global_step": 115104, "epoch": 2740} {"train_loss": -6.535179615020752, "global_step": 115105, "epoch": 2740} {"train_loss": -6.449846267700195, "global_step": 115106, "epoch": 2740} {"train_loss": -6.4713544845581055, "global_step": 115107, "epoch": 2740} {"train_loss": -6.51536750793457, "global_step": 115108, "epoch": 2740} {"train_loss": -6.410800457000732, "global_step": 115109, "epoch": 2740} {"train_loss": -6.505446434020996, "global_step": 115110, "epoch": 2740} {"train_loss": -6.394802093505859, "global_step": 115111, "epoch": 2740} {"train_loss": -6.428988933563232, "global_step": 115112, "epoch": 2740} {"train_loss": -6.549527168273926, "global_step": 115113, "epoch": 2740} {"train_loss": -6.403469085693359, "global_step": 115114, "epoch": 2740} {"train_loss": -6.531335353851318, "global_step": 115115, "epoch": 2740} {"train_loss": -6.568282604217529, "global_step": 115116, "epoch": 2740} {"train_loss": -6.462859630584717, "global_step": 115117, "epoch": 2740} {"train_loss": -6.558284759521484, "global_step": 115118, "epoch": 2740} {"train_loss": -6.523421287536621, "global_step": 115119, "epoch": 2740} {"train_loss": -6.407822608947754, "global_step": 115120, "epoch": 2740} {"train_loss": -6.46333216485523, "global_step": 115121, "epoch": 2740, "val_loss": 67831.234375} {"train_loss": -6.530028343200684, "global_step": 115122, "epoch": 2741} {"train_loss": -6.494098663330078, "global_step": 115123, "epoch": 2741} {"train_loss": -6.4896697998046875, "global_step": 115124, "epoch": 2741} {"train_loss": -6.592597007751465, "global_step": 115125, "epoch": 2741} {"train_loss": -6.507280349731445, "global_step": 115126, "epoch": 2741} {"train_loss": -6.488038063049316, "global_step": 115127, "epoch": 2741} {"train_loss": -6.483233451843262, "global_step": 115128, "epoch": 2741} {"train_loss": -6.502100944519043, "global_step": 115129, "epoch": 2741} {"train_loss": -6.545940399169922, "global_step": 115130, "epoch": 2741} {"train_loss": -6.457935810089111, "global_step": 115131, "epoch": 2741} {"train_loss": -6.434695243835449, "global_step": 115132, "epoch": 2741} {"train_loss": -6.496967315673828, "global_step": 115133, "epoch": 2741} {"train_loss": -6.507327079772949, "global_step": 115134, "epoch": 2741} {"train_loss": -6.485594272613525, "global_step": 115135, "epoch": 2741} {"train_loss": -6.451692581176758, "global_step": 115136, "epoch": 2741} {"train_loss": -6.492620944976807, "global_step": 115137, "epoch": 2741} {"train_loss": -6.395843505859375, "global_step": 115138, "epoch": 2741} {"train_loss": -6.483396530151367, "global_step": 115139, "epoch": 2741} {"train_loss": -6.558869361877441, "global_step": 115140, "epoch": 2741} {"train_loss": -6.492944717407227, "global_step": 115141, "epoch": 2741} {"train_loss": -6.586190700531006, "global_step": 115142, "epoch": 2741} {"train_loss": -6.571712493896484, "global_step": 115143, "epoch": 2741} {"train_loss": -6.539445877075195, "global_step": 115144, "epoch": 2741} {"train_loss": -6.4214372634887695, "global_step": 115145, "epoch": 2741} {"train_loss": -6.476387023925781, "global_step": 115146, "epoch": 2741} {"train_loss": -6.509561538696289, "global_step": 115147, "epoch": 2741} {"train_loss": -6.432666778564453, "global_step": 115148, "epoch": 2741} {"train_loss": -6.511180877685547, "global_step": 115149, "epoch": 2741} {"train_loss": -6.521584987640381, "global_step": 115150, "epoch": 2741} {"train_loss": -6.432910919189453, "global_step": 115151, "epoch": 2741} {"train_loss": -6.492769718170166, "global_step": 115152, "epoch": 2741} {"train_loss": -6.474599361419678, "global_step": 115153, "epoch": 2741} {"train_loss": -6.54714822769165, "global_step": 115154, "epoch": 2741} {"train_loss": -6.5953264236450195, "global_step": 115155, "epoch": 2741} {"train_loss": -6.586525917053223, "global_step": 115156, "epoch": 2741} {"train_loss": -6.4399919509887695, "global_step": 115157, "epoch": 2741} {"train_loss": -6.412665367126465, "global_step": 115158, "epoch": 2741} {"train_loss": -6.44954776763916, "global_step": 115159, "epoch": 2741} {"train_loss": -6.513689041137695, "global_step": 115160, "epoch": 2741} {"train_loss": -6.549426078796387, "global_step": 115161, "epoch": 2741} {"train_loss": -6.388199806213379, "global_step": 115162, "epoch": 2741} {"train_loss": -6.493133658454532, "global_step": 115163, "epoch": 2741, "val_loss": 67875.7109375} {"train_loss": -6.57431697845459, "global_step": 115164, "epoch": 2742} {"train_loss": -6.368974685668945, "global_step": 115165, "epoch": 2742} {"train_loss": -6.511433124542236, "global_step": 115166, "epoch": 2742} {"train_loss": -6.476761817932129, "global_step": 115167, "epoch": 2742} {"train_loss": -6.489112854003906, "global_step": 115168, "epoch": 2742} {"train_loss": -6.565268516540527, "global_step": 115169, "epoch": 2742} {"train_loss": -6.445549964904785, "global_step": 115170, "epoch": 2742} {"train_loss": -6.415163993835449, "global_step": 115171, "epoch": 2742} {"train_loss": -6.531050682067871, "global_step": 115172, "epoch": 2742} {"train_loss": -6.4864044189453125, "global_step": 115173, "epoch": 2742} {"train_loss": -6.6398797035217285, "global_step": 115174, "epoch": 2742} {"train_loss": -6.5233049392700195, "global_step": 115175, "epoch": 2742} {"train_loss": -6.590956211090088, "global_step": 115176, "epoch": 2742} {"train_loss": -6.437087059020996, "global_step": 115177, "epoch": 2742} {"train_loss": -6.50083589553833, "global_step": 115178, "epoch": 2742} {"train_loss": -6.540492057800293, "global_step": 115179, "epoch": 2742} {"train_loss": -6.492936134338379, "global_step": 115180, "epoch": 2742} {"train_loss": -6.50538444519043, "global_step": 115181, "epoch": 2742} {"train_loss": -6.610986709594727, "global_step": 115182, "epoch": 2742} {"train_loss": -6.515739440917969, "global_step": 115183, "epoch": 2742} {"train_loss": -6.574628829956055, "global_step": 115184, "epoch": 2742} {"train_loss": -6.571813106536865, "global_step": 115185, "epoch": 2742} {"train_loss": -6.566936492919922, "global_step": 115186, "epoch": 2742} {"train_loss": -6.453058242797852, "global_step": 115187, "epoch": 2742} {"train_loss": -6.609546661376953, "global_step": 115188, "epoch": 2742} {"train_loss": -6.526324272155762, "global_step": 115189, "epoch": 2742} {"train_loss": -6.428888320922852, "global_step": 115190, "epoch": 2742} {"train_loss": -6.622858047485352, "global_step": 115191, "epoch": 2742} {"train_loss": -6.481198310852051, "global_step": 115192, "epoch": 2742} {"train_loss": -6.439749240875244, "global_step": 115193, "epoch": 2742} {"train_loss": -6.501531600952148, "global_step": 115194, "epoch": 2742} {"train_loss": -6.490079879760742, "global_step": 115195, "epoch": 2742} {"train_loss": -6.553936958312988, "global_step": 115196, "epoch": 2742} {"train_loss": -6.434565544128418, "global_step": 115197, "epoch": 2742} {"train_loss": -6.464814186096191, "global_step": 115198, "epoch": 2742} {"train_loss": -6.569845199584961, "global_step": 115199, "epoch": 2742} {"train_loss": -6.390024185180664, "global_step": 115200, "epoch": 2742} {"train_loss": -6.516358375549316, "global_step": 115201, "epoch": 2742} {"train_loss": -6.6011176109313965, "global_step": 115202, "epoch": 2742} {"train_loss": -6.622986316680908, "global_step": 115203, "epoch": 2742} {"train_loss": -6.435292720794678, "global_step": 115204, "epoch": 2742} {"train_loss": -6.51182678767613, "global_step": 115205, "epoch": 2742, "val_loss": 67840.2109375} {"train_loss": -6.64270544052124, "global_step": 115206, "epoch": 2743} {"train_loss": -6.447835922241211, "global_step": 115207, "epoch": 2743} {"train_loss": -6.544828414916992, "global_step": 115208, "epoch": 2743} {"train_loss": -6.6340532302856445, "global_step": 115209, "epoch": 2743} {"train_loss": -6.644528865814209, "global_step": 115210, "epoch": 2743} {"train_loss": -6.46557092666626, "global_step": 115211, "epoch": 2743} {"train_loss": -6.476152420043945, "global_step": 115212, "epoch": 2743} {"train_loss": -6.612436294555664, "global_step": 115213, "epoch": 2743} {"train_loss": -6.52923583984375, "global_step": 115214, "epoch": 2743} {"train_loss": -6.513930320739746, "global_step": 115215, "epoch": 2743} {"train_loss": -6.562982559204102, "global_step": 115216, "epoch": 2743} {"train_loss": -6.439401149749756, "global_step": 115217, "epoch": 2743} {"train_loss": -6.496057033538818, "global_step": 115218, "epoch": 2743} {"train_loss": -6.541353225708008, "global_step": 115219, "epoch": 2743} {"train_loss": -6.547391891479492, "global_step": 115220, "epoch": 2743} {"train_loss": -6.540011882781982, "global_step": 115221, "epoch": 2743} {"train_loss": -6.514925003051758, "global_step": 115222, "epoch": 2743} {"train_loss": -6.506763935089111, "global_step": 115223, "epoch": 2743} {"train_loss": -6.437939643859863, "global_step": 115224, "epoch": 2743} {"train_loss": -6.495985984802246, "global_step": 115225, "epoch": 2743} {"train_loss": -6.498809814453125, "global_step": 115226, "epoch": 2743} {"train_loss": -6.346319675445557, "global_step": 115227, "epoch": 2743} {"train_loss": -6.480380058288574, "global_step": 115228, "epoch": 2743} {"train_loss": -6.459546089172363, "global_step": 115229, "epoch": 2743} {"train_loss": -6.453171730041504, "global_step": 115230, "epoch": 2743} {"train_loss": -6.425305366516113, "global_step": 115231, "epoch": 2743} {"train_loss": -6.452844142913818, "global_step": 115232, "epoch": 2743} {"train_loss": -6.473811149597168, "global_step": 115233, "epoch": 2743} {"train_loss": -6.392605304718018, "global_step": 115234, "epoch": 2743} {"train_loss": -6.515636444091797, "global_step": 115235, "epoch": 2743} {"train_loss": -6.591691970825195, "global_step": 115236, "epoch": 2743} {"train_loss": -6.597415924072266, "global_step": 115237, "epoch": 2743} {"train_loss": -6.4642534255981445, "global_step": 115238, "epoch": 2743} {"train_loss": -6.551896095275879, "global_step": 115239, "epoch": 2743} {"train_loss": -6.537586212158203, "global_step": 115240, "epoch": 2743} {"train_loss": -6.4470062255859375, "global_step": 115241, "epoch": 2743} {"train_loss": -6.543506622314453, "global_step": 115242, "epoch": 2743} {"train_loss": -6.556461334228516, "global_step": 115243, "epoch": 2743} {"train_loss": -6.447143077850342, "global_step": 115244, "epoch": 2743} {"train_loss": -6.50063419342041, "global_step": 115245, "epoch": 2743} {"train_loss": -6.4420881271362305, "global_step": 115246, "epoch": 2743} {"train_loss": -6.504516998926799, "global_step": 115247, "epoch": 2743, "val_loss": 67893.265625} {"train_loss": -6.608452796936035, "global_step": 115248, "epoch": 2744} {"train_loss": -6.468384742736816, "global_step": 115249, "epoch": 2744} {"train_loss": -6.464966773986816, "global_step": 115250, "epoch": 2744} {"train_loss": -6.419217586517334, "global_step": 115251, "epoch": 2744} {"train_loss": -6.387181282043457, "global_step": 115252, "epoch": 2744} {"train_loss": -6.517091751098633, "global_step": 115253, "epoch": 2744} {"train_loss": -6.461143493652344, "global_step": 115254, "epoch": 2744} {"train_loss": -6.46949577331543, "global_step": 115255, "epoch": 2744} {"train_loss": -6.408038139343262, "global_step": 115256, "epoch": 2744} {"train_loss": -6.34232759475708, "global_step": 115257, "epoch": 2744} {"train_loss": -6.411747932434082, "global_step": 115258, "epoch": 2744} {"train_loss": -6.468114852905273, "global_step": 115259, "epoch": 2744} {"train_loss": -6.412644386291504, "global_step": 115260, "epoch": 2744} {"train_loss": -6.396417140960693, "global_step": 115261, "epoch": 2744} {"train_loss": -6.381415367126465, "global_step": 115262, "epoch": 2744} {"train_loss": -6.476751804351807, "global_step": 115263, "epoch": 2744} {"train_loss": -6.483610153198242, "global_step": 115264, "epoch": 2744} {"train_loss": -6.425278663635254, "global_step": 115265, "epoch": 2744} {"train_loss": -6.4029645919799805, "global_step": 115266, "epoch": 2744} {"train_loss": -6.4142165184021, "global_step": 115267, "epoch": 2744} {"train_loss": -6.453647613525391, "global_step": 115268, "epoch": 2744} {"train_loss": -6.409389019012451, "global_step": 115269, "epoch": 2744} {"train_loss": -6.516376495361328, "global_step": 115270, "epoch": 2744} {"train_loss": -6.471426963806152, "global_step": 115271, "epoch": 2744} {"train_loss": -6.495898723602295, "global_step": 115272, "epoch": 2744} {"train_loss": -6.447940826416016, "global_step": 115273, "epoch": 2744} {"train_loss": -6.465324878692627, "global_step": 115274, "epoch": 2744} {"train_loss": -6.492759704589844, "global_step": 115275, "epoch": 2744} {"train_loss": -6.445804595947266, "global_step": 115276, "epoch": 2744} {"train_loss": -6.436672210693359, "global_step": 115277, "epoch": 2744} {"train_loss": -6.511016368865967, "global_step": 115278, "epoch": 2744} {"train_loss": -6.378621578216553, "global_step": 115279, "epoch": 2744} {"train_loss": -6.5104594230651855, "global_step": 115280, "epoch": 2744} {"train_loss": -6.511612415313721, "global_step": 115281, "epoch": 2744} {"train_loss": -6.553135395050049, "global_step": 115282, "epoch": 2744} {"train_loss": -6.43355655670166, "global_step": 115283, "epoch": 2744} {"train_loss": -6.431801795959473, "global_step": 115284, "epoch": 2744} {"train_loss": -6.466571807861328, "global_step": 115285, "epoch": 2744} {"train_loss": -6.461005210876465, "global_step": 115286, "epoch": 2744} {"train_loss": -6.452445983886719, "global_step": 115287, "epoch": 2744} {"train_loss": -6.416677951812744, "global_step": 115288, "epoch": 2744} {"train_loss": -6.45151382400876, "global_step": 115289, "epoch": 2744, "val_loss": 67772.734375} {"train_loss": -6.619285583496094, "global_step": 115290, "epoch": 2745} {"train_loss": -6.4273271560668945, "global_step": 115291, "epoch": 2745} {"train_loss": -6.499573230743408, "global_step": 115292, "epoch": 2745} {"train_loss": -6.598878383636475, "global_step": 115293, "epoch": 2745} {"train_loss": -6.452205657958984, "global_step": 115294, "epoch": 2745} {"train_loss": -6.357043743133545, "global_step": 115295, "epoch": 2745} {"train_loss": -6.481809139251709, "global_step": 115296, "epoch": 2745} {"train_loss": -6.449338912963867, "global_step": 115297, "epoch": 2745} {"train_loss": -6.377565383911133, "global_step": 115298, "epoch": 2745} {"train_loss": -6.454679012298584, "global_step": 115299, "epoch": 2745} {"train_loss": -6.45877742767334, "global_step": 115300, "epoch": 2745} {"train_loss": -6.294960975646973, "global_step": 115301, "epoch": 2745} {"train_loss": -6.496204376220703, "global_step": 115302, "epoch": 2745} {"train_loss": -6.362722873687744, "global_step": 115303, "epoch": 2745} {"train_loss": -6.3915581703186035, "global_step": 115304, "epoch": 2745} {"train_loss": -6.32731819152832, "global_step": 115305, "epoch": 2745} {"train_loss": -6.368786334991455, "global_step": 115306, "epoch": 2745} {"train_loss": -6.413559436798096, "global_step": 115307, "epoch": 2745} {"train_loss": -6.486414909362793, "global_step": 115308, "epoch": 2745} {"train_loss": -6.375095367431641, "global_step": 115309, "epoch": 2745} {"train_loss": -6.3766398429870605, "global_step": 115310, "epoch": 2745} {"train_loss": -6.414772987365723, "global_step": 115311, "epoch": 2745} {"train_loss": -6.4274773597717285, "global_step": 115312, "epoch": 2745} {"train_loss": -6.526690483093262, "global_step": 115313, "epoch": 2745} {"train_loss": -6.492519378662109, "global_step": 115314, "epoch": 2745} {"train_loss": -6.469112396240234, "global_step": 115315, "epoch": 2745} {"train_loss": -6.387369155883789, "global_step": 115316, "epoch": 2745} {"train_loss": -6.352525234222412, "global_step": 115317, "epoch": 2745} {"train_loss": -6.486330032348633, "global_step": 115318, "epoch": 2745} {"train_loss": -6.525434494018555, "global_step": 115319, "epoch": 2745} {"train_loss": -6.441200256347656, "global_step": 115320, "epoch": 2745} {"train_loss": -6.509303092956543, "global_step": 115321, "epoch": 2745} {"train_loss": -6.4099860191345215, "global_step": 115322, "epoch": 2745} {"train_loss": -6.416630268096924, "global_step": 115323, "epoch": 2745} {"train_loss": -6.456228256225586, "global_step": 115324, "epoch": 2745} {"train_loss": -6.33915376663208, "global_step": 115325, "epoch": 2745} {"train_loss": -6.438719749450684, "global_step": 115326, "epoch": 2745} {"train_loss": -6.532033443450928, "global_step": 115327, "epoch": 2745} {"train_loss": -6.507796287536621, "global_step": 115328, "epoch": 2745} {"train_loss": -6.480419635772705, "global_step": 115329, "epoch": 2745} {"train_loss": -6.52933931350708, "global_step": 115330, "epoch": 2745} {"train_loss": -6.44240190869286, "global_step": 115331, "epoch": 2745, "val_loss": 67857.2265625} {"train_loss": -6.5071210861206055, "global_step": 115332, "epoch": 2746} {"train_loss": -6.519938945770264, "global_step": 115333, "epoch": 2746} {"train_loss": -6.530261993408203, "global_step": 115334, "epoch": 2746} {"train_loss": -6.531617641448975, "global_step": 115335, "epoch": 2746} {"train_loss": -6.453763484954834, "global_step": 115336, "epoch": 2746} {"train_loss": -6.606410980224609, "global_step": 115337, "epoch": 2746} {"train_loss": -6.376705169677734, "global_step": 115338, "epoch": 2746} {"train_loss": -6.555444717407227, "global_step": 115339, "epoch": 2746} {"train_loss": -6.494389533996582, "global_step": 115340, "epoch": 2746} {"train_loss": -6.558306694030762, "global_step": 115341, "epoch": 2746} {"train_loss": -6.497159957885742, "global_step": 115342, "epoch": 2746} {"train_loss": -6.467344284057617, "global_step": 115343, "epoch": 2746} {"train_loss": -6.541940689086914, "global_step": 115344, "epoch": 2746} {"train_loss": -6.474005222320557, "global_step": 115345, "epoch": 2746} {"train_loss": -6.467507362365723, "global_step": 115346, "epoch": 2746} {"train_loss": -6.441738128662109, "global_step": 115347, "epoch": 2746} {"train_loss": -6.423391819000244, "global_step": 115348, "epoch": 2746} {"train_loss": -6.422356128692627, "global_step": 115349, "epoch": 2746} {"train_loss": -6.491618633270264, "global_step": 115350, "epoch": 2746} {"train_loss": -6.463486194610596, "global_step": 115351, "epoch": 2746} {"train_loss": -6.528467178344727, "global_step": 115352, "epoch": 2746} {"train_loss": -6.45947265625, "global_step": 115353, "epoch": 2746} {"train_loss": -6.477337837219238, "global_step": 115354, "epoch": 2746} {"train_loss": -6.458813667297363, "global_step": 115355, "epoch": 2746} {"train_loss": -6.596877574920654, "global_step": 115356, "epoch": 2746} {"train_loss": -6.4260406494140625, "global_step": 115357, "epoch": 2746} {"train_loss": -6.424638748168945, "global_step": 115358, "epoch": 2746} {"train_loss": -6.4135026931762695, "global_step": 115359, "epoch": 2746} {"train_loss": -6.520208358764648, "global_step": 115360, "epoch": 2746} {"train_loss": -6.555915832519531, "global_step": 115361, "epoch": 2746} {"train_loss": -6.570187568664551, "global_step": 115362, "epoch": 2746} {"train_loss": -6.536770343780518, "global_step": 115363, "epoch": 2746} {"train_loss": -6.436459541320801, "global_step": 115364, "epoch": 2746} {"train_loss": -6.531916618347168, "global_step": 115365, "epoch": 2746} {"train_loss": -6.490436553955078, "global_step": 115366, "epoch": 2746} {"train_loss": -6.348378658294678, "global_step": 115367, "epoch": 2746} {"train_loss": -6.470328330993652, "global_step": 115368, "epoch": 2746} {"train_loss": -6.591095447540283, "global_step": 115369, "epoch": 2746} {"train_loss": -6.450723648071289, "global_step": 115370, "epoch": 2746} {"train_loss": -6.548626899719238, "global_step": 115371, "epoch": 2746} {"train_loss": -6.477280616760254, "global_step": 115372, "epoch": 2746} {"train_loss": -6.492925416855585, "global_step": 115373, "epoch": 2746, "val_loss": 67792.5859375} {"train_loss": -6.326405048370361, "global_step": 115374, "epoch": 2747} {"train_loss": -6.583627700805664, "global_step": 115375, "epoch": 2747} {"train_loss": -6.4240593910217285, "global_step": 115376, "epoch": 2747} {"train_loss": -6.521088123321533, "global_step": 115377, "epoch": 2747} {"train_loss": -6.539303779602051, "global_step": 115378, "epoch": 2747} {"train_loss": -6.447260856628418, "global_step": 115379, "epoch": 2747} {"train_loss": -6.541626930236816, "global_step": 115380, "epoch": 2747} {"train_loss": -6.496461868286133, "global_step": 115381, "epoch": 2747} {"train_loss": -6.394500732421875, "global_step": 115382, "epoch": 2747} {"train_loss": -6.53267765045166, "global_step": 115383, "epoch": 2747} {"train_loss": -6.500430107116699, "global_step": 115384, "epoch": 2747} {"train_loss": -6.550503730773926, "global_step": 115385, "epoch": 2747} {"train_loss": -6.61631965637207, "global_step": 115386, "epoch": 2747} {"train_loss": -6.606287956237793, "global_step": 115387, "epoch": 2747} {"train_loss": -6.561305522918701, "global_step": 115388, "epoch": 2747} {"train_loss": -6.439497947692871, "global_step": 115389, "epoch": 2747} {"train_loss": -6.588057041168213, "global_step": 115390, "epoch": 2747} {"train_loss": -6.549726486206055, "global_step": 115391, "epoch": 2747} {"train_loss": -6.47774600982666, "global_step": 115392, "epoch": 2747} {"train_loss": -6.591387748718262, "global_step": 115393, "epoch": 2747} {"train_loss": -6.584782600402832, "global_step": 115394, "epoch": 2747} {"train_loss": -6.552102088928223, "global_step": 115395, "epoch": 2747} {"train_loss": -6.495349884033203, "global_step": 115396, "epoch": 2747} {"train_loss": -6.469372749328613, "global_step": 115397, "epoch": 2747} {"train_loss": -6.598987102508545, "global_step": 115398, "epoch": 2747} {"train_loss": -6.466465950012207, "global_step": 115399, "epoch": 2747} {"train_loss": -6.643629550933838, "global_step": 115400, "epoch": 2747} {"train_loss": -6.463021755218506, "global_step": 115401, "epoch": 2747} {"train_loss": -6.515957355499268, "global_step": 115402, "epoch": 2747} {"train_loss": -6.571469783782959, "global_step": 115403, "epoch": 2747} {"train_loss": -6.598295211791992, "global_step": 115404, "epoch": 2747} {"train_loss": -6.372546672821045, "global_step": 115405, "epoch": 2747} {"train_loss": -6.471906661987305, "global_step": 115406, "epoch": 2747} {"train_loss": -6.40541934967041, "global_step": 115407, "epoch": 2747} {"train_loss": -6.527580738067627, "global_step": 115408, "epoch": 2747} {"train_loss": -6.539529323577881, "global_step": 115409, "epoch": 2747} {"train_loss": -6.30757474899292, "global_step": 115410, "epoch": 2747} {"train_loss": -6.469865798950195, "global_step": 115411, "epoch": 2747} {"train_loss": -6.47402286529541, "global_step": 115412, "epoch": 2747} {"train_loss": -6.338653564453125, "global_step": 115413, "epoch": 2747} {"train_loss": -6.490927219390869, "global_step": 115414, "epoch": 2747} {"train_loss": -6.501000517890567, "global_step": 115415, "epoch": 2747, "val_loss": 67880.875} {"train_loss": -6.386045455932617, "global_step": 115416, "epoch": 2748} {"train_loss": -6.435243129730225, "global_step": 115417, "epoch": 2748} {"train_loss": -6.412177085876465, "global_step": 115418, "epoch": 2748} {"train_loss": -6.4895782470703125, "global_step": 115419, "epoch": 2748} {"train_loss": -6.514598846435547, "global_step": 115420, "epoch": 2748} {"train_loss": -6.4427971839904785, "global_step": 115421, "epoch": 2748} {"train_loss": -6.480817794799805, "global_step": 115422, "epoch": 2748} {"train_loss": -6.554374694824219, "global_step": 115423, "epoch": 2748} {"train_loss": -6.4795732498168945, "global_step": 115424, "epoch": 2748} {"train_loss": -6.571150779724121, "global_step": 115425, "epoch": 2748} {"train_loss": -6.5331244468688965, "global_step": 115426, "epoch": 2748} {"train_loss": -6.4277544021606445, "global_step": 115427, "epoch": 2748} {"train_loss": -6.4128618240356445, "global_step": 115428, "epoch": 2748} {"train_loss": -6.403960227966309, "global_step": 115429, "epoch": 2748} {"train_loss": -6.456077575683594, "global_step": 115430, "epoch": 2748} {"train_loss": -6.486239433288574, "global_step": 115431, "epoch": 2748} {"train_loss": -6.370064735412598, "global_step": 115432, "epoch": 2748} {"train_loss": -6.534872055053711, "global_step": 115433, "epoch": 2748} {"train_loss": -6.371514320373535, "global_step": 115434, "epoch": 2748} {"train_loss": -6.545323848724365, "global_step": 115435, "epoch": 2748} {"train_loss": -6.584959983825684, "global_step": 115436, "epoch": 2748} {"train_loss": -6.438279151916504, "global_step": 115437, "epoch": 2748} {"train_loss": -6.584569931030273, "global_step": 115438, "epoch": 2748} {"train_loss": -6.463852882385254, "global_step": 115439, "epoch": 2748} {"train_loss": -6.4657979011535645, "global_step": 115440, "epoch": 2748} {"train_loss": -6.5277557373046875, "global_step": 115441, "epoch": 2748} {"train_loss": -6.473165512084961, "global_step": 115442, "epoch": 2748} {"train_loss": -6.496789932250977, "global_step": 115443, "epoch": 2748} {"train_loss": -6.566116809844971, "global_step": 115444, "epoch": 2748} {"train_loss": -6.497284889221191, "global_step": 115445, "epoch": 2748} {"train_loss": -6.334975719451904, "global_step": 115446, "epoch": 2748} {"train_loss": -6.392025947570801, "global_step": 115447, "epoch": 2748} {"train_loss": -6.472802639007568, "global_step": 115448, "epoch": 2748} {"train_loss": -6.538134574890137, "global_step": 115449, "epoch": 2748} {"train_loss": -6.512398719787598, "global_step": 115450, "epoch": 2748} {"train_loss": -6.404418468475342, "global_step": 115451, "epoch": 2748} {"train_loss": -6.46663236618042, "global_step": 115452, "epoch": 2748} {"train_loss": -6.430468559265137, "global_step": 115453, "epoch": 2748} {"train_loss": -6.465512752532959, "global_step": 115454, "epoch": 2748} {"train_loss": -6.587450981140137, "global_step": 115455, "epoch": 2748} {"train_loss": -6.62907600402832, "global_step": 115456, "epoch": 2748} {"train_loss": -6.478900580179124, "global_step": 115457, "epoch": 2748, "val_loss": 68076.859375} {"train_loss": -6.478303909301758, "global_step": 115458, "epoch": 2749} {"train_loss": -6.505837440490723, "global_step": 115459, "epoch": 2749} {"train_loss": -6.560885906219482, "global_step": 115460, "epoch": 2749} {"train_loss": -6.502309799194336, "global_step": 115461, "epoch": 2749} {"train_loss": -6.441743850708008, "global_step": 115462, "epoch": 2749} {"train_loss": -6.430726528167725, "global_step": 115463, "epoch": 2749} {"train_loss": -6.370981693267822, "global_step": 115464, "epoch": 2749} {"train_loss": -6.482449531555176, "global_step": 115465, "epoch": 2749} {"train_loss": -6.50815486907959, "global_step": 115466, "epoch": 2749} {"train_loss": -6.410609722137451, "global_step": 115467, "epoch": 2749} {"train_loss": -6.43748140335083, "global_step": 115468, "epoch": 2749} {"train_loss": -6.412770748138428, "global_step": 115469, "epoch": 2749} {"train_loss": -6.408044815063477, "global_step": 115470, "epoch": 2749} {"train_loss": -6.49353551864624, "global_step": 115471, "epoch": 2749} {"train_loss": -6.416934967041016, "global_step": 115472, "epoch": 2749} {"train_loss": -6.38616418838501, "global_step": 115473, "epoch": 2749} {"train_loss": -6.4878830909729, "global_step": 115474, "epoch": 2749} {"train_loss": -6.505375385284424, "global_step": 115475, "epoch": 2749} {"train_loss": -6.406431198120117, "global_step": 115476, "epoch": 2749} {"train_loss": -6.328900337219238, "global_step": 115477, "epoch": 2749} {"train_loss": -6.414421081542969, "global_step": 115478, "epoch": 2749} {"train_loss": -6.466758728027344, "global_step": 115479, "epoch": 2749} {"train_loss": -6.526323318481445, "global_step": 115480, "epoch": 2749} {"train_loss": -6.428073406219482, "global_step": 115481, "epoch": 2749} {"train_loss": -6.4709343910217285, "global_step": 115482, "epoch": 2749} {"train_loss": -6.452803611755371, "global_step": 115483, "epoch": 2749} {"train_loss": -6.492258071899414, "global_step": 115484, "epoch": 2749} {"train_loss": -6.534431457519531, "global_step": 115485, "epoch": 2749} {"train_loss": -6.615478515625, "global_step": 115486, "epoch": 2749} {"train_loss": -6.646908283233643, "global_step": 115487, "epoch": 2749} {"train_loss": -6.515614032745361, "global_step": 115488, "epoch": 2749} {"train_loss": -6.546514511108398, "global_step": 115489, "epoch": 2749} {"train_loss": -6.445888042449951, "global_step": 115490, "epoch": 2749} {"train_loss": -6.652610778808594, "global_step": 115491, "epoch": 2749} {"train_loss": -6.538305282592773, "global_step": 115492, "epoch": 2749} {"train_loss": -6.523139476776123, "global_step": 115493, "epoch": 2749} {"train_loss": -6.563460350036621, "global_step": 115494, "epoch": 2749} {"train_loss": -6.444713115692139, "global_step": 115495, "epoch": 2749} {"train_loss": -6.548805236816406, "global_step": 115496, "epoch": 2749} {"train_loss": -6.431783676147461, "global_step": 115497, "epoch": 2749} {"train_loss": -6.504110813140869, "global_step": 115498, "epoch": 2749} {"train_loss": -6.4807938280559725, "global_step": 115499, "epoch": 2749, "val_loss": 68065.546875} {"train_loss": -6.5427093505859375, "global_step": 115500, "epoch": 2750} {"train_loss": -6.573367595672607, "global_step": 115501, "epoch": 2750} {"train_loss": -6.453893184661865, "global_step": 115502, "epoch": 2750} {"train_loss": -6.373505592346191, "global_step": 115503, "epoch": 2750} {"train_loss": -6.315047264099121, "global_step": 115504, "epoch": 2750} {"train_loss": -6.454833507537842, "global_step": 115505, "epoch": 2750} {"train_loss": -6.429854393005371, "global_step": 115506, "epoch": 2750} {"train_loss": -6.382327079772949, "global_step": 115507, "epoch": 2750} {"train_loss": -6.571741104125977, "global_step": 115508, "epoch": 2750} {"train_loss": -6.498717784881592, "global_step": 115509, "epoch": 2750} {"train_loss": -6.517366409301758, "global_step": 115510, "epoch": 2750} {"train_loss": -6.466414451599121, "global_step": 115511, "epoch": 2750} {"train_loss": -6.468254089355469, "global_step": 115512, "epoch": 2750} {"train_loss": -6.526045799255371, "global_step": 115513, "epoch": 2750} {"train_loss": -6.3950958251953125, "global_step": 115514, "epoch": 2750} {"train_loss": -6.559856414794922, "global_step": 115515, "epoch": 2750} {"train_loss": -6.481804370880127, "global_step": 115516, "epoch": 2750} {"train_loss": -6.494019985198975, "global_step": 115517, "epoch": 2750} {"train_loss": -6.559873580932617, "global_step": 115518, "epoch": 2750} {"train_loss": -6.442246437072754, "global_step": 115519, "epoch": 2750} {"train_loss": -6.508213043212891, "global_step": 115520, "epoch": 2750} {"train_loss": -6.550063610076904, "global_step": 115521, "epoch": 2750} {"train_loss": -6.498335361480713, "global_step": 115522, "epoch": 2750} {"train_loss": -6.494503021240234, "global_step": 115523, "epoch": 2750} {"train_loss": -6.570451736450195, "global_step": 115524, "epoch": 2750} {"train_loss": -6.417945861816406, "global_step": 115525, "epoch": 2750} {"train_loss": -6.445146560668945, "global_step": 115526, "epoch": 2750} {"train_loss": -6.381680011749268, "global_step": 115527, "epoch": 2750} {"train_loss": -6.499671936035156, "global_step": 115528, "epoch": 2750} {"train_loss": -6.49934196472168, "global_step": 115529, "epoch": 2750} {"train_loss": -6.596159934997559, "global_step": 115530, "epoch": 2750} {"train_loss": -6.464759349822998, "global_step": 115531, "epoch": 2750} {"train_loss": -6.455770969390869, "global_step": 115532, "epoch": 2750} {"train_loss": -6.490175247192383, "global_step": 115533, "epoch": 2750} {"train_loss": -6.432602405548096, "global_step": 115534, "epoch": 2750} {"train_loss": -6.52044677734375, "global_step": 115535, "epoch": 2750} {"train_loss": -6.581797122955322, "global_step": 115536, "epoch": 2750} {"train_loss": -6.291924476623535, "global_step": 115537, "epoch": 2750} {"train_loss": -6.476442337036133, "global_step": 115538, "epoch": 2750} {"train_loss": -6.471351623535156, "global_step": 115539, "epoch": 2750} {"train_loss": -6.441159248352051, "global_step": 115540, "epoch": 2750} {"train_loss": -6.475903193155925, "global_step": 115541, "epoch": 2750, "train/sim_max_reward_0": 0.256612521467665, "train/sim_max_reward_1": 0.55863805091215, "train/sim_max_reward_2": 0.16017442646571556, "train/sim_max_reward_3": 0.9104945747083217, "train/sim_max_reward_4": 0.8538340429002963, "train/sim_max_reward_5": 0.20231058480045494, "test/sim_max_reward_4400000": 0.17604308110667538, "test/sim_max_reward_4400001": 0.8739554522301344, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.9805993531252679, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.1733948814999089, "test/sim_max_reward_4400006": 0.894227351299592, "test/sim_max_reward_4400007": 0.7888913830142531, "test/sim_max_reward_4400008": 0.2993942216872311, "test/sim_max_reward_4400009": 0.8501542413424864, "test/sim_max_reward_4400010": 0.2824373856479089, "test/sim_max_reward_4400011": 0.7279111568816362, "test/sim_max_reward_4400012": 0.9444427596399162, "test/sim_max_reward_4400013": 0.3742661810669653, "test/sim_max_reward_4400014": 0.9323022489616322, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.07801935213175977, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.26334585371101665, "test/sim_max_reward_4400019": 0.893990251350305, "test/sim_max_reward_4400020": 0.9948845789177895, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9616307027045495, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.5402833458756651, "test/sim_max_reward_4400025": 0.2485955102513722, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.06325581590800303, "test/sim_max_reward_4400028": 0.8649013935089628, "test/sim_max_reward_4400029": 0.9285445139422355, "test/sim_max_reward_4400030": 0.9536743246500836, "test/sim_max_reward_4400031": 0.9993383777039316, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7420120695263497, "test/sim_max_reward_4400034": 0.8784330070789332, "test/sim_max_reward_4400035": 0.408897261348048, "test/sim_max_reward_4400036": 0.9184942369453193, "test/sim_max_reward_4400037": 0.27017655610680025, "test/sim_max_reward_4400038": 0.2880308336102168, "test/sim_max_reward_4400039": 0.9644113746573816, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.980520366394073, "test/sim_max_reward_4400044": 0.7678894747923385, "test/sim_max_reward_4400045": 0.9827635809125184, "test/sim_max_reward_4400046": 0.873638871790585, "test/sim_max_reward_4400047": 0.950515887789207, "test/sim_max_reward_4400048": 0.952691149177366, "test/sim_max_reward_4400049": 0.946433284104561, "train/mean_score": 0.4903440335424339, "test/mean_score": 0.5706448744214085, "val_loss": 67789.1328125} {"train_loss": -6.486036777496338, "global_step": 115542, "epoch": 2751} {"train_loss": -6.493863105773926, "global_step": 115543, "epoch": 2751} {"train_loss": -6.345451354980469, "global_step": 115544, "epoch": 2751} {"train_loss": -6.434886932373047, "global_step": 115545, "epoch": 2751} {"train_loss": -6.445979118347168, "global_step": 115546, "epoch": 2751} {"train_loss": -6.387224197387695, "global_step": 115547, "epoch": 2751} {"train_loss": -6.43067741394043, "global_step": 115548, "epoch": 2751} {"train_loss": -6.392640113830566, "global_step": 115549, "epoch": 2751} {"train_loss": -6.5274739265441895, "global_step": 115550, "epoch": 2751} {"train_loss": -6.488164901733398, "global_step": 115551, "epoch": 2751} {"train_loss": -6.491580009460449, "global_step": 115552, "epoch": 2751} {"train_loss": -6.375799179077148, "global_step": 115553, "epoch": 2751} {"train_loss": -6.522391319274902, "global_step": 115554, "epoch": 2751} {"train_loss": -6.425713539123535, "global_step": 115555, "epoch": 2751} {"train_loss": -6.319979667663574, "global_step": 115556, "epoch": 2751} {"train_loss": -6.398275375366211, "global_step": 115557, "epoch": 2751} {"train_loss": -6.403599739074707, "global_step": 115558, "epoch": 2751} {"train_loss": -6.376424789428711, "global_step": 115559, "epoch": 2751} {"train_loss": -6.386609077453613, "global_step": 115560, "epoch": 2751} {"train_loss": -6.346452713012695, "global_step": 115561, "epoch": 2751} {"train_loss": -6.306735038757324, "global_step": 115562, "epoch": 2751} {"train_loss": -6.459046363830566, "global_step": 115563, "epoch": 2751} {"train_loss": -6.377199172973633, "global_step": 115564, "epoch": 2751} {"train_loss": -6.471710205078125, "global_step": 115565, "epoch": 2751} {"train_loss": -6.3963518142700195, "global_step": 115566, "epoch": 2751} {"train_loss": -6.496953010559082, "global_step": 115567, "epoch": 2751} {"train_loss": -6.395956039428711, "global_step": 115568, "epoch": 2751} {"train_loss": -6.594319820404053, "global_step": 115569, "epoch": 2751} {"train_loss": -6.482705116271973, "global_step": 115570, "epoch": 2751} {"train_loss": -6.533483505249023, "global_step": 115571, "epoch": 2751} {"train_loss": -6.503960609436035, "global_step": 115572, "epoch": 2751} {"train_loss": -6.469647407531738, "global_step": 115573, "epoch": 2751} {"train_loss": -6.631234169006348, "global_step": 115574, "epoch": 2751} {"train_loss": -6.394709587097168, "global_step": 115575, "epoch": 2751} {"train_loss": -6.461098670959473, "global_step": 115576, "epoch": 2751} {"train_loss": -6.610035419464111, "global_step": 115577, "epoch": 2751} {"train_loss": -6.374457836151123, "global_step": 115578, "epoch": 2751} {"train_loss": -6.409271240234375, "global_step": 115579, "epoch": 2751} {"train_loss": -6.428280353546143, "global_step": 115580, "epoch": 2751} {"train_loss": -6.325973033905029, "global_step": 115581, "epoch": 2751} {"train_loss": -6.474785804748535, "global_step": 115582, "epoch": 2751} {"train_loss": -6.439779928752354, "global_step": 115583, "epoch": 2751, "val_loss": 67970.4453125} {"train_loss": -6.46442174911499, "global_step": 115584, "epoch": 2752} {"train_loss": -6.511904716491699, "global_step": 115585, "epoch": 2752} {"train_loss": -6.379441738128662, "global_step": 115586, "epoch": 2752} {"train_loss": -6.4798264503479, "global_step": 115587, "epoch": 2752} {"train_loss": -6.4812116622924805, "global_step": 115588, "epoch": 2752} {"train_loss": -6.5029988288879395, "global_step": 115589, "epoch": 2752} {"train_loss": -6.475994110107422, "global_step": 115590, "epoch": 2752} {"train_loss": -6.484691143035889, "global_step": 115591, "epoch": 2752} {"train_loss": -6.5516204833984375, "global_step": 115592, "epoch": 2752} {"train_loss": -6.555855751037598, "global_step": 115593, "epoch": 2752} {"train_loss": -6.520238876342773, "global_step": 115594, "epoch": 2752} {"train_loss": -6.5535888671875, "global_step": 115595, "epoch": 2752} {"train_loss": -6.458062171936035, "global_step": 115596, "epoch": 2752} {"train_loss": -6.380182266235352, "global_step": 115597, "epoch": 2752} {"train_loss": -6.409943580627441, "global_step": 115598, "epoch": 2752} {"train_loss": -6.584342002868652, "global_step": 115599, "epoch": 2752} {"train_loss": -6.447628974914551, "global_step": 115600, "epoch": 2752} {"train_loss": -6.460772514343262, "global_step": 115601, "epoch": 2752} {"train_loss": -6.326298236846924, "global_step": 115602, "epoch": 2752} {"train_loss": -6.399430274963379, "global_step": 115603, "epoch": 2752} {"train_loss": -6.469760894775391, "global_step": 115604, "epoch": 2752} {"train_loss": -6.552443027496338, "global_step": 115605, "epoch": 2752} {"train_loss": -6.550402641296387, "global_step": 115606, "epoch": 2752} {"train_loss": -6.430770397186279, "global_step": 115607, "epoch": 2752} {"train_loss": -6.4586896896362305, "global_step": 115608, "epoch": 2752} {"train_loss": -6.493189334869385, "global_step": 115609, "epoch": 2752} {"train_loss": -6.388705730438232, "global_step": 115610, "epoch": 2752} {"train_loss": -6.540926456451416, "global_step": 115611, "epoch": 2752} {"train_loss": -6.537766456604004, "global_step": 115612, "epoch": 2752} {"train_loss": -6.409924507141113, "global_step": 115613, "epoch": 2752} {"train_loss": -6.546171188354492, "global_step": 115614, "epoch": 2752} {"train_loss": -6.48864221572876, "global_step": 115615, "epoch": 2752} {"train_loss": -6.576908111572266, "global_step": 115616, "epoch": 2752} {"train_loss": -6.450373649597168, "global_step": 115617, "epoch": 2752} {"train_loss": -6.5288615226745605, "global_step": 115618, "epoch": 2752} {"train_loss": -6.5333662033081055, "global_step": 115619, "epoch": 2752} {"train_loss": -6.5460662841796875, "global_step": 115620, "epoch": 2752} {"train_loss": -6.579521656036377, "global_step": 115621, "epoch": 2752} {"train_loss": -6.604719638824463, "global_step": 115622, "epoch": 2752} {"train_loss": -6.437997341156006, "global_step": 115623, "epoch": 2752} {"train_loss": -6.546195983886719, "global_step": 115624, "epoch": 2752} {"train_loss": -6.488001687186105, "global_step": 115625, "epoch": 2752, "val_loss": 68225.3359375} {"train_loss": -6.460626125335693, "global_step": 115626, "epoch": 2753} {"train_loss": -6.532968521118164, "global_step": 115627, "epoch": 2753} {"train_loss": -6.433797836303711, "global_step": 115628, "epoch": 2753} {"train_loss": -6.400880336761475, "global_step": 115629, "epoch": 2753} {"train_loss": -6.576911926269531, "global_step": 115630, "epoch": 2753} {"train_loss": -6.492678165435791, "global_step": 115631, "epoch": 2753} {"train_loss": -6.494393348693848, "global_step": 115632, "epoch": 2753} {"train_loss": -6.443902969360352, "global_step": 115633, "epoch": 2753} {"train_loss": -6.445572853088379, "global_step": 115634, "epoch": 2753} {"train_loss": -6.563935279846191, "global_step": 115635, "epoch": 2753} {"train_loss": -6.415187358856201, "global_step": 115636, "epoch": 2753} {"train_loss": -6.472986698150635, "global_step": 115637, "epoch": 2753} {"train_loss": -6.573543548583984, "global_step": 115638, "epoch": 2753} {"train_loss": -6.376426696777344, "global_step": 115639, "epoch": 2753} {"train_loss": -6.366250038146973, "global_step": 115640, "epoch": 2753} {"train_loss": -6.34432315826416, "global_step": 115641, "epoch": 2753} {"train_loss": -6.4260358810424805, "global_step": 115642, "epoch": 2753} {"train_loss": -6.454807281494141, "global_step": 115643, "epoch": 2753} {"train_loss": -6.392764091491699, "global_step": 115644, "epoch": 2753} {"train_loss": -6.470894813537598, "global_step": 115645, "epoch": 2753} {"train_loss": -6.552990913391113, "global_step": 115646, "epoch": 2753} {"train_loss": -6.469153881072998, "global_step": 115647, "epoch": 2753} {"train_loss": -6.515445709228516, "global_step": 115648, "epoch": 2753} {"train_loss": -6.457588195800781, "global_step": 115649, "epoch": 2753} {"train_loss": -6.447907447814941, "global_step": 115650, "epoch": 2753} {"train_loss": -6.54290771484375, "global_step": 115651, "epoch": 2753} {"train_loss": -6.437158584594727, "global_step": 115652, "epoch": 2753} {"train_loss": -6.513001918792725, "global_step": 115653, "epoch": 2753} {"train_loss": -6.593599319458008, "global_step": 115654, "epoch": 2753} {"train_loss": -6.565517425537109, "global_step": 115655, "epoch": 2753} {"train_loss": -6.608583927154541, "global_step": 115656, "epoch": 2753} {"train_loss": -6.472052574157715, "global_step": 115657, "epoch": 2753} {"train_loss": -6.563736915588379, "global_step": 115658, "epoch": 2753} {"train_loss": -6.570625305175781, "global_step": 115659, "epoch": 2753} {"train_loss": -6.586277008056641, "global_step": 115660, "epoch": 2753} {"train_loss": -6.5886359214782715, "global_step": 115661, "epoch": 2753} {"train_loss": -6.542260646820068, "global_step": 115662, "epoch": 2753} {"train_loss": -6.496035575866699, "global_step": 115663, "epoch": 2753} {"train_loss": -6.555054664611816, "global_step": 115664, "epoch": 2753} {"train_loss": -6.519799709320068, "global_step": 115665, "epoch": 2753} {"train_loss": -6.509678840637207, "global_step": 115666, "epoch": 2753} {"train_loss": -6.496625082833426, "global_step": 115667, "epoch": 2753, "val_loss": 67877.015625} {"train_loss": -6.663449287414551, "global_step": 115668, "epoch": 2754} {"train_loss": -6.405244827270508, "global_step": 115669, "epoch": 2754} {"train_loss": -6.667693138122559, "global_step": 115670, "epoch": 2754} {"train_loss": -6.56478214263916, "global_step": 115671, "epoch": 2754} {"train_loss": -6.506937026977539, "global_step": 115672, "epoch": 2754} {"train_loss": -6.574314117431641, "global_step": 115673, "epoch": 2754} {"train_loss": -6.432539939880371, "global_step": 115674, "epoch": 2754} {"train_loss": -6.507091999053955, "global_step": 115675, "epoch": 2754} {"train_loss": -6.501941204071045, "global_step": 115676, "epoch": 2754} {"train_loss": -6.520751953125, "global_step": 115677, "epoch": 2754} {"train_loss": -6.512449264526367, "global_step": 115678, "epoch": 2754} {"train_loss": -6.397282123565674, "global_step": 115679, "epoch": 2754} {"train_loss": -6.483264923095703, "global_step": 115680, "epoch": 2754} {"train_loss": -6.459787845611572, "global_step": 115681, "epoch": 2754} {"train_loss": -6.635088920593262, "global_step": 115682, "epoch": 2754} {"train_loss": -6.419277667999268, "global_step": 115683, "epoch": 2754} {"train_loss": -6.563945770263672, "global_step": 115684, "epoch": 2754} {"train_loss": -6.485678672790527, "global_step": 115685, "epoch": 2754} {"train_loss": -6.469761848449707, "global_step": 115686, "epoch": 2754} {"train_loss": -6.479923248291016, "global_step": 115687, "epoch": 2754} {"train_loss": -6.382474899291992, "global_step": 115688, "epoch": 2754} {"train_loss": -6.361835479736328, "global_step": 115689, "epoch": 2754} {"train_loss": -6.483606815338135, "global_step": 115690, "epoch": 2754} {"train_loss": -6.48554801940918, "global_step": 115691, "epoch": 2754} {"train_loss": -6.399158477783203, "global_step": 115692, "epoch": 2754} {"train_loss": -6.459224700927734, "global_step": 115693, "epoch": 2754} {"train_loss": -6.527407169342041, "global_step": 115694, "epoch": 2754} {"train_loss": -6.578046798706055, "global_step": 115695, "epoch": 2754} {"train_loss": -6.383935451507568, "global_step": 115696, "epoch": 2754} {"train_loss": -6.498568058013916, "global_step": 115697, "epoch": 2754} {"train_loss": -6.489969730377197, "global_step": 115698, "epoch": 2754} {"train_loss": -6.353160858154297, "global_step": 115699, "epoch": 2754} {"train_loss": -6.488691329956055, "global_step": 115700, "epoch": 2754} {"train_loss": -6.468655586242676, "global_step": 115701, "epoch": 2754} {"train_loss": -6.440821647644043, "global_step": 115702, "epoch": 2754} {"train_loss": -6.485085487365723, "global_step": 115703, "epoch": 2754} {"train_loss": -6.4506731033325195, "global_step": 115704, "epoch": 2754} {"train_loss": -6.485590934753418, "global_step": 115705, "epoch": 2754} {"train_loss": -6.45827054977417, "global_step": 115706, "epoch": 2754} {"train_loss": -6.509311676025391, "global_step": 115707, "epoch": 2754} {"train_loss": -6.5177507400512695, "global_step": 115708, "epoch": 2754} {"train_loss": -6.488322984604609, "global_step": 115709, "epoch": 2754, "val_loss": 67813.2890625} {"train_loss": -6.570903778076172, "global_step": 115710, "epoch": 2755} {"train_loss": -6.478384017944336, "global_step": 115711, "epoch": 2755} {"train_loss": -6.560122489929199, "global_step": 115712, "epoch": 2755} {"train_loss": -6.375382423400879, "global_step": 115713, "epoch": 2755} {"train_loss": -6.485267639160156, "global_step": 115714, "epoch": 2755} {"train_loss": -6.5077056884765625, "global_step": 115715, "epoch": 2755} {"train_loss": -6.534595489501953, "global_step": 115716, "epoch": 2755} {"train_loss": -6.417700290679932, "global_step": 115717, "epoch": 2755} {"train_loss": -6.560749053955078, "global_step": 115718, "epoch": 2755} {"train_loss": -6.397036075592041, "global_step": 115719, "epoch": 2755} {"train_loss": -6.468180179595947, "global_step": 115720, "epoch": 2755} {"train_loss": -6.507181167602539, "global_step": 115721, "epoch": 2755} {"train_loss": -6.3692545890808105, "global_step": 115722, "epoch": 2755} {"train_loss": -6.539234161376953, "global_step": 115723, "epoch": 2755} {"train_loss": -6.376641273498535, "global_step": 115724, "epoch": 2755} {"train_loss": -6.5116472244262695, "global_step": 115725, "epoch": 2755} {"train_loss": -6.479442596435547, "global_step": 115726, "epoch": 2755} {"train_loss": -6.4127936363220215, "global_step": 115727, "epoch": 2755} {"train_loss": -6.547749996185303, "global_step": 115728, "epoch": 2755} {"train_loss": -6.548946380615234, "global_step": 115729, "epoch": 2755} {"train_loss": -6.546660423278809, "global_step": 115730, "epoch": 2755} {"train_loss": -6.465575218200684, "global_step": 115731, "epoch": 2755} {"train_loss": -6.525873184204102, "global_step": 115732, "epoch": 2755} {"train_loss": -6.576050758361816, "global_step": 115733, "epoch": 2755} {"train_loss": -6.586698532104492, "global_step": 115734, "epoch": 2755} {"train_loss": -6.527353286743164, "global_step": 115735, "epoch": 2755} {"train_loss": -6.488414764404297, "global_step": 115736, "epoch": 2755} {"train_loss": -6.367893695831299, "global_step": 115737, "epoch": 2755} {"train_loss": -6.49790620803833, "global_step": 115738, "epoch": 2755} {"train_loss": -6.4855427742004395, "global_step": 115739, "epoch": 2755} {"train_loss": -6.548779487609863, "global_step": 115740, "epoch": 2755} {"train_loss": -6.527064323425293, "global_step": 115741, "epoch": 2755} {"train_loss": -6.4663848876953125, "global_step": 115742, "epoch": 2755} {"train_loss": -6.459347724914551, "global_step": 115743, "epoch": 2755} {"train_loss": -6.552487373352051, "global_step": 115744, "epoch": 2755} {"train_loss": -6.510822296142578, "global_step": 115745, "epoch": 2755} {"train_loss": -6.4760847091674805, "global_step": 115746, "epoch": 2755} {"train_loss": -6.564897537231445, "global_step": 115747, "epoch": 2755} {"train_loss": -6.555404186248779, "global_step": 115748, "epoch": 2755} {"train_loss": -6.570775985717773, "global_step": 115749, "epoch": 2755} {"train_loss": -6.511341094970703, "global_step": 115750, "epoch": 2755} {"train_loss": -6.499386844180879, "global_step": 115751, "epoch": 2755, "val_loss": 67896.7421875} {"train_loss": -6.542243957519531, "global_step": 115752, "epoch": 2756} {"train_loss": -6.472759246826172, "global_step": 115753, "epoch": 2756} {"train_loss": -6.625349998474121, "global_step": 115754, "epoch": 2756} {"train_loss": -6.4666852951049805, "global_step": 115755, "epoch": 2756} {"train_loss": -6.559029579162598, "global_step": 115756, "epoch": 2756} {"train_loss": -6.493954658508301, "global_step": 115757, "epoch": 2756} {"train_loss": -6.524118423461914, "global_step": 115758, "epoch": 2756} {"train_loss": -6.428692817687988, "global_step": 115759, "epoch": 2756} {"train_loss": -6.624597549438477, "global_step": 115760, "epoch": 2756} {"train_loss": -6.466976165771484, "global_step": 115761, "epoch": 2756} {"train_loss": -6.440647602081299, "global_step": 115762, "epoch": 2756} {"train_loss": -6.486194610595703, "global_step": 115763, "epoch": 2756} {"train_loss": -6.459651470184326, "global_step": 115764, "epoch": 2756} {"train_loss": -6.485563278198242, "global_step": 115765, "epoch": 2756} {"train_loss": -6.45459508895874, "global_step": 115766, "epoch": 2756} {"train_loss": -6.354555130004883, "global_step": 115767, "epoch": 2756} {"train_loss": -6.451575756072998, "global_step": 115768, "epoch": 2756} {"train_loss": -6.485293388366699, "global_step": 115769, "epoch": 2756} {"train_loss": -6.456251621246338, "global_step": 115770, "epoch": 2756} {"train_loss": -6.554634094238281, "global_step": 115771, "epoch": 2756} {"train_loss": -6.526336193084717, "global_step": 115772, "epoch": 2756} {"train_loss": -6.566312789916992, "global_step": 115773, "epoch": 2756} {"train_loss": -6.540736198425293, "global_step": 115774, "epoch": 2756} {"train_loss": -6.533745288848877, "global_step": 115775, "epoch": 2756} {"train_loss": -6.401793479919434, "global_step": 115776, "epoch": 2756} {"train_loss": -6.421113967895508, "global_step": 115777, "epoch": 2756} {"train_loss": -6.338277339935303, "global_step": 115778, "epoch": 2756} {"train_loss": -6.544719696044922, "global_step": 115779, "epoch": 2756} {"train_loss": -6.528353214263916, "global_step": 115780, "epoch": 2756} {"train_loss": -6.3981404304504395, "global_step": 115781, "epoch": 2756} {"train_loss": -6.520939350128174, "global_step": 115782, "epoch": 2756} {"train_loss": -6.434805870056152, "global_step": 115783, "epoch": 2756} {"train_loss": -6.452666282653809, "global_step": 115784, "epoch": 2756} {"train_loss": -6.496565341949463, "global_step": 115785, "epoch": 2756} {"train_loss": -6.438366889953613, "global_step": 115786, "epoch": 2756} {"train_loss": -6.51241397857666, "global_step": 115787, "epoch": 2756} {"train_loss": -6.528067588806152, "global_step": 115788, "epoch": 2756} {"train_loss": -6.442429542541504, "global_step": 115789, "epoch": 2756} {"train_loss": -6.520962715148926, "global_step": 115790, "epoch": 2756} {"train_loss": -6.453667640686035, "global_step": 115791, "epoch": 2756} {"train_loss": -6.499005317687988, "global_step": 115792, "epoch": 2756} {"train_loss": -6.484379915964036, "global_step": 115793, "epoch": 2756, "val_loss": 68008.2578125} {"train_loss": -6.459784507751465, "global_step": 115794, "epoch": 2757} {"train_loss": -6.479386806488037, "global_step": 115795, "epoch": 2757} {"train_loss": -6.458641052246094, "global_step": 115796, "epoch": 2757} {"train_loss": -6.4920334815979, "global_step": 115797, "epoch": 2757} {"train_loss": -6.535463809967041, "global_step": 115798, "epoch": 2757} {"train_loss": -6.477585792541504, "global_step": 115799, "epoch": 2757} {"train_loss": -6.583990573883057, "global_step": 115800, "epoch": 2757} {"train_loss": -6.497629642486572, "global_step": 115801, "epoch": 2757} {"train_loss": -6.497476577758789, "global_step": 115802, "epoch": 2757} {"train_loss": -6.5674591064453125, "global_step": 115803, "epoch": 2757} {"train_loss": -6.371797561645508, "global_step": 115804, "epoch": 2757} {"train_loss": -6.394382953643799, "global_step": 115805, "epoch": 2757} {"train_loss": -6.513369560241699, "global_step": 115806, "epoch": 2757} {"train_loss": -6.183503150939941, "global_step": 115807, "epoch": 2757} {"train_loss": -6.547357082366943, "global_step": 115808, "epoch": 2757} {"train_loss": -6.230611801147461, "global_step": 115809, "epoch": 2757} {"train_loss": -6.381625175476074, "global_step": 115810, "epoch": 2757} {"train_loss": -6.406217098236084, "global_step": 115811, "epoch": 2757} {"train_loss": -6.371530532836914, "global_step": 115812, "epoch": 2757} {"train_loss": -6.442098140716553, "global_step": 115813, "epoch": 2757} {"train_loss": -6.312817573547363, "global_step": 115814, "epoch": 2757} {"train_loss": -6.2953200340271, "global_step": 115815, "epoch": 2757} {"train_loss": -6.300228595733643, "global_step": 115816, "epoch": 2757} {"train_loss": -6.400785446166992, "global_step": 115817, "epoch": 2757} {"train_loss": -6.330766677856445, "global_step": 115818, "epoch": 2757} {"train_loss": -6.426639556884766, "global_step": 115819, "epoch": 2757} {"train_loss": -6.3678107261657715, "global_step": 115820, "epoch": 2757} {"train_loss": -6.525695323944092, "global_step": 115821, "epoch": 2757} {"train_loss": -6.433928966522217, "global_step": 115822, "epoch": 2757} {"train_loss": -6.413996696472168, "global_step": 115823, "epoch": 2757} {"train_loss": -6.415161609649658, "global_step": 115824, "epoch": 2757} {"train_loss": -6.369734287261963, "global_step": 115825, "epoch": 2757} {"train_loss": -6.478901386260986, "global_step": 115826, "epoch": 2757} {"train_loss": -6.427482604980469, "global_step": 115827, "epoch": 2757} {"train_loss": -6.575982093811035, "global_step": 115828, "epoch": 2757} {"train_loss": -6.584300994873047, "global_step": 115829, "epoch": 2757} {"train_loss": -6.459872245788574, "global_step": 115830, "epoch": 2757} {"train_loss": -6.4600677490234375, "global_step": 115831, "epoch": 2757} {"train_loss": -6.386225700378418, "global_step": 115832, "epoch": 2757} {"train_loss": -6.563127517700195, "global_step": 115833, "epoch": 2757} {"train_loss": -6.453880310058594, "global_step": 115834, "epoch": 2757} {"train_loss": -6.438925391151791, "global_step": 115835, "epoch": 2757, "val_loss": 67907.7890625} {"train_loss": -6.367652893066406, "global_step": 115836, "epoch": 2758} {"train_loss": -6.625822067260742, "global_step": 115837, "epoch": 2758} {"train_loss": -6.510486125946045, "global_step": 115838, "epoch": 2758} {"train_loss": -6.472293853759766, "global_step": 115839, "epoch": 2758} {"train_loss": -6.530733108520508, "global_step": 115840, "epoch": 2758} {"train_loss": -6.594660758972168, "global_step": 115841, "epoch": 2758} {"train_loss": -6.517667293548584, "global_step": 115842, "epoch": 2758} {"train_loss": -6.460031986236572, "global_step": 115843, "epoch": 2758} {"train_loss": -6.470868110656738, "global_step": 115844, "epoch": 2758} {"train_loss": -6.452677249908447, "global_step": 115845, "epoch": 2758} {"train_loss": -6.481377124786377, "global_step": 115846, "epoch": 2758} {"train_loss": -6.591728687286377, "global_step": 115847, "epoch": 2758} {"train_loss": -6.44674015045166, "global_step": 115848, "epoch": 2758} {"train_loss": -6.549338340759277, "global_step": 115849, "epoch": 2758} {"train_loss": -6.362970352172852, "global_step": 115850, "epoch": 2758} {"train_loss": -6.39141845703125, "global_step": 115851, "epoch": 2758} {"train_loss": -6.477949142456055, "global_step": 115852, "epoch": 2758} {"train_loss": -6.46451473236084, "global_step": 115853, "epoch": 2758} {"train_loss": -6.635825157165527, "global_step": 115854, "epoch": 2758} {"train_loss": -6.457003116607666, "global_step": 115855, "epoch": 2758} {"train_loss": -6.525721549987793, "global_step": 115856, "epoch": 2758} {"train_loss": -6.510224342346191, "global_step": 115857, "epoch": 2758} {"train_loss": -6.4786295890808105, "global_step": 115858, "epoch": 2758} {"train_loss": -6.577854633331299, "global_step": 115859, "epoch": 2758} {"train_loss": -6.54927396774292, "global_step": 115860, "epoch": 2758} {"train_loss": -6.359848976135254, "global_step": 115861, "epoch": 2758} {"train_loss": -6.510514259338379, "global_step": 115862, "epoch": 2758} {"train_loss": -6.486536979675293, "global_step": 115863, "epoch": 2758} {"train_loss": -6.5725250244140625, "global_step": 115864, "epoch": 2758} {"train_loss": -6.542115211486816, "global_step": 115865, "epoch": 2758} {"train_loss": -6.464201927185059, "global_step": 115866, "epoch": 2758} {"train_loss": -6.494710922241211, "global_step": 115867, "epoch": 2758} {"train_loss": -6.567185401916504, "global_step": 115868, "epoch": 2758} {"train_loss": -6.499593734741211, "global_step": 115869, "epoch": 2758} {"train_loss": -6.52540397644043, "global_step": 115870, "epoch": 2758} {"train_loss": -6.541388034820557, "global_step": 115871, "epoch": 2758} {"train_loss": -6.492168426513672, "global_step": 115872, "epoch": 2758} {"train_loss": -6.489175796508789, "global_step": 115873, "epoch": 2758} {"train_loss": -6.387449741363525, "global_step": 115874, "epoch": 2758} {"train_loss": -6.576028347015381, "global_step": 115875, "epoch": 2758} {"train_loss": -6.524378776550293, "global_step": 115876, "epoch": 2758} {"train_loss": -6.501423778988066, "global_step": 115877, "epoch": 2758, "val_loss": 67859.5078125} {"train_loss": -6.523037910461426, "global_step": 115878, "epoch": 2759} {"train_loss": -6.544321060180664, "global_step": 115879, "epoch": 2759} {"train_loss": -6.593213081359863, "global_step": 115880, "epoch": 2759} {"train_loss": -6.6180243492126465, "global_step": 115881, "epoch": 2759} {"train_loss": -6.462317943572998, "global_step": 115882, "epoch": 2759} {"train_loss": -6.460148811340332, "global_step": 115883, "epoch": 2759} {"train_loss": -6.5097246170043945, "global_step": 115884, "epoch": 2759} {"train_loss": -6.514812469482422, "global_step": 115885, "epoch": 2759} {"train_loss": -6.443947792053223, "global_step": 115886, "epoch": 2759} {"train_loss": -6.572154521942139, "global_step": 115887, "epoch": 2759} {"train_loss": -6.504822731018066, "global_step": 115888, "epoch": 2759} {"train_loss": -6.604058265686035, "global_step": 115889, "epoch": 2759} {"train_loss": -6.458524703979492, "global_step": 115890, "epoch": 2759} {"train_loss": -6.514921188354492, "global_step": 115891, "epoch": 2759} {"train_loss": -6.453762054443359, "global_step": 115892, "epoch": 2759} {"train_loss": -6.4779052734375, "global_step": 115893, "epoch": 2759} {"train_loss": -6.420341491699219, "global_step": 115894, "epoch": 2759} {"train_loss": -6.538909912109375, "global_step": 115895, "epoch": 2759} {"train_loss": -6.466617584228516, "global_step": 115896, "epoch": 2759} {"train_loss": -6.467937469482422, "global_step": 115897, "epoch": 2759} {"train_loss": -6.65247106552124, "global_step": 115898, "epoch": 2759} {"train_loss": -6.46665620803833, "global_step": 115899, "epoch": 2759} {"train_loss": -6.4906907081604, "global_step": 115900, "epoch": 2759} {"train_loss": -6.4168500900268555, "global_step": 115901, "epoch": 2759} {"train_loss": -6.550148963928223, "global_step": 115902, "epoch": 2759} {"train_loss": -6.467411518096924, "global_step": 115903, "epoch": 2759} {"train_loss": -6.436069011688232, "global_step": 115904, "epoch": 2759} {"train_loss": -6.561485290527344, "global_step": 115905, "epoch": 2759} {"train_loss": -6.450021743774414, "global_step": 115906, "epoch": 2759} {"train_loss": -6.407837867736816, "global_step": 115907, "epoch": 2759} {"train_loss": -6.548557281494141, "global_step": 115908, "epoch": 2759} {"train_loss": -6.411982536315918, "global_step": 115909, "epoch": 2759} {"train_loss": -6.407716751098633, "global_step": 115910, "epoch": 2759} {"train_loss": -6.451469898223877, "global_step": 115911, "epoch": 2759} {"train_loss": -6.422698974609375, "global_step": 115912, "epoch": 2759} {"train_loss": -6.456815242767334, "global_step": 115913, "epoch": 2759} {"train_loss": -6.407045364379883, "global_step": 115914, "epoch": 2759} {"train_loss": -6.453845977783203, "global_step": 115915, "epoch": 2759} {"train_loss": -6.435589790344238, "global_step": 115916, "epoch": 2759} {"train_loss": -6.511313438415527, "global_step": 115917, "epoch": 2759} {"train_loss": -6.564376354217529, "global_step": 115918, "epoch": 2759} {"train_loss": -6.491243498665946, "global_step": 115919, "epoch": 2759, "val_loss": 67983.1953125} {"train_loss": -6.493099689483643, "global_step": 115920, "epoch": 2760} {"train_loss": -6.440251350402832, "global_step": 115921, "epoch": 2760} {"train_loss": -6.418839454650879, "global_step": 115922, "epoch": 2760} {"train_loss": -6.563462734222412, "global_step": 115923, "epoch": 2760} {"train_loss": -6.376888275146484, "global_step": 115924, "epoch": 2760} {"train_loss": -6.563662528991699, "global_step": 115925, "epoch": 2760} {"train_loss": -6.571122646331787, "global_step": 115926, "epoch": 2760} {"train_loss": -6.439166069030762, "global_step": 115927, "epoch": 2760} {"train_loss": -6.54369592666626, "global_step": 115928, "epoch": 2760} {"train_loss": -6.584717273712158, "global_step": 115929, "epoch": 2760} {"train_loss": -6.412954330444336, "global_step": 115930, "epoch": 2760} {"train_loss": -6.55653715133667, "global_step": 115931, "epoch": 2760} {"train_loss": -6.497577667236328, "global_step": 115932, "epoch": 2760} {"train_loss": -6.523726940155029, "global_step": 115933, "epoch": 2760} {"train_loss": -6.465193748474121, "global_step": 115934, "epoch": 2760} {"train_loss": -6.537428379058838, "global_step": 115935, "epoch": 2760} {"train_loss": -6.517662048339844, "global_step": 115936, "epoch": 2760} {"train_loss": -6.549934387207031, "global_step": 115937, "epoch": 2760} {"train_loss": -6.490150451660156, "global_step": 115938, "epoch": 2760} {"train_loss": -6.478999137878418, "global_step": 115939, "epoch": 2760} {"train_loss": -6.472459316253662, "global_step": 115940, "epoch": 2760} {"train_loss": -6.377987384796143, "global_step": 115941, "epoch": 2760} {"train_loss": -6.528063774108887, "global_step": 115942, "epoch": 2760} {"train_loss": -6.307879447937012, "global_step": 115943, "epoch": 2760} {"train_loss": -6.572757244110107, "global_step": 115944, "epoch": 2760} {"train_loss": -6.4102020263671875, "global_step": 115945, "epoch": 2760} {"train_loss": -6.3917236328125, "global_step": 115946, "epoch": 2760} {"train_loss": -6.501615524291992, "global_step": 115947, "epoch": 2760} {"train_loss": -6.532029628753662, "global_step": 115948, "epoch": 2760} {"train_loss": -6.322771072387695, "global_step": 115949, "epoch": 2760} {"train_loss": -6.584273815155029, "global_step": 115950, "epoch": 2760} {"train_loss": -6.511192798614502, "global_step": 115951, "epoch": 2760} {"train_loss": -6.51807975769043, "global_step": 115952, "epoch": 2760} {"train_loss": -6.531338691711426, "global_step": 115953, "epoch": 2760} {"train_loss": -6.439700603485107, "global_step": 115954, "epoch": 2760} {"train_loss": -6.424704074859619, "global_step": 115955, "epoch": 2760} {"train_loss": -6.494164943695068, "global_step": 115956, "epoch": 2760} {"train_loss": -6.372797012329102, "global_step": 115957, "epoch": 2760} {"train_loss": -6.471587181091309, "global_step": 115958, "epoch": 2760} {"train_loss": -6.459347248077393, "global_step": 115959, "epoch": 2760} {"train_loss": -6.369541168212891, "global_step": 115960, "epoch": 2760} {"train_loss": -6.477556308110555, "global_step": 115961, "epoch": 2760, "val_loss": 67807.4375} {"train_loss": -6.449173927307129, "global_step": 115962, "epoch": 2761} {"train_loss": -6.385007858276367, "global_step": 115963, "epoch": 2761} {"train_loss": -6.34926700592041, "global_step": 115964, "epoch": 2761} {"train_loss": -6.465298652648926, "global_step": 115965, "epoch": 2761} {"train_loss": -6.664161205291748, "global_step": 115966, "epoch": 2761} {"train_loss": -6.416839599609375, "global_step": 115967, "epoch": 2761} {"train_loss": -6.349750518798828, "global_step": 115968, "epoch": 2761} {"train_loss": -6.477373123168945, "global_step": 115969, "epoch": 2761} {"train_loss": -6.4426116943359375, "global_step": 115970, "epoch": 2761} {"train_loss": -6.499637603759766, "global_step": 115971, "epoch": 2761} {"train_loss": -6.516887664794922, "global_step": 115972, "epoch": 2761} {"train_loss": -6.469169616699219, "global_step": 115973, "epoch": 2761} {"train_loss": -6.5564422607421875, "global_step": 115974, "epoch": 2761} {"train_loss": -6.565388202667236, "global_step": 115975, "epoch": 2761} {"train_loss": -6.490456581115723, "global_step": 115976, "epoch": 2761} {"train_loss": -6.517919063568115, "global_step": 115977, "epoch": 2761} {"train_loss": -6.4758524894714355, "global_step": 115978, "epoch": 2761} {"train_loss": -6.635180473327637, "global_step": 115979, "epoch": 2761} {"train_loss": -6.462019443511963, "global_step": 115980, "epoch": 2761} {"train_loss": -6.457587242126465, "global_step": 115981, "epoch": 2761} {"train_loss": -6.459192752838135, "global_step": 115982, "epoch": 2761} {"train_loss": -6.434055328369141, "global_step": 115983, "epoch": 2761} {"train_loss": -6.436980724334717, "global_step": 115984, "epoch": 2761} {"train_loss": -6.407107353210449, "global_step": 115985, "epoch": 2761} {"train_loss": -6.538938999176025, "global_step": 115986, "epoch": 2761} {"train_loss": -6.494562149047852, "global_step": 115987, "epoch": 2761} {"train_loss": -6.581907272338867, "global_step": 115988, "epoch": 2761} {"train_loss": -6.41270112991333, "global_step": 115989, "epoch": 2761} {"train_loss": -6.447890281677246, "global_step": 115990, "epoch": 2761} {"train_loss": -6.533341407775879, "global_step": 115991, "epoch": 2761} {"train_loss": -6.536637306213379, "global_step": 115992, "epoch": 2761} {"train_loss": -6.406721115112305, "global_step": 115993, "epoch": 2761} {"train_loss": -6.524648666381836, "global_step": 115994, "epoch": 2761} {"train_loss": -6.460880756378174, "global_step": 115995, "epoch": 2761} {"train_loss": -6.402052402496338, "global_step": 115996, "epoch": 2761} {"train_loss": -6.318374156951904, "global_step": 115997, "epoch": 2761} {"train_loss": -6.436212539672852, "global_step": 115998, "epoch": 2761} {"train_loss": -6.513121128082275, "global_step": 115999, "epoch": 2761} {"train_loss": -6.402011871337891, "global_step": 116000, "epoch": 2761} {"train_loss": -6.457087516784668, "global_step": 116001, "epoch": 2761} {"train_loss": -6.4051313400268555, "global_step": 116002, "epoch": 2761} {"train_loss": -6.46922288622175, "global_step": 116003, "epoch": 2761, "val_loss": 67777.578125} {"train_loss": -6.406308174133301, "global_step": 116004, "epoch": 2762} {"train_loss": -6.36778450012207, "global_step": 116005, "epoch": 2762} {"train_loss": -6.502503871917725, "global_step": 116006, "epoch": 2762} {"train_loss": -6.442004203796387, "global_step": 116007, "epoch": 2762} {"train_loss": -6.411927700042725, "global_step": 116008, "epoch": 2762} {"train_loss": -6.5555830001831055, "global_step": 116009, "epoch": 2762} {"train_loss": -6.596823215484619, "global_step": 116010, "epoch": 2762} {"train_loss": -6.5336833000183105, "global_step": 116011, "epoch": 2762} {"train_loss": -6.501269340515137, "global_step": 116012, "epoch": 2762} {"train_loss": -6.489805698394775, "global_step": 116013, "epoch": 2762} {"train_loss": -6.591106414794922, "global_step": 116014, "epoch": 2762} {"train_loss": -6.53119421005249, "global_step": 116015, "epoch": 2762} {"train_loss": -6.632645606994629, "global_step": 116016, "epoch": 2762} {"train_loss": -6.578433990478516, "global_step": 116017, "epoch": 2762} {"train_loss": -6.5172343254089355, "global_step": 116018, "epoch": 2762} {"train_loss": -6.453880310058594, "global_step": 116019, "epoch": 2762} {"train_loss": -6.401550769805908, "global_step": 116020, "epoch": 2762} {"train_loss": -6.606339454650879, "global_step": 116021, "epoch": 2762} {"train_loss": -6.553190231323242, "global_step": 116022, "epoch": 2762} {"train_loss": -6.544677257537842, "global_step": 116023, "epoch": 2762} {"train_loss": -6.529454231262207, "global_step": 116024, "epoch": 2762} {"train_loss": -6.569728374481201, "global_step": 116025, "epoch": 2762} {"train_loss": -6.446268081665039, "global_step": 116026, "epoch": 2762} {"train_loss": -6.635249137878418, "global_step": 116027, "epoch": 2762} {"train_loss": -6.43402099609375, "global_step": 116028, "epoch": 2762} {"train_loss": -6.481964111328125, "global_step": 116029, "epoch": 2762} {"train_loss": -6.4678120613098145, "global_step": 116030, "epoch": 2762} {"train_loss": -6.524054527282715, "global_step": 116031, "epoch": 2762} {"train_loss": -6.628088474273682, "global_step": 116032, "epoch": 2762} {"train_loss": -6.427286148071289, "global_step": 116033, "epoch": 2762} {"train_loss": -6.493927955627441, "global_step": 116034, "epoch": 2762} {"train_loss": -6.548123359680176, "global_step": 116035, "epoch": 2762} {"train_loss": -6.552422046661377, "global_step": 116036, "epoch": 2762} {"train_loss": -6.563096046447754, "global_step": 116037, "epoch": 2762} {"train_loss": -6.476190567016602, "global_step": 116038, "epoch": 2762} {"train_loss": -6.3993821144104, "global_step": 116039, "epoch": 2762} {"train_loss": -6.566679954528809, "global_step": 116040, "epoch": 2762} {"train_loss": -6.459529876708984, "global_step": 116041, "epoch": 2762} {"train_loss": -6.521603584289551, "global_step": 116042, "epoch": 2762} {"train_loss": -6.529675483703613, "global_step": 116043, "epoch": 2762} {"train_loss": -6.43497371673584, "global_step": 116044, "epoch": 2762} {"train_loss": -6.508246433167231, "global_step": 116045, "epoch": 2762, "val_loss": 68010.4609375} {"train_loss": -6.532096862792969, "global_step": 116046, "epoch": 2763} {"train_loss": -6.464320659637451, "global_step": 116047, "epoch": 2763} {"train_loss": -6.490065574645996, "global_step": 116048, "epoch": 2763} {"train_loss": -6.616652965545654, "global_step": 116049, "epoch": 2763} {"train_loss": -6.4876604080200195, "global_step": 116050, "epoch": 2763} {"train_loss": -6.52606725692749, "global_step": 116051, "epoch": 2763} {"train_loss": -6.582427978515625, "global_step": 116052, "epoch": 2763} {"train_loss": -6.488586902618408, "global_step": 116053, "epoch": 2763} {"train_loss": -6.534065246582031, "global_step": 116054, "epoch": 2763} {"train_loss": -6.582975387573242, "global_step": 116055, "epoch": 2763} {"train_loss": -6.549072742462158, "global_step": 116056, "epoch": 2763} {"train_loss": -6.351423263549805, "global_step": 116057, "epoch": 2763} {"train_loss": -6.364841461181641, "global_step": 116058, "epoch": 2763} {"train_loss": -6.546815872192383, "global_step": 116059, "epoch": 2763} {"train_loss": -6.3845438957214355, "global_step": 116060, "epoch": 2763} {"train_loss": -6.377309322357178, "global_step": 116061, "epoch": 2763} {"train_loss": -6.4259843826293945, "global_step": 116062, "epoch": 2763} {"train_loss": -6.323970794677734, "global_step": 116063, "epoch": 2763} {"train_loss": -6.5260467529296875, "global_step": 116064, "epoch": 2763} {"train_loss": -6.458586692810059, "global_step": 116065, "epoch": 2763} {"train_loss": -6.460901260375977, "global_step": 116066, "epoch": 2763} {"train_loss": -6.455617904663086, "global_step": 116067, "epoch": 2763} {"train_loss": -6.457993984222412, "global_step": 116068, "epoch": 2763} {"train_loss": -6.500257968902588, "global_step": 116069, "epoch": 2763} {"train_loss": -6.46746826171875, "global_step": 116070, "epoch": 2763} {"train_loss": -6.474750995635986, "global_step": 116071, "epoch": 2763} {"train_loss": -6.631962776184082, "global_step": 116072, "epoch": 2763} {"train_loss": -6.504267692565918, "global_step": 116073, "epoch": 2763} {"train_loss": -6.523914337158203, "global_step": 116074, "epoch": 2763} {"train_loss": -6.543941497802734, "global_step": 116075, "epoch": 2763} {"train_loss": -6.545072555541992, "global_step": 116076, "epoch": 2763} {"train_loss": -6.518721580505371, "global_step": 116077, "epoch": 2763} {"train_loss": -6.545546531677246, "global_step": 116078, "epoch": 2763} {"train_loss": -6.5467400550842285, "global_step": 116079, "epoch": 2763} {"train_loss": -6.484918594360352, "global_step": 116080, "epoch": 2763} {"train_loss": -6.523070812225342, "global_step": 116081, "epoch": 2763} {"train_loss": -6.529218673706055, "global_step": 116082, "epoch": 2763} {"train_loss": -6.380241394042969, "global_step": 116083, "epoch": 2763} {"train_loss": -6.432809352874756, "global_step": 116084, "epoch": 2763} {"train_loss": -6.492474555969238, "global_step": 116085, "epoch": 2763} {"train_loss": -6.462710380554199, "global_step": 116086, "epoch": 2763} {"train_loss": -6.4879849297659735, "global_step": 116087, "epoch": 2763, "val_loss": 67986.75} {"train_loss": -6.508874893188477, "global_step": 116088, "epoch": 2764} {"train_loss": -6.397500038146973, "global_step": 116089, "epoch": 2764} {"train_loss": -6.521900177001953, "global_step": 116090, "epoch": 2764} {"train_loss": -6.446688175201416, "global_step": 116091, "epoch": 2764} {"train_loss": -6.509206771850586, "global_step": 116092, "epoch": 2764} {"train_loss": -6.484964847564697, "global_step": 116093, "epoch": 2764} {"train_loss": -6.376806735992432, "global_step": 116094, "epoch": 2764} {"train_loss": -6.5620574951171875, "global_step": 116095, "epoch": 2764} {"train_loss": -6.542634010314941, "global_step": 116096, "epoch": 2764} {"train_loss": -6.473274230957031, "global_step": 116097, "epoch": 2764} {"train_loss": -6.478703498840332, "global_step": 116098, "epoch": 2764} {"train_loss": -6.489990711212158, "global_step": 116099, "epoch": 2764} {"train_loss": -6.448728561401367, "global_step": 116100, "epoch": 2764} {"train_loss": -6.48626708984375, "global_step": 116101, "epoch": 2764} {"train_loss": -6.450117111206055, "global_step": 116102, "epoch": 2764} {"train_loss": -6.581920623779297, "global_step": 116103, "epoch": 2764} {"train_loss": -6.45389461517334, "global_step": 116104, "epoch": 2764} {"train_loss": -6.355880260467529, "global_step": 116105, "epoch": 2764} {"train_loss": -6.4861063957214355, "global_step": 116106, "epoch": 2764} {"train_loss": -6.375699996948242, "global_step": 116107, "epoch": 2764} {"train_loss": -6.537553787231445, "global_step": 116108, "epoch": 2764} {"train_loss": -6.447964668273926, "global_step": 116109, "epoch": 2764} {"train_loss": -6.403165817260742, "global_step": 116110, "epoch": 2764} {"train_loss": -6.45127010345459, "global_step": 116111, "epoch": 2764} {"train_loss": -6.361374378204346, "global_step": 116112, "epoch": 2764} {"train_loss": -6.474484920501709, "global_step": 116113, "epoch": 2764} {"train_loss": -6.485019207000732, "global_step": 116114, "epoch": 2764} {"train_loss": -6.317309379577637, "global_step": 116115, "epoch": 2764} {"train_loss": -6.514534950256348, "global_step": 116116, "epoch": 2764} {"train_loss": -6.4748101234436035, "global_step": 116117, "epoch": 2764} {"train_loss": -6.506997108459473, "global_step": 116118, "epoch": 2764} {"train_loss": -6.399828910827637, "global_step": 116119, "epoch": 2764} {"train_loss": -6.611141204833984, "global_step": 116120, "epoch": 2764} {"train_loss": -6.535865783691406, "global_step": 116121, "epoch": 2764} {"train_loss": -6.366353988647461, "global_step": 116122, "epoch": 2764} {"train_loss": -6.46092414855957, "global_step": 116123, "epoch": 2764} {"train_loss": -6.413773536682129, "global_step": 116124, "epoch": 2764} {"train_loss": -6.411550521850586, "global_step": 116125, "epoch": 2764} {"train_loss": -6.455463409423828, "global_step": 116126, "epoch": 2764} {"train_loss": -6.376914978027344, "global_step": 116127, "epoch": 2764} {"train_loss": -6.49764347076416, "global_step": 116128, "epoch": 2764} {"train_loss": -6.459893328802926, "global_step": 116129, "epoch": 2764, "val_loss": 67917.7578125} {"train_loss": -6.527415752410889, "global_step": 116130, "epoch": 2765} {"train_loss": -6.714656829833984, "global_step": 116131, "epoch": 2765} {"train_loss": -6.530559539794922, "global_step": 116132, "epoch": 2765} {"train_loss": -6.504435062408447, "global_step": 116133, "epoch": 2765} {"train_loss": -6.533794403076172, "global_step": 116134, "epoch": 2765} {"train_loss": -6.5670390129089355, "global_step": 116135, "epoch": 2765} {"train_loss": -6.614022254943848, "global_step": 116136, "epoch": 2765} {"train_loss": -6.640201568603516, "global_step": 116137, "epoch": 2765} {"train_loss": -6.497032165527344, "global_step": 116138, "epoch": 2765} {"train_loss": -6.493393421173096, "global_step": 116139, "epoch": 2765} {"train_loss": -6.525739669799805, "global_step": 116140, "epoch": 2765} {"train_loss": -6.571715354919434, "global_step": 116141, "epoch": 2765} {"train_loss": -6.53264856338501, "global_step": 116142, "epoch": 2765} {"train_loss": -6.430347442626953, "global_step": 116143, "epoch": 2765} {"train_loss": -6.585340976715088, "global_step": 116144, "epoch": 2765} {"train_loss": -6.600869178771973, "global_step": 116145, "epoch": 2765} {"train_loss": -6.435413360595703, "global_step": 116146, "epoch": 2765} {"train_loss": -6.564683437347412, "global_step": 116147, "epoch": 2765} {"train_loss": -6.634227752685547, "global_step": 116148, "epoch": 2765} {"train_loss": -6.584872245788574, "global_step": 116149, "epoch": 2765} {"train_loss": -6.704709053039551, "global_step": 116150, "epoch": 2765} {"train_loss": -6.419023513793945, "global_step": 116151, "epoch": 2765} {"train_loss": -6.3601179122924805, "global_step": 116152, "epoch": 2765} {"train_loss": -6.619543552398682, "global_step": 116153, "epoch": 2765} {"train_loss": -6.47907829284668, "global_step": 116154, "epoch": 2765} {"train_loss": -6.445236682891846, "global_step": 116155, "epoch": 2765} {"train_loss": -6.5070648193359375, "global_step": 116156, "epoch": 2765} {"train_loss": -6.446893692016602, "global_step": 116157, "epoch": 2765} {"train_loss": -6.507587432861328, "global_step": 116158, "epoch": 2765} {"train_loss": -6.539098262786865, "global_step": 116159, "epoch": 2765} {"train_loss": -6.5451979637146, "global_step": 116160, "epoch": 2765} {"train_loss": -6.603070259094238, "global_step": 116161, "epoch": 2765} {"train_loss": -6.487293243408203, "global_step": 116162, "epoch": 2765} {"train_loss": -6.496817111968994, "global_step": 116163, "epoch": 2765} {"train_loss": -6.462248802185059, "global_step": 116164, "epoch": 2765} {"train_loss": -6.5618743896484375, "global_step": 116165, "epoch": 2765} {"train_loss": -6.440526962280273, "global_step": 116166, "epoch": 2765} {"train_loss": -6.512217998504639, "global_step": 116167, "epoch": 2765} {"train_loss": -6.532543659210205, "global_step": 116168, "epoch": 2765} {"train_loss": -6.578409194946289, "global_step": 116169, "epoch": 2765} {"train_loss": -6.559182167053223, "global_step": 116170, "epoch": 2765} {"train_loss": -6.533661717460269, "global_step": 116171, "epoch": 2765, "val_loss": 67836.1328125} {"train_loss": -6.400998115539551, "global_step": 116172, "epoch": 2766} {"train_loss": -6.465573787689209, "global_step": 116173, "epoch": 2766} {"train_loss": -6.482472896575928, "global_step": 116174, "epoch": 2766} {"train_loss": -6.483006477355957, "global_step": 116175, "epoch": 2766} {"train_loss": -6.495763301849365, "global_step": 116176, "epoch": 2766} {"train_loss": -6.505203723907471, "global_step": 116177, "epoch": 2766} {"train_loss": -6.463582992553711, "global_step": 116178, "epoch": 2766} {"train_loss": -6.588679313659668, "global_step": 116179, "epoch": 2766} {"train_loss": -6.466550827026367, "global_step": 116180, "epoch": 2766} {"train_loss": -6.323031425476074, "global_step": 116181, "epoch": 2766} {"train_loss": -6.481534481048584, "global_step": 116182, "epoch": 2766} {"train_loss": -6.370312690734863, "global_step": 116183, "epoch": 2766} {"train_loss": -6.436654090881348, "global_step": 116184, "epoch": 2766} {"train_loss": -6.46282434463501, "global_step": 116185, "epoch": 2766} {"train_loss": -6.51728630065918, "global_step": 116186, "epoch": 2766} {"train_loss": -6.519964218139648, "global_step": 116187, "epoch": 2766} {"train_loss": -6.586345195770264, "global_step": 116188, "epoch": 2766} {"train_loss": -6.4908294677734375, "global_step": 116189, "epoch": 2766} {"train_loss": -6.5470499992370605, "global_step": 116190, "epoch": 2766} {"train_loss": -6.3432722091674805, "global_step": 116191, "epoch": 2766} {"train_loss": -6.453970432281494, "global_step": 116192, "epoch": 2766} {"train_loss": -6.498565196990967, "global_step": 116193, "epoch": 2766} {"train_loss": -6.533262252807617, "global_step": 116194, "epoch": 2766} {"train_loss": -6.571399688720703, "global_step": 116195, "epoch": 2766} {"train_loss": -6.4822492599487305, "global_step": 116196, "epoch": 2766} {"train_loss": -6.479801177978516, "global_step": 116197, "epoch": 2766} {"train_loss": -6.438448429107666, "global_step": 116198, "epoch": 2766} {"train_loss": -6.47124719619751, "global_step": 116199, "epoch": 2766} {"train_loss": -6.464241981506348, "global_step": 116200, "epoch": 2766} {"train_loss": -6.421226501464844, "global_step": 116201, "epoch": 2766} {"train_loss": -6.400774002075195, "global_step": 116202, "epoch": 2766} {"train_loss": -6.486106872558594, "global_step": 116203, "epoch": 2766} {"train_loss": -6.387779235839844, "global_step": 116204, "epoch": 2766} {"train_loss": -6.5963311195373535, "global_step": 116205, "epoch": 2766} {"train_loss": -6.385040760040283, "global_step": 116206, "epoch": 2766} {"train_loss": -6.420143127441406, "global_step": 116207, "epoch": 2766} {"train_loss": -6.508309364318848, "global_step": 116208, "epoch": 2766} {"train_loss": -6.478941917419434, "global_step": 116209, "epoch": 2766} {"train_loss": -6.492681503295898, "global_step": 116210, "epoch": 2766} {"train_loss": -6.397600173950195, "global_step": 116211, "epoch": 2766} {"train_loss": -6.486629486083984, "global_step": 116212, "epoch": 2766} {"train_loss": -6.4714279515402655, "global_step": 116213, "epoch": 2766, "val_loss": 68040.375} {"train_loss": -6.423190116882324, "global_step": 116214, "epoch": 2767} {"train_loss": -6.498941421508789, "global_step": 116215, "epoch": 2767} {"train_loss": -6.479692459106445, "global_step": 116216, "epoch": 2767} {"train_loss": -6.460642337799072, "global_step": 116217, "epoch": 2767} {"train_loss": -6.453855037689209, "global_step": 116218, "epoch": 2767} {"train_loss": -6.415952205657959, "global_step": 116219, "epoch": 2767} {"train_loss": -6.540284633636475, "global_step": 116220, "epoch": 2767} {"train_loss": -6.533666133880615, "global_step": 116221, "epoch": 2767} {"train_loss": -6.443540573120117, "global_step": 116222, "epoch": 2767} {"train_loss": -6.563863754272461, "global_step": 116223, "epoch": 2767} {"train_loss": -6.576300621032715, "global_step": 116224, "epoch": 2767} {"train_loss": -6.515118598937988, "global_step": 116225, "epoch": 2767} {"train_loss": -6.510688781738281, "global_step": 116226, "epoch": 2767} {"train_loss": -6.503560543060303, "global_step": 116227, "epoch": 2767} {"train_loss": -6.517726421356201, "global_step": 116228, "epoch": 2767} {"train_loss": -6.4255523681640625, "global_step": 116229, "epoch": 2767} {"train_loss": -6.451481819152832, "global_step": 116230, "epoch": 2767} {"train_loss": -6.568050384521484, "global_step": 116231, "epoch": 2767} {"train_loss": -6.527817726135254, "global_step": 116232, "epoch": 2767} {"train_loss": -6.483730316162109, "global_step": 116233, "epoch": 2767} {"train_loss": -6.341544151306152, "global_step": 116234, "epoch": 2767} {"train_loss": -6.50803804397583, "global_step": 116235, "epoch": 2767} {"train_loss": -6.48709774017334, "global_step": 116236, "epoch": 2767} {"train_loss": -6.45922327041626, "global_step": 116237, "epoch": 2767} {"train_loss": -6.443875789642334, "global_step": 116238, "epoch": 2767} {"train_loss": -6.4852423667907715, "global_step": 116239, "epoch": 2767} {"train_loss": -6.432435989379883, "global_step": 116240, "epoch": 2767} {"train_loss": -6.50566291809082, "global_step": 116241, "epoch": 2767} {"train_loss": -6.469967842102051, "global_step": 116242, "epoch": 2767} {"train_loss": -6.443247318267822, "global_step": 116243, "epoch": 2767} {"train_loss": -6.484946250915527, "global_step": 116244, "epoch": 2767} {"train_loss": -6.623402118682861, "global_step": 116245, "epoch": 2767} {"train_loss": -6.503696918487549, "global_step": 116246, "epoch": 2767} {"train_loss": -6.388542652130127, "global_step": 116247, "epoch": 2767} {"train_loss": -6.627553939819336, "global_step": 116248, "epoch": 2767} {"train_loss": -6.532981872558594, "global_step": 116249, "epoch": 2767} {"train_loss": -6.5287580490112305, "global_step": 116250, "epoch": 2767} {"train_loss": -6.543086051940918, "global_step": 116251, "epoch": 2767} {"train_loss": -6.471083641052246, "global_step": 116252, "epoch": 2767} {"train_loss": -6.530961513519287, "global_step": 116253, "epoch": 2767} {"train_loss": -6.409291744232178, "global_step": 116254, "epoch": 2767} {"train_loss": -6.491545506886074, "global_step": 116255, "epoch": 2767, "val_loss": 67913.4921875} {"train_loss": -6.458863258361816, "global_step": 116256, "epoch": 2768} {"train_loss": -6.5249786376953125, "global_step": 116257, "epoch": 2768} {"train_loss": -6.536264896392822, "global_step": 116258, "epoch": 2768} {"train_loss": -6.632749557495117, "global_step": 116259, "epoch": 2768} {"train_loss": -6.565939903259277, "global_step": 116260, "epoch": 2768} {"train_loss": -6.636288642883301, "global_step": 116261, "epoch": 2768} {"train_loss": -6.574373245239258, "global_step": 116262, "epoch": 2768} {"train_loss": -6.4628729820251465, "global_step": 116263, "epoch": 2768} {"train_loss": -6.462525367736816, "global_step": 116264, "epoch": 2768} {"train_loss": -6.5377607345581055, "global_step": 116265, "epoch": 2768} {"train_loss": -6.543130874633789, "global_step": 116266, "epoch": 2768} {"train_loss": -6.389704704284668, "global_step": 116267, "epoch": 2768} {"train_loss": -6.52650260925293, "global_step": 116268, "epoch": 2768} {"train_loss": -6.542600631713867, "global_step": 116269, "epoch": 2768} {"train_loss": -6.406689643859863, "global_step": 116270, "epoch": 2768} {"train_loss": -6.519543647766113, "global_step": 116271, "epoch": 2768} {"train_loss": -6.476910591125488, "global_step": 116272, "epoch": 2768} {"train_loss": -6.547631740570068, "global_step": 116273, "epoch": 2768} {"train_loss": -6.433524131774902, "global_step": 116274, "epoch": 2768} {"train_loss": -6.546650409698486, "global_step": 116275, "epoch": 2768} {"train_loss": -6.485569477081299, "global_step": 116276, "epoch": 2768} {"train_loss": -6.519343376159668, "global_step": 116277, "epoch": 2768} {"train_loss": -6.6157355308532715, "global_step": 116278, "epoch": 2768} {"train_loss": -6.477386474609375, "global_step": 116279, "epoch": 2768} {"train_loss": -6.422760963439941, "global_step": 116280, "epoch": 2768} {"train_loss": -6.341754913330078, "global_step": 116281, "epoch": 2768} {"train_loss": -6.469038009643555, "global_step": 116282, "epoch": 2768} {"train_loss": -6.413714408874512, "global_step": 116283, "epoch": 2768} {"train_loss": -6.306361198425293, "global_step": 116284, "epoch": 2768} {"train_loss": -6.405237197875977, "global_step": 116285, "epoch": 2768} {"train_loss": -6.466582298278809, "global_step": 116286, "epoch": 2768} {"train_loss": -6.341032028198242, "global_step": 116287, "epoch": 2768} {"train_loss": -6.498954772949219, "global_step": 116288, "epoch": 2768} {"train_loss": -6.3698649406433105, "global_step": 116289, "epoch": 2768} {"train_loss": -6.563570976257324, "global_step": 116290, "epoch": 2768} {"train_loss": -6.609084606170654, "global_step": 116291, "epoch": 2768} {"train_loss": -6.546104431152344, "global_step": 116292, "epoch": 2768} {"train_loss": -6.4412689208984375, "global_step": 116293, "epoch": 2768} {"train_loss": -6.535521507263184, "global_step": 116294, "epoch": 2768} {"train_loss": -6.522181510925293, "global_step": 116295, "epoch": 2768} {"train_loss": -6.508474826812744, "global_step": 116296, "epoch": 2768} {"train_loss": -6.49399825504848, "global_step": 116297, "epoch": 2768, "val_loss": 67962.3046875} {"train_loss": -6.553077220916748, "global_step": 116298, "epoch": 2769} {"train_loss": -6.431541442871094, "global_step": 116299, "epoch": 2769} {"train_loss": -6.505876541137695, "global_step": 116300, "epoch": 2769} {"train_loss": -6.486098766326904, "global_step": 116301, "epoch": 2769} {"train_loss": -6.522122383117676, "global_step": 116302, "epoch": 2769} {"train_loss": -6.5314106941223145, "global_step": 116303, "epoch": 2769} {"train_loss": -6.484773635864258, "global_step": 116304, "epoch": 2769} {"train_loss": -6.433080196380615, "global_step": 116305, "epoch": 2769} {"train_loss": -6.52705192565918, "global_step": 116306, "epoch": 2769} {"train_loss": -6.53865385055542, "global_step": 116307, "epoch": 2769} {"train_loss": -6.600619316101074, "global_step": 116308, "epoch": 2769} {"train_loss": -6.5500874519348145, "global_step": 116309, "epoch": 2769} {"train_loss": -6.577861785888672, "global_step": 116310, "epoch": 2769} {"train_loss": -6.572075843811035, "global_step": 116311, "epoch": 2769} {"train_loss": -6.498679161071777, "global_step": 116312, "epoch": 2769} {"train_loss": -6.520000457763672, "global_step": 116313, "epoch": 2769} {"train_loss": -6.481997966766357, "global_step": 116314, "epoch": 2769} {"train_loss": -6.565739631652832, "global_step": 116315, "epoch": 2769} {"train_loss": -6.323347091674805, "global_step": 116316, "epoch": 2769} {"train_loss": -6.479945182800293, "global_step": 116317, "epoch": 2769} {"train_loss": -6.551708698272705, "global_step": 116318, "epoch": 2769} {"train_loss": -6.329381942749023, "global_step": 116319, "epoch": 2769} {"train_loss": -6.4270830154418945, "global_step": 116320, "epoch": 2769} {"train_loss": -6.543572425842285, "global_step": 116321, "epoch": 2769} {"train_loss": -6.3989152908325195, "global_step": 116322, "epoch": 2769} {"train_loss": -6.550581455230713, "global_step": 116323, "epoch": 2769} {"train_loss": -6.477295875549316, "global_step": 116324, "epoch": 2769} {"train_loss": -6.4163055419921875, "global_step": 116325, "epoch": 2769} {"train_loss": -6.584089279174805, "global_step": 116326, "epoch": 2769} {"train_loss": -6.574176788330078, "global_step": 116327, "epoch": 2769} {"train_loss": -6.543370723724365, "global_step": 116328, "epoch": 2769} {"train_loss": -6.539673328399658, "global_step": 116329, "epoch": 2769} {"train_loss": -6.488487243652344, "global_step": 116330, "epoch": 2769} {"train_loss": -6.43192195892334, "global_step": 116331, "epoch": 2769} {"train_loss": -6.465405464172363, "global_step": 116332, "epoch": 2769} {"train_loss": -6.480362415313721, "global_step": 116333, "epoch": 2769} {"train_loss": -6.581724166870117, "global_step": 116334, "epoch": 2769} {"train_loss": -6.438891887664795, "global_step": 116335, "epoch": 2769} {"train_loss": -6.551750183105469, "global_step": 116336, "epoch": 2769} {"train_loss": -6.6286821365356445, "global_step": 116337, "epoch": 2769} {"train_loss": -6.557456016540527, "global_step": 116338, "epoch": 2769} {"train_loss": -6.506055343718756, "global_step": 116339, "epoch": 2769, "val_loss": 67881.5546875} {"train_loss": -6.587704658508301, "global_step": 116340, "epoch": 2770} {"train_loss": -6.526973724365234, "global_step": 116341, "epoch": 2770} {"train_loss": -6.485405921936035, "global_step": 116342, "epoch": 2770} {"train_loss": -6.514615058898926, "global_step": 116343, "epoch": 2770} {"train_loss": -6.5811262130737305, "global_step": 116344, "epoch": 2770} {"train_loss": -6.564715385437012, "global_step": 116345, "epoch": 2770} {"train_loss": -6.487375259399414, "global_step": 116346, "epoch": 2770} {"train_loss": -6.4133076667785645, "global_step": 116347, "epoch": 2770} {"train_loss": -6.460231304168701, "global_step": 116348, "epoch": 2770} {"train_loss": -6.605910301208496, "global_step": 116349, "epoch": 2770} {"train_loss": -6.41866397857666, "global_step": 116350, "epoch": 2770} {"train_loss": -6.507762908935547, "global_step": 116351, "epoch": 2770} {"train_loss": -6.377300262451172, "global_step": 116352, "epoch": 2770} {"train_loss": -6.518263816833496, "global_step": 116353, "epoch": 2770} {"train_loss": -6.44639778137207, "global_step": 116354, "epoch": 2770} {"train_loss": -6.597578048706055, "global_step": 116355, "epoch": 2770} {"train_loss": -6.421121597290039, "global_step": 116356, "epoch": 2770} {"train_loss": -6.428936958312988, "global_step": 116357, "epoch": 2770} {"train_loss": -6.4608612060546875, "global_step": 116358, "epoch": 2770} {"train_loss": -6.459955215454102, "global_step": 116359, "epoch": 2770} {"train_loss": -6.57537317276001, "global_step": 116360, "epoch": 2770} {"train_loss": -6.590649127960205, "global_step": 116361, "epoch": 2770} {"train_loss": -6.459849834442139, "global_step": 116362, "epoch": 2770} {"train_loss": -6.465367794036865, "global_step": 116363, "epoch": 2770} {"train_loss": -6.468866348266602, "global_step": 116364, "epoch": 2770} {"train_loss": -6.481320858001709, "global_step": 116365, "epoch": 2770} {"train_loss": -6.520337104797363, "global_step": 116366, "epoch": 2770} {"train_loss": -6.5263671875, "global_step": 116367, "epoch": 2770} {"train_loss": -6.558406829833984, "global_step": 116368, "epoch": 2770} {"train_loss": -6.513801574707031, "global_step": 116369, "epoch": 2770} {"train_loss": -6.578505516052246, "global_step": 116370, "epoch": 2770} {"train_loss": -6.618947982788086, "global_step": 116371, "epoch": 2770} {"train_loss": -6.502870082855225, "global_step": 116372, "epoch": 2770} {"train_loss": -6.485546112060547, "global_step": 116373, "epoch": 2770} {"train_loss": -6.445178985595703, "global_step": 116374, "epoch": 2770} {"train_loss": -6.5861639976501465, "global_step": 116375, "epoch": 2770} {"train_loss": -6.496912956237793, "global_step": 116376, "epoch": 2770} {"train_loss": -6.511162281036377, "global_step": 116377, "epoch": 2770} {"train_loss": -6.471327781677246, "global_step": 116378, "epoch": 2770} {"train_loss": -6.446308135986328, "global_step": 116379, "epoch": 2770} {"train_loss": -6.554507732391357, "global_step": 116380, "epoch": 2770} {"train_loss": -6.503115653991699, "global_step": 116381, "epoch": 2770, "val_loss": 67831.6015625} {"train_loss": -6.432405948638916, "global_step": 116382, "epoch": 2771} {"train_loss": -6.3586812019348145, "global_step": 116383, "epoch": 2771} {"train_loss": -6.513388633728027, "global_step": 116384, "epoch": 2771} {"train_loss": -6.555993556976318, "global_step": 116385, "epoch": 2771} {"train_loss": -6.449499130249023, "global_step": 116386, "epoch": 2771} {"train_loss": -6.485878944396973, "global_step": 116387, "epoch": 2771} {"train_loss": -6.5104756355285645, "global_step": 116388, "epoch": 2771} {"train_loss": -6.626614570617676, "global_step": 116389, "epoch": 2771} {"train_loss": -6.563244819641113, "global_step": 116390, "epoch": 2771} {"train_loss": -6.556685924530029, "global_step": 116391, "epoch": 2771} {"train_loss": -6.590263366699219, "global_step": 116392, "epoch": 2771} {"train_loss": -6.440962791442871, "global_step": 116393, "epoch": 2771} {"train_loss": -6.488771438598633, "global_step": 116394, "epoch": 2771} {"train_loss": -6.46419620513916, "global_step": 116395, "epoch": 2771} {"train_loss": -6.527911186218262, "global_step": 116396, "epoch": 2771} {"train_loss": -6.386745452880859, "global_step": 116397, "epoch": 2771} {"train_loss": -6.463234901428223, "global_step": 116398, "epoch": 2771} {"train_loss": -6.494334697723389, "global_step": 116399, "epoch": 2771} {"train_loss": -6.462862014770508, "global_step": 116400, "epoch": 2771} {"train_loss": -6.475926876068115, "global_step": 116401, "epoch": 2771} {"train_loss": -6.48259162902832, "global_step": 116402, "epoch": 2771} {"train_loss": -6.498653888702393, "global_step": 116403, "epoch": 2771} {"train_loss": -6.5197248458862305, "global_step": 116404, "epoch": 2771} {"train_loss": -6.4405622482299805, "global_step": 116405, "epoch": 2771} {"train_loss": -6.5455522537231445, "global_step": 116406, "epoch": 2771} {"train_loss": -6.4710693359375, "global_step": 116407, "epoch": 2771} {"train_loss": -6.604859828948975, "global_step": 116408, "epoch": 2771} {"train_loss": -6.482990741729736, "global_step": 116409, "epoch": 2771} {"train_loss": -6.601991176605225, "global_step": 116410, "epoch": 2771} {"train_loss": -6.529824256896973, "global_step": 116411, "epoch": 2771} {"train_loss": -6.468020915985107, "global_step": 116412, "epoch": 2771} {"train_loss": -6.4847846031188965, "global_step": 116413, "epoch": 2771} {"train_loss": -6.550765514373779, "global_step": 116414, "epoch": 2771} {"train_loss": -6.555037498474121, "global_step": 116415, "epoch": 2771} {"train_loss": -6.45050573348999, "global_step": 116416, "epoch": 2771} {"train_loss": -6.520367622375488, "global_step": 116417, "epoch": 2771} {"train_loss": -6.562570571899414, "global_step": 116418, "epoch": 2771} {"train_loss": -6.495846748352051, "global_step": 116419, "epoch": 2771} {"train_loss": -6.59857702255249, "global_step": 116420, "epoch": 2771} {"train_loss": -6.470301628112793, "global_step": 116421, "epoch": 2771} {"train_loss": -6.607661247253418, "global_step": 116422, "epoch": 2771} {"train_loss": -6.509323812666393, "global_step": 116423, "epoch": 2771, "val_loss": 67914.703125} {"train_loss": -6.5658979415893555, "global_step": 116424, "epoch": 2772} {"train_loss": -6.567767143249512, "global_step": 116425, "epoch": 2772} {"train_loss": -6.556704521179199, "global_step": 116426, "epoch": 2772} {"train_loss": -6.497281074523926, "global_step": 116427, "epoch": 2772} {"train_loss": -6.590388298034668, "global_step": 116428, "epoch": 2772} {"train_loss": -6.424535751342773, "global_step": 116429, "epoch": 2772} {"train_loss": -6.443233489990234, "global_step": 116430, "epoch": 2772} {"train_loss": -6.4487762451171875, "global_step": 116431, "epoch": 2772} {"train_loss": -6.496091365814209, "global_step": 116432, "epoch": 2772} {"train_loss": -6.520435333251953, "global_step": 116433, "epoch": 2772} {"train_loss": -6.577199935913086, "global_step": 116434, "epoch": 2772} {"train_loss": -6.534310817718506, "global_step": 116435, "epoch": 2772} {"train_loss": -6.466883659362793, "global_step": 116436, "epoch": 2772} {"train_loss": -6.494260787963867, "global_step": 116437, "epoch": 2772} {"train_loss": -6.519855499267578, "global_step": 116438, "epoch": 2772} {"train_loss": -6.575306415557861, "global_step": 116439, "epoch": 2772} {"train_loss": -6.515927314758301, "global_step": 116440, "epoch": 2772} {"train_loss": -6.558148384094238, "global_step": 116441, "epoch": 2772} {"train_loss": -6.465076446533203, "global_step": 116442, "epoch": 2772} {"train_loss": -6.549114227294922, "global_step": 116443, "epoch": 2772} {"train_loss": -6.545031547546387, "global_step": 116444, "epoch": 2772} {"train_loss": -6.563175201416016, "global_step": 116445, "epoch": 2772} {"train_loss": -6.471367359161377, "global_step": 116446, "epoch": 2772} {"train_loss": -6.509272575378418, "global_step": 116447, "epoch": 2772} {"train_loss": -6.493363380432129, "global_step": 116448, "epoch": 2772} {"train_loss": -6.332803726196289, "global_step": 116449, "epoch": 2772} {"train_loss": -6.44950008392334, "global_step": 116450, "epoch": 2772} {"train_loss": -6.482210636138916, "global_step": 116451, "epoch": 2772} {"train_loss": -6.414101600646973, "global_step": 116452, "epoch": 2772} {"train_loss": -6.464849472045898, "global_step": 116453, "epoch": 2772} {"train_loss": -6.424298286437988, "global_step": 116454, "epoch": 2772} {"train_loss": -6.602021217346191, "global_step": 116455, "epoch": 2772} {"train_loss": -6.3153204917907715, "global_step": 116456, "epoch": 2772} {"train_loss": -6.4784464836120605, "global_step": 116457, "epoch": 2772} {"train_loss": -6.301483631134033, "global_step": 116458, "epoch": 2772} {"train_loss": -6.465702056884766, "global_step": 116459, "epoch": 2772} {"train_loss": -6.4668965339660645, "global_step": 116460, "epoch": 2772} {"train_loss": -6.493444919586182, "global_step": 116461, "epoch": 2772} {"train_loss": -6.549488544464111, "global_step": 116462, "epoch": 2772} {"train_loss": -6.395318031311035, "global_step": 116463, "epoch": 2772} {"train_loss": -6.535386085510254, "global_step": 116464, "epoch": 2772} {"train_loss": -6.491833323524112, "global_step": 116465, "epoch": 2772, "val_loss": 67852.4609375} {"train_loss": -6.371665000915527, "global_step": 116466, "epoch": 2773} {"train_loss": -6.600334167480469, "global_step": 116467, "epoch": 2773} {"train_loss": -6.578377723693848, "global_step": 116468, "epoch": 2773} {"train_loss": -6.572002410888672, "global_step": 116469, "epoch": 2773} {"train_loss": -6.645161151885986, "global_step": 116470, "epoch": 2773} {"train_loss": -6.5327630043029785, "global_step": 116471, "epoch": 2773} {"train_loss": -6.473089694976807, "global_step": 116472, "epoch": 2773} {"train_loss": -6.6123247146606445, "global_step": 116473, "epoch": 2773} {"train_loss": -6.449911117553711, "global_step": 116474, "epoch": 2773} {"train_loss": -6.524123191833496, "global_step": 116475, "epoch": 2773} {"train_loss": -6.408906936645508, "global_step": 116476, "epoch": 2773} {"train_loss": -6.542145729064941, "global_step": 116477, "epoch": 2773} {"train_loss": -6.539870262145996, "global_step": 116478, "epoch": 2773} {"train_loss": -6.44672966003418, "global_step": 116479, "epoch": 2773} {"train_loss": -6.464702606201172, "global_step": 116480, "epoch": 2773} {"train_loss": -6.445683479309082, "global_step": 116481, "epoch": 2773} {"train_loss": -6.575693130493164, "global_step": 116482, "epoch": 2773} {"train_loss": -6.506615161895752, "global_step": 116483, "epoch": 2773} {"train_loss": -6.522524356842041, "global_step": 116484, "epoch": 2773} {"train_loss": -6.5285749435424805, "global_step": 116485, "epoch": 2773} {"train_loss": -6.523818016052246, "global_step": 116486, "epoch": 2773} {"train_loss": -6.490194320678711, "global_step": 116487, "epoch": 2773} {"train_loss": -6.554229259490967, "global_step": 116488, "epoch": 2773} {"train_loss": -6.467700958251953, "global_step": 116489, "epoch": 2773} {"train_loss": -6.446741104125977, "global_step": 116490, "epoch": 2773} {"train_loss": -6.563371658325195, "global_step": 116491, "epoch": 2773} {"train_loss": -6.582018852233887, "global_step": 116492, "epoch": 2773} {"train_loss": -6.559715747833252, "global_step": 116493, "epoch": 2773} {"train_loss": -6.472038745880127, "global_step": 116494, "epoch": 2773} {"train_loss": -6.61696720123291, "global_step": 116495, "epoch": 2773} {"train_loss": -6.636258125305176, "global_step": 116496, "epoch": 2773} {"train_loss": -6.552341461181641, "global_step": 116497, "epoch": 2773} {"train_loss": -6.470562934875488, "global_step": 116498, "epoch": 2773} {"train_loss": -6.546504974365234, "global_step": 116499, "epoch": 2773} {"train_loss": -6.620551109313965, "global_step": 116500, "epoch": 2773} {"train_loss": -6.46502161026001, "global_step": 116501, "epoch": 2773} {"train_loss": -6.424635887145996, "global_step": 116502, "epoch": 2773} {"train_loss": -6.478631973266602, "global_step": 116503, "epoch": 2773} {"train_loss": -6.462087631225586, "global_step": 116504, "epoch": 2773} {"train_loss": -6.458759784698486, "global_step": 116505, "epoch": 2773} {"train_loss": -6.427609443664551, "global_step": 116506, "epoch": 2773} {"train_loss": -6.517257917495001, "global_step": 116507, "epoch": 2773, "val_loss": 68097.6484375} {"train_loss": -6.457784652709961, "global_step": 116508, "epoch": 2774} {"train_loss": -6.451600074768066, "global_step": 116509, "epoch": 2774} {"train_loss": -6.590830326080322, "global_step": 116510, "epoch": 2774} {"train_loss": -6.348975658416748, "global_step": 116511, "epoch": 2774} {"train_loss": -6.520724296569824, "global_step": 116512, "epoch": 2774} {"train_loss": -6.311500549316406, "global_step": 116513, "epoch": 2774} {"train_loss": -6.223240852355957, "global_step": 116514, "epoch": 2774} {"train_loss": -6.5700483322143555, "global_step": 116515, "epoch": 2774} {"train_loss": -6.185845851898193, "global_step": 116516, "epoch": 2774} {"train_loss": -6.3951416015625, "global_step": 116517, "epoch": 2774} {"train_loss": -6.350027084350586, "global_step": 116518, "epoch": 2774} {"train_loss": -6.358599662780762, "global_step": 116519, "epoch": 2774} {"train_loss": -6.310973167419434, "global_step": 116520, "epoch": 2774} {"train_loss": -6.284645080566406, "global_step": 116521, "epoch": 2774} {"train_loss": -6.365342617034912, "global_step": 116522, "epoch": 2774} {"train_loss": -6.363278388977051, "global_step": 116523, "epoch": 2774} {"train_loss": -6.392611980438232, "global_step": 116524, "epoch": 2774} {"train_loss": -6.31911039352417, "global_step": 116525, "epoch": 2774} {"train_loss": -6.225980758666992, "global_step": 116526, "epoch": 2774} {"train_loss": -6.364631652832031, "global_step": 116527, "epoch": 2774} {"train_loss": -6.281237602233887, "global_step": 116528, "epoch": 2774} {"train_loss": -6.388527870178223, "global_step": 116529, "epoch": 2774} {"train_loss": -6.3319854736328125, "global_step": 116530, "epoch": 2774} {"train_loss": -6.478652000427246, "global_step": 116531, "epoch": 2774} {"train_loss": -6.367115020751953, "global_step": 116532, "epoch": 2774} {"train_loss": -6.42434024810791, "global_step": 116533, "epoch": 2774} {"train_loss": -6.367234706878662, "global_step": 116534, "epoch": 2774} {"train_loss": -6.449031829833984, "global_step": 116535, "epoch": 2774} {"train_loss": -6.41489315032959, "global_step": 116536, "epoch": 2774} {"train_loss": -6.479079246520996, "global_step": 116537, "epoch": 2774} {"train_loss": -6.329302787780762, "global_step": 116538, "epoch": 2774} {"train_loss": -6.4803571701049805, "global_step": 116539, "epoch": 2774} {"train_loss": -6.417628288269043, "global_step": 116540, "epoch": 2774} {"train_loss": -6.392910003662109, "global_step": 116541, "epoch": 2774} {"train_loss": -6.374914169311523, "global_step": 116542, "epoch": 2774} {"train_loss": -6.4606547355651855, "global_step": 116543, "epoch": 2774} {"train_loss": -6.433962821960449, "global_step": 116544, "epoch": 2774} {"train_loss": -6.542390823364258, "global_step": 116545, "epoch": 2774} {"train_loss": -6.420310974121094, "global_step": 116546, "epoch": 2774} {"train_loss": -6.424715042114258, "global_step": 116547, "epoch": 2774} {"train_loss": -6.386051177978516, "global_step": 116548, "epoch": 2774} {"train_loss": -6.389471213022868, "global_step": 116549, "epoch": 2774, "val_loss": 67806.0390625} {"train_loss": -6.530179500579834, "global_step": 116550, "epoch": 2775} {"train_loss": -6.377963066101074, "global_step": 116551, "epoch": 2775} {"train_loss": -6.446906089782715, "global_step": 116552, "epoch": 2775} {"train_loss": -6.471384048461914, "global_step": 116553, "epoch": 2775} {"train_loss": -6.378767967224121, "global_step": 116554, "epoch": 2775} {"train_loss": -6.587549686431885, "global_step": 116555, "epoch": 2775} {"train_loss": -6.424755096435547, "global_step": 116556, "epoch": 2775} {"train_loss": -6.553114891052246, "global_step": 116557, "epoch": 2775} {"train_loss": -6.37874698638916, "global_step": 116558, "epoch": 2775} {"train_loss": -6.511744499206543, "global_step": 116559, "epoch": 2775} {"train_loss": -6.525712966918945, "global_step": 116560, "epoch": 2775} {"train_loss": -6.573968887329102, "global_step": 116561, "epoch": 2775} {"train_loss": -6.526044845581055, "global_step": 116562, "epoch": 2775} {"train_loss": -6.519749641418457, "global_step": 116563, "epoch": 2775} {"train_loss": -6.499154567718506, "global_step": 116564, "epoch": 2775} {"train_loss": -6.489937782287598, "global_step": 116565, "epoch": 2775} {"train_loss": -6.514564514160156, "global_step": 116566, "epoch": 2775} {"train_loss": -6.4536943435668945, "global_step": 116567, "epoch": 2775} {"train_loss": -6.574414253234863, "global_step": 116568, "epoch": 2775} {"train_loss": -6.467048168182373, "global_step": 116569, "epoch": 2775} {"train_loss": -6.572179794311523, "global_step": 116570, "epoch": 2775} {"train_loss": -6.476171493530273, "global_step": 116571, "epoch": 2775} {"train_loss": -6.514202117919922, "global_step": 116572, "epoch": 2775} {"train_loss": -6.571834087371826, "global_step": 116573, "epoch": 2775} {"train_loss": -6.626821041107178, "global_step": 116574, "epoch": 2775} {"train_loss": -6.463056564331055, "global_step": 116575, "epoch": 2775} {"train_loss": -6.64015531539917, "global_step": 116576, "epoch": 2775} {"train_loss": -6.493471145629883, "global_step": 116577, "epoch": 2775} {"train_loss": -6.549221038818359, "global_step": 116578, "epoch": 2775} {"train_loss": -6.497042655944824, "global_step": 116579, "epoch": 2775} {"train_loss": -6.579691410064697, "global_step": 116580, "epoch": 2775} {"train_loss": -6.582162857055664, "global_step": 116581, "epoch": 2775} {"train_loss": -6.536639213562012, "global_step": 116582, "epoch": 2775} {"train_loss": -6.604340076446533, "global_step": 116583, "epoch": 2775} {"train_loss": -6.527665138244629, "global_step": 116584, "epoch": 2775} {"train_loss": -6.609776496887207, "global_step": 116585, "epoch": 2775} {"train_loss": -6.520419597625732, "global_step": 116586, "epoch": 2775} {"train_loss": -6.457376480102539, "global_step": 116587, "epoch": 2775} {"train_loss": -6.445709705352783, "global_step": 116588, "epoch": 2775} {"train_loss": -6.479344367980957, "global_step": 116589, "epoch": 2775} {"train_loss": -6.597146034240723, "global_step": 116590, "epoch": 2775} {"train_loss": -6.517032963888986, "global_step": 116591, "epoch": 2775, "val_loss": 67902.7578125} {"train_loss": -6.54755973815918, "global_step": 116592, "epoch": 2776} {"train_loss": -6.532169342041016, "global_step": 116593, "epoch": 2776} {"train_loss": -6.443293571472168, "global_step": 116594, "epoch": 2776} {"train_loss": -6.5414204597473145, "global_step": 116595, "epoch": 2776} {"train_loss": -6.653249740600586, "global_step": 116596, "epoch": 2776} {"train_loss": -6.556292533874512, "global_step": 116597, "epoch": 2776} {"train_loss": -6.454346179962158, "global_step": 116598, "epoch": 2776} {"train_loss": -6.450584411621094, "global_step": 116599, "epoch": 2776} {"train_loss": -6.576054573059082, "global_step": 116600, "epoch": 2776} {"train_loss": -6.527483940124512, "global_step": 116601, "epoch": 2776} {"train_loss": -6.557185649871826, "global_step": 116602, "epoch": 2776} {"train_loss": -6.522671222686768, "global_step": 116603, "epoch": 2776} {"train_loss": -6.541380882263184, "global_step": 116604, "epoch": 2776} {"train_loss": -6.532038688659668, "global_step": 116605, "epoch": 2776} {"train_loss": -6.574164867401123, "global_step": 116606, "epoch": 2776} {"train_loss": -6.532446384429932, "global_step": 116607, "epoch": 2776} {"train_loss": -6.622670650482178, "global_step": 116608, "epoch": 2776} {"train_loss": -6.546191215515137, "global_step": 116609, "epoch": 2776} {"train_loss": -6.559887409210205, "global_step": 116610, "epoch": 2776} {"train_loss": -6.456727027893066, "global_step": 116611, "epoch": 2776} {"train_loss": -6.483438491821289, "global_step": 116612, "epoch": 2776} {"train_loss": -6.536137104034424, "global_step": 116613, "epoch": 2776} {"train_loss": -6.549897193908691, "global_step": 116614, "epoch": 2776} {"train_loss": -6.393677711486816, "global_step": 116615, "epoch": 2776} {"train_loss": -6.529370307922363, "global_step": 116616, "epoch": 2776} {"train_loss": -6.549476146697998, "global_step": 116617, "epoch": 2776} {"train_loss": -6.442319869995117, "global_step": 116618, "epoch": 2776} {"train_loss": -6.379325866699219, "global_step": 116619, "epoch": 2776} {"train_loss": -6.56759786605835, "global_step": 116620, "epoch": 2776} {"train_loss": -6.413791656494141, "global_step": 116621, "epoch": 2776} {"train_loss": -6.411638259887695, "global_step": 116622, "epoch": 2776} {"train_loss": -6.527865886688232, "global_step": 116623, "epoch": 2776} {"train_loss": -6.432592391967773, "global_step": 116624, "epoch": 2776} {"train_loss": -6.427319526672363, "global_step": 116625, "epoch": 2776} {"train_loss": -6.515703201293945, "global_step": 116626, "epoch": 2776} {"train_loss": -6.507481575012207, "global_step": 116627, "epoch": 2776} {"train_loss": -6.438823223114014, "global_step": 116628, "epoch": 2776} {"train_loss": -6.508166790008545, "global_step": 116629, "epoch": 2776} {"train_loss": -6.566662311553955, "global_step": 116630, "epoch": 2776} {"train_loss": -6.474626541137695, "global_step": 116631, "epoch": 2776} {"train_loss": -6.531820297241211, "global_step": 116632, "epoch": 2776} {"train_loss": -6.51299406233288, "global_step": 116633, "epoch": 2776, "val_loss": 68023.7578125} {"train_loss": -6.606328010559082, "global_step": 116634, "epoch": 2777} {"train_loss": -6.42836856842041, "global_step": 116635, "epoch": 2777} {"train_loss": -6.4762163162231445, "global_step": 116636, "epoch": 2777} {"train_loss": -6.500210285186768, "global_step": 116637, "epoch": 2777} {"train_loss": -6.540493965148926, "global_step": 116638, "epoch": 2777} {"train_loss": -6.453616142272949, "global_step": 116639, "epoch": 2777} {"train_loss": -6.449175834655762, "global_step": 116640, "epoch": 2777} {"train_loss": -6.534849166870117, "global_step": 116641, "epoch": 2777} {"train_loss": -6.469221115112305, "global_step": 116642, "epoch": 2777} {"train_loss": -6.557165622711182, "global_step": 116643, "epoch": 2777} {"train_loss": -6.482417106628418, "global_step": 116644, "epoch": 2777} {"train_loss": -6.5724287033081055, "global_step": 116645, "epoch": 2777} {"train_loss": -6.556013107299805, "global_step": 116646, "epoch": 2777} {"train_loss": -6.494599342346191, "global_step": 116647, "epoch": 2777} {"train_loss": -6.492224216461182, "global_step": 116648, "epoch": 2777} {"train_loss": -6.463160037994385, "global_step": 116649, "epoch": 2777} {"train_loss": -6.611966133117676, "global_step": 116650, "epoch": 2777} {"train_loss": -6.4752912521362305, "global_step": 116651, "epoch": 2777} {"train_loss": -6.4902663230896, "global_step": 116652, "epoch": 2777} {"train_loss": -6.5898332595825195, "global_step": 116653, "epoch": 2777} {"train_loss": -6.514770984649658, "global_step": 116654, "epoch": 2777} {"train_loss": -6.494708061218262, "global_step": 116655, "epoch": 2777} {"train_loss": -6.487293243408203, "global_step": 116656, "epoch": 2777} {"train_loss": -6.38961124420166, "global_step": 116657, "epoch": 2777} {"train_loss": -6.499271392822266, "global_step": 116658, "epoch": 2777} {"train_loss": -6.534332275390625, "global_step": 116659, "epoch": 2777} {"train_loss": -6.55813455581665, "global_step": 116660, "epoch": 2777} {"train_loss": -6.484978675842285, "global_step": 116661, "epoch": 2777} {"train_loss": -6.503252983093262, "global_step": 116662, "epoch": 2777} {"train_loss": -6.559657573699951, "global_step": 116663, "epoch": 2777} {"train_loss": -6.44842529296875, "global_step": 116664, "epoch": 2777} {"train_loss": -6.518098831176758, "global_step": 116665, "epoch": 2777} {"train_loss": -6.461696624755859, "global_step": 116666, "epoch": 2777} {"train_loss": -6.482867240905762, "global_step": 116667, "epoch": 2777} {"train_loss": -6.561606407165527, "global_step": 116668, "epoch": 2777} {"train_loss": -6.4337921142578125, "global_step": 116669, "epoch": 2777} {"train_loss": -6.47896146774292, "global_step": 116670, "epoch": 2777} {"train_loss": -6.397045612335205, "global_step": 116671, "epoch": 2777} {"train_loss": -6.5514678955078125, "global_step": 116672, "epoch": 2777} {"train_loss": -6.515811920166016, "global_step": 116673, "epoch": 2777} {"train_loss": -6.57621431350708, "global_step": 116674, "epoch": 2777} {"train_loss": -6.505585715884254, "global_step": 116675, "epoch": 2777, "val_loss": 68087.5546875} {"train_loss": -6.471211910247803, "global_step": 116676, "epoch": 2778} {"train_loss": -6.5240654945373535, "global_step": 116677, "epoch": 2778} {"train_loss": -6.537841320037842, "global_step": 116678, "epoch": 2778} {"train_loss": -6.524592399597168, "global_step": 116679, "epoch": 2778} {"train_loss": -6.532282829284668, "global_step": 116680, "epoch": 2778} {"train_loss": -6.592892169952393, "global_step": 116681, "epoch": 2778} {"train_loss": -6.51482629776001, "global_step": 116682, "epoch": 2778} {"train_loss": -6.463274955749512, "global_step": 116683, "epoch": 2778} {"train_loss": -6.5186262130737305, "global_step": 116684, "epoch": 2778} {"train_loss": -6.533159255981445, "global_step": 116685, "epoch": 2778} {"train_loss": -6.614212989807129, "global_step": 116686, "epoch": 2778} {"train_loss": -6.431454658508301, "global_step": 116687, "epoch": 2778} {"train_loss": -6.447134971618652, "global_step": 116688, "epoch": 2778} {"train_loss": -6.471566200256348, "global_step": 116689, "epoch": 2778} {"train_loss": -6.5389814376831055, "global_step": 116690, "epoch": 2778} {"train_loss": -6.537714004516602, "global_step": 116691, "epoch": 2778} {"train_loss": -6.603238105773926, "global_step": 116692, "epoch": 2778} {"train_loss": -6.464174270629883, "global_step": 116693, "epoch": 2778} {"train_loss": -6.453014850616455, "global_step": 116694, "epoch": 2778} {"train_loss": -6.48322868347168, "global_step": 116695, "epoch": 2778} {"train_loss": -6.533300876617432, "global_step": 116696, "epoch": 2778} {"train_loss": -6.648089408874512, "global_step": 116697, "epoch": 2778} {"train_loss": -6.472783088684082, "global_step": 116698, "epoch": 2778} {"train_loss": -6.51316499710083, "global_step": 116699, "epoch": 2778} {"train_loss": -6.593523025512695, "global_step": 116700, "epoch": 2778} {"train_loss": -6.462625026702881, "global_step": 116701, "epoch": 2778} {"train_loss": -6.508861064910889, "global_step": 116702, "epoch": 2778} {"train_loss": -6.587499618530273, "global_step": 116703, "epoch": 2778} {"train_loss": -6.521145820617676, "global_step": 116704, "epoch": 2778} {"train_loss": -6.363142013549805, "global_step": 116705, "epoch": 2778} {"train_loss": -6.464825630187988, "global_step": 116706, "epoch": 2778} {"train_loss": -6.495299339294434, "global_step": 116707, "epoch": 2778} {"train_loss": -6.480139255523682, "global_step": 116708, "epoch": 2778} {"train_loss": -6.58164119720459, "global_step": 116709, "epoch": 2778} {"train_loss": -6.460279941558838, "global_step": 116710, "epoch": 2778} {"train_loss": -6.579279899597168, "global_step": 116711, "epoch": 2778} {"train_loss": -6.621214866638184, "global_step": 116712, "epoch": 2778} {"train_loss": -6.37359619140625, "global_step": 116713, "epoch": 2778} {"train_loss": -6.484492301940918, "global_step": 116714, "epoch": 2778} {"train_loss": -6.475558280944824, "global_step": 116715, "epoch": 2778} {"train_loss": -6.441833019256592, "global_step": 116716, "epoch": 2778} {"train_loss": -6.507826021739414, "global_step": 116717, "epoch": 2778, "val_loss": 68040.1796875} {"train_loss": -6.4778947830200195, "global_step": 116718, "epoch": 2779} {"train_loss": -6.4673357009887695, "global_step": 116719, "epoch": 2779} {"train_loss": -6.427768707275391, "global_step": 116720, "epoch": 2779} {"train_loss": -6.493865013122559, "global_step": 116721, "epoch": 2779} {"train_loss": -6.442338943481445, "global_step": 116722, "epoch": 2779} {"train_loss": -6.573049068450928, "global_step": 116723, "epoch": 2779} {"train_loss": -6.434258460998535, "global_step": 116724, "epoch": 2779} {"train_loss": -6.519269943237305, "global_step": 116725, "epoch": 2779} {"train_loss": -6.4367780685424805, "global_step": 116726, "epoch": 2779} {"train_loss": -6.412672996520996, "global_step": 116727, "epoch": 2779} {"train_loss": -6.462510585784912, "global_step": 116728, "epoch": 2779} {"train_loss": -6.4779887199401855, "global_step": 116729, "epoch": 2779} {"train_loss": -6.469866752624512, "global_step": 116730, "epoch": 2779} {"train_loss": -6.490778923034668, "global_step": 116731, "epoch": 2779} {"train_loss": -6.471508026123047, "global_step": 116732, "epoch": 2779} {"train_loss": -6.308716773986816, "global_step": 116733, "epoch": 2779} {"train_loss": -6.408787250518799, "global_step": 116734, "epoch": 2779} {"train_loss": -6.425328254699707, "global_step": 116735, "epoch": 2779} {"train_loss": -6.392797946929932, "global_step": 116736, "epoch": 2779} {"train_loss": -6.534454345703125, "global_step": 116737, "epoch": 2779} {"train_loss": -6.4152021408081055, "global_step": 116738, "epoch": 2779} {"train_loss": -6.517563819885254, "global_step": 116739, "epoch": 2779} {"train_loss": -6.408843040466309, "global_step": 116740, "epoch": 2779} {"train_loss": -6.475620269775391, "global_step": 116741, "epoch": 2779} {"train_loss": -6.554220199584961, "global_step": 116742, "epoch": 2779} {"train_loss": -6.4651055335998535, "global_step": 116743, "epoch": 2779} {"train_loss": -6.5693464279174805, "global_step": 116744, "epoch": 2779} {"train_loss": -6.424391746520996, "global_step": 116745, "epoch": 2779} {"train_loss": -6.3884501457214355, "global_step": 116746, "epoch": 2779} {"train_loss": -6.3969621658325195, "global_step": 116747, "epoch": 2779} {"train_loss": -6.497229099273682, "global_step": 116748, "epoch": 2779} {"train_loss": -6.3744120597839355, "global_step": 116749, "epoch": 2779} {"train_loss": -6.383600234985352, "global_step": 116750, "epoch": 2779} {"train_loss": -6.482548713684082, "global_step": 116751, "epoch": 2779} {"train_loss": -6.546063423156738, "global_step": 116752, "epoch": 2779} {"train_loss": -6.552456378936768, "global_step": 116753, "epoch": 2779} {"train_loss": -6.45015287399292, "global_step": 116754, "epoch": 2779} {"train_loss": -6.498010635375977, "global_step": 116755, "epoch": 2779} {"train_loss": -6.422915935516357, "global_step": 116756, "epoch": 2779} {"train_loss": -6.548504829406738, "global_step": 116757, "epoch": 2779} {"train_loss": -6.528812408447266, "global_step": 116758, "epoch": 2779} {"train_loss": -6.465956710633778, "global_step": 116759, "epoch": 2779, "val_loss": 67950.8359375} {"train_loss": -6.47895622253418, "global_step": 116760, "epoch": 2780} {"train_loss": -6.447117328643799, "global_step": 116761, "epoch": 2780} {"train_loss": -6.365880012512207, "global_step": 116762, "epoch": 2780} {"train_loss": -6.385505199432373, "global_step": 116763, "epoch": 2780} {"train_loss": -6.455287933349609, "global_step": 116764, "epoch": 2780} {"train_loss": -6.534112930297852, "global_step": 116765, "epoch": 2780} {"train_loss": -6.43411111831665, "global_step": 116766, "epoch": 2780} {"train_loss": -6.443462371826172, "global_step": 116767, "epoch": 2780} {"train_loss": -6.441489219665527, "global_step": 116768, "epoch": 2780} {"train_loss": -6.601518630981445, "global_step": 116769, "epoch": 2780} {"train_loss": -6.540991306304932, "global_step": 116770, "epoch": 2780} {"train_loss": -6.362753391265869, "global_step": 116771, "epoch": 2780} {"train_loss": -6.577061176300049, "global_step": 116772, "epoch": 2780} {"train_loss": -6.467113971710205, "global_step": 116773, "epoch": 2780} {"train_loss": -6.434094429016113, "global_step": 116774, "epoch": 2780} {"train_loss": -6.574550628662109, "global_step": 116775, "epoch": 2780} {"train_loss": -6.497370719909668, "global_step": 116776, "epoch": 2780} {"train_loss": -6.505002021789551, "global_step": 116777, "epoch": 2780} {"train_loss": -6.631740093231201, "global_step": 116778, "epoch": 2780} {"train_loss": -6.522275924682617, "global_step": 116779, "epoch": 2780} {"train_loss": -6.488754749298096, "global_step": 116780, "epoch": 2780} {"train_loss": -6.521553039550781, "global_step": 116781, "epoch": 2780} {"train_loss": -6.41279935836792, "global_step": 116782, "epoch": 2780} {"train_loss": -6.437872886657715, "global_step": 116783, "epoch": 2780} {"train_loss": -6.544059753417969, "global_step": 116784, "epoch": 2780} {"train_loss": -6.474956035614014, "global_step": 116785, "epoch": 2780} {"train_loss": -6.4512858390808105, "global_step": 116786, "epoch": 2780} {"train_loss": -6.490454196929932, "global_step": 116787, "epoch": 2780} {"train_loss": -6.408679962158203, "global_step": 116788, "epoch": 2780} {"train_loss": -6.394916534423828, "global_step": 116789, "epoch": 2780} {"train_loss": -6.462060928344727, "global_step": 116790, "epoch": 2780} {"train_loss": -6.440629959106445, "global_step": 116791, "epoch": 2780} {"train_loss": -6.338840484619141, "global_step": 116792, "epoch": 2780} {"train_loss": -6.380533218383789, "global_step": 116793, "epoch": 2780} {"train_loss": -6.353049278259277, "global_step": 116794, "epoch": 2780} {"train_loss": -6.255316734313965, "global_step": 116795, "epoch": 2780} {"train_loss": -6.587333679199219, "global_step": 116796, "epoch": 2780} {"train_loss": -6.33754825592041, "global_step": 116797, "epoch": 2780} {"train_loss": -6.495604515075684, "global_step": 116798, "epoch": 2780} {"train_loss": -6.4401092529296875, "global_step": 116799, "epoch": 2780} {"train_loss": -6.455995559692383, "global_step": 116800, "epoch": 2780} {"train_loss": -6.459886789321899, "global_step": 116801, "epoch": 2780, "val_loss": 68304.6796875} {"train_loss": -6.312353134155273, "global_step": 116802, "epoch": 2781} {"train_loss": -6.364228248596191, "global_step": 116803, "epoch": 2781} {"train_loss": -6.454216957092285, "global_step": 116804, "epoch": 2781} {"train_loss": -6.510210037231445, "global_step": 116805, "epoch": 2781} {"train_loss": -6.463666915893555, "global_step": 116806, "epoch": 2781} {"train_loss": -6.403805732727051, "global_step": 116807, "epoch": 2781} {"train_loss": -6.299849033355713, "global_step": 116808, "epoch": 2781} {"train_loss": -6.452426910400391, "global_step": 116809, "epoch": 2781} {"train_loss": -6.528232574462891, "global_step": 116810, "epoch": 2781} {"train_loss": -6.389560699462891, "global_step": 116811, "epoch": 2781} {"train_loss": -6.490123748779297, "global_step": 116812, "epoch": 2781} {"train_loss": -6.2755255699157715, "global_step": 116813, "epoch": 2781} {"train_loss": -6.445468902587891, "global_step": 116814, "epoch": 2781} {"train_loss": -6.336474418640137, "global_step": 116815, "epoch": 2781} {"train_loss": -6.446124076843262, "global_step": 116816, "epoch": 2781} {"train_loss": -6.302570343017578, "global_step": 116817, "epoch": 2781} {"train_loss": -6.461979866027832, "global_step": 116818, "epoch": 2781} {"train_loss": -6.41152811050415, "global_step": 116819, "epoch": 2781} {"train_loss": -6.407221794128418, "global_step": 116820, "epoch": 2781} {"train_loss": -6.4375481605529785, "global_step": 116821, "epoch": 2781} {"train_loss": -6.472959518432617, "global_step": 116822, "epoch": 2781} {"train_loss": -6.452691078186035, "global_step": 116823, "epoch": 2781} {"train_loss": -6.492494583129883, "global_step": 116824, "epoch": 2781} {"train_loss": -6.293157577514648, "global_step": 116825, "epoch": 2781} {"train_loss": -6.4857072830200195, "global_step": 116826, "epoch": 2781} {"train_loss": -6.4809160232543945, "global_step": 116827, "epoch": 2781} {"train_loss": -6.271477699279785, "global_step": 116828, "epoch": 2781} {"train_loss": -6.5847368240356445, "global_step": 116829, "epoch": 2781} {"train_loss": -6.304206848144531, "global_step": 116830, "epoch": 2781} {"train_loss": -6.39820671081543, "global_step": 116831, "epoch": 2781} {"train_loss": -6.431621551513672, "global_step": 116832, "epoch": 2781} {"train_loss": -6.405561923980713, "global_step": 116833, "epoch": 2781} {"train_loss": -6.442619800567627, "global_step": 116834, "epoch": 2781} {"train_loss": -6.351767539978027, "global_step": 116835, "epoch": 2781} {"train_loss": -6.449749946594238, "global_step": 116836, "epoch": 2781} {"train_loss": -6.391435623168945, "global_step": 116837, "epoch": 2781} {"train_loss": -6.481786727905273, "global_step": 116838, "epoch": 2781} {"train_loss": -6.432332992553711, "global_step": 116839, "epoch": 2781} {"train_loss": -6.471785068511963, "global_step": 116840, "epoch": 2781} {"train_loss": -6.408970355987549, "global_step": 116841, "epoch": 2781} {"train_loss": -6.536993026733398, "global_step": 116842, "epoch": 2781} {"train_loss": -6.421021359307425, "global_step": 116843, "epoch": 2781, "val_loss": 67743.7578125} {"train_loss": -6.660586357116699, "global_step": 116844, "epoch": 2782} {"train_loss": -6.570021152496338, "global_step": 116845, "epoch": 2782} {"train_loss": -6.55234432220459, "global_step": 116846, "epoch": 2782} {"train_loss": -6.497909069061279, "global_step": 116847, "epoch": 2782} {"train_loss": -6.4362311363220215, "global_step": 116848, "epoch": 2782} {"train_loss": -6.597653388977051, "global_step": 116849, "epoch": 2782} {"train_loss": -6.586882591247559, "global_step": 116850, "epoch": 2782} {"train_loss": -6.584561824798584, "global_step": 116851, "epoch": 2782} {"train_loss": -6.476306438446045, "global_step": 116852, "epoch": 2782} {"train_loss": -6.483484268188477, "global_step": 116853, "epoch": 2782} {"train_loss": -6.583314895629883, "global_step": 116854, "epoch": 2782} {"train_loss": -6.462020397186279, "global_step": 116855, "epoch": 2782} {"train_loss": -6.542934417724609, "global_step": 116856, "epoch": 2782} {"train_loss": -6.496532440185547, "global_step": 116857, "epoch": 2782} {"train_loss": -6.523843288421631, "global_step": 116858, "epoch": 2782} {"train_loss": -6.48608922958374, "global_step": 116859, "epoch": 2782} {"train_loss": -6.614501476287842, "global_step": 116860, "epoch": 2782} {"train_loss": -6.561941146850586, "global_step": 116861, "epoch": 2782} {"train_loss": -6.551980018615723, "global_step": 116862, "epoch": 2782} {"train_loss": -6.446750640869141, "global_step": 116863, "epoch": 2782} {"train_loss": -6.456135272979736, "global_step": 116864, "epoch": 2782} {"train_loss": -6.528591156005859, "global_step": 116865, "epoch": 2782} {"train_loss": -6.593453407287598, "global_step": 116866, "epoch": 2782} {"train_loss": -6.57309627532959, "global_step": 116867, "epoch": 2782} {"train_loss": -6.464203834533691, "global_step": 116868, "epoch": 2782} {"train_loss": -6.493675708770752, "global_step": 116869, "epoch": 2782} {"train_loss": -6.544406890869141, "global_step": 116870, "epoch": 2782} {"train_loss": -6.469924449920654, "global_step": 116871, "epoch": 2782} {"train_loss": -6.537141799926758, "global_step": 116872, "epoch": 2782} {"train_loss": -6.563488006591797, "global_step": 116873, "epoch": 2782} {"train_loss": -6.481442451477051, "global_step": 116874, "epoch": 2782} {"train_loss": -6.567741870880127, "global_step": 116875, "epoch": 2782} {"train_loss": -6.477950096130371, "global_step": 116876, "epoch": 2782} {"train_loss": -6.607176303863525, "global_step": 116877, "epoch": 2782} {"train_loss": -6.482635498046875, "global_step": 116878, "epoch": 2782} {"train_loss": -6.517606258392334, "global_step": 116879, "epoch": 2782} {"train_loss": -6.395744323730469, "global_step": 116880, "epoch": 2782} {"train_loss": -6.346134185791016, "global_step": 116881, "epoch": 2782} {"train_loss": -6.531393051147461, "global_step": 116882, "epoch": 2782} {"train_loss": -6.570030212402344, "global_step": 116883, "epoch": 2782} {"train_loss": -6.507876396179199, "global_step": 116884, "epoch": 2782} {"train_loss": -6.521015825725737, "global_step": 116885, "epoch": 2782, "val_loss": 67801.9375} {"train_loss": -6.524754524230957, "global_step": 116886, "epoch": 2783} {"train_loss": -6.429682731628418, "global_step": 116887, "epoch": 2783} {"train_loss": -6.531661033630371, "global_step": 116888, "epoch": 2783} {"train_loss": -6.541179656982422, "global_step": 116889, "epoch": 2783} {"train_loss": -6.392421722412109, "global_step": 116890, "epoch": 2783} {"train_loss": -6.560806751251221, "global_step": 116891, "epoch": 2783} {"train_loss": -6.570680141448975, "global_step": 116892, "epoch": 2783} {"train_loss": -6.435924053192139, "global_step": 116893, "epoch": 2783} {"train_loss": -6.459776401519775, "global_step": 116894, "epoch": 2783} {"train_loss": -6.507322311401367, "global_step": 116895, "epoch": 2783} {"train_loss": -6.3717360496521, "global_step": 116896, "epoch": 2783} {"train_loss": -6.500347137451172, "global_step": 116897, "epoch": 2783} {"train_loss": -6.554194927215576, "global_step": 116898, "epoch": 2783} {"train_loss": -6.40775203704834, "global_step": 116899, "epoch": 2783} {"train_loss": -6.380155563354492, "global_step": 116900, "epoch": 2783} {"train_loss": -6.535574913024902, "global_step": 116901, "epoch": 2783} {"train_loss": -6.488325119018555, "global_step": 116902, "epoch": 2783} {"train_loss": -6.468491554260254, "global_step": 116903, "epoch": 2783} {"train_loss": -6.434671401977539, "global_step": 116904, "epoch": 2783} {"train_loss": -6.467128753662109, "global_step": 116905, "epoch": 2783} {"train_loss": -6.616300582885742, "global_step": 116906, "epoch": 2783} {"train_loss": -6.445063591003418, "global_step": 116907, "epoch": 2783} {"train_loss": -6.381044864654541, "global_step": 116908, "epoch": 2783} {"train_loss": -6.424961090087891, "global_step": 116909, "epoch": 2783} {"train_loss": -6.41171932220459, "global_step": 116910, "epoch": 2783} {"train_loss": -6.400411605834961, "global_step": 116911, "epoch": 2783} {"train_loss": -6.637171745300293, "global_step": 116912, "epoch": 2783} {"train_loss": -6.420375823974609, "global_step": 116913, "epoch": 2783} {"train_loss": -6.4903788566589355, "global_step": 116914, "epoch": 2783} {"train_loss": -6.503673553466797, "global_step": 116915, "epoch": 2783} {"train_loss": -6.464332103729248, "global_step": 116916, "epoch": 2783} {"train_loss": -6.572531223297119, "global_step": 116917, "epoch": 2783} {"train_loss": -6.501662731170654, "global_step": 116918, "epoch": 2783} {"train_loss": -6.490947723388672, "global_step": 116919, "epoch": 2783} {"train_loss": -6.555280685424805, "global_step": 116920, "epoch": 2783} {"train_loss": -6.392351150512695, "global_step": 116921, "epoch": 2783} {"train_loss": -6.545920372009277, "global_step": 116922, "epoch": 2783} {"train_loss": -6.5340118408203125, "global_step": 116923, "epoch": 2783} {"train_loss": -6.480294704437256, "global_step": 116924, "epoch": 2783} {"train_loss": -6.561722278594971, "global_step": 116925, "epoch": 2783} {"train_loss": -6.510364532470703, "global_step": 116926, "epoch": 2783} {"train_loss": -6.483001754397438, "global_step": 116927, "epoch": 2783, "val_loss": 68025.734375} {"train_loss": -6.501585960388184, "global_step": 116928, "epoch": 2784} {"train_loss": -6.515135765075684, "global_step": 116929, "epoch": 2784} {"train_loss": -6.558345794677734, "global_step": 116930, "epoch": 2784} {"train_loss": -6.545818328857422, "global_step": 116931, "epoch": 2784} {"train_loss": -6.436221122741699, "global_step": 116932, "epoch": 2784} {"train_loss": -6.542848587036133, "global_step": 116933, "epoch": 2784} {"train_loss": -6.501646041870117, "global_step": 116934, "epoch": 2784} {"train_loss": -6.511159896850586, "global_step": 116935, "epoch": 2784} {"train_loss": -6.478961944580078, "global_step": 116936, "epoch": 2784} {"train_loss": -6.5412139892578125, "global_step": 116937, "epoch": 2784} {"train_loss": -6.5019731521606445, "global_step": 116938, "epoch": 2784} {"train_loss": -6.502767562866211, "global_step": 116939, "epoch": 2784} {"train_loss": -6.557806015014648, "global_step": 116940, "epoch": 2784} {"train_loss": -6.627868175506592, "global_step": 116941, "epoch": 2784} {"train_loss": -6.533720970153809, "global_step": 116942, "epoch": 2784} {"train_loss": -6.402064323425293, "global_step": 116943, "epoch": 2784} {"train_loss": -6.537059783935547, "global_step": 116944, "epoch": 2784} {"train_loss": -6.489190101623535, "global_step": 116945, "epoch": 2784} {"train_loss": -6.495078086853027, "global_step": 116946, "epoch": 2784} {"train_loss": -6.486605167388916, "global_step": 116947, "epoch": 2784} {"train_loss": -6.469356060028076, "global_step": 116948, "epoch": 2784} {"train_loss": -6.503954887390137, "global_step": 116949, "epoch": 2784} {"train_loss": -6.470646381378174, "global_step": 116950, "epoch": 2784} {"train_loss": -6.483484745025635, "global_step": 116951, "epoch": 2784} {"train_loss": -6.573328971862793, "global_step": 116952, "epoch": 2784} {"train_loss": -6.396337032318115, "global_step": 116953, "epoch": 2784} {"train_loss": -6.456998825073242, "global_step": 116954, "epoch": 2784} {"train_loss": -6.507277488708496, "global_step": 116955, "epoch": 2784} {"train_loss": -6.346700668334961, "global_step": 116956, "epoch": 2784} {"train_loss": -6.423887252807617, "global_step": 116957, "epoch": 2784} {"train_loss": -6.44381046295166, "global_step": 116958, "epoch": 2784} {"train_loss": -6.471076011657715, "global_step": 116959, "epoch": 2784} {"train_loss": -6.541929244995117, "global_step": 116960, "epoch": 2784} {"train_loss": -6.449276924133301, "global_step": 116961, "epoch": 2784} {"train_loss": -6.529162406921387, "global_step": 116962, "epoch": 2784} {"train_loss": -6.375767707824707, "global_step": 116963, "epoch": 2784} {"train_loss": -6.446822166442871, "global_step": 116964, "epoch": 2784} {"train_loss": -6.598973751068115, "global_step": 116965, "epoch": 2784} {"train_loss": -6.333115100860596, "global_step": 116966, "epoch": 2784} {"train_loss": -6.504824638366699, "global_step": 116967, "epoch": 2784} {"train_loss": -6.401436805725098, "global_step": 116968, "epoch": 2784} {"train_loss": -6.486975442795527, "global_step": 116969, "epoch": 2784, "val_loss": 67962.4609375} {"train_loss": -6.430864334106445, "global_step": 116970, "epoch": 2785} {"train_loss": -6.486002445220947, "global_step": 116971, "epoch": 2785} {"train_loss": -6.427088737487793, "global_step": 116972, "epoch": 2785} {"train_loss": -6.503006935119629, "global_step": 116973, "epoch": 2785} {"train_loss": -6.333207130432129, "global_step": 116974, "epoch": 2785} {"train_loss": -6.566222190856934, "global_step": 116975, "epoch": 2785} {"train_loss": -6.48710298538208, "global_step": 116976, "epoch": 2785} {"train_loss": -6.488141059875488, "global_step": 116977, "epoch": 2785} {"train_loss": -6.514226913452148, "global_step": 116978, "epoch": 2785} {"train_loss": -6.525094032287598, "global_step": 116979, "epoch": 2785} {"train_loss": -6.515380859375, "global_step": 116980, "epoch": 2785} {"train_loss": -6.622071266174316, "global_step": 116981, "epoch": 2785} {"train_loss": -6.51145601272583, "global_step": 116982, "epoch": 2785} {"train_loss": -6.453925609588623, "global_step": 116983, "epoch": 2785} {"train_loss": -6.605878829956055, "global_step": 116984, "epoch": 2785} {"train_loss": -6.433808326721191, "global_step": 116985, "epoch": 2785} {"train_loss": -6.477560997009277, "global_step": 116986, "epoch": 2785} {"train_loss": -6.495125770568848, "global_step": 116987, "epoch": 2785} {"train_loss": -6.534246444702148, "global_step": 116988, "epoch": 2785} {"train_loss": -6.605029106140137, "global_step": 116989, "epoch": 2785} {"train_loss": -6.59895658493042, "global_step": 116990, "epoch": 2785} {"train_loss": -6.457420825958252, "global_step": 116991, "epoch": 2785} {"train_loss": -6.5714497566223145, "global_step": 116992, "epoch": 2785} {"train_loss": -6.522444725036621, "global_step": 116993, "epoch": 2785} {"train_loss": -6.60054874420166, "global_step": 116994, "epoch": 2785} {"train_loss": -6.52925968170166, "global_step": 116995, "epoch": 2785} {"train_loss": -6.542720794677734, "global_step": 116996, "epoch": 2785} {"train_loss": -6.511291980743408, "global_step": 116997, "epoch": 2785} {"train_loss": -6.504219055175781, "global_step": 116998, "epoch": 2785} {"train_loss": -6.459961414337158, "global_step": 116999, "epoch": 2785} {"train_loss": -6.459974765777588, "global_step": 117000, "epoch": 2785} {"train_loss": -6.463418960571289, "global_step": 117001, "epoch": 2785} {"train_loss": -6.584173202514648, "global_step": 117002, "epoch": 2785} {"train_loss": -6.527688503265381, "global_step": 117003, "epoch": 2785} {"train_loss": -6.641836166381836, "global_step": 117004, "epoch": 2785} {"train_loss": -6.5426249504089355, "global_step": 117005, "epoch": 2785} {"train_loss": -6.6203718185424805, "global_step": 117006, "epoch": 2785} {"train_loss": -6.5083394050598145, "global_step": 117007, "epoch": 2785} {"train_loss": -6.466519832611084, "global_step": 117008, "epoch": 2785} {"train_loss": -6.453258514404297, "global_step": 117009, "epoch": 2785} {"train_loss": -6.56756591796875, "global_step": 117010, "epoch": 2785} {"train_loss": -6.520323469525292, "global_step": 117011, "epoch": 2785, "val_loss": 68006.5625} {"train_loss": -6.472557544708252, "global_step": 117012, "epoch": 2786} {"train_loss": -6.405759811401367, "global_step": 117013, "epoch": 2786} {"train_loss": -6.475668430328369, "global_step": 117014, "epoch": 2786} {"train_loss": -6.402362823486328, "global_step": 117015, "epoch": 2786} {"train_loss": -6.516131401062012, "global_step": 117016, "epoch": 2786} {"train_loss": -6.7146687507629395, "global_step": 117017, "epoch": 2786} {"train_loss": -6.286557674407959, "global_step": 117018, "epoch": 2786} {"train_loss": -6.4952802658081055, "global_step": 117019, "epoch": 2786} {"train_loss": -6.551582336425781, "global_step": 117020, "epoch": 2786} {"train_loss": -6.57639217376709, "global_step": 117021, "epoch": 2786} {"train_loss": -6.53294563293457, "global_step": 117022, "epoch": 2786} {"train_loss": -6.585619926452637, "global_step": 117023, "epoch": 2786} {"train_loss": -6.6233811378479, "global_step": 117024, "epoch": 2786} {"train_loss": -6.486477851867676, "global_step": 117025, "epoch": 2786} {"train_loss": -6.488101959228516, "global_step": 117026, "epoch": 2786} {"train_loss": -6.621014595031738, "global_step": 117027, "epoch": 2786} {"train_loss": -6.551305770874023, "global_step": 117028, "epoch": 2786} {"train_loss": -6.574853897094727, "global_step": 117029, "epoch": 2786} {"train_loss": -6.600501537322998, "global_step": 117030, "epoch": 2786} {"train_loss": -6.59251594543457, "global_step": 117031, "epoch": 2786} {"train_loss": -6.485747337341309, "global_step": 117032, "epoch": 2786} {"train_loss": -6.590759754180908, "global_step": 117033, "epoch": 2786} {"train_loss": -6.470419406890869, "global_step": 117034, "epoch": 2786} {"train_loss": -6.544441223144531, "global_step": 117035, "epoch": 2786} {"train_loss": -6.466525077819824, "global_step": 117036, "epoch": 2786} {"train_loss": -6.528645992279053, "global_step": 117037, "epoch": 2786} {"train_loss": -6.603601455688477, "global_step": 117038, "epoch": 2786} {"train_loss": -6.605628967285156, "global_step": 117039, "epoch": 2786} {"train_loss": -6.453315734863281, "global_step": 117040, "epoch": 2786} {"train_loss": -6.5777106285095215, "global_step": 117041, "epoch": 2786} {"train_loss": -6.4754228591918945, "global_step": 117042, "epoch": 2786} {"train_loss": -6.386754989624023, "global_step": 117043, "epoch": 2786} {"train_loss": -6.481295108795166, "global_step": 117044, "epoch": 2786} {"train_loss": -6.495301246643066, "global_step": 117045, "epoch": 2786} {"train_loss": -6.504005432128906, "global_step": 117046, "epoch": 2786} {"train_loss": -6.545881271362305, "global_step": 117047, "epoch": 2786} {"train_loss": -6.516995429992676, "global_step": 117048, "epoch": 2786} {"train_loss": -6.5268120765686035, "global_step": 117049, "epoch": 2786} {"train_loss": -6.405884265899658, "global_step": 117050, "epoch": 2786} {"train_loss": -6.476332664489746, "global_step": 117051, "epoch": 2786} {"train_loss": -6.600647926330566, "global_step": 117052, "epoch": 2786} {"train_loss": -6.519739968436105, "global_step": 117053, "epoch": 2786, "val_loss": 68013.875} {"train_loss": -6.5637311935424805, "global_step": 117054, "epoch": 2787} {"train_loss": -6.472740173339844, "global_step": 117055, "epoch": 2787} {"train_loss": -6.573094844818115, "global_step": 117056, "epoch": 2787} {"train_loss": -6.55345344543457, "global_step": 117057, "epoch": 2787} {"train_loss": -6.500611782073975, "global_step": 117058, "epoch": 2787} {"train_loss": -6.53584098815918, "global_step": 117059, "epoch": 2787} {"train_loss": -6.431283950805664, "global_step": 117060, "epoch": 2787} {"train_loss": -6.508252143859863, "global_step": 117061, "epoch": 2787} {"train_loss": -6.461853504180908, "global_step": 117062, "epoch": 2787} {"train_loss": -6.582287788391113, "global_step": 117063, "epoch": 2787} {"train_loss": -6.39373779296875, "global_step": 117064, "epoch": 2787} {"train_loss": -6.406521797180176, "global_step": 117065, "epoch": 2787} {"train_loss": -6.473603248596191, "global_step": 117066, "epoch": 2787} {"train_loss": -6.488349914550781, "global_step": 117067, "epoch": 2787} {"train_loss": -6.326388359069824, "global_step": 117068, "epoch": 2787} {"train_loss": -6.43626594543457, "global_step": 117069, "epoch": 2787} {"train_loss": -6.372625827789307, "global_step": 117070, "epoch": 2787} {"train_loss": -6.348812580108643, "global_step": 117071, "epoch": 2787} {"train_loss": -6.414477348327637, "global_step": 117072, "epoch": 2787} {"train_loss": -6.531111717224121, "global_step": 117073, "epoch": 2787} {"train_loss": -6.459388732910156, "global_step": 117074, "epoch": 2787} {"train_loss": -6.425901412963867, "global_step": 117075, "epoch": 2787} {"train_loss": -6.36545991897583, "global_step": 117076, "epoch": 2787} {"train_loss": -6.39143705368042, "global_step": 117077, "epoch": 2787} {"train_loss": -6.428735733032227, "global_step": 117078, "epoch": 2787} {"train_loss": -6.354676246643066, "global_step": 117079, "epoch": 2787} {"train_loss": -6.457449913024902, "global_step": 117080, "epoch": 2787} {"train_loss": -6.294938087463379, "global_step": 117081, "epoch": 2787} {"train_loss": -6.4798173904418945, "global_step": 117082, "epoch": 2787} {"train_loss": -6.378850936889648, "global_step": 117083, "epoch": 2787} {"train_loss": -6.392001152038574, "global_step": 117084, "epoch": 2787} {"train_loss": -6.465461254119873, "global_step": 117085, "epoch": 2787} {"train_loss": -6.371170520782471, "global_step": 117086, "epoch": 2787} {"train_loss": -6.429376125335693, "global_step": 117087, "epoch": 2787} {"train_loss": -6.646486282348633, "global_step": 117088, "epoch": 2787} {"train_loss": -6.468166351318359, "global_step": 117089, "epoch": 2787} {"train_loss": -6.375011444091797, "global_step": 117090, "epoch": 2787} {"train_loss": -6.424263000488281, "global_step": 117091, "epoch": 2787} {"train_loss": -6.320061683654785, "global_step": 117092, "epoch": 2787} {"train_loss": -6.328867435455322, "global_step": 117093, "epoch": 2787} {"train_loss": -6.451836109161377, "global_step": 117094, "epoch": 2787} {"train_loss": -6.440578165508452, "global_step": 117095, "epoch": 2787, "val_loss": 68077.0546875} {"train_loss": -6.410275936126709, "global_step": 117096, "epoch": 2788} {"train_loss": -6.298357009887695, "global_step": 117097, "epoch": 2788} {"train_loss": -6.415050983428955, "global_step": 117098, "epoch": 2788} {"train_loss": -6.390789985656738, "global_step": 117099, "epoch": 2788} {"train_loss": -6.3429155349731445, "global_step": 117100, "epoch": 2788} {"train_loss": -6.54593563079834, "global_step": 117101, "epoch": 2788} {"train_loss": -6.380329132080078, "global_step": 117102, "epoch": 2788} {"train_loss": -6.434852123260498, "global_step": 117103, "epoch": 2788} {"train_loss": -6.391602516174316, "global_step": 117104, "epoch": 2788} {"train_loss": -6.52036714553833, "global_step": 117105, "epoch": 2788} {"train_loss": -6.354111194610596, "global_step": 117106, "epoch": 2788} {"train_loss": -6.482283592224121, "global_step": 117107, "epoch": 2788} {"train_loss": -6.467171669006348, "global_step": 117108, "epoch": 2788} {"train_loss": -6.393373489379883, "global_step": 117109, "epoch": 2788} {"train_loss": -6.387142658233643, "global_step": 117110, "epoch": 2788} {"train_loss": -6.356174468994141, "global_step": 117111, "epoch": 2788} {"train_loss": -6.50253438949585, "global_step": 117112, "epoch": 2788} {"train_loss": -6.61124324798584, "global_step": 117113, "epoch": 2788} {"train_loss": -6.461742877960205, "global_step": 117114, "epoch": 2788} {"train_loss": -6.4415388107299805, "global_step": 117115, "epoch": 2788} {"train_loss": -6.49967098236084, "global_step": 117116, "epoch": 2788} {"train_loss": -6.39576530456543, "global_step": 117117, "epoch": 2788} {"train_loss": -6.423820972442627, "global_step": 117118, "epoch": 2788} {"train_loss": -6.531146049499512, "global_step": 117119, "epoch": 2788} {"train_loss": -6.540437698364258, "global_step": 117120, "epoch": 2788} {"train_loss": -6.500575065612793, "global_step": 117121, "epoch": 2788} {"train_loss": -6.510674476623535, "global_step": 117122, "epoch": 2788} {"train_loss": -6.399742603302002, "global_step": 117123, "epoch": 2788} {"train_loss": -6.545783996582031, "global_step": 117124, "epoch": 2788} {"train_loss": -6.596230506896973, "global_step": 117125, "epoch": 2788} {"train_loss": -6.451145172119141, "global_step": 117126, "epoch": 2788} {"train_loss": -6.484330177307129, "global_step": 117127, "epoch": 2788} {"train_loss": -6.6404547691345215, "global_step": 117128, "epoch": 2788} {"train_loss": -6.472238540649414, "global_step": 117129, "epoch": 2788} {"train_loss": -6.66416072845459, "global_step": 117130, "epoch": 2788} {"train_loss": -6.4869384765625, "global_step": 117131, "epoch": 2788} {"train_loss": -6.465329647064209, "global_step": 117132, "epoch": 2788} {"train_loss": -6.642853260040283, "global_step": 117133, "epoch": 2788} {"train_loss": -6.417563438415527, "global_step": 117134, "epoch": 2788} {"train_loss": -6.4404473304748535, "global_step": 117135, "epoch": 2788} {"train_loss": -6.548806667327881, "global_step": 117136, "epoch": 2788} {"train_loss": -6.46965301604498, "global_step": 117137, "epoch": 2788, "val_loss": 68007.640625} {"train_loss": -6.556605339050293, "global_step": 117138, "epoch": 2789} {"train_loss": -6.530573844909668, "global_step": 117139, "epoch": 2789} {"train_loss": -6.679984092712402, "global_step": 117140, "epoch": 2789} {"train_loss": -6.434322834014893, "global_step": 117141, "epoch": 2789} {"train_loss": -6.628267765045166, "global_step": 117142, "epoch": 2789} {"train_loss": -6.707774639129639, "global_step": 117143, "epoch": 2789} {"train_loss": -6.624256134033203, "global_step": 117144, "epoch": 2789} {"train_loss": -6.599293231964111, "global_step": 117145, "epoch": 2789} {"train_loss": -6.491667747497559, "global_step": 117146, "epoch": 2789} {"train_loss": -6.5123443603515625, "global_step": 117147, "epoch": 2789} {"train_loss": -6.599120616912842, "global_step": 117148, "epoch": 2789} {"train_loss": -6.554637908935547, "global_step": 117149, "epoch": 2789} {"train_loss": -6.595911979675293, "global_step": 117150, "epoch": 2789} {"train_loss": -6.564138412475586, "global_step": 117151, "epoch": 2789} {"train_loss": -6.476352214813232, "global_step": 117152, "epoch": 2789} {"train_loss": -6.473133087158203, "global_step": 117153, "epoch": 2789} {"train_loss": -6.5507659912109375, "global_step": 117154, "epoch": 2789} {"train_loss": -6.524563789367676, "global_step": 117155, "epoch": 2789} {"train_loss": -6.644280433654785, "global_step": 117156, "epoch": 2789} {"train_loss": -6.537458419799805, "global_step": 117157, "epoch": 2789} {"train_loss": -6.599591255187988, "global_step": 117158, "epoch": 2789} {"train_loss": -6.525885105133057, "global_step": 117159, "epoch": 2789} {"train_loss": -6.517423629760742, "global_step": 117160, "epoch": 2789} {"train_loss": -6.525221347808838, "global_step": 117161, "epoch": 2789} {"train_loss": -6.608854293823242, "global_step": 117162, "epoch": 2789} {"train_loss": -6.5315070152282715, "global_step": 117163, "epoch": 2789} {"train_loss": -6.5096893310546875, "global_step": 117164, "epoch": 2789} {"train_loss": -6.4521164894104, "global_step": 117165, "epoch": 2789} {"train_loss": -6.5687174797058105, "global_step": 117166, "epoch": 2789} {"train_loss": -6.613038539886475, "global_step": 117167, "epoch": 2789} {"train_loss": -6.47977876663208, "global_step": 117168, "epoch": 2789} {"train_loss": -6.5645952224731445, "global_step": 117169, "epoch": 2789} {"train_loss": -6.5209059715271, "global_step": 117170, "epoch": 2789} {"train_loss": -6.5344953536987305, "global_step": 117171, "epoch": 2789} {"train_loss": -6.468503952026367, "global_step": 117172, "epoch": 2789} {"train_loss": -6.527544021606445, "global_step": 117173, "epoch": 2789} {"train_loss": -6.492999076843262, "global_step": 117174, "epoch": 2789} {"train_loss": -6.444517135620117, "global_step": 117175, "epoch": 2789} {"train_loss": -6.481129169464111, "global_step": 117176, "epoch": 2789} {"train_loss": -6.561221122741699, "global_step": 117177, "epoch": 2789} {"train_loss": -6.452665328979492, "global_step": 117178, "epoch": 2789} {"train_loss": -6.545485167276292, "global_step": 117179, "epoch": 2789, "val_loss": 67745.453125} {"train_loss": -6.479164123535156, "global_step": 117180, "epoch": 2790} {"train_loss": -6.555631637573242, "global_step": 117181, "epoch": 2790} {"train_loss": -6.536616802215576, "global_step": 117182, "epoch": 2790} {"train_loss": -6.391545295715332, "global_step": 117183, "epoch": 2790} {"train_loss": -6.59771728515625, "global_step": 117184, "epoch": 2790} {"train_loss": -6.635593414306641, "global_step": 117185, "epoch": 2790} {"train_loss": -6.4785237312316895, "global_step": 117186, "epoch": 2790} {"train_loss": -6.500252723693848, "global_step": 117187, "epoch": 2790} {"train_loss": -6.5137939453125, "global_step": 117188, "epoch": 2790} {"train_loss": -6.608716011047363, "global_step": 117189, "epoch": 2790} {"train_loss": -6.699332237243652, "global_step": 117190, "epoch": 2790} {"train_loss": -6.537104606628418, "global_step": 117191, "epoch": 2790} {"train_loss": -6.577123165130615, "global_step": 117192, "epoch": 2790} {"train_loss": -6.471821308135986, "global_step": 117193, "epoch": 2790} {"train_loss": -6.559464454650879, "global_step": 117194, "epoch": 2790} {"train_loss": -6.664693355560303, "global_step": 117195, "epoch": 2790} {"train_loss": -6.491523742675781, "global_step": 117196, "epoch": 2790} {"train_loss": -6.422896862030029, "global_step": 117197, "epoch": 2790} {"train_loss": -6.539521217346191, "global_step": 117198, "epoch": 2790} {"train_loss": -6.597112655639648, "global_step": 117199, "epoch": 2790} {"train_loss": -6.404787540435791, "global_step": 117200, "epoch": 2790} {"train_loss": -6.486815452575684, "global_step": 117201, "epoch": 2790} {"train_loss": -6.529782295227051, "global_step": 117202, "epoch": 2790} {"train_loss": -6.465232849121094, "global_step": 117203, "epoch": 2790} {"train_loss": -6.519704818725586, "global_step": 117204, "epoch": 2790} {"train_loss": -6.492091178894043, "global_step": 117205, "epoch": 2790} {"train_loss": -6.458738327026367, "global_step": 117206, "epoch": 2790} {"train_loss": -6.540829658508301, "global_step": 117207, "epoch": 2790} {"train_loss": -6.4495368003845215, "global_step": 117208, "epoch": 2790} {"train_loss": -6.526247024536133, "global_step": 117209, "epoch": 2790} {"train_loss": -6.601554870605469, "global_step": 117210, "epoch": 2790} {"train_loss": -6.486428737640381, "global_step": 117211, "epoch": 2790} {"train_loss": -6.497241973876953, "global_step": 117212, "epoch": 2790} {"train_loss": -6.4869608879089355, "global_step": 117213, "epoch": 2790} {"train_loss": -6.550754070281982, "global_step": 117214, "epoch": 2790} {"train_loss": -6.534091949462891, "global_step": 117215, "epoch": 2790} {"train_loss": -6.501376152038574, "global_step": 117216, "epoch": 2790} {"train_loss": -6.425878047943115, "global_step": 117217, "epoch": 2790} {"train_loss": -6.583164215087891, "global_step": 117218, "epoch": 2790} {"train_loss": -6.460506439208984, "global_step": 117219, "epoch": 2790} {"train_loss": -6.467436790466309, "global_step": 117220, "epoch": 2790} {"train_loss": -6.517186823345366, "global_step": 117221, "epoch": 2790, "val_loss": 68048.625} {"train_loss": -6.426159858703613, "global_step": 117222, "epoch": 2791} {"train_loss": -6.462423801422119, "global_step": 117223, "epoch": 2791} {"train_loss": -6.573503494262695, "global_step": 117224, "epoch": 2791} {"train_loss": -6.485671043395996, "global_step": 117225, "epoch": 2791} {"train_loss": -6.465364933013916, "global_step": 117226, "epoch": 2791} {"train_loss": -6.4431610107421875, "global_step": 117227, "epoch": 2791} {"train_loss": -6.46354341506958, "global_step": 117228, "epoch": 2791} {"train_loss": -6.499754905700684, "global_step": 117229, "epoch": 2791} {"train_loss": -6.403866767883301, "global_step": 117230, "epoch": 2791} {"train_loss": -6.504518508911133, "global_step": 117231, "epoch": 2791} {"train_loss": -6.449234962463379, "global_step": 117232, "epoch": 2791} {"train_loss": -6.5582194328308105, "global_step": 117233, "epoch": 2791} {"train_loss": -6.500309944152832, "global_step": 117234, "epoch": 2791} {"train_loss": -6.535558223724365, "global_step": 117235, "epoch": 2791} {"train_loss": -6.547576904296875, "global_step": 117236, "epoch": 2791} {"train_loss": -6.538907527923584, "global_step": 117237, "epoch": 2791} {"train_loss": -6.433496952056885, "global_step": 117238, "epoch": 2791} {"train_loss": -6.396814346313477, "global_step": 117239, "epoch": 2791} {"train_loss": -6.4681596755981445, "global_step": 117240, "epoch": 2791} {"train_loss": -6.4678850173950195, "global_step": 117241, "epoch": 2791} {"train_loss": -6.54297399520874, "global_step": 117242, "epoch": 2791} {"train_loss": -6.512179374694824, "global_step": 117243, "epoch": 2791} {"train_loss": -6.463475227355957, "global_step": 117244, "epoch": 2791} {"train_loss": -6.512778282165527, "global_step": 117245, "epoch": 2791} {"train_loss": -6.305767059326172, "global_step": 117246, "epoch": 2791} {"train_loss": -6.421664714813232, "global_step": 117247, "epoch": 2791} {"train_loss": -6.361459732055664, "global_step": 117248, "epoch": 2791} {"train_loss": -6.516080379486084, "global_step": 117249, "epoch": 2791} {"train_loss": -6.373139381408691, "global_step": 117250, "epoch": 2791} {"train_loss": -6.4006242752075195, "global_step": 117251, "epoch": 2791} {"train_loss": -6.47548246383667, "global_step": 117252, "epoch": 2791} {"train_loss": -6.506028652191162, "global_step": 117253, "epoch": 2791} {"train_loss": -6.511850833892822, "global_step": 117254, "epoch": 2791} {"train_loss": -6.445133686065674, "global_step": 117255, "epoch": 2791} {"train_loss": -6.490664958953857, "global_step": 117256, "epoch": 2791} {"train_loss": -6.502074241638184, "global_step": 117257, "epoch": 2791} {"train_loss": -6.4672417640686035, "global_step": 117258, "epoch": 2791} {"train_loss": -6.424241065979004, "global_step": 117259, "epoch": 2791} {"train_loss": -6.557905197143555, "global_step": 117260, "epoch": 2791} {"train_loss": -6.394117832183838, "global_step": 117261, "epoch": 2791} {"train_loss": -6.365294456481934, "global_step": 117262, "epoch": 2791} {"train_loss": -6.467355217252459, "global_step": 117263, "epoch": 2791, "val_loss": 68014.28125} {"train_loss": -6.469334602355957, "global_step": 117264, "epoch": 2792} {"train_loss": -6.513842582702637, "global_step": 117265, "epoch": 2792} {"train_loss": -6.494524955749512, "global_step": 117266, "epoch": 2792} {"train_loss": -6.5235419273376465, "global_step": 117267, "epoch": 2792} {"train_loss": -6.376494407653809, "global_step": 117268, "epoch": 2792} {"train_loss": -6.489006042480469, "global_step": 117269, "epoch": 2792} {"train_loss": -6.4749755859375, "global_step": 117270, "epoch": 2792} {"train_loss": -6.439318656921387, "global_step": 117271, "epoch": 2792} {"train_loss": -6.378064155578613, "global_step": 117272, "epoch": 2792} {"train_loss": -6.444519996643066, "global_step": 117273, "epoch": 2792} {"train_loss": -6.410457611083984, "global_step": 117274, "epoch": 2792} {"train_loss": -6.5551557540893555, "global_step": 117275, "epoch": 2792} {"train_loss": -6.443209648132324, "global_step": 117276, "epoch": 2792} {"train_loss": -6.363666534423828, "global_step": 117277, "epoch": 2792} {"train_loss": -6.637391090393066, "global_step": 117278, "epoch": 2792} {"train_loss": -6.498540878295898, "global_step": 117279, "epoch": 2792} {"train_loss": -6.453534126281738, "global_step": 117280, "epoch": 2792} {"train_loss": -6.463137626647949, "global_step": 117281, "epoch": 2792} {"train_loss": -6.492882251739502, "global_step": 117282, "epoch": 2792} {"train_loss": -6.496164798736572, "global_step": 117283, "epoch": 2792} {"train_loss": -6.471460342407227, "global_step": 117284, "epoch": 2792} {"train_loss": -6.394409656524658, "global_step": 117285, "epoch": 2792} {"train_loss": -6.497053146362305, "global_step": 117286, "epoch": 2792} {"train_loss": -6.505411148071289, "global_step": 117287, "epoch": 2792} {"train_loss": -6.532737731933594, "global_step": 117288, "epoch": 2792} {"train_loss": -6.541406631469727, "global_step": 117289, "epoch": 2792} {"train_loss": -6.398800373077393, "global_step": 117290, "epoch": 2792} {"train_loss": -6.563486576080322, "global_step": 117291, "epoch": 2792} {"train_loss": -6.416910648345947, "global_step": 117292, "epoch": 2792} {"train_loss": -6.515007019042969, "global_step": 117293, "epoch": 2792} {"train_loss": -6.558418273925781, "global_step": 117294, "epoch": 2792} {"train_loss": -6.511574745178223, "global_step": 117295, "epoch": 2792} {"train_loss": -6.368538856506348, "global_step": 117296, "epoch": 2792} {"train_loss": -6.498618125915527, "global_step": 117297, "epoch": 2792} {"train_loss": -6.570356369018555, "global_step": 117298, "epoch": 2792} {"train_loss": -6.483966827392578, "global_step": 117299, "epoch": 2792} {"train_loss": -6.578645706176758, "global_step": 117300, "epoch": 2792} {"train_loss": -6.467961311340332, "global_step": 117301, "epoch": 2792} {"train_loss": -6.511043071746826, "global_step": 117302, "epoch": 2792} {"train_loss": -6.392336368560791, "global_step": 117303, "epoch": 2792} {"train_loss": -6.450561046600342, "global_step": 117304, "epoch": 2792} {"train_loss": -6.480276607331776, "global_step": 117305, "epoch": 2792, "val_loss": 67848.8984375} {"train_loss": -6.56744384765625, "global_step": 117306, "epoch": 2793} {"train_loss": -6.462772369384766, "global_step": 117307, "epoch": 2793} {"train_loss": -6.527730941772461, "global_step": 117308, "epoch": 2793} {"train_loss": -6.512198448181152, "global_step": 117309, "epoch": 2793} {"train_loss": -6.53837776184082, "global_step": 117310, "epoch": 2793} {"train_loss": -6.567841529846191, "global_step": 117311, "epoch": 2793} {"train_loss": -6.495505332946777, "global_step": 117312, "epoch": 2793} {"train_loss": -6.4085588455200195, "global_step": 117313, "epoch": 2793} {"train_loss": -6.63730525970459, "global_step": 117314, "epoch": 2793} {"train_loss": -6.466513633728027, "global_step": 117315, "epoch": 2793} {"train_loss": -6.396236419677734, "global_step": 117316, "epoch": 2793} {"train_loss": -6.582316875457764, "global_step": 117317, "epoch": 2793} {"train_loss": -6.518133640289307, "global_step": 117318, "epoch": 2793} {"train_loss": -6.41987419128418, "global_step": 117319, "epoch": 2793} {"train_loss": -6.50269079208374, "global_step": 117320, "epoch": 2793} {"train_loss": -6.552128791809082, "global_step": 117321, "epoch": 2793} {"train_loss": -6.5233917236328125, "global_step": 117322, "epoch": 2793} {"train_loss": -6.458215713500977, "global_step": 117323, "epoch": 2793} {"train_loss": -6.40470027923584, "global_step": 117324, "epoch": 2793} {"train_loss": -6.4406585693359375, "global_step": 117325, "epoch": 2793} {"train_loss": -6.366730690002441, "global_step": 117326, "epoch": 2793} {"train_loss": -6.483275413513184, "global_step": 117327, "epoch": 2793} {"train_loss": -6.480392932891846, "global_step": 117328, "epoch": 2793} {"train_loss": -6.529808521270752, "global_step": 117329, "epoch": 2793} {"train_loss": -6.53469705581665, "global_step": 117330, "epoch": 2793} {"train_loss": -6.524561882019043, "global_step": 117331, "epoch": 2793} {"train_loss": -6.570977687835693, "global_step": 117332, "epoch": 2793} {"train_loss": -6.494878768920898, "global_step": 117333, "epoch": 2793} {"train_loss": -6.444666862487793, "global_step": 117334, "epoch": 2793} {"train_loss": -6.6423258781433105, "global_step": 117335, "epoch": 2793} {"train_loss": -6.502756118774414, "global_step": 117336, "epoch": 2793} {"train_loss": -6.419203281402588, "global_step": 117337, "epoch": 2793} {"train_loss": -6.639088153839111, "global_step": 117338, "epoch": 2793} {"train_loss": -6.419879913330078, "global_step": 117339, "epoch": 2793} {"train_loss": -6.413156986236572, "global_step": 117340, "epoch": 2793} {"train_loss": -6.490555763244629, "global_step": 117341, "epoch": 2793} {"train_loss": -6.569369316101074, "global_step": 117342, "epoch": 2793} {"train_loss": -6.489312171936035, "global_step": 117343, "epoch": 2793} {"train_loss": -6.492737293243408, "global_step": 117344, "epoch": 2793} {"train_loss": -6.568890571594238, "global_step": 117345, "epoch": 2793} {"train_loss": -6.567103385925293, "global_step": 117346, "epoch": 2793} {"train_loss": -6.502115238280523, "global_step": 117347, "epoch": 2793, "val_loss": 67793.21875} {"train_loss": -6.559828758239746, "global_step": 117348, "epoch": 2794} {"train_loss": -6.515571594238281, "global_step": 117349, "epoch": 2794} {"train_loss": -6.50174617767334, "global_step": 117350, "epoch": 2794} {"train_loss": -6.479551315307617, "global_step": 117351, "epoch": 2794} {"train_loss": -6.511240005493164, "global_step": 117352, "epoch": 2794} {"train_loss": -6.415473937988281, "global_step": 117353, "epoch": 2794} {"train_loss": -6.370266914367676, "global_step": 117354, "epoch": 2794} {"train_loss": -6.473738670349121, "global_step": 117355, "epoch": 2794} {"train_loss": -6.449024200439453, "global_step": 117356, "epoch": 2794} {"train_loss": -6.500011444091797, "global_step": 117357, "epoch": 2794} {"train_loss": -6.453989505767822, "global_step": 117358, "epoch": 2794} {"train_loss": -6.582240104675293, "global_step": 117359, "epoch": 2794} {"train_loss": -6.498950004577637, "global_step": 117360, "epoch": 2794} {"train_loss": -6.407452583312988, "global_step": 117361, "epoch": 2794} {"train_loss": -6.43617057800293, "global_step": 117362, "epoch": 2794} {"train_loss": -6.651576042175293, "global_step": 117363, "epoch": 2794} {"train_loss": -6.555619239807129, "global_step": 117364, "epoch": 2794} {"train_loss": -6.393420696258545, "global_step": 117365, "epoch": 2794} {"train_loss": -6.584897994995117, "global_step": 117366, "epoch": 2794} {"train_loss": -6.493020057678223, "global_step": 117367, "epoch": 2794} {"train_loss": -6.478494644165039, "global_step": 117368, "epoch": 2794} {"train_loss": -6.665058135986328, "global_step": 117369, "epoch": 2794} {"train_loss": -6.501579284667969, "global_step": 117370, "epoch": 2794} {"train_loss": -6.369560241699219, "global_step": 117371, "epoch": 2794} {"train_loss": -6.47629451751709, "global_step": 117372, "epoch": 2794} {"train_loss": -6.545694351196289, "global_step": 117373, "epoch": 2794} {"train_loss": -6.394655704498291, "global_step": 117374, "epoch": 2794} {"train_loss": -6.517757415771484, "global_step": 117375, "epoch": 2794} {"train_loss": -6.436221599578857, "global_step": 117376, "epoch": 2794} {"train_loss": -6.54744815826416, "global_step": 117377, "epoch": 2794} {"train_loss": -6.519266128540039, "global_step": 117378, "epoch": 2794} {"train_loss": -6.48325252532959, "global_step": 117379, "epoch": 2794} {"train_loss": -6.5359697341918945, "global_step": 117380, "epoch": 2794} {"train_loss": -6.478376388549805, "global_step": 117381, "epoch": 2794} {"train_loss": -6.43870735168457, "global_step": 117382, "epoch": 2794} {"train_loss": -6.584963321685791, "global_step": 117383, "epoch": 2794} {"train_loss": -6.375865936279297, "global_step": 117384, "epoch": 2794} {"train_loss": -6.427750587463379, "global_step": 117385, "epoch": 2794} {"train_loss": -6.448548316955566, "global_step": 117386, "epoch": 2794} {"train_loss": -6.484829425811768, "global_step": 117387, "epoch": 2794} {"train_loss": -6.470912933349609, "global_step": 117388, "epoch": 2794} {"train_loss": -6.4843307336171465, "global_step": 117389, "epoch": 2794, "val_loss": 68186.171875} {"train_loss": -6.4648590087890625, "global_step": 117390, "epoch": 2795} {"train_loss": -6.382959842681885, "global_step": 117391, "epoch": 2795} {"train_loss": -6.304342269897461, "global_step": 117392, "epoch": 2795} {"train_loss": -6.609431266784668, "global_step": 117393, "epoch": 2795} {"train_loss": -6.5238142013549805, "global_step": 117394, "epoch": 2795} {"train_loss": -6.379701614379883, "global_step": 117395, "epoch": 2795} {"train_loss": -6.303153991699219, "global_step": 117396, "epoch": 2795} {"train_loss": -6.554953575134277, "global_step": 117397, "epoch": 2795} {"train_loss": -6.436732769012451, "global_step": 117398, "epoch": 2795} {"train_loss": -6.4400434494018555, "global_step": 117399, "epoch": 2795} {"train_loss": -6.432635307312012, "global_step": 117400, "epoch": 2795} {"train_loss": -6.4097490310668945, "global_step": 117401, "epoch": 2795} {"train_loss": -6.390000820159912, "global_step": 117402, "epoch": 2795} {"train_loss": -6.444025993347168, "global_step": 117403, "epoch": 2795} {"train_loss": -6.369286060333252, "global_step": 117404, "epoch": 2795} {"train_loss": -6.424060344696045, "global_step": 117405, "epoch": 2795} {"train_loss": -6.535795211791992, "global_step": 117406, "epoch": 2795} {"train_loss": -6.3541178703308105, "global_step": 117407, "epoch": 2795} {"train_loss": -6.606674671173096, "global_step": 117408, "epoch": 2795} {"train_loss": -6.4279632568359375, "global_step": 117409, "epoch": 2795} {"train_loss": -6.552005290985107, "global_step": 117410, "epoch": 2795} {"train_loss": -6.426194190979004, "global_step": 117411, "epoch": 2795} {"train_loss": -6.43517541885376, "global_step": 117412, "epoch": 2795} {"train_loss": -6.46390438079834, "global_step": 117413, "epoch": 2795} {"train_loss": -6.465632915496826, "global_step": 117414, "epoch": 2795} {"train_loss": -6.507941722869873, "global_step": 117415, "epoch": 2795} {"train_loss": -6.4650421142578125, "global_step": 117416, "epoch": 2795} {"train_loss": -6.548266410827637, "global_step": 117417, "epoch": 2795} {"train_loss": -6.589216232299805, "global_step": 117418, "epoch": 2795} {"train_loss": -6.519219398498535, "global_step": 117419, "epoch": 2795} {"train_loss": -6.557964324951172, "global_step": 117420, "epoch": 2795} {"train_loss": -6.527748107910156, "global_step": 117421, "epoch": 2795} {"train_loss": -6.538078308105469, "global_step": 117422, "epoch": 2795} {"train_loss": -6.458739280700684, "global_step": 117423, "epoch": 2795} {"train_loss": -6.499905109405518, "global_step": 117424, "epoch": 2795} {"train_loss": -6.461858749389648, "global_step": 117425, "epoch": 2795} {"train_loss": -6.554567813873291, "global_step": 117426, "epoch": 2795} {"train_loss": -6.503941059112549, "global_step": 117427, "epoch": 2795} {"train_loss": -6.5382843017578125, "global_step": 117428, "epoch": 2795} {"train_loss": -6.55965518951416, "global_step": 117429, "epoch": 2795} {"train_loss": -6.452762126922607, "global_step": 117430, "epoch": 2795} {"train_loss": -6.476443608601888, "global_step": 117431, "epoch": 2795, "val_loss": 67900.8203125} {"train_loss": -6.47730827331543, "global_step": 117432, "epoch": 2796} {"train_loss": -6.596956729888916, "global_step": 117433, "epoch": 2796} {"train_loss": -6.619812488555908, "global_step": 117434, "epoch": 2796} {"train_loss": -6.580989837646484, "global_step": 117435, "epoch": 2796} {"train_loss": -6.500197410583496, "global_step": 117436, "epoch": 2796} {"train_loss": -6.52099084854126, "global_step": 117437, "epoch": 2796} {"train_loss": -6.460522651672363, "global_step": 117438, "epoch": 2796} {"train_loss": -6.538966655731201, "global_step": 117439, "epoch": 2796} {"train_loss": -6.658099174499512, "global_step": 117440, "epoch": 2796} {"train_loss": -6.503845691680908, "global_step": 117441, "epoch": 2796} {"train_loss": -6.415476322174072, "global_step": 117442, "epoch": 2796} {"train_loss": -6.453314781188965, "global_step": 117443, "epoch": 2796} {"train_loss": -6.497640609741211, "global_step": 117444, "epoch": 2796} {"train_loss": -6.4969587326049805, "global_step": 117445, "epoch": 2796} {"train_loss": -6.420647621154785, "global_step": 117446, "epoch": 2796} {"train_loss": -6.538727760314941, "global_step": 117447, "epoch": 2796} {"train_loss": -6.512383460998535, "global_step": 117448, "epoch": 2796} {"train_loss": -6.408705234527588, "global_step": 117449, "epoch": 2796} {"train_loss": -6.476559638977051, "global_step": 117450, "epoch": 2796} {"train_loss": -6.440844535827637, "global_step": 117451, "epoch": 2796} {"train_loss": -6.439099311828613, "global_step": 117452, "epoch": 2796} {"train_loss": -6.560403823852539, "global_step": 117453, "epoch": 2796} {"train_loss": -6.512322902679443, "global_step": 117454, "epoch": 2796} {"train_loss": -6.525310039520264, "global_step": 117455, "epoch": 2796} {"train_loss": -6.478909492492676, "global_step": 117456, "epoch": 2796} {"train_loss": -6.50444221496582, "global_step": 117457, "epoch": 2796} {"train_loss": -6.553455352783203, "global_step": 117458, "epoch": 2796} {"train_loss": -6.387057304382324, "global_step": 117459, "epoch": 2796} {"train_loss": -6.486018657684326, "global_step": 117460, "epoch": 2796} {"train_loss": -6.599452972412109, "global_step": 117461, "epoch": 2796} {"train_loss": -6.46973991394043, "global_step": 117462, "epoch": 2796} {"train_loss": -6.434150695800781, "global_step": 117463, "epoch": 2796} {"train_loss": -6.502255439758301, "global_step": 117464, "epoch": 2796} {"train_loss": -6.61448860168457, "global_step": 117465, "epoch": 2796} {"train_loss": -6.431012153625488, "global_step": 117466, "epoch": 2796} {"train_loss": -6.456827163696289, "global_step": 117467, "epoch": 2796} {"train_loss": -6.437899112701416, "global_step": 117468, "epoch": 2796} {"train_loss": -6.461021900177002, "global_step": 117469, "epoch": 2796} {"train_loss": -6.5320940017700195, "global_step": 117470, "epoch": 2796} {"train_loss": -6.668778419494629, "global_step": 117471, "epoch": 2796} {"train_loss": -6.498604774475098, "global_step": 117472, "epoch": 2796} {"train_loss": -6.504283859616234, "global_step": 117473, "epoch": 2796, "val_loss": 67737.4609375} {"train_loss": -6.551318168640137, "global_step": 117474, "epoch": 2797} {"train_loss": -6.537469863891602, "global_step": 117475, "epoch": 2797} {"train_loss": -6.535399436950684, "global_step": 117476, "epoch": 2797} {"train_loss": -6.571530818939209, "global_step": 117477, "epoch": 2797} {"train_loss": -6.502326488494873, "global_step": 117478, "epoch": 2797} {"train_loss": -6.50031852722168, "global_step": 117479, "epoch": 2797} {"train_loss": -6.537664413452148, "global_step": 117480, "epoch": 2797} {"train_loss": -6.439769268035889, "global_step": 117481, "epoch": 2797} {"train_loss": -6.453783988952637, "global_step": 117482, "epoch": 2797} {"train_loss": -6.4462571144104, "global_step": 117483, "epoch": 2797} {"train_loss": -6.448150634765625, "global_step": 117484, "epoch": 2797} {"train_loss": -6.60158634185791, "global_step": 117485, "epoch": 2797} {"train_loss": -6.520133018493652, "global_step": 117486, "epoch": 2797} {"train_loss": -6.6313347816467285, "global_step": 117487, "epoch": 2797} {"train_loss": -6.6742143630981445, "global_step": 117488, "epoch": 2797} {"train_loss": -6.4822282791137695, "global_step": 117489, "epoch": 2797} {"train_loss": -6.539796352386475, "global_step": 117490, "epoch": 2797} {"train_loss": -6.50724458694458, "global_step": 117491, "epoch": 2797} {"train_loss": -6.434779167175293, "global_step": 117492, "epoch": 2797} {"train_loss": -6.543865203857422, "global_step": 117493, "epoch": 2797} {"train_loss": -6.584056854248047, "global_step": 117494, "epoch": 2797} {"train_loss": -6.536952972412109, "global_step": 117495, "epoch": 2797} {"train_loss": -6.57877254486084, "global_step": 117496, "epoch": 2797} {"train_loss": -6.626996040344238, "global_step": 117497, "epoch": 2797} {"train_loss": -6.557661056518555, "global_step": 117498, "epoch": 2797} {"train_loss": -6.582398414611816, "global_step": 117499, "epoch": 2797} {"train_loss": -6.532778263092041, "global_step": 117500, "epoch": 2797} {"train_loss": -6.602755069732666, "global_step": 117501, "epoch": 2797} {"train_loss": -6.500666618347168, "global_step": 117502, "epoch": 2797} {"train_loss": -6.5188093185424805, "global_step": 117503, "epoch": 2797} {"train_loss": -6.655479431152344, "global_step": 117504, "epoch": 2797} {"train_loss": -6.565505027770996, "global_step": 117505, "epoch": 2797} {"train_loss": -6.598508834838867, "global_step": 117506, "epoch": 2797} {"train_loss": -6.610703468322754, "global_step": 117507, "epoch": 2797} {"train_loss": -6.642495632171631, "global_step": 117508, "epoch": 2797} {"train_loss": -6.475494384765625, "global_step": 117509, "epoch": 2797} {"train_loss": -6.574343681335449, "global_step": 117510, "epoch": 2797} {"train_loss": -6.403517723083496, "global_step": 117511, "epoch": 2797} {"train_loss": -6.533371448516846, "global_step": 117512, "epoch": 2797} {"train_loss": -6.62580680847168, "global_step": 117513, "epoch": 2797} {"train_loss": -6.566217422485352, "global_step": 117514, "epoch": 2797} {"train_loss": -6.544116724105108, "global_step": 117515, "epoch": 2797, "val_loss": 68032.546875} {"train_loss": -6.526145935058594, "global_step": 117516, "epoch": 2798} {"train_loss": -6.524478912353516, "global_step": 117517, "epoch": 2798} {"train_loss": -6.568886756896973, "global_step": 117518, "epoch": 2798} {"train_loss": -6.400328636169434, "global_step": 117519, "epoch": 2798} {"train_loss": -6.590070724487305, "global_step": 117520, "epoch": 2798} {"train_loss": -6.500275611877441, "global_step": 117521, "epoch": 2798} {"train_loss": -6.555647850036621, "global_step": 117522, "epoch": 2798} {"train_loss": -6.621786594390869, "global_step": 117523, "epoch": 2798} {"train_loss": -6.569287300109863, "global_step": 117524, "epoch": 2798} {"train_loss": -6.544161796569824, "global_step": 117525, "epoch": 2798} {"train_loss": -6.574406623840332, "global_step": 117526, "epoch": 2798} {"train_loss": -6.503602027893066, "global_step": 117527, "epoch": 2798} {"train_loss": -6.501585960388184, "global_step": 117528, "epoch": 2798} {"train_loss": -6.48606014251709, "global_step": 117529, "epoch": 2798} {"train_loss": -6.556480407714844, "global_step": 117530, "epoch": 2798} {"train_loss": -6.569211483001709, "global_step": 117531, "epoch": 2798} {"train_loss": -6.561739444732666, "global_step": 117532, "epoch": 2798} {"train_loss": -6.510195255279541, "global_step": 117533, "epoch": 2798} {"train_loss": -6.448887825012207, "global_step": 117534, "epoch": 2798} {"train_loss": -6.483588695526123, "global_step": 117535, "epoch": 2798} {"train_loss": -6.545419216156006, "global_step": 117536, "epoch": 2798} {"train_loss": -6.500894546508789, "global_step": 117537, "epoch": 2798} {"train_loss": -6.560382843017578, "global_step": 117538, "epoch": 2798} {"train_loss": -6.503167152404785, "global_step": 117539, "epoch": 2798} {"train_loss": -6.488902568817139, "global_step": 117540, "epoch": 2798} {"train_loss": -6.6023406982421875, "global_step": 117541, "epoch": 2798} {"train_loss": -6.510544776916504, "global_step": 117542, "epoch": 2798} {"train_loss": -6.487821578979492, "global_step": 117543, "epoch": 2798} {"train_loss": -6.456755638122559, "global_step": 117544, "epoch": 2798} {"train_loss": -6.532312393188477, "global_step": 117545, "epoch": 2798} {"train_loss": -6.640680313110352, "global_step": 117546, "epoch": 2798} {"train_loss": -6.586362361907959, "global_step": 117547, "epoch": 2798} {"train_loss": -6.484869003295898, "global_step": 117548, "epoch": 2798} {"train_loss": -6.512871742248535, "global_step": 117549, "epoch": 2798} {"train_loss": -6.526751518249512, "global_step": 117550, "epoch": 2798} {"train_loss": -6.463014602661133, "global_step": 117551, "epoch": 2798} {"train_loss": -6.475174427032471, "global_step": 117552, "epoch": 2798} {"train_loss": -6.4833197593688965, "global_step": 117553, "epoch": 2798} {"train_loss": -6.51894474029541, "global_step": 117554, "epoch": 2798} {"train_loss": -6.642754554748535, "global_step": 117555, "epoch": 2798} {"train_loss": -6.551564693450928, "global_step": 117556, "epoch": 2798} {"train_loss": -6.527090719767979, "global_step": 117557, "epoch": 2798, "val_loss": 67939.0703125} {"train_loss": -6.411309242248535, "global_step": 117558, "epoch": 2799} {"train_loss": -6.500094413757324, "global_step": 117559, "epoch": 2799} {"train_loss": -6.600907325744629, "global_step": 117560, "epoch": 2799} {"train_loss": -6.449280738830566, "global_step": 117561, "epoch": 2799} {"train_loss": -6.433104038238525, "global_step": 117562, "epoch": 2799} {"train_loss": -6.355237007141113, "global_step": 117563, "epoch": 2799} {"train_loss": -6.557119369506836, "global_step": 117564, "epoch": 2799} {"train_loss": -6.476686477661133, "global_step": 117565, "epoch": 2799} {"train_loss": -6.6282806396484375, "global_step": 117566, "epoch": 2799} {"train_loss": -6.413057327270508, "global_step": 117567, "epoch": 2799} {"train_loss": -6.450406074523926, "global_step": 117568, "epoch": 2799} {"train_loss": -6.476451873779297, "global_step": 117569, "epoch": 2799} {"train_loss": -6.525578498840332, "global_step": 117570, "epoch": 2799} {"train_loss": -6.490908622741699, "global_step": 117571, "epoch": 2799} {"train_loss": -6.5877366065979, "global_step": 117572, "epoch": 2799} {"train_loss": -6.549515724182129, "global_step": 117573, "epoch": 2799} {"train_loss": -6.424751281738281, "global_step": 117574, "epoch": 2799} {"train_loss": -6.501875877380371, "global_step": 117575, "epoch": 2799} {"train_loss": -6.660858154296875, "global_step": 117576, "epoch": 2799} {"train_loss": -6.440241813659668, "global_step": 117577, "epoch": 2799} {"train_loss": -6.483940601348877, "global_step": 117578, "epoch": 2799} {"train_loss": -6.410144805908203, "global_step": 117579, "epoch": 2799} {"train_loss": -6.4771623611450195, "global_step": 117580, "epoch": 2799} {"train_loss": -6.549093723297119, "global_step": 117581, "epoch": 2799} {"train_loss": -6.382338047027588, "global_step": 117582, "epoch": 2799} {"train_loss": -6.43274450302124, "global_step": 117583, "epoch": 2799} {"train_loss": -6.459364891052246, "global_step": 117584, "epoch": 2799} {"train_loss": -6.493903160095215, "global_step": 117585, "epoch": 2799} {"train_loss": -6.438961982727051, "global_step": 117586, "epoch": 2799} {"train_loss": -6.369568347930908, "global_step": 117587, "epoch": 2799} {"train_loss": -6.448602676391602, "global_step": 117588, "epoch": 2799} {"train_loss": -6.425796985626221, "global_step": 117589, "epoch": 2799} {"train_loss": -6.325693130493164, "global_step": 117590, "epoch": 2799} {"train_loss": -6.545659065246582, "global_step": 117591, "epoch": 2799} {"train_loss": -6.447094917297363, "global_step": 117592, "epoch": 2799} {"train_loss": -6.532085418701172, "global_step": 117593, "epoch": 2799} {"train_loss": -6.521180152893066, "global_step": 117594, "epoch": 2799} {"train_loss": -6.42692756652832, "global_step": 117595, "epoch": 2799} {"train_loss": -6.4392876625061035, "global_step": 117596, "epoch": 2799} {"train_loss": -6.425710678100586, "global_step": 117597, "epoch": 2799} {"train_loss": -6.59470272064209, "global_step": 117598, "epoch": 2799} {"train_loss": -6.479446694964454, "global_step": 117599, "epoch": 2799, "val_loss": 67863.625} {"train_loss": -6.399930477142334, "global_step": 117600, "epoch": 2800} {"train_loss": -6.5167083740234375, "global_step": 117601, "epoch": 2800} {"train_loss": -6.502712249755859, "global_step": 117602, "epoch": 2800} {"train_loss": -6.457813262939453, "global_step": 117603, "epoch": 2800} {"train_loss": -6.519960403442383, "global_step": 117604, "epoch": 2800} {"train_loss": -6.54406213760376, "global_step": 117605, "epoch": 2800} {"train_loss": -6.448692321777344, "global_step": 117606, "epoch": 2800} {"train_loss": -6.484324932098389, "global_step": 117607, "epoch": 2800} {"train_loss": -6.466437816619873, "global_step": 117608, "epoch": 2800} {"train_loss": -6.470678329467773, "global_step": 117609, "epoch": 2800} {"train_loss": -6.553874492645264, "global_step": 117610, "epoch": 2800} {"train_loss": -6.5981245040893555, "global_step": 117611, "epoch": 2800} {"train_loss": -6.274103164672852, "global_step": 117612, "epoch": 2800} {"train_loss": -6.520287036895752, "global_step": 117613, "epoch": 2800} {"train_loss": -6.460029602050781, "global_step": 117614, "epoch": 2800} {"train_loss": -6.3805131912231445, "global_step": 117615, "epoch": 2800} {"train_loss": -6.568646430969238, "global_step": 117616, "epoch": 2800} {"train_loss": -6.538973808288574, "global_step": 117617, "epoch": 2800} {"train_loss": -6.537132263183594, "global_step": 117618, "epoch": 2800} {"train_loss": -6.510894775390625, "global_step": 117619, "epoch": 2800} {"train_loss": -6.512487411499023, "global_step": 117620, "epoch": 2800} {"train_loss": -6.365268707275391, "global_step": 117621, "epoch": 2800} {"train_loss": -6.516668319702148, "global_step": 117622, "epoch": 2800} {"train_loss": -6.5402607917785645, "global_step": 117623, "epoch": 2800} {"train_loss": -6.476553916931152, "global_step": 117624, "epoch": 2800} {"train_loss": -6.45623779296875, "global_step": 117625, "epoch": 2800} {"train_loss": -6.5705766677856445, "global_step": 117626, "epoch": 2800} {"train_loss": -6.51615047454834, "global_step": 117627, "epoch": 2800} {"train_loss": -6.557490348815918, "global_step": 117628, "epoch": 2800} {"train_loss": -6.492582321166992, "global_step": 117629, "epoch": 2800} {"train_loss": -6.574971675872803, "global_step": 117630, "epoch": 2800} {"train_loss": -6.570111274719238, "global_step": 117631, "epoch": 2800} {"train_loss": -6.533559799194336, "global_step": 117632, "epoch": 2800} {"train_loss": -6.435049057006836, "global_step": 117633, "epoch": 2800} {"train_loss": -6.624808311462402, "global_step": 117634, "epoch": 2800} {"train_loss": -6.588640213012695, "global_step": 117635, "epoch": 2800} {"train_loss": -6.491397857666016, "global_step": 117636, "epoch": 2800} {"train_loss": -6.438595771789551, "global_step": 117637, "epoch": 2800} {"train_loss": -6.666125774383545, "global_step": 117638, "epoch": 2800} {"train_loss": -6.648530006408691, "global_step": 117639, "epoch": 2800} {"train_loss": -6.569123268127441, "global_step": 117640, "epoch": 2800} {"train_loss": -6.508433784757342, "global_step": 117641, "epoch": 2800, "train/sim_max_reward_0": 0.21716750400052112, "train/sim_max_reward_1": 0.9349013571360494, "train/sim_max_reward_2": 0.20377016980514745, "train/sim_max_reward_3": 0.11826400614257877, "train/sim_max_reward_4": 0.848663981620562, "train/sim_max_reward_5": 0.32483692443697276, "test/sim_max_reward_4400000": 0.1605795184710024, "test/sim_max_reward_4400001": 0.2557906304058492, "test/sim_max_reward_4400002": 0.916488203357587, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.8805336883486892, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.7980241650989771, "test/sim_max_reward_4400010": 0.1982909712375427, "test/sim_max_reward_4400011": 0.6638188078820932, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.8782287331036914, "test/sim_max_reward_4400014": 0.15396461409959308, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.21419986470646196, "test/sim_max_reward_4400019": 0.3010722544646577, "test/sim_max_reward_4400020": 2.3705804988365036e-05, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9734743852246575, "test/sim_max_reward_4400023": 0.9033519506286833, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.23822433317947245, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.030137235322054496, "test/sim_max_reward_4400028": 0.8312581499313195, "test/sim_max_reward_4400029": 0.902829764037413, "test/sim_max_reward_4400030": 0.9513824130263158, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.6628616191583458, "test/sim_max_reward_4400034": 0.7759756233913163, "test/sim_max_reward_4400035": 0.39387227398325436, "test/sim_max_reward_4400036": 0.7308084389100226, "test/sim_max_reward_4400037": 0.9662314729089553, "test/sim_max_reward_4400038": 0.9109502543794697, "test/sim_max_reward_4400039": 0.9859047390432284, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.5658136545454064, "test/sim_max_reward_4400042": 0.4989970782770666, "test/sim_max_reward_4400043": 0.9495669474420357, "test/sim_max_reward_4400044": 0.8314515172378077, "test/sim_max_reward_4400045": 0.3913871250692102, "test/sim_max_reward_4400046": 0.9668702338640953, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.8899543974189843, "test/sim_max_reward_4400049": 0.8106051099834619, "train/mean_score": 0.4412673238569719, "test/mean_score": 0.5670563524894706, "val_loss": 67891.109375} {"train_loss": -6.474807262420654, "global_step": 117642, "epoch": 2801} {"train_loss": -6.506956100463867, "global_step": 117643, "epoch": 2801} {"train_loss": -6.483750343322754, "global_step": 117644, "epoch": 2801} {"train_loss": -6.587011337280273, "global_step": 117645, "epoch": 2801} {"train_loss": -6.565857410430908, "global_step": 117646, "epoch": 2801} {"train_loss": -6.404294967651367, "global_step": 117647, "epoch": 2801} {"train_loss": -6.638171672821045, "global_step": 117648, "epoch": 2801} {"train_loss": -6.545230865478516, "global_step": 117649, "epoch": 2801} {"train_loss": -6.580426216125488, "global_step": 117650, "epoch": 2801} {"train_loss": -6.651043891906738, "global_step": 117651, "epoch": 2801} {"train_loss": -6.545915126800537, "global_step": 117652, "epoch": 2801} {"train_loss": -6.571127891540527, "global_step": 117653, "epoch": 2801} {"train_loss": -6.471512794494629, "global_step": 117654, "epoch": 2801} {"train_loss": -6.6297783851623535, "global_step": 117655, "epoch": 2801} {"train_loss": -6.55225944519043, "global_step": 117656, "epoch": 2801} {"train_loss": -6.480138778686523, "global_step": 117657, "epoch": 2801} {"train_loss": -6.587122917175293, "global_step": 117658, "epoch": 2801} {"train_loss": -6.596536159515381, "global_step": 117659, "epoch": 2801} {"train_loss": -6.503474235534668, "global_step": 117660, "epoch": 2801} {"train_loss": -6.440497398376465, "global_step": 117661, "epoch": 2801} {"train_loss": -6.48994255065918, "global_step": 117662, "epoch": 2801} {"train_loss": -6.534891128540039, "global_step": 117663, "epoch": 2801} {"train_loss": -6.410231590270996, "global_step": 117664, "epoch": 2801} {"train_loss": -6.5328168869018555, "global_step": 117665, "epoch": 2801} {"train_loss": -6.319583892822266, "global_step": 117666, "epoch": 2801} {"train_loss": -6.331503391265869, "global_step": 117667, "epoch": 2801} {"train_loss": -6.442205429077148, "global_step": 117668, "epoch": 2801} {"train_loss": -6.428238868713379, "global_step": 117669, "epoch": 2801} {"train_loss": -6.491529941558838, "global_step": 117670, "epoch": 2801} {"train_loss": -6.42915678024292, "global_step": 117671, "epoch": 2801} {"train_loss": -6.394462585449219, "global_step": 117672, "epoch": 2801} {"train_loss": -6.554835319519043, "global_step": 117673, "epoch": 2801} {"train_loss": -6.430221080780029, "global_step": 117674, "epoch": 2801} {"train_loss": -6.527210712432861, "global_step": 117675, "epoch": 2801} {"train_loss": -6.3706865310668945, "global_step": 117676, "epoch": 2801} {"train_loss": -6.46858024597168, "global_step": 117677, "epoch": 2801} {"train_loss": -6.447056293487549, "global_step": 117678, "epoch": 2801} {"train_loss": -6.395442008972168, "global_step": 117679, "epoch": 2801} {"train_loss": -6.466979026794434, "global_step": 117680, "epoch": 2801} {"train_loss": -6.557588577270508, "global_step": 117681, "epoch": 2801} {"train_loss": -6.433789253234863, "global_step": 117682, "epoch": 2801} {"train_loss": -6.4949522245497935, "global_step": 117683, "epoch": 2801, "val_loss": 67659.4921875} {"train_loss": -6.605075359344482, "global_step": 117684, "epoch": 2802} {"train_loss": -6.599218368530273, "global_step": 117685, "epoch": 2802} {"train_loss": -6.37083625793457, "global_step": 117686, "epoch": 2802} {"train_loss": -6.421207427978516, "global_step": 117687, "epoch": 2802} {"train_loss": -6.434230327606201, "global_step": 117688, "epoch": 2802} {"train_loss": -6.517120361328125, "global_step": 117689, "epoch": 2802} {"train_loss": -6.419017314910889, "global_step": 117690, "epoch": 2802} {"train_loss": -6.425339698791504, "global_step": 117691, "epoch": 2802} {"train_loss": -6.485363960266113, "global_step": 117692, "epoch": 2802} {"train_loss": -6.481271266937256, "global_step": 117693, "epoch": 2802} {"train_loss": -6.520825386047363, "global_step": 117694, "epoch": 2802} {"train_loss": -6.469412803649902, "global_step": 117695, "epoch": 2802} {"train_loss": -6.504358291625977, "global_step": 117696, "epoch": 2802} {"train_loss": -6.42879581451416, "global_step": 117697, "epoch": 2802} {"train_loss": -6.532991409301758, "global_step": 117698, "epoch": 2802} {"train_loss": -6.451310634613037, "global_step": 117699, "epoch": 2802} {"train_loss": -6.635153770446777, "global_step": 117700, "epoch": 2802} {"train_loss": -6.306583881378174, "global_step": 117701, "epoch": 2802} {"train_loss": -6.61570930480957, "global_step": 117702, "epoch": 2802} {"train_loss": -6.408271789550781, "global_step": 117703, "epoch": 2802} {"train_loss": -6.52781867980957, "global_step": 117704, "epoch": 2802} {"train_loss": -6.557291030883789, "global_step": 117705, "epoch": 2802} {"train_loss": -6.541547775268555, "global_step": 117706, "epoch": 2802} {"train_loss": -6.46772575378418, "global_step": 117707, "epoch": 2802} {"train_loss": -6.423971176147461, "global_step": 117708, "epoch": 2802} {"train_loss": -6.592324256896973, "global_step": 117709, "epoch": 2802} {"train_loss": -6.477510929107666, "global_step": 117710, "epoch": 2802} {"train_loss": -6.448555946350098, "global_step": 117711, "epoch": 2802} {"train_loss": -6.526486396789551, "global_step": 117712, "epoch": 2802} {"train_loss": -6.483270645141602, "global_step": 117713, "epoch": 2802} {"train_loss": -6.574254035949707, "global_step": 117714, "epoch": 2802} {"train_loss": -6.60054874420166, "global_step": 117715, "epoch": 2802} {"train_loss": -6.509715557098389, "global_step": 117716, "epoch": 2802} {"train_loss": -6.578981876373291, "global_step": 117717, "epoch": 2802} {"train_loss": -6.4560041427612305, "global_step": 117718, "epoch": 2802} {"train_loss": -6.568419456481934, "global_step": 117719, "epoch": 2802} {"train_loss": -6.614315032958984, "global_step": 117720, "epoch": 2802} {"train_loss": -6.531225681304932, "global_step": 117721, "epoch": 2802} {"train_loss": -6.549022197723389, "global_step": 117722, "epoch": 2802} {"train_loss": -6.50407600402832, "global_step": 117723, "epoch": 2802} {"train_loss": -6.537982940673828, "global_step": 117724, "epoch": 2802} {"train_loss": -6.5067287513187955, "global_step": 117725, "epoch": 2802, "val_loss": 67818.7578125} {"train_loss": -6.6828718185424805, "global_step": 117726, "epoch": 2803} {"train_loss": -6.46821928024292, "global_step": 117727, "epoch": 2803} {"train_loss": -6.573754787445068, "global_step": 117728, "epoch": 2803} {"train_loss": -6.589325428009033, "global_step": 117729, "epoch": 2803} {"train_loss": -6.5369672775268555, "global_step": 117730, "epoch": 2803} {"train_loss": -6.522461414337158, "global_step": 117731, "epoch": 2803} {"train_loss": -6.5330376625061035, "global_step": 117732, "epoch": 2803} {"train_loss": -6.549163818359375, "global_step": 117733, "epoch": 2803} {"train_loss": -6.583365440368652, "global_step": 117734, "epoch": 2803} {"train_loss": -6.468704700469971, "global_step": 117735, "epoch": 2803} {"train_loss": -6.506723403930664, "global_step": 117736, "epoch": 2803} {"train_loss": -6.5681681632995605, "global_step": 117737, "epoch": 2803} {"train_loss": -6.588594436645508, "global_step": 117738, "epoch": 2803} {"train_loss": -6.602683067321777, "global_step": 117739, "epoch": 2803} {"train_loss": -6.486375331878662, "global_step": 117740, "epoch": 2803} {"train_loss": -6.519710063934326, "global_step": 117741, "epoch": 2803} {"train_loss": -6.495558738708496, "global_step": 117742, "epoch": 2803} {"train_loss": -6.52186393737793, "global_step": 117743, "epoch": 2803} {"train_loss": -6.442567825317383, "global_step": 117744, "epoch": 2803} {"train_loss": -6.538990020751953, "global_step": 117745, "epoch": 2803} {"train_loss": -6.5031843185424805, "global_step": 117746, "epoch": 2803} {"train_loss": -6.514537334442139, "global_step": 117747, "epoch": 2803} {"train_loss": -6.503575801849365, "global_step": 117748, "epoch": 2803} {"train_loss": -6.538884162902832, "global_step": 117749, "epoch": 2803} {"train_loss": -6.437172889709473, "global_step": 117750, "epoch": 2803} {"train_loss": -6.528814315795898, "global_step": 117751, "epoch": 2803} {"train_loss": -6.483066558837891, "global_step": 117752, "epoch": 2803} {"train_loss": -6.537098407745361, "global_step": 117753, "epoch": 2803} {"train_loss": -6.5718793869018555, "global_step": 117754, "epoch": 2803} {"train_loss": -6.522887229919434, "global_step": 117755, "epoch": 2803} {"train_loss": -6.638222694396973, "global_step": 117756, "epoch": 2803} {"train_loss": -6.627699851989746, "global_step": 117757, "epoch": 2803} {"train_loss": -6.583578109741211, "global_step": 117758, "epoch": 2803} {"train_loss": -6.584796905517578, "global_step": 117759, "epoch": 2803} {"train_loss": -6.626172065734863, "global_step": 117760, "epoch": 2803} {"train_loss": -6.528040885925293, "global_step": 117761, "epoch": 2803} {"train_loss": -6.469503402709961, "global_step": 117762, "epoch": 2803} {"train_loss": -6.70145320892334, "global_step": 117763, "epoch": 2803} {"train_loss": -6.638496398925781, "global_step": 117764, "epoch": 2803} {"train_loss": -6.543452262878418, "global_step": 117765, "epoch": 2803} {"train_loss": -6.434837341308594, "global_step": 117766, "epoch": 2803} {"train_loss": -6.545439958572388, "global_step": 117767, "epoch": 2803, "val_loss": 67749.71875} {"train_loss": -6.631418228149414, "global_step": 117768, "epoch": 2804} {"train_loss": -6.483555793762207, "global_step": 117769, "epoch": 2804} {"train_loss": -6.5734639167785645, "global_step": 117770, "epoch": 2804} {"train_loss": -6.5506415367126465, "global_step": 117771, "epoch": 2804} {"train_loss": -6.498055934906006, "global_step": 117772, "epoch": 2804} {"train_loss": -6.650968551635742, "global_step": 117773, "epoch": 2804} {"train_loss": -6.636781215667725, "global_step": 117774, "epoch": 2804} {"train_loss": -6.603503227233887, "global_step": 117775, "epoch": 2804} {"train_loss": -6.582618713378906, "global_step": 117776, "epoch": 2804} {"train_loss": -6.6741414070129395, "global_step": 117777, "epoch": 2804} {"train_loss": -6.513575553894043, "global_step": 117778, "epoch": 2804} {"train_loss": -6.611732482910156, "global_step": 117779, "epoch": 2804} {"train_loss": -6.522185325622559, "global_step": 117780, "epoch": 2804} {"train_loss": -6.456056118011475, "global_step": 117781, "epoch": 2804} {"train_loss": -6.612749099731445, "global_step": 117782, "epoch": 2804} {"train_loss": -6.421465873718262, "global_step": 117783, "epoch": 2804} {"train_loss": -6.454014778137207, "global_step": 117784, "epoch": 2804} {"train_loss": -6.564537525177002, "global_step": 117785, "epoch": 2804} {"train_loss": -6.5134782791137695, "global_step": 117786, "epoch": 2804} {"train_loss": -6.494067668914795, "global_step": 117787, "epoch": 2804} {"train_loss": -6.5186004638671875, "global_step": 117788, "epoch": 2804} {"train_loss": -6.535513877868652, "global_step": 117789, "epoch": 2804} {"train_loss": -6.545352935791016, "global_step": 117790, "epoch": 2804} {"train_loss": -6.470218658447266, "global_step": 117791, "epoch": 2804} {"train_loss": -6.572583198547363, "global_step": 117792, "epoch": 2804} {"train_loss": -6.528377532958984, "global_step": 117793, "epoch": 2804} {"train_loss": -6.414000988006592, "global_step": 117794, "epoch": 2804} {"train_loss": -6.522001266479492, "global_step": 117795, "epoch": 2804} {"train_loss": -6.4899139404296875, "global_step": 117796, "epoch": 2804} {"train_loss": -6.446535587310791, "global_step": 117797, "epoch": 2804} {"train_loss": -6.617762565612793, "global_step": 117798, "epoch": 2804} {"train_loss": -6.422224998474121, "global_step": 117799, "epoch": 2804} {"train_loss": -6.558996200561523, "global_step": 117800, "epoch": 2804} {"train_loss": -6.609492778778076, "global_step": 117801, "epoch": 2804} {"train_loss": -6.578590393066406, "global_step": 117802, "epoch": 2804} {"train_loss": -6.573616027832031, "global_step": 117803, "epoch": 2804} {"train_loss": -6.423384666442871, "global_step": 117804, "epoch": 2804} {"train_loss": -6.519872665405273, "global_step": 117805, "epoch": 2804} {"train_loss": -6.590185642242432, "global_step": 117806, "epoch": 2804} {"train_loss": -6.568720817565918, "global_step": 117807, "epoch": 2804} {"train_loss": -6.609512805938721, "global_step": 117808, "epoch": 2804} {"train_loss": -6.53875055767241, "global_step": 117809, "epoch": 2804, "val_loss": 67908.03125} {"train_loss": -6.559553146362305, "global_step": 117810, "epoch": 2805} {"train_loss": -6.447297096252441, "global_step": 117811, "epoch": 2805} {"train_loss": -6.665799140930176, "global_step": 117812, "epoch": 2805} {"train_loss": -6.544156074523926, "global_step": 117813, "epoch": 2805} {"train_loss": -6.505853176116943, "global_step": 117814, "epoch": 2805} {"train_loss": -6.525043964385986, "global_step": 117815, "epoch": 2805} {"train_loss": -6.504367828369141, "global_step": 117816, "epoch": 2805} {"train_loss": -6.542280197143555, "global_step": 117817, "epoch": 2805} {"train_loss": -6.550910472869873, "global_step": 117818, "epoch": 2805} {"train_loss": -6.568498611450195, "global_step": 117819, "epoch": 2805} {"train_loss": -6.500539779663086, "global_step": 117820, "epoch": 2805} {"train_loss": -6.482293128967285, "global_step": 117821, "epoch": 2805} {"train_loss": -6.6394805908203125, "global_step": 117822, "epoch": 2805} {"train_loss": -6.422882080078125, "global_step": 117823, "epoch": 2805} {"train_loss": -6.550073623657227, "global_step": 117824, "epoch": 2805} {"train_loss": -6.539297103881836, "global_step": 117825, "epoch": 2805} {"train_loss": -6.4876580238342285, "global_step": 117826, "epoch": 2805} {"train_loss": -6.665207862854004, "global_step": 117827, "epoch": 2805} {"train_loss": -6.608638286590576, "global_step": 117828, "epoch": 2805} {"train_loss": -6.553513526916504, "global_step": 117829, "epoch": 2805} {"train_loss": -6.617697715759277, "global_step": 117830, "epoch": 2805} {"train_loss": -6.58689022064209, "global_step": 117831, "epoch": 2805} {"train_loss": -6.618062973022461, "global_step": 117832, "epoch": 2805} {"train_loss": -6.394796848297119, "global_step": 117833, "epoch": 2805} {"train_loss": -6.526979446411133, "global_step": 117834, "epoch": 2805} {"train_loss": -6.571163177490234, "global_step": 117835, "epoch": 2805} {"train_loss": -6.458805084228516, "global_step": 117836, "epoch": 2805} {"train_loss": -6.474109649658203, "global_step": 117837, "epoch": 2805} {"train_loss": -6.539724826812744, "global_step": 117838, "epoch": 2805} {"train_loss": -6.50999641418457, "global_step": 117839, "epoch": 2805} {"train_loss": -6.561777591705322, "global_step": 117840, "epoch": 2805} {"train_loss": -6.523894786834717, "global_step": 117841, "epoch": 2805} {"train_loss": -6.527392387390137, "global_step": 117842, "epoch": 2805} {"train_loss": -6.442227363586426, "global_step": 117843, "epoch": 2805} {"train_loss": -6.581296920776367, "global_step": 117844, "epoch": 2805} {"train_loss": -6.477341175079346, "global_step": 117845, "epoch": 2805} {"train_loss": -6.554966926574707, "global_step": 117846, "epoch": 2805} {"train_loss": -6.53327751159668, "global_step": 117847, "epoch": 2805} {"train_loss": -6.516322135925293, "global_step": 117848, "epoch": 2805} {"train_loss": -6.52483606338501, "global_step": 117849, "epoch": 2805} {"train_loss": -6.4803242683410645, "global_step": 117850, "epoch": 2805} {"train_loss": -6.532361234937396, "global_step": 117851, "epoch": 2805, "val_loss": 67963.4296875} {"train_loss": -6.470547676086426, "global_step": 117852, "epoch": 2806} {"train_loss": -6.353140830993652, "global_step": 117853, "epoch": 2806} {"train_loss": -6.49177360534668, "global_step": 117854, "epoch": 2806} {"train_loss": -6.3882904052734375, "global_step": 117855, "epoch": 2806} {"train_loss": -6.385503768920898, "global_step": 117856, "epoch": 2806} {"train_loss": -6.469127655029297, "global_step": 117857, "epoch": 2806} {"train_loss": -6.4728264808654785, "global_step": 117858, "epoch": 2806} {"train_loss": -6.492148399353027, "global_step": 117859, "epoch": 2806} {"train_loss": -6.468658447265625, "global_step": 117860, "epoch": 2806} {"train_loss": -6.3918304443359375, "global_step": 117861, "epoch": 2806} {"train_loss": -6.558477401733398, "global_step": 117862, "epoch": 2806} {"train_loss": -6.608739852905273, "global_step": 117863, "epoch": 2806} {"train_loss": -6.474839210510254, "global_step": 117864, "epoch": 2806} {"train_loss": -6.605320930480957, "global_step": 117865, "epoch": 2806} {"train_loss": -6.456674098968506, "global_step": 117866, "epoch": 2806} {"train_loss": -6.55453634262085, "global_step": 117867, "epoch": 2806} {"train_loss": -6.52731466293335, "global_step": 117868, "epoch": 2806} {"train_loss": -6.550762176513672, "global_step": 117869, "epoch": 2806} {"train_loss": -6.570267677307129, "global_step": 117870, "epoch": 2806} {"train_loss": -6.532874584197998, "global_step": 117871, "epoch": 2806} {"train_loss": -6.537266731262207, "global_step": 117872, "epoch": 2806} {"train_loss": -6.651331901550293, "global_step": 117873, "epoch": 2806} {"train_loss": -6.532806396484375, "global_step": 117874, "epoch": 2806} {"train_loss": -6.539557933807373, "global_step": 117875, "epoch": 2806} {"train_loss": -6.562655925750732, "global_step": 117876, "epoch": 2806} {"train_loss": -6.537445068359375, "global_step": 117877, "epoch": 2806} {"train_loss": -6.612884044647217, "global_step": 117878, "epoch": 2806} {"train_loss": -6.5632643699646, "global_step": 117879, "epoch": 2806} {"train_loss": -6.5665388107299805, "global_step": 117880, "epoch": 2806} {"train_loss": -6.465550422668457, "global_step": 117881, "epoch": 2806} {"train_loss": -6.537835597991943, "global_step": 117882, "epoch": 2806} {"train_loss": -6.531813621520996, "global_step": 117883, "epoch": 2806} {"train_loss": -6.4441728591918945, "global_step": 117884, "epoch": 2806} {"train_loss": -6.532905101776123, "global_step": 117885, "epoch": 2806} {"train_loss": -6.507394790649414, "global_step": 117886, "epoch": 2806} {"train_loss": -6.529321670532227, "global_step": 117887, "epoch": 2806} {"train_loss": -6.508708477020264, "global_step": 117888, "epoch": 2806} {"train_loss": -6.535404205322266, "global_step": 117889, "epoch": 2806} {"train_loss": -6.5605950355529785, "global_step": 117890, "epoch": 2806} {"train_loss": -6.604672431945801, "global_step": 117891, "epoch": 2806} {"train_loss": -6.53358268737793, "global_step": 117892, "epoch": 2806} {"train_loss": -6.518169391722906, "global_step": 117893, "epoch": 2806, "val_loss": 67879.546875} {"train_loss": -6.523320198059082, "global_step": 117894, "epoch": 2807} {"train_loss": -6.531447410583496, "global_step": 117895, "epoch": 2807} {"train_loss": -6.6259613037109375, "global_step": 117896, "epoch": 2807} {"train_loss": -6.589351177215576, "global_step": 117897, "epoch": 2807} {"train_loss": -6.42169189453125, "global_step": 117898, "epoch": 2807} {"train_loss": -6.44127893447876, "global_step": 117899, "epoch": 2807} {"train_loss": -6.482349395751953, "global_step": 117900, "epoch": 2807} {"train_loss": -6.56427001953125, "global_step": 117901, "epoch": 2807} {"train_loss": -6.493269920349121, "global_step": 117902, "epoch": 2807} {"train_loss": -6.618417739868164, "global_step": 117903, "epoch": 2807} {"train_loss": -6.444643974304199, "global_step": 117904, "epoch": 2807} {"train_loss": -6.555681228637695, "global_step": 117905, "epoch": 2807} {"train_loss": -6.484103679656982, "global_step": 117906, "epoch": 2807} {"train_loss": -6.457603454589844, "global_step": 117907, "epoch": 2807} {"train_loss": -6.487638473510742, "global_step": 117908, "epoch": 2807} {"train_loss": -6.445869445800781, "global_step": 117909, "epoch": 2807} {"train_loss": -6.479091167449951, "global_step": 117910, "epoch": 2807} {"train_loss": -6.615212440490723, "global_step": 117911, "epoch": 2807} {"train_loss": -6.473382949829102, "global_step": 117912, "epoch": 2807} {"train_loss": -6.532680511474609, "global_step": 117913, "epoch": 2807} {"train_loss": -6.523617267608643, "global_step": 117914, "epoch": 2807} {"train_loss": -6.357239723205566, "global_step": 117915, "epoch": 2807} {"train_loss": -6.603788375854492, "global_step": 117916, "epoch": 2807} {"train_loss": -6.436415672302246, "global_step": 117917, "epoch": 2807} {"train_loss": -6.469293594360352, "global_step": 117918, "epoch": 2807} {"train_loss": -6.461362838745117, "global_step": 117919, "epoch": 2807} {"train_loss": -6.395841598510742, "global_step": 117920, "epoch": 2807} {"train_loss": -6.492595672607422, "global_step": 117921, "epoch": 2807} {"train_loss": -6.415327072143555, "global_step": 117922, "epoch": 2807} {"train_loss": -6.4033660888671875, "global_step": 117923, "epoch": 2807} {"train_loss": -6.394950866699219, "global_step": 117924, "epoch": 2807} {"train_loss": -6.451765537261963, "global_step": 117925, "epoch": 2807} {"train_loss": -6.637594699859619, "global_step": 117926, "epoch": 2807} {"train_loss": -6.471376419067383, "global_step": 117927, "epoch": 2807} {"train_loss": -6.38198184967041, "global_step": 117928, "epoch": 2807} {"train_loss": -6.503013610839844, "global_step": 117929, "epoch": 2807} {"train_loss": -6.466585159301758, "global_step": 117930, "epoch": 2807} {"train_loss": -6.429730415344238, "global_step": 117931, "epoch": 2807} {"train_loss": -6.53334379196167, "global_step": 117932, "epoch": 2807} {"train_loss": -6.503421783447266, "global_step": 117933, "epoch": 2807} {"train_loss": -6.409584999084473, "global_step": 117934, "epoch": 2807} {"train_loss": -6.490528992244175, "global_step": 117935, "epoch": 2807, "val_loss": 67952.8515625} {"train_loss": -6.489758014678955, "global_step": 117936, "epoch": 2808} {"train_loss": -6.562215805053711, "global_step": 117937, "epoch": 2808} {"train_loss": -6.618679523468018, "global_step": 117938, "epoch": 2808} {"train_loss": -6.624617576599121, "global_step": 117939, "epoch": 2808} {"train_loss": -6.548442840576172, "global_step": 117940, "epoch": 2808} {"train_loss": -6.4182281494140625, "global_step": 117941, "epoch": 2808} {"train_loss": -6.520820617675781, "global_step": 117942, "epoch": 2808} {"train_loss": -6.601022720336914, "global_step": 117943, "epoch": 2808} {"train_loss": -6.518668174743652, "global_step": 117944, "epoch": 2808} {"train_loss": -6.388130187988281, "global_step": 117945, "epoch": 2808} {"train_loss": -6.435828685760498, "global_step": 117946, "epoch": 2808} {"train_loss": -6.620807647705078, "global_step": 117947, "epoch": 2808} {"train_loss": -6.5193986892700195, "global_step": 117948, "epoch": 2808} {"train_loss": -6.504408836364746, "global_step": 117949, "epoch": 2808} {"train_loss": -6.509897232055664, "global_step": 117950, "epoch": 2808} {"train_loss": -6.688264846801758, "global_step": 117951, "epoch": 2808} {"train_loss": -6.5712432861328125, "global_step": 117952, "epoch": 2808} {"train_loss": -6.503582000732422, "global_step": 117953, "epoch": 2808} {"train_loss": -6.4231085777282715, "global_step": 117954, "epoch": 2808} {"train_loss": -6.647042274475098, "global_step": 117955, "epoch": 2808} {"train_loss": -6.504264831542969, "global_step": 117956, "epoch": 2808} {"train_loss": -6.4042816162109375, "global_step": 117957, "epoch": 2808} {"train_loss": -6.573060989379883, "global_step": 117958, "epoch": 2808} {"train_loss": -6.5470075607299805, "global_step": 117959, "epoch": 2808} {"train_loss": -6.6315412521362305, "global_step": 117960, "epoch": 2808} {"train_loss": -6.5475616455078125, "global_step": 117961, "epoch": 2808} {"train_loss": -6.57869815826416, "global_step": 117962, "epoch": 2808} {"train_loss": -6.500593185424805, "global_step": 117963, "epoch": 2808} {"train_loss": -6.400638580322266, "global_step": 117964, "epoch": 2808} {"train_loss": -6.550938606262207, "global_step": 117965, "epoch": 2808} {"train_loss": -6.605568885803223, "global_step": 117966, "epoch": 2808} {"train_loss": -6.609427452087402, "global_step": 117967, "epoch": 2808} {"train_loss": -6.609512805938721, "global_step": 117968, "epoch": 2808} {"train_loss": -6.543903350830078, "global_step": 117969, "epoch": 2808} {"train_loss": -6.487283706665039, "global_step": 117970, "epoch": 2808} {"train_loss": -6.551708221435547, "global_step": 117971, "epoch": 2808} {"train_loss": -6.4366044998168945, "global_step": 117972, "epoch": 2808} {"train_loss": -6.550445079803467, "global_step": 117973, "epoch": 2808} {"train_loss": -6.667621612548828, "global_step": 117974, "epoch": 2808} {"train_loss": -6.443453788757324, "global_step": 117975, "epoch": 2808} {"train_loss": -6.534773826599121, "global_step": 117976, "epoch": 2808} {"train_loss": -6.538011539550054, "global_step": 117977, "epoch": 2808, "val_loss": 68029.5078125} {"train_loss": -6.442577362060547, "global_step": 117978, "epoch": 2809} {"train_loss": -6.61012077331543, "global_step": 117979, "epoch": 2809} {"train_loss": -6.564558982849121, "global_step": 117980, "epoch": 2809} {"train_loss": -6.588695526123047, "global_step": 117981, "epoch": 2809} {"train_loss": -6.612180709838867, "global_step": 117982, "epoch": 2809} {"train_loss": -6.447270393371582, "global_step": 117983, "epoch": 2809} {"train_loss": -6.543936729431152, "global_step": 117984, "epoch": 2809} {"train_loss": -6.5820794105529785, "global_step": 117985, "epoch": 2809} {"train_loss": -6.5239996910095215, "global_step": 117986, "epoch": 2809} {"train_loss": -6.538832664489746, "global_step": 117987, "epoch": 2809} {"train_loss": -6.493951797485352, "global_step": 117988, "epoch": 2809} {"train_loss": -6.523736000061035, "global_step": 117989, "epoch": 2809} {"train_loss": -6.512908935546875, "global_step": 117990, "epoch": 2809} {"train_loss": -6.550699710845947, "global_step": 117991, "epoch": 2809} {"train_loss": -6.597481727600098, "global_step": 117992, "epoch": 2809} {"train_loss": -6.4638447761535645, "global_step": 117993, "epoch": 2809} {"train_loss": -6.5089898109436035, "global_step": 117994, "epoch": 2809} {"train_loss": -6.364728927612305, "global_step": 117995, "epoch": 2809} {"train_loss": -6.326532363891602, "global_step": 117996, "epoch": 2809} {"train_loss": -6.449607849121094, "global_step": 117997, "epoch": 2809} {"train_loss": -6.5119476318359375, "global_step": 117998, "epoch": 2809} {"train_loss": -6.37376594543457, "global_step": 117999, "epoch": 2809} {"train_loss": -6.444430351257324, "global_step": 118000, "epoch": 2809} {"train_loss": -6.398584842681885, "global_step": 118001, "epoch": 2809} {"train_loss": -6.437108993530273, "global_step": 118002, "epoch": 2809} {"train_loss": -6.487261772155762, "global_step": 118003, "epoch": 2809} {"train_loss": -6.349019527435303, "global_step": 118004, "epoch": 2809} {"train_loss": -6.375731945037842, "global_step": 118005, "epoch": 2809} {"train_loss": -6.407392501831055, "global_step": 118006, "epoch": 2809} {"train_loss": -6.376120567321777, "global_step": 118007, "epoch": 2809} {"train_loss": -6.511930465698242, "global_step": 118008, "epoch": 2809} {"train_loss": -6.476673603057861, "global_step": 118009, "epoch": 2809} {"train_loss": -6.515241622924805, "global_step": 118010, "epoch": 2809} {"train_loss": -6.540318965911865, "global_step": 118011, "epoch": 2809} {"train_loss": -6.355647087097168, "global_step": 118012, "epoch": 2809} {"train_loss": -6.547914028167725, "global_step": 118013, "epoch": 2809} {"train_loss": -6.457231521606445, "global_step": 118014, "epoch": 2809} {"train_loss": -6.502226829528809, "global_step": 118015, "epoch": 2809} {"train_loss": -6.595710754394531, "global_step": 118016, "epoch": 2809} {"train_loss": -6.590065002441406, "global_step": 118017, "epoch": 2809} {"train_loss": -6.465452194213867, "global_step": 118018, "epoch": 2809} {"train_loss": -6.490267435709636, "global_step": 118019, "epoch": 2809, "val_loss": 67785.15625} {"train_loss": -6.532644271850586, "global_step": 118020, "epoch": 2810} {"train_loss": -6.367142677307129, "global_step": 118021, "epoch": 2810} {"train_loss": -6.539275646209717, "global_step": 118022, "epoch": 2810} {"train_loss": -6.348752021789551, "global_step": 118023, "epoch": 2810} {"train_loss": -6.454407691955566, "global_step": 118024, "epoch": 2810} {"train_loss": -6.508180618286133, "global_step": 118025, "epoch": 2810} {"train_loss": -6.430266380310059, "global_step": 118026, "epoch": 2810} {"train_loss": -6.514408111572266, "global_step": 118027, "epoch": 2810} {"train_loss": -6.465256690979004, "global_step": 118028, "epoch": 2810} {"train_loss": -6.471042633056641, "global_step": 118029, "epoch": 2810} {"train_loss": -6.52979850769043, "global_step": 118030, "epoch": 2810} {"train_loss": -6.5464043617248535, "global_step": 118031, "epoch": 2810} {"train_loss": -6.548511505126953, "global_step": 118032, "epoch": 2810} {"train_loss": -6.584193706512451, "global_step": 118033, "epoch": 2810} {"train_loss": -6.556997299194336, "global_step": 118034, "epoch": 2810} {"train_loss": -6.445650100708008, "global_step": 118035, "epoch": 2810} {"train_loss": -6.5518999099731445, "global_step": 118036, "epoch": 2810} {"train_loss": -6.517529010772705, "global_step": 118037, "epoch": 2810} {"train_loss": -6.455045700073242, "global_step": 118038, "epoch": 2810} {"train_loss": -6.543092727661133, "global_step": 118039, "epoch": 2810} {"train_loss": -6.520567893981934, "global_step": 118040, "epoch": 2810} {"train_loss": -6.54921817779541, "global_step": 118041, "epoch": 2810} {"train_loss": -6.626596450805664, "global_step": 118042, "epoch": 2810} {"train_loss": -6.454030990600586, "global_step": 118043, "epoch": 2810} {"train_loss": -6.532301902770996, "global_step": 118044, "epoch": 2810} {"train_loss": -6.466280937194824, "global_step": 118045, "epoch": 2810} {"train_loss": -6.604394912719727, "global_step": 118046, "epoch": 2810} {"train_loss": -6.585812568664551, "global_step": 118047, "epoch": 2810} {"train_loss": -6.44123649597168, "global_step": 118048, "epoch": 2810} {"train_loss": -6.5162506103515625, "global_step": 118049, "epoch": 2810} {"train_loss": -6.500983238220215, "global_step": 118050, "epoch": 2810} {"train_loss": -6.563296318054199, "global_step": 118051, "epoch": 2810} {"train_loss": -6.548313140869141, "global_step": 118052, "epoch": 2810} {"train_loss": -6.477714538574219, "global_step": 118053, "epoch": 2810} {"train_loss": -6.494503974914551, "global_step": 118054, "epoch": 2810} {"train_loss": -6.512447357177734, "global_step": 118055, "epoch": 2810} {"train_loss": -6.473723411560059, "global_step": 118056, "epoch": 2810} {"train_loss": -6.586732864379883, "global_step": 118057, "epoch": 2810} {"train_loss": -6.519904136657715, "global_step": 118058, "epoch": 2810} {"train_loss": -6.454652309417725, "global_step": 118059, "epoch": 2810} {"train_loss": -6.570219993591309, "global_step": 118060, "epoch": 2810} {"train_loss": -6.512520721980503, "global_step": 118061, "epoch": 2810, "val_loss": 67893.3046875} {"train_loss": -6.5661420822143555, "global_step": 118062, "epoch": 2811} {"train_loss": -6.566924571990967, "global_step": 118063, "epoch": 2811} {"train_loss": -6.530030727386475, "global_step": 118064, "epoch": 2811} {"train_loss": -6.663486480712891, "global_step": 118065, "epoch": 2811} {"train_loss": -6.53773307800293, "global_step": 118066, "epoch": 2811} {"train_loss": -6.5959014892578125, "global_step": 118067, "epoch": 2811} {"train_loss": -6.6068034172058105, "global_step": 118068, "epoch": 2811} {"train_loss": -6.549569129943848, "global_step": 118069, "epoch": 2811} {"train_loss": -6.52579402923584, "global_step": 118070, "epoch": 2811} {"train_loss": -6.543625831604004, "global_step": 118071, "epoch": 2811} {"train_loss": -6.549211502075195, "global_step": 118072, "epoch": 2811} {"train_loss": -6.476992607116699, "global_step": 118073, "epoch": 2811} {"train_loss": -6.525703430175781, "global_step": 118074, "epoch": 2811} {"train_loss": -6.631301403045654, "global_step": 118075, "epoch": 2811} {"train_loss": -6.5595808029174805, "global_step": 118076, "epoch": 2811} {"train_loss": -6.4321746826171875, "global_step": 118077, "epoch": 2811} {"train_loss": -6.604168891906738, "global_step": 118078, "epoch": 2811} {"train_loss": -6.642269134521484, "global_step": 118079, "epoch": 2811} {"train_loss": -6.53663969039917, "global_step": 118080, "epoch": 2811} {"train_loss": -6.355718612670898, "global_step": 118081, "epoch": 2811} {"train_loss": -6.501855850219727, "global_step": 118082, "epoch": 2811} {"train_loss": -6.325040817260742, "global_step": 118083, "epoch": 2811} {"train_loss": -6.443242073059082, "global_step": 118084, "epoch": 2811} {"train_loss": -6.48757266998291, "global_step": 118085, "epoch": 2811} {"train_loss": -6.430510997772217, "global_step": 118086, "epoch": 2811} {"train_loss": -6.49360466003418, "global_step": 118087, "epoch": 2811} {"train_loss": -6.456783294677734, "global_step": 118088, "epoch": 2811} {"train_loss": -6.5788421630859375, "global_step": 118089, "epoch": 2811} {"train_loss": -6.424760341644287, "global_step": 118090, "epoch": 2811} {"train_loss": -6.473203659057617, "global_step": 118091, "epoch": 2811} {"train_loss": -6.463523864746094, "global_step": 118092, "epoch": 2811} {"train_loss": -6.465490341186523, "global_step": 118093, "epoch": 2811} {"train_loss": -6.515514373779297, "global_step": 118094, "epoch": 2811} {"train_loss": -6.6719160079956055, "global_step": 118095, "epoch": 2811} {"train_loss": -6.555830001831055, "global_step": 118096, "epoch": 2811} {"train_loss": -6.405692100524902, "global_step": 118097, "epoch": 2811} {"train_loss": -6.509664535522461, "global_step": 118098, "epoch": 2811} {"train_loss": -6.629271984100342, "global_step": 118099, "epoch": 2811} {"train_loss": -6.577667713165283, "global_step": 118100, "epoch": 2811} {"train_loss": -6.526955604553223, "global_step": 118101, "epoch": 2811} {"train_loss": -6.474189758300781, "global_step": 118102, "epoch": 2811} {"train_loss": -6.521965140388126, "global_step": 118103, "epoch": 2811, "val_loss": 67963.1640625} {"train_loss": -6.551633834838867, "global_step": 118104, "epoch": 2812} {"train_loss": -6.539009094238281, "global_step": 118105, "epoch": 2812} {"train_loss": -6.5780510902404785, "global_step": 118106, "epoch": 2812} {"train_loss": -6.53490686416626, "global_step": 118107, "epoch": 2812} {"train_loss": -6.570805549621582, "global_step": 118108, "epoch": 2812} {"train_loss": -6.463008880615234, "global_step": 118109, "epoch": 2812} {"train_loss": -6.456381797790527, "global_step": 118110, "epoch": 2812} {"train_loss": -6.4867844581604, "global_step": 118111, "epoch": 2812} {"train_loss": -6.483181953430176, "global_step": 118112, "epoch": 2812} {"train_loss": -6.579074859619141, "global_step": 118113, "epoch": 2812} {"train_loss": -6.456784725189209, "global_step": 118114, "epoch": 2812} {"train_loss": -6.575675964355469, "global_step": 118115, "epoch": 2812} {"train_loss": -6.607812881469727, "global_step": 118116, "epoch": 2812} {"train_loss": -6.459198951721191, "global_step": 118117, "epoch": 2812} {"train_loss": -6.444995880126953, "global_step": 118118, "epoch": 2812} {"train_loss": -6.392409324645996, "global_step": 118119, "epoch": 2812} {"train_loss": -6.573214054107666, "global_step": 118120, "epoch": 2812} {"train_loss": -6.483979225158691, "global_step": 118121, "epoch": 2812} {"train_loss": -6.3770246505737305, "global_step": 118122, "epoch": 2812} {"train_loss": -6.466296195983887, "global_step": 118123, "epoch": 2812} {"train_loss": -6.617368698120117, "global_step": 118124, "epoch": 2812} {"train_loss": -6.472705841064453, "global_step": 118125, "epoch": 2812} {"train_loss": -6.457634925842285, "global_step": 118126, "epoch": 2812} {"train_loss": -6.552230358123779, "global_step": 118127, "epoch": 2812} {"train_loss": -6.477794647216797, "global_step": 118128, "epoch": 2812} {"train_loss": -6.433337688446045, "global_step": 118129, "epoch": 2812} {"train_loss": -6.467586517333984, "global_step": 118130, "epoch": 2812} {"train_loss": -6.40023136138916, "global_step": 118131, "epoch": 2812} {"train_loss": -6.449210166931152, "global_step": 118132, "epoch": 2812} {"train_loss": -6.49818754196167, "global_step": 118133, "epoch": 2812} {"train_loss": -6.48874568939209, "global_step": 118134, "epoch": 2812} {"train_loss": -6.51888370513916, "global_step": 118135, "epoch": 2812} {"train_loss": -6.452495574951172, "global_step": 118136, "epoch": 2812} {"train_loss": -6.573219299316406, "global_step": 118137, "epoch": 2812} {"train_loss": -6.5210957527160645, "global_step": 118138, "epoch": 2812} {"train_loss": -6.518502235412598, "global_step": 118139, "epoch": 2812} {"train_loss": -6.473852157592773, "global_step": 118140, "epoch": 2812} {"train_loss": -6.490089416503906, "global_step": 118141, "epoch": 2812} {"train_loss": -6.548023223876953, "global_step": 118142, "epoch": 2812} {"train_loss": -6.539990425109863, "global_step": 118143, "epoch": 2812} {"train_loss": -6.46889591217041, "global_step": 118144, "epoch": 2812} {"train_loss": -6.4992764223189585, "global_step": 118145, "epoch": 2812, "val_loss": 67811.7578125} {"train_loss": -6.4603424072265625, "global_step": 118146, "epoch": 2813} {"train_loss": -6.431662082672119, "global_step": 118147, "epoch": 2813} {"train_loss": -6.6569037437438965, "global_step": 118148, "epoch": 2813} {"train_loss": -6.525073051452637, "global_step": 118149, "epoch": 2813} {"train_loss": -6.4291605949401855, "global_step": 118150, "epoch": 2813} {"train_loss": -6.605963706970215, "global_step": 118151, "epoch": 2813} {"train_loss": -6.456754207611084, "global_step": 118152, "epoch": 2813} {"train_loss": -6.492125988006592, "global_step": 118153, "epoch": 2813} {"train_loss": -6.647685527801514, "global_step": 118154, "epoch": 2813} {"train_loss": -6.448058128356934, "global_step": 118155, "epoch": 2813} {"train_loss": -6.504746437072754, "global_step": 118156, "epoch": 2813} {"train_loss": -6.458984375, "global_step": 118157, "epoch": 2813} {"train_loss": -6.407675743103027, "global_step": 118158, "epoch": 2813} {"train_loss": -6.587893486022949, "global_step": 118159, "epoch": 2813} {"train_loss": -6.432146072387695, "global_step": 118160, "epoch": 2813} {"train_loss": -6.356508731842041, "global_step": 118161, "epoch": 2813} {"train_loss": -6.479372501373291, "global_step": 118162, "epoch": 2813} {"train_loss": -6.397521495819092, "global_step": 118163, "epoch": 2813} {"train_loss": -6.520155906677246, "global_step": 118164, "epoch": 2813} {"train_loss": -6.485400676727295, "global_step": 118165, "epoch": 2813} {"train_loss": -6.497203350067139, "global_step": 118166, "epoch": 2813} {"train_loss": -6.43734073638916, "global_step": 118167, "epoch": 2813} {"train_loss": -6.444340705871582, "global_step": 118168, "epoch": 2813} {"train_loss": -6.50441837310791, "global_step": 118169, "epoch": 2813} {"train_loss": -6.46988582611084, "global_step": 118170, "epoch": 2813} {"train_loss": -6.548062324523926, "global_step": 118171, "epoch": 2813} {"train_loss": -6.482732772827148, "global_step": 118172, "epoch": 2813} {"train_loss": -6.406810283660889, "global_step": 118173, "epoch": 2813} {"train_loss": -6.530534267425537, "global_step": 118174, "epoch": 2813} {"train_loss": -6.515376091003418, "global_step": 118175, "epoch": 2813} {"train_loss": -6.491487503051758, "global_step": 118176, "epoch": 2813} {"train_loss": -6.488658905029297, "global_step": 118177, "epoch": 2813} {"train_loss": -6.602065086364746, "global_step": 118178, "epoch": 2813} {"train_loss": -6.635334014892578, "global_step": 118179, "epoch": 2813} {"train_loss": -6.567890167236328, "global_step": 118180, "epoch": 2813} {"train_loss": -6.3993659019470215, "global_step": 118181, "epoch": 2813} {"train_loss": -6.63223123550415, "global_step": 118182, "epoch": 2813} {"train_loss": -6.646808624267578, "global_step": 118183, "epoch": 2813} {"train_loss": -6.541218280792236, "global_step": 118184, "epoch": 2813} {"train_loss": -6.562716484069824, "global_step": 118185, "epoch": 2813} {"train_loss": -6.550681114196777, "global_step": 118186, "epoch": 2813} {"train_loss": -6.50986925760905, "global_step": 118187, "epoch": 2813, "val_loss": 67832.375} {"train_loss": -6.5350236892700195, "global_step": 118188, "epoch": 2814} {"train_loss": -6.560937881469727, "global_step": 118189, "epoch": 2814} {"train_loss": -6.576942443847656, "global_step": 118190, "epoch": 2814} {"train_loss": -6.5484514236450195, "global_step": 118191, "epoch": 2814} {"train_loss": -6.54218864440918, "global_step": 118192, "epoch": 2814} {"train_loss": -6.5014214515686035, "global_step": 118193, "epoch": 2814} {"train_loss": -6.543543815612793, "global_step": 118194, "epoch": 2814} {"train_loss": -6.551709175109863, "global_step": 118195, "epoch": 2814} {"train_loss": -6.532975673675537, "global_step": 118196, "epoch": 2814} {"train_loss": -6.423237323760986, "global_step": 118197, "epoch": 2814} {"train_loss": -6.458637714385986, "global_step": 118198, "epoch": 2814} {"train_loss": -6.594455718994141, "global_step": 118199, "epoch": 2814} {"train_loss": -6.478050231933594, "global_step": 118200, "epoch": 2814} {"train_loss": -6.57710599899292, "global_step": 118201, "epoch": 2814} {"train_loss": -6.538975715637207, "global_step": 118202, "epoch": 2814} {"train_loss": -6.41810941696167, "global_step": 118203, "epoch": 2814} {"train_loss": -6.544076919555664, "global_step": 118204, "epoch": 2814} {"train_loss": -6.448918342590332, "global_step": 118205, "epoch": 2814} {"train_loss": -6.468624114990234, "global_step": 118206, "epoch": 2814} {"train_loss": -6.563401222229004, "global_step": 118207, "epoch": 2814} {"train_loss": -6.483852386474609, "global_step": 118208, "epoch": 2814} {"train_loss": -6.531783103942871, "global_step": 118209, "epoch": 2814} {"train_loss": -6.5238237380981445, "global_step": 118210, "epoch": 2814} {"train_loss": -6.378286361694336, "global_step": 118211, "epoch": 2814} {"train_loss": -6.491981506347656, "global_step": 118212, "epoch": 2814} {"train_loss": -6.442169189453125, "global_step": 118213, "epoch": 2814} {"train_loss": -6.498905181884766, "global_step": 118214, "epoch": 2814} {"train_loss": -6.540143966674805, "global_step": 118215, "epoch": 2814} {"train_loss": -6.408374786376953, "global_step": 118216, "epoch": 2814} {"train_loss": -6.452732563018799, "global_step": 118217, "epoch": 2814} {"train_loss": -6.564311504364014, "global_step": 118218, "epoch": 2814} {"train_loss": -6.438952445983887, "global_step": 118219, "epoch": 2814} {"train_loss": -6.556815147399902, "global_step": 118220, "epoch": 2814} {"train_loss": -6.479787349700928, "global_step": 118221, "epoch": 2814} {"train_loss": -6.436758518218994, "global_step": 118222, "epoch": 2814} {"train_loss": -6.472963333129883, "global_step": 118223, "epoch": 2814} {"train_loss": -6.567258834838867, "global_step": 118224, "epoch": 2814} {"train_loss": -6.549297332763672, "global_step": 118225, "epoch": 2814} {"train_loss": -6.447231769561768, "global_step": 118226, "epoch": 2814} {"train_loss": -6.488797187805176, "global_step": 118227, "epoch": 2814} {"train_loss": -6.604833602905273, "global_step": 118228, "epoch": 2814} {"train_loss": -6.504837263198126, "global_step": 118229, "epoch": 2814, "val_loss": 68025.8359375} {"train_loss": -6.528748512268066, "global_step": 118230, "epoch": 2815} {"train_loss": -6.559936046600342, "global_step": 118231, "epoch": 2815} {"train_loss": -6.466094017028809, "global_step": 118232, "epoch": 2815} {"train_loss": -6.442917823791504, "global_step": 118233, "epoch": 2815} {"train_loss": -6.502651214599609, "global_step": 118234, "epoch": 2815} {"train_loss": -6.559332847595215, "global_step": 118235, "epoch": 2815} {"train_loss": -6.562387466430664, "global_step": 118236, "epoch": 2815} {"train_loss": -6.506625175476074, "global_step": 118237, "epoch": 2815} {"train_loss": -6.545866012573242, "global_step": 118238, "epoch": 2815} {"train_loss": -6.595667839050293, "global_step": 118239, "epoch": 2815} {"train_loss": -6.420133590698242, "global_step": 118240, "epoch": 2815} {"train_loss": -6.563802719116211, "global_step": 118241, "epoch": 2815} {"train_loss": -6.604944229125977, "global_step": 118242, "epoch": 2815} {"train_loss": -6.5244646072387695, "global_step": 118243, "epoch": 2815} {"train_loss": -6.532341003417969, "global_step": 118244, "epoch": 2815} {"train_loss": -6.609192848205566, "global_step": 118245, "epoch": 2815} {"train_loss": -6.533393383026123, "global_step": 118246, "epoch": 2815} {"train_loss": -6.453603267669678, "global_step": 118247, "epoch": 2815} {"train_loss": -6.441360950469971, "global_step": 118248, "epoch": 2815} {"train_loss": -6.579739570617676, "global_step": 118249, "epoch": 2815} {"train_loss": -6.565053939819336, "global_step": 118250, "epoch": 2815} {"train_loss": -6.548275947570801, "global_step": 118251, "epoch": 2815} {"train_loss": -6.668726444244385, "global_step": 118252, "epoch": 2815} {"train_loss": -6.539411544799805, "global_step": 118253, "epoch": 2815} {"train_loss": -6.651119232177734, "global_step": 118254, "epoch": 2815} {"train_loss": -6.479912757873535, "global_step": 118255, "epoch": 2815} {"train_loss": -6.579452037811279, "global_step": 118256, "epoch": 2815} {"train_loss": -6.50930118560791, "global_step": 118257, "epoch": 2815} {"train_loss": -6.398739814758301, "global_step": 118258, "epoch": 2815} {"train_loss": -6.591477870941162, "global_step": 118259, "epoch": 2815} {"train_loss": -6.613784313201904, "global_step": 118260, "epoch": 2815} {"train_loss": -6.41139030456543, "global_step": 118261, "epoch": 2815} {"train_loss": -6.531344890594482, "global_step": 118262, "epoch": 2815} {"train_loss": -6.554476737976074, "global_step": 118263, "epoch": 2815} {"train_loss": -6.5407915115356445, "global_step": 118264, "epoch": 2815} {"train_loss": -6.616985321044922, "global_step": 118265, "epoch": 2815} {"train_loss": -6.521956443786621, "global_step": 118266, "epoch": 2815} {"train_loss": -6.473034381866455, "global_step": 118267, "epoch": 2815} {"train_loss": -6.61332893371582, "global_step": 118268, "epoch": 2815} {"train_loss": -6.504131317138672, "global_step": 118269, "epoch": 2815} {"train_loss": -6.482588768005371, "global_step": 118270, "epoch": 2815} {"train_loss": -6.536018314815703, "global_step": 118271, "epoch": 2815, "val_loss": 67784.4453125} {"train_loss": -6.528353691101074, "global_step": 118272, "epoch": 2816} {"train_loss": -6.4770050048828125, "global_step": 118273, "epoch": 2816} {"train_loss": -6.658469200134277, "global_step": 118274, "epoch": 2816} {"train_loss": -6.502093315124512, "global_step": 118275, "epoch": 2816} {"train_loss": -6.453712463378906, "global_step": 118276, "epoch": 2816} {"train_loss": -6.471500396728516, "global_step": 118277, "epoch": 2816} {"train_loss": -6.487765312194824, "global_step": 118278, "epoch": 2816} {"train_loss": -6.365139007568359, "global_step": 118279, "epoch": 2816} {"train_loss": -6.642236709594727, "global_step": 118280, "epoch": 2816} {"train_loss": -6.348989486694336, "global_step": 118281, "epoch": 2816} {"train_loss": -6.464944362640381, "global_step": 118282, "epoch": 2816} {"train_loss": -6.524579048156738, "global_step": 118283, "epoch": 2816} {"train_loss": -6.627270698547363, "global_step": 118284, "epoch": 2816} {"train_loss": -6.532538414001465, "global_step": 118285, "epoch": 2816} {"train_loss": -6.549632549285889, "global_step": 118286, "epoch": 2816} {"train_loss": -6.465878009796143, "global_step": 118287, "epoch": 2816} {"train_loss": -6.473742485046387, "global_step": 118288, "epoch": 2816} {"train_loss": -6.5212602615356445, "global_step": 118289, "epoch": 2816} {"train_loss": -6.543187141418457, "global_step": 118290, "epoch": 2816} {"train_loss": -6.533185958862305, "global_step": 118291, "epoch": 2816} {"train_loss": -6.463041305541992, "global_step": 118292, "epoch": 2816} {"train_loss": -6.529781341552734, "global_step": 118293, "epoch": 2816} {"train_loss": -6.5532546043396, "global_step": 118294, "epoch": 2816} {"train_loss": -6.4293365478515625, "global_step": 118295, "epoch": 2816} {"train_loss": -6.4691572189331055, "global_step": 118296, "epoch": 2816} {"train_loss": -6.4537458419799805, "global_step": 118297, "epoch": 2816} {"train_loss": -6.469645977020264, "global_step": 118298, "epoch": 2816} {"train_loss": -6.417712211608887, "global_step": 118299, "epoch": 2816} {"train_loss": -6.352602005004883, "global_step": 118300, "epoch": 2816} {"train_loss": -6.444138526916504, "global_step": 118301, "epoch": 2816} {"train_loss": -6.544865131378174, "global_step": 118302, "epoch": 2816} {"train_loss": -6.4395036697387695, "global_step": 118303, "epoch": 2816} {"train_loss": -6.552573204040527, "global_step": 118304, "epoch": 2816} {"train_loss": -6.451657295227051, "global_step": 118305, "epoch": 2816} {"train_loss": -6.479862213134766, "global_step": 118306, "epoch": 2816} {"train_loss": -6.50861120223999, "global_step": 118307, "epoch": 2816} {"train_loss": -6.43853759765625, "global_step": 118308, "epoch": 2816} {"train_loss": -6.500212669372559, "global_step": 118309, "epoch": 2816} {"train_loss": -6.577864646911621, "global_step": 118310, "epoch": 2816} {"train_loss": -6.497206211090088, "global_step": 118311, "epoch": 2816} {"train_loss": -6.464245319366455, "global_step": 118312, "epoch": 2816} {"train_loss": -6.492988529659453, "global_step": 118313, "epoch": 2816, "val_loss": 68006.828125} {"train_loss": -6.471282958984375, "global_step": 118314, "epoch": 2817} {"train_loss": -6.4761962890625, "global_step": 118315, "epoch": 2817} {"train_loss": -6.558225631713867, "global_step": 118316, "epoch": 2817} {"train_loss": -6.553462028503418, "global_step": 118317, "epoch": 2817} {"train_loss": -6.48203706741333, "global_step": 118318, "epoch": 2817} {"train_loss": -6.410066604614258, "global_step": 118319, "epoch": 2817} {"train_loss": -6.5792388916015625, "global_step": 118320, "epoch": 2817} {"train_loss": -6.498051643371582, "global_step": 118321, "epoch": 2817} {"train_loss": -6.457263946533203, "global_step": 118322, "epoch": 2817} {"train_loss": -6.552676200866699, "global_step": 118323, "epoch": 2817} {"train_loss": -6.571446418762207, "global_step": 118324, "epoch": 2817} {"train_loss": -6.4695611000061035, "global_step": 118325, "epoch": 2817} {"train_loss": -6.499964714050293, "global_step": 118326, "epoch": 2817} {"train_loss": -6.565012454986572, "global_step": 118327, "epoch": 2817} {"train_loss": -6.55433464050293, "global_step": 118328, "epoch": 2817} {"train_loss": -6.4187331199646, "global_step": 118329, "epoch": 2817} {"train_loss": -6.528678894042969, "global_step": 118330, "epoch": 2817} {"train_loss": -6.549866199493408, "global_step": 118331, "epoch": 2817} {"train_loss": -6.690225601196289, "global_step": 118332, "epoch": 2817} {"train_loss": -6.53078031539917, "global_step": 118333, "epoch": 2817} {"train_loss": -6.480286598205566, "global_step": 118334, "epoch": 2817} {"train_loss": -6.617079734802246, "global_step": 118335, "epoch": 2817} {"train_loss": -6.435429573059082, "global_step": 118336, "epoch": 2817} {"train_loss": -6.497847557067871, "global_step": 118337, "epoch": 2817} {"train_loss": -6.640951156616211, "global_step": 118338, "epoch": 2817} {"train_loss": -6.452193260192871, "global_step": 118339, "epoch": 2817} {"train_loss": -6.544375419616699, "global_step": 118340, "epoch": 2817} {"train_loss": -6.6425981521606445, "global_step": 118341, "epoch": 2817} {"train_loss": -6.5767059326171875, "global_step": 118342, "epoch": 2817} {"train_loss": -6.5127692222595215, "global_step": 118343, "epoch": 2817} {"train_loss": -6.6016669273376465, "global_step": 118344, "epoch": 2817} {"train_loss": -6.539741039276123, "global_step": 118345, "epoch": 2817} {"train_loss": -6.455970764160156, "global_step": 118346, "epoch": 2817} {"train_loss": -6.71230936050415, "global_step": 118347, "epoch": 2817} {"train_loss": -6.562191009521484, "global_step": 118348, "epoch": 2817} {"train_loss": -6.473156929016113, "global_step": 118349, "epoch": 2817} {"train_loss": -6.600854873657227, "global_step": 118350, "epoch": 2817} {"train_loss": -6.605075836181641, "global_step": 118351, "epoch": 2817} {"train_loss": -6.551150321960449, "global_step": 118352, "epoch": 2817} {"train_loss": -6.476865768432617, "global_step": 118353, "epoch": 2817} {"train_loss": -6.574295997619629, "global_step": 118354, "epoch": 2817} {"train_loss": -6.536498251415434, "global_step": 118355, "epoch": 2817, "val_loss": 67955.7421875} {"train_loss": -6.541117191314697, "global_step": 118356, "epoch": 2818} {"train_loss": -6.481935024261475, "global_step": 118357, "epoch": 2818} {"train_loss": -6.525449275970459, "global_step": 118358, "epoch": 2818} {"train_loss": -6.592292785644531, "global_step": 118359, "epoch": 2818} {"train_loss": -6.551917552947998, "global_step": 118360, "epoch": 2818} {"train_loss": -6.636360168457031, "global_step": 118361, "epoch": 2818} {"train_loss": -6.486997127532959, "global_step": 118362, "epoch": 2818} {"train_loss": -6.487555503845215, "global_step": 118363, "epoch": 2818} {"train_loss": -6.438883304595947, "global_step": 118364, "epoch": 2818} {"train_loss": -6.5293288230896, "global_step": 118365, "epoch": 2818} {"train_loss": -6.488207817077637, "global_step": 118366, "epoch": 2818} {"train_loss": -6.536386489868164, "global_step": 118367, "epoch": 2818} {"train_loss": -6.55225944519043, "global_step": 118368, "epoch": 2818} {"train_loss": -6.465426445007324, "global_step": 118369, "epoch": 2818} {"train_loss": -6.669414520263672, "global_step": 118370, "epoch": 2818} {"train_loss": -6.55422830581665, "global_step": 118371, "epoch": 2818} {"train_loss": -6.474237442016602, "global_step": 118372, "epoch": 2818} {"train_loss": -6.553891181945801, "global_step": 118373, "epoch": 2818} {"train_loss": -6.466708183288574, "global_step": 118374, "epoch": 2818} {"train_loss": -6.706549644470215, "global_step": 118375, "epoch": 2818} {"train_loss": -6.497837066650391, "global_step": 118376, "epoch": 2818} {"train_loss": -6.446804046630859, "global_step": 118377, "epoch": 2818} {"train_loss": -6.396790504455566, "global_step": 118378, "epoch": 2818} {"train_loss": -6.591822147369385, "global_step": 118379, "epoch": 2818} {"train_loss": -6.511427879333496, "global_step": 118380, "epoch": 2818} {"train_loss": -6.590451717376709, "global_step": 118381, "epoch": 2818} {"train_loss": -6.5569610595703125, "global_step": 118382, "epoch": 2818} {"train_loss": -6.603536128997803, "global_step": 118383, "epoch": 2818} {"train_loss": -6.499115943908691, "global_step": 118384, "epoch": 2818} {"train_loss": -6.599208831787109, "global_step": 118385, "epoch": 2818} {"train_loss": -6.5822858810424805, "global_step": 118386, "epoch": 2818} {"train_loss": -6.468533992767334, "global_step": 118387, "epoch": 2818} {"train_loss": -6.550103187561035, "global_step": 118388, "epoch": 2818} {"train_loss": -6.529951095581055, "global_step": 118389, "epoch": 2818} {"train_loss": -6.443350315093994, "global_step": 118390, "epoch": 2818} {"train_loss": -6.433625221252441, "global_step": 118391, "epoch": 2818} {"train_loss": -6.596344947814941, "global_step": 118392, "epoch": 2818} {"train_loss": -6.5862650871276855, "global_step": 118393, "epoch": 2818} {"train_loss": -6.50551176071167, "global_step": 118394, "epoch": 2818} {"train_loss": -6.451542377471924, "global_step": 118395, "epoch": 2818} {"train_loss": -6.586601257324219, "global_step": 118396, "epoch": 2818} {"train_loss": -6.529537541525705, "global_step": 118397, "epoch": 2818, "val_loss": 68013.7421875} {"train_loss": -6.506519317626953, "global_step": 118398, "epoch": 2819} {"train_loss": -6.5049943923950195, "global_step": 118399, "epoch": 2819} {"train_loss": -6.426701545715332, "global_step": 118400, "epoch": 2819} {"train_loss": -6.4313812255859375, "global_step": 118401, "epoch": 2819} {"train_loss": -6.466855049133301, "global_step": 118402, "epoch": 2819} {"train_loss": -6.505527496337891, "global_step": 118403, "epoch": 2819} {"train_loss": -6.521023750305176, "global_step": 118404, "epoch": 2819} {"train_loss": -6.447878360748291, "global_step": 118405, "epoch": 2819} {"train_loss": -6.539044380187988, "global_step": 118406, "epoch": 2819} {"train_loss": -6.40819787979126, "global_step": 118407, "epoch": 2819} {"train_loss": -6.502161979675293, "global_step": 118408, "epoch": 2819} {"train_loss": -6.5961127281188965, "global_step": 118409, "epoch": 2819} {"train_loss": -6.588421821594238, "global_step": 118410, "epoch": 2819} {"train_loss": -6.485311508178711, "global_step": 118411, "epoch": 2819} {"train_loss": -6.466362953186035, "global_step": 118412, "epoch": 2819} {"train_loss": -6.505776405334473, "global_step": 118413, "epoch": 2819} {"train_loss": -6.460330009460449, "global_step": 118414, "epoch": 2819} {"train_loss": -6.502870082855225, "global_step": 118415, "epoch": 2819} {"train_loss": -6.60630989074707, "global_step": 118416, "epoch": 2819} {"train_loss": -6.53092098236084, "global_step": 118417, "epoch": 2819} {"train_loss": -6.576728343963623, "global_step": 118418, "epoch": 2819} {"train_loss": -6.417697906494141, "global_step": 118419, "epoch": 2819} {"train_loss": -6.619410514831543, "global_step": 118420, "epoch": 2819} {"train_loss": -6.454113483428955, "global_step": 118421, "epoch": 2819} {"train_loss": -6.574590682983398, "global_step": 118422, "epoch": 2819} {"train_loss": -6.502933979034424, "global_step": 118423, "epoch": 2819} {"train_loss": -6.557206153869629, "global_step": 118424, "epoch": 2819} {"train_loss": -6.597565650939941, "global_step": 118425, "epoch": 2819} {"train_loss": -6.457088470458984, "global_step": 118426, "epoch": 2819} {"train_loss": -6.567249298095703, "global_step": 118427, "epoch": 2819} {"train_loss": -6.520312309265137, "global_step": 118428, "epoch": 2819} {"train_loss": -6.400923728942871, "global_step": 118429, "epoch": 2819} {"train_loss": -6.454668998718262, "global_step": 118430, "epoch": 2819} {"train_loss": -6.461895942687988, "global_step": 118431, "epoch": 2819} {"train_loss": -6.46807336807251, "global_step": 118432, "epoch": 2819} {"train_loss": -6.577992916107178, "global_step": 118433, "epoch": 2819} {"train_loss": -6.54197883605957, "global_step": 118434, "epoch": 2819} {"train_loss": -6.488138198852539, "global_step": 118435, "epoch": 2819} {"train_loss": -6.462750434875488, "global_step": 118436, "epoch": 2819} {"train_loss": -6.47480583190918, "global_step": 118437, "epoch": 2819} {"train_loss": -6.425976753234863, "global_step": 118438, "epoch": 2819} {"train_loss": -6.502429349081857, "global_step": 118439, "epoch": 2819, "val_loss": 67802.015625} {"train_loss": -6.513602256774902, "global_step": 118440, "epoch": 2820} {"train_loss": -6.5051069259643555, "global_step": 118441, "epoch": 2820} {"train_loss": -6.480088233947754, "global_step": 118442, "epoch": 2820} {"train_loss": -6.5026092529296875, "global_step": 118443, "epoch": 2820} {"train_loss": -6.506503105163574, "global_step": 118444, "epoch": 2820} {"train_loss": -6.365245819091797, "global_step": 118445, "epoch": 2820} {"train_loss": -6.493141174316406, "global_step": 118446, "epoch": 2820} {"train_loss": -6.470287322998047, "global_step": 118447, "epoch": 2820} {"train_loss": -6.406196117401123, "global_step": 118448, "epoch": 2820} {"train_loss": -6.48094367980957, "global_step": 118449, "epoch": 2820} {"train_loss": -6.500655174255371, "global_step": 118450, "epoch": 2820} {"train_loss": -6.539878845214844, "global_step": 118451, "epoch": 2820} {"train_loss": -6.48098611831665, "global_step": 118452, "epoch": 2820} {"train_loss": -6.574547290802002, "global_step": 118453, "epoch": 2820} {"train_loss": -6.430582046508789, "global_step": 118454, "epoch": 2820} {"train_loss": -6.403159141540527, "global_step": 118455, "epoch": 2820} {"train_loss": -6.494108200073242, "global_step": 118456, "epoch": 2820} {"train_loss": -6.454154968261719, "global_step": 118457, "epoch": 2820} {"train_loss": -6.547188758850098, "global_step": 118458, "epoch": 2820} {"train_loss": -6.4903740882873535, "global_step": 118459, "epoch": 2820} {"train_loss": -6.651262283325195, "global_step": 118460, "epoch": 2820} {"train_loss": -6.594964981079102, "global_step": 118461, "epoch": 2820} {"train_loss": -6.539980888366699, "global_step": 118462, "epoch": 2820} {"train_loss": -6.499109268188477, "global_step": 118463, "epoch": 2820} {"train_loss": -6.472182273864746, "global_step": 118464, "epoch": 2820} {"train_loss": -6.545867919921875, "global_step": 118465, "epoch": 2820} {"train_loss": -6.600229263305664, "global_step": 118466, "epoch": 2820} {"train_loss": -6.421652793884277, "global_step": 118467, "epoch": 2820} {"train_loss": -6.412127494812012, "global_step": 118468, "epoch": 2820} {"train_loss": -6.498988628387451, "global_step": 118469, "epoch": 2820} {"train_loss": -6.5866899490356445, "global_step": 118470, "epoch": 2820} {"train_loss": -6.461272716522217, "global_step": 118471, "epoch": 2820} {"train_loss": -6.4102277755737305, "global_step": 118472, "epoch": 2820} {"train_loss": -6.255585193634033, "global_step": 118473, "epoch": 2820} {"train_loss": -6.520738124847412, "global_step": 118474, "epoch": 2820} {"train_loss": -6.4163360595703125, "global_step": 118475, "epoch": 2820} {"train_loss": -6.341801643371582, "global_step": 118476, "epoch": 2820} {"train_loss": -6.533679485321045, "global_step": 118477, "epoch": 2820} {"train_loss": -6.506121635437012, "global_step": 118478, "epoch": 2820} {"train_loss": -6.403680801391602, "global_step": 118479, "epoch": 2820} {"train_loss": -6.4228386878967285, "global_step": 118480, "epoch": 2820} {"train_loss": -6.47943317322504, "global_step": 118481, "epoch": 2820, "val_loss": 68147.078125} {"train_loss": -6.278435707092285, "global_step": 118482, "epoch": 2821} {"train_loss": -6.4389848709106445, "global_step": 118483, "epoch": 2821} {"train_loss": -6.464694976806641, "global_step": 118484, "epoch": 2821} {"train_loss": -6.3517961502075195, "global_step": 118485, "epoch": 2821} {"train_loss": -6.472777366638184, "global_step": 118486, "epoch": 2821} {"train_loss": -6.446699142456055, "global_step": 118487, "epoch": 2821} {"train_loss": -6.391160011291504, "global_step": 118488, "epoch": 2821} {"train_loss": -6.492058753967285, "global_step": 118489, "epoch": 2821} {"train_loss": -6.442465782165527, "global_step": 118490, "epoch": 2821} {"train_loss": -6.441335201263428, "global_step": 118491, "epoch": 2821} {"train_loss": -6.477181911468506, "global_step": 118492, "epoch": 2821} {"train_loss": -6.264705657958984, "global_step": 118493, "epoch": 2821} {"train_loss": -6.522974014282227, "global_step": 118494, "epoch": 2821} {"train_loss": -6.431512832641602, "global_step": 118495, "epoch": 2821} {"train_loss": -6.415036201477051, "global_step": 118496, "epoch": 2821} {"train_loss": -6.623473167419434, "global_step": 118497, "epoch": 2821} {"train_loss": -6.553019046783447, "global_step": 118498, "epoch": 2821} {"train_loss": -6.40395975112915, "global_step": 118499, "epoch": 2821} {"train_loss": -6.511323928833008, "global_step": 118500, "epoch": 2821} {"train_loss": -6.448051452636719, "global_step": 118501, "epoch": 2821} {"train_loss": -6.561949729919434, "global_step": 118502, "epoch": 2821} {"train_loss": -6.507043838500977, "global_step": 118503, "epoch": 2821} {"train_loss": -6.539187431335449, "global_step": 118504, "epoch": 2821} {"train_loss": -6.652688980102539, "global_step": 118505, "epoch": 2821} {"train_loss": -6.574933052062988, "global_step": 118506, "epoch": 2821} {"train_loss": -6.51796817779541, "global_step": 118507, "epoch": 2821} {"train_loss": -6.4807939529418945, "global_step": 118508, "epoch": 2821} {"train_loss": -6.54964542388916, "global_step": 118509, "epoch": 2821} {"train_loss": -6.579732418060303, "global_step": 118510, "epoch": 2821} {"train_loss": -6.48508358001709, "global_step": 118511, "epoch": 2821} {"train_loss": -6.5550031661987305, "global_step": 118512, "epoch": 2821} {"train_loss": -6.564051628112793, "global_step": 118513, "epoch": 2821} {"train_loss": -6.601180076599121, "global_step": 118514, "epoch": 2821} {"train_loss": -6.616887092590332, "global_step": 118515, "epoch": 2821} {"train_loss": -6.667035102844238, "global_step": 118516, "epoch": 2821} {"train_loss": -6.594473838806152, "global_step": 118517, "epoch": 2821} {"train_loss": -6.5859880447387695, "global_step": 118518, "epoch": 2821} {"train_loss": -6.4348225593566895, "global_step": 118519, "epoch": 2821} {"train_loss": -6.591588020324707, "global_step": 118520, "epoch": 2821} {"train_loss": -6.417311668395996, "global_step": 118521, "epoch": 2821} {"train_loss": -6.447884559631348, "global_step": 118522, "epoch": 2821} {"train_loss": -6.498899005708241, "global_step": 118523, "epoch": 2821, "val_loss": 67849.25} {"train_loss": -6.628014087677002, "global_step": 118524, "epoch": 2822} {"train_loss": -6.591776371002197, "global_step": 118525, "epoch": 2822} {"train_loss": -6.519986152648926, "global_step": 118526, "epoch": 2822} {"train_loss": -6.5017571449279785, "global_step": 118527, "epoch": 2822} {"train_loss": -6.54086971282959, "global_step": 118528, "epoch": 2822} {"train_loss": -6.637707710266113, "global_step": 118529, "epoch": 2822} {"train_loss": -6.571743011474609, "global_step": 118530, "epoch": 2822} {"train_loss": -6.588502883911133, "global_step": 118531, "epoch": 2822} {"train_loss": -6.587031841278076, "global_step": 118532, "epoch": 2822} {"train_loss": -6.564052581787109, "global_step": 118533, "epoch": 2822} {"train_loss": -6.502068519592285, "global_step": 118534, "epoch": 2822} {"train_loss": -6.518709182739258, "global_step": 118535, "epoch": 2822} {"train_loss": -6.630370140075684, "global_step": 118536, "epoch": 2822} {"train_loss": -6.498061656951904, "global_step": 118537, "epoch": 2822} {"train_loss": -6.470699787139893, "global_step": 118538, "epoch": 2822} {"train_loss": -6.447781562805176, "global_step": 118539, "epoch": 2822} {"train_loss": -6.626657485961914, "global_step": 118540, "epoch": 2822} {"train_loss": -6.5420451164245605, "global_step": 118541, "epoch": 2822} {"train_loss": -6.527162551879883, "global_step": 118542, "epoch": 2822} {"train_loss": -6.6202921867370605, "global_step": 118543, "epoch": 2822} {"train_loss": -6.4719719886779785, "global_step": 118544, "epoch": 2822} {"train_loss": -6.510242938995361, "global_step": 118545, "epoch": 2822} {"train_loss": -6.461185932159424, "global_step": 118546, "epoch": 2822} {"train_loss": -6.511027812957764, "global_step": 118547, "epoch": 2822} {"train_loss": -6.468891143798828, "global_step": 118548, "epoch": 2822} {"train_loss": -6.481514930725098, "global_step": 118549, "epoch": 2822} {"train_loss": -6.397673606872559, "global_step": 118550, "epoch": 2822} {"train_loss": -6.429328918457031, "global_step": 118551, "epoch": 2822} {"train_loss": -6.550502777099609, "global_step": 118552, "epoch": 2822} {"train_loss": -6.525843143463135, "global_step": 118553, "epoch": 2822} {"train_loss": -6.578214645385742, "global_step": 118554, "epoch": 2822} {"train_loss": -6.5045061111450195, "global_step": 118555, "epoch": 2822} {"train_loss": -6.4293742179870605, "global_step": 118556, "epoch": 2822} {"train_loss": -6.49129056930542, "global_step": 118557, "epoch": 2822} {"train_loss": -6.4916672706604, "global_step": 118558, "epoch": 2822} {"train_loss": -6.5303497314453125, "global_step": 118559, "epoch": 2822} {"train_loss": -6.557348728179932, "global_step": 118560, "epoch": 2822} {"train_loss": -6.558006286621094, "global_step": 118561, "epoch": 2822} {"train_loss": -6.55151891708374, "global_step": 118562, "epoch": 2822} {"train_loss": -6.383292198181152, "global_step": 118563, "epoch": 2822} {"train_loss": -6.594211101531982, "global_step": 118564, "epoch": 2822} {"train_loss": -6.526358717963809, "global_step": 118565, "epoch": 2822, "val_loss": 68040.0546875} {"train_loss": -6.591565132141113, "global_step": 118566, "epoch": 2823} {"train_loss": -6.496796131134033, "global_step": 118567, "epoch": 2823} {"train_loss": -6.455605506896973, "global_step": 118568, "epoch": 2823} {"train_loss": -6.469099998474121, "global_step": 118569, "epoch": 2823} {"train_loss": -6.717784404754639, "global_step": 118570, "epoch": 2823} {"train_loss": -6.457935333251953, "global_step": 118571, "epoch": 2823} {"train_loss": -6.474204063415527, "global_step": 118572, "epoch": 2823} {"train_loss": -6.564420223236084, "global_step": 118573, "epoch": 2823} {"train_loss": -6.495301246643066, "global_step": 118574, "epoch": 2823} {"train_loss": -6.515542507171631, "global_step": 118575, "epoch": 2823} {"train_loss": -6.669695854187012, "global_step": 118576, "epoch": 2823} {"train_loss": -6.629915714263916, "global_step": 118577, "epoch": 2823} {"train_loss": -6.4898786544799805, "global_step": 118578, "epoch": 2823} {"train_loss": -6.52079963684082, "global_step": 118579, "epoch": 2823} {"train_loss": -6.599164962768555, "global_step": 118580, "epoch": 2823} {"train_loss": -6.501734733581543, "global_step": 118581, "epoch": 2823} {"train_loss": -6.355710506439209, "global_step": 118582, "epoch": 2823} {"train_loss": -6.571776390075684, "global_step": 118583, "epoch": 2823} {"train_loss": -6.474989414215088, "global_step": 118584, "epoch": 2823} {"train_loss": -6.4155426025390625, "global_step": 118585, "epoch": 2823} {"train_loss": -6.581876754760742, "global_step": 118586, "epoch": 2823} {"train_loss": -6.537644863128662, "global_step": 118587, "epoch": 2823} {"train_loss": -6.544442653656006, "global_step": 118588, "epoch": 2823} {"train_loss": -6.508173942565918, "global_step": 118589, "epoch": 2823} {"train_loss": -6.526449203491211, "global_step": 118590, "epoch": 2823} {"train_loss": -6.523431777954102, "global_step": 118591, "epoch": 2823} {"train_loss": -6.509871482849121, "global_step": 118592, "epoch": 2823} {"train_loss": -6.484261989593506, "global_step": 118593, "epoch": 2823} {"train_loss": -6.511441230773926, "global_step": 118594, "epoch": 2823} {"train_loss": -6.458359718322754, "global_step": 118595, "epoch": 2823} {"train_loss": -6.614672660827637, "global_step": 118596, "epoch": 2823} {"train_loss": -6.493586540222168, "global_step": 118597, "epoch": 2823} {"train_loss": -6.5877227783203125, "global_step": 118598, "epoch": 2823} {"train_loss": -6.496569633483887, "global_step": 118599, "epoch": 2823} {"train_loss": -6.521636486053467, "global_step": 118600, "epoch": 2823} {"train_loss": -6.414858341217041, "global_step": 118601, "epoch": 2823} {"train_loss": -6.492923736572266, "global_step": 118602, "epoch": 2823} {"train_loss": -6.503429412841797, "global_step": 118603, "epoch": 2823} {"train_loss": -6.5797319412231445, "global_step": 118604, "epoch": 2823} {"train_loss": -6.508210182189941, "global_step": 118605, "epoch": 2823} {"train_loss": -6.380333423614502, "global_step": 118606, "epoch": 2823} {"train_loss": -6.518569106147403, "global_step": 118607, "epoch": 2823, "val_loss": 67994.484375} {"train_loss": -6.528399467468262, "global_step": 118608, "epoch": 2824} {"train_loss": -6.529152870178223, "global_step": 118609, "epoch": 2824} {"train_loss": -6.48182487487793, "global_step": 118610, "epoch": 2824} {"train_loss": -6.564596652984619, "global_step": 118611, "epoch": 2824} {"train_loss": -6.408834457397461, "global_step": 118612, "epoch": 2824} {"train_loss": -6.557576656341553, "global_step": 118613, "epoch": 2824} {"train_loss": -6.597883224487305, "global_step": 118614, "epoch": 2824} {"train_loss": -6.567030906677246, "global_step": 118615, "epoch": 2824} {"train_loss": -6.515393257141113, "global_step": 118616, "epoch": 2824} {"train_loss": -6.529155731201172, "global_step": 118617, "epoch": 2824} {"train_loss": -6.45982027053833, "global_step": 118618, "epoch": 2824} {"train_loss": -6.558812141418457, "global_step": 118619, "epoch": 2824} {"train_loss": -6.525899887084961, "global_step": 118620, "epoch": 2824} {"train_loss": -6.378551483154297, "global_step": 118621, "epoch": 2824} {"train_loss": -6.621102333068848, "global_step": 118622, "epoch": 2824} {"train_loss": -6.401771068572998, "global_step": 118623, "epoch": 2824} {"train_loss": -6.459446430206299, "global_step": 118624, "epoch": 2824} {"train_loss": -6.441720008850098, "global_step": 118625, "epoch": 2824} {"train_loss": -6.4519805908203125, "global_step": 118626, "epoch": 2824} {"train_loss": -6.5275373458862305, "global_step": 118627, "epoch": 2824} {"train_loss": -6.467883110046387, "global_step": 118628, "epoch": 2824} {"train_loss": -6.559295654296875, "global_step": 118629, "epoch": 2824} {"train_loss": -6.471931457519531, "global_step": 118630, "epoch": 2824} {"train_loss": -6.395792007446289, "global_step": 118631, "epoch": 2824} {"train_loss": -6.431307792663574, "global_step": 118632, "epoch": 2824} {"train_loss": -6.490294456481934, "global_step": 118633, "epoch": 2824} {"train_loss": -6.453812599182129, "global_step": 118634, "epoch": 2824} {"train_loss": -6.5517497062683105, "global_step": 118635, "epoch": 2824} {"train_loss": -6.400963306427002, "global_step": 118636, "epoch": 2824} {"train_loss": -6.583475589752197, "global_step": 118637, "epoch": 2824} {"train_loss": -6.46958065032959, "global_step": 118638, "epoch": 2824} {"train_loss": -6.502586841583252, "global_step": 118639, "epoch": 2824} {"train_loss": -6.495547294616699, "global_step": 118640, "epoch": 2824} {"train_loss": -6.414336204528809, "global_step": 118641, "epoch": 2824} {"train_loss": -6.526791095733643, "global_step": 118642, "epoch": 2824} {"train_loss": -6.402988433837891, "global_step": 118643, "epoch": 2824} {"train_loss": -6.539438247680664, "global_step": 118644, "epoch": 2824} {"train_loss": -6.476310729980469, "global_step": 118645, "epoch": 2824} {"train_loss": -6.5013427734375, "global_step": 118646, "epoch": 2824} {"train_loss": -6.5157880783081055, "global_step": 118647, "epoch": 2824} {"train_loss": -6.462045192718506, "global_step": 118648, "epoch": 2824} {"train_loss": -6.494129112788609, "global_step": 118649, "epoch": 2824, "val_loss": 68113.7265625} {"train_loss": -6.532939434051514, "global_step": 118650, "epoch": 2825} {"train_loss": -6.414993762969971, "global_step": 118651, "epoch": 2825} {"train_loss": -6.499697685241699, "global_step": 118652, "epoch": 2825} {"train_loss": -6.48316764831543, "global_step": 118653, "epoch": 2825} {"train_loss": -6.504167556762695, "global_step": 118654, "epoch": 2825} {"train_loss": -6.522690296173096, "global_step": 118655, "epoch": 2825} {"train_loss": -6.572059154510498, "global_step": 118656, "epoch": 2825} {"train_loss": -6.529340744018555, "global_step": 118657, "epoch": 2825} {"train_loss": -6.498048782348633, "global_step": 118658, "epoch": 2825} {"train_loss": -6.4162917137146, "global_step": 118659, "epoch": 2825} {"train_loss": -6.6371564865112305, "global_step": 118660, "epoch": 2825} {"train_loss": -6.644710540771484, "global_step": 118661, "epoch": 2825} {"train_loss": -6.532163143157959, "global_step": 118662, "epoch": 2825} {"train_loss": -6.420472145080566, "global_step": 118663, "epoch": 2825} {"train_loss": -6.5889434814453125, "global_step": 118664, "epoch": 2825} {"train_loss": -6.477860450744629, "global_step": 118665, "epoch": 2825} {"train_loss": -6.496490478515625, "global_step": 118666, "epoch": 2825} {"train_loss": -6.440587997436523, "global_step": 118667, "epoch": 2825} {"train_loss": -6.596367359161377, "global_step": 118668, "epoch": 2825} {"train_loss": -6.533608436584473, "global_step": 118669, "epoch": 2825} {"train_loss": -6.493178367614746, "global_step": 118670, "epoch": 2825} {"train_loss": -6.539670944213867, "global_step": 118671, "epoch": 2825} {"train_loss": -6.482513904571533, "global_step": 118672, "epoch": 2825} {"train_loss": -6.68779182434082, "global_step": 118673, "epoch": 2825} {"train_loss": -6.562163352966309, "global_step": 118674, "epoch": 2825} {"train_loss": -6.589848518371582, "global_step": 118675, "epoch": 2825} {"train_loss": -6.4806013107299805, "global_step": 118676, "epoch": 2825} {"train_loss": -6.564818382263184, "global_step": 118677, "epoch": 2825} {"train_loss": -6.5021772384643555, "global_step": 118678, "epoch": 2825} {"train_loss": -6.539736270904541, "global_step": 118679, "epoch": 2825} {"train_loss": -6.422026634216309, "global_step": 118680, "epoch": 2825} {"train_loss": -6.489012718200684, "global_step": 118681, "epoch": 2825} {"train_loss": -6.443865776062012, "global_step": 118682, "epoch": 2825} {"train_loss": -6.415736675262451, "global_step": 118683, "epoch": 2825} {"train_loss": -6.653693675994873, "global_step": 118684, "epoch": 2825} {"train_loss": -6.508864402770996, "global_step": 118685, "epoch": 2825} {"train_loss": -6.538334846496582, "global_step": 118686, "epoch": 2825} {"train_loss": -6.505802154541016, "global_step": 118687, "epoch": 2825} {"train_loss": -6.482778549194336, "global_step": 118688, "epoch": 2825} {"train_loss": -6.417123794555664, "global_step": 118689, "epoch": 2825} {"train_loss": -6.510256767272949, "global_step": 118690, "epoch": 2825} {"train_loss": -6.516475302832467, "global_step": 118691, "epoch": 2825, "val_loss": 67920.59375} {"train_loss": -6.456803798675537, "global_step": 118692, "epoch": 2826} {"train_loss": -6.502806186676025, "global_step": 118693, "epoch": 2826} {"train_loss": -6.516104698181152, "global_step": 118694, "epoch": 2826} {"train_loss": -6.496177673339844, "global_step": 118695, "epoch": 2826} {"train_loss": -6.505454063415527, "global_step": 118696, "epoch": 2826} {"train_loss": -6.412045478820801, "global_step": 118697, "epoch": 2826} {"train_loss": -6.442532062530518, "global_step": 118698, "epoch": 2826} {"train_loss": -6.482044219970703, "global_step": 118699, "epoch": 2826} {"train_loss": -6.546307563781738, "global_step": 118700, "epoch": 2826} {"train_loss": -6.573558807373047, "global_step": 118701, "epoch": 2826} {"train_loss": -6.606435775756836, "global_step": 118702, "epoch": 2826} {"train_loss": -6.355359077453613, "global_step": 118703, "epoch": 2826} {"train_loss": -6.52016544342041, "global_step": 118704, "epoch": 2826} {"train_loss": -6.450395107269287, "global_step": 118705, "epoch": 2826} {"train_loss": -6.458815574645996, "global_step": 118706, "epoch": 2826} {"train_loss": -6.533980846405029, "global_step": 118707, "epoch": 2826} {"train_loss": -6.529444217681885, "global_step": 118708, "epoch": 2826} {"train_loss": -6.51571798324585, "global_step": 118709, "epoch": 2826} {"train_loss": -6.427973747253418, "global_step": 118710, "epoch": 2826} {"train_loss": -6.398073673248291, "global_step": 118711, "epoch": 2826} {"train_loss": -6.40794563293457, "global_step": 118712, "epoch": 2826} {"train_loss": -6.431240081787109, "global_step": 118713, "epoch": 2826} {"train_loss": -6.396379470825195, "global_step": 118714, "epoch": 2826} {"train_loss": -6.3450751304626465, "global_step": 118715, "epoch": 2826} {"train_loss": -6.485535621643066, "global_step": 118716, "epoch": 2826} {"train_loss": -6.318787574768066, "global_step": 118717, "epoch": 2826} {"train_loss": -6.420072555541992, "global_step": 118718, "epoch": 2826} {"train_loss": -6.4151411056518555, "global_step": 118719, "epoch": 2826} {"train_loss": -6.499064922332764, "global_step": 118720, "epoch": 2826} {"train_loss": -6.463183879852295, "global_step": 118721, "epoch": 2826} {"train_loss": -6.453559875488281, "global_step": 118722, "epoch": 2826} {"train_loss": -6.497957229614258, "global_step": 118723, "epoch": 2826} {"train_loss": -6.542209148406982, "global_step": 118724, "epoch": 2826} {"train_loss": -6.420189380645752, "global_step": 118725, "epoch": 2826} {"train_loss": -6.49536657333374, "global_step": 118726, "epoch": 2826} {"train_loss": -6.341428279876709, "global_step": 118727, "epoch": 2826} {"train_loss": -6.459257125854492, "global_step": 118728, "epoch": 2826} {"train_loss": -6.532225608825684, "global_step": 118729, "epoch": 2826} {"train_loss": -6.449681758880615, "global_step": 118730, "epoch": 2826} {"train_loss": -6.512889862060547, "global_step": 118731, "epoch": 2826} {"train_loss": -6.41585636138916, "global_step": 118732, "epoch": 2826} {"train_loss": -6.462705226171584, "global_step": 118733, "epoch": 2826, "val_loss": 68097.3125} {"train_loss": -6.361757755279541, "global_step": 118734, "epoch": 2827} {"train_loss": -6.560657501220703, "global_step": 118735, "epoch": 2827} {"train_loss": -6.450794219970703, "global_step": 118736, "epoch": 2827} {"train_loss": -6.433883190155029, "global_step": 118737, "epoch": 2827} {"train_loss": -6.515588760375977, "global_step": 118738, "epoch": 2827} {"train_loss": -6.514596939086914, "global_step": 118739, "epoch": 2827} {"train_loss": -6.501897811889648, "global_step": 118740, "epoch": 2827} {"train_loss": -6.609762191772461, "global_step": 118741, "epoch": 2827} {"train_loss": -6.454226970672607, "global_step": 118742, "epoch": 2827} {"train_loss": -6.437900543212891, "global_step": 118743, "epoch": 2827} {"train_loss": -6.5223002433776855, "global_step": 118744, "epoch": 2827} {"train_loss": -6.468894958496094, "global_step": 118745, "epoch": 2827} {"train_loss": -6.553154945373535, "global_step": 118746, "epoch": 2827} {"train_loss": -6.458258628845215, "global_step": 118747, "epoch": 2827} {"train_loss": -6.490018844604492, "global_step": 118748, "epoch": 2827} {"train_loss": -6.541057586669922, "global_step": 118749, "epoch": 2827} {"train_loss": -6.479211330413818, "global_step": 118750, "epoch": 2827} {"train_loss": -6.515295028686523, "global_step": 118751, "epoch": 2827} {"train_loss": -6.349302291870117, "global_step": 118752, "epoch": 2827} {"train_loss": -6.566826820373535, "global_step": 118753, "epoch": 2827} {"train_loss": -6.372852325439453, "global_step": 118754, "epoch": 2827} {"train_loss": -6.470654487609863, "global_step": 118755, "epoch": 2827} {"train_loss": -6.578820705413818, "global_step": 118756, "epoch": 2827} {"train_loss": -6.447170257568359, "global_step": 118757, "epoch": 2827} {"train_loss": -6.427053451538086, "global_step": 118758, "epoch": 2827} {"train_loss": -6.267492294311523, "global_step": 118759, "epoch": 2827} {"train_loss": -6.608415603637695, "global_step": 118760, "epoch": 2827} {"train_loss": -6.484793186187744, "global_step": 118761, "epoch": 2827} {"train_loss": -6.558314323425293, "global_step": 118762, "epoch": 2827} {"train_loss": -6.363800048828125, "global_step": 118763, "epoch": 2827} {"train_loss": -6.506726264953613, "global_step": 118764, "epoch": 2827} {"train_loss": -6.4251604080200195, "global_step": 118765, "epoch": 2827} {"train_loss": -6.487682342529297, "global_step": 118766, "epoch": 2827} {"train_loss": -6.504552841186523, "global_step": 118767, "epoch": 2827} {"train_loss": -6.457770824432373, "global_step": 118768, "epoch": 2827} {"train_loss": -6.420314788818359, "global_step": 118769, "epoch": 2827} {"train_loss": -6.380544662475586, "global_step": 118770, "epoch": 2827} {"train_loss": -6.515727996826172, "global_step": 118771, "epoch": 2827} {"train_loss": -6.47479248046875, "global_step": 118772, "epoch": 2827} {"train_loss": -6.471664905548096, "global_step": 118773, "epoch": 2827} {"train_loss": -6.443894386291504, "global_step": 118774, "epoch": 2827} {"train_loss": -6.475736107145037, "global_step": 118775, "epoch": 2827, "val_loss": 68036.3125} {"train_loss": -6.545465469360352, "global_step": 118776, "epoch": 2828} {"train_loss": -6.493078708648682, "global_step": 118777, "epoch": 2828} {"train_loss": -6.522770881652832, "global_step": 118778, "epoch": 2828} {"train_loss": -6.460827827453613, "global_step": 118779, "epoch": 2828} {"train_loss": -6.414047718048096, "global_step": 118780, "epoch": 2828} {"train_loss": -6.633677959442139, "global_step": 118781, "epoch": 2828} {"train_loss": -6.59929084777832, "global_step": 118782, "epoch": 2828} {"train_loss": -6.451605796813965, "global_step": 118783, "epoch": 2828} {"train_loss": -6.442166805267334, "global_step": 118784, "epoch": 2828} {"train_loss": -6.555154800415039, "global_step": 118785, "epoch": 2828} {"train_loss": -6.47081184387207, "global_step": 118786, "epoch": 2828} {"train_loss": -6.63993501663208, "global_step": 118787, "epoch": 2828} {"train_loss": -6.696515083312988, "global_step": 118788, "epoch": 2828} {"train_loss": -6.556506156921387, "global_step": 118789, "epoch": 2828} {"train_loss": -6.5117692947387695, "global_step": 118790, "epoch": 2828} {"train_loss": -6.5195441246032715, "global_step": 118791, "epoch": 2828} {"train_loss": -6.550483226776123, "global_step": 118792, "epoch": 2828} {"train_loss": -6.583600044250488, "global_step": 118793, "epoch": 2828} {"train_loss": -6.437188148498535, "global_step": 118794, "epoch": 2828} {"train_loss": -6.416037559509277, "global_step": 118795, "epoch": 2828} {"train_loss": -6.623464584350586, "global_step": 118796, "epoch": 2828} {"train_loss": -6.631994724273682, "global_step": 118797, "epoch": 2828} {"train_loss": -6.6163434982299805, "global_step": 118798, "epoch": 2828} {"train_loss": -6.53220272064209, "global_step": 118799, "epoch": 2828} {"train_loss": -6.558564186096191, "global_step": 118800, "epoch": 2828} {"train_loss": -6.484313488006592, "global_step": 118801, "epoch": 2828} {"train_loss": -6.504006862640381, "global_step": 118802, "epoch": 2828} {"train_loss": -6.576137065887451, "global_step": 118803, "epoch": 2828} {"train_loss": -6.356443881988525, "global_step": 118804, "epoch": 2828} {"train_loss": -6.506458282470703, "global_step": 118805, "epoch": 2828} {"train_loss": -6.496729850769043, "global_step": 118806, "epoch": 2828} {"train_loss": -6.458800315856934, "global_step": 118807, "epoch": 2828} {"train_loss": -6.373523235321045, "global_step": 118808, "epoch": 2828} {"train_loss": -6.410312652587891, "global_step": 118809, "epoch": 2828} {"train_loss": -6.479335784912109, "global_step": 118810, "epoch": 2828} {"train_loss": -6.445076942443848, "global_step": 118811, "epoch": 2828} {"train_loss": -6.47029447555542, "global_step": 118812, "epoch": 2828} {"train_loss": -6.540404796600342, "global_step": 118813, "epoch": 2828} {"train_loss": -6.378576278686523, "global_step": 118814, "epoch": 2828} {"train_loss": -6.581429958343506, "global_step": 118815, "epoch": 2828} {"train_loss": -6.537449836730957, "global_step": 118816, "epoch": 2828} {"train_loss": -6.515570901689076, "global_step": 118817, "epoch": 2828, "val_loss": 67988.7109375} {"train_loss": -6.4646196365356445, "global_step": 118818, "epoch": 2829} {"train_loss": -6.525805473327637, "global_step": 118819, "epoch": 2829} {"train_loss": -6.4568305015563965, "global_step": 118820, "epoch": 2829} {"train_loss": -6.508340835571289, "global_step": 118821, "epoch": 2829} {"train_loss": -6.578114986419678, "global_step": 118822, "epoch": 2829} {"train_loss": -6.599739074707031, "global_step": 118823, "epoch": 2829} {"train_loss": -6.411321640014648, "global_step": 118824, "epoch": 2829} {"train_loss": -6.526065826416016, "global_step": 118825, "epoch": 2829} {"train_loss": -6.5010271072387695, "global_step": 118826, "epoch": 2829} {"train_loss": -6.573144912719727, "global_step": 118827, "epoch": 2829} {"train_loss": -6.548275470733643, "global_step": 118828, "epoch": 2829} {"train_loss": -6.489108085632324, "global_step": 118829, "epoch": 2829} {"train_loss": -6.603836536407471, "global_step": 118830, "epoch": 2829} {"train_loss": -6.442018508911133, "global_step": 118831, "epoch": 2829} {"train_loss": -6.563144207000732, "global_step": 118832, "epoch": 2829} {"train_loss": -6.448936939239502, "global_step": 118833, "epoch": 2829} {"train_loss": -6.517245292663574, "global_step": 118834, "epoch": 2829} {"train_loss": -6.468311309814453, "global_step": 118835, "epoch": 2829} {"train_loss": -6.544096946716309, "global_step": 118836, "epoch": 2829} {"train_loss": -6.637584686279297, "global_step": 118837, "epoch": 2829} {"train_loss": -6.510251522064209, "global_step": 118838, "epoch": 2829} {"train_loss": -6.509128570556641, "global_step": 118839, "epoch": 2829} {"train_loss": -6.443448066711426, "global_step": 118840, "epoch": 2829} {"train_loss": -6.482471466064453, "global_step": 118841, "epoch": 2829} {"train_loss": -6.572021484375, "global_step": 118842, "epoch": 2829} {"train_loss": -6.380829811096191, "global_step": 118843, "epoch": 2829} {"train_loss": -6.539624214172363, "global_step": 118844, "epoch": 2829} {"train_loss": -6.604737281799316, "global_step": 118845, "epoch": 2829} {"train_loss": -6.532455921173096, "global_step": 118846, "epoch": 2829} {"train_loss": -6.468288421630859, "global_step": 118847, "epoch": 2829} {"train_loss": -6.460731029510498, "global_step": 118848, "epoch": 2829} {"train_loss": -6.583245277404785, "global_step": 118849, "epoch": 2829} {"train_loss": -6.735675811767578, "global_step": 118850, "epoch": 2829} {"train_loss": -6.468595027923584, "global_step": 118851, "epoch": 2829} {"train_loss": -6.525826454162598, "global_step": 118852, "epoch": 2829} {"train_loss": -6.610480308532715, "global_step": 118853, "epoch": 2829} {"train_loss": -6.471142768859863, "global_step": 118854, "epoch": 2829} {"train_loss": -6.420891761779785, "global_step": 118855, "epoch": 2829} {"train_loss": -6.598226547241211, "global_step": 118856, "epoch": 2829} {"train_loss": -6.591171741485596, "global_step": 118857, "epoch": 2829} {"train_loss": -6.6208906173706055, "global_step": 118858, "epoch": 2829} {"train_loss": -6.523712907518659, "global_step": 118859, "epoch": 2829, "val_loss": 67966.6484375} {"train_loss": -6.665036201477051, "global_step": 118860, "epoch": 2830} {"train_loss": -6.513795375823975, "global_step": 118861, "epoch": 2830} {"train_loss": -6.582368850708008, "global_step": 118862, "epoch": 2830} {"train_loss": -6.577585220336914, "global_step": 118863, "epoch": 2830} {"train_loss": -6.495501518249512, "global_step": 118864, "epoch": 2830} {"train_loss": -6.4548187255859375, "global_step": 118865, "epoch": 2830} {"train_loss": -6.543407440185547, "global_step": 118866, "epoch": 2830} {"train_loss": -6.403903961181641, "global_step": 118867, "epoch": 2830} {"train_loss": -6.417006492614746, "global_step": 118868, "epoch": 2830} {"train_loss": -6.351752281188965, "global_step": 118869, "epoch": 2830} {"train_loss": -6.600550174713135, "global_step": 118870, "epoch": 2830} {"train_loss": -6.363674640655518, "global_step": 118871, "epoch": 2830} {"train_loss": -6.458884239196777, "global_step": 118872, "epoch": 2830} {"train_loss": -6.631436347961426, "global_step": 118873, "epoch": 2830} {"train_loss": -6.39227294921875, "global_step": 118874, "epoch": 2830} {"train_loss": -6.543817043304443, "global_step": 118875, "epoch": 2830} {"train_loss": -6.47644567489624, "global_step": 118876, "epoch": 2830} {"train_loss": -6.447397232055664, "global_step": 118877, "epoch": 2830} {"train_loss": -6.517173767089844, "global_step": 118878, "epoch": 2830} {"train_loss": -6.493145942687988, "global_step": 118879, "epoch": 2830} {"train_loss": -6.503641128540039, "global_step": 118880, "epoch": 2830} {"train_loss": -6.551801681518555, "global_step": 118881, "epoch": 2830} {"train_loss": -6.535574436187744, "global_step": 118882, "epoch": 2830} {"train_loss": -6.457372665405273, "global_step": 118883, "epoch": 2830} {"train_loss": -6.49434757232666, "global_step": 118884, "epoch": 2830} {"train_loss": -6.472869873046875, "global_step": 118885, "epoch": 2830} {"train_loss": -6.542271137237549, "global_step": 118886, "epoch": 2830} {"train_loss": -6.4246344566345215, "global_step": 118887, "epoch": 2830} {"train_loss": -6.589975357055664, "global_step": 118888, "epoch": 2830} {"train_loss": -6.405817031860352, "global_step": 118889, "epoch": 2830} {"train_loss": -6.354083061218262, "global_step": 118890, "epoch": 2830} {"train_loss": -6.470476150512695, "global_step": 118891, "epoch": 2830} {"train_loss": -6.362675666809082, "global_step": 118892, "epoch": 2830} {"train_loss": -6.410529136657715, "global_step": 118893, "epoch": 2830} {"train_loss": -6.423983573913574, "global_step": 118894, "epoch": 2830} {"train_loss": -6.457021236419678, "global_step": 118895, "epoch": 2830} {"train_loss": -6.598421096801758, "global_step": 118896, "epoch": 2830} {"train_loss": -6.519874572753906, "global_step": 118897, "epoch": 2830} {"train_loss": -6.470563888549805, "global_step": 118898, "epoch": 2830} {"train_loss": -6.639226913452148, "global_step": 118899, "epoch": 2830} {"train_loss": -6.489214897155762, "global_step": 118900, "epoch": 2830} {"train_loss": -6.488684688295637, "global_step": 118901, "epoch": 2830, "val_loss": 67863.59375} {"train_loss": -6.578117847442627, "global_step": 118902, "epoch": 2831} {"train_loss": -6.5162129402160645, "global_step": 118903, "epoch": 2831} {"train_loss": -6.429111480712891, "global_step": 118904, "epoch": 2831} {"train_loss": -6.488922595977783, "global_step": 118905, "epoch": 2831} {"train_loss": -6.531939506530762, "global_step": 118906, "epoch": 2831} {"train_loss": -6.435083389282227, "global_step": 118907, "epoch": 2831} {"train_loss": -6.6778154373168945, "global_step": 118908, "epoch": 2831} {"train_loss": -6.509057998657227, "global_step": 118909, "epoch": 2831} {"train_loss": -6.536651134490967, "global_step": 118910, "epoch": 2831} {"train_loss": -6.550754547119141, "global_step": 118911, "epoch": 2831} {"train_loss": -6.605496406555176, "global_step": 118912, "epoch": 2831} {"train_loss": -6.560663223266602, "global_step": 118913, "epoch": 2831} {"train_loss": -6.5012125968933105, "global_step": 118914, "epoch": 2831} {"train_loss": -6.5241379737854, "global_step": 118915, "epoch": 2831} {"train_loss": -6.482640266418457, "global_step": 118916, "epoch": 2831} {"train_loss": -6.57155704498291, "global_step": 118917, "epoch": 2831} {"train_loss": -6.430525779724121, "global_step": 118918, "epoch": 2831} {"train_loss": -6.40643835067749, "global_step": 118919, "epoch": 2831} {"train_loss": -6.402338027954102, "global_step": 118920, "epoch": 2831} {"train_loss": -6.590283393859863, "global_step": 118921, "epoch": 2831} {"train_loss": -6.529549598693848, "global_step": 118922, "epoch": 2831} {"train_loss": -6.455474376678467, "global_step": 118923, "epoch": 2831} {"train_loss": -6.542750358581543, "global_step": 118924, "epoch": 2831} {"train_loss": -6.4077558517456055, "global_step": 118925, "epoch": 2831} {"train_loss": -6.615113735198975, "global_step": 118926, "epoch": 2831} {"train_loss": -6.520786285400391, "global_step": 118927, "epoch": 2831} {"train_loss": -6.524951934814453, "global_step": 118928, "epoch": 2831} {"train_loss": -6.541993141174316, "global_step": 118929, "epoch": 2831} {"train_loss": -6.4432172775268555, "global_step": 118930, "epoch": 2831} {"train_loss": -6.461341857910156, "global_step": 118931, "epoch": 2831} {"train_loss": -6.549941062927246, "global_step": 118932, "epoch": 2831} {"train_loss": -6.571272373199463, "global_step": 118933, "epoch": 2831} {"train_loss": -6.605181694030762, "global_step": 118934, "epoch": 2831} {"train_loss": -6.558011054992676, "global_step": 118935, "epoch": 2831} {"train_loss": -6.5627899169921875, "global_step": 118936, "epoch": 2831} {"train_loss": -6.475362300872803, "global_step": 118937, "epoch": 2831} {"train_loss": -6.532812118530273, "global_step": 118938, "epoch": 2831} {"train_loss": -6.595324993133545, "global_step": 118939, "epoch": 2831} {"train_loss": -6.554652690887451, "global_step": 118940, "epoch": 2831} {"train_loss": -6.525943756103516, "global_step": 118941, "epoch": 2831} {"train_loss": -6.513752460479736, "global_step": 118942, "epoch": 2831} {"train_loss": -6.522621847334362, "global_step": 118943, "epoch": 2831, "val_loss": 67905.390625} {"train_loss": -6.425342559814453, "global_step": 118944, "epoch": 2832} {"train_loss": -6.452513694763184, "global_step": 118945, "epoch": 2832} {"train_loss": -6.450613975524902, "global_step": 118946, "epoch": 2832} {"train_loss": -6.595789909362793, "global_step": 118947, "epoch": 2832} {"train_loss": -6.4554643630981445, "global_step": 118948, "epoch": 2832} {"train_loss": -6.576227188110352, "global_step": 118949, "epoch": 2832} {"train_loss": -6.528680801391602, "global_step": 118950, "epoch": 2832} {"train_loss": -6.569845199584961, "global_step": 118951, "epoch": 2832} {"train_loss": -6.553885459899902, "global_step": 118952, "epoch": 2832} {"train_loss": -6.562868595123291, "global_step": 118953, "epoch": 2832} {"train_loss": -6.573404312133789, "global_step": 118954, "epoch": 2832} {"train_loss": -6.618650436401367, "global_step": 118955, "epoch": 2832} {"train_loss": -6.5500288009643555, "global_step": 118956, "epoch": 2832} {"train_loss": -6.460348606109619, "global_step": 118957, "epoch": 2832} {"train_loss": -6.399179935455322, "global_step": 118958, "epoch": 2832} {"train_loss": -6.545351028442383, "global_step": 118959, "epoch": 2832} {"train_loss": -6.511910438537598, "global_step": 118960, "epoch": 2832} {"train_loss": -6.507899761199951, "global_step": 118961, "epoch": 2832} {"train_loss": -6.623954772949219, "global_step": 118962, "epoch": 2832} {"train_loss": -6.5160746574401855, "global_step": 118963, "epoch": 2832} {"train_loss": -6.626713752746582, "global_step": 118964, "epoch": 2832} {"train_loss": -6.592564105987549, "global_step": 118965, "epoch": 2832} {"train_loss": -6.648001670837402, "global_step": 118966, "epoch": 2832} {"train_loss": -6.625749588012695, "global_step": 118967, "epoch": 2832} {"train_loss": -6.5330810546875, "global_step": 118968, "epoch": 2832} {"train_loss": -6.599486351013184, "global_step": 118969, "epoch": 2832} {"train_loss": -6.640276908874512, "global_step": 118970, "epoch": 2832} {"train_loss": -6.642389297485352, "global_step": 118971, "epoch": 2832} {"train_loss": -6.668216705322266, "global_step": 118972, "epoch": 2832} {"train_loss": -6.5177388191223145, "global_step": 118973, "epoch": 2832} {"train_loss": -6.608499050140381, "global_step": 118974, "epoch": 2832} {"train_loss": -6.465788841247559, "global_step": 118975, "epoch": 2832} {"train_loss": -6.6338043212890625, "global_step": 118976, "epoch": 2832} {"train_loss": -6.555516242980957, "global_step": 118977, "epoch": 2832} {"train_loss": -6.38947057723999, "global_step": 118978, "epoch": 2832} {"train_loss": -6.523349285125732, "global_step": 118979, "epoch": 2832} {"train_loss": -6.643155097961426, "global_step": 118980, "epoch": 2832} {"train_loss": -6.469208717346191, "global_step": 118981, "epoch": 2832} {"train_loss": -6.5007781982421875, "global_step": 118982, "epoch": 2832} {"train_loss": -6.633164405822754, "global_step": 118983, "epoch": 2832} {"train_loss": -6.570380210876465, "global_step": 118984, "epoch": 2832} {"train_loss": -6.551043782915388, "global_step": 118985, "epoch": 2832, "val_loss": 67818.828125} {"train_loss": -6.538789749145508, "global_step": 118986, "epoch": 2833} {"train_loss": -6.644643783569336, "global_step": 118987, "epoch": 2833} {"train_loss": -6.515448093414307, "global_step": 118988, "epoch": 2833} {"train_loss": -6.561554908752441, "global_step": 118989, "epoch": 2833} {"train_loss": -6.594603061676025, "global_step": 118990, "epoch": 2833} {"train_loss": -6.6210737228393555, "global_step": 118991, "epoch": 2833} {"train_loss": -6.59427547454834, "global_step": 118992, "epoch": 2833} {"train_loss": -6.562312126159668, "global_step": 118993, "epoch": 2833} {"train_loss": -6.588488578796387, "global_step": 118994, "epoch": 2833} {"train_loss": -6.555779457092285, "global_step": 118995, "epoch": 2833} {"train_loss": -6.529894828796387, "global_step": 118996, "epoch": 2833} {"train_loss": -6.632810592651367, "global_step": 118997, "epoch": 2833} {"train_loss": -6.501867294311523, "global_step": 118998, "epoch": 2833} {"train_loss": -6.64607572555542, "global_step": 118999, "epoch": 2833} {"train_loss": -6.5302839279174805, "global_step": 119000, "epoch": 2833} {"train_loss": -6.569462776184082, "global_step": 119001, "epoch": 2833} {"train_loss": -6.594351768493652, "global_step": 119002, "epoch": 2833} {"train_loss": -6.648408889770508, "global_step": 119003, "epoch": 2833} {"train_loss": -6.541468620300293, "global_step": 119004, "epoch": 2833} {"train_loss": -6.440374374389648, "global_step": 119005, "epoch": 2833} {"train_loss": -6.569809913635254, "global_step": 119006, "epoch": 2833} {"train_loss": -6.517591953277588, "global_step": 119007, "epoch": 2833} {"train_loss": -6.609787940979004, "global_step": 119008, "epoch": 2833} {"train_loss": -6.513227462768555, "global_step": 119009, "epoch": 2833} {"train_loss": -6.590316295623779, "global_step": 119010, "epoch": 2833} {"train_loss": -6.348813056945801, "global_step": 119011, "epoch": 2833} {"train_loss": -6.489980220794678, "global_step": 119012, "epoch": 2833} {"train_loss": -6.389509201049805, "global_step": 119013, "epoch": 2833} {"train_loss": -6.591336250305176, "global_step": 119014, "epoch": 2833} {"train_loss": -6.517728805541992, "global_step": 119015, "epoch": 2833} {"train_loss": -6.413352012634277, "global_step": 119016, "epoch": 2833} {"train_loss": -6.485600471496582, "global_step": 119017, "epoch": 2833} {"train_loss": -6.4568915367126465, "global_step": 119018, "epoch": 2833} {"train_loss": -6.334244728088379, "global_step": 119019, "epoch": 2833} {"train_loss": -6.446796894073486, "global_step": 119020, "epoch": 2833} {"train_loss": -6.370439052581787, "global_step": 119021, "epoch": 2833} {"train_loss": -6.465235710144043, "global_step": 119022, "epoch": 2833} {"train_loss": -6.4995222091674805, "global_step": 119023, "epoch": 2833} {"train_loss": -6.410683631896973, "global_step": 119024, "epoch": 2833} {"train_loss": -6.343167304992676, "global_step": 119025, "epoch": 2833} {"train_loss": -6.413417816162109, "global_step": 119026, "epoch": 2833} {"train_loss": -6.5143538656688875, "global_step": 119027, "epoch": 2833, "val_loss": 68003.5} {"train_loss": -6.511593341827393, "global_step": 119028, "epoch": 2834} {"train_loss": -6.380390644073486, "global_step": 119029, "epoch": 2834} {"train_loss": -6.386489391326904, "global_step": 119030, "epoch": 2834} {"train_loss": -6.373600006103516, "global_step": 119031, "epoch": 2834} {"train_loss": -6.292280197143555, "global_step": 119032, "epoch": 2834} {"train_loss": -6.408316612243652, "global_step": 119033, "epoch": 2834} {"train_loss": -6.458580493927002, "global_step": 119034, "epoch": 2834} {"train_loss": -6.54795503616333, "global_step": 119035, "epoch": 2834} {"train_loss": -6.394519805908203, "global_step": 119036, "epoch": 2834} {"train_loss": -6.468883037567139, "global_step": 119037, "epoch": 2834} {"train_loss": -6.501977443695068, "global_step": 119038, "epoch": 2834} {"train_loss": -6.481243133544922, "global_step": 119039, "epoch": 2834} {"train_loss": -6.5249433517456055, "global_step": 119040, "epoch": 2834} {"train_loss": -6.391232013702393, "global_step": 119041, "epoch": 2834} {"train_loss": -6.438714504241943, "global_step": 119042, "epoch": 2834} {"train_loss": -6.361851692199707, "global_step": 119043, "epoch": 2834} {"train_loss": -6.416993618011475, "global_step": 119044, "epoch": 2834} {"train_loss": -6.411191940307617, "global_step": 119045, "epoch": 2834} {"train_loss": -6.421743392944336, "global_step": 119046, "epoch": 2834} {"train_loss": -6.410895347595215, "global_step": 119047, "epoch": 2834} {"train_loss": -6.525605201721191, "global_step": 119048, "epoch": 2834} {"train_loss": -6.534516334533691, "global_step": 119049, "epoch": 2834} {"train_loss": -6.447761058807373, "global_step": 119050, "epoch": 2834} {"train_loss": -6.411467552185059, "global_step": 119051, "epoch": 2834} {"train_loss": -6.435276985168457, "global_step": 119052, "epoch": 2834} {"train_loss": -6.613047122955322, "global_step": 119053, "epoch": 2834} {"train_loss": -6.456496238708496, "global_step": 119054, "epoch": 2834} {"train_loss": -6.474546909332275, "global_step": 119055, "epoch": 2834} {"train_loss": -6.500701427459717, "global_step": 119056, "epoch": 2834} {"train_loss": -6.429647922515869, "global_step": 119057, "epoch": 2834} {"train_loss": -6.548185348510742, "global_step": 119058, "epoch": 2834} {"train_loss": -6.438883304595947, "global_step": 119059, "epoch": 2834} {"train_loss": -6.489322185516357, "global_step": 119060, "epoch": 2834} {"train_loss": -6.409885406494141, "global_step": 119061, "epoch": 2834} {"train_loss": -6.488908767700195, "global_step": 119062, "epoch": 2834} {"train_loss": -6.540884017944336, "global_step": 119063, "epoch": 2834} {"train_loss": -6.438775062561035, "global_step": 119064, "epoch": 2834} {"train_loss": -6.597797870635986, "global_step": 119065, "epoch": 2834} {"train_loss": -6.529829025268555, "global_step": 119066, "epoch": 2834} {"train_loss": -6.429196357727051, "global_step": 119067, "epoch": 2834} {"train_loss": -6.463708400726318, "global_step": 119068, "epoch": 2834} {"train_loss": -6.458717811675299, "global_step": 119069, "epoch": 2834, "val_loss": 67949.234375} {"train_loss": -6.5585784912109375, "global_step": 119070, "epoch": 2835} {"train_loss": -6.583402633666992, "global_step": 119071, "epoch": 2835} {"train_loss": -6.496196746826172, "global_step": 119072, "epoch": 2835} {"train_loss": -6.578415870666504, "global_step": 119073, "epoch": 2835} {"train_loss": -6.578012466430664, "global_step": 119074, "epoch": 2835} {"train_loss": -6.509793758392334, "global_step": 119075, "epoch": 2835} {"train_loss": -6.592317581176758, "global_step": 119076, "epoch": 2835} {"train_loss": -6.560348033905029, "global_step": 119077, "epoch": 2835} {"train_loss": -6.419515609741211, "global_step": 119078, "epoch": 2835} {"train_loss": -6.512557029724121, "global_step": 119079, "epoch": 2835} {"train_loss": -6.473308563232422, "global_step": 119080, "epoch": 2835} {"train_loss": -6.4178547859191895, "global_step": 119081, "epoch": 2835} {"train_loss": -6.521169662475586, "global_step": 119082, "epoch": 2835} {"train_loss": -6.600578784942627, "global_step": 119083, "epoch": 2835} {"train_loss": -6.621743202209473, "global_step": 119084, "epoch": 2835} {"train_loss": -6.514927387237549, "global_step": 119085, "epoch": 2835} {"train_loss": -6.503278732299805, "global_step": 119086, "epoch": 2835} {"train_loss": -6.615291595458984, "global_step": 119087, "epoch": 2835} {"train_loss": -6.584109306335449, "global_step": 119088, "epoch": 2835} {"train_loss": -6.595105171203613, "global_step": 119089, "epoch": 2835} {"train_loss": -6.542922019958496, "global_step": 119090, "epoch": 2835} {"train_loss": -6.503434658050537, "global_step": 119091, "epoch": 2835} {"train_loss": -6.456949710845947, "global_step": 119092, "epoch": 2835} {"train_loss": -6.522275924682617, "global_step": 119093, "epoch": 2835} {"train_loss": -6.654265403747559, "global_step": 119094, "epoch": 2835} {"train_loss": -6.59407901763916, "global_step": 119095, "epoch": 2835} {"train_loss": -6.503951072692871, "global_step": 119096, "epoch": 2835} {"train_loss": -6.551012992858887, "global_step": 119097, "epoch": 2835} {"train_loss": -6.561718940734863, "global_step": 119098, "epoch": 2835} {"train_loss": -6.491630554199219, "global_step": 119099, "epoch": 2835} {"train_loss": -6.576471328735352, "global_step": 119100, "epoch": 2835} {"train_loss": -6.490919589996338, "global_step": 119101, "epoch": 2835} {"train_loss": -6.574671268463135, "global_step": 119102, "epoch": 2835} {"train_loss": -6.544878959655762, "global_step": 119103, "epoch": 2835} {"train_loss": -6.663369178771973, "global_step": 119104, "epoch": 2835} {"train_loss": -6.44191837310791, "global_step": 119105, "epoch": 2835} {"train_loss": -6.527491569519043, "global_step": 119106, "epoch": 2835} {"train_loss": -6.515827178955078, "global_step": 119107, "epoch": 2835} {"train_loss": -6.596263885498047, "global_step": 119108, "epoch": 2835} {"train_loss": -6.428265571594238, "global_step": 119109, "epoch": 2835} {"train_loss": -6.567756175994873, "global_step": 119110, "epoch": 2835} {"train_loss": -6.542655150095622, "global_step": 119111, "epoch": 2835, "val_loss": 68031.859375} {"train_loss": -6.529997825622559, "global_step": 119112, "epoch": 2836} {"train_loss": -6.377861976623535, "global_step": 119113, "epoch": 2836} {"train_loss": -6.50159215927124, "global_step": 119114, "epoch": 2836} {"train_loss": -6.5280256271362305, "global_step": 119115, "epoch": 2836} {"train_loss": -6.560344219207764, "global_step": 119116, "epoch": 2836} {"train_loss": -6.620555400848389, "global_step": 119117, "epoch": 2836} {"train_loss": -6.582432270050049, "global_step": 119118, "epoch": 2836} {"train_loss": -6.439988136291504, "global_step": 119119, "epoch": 2836} {"train_loss": -6.681138038635254, "global_step": 119120, "epoch": 2836} {"train_loss": -6.576131343841553, "global_step": 119121, "epoch": 2836} {"train_loss": -6.664214611053467, "global_step": 119122, "epoch": 2836} {"train_loss": -6.580227375030518, "global_step": 119123, "epoch": 2836} {"train_loss": -6.652002334594727, "global_step": 119124, "epoch": 2836} {"train_loss": -6.596194267272949, "global_step": 119125, "epoch": 2836} {"train_loss": -6.596856117248535, "global_step": 119126, "epoch": 2836} {"train_loss": -6.595128059387207, "global_step": 119127, "epoch": 2836} {"train_loss": -6.568236827850342, "global_step": 119128, "epoch": 2836} {"train_loss": -6.48007869720459, "global_step": 119129, "epoch": 2836} {"train_loss": -6.539888381958008, "global_step": 119130, "epoch": 2836} {"train_loss": -6.583345413208008, "global_step": 119131, "epoch": 2836} {"train_loss": -6.46502685546875, "global_step": 119132, "epoch": 2836} {"train_loss": -6.385439395904541, "global_step": 119133, "epoch": 2836} {"train_loss": -6.56712532043457, "global_step": 119134, "epoch": 2836} {"train_loss": -6.578060150146484, "global_step": 119135, "epoch": 2836} {"train_loss": -6.420496940612793, "global_step": 119136, "epoch": 2836} {"train_loss": -6.546506881713867, "global_step": 119137, "epoch": 2836} {"train_loss": -6.636862754821777, "global_step": 119138, "epoch": 2836} {"train_loss": -6.541354179382324, "global_step": 119139, "epoch": 2836} {"train_loss": -6.486462593078613, "global_step": 119140, "epoch": 2836} {"train_loss": -6.570837020874023, "global_step": 119141, "epoch": 2836} {"train_loss": -6.471573829650879, "global_step": 119142, "epoch": 2836} {"train_loss": -6.404824733734131, "global_step": 119143, "epoch": 2836} {"train_loss": -6.53878116607666, "global_step": 119144, "epoch": 2836} {"train_loss": -6.6214399337768555, "global_step": 119145, "epoch": 2836} {"train_loss": -6.429513931274414, "global_step": 119146, "epoch": 2836} {"train_loss": -6.487964630126953, "global_step": 119147, "epoch": 2836} {"train_loss": -6.516875267028809, "global_step": 119148, "epoch": 2836} {"train_loss": -6.476391792297363, "global_step": 119149, "epoch": 2836} {"train_loss": -6.549289703369141, "global_step": 119150, "epoch": 2836} {"train_loss": -6.506053924560547, "global_step": 119151, "epoch": 2836} {"train_loss": -6.551272392272949, "global_step": 119152, "epoch": 2836} {"train_loss": -6.537882464272635, "global_step": 119153, "epoch": 2836, "val_loss": 68101.4140625} {"train_loss": -6.444379806518555, "global_step": 119154, "epoch": 2837} {"train_loss": -6.346452236175537, "global_step": 119155, "epoch": 2837} {"train_loss": -6.456282615661621, "global_step": 119156, "epoch": 2837} {"train_loss": -6.680312156677246, "global_step": 119157, "epoch": 2837} {"train_loss": -6.4660844802856445, "global_step": 119158, "epoch": 2837} {"train_loss": -6.547502517700195, "global_step": 119159, "epoch": 2837} {"train_loss": -6.491542816162109, "global_step": 119160, "epoch": 2837} {"train_loss": -6.536838531494141, "global_step": 119161, "epoch": 2837} {"train_loss": -6.420631408691406, "global_step": 119162, "epoch": 2837} {"train_loss": -6.4611897468566895, "global_step": 119163, "epoch": 2837} {"train_loss": -6.493595123291016, "global_step": 119164, "epoch": 2837} {"train_loss": -6.47318172454834, "global_step": 119165, "epoch": 2837} {"train_loss": -6.498466491699219, "global_step": 119166, "epoch": 2837} {"train_loss": -6.48372745513916, "global_step": 119167, "epoch": 2837} {"train_loss": -6.371888160705566, "global_step": 119168, "epoch": 2837} {"train_loss": -6.506448745727539, "global_step": 119169, "epoch": 2837} {"train_loss": -6.462739944458008, "global_step": 119170, "epoch": 2837} {"train_loss": -6.469227313995361, "global_step": 119171, "epoch": 2837} {"train_loss": -6.536007881164551, "global_step": 119172, "epoch": 2837} {"train_loss": -6.545244216918945, "global_step": 119173, "epoch": 2837} {"train_loss": -6.539342880249023, "global_step": 119174, "epoch": 2837} {"train_loss": -6.474347114562988, "global_step": 119175, "epoch": 2837} {"train_loss": -6.448357582092285, "global_step": 119176, "epoch": 2837} {"train_loss": -6.6323041915893555, "global_step": 119177, "epoch": 2837} {"train_loss": -6.508711814880371, "global_step": 119178, "epoch": 2837} {"train_loss": -6.5701212882995605, "global_step": 119179, "epoch": 2837} {"train_loss": -6.540737152099609, "global_step": 119180, "epoch": 2837} {"train_loss": -6.559943199157715, "global_step": 119181, "epoch": 2837} {"train_loss": -6.507063865661621, "global_step": 119182, "epoch": 2837} {"train_loss": -6.548314094543457, "global_step": 119183, "epoch": 2837} {"train_loss": -6.4317545890808105, "global_step": 119184, "epoch": 2837} {"train_loss": -6.662751197814941, "global_step": 119185, "epoch": 2837} {"train_loss": -6.4429826736450195, "global_step": 119186, "epoch": 2837} {"train_loss": -6.571113586425781, "global_step": 119187, "epoch": 2837} {"train_loss": -6.607639312744141, "global_step": 119188, "epoch": 2837} {"train_loss": -6.405029296875, "global_step": 119189, "epoch": 2837} {"train_loss": -6.42716121673584, "global_step": 119190, "epoch": 2837} {"train_loss": -6.498064994812012, "global_step": 119191, "epoch": 2837} {"train_loss": -6.467353820800781, "global_step": 119192, "epoch": 2837} {"train_loss": -6.501433372497559, "global_step": 119193, "epoch": 2837} {"train_loss": -6.342436790466309, "global_step": 119194, "epoch": 2837} {"train_loss": -6.49641878264291, "global_step": 119195, "epoch": 2837, "val_loss": 68162.671875} {"train_loss": -6.563131332397461, "global_step": 119196, "epoch": 2838} {"train_loss": -6.525891304016113, "global_step": 119197, "epoch": 2838} {"train_loss": -6.538299560546875, "global_step": 119198, "epoch": 2838} {"train_loss": -6.576421737670898, "global_step": 119199, "epoch": 2838} {"train_loss": -6.48976993560791, "global_step": 119200, "epoch": 2838} {"train_loss": -6.560686111450195, "global_step": 119201, "epoch": 2838} {"train_loss": -6.399379730224609, "global_step": 119202, "epoch": 2838} {"train_loss": -6.427210807800293, "global_step": 119203, "epoch": 2838} {"train_loss": -6.554000377655029, "global_step": 119204, "epoch": 2838} {"train_loss": -6.566497325897217, "global_step": 119205, "epoch": 2838} {"train_loss": -6.519412040710449, "global_step": 119206, "epoch": 2838} {"train_loss": -6.5044846534729, "global_step": 119207, "epoch": 2838} {"train_loss": -6.483713150024414, "global_step": 119208, "epoch": 2838} {"train_loss": -6.638676643371582, "global_step": 119209, "epoch": 2838} {"train_loss": -6.587652206420898, "global_step": 119210, "epoch": 2838} {"train_loss": -6.49938440322876, "global_step": 119211, "epoch": 2838} {"train_loss": -6.399693489074707, "global_step": 119212, "epoch": 2838} {"train_loss": -6.534734725952148, "global_step": 119213, "epoch": 2838} {"train_loss": -6.5218424797058105, "global_step": 119214, "epoch": 2838} {"train_loss": -6.509914398193359, "global_step": 119215, "epoch": 2838} {"train_loss": -6.544562339782715, "global_step": 119216, "epoch": 2838} {"train_loss": -6.661389350891113, "global_step": 119217, "epoch": 2838} {"train_loss": -6.554111957550049, "global_step": 119218, "epoch": 2838} {"train_loss": -6.493510723114014, "global_step": 119219, "epoch": 2838} {"train_loss": -6.59550666809082, "global_step": 119220, "epoch": 2838} {"train_loss": -6.45022439956665, "global_step": 119221, "epoch": 2838} {"train_loss": -6.57344388961792, "global_step": 119222, "epoch": 2838} {"train_loss": -6.545864105224609, "global_step": 119223, "epoch": 2838} {"train_loss": -6.680549621582031, "global_step": 119224, "epoch": 2838} {"train_loss": -6.474893569946289, "global_step": 119225, "epoch": 2838} {"train_loss": -6.609636306762695, "global_step": 119226, "epoch": 2838} {"train_loss": -6.577723503112793, "global_step": 119227, "epoch": 2838} {"train_loss": -6.550807952880859, "global_step": 119228, "epoch": 2838} {"train_loss": -6.4162797927856445, "global_step": 119229, "epoch": 2838} {"train_loss": -6.601126670837402, "global_step": 119230, "epoch": 2838} {"train_loss": -6.623866081237793, "global_step": 119231, "epoch": 2838} {"train_loss": -6.452281475067139, "global_step": 119232, "epoch": 2838} {"train_loss": -6.413793563842773, "global_step": 119233, "epoch": 2838} {"train_loss": -6.610646724700928, "global_step": 119234, "epoch": 2838} {"train_loss": -6.525464057922363, "global_step": 119235, "epoch": 2838} {"train_loss": -6.571620941162109, "global_step": 119236, "epoch": 2838} {"train_loss": -6.535347654705956, "global_step": 119237, "epoch": 2838, "val_loss": 67799.2734375} {"train_loss": -6.5994977951049805, "global_step": 119238, "epoch": 2839} {"train_loss": -6.60232400894165, "global_step": 119239, "epoch": 2839} {"train_loss": -6.652149200439453, "global_step": 119240, "epoch": 2839} {"train_loss": -6.511302947998047, "global_step": 119241, "epoch": 2839} {"train_loss": -6.5649495124816895, "global_step": 119242, "epoch": 2839} {"train_loss": -6.49323844909668, "global_step": 119243, "epoch": 2839} {"train_loss": -6.346928119659424, "global_step": 119244, "epoch": 2839} {"train_loss": -6.6628522872924805, "global_step": 119245, "epoch": 2839} {"train_loss": -6.449411392211914, "global_step": 119246, "epoch": 2839} {"train_loss": -6.489461898803711, "global_step": 119247, "epoch": 2839} {"train_loss": -6.503880500793457, "global_step": 119248, "epoch": 2839} {"train_loss": -6.524932861328125, "global_step": 119249, "epoch": 2839} {"train_loss": -6.575593948364258, "global_step": 119250, "epoch": 2839} {"train_loss": -6.588355541229248, "global_step": 119251, "epoch": 2839} {"train_loss": -6.530060768127441, "global_step": 119252, "epoch": 2839} {"train_loss": -6.5245771408081055, "global_step": 119253, "epoch": 2839} {"train_loss": -6.519268989562988, "global_step": 119254, "epoch": 2839} {"train_loss": -6.540424346923828, "global_step": 119255, "epoch": 2839} {"train_loss": -6.536346435546875, "global_step": 119256, "epoch": 2839} {"train_loss": -6.562228679656982, "global_step": 119257, "epoch": 2839} {"train_loss": -6.516254425048828, "global_step": 119258, "epoch": 2839} {"train_loss": -6.560163974761963, "global_step": 119259, "epoch": 2839} {"train_loss": -6.565410614013672, "global_step": 119260, "epoch": 2839} {"train_loss": -6.575933456420898, "global_step": 119261, "epoch": 2839} {"train_loss": -6.585886001586914, "global_step": 119262, "epoch": 2839} {"train_loss": -6.50050163269043, "global_step": 119263, "epoch": 2839} {"train_loss": -6.409625053405762, "global_step": 119264, "epoch": 2839} {"train_loss": -6.569149971008301, "global_step": 119265, "epoch": 2839} {"train_loss": -6.490221977233887, "global_step": 119266, "epoch": 2839} {"train_loss": -6.459223747253418, "global_step": 119267, "epoch": 2839} {"train_loss": -6.615571022033691, "global_step": 119268, "epoch": 2839} {"train_loss": -6.430129528045654, "global_step": 119269, "epoch": 2839} {"train_loss": -6.379556655883789, "global_step": 119270, "epoch": 2839} {"train_loss": -6.594668388366699, "global_step": 119271, "epoch": 2839} {"train_loss": -6.3821563720703125, "global_step": 119272, "epoch": 2839} {"train_loss": -6.415928363800049, "global_step": 119273, "epoch": 2839} {"train_loss": -6.468820571899414, "global_step": 119274, "epoch": 2839} {"train_loss": -6.475834846496582, "global_step": 119275, "epoch": 2839} {"train_loss": -6.467954635620117, "global_step": 119276, "epoch": 2839} {"train_loss": -6.534750938415527, "global_step": 119277, "epoch": 2839} {"train_loss": -6.392956256866455, "global_step": 119278, "epoch": 2839} {"train_loss": -6.515471231369745, "global_step": 119279, "epoch": 2839, "val_loss": 67763.609375} {"train_loss": -6.521561145782471, "global_step": 119280, "epoch": 2840} {"train_loss": -6.434380531311035, "global_step": 119281, "epoch": 2840} {"train_loss": -6.410294532775879, "global_step": 119282, "epoch": 2840} {"train_loss": -6.485419750213623, "global_step": 119283, "epoch": 2840} {"train_loss": -6.516371726989746, "global_step": 119284, "epoch": 2840} {"train_loss": -6.589306831359863, "global_step": 119285, "epoch": 2840} {"train_loss": -6.401484966278076, "global_step": 119286, "epoch": 2840} {"train_loss": -6.3569440841674805, "global_step": 119287, "epoch": 2840} {"train_loss": -6.5150227546691895, "global_step": 119288, "epoch": 2840} {"train_loss": -6.543789863586426, "global_step": 119289, "epoch": 2840} {"train_loss": -6.507072448730469, "global_step": 119290, "epoch": 2840} {"train_loss": -6.5504865646362305, "global_step": 119291, "epoch": 2840} {"train_loss": -6.556087970733643, "global_step": 119292, "epoch": 2840} {"train_loss": -6.496002197265625, "global_step": 119293, "epoch": 2840} {"train_loss": -6.543827533721924, "global_step": 119294, "epoch": 2840} {"train_loss": -6.519096374511719, "global_step": 119295, "epoch": 2840} {"train_loss": -6.556817531585693, "global_step": 119296, "epoch": 2840} {"train_loss": -6.579193592071533, "global_step": 119297, "epoch": 2840} {"train_loss": -6.516844749450684, "global_step": 119298, "epoch": 2840} {"train_loss": -6.43502140045166, "global_step": 119299, "epoch": 2840} {"train_loss": -6.433947563171387, "global_step": 119300, "epoch": 2840} {"train_loss": -6.469799995422363, "global_step": 119301, "epoch": 2840} {"train_loss": -6.63004207611084, "global_step": 119302, "epoch": 2840} {"train_loss": -6.505687713623047, "global_step": 119303, "epoch": 2840} {"train_loss": -6.577178478240967, "global_step": 119304, "epoch": 2840} {"train_loss": -6.53070068359375, "global_step": 119305, "epoch": 2840} {"train_loss": -6.471688270568848, "global_step": 119306, "epoch": 2840} {"train_loss": -6.651492118835449, "global_step": 119307, "epoch": 2840} {"train_loss": -6.603882789611816, "global_step": 119308, "epoch": 2840} {"train_loss": -6.506513595581055, "global_step": 119309, "epoch": 2840} {"train_loss": -6.524145603179932, "global_step": 119310, "epoch": 2840} {"train_loss": -6.442836761474609, "global_step": 119311, "epoch": 2840} {"train_loss": -6.568312644958496, "global_step": 119312, "epoch": 2840} {"train_loss": -6.519660949707031, "global_step": 119313, "epoch": 2840} {"train_loss": -6.6304240226745605, "global_step": 119314, "epoch": 2840} {"train_loss": -6.537517070770264, "global_step": 119315, "epoch": 2840} {"train_loss": -6.398046493530273, "global_step": 119316, "epoch": 2840} {"train_loss": -6.651474475860596, "global_step": 119317, "epoch": 2840} {"train_loss": -6.660343170166016, "global_step": 119318, "epoch": 2840} {"train_loss": -6.580198764801025, "global_step": 119319, "epoch": 2840} {"train_loss": -6.672457695007324, "global_step": 119320, "epoch": 2840} {"train_loss": -6.5263936292557485, "global_step": 119321, "epoch": 2840, "val_loss": 67919.6796875} {"train_loss": -6.531268119812012, "global_step": 119322, "epoch": 2841} {"train_loss": -6.5717315673828125, "global_step": 119323, "epoch": 2841} {"train_loss": -6.686107158660889, "global_step": 119324, "epoch": 2841} {"train_loss": -6.537571907043457, "global_step": 119325, "epoch": 2841} {"train_loss": -6.652249336242676, "global_step": 119326, "epoch": 2841} {"train_loss": -6.613053321838379, "global_step": 119327, "epoch": 2841} {"train_loss": -6.655328750610352, "global_step": 119328, "epoch": 2841} {"train_loss": -6.542028903961182, "global_step": 119329, "epoch": 2841} {"train_loss": -6.600625991821289, "global_step": 119330, "epoch": 2841} {"train_loss": -6.470089912414551, "global_step": 119331, "epoch": 2841} {"train_loss": -6.459527015686035, "global_step": 119332, "epoch": 2841} {"train_loss": -6.56731653213501, "global_step": 119333, "epoch": 2841} {"train_loss": -6.610623359680176, "global_step": 119334, "epoch": 2841} {"train_loss": -6.514777183532715, "global_step": 119335, "epoch": 2841} {"train_loss": -6.614385604858398, "global_step": 119336, "epoch": 2841} {"train_loss": -6.500510215759277, "global_step": 119337, "epoch": 2841} {"train_loss": -6.509941577911377, "global_step": 119338, "epoch": 2841} {"train_loss": -6.42880916595459, "global_step": 119339, "epoch": 2841} {"train_loss": -6.474836349487305, "global_step": 119340, "epoch": 2841} {"train_loss": -6.5668158531188965, "global_step": 119341, "epoch": 2841} {"train_loss": -6.500884532928467, "global_step": 119342, "epoch": 2841} {"train_loss": -6.502745628356934, "global_step": 119343, "epoch": 2841} {"train_loss": -6.4986677169799805, "global_step": 119344, "epoch": 2841} {"train_loss": -6.589522361755371, "global_step": 119345, "epoch": 2841} {"train_loss": -6.535107612609863, "global_step": 119346, "epoch": 2841} {"train_loss": -6.527215003967285, "global_step": 119347, "epoch": 2841} {"train_loss": -6.631473541259766, "global_step": 119348, "epoch": 2841} {"train_loss": -6.570728302001953, "global_step": 119349, "epoch": 2841} {"train_loss": -6.576717853546143, "global_step": 119350, "epoch": 2841} {"train_loss": -6.526052951812744, "global_step": 119351, "epoch": 2841} {"train_loss": -6.717686653137207, "global_step": 119352, "epoch": 2841} {"train_loss": -6.694016933441162, "global_step": 119353, "epoch": 2841} {"train_loss": -6.576438903808594, "global_step": 119354, "epoch": 2841} {"train_loss": -6.678119659423828, "global_step": 119355, "epoch": 2841} {"train_loss": -6.513376235961914, "global_step": 119356, "epoch": 2841} {"train_loss": -6.581817626953125, "global_step": 119357, "epoch": 2841} {"train_loss": -6.46586799621582, "global_step": 119358, "epoch": 2841} {"train_loss": -6.552706241607666, "global_step": 119359, "epoch": 2841} {"train_loss": -6.390918254852295, "global_step": 119360, "epoch": 2841} {"train_loss": -6.562828063964844, "global_step": 119361, "epoch": 2841} {"train_loss": -6.507575035095215, "global_step": 119362, "epoch": 2841} {"train_loss": -6.554444347109113, "global_step": 119363, "epoch": 2841, "val_loss": 68008.4140625} {"train_loss": -6.628639221191406, "global_step": 119364, "epoch": 2842} {"train_loss": -6.470766544342041, "global_step": 119365, "epoch": 2842} {"train_loss": -6.66841983795166, "global_step": 119366, "epoch": 2842} {"train_loss": -6.514071941375732, "global_step": 119367, "epoch": 2842} {"train_loss": -6.53919792175293, "global_step": 119368, "epoch": 2842} {"train_loss": -6.563508987426758, "global_step": 119369, "epoch": 2842} {"train_loss": -6.545751571655273, "global_step": 119370, "epoch": 2842} {"train_loss": -6.670645713806152, "global_step": 119371, "epoch": 2842} {"train_loss": -6.556070327758789, "global_step": 119372, "epoch": 2842} {"train_loss": -6.498623847961426, "global_step": 119373, "epoch": 2842} {"train_loss": -6.563493728637695, "global_step": 119374, "epoch": 2842} {"train_loss": -6.463342189788818, "global_step": 119375, "epoch": 2842} {"train_loss": -6.676708698272705, "global_step": 119376, "epoch": 2842} {"train_loss": -6.583368301391602, "global_step": 119377, "epoch": 2842} {"train_loss": -6.535882949829102, "global_step": 119378, "epoch": 2842} {"train_loss": -6.572175025939941, "global_step": 119379, "epoch": 2842} {"train_loss": -6.565801620483398, "global_step": 119380, "epoch": 2842} {"train_loss": -6.507503509521484, "global_step": 119381, "epoch": 2842} {"train_loss": -6.49371337890625, "global_step": 119382, "epoch": 2842} {"train_loss": -6.472787857055664, "global_step": 119383, "epoch": 2842} {"train_loss": -6.550470352172852, "global_step": 119384, "epoch": 2842} {"train_loss": -6.503083229064941, "global_step": 119385, "epoch": 2842} {"train_loss": -6.544194221496582, "global_step": 119386, "epoch": 2842} {"train_loss": -6.477636337280273, "global_step": 119387, "epoch": 2842} {"train_loss": -6.467480659484863, "global_step": 119388, "epoch": 2842} {"train_loss": -6.506049156188965, "global_step": 119389, "epoch": 2842} {"train_loss": -6.431314468383789, "global_step": 119390, "epoch": 2842} {"train_loss": -6.432808876037598, "global_step": 119391, "epoch": 2842} {"train_loss": -6.478140830993652, "global_step": 119392, "epoch": 2842} {"train_loss": -6.466409683227539, "global_step": 119393, "epoch": 2842} {"train_loss": -6.6125288009643555, "global_step": 119394, "epoch": 2842} {"train_loss": -6.559812068939209, "global_step": 119395, "epoch": 2842} {"train_loss": -6.424772262573242, "global_step": 119396, "epoch": 2842} {"train_loss": -6.442678928375244, "global_step": 119397, "epoch": 2842} {"train_loss": -6.478238582611084, "global_step": 119398, "epoch": 2842} {"train_loss": -6.4196085929870605, "global_step": 119399, "epoch": 2842} {"train_loss": -6.611793041229248, "global_step": 119400, "epoch": 2842} {"train_loss": -6.487054824829102, "global_step": 119401, "epoch": 2842} {"train_loss": -6.547256946563721, "global_step": 119402, "epoch": 2842} {"train_loss": -6.347905158996582, "global_step": 119403, "epoch": 2842} {"train_loss": -6.5721235275268555, "global_step": 119404, "epoch": 2842} {"train_loss": -6.521402858552479, "global_step": 119405, "epoch": 2842, "val_loss": 67745.78125} {"train_loss": -6.523323059082031, "global_step": 119406, "epoch": 2843} {"train_loss": -6.520527362823486, "global_step": 119407, "epoch": 2843} {"train_loss": -6.540674686431885, "global_step": 119408, "epoch": 2843} {"train_loss": -6.355263710021973, "global_step": 119409, "epoch": 2843} {"train_loss": -6.496323108673096, "global_step": 119410, "epoch": 2843} {"train_loss": -6.556112766265869, "global_step": 119411, "epoch": 2843} {"train_loss": -6.454464912414551, "global_step": 119412, "epoch": 2843} {"train_loss": -6.417173385620117, "global_step": 119413, "epoch": 2843} {"train_loss": -6.455608367919922, "global_step": 119414, "epoch": 2843} {"train_loss": -6.475149631500244, "global_step": 119415, "epoch": 2843} {"train_loss": -6.552376747131348, "global_step": 119416, "epoch": 2843} {"train_loss": -6.525758266448975, "global_step": 119417, "epoch": 2843} {"train_loss": -6.455411434173584, "global_step": 119418, "epoch": 2843} {"train_loss": -6.607351779937744, "global_step": 119419, "epoch": 2843} {"train_loss": -6.4612040519714355, "global_step": 119420, "epoch": 2843} {"train_loss": -6.487530708312988, "global_step": 119421, "epoch": 2843} {"train_loss": -6.548280239105225, "global_step": 119422, "epoch": 2843} {"train_loss": -6.432171821594238, "global_step": 119423, "epoch": 2843} {"train_loss": -6.4834184646606445, "global_step": 119424, "epoch": 2843} {"train_loss": -6.491700172424316, "global_step": 119425, "epoch": 2843} {"train_loss": -6.432064056396484, "global_step": 119426, "epoch": 2843} {"train_loss": -6.426589488983154, "global_step": 119427, "epoch": 2843} {"train_loss": -6.425457954406738, "global_step": 119428, "epoch": 2843} {"train_loss": -6.503833770751953, "global_step": 119429, "epoch": 2843} {"train_loss": -6.4365034103393555, "global_step": 119430, "epoch": 2843} {"train_loss": -6.4634108543396, "global_step": 119431, "epoch": 2843} {"train_loss": -6.486637115478516, "global_step": 119432, "epoch": 2843} {"train_loss": -6.506095886230469, "global_step": 119433, "epoch": 2843} {"train_loss": -6.473094463348389, "global_step": 119434, "epoch": 2843} {"train_loss": -6.483182907104492, "global_step": 119435, "epoch": 2843} {"train_loss": -6.497753143310547, "global_step": 119436, "epoch": 2843} {"train_loss": -6.3478217124938965, "global_step": 119437, "epoch": 2843} {"train_loss": -6.502703666687012, "global_step": 119438, "epoch": 2843} {"train_loss": -6.380350589752197, "global_step": 119439, "epoch": 2843} {"train_loss": -6.440642833709717, "global_step": 119440, "epoch": 2843} {"train_loss": -6.501482963562012, "global_step": 119441, "epoch": 2843} {"train_loss": -6.402471542358398, "global_step": 119442, "epoch": 2843} {"train_loss": -6.434948444366455, "global_step": 119443, "epoch": 2843} {"train_loss": -6.503933906555176, "global_step": 119444, "epoch": 2843} {"train_loss": -6.520146369934082, "global_step": 119445, "epoch": 2843} {"train_loss": -6.487075328826904, "global_step": 119446, "epoch": 2843} {"train_loss": -6.474410284133184, "global_step": 119447, "epoch": 2843, "val_loss": 67821.6796875} {"train_loss": -6.481493949890137, "global_step": 119448, "epoch": 2844} {"train_loss": -6.4826979637146, "global_step": 119449, "epoch": 2844} {"train_loss": -6.558128356933594, "global_step": 119450, "epoch": 2844} {"train_loss": -6.588647365570068, "global_step": 119451, "epoch": 2844} {"train_loss": -6.592750072479248, "global_step": 119452, "epoch": 2844} {"train_loss": -6.57164192199707, "global_step": 119453, "epoch": 2844} {"train_loss": -6.533296585083008, "global_step": 119454, "epoch": 2844} {"train_loss": -6.490999221801758, "global_step": 119455, "epoch": 2844} {"train_loss": -6.429369926452637, "global_step": 119456, "epoch": 2844} {"train_loss": -6.535122394561768, "global_step": 119457, "epoch": 2844} {"train_loss": -6.589898109436035, "global_step": 119458, "epoch": 2844} {"train_loss": -6.580222129821777, "global_step": 119459, "epoch": 2844} {"train_loss": -6.469649791717529, "global_step": 119460, "epoch": 2844} {"train_loss": -6.564819812774658, "global_step": 119461, "epoch": 2844} {"train_loss": -6.556962966918945, "global_step": 119462, "epoch": 2844} {"train_loss": -6.564393520355225, "global_step": 119463, "epoch": 2844} {"train_loss": -6.567325115203857, "global_step": 119464, "epoch": 2844} {"train_loss": -6.488289833068848, "global_step": 119465, "epoch": 2844} {"train_loss": -6.5218305587768555, "global_step": 119466, "epoch": 2844} {"train_loss": -6.480984687805176, "global_step": 119467, "epoch": 2844} {"train_loss": -6.492464065551758, "global_step": 119468, "epoch": 2844} {"train_loss": -6.531408309936523, "global_step": 119469, "epoch": 2844} {"train_loss": -6.573045253753662, "global_step": 119470, "epoch": 2844} {"train_loss": -6.519077301025391, "global_step": 119471, "epoch": 2844} {"train_loss": -6.504363059997559, "global_step": 119472, "epoch": 2844} {"train_loss": -6.5723419189453125, "global_step": 119473, "epoch": 2844} {"train_loss": -6.453464031219482, "global_step": 119474, "epoch": 2844} {"train_loss": -6.51501989364624, "global_step": 119475, "epoch": 2844} {"train_loss": -6.400819778442383, "global_step": 119476, "epoch": 2844} {"train_loss": -6.4783453941345215, "global_step": 119477, "epoch": 2844} {"train_loss": -6.482366561889648, "global_step": 119478, "epoch": 2844} {"train_loss": -6.559438705444336, "global_step": 119479, "epoch": 2844} {"train_loss": -6.403232574462891, "global_step": 119480, "epoch": 2844} {"train_loss": -6.314009666442871, "global_step": 119481, "epoch": 2844} {"train_loss": -6.543068885803223, "global_step": 119482, "epoch": 2844} {"train_loss": -6.399706840515137, "global_step": 119483, "epoch": 2844} {"train_loss": -6.620505332946777, "global_step": 119484, "epoch": 2844} {"train_loss": -6.422909259796143, "global_step": 119485, "epoch": 2844} {"train_loss": -6.569363594055176, "global_step": 119486, "epoch": 2844} {"train_loss": -6.556115627288818, "global_step": 119487, "epoch": 2844} {"train_loss": -6.511655330657959, "global_step": 119488, "epoch": 2844} {"train_loss": -6.512311072576614, "global_step": 119489, "epoch": 2844, "val_loss": 67993.0078125} {"train_loss": -6.55889892578125, "global_step": 119490, "epoch": 2845} {"train_loss": -6.497200965881348, "global_step": 119491, "epoch": 2845} {"train_loss": -6.457589149475098, "global_step": 119492, "epoch": 2845} {"train_loss": -6.511964797973633, "global_step": 119493, "epoch": 2845} {"train_loss": -6.486128807067871, "global_step": 119494, "epoch": 2845} {"train_loss": -6.65444278717041, "global_step": 119495, "epoch": 2845} {"train_loss": -6.5367560386657715, "global_step": 119496, "epoch": 2845} {"train_loss": -6.506928443908691, "global_step": 119497, "epoch": 2845} {"train_loss": -6.535586357116699, "global_step": 119498, "epoch": 2845} {"train_loss": -6.572440147399902, "global_step": 119499, "epoch": 2845} {"train_loss": -6.606123447418213, "global_step": 119500, "epoch": 2845} {"train_loss": -6.540219306945801, "global_step": 119501, "epoch": 2845} {"train_loss": -6.483410835266113, "global_step": 119502, "epoch": 2845} {"train_loss": -6.4572906494140625, "global_step": 119503, "epoch": 2845} {"train_loss": -6.462669372558594, "global_step": 119504, "epoch": 2845} {"train_loss": -6.468021869659424, "global_step": 119505, "epoch": 2845} {"train_loss": -6.524763107299805, "global_step": 119506, "epoch": 2845} {"train_loss": -6.573083877563477, "global_step": 119507, "epoch": 2845} {"train_loss": -6.554759502410889, "global_step": 119508, "epoch": 2845} {"train_loss": -6.458759307861328, "global_step": 119509, "epoch": 2845} {"train_loss": -6.429609775543213, "global_step": 119510, "epoch": 2845} {"train_loss": -6.544898986816406, "global_step": 119511, "epoch": 2845} {"train_loss": -6.590442657470703, "global_step": 119512, "epoch": 2845} {"train_loss": -6.5539164543151855, "global_step": 119513, "epoch": 2845} {"train_loss": -6.544970512390137, "global_step": 119514, "epoch": 2845} {"train_loss": -6.501163482666016, "global_step": 119515, "epoch": 2845} {"train_loss": -6.596932411193848, "global_step": 119516, "epoch": 2845} {"train_loss": -6.52592134475708, "global_step": 119517, "epoch": 2845} {"train_loss": -6.555413246154785, "global_step": 119518, "epoch": 2845} {"train_loss": -6.449516773223877, "global_step": 119519, "epoch": 2845} {"train_loss": -6.6306562423706055, "global_step": 119520, "epoch": 2845} {"train_loss": -6.519282817840576, "global_step": 119521, "epoch": 2845} {"train_loss": -6.507387161254883, "global_step": 119522, "epoch": 2845} {"train_loss": -6.549263000488281, "global_step": 119523, "epoch": 2845} {"train_loss": -6.441316604614258, "global_step": 119524, "epoch": 2845} {"train_loss": -6.530959129333496, "global_step": 119525, "epoch": 2845} {"train_loss": -6.4767045974731445, "global_step": 119526, "epoch": 2845} {"train_loss": -6.523686408996582, "global_step": 119527, "epoch": 2845} {"train_loss": -6.492507457733154, "global_step": 119528, "epoch": 2845} {"train_loss": -6.512187957763672, "global_step": 119529, "epoch": 2845} {"train_loss": -6.554998874664307, "global_step": 119530, "epoch": 2845} {"train_loss": -6.522231226875668, "global_step": 119531, "epoch": 2845, "val_loss": 68300.8359375} {"train_loss": -6.487496376037598, "global_step": 119532, "epoch": 2846} {"train_loss": -6.468742370605469, "global_step": 119533, "epoch": 2846} {"train_loss": -6.526996612548828, "global_step": 119534, "epoch": 2846} {"train_loss": -6.535874366760254, "global_step": 119535, "epoch": 2846} {"train_loss": -6.6528544425964355, "global_step": 119536, "epoch": 2846} {"train_loss": -6.608760833740234, "global_step": 119537, "epoch": 2846} {"train_loss": -6.478730201721191, "global_step": 119538, "epoch": 2846} {"train_loss": -6.6692986488342285, "global_step": 119539, "epoch": 2846} {"train_loss": -6.642092704772949, "global_step": 119540, "epoch": 2846} {"train_loss": -6.437912940979004, "global_step": 119541, "epoch": 2846} {"train_loss": -6.613708972930908, "global_step": 119542, "epoch": 2846} {"train_loss": -6.375555038452148, "global_step": 119543, "epoch": 2846} {"train_loss": -6.538774490356445, "global_step": 119544, "epoch": 2846} {"train_loss": -6.385906219482422, "global_step": 119545, "epoch": 2846} {"train_loss": -6.509357452392578, "global_step": 119546, "epoch": 2846} {"train_loss": -6.45292854309082, "global_step": 119547, "epoch": 2846} {"train_loss": -6.454887390136719, "global_step": 119548, "epoch": 2846} {"train_loss": -6.5905442237854, "global_step": 119549, "epoch": 2846} {"train_loss": -6.594429969787598, "global_step": 119550, "epoch": 2846} {"train_loss": -6.521312713623047, "global_step": 119551, "epoch": 2846} {"train_loss": -6.49478816986084, "global_step": 119552, "epoch": 2846} {"train_loss": -6.59967041015625, "global_step": 119553, "epoch": 2846} {"train_loss": -6.603645324707031, "global_step": 119554, "epoch": 2846} {"train_loss": -6.607031345367432, "global_step": 119555, "epoch": 2846} {"train_loss": -6.548426628112793, "global_step": 119556, "epoch": 2846} {"train_loss": -6.486525535583496, "global_step": 119557, "epoch": 2846} {"train_loss": -6.590768814086914, "global_step": 119558, "epoch": 2846} {"train_loss": -6.464458465576172, "global_step": 119559, "epoch": 2846} {"train_loss": -6.4252424240112305, "global_step": 119560, "epoch": 2846} {"train_loss": -6.595141410827637, "global_step": 119561, "epoch": 2846} {"train_loss": -6.448258876800537, "global_step": 119562, "epoch": 2846} {"train_loss": -6.5149078369140625, "global_step": 119563, "epoch": 2846} {"train_loss": -6.484772682189941, "global_step": 119564, "epoch": 2846} {"train_loss": -6.431764125823975, "global_step": 119565, "epoch": 2846} {"train_loss": -6.520081520080566, "global_step": 119566, "epoch": 2846} {"train_loss": -6.54463005065918, "global_step": 119567, "epoch": 2846} {"train_loss": -6.499344348907471, "global_step": 119568, "epoch": 2846} {"train_loss": -6.535904407501221, "global_step": 119569, "epoch": 2846} {"train_loss": -6.516160011291504, "global_step": 119570, "epoch": 2846} {"train_loss": -6.500612258911133, "global_step": 119571, "epoch": 2846} {"train_loss": -6.416871070861816, "global_step": 119572, "epoch": 2846} {"train_loss": -6.520462444850376, "global_step": 119573, "epoch": 2846, "val_loss": 67742.09375} {"train_loss": -6.5965423583984375, "global_step": 119574, "epoch": 2847} {"train_loss": -6.499063491821289, "global_step": 119575, "epoch": 2847} {"train_loss": -6.573302745819092, "global_step": 119576, "epoch": 2847} {"train_loss": -6.429621696472168, "global_step": 119577, "epoch": 2847} {"train_loss": -6.515244960784912, "global_step": 119578, "epoch": 2847} {"train_loss": -6.56640625, "global_step": 119579, "epoch": 2847} {"train_loss": -6.540463447570801, "global_step": 119580, "epoch": 2847} {"train_loss": -6.509610176086426, "global_step": 119581, "epoch": 2847} {"train_loss": -6.51245641708374, "global_step": 119582, "epoch": 2847} {"train_loss": -6.507454872131348, "global_step": 119583, "epoch": 2847} {"train_loss": -6.381192684173584, "global_step": 119584, "epoch": 2847} {"train_loss": -6.441129684448242, "global_step": 119585, "epoch": 2847} {"train_loss": -6.4617509841918945, "global_step": 119586, "epoch": 2847} {"train_loss": -6.414359092712402, "global_step": 119587, "epoch": 2847} {"train_loss": -6.495452880859375, "global_step": 119588, "epoch": 2847} {"train_loss": -6.446407794952393, "global_step": 119589, "epoch": 2847} {"train_loss": -6.45358943939209, "global_step": 119590, "epoch": 2847} {"train_loss": -6.565515518188477, "global_step": 119591, "epoch": 2847} {"train_loss": -6.506966590881348, "global_step": 119592, "epoch": 2847} {"train_loss": -6.527249336242676, "global_step": 119593, "epoch": 2847} {"train_loss": -6.450701713562012, "global_step": 119594, "epoch": 2847} {"train_loss": -6.557350158691406, "global_step": 119595, "epoch": 2847} {"train_loss": -6.504547119140625, "global_step": 119596, "epoch": 2847} {"train_loss": -6.521707534790039, "global_step": 119597, "epoch": 2847} {"train_loss": -6.539344787597656, "global_step": 119598, "epoch": 2847} {"train_loss": -6.470463752746582, "global_step": 119599, "epoch": 2847} {"train_loss": -6.474749565124512, "global_step": 119600, "epoch": 2847} {"train_loss": -6.569566249847412, "global_step": 119601, "epoch": 2847} {"train_loss": -6.482574462890625, "global_step": 119602, "epoch": 2847} {"train_loss": -6.415609359741211, "global_step": 119603, "epoch": 2847} {"train_loss": -6.4523820877075195, "global_step": 119604, "epoch": 2847} {"train_loss": -6.416903972625732, "global_step": 119605, "epoch": 2847} {"train_loss": -6.500730991363525, "global_step": 119606, "epoch": 2847} {"train_loss": -6.494333267211914, "global_step": 119607, "epoch": 2847} {"train_loss": -6.478582382202148, "global_step": 119608, "epoch": 2847} {"train_loss": -6.527249813079834, "global_step": 119609, "epoch": 2847} {"train_loss": -6.580413818359375, "global_step": 119610, "epoch": 2847} {"train_loss": -6.472800254821777, "global_step": 119611, "epoch": 2847} {"train_loss": -6.618386745452881, "global_step": 119612, "epoch": 2847} {"train_loss": -6.646960735321045, "global_step": 119613, "epoch": 2847} {"train_loss": -6.518346309661865, "global_step": 119614, "epoch": 2847} {"train_loss": -6.504998820168631, "global_step": 119615, "epoch": 2847, "val_loss": 67850.96875} {"train_loss": -6.395988464355469, "global_step": 119616, "epoch": 2848} {"train_loss": -6.458249568939209, "global_step": 119617, "epoch": 2848} {"train_loss": -6.703451156616211, "global_step": 119618, "epoch": 2848} {"train_loss": -6.540788650512695, "global_step": 119619, "epoch": 2848} {"train_loss": -6.576091289520264, "global_step": 119620, "epoch": 2848} {"train_loss": -6.640018939971924, "global_step": 119621, "epoch": 2848} {"train_loss": -6.549358367919922, "global_step": 119622, "epoch": 2848} {"train_loss": -6.479069709777832, "global_step": 119623, "epoch": 2848} {"train_loss": -6.6224260330200195, "global_step": 119624, "epoch": 2848} {"train_loss": -6.495206356048584, "global_step": 119625, "epoch": 2848} {"train_loss": -6.597763538360596, "global_step": 119626, "epoch": 2848} {"train_loss": -6.601605415344238, "global_step": 119627, "epoch": 2848} {"train_loss": -6.616883277893066, "global_step": 119628, "epoch": 2848} {"train_loss": -6.53964376449585, "global_step": 119629, "epoch": 2848} {"train_loss": -6.661037445068359, "global_step": 119630, "epoch": 2848} {"train_loss": -6.467903137207031, "global_step": 119631, "epoch": 2848} {"train_loss": -6.4995927810668945, "global_step": 119632, "epoch": 2848} {"train_loss": -6.589184761047363, "global_step": 119633, "epoch": 2848} {"train_loss": -6.548639297485352, "global_step": 119634, "epoch": 2848} {"train_loss": -6.652215003967285, "global_step": 119635, "epoch": 2848} {"train_loss": -6.583868026733398, "global_step": 119636, "epoch": 2848} {"train_loss": -6.5615434646606445, "global_step": 119637, "epoch": 2848} {"train_loss": -6.442708969116211, "global_step": 119638, "epoch": 2848} {"train_loss": -6.597890377044678, "global_step": 119639, "epoch": 2848} {"train_loss": -6.610896110534668, "global_step": 119640, "epoch": 2848} {"train_loss": -6.392449855804443, "global_step": 119641, "epoch": 2848} {"train_loss": -6.608829498291016, "global_step": 119642, "epoch": 2848} {"train_loss": -6.557415008544922, "global_step": 119643, "epoch": 2848} {"train_loss": -6.572945594787598, "global_step": 119644, "epoch": 2848} {"train_loss": -6.567144393920898, "global_step": 119645, "epoch": 2848} {"train_loss": -6.537546157836914, "global_step": 119646, "epoch": 2848} {"train_loss": -6.544639587402344, "global_step": 119647, "epoch": 2848} {"train_loss": -6.535114288330078, "global_step": 119648, "epoch": 2848} {"train_loss": -6.392749786376953, "global_step": 119649, "epoch": 2848} {"train_loss": -6.424328327178955, "global_step": 119650, "epoch": 2848} {"train_loss": -6.598867416381836, "global_step": 119651, "epoch": 2848} {"train_loss": -6.535109043121338, "global_step": 119652, "epoch": 2848} {"train_loss": -6.4476318359375, "global_step": 119653, "epoch": 2848} {"train_loss": -6.540568828582764, "global_step": 119654, "epoch": 2848} {"train_loss": -6.4931464195251465, "global_step": 119655, "epoch": 2848} {"train_loss": -6.479611873626709, "global_step": 119656, "epoch": 2848} {"train_loss": -6.545282386598133, "global_step": 119657, "epoch": 2848, "val_loss": 68000.4140625} {"train_loss": -6.534780979156494, "global_step": 119658, "epoch": 2849} {"train_loss": -6.510018348693848, "global_step": 119659, "epoch": 2849} {"train_loss": -6.630934715270996, "global_step": 119660, "epoch": 2849} {"train_loss": -6.4484968185424805, "global_step": 119661, "epoch": 2849} {"train_loss": -6.623088836669922, "global_step": 119662, "epoch": 2849} {"train_loss": -6.5887861251831055, "global_step": 119663, "epoch": 2849} {"train_loss": -6.513144493103027, "global_step": 119664, "epoch": 2849} {"train_loss": -6.679291248321533, "global_step": 119665, "epoch": 2849} {"train_loss": -6.58818244934082, "global_step": 119666, "epoch": 2849} {"train_loss": -6.511298656463623, "global_step": 119667, "epoch": 2849} {"train_loss": -6.473455429077148, "global_step": 119668, "epoch": 2849} {"train_loss": -6.536954402923584, "global_step": 119669, "epoch": 2849} {"train_loss": -6.468277931213379, "global_step": 119670, "epoch": 2849} {"train_loss": -6.455631256103516, "global_step": 119671, "epoch": 2849} {"train_loss": -6.494533061981201, "global_step": 119672, "epoch": 2849} {"train_loss": -6.531946659088135, "global_step": 119673, "epoch": 2849} {"train_loss": -6.44273567199707, "global_step": 119674, "epoch": 2849} {"train_loss": -6.492912292480469, "global_step": 119675, "epoch": 2849} {"train_loss": -6.455894470214844, "global_step": 119676, "epoch": 2849} {"train_loss": -6.432018280029297, "global_step": 119677, "epoch": 2849} {"train_loss": -6.464776039123535, "global_step": 119678, "epoch": 2849} {"train_loss": -6.4793701171875, "global_step": 119679, "epoch": 2849} {"train_loss": -6.540922164916992, "global_step": 119680, "epoch": 2849} {"train_loss": -6.495573043823242, "global_step": 119681, "epoch": 2849} {"train_loss": -6.48557186126709, "global_step": 119682, "epoch": 2849} {"train_loss": -6.62174129486084, "global_step": 119683, "epoch": 2849} {"train_loss": -6.560614585876465, "global_step": 119684, "epoch": 2849} {"train_loss": -6.461718559265137, "global_step": 119685, "epoch": 2849} {"train_loss": -6.48649787902832, "global_step": 119686, "epoch": 2849} {"train_loss": -6.457270622253418, "global_step": 119687, "epoch": 2849} {"train_loss": -6.5658159255981445, "global_step": 119688, "epoch": 2849} {"train_loss": -6.512853622436523, "global_step": 119689, "epoch": 2849} {"train_loss": -6.371222019195557, "global_step": 119690, "epoch": 2849} {"train_loss": -6.529170036315918, "global_step": 119691, "epoch": 2849} {"train_loss": -6.565553665161133, "global_step": 119692, "epoch": 2849} {"train_loss": -6.486479759216309, "global_step": 119693, "epoch": 2849} {"train_loss": -6.503856182098389, "global_step": 119694, "epoch": 2849} {"train_loss": -6.4427642822265625, "global_step": 119695, "epoch": 2849} {"train_loss": -6.489311695098877, "global_step": 119696, "epoch": 2849} {"train_loss": -6.500874996185303, "global_step": 119697, "epoch": 2849} {"train_loss": -6.501690864562988, "global_step": 119698, "epoch": 2849} {"train_loss": -6.509605873198736, "global_step": 119699, "epoch": 2849, "val_loss": 67952.0078125} {"train_loss": -6.433342456817627, "global_step": 119700, "epoch": 2850} {"train_loss": -6.5792236328125, "global_step": 119701, "epoch": 2850} {"train_loss": -6.363514423370361, "global_step": 119702, "epoch": 2850} {"train_loss": -6.477351188659668, "global_step": 119703, "epoch": 2850} {"train_loss": -6.600772857666016, "global_step": 119704, "epoch": 2850} {"train_loss": -6.488224029541016, "global_step": 119705, "epoch": 2850} {"train_loss": -6.487641334533691, "global_step": 119706, "epoch": 2850} {"train_loss": -6.525762557983398, "global_step": 119707, "epoch": 2850} {"train_loss": -6.528106689453125, "global_step": 119708, "epoch": 2850} {"train_loss": -6.561290740966797, "global_step": 119709, "epoch": 2850} {"train_loss": -6.510951995849609, "global_step": 119710, "epoch": 2850} {"train_loss": -6.4547648429870605, "global_step": 119711, "epoch": 2850} {"train_loss": -6.389358997344971, "global_step": 119712, "epoch": 2850} {"train_loss": -6.4418487548828125, "global_step": 119713, "epoch": 2850} {"train_loss": -6.639034271240234, "global_step": 119714, "epoch": 2850} {"train_loss": -6.387114524841309, "global_step": 119715, "epoch": 2850} {"train_loss": -6.560117721557617, "global_step": 119716, "epoch": 2850} {"train_loss": -6.452857971191406, "global_step": 119717, "epoch": 2850} {"train_loss": -6.4147138595581055, "global_step": 119718, "epoch": 2850} {"train_loss": -6.455421447753906, "global_step": 119719, "epoch": 2850} {"train_loss": -6.399947643280029, "global_step": 119720, "epoch": 2850} {"train_loss": -6.548383712768555, "global_step": 119721, "epoch": 2850} {"train_loss": -6.573211193084717, "global_step": 119722, "epoch": 2850} {"train_loss": -6.390928268432617, "global_step": 119723, "epoch": 2850} {"train_loss": -6.469901084899902, "global_step": 119724, "epoch": 2850} {"train_loss": -6.455063819885254, "global_step": 119725, "epoch": 2850} {"train_loss": -6.368638515472412, "global_step": 119726, "epoch": 2850} {"train_loss": -6.435457706451416, "global_step": 119727, "epoch": 2850} {"train_loss": -6.5400390625, "global_step": 119728, "epoch": 2850} {"train_loss": -6.469147682189941, "global_step": 119729, "epoch": 2850} {"train_loss": -6.451759338378906, "global_step": 119730, "epoch": 2850} {"train_loss": -6.508732795715332, "global_step": 119731, "epoch": 2850} {"train_loss": -6.456301689147949, "global_step": 119732, "epoch": 2850} {"train_loss": -6.548408508300781, "global_step": 119733, "epoch": 2850} {"train_loss": -6.508014678955078, "global_step": 119734, "epoch": 2850} {"train_loss": -6.411716461181641, "global_step": 119735, "epoch": 2850} {"train_loss": -6.484224319458008, "global_step": 119736, "epoch": 2850} {"train_loss": -6.417934417724609, "global_step": 119737, "epoch": 2850} {"train_loss": -6.584311485290527, "global_step": 119738, "epoch": 2850} {"train_loss": -6.424280166625977, "global_step": 119739, "epoch": 2850} {"train_loss": -6.570402145385742, "global_step": 119740, "epoch": 2850} {"train_loss": -6.480639889126732, "global_step": 119741, "epoch": 2850, "train/sim_max_reward_0": 0.23220940478901658, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.6882506376180456, "train/sim_max_reward_3": 0.12428885619496693, "train/sim_max_reward_4": 0.6457548999083974, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.9319565766707, "test/sim_max_reward_4400001": 0.9228566022880248, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.9442067959518221, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9828768069451234, "test/sim_max_reward_4400006": 0.9830346059803674, "test/sim_max_reward_4400007": 0.03563130485048696, "test/sim_max_reward_4400008": 0.3090890740366581, "test/sim_max_reward_4400009": 0.9690122899481964, "test/sim_max_reward_4400010": 0.24944975132069822, "test/sim_max_reward_4400011": 0.2205173616773945, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9197812686284523, "test/sim_max_reward_4400014": 0.23102422933586267, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.13791366732736285, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24791531491759136, "test/sim_max_reward_4400019": 0.866125952486802, "test/sim_max_reward_4400020": 3.7862001189071815e-05, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.18424677043138135, "test/sim_max_reward_4400023": 0.9111789150156762, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.24994939510384137, "test/sim_max_reward_4400026": 0.6329940432203052, "test/sim_max_reward_4400027": 0.03868228861000423, "test/sim_max_reward_4400028": 0.8769549095730838, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9951950456779787, "test/sim_max_reward_4400031": 0.9556449397905105, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.6479075433663931, "test/sim_max_reward_4400034": 0.9638365431159771, "test/sim_max_reward_4400035": 0.9964357921333004, "test/sim_max_reward_4400036": 0.3283761175711872, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.8812739872365793, "test/sim_max_reward_4400039": 0.9951866740872414, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8607890260585778, "test/sim_max_reward_4400042": 0.8916633497661697, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8184764269721299, "test/sim_max_reward_4400047": 0.9750772409555057, "test/sim_max_reward_4400048": 0.8819102451355577, "test/sim_max_reward_4400049": 0.8875130413595594, "train/mean_score": 0.48058142631210227, "test/mean_score": 0.5908376091009355, "val_loss": 68068.0078125} {"train_loss": -6.436550140380859, "global_step": 119742, "epoch": 2851} {"train_loss": -6.511823654174805, "global_step": 119743, "epoch": 2851} {"train_loss": -6.61577033996582, "global_step": 119744, "epoch": 2851} {"train_loss": -6.484358787536621, "global_step": 119745, "epoch": 2851} {"train_loss": -6.54496955871582, "global_step": 119746, "epoch": 2851} {"train_loss": -6.5475006103515625, "global_step": 119747, "epoch": 2851} {"train_loss": -6.492118835449219, "global_step": 119748, "epoch": 2851} {"train_loss": -6.560808181762695, "global_step": 119749, "epoch": 2851} {"train_loss": -6.5794501304626465, "global_step": 119750, "epoch": 2851} {"train_loss": -6.528901100158691, "global_step": 119751, "epoch": 2851} {"train_loss": -6.668170928955078, "global_step": 119752, "epoch": 2851} {"train_loss": -6.6058573722839355, "global_step": 119753, "epoch": 2851} {"train_loss": -6.421473503112793, "global_step": 119754, "epoch": 2851} {"train_loss": -6.531293869018555, "global_step": 119755, "epoch": 2851} {"train_loss": -6.67232084274292, "global_step": 119756, "epoch": 2851} {"train_loss": -6.707181930541992, "global_step": 119757, "epoch": 2851} {"train_loss": -6.482301712036133, "global_step": 119758, "epoch": 2851} {"train_loss": -6.555814743041992, "global_step": 119759, "epoch": 2851} {"train_loss": -6.561305999755859, "global_step": 119760, "epoch": 2851} {"train_loss": -6.437499046325684, "global_step": 119761, "epoch": 2851} {"train_loss": -6.516467094421387, "global_step": 119762, "epoch": 2851} {"train_loss": -6.522727012634277, "global_step": 119763, "epoch": 2851} {"train_loss": -6.466428279876709, "global_step": 119764, "epoch": 2851} {"train_loss": -6.627073287963867, "global_step": 119765, "epoch": 2851} {"train_loss": -6.55610466003418, "global_step": 119766, "epoch": 2851} {"train_loss": -6.526451110839844, "global_step": 119767, "epoch": 2851} {"train_loss": -6.524438858032227, "global_step": 119768, "epoch": 2851} {"train_loss": -6.492700099945068, "global_step": 119769, "epoch": 2851} {"train_loss": -6.587092876434326, "global_step": 119770, "epoch": 2851} {"train_loss": -6.485065937042236, "global_step": 119771, "epoch": 2851} {"train_loss": -6.586479187011719, "global_step": 119772, "epoch": 2851} {"train_loss": -6.522629737854004, "global_step": 119773, "epoch": 2851} {"train_loss": -6.567620277404785, "global_step": 119774, "epoch": 2851} {"train_loss": -6.5241475105285645, "global_step": 119775, "epoch": 2851} {"train_loss": -6.400089263916016, "global_step": 119776, "epoch": 2851} {"train_loss": -6.5457611083984375, "global_step": 119777, "epoch": 2851} {"train_loss": -6.5674285888671875, "global_step": 119778, "epoch": 2851} {"train_loss": -6.582124710083008, "global_step": 119779, "epoch": 2851} {"train_loss": -6.531106948852539, "global_step": 119780, "epoch": 2851} {"train_loss": -6.493556022644043, "global_step": 119781, "epoch": 2851} {"train_loss": -6.652993202209473, "global_step": 119782, "epoch": 2851} {"train_loss": -6.540862832750593, "global_step": 119783, "epoch": 2851, "val_loss": 67838.7578125} {"train_loss": -6.490924835205078, "global_step": 119784, "epoch": 2852} {"train_loss": -6.543535232543945, "global_step": 119785, "epoch": 2852} {"train_loss": -6.428091049194336, "global_step": 119786, "epoch": 2852} {"train_loss": -6.614229679107666, "global_step": 119787, "epoch": 2852} {"train_loss": -6.642972469329834, "global_step": 119788, "epoch": 2852} {"train_loss": -6.658246994018555, "global_step": 119789, "epoch": 2852} {"train_loss": -6.576672554016113, "global_step": 119790, "epoch": 2852} {"train_loss": -6.647316932678223, "global_step": 119791, "epoch": 2852} {"train_loss": -6.597706317901611, "global_step": 119792, "epoch": 2852} {"train_loss": -6.618085861206055, "global_step": 119793, "epoch": 2852} {"train_loss": -6.6639814376831055, "global_step": 119794, "epoch": 2852} {"train_loss": -6.52876091003418, "global_step": 119795, "epoch": 2852} {"train_loss": -6.615597724914551, "global_step": 119796, "epoch": 2852} {"train_loss": -6.47896146774292, "global_step": 119797, "epoch": 2852} {"train_loss": -6.636650085449219, "global_step": 119798, "epoch": 2852} {"train_loss": -6.510102272033691, "global_step": 119799, "epoch": 2852} {"train_loss": -6.62999153137207, "global_step": 119800, "epoch": 2852} {"train_loss": -6.5544514656066895, "global_step": 119801, "epoch": 2852} {"train_loss": -6.556761741638184, "global_step": 119802, "epoch": 2852} {"train_loss": -6.519996643066406, "global_step": 119803, "epoch": 2852} {"train_loss": -6.635310173034668, "global_step": 119804, "epoch": 2852} {"train_loss": -6.447917461395264, "global_step": 119805, "epoch": 2852} {"train_loss": -6.57945442199707, "global_step": 119806, "epoch": 2852} {"train_loss": -6.451448917388916, "global_step": 119807, "epoch": 2852} {"train_loss": -6.449443817138672, "global_step": 119808, "epoch": 2852} {"train_loss": -6.577177047729492, "global_step": 119809, "epoch": 2852} {"train_loss": -6.547995567321777, "global_step": 119810, "epoch": 2852} {"train_loss": -6.519129753112793, "global_step": 119811, "epoch": 2852} {"train_loss": -6.534071922302246, "global_step": 119812, "epoch": 2852} {"train_loss": -6.525430679321289, "global_step": 119813, "epoch": 2852} {"train_loss": -6.570560932159424, "global_step": 119814, "epoch": 2852} {"train_loss": -6.512660980224609, "global_step": 119815, "epoch": 2852} {"train_loss": -6.559185028076172, "global_step": 119816, "epoch": 2852} {"train_loss": -6.486034870147705, "global_step": 119817, "epoch": 2852} {"train_loss": -6.3962883949279785, "global_step": 119818, "epoch": 2852} {"train_loss": -6.535070896148682, "global_step": 119819, "epoch": 2852} {"train_loss": -6.370861530303955, "global_step": 119820, "epoch": 2852} {"train_loss": -6.481818199157715, "global_step": 119821, "epoch": 2852} {"train_loss": -6.518305778503418, "global_step": 119822, "epoch": 2852} {"train_loss": -6.427062511444092, "global_step": 119823, "epoch": 2852} {"train_loss": -6.581910133361816, "global_step": 119824, "epoch": 2852} {"train_loss": -6.543284688677106, "global_step": 119825, "epoch": 2852, "val_loss": 68129.3125} {"train_loss": -6.461204528808594, "global_step": 119826, "epoch": 2853} {"train_loss": -6.539108753204346, "global_step": 119827, "epoch": 2853} {"train_loss": -6.532186031341553, "global_step": 119828, "epoch": 2853} {"train_loss": -6.4968671798706055, "global_step": 119829, "epoch": 2853} {"train_loss": -6.562274932861328, "global_step": 119830, "epoch": 2853} {"train_loss": -6.4522786140441895, "global_step": 119831, "epoch": 2853} {"train_loss": -6.510604381561279, "global_step": 119832, "epoch": 2853} {"train_loss": -6.640353202819824, "global_step": 119833, "epoch": 2853} {"train_loss": -6.455875396728516, "global_step": 119834, "epoch": 2853} {"train_loss": -6.523612976074219, "global_step": 119835, "epoch": 2853} {"train_loss": -6.539958953857422, "global_step": 119836, "epoch": 2853} {"train_loss": -6.564655303955078, "global_step": 119837, "epoch": 2853} {"train_loss": -6.491548538208008, "global_step": 119838, "epoch": 2853} {"train_loss": -6.607353210449219, "global_step": 119839, "epoch": 2853} {"train_loss": -6.630424499511719, "global_step": 119840, "epoch": 2853} {"train_loss": -6.587255954742432, "global_step": 119841, "epoch": 2853} {"train_loss": -6.630687236785889, "global_step": 119842, "epoch": 2853} {"train_loss": -6.470610618591309, "global_step": 119843, "epoch": 2853} {"train_loss": -6.520852088928223, "global_step": 119844, "epoch": 2853} {"train_loss": -6.5706634521484375, "global_step": 119845, "epoch": 2853} {"train_loss": -6.419216632843018, "global_step": 119846, "epoch": 2853} {"train_loss": -6.513699531555176, "global_step": 119847, "epoch": 2853} {"train_loss": -6.475696086883545, "global_step": 119848, "epoch": 2853} {"train_loss": -6.618627548217773, "global_step": 119849, "epoch": 2853} {"train_loss": -6.45240592956543, "global_step": 119850, "epoch": 2853} {"train_loss": -6.407890319824219, "global_step": 119851, "epoch": 2853} {"train_loss": -6.501249313354492, "global_step": 119852, "epoch": 2853} {"train_loss": -6.479740142822266, "global_step": 119853, "epoch": 2853} {"train_loss": -6.457662105560303, "global_step": 119854, "epoch": 2853} {"train_loss": -6.457047462463379, "global_step": 119855, "epoch": 2853} {"train_loss": -6.4404730796813965, "global_step": 119856, "epoch": 2853} {"train_loss": -6.54608154296875, "global_step": 119857, "epoch": 2853} {"train_loss": -6.4889373779296875, "global_step": 119858, "epoch": 2853} {"train_loss": -6.571084022521973, "global_step": 119859, "epoch": 2853} {"train_loss": -6.517582893371582, "global_step": 119860, "epoch": 2853} {"train_loss": -6.471140384674072, "global_step": 119861, "epoch": 2853} {"train_loss": -6.5665178298950195, "global_step": 119862, "epoch": 2853} {"train_loss": -6.491049766540527, "global_step": 119863, "epoch": 2853} {"train_loss": -6.506707668304443, "global_step": 119864, "epoch": 2853} {"train_loss": -6.488459587097168, "global_step": 119865, "epoch": 2853} {"train_loss": -6.502300262451172, "global_step": 119866, "epoch": 2853} {"train_loss": -6.515411876496815, "global_step": 119867, "epoch": 2853, "val_loss": 68020.2890625} {"train_loss": -6.608190059661865, "global_step": 119868, "epoch": 2854} {"train_loss": -6.450645446777344, "global_step": 119869, "epoch": 2854} {"train_loss": -6.5022172927856445, "global_step": 119870, "epoch": 2854} {"train_loss": -6.369071960449219, "global_step": 119871, "epoch": 2854} {"train_loss": -6.600124359130859, "global_step": 119872, "epoch": 2854} {"train_loss": -6.568958282470703, "global_step": 119873, "epoch": 2854} {"train_loss": -6.635936737060547, "global_step": 119874, "epoch": 2854} {"train_loss": -6.585904121398926, "global_step": 119875, "epoch": 2854} {"train_loss": -6.444092273712158, "global_step": 119876, "epoch": 2854} {"train_loss": -6.428620338439941, "global_step": 119877, "epoch": 2854} {"train_loss": -6.534836769104004, "global_step": 119878, "epoch": 2854} {"train_loss": -6.471636772155762, "global_step": 119879, "epoch": 2854} {"train_loss": -6.396982192993164, "global_step": 119880, "epoch": 2854} {"train_loss": -6.496721267700195, "global_step": 119881, "epoch": 2854} {"train_loss": -6.460782051086426, "global_step": 119882, "epoch": 2854} {"train_loss": -6.416172981262207, "global_step": 119883, "epoch": 2854} {"train_loss": -6.308316230773926, "global_step": 119884, "epoch": 2854} {"train_loss": -6.599276065826416, "global_step": 119885, "epoch": 2854} {"train_loss": -6.370185852050781, "global_step": 119886, "epoch": 2854} {"train_loss": -6.327533721923828, "global_step": 119887, "epoch": 2854} {"train_loss": -6.476290702819824, "global_step": 119888, "epoch": 2854} {"train_loss": -6.2607269287109375, "global_step": 119889, "epoch": 2854} {"train_loss": -6.412887096405029, "global_step": 119890, "epoch": 2854} {"train_loss": -6.4097700119018555, "global_step": 119891, "epoch": 2854} {"train_loss": -6.300786018371582, "global_step": 119892, "epoch": 2854} {"train_loss": -6.237817287445068, "global_step": 119893, "epoch": 2854} {"train_loss": -6.498587608337402, "global_step": 119894, "epoch": 2854} {"train_loss": -6.257673740386963, "global_step": 119895, "epoch": 2854} {"train_loss": -6.364975929260254, "global_step": 119896, "epoch": 2854} {"train_loss": -6.428734302520752, "global_step": 119897, "epoch": 2854} {"train_loss": -6.398289680480957, "global_step": 119898, "epoch": 2854} {"train_loss": -6.484342098236084, "global_step": 119899, "epoch": 2854} {"train_loss": -6.480793476104736, "global_step": 119900, "epoch": 2854} {"train_loss": -6.4598846435546875, "global_step": 119901, "epoch": 2854} {"train_loss": -6.3581767082214355, "global_step": 119902, "epoch": 2854} {"train_loss": -6.415606498718262, "global_step": 119903, "epoch": 2854} {"train_loss": -6.5589799880981445, "global_step": 119904, "epoch": 2854} {"train_loss": -6.4834465980529785, "global_step": 119905, "epoch": 2854} {"train_loss": -6.490952491760254, "global_step": 119906, "epoch": 2854} {"train_loss": -6.497917652130127, "global_step": 119907, "epoch": 2854} {"train_loss": -6.544681072235107, "global_step": 119908, "epoch": 2854} {"train_loss": -6.452302739733741, "global_step": 119909, "epoch": 2854, "val_loss": 67901.21875} {"train_loss": -6.4812726974487305, "global_step": 119910, "epoch": 2855} {"train_loss": -6.416290283203125, "global_step": 119911, "epoch": 2855} {"train_loss": -6.557817459106445, "global_step": 119912, "epoch": 2855} {"train_loss": -6.624124526977539, "global_step": 119913, "epoch": 2855} {"train_loss": -6.535726547241211, "global_step": 119914, "epoch": 2855} {"train_loss": -6.588969707489014, "global_step": 119915, "epoch": 2855} {"train_loss": -6.547791481018066, "global_step": 119916, "epoch": 2855} {"train_loss": -6.589454650878906, "global_step": 119917, "epoch": 2855} {"train_loss": -6.6979079246521, "global_step": 119918, "epoch": 2855} {"train_loss": -6.62713623046875, "global_step": 119919, "epoch": 2855} {"train_loss": -6.521594047546387, "global_step": 119920, "epoch": 2855} {"train_loss": -6.689915180206299, "global_step": 119921, "epoch": 2855} {"train_loss": -6.550822734832764, "global_step": 119922, "epoch": 2855} {"train_loss": -6.559261798858643, "global_step": 119923, "epoch": 2855} {"train_loss": -6.739872455596924, "global_step": 119924, "epoch": 2855} {"train_loss": -6.522468566894531, "global_step": 119925, "epoch": 2855} {"train_loss": -6.605581760406494, "global_step": 119926, "epoch": 2855} {"train_loss": -6.505903244018555, "global_step": 119927, "epoch": 2855} {"train_loss": -6.592689037322998, "global_step": 119928, "epoch": 2855} {"train_loss": -6.565812110900879, "global_step": 119929, "epoch": 2855} {"train_loss": -6.610314846038818, "global_step": 119930, "epoch": 2855} {"train_loss": -6.574613571166992, "global_step": 119931, "epoch": 2855} {"train_loss": -6.500369071960449, "global_step": 119932, "epoch": 2855} {"train_loss": -6.621390342712402, "global_step": 119933, "epoch": 2855} {"train_loss": -6.6762590408325195, "global_step": 119934, "epoch": 2855} {"train_loss": -6.556201934814453, "global_step": 119935, "epoch": 2855} {"train_loss": -6.5621747970581055, "global_step": 119936, "epoch": 2855} {"train_loss": -6.6417083740234375, "global_step": 119937, "epoch": 2855} {"train_loss": -6.558404922485352, "global_step": 119938, "epoch": 2855} {"train_loss": -6.528820037841797, "global_step": 119939, "epoch": 2855} {"train_loss": -6.434473037719727, "global_step": 119940, "epoch": 2855} {"train_loss": -6.491919994354248, "global_step": 119941, "epoch": 2855} {"train_loss": -6.625207901000977, "global_step": 119942, "epoch": 2855} {"train_loss": -6.5880231857299805, "global_step": 119943, "epoch": 2855} {"train_loss": -6.57360315322876, "global_step": 119944, "epoch": 2855} {"train_loss": -6.61517333984375, "global_step": 119945, "epoch": 2855} {"train_loss": -6.605125427246094, "global_step": 119946, "epoch": 2855} {"train_loss": -6.501898765563965, "global_step": 119947, "epoch": 2855} {"train_loss": -6.515019416809082, "global_step": 119948, "epoch": 2855} {"train_loss": -6.642024993896484, "global_step": 119949, "epoch": 2855} {"train_loss": -6.61625862121582, "global_step": 119950, "epoch": 2855} {"train_loss": -6.575615394683111, "global_step": 119951, "epoch": 2855, "val_loss": 67994.4609375} {"train_loss": -6.594111919403076, "global_step": 119952, "epoch": 2856} {"train_loss": -6.540389060974121, "global_step": 119953, "epoch": 2856} {"train_loss": -6.58906888961792, "global_step": 119954, "epoch": 2856} {"train_loss": -6.578821182250977, "global_step": 119955, "epoch": 2856} {"train_loss": -6.580633640289307, "global_step": 119956, "epoch": 2856} {"train_loss": -6.602644443511963, "global_step": 119957, "epoch": 2856} {"train_loss": -6.605535507202148, "global_step": 119958, "epoch": 2856} {"train_loss": -6.635724067687988, "global_step": 119959, "epoch": 2856} {"train_loss": -6.560695171356201, "global_step": 119960, "epoch": 2856} {"train_loss": -6.540276050567627, "global_step": 119961, "epoch": 2856} {"train_loss": -6.627884864807129, "global_step": 119962, "epoch": 2856} {"train_loss": -6.672985553741455, "global_step": 119963, "epoch": 2856} {"train_loss": -6.582405090332031, "global_step": 119964, "epoch": 2856} {"train_loss": -6.572484016418457, "global_step": 119965, "epoch": 2856} {"train_loss": -6.548528671264648, "global_step": 119966, "epoch": 2856} {"train_loss": -6.6196441650390625, "global_step": 119967, "epoch": 2856} {"train_loss": -6.428874969482422, "global_step": 119968, "epoch": 2856} {"train_loss": -6.51912784576416, "global_step": 119969, "epoch": 2856} {"train_loss": -6.624971389770508, "global_step": 119970, "epoch": 2856} {"train_loss": -6.591419696807861, "global_step": 119971, "epoch": 2856} {"train_loss": -6.60609245300293, "global_step": 119972, "epoch": 2856} {"train_loss": -6.479009628295898, "global_step": 119973, "epoch": 2856} {"train_loss": -6.5699968338012695, "global_step": 119974, "epoch": 2856} {"train_loss": -6.5587663650512695, "global_step": 119975, "epoch": 2856} {"train_loss": -6.523703575134277, "global_step": 119976, "epoch": 2856} {"train_loss": -6.605515480041504, "global_step": 119977, "epoch": 2856} {"train_loss": -6.525737762451172, "global_step": 119978, "epoch": 2856} {"train_loss": -6.633406639099121, "global_step": 119979, "epoch": 2856} {"train_loss": -6.485909461975098, "global_step": 119980, "epoch": 2856} {"train_loss": -6.427570343017578, "global_step": 119981, "epoch": 2856} {"train_loss": -6.470552444458008, "global_step": 119982, "epoch": 2856} {"train_loss": -6.490030288696289, "global_step": 119983, "epoch": 2856} {"train_loss": -6.567323207855225, "global_step": 119984, "epoch": 2856} {"train_loss": -6.524130821228027, "global_step": 119985, "epoch": 2856} {"train_loss": -6.486232757568359, "global_step": 119986, "epoch": 2856} {"train_loss": -6.515913963317871, "global_step": 119987, "epoch": 2856} {"train_loss": -6.575433731079102, "global_step": 119988, "epoch": 2856} {"train_loss": -6.378548622131348, "global_step": 119989, "epoch": 2856} {"train_loss": -6.451709747314453, "global_step": 119990, "epoch": 2856} {"train_loss": -6.49387264251709, "global_step": 119991, "epoch": 2856} {"train_loss": -6.637990951538086, "global_step": 119992, "epoch": 2856} {"train_loss": -6.55046744573684, "global_step": 119993, "epoch": 2856, "val_loss": 68174.5078125} {"train_loss": -6.439790725708008, "global_step": 119994, "epoch": 2857} {"train_loss": -6.557460784912109, "global_step": 119995, "epoch": 2857} {"train_loss": -6.565035343170166, "global_step": 119996, "epoch": 2857} {"train_loss": -6.5307159423828125, "global_step": 119997, "epoch": 2857} {"train_loss": -6.484400272369385, "global_step": 119998, "epoch": 2857} {"train_loss": -6.527344703674316, "global_step": 119999, "epoch": 2857} {"train_loss": -6.538018226623535, "global_step": 120000, "epoch": 2857} {"train_loss": -6.515256404876709, "global_step": 120001, "epoch": 2857} {"train_loss": -6.542898178100586, "global_step": 120002, "epoch": 2857} {"train_loss": -6.398976802825928, "global_step": 120003, "epoch": 2857} {"train_loss": -6.489563941955566, "global_step": 120004, "epoch": 2857} {"train_loss": -6.6350321769714355, "global_step": 120005, "epoch": 2857} {"train_loss": -6.5487284660339355, "global_step": 120006, "epoch": 2857} {"train_loss": -6.424991130828857, "global_step": 120007, "epoch": 2857} {"train_loss": -6.590436935424805, "global_step": 120008, "epoch": 2857} {"train_loss": -6.452619552612305, "global_step": 120009, "epoch": 2857} {"train_loss": -6.534440040588379, "global_step": 120010, "epoch": 2857} {"train_loss": -6.5107011795043945, "global_step": 120011, "epoch": 2857} {"train_loss": -6.526226043701172, "global_step": 120012, "epoch": 2857} {"train_loss": -6.514077186584473, "global_step": 120013, "epoch": 2857} {"train_loss": -6.4524078369140625, "global_step": 120014, "epoch": 2857} {"train_loss": -6.494503021240234, "global_step": 120015, "epoch": 2857} {"train_loss": -6.401339530944824, "global_step": 120016, "epoch": 2857} {"train_loss": -6.537820816040039, "global_step": 120017, "epoch": 2857} {"train_loss": -6.569824695587158, "global_step": 120018, "epoch": 2857} {"train_loss": -6.563541889190674, "global_step": 120019, "epoch": 2857} {"train_loss": -6.620479583740234, "global_step": 120020, "epoch": 2857} {"train_loss": -6.4737396240234375, "global_step": 120021, "epoch": 2857} {"train_loss": -6.677229881286621, "global_step": 120022, "epoch": 2857} {"train_loss": -6.54945707321167, "global_step": 120023, "epoch": 2857} {"train_loss": -6.519697666168213, "global_step": 120024, "epoch": 2857} {"train_loss": -6.566061019897461, "global_step": 120025, "epoch": 2857} {"train_loss": -6.492404937744141, "global_step": 120026, "epoch": 2857} {"train_loss": -6.575364589691162, "global_step": 120027, "epoch": 2857} {"train_loss": -6.435202121734619, "global_step": 120028, "epoch": 2857} {"train_loss": -6.44583797454834, "global_step": 120029, "epoch": 2857} {"train_loss": -6.567508697509766, "global_step": 120030, "epoch": 2857} {"train_loss": -6.4429216384887695, "global_step": 120031, "epoch": 2857} {"train_loss": -6.515717029571533, "global_step": 120032, "epoch": 2857} {"train_loss": -6.6993865966796875, "global_step": 120033, "epoch": 2857} {"train_loss": -6.587357044219971, "global_step": 120034, "epoch": 2857} {"train_loss": -6.524671168554397, "global_step": 120035, "epoch": 2857, "val_loss": 68092.0859375} {"train_loss": -6.503028869628906, "global_step": 120036, "epoch": 2858} {"train_loss": -6.595979690551758, "global_step": 120037, "epoch": 2858} {"train_loss": -6.476940155029297, "global_step": 120038, "epoch": 2858} {"train_loss": -6.478760719299316, "global_step": 120039, "epoch": 2858} {"train_loss": -6.405548095703125, "global_step": 120040, "epoch": 2858} {"train_loss": -6.507023811340332, "global_step": 120041, "epoch": 2858} {"train_loss": -6.4888200759887695, "global_step": 120042, "epoch": 2858} {"train_loss": -6.530696868896484, "global_step": 120043, "epoch": 2858} {"train_loss": -6.511910915374756, "global_step": 120044, "epoch": 2858} {"train_loss": -6.433584213256836, "global_step": 120045, "epoch": 2858} {"train_loss": -6.51118803024292, "global_step": 120046, "epoch": 2858} {"train_loss": -6.438238143920898, "global_step": 120047, "epoch": 2858} {"train_loss": -6.553297996520996, "global_step": 120048, "epoch": 2858} {"train_loss": -6.6071391105651855, "global_step": 120049, "epoch": 2858} {"train_loss": -6.452549934387207, "global_step": 120050, "epoch": 2858} {"train_loss": -6.631751537322998, "global_step": 120051, "epoch": 2858} {"train_loss": -6.503005027770996, "global_step": 120052, "epoch": 2858} {"train_loss": -6.504735946655273, "global_step": 120053, "epoch": 2858} {"train_loss": -6.48970890045166, "global_step": 120054, "epoch": 2858} {"train_loss": -6.5709052085876465, "global_step": 120055, "epoch": 2858} {"train_loss": -6.52821683883667, "global_step": 120056, "epoch": 2858} {"train_loss": -6.519624710083008, "global_step": 120057, "epoch": 2858} {"train_loss": -6.643721580505371, "global_step": 120058, "epoch": 2858} {"train_loss": -6.543399810791016, "global_step": 120059, "epoch": 2858} {"train_loss": -6.6558027267456055, "global_step": 120060, "epoch": 2858} {"train_loss": -6.446004867553711, "global_step": 120061, "epoch": 2858} {"train_loss": -6.5608930587768555, "global_step": 120062, "epoch": 2858} {"train_loss": -6.467399597167969, "global_step": 120063, "epoch": 2858} {"train_loss": -6.544198036193848, "global_step": 120064, "epoch": 2858} {"train_loss": -6.596105098724365, "global_step": 120065, "epoch": 2858} {"train_loss": -6.566067695617676, "global_step": 120066, "epoch": 2858} {"train_loss": -6.608772277832031, "global_step": 120067, "epoch": 2858} {"train_loss": -6.509676456451416, "global_step": 120068, "epoch": 2858} {"train_loss": -6.584848403930664, "global_step": 120069, "epoch": 2858} {"train_loss": -6.509156703948975, "global_step": 120070, "epoch": 2858} {"train_loss": -6.457709789276123, "global_step": 120071, "epoch": 2858} {"train_loss": -6.566243648529053, "global_step": 120072, "epoch": 2858} {"train_loss": -6.537721633911133, "global_step": 120073, "epoch": 2858} {"train_loss": -6.522428512573242, "global_step": 120074, "epoch": 2858} {"train_loss": -6.411527633666992, "global_step": 120075, "epoch": 2858} {"train_loss": -6.548447608947754, "global_step": 120076, "epoch": 2858} {"train_loss": -6.522591431935628, "global_step": 120077, "epoch": 2858, "val_loss": 68290.9140625} {"train_loss": -6.483927249908447, "global_step": 120078, "epoch": 2859} {"train_loss": -6.589088439941406, "global_step": 120079, "epoch": 2859} {"train_loss": -6.383858680725098, "global_step": 120080, "epoch": 2859} {"train_loss": -6.5850653648376465, "global_step": 120081, "epoch": 2859} {"train_loss": -6.495704650878906, "global_step": 120082, "epoch": 2859} {"train_loss": -6.387628555297852, "global_step": 120083, "epoch": 2859} {"train_loss": -6.514474868774414, "global_step": 120084, "epoch": 2859} {"train_loss": -6.395939826965332, "global_step": 120085, "epoch": 2859} {"train_loss": -6.443387031555176, "global_step": 120086, "epoch": 2859} {"train_loss": -6.600436210632324, "global_step": 120087, "epoch": 2859} {"train_loss": -6.521014213562012, "global_step": 120088, "epoch": 2859} {"train_loss": -6.569547653198242, "global_step": 120089, "epoch": 2859} {"train_loss": -6.586050987243652, "global_step": 120090, "epoch": 2859} {"train_loss": -6.536555290222168, "global_step": 120091, "epoch": 2859} {"train_loss": -6.593860626220703, "global_step": 120092, "epoch": 2859} {"train_loss": -6.433940410614014, "global_step": 120093, "epoch": 2859} {"train_loss": -6.536367893218994, "global_step": 120094, "epoch": 2859} {"train_loss": -6.545053958892822, "global_step": 120095, "epoch": 2859} {"train_loss": -6.428602695465088, "global_step": 120096, "epoch": 2859} {"train_loss": -6.473634719848633, "global_step": 120097, "epoch": 2859} {"train_loss": -6.5492987632751465, "global_step": 120098, "epoch": 2859} {"train_loss": -6.539355278015137, "global_step": 120099, "epoch": 2859} {"train_loss": -6.618109226226807, "global_step": 120100, "epoch": 2859} {"train_loss": -6.421989440917969, "global_step": 120101, "epoch": 2859} {"train_loss": -6.596030235290527, "global_step": 120102, "epoch": 2859} {"train_loss": -6.470782279968262, "global_step": 120103, "epoch": 2859} {"train_loss": -6.263179302215576, "global_step": 120104, "epoch": 2859} {"train_loss": -6.497981071472168, "global_step": 120105, "epoch": 2859} {"train_loss": -6.3657121658325195, "global_step": 120106, "epoch": 2859} {"train_loss": -6.3785858154296875, "global_step": 120107, "epoch": 2859} {"train_loss": -6.5097198486328125, "global_step": 120108, "epoch": 2859} {"train_loss": -6.337275981903076, "global_step": 120109, "epoch": 2859} {"train_loss": -6.456389427185059, "global_step": 120110, "epoch": 2859} {"train_loss": -6.321508884429932, "global_step": 120111, "epoch": 2859} {"train_loss": -6.370349884033203, "global_step": 120112, "epoch": 2859} {"train_loss": -6.324834823608398, "global_step": 120113, "epoch": 2859} {"train_loss": -6.568342685699463, "global_step": 120114, "epoch": 2859} {"train_loss": -6.427667140960693, "global_step": 120115, "epoch": 2859} {"train_loss": -6.514338493347168, "global_step": 120116, "epoch": 2859} {"train_loss": -6.507604598999023, "global_step": 120117, "epoch": 2859} {"train_loss": -6.502649784088135, "global_step": 120118, "epoch": 2859} {"train_loss": -6.4796447186242965, "global_step": 120119, "epoch": 2859, "val_loss": 68050.34375} {"train_loss": -6.410234451293945, "global_step": 120120, "epoch": 2860} {"train_loss": -6.387892246246338, "global_step": 120121, "epoch": 2860} {"train_loss": -6.337759971618652, "global_step": 120122, "epoch": 2860} {"train_loss": -6.433261871337891, "global_step": 120123, "epoch": 2860} {"train_loss": -6.405137062072754, "global_step": 120124, "epoch": 2860} {"train_loss": -6.509663105010986, "global_step": 120125, "epoch": 2860} {"train_loss": -6.5268964767456055, "global_step": 120126, "epoch": 2860} {"train_loss": -6.478145599365234, "global_step": 120127, "epoch": 2860} {"train_loss": -6.549498558044434, "global_step": 120128, "epoch": 2860} {"train_loss": -6.502683162689209, "global_step": 120129, "epoch": 2860} {"train_loss": -6.562064170837402, "global_step": 120130, "epoch": 2860} {"train_loss": -6.6878132820129395, "global_step": 120131, "epoch": 2860} {"train_loss": -6.630949020385742, "global_step": 120132, "epoch": 2860} {"train_loss": -6.476001739501953, "global_step": 120133, "epoch": 2860} {"train_loss": -6.5395355224609375, "global_step": 120134, "epoch": 2860} {"train_loss": -6.676181793212891, "global_step": 120135, "epoch": 2860} {"train_loss": -6.5323486328125, "global_step": 120136, "epoch": 2860} {"train_loss": -6.685656547546387, "global_step": 120137, "epoch": 2860} {"train_loss": -6.552306175231934, "global_step": 120138, "epoch": 2860} {"train_loss": -6.611663818359375, "global_step": 120139, "epoch": 2860} {"train_loss": -6.536504745483398, "global_step": 120140, "epoch": 2860} {"train_loss": -6.5460100173950195, "global_step": 120141, "epoch": 2860} {"train_loss": -6.511245250701904, "global_step": 120142, "epoch": 2860} {"train_loss": -6.616020202636719, "global_step": 120143, "epoch": 2860} {"train_loss": -6.56196928024292, "global_step": 120144, "epoch": 2860} {"train_loss": -6.558634281158447, "global_step": 120145, "epoch": 2860} {"train_loss": -6.617745399475098, "global_step": 120146, "epoch": 2860} {"train_loss": -6.567694664001465, "global_step": 120147, "epoch": 2860} {"train_loss": -6.652741432189941, "global_step": 120148, "epoch": 2860} {"train_loss": -6.564960956573486, "global_step": 120149, "epoch": 2860} {"train_loss": -6.580013751983643, "global_step": 120150, "epoch": 2860} {"train_loss": -6.611571788787842, "global_step": 120151, "epoch": 2860} {"train_loss": -6.52476692199707, "global_step": 120152, "epoch": 2860} {"train_loss": -6.586192607879639, "global_step": 120153, "epoch": 2860} {"train_loss": -6.587347030639648, "global_step": 120154, "epoch": 2860} {"train_loss": -6.544264793395996, "global_step": 120155, "epoch": 2860} {"train_loss": -6.549684524536133, "global_step": 120156, "epoch": 2860} {"train_loss": -6.565701484680176, "global_step": 120157, "epoch": 2860} {"train_loss": -6.478438854217529, "global_step": 120158, "epoch": 2860} {"train_loss": -6.479863166809082, "global_step": 120159, "epoch": 2860} {"train_loss": -6.471324443817139, "global_step": 120160, "epoch": 2860} {"train_loss": -6.539725360416231, "global_step": 120161, "epoch": 2860, "val_loss": 68164.0234375} {"train_loss": -6.532012462615967, "global_step": 120162, "epoch": 2861} {"train_loss": -6.541136741638184, "global_step": 120163, "epoch": 2861} {"train_loss": -6.529268264770508, "global_step": 120164, "epoch": 2861} {"train_loss": -6.5496625900268555, "global_step": 120165, "epoch": 2861} {"train_loss": -6.478646278381348, "global_step": 120166, "epoch": 2861} {"train_loss": -6.518884181976318, "global_step": 120167, "epoch": 2861} {"train_loss": -6.505285263061523, "global_step": 120168, "epoch": 2861} {"train_loss": -6.450277805328369, "global_step": 120169, "epoch": 2861} {"train_loss": -6.5081987380981445, "global_step": 120170, "epoch": 2861} {"train_loss": -6.468764781951904, "global_step": 120171, "epoch": 2861} {"train_loss": -6.512868881225586, "global_step": 120172, "epoch": 2861} {"train_loss": -6.482549667358398, "global_step": 120173, "epoch": 2861} {"train_loss": -6.44686222076416, "global_step": 120174, "epoch": 2861} {"train_loss": -6.5251383781433105, "global_step": 120175, "epoch": 2861} {"train_loss": -6.3683671951293945, "global_step": 120176, "epoch": 2861} {"train_loss": -6.454070091247559, "global_step": 120177, "epoch": 2861} {"train_loss": -6.413106918334961, "global_step": 120178, "epoch": 2861} {"train_loss": -6.5592522621154785, "global_step": 120179, "epoch": 2861} {"train_loss": -6.612507343292236, "global_step": 120180, "epoch": 2861} {"train_loss": -6.595033645629883, "global_step": 120181, "epoch": 2861} {"train_loss": -6.582086086273193, "global_step": 120182, "epoch": 2861} {"train_loss": -6.5091962814331055, "global_step": 120183, "epoch": 2861} {"train_loss": -6.6029253005981445, "global_step": 120184, "epoch": 2861} {"train_loss": -6.461821556091309, "global_step": 120185, "epoch": 2861} {"train_loss": -6.661316871643066, "global_step": 120186, "epoch": 2861} {"train_loss": -6.4851555824279785, "global_step": 120187, "epoch": 2861} {"train_loss": -6.473907470703125, "global_step": 120188, "epoch": 2861} {"train_loss": -6.469703674316406, "global_step": 120189, "epoch": 2861} {"train_loss": -6.608753681182861, "global_step": 120190, "epoch": 2861} {"train_loss": -6.568210601806641, "global_step": 120191, "epoch": 2861} {"train_loss": -6.534001350402832, "global_step": 120192, "epoch": 2861} {"train_loss": -6.6330366134643555, "global_step": 120193, "epoch": 2861} {"train_loss": -6.569232940673828, "global_step": 120194, "epoch": 2861} {"train_loss": -6.394067764282227, "global_step": 120195, "epoch": 2861} {"train_loss": -6.520395278930664, "global_step": 120196, "epoch": 2861} {"train_loss": -6.531937599182129, "global_step": 120197, "epoch": 2861} {"train_loss": -6.5788350105285645, "global_step": 120198, "epoch": 2861} {"train_loss": -6.505333423614502, "global_step": 120199, "epoch": 2861} {"train_loss": -6.65110969543457, "global_step": 120200, "epoch": 2861} {"train_loss": -6.564799785614014, "global_step": 120201, "epoch": 2861} {"train_loss": -6.512302398681641, "global_step": 120202, "epoch": 2861} {"train_loss": -6.524302164713542, "global_step": 120203, "epoch": 2861, "val_loss": 67823.3515625} {"train_loss": -6.583372116088867, "global_step": 120204, "epoch": 2862} {"train_loss": -6.623884201049805, "global_step": 120205, "epoch": 2862} {"train_loss": -6.6190972328186035, "global_step": 120206, "epoch": 2862} {"train_loss": -6.649261474609375, "global_step": 120207, "epoch": 2862} {"train_loss": -6.593843460083008, "global_step": 120208, "epoch": 2862} {"train_loss": -6.544525146484375, "global_step": 120209, "epoch": 2862} {"train_loss": -6.514432907104492, "global_step": 120210, "epoch": 2862} {"train_loss": -6.512231826782227, "global_step": 120211, "epoch": 2862} {"train_loss": -6.429426193237305, "global_step": 120212, "epoch": 2862} {"train_loss": -6.535398483276367, "global_step": 120213, "epoch": 2862} {"train_loss": -6.625767707824707, "global_step": 120214, "epoch": 2862} {"train_loss": -6.583914756774902, "global_step": 120215, "epoch": 2862} {"train_loss": -6.5151801109313965, "global_step": 120216, "epoch": 2862} {"train_loss": -6.43366813659668, "global_step": 120217, "epoch": 2862} {"train_loss": -6.470194339752197, "global_step": 120218, "epoch": 2862} {"train_loss": -6.549560546875, "global_step": 120219, "epoch": 2862} {"train_loss": -6.444566249847412, "global_step": 120220, "epoch": 2862} {"train_loss": -6.58862829208374, "global_step": 120221, "epoch": 2862} {"train_loss": -6.577744960784912, "global_step": 120222, "epoch": 2862} {"train_loss": -6.5990495681762695, "global_step": 120223, "epoch": 2862} {"train_loss": -6.451076507568359, "global_step": 120224, "epoch": 2862} {"train_loss": -6.584954738616943, "global_step": 120225, "epoch": 2862} {"train_loss": -6.567152500152588, "global_step": 120226, "epoch": 2862} {"train_loss": -6.53921365737915, "global_step": 120227, "epoch": 2862} {"train_loss": -6.555633544921875, "global_step": 120228, "epoch": 2862} {"train_loss": -6.5926513671875, "global_step": 120229, "epoch": 2862} {"train_loss": -6.551070213317871, "global_step": 120230, "epoch": 2862} {"train_loss": -6.5040693283081055, "global_step": 120231, "epoch": 2862} {"train_loss": -6.567445755004883, "global_step": 120232, "epoch": 2862} {"train_loss": -6.323609828948975, "global_step": 120233, "epoch": 2862} {"train_loss": -6.575106620788574, "global_step": 120234, "epoch": 2862} {"train_loss": -6.493370532989502, "global_step": 120235, "epoch": 2862} {"train_loss": -6.61699104309082, "global_step": 120236, "epoch": 2862} {"train_loss": -6.464499473571777, "global_step": 120237, "epoch": 2862} {"train_loss": -6.485252380371094, "global_step": 120238, "epoch": 2862} {"train_loss": -6.667816162109375, "global_step": 120239, "epoch": 2862} {"train_loss": -6.507658958435059, "global_step": 120240, "epoch": 2862} {"train_loss": -6.4798784255981445, "global_step": 120241, "epoch": 2862} {"train_loss": -6.510644435882568, "global_step": 120242, "epoch": 2862} {"train_loss": -6.462350845336914, "global_step": 120243, "epoch": 2862} {"train_loss": -6.626215934753418, "global_step": 120244, "epoch": 2862} {"train_loss": -6.536944934300014, "global_step": 120245, "epoch": 2862, "val_loss": 67945.6171875} {"train_loss": -6.54239559173584, "global_step": 120246, "epoch": 2863} {"train_loss": -6.506192207336426, "global_step": 120247, "epoch": 2863} {"train_loss": -6.411608695983887, "global_step": 120248, "epoch": 2863} {"train_loss": -6.579736709594727, "global_step": 120249, "epoch": 2863} {"train_loss": -6.402866363525391, "global_step": 120250, "epoch": 2863} {"train_loss": -6.455537796020508, "global_step": 120251, "epoch": 2863} {"train_loss": -6.47083044052124, "global_step": 120252, "epoch": 2863} {"train_loss": -6.55000114440918, "global_step": 120253, "epoch": 2863} {"train_loss": -6.584676742553711, "global_step": 120254, "epoch": 2863} {"train_loss": -6.538599014282227, "global_step": 120255, "epoch": 2863} {"train_loss": -6.602031707763672, "global_step": 120256, "epoch": 2863} {"train_loss": -6.537909507751465, "global_step": 120257, "epoch": 2863} {"train_loss": -6.467902183532715, "global_step": 120258, "epoch": 2863} {"train_loss": -6.477593421936035, "global_step": 120259, "epoch": 2863} {"train_loss": -6.4461164474487305, "global_step": 120260, "epoch": 2863} {"train_loss": -6.463672161102295, "global_step": 120261, "epoch": 2863} {"train_loss": -6.552460670471191, "global_step": 120262, "epoch": 2863} {"train_loss": -6.444083213806152, "global_step": 120263, "epoch": 2863} {"train_loss": -6.506688117980957, "global_step": 120264, "epoch": 2863} {"train_loss": -6.526603698730469, "global_step": 120265, "epoch": 2863} {"train_loss": -6.508477687835693, "global_step": 120266, "epoch": 2863} {"train_loss": -6.539249420166016, "global_step": 120267, "epoch": 2863} {"train_loss": -6.438611030578613, "global_step": 120268, "epoch": 2863} {"train_loss": -6.523388862609863, "global_step": 120269, "epoch": 2863} {"train_loss": -6.620637893676758, "global_step": 120270, "epoch": 2863} {"train_loss": -6.567863464355469, "global_step": 120271, "epoch": 2863} {"train_loss": -6.472838401794434, "global_step": 120272, "epoch": 2863} {"train_loss": -6.525628089904785, "global_step": 120273, "epoch": 2863} {"train_loss": -6.691717624664307, "global_step": 120274, "epoch": 2863} {"train_loss": -6.529277324676514, "global_step": 120275, "epoch": 2863} {"train_loss": -6.508831977844238, "global_step": 120276, "epoch": 2863} {"train_loss": -6.495440483093262, "global_step": 120277, "epoch": 2863} {"train_loss": -6.556179046630859, "global_step": 120278, "epoch": 2863} {"train_loss": -6.5992112159729, "global_step": 120279, "epoch": 2863} {"train_loss": -6.411480903625488, "global_step": 120280, "epoch": 2863} {"train_loss": -6.600241184234619, "global_step": 120281, "epoch": 2863} {"train_loss": -6.387375354766846, "global_step": 120282, "epoch": 2863} {"train_loss": -6.544456481933594, "global_step": 120283, "epoch": 2863} {"train_loss": -6.521999835968018, "global_step": 120284, "epoch": 2863} {"train_loss": -6.575376510620117, "global_step": 120285, "epoch": 2863} {"train_loss": -6.52813720703125, "global_step": 120286, "epoch": 2863} {"train_loss": -6.519294647943406, "global_step": 120287, "epoch": 2863, "val_loss": 67993.7578125} {"train_loss": -6.645685195922852, "global_step": 120288, "epoch": 2864} {"train_loss": -6.497650146484375, "global_step": 120289, "epoch": 2864} {"train_loss": -6.491612911224365, "global_step": 120290, "epoch": 2864} {"train_loss": -6.4520721435546875, "global_step": 120291, "epoch": 2864} {"train_loss": -6.411901950836182, "global_step": 120292, "epoch": 2864} {"train_loss": -6.553138732910156, "global_step": 120293, "epoch": 2864} {"train_loss": -6.50905704498291, "global_step": 120294, "epoch": 2864} {"train_loss": -6.429994583129883, "global_step": 120295, "epoch": 2864} {"train_loss": -6.529223442077637, "global_step": 120296, "epoch": 2864} {"train_loss": -6.4035491943359375, "global_step": 120297, "epoch": 2864} {"train_loss": -6.476883888244629, "global_step": 120298, "epoch": 2864} {"train_loss": -6.620617866516113, "global_step": 120299, "epoch": 2864} {"train_loss": -6.504083633422852, "global_step": 120300, "epoch": 2864} {"train_loss": -6.520061492919922, "global_step": 120301, "epoch": 2864} {"train_loss": -6.509139060974121, "global_step": 120302, "epoch": 2864} {"train_loss": -6.541481018066406, "global_step": 120303, "epoch": 2864} {"train_loss": -6.48164176940918, "global_step": 120304, "epoch": 2864} {"train_loss": -6.456974983215332, "global_step": 120305, "epoch": 2864} {"train_loss": -6.600997447967529, "global_step": 120306, "epoch": 2864} {"train_loss": -6.60783576965332, "global_step": 120307, "epoch": 2864} {"train_loss": -6.551850318908691, "global_step": 120308, "epoch": 2864} {"train_loss": -6.622599124908447, "global_step": 120309, "epoch": 2864} {"train_loss": -6.503593921661377, "global_step": 120310, "epoch": 2864} {"train_loss": -6.541815757751465, "global_step": 120311, "epoch": 2864} {"train_loss": -6.610382080078125, "global_step": 120312, "epoch": 2864} {"train_loss": -6.534819602966309, "global_step": 120313, "epoch": 2864} {"train_loss": -6.553232192993164, "global_step": 120314, "epoch": 2864} {"train_loss": -6.624529838562012, "global_step": 120315, "epoch": 2864} {"train_loss": -6.515289306640625, "global_step": 120316, "epoch": 2864} {"train_loss": -6.453767776489258, "global_step": 120317, "epoch": 2864} {"train_loss": -6.375983238220215, "global_step": 120318, "epoch": 2864} {"train_loss": -6.602205276489258, "global_step": 120319, "epoch": 2864} {"train_loss": -6.486259460449219, "global_step": 120320, "epoch": 2864} {"train_loss": -6.423306465148926, "global_step": 120321, "epoch": 2864} {"train_loss": -6.4940080642700195, "global_step": 120322, "epoch": 2864} {"train_loss": -6.485197067260742, "global_step": 120323, "epoch": 2864} {"train_loss": -6.548171043395996, "global_step": 120324, "epoch": 2864} {"train_loss": -6.530951499938965, "global_step": 120325, "epoch": 2864} {"train_loss": -6.490315914154053, "global_step": 120326, "epoch": 2864} {"train_loss": -6.618573188781738, "global_step": 120327, "epoch": 2864} {"train_loss": -6.4843244552612305, "global_step": 120328, "epoch": 2864} {"train_loss": -6.519678013665335, "global_step": 120329, "epoch": 2864, "val_loss": 67812.7578125} {"train_loss": -6.516173839569092, "global_step": 120330, "epoch": 2865} {"train_loss": -6.598758697509766, "global_step": 120331, "epoch": 2865} {"train_loss": -6.508736610412598, "global_step": 120332, "epoch": 2865} {"train_loss": -6.642397403717041, "global_step": 120333, "epoch": 2865} {"train_loss": -6.560487747192383, "global_step": 120334, "epoch": 2865} {"train_loss": -6.648420810699463, "global_step": 120335, "epoch": 2865} {"train_loss": -6.634043216705322, "global_step": 120336, "epoch": 2865} {"train_loss": -6.596103668212891, "global_step": 120337, "epoch": 2865} {"train_loss": -6.575672626495361, "global_step": 120338, "epoch": 2865} {"train_loss": -6.65958833694458, "global_step": 120339, "epoch": 2865} {"train_loss": -6.614680290222168, "global_step": 120340, "epoch": 2865} {"train_loss": -6.557985782623291, "global_step": 120341, "epoch": 2865} {"train_loss": -6.595162391662598, "global_step": 120342, "epoch": 2865} {"train_loss": -6.601993560791016, "global_step": 120343, "epoch": 2865} {"train_loss": -6.622287750244141, "global_step": 120344, "epoch": 2865} {"train_loss": -6.604547500610352, "global_step": 120345, "epoch": 2865} {"train_loss": -6.555020332336426, "global_step": 120346, "epoch": 2865} {"train_loss": -6.589024066925049, "global_step": 120347, "epoch": 2865} {"train_loss": -6.483613014221191, "global_step": 120348, "epoch": 2865} {"train_loss": -6.557895183563232, "global_step": 120349, "epoch": 2865} {"train_loss": -6.537601470947266, "global_step": 120350, "epoch": 2865} {"train_loss": -6.519491195678711, "global_step": 120351, "epoch": 2865} {"train_loss": -6.4638166427612305, "global_step": 120352, "epoch": 2865} {"train_loss": -6.5907440185546875, "global_step": 120353, "epoch": 2865} {"train_loss": -6.539611339569092, "global_step": 120354, "epoch": 2865} {"train_loss": -6.4647440910339355, "global_step": 120355, "epoch": 2865} {"train_loss": -6.5330352783203125, "global_step": 120356, "epoch": 2865} {"train_loss": -6.5708088874816895, "global_step": 120357, "epoch": 2865} {"train_loss": -6.658196926116943, "global_step": 120358, "epoch": 2865} {"train_loss": -6.538374900817871, "global_step": 120359, "epoch": 2865} {"train_loss": -6.579800128936768, "global_step": 120360, "epoch": 2865} {"train_loss": -6.511830806732178, "global_step": 120361, "epoch": 2865} {"train_loss": -6.576094627380371, "global_step": 120362, "epoch": 2865} {"train_loss": -6.579953670501709, "global_step": 120363, "epoch": 2865} {"train_loss": -6.510434150695801, "global_step": 120364, "epoch": 2865} {"train_loss": -6.571477890014648, "global_step": 120365, "epoch": 2865} {"train_loss": -6.5488972663879395, "global_step": 120366, "epoch": 2865} {"train_loss": -6.653725624084473, "global_step": 120367, "epoch": 2865} {"train_loss": -6.472745895385742, "global_step": 120368, "epoch": 2865} {"train_loss": -6.533303260803223, "global_step": 120369, "epoch": 2865} {"train_loss": -6.533491134643555, "global_step": 120370, "epoch": 2865} {"train_loss": -6.565507411956787, "global_step": 120371, "epoch": 2865, "val_loss": 67826.7265625} {"train_loss": -6.556262969970703, "global_step": 120372, "epoch": 2866} {"train_loss": -6.379450798034668, "global_step": 120373, "epoch": 2866} {"train_loss": -6.433803081512451, "global_step": 120374, "epoch": 2866} {"train_loss": -6.5738654136657715, "global_step": 120375, "epoch": 2866} {"train_loss": -6.421709060668945, "global_step": 120376, "epoch": 2866} {"train_loss": -6.550942420959473, "global_step": 120377, "epoch": 2866} {"train_loss": -6.440463066101074, "global_step": 120378, "epoch": 2866} {"train_loss": -6.406437873840332, "global_step": 120379, "epoch": 2866} {"train_loss": -6.593498229980469, "global_step": 120380, "epoch": 2866} {"train_loss": -6.496851444244385, "global_step": 120381, "epoch": 2866} {"train_loss": -6.41134786605835, "global_step": 120382, "epoch": 2866} {"train_loss": -6.510808944702148, "global_step": 120383, "epoch": 2866} {"train_loss": -6.597053527832031, "global_step": 120384, "epoch": 2866} {"train_loss": -6.584629535675049, "global_step": 120385, "epoch": 2866} {"train_loss": -6.571026802062988, "global_step": 120386, "epoch": 2866} {"train_loss": -6.4671101570129395, "global_step": 120387, "epoch": 2866} {"train_loss": -6.405388832092285, "global_step": 120388, "epoch": 2866} {"train_loss": -6.4906535148620605, "global_step": 120389, "epoch": 2866} {"train_loss": -6.522679805755615, "global_step": 120390, "epoch": 2866} {"train_loss": -6.433259010314941, "global_step": 120391, "epoch": 2866} {"train_loss": -6.517352104187012, "global_step": 120392, "epoch": 2866} {"train_loss": -6.456497669219971, "global_step": 120393, "epoch": 2866} {"train_loss": -6.327695369720459, "global_step": 120394, "epoch": 2866} {"train_loss": -6.528923988342285, "global_step": 120395, "epoch": 2866} {"train_loss": -6.401032447814941, "global_step": 120396, "epoch": 2866} {"train_loss": -6.607303619384766, "global_step": 120397, "epoch": 2866} {"train_loss": -6.266834259033203, "global_step": 120398, "epoch": 2866} {"train_loss": -6.3883867263793945, "global_step": 120399, "epoch": 2866} {"train_loss": -6.432576656341553, "global_step": 120400, "epoch": 2866} {"train_loss": -6.365854263305664, "global_step": 120401, "epoch": 2866} {"train_loss": -6.591197967529297, "global_step": 120402, "epoch": 2866} {"train_loss": -6.3932695388793945, "global_step": 120403, "epoch": 2866} {"train_loss": -6.561285495758057, "global_step": 120404, "epoch": 2866} {"train_loss": -6.541682243347168, "global_step": 120405, "epoch": 2866} {"train_loss": -6.502306938171387, "global_step": 120406, "epoch": 2866} {"train_loss": -6.494569778442383, "global_step": 120407, "epoch": 2866} {"train_loss": -6.508411884307861, "global_step": 120408, "epoch": 2866} {"train_loss": -6.3816070556640625, "global_step": 120409, "epoch": 2866} {"train_loss": -6.428264617919922, "global_step": 120410, "epoch": 2866} {"train_loss": -6.510700225830078, "global_step": 120411, "epoch": 2866} {"train_loss": -6.300311088562012, "global_step": 120412, "epoch": 2866} {"train_loss": -6.470117478143601, "global_step": 120413, "epoch": 2866, "val_loss": 68425.296875} {"train_loss": -6.305953025817871, "global_step": 120414, "epoch": 2867} {"train_loss": -6.399596214294434, "global_step": 120415, "epoch": 2867} {"train_loss": -6.337337493896484, "global_step": 120416, "epoch": 2867} {"train_loss": -6.505342960357666, "global_step": 120417, "epoch": 2867} {"train_loss": -6.331001281738281, "global_step": 120418, "epoch": 2867} {"train_loss": -6.4190897941589355, "global_step": 120419, "epoch": 2867} {"train_loss": -6.269448280334473, "global_step": 120420, "epoch": 2867} {"train_loss": -6.363367557525635, "global_step": 120421, "epoch": 2867} {"train_loss": -6.471005439758301, "global_step": 120422, "epoch": 2867} {"train_loss": -6.407314300537109, "global_step": 120423, "epoch": 2867} {"train_loss": -6.365072250366211, "global_step": 120424, "epoch": 2867} {"train_loss": -6.4141693115234375, "global_step": 120425, "epoch": 2867} {"train_loss": -6.469878196716309, "global_step": 120426, "epoch": 2867} {"train_loss": -6.463377475738525, "global_step": 120427, "epoch": 2867} {"train_loss": -6.504459381103516, "global_step": 120428, "epoch": 2867} {"train_loss": -6.41472864151001, "global_step": 120429, "epoch": 2867} {"train_loss": -6.44476318359375, "global_step": 120430, "epoch": 2867} {"train_loss": -6.408318519592285, "global_step": 120431, "epoch": 2867} {"train_loss": -6.45702600479126, "global_step": 120432, "epoch": 2867} {"train_loss": -6.453965187072754, "global_step": 120433, "epoch": 2867} {"train_loss": -6.527633190155029, "global_step": 120434, "epoch": 2867} {"train_loss": -6.430846214294434, "global_step": 120435, "epoch": 2867} {"train_loss": -6.423763751983643, "global_step": 120436, "epoch": 2867} {"train_loss": -6.364010810852051, "global_step": 120437, "epoch": 2867} {"train_loss": -6.541611671447754, "global_step": 120438, "epoch": 2867} {"train_loss": -6.420938968658447, "global_step": 120439, "epoch": 2867} {"train_loss": -6.436748504638672, "global_step": 120440, "epoch": 2867} {"train_loss": -6.499123573303223, "global_step": 120441, "epoch": 2867} {"train_loss": -6.53692102432251, "global_step": 120442, "epoch": 2867} {"train_loss": -6.531375885009766, "global_step": 120443, "epoch": 2867} {"train_loss": -6.5012593269348145, "global_step": 120444, "epoch": 2867} {"train_loss": -6.549101829528809, "global_step": 120445, "epoch": 2867} {"train_loss": -6.463788986206055, "global_step": 120446, "epoch": 2867} {"train_loss": -6.587769508361816, "global_step": 120447, "epoch": 2867} {"train_loss": -6.357073783874512, "global_step": 120448, "epoch": 2867} {"train_loss": -6.550069332122803, "global_step": 120449, "epoch": 2867} {"train_loss": -6.4598069190979, "global_step": 120450, "epoch": 2867} {"train_loss": -6.614583969116211, "global_step": 120451, "epoch": 2867} {"train_loss": -6.456126689910889, "global_step": 120452, "epoch": 2867} {"train_loss": -6.475929260253906, "global_step": 120453, "epoch": 2867} {"train_loss": -6.593380451202393, "global_step": 120454, "epoch": 2867} {"train_loss": -6.454060247966221, "global_step": 120455, "epoch": 2867, "val_loss": 67918.6484375} {"train_loss": -6.5963616371154785, "global_step": 120456, "epoch": 2868} {"train_loss": -6.575098037719727, "global_step": 120457, "epoch": 2868} {"train_loss": -6.534567832946777, "global_step": 120458, "epoch": 2868} {"train_loss": -6.445777416229248, "global_step": 120459, "epoch": 2868} {"train_loss": -6.481984615325928, "global_step": 120460, "epoch": 2868} {"train_loss": -6.518559455871582, "global_step": 120461, "epoch": 2868} {"train_loss": -6.499083518981934, "global_step": 120462, "epoch": 2868} {"train_loss": -6.605849266052246, "global_step": 120463, "epoch": 2868} {"train_loss": -6.5279364585876465, "global_step": 120464, "epoch": 2868} {"train_loss": -6.662395000457764, "global_step": 120465, "epoch": 2868} {"train_loss": -6.5420756340026855, "global_step": 120466, "epoch": 2868} {"train_loss": -6.595465183258057, "global_step": 120467, "epoch": 2868} {"train_loss": -6.560153961181641, "global_step": 120468, "epoch": 2868} {"train_loss": -6.556173801422119, "global_step": 120469, "epoch": 2868} {"train_loss": -6.5420427322387695, "global_step": 120470, "epoch": 2868} {"train_loss": -6.590534687042236, "global_step": 120471, "epoch": 2868} {"train_loss": -6.512444496154785, "global_step": 120472, "epoch": 2868} {"train_loss": -6.6186676025390625, "global_step": 120473, "epoch": 2868} {"train_loss": -6.533453464508057, "global_step": 120474, "epoch": 2868} {"train_loss": -6.640898704528809, "global_step": 120475, "epoch": 2868} {"train_loss": -6.496916770935059, "global_step": 120476, "epoch": 2868} {"train_loss": -6.583024024963379, "global_step": 120477, "epoch": 2868} {"train_loss": -6.411078453063965, "global_step": 120478, "epoch": 2868} {"train_loss": -6.466719150543213, "global_step": 120479, "epoch": 2868} {"train_loss": -6.568921089172363, "global_step": 120480, "epoch": 2868} {"train_loss": -6.42629337310791, "global_step": 120481, "epoch": 2868} {"train_loss": -6.472597599029541, "global_step": 120482, "epoch": 2868} {"train_loss": -6.610551834106445, "global_step": 120483, "epoch": 2868} {"train_loss": -6.404891014099121, "global_step": 120484, "epoch": 2868} {"train_loss": -6.599712371826172, "global_step": 120485, "epoch": 2868} {"train_loss": -6.572479724884033, "global_step": 120486, "epoch": 2868} {"train_loss": -6.593289375305176, "global_step": 120487, "epoch": 2868} {"train_loss": -6.534367084503174, "global_step": 120488, "epoch": 2868} {"train_loss": -6.513528823852539, "global_step": 120489, "epoch": 2868} {"train_loss": -6.53971004486084, "global_step": 120490, "epoch": 2868} {"train_loss": -6.556604385375977, "global_step": 120491, "epoch": 2868} {"train_loss": -6.542865753173828, "global_step": 120492, "epoch": 2868} {"train_loss": -6.5026960372924805, "global_step": 120493, "epoch": 2868} {"train_loss": -6.440462112426758, "global_step": 120494, "epoch": 2868} {"train_loss": -6.610461235046387, "global_step": 120495, "epoch": 2868} {"train_loss": -6.563718795776367, "global_step": 120496, "epoch": 2868} {"train_loss": -6.544622421264648, "global_step": 120497, "epoch": 2868, "val_loss": 67880.7578125} {"train_loss": -6.642342567443848, "global_step": 120498, "epoch": 2869} {"train_loss": -6.601480484008789, "global_step": 120499, "epoch": 2869} {"train_loss": -6.479225158691406, "global_step": 120500, "epoch": 2869} {"train_loss": -6.565493106842041, "global_step": 120501, "epoch": 2869} {"train_loss": -6.586407661437988, "global_step": 120502, "epoch": 2869} {"train_loss": -6.593591213226318, "global_step": 120503, "epoch": 2869} {"train_loss": -6.509346961975098, "global_step": 120504, "epoch": 2869} {"train_loss": -6.5728373527526855, "global_step": 120505, "epoch": 2869} {"train_loss": -6.458807945251465, "global_step": 120506, "epoch": 2869} {"train_loss": -6.595038414001465, "global_step": 120507, "epoch": 2869} {"train_loss": -6.391711235046387, "global_step": 120508, "epoch": 2869} {"train_loss": -6.501879692077637, "global_step": 120509, "epoch": 2869} {"train_loss": -6.489582061767578, "global_step": 120510, "epoch": 2869} {"train_loss": -6.493130207061768, "global_step": 120511, "epoch": 2869} {"train_loss": -6.467820167541504, "global_step": 120512, "epoch": 2869} {"train_loss": -6.559806823730469, "global_step": 120513, "epoch": 2869} {"train_loss": -6.452610969543457, "global_step": 120514, "epoch": 2869} {"train_loss": -6.585291385650635, "global_step": 120515, "epoch": 2869} {"train_loss": -6.460142612457275, "global_step": 120516, "epoch": 2869} {"train_loss": -6.442944526672363, "global_step": 120517, "epoch": 2869} {"train_loss": -6.550185203552246, "global_step": 120518, "epoch": 2869} {"train_loss": -6.404847621917725, "global_step": 120519, "epoch": 2869} {"train_loss": -6.400191783905029, "global_step": 120520, "epoch": 2869} {"train_loss": -6.478751182556152, "global_step": 120521, "epoch": 2869} {"train_loss": -6.552505016326904, "global_step": 120522, "epoch": 2869} {"train_loss": -6.406033515930176, "global_step": 120523, "epoch": 2869} {"train_loss": -6.501908302307129, "global_step": 120524, "epoch": 2869} {"train_loss": -6.569211959838867, "global_step": 120525, "epoch": 2869} {"train_loss": -6.489564895629883, "global_step": 120526, "epoch": 2869} {"train_loss": -6.439477920532227, "global_step": 120527, "epoch": 2869} {"train_loss": -6.5470476150512695, "global_step": 120528, "epoch": 2869} {"train_loss": -6.55495548248291, "global_step": 120529, "epoch": 2869} {"train_loss": -6.695664882659912, "global_step": 120530, "epoch": 2869} {"train_loss": -6.554682731628418, "global_step": 120531, "epoch": 2869} {"train_loss": -6.652066230773926, "global_step": 120532, "epoch": 2869} {"train_loss": -6.631086826324463, "global_step": 120533, "epoch": 2869} {"train_loss": -6.4348907470703125, "global_step": 120534, "epoch": 2869} {"train_loss": -6.583160877227783, "global_step": 120535, "epoch": 2869} {"train_loss": -6.532330513000488, "global_step": 120536, "epoch": 2869} {"train_loss": -6.557498455047607, "global_step": 120537, "epoch": 2869} {"train_loss": -6.513827800750732, "global_step": 120538, "epoch": 2869} {"train_loss": -6.524217219579787, "global_step": 120539, "epoch": 2869, "val_loss": 67765.046875} {"train_loss": -6.629857063293457, "global_step": 120540, "epoch": 2870} {"train_loss": -6.573670387268066, "global_step": 120541, "epoch": 2870} {"train_loss": -6.541953086853027, "global_step": 120542, "epoch": 2870} {"train_loss": -6.577139854431152, "global_step": 120543, "epoch": 2870} {"train_loss": -6.407569885253906, "global_step": 120544, "epoch": 2870} {"train_loss": -6.4934282302856445, "global_step": 120545, "epoch": 2870} {"train_loss": -6.761363983154297, "global_step": 120546, "epoch": 2870} {"train_loss": -6.522703647613525, "global_step": 120547, "epoch": 2870} {"train_loss": -6.667302131652832, "global_step": 120548, "epoch": 2870} {"train_loss": -6.757272243499756, "global_step": 120549, "epoch": 2870} {"train_loss": -6.627721786499023, "global_step": 120550, "epoch": 2870} {"train_loss": -6.509059429168701, "global_step": 120551, "epoch": 2870} {"train_loss": -6.5450439453125, "global_step": 120552, "epoch": 2870} {"train_loss": -6.6264801025390625, "global_step": 120553, "epoch": 2870} {"train_loss": -6.5946526527404785, "global_step": 120554, "epoch": 2870} {"train_loss": -6.640092849731445, "global_step": 120555, "epoch": 2870} {"train_loss": -6.620223522186279, "global_step": 120556, "epoch": 2870} {"train_loss": -6.477733135223389, "global_step": 120557, "epoch": 2870} {"train_loss": -6.560909748077393, "global_step": 120558, "epoch": 2870} {"train_loss": -6.625658988952637, "global_step": 120559, "epoch": 2870} {"train_loss": -6.5549163818359375, "global_step": 120560, "epoch": 2870} {"train_loss": -6.3711161613464355, "global_step": 120561, "epoch": 2870} {"train_loss": -6.614508628845215, "global_step": 120562, "epoch": 2870} {"train_loss": -6.4459333419799805, "global_step": 120563, "epoch": 2870} {"train_loss": -6.474331855773926, "global_step": 120564, "epoch": 2870} {"train_loss": -6.593976974487305, "global_step": 120565, "epoch": 2870} {"train_loss": -6.485878944396973, "global_step": 120566, "epoch": 2870} {"train_loss": -6.620730876922607, "global_step": 120567, "epoch": 2870} {"train_loss": -6.596974849700928, "global_step": 120568, "epoch": 2870} {"train_loss": -6.507010459899902, "global_step": 120569, "epoch": 2870} {"train_loss": -6.5808820724487305, "global_step": 120570, "epoch": 2870} {"train_loss": -6.4685797691345215, "global_step": 120571, "epoch": 2870} {"train_loss": -6.345978736877441, "global_step": 120572, "epoch": 2870} {"train_loss": -6.574847221374512, "global_step": 120573, "epoch": 2870} {"train_loss": -6.622066497802734, "global_step": 120574, "epoch": 2870} {"train_loss": -6.534153461456299, "global_step": 120575, "epoch": 2870} {"train_loss": -6.5183634757995605, "global_step": 120576, "epoch": 2870} {"train_loss": -6.518888473510742, "global_step": 120577, "epoch": 2870} {"train_loss": -6.510923862457275, "global_step": 120578, "epoch": 2870} {"train_loss": -6.629693031311035, "global_step": 120579, "epoch": 2870} {"train_loss": -6.539745330810547, "global_step": 120580, "epoch": 2870} {"train_loss": -6.556211278552101, "global_step": 120581, "epoch": 2870, "val_loss": 67964.2421875} {"train_loss": -6.565338611602783, "global_step": 120582, "epoch": 2871} {"train_loss": -6.561790466308594, "global_step": 120583, "epoch": 2871} {"train_loss": -6.526660442352295, "global_step": 120584, "epoch": 2871} {"train_loss": -6.529516220092773, "global_step": 120585, "epoch": 2871} {"train_loss": -6.5111517906188965, "global_step": 120586, "epoch": 2871} {"train_loss": -6.607295036315918, "global_step": 120587, "epoch": 2871} {"train_loss": -6.57553768157959, "global_step": 120588, "epoch": 2871} {"train_loss": -6.627545356750488, "global_step": 120589, "epoch": 2871} {"train_loss": -6.636661529541016, "global_step": 120590, "epoch": 2871} {"train_loss": -6.688043594360352, "global_step": 120591, "epoch": 2871} {"train_loss": -6.528826713562012, "global_step": 120592, "epoch": 2871} {"train_loss": -6.504166126251221, "global_step": 120593, "epoch": 2871} {"train_loss": -6.614772796630859, "global_step": 120594, "epoch": 2871} {"train_loss": -6.501495838165283, "global_step": 120595, "epoch": 2871} {"train_loss": -6.5474934577941895, "global_step": 120596, "epoch": 2871} {"train_loss": -6.602569580078125, "global_step": 120597, "epoch": 2871} {"train_loss": -6.424515724182129, "global_step": 120598, "epoch": 2871} {"train_loss": -6.539630889892578, "global_step": 120599, "epoch": 2871} {"train_loss": -6.572888374328613, "global_step": 120600, "epoch": 2871} {"train_loss": -6.577932834625244, "global_step": 120601, "epoch": 2871} {"train_loss": -6.592732906341553, "global_step": 120602, "epoch": 2871} {"train_loss": -6.572453498840332, "global_step": 120603, "epoch": 2871} {"train_loss": -6.611351013183594, "global_step": 120604, "epoch": 2871} {"train_loss": -6.493048667907715, "global_step": 120605, "epoch": 2871} {"train_loss": -6.600392818450928, "global_step": 120606, "epoch": 2871} {"train_loss": -6.556829452514648, "global_step": 120607, "epoch": 2871} {"train_loss": -6.468010902404785, "global_step": 120608, "epoch": 2871} {"train_loss": -6.504355430603027, "global_step": 120609, "epoch": 2871} {"train_loss": -6.498529434204102, "global_step": 120610, "epoch": 2871} {"train_loss": -6.487677574157715, "global_step": 120611, "epoch": 2871} {"train_loss": -6.493194103240967, "global_step": 120612, "epoch": 2871} {"train_loss": -6.319963455200195, "global_step": 120613, "epoch": 2871} {"train_loss": -6.464707374572754, "global_step": 120614, "epoch": 2871} {"train_loss": -6.426402568817139, "global_step": 120615, "epoch": 2871} {"train_loss": -6.486034393310547, "global_step": 120616, "epoch": 2871} {"train_loss": -6.539448261260986, "global_step": 120617, "epoch": 2871} {"train_loss": -6.448750019073486, "global_step": 120618, "epoch": 2871} {"train_loss": -6.5224223136901855, "global_step": 120619, "epoch": 2871} {"train_loss": -6.454491138458252, "global_step": 120620, "epoch": 2871} {"train_loss": -6.410883903503418, "global_step": 120621, "epoch": 2871} {"train_loss": -6.5395917892456055, "global_step": 120622, "epoch": 2871} {"train_loss": -6.5277314867292136, "global_step": 120623, "epoch": 2871, "val_loss": 67890.7578125} {"train_loss": -6.5263166427612305, "global_step": 120624, "epoch": 2872} {"train_loss": -6.516047477722168, "global_step": 120625, "epoch": 2872} {"train_loss": -6.563112735748291, "global_step": 120626, "epoch": 2872} {"train_loss": -6.52754545211792, "global_step": 120627, "epoch": 2872} {"train_loss": -6.535625457763672, "global_step": 120628, "epoch": 2872} {"train_loss": -6.538600444793701, "global_step": 120629, "epoch": 2872} {"train_loss": -6.533319473266602, "global_step": 120630, "epoch": 2872} {"train_loss": -6.531947135925293, "global_step": 120631, "epoch": 2872} {"train_loss": -6.631237983703613, "global_step": 120632, "epoch": 2872} {"train_loss": -6.697653770446777, "global_step": 120633, "epoch": 2872} {"train_loss": -6.594681262969971, "global_step": 120634, "epoch": 2872} {"train_loss": -6.546255111694336, "global_step": 120635, "epoch": 2872} {"train_loss": -6.613803863525391, "global_step": 120636, "epoch": 2872} {"train_loss": -6.476747512817383, "global_step": 120637, "epoch": 2872} {"train_loss": -6.515610694885254, "global_step": 120638, "epoch": 2872} {"train_loss": -6.5187788009643555, "global_step": 120639, "epoch": 2872} {"train_loss": -6.613116264343262, "global_step": 120640, "epoch": 2872} {"train_loss": -6.612748146057129, "global_step": 120641, "epoch": 2872} {"train_loss": -6.590090751647949, "global_step": 120642, "epoch": 2872} {"train_loss": -6.4958815574646, "global_step": 120643, "epoch": 2872} {"train_loss": -6.615033149719238, "global_step": 120644, "epoch": 2872} {"train_loss": -6.496673583984375, "global_step": 120645, "epoch": 2872} {"train_loss": -6.456563472747803, "global_step": 120646, "epoch": 2872} {"train_loss": -6.522831916809082, "global_step": 120647, "epoch": 2872} {"train_loss": -6.458681106567383, "global_step": 120648, "epoch": 2872} {"train_loss": -6.5139994621276855, "global_step": 120649, "epoch": 2872} {"train_loss": -6.577810764312744, "global_step": 120650, "epoch": 2872} {"train_loss": -6.499650001525879, "global_step": 120651, "epoch": 2872} {"train_loss": -6.410555839538574, "global_step": 120652, "epoch": 2872} {"train_loss": -6.420814037322998, "global_step": 120653, "epoch": 2872} {"train_loss": -6.446532249450684, "global_step": 120654, "epoch": 2872} {"train_loss": -6.543704032897949, "global_step": 120655, "epoch": 2872} {"train_loss": -6.414879322052002, "global_step": 120656, "epoch": 2872} {"train_loss": -6.522929668426514, "global_step": 120657, "epoch": 2872} {"train_loss": -6.441924095153809, "global_step": 120658, "epoch": 2872} {"train_loss": -6.494309425354004, "global_step": 120659, "epoch": 2872} {"train_loss": -6.5241498947143555, "global_step": 120660, "epoch": 2872} {"train_loss": -6.4665703773498535, "global_step": 120661, "epoch": 2872} {"train_loss": -6.525976181030273, "global_step": 120662, "epoch": 2872} {"train_loss": -6.6247968673706055, "global_step": 120663, "epoch": 2872} {"train_loss": -6.389458179473877, "global_step": 120664, "epoch": 2872} {"train_loss": -6.524642478852045, "global_step": 120665, "epoch": 2872, "val_loss": 68010.09375} {"train_loss": -6.543917179107666, "global_step": 120666, "epoch": 2873} {"train_loss": -6.562520980834961, "global_step": 120667, "epoch": 2873} {"train_loss": -6.417576313018799, "global_step": 120668, "epoch": 2873} {"train_loss": -6.577237606048584, "global_step": 120669, "epoch": 2873} {"train_loss": -6.489052772521973, "global_step": 120670, "epoch": 2873} {"train_loss": -6.485479354858398, "global_step": 120671, "epoch": 2873} {"train_loss": -6.57924222946167, "global_step": 120672, "epoch": 2873} {"train_loss": -6.50742244720459, "global_step": 120673, "epoch": 2873} {"train_loss": -6.579400062561035, "global_step": 120674, "epoch": 2873} {"train_loss": -6.617664337158203, "global_step": 120675, "epoch": 2873} {"train_loss": -6.51692008972168, "global_step": 120676, "epoch": 2873} {"train_loss": -6.533718585968018, "global_step": 120677, "epoch": 2873} {"train_loss": -6.565602779388428, "global_step": 120678, "epoch": 2873} {"train_loss": -6.541646480560303, "global_step": 120679, "epoch": 2873} {"train_loss": -6.446414470672607, "global_step": 120680, "epoch": 2873} {"train_loss": -6.626053810119629, "global_step": 120681, "epoch": 2873} {"train_loss": -6.521832466125488, "global_step": 120682, "epoch": 2873} {"train_loss": -6.587863922119141, "global_step": 120683, "epoch": 2873} {"train_loss": -6.564148902893066, "global_step": 120684, "epoch": 2873} {"train_loss": -6.602609157562256, "global_step": 120685, "epoch": 2873} {"train_loss": -6.5561604499816895, "global_step": 120686, "epoch": 2873} {"train_loss": -6.499418258666992, "global_step": 120687, "epoch": 2873} {"train_loss": -6.467379570007324, "global_step": 120688, "epoch": 2873} {"train_loss": -6.639369487762451, "global_step": 120689, "epoch": 2873} {"train_loss": -6.611067771911621, "global_step": 120690, "epoch": 2873} {"train_loss": -6.692837238311768, "global_step": 120691, "epoch": 2873} {"train_loss": -6.51371431350708, "global_step": 120692, "epoch": 2873} {"train_loss": -6.486485004425049, "global_step": 120693, "epoch": 2873} {"train_loss": -6.545538425445557, "global_step": 120694, "epoch": 2873} {"train_loss": -6.397735595703125, "global_step": 120695, "epoch": 2873} {"train_loss": -6.55174446105957, "global_step": 120696, "epoch": 2873} {"train_loss": -6.479073524475098, "global_step": 120697, "epoch": 2873} {"train_loss": -6.561140060424805, "global_step": 120698, "epoch": 2873} {"train_loss": -6.578352928161621, "global_step": 120699, "epoch": 2873} {"train_loss": -6.6190996170043945, "global_step": 120700, "epoch": 2873} {"train_loss": -6.680792808532715, "global_step": 120701, "epoch": 2873} {"train_loss": -6.649068355560303, "global_step": 120702, "epoch": 2873} {"train_loss": -6.517919540405273, "global_step": 120703, "epoch": 2873} {"train_loss": -6.582670211791992, "global_step": 120704, "epoch": 2873} {"train_loss": -6.451696395874023, "global_step": 120705, "epoch": 2873} {"train_loss": -6.536046504974365, "global_step": 120706, "epoch": 2873} {"train_loss": -6.544970126379104, "global_step": 120707, "epoch": 2873, "val_loss": 68020.7578125} {"train_loss": -6.524956703186035, "global_step": 120708, "epoch": 2874} {"train_loss": -6.723047733306885, "global_step": 120709, "epoch": 2874} {"train_loss": -6.471764087677002, "global_step": 120710, "epoch": 2874} {"train_loss": -6.559466361999512, "global_step": 120711, "epoch": 2874} {"train_loss": -6.615230560302734, "global_step": 120712, "epoch": 2874} {"train_loss": -6.505444526672363, "global_step": 120713, "epoch": 2874} {"train_loss": -6.523991584777832, "global_step": 120714, "epoch": 2874} {"train_loss": -6.609914779663086, "global_step": 120715, "epoch": 2874} {"train_loss": -6.4849958419799805, "global_step": 120716, "epoch": 2874} {"train_loss": -6.473275184631348, "global_step": 120717, "epoch": 2874} {"train_loss": -6.494368553161621, "global_step": 120718, "epoch": 2874} {"train_loss": -6.4981489181518555, "global_step": 120719, "epoch": 2874} {"train_loss": -6.623773574829102, "global_step": 120720, "epoch": 2874} {"train_loss": -6.4378557205200195, "global_step": 120721, "epoch": 2874} {"train_loss": -6.454133033752441, "global_step": 120722, "epoch": 2874} {"train_loss": -6.604252815246582, "global_step": 120723, "epoch": 2874} {"train_loss": -6.548357963562012, "global_step": 120724, "epoch": 2874} {"train_loss": -6.556352138519287, "global_step": 120725, "epoch": 2874} {"train_loss": -6.497873306274414, "global_step": 120726, "epoch": 2874} {"train_loss": -6.582131385803223, "global_step": 120727, "epoch": 2874} {"train_loss": -6.516362190246582, "global_step": 120728, "epoch": 2874} {"train_loss": -6.532732963562012, "global_step": 120729, "epoch": 2874} {"train_loss": -6.5805439949035645, "global_step": 120730, "epoch": 2874} {"train_loss": -6.592172622680664, "global_step": 120731, "epoch": 2874} {"train_loss": -6.572890758514404, "global_step": 120732, "epoch": 2874} {"train_loss": -6.645999908447266, "global_step": 120733, "epoch": 2874} {"train_loss": -6.693708419799805, "global_step": 120734, "epoch": 2874} {"train_loss": -6.517864227294922, "global_step": 120735, "epoch": 2874} {"train_loss": -6.523462772369385, "global_step": 120736, "epoch": 2874} {"train_loss": -6.6139678955078125, "global_step": 120737, "epoch": 2874} {"train_loss": -6.593029022216797, "global_step": 120738, "epoch": 2874} {"train_loss": -6.508540153503418, "global_step": 120739, "epoch": 2874} {"train_loss": -6.685908317565918, "global_step": 120740, "epoch": 2874} {"train_loss": -6.587273120880127, "global_step": 120741, "epoch": 2874} {"train_loss": -6.595489501953125, "global_step": 120742, "epoch": 2874} {"train_loss": -6.526223659515381, "global_step": 120743, "epoch": 2874} {"train_loss": -6.6265130043029785, "global_step": 120744, "epoch": 2874} {"train_loss": -6.511863708496094, "global_step": 120745, "epoch": 2874} {"train_loss": -6.495212078094482, "global_step": 120746, "epoch": 2874} {"train_loss": -6.692363739013672, "global_step": 120747, "epoch": 2874} {"train_loss": -6.578017234802246, "global_step": 120748, "epoch": 2874} {"train_loss": -6.56132029351734, "global_step": 120749, "epoch": 2874, "val_loss": 67911.4609375} {"train_loss": -6.610051155090332, "global_step": 120750, "epoch": 2875} {"train_loss": -6.522253036499023, "global_step": 120751, "epoch": 2875} {"train_loss": -6.782552242279053, "global_step": 120752, "epoch": 2875} {"train_loss": -6.761429309844971, "global_step": 120753, "epoch": 2875} {"train_loss": -6.607903480529785, "global_step": 120754, "epoch": 2875} {"train_loss": -6.51511287689209, "global_step": 120755, "epoch": 2875} {"train_loss": -6.596001625061035, "global_step": 120756, "epoch": 2875} {"train_loss": -6.630241394042969, "global_step": 120757, "epoch": 2875} {"train_loss": -6.704594135284424, "global_step": 120758, "epoch": 2875} {"train_loss": -6.689847946166992, "global_step": 120759, "epoch": 2875} {"train_loss": -6.564497947692871, "global_step": 120760, "epoch": 2875} {"train_loss": -6.60410213470459, "global_step": 120761, "epoch": 2875} {"train_loss": -6.666755199432373, "global_step": 120762, "epoch": 2875} {"train_loss": -6.659409523010254, "global_step": 120763, "epoch": 2875} {"train_loss": -6.521611213684082, "global_step": 120764, "epoch": 2875} {"train_loss": -6.638912200927734, "global_step": 120765, "epoch": 2875} {"train_loss": -6.596668243408203, "global_step": 120766, "epoch": 2875} {"train_loss": -6.614514350891113, "global_step": 120767, "epoch": 2875} {"train_loss": -6.504283905029297, "global_step": 120768, "epoch": 2875} {"train_loss": -6.583279609680176, "global_step": 120769, "epoch": 2875} {"train_loss": -6.5364580154418945, "global_step": 120770, "epoch": 2875} {"train_loss": -6.563052177429199, "global_step": 120771, "epoch": 2875} {"train_loss": -6.564854145050049, "global_step": 120772, "epoch": 2875} {"train_loss": -6.573428153991699, "global_step": 120773, "epoch": 2875} {"train_loss": -6.522000312805176, "global_step": 120774, "epoch": 2875} {"train_loss": -6.583737373352051, "global_step": 120775, "epoch": 2875} {"train_loss": -6.524618625640869, "global_step": 120776, "epoch": 2875} {"train_loss": -6.507871627807617, "global_step": 120777, "epoch": 2875} {"train_loss": -6.515230178833008, "global_step": 120778, "epoch": 2875} {"train_loss": -6.631555080413818, "global_step": 120779, "epoch": 2875} {"train_loss": -6.494668006896973, "global_step": 120780, "epoch": 2875} {"train_loss": -6.641430854797363, "global_step": 120781, "epoch": 2875} {"train_loss": -6.401640892028809, "global_step": 120782, "epoch": 2875} {"train_loss": -6.446147918701172, "global_step": 120783, "epoch": 2875} {"train_loss": -6.474826812744141, "global_step": 120784, "epoch": 2875} {"train_loss": -6.48098087310791, "global_step": 120785, "epoch": 2875} {"train_loss": -6.487228870391846, "global_step": 120786, "epoch": 2875} {"train_loss": -6.561039924621582, "global_step": 120787, "epoch": 2875} {"train_loss": -6.469834804534912, "global_step": 120788, "epoch": 2875} {"train_loss": -6.553096294403076, "global_step": 120789, "epoch": 2875} {"train_loss": -6.442479133605957, "global_step": 120790, "epoch": 2875} {"train_loss": -6.56653660819644, "global_step": 120791, "epoch": 2875, "val_loss": 67996.9375} {"train_loss": -6.541811943054199, "global_step": 120792, "epoch": 2876} {"train_loss": -6.416706562042236, "global_step": 120793, "epoch": 2876} {"train_loss": -6.612252235412598, "global_step": 120794, "epoch": 2876} {"train_loss": -6.440873146057129, "global_step": 120795, "epoch": 2876} {"train_loss": -6.525024890899658, "global_step": 120796, "epoch": 2876} {"train_loss": -6.521927833557129, "global_step": 120797, "epoch": 2876} {"train_loss": -6.530296325683594, "global_step": 120798, "epoch": 2876} {"train_loss": -6.574603080749512, "global_step": 120799, "epoch": 2876} {"train_loss": -6.5309343338012695, "global_step": 120800, "epoch": 2876} {"train_loss": -6.426023006439209, "global_step": 120801, "epoch": 2876} {"train_loss": -6.599506378173828, "global_step": 120802, "epoch": 2876} {"train_loss": -6.363131523132324, "global_step": 120803, "epoch": 2876} {"train_loss": -6.520021915435791, "global_step": 120804, "epoch": 2876} {"train_loss": -6.488795280456543, "global_step": 120805, "epoch": 2876} {"train_loss": -6.577976226806641, "global_step": 120806, "epoch": 2876} {"train_loss": -6.58415412902832, "global_step": 120807, "epoch": 2876} {"train_loss": -6.422933578491211, "global_step": 120808, "epoch": 2876} {"train_loss": -6.476370334625244, "global_step": 120809, "epoch": 2876} {"train_loss": -6.4418487548828125, "global_step": 120810, "epoch": 2876} {"train_loss": -6.5935282707214355, "global_step": 120811, "epoch": 2876} {"train_loss": -6.56801700592041, "global_step": 120812, "epoch": 2876} {"train_loss": -6.532438278198242, "global_step": 120813, "epoch": 2876} {"train_loss": -6.573142051696777, "global_step": 120814, "epoch": 2876} {"train_loss": -6.594945907592773, "global_step": 120815, "epoch": 2876} {"train_loss": -6.499300479888916, "global_step": 120816, "epoch": 2876} {"train_loss": -6.574934005737305, "global_step": 120817, "epoch": 2876} {"train_loss": -6.631519794464111, "global_step": 120818, "epoch": 2876} {"train_loss": -6.503273010253906, "global_step": 120819, "epoch": 2876} {"train_loss": -6.543364524841309, "global_step": 120820, "epoch": 2876} {"train_loss": -6.488140106201172, "global_step": 120821, "epoch": 2876} {"train_loss": -6.422175407409668, "global_step": 120822, "epoch": 2876} {"train_loss": -6.559075832366943, "global_step": 120823, "epoch": 2876} {"train_loss": -6.460378170013428, "global_step": 120824, "epoch": 2876} {"train_loss": -6.503011703491211, "global_step": 120825, "epoch": 2876} {"train_loss": -6.561100482940674, "global_step": 120826, "epoch": 2876} {"train_loss": -6.49864387512207, "global_step": 120827, "epoch": 2876} {"train_loss": -6.568594932556152, "global_step": 120828, "epoch": 2876} {"train_loss": -6.455560684204102, "global_step": 120829, "epoch": 2876} {"train_loss": -6.575829029083252, "global_step": 120830, "epoch": 2876} {"train_loss": -6.498928070068359, "global_step": 120831, "epoch": 2876} {"train_loss": -6.534784317016602, "global_step": 120832, "epoch": 2876} {"train_loss": -6.522392704373314, "global_step": 120833, "epoch": 2876, "val_loss": 67764.4609375} {"train_loss": -6.352200984954834, "global_step": 120834, "epoch": 2877} {"train_loss": -6.614537239074707, "global_step": 120835, "epoch": 2877} {"train_loss": -6.557912826538086, "global_step": 120836, "epoch": 2877} {"train_loss": -6.618555545806885, "global_step": 120837, "epoch": 2877} {"train_loss": -6.553643226623535, "global_step": 120838, "epoch": 2877} {"train_loss": -6.571797847747803, "global_step": 120839, "epoch": 2877} {"train_loss": -6.61955451965332, "global_step": 120840, "epoch": 2877} {"train_loss": -6.59995174407959, "global_step": 120841, "epoch": 2877} {"train_loss": -6.522892951965332, "global_step": 120842, "epoch": 2877} {"train_loss": -6.572762489318848, "global_step": 120843, "epoch": 2877} {"train_loss": -6.6233625411987305, "global_step": 120844, "epoch": 2877} {"train_loss": -6.60943078994751, "global_step": 120845, "epoch": 2877} {"train_loss": -6.628482818603516, "global_step": 120846, "epoch": 2877} {"train_loss": -6.444609642028809, "global_step": 120847, "epoch": 2877} {"train_loss": -6.63171911239624, "global_step": 120848, "epoch": 2877} {"train_loss": -6.583312034606934, "global_step": 120849, "epoch": 2877} {"train_loss": -6.537548065185547, "global_step": 120850, "epoch": 2877} {"train_loss": -6.552381992340088, "global_step": 120851, "epoch": 2877} {"train_loss": -6.503669738769531, "global_step": 120852, "epoch": 2877} {"train_loss": -6.574751853942871, "global_step": 120853, "epoch": 2877} {"train_loss": -6.562520980834961, "global_step": 120854, "epoch": 2877} {"train_loss": -6.598948001861572, "global_step": 120855, "epoch": 2877} {"train_loss": -6.586690425872803, "global_step": 120856, "epoch": 2877} {"train_loss": -6.4803853034973145, "global_step": 120857, "epoch": 2877} {"train_loss": -6.582793712615967, "global_step": 120858, "epoch": 2877} {"train_loss": -6.589370250701904, "global_step": 120859, "epoch": 2877} {"train_loss": -6.5223493576049805, "global_step": 120860, "epoch": 2877} {"train_loss": -6.587721824645996, "global_step": 120861, "epoch": 2877} {"train_loss": -6.566561698913574, "global_step": 120862, "epoch": 2877} {"train_loss": -6.575702667236328, "global_step": 120863, "epoch": 2877} {"train_loss": -6.59842586517334, "global_step": 120864, "epoch": 2877} {"train_loss": -6.47683048248291, "global_step": 120865, "epoch": 2877} {"train_loss": -6.537352561950684, "global_step": 120866, "epoch": 2877} {"train_loss": -6.629022598266602, "global_step": 120867, "epoch": 2877} {"train_loss": -6.5246734619140625, "global_step": 120868, "epoch": 2877} {"train_loss": -6.55324649810791, "global_step": 120869, "epoch": 2877} {"train_loss": -6.364480018615723, "global_step": 120870, "epoch": 2877} {"train_loss": -6.373831748962402, "global_step": 120871, "epoch": 2877} {"train_loss": -6.403426170349121, "global_step": 120872, "epoch": 2877} {"train_loss": -6.310391426086426, "global_step": 120873, "epoch": 2877} {"train_loss": -6.587956428527832, "global_step": 120874, "epoch": 2877} {"train_loss": -6.541923795427595, "global_step": 120875, "epoch": 2877, "val_loss": 68225.1875} {"train_loss": -6.326306343078613, "global_step": 120876, "epoch": 2878} {"train_loss": -6.521455764770508, "global_step": 120877, "epoch": 2878} {"train_loss": -6.344182014465332, "global_step": 120878, "epoch": 2878} {"train_loss": -6.449334144592285, "global_step": 120879, "epoch": 2878} {"train_loss": -6.332033634185791, "global_step": 120880, "epoch": 2878} {"train_loss": -6.4344024658203125, "global_step": 120881, "epoch": 2878} {"train_loss": -6.473841667175293, "global_step": 120882, "epoch": 2878} {"train_loss": -6.217641830444336, "global_step": 120883, "epoch": 2878} {"train_loss": -6.512342929840088, "global_step": 120884, "epoch": 2878} {"train_loss": -6.313981056213379, "global_step": 120885, "epoch": 2878} {"train_loss": -6.462850570678711, "global_step": 120886, "epoch": 2878} {"train_loss": -6.424870491027832, "global_step": 120887, "epoch": 2878} {"train_loss": -6.536179542541504, "global_step": 120888, "epoch": 2878} {"train_loss": -6.3391265869140625, "global_step": 120889, "epoch": 2878} {"train_loss": -6.480558395385742, "global_step": 120890, "epoch": 2878} {"train_loss": -6.259363174438477, "global_step": 120891, "epoch": 2878} {"train_loss": -6.422072410583496, "global_step": 120892, "epoch": 2878} {"train_loss": -6.461597442626953, "global_step": 120893, "epoch": 2878} {"train_loss": -6.402963161468506, "global_step": 120894, "epoch": 2878} {"train_loss": -6.447601318359375, "global_step": 120895, "epoch": 2878} {"train_loss": -6.350190162658691, "global_step": 120896, "epoch": 2878} {"train_loss": -6.4619855880737305, "global_step": 120897, "epoch": 2878} {"train_loss": -6.53187370300293, "global_step": 120898, "epoch": 2878} {"train_loss": -6.422159194946289, "global_step": 120899, "epoch": 2878} {"train_loss": -6.567866325378418, "global_step": 120900, "epoch": 2878} {"train_loss": -6.485491752624512, "global_step": 120901, "epoch": 2878} {"train_loss": -6.456642150878906, "global_step": 120902, "epoch": 2878} {"train_loss": -6.438462734222412, "global_step": 120903, "epoch": 2878} {"train_loss": -6.481404781341553, "global_step": 120904, "epoch": 2878} {"train_loss": -6.50070333480835, "global_step": 120905, "epoch": 2878} {"train_loss": -6.397168159484863, "global_step": 120906, "epoch": 2878} {"train_loss": -6.553659915924072, "global_step": 120907, "epoch": 2878} {"train_loss": -6.54442834854126, "global_step": 120908, "epoch": 2878} {"train_loss": -6.394106864929199, "global_step": 120909, "epoch": 2878} {"train_loss": -6.517004489898682, "global_step": 120910, "epoch": 2878} {"train_loss": -6.623727321624756, "global_step": 120911, "epoch": 2878} {"train_loss": -6.702592372894287, "global_step": 120912, "epoch": 2878} {"train_loss": -6.520718097686768, "global_step": 120913, "epoch": 2878} {"train_loss": -6.55876350402832, "global_step": 120914, "epoch": 2878} {"train_loss": -6.622223854064941, "global_step": 120915, "epoch": 2878} {"train_loss": -6.564155101776123, "global_step": 120916, "epoch": 2878} {"train_loss": -6.462496303376698, "global_step": 120917, "epoch": 2878, "val_loss": 67983.90625} {"train_loss": -6.582298755645752, "global_step": 120918, "epoch": 2879} {"train_loss": -6.670419216156006, "global_step": 120919, "epoch": 2879} {"train_loss": -6.607715129852295, "global_step": 120920, "epoch": 2879} {"train_loss": -6.506298065185547, "global_step": 120921, "epoch": 2879} {"train_loss": -6.457491397857666, "global_step": 120922, "epoch": 2879} {"train_loss": -6.43709659576416, "global_step": 120923, "epoch": 2879} {"train_loss": -6.4507317543029785, "global_step": 120924, "epoch": 2879} {"train_loss": -6.642852783203125, "global_step": 120925, "epoch": 2879} {"train_loss": -6.580862998962402, "global_step": 120926, "epoch": 2879} {"train_loss": -6.53742790222168, "global_step": 120927, "epoch": 2879} {"train_loss": -6.609468936920166, "global_step": 120928, "epoch": 2879} {"train_loss": -6.5806708335876465, "global_step": 120929, "epoch": 2879} {"train_loss": -6.59903621673584, "global_step": 120930, "epoch": 2879} {"train_loss": -6.457305908203125, "global_step": 120931, "epoch": 2879} {"train_loss": -6.528604507446289, "global_step": 120932, "epoch": 2879} {"train_loss": -6.566944122314453, "global_step": 120933, "epoch": 2879} {"train_loss": -6.485476970672607, "global_step": 120934, "epoch": 2879} {"train_loss": -6.603750228881836, "global_step": 120935, "epoch": 2879} {"train_loss": -6.466338157653809, "global_step": 120936, "epoch": 2879} {"train_loss": -6.498394012451172, "global_step": 120937, "epoch": 2879} {"train_loss": -6.613508224487305, "global_step": 120938, "epoch": 2879} {"train_loss": -6.669759273529053, "global_step": 120939, "epoch": 2879} {"train_loss": -6.499079704284668, "global_step": 120940, "epoch": 2879} {"train_loss": -6.709406852722168, "global_step": 120941, "epoch": 2879} {"train_loss": -6.540304660797119, "global_step": 120942, "epoch": 2879} {"train_loss": -6.565301895141602, "global_step": 120943, "epoch": 2879} {"train_loss": -6.62532901763916, "global_step": 120944, "epoch": 2879} {"train_loss": -6.514273643493652, "global_step": 120945, "epoch": 2879} {"train_loss": -6.662364959716797, "global_step": 120946, "epoch": 2879} {"train_loss": -6.5960588455200195, "global_step": 120947, "epoch": 2879} {"train_loss": -6.570291996002197, "global_step": 120948, "epoch": 2879} {"train_loss": -6.600493907928467, "global_step": 120949, "epoch": 2879} {"train_loss": -6.524568557739258, "global_step": 120950, "epoch": 2879} {"train_loss": -6.382540702819824, "global_step": 120951, "epoch": 2879} {"train_loss": -6.5170183181762695, "global_step": 120952, "epoch": 2879} {"train_loss": -6.312069892883301, "global_step": 120953, "epoch": 2879} {"train_loss": -6.576232433319092, "global_step": 120954, "epoch": 2879} {"train_loss": -6.422133445739746, "global_step": 120955, "epoch": 2879} {"train_loss": -6.429026126861572, "global_step": 120956, "epoch": 2879} {"train_loss": -6.405861854553223, "global_step": 120957, "epoch": 2879} {"train_loss": -6.441526412963867, "global_step": 120958, "epoch": 2879} {"train_loss": -6.538311379296439, "global_step": 120959, "epoch": 2879, "val_loss": 68061.7890625} {"train_loss": -6.490041732788086, "global_step": 120960, "epoch": 2880} {"train_loss": -6.6014580726623535, "global_step": 120961, "epoch": 2880} {"train_loss": -6.51479434967041, "global_step": 120962, "epoch": 2880} {"train_loss": -6.577776908874512, "global_step": 120963, "epoch": 2880} {"train_loss": -6.501944541931152, "global_step": 120964, "epoch": 2880} {"train_loss": -6.468418121337891, "global_step": 120965, "epoch": 2880} {"train_loss": -6.487643241882324, "global_step": 120966, "epoch": 2880} {"train_loss": -6.517675399780273, "global_step": 120967, "epoch": 2880} {"train_loss": -6.495660781860352, "global_step": 120968, "epoch": 2880} {"train_loss": -6.577695846557617, "global_step": 120969, "epoch": 2880} {"train_loss": -6.539120674133301, "global_step": 120970, "epoch": 2880} {"train_loss": -6.570736885070801, "global_step": 120971, "epoch": 2880} {"train_loss": -6.533257484436035, "global_step": 120972, "epoch": 2880} {"train_loss": -6.458367347717285, "global_step": 120973, "epoch": 2880} {"train_loss": -6.609342575073242, "global_step": 120974, "epoch": 2880} {"train_loss": -6.45097541809082, "global_step": 120975, "epoch": 2880} {"train_loss": -6.70919132232666, "global_step": 120976, "epoch": 2880} {"train_loss": -6.635743141174316, "global_step": 120977, "epoch": 2880} {"train_loss": -6.673894882202148, "global_step": 120978, "epoch": 2880} {"train_loss": -6.602686882019043, "global_step": 120979, "epoch": 2880} {"train_loss": -6.573307037353516, "global_step": 120980, "epoch": 2880} {"train_loss": -6.598539352416992, "global_step": 120981, "epoch": 2880} {"train_loss": -6.583646774291992, "global_step": 120982, "epoch": 2880} {"train_loss": -6.517482757568359, "global_step": 120983, "epoch": 2880} {"train_loss": -6.624967575073242, "global_step": 120984, "epoch": 2880} {"train_loss": -6.50295352935791, "global_step": 120985, "epoch": 2880} {"train_loss": -6.562718391418457, "global_step": 120986, "epoch": 2880} {"train_loss": -6.540829658508301, "global_step": 120987, "epoch": 2880} {"train_loss": -6.546205520629883, "global_step": 120988, "epoch": 2880} {"train_loss": -6.471164703369141, "global_step": 120989, "epoch": 2880} {"train_loss": -6.634354591369629, "global_step": 120990, "epoch": 2880} {"train_loss": -6.547518253326416, "global_step": 120991, "epoch": 2880} {"train_loss": -6.567218780517578, "global_step": 120992, "epoch": 2880} {"train_loss": -6.500326156616211, "global_step": 120993, "epoch": 2880} {"train_loss": -6.661477565765381, "global_step": 120994, "epoch": 2880} {"train_loss": -6.482643127441406, "global_step": 120995, "epoch": 2880} {"train_loss": -6.585463047027588, "global_step": 120996, "epoch": 2880} {"train_loss": -6.61508846282959, "global_step": 120997, "epoch": 2880} {"train_loss": -6.556585788726807, "global_step": 120998, "epoch": 2880} {"train_loss": -6.627376556396484, "global_step": 120999, "epoch": 2880} {"train_loss": -6.608008861541748, "global_step": 121000, "epoch": 2880} {"train_loss": -6.563564243770781, "global_step": 121001, "epoch": 2880, "val_loss": 68049.8671875} {"train_loss": -6.575051307678223, "global_step": 121002, "epoch": 2881} {"train_loss": -6.547821044921875, "global_step": 121003, "epoch": 2881} {"train_loss": -6.547281742095947, "global_step": 121004, "epoch": 2881} {"train_loss": -6.381857395172119, "global_step": 121005, "epoch": 2881} {"train_loss": -6.57527494430542, "global_step": 121006, "epoch": 2881} {"train_loss": -6.610867977142334, "global_step": 121007, "epoch": 2881} {"train_loss": -6.426695346832275, "global_step": 121008, "epoch": 2881} {"train_loss": -6.49903678894043, "global_step": 121009, "epoch": 2881} {"train_loss": -6.632521629333496, "global_step": 121010, "epoch": 2881} {"train_loss": -6.474720478057861, "global_step": 121011, "epoch": 2881} {"train_loss": -6.604374885559082, "global_step": 121012, "epoch": 2881} {"train_loss": -6.649886608123779, "global_step": 121013, "epoch": 2881} {"train_loss": -6.678256034851074, "global_step": 121014, "epoch": 2881} {"train_loss": -6.593594551086426, "global_step": 121015, "epoch": 2881} {"train_loss": -6.6690216064453125, "global_step": 121016, "epoch": 2881} {"train_loss": -6.578383445739746, "global_step": 121017, "epoch": 2881} {"train_loss": -6.503820896148682, "global_step": 121018, "epoch": 2881} {"train_loss": -6.480156898498535, "global_step": 121019, "epoch": 2881} {"train_loss": -6.659099578857422, "global_step": 121020, "epoch": 2881} {"train_loss": -6.543241500854492, "global_step": 121021, "epoch": 2881} {"train_loss": -6.595026016235352, "global_step": 121022, "epoch": 2881} {"train_loss": -6.527680397033691, "global_step": 121023, "epoch": 2881} {"train_loss": -6.479442596435547, "global_step": 121024, "epoch": 2881} {"train_loss": -6.585844039916992, "global_step": 121025, "epoch": 2881} {"train_loss": -6.622985363006592, "global_step": 121026, "epoch": 2881} {"train_loss": -6.5399169921875, "global_step": 121027, "epoch": 2881} {"train_loss": -6.551932334899902, "global_step": 121028, "epoch": 2881} {"train_loss": -6.55665397644043, "global_step": 121029, "epoch": 2881} {"train_loss": -6.550536155700684, "global_step": 121030, "epoch": 2881} {"train_loss": -6.479649543762207, "global_step": 121031, "epoch": 2881} {"train_loss": -6.407865047454834, "global_step": 121032, "epoch": 2881} {"train_loss": -6.549170017242432, "global_step": 121033, "epoch": 2881} {"train_loss": -6.609169006347656, "global_step": 121034, "epoch": 2881} {"train_loss": -6.464790344238281, "global_step": 121035, "epoch": 2881} {"train_loss": -6.456171989440918, "global_step": 121036, "epoch": 2881} {"train_loss": -6.591131210327148, "global_step": 121037, "epoch": 2881} {"train_loss": -6.664968490600586, "global_step": 121038, "epoch": 2881} {"train_loss": -6.636876106262207, "global_step": 121039, "epoch": 2881} {"train_loss": -6.6239423751831055, "global_step": 121040, "epoch": 2881} {"train_loss": -6.453242301940918, "global_step": 121041, "epoch": 2881} {"train_loss": -6.581328868865967, "global_step": 121042, "epoch": 2881} {"train_loss": -6.5554613045283725, "global_step": 121043, "epoch": 2881, "val_loss": 68014.0078125} {"train_loss": -6.475499153137207, "global_step": 121044, "epoch": 2882} {"train_loss": -6.597501277923584, "global_step": 121045, "epoch": 2882} {"train_loss": -6.47994327545166, "global_step": 121046, "epoch": 2882} {"train_loss": -6.564288139343262, "global_step": 121047, "epoch": 2882} {"train_loss": -6.464916229248047, "global_step": 121048, "epoch": 2882} {"train_loss": -6.490986347198486, "global_step": 121049, "epoch": 2882} {"train_loss": -6.522827625274658, "global_step": 121050, "epoch": 2882} {"train_loss": -6.531730651855469, "global_step": 121051, "epoch": 2882} {"train_loss": -6.555016994476318, "global_step": 121052, "epoch": 2882} {"train_loss": -6.560635566711426, "global_step": 121053, "epoch": 2882} {"train_loss": -6.485795974731445, "global_step": 121054, "epoch": 2882} {"train_loss": -6.605836868286133, "global_step": 121055, "epoch": 2882} {"train_loss": -6.5705485343933105, "global_step": 121056, "epoch": 2882} {"train_loss": -6.629664421081543, "global_step": 121057, "epoch": 2882} {"train_loss": -6.512574195861816, "global_step": 121058, "epoch": 2882} {"train_loss": -6.640869617462158, "global_step": 121059, "epoch": 2882} {"train_loss": -6.428943634033203, "global_step": 121060, "epoch": 2882} {"train_loss": -6.469804286956787, "global_step": 121061, "epoch": 2882} {"train_loss": -6.566023826599121, "global_step": 121062, "epoch": 2882} {"train_loss": -6.649929046630859, "global_step": 121063, "epoch": 2882} {"train_loss": -6.5561137199401855, "global_step": 121064, "epoch": 2882} {"train_loss": -6.474716663360596, "global_step": 121065, "epoch": 2882} {"train_loss": -6.648059368133545, "global_step": 121066, "epoch": 2882} {"train_loss": -6.571024417877197, "global_step": 121067, "epoch": 2882} {"train_loss": -6.373463153839111, "global_step": 121068, "epoch": 2882} {"train_loss": -6.625707626342773, "global_step": 121069, "epoch": 2882} {"train_loss": -6.382132053375244, "global_step": 121070, "epoch": 2882} {"train_loss": -6.569399356842041, "global_step": 121071, "epoch": 2882} {"train_loss": -6.517040252685547, "global_step": 121072, "epoch": 2882} {"train_loss": -6.375444412231445, "global_step": 121073, "epoch": 2882} {"train_loss": -6.473734378814697, "global_step": 121074, "epoch": 2882} {"train_loss": -6.461233139038086, "global_step": 121075, "epoch": 2882} {"train_loss": -6.495373725891113, "global_step": 121076, "epoch": 2882} {"train_loss": -6.478590965270996, "global_step": 121077, "epoch": 2882} {"train_loss": -6.4791669845581055, "global_step": 121078, "epoch": 2882} {"train_loss": -6.4232635498046875, "global_step": 121079, "epoch": 2882} {"train_loss": -6.434776782989502, "global_step": 121080, "epoch": 2882} {"train_loss": -6.551456928253174, "global_step": 121081, "epoch": 2882} {"train_loss": -6.511386871337891, "global_step": 121082, "epoch": 2882} {"train_loss": -6.631894111633301, "global_step": 121083, "epoch": 2882} {"train_loss": -6.562854766845703, "global_step": 121084, "epoch": 2882} {"train_loss": -6.523060117449079, "global_step": 121085, "epoch": 2882, "val_loss": 68211.5390625} {"train_loss": -6.521235466003418, "global_step": 121086, "epoch": 2883} {"train_loss": -6.4853081703186035, "global_step": 121087, "epoch": 2883} {"train_loss": -6.459221839904785, "global_step": 121088, "epoch": 2883} {"train_loss": -6.595702171325684, "global_step": 121089, "epoch": 2883} {"train_loss": -6.537117004394531, "global_step": 121090, "epoch": 2883} {"train_loss": -6.543157577514648, "global_step": 121091, "epoch": 2883} {"train_loss": -6.597108840942383, "global_step": 121092, "epoch": 2883} {"train_loss": -6.4327521324157715, "global_step": 121093, "epoch": 2883} {"train_loss": -6.546138763427734, "global_step": 121094, "epoch": 2883} {"train_loss": -6.522526741027832, "global_step": 121095, "epoch": 2883} {"train_loss": -6.541106700897217, "global_step": 121096, "epoch": 2883} {"train_loss": -6.604189395904541, "global_step": 121097, "epoch": 2883} {"train_loss": -6.547490119934082, "global_step": 121098, "epoch": 2883} {"train_loss": -6.426194190979004, "global_step": 121099, "epoch": 2883} {"train_loss": -6.573694229125977, "global_step": 121100, "epoch": 2883} {"train_loss": -6.468875885009766, "global_step": 121101, "epoch": 2883} {"train_loss": -6.540639877319336, "global_step": 121102, "epoch": 2883} {"train_loss": -6.629365921020508, "global_step": 121103, "epoch": 2883} {"train_loss": -6.524470806121826, "global_step": 121104, "epoch": 2883} {"train_loss": -6.69429874420166, "global_step": 121105, "epoch": 2883} {"train_loss": -6.551619529724121, "global_step": 121106, "epoch": 2883} {"train_loss": -6.517294883728027, "global_step": 121107, "epoch": 2883} {"train_loss": -6.610141754150391, "global_step": 121108, "epoch": 2883} {"train_loss": -6.481217384338379, "global_step": 121109, "epoch": 2883} {"train_loss": -6.6608357429504395, "global_step": 121110, "epoch": 2883} {"train_loss": -6.6239118576049805, "global_step": 121111, "epoch": 2883} {"train_loss": -6.509818077087402, "global_step": 121112, "epoch": 2883} {"train_loss": -6.68040657043457, "global_step": 121113, "epoch": 2883} {"train_loss": -6.49202823638916, "global_step": 121114, "epoch": 2883} {"train_loss": -6.5958123207092285, "global_step": 121115, "epoch": 2883} {"train_loss": -6.550394058227539, "global_step": 121116, "epoch": 2883} {"train_loss": -6.420957088470459, "global_step": 121117, "epoch": 2883} {"train_loss": -6.551555633544922, "global_step": 121118, "epoch": 2883} {"train_loss": -6.440459728240967, "global_step": 121119, "epoch": 2883} {"train_loss": -6.458956241607666, "global_step": 121120, "epoch": 2883} {"train_loss": -6.512728691101074, "global_step": 121121, "epoch": 2883} {"train_loss": -6.4296417236328125, "global_step": 121122, "epoch": 2883} {"train_loss": -6.475120544433594, "global_step": 121123, "epoch": 2883} {"train_loss": -6.536897659301758, "global_step": 121124, "epoch": 2883} {"train_loss": -6.443140983581543, "global_step": 121125, "epoch": 2883} {"train_loss": -6.410158157348633, "global_step": 121126, "epoch": 2883} {"train_loss": -6.526611793608892, "global_step": 121127, "epoch": 2883, "val_loss": 67958.4765625} {"train_loss": -6.569901466369629, "global_step": 121128, "epoch": 2884} {"train_loss": -6.417604923248291, "global_step": 121129, "epoch": 2884} {"train_loss": -6.605757236480713, "global_step": 121130, "epoch": 2884} {"train_loss": -6.403702735900879, "global_step": 121131, "epoch": 2884} {"train_loss": -6.4388041496276855, "global_step": 121132, "epoch": 2884} {"train_loss": -6.444984436035156, "global_step": 121133, "epoch": 2884} {"train_loss": -6.425085544586182, "global_step": 121134, "epoch": 2884} {"train_loss": -6.428441047668457, "global_step": 121135, "epoch": 2884} {"train_loss": -6.371954441070557, "global_step": 121136, "epoch": 2884} {"train_loss": -6.379106044769287, "global_step": 121137, "epoch": 2884} {"train_loss": -6.320337772369385, "global_step": 121138, "epoch": 2884} {"train_loss": -6.459864616394043, "global_step": 121139, "epoch": 2884} {"train_loss": -6.394366264343262, "global_step": 121140, "epoch": 2884} {"train_loss": -6.3962082862854, "global_step": 121141, "epoch": 2884} {"train_loss": -6.252678871154785, "global_step": 121142, "epoch": 2884} {"train_loss": -6.499351501464844, "global_step": 121143, "epoch": 2884} {"train_loss": -6.572955131530762, "global_step": 121144, "epoch": 2884} {"train_loss": -6.469144821166992, "global_step": 121145, "epoch": 2884} {"train_loss": -6.500720977783203, "global_step": 121146, "epoch": 2884} {"train_loss": -6.611739158630371, "global_step": 121147, "epoch": 2884} {"train_loss": -6.542186737060547, "global_step": 121148, "epoch": 2884} {"train_loss": -6.590638160705566, "global_step": 121149, "epoch": 2884} {"train_loss": -6.556366920471191, "global_step": 121150, "epoch": 2884} {"train_loss": -6.562771797180176, "global_step": 121151, "epoch": 2884} {"train_loss": -6.618268966674805, "global_step": 121152, "epoch": 2884} {"train_loss": -6.570808410644531, "global_step": 121153, "epoch": 2884} {"train_loss": -6.576895713806152, "global_step": 121154, "epoch": 2884} {"train_loss": -6.588779449462891, "global_step": 121155, "epoch": 2884} {"train_loss": -6.575109958648682, "global_step": 121156, "epoch": 2884} {"train_loss": -6.618473052978516, "global_step": 121157, "epoch": 2884} {"train_loss": -6.63581657409668, "global_step": 121158, "epoch": 2884} {"train_loss": -6.651585102081299, "global_step": 121159, "epoch": 2884} {"train_loss": -6.5456671714782715, "global_step": 121160, "epoch": 2884} {"train_loss": -6.527239799499512, "global_step": 121161, "epoch": 2884} {"train_loss": -6.581182479858398, "global_step": 121162, "epoch": 2884} {"train_loss": -6.601805210113525, "global_step": 121163, "epoch": 2884} {"train_loss": -6.6206231117248535, "global_step": 121164, "epoch": 2884} {"train_loss": -6.681159019470215, "global_step": 121165, "epoch": 2884} {"train_loss": -6.584375381469727, "global_step": 121166, "epoch": 2884} {"train_loss": -6.643433570861816, "global_step": 121167, "epoch": 2884} {"train_loss": -6.582706928253174, "global_step": 121168, "epoch": 2884} {"train_loss": -6.524511768704369, "global_step": 121169, "epoch": 2884, "val_loss": 68078.609375} {"train_loss": -6.545925140380859, "global_step": 121170, "epoch": 2885} {"train_loss": -6.700199604034424, "global_step": 121171, "epoch": 2885} {"train_loss": -6.572165489196777, "global_step": 121172, "epoch": 2885} {"train_loss": -6.524704456329346, "global_step": 121173, "epoch": 2885} {"train_loss": -6.638058185577393, "global_step": 121174, "epoch": 2885} {"train_loss": -6.566266059875488, "global_step": 121175, "epoch": 2885} {"train_loss": -6.5139055252075195, "global_step": 121176, "epoch": 2885} {"train_loss": -6.530224800109863, "global_step": 121177, "epoch": 2885} {"train_loss": -6.5144195556640625, "global_step": 121178, "epoch": 2885} {"train_loss": -6.534429550170898, "global_step": 121179, "epoch": 2885} {"train_loss": -6.609213829040527, "global_step": 121180, "epoch": 2885} {"train_loss": -6.537193775177002, "global_step": 121181, "epoch": 2885} {"train_loss": -6.550520896911621, "global_step": 121182, "epoch": 2885} {"train_loss": -6.576717853546143, "global_step": 121183, "epoch": 2885} {"train_loss": -6.487649917602539, "global_step": 121184, "epoch": 2885} {"train_loss": -6.635293483734131, "global_step": 121185, "epoch": 2885} {"train_loss": -6.529034614562988, "global_step": 121186, "epoch": 2885} {"train_loss": -6.52011775970459, "global_step": 121187, "epoch": 2885} {"train_loss": -6.492917060852051, "global_step": 121188, "epoch": 2885} {"train_loss": -6.52735710144043, "global_step": 121189, "epoch": 2885} {"train_loss": -6.645633697509766, "global_step": 121190, "epoch": 2885} {"train_loss": -6.441291809082031, "global_step": 121191, "epoch": 2885} {"train_loss": -6.651397228240967, "global_step": 121192, "epoch": 2885} {"train_loss": -6.4683613777160645, "global_step": 121193, "epoch": 2885} {"train_loss": -6.440922260284424, "global_step": 121194, "epoch": 2885} {"train_loss": -6.486485004425049, "global_step": 121195, "epoch": 2885} {"train_loss": -6.5799360275268555, "global_step": 121196, "epoch": 2885} {"train_loss": -6.619068622589111, "global_step": 121197, "epoch": 2885} {"train_loss": -6.485346794128418, "global_step": 121198, "epoch": 2885} {"train_loss": -6.603542327880859, "global_step": 121199, "epoch": 2885} {"train_loss": -6.547642230987549, "global_step": 121200, "epoch": 2885} {"train_loss": -6.513065814971924, "global_step": 121201, "epoch": 2885} {"train_loss": -6.5480475425720215, "global_step": 121202, "epoch": 2885} {"train_loss": -6.629735946655273, "global_step": 121203, "epoch": 2885} {"train_loss": -6.60401725769043, "global_step": 121204, "epoch": 2885} {"train_loss": -6.419610977172852, "global_step": 121205, "epoch": 2885} {"train_loss": -6.345596790313721, "global_step": 121206, "epoch": 2885} {"train_loss": -6.4716691970825195, "global_step": 121207, "epoch": 2885} {"train_loss": -6.465631484985352, "global_step": 121208, "epoch": 2885} {"train_loss": -6.508747100830078, "global_step": 121209, "epoch": 2885} {"train_loss": -6.415006160736084, "global_step": 121210, "epoch": 2885} {"train_loss": -6.531985294251215, "global_step": 121211, "epoch": 2885, "val_loss": 67889.375} {"train_loss": -6.5484724044799805, "global_step": 121212, "epoch": 2886} {"train_loss": -6.3858866691589355, "global_step": 121213, "epoch": 2886} {"train_loss": -6.520884037017822, "global_step": 121214, "epoch": 2886} {"train_loss": -6.361440658569336, "global_step": 121215, "epoch": 2886} {"train_loss": -6.401854515075684, "global_step": 121216, "epoch": 2886} {"train_loss": -6.5356621742248535, "global_step": 121217, "epoch": 2886} {"train_loss": -6.33059024810791, "global_step": 121218, "epoch": 2886} {"train_loss": -6.467918872833252, "global_step": 121219, "epoch": 2886} {"train_loss": -6.394172668457031, "global_step": 121220, "epoch": 2886} {"train_loss": -6.56077766418457, "global_step": 121221, "epoch": 2886} {"train_loss": -6.504249095916748, "global_step": 121222, "epoch": 2886} {"train_loss": -6.614480018615723, "global_step": 121223, "epoch": 2886} {"train_loss": -6.421979904174805, "global_step": 121224, "epoch": 2886} {"train_loss": -6.496016025543213, "global_step": 121225, "epoch": 2886} {"train_loss": -6.518093109130859, "global_step": 121226, "epoch": 2886} {"train_loss": -6.457942008972168, "global_step": 121227, "epoch": 2886} {"train_loss": -6.54857873916626, "global_step": 121228, "epoch": 2886} {"train_loss": -6.506361484527588, "global_step": 121229, "epoch": 2886} {"train_loss": -6.4875874519348145, "global_step": 121230, "epoch": 2886} {"train_loss": -6.446469306945801, "global_step": 121231, "epoch": 2886} {"train_loss": -6.456587791442871, "global_step": 121232, "epoch": 2886} {"train_loss": -6.3815598487854, "global_step": 121233, "epoch": 2886} {"train_loss": -6.37885856628418, "global_step": 121234, "epoch": 2886} {"train_loss": -6.454342842102051, "global_step": 121235, "epoch": 2886} {"train_loss": -6.433078289031982, "global_step": 121236, "epoch": 2886} {"train_loss": -6.506529808044434, "global_step": 121237, "epoch": 2886} {"train_loss": -6.611354827880859, "global_step": 121238, "epoch": 2886} {"train_loss": -6.418475151062012, "global_step": 121239, "epoch": 2886} {"train_loss": -6.621820449829102, "global_step": 121240, "epoch": 2886} {"train_loss": -6.463410377502441, "global_step": 121241, "epoch": 2886} {"train_loss": -6.521059989929199, "global_step": 121242, "epoch": 2886} {"train_loss": -6.509946823120117, "global_step": 121243, "epoch": 2886} {"train_loss": -6.490487098693848, "global_step": 121244, "epoch": 2886} {"train_loss": -6.601390838623047, "global_step": 121245, "epoch": 2886} {"train_loss": -6.5709452629089355, "global_step": 121246, "epoch": 2886} {"train_loss": -6.551107406616211, "global_step": 121247, "epoch": 2886} {"train_loss": -6.561371326446533, "global_step": 121248, "epoch": 2886} {"train_loss": -6.51289176940918, "global_step": 121249, "epoch": 2886} {"train_loss": -6.577661514282227, "global_step": 121250, "epoch": 2886} {"train_loss": -6.565277099609375, "global_step": 121251, "epoch": 2886} {"train_loss": -6.485019683837891, "global_step": 121252, "epoch": 2886} {"train_loss": -6.49189187231518, "global_step": 121253, "epoch": 2886, "val_loss": 68208.140625} {"train_loss": -6.539067268371582, "global_step": 121254, "epoch": 2887} {"train_loss": -6.473224639892578, "global_step": 121255, "epoch": 2887} {"train_loss": -6.49641227722168, "global_step": 121256, "epoch": 2887} {"train_loss": -6.660702705383301, "global_step": 121257, "epoch": 2887} {"train_loss": -6.64317512512207, "global_step": 121258, "epoch": 2887} {"train_loss": -6.605051040649414, "global_step": 121259, "epoch": 2887} {"train_loss": -6.55987024307251, "global_step": 121260, "epoch": 2887} {"train_loss": -6.467589378356934, "global_step": 121261, "epoch": 2887} {"train_loss": -6.540121078491211, "global_step": 121262, "epoch": 2887} {"train_loss": -6.570652961730957, "global_step": 121263, "epoch": 2887} {"train_loss": -6.479342460632324, "global_step": 121264, "epoch": 2887} {"train_loss": -6.594675064086914, "global_step": 121265, "epoch": 2887} {"train_loss": -6.48771858215332, "global_step": 121266, "epoch": 2887} {"train_loss": -6.6582417488098145, "global_step": 121267, "epoch": 2887} {"train_loss": -6.533618450164795, "global_step": 121268, "epoch": 2887} {"train_loss": -6.459532737731934, "global_step": 121269, "epoch": 2887} {"train_loss": -6.621285438537598, "global_step": 121270, "epoch": 2887} {"train_loss": -6.5150909423828125, "global_step": 121271, "epoch": 2887} {"train_loss": -6.690382957458496, "global_step": 121272, "epoch": 2887} {"train_loss": -6.514719009399414, "global_step": 121273, "epoch": 2887} {"train_loss": -6.518857955932617, "global_step": 121274, "epoch": 2887} {"train_loss": -6.544490814208984, "global_step": 121275, "epoch": 2887} {"train_loss": -6.576655864715576, "global_step": 121276, "epoch": 2887} {"train_loss": -6.589389324188232, "global_step": 121277, "epoch": 2887} {"train_loss": -6.4926605224609375, "global_step": 121278, "epoch": 2887} {"train_loss": -6.53483772277832, "global_step": 121279, "epoch": 2887} {"train_loss": -6.534090042114258, "global_step": 121280, "epoch": 2887} {"train_loss": -6.638285160064697, "global_step": 121281, "epoch": 2887} {"train_loss": -6.591311454772949, "global_step": 121282, "epoch": 2887} {"train_loss": -6.664560317993164, "global_step": 121283, "epoch": 2887} {"train_loss": -6.5894927978515625, "global_step": 121284, "epoch": 2887} {"train_loss": -6.594673156738281, "global_step": 121285, "epoch": 2887} {"train_loss": -6.55075740814209, "global_step": 121286, "epoch": 2887} {"train_loss": -6.65203332901001, "global_step": 121287, "epoch": 2887} {"train_loss": -6.617229461669922, "global_step": 121288, "epoch": 2887} {"train_loss": -6.593326091766357, "global_step": 121289, "epoch": 2887} {"train_loss": -6.470788955688477, "global_step": 121290, "epoch": 2887} {"train_loss": -6.64009952545166, "global_step": 121291, "epoch": 2887} {"train_loss": -6.659952163696289, "global_step": 121292, "epoch": 2887} {"train_loss": -6.5673675537109375, "global_step": 121293, "epoch": 2887} {"train_loss": -6.670328617095947, "global_step": 121294, "epoch": 2887} {"train_loss": -6.571129605883644, "global_step": 121295, "epoch": 2887, "val_loss": 67951.6640625} {"train_loss": -6.527065753936768, "global_step": 121296, "epoch": 2888} {"train_loss": -6.630230903625488, "global_step": 121297, "epoch": 2888} {"train_loss": -6.5832695960998535, "global_step": 121298, "epoch": 2888} {"train_loss": -6.419405937194824, "global_step": 121299, "epoch": 2888} {"train_loss": -6.541360378265381, "global_step": 121300, "epoch": 2888} {"train_loss": -6.4595842361450195, "global_step": 121301, "epoch": 2888} {"train_loss": -6.499363899230957, "global_step": 121302, "epoch": 2888} {"train_loss": -6.505712509155273, "global_step": 121303, "epoch": 2888} {"train_loss": -6.510004997253418, "global_step": 121304, "epoch": 2888} {"train_loss": -6.62066125869751, "global_step": 121305, "epoch": 2888} {"train_loss": -6.544302940368652, "global_step": 121306, "epoch": 2888} {"train_loss": -6.658084869384766, "global_step": 121307, "epoch": 2888} {"train_loss": -6.55391788482666, "global_step": 121308, "epoch": 2888} {"train_loss": -6.507841110229492, "global_step": 121309, "epoch": 2888} {"train_loss": -6.489544868469238, "global_step": 121310, "epoch": 2888} {"train_loss": -6.430438995361328, "global_step": 121311, "epoch": 2888} {"train_loss": -6.5902814865112305, "global_step": 121312, "epoch": 2888} {"train_loss": -6.457988262176514, "global_step": 121313, "epoch": 2888} {"train_loss": -6.501775741577148, "global_step": 121314, "epoch": 2888} {"train_loss": -6.663751125335693, "global_step": 121315, "epoch": 2888} {"train_loss": -6.571732997894287, "global_step": 121316, "epoch": 2888} {"train_loss": -6.478207111358643, "global_step": 121317, "epoch": 2888} {"train_loss": -6.442848205566406, "global_step": 121318, "epoch": 2888} {"train_loss": -6.431929588317871, "global_step": 121319, "epoch": 2888} {"train_loss": -6.3902692794799805, "global_step": 121320, "epoch": 2888} {"train_loss": -6.465649127960205, "global_step": 121321, "epoch": 2888} {"train_loss": -6.578234672546387, "global_step": 121322, "epoch": 2888} {"train_loss": -6.418058395385742, "global_step": 121323, "epoch": 2888} {"train_loss": -6.590960502624512, "global_step": 121324, "epoch": 2888} {"train_loss": -6.482567310333252, "global_step": 121325, "epoch": 2888} {"train_loss": -6.574949264526367, "global_step": 121326, "epoch": 2888} {"train_loss": -6.549854278564453, "global_step": 121327, "epoch": 2888} {"train_loss": -6.45833158493042, "global_step": 121328, "epoch": 2888} {"train_loss": -6.614902496337891, "global_step": 121329, "epoch": 2888} {"train_loss": -6.506941795349121, "global_step": 121330, "epoch": 2888} {"train_loss": -6.606898307800293, "global_step": 121331, "epoch": 2888} {"train_loss": -6.59897518157959, "global_step": 121332, "epoch": 2888} {"train_loss": -6.487499713897705, "global_step": 121333, "epoch": 2888} {"train_loss": -6.516068458557129, "global_step": 121334, "epoch": 2888} {"train_loss": -6.543862342834473, "global_step": 121335, "epoch": 2888} {"train_loss": -6.502613067626953, "global_step": 121336, "epoch": 2888} {"train_loss": -6.527757406234741, "global_step": 121337, "epoch": 2888, "val_loss": 68032.5078125} {"train_loss": -6.521242618560791, "global_step": 121338, "epoch": 2889} {"train_loss": -6.554531574249268, "global_step": 121339, "epoch": 2889} {"train_loss": -6.550469398498535, "global_step": 121340, "epoch": 2889} {"train_loss": -6.443854331970215, "global_step": 121341, "epoch": 2889} {"train_loss": -6.585968017578125, "global_step": 121342, "epoch": 2889} {"train_loss": -6.570194721221924, "global_step": 121343, "epoch": 2889} {"train_loss": -6.464040756225586, "global_step": 121344, "epoch": 2889} {"train_loss": -6.466628551483154, "global_step": 121345, "epoch": 2889} {"train_loss": -6.669577598571777, "global_step": 121346, "epoch": 2889} {"train_loss": -6.536783218383789, "global_step": 121347, "epoch": 2889} {"train_loss": -6.581124305725098, "global_step": 121348, "epoch": 2889} {"train_loss": -6.5479278564453125, "global_step": 121349, "epoch": 2889} {"train_loss": -6.466395378112793, "global_step": 121350, "epoch": 2889} {"train_loss": -6.638862133026123, "global_step": 121351, "epoch": 2889} {"train_loss": -6.557559013366699, "global_step": 121352, "epoch": 2889} {"train_loss": -6.459311485290527, "global_step": 121353, "epoch": 2889} {"train_loss": -6.4624128341674805, "global_step": 121354, "epoch": 2889} {"train_loss": -6.367585182189941, "global_step": 121355, "epoch": 2889} {"train_loss": -6.438309192657471, "global_step": 121356, "epoch": 2889} {"train_loss": -6.488041877746582, "global_step": 121357, "epoch": 2889} {"train_loss": -6.450959205627441, "global_step": 121358, "epoch": 2889} {"train_loss": -6.403478145599365, "global_step": 121359, "epoch": 2889} {"train_loss": -6.535408973693848, "global_step": 121360, "epoch": 2889} {"train_loss": -6.462801456451416, "global_step": 121361, "epoch": 2889} {"train_loss": -6.541018486022949, "global_step": 121362, "epoch": 2889} {"train_loss": -6.588240623474121, "global_step": 121363, "epoch": 2889} {"train_loss": -6.5516204833984375, "global_step": 121364, "epoch": 2889} {"train_loss": -6.511991500854492, "global_step": 121365, "epoch": 2889} {"train_loss": -6.495519638061523, "global_step": 121366, "epoch": 2889} {"train_loss": -6.488908767700195, "global_step": 121367, "epoch": 2889} {"train_loss": -6.538119316101074, "global_step": 121368, "epoch": 2889} {"train_loss": -6.518219470977783, "global_step": 121369, "epoch": 2889} {"train_loss": -6.41195011138916, "global_step": 121370, "epoch": 2889} {"train_loss": -6.570281982421875, "global_step": 121371, "epoch": 2889} {"train_loss": -6.3721113204956055, "global_step": 121372, "epoch": 2889} {"train_loss": -6.681872367858887, "global_step": 121373, "epoch": 2889} {"train_loss": -6.479682445526123, "global_step": 121374, "epoch": 2889} {"train_loss": -6.550770282745361, "global_step": 121375, "epoch": 2889} {"train_loss": -6.544854164123535, "global_step": 121376, "epoch": 2889} {"train_loss": -6.457684516906738, "global_step": 121377, "epoch": 2889} {"train_loss": -6.62630033493042, "global_step": 121378, "epoch": 2889} {"train_loss": -6.517366738546462, "global_step": 121379, "epoch": 2889, "val_loss": 67903.8125} {"train_loss": -6.568054676055908, "global_step": 121380, "epoch": 2890} {"train_loss": -6.6099934577941895, "global_step": 121381, "epoch": 2890} {"train_loss": -6.638411521911621, "global_step": 121382, "epoch": 2890} {"train_loss": -6.594090461730957, "global_step": 121383, "epoch": 2890} {"train_loss": -6.54900598526001, "global_step": 121384, "epoch": 2890} {"train_loss": -6.629359245300293, "global_step": 121385, "epoch": 2890} {"train_loss": -6.538599491119385, "global_step": 121386, "epoch": 2890} {"train_loss": -6.563023567199707, "global_step": 121387, "epoch": 2890} {"train_loss": -6.52414608001709, "global_step": 121388, "epoch": 2890} {"train_loss": -6.540713310241699, "global_step": 121389, "epoch": 2890} {"train_loss": -6.557838439941406, "global_step": 121390, "epoch": 2890} {"train_loss": -6.564708232879639, "global_step": 121391, "epoch": 2890} {"train_loss": -6.586909294128418, "global_step": 121392, "epoch": 2890} {"train_loss": -6.507901191711426, "global_step": 121393, "epoch": 2890} {"train_loss": -6.440769195556641, "global_step": 121394, "epoch": 2890} {"train_loss": -6.588244438171387, "global_step": 121395, "epoch": 2890} {"train_loss": -6.49771785736084, "global_step": 121396, "epoch": 2890} {"train_loss": -6.540088176727295, "global_step": 121397, "epoch": 2890} {"train_loss": -6.495869159698486, "global_step": 121398, "epoch": 2890} {"train_loss": -6.601330757141113, "global_step": 121399, "epoch": 2890} {"train_loss": -6.6120123863220215, "global_step": 121400, "epoch": 2890} {"train_loss": -6.584815502166748, "global_step": 121401, "epoch": 2890} {"train_loss": -6.591949462890625, "global_step": 121402, "epoch": 2890} {"train_loss": -6.5633978843688965, "global_step": 121403, "epoch": 2890} {"train_loss": -6.602409362792969, "global_step": 121404, "epoch": 2890} {"train_loss": -6.500912666320801, "global_step": 121405, "epoch": 2890} {"train_loss": -6.460818767547607, "global_step": 121406, "epoch": 2890} {"train_loss": -6.524797439575195, "global_step": 121407, "epoch": 2890} {"train_loss": -6.652895927429199, "global_step": 121408, "epoch": 2890} {"train_loss": -6.592465400695801, "global_step": 121409, "epoch": 2890} {"train_loss": -6.409882545471191, "global_step": 121410, "epoch": 2890} {"train_loss": -6.565273284912109, "global_step": 121411, "epoch": 2890} {"train_loss": -6.46451997756958, "global_step": 121412, "epoch": 2890} {"train_loss": -6.543454170227051, "global_step": 121413, "epoch": 2890} {"train_loss": -6.539656639099121, "global_step": 121414, "epoch": 2890} {"train_loss": -6.551995277404785, "global_step": 121415, "epoch": 2890} {"train_loss": -6.548338413238525, "global_step": 121416, "epoch": 2890} {"train_loss": -6.466954231262207, "global_step": 121417, "epoch": 2890} {"train_loss": -6.553826332092285, "global_step": 121418, "epoch": 2890} {"train_loss": -6.509329319000244, "global_step": 121419, "epoch": 2890} {"train_loss": -6.555994033813477, "global_step": 121420, "epoch": 2890} {"train_loss": -6.547645761853173, "global_step": 121421, "epoch": 2890, "val_loss": 68114.515625} {"train_loss": -6.540724277496338, "global_step": 121422, "epoch": 2891} {"train_loss": -6.522200107574463, "global_step": 121423, "epoch": 2891} {"train_loss": -6.461647033691406, "global_step": 121424, "epoch": 2891} {"train_loss": -6.402925491333008, "global_step": 121425, "epoch": 2891} {"train_loss": -6.458500862121582, "global_step": 121426, "epoch": 2891} {"train_loss": -6.500537872314453, "global_step": 121427, "epoch": 2891} {"train_loss": -6.459623336791992, "global_step": 121428, "epoch": 2891} {"train_loss": -6.402728080749512, "global_step": 121429, "epoch": 2891} {"train_loss": -6.5226240158081055, "global_step": 121430, "epoch": 2891} {"train_loss": -6.631653785705566, "global_step": 121431, "epoch": 2891} {"train_loss": -6.479244232177734, "global_step": 121432, "epoch": 2891} {"train_loss": -6.43965482711792, "global_step": 121433, "epoch": 2891} {"train_loss": -6.590725898742676, "global_step": 121434, "epoch": 2891} {"train_loss": -6.5557074546813965, "global_step": 121435, "epoch": 2891} {"train_loss": -6.533158302307129, "global_step": 121436, "epoch": 2891} {"train_loss": -6.54256010055542, "global_step": 121437, "epoch": 2891} {"train_loss": -6.6224470138549805, "global_step": 121438, "epoch": 2891} {"train_loss": -6.5717997550964355, "global_step": 121439, "epoch": 2891} {"train_loss": -6.534814357757568, "global_step": 121440, "epoch": 2891} {"train_loss": -6.619966983795166, "global_step": 121441, "epoch": 2891} {"train_loss": -6.423866271972656, "global_step": 121442, "epoch": 2891} {"train_loss": -6.571890830993652, "global_step": 121443, "epoch": 2891} {"train_loss": -6.626567840576172, "global_step": 121444, "epoch": 2891} {"train_loss": -6.374785423278809, "global_step": 121445, "epoch": 2891} {"train_loss": -6.430639266967773, "global_step": 121446, "epoch": 2891} {"train_loss": -6.472289562225342, "global_step": 121447, "epoch": 2891} {"train_loss": -6.468915939331055, "global_step": 121448, "epoch": 2891} {"train_loss": -6.456590175628662, "global_step": 121449, "epoch": 2891} {"train_loss": -6.499477386474609, "global_step": 121450, "epoch": 2891} {"train_loss": -6.582612991333008, "global_step": 121451, "epoch": 2891} {"train_loss": -6.440553665161133, "global_step": 121452, "epoch": 2891} {"train_loss": -6.4886250495910645, "global_step": 121453, "epoch": 2891} {"train_loss": -6.436484336853027, "global_step": 121454, "epoch": 2891} {"train_loss": -6.522847652435303, "global_step": 121455, "epoch": 2891} {"train_loss": -6.490917205810547, "global_step": 121456, "epoch": 2891} {"train_loss": -6.593945503234863, "global_step": 121457, "epoch": 2891} {"train_loss": -6.472066879272461, "global_step": 121458, "epoch": 2891} {"train_loss": -6.576090335845947, "global_step": 121459, "epoch": 2891} {"train_loss": -6.499316692352295, "global_step": 121460, "epoch": 2891} {"train_loss": -6.596769332885742, "global_step": 121461, "epoch": 2891} {"train_loss": -6.488240718841553, "global_step": 121462, "epoch": 2891} {"train_loss": -6.512503044945853, "global_step": 121463, "epoch": 2891, "val_loss": 68265.6015625} {"train_loss": -6.5920844078063965, "global_step": 121464, "epoch": 2892} {"train_loss": -6.620558261871338, "global_step": 121465, "epoch": 2892} {"train_loss": -6.570107460021973, "global_step": 121466, "epoch": 2892} {"train_loss": -6.575141906738281, "global_step": 121467, "epoch": 2892} {"train_loss": -6.626723766326904, "global_step": 121468, "epoch": 2892} {"train_loss": -6.497936248779297, "global_step": 121469, "epoch": 2892} {"train_loss": -6.594479084014893, "global_step": 121470, "epoch": 2892} {"train_loss": -6.594745635986328, "global_step": 121471, "epoch": 2892} {"train_loss": -6.627615451812744, "global_step": 121472, "epoch": 2892} {"train_loss": -6.548032760620117, "global_step": 121473, "epoch": 2892} {"train_loss": -6.560486316680908, "global_step": 121474, "epoch": 2892} {"train_loss": -6.538143157958984, "global_step": 121475, "epoch": 2892} {"train_loss": -6.635824203491211, "global_step": 121476, "epoch": 2892} {"train_loss": -6.5970354080200195, "global_step": 121477, "epoch": 2892} {"train_loss": -6.537671089172363, "global_step": 121478, "epoch": 2892} {"train_loss": -6.676389694213867, "global_step": 121479, "epoch": 2892} {"train_loss": -6.649294853210449, "global_step": 121480, "epoch": 2892} {"train_loss": -6.450760841369629, "global_step": 121481, "epoch": 2892} {"train_loss": -6.5506439208984375, "global_step": 121482, "epoch": 2892} {"train_loss": -6.542757511138916, "global_step": 121483, "epoch": 2892} {"train_loss": -6.6120405197143555, "global_step": 121484, "epoch": 2892} {"train_loss": -6.642847061157227, "global_step": 121485, "epoch": 2892} {"train_loss": -6.538561820983887, "global_step": 121486, "epoch": 2892} {"train_loss": -6.520335674285889, "global_step": 121487, "epoch": 2892} {"train_loss": -6.578304767608643, "global_step": 121488, "epoch": 2892} {"train_loss": -6.511092185974121, "global_step": 121489, "epoch": 2892} {"train_loss": -6.420160293579102, "global_step": 121490, "epoch": 2892} {"train_loss": -6.4975972175598145, "global_step": 121491, "epoch": 2892} {"train_loss": -6.6911211013793945, "global_step": 121492, "epoch": 2892} {"train_loss": -6.6162004470825195, "global_step": 121493, "epoch": 2892} {"train_loss": -6.507817268371582, "global_step": 121494, "epoch": 2892} {"train_loss": -6.466804504394531, "global_step": 121495, "epoch": 2892} {"train_loss": -6.482973098754883, "global_step": 121496, "epoch": 2892} {"train_loss": -6.563451766967773, "global_step": 121497, "epoch": 2892} {"train_loss": -6.5213117599487305, "global_step": 121498, "epoch": 2892} {"train_loss": -6.567371368408203, "global_step": 121499, "epoch": 2892} {"train_loss": -6.51528787612915, "global_step": 121500, "epoch": 2892} {"train_loss": -6.56568717956543, "global_step": 121501, "epoch": 2892} {"train_loss": -6.596968650817871, "global_step": 121502, "epoch": 2892} {"train_loss": -6.45648717880249, "global_step": 121503, "epoch": 2892} {"train_loss": -6.550096035003662, "global_step": 121504, "epoch": 2892} {"train_loss": -6.5620303721654984, "global_step": 121505, "epoch": 2892, "val_loss": 68154.1015625} {"train_loss": -6.5082597732543945, "global_step": 121506, "epoch": 2893} {"train_loss": -6.584465503692627, "global_step": 121507, "epoch": 2893} {"train_loss": -6.559593200683594, "global_step": 121508, "epoch": 2893} {"train_loss": -6.621840476989746, "global_step": 121509, "epoch": 2893} {"train_loss": -6.637159824371338, "global_step": 121510, "epoch": 2893} {"train_loss": -6.613097190856934, "global_step": 121511, "epoch": 2893} {"train_loss": -6.571840763092041, "global_step": 121512, "epoch": 2893} {"train_loss": -6.620882987976074, "global_step": 121513, "epoch": 2893} {"train_loss": -6.59163761138916, "global_step": 121514, "epoch": 2893} {"train_loss": -6.496829986572266, "global_step": 121515, "epoch": 2893} {"train_loss": -6.51038932800293, "global_step": 121516, "epoch": 2893} {"train_loss": -6.599299907684326, "global_step": 121517, "epoch": 2893} {"train_loss": -6.630339622497559, "global_step": 121518, "epoch": 2893} {"train_loss": -6.476036548614502, "global_step": 121519, "epoch": 2893} {"train_loss": -6.527754783630371, "global_step": 121520, "epoch": 2893} {"train_loss": -6.4018235206604, "global_step": 121521, "epoch": 2893} {"train_loss": -6.504788875579834, "global_step": 121522, "epoch": 2893} {"train_loss": -6.475400447845459, "global_step": 121523, "epoch": 2893} {"train_loss": -6.528785705566406, "global_step": 121524, "epoch": 2893} {"train_loss": -6.534372329711914, "global_step": 121525, "epoch": 2893} {"train_loss": -6.547039985656738, "global_step": 121526, "epoch": 2893} {"train_loss": -6.536341667175293, "global_step": 121527, "epoch": 2893} {"train_loss": -6.541807174682617, "global_step": 121528, "epoch": 2893} {"train_loss": -6.6338791847229, "global_step": 121529, "epoch": 2893} {"train_loss": -6.410506248474121, "global_step": 121530, "epoch": 2893} {"train_loss": -6.574640274047852, "global_step": 121531, "epoch": 2893} {"train_loss": -6.5426025390625, "global_step": 121532, "epoch": 2893} {"train_loss": -6.581238269805908, "global_step": 121533, "epoch": 2893} {"train_loss": -6.489572048187256, "global_step": 121534, "epoch": 2893} {"train_loss": -6.524799346923828, "global_step": 121535, "epoch": 2893} {"train_loss": -6.7200798988342285, "global_step": 121536, "epoch": 2893} {"train_loss": -6.576562881469727, "global_step": 121537, "epoch": 2893} {"train_loss": -6.512598037719727, "global_step": 121538, "epoch": 2893} {"train_loss": -6.719719886779785, "global_step": 121539, "epoch": 2893} {"train_loss": -6.393362045288086, "global_step": 121540, "epoch": 2893} {"train_loss": -6.4635701179504395, "global_step": 121541, "epoch": 2893} {"train_loss": -6.556399345397949, "global_step": 121542, "epoch": 2893} {"train_loss": -6.39219856262207, "global_step": 121543, "epoch": 2893} {"train_loss": -6.3816118240356445, "global_step": 121544, "epoch": 2893} {"train_loss": -6.546055793762207, "global_step": 121545, "epoch": 2893} {"train_loss": -6.470344066619873, "global_step": 121546, "epoch": 2893} {"train_loss": -6.538940100442796, "global_step": 121547, "epoch": 2893, "val_loss": 67850.6484375} {"train_loss": -6.5813798904418945, "global_step": 121548, "epoch": 2894} {"train_loss": -6.583341598510742, "global_step": 121549, "epoch": 2894} {"train_loss": -6.6555328369140625, "global_step": 121550, "epoch": 2894} {"train_loss": -6.536500930786133, "global_step": 121551, "epoch": 2894} {"train_loss": -6.643138408660889, "global_step": 121552, "epoch": 2894} {"train_loss": -6.571996212005615, "global_step": 121553, "epoch": 2894} {"train_loss": -6.478739261627197, "global_step": 121554, "epoch": 2894} {"train_loss": -6.582635402679443, "global_step": 121555, "epoch": 2894} {"train_loss": -6.400082588195801, "global_step": 121556, "epoch": 2894} {"train_loss": -6.520977020263672, "global_step": 121557, "epoch": 2894} {"train_loss": -6.59990119934082, "global_step": 121558, "epoch": 2894} {"train_loss": -6.361673355102539, "global_step": 121559, "epoch": 2894} {"train_loss": -6.487856864929199, "global_step": 121560, "epoch": 2894} {"train_loss": -6.5318803787231445, "global_step": 121561, "epoch": 2894} {"train_loss": -6.502720832824707, "global_step": 121562, "epoch": 2894} {"train_loss": -6.52345085144043, "global_step": 121563, "epoch": 2894} {"train_loss": -6.510719299316406, "global_step": 121564, "epoch": 2894} {"train_loss": -6.501352787017822, "global_step": 121565, "epoch": 2894} {"train_loss": -6.578307628631592, "global_step": 121566, "epoch": 2894} {"train_loss": -6.555838108062744, "global_step": 121567, "epoch": 2894} {"train_loss": -6.458725929260254, "global_step": 121568, "epoch": 2894} {"train_loss": -6.500615119934082, "global_step": 121569, "epoch": 2894} {"train_loss": -6.579506874084473, "global_step": 121570, "epoch": 2894} {"train_loss": -6.5756072998046875, "global_step": 121571, "epoch": 2894} {"train_loss": -6.4811577796936035, "global_step": 121572, "epoch": 2894} {"train_loss": -6.487287521362305, "global_step": 121573, "epoch": 2894} {"train_loss": -6.491707801818848, "global_step": 121574, "epoch": 2894} {"train_loss": -6.5525102615356445, "global_step": 121575, "epoch": 2894} {"train_loss": -6.597928047180176, "global_step": 121576, "epoch": 2894} {"train_loss": -6.536648750305176, "global_step": 121577, "epoch": 2894} {"train_loss": -6.542675971984863, "global_step": 121578, "epoch": 2894} {"train_loss": -6.564548492431641, "global_step": 121579, "epoch": 2894} {"train_loss": -6.468765735626221, "global_step": 121580, "epoch": 2894} {"train_loss": -6.5233049392700195, "global_step": 121581, "epoch": 2894} {"train_loss": -6.6053242683410645, "global_step": 121582, "epoch": 2894} {"train_loss": -6.42885684967041, "global_step": 121583, "epoch": 2894} {"train_loss": -6.576182842254639, "global_step": 121584, "epoch": 2894} {"train_loss": -6.547036170959473, "global_step": 121585, "epoch": 2894} {"train_loss": -6.366476535797119, "global_step": 121586, "epoch": 2894} {"train_loss": -6.552643775939941, "global_step": 121587, "epoch": 2894} {"train_loss": -6.4598307609558105, "global_step": 121588, "epoch": 2894} {"train_loss": -6.52833290327163, "global_step": 121589, "epoch": 2894, "val_loss": 68065.6875} {"train_loss": -6.493630409240723, "global_step": 121590, "epoch": 2895} {"train_loss": -6.474532127380371, "global_step": 121591, "epoch": 2895} {"train_loss": -6.636805057525635, "global_step": 121592, "epoch": 2895} {"train_loss": -6.415512561798096, "global_step": 121593, "epoch": 2895} {"train_loss": -6.476347923278809, "global_step": 121594, "epoch": 2895} {"train_loss": -6.482943534851074, "global_step": 121595, "epoch": 2895} {"train_loss": -6.473269462585449, "global_step": 121596, "epoch": 2895} {"train_loss": -6.64303731918335, "global_step": 121597, "epoch": 2895} {"train_loss": -6.546571731567383, "global_step": 121598, "epoch": 2895} {"train_loss": -6.463412284851074, "global_step": 121599, "epoch": 2895} {"train_loss": -6.678111553192139, "global_step": 121600, "epoch": 2895} {"train_loss": -6.574713706970215, "global_step": 121601, "epoch": 2895} {"train_loss": -6.670074939727783, "global_step": 121602, "epoch": 2895} {"train_loss": -6.528447151184082, "global_step": 121603, "epoch": 2895} {"train_loss": -6.476142406463623, "global_step": 121604, "epoch": 2895} {"train_loss": -6.645390510559082, "global_step": 121605, "epoch": 2895} {"train_loss": -6.543093204498291, "global_step": 121606, "epoch": 2895} {"train_loss": -6.545933723449707, "global_step": 121607, "epoch": 2895} {"train_loss": -6.464069366455078, "global_step": 121608, "epoch": 2895} {"train_loss": -6.571904182434082, "global_step": 121609, "epoch": 2895} {"train_loss": -6.592966079711914, "global_step": 121610, "epoch": 2895} {"train_loss": -6.620834827423096, "global_step": 121611, "epoch": 2895} {"train_loss": -6.5936126708984375, "global_step": 121612, "epoch": 2895} {"train_loss": -6.586936950683594, "global_step": 121613, "epoch": 2895} {"train_loss": -6.434738636016846, "global_step": 121614, "epoch": 2895} {"train_loss": -6.605767250061035, "global_step": 121615, "epoch": 2895} {"train_loss": -6.579242706298828, "global_step": 121616, "epoch": 2895} {"train_loss": -6.583092212677002, "global_step": 121617, "epoch": 2895} {"train_loss": -6.5197906494140625, "global_step": 121618, "epoch": 2895} {"train_loss": -6.667658805847168, "global_step": 121619, "epoch": 2895} {"train_loss": -6.570523262023926, "global_step": 121620, "epoch": 2895} {"train_loss": -6.440239906311035, "global_step": 121621, "epoch": 2895} {"train_loss": -6.535732746124268, "global_step": 121622, "epoch": 2895} {"train_loss": -6.483986854553223, "global_step": 121623, "epoch": 2895} {"train_loss": -6.46740198135376, "global_step": 121624, "epoch": 2895} {"train_loss": -6.508826732635498, "global_step": 121625, "epoch": 2895} {"train_loss": -6.572713851928711, "global_step": 121626, "epoch": 2895} {"train_loss": -6.540151119232178, "global_step": 121627, "epoch": 2895} {"train_loss": -6.598066329956055, "global_step": 121628, "epoch": 2895} {"train_loss": -6.489362716674805, "global_step": 121629, "epoch": 2895} {"train_loss": -6.623133659362793, "global_step": 121630, "epoch": 2895} {"train_loss": -6.544966470627558, "global_step": 121631, "epoch": 2895, "val_loss": 67926.75} {"train_loss": -6.494473934173584, "global_step": 121632, "epoch": 2896} {"train_loss": -6.5018486976623535, "global_step": 121633, "epoch": 2896} {"train_loss": -6.443449974060059, "global_step": 121634, "epoch": 2896} {"train_loss": -6.337963104248047, "global_step": 121635, "epoch": 2896} {"train_loss": -6.4261651039123535, "global_step": 121636, "epoch": 2896} {"train_loss": -6.50932502746582, "global_step": 121637, "epoch": 2896} {"train_loss": -6.4820475578308105, "global_step": 121638, "epoch": 2896} {"train_loss": -6.563703536987305, "global_step": 121639, "epoch": 2896} {"train_loss": -6.529078483581543, "global_step": 121640, "epoch": 2896} {"train_loss": -6.497210502624512, "global_step": 121641, "epoch": 2896} {"train_loss": -6.544905185699463, "global_step": 121642, "epoch": 2896} {"train_loss": -6.59005069732666, "global_step": 121643, "epoch": 2896} {"train_loss": -6.544268608093262, "global_step": 121644, "epoch": 2896} {"train_loss": -6.670348167419434, "global_step": 121645, "epoch": 2896} {"train_loss": -6.551207542419434, "global_step": 121646, "epoch": 2896} {"train_loss": -6.530325889587402, "global_step": 121647, "epoch": 2896} {"train_loss": -6.542397975921631, "global_step": 121648, "epoch": 2896} {"train_loss": -6.566559314727783, "global_step": 121649, "epoch": 2896} {"train_loss": -6.603219032287598, "global_step": 121650, "epoch": 2896} {"train_loss": -6.535918712615967, "global_step": 121651, "epoch": 2896} {"train_loss": -6.653875350952148, "global_step": 121652, "epoch": 2896} {"train_loss": -6.729855537414551, "global_step": 121653, "epoch": 2896} {"train_loss": -6.509153366088867, "global_step": 121654, "epoch": 2896} {"train_loss": -6.572640419006348, "global_step": 121655, "epoch": 2896} {"train_loss": -6.548453330993652, "global_step": 121656, "epoch": 2896} {"train_loss": -6.674936294555664, "global_step": 121657, "epoch": 2896} {"train_loss": -6.548079490661621, "global_step": 121658, "epoch": 2896} {"train_loss": -6.568821907043457, "global_step": 121659, "epoch": 2896} {"train_loss": -6.664620399475098, "global_step": 121660, "epoch": 2896} {"train_loss": -6.660366535186768, "global_step": 121661, "epoch": 2896} {"train_loss": -6.571323394775391, "global_step": 121662, "epoch": 2896} {"train_loss": -6.592918872833252, "global_step": 121663, "epoch": 2896} {"train_loss": -6.5279951095581055, "global_step": 121664, "epoch": 2896} {"train_loss": -6.579351425170898, "global_step": 121665, "epoch": 2896} {"train_loss": -6.544695854187012, "global_step": 121666, "epoch": 2896} {"train_loss": -6.609803676605225, "global_step": 121667, "epoch": 2896} {"train_loss": -6.498155117034912, "global_step": 121668, "epoch": 2896} {"train_loss": -6.537008285522461, "global_step": 121669, "epoch": 2896} {"train_loss": -6.628377437591553, "global_step": 121670, "epoch": 2896} {"train_loss": -6.557722091674805, "global_step": 121671, "epoch": 2896} {"train_loss": -6.5684494972229, "global_step": 121672, "epoch": 2896} {"train_loss": -6.558322157178607, "global_step": 121673, "epoch": 2896, "val_loss": 67858.8046875} {"train_loss": -6.553890228271484, "global_step": 121674, "epoch": 2897} {"train_loss": -6.587737083435059, "global_step": 121675, "epoch": 2897} {"train_loss": -6.633617401123047, "global_step": 121676, "epoch": 2897} {"train_loss": -6.629770278930664, "global_step": 121677, "epoch": 2897} {"train_loss": -6.403639793395996, "global_step": 121678, "epoch": 2897} {"train_loss": -6.471254348754883, "global_step": 121679, "epoch": 2897} {"train_loss": -6.6754865646362305, "global_step": 121680, "epoch": 2897} {"train_loss": -6.6217522621154785, "global_step": 121681, "epoch": 2897} {"train_loss": -6.536970615386963, "global_step": 121682, "epoch": 2897} {"train_loss": -6.747654914855957, "global_step": 121683, "epoch": 2897} {"train_loss": -6.621606826782227, "global_step": 121684, "epoch": 2897} {"train_loss": -6.560085296630859, "global_step": 121685, "epoch": 2897} {"train_loss": -6.611288070678711, "global_step": 121686, "epoch": 2897} {"train_loss": -6.779221534729004, "global_step": 121687, "epoch": 2897} {"train_loss": -6.601203918457031, "global_step": 121688, "epoch": 2897} {"train_loss": -6.492981910705566, "global_step": 121689, "epoch": 2897} {"train_loss": -6.480890274047852, "global_step": 121690, "epoch": 2897} {"train_loss": -6.464432716369629, "global_step": 121691, "epoch": 2897} {"train_loss": -6.683481216430664, "global_step": 121692, "epoch": 2897} {"train_loss": -6.599358081817627, "global_step": 121693, "epoch": 2897} {"train_loss": -6.519537925720215, "global_step": 121694, "epoch": 2897} {"train_loss": -6.580860137939453, "global_step": 121695, "epoch": 2897} {"train_loss": -6.584727764129639, "global_step": 121696, "epoch": 2897} {"train_loss": -6.663814067840576, "global_step": 121697, "epoch": 2897} {"train_loss": -6.521941184997559, "global_step": 121698, "epoch": 2897} {"train_loss": -6.605929374694824, "global_step": 121699, "epoch": 2897} {"train_loss": -6.601898193359375, "global_step": 121700, "epoch": 2897} {"train_loss": -6.513280868530273, "global_step": 121701, "epoch": 2897} {"train_loss": -6.518133163452148, "global_step": 121702, "epoch": 2897} {"train_loss": -6.588108539581299, "global_step": 121703, "epoch": 2897} {"train_loss": -6.521130561828613, "global_step": 121704, "epoch": 2897} {"train_loss": -6.452096462249756, "global_step": 121705, "epoch": 2897} {"train_loss": -6.555356025695801, "global_step": 121706, "epoch": 2897} {"train_loss": -6.482107162475586, "global_step": 121707, "epoch": 2897} {"train_loss": -6.557834625244141, "global_step": 121708, "epoch": 2897} {"train_loss": -6.584808349609375, "global_step": 121709, "epoch": 2897} {"train_loss": -6.561188220977783, "global_step": 121710, "epoch": 2897} {"train_loss": -6.59512996673584, "global_step": 121711, "epoch": 2897} {"train_loss": -6.519031524658203, "global_step": 121712, "epoch": 2897} {"train_loss": -6.497912406921387, "global_step": 121713, "epoch": 2897} {"train_loss": -6.518439769744873, "global_step": 121714, "epoch": 2897} {"train_loss": -6.5692583946954635, "global_step": 121715, "epoch": 2897, "val_loss": 67936.3125} {"train_loss": -6.613036632537842, "global_step": 121716, "epoch": 2898} {"train_loss": -6.670037269592285, "global_step": 121717, "epoch": 2898} {"train_loss": -6.596864223480225, "global_step": 121718, "epoch": 2898} {"train_loss": -6.469857215881348, "global_step": 121719, "epoch": 2898} {"train_loss": -6.609821319580078, "global_step": 121720, "epoch": 2898} {"train_loss": -6.607631683349609, "global_step": 121721, "epoch": 2898} {"train_loss": -6.449203968048096, "global_step": 121722, "epoch": 2898} {"train_loss": -6.475446701049805, "global_step": 121723, "epoch": 2898} {"train_loss": -6.57017707824707, "global_step": 121724, "epoch": 2898} {"train_loss": -6.529972076416016, "global_step": 121725, "epoch": 2898} {"train_loss": -6.537747383117676, "global_step": 121726, "epoch": 2898} {"train_loss": -6.666372299194336, "global_step": 121727, "epoch": 2898} {"train_loss": -6.540050506591797, "global_step": 121728, "epoch": 2898} {"train_loss": -6.508279800415039, "global_step": 121729, "epoch": 2898} {"train_loss": -6.5440592765808105, "global_step": 121730, "epoch": 2898} {"train_loss": -6.488699913024902, "global_step": 121731, "epoch": 2898} {"train_loss": -6.528726577758789, "global_step": 121732, "epoch": 2898} {"train_loss": -6.59537410736084, "global_step": 121733, "epoch": 2898} {"train_loss": -6.490011215209961, "global_step": 121734, "epoch": 2898} {"train_loss": -6.631956100463867, "global_step": 121735, "epoch": 2898} {"train_loss": -6.570102691650391, "global_step": 121736, "epoch": 2898} {"train_loss": -6.572395324707031, "global_step": 121737, "epoch": 2898} {"train_loss": -6.551462173461914, "global_step": 121738, "epoch": 2898} {"train_loss": -6.592085361480713, "global_step": 121739, "epoch": 2898} {"train_loss": -6.62216854095459, "global_step": 121740, "epoch": 2898} {"train_loss": -6.606609344482422, "global_step": 121741, "epoch": 2898} {"train_loss": -6.509172439575195, "global_step": 121742, "epoch": 2898} {"train_loss": -6.3751959800720215, "global_step": 121743, "epoch": 2898} {"train_loss": -6.464631080627441, "global_step": 121744, "epoch": 2898} {"train_loss": -6.405780792236328, "global_step": 121745, "epoch": 2898} {"train_loss": -6.518939971923828, "global_step": 121746, "epoch": 2898} {"train_loss": -6.574488639831543, "global_step": 121747, "epoch": 2898} {"train_loss": -6.536680221557617, "global_step": 121748, "epoch": 2898} {"train_loss": -6.439756393432617, "global_step": 121749, "epoch": 2898} {"train_loss": -6.622358322143555, "global_step": 121750, "epoch": 2898} {"train_loss": -6.493748664855957, "global_step": 121751, "epoch": 2898} {"train_loss": -6.53369140625, "global_step": 121752, "epoch": 2898} {"train_loss": -6.596432685852051, "global_step": 121753, "epoch": 2898} {"train_loss": -6.499821662902832, "global_step": 121754, "epoch": 2898} {"train_loss": -6.498658180236816, "global_step": 121755, "epoch": 2898} {"train_loss": -6.60386323928833, "global_step": 121756, "epoch": 2898} {"train_loss": -6.541676873252506, "global_step": 121757, "epoch": 2898, "val_loss": 68120.453125} {"train_loss": -6.561215400695801, "global_step": 121758, "epoch": 2899} {"train_loss": -6.433286666870117, "global_step": 121759, "epoch": 2899} {"train_loss": -6.487069606781006, "global_step": 121760, "epoch": 2899} {"train_loss": -6.580209732055664, "global_step": 121761, "epoch": 2899} {"train_loss": -6.364880561828613, "global_step": 121762, "epoch": 2899} {"train_loss": -6.589221000671387, "global_step": 121763, "epoch": 2899} {"train_loss": -6.454207420349121, "global_step": 121764, "epoch": 2899} {"train_loss": -6.483546257019043, "global_step": 121765, "epoch": 2899} {"train_loss": -6.449102401733398, "global_step": 121766, "epoch": 2899} {"train_loss": -6.509570121765137, "global_step": 121767, "epoch": 2899} {"train_loss": -6.507026672363281, "global_step": 121768, "epoch": 2899} {"train_loss": -6.408109664916992, "global_step": 121769, "epoch": 2899} {"train_loss": -6.4008378982543945, "global_step": 121770, "epoch": 2899} {"train_loss": -6.50280237197876, "global_step": 121771, "epoch": 2899} {"train_loss": -6.4984941482543945, "global_step": 121772, "epoch": 2899} {"train_loss": -6.522314548492432, "global_step": 121773, "epoch": 2899} {"train_loss": -6.466089248657227, "global_step": 121774, "epoch": 2899} {"train_loss": -6.518891334533691, "global_step": 121775, "epoch": 2899} {"train_loss": -6.443450927734375, "global_step": 121776, "epoch": 2899} {"train_loss": -6.553662300109863, "global_step": 121777, "epoch": 2899} {"train_loss": -6.6241912841796875, "global_step": 121778, "epoch": 2899} {"train_loss": -6.553779602050781, "global_step": 121779, "epoch": 2899} {"train_loss": -6.586330890655518, "global_step": 121780, "epoch": 2899} {"train_loss": -6.38921594619751, "global_step": 121781, "epoch": 2899} {"train_loss": -6.556452751159668, "global_step": 121782, "epoch": 2899} {"train_loss": -6.490339279174805, "global_step": 121783, "epoch": 2899} {"train_loss": -6.5044779777526855, "global_step": 121784, "epoch": 2899} {"train_loss": -6.490755081176758, "global_step": 121785, "epoch": 2899} {"train_loss": -6.481289386749268, "global_step": 121786, "epoch": 2899} {"train_loss": -6.654835224151611, "global_step": 121787, "epoch": 2899} {"train_loss": -6.569231033325195, "global_step": 121788, "epoch": 2899} {"train_loss": -6.540581703186035, "global_step": 121789, "epoch": 2899} {"train_loss": -6.632713794708252, "global_step": 121790, "epoch": 2899} {"train_loss": -6.530463695526123, "global_step": 121791, "epoch": 2899} {"train_loss": -6.522116184234619, "global_step": 121792, "epoch": 2899} {"train_loss": -6.515955924987793, "global_step": 121793, "epoch": 2899} {"train_loss": -6.626326084136963, "global_step": 121794, "epoch": 2899} {"train_loss": -6.595898628234863, "global_step": 121795, "epoch": 2899} {"train_loss": -6.597340106964111, "global_step": 121796, "epoch": 2899} {"train_loss": -6.538012981414795, "global_step": 121797, "epoch": 2899} {"train_loss": -6.357685089111328, "global_step": 121798, "epoch": 2899} {"train_loss": -6.516317412966774, "global_step": 121799, "epoch": 2899, "val_loss": 68130.0859375} {"train_loss": -6.474637031555176, "global_step": 121800, "epoch": 2900} {"train_loss": -6.576468467712402, "global_step": 121801, "epoch": 2900} {"train_loss": -6.536778450012207, "global_step": 121802, "epoch": 2900} {"train_loss": -6.592159271240234, "global_step": 121803, "epoch": 2900} {"train_loss": -6.607905387878418, "global_step": 121804, "epoch": 2900} {"train_loss": -6.579850673675537, "global_step": 121805, "epoch": 2900} {"train_loss": -6.61916446685791, "global_step": 121806, "epoch": 2900} {"train_loss": -6.55427885055542, "global_step": 121807, "epoch": 2900} {"train_loss": -6.647855758666992, "global_step": 121808, "epoch": 2900} {"train_loss": -6.5095038414001465, "global_step": 121809, "epoch": 2900} {"train_loss": -6.578853607177734, "global_step": 121810, "epoch": 2900} {"train_loss": -6.487017631530762, "global_step": 121811, "epoch": 2900} {"train_loss": -6.512718677520752, "global_step": 121812, "epoch": 2900} {"train_loss": -6.602989196777344, "global_step": 121813, "epoch": 2900} {"train_loss": -6.662197113037109, "global_step": 121814, "epoch": 2900} {"train_loss": -6.594907760620117, "global_step": 121815, "epoch": 2900} {"train_loss": -6.536022663116455, "global_step": 121816, "epoch": 2900} {"train_loss": -6.636658668518066, "global_step": 121817, "epoch": 2900} {"train_loss": -6.562280654907227, "global_step": 121818, "epoch": 2900} {"train_loss": -6.494120121002197, "global_step": 121819, "epoch": 2900} {"train_loss": -6.408313751220703, "global_step": 121820, "epoch": 2900} {"train_loss": -6.450126647949219, "global_step": 121821, "epoch": 2900} {"train_loss": -6.497588634490967, "global_step": 121822, "epoch": 2900} {"train_loss": -6.325780868530273, "global_step": 121823, "epoch": 2900} {"train_loss": -6.591096878051758, "global_step": 121824, "epoch": 2900} {"train_loss": -6.595355033874512, "global_step": 121825, "epoch": 2900} {"train_loss": -6.557103157043457, "global_step": 121826, "epoch": 2900} {"train_loss": -6.488987922668457, "global_step": 121827, "epoch": 2900} {"train_loss": -6.546262741088867, "global_step": 121828, "epoch": 2900} {"train_loss": -6.468560695648193, "global_step": 121829, "epoch": 2900} {"train_loss": -6.499343395233154, "global_step": 121830, "epoch": 2900} {"train_loss": -6.52227783203125, "global_step": 121831, "epoch": 2900} {"train_loss": -6.534377574920654, "global_step": 121832, "epoch": 2900} {"train_loss": -6.379037380218506, "global_step": 121833, "epoch": 2900} {"train_loss": -6.519210338592529, "global_step": 121834, "epoch": 2900} {"train_loss": -6.543019771575928, "global_step": 121835, "epoch": 2900} {"train_loss": -6.548489093780518, "global_step": 121836, "epoch": 2900} {"train_loss": -6.497966766357422, "global_step": 121837, "epoch": 2900} {"train_loss": -6.544064044952393, "global_step": 121838, "epoch": 2900} {"train_loss": -6.512967586517334, "global_step": 121839, "epoch": 2900} {"train_loss": -6.666060924530029, "global_step": 121840, "epoch": 2900} {"train_loss": -6.537649472554524, "global_step": 121841, "epoch": 2900, "train/sim_max_reward_0": 0.22779803492161893, "train/sim_max_reward_1": 0.9916564384104385, "train/sim_max_reward_2": 0.2849433584943725, "train/sim_max_reward_3": 0.13980499072287828, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.7518108371743089, "test/sim_max_reward_4400000": 0.12956968883352202, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 0.19828649999001166, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.6750823966392919, "test/sim_max_reward_4400007": 0.9908759342603375, "test/sim_max_reward_4400008": 0.30688660170852217, "test/sim_max_reward_4400009": 0.827649189410467, "test/sim_max_reward_4400010": 0.9562051054246963, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.868789461504703, "test/sim_max_reward_4400013": 0.9988745200730933, "test/sim_max_reward_4400014": 0.2621048450777562, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.931626055659735, "test/sim_max_reward_4400017": 0.6988300337689325, "test/sim_max_reward_4400018": 0.2389037048203523, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.33321469134498943, "test/sim_max_reward_4400023": 0.9566523682533205, "test/sim_max_reward_4400024": 0.3070647661905653, "test/sim_max_reward_4400025": 0.26126306853268355, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.049183902883074566, "test/sim_max_reward_4400028": 0.8316081009629641, "test/sim_max_reward_4400029": 0.5649105091477467, "test/sim_max_reward_4400030": 0.8381348418673874, "test/sim_max_reward_4400031": 0.9441053186901306, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.21448095559460345, "test/sim_max_reward_4400034": 0.947190874896541, "test/sim_max_reward_4400035": 0.642428646539719, "test/sim_max_reward_4400036": 0.34471386360930584, "test/sim_max_reward_4400037": 0.905695470148823, "test/sim_max_reward_4400038": 0.9487066560712266, "test/sim_max_reward_4400039": 0.5667673650071502, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6174525338134838, "test/sim_max_reward_4400042": 0.9667133203734266, "test/sim_max_reward_4400043": 0.888542151335422, "test/sim_max_reward_4400044": 0.7294069370583663, "test/sim_max_reward_4400045": 0.9448619685816915, "test/sim_max_reward_4400046": 0.9491901219880788, "test/sim_max_reward_4400047": 0.8904775509422522, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.5660022766206029, "test/mean_score": 0.5254571085428319, "val_loss": 68098.9609375} {"train_loss": -6.545615196228027, "global_step": 121842, "epoch": 2901} {"train_loss": -6.6895036697387695, "global_step": 121843, "epoch": 2901} {"train_loss": -6.449981689453125, "global_step": 121844, "epoch": 2901} {"train_loss": -6.485909938812256, "global_step": 121845, "epoch": 2901} {"train_loss": -6.583209991455078, "global_step": 121846, "epoch": 2901} {"train_loss": -6.494413375854492, "global_step": 121847, "epoch": 2901} {"train_loss": -6.527167320251465, "global_step": 121848, "epoch": 2901} {"train_loss": -6.472963809967041, "global_step": 121849, "epoch": 2901} {"train_loss": -6.522971153259277, "global_step": 121850, "epoch": 2901} {"train_loss": -6.563626766204834, "global_step": 121851, "epoch": 2901} {"train_loss": -6.356604099273682, "global_step": 121852, "epoch": 2901} {"train_loss": -6.431010723114014, "global_step": 121853, "epoch": 2901} {"train_loss": -6.467754364013672, "global_step": 121854, "epoch": 2901} {"train_loss": -6.456945896148682, "global_step": 121855, "epoch": 2901} {"train_loss": -6.579827308654785, "global_step": 121856, "epoch": 2901} {"train_loss": -6.498391151428223, "global_step": 121857, "epoch": 2901} {"train_loss": -6.495388984680176, "global_step": 121858, "epoch": 2901} {"train_loss": -6.483798980712891, "global_step": 121859, "epoch": 2901} {"train_loss": -6.43197774887085, "global_step": 121860, "epoch": 2901} {"train_loss": -6.579825401306152, "global_step": 121861, "epoch": 2901} {"train_loss": -6.5684895515441895, "global_step": 121862, "epoch": 2901} {"train_loss": -6.517061710357666, "global_step": 121863, "epoch": 2901} {"train_loss": -6.576381683349609, "global_step": 121864, "epoch": 2901} {"train_loss": -6.4184417724609375, "global_step": 121865, "epoch": 2901} {"train_loss": -6.634846210479736, "global_step": 121866, "epoch": 2901} {"train_loss": -6.604631423950195, "global_step": 121867, "epoch": 2901} {"train_loss": -6.578766822814941, "global_step": 121868, "epoch": 2901} {"train_loss": -6.456207752227783, "global_step": 121869, "epoch": 2901} {"train_loss": -6.639303684234619, "global_step": 121870, "epoch": 2901} {"train_loss": -6.541290760040283, "global_step": 121871, "epoch": 2901} {"train_loss": -6.519606590270996, "global_step": 121872, "epoch": 2901} {"train_loss": -6.474298000335693, "global_step": 121873, "epoch": 2901} {"train_loss": -6.522465229034424, "global_step": 121874, "epoch": 2901} {"train_loss": -6.5284881591796875, "global_step": 121875, "epoch": 2901} {"train_loss": -6.538481712341309, "global_step": 121876, "epoch": 2901} {"train_loss": -6.496952533721924, "global_step": 121877, "epoch": 2901} {"train_loss": -6.582037925720215, "global_step": 121878, "epoch": 2901} {"train_loss": -6.616477966308594, "global_step": 121879, "epoch": 2901} {"train_loss": -6.447514057159424, "global_step": 121880, "epoch": 2901} {"train_loss": -6.611015796661377, "global_step": 121881, "epoch": 2901} {"train_loss": -6.5387163162231445, "global_step": 121882, "epoch": 2901} {"train_loss": -6.525149799528576, "global_step": 121883, "epoch": 2901, "val_loss": 68086.953125} {"train_loss": -6.544251918792725, "global_step": 121884, "epoch": 2902} {"train_loss": -6.64559268951416, "global_step": 121885, "epoch": 2902} {"train_loss": -6.574695587158203, "global_step": 121886, "epoch": 2902} {"train_loss": -6.637333869934082, "global_step": 121887, "epoch": 2902} {"train_loss": -6.449879169464111, "global_step": 121888, "epoch": 2902} {"train_loss": -6.45597505569458, "global_step": 121889, "epoch": 2902} {"train_loss": -6.613363742828369, "global_step": 121890, "epoch": 2902} {"train_loss": -6.6123127937316895, "global_step": 121891, "epoch": 2902} {"train_loss": -6.5958943367004395, "global_step": 121892, "epoch": 2902} {"train_loss": -6.482078552246094, "global_step": 121893, "epoch": 2902} {"train_loss": -6.675050258636475, "global_step": 121894, "epoch": 2902} {"train_loss": -6.496807098388672, "global_step": 121895, "epoch": 2902} {"train_loss": -6.472658157348633, "global_step": 121896, "epoch": 2902} {"train_loss": -6.54976224899292, "global_step": 121897, "epoch": 2902} {"train_loss": -6.616774559020996, "global_step": 121898, "epoch": 2902} {"train_loss": -6.579312324523926, "global_step": 121899, "epoch": 2902} {"train_loss": -6.57623291015625, "global_step": 121900, "epoch": 2902} {"train_loss": -6.5966267585754395, "global_step": 121901, "epoch": 2902} {"train_loss": -6.565220355987549, "global_step": 121902, "epoch": 2902} {"train_loss": -6.57198429107666, "global_step": 121903, "epoch": 2902} {"train_loss": -6.534474849700928, "global_step": 121904, "epoch": 2902} {"train_loss": -6.604169845581055, "global_step": 121905, "epoch": 2902} {"train_loss": -6.605674743652344, "global_step": 121906, "epoch": 2902} {"train_loss": -6.488336563110352, "global_step": 121907, "epoch": 2902} {"train_loss": -6.5674943923950195, "global_step": 121908, "epoch": 2902} {"train_loss": -6.670146942138672, "global_step": 121909, "epoch": 2902} {"train_loss": -6.680110454559326, "global_step": 121910, "epoch": 2902} {"train_loss": -6.631962776184082, "global_step": 121911, "epoch": 2902} {"train_loss": -6.644637584686279, "global_step": 121912, "epoch": 2902} {"train_loss": -6.5283002853393555, "global_step": 121913, "epoch": 2902} {"train_loss": -6.5469465255737305, "global_step": 121914, "epoch": 2902} {"train_loss": -6.551934242248535, "global_step": 121915, "epoch": 2902} {"train_loss": -6.507782459259033, "global_step": 121916, "epoch": 2902} {"train_loss": -6.564767360687256, "global_step": 121917, "epoch": 2902} {"train_loss": -6.603181838989258, "global_step": 121918, "epoch": 2902} {"train_loss": -6.594103813171387, "global_step": 121919, "epoch": 2902} {"train_loss": -6.5766401290893555, "global_step": 121920, "epoch": 2902} {"train_loss": -6.499300003051758, "global_step": 121921, "epoch": 2902} {"train_loss": -6.5385589599609375, "global_step": 121922, "epoch": 2902} {"train_loss": -6.545133590698242, "global_step": 121923, "epoch": 2902} {"train_loss": -6.637442588806152, "global_step": 121924, "epoch": 2902} {"train_loss": -6.568943069094703, "global_step": 121925, "epoch": 2902, "val_loss": 68061.1953125} {"train_loss": -6.613925457000732, "global_step": 121926, "epoch": 2903} {"train_loss": -6.688457489013672, "global_step": 121927, "epoch": 2903} {"train_loss": -6.62186861038208, "global_step": 121928, "epoch": 2903} {"train_loss": -6.521023750305176, "global_step": 121929, "epoch": 2903} {"train_loss": -6.547345161437988, "global_step": 121930, "epoch": 2903} {"train_loss": -6.627226829528809, "global_step": 121931, "epoch": 2903} {"train_loss": -6.513167381286621, "global_step": 121932, "epoch": 2903} {"train_loss": -6.5230560302734375, "global_step": 121933, "epoch": 2903} {"train_loss": -6.547436714172363, "global_step": 121934, "epoch": 2903} {"train_loss": -6.542649745941162, "global_step": 121935, "epoch": 2903} {"train_loss": -6.5581841468811035, "global_step": 121936, "epoch": 2903} {"train_loss": -6.652889728546143, "global_step": 121937, "epoch": 2903} {"train_loss": -6.501708984375, "global_step": 121938, "epoch": 2903} {"train_loss": -6.446982383728027, "global_step": 121939, "epoch": 2903} {"train_loss": -6.565828800201416, "global_step": 121940, "epoch": 2903} {"train_loss": -6.541321754455566, "global_step": 121941, "epoch": 2903} {"train_loss": -6.4664225578308105, "global_step": 121942, "epoch": 2903} {"train_loss": -6.567676544189453, "global_step": 121943, "epoch": 2903} {"train_loss": -6.6211700439453125, "global_step": 121944, "epoch": 2903} {"train_loss": -6.718113899230957, "global_step": 121945, "epoch": 2903} {"train_loss": -6.519527912139893, "global_step": 121946, "epoch": 2903} {"train_loss": -6.56048583984375, "global_step": 121947, "epoch": 2903} {"train_loss": -6.531559944152832, "global_step": 121948, "epoch": 2903} {"train_loss": -6.585788726806641, "global_step": 121949, "epoch": 2903} {"train_loss": -6.446526527404785, "global_step": 121950, "epoch": 2903} {"train_loss": -6.623818397521973, "global_step": 121951, "epoch": 2903} {"train_loss": -6.542435169219971, "global_step": 121952, "epoch": 2903} {"train_loss": -6.5023932456970215, "global_step": 121953, "epoch": 2903} {"train_loss": -6.536891937255859, "global_step": 121954, "epoch": 2903} {"train_loss": -6.753100395202637, "global_step": 121955, "epoch": 2903} {"train_loss": -6.5912017822265625, "global_step": 121956, "epoch": 2903} {"train_loss": -6.555047035217285, "global_step": 121957, "epoch": 2903} {"train_loss": -6.682265281677246, "global_step": 121958, "epoch": 2903} {"train_loss": -6.592784881591797, "global_step": 121959, "epoch": 2903} {"train_loss": -6.664554595947266, "global_step": 121960, "epoch": 2903} {"train_loss": -6.6320905685424805, "global_step": 121961, "epoch": 2903} {"train_loss": -6.666555881500244, "global_step": 121962, "epoch": 2903} {"train_loss": -6.618680000305176, "global_step": 121963, "epoch": 2903} {"train_loss": -6.648655891418457, "global_step": 121964, "epoch": 2903} {"train_loss": -6.561807632446289, "global_step": 121965, "epoch": 2903} {"train_loss": -6.621408462524414, "global_step": 121966, "epoch": 2903} {"train_loss": -6.58185194787525, "global_step": 121967, "epoch": 2903, "val_loss": 67859.6171875} {"train_loss": -6.708087921142578, "global_step": 121968, "epoch": 2904} {"train_loss": -6.537468433380127, "global_step": 121969, "epoch": 2904} {"train_loss": -6.567353248596191, "global_step": 121970, "epoch": 2904} {"train_loss": -6.6716132164001465, "global_step": 121971, "epoch": 2904} {"train_loss": -6.509983062744141, "global_step": 121972, "epoch": 2904} {"train_loss": -6.368244171142578, "global_step": 121973, "epoch": 2904} {"train_loss": -6.507165908813477, "global_step": 121974, "epoch": 2904} {"train_loss": -6.4925432205200195, "global_step": 121975, "epoch": 2904} {"train_loss": -6.506498336791992, "global_step": 121976, "epoch": 2904} {"train_loss": -6.65210485458374, "global_step": 121977, "epoch": 2904} {"train_loss": -6.519939422607422, "global_step": 121978, "epoch": 2904} {"train_loss": -6.530726432800293, "global_step": 121979, "epoch": 2904} {"train_loss": -6.590085029602051, "global_step": 121980, "epoch": 2904} {"train_loss": -6.3605570793151855, "global_step": 121981, "epoch": 2904} {"train_loss": -6.552890777587891, "global_step": 121982, "epoch": 2904} {"train_loss": -6.548802375793457, "global_step": 121983, "epoch": 2904} {"train_loss": -6.596856117248535, "global_step": 121984, "epoch": 2904} {"train_loss": -6.6486101150512695, "global_step": 121985, "epoch": 2904} {"train_loss": -6.6511454582214355, "global_step": 121986, "epoch": 2904} {"train_loss": -6.530761241912842, "global_step": 121987, "epoch": 2904} {"train_loss": -6.561105251312256, "global_step": 121988, "epoch": 2904} {"train_loss": -6.484124183654785, "global_step": 121989, "epoch": 2904} {"train_loss": -6.628121376037598, "global_step": 121990, "epoch": 2904} {"train_loss": -6.582218170166016, "global_step": 121991, "epoch": 2904} {"train_loss": -6.524520397186279, "global_step": 121992, "epoch": 2904} {"train_loss": -6.548801422119141, "global_step": 121993, "epoch": 2904} {"train_loss": -6.39961051940918, "global_step": 121994, "epoch": 2904} {"train_loss": -6.508366107940674, "global_step": 121995, "epoch": 2904} {"train_loss": -6.450342178344727, "global_step": 121996, "epoch": 2904} {"train_loss": -6.399673938751221, "global_step": 121997, "epoch": 2904} {"train_loss": -6.463814735412598, "global_step": 121998, "epoch": 2904} {"train_loss": -6.355836868286133, "global_step": 121999, "epoch": 2904} {"train_loss": -6.28881311416626, "global_step": 122000, "epoch": 2904} {"train_loss": -6.436126708984375, "global_step": 122001, "epoch": 2904} {"train_loss": -6.497066974639893, "global_step": 122002, "epoch": 2904} {"train_loss": -6.416257858276367, "global_step": 122003, "epoch": 2904} {"train_loss": -6.612947940826416, "global_step": 122004, "epoch": 2904} {"train_loss": -6.381708145141602, "global_step": 122005, "epoch": 2904} {"train_loss": -6.494637966156006, "global_step": 122006, "epoch": 2904} {"train_loss": -6.491244316101074, "global_step": 122007, "epoch": 2904} {"train_loss": -6.5395002365112305, "global_step": 122008, "epoch": 2904} {"train_loss": -6.512378681273687, "global_step": 122009, "epoch": 2904, "val_loss": 67925.3125} {"train_loss": -6.5092291831970215, "global_step": 122010, "epoch": 2905} {"train_loss": -6.494659900665283, "global_step": 122011, "epoch": 2905} {"train_loss": -6.530265808105469, "global_step": 122012, "epoch": 2905} {"train_loss": -6.590960502624512, "global_step": 122013, "epoch": 2905} {"train_loss": -6.436642646789551, "global_step": 122014, "epoch": 2905} {"train_loss": -6.526393890380859, "global_step": 122015, "epoch": 2905} {"train_loss": -6.550867557525635, "global_step": 122016, "epoch": 2905} {"train_loss": -6.580845355987549, "global_step": 122017, "epoch": 2905} {"train_loss": -6.56346321105957, "global_step": 122018, "epoch": 2905} {"train_loss": -6.502309799194336, "global_step": 122019, "epoch": 2905} {"train_loss": -6.5240325927734375, "global_step": 122020, "epoch": 2905} {"train_loss": -6.618257522583008, "global_step": 122021, "epoch": 2905} {"train_loss": -6.551224708557129, "global_step": 122022, "epoch": 2905} {"train_loss": -6.634820461273193, "global_step": 122023, "epoch": 2905} {"train_loss": -6.5117716789245605, "global_step": 122024, "epoch": 2905} {"train_loss": -6.531270503997803, "global_step": 122025, "epoch": 2905} {"train_loss": -6.5570068359375, "global_step": 122026, "epoch": 2905} {"train_loss": -6.667086601257324, "global_step": 122027, "epoch": 2905} {"train_loss": -6.493937969207764, "global_step": 122028, "epoch": 2905} {"train_loss": -6.539600372314453, "global_step": 122029, "epoch": 2905} {"train_loss": -6.546060562133789, "global_step": 122030, "epoch": 2905} {"train_loss": -6.525937080383301, "global_step": 122031, "epoch": 2905} {"train_loss": -6.542038917541504, "global_step": 122032, "epoch": 2905} {"train_loss": -6.422165870666504, "global_step": 122033, "epoch": 2905} {"train_loss": -6.503574848175049, "global_step": 122034, "epoch": 2905} {"train_loss": -6.5329132080078125, "global_step": 122035, "epoch": 2905} {"train_loss": -6.590944766998291, "global_step": 122036, "epoch": 2905} {"train_loss": -6.478402137756348, "global_step": 122037, "epoch": 2905} {"train_loss": -6.482611656188965, "global_step": 122038, "epoch": 2905} {"train_loss": -6.489893913269043, "global_step": 122039, "epoch": 2905} {"train_loss": -6.530913352966309, "global_step": 122040, "epoch": 2905} {"train_loss": -6.550874710083008, "global_step": 122041, "epoch": 2905} {"train_loss": -6.545132637023926, "global_step": 122042, "epoch": 2905} {"train_loss": -6.566954612731934, "global_step": 122043, "epoch": 2905} {"train_loss": -6.595961570739746, "global_step": 122044, "epoch": 2905} {"train_loss": -6.529565811157227, "global_step": 122045, "epoch": 2905} {"train_loss": -6.499388694763184, "global_step": 122046, "epoch": 2905} {"train_loss": -6.6205244064331055, "global_step": 122047, "epoch": 2905} {"train_loss": -6.54940128326416, "global_step": 122048, "epoch": 2905} {"train_loss": -6.533856391906738, "global_step": 122049, "epoch": 2905} {"train_loss": -6.442751407623291, "global_step": 122050, "epoch": 2905} {"train_loss": -6.536925054731823, "global_step": 122051, "epoch": 2905, "val_loss": 68122.9609375} {"train_loss": -6.579193115234375, "global_step": 122052, "epoch": 2906} {"train_loss": -6.485893249511719, "global_step": 122053, "epoch": 2906} {"train_loss": -6.569319248199463, "global_step": 122054, "epoch": 2906} {"train_loss": -6.4694929122924805, "global_step": 122055, "epoch": 2906} {"train_loss": -6.572566986083984, "global_step": 122056, "epoch": 2906} {"train_loss": -6.516494274139404, "global_step": 122057, "epoch": 2906} {"train_loss": -6.520078182220459, "global_step": 122058, "epoch": 2906} {"train_loss": -6.540294647216797, "global_step": 122059, "epoch": 2906} {"train_loss": -6.673295497894287, "global_step": 122060, "epoch": 2906} {"train_loss": -6.584246635437012, "global_step": 122061, "epoch": 2906} {"train_loss": -6.444087028503418, "global_step": 122062, "epoch": 2906} {"train_loss": -6.495108604431152, "global_step": 122063, "epoch": 2906} {"train_loss": -6.596172332763672, "global_step": 122064, "epoch": 2906} {"train_loss": -6.592951774597168, "global_step": 122065, "epoch": 2906} {"train_loss": -6.561983108520508, "global_step": 122066, "epoch": 2906} {"train_loss": -6.588810920715332, "global_step": 122067, "epoch": 2906} {"train_loss": -6.479283809661865, "global_step": 122068, "epoch": 2906} {"train_loss": -6.578953742980957, "global_step": 122069, "epoch": 2906} {"train_loss": -6.6916608810424805, "global_step": 122070, "epoch": 2906} {"train_loss": -6.602984428405762, "global_step": 122071, "epoch": 2906} {"train_loss": -6.542645454406738, "global_step": 122072, "epoch": 2906} {"train_loss": -6.621767997741699, "global_step": 122073, "epoch": 2906} {"train_loss": -6.618997573852539, "global_step": 122074, "epoch": 2906} {"train_loss": -6.521246433258057, "global_step": 122075, "epoch": 2906} {"train_loss": -6.51054573059082, "global_step": 122076, "epoch": 2906} {"train_loss": -6.60892915725708, "global_step": 122077, "epoch": 2906} {"train_loss": -6.620689392089844, "global_step": 122078, "epoch": 2906} {"train_loss": -6.637089729309082, "global_step": 122079, "epoch": 2906} {"train_loss": -6.579845428466797, "global_step": 122080, "epoch": 2906} {"train_loss": -6.551501274108887, "global_step": 122081, "epoch": 2906} {"train_loss": -6.568617820739746, "global_step": 122082, "epoch": 2906} {"train_loss": -6.439220428466797, "global_step": 122083, "epoch": 2906} {"train_loss": -6.582806587219238, "global_step": 122084, "epoch": 2906} {"train_loss": -6.499976634979248, "global_step": 122085, "epoch": 2906} {"train_loss": -6.424551486968994, "global_step": 122086, "epoch": 2906} {"train_loss": -6.68375301361084, "global_step": 122087, "epoch": 2906} {"train_loss": -6.494661331176758, "global_step": 122088, "epoch": 2906} {"train_loss": -6.5170769691467285, "global_step": 122089, "epoch": 2906} {"train_loss": -6.511716842651367, "global_step": 122090, "epoch": 2906} {"train_loss": -6.636646270751953, "global_step": 122091, "epoch": 2906} {"train_loss": -6.512929916381836, "global_step": 122092, "epoch": 2906} {"train_loss": -6.55507154691787, "global_step": 122093, "epoch": 2906, "val_loss": 68072.875} {"train_loss": -6.502022743225098, "global_step": 122094, "epoch": 2907} {"train_loss": -6.574352264404297, "global_step": 122095, "epoch": 2907} {"train_loss": -6.518116474151611, "global_step": 122096, "epoch": 2907} {"train_loss": -6.607739448547363, "global_step": 122097, "epoch": 2907} {"train_loss": -6.466133117675781, "global_step": 122098, "epoch": 2907} {"train_loss": -6.652506351470947, "global_step": 122099, "epoch": 2907} {"train_loss": -6.634221076965332, "global_step": 122100, "epoch": 2907} {"train_loss": -6.576456069946289, "global_step": 122101, "epoch": 2907} {"train_loss": -6.574199199676514, "global_step": 122102, "epoch": 2907} {"train_loss": -6.673844814300537, "global_step": 122103, "epoch": 2907} {"train_loss": -6.463544845581055, "global_step": 122104, "epoch": 2907} {"train_loss": -6.446993827819824, "global_step": 122105, "epoch": 2907} {"train_loss": -6.4214277267456055, "global_step": 122106, "epoch": 2907} {"train_loss": -6.455165863037109, "global_step": 122107, "epoch": 2907} {"train_loss": -6.539759635925293, "global_step": 122108, "epoch": 2907} {"train_loss": -6.521299362182617, "global_step": 122109, "epoch": 2907} {"train_loss": -6.502126693725586, "global_step": 122110, "epoch": 2907} {"train_loss": -6.634042739868164, "global_step": 122111, "epoch": 2907} {"train_loss": -6.4956440925598145, "global_step": 122112, "epoch": 2907} {"train_loss": -6.459567070007324, "global_step": 122113, "epoch": 2907} {"train_loss": -6.587610244750977, "global_step": 122114, "epoch": 2907} {"train_loss": -6.453422546386719, "global_step": 122115, "epoch": 2907} {"train_loss": -6.679069519042969, "global_step": 122116, "epoch": 2907} {"train_loss": -6.542351722717285, "global_step": 122117, "epoch": 2907} {"train_loss": -6.510832786560059, "global_step": 122118, "epoch": 2907} {"train_loss": -6.547285556793213, "global_step": 122119, "epoch": 2907} {"train_loss": -6.436026573181152, "global_step": 122120, "epoch": 2907} {"train_loss": -6.515002250671387, "global_step": 122121, "epoch": 2907} {"train_loss": -6.529362201690674, "global_step": 122122, "epoch": 2907} {"train_loss": -6.461026191711426, "global_step": 122123, "epoch": 2907} {"train_loss": -6.57402229309082, "global_step": 122124, "epoch": 2907} {"train_loss": -6.477202415466309, "global_step": 122125, "epoch": 2907} {"train_loss": -6.562751293182373, "global_step": 122126, "epoch": 2907} {"train_loss": -6.612125396728516, "global_step": 122127, "epoch": 2907} {"train_loss": -6.614853858947754, "global_step": 122128, "epoch": 2907} {"train_loss": -6.523702621459961, "global_step": 122129, "epoch": 2907} {"train_loss": -6.442953109741211, "global_step": 122130, "epoch": 2907} {"train_loss": -6.491034030914307, "global_step": 122131, "epoch": 2907} {"train_loss": -6.5242133140563965, "global_step": 122132, "epoch": 2907} {"train_loss": -6.5150861740112305, "global_step": 122133, "epoch": 2907} {"train_loss": -6.5486650466918945, "global_step": 122134, "epoch": 2907} {"train_loss": -6.533789078394572, "global_step": 122135, "epoch": 2907, "val_loss": 67809.9375} {"train_loss": -6.590278148651123, "global_step": 122136, "epoch": 2908} {"train_loss": -6.581748962402344, "global_step": 122137, "epoch": 2908} {"train_loss": -6.484235763549805, "global_step": 122138, "epoch": 2908} {"train_loss": -6.634489059448242, "global_step": 122139, "epoch": 2908} {"train_loss": -6.650688171386719, "global_step": 122140, "epoch": 2908} {"train_loss": -6.603375434875488, "global_step": 122141, "epoch": 2908} {"train_loss": -6.573864936828613, "global_step": 122142, "epoch": 2908} {"train_loss": -6.580600738525391, "global_step": 122143, "epoch": 2908} {"train_loss": -6.560140132904053, "global_step": 122144, "epoch": 2908} {"train_loss": -6.533666610717773, "global_step": 122145, "epoch": 2908} {"train_loss": -6.515401363372803, "global_step": 122146, "epoch": 2908} {"train_loss": -6.472820281982422, "global_step": 122147, "epoch": 2908} {"train_loss": -6.569417953491211, "global_step": 122148, "epoch": 2908} {"train_loss": -6.610084533691406, "global_step": 122149, "epoch": 2908} {"train_loss": -6.595647811889648, "global_step": 122150, "epoch": 2908} {"train_loss": -6.4870524406433105, "global_step": 122151, "epoch": 2908} {"train_loss": -6.589563369750977, "global_step": 122152, "epoch": 2908} {"train_loss": -6.622407913208008, "global_step": 122153, "epoch": 2908} {"train_loss": -6.615389823913574, "global_step": 122154, "epoch": 2908} {"train_loss": -6.69849967956543, "global_step": 122155, "epoch": 2908} {"train_loss": -6.535726547241211, "global_step": 122156, "epoch": 2908} {"train_loss": -6.638298034667969, "global_step": 122157, "epoch": 2908} {"train_loss": -6.575055122375488, "global_step": 122158, "epoch": 2908} {"train_loss": -6.476305961608887, "global_step": 122159, "epoch": 2908} {"train_loss": -6.627678871154785, "global_step": 122160, "epoch": 2908} {"train_loss": -6.599609851837158, "global_step": 122161, "epoch": 2908} {"train_loss": -6.564034461975098, "global_step": 122162, "epoch": 2908} {"train_loss": -6.508965492248535, "global_step": 122163, "epoch": 2908} {"train_loss": -6.529983997344971, "global_step": 122164, "epoch": 2908} {"train_loss": -6.649395942687988, "global_step": 122165, "epoch": 2908} {"train_loss": -6.608826160430908, "global_step": 122166, "epoch": 2908} {"train_loss": -6.581093788146973, "global_step": 122167, "epoch": 2908} {"train_loss": -6.479343414306641, "global_step": 122168, "epoch": 2908} {"train_loss": -6.578084945678711, "global_step": 122169, "epoch": 2908} {"train_loss": -6.605762481689453, "global_step": 122170, "epoch": 2908} {"train_loss": -6.557662487030029, "global_step": 122171, "epoch": 2908} {"train_loss": -6.657270431518555, "global_step": 122172, "epoch": 2908} {"train_loss": -6.540966987609863, "global_step": 122173, "epoch": 2908} {"train_loss": -6.504196643829346, "global_step": 122174, "epoch": 2908} {"train_loss": -6.486836910247803, "global_step": 122175, "epoch": 2908} {"train_loss": -6.37286376953125, "global_step": 122176, "epoch": 2908} {"train_loss": -6.568562360036941, "global_step": 122177, "epoch": 2908, "val_loss": 67956.7265625} {"train_loss": -6.49097204208374, "global_step": 122178, "epoch": 2909} {"train_loss": -6.417000770568848, "global_step": 122179, "epoch": 2909} {"train_loss": -6.716001033782959, "global_step": 122180, "epoch": 2909} {"train_loss": -6.535881996154785, "global_step": 122181, "epoch": 2909} {"train_loss": -6.542741775512695, "global_step": 122182, "epoch": 2909} {"train_loss": -6.59281587600708, "global_step": 122183, "epoch": 2909} {"train_loss": -6.607799530029297, "global_step": 122184, "epoch": 2909} {"train_loss": -6.685628414154053, "global_step": 122185, "epoch": 2909} {"train_loss": -6.399510860443115, "global_step": 122186, "epoch": 2909} {"train_loss": -6.625672817230225, "global_step": 122187, "epoch": 2909} {"train_loss": -6.564399719238281, "global_step": 122188, "epoch": 2909} {"train_loss": -6.663269996643066, "global_step": 122189, "epoch": 2909} {"train_loss": -6.643036842346191, "global_step": 122190, "epoch": 2909} {"train_loss": -6.519323348999023, "global_step": 122191, "epoch": 2909} {"train_loss": -6.747858047485352, "global_step": 122192, "epoch": 2909} {"train_loss": -6.50802755355835, "global_step": 122193, "epoch": 2909} {"train_loss": -6.677385330200195, "global_step": 122194, "epoch": 2909} {"train_loss": -6.548130989074707, "global_step": 122195, "epoch": 2909} {"train_loss": -6.635010719299316, "global_step": 122196, "epoch": 2909} {"train_loss": -6.471312522888184, "global_step": 122197, "epoch": 2909} {"train_loss": -6.409030437469482, "global_step": 122198, "epoch": 2909} {"train_loss": -6.658817768096924, "global_step": 122199, "epoch": 2909} {"train_loss": -6.5344390869140625, "global_step": 122200, "epoch": 2909} {"train_loss": -6.660818099975586, "global_step": 122201, "epoch": 2909} {"train_loss": -6.631806373596191, "global_step": 122202, "epoch": 2909} {"train_loss": -6.519954681396484, "global_step": 122203, "epoch": 2909} {"train_loss": -6.703839302062988, "global_step": 122204, "epoch": 2909} {"train_loss": -6.593139171600342, "global_step": 122205, "epoch": 2909} {"train_loss": -6.647850036621094, "global_step": 122206, "epoch": 2909} {"train_loss": -6.595319747924805, "global_step": 122207, "epoch": 2909} {"train_loss": -6.642583847045898, "global_step": 122208, "epoch": 2909} {"train_loss": -6.505632400512695, "global_step": 122209, "epoch": 2909} {"train_loss": -6.583345413208008, "global_step": 122210, "epoch": 2909} {"train_loss": -6.5726728439331055, "global_step": 122211, "epoch": 2909} {"train_loss": -6.619119644165039, "global_step": 122212, "epoch": 2909} {"train_loss": -6.643885612487793, "global_step": 122213, "epoch": 2909} {"train_loss": -6.564388751983643, "global_step": 122214, "epoch": 2909} {"train_loss": -6.595526695251465, "global_step": 122215, "epoch": 2909} {"train_loss": -6.548887252807617, "global_step": 122216, "epoch": 2909} {"train_loss": -6.594114303588867, "global_step": 122217, "epoch": 2909} {"train_loss": -6.584114074707031, "global_step": 122218, "epoch": 2909} {"train_loss": -6.586032492773874, "global_step": 122219, "epoch": 2909, "val_loss": 67989.0390625} {"train_loss": -6.535226821899414, "global_step": 122220, "epoch": 2910} {"train_loss": -6.393657207489014, "global_step": 122221, "epoch": 2910} {"train_loss": -6.607658386230469, "global_step": 122222, "epoch": 2910} {"train_loss": -6.556907653808594, "global_step": 122223, "epoch": 2910} {"train_loss": -6.398682594299316, "global_step": 122224, "epoch": 2910} {"train_loss": -6.510235786437988, "global_step": 122225, "epoch": 2910} {"train_loss": -6.507460594177246, "global_step": 122226, "epoch": 2910} {"train_loss": -6.535318851470947, "global_step": 122227, "epoch": 2910} {"train_loss": -6.496435642242432, "global_step": 122228, "epoch": 2910} {"train_loss": -6.433712959289551, "global_step": 122229, "epoch": 2910} {"train_loss": -6.570535659790039, "global_step": 122230, "epoch": 2910} {"train_loss": -6.649061679840088, "global_step": 122231, "epoch": 2910} {"train_loss": -6.503493309020996, "global_step": 122232, "epoch": 2910} {"train_loss": -6.589980125427246, "global_step": 122233, "epoch": 2910} {"train_loss": -6.5976457595825195, "global_step": 122234, "epoch": 2910} {"train_loss": -6.542737007141113, "global_step": 122235, "epoch": 2910} {"train_loss": -6.540074825286865, "global_step": 122236, "epoch": 2910} {"train_loss": -6.536370754241943, "global_step": 122237, "epoch": 2910} {"train_loss": -6.539026260375977, "global_step": 122238, "epoch": 2910} {"train_loss": -6.5489325523376465, "global_step": 122239, "epoch": 2910} {"train_loss": -6.578651428222656, "global_step": 122240, "epoch": 2910} {"train_loss": -6.487591743469238, "global_step": 122241, "epoch": 2910} {"train_loss": -6.573767185211182, "global_step": 122242, "epoch": 2910} {"train_loss": -6.526033401489258, "global_step": 122243, "epoch": 2910} {"train_loss": -6.507083892822266, "global_step": 122244, "epoch": 2910} {"train_loss": -6.581656455993652, "global_step": 122245, "epoch": 2910} {"train_loss": -6.522583961486816, "global_step": 122246, "epoch": 2910} {"train_loss": -6.625181198120117, "global_step": 122247, "epoch": 2910} {"train_loss": -6.593740463256836, "global_step": 122248, "epoch": 2910} {"train_loss": -6.535022735595703, "global_step": 122249, "epoch": 2910} {"train_loss": -6.529555320739746, "global_step": 122250, "epoch": 2910} {"train_loss": -6.626931190490723, "global_step": 122251, "epoch": 2910} {"train_loss": -6.448453903198242, "global_step": 122252, "epoch": 2910} {"train_loss": -6.596375465393066, "global_step": 122253, "epoch": 2910} {"train_loss": -6.559481143951416, "global_step": 122254, "epoch": 2910} {"train_loss": -6.535759925842285, "global_step": 122255, "epoch": 2910} {"train_loss": -6.5955810546875, "global_step": 122256, "epoch": 2910} {"train_loss": -6.6501054763793945, "global_step": 122257, "epoch": 2910} {"train_loss": -6.520853042602539, "global_step": 122258, "epoch": 2910} {"train_loss": -6.541033744812012, "global_step": 122259, "epoch": 2910} {"train_loss": -6.5431227684021, "global_step": 122260, "epoch": 2910} {"train_loss": -6.5417906783875965, "global_step": 122261, "epoch": 2910, "val_loss": 68005.328125} {"train_loss": -6.605521202087402, "global_step": 122262, "epoch": 2911} {"train_loss": -6.463726043701172, "global_step": 122263, "epoch": 2911} {"train_loss": -6.51726770401001, "global_step": 122264, "epoch": 2911} {"train_loss": -6.6698431968688965, "global_step": 122265, "epoch": 2911} {"train_loss": -6.4483489990234375, "global_step": 122266, "epoch": 2911} {"train_loss": -6.562807083129883, "global_step": 122267, "epoch": 2911} {"train_loss": -6.5282368659973145, "global_step": 122268, "epoch": 2911} {"train_loss": -6.501697540283203, "global_step": 122269, "epoch": 2911} {"train_loss": -6.43735408782959, "global_step": 122270, "epoch": 2911} {"train_loss": -6.450713634490967, "global_step": 122271, "epoch": 2911} {"train_loss": -6.649408340454102, "global_step": 122272, "epoch": 2911} {"train_loss": -6.505954742431641, "global_step": 122273, "epoch": 2911} {"train_loss": -6.447525501251221, "global_step": 122274, "epoch": 2911} {"train_loss": -6.598825454711914, "global_step": 122275, "epoch": 2911} {"train_loss": -6.728268623352051, "global_step": 122276, "epoch": 2911} {"train_loss": -6.434199810028076, "global_step": 122277, "epoch": 2911} {"train_loss": -6.355584144592285, "global_step": 122278, "epoch": 2911} {"train_loss": -6.4989423751831055, "global_step": 122279, "epoch": 2911} {"train_loss": -6.421389579772949, "global_step": 122280, "epoch": 2911} {"train_loss": -6.422842979431152, "global_step": 122281, "epoch": 2911} {"train_loss": -6.529767990112305, "global_step": 122282, "epoch": 2911} {"train_loss": -6.617382049560547, "global_step": 122283, "epoch": 2911} {"train_loss": -6.502039432525635, "global_step": 122284, "epoch": 2911} {"train_loss": -6.515695095062256, "global_step": 122285, "epoch": 2911} {"train_loss": -6.560927391052246, "global_step": 122286, "epoch": 2911} {"train_loss": -6.536439895629883, "global_step": 122287, "epoch": 2911} {"train_loss": -6.514590263366699, "global_step": 122288, "epoch": 2911} {"train_loss": -6.565890312194824, "global_step": 122289, "epoch": 2911} {"train_loss": -6.460564613342285, "global_step": 122290, "epoch": 2911} {"train_loss": -6.542215347290039, "global_step": 122291, "epoch": 2911} {"train_loss": -6.578503131866455, "global_step": 122292, "epoch": 2911} {"train_loss": -6.555853843688965, "global_step": 122293, "epoch": 2911} {"train_loss": -6.436711311340332, "global_step": 122294, "epoch": 2911} {"train_loss": -6.538937568664551, "global_step": 122295, "epoch": 2911} {"train_loss": -6.468588352203369, "global_step": 122296, "epoch": 2911} {"train_loss": -6.568044662475586, "global_step": 122297, "epoch": 2911} {"train_loss": -6.601243019104004, "global_step": 122298, "epoch": 2911} {"train_loss": -6.452911376953125, "global_step": 122299, "epoch": 2911} {"train_loss": -6.424797058105469, "global_step": 122300, "epoch": 2911} {"train_loss": -6.449967384338379, "global_step": 122301, "epoch": 2911} {"train_loss": -6.517465591430664, "global_step": 122302, "epoch": 2911} {"train_loss": -6.517251877557664, "global_step": 122303, "epoch": 2911, "val_loss": 68061.671875} {"train_loss": -6.471800327301025, "global_step": 122304, "epoch": 2912} {"train_loss": -6.441897392272949, "global_step": 122305, "epoch": 2912} {"train_loss": -6.610601902008057, "global_step": 122306, "epoch": 2912} {"train_loss": -6.490914821624756, "global_step": 122307, "epoch": 2912} {"train_loss": -6.473657608032227, "global_step": 122308, "epoch": 2912} {"train_loss": -6.607711315155029, "global_step": 122309, "epoch": 2912} {"train_loss": -6.444073677062988, "global_step": 122310, "epoch": 2912} {"train_loss": -6.512972354888916, "global_step": 122311, "epoch": 2912} {"train_loss": -6.691956520080566, "global_step": 122312, "epoch": 2912} {"train_loss": -6.445059776306152, "global_step": 122313, "epoch": 2912} {"train_loss": -6.541293144226074, "global_step": 122314, "epoch": 2912} {"train_loss": -6.578853607177734, "global_step": 122315, "epoch": 2912} {"train_loss": -6.576257705688477, "global_step": 122316, "epoch": 2912} {"train_loss": -6.531905174255371, "global_step": 122317, "epoch": 2912} {"train_loss": -6.640896797180176, "global_step": 122318, "epoch": 2912} {"train_loss": -6.565847396850586, "global_step": 122319, "epoch": 2912} {"train_loss": -6.518520355224609, "global_step": 122320, "epoch": 2912} {"train_loss": -6.535899639129639, "global_step": 122321, "epoch": 2912} {"train_loss": -6.5552825927734375, "global_step": 122322, "epoch": 2912} {"train_loss": -6.6227288246154785, "global_step": 122323, "epoch": 2912} {"train_loss": -6.585753440856934, "global_step": 122324, "epoch": 2912} {"train_loss": -6.626528263092041, "global_step": 122325, "epoch": 2912} {"train_loss": -6.3734564781188965, "global_step": 122326, "epoch": 2912} {"train_loss": -6.603975296020508, "global_step": 122327, "epoch": 2912} {"train_loss": -6.633793830871582, "global_step": 122328, "epoch": 2912} {"train_loss": -6.594442367553711, "global_step": 122329, "epoch": 2912} {"train_loss": -6.554150104522705, "global_step": 122330, "epoch": 2912} {"train_loss": -6.624451637268066, "global_step": 122331, "epoch": 2912} {"train_loss": -6.531597137451172, "global_step": 122332, "epoch": 2912} {"train_loss": -6.454390525817871, "global_step": 122333, "epoch": 2912} {"train_loss": -6.562679290771484, "global_step": 122334, "epoch": 2912} {"train_loss": -6.585786819458008, "global_step": 122335, "epoch": 2912} {"train_loss": -6.547014236450195, "global_step": 122336, "epoch": 2912} {"train_loss": -6.665355682373047, "global_step": 122337, "epoch": 2912} {"train_loss": -6.473288059234619, "global_step": 122338, "epoch": 2912} {"train_loss": -6.5360260009765625, "global_step": 122339, "epoch": 2912} {"train_loss": -6.627782821655273, "global_step": 122340, "epoch": 2912} {"train_loss": -6.584966659545898, "global_step": 122341, "epoch": 2912} {"train_loss": -6.63773250579834, "global_step": 122342, "epoch": 2912} {"train_loss": -6.581545829772949, "global_step": 122343, "epoch": 2912} {"train_loss": -6.525181770324707, "global_step": 122344, "epoch": 2912} {"train_loss": -6.555248725981939, "global_step": 122345, "epoch": 2912, "val_loss": 67982.4296875} {"train_loss": -6.5690155029296875, "global_step": 122346, "epoch": 2913} {"train_loss": -6.597947120666504, "global_step": 122347, "epoch": 2913} {"train_loss": -6.623372554779053, "global_step": 122348, "epoch": 2913} {"train_loss": -6.526177406311035, "global_step": 122349, "epoch": 2913} {"train_loss": -6.546758651733398, "global_step": 122350, "epoch": 2913} {"train_loss": -6.583866119384766, "global_step": 122351, "epoch": 2913} {"train_loss": -6.627777576446533, "global_step": 122352, "epoch": 2913} {"train_loss": -6.491274833679199, "global_step": 122353, "epoch": 2913} {"train_loss": -6.545485019683838, "global_step": 122354, "epoch": 2913} {"train_loss": -6.639507293701172, "global_step": 122355, "epoch": 2913} {"train_loss": -6.734889984130859, "global_step": 122356, "epoch": 2913} {"train_loss": -6.505873680114746, "global_step": 122357, "epoch": 2913} {"train_loss": -6.65733528137207, "global_step": 122358, "epoch": 2913} {"train_loss": -6.5764079093933105, "global_step": 122359, "epoch": 2913} {"train_loss": -6.498964309692383, "global_step": 122360, "epoch": 2913} {"train_loss": -6.548796653747559, "global_step": 122361, "epoch": 2913} {"train_loss": -6.5278730392456055, "global_step": 122362, "epoch": 2913} {"train_loss": -6.590599060058594, "global_step": 122363, "epoch": 2913} {"train_loss": -6.552259922027588, "global_step": 122364, "epoch": 2913} {"train_loss": -6.637448310852051, "global_step": 122365, "epoch": 2913} {"train_loss": -6.376189231872559, "global_step": 122366, "epoch": 2913} {"train_loss": -6.566546440124512, "global_step": 122367, "epoch": 2913} {"train_loss": -6.430418968200684, "global_step": 122368, "epoch": 2913} {"train_loss": -6.3924102783203125, "global_step": 122369, "epoch": 2913} {"train_loss": -6.515069007873535, "global_step": 122370, "epoch": 2913} {"train_loss": -6.370108604431152, "global_step": 122371, "epoch": 2913} {"train_loss": -6.541874408721924, "global_step": 122372, "epoch": 2913} {"train_loss": -6.388334274291992, "global_step": 122373, "epoch": 2913} {"train_loss": -6.416600227355957, "global_step": 122374, "epoch": 2913} {"train_loss": -6.478034973144531, "global_step": 122375, "epoch": 2913} {"train_loss": -6.597095966339111, "global_step": 122376, "epoch": 2913} {"train_loss": -6.366746425628662, "global_step": 122377, "epoch": 2913} {"train_loss": -6.442174911499023, "global_step": 122378, "epoch": 2913} {"train_loss": -6.590170383453369, "global_step": 122379, "epoch": 2913} {"train_loss": -6.510217189788818, "global_step": 122380, "epoch": 2913} {"train_loss": -6.542112827301025, "global_step": 122381, "epoch": 2913} {"train_loss": -6.464820861816406, "global_step": 122382, "epoch": 2913} {"train_loss": -6.507574558258057, "global_step": 122383, "epoch": 2913} {"train_loss": -6.446015357971191, "global_step": 122384, "epoch": 2913} {"train_loss": -6.507068634033203, "global_step": 122385, "epoch": 2913} {"train_loss": -6.463545322418213, "global_step": 122386, "epoch": 2913} {"train_loss": -6.523771410896664, "global_step": 122387, "epoch": 2913, "val_loss": 68291.3203125} {"train_loss": -6.503655433654785, "global_step": 122388, "epoch": 2914} {"train_loss": -6.468312740325928, "global_step": 122389, "epoch": 2914} {"train_loss": -6.497128009796143, "global_step": 122390, "epoch": 2914} {"train_loss": -6.528964042663574, "global_step": 122391, "epoch": 2914} {"train_loss": -6.530631065368652, "global_step": 122392, "epoch": 2914} {"train_loss": -6.407588958740234, "global_step": 122393, "epoch": 2914} {"train_loss": -6.574880599975586, "global_step": 122394, "epoch": 2914} {"train_loss": -6.444978713989258, "global_step": 122395, "epoch": 2914} {"train_loss": -6.487165927886963, "global_step": 122396, "epoch": 2914} {"train_loss": -6.49363374710083, "global_step": 122397, "epoch": 2914} {"train_loss": -6.442499160766602, "global_step": 122398, "epoch": 2914} {"train_loss": -6.318603515625, "global_step": 122399, "epoch": 2914} {"train_loss": -6.551746368408203, "global_step": 122400, "epoch": 2914} {"train_loss": -6.422689437866211, "global_step": 122401, "epoch": 2914} {"train_loss": -6.399276256561279, "global_step": 122402, "epoch": 2914} {"train_loss": -6.595711708068848, "global_step": 122403, "epoch": 2914} {"train_loss": -6.346795082092285, "global_step": 122404, "epoch": 2914} {"train_loss": -6.571963787078857, "global_step": 122405, "epoch": 2914} {"train_loss": -6.375160217285156, "global_step": 122406, "epoch": 2914} {"train_loss": -6.543069839477539, "global_step": 122407, "epoch": 2914} {"train_loss": -6.5233540534973145, "global_step": 122408, "epoch": 2914} {"train_loss": -6.431400775909424, "global_step": 122409, "epoch": 2914} {"train_loss": -6.503505706787109, "global_step": 122410, "epoch": 2914} {"train_loss": -6.503986835479736, "global_step": 122411, "epoch": 2914} {"train_loss": -6.492636680603027, "global_step": 122412, "epoch": 2914} {"train_loss": -6.466176986694336, "global_step": 122413, "epoch": 2914} {"train_loss": -6.640876770019531, "global_step": 122414, "epoch": 2914} {"train_loss": -6.511307716369629, "global_step": 122415, "epoch": 2914} {"train_loss": -6.497416019439697, "global_step": 122416, "epoch": 2914} {"train_loss": -6.60374641418457, "global_step": 122417, "epoch": 2914} {"train_loss": -6.605334281921387, "global_step": 122418, "epoch": 2914} {"train_loss": -6.675296783447266, "global_step": 122419, "epoch": 2914} {"train_loss": -6.612338066101074, "global_step": 122420, "epoch": 2914} {"train_loss": -6.656441688537598, "global_step": 122421, "epoch": 2914} {"train_loss": -6.557036399841309, "global_step": 122422, "epoch": 2914} {"train_loss": -6.423664093017578, "global_step": 122423, "epoch": 2914} {"train_loss": -6.62331485748291, "global_step": 122424, "epoch": 2914} {"train_loss": -6.587982177734375, "global_step": 122425, "epoch": 2914} {"train_loss": -6.561235427856445, "global_step": 122426, "epoch": 2914} {"train_loss": -6.542015552520752, "global_step": 122427, "epoch": 2914} {"train_loss": -6.556244850158691, "global_step": 122428, "epoch": 2914} {"train_loss": -6.5161001568748835, "global_step": 122429, "epoch": 2914, "val_loss": 67908.515625} {"train_loss": -6.5711846351623535, "global_step": 122430, "epoch": 2915} {"train_loss": -6.55360221862793, "global_step": 122431, "epoch": 2915} {"train_loss": -6.5438103675842285, "global_step": 122432, "epoch": 2915} {"train_loss": -6.50518798828125, "global_step": 122433, "epoch": 2915} {"train_loss": -6.482356548309326, "global_step": 122434, "epoch": 2915} {"train_loss": -6.588994979858398, "global_step": 122435, "epoch": 2915} {"train_loss": -6.682533264160156, "global_step": 122436, "epoch": 2915} {"train_loss": -6.531538009643555, "global_step": 122437, "epoch": 2915} {"train_loss": -6.568331718444824, "global_step": 122438, "epoch": 2915} {"train_loss": -6.665580749511719, "global_step": 122439, "epoch": 2915} {"train_loss": -6.693063259124756, "global_step": 122440, "epoch": 2915} {"train_loss": -6.585108280181885, "global_step": 122441, "epoch": 2915} {"train_loss": -6.5900468826293945, "global_step": 122442, "epoch": 2915} {"train_loss": -6.439302444458008, "global_step": 122443, "epoch": 2915} {"train_loss": -6.546429634094238, "global_step": 122444, "epoch": 2915} {"train_loss": -6.693863868713379, "global_step": 122445, "epoch": 2915} {"train_loss": -6.501568794250488, "global_step": 122446, "epoch": 2915} {"train_loss": -6.517313003540039, "global_step": 122447, "epoch": 2915} {"train_loss": -6.508368015289307, "global_step": 122448, "epoch": 2915} {"train_loss": -6.683154582977295, "global_step": 122449, "epoch": 2915} {"train_loss": -6.494474411010742, "global_step": 122450, "epoch": 2915} {"train_loss": -6.578469276428223, "global_step": 122451, "epoch": 2915} {"train_loss": -6.490155220031738, "global_step": 122452, "epoch": 2915} {"train_loss": -6.513604640960693, "global_step": 122453, "epoch": 2915} {"train_loss": -6.580962657928467, "global_step": 122454, "epoch": 2915} {"train_loss": -6.563912391662598, "global_step": 122455, "epoch": 2915} {"train_loss": -6.5342583656311035, "global_step": 122456, "epoch": 2915} {"train_loss": -6.525312423706055, "global_step": 122457, "epoch": 2915} {"train_loss": -6.657211780548096, "global_step": 122458, "epoch": 2915} {"train_loss": -6.712508678436279, "global_step": 122459, "epoch": 2915} {"train_loss": -6.427652359008789, "global_step": 122460, "epoch": 2915} {"train_loss": -6.601450443267822, "global_step": 122461, "epoch": 2915} {"train_loss": -6.633116722106934, "global_step": 122462, "epoch": 2915} {"train_loss": -6.59442138671875, "global_step": 122463, "epoch": 2915} {"train_loss": -6.533085823059082, "global_step": 122464, "epoch": 2915} {"train_loss": -6.498893737792969, "global_step": 122465, "epoch": 2915} {"train_loss": -6.5766496658325195, "global_step": 122466, "epoch": 2915} {"train_loss": -6.47907829284668, "global_step": 122467, "epoch": 2915} {"train_loss": -6.628244400024414, "global_step": 122468, "epoch": 2915} {"train_loss": -6.5879597663879395, "global_step": 122469, "epoch": 2915} {"train_loss": -6.57924747467041, "global_step": 122470, "epoch": 2915} {"train_loss": -6.566907360440209, "global_step": 122471, "epoch": 2915, "val_loss": 67757.2109375} {"train_loss": -6.540468692779541, "global_step": 122472, "epoch": 2916} {"train_loss": -6.5897722244262695, "global_step": 122473, "epoch": 2916} {"train_loss": -6.434287071228027, "global_step": 122474, "epoch": 2916} {"train_loss": -6.586236953735352, "global_step": 122475, "epoch": 2916} {"train_loss": -6.62832498550415, "global_step": 122476, "epoch": 2916} {"train_loss": -6.60184383392334, "global_step": 122477, "epoch": 2916} {"train_loss": -6.594293117523193, "global_step": 122478, "epoch": 2916} {"train_loss": -6.501649379730225, "global_step": 122479, "epoch": 2916} {"train_loss": -6.621608734130859, "global_step": 122480, "epoch": 2916} {"train_loss": -6.572075843811035, "global_step": 122481, "epoch": 2916} {"train_loss": -6.625187873840332, "global_step": 122482, "epoch": 2916} {"train_loss": -6.652835845947266, "global_step": 122483, "epoch": 2916} {"train_loss": -6.5409088134765625, "global_step": 122484, "epoch": 2916} {"train_loss": -6.565334796905518, "global_step": 122485, "epoch": 2916} {"train_loss": -6.486948013305664, "global_step": 122486, "epoch": 2916} {"train_loss": -6.626442909240723, "global_step": 122487, "epoch": 2916} {"train_loss": -6.569352149963379, "global_step": 122488, "epoch": 2916} {"train_loss": -6.602041244506836, "global_step": 122489, "epoch": 2916} {"train_loss": -6.736960411071777, "global_step": 122490, "epoch": 2916} {"train_loss": -6.5621747970581055, "global_step": 122491, "epoch": 2916} {"train_loss": -6.7764692306518555, "global_step": 122492, "epoch": 2916} {"train_loss": -6.607956409454346, "global_step": 122493, "epoch": 2916} {"train_loss": -6.477034091949463, "global_step": 122494, "epoch": 2916} {"train_loss": -6.564199924468994, "global_step": 122495, "epoch": 2916} {"train_loss": -6.491664886474609, "global_step": 122496, "epoch": 2916} {"train_loss": -6.6128058433532715, "global_step": 122497, "epoch": 2916} {"train_loss": -6.592809677124023, "global_step": 122498, "epoch": 2916} {"train_loss": -6.4806060791015625, "global_step": 122499, "epoch": 2916} {"train_loss": -6.536961078643799, "global_step": 122500, "epoch": 2916} {"train_loss": -6.585343360900879, "global_step": 122501, "epoch": 2916} {"train_loss": -6.578082084655762, "global_step": 122502, "epoch": 2916} {"train_loss": -6.586716651916504, "global_step": 122503, "epoch": 2916} {"train_loss": -6.658684730529785, "global_step": 122504, "epoch": 2916} {"train_loss": -6.548824787139893, "global_step": 122505, "epoch": 2916} {"train_loss": -6.582803249359131, "global_step": 122506, "epoch": 2916} {"train_loss": -6.3881516456604, "global_step": 122507, "epoch": 2916} {"train_loss": -6.504671573638916, "global_step": 122508, "epoch": 2916} {"train_loss": -6.461475372314453, "global_step": 122509, "epoch": 2916} {"train_loss": -6.422873497009277, "global_step": 122510, "epoch": 2916} {"train_loss": -6.5724101066589355, "global_step": 122511, "epoch": 2916} {"train_loss": -6.629744529724121, "global_step": 122512, "epoch": 2916} {"train_loss": -6.56726192292713, "global_step": 122513, "epoch": 2916, "val_loss": 68089.4375} {"train_loss": -6.5307207107543945, "global_step": 122514, "epoch": 2917} {"train_loss": -6.5730814933776855, "global_step": 122515, "epoch": 2917} {"train_loss": -6.597272872924805, "global_step": 122516, "epoch": 2917} {"train_loss": -6.600149154663086, "global_step": 122517, "epoch": 2917} {"train_loss": -6.636675834655762, "global_step": 122518, "epoch": 2917} {"train_loss": -6.531960964202881, "global_step": 122519, "epoch": 2917} {"train_loss": -6.5979814529418945, "global_step": 122520, "epoch": 2917} {"train_loss": -6.607381820678711, "global_step": 122521, "epoch": 2917} {"train_loss": -6.43430233001709, "global_step": 122522, "epoch": 2917} {"train_loss": -6.496417999267578, "global_step": 122523, "epoch": 2917} {"train_loss": -6.5602264404296875, "global_step": 122524, "epoch": 2917} {"train_loss": -6.337751388549805, "global_step": 122525, "epoch": 2917} {"train_loss": -6.642038822174072, "global_step": 122526, "epoch": 2917} {"train_loss": -6.587305545806885, "global_step": 122527, "epoch": 2917} {"train_loss": -6.523483753204346, "global_step": 122528, "epoch": 2917} {"train_loss": -6.545573711395264, "global_step": 122529, "epoch": 2917} {"train_loss": -6.343017578125, "global_step": 122530, "epoch": 2917} {"train_loss": -6.488190650939941, "global_step": 122531, "epoch": 2917} {"train_loss": -6.545902729034424, "global_step": 122532, "epoch": 2917} {"train_loss": -6.518030166625977, "global_step": 122533, "epoch": 2917} {"train_loss": -6.645704746246338, "global_step": 122534, "epoch": 2917} {"train_loss": -6.5286784172058105, "global_step": 122535, "epoch": 2917} {"train_loss": -6.534494400024414, "global_step": 122536, "epoch": 2917} {"train_loss": -6.530847549438477, "global_step": 122537, "epoch": 2917} {"train_loss": -6.703934669494629, "global_step": 122538, "epoch": 2917} {"train_loss": -6.471347808837891, "global_step": 122539, "epoch": 2917} {"train_loss": -6.433831691741943, "global_step": 122540, "epoch": 2917} {"train_loss": -6.500339984893799, "global_step": 122541, "epoch": 2917} {"train_loss": -6.496936798095703, "global_step": 122542, "epoch": 2917} {"train_loss": -6.57922887802124, "global_step": 122543, "epoch": 2917} {"train_loss": -6.547021865844727, "global_step": 122544, "epoch": 2917} {"train_loss": -6.573092460632324, "global_step": 122545, "epoch": 2917} {"train_loss": -6.605298042297363, "global_step": 122546, "epoch": 2917} {"train_loss": -6.522353172302246, "global_step": 122547, "epoch": 2917} {"train_loss": -6.605827331542969, "global_step": 122548, "epoch": 2917} {"train_loss": -6.560638427734375, "global_step": 122549, "epoch": 2917} {"train_loss": -6.571555137634277, "global_step": 122550, "epoch": 2917} {"train_loss": -6.527251720428467, "global_step": 122551, "epoch": 2917} {"train_loss": -6.613430976867676, "global_step": 122552, "epoch": 2917} {"train_loss": -6.684898376464844, "global_step": 122553, "epoch": 2917} {"train_loss": -6.624936103820801, "global_step": 122554, "epoch": 2917} {"train_loss": -6.552196059908185, "global_step": 122555, "epoch": 2917, "val_loss": 67976.28125} {"train_loss": -6.552947044372559, "global_step": 122556, "epoch": 2918} {"train_loss": -6.6522932052612305, "global_step": 122557, "epoch": 2918} {"train_loss": -6.451949119567871, "global_step": 122558, "epoch": 2918} {"train_loss": -6.5934648513793945, "global_step": 122559, "epoch": 2918} {"train_loss": -6.561690330505371, "global_step": 122560, "epoch": 2918} {"train_loss": -6.631839752197266, "global_step": 122561, "epoch": 2918} {"train_loss": -6.472904205322266, "global_step": 122562, "epoch": 2918} {"train_loss": -6.620282173156738, "global_step": 122563, "epoch": 2918} {"train_loss": -6.6363396644592285, "global_step": 122564, "epoch": 2918} {"train_loss": -6.533133506774902, "global_step": 122565, "epoch": 2918} {"train_loss": -6.6378865242004395, "global_step": 122566, "epoch": 2918} {"train_loss": -6.647914886474609, "global_step": 122567, "epoch": 2918} {"train_loss": -6.622415542602539, "global_step": 122568, "epoch": 2918} {"train_loss": -6.553460597991943, "global_step": 122569, "epoch": 2918} {"train_loss": -6.675909519195557, "global_step": 122570, "epoch": 2918} {"train_loss": -6.412270545959473, "global_step": 122571, "epoch": 2918} {"train_loss": -6.6269145011901855, "global_step": 122572, "epoch": 2918} {"train_loss": -6.682328224182129, "global_step": 122573, "epoch": 2918} {"train_loss": -6.478696823120117, "global_step": 122574, "epoch": 2918} {"train_loss": -6.601643085479736, "global_step": 122575, "epoch": 2918} {"train_loss": -6.597916603088379, "global_step": 122576, "epoch": 2918} {"train_loss": -6.5507283210754395, "global_step": 122577, "epoch": 2918} {"train_loss": -6.524194717407227, "global_step": 122578, "epoch": 2918} {"train_loss": -6.4906744956970215, "global_step": 122579, "epoch": 2918} {"train_loss": -6.362898826599121, "global_step": 122580, "epoch": 2918} {"train_loss": -6.524503707885742, "global_step": 122581, "epoch": 2918} {"train_loss": -6.342103958129883, "global_step": 122582, "epoch": 2918} {"train_loss": -6.475854873657227, "global_step": 122583, "epoch": 2918} {"train_loss": -6.516271591186523, "global_step": 122584, "epoch": 2918} {"train_loss": -6.402956008911133, "global_step": 122585, "epoch": 2918} {"train_loss": -6.386438846588135, "global_step": 122586, "epoch": 2918} {"train_loss": -6.484679222106934, "global_step": 122587, "epoch": 2918} {"train_loss": -6.477516174316406, "global_step": 122588, "epoch": 2918} {"train_loss": -6.566910743713379, "global_step": 122589, "epoch": 2918} {"train_loss": -6.374817848205566, "global_step": 122590, "epoch": 2918} {"train_loss": -6.493586540222168, "global_step": 122591, "epoch": 2918} {"train_loss": -6.532759189605713, "global_step": 122592, "epoch": 2918} {"train_loss": -6.336053848266602, "global_step": 122593, "epoch": 2918} {"train_loss": -6.607858657836914, "global_step": 122594, "epoch": 2918} {"train_loss": -6.498265266418457, "global_step": 122595, "epoch": 2918} {"train_loss": -6.59943962097168, "global_step": 122596, "epoch": 2918} {"train_loss": -6.529308069319952, "global_step": 122597, "epoch": 2918, "val_loss": 68156.125} {"train_loss": -6.444450378417969, "global_step": 122598, "epoch": 2919} {"train_loss": -6.441719055175781, "global_step": 122599, "epoch": 2919} {"train_loss": -6.488216876983643, "global_step": 122600, "epoch": 2919} {"train_loss": -6.4800519943237305, "global_step": 122601, "epoch": 2919} {"train_loss": -6.331812381744385, "global_step": 122602, "epoch": 2919} {"train_loss": -6.415428638458252, "global_step": 122603, "epoch": 2919} {"train_loss": -6.142903804779053, "global_step": 122604, "epoch": 2919} {"train_loss": -6.48641300201416, "global_step": 122605, "epoch": 2919} {"train_loss": -6.378785610198975, "global_step": 122606, "epoch": 2919} {"train_loss": -6.208214282989502, "global_step": 122607, "epoch": 2919} {"train_loss": -6.499273300170898, "global_step": 122608, "epoch": 2919} {"train_loss": -6.352463722229004, "global_step": 122609, "epoch": 2919} {"train_loss": -6.458765983581543, "global_step": 122610, "epoch": 2919} {"train_loss": -6.360054016113281, "global_step": 122611, "epoch": 2919} {"train_loss": -6.526414394378662, "global_step": 122612, "epoch": 2919} {"train_loss": -6.462503910064697, "global_step": 122613, "epoch": 2919} {"train_loss": -6.480579376220703, "global_step": 122614, "epoch": 2919} {"train_loss": -6.43402624130249, "global_step": 122615, "epoch": 2919} {"train_loss": -6.439571857452393, "global_step": 122616, "epoch": 2919} {"train_loss": -6.500143527984619, "global_step": 122617, "epoch": 2919} {"train_loss": -6.363708972930908, "global_step": 122618, "epoch": 2919} {"train_loss": -6.55900764465332, "global_step": 122619, "epoch": 2919} {"train_loss": -6.554694175720215, "global_step": 122620, "epoch": 2919} {"train_loss": -6.563625335693359, "global_step": 122621, "epoch": 2919} {"train_loss": -6.455081939697266, "global_step": 122622, "epoch": 2919} {"train_loss": -6.354296684265137, "global_step": 122623, "epoch": 2919} {"train_loss": -6.493658065795898, "global_step": 122624, "epoch": 2919} {"train_loss": -6.551354885101318, "global_step": 122625, "epoch": 2919} {"train_loss": -6.546842575073242, "global_step": 122626, "epoch": 2919} {"train_loss": -6.65000057220459, "global_step": 122627, "epoch": 2919} {"train_loss": -6.430858612060547, "global_step": 122628, "epoch": 2919} {"train_loss": -6.628047466278076, "global_step": 122629, "epoch": 2919} {"train_loss": -6.6714935302734375, "global_step": 122630, "epoch": 2919} {"train_loss": -6.455223083496094, "global_step": 122631, "epoch": 2919} {"train_loss": -6.552434921264648, "global_step": 122632, "epoch": 2919} {"train_loss": -6.573545455932617, "global_step": 122633, "epoch": 2919} {"train_loss": -6.445076942443848, "global_step": 122634, "epoch": 2919} {"train_loss": -6.468959808349609, "global_step": 122635, "epoch": 2919} {"train_loss": -6.516705513000488, "global_step": 122636, "epoch": 2919} {"train_loss": -6.331061363220215, "global_step": 122637, "epoch": 2919} {"train_loss": -6.532548427581787, "global_step": 122638, "epoch": 2919} {"train_loss": -6.463180962063017, "global_step": 122639, "epoch": 2919, "val_loss": 68064.3828125} {"train_loss": -6.4714274406433105, "global_step": 122640, "epoch": 2920} {"train_loss": -6.507022857666016, "global_step": 122641, "epoch": 2920} {"train_loss": -6.4895172119140625, "global_step": 122642, "epoch": 2920} {"train_loss": -6.493821144104004, "global_step": 122643, "epoch": 2920} {"train_loss": -6.462276935577393, "global_step": 122644, "epoch": 2920} {"train_loss": -6.457515716552734, "global_step": 122645, "epoch": 2920} {"train_loss": -6.52620792388916, "global_step": 122646, "epoch": 2920} {"train_loss": -6.568533420562744, "global_step": 122647, "epoch": 2920} {"train_loss": -6.529499053955078, "global_step": 122648, "epoch": 2920} {"train_loss": -6.5848588943481445, "global_step": 122649, "epoch": 2920} {"train_loss": -6.674140453338623, "global_step": 122650, "epoch": 2920} {"train_loss": -6.584534645080566, "global_step": 122651, "epoch": 2920} {"train_loss": -6.5190510749816895, "global_step": 122652, "epoch": 2920} {"train_loss": -6.522076606750488, "global_step": 122653, "epoch": 2920} {"train_loss": -6.5380659103393555, "global_step": 122654, "epoch": 2920} {"train_loss": -6.627854347229004, "global_step": 122655, "epoch": 2920} {"train_loss": -6.644293785095215, "global_step": 122656, "epoch": 2920} {"train_loss": -6.606370449066162, "global_step": 122657, "epoch": 2920} {"train_loss": -6.5353851318359375, "global_step": 122658, "epoch": 2920} {"train_loss": -6.643548488616943, "global_step": 122659, "epoch": 2920} {"train_loss": -6.572863578796387, "global_step": 122660, "epoch": 2920} {"train_loss": -6.542177200317383, "global_step": 122661, "epoch": 2920} {"train_loss": -6.695158004760742, "global_step": 122662, "epoch": 2920} {"train_loss": -6.567808628082275, "global_step": 122663, "epoch": 2920} {"train_loss": -6.585283279418945, "global_step": 122664, "epoch": 2920} {"train_loss": -6.507551193237305, "global_step": 122665, "epoch": 2920} {"train_loss": -6.484244346618652, "global_step": 122666, "epoch": 2920} {"train_loss": -6.475780963897705, "global_step": 122667, "epoch": 2920} {"train_loss": -6.490297317504883, "global_step": 122668, "epoch": 2920} {"train_loss": -6.547163963317871, "global_step": 122669, "epoch": 2920} {"train_loss": -6.476743698120117, "global_step": 122670, "epoch": 2920} {"train_loss": -6.597140789031982, "global_step": 122671, "epoch": 2920} {"train_loss": -6.459203720092773, "global_step": 122672, "epoch": 2920} {"train_loss": -6.61562442779541, "global_step": 122673, "epoch": 2920} {"train_loss": -6.582290172576904, "global_step": 122674, "epoch": 2920} {"train_loss": -6.4940290451049805, "global_step": 122675, "epoch": 2920} {"train_loss": -6.560113906860352, "global_step": 122676, "epoch": 2920} {"train_loss": -6.552275657653809, "global_step": 122677, "epoch": 2920} {"train_loss": -6.653627872467041, "global_step": 122678, "epoch": 2920} {"train_loss": -6.585988521575928, "global_step": 122679, "epoch": 2920} {"train_loss": -6.5997114181518555, "global_step": 122680, "epoch": 2920} {"train_loss": -6.550752480824788, "global_step": 122681, "epoch": 2920, "val_loss": 67859.0078125} {"train_loss": -6.636857986450195, "global_step": 122682, "epoch": 2921} {"train_loss": -6.505239486694336, "global_step": 122683, "epoch": 2921} {"train_loss": -6.642516613006592, "global_step": 122684, "epoch": 2921} {"train_loss": -6.643416404724121, "global_step": 122685, "epoch": 2921} {"train_loss": -6.579300403594971, "global_step": 122686, "epoch": 2921} {"train_loss": -6.595364093780518, "global_step": 122687, "epoch": 2921} {"train_loss": -6.6605634689331055, "global_step": 122688, "epoch": 2921} {"train_loss": -6.643529891967773, "global_step": 122689, "epoch": 2921} {"train_loss": -6.538846492767334, "global_step": 122690, "epoch": 2921} {"train_loss": -6.467761039733887, "global_step": 122691, "epoch": 2921} {"train_loss": -6.558911323547363, "global_step": 122692, "epoch": 2921} {"train_loss": -6.555071830749512, "global_step": 122693, "epoch": 2921} {"train_loss": -6.59577751159668, "global_step": 122694, "epoch": 2921} {"train_loss": -6.63632869720459, "global_step": 122695, "epoch": 2921} {"train_loss": -6.543631076812744, "global_step": 122696, "epoch": 2921} {"train_loss": -6.628406047821045, "global_step": 122697, "epoch": 2921} {"train_loss": -6.613676071166992, "global_step": 122698, "epoch": 2921} {"train_loss": -6.636198997497559, "global_step": 122699, "epoch": 2921} {"train_loss": -6.548103332519531, "global_step": 122700, "epoch": 2921} {"train_loss": -6.62161922454834, "global_step": 122701, "epoch": 2921} {"train_loss": -6.542181968688965, "global_step": 122702, "epoch": 2921} {"train_loss": -6.437469482421875, "global_step": 122703, "epoch": 2921} {"train_loss": -6.641435146331787, "global_step": 122704, "epoch": 2921} {"train_loss": -6.712630271911621, "global_step": 122705, "epoch": 2921} {"train_loss": -6.594829082489014, "global_step": 122706, "epoch": 2921} {"train_loss": -6.57807731628418, "global_step": 122707, "epoch": 2921} {"train_loss": -6.69072151184082, "global_step": 122708, "epoch": 2921} {"train_loss": -6.680335998535156, "global_step": 122709, "epoch": 2921} {"train_loss": -6.62156867980957, "global_step": 122710, "epoch": 2921} {"train_loss": -6.6091156005859375, "global_step": 122711, "epoch": 2921} {"train_loss": -6.551235198974609, "global_step": 122712, "epoch": 2921} {"train_loss": -6.650317192077637, "global_step": 122713, "epoch": 2921} {"train_loss": -6.608909606933594, "global_step": 122714, "epoch": 2921} {"train_loss": -6.541348934173584, "global_step": 122715, "epoch": 2921} {"train_loss": -6.600181579589844, "global_step": 122716, "epoch": 2921} {"train_loss": -6.619441986083984, "global_step": 122717, "epoch": 2921} {"train_loss": -6.492722034454346, "global_step": 122718, "epoch": 2921} {"train_loss": -6.650224208831787, "global_step": 122719, "epoch": 2921} {"train_loss": -6.38005256652832, "global_step": 122720, "epoch": 2921} {"train_loss": -6.597238063812256, "global_step": 122721, "epoch": 2921} {"train_loss": -6.524810791015625, "global_step": 122722, "epoch": 2921} {"train_loss": -6.588031405494327, "global_step": 122723, "epoch": 2921, "val_loss": 67913.703125} {"train_loss": -6.623777389526367, "global_step": 122724, "epoch": 2922} {"train_loss": -6.506547451019287, "global_step": 122725, "epoch": 2922} {"train_loss": -6.592058181762695, "global_step": 122726, "epoch": 2922} {"train_loss": -6.610047340393066, "global_step": 122727, "epoch": 2922} {"train_loss": -6.567007064819336, "global_step": 122728, "epoch": 2922} {"train_loss": -6.5490922927856445, "global_step": 122729, "epoch": 2922} {"train_loss": -6.5233354568481445, "global_step": 122730, "epoch": 2922} {"train_loss": -6.574827671051025, "global_step": 122731, "epoch": 2922} {"train_loss": -6.549807548522949, "global_step": 122732, "epoch": 2922} {"train_loss": -6.5804338455200195, "global_step": 122733, "epoch": 2922} {"train_loss": -6.51082181930542, "global_step": 122734, "epoch": 2922} {"train_loss": -6.516294002532959, "global_step": 122735, "epoch": 2922} {"train_loss": -6.545567512512207, "global_step": 122736, "epoch": 2922} {"train_loss": -6.49533748626709, "global_step": 122737, "epoch": 2922} {"train_loss": -6.557056427001953, "global_step": 122738, "epoch": 2922} {"train_loss": -6.516585350036621, "global_step": 122739, "epoch": 2922} {"train_loss": -6.3523712158203125, "global_step": 122740, "epoch": 2922} {"train_loss": -6.543911933898926, "global_step": 122741, "epoch": 2922} {"train_loss": -6.399592399597168, "global_step": 122742, "epoch": 2922} {"train_loss": -6.533485412597656, "global_step": 122743, "epoch": 2922} {"train_loss": -6.425175666809082, "global_step": 122744, "epoch": 2922} {"train_loss": -6.5421953201293945, "global_step": 122745, "epoch": 2922} {"train_loss": -6.414435386657715, "global_step": 122746, "epoch": 2922} {"train_loss": -6.534732818603516, "global_step": 122747, "epoch": 2922} {"train_loss": -6.497679710388184, "global_step": 122748, "epoch": 2922} {"train_loss": -6.5078253746032715, "global_step": 122749, "epoch": 2922} {"train_loss": -6.5354156494140625, "global_step": 122750, "epoch": 2922} {"train_loss": -6.4816999435424805, "global_step": 122751, "epoch": 2922} {"train_loss": -6.462804317474365, "global_step": 122752, "epoch": 2922} {"train_loss": -6.4663190841674805, "global_step": 122753, "epoch": 2922} {"train_loss": -6.461605072021484, "global_step": 122754, "epoch": 2922} {"train_loss": -6.522207260131836, "global_step": 122755, "epoch": 2922} {"train_loss": -6.325778484344482, "global_step": 122756, "epoch": 2922} {"train_loss": -6.519352436065674, "global_step": 122757, "epoch": 2922} {"train_loss": -6.522539138793945, "global_step": 122758, "epoch": 2922} {"train_loss": -6.470508575439453, "global_step": 122759, "epoch": 2922} {"train_loss": -6.466646671295166, "global_step": 122760, "epoch": 2922} {"train_loss": -6.48436975479126, "global_step": 122761, "epoch": 2922} {"train_loss": -6.574033260345459, "global_step": 122762, "epoch": 2922} {"train_loss": -6.673291206359863, "global_step": 122763, "epoch": 2922} {"train_loss": -6.529964447021484, "global_step": 122764, "epoch": 2922} {"train_loss": -6.515355314527239, "global_step": 122765, "epoch": 2922, "val_loss": 67965.2109375} {"train_loss": -6.580455303192139, "global_step": 122766, "epoch": 2923} {"train_loss": -6.593860626220703, "global_step": 122767, "epoch": 2923} {"train_loss": -6.57832145690918, "global_step": 122768, "epoch": 2923} {"train_loss": -6.608985900878906, "global_step": 122769, "epoch": 2923} {"train_loss": -6.542299747467041, "global_step": 122770, "epoch": 2923} {"train_loss": -6.580078125, "global_step": 122771, "epoch": 2923} {"train_loss": -6.566928863525391, "global_step": 122772, "epoch": 2923} {"train_loss": -6.600028991699219, "global_step": 122773, "epoch": 2923} {"train_loss": -6.461341381072998, "global_step": 122774, "epoch": 2923} {"train_loss": -6.525771141052246, "global_step": 122775, "epoch": 2923} {"train_loss": -6.570059776306152, "global_step": 122776, "epoch": 2923} {"train_loss": -6.6219072341918945, "global_step": 122777, "epoch": 2923} {"train_loss": -6.619500637054443, "global_step": 122778, "epoch": 2923} {"train_loss": -6.678194999694824, "global_step": 122779, "epoch": 2923} {"train_loss": -6.535952568054199, "global_step": 122780, "epoch": 2923} {"train_loss": -6.510319232940674, "global_step": 122781, "epoch": 2923} {"train_loss": -6.5736236572265625, "global_step": 122782, "epoch": 2923} {"train_loss": -6.466488361358643, "global_step": 122783, "epoch": 2923} {"train_loss": -6.463994979858398, "global_step": 122784, "epoch": 2923} {"train_loss": -6.549262046813965, "global_step": 122785, "epoch": 2923} {"train_loss": -6.55874490737915, "global_step": 122786, "epoch": 2923} {"train_loss": -6.576201438903809, "global_step": 122787, "epoch": 2923} {"train_loss": -6.523027420043945, "global_step": 122788, "epoch": 2923} {"train_loss": -6.482704162597656, "global_step": 122789, "epoch": 2923} {"train_loss": -6.540438175201416, "global_step": 122790, "epoch": 2923} {"train_loss": -6.66254997253418, "global_step": 122791, "epoch": 2923} {"train_loss": -6.513473987579346, "global_step": 122792, "epoch": 2923} {"train_loss": -6.608831405639648, "global_step": 122793, "epoch": 2923} {"train_loss": -6.613124847412109, "global_step": 122794, "epoch": 2923} {"train_loss": -6.630013465881348, "global_step": 122795, "epoch": 2923} {"train_loss": -6.638468265533447, "global_step": 122796, "epoch": 2923} {"train_loss": -6.46287727355957, "global_step": 122797, "epoch": 2923} {"train_loss": -6.659450531005859, "global_step": 122798, "epoch": 2923} {"train_loss": -6.57131814956665, "global_step": 122799, "epoch": 2923} {"train_loss": -6.633974075317383, "global_step": 122800, "epoch": 2923} {"train_loss": -6.653713226318359, "global_step": 122801, "epoch": 2923} {"train_loss": -6.610283851623535, "global_step": 122802, "epoch": 2923} {"train_loss": -6.626136302947998, "global_step": 122803, "epoch": 2923} {"train_loss": -6.577869415283203, "global_step": 122804, "epoch": 2923} {"train_loss": -6.57541036605835, "global_step": 122805, "epoch": 2923} {"train_loss": -6.43684196472168, "global_step": 122806, "epoch": 2923} {"train_loss": -6.570744843710036, "global_step": 122807, "epoch": 2923, "val_loss": 68107.265625} {"train_loss": -6.524941444396973, "global_step": 122808, "epoch": 2924} {"train_loss": -6.402551651000977, "global_step": 122809, "epoch": 2924} {"train_loss": -6.471014976501465, "global_step": 122810, "epoch": 2924} {"train_loss": -6.632004737854004, "global_step": 122811, "epoch": 2924} {"train_loss": -6.529162883758545, "global_step": 122812, "epoch": 2924} {"train_loss": -6.529547691345215, "global_step": 122813, "epoch": 2924} {"train_loss": -6.563472747802734, "global_step": 122814, "epoch": 2924} {"train_loss": -6.6637067794799805, "global_step": 122815, "epoch": 2924} {"train_loss": -6.537673473358154, "global_step": 122816, "epoch": 2924} {"train_loss": -6.537193298339844, "global_step": 122817, "epoch": 2924} {"train_loss": -6.531301975250244, "global_step": 122818, "epoch": 2924} {"train_loss": -6.648238182067871, "global_step": 122819, "epoch": 2924} {"train_loss": -6.566494464874268, "global_step": 122820, "epoch": 2924} {"train_loss": -6.574408531188965, "global_step": 122821, "epoch": 2924} {"train_loss": -6.483822822570801, "global_step": 122822, "epoch": 2924} {"train_loss": -6.654069423675537, "global_step": 122823, "epoch": 2924} {"train_loss": -6.549535751342773, "global_step": 122824, "epoch": 2924} {"train_loss": -6.487405776977539, "global_step": 122825, "epoch": 2924} {"train_loss": -6.473413467407227, "global_step": 122826, "epoch": 2924} {"train_loss": -6.507234573364258, "global_step": 122827, "epoch": 2924} {"train_loss": -6.395287990570068, "global_step": 122828, "epoch": 2924} {"train_loss": -6.4977126121521, "global_step": 122829, "epoch": 2924} {"train_loss": -6.425175666809082, "global_step": 122830, "epoch": 2924} {"train_loss": -6.4789557456970215, "global_step": 122831, "epoch": 2924} {"train_loss": -6.488852500915527, "global_step": 122832, "epoch": 2924} {"train_loss": -6.38175106048584, "global_step": 122833, "epoch": 2924} {"train_loss": -6.5362467765808105, "global_step": 122834, "epoch": 2924} {"train_loss": -6.564447402954102, "global_step": 122835, "epoch": 2924} {"train_loss": -6.53535795211792, "global_step": 122836, "epoch": 2924} {"train_loss": -6.405789852142334, "global_step": 122837, "epoch": 2924} {"train_loss": -6.502416133880615, "global_step": 122838, "epoch": 2924} {"train_loss": -6.556950569152832, "global_step": 122839, "epoch": 2924} {"train_loss": -6.504850387573242, "global_step": 122840, "epoch": 2924} {"train_loss": -6.587839603424072, "global_step": 122841, "epoch": 2924} {"train_loss": -6.632392883300781, "global_step": 122842, "epoch": 2924} {"train_loss": -6.606557846069336, "global_step": 122843, "epoch": 2924} {"train_loss": -6.65482234954834, "global_step": 122844, "epoch": 2924} {"train_loss": -6.503149509429932, "global_step": 122845, "epoch": 2924} {"train_loss": -6.6210808753967285, "global_step": 122846, "epoch": 2924} {"train_loss": -6.46012020111084, "global_step": 122847, "epoch": 2924} {"train_loss": -6.602753639221191, "global_step": 122848, "epoch": 2924} {"train_loss": -6.535086030051822, "global_step": 122849, "epoch": 2924, "val_loss": 67939.984375} {"train_loss": -6.5058817863464355, "global_step": 122850, "epoch": 2925} {"train_loss": -6.595245361328125, "global_step": 122851, "epoch": 2925} {"train_loss": -6.534272193908691, "global_step": 122852, "epoch": 2925} {"train_loss": -6.66572380065918, "global_step": 122853, "epoch": 2925} {"train_loss": -6.622054576873779, "global_step": 122854, "epoch": 2925} {"train_loss": -6.683209419250488, "global_step": 122855, "epoch": 2925} {"train_loss": -6.632106781005859, "global_step": 122856, "epoch": 2925} {"train_loss": -6.612509727478027, "global_step": 122857, "epoch": 2925} {"train_loss": -6.607170104980469, "global_step": 122858, "epoch": 2925} {"train_loss": -6.564266204833984, "global_step": 122859, "epoch": 2925} {"train_loss": -6.587197780609131, "global_step": 122860, "epoch": 2925} {"train_loss": -6.617348670959473, "global_step": 122861, "epoch": 2925} {"train_loss": -6.5703325271606445, "global_step": 122862, "epoch": 2925} {"train_loss": -6.519765377044678, "global_step": 122863, "epoch": 2925} {"train_loss": -6.674709320068359, "global_step": 122864, "epoch": 2925} {"train_loss": -6.56818151473999, "global_step": 122865, "epoch": 2925} {"train_loss": -6.484136581420898, "global_step": 122866, "epoch": 2925} {"train_loss": -6.610342025756836, "global_step": 122867, "epoch": 2925} {"train_loss": -6.5705413818359375, "global_step": 122868, "epoch": 2925} {"train_loss": -6.69033145904541, "global_step": 122869, "epoch": 2925} {"train_loss": -6.442421913146973, "global_step": 122870, "epoch": 2925} {"train_loss": -6.595757961273193, "global_step": 122871, "epoch": 2925} {"train_loss": -6.577487945556641, "global_step": 122872, "epoch": 2925} {"train_loss": -6.441618919372559, "global_step": 122873, "epoch": 2925} {"train_loss": -6.549797058105469, "global_step": 122874, "epoch": 2925} {"train_loss": -6.587478160858154, "global_step": 122875, "epoch": 2925} {"train_loss": -6.557413101196289, "global_step": 122876, "epoch": 2925} {"train_loss": -6.515444278717041, "global_step": 122877, "epoch": 2925} {"train_loss": -6.570899963378906, "global_step": 122878, "epoch": 2925} {"train_loss": -6.515380859375, "global_step": 122879, "epoch": 2925} {"train_loss": -6.512660026550293, "global_step": 122880, "epoch": 2925} {"train_loss": -6.412756443023682, "global_step": 122881, "epoch": 2925} {"train_loss": -6.666240692138672, "global_step": 122882, "epoch": 2925} {"train_loss": -6.441486358642578, "global_step": 122883, "epoch": 2925} {"train_loss": -6.433980464935303, "global_step": 122884, "epoch": 2925} {"train_loss": -6.454829692840576, "global_step": 122885, "epoch": 2925} {"train_loss": -6.491429328918457, "global_step": 122886, "epoch": 2925} {"train_loss": -6.534383773803711, "global_step": 122887, "epoch": 2925} {"train_loss": -6.472304344177246, "global_step": 122888, "epoch": 2925} {"train_loss": -6.543478965759277, "global_step": 122889, "epoch": 2925} {"train_loss": -6.457204818725586, "global_step": 122890, "epoch": 2925} {"train_loss": -6.548920937946865, "global_step": 122891, "epoch": 2925, "val_loss": 67751.4140625} {"train_loss": -6.505884647369385, "global_step": 122892, "epoch": 2926} {"train_loss": -6.413827896118164, "global_step": 122893, "epoch": 2926} {"train_loss": -6.5458197593688965, "global_step": 122894, "epoch": 2926} {"train_loss": -6.563876152038574, "global_step": 122895, "epoch": 2926} {"train_loss": -6.478362560272217, "global_step": 122896, "epoch": 2926} {"train_loss": -6.5653157234191895, "global_step": 122897, "epoch": 2926} {"train_loss": -6.487515449523926, "global_step": 122898, "epoch": 2926} {"train_loss": -6.564051628112793, "global_step": 122899, "epoch": 2926} {"train_loss": -6.48116397857666, "global_step": 122900, "epoch": 2926} {"train_loss": -6.476940155029297, "global_step": 122901, "epoch": 2926} {"train_loss": -6.529630661010742, "global_step": 122902, "epoch": 2926} {"train_loss": -6.462528705596924, "global_step": 122903, "epoch": 2926} {"train_loss": -6.495277404785156, "global_step": 122904, "epoch": 2926} {"train_loss": -6.566080570220947, "global_step": 122905, "epoch": 2926} {"train_loss": -6.589566707611084, "global_step": 122906, "epoch": 2926} {"train_loss": -6.57505989074707, "global_step": 122907, "epoch": 2926} {"train_loss": -6.633156776428223, "global_step": 122908, "epoch": 2926} {"train_loss": -6.628060340881348, "global_step": 122909, "epoch": 2926} {"train_loss": -6.522991180419922, "global_step": 122910, "epoch": 2926} {"train_loss": -6.502622604370117, "global_step": 122911, "epoch": 2926} {"train_loss": -6.55851936340332, "global_step": 122912, "epoch": 2926} {"train_loss": -6.460676193237305, "global_step": 122913, "epoch": 2926} {"train_loss": -6.527058124542236, "global_step": 122914, "epoch": 2926} {"train_loss": -6.462459564208984, "global_step": 122915, "epoch": 2926} {"train_loss": -6.430303573608398, "global_step": 122916, "epoch": 2926} {"train_loss": -6.552871227264404, "global_step": 122917, "epoch": 2926} {"train_loss": -6.562029838562012, "global_step": 122918, "epoch": 2926} {"train_loss": -6.507126808166504, "global_step": 122919, "epoch": 2926} {"train_loss": -6.573714256286621, "global_step": 122920, "epoch": 2926} {"train_loss": -6.4796600341796875, "global_step": 122921, "epoch": 2926} {"train_loss": -6.549156665802002, "global_step": 122922, "epoch": 2926} {"train_loss": -6.4124345779418945, "global_step": 122923, "epoch": 2926} {"train_loss": -6.545065879821777, "global_step": 122924, "epoch": 2926} {"train_loss": -6.583449363708496, "global_step": 122925, "epoch": 2926} {"train_loss": -6.488335132598877, "global_step": 122926, "epoch": 2926} {"train_loss": -6.38247013092041, "global_step": 122927, "epoch": 2926} {"train_loss": -6.365272521972656, "global_step": 122928, "epoch": 2926} {"train_loss": -6.5729498863220215, "global_step": 122929, "epoch": 2926} {"train_loss": -6.51934814453125, "global_step": 122930, "epoch": 2926} {"train_loss": -6.390969276428223, "global_step": 122931, "epoch": 2926} {"train_loss": -6.474328517913818, "global_step": 122932, "epoch": 2926} {"train_loss": -6.5097093014490035, "global_step": 122933, "epoch": 2926, "val_loss": 67852.71875} {"train_loss": -6.4694318771362305, "global_step": 122934, "epoch": 2927} {"train_loss": -6.545734405517578, "global_step": 122935, "epoch": 2927} {"train_loss": -6.542385101318359, "global_step": 122936, "epoch": 2927} {"train_loss": -6.492312431335449, "global_step": 122937, "epoch": 2927} {"train_loss": -6.551590919494629, "global_step": 122938, "epoch": 2927} {"train_loss": -6.562079429626465, "global_step": 122939, "epoch": 2927} {"train_loss": -6.650649070739746, "global_step": 122940, "epoch": 2927} {"train_loss": -6.445318222045898, "global_step": 122941, "epoch": 2927} {"train_loss": -6.539405822753906, "global_step": 122942, "epoch": 2927} {"train_loss": -6.5212225914001465, "global_step": 122943, "epoch": 2927} {"train_loss": -6.498909950256348, "global_step": 122944, "epoch": 2927} {"train_loss": -6.482816219329834, "global_step": 122945, "epoch": 2927} {"train_loss": -6.49625301361084, "global_step": 122946, "epoch": 2927} {"train_loss": -6.7114152908325195, "global_step": 122947, "epoch": 2927} {"train_loss": -6.681540012359619, "global_step": 122948, "epoch": 2927} {"train_loss": -6.6798481941223145, "global_step": 122949, "epoch": 2927} {"train_loss": -6.428497314453125, "global_step": 122950, "epoch": 2927} {"train_loss": -6.546629905700684, "global_step": 122951, "epoch": 2927} {"train_loss": -6.593891143798828, "global_step": 122952, "epoch": 2927} {"train_loss": -6.519045352935791, "global_step": 122953, "epoch": 2927} {"train_loss": -6.567105293273926, "global_step": 122954, "epoch": 2927} {"train_loss": -6.499868392944336, "global_step": 122955, "epoch": 2927} {"train_loss": -6.646760940551758, "global_step": 122956, "epoch": 2927} {"train_loss": -6.597765922546387, "global_step": 122957, "epoch": 2927} {"train_loss": -6.548758506774902, "global_step": 122958, "epoch": 2927} {"train_loss": -6.4707231521606445, "global_step": 122959, "epoch": 2927} {"train_loss": -6.511510848999023, "global_step": 122960, "epoch": 2927} {"train_loss": -6.443133354187012, "global_step": 122961, "epoch": 2927} {"train_loss": -6.428763389587402, "global_step": 122962, "epoch": 2927} {"train_loss": -6.44558048248291, "global_step": 122963, "epoch": 2927} {"train_loss": -6.548768520355225, "global_step": 122964, "epoch": 2927} {"train_loss": -6.527708053588867, "global_step": 122965, "epoch": 2927} {"train_loss": -6.6578898429870605, "global_step": 122966, "epoch": 2927} {"train_loss": -6.529975891113281, "global_step": 122967, "epoch": 2927} {"train_loss": -6.544315338134766, "global_step": 122968, "epoch": 2927} {"train_loss": -6.650170803070068, "global_step": 122969, "epoch": 2927} {"train_loss": -6.569281101226807, "global_step": 122970, "epoch": 2927} {"train_loss": -6.572855472564697, "global_step": 122971, "epoch": 2927} {"train_loss": -6.563628196716309, "global_step": 122972, "epoch": 2927} {"train_loss": -6.502910137176514, "global_step": 122973, "epoch": 2927} {"train_loss": -6.580428600311279, "global_step": 122974, "epoch": 2927} {"train_loss": -6.545804795764742, "global_step": 122975, "epoch": 2927, "val_loss": 68037.2734375} {"train_loss": -6.605589389801025, "global_step": 122976, "epoch": 2928} {"train_loss": -6.621269702911377, "global_step": 122977, "epoch": 2928} {"train_loss": -6.604715347290039, "global_step": 122978, "epoch": 2928} {"train_loss": -6.630840301513672, "global_step": 122979, "epoch": 2928} {"train_loss": -6.579801082611084, "global_step": 122980, "epoch": 2928} {"train_loss": -6.5495500564575195, "global_step": 122981, "epoch": 2928} {"train_loss": -6.552823066711426, "global_step": 122982, "epoch": 2928} {"train_loss": -6.432706832885742, "global_step": 122983, "epoch": 2928} {"train_loss": -6.512707710266113, "global_step": 122984, "epoch": 2928} {"train_loss": -6.6091461181640625, "global_step": 122985, "epoch": 2928} {"train_loss": -6.512384414672852, "global_step": 122986, "epoch": 2928} {"train_loss": -6.583783149719238, "global_step": 122987, "epoch": 2928} {"train_loss": -6.528739929199219, "global_step": 122988, "epoch": 2928} {"train_loss": -6.582339286804199, "global_step": 122989, "epoch": 2928} {"train_loss": -6.5185747146606445, "global_step": 122990, "epoch": 2928} {"train_loss": -6.393223762512207, "global_step": 122991, "epoch": 2928} {"train_loss": -6.547493934631348, "global_step": 122992, "epoch": 2928} {"train_loss": -6.451935768127441, "global_step": 122993, "epoch": 2928} {"train_loss": -6.518338680267334, "global_step": 122994, "epoch": 2928} {"train_loss": -6.468153476715088, "global_step": 122995, "epoch": 2928} {"train_loss": -6.5472917556762695, "global_step": 122996, "epoch": 2928} {"train_loss": -6.495717525482178, "global_step": 122997, "epoch": 2928} {"train_loss": -6.5599517822265625, "global_step": 122998, "epoch": 2928} {"train_loss": -6.561847686767578, "global_step": 122999, "epoch": 2928} {"train_loss": -6.471951484680176, "global_step": 123000, "epoch": 2928} {"train_loss": -6.438782691955566, "global_step": 123001, "epoch": 2928} {"train_loss": -6.407567024230957, "global_step": 123002, "epoch": 2928} {"train_loss": -6.526366233825684, "global_step": 123003, "epoch": 2928} {"train_loss": -6.486693382263184, "global_step": 123004, "epoch": 2928} {"train_loss": -6.461902618408203, "global_step": 123005, "epoch": 2928} {"train_loss": -6.491772651672363, "global_step": 123006, "epoch": 2928} {"train_loss": -6.564587593078613, "global_step": 123007, "epoch": 2928} {"train_loss": -6.325217247009277, "global_step": 123008, "epoch": 2928} {"train_loss": -6.5799641609191895, "global_step": 123009, "epoch": 2928} {"train_loss": -6.3235368728637695, "global_step": 123010, "epoch": 2928} {"train_loss": -6.59272575378418, "global_step": 123011, "epoch": 2928} {"train_loss": -6.317753791809082, "global_step": 123012, "epoch": 2928} {"train_loss": -6.540701866149902, "global_step": 123013, "epoch": 2928} {"train_loss": -6.572480201721191, "global_step": 123014, "epoch": 2928} {"train_loss": -6.541065216064453, "global_step": 123015, "epoch": 2928} {"train_loss": -6.505952835083008, "global_step": 123016, "epoch": 2928} {"train_loss": -6.517562400727045, "global_step": 123017, "epoch": 2928, "val_loss": 68071.8515625} {"train_loss": -6.636338710784912, "global_step": 123018, "epoch": 2929} {"train_loss": -6.500629425048828, "global_step": 123019, "epoch": 2929} {"train_loss": -6.609894752502441, "global_step": 123020, "epoch": 2929} {"train_loss": -6.566822528839111, "global_step": 123021, "epoch": 2929} {"train_loss": -6.767385482788086, "global_step": 123022, "epoch": 2929} {"train_loss": -6.468521595001221, "global_step": 123023, "epoch": 2929} {"train_loss": -6.458678245544434, "global_step": 123024, "epoch": 2929} {"train_loss": -6.418550491333008, "global_step": 123025, "epoch": 2929} {"train_loss": -6.489458084106445, "global_step": 123026, "epoch": 2929} {"train_loss": -6.486719131469727, "global_step": 123027, "epoch": 2929} {"train_loss": -6.533841133117676, "global_step": 123028, "epoch": 2929} {"train_loss": -6.5619354248046875, "global_step": 123029, "epoch": 2929} {"train_loss": -6.542693614959717, "global_step": 123030, "epoch": 2929} {"train_loss": -6.626881122589111, "global_step": 123031, "epoch": 2929} {"train_loss": -6.52175760269165, "global_step": 123032, "epoch": 2929} {"train_loss": -6.569248199462891, "global_step": 123033, "epoch": 2929} {"train_loss": -6.568093299865723, "global_step": 123034, "epoch": 2929} {"train_loss": -6.485617160797119, "global_step": 123035, "epoch": 2929} {"train_loss": -6.474963188171387, "global_step": 123036, "epoch": 2929} {"train_loss": -6.629418849945068, "global_step": 123037, "epoch": 2929} {"train_loss": -6.553497314453125, "global_step": 123038, "epoch": 2929} {"train_loss": -6.572500705718994, "global_step": 123039, "epoch": 2929} {"train_loss": -6.584373950958252, "global_step": 123040, "epoch": 2929} {"train_loss": -6.544958114624023, "global_step": 123041, "epoch": 2929} {"train_loss": -6.629810333251953, "global_step": 123042, "epoch": 2929} {"train_loss": -6.633066654205322, "global_step": 123043, "epoch": 2929} {"train_loss": -6.438028335571289, "global_step": 123044, "epoch": 2929} {"train_loss": -6.58003568649292, "global_step": 123045, "epoch": 2929} {"train_loss": -6.567420482635498, "global_step": 123046, "epoch": 2929} {"train_loss": -6.6338653564453125, "global_step": 123047, "epoch": 2929} {"train_loss": -6.700984954833984, "global_step": 123048, "epoch": 2929} {"train_loss": -6.586298942565918, "global_step": 123049, "epoch": 2929} {"train_loss": -6.592309951782227, "global_step": 123050, "epoch": 2929} {"train_loss": -6.48965311050415, "global_step": 123051, "epoch": 2929} {"train_loss": -6.5269317626953125, "global_step": 123052, "epoch": 2929} {"train_loss": -6.6651506423950195, "global_step": 123053, "epoch": 2929} {"train_loss": -6.509461402893066, "global_step": 123054, "epoch": 2929} {"train_loss": -6.668968677520752, "global_step": 123055, "epoch": 2929} {"train_loss": -6.674809455871582, "global_step": 123056, "epoch": 2929} {"train_loss": -6.640042304992676, "global_step": 123057, "epoch": 2929} {"train_loss": -6.604755401611328, "global_step": 123058, "epoch": 2929} {"train_loss": -6.569402399517241, "global_step": 123059, "epoch": 2929, "val_loss": 67781.75} {"train_loss": -6.502693176269531, "global_step": 123060, "epoch": 2930} {"train_loss": -6.670773506164551, "global_step": 123061, "epoch": 2930} {"train_loss": -6.470800876617432, "global_step": 123062, "epoch": 2930} {"train_loss": -6.557313919067383, "global_step": 123063, "epoch": 2930} {"train_loss": -6.599656105041504, "global_step": 123064, "epoch": 2930} {"train_loss": -6.576356887817383, "global_step": 123065, "epoch": 2930} {"train_loss": -6.579293251037598, "global_step": 123066, "epoch": 2930} {"train_loss": -6.476935386657715, "global_step": 123067, "epoch": 2930} {"train_loss": -6.531007766723633, "global_step": 123068, "epoch": 2930} {"train_loss": -6.587038993835449, "global_step": 123069, "epoch": 2930} {"train_loss": -6.610633373260498, "global_step": 123070, "epoch": 2930} {"train_loss": -6.488800048828125, "global_step": 123071, "epoch": 2930} {"train_loss": -6.5454020500183105, "global_step": 123072, "epoch": 2930} {"train_loss": -6.5979156494140625, "global_step": 123073, "epoch": 2930} {"train_loss": -6.467592239379883, "global_step": 123074, "epoch": 2930} {"train_loss": -6.575716972351074, "global_step": 123075, "epoch": 2930} {"train_loss": -6.550024032592773, "global_step": 123076, "epoch": 2930} {"train_loss": -6.544655799865723, "global_step": 123077, "epoch": 2930} {"train_loss": -6.516478538513184, "global_step": 123078, "epoch": 2930} {"train_loss": -6.56404972076416, "global_step": 123079, "epoch": 2930} {"train_loss": -6.592016696929932, "global_step": 123080, "epoch": 2930} {"train_loss": -6.562976837158203, "global_step": 123081, "epoch": 2930} {"train_loss": -6.632588863372803, "global_step": 123082, "epoch": 2930} {"train_loss": -6.575383186340332, "global_step": 123083, "epoch": 2930} {"train_loss": -6.57086181640625, "global_step": 123084, "epoch": 2930} {"train_loss": -6.5275702476501465, "global_step": 123085, "epoch": 2930} {"train_loss": -6.580233573913574, "global_step": 123086, "epoch": 2930} {"train_loss": -6.5548906326293945, "global_step": 123087, "epoch": 2930} {"train_loss": -6.564105033874512, "global_step": 123088, "epoch": 2930} {"train_loss": -6.401312828063965, "global_step": 123089, "epoch": 2930} {"train_loss": -6.539684295654297, "global_step": 123090, "epoch": 2930} {"train_loss": -6.579392910003662, "global_step": 123091, "epoch": 2930} {"train_loss": -6.603072166442871, "global_step": 123092, "epoch": 2930} {"train_loss": -6.678604602813721, "global_step": 123093, "epoch": 2930} {"train_loss": -6.623937129974365, "global_step": 123094, "epoch": 2930} {"train_loss": -6.636307239532471, "global_step": 123095, "epoch": 2930} {"train_loss": -6.598368167877197, "global_step": 123096, "epoch": 2930} {"train_loss": -6.6070990562438965, "global_step": 123097, "epoch": 2930} {"train_loss": -6.586206436157227, "global_step": 123098, "epoch": 2930} {"train_loss": -6.617785453796387, "global_step": 123099, "epoch": 2930} {"train_loss": -6.55581521987915, "global_step": 123100, "epoch": 2930} {"train_loss": -6.567067736671085, "global_step": 123101, "epoch": 2930, "val_loss": 68081.234375} {"train_loss": -6.517086982727051, "global_step": 123102, "epoch": 2931} {"train_loss": -6.600088119506836, "global_step": 123103, "epoch": 2931} {"train_loss": -6.609752655029297, "global_step": 123104, "epoch": 2931} {"train_loss": -6.683471202850342, "global_step": 123105, "epoch": 2931} {"train_loss": -6.617273330688477, "global_step": 123106, "epoch": 2931} {"train_loss": -6.585390090942383, "global_step": 123107, "epoch": 2931} {"train_loss": -6.59309720993042, "global_step": 123108, "epoch": 2931} {"train_loss": -6.5728440284729, "global_step": 123109, "epoch": 2931} {"train_loss": -6.684737205505371, "global_step": 123110, "epoch": 2931} {"train_loss": -6.585559844970703, "global_step": 123111, "epoch": 2931} {"train_loss": -6.466607093811035, "global_step": 123112, "epoch": 2931} {"train_loss": -6.594273090362549, "global_step": 123113, "epoch": 2931} {"train_loss": -6.553440570831299, "global_step": 123114, "epoch": 2931} {"train_loss": -6.534640312194824, "global_step": 123115, "epoch": 2931} {"train_loss": -6.5782670974731445, "global_step": 123116, "epoch": 2931} {"train_loss": -6.5781426429748535, "global_step": 123117, "epoch": 2931} {"train_loss": -6.564377784729004, "global_step": 123118, "epoch": 2931} {"train_loss": -6.550566673278809, "global_step": 123119, "epoch": 2931} {"train_loss": -6.613152503967285, "global_step": 123120, "epoch": 2931} {"train_loss": -6.55369234085083, "global_step": 123121, "epoch": 2931} {"train_loss": -6.544990539550781, "global_step": 123122, "epoch": 2931} {"train_loss": -6.573444366455078, "global_step": 123123, "epoch": 2931} {"train_loss": -6.556692123413086, "global_step": 123124, "epoch": 2931} {"train_loss": -6.599946975708008, "global_step": 123125, "epoch": 2931} {"train_loss": -6.567563056945801, "global_step": 123126, "epoch": 2931} {"train_loss": -6.554010391235352, "global_step": 123127, "epoch": 2931} {"train_loss": -6.541516304016113, "global_step": 123128, "epoch": 2931} {"train_loss": -6.577160358428955, "global_step": 123129, "epoch": 2931} {"train_loss": -6.561248779296875, "global_step": 123130, "epoch": 2931} {"train_loss": -6.549752235412598, "global_step": 123131, "epoch": 2931} {"train_loss": -6.673244953155518, "global_step": 123132, "epoch": 2931} {"train_loss": -6.5502519607543945, "global_step": 123133, "epoch": 2931} {"train_loss": -6.67633056640625, "global_step": 123134, "epoch": 2931} {"train_loss": -6.589852333068848, "global_step": 123135, "epoch": 2931} {"train_loss": -6.6004109382629395, "global_step": 123136, "epoch": 2931} {"train_loss": -6.396787643432617, "global_step": 123137, "epoch": 2931} {"train_loss": -6.533030986785889, "global_step": 123138, "epoch": 2931} {"train_loss": -6.588414192199707, "global_step": 123139, "epoch": 2931} {"train_loss": -6.506748199462891, "global_step": 123140, "epoch": 2931} {"train_loss": -6.5798492431640625, "global_step": 123141, "epoch": 2931} {"train_loss": -6.540035724639893, "global_step": 123142, "epoch": 2931} {"train_loss": -6.574050244830904, "global_step": 123143, "epoch": 2931, "val_loss": 68004.3046875} {"train_loss": -6.596322059631348, "global_step": 123144, "epoch": 2932} {"train_loss": -6.577057838439941, "global_step": 123145, "epoch": 2932} {"train_loss": -6.649580001831055, "global_step": 123146, "epoch": 2932} {"train_loss": -6.600997447967529, "global_step": 123147, "epoch": 2932} {"train_loss": -6.593945503234863, "global_step": 123148, "epoch": 2932} {"train_loss": -6.527555465698242, "global_step": 123149, "epoch": 2932} {"train_loss": -6.421034812927246, "global_step": 123150, "epoch": 2932} {"train_loss": -6.548838138580322, "global_step": 123151, "epoch": 2932} {"train_loss": -6.556731224060059, "global_step": 123152, "epoch": 2932} {"train_loss": -6.507937908172607, "global_step": 123153, "epoch": 2932} {"train_loss": -6.453771591186523, "global_step": 123154, "epoch": 2932} {"train_loss": -6.553555011749268, "global_step": 123155, "epoch": 2932} {"train_loss": -6.4884772300720215, "global_step": 123156, "epoch": 2932} {"train_loss": -6.410774230957031, "global_step": 123157, "epoch": 2932} {"train_loss": -6.502528190612793, "global_step": 123158, "epoch": 2932} {"train_loss": -6.429798603057861, "global_step": 123159, "epoch": 2932} {"train_loss": -6.492068290710449, "global_step": 123160, "epoch": 2932} {"train_loss": -6.523146629333496, "global_step": 123161, "epoch": 2932} {"train_loss": -6.538717269897461, "global_step": 123162, "epoch": 2932} {"train_loss": -6.570389747619629, "global_step": 123163, "epoch": 2932} {"train_loss": -6.538235664367676, "global_step": 123164, "epoch": 2932} {"train_loss": -6.606618881225586, "global_step": 123165, "epoch": 2932} {"train_loss": -6.480032920837402, "global_step": 123166, "epoch": 2932} {"train_loss": -6.406406402587891, "global_step": 123167, "epoch": 2932} {"train_loss": -6.579150199890137, "global_step": 123168, "epoch": 2932} {"train_loss": -6.5187201499938965, "global_step": 123169, "epoch": 2932} {"train_loss": -6.598453521728516, "global_step": 123170, "epoch": 2932} {"train_loss": -6.470822334289551, "global_step": 123171, "epoch": 2932} {"train_loss": -6.416037559509277, "global_step": 123172, "epoch": 2932} {"train_loss": -6.433318138122559, "global_step": 123173, "epoch": 2932} {"train_loss": -6.391819000244141, "global_step": 123174, "epoch": 2932} {"train_loss": -6.444894790649414, "global_step": 123175, "epoch": 2932} {"train_loss": -6.406913757324219, "global_step": 123176, "epoch": 2932} {"train_loss": -6.358550071716309, "global_step": 123177, "epoch": 2932} {"train_loss": -6.487347602844238, "global_step": 123178, "epoch": 2932} {"train_loss": -6.440570831298828, "global_step": 123179, "epoch": 2932} {"train_loss": -6.420722961425781, "global_step": 123180, "epoch": 2932} {"train_loss": -6.41213321685791, "global_step": 123181, "epoch": 2932} {"train_loss": -6.325376987457275, "global_step": 123182, "epoch": 2932} {"train_loss": -6.520589351654053, "global_step": 123183, "epoch": 2932} {"train_loss": -6.39164400100708, "global_step": 123184, "epoch": 2932} {"train_loss": -6.494123912992931, "global_step": 123185, "epoch": 2932, "val_loss": 68074.28125} {"train_loss": -6.517329216003418, "global_step": 123186, "epoch": 2933} {"train_loss": -6.483272075653076, "global_step": 123187, "epoch": 2933} {"train_loss": -6.522529602050781, "global_step": 123188, "epoch": 2933} {"train_loss": -6.523831367492676, "global_step": 123189, "epoch": 2933} {"train_loss": -6.6419477462768555, "global_step": 123190, "epoch": 2933} {"train_loss": -6.547273635864258, "global_step": 123191, "epoch": 2933} {"train_loss": -6.551061630249023, "global_step": 123192, "epoch": 2933} {"train_loss": -6.573242664337158, "global_step": 123193, "epoch": 2933} {"train_loss": -6.562356948852539, "global_step": 123194, "epoch": 2933} {"train_loss": -6.509291648864746, "global_step": 123195, "epoch": 2933} {"train_loss": -6.464910507202148, "global_step": 123196, "epoch": 2933} {"train_loss": -6.592598915100098, "global_step": 123197, "epoch": 2933} {"train_loss": -6.527748107910156, "global_step": 123198, "epoch": 2933} {"train_loss": -6.558176517486572, "global_step": 123199, "epoch": 2933} {"train_loss": -6.616303443908691, "global_step": 123200, "epoch": 2933} {"train_loss": -6.599740982055664, "global_step": 123201, "epoch": 2933} {"train_loss": -6.533974647521973, "global_step": 123202, "epoch": 2933} {"train_loss": -6.5706939697265625, "global_step": 123203, "epoch": 2933} {"train_loss": -6.569916725158691, "global_step": 123204, "epoch": 2933} {"train_loss": -6.6048173904418945, "global_step": 123205, "epoch": 2933} {"train_loss": -6.595478057861328, "global_step": 123206, "epoch": 2933} {"train_loss": -6.548728942871094, "global_step": 123207, "epoch": 2933} {"train_loss": -6.588234901428223, "global_step": 123208, "epoch": 2933} {"train_loss": -6.539305686950684, "global_step": 123209, "epoch": 2933} {"train_loss": -6.443350791931152, "global_step": 123210, "epoch": 2933} {"train_loss": -6.537086486816406, "global_step": 123211, "epoch": 2933} {"train_loss": -6.559856414794922, "global_step": 123212, "epoch": 2933} {"train_loss": -6.531368732452393, "global_step": 123213, "epoch": 2933} {"train_loss": -6.512096405029297, "global_step": 123214, "epoch": 2933} {"train_loss": -6.594030380249023, "global_step": 123215, "epoch": 2933} {"train_loss": -6.6164445877075195, "global_step": 123216, "epoch": 2933} {"train_loss": -6.752658843994141, "global_step": 123217, "epoch": 2933} {"train_loss": -6.518145561218262, "global_step": 123218, "epoch": 2933} {"train_loss": -6.542991638183594, "global_step": 123219, "epoch": 2933} {"train_loss": -6.511028289794922, "global_step": 123220, "epoch": 2933} {"train_loss": -6.5086669921875, "global_step": 123221, "epoch": 2933} {"train_loss": -6.578743934631348, "global_step": 123222, "epoch": 2933} {"train_loss": -6.56002140045166, "global_step": 123223, "epoch": 2933} {"train_loss": -6.546567916870117, "global_step": 123224, "epoch": 2933} {"train_loss": -6.693175315856934, "global_step": 123225, "epoch": 2933} {"train_loss": -6.532144069671631, "global_step": 123226, "epoch": 2933} {"train_loss": -6.560318254289173, "global_step": 123227, "epoch": 2933, "val_loss": 68046.8671875} {"train_loss": -6.623664379119873, "global_step": 123228, "epoch": 2934} {"train_loss": -6.657138347625732, "global_step": 123229, "epoch": 2934} {"train_loss": -6.649673938751221, "global_step": 123230, "epoch": 2934} {"train_loss": -6.538642883300781, "global_step": 123231, "epoch": 2934} {"train_loss": -6.632189750671387, "global_step": 123232, "epoch": 2934} {"train_loss": -6.506491184234619, "global_step": 123233, "epoch": 2934} {"train_loss": -6.47442626953125, "global_step": 123234, "epoch": 2934} {"train_loss": -6.528162956237793, "global_step": 123235, "epoch": 2934} {"train_loss": -6.56581449508667, "global_step": 123236, "epoch": 2934} {"train_loss": -6.640300750732422, "global_step": 123237, "epoch": 2934} {"train_loss": -6.659627437591553, "global_step": 123238, "epoch": 2934} {"train_loss": -6.611246109008789, "global_step": 123239, "epoch": 2934} {"train_loss": -6.64357328414917, "global_step": 123240, "epoch": 2934} {"train_loss": -6.6127543449401855, "global_step": 123241, "epoch": 2934} {"train_loss": -6.6158599853515625, "global_step": 123242, "epoch": 2934} {"train_loss": -6.651022911071777, "global_step": 123243, "epoch": 2934} {"train_loss": -6.591371536254883, "global_step": 123244, "epoch": 2934} {"train_loss": -6.664358139038086, "global_step": 123245, "epoch": 2934} {"train_loss": -6.600828170776367, "global_step": 123246, "epoch": 2934} {"train_loss": -6.534353256225586, "global_step": 123247, "epoch": 2934} {"train_loss": -6.586733341217041, "global_step": 123248, "epoch": 2934} {"train_loss": -6.450207710266113, "global_step": 123249, "epoch": 2934} {"train_loss": -6.522838592529297, "global_step": 123250, "epoch": 2934} {"train_loss": -6.610933303833008, "global_step": 123251, "epoch": 2934} {"train_loss": -6.614234924316406, "global_step": 123252, "epoch": 2934} {"train_loss": -6.523961067199707, "global_step": 123253, "epoch": 2934} {"train_loss": -6.605020523071289, "global_step": 123254, "epoch": 2934} {"train_loss": -6.488508224487305, "global_step": 123255, "epoch": 2934} {"train_loss": -6.403270721435547, "global_step": 123256, "epoch": 2934} {"train_loss": -6.463809013366699, "global_step": 123257, "epoch": 2934} {"train_loss": -6.491841793060303, "global_step": 123258, "epoch": 2934} {"train_loss": -6.457508087158203, "global_step": 123259, "epoch": 2934} {"train_loss": -6.5325517654418945, "global_step": 123260, "epoch": 2934} {"train_loss": -6.467153549194336, "global_step": 123261, "epoch": 2934} {"train_loss": -6.437985897064209, "global_step": 123262, "epoch": 2934} {"train_loss": -6.402639389038086, "global_step": 123263, "epoch": 2934} {"train_loss": -6.401431083679199, "global_step": 123264, "epoch": 2934} {"train_loss": -6.362457275390625, "global_step": 123265, "epoch": 2934} {"train_loss": -6.6438493728637695, "global_step": 123266, "epoch": 2934} {"train_loss": -6.565326690673828, "global_step": 123267, "epoch": 2934} {"train_loss": -6.453389644622803, "global_step": 123268, "epoch": 2934} {"train_loss": -6.549178713843936, "global_step": 123269, "epoch": 2934, "val_loss": 68131.375} {"train_loss": -6.437404632568359, "global_step": 123270, "epoch": 2935} {"train_loss": -6.607766151428223, "global_step": 123271, "epoch": 2935} {"train_loss": -6.488584518432617, "global_step": 123272, "epoch": 2935} {"train_loss": -6.456244945526123, "global_step": 123273, "epoch": 2935} {"train_loss": -6.573666572570801, "global_step": 123274, "epoch": 2935} {"train_loss": -6.509852409362793, "global_step": 123275, "epoch": 2935} {"train_loss": -6.478072166442871, "global_step": 123276, "epoch": 2935} {"train_loss": -6.638694763183594, "global_step": 123277, "epoch": 2935} {"train_loss": -6.526181221008301, "global_step": 123278, "epoch": 2935} {"train_loss": -6.562621116638184, "global_step": 123279, "epoch": 2935} {"train_loss": -6.469226837158203, "global_step": 123280, "epoch": 2935} {"train_loss": -6.469145774841309, "global_step": 123281, "epoch": 2935} {"train_loss": -6.6493964195251465, "global_step": 123282, "epoch": 2935} {"train_loss": -6.543564796447754, "global_step": 123283, "epoch": 2935} {"train_loss": -6.558262825012207, "global_step": 123284, "epoch": 2935} {"train_loss": -6.651603698730469, "global_step": 123285, "epoch": 2935} {"train_loss": -6.484493255615234, "global_step": 123286, "epoch": 2935} {"train_loss": -6.473186492919922, "global_step": 123287, "epoch": 2935} {"train_loss": -6.671473503112793, "global_step": 123288, "epoch": 2935} {"train_loss": -6.709333419799805, "global_step": 123289, "epoch": 2935} {"train_loss": -6.391848564147949, "global_step": 123290, "epoch": 2935} {"train_loss": -6.63230037689209, "global_step": 123291, "epoch": 2935} {"train_loss": -6.606017112731934, "global_step": 123292, "epoch": 2935} {"train_loss": -6.623500823974609, "global_step": 123293, "epoch": 2935} {"train_loss": -6.535233020782471, "global_step": 123294, "epoch": 2935} {"train_loss": -6.573013782501221, "global_step": 123295, "epoch": 2935} {"train_loss": -6.568565368652344, "global_step": 123296, "epoch": 2935} {"train_loss": -6.5587358474731445, "global_step": 123297, "epoch": 2935} {"train_loss": -6.372603416442871, "global_step": 123298, "epoch": 2935} {"train_loss": -6.602665424346924, "global_step": 123299, "epoch": 2935} {"train_loss": -6.715956687927246, "global_step": 123300, "epoch": 2935} {"train_loss": -6.497004508972168, "global_step": 123301, "epoch": 2935} {"train_loss": -6.476318359375, "global_step": 123302, "epoch": 2935} {"train_loss": -6.580448627471924, "global_step": 123303, "epoch": 2935} {"train_loss": -6.643551826477051, "global_step": 123304, "epoch": 2935} {"train_loss": -6.491433143615723, "global_step": 123305, "epoch": 2935} {"train_loss": -6.577699184417725, "global_step": 123306, "epoch": 2935} {"train_loss": -6.512796401977539, "global_step": 123307, "epoch": 2935} {"train_loss": -6.649199485778809, "global_step": 123308, "epoch": 2935} {"train_loss": -6.573431015014648, "global_step": 123309, "epoch": 2935} {"train_loss": -6.702231407165527, "global_step": 123310, "epoch": 2935} {"train_loss": -6.557847545260475, "global_step": 123311, "epoch": 2935, "val_loss": 68052.40625} {"train_loss": -6.614295959472656, "global_step": 123312, "epoch": 2936} {"train_loss": -6.628664016723633, "global_step": 123313, "epoch": 2936} {"train_loss": -6.594560623168945, "global_step": 123314, "epoch": 2936} {"train_loss": -6.544008255004883, "global_step": 123315, "epoch": 2936} {"train_loss": -6.548981189727783, "global_step": 123316, "epoch": 2936} {"train_loss": -6.486170291900635, "global_step": 123317, "epoch": 2936} {"train_loss": -6.484226703643799, "global_step": 123318, "epoch": 2936} {"train_loss": -6.522517204284668, "global_step": 123319, "epoch": 2936} {"train_loss": -6.688750267028809, "global_step": 123320, "epoch": 2936} {"train_loss": -6.470853328704834, "global_step": 123321, "epoch": 2936} {"train_loss": -6.560145854949951, "global_step": 123322, "epoch": 2936} {"train_loss": -6.536574363708496, "global_step": 123323, "epoch": 2936} {"train_loss": -6.5558319091796875, "global_step": 123324, "epoch": 2936} {"train_loss": -6.585124969482422, "global_step": 123325, "epoch": 2936} {"train_loss": -6.534689903259277, "global_step": 123326, "epoch": 2936} {"train_loss": -6.427713394165039, "global_step": 123327, "epoch": 2936} {"train_loss": -6.53925895690918, "global_step": 123328, "epoch": 2936} {"train_loss": -6.512598991394043, "global_step": 123329, "epoch": 2936} {"train_loss": -6.66535758972168, "global_step": 123330, "epoch": 2936} {"train_loss": -6.510884761810303, "global_step": 123331, "epoch": 2936} {"train_loss": -6.610550880432129, "global_step": 123332, "epoch": 2936} {"train_loss": -6.599849700927734, "global_step": 123333, "epoch": 2936} {"train_loss": -6.407968997955322, "global_step": 123334, "epoch": 2936} {"train_loss": -6.692946434020996, "global_step": 123335, "epoch": 2936} {"train_loss": -6.644805908203125, "global_step": 123336, "epoch": 2936} {"train_loss": -6.4514665603637695, "global_step": 123337, "epoch": 2936} {"train_loss": -6.6207451820373535, "global_step": 123338, "epoch": 2936} {"train_loss": -6.543132781982422, "global_step": 123339, "epoch": 2936} {"train_loss": -6.526910305023193, "global_step": 123340, "epoch": 2936} {"train_loss": -6.538628101348877, "global_step": 123341, "epoch": 2936} {"train_loss": -6.591243743896484, "global_step": 123342, "epoch": 2936} {"train_loss": -6.476441860198975, "global_step": 123343, "epoch": 2936} {"train_loss": -6.494535446166992, "global_step": 123344, "epoch": 2936} {"train_loss": -6.52577018737793, "global_step": 123345, "epoch": 2936} {"train_loss": -6.345850467681885, "global_step": 123346, "epoch": 2936} {"train_loss": -6.510941028594971, "global_step": 123347, "epoch": 2936} {"train_loss": -6.403560638427734, "global_step": 123348, "epoch": 2936} {"train_loss": -6.421733856201172, "global_step": 123349, "epoch": 2936} {"train_loss": -6.632768630981445, "global_step": 123350, "epoch": 2936} {"train_loss": -6.43031120300293, "global_step": 123351, "epoch": 2936} {"train_loss": -6.432050704956055, "global_step": 123352, "epoch": 2936} {"train_loss": -6.535592510586693, "global_step": 123353, "epoch": 2936, "val_loss": 68220.2421875} {"train_loss": -6.574172019958496, "global_step": 123354, "epoch": 2937} {"train_loss": -6.565514087677002, "global_step": 123355, "epoch": 2937} {"train_loss": -6.555628776550293, "global_step": 123356, "epoch": 2937} {"train_loss": -6.461338996887207, "global_step": 123357, "epoch": 2937} {"train_loss": -6.545907020568848, "global_step": 123358, "epoch": 2937} {"train_loss": -6.583737373352051, "global_step": 123359, "epoch": 2937} {"train_loss": -6.380337715148926, "global_step": 123360, "epoch": 2937} {"train_loss": -6.52508544921875, "global_step": 123361, "epoch": 2937} {"train_loss": -6.4518141746521, "global_step": 123362, "epoch": 2937} {"train_loss": -6.525843620300293, "global_step": 123363, "epoch": 2937} {"train_loss": -6.5997700691223145, "global_step": 123364, "epoch": 2937} {"train_loss": -6.593513488769531, "global_step": 123365, "epoch": 2937} {"train_loss": -6.632696151733398, "global_step": 123366, "epoch": 2937} {"train_loss": -6.556020736694336, "global_step": 123367, "epoch": 2937} {"train_loss": -6.513041973114014, "global_step": 123368, "epoch": 2937} {"train_loss": -6.676394462585449, "global_step": 123369, "epoch": 2937} {"train_loss": -6.536340713500977, "global_step": 123370, "epoch": 2937} {"train_loss": -6.6987833976745605, "global_step": 123371, "epoch": 2937} {"train_loss": -6.663790225982666, "global_step": 123372, "epoch": 2937} {"train_loss": -6.52314567565918, "global_step": 123373, "epoch": 2937} {"train_loss": -6.5345869064331055, "global_step": 123374, "epoch": 2937} {"train_loss": -6.4744110107421875, "global_step": 123375, "epoch": 2937} {"train_loss": -6.561193943023682, "global_step": 123376, "epoch": 2937} {"train_loss": -6.669867515563965, "global_step": 123377, "epoch": 2937} {"train_loss": -6.515420913696289, "global_step": 123378, "epoch": 2937} {"train_loss": -6.456308841705322, "global_step": 123379, "epoch": 2937} {"train_loss": -6.701104164123535, "global_step": 123380, "epoch": 2937} {"train_loss": -6.571444511413574, "global_step": 123381, "epoch": 2937} {"train_loss": -6.524996280670166, "global_step": 123382, "epoch": 2937} {"train_loss": -6.53754997253418, "global_step": 123383, "epoch": 2937} {"train_loss": -6.40537691116333, "global_step": 123384, "epoch": 2937} {"train_loss": -6.479769706726074, "global_step": 123385, "epoch": 2937} {"train_loss": -6.386013984680176, "global_step": 123386, "epoch": 2937} {"train_loss": -6.556911945343018, "global_step": 123387, "epoch": 2937} {"train_loss": -6.6197662353515625, "global_step": 123388, "epoch": 2937} {"train_loss": -6.50825834274292, "global_step": 123389, "epoch": 2937} {"train_loss": -6.548425674438477, "global_step": 123390, "epoch": 2937} {"train_loss": -6.360525131225586, "global_step": 123391, "epoch": 2937} {"train_loss": -6.611963748931885, "global_step": 123392, "epoch": 2937} {"train_loss": -6.375617027282715, "global_step": 123393, "epoch": 2937} {"train_loss": -6.539332866668701, "global_step": 123394, "epoch": 2937} {"train_loss": -6.538659890492757, "global_step": 123395, "epoch": 2937, "val_loss": 68168.9375} {"train_loss": -6.530681133270264, "global_step": 123396, "epoch": 2938} {"train_loss": -6.371982097625732, "global_step": 123397, "epoch": 2938} {"train_loss": -6.503899574279785, "global_step": 123398, "epoch": 2938} {"train_loss": -6.544677257537842, "global_step": 123399, "epoch": 2938} {"train_loss": -6.527963638305664, "global_step": 123400, "epoch": 2938} {"train_loss": -6.497142791748047, "global_step": 123401, "epoch": 2938} {"train_loss": -6.532886505126953, "global_step": 123402, "epoch": 2938} {"train_loss": -6.569856643676758, "global_step": 123403, "epoch": 2938} {"train_loss": -6.4811692237854, "global_step": 123404, "epoch": 2938} {"train_loss": -6.4989166259765625, "global_step": 123405, "epoch": 2938} {"train_loss": -6.518669605255127, "global_step": 123406, "epoch": 2938} {"train_loss": -6.487909317016602, "global_step": 123407, "epoch": 2938} {"train_loss": -6.461521625518799, "global_step": 123408, "epoch": 2938} {"train_loss": -6.494401931762695, "global_step": 123409, "epoch": 2938} {"train_loss": -6.611300468444824, "global_step": 123410, "epoch": 2938} {"train_loss": -6.637664318084717, "global_step": 123411, "epoch": 2938} {"train_loss": -6.646130561828613, "global_step": 123412, "epoch": 2938} {"train_loss": -6.47752571105957, "global_step": 123413, "epoch": 2938} {"train_loss": -6.465139389038086, "global_step": 123414, "epoch": 2938} {"train_loss": -6.540907382965088, "global_step": 123415, "epoch": 2938} {"train_loss": -6.6303558349609375, "global_step": 123416, "epoch": 2938} {"train_loss": -6.549120903015137, "global_step": 123417, "epoch": 2938} {"train_loss": -6.488577842712402, "global_step": 123418, "epoch": 2938} {"train_loss": -6.593453407287598, "global_step": 123419, "epoch": 2938} {"train_loss": -6.495652198791504, "global_step": 123420, "epoch": 2938} {"train_loss": -6.604764938354492, "global_step": 123421, "epoch": 2938} {"train_loss": -6.479099750518799, "global_step": 123422, "epoch": 2938} {"train_loss": -6.496044158935547, "global_step": 123423, "epoch": 2938} {"train_loss": -6.498552322387695, "global_step": 123424, "epoch": 2938} {"train_loss": -6.581353187561035, "global_step": 123425, "epoch": 2938} {"train_loss": -6.635837554931641, "global_step": 123426, "epoch": 2938} {"train_loss": -6.527087211608887, "global_step": 123427, "epoch": 2938} {"train_loss": -6.521120071411133, "global_step": 123428, "epoch": 2938} {"train_loss": -6.613212585449219, "global_step": 123429, "epoch": 2938} {"train_loss": -6.645866870880127, "global_step": 123430, "epoch": 2938} {"train_loss": -6.462595462799072, "global_step": 123431, "epoch": 2938} {"train_loss": -6.535572052001953, "global_step": 123432, "epoch": 2938} {"train_loss": -6.551606178283691, "global_step": 123433, "epoch": 2938} {"train_loss": -6.544900894165039, "global_step": 123434, "epoch": 2938} {"train_loss": -6.606266975402832, "global_step": 123435, "epoch": 2938} {"train_loss": -6.478925704956055, "global_step": 123436, "epoch": 2938} {"train_loss": -6.535421507699149, "global_step": 123437, "epoch": 2938, "val_loss": 67946.7265625} {"train_loss": -6.492543697357178, "global_step": 123438, "epoch": 2939} {"train_loss": -6.485689163208008, "global_step": 123439, "epoch": 2939} {"train_loss": -6.548842430114746, "global_step": 123440, "epoch": 2939} {"train_loss": -6.786279678344727, "global_step": 123441, "epoch": 2939} {"train_loss": -6.544896125793457, "global_step": 123442, "epoch": 2939} {"train_loss": -6.604650497436523, "global_step": 123443, "epoch": 2939} {"train_loss": -6.7277445793151855, "global_step": 123444, "epoch": 2939} {"train_loss": -6.522340774536133, "global_step": 123445, "epoch": 2939} {"train_loss": -6.64084529876709, "global_step": 123446, "epoch": 2939} {"train_loss": -6.5063066482543945, "global_step": 123447, "epoch": 2939} {"train_loss": -6.616204261779785, "global_step": 123448, "epoch": 2939} {"train_loss": -6.55332088470459, "global_step": 123449, "epoch": 2939} {"train_loss": -6.704651832580566, "global_step": 123450, "epoch": 2939} {"train_loss": -6.545720100402832, "global_step": 123451, "epoch": 2939} {"train_loss": -6.6697893142700195, "global_step": 123452, "epoch": 2939} {"train_loss": -6.664546489715576, "global_step": 123453, "epoch": 2939} {"train_loss": -6.542994499206543, "global_step": 123454, "epoch": 2939} {"train_loss": -6.569550514221191, "global_step": 123455, "epoch": 2939} {"train_loss": -6.60147762298584, "global_step": 123456, "epoch": 2939} {"train_loss": -6.689613342285156, "global_step": 123457, "epoch": 2939} {"train_loss": -6.678694725036621, "global_step": 123458, "epoch": 2939} {"train_loss": -6.6007819175720215, "global_step": 123459, "epoch": 2939} {"train_loss": -6.686979293823242, "global_step": 123460, "epoch": 2939} {"train_loss": -6.819869041442871, "global_step": 123461, "epoch": 2939} {"train_loss": -6.652551651000977, "global_step": 123462, "epoch": 2939} {"train_loss": -6.568190574645996, "global_step": 123463, "epoch": 2939} {"train_loss": -6.626280784606934, "global_step": 123464, "epoch": 2939} {"train_loss": -6.630916595458984, "global_step": 123465, "epoch": 2939} {"train_loss": -6.684103012084961, "global_step": 123466, "epoch": 2939} {"train_loss": -6.556034088134766, "global_step": 123467, "epoch": 2939} {"train_loss": -6.555693626403809, "global_step": 123468, "epoch": 2939} {"train_loss": -6.508908271789551, "global_step": 123469, "epoch": 2939} {"train_loss": -6.666167259216309, "global_step": 123470, "epoch": 2939} {"train_loss": -6.720186233520508, "global_step": 123471, "epoch": 2939} {"train_loss": -6.593137741088867, "global_step": 123472, "epoch": 2939} {"train_loss": -6.6024065017700195, "global_step": 123473, "epoch": 2939} {"train_loss": -6.590480804443359, "global_step": 123474, "epoch": 2939} {"train_loss": -6.579148292541504, "global_step": 123475, "epoch": 2939} {"train_loss": -6.660881042480469, "global_step": 123476, "epoch": 2939} {"train_loss": -6.603208065032959, "global_step": 123477, "epoch": 2939} {"train_loss": -6.5106048583984375, "global_step": 123478, "epoch": 2939} {"train_loss": -6.612451678230649, "global_step": 123479, "epoch": 2939, "val_loss": 68113.96875} {"train_loss": -6.569851875305176, "global_step": 123480, "epoch": 2940} {"train_loss": -6.576664924621582, "global_step": 123481, "epoch": 2940} {"train_loss": -6.646794319152832, "global_step": 123482, "epoch": 2940} {"train_loss": -6.632671356201172, "global_step": 123483, "epoch": 2940} {"train_loss": -6.601892471313477, "global_step": 123484, "epoch": 2940} {"train_loss": -6.470796585083008, "global_step": 123485, "epoch": 2940} {"train_loss": -6.46628999710083, "global_step": 123486, "epoch": 2940} {"train_loss": -6.620352745056152, "global_step": 123487, "epoch": 2940} {"train_loss": -6.511693954467773, "global_step": 123488, "epoch": 2940} {"train_loss": -6.60135555267334, "global_step": 123489, "epoch": 2940} {"train_loss": -6.635584831237793, "global_step": 123490, "epoch": 2940} {"train_loss": -6.532505035400391, "global_step": 123491, "epoch": 2940} {"train_loss": -6.548341751098633, "global_step": 123492, "epoch": 2940} {"train_loss": -6.54020357131958, "global_step": 123493, "epoch": 2940} {"train_loss": -6.491833209991455, "global_step": 123494, "epoch": 2940} {"train_loss": -6.660561561584473, "global_step": 123495, "epoch": 2940} {"train_loss": -6.605921745300293, "global_step": 123496, "epoch": 2940} {"train_loss": -6.574748992919922, "global_step": 123497, "epoch": 2940} {"train_loss": -6.566384315490723, "global_step": 123498, "epoch": 2940} {"train_loss": -6.422396183013916, "global_step": 123499, "epoch": 2940} {"train_loss": -6.534017086029053, "global_step": 123500, "epoch": 2940} {"train_loss": -6.565802097320557, "global_step": 123501, "epoch": 2940} {"train_loss": -6.647195339202881, "global_step": 123502, "epoch": 2940} {"train_loss": -6.539522647857666, "global_step": 123503, "epoch": 2940} {"train_loss": -6.541536331176758, "global_step": 123504, "epoch": 2940} {"train_loss": -6.567788124084473, "global_step": 123505, "epoch": 2940} {"train_loss": -6.54369592666626, "global_step": 123506, "epoch": 2940} {"train_loss": -6.533422470092773, "global_step": 123507, "epoch": 2940} {"train_loss": -6.5950164794921875, "global_step": 123508, "epoch": 2940} {"train_loss": -6.538747787475586, "global_step": 123509, "epoch": 2940} {"train_loss": -6.492588996887207, "global_step": 123510, "epoch": 2940} {"train_loss": -6.609478950500488, "global_step": 123511, "epoch": 2940} {"train_loss": -6.629570960998535, "global_step": 123512, "epoch": 2940} {"train_loss": -6.505105018615723, "global_step": 123513, "epoch": 2940} {"train_loss": -6.6591596603393555, "global_step": 123514, "epoch": 2940} {"train_loss": -6.590825080871582, "global_step": 123515, "epoch": 2940} {"train_loss": -6.522940635681152, "global_step": 123516, "epoch": 2940} {"train_loss": -6.592410087585449, "global_step": 123517, "epoch": 2940} {"train_loss": -6.5845746994018555, "global_step": 123518, "epoch": 2940} {"train_loss": -6.577935218811035, "global_step": 123519, "epoch": 2940} {"train_loss": -6.493762016296387, "global_step": 123520, "epoch": 2940} {"train_loss": -6.565916981015887, "global_step": 123521, "epoch": 2940, "val_loss": 67938.9375} {"train_loss": -6.581470489501953, "global_step": 123522, "epoch": 2941} {"train_loss": -6.513120174407959, "global_step": 123523, "epoch": 2941} {"train_loss": -6.565023422241211, "global_step": 123524, "epoch": 2941} {"train_loss": -6.671489238739014, "global_step": 123525, "epoch": 2941} {"train_loss": -6.541949272155762, "global_step": 123526, "epoch": 2941} {"train_loss": -6.575830459594727, "global_step": 123527, "epoch": 2941} {"train_loss": -6.634784698486328, "global_step": 123528, "epoch": 2941} {"train_loss": -6.575268268585205, "global_step": 123529, "epoch": 2941} {"train_loss": -6.623356819152832, "global_step": 123530, "epoch": 2941} {"train_loss": -6.599368095397949, "global_step": 123531, "epoch": 2941} {"train_loss": -6.493539810180664, "global_step": 123532, "epoch": 2941} {"train_loss": -6.500721454620361, "global_step": 123533, "epoch": 2941} {"train_loss": -6.4336700439453125, "global_step": 123534, "epoch": 2941} {"train_loss": -6.52517032623291, "global_step": 123535, "epoch": 2941} {"train_loss": -6.495394229888916, "global_step": 123536, "epoch": 2941} {"train_loss": -6.573808193206787, "global_step": 123537, "epoch": 2941} {"train_loss": -6.581676483154297, "global_step": 123538, "epoch": 2941} {"train_loss": -6.53965425491333, "global_step": 123539, "epoch": 2941} {"train_loss": -6.640571594238281, "global_step": 123540, "epoch": 2941} {"train_loss": -6.558796405792236, "global_step": 123541, "epoch": 2941} {"train_loss": -6.529458045959473, "global_step": 123542, "epoch": 2941} {"train_loss": -6.624113082885742, "global_step": 123543, "epoch": 2941} {"train_loss": -6.445334434509277, "global_step": 123544, "epoch": 2941} {"train_loss": -6.585697174072266, "global_step": 123545, "epoch": 2941} {"train_loss": -6.718184471130371, "global_step": 123546, "epoch": 2941} {"train_loss": -6.514177322387695, "global_step": 123547, "epoch": 2941} {"train_loss": -6.602393627166748, "global_step": 123548, "epoch": 2941} {"train_loss": -6.611996173858643, "global_step": 123549, "epoch": 2941} {"train_loss": -6.528234481811523, "global_step": 123550, "epoch": 2941} {"train_loss": -6.596061706542969, "global_step": 123551, "epoch": 2941} {"train_loss": -6.593487739562988, "global_step": 123552, "epoch": 2941} {"train_loss": -6.492454528808594, "global_step": 123553, "epoch": 2941} {"train_loss": -6.692065715789795, "global_step": 123554, "epoch": 2941} {"train_loss": -6.637177467346191, "global_step": 123555, "epoch": 2941} {"train_loss": -6.565561294555664, "global_step": 123556, "epoch": 2941} {"train_loss": -6.469111442565918, "global_step": 123557, "epoch": 2941} {"train_loss": -6.4997053146362305, "global_step": 123558, "epoch": 2941} {"train_loss": -6.673090934753418, "global_step": 123559, "epoch": 2941} {"train_loss": -6.576974868774414, "global_step": 123560, "epoch": 2941} {"train_loss": -6.640089511871338, "global_step": 123561, "epoch": 2941} {"train_loss": -6.56696891784668, "global_step": 123562, "epoch": 2941} {"train_loss": -6.570398364748273, "global_step": 123563, "epoch": 2941, "val_loss": 67932.0390625} {"train_loss": -6.5606889724731445, "global_step": 123564, "epoch": 2942} {"train_loss": -6.523962020874023, "global_step": 123565, "epoch": 2942} {"train_loss": -6.624713897705078, "global_step": 123566, "epoch": 2942} {"train_loss": -6.556814193725586, "global_step": 123567, "epoch": 2942} {"train_loss": -6.612703323364258, "global_step": 123568, "epoch": 2942} {"train_loss": -6.602994918823242, "global_step": 123569, "epoch": 2942} {"train_loss": -6.575720310211182, "global_step": 123570, "epoch": 2942} {"train_loss": -6.62960147857666, "global_step": 123571, "epoch": 2942} {"train_loss": -6.46626091003418, "global_step": 123572, "epoch": 2942} {"train_loss": -6.516297340393066, "global_step": 123573, "epoch": 2942} {"train_loss": -6.569313049316406, "global_step": 123574, "epoch": 2942} {"train_loss": -6.576343536376953, "global_step": 123575, "epoch": 2942} {"train_loss": -6.640158653259277, "global_step": 123576, "epoch": 2942} {"train_loss": -6.6258544921875, "global_step": 123577, "epoch": 2942} {"train_loss": -6.470724582672119, "global_step": 123578, "epoch": 2942} {"train_loss": -6.491021156311035, "global_step": 123579, "epoch": 2942} {"train_loss": -6.39284610748291, "global_step": 123580, "epoch": 2942} {"train_loss": -6.438962936401367, "global_step": 123581, "epoch": 2942} {"train_loss": -6.6787309646606445, "global_step": 123582, "epoch": 2942} {"train_loss": -6.4092607498168945, "global_step": 123583, "epoch": 2942} {"train_loss": -6.646914005279541, "global_step": 123584, "epoch": 2942} {"train_loss": -6.551452159881592, "global_step": 123585, "epoch": 2942} {"train_loss": -6.585824012756348, "global_step": 123586, "epoch": 2942} {"train_loss": -6.571088790893555, "global_step": 123587, "epoch": 2942} {"train_loss": -6.447063446044922, "global_step": 123588, "epoch": 2942} {"train_loss": -6.511351585388184, "global_step": 123589, "epoch": 2942} {"train_loss": -6.517312049865723, "global_step": 123590, "epoch": 2942} {"train_loss": -6.492801666259766, "global_step": 123591, "epoch": 2942} {"train_loss": -6.618536949157715, "global_step": 123592, "epoch": 2942} {"train_loss": -6.478371620178223, "global_step": 123593, "epoch": 2942} {"train_loss": -6.5702223777771, "global_step": 123594, "epoch": 2942} {"train_loss": -6.545261383056641, "global_step": 123595, "epoch": 2942} {"train_loss": -6.470877647399902, "global_step": 123596, "epoch": 2942} {"train_loss": -6.551165580749512, "global_step": 123597, "epoch": 2942} {"train_loss": -6.718271255493164, "global_step": 123598, "epoch": 2942} {"train_loss": -6.579855442047119, "global_step": 123599, "epoch": 2942} {"train_loss": -6.658114433288574, "global_step": 123600, "epoch": 2942} {"train_loss": -6.627337455749512, "global_step": 123601, "epoch": 2942} {"train_loss": -6.5901408195495605, "global_step": 123602, "epoch": 2942} {"train_loss": -6.5499372482299805, "global_step": 123603, "epoch": 2942} {"train_loss": -6.522471904754639, "global_step": 123604, "epoch": 2942} {"train_loss": -6.55717438743228, "global_step": 123605, "epoch": 2942, "val_loss": 68088.171875} {"train_loss": -6.640730857849121, "global_step": 123606, "epoch": 2943} {"train_loss": -6.5602312088012695, "global_step": 123607, "epoch": 2943} {"train_loss": -6.581592082977295, "global_step": 123608, "epoch": 2943} {"train_loss": -6.62662935256958, "global_step": 123609, "epoch": 2943} {"train_loss": -6.591418266296387, "global_step": 123610, "epoch": 2943} {"train_loss": -6.611611843109131, "global_step": 123611, "epoch": 2943} {"train_loss": -6.609262943267822, "global_step": 123612, "epoch": 2943} {"train_loss": -6.651061058044434, "global_step": 123613, "epoch": 2943} {"train_loss": -6.576615333557129, "global_step": 123614, "epoch": 2943} {"train_loss": -6.647982597351074, "global_step": 123615, "epoch": 2943} {"train_loss": -6.556558609008789, "global_step": 123616, "epoch": 2943} {"train_loss": -6.589393138885498, "global_step": 123617, "epoch": 2943} {"train_loss": -6.701796531677246, "global_step": 123618, "epoch": 2943} {"train_loss": -6.588457107543945, "global_step": 123619, "epoch": 2943} {"train_loss": -6.57102632522583, "global_step": 123620, "epoch": 2943} {"train_loss": -6.594561576843262, "global_step": 123621, "epoch": 2943} {"train_loss": -6.600865364074707, "global_step": 123622, "epoch": 2943} {"train_loss": -6.566377639770508, "global_step": 123623, "epoch": 2943} {"train_loss": -6.555673122406006, "global_step": 123624, "epoch": 2943} {"train_loss": -6.585453033447266, "global_step": 123625, "epoch": 2943} {"train_loss": -6.6123504638671875, "global_step": 123626, "epoch": 2943} {"train_loss": -6.607753753662109, "global_step": 123627, "epoch": 2943} {"train_loss": -6.4144673347473145, "global_step": 123628, "epoch": 2943} {"train_loss": -6.5070881843566895, "global_step": 123629, "epoch": 2943} {"train_loss": -6.5438103675842285, "global_step": 123630, "epoch": 2943} {"train_loss": -6.523157119750977, "global_step": 123631, "epoch": 2943} {"train_loss": -6.50543737411499, "global_step": 123632, "epoch": 2943} {"train_loss": -6.601447105407715, "global_step": 123633, "epoch": 2943} {"train_loss": -6.552660942077637, "global_step": 123634, "epoch": 2943} {"train_loss": -6.671828269958496, "global_step": 123635, "epoch": 2943} {"train_loss": -6.546026229858398, "global_step": 123636, "epoch": 2943} {"train_loss": -6.500316619873047, "global_step": 123637, "epoch": 2943} {"train_loss": -6.608150959014893, "global_step": 123638, "epoch": 2943} {"train_loss": -6.545657157897949, "global_step": 123639, "epoch": 2943} {"train_loss": -6.569072723388672, "global_step": 123640, "epoch": 2943} {"train_loss": -6.635859966278076, "global_step": 123641, "epoch": 2943} {"train_loss": -6.565796852111816, "global_step": 123642, "epoch": 2943} {"train_loss": -6.591740608215332, "global_step": 123643, "epoch": 2943} {"train_loss": -6.451512813568115, "global_step": 123644, "epoch": 2943} {"train_loss": -6.574399471282959, "global_step": 123645, "epoch": 2943} {"train_loss": -6.601737022399902, "global_step": 123646, "epoch": 2943} {"train_loss": -6.578561044874645, "global_step": 123647, "epoch": 2943, "val_loss": 67943.21875} {"train_loss": -6.649066925048828, "global_step": 123648, "epoch": 2944} {"train_loss": -6.673092365264893, "global_step": 123649, "epoch": 2944} {"train_loss": -6.617412090301514, "global_step": 123650, "epoch": 2944} {"train_loss": -6.635851860046387, "global_step": 123651, "epoch": 2944} {"train_loss": -6.643345832824707, "global_step": 123652, "epoch": 2944} {"train_loss": -6.651858329772949, "global_step": 123653, "epoch": 2944} {"train_loss": -6.514828681945801, "global_step": 123654, "epoch": 2944} {"train_loss": -6.457097053527832, "global_step": 123655, "epoch": 2944} {"train_loss": -6.667635917663574, "global_step": 123656, "epoch": 2944} {"train_loss": -6.643599033355713, "global_step": 123657, "epoch": 2944} {"train_loss": -6.5787200927734375, "global_step": 123658, "epoch": 2944} {"train_loss": -6.596629619598389, "global_step": 123659, "epoch": 2944} {"train_loss": -6.551640510559082, "global_step": 123660, "epoch": 2944} {"train_loss": -6.572266578674316, "global_step": 123661, "epoch": 2944} {"train_loss": -6.553099155426025, "global_step": 123662, "epoch": 2944} {"train_loss": -6.568580627441406, "global_step": 123663, "epoch": 2944} {"train_loss": -6.700550079345703, "global_step": 123664, "epoch": 2944} {"train_loss": -6.696910858154297, "global_step": 123665, "epoch": 2944} {"train_loss": -6.5284743309021, "global_step": 123666, "epoch": 2944} {"train_loss": -6.605385780334473, "global_step": 123667, "epoch": 2944} {"train_loss": -6.594167709350586, "global_step": 123668, "epoch": 2944} {"train_loss": -6.621549606323242, "global_step": 123669, "epoch": 2944} {"train_loss": -6.557640075683594, "global_step": 123670, "epoch": 2944} {"train_loss": -6.60827112197876, "global_step": 123671, "epoch": 2944} {"train_loss": -6.554080009460449, "global_step": 123672, "epoch": 2944} {"train_loss": -6.610927104949951, "global_step": 123673, "epoch": 2944} {"train_loss": -6.493244171142578, "global_step": 123674, "epoch": 2944} {"train_loss": -6.587738037109375, "global_step": 123675, "epoch": 2944} {"train_loss": -6.591526985168457, "global_step": 123676, "epoch": 2944} {"train_loss": -6.618488788604736, "global_step": 123677, "epoch": 2944} {"train_loss": -6.575284481048584, "global_step": 123678, "epoch": 2944} {"train_loss": -6.381953716278076, "global_step": 123679, "epoch": 2944} {"train_loss": -6.587606906890869, "global_step": 123680, "epoch": 2944} {"train_loss": -6.545843124389648, "global_step": 123681, "epoch": 2944} {"train_loss": -6.569144248962402, "global_step": 123682, "epoch": 2944} {"train_loss": -6.489055633544922, "global_step": 123683, "epoch": 2944} {"train_loss": -6.443678855895996, "global_step": 123684, "epoch": 2944} {"train_loss": -6.47506856918335, "global_step": 123685, "epoch": 2944} {"train_loss": -6.554022789001465, "global_step": 123686, "epoch": 2944} {"train_loss": -6.449864864349365, "global_step": 123687, "epoch": 2944} {"train_loss": -6.457270622253418, "global_step": 123688, "epoch": 2944} {"train_loss": -6.567995309829712, "global_step": 123689, "epoch": 2944, "val_loss": 68047.2578125} {"train_loss": -6.514686584472656, "global_step": 123690, "epoch": 2945} {"train_loss": -6.527706146240234, "global_step": 123691, "epoch": 2945} {"train_loss": -6.461350440979004, "global_step": 123692, "epoch": 2945} {"train_loss": -6.59481143951416, "global_step": 123693, "epoch": 2945} {"train_loss": -6.3607378005981445, "global_step": 123694, "epoch": 2945} {"train_loss": -6.444689750671387, "global_step": 123695, "epoch": 2945} {"train_loss": -6.474606513977051, "global_step": 123696, "epoch": 2945} {"train_loss": -6.513326644897461, "global_step": 123697, "epoch": 2945} {"train_loss": -6.436633586883545, "global_step": 123698, "epoch": 2945} {"train_loss": -6.4264984130859375, "global_step": 123699, "epoch": 2945} {"train_loss": -6.625679969787598, "global_step": 123700, "epoch": 2945} {"train_loss": -6.514492034912109, "global_step": 123701, "epoch": 2945} {"train_loss": -6.58062744140625, "global_step": 123702, "epoch": 2945} {"train_loss": -6.566632270812988, "global_step": 123703, "epoch": 2945} {"train_loss": -6.600201606750488, "global_step": 123704, "epoch": 2945} {"train_loss": -6.547863960266113, "global_step": 123705, "epoch": 2945} {"train_loss": -6.539039611816406, "global_step": 123706, "epoch": 2945} {"train_loss": -6.603071212768555, "global_step": 123707, "epoch": 2945} {"train_loss": -6.512762069702148, "global_step": 123708, "epoch": 2945} {"train_loss": -6.500215530395508, "global_step": 123709, "epoch": 2945} {"train_loss": -6.614264011383057, "global_step": 123710, "epoch": 2945} {"train_loss": -6.521037578582764, "global_step": 123711, "epoch": 2945} {"train_loss": -6.533193111419678, "global_step": 123712, "epoch": 2945} {"train_loss": -6.52103328704834, "global_step": 123713, "epoch": 2945} {"train_loss": -6.497775077819824, "global_step": 123714, "epoch": 2945} {"train_loss": -6.685541152954102, "global_step": 123715, "epoch": 2945} {"train_loss": -6.499213218688965, "global_step": 123716, "epoch": 2945} {"train_loss": -6.540802478790283, "global_step": 123717, "epoch": 2945} {"train_loss": -6.581439971923828, "global_step": 123718, "epoch": 2945} {"train_loss": -6.551796913146973, "global_step": 123719, "epoch": 2945} {"train_loss": -6.589954853057861, "global_step": 123720, "epoch": 2945} {"train_loss": -6.552586555480957, "global_step": 123721, "epoch": 2945} {"train_loss": -6.665554523468018, "global_step": 123722, "epoch": 2945} {"train_loss": -6.484911918640137, "global_step": 123723, "epoch": 2945} {"train_loss": -6.4900312423706055, "global_step": 123724, "epoch": 2945} {"train_loss": -6.574843406677246, "global_step": 123725, "epoch": 2945} {"train_loss": -6.563214302062988, "global_step": 123726, "epoch": 2945} {"train_loss": -6.577702522277832, "global_step": 123727, "epoch": 2945} {"train_loss": -6.554594039916992, "global_step": 123728, "epoch": 2945} {"train_loss": -6.679961204528809, "global_step": 123729, "epoch": 2945} {"train_loss": -6.637604236602783, "global_step": 123730, "epoch": 2945} {"train_loss": -6.5446933678218295, "global_step": 123731, "epoch": 2945, "val_loss": 68048.5546875} {"train_loss": -6.534152984619141, "global_step": 123732, "epoch": 2946} {"train_loss": -6.668578147888184, "global_step": 123733, "epoch": 2946} {"train_loss": -6.480085372924805, "global_step": 123734, "epoch": 2946} {"train_loss": -6.6498212814331055, "global_step": 123735, "epoch": 2946} {"train_loss": -6.561254024505615, "global_step": 123736, "epoch": 2946} {"train_loss": -6.678809642791748, "global_step": 123737, "epoch": 2946} {"train_loss": -6.706326484680176, "global_step": 123738, "epoch": 2946} {"train_loss": -6.550656795501709, "global_step": 123739, "epoch": 2946} {"train_loss": -6.614541053771973, "global_step": 123740, "epoch": 2946} {"train_loss": -6.6724324226379395, "global_step": 123741, "epoch": 2946} {"train_loss": -6.5133514404296875, "global_step": 123742, "epoch": 2946} {"train_loss": -6.569807529449463, "global_step": 123743, "epoch": 2946} {"train_loss": -6.695377349853516, "global_step": 123744, "epoch": 2946} {"train_loss": -6.657702445983887, "global_step": 123745, "epoch": 2946} {"train_loss": -6.664615631103516, "global_step": 123746, "epoch": 2946} {"train_loss": -6.679943561553955, "global_step": 123747, "epoch": 2946} {"train_loss": -6.670111656188965, "global_step": 123748, "epoch": 2946} {"train_loss": -6.568605422973633, "global_step": 123749, "epoch": 2946} {"train_loss": -6.49137020111084, "global_step": 123750, "epoch": 2946} {"train_loss": -6.550375938415527, "global_step": 123751, "epoch": 2946} {"train_loss": -6.5185160636901855, "global_step": 123752, "epoch": 2946} {"train_loss": -6.509488582611084, "global_step": 123753, "epoch": 2946} {"train_loss": -6.5514936447143555, "global_step": 123754, "epoch": 2946} {"train_loss": -6.536337852478027, "global_step": 123755, "epoch": 2946} {"train_loss": -6.555891513824463, "global_step": 123756, "epoch": 2946} {"train_loss": -6.5237884521484375, "global_step": 123757, "epoch": 2946} {"train_loss": -6.511542320251465, "global_step": 123758, "epoch": 2946} {"train_loss": -6.519525527954102, "global_step": 123759, "epoch": 2946} {"train_loss": -6.492031097412109, "global_step": 123760, "epoch": 2946} {"train_loss": -6.520650863647461, "global_step": 123761, "epoch": 2946} {"train_loss": -6.546175003051758, "global_step": 123762, "epoch": 2946} {"train_loss": -6.526608467102051, "global_step": 123763, "epoch": 2946} {"train_loss": -6.444294452667236, "global_step": 123764, "epoch": 2946} {"train_loss": -6.445672988891602, "global_step": 123765, "epoch": 2946} {"train_loss": -6.510899066925049, "global_step": 123766, "epoch": 2946} {"train_loss": -6.510387897491455, "global_step": 123767, "epoch": 2946} {"train_loss": -6.484475135803223, "global_step": 123768, "epoch": 2946} {"train_loss": -6.489879608154297, "global_step": 123769, "epoch": 2946} {"train_loss": -6.5308661460876465, "global_step": 123770, "epoch": 2946} {"train_loss": -6.4620361328125, "global_step": 123771, "epoch": 2946} {"train_loss": -6.576862335205078, "global_step": 123772, "epoch": 2946} {"train_loss": -6.560492640449887, "global_step": 123773, "epoch": 2946, "val_loss": 68231.8046875} {"train_loss": -6.524958610534668, "global_step": 123774, "epoch": 2947} {"train_loss": -6.557107448577881, "global_step": 123775, "epoch": 2947} {"train_loss": -6.538601398468018, "global_step": 123776, "epoch": 2947} {"train_loss": -6.578887939453125, "global_step": 123777, "epoch": 2947} {"train_loss": -6.560398101806641, "global_step": 123778, "epoch": 2947} {"train_loss": -6.536489486694336, "global_step": 123779, "epoch": 2947} {"train_loss": -6.588822364807129, "global_step": 123780, "epoch": 2947} {"train_loss": -6.401535987854004, "global_step": 123781, "epoch": 2947} {"train_loss": -6.419756889343262, "global_step": 123782, "epoch": 2947} {"train_loss": -6.441368103027344, "global_step": 123783, "epoch": 2947} {"train_loss": -6.471091270446777, "global_step": 123784, "epoch": 2947} {"train_loss": -6.63400936126709, "global_step": 123785, "epoch": 2947} {"train_loss": -6.553765296936035, "global_step": 123786, "epoch": 2947} {"train_loss": -6.596388816833496, "global_step": 123787, "epoch": 2947} {"train_loss": -6.588650703430176, "global_step": 123788, "epoch": 2947} {"train_loss": -6.572237968444824, "global_step": 123789, "epoch": 2947} {"train_loss": -6.652519226074219, "global_step": 123790, "epoch": 2947} {"train_loss": -6.634679794311523, "global_step": 123791, "epoch": 2947} {"train_loss": -6.650423049926758, "global_step": 123792, "epoch": 2947} {"train_loss": -6.724454879760742, "global_step": 123793, "epoch": 2947} {"train_loss": -6.574829578399658, "global_step": 123794, "epoch": 2947} {"train_loss": -6.731616973876953, "global_step": 123795, "epoch": 2947} {"train_loss": -6.550310134887695, "global_step": 123796, "epoch": 2947} {"train_loss": -6.564375877380371, "global_step": 123797, "epoch": 2947} {"train_loss": -6.498757839202881, "global_step": 123798, "epoch": 2947} {"train_loss": -6.555657386779785, "global_step": 123799, "epoch": 2947} {"train_loss": -6.6537580490112305, "global_step": 123800, "epoch": 2947} {"train_loss": -6.459160804748535, "global_step": 123801, "epoch": 2947} {"train_loss": -6.512433052062988, "global_step": 123802, "epoch": 2947} {"train_loss": -6.650723934173584, "global_step": 123803, "epoch": 2947} {"train_loss": -6.4077372550964355, "global_step": 123804, "epoch": 2947} {"train_loss": -6.544345855712891, "global_step": 123805, "epoch": 2947} {"train_loss": -6.567575931549072, "global_step": 123806, "epoch": 2947} {"train_loss": -6.549341678619385, "global_step": 123807, "epoch": 2947} {"train_loss": -6.574592590332031, "global_step": 123808, "epoch": 2947} {"train_loss": -6.594856262207031, "global_step": 123809, "epoch": 2947} {"train_loss": -6.599796295166016, "global_step": 123810, "epoch": 2947} {"train_loss": -6.50961971282959, "global_step": 123811, "epoch": 2947} {"train_loss": -6.595956325531006, "global_step": 123812, "epoch": 2947} {"train_loss": -6.479998588562012, "global_step": 123813, "epoch": 2947} {"train_loss": -6.585638999938965, "global_step": 123814, "epoch": 2947} {"train_loss": -6.559646878923688, "global_step": 123815, "epoch": 2947, "val_loss": 68129.421875} {"train_loss": -6.522984504699707, "global_step": 123816, "epoch": 2948} {"train_loss": -6.53362512588501, "global_step": 123817, "epoch": 2948} {"train_loss": -6.6575469970703125, "global_step": 123818, "epoch": 2948} {"train_loss": -6.649988174438477, "global_step": 123819, "epoch": 2948} {"train_loss": -6.667125225067139, "global_step": 123820, "epoch": 2948} {"train_loss": -6.6209330558776855, "global_step": 123821, "epoch": 2948} {"train_loss": -6.6158294677734375, "global_step": 123822, "epoch": 2948} {"train_loss": -6.54586124420166, "global_step": 123823, "epoch": 2948} {"train_loss": -6.531110763549805, "global_step": 123824, "epoch": 2948} {"train_loss": -6.558876991271973, "global_step": 123825, "epoch": 2948} {"train_loss": -6.575989723205566, "global_step": 123826, "epoch": 2948} {"train_loss": -6.504135608673096, "global_step": 123827, "epoch": 2948} {"train_loss": -6.556647300720215, "global_step": 123828, "epoch": 2948} {"train_loss": -6.491818428039551, "global_step": 123829, "epoch": 2948} {"train_loss": -6.585789680480957, "global_step": 123830, "epoch": 2948} {"train_loss": -6.488755226135254, "global_step": 123831, "epoch": 2948} {"train_loss": -6.559086799621582, "global_step": 123832, "epoch": 2948} {"train_loss": -6.641249656677246, "global_step": 123833, "epoch": 2948} {"train_loss": -6.573458671569824, "global_step": 123834, "epoch": 2948} {"train_loss": -6.603965759277344, "global_step": 123835, "epoch": 2948} {"train_loss": -6.503452301025391, "global_step": 123836, "epoch": 2948} {"train_loss": -6.654265403747559, "global_step": 123837, "epoch": 2948} {"train_loss": -6.539076328277588, "global_step": 123838, "epoch": 2948} {"train_loss": -6.580896854400635, "global_step": 123839, "epoch": 2948} {"train_loss": -6.5133957862854, "global_step": 123840, "epoch": 2948} {"train_loss": -6.601064682006836, "global_step": 123841, "epoch": 2948} {"train_loss": -6.4974164962768555, "global_step": 123842, "epoch": 2948} {"train_loss": -6.567165374755859, "global_step": 123843, "epoch": 2948} {"train_loss": -6.4417572021484375, "global_step": 123844, "epoch": 2948} {"train_loss": -6.571603298187256, "global_step": 123845, "epoch": 2948} {"train_loss": -6.492873191833496, "global_step": 123846, "epoch": 2948} {"train_loss": -6.531733989715576, "global_step": 123847, "epoch": 2948} {"train_loss": -6.487679481506348, "global_step": 123848, "epoch": 2948} {"train_loss": -6.594222545623779, "global_step": 123849, "epoch": 2948} {"train_loss": -6.572648048400879, "global_step": 123850, "epoch": 2948} {"train_loss": -6.509599685668945, "global_step": 123851, "epoch": 2948} {"train_loss": -6.652811527252197, "global_step": 123852, "epoch": 2948} {"train_loss": -6.542994976043701, "global_step": 123853, "epoch": 2948} {"train_loss": -6.617640495300293, "global_step": 123854, "epoch": 2948} {"train_loss": -6.712337493896484, "global_step": 123855, "epoch": 2948} {"train_loss": -6.407094955444336, "global_step": 123856, "epoch": 2948} {"train_loss": -6.563580706006005, "global_step": 123857, "epoch": 2948, "val_loss": 68068.875} {"train_loss": -6.572361469268799, "global_step": 123858, "epoch": 2949} {"train_loss": -6.5, "global_step": 123859, "epoch": 2949} {"train_loss": -6.6394829750061035, "global_step": 123860, "epoch": 2949} {"train_loss": -6.604347229003906, "global_step": 123861, "epoch": 2949} {"train_loss": -6.523996829986572, "global_step": 123862, "epoch": 2949} {"train_loss": -6.607206344604492, "global_step": 123863, "epoch": 2949} {"train_loss": -6.584151268005371, "global_step": 123864, "epoch": 2949} {"train_loss": -6.495250225067139, "global_step": 123865, "epoch": 2949} {"train_loss": -6.548027992248535, "global_step": 123866, "epoch": 2949} {"train_loss": -6.634251594543457, "global_step": 123867, "epoch": 2949} {"train_loss": -6.574488162994385, "global_step": 123868, "epoch": 2949} {"train_loss": -6.613457679748535, "global_step": 123869, "epoch": 2949} {"train_loss": -6.654199123382568, "global_step": 123870, "epoch": 2949} {"train_loss": -6.538909435272217, "global_step": 123871, "epoch": 2949} {"train_loss": -6.626985549926758, "global_step": 123872, "epoch": 2949} {"train_loss": -6.536418914794922, "global_step": 123873, "epoch": 2949} {"train_loss": -6.56768798828125, "global_step": 123874, "epoch": 2949} {"train_loss": -6.569403648376465, "global_step": 123875, "epoch": 2949} {"train_loss": -6.549171447753906, "global_step": 123876, "epoch": 2949} {"train_loss": -6.61737585067749, "global_step": 123877, "epoch": 2949} {"train_loss": -6.52241325378418, "global_step": 123878, "epoch": 2949} {"train_loss": -6.570434093475342, "global_step": 123879, "epoch": 2949} {"train_loss": -6.585233688354492, "global_step": 123880, "epoch": 2949} {"train_loss": -6.555974006652832, "global_step": 123881, "epoch": 2949} {"train_loss": -6.5528564453125, "global_step": 123882, "epoch": 2949} {"train_loss": -6.638247489929199, "global_step": 123883, "epoch": 2949} {"train_loss": -6.618619918823242, "global_step": 123884, "epoch": 2949} {"train_loss": -6.685773849487305, "global_step": 123885, "epoch": 2949} {"train_loss": -6.582120895385742, "global_step": 123886, "epoch": 2949} {"train_loss": -6.541563510894775, "global_step": 123887, "epoch": 2949} {"train_loss": -6.554744720458984, "global_step": 123888, "epoch": 2949} {"train_loss": -6.5622968673706055, "global_step": 123889, "epoch": 2949} {"train_loss": -6.476670742034912, "global_step": 123890, "epoch": 2949} {"train_loss": -6.550137042999268, "global_step": 123891, "epoch": 2949} {"train_loss": -6.539726257324219, "global_step": 123892, "epoch": 2949} {"train_loss": -6.59776496887207, "global_step": 123893, "epoch": 2949} {"train_loss": -6.643772125244141, "global_step": 123894, "epoch": 2949} {"train_loss": -6.548465728759766, "global_step": 123895, "epoch": 2949} {"train_loss": -6.597522735595703, "global_step": 123896, "epoch": 2949} {"train_loss": -6.599252223968506, "global_step": 123897, "epoch": 2949} {"train_loss": -6.729362487792969, "global_step": 123898, "epoch": 2949} {"train_loss": -6.58221359479995, "global_step": 123899, "epoch": 2949, "val_loss": 67992.2890625} {"train_loss": -6.574283123016357, "global_step": 123900, "epoch": 2950} {"train_loss": -6.607137680053711, "global_step": 123901, "epoch": 2950} {"train_loss": -6.688971519470215, "global_step": 123902, "epoch": 2950} {"train_loss": -6.640193939208984, "global_step": 123903, "epoch": 2950} {"train_loss": -6.614999771118164, "global_step": 123904, "epoch": 2950} {"train_loss": -6.673871040344238, "global_step": 123905, "epoch": 2950} {"train_loss": -6.70826530456543, "global_step": 123906, "epoch": 2950} {"train_loss": -6.701043605804443, "global_step": 123907, "epoch": 2950} {"train_loss": -6.616204261779785, "global_step": 123908, "epoch": 2950} {"train_loss": -6.688145160675049, "global_step": 123909, "epoch": 2950} {"train_loss": -6.64970588684082, "global_step": 123910, "epoch": 2950} {"train_loss": -6.615231037139893, "global_step": 123911, "epoch": 2950} {"train_loss": -6.492608547210693, "global_step": 123912, "epoch": 2950} {"train_loss": -6.569798469543457, "global_step": 123913, "epoch": 2950} {"train_loss": -6.634591102600098, "global_step": 123914, "epoch": 2950} {"train_loss": -6.534765720367432, "global_step": 123915, "epoch": 2950} {"train_loss": -6.530121803283691, "global_step": 123916, "epoch": 2950} {"train_loss": -6.62790584564209, "global_step": 123917, "epoch": 2950} {"train_loss": -6.598180294036865, "global_step": 123918, "epoch": 2950} {"train_loss": -6.572083473205566, "global_step": 123919, "epoch": 2950} {"train_loss": -6.512717247009277, "global_step": 123920, "epoch": 2950} {"train_loss": -6.447461128234863, "global_step": 123921, "epoch": 2950} {"train_loss": -6.568023681640625, "global_step": 123922, "epoch": 2950} {"train_loss": -6.510885238647461, "global_step": 123923, "epoch": 2950} {"train_loss": -6.600324630737305, "global_step": 123924, "epoch": 2950} {"train_loss": -6.683528423309326, "global_step": 123925, "epoch": 2950} {"train_loss": -6.501640796661377, "global_step": 123926, "epoch": 2950} {"train_loss": -6.604772567749023, "global_step": 123927, "epoch": 2950} {"train_loss": -6.536540985107422, "global_step": 123928, "epoch": 2950} {"train_loss": -6.487271308898926, "global_step": 123929, "epoch": 2950} {"train_loss": -6.4105119705200195, "global_step": 123930, "epoch": 2950} {"train_loss": -6.4618449211120605, "global_step": 123931, "epoch": 2950} {"train_loss": -6.556188583374023, "global_step": 123932, "epoch": 2950} {"train_loss": -6.600807189941406, "global_step": 123933, "epoch": 2950} {"train_loss": -6.570681095123291, "global_step": 123934, "epoch": 2950} {"train_loss": -6.546304702758789, "global_step": 123935, "epoch": 2950} {"train_loss": -6.529684066772461, "global_step": 123936, "epoch": 2950} {"train_loss": -6.61720085144043, "global_step": 123937, "epoch": 2950} {"train_loss": -6.525029182434082, "global_step": 123938, "epoch": 2950} {"train_loss": -6.444591045379639, "global_step": 123939, "epoch": 2950} {"train_loss": -6.487889289855957, "global_step": 123940, "epoch": 2950} {"train_loss": -6.57151046253386, "global_step": 123941, "epoch": 2950, "train/sim_max_reward_0": 0.199572159146473, "train/sim_max_reward_1": 0.8953967097878579, "train/sim_max_reward_2": 0.35323574596101137, "train/sim_max_reward_3": 0.1372635558745509, "train/sim_max_reward_4": 0.9840651225489221, "train/sim_max_reward_5": 0.9322152276654874, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.9241491819822267, "test/sim_max_reward_4400002": 0.37885133609121086, "test/sim_max_reward_4400003": 0.8267359574056347, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.7977921738384401, "test/sim_max_reward_4400006": 0.9916154452411491, "test/sim_max_reward_4400007": 0.9535714347525456, "test/sim_max_reward_4400008": 0.2990103009577125, "test/sim_max_reward_4400009": 0.9174585978549628, "test/sim_max_reward_4400010": 0.3265750947944026, "test/sim_max_reward_4400011": 0.25343261552134755, "test/sim_max_reward_4400012": 0.9657295906317854, "test/sim_max_reward_4400013": 0.404818800398275, "test/sim_max_reward_4400014": 0.7535559114411085, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0629841473402006, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2648723901975427, "test/sim_max_reward_4400019": 0.3185632199745616, "test/sim_max_reward_4400020": 2.0818467843931306e-05, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9761337068701204, "test/sim_max_reward_4400023": 0.9392835963875011, "test/sim_max_reward_4400024": 0.927416991518096, "test/sim_max_reward_4400025": 0.25981418453160066, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.04014455803554877, "test/sim_max_reward_4400028": 0.41488158416131765, "test/sim_max_reward_4400029": 0.46306452815858484, "test/sim_max_reward_4400030": 0.8909398861147337, "test/sim_max_reward_4400031": 0.9184008326672688, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.28340595081121417, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.9392620090024218, "test/sim_max_reward_4400036": 0.3957923543997684, "test/sim_max_reward_4400037": 0.9442550183028233, "test/sim_max_reward_4400038": 0.9938067409366943, "test/sim_max_reward_4400039": 0.9354264487182592, "test/sim_max_reward_4400040": 0.472256937912015, "test/sim_max_reward_4400041": 0.8929050873950437, "test/sim_max_reward_4400042": 0.8006844756265541, "test/sim_max_reward_4400043": 0.9029417081693869, "test/sim_max_reward_4400044": 0.824148496136717, "test/sim_max_reward_4400045": 0.9758551045617656, "test/sim_max_reward_4400046": 0.8928047648811942, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.7575309521418275, "test/sim_max_reward_4400049": 0.9412373736975549, "train/mean_score": 0.5836247534973839, "test/mean_score": 0.6139072027680572, "val_loss": 68142.4453125} {"train_loss": -6.578446388244629, "global_step": 123942, "epoch": 2951} {"train_loss": -6.626065254211426, "global_step": 123943, "epoch": 2951} {"train_loss": -6.455289840698242, "global_step": 123944, "epoch": 2951} {"train_loss": -6.674885272979736, "global_step": 123945, "epoch": 2951} {"train_loss": -6.425184726715088, "global_step": 123946, "epoch": 2951} {"train_loss": -6.504309177398682, "global_step": 123947, "epoch": 2951} {"train_loss": -6.5344367027282715, "global_step": 123948, "epoch": 2951} {"train_loss": -6.529336929321289, "global_step": 123949, "epoch": 2951} {"train_loss": -6.583106994628906, "global_step": 123950, "epoch": 2951} {"train_loss": -6.579093933105469, "global_step": 123951, "epoch": 2951} {"train_loss": -6.592528820037842, "global_step": 123952, "epoch": 2951} {"train_loss": -6.491557598114014, "global_step": 123953, "epoch": 2951} {"train_loss": -6.6030049324035645, "global_step": 123954, "epoch": 2951} {"train_loss": -6.519916534423828, "global_step": 123955, "epoch": 2951} {"train_loss": -6.618730545043945, "global_step": 123956, "epoch": 2951} {"train_loss": -6.590673446655273, "global_step": 123957, "epoch": 2951} {"train_loss": -6.497235298156738, "global_step": 123958, "epoch": 2951} {"train_loss": -6.57614278793335, "global_step": 123959, "epoch": 2951} {"train_loss": -6.607158660888672, "global_step": 123960, "epoch": 2951} {"train_loss": -6.513492584228516, "global_step": 123961, "epoch": 2951} {"train_loss": -6.670815467834473, "global_step": 123962, "epoch": 2951} {"train_loss": -6.561223983764648, "global_step": 123963, "epoch": 2951} {"train_loss": -6.548218250274658, "global_step": 123964, "epoch": 2951} {"train_loss": -6.642801284790039, "global_step": 123965, "epoch": 2951} {"train_loss": -6.525754928588867, "global_step": 123966, "epoch": 2951} {"train_loss": -6.634840488433838, "global_step": 123967, "epoch": 2951} {"train_loss": -6.589970588684082, "global_step": 123968, "epoch": 2951} {"train_loss": -6.696300506591797, "global_step": 123969, "epoch": 2951} {"train_loss": -6.505022048950195, "global_step": 123970, "epoch": 2951} {"train_loss": -6.617792129516602, "global_step": 123971, "epoch": 2951} {"train_loss": -6.57547664642334, "global_step": 123972, "epoch": 2951} {"train_loss": -6.612586498260498, "global_step": 123973, "epoch": 2951} {"train_loss": -6.633971214294434, "global_step": 123974, "epoch": 2951} {"train_loss": -6.601103782653809, "global_step": 123975, "epoch": 2951} {"train_loss": -6.638164520263672, "global_step": 123976, "epoch": 2951} {"train_loss": -6.482419013977051, "global_step": 123977, "epoch": 2951} {"train_loss": -6.572242736816406, "global_step": 123978, "epoch": 2951} {"train_loss": -6.576712131500244, "global_step": 123979, "epoch": 2951} {"train_loss": -6.407845497131348, "global_step": 123980, "epoch": 2951} {"train_loss": -6.677602291107178, "global_step": 123981, "epoch": 2951} {"train_loss": -6.5595903396606445, "global_step": 123982, "epoch": 2951} {"train_loss": -6.571400619688488, "global_step": 123983, "epoch": 2951, "val_loss": 68071.2109375} {"train_loss": -6.658466339111328, "global_step": 123984, "epoch": 2952} {"train_loss": -6.618239402770996, "global_step": 123985, "epoch": 2952} {"train_loss": -6.538975715637207, "global_step": 123986, "epoch": 2952} {"train_loss": -6.591850280761719, "global_step": 123987, "epoch": 2952} {"train_loss": -6.5344953536987305, "global_step": 123988, "epoch": 2952} {"train_loss": -6.666401386260986, "global_step": 123989, "epoch": 2952} {"train_loss": -6.578238010406494, "global_step": 123990, "epoch": 2952} {"train_loss": -6.639147758483887, "global_step": 123991, "epoch": 2952} {"train_loss": -6.688197135925293, "global_step": 123992, "epoch": 2952} {"train_loss": -6.495387077331543, "global_step": 123993, "epoch": 2952} {"train_loss": -6.506152153015137, "global_step": 123994, "epoch": 2952} {"train_loss": -6.535948753356934, "global_step": 123995, "epoch": 2952} {"train_loss": -6.626727104187012, "global_step": 123996, "epoch": 2952} {"train_loss": -6.496356964111328, "global_step": 123997, "epoch": 2952} {"train_loss": -6.582673072814941, "global_step": 123998, "epoch": 2952} {"train_loss": -6.551784992218018, "global_step": 123999, "epoch": 2952} {"train_loss": -6.617317199707031, "global_step": 124000, "epoch": 2952} {"train_loss": -6.607831954956055, "global_step": 124001, "epoch": 2952} {"train_loss": -6.571894645690918, "global_step": 124002, "epoch": 2952} {"train_loss": -6.525223731994629, "global_step": 124003, "epoch": 2952} {"train_loss": -6.529862403869629, "global_step": 124004, "epoch": 2952} {"train_loss": -6.526391506195068, "global_step": 124005, "epoch": 2952} {"train_loss": -6.570511817932129, "global_step": 124006, "epoch": 2952} {"train_loss": -6.689387321472168, "global_step": 124007, "epoch": 2952} {"train_loss": -6.515203475952148, "global_step": 124008, "epoch": 2952} {"train_loss": -6.658210754394531, "global_step": 124009, "epoch": 2952} {"train_loss": -6.517432689666748, "global_step": 124010, "epoch": 2952} {"train_loss": -6.494282245635986, "global_step": 124011, "epoch": 2952} {"train_loss": -6.494009971618652, "global_step": 124012, "epoch": 2952} {"train_loss": -6.5304460525512695, "global_step": 124013, "epoch": 2952} {"train_loss": -6.51754093170166, "global_step": 124014, "epoch": 2952} {"train_loss": -6.587497234344482, "global_step": 124015, "epoch": 2952} {"train_loss": -6.600982666015625, "global_step": 124016, "epoch": 2952} {"train_loss": -6.4543046951293945, "global_step": 124017, "epoch": 2952} {"train_loss": -6.587329387664795, "global_step": 124018, "epoch": 2952} {"train_loss": -6.625833511352539, "global_step": 124019, "epoch": 2952} {"train_loss": -6.677596092224121, "global_step": 124020, "epoch": 2952} {"train_loss": -6.623381614685059, "global_step": 124021, "epoch": 2952} {"train_loss": -6.565528869628906, "global_step": 124022, "epoch": 2952} {"train_loss": -6.560014724731445, "global_step": 124023, "epoch": 2952} {"train_loss": -6.695827484130859, "global_step": 124024, "epoch": 2952} {"train_loss": -6.578908068793161, "global_step": 124025, "epoch": 2952, "val_loss": 68043.9375} {"train_loss": -6.523766040802002, "global_step": 124026, "epoch": 2953} {"train_loss": -6.682991981506348, "global_step": 124027, "epoch": 2953} {"train_loss": -6.613207817077637, "global_step": 124028, "epoch": 2953} {"train_loss": -6.658929347991943, "global_step": 124029, "epoch": 2953} {"train_loss": -6.576372146606445, "global_step": 124030, "epoch": 2953} {"train_loss": -6.719123840332031, "global_step": 124031, "epoch": 2953} {"train_loss": -6.6437788009643555, "global_step": 124032, "epoch": 2953} {"train_loss": -6.609310150146484, "global_step": 124033, "epoch": 2953} {"train_loss": -6.555572032928467, "global_step": 124034, "epoch": 2953} {"train_loss": -6.4736409187316895, "global_step": 124035, "epoch": 2953} {"train_loss": -6.580954074859619, "global_step": 124036, "epoch": 2953} {"train_loss": -6.594521522521973, "global_step": 124037, "epoch": 2953} {"train_loss": -6.635967254638672, "global_step": 124038, "epoch": 2953} {"train_loss": -6.488363742828369, "global_step": 124039, "epoch": 2953} {"train_loss": -6.656273365020752, "global_step": 124040, "epoch": 2953} {"train_loss": -6.640585899353027, "global_step": 124041, "epoch": 2953} {"train_loss": -6.589853286743164, "global_step": 124042, "epoch": 2953} {"train_loss": -6.4897942543029785, "global_step": 124043, "epoch": 2953} {"train_loss": -6.671976089477539, "global_step": 124044, "epoch": 2953} {"train_loss": -6.600652694702148, "global_step": 124045, "epoch": 2953} {"train_loss": -6.553505897521973, "global_step": 124046, "epoch": 2953} {"train_loss": -6.598767280578613, "global_step": 124047, "epoch": 2953} {"train_loss": -6.604470252990723, "global_step": 124048, "epoch": 2953} {"train_loss": -6.704235076904297, "global_step": 124049, "epoch": 2953} {"train_loss": -6.566232204437256, "global_step": 124050, "epoch": 2953} {"train_loss": -6.509633541107178, "global_step": 124051, "epoch": 2953} {"train_loss": -6.546422481536865, "global_step": 124052, "epoch": 2953} {"train_loss": -6.60117244720459, "global_step": 124053, "epoch": 2953} {"train_loss": -6.55837345123291, "global_step": 124054, "epoch": 2953} {"train_loss": -6.4600749015808105, "global_step": 124055, "epoch": 2953} {"train_loss": -6.636906623840332, "global_step": 124056, "epoch": 2953} {"train_loss": -6.663029670715332, "global_step": 124057, "epoch": 2953} {"train_loss": -6.601001739501953, "global_step": 124058, "epoch": 2953} {"train_loss": -6.619692325592041, "global_step": 124059, "epoch": 2953} {"train_loss": -6.619206428527832, "global_step": 124060, "epoch": 2953} {"train_loss": -6.583285331726074, "global_step": 124061, "epoch": 2953} {"train_loss": -6.507542133331299, "global_step": 124062, "epoch": 2953} {"train_loss": -6.643944263458252, "global_step": 124063, "epoch": 2953} {"train_loss": -6.55575704574585, "global_step": 124064, "epoch": 2953} {"train_loss": -6.611962795257568, "global_step": 124065, "epoch": 2953} {"train_loss": -6.605566024780273, "global_step": 124066, "epoch": 2953} {"train_loss": -6.59256420816694, "global_step": 124067, "epoch": 2953, "val_loss": 68214.53125} {"train_loss": -6.679864883422852, "global_step": 124068, "epoch": 2954} {"train_loss": -6.582680702209473, "global_step": 124069, "epoch": 2954} {"train_loss": -6.660708427429199, "global_step": 124070, "epoch": 2954} {"train_loss": -6.566189765930176, "global_step": 124071, "epoch": 2954} {"train_loss": -6.623924732208252, "global_step": 124072, "epoch": 2954} {"train_loss": -6.560093402862549, "global_step": 124073, "epoch": 2954} {"train_loss": -6.655536651611328, "global_step": 124074, "epoch": 2954} {"train_loss": -6.513845920562744, "global_step": 124075, "epoch": 2954} {"train_loss": -6.575068950653076, "global_step": 124076, "epoch": 2954} {"train_loss": -6.602087020874023, "global_step": 124077, "epoch": 2954} {"train_loss": -6.687675476074219, "global_step": 124078, "epoch": 2954} {"train_loss": -6.547787189483643, "global_step": 124079, "epoch": 2954} {"train_loss": -6.546972751617432, "global_step": 124080, "epoch": 2954} {"train_loss": -6.59970235824585, "global_step": 124081, "epoch": 2954} {"train_loss": -6.6259541511535645, "global_step": 124082, "epoch": 2954} {"train_loss": -6.584102153778076, "global_step": 124083, "epoch": 2954} {"train_loss": -6.59749698638916, "global_step": 124084, "epoch": 2954} {"train_loss": -6.5558624267578125, "global_step": 124085, "epoch": 2954} {"train_loss": -6.623686790466309, "global_step": 124086, "epoch": 2954} {"train_loss": -6.620505332946777, "global_step": 124087, "epoch": 2954} {"train_loss": -6.446165084838867, "global_step": 124088, "epoch": 2954} {"train_loss": -6.585880279541016, "global_step": 124089, "epoch": 2954} {"train_loss": -6.48551082611084, "global_step": 124090, "epoch": 2954} {"train_loss": -6.488681793212891, "global_step": 124091, "epoch": 2954} {"train_loss": -6.507688045501709, "global_step": 124092, "epoch": 2954} {"train_loss": -6.605710983276367, "global_step": 124093, "epoch": 2954} {"train_loss": -6.547819137573242, "global_step": 124094, "epoch": 2954} {"train_loss": -6.610435485839844, "global_step": 124095, "epoch": 2954} {"train_loss": -6.596461296081543, "global_step": 124096, "epoch": 2954} {"train_loss": -6.528919219970703, "global_step": 124097, "epoch": 2954} {"train_loss": -6.575104713439941, "global_step": 124098, "epoch": 2954} {"train_loss": -6.505377769470215, "global_step": 124099, "epoch": 2954} {"train_loss": -6.517333030700684, "global_step": 124100, "epoch": 2954} {"train_loss": -6.445847034454346, "global_step": 124101, "epoch": 2954} {"train_loss": -6.512801647186279, "global_step": 124102, "epoch": 2954} {"train_loss": -6.500048637390137, "global_step": 124103, "epoch": 2954} {"train_loss": -6.563292980194092, "global_step": 124104, "epoch": 2954} {"train_loss": -6.645155429840088, "global_step": 124105, "epoch": 2954} {"train_loss": -6.565855979919434, "global_step": 124106, "epoch": 2954} {"train_loss": -6.616145133972168, "global_step": 124107, "epoch": 2954} {"train_loss": -6.513955116271973, "global_step": 124108, "epoch": 2954} {"train_loss": -6.571718295415242, "global_step": 124109, "epoch": 2954, "val_loss": 68115.078125} {"train_loss": -6.63924503326416, "global_step": 124110, "epoch": 2955} {"train_loss": -6.634102821350098, "global_step": 124111, "epoch": 2955} {"train_loss": -6.573134422302246, "global_step": 124112, "epoch": 2955} {"train_loss": -6.671197414398193, "global_step": 124113, "epoch": 2955} {"train_loss": -6.528210639953613, "global_step": 124114, "epoch": 2955} {"train_loss": -6.6246514320373535, "global_step": 124115, "epoch": 2955} {"train_loss": -6.5335187911987305, "global_step": 124116, "epoch": 2955} {"train_loss": -6.598090171813965, "global_step": 124117, "epoch": 2955} {"train_loss": -6.595044136047363, "global_step": 124118, "epoch": 2955} {"train_loss": -6.6282525062561035, "global_step": 124119, "epoch": 2955} {"train_loss": -6.543374538421631, "global_step": 124120, "epoch": 2955} {"train_loss": -6.543642520904541, "global_step": 124121, "epoch": 2955} {"train_loss": -6.75166130065918, "global_step": 124122, "epoch": 2955} {"train_loss": -6.483679294586182, "global_step": 124123, "epoch": 2955} {"train_loss": -6.362842559814453, "global_step": 124124, "epoch": 2955} {"train_loss": -6.6140828132629395, "global_step": 124125, "epoch": 2955} {"train_loss": -6.545350551605225, "global_step": 124126, "epoch": 2955} {"train_loss": -6.611259460449219, "global_step": 124127, "epoch": 2955} {"train_loss": -6.582889080047607, "global_step": 124128, "epoch": 2955} {"train_loss": -6.409607410430908, "global_step": 124129, "epoch": 2955} {"train_loss": -6.585227012634277, "global_step": 124130, "epoch": 2955} {"train_loss": -6.502045631408691, "global_step": 124131, "epoch": 2955} {"train_loss": -6.501073837280273, "global_step": 124132, "epoch": 2955} {"train_loss": -6.404392242431641, "global_step": 124133, "epoch": 2955} {"train_loss": -6.581377983093262, "global_step": 124134, "epoch": 2955} {"train_loss": -6.320898532867432, "global_step": 124135, "epoch": 2955} {"train_loss": -6.551237106323242, "global_step": 124136, "epoch": 2955} {"train_loss": -6.477848529815674, "global_step": 124137, "epoch": 2955} {"train_loss": -6.446230411529541, "global_step": 124138, "epoch": 2955} {"train_loss": -6.56182861328125, "global_step": 124139, "epoch": 2955} {"train_loss": -6.482575416564941, "global_step": 124140, "epoch": 2955} {"train_loss": -6.598575115203857, "global_step": 124141, "epoch": 2955} {"train_loss": -6.542366981506348, "global_step": 124142, "epoch": 2955} {"train_loss": -6.559985160827637, "global_step": 124143, "epoch": 2955} {"train_loss": -6.530965805053711, "global_step": 124144, "epoch": 2955} {"train_loss": -6.486616134643555, "global_step": 124145, "epoch": 2955} {"train_loss": -6.626403331756592, "global_step": 124146, "epoch": 2955} {"train_loss": -6.449675559997559, "global_step": 124147, "epoch": 2955} {"train_loss": -6.538325309753418, "global_step": 124148, "epoch": 2955} {"train_loss": -6.397433280944824, "global_step": 124149, "epoch": 2955} {"train_loss": -6.488150596618652, "global_step": 124150, "epoch": 2955} {"train_loss": -6.539215121950422, "global_step": 124151, "epoch": 2955, "val_loss": 68197.2578125} {"train_loss": -6.375444412231445, "global_step": 124152, "epoch": 2956} {"train_loss": -6.484491348266602, "global_step": 124153, "epoch": 2956} {"train_loss": -6.498169898986816, "global_step": 124154, "epoch": 2956} {"train_loss": -6.5048112869262695, "global_step": 124155, "epoch": 2956} {"train_loss": -6.447606086730957, "global_step": 124156, "epoch": 2956} {"train_loss": -6.485177993774414, "global_step": 124157, "epoch": 2956} {"train_loss": -6.602259635925293, "global_step": 124158, "epoch": 2956} {"train_loss": -6.568635940551758, "global_step": 124159, "epoch": 2956} {"train_loss": -6.635684967041016, "global_step": 124160, "epoch": 2956} {"train_loss": -6.570410251617432, "global_step": 124161, "epoch": 2956} {"train_loss": -6.623662948608398, "global_step": 124162, "epoch": 2956} {"train_loss": -6.554841041564941, "global_step": 124163, "epoch": 2956} {"train_loss": -6.672884941101074, "global_step": 124164, "epoch": 2956} {"train_loss": -6.5560712814331055, "global_step": 124165, "epoch": 2956} {"train_loss": -6.730899810791016, "global_step": 124166, "epoch": 2956} {"train_loss": -6.547786712646484, "global_step": 124167, "epoch": 2956} {"train_loss": -6.574099063873291, "global_step": 124168, "epoch": 2956} {"train_loss": -6.684933662414551, "global_step": 124169, "epoch": 2956} {"train_loss": -6.5801191329956055, "global_step": 124170, "epoch": 2956} {"train_loss": -6.5874176025390625, "global_step": 124171, "epoch": 2956} {"train_loss": -6.677824020385742, "global_step": 124172, "epoch": 2956} {"train_loss": -6.667037487030029, "global_step": 124173, "epoch": 2956} {"train_loss": -6.6856279373168945, "global_step": 124174, "epoch": 2956} {"train_loss": -6.664332866668701, "global_step": 124175, "epoch": 2956} {"train_loss": -6.595959663391113, "global_step": 124176, "epoch": 2956} {"train_loss": -6.485764980316162, "global_step": 124177, "epoch": 2956} {"train_loss": -6.60868501663208, "global_step": 124178, "epoch": 2956} {"train_loss": -6.57814884185791, "global_step": 124179, "epoch": 2956} {"train_loss": -6.533860206604004, "global_step": 124180, "epoch": 2956} {"train_loss": -6.65759801864624, "global_step": 124181, "epoch": 2956} {"train_loss": -6.586796283721924, "global_step": 124182, "epoch": 2956} {"train_loss": -6.589990615844727, "global_step": 124183, "epoch": 2956} {"train_loss": -6.467954635620117, "global_step": 124184, "epoch": 2956} {"train_loss": -6.603531360626221, "global_step": 124185, "epoch": 2956} {"train_loss": -6.661871910095215, "global_step": 124186, "epoch": 2956} {"train_loss": -6.551059722900391, "global_step": 124187, "epoch": 2956} {"train_loss": -6.634108543395996, "global_step": 124188, "epoch": 2956} {"train_loss": -6.555544853210449, "global_step": 124189, "epoch": 2956} {"train_loss": -6.659481048583984, "global_step": 124190, "epoch": 2956} {"train_loss": -6.636916160583496, "global_step": 124191, "epoch": 2956} {"train_loss": -6.560140609741211, "global_step": 124192, "epoch": 2956} {"train_loss": -6.581044730686006, "global_step": 124193, "epoch": 2956, "val_loss": 68146.9140625} {"train_loss": -6.48756217956543, "global_step": 124194, "epoch": 2957} {"train_loss": -6.569751739501953, "global_step": 124195, "epoch": 2957} {"train_loss": -6.611644744873047, "global_step": 124196, "epoch": 2957} {"train_loss": -6.577101707458496, "global_step": 124197, "epoch": 2957} {"train_loss": -6.6412577629089355, "global_step": 124198, "epoch": 2957} {"train_loss": -6.41172981262207, "global_step": 124199, "epoch": 2957} {"train_loss": -6.5874433517456055, "global_step": 124200, "epoch": 2957} {"train_loss": -6.602750778198242, "global_step": 124201, "epoch": 2957} {"train_loss": -6.658561706542969, "global_step": 124202, "epoch": 2957} {"train_loss": -6.510980606079102, "global_step": 124203, "epoch": 2957} {"train_loss": -6.599460601806641, "global_step": 124204, "epoch": 2957} {"train_loss": -6.5126261711120605, "global_step": 124205, "epoch": 2957} {"train_loss": -6.662830352783203, "global_step": 124206, "epoch": 2957} {"train_loss": -6.609821796417236, "global_step": 124207, "epoch": 2957} {"train_loss": -6.60595703125, "global_step": 124208, "epoch": 2957} {"train_loss": -6.605910301208496, "global_step": 124209, "epoch": 2957} {"train_loss": -6.617214202880859, "global_step": 124210, "epoch": 2957} {"train_loss": -6.561619281768799, "global_step": 124211, "epoch": 2957} {"train_loss": -6.567723274230957, "global_step": 124212, "epoch": 2957} {"train_loss": -6.6294379234313965, "global_step": 124213, "epoch": 2957} {"train_loss": -6.585099220275879, "global_step": 124214, "epoch": 2957} {"train_loss": -6.585474967956543, "global_step": 124215, "epoch": 2957} {"train_loss": -6.598882675170898, "global_step": 124216, "epoch": 2957} {"train_loss": -6.552412509918213, "global_step": 124217, "epoch": 2957} {"train_loss": -6.570799827575684, "global_step": 124218, "epoch": 2957} {"train_loss": -6.462238788604736, "global_step": 124219, "epoch": 2957} {"train_loss": -6.641412734985352, "global_step": 124220, "epoch": 2957} {"train_loss": -6.565350532531738, "global_step": 124221, "epoch": 2957} {"train_loss": -6.4985432624816895, "global_step": 124222, "epoch": 2957} {"train_loss": -6.5432353019714355, "global_step": 124223, "epoch": 2957} {"train_loss": -6.547954559326172, "global_step": 124224, "epoch": 2957} {"train_loss": -6.624446868896484, "global_step": 124225, "epoch": 2957} {"train_loss": -6.546353816986084, "global_step": 124226, "epoch": 2957} {"train_loss": -6.650474548339844, "global_step": 124227, "epoch": 2957} {"train_loss": -6.410463333129883, "global_step": 124228, "epoch": 2957} {"train_loss": -6.619657516479492, "global_step": 124229, "epoch": 2957} {"train_loss": -6.602787971496582, "global_step": 124230, "epoch": 2957} {"train_loss": -6.666399955749512, "global_step": 124231, "epoch": 2957} {"train_loss": -6.59749698638916, "global_step": 124232, "epoch": 2957} {"train_loss": -6.526098251342773, "global_step": 124233, "epoch": 2957} {"train_loss": -6.57980489730835, "global_step": 124234, "epoch": 2957} {"train_loss": -6.575077374776204, "global_step": 124235, "epoch": 2957, "val_loss": 68438.7109375} {"train_loss": -6.461700439453125, "global_step": 124236, "epoch": 2958} {"train_loss": -6.673011779785156, "global_step": 124237, "epoch": 2958} {"train_loss": -6.623879909515381, "global_step": 124238, "epoch": 2958} {"train_loss": -6.579771518707275, "global_step": 124239, "epoch": 2958} {"train_loss": -6.640626907348633, "global_step": 124240, "epoch": 2958} {"train_loss": -6.57777738571167, "global_step": 124241, "epoch": 2958} {"train_loss": -6.495783805847168, "global_step": 124242, "epoch": 2958} {"train_loss": -6.599093437194824, "global_step": 124243, "epoch": 2958} {"train_loss": -6.491705894470215, "global_step": 124244, "epoch": 2958} {"train_loss": -6.632221698760986, "global_step": 124245, "epoch": 2958} {"train_loss": -6.521215438842773, "global_step": 124246, "epoch": 2958} {"train_loss": -6.563083648681641, "global_step": 124247, "epoch": 2958} {"train_loss": -6.623727798461914, "global_step": 124248, "epoch": 2958} {"train_loss": -6.495306015014648, "global_step": 124249, "epoch": 2958} {"train_loss": -6.596156597137451, "global_step": 124250, "epoch": 2958} {"train_loss": -6.534297466278076, "global_step": 124251, "epoch": 2958} {"train_loss": -6.585021018981934, "global_step": 124252, "epoch": 2958} {"train_loss": -6.581019878387451, "global_step": 124253, "epoch": 2958} {"train_loss": -6.549978256225586, "global_step": 124254, "epoch": 2958} {"train_loss": -6.600958347320557, "global_step": 124255, "epoch": 2958} {"train_loss": -6.46201229095459, "global_step": 124256, "epoch": 2958} {"train_loss": -6.5022382736206055, "global_step": 124257, "epoch": 2958} {"train_loss": -6.553046226501465, "global_step": 124258, "epoch": 2958} {"train_loss": -6.590504169464111, "global_step": 124259, "epoch": 2958} {"train_loss": -6.596073150634766, "global_step": 124260, "epoch": 2958} {"train_loss": -6.5319719314575195, "global_step": 124261, "epoch": 2958} {"train_loss": -6.6000752449035645, "global_step": 124262, "epoch": 2958} {"train_loss": -6.528306007385254, "global_step": 124263, "epoch": 2958} {"train_loss": -6.516786575317383, "global_step": 124264, "epoch": 2958} {"train_loss": -6.532860279083252, "global_step": 124265, "epoch": 2958} {"train_loss": -6.445552825927734, "global_step": 124266, "epoch": 2958} {"train_loss": -6.575328826904297, "global_step": 124267, "epoch": 2958} {"train_loss": -6.579975128173828, "global_step": 124268, "epoch": 2958} {"train_loss": -6.536648750305176, "global_step": 124269, "epoch": 2958} {"train_loss": -6.5226850509643555, "global_step": 124270, "epoch": 2958} {"train_loss": -6.455976486206055, "global_step": 124271, "epoch": 2958} {"train_loss": -6.460199356079102, "global_step": 124272, "epoch": 2958} {"train_loss": -6.589609146118164, "global_step": 124273, "epoch": 2958} {"train_loss": -6.6406989097595215, "global_step": 124274, "epoch": 2958} {"train_loss": -6.5634050369262695, "global_step": 124275, "epoch": 2958} {"train_loss": -6.564371109008789, "global_step": 124276, "epoch": 2958} {"train_loss": -6.558575550715129, "global_step": 124277, "epoch": 2958, "val_loss": 68214.375} {"train_loss": -6.481781005859375, "global_step": 124278, "epoch": 2959} {"train_loss": -6.664161682128906, "global_step": 124279, "epoch": 2959} {"train_loss": -6.503966331481934, "global_step": 124280, "epoch": 2959} {"train_loss": -6.573278903961182, "global_step": 124281, "epoch": 2959} {"train_loss": -6.557639122009277, "global_step": 124282, "epoch": 2959} {"train_loss": -6.532294273376465, "global_step": 124283, "epoch": 2959} {"train_loss": -6.540937423706055, "global_step": 124284, "epoch": 2959} {"train_loss": -6.569559097290039, "global_step": 124285, "epoch": 2959} {"train_loss": -6.463542938232422, "global_step": 124286, "epoch": 2959} {"train_loss": -6.432555198669434, "global_step": 124287, "epoch": 2959} {"train_loss": -6.394609451293945, "global_step": 124288, "epoch": 2959} {"train_loss": -6.522110939025879, "global_step": 124289, "epoch": 2959} {"train_loss": -6.526784896850586, "global_step": 124290, "epoch": 2959} {"train_loss": -6.46525764465332, "global_step": 124291, "epoch": 2959} {"train_loss": -6.486315727233887, "global_step": 124292, "epoch": 2959} {"train_loss": -6.480934143066406, "global_step": 124293, "epoch": 2959} {"train_loss": -6.3072099685668945, "global_step": 124294, "epoch": 2959} {"train_loss": -6.596977233886719, "global_step": 124295, "epoch": 2959} {"train_loss": -6.398731708526611, "global_step": 124296, "epoch": 2959} {"train_loss": -6.613836765289307, "global_step": 124297, "epoch": 2959} {"train_loss": -6.531939506530762, "global_step": 124298, "epoch": 2959} {"train_loss": -6.550112724304199, "global_step": 124299, "epoch": 2959} {"train_loss": -6.65255069732666, "global_step": 124300, "epoch": 2959} {"train_loss": -6.600393295288086, "global_step": 124301, "epoch": 2959} {"train_loss": -6.599767208099365, "global_step": 124302, "epoch": 2959} {"train_loss": -6.604457378387451, "global_step": 124303, "epoch": 2959} {"train_loss": -6.65449333190918, "global_step": 124304, "epoch": 2959} {"train_loss": -6.622097492218018, "global_step": 124305, "epoch": 2959} {"train_loss": -6.503657817840576, "global_step": 124306, "epoch": 2959} {"train_loss": -6.532805442810059, "global_step": 124307, "epoch": 2959} {"train_loss": -6.547319412231445, "global_step": 124308, "epoch": 2959} {"train_loss": -6.590412616729736, "global_step": 124309, "epoch": 2959} {"train_loss": -6.537579536437988, "global_step": 124310, "epoch": 2959} {"train_loss": -6.576390266418457, "global_step": 124311, "epoch": 2959} {"train_loss": -6.589939117431641, "global_step": 124312, "epoch": 2959} {"train_loss": -6.661109924316406, "global_step": 124313, "epoch": 2959} {"train_loss": -6.602688789367676, "global_step": 124314, "epoch": 2959} {"train_loss": -6.586853981018066, "global_step": 124315, "epoch": 2959} {"train_loss": -6.553648948669434, "global_step": 124316, "epoch": 2959} {"train_loss": -6.5680012702941895, "global_step": 124317, "epoch": 2959} {"train_loss": -6.608036994934082, "global_step": 124318, "epoch": 2959} {"train_loss": -6.547657285417829, "global_step": 124319, "epoch": 2959, "val_loss": 68093.53125} {"train_loss": -6.585392951965332, "global_step": 124320, "epoch": 2960} {"train_loss": -6.5507941246032715, "global_step": 124321, "epoch": 2960} {"train_loss": -6.537805557250977, "global_step": 124322, "epoch": 2960} {"train_loss": -6.609988212585449, "global_step": 124323, "epoch": 2960} {"train_loss": -6.373892784118652, "global_step": 124324, "epoch": 2960} {"train_loss": -6.567399024963379, "global_step": 124325, "epoch": 2960} {"train_loss": -6.554653167724609, "global_step": 124326, "epoch": 2960} {"train_loss": -6.44230318069458, "global_step": 124327, "epoch": 2960} {"train_loss": -6.571380138397217, "global_step": 124328, "epoch": 2960} {"train_loss": -6.693410396575928, "global_step": 124329, "epoch": 2960} {"train_loss": -6.665596008300781, "global_step": 124330, "epoch": 2960} {"train_loss": -6.590627193450928, "global_step": 124331, "epoch": 2960} {"train_loss": -6.532814025878906, "global_step": 124332, "epoch": 2960} {"train_loss": -6.533041954040527, "global_step": 124333, "epoch": 2960} {"train_loss": -6.613101959228516, "global_step": 124334, "epoch": 2960} {"train_loss": -6.578183650970459, "global_step": 124335, "epoch": 2960} {"train_loss": -6.547507286071777, "global_step": 124336, "epoch": 2960} {"train_loss": -6.58324670791626, "global_step": 124337, "epoch": 2960} {"train_loss": -6.628790378570557, "global_step": 124338, "epoch": 2960} {"train_loss": -6.587242603302002, "global_step": 124339, "epoch": 2960} {"train_loss": -6.534344673156738, "global_step": 124340, "epoch": 2960} {"train_loss": -6.495440483093262, "global_step": 124341, "epoch": 2960} {"train_loss": -6.614404678344727, "global_step": 124342, "epoch": 2960} {"train_loss": -6.486559867858887, "global_step": 124343, "epoch": 2960} {"train_loss": -6.612093925476074, "global_step": 124344, "epoch": 2960} {"train_loss": -6.627628803253174, "global_step": 124345, "epoch": 2960} {"train_loss": -6.515254974365234, "global_step": 124346, "epoch": 2960} {"train_loss": -6.61634635925293, "global_step": 124347, "epoch": 2960} {"train_loss": -6.677590847015381, "global_step": 124348, "epoch": 2960} {"train_loss": -6.4812822341918945, "global_step": 124349, "epoch": 2960} {"train_loss": -6.6914753913879395, "global_step": 124350, "epoch": 2960} {"train_loss": -6.5043182373046875, "global_step": 124351, "epoch": 2960} {"train_loss": -6.657594680786133, "global_step": 124352, "epoch": 2960} {"train_loss": -6.655784606933594, "global_step": 124353, "epoch": 2960} {"train_loss": -6.520046234130859, "global_step": 124354, "epoch": 2960} {"train_loss": -6.679655075073242, "global_step": 124355, "epoch": 2960} {"train_loss": -6.543642997741699, "global_step": 124356, "epoch": 2960} {"train_loss": -6.687871932983398, "global_step": 124357, "epoch": 2960} {"train_loss": -6.625484466552734, "global_step": 124358, "epoch": 2960} {"train_loss": -6.58001708984375, "global_step": 124359, "epoch": 2960} {"train_loss": -6.733506202697754, "global_step": 124360, "epoch": 2960} {"train_loss": -6.582224482581729, "global_step": 124361, "epoch": 2960, "val_loss": 67952.03125} {"train_loss": -6.656832218170166, "global_step": 124362, "epoch": 2961} {"train_loss": -6.628107070922852, "global_step": 124363, "epoch": 2961} {"train_loss": -6.495440483093262, "global_step": 124364, "epoch": 2961} {"train_loss": -6.712747573852539, "global_step": 124365, "epoch": 2961} {"train_loss": -6.638289928436279, "global_step": 124366, "epoch": 2961} {"train_loss": -6.536436080932617, "global_step": 124367, "epoch": 2961} {"train_loss": -6.516549110412598, "global_step": 124368, "epoch": 2961} {"train_loss": -6.5039143562316895, "global_step": 124369, "epoch": 2961} {"train_loss": -6.5406413078308105, "global_step": 124370, "epoch": 2961} {"train_loss": -6.603375434875488, "global_step": 124371, "epoch": 2961} {"train_loss": -6.676412582397461, "global_step": 124372, "epoch": 2961} {"train_loss": -6.524998664855957, "global_step": 124373, "epoch": 2961} {"train_loss": -6.505982398986816, "global_step": 124374, "epoch": 2961} {"train_loss": -6.5915117263793945, "global_step": 124375, "epoch": 2961} {"train_loss": -6.515008926391602, "global_step": 124376, "epoch": 2961} {"train_loss": -6.384759902954102, "global_step": 124377, "epoch": 2961} {"train_loss": -6.456754207611084, "global_step": 124378, "epoch": 2961} {"train_loss": -6.491506099700928, "global_step": 124379, "epoch": 2961} {"train_loss": -6.597809791564941, "global_step": 124380, "epoch": 2961} {"train_loss": -6.5151519775390625, "global_step": 124381, "epoch": 2961} {"train_loss": -6.601768493652344, "global_step": 124382, "epoch": 2961} {"train_loss": -6.494361877441406, "global_step": 124383, "epoch": 2961} {"train_loss": -6.532893180847168, "global_step": 124384, "epoch": 2961} {"train_loss": -6.480445861816406, "global_step": 124385, "epoch": 2961} {"train_loss": -6.644624710083008, "global_step": 124386, "epoch": 2961} {"train_loss": -6.482751369476318, "global_step": 124387, "epoch": 2961} {"train_loss": -6.6546101570129395, "global_step": 124388, "epoch": 2961} {"train_loss": -6.5904717445373535, "global_step": 124389, "epoch": 2961} {"train_loss": -6.544045448303223, "global_step": 124390, "epoch": 2961} {"train_loss": -6.492859840393066, "global_step": 124391, "epoch": 2961} {"train_loss": -6.457598686218262, "global_step": 124392, "epoch": 2961} {"train_loss": -6.516702651977539, "global_step": 124393, "epoch": 2961} {"train_loss": -6.506260395050049, "global_step": 124394, "epoch": 2961} {"train_loss": -6.6674957275390625, "global_step": 124395, "epoch": 2961} {"train_loss": -6.536661148071289, "global_step": 124396, "epoch": 2961} {"train_loss": -6.585101127624512, "global_step": 124397, "epoch": 2961} {"train_loss": -6.631441593170166, "global_step": 124398, "epoch": 2961} {"train_loss": -6.594917297363281, "global_step": 124399, "epoch": 2961} {"train_loss": -6.587637901306152, "global_step": 124400, "epoch": 2961} {"train_loss": -6.484857559204102, "global_step": 124401, "epoch": 2961} {"train_loss": -6.634218215942383, "global_step": 124402, "epoch": 2961} {"train_loss": -6.55595976965768, "global_step": 124403, "epoch": 2961, "val_loss": 67939.2109375} {"train_loss": -6.55916166305542, "global_step": 124404, "epoch": 2962} {"train_loss": -6.692986488342285, "global_step": 124405, "epoch": 2962} {"train_loss": -6.598777770996094, "global_step": 124406, "epoch": 2962} {"train_loss": -6.49346923828125, "global_step": 124407, "epoch": 2962} {"train_loss": -6.533455848693848, "global_step": 124408, "epoch": 2962} {"train_loss": -6.636322021484375, "global_step": 124409, "epoch": 2962} {"train_loss": -6.495541095733643, "global_step": 124410, "epoch": 2962} {"train_loss": -6.54420280456543, "global_step": 124411, "epoch": 2962} {"train_loss": -6.550936698913574, "global_step": 124412, "epoch": 2962} {"train_loss": -6.433749198913574, "global_step": 124413, "epoch": 2962} {"train_loss": -6.648571968078613, "global_step": 124414, "epoch": 2962} {"train_loss": -6.306727886199951, "global_step": 124415, "epoch": 2962} {"train_loss": -6.522831916809082, "global_step": 124416, "epoch": 2962} {"train_loss": -6.444117546081543, "global_step": 124417, "epoch": 2962} {"train_loss": -6.566390037536621, "global_step": 124418, "epoch": 2962} {"train_loss": -6.634883880615234, "global_step": 124419, "epoch": 2962} {"train_loss": -6.481484413146973, "global_step": 124420, "epoch": 2962} {"train_loss": -6.539181709289551, "global_step": 124421, "epoch": 2962} {"train_loss": -6.458065032958984, "global_step": 124422, "epoch": 2962} {"train_loss": -6.54640531539917, "global_step": 124423, "epoch": 2962} {"train_loss": -6.635924339294434, "global_step": 124424, "epoch": 2962} {"train_loss": -6.503680229187012, "global_step": 124425, "epoch": 2962} {"train_loss": -6.502947807312012, "global_step": 124426, "epoch": 2962} {"train_loss": -6.6020684242248535, "global_step": 124427, "epoch": 2962} {"train_loss": -6.516935348510742, "global_step": 124428, "epoch": 2962} {"train_loss": -6.502713203430176, "global_step": 124429, "epoch": 2962} {"train_loss": -6.481528282165527, "global_step": 124430, "epoch": 2962} {"train_loss": -6.471785545349121, "global_step": 124431, "epoch": 2962} {"train_loss": -6.709914207458496, "global_step": 124432, "epoch": 2962} {"train_loss": -6.560507774353027, "global_step": 124433, "epoch": 2962} {"train_loss": -6.441218376159668, "global_step": 124434, "epoch": 2962} {"train_loss": -6.64400577545166, "global_step": 124435, "epoch": 2962} {"train_loss": -6.59598445892334, "global_step": 124436, "epoch": 2962} {"train_loss": -6.444153308868408, "global_step": 124437, "epoch": 2962} {"train_loss": -6.460325717926025, "global_step": 124438, "epoch": 2962} {"train_loss": -6.439462184906006, "global_step": 124439, "epoch": 2962} {"train_loss": -6.478711128234863, "global_step": 124440, "epoch": 2962} {"train_loss": -6.496433734893799, "global_step": 124441, "epoch": 2962} {"train_loss": -6.513751029968262, "global_step": 124442, "epoch": 2962} {"train_loss": -6.528309345245361, "global_step": 124443, "epoch": 2962} {"train_loss": -6.554617881774902, "global_step": 124444, "epoch": 2962} {"train_loss": -6.532026052474976, "global_step": 124445, "epoch": 2962, "val_loss": 67919.9453125} {"train_loss": -6.643117427825928, "global_step": 124446, "epoch": 2963} {"train_loss": -6.505608558654785, "global_step": 124447, "epoch": 2963} {"train_loss": -6.543698787689209, "global_step": 124448, "epoch": 2963} {"train_loss": -6.618426322937012, "global_step": 124449, "epoch": 2963} {"train_loss": -6.614037036895752, "global_step": 124450, "epoch": 2963} {"train_loss": -6.5519819259643555, "global_step": 124451, "epoch": 2963} {"train_loss": -6.497950553894043, "global_step": 124452, "epoch": 2963} {"train_loss": -6.571868896484375, "global_step": 124453, "epoch": 2963} {"train_loss": -6.521134376525879, "global_step": 124454, "epoch": 2963} {"train_loss": -6.564236640930176, "global_step": 124455, "epoch": 2963} {"train_loss": -6.4376068115234375, "global_step": 124456, "epoch": 2963} {"train_loss": -6.5113372802734375, "global_step": 124457, "epoch": 2963} {"train_loss": -6.555943489074707, "global_step": 124458, "epoch": 2963} {"train_loss": -6.596238136291504, "global_step": 124459, "epoch": 2963} {"train_loss": -6.567552089691162, "global_step": 124460, "epoch": 2963} {"train_loss": -6.676522254943848, "global_step": 124461, "epoch": 2963} {"train_loss": -6.590016841888428, "global_step": 124462, "epoch": 2963} {"train_loss": -6.6275105476379395, "global_step": 124463, "epoch": 2963} {"train_loss": -6.602240562438965, "global_step": 124464, "epoch": 2963} {"train_loss": -6.537374496459961, "global_step": 124465, "epoch": 2963} {"train_loss": -6.594655990600586, "global_step": 124466, "epoch": 2963} {"train_loss": -6.483083724975586, "global_step": 124467, "epoch": 2963} {"train_loss": -6.577929496765137, "global_step": 124468, "epoch": 2963} {"train_loss": -6.639749050140381, "global_step": 124469, "epoch": 2963} {"train_loss": -6.457009315490723, "global_step": 124470, "epoch": 2963} {"train_loss": -6.624451637268066, "global_step": 124471, "epoch": 2963} {"train_loss": -6.517928123474121, "global_step": 124472, "epoch": 2963} {"train_loss": -6.605546474456787, "global_step": 124473, "epoch": 2963} {"train_loss": -6.670840740203857, "global_step": 124474, "epoch": 2963} {"train_loss": -6.574961185455322, "global_step": 124475, "epoch": 2963} {"train_loss": -6.523809432983398, "global_step": 124476, "epoch": 2963} {"train_loss": -6.540287017822266, "global_step": 124477, "epoch": 2963} {"train_loss": -6.608391761779785, "global_step": 124478, "epoch": 2963} {"train_loss": -6.511758804321289, "global_step": 124479, "epoch": 2963} {"train_loss": -6.530492305755615, "global_step": 124480, "epoch": 2963} {"train_loss": -6.512577056884766, "global_step": 124481, "epoch": 2963} {"train_loss": -6.464163780212402, "global_step": 124482, "epoch": 2963} {"train_loss": -6.603453636169434, "global_step": 124483, "epoch": 2963} {"train_loss": -6.587309837341309, "global_step": 124484, "epoch": 2963} {"train_loss": -6.540124893188477, "global_step": 124485, "epoch": 2963} {"train_loss": -6.6238484382629395, "global_step": 124486, "epoch": 2963} {"train_loss": -6.564420359475272, "global_step": 124487, "epoch": 2963, "val_loss": 68035.671875} {"train_loss": -6.550759315490723, "global_step": 124488, "epoch": 2964} {"train_loss": -6.496119499206543, "global_step": 124489, "epoch": 2964} {"train_loss": -6.559134006500244, "global_step": 124490, "epoch": 2964} {"train_loss": -6.5189595222473145, "global_step": 124491, "epoch": 2964} {"train_loss": -6.4639434814453125, "global_step": 124492, "epoch": 2964} {"train_loss": -6.650308609008789, "global_step": 124493, "epoch": 2964} {"train_loss": -6.619295597076416, "global_step": 124494, "epoch": 2964} {"train_loss": -6.515752792358398, "global_step": 124495, "epoch": 2964} {"train_loss": -6.5894269943237305, "global_step": 124496, "epoch": 2964} {"train_loss": -6.577663421630859, "global_step": 124497, "epoch": 2964} {"train_loss": -6.563224792480469, "global_step": 124498, "epoch": 2964} {"train_loss": -6.696000099182129, "global_step": 124499, "epoch": 2964} {"train_loss": -6.477013111114502, "global_step": 124500, "epoch": 2964} {"train_loss": -6.6506805419921875, "global_step": 124501, "epoch": 2964} {"train_loss": -6.601452350616455, "global_step": 124502, "epoch": 2964} {"train_loss": -6.603208541870117, "global_step": 124503, "epoch": 2964} {"train_loss": -6.486191272735596, "global_step": 124504, "epoch": 2964} {"train_loss": -6.538516998291016, "global_step": 124505, "epoch": 2964} {"train_loss": -6.623088836669922, "global_step": 124506, "epoch": 2964} {"train_loss": -6.554140567779541, "global_step": 124507, "epoch": 2964} {"train_loss": -6.644321441650391, "global_step": 124508, "epoch": 2964} {"train_loss": -6.529750347137451, "global_step": 124509, "epoch": 2964} {"train_loss": -6.54299259185791, "global_step": 124510, "epoch": 2964} {"train_loss": -6.5207929611206055, "global_step": 124511, "epoch": 2964} {"train_loss": -6.576827049255371, "global_step": 124512, "epoch": 2964} {"train_loss": -6.603233337402344, "global_step": 124513, "epoch": 2964} {"train_loss": -6.572171211242676, "global_step": 124514, "epoch": 2964} {"train_loss": -6.421532154083252, "global_step": 124515, "epoch": 2964} {"train_loss": -6.550514221191406, "global_step": 124516, "epoch": 2964} {"train_loss": -6.465959072113037, "global_step": 124517, "epoch": 2964} {"train_loss": -6.6192731857299805, "global_step": 124518, "epoch": 2964} {"train_loss": -6.488764762878418, "global_step": 124519, "epoch": 2964} {"train_loss": -6.532687187194824, "global_step": 124520, "epoch": 2964} {"train_loss": -6.526803970336914, "global_step": 124521, "epoch": 2964} {"train_loss": -6.471016883850098, "global_step": 124522, "epoch": 2964} {"train_loss": -6.49537467956543, "global_step": 124523, "epoch": 2964} {"train_loss": -6.56755256652832, "global_step": 124524, "epoch": 2964} {"train_loss": -6.515439987182617, "global_step": 124525, "epoch": 2964} {"train_loss": -6.583235740661621, "global_step": 124526, "epoch": 2964} {"train_loss": -6.643174171447754, "global_step": 124527, "epoch": 2964} {"train_loss": -6.655061721801758, "global_step": 124528, "epoch": 2964} {"train_loss": -6.556806870869228, "global_step": 124529, "epoch": 2964, "val_loss": 67918.828125} {"train_loss": -6.613951683044434, "global_step": 124530, "epoch": 2965} {"train_loss": -6.611255168914795, "global_step": 124531, "epoch": 2965} {"train_loss": -6.514920234680176, "global_step": 124532, "epoch": 2965} {"train_loss": -6.611404895782471, "global_step": 124533, "epoch": 2965} {"train_loss": -6.563371658325195, "global_step": 124534, "epoch": 2965} {"train_loss": -6.567946434020996, "global_step": 124535, "epoch": 2965} {"train_loss": -6.60448694229126, "global_step": 124536, "epoch": 2965} {"train_loss": -6.515857219696045, "global_step": 124537, "epoch": 2965} {"train_loss": -6.730128288269043, "global_step": 124538, "epoch": 2965} {"train_loss": -6.546719551086426, "global_step": 124539, "epoch": 2965} {"train_loss": -6.702517509460449, "global_step": 124540, "epoch": 2965} {"train_loss": -6.605733871459961, "global_step": 124541, "epoch": 2965} {"train_loss": -6.552694320678711, "global_step": 124542, "epoch": 2965} {"train_loss": -6.622067451477051, "global_step": 124543, "epoch": 2965} {"train_loss": -6.627764701843262, "global_step": 124544, "epoch": 2965} {"train_loss": -6.544332504272461, "global_step": 124545, "epoch": 2965} {"train_loss": -6.574617385864258, "global_step": 124546, "epoch": 2965} {"train_loss": -6.645524978637695, "global_step": 124547, "epoch": 2965} {"train_loss": -6.644728183746338, "global_step": 124548, "epoch": 2965} {"train_loss": -6.665478706359863, "global_step": 124549, "epoch": 2965} {"train_loss": -6.614389419555664, "global_step": 124550, "epoch": 2965} {"train_loss": -6.5278191566467285, "global_step": 124551, "epoch": 2965} {"train_loss": -6.539535045623779, "global_step": 124552, "epoch": 2965} {"train_loss": -6.498761177062988, "global_step": 124553, "epoch": 2965} {"train_loss": -6.673672199249268, "global_step": 124554, "epoch": 2965} {"train_loss": -6.554873466491699, "global_step": 124555, "epoch": 2965} {"train_loss": -6.523310661315918, "global_step": 124556, "epoch": 2965} {"train_loss": -6.603744029998779, "global_step": 124557, "epoch": 2965} {"train_loss": -6.54763650894165, "global_step": 124558, "epoch": 2965} {"train_loss": -6.653713226318359, "global_step": 124559, "epoch": 2965} {"train_loss": -6.538593292236328, "global_step": 124560, "epoch": 2965} {"train_loss": -6.659292221069336, "global_step": 124561, "epoch": 2965} {"train_loss": -6.694076061248779, "global_step": 124562, "epoch": 2965} {"train_loss": -6.435497283935547, "global_step": 124563, "epoch": 2965} {"train_loss": -6.548770904541016, "global_step": 124564, "epoch": 2965} {"train_loss": -6.603667259216309, "global_step": 124565, "epoch": 2965} {"train_loss": -6.661419868469238, "global_step": 124566, "epoch": 2965} {"train_loss": -6.63364315032959, "global_step": 124567, "epoch": 2965} {"train_loss": -6.571658134460449, "global_step": 124568, "epoch": 2965} {"train_loss": -6.602722644805908, "global_step": 124569, "epoch": 2965} {"train_loss": -6.638537406921387, "global_step": 124570, "epoch": 2965} {"train_loss": -6.594927980786278, "global_step": 124571, "epoch": 2965, "val_loss": 68047.8125} {"train_loss": -6.5598225593566895, "global_step": 124572, "epoch": 2966} {"train_loss": -6.549196243286133, "global_step": 124573, "epoch": 2966} {"train_loss": -6.592363357543945, "global_step": 124574, "epoch": 2966} {"train_loss": -6.518791198730469, "global_step": 124575, "epoch": 2966} {"train_loss": -6.651646614074707, "global_step": 124576, "epoch": 2966} {"train_loss": -6.633575439453125, "global_step": 124577, "epoch": 2966} {"train_loss": -6.652884006500244, "global_step": 124578, "epoch": 2966} {"train_loss": -6.538043022155762, "global_step": 124579, "epoch": 2966} {"train_loss": -6.620056629180908, "global_step": 124580, "epoch": 2966} {"train_loss": -6.564309120178223, "global_step": 124581, "epoch": 2966} {"train_loss": -6.610875129699707, "global_step": 124582, "epoch": 2966} {"train_loss": -6.63162899017334, "global_step": 124583, "epoch": 2966} {"train_loss": -6.5096235275268555, "global_step": 124584, "epoch": 2966} {"train_loss": -6.548398494720459, "global_step": 124585, "epoch": 2966} {"train_loss": -6.559355735778809, "global_step": 124586, "epoch": 2966} {"train_loss": -6.567090034484863, "global_step": 124587, "epoch": 2966} {"train_loss": -6.639327526092529, "global_step": 124588, "epoch": 2966} {"train_loss": -6.698309898376465, "global_step": 124589, "epoch": 2966} {"train_loss": -6.56717586517334, "global_step": 124590, "epoch": 2966} {"train_loss": -6.520943641662598, "global_step": 124591, "epoch": 2966} {"train_loss": -6.531138896942139, "global_step": 124592, "epoch": 2966} {"train_loss": -6.484514236450195, "global_step": 124593, "epoch": 2966} {"train_loss": -6.572909355163574, "global_step": 124594, "epoch": 2966} {"train_loss": -6.453505516052246, "global_step": 124595, "epoch": 2966} {"train_loss": -6.634105682373047, "global_step": 124596, "epoch": 2966} {"train_loss": -6.488418102264404, "global_step": 124597, "epoch": 2966} {"train_loss": -6.500059127807617, "global_step": 124598, "epoch": 2966} {"train_loss": -6.588595867156982, "global_step": 124599, "epoch": 2966} {"train_loss": -6.502078056335449, "global_step": 124600, "epoch": 2966} {"train_loss": -6.438294887542725, "global_step": 124601, "epoch": 2966} {"train_loss": -6.548583030700684, "global_step": 124602, "epoch": 2966} {"train_loss": -6.50278377532959, "global_step": 124603, "epoch": 2966} {"train_loss": -6.574501991271973, "global_step": 124604, "epoch": 2966} {"train_loss": -6.485358238220215, "global_step": 124605, "epoch": 2966} {"train_loss": -6.545649528503418, "global_step": 124606, "epoch": 2966} {"train_loss": -6.562585353851318, "global_step": 124607, "epoch": 2966} {"train_loss": -6.596258163452148, "global_step": 124608, "epoch": 2966} {"train_loss": -6.582474231719971, "global_step": 124609, "epoch": 2966} {"train_loss": -6.622225284576416, "global_step": 124610, "epoch": 2966} {"train_loss": -6.549988746643066, "global_step": 124611, "epoch": 2966} {"train_loss": -6.589097023010254, "global_step": 124612, "epoch": 2966} {"train_loss": -6.5645178726741245, "global_step": 124613, "epoch": 2966, "val_loss": 68224.3359375} {"train_loss": -6.514169692993164, "global_step": 124614, "epoch": 2967} {"train_loss": -6.470126628875732, "global_step": 124615, "epoch": 2967} {"train_loss": -6.670468807220459, "global_step": 124616, "epoch": 2967} {"train_loss": -6.539310455322266, "global_step": 124617, "epoch": 2967} {"train_loss": -6.524423599243164, "global_step": 124618, "epoch": 2967} {"train_loss": -6.553752422332764, "global_step": 124619, "epoch": 2967} {"train_loss": -6.500110626220703, "global_step": 124620, "epoch": 2967} {"train_loss": -6.556578636169434, "global_step": 124621, "epoch": 2967} {"train_loss": -6.5424699783325195, "global_step": 124622, "epoch": 2967} {"train_loss": -6.5974578857421875, "global_step": 124623, "epoch": 2967} {"train_loss": -6.525882720947266, "global_step": 124624, "epoch": 2967} {"train_loss": -6.643930435180664, "global_step": 124625, "epoch": 2967} {"train_loss": -6.6446943283081055, "global_step": 124626, "epoch": 2967} {"train_loss": -6.5282487869262695, "global_step": 124627, "epoch": 2967} {"train_loss": -6.708370685577393, "global_step": 124628, "epoch": 2967} {"train_loss": -6.694896221160889, "global_step": 124629, "epoch": 2967} {"train_loss": -6.599782466888428, "global_step": 124630, "epoch": 2967} {"train_loss": -6.5435991287231445, "global_step": 124631, "epoch": 2967} {"train_loss": -6.6326799392700195, "global_step": 124632, "epoch": 2967} {"train_loss": -6.702901840209961, "global_step": 124633, "epoch": 2967} {"train_loss": -6.611410140991211, "global_step": 124634, "epoch": 2967} {"train_loss": -6.605182647705078, "global_step": 124635, "epoch": 2967} {"train_loss": -6.594675064086914, "global_step": 124636, "epoch": 2967} {"train_loss": -6.473660469055176, "global_step": 124637, "epoch": 2967} {"train_loss": -6.510676383972168, "global_step": 124638, "epoch": 2967} {"train_loss": -6.620190620422363, "global_step": 124639, "epoch": 2967} {"train_loss": -6.618071556091309, "global_step": 124640, "epoch": 2967} {"train_loss": -6.5517377853393555, "global_step": 124641, "epoch": 2967} {"train_loss": -6.462194442749023, "global_step": 124642, "epoch": 2967} {"train_loss": -6.551682472229004, "global_step": 124643, "epoch": 2967} {"train_loss": -6.486706733703613, "global_step": 124644, "epoch": 2967} {"train_loss": -6.461787223815918, "global_step": 124645, "epoch": 2967} {"train_loss": -6.5630645751953125, "global_step": 124646, "epoch": 2967} {"train_loss": -6.495965003967285, "global_step": 124647, "epoch": 2967} {"train_loss": -6.491433143615723, "global_step": 124648, "epoch": 2967} {"train_loss": -6.500728607177734, "global_step": 124649, "epoch": 2967} {"train_loss": -6.6007466316223145, "global_step": 124650, "epoch": 2967} {"train_loss": -6.568391799926758, "global_step": 124651, "epoch": 2967} {"train_loss": -6.4824347496032715, "global_step": 124652, "epoch": 2967} {"train_loss": -6.6097612380981445, "global_step": 124653, "epoch": 2967} {"train_loss": -6.4850850105285645, "global_step": 124654, "epoch": 2967} {"train_loss": -6.56333757582165, "global_step": 124655, "epoch": 2967, "val_loss": 67973.515625} {"train_loss": -6.610891819000244, "global_step": 124656, "epoch": 2968} {"train_loss": -6.547324180603027, "global_step": 124657, "epoch": 2968} {"train_loss": -6.575145721435547, "global_step": 124658, "epoch": 2968} {"train_loss": -6.524917125701904, "global_step": 124659, "epoch": 2968} {"train_loss": -6.5713701248168945, "global_step": 124660, "epoch": 2968} {"train_loss": -6.527527809143066, "global_step": 124661, "epoch": 2968} {"train_loss": -6.5530500411987305, "global_step": 124662, "epoch": 2968} {"train_loss": -6.490758895874023, "global_step": 124663, "epoch": 2968} {"train_loss": -6.559421539306641, "global_step": 124664, "epoch": 2968} {"train_loss": -6.515562057495117, "global_step": 124665, "epoch": 2968} {"train_loss": -6.5907440185546875, "global_step": 124666, "epoch": 2968} {"train_loss": -6.5158162117004395, "global_step": 124667, "epoch": 2968} {"train_loss": -6.570975303649902, "global_step": 124668, "epoch": 2968} {"train_loss": -6.564087867736816, "global_step": 124669, "epoch": 2968} {"train_loss": -6.639420509338379, "global_step": 124670, "epoch": 2968} {"train_loss": -6.5296831130981445, "global_step": 124671, "epoch": 2968} {"train_loss": -6.614173889160156, "global_step": 124672, "epoch": 2968} {"train_loss": -6.490727424621582, "global_step": 124673, "epoch": 2968} {"train_loss": -6.688666343688965, "global_step": 124674, "epoch": 2968} {"train_loss": -6.574970245361328, "global_step": 124675, "epoch": 2968} {"train_loss": -6.613157272338867, "global_step": 124676, "epoch": 2968} {"train_loss": -6.617836952209473, "global_step": 124677, "epoch": 2968} {"train_loss": -6.529651165008545, "global_step": 124678, "epoch": 2968} {"train_loss": -6.640878677368164, "global_step": 124679, "epoch": 2968} {"train_loss": -6.531693458557129, "global_step": 124680, "epoch": 2968} {"train_loss": -6.608991622924805, "global_step": 124681, "epoch": 2968} {"train_loss": -6.6038007736206055, "global_step": 124682, "epoch": 2968} {"train_loss": -6.526956081390381, "global_step": 124683, "epoch": 2968} {"train_loss": -6.581284523010254, "global_step": 124684, "epoch": 2968} {"train_loss": -6.623387336730957, "global_step": 124685, "epoch": 2968} {"train_loss": -6.711826324462891, "global_step": 124686, "epoch": 2968} {"train_loss": -6.678332328796387, "global_step": 124687, "epoch": 2968} {"train_loss": -6.65528678894043, "global_step": 124688, "epoch": 2968} {"train_loss": -6.586224555969238, "global_step": 124689, "epoch": 2968} {"train_loss": -6.474037170410156, "global_step": 124690, "epoch": 2968} {"train_loss": -6.751013278961182, "global_step": 124691, "epoch": 2968} {"train_loss": -6.5565385818481445, "global_step": 124692, "epoch": 2968} {"train_loss": -6.623733043670654, "global_step": 124693, "epoch": 2968} {"train_loss": -6.512237548828125, "global_step": 124694, "epoch": 2968} {"train_loss": -6.502309322357178, "global_step": 124695, "epoch": 2968} {"train_loss": -6.55648136138916, "global_step": 124696, "epoch": 2968} {"train_loss": -6.575945138931274, "global_step": 124697, "epoch": 2968, "val_loss": 68177.21875} {"train_loss": -6.536992073059082, "global_step": 124698, "epoch": 2969} {"train_loss": -6.530834197998047, "global_step": 124699, "epoch": 2969} {"train_loss": -6.516633033752441, "global_step": 124700, "epoch": 2969} {"train_loss": -6.4228105545043945, "global_step": 124701, "epoch": 2969} {"train_loss": -6.522748947143555, "global_step": 124702, "epoch": 2969} {"train_loss": -6.474366188049316, "global_step": 124703, "epoch": 2969} {"train_loss": -6.615920066833496, "global_step": 124704, "epoch": 2969} {"train_loss": -6.594461917877197, "global_step": 124705, "epoch": 2969} {"train_loss": -6.395329475402832, "global_step": 124706, "epoch": 2969} {"train_loss": -6.499058246612549, "global_step": 124707, "epoch": 2969} {"train_loss": -6.490875720977783, "global_step": 124708, "epoch": 2969} {"train_loss": -6.529594421386719, "global_step": 124709, "epoch": 2969} {"train_loss": -6.577578544616699, "global_step": 124710, "epoch": 2969} {"train_loss": -6.547224044799805, "global_step": 124711, "epoch": 2969} {"train_loss": -6.613208770751953, "global_step": 124712, "epoch": 2969} {"train_loss": -6.562322616577148, "global_step": 124713, "epoch": 2969} {"train_loss": -6.617485523223877, "global_step": 124714, "epoch": 2969} {"train_loss": -6.680263519287109, "global_step": 124715, "epoch": 2969} {"train_loss": -6.48410701751709, "global_step": 124716, "epoch": 2969} {"train_loss": -6.586868762969971, "global_step": 124717, "epoch": 2969} {"train_loss": -6.603703498840332, "global_step": 124718, "epoch": 2969} {"train_loss": -6.57973575592041, "global_step": 124719, "epoch": 2969} {"train_loss": -6.567963123321533, "global_step": 124720, "epoch": 2969} {"train_loss": -6.484640121459961, "global_step": 124721, "epoch": 2969} {"train_loss": -6.578482627868652, "global_step": 124722, "epoch": 2969} {"train_loss": -6.53317928314209, "global_step": 124723, "epoch": 2969} {"train_loss": -6.63238525390625, "global_step": 124724, "epoch": 2969} {"train_loss": -6.508739471435547, "global_step": 124725, "epoch": 2969} {"train_loss": -6.508050441741943, "global_step": 124726, "epoch": 2969} {"train_loss": -6.649932861328125, "global_step": 124727, "epoch": 2969} {"train_loss": -6.636539936065674, "global_step": 124728, "epoch": 2969} {"train_loss": -6.496397972106934, "global_step": 124729, "epoch": 2969} {"train_loss": -6.522974967956543, "global_step": 124730, "epoch": 2969} {"train_loss": -6.511786460876465, "global_step": 124731, "epoch": 2969} {"train_loss": -6.607322692871094, "global_step": 124732, "epoch": 2969} {"train_loss": -6.572151184082031, "global_step": 124733, "epoch": 2969} {"train_loss": -6.442081928253174, "global_step": 124734, "epoch": 2969} {"train_loss": -6.653296947479248, "global_step": 124735, "epoch": 2969} {"train_loss": -6.518390655517578, "global_step": 124736, "epoch": 2969} {"train_loss": -6.468114852905273, "global_step": 124737, "epoch": 2969} {"train_loss": -6.576874732971191, "global_step": 124738, "epoch": 2969} {"train_loss": -6.549412375404721, "global_step": 124739, "epoch": 2969, "val_loss": 68035.7109375} {"train_loss": -6.507787704467773, "global_step": 124740, "epoch": 2970} {"train_loss": -6.62918758392334, "global_step": 124741, "epoch": 2970} {"train_loss": -6.488959312438965, "global_step": 124742, "epoch": 2970} {"train_loss": -6.596081733703613, "global_step": 124743, "epoch": 2970} {"train_loss": -6.577482223510742, "global_step": 124744, "epoch": 2970} {"train_loss": -6.511516571044922, "global_step": 124745, "epoch": 2970} {"train_loss": -6.639890670776367, "global_step": 124746, "epoch": 2970} {"train_loss": -6.595753192901611, "global_step": 124747, "epoch": 2970} {"train_loss": -6.453158378601074, "global_step": 124748, "epoch": 2970} {"train_loss": -6.504406929016113, "global_step": 124749, "epoch": 2970} {"train_loss": -6.68120002746582, "global_step": 124750, "epoch": 2970} {"train_loss": -6.611344814300537, "global_step": 124751, "epoch": 2970} {"train_loss": -6.546966075897217, "global_step": 124752, "epoch": 2970} {"train_loss": -6.509085178375244, "global_step": 124753, "epoch": 2970} {"train_loss": -6.54132080078125, "global_step": 124754, "epoch": 2970} {"train_loss": -6.441389560699463, "global_step": 124755, "epoch": 2970} {"train_loss": -6.506258010864258, "global_step": 124756, "epoch": 2970} {"train_loss": -6.648880958557129, "global_step": 124757, "epoch": 2970} {"train_loss": -6.582294464111328, "global_step": 124758, "epoch": 2970} {"train_loss": -6.5777506828308105, "global_step": 124759, "epoch": 2970} {"train_loss": -6.606575965881348, "global_step": 124760, "epoch": 2970} {"train_loss": -6.582884788513184, "global_step": 124761, "epoch": 2970} {"train_loss": -6.462615013122559, "global_step": 124762, "epoch": 2970} {"train_loss": -6.677319526672363, "global_step": 124763, "epoch": 2970} {"train_loss": -6.633776664733887, "global_step": 124764, "epoch": 2970} {"train_loss": -6.513517379760742, "global_step": 124765, "epoch": 2970} {"train_loss": -6.582599639892578, "global_step": 124766, "epoch": 2970} {"train_loss": -6.596996784210205, "global_step": 124767, "epoch": 2970} {"train_loss": -6.503824234008789, "global_step": 124768, "epoch": 2970} {"train_loss": -6.516086578369141, "global_step": 124769, "epoch": 2970} {"train_loss": -6.52557373046875, "global_step": 124770, "epoch": 2970} {"train_loss": -6.678309440612793, "global_step": 124771, "epoch": 2970} {"train_loss": -6.503844261169434, "global_step": 124772, "epoch": 2970} {"train_loss": -6.6355791091918945, "global_step": 124773, "epoch": 2970} {"train_loss": -6.570420742034912, "global_step": 124774, "epoch": 2970} {"train_loss": -6.476366996765137, "global_step": 124775, "epoch": 2970} {"train_loss": -6.591022491455078, "global_step": 124776, "epoch": 2970} {"train_loss": -6.563413143157959, "global_step": 124777, "epoch": 2970} {"train_loss": -6.490106582641602, "global_step": 124778, "epoch": 2970} {"train_loss": -6.4217681884765625, "global_step": 124779, "epoch": 2970} {"train_loss": -6.4183549880981445, "global_step": 124780, "epoch": 2970} {"train_loss": -6.5553310598645895, "global_step": 124781, "epoch": 2970, "val_loss": 68074.9921875} {"train_loss": -6.434907913208008, "global_step": 124782, "epoch": 2971} {"train_loss": -6.576944351196289, "global_step": 124783, "epoch": 2971} {"train_loss": -6.556366443634033, "global_step": 124784, "epoch": 2971} {"train_loss": -6.558869361877441, "global_step": 124785, "epoch": 2971} {"train_loss": -6.485324859619141, "global_step": 124786, "epoch": 2971} {"train_loss": -6.670949459075928, "global_step": 124787, "epoch": 2971} {"train_loss": -6.542993068695068, "global_step": 124788, "epoch": 2971} {"train_loss": -6.431110382080078, "global_step": 124789, "epoch": 2971} {"train_loss": -6.657210826873779, "global_step": 124790, "epoch": 2971} {"train_loss": -6.473994255065918, "global_step": 124791, "epoch": 2971} {"train_loss": -6.549171447753906, "global_step": 124792, "epoch": 2971} {"train_loss": -6.577750205993652, "global_step": 124793, "epoch": 2971} {"train_loss": -6.390909671783447, "global_step": 124794, "epoch": 2971} {"train_loss": -6.623358726501465, "global_step": 124795, "epoch": 2971} {"train_loss": -6.519102096557617, "global_step": 124796, "epoch": 2971} {"train_loss": -6.564942359924316, "global_step": 124797, "epoch": 2971} {"train_loss": -6.568392753601074, "global_step": 124798, "epoch": 2971} {"train_loss": -6.507835388183594, "global_step": 124799, "epoch": 2971} {"train_loss": -6.490006923675537, "global_step": 124800, "epoch": 2971} {"train_loss": -6.564754486083984, "global_step": 124801, "epoch": 2971} {"train_loss": -6.533813953399658, "global_step": 124802, "epoch": 2971} {"train_loss": -6.611332893371582, "global_step": 124803, "epoch": 2971} {"train_loss": -6.433335781097412, "global_step": 124804, "epoch": 2971} {"train_loss": -6.54722261428833, "global_step": 124805, "epoch": 2971} {"train_loss": -6.407747745513916, "global_step": 124806, "epoch": 2971} {"train_loss": -6.45051383972168, "global_step": 124807, "epoch": 2971} {"train_loss": -6.512020111083984, "global_step": 124808, "epoch": 2971} {"train_loss": -6.394863128662109, "global_step": 124809, "epoch": 2971} {"train_loss": -6.354464530944824, "global_step": 124810, "epoch": 2971} {"train_loss": -6.39891242980957, "global_step": 124811, "epoch": 2971} {"train_loss": -6.33524227142334, "global_step": 124812, "epoch": 2971} {"train_loss": -6.394006729125977, "global_step": 124813, "epoch": 2971} {"train_loss": -6.32769250869751, "global_step": 124814, "epoch": 2971} {"train_loss": -6.395020484924316, "global_step": 124815, "epoch": 2971} {"train_loss": -6.321723461151123, "global_step": 124816, "epoch": 2971} {"train_loss": -6.551845073699951, "global_step": 124817, "epoch": 2971} {"train_loss": -6.394781589508057, "global_step": 124818, "epoch": 2971} {"train_loss": -6.455395221710205, "global_step": 124819, "epoch": 2971} {"train_loss": -6.427651405334473, "global_step": 124820, "epoch": 2971} {"train_loss": -6.562089443206787, "global_step": 124821, "epoch": 2971} {"train_loss": -6.495296478271484, "global_step": 124822, "epoch": 2971} {"train_loss": -6.49017444111052, "global_step": 124823, "epoch": 2971, "val_loss": 68156.390625} {"train_loss": -6.505763053894043, "global_step": 124824, "epoch": 2972} {"train_loss": -6.438415050506592, "global_step": 124825, "epoch": 2972} {"train_loss": -6.517764091491699, "global_step": 124826, "epoch": 2972} {"train_loss": -6.540598392486572, "global_step": 124827, "epoch": 2972} {"train_loss": -6.505710601806641, "global_step": 124828, "epoch": 2972} {"train_loss": -6.612442493438721, "global_step": 124829, "epoch": 2972} {"train_loss": -6.655570030212402, "global_step": 124830, "epoch": 2972} {"train_loss": -6.596236228942871, "global_step": 124831, "epoch": 2972} {"train_loss": -6.58704948425293, "global_step": 124832, "epoch": 2972} {"train_loss": -6.647670269012451, "global_step": 124833, "epoch": 2972} {"train_loss": -6.475586891174316, "global_step": 124834, "epoch": 2972} {"train_loss": -6.520535945892334, "global_step": 124835, "epoch": 2972} {"train_loss": -6.563634872436523, "global_step": 124836, "epoch": 2972} {"train_loss": -6.6391682624816895, "global_step": 124837, "epoch": 2972} {"train_loss": -6.610752105712891, "global_step": 124838, "epoch": 2972} {"train_loss": -6.630466461181641, "global_step": 124839, "epoch": 2972} {"train_loss": -6.553656578063965, "global_step": 124840, "epoch": 2972} {"train_loss": -6.638188362121582, "global_step": 124841, "epoch": 2972} {"train_loss": -6.476221084594727, "global_step": 124842, "epoch": 2972} {"train_loss": -6.6800947189331055, "global_step": 124843, "epoch": 2972} {"train_loss": -6.81173038482666, "global_step": 124844, "epoch": 2972} {"train_loss": -6.658150672912598, "global_step": 124845, "epoch": 2972} {"train_loss": -6.593920707702637, "global_step": 124846, "epoch": 2972} {"train_loss": -6.712224006652832, "global_step": 124847, "epoch": 2972} {"train_loss": -6.640198230743408, "global_step": 124848, "epoch": 2972} {"train_loss": -6.680478572845459, "global_step": 124849, "epoch": 2972} {"train_loss": -6.614203453063965, "global_step": 124850, "epoch": 2972} {"train_loss": -6.551504135131836, "global_step": 124851, "epoch": 2972} {"train_loss": -6.594389915466309, "global_step": 124852, "epoch": 2972} {"train_loss": -6.585702419281006, "global_step": 124853, "epoch": 2972} {"train_loss": -6.628113746643066, "global_step": 124854, "epoch": 2972} {"train_loss": -6.535210609436035, "global_step": 124855, "epoch": 2972} {"train_loss": -6.655291557312012, "global_step": 124856, "epoch": 2972} {"train_loss": -6.550190448760986, "global_step": 124857, "epoch": 2972} {"train_loss": -6.52855110168457, "global_step": 124858, "epoch": 2972} {"train_loss": -6.596363067626953, "global_step": 124859, "epoch": 2972} {"train_loss": -6.543766975402832, "global_step": 124860, "epoch": 2972} {"train_loss": -6.610926628112793, "global_step": 124861, "epoch": 2972} {"train_loss": -6.718570709228516, "global_step": 124862, "epoch": 2972} {"train_loss": -6.661649703979492, "global_step": 124863, "epoch": 2972} {"train_loss": -6.45156192779541, "global_step": 124864, "epoch": 2972} {"train_loss": -6.591357174373808, "global_step": 124865, "epoch": 2972, "val_loss": 68048.703125} {"train_loss": -6.605685234069824, "global_step": 124866, "epoch": 2973} {"train_loss": -6.687316417694092, "global_step": 124867, "epoch": 2973} {"train_loss": -6.6462273597717285, "global_step": 124868, "epoch": 2973} {"train_loss": -6.595065116882324, "global_step": 124869, "epoch": 2973} {"train_loss": -6.628401756286621, "global_step": 124870, "epoch": 2973} {"train_loss": -6.60563850402832, "global_step": 124871, "epoch": 2973} {"train_loss": -6.633709907531738, "global_step": 124872, "epoch": 2973} {"train_loss": -6.608948707580566, "global_step": 124873, "epoch": 2973} {"train_loss": -6.57985782623291, "global_step": 124874, "epoch": 2973} {"train_loss": -6.624123573303223, "global_step": 124875, "epoch": 2973} {"train_loss": -6.610407829284668, "global_step": 124876, "epoch": 2973} {"train_loss": -6.617652416229248, "global_step": 124877, "epoch": 2973} {"train_loss": -6.656129837036133, "global_step": 124878, "epoch": 2973} {"train_loss": -6.608283996582031, "global_step": 124879, "epoch": 2973} {"train_loss": -6.510776519775391, "global_step": 124880, "epoch": 2973} {"train_loss": -6.512284278869629, "global_step": 124881, "epoch": 2973} {"train_loss": -6.682964324951172, "global_step": 124882, "epoch": 2973} {"train_loss": -6.657070636749268, "global_step": 124883, "epoch": 2973} {"train_loss": -6.621469974517822, "global_step": 124884, "epoch": 2973} {"train_loss": -6.514575004577637, "global_step": 124885, "epoch": 2973} {"train_loss": -6.652653694152832, "global_step": 124886, "epoch": 2973} {"train_loss": -6.552147388458252, "global_step": 124887, "epoch": 2973} {"train_loss": -6.67066764831543, "global_step": 124888, "epoch": 2973} {"train_loss": -6.608686447143555, "global_step": 124889, "epoch": 2973} {"train_loss": -6.668916702270508, "global_step": 124890, "epoch": 2973} {"train_loss": -6.6070380210876465, "global_step": 124891, "epoch": 2973} {"train_loss": -6.670774936676025, "global_step": 124892, "epoch": 2973} {"train_loss": -6.664707183837891, "global_step": 124893, "epoch": 2973} {"train_loss": -6.5318803787231445, "global_step": 124894, "epoch": 2973} {"train_loss": -6.454829216003418, "global_step": 124895, "epoch": 2973} {"train_loss": -6.654967308044434, "global_step": 124896, "epoch": 2973} {"train_loss": -6.473465919494629, "global_step": 124897, "epoch": 2973} {"train_loss": -6.528670310974121, "global_step": 124898, "epoch": 2973} {"train_loss": -6.495075702667236, "global_step": 124899, "epoch": 2973} {"train_loss": -6.568299293518066, "global_step": 124900, "epoch": 2973} {"train_loss": -6.6015625, "global_step": 124901, "epoch": 2973} {"train_loss": -6.612239837646484, "global_step": 124902, "epoch": 2973} {"train_loss": -6.45350456237793, "global_step": 124903, "epoch": 2973} {"train_loss": -6.62996768951416, "global_step": 124904, "epoch": 2973} {"train_loss": -6.554306983947754, "global_step": 124905, "epoch": 2973} {"train_loss": -6.633814811706543, "global_step": 124906, "epoch": 2973} {"train_loss": -6.597031570616222, "global_step": 124907, "epoch": 2973, "val_loss": 67956.53125} {"train_loss": -6.648541450500488, "global_step": 124908, "epoch": 2974} {"train_loss": -6.574936866760254, "global_step": 124909, "epoch": 2974} {"train_loss": -6.4611735343933105, "global_step": 124910, "epoch": 2974} {"train_loss": -6.537192344665527, "global_step": 124911, "epoch": 2974} {"train_loss": -6.49664831161499, "global_step": 124912, "epoch": 2974} {"train_loss": -6.5086140632629395, "global_step": 124913, "epoch": 2974} {"train_loss": -6.6469221115112305, "global_step": 124914, "epoch": 2974} {"train_loss": -6.5147576332092285, "global_step": 124915, "epoch": 2974} {"train_loss": -6.664011001586914, "global_step": 124916, "epoch": 2974} {"train_loss": -6.530429840087891, "global_step": 124917, "epoch": 2974} {"train_loss": -6.541010856628418, "global_step": 124918, "epoch": 2974} {"train_loss": -6.610095977783203, "global_step": 124919, "epoch": 2974} {"train_loss": -6.554381847381592, "global_step": 124920, "epoch": 2974} {"train_loss": -6.566375732421875, "global_step": 124921, "epoch": 2974} {"train_loss": -6.606705188751221, "global_step": 124922, "epoch": 2974} {"train_loss": -6.637605667114258, "global_step": 124923, "epoch": 2974} {"train_loss": -6.5941691398620605, "global_step": 124924, "epoch": 2974} {"train_loss": -6.503535747528076, "global_step": 124925, "epoch": 2974} {"train_loss": -6.667623519897461, "global_step": 124926, "epoch": 2974} {"train_loss": -6.5805864334106445, "global_step": 124927, "epoch": 2974} {"train_loss": -6.532498359680176, "global_step": 124928, "epoch": 2974} {"train_loss": -6.722947120666504, "global_step": 124929, "epoch": 2974} {"train_loss": -6.5763397216796875, "global_step": 124930, "epoch": 2974} {"train_loss": -6.661391258239746, "global_step": 124931, "epoch": 2974} {"train_loss": -6.715729713439941, "global_step": 124932, "epoch": 2974} {"train_loss": -6.641654014587402, "global_step": 124933, "epoch": 2974} {"train_loss": -6.60829496383667, "global_step": 124934, "epoch": 2974} {"train_loss": -6.546004772186279, "global_step": 124935, "epoch": 2974} {"train_loss": -6.625550270080566, "global_step": 124936, "epoch": 2974} {"train_loss": -6.4983134269714355, "global_step": 124937, "epoch": 2974} {"train_loss": -6.48629093170166, "global_step": 124938, "epoch": 2974} {"train_loss": -6.637956619262695, "global_step": 124939, "epoch": 2974} {"train_loss": -6.668474197387695, "global_step": 124940, "epoch": 2974} {"train_loss": -6.611137866973877, "global_step": 124941, "epoch": 2974} {"train_loss": -6.561746597290039, "global_step": 124942, "epoch": 2974} {"train_loss": -6.55971622467041, "global_step": 124943, "epoch": 2974} {"train_loss": -6.636086940765381, "global_step": 124944, "epoch": 2974} {"train_loss": -6.559211254119873, "global_step": 124945, "epoch": 2974} {"train_loss": -6.548586368560791, "global_step": 124946, "epoch": 2974} {"train_loss": -6.562124252319336, "global_step": 124947, "epoch": 2974} {"train_loss": -6.696147918701172, "global_step": 124948, "epoch": 2974} {"train_loss": -6.588286899384999, "global_step": 124949, "epoch": 2974, "val_loss": 68125.0625} {"train_loss": -6.593649387359619, "global_step": 124950, "epoch": 2975} {"train_loss": -6.4713945388793945, "global_step": 124951, "epoch": 2975} {"train_loss": -6.622118949890137, "global_step": 124952, "epoch": 2975} {"train_loss": -6.660460472106934, "global_step": 124953, "epoch": 2975} {"train_loss": -6.584851264953613, "global_step": 124954, "epoch": 2975} {"train_loss": -6.5292558670043945, "global_step": 124955, "epoch": 2975} {"train_loss": -6.577487945556641, "global_step": 124956, "epoch": 2975} {"train_loss": -6.509824752807617, "global_step": 124957, "epoch": 2975} {"train_loss": -6.609197616577148, "global_step": 124958, "epoch": 2975} {"train_loss": -6.68892765045166, "global_step": 124959, "epoch": 2975} {"train_loss": -6.595139503479004, "global_step": 124960, "epoch": 2975} {"train_loss": -6.595707893371582, "global_step": 124961, "epoch": 2975} {"train_loss": -6.651363849639893, "global_step": 124962, "epoch": 2975} {"train_loss": -6.607437610626221, "global_step": 124963, "epoch": 2975} {"train_loss": -6.536314964294434, "global_step": 124964, "epoch": 2975} {"train_loss": -6.6437087059021, "global_step": 124965, "epoch": 2975} {"train_loss": -6.561012268066406, "global_step": 124966, "epoch": 2975} {"train_loss": -6.622030735015869, "global_step": 124967, "epoch": 2975} {"train_loss": -6.591073513031006, "global_step": 124968, "epoch": 2975} {"train_loss": -6.554232120513916, "global_step": 124969, "epoch": 2975} {"train_loss": -6.611573696136475, "global_step": 124970, "epoch": 2975} {"train_loss": -6.55182409286499, "global_step": 124971, "epoch": 2975} {"train_loss": -6.5917205810546875, "global_step": 124972, "epoch": 2975} {"train_loss": -6.642135143280029, "global_step": 124973, "epoch": 2975} {"train_loss": -6.576937198638916, "global_step": 124974, "epoch": 2975} {"train_loss": -6.544782638549805, "global_step": 124975, "epoch": 2975} {"train_loss": -6.512424468994141, "global_step": 124976, "epoch": 2975} {"train_loss": -6.474234580993652, "global_step": 124977, "epoch": 2975} {"train_loss": -6.614269256591797, "global_step": 124978, "epoch": 2975} {"train_loss": -6.620100975036621, "global_step": 124979, "epoch": 2975} {"train_loss": -6.605804443359375, "global_step": 124980, "epoch": 2975} {"train_loss": -6.567838668823242, "global_step": 124981, "epoch": 2975} {"train_loss": -6.602505207061768, "global_step": 124982, "epoch": 2975} {"train_loss": -6.576640605926514, "global_step": 124983, "epoch": 2975} {"train_loss": -6.574808120727539, "global_step": 124984, "epoch": 2975} {"train_loss": -6.653317928314209, "global_step": 124985, "epoch": 2975} {"train_loss": -6.574687957763672, "global_step": 124986, "epoch": 2975} {"train_loss": -6.726394176483154, "global_step": 124987, "epoch": 2975} {"train_loss": -6.677684783935547, "global_step": 124988, "epoch": 2975} {"train_loss": -6.555347919464111, "global_step": 124989, "epoch": 2975} {"train_loss": -6.569237232208252, "global_step": 124990, "epoch": 2975} {"train_loss": -6.59091736021496, "global_step": 124991, "epoch": 2975, "val_loss": 67927.875} {"train_loss": -6.686129093170166, "global_step": 124992, "epoch": 2976} {"train_loss": -6.61314582824707, "global_step": 124993, "epoch": 2976} {"train_loss": -6.5346832275390625, "global_step": 124994, "epoch": 2976} {"train_loss": -6.7069597244262695, "global_step": 124995, "epoch": 2976} {"train_loss": -6.652396202087402, "global_step": 124996, "epoch": 2976} {"train_loss": -6.695339679718018, "global_step": 124997, "epoch": 2976} {"train_loss": -6.6660003662109375, "global_step": 124998, "epoch": 2976} {"train_loss": -6.623263835906982, "global_step": 124999, "epoch": 2976} {"train_loss": -6.659786224365234, "global_step": 125000, "epoch": 2976} {"train_loss": -6.580138683319092, "global_step": 125001, "epoch": 2976} {"train_loss": -6.6214470863342285, "global_step": 125002, "epoch": 2976} {"train_loss": -6.4353485107421875, "global_step": 125003, "epoch": 2976} {"train_loss": -6.657751560211182, "global_step": 125004, "epoch": 2976} {"train_loss": -6.692014217376709, "global_step": 125005, "epoch": 2976} {"train_loss": -6.512631416320801, "global_step": 125006, "epoch": 2976} {"train_loss": -6.545623779296875, "global_step": 125007, "epoch": 2976} {"train_loss": -6.4565839767456055, "global_step": 125008, "epoch": 2976} {"train_loss": -6.402085304260254, "global_step": 125009, "epoch": 2976} {"train_loss": -6.586817264556885, "global_step": 125010, "epoch": 2976} {"train_loss": -6.549625873565674, "global_step": 125011, "epoch": 2976} {"train_loss": -6.586285591125488, "global_step": 125012, "epoch": 2976} {"train_loss": -6.528985500335693, "global_step": 125013, "epoch": 2976} {"train_loss": -6.45554256439209, "global_step": 125014, "epoch": 2976} {"train_loss": -6.484454154968262, "global_step": 125015, "epoch": 2976} {"train_loss": -6.57289981842041, "global_step": 125016, "epoch": 2976} {"train_loss": -6.532448768615723, "global_step": 125017, "epoch": 2976} {"train_loss": -6.439383029937744, "global_step": 125018, "epoch": 2976} {"train_loss": -6.596683025360107, "global_step": 125019, "epoch": 2976} {"train_loss": -6.495471000671387, "global_step": 125020, "epoch": 2976} {"train_loss": -6.637894630432129, "global_step": 125021, "epoch": 2976} {"train_loss": -6.596393585205078, "global_step": 125022, "epoch": 2976} {"train_loss": -6.662339687347412, "global_step": 125023, "epoch": 2976} {"train_loss": -6.508322238922119, "global_step": 125024, "epoch": 2976} {"train_loss": -6.442779541015625, "global_step": 125025, "epoch": 2976} {"train_loss": -6.663017272949219, "global_step": 125026, "epoch": 2976} {"train_loss": -6.665835857391357, "global_step": 125027, "epoch": 2976} {"train_loss": -6.591301918029785, "global_step": 125028, "epoch": 2976} {"train_loss": -6.558529853820801, "global_step": 125029, "epoch": 2976} {"train_loss": -6.352972507476807, "global_step": 125030, "epoch": 2976} {"train_loss": -6.490114688873291, "global_step": 125031, "epoch": 2976} {"train_loss": -6.346656799316406, "global_step": 125032, "epoch": 2976} {"train_loss": -6.5614271731603715, "global_step": 125033, "epoch": 2976, "val_loss": 68216.875} {"train_loss": -6.505754470825195, "global_step": 125034, "epoch": 2977} {"train_loss": -6.68719482421875, "global_step": 125035, "epoch": 2977} {"train_loss": -6.588751316070557, "global_step": 125036, "epoch": 2977} {"train_loss": -6.428642749786377, "global_step": 125037, "epoch": 2977} {"train_loss": -6.528792858123779, "global_step": 125038, "epoch": 2977} {"train_loss": -6.5542497634887695, "global_step": 125039, "epoch": 2977} {"train_loss": -6.606671333312988, "global_step": 125040, "epoch": 2977} {"train_loss": -6.543919563293457, "global_step": 125041, "epoch": 2977} {"train_loss": -6.529646873474121, "global_step": 125042, "epoch": 2977} {"train_loss": -6.591078281402588, "global_step": 125043, "epoch": 2977} {"train_loss": -6.566350936889648, "global_step": 125044, "epoch": 2977} {"train_loss": -6.575108051300049, "global_step": 125045, "epoch": 2977} {"train_loss": -6.6364593505859375, "global_step": 125046, "epoch": 2977} {"train_loss": -6.581663131713867, "global_step": 125047, "epoch": 2977} {"train_loss": -6.749513626098633, "global_step": 125048, "epoch": 2977} {"train_loss": -6.597151279449463, "global_step": 125049, "epoch": 2977} {"train_loss": -6.628290176391602, "global_step": 125050, "epoch": 2977} {"train_loss": -6.6337080001831055, "global_step": 125051, "epoch": 2977} {"train_loss": -6.547861099243164, "global_step": 125052, "epoch": 2977} {"train_loss": -6.573806285858154, "global_step": 125053, "epoch": 2977} {"train_loss": -6.619683742523193, "global_step": 125054, "epoch": 2977} {"train_loss": -6.566359519958496, "global_step": 125055, "epoch": 2977} {"train_loss": -6.620465278625488, "global_step": 125056, "epoch": 2977} {"train_loss": -6.5543975830078125, "global_step": 125057, "epoch": 2977} {"train_loss": -6.644482612609863, "global_step": 125058, "epoch": 2977} {"train_loss": -6.636139869689941, "global_step": 125059, "epoch": 2977} {"train_loss": -6.586259841918945, "global_step": 125060, "epoch": 2977} {"train_loss": -6.56118106842041, "global_step": 125061, "epoch": 2977} {"train_loss": -6.537890911102295, "global_step": 125062, "epoch": 2977} {"train_loss": -6.499401092529297, "global_step": 125063, "epoch": 2977} {"train_loss": -6.549694061279297, "global_step": 125064, "epoch": 2977} {"train_loss": -6.448351860046387, "global_step": 125065, "epoch": 2977} {"train_loss": -6.414921283721924, "global_step": 125066, "epoch": 2977} {"train_loss": -6.4677205085754395, "global_step": 125067, "epoch": 2977} {"train_loss": -6.314545631408691, "global_step": 125068, "epoch": 2977} {"train_loss": -6.6158061027526855, "global_step": 125069, "epoch": 2977} {"train_loss": -6.539307594299316, "global_step": 125070, "epoch": 2977} {"train_loss": -6.465559005737305, "global_step": 125071, "epoch": 2977} {"train_loss": -6.570591926574707, "global_step": 125072, "epoch": 2977} {"train_loss": -6.503926753997803, "global_step": 125073, "epoch": 2977} {"train_loss": -6.618507385253906, "global_step": 125074, "epoch": 2977} {"train_loss": -6.559953224091303, "global_step": 125075, "epoch": 2977, "val_loss": 68049.9296875} {"train_loss": -6.48520565032959, "global_step": 125076, "epoch": 2978} {"train_loss": -6.5723185539245605, "global_step": 125077, "epoch": 2978} {"train_loss": -6.542868137359619, "global_step": 125078, "epoch": 2978} {"train_loss": -6.565546989440918, "global_step": 125079, "epoch": 2978} {"train_loss": -6.572887420654297, "global_step": 125080, "epoch": 2978} {"train_loss": -6.5106096267700195, "global_step": 125081, "epoch": 2978} {"train_loss": -6.438143253326416, "global_step": 125082, "epoch": 2978} {"train_loss": -6.523586273193359, "global_step": 125083, "epoch": 2978} {"train_loss": -6.534080505371094, "global_step": 125084, "epoch": 2978} {"train_loss": -6.640807151794434, "global_step": 125085, "epoch": 2978} {"train_loss": -6.495984077453613, "global_step": 125086, "epoch": 2978} {"train_loss": -6.486299991607666, "global_step": 125087, "epoch": 2978} {"train_loss": -6.511073112487793, "global_step": 125088, "epoch": 2978} {"train_loss": -6.5760626792907715, "global_step": 125089, "epoch": 2978} {"train_loss": -6.571652412414551, "global_step": 125090, "epoch": 2978} {"train_loss": -6.482447147369385, "global_step": 125091, "epoch": 2978} {"train_loss": -6.583345413208008, "global_step": 125092, "epoch": 2978} {"train_loss": -6.542805194854736, "global_step": 125093, "epoch": 2978} {"train_loss": -6.611734867095947, "global_step": 125094, "epoch": 2978} {"train_loss": -6.636828899383545, "global_step": 125095, "epoch": 2978} {"train_loss": -6.404360294342041, "global_step": 125096, "epoch": 2978} {"train_loss": -6.552439212799072, "global_step": 125097, "epoch": 2978} {"train_loss": -6.523675918579102, "global_step": 125098, "epoch": 2978} {"train_loss": -6.4896345138549805, "global_step": 125099, "epoch": 2978} {"train_loss": -6.624638557434082, "global_step": 125100, "epoch": 2978} {"train_loss": -6.479575157165527, "global_step": 125101, "epoch": 2978} {"train_loss": -6.527771472930908, "global_step": 125102, "epoch": 2978} {"train_loss": -6.619752883911133, "global_step": 125103, "epoch": 2978} {"train_loss": -6.566242218017578, "global_step": 125104, "epoch": 2978} {"train_loss": -6.600846290588379, "global_step": 125105, "epoch": 2978} {"train_loss": -6.531524181365967, "global_step": 125106, "epoch": 2978} {"train_loss": -6.513982772827148, "global_step": 125107, "epoch": 2978} {"train_loss": -6.638036727905273, "global_step": 125108, "epoch": 2978} {"train_loss": -6.659344673156738, "global_step": 125109, "epoch": 2978} {"train_loss": -6.568194389343262, "global_step": 125110, "epoch": 2978} {"train_loss": -6.664862155914307, "global_step": 125111, "epoch": 2978} {"train_loss": -6.649387359619141, "global_step": 125112, "epoch": 2978} {"train_loss": -6.545297622680664, "global_step": 125113, "epoch": 2978} {"train_loss": -6.675386428833008, "global_step": 125114, "epoch": 2978} {"train_loss": -6.5561418533325195, "global_step": 125115, "epoch": 2978} {"train_loss": -6.478106498718262, "global_step": 125116, "epoch": 2978} {"train_loss": -6.556631962458293, "global_step": 125117, "epoch": 2978, "val_loss": 67913.6015625} {"train_loss": -6.611187934875488, "global_step": 125118, "epoch": 2979} {"train_loss": -6.545953750610352, "global_step": 125119, "epoch": 2979} {"train_loss": -6.555011749267578, "global_step": 125120, "epoch": 2979} {"train_loss": -6.7142438888549805, "global_step": 125121, "epoch": 2979} {"train_loss": -6.768466472625732, "global_step": 125122, "epoch": 2979} {"train_loss": -6.688658714294434, "global_step": 125123, "epoch": 2979} {"train_loss": -6.568774700164795, "global_step": 125124, "epoch": 2979} {"train_loss": -6.609569072723389, "global_step": 125125, "epoch": 2979} {"train_loss": -6.559791564941406, "global_step": 125126, "epoch": 2979} {"train_loss": -6.62856388092041, "global_step": 125127, "epoch": 2979} {"train_loss": -6.5526909828186035, "global_step": 125128, "epoch": 2979} {"train_loss": -6.5940375328063965, "global_step": 125129, "epoch": 2979} {"train_loss": -6.585264205932617, "global_step": 125130, "epoch": 2979} {"train_loss": -6.703668594360352, "global_step": 125131, "epoch": 2979} {"train_loss": -6.488341331481934, "global_step": 125132, "epoch": 2979} {"train_loss": -6.712522506713867, "global_step": 125133, "epoch": 2979} {"train_loss": -6.602149963378906, "global_step": 125134, "epoch": 2979} {"train_loss": -6.578535079956055, "global_step": 125135, "epoch": 2979} {"train_loss": -6.637743949890137, "global_step": 125136, "epoch": 2979} {"train_loss": -6.670957565307617, "global_step": 125137, "epoch": 2979} {"train_loss": -6.626013278961182, "global_step": 125138, "epoch": 2979} {"train_loss": -6.577569007873535, "global_step": 125139, "epoch": 2979} {"train_loss": -6.554259300231934, "global_step": 125140, "epoch": 2979} {"train_loss": -6.701282501220703, "global_step": 125141, "epoch": 2979} {"train_loss": -6.628023147583008, "global_step": 125142, "epoch": 2979} {"train_loss": -6.604440212249756, "global_step": 125143, "epoch": 2979} {"train_loss": -6.678109169006348, "global_step": 125144, "epoch": 2979} {"train_loss": -6.639669418334961, "global_step": 125145, "epoch": 2979} {"train_loss": -6.678596496582031, "global_step": 125146, "epoch": 2979} {"train_loss": -6.51784610748291, "global_step": 125147, "epoch": 2979} {"train_loss": -6.617559909820557, "global_step": 125148, "epoch": 2979} {"train_loss": -6.522593975067139, "global_step": 125149, "epoch": 2979} {"train_loss": -6.609668731689453, "global_step": 125150, "epoch": 2979} {"train_loss": -6.558596134185791, "global_step": 125151, "epoch": 2979} {"train_loss": -6.6123809814453125, "global_step": 125152, "epoch": 2979} {"train_loss": -6.622420310974121, "global_step": 125153, "epoch": 2979} {"train_loss": -6.608332633972168, "global_step": 125154, "epoch": 2979} {"train_loss": -6.518064022064209, "global_step": 125155, "epoch": 2979} {"train_loss": -6.630177021026611, "global_step": 125156, "epoch": 2979} {"train_loss": -6.55959415435791, "global_step": 125157, "epoch": 2979} {"train_loss": -6.630650520324707, "global_step": 125158, "epoch": 2979} {"train_loss": -6.610814696266537, "global_step": 125159, "epoch": 2979, "val_loss": 68199.53125} {"train_loss": -6.618659019470215, "global_step": 125160, "epoch": 2980} {"train_loss": -6.617710590362549, "global_step": 125161, "epoch": 2980} {"train_loss": -6.657253742218018, "global_step": 125162, "epoch": 2980} {"train_loss": -6.497309684753418, "global_step": 125163, "epoch": 2980} {"train_loss": -6.471978187561035, "global_step": 125164, "epoch": 2980} {"train_loss": -6.395277500152588, "global_step": 125165, "epoch": 2980} {"train_loss": -6.55694580078125, "global_step": 125166, "epoch": 2980} {"train_loss": -6.54757833480835, "global_step": 125167, "epoch": 2980} {"train_loss": -6.537982940673828, "global_step": 125168, "epoch": 2980} {"train_loss": -6.448119163513184, "global_step": 125169, "epoch": 2980} {"train_loss": -6.492237091064453, "global_step": 125170, "epoch": 2980} {"train_loss": -6.497987747192383, "global_step": 125171, "epoch": 2980} {"train_loss": -6.537075996398926, "global_step": 125172, "epoch": 2980} {"train_loss": -6.5656819343566895, "global_step": 125173, "epoch": 2980} {"train_loss": -6.511882305145264, "global_step": 125174, "epoch": 2980} {"train_loss": -6.559610843658447, "global_step": 125175, "epoch": 2980} {"train_loss": -6.598756790161133, "global_step": 125176, "epoch": 2980} {"train_loss": -6.548479080200195, "global_step": 125177, "epoch": 2980} {"train_loss": -6.518938064575195, "global_step": 125178, "epoch": 2980} {"train_loss": -6.480704307556152, "global_step": 125179, "epoch": 2980} {"train_loss": -6.604833126068115, "global_step": 125180, "epoch": 2980} {"train_loss": -6.55885648727417, "global_step": 125181, "epoch": 2980} {"train_loss": -6.488334655761719, "global_step": 125182, "epoch": 2980} {"train_loss": -6.483869552612305, "global_step": 125183, "epoch": 2980} {"train_loss": -6.4839372634887695, "global_step": 125184, "epoch": 2980} {"train_loss": -6.555891036987305, "global_step": 125185, "epoch": 2980} {"train_loss": -6.438713550567627, "global_step": 125186, "epoch": 2980} {"train_loss": -6.572450637817383, "global_step": 125187, "epoch": 2980} {"train_loss": -6.529915809631348, "global_step": 125188, "epoch": 2980} {"train_loss": -6.490511417388916, "global_step": 125189, "epoch": 2980} {"train_loss": -6.523920059204102, "global_step": 125190, "epoch": 2980} {"train_loss": -6.451772689819336, "global_step": 125191, "epoch": 2980} {"train_loss": -6.633126258850098, "global_step": 125192, "epoch": 2980} {"train_loss": -6.536205768585205, "global_step": 125193, "epoch": 2980} {"train_loss": -6.41641902923584, "global_step": 125194, "epoch": 2980} {"train_loss": -6.573034286499023, "global_step": 125195, "epoch": 2980} {"train_loss": -6.5521721839904785, "global_step": 125196, "epoch": 2980} {"train_loss": -6.510636806488037, "global_step": 125197, "epoch": 2980} {"train_loss": -6.482505798339844, "global_step": 125198, "epoch": 2980} {"train_loss": -6.469055652618408, "global_step": 125199, "epoch": 2980} {"train_loss": -6.546177864074707, "global_step": 125200, "epoch": 2980} {"train_loss": -6.52726285798209, "global_step": 125201, "epoch": 2980, "val_loss": 67999.7265625} {"train_loss": -6.605045795440674, "global_step": 125202, "epoch": 2981} {"train_loss": -6.526037216186523, "global_step": 125203, "epoch": 2981} {"train_loss": -6.526324272155762, "global_step": 125204, "epoch": 2981} {"train_loss": -6.57681131362915, "global_step": 125205, "epoch": 2981} {"train_loss": -6.6523847579956055, "global_step": 125206, "epoch": 2981} {"train_loss": -6.489614963531494, "global_step": 125207, "epoch": 2981} {"train_loss": -6.632720947265625, "global_step": 125208, "epoch": 2981} {"train_loss": -6.627439498901367, "global_step": 125209, "epoch": 2981} {"train_loss": -6.5114521980285645, "global_step": 125210, "epoch": 2981} {"train_loss": -6.639928340911865, "global_step": 125211, "epoch": 2981} {"train_loss": -6.425340175628662, "global_step": 125212, "epoch": 2981} {"train_loss": -6.607263088226318, "global_step": 125213, "epoch": 2981} {"train_loss": -6.52255916595459, "global_step": 125214, "epoch": 2981} {"train_loss": -6.546623229980469, "global_step": 125215, "epoch": 2981} {"train_loss": -6.572725772857666, "global_step": 125216, "epoch": 2981} {"train_loss": -6.466350078582764, "global_step": 125217, "epoch": 2981} {"train_loss": -6.547488212585449, "global_step": 125218, "epoch": 2981} {"train_loss": -6.633993148803711, "global_step": 125219, "epoch": 2981} {"train_loss": -6.4792680740356445, "global_step": 125220, "epoch": 2981} {"train_loss": -6.691378593444824, "global_step": 125221, "epoch": 2981} {"train_loss": -6.535464286804199, "global_step": 125222, "epoch": 2981} {"train_loss": -6.507274627685547, "global_step": 125223, "epoch": 2981} {"train_loss": -6.675562381744385, "global_step": 125224, "epoch": 2981} {"train_loss": -6.411197662353516, "global_step": 125225, "epoch": 2981} {"train_loss": -6.511453628540039, "global_step": 125226, "epoch": 2981} {"train_loss": -6.5589494705200195, "global_step": 125227, "epoch": 2981} {"train_loss": -6.513123035430908, "global_step": 125228, "epoch": 2981} {"train_loss": -6.514108657836914, "global_step": 125229, "epoch": 2981} {"train_loss": -6.522607326507568, "global_step": 125230, "epoch": 2981} {"train_loss": -6.525164604187012, "global_step": 125231, "epoch": 2981} {"train_loss": -6.468250274658203, "global_step": 125232, "epoch": 2981} {"train_loss": -6.424537658691406, "global_step": 125233, "epoch": 2981} {"train_loss": -6.471457481384277, "global_step": 125234, "epoch": 2981} {"train_loss": -6.596077919006348, "global_step": 125235, "epoch": 2981} {"train_loss": -6.641200065612793, "global_step": 125236, "epoch": 2981} {"train_loss": -6.50653600692749, "global_step": 125237, "epoch": 2981} {"train_loss": -6.576432228088379, "global_step": 125238, "epoch": 2981} {"train_loss": -6.574713706970215, "global_step": 125239, "epoch": 2981} {"train_loss": -6.579166412353516, "global_step": 125240, "epoch": 2981} {"train_loss": -6.593730926513672, "global_step": 125241, "epoch": 2981} {"train_loss": -6.438831806182861, "global_step": 125242, "epoch": 2981} {"train_loss": -6.547333478927612, "global_step": 125243, "epoch": 2981, "val_loss": 67914.9140625} {"train_loss": -6.553245544433594, "global_step": 125244, "epoch": 2982} {"train_loss": -6.570878028869629, "global_step": 125245, "epoch": 2982} {"train_loss": -6.623732089996338, "global_step": 125246, "epoch": 2982} {"train_loss": -6.471906661987305, "global_step": 125247, "epoch": 2982} {"train_loss": -6.4544477462768555, "global_step": 125248, "epoch": 2982} {"train_loss": -6.5056939125061035, "global_step": 125249, "epoch": 2982} {"train_loss": -6.458191871643066, "global_step": 125250, "epoch": 2982} {"train_loss": -6.506113052368164, "global_step": 125251, "epoch": 2982} {"train_loss": -6.6179986000061035, "global_step": 125252, "epoch": 2982} {"train_loss": -6.479833126068115, "global_step": 125253, "epoch": 2982} {"train_loss": -6.546966075897217, "global_step": 125254, "epoch": 2982} {"train_loss": -6.4865922927856445, "global_step": 125255, "epoch": 2982} {"train_loss": -6.4734320640563965, "global_step": 125256, "epoch": 2982} {"train_loss": -6.473917007446289, "global_step": 125257, "epoch": 2982} {"train_loss": -6.470807075500488, "global_step": 125258, "epoch": 2982} {"train_loss": -6.555443286895752, "global_step": 125259, "epoch": 2982} {"train_loss": -6.538300514221191, "global_step": 125260, "epoch": 2982} {"train_loss": -6.578728199005127, "global_step": 125261, "epoch": 2982} {"train_loss": -6.57578182220459, "global_step": 125262, "epoch": 2982} {"train_loss": -6.538443565368652, "global_step": 125263, "epoch": 2982} {"train_loss": -6.565473556518555, "global_step": 125264, "epoch": 2982} {"train_loss": -6.609156608581543, "global_step": 125265, "epoch": 2982} {"train_loss": -6.506237983703613, "global_step": 125266, "epoch": 2982} {"train_loss": -6.535167217254639, "global_step": 125267, "epoch": 2982} {"train_loss": -6.584181785583496, "global_step": 125268, "epoch": 2982} {"train_loss": -6.5776262283325195, "global_step": 125269, "epoch": 2982} {"train_loss": -6.563977241516113, "global_step": 125270, "epoch": 2982} {"train_loss": -6.499086856842041, "global_step": 125271, "epoch": 2982} {"train_loss": -6.586006164550781, "global_step": 125272, "epoch": 2982} {"train_loss": -6.616950988769531, "global_step": 125273, "epoch": 2982} {"train_loss": -6.595327854156494, "global_step": 125274, "epoch": 2982} {"train_loss": -6.509812355041504, "global_step": 125275, "epoch": 2982} {"train_loss": -6.521310806274414, "global_step": 125276, "epoch": 2982} {"train_loss": -6.609869480133057, "global_step": 125277, "epoch": 2982} {"train_loss": -6.485333442687988, "global_step": 125278, "epoch": 2982} {"train_loss": -6.543190002441406, "global_step": 125279, "epoch": 2982} {"train_loss": -6.6354756355285645, "global_step": 125280, "epoch": 2982} {"train_loss": -6.481982231140137, "global_step": 125281, "epoch": 2982} {"train_loss": -6.562629699707031, "global_step": 125282, "epoch": 2982} {"train_loss": -6.565411567687988, "global_step": 125283, "epoch": 2982} {"train_loss": -6.467378616333008, "global_step": 125284, "epoch": 2982} {"train_loss": -6.5368416877019975, "global_step": 125285, "epoch": 2982, "val_loss": 68301.0078125} {"train_loss": -6.507908344268799, "global_step": 125286, "epoch": 2983} {"train_loss": -6.626210689544678, "global_step": 125287, "epoch": 2983} {"train_loss": -6.590170383453369, "global_step": 125288, "epoch": 2983} {"train_loss": -6.559115409851074, "global_step": 125289, "epoch": 2983} {"train_loss": -6.659705638885498, "global_step": 125290, "epoch": 2983} {"train_loss": -6.580910682678223, "global_step": 125291, "epoch": 2983} {"train_loss": -6.667705535888672, "global_step": 125292, "epoch": 2983} {"train_loss": -6.542923927307129, "global_step": 125293, "epoch": 2983} {"train_loss": -6.591672897338867, "global_step": 125294, "epoch": 2983} {"train_loss": -6.57011604309082, "global_step": 125295, "epoch": 2983} {"train_loss": -6.647153854370117, "global_step": 125296, "epoch": 2983} {"train_loss": -6.5166168212890625, "global_step": 125297, "epoch": 2983} {"train_loss": -6.591312885284424, "global_step": 125298, "epoch": 2983} {"train_loss": -6.533198356628418, "global_step": 125299, "epoch": 2983} {"train_loss": -6.444634437561035, "global_step": 125300, "epoch": 2983} {"train_loss": -6.526483058929443, "global_step": 125301, "epoch": 2983} {"train_loss": -6.755358695983887, "global_step": 125302, "epoch": 2983} {"train_loss": -6.545876502990723, "global_step": 125303, "epoch": 2983} {"train_loss": -6.589686870574951, "global_step": 125304, "epoch": 2983} {"train_loss": -6.691431999206543, "global_step": 125305, "epoch": 2983} {"train_loss": -6.437265396118164, "global_step": 125306, "epoch": 2983} {"train_loss": -6.5386247634887695, "global_step": 125307, "epoch": 2983} {"train_loss": -6.636186599731445, "global_step": 125308, "epoch": 2983} {"train_loss": -6.613455772399902, "global_step": 125309, "epoch": 2983} {"train_loss": -6.552166938781738, "global_step": 125310, "epoch": 2983} {"train_loss": -6.4993109703063965, "global_step": 125311, "epoch": 2983} {"train_loss": -6.616156578063965, "global_step": 125312, "epoch": 2983} {"train_loss": -6.666419982910156, "global_step": 125313, "epoch": 2983} {"train_loss": -6.581516265869141, "global_step": 125314, "epoch": 2983} {"train_loss": -6.50474739074707, "global_step": 125315, "epoch": 2983} {"train_loss": -6.574948310852051, "global_step": 125316, "epoch": 2983} {"train_loss": -6.507250785827637, "global_step": 125317, "epoch": 2983} {"train_loss": -6.517757415771484, "global_step": 125318, "epoch": 2983} {"train_loss": -6.627573490142822, "global_step": 125319, "epoch": 2983} {"train_loss": -6.491065979003906, "global_step": 125320, "epoch": 2983} {"train_loss": -6.488437175750732, "global_step": 125321, "epoch": 2983} {"train_loss": -6.654855728149414, "global_step": 125322, "epoch": 2983} {"train_loss": -6.512134552001953, "global_step": 125323, "epoch": 2983} {"train_loss": -6.558313369750977, "global_step": 125324, "epoch": 2983} {"train_loss": -6.591590404510498, "global_step": 125325, "epoch": 2983} {"train_loss": -6.595379829406738, "global_step": 125326, "epoch": 2983} {"train_loss": -6.5720171474275135, "global_step": 125327, "epoch": 2983, "val_loss": 68168.2578125} {"train_loss": -6.48491096496582, "global_step": 125328, "epoch": 2984} {"train_loss": -6.6088995933532715, "global_step": 125329, "epoch": 2984} {"train_loss": -6.476487159729004, "global_step": 125330, "epoch": 2984} {"train_loss": -6.50421142578125, "global_step": 125331, "epoch": 2984} {"train_loss": -6.555285930633545, "global_step": 125332, "epoch": 2984} {"train_loss": -6.548704147338867, "global_step": 125333, "epoch": 2984} {"train_loss": -6.547402858734131, "global_step": 125334, "epoch": 2984} {"train_loss": -6.670914173126221, "global_step": 125335, "epoch": 2984} {"train_loss": -6.4581708908081055, "global_step": 125336, "epoch": 2984} {"train_loss": -6.6094512939453125, "global_step": 125337, "epoch": 2984} {"train_loss": -6.547428607940674, "global_step": 125338, "epoch": 2984} {"train_loss": -6.57362174987793, "global_step": 125339, "epoch": 2984} {"train_loss": -6.5690507888793945, "global_step": 125340, "epoch": 2984} {"train_loss": -6.511903762817383, "global_step": 125341, "epoch": 2984} {"train_loss": -6.495295524597168, "global_step": 125342, "epoch": 2984} {"train_loss": -6.532788276672363, "global_step": 125343, "epoch": 2984} {"train_loss": -6.537887096405029, "global_step": 125344, "epoch": 2984} {"train_loss": -6.558622360229492, "global_step": 125345, "epoch": 2984} {"train_loss": -6.618552207946777, "global_step": 125346, "epoch": 2984} {"train_loss": -6.58252477645874, "global_step": 125347, "epoch": 2984} {"train_loss": -6.501359939575195, "global_step": 125348, "epoch": 2984} {"train_loss": -6.585008144378662, "global_step": 125349, "epoch": 2984} {"train_loss": -6.478107452392578, "global_step": 125350, "epoch": 2984} {"train_loss": -6.589466094970703, "global_step": 125351, "epoch": 2984} {"train_loss": -6.48738956451416, "global_step": 125352, "epoch": 2984} {"train_loss": -6.611003875732422, "global_step": 125353, "epoch": 2984} {"train_loss": -6.399998188018799, "global_step": 125354, "epoch": 2984} {"train_loss": -6.562127590179443, "global_step": 125355, "epoch": 2984} {"train_loss": -6.467574119567871, "global_step": 125356, "epoch": 2984} {"train_loss": -6.546195030212402, "global_step": 125357, "epoch": 2984} {"train_loss": -6.602766036987305, "global_step": 125358, "epoch": 2984} {"train_loss": -6.544674396514893, "global_step": 125359, "epoch": 2984} {"train_loss": -6.639514446258545, "global_step": 125360, "epoch": 2984} {"train_loss": -6.51035737991333, "global_step": 125361, "epoch": 2984} {"train_loss": -6.478940010070801, "global_step": 125362, "epoch": 2984} {"train_loss": -6.553870677947998, "global_step": 125363, "epoch": 2984} {"train_loss": -6.575014114379883, "global_step": 125364, "epoch": 2984} {"train_loss": -6.589869976043701, "global_step": 125365, "epoch": 2984} {"train_loss": -6.656238555908203, "global_step": 125366, "epoch": 2984} {"train_loss": -6.647823810577393, "global_step": 125367, "epoch": 2984} {"train_loss": -6.564873695373535, "global_step": 125368, "epoch": 2984} {"train_loss": -6.552805707568214, "global_step": 125369, "epoch": 2984, "val_loss": 67929.5078125} {"train_loss": -6.485072135925293, "global_step": 125370, "epoch": 2985} {"train_loss": -6.561020851135254, "global_step": 125371, "epoch": 2985} {"train_loss": -6.61591911315918, "global_step": 125372, "epoch": 2985} {"train_loss": -6.598115921020508, "global_step": 125373, "epoch": 2985} {"train_loss": -6.539621829986572, "global_step": 125374, "epoch": 2985} {"train_loss": -6.6144866943359375, "global_step": 125375, "epoch": 2985} {"train_loss": -6.688849449157715, "global_step": 125376, "epoch": 2985} {"train_loss": -6.659246444702148, "global_step": 125377, "epoch": 2985} {"train_loss": -6.585180282592773, "global_step": 125378, "epoch": 2985} {"train_loss": -6.568836212158203, "global_step": 125379, "epoch": 2985} {"train_loss": -6.525565147399902, "global_step": 125380, "epoch": 2985} {"train_loss": -6.687793254852295, "global_step": 125381, "epoch": 2985} {"train_loss": -6.592525959014893, "global_step": 125382, "epoch": 2985} {"train_loss": -6.6400861740112305, "global_step": 125383, "epoch": 2985} {"train_loss": -6.706377029418945, "global_step": 125384, "epoch": 2985} {"train_loss": -6.65794038772583, "global_step": 125385, "epoch": 2985} {"train_loss": -6.66868782043457, "global_step": 125386, "epoch": 2985} {"train_loss": -6.560057640075684, "global_step": 125387, "epoch": 2985} {"train_loss": -6.668530464172363, "global_step": 125388, "epoch": 2985} {"train_loss": -6.562670707702637, "global_step": 125389, "epoch": 2985} {"train_loss": -6.712036609649658, "global_step": 125390, "epoch": 2985} {"train_loss": -6.538975715637207, "global_step": 125391, "epoch": 2985} {"train_loss": -6.581287384033203, "global_step": 125392, "epoch": 2985} {"train_loss": -6.5858917236328125, "global_step": 125393, "epoch": 2985} {"train_loss": -6.609220504760742, "global_step": 125394, "epoch": 2985} {"train_loss": -6.663463115692139, "global_step": 125395, "epoch": 2985} {"train_loss": -6.560579299926758, "global_step": 125396, "epoch": 2985} {"train_loss": -6.619248390197754, "global_step": 125397, "epoch": 2985} {"train_loss": -6.640285491943359, "global_step": 125398, "epoch": 2985} {"train_loss": -6.53288459777832, "global_step": 125399, "epoch": 2985} {"train_loss": -6.558527946472168, "global_step": 125400, "epoch": 2985} {"train_loss": -6.625723838806152, "global_step": 125401, "epoch": 2985} {"train_loss": -6.360811233520508, "global_step": 125402, "epoch": 2985} {"train_loss": -6.634952545166016, "global_step": 125403, "epoch": 2985} {"train_loss": -6.4729485511779785, "global_step": 125404, "epoch": 2985} {"train_loss": -6.625767707824707, "global_step": 125405, "epoch": 2985} {"train_loss": -6.568903923034668, "global_step": 125406, "epoch": 2985} {"train_loss": -6.558101177215576, "global_step": 125407, "epoch": 2985} {"train_loss": -6.555257320404053, "global_step": 125408, "epoch": 2985} {"train_loss": -6.518712043762207, "global_step": 125409, "epoch": 2985} {"train_loss": -6.546242713928223, "global_step": 125410, "epoch": 2985} {"train_loss": -6.59020091238476, "global_step": 125411, "epoch": 2985, "val_loss": 68185.765625} {"train_loss": -6.517101287841797, "global_step": 125412, "epoch": 2986} {"train_loss": -6.540990829467773, "global_step": 125413, "epoch": 2986} {"train_loss": -6.56058406829834, "global_step": 125414, "epoch": 2986} {"train_loss": -6.564258575439453, "global_step": 125415, "epoch": 2986} {"train_loss": -6.538791179656982, "global_step": 125416, "epoch": 2986} {"train_loss": -6.565390586853027, "global_step": 125417, "epoch": 2986} {"train_loss": -6.642439365386963, "global_step": 125418, "epoch": 2986} {"train_loss": -6.310620307922363, "global_step": 125419, "epoch": 2986} {"train_loss": -6.504570007324219, "global_step": 125420, "epoch": 2986} {"train_loss": -6.486856937408447, "global_step": 125421, "epoch": 2986} {"train_loss": -6.39528751373291, "global_step": 125422, "epoch": 2986} {"train_loss": -6.580625534057617, "global_step": 125423, "epoch": 2986} {"train_loss": -6.4777374267578125, "global_step": 125424, "epoch": 2986} {"train_loss": -6.476441860198975, "global_step": 125425, "epoch": 2986} {"train_loss": -6.5432634353637695, "global_step": 125426, "epoch": 2986} {"train_loss": -6.455113410949707, "global_step": 125427, "epoch": 2986} {"train_loss": -6.511708736419678, "global_step": 125428, "epoch": 2986} {"train_loss": -6.436849117279053, "global_step": 125429, "epoch": 2986} {"train_loss": -6.541110992431641, "global_step": 125430, "epoch": 2986} {"train_loss": -6.5810770988464355, "global_step": 125431, "epoch": 2986} {"train_loss": -6.657616138458252, "global_step": 125432, "epoch": 2986} {"train_loss": -6.430562973022461, "global_step": 125433, "epoch": 2986} {"train_loss": -6.512651443481445, "global_step": 125434, "epoch": 2986} {"train_loss": -6.638531684875488, "global_step": 125435, "epoch": 2986} {"train_loss": -6.566333293914795, "global_step": 125436, "epoch": 2986} {"train_loss": -6.644902229309082, "global_step": 125437, "epoch": 2986} {"train_loss": -6.680867671966553, "global_step": 125438, "epoch": 2986} {"train_loss": -6.646501541137695, "global_step": 125439, "epoch": 2986} {"train_loss": -6.604665756225586, "global_step": 125440, "epoch": 2986} {"train_loss": -6.535483360290527, "global_step": 125441, "epoch": 2986} {"train_loss": -6.4806694984436035, "global_step": 125442, "epoch": 2986} {"train_loss": -6.50421142578125, "global_step": 125443, "epoch": 2986} {"train_loss": -6.607311725616455, "global_step": 125444, "epoch": 2986} {"train_loss": -6.612471103668213, "global_step": 125445, "epoch": 2986} {"train_loss": -6.561586380004883, "global_step": 125446, "epoch": 2986} {"train_loss": -6.545218467712402, "global_step": 125447, "epoch": 2986} {"train_loss": -6.521800518035889, "global_step": 125448, "epoch": 2986} {"train_loss": -6.521175861358643, "global_step": 125449, "epoch": 2986} {"train_loss": -6.5490803718566895, "global_step": 125450, "epoch": 2986} {"train_loss": -6.573629379272461, "global_step": 125451, "epoch": 2986} {"train_loss": -6.540328025817871, "global_step": 125452, "epoch": 2986} {"train_loss": -6.541474887302944, "global_step": 125453, "epoch": 2986, "val_loss": 68113.9609375} {"train_loss": -6.570703983306885, "global_step": 125454, "epoch": 2987} {"train_loss": -6.609604358673096, "global_step": 125455, "epoch": 2987} {"train_loss": -6.609046936035156, "global_step": 125456, "epoch": 2987} {"train_loss": -6.623236179351807, "global_step": 125457, "epoch": 2987} {"train_loss": -6.562094688415527, "global_step": 125458, "epoch": 2987} {"train_loss": -6.658254623413086, "global_step": 125459, "epoch": 2987} {"train_loss": -6.56791877746582, "global_step": 125460, "epoch": 2987} {"train_loss": -6.607658386230469, "global_step": 125461, "epoch": 2987} {"train_loss": -6.717914581298828, "global_step": 125462, "epoch": 2987} {"train_loss": -6.527383804321289, "global_step": 125463, "epoch": 2987} {"train_loss": -6.632477760314941, "global_step": 125464, "epoch": 2987} {"train_loss": -6.621722221374512, "global_step": 125465, "epoch": 2987} {"train_loss": -6.610007286071777, "global_step": 125466, "epoch": 2987} {"train_loss": -6.631430625915527, "global_step": 125467, "epoch": 2987} {"train_loss": -6.656613349914551, "global_step": 125468, "epoch": 2987} {"train_loss": -6.622783660888672, "global_step": 125469, "epoch": 2987} {"train_loss": -6.623159408569336, "global_step": 125470, "epoch": 2987} {"train_loss": -6.683551788330078, "global_step": 125471, "epoch": 2987} {"train_loss": -6.603436470031738, "global_step": 125472, "epoch": 2987} {"train_loss": -6.598282337188721, "global_step": 125473, "epoch": 2987} {"train_loss": -6.617367744445801, "global_step": 125474, "epoch": 2987} {"train_loss": -6.663620948791504, "global_step": 125475, "epoch": 2987} {"train_loss": -6.709977149963379, "global_step": 125476, "epoch": 2987} {"train_loss": -6.459835052490234, "global_step": 125477, "epoch": 2987} {"train_loss": -6.617956161499023, "global_step": 125478, "epoch": 2987} {"train_loss": -6.5785298347473145, "global_step": 125479, "epoch": 2987} {"train_loss": -6.55464506149292, "global_step": 125480, "epoch": 2987} {"train_loss": -6.577189922332764, "global_step": 125481, "epoch": 2987} {"train_loss": -6.554553031921387, "global_step": 125482, "epoch": 2987} {"train_loss": -6.641338348388672, "global_step": 125483, "epoch": 2987} {"train_loss": -6.548449516296387, "global_step": 125484, "epoch": 2987} {"train_loss": -6.5854291915893555, "global_step": 125485, "epoch": 2987} {"train_loss": -6.668529510498047, "global_step": 125486, "epoch": 2987} {"train_loss": -6.547299861907959, "global_step": 125487, "epoch": 2987} {"train_loss": -6.606448650360107, "global_step": 125488, "epoch": 2987} {"train_loss": -6.554635524749756, "global_step": 125489, "epoch": 2987} {"train_loss": -6.502911567687988, "global_step": 125490, "epoch": 2987} {"train_loss": -6.6230058670043945, "global_step": 125491, "epoch": 2987} {"train_loss": -6.677083969116211, "global_step": 125492, "epoch": 2987} {"train_loss": -6.550673007965088, "global_step": 125493, "epoch": 2987} {"train_loss": -6.487455368041992, "global_step": 125494, "epoch": 2987} {"train_loss": -6.599582581293015, "global_step": 125495, "epoch": 2987, "val_loss": 68137.3046875} {"train_loss": -6.605222702026367, "global_step": 125496, "epoch": 2988} {"train_loss": -6.653295516967773, "global_step": 125497, "epoch": 2988} {"train_loss": -6.594256401062012, "global_step": 125498, "epoch": 2988} {"train_loss": -6.693090915679932, "global_step": 125499, "epoch": 2988} {"train_loss": -6.542031288146973, "global_step": 125500, "epoch": 2988} {"train_loss": -6.726656436920166, "global_step": 125501, "epoch": 2988} {"train_loss": -6.621506690979004, "global_step": 125502, "epoch": 2988} {"train_loss": -6.5553131103515625, "global_step": 125503, "epoch": 2988} {"train_loss": -6.60835075378418, "global_step": 125504, "epoch": 2988} {"train_loss": -6.640419960021973, "global_step": 125505, "epoch": 2988} {"train_loss": -6.560194969177246, "global_step": 125506, "epoch": 2988} {"train_loss": -6.648780822753906, "global_step": 125507, "epoch": 2988} {"train_loss": -6.7060747146606445, "global_step": 125508, "epoch": 2988} {"train_loss": -6.650824546813965, "global_step": 125509, "epoch": 2988} {"train_loss": -6.589827060699463, "global_step": 125510, "epoch": 2988} {"train_loss": -6.608538627624512, "global_step": 125511, "epoch": 2988} {"train_loss": -6.562732219696045, "global_step": 125512, "epoch": 2988} {"train_loss": -6.70526123046875, "global_step": 125513, "epoch": 2988} {"train_loss": -6.581112861633301, "global_step": 125514, "epoch": 2988} {"train_loss": -6.509091377258301, "global_step": 125515, "epoch": 2988} {"train_loss": -6.700403213500977, "global_step": 125516, "epoch": 2988} {"train_loss": -6.480349063873291, "global_step": 125517, "epoch": 2988} {"train_loss": -6.430852890014648, "global_step": 125518, "epoch": 2988} {"train_loss": -6.5203962326049805, "global_step": 125519, "epoch": 2988} {"train_loss": -6.569704055786133, "global_step": 125520, "epoch": 2988} {"train_loss": -6.4618635177612305, "global_step": 125521, "epoch": 2988} {"train_loss": -6.781582355499268, "global_step": 125522, "epoch": 2988} {"train_loss": -6.616034030914307, "global_step": 125523, "epoch": 2988} {"train_loss": -6.685632705688477, "global_step": 125524, "epoch": 2988} {"train_loss": -6.585165977478027, "global_step": 125525, "epoch": 2988} {"train_loss": -6.566936016082764, "global_step": 125526, "epoch": 2988} {"train_loss": -6.371211528778076, "global_step": 125527, "epoch": 2988} {"train_loss": -6.527663230895996, "global_step": 125528, "epoch": 2988} {"train_loss": -6.529711723327637, "global_step": 125529, "epoch": 2988} {"train_loss": -6.553488731384277, "global_step": 125530, "epoch": 2988} {"train_loss": -6.5392303466796875, "global_step": 125531, "epoch": 2988} {"train_loss": -6.490772724151611, "global_step": 125532, "epoch": 2988} {"train_loss": -6.455716133117676, "global_step": 125533, "epoch": 2988} {"train_loss": -6.535862445831299, "global_step": 125534, "epoch": 2988} {"train_loss": -6.564050674438477, "global_step": 125535, "epoch": 2988} {"train_loss": -6.403576850891113, "global_step": 125536, "epoch": 2988} {"train_loss": -6.5775807698567705, "global_step": 125537, "epoch": 2988, "val_loss": 68252.96875} {"train_loss": -6.4785871505737305, "global_step": 125538, "epoch": 2989} {"train_loss": -6.619882583618164, "global_step": 125539, "epoch": 2989} {"train_loss": -6.514188289642334, "global_step": 125540, "epoch": 2989} {"train_loss": -6.4576921463012695, "global_step": 125541, "epoch": 2989} {"train_loss": -6.58221960067749, "global_step": 125542, "epoch": 2989} {"train_loss": -6.531291484832764, "global_step": 125543, "epoch": 2989} {"train_loss": -6.551167011260986, "global_step": 125544, "epoch": 2989} {"train_loss": -6.626800537109375, "global_step": 125545, "epoch": 2989} {"train_loss": -6.562104225158691, "global_step": 125546, "epoch": 2989} {"train_loss": -6.692659378051758, "global_step": 125547, "epoch": 2989} {"train_loss": -6.599817276000977, "global_step": 125548, "epoch": 2989} {"train_loss": -6.488553047180176, "global_step": 125549, "epoch": 2989} {"train_loss": -6.514411926269531, "global_step": 125550, "epoch": 2989} {"train_loss": -6.579464435577393, "global_step": 125551, "epoch": 2989} {"train_loss": -6.668704509735107, "global_step": 125552, "epoch": 2989} {"train_loss": -6.5477800369262695, "global_step": 125553, "epoch": 2989} {"train_loss": -6.620053768157959, "global_step": 125554, "epoch": 2989} {"train_loss": -6.590524673461914, "global_step": 125555, "epoch": 2989} {"train_loss": -6.630107879638672, "global_step": 125556, "epoch": 2989} {"train_loss": -6.559805870056152, "global_step": 125557, "epoch": 2989} {"train_loss": -6.584983825683594, "global_step": 125558, "epoch": 2989} {"train_loss": -6.54157829284668, "global_step": 125559, "epoch": 2989} {"train_loss": -6.709665775299072, "global_step": 125560, "epoch": 2989} {"train_loss": -6.555463790893555, "global_step": 125561, "epoch": 2989} {"train_loss": -6.468323707580566, "global_step": 125562, "epoch": 2989} {"train_loss": -6.617805480957031, "global_step": 125563, "epoch": 2989} {"train_loss": -6.51027774810791, "global_step": 125564, "epoch": 2989} {"train_loss": -6.585850715637207, "global_step": 125565, "epoch": 2989} {"train_loss": -6.617733478546143, "global_step": 125566, "epoch": 2989} {"train_loss": -6.548025131225586, "global_step": 125567, "epoch": 2989} {"train_loss": -6.543832778930664, "global_step": 125568, "epoch": 2989} {"train_loss": -6.505049228668213, "global_step": 125569, "epoch": 2989} {"train_loss": -6.487818717956543, "global_step": 125570, "epoch": 2989} {"train_loss": -6.60459041595459, "global_step": 125571, "epoch": 2989} {"train_loss": -6.572977066040039, "global_step": 125572, "epoch": 2989} {"train_loss": -6.662168502807617, "global_step": 125573, "epoch": 2989} {"train_loss": -6.582198143005371, "global_step": 125574, "epoch": 2989} {"train_loss": -6.483155250549316, "global_step": 125575, "epoch": 2989} {"train_loss": -6.63032865524292, "global_step": 125576, "epoch": 2989} {"train_loss": -6.665565490722656, "global_step": 125577, "epoch": 2989} {"train_loss": -6.525672435760498, "global_step": 125578, "epoch": 2989} {"train_loss": -6.571264312380836, "global_step": 125579, "epoch": 2989, "val_loss": 68025.109375} {"train_loss": -6.660866737365723, "global_step": 125580, "epoch": 2990} {"train_loss": -6.669185638427734, "global_step": 125581, "epoch": 2990} {"train_loss": -6.636745452880859, "global_step": 125582, "epoch": 2990} {"train_loss": -6.51516056060791, "global_step": 125583, "epoch": 2990} {"train_loss": -6.697498321533203, "global_step": 125584, "epoch": 2990} {"train_loss": -6.595863342285156, "global_step": 125585, "epoch": 2990} {"train_loss": -6.479597091674805, "global_step": 125586, "epoch": 2990} {"train_loss": -6.512301445007324, "global_step": 125587, "epoch": 2990} {"train_loss": -6.5124711990356445, "global_step": 125588, "epoch": 2990} {"train_loss": -6.520254135131836, "global_step": 125589, "epoch": 2990} {"train_loss": -6.519185543060303, "global_step": 125590, "epoch": 2990} {"train_loss": -6.465845108032227, "global_step": 125591, "epoch": 2990} {"train_loss": -6.631442070007324, "global_step": 125592, "epoch": 2990} {"train_loss": -6.643472194671631, "global_step": 125593, "epoch": 2990} {"train_loss": -6.530845642089844, "global_step": 125594, "epoch": 2990} {"train_loss": -6.524639129638672, "global_step": 125595, "epoch": 2990} {"train_loss": -6.481738090515137, "global_step": 125596, "epoch": 2990} {"train_loss": -6.502951622009277, "global_step": 125597, "epoch": 2990} {"train_loss": -6.642404079437256, "global_step": 125598, "epoch": 2990} {"train_loss": -6.544189929962158, "global_step": 125599, "epoch": 2990} {"train_loss": -6.603582382202148, "global_step": 125600, "epoch": 2990} {"train_loss": -6.561716079711914, "global_step": 125601, "epoch": 2990} {"train_loss": -6.543769359588623, "global_step": 125602, "epoch": 2990} {"train_loss": -6.59720516204834, "global_step": 125603, "epoch": 2990} {"train_loss": -6.584474086761475, "global_step": 125604, "epoch": 2990} {"train_loss": -6.556457996368408, "global_step": 125605, "epoch": 2990} {"train_loss": -6.578299522399902, "global_step": 125606, "epoch": 2990} {"train_loss": -6.559651851654053, "global_step": 125607, "epoch": 2990} {"train_loss": -6.721041202545166, "global_step": 125608, "epoch": 2990} {"train_loss": -6.697671413421631, "global_step": 125609, "epoch": 2990} {"train_loss": -6.659816265106201, "global_step": 125610, "epoch": 2990} {"train_loss": -6.672981262207031, "global_step": 125611, "epoch": 2990} {"train_loss": -6.508135795593262, "global_step": 125612, "epoch": 2990} {"train_loss": -6.698666572570801, "global_step": 125613, "epoch": 2990} {"train_loss": -6.499547004699707, "global_step": 125614, "epoch": 2990} {"train_loss": -6.626260757446289, "global_step": 125615, "epoch": 2990} {"train_loss": -6.55336856842041, "global_step": 125616, "epoch": 2990} {"train_loss": -6.501323699951172, "global_step": 125617, "epoch": 2990} {"train_loss": -6.681333541870117, "global_step": 125618, "epoch": 2990} {"train_loss": -6.600942134857178, "global_step": 125619, "epoch": 2990} {"train_loss": -6.505887985229492, "global_step": 125620, "epoch": 2990} {"train_loss": -6.5798758779253275, "global_step": 125621, "epoch": 2990, "val_loss": 68130.40625} {"train_loss": -6.617184638977051, "global_step": 125622, "epoch": 2991} {"train_loss": -6.515902042388916, "global_step": 125623, "epoch": 2991} {"train_loss": -6.493988037109375, "global_step": 125624, "epoch": 2991} {"train_loss": -6.63042688369751, "global_step": 125625, "epoch": 2991} {"train_loss": -6.660222053527832, "global_step": 125626, "epoch": 2991} {"train_loss": -6.5361785888671875, "global_step": 125627, "epoch": 2991} {"train_loss": -6.594531059265137, "global_step": 125628, "epoch": 2991} {"train_loss": -6.663654327392578, "global_step": 125629, "epoch": 2991} {"train_loss": -6.539219856262207, "global_step": 125630, "epoch": 2991} {"train_loss": -6.664393901824951, "global_step": 125631, "epoch": 2991} {"train_loss": -6.712961196899414, "global_step": 125632, "epoch": 2991} {"train_loss": -6.757134437561035, "global_step": 125633, "epoch": 2991} {"train_loss": -6.618549346923828, "global_step": 125634, "epoch": 2991} {"train_loss": -6.6714935302734375, "global_step": 125635, "epoch": 2991} {"train_loss": -6.60920524597168, "global_step": 125636, "epoch": 2991} {"train_loss": -6.566963195800781, "global_step": 125637, "epoch": 2991} {"train_loss": -6.7246479988098145, "global_step": 125638, "epoch": 2991} {"train_loss": -6.480737209320068, "global_step": 125639, "epoch": 2991} {"train_loss": -6.643636703491211, "global_step": 125640, "epoch": 2991} {"train_loss": -6.674909591674805, "global_step": 125641, "epoch": 2991} {"train_loss": -6.494877815246582, "global_step": 125642, "epoch": 2991} {"train_loss": -6.668954372406006, "global_step": 125643, "epoch": 2991} {"train_loss": -6.564478397369385, "global_step": 125644, "epoch": 2991} {"train_loss": -6.514430522918701, "global_step": 125645, "epoch": 2991} {"train_loss": -6.696073532104492, "global_step": 125646, "epoch": 2991} {"train_loss": -6.533215522766113, "global_step": 125647, "epoch": 2991} {"train_loss": -6.5082902908325195, "global_step": 125648, "epoch": 2991} {"train_loss": -6.60048770904541, "global_step": 125649, "epoch": 2991} {"train_loss": -6.673377990722656, "global_step": 125650, "epoch": 2991} {"train_loss": -6.500560283660889, "global_step": 125651, "epoch": 2991} {"train_loss": -6.633337497711182, "global_step": 125652, "epoch": 2991} {"train_loss": -6.658102989196777, "global_step": 125653, "epoch": 2991} {"train_loss": -6.527351379394531, "global_step": 125654, "epoch": 2991} {"train_loss": -6.692260265350342, "global_step": 125655, "epoch": 2991} {"train_loss": -6.461947441101074, "global_step": 125656, "epoch": 2991} {"train_loss": -6.669290542602539, "global_step": 125657, "epoch": 2991} {"train_loss": -6.503000259399414, "global_step": 125658, "epoch": 2991} {"train_loss": -6.670561790466309, "global_step": 125659, "epoch": 2991} {"train_loss": -6.699480056762695, "global_step": 125660, "epoch": 2991} {"train_loss": -6.517439365386963, "global_step": 125661, "epoch": 2991} {"train_loss": -6.686890125274658, "global_step": 125662, "epoch": 2991} {"train_loss": -6.605240220115299, "global_step": 125663, "epoch": 2991, "val_loss": 68066.2890625} {"train_loss": -6.760109901428223, "global_step": 125664, "epoch": 2992} {"train_loss": -6.629528522491455, "global_step": 125665, "epoch": 2992} {"train_loss": -6.577093124389648, "global_step": 125666, "epoch": 2992} {"train_loss": -6.657962799072266, "global_step": 125667, "epoch": 2992} {"train_loss": -6.563424587249756, "global_step": 125668, "epoch": 2992} {"train_loss": -6.631613254547119, "global_step": 125669, "epoch": 2992} {"train_loss": -6.625150203704834, "global_step": 125670, "epoch": 2992} {"train_loss": -6.528315544128418, "global_step": 125671, "epoch": 2992} {"train_loss": -6.535315036773682, "global_step": 125672, "epoch": 2992} {"train_loss": -6.593986511230469, "global_step": 125673, "epoch": 2992} {"train_loss": -6.605337142944336, "global_step": 125674, "epoch": 2992} {"train_loss": -6.485045909881592, "global_step": 125675, "epoch": 2992} {"train_loss": -6.482679843902588, "global_step": 125676, "epoch": 2992} {"train_loss": -6.4335479736328125, "global_step": 125677, "epoch": 2992} {"train_loss": -6.512955665588379, "global_step": 125678, "epoch": 2992} {"train_loss": -6.5508036613464355, "global_step": 125679, "epoch": 2992} {"train_loss": -6.573918342590332, "global_step": 125680, "epoch": 2992} {"train_loss": -6.530514717102051, "global_step": 125681, "epoch": 2992} {"train_loss": -6.491267204284668, "global_step": 125682, "epoch": 2992} {"train_loss": -6.537930488586426, "global_step": 125683, "epoch": 2992} {"train_loss": -6.709293365478516, "global_step": 125684, "epoch": 2992} {"train_loss": -6.520576477050781, "global_step": 125685, "epoch": 2992} {"train_loss": -6.613360404968262, "global_step": 125686, "epoch": 2992} {"train_loss": -6.565317630767822, "global_step": 125687, "epoch": 2992} {"train_loss": -6.600456237792969, "global_step": 125688, "epoch": 2992} {"train_loss": -6.598550796508789, "global_step": 125689, "epoch": 2992} {"train_loss": -6.68168830871582, "global_step": 125690, "epoch": 2992} {"train_loss": -6.464267253875732, "global_step": 125691, "epoch": 2992} {"train_loss": -6.552923679351807, "global_step": 125692, "epoch": 2992} {"train_loss": -6.618433952331543, "global_step": 125693, "epoch": 2992} {"train_loss": -6.568467617034912, "global_step": 125694, "epoch": 2992} {"train_loss": -6.64846134185791, "global_step": 125695, "epoch": 2992} {"train_loss": -6.587096691131592, "global_step": 125696, "epoch": 2992} {"train_loss": -6.60714864730835, "global_step": 125697, "epoch": 2992} {"train_loss": -6.60079288482666, "global_step": 125698, "epoch": 2992} {"train_loss": -6.581045150756836, "global_step": 125699, "epoch": 2992} {"train_loss": -6.626955509185791, "global_step": 125700, "epoch": 2992} {"train_loss": -6.655526161193848, "global_step": 125701, "epoch": 2992} {"train_loss": -6.693460464477539, "global_step": 125702, "epoch": 2992} {"train_loss": -6.662867069244385, "global_step": 125703, "epoch": 2992} {"train_loss": -6.587011337280273, "global_step": 125704, "epoch": 2992} {"train_loss": -6.587800786608741, "global_step": 125705, "epoch": 2992, "val_loss": 68086.9609375} {"train_loss": -6.654790878295898, "global_step": 125706, "epoch": 2993} {"train_loss": -6.577384948730469, "global_step": 125707, "epoch": 2993} {"train_loss": -6.5455546379089355, "global_step": 125708, "epoch": 2993} {"train_loss": -6.573117733001709, "global_step": 125709, "epoch": 2993} {"train_loss": -6.574253559112549, "global_step": 125710, "epoch": 2993} {"train_loss": -6.57813835144043, "global_step": 125711, "epoch": 2993} {"train_loss": -6.542536735534668, "global_step": 125712, "epoch": 2993} {"train_loss": -6.570799827575684, "global_step": 125713, "epoch": 2993} {"train_loss": -6.582858085632324, "global_step": 125714, "epoch": 2993} {"train_loss": -6.5053887367248535, "global_step": 125715, "epoch": 2993} {"train_loss": -6.670660972595215, "global_step": 125716, "epoch": 2993} {"train_loss": -6.619685173034668, "global_step": 125717, "epoch": 2993} {"train_loss": -6.468044281005859, "global_step": 125718, "epoch": 2993} {"train_loss": -6.569543838500977, "global_step": 125719, "epoch": 2993} {"train_loss": -6.551790237426758, "global_step": 125720, "epoch": 2993} {"train_loss": -6.615519046783447, "global_step": 125721, "epoch": 2993} {"train_loss": -6.452054500579834, "global_step": 125722, "epoch": 2993} {"train_loss": -6.562021255493164, "global_step": 125723, "epoch": 2993} {"train_loss": -6.53306770324707, "global_step": 125724, "epoch": 2993} {"train_loss": -6.488265514373779, "global_step": 125725, "epoch": 2993} {"train_loss": -6.586885452270508, "global_step": 125726, "epoch": 2993} {"train_loss": -6.4973039627075195, "global_step": 125727, "epoch": 2993} {"train_loss": -6.610352516174316, "global_step": 125728, "epoch": 2993} {"train_loss": -6.606087684631348, "global_step": 125729, "epoch": 2993} {"train_loss": -6.502176284790039, "global_step": 125730, "epoch": 2993} {"train_loss": -6.494239807128906, "global_step": 125731, "epoch": 2993} {"train_loss": -6.480040550231934, "global_step": 125732, "epoch": 2993} {"train_loss": -6.598584175109863, "global_step": 125733, "epoch": 2993} {"train_loss": -6.466620445251465, "global_step": 125734, "epoch": 2993} {"train_loss": -6.527797698974609, "global_step": 125735, "epoch": 2993} {"train_loss": -6.445333480834961, "global_step": 125736, "epoch": 2993} {"train_loss": -6.506086349487305, "global_step": 125737, "epoch": 2993} {"train_loss": -6.49307107925415, "global_step": 125738, "epoch": 2993} {"train_loss": -6.585805892944336, "global_step": 125739, "epoch": 2993} {"train_loss": -6.59507417678833, "global_step": 125740, "epoch": 2993} {"train_loss": -6.654107093811035, "global_step": 125741, "epoch": 2993} {"train_loss": -6.436004638671875, "global_step": 125742, "epoch": 2993} {"train_loss": -6.6831817626953125, "global_step": 125743, "epoch": 2993} {"train_loss": -6.505601406097412, "global_step": 125744, "epoch": 2993} {"train_loss": -6.510349750518799, "global_step": 125745, "epoch": 2993} {"train_loss": -6.5443220138549805, "global_step": 125746, "epoch": 2993} {"train_loss": -6.5511702582949685, "global_step": 125747, "epoch": 2993, "val_loss": 68061.1953125} {"train_loss": -6.558426856994629, "global_step": 125748, "epoch": 2994} {"train_loss": -6.6790242195129395, "global_step": 125749, "epoch": 2994} {"train_loss": -6.458281517028809, "global_step": 125750, "epoch": 2994} {"train_loss": -6.716428756713867, "global_step": 125751, "epoch": 2994} {"train_loss": -6.613960266113281, "global_step": 125752, "epoch": 2994} {"train_loss": -6.600164413452148, "global_step": 125753, "epoch": 2994} {"train_loss": -6.589665412902832, "global_step": 125754, "epoch": 2994} {"train_loss": -6.516566753387451, "global_step": 125755, "epoch": 2994} {"train_loss": -6.590867042541504, "global_step": 125756, "epoch": 2994} {"train_loss": -6.569913864135742, "global_step": 125757, "epoch": 2994} {"train_loss": -6.540581703186035, "global_step": 125758, "epoch": 2994} {"train_loss": -6.572482109069824, "global_step": 125759, "epoch": 2994} {"train_loss": -6.535191059112549, "global_step": 125760, "epoch": 2994} {"train_loss": -6.467848777770996, "global_step": 125761, "epoch": 2994} {"train_loss": -6.5807952880859375, "global_step": 125762, "epoch": 2994} {"train_loss": -6.637956619262695, "global_step": 125763, "epoch": 2994} {"train_loss": -6.546784400939941, "global_step": 125764, "epoch": 2994} {"train_loss": -6.456963539123535, "global_step": 125765, "epoch": 2994} {"train_loss": -6.6764631271362305, "global_step": 125766, "epoch": 2994} {"train_loss": -6.58560848236084, "global_step": 125767, "epoch": 2994} {"train_loss": -6.468490123748779, "global_step": 125768, "epoch": 2994} {"train_loss": -6.563581466674805, "global_step": 125769, "epoch": 2994} {"train_loss": -6.548378944396973, "global_step": 125770, "epoch": 2994} {"train_loss": -6.422811508178711, "global_step": 125771, "epoch": 2994} {"train_loss": -6.530954360961914, "global_step": 125772, "epoch": 2994} {"train_loss": -6.590749263763428, "global_step": 125773, "epoch": 2994} {"train_loss": -6.518640995025635, "global_step": 125774, "epoch": 2994} {"train_loss": -6.523327827453613, "global_step": 125775, "epoch": 2994} {"train_loss": -6.483415603637695, "global_step": 125776, "epoch": 2994} {"train_loss": -6.466916561126709, "global_step": 125777, "epoch": 2994} {"train_loss": -6.54265022277832, "global_step": 125778, "epoch": 2994} {"train_loss": -6.620413780212402, "global_step": 125779, "epoch": 2994} {"train_loss": -6.5447678565979, "global_step": 125780, "epoch": 2994} {"train_loss": -6.684231281280518, "global_step": 125781, "epoch": 2994} {"train_loss": -6.588781833648682, "global_step": 125782, "epoch": 2994} {"train_loss": -6.619058609008789, "global_step": 125783, "epoch": 2994} {"train_loss": -6.532391548156738, "global_step": 125784, "epoch": 2994} {"train_loss": -6.588700294494629, "global_step": 125785, "epoch": 2994} {"train_loss": -6.547739028930664, "global_step": 125786, "epoch": 2994} {"train_loss": -6.576941013336182, "global_step": 125787, "epoch": 2994} {"train_loss": -6.637055397033691, "global_step": 125788, "epoch": 2994} {"train_loss": -6.564316624686832, "global_step": 125789, "epoch": 2994, "val_loss": 68107.859375} {"train_loss": -6.573050498962402, "global_step": 125790, "epoch": 2995} {"train_loss": -6.559295654296875, "global_step": 125791, "epoch": 2995} {"train_loss": -6.457337379455566, "global_step": 125792, "epoch": 2995} {"train_loss": -6.632115364074707, "global_step": 125793, "epoch": 2995} {"train_loss": -6.535991191864014, "global_step": 125794, "epoch": 2995} {"train_loss": -6.55023717880249, "global_step": 125795, "epoch": 2995} {"train_loss": -6.609336853027344, "global_step": 125796, "epoch": 2995} {"train_loss": -6.570417404174805, "global_step": 125797, "epoch": 2995} {"train_loss": -6.656381607055664, "global_step": 125798, "epoch": 2995} {"train_loss": -6.569965362548828, "global_step": 125799, "epoch": 2995} {"train_loss": -6.532689094543457, "global_step": 125800, "epoch": 2995} {"train_loss": -6.689716815948486, "global_step": 125801, "epoch": 2995} {"train_loss": -6.458655834197998, "global_step": 125802, "epoch": 2995} {"train_loss": -6.592199325561523, "global_step": 125803, "epoch": 2995} {"train_loss": -6.498713970184326, "global_step": 125804, "epoch": 2995} {"train_loss": -6.6728973388671875, "global_step": 125805, "epoch": 2995} {"train_loss": -6.629235744476318, "global_step": 125806, "epoch": 2995} {"train_loss": -6.516639709472656, "global_step": 125807, "epoch": 2995} {"train_loss": -6.582143783569336, "global_step": 125808, "epoch": 2995} {"train_loss": -6.605868816375732, "global_step": 125809, "epoch": 2995} {"train_loss": -6.586568832397461, "global_step": 125810, "epoch": 2995} {"train_loss": -6.665392875671387, "global_step": 125811, "epoch": 2995} {"train_loss": -6.665950775146484, "global_step": 125812, "epoch": 2995} {"train_loss": -6.717148780822754, "global_step": 125813, "epoch": 2995} {"train_loss": -6.640108108520508, "global_step": 125814, "epoch": 2995} {"train_loss": -6.661752700805664, "global_step": 125815, "epoch": 2995} {"train_loss": -6.5978546142578125, "global_step": 125816, "epoch": 2995} {"train_loss": -6.657520294189453, "global_step": 125817, "epoch": 2995} {"train_loss": -6.717038154602051, "global_step": 125818, "epoch": 2995} {"train_loss": -6.652886390686035, "global_step": 125819, "epoch": 2995} {"train_loss": -6.596820831298828, "global_step": 125820, "epoch": 2995} {"train_loss": -6.526045799255371, "global_step": 125821, "epoch": 2995} {"train_loss": -6.5180206298828125, "global_step": 125822, "epoch": 2995} {"train_loss": -6.64860725402832, "global_step": 125823, "epoch": 2995} {"train_loss": -6.725186347961426, "global_step": 125824, "epoch": 2995} {"train_loss": -6.61641263961792, "global_step": 125825, "epoch": 2995} {"train_loss": -6.690537452697754, "global_step": 125826, "epoch": 2995} {"train_loss": -6.574131965637207, "global_step": 125827, "epoch": 2995} {"train_loss": -6.5579047203063965, "global_step": 125828, "epoch": 2995} {"train_loss": -6.525331497192383, "global_step": 125829, "epoch": 2995} {"train_loss": -6.5675787925720215, "global_step": 125830, "epoch": 2995} {"train_loss": -6.600148132869175, "global_step": 125831, "epoch": 2995, "val_loss": 68007.671875} {"train_loss": -6.557183265686035, "global_step": 125832, "epoch": 2996} {"train_loss": -6.638313293457031, "global_step": 125833, "epoch": 2996} {"train_loss": -6.68404483795166, "global_step": 125834, "epoch": 2996} {"train_loss": -6.603996753692627, "global_step": 125835, "epoch": 2996} {"train_loss": -6.561141490936279, "global_step": 125836, "epoch": 2996} {"train_loss": -6.674202919006348, "global_step": 125837, "epoch": 2996} {"train_loss": -6.49644660949707, "global_step": 125838, "epoch": 2996} {"train_loss": -6.507809162139893, "global_step": 125839, "epoch": 2996} {"train_loss": -6.647104740142822, "global_step": 125840, "epoch": 2996} {"train_loss": -6.665424346923828, "global_step": 125841, "epoch": 2996} {"train_loss": -6.526256084442139, "global_step": 125842, "epoch": 2996} {"train_loss": -6.610509872436523, "global_step": 125843, "epoch": 2996} {"train_loss": -6.47995662689209, "global_step": 125844, "epoch": 2996} {"train_loss": -6.604803085327148, "global_step": 125845, "epoch": 2996} {"train_loss": -6.452027320861816, "global_step": 125846, "epoch": 2996} {"train_loss": -6.506524085998535, "global_step": 125847, "epoch": 2996} {"train_loss": -6.54110050201416, "global_step": 125848, "epoch": 2996} {"train_loss": -6.37886381149292, "global_step": 125849, "epoch": 2996} {"train_loss": -6.582143783569336, "global_step": 125850, "epoch": 2996} {"train_loss": -6.444360733032227, "global_step": 125851, "epoch": 2996} {"train_loss": -6.544734001159668, "global_step": 125852, "epoch": 2996} {"train_loss": -6.523934364318848, "global_step": 125853, "epoch": 2996} {"train_loss": -6.572452545166016, "global_step": 125854, "epoch": 2996} {"train_loss": -6.631586074829102, "global_step": 125855, "epoch": 2996} {"train_loss": -6.378074645996094, "global_step": 125856, "epoch": 2996} {"train_loss": -6.545187950134277, "global_step": 125857, "epoch": 2996} {"train_loss": -6.48533296585083, "global_step": 125858, "epoch": 2996} {"train_loss": -6.432619094848633, "global_step": 125859, "epoch": 2996} {"train_loss": -6.576534271240234, "global_step": 125860, "epoch": 2996} {"train_loss": -6.468415260314941, "global_step": 125861, "epoch": 2996} {"train_loss": -6.394110202789307, "global_step": 125862, "epoch": 2996} {"train_loss": -6.512988567352295, "global_step": 125863, "epoch": 2996} {"train_loss": -6.5144758224487305, "global_step": 125864, "epoch": 2996} {"train_loss": -6.51236629486084, "global_step": 125865, "epoch": 2996} {"train_loss": -6.519536972045898, "global_step": 125866, "epoch": 2996} {"train_loss": -6.471905708312988, "global_step": 125867, "epoch": 2996} {"train_loss": -6.503447532653809, "global_step": 125868, "epoch": 2996} {"train_loss": -6.4985198974609375, "global_step": 125869, "epoch": 2996} {"train_loss": -6.418824195861816, "global_step": 125870, "epoch": 2996} {"train_loss": -6.579051971435547, "global_step": 125871, "epoch": 2996} {"train_loss": -6.552431106567383, "global_step": 125872, "epoch": 2996} {"train_loss": -6.531282810937791, "global_step": 125873, "epoch": 2996, "val_loss": 67847.0703125} {"train_loss": -6.675960540771484, "global_step": 125874, "epoch": 2997} {"train_loss": -6.552322864532471, "global_step": 125875, "epoch": 2997} {"train_loss": -6.608481407165527, "global_step": 125876, "epoch": 2997} {"train_loss": -6.548970699310303, "global_step": 125877, "epoch": 2997} {"train_loss": -6.531630992889404, "global_step": 125878, "epoch": 2997} {"train_loss": -6.448026657104492, "global_step": 125879, "epoch": 2997} {"train_loss": -6.59575080871582, "global_step": 125880, "epoch": 2997} {"train_loss": -6.642135143280029, "global_step": 125881, "epoch": 2997} {"train_loss": -6.556886672973633, "global_step": 125882, "epoch": 2997} {"train_loss": -6.5713791847229, "global_step": 125883, "epoch": 2997} {"train_loss": -6.501260757446289, "global_step": 125884, "epoch": 2997} {"train_loss": -6.639597415924072, "global_step": 125885, "epoch": 2997} {"train_loss": -6.686404228210449, "global_step": 125886, "epoch": 2997} {"train_loss": -6.650429725646973, "global_step": 125887, "epoch": 2997} {"train_loss": -6.640935897827148, "global_step": 125888, "epoch": 2997} {"train_loss": -6.672715187072754, "global_step": 125889, "epoch": 2997} {"train_loss": -6.549860000610352, "global_step": 125890, "epoch": 2997} {"train_loss": -6.56101131439209, "global_step": 125891, "epoch": 2997} {"train_loss": -6.561624050140381, "global_step": 125892, "epoch": 2997} {"train_loss": -6.480926513671875, "global_step": 125893, "epoch": 2997} {"train_loss": -6.593783378601074, "global_step": 125894, "epoch": 2997} {"train_loss": -6.497596740722656, "global_step": 125895, "epoch": 2997} {"train_loss": -6.510866165161133, "global_step": 125896, "epoch": 2997} {"train_loss": -6.548182010650635, "global_step": 125897, "epoch": 2997} {"train_loss": -6.385445594787598, "global_step": 125898, "epoch": 2997} {"train_loss": -6.533628463745117, "global_step": 125899, "epoch": 2997} {"train_loss": -6.576084136962891, "global_step": 125900, "epoch": 2997} {"train_loss": -6.47078800201416, "global_step": 125901, "epoch": 2997} {"train_loss": -6.549096584320068, "global_step": 125902, "epoch": 2997} {"train_loss": -6.481559753417969, "global_step": 125903, "epoch": 2997} {"train_loss": -6.596543312072754, "global_step": 125904, "epoch": 2997} {"train_loss": -6.4903459548950195, "global_step": 125905, "epoch": 2997} {"train_loss": -6.547686576843262, "global_step": 125906, "epoch": 2997} {"train_loss": -6.418770790100098, "global_step": 125907, "epoch": 2997} {"train_loss": -6.396404266357422, "global_step": 125908, "epoch": 2997} {"train_loss": -6.508874893188477, "global_step": 125909, "epoch": 2997} {"train_loss": -6.468286514282227, "global_step": 125910, "epoch": 2997} {"train_loss": -6.520130157470703, "global_step": 125911, "epoch": 2997} {"train_loss": -6.530120849609375, "global_step": 125912, "epoch": 2997} {"train_loss": -6.475592613220215, "global_step": 125913, "epoch": 2997} {"train_loss": -6.566022872924805, "global_step": 125914, "epoch": 2997} {"train_loss": -6.541199661436535, "global_step": 125915, "epoch": 2997, "val_loss": 68033.703125} {"train_loss": -6.645697116851807, "global_step": 125916, "epoch": 2998} {"train_loss": -6.461937427520752, "global_step": 125917, "epoch": 2998} {"train_loss": -6.606880187988281, "global_step": 125918, "epoch": 2998} {"train_loss": -6.607635021209717, "global_step": 125919, "epoch": 2998} {"train_loss": -6.46330451965332, "global_step": 125920, "epoch": 2998} {"train_loss": -6.643119812011719, "global_step": 125921, "epoch": 2998} {"train_loss": -6.63163948059082, "global_step": 125922, "epoch": 2998} {"train_loss": -6.598569393157959, "global_step": 125923, "epoch": 2998} {"train_loss": -6.548708915710449, "global_step": 125924, "epoch": 2998} {"train_loss": -6.618952751159668, "global_step": 125925, "epoch": 2998} {"train_loss": -6.6146392822265625, "global_step": 125926, "epoch": 2998} {"train_loss": -6.539675712585449, "global_step": 125927, "epoch": 2998} {"train_loss": -6.604367256164551, "global_step": 125928, "epoch": 2998} {"train_loss": -6.51311731338501, "global_step": 125929, "epoch": 2998} {"train_loss": -6.6571807861328125, "global_step": 125930, "epoch": 2998} {"train_loss": -6.6183061599731445, "global_step": 125931, "epoch": 2998} {"train_loss": -6.657236099243164, "global_step": 125932, "epoch": 2998} {"train_loss": -6.612295627593994, "global_step": 125933, "epoch": 2998} {"train_loss": -6.556540012359619, "global_step": 125934, "epoch": 2998} {"train_loss": -6.59926700592041, "global_step": 125935, "epoch": 2998} {"train_loss": -6.53889799118042, "global_step": 125936, "epoch": 2998} {"train_loss": -6.526798248291016, "global_step": 125937, "epoch": 2998} {"train_loss": -6.59634256362915, "global_step": 125938, "epoch": 2998} {"train_loss": -6.630611896514893, "global_step": 125939, "epoch": 2998} {"train_loss": -6.6095194816589355, "global_step": 125940, "epoch": 2998} {"train_loss": -6.683956623077393, "global_step": 125941, "epoch": 2998} {"train_loss": -6.556277275085449, "global_step": 125942, "epoch": 2998} {"train_loss": -6.677025318145752, "global_step": 125943, "epoch": 2998} {"train_loss": -6.755992889404297, "global_step": 125944, "epoch": 2998} {"train_loss": -6.595438480377197, "global_step": 125945, "epoch": 2998} {"train_loss": -6.564138412475586, "global_step": 125946, "epoch": 2998} {"train_loss": -6.679813385009766, "global_step": 125947, "epoch": 2998} {"train_loss": -6.582206726074219, "global_step": 125948, "epoch": 2998} {"train_loss": -6.479204177856445, "global_step": 125949, "epoch": 2998} {"train_loss": -6.657361030578613, "global_step": 125950, "epoch": 2998} {"train_loss": -6.617978096008301, "global_step": 125951, "epoch": 2998} {"train_loss": -6.630522727966309, "global_step": 125952, "epoch": 2998} {"train_loss": -6.479251861572266, "global_step": 125953, "epoch": 2998} {"train_loss": -6.4741339683532715, "global_step": 125954, "epoch": 2998} {"train_loss": -6.608366966247559, "global_step": 125955, "epoch": 2998} {"train_loss": -6.61732292175293, "global_step": 125956, "epoch": 2998} {"train_loss": -6.5951321352095835, "global_step": 125957, "epoch": 2998, "val_loss": 68044.5625} {"train_loss": -6.5153656005859375, "global_step": 125958, "epoch": 2999} {"train_loss": -6.589175224304199, "global_step": 125959, "epoch": 2999} {"train_loss": -6.502893447875977, "global_step": 125960, "epoch": 2999} {"train_loss": -6.657480239868164, "global_step": 125961, "epoch": 2999} {"train_loss": -6.559069633483887, "global_step": 125962, "epoch": 2999} {"train_loss": -6.53223180770874, "global_step": 125963, "epoch": 2999} {"train_loss": -6.593860626220703, "global_step": 125964, "epoch": 2999} {"train_loss": -6.581624984741211, "global_step": 125965, "epoch": 2999} {"train_loss": -6.531459808349609, "global_step": 125966, "epoch": 2999} {"train_loss": -6.6259307861328125, "global_step": 125967, "epoch": 2999} {"train_loss": -6.550662994384766, "global_step": 125968, "epoch": 2999} {"train_loss": -6.577929496765137, "global_step": 125969, "epoch": 2999} {"train_loss": -6.723270893096924, "global_step": 125970, "epoch": 2999} {"train_loss": -6.550333023071289, "global_step": 125971, "epoch": 2999} {"train_loss": -6.630340576171875, "global_step": 125972, "epoch": 2999} {"train_loss": -6.596117973327637, "global_step": 125973, "epoch": 2999} {"train_loss": -6.576831817626953, "global_step": 125974, "epoch": 2999} {"train_loss": -6.57679557800293, "global_step": 125975, "epoch": 2999} {"train_loss": -6.597334861755371, "global_step": 125976, "epoch": 2999} {"train_loss": -6.613533973693848, "global_step": 125977, "epoch": 2999} {"train_loss": -6.568516731262207, "global_step": 125978, "epoch": 2999} {"train_loss": -6.542136192321777, "global_step": 125979, "epoch": 2999} {"train_loss": -6.70560359954834, "global_step": 125980, "epoch": 2999} {"train_loss": -6.568272590637207, "global_step": 125981, "epoch": 2999} {"train_loss": -6.71395206451416, "global_step": 125982, "epoch": 2999} {"train_loss": -6.567852973937988, "global_step": 125983, "epoch": 2999} {"train_loss": -6.610411167144775, "global_step": 125984, "epoch": 2999} {"train_loss": -6.573148250579834, "global_step": 125985, "epoch": 2999} {"train_loss": -6.560746192932129, "global_step": 125986, "epoch": 2999} {"train_loss": -6.762569427490234, "global_step": 125987, "epoch": 2999} {"train_loss": -6.649188041687012, "global_step": 125988, "epoch": 2999} {"train_loss": -6.593912124633789, "global_step": 125989, "epoch": 2999} {"train_loss": -6.5856428146362305, "global_step": 125990, "epoch": 2999} {"train_loss": -6.600346565246582, "global_step": 125991, "epoch": 2999} {"train_loss": -6.638124942779541, "global_step": 125992, "epoch": 2999} {"train_loss": -6.580842018127441, "global_step": 125993, "epoch": 2999} {"train_loss": -6.537871360778809, "global_step": 125994, "epoch": 2999} {"train_loss": -6.595335006713867, "global_step": 125995, "epoch": 2999} {"train_loss": -6.590705394744873, "global_step": 125996, "epoch": 2999} {"train_loss": -6.526232719421387, "global_step": 125997, "epoch": 2999} {"train_loss": -6.6227569580078125, "global_step": 125998, "epoch": 2999} {"train_loss": -6.59669558207194, "global_step": 125999, "epoch": 2999, "val_loss": 68117.953125} {"train_loss": -6.566874980926514, "global_step": 126000, "epoch": 3000} {"train_loss": -6.648869514465332, "global_step": 126001, "epoch": 3000} {"train_loss": -6.37199068069458, "global_step": 126002, "epoch": 3000} {"train_loss": -6.4718451499938965, "global_step": 126003, "epoch": 3000} {"train_loss": -6.528621673583984, "global_step": 126004, "epoch": 3000} {"train_loss": -6.516593933105469, "global_step": 126005, "epoch": 3000} {"train_loss": -6.632311820983887, "global_step": 126006, "epoch": 3000} {"train_loss": -6.503974914550781, "global_step": 126007, "epoch": 3000} {"train_loss": -6.556453704833984, "global_step": 126008, "epoch": 3000} {"train_loss": -6.49686336517334, "global_step": 126009, "epoch": 3000} {"train_loss": -6.497158050537109, "global_step": 126010, "epoch": 3000} {"train_loss": -6.636661529541016, "global_step": 126011, "epoch": 3000} {"train_loss": -6.564624309539795, "global_step": 126012, "epoch": 3000} {"train_loss": -6.513416290283203, "global_step": 126013, "epoch": 3000} {"train_loss": -6.586282253265381, "global_step": 126014, "epoch": 3000} {"train_loss": -6.633777618408203, "global_step": 126015, "epoch": 3000} {"train_loss": -6.48609733581543, "global_step": 126016, "epoch": 3000} {"train_loss": -6.535017490386963, "global_step": 126017, "epoch": 3000} {"train_loss": -6.59100341796875, "global_step": 126018, "epoch": 3000} {"train_loss": -6.60663366317749, "global_step": 126019, "epoch": 3000} {"train_loss": -6.432844161987305, "global_step": 126020, "epoch": 3000} {"train_loss": -6.519711494445801, "global_step": 126021, "epoch": 3000} {"train_loss": -6.577927589416504, "global_step": 126022, "epoch": 3000} {"train_loss": -6.563719749450684, "global_step": 126023, "epoch": 3000} {"train_loss": -6.525623321533203, "global_step": 126024, "epoch": 3000} {"train_loss": -6.596319198608398, "global_step": 126025, "epoch": 3000} {"train_loss": -6.538365364074707, "global_step": 126026, "epoch": 3000} {"train_loss": -6.564398765563965, "global_step": 126027, "epoch": 3000} {"train_loss": -6.510893821716309, "global_step": 126028, "epoch": 3000} {"train_loss": -6.4727067947387695, "global_step": 126029, "epoch": 3000} {"train_loss": -6.5796027183532715, "global_step": 126030, "epoch": 3000} {"train_loss": -6.428535461425781, "global_step": 126031, "epoch": 3000} {"train_loss": -6.620080471038818, "global_step": 126032, "epoch": 3000} {"train_loss": -6.522292137145996, "global_step": 126033, "epoch": 3000} {"train_loss": -6.612974166870117, "global_step": 126034, "epoch": 3000} {"train_loss": -6.586808204650879, "global_step": 126035, "epoch": 3000} {"train_loss": -6.575089454650879, "global_step": 126036, "epoch": 3000} {"train_loss": -6.581606864929199, "global_step": 126037, "epoch": 3000} {"train_loss": -6.608080863952637, "global_step": 126038, "epoch": 3000} {"train_loss": -6.572194576263428, "global_step": 126039, "epoch": 3000} {"train_loss": -6.548623561859131, "global_step": 126040, "epoch": 3000} {"train_loss": -6.550491980143955, "global_step": 126041, "epoch": 3000, "train/sim_max_reward_0": 0.23830101162268982, "train/sim_max_reward_1": 0.9526540906587727, "train/sim_max_reward_2": 0.9973532073533206, "train/sim_max_reward_3": 0.8839277730793117, "train/sim_max_reward_4": 0.41070860280005833, "train/sim_max_reward_5": 0.8761826551509282, "test/sim_max_reward_4400000": 0.23856209912755294, "test/sim_max_reward_4400001": 0.2971914443624914, "test/sim_max_reward_4400002": 0.45923548533045855, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.17323397831662093, "test/sim_max_reward_4400006": 0.21073270934187016, "test/sim_max_reward_4400007": 0.9014056377383829, "test/sim_max_reward_4400008": 0.29947019504052086, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 0.23074912502050055, "test/sim_max_reward_4400011": 0.21247073311808978, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9059768262626035, "test/sim_max_reward_4400014": 0.7791366512556827, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2108447981985609, "test/sim_max_reward_4400019": 0.21521596993579345, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9319596003938139, "test/sim_max_reward_4400023": 0.6843866057564709, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.24725689610189575, "test/sim_max_reward_4400026": 0.7899794804881745, "test/sim_max_reward_4400027": 0.02167653619045905, "test/sim_max_reward_4400028": 0.5231947326448463, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9991858892780497, "test/sim_max_reward_4400031": 0.46437552263821624, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9961730364120599, "test/sim_max_reward_4400034": 0.9508513357691857, "test/sim_max_reward_4400035": 0.9481630010767951, "test/sim_max_reward_4400036": 0.3802964746022656, "test/sim_max_reward_4400037": 0.9903527249900574, "test/sim_max_reward_4400038": 0.9821321075657791, "test/sim_max_reward_4400039": 0.873150212896905, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6938650806333722, "test/sim_max_reward_4400042": 0.9998539766273074, "test/sim_max_reward_4400043": 0.9822821296623278, "test/sim_max_reward_4400044": 0.9864873187944346, "test/sim_max_reward_4400045": 0.8957538495523243, "test/sim_max_reward_4400046": 0.9060176776103122, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.8620492547257396, "test/sim_max_reward_4400049": 0.7351263498872062, "train/mean_score": 0.7265212234441801, "test/mean_score": 0.549044714066547, "val_loss": 67970.6015625} {"train_loss": -6.584566593170166, "global_step": 126042, "epoch": 3001} {"train_loss": -6.502388000488281, "global_step": 126043, "epoch": 3001} {"train_loss": -6.559626579284668, "global_step": 126044, "epoch": 3001} {"train_loss": -6.622040748596191, "global_step": 126045, "epoch": 3001} {"train_loss": -6.620221138000488, "global_step": 126046, "epoch": 3001} {"train_loss": -6.7213335037231445, "global_step": 126047, "epoch": 3001} {"train_loss": -6.72783088684082, "global_step": 126048, "epoch": 3001} {"train_loss": -6.660345077514648, "global_step": 126049, "epoch": 3001} {"train_loss": -6.464624404907227, "global_step": 126050, "epoch": 3001} {"train_loss": -6.540203094482422, "global_step": 126051, "epoch": 3001} {"train_loss": -6.704121112823486, "global_step": 126052, "epoch": 3001} {"train_loss": -6.57508659362793, "global_step": 126053, "epoch": 3001} {"train_loss": -6.679258823394775, "global_step": 126054, "epoch": 3001} {"train_loss": -6.637760162353516, "global_step": 126055, "epoch": 3001} {"train_loss": -6.67315673828125, "global_step": 126056, "epoch": 3001} {"train_loss": -6.543911933898926, "global_step": 126057, "epoch": 3001} {"train_loss": -6.649110794067383, "global_step": 126058, "epoch": 3001} {"train_loss": -6.554056167602539, "global_step": 126059, "epoch": 3001} {"train_loss": -6.491940498352051, "global_step": 126060, "epoch": 3001} {"train_loss": -6.717606544494629, "global_step": 126061, "epoch": 3001} {"train_loss": -6.497594833374023, "global_step": 126062, "epoch": 3001} {"train_loss": -6.671933174133301, "global_step": 126063, "epoch": 3001} {"train_loss": -6.628556251525879, "global_step": 126064, "epoch": 3001} {"train_loss": -6.506627082824707, "global_step": 126065, "epoch": 3001} {"train_loss": -6.548600673675537, "global_step": 126066, "epoch": 3001} {"train_loss": -6.490780830383301, "global_step": 126067, "epoch": 3001} {"train_loss": -6.600553035736084, "global_step": 126068, "epoch": 3001} {"train_loss": -6.52644157409668, "global_step": 126069, "epoch": 3001} {"train_loss": -6.497101306915283, "global_step": 126070, "epoch": 3001} {"train_loss": -6.585962295532227, "global_step": 126071, "epoch": 3001} {"train_loss": -6.469113349914551, "global_step": 126072, "epoch": 3001} {"train_loss": -6.6406426429748535, "global_step": 126073, "epoch": 3001} {"train_loss": -6.546931743621826, "global_step": 126074, "epoch": 3001} {"train_loss": -6.470037460327148, "global_step": 126075, "epoch": 3001} {"train_loss": -6.5762939453125, "global_step": 126076, "epoch": 3001} {"train_loss": -6.518677711486816, "global_step": 126077, "epoch": 3001} {"train_loss": -6.472414970397949, "global_step": 126078, "epoch": 3001} {"train_loss": -6.615339756011963, "global_step": 126079, "epoch": 3001} {"train_loss": -6.5054216384887695, "global_step": 126080, "epoch": 3001} {"train_loss": -6.538768768310547, "global_step": 126081, "epoch": 3001} {"train_loss": -6.5556745529174805, "global_step": 126082, "epoch": 3001} {"train_loss": -6.577421574365525, "global_step": 126083, "epoch": 3001, "val_loss": 68191.390625} {"train_loss": -6.432120323181152, "global_step": 126084, "epoch": 3002} {"train_loss": -6.557525157928467, "global_step": 126085, "epoch": 3002} {"train_loss": -6.540937423706055, "global_step": 126086, "epoch": 3002} {"train_loss": -6.593852519989014, "global_step": 126087, "epoch": 3002} {"train_loss": -6.515354156494141, "global_step": 126088, "epoch": 3002} {"train_loss": -6.452117919921875, "global_step": 126089, "epoch": 3002} {"train_loss": -6.563588619232178, "global_step": 126090, "epoch": 3002} {"train_loss": -6.480008125305176, "global_step": 126091, "epoch": 3002} {"train_loss": -6.675315856933594, "global_step": 126092, "epoch": 3002} {"train_loss": -6.5796098709106445, "global_step": 126093, "epoch": 3002} {"train_loss": -6.494070529937744, "global_step": 126094, "epoch": 3002} {"train_loss": -6.535780906677246, "global_step": 126095, "epoch": 3002} {"train_loss": -6.580278396606445, "global_step": 126096, "epoch": 3002} {"train_loss": -6.5955305099487305, "global_step": 126097, "epoch": 3002} {"train_loss": -6.664186477661133, "global_step": 126098, "epoch": 3002} {"train_loss": -6.551915168762207, "global_step": 126099, "epoch": 3002} {"train_loss": -6.664334297180176, "global_step": 126100, "epoch": 3002} {"train_loss": -6.668136119842529, "global_step": 126101, "epoch": 3002} {"train_loss": -6.622706890106201, "global_step": 126102, "epoch": 3002} {"train_loss": -6.552898406982422, "global_step": 126103, "epoch": 3002} {"train_loss": -6.620388031005859, "global_step": 126104, "epoch": 3002} {"train_loss": -6.571303367614746, "global_step": 126105, "epoch": 3002} {"train_loss": -6.559021949768066, "global_step": 126106, "epoch": 3002} {"train_loss": -6.550002098083496, "global_step": 126107, "epoch": 3002} {"train_loss": -6.725658416748047, "global_step": 126108, "epoch": 3002} {"train_loss": -6.572421550750732, "global_step": 126109, "epoch": 3002} {"train_loss": -6.66564416885376, "global_step": 126110, "epoch": 3002} {"train_loss": -6.600676536560059, "global_step": 126111, "epoch": 3002} {"train_loss": -6.538544178009033, "global_step": 126112, "epoch": 3002} {"train_loss": -6.777789115905762, "global_step": 126113, "epoch": 3002} {"train_loss": -6.685825824737549, "global_step": 126114, "epoch": 3002} {"train_loss": -6.579872131347656, "global_step": 126115, "epoch": 3002} {"train_loss": -6.614374160766602, "global_step": 126116, "epoch": 3002} {"train_loss": -6.663978099822998, "global_step": 126117, "epoch": 3002} {"train_loss": -6.653465270996094, "global_step": 126118, "epoch": 3002} {"train_loss": -6.625000953674316, "global_step": 126119, "epoch": 3002} {"train_loss": -6.593291282653809, "global_step": 126120, "epoch": 3002} {"train_loss": -6.58464241027832, "global_step": 126121, "epoch": 3002} {"train_loss": -6.639934539794922, "global_step": 126122, "epoch": 3002} {"train_loss": -6.534224510192871, "global_step": 126123, "epoch": 3002} {"train_loss": -6.519121170043945, "global_step": 126124, "epoch": 3002} {"train_loss": -6.5884388741992765, "global_step": 126125, "epoch": 3002, "val_loss": 68072.65625} {"train_loss": -6.548155784606934, "global_step": 126126, "epoch": 3003} {"train_loss": -6.634069442749023, "global_step": 126127, "epoch": 3003} {"train_loss": -6.553262710571289, "global_step": 126128, "epoch": 3003} {"train_loss": -6.5174455642700195, "global_step": 126129, "epoch": 3003} {"train_loss": -6.686709403991699, "global_step": 126130, "epoch": 3003} {"train_loss": -6.599276065826416, "global_step": 126131, "epoch": 3003} {"train_loss": -6.723544120788574, "global_step": 126132, "epoch": 3003} {"train_loss": -6.686769485473633, "global_step": 126133, "epoch": 3003} {"train_loss": -6.639615058898926, "global_step": 126134, "epoch": 3003} {"train_loss": -6.583749771118164, "global_step": 126135, "epoch": 3003} {"train_loss": -6.5573859214782715, "global_step": 126136, "epoch": 3003} {"train_loss": -6.601169586181641, "global_step": 126137, "epoch": 3003} {"train_loss": -6.744942665100098, "global_step": 126138, "epoch": 3003} {"train_loss": -6.7563886642456055, "global_step": 126139, "epoch": 3003} {"train_loss": -6.7751054763793945, "global_step": 126140, "epoch": 3003} {"train_loss": -6.698005199432373, "global_step": 126141, "epoch": 3003} {"train_loss": -6.620783805847168, "global_step": 126142, "epoch": 3003} {"train_loss": -6.631011962890625, "global_step": 126143, "epoch": 3003} {"train_loss": -6.553492546081543, "global_step": 126144, "epoch": 3003} {"train_loss": -6.548494338989258, "global_step": 126145, "epoch": 3003} {"train_loss": -6.532604694366455, "global_step": 126146, "epoch": 3003} {"train_loss": -6.36436128616333, "global_step": 126147, "epoch": 3003} {"train_loss": -6.6458024978637695, "global_step": 126148, "epoch": 3003} {"train_loss": -6.642361164093018, "global_step": 126149, "epoch": 3003} {"train_loss": -6.363776683807373, "global_step": 126150, "epoch": 3003} {"train_loss": -6.5260162353515625, "global_step": 126151, "epoch": 3003} {"train_loss": -6.561112880706787, "global_step": 126152, "epoch": 3003} {"train_loss": -6.286469459533691, "global_step": 126153, "epoch": 3003} {"train_loss": -6.721420764923096, "global_step": 126154, "epoch": 3003} {"train_loss": -6.403400897979736, "global_step": 126155, "epoch": 3003} {"train_loss": -6.591616153717041, "global_step": 126156, "epoch": 3003} {"train_loss": -6.5179548263549805, "global_step": 126157, "epoch": 3003} {"train_loss": -6.535497665405273, "global_step": 126158, "epoch": 3003} {"train_loss": -6.493562698364258, "global_step": 126159, "epoch": 3003} {"train_loss": -6.461979389190674, "global_step": 126160, "epoch": 3003} {"train_loss": -6.475064277648926, "global_step": 126161, "epoch": 3003} {"train_loss": -6.491147994995117, "global_step": 126162, "epoch": 3003} {"train_loss": -6.4364118576049805, "global_step": 126163, "epoch": 3003} {"train_loss": -6.4548115730285645, "global_step": 126164, "epoch": 3003} {"train_loss": -6.508613586425781, "global_step": 126165, "epoch": 3003} {"train_loss": -6.505954742431641, "global_step": 126166, "epoch": 3003} {"train_loss": -6.563097090948196, "global_step": 126167, "epoch": 3003, "val_loss": 68307.6484375} {"train_loss": -6.746413707733154, "global_step": 126168, "epoch": 3004} {"train_loss": -6.45743465423584, "global_step": 126169, "epoch": 3004} {"train_loss": -6.583278179168701, "global_step": 126170, "epoch": 3004} {"train_loss": -6.5706868171691895, "global_step": 126171, "epoch": 3004} {"train_loss": -6.505698204040527, "global_step": 126172, "epoch": 3004} {"train_loss": -6.542567729949951, "global_step": 126173, "epoch": 3004} {"train_loss": -6.642524719238281, "global_step": 126174, "epoch": 3004} {"train_loss": -6.5065531730651855, "global_step": 126175, "epoch": 3004} {"train_loss": -6.5585527420043945, "global_step": 126176, "epoch": 3004} {"train_loss": -6.601988792419434, "global_step": 126177, "epoch": 3004} {"train_loss": -6.604007720947266, "global_step": 126178, "epoch": 3004} {"train_loss": -6.648138046264648, "global_step": 126179, "epoch": 3004} {"train_loss": -6.496902942657471, "global_step": 126180, "epoch": 3004} {"train_loss": -6.459749221801758, "global_step": 126181, "epoch": 3004} {"train_loss": -6.6781535148620605, "global_step": 126182, "epoch": 3004} {"train_loss": -6.574797630310059, "global_step": 126183, "epoch": 3004} {"train_loss": -6.601873397827148, "global_step": 126184, "epoch": 3004} {"train_loss": -6.643429756164551, "global_step": 126185, "epoch": 3004} {"train_loss": -6.598339557647705, "global_step": 126186, "epoch": 3004} {"train_loss": -6.627938270568848, "global_step": 126187, "epoch": 3004} {"train_loss": -6.628490924835205, "global_step": 126188, "epoch": 3004} {"train_loss": -6.622347831726074, "global_step": 126189, "epoch": 3004} {"train_loss": -6.626237392425537, "global_step": 126190, "epoch": 3004} {"train_loss": -6.6024675369262695, "global_step": 126191, "epoch": 3004} {"train_loss": -6.5292253494262695, "global_step": 126192, "epoch": 3004} {"train_loss": -6.60145902633667, "global_step": 126193, "epoch": 3004} {"train_loss": -6.60140323638916, "global_step": 126194, "epoch": 3004} {"train_loss": -6.601312160491943, "global_step": 126195, "epoch": 3004} {"train_loss": -6.625789642333984, "global_step": 126196, "epoch": 3004} {"train_loss": -6.618119239807129, "global_step": 126197, "epoch": 3004} {"train_loss": -6.504481315612793, "global_step": 126198, "epoch": 3004} {"train_loss": -6.511385917663574, "global_step": 126199, "epoch": 3004} {"train_loss": -6.618912220001221, "global_step": 126200, "epoch": 3004} {"train_loss": -6.389715194702148, "global_step": 126201, "epoch": 3004} {"train_loss": -6.464566707611084, "global_step": 126202, "epoch": 3004} {"train_loss": -6.530903339385986, "global_step": 126203, "epoch": 3004} {"train_loss": -6.544745922088623, "global_step": 126204, "epoch": 3004} {"train_loss": -6.462467193603516, "global_step": 126205, "epoch": 3004} {"train_loss": -6.5618133544921875, "global_step": 126206, "epoch": 3004} {"train_loss": -6.4857892990112305, "global_step": 126207, "epoch": 3004} {"train_loss": -6.454093933105469, "global_step": 126208, "epoch": 3004} {"train_loss": -6.56709056808835, "global_step": 126209, "epoch": 3004, "val_loss": 68142.1328125} {"train_loss": -6.571978569030762, "global_step": 126210, "epoch": 3005} {"train_loss": -6.594696044921875, "global_step": 126211, "epoch": 3005} {"train_loss": -6.606672286987305, "global_step": 126212, "epoch": 3005} {"train_loss": -6.724875450134277, "global_step": 126213, "epoch": 3005} {"train_loss": -6.523947715759277, "global_step": 126214, "epoch": 3005} {"train_loss": -6.59603214263916, "global_step": 126215, "epoch": 3005} {"train_loss": -6.595081806182861, "global_step": 126216, "epoch": 3005} {"train_loss": -6.619426727294922, "global_step": 126217, "epoch": 3005} {"train_loss": -6.5390167236328125, "global_step": 126218, "epoch": 3005} {"train_loss": -6.606522560119629, "global_step": 126219, "epoch": 3005} {"train_loss": -6.500127792358398, "global_step": 126220, "epoch": 3005} {"train_loss": -6.598507881164551, "global_step": 126221, "epoch": 3005} {"train_loss": -6.734301567077637, "global_step": 126222, "epoch": 3005} {"train_loss": -6.438914775848389, "global_step": 126223, "epoch": 3005} {"train_loss": -6.498950004577637, "global_step": 126224, "epoch": 3005} {"train_loss": -6.517836570739746, "global_step": 126225, "epoch": 3005} {"train_loss": -6.504551887512207, "global_step": 126226, "epoch": 3005} {"train_loss": -6.503274917602539, "global_step": 126227, "epoch": 3005} {"train_loss": -6.515909194946289, "global_step": 126228, "epoch": 3005} {"train_loss": -6.422353744506836, "global_step": 126229, "epoch": 3005} {"train_loss": -6.541815757751465, "global_step": 126230, "epoch": 3005} {"train_loss": -6.489165306091309, "global_step": 126231, "epoch": 3005} {"train_loss": -6.416064739227295, "global_step": 126232, "epoch": 3005} {"train_loss": -6.507472991943359, "global_step": 126233, "epoch": 3005} {"train_loss": -6.622200965881348, "global_step": 126234, "epoch": 3005} {"train_loss": -6.506048202514648, "global_step": 126235, "epoch": 3005} {"train_loss": -6.5918378829956055, "global_step": 126236, "epoch": 3005} {"train_loss": -6.497335433959961, "global_step": 126237, "epoch": 3005} {"train_loss": -6.611148834228516, "global_step": 126238, "epoch": 3005} {"train_loss": -6.367135524749756, "global_step": 126239, "epoch": 3005} {"train_loss": -6.447403907775879, "global_step": 126240, "epoch": 3005} {"train_loss": -6.389196395874023, "global_step": 126241, "epoch": 3005} {"train_loss": -6.455958366394043, "global_step": 126242, "epoch": 3005} {"train_loss": -6.411428451538086, "global_step": 126243, "epoch": 3005} {"train_loss": -6.429264545440674, "global_step": 126244, "epoch": 3005} {"train_loss": -6.331848621368408, "global_step": 126245, "epoch": 3005} {"train_loss": -6.431622505187988, "global_step": 126246, "epoch": 3005} {"train_loss": -6.561655044555664, "global_step": 126247, "epoch": 3005} {"train_loss": -6.418493270874023, "global_step": 126248, "epoch": 3005} {"train_loss": -6.500934600830078, "global_step": 126249, "epoch": 3005} {"train_loss": -6.462281703948975, "global_step": 126250, "epoch": 3005} {"train_loss": -6.513423352014451, "global_step": 126251, "epoch": 3005, "val_loss": 68303.625} {"train_loss": -6.347463130950928, "global_step": 126252, "epoch": 3006} {"train_loss": -6.640253067016602, "global_step": 126253, "epoch": 3006} {"train_loss": -6.3707475662231445, "global_step": 126254, "epoch": 3006} {"train_loss": -6.644626617431641, "global_step": 126255, "epoch": 3006} {"train_loss": -6.397130012512207, "global_step": 126256, "epoch": 3006} {"train_loss": -6.4142069816589355, "global_step": 126257, "epoch": 3006} {"train_loss": -6.544084548950195, "global_step": 126258, "epoch": 3006} {"train_loss": -6.511638641357422, "global_step": 126259, "epoch": 3006} {"train_loss": -6.533353805541992, "global_step": 126260, "epoch": 3006} {"train_loss": -6.572946071624756, "global_step": 126261, "epoch": 3006} {"train_loss": -6.597264289855957, "global_step": 126262, "epoch": 3006} {"train_loss": -6.619500160217285, "global_step": 126263, "epoch": 3006} {"train_loss": -6.559442520141602, "global_step": 126264, "epoch": 3006} {"train_loss": -6.6065473556518555, "global_step": 126265, "epoch": 3006} {"train_loss": -6.461625576019287, "global_step": 126266, "epoch": 3006} {"train_loss": -6.500089168548584, "global_step": 126267, "epoch": 3006} {"train_loss": -6.612390518188477, "global_step": 126268, "epoch": 3006} {"train_loss": -6.624820709228516, "global_step": 126269, "epoch": 3006} {"train_loss": -6.6001386642456055, "global_step": 126270, "epoch": 3006} {"train_loss": -6.675040245056152, "global_step": 126271, "epoch": 3006} {"train_loss": -6.686861991882324, "global_step": 126272, "epoch": 3006} {"train_loss": -6.593560218811035, "global_step": 126273, "epoch": 3006} {"train_loss": -6.613868236541748, "global_step": 126274, "epoch": 3006} {"train_loss": -6.629649639129639, "global_step": 126275, "epoch": 3006} {"train_loss": -6.587379455566406, "global_step": 126276, "epoch": 3006} {"train_loss": -6.56677770614624, "global_step": 126277, "epoch": 3006} {"train_loss": -6.583308219909668, "global_step": 126278, "epoch": 3006} {"train_loss": -6.570891380310059, "global_step": 126279, "epoch": 3006} {"train_loss": -6.613184928894043, "global_step": 126280, "epoch": 3006} {"train_loss": -6.6996660232543945, "global_step": 126281, "epoch": 3006} {"train_loss": -6.556939601898193, "global_step": 126282, "epoch": 3006} {"train_loss": -6.54494571685791, "global_step": 126283, "epoch": 3006} {"train_loss": -6.611822128295898, "global_step": 126284, "epoch": 3006} {"train_loss": -6.598043441772461, "global_step": 126285, "epoch": 3006} {"train_loss": -6.490996360778809, "global_step": 126286, "epoch": 3006} {"train_loss": -6.567028999328613, "global_step": 126287, "epoch": 3006} {"train_loss": -6.5746612548828125, "global_step": 126288, "epoch": 3006} {"train_loss": -6.541355609893799, "global_step": 126289, "epoch": 3006} {"train_loss": -6.671482086181641, "global_step": 126290, "epoch": 3006} {"train_loss": -6.63055944442749, "global_step": 126291, "epoch": 3006} {"train_loss": -6.5844316482543945, "global_step": 126292, "epoch": 3006} {"train_loss": -6.574118988854544, "global_step": 126293, "epoch": 3006, "val_loss": 68043.5546875} {"train_loss": -6.598804950714111, "global_step": 126294, "epoch": 3007} {"train_loss": -6.71705436706543, "global_step": 126295, "epoch": 3007} {"train_loss": -6.603529930114746, "global_step": 126296, "epoch": 3007} {"train_loss": -6.5745930671691895, "global_step": 126297, "epoch": 3007} {"train_loss": -6.655194282531738, "global_step": 126298, "epoch": 3007} {"train_loss": -6.708215713500977, "global_step": 126299, "epoch": 3007} {"train_loss": -6.632535934448242, "global_step": 126300, "epoch": 3007} {"train_loss": -6.629914283752441, "global_step": 126301, "epoch": 3007} {"train_loss": -6.576719760894775, "global_step": 126302, "epoch": 3007} {"train_loss": -6.5689592361450195, "global_step": 126303, "epoch": 3007} {"train_loss": -6.652061462402344, "global_step": 126304, "epoch": 3007} {"train_loss": -6.538505554199219, "global_step": 126305, "epoch": 3007} {"train_loss": -6.648882865905762, "global_step": 126306, "epoch": 3007} {"train_loss": -6.65814208984375, "global_step": 126307, "epoch": 3007} {"train_loss": -6.604879379272461, "global_step": 126308, "epoch": 3007} {"train_loss": -6.520987510681152, "global_step": 126309, "epoch": 3007} {"train_loss": -6.586747169494629, "global_step": 126310, "epoch": 3007} {"train_loss": -6.433090686798096, "global_step": 126311, "epoch": 3007} {"train_loss": -6.600593090057373, "global_step": 126312, "epoch": 3007} {"train_loss": -6.533613204956055, "global_step": 126313, "epoch": 3007} {"train_loss": -6.43692684173584, "global_step": 126314, "epoch": 3007} {"train_loss": -6.642212390899658, "global_step": 126315, "epoch": 3007} {"train_loss": -6.5512824058532715, "global_step": 126316, "epoch": 3007} {"train_loss": -6.426877498626709, "global_step": 126317, "epoch": 3007} {"train_loss": -6.531711101531982, "global_step": 126318, "epoch": 3007} {"train_loss": -6.374029636383057, "global_step": 126319, "epoch": 3007} {"train_loss": -6.6250224113464355, "global_step": 126320, "epoch": 3007} {"train_loss": -6.557973861694336, "global_step": 126321, "epoch": 3007} {"train_loss": -6.528693675994873, "global_step": 126322, "epoch": 3007} {"train_loss": -6.5632243156433105, "global_step": 126323, "epoch": 3007} {"train_loss": -6.455376625061035, "global_step": 126324, "epoch": 3007} {"train_loss": -6.475508689880371, "global_step": 126325, "epoch": 3007} {"train_loss": -6.514523029327393, "global_step": 126326, "epoch": 3007} {"train_loss": -6.539946556091309, "global_step": 126327, "epoch": 3007} {"train_loss": -6.5719099044799805, "global_step": 126328, "epoch": 3007} {"train_loss": -6.6076250076293945, "global_step": 126329, "epoch": 3007} {"train_loss": -6.499444007873535, "global_step": 126330, "epoch": 3007} {"train_loss": -6.620824813842773, "global_step": 126331, "epoch": 3007} {"train_loss": -6.677546501159668, "global_step": 126332, "epoch": 3007} {"train_loss": -6.524168968200684, "global_step": 126333, "epoch": 3007} {"train_loss": -6.708826065063477, "global_step": 126334, "epoch": 3007} {"train_loss": -6.570537692024594, "global_step": 126335, "epoch": 3007, "val_loss": 68083.859375} {"train_loss": -6.622149467468262, "global_step": 126336, "epoch": 3008} {"train_loss": -6.690842151641846, "global_step": 126337, "epoch": 3008} {"train_loss": -6.532135009765625, "global_step": 126338, "epoch": 3008} {"train_loss": -6.58424186706543, "global_step": 126339, "epoch": 3008} {"train_loss": -6.579150199890137, "global_step": 126340, "epoch": 3008} {"train_loss": -6.586799621582031, "global_step": 126341, "epoch": 3008} {"train_loss": -6.571109294891357, "global_step": 126342, "epoch": 3008} {"train_loss": -6.614635467529297, "global_step": 126343, "epoch": 3008} {"train_loss": -6.599358081817627, "global_step": 126344, "epoch": 3008} {"train_loss": -6.599857330322266, "global_step": 126345, "epoch": 3008} {"train_loss": -6.6112141609191895, "global_step": 126346, "epoch": 3008} {"train_loss": -6.6415557861328125, "global_step": 126347, "epoch": 3008} {"train_loss": -6.638923168182373, "global_step": 126348, "epoch": 3008} {"train_loss": -6.562250137329102, "global_step": 126349, "epoch": 3008} {"train_loss": -6.593411445617676, "global_step": 126350, "epoch": 3008} {"train_loss": -6.566672325134277, "global_step": 126351, "epoch": 3008} {"train_loss": -6.584090232849121, "global_step": 126352, "epoch": 3008} {"train_loss": -6.596424102783203, "global_step": 126353, "epoch": 3008} {"train_loss": -6.678552627563477, "global_step": 126354, "epoch": 3008} {"train_loss": -6.679614067077637, "global_step": 126355, "epoch": 3008} {"train_loss": -6.71702766418457, "global_step": 126356, "epoch": 3008} {"train_loss": -6.641602516174316, "global_step": 126357, "epoch": 3008} {"train_loss": -6.548460960388184, "global_step": 126358, "epoch": 3008} {"train_loss": -6.621307373046875, "global_step": 126359, "epoch": 3008} {"train_loss": -6.555503845214844, "global_step": 126360, "epoch": 3008} {"train_loss": -6.720450401306152, "global_step": 126361, "epoch": 3008} {"train_loss": -6.57952880859375, "global_step": 126362, "epoch": 3008} {"train_loss": -6.701686859130859, "global_step": 126363, "epoch": 3008} {"train_loss": -6.7502851486206055, "global_step": 126364, "epoch": 3008} {"train_loss": -6.580021381378174, "global_step": 126365, "epoch": 3008} {"train_loss": -6.588481903076172, "global_step": 126366, "epoch": 3008} {"train_loss": -6.587743759155273, "global_step": 126367, "epoch": 3008} {"train_loss": -6.561100482940674, "global_step": 126368, "epoch": 3008} {"train_loss": -6.669771671295166, "global_step": 126369, "epoch": 3008} {"train_loss": -6.692295074462891, "global_step": 126370, "epoch": 3008} {"train_loss": -6.6722412109375, "global_step": 126371, "epoch": 3008} {"train_loss": -6.668117523193359, "global_step": 126372, "epoch": 3008} {"train_loss": -6.570562362670898, "global_step": 126373, "epoch": 3008} {"train_loss": -6.483583450317383, "global_step": 126374, "epoch": 3008} {"train_loss": -6.666146755218506, "global_step": 126375, "epoch": 3008} {"train_loss": -6.584046363830566, "global_step": 126376, "epoch": 3008} {"train_loss": -6.617611828304472, "global_step": 126377, "epoch": 3008, "val_loss": 68077.0859375} {"train_loss": -6.683475494384766, "global_step": 126378, "epoch": 3009} {"train_loss": -6.669886112213135, "global_step": 126379, "epoch": 3009} {"train_loss": -6.620195388793945, "global_step": 126380, "epoch": 3009} {"train_loss": -6.667366981506348, "global_step": 126381, "epoch": 3009} {"train_loss": -6.589446544647217, "global_step": 126382, "epoch": 3009} {"train_loss": -6.614763259887695, "global_step": 126383, "epoch": 3009} {"train_loss": -6.719104766845703, "global_step": 126384, "epoch": 3009} {"train_loss": -6.601348876953125, "global_step": 126385, "epoch": 3009} {"train_loss": -6.601772308349609, "global_step": 126386, "epoch": 3009} {"train_loss": -6.533547401428223, "global_step": 126387, "epoch": 3009} {"train_loss": -6.587075233459473, "global_step": 126388, "epoch": 3009} {"train_loss": -6.6682658195495605, "global_step": 126389, "epoch": 3009} {"train_loss": -6.681347370147705, "global_step": 126390, "epoch": 3009} {"train_loss": -6.650119781494141, "global_step": 126391, "epoch": 3009} {"train_loss": -6.607257843017578, "global_step": 126392, "epoch": 3009} {"train_loss": -6.657881736755371, "global_step": 126393, "epoch": 3009} {"train_loss": -6.622112274169922, "global_step": 126394, "epoch": 3009} {"train_loss": -6.557188510894775, "global_step": 126395, "epoch": 3009} {"train_loss": -6.579432487487793, "global_step": 126396, "epoch": 3009} {"train_loss": -6.702213287353516, "global_step": 126397, "epoch": 3009} {"train_loss": -6.562771797180176, "global_step": 126398, "epoch": 3009} {"train_loss": -6.635822772979736, "global_step": 126399, "epoch": 3009} {"train_loss": -6.633908271789551, "global_step": 126400, "epoch": 3009} {"train_loss": -6.779950141906738, "global_step": 126401, "epoch": 3009} {"train_loss": -6.593077182769775, "global_step": 126402, "epoch": 3009} {"train_loss": -6.661635398864746, "global_step": 126403, "epoch": 3009} {"train_loss": -6.561014175415039, "global_step": 126404, "epoch": 3009} {"train_loss": -6.646836280822754, "global_step": 126405, "epoch": 3009} {"train_loss": -6.531123161315918, "global_step": 126406, "epoch": 3009} {"train_loss": -6.643153190612793, "global_step": 126407, "epoch": 3009} {"train_loss": -6.466712951660156, "global_step": 126408, "epoch": 3009} {"train_loss": -6.512651443481445, "global_step": 126409, "epoch": 3009} {"train_loss": -6.722291946411133, "global_step": 126410, "epoch": 3009} {"train_loss": -6.478600025177002, "global_step": 126411, "epoch": 3009} {"train_loss": -6.640468120574951, "global_step": 126412, "epoch": 3009} {"train_loss": -6.352724552154541, "global_step": 126413, "epoch": 3009} {"train_loss": -6.555700302124023, "global_step": 126414, "epoch": 3009} {"train_loss": -6.670130729675293, "global_step": 126415, "epoch": 3009} {"train_loss": -6.36251163482666, "global_step": 126416, "epoch": 3009} {"train_loss": -6.526300430297852, "global_step": 126417, "epoch": 3009} {"train_loss": -6.461390495300293, "global_step": 126418, "epoch": 3009} {"train_loss": -6.59374281338283, "global_step": 126419, "epoch": 3009, "val_loss": 68075.859375} {"train_loss": -6.509951591491699, "global_step": 126420, "epoch": 3010} {"train_loss": -6.5335869789123535, "global_step": 126421, "epoch": 3010} {"train_loss": -6.556025505065918, "global_step": 126422, "epoch": 3010} {"train_loss": -6.504084587097168, "global_step": 126423, "epoch": 3010} {"train_loss": -6.528689861297607, "global_step": 126424, "epoch": 3010} {"train_loss": -6.54426383972168, "global_step": 126425, "epoch": 3010} {"train_loss": -6.533235549926758, "global_step": 126426, "epoch": 3010} {"train_loss": -6.562682151794434, "global_step": 126427, "epoch": 3010} {"train_loss": -6.474076271057129, "global_step": 126428, "epoch": 3010} {"train_loss": -6.495065689086914, "global_step": 126429, "epoch": 3010} {"train_loss": -6.552707195281982, "global_step": 126430, "epoch": 3010} {"train_loss": -6.536865234375, "global_step": 126431, "epoch": 3010} {"train_loss": -6.48813533782959, "global_step": 126432, "epoch": 3010} {"train_loss": -6.613978385925293, "global_step": 126433, "epoch": 3010} {"train_loss": -6.588160514831543, "global_step": 126434, "epoch": 3010} {"train_loss": -6.609353542327881, "global_step": 126435, "epoch": 3010} {"train_loss": -6.564302444458008, "global_step": 126436, "epoch": 3010} {"train_loss": -6.587714672088623, "global_step": 126437, "epoch": 3010} {"train_loss": -6.568034648895264, "global_step": 126438, "epoch": 3010} {"train_loss": -6.656668663024902, "global_step": 126439, "epoch": 3010} {"train_loss": -6.564951419830322, "global_step": 126440, "epoch": 3010} {"train_loss": -6.516984939575195, "global_step": 126441, "epoch": 3010} {"train_loss": -6.563570499420166, "global_step": 126442, "epoch": 3010} {"train_loss": -6.571721076965332, "global_step": 126443, "epoch": 3010} {"train_loss": -6.60538911819458, "global_step": 126444, "epoch": 3010} {"train_loss": -6.551125526428223, "global_step": 126445, "epoch": 3010} {"train_loss": -6.601503372192383, "global_step": 126446, "epoch": 3010} {"train_loss": -6.585599899291992, "global_step": 126447, "epoch": 3010} {"train_loss": -6.561784744262695, "global_step": 126448, "epoch": 3010} {"train_loss": -6.489823818206787, "global_step": 126449, "epoch": 3010} {"train_loss": -6.509682655334473, "global_step": 126450, "epoch": 3010} {"train_loss": -6.598710060119629, "global_step": 126451, "epoch": 3010} {"train_loss": -6.5762152671813965, "global_step": 126452, "epoch": 3010} {"train_loss": -6.535772323608398, "global_step": 126453, "epoch": 3010} {"train_loss": -6.542636871337891, "global_step": 126454, "epoch": 3010} {"train_loss": -6.5457353591918945, "global_step": 126455, "epoch": 3010} {"train_loss": -6.649966239929199, "global_step": 126456, "epoch": 3010} {"train_loss": -6.552529811859131, "global_step": 126457, "epoch": 3010} {"train_loss": -6.692629337310791, "global_step": 126458, "epoch": 3010} {"train_loss": -6.664958477020264, "global_step": 126459, "epoch": 3010} {"train_loss": -6.684171676635742, "global_step": 126460, "epoch": 3010} {"train_loss": -6.5643310546875, "global_step": 126461, "epoch": 3010, "val_loss": 68056.5546875} {"train_loss": -6.581106662750244, "global_step": 126462, "epoch": 3011} {"train_loss": -6.65602970123291, "global_step": 126463, "epoch": 3011} {"train_loss": -6.653716087341309, "global_step": 126464, "epoch": 3011} {"train_loss": -6.738685607910156, "global_step": 126465, "epoch": 3011} {"train_loss": -6.683697700500488, "global_step": 126466, "epoch": 3011} {"train_loss": -6.6359052658081055, "global_step": 126467, "epoch": 3011} {"train_loss": -6.614730358123779, "global_step": 126468, "epoch": 3011} {"train_loss": -6.641785621643066, "global_step": 126469, "epoch": 3011} {"train_loss": -6.570965766906738, "global_step": 126470, "epoch": 3011} {"train_loss": -6.631049633026123, "global_step": 126471, "epoch": 3011} {"train_loss": -6.5844621658325195, "global_step": 126472, "epoch": 3011} {"train_loss": -6.663356781005859, "global_step": 126473, "epoch": 3011} {"train_loss": -6.682035446166992, "global_step": 126474, "epoch": 3011} {"train_loss": -6.600761413574219, "global_step": 126475, "epoch": 3011} {"train_loss": -6.585410118103027, "global_step": 126476, "epoch": 3011} {"train_loss": -6.68682861328125, "global_step": 126477, "epoch": 3011} {"train_loss": -6.510674476623535, "global_step": 126478, "epoch": 3011} {"train_loss": -6.679837226867676, "global_step": 126479, "epoch": 3011} {"train_loss": -6.5983099937438965, "global_step": 126480, "epoch": 3011} {"train_loss": -6.610213279724121, "global_step": 126481, "epoch": 3011} {"train_loss": -6.649825096130371, "global_step": 126482, "epoch": 3011} {"train_loss": -6.503816604614258, "global_step": 126483, "epoch": 3011} {"train_loss": -6.6603169441223145, "global_step": 126484, "epoch": 3011} {"train_loss": -6.4527587890625, "global_step": 126485, "epoch": 3011} {"train_loss": -6.5805463790893555, "global_step": 126486, "epoch": 3011} {"train_loss": -6.644872665405273, "global_step": 126487, "epoch": 3011} {"train_loss": -6.628515243530273, "global_step": 126488, "epoch": 3011} {"train_loss": -6.69905424118042, "global_step": 126489, "epoch": 3011} {"train_loss": -6.51086950302124, "global_step": 126490, "epoch": 3011} {"train_loss": -6.595056533813477, "global_step": 126491, "epoch": 3011} {"train_loss": -6.544522762298584, "global_step": 126492, "epoch": 3011} {"train_loss": -6.575107097625732, "global_step": 126493, "epoch": 3011} {"train_loss": -6.511435508728027, "global_step": 126494, "epoch": 3011} {"train_loss": -6.589929580688477, "global_step": 126495, "epoch": 3011} {"train_loss": -6.536500453948975, "global_step": 126496, "epoch": 3011} {"train_loss": -6.5874128341674805, "global_step": 126497, "epoch": 3011} {"train_loss": -6.538968086242676, "global_step": 126498, "epoch": 3011} {"train_loss": -6.545909881591797, "global_step": 126499, "epoch": 3011} {"train_loss": -6.596617698669434, "global_step": 126500, "epoch": 3011} {"train_loss": -6.625619411468506, "global_step": 126501, "epoch": 3011} {"train_loss": -6.605363368988037, "global_step": 126502, "epoch": 3011} {"train_loss": -6.6059231871650335, "global_step": 126503, "epoch": 3011, "val_loss": 68055.3046875} {"train_loss": -6.590787410736084, "global_step": 126504, "epoch": 3012} {"train_loss": -6.530247688293457, "global_step": 126505, "epoch": 3012} {"train_loss": -6.521945476531982, "global_step": 126506, "epoch": 3012} {"train_loss": -6.60151481628418, "global_step": 126507, "epoch": 3012} {"train_loss": -6.52008056640625, "global_step": 126508, "epoch": 3012} {"train_loss": -6.620905876159668, "global_step": 126509, "epoch": 3012} {"train_loss": -6.593009948730469, "global_step": 126510, "epoch": 3012} {"train_loss": -6.475122451782227, "global_step": 126511, "epoch": 3012} {"train_loss": -6.615665912628174, "global_step": 126512, "epoch": 3012} {"train_loss": -6.597038269042969, "global_step": 126513, "epoch": 3012} {"train_loss": -6.609836578369141, "global_step": 126514, "epoch": 3012} {"train_loss": -6.529080390930176, "global_step": 126515, "epoch": 3012} {"train_loss": -6.57624626159668, "global_step": 126516, "epoch": 3012} {"train_loss": -6.6110429763793945, "global_step": 126517, "epoch": 3012} {"train_loss": -6.516663074493408, "global_step": 126518, "epoch": 3012} {"train_loss": -6.5702805519104, "global_step": 126519, "epoch": 3012} {"train_loss": -6.60447359085083, "global_step": 126520, "epoch": 3012} {"train_loss": -6.563004016876221, "global_step": 126521, "epoch": 3012} {"train_loss": -6.590484142303467, "global_step": 126522, "epoch": 3012} {"train_loss": -6.607255935668945, "global_step": 126523, "epoch": 3012} {"train_loss": -6.675622940063477, "global_step": 126524, "epoch": 3012} {"train_loss": -6.720024585723877, "global_step": 126525, "epoch": 3012} {"train_loss": -6.6430864334106445, "global_step": 126526, "epoch": 3012} {"train_loss": -6.689810752868652, "global_step": 126527, "epoch": 3012} {"train_loss": -6.5823869705200195, "global_step": 126528, "epoch": 3012} {"train_loss": -6.586089134216309, "global_step": 126529, "epoch": 3012} {"train_loss": -6.581772804260254, "global_step": 126530, "epoch": 3012} {"train_loss": -6.723962783813477, "global_step": 126531, "epoch": 3012} {"train_loss": -6.669795513153076, "global_step": 126532, "epoch": 3012} {"train_loss": -6.5903120040893555, "global_step": 126533, "epoch": 3012} {"train_loss": -6.706395149230957, "global_step": 126534, "epoch": 3012} {"train_loss": -6.711036682128906, "global_step": 126535, "epoch": 3012} {"train_loss": -6.588840484619141, "global_step": 126536, "epoch": 3012} {"train_loss": -6.586972236633301, "global_step": 126537, "epoch": 3012} {"train_loss": -6.563753604888916, "global_step": 126538, "epoch": 3012} {"train_loss": -6.672521114349365, "global_step": 126539, "epoch": 3012} {"train_loss": -6.613751411437988, "global_step": 126540, "epoch": 3012} {"train_loss": -6.659882545471191, "global_step": 126541, "epoch": 3012} {"train_loss": -6.651188850402832, "global_step": 126542, "epoch": 3012} {"train_loss": -6.746543884277344, "global_step": 126543, "epoch": 3012} {"train_loss": -6.703421592712402, "global_step": 126544, "epoch": 3012} {"train_loss": -6.613884619304112, "global_step": 126545, "epoch": 3012, "val_loss": 68016.484375} {"train_loss": -6.694925308227539, "global_step": 126546, "epoch": 3013} {"train_loss": -6.601056098937988, "global_step": 126547, "epoch": 3013} {"train_loss": -6.504796028137207, "global_step": 126548, "epoch": 3013} {"train_loss": -6.622506141662598, "global_step": 126549, "epoch": 3013} {"train_loss": -6.755037307739258, "global_step": 126550, "epoch": 3013} {"train_loss": -6.656964302062988, "global_step": 126551, "epoch": 3013} {"train_loss": -6.542768478393555, "global_step": 126552, "epoch": 3013} {"train_loss": -6.644891262054443, "global_step": 126553, "epoch": 3013} {"train_loss": -6.607583999633789, "global_step": 126554, "epoch": 3013} {"train_loss": -6.560464382171631, "global_step": 126555, "epoch": 3013} {"train_loss": -6.678249359130859, "global_step": 126556, "epoch": 3013} {"train_loss": -6.633727073669434, "global_step": 126557, "epoch": 3013} {"train_loss": -6.5981645584106445, "global_step": 126558, "epoch": 3013} {"train_loss": -6.573633193969727, "global_step": 126559, "epoch": 3013} {"train_loss": -6.622649192810059, "global_step": 126560, "epoch": 3013} {"train_loss": -6.566461086273193, "global_step": 126561, "epoch": 3013} {"train_loss": -6.634922981262207, "global_step": 126562, "epoch": 3013} {"train_loss": -6.671778678894043, "global_step": 126563, "epoch": 3013} {"train_loss": -6.468104839324951, "global_step": 126564, "epoch": 3013} {"train_loss": -6.629311561584473, "global_step": 126565, "epoch": 3013} {"train_loss": -6.566440582275391, "global_step": 126566, "epoch": 3013} {"train_loss": -6.474977493286133, "global_step": 126567, "epoch": 3013} {"train_loss": -6.487922668457031, "global_step": 126568, "epoch": 3013} {"train_loss": -6.471676826477051, "global_step": 126569, "epoch": 3013} {"train_loss": -6.655263423919678, "global_step": 126570, "epoch": 3013} {"train_loss": -6.471862316131592, "global_step": 126571, "epoch": 3013} {"train_loss": -6.501321792602539, "global_step": 126572, "epoch": 3013} {"train_loss": -6.603439807891846, "global_step": 126573, "epoch": 3013} {"train_loss": -6.507406711578369, "global_step": 126574, "epoch": 3013} {"train_loss": -6.631197452545166, "global_step": 126575, "epoch": 3013} {"train_loss": -6.461844444274902, "global_step": 126576, "epoch": 3013} {"train_loss": -6.631139278411865, "global_step": 126577, "epoch": 3013} {"train_loss": -6.489236831665039, "global_step": 126578, "epoch": 3013} {"train_loss": -6.662191390991211, "global_step": 126579, "epoch": 3013} {"train_loss": -6.600574493408203, "global_step": 126580, "epoch": 3013} {"train_loss": -6.530906677246094, "global_step": 126581, "epoch": 3013} {"train_loss": -6.617722034454346, "global_step": 126582, "epoch": 3013} {"train_loss": -6.54378604888916, "global_step": 126583, "epoch": 3013} {"train_loss": -6.504936695098877, "global_step": 126584, "epoch": 3013} {"train_loss": -6.654680252075195, "global_step": 126585, "epoch": 3013} {"train_loss": -6.658417224884033, "global_step": 126586, "epoch": 3013} {"train_loss": -6.5823641050429575, "global_step": 126587, "epoch": 3013, "val_loss": 68325.984375} {"train_loss": -6.528249740600586, "global_step": 126588, "epoch": 3014} {"train_loss": -6.621123313903809, "global_step": 126589, "epoch": 3014} {"train_loss": -6.528267860412598, "global_step": 126590, "epoch": 3014} {"train_loss": -6.5923662185668945, "global_step": 126591, "epoch": 3014} {"train_loss": -6.650579452514648, "global_step": 126592, "epoch": 3014} {"train_loss": -6.6400251388549805, "global_step": 126593, "epoch": 3014} {"train_loss": -6.623241424560547, "global_step": 126594, "epoch": 3014} {"train_loss": -6.727420806884766, "global_step": 126595, "epoch": 3014} {"train_loss": -6.679681301116943, "global_step": 126596, "epoch": 3014} {"train_loss": -6.4704999923706055, "global_step": 126597, "epoch": 3014} {"train_loss": -6.591860771179199, "global_step": 126598, "epoch": 3014} {"train_loss": -6.6768412590026855, "global_step": 126599, "epoch": 3014} {"train_loss": -6.644505977630615, "global_step": 126600, "epoch": 3014} {"train_loss": -6.619592666625977, "global_step": 126601, "epoch": 3014} {"train_loss": -6.629763126373291, "global_step": 126602, "epoch": 3014} {"train_loss": -6.5587615966796875, "global_step": 126603, "epoch": 3014} {"train_loss": -6.478633403778076, "global_step": 126604, "epoch": 3014} {"train_loss": -6.419862747192383, "global_step": 126605, "epoch": 3014} {"train_loss": -6.573200225830078, "global_step": 126606, "epoch": 3014} {"train_loss": -6.651943206787109, "global_step": 126607, "epoch": 3014} {"train_loss": -6.65047550201416, "global_step": 126608, "epoch": 3014} {"train_loss": -6.526752948760986, "global_step": 126609, "epoch": 3014} {"train_loss": -6.580503940582275, "global_step": 126610, "epoch": 3014} {"train_loss": -6.681478500366211, "global_step": 126611, "epoch": 3014} {"train_loss": -6.563511848449707, "global_step": 126612, "epoch": 3014} {"train_loss": -6.54754638671875, "global_step": 126613, "epoch": 3014} {"train_loss": -6.630816459655762, "global_step": 126614, "epoch": 3014} {"train_loss": -6.581628322601318, "global_step": 126615, "epoch": 3014} {"train_loss": -6.644468307495117, "global_step": 126616, "epoch": 3014} {"train_loss": -6.648268699645996, "global_step": 126617, "epoch": 3014} {"train_loss": -6.6791486740112305, "global_step": 126618, "epoch": 3014} {"train_loss": -6.56287145614624, "global_step": 126619, "epoch": 3014} {"train_loss": -6.599030017852783, "global_step": 126620, "epoch": 3014} {"train_loss": -6.519649505615234, "global_step": 126621, "epoch": 3014} {"train_loss": -6.600342750549316, "global_step": 126622, "epoch": 3014} {"train_loss": -6.508582592010498, "global_step": 126623, "epoch": 3014} {"train_loss": -6.541754722595215, "global_step": 126624, "epoch": 3014} {"train_loss": -6.545875549316406, "global_step": 126625, "epoch": 3014} {"train_loss": -6.540428161621094, "global_step": 126626, "epoch": 3014} {"train_loss": -6.618727207183838, "global_step": 126627, "epoch": 3014} {"train_loss": -6.733858585357666, "global_step": 126628, "epoch": 3014} {"train_loss": -6.593086776279268, "global_step": 126629, "epoch": 3014, "val_loss": 68105.8984375} {"train_loss": -6.6100687980651855, "global_step": 126630, "epoch": 3015} {"train_loss": -6.692331790924072, "global_step": 126631, "epoch": 3015} {"train_loss": -6.598654747009277, "global_step": 126632, "epoch": 3015} {"train_loss": -6.476810455322266, "global_step": 126633, "epoch": 3015} {"train_loss": -6.543551921844482, "global_step": 126634, "epoch": 3015} {"train_loss": -6.642418384552002, "global_step": 126635, "epoch": 3015} {"train_loss": -6.628992557525635, "global_step": 126636, "epoch": 3015} {"train_loss": -6.651256561279297, "global_step": 126637, "epoch": 3015} {"train_loss": -6.661787986755371, "global_step": 126638, "epoch": 3015} {"train_loss": -6.524260520935059, "global_step": 126639, "epoch": 3015} {"train_loss": -6.595743179321289, "global_step": 126640, "epoch": 3015} {"train_loss": -6.5948686599731445, "global_step": 126641, "epoch": 3015} {"train_loss": -6.515264511108398, "global_step": 126642, "epoch": 3015} {"train_loss": -6.65213680267334, "global_step": 126643, "epoch": 3015} {"train_loss": -6.583786964416504, "global_step": 126644, "epoch": 3015} {"train_loss": -6.564122200012207, "global_step": 126645, "epoch": 3015} {"train_loss": -6.582597732543945, "global_step": 126646, "epoch": 3015} {"train_loss": -6.607801914215088, "global_step": 126647, "epoch": 3015} {"train_loss": -6.634824752807617, "global_step": 126648, "epoch": 3015} {"train_loss": -6.516663551330566, "global_step": 126649, "epoch": 3015} {"train_loss": -6.580947399139404, "global_step": 126650, "epoch": 3015} {"train_loss": -6.602792739868164, "global_step": 126651, "epoch": 3015} {"train_loss": -6.547318458557129, "global_step": 126652, "epoch": 3015} {"train_loss": -6.560853004455566, "global_step": 126653, "epoch": 3015} {"train_loss": -6.723267078399658, "global_step": 126654, "epoch": 3015} {"train_loss": -6.708286285400391, "global_step": 126655, "epoch": 3015} {"train_loss": -6.436526775360107, "global_step": 126656, "epoch": 3015} {"train_loss": -6.642154693603516, "global_step": 126657, "epoch": 3015} {"train_loss": -6.602365493774414, "global_step": 126658, "epoch": 3015} {"train_loss": -6.647719860076904, "global_step": 126659, "epoch": 3015} {"train_loss": -6.566839218139648, "global_step": 126660, "epoch": 3015} {"train_loss": -6.479668617248535, "global_step": 126661, "epoch": 3015} {"train_loss": -6.5794453620910645, "global_step": 126662, "epoch": 3015} {"train_loss": -6.613759517669678, "global_step": 126663, "epoch": 3015} {"train_loss": -6.540395736694336, "global_step": 126664, "epoch": 3015} {"train_loss": -6.453502655029297, "global_step": 126665, "epoch": 3015} {"train_loss": -6.492127895355225, "global_step": 126666, "epoch": 3015} {"train_loss": -6.514954566955566, "global_step": 126667, "epoch": 3015} {"train_loss": -6.544558525085449, "global_step": 126668, "epoch": 3015} {"train_loss": -6.524302005767822, "global_step": 126669, "epoch": 3015} {"train_loss": -6.579225540161133, "global_step": 126670, "epoch": 3015} {"train_loss": -6.58091614359901, "global_step": 126671, "epoch": 3015, "val_loss": 68064.6484375} {"train_loss": -6.476702690124512, "global_step": 126672, "epoch": 3016} {"train_loss": -6.579610347747803, "global_step": 126673, "epoch": 3016} {"train_loss": -6.547740936279297, "global_step": 126674, "epoch": 3016} {"train_loss": -6.590940952301025, "global_step": 126675, "epoch": 3016} {"train_loss": -6.65116548538208, "global_step": 126676, "epoch": 3016} {"train_loss": -6.48362398147583, "global_step": 126677, "epoch": 3016} {"train_loss": -6.597552299499512, "global_step": 126678, "epoch": 3016} {"train_loss": -6.655710220336914, "global_step": 126679, "epoch": 3016} {"train_loss": -6.512789726257324, "global_step": 126680, "epoch": 3016} {"train_loss": -6.584748268127441, "global_step": 126681, "epoch": 3016} {"train_loss": -6.448712348937988, "global_step": 126682, "epoch": 3016} {"train_loss": -6.688657760620117, "global_step": 126683, "epoch": 3016} {"train_loss": -6.556963920593262, "global_step": 126684, "epoch": 3016} {"train_loss": -6.7434306144714355, "global_step": 126685, "epoch": 3016} {"train_loss": -6.703984260559082, "global_step": 126686, "epoch": 3016} {"train_loss": -6.678533554077148, "global_step": 126687, "epoch": 3016} {"train_loss": -6.558021545410156, "global_step": 126688, "epoch": 3016} {"train_loss": -6.724815368652344, "global_step": 126689, "epoch": 3016} {"train_loss": -6.626635551452637, "global_step": 126690, "epoch": 3016} {"train_loss": -6.54476261138916, "global_step": 126691, "epoch": 3016} {"train_loss": -6.51668643951416, "global_step": 126692, "epoch": 3016} {"train_loss": -6.520630836486816, "global_step": 126693, "epoch": 3016} {"train_loss": -6.724452018737793, "global_step": 126694, "epoch": 3016} {"train_loss": -6.625069618225098, "global_step": 126695, "epoch": 3016} {"train_loss": -6.6329545974731445, "global_step": 126696, "epoch": 3016} {"train_loss": -6.589166641235352, "global_step": 126697, "epoch": 3016} {"train_loss": -6.6516008377075195, "global_step": 126698, "epoch": 3016} {"train_loss": -6.570687294006348, "global_step": 126699, "epoch": 3016} {"train_loss": -6.7005391120910645, "global_step": 126700, "epoch": 3016} {"train_loss": -6.669170379638672, "global_step": 126701, "epoch": 3016} {"train_loss": -6.537100791931152, "global_step": 126702, "epoch": 3016} {"train_loss": -6.633866310119629, "global_step": 126703, "epoch": 3016} {"train_loss": -6.564761638641357, "global_step": 126704, "epoch": 3016} {"train_loss": -6.657299995422363, "global_step": 126705, "epoch": 3016} {"train_loss": -6.638151168823242, "global_step": 126706, "epoch": 3016} {"train_loss": -6.650725364685059, "global_step": 126707, "epoch": 3016} {"train_loss": -6.554956912994385, "global_step": 126708, "epoch": 3016} {"train_loss": -6.697615146636963, "global_step": 126709, "epoch": 3016} {"train_loss": -6.6953020095825195, "global_step": 126710, "epoch": 3016} {"train_loss": -6.545047760009766, "global_step": 126711, "epoch": 3016} {"train_loss": -6.539549827575684, "global_step": 126712, "epoch": 3016} {"train_loss": -6.607590084984189, "global_step": 126713, "epoch": 3016, "val_loss": 68011.015625} {"train_loss": -6.606716156005859, "global_step": 126714, "epoch": 3017} {"train_loss": -6.6093034744262695, "global_step": 126715, "epoch": 3017} {"train_loss": -6.557755947113037, "global_step": 126716, "epoch": 3017} {"train_loss": -6.664461612701416, "global_step": 126717, "epoch": 3017} {"train_loss": -6.579891204833984, "global_step": 126718, "epoch": 3017} {"train_loss": -6.7146759033203125, "global_step": 126719, "epoch": 3017} {"train_loss": -6.672919273376465, "global_step": 126720, "epoch": 3017} {"train_loss": -6.575565338134766, "global_step": 126721, "epoch": 3017} {"train_loss": -6.63505220413208, "global_step": 126722, "epoch": 3017} {"train_loss": -6.467944145202637, "global_step": 126723, "epoch": 3017} {"train_loss": -6.683088302612305, "global_step": 126724, "epoch": 3017} {"train_loss": -6.621189594268799, "global_step": 126725, "epoch": 3017} {"train_loss": -6.509951114654541, "global_step": 126726, "epoch": 3017} {"train_loss": -6.76243782043457, "global_step": 126727, "epoch": 3017} {"train_loss": -6.573534965515137, "global_step": 126728, "epoch": 3017} {"train_loss": -6.680057525634766, "global_step": 126729, "epoch": 3017} {"train_loss": -6.566158294677734, "global_step": 126730, "epoch": 3017} {"train_loss": -6.603130340576172, "global_step": 126731, "epoch": 3017} {"train_loss": -6.617833137512207, "global_step": 126732, "epoch": 3017} {"train_loss": -6.645754814147949, "global_step": 126733, "epoch": 3017} {"train_loss": -6.666138648986816, "global_step": 126734, "epoch": 3017} {"train_loss": -6.628824710845947, "global_step": 126735, "epoch": 3017} {"train_loss": -6.621980667114258, "global_step": 126736, "epoch": 3017} {"train_loss": -6.64332389831543, "global_step": 126737, "epoch": 3017} {"train_loss": -6.646643161773682, "global_step": 126738, "epoch": 3017} {"train_loss": -6.523175239562988, "global_step": 126739, "epoch": 3017} {"train_loss": -6.564505577087402, "global_step": 126740, "epoch": 3017} {"train_loss": -6.655751705169678, "global_step": 126741, "epoch": 3017} {"train_loss": -6.5006561279296875, "global_step": 126742, "epoch": 3017} {"train_loss": -6.753834247589111, "global_step": 126743, "epoch": 3017} {"train_loss": -6.599786281585693, "global_step": 126744, "epoch": 3017} {"train_loss": -6.510270595550537, "global_step": 126745, "epoch": 3017} {"train_loss": -6.507053375244141, "global_step": 126746, "epoch": 3017} {"train_loss": -6.558784484863281, "global_step": 126747, "epoch": 3017} {"train_loss": -6.592170715332031, "global_step": 126748, "epoch": 3017} {"train_loss": -6.499810218811035, "global_step": 126749, "epoch": 3017} {"train_loss": -6.480879783630371, "global_step": 126750, "epoch": 3017} {"train_loss": -6.5848469734191895, "global_step": 126751, "epoch": 3017} {"train_loss": -6.535037994384766, "global_step": 126752, "epoch": 3017} {"train_loss": -6.7881999015808105, "global_step": 126753, "epoch": 3017} {"train_loss": -6.618167877197266, "global_step": 126754, "epoch": 3017} {"train_loss": -6.605199234826224, "global_step": 126755, "epoch": 3017, "val_loss": 68166.4609375} {"train_loss": -6.639308929443359, "global_step": 126756, "epoch": 3018} {"train_loss": -6.633473873138428, "global_step": 126757, "epoch": 3018} {"train_loss": -6.598337650299072, "global_step": 126758, "epoch": 3018} {"train_loss": -6.603999614715576, "global_step": 126759, "epoch": 3018} {"train_loss": -6.623927593231201, "global_step": 126760, "epoch": 3018} {"train_loss": -6.648000717163086, "global_step": 126761, "epoch": 3018} {"train_loss": -6.598288059234619, "global_step": 126762, "epoch": 3018} {"train_loss": -6.5884809494018555, "global_step": 126763, "epoch": 3018} {"train_loss": -6.6077470779418945, "global_step": 126764, "epoch": 3018} {"train_loss": -6.642967224121094, "global_step": 126765, "epoch": 3018} {"train_loss": -6.656412124633789, "global_step": 126766, "epoch": 3018} {"train_loss": -6.678378582000732, "global_step": 126767, "epoch": 3018} {"train_loss": -6.59443473815918, "global_step": 126768, "epoch": 3018} {"train_loss": -6.5434160232543945, "global_step": 126769, "epoch": 3018} {"train_loss": -6.735754013061523, "global_step": 126770, "epoch": 3018} {"train_loss": -6.769798278808594, "global_step": 126771, "epoch": 3018} {"train_loss": -6.623705863952637, "global_step": 126772, "epoch": 3018} {"train_loss": -6.68866491317749, "global_step": 126773, "epoch": 3018} {"train_loss": -6.680367946624756, "global_step": 126774, "epoch": 3018} {"train_loss": -6.54556941986084, "global_step": 126775, "epoch": 3018} {"train_loss": -6.624421119689941, "global_step": 126776, "epoch": 3018} {"train_loss": -6.648437023162842, "global_step": 126777, "epoch": 3018} {"train_loss": -6.736872673034668, "global_step": 126778, "epoch": 3018} {"train_loss": -6.62269401550293, "global_step": 126779, "epoch": 3018} {"train_loss": -6.692288398742676, "global_step": 126780, "epoch": 3018} {"train_loss": -6.672449111938477, "global_step": 126781, "epoch": 3018} {"train_loss": -6.7541375160217285, "global_step": 126782, "epoch": 3018} {"train_loss": -6.715897083282471, "global_step": 126783, "epoch": 3018} {"train_loss": -6.557228088378906, "global_step": 126784, "epoch": 3018} {"train_loss": -6.530607223510742, "global_step": 126785, "epoch": 3018} {"train_loss": -6.582206726074219, "global_step": 126786, "epoch": 3018} {"train_loss": -6.716709136962891, "global_step": 126787, "epoch": 3018} {"train_loss": -6.710133075714111, "global_step": 126788, "epoch": 3018} {"train_loss": -6.600726127624512, "global_step": 126789, "epoch": 3018} {"train_loss": -6.661978244781494, "global_step": 126790, "epoch": 3018} {"train_loss": -6.612829685211182, "global_step": 126791, "epoch": 3018} {"train_loss": -6.59619140625, "global_step": 126792, "epoch": 3018} {"train_loss": -6.656278133392334, "global_step": 126793, "epoch": 3018} {"train_loss": -6.5976409912109375, "global_step": 126794, "epoch": 3018} {"train_loss": -6.551990509033203, "global_step": 126795, "epoch": 3018} {"train_loss": -6.546710014343262, "global_step": 126796, "epoch": 3018} {"train_loss": -6.6345091206686835, "global_step": 126797, "epoch": 3018, "val_loss": 68062.1171875} {"train_loss": -6.574814796447754, "global_step": 126798, "epoch": 3019} {"train_loss": -6.644368648529053, "global_step": 126799, "epoch": 3019} {"train_loss": -6.654019355773926, "global_step": 126800, "epoch": 3019} {"train_loss": -6.768197059631348, "global_step": 126801, "epoch": 3019} {"train_loss": -6.5942277908325195, "global_step": 126802, "epoch": 3019} {"train_loss": -6.565445899963379, "global_step": 126803, "epoch": 3019} {"train_loss": -6.522033214569092, "global_step": 126804, "epoch": 3019} {"train_loss": -6.596663475036621, "global_step": 126805, "epoch": 3019} {"train_loss": -6.687280178070068, "global_step": 126806, "epoch": 3019} {"train_loss": -6.698639869689941, "global_step": 126807, "epoch": 3019} {"train_loss": -6.636070251464844, "global_step": 126808, "epoch": 3019} {"train_loss": -6.67562198638916, "global_step": 126809, "epoch": 3019} {"train_loss": -6.567706108093262, "global_step": 126810, "epoch": 3019} {"train_loss": -6.646664619445801, "global_step": 126811, "epoch": 3019} {"train_loss": -6.496099948883057, "global_step": 126812, "epoch": 3019} {"train_loss": -6.580324172973633, "global_step": 126813, "epoch": 3019} {"train_loss": -6.718811988830566, "global_step": 126814, "epoch": 3019} {"train_loss": -6.571865081787109, "global_step": 126815, "epoch": 3019} {"train_loss": -6.541391849517822, "global_step": 126816, "epoch": 3019} {"train_loss": -6.5452728271484375, "global_step": 126817, "epoch": 3019} {"train_loss": -6.557245254516602, "global_step": 126818, "epoch": 3019} {"train_loss": -6.520801544189453, "global_step": 126819, "epoch": 3019} {"train_loss": -6.562961578369141, "global_step": 126820, "epoch": 3019} {"train_loss": -6.49469518661499, "global_step": 126821, "epoch": 3019} {"train_loss": -6.488195419311523, "global_step": 126822, "epoch": 3019} {"train_loss": -6.463380336761475, "global_step": 126823, "epoch": 3019} {"train_loss": -6.5563530921936035, "global_step": 126824, "epoch": 3019} {"train_loss": -6.547975540161133, "global_step": 126825, "epoch": 3019} {"train_loss": -6.59706449508667, "global_step": 126826, "epoch": 3019} {"train_loss": -6.662522315979004, "global_step": 126827, "epoch": 3019} {"train_loss": -6.4975786209106445, "global_step": 126828, "epoch": 3019} {"train_loss": -6.612150192260742, "global_step": 126829, "epoch": 3019} {"train_loss": -6.570223331451416, "global_step": 126830, "epoch": 3019} {"train_loss": -6.540199279785156, "global_step": 126831, "epoch": 3019} {"train_loss": -6.391934871673584, "global_step": 126832, "epoch": 3019} {"train_loss": -6.539455413818359, "global_step": 126833, "epoch": 3019} {"train_loss": -6.553162574768066, "global_step": 126834, "epoch": 3019} {"train_loss": -6.657861709594727, "global_step": 126835, "epoch": 3019} {"train_loss": -6.597137451171875, "global_step": 126836, "epoch": 3019} {"train_loss": -6.442523002624512, "global_step": 126837, "epoch": 3019} {"train_loss": -6.596750259399414, "global_step": 126838, "epoch": 3019} {"train_loss": -6.5758833431062245, "global_step": 126839, "epoch": 3019, "val_loss": 67880.7421875} {"train_loss": -6.580505847930908, "global_step": 126840, "epoch": 3020} {"train_loss": -6.620044708251953, "global_step": 126841, "epoch": 3020} {"train_loss": -6.520078659057617, "global_step": 126842, "epoch": 3020} {"train_loss": -6.535403251647949, "global_step": 126843, "epoch": 3020} {"train_loss": -6.682192325592041, "global_step": 126844, "epoch": 3020} {"train_loss": -6.510561466217041, "global_step": 126845, "epoch": 3020} {"train_loss": -6.64437198638916, "global_step": 126846, "epoch": 3020} {"train_loss": -6.625523090362549, "global_step": 126847, "epoch": 3020} {"train_loss": -6.48301887512207, "global_step": 126848, "epoch": 3020} {"train_loss": -6.659866809844971, "global_step": 126849, "epoch": 3020} {"train_loss": -6.550693511962891, "global_step": 126850, "epoch": 3020} {"train_loss": -6.5566511154174805, "global_step": 126851, "epoch": 3020} {"train_loss": -6.6875081062316895, "global_step": 126852, "epoch": 3020} {"train_loss": -6.537300109863281, "global_step": 126853, "epoch": 3020} {"train_loss": -6.458818435668945, "global_step": 126854, "epoch": 3020} {"train_loss": -6.645570755004883, "global_step": 126855, "epoch": 3020} {"train_loss": -6.616574287414551, "global_step": 126856, "epoch": 3020} {"train_loss": -6.473210334777832, "global_step": 126857, "epoch": 3020} {"train_loss": -6.4991841316223145, "global_step": 126858, "epoch": 3020} {"train_loss": -6.626134872436523, "global_step": 126859, "epoch": 3020} {"train_loss": -6.588854789733887, "global_step": 126860, "epoch": 3020} {"train_loss": -6.563746452331543, "global_step": 126861, "epoch": 3020} {"train_loss": -6.618272304534912, "global_step": 126862, "epoch": 3020} {"train_loss": -6.517356872558594, "global_step": 126863, "epoch": 3020} {"train_loss": -6.603785037994385, "global_step": 126864, "epoch": 3020} {"train_loss": -6.58849573135376, "global_step": 126865, "epoch": 3020} {"train_loss": -6.573982238769531, "global_step": 126866, "epoch": 3020} {"train_loss": -6.603598594665527, "global_step": 126867, "epoch": 3020} {"train_loss": -6.645050048828125, "global_step": 126868, "epoch": 3020} {"train_loss": -6.626877784729004, "global_step": 126869, "epoch": 3020} {"train_loss": -6.607832908630371, "global_step": 126870, "epoch": 3020} {"train_loss": -6.541097164154053, "global_step": 126871, "epoch": 3020} {"train_loss": -6.524601459503174, "global_step": 126872, "epoch": 3020} {"train_loss": -6.5815300941467285, "global_step": 126873, "epoch": 3020} {"train_loss": -6.5501909255981445, "global_step": 126874, "epoch": 3020} {"train_loss": -6.56934928894043, "global_step": 126875, "epoch": 3020} {"train_loss": -6.520383834838867, "global_step": 126876, "epoch": 3020} {"train_loss": -6.592498779296875, "global_step": 126877, "epoch": 3020} {"train_loss": -6.610836029052734, "global_step": 126878, "epoch": 3020} {"train_loss": -6.605999946594238, "global_step": 126879, "epoch": 3020} {"train_loss": -6.596290111541748, "global_step": 126880, "epoch": 3020} {"train_loss": -6.579132806687128, "global_step": 126881, "epoch": 3020, "val_loss": 68032.6796875} {"train_loss": -6.624179840087891, "global_step": 126882, "epoch": 3021} {"train_loss": -6.555413246154785, "global_step": 126883, "epoch": 3021} {"train_loss": -6.623863697052002, "global_step": 126884, "epoch": 3021} {"train_loss": -6.54216194152832, "global_step": 126885, "epoch": 3021} {"train_loss": -6.542412757873535, "global_step": 126886, "epoch": 3021} {"train_loss": -6.631472587585449, "global_step": 126887, "epoch": 3021} {"train_loss": -6.549726486206055, "global_step": 126888, "epoch": 3021} {"train_loss": -6.592894077301025, "global_step": 126889, "epoch": 3021} {"train_loss": -6.623743057250977, "global_step": 126890, "epoch": 3021} {"train_loss": -6.6022539138793945, "global_step": 126891, "epoch": 3021} {"train_loss": -6.608513355255127, "global_step": 126892, "epoch": 3021} {"train_loss": -6.605041980743408, "global_step": 126893, "epoch": 3021} {"train_loss": -6.635892391204834, "global_step": 126894, "epoch": 3021} {"train_loss": -6.614828586578369, "global_step": 126895, "epoch": 3021} {"train_loss": -6.593267440795898, "global_step": 126896, "epoch": 3021} {"train_loss": -6.5374345779418945, "global_step": 126897, "epoch": 3021} {"train_loss": -6.648209571838379, "global_step": 126898, "epoch": 3021} {"train_loss": -6.639368534088135, "global_step": 126899, "epoch": 3021} {"train_loss": -6.60001277923584, "global_step": 126900, "epoch": 3021} {"train_loss": -6.672061920166016, "global_step": 126901, "epoch": 3021} {"train_loss": -6.654534816741943, "global_step": 126902, "epoch": 3021} {"train_loss": -6.632097244262695, "global_step": 126903, "epoch": 3021} {"train_loss": -6.61152458190918, "global_step": 126904, "epoch": 3021} {"train_loss": -6.520852565765381, "global_step": 126905, "epoch": 3021} {"train_loss": -6.60374641418457, "global_step": 126906, "epoch": 3021} {"train_loss": -6.58518123626709, "global_step": 126907, "epoch": 3021} {"train_loss": -6.588695526123047, "global_step": 126908, "epoch": 3021} {"train_loss": -6.591608047485352, "global_step": 126909, "epoch": 3021} {"train_loss": -6.527716636657715, "global_step": 126910, "epoch": 3021} {"train_loss": -6.664294719696045, "global_step": 126911, "epoch": 3021} {"train_loss": -6.645593166351318, "global_step": 126912, "epoch": 3021} {"train_loss": -6.468658447265625, "global_step": 126913, "epoch": 3021} {"train_loss": -6.682106018066406, "global_step": 126914, "epoch": 3021} {"train_loss": -6.621502876281738, "global_step": 126915, "epoch": 3021} {"train_loss": -6.6681718826293945, "global_step": 126916, "epoch": 3021} {"train_loss": -6.621757507324219, "global_step": 126917, "epoch": 3021} {"train_loss": -6.663399696350098, "global_step": 126918, "epoch": 3021} {"train_loss": -6.67290735244751, "global_step": 126919, "epoch": 3021} {"train_loss": -6.631916046142578, "global_step": 126920, "epoch": 3021} {"train_loss": -6.546971321105957, "global_step": 126921, "epoch": 3021} {"train_loss": -6.531878471374512, "global_step": 126922, "epoch": 3021} {"train_loss": -6.602551903043475, "global_step": 126923, "epoch": 3021, "val_loss": 68134.7578125} {"train_loss": -6.686391830444336, "global_step": 126924, "epoch": 3022} {"train_loss": -6.637872695922852, "global_step": 126925, "epoch": 3022} {"train_loss": -6.673125743865967, "global_step": 126926, "epoch": 3022} {"train_loss": -6.726734638214111, "global_step": 126927, "epoch": 3022} {"train_loss": -6.531693935394287, "global_step": 126928, "epoch": 3022} {"train_loss": -6.679050445556641, "global_step": 126929, "epoch": 3022} {"train_loss": -6.58126163482666, "global_step": 126930, "epoch": 3022} {"train_loss": -6.629724025726318, "global_step": 126931, "epoch": 3022} {"train_loss": -6.545503616333008, "global_step": 126932, "epoch": 3022} {"train_loss": -6.687748432159424, "global_step": 126933, "epoch": 3022} {"train_loss": -6.653866767883301, "global_step": 126934, "epoch": 3022} {"train_loss": -6.640639781951904, "global_step": 126935, "epoch": 3022} {"train_loss": -6.6452436447143555, "global_step": 126936, "epoch": 3022} {"train_loss": -6.720303058624268, "global_step": 126937, "epoch": 3022} {"train_loss": -6.621090412139893, "global_step": 126938, "epoch": 3022} {"train_loss": -6.68720006942749, "global_step": 126939, "epoch": 3022} {"train_loss": -6.6114959716796875, "global_step": 126940, "epoch": 3022} {"train_loss": -6.536866188049316, "global_step": 126941, "epoch": 3022} {"train_loss": -6.690718650817871, "global_step": 126942, "epoch": 3022} {"train_loss": -6.61453104019165, "global_step": 126943, "epoch": 3022} {"train_loss": -6.622068405151367, "global_step": 126944, "epoch": 3022} {"train_loss": -6.63138484954834, "global_step": 126945, "epoch": 3022} {"train_loss": -6.473141670227051, "global_step": 126946, "epoch": 3022} {"train_loss": -6.622673988342285, "global_step": 126947, "epoch": 3022} {"train_loss": -6.695451736450195, "global_step": 126948, "epoch": 3022} {"train_loss": -6.544356822967529, "global_step": 126949, "epoch": 3022} {"train_loss": -6.588258743286133, "global_step": 126950, "epoch": 3022} {"train_loss": -6.760556221008301, "global_step": 126951, "epoch": 3022} {"train_loss": -6.626813888549805, "global_step": 126952, "epoch": 3022} {"train_loss": -6.579952239990234, "global_step": 126953, "epoch": 3022} {"train_loss": -6.562581539154053, "global_step": 126954, "epoch": 3022} {"train_loss": -6.634670734405518, "global_step": 126955, "epoch": 3022} {"train_loss": -6.467002868652344, "global_step": 126956, "epoch": 3022} {"train_loss": -6.5905303955078125, "global_step": 126957, "epoch": 3022} {"train_loss": -6.526389122009277, "global_step": 126958, "epoch": 3022} {"train_loss": -6.624063968658447, "global_step": 126959, "epoch": 3022} {"train_loss": -6.488360404968262, "global_step": 126960, "epoch": 3022} {"train_loss": -6.4197916984558105, "global_step": 126961, "epoch": 3022} {"train_loss": -6.533185005187988, "global_step": 126962, "epoch": 3022} {"train_loss": -6.463546276092529, "global_step": 126963, "epoch": 3022} {"train_loss": -6.368353843688965, "global_step": 126964, "epoch": 3022} {"train_loss": -6.597568375723703, "global_step": 126965, "epoch": 3022, "val_loss": 68749.3125} {"train_loss": -6.224298477172852, "global_step": 126966, "epoch": 3023} {"train_loss": -6.597962379455566, "global_step": 126967, "epoch": 3023} {"train_loss": -6.37237548828125, "global_step": 126968, "epoch": 3023} {"train_loss": -6.385568618774414, "global_step": 126969, "epoch": 3023} {"train_loss": -6.383364200592041, "global_step": 126970, "epoch": 3023} {"train_loss": -6.420494079589844, "global_step": 126971, "epoch": 3023} {"train_loss": -6.415643692016602, "global_step": 126972, "epoch": 3023} {"train_loss": -6.428577423095703, "global_step": 126973, "epoch": 3023} {"train_loss": -6.517300128936768, "global_step": 126974, "epoch": 3023} {"train_loss": -6.499246597290039, "global_step": 126975, "epoch": 3023} {"train_loss": -6.5076398849487305, "global_step": 126976, "epoch": 3023} {"train_loss": -6.591167449951172, "global_step": 126977, "epoch": 3023} {"train_loss": -6.4686174392700195, "global_step": 126978, "epoch": 3023} {"train_loss": -6.442191123962402, "global_step": 126979, "epoch": 3023} {"train_loss": -6.4684977531433105, "global_step": 126980, "epoch": 3023} {"train_loss": -6.639204978942871, "global_step": 126981, "epoch": 3023} {"train_loss": -6.5928754806518555, "global_step": 126982, "epoch": 3023} {"train_loss": -6.476950645446777, "global_step": 126983, "epoch": 3023} {"train_loss": -6.548045635223389, "global_step": 126984, "epoch": 3023} {"train_loss": -6.601853370666504, "global_step": 126985, "epoch": 3023} {"train_loss": -6.614858627319336, "global_step": 126986, "epoch": 3023} {"train_loss": -6.547998905181885, "global_step": 126987, "epoch": 3023} {"train_loss": -6.526336669921875, "global_step": 126988, "epoch": 3023} {"train_loss": -6.448558330535889, "global_step": 126989, "epoch": 3023} {"train_loss": -6.498002052307129, "global_step": 126990, "epoch": 3023} {"train_loss": -6.48476505279541, "global_step": 126991, "epoch": 3023} {"train_loss": -6.42624044418335, "global_step": 126992, "epoch": 3023} {"train_loss": -6.567570686340332, "global_step": 126993, "epoch": 3023} {"train_loss": -6.539434432983398, "global_step": 126994, "epoch": 3023} {"train_loss": -6.572309494018555, "global_step": 126995, "epoch": 3023} {"train_loss": -6.532293319702148, "global_step": 126996, "epoch": 3023} {"train_loss": -6.6649370193481445, "global_step": 126997, "epoch": 3023} {"train_loss": -6.563401222229004, "global_step": 126998, "epoch": 3023} {"train_loss": -6.581930160522461, "global_step": 126999, "epoch": 3023} {"train_loss": -6.636112213134766, "global_step": 127000, "epoch": 3023} {"train_loss": -6.551026344299316, "global_step": 127001, "epoch": 3023} {"train_loss": -6.601187705993652, "global_step": 127002, "epoch": 3023} {"train_loss": -6.54455041885376, "global_step": 127003, "epoch": 3023} {"train_loss": -6.573936462402344, "global_step": 127004, "epoch": 3023} {"train_loss": -6.6673688888549805, "global_step": 127005, "epoch": 3023} {"train_loss": -6.57452392578125, "global_step": 127006, "epoch": 3023} {"train_loss": -6.523220811571393, "global_step": 127007, "epoch": 3023, "val_loss": 68107.5859375} {"train_loss": -6.540380477905273, "global_step": 127008, "epoch": 3024} {"train_loss": -6.703405857086182, "global_step": 127009, "epoch": 3024} {"train_loss": -6.677080154418945, "global_step": 127010, "epoch": 3024} {"train_loss": -6.602729320526123, "global_step": 127011, "epoch": 3024} {"train_loss": -6.656974792480469, "global_step": 127012, "epoch": 3024} {"train_loss": -6.601827621459961, "global_step": 127013, "epoch": 3024} {"train_loss": -6.577559947967529, "global_step": 127014, "epoch": 3024} {"train_loss": -6.647623062133789, "global_step": 127015, "epoch": 3024} {"train_loss": -6.596116065979004, "global_step": 127016, "epoch": 3024} {"train_loss": -6.66732120513916, "global_step": 127017, "epoch": 3024} {"train_loss": -6.568969249725342, "global_step": 127018, "epoch": 3024} {"train_loss": -6.630161285400391, "global_step": 127019, "epoch": 3024} {"train_loss": -6.662346839904785, "global_step": 127020, "epoch": 3024} {"train_loss": -6.5594072341918945, "global_step": 127021, "epoch": 3024} {"train_loss": -6.450932502746582, "global_step": 127022, "epoch": 3024} {"train_loss": -6.563167095184326, "global_step": 127023, "epoch": 3024} {"train_loss": -6.590814590454102, "global_step": 127024, "epoch": 3024} {"train_loss": -6.497788906097412, "global_step": 127025, "epoch": 3024} {"train_loss": -6.651558876037598, "global_step": 127026, "epoch": 3024} {"train_loss": -6.577816009521484, "global_step": 127027, "epoch": 3024} {"train_loss": -6.643122673034668, "global_step": 127028, "epoch": 3024} {"train_loss": -6.666913986206055, "global_step": 127029, "epoch": 3024} {"train_loss": -6.480476379394531, "global_step": 127030, "epoch": 3024} {"train_loss": -6.672067165374756, "global_step": 127031, "epoch": 3024} {"train_loss": -6.581409454345703, "global_step": 127032, "epoch": 3024} {"train_loss": -6.625908851623535, "global_step": 127033, "epoch": 3024} {"train_loss": -6.704196453094482, "global_step": 127034, "epoch": 3024} {"train_loss": -6.6217474937438965, "global_step": 127035, "epoch": 3024} {"train_loss": -6.604905128479004, "global_step": 127036, "epoch": 3024} {"train_loss": -6.7117695808410645, "global_step": 127037, "epoch": 3024} {"train_loss": -6.721841812133789, "global_step": 127038, "epoch": 3024} {"train_loss": -6.699643135070801, "global_step": 127039, "epoch": 3024} {"train_loss": -6.583592414855957, "global_step": 127040, "epoch": 3024} {"train_loss": -6.425026893615723, "global_step": 127041, "epoch": 3024} {"train_loss": -6.574182510375977, "global_step": 127042, "epoch": 3024} {"train_loss": -6.638753890991211, "global_step": 127043, "epoch": 3024} {"train_loss": -6.624749660491943, "global_step": 127044, "epoch": 3024} {"train_loss": -6.646883010864258, "global_step": 127045, "epoch": 3024} {"train_loss": -6.660980224609375, "global_step": 127046, "epoch": 3024} {"train_loss": -6.699071407318115, "global_step": 127047, "epoch": 3024} {"train_loss": -6.725381374359131, "global_step": 127048, "epoch": 3024} {"train_loss": -6.6168953237079435, "global_step": 127049, "epoch": 3024, "val_loss": 68110.8828125} {"train_loss": -6.553221702575684, "global_step": 127050, "epoch": 3025} {"train_loss": -6.530860424041748, "global_step": 127051, "epoch": 3025} {"train_loss": -6.668269157409668, "global_step": 127052, "epoch": 3025} {"train_loss": -6.634308338165283, "global_step": 127053, "epoch": 3025} {"train_loss": -6.736067771911621, "global_step": 127054, "epoch": 3025} {"train_loss": -6.699594497680664, "global_step": 127055, "epoch": 3025} {"train_loss": -6.522998809814453, "global_step": 127056, "epoch": 3025} {"train_loss": -6.703020095825195, "global_step": 127057, "epoch": 3025} {"train_loss": -6.598999977111816, "global_step": 127058, "epoch": 3025} {"train_loss": -6.506752967834473, "global_step": 127059, "epoch": 3025} {"train_loss": -6.610106468200684, "global_step": 127060, "epoch": 3025} {"train_loss": -6.630549430847168, "global_step": 127061, "epoch": 3025} {"train_loss": -6.528080463409424, "global_step": 127062, "epoch": 3025} {"train_loss": -6.583940505981445, "global_step": 127063, "epoch": 3025} {"train_loss": -6.629668235778809, "global_step": 127064, "epoch": 3025} {"train_loss": -6.697603225708008, "global_step": 127065, "epoch": 3025} {"train_loss": -6.712904930114746, "global_step": 127066, "epoch": 3025} {"train_loss": -6.658475399017334, "global_step": 127067, "epoch": 3025} {"train_loss": -6.607536792755127, "global_step": 127068, "epoch": 3025} {"train_loss": -6.773063659667969, "global_step": 127069, "epoch": 3025} {"train_loss": -6.555669784545898, "global_step": 127070, "epoch": 3025} {"train_loss": -6.621399402618408, "global_step": 127071, "epoch": 3025} {"train_loss": -6.546701431274414, "global_step": 127072, "epoch": 3025} {"train_loss": -6.56500244140625, "global_step": 127073, "epoch": 3025} {"train_loss": -6.672676086425781, "global_step": 127074, "epoch": 3025} {"train_loss": -6.514856338500977, "global_step": 127075, "epoch": 3025} {"train_loss": -6.6160478591918945, "global_step": 127076, "epoch": 3025} {"train_loss": -6.62359619140625, "global_step": 127077, "epoch": 3025} {"train_loss": -6.550931453704834, "global_step": 127078, "epoch": 3025} {"train_loss": -6.621992111206055, "global_step": 127079, "epoch": 3025} {"train_loss": -6.665124893188477, "global_step": 127080, "epoch": 3025} {"train_loss": -6.6230573654174805, "global_step": 127081, "epoch": 3025} {"train_loss": -6.639918327331543, "global_step": 127082, "epoch": 3025} {"train_loss": -6.5575690269470215, "global_step": 127083, "epoch": 3025} {"train_loss": -6.631059646606445, "global_step": 127084, "epoch": 3025} {"train_loss": -6.572806358337402, "global_step": 127085, "epoch": 3025} {"train_loss": -6.573774337768555, "global_step": 127086, "epoch": 3025} {"train_loss": -6.559404373168945, "global_step": 127087, "epoch": 3025} {"train_loss": -6.667169570922852, "global_step": 127088, "epoch": 3025} {"train_loss": -6.526878833770752, "global_step": 127089, "epoch": 3025} {"train_loss": -6.615975379943848, "global_step": 127090, "epoch": 3025} {"train_loss": -6.610171431586856, "global_step": 127091, "epoch": 3025, "val_loss": 68061.984375} {"train_loss": -6.652699947357178, "global_step": 127092, "epoch": 3026} {"train_loss": -6.756043434143066, "global_step": 127093, "epoch": 3026} {"train_loss": -6.584125518798828, "global_step": 127094, "epoch": 3026} {"train_loss": -6.599592208862305, "global_step": 127095, "epoch": 3026} {"train_loss": -6.735477447509766, "global_step": 127096, "epoch": 3026} {"train_loss": -6.612309455871582, "global_step": 127097, "epoch": 3026} {"train_loss": -6.615209102630615, "global_step": 127098, "epoch": 3026} {"train_loss": -6.667196750640869, "global_step": 127099, "epoch": 3026} {"train_loss": -6.611663341522217, "global_step": 127100, "epoch": 3026} {"train_loss": -6.70011568069458, "global_step": 127101, "epoch": 3026} {"train_loss": -6.503384590148926, "global_step": 127102, "epoch": 3026} {"train_loss": -6.621979236602783, "global_step": 127103, "epoch": 3026} {"train_loss": -6.622987270355225, "global_step": 127104, "epoch": 3026} {"train_loss": -6.617410659790039, "global_step": 127105, "epoch": 3026} {"train_loss": -6.628054618835449, "global_step": 127106, "epoch": 3026} {"train_loss": -6.685841083526611, "global_step": 127107, "epoch": 3026} {"train_loss": -6.6377668380737305, "global_step": 127108, "epoch": 3026} {"train_loss": -6.673095226287842, "global_step": 127109, "epoch": 3026} {"train_loss": -6.761721611022949, "global_step": 127110, "epoch": 3026} {"train_loss": -6.612678527832031, "global_step": 127111, "epoch": 3026} {"train_loss": -6.579820156097412, "global_step": 127112, "epoch": 3026} {"train_loss": -6.603252410888672, "global_step": 127113, "epoch": 3026} {"train_loss": -6.664331436157227, "global_step": 127114, "epoch": 3026} {"train_loss": -6.623829364776611, "global_step": 127115, "epoch": 3026} {"train_loss": -6.596933364868164, "global_step": 127116, "epoch": 3026} {"train_loss": -6.6177568435668945, "global_step": 127117, "epoch": 3026} {"train_loss": -6.397841453552246, "global_step": 127118, "epoch": 3026} {"train_loss": -6.544600486755371, "global_step": 127119, "epoch": 3026} {"train_loss": -6.528902053833008, "global_step": 127120, "epoch": 3026} {"train_loss": -6.468183517456055, "global_step": 127121, "epoch": 3026} {"train_loss": -6.611472129821777, "global_step": 127122, "epoch": 3026} {"train_loss": -6.6391777992248535, "global_step": 127123, "epoch": 3026} {"train_loss": -6.6274333000183105, "global_step": 127124, "epoch": 3026} {"train_loss": -6.602055549621582, "global_step": 127125, "epoch": 3026} {"train_loss": -6.594496726989746, "global_step": 127126, "epoch": 3026} {"train_loss": -6.528141021728516, "global_step": 127127, "epoch": 3026} {"train_loss": -6.641002655029297, "global_step": 127128, "epoch": 3026} {"train_loss": -6.592947483062744, "global_step": 127129, "epoch": 3026} {"train_loss": -6.6372857093811035, "global_step": 127130, "epoch": 3026} {"train_loss": -6.555902481079102, "global_step": 127131, "epoch": 3026} {"train_loss": -6.585758209228516, "global_step": 127132, "epoch": 3026} {"train_loss": -6.613861049924578, "global_step": 127133, "epoch": 3026, "val_loss": 68263.609375} {"train_loss": -6.585089206695557, "global_step": 127134, "epoch": 3027} {"train_loss": -6.636403560638428, "global_step": 127135, "epoch": 3027} {"train_loss": -6.506985664367676, "global_step": 127136, "epoch": 3027} {"train_loss": -6.559467315673828, "global_step": 127137, "epoch": 3027} {"train_loss": -6.5525383949279785, "global_step": 127138, "epoch": 3027} {"train_loss": -6.6027631759643555, "global_step": 127139, "epoch": 3027} {"train_loss": -6.46420955657959, "global_step": 127140, "epoch": 3027} {"train_loss": -6.583595275878906, "global_step": 127141, "epoch": 3027} {"train_loss": -6.595632553100586, "global_step": 127142, "epoch": 3027} {"train_loss": -6.622467041015625, "global_step": 127143, "epoch": 3027} {"train_loss": -6.732496738433838, "global_step": 127144, "epoch": 3027} {"train_loss": -6.551393985748291, "global_step": 127145, "epoch": 3027} {"train_loss": -6.611527442932129, "global_step": 127146, "epoch": 3027} {"train_loss": -6.5951080322265625, "global_step": 127147, "epoch": 3027} {"train_loss": -6.637840270996094, "global_step": 127148, "epoch": 3027} {"train_loss": -6.678905963897705, "global_step": 127149, "epoch": 3027} {"train_loss": -6.605922222137451, "global_step": 127150, "epoch": 3027} {"train_loss": -6.558392524719238, "global_step": 127151, "epoch": 3027} {"train_loss": -6.655308246612549, "global_step": 127152, "epoch": 3027} {"train_loss": -6.757848739624023, "global_step": 127153, "epoch": 3027} {"train_loss": -6.5260515213012695, "global_step": 127154, "epoch": 3027} {"train_loss": -6.698945045471191, "global_step": 127155, "epoch": 3027} {"train_loss": -6.693890571594238, "global_step": 127156, "epoch": 3027} {"train_loss": -6.511622428894043, "global_step": 127157, "epoch": 3027} {"train_loss": -6.558754920959473, "global_step": 127158, "epoch": 3027} {"train_loss": -6.742292404174805, "global_step": 127159, "epoch": 3027} {"train_loss": -6.574975490570068, "global_step": 127160, "epoch": 3027} {"train_loss": -6.6654839515686035, "global_step": 127161, "epoch": 3027} {"train_loss": -6.526041507720947, "global_step": 127162, "epoch": 3027} {"train_loss": -6.599495887756348, "global_step": 127163, "epoch": 3027} {"train_loss": -6.647510528564453, "global_step": 127164, "epoch": 3027} {"train_loss": -6.602665901184082, "global_step": 127165, "epoch": 3027} {"train_loss": -6.504809856414795, "global_step": 127166, "epoch": 3027} {"train_loss": -6.5260844230651855, "global_step": 127167, "epoch": 3027} {"train_loss": -6.559837341308594, "global_step": 127168, "epoch": 3027} {"train_loss": -6.508378982543945, "global_step": 127169, "epoch": 3027} {"train_loss": -6.48455810546875, "global_step": 127170, "epoch": 3027} {"train_loss": -6.507011413574219, "global_step": 127171, "epoch": 3027} {"train_loss": -6.571961402893066, "global_step": 127172, "epoch": 3027} {"train_loss": -6.669961929321289, "global_step": 127173, "epoch": 3027} {"train_loss": -6.569545745849609, "global_step": 127174, "epoch": 3027} {"train_loss": -6.5921801044827415, "global_step": 127175, "epoch": 3027, "val_loss": 68082.75} {"train_loss": -6.662718772888184, "global_step": 127176, "epoch": 3028} {"train_loss": -6.551377296447754, "global_step": 127177, "epoch": 3028} {"train_loss": -6.672650337219238, "global_step": 127178, "epoch": 3028} {"train_loss": -6.696101188659668, "global_step": 127179, "epoch": 3028} {"train_loss": -6.5657758712768555, "global_step": 127180, "epoch": 3028} {"train_loss": -6.63957405090332, "global_step": 127181, "epoch": 3028} {"train_loss": -6.622618675231934, "global_step": 127182, "epoch": 3028} {"train_loss": -6.8060784339904785, "global_step": 127183, "epoch": 3028} {"train_loss": -6.505925178527832, "global_step": 127184, "epoch": 3028} {"train_loss": -6.68384313583374, "global_step": 127185, "epoch": 3028} {"train_loss": -6.540383338928223, "global_step": 127186, "epoch": 3028} {"train_loss": -6.600254535675049, "global_step": 127187, "epoch": 3028} {"train_loss": -6.640616416931152, "global_step": 127188, "epoch": 3028} {"train_loss": -6.462596893310547, "global_step": 127189, "epoch": 3028} {"train_loss": -6.513438701629639, "global_step": 127190, "epoch": 3028} {"train_loss": -6.5751166343688965, "global_step": 127191, "epoch": 3028} {"train_loss": -6.613086223602295, "global_step": 127192, "epoch": 3028} {"train_loss": -6.575766086578369, "global_step": 127193, "epoch": 3028} {"train_loss": -6.551189422607422, "global_step": 127194, "epoch": 3028} {"train_loss": -6.564431667327881, "global_step": 127195, "epoch": 3028} {"train_loss": -6.640379905700684, "global_step": 127196, "epoch": 3028} {"train_loss": -6.612466812133789, "global_step": 127197, "epoch": 3028} {"train_loss": -6.473818778991699, "global_step": 127198, "epoch": 3028} {"train_loss": -6.759017467498779, "global_step": 127199, "epoch": 3028} {"train_loss": -6.710488319396973, "global_step": 127200, "epoch": 3028} {"train_loss": -6.522903919219971, "global_step": 127201, "epoch": 3028} {"train_loss": -6.579898834228516, "global_step": 127202, "epoch": 3028} {"train_loss": -6.638355255126953, "global_step": 127203, "epoch": 3028} {"train_loss": -6.6720290184021, "global_step": 127204, "epoch": 3028} {"train_loss": -6.528800010681152, "global_step": 127205, "epoch": 3028} {"train_loss": -6.742969989776611, "global_step": 127206, "epoch": 3028} {"train_loss": -6.595077037811279, "global_step": 127207, "epoch": 3028} {"train_loss": -6.656863212585449, "global_step": 127208, "epoch": 3028} {"train_loss": -6.56715726852417, "global_step": 127209, "epoch": 3028} {"train_loss": -6.643402099609375, "global_step": 127210, "epoch": 3028} {"train_loss": -6.523646354675293, "global_step": 127211, "epoch": 3028} {"train_loss": -6.583010673522949, "global_step": 127212, "epoch": 3028} {"train_loss": -6.652268409729004, "global_step": 127213, "epoch": 3028} {"train_loss": -6.548861026763916, "global_step": 127214, "epoch": 3028} {"train_loss": -6.5729265213012695, "global_step": 127215, "epoch": 3028} {"train_loss": -6.562952995300293, "global_step": 127216, "epoch": 3028} {"train_loss": -6.604841232299805, "global_step": 127217, "epoch": 3028, "val_loss": 68034.8125} {"train_loss": -6.679853439331055, "global_step": 127218, "epoch": 3029} {"train_loss": -6.645431041717529, "global_step": 127219, "epoch": 3029} {"train_loss": -6.65596866607666, "global_step": 127220, "epoch": 3029} {"train_loss": -6.763674259185791, "global_step": 127221, "epoch": 3029} {"train_loss": -6.662306308746338, "global_step": 127222, "epoch": 3029} {"train_loss": -6.639540195465088, "global_step": 127223, "epoch": 3029} {"train_loss": -6.64004373550415, "global_step": 127224, "epoch": 3029} {"train_loss": -6.527098178863525, "global_step": 127225, "epoch": 3029} {"train_loss": -6.587105751037598, "global_step": 127226, "epoch": 3029} {"train_loss": -6.5739240646362305, "global_step": 127227, "epoch": 3029} {"train_loss": -6.669198036193848, "global_step": 127228, "epoch": 3029} {"train_loss": -6.600461006164551, "global_step": 127229, "epoch": 3029} {"train_loss": -6.593258857727051, "global_step": 127230, "epoch": 3029} {"train_loss": -6.682645797729492, "global_step": 127231, "epoch": 3029} {"train_loss": -6.644517421722412, "global_step": 127232, "epoch": 3029} {"train_loss": -6.703653335571289, "global_step": 127233, "epoch": 3029} {"train_loss": -6.491518974304199, "global_step": 127234, "epoch": 3029} {"train_loss": -6.507781028747559, "global_step": 127235, "epoch": 3029} {"train_loss": -6.72601318359375, "global_step": 127236, "epoch": 3029} {"train_loss": -6.667006969451904, "global_step": 127237, "epoch": 3029} {"train_loss": -6.637210845947266, "global_step": 127238, "epoch": 3029} {"train_loss": -6.6523261070251465, "global_step": 127239, "epoch": 3029} {"train_loss": -6.675131797790527, "global_step": 127240, "epoch": 3029} {"train_loss": -6.650051116943359, "global_step": 127241, "epoch": 3029} {"train_loss": -6.633975982666016, "global_step": 127242, "epoch": 3029} {"train_loss": -6.605844497680664, "global_step": 127243, "epoch": 3029} {"train_loss": -6.722080230712891, "global_step": 127244, "epoch": 3029} {"train_loss": -6.630171775817871, "global_step": 127245, "epoch": 3029} {"train_loss": -6.649738311767578, "global_step": 127246, "epoch": 3029} {"train_loss": -6.7248992919921875, "global_step": 127247, "epoch": 3029} {"train_loss": -6.682740211486816, "global_step": 127248, "epoch": 3029} {"train_loss": -6.706541061401367, "global_step": 127249, "epoch": 3029} {"train_loss": -6.712455749511719, "global_step": 127250, "epoch": 3029} {"train_loss": -6.777678489685059, "global_step": 127251, "epoch": 3029} {"train_loss": -6.624934673309326, "global_step": 127252, "epoch": 3029} {"train_loss": -6.623493194580078, "global_step": 127253, "epoch": 3029} {"train_loss": -6.677291393280029, "global_step": 127254, "epoch": 3029} {"train_loss": -6.584689140319824, "global_step": 127255, "epoch": 3029} {"train_loss": -6.672579765319824, "global_step": 127256, "epoch": 3029} {"train_loss": -6.615487098693848, "global_step": 127257, "epoch": 3029} {"train_loss": -6.488262176513672, "global_step": 127258, "epoch": 3029} {"train_loss": -6.644506704239618, "global_step": 127259, "epoch": 3029, "val_loss": 68259.6640625} {"train_loss": -6.709212303161621, "global_step": 127260, "epoch": 3030} {"train_loss": -6.4341349601745605, "global_step": 127261, "epoch": 3030} {"train_loss": -6.788841247558594, "global_step": 127262, "epoch": 3030} {"train_loss": -6.585175514221191, "global_step": 127263, "epoch": 3030} {"train_loss": -6.504769802093506, "global_step": 127264, "epoch": 3030} {"train_loss": -6.712538719177246, "global_step": 127265, "epoch": 3030} {"train_loss": -6.701285362243652, "global_step": 127266, "epoch": 3030} {"train_loss": -6.694746971130371, "global_step": 127267, "epoch": 3030} {"train_loss": -6.525996208190918, "global_step": 127268, "epoch": 3030} {"train_loss": -6.546820640563965, "global_step": 127269, "epoch": 3030} {"train_loss": -6.464272499084473, "global_step": 127270, "epoch": 3030} {"train_loss": -6.448611259460449, "global_step": 127271, "epoch": 3030} {"train_loss": -6.620884418487549, "global_step": 127272, "epoch": 3030} {"train_loss": -6.483254432678223, "global_step": 127273, "epoch": 3030} {"train_loss": -6.463894844055176, "global_step": 127274, "epoch": 3030} {"train_loss": -6.692009925842285, "global_step": 127275, "epoch": 3030} {"train_loss": -6.659082889556885, "global_step": 127276, "epoch": 3030} {"train_loss": -6.587996959686279, "global_step": 127277, "epoch": 3030} {"train_loss": -6.600951194763184, "global_step": 127278, "epoch": 3030} {"train_loss": -6.498564720153809, "global_step": 127279, "epoch": 3030} {"train_loss": -6.5631279945373535, "global_step": 127280, "epoch": 3030} {"train_loss": -6.354755401611328, "global_step": 127281, "epoch": 3030} {"train_loss": -6.556807518005371, "global_step": 127282, "epoch": 3030} {"train_loss": -6.556812763214111, "global_step": 127283, "epoch": 3030} {"train_loss": -6.597367763519287, "global_step": 127284, "epoch": 3030} {"train_loss": -6.637124061584473, "global_step": 127285, "epoch": 3030} {"train_loss": -6.483323574066162, "global_step": 127286, "epoch": 3030} {"train_loss": -6.551319122314453, "global_step": 127287, "epoch": 3030} {"train_loss": -6.4413652420043945, "global_step": 127288, "epoch": 3030} {"train_loss": -6.604452133178711, "global_step": 127289, "epoch": 3030} {"train_loss": -6.522985458374023, "global_step": 127290, "epoch": 3030} {"train_loss": -6.46277379989624, "global_step": 127291, "epoch": 3030} {"train_loss": -6.626309394836426, "global_step": 127292, "epoch": 3030} {"train_loss": -6.43499231338501, "global_step": 127293, "epoch": 3030} {"train_loss": -6.493259906768799, "global_step": 127294, "epoch": 3030} {"train_loss": -6.490929126739502, "global_step": 127295, "epoch": 3030} {"train_loss": -6.509474754333496, "global_step": 127296, "epoch": 3030} {"train_loss": -6.538117408752441, "global_step": 127297, "epoch": 3030} {"train_loss": -6.531657695770264, "global_step": 127298, "epoch": 3030} {"train_loss": -6.672317981719971, "global_step": 127299, "epoch": 3030} {"train_loss": -6.563738822937012, "global_step": 127300, "epoch": 3030} {"train_loss": -6.558407715388706, "global_step": 127301, "epoch": 3030, "val_loss": 68100.703125} {"train_loss": -6.568703651428223, "global_step": 127302, "epoch": 3031} {"train_loss": -6.4981231689453125, "global_step": 127303, "epoch": 3031} {"train_loss": -6.544027805328369, "global_step": 127304, "epoch": 3031} {"train_loss": -6.423209190368652, "global_step": 127305, "epoch": 3031} {"train_loss": -6.610346794128418, "global_step": 127306, "epoch": 3031} {"train_loss": -6.496675968170166, "global_step": 127307, "epoch": 3031} {"train_loss": -6.525005340576172, "global_step": 127308, "epoch": 3031} {"train_loss": -6.420514106750488, "global_step": 127309, "epoch": 3031} {"train_loss": -6.660357475280762, "global_step": 127310, "epoch": 3031} {"train_loss": -6.480186939239502, "global_step": 127311, "epoch": 3031} {"train_loss": -6.614690780639648, "global_step": 127312, "epoch": 3031} {"train_loss": -6.607245445251465, "global_step": 127313, "epoch": 3031} {"train_loss": -6.520791053771973, "global_step": 127314, "epoch": 3031} {"train_loss": -6.624457359313965, "global_step": 127315, "epoch": 3031} {"train_loss": -6.704163551330566, "global_step": 127316, "epoch": 3031} {"train_loss": -6.590747833251953, "global_step": 127317, "epoch": 3031} {"train_loss": -6.482539176940918, "global_step": 127318, "epoch": 3031} {"train_loss": -6.533247947692871, "global_step": 127319, "epoch": 3031} {"train_loss": -6.385663986206055, "global_step": 127320, "epoch": 3031} {"train_loss": -6.550705432891846, "global_step": 127321, "epoch": 3031} {"train_loss": -6.553907871246338, "global_step": 127322, "epoch": 3031} {"train_loss": -6.51807165145874, "global_step": 127323, "epoch": 3031} {"train_loss": -6.632288932800293, "global_step": 127324, "epoch": 3031} {"train_loss": -6.531332015991211, "global_step": 127325, "epoch": 3031} {"train_loss": -6.55643367767334, "global_step": 127326, "epoch": 3031} {"train_loss": -6.5886125564575195, "global_step": 127327, "epoch": 3031} {"train_loss": -6.544696807861328, "global_step": 127328, "epoch": 3031} {"train_loss": -6.648284912109375, "global_step": 127329, "epoch": 3031} {"train_loss": -6.477124214172363, "global_step": 127330, "epoch": 3031} {"train_loss": -6.590142726898193, "global_step": 127331, "epoch": 3031} {"train_loss": -6.574724197387695, "global_step": 127332, "epoch": 3031} {"train_loss": -6.601673126220703, "global_step": 127333, "epoch": 3031} {"train_loss": -6.505166530609131, "global_step": 127334, "epoch": 3031} {"train_loss": -6.674617767333984, "global_step": 127335, "epoch": 3031} {"train_loss": -6.65080451965332, "global_step": 127336, "epoch": 3031} {"train_loss": -6.501370429992676, "global_step": 127337, "epoch": 3031} {"train_loss": -6.671490669250488, "global_step": 127338, "epoch": 3031} {"train_loss": -6.473939895629883, "global_step": 127339, "epoch": 3031} {"train_loss": -6.5547637939453125, "global_step": 127340, "epoch": 3031} {"train_loss": -6.582769393920898, "global_step": 127341, "epoch": 3031} {"train_loss": -6.518837928771973, "global_step": 127342, "epoch": 3031} {"train_loss": -6.555983168738229, "global_step": 127343, "epoch": 3031, "val_loss": 68169.890625} {"train_loss": -6.60771369934082, "global_step": 127344, "epoch": 3032} {"train_loss": -6.636639595031738, "global_step": 127345, "epoch": 3032} {"train_loss": -6.6842041015625, "global_step": 127346, "epoch": 3032} {"train_loss": -6.535245895385742, "global_step": 127347, "epoch": 3032} {"train_loss": -6.647930145263672, "global_step": 127348, "epoch": 3032} {"train_loss": -6.678873062133789, "global_step": 127349, "epoch": 3032} {"train_loss": -6.73333740234375, "global_step": 127350, "epoch": 3032} {"train_loss": -6.425420761108398, "global_step": 127351, "epoch": 3032} {"train_loss": -6.6447834968566895, "global_step": 127352, "epoch": 3032} {"train_loss": -6.681563854217529, "global_step": 127353, "epoch": 3032} {"train_loss": -6.617110252380371, "global_step": 127354, "epoch": 3032} {"train_loss": -6.570765972137451, "global_step": 127355, "epoch": 3032} {"train_loss": -6.665360450744629, "global_step": 127356, "epoch": 3032} {"train_loss": -6.662539005279541, "global_step": 127357, "epoch": 3032} {"train_loss": -6.700745582580566, "global_step": 127358, "epoch": 3032} {"train_loss": -6.632734298706055, "global_step": 127359, "epoch": 3032} {"train_loss": -6.562073707580566, "global_step": 127360, "epoch": 3032} {"train_loss": -6.7123613357543945, "global_step": 127361, "epoch": 3032} {"train_loss": -6.652259826660156, "global_step": 127362, "epoch": 3032} {"train_loss": -6.486132621765137, "global_step": 127363, "epoch": 3032} {"train_loss": -6.6139373779296875, "global_step": 127364, "epoch": 3032} {"train_loss": -6.4516191482543945, "global_step": 127365, "epoch": 3032} {"train_loss": -6.541810989379883, "global_step": 127366, "epoch": 3032} {"train_loss": -6.576524257659912, "global_step": 127367, "epoch": 3032} {"train_loss": -6.450641632080078, "global_step": 127368, "epoch": 3032} {"train_loss": -6.58698844909668, "global_step": 127369, "epoch": 3032} {"train_loss": -6.719564437866211, "global_step": 127370, "epoch": 3032} {"train_loss": -6.5182671546936035, "global_step": 127371, "epoch": 3032} {"train_loss": -6.507179260253906, "global_step": 127372, "epoch": 3032} {"train_loss": -6.484321594238281, "global_step": 127373, "epoch": 3032} {"train_loss": -6.609373092651367, "global_step": 127374, "epoch": 3032} {"train_loss": -6.5620551109313965, "global_step": 127375, "epoch": 3032} {"train_loss": -6.542737007141113, "global_step": 127376, "epoch": 3032} {"train_loss": -6.5521016120910645, "global_step": 127377, "epoch": 3032} {"train_loss": -6.504294395446777, "global_step": 127378, "epoch": 3032} {"train_loss": -6.609630584716797, "global_step": 127379, "epoch": 3032} {"train_loss": -6.5051164627075195, "global_step": 127380, "epoch": 3032} {"train_loss": -6.57655143737793, "global_step": 127381, "epoch": 3032} {"train_loss": -6.571264266967773, "global_step": 127382, "epoch": 3032} {"train_loss": -6.553122520446777, "global_step": 127383, "epoch": 3032} {"train_loss": -6.500710487365723, "global_step": 127384, "epoch": 3032} {"train_loss": -6.585050480706351, "global_step": 127385, "epoch": 3032, "val_loss": 67995.015625} {"train_loss": -6.676628112792969, "global_step": 127386, "epoch": 3033} {"train_loss": -6.595386505126953, "global_step": 127387, "epoch": 3033} {"train_loss": -6.649941444396973, "global_step": 127388, "epoch": 3033} {"train_loss": -6.708152770996094, "global_step": 127389, "epoch": 3033} {"train_loss": -6.56929874420166, "global_step": 127390, "epoch": 3033} {"train_loss": -6.586920738220215, "global_step": 127391, "epoch": 3033} {"train_loss": -6.559688568115234, "global_step": 127392, "epoch": 3033} {"train_loss": -6.649543762207031, "global_step": 127393, "epoch": 3033} {"train_loss": -6.561023712158203, "global_step": 127394, "epoch": 3033} {"train_loss": -6.550189971923828, "global_step": 127395, "epoch": 3033} {"train_loss": -6.711977958679199, "global_step": 127396, "epoch": 3033} {"train_loss": -6.66440486907959, "global_step": 127397, "epoch": 3033} {"train_loss": -6.634518623352051, "global_step": 127398, "epoch": 3033} {"train_loss": -6.630350112915039, "global_step": 127399, "epoch": 3033} {"train_loss": -6.609631538391113, "global_step": 127400, "epoch": 3033} {"train_loss": -6.638675689697266, "global_step": 127401, "epoch": 3033} {"train_loss": -6.600688934326172, "global_step": 127402, "epoch": 3033} {"train_loss": -6.517982482910156, "global_step": 127403, "epoch": 3033} {"train_loss": -6.565810203552246, "global_step": 127404, "epoch": 3033} {"train_loss": -6.548127174377441, "global_step": 127405, "epoch": 3033} {"train_loss": -6.546651840209961, "global_step": 127406, "epoch": 3033} {"train_loss": -6.593393802642822, "global_step": 127407, "epoch": 3033} {"train_loss": -6.718355178833008, "global_step": 127408, "epoch": 3033} {"train_loss": -6.478954792022705, "global_step": 127409, "epoch": 3033} {"train_loss": -6.6386566162109375, "global_step": 127410, "epoch": 3033} {"train_loss": -6.501126289367676, "global_step": 127411, "epoch": 3033} {"train_loss": -6.567379951477051, "global_step": 127412, "epoch": 3033} {"train_loss": -6.386230945587158, "global_step": 127413, "epoch": 3033} {"train_loss": -6.635194301605225, "global_step": 127414, "epoch": 3033} {"train_loss": -6.4551191329956055, "global_step": 127415, "epoch": 3033} {"train_loss": -6.599085807800293, "global_step": 127416, "epoch": 3033} {"train_loss": -6.496286392211914, "global_step": 127417, "epoch": 3033} {"train_loss": -6.492755889892578, "global_step": 127418, "epoch": 3033} {"train_loss": -6.506642818450928, "global_step": 127419, "epoch": 3033} {"train_loss": -6.534172534942627, "global_step": 127420, "epoch": 3033} {"train_loss": -6.6399126052856445, "global_step": 127421, "epoch": 3033} {"train_loss": -6.587742805480957, "global_step": 127422, "epoch": 3033} {"train_loss": -6.47824239730835, "global_step": 127423, "epoch": 3033} {"train_loss": -6.513462543487549, "global_step": 127424, "epoch": 3033} {"train_loss": -6.4893083572387695, "global_step": 127425, "epoch": 3033} {"train_loss": -6.481663703918457, "global_step": 127426, "epoch": 3033} {"train_loss": -6.577167159035092, "global_step": 127427, "epoch": 3033, "val_loss": 67913.1796875} {"train_loss": -6.613722801208496, "global_step": 127428, "epoch": 3034} {"train_loss": -6.546613693237305, "global_step": 127429, "epoch": 3034} {"train_loss": -6.554572582244873, "global_step": 127430, "epoch": 3034} {"train_loss": -6.66387939453125, "global_step": 127431, "epoch": 3034} {"train_loss": -6.586589813232422, "global_step": 127432, "epoch": 3034} {"train_loss": -6.648369312286377, "global_step": 127433, "epoch": 3034} {"train_loss": -6.612870216369629, "global_step": 127434, "epoch": 3034} {"train_loss": -6.654668807983398, "global_step": 127435, "epoch": 3034} {"train_loss": -6.525492191314697, "global_step": 127436, "epoch": 3034} {"train_loss": -6.450155258178711, "global_step": 127437, "epoch": 3034} {"train_loss": -6.600776672363281, "global_step": 127438, "epoch": 3034} {"train_loss": -6.52664852142334, "global_step": 127439, "epoch": 3034} {"train_loss": -6.535531997680664, "global_step": 127440, "epoch": 3034} {"train_loss": -6.522646903991699, "global_step": 127441, "epoch": 3034} {"train_loss": -6.476500034332275, "global_step": 127442, "epoch": 3034} {"train_loss": -6.5579705238342285, "global_step": 127443, "epoch": 3034} {"train_loss": -6.627202033996582, "global_step": 127444, "epoch": 3034} {"train_loss": -6.600340843200684, "global_step": 127445, "epoch": 3034} {"train_loss": -6.663094520568848, "global_step": 127446, "epoch": 3034} {"train_loss": -6.524997234344482, "global_step": 127447, "epoch": 3034} {"train_loss": -6.668943405151367, "global_step": 127448, "epoch": 3034} {"train_loss": -6.549246311187744, "global_step": 127449, "epoch": 3034} {"train_loss": -6.4975690841674805, "global_step": 127450, "epoch": 3034} {"train_loss": -6.608419418334961, "global_step": 127451, "epoch": 3034} {"train_loss": -6.64309024810791, "global_step": 127452, "epoch": 3034} {"train_loss": -6.69498872756958, "global_step": 127453, "epoch": 3034} {"train_loss": -6.6213698387146, "global_step": 127454, "epoch": 3034} {"train_loss": -6.519536018371582, "global_step": 127455, "epoch": 3034} {"train_loss": -6.491089820861816, "global_step": 127456, "epoch": 3034} {"train_loss": -6.67063045501709, "global_step": 127457, "epoch": 3034} {"train_loss": -6.591987609863281, "global_step": 127458, "epoch": 3034} {"train_loss": -6.706284523010254, "global_step": 127459, "epoch": 3034} {"train_loss": -6.620429992675781, "global_step": 127460, "epoch": 3034} {"train_loss": -6.576796531677246, "global_step": 127461, "epoch": 3034} {"train_loss": -6.570594787597656, "global_step": 127462, "epoch": 3034} {"train_loss": -6.470941543579102, "global_step": 127463, "epoch": 3034} {"train_loss": -6.446732521057129, "global_step": 127464, "epoch": 3034} {"train_loss": -6.699040412902832, "global_step": 127465, "epoch": 3034} {"train_loss": -6.603135108947754, "global_step": 127466, "epoch": 3034} {"train_loss": -6.657410144805908, "global_step": 127467, "epoch": 3034} {"train_loss": -6.573225021362305, "global_step": 127468, "epoch": 3034} {"train_loss": -6.584886233011882, "global_step": 127469, "epoch": 3034, "val_loss": 68036.2578125} {"train_loss": -6.439367294311523, "global_step": 127470, "epoch": 3035} {"train_loss": -6.54437255859375, "global_step": 127471, "epoch": 3035} {"train_loss": -6.582453727722168, "global_step": 127472, "epoch": 3035} {"train_loss": -6.493123531341553, "global_step": 127473, "epoch": 3035} {"train_loss": -6.477198600769043, "global_step": 127474, "epoch": 3035} {"train_loss": -6.549979209899902, "global_step": 127475, "epoch": 3035} {"train_loss": -6.566978454589844, "global_step": 127476, "epoch": 3035} {"train_loss": -6.615076541900635, "global_step": 127477, "epoch": 3035} {"train_loss": -6.436441421508789, "global_step": 127478, "epoch": 3035} {"train_loss": -6.600954055786133, "global_step": 127479, "epoch": 3035} {"train_loss": -6.646306037902832, "global_step": 127480, "epoch": 3035} {"train_loss": -6.638400077819824, "global_step": 127481, "epoch": 3035} {"train_loss": -6.5702104568481445, "global_step": 127482, "epoch": 3035} {"train_loss": -6.525769233703613, "global_step": 127483, "epoch": 3035} {"train_loss": -6.642793655395508, "global_step": 127484, "epoch": 3035} {"train_loss": -6.623854637145996, "global_step": 127485, "epoch": 3035} {"train_loss": -6.667384624481201, "global_step": 127486, "epoch": 3035} {"train_loss": -6.599000930786133, "global_step": 127487, "epoch": 3035} {"train_loss": -6.6020989418029785, "global_step": 127488, "epoch": 3035} {"train_loss": -6.772675514221191, "global_step": 127489, "epoch": 3035} {"train_loss": -6.614192008972168, "global_step": 127490, "epoch": 3035} {"train_loss": -6.637568473815918, "global_step": 127491, "epoch": 3035} {"train_loss": -6.663363933563232, "global_step": 127492, "epoch": 3035} {"train_loss": -6.586658477783203, "global_step": 127493, "epoch": 3035} {"train_loss": -6.62490177154541, "global_step": 127494, "epoch": 3035} {"train_loss": -6.652065277099609, "global_step": 127495, "epoch": 3035} {"train_loss": -6.585031032562256, "global_step": 127496, "epoch": 3035} {"train_loss": -6.630248069763184, "global_step": 127497, "epoch": 3035} {"train_loss": -6.586867332458496, "global_step": 127498, "epoch": 3035} {"train_loss": -6.640629768371582, "global_step": 127499, "epoch": 3035} {"train_loss": -6.772050857543945, "global_step": 127500, "epoch": 3035} {"train_loss": -6.722290515899658, "global_step": 127501, "epoch": 3035} {"train_loss": -6.673030853271484, "global_step": 127502, "epoch": 3035} {"train_loss": -6.678891181945801, "global_step": 127503, "epoch": 3035} {"train_loss": -6.652060031890869, "global_step": 127504, "epoch": 3035} {"train_loss": -6.682871341705322, "global_step": 127505, "epoch": 3035} {"train_loss": -6.673892498016357, "global_step": 127506, "epoch": 3035} {"train_loss": -6.51353645324707, "global_step": 127507, "epoch": 3035} {"train_loss": -6.589809417724609, "global_step": 127508, "epoch": 3035} {"train_loss": -6.55000114440918, "global_step": 127509, "epoch": 3035} {"train_loss": -6.626377105712891, "global_step": 127510, "epoch": 3035} {"train_loss": -6.612379743939354, "global_step": 127511, "epoch": 3035, "val_loss": 68027.6328125} {"train_loss": -6.739124774932861, "global_step": 127512, "epoch": 3036} {"train_loss": -6.703137397766113, "global_step": 127513, "epoch": 3036} {"train_loss": -6.837535858154297, "global_step": 127514, "epoch": 3036} {"train_loss": -6.6318206787109375, "global_step": 127515, "epoch": 3036} {"train_loss": -6.600816249847412, "global_step": 127516, "epoch": 3036} {"train_loss": -6.640737533569336, "global_step": 127517, "epoch": 3036} {"train_loss": -6.737654685974121, "global_step": 127518, "epoch": 3036} {"train_loss": -6.650634288787842, "global_step": 127519, "epoch": 3036} {"train_loss": -6.599722385406494, "global_step": 127520, "epoch": 3036} {"train_loss": -6.581415176391602, "global_step": 127521, "epoch": 3036} {"train_loss": -6.637689590454102, "global_step": 127522, "epoch": 3036} {"train_loss": -6.671840190887451, "global_step": 127523, "epoch": 3036} {"train_loss": -6.636293888092041, "global_step": 127524, "epoch": 3036} {"train_loss": -6.660885334014893, "global_step": 127525, "epoch": 3036} {"train_loss": -6.700610160827637, "global_step": 127526, "epoch": 3036} {"train_loss": -6.572900772094727, "global_step": 127527, "epoch": 3036} {"train_loss": -6.598326683044434, "global_step": 127528, "epoch": 3036} {"train_loss": -6.644183158874512, "global_step": 127529, "epoch": 3036} {"train_loss": -6.672032356262207, "global_step": 127530, "epoch": 3036} {"train_loss": -6.685384750366211, "global_step": 127531, "epoch": 3036} {"train_loss": -6.620330810546875, "global_step": 127532, "epoch": 3036} {"train_loss": -6.683865070343018, "global_step": 127533, "epoch": 3036} {"train_loss": -6.748826026916504, "global_step": 127534, "epoch": 3036} {"train_loss": -6.539209365844727, "global_step": 127535, "epoch": 3036} {"train_loss": -6.609017848968506, "global_step": 127536, "epoch": 3036} {"train_loss": -6.623558044433594, "global_step": 127537, "epoch": 3036} {"train_loss": -6.6600189208984375, "global_step": 127538, "epoch": 3036} {"train_loss": -6.676692485809326, "global_step": 127539, "epoch": 3036} {"train_loss": -6.573420524597168, "global_step": 127540, "epoch": 3036} {"train_loss": -6.539417266845703, "global_step": 127541, "epoch": 3036} {"train_loss": -6.739311695098877, "global_step": 127542, "epoch": 3036} {"train_loss": -6.576362133026123, "global_step": 127543, "epoch": 3036} {"train_loss": -6.575249671936035, "global_step": 127544, "epoch": 3036} {"train_loss": -6.617424011230469, "global_step": 127545, "epoch": 3036} {"train_loss": -6.581198692321777, "global_step": 127546, "epoch": 3036} {"train_loss": -6.620231628417969, "global_step": 127547, "epoch": 3036} {"train_loss": -6.580784797668457, "global_step": 127548, "epoch": 3036} {"train_loss": -6.452178001403809, "global_step": 127549, "epoch": 3036} {"train_loss": -6.581658840179443, "global_step": 127550, "epoch": 3036} {"train_loss": -6.593611240386963, "global_step": 127551, "epoch": 3036} {"train_loss": -6.583474159240723, "global_step": 127552, "epoch": 3036} {"train_loss": -6.634730475289481, "global_step": 127553, "epoch": 3036, "val_loss": 68235.625} {"train_loss": -6.60166072845459, "global_step": 127554, "epoch": 3037} {"train_loss": -6.617500305175781, "global_step": 127555, "epoch": 3037} {"train_loss": -6.575578689575195, "global_step": 127556, "epoch": 3037} {"train_loss": -6.582624435424805, "global_step": 127557, "epoch": 3037} {"train_loss": -6.684562683105469, "global_step": 127558, "epoch": 3037} {"train_loss": -6.540671348571777, "global_step": 127559, "epoch": 3037} {"train_loss": -6.705205917358398, "global_step": 127560, "epoch": 3037} {"train_loss": -6.649365425109863, "global_step": 127561, "epoch": 3037} {"train_loss": -6.727737903594971, "global_step": 127562, "epoch": 3037} {"train_loss": -6.704898834228516, "global_step": 127563, "epoch": 3037} {"train_loss": -6.5655107498168945, "global_step": 127564, "epoch": 3037} {"train_loss": -6.764461517333984, "global_step": 127565, "epoch": 3037} {"train_loss": -6.655919075012207, "global_step": 127566, "epoch": 3037} {"train_loss": -6.613373756408691, "global_step": 127567, "epoch": 3037} {"train_loss": -6.767162322998047, "global_step": 127568, "epoch": 3037} {"train_loss": -6.599526405334473, "global_step": 127569, "epoch": 3037} {"train_loss": -6.625890731811523, "global_step": 127570, "epoch": 3037} {"train_loss": -6.701427459716797, "global_step": 127571, "epoch": 3037} {"train_loss": -6.562930107116699, "global_step": 127572, "epoch": 3037} {"train_loss": -6.637255668640137, "global_step": 127573, "epoch": 3037} {"train_loss": -6.54080057144165, "global_step": 127574, "epoch": 3037} {"train_loss": -6.524896621704102, "global_step": 127575, "epoch": 3037} {"train_loss": -6.666014671325684, "global_step": 127576, "epoch": 3037} {"train_loss": -6.61613655090332, "global_step": 127577, "epoch": 3037} {"train_loss": -6.557981967926025, "global_step": 127578, "epoch": 3037} {"train_loss": -6.644020080566406, "global_step": 127579, "epoch": 3037} {"train_loss": -6.682969093322754, "global_step": 127580, "epoch": 3037} {"train_loss": -6.637942314147949, "global_step": 127581, "epoch": 3037} {"train_loss": -6.489720821380615, "global_step": 127582, "epoch": 3037} {"train_loss": -6.521385192871094, "global_step": 127583, "epoch": 3037} {"train_loss": -6.679910659790039, "global_step": 127584, "epoch": 3037} {"train_loss": -6.63350248336792, "global_step": 127585, "epoch": 3037} {"train_loss": -6.667354106903076, "global_step": 127586, "epoch": 3037} {"train_loss": -6.531256675720215, "global_step": 127587, "epoch": 3037} {"train_loss": -6.700451850891113, "global_step": 127588, "epoch": 3037} {"train_loss": -6.556994915008545, "global_step": 127589, "epoch": 3037} {"train_loss": -6.549700736999512, "global_step": 127590, "epoch": 3037} {"train_loss": -6.601912975311279, "global_step": 127591, "epoch": 3037} {"train_loss": -6.544981956481934, "global_step": 127592, "epoch": 3037} {"train_loss": -6.570144176483154, "global_step": 127593, "epoch": 3037} {"train_loss": -6.676799297332764, "global_step": 127594, "epoch": 3037} {"train_loss": -6.621071951729911, "global_step": 127595, "epoch": 3037, "val_loss": 68279.375} {"train_loss": -6.612360000610352, "global_step": 127596, "epoch": 3038} {"train_loss": -6.6352643966674805, "global_step": 127597, "epoch": 3038} {"train_loss": -6.658557891845703, "global_step": 127598, "epoch": 3038} {"train_loss": -6.534642219543457, "global_step": 127599, "epoch": 3038} {"train_loss": -6.574234962463379, "global_step": 127600, "epoch": 3038} {"train_loss": -6.694448471069336, "global_step": 127601, "epoch": 3038} {"train_loss": -6.5198869705200195, "global_step": 127602, "epoch": 3038} {"train_loss": -6.591978073120117, "global_step": 127603, "epoch": 3038} {"train_loss": -6.712376594543457, "global_step": 127604, "epoch": 3038} {"train_loss": -6.6044602394104, "global_step": 127605, "epoch": 3038} {"train_loss": -6.555505275726318, "global_step": 127606, "epoch": 3038} {"train_loss": -6.511146068572998, "global_step": 127607, "epoch": 3038} {"train_loss": -6.571834564208984, "global_step": 127608, "epoch": 3038} {"train_loss": -6.591704368591309, "global_step": 127609, "epoch": 3038} {"train_loss": -6.675049304962158, "global_step": 127610, "epoch": 3038} {"train_loss": -6.574800491333008, "global_step": 127611, "epoch": 3038} {"train_loss": -6.570881366729736, "global_step": 127612, "epoch": 3038} {"train_loss": -6.602372646331787, "global_step": 127613, "epoch": 3038} {"train_loss": -6.5392303466796875, "global_step": 127614, "epoch": 3038} {"train_loss": -6.4468793869018555, "global_step": 127615, "epoch": 3038} {"train_loss": -6.571176528930664, "global_step": 127616, "epoch": 3038} {"train_loss": -6.755908966064453, "global_step": 127617, "epoch": 3038} {"train_loss": -6.662290573120117, "global_step": 127618, "epoch": 3038} {"train_loss": -6.514605522155762, "global_step": 127619, "epoch": 3038} {"train_loss": -6.52083683013916, "global_step": 127620, "epoch": 3038} {"train_loss": -6.494389533996582, "global_step": 127621, "epoch": 3038} {"train_loss": -6.6400017738342285, "global_step": 127622, "epoch": 3038} {"train_loss": -6.57196044921875, "global_step": 127623, "epoch": 3038} {"train_loss": -6.598856449127197, "global_step": 127624, "epoch": 3038} {"train_loss": -6.678666114807129, "global_step": 127625, "epoch": 3038} {"train_loss": -6.5114288330078125, "global_step": 127626, "epoch": 3038} {"train_loss": -6.604154586791992, "global_step": 127627, "epoch": 3038} {"train_loss": -6.592803001403809, "global_step": 127628, "epoch": 3038} {"train_loss": -6.678772926330566, "global_step": 127629, "epoch": 3038} {"train_loss": -6.699005603790283, "global_step": 127630, "epoch": 3038} {"train_loss": -6.64608097076416, "global_step": 127631, "epoch": 3038} {"train_loss": -6.702945232391357, "global_step": 127632, "epoch": 3038} {"train_loss": -6.6195173263549805, "global_step": 127633, "epoch": 3038} {"train_loss": -6.555442810058594, "global_step": 127634, "epoch": 3038} {"train_loss": -6.598923683166504, "global_step": 127635, "epoch": 3038} {"train_loss": -6.578099250793457, "global_step": 127636, "epoch": 3038} {"train_loss": -6.598807879856655, "global_step": 127637, "epoch": 3038, "val_loss": 68003.21875} {"train_loss": -6.715329170227051, "global_step": 127638, "epoch": 3039} {"train_loss": -6.695469856262207, "global_step": 127639, "epoch": 3039} {"train_loss": -6.612936973571777, "global_step": 127640, "epoch": 3039} {"train_loss": -6.709712982177734, "global_step": 127641, "epoch": 3039} {"train_loss": -6.677285194396973, "global_step": 127642, "epoch": 3039} {"train_loss": -6.611930847167969, "global_step": 127643, "epoch": 3039} {"train_loss": -6.627688407897949, "global_step": 127644, "epoch": 3039} {"train_loss": -6.559416770935059, "global_step": 127645, "epoch": 3039} {"train_loss": -6.6635236740112305, "global_step": 127646, "epoch": 3039} {"train_loss": -6.548183441162109, "global_step": 127647, "epoch": 3039} {"train_loss": -6.556927680969238, "global_step": 127648, "epoch": 3039} {"train_loss": -6.555844306945801, "global_step": 127649, "epoch": 3039} {"train_loss": -6.708288192749023, "global_step": 127650, "epoch": 3039} {"train_loss": -6.50200891494751, "global_step": 127651, "epoch": 3039} {"train_loss": -6.691053867340088, "global_step": 127652, "epoch": 3039} {"train_loss": -6.517669200897217, "global_step": 127653, "epoch": 3039} {"train_loss": -6.583465576171875, "global_step": 127654, "epoch": 3039} {"train_loss": -6.603631973266602, "global_step": 127655, "epoch": 3039} {"train_loss": -6.606233596801758, "global_step": 127656, "epoch": 3039} {"train_loss": -6.602160453796387, "global_step": 127657, "epoch": 3039} {"train_loss": -6.662789344787598, "global_step": 127658, "epoch": 3039} {"train_loss": -6.687313556671143, "global_step": 127659, "epoch": 3039} {"train_loss": -6.733610153198242, "global_step": 127660, "epoch": 3039} {"train_loss": -6.712868690490723, "global_step": 127661, "epoch": 3039} {"train_loss": -6.65122652053833, "global_step": 127662, "epoch": 3039} {"train_loss": -6.629714012145996, "global_step": 127663, "epoch": 3039} {"train_loss": -6.673521041870117, "global_step": 127664, "epoch": 3039} {"train_loss": -6.720231056213379, "global_step": 127665, "epoch": 3039} {"train_loss": -6.659071922302246, "global_step": 127666, "epoch": 3039} {"train_loss": -6.6588239669799805, "global_step": 127667, "epoch": 3039} {"train_loss": -6.617824554443359, "global_step": 127668, "epoch": 3039} {"train_loss": -6.570408821105957, "global_step": 127669, "epoch": 3039} {"train_loss": -6.579826831817627, "global_step": 127670, "epoch": 3039} {"train_loss": -6.508784294128418, "global_step": 127671, "epoch": 3039} {"train_loss": -6.318790912628174, "global_step": 127672, "epoch": 3039} {"train_loss": -6.543321132659912, "global_step": 127673, "epoch": 3039} {"train_loss": -6.68919563293457, "global_step": 127674, "epoch": 3039} {"train_loss": -6.535798072814941, "global_step": 127675, "epoch": 3039} {"train_loss": -6.5989603996276855, "global_step": 127676, "epoch": 3039} {"train_loss": -6.531899929046631, "global_step": 127677, "epoch": 3039} {"train_loss": -6.601104736328125, "global_step": 127678, "epoch": 3039} {"train_loss": -6.613824344816662, "global_step": 127679, "epoch": 3039, "val_loss": 67974.4921875} {"train_loss": -6.540319442749023, "global_step": 127680, "epoch": 3040} {"train_loss": -6.660024642944336, "global_step": 127681, "epoch": 3040} {"train_loss": -6.589451313018799, "global_step": 127682, "epoch": 3040} {"train_loss": -6.483281135559082, "global_step": 127683, "epoch": 3040} {"train_loss": -6.680661678314209, "global_step": 127684, "epoch": 3040} {"train_loss": -6.532415390014648, "global_step": 127685, "epoch": 3040} {"train_loss": -6.618459701538086, "global_step": 127686, "epoch": 3040} {"train_loss": -6.658322334289551, "global_step": 127687, "epoch": 3040} {"train_loss": -6.597651481628418, "global_step": 127688, "epoch": 3040} {"train_loss": -6.608193874359131, "global_step": 127689, "epoch": 3040} {"train_loss": -6.667520523071289, "global_step": 127690, "epoch": 3040} {"train_loss": -6.635491371154785, "global_step": 127691, "epoch": 3040} {"train_loss": -6.504573822021484, "global_step": 127692, "epoch": 3040} {"train_loss": -6.607137203216553, "global_step": 127693, "epoch": 3040} {"train_loss": -6.5704345703125, "global_step": 127694, "epoch": 3040} {"train_loss": -6.574981689453125, "global_step": 127695, "epoch": 3040} {"train_loss": -6.490395545959473, "global_step": 127696, "epoch": 3040} {"train_loss": -6.676082134246826, "global_step": 127697, "epoch": 3040} {"train_loss": -6.533218860626221, "global_step": 127698, "epoch": 3040} {"train_loss": -6.615001678466797, "global_step": 127699, "epoch": 3040} {"train_loss": -6.675994873046875, "global_step": 127700, "epoch": 3040} {"train_loss": -6.601632118225098, "global_step": 127701, "epoch": 3040} {"train_loss": -6.565818786621094, "global_step": 127702, "epoch": 3040} {"train_loss": -6.48806619644165, "global_step": 127703, "epoch": 3040} {"train_loss": -6.6787638664245605, "global_step": 127704, "epoch": 3040} {"train_loss": -6.471205234527588, "global_step": 127705, "epoch": 3040} {"train_loss": -6.593229293823242, "global_step": 127706, "epoch": 3040} {"train_loss": -6.682665824890137, "global_step": 127707, "epoch": 3040} {"train_loss": -6.487981796264648, "global_step": 127708, "epoch": 3040} {"train_loss": -6.733196258544922, "global_step": 127709, "epoch": 3040} {"train_loss": -6.517096996307373, "global_step": 127710, "epoch": 3040} {"train_loss": -6.538370609283447, "global_step": 127711, "epoch": 3040} {"train_loss": -6.586413383483887, "global_step": 127712, "epoch": 3040} {"train_loss": -6.504499435424805, "global_step": 127713, "epoch": 3040} {"train_loss": -6.5151753425598145, "global_step": 127714, "epoch": 3040} {"train_loss": -6.422131538391113, "global_step": 127715, "epoch": 3040} {"train_loss": -6.6416707038879395, "global_step": 127716, "epoch": 3040} {"train_loss": -6.4940409660339355, "global_step": 127717, "epoch": 3040} {"train_loss": -6.528599262237549, "global_step": 127718, "epoch": 3040} {"train_loss": -6.677960395812988, "global_step": 127719, "epoch": 3040} {"train_loss": -6.492639541625977, "global_step": 127720, "epoch": 3040} {"train_loss": -6.578262238275437, "global_step": 127721, "epoch": 3040, "val_loss": 67936.796875} {"train_loss": -6.424623489379883, "global_step": 127722, "epoch": 3041} {"train_loss": -6.597097396850586, "global_step": 127723, "epoch": 3041} {"train_loss": -6.568198204040527, "global_step": 127724, "epoch": 3041} {"train_loss": -6.587814807891846, "global_step": 127725, "epoch": 3041} {"train_loss": -6.631162166595459, "global_step": 127726, "epoch": 3041} {"train_loss": -6.461000442504883, "global_step": 127727, "epoch": 3041} {"train_loss": -6.619751930236816, "global_step": 127728, "epoch": 3041} {"train_loss": -6.570073127746582, "global_step": 127729, "epoch": 3041} {"train_loss": -6.614350318908691, "global_step": 127730, "epoch": 3041} {"train_loss": -6.692470550537109, "global_step": 127731, "epoch": 3041} {"train_loss": -6.532868385314941, "global_step": 127732, "epoch": 3041} {"train_loss": -6.673099517822266, "global_step": 127733, "epoch": 3041} {"train_loss": -6.60787296295166, "global_step": 127734, "epoch": 3041} {"train_loss": -6.639301300048828, "global_step": 127735, "epoch": 3041} {"train_loss": -6.694952964782715, "global_step": 127736, "epoch": 3041} {"train_loss": -6.572946071624756, "global_step": 127737, "epoch": 3041} {"train_loss": -6.5140204429626465, "global_step": 127738, "epoch": 3041} {"train_loss": -6.625295639038086, "global_step": 127739, "epoch": 3041} {"train_loss": -6.5405802726745605, "global_step": 127740, "epoch": 3041} {"train_loss": -6.519378662109375, "global_step": 127741, "epoch": 3041} {"train_loss": -6.6494832038879395, "global_step": 127742, "epoch": 3041} {"train_loss": -6.611185073852539, "global_step": 127743, "epoch": 3041} {"train_loss": -6.778897285461426, "global_step": 127744, "epoch": 3041} {"train_loss": -6.590441703796387, "global_step": 127745, "epoch": 3041} {"train_loss": -6.723413467407227, "global_step": 127746, "epoch": 3041} {"train_loss": -6.601441860198975, "global_step": 127747, "epoch": 3041} {"train_loss": -6.6456618309021, "global_step": 127748, "epoch": 3041} {"train_loss": -6.593044281005859, "global_step": 127749, "epoch": 3041} {"train_loss": -6.506752967834473, "global_step": 127750, "epoch": 3041} {"train_loss": -6.599093437194824, "global_step": 127751, "epoch": 3041} {"train_loss": -6.687963008880615, "global_step": 127752, "epoch": 3041} {"train_loss": -6.455148220062256, "global_step": 127753, "epoch": 3041} {"train_loss": -6.460304260253906, "global_step": 127754, "epoch": 3041} {"train_loss": -6.54598331451416, "global_step": 127755, "epoch": 3041} {"train_loss": -6.492693901062012, "global_step": 127756, "epoch": 3041} {"train_loss": -6.524378776550293, "global_step": 127757, "epoch": 3041} {"train_loss": -6.523776054382324, "global_step": 127758, "epoch": 3041} {"train_loss": -6.370489120483398, "global_step": 127759, "epoch": 3041} {"train_loss": -6.464158535003662, "global_step": 127760, "epoch": 3041} {"train_loss": -6.537411689758301, "global_step": 127761, "epoch": 3041} {"train_loss": -6.461786270141602, "global_step": 127762, "epoch": 3041} {"train_loss": -6.5720605963752385, "global_step": 127763, "epoch": 3041, "val_loss": 68283.03125} {"train_loss": -6.533381462097168, "global_step": 127764, "epoch": 3042} {"train_loss": -6.453967094421387, "global_step": 127765, "epoch": 3042} {"train_loss": -6.435294151306152, "global_step": 127766, "epoch": 3042} {"train_loss": -6.701422691345215, "global_step": 127767, "epoch": 3042} {"train_loss": -6.6219329833984375, "global_step": 127768, "epoch": 3042} {"train_loss": -6.536478042602539, "global_step": 127769, "epoch": 3042} {"train_loss": -6.499022483825684, "global_step": 127770, "epoch": 3042} {"train_loss": -6.586498260498047, "global_step": 127771, "epoch": 3042} {"train_loss": -6.491945743560791, "global_step": 127772, "epoch": 3042} {"train_loss": -6.601312637329102, "global_step": 127773, "epoch": 3042} {"train_loss": -6.530221939086914, "global_step": 127774, "epoch": 3042} {"train_loss": -6.639884948730469, "global_step": 127775, "epoch": 3042} {"train_loss": -6.558124542236328, "global_step": 127776, "epoch": 3042} {"train_loss": -6.593320369720459, "global_step": 127777, "epoch": 3042} {"train_loss": -6.381814956665039, "global_step": 127778, "epoch": 3042} {"train_loss": -6.511160850524902, "global_step": 127779, "epoch": 3042} {"train_loss": -6.589399337768555, "global_step": 127780, "epoch": 3042} {"train_loss": -6.528936862945557, "global_step": 127781, "epoch": 3042} {"train_loss": -6.45186710357666, "global_step": 127782, "epoch": 3042} {"train_loss": -6.511403560638428, "global_step": 127783, "epoch": 3042} {"train_loss": -6.365267753601074, "global_step": 127784, "epoch": 3042} {"train_loss": -6.476356506347656, "global_step": 127785, "epoch": 3042} {"train_loss": -6.502902984619141, "global_step": 127786, "epoch": 3042} {"train_loss": -6.423566818237305, "global_step": 127787, "epoch": 3042} {"train_loss": -6.569496154785156, "global_step": 127788, "epoch": 3042} {"train_loss": -6.484907150268555, "global_step": 127789, "epoch": 3042} {"train_loss": -6.591854572296143, "global_step": 127790, "epoch": 3042} {"train_loss": -6.470085620880127, "global_step": 127791, "epoch": 3042} {"train_loss": -6.610288619995117, "global_step": 127792, "epoch": 3042} {"train_loss": -6.468908786773682, "global_step": 127793, "epoch": 3042} {"train_loss": -6.503809928894043, "global_step": 127794, "epoch": 3042} {"train_loss": -6.562935829162598, "global_step": 127795, "epoch": 3042} {"train_loss": -6.547542572021484, "global_step": 127796, "epoch": 3042} {"train_loss": -6.481380939483643, "global_step": 127797, "epoch": 3042} {"train_loss": -6.542067527770996, "global_step": 127798, "epoch": 3042} {"train_loss": -6.700021743774414, "global_step": 127799, "epoch": 3042} {"train_loss": -6.608342170715332, "global_step": 127800, "epoch": 3042} {"train_loss": -6.609222412109375, "global_step": 127801, "epoch": 3042} {"train_loss": -6.582028388977051, "global_step": 127802, "epoch": 3042} {"train_loss": -6.691049575805664, "global_step": 127803, "epoch": 3042} {"train_loss": -6.616613388061523, "global_step": 127804, "epoch": 3042} {"train_loss": -6.543862320127941, "global_step": 127805, "epoch": 3042, "val_loss": 68211.78125} {"train_loss": -6.660161018371582, "global_step": 127806, "epoch": 3043} {"train_loss": -6.673901557922363, "global_step": 127807, "epoch": 3043} {"train_loss": -6.538267612457275, "global_step": 127808, "epoch": 3043} {"train_loss": -6.689388275146484, "global_step": 127809, "epoch": 3043} {"train_loss": -6.589483737945557, "global_step": 127810, "epoch": 3043} {"train_loss": -6.642692565917969, "global_step": 127811, "epoch": 3043} {"train_loss": -6.590165138244629, "global_step": 127812, "epoch": 3043} {"train_loss": -6.628487586975098, "global_step": 127813, "epoch": 3043} {"train_loss": -6.594061851501465, "global_step": 127814, "epoch": 3043} {"train_loss": -6.636202335357666, "global_step": 127815, "epoch": 3043} {"train_loss": -6.6257781982421875, "global_step": 127816, "epoch": 3043} {"train_loss": -6.657189846038818, "global_step": 127817, "epoch": 3043} {"train_loss": -6.5648908615112305, "global_step": 127818, "epoch": 3043} {"train_loss": -6.5513739585876465, "global_step": 127819, "epoch": 3043} {"train_loss": -6.750924587249756, "global_step": 127820, "epoch": 3043} {"train_loss": -6.599775791168213, "global_step": 127821, "epoch": 3043} {"train_loss": -6.55278205871582, "global_step": 127822, "epoch": 3043} {"train_loss": -6.423752784729004, "global_step": 127823, "epoch": 3043} {"train_loss": -6.687915325164795, "global_step": 127824, "epoch": 3043} {"train_loss": -6.607339859008789, "global_step": 127825, "epoch": 3043} {"train_loss": -6.480406284332275, "global_step": 127826, "epoch": 3043} {"train_loss": -6.509020805358887, "global_step": 127827, "epoch": 3043} {"train_loss": -6.565258979797363, "global_step": 127828, "epoch": 3043} {"train_loss": -6.5776166915893555, "global_step": 127829, "epoch": 3043} {"train_loss": -6.607052803039551, "global_step": 127830, "epoch": 3043} {"train_loss": -6.568886756896973, "global_step": 127831, "epoch": 3043} {"train_loss": -6.767444610595703, "global_step": 127832, "epoch": 3043} {"train_loss": -6.622466087341309, "global_step": 127833, "epoch": 3043} {"train_loss": -6.738630294799805, "global_step": 127834, "epoch": 3043} {"train_loss": -6.608818054199219, "global_step": 127835, "epoch": 3043} {"train_loss": -6.594262599945068, "global_step": 127836, "epoch": 3043} {"train_loss": -6.590091705322266, "global_step": 127837, "epoch": 3043} {"train_loss": -6.662798881530762, "global_step": 127838, "epoch": 3043} {"train_loss": -6.713864326477051, "global_step": 127839, "epoch": 3043} {"train_loss": -6.637381553649902, "global_step": 127840, "epoch": 3043} {"train_loss": -6.660186767578125, "global_step": 127841, "epoch": 3043} {"train_loss": -6.549866676330566, "global_step": 127842, "epoch": 3043} {"train_loss": -6.606515884399414, "global_step": 127843, "epoch": 3043} {"train_loss": -6.688063621520996, "global_step": 127844, "epoch": 3043} {"train_loss": -6.753591537475586, "global_step": 127845, "epoch": 3043} {"train_loss": -6.621349811553955, "global_step": 127846, "epoch": 3043} {"train_loss": -6.61777713185265, "global_step": 127847, "epoch": 3043, "val_loss": 68022.390625} {"train_loss": -6.687559127807617, "global_step": 127848, "epoch": 3044} {"train_loss": -6.507802963256836, "global_step": 127849, "epoch": 3044} {"train_loss": -6.72062873840332, "global_step": 127850, "epoch": 3044} {"train_loss": -6.577545166015625, "global_step": 127851, "epoch": 3044} {"train_loss": -6.616096019744873, "global_step": 127852, "epoch": 3044} {"train_loss": -6.564076900482178, "global_step": 127853, "epoch": 3044} {"train_loss": -6.65789794921875, "global_step": 127854, "epoch": 3044} {"train_loss": -6.60262393951416, "global_step": 127855, "epoch": 3044} {"train_loss": -6.6040520668029785, "global_step": 127856, "epoch": 3044} {"train_loss": -6.600278377532959, "global_step": 127857, "epoch": 3044} {"train_loss": -6.646252632141113, "global_step": 127858, "epoch": 3044} {"train_loss": -6.527829170227051, "global_step": 127859, "epoch": 3044} {"train_loss": -6.505840301513672, "global_step": 127860, "epoch": 3044} {"train_loss": -6.401124477386475, "global_step": 127861, "epoch": 3044} {"train_loss": -6.59873104095459, "global_step": 127862, "epoch": 3044} {"train_loss": -6.574691295623779, "global_step": 127863, "epoch": 3044} {"train_loss": -6.520472526550293, "global_step": 127864, "epoch": 3044} {"train_loss": -6.566070556640625, "global_step": 127865, "epoch": 3044} {"train_loss": -6.58352518081665, "global_step": 127866, "epoch": 3044} {"train_loss": -6.505695343017578, "global_step": 127867, "epoch": 3044} {"train_loss": -6.624648094177246, "global_step": 127868, "epoch": 3044} {"train_loss": -6.509918212890625, "global_step": 127869, "epoch": 3044} {"train_loss": -6.631279945373535, "global_step": 127870, "epoch": 3044} {"train_loss": -6.668149948120117, "global_step": 127871, "epoch": 3044} {"train_loss": -6.59896183013916, "global_step": 127872, "epoch": 3044} {"train_loss": -6.674449443817139, "global_step": 127873, "epoch": 3044} {"train_loss": -6.6527581214904785, "global_step": 127874, "epoch": 3044} {"train_loss": -6.64634370803833, "global_step": 127875, "epoch": 3044} {"train_loss": -6.752208709716797, "global_step": 127876, "epoch": 3044} {"train_loss": -6.497656345367432, "global_step": 127877, "epoch": 3044} {"train_loss": -6.508784294128418, "global_step": 127878, "epoch": 3044} {"train_loss": -6.519484043121338, "global_step": 127879, "epoch": 3044} {"train_loss": -6.5152387619018555, "global_step": 127880, "epoch": 3044} {"train_loss": -6.607964515686035, "global_step": 127881, "epoch": 3044} {"train_loss": -6.565915584564209, "global_step": 127882, "epoch": 3044} {"train_loss": -6.570706367492676, "global_step": 127883, "epoch": 3044} {"train_loss": -6.564493179321289, "global_step": 127884, "epoch": 3044} {"train_loss": -6.49028205871582, "global_step": 127885, "epoch": 3044} {"train_loss": -6.5345916748046875, "global_step": 127886, "epoch": 3044} {"train_loss": -6.507441997528076, "global_step": 127887, "epoch": 3044} {"train_loss": -6.605279445648193, "global_step": 127888, "epoch": 3044} {"train_loss": -6.582261176336379, "global_step": 127889, "epoch": 3044, "val_loss": 68302.9375} {"train_loss": -6.496565818786621, "global_step": 127890, "epoch": 3045} {"train_loss": -6.653710842132568, "global_step": 127891, "epoch": 3045} {"train_loss": -6.618288040161133, "global_step": 127892, "epoch": 3045} {"train_loss": -6.482475280761719, "global_step": 127893, "epoch": 3045} {"train_loss": -6.624621391296387, "global_step": 127894, "epoch": 3045} {"train_loss": -6.608443737030029, "global_step": 127895, "epoch": 3045} {"train_loss": -6.657114028930664, "global_step": 127896, "epoch": 3045} {"train_loss": -6.652529716491699, "global_step": 127897, "epoch": 3045} {"train_loss": -6.697395324707031, "global_step": 127898, "epoch": 3045} {"train_loss": -6.6010847091674805, "global_step": 127899, "epoch": 3045} {"train_loss": -6.566813945770264, "global_step": 127900, "epoch": 3045} {"train_loss": -6.546507835388184, "global_step": 127901, "epoch": 3045} {"train_loss": -6.544272422790527, "global_step": 127902, "epoch": 3045} {"train_loss": -6.4582390785217285, "global_step": 127903, "epoch": 3045} {"train_loss": -6.648061752319336, "global_step": 127904, "epoch": 3045} {"train_loss": -6.586842060089111, "global_step": 127905, "epoch": 3045} {"train_loss": -6.610713958740234, "global_step": 127906, "epoch": 3045} {"train_loss": -6.632020950317383, "global_step": 127907, "epoch": 3045} {"train_loss": -6.56101131439209, "global_step": 127908, "epoch": 3045} {"train_loss": -6.612296104431152, "global_step": 127909, "epoch": 3045} {"train_loss": -6.6998419761657715, "global_step": 127910, "epoch": 3045} {"train_loss": -6.5825910568237305, "global_step": 127911, "epoch": 3045} {"train_loss": -6.665951728820801, "global_step": 127912, "epoch": 3045} {"train_loss": -6.500139236450195, "global_step": 127913, "epoch": 3045} {"train_loss": -6.645030498504639, "global_step": 127914, "epoch": 3045} {"train_loss": -6.60967493057251, "global_step": 127915, "epoch": 3045} {"train_loss": -6.598407745361328, "global_step": 127916, "epoch": 3045} {"train_loss": -6.700368404388428, "global_step": 127917, "epoch": 3045} {"train_loss": -6.637617111206055, "global_step": 127918, "epoch": 3045} {"train_loss": -6.580957412719727, "global_step": 127919, "epoch": 3045} {"train_loss": -6.777663230895996, "global_step": 127920, "epoch": 3045} {"train_loss": -6.693816661834717, "global_step": 127921, "epoch": 3045} {"train_loss": -6.577120780944824, "global_step": 127922, "epoch": 3045} {"train_loss": -6.750463008880615, "global_step": 127923, "epoch": 3045} {"train_loss": -6.577024936676025, "global_step": 127924, "epoch": 3045} {"train_loss": -6.691277503967285, "global_step": 127925, "epoch": 3045} {"train_loss": -6.557129383087158, "global_step": 127926, "epoch": 3045} {"train_loss": -6.647510528564453, "global_step": 127927, "epoch": 3045} {"train_loss": -6.549878120422363, "global_step": 127928, "epoch": 3045} {"train_loss": -6.512265682220459, "global_step": 127929, "epoch": 3045} {"train_loss": -6.603442668914795, "global_step": 127930, "epoch": 3045} {"train_loss": -6.612517402285621, "global_step": 127931, "epoch": 3045, "val_loss": 68394.9140625} {"train_loss": -6.620800971984863, "global_step": 127932, "epoch": 3046} {"train_loss": -6.533143520355225, "global_step": 127933, "epoch": 3046} {"train_loss": -6.704488754272461, "global_step": 127934, "epoch": 3046} {"train_loss": -6.548299312591553, "global_step": 127935, "epoch": 3046} {"train_loss": -6.697513580322266, "global_step": 127936, "epoch": 3046} {"train_loss": -6.53212308883667, "global_step": 127937, "epoch": 3046} {"train_loss": -6.702635765075684, "global_step": 127938, "epoch": 3046} {"train_loss": -6.547363758087158, "global_step": 127939, "epoch": 3046} {"train_loss": -6.598142623901367, "global_step": 127940, "epoch": 3046} {"train_loss": -6.640473365783691, "global_step": 127941, "epoch": 3046} {"train_loss": -6.715551376342773, "global_step": 127942, "epoch": 3046} {"train_loss": -6.71502685546875, "global_step": 127943, "epoch": 3046} {"train_loss": -6.690202713012695, "global_step": 127944, "epoch": 3046} {"train_loss": -6.5566840171813965, "global_step": 127945, "epoch": 3046} {"train_loss": -6.6806769371032715, "global_step": 127946, "epoch": 3046} {"train_loss": -6.73160457611084, "global_step": 127947, "epoch": 3046} {"train_loss": -6.628073692321777, "global_step": 127948, "epoch": 3046} {"train_loss": -6.7397918701171875, "global_step": 127949, "epoch": 3046} {"train_loss": -6.622865676879883, "global_step": 127950, "epoch": 3046} {"train_loss": -6.644916534423828, "global_step": 127951, "epoch": 3046} {"train_loss": -6.7310709953308105, "global_step": 127952, "epoch": 3046} {"train_loss": -6.602207660675049, "global_step": 127953, "epoch": 3046} {"train_loss": -6.615052223205566, "global_step": 127954, "epoch": 3046} {"train_loss": -6.591794013977051, "global_step": 127955, "epoch": 3046} {"train_loss": -6.825101852416992, "global_step": 127956, "epoch": 3046} {"train_loss": -6.650616645812988, "global_step": 127957, "epoch": 3046} {"train_loss": -6.647871971130371, "global_step": 127958, "epoch": 3046} {"train_loss": -6.5260467529296875, "global_step": 127959, "epoch": 3046} {"train_loss": -6.617987632751465, "global_step": 127960, "epoch": 3046} {"train_loss": -6.614316940307617, "global_step": 127961, "epoch": 3046} {"train_loss": -6.601156234741211, "global_step": 127962, "epoch": 3046} {"train_loss": -6.685150623321533, "global_step": 127963, "epoch": 3046} {"train_loss": -6.63822078704834, "global_step": 127964, "epoch": 3046} {"train_loss": -6.516979217529297, "global_step": 127965, "epoch": 3046} {"train_loss": -6.578114032745361, "global_step": 127966, "epoch": 3046} {"train_loss": -6.614765644073486, "global_step": 127967, "epoch": 3046} {"train_loss": -6.499670505523682, "global_step": 127968, "epoch": 3046} {"train_loss": -6.66890811920166, "global_step": 127969, "epoch": 3046} {"train_loss": -6.554306507110596, "global_step": 127970, "epoch": 3046} {"train_loss": -6.5623979568481445, "global_step": 127971, "epoch": 3046} {"train_loss": -6.6356282234191895, "global_step": 127972, "epoch": 3046} {"train_loss": -6.631456897372291, "global_step": 127973, "epoch": 3046, "val_loss": 68135.7578125} {"train_loss": -6.4989013671875, "global_step": 127974, "epoch": 3047} {"train_loss": -6.726186752319336, "global_step": 127975, "epoch": 3047} {"train_loss": -6.572528839111328, "global_step": 127976, "epoch": 3047} {"train_loss": -6.55888032913208, "global_step": 127977, "epoch": 3047} {"train_loss": -6.53687047958374, "global_step": 127978, "epoch": 3047} {"train_loss": -6.672366619110107, "global_step": 127979, "epoch": 3047} {"train_loss": -6.674790859222412, "global_step": 127980, "epoch": 3047} {"train_loss": -6.644095420837402, "global_step": 127981, "epoch": 3047} {"train_loss": -6.461581230163574, "global_step": 127982, "epoch": 3047} {"train_loss": -6.667089462280273, "global_step": 127983, "epoch": 3047} {"train_loss": -6.530571460723877, "global_step": 127984, "epoch": 3047} {"train_loss": -6.569088935852051, "global_step": 127985, "epoch": 3047} {"train_loss": -6.520018100738525, "global_step": 127986, "epoch": 3047} {"train_loss": -6.510327339172363, "global_step": 127987, "epoch": 3047} {"train_loss": -6.584939956665039, "global_step": 127988, "epoch": 3047} {"train_loss": -6.573841571807861, "global_step": 127989, "epoch": 3047} {"train_loss": -6.576111316680908, "global_step": 127990, "epoch": 3047} {"train_loss": -6.553589820861816, "global_step": 127991, "epoch": 3047} {"train_loss": -6.512322425842285, "global_step": 127992, "epoch": 3047} {"train_loss": -6.513525009155273, "global_step": 127993, "epoch": 3047} {"train_loss": -6.508917331695557, "global_step": 127994, "epoch": 3047} {"train_loss": -6.606283187866211, "global_step": 127995, "epoch": 3047} {"train_loss": -6.521438121795654, "global_step": 127996, "epoch": 3047} {"train_loss": -6.597780227661133, "global_step": 127997, "epoch": 3047} {"train_loss": -6.513165473937988, "global_step": 127998, "epoch": 3047} {"train_loss": -6.543506622314453, "global_step": 127999, "epoch": 3047} {"train_loss": -6.535406112670898, "global_step": 128000, "epoch": 3047} {"train_loss": -6.587634086608887, "global_step": 128001, "epoch": 3047} {"train_loss": -6.570257186889648, "global_step": 128002, "epoch": 3047} {"train_loss": -6.6455230712890625, "global_step": 128003, "epoch": 3047} {"train_loss": -6.5430908203125, "global_step": 128004, "epoch": 3047} {"train_loss": -6.493975639343262, "global_step": 128005, "epoch": 3047} {"train_loss": -6.456874847412109, "global_step": 128006, "epoch": 3047} {"train_loss": -6.518043041229248, "global_step": 128007, "epoch": 3047} {"train_loss": -6.594825744628906, "global_step": 128008, "epoch": 3047} {"train_loss": -6.623027324676514, "global_step": 128009, "epoch": 3047} {"train_loss": -6.484513282775879, "global_step": 128010, "epoch": 3047} {"train_loss": -6.5046491622924805, "global_step": 128011, "epoch": 3047} {"train_loss": -6.682282447814941, "global_step": 128012, "epoch": 3047} {"train_loss": -6.590851783752441, "global_step": 128013, "epoch": 3047} {"train_loss": -6.57731294631958, "global_step": 128014, "epoch": 3047} {"train_loss": -6.567265624091739, "global_step": 128015, "epoch": 3047, "val_loss": 68073.0546875} {"train_loss": -6.568101406097412, "global_step": 128016, "epoch": 3048} {"train_loss": -6.641084671020508, "global_step": 128017, "epoch": 3048} {"train_loss": -6.580157279968262, "global_step": 128018, "epoch": 3048} {"train_loss": -6.703568935394287, "global_step": 128019, "epoch": 3048} {"train_loss": -6.620072364807129, "global_step": 128020, "epoch": 3048} {"train_loss": -6.686577796936035, "global_step": 128021, "epoch": 3048} {"train_loss": -6.524194717407227, "global_step": 128022, "epoch": 3048} {"train_loss": -6.591380596160889, "global_step": 128023, "epoch": 3048} {"train_loss": -6.535284996032715, "global_step": 128024, "epoch": 3048} {"train_loss": -6.6385498046875, "global_step": 128025, "epoch": 3048} {"train_loss": -6.626852989196777, "global_step": 128026, "epoch": 3048} {"train_loss": -6.61408805847168, "global_step": 128027, "epoch": 3048} {"train_loss": -6.6382598876953125, "global_step": 128028, "epoch": 3048} {"train_loss": -6.603644847869873, "global_step": 128029, "epoch": 3048} {"train_loss": -6.60658073425293, "global_step": 128030, "epoch": 3048} {"train_loss": -6.5358381271362305, "global_step": 128031, "epoch": 3048} {"train_loss": -6.5556230545043945, "global_step": 128032, "epoch": 3048} {"train_loss": -6.5167059898376465, "global_step": 128033, "epoch": 3048} {"train_loss": -6.569046497344971, "global_step": 128034, "epoch": 3048} {"train_loss": -6.624958038330078, "global_step": 128035, "epoch": 3048} {"train_loss": -6.57425594329834, "global_step": 128036, "epoch": 3048} {"train_loss": -6.5511932373046875, "global_step": 128037, "epoch": 3048} {"train_loss": -6.605875492095947, "global_step": 128038, "epoch": 3048} {"train_loss": -6.61430025100708, "global_step": 128039, "epoch": 3048} {"train_loss": -6.532862186431885, "global_step": 128040, "epoch": 3048} {"train_loss": -6.615726470947266, "global_step": 128041, "epoch": 3048} {"train_loss": -6.551520347595215, "global_step": 128042, "epoch": 3048} {"train_loss": -6.6460161209106445, "global_step": 128043, "epoch": 3048} {"train_loss": -6.589312553405762, "global_step": 128044, "epoch": 3048} {"train_loss": -6.545101165771484, "global_step": 128045, "epoch": 3048} {"train_loss": -6.574619770050049, "global_step": 128046, "epoch": 3048} {"train_loss": -6.554581165313721, "global_step": 128047, "epoch": 3048} {"train_loss": -6.671331882476807, "global_step": 128048, "epoch": 3048} {"train_loss": -6.676464080810547, "global_step": 128049, "epoch": 3048} {"train_loss": -6.645688056945801, "global_step": 128050, "epoch": 3048} {"train_loss": -6.65850305557251, "global_step": 128051, "epoch": 3048} {"train_loss": -6.504875183105469, "global_step": 128052, "epoch": 3048} {"train_loss": -6.656658172607422, "global_step": 128053, "epoch": 3048} {"train_loss": -6.592751502990723, "global_step": 128054, "epoch": 3048} {"train_loss": -6.531052112579346, "global_step": 128055, "epoch": 3048} {"train_loss": -6.705416679382324, "global_step": 128056, "epoch": 3048} {"train_loss": -6.599877073651268, "global_step": 128057, "epoch": 3048, "val_loss": 68127.0390625} {"train_loss": -6.718097686767578, "global_step": 128058, "epoch": 3049} {"train_loss": -6.7247161865234375, "global_step": 128059, "epoch": 3049} {"train_loss": -6.634395122528076, "global_step": 128060, "epoch": 3049} {"train_loss": -6.734760761260986, "global_step": 128061, "epoch": 3049} {"train_loss": -6.688760280609131, "global_step": 128062, "epoch": 3049} {"train_loss": -6.5834479331970215, "global_step": 128063, "epoch": 3049} {"train_loss": -6.625245094299316, "global_step": 128064, "epoch": 3049} {"train_loss": -6.538119792938232, "global_step": 128065, "epoch": 3049} {"train_loss": -6.7401814460754395, "global_step": 128066, "epoch": 3049} {"train_loss": -6.608284950256348, "global_step": 128067, "epoch": 3049} {"train_loss": -6.4854278564453125, "global_step": 128068, "epoch": 3049} {"train_loss": -6.717921733856201, "global_step": 128069, "epoch": 3049} {"train_loss": -6.528445243835449, "global_step": 128070, "epoch": 3049} {"train_loss": -6.428778648376465, "global_step": 128071, "epoch": 3049} {"train_loss": -6.505814552307129, "global_step": 128072, "epoch": 3049} {"train_loss": -6.527088642120361, "global_step": 128073, "epoch": 3049} {"train_loss": -6.508721351623535, "global_step": 128074, "epoch": 3049} {"train_loss": -6.3350934982299805, "global_step": 128075, "epoch": 3049} {"train_loss": -6.496162414550781, "global_step": 128076, "epoch": 3049} {"train_loss": -6.44450569152832, "global_step": 128077, "epoch": 3049} {"train_loss": -6.402928352355957, "global_step": 128078, "epoch": 3049} {"train_loss": -6.521331310272217, "global_step": 128079, "epoch": 3049} {"train_loss": -6.443922519683838, "global_step": 128080, "epoch": 3049} {"train_loss": -6.523730278015137, "global_step": 128081, "epoch": 3049} {"train_loss": -6.3266282081604, "global_step": 128082, "epoch": 3049} {"train_loss": -6.595096588134766, "global_step": 128083, "epoch": 3049} {"train_loss": -6.5446600914001465, "global_step": 128084, "epoch": 3049} {"train_loss": -6.499079704284668, "global_step": 128085, "epoch": 3049} {"train_loss": -6.574833869934082, "global_step": 128086, "epoch": 3049} {"train_loss": -6.617997646331787, "global_step": 128087, "epoch": 3049} {"train_loss": -6.4072675704956055, "global_step": 128088, "epoch": 3049} {"train_loss": -6.374392509460449, "global_step": 128089, "epoch": 3049} {"train_loss": -6.403692245483398, "global_step": 128090, "epoch": 3049} {"train_loss": -6.543506622314453, "global_step": 128091, "epoch": 3049} {"train_loss": -6.544239521026611, "global_step": 128092, "epoch": 3049} {"train_loss": -6.566052436828613, "global_step": 128093, "epoch": 3049} {"train_loss": -6.604400634765625, "global_step": 128094, "epoch": 3049} {"train_loss": -6.56777286529541, "global_step": 128095, "epoch": 3049} {"train_loss": -6.539097785949707, "global_step": 128096, "epoch": 3049} {"train_loss": -6.573617935180664, "global_step": 128097, "epoch": 3049} {"train_loss": -6.56658935546875, "global_step": 128098, "epoch": 3049} {"train_loss": -6.548336994080317, "global_step": 128099, "epoch": 3049, "val_loss": 68137.0703125} {"train_loss": -6.675981521606445, "global_step": 128100, "epoch": 3050} {"train_loss": -6.672765254974365, "global_step": 128101, "epoch": 3050} {"train_loss": -6.628365516662598, "global_step": 128102, "epoch": 3050} {"train_loss": -6.634850025177002, "global_step": 128103, "epoch": 3050} {"train_loss": -6.6146392822265625, "global_step": 128104, "epoch": 3050} {"train_loss": -6.631379127502441, "global_step": 128105, "epoch": 3050} {"train_loss": -6.634622573852539, "global_step": 128106, "epoch": 3050} {"train_loss": -6.634654998779297, "global_step": 128107, "epoch": 3050} {"train_loss": -6.609571933746338, "global_step": 128108, "epoch": 3050} {"train_loss": -6.628351211547852, "global_step": 128109, "epoch": 3050} {"train_loss": -6.597343444824219, "global_step": 128110, "epoch": 3050} {"train_loss": -6.6657257080078125, "global_step": 128111, "epoch": 3050} {"train_loss": -6.536159038543701, "global_step": 128112, "epoch": 3050} {"train_loss": -6.509238243103027, "global_step": 128113, "epoch": 3050} {"train_loss": -6.48701286315918, "global_step": 128114, "epoch": 3050} {"train_loss": -6.654036998748779, "global_step": 128115, "epoch": 3050} {"train_loss": -6.643039226531982, "global_step": 128116, "epoch": 3050} {"train_loss": -6.529121398925781, "global_step": 128117, "epoch": 3050} {"train_loss": -6.659490585327148, "global_step": 128118, "epoch": 3050} {"train_loss": -6.6801981925964355, "global_step": 128119, "epoch": 3050} {"train_loss": -6.539141654968262, "global_step": 128120, "epoch": 3050} {"train_loss": -6.624298572540283, "global_step": 128121, "epoch": 3050} {"train_loss": -6.636752128601074, "global_step": 128122, "epoch": 3050} {"train_loss": -6.612748146057129, "global_step": 128123, "epoch": 3050} {"train_loss": -6.518373489379883, "global_step": 128124, "epoch": 3050} {"train_loss": -6.618778228759766, "global_step": 128125, "epoch": 3050} {"train_loss": -6.625283241271973, "global_step": 128126, "epoch": 3050} {"train_loss": -6.57377290725708, "global_step": 128127, "epoch": 3050} {"train_loss": -6.645045280456543, "global_step": 128128, "epoch": 3050} {"train_loss": -6.614292621612549, "global_step": 128129, "epoch": 3050} {"train_loss": -6.589221954345703, "global_step": 128130, "epoch": 3050} {"train_loss": -6.462718963623047, "global_step": 128131, "epoch": 3050} {"train_loss": -6.470308303833008, "global_step": 128132, "epoch": 3050} {"train_loss": -6.529566764831543, "global_step": 128133, "epoch": 3050} {"train_loss": -6.48585319519043, "global_step": 128134, "epoch": 3050} {"train_loss": -6.6943511962890625, "global_step": 128135, "epoch": 3050} {"train_loss": -6.443199634552002, "global_step": 128136, "epoch": 3050} {"train_loss": -6.505672931671143, "global_step": 128137, "epoch": 3050} {"train_loss": -6.673341751098633, "global_step": 128138, "epoch": 3050} {"train_loss": -6.591992378234863, "global_step": 128139, "epoch": 3050} {"train_loss": -6.684990882873535, "global_step": 128140, "epoch": 3050} {"train_loss": -6.5941214220864435, "global_step": 128141, "epoch": 3050, "train/sim_max_reward_0": 0.2248642964532047, "train/sim_max_reward_1": 0.8647792999916744, "train/sim_max_reward_2": 0.2238738661216988, "train/sim_max_reward_3": 0.9758073220534746, "train/sim_max_reward_4": 0.8290878756855059, "train/sim_max_reward_5": 0.963253013316396, "test/sim_max_reward_4400000": 0.2037739787956672, "test/sim_max_reward_4400001": 0.24188712886198022, "test/sim_max_reward_4400002": 0.9999937029522091, "test/sim_max_reward_4400003": 0.8842025293544112, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.14198881497347304, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.31841908146981446, "test/sim_max_reward_4400009": 0.892129150088803, "test/sim_max_reward_4400010": 0.24326200043202048, "test/sim_max_reward_4400011": 0.128348482954899, "test/sim_max_reward_4400012": 0.8696754111642931, "test/sim_max_reward_4400013": 0.7438492981698122, "test/sim_max_reward_4400014": 0.8571605625722044, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.07659466523649004, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 0.23885549651123023, "test/sim_max_reward_4400019": 0.33670446103394713, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.2552306722293219, "test/sim_max_reward_4400023": 0.9025940989754793, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.2521835567264707, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.003946981378860493, "test/sim_max_reward_4400028": 0.43664703386601467, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9707705408647612, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.3952715889962966, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.40866175186089826, "test/sim_max_reward_4400036": 1.0, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4115662287059329, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9763381979834713, "test/sim_max_reward_4400042": 0.5592364256452909, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9522818005322419, "test/sim_max_reward_4400045": 0.9128864584828087, "test/sim_max_reward_4400046": 0.8556875250874562, "test/sim_max_reward_4400047": 0.9622770627343726, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8980592284532672, "train/mean_score": 0.6802776122703257, "test/mean_score": 0.5180404078857948, "val_loss": 68057.6015625} {"train_loss": -6.640705108642578, "global_step": 128142, "epoch": 3051} {"train_loss": -6.663764953613281, "global_step": 128143, "epoch": 3051} {"train_loss": -6.607326030731201, "global_step": 128144, "epoch": 3051} {"train_loss": -6.478079319000244, "global_step": 128145, "epoch": 3051} {"train_loss": -6.669370651245117, "global_step": 128146, "epoch": 3051} {"train_loss": -6.46768045425415, "global_step": 128147, "epoch": 3051} {"train_loss": -6.647158145904541, "global_step": 128148, "epoch": 3051} {"train_loss": -6.641546249389648, "global_step": 128149, "epoch": 3051} {"train_loss": -6.657783031463623, "global_step": 128150, "epoch": 3051} {"train_loss": -6.588006973266602, "global_step": 128151, "epoch": 3051} {"train_loss": -6.621735572814941, "global_step": 128152, "epoch": 3051} {"train_loss": -6.532770156860352, "global_step": 128153, "epoch": 3051} {"train_loss": -6.622538089752197, "global_step": 128154, "epoch": 3051} {"train_loss": -6.633841514587402, "global_step": 128155, "epoch": 3051} {"train_loss": -6.562100410461426, "global_step": 128156, "epoch": 3051} {"train_loss": -6.666992664337158, "global_step": 128157, "epoch": 3051} {"train_loss": -6.6582722663879395, "global_step": 128158, "epoch": 3051} {"train_loss": -6.574516296386719, "global_step": 128159, "epoch": 3051} {"train_loss": -6.680211067199707, "global_step": 128160, "epoch": 3051} {"train_loss": -6.496081829071045, "global_step": 128161, "epoch": 3051} {"train_loss": -6.610198974609375, "global_step": 128162, "epoch": 3051} {"train_loss": -6.580799579620361, "global_step": 128163, "epoch": 3051} {"train_loss": -6.51607608795166, "global_step": 128164, "epoch": 3051} {"train_loss": -6.52549934387207, "global_step": 128165, "epoch": 3051} {"train_loss": -6.635250091552734, "global_step": 128166, "epoch": 3051} {"train_loss": -6.66243839263916, "global_step": 128167, "epoch": 3051} {"train_loss": -6.580297470092773, "global_step": 128168, "epoch": 3051} {"train_loss": -6.681937217712402, "global_step": 128169, "epoch": 3051} {"train_loss": -6.554477691650391, "global_step": 128170, "epoch": 3051} {"train_loss": -6.540964126586914, "global_step": 128171, "epoch": 3051} {"train_loss": -6.7169413566589355, "global_step": 128172, "epoch": 3051} {"train_loss": -6.6254191398620605, "global_step": 128173, "epoch": 3051} {"train_loss": -6.667806625366211, "global_step": 128174, "epoch": 3051} {"train_loss": -6.6528730392456055, "global_step": 128175, "epoch": 3051} {"train_loss": -6.713709831237793, "global_step": 128176, "epoch": 3051} {"train_loss": -6.481258869171143, "global_step": 128177, "epoch": 3051} {"train_loss": -6.5125226974487305, "global_step": 128178, "epoch": 3051} {"train_loss": -6.683284282684326, "global_step": 128179, "epoch": 3051} {"train_loss": -6.595722675323486, "global_step": 128180, "epoch": 3051} {"train_loss": -6.566642761230469, "global_step": 128181, "epoch": 3051} {"train_loss": -6.547163486480713, "global_step": 128182, "epoch": 3051} {"train_loss": -6.6061948253994895, "global_step": 128183, "epoch": 3051, "val_loss": 68203.3203125} {"train_loss": -6.6035051345825195, "global_step": 128184, "epoch": 3052} {"train_loss": -6.618241310119629, "global_step": 128185, "epoch": 3052} {"train_loss": -6.62827205657959, "global_step": 128186, "epoch": 3052} {"train_loss": -6.588373184204102, "global_step": 128187, "epoch": 3052} {"train_loss": -6.6758928298950195, "global_step": 128188, "epoch": 3052} {"train_loss": -6.700646877288818, "global_step": 128189, "epoch": 3052} {"train_loss": -6.662442684173584, "global_step": 128190, "epoch": 3052} {"train_loss": -6.605213165283203, "global_step": 128191, "epoch": 3052} {"train_loss": -6.74738883972168, "global_step": 128192, "epoch": 3052} {"train_loss": -6.633538722991943, "global_step": 128193, "epoch": 3052} {"train_loss": -6.733102798461914, "global_step": 128194, "epoch": 3052} {"train_loss": -6.714946746826172, "global_step": 128195, "epoch": 3052} {"train_loss": -6.753363609313965, "global_step": 128196, "epoch": 3052} {"train_loss": -6.684793949127197, "global_step": 128197, "epoch": 3052} {"train_loss": -6.671339988708496, "global_step": 128198, "epoch": 3052} {"train_loss": -6.679924488067627, "global_step": 128199, "epoch": 3052} {"train_loss": -6.699231147766113, "global_step": 128200, "epoch": 3052} {"train_loss": -6.67744779586792, "global_step": 128201, "epoch": 3052} {"train_loss": -6.618376731872559, "global_step": 128202, "epoch": 3052} {"train_loss": -6.669459819793701, "global_step": 128203, "epoch": 3052} {"train_loss": -6.547255039215088, "global_step": 128204, "epoch": 3052} {"train_loss": -6.653230667114258, "global_step": 128205, "epoch": 3052} {"train_loss": -6.68528938293457, "global_step": 128206, "epoch": 3052} {"train_loss": -6.700964450836182, "global_step": 128207, "epoch": 3052} {"train_loss": -6.432104587554932, "global_step": 128208, "epoch": 3052} {"train_loss": -6.479092121124268, "global_step": 128209, "epoch": 3052} {"train_loss": -6.560934543609619, "global_step": 128210, "epoch": 3052} {"train_loss": -6.671955108642578, "global_step": 128211, "epoch": 3052} {"train_loss": -6.486804962158203, "global_step": 128212, "epoch": 3052} {"train_loss": -6.557172775268555, "global_step": 128213, "epoch": 3052} {"train_loss": -6.610988140106201, "global_step": 128214, "epoch": 3052} {"train_loss": -6.585790634155273, "global_step": 128215, "epoch": 3052} {"train_loss": -6.661159992218018, "global_step": 128216, "epoch": 3052} {"train_loss": -6.659223556518555, "global_step": 128217, "epoch": 3052} {"train_loss": -6.591780185699463, "global_step": 128218, "epoch": 3052} {"train_loss": -6.600922584533691, "global_step": 128219, "epoch": 3052} {"train_loss": -6.512898921966553, "global_step": 128220, "epoch": 3052} {"train_loss": -6.684778213500977, "global_step": 128221, "epoch": 3052} {"train_loss": -6.581090927124023, "global_step": 128222, "epoch": 3052} {"train_loss": -6.623816013336182, "global_step": 128223, "epoch": 3052} {"train_loss": -6.569006443023682, "global_step": 128224, "epoch": 3052} {"train_loss": -6.631222179957798, "global_step": 128225, "epoch": 3052, "val_loss": 68226.5234375} {"train_loss": -6.780848979949951, "global_step": 128226, "epoch": 3053} {"train_loss": -6.580721855163574, "global_step": 128227, "epoch": 3053} {"train_loss": -6.544424057006836, "global_step": 128228, "epoch": 3053} {"train_loss": -6.608050346374512, "global_step": 128229, "epoch": 3053} {"train_loss": -6.59748649597168, "global_step": 128230, "epoch": 3053} {"train_loss": -6.722390174865723, "global_step": 128231, "epoch": 3053} {"train_loss": -6.528833389282227, "global_step": 128232, "epoch": 3053} {"train_loss": -6.585744380950928, "global_step": 128233, "epoch": 3053} {"train_loss": -6.543636322021484, "global_step": 128234, "epoch": 3053} {"train_loss": -6.675004959106445, "global_step": 128235, "epoch": 3053} {"train_loss": -6.610769748687744, "global_step": 128236, "epoch": 3053} {"train_loss": -6.485952377319336, "global_step": 128237, "epoch": 3053} {"train_loss": -6.478495121002197, "global_step": 128238, "epoch": 3053} {"train_loss": -6.725950241088867, "global_step": 128239, "epoch": 3053} {"train_loss": -6.5704665184021, "global_step": 128240, "epoch": 3053} {"train_loss": -6.306066036224365, "global_step": 128241, "epoch": 3053} {"train_loss": -6.628008842468262, "global_step": 128242, "epoch": 3053} {"train_loss": -6.503898620605469, "global_step": 128243, "epoch": 3053} {"train_loss": -6.765201091766357, "global_step": 128244, "epoch": 3053} {"train_loss": -6.546065330505371, "global_step": 128245, "epoch": 3053} {"train_loss": -6.520078659057617, "global_step": 128246, "epoch": 3053} {"train_loss": -6.463292121887207, "global_step": 128247, "epoch": 3053} {"train_loss": -6.538928031921387, "global_step": 128248, "epoch": 3053} {"train_loss": -6.536581993103027, "global_step": 128249, "epoch": 3053} {"train_loss": -6.467277526855469, "global_step": 128250, "epoch": 3053} {"train_loss": -6.582528591156006, "global_step": 128251, "epoch": 3053} {"train_loss": -6.704981327056885, "global_step": 128252, "epoch": 3053} {"train_loss": -6.60707950592041, "global_step": 128253, "epoch": 3053} {"train_loss": -6.628301620483398, "global_step": 128254, "epoch": 3053} {"train_loss": -6.589989185333252, "global_step": 128255, "epoch": 3053} {"train_loss": -6.531795501708984, "global_step": 128256, "epoch": 3053} {"train_loss": -6.652046203613281, "global_step": 128257, "epoch": 3053} {"train_loss": -6.635335922241211, "global_step": 128258, "epoch": 3053} {"train_loss": -6.6708173751831055, "global_step": 128259, "epoch": 3053} {"train_loss": -6.637237071990967, "global_step": 128260, "epoch": 3053} {"train_loss": -6.582983016967773, "global_step": 128261, "epoch": 3053} {"train_loss": -6.712172508239746, "global_step": 128262, "epoch": 3053} {"train_loss": -6.659405708312988, "global_step": 128263, "epoch": 3053} {"train_loss": -6.510366439819336, "global_step": 128264, "epoch": 3053} {"train_loss": -6.601865768432617, "global_step": 128265, "epoch": 3053} {"train_loss": -6.690192699432373, "global_step": 128266, "epoch": 3053} {"train_loss": -6.592794804345994, "global_step": 128267, "epoch": 3053, "val_loss": 68249.8671875} {"train_loss": -6.6452436447143555, "global_step": 128268, "epoch": 3054} {"train_loss": -6.507626533508301, "global_step": 128269, "epoch": 3054} {"train_loss": -6.564227104187012, "global_step": 128270, "epoch": 3054} {"train_loss": -6.71526575088501, "global_step": 128271, "epoch": 3054} {"train_loss": -6.682127952575684, "global_step": 128272, "epoch": 3054} {"train_loss": -6.5556321144104, "global_step": 128273, "epoch": 3054} {"train_loss": -6.556841850280762, "global_step": 128274, "epoch": 3054} {"train_loss": -6.579996585845947, "global_step": 128275, "epoch": 3054} {"train_loss": -6.634637355804443, "global_step": 128276, "epoch": 3054} {"train_loss": -6.607883930206299, "global_step": 128277, "epoch": 3054} {"train_loss": -6.599341869354248, "global_step": 128278, "epoch": 3054} {"train_loss": -6.625490188598633, "global_step": 128279, "epoch": 3054} {"train_loss": -6.537547588348389, "global_step": 128280, "epoch": 3054} {"train_loss": -6.612727165222168, "global_step": 128281, "epoch": 3054} {"train_loss": -6.618542671203613, "global_step": 128282, "epoch": 3054} {"train_loss": -6.51301383972168, "global_step": 128283, "epoch": 3054} {"train_loss": -6.667368412017822, "global_step": 128284, "epoch": 3054} {"train_loss": -6.600700378417969, "global_step": 128285, "epoch": 3054} {"train_loss": -6.569414138793945, "global_step": 128286, "epoch": 3054} {"train_loss": -6.680388927459717, "global_step": 128287, "epoch": 3054} {"train_loss": -6.542812347412109, "global_step": 128288, "epoch": 3054} {"train_loss": -6.565062522888184, "global_step": 128289, "epoch": 3054} {"train_loss": -6.6623148918151855, "global_step": 128290, "epoch": 3054} {"train_loss": -6.5377984046936035, "global_step": 128291, "epoch": 3054} {"train_loss": -6.636835098266602, "global_step": 128292, "epoch": 3054} {"train_loss": -6.554659843444824, "global_step": 128293, "epoch": 3054} {"train_loss": -6.536855697631836, "global_step": 128294, "epoch": 3054} {"train_loss": -6.548771381378174, "global_step": 128295, "epoch": 3054} {"train_loss": -6.635788917541504, "global_step": 128296, "epoch": 3054} {"train_loss": -6.563106536865234, "global_step": 128297, "epoch": 3054} {"train_loss": -6.600471019744873, "global_step": 128298, "epoch": 3054} {"train_loss": -6.698844909667969, "global_step": 128299, "epoch": 3054} {"train_loss": -6.729755878448486, "global_step": 128300, "epoch": 3054} {"train_loss": -6.641183853149414, "global_step": 128301, "epoch": 3054} {"train_loss": -6.593029022216797, "global_step": 128302, "epoch": 3054} {"train_loss": -6.611652374267578, "global_step": 128303, "epoch": 3054} {"train_loss": -6.570460796356201, "global_step": 128304, "epoch": 3054} {"train_loss": -6.691901206970215, "global_step": 128305, "epoch": 3054} {"train_loss": -6.6590070724487305, "global_step": 128306, "epoch": 3054} {"train_loss": -6.610458850860596, "global_step": 128307, "epoch": 3054} {"train_loss": -6.677463531494141, "global_step": 128308, "epoch": 3054} {"train_loss": -6.608896732330322, "global_step": 128309, "epoch": 3054, "val_loss": 67990.359375} {"train_loss": -6.670932769775391, "global_step": 128310, "epoch": 3055} {"train_loss": -6.770023822784424, "global_step": 128311, "epoch": 3055} {"train_loss": -6.539448261260986, "global_step": 128312, "epoch": 3055} {"train_loss": -6.613102436065674, "global_step": 128313, "epoch": 3055} {"train_loss": -6.7260050773620605, "global_step": 128314, "epoch": 3055} {"train_loss": -6.687535285949707, "global_step": 128315, "epoch": 3055} {"train_loss": -6.618646621704102, "global_step": 128316, "epoch": 3055} {"train_loss": -6.593527317047119, "global_step": 128317, "epoch": 3055} {"train_loss": -6.686927795410156, "global_step": 128318, "epoch": 3055} {"train_loss": -6.666123390197754, "global_step": 128319, "epoch": 3055} {"train_loss": -6.678487777709961, "global_step": 128320, "epoch": 3055} {"train_loss": -6.655529022216797, "global_step": 128321, "epoch": 3055} {"train_loss": -6.601506233215332, "global_step": 128322, "epoch": 3055} {"train_loss": -6.725306987762451, "global_step": 128323, "epoch": 3055} {"train_loss": -6.756067276000977, "global_step": 128324, "epoch": 3055} {"train_loss": -6.616091728210449, "global_step": 128325, "epoch": 3055} {"train_loss": -6.579999923706055, "global_step": 128326, "epoch": 3055} {"train_loss": -6.63045072555542, "global_step": 128327, "epoch": 3055} {"train_loss": -6.523221969604492, "global_step": 128328, "epoch": 3055} {"train_loss": -6.589459419250488, "global_step": 128329, "epoch": 3055} {"train_loss": -6.630442142486572, "global_step": 128330, "epoch": 3055} {"train_loss": -6.614723205566406, "global_step": 128331, "epoch": 3055} {"train_loss": -6.435824394226074, "global_step": 128332, "epoch": 3055} {"train_loss": -6.711899757385254, "global_step": 128333, "epoch": 3055} {"train_loss": -6.495964050292969, "global_step": 128334, "epoch": 3055} {"train_loss": -6.454873561859131, "global_step": 128335, "epoch": 3055} {"train_loss": -6.538937568664551, "global_step": 128336, "epoch": 3055} {"train_loss": -6.49491548538208, "global_step": 128337, "epoch": 3055} {"train_loss": -6.577709197998047, "global_step": 128338, "epoch": 3055} {"train_loss": -6.689189434051514, "global_step": 128339, "epoch": 3055} {"train_loss": -6.481242656707764, "global_step": 128340, "epoch": 3055} {"train_loss": -6.509011268615723, "global_step": 128341, "epoch": 3055} {"train_loss": -6.593114852905273, "global_step": 128342, "epoch": 3055} {"train_loss": -6.634818077087402, "global_step": 128343, "epoch": 3055} {"train_loss": -6.642405986785889, "global_step": 128344, "epoch": 3055} {"train_loss": -6.617002487182617, "global_step": 128345, "epoch": 3055} {"train_loss": -6.705409526824951, "global_step": 128346, "epoch": 3055} {"train_loss": -6.5235981941223145, "global_step": 128347, "epoch": 3055} {"train_loss": -6.6470136642456055, "global_step": 128348, "epoch": 3055} {"train_loss": -6.67592191696167, "global_step": 128349, "epoch": 3055} {"train_loss": -6.468440532684326, "global_step": 128350, "epoch": 3055} {"train_loss": -6.609801156180246, "global_step": 128351, "epoch": 3055, "val_loss": 68116.1796875} {"train_loss": -6.566102027893066, "global_step": 128352, "epoch": 3056} {"train_loss": -6.519269943237305, "global_step": 128353, "epoch": 3056} {"train_loss": -6.578927040100098, "global_step": 128354, "epoch": 3056} {"train_loss": -6.538877487182617, "global_step": 128355, "epoch": 3056} {"train_loss": -6.658571243286133, "global_step": 128356, "epoch": 3056} {"train_loss": -6.566671371459961, "global_step": 128357, "epoch": 3056} {"train_loss": -6.553073883056641, "global_step": 128358, "epoch": 3056} {"train_loss": -6.6545000076293945, "global_step": 128359, "epoch": 3056} {"train_loss": -6.533657073974609, "global_step": 128360, "epoch": 3056} {"train_loss": -6.7001142501831055, "global_step": 128361, "epoch": 3056} {"train_loss": -6.606576919555664, "global_step": 128362, "epoch": 3056} {"train_loss": -6.538066864013672, "global_step": 128363, "epoch": 3056} {"train_loss": -6.729313850402832, "global_step": 128364, "epoch": 3056} {"train_loss": -6.469337463378906, "global_step": 128365, "epoch": 3056} {"train_loss": -6.65355920791626, "global_step": 128366, "epoch": 3056} {"train_loss": -6.5763726234436035, "global_step": 128367, "epoch": 3056} {"train_loss": -6.612977027893066, "global_step": 128368, "epoch": 3056} {"train_loss": -6.586098670959473, "global_step": 128369, "epoch": 3056} {"train_loss": -6.598553657531738, "global_step": 128370, "epoch": 3056} {"train_loss": -6.463050365447998, "global_step": 128371, "epoch": 3056} {"train_loss": -6.572055816650391, "global_step": 128372, "epoch": 3056} {"train_loss": -6.700725555419922, "global_step": 128373, "epoch": 3056} {"train_loss": -6.619631767272949, "global_step": 128374, "epoch": 3056} {"train_loss": -6.557908535003662, "global_step": 128375, "epoch": 3056} {"train_loss": -6.657575607299805, "global_step": 128376, "epoch": 3056} {"train_loss": -6.739293575286865, "global_step": 128377, "epoch": 3056} {"train_loss": -6.681269645690918, "global_step": 128378, "epoch": 3056} {"train_loss": -6.577058792114258, "global_step": 128379, "epoch": 3056} {"train_loss": -6.679006576538086, "global_step": 128380, "epoch": 3056} {"train_loss": -6.60577392578125, "global_step": 128381, "epoch": 3056} {"train_loss": -6.609897136688232, "global_step": 128382, "epoch": 3056} {"train_loss": -6.6170573234558105, "global_step": 128383, "epoch": 3056} {"train_loss": -6.5139875411987305, "global_step": 128384, "epoch": 3056} {"train_loss": -6.752828121185303, "global_step": 128385, "epoch": 3056} {"train_loss": -6.685724258422852, "global_step": 128386, "epoch": 3056} {"train_loss": -6.636239051818848, "global_step": 128387, "epoch": 3056} {"train_loss": -6.698987007141113, "global_step": 128388, "epoch": 3056} {"train_loss": -6.66997766494751, "global_step": 128389, "epoch": 3056} {"train_loss": -6.555537223815918, "global_step": 128390, "epoch": 3056} {"train_loss": -6.68549919128418, "global_step": 128391, "epoch": 3056} {"train_loss": -6.578675270080566, "global_step": 128392, "epoch": 3056} {"train_loss": -6.614998896916707, "global_step": 128393, "epoch": 3056, "val_loss": 68016.59375} {"train_loss": -6.579080581665039, "global_step": 128394, "epoch": 3057} {"train_loss": -6.640522480010986, "global_step": 128395, "epoch": 3057} {"train_loss": -6.622834205627441, "global_step": 128396, "epoch": 3057} {"train_loss": -6.631814002990723, "global_step": 128397, "epoch": 3057} {"train_loss": -6.654085159301758, "global_step": 128398, "epoch": 3057} {"train_loss": -6.588797092437744, "global_step": 128399, "epoch": 3057} {"train_loss": -6.661715984344482, "global_step": 128400, "epoch": 3057} {"train_loss": -6.60045051574707, "global_step": 128401, "epoch": 3057} {"train_loss": -6.63822603225708, "global_step": 128402, "epoch": 3057} {"train_loss": -6.7412872314453125, "global_step": 128403, "epoch": 3057} {"train_loss": -6.590078353881836, "global_step": 128404, "epoch": 3057} {"train_loss": -6.624605178833008, "global_step": 128405, "epoch": 3057} {"train_loss": -6.72727108001709, "global_step": 128406, "epoch": 3057} {"train_loss": -6.597497463226318, "global_step": 128407, "epoch": 3057} {"train_loss": -6.637094497680664, "global_step": 128408, "epoch": 3057} {"train_loss": -6.6562652587890625, "global_step": 128409, "epoch": 3057} {"train_loss": -6.738739013671875, "global_step": 128410, "epoch": 3057} {"train_loss": -6.731052398681641, "global_step": 128411, "epoch": 3057} {"train_loss": -6.62973690032959, "global_step": 128412, "epoch": 3057} {"train_loss": -6.7269134521484375, "global_step": 128413, "epoch": 3057} {"train_loss": -6.582663536071777, "global_step": 128414, "epoch": 3057} {"train_loss": -6.627314567565918, "global_step": 128415, "epoch": 3057} {"train_loss": -6.761279106140137, "global_step": 128416, "epoch": 3057} {"train_loss": -6.57656192779541, "global_step": 128417, "epoch": 3057} {"train_loss": -6.601269245147705, "global_step": 128418, "epoch": 3057} {"train_loss": -6.663066864013672, "global_step": 128419, "epoch": 3057} {"train_loss": -6.656704425811768, "global_step": 128420, "epoch": 3057} {"train_loss": -6.5515618324279785, "global_step": 128421, "epoch": 3057} {"train_loss": -6.694524765014648, "global_step": 128422, "epoch": 3057} {"train_loss": -6.632648468017578, "global_step": 128423, "epoch": 3057} {"train_loss": -6.456847667694092, "global_step": 128424, "epoch": 3057} {"train_loss": -6.69110631942749, "global_step": 128425, "epoch": 3057} {"train_loss": -6.584418296813965, "global_step": 128426, "epoch": 3057} {"train_loss": -6.458190441131592, "global_step": 128427, "epoch": 3057} {"train_loss": -6.5125908851623535, "global_step": 128428, "epoch": 3057} {"train_loss": -6.580704212188721, "global_step": 128429, "epoch": 3057} {"train_loss": -6.531406402587891, "global_step": 128430, "epoch": 3057} {"train_loss": -6.590364456176758, "global_step": 128431, "epoch": 3057} {"train_loss": -6.2942423820495605, "global_step": 128432, "epoch": 3057} {"train_loss": -6.432966232299805, "global_step": 128433, "epoch": 3057} {"train_loss": -6.486695766448975, "global_step": 128434, "epoch": 3057} {"train_loss": -6.603745074499221, "global_step": 128435, "epoch": 3057, "val_loss": 68339.0} {"train_loss": -6.594178199768066, "global_step": 128436, "epoch": 3058} {"train_loss": -6.569792747497559, "global_step": 128437, "epoch": 3058} {"train_loss": -6.591669082641602, "global_step": 128438, "epoch": 3058} {"train_loss": -6.464879989624023, "global_step": 128439, "epoch": 3058} {"train_loss": -6.54160213470459, "global_step": 128440, "epoch": 3058} {"train_loss": -6.426733016967773, "global_step": 128441, "epoch": 3058} {"train_loss": -6.522021293640137, "global_step": 128442, "epoch": 3058} {"train_loss": -6.547135353088379, "global_step": 128443, "epoch": 3058} {"train_loss": -6.520059585571289, "global_step": 128444, "epoch": 3058} {"train_loss": -6.498861312866211, "global_step": 128445, "epoch": 3058} {"train_loss": -6.607308387756348, "global_step": 128446, "epoch": 3058} {"train_loss": -6.60526180267334, "global_step": 128447, "epoch": 3058} {"train_loss": -6.59992790222168, "global_step": 128448, "epoch": 3058} {"train_loss": -6.479464054107666, "global_step": 128449, "epoch": 3058} {"train_loss": -6.630857944488525, "global_step": 128450, "epoch": 3058} {"train_loss": -6.497069358825684, "global_step": 128451, "epoch": 3058} {"train_loss": -6.572766304016113, "global_step": 128452, "epoch": 3058} {"train_loss": -6.602105140686035, "global_step": 128453, "epoch": 3058} {"train_loss": -6.569666862487793, "global_step": 128454, "epoch": 3058} {"train_loss": -6.5295610427856445, "global_step": 128455, "epoch": 3058} {"train_loss": -6.482504367828369, "global_step": 128456, "epoch": 3058} {"train_loss": -6.6399827003479, "global_step": 128457, "epoch": 3058} {"train_loss": -6.506770133972168, "global_step": 128458, "epoch": 3058} {"train_loss": -6.461949825286865, "global_step": 128459, "epoch": 3058} {"train_loss": -6.467175483703613, "global_step": 128460, "epoch": 3058} {"train_loss": -6.618869781494141, "global_step": 128461, "epoch": 3058} {"train_loss": -6.618828773498535, "global_step": 128462, "epoch": 3058} {"train_loss": -6.547307968139648, "global_step": 128463, "epoch": 3058} {"train_loss": -6.626077175140381, "global_step": 128464, "epoch": 3058} {"train_loss": -6.543280601501465, "global_step": 128465, "epoch": 3058} {"train_loss": -6.47650671005249, "global_step": 128466, "epoch": 3058} {"train_loss": -6.611980438232422, "global_step": 128467, "epoch": 3058} {"train_loss": -6.594446182250977, "global_step": 128468, "epoch": 3058} {"train_loss": -6.608607292175293, "global_step": 128469, "epoch": 3058} {"train_loss": -6.579378128051758, "global_step": 128470, "epoch": 3058} {"train_loss": -6.599184989929199, "global_step": 128471, "epoch": 3058} {"train_loss": -6.664803504943848, "global_step": 128472, "epoch": 3058} {"train_loss": -6.521735191345215, "global_step": 128473, "epoch": 3058} {"train_loss": -6.646885871887207, "global_step": 128474, "epoch": 3058} {"train_loss": -6.663887977600098, "global_step": 128475, "epoch": 3058} {"train_loss": -6.595041275024414, "global_step": 128476, "epoch": 3058} {"train_loss": -6.564600592567807, "global_step": 128477, "epoch": 3058, "val_loss": 68140.625} {"train_loss": -6.575189590454102, "global_step": 128478, "epoch": 3059} {"train_loss": -6.522897243499756, "global_step": 128479, "epoch": 3059} {"train_loss": -6.574287414550781, "global_step": 128480, "epoch": 3059} {"train_loss": -6.673029899597168, "global_step": 128481, "epoch": 3059} {"train_loss": -6.666960716247559, "global_step": 128482, "epoch": 3059} {"train_loss": -6.5443196296691895, "global_step": 128483, "epoch": 3059} {"train_loss": -6.557931900024414, "global_step": 128484, "epoch": 3059} {"train_loss": -6.5348615646362305, "global_step": 128485, "epoch": 3059} {"train_loss": -6.5970540046691895, "global_step": 128486, "epoch": 3059} {"train_loss": -6.665820598602295, "global_step": 128487, "epoch": 3059} {"train_loss": -6.60179328918457, "global_step": 128488, "epoch": 3059} {"train_loss": -6.486684799194336, "global_step": 128489, "epoch": 3059} {"train_loss": -6.615321159362793, "global_step": 128490, "epoch": 3059} {"train_loss": -6.565369606018066, "global_step": 128491, "epoch": 3059} {"train_loss": -6.537768840789795, "global_step": 128492, "epoch": 3059} {"train_loss": -6.616071701049805, "global_step": 128493, "epoch": 3059} {"train_loss": -6.5013275146484375, "global_step": 128494, "epoch": 3059} {"train_loss": -6.615400314331055, "global_step": 128495, "epoch": 3059} {"train_loss": -6.4953460693359375, "global_step": 128496, "epoch": 3059} {"train_loss": -6.570106506347656, "global_step": 128497, "epoch": 3059} {"train_loss": -6.526764869689941, "global_step": 128498, "epoch": 3059} {"train_loss": -6.534535884857178, "global_step": 128499, "epoch": 3059} {"train_loss": -6.600864887237549, "global_step": 128500, "epoch": 3059} {"train_loss": -6.539602279663086, "global_step": 128501, "epoch": 3059} {"train_loss": -6.598886966705322, "global_step": 128502, "epoch": 3059} {"train_loss": -6.569463729858398, "global_step": 128503, "epoch": 3059} {"train_loss": -6.596181869506836, "global_step": 128504, "epoch": 3059} {"train_loss": -6.633117198944092, "global_step": 128505, "epoch": 3059} {"train_loss": -6.645613670349121, "global_step": 128506, "epoch": 3059} {"train_loss": -6.674007415771484, "global_step": 128507, "epoch": 3059} {"train_loss": -6.656439781188965, "global_step": 128508, "epoch": 3059} {"train_loss": -6.580048561096191, "global_step": 128509, "epoch": 3059} {"train_loss": -6.664636135101318, "global_step": 128510, "epoch": 3059} {"train_loss": -6.636043548583984, "global_step": 128511, "epoch": 3059} {"train_loss": -6.609004020690918, "global_step": 128512, "epoch": 3059} {"train_loss": -6.643585205078125, "global_step": 128513, "epoch": 3059} {"train_loss": -6.564354419708252, "global_step": 128514, "epoch": 3059} {"train_loss": -6.629512310028076, "global_step": 128515, "epoch": 3059} {"train_loss": -6.547101020812988, "global_step": 128516, "epoch": 3059} {"train_loss": -6.706061363220215, "global_step": 128517, "epoch": 3059} {"train_loss": -6.588133811950684, "global_step": 128518, "epoch": 3059} {"train_loss": -6.591134639013381, "global_step": 128519, "epoch": 3059, "val_loss": 67900.390625} {"train_loss": -6.627449989318848, "global_step": 128520, "epoch": 3060} {"train_loss": -6.670227527618408, "global_step": 128521, "epoch": 3060} {"train_loss": -6.5986857414245605, "global_step": 128522, "epoch": 3060} {"train_loss": -6.553601264953613, "global_step": 128523, "epoch": 3060} {"train_loss": -6.611075401306152, "global_step": 128524, "epoch": 3060} {"train_loss": -6.726746082305908, "global_step": 128525, "epoch": 3060} {"train_loss": -6.615573406219482, "global_step": 128526, "epoch": 3060} {"train_loss": -6.657986164093018, "global_step": 128527, "epoch": 3060} {"train_loss": -6.579641342163086, "global_step": 128528, "epoch": 3060} {"train_loss": -6.696987152099609, "global_step": 128529, "epoch": 3060} {"train_loss": -6.660434722900391, "global_step": 128530, "epoch": 3060} {"train_loss": -6.62434196472168, "global_step": 128531, "epoch": 3060} {"train_loss": -6.511014938354492, "global_step": 128532, "epoch": 3060} {"train_loss": -6.711653709411621, "global_step": 128533, "epoch": 3060} {"train_loss": -6.682224273681641, "global_step": 128534, "epoch": 3060} {"train_loss": -6.683157444000244, "global_step": 128535, "epoch": 3060} {"train_loss": -6.7085957527160645, "global_step": 128536, "epoch": 3060} {"train_loss": -6.567617416381836, "global_step": 128537, "epoch": 3060} {"train_loss": -6.6488237380981445, "global_step": 128538, "epoch": 3060} {"train_loss": -6.583608627319336, "global_step": 128539, "epoch": 3060} {"train_loss": -6.666712760925293, "global_step": 128540, "epoch": 3060} {"train_loss": -6.673487663269043, "global_step": 128541, "epoch": 3060} {"train_loss": -6.559025764465332, "global_step": 128542, "epoch": 3060} {"train_loss": -6.570000648498535, "global_step": 128543, "epoch": 3060} {"train_loss": -6.542983055114746, "global_step": 128544, "epoch": 3060} {"train_loss": -6.752985000610352, "global_step": 128545, "epoch": 3060} {"train_loss": -6.584413528442383, "global_step": 128546, "epoch": 3060} {"train_loss": -6.462339401245117, "global_step": 128547, "epoch": 3060} {"train_loss": -6.70150089263916, "global_step": 128548, "epoch": 3060} {"train_loss": -6.511148452758789, "global_step": 128549, "epoch": 3060} {"train_loss": -6.674931526184082, "global_step": 128550, "epoch": 3060} {"train_loss": -6.627158164978027, "global_step": 128551, "epoch": 3060} {"train_loss": -6.693740367889404, "global_step": 128552, "epoch": 3060} {"train_loss": -6.663743495941162, "global_step": 128553, "epoch": 3060} {"train_loss": -6.702144145965576, "global_step": 128554, "epoch": 3060} {"train_loss": -6.749654769897461, "global_step": 128555, "epoch": 3060} {"train_loss": -6.823614120483398, "global_step": 128556, "epoch": 3060} {"train_loss": -6.6465020179748535, "global_step": 128557, "epoch": 3060} {"train_loss": -6.667009353637695, "global_step": 128558, "epoch": 3060} {"train_loss": -6.735990047454834, "global_step": 128559, "epoch": 3060} {"train_loss": -6.750167369842529, "global_step": 128560, "epoch": 3060} {"train_loss": -6.647364457448323, "global_step": 128561, "epoch": 3060, "val_loss": 68141.984375} {"train_loss": -6.616085052490234, "global_step": 128562, "epoch": 3061} {"train_loss": -6.73040771484375, "global_step": 128563, "epoch": 3061} {"train_loss": -6.697010040283203, "global_step": 128564, "epoch": 3061} {"train_loss": -6.5928053855896, "global_step": 128565, "epoch": 3061} {"train_loss": -6.528628349304199, "global_step": 128566, "epoch": 3061} {"train_loss": -6.590991020202637, "global_step": 128567, "epoch": 3061} {"train_loss": -6.722641468048096, "global_step": 128568, "epoch": 3061} {"train_loss": -6.648074626922607, "global_step": 128569, "epoch": 3061} {"train_loss": -6.574563980102539, "global_step": 128570, "epoch": 3061} {"train_loss": -6.766798973083496, "global_step": 128571, "epoch": 3061} {"train_loss": -6.6374430656433105, "global_step": 128572, "epoch": 3061} {"train_loss": -6.480464935302734, "global_step": 128573, "epoch": 3061} {"train_loss": -6.599600791931152, "global_step": 128574, "epoch": 3061} {"train_loss": -6.606101036071777, "global_step": 128575, "epoch": 3061} {"train_loss": -6.530553340911865, "global_step": 128576, "epoch": 3061} {"train_loss": -6.616349220275879, "global_step": 128577, "epoch": 3061} {"train_loss": -6.586921215057373, "global_step": 128578, "epoch": 3061} {"train_loss": -6.53877067565918, "global_step": 128579, "epoch": 3061} {"train_loss": -6.586237907409668, "global_step": 128580, "epoch": 3061} {"train_loss": -6.726015567779541, "global_step": 128581, "epoch": 3061} {"train_loss": -6.607094764709473, "global_step": 128582, "epoch": 3061} {"train_loss": -6.593917369842529, "global_step": 128583, "epoch": 3061} {"train_loss": -6.534916877746582, "global_step": 128584, "epoch": 3061} {"train_loss": -6.6146745681762695, "global_step": 128585, "epoch": 3061} {"train_loss": -6.475005626678467, "global_step": 128586, "epoch": 3061} {"train_loss": -6.509744644165039, "global_step": 128587, "epoch": 3061} {"train_loss": -6.590965270996094, "global_step": 128588, "epoch": 3061} {"train_loss": -6.441278457641602, "global_step": 128589, "epoch": 3061} {"train_loss": -6.633146286010742, "global_step": 128590, "epoch": 3061} {"train_loss": -6.503091812133789, "global_step": 128591, "epoch": 3061} {"train_loss": -6.4992570877075195, "global_step": 128592, "epoch": 3061} {"train_loss": -6.582185745239258, "global_step": 128593, "epoch": 3061} {"train_loss": -6.576873302459717, "global_step": 128594, "epoch": 3061} {"train_loss": -6.519709587097168, "global_step": 128595, "epoch": 3061} {"train_loss": -6.478574752807617, "global_step": 128596, "epoch": 3061} {"train_loss": -6.611154079437256, "global_step": 128597, "epoch": 3061} {"train_loss": -6.558071136474609, "global_step": 128598, "epoch": 3061} {"train_loss": -6.578544616699219, "global_step": 128599, "epoch": 3061} {"train_loss": -6.6002068519592285, "global_step": 128600, "epoch": 3061} {"train_loss": -6.5565266609191895, "global_step": 128601, "epoch": 3061} {"train_loss": -6.484447479248047, "global_step": 128602, "epoch": 3061} {"train_loss": -6.584052528653826, "global_step": 128603, "epoch": 3061, "val_loss": 68118.96875} {"train_loss": -6.565862655639648, "global_step": 128604, "epoch": 3062} {"train_loss": -6.752338886260986, "global_step": 128605, "epoch": 3062} {"train_loss": -6.533123016357422, "global_step": 128606, "epoch": 3062} {"train_loss": -6.72163724899292, "global_step": 128607, "epoch": 3062} {"train_loss": -6.559743881225586, "global_step": 128608, "epoch": 3062} {"train_loss": -6.567255020141602, "global_step": 128609, "epoch": 3062} {"train_loss": -6.701022148132324, "global_step": 128610, "epoch": 3062} {"train_loss": -6.658607482910156, "global_step": 128611, "epoch": 3062} {"train_loss": -6.646367073059082, "global_step": 128612, "epoch": 3062} {"train_loss": -6.635659217834473, "global_step": 128613, "epoch": 3062} {"train_loss": -6.649312973022461, "global_step": 128614, "epoch": 3062} {"train_loss": -6.529860496520996, "global_step": 128615, "epoch": 3062} {"train_loss": -6.531756401062012, "global_step": 128616, "epoch": 3062} {"train_loss": -6.573502063751221, "global_step": 128617, "epoch": 3062} {"train_loss": -6.59774923324585, "global_step": 128618, "epoch": 3062} {"train_loss": -6.578315734863281, "global_step": 128619, "epoch": 3062} {"train_loss": -6.607306003570557, "global_step": 128620, "epoch": 3062} {"train_loss": -6.589555740356445, "global_step": 128621, "epoch": 3062} {"train_loss": -6.6458587646484375, "global_step": 128622, "epoch": 3062} {"train_loss": -6.603237152099609, "global_step": 128623, "epoch": 3062} {"train_loss": -6.613659858703613, "global_step": 128624, "epoch": 3062} {"train_loss": -6.638847827911377, "global_step": 128625, "epoch": 3062} {"train_loss": -6.674593925476074, "global_step": 128626, "epoch": 3062} {"train_loss": -6.687317848205566, "global_step": 128627, "epoch": 3062} {"train_loss": -6.670441627502441, "global_step": 128628, "epoch": 3062} {"train_loss": -6.611415863037109, "global_step": 128629, "epoch": 3062} {"train_loss": -6.706279754638672, "global_step": 128630, "epoch": 3062} {"train_loss": -6.722385883331299, "global_step": 128631, "epoch": 3062} {"train_loss": -6.579694747924805, "global_step": 128632, "epoch": 3062} {"train_loss": -6.581396102905273, "global_step": 128633, "epoch": 3062} {"train_loss": -6.601197242736816, "global_step": 128634, "epoch": 3062} {"train_loss": -6.593576431274414, "global_step": 128635, "epoch": 3062} {"train_loss": -6.675886154174805, "global_step": 128636, "epoch": 3062} {"train_loss": -6.541308403015137, "global_step": 128637, "epoch": 3062} {"train_loss": -6.582286834716797, "global_step": 128638, "epoch": 3062} {"train_loss": -6.624703407287598, "global_step": 128639, "epoch": 3062} {"train_loss": -6.445316314697266, "global_step": 128640, "epoch": 3062} {"train_loss": -6.608126640319824, "global_step": 128641, "epoch": 3062} {"train_loss": -6.614268779754639, "global_step": 128642, "epoch": 3062} {"train_loss": -6.452902793884277, "global_step": 128643, "epoch": 3062} {"train_loss": -6.617981910705566, "global_step": 128644, "epoch": 3062} {"train_loss": -6.611912454877581, "global_step": 128645, "epoch": 3062, "val_loss": 68211.3203125} {"train_loss": -6.658673286437988, "global_step": 128646, "epoch": 3063} {"train_loss": -6.642028331756592, "global_step": 128647, "epoch": 3063} {"train_loss": -6.468896389007568, "global_step": 128648, "epoch": 3063} {"train_loss": -6.590388298034668, "global_step": 128649, "epoch": 3063} {"train_loss": -6.586047649383545, "global_step": 128650, "epoch": 3063} {"train_loss": -6.560454368591309, "global_step": 128651, "epoch": 3063} {"train_loss": -6.561476707458496, "global_step": 128652, "epoch": 3063} {"train_loss": -6.486958026885986, "global_step": 128653, "epoch": 3063} {"train_loss": -6.644783020019531, "global_step": 128654, "epoch": 3063} {"train_loss": -6.5360002517700195, "global_step": 128655, "epoch": 3063} {"train_loss": -6.6709184646606445, "global_step": 128656, "epoch": 3063} {"train_loss": -6.634615898132324, "global_step": 128657, "epoch": 3063} {"train_loss": -6.534764289855957, "global_step": 128658, "epoch": 3063} {"train_loss": -6.563830852508545, "global_step": 128659, "epoch": 3063} {"train_loss": -6.48906946182251, "global_step": 128660, "epoch": 3063} {"train_loss": -6.594414710998535, "global_step": 128661, "epoch": 3063} {"train_loss": -6.592329025268555, "global_step": 128662, "epoch": 3063} {"train_loss": -6.567547798156738, "global_step": 128663, "epoch": 3063} {"train_loss": -6.579557418823242, "global_step": 128664, "epoch": 3063} {"train_loss": -6.623541831970215, "global_step": 128665, "epoch": 3063} {"train_loss": -6.55744743347168, "global_step": 128666, "epoch": 3063} {"train_loss": -6.559309959411621, "global_step": 128667, "epoch": 3063} {"train_loss": -6.6046576499938965, "global_step": 128668, "epoch": 3063} {"train_loss": -6.52772855758667, "global_step": 128669, "epoch": 3063} {"train_loss": -6.605713844299316, "global_step": 128670, "epoch": 3063} {"train_loss": -6.578971862792969, "global_step": 128671, "epoch": 3063} {"train_loss": -6.560135841369629, "global_step": 128672, "epoch": 3063} {"train_loss": -6.6156392097473145, "global_step": 128673, "epoch": 3063} {"train_loss": -6.454248905181885, "global_step": 128674, "epoch": 3063} {"train_loss": -6.593345642089844, "global_step": 128675, "epoch": 3063} {"train_loss": -6.604061603546143, "global_step": 128676, "epoch": 3063} {"train_loss": -6.560617446899414, "global_step": 128677, "epoch": 3063} {"train_loss": -6.669602870941162, "global_step": 128678, "epoch": 3063} {"train_loss": -6.562899589538574, "global_step": 128679, "epoch": 3063} {"train_loss": -6.4406418800354, "global_step": 128680, "epoch": 3063} {"train_loss": -6.642282009124756, "global_step": 128681, "epoch": 3063} {"train_loss": -6.4594197273254395, "global_step": 128682, "epoch": 3063} {"train_loss": -6.672790050506592, "global_step": 128683, "epoch": 3063} {"train_loss": -6.533177852630615, "global_step": 128684, "epoch": 3063} {"train_loss": -6.566847324371338, "global_step": 128685, "epoch": 3063} {"train_loss": -6.644674301147461, "global_step": 128686, "epoch": 3063} {"train_loss": -6.574735085169475, "global_step": 128687, "epoch": 3063, "val_loss": 68204.4453125} {"train_loss": -6.7046918869018555, "global_step": 128688, "epoch": 3064} {"train_loss": -6.493750095367432, "global_step": 128689, "epoch": 3064} {"train_loss": -6.605245590209961, "global_step": 128690, "epoch": 3064} {"train_loss": -6.474481582641602, "global_step": 128691, "epoch": 3064} {"train_loss": -6.378782272338867, "global_step": 128692, "epoch": 3064} {"train_loss": -6.681894302368164, "global_step": 128693, "epoch": 3064} {"train_loss": -6.558009147644043, "global_step": 128694, "epoch": 3064} {"train_loss": -6.472455024719238, "global_step": 128695, "epoch": 3064} {"train_loss": -6.529531478881836, "global_step": 128696, "epoch": 3064} {"train_loss": -6.547157287597656, "global_step": 128697, "epoch": 3064} {"train_loss": -6.502824783325195, "global_step": 128698, "epoch": 3064} {"train_loss": -6.621591567993164, "global_step": 128699, "epoch": 3064} {"train_loss": -6.477999687194824, "global_step": 128700, "epoch": 3064} {"train_loss": -6.588379859924316, "global_step": 128701, "epoch": 3064} {"train_loss": -6.644330978393555, "global_step": 128702, "epoch": 3064} {"train_loss": -6.596732139587402, "global_step": 128703, "epoch": 3064} {"train_loss": -6.503961563110352, "global_step": 128704, "epoch": 3064} {"train_loss": -6.4963226318359375, "global_step": 128705, "epoch": 3064} {"train_loss": -6.550278663635254, "global_step": 128706, "epoch": 3064} {"train_loss": -6.540905952453613, "global_step": 128707, "epoch": 3064} {"train_loss": -6.525793075561523, "global_step": 128708, "epoch": 3064} {"train_loss": -6.628459453582764, "global_step": 128709, "epoch": 3064} {"train_loss": -6.589937686920166, "global_step": 128710, "epoch": 3064} {"train_loss": -6.603928565979004, "global_step": 128711, "epoch": 3064} {"train_loss": -6.6421709060668945, "global_step": 128712, "epoch": 3064} {"train_loss": -6.451230049133301, "global_step": 128713, "epoch": 3064} {"train_loss": -6.49299955368042, "global_step": 128714, "epoch": 3064} {"train_loss": -6.472039222717285, "global_step": 128715, "epoch": 3064} {"train_loss": -6.6263532638549805, "global_step": 128716, "epoch": 3064} {"train_loss": -6.57065486907959, "global_step": 128717, "epoch": 3064} {"train_loss": -6.521820068359375, "global_step": 128718, "epoch": 3064} {"train_loss": -6.575191974639893, "global_step": 128719, "epoch": 3064} {"train_loss": -6.5562744140625, "global_step": 128720, "epoch": 3064} {"train_loss": -6.646758079528809, "global_step": 128721, "epoch": 3064} {"train_loss": -6.541557312011719, "global_step": 128722, "epoch": 3064} {"train_loss": -6.626300811767578, "global_step": 128723, "epoch": 3064} {"train_loss": -6.521578788757324, "global_step": 128724, "epoch": 3064} {"train_loss": -6.625253677368164, "global_step": 128725, "epoch": 3064} {"train_loss": -6.632251739501953, "global_step": 128726, "epoch": 3064} {"train_loss": -6.501021385192871, "global_step": 128727, "epoch": 3064} {"train_loss": -6.57449197769165, "global_step": 128728, "epoch": 3064} {"train_loss": -6.556954724448068, "global_step": 128729, "epoch": 3064, "val_loss": 68089.3125} {"train_loss": -6.608921051025391, "global_step": 128730, "epoch": 3065} {"train_loss": -6.557005882263184, "global_step": 128731, "epoch": 3065} {"train_loss": -6.491539478302002, "global_step": 128732, "epoch": 3065} {"train_loss": -6.578463077545166, "global_step": 128733, "epoch": 3065} {"train_loss": -6.650292873382568, "global_step": 128734, "epoch": 3065} {"train_loss": -6.601897239685059, "global_step": 128735, "epoch": 3065} {"train_loss": -6.455033302307129, "global_step": 128736, "epoch": 3065} {"train_loss": -6.537288665771484, "global_step": 128737, "epoch": 3065} {"train_loss": -6.495145320892334, "global_step": 128738, "epoch": 3065} {"train_loss": -6.622631072998047, "global_step": 128739, "epoch": 3065} {"train_loss": -6.66241979598999, "global_step": 128740, "epoch": 3065} {"train_loss": -6.515120506286621, "global_step": 128741, "epoch": 3065} {"train_loss": -6.576898097991943, "global_step": 128742, "epoch": 3065} {"train_loss": -6.647152900695801, "global_step": 128743, "epoch": 3065} {"train_loss": -6.51073694229126, "global_step": 128744, "epoch": 3065} {"train_loss": -6.554643154144287, "global_step": 128745, "epoch": 3065} {"train_loss": -6.6033148765563965, "global_step": 128746, "epoch": 3065} {"train_loss": -6.6461567878723145, "global_step": 128747, "epoch": 3065} {"train_loss": -6.56572961807251, "global_step": 128748, "epoch": 3065} {"train_loss": -6.6447601318359375, "global_step": 128749, "epoch": 3065} {"train_loss": -6.55131196975708, "global_step": 128750, "epoch": 3065} {"train_loss": -6.661462306976318, "global_step": 128751, "epoch": 3065} {"train_loss": -6.641051292419434, "global_step": 128752, "epoch": 3065} {"train_loss": -6.6602888107299805, "global_step": 128753, "epoch": 3065} {"train_loss": -6.650278091430664, "global_step": 128754, "epoch": 3065} {"train_loss": -6.707924842834473, "global_step": 128755, "epoch": 3065} {"train_loss": -6.741873741149902, "global_step": 128756, "epoch": 3065} {"train_loss": -6.612220764160156, "global_step": 128757, "epoch": 3065} {"train_loss": -6.684804916381836, "global_step": 128758, "epoch": 3065} {"train_loss": -6.611016273498535, "global_step": 128759, "epoch": 3065} {"train_loss": -6.652225494384766, "global_step": 128760, "epoch": 3065} {"train_loss": -6.642297744750977, "global_step": 128761, "epoch": 3065} {"train_loss": -6.611215114593506, "global_step": 128762, "epoch": 3065} {"train_loss": -6.650764465332031, "global_step": 128763, "epoch": 3065} {"train_loss": -6.68472957611084, "global_step": 128764, "epoch": 3065} {"train_loss": -6.60375452041626, "global_step": 128765, "epoch": 3065} {"train_loss": -6.641287326812744, "global_step": 128766, "epoch": 3065} {"train_loss": -6.596236228942871, "global_step": 128767, "epoch": 3065} {"train_loss": -6.533358573913574, "global_step": 128768, "epoch": 3065} {"train_loss": -6.652701377868652, "global_step": 128769, "epoch": 3065} {"train_loss": -6.570504188537598, "global_step": 128770, "epoch": 3065} {"train_loss": -6.608392386209397, "global_step": 128771, "epoch": 3065, "val_loss": 68053.0859375} {"train_loss": -6.529336929321289, "global_step": 128772, "epoch": 3066} {"train_loss": -6.620236396789551, "global_step": 128773, "epoch": 3066} {"train_loss": -6.750017166137695, "global_step": 128774, "epoch": 3066} {"train_loss": -6.661680221557617, "global_step": 128775, "epoch": 3066} {"train_loss": -6.660926818847656, "global_step": 128776, "epoch": 3066} {"train_loss": -6.719926834106445, "global_step": 128777, "epoch": 3066} {"train_loss": -6.666520595550537, "global_step": 128778, "epoch": 3066} {"train_loss": -6.607788562774658, "global_step": 128779, "epoch": 3066} {"train_loss": -6.602212905883789, "global_step": 128780, "epoch": 3066} {"train_loss": -6.613888263702393, "global_step": 128781, "epoch": 3066} {"train_loss": -6.766238212585449, "global_step": 128782, "epoch": 3066} {"train_loss": -6.685891628265381, "global_step": 128783, "epoch": 3066} {"train_loss": -6.691097259521484, "global_step": 128784, "epoch": 3066} {"train_loss": -6.592484474182129, "global_step": 128785, "epoch": 3066} {"train_loss": -6.699193000793457, "global_step": 128786, "epoch": 3066} {"train_loss": -6.609001159667969, "global_step": 128787, "epoch": 3066} {"train_loss": -6.6305036544799805, "global_step": 128788, "epoch": 3066} {"train_loss": -6.610013008117676, "global_step": 128789, "epoch": 3066} {"train_loss": -6.655091285705566, "global_step": 128790, "epoch": 3066} {"train_loss": -6.602538108825684, "global_step": 128791, "epoch": 3066} {"train_loss": -6.648691177368164, "global_step": 128792, "epoch": 3066} {"train_loss": -6.510801315307617, "global_step": 128793, "epoch": 3066} {"train_loss": -6.687722206115723, "global_step": 128794, "epoch": 3066} {"train_loss": -6.68564510345459, "global_step": 128795, "epoch": 3066} {"train_loss": -6.631426811218262, "global_step": 128796, "epoch": 3066} {"train_loss": -6.593906402587891, "global_step": 128797, "epoch": 3066} {"train_loss": -6.5780839920043945, "global_step": 128798, "epoch": 3066} {"train_loss": -6.606072425842285, "global_step": 128799, "epoch": 3066} {"train_loss": -6.656911849975586, "global_step": 128800, "epoch": 3066} {"train_loss": -6.525832176208496, "global_step": 128801, "epoch": 3066} {"train_loss": -6.7035112380981445, "global_step": 128802, "epoch": 3066} {"train_loss": -6.542900085449219, "global_step": 128803, "epoch": 3066} {"train_loss": -6.602839946746826, "global_step": 128804, "epoch": 3066} {"train_loss": -6.588308811187744, "global_step": 128805, "epoch": 3066} {"train_loss": -6.581337928771973, "global_step": 128806, "epoch": 3066} {"train_loss": -6.6554083824157715, "global_step": 128807, "epoch": 3066} {"train_loss": -6.581472396850586, "global_step": 128808, "epoch": 3066} {"train_loss": -6.671989917755127, "global_step": 128809, "epoch": 3066} {"train_loss": -6.402600288391113, "global_step": 128810, "epoch": 3066} {"train_loss": -6.420925140380859, "global_step": 128811, "epoch": 3066} {"train_loss": -6.607189178466797, "global_step": 128812, "epoch": 3066} {"train_loss": -6.619110220954532, "global_step": 128813, "epoch": 3066, "val_loss": 68091.6484375} {"train_loss": -6.600865364074707, "global_step": 128814, "epoch": 3067} {"train_loss": -6.615119457244873, "global_step": 128815, "epoch": 3067} {"train_loss": -6.532486915588379, "global_step": 128816, "epoch": 3067} {"train_loss": -6.651582717895508, "global_step": 128817, "epoch": 3067} {"train_loss": -6.557546615600586, "global_step": 128818, "epoch": 3067} {"train_loss": -6.677252769470215, "global_step": 128819, "epoch": 3067} {"train_loss": -6.6140265464782715, "global_step": 128820, "epoch": 3067} {"train_loss": -6.587385177612305, "global_step": 128821, "epoch": 3067} {"train_loss": -6.668403625488281, "global_step": 128822, "epoch": 3067} {"train_loss": -6.6337361335754395, "global_step": 128823, "epoch": 3067} {"train_loss": -6.670980453491211, "global_step": 128824, "epoch": 3067} {"train_loss": -6.653746128082275, "global_step": 128825, "epoch": 3067} {"train_loss": -6.657909393310547, "global_step": 128826, "epoch": 3067} {"train_loss": -6.636275768280029, "global_step": 128827, "epoch": 3067} {"train_loss": -6.523778915405273, "global_step": 128828, "epoch": 3067} {"train_loss": -6.7049360275268555, "global_step": 128829, "epoch": 3067} {"train_loss": -6.395648956298828, "global_step": 128830, "epoch": 3067} {"train_loss": -6.462812423706055, "global_step": 128831, "epoch": 3067} {"train_loss": -6.555210113525391, "global_step": 128832, "epoch": 3067} {"train_loss": -6.626662731170654, "global_step": 128833, "epoch": 3067} {"train_loss": -6.688800811767578, "global_step": 128834, "epoch": 3067} {"train_loss": -6.583774089813232, "global_step": 128835, "epoch": 3067} {"train_loss": -6.592768669128418, "global_step": 128836, "epoch": 3067} {"train_loss": -6.657095909118652, "global_step": 128837, "epoch": 3067} {"train_loss": -6.651174068450928, "global_step": 128838, "epoch": 3067} {"train_loss": -6.569616317749023, "global_step": 128839, "epoch": 3067} {"train_loss": -6.672496795654297, "global_step": 128840, "epoch": 3067} {"train_loss": -6.522983074188232, "global_step": 128841, "epoch": 3067} {"train_loss": -6.690084457397461, "global_step": 128842, "epoch": 3067} {"train_loss": -6.700504302978516, "global_step": 128843, "epoch": 3067} {"train_loss": -6.585916519165039, "global_step": 128844, "epoch": 3067} {"train_loss": -6.652427673339844, "global_step": 128845, "epoch": 3067} {"train_loss": -6.7622389793396, "global_step": 128846, "epoch": 3067} {"train_loss": -6.626355171203613, "global_step": 128847, "epoch": 3067} {"train_loss": -6.748542785644531, "global_step": 128848, "epoch": 3067} {"train_loss": -6.61685848236084, "global_step": 128849, "epoch": 3067} {"train_loss": -6.60958194732666, "global_step": 128850, "epoch": 3067} {"train_loss": -6.564805030822754, "global_step": 128851, "epoch": 3067} {"train_loss": -6.617865085601807, "global_step": 128852, "epoch": 3067} {"train_loss": -6.607568740844727, "global_step": 128853, "epoch": 3067} {"train_loss": -6.672499656677246, "global_step": 128854, "epoch": 3067} {"train_loss": -6.62295058795384, "global_step": 128855, "epoch": 3067, "val_loss": 68109.1640625} {"train_loss": -6.716805458068848, "global_step": 128856, "epoch": 3068} {"train_loss": -6.713954925537109, "global_step": 128857, "epoch": 3068} {"train_loss": -6.704781532287598, "global_step": 128858, "epoch": 3068} {"train_loss": -6.795974254608154, "global_step": 128859, "epoch": 3068} {"train_loss": -6.635223388671875, "global_step": 128860, "epoch": 3068} {"train_loss": -6.60735559463501, "global_step": 128861, "epoch": 3068} {"train_loss": -6.585977554321289, "global_step": 128862, "epoch": 3068} {"train_loss": -6.729454517364502, "global_step": 128863, "epoch": 3068} {"train_loss": -6.691370487213135, "global_step": 128864, "epoch": 3068} {"train_loss": -6.468851566314697, "global_step": 128865, "epoch": 3068} {"train_loss": -6.697337627410889, "global_step": 128866, "epoch": 3068} {"train_loss": -6.717225074768066, "global_step": 128867, "epoch": 3068} {"train_loss": -6.67547607421875, "global_step": 128868, "epoch": 3068} {"train_loss": -6.5957489013671875, "global_step": 128869, "epoch": 3068} {"train_loss": -6.551942825317383, "global_step": 128870, "epoch": 3068} {"train_loss": -6.607987403869629, "global_step": 128871, "epoch": 3068} {"train_loss": -6.56096076965332, "global_step": 128872, "epoch": 3068} {"train_loss": -6.523536682128906, "global_step": 128873, "epoch": 3068} {"train_loss": -6.571094036102295, "global_step": 128874, "epoch": 3068} {"train_loss": -6.654253005981445, "global_step": 128875, "epoch": 3068} {"train_loss": -6.584624290466309, "global_step": 128876, "epoch": 3068} {"train_loss": -6.602006912231445, "global_step": 128877, "epoch": 3068} {"train_loss": -6.576603889465332, "global_step": 128878, "epoch": 3068} {"train_loss": -6.6015849113464355, "global_step": 128879, "epoch": 3068} {"train_loss": -6.594934463500977, "global_step": 128880, "epoch": 3068} {"train_loss": -6.575308799743652, "global_step": 128881, "epoch": 3068} {"train_loss": -6.486736297607422, "global_step": 128882, "epoch": 3068} {"train_loss": -6.574256896972656, "global_step": 128883, "epoch": 3068} {"train_loss": -6.601348400115967, "global_step": 128884, "epoch": 3068} {"train_loss": -6.5062971115112305, "global_step": 128885, "epoch": 3068} {"train_loss": -6.641810417175293, "global_step": 128886, "epoch": 3068} {"train_loss": -6.468932628631592, "global_step": 128887, "epoch": 3068} {"train_loss": -6.675260066986084, "global_step": 128888, "epoch": 3068} {"train_loss": -6.616153717041016, "global_step": 128889, "epoch": 3068} {"train_loss": -6.603615760803223, "global_step": 128890, "epoch": 3068} {"train_loss": -6.780716896057129, "global_step": 128891, "epoch": 3068} {"train_loss": -6.6289191246032715, "global_step": 128892, "epoch": 3068} {"train_loss": -6.657015800476074, "global_step": 128893, "epoch": 3068} {"train_loss": -6.616416931152344, "global_step": 128894, "epoch": 3068} {"train_loss": -6.562620162963867, "global_step": 128895, "epoch": 3068} {"train_loss": -6.681097030639648, "global_step": 128896, "epoch": 3068} {"train_loss": -6.618271975290208, "global_step": 128897, "epoch": 3068, "val_loss": 68196.1640625} {"train_loss": -6.646533966064453, "global_step": 128898, "epoch": 3069} {"train_loss": -6.654475688934326, "global_step": 128899, "epoch": 3069} {"train_loss": -6.418611526489258, "global_step": 128900, "epoch": 3069} {"train_loss": -6.574188232421875, "global_step": 128901, "epoch": 3069} {"train_loss": -6.523441791534424, "global_step": 128902, "epoch": 3069} {"train_loss": -6.526286602020264, "global_step": 128903, "epoch": 3069} {"train_loss": -6.5967793464660645, "global_step": 128904, "epoch": 3069} {"train_loss": -6.596467018127441, "global_step": 128905, "epoch": 3069} {"train_loss": -6.464655876159668, "global_step": 128906, "epoch": 3069} {"train_loss": -6.608806133270264, "global_step": 128907, "epoch": 3069} {"train_loss": -6.60093879699707, "global_step": 128908, "epoch": 3069} {"train_loss": -6.545707702636719, "global_step": 128909, "epoch": 3069} {"train_loss": -6.630837440490723, "global_step": 128910, "epoch": 3069} {"train_loss": -6.657656669616699, "global_step": 128911, "epoch": 3069} {"train_loss": -6.687491416931152, "global_step": 128912, "epoch": 3069} {"train_loss": -6.586417198181152, "global_step": 128913, "epoch": 3069} {"train_loss": -6.713619709014893, "global_step": 128914, "epoch": 3069} {"train_loss": -6.437975883483887, "global_step": 128915, "epoch": 3069} {"train_loss": -6.5901970863342285, "global_step": 128916, "epoch": 3069} {"train_loss": -6.723812580108643, "global_step": 128917, "epoch": 3069} {"train_loss": -6.611040115356445, "global_step": 128918, "epoch": 3069} {"train_loss": -6.615453720092773, "global_step": 128919, "epoch": 3069} {"train_loss": -6.553891181945801, "global_step": 128920, "epoch": 3069} {"train_loss": -6.521315574645996, "global_step": 128921, "epoch": 3069} {"train_loss": -6.643845081329346, "global_step": 128922, "epoch": 3069} {"train_loss": -6.568781852722168, "global_step": 128923, "epoch": 3069} {"train_loss": -6.536556243896484, "global_step": 128924, "epoch": 3069} {"train_loss": -6.6109771728515625, "global_step": 128925, "epoch": 3069} {"train_loss": -6.6064252853393555, "global_step": 128926, "epoch": 3069} {"train_loss": -6.626282691955566, "global_step": 128927, "epoch": 3069} {"train_loss": -6.634943008422852, "global_step": 128928, "epoch": 3069} {"train_loss": -6.672758102416992, "global_step": 128929, "epoch": 3069} {"train_loss": -6.6025004386901855, "global_step": 128930, "epoch": 3069} {"train_loss": -6.693668365478516, "global_step": 128931, "epoch": 3069} {"train_loss": -6.625646114349365, "global_step": 128932, "epoch": 3069} {"train_loss": -6.5329909324646, "global_step": 128933, "epoch": 3069} {"train_loss": -6.635439872741699, "global_step": 128934, "epoch": 3069} {"train_loss": -6.696920394897461, "global_step": 128935, "epoch": 3069} {"train_loss": -6.689428806304932, "global_step": 128936, "epoch": 3069} {"train_loss": -6.591375827789307, "global_step": 128937, "epoch": 3069} {"train_loss": -6.558204174041748, "global_step": 128938, "epoch": 3069} {"train_loss": -6.598232734771002, "global_step": 128939, "epoch": 3069, "val_loss": 68098.484375} {"train_loss": -6.627706527709961, "global_step": 128940, "epoch": 3070} {"train_loss": -6.604020118713379, "global_step": 128941, "epoch": 3070} {"train_loss": -6.619421005249023, "global_step": 128942, "epoch": 3070} {"train_loss": -6.625948905944824, "global_step": 128943, "epoch": 3070} {"train_loss": -6.583704948425293, "global_step": 128944, "epoch": 3070} {"train_loss": -6.580165386199951, "global_step": 128945, "epoch": 3070} {"train_loss": -6.678289890289307, "global_step": 128946, "epoch": 3070} {"train_loss": -6.601828575134277, "global_step": 128947, "epoch": 3070} {"train_loss": -6.601317405700684, "global_step": 128948, "epoch": 3070} {"train_loss": -6.586623668670654, "global_step": 128949, "epoch": 3070} {"train_loss": -6.663191795349121, "global_step": 128950, "epoch": 3070} {"train_loss": -6.720149040222168, "global_step": 128951, "epoch": 3070} {"train_loss": -6.685683727264404, "global_step": 128952, "epoch": 3070} {"train_loss": -6.5290751457214355, "global_step": 128953, "epoch": 3070} {"train_loss": -6.681793212890625, "global_step": 128954, "epoch": 3070} {"train_loss": -6.664464473724365, "global_step": 128955, "epoch": 3070} {"train_loss": -6.720821380615234, "global_step": 128956, "epoch": 3070} {"train_loss": -6.6330671310424805, "global_step": 128957, "epoch": 3070} {"train_loss": -6.8025336265563965, "global_step": 128958, "epoch": 3070} {"train_loss": -6.755354404449463, "global_step": 128959, "epoch": 3070} {"train_loss": -6.65772819519043, "global_step": 128960, "epoch": 3070} {"train_loss": -6.391197204589844, "global_step": 128961, "epoch": 3070} {"train_loss": -6.586165428161621, "global_step": 128962, "epoch": 3070} {"train_loss": -6.620811462402344, "global_step": 128963, "epoch": 3070} {"train_loss": -6.62971830368042, "global_step": 128964, "epoch": 3070} {"train_loss": -6.624432563781738, "global_step": 128965, "epoch": 3070} {"train_loss": -6.6461639404296875, "global_step": 128966, "epoch": 3070} {"train_loss": -6.436017036437988, "global_step": 128967, "epoch": 3070} {"train_loss": -6.571194648742676, "global_step": 128968, "epoch": 3070} {"train_loss": -6.5696024894714355, "global_step": 128969, "epoch": 3070} {"train_loss": -6.572605133056641, "global_step": 128970, "epoch": 3070} {"train_loss": -6.649796485900879, "global_step": 128971, "epoch": 3070} {"train_loss": -6.449241638183594, "global_step": 128972, "epoch": 3070} {"train_loss": -6.620589733123779, "global_step": 128973, "epoch": 3070} {"train_loss": -6.503066539764404, "global_step": 128974, "epoch": 3070} {"train_loss": -6.651065349578857, "global_step": 128975, "epoch": 3070} {"train_loss": -6.662053108215332, "global_step": 128976, "epoch": 3070} {"train_loss": -6.650653839111328, "global_step": 128977, "epoch": 3070} {"train_loss": -6.729548931121826, "global_step": 128978, "epoch": 3070} {"train_loss": -6.529420852661133, "global_step": 128979, "epoch": 3070} {"train_loss": -6.658604145050049, "global_step": 128980, "epoch": 3070} {"train_loss": -6.621342431931269, "global_step": 128981, "epoch": 3070, "val_loss": 68163.4921875} {"train_loss": -6.6615095138549805, "global_step": 128982, "epoch": 3071} {"train_loss": -6.595600128173828, "global_step": 128983, "epoch": 3071} {"train_loss": -6.594697952270508, "global_step": 128984, "epoch": 3071} {"train_loss": -6.578890323638916, "global_step": 128985, "epoch": 3071} {"train_loss": -6.591183662414551, "global_step": 128986, "epoch": 3071} {"train_loss": -6.612570285797119, "global_step": 128987, "epoch": 3071} {"train_loss": -6.5389404296875, "global_step": 128988, "epoch": 3071} {"train_loss": -6.628826141357422, "global_step": 128989, "epoch": 3071} {"train_loss": -6.660625457763672, "global_step": 128990, "epoch": 3071} {"train_loss": -6.569181442260742, "global_step": 128991, "epoch": 3071} {"train_loss": -6.665539741516113, "global_step": 128992, "epoch": 3071} {"train_loss": -6.709907531738281, "global_step": 128993, "epoch": 3071} {"train_loss": -6.636008262634277, "global_step": 128994, "epoch": 3071} {"train_loss": -6.74194860458374, "global_step": 128995, "epoch": 3071} {"train_loss": -6.521399021148682, "global_step": 128996, "epoch": 3071} {"train_loss": -6.6393914222717285, "global_step": 128997, "epoch": 3071} {"train_loss": -6.886477470397949, "global_step": 128998, "epoch": 3071} {"train_loss": -6.547970294952393, "global_step": 128999, "epoch": 3071} {"train_loss": -6.660802841186523, "global_step": 129000, "epoch": 3071} {"train_loss": -6.666505813598633, "global_step": 129001, "epoch": 3071} {"train_loss": -6.763958930969238, "global_step": 129002, "epoch": 3071} {"train_loss": -6.73917293548584, "global_step": 129003, "epoch": 3071} {"train_loss": -6.67818546295166, "global_step": 129004, "epoch": 3071} {"train_loss": -6.647522449493408, "global_step": 129005, "epoch": 3071} {"train_loss": -6.634809494018555, "global_step": 129006, "epoch": 3071} {"train_loss": -6.773576259613037, "global_step": 129007, "epoch": 3071} {"train_loss": -6.58296012878418, "global_step": 129008, "epoch": 3071} {"train_loss": -6.519248962402344, "global_step": 129009, "epoch": 3071} {"train_loss": -6.460104942321777, "global_step": 129010, "epoch": 3071} {"train_loss": -6.629577159881592, "global_step": 129011, "epoch": 3071} {"train_loss": -6.734466075897217, "global_step": 129012, "epoch": 3071} {"train_loss": -6.615912914276123, "global_step": 129013, "epoch": 3071} {"train_loss": -6.71889591217041, "global_step": 129014, "epoch": 3071} {"train_loss": -6.636261940002441, "global_step": 129015, "epoch": 3071} {"train_loss": -6.671950817108154, "global_step": 129016, "epoch": 3071} {"train_loss": -6.476807594299316, "global_step": 129017, "epoch": 3071} {"train_loss": -6.647960662841797, "global_step": 129018, "epoch": 3071} {"train_loss": -6.642149925231934, "global_step": 129019, "epoch": 3071} {"train_loss": -6.6185431480407715, "global_step": 129020, "epoch": 3071} {"train_loss": -6.49038028717041, "global_step": 129021, "epoch": 3071} {"train_loss": -6.678839683532715, "global_step": 129022, "epoch": 3071} {"train_loss": -6.63408180645534, "global_step": 129023, "epoch": 3071, "val_loss": 68183.328125} {"train_loss": -6.657008647918701, "global_step": 129024, "epoch": 3072} {"train_loss": -6.626593112945557, "global_step": 129025, "epoch": 3072} {"train_loss": -6.5521979331970215, "global_step": 129026, "epoch": 3072} {"train_loss": -6.618748664855957, "global_step": 129027, "epoch": 3072} {"train_loss": -6.638039588928223, "global_step": 129028, "epoch": 3072} {"train_loss": -6.6286797523498535, "global_step": 129029, "epoch": 3072} {"train_loss": -6.663541793823242, "global_step": 129030, "epoch": 3072} {"train_loss": -6.655858993530273, "global_step": 129031, "epoch": 3072} {"train_loss": -6.568138122558594, "global_step": 129032, "epoch": 3072} {"train_loss": -6.548491477966309, "global_step": 129033, "epoch": 3072} {"train_loss": -6.5009613037109375, "global_step": 129034, "epoch": 3072} {"train_loss": -6.606882095336914, "global_step": 129035, "epoch": 3072} {"train_loss": -6.50468635559082, "global_step": 129036, "epoch": 3072} {"train_loss": -6.555850028991699, "global_step": 129037, "epoch": 3072} {"train_loss": -6.625455856323242, "global_step": 129038, "epoch": 3072} {"train_loss": -6.536178112030029, "global_step": 129039, "epoch": 3072} {"train_loss": -6.69864559173584, "global_step": 129040, "epoch": 3072} {"train_loss": -6.650516510009766, "global_step": 129041, "epoch": 3072} {"train_loss": -6.695051193237305, "global_step": 129042, "epoch": 3072} {"train_loss": -6.49395751953125, "global_step": 129043, "epoch": 3072} {"train_loss": -6.469893932342529, "global_step": 129044, "epoch": 3072} {"train_loss": -6.529723167419434, "global_step": 129045, "epoch": 3072} {"train_loss": -6.579251289367676, "global_step": 129046, "epoch": 3072} {"train_loss": -6.567525386810303, "global_step": 129047, "epoch": 3072} {"train_loss": -6.70509147644043, "global_step": 129048, "epoch": 3072} {"train_loss": -6.603279113769531, "global_step": 129049, "epoch": 3072} {"train_loss": -6.620314121246338, "global_step": 129050, "epoch": 3072} {"train_loss": -6.579704761505127, "global_step": 129051, "epoch": 3072} {"train_loss": -6.588479995727539, "global_step": 129052, "epoch": 3072} {"train_loss": -6.739300727844238, "global_step": 129053, "epoch": 3072} {"train_loss": -6.607861042022705, "global_step": 129054, "epoch": 3072} {"train_loss": -6.528421401977539, "global_step": 129055, "epoch": 3072} {"train_loss": -6.664442539215088, "global_step": 129056, "epoch": 3072} {"train_loss": -6.624532699584961, "global_step": 129057, "epoch": 3072} {"train_loss": -6.562557220458984, "global_step": 129058, "epoch": 3072} {"train_loss": -6.624751091003418, "global_step": 129059, "epoch": 3072} {"train_loss": -6.704583168029785, "global_step": 129060, "epoch": 3072} {"train_loss": -6.574665069580078, "global_step": 129061, "epoch": 3072} {"train_loss": -6.470872402191162, "global_step": 129062, "epoch": 3072} {"train_loss": -6.579805374145508, "global_step": 129063, "epoch": 3072} {"train_loss": -6.560564994812012, "global_step": 129064, "epoch": 3072} {"train_loss": -6.600797460192726, "global_step": 129065, "epoch": 3072, "val_loss": 68161.875} {"train_loss": -6.5818963050842285, "global_step": 129066, "epoch": 3073} {"train_loss": -6.628140926361084, "global_step": 129067, "epoch": 3073} {"train_loss": -6.51999568939209, "global_step": 129068, "epoch": 3073} {"train_loss": -6.553929805755615, "global_step": 129069, "epoch": 3073} {"train_loss": -6.629935264587402, "global_step": 129070, "epoch": 3073} {"train_loss": -6.394597053527832, "global_step": 129071, "epoch": 3073} {"train_loss": -6.680988311767578, "global_step": 129072, "epoch": 3073} {"train_loss": -6.465445518493652, "global_step": 129073, "epoch": 3073} {"train_loss": -6.623684883117676, "global_step": 129074, "epoch": 3073} {"train_loss": -6.688801288604736, "global_step": 129075, "epoch": 3073} {"train_loss": -6.641318321228027, "global_step": 129076, "epoch": 3073} {"train_loss": -6.5942206382751465, "global_step": 129077, "epoch": 3073} {"train_loss": -6.696384429931641, "global_step": 129078, "epoch": 3073} {"train_loss": -6.622920036315918, "global_step": 129079, "epoch": 3073} {"train_loss": -6.643209457397461, "global_step": 129080, "epoch": 3073} {"train_loss": -6.66334867477417, "global_step": 129081, "epoch": 3073} {"train_loss": -6.68126916885376, "global_step": 129082, "epoch": 3073} {"train_loss": -6.676831245422363, "global_step": 129083, "epoch": 3073} {"train_loss": -6.6392292976379395, "global_step": 129084, "epoch": 3073} {"train_loss": -6.545222282409668, "global_step": 129085, "epoch": 3073} {"train_loss": -6.650518417358398, "global_step": 129086, "epoch": 3073} {"train_loss": -6.647121429443359, "global_step": 129087, "epoch": 3073} {"train_loss": -6.648653507232666, "global_step": 129088, "epoch": 3073} {"train_loss": -6.647433280944824, "global_step": 129089, "epoch": 3073} {"train_loss": -6.643281936645508, "global_step": 129090, "epoch": 3073} {"train_loss": -6.542375564575195, "global_step": 129091, "epoch": 3073} {"train_loss": -6.5937676429748535, "global_step": 129092, "epoch": 3073} {"train_loss": -6.6113362312316895, "global_step": 129093, "epoch": 3073} {"train_loss": -6.554743766784668, "global_step": 129094, "epoch": 3073} {"train_loss": -6.6016669273376465, "global_step": 129095, "epoch": 3073} {"train_loss": -6.573631763458252, "global_step": 129096, "epoch": 3073} {"train_loss": -6.645516395568848, "global_step": 129097, "epoch": 3073} {"train_loss": -6.567467212677002, "global_step": 129098, "epoch": 3073} {"train_loss": -6.60557746887207, "global_step": 129099, "epoch": 3073} {"train_loss": -6.710068702697754, "global_step": 129100, "epoch": 3073} {"train_loss": -6.63825798034668, "global_step": 129101, "epoch": 3073} {"train_loss": -6.620150566101074, "global_step": 129102, "epoch": 3073} {"train_loss": -6.539051055908203, "global_step": 129103, "epoch": 3073} {"train_loss": -6.550232887268066, "global_step": 129104, "epoch": 3073} {"train_loss": -6.627824306488037, "global_step": 129105, "epoch": 3073} {"train_loss": -6.633387565612793, "global_step": 129106, "epoch": 3073} {"train_loss": -6.611022835686093, "global_step": 129107, "epoch": 3073, "val_loss": 68011.6015625} {"train_loss": -6.597303867340088, "global_step": 129108, "epoch": 3074} {"train_loss": -6.422243118286133, "global_step": 129109, "epoch": 3074} {"train_loss": -6.645778656005859, "global_step": 129110, "epoch": 3074} {"train_loss": -6.558481216430664, "global_step": 129111, "epoch": 3074} {"train_loss": -6.617805480957031, "global_step": 129112, "epoch": 3074} {"train_loss": -6.516709327697754, "global_step": 129113, "epoch": 3074} {"train_loss": -6.429663181304932, "global_step": 129114, "epoch": 3074} {"train_loss": -6.668692111968994, "global_step": 129115, "epoch": 3074} {"train_loss": -6.5434370040893555, "global_step": 129116, "epoch": 3074} {"train_loss": -6.544865608215332, "global_step": 129117, "epoch": 3074} {"train_loss": -6.592369556427002, "global_step": 129118, "epoch": 3074} {"train_loss": -6.474269866943359, "global_step": 129119, "epoch": 3074} {"train_loss": -6.634878635406494, "global_step": 129120, "epoch": 3074} {"train_loss": -6.567482948303223, "global_step": 129121, "epoch": 3074} {"train_loss": -6.592261791229248, "global_step": 129122, "epoch": 3074} {"train_loss": -6.703682899475098, "global_step": 129123, "epoch": 3074} {"train_loss": -6.543719291687012, "global_step": 129124, "epoch": 3074} {"train_loss": -6.692236423492432, "global_step": 129125, "epoch": 3074} {"train_loss": -6.418920516967773, "global_step": 129126, "epoch": 3074} {"train_loss": -6.552280426025391, "global_step": 129127, "epoch": 3074} {"train_loss": -6.56486701965332, "global_step": 129128, "epoch": 3074} {"train_loss": -6.420819282531738, "global_step": 129129, "epoch": 3074} {"train_loss": -6.62868070602417, "global_step": 129130, "epoch": 3074} {"train_loss": -6.474590301513672, "global_step": 129131, "epoch": 3074} {"train_loss": -6.645270347595215, "global_step": 129132, "epoch": 3074} {"train_loss": -6.511786460876465, "global_step": 129133, "epoch": 3074} {"train_loss": -6.511255741119385, "global_step": 129134, "epoch": 3074} {"train_loss": -6.612981796264648, "global_step": 129135, "epoch": 3074} {"train_loss": -6.488458633422852, "global_step": 129136, "epoch": 3074} {"train_loss": -6.621253490447998, "global_step": 129137, "epoch": 3074} {"train_loss": -6.471725940704346, "global_step": 129138, "epoch": 3074} {"train_loss": -6.6194047927856445, "global_step": 129139, "epoch": 3074} {"train_loss": -6.6241350173950195, "global_step": 129140, "epoch": 3074} {"train_loss": -6.5574188232421875, "global_step": 129141, "epoch": 3074} {"train_loss": -6.638848304748535, "global_step": 129142, "epoch": 3074} {"train_loss": -6.464395523071289, "global_step": 129143, "epoch": 3074} {"train_loss": -6.676723957061768, "global_step": 129144, "epoch": 3074} {"train_loss": -6.665700435638428, "global_step": 129145, "epoch": 3074} {"train_loss": -6.672560691833496, "global_step": 129146, "epoch": 3074} {"train_loss": -6.6032209396362305, "global_step": 129147, "epoch": 3074} {"train_loss": -6.686919212341309, "global_step": 129148, "epoch": 3074} {"train_loss": -6.574744883037749, "global_step": 129149, "epoch": 3074, "val_loss": 68198.9140625} {"train_loss": -6.527656555175781, "global_step": 129150, "epoch": 3075} {"train_loss": -6.543985843658447, "global_step": 129151, "epoch": 3075} {"train_loss": -6.68403959274292, "global_step": 129152, "epoch": 3075} {"train_loss": -6.545371055603027, "global_step": 129153, "epoch": 3075} {"train_loss": -6.631144046783447, "global_step": 129154, "epoch": 3075} {"train_loss": -6.487937927246094, "global_step": 129155, "epoch": 3075} {"train_loss": -6.6474151611328125, "global_step": 129156, "epoch": 3075} {"train_loss": -6.678445816040039, "global_step": 129157, "epoch": 3075} {"train_loss": -6.5255632400512695, "global_step": 129158, "epoch": 3075} {"train_loss": -6.722479820251465, "global_step": 129159, "epoch": 3075} {"train_loss": -6.666243553161621, "global_step": 129160, "epoch": 3075} {"train_loss": -6.70076847076416, "global_step": 129161, "epoch": 3075} {"train_loss": -6.489803314208984, "global_step": 129162, "epoch": 3075} {"train_loss": -6.488672256469727, "global_step": 129163, "epoch": 3075} {"train_loss": -6.529701232910156, "global_step": 129164, "epoch": 3075} {"train_loss": -6.512227535247803, "global_step": 129165, "epoch": 3075} {"train_loss": -6.560187339782715, "global_step": 129166, "epoch": 3075} {"train_loss": -6.5180816650390625, "global_step": 129167, "epoch": 3075} {"train_loss": -6.693205833435059, "global_step": 129168, "epoch": 3075} {"train_loss": -6.579380989074707, "global_step": 129169, "epoch": 3075} {"train_loss": -6.673223495483398, "global_step": 129170, "epoch": 3075} {"train_loss": -6.5482611656188965, "global_step": 129171, "epoch": 3075} {"train_loss": -6.67215633392334, "global_step": 129172, "epoch": 3075} {"train_loss": -6.613588333129883, "global_step": 129173, "epoch": 3075} {"train_loss": -6.6360626220703125, "global_step": 129174, "epoch": 3075} {"train_loss": -6.666378974914551, "global_step": 129175, "epoch": 3075} {"train_loss": -6.725490093231201, "global_step": 129176, "epoch": 3075} {"train_loss": -6.627750396728516, "global_step": 129177, "epoch": 3075} {"train_loss": -6.617934226989746, "global_step": 129178, "epoch": 3075} {"train_loss": -6.600964069366455, "global_step": 129179, "epoch": 3075} {"train_loss": -6.704571723937988, "global_step": 129180, "epoch": 3075} {"train_loss": -6.636233806610107, "global_step": 129181, "epoch": 3075} {"train_loss": -6.568542003631592, "global_step": 129182, "epoch": 3075} {"train_loss": -6.768557548522949, "global_step": 129183, "epoch": 3075} {"train_loss": -6.573729515075684, "global_step": 129184, "epoch": 3075} {"train_loss": -6.563507080078125, "global_step": 129185, "epoch": 3075} {"train_loss": -6.764155864715576, "global_step": 129186, "epoch": 3075} {"train_loss": -6.6072540283203125, "global_step": 129187, "epoch": 3075} {"train_loss": -6.691770076751709, "global_step": 129188, "epoch": 3075} {"train_loss": -6.717014312744141, "global_step": 129189, "epoch": 3075} {"train_loss": -6.671222686767578, "global_step": 129190, "epoch": 3075} {"train_loss": -6.617129711877732, "global_step": 129191, "epoch": 3075, "val_loss": 68391.609375} {"train_loss": -6.61075496673584, "global_step": 129192, "epoch": 3076} {"train_loss": -6.601099014282227, "global_step": 129193, "epoch": 3076} {"train_loss": -6.5414838790893555, "global_step": 129194, "epoch": 3076} {"train_loss": -6.6439619064331055, "global_step": 129195, "epoch": 3076} {"train_loss": -6.403339385986328, "global_step": 129196, "epoch": 3076} {"train_loss": -6.583362579345703, "global_step": 129197, "epoch": 3076} {"train_loss": -6.480731964111328, "global_step": 129198, "epoch": 3076} {"train_loss": -6.419079303741455, "global_step": 129199, "epoch": 3076} {"train_loss": -6.694264888763428, "global_step": 129200, "epoch": 3076} {"train_loss": -6.407972812652588, "global_step": 129201, "epoch": 3076} {"train_loss": -6.6629252433776855, "global_step": 129202, "epoch": 3076} {"train_loss": -6.45343017578125, "global_step": 129203, "epoch": 3076} {"train_loss": -6.467385292053223, "global_step": 129204, "epoch": 3076} {"train_loss": -6.535224914550781, "global_step": 129205, "epoch": 3076} {"train_loss": -6.534911155700684, "global_step": 129206, "epoch": 3076} {"train_loss": -6.531716823577881, "global_step": 129207, "epoch": 3076} {"train_loss": -6.652872085571289, "global_step": 129208, "epoch": 3076} {"train_loss": -6.476865768432617, "global_step": 129209, "epoch": 3076} {"train_loss": -6.596924304962158, "global_step": 129210, "epoch": 3076} {"train_loss": -6.652349472045898, "global_step": 129211, "epoch": 3076} {"train_loss": -6.544032573699951, "global_step": 129212, "epoch": 3076} {"train_loss": -6.662214279174805, "global_step": 129213, "epoch": 3076} {"train_loss": -6.577348709106445, "global_step": 129214, "epoch": 3076} {"train_loss": -6.6841301918029785, "global_step": 129215, "epoch": 3076} {"train_loss": -6.482133388519287, "global_step": 129216, "epoch": 3076} {"train_loss": -6.7268805503845215, "global_step": 129217, "epoch": 3076} {"train_loss": -6.571284294128418, "global_step": 129218, "epoch": 3076} {"train_loss": -6.698992729187012, "global_step": 129219, "epoch": 3076} {"train_loss": -6.697016716003418, "global_step": 129220, "epoch": 3076} {"train_loss": -6.5942840576171875, "global_step": 129221, "epoch": 3076} {"train_loss": -6.618807792663574, "global_step": 129222, "epoch": 3076} {"train_loss": -6.675032138824463, "global_step": 129223, "epoch": 3076} {"train_loss": -6.652838706970215, "global_step": 129224, "epoch": 3076} {"train_loss": -6.7385149002075195, "global_step": 129225, "epoch": 3076} {"train_loss": -6.642003059387207, "global_step": 129226, "epoch": 3076} {"train_loss": -6.609620094299316, "global_step": 129227, "epoch": 3076} {"train_loss": -6.617560386657715, "global_step": 129228, "epoch": 3076} {"train_loss": -6.612561225891113, "global_step": 129229, "epoch": 3076} {"train_loss": -6.735217571258545, "global_step": 129230, "epoch": 3076} {"train_loss": -6.610146999359131, "global_step": 129231, "epoch": 3076} {"train_loss": -6.6463775634765625, "global_step": 129232, "epoch": 3076} {"train_loss": -6.59318242754255, "global_step": 129233, "epoch": 3076, "val_loss": 68314.6875} {"train_loss": -6.565648078918457, "global_step": 129234, "epoch": 3077} {"train_loss": -6.74370002746582, "global_step": 129235, "epoch": 3077} {"train_loss": -6.436704158782959, "global_step": 129236, "epoch": 3077} {"train_loss": -6.5447869300842285, "global_step": 129237, "epoch": 3077} {"train_loss": -6.599148750305176, "global_step": 129238, "epoch": 3077} {"train_loss": -6.690808296203613, "global_step": 129239, "epoch": 3077} {"train_loss": -6.506739616394043, "global_step": 129240, "epoch": 3077} {"train_loss": -6.589359283447266, "global_step": 129241, "epoch": 3077} {"train_loss": -6.564896583557129, "global_step": 129242, "epoch": 3077} {"train_loss": -6.579526901245117, "global_step": 129243, "epoch": 3077} {"train_loss": -6.718279838562012, "global_step": 129244, "epoch": 3077} {"train_loss": -6.726588249206543, "global_step": 129245, "epoch": 3077} {"train_loss": -6.742133140563965, "global_step": 129246, "epoch": 3077} {"train_loss": -6.645898818969727, "global_step": 129247, "epoch": 3077} {"train_loss": -6.615817070007324, "global_step": 129248, "epoch": 3077} {"train_loss": -6.555093765258789, "global_step": 129249, "epoch": 3077} {"train_loss": -6.569856643676758, "global_step": 129250, "epoch": 3077} {"train_loss": -6.539702415466309, "global_step": 129251, "epoch": 3077} {"train_loss": -6.6882100105285645, "global_step": 129252, "epoch": 3077} {"train_loss": -6.666621208190918, "global_step": 129253, "epoch": 3077} {"train_loss": -6.631931304931641, "global_step": 129254, "epoch": 3077} {"train_loss": -6.6140618324279785, "global_step": 129255, "epoch": 3077} {"train_loss": -6.716364860534668, "global_step": 129256, "epoch": 3077} {"train_loss": -6.624095916748047, "global_step": 129257, "epoch": 3077} {"train_loss": -6.61613655090332, "global_step": 129258, "epoch": 3077} {"train_loss": -6.751952171325684, "global_step": 129259, "epoch": 3077} {"train_loss": -6.701082706451416, "global_step": 129260, "epoch": 3077} {"train_loss": -6.561961650848389, "global_step": 129261, "epoch": 3077} {"train_loss": -6.647147178649902, "global_step": 129262, "epoch": 3077} {"train_loss": -6.537505149841309, "global_step": 129263, "epoch": 3077} {"train_loss": -6.605319499969482, "global_step": 129264, "epoch": 3077} {"train_loss": -6.593820095062256, "global_step": 129265, "epoch": 3077} {"train_loss": -6.636412620544434, "global_step": 129266, "epoch": 3077} {"train_loss": -6.762722015380859, "global_step": 129267, "epoch": 3077} {"train_loss": -6.803072452545166, "global_step": 129268, "epoch": 3077} {"train_loss": -6.6787109375, "global_step": 129269, "epoch": 3077} {"train_loss": -6.633155345916748, "global_step": 129270, "epoch": 3077} {"train_loss": -6.661250114440918, "global_step": 129271, "epoch": 3077} {"train_loss": -6.5729875564575195, "global_step": 129272, "epoch": 3077} {"train_loss": -6.7021260261535645, "global_step": 129273, "epoch": 3077} {"train_loss": -6.498133659362793, "global_step": 129274, "epoch": 3077} {"train_loss": -6.6289560454232355, "global_step": 129275, "epoch": 3077, "val_loss": 67979.8984375} {"train_loss": -6.760984420776367, "global_step": 129276, "epoch": 3078} {"train_loss": -6.711102485656738, "global_step": 129277, "epoch": 3078} {"train_loss": -6.657055854797363, "global_step": 129278, "epoch": 3078} {"train_loss": -6.657936096191406, "global_step": 129279, "epoch": 3078} {"train_loss": -6.721490859985352, "global_step": 129280, "epoch": 3078} {"train_loss": -6.658995151519775, "global_step": 129281, "epoch": 3078} {"train_loss": -6.606878757476807, "global_step": 129282, "epoch": 3078} {"train_loss": -6.700963973999023, "global_step": 129283, "epoch": 3078} {"train_loss": -6.601229667663574, "global_step": 129284, "epoch": 3078} {"train_loss": -6.651646614074707, "global_step": 129285, "epoch": 3078} {"train_loss": -6.640573024749756, "global_step": 129286, "epoch": 3078} {"train_loss": -6.639621734619141, "global_step": 129287, "epoch": 3078} {"train_loss": -6.779958724975586, "global_step": 129288, "epoch": 3078} {"train_loss": -6.581271171569824, "global_step": 129289, "epoch": 3078} {"train_loss": -6.599969863891602, "global_step": 129290, "epoch": 3078} {"train_loss": -6.6657233238220215, "global_step": 129291, "epoch": 3078} {"train_loss": -6.690720558166504, "global_step": 129292, "epoch": 3078} {"train_loss": -6.570534706115723, "global_step": 129293, "epoch": 3078} {"train_loss": -6.684945583343506, "global_step": 129294, "epoch": 3078} {"train_loss": -6.458573341369629, "global_step": 129295, "epoch": 3078} {"train_loss": -6.593513011932373, "global_step": 129296, "epoch": 3078} {"train_loss": -6.719729423522949, "global_step": 129297, "epoch": 3078} {"train_loss": -6.786614418029785, "global_step": 129298, "epoch": 3078} {"train_loss": -6.571141719818115, "global_step": 129299, "epoch": 3078} {"train_loss": -6.572906494140625, "global_step": 129300, "epoch": 3078} {"train_loss": -6.68295955657959, "global_step": 129301, "epoch": 3078} {"train_loss": -6.64451265335083, "global_step": 129302, "epoch": 3078} {"train_loss": -6.571259021759033, "global_step": 129303, "epoch": 3078} {"train_loss": -6.660861968994141, "global_step": 129304, "epoch": 3078} {"train_loss": -6.650929927825928, "global_step": 129305, "epoch": 3078} {"train_loss": -6.617072105407715, "global_step": 129306, "epoch": 3078} {"train_loss": -6.597803115844727, "global_step": 129307, "epoch": 3078} {"train_loss": -6.729403972625732, "global_step": 129308, "epoch": 3078} {"train_loss": -6.642966270446777, "global_step": 129309, "epoch": 3078} {"train_loss": -6.624014854431152, "global_step": 129310, "epoch": 3078} {"train_loss": -6.557889938354492, "global_step": 129311, "epoch": 3078} {"train_loss": -6.5871429443359375, "global_step": 129312, "epoch": 3078} {"train_loss": -6.528616905212402, "global_step": 129313, "epoch": 3078} {"train_loss": -6.530744552612305, "global_step": 129314, "epoch": 3078} {"train_loss": -6.619111061096191, "global_step": 129315, "epoch": 3078} {"train_loss": -6.642853736877441, "global_step": 129316, "epoch": 3078} {"train_loss": -6.639555249895368, "global_step": 129317, "epoch": 3078, "val_loss": 68208.984375} {"train_loss": -6.611304759979248, "global_step": 129318, "epoch": 3079} {"train_loss": -6.67579460144043, "global_step": 129319, "epoch": 3079} {"train_loss": -6.683082103729248, "global_step": 129320, "epoch": 3079} {"train_loss": -6.68279504776001, "global_step": 129321, "epoch": 3079} {"train_loss": -6.673971652984619, "global_step": 129322, "epoch": 3079} {"train_loss": -6.711366176605225, "global_step": 129323, "epoch": 3079} {"train_loss": -6.5547332763671875, "global_step": 129324, "epoch": 3079} {"train_loss": -6.602451324462891, "global_step": 129325, "epoch": 3079} {"train_loss": -6.641438007354736, "global_step": 129326, "epoch": 3079} {"train_loss": -6.64363956451416, "global_step": 129327, "epoch": 3079} {"train_loss": -6.740287780761719, "global_step": 129328, "epoch": 3079} {"train_loss": -6.630832195281982, "global_step": 129329, "epoch": 3079} {"train_loss": -6.662385940551758, "global_step": 129330, "epoch": 3079} {"train_loss": -6.6674652099609375, "global_step": 129331, "epoch": 3079} {"train_loss": -6.674814701080322, "global_step": 129332, "epoch": 3079} {"train_loss": -6.666301727294922, "global_step": 129333, "epoch": 3079} {"train_loss": -6.649519920349121, "global_step": 129334, "epoch": 3079} {"train_loss": -6.574659824371338, "global_step": 129335, "epoch": 3079} {"train_loss": -6.516451835632324, "global_step": 129336, "epoch": 3079} {"train_loss": -6.643536567687988, "global_step": 129337, "epoch": 3079} {"train_loss": -6.5937299728393555, "global_step": 129338, "epoch": 3079} {"train_loss": -6.415375709533691, "global_step": 129339, "epoch": 3079} {"train_loss": -6.711679458618164, "global_step": 129340, "epoch": 3079} {"train_loss": -6.556758880615234, "global_step": 129341, "epoch": 3079} {"train_loss": -6.536179542541504, "global_step": 129342, "epoch": 3079} {"train_loss": -6.679352283477783, "global_step": 129343, "epoch": 3079} {"train_loss": -6.582895755767822, "global_step": 129344, "epoch": 3079} {"train_loss": -6.633389472961426, "global_step": 129345, "epoch": 3079} {"train_loss": -6.746406555175781, "global_step": 129346, "epoch": 3079} {"train_loss": -6.491908550262451, "global_step": 129347, "epoch": 3079} {"train_loss": -6.606548309326172, "global_step": 129348, "epoch": 3079} {"train_loss": -6.544633865356445, "global_step": 129349, "epoch": 3079} {"train_loss": -6.464835166931152, "global_step": 129350, "epoch": 3079} {"train_loss": -6.543749809265137, "global_step": 129351, "epoch": 3079} {"train_loss": -6.638411521911621, "global_step": 129352, "epoch": 3079} {"train_loss": -6.58432149887085, "global_step": 129353, "epoch": 3079} {"train_loss": -6.472897529602051, "global_step": 129354, "epoch": 3079} {"train_loss": -6.595058441162109, "global_step": 129355, "epoch": 3079} {"train_loss": -6.57675838470459, "global_step": 129356, "epoch": 3079} {"train_loss": -6.558437347412109, "global_step": 129357, "epoch": 3079} {"train_loss": -6.520231246948242, "global_step": 129358, "epoch": 3079} {"train_loss": -6.606858594076974, "global_step": 129359, "epoch": 3079, "val_loss": 67968.7265625} {"train_loss": -6.609702110290527, "global_step": 129360, "epoch": 3080} {"train_loss": -6.462635040283203, "global_step": 129361, "epoch": 3080} {"train_loss": -6.4525041580200195, "global_step": 129362, "epoch": 3080} {"train_loss": -6.548472881317139, "global_step": 129363, "epoch": 3080} {"train_loss": -6.448228359222412, "global_step": 129364, "epoch": 3080} {"train_loss": -6.607595920562744, "global_step": 129365, "epoch": 3080} {"train_loss": -6.344700813293457, "global_step": 129366, "epoch": 3080} {"train_loss": -6.486473083496094, "global_step": 129367, "epoch": 3080} {"train_loss": -6.534564971923828, "global_step": 129368, "epoch": 3080} {"train_loss": -6.538829803466797, "global_step": 129369, "epoch": 3080} {"train_loss": -6.56469202041626, "global_step": 129370, "epoch": 3080} {"train_loss": -6.625390529632568, "global_step": 129371, "epoch": 3080} {"train_loss": -6.4823527336120605, "global_step": 129372, "epoch": 3080} {"train_loss": -6.635144233703613, "global_step": 129373, "epoch": 3080} {"train_loss": -6.673367023468018, "global_step": 129374, "epoch": 3080} {"train_loss": -6.661536693572998, "global_step": 129375, "epoch": 3080} {"train_loss": -6.521956920623779, "global_step": 129376, "epoch": 3080} {"train_loss": -6.597440242767334, "global_step": 129377, "epoch": 3080} {"train_loss": -6.555525779724121, "global_step": 129378, "epoch": 3080} {"train_loss": -6.67501163482666, "global_step": 129379, "epoch": 3080} {"train_loss": -6.633637428283691, "global_step": 129380, "epoch": 3080} {"train_loss": -6.571972846984863, "global_step": 129381, "epoch": 3080} {"train_loss": -6.5866522789001465, "global_step": 129382, "epoch": 3080} {"train_loss": -6.665291786193848, "global_step": 129383, "epoch": 3080} {"train_loss": -6.619342803955078, "global_step": 129384, "epoch": 3080} {"train_loss": -6.6071600914001465, "global_step": 129385, "epoch": 3080} {"train_loss": -6.659729957580566, "global_step": 129386, "epoch": 3080} {"train_loss": -6.594935417175293, "global_step": 129387, "epoch": 3080} {"train_loss": -6.542751312255859, "global_step": 129388, "epoch": 3080} {"train_loss": -6.589885234832764, "global_step": 129389, "epoch": 3080} {"train_loss": -6.643924713134766, "global_step": 129390, "epoch": 3080} {"train_loss": -6.591100692749023, "global_step": 129391, "epoch": 3080} {"train_loss": -6.667512893676758, "global_step": 129392, "epoch": 3080} {"train_loss": -6.629321575164795, "global_step": 129393, "epoch": 3080} {"train_loss": -6.600584030151367, "global_step": 129394, "epoch": 3080} {"train_loss": -6.664386749267578, "global_step": 129395, "epoch": 3080} {"train_loss": -6.650079727172852, "global_step": 129396, "epoch": 3080} {"train_loss": -6.654676914215088, "global_step": 129397, "epoch": 3080} {"train_loss": -6.6778483390808105, "global_step": 129398, "epoch": 3080} {"train_loss": -6.641070365905762, "global_step": 129399, "epoch": 3080} {"train_loss": -6.736268997192383, "global_step": 129400, "epoch": 3080} {"train_loss": -6.593618052346366, "global_step": 129401, "epoch": 3080, "val_loss": 68284.2890625} {"train_loss": -6.8131561279296875, "global_step": 129402, "epoch": 3081} {"train_loss": -6.692617893218994, "global_step": 129403, "epoch": 3081} {"train_loss": -6.6988067626953125, "global_step": 129404, "epoch": 3081} {"train_loss": -6.597016334533691, "global_step": 129405, "epoch": 3081} {"train_loss": -6.631771564483643, "global_step": 129406, "epoch": 3081} {"train_loss": -6.723909378051758, "global_step": 129407, "epoch": 3081} {"train_loss": -6.626853942871094, "global_step": 129408, "epoch": 3081} {"train_loss": -6.560434341430664, "global_step": 129409, "epoch": 3081} {"train_loss": -6.615649223327637, "global_step": 129410, "epoch": 3081} {"train_loss": -6.706000328063965, "global_step": 129411, "epoch": 3081} {"train_loss": -6.587051868438721, "global_step": 129412, "epoch": 3081} {"train_loss": -6.585640907287598, "global_step": 129413, "epoch": 3081} {"train_loss": -6.525660514831543, "global_step": 129414, "epoch": 3081} {"train_loss": -6.697601795196533, "global_step": 129415, "epoch": 3081} {"train_loss": -6.494754791259766, "global_step": 129416, "epoch": 3081} {"train_loss": -6.673999786376953, "global_step": 129417, "epoch": 3081} {"train_loss": -6.6467509269714355, "global_step": 129418, "epoch": 3081} {"train_loss": -6.512598991394043, "global_step": 129419, "epoch": 3081} {"train_loss": -6.594231605529785, "global_step": 129420, "epoch": 3081} {"train_loss": -6.543898582458496, "global_step": 129421, "epoch": 3081} {"train_loss": -6.662561893463135, "global_step": 129422, "epoch": 3081} {"train_loss": -6.492831707000732, "global_step": 129423, "epoch": 3081} {"train_loss": -6.686858177185059, "global_step": 129424, "epoch": 3081} {"train_loss": -6.647367477416992, "global_step": 129425, "epoch": 3081} {"train_loss": -6.64866304397583, "global_step": 129426, "epoch": 3081} {"train_loss": -6.622725486755371, "global_step": 129427, "epoch": 3081} {"train_loss": -6.640898704528809, "global_step": 129428, "epoch": 3081} {"train_loss": -6.535501003265381, "global_step": 129429, "epoch": 3081} {"train_loss": -6.5624494552612305, "global_step": 129430, "epoch": 3081} {"train_loss": -6.513510704040527, "global_step": 129431, "epoch": 3081} {"train_loss": -6.694520950317383, "global_step": 129432, "epoch": 3081} {"train_loss": -6.648663520812988, "global_step": 129433, "epoch": 3081} {"train_loss": -6.519525527954102, "global_step": 129434, "epoch": 3081} {"train_loss": -6.637576103210449, "global_step": 129435, "epoch": 3081} {"train_loss": -6.5475754737854, "global_step": 129436, "epoch": 3081} {"train_loss": -6.521368026733398, "global_step": 129437, "epoch": 3081} {"train_loss": -6.603363037109375, "global_step": 129438, "epoch": 3081} {"train_loss": -6.653050899505615, "global_step": 129439, "epoch": 3081} {"train_loss": -6.596746921539307, "global_step": 129440, "epoch": 3081} {"train_loss": -6.507294654846191, "global_step": 129441, "epoch": 3081} {"train_loss": -6.640230178833008, "global_step": 129442, "epoch": 3081} {"train_loss": -6.611826942080543, "global_step": 129443, "epoch": 3081, "val_loss": 68182.40625} {"train_loss": -6.671021461486816, "global_step": 129444, "epoch": 3082} {"train_loss": -6.599615097045898, "global_step": 129445, "epoch": 3082} {"train_loss": -6.63449764251709, "global_step": 129446, "epoch": 3082} {"train_loss": -6.523890018463135, "global_step": 129447, "epoch": 3082} {"train_loss": -6.6585001945495605, "global_step": 129448, "epoch": 3082} {"train_loss": -6.630577087402344, "global_step": 129449, "epoch": 3082} {"train_loss": -6.521540641784668, "global_step": 129450, "epoch": 3082} {"train_loss": -6.688234806060791, "global_step": 129451, "epoch": 3082} {"train_loss": -6.751598358154297, "global_step": 129452, "epoch": 3082} {"train_loss": -6.677338600158691, "global_step": 129453, "epoch": 3082} {"train_loss": -6.625311851501465, "global_step": 129454, "epoch": 3082} {"train_loss": -6.728342056274414, "global_step": 129455, "epoch": 3082} {"train_loss": -6.614485263824463, "global_step": 129456, "epoch": 3082} {"train_loss": -6.621796607971191, "global_step": 129457, "epoch": 3082} {"train_loss": -6.57050085067749, "global_step": 129458, "epoch": 3082} {"train_loss": -6.590334892272949, "global_step": 129459, "epoch": 3082} {"train_loss": -6.60505485534668, "global_step": 129460, "epoch": 3082} {"train_loss": -6.443518161773682, "global_step": 129461, "epoch": 3082} {"train_loss": -6.565488815307617, "global_step": 129462, "epoch": 3082} {"train_loss": -6.533465385437012, "global_step": 129463, "epoch": 3082} {"train_loss": -6.627168655395508, "global_step": 129464, "epoch": 3082} {"train_loss": -6.440786361694336, "global_step": 129465, "epoch": 3082} {"train_loss": -6.5318708419799805, "global_step": 129466, "epoch": 3082} {"train_loss": -6.5007500648498535, "global_step": 129467, "epoch": 3082} {"train_loss": -6.50868034362793, "global_step": 129468, "epoch": 3082} {"train_loss": -6.634295463562012, "global_step": 129469, "epoch": 3082} {"train_loss": -6.6090288162231445, "global_step": 129470, "epoch": 3082} {"train_loss": -6.596128940582275, "global_step": 129471, "epoch": 3082} {"train_loss": -6.5791168212890625, "global_step": 129472, "epoch": 3082} {"train_loss": -6.569133758544922, "global_step": 129473, "epoch": 3082} {"train_loss": -6.547573089599609, "global_step": 129474, "epoch": 3082} {"train_loss": -6.605508804321289, "global_step": 129475, "epoch": 3082} {"train_loss": -6.590482234954834, "global_step": 129476, "epoch": 3082} {"train_loss": -6.602617263793945, "global_step": 129477, "epoch": 3082} {"train_loss": -6.587568283081055, "global_step": 129478, "epoch": 3082} {"train_loss": -6.6199493408203125, "global_step": 129479, "epoch": 3082} {"train_loss": -6.662341594696045, "global_step": 129480, "epoch": 3082} {"train_loss": -6.640007495880127, "global_step": 129481, "epoch": 3082} {"train_loss": -6.54704475402832, "global_step": 129482, "epoch": 3082} {"train_loss": -6.66957950592041, "global_step": 129483, "epoch": 3082} {"train_loss": -6.648634910583496, "global_step": 129484, "epoch": 3082} {"train_loss": -6.600795427958171, "global_step": 129485, "epoch": 3082, "val_loss": 68300.46875} {"train_loss": -6.598923683166504, "global_step": 129486, "epoch": 3083} {"train_loss": -6.698671340942383, "global_step": 129487, "epoch": 3083} {"train_loss": -6.6020026206970215, "global_step": 129488, "epoch": 3083} {"train_loss": -6.561351776123047, "global_step": 129489, "epoch": 3083} {"train_loss": -6.693421363830566, "global_step": 129490, "epoch": 3083} {"train_loss": -6.550351619720459, "global_step": 129491, "epoch": 3083} {"train_loss": -6.687623500823975, "global_step": 129492, "epoch": 3083} {"train_loss": -6.5795674324035645, "global_step": 129493, "epoch": 3083} {"train_loss": -6.750504016876221, "global_step": 129494, "epoch": 3083} {"train_loss": -6.750207901000977, "global_step": 129495, "epoch": 3083} {"train_loss": -6.549166679382324, "global_step": 129496, "epoch": 3083} {"train_loss": -6.669142723083496, "global_step": 129497, "epoch": 3083} {"train_loss": -6.6440582275390625, "global_step": 129498, "epoch": 3083} {"train_loss": -6.762284278869629, "global_step": 129499, "epoch": 3083} {"train_loss": -6.605541706085205, "global_step": 129500, "epoch": 3083} {"train_loss": -6.722832202911377, "global_step": 129501, "epoch": 3083} {"train_loss": -6.645023345947266, "global_step": 129502, "epoch": 3083} {"train_loss": -6.606168746948242, "global_step": 129503, "epoch": 3083} {"train_loss": -6.593308448791504, "global_step": 129504, "epoch": 3083} {"train_loss": -6.6277008056640625, "global_step": 129505, "epoch": 3083} {"train_loss": -6.574114799499512, "global_step": 129506, "epoch": 3083} {"train_loss": -6.602545261383057, "global_step": 129507, "epoch": 3083} {"train_loss": -6.632309436798096, "global_step": 129508, "epoch": 3083} {"train_loss": -6.690017223358154, "global_step": 129509, "epoch": 3083} {"train_loss": -6.594699859619141, "global_step": 129510, "epoch": 3083} {"train_loss": -6.716835021972656, "global_step": 129511, "epoch": 3083} {"train_loss": -6.593583106994629, "global_step": 129512, "epoch": 3083} {"train_loss": -6.520514488220215, "global_step": 129513, "epoch": 3083} {"train_loss": -6.733597755432129, "global_step": 129514, "epoch": 3083} {"train_loss": -6.56370735168457, "global_step": 129515, "epoch": 3083} {"train_loss": -6.528324604034424, "global_step": 129516, "epoch": 3083} {"train_loss": -6.522120475769043, "global_step": 129517, "epoch": 3083} {"train_loss": -6.627955913543701, "global_step": 129518, "epoch": 3083} {"train_loss": -6.41696834564209, "global_step": 129519, "epoch": 3083} {"train_loss": -6.592196464538574, "global_step": 129520, "epoch": 3083} {"train_loss": -6.549563407897949, "global_step": 129521, "epoch": 3083} {"train_loss": -6.5109028816223145, "global_step": 129522, "epoch": 3083} {"train_loss": -6.637377738952637, "global_step": 129523, "epoch": 3083} {"train_loss": -6.439199447631836, "global_step": 129524, "epoch": 3083} {"train_loss": -6.609735488891602, "global_step": 129525, "epoch": 3083} {"train_loss": -6.495090484619141, "global_step": 129526, "epoch": 3083} {"train_loss": -6.609373421896072, "global_step": 129527, "epoch": 3083, "val_loss": 68287.5859375} {"train_loss": -6.660640239715576, "global_step": 129528, "epoch": 3084} {"train_loss": -6.66103982925415, "global_step": 129529, "epoch": 3084} {"train_loss": -6.519914627075195, "global_step": 129530, "epoch": 3084} {"train_loss": -6.6526288986206055, "global_step": 129531, "epoch": 3084} {"train_loss": -6.592310905456543, "global_step": 129532, "epoch": 3084} {"train_loss": -6.577686309814453, "global_step": 129533, "epoch": 3084} {"train_loss": -6.61298942565918, "global_step": 129534, "epoch": 3084} {"train_loss": -6.562862396240234, "global_step": 129535, "epoch": 3084} {"train_loss": -6.639098167419434, "global_step": 129536, "epoch": 3084} {"train_loss": -6.554835319519043, "global_step": 129537, "epoch": 3084} {"train_loss": -6.690891265869141, "global_step": 129538, "epoch": 3084} {"train_loss": -6.528115272521973, "global_step": 129539, "epoch": 3084} {"train_loss": -6.607858657836914, "global_step": 129540, "epoch": 3084} {"train_loss": -6.5621747970581055, "global_step": 129541, "epoch": 3084} {"train_loss": -6.596512794494629, "global_step": 129542, "epoch": 3084} {"train_loss": -6.692726135253906, "global_step": 129543, "epoch": 3084} {"train_loss": -6.530611038208008, "global_step": 129544, "epoch": 3084} {"train_loss": -6.565903186798096, "global_step": 129545, "epoch": 3084} {"train_loss": -6.491941452026367, "global_step": 129546, "epoch": 3084} {"train_loss": -6.532629489898682, "global_step": 129547, "epoch": 3084} {"train_loss": -6.656832218170166, "global_step": 129548, "epoch": 3084} {"train_loss": -6.513889789581299, "global_step": 129549, "epoch": 3084} {"train_loss": -6.630877494812012, "global_step": 129550, "epoch": 3084} {"train_loss": -6.604703903198242, "global_step": 129551, "epoch": 3084} {"train_loss": -6.666719436645508, "global_step": 129552, "epoch": 3084} {"train_loss": -6.501421928405762, "global_step": 129553, "epoch": 3084} {"train_loss": -6.395835876464844, "global_step": 129554, "epoch": 3084} {"train_loss": -6.549664497375488, "global_step": 129555, "epoch": 3084} {"train_loss": -6.519555568695068, "global_step": 129556, "epoch": 3084} {"train_loss": -6.581905364990234, "global_step": 129557, "epoch": 3084} {"train_loss": -6.503678321838379, "global_step": 129558, "epoch": 3084} {"train_loss": -6.463995456695557, "global_step": 129559, "epoch": 3084} {"train_loss": -6.638435363769531, "global_step": 129560, "epoch": 3084} {"train_loss": -6.4889445304870605, "global_step": 129561, "epoch": 3084} {"train_loss": -6.570042133331299, "global_step": 129562, "epoch": 3084} {"train_loss": -6.626152992248535, "global_step": 129563, "epoch": 3084} {"train_loss": -6.636971473693848, "global_step": 129564, "epoch": 3084} {"train_loss": -6.628240585327148, "global_step": 129565, "epoch": 3084} {"train_loss": -6.611915588378906, "global_step": 129566, "epoch": 3084} {"train_loss": -6.6958513259887695, "global_step": 129567, "epoch": 3084} {"train_loss": -6.65919303894043, "global_step": 129568, "epoch": 3084} {"train_loss": -6.584496407281785, "global_step": 129569, "epoch": 3084, "val_loss": 68254.109375} {"train_loss": -6.720334053039551, "global_step": 129570, "epoch": 3085} {"train_loss": -6.563309669494629, "global_step": 129571, "epoch": 3085} {"train_loss": -6.675861358642578, "global_step": 129572, "epoch": 3085} {"train_loss": -6.686490535736084, "global_step": 129573, "epoch": 3085} {"train_loss": -6.607000350952148, "global_step": 129574, "epoch": 3085} {"train_loss": -6.627153396606445, "global_step": 129575, "epoch": 3085} {"train_loss": -6.783990859985352, "global_step": 129576, "epoch": 3085} {"train_loss": -6.6120100021362305, "global_step": 129577, "epoch": 3085} {"train_loss": -6.74635124206543, "global_step": 129578, "epoch": 3085} {"train_loss": -6.674542427062988, "global_step": 129579, "epoch": 3085} {"train_loss": -6.644100666046143, "global_step": 129580, "epoch": 3085} {"train_loss": -6.592013359069824, "global_step": 129581, "epoch": 3085} {"train_loss": -6.706523895263672, "global_step": 129582, "epoch": 3085} {"train_loss": -6.644148826599121, "global_step": 129583, "epoch": 3085} {"train_loss": -6.694589138031006, "global_step": 129584, "epoch": 3085} {"train_loss": -6.675542831420898, "global_step": 129585, "epoch": 3085} {"train_loss": -6.715246200561523, "global_step": 129586, "epoch": 3085} {"train_loss": -6.640012741088867, "global_step": 129587, "epoch": 3085} {"train_loss": -6.5758185386657715, "global_step": 129588, "epoch": 3085} {"train_loss": -6.663355827331543, "global_step": 129589, "epoch": 3085} {"train_loss": -6.662840843200684, "global_step": 129590, "epoch": 3085} {"train_loss": -6.66752815246582, "global_step": 129591, "epoch": 3085} {"train_loss": -6.609081745147705, "global_step": 129592, "epoch": 3085} {"train_loss": -6.5782551765441895, "global_step": 129593, "epoch": 3085} {"train_loss": -6.614208698272705, "global_step": 129594, "epoch": 3085} {"train_loss": -6.648808479309082, "global_step": 129595, "epoch": 3085} {"train_loss": -6.464833736419678, "global_step": 129596, "epoch": 3085} {"train_loss": -6.619411468505859, "global_step": 129597, "epoch": 3085} {"train_loss": -6.502124786376953, "global_step": 129598, "epoch": 3085} {"train_loss": -6.596220970153809, "global_step": 129599, "epoch": 3085} {"train_loss": -6.562875747680664, "global_step": 129600, "epoch": 3085} {"train_loss": -6.543395519256592, "global_step": 129601, "epoch": 3085} {"train_loss": -6.615306854248047, "global_step": 129602, "epoch": 3085} {"train_loss": -6.4033732414245605, "global_step": 129603, "epoch": 3085} {"train_loss": -6.502923965454102, "global_step": 129604, "epoch": 3085} {"train_loss": -6.5919599533081055, "global_step": 129605, "epoch": 3085} {"train_loss": -6.518815994262695, "global_step": 129606, "epoch": 3085} {"train_loss": -6.5139923095703125, "global_step": 129607, "epoch": 3085} {"train_loss": -6.658110618591309, "global_step": 129608, "epoch": 3085} {"train_loss": -6.6315226554870605, "global_step": 129609, "epoch": 3085} {"train_loss": -6.654382705688477, "global_step": 129610, "epoch": 3085} {"train_loss": -6.61850186756679, "global_step": 129611, "epoch": 3085, "val_loss": 68315.046875} {"train_loss": -6.556486129760742, "global_step": 129612, "epoch": 3086} {"train_loss": -6.632807731628418, "global_step": 129613, "epoch": 3086} {"train_loss": -6.5319061279296875, "global_step": 129614, "epoch": 3086} {"train_loss": -6.575075149536133, "global_step": 129615, "epoch": 3086} {"train_loss": -6.676076889038086, "global_step": 129616, "epoch": 3086} {"train_loss": -6.5511932373046875, "global_step": 129617, "epoch": 3086} {"train_loss": -6.596986770629883, "global_step": 129618, "epoch": 3086} {"train_loss": -6.620049476623535, "global_step": 129619, "epoch": 3086} {"train_loss": -6.470166206359863, "global_step": 129620, "epoch": 3086} {"train_loss": -6.641885757446289, "global_step": 129621, "epoch": 3086} {"train_loss": -6.638091087341309, "global_step": 129622, "epoch": 3086} {"train_loss": -6.592355728149414, "global_step": 129623, "epoch": 3086} {"train_loss": -6.6437296867370605, "global_step": 129624, "epoch": 3086} {"train_loss": -6.5095062255859375, "global_step": 129625, "epoch": 3086} {"train_loss": -6.564448356628418, "global_step": 129626, "epoch": 3086} {"train_loss": -6.590933799743652, "global_step": 129627, "epoch": 3086} {"train_loss": -6.537845611572266, "global_step": 129628, "epoch": 3086} {"train_loss": -6.57351016998291, "global_step": 129629, "epoch": 3086} {"train_loss": -6.684238433837891, "global_step": 129630, "epoch": 3086} {"train_loss": -6.7293314933776855, "global_step": 129631, "epoch": 3086} {"train_loss": -6.638607025146484, "global_step": 129632, "epoch": 3086} {"train_loss": -6.524970054626465, "global_step": 129633, "epoch": 3086} {"train_loss": -6.616218090057373, "global_step": 129634, "epoch": 3086} {"train_loss": -6.650244235992432, "global_step": 129635, "epoch": 3086} {"train_loss": -6.682923316955566, "global_step": 129636, "epoch": 3086} {"train_loss": -6.656793594360352, "global_step": 129637, "epoch": 3086} {"train_loss": -6.581315994262695, "global_step": 129638, "epoch": 3086} {"train_loss": -6.703494071960449, "global_step": 129639, "epoch": 3086} {"train_loss": -6.541680812835693, "global_step": 129640, "epoch": 3086} {"train_loss": -6.620129585266113, "global_step": 129641, "epoch": 3086} {"train_loss": -6.640355110168457, "global_step": 129642, "epoch": 3086} {"train_loss": -6.736080646514893, "global_step": 129643, "epoch": 3086} {"train_loss": -6.473092555999756, "global_step": 129644, "epoch": 3086} {"train_loss": -6.638816833496094, "global_step": 129645, "epoch": 3086} {"train_loss": -6.628515243530273, "global_step": 129646, "epoch": 3086} {"train_loss": -6.60952091217041, "global_step": 129647, "epoch": 3086} {"train_loss": -6.693313121795654, "global_step": 129648, "epoch": 3086} {"train_loss": -6.62655782699585, "global_step": 129649, "epoch": 3086} {"train_loss": -6.67414665222168, "global_step": 129650, "epoch": 3086} {"train_loss": -6.583458423614502, "global_step": 129651, "epoch": 3086} {"train_loss": -6.632262229919434, "global_step": 129652, "epoch": 3086} {"train_loss": -6.611633448373704, "global_step": 129653, "epoch": 3086, "val_loss": 68092.40625} {"train_loss": -6.687018871307373, "global_step": 129654, "epoch": 3087} {"train_loss": -6.550646781921387, "global_step": 129655, "epoch": 3087} {"train_loss": -6.658280372619629, "global_step": 129656, "epoch": 3087} {"train_loss": -6.495784759521484, "global_step": 129657, "epoch": 3087} {"train_loss": -6.674811840057373, "global_step": 129658, "epoch": 3087} {"train_loss": -6.606430530548096, "global_step": 129659, "epoch": 3087} {"train_loss": -6.636336326599121, "global_step": 129660, "epoch": 3087} {"train_loss": -6.623715877532959, "global_step": 129661, "epoch": 3087} {"train_loss": -6.628561496734619, "global_step": 129662, "epoch": 3087} {"train_loss": -6.6445536613464355, "global_step": 129663, "epoch": 3087} {"train_loss": -6.734769344329834, "global_step": 129664, "epoch": 3087} {"train_loss": -6.560345649719238, "global_step": 129665, "epoch": 3087} {"train_loss": -6.765937805175781, "global_step": 129666, "epoch": 3087} {"train_loss": -6.62188196182251, "global_step": 129667, "epoch": 3087} {"train_loss": -6.706564903259277, "global_step": 129668, "epoch": 3087} {"train_loss": -6.56828498840332, "global_step": 129669, "epoch": 3087} {"train_loss": -6.558612823486328, "global_step": 129670, "epoch": 3087} {"train_loss": -6.687231540679932, "global_step": 129671, "epoch": 3087} {"train_loss": -6.689294815063477, "global_step": 129672, "epoch": 3087} {"train_loss": -6.654069900512695, "global_step": 129673, "epoch": 3087} {"train_loss": -6.6949687004089355, "global_step": 129674, "epoch": 3087} {"train_loss": -6.649120330810547, "global_step": 129675, "epoch": 3087} {"train_loss": -6.7259063720703125, "global_step": 129676, "epoch": 3087} {"train_loss": -6.659069061279297, "global_step": 129677, "epoch": 3087} {"train_loss": -6.776485443115234, "global_step": 129678, "epoch": 3087} {"train_loss": -6.672895431518555, "global_step": 129679, "epoch": 3087} {"train_loss": -6.6636552810668945, "global_step": 129680, "epoch": 3087} {"train_loss": -6.619776248931885, "global_step": 129681, "epoch": 3087} {"train_loss": -6.619427680969238, "global_step": 129682, "epoch": 3087} {"train_loss": -6.61662483215332, "global_step": 129683, "epoch": 3087} {"train_loss": -6.6189985275268555, "global_step": 129684, "epoch": 3087} {"train_loss": -6.624327659606934, "global_step": 129685, "epoch": 3087} {"train_loss": -6.605234622955322, "global_step": 129686, "epoch": 3087} {"train_loss": -6.642627716064453, "global_step": 129687, "epoch": 3087} {"train_loss": -6.628713607788086, "global_step": 129688, "epoch": 3087} {"train_loss": -6.760759353637695, "global_step": 129689, "epoch": 3087} {"train_loss": -6.627490997314453, "global_step": 129690, "epoch": 3087} {"train_loss": -6.605834484100342, "global_step": 129691, "epoch": 3087} {"train_loss": -6.673681259155273, "global_step": 129692, "epoch": 3087} {"train_loss": -6.664072036743164, "global_step": 129693, "epoch": 3087} {"train_loss": -6.575029373168945, "global_step": 129694, "epoch": 3087} {"train_loss": -6.646323181333996, "global_step": 129695, "epoch": 3087, "val_loss": 68430.0546875} {"train_loss": -6.5326151847839355, "global_step": 129696, "epoch": 3088} {"train_loss": -6.589033603668213, "global_step": 129697, "epoch": 3088} {"train_loss": -6.656317710876465, "global_step": 129698, "epoch": 3088} {"train_loss": -6.674294471740723, "global_step": 129699, "epoch": 3088} {"train_loss": -6.731006145477295, "global_step": 129700, "epoch": 3088} {"train_loss": -6.630913734436035, "global_step": 129701, "epoch": 3088} {"train_loss": -6.708286285400391, "global_step": 129702, "epoch": 3088} {"train_loss": -6.633489608764648, "global_step": 129703, "epoch": 3088} {"train_loss": -6.60258674621582, "global_step": 129704, "epoch": 3088} {"train_loss": -6.561469078063965, "global_step": 129705, "epoch": 3088} {"train_loss": -6.6406450271606445, "global_step": 129706, "epoch": 3088} {"train_loss": -6.7917304039001465, "global_step": 129707, "epoch": 3088} {"train_loss": -6.645754814147949, "global_step": 129708, "epoch": 3088} {"train_loss": -6.699275016784668, "global_step": 129709, "epoch": 3088} {"train_loss": -6.746322154998779, "global_step": 129710, "epoch": 3088} {"train_loss": -6.686491966247559, "global_step": 129711, "epoch": 3088} {"train_loss": -6.6888017654418945, "global_step": 129712, "epoch": 3088} {"train_loss": -6.713351249694824, "global_step": 129713, "epoch": 3088} {"train_loss": -6.676541328430176, "global_step": 129714, "epoch": 3088} {"train_loss": -6.6046342849731445, "global_step": 129715, "epoch": 3088} {"train_loss": -6.51284122467041, "global_step": 129716, "epoch": 3088} {"train_loss": -6.692447662353516, "global_step": 129717, "epoch": 3088} {"train_loss": -6.723400115966797, "global_step": 129718, "epoch": 3088} {"train_loss": -6.566651344299316, "global_step": 129719, "epoch": 3088} {"train_loss": -6.614223480224609, "global_step": 129720, "epoch": 3088} {"train_loss": -6.652636528015137, "global_step": 129721, "epoch": 3088} {"train_loss": -6.611715316772461, "global_step": 129722, "epoch": 3088} {"train_loss": -6.520434379577637, "global_step": 129723, "epoch": 3088} {"train_loss": -6.599396705627441, "global_step": 129724, "epoch": 3088} {"train_loss": -6.686612129211426, "global_step": 129725, "epoch": 3088} {"train_loss": -6.420784950256348, "global_step": 129726, "epoch": 3088} {"train_loss": -6.590978622436523, "global_step": 129727, "epoch": 3088} {"train_loss": -6.6281538009643555, "global_step": 129728, "epoch": 3088} {"train_loss": -6.623104572296143, "global_step": 129729, "epoch": 3088} {"train_loss": -6.696710586547852, "global_step": 129730, "epoch": 3088} {"train_loss": -6.612512588500977, "global_step": 129731, "epoch": 3088} {"train_loss": -6.613577365875244, "global_step": 129732, "epoch": 3088} {"train_loss": -6.770630836486816, "global_step": 129733, "epoch": 3088} {"train_loss": -6.695978164672852, "global_step": 129734, "epoch": 3088} {"train_loss": -6.625968933105469, "global_step": 129735, "epoch": 3088} {"train_loss": -6.663724899291992, "global_step": 129736, "epoch": 3088} {"train_loss": -6.641338007790702, "global_step": 129737, "epoch": 3088, "val_loss": 68306.234375} {"train_loss": -6.684329032897949, "global_step": 129738, "epoch": 3089} {"train_loss": -6.630981922149658, "global_step": 129739, "epoch": 3089} {"train_loss": -6.567023277282715, "global_step": 129740, "epoch": 3089} {"train_loss": -6.618978023529053, "global_step": 129741, "epoch": 3089} {"train_loss": -6.636572360992432, "global_step": 129742, "epoch": 3089} {"train_loss": -6.601373672485352, "global_step": 129743, "epoch": 3089} {"train_loss": -6.579130172729492, "global_step": 129744, "epoch": 3089} {"train_loss": -6.686290740966797, "global_step": 129745, "epoch": 3089} {"train_loss": -6.744866847991943, "global_step": 129746, "epoch": 3089} {"train_loss": -6.613035678863525, "global_step": 129747, "epoch": 3089} {"train_loss": -6.566034317016602, "global_step": 129748, "epoch": 3089} {"train_loss": -6.6776227951049805, "global_step": 129749, "epoch": 3089} {"train_loss": -6.778835773468018, "global_step": 129750, "epoch": 3089} {"train_loss": -6.5598883628845215, "global_step": 129751, "epoch": 3089} {"train_loss": -6.622433662414551, "global_step": 129752, "epoch": 3089} {"train_loss": -6.476012229919434, "global_step": 129753, "epoch": 3089} {"train_loss": -6.634160995483398, "global_step": 129754, "epoch": 3089} {"train_loss": -6.541048049926758, "global_step": 129755, "epoch": 3089} {"train_loss": -6.525400638580322, "global_step": 129756, "epoch": 3089} {"train_loss": -6.657554626464844, "global_step": 129757, "epoch": 3089} {"train_loss": -6.435702323913574, "global_step": 129758, "epoch": 3089} {"train_loss": -6.648536682128906, "global_step": 129759, "epoch": 3089} {"train_loss": -6.613577365875244, "global_step": 129760, "epoch": 3089} {"train_loss": -6.539823532104492, "global_step": 129761, "epoch": 3089} {"train_loss": -6.670201301574707, "global_step": 129762, "epoch": 3089} {"train_loss": -6.599203109741211, "global_step": 129763, "epoch": 3089} {"train_loss": -6.412264823913574, "global_step": 129764, "epoch": 3089} {"train_loss": -6.766993045806885, "global_step": 129765, "epoch": 3089} {"train_loss": -6.555296421051025, "global_step": 129766, "epoch": 3089} {"train_loss": -6.603540420532227, "global_step": 129767, "epoch": 3089} {"train_loss": -6.503568649291992, "global_step": 129768, "epoch": 3089} {"train_loss": -6.590963363647461, "global_step": 129769, "epoch": 3089} {"train_loss": -6.634610176086426, "global_step": 129770, "epoch": 3089} {"train_loss": -6.602540493011475, "global_step": 129771, "epoch": 3089} {"train_loss": -6.635725021362305, "global_step": 129772, "epoch": 3089} {"train_loss": -6.611052989959717, "global_step": 129773, "epoch": 3089} {"train_loss": -6.611732482910156, "global_step": 129774, "epoch": 3089} {"train_loss": -6.704111099243164, "global_step": 129775, "epoch": 3089} {"train_loss": -6.701566219329834, "global_step": 129776, "epoch": 3089} {"train_loss": -6.498782634735107, "global_step": 129777, "epoch": 3089} {"train_loss": -6.7093329429626465, "global_step": 129778, "epoch": 3089} {"train_loss": -6.612592436018444, "global_step": 129779, "epoch": 3089, "val_loss": 68307.859375} {"train_loss": -6.548296928405762, "global_step": 129780, "epoch": 3090} {"train_loss": -6.7059173583984375, "global_step": 129781, "epoch": 3090} {"train_loss": -6.682794570922852, "global_step": 129782, "epoch": 3090} {"train_loss": -6.7143964767456055, "global_step": 129783, "epoch": 3090} {"train_loss": -6.6259870529174805, "global_step": 129784, "epoch": 3090} {"train_loss": -6.655747413635254, "global_step": 129785, "epoch": 3090} {"train_loss": -6.769157886505127, "global_step": 129786, "epoch": 3090} {"train_loss": -6.622591972351074, "global_step": 129787, "epoch": 3090} {"train_loss": -6.717293739318848, "global_step": 129788, "epoch": 3090} {"train_loss": -6.717558860778809, "global_step": 129789, "epoch": 3090} {"train_loss": -6.590666770935059, "global_step": 129790, "epoch": 3090} {"train_loss": -6.60373592376709, "global_step": 129791, "epoch": 3090} {"train_loss": -6.684441089630127, "global_step": 129792, "epoch": 3090} {"train_loss": -6.700559616088867, "global_step": 129793, "epoch": 3090} {"train_loss": -6.696874141693115, "global_step": 129794, "epoch": 3090} {"train_loss": -6.544684410095215, "global_step": 129795, "epoch": 3090} {"train_loss": -6.606083869934082, "global_step": 129796, "epoch": 3090} {"train_loss": -6.597458839416504, "global_step": 129797, "epoch": 3090} {"train_loss": -6.62679386138916, "global_step": 129798, "epoch": 3090} {"train_loss": -6.682551383972168, "global_step": 129799, "epoch": 3090} {"train_loss": -6.694584369659424, "global_step": 129800, "epoch": 3090} {"train_loss": -6.679318428039551, "global_step": 129801, "epoch": 3090} {"train_loss": -6.559289932250977, "global_step": 129802, "epoch": 3090} {"train_loss": -6.647217750549316, "global_step": 129803, "epoch": 3090} {"train_loss": -6.627232551574707, "global_step": 129804, "epoch": 3090} {"train_loss": -6.635004997253418, "global_step": 129805, "epoch": 3090} {"train_loss": -6.603309631347656, "global_step": 129806, "epoch": 3090} {"train_loss": -6.684790134429932, "global_step": 129807, "epoch": 3090} {"train_loss": -6.51216983795166, "global_step": 129808, "epoch": 3090} {"train_loss": -6.660233497619629, "global_step": 129809, "epoch": 3090} {"train_loss": -6.551255226135254, "global_step": 129810, "epoch": 3090} {"train_loss": -6.529753684997559, "global_step": 129811, "epoch": 3090} {"train_loss": -6.602785110473633, "global_step": 129812, "epoch": 3090} {"train_loss": -6.638692378997803, "global_step": 129813, "epoch": 3090} {"train_loss": -6.621310234069824, "global_step": 129814, "epoch": 3090} {"train_loss": -6.497532367706299, "global_step": 129815, "epoch": 3090} {"train_loss": -6.688065528869629, "global_step": 129816, "epoch": 3090} {"train_loss": -6.6546430587768555, "global_step": 129817, "epoch": 3090} {"train_loss": -6.809791564941406, "global_step": 129818, "epoch": 3090} {"train_loss": -6.638071060180664, "global_step": 129819, "epoch": 3090} {"train_loss": -6.550309181213379, "global_step": 129820, "epoch": 3090} {"train_loss": -6.63893909681411, "global_step": 129821, "epoch": 3090, "val_loss": 68159.375} {"train_loss": -6.572011947631836, "global_step": 129822, "epoch": 3091} {"train_loss": -6.700822830200195, "global_step": 129823, "epoch": 3091} {"train_loss": -6.536895751953125, "global_step": 129824, "epoch": 3091} {"train_loss": -6.587968349456787, "global_step": 129825, "epoch": 3091} {"train_loss": -6.742842674255371, "global_step": 129826, "epoch": 3091} {"train_loss": -6.55662202835083, "global_step": 129827, "epoch": 3091} {"train_loss": -6.541446685791016, "global_step": 129828, "epoch": 3091} {"train_loss": -6.720888137817383, "global_step": 129829, "epoch": 3091} {"train_loss": -6.619531154632568, "global_step": 129830, "epoch": 3091} {"train_loss": -6.783301830291748, "global_step": 129831, "epoch": 3091} {"train_loss": -6.678786754608154, "global_step": 129832, "epoch": 3091} {"train_loss": -6.513982772827148, "global_step": 129833, "epoch": 3091} {"train_loss": -6.715448379516602, "global_step": 129834, "epoch": 3091} {"train_loss": -6.620675086975098, "global_step": 129835, "epoch": 3091} {"train_loss": -6.593849182128906, "global_step": 129836, "epoch": 3091} {"train_loss": -6.6650567054748535, "global_step": 129837, "epoch": 3091} {"train_loss": -6.53070068359375, "global_step": 129838, "epoch": 3091} {"train_loss": -6.698749542236328, "global_step": 129839, "epoch": 3091} {"train_loss": -6.655261039733887, "global_step": 129840, "epoch": 3091} {"train_loss": -6.539499282836914, "global_step": 129841, "epoch": 3091} {"train_loss": -6.60640287399292, "global_step": 129842, "epoch": 3091} {"train_loss": -6.53825044631958, "global_step": 129843, "epoch": 3091} {"train_loss": -6.579484462738037, "global_step": 129844, "epoch": 3091} {"train_loss": -6.632070541381836, "global_step": 129845, "epoch": 3091} {"train_loss": -6.676851272583008, "global_step": 129846, "epoch": 3091} {"train_loss": -6.6486053466796875, "global_step": 129847, "epoch": 3091} {"train_loss": -6.5628228187561035, "global_step": 129848, "epoch": 3091} {"train_loss": -6.640671730041504, "global_step": 129849, "epoch": 3091} {"train_loss": -6.644667625427246, "global_step": 129850, "epoch": 3091} {"train_loss": -6.689253330230713, "global_step": 129851, "epoch": 3091} {"train_loss": -6.6330132484436035, "global_step": 129852, "epoch": 3091} {"train_loss": -6.747396469116211, "global_step": 129853, "epoch": 3091} {"train_loss": -6.60754919052124, "global_step": 129854, "epoch": 3091} {"train_loss": -6.4730424880981445, "global_step": 129855, "epoch": 3091} {"train_loss": -6.652848243713379, "global_step": 129856, "epoch": 3091} {"train_loss": -6.6600189208984375, "global_step": 129857, "epoch": 3091} {"train_loss": -6.671696662902832, "global_step": 129858, "epoch": 3091} {"train_loss": -6.587307453155518, "global_step": 129859, "epoch": 3091} {"train_loss": -6.645253658294678, "global_step": 129860, "epoch": 3091} {"train_loss": -6.585146427154541, "global_step": 129861, "epoch": 3091} {"train_loss": -6.579804420471191, "global_step": 129862, "epoch": 3091} {"train_loss": -6.621298438026791, "global_step": 129863, "epoch": 3091, "val_loss": 68147.4296875} {"train_loss": -6.654143333435059, "global_step": 129864, "epoch": 3092} {"train_loss": -6.596598148345947, "global_step": 129865, "epoch": 3092} {"train_loss": -6.558829307556152, "global_step": 129866, "epoch": 3092} {"train_loss": -6.70463752746582, "global_step": 129867, "epoch": 3092} {"train_loss": -6.673272132873535, "global_step": 129868, "epoch": 3092} {"train_loss": -6.764612197875977, "global_step": 129869, "epoch": 3092} {"train_loss": -6.6801533699035645, "global_step": 129870, "epoch": 3092} {"train_loss": -6.653893947601318, "global_step": 129871, "epoch": 3092} {"train_loss": -6.688334941864014, "global_step": 129872, "epoch": 3092} {"train_loss": -6.627368927001953, "global_step": 129873, "epoch": 3092} {"train_loss": -6.671728134155273, "global_step": 129874, "epoch": 3092} {"train_loss": -6.608027458190918, "global_step": 129875, "epoch": 3092} {"train_loss": -6.696545600891113, "global_step": 129876, "epoch": 3092} {"train_loss": -6.749162197113037, "global_step": 129877, "epoch": 3092} {"train_loss": -6.639761924743652, "global_step": 129878, "epoch": 3092} {"train_loss": -6.762454032897949, "global_step": 129879, "epoch": 3092} {"train_loss": -6.612022876739502, "global_step": 129880, "epoch": 3092} {"train_loss": -6.812236785888672, "global_step": 129881, "epoch": 3092} {"train_loss": -6.669985771179199, "global_step": 129882, "epoch": 3092} {"train_loss": -6.6012115478515625, "global_step": 129883, "epoch": 3092} {"train_loss": -6.649753570556641, "global_step": 129884, "epoch": 3092} {"train_loss": -6.8314666748046875, "global_step": 129885, "epoch": 3092} {"train_loss": -6.611667633056641, "global_step": 129886, "epoch": 3092} {"train_loss": -6.7364301681518555, "global_step": 129887, "epoch": 3092} {"train_loss": -6.663321018218994, "global_step": 129888, "epoch": 3092} {"train_loss": -6.73005485534668, "global_step": 129889, "epoch": 3092} {"train_loss": -6.666779518127441, "global_step": 129890, "epoch": 3092} {"train_loss": -6.657440185546875, "global_step": 129891, "epoch": 3092} {"train_loss": -6.775246620178223, "global_step": 129892, "epoch": 3092} {"train_loss": -6.68820858001709, "global_step": 129893, "epoch": 3092} {"train_loss": -6.608445167541504, "global_step": 129894, "epoch": 3092} {"train_loss": -6.623900890350342, "global_step": 129895, "epoch": 3092} {"train_loss": -6.670949935913086, "global_step": 129896, "epoch": 3092} {"train_loss": -6.7526750564575195, "global_step": 129897, "epoch": 3092} {"train_loss": -6.665091037750244, "global_step": 129898, "epoch": 3092} {"train_loss": -6.549090385437012, "global_step": 129899, "epoch": 3092} {"train_loss": -6.71975040435791, "global_step": 129900, "epoch": 3092} {"train_loss": -6.61055850982666, "global_step": 129901, "epoch": 3092} {"train_loss": -6.643824577331543, "global_step": 129902, "epoch": 3092} {"train_loss": -6.619630813598633, "global_step": 129903, "epoch": 3092} {"train_loss": -6.521087646484375, "global_step": 129904, "epoch": 3092} {"train_loss": -6.669635046096075, "global_step": 129905, "epoch": 3092, "val_loss": 68245.3515625} {"train_loss": -6.63663911819458, "global_step": 129906, "epoch": 3093} {"train_loss": -6.683152198791504, "global_step": 129907, "epoch": 3093} {"train_loss": -6.618134021759033, "global_step": 129908, "epoch": 3093} {"train_loss": -6.613375663757324, "global_step": 129909, "epoch": 3093} {"train_loss": -6.646222114562988, "global_step": 129910, "epoch": 3093} {"train_loss": -6.753748416900635, "global_step": 129911, "epoch": 3093} {"train_loss": -6.618117332458496, "global_step": 129912, "epoch": 3093} {"train_loss": -6.7154316902160645, "global_step": 129913, "epoch": 3093} {"train_loss": -6.67598819732666, "global_step": 129914, "epoch": 3093} {"train_loss": -6.6730523109436035, "global_step": 129915, "epoch": 3093} {"train_loss": -6.639547824859619, "global_step": 129916, "epoch": 3093} {"train_loss": -6.6326751708984375, "global_step": 129917, "epoch": 3093} {"train_loss": -6.644013404846191, "global_step": 129918, "epoch": 3093} {"train_loss": -6.6770429611206055, "global_step": 129919, "epoch": 3093} {"train_loss": -6.698700904846191, "global_step": 129920, "epoch": 3093} {"train_loss": -6.600813865661621, "global_step": 129921, "epoch": 3093} {"train_loss": -6.623793601989746, "global_step": 129922, "epoch": 3093} {"train_loss": -6.685832977294922, "global_step": 129923, "epoch": 3093} {"train_loss": -6.583321571350098, "global_step": 129924, "epoch": 3093} {"train_loss": -6.50649356842041, "global_step": 129925, "epoch": 3093} {"train_loss": -6.638733863830566, "global_step": 129926, "epoch": 3093} {"train_loss": -6.679746627807617, "global_step": 129927, "epoch": 3093} {"train_loss": -6.740632057189941, "global_step": 129928, "epoch": 3093} {"train_loss": -6.593613624572754, "global_step": 129929, "epoch": 3093} {"train_loss": -6.606698989868164, "global_step": 129930, "epoch": 3093} {"train_loss": -6.526213645935059, "global_step": 129931, "epoch": 3093} {"train_loss": -6.718445777893066, "global_step": 129932, "epoch": 3093} {"train_loss": -6.629034042358398, "global_step": 129933, "epoch": 3093} {"train_loss": -6.650831699371338, "global_step": 129934, "epoch": 3093} {"train_loss": -6.695880889892578, "global_step": 129935, "epoch": 3093} {"train_loss": -6.596560001373291, "global_step": 129936, "epoch": 3093} {"train_loss": -6.602867126464844, "global_step": 129937, "epoch": 3093} {"train_loss": -6.653115272521973, "global_step": 129938, "epoch": 3093} {"train_loss": -6.586154937744141, "global_step": 129939, "epoch": 3093} {"train_loss": -6.595297813415527, "global_step": 129940, "epoch": 3093} {"train_loss": -6.53819465637207, "global_step": 129941, "epoch": 3093} {"train_loss": -6.577550888061523, "global_step": 129942, "epoch": 3093} {"train_loss": -6.641207695007324, "global_step": 129943, "epoch": 3093} {"train_loss": -6.58328914642334, "global_step": 129944, "epoch": 3093} {"train_loss": -6.7190423011779785, "global_step": 129945, "epoch": 3093} {"train_loss": -6.551778793334961, "global_step": 129946, "epoch": 3093} {"train_loss": -6.634935095196679, "global_step": 129947, "epoch": 3093, "val_loss": 68445.0546875} {"train_loss": -6.721401214599609, "global_step": 129948, "epoch": 3094} {"train_loss": -6.606997013092041, "global_step": 129949, "epoch": 3094} {"train_loss": -6.607329368591309, "global_step": 129950, "epoch": 3094} {"train_loss": -6.555682182312012, "global_step": 129951, "epoch": 3094} {"train_loss": -6.584473133087158, "global_step": 129952, "epoch": 3094} {"train_loss": -6.652392864227295, "global_step": 129953, "epoch": 3094} {"train_loss": -6.435585021972656, "global_step": 129954, "epoch": 3094} {"train_loss": -6.62086820602417, "global_step": 129955, "epoch": 3094} {"train_loss": -6.548463344573975, "global_step": 129956, "epoch": 3094} {"train_loss": -6.665566444396973, "global_step": 129957, "epoch": 3094} {"train_loss": -6.732763290405273, "global_step": 129958, "epoch": 3094} {"train_loss": -6.616568565368652, "global_step": 129959, "epoch": 3094} {"train_loss": -6.5962395668029785, "global_step": 129960, "epoch": 3094} {"train_loss": -6.564640998840332, "global_step": 129961, "epoch": 3094} {"train_loss": -6.606415748596191, "global_step": 129962, "epoch": 3094} {"train_loss": -6.54833459854126, "global_step": 129963, "epoch": 3094} {"train_loss": -6.60488224029541, "global_step": 129964, "epoch": 3094} {"train_loss": -6.6784491539001465, "global_step": 129965, "epoch": 3094} {"train_loss": -6.66412353515625, "global_step": 129966, "epoch": 3094} {"train_loss": -6.600592613220215, "global_step": 129967, "epoch": 3094} {"train_loss": -6.703547477722168, "global_step": 129968, "epoch": 3094} {"train_loss": -6.636672496795654, "global_step": 129969, "epoch": 3094} {"train_loss": -6.715794563293457, "global_step": 129970, "epoch": 3094} {"train_loss": -6.705385208129883, "global_step": 129971, "epoch": 3094} {"train_loss": -6.500618934631348, "global_step": 129972, "epoch": 3094} {"train_loss": -6.5868144035339355, "global_step": 129973, "epoch": 3094} {"train_loss": -6.698038578033447, "global_step": 129974, "epoch": 3094} {"train_loss": -6.7147536277771, "global_step": 129975, "epoch": 3094} {"train_loss": -6.668278694152832, "global_step": 129976, "epoch": 3094} {"train_loss": -6.682103157043457, "global_step": 129977, "epoch": 3094} {"train_loss": -6.75367546081543, "global_step": 129978, "epoch": 3094} {"train_loss": -6.734325408935547, "global_step": 129979, "epoch": 3094} {"train_loss": -6.646000862121582, "global_step": 129980, "epoch": 3094} {"train_loss": -6.687255859375, "global_step": 129981, "epoch": 3094} {"train_loss": -6.734833717346191, "global_step": 129982, "epoch": 3094} {"train_loss": -6.575477600097656, "global_step": 129983, "epoch": 3094} {"train_loss": -6.658624649047852, "global_step": 129984, "epoch": 3094} {"train_loss": -6.496371746063232, "global_step": 129985, "epoch": 3094} {"train_loss": -6.629793643951416, "global_step": 129986, "epoch": 3094} {"train_loss": -6.549663543701172, "global_step": 129987, "epoch": 3094} {"train_loss": -6.4076032638549805, "global_step": 129988, "epoch": 3094} {"train_loss": -6.622297332400367, "global_step": 129989, "epoch": 3094, "val_loss": 68527.421875} {"train_loss": -6.56131649017334, "global_step": 129990, "epoch": 3095} {"train_loss": -6.503856658935547, "global_step": 129991, "epoch": 3095} {"train_loss": -6.613132476806641, "global_step": 129992, "epoch": 3095} {"train_loss": -6.488640785217285, "global_step": 129993, "epoch": 3095} {"train_loss": -6.477109909057617, "global_step": 129994, "epoch": 3095} {"train_loss": -6.515331268310547, "global_step": 129995, "epoch": 3095} {"train_loss": -6.6223602294921875, "global_step": 129996, "epoch": 3095} {"train_loss": -6.472823619842529, "global_step": 129997, "epoch": 3095} {"train_loss": -6.657619476318359, "global_step": 129998, "epoch": 3095} {"train_loss": -6.53151798248291, "global_step": 129999, "epoch": 3095} {"train_loss": -6.538641452789307, "global_step": 130000, "epoch": 3095} {"train_loss": -6.574738502502441, "global_step": 130001, "epoch": 3095} {"train_loss": -6.651310920715332, "global_step": 130002, "epoch": 3095} {"train_loss": -6.565377712249756, "global_step": 130003, "epoch": 3095} {"train_loss": -6.674915790557861, "global_step": 130004, "epoch": 3095} {"train_loss": -6.665222644805908, "global_step": 130005, "epoch": 3095} {"train_loss": -6.675689697265625, "global_step": 130006, "epoch": 3095} {"train_loss": -6.657137870788574, "global_step": 130007, "epoch": 3095} {"train_loss": -6.7275190353393555, "global_step": 130008, "epoch": 3095} {"train_loss": -6.640985012054443, "global_step": 130009, "epoch": 3095} {"train_loss": -6.582798004150391, "global_step": 130010, "epoch": 3095} {"train_loss": -6.604404449462891, "global_step": 130011, "epoch": 3095} {"train_loss": -6.674492835998535, "global_step": 130012, "epoch": 3095} {"train_loss": -6.6999711990356445, "global_step": 130013, "epoch": 3095} {"train_loss": -6.570906639099121, "global_step": 130014, "epoch": 3095} {"train_loss": -6.654987335205078, "global_step": 130015, "epoch": 3095} {"train_loss": -6.591479301452637, "global_step": 130016, "epoch": 3095} {"train_loss": -6.573750019073486, "global_step": 130017, "epoch": 3095} {"train_loss": -6.699221611022949, "global_step": 130018, "epoch": 3095} {"train_loss": -6.594281196594238, "global_step": 130019, "epoch": 3095} {"train_loss": -6.683197975158691, "global_step": 130020, "epoch": 3095} {"train_loss": -6.60513162612915, "global_step": 130021, "epoch": 3095} {"train_loss": -6.563810348510742, "global_step": 130022, "epoch": 3095} {"train_loss": -6.675995826721191, "global_step": 130023, "epoch": 3095} {"train_loss": -6.666947841644287, "global_step": 130024, "epoch": 3095} {"train_loss": -6.60020112991333, "global_step": 130025, "epoch": 3095} {"train_loss": -6.5961995124816895, "global_step": 130026, "epoch": 3095} {"train_loss": -6.604109764099121, "global_step": 130027, "epoch": 3095} {"train_loss": -6.686613082885742, "global_step": 130028, "epoch": 3095} {"train_loss": -6.666549205780029, "global_step": 130029, "epoch": 3095} {"train_loss": -6.587202072143555, "global_step": 130030, "epoch": 3095} {"train_loss": -6.61108272416251, "global_step": 130031, "epoch": 3095, "val_loss": 68202.1640625} {"train_loss": -6.497676849365234, "global_step": 130032, "epoch": 3096} {"train_loss": -6.620333671569824, "global_step": 130033, "epoch": 3096} {"train_loss": -6.647212028503418, "global_step": 130034, "epoch": 3096} {"train_loss": -6.58466911315918, "global_step": 130035, "epoch": 3096} {"train_loss": -6.740569114685059, "global_step": 130036, "epoch": 3096} {"train_loss": -6.695989608764648, "global_step": 130037, "epoch": 3096} {"train_loss": -6.657134056091309, "global_step": 130038, "epoch": 3096} {"train_loss": -6.733888626098633, "global_step": 130039, "epoch": 3096} {"train_loss": -6.628849983215332, "global_step": 130040, "epoch": 3096} {"train_loss": -6.649897575378418, "global_step": 130041, "epoch": 3096} {"train_loss": -6.651980876922607, "global_step": 130042, "epoch": 3096} {"train_loss": -6.569725513458252, "global_step": 130043, "epoch": 3096} {"train_loss": -6.5125532150268555, "global_step": 130044, "epoch": 3096} {"train_loss": -6.668513774871826, "global_step": 130045, "epoch": 3096} {"train_loss": -6.632179260253906, "global_step": 130046, "epoch": 3096} {"train_loss": -6.6969404220581055, "global_step": 130047, "epoch": 3096} {"train_loss": -6.638010025024414, "global_step": 130048, "epoch": 3096} {"train_loss": -6.538760185241699, "global_step": 130049, "epoch": 3096} {"train_loss": -6.591469764709473, "global_step": 130050, "epoch": 3096} {"train_loss": -6.656552314758301, "global_step": 130051, "epoch": 3096} {"train_loss": -6.537951469421387, "global_step": 130052, "epoch": 3096} {"train_loss": -6.610315799713135, "global_step": 130053, "epoch": 3096} {"train_loss": -6.639109134674072, "global_step": 130054, "epoch": 3096} {"train_loss": -6.582427978515625, "global_step": 130055, "epoch": 3096} {"train_loss": -6.712841033935547, "global_step": 130056, "epoch": 3096} {"train_loss": -6.725587368011475, "global_step": 130057, "epoch": 3096} {"train_loss": -6.6632890701293945, "global_step": 130058, "epoch": 3096} {"train_loss": -6.544851303100586, "global_step": 130059, "epoch": 3096} {"train_loss": -6.64378547668457, "global_step": 130060, "epoch": 3096} {"train_loss": -6.592016696929932, "global_step": 130061, "epoch": 3096} {"train_loss": -6.629871368408203, "global_step": 130062, "epoch": 3096} {"train_loss": -6.681502342224121, "global_step": 130063, "epoch": 3096} {"train_loss": -6.717310905456543, "global_step": 130064, "epoch": 3096} {"train_loss": -6.578518390655518, "global_step": 130065, "epoch": 3096} {"train_loss": -6.590631484985352, "global_step": 130066, "epoch": 3096} {"train_loss": -6.51387882232666, "global_step": 130067, "epoch": 3096} {"train_loss": -6.709532737731934, "global_step": 130068, "epoch": 3096} {"train_loss": -6.6212968826293945, "global_step": 130069, "epoch": 3096} {"train_loss": -6.524904727935791, "global_step": 130070, "epoch": 3096} {"train_loss": -6.623928070068359, "global_step": 130071, "epoch": 3096} {"train_loss": -6.548699378967285, "global_step": 130072, "epoch": 3096} {"train_loss": -6.624049515951247, "global_step": 130073, "epoch": 3096, "val_loss": 68180.1640625} {"train_loss": -6.595892429351807, "global_step": 130074, "epoch": 3097} {"train_loss": -6.708355903625488, "global_step": 130075, "epoch": 3097} {"train_loss": -6.558843612670898, "global_step": 130076, "epoch": 3097} {"train_loss": -6.599551677703857, "global_step": 130077, "epoch": 3097} {"train_loss": -6.653398036956787, "global_step": 130078, "epoch": 3097} {"train_loss": -6.699256420135498, "global_step": 130079, "epoch": 3097} {"train_loss": -6.574289321899414, "global_step": 130080, "epoch": 3097} {"train_loss": -6.54010009765625, "global_step": 130081, "epoch": 3097} {"train_loss": -6.64838981628418, "global_step": 130082, "epoch": 3097} {"train_loss": -6.719354629516602, "global_step": 130083, "epoch": 3097} {"train_loss": -6.7094316482543945, "global_step": 130084, "epoch": 3097} {"train_loss": -6.696136951446533, "global_step": 130085, "epoch": 3097} {"train_loss": -6.556875228881836, "global_step": 130086, "epoch": 3097} {"train_loss": -6.595303535461426, "global_step": 130087, "epoch": 3097} {"train_loss": -6.610710144042969, "global_step": 130088, "epoch": 3097} {"train_loss": -6.572021961212158, "global_step": 130089, "epoch": 3097} {"train_loss": -6.663975715637207, "global_step": 130090, "epoch": 3097} {"train_loss": -6.628073692321777, "global_step": 130091, "epoch": 3097} {"train_loss": -6.642560958862305, "global_step": 130092, "epoch": 3097} {"train_loss": -6.662154674530029, "global_step": 130093, "epoch": 3097} {"train_loss": -6.642759323120117, "global_step": 130094, "epoch": 3097} {"train_loss": -6.675956726074219, "global_step": 130095, "epoch": 3097} {"train_loss": -6.591612339019775, "global_step": 130096, "epoch": 3097} {"train_loss": -6.640414237976074, "global_step": 130097, "epoch": 3097} {"train_loss": -6.606429100036621, "global_step": 130098, "epoch": 3097} {"train_loss": -6.619616985321045, "global_step": 130099, "epoch": 3097} {"train_loss": -6.587921619415283, "global_step": 130100, "epoch": 3097} {"train_loss": -6.598141193389893, "global_step": 130101, "epoch": 3097} {"train_loss": -6.597594738006592, "global_step": 130102, "epoch": 3097} {"train_loss": -6.594642639160156, "global_step": 130103, "epoch": 3097} {"train_loss": -6.630054473876953, "global_step": 130104, "epoch": 3097} {"train_loss": -6.578502178192139, "global_step": 130105, "epoch": 3097} {"train_loss": -6.490277290344238, "global_step": 130106, "epoch": 3097} {"train_loss": -6.620064735412598, "global_step": 130107, "epoch": 3097} {"train_loss": -6.530756950378418, "global_step": 130108, "epoch": 3097} {"train_loss": -6.62886381149292, "global_step": 130109, "epoch": 3097} {"train_loss": -6.560297012329102, "global_step": 130110, "epoch": 3097} {"train_loss": -6.489844799041748, "global_step": 130111, "epoch": 3097} {"train_loss": -6.562685012817383, "global_step": 130112, "epoch": 3097} {"train_loss": -6.478353500366211, "global_step": 130113, "epoch": 3097} {"train_loss": -6.605554103851318, "global_step": 130114, "epoch": 3097} {"train_loss": -6.60930491629101, "global_step": 130115, "epoch": 3097, "val_loss": 68319.015625} {"train_loss": -6.622732162475586, "global_step": 130116, "epoch": 3098} {"train_loss": -6.463223457336426, "global_step": 130117, "epoch": 3098} {"train_loss": -6.6112847328186035, "global_step": 130118, "epoch": 3098} {"train_loss": -6.625200271606445, "global_step": 130119, "epoch": 3098} {"train_loss": -6.527223110198975, "global_step": 130120, "epoch": 3098} {"train_loss": -6.587859153747559, "global_step": 130121, "epoch": 3098} {"train_loss": -6.4755096435546875, "global_step": 130122, "epoch": 3098} {"train_loss": -6.570580959320068, "global_step": 130123, "epoch": 3098} {"train_loss": -6.609713077545166, "global_step": 130124, "epoch": 3098} {"train_loss": -6.569653511047363, "global_step": 130125, "epoch": 3098} {"train_loss": -6.577617168426514, "global_step": 130126, "epoch": 3098} {"train_loss": -6.512348175048828, "global_step": 130127, "epoch": 3098} {"train_loss": -6.595426082611084, "global_step": 130128, "epoch": 3098} {"train_loss": -6.560807228088379, "global_step": 130129, "epoch": 3098} {"train_loss": -6.6208109855651855, "global_step": 130130, "epoch": 3098} {"train_loss": -6.5547027587890625, "global_step": 130131, "epoch": 3098} {"train_loss": -6.674315929412842, "global_step": 130132, "epoch": 3098} {"train_loss": -6.617836952209473, "global_step": 130133, "epoch": 3098} {"train_loss": -6.583453178405762, "global_step": 130134, "epoch": 3098} {"train_loss": -6.6112060546875, "global_step": 130135, "epoch": 3098} {"train_loss": -6.600172996520996, "global_step": 130136, "epoch": 3098} {"train_loss": -6.688783645629883, "global_step": 130137, "epoch": 3098} {"train_loss": -6.640317916870117, "global_step": 130138, "epoch": 3098} {"train_loss": -6.615400791168213, "global_step": 130139, "epoch": 3098} {"train_loss": -6.5935540199279785, "global_step": 130140, "epoch": 3098} {"train_loss": -6.595000267028809, "global_step": 130141, "epoch": 3098} {"train_loss": -6.744892597198486, "global_step": 130142, "epoch": 3098} {"train_loss": -6.584628582000732, "global_step": 130143, "epoch": 3098} {"train_loss": -6.593226432800293, "global_step": 130144, "epoch": 3098} {"train_loss": -6.5362372398376465, "global_step": 130145, "epoch": 3098} {"train_loss": -6.783513069152832, "global_step": 130146, "epoch": 3098} {"train_loss": -6.702014923095703, "global_step": 130147, "epoch": 3098} {"train_loss": -6.603628158569336, "global_step": 130148, "epoch": 3098} {"train_loss": -6.647037506103516, "global_step": 130149, "epoch": 3098} {"train_loss": -6.706211090087891, "global_step": 130150, "epoch": 3098} {"train_loss": -6.493026256561279, "global_step": 130151, "epoch": 3098} {"train_loss": -6.733277320861816, "global_step": 130152, "epoch": 3098} {"train_loss": -6.6027374267578125, "global_step": 130153, "epoch": 3098} {"train_loss": -6.598959922790527, "global_step": 130154, "epoch": 3098} {"train_loss": -6.716320514678955, "global_step": 130155, "epoch": 3098} {"train_loss": -6.593935966491699, "global_step": 130156, "epoch": 3098} {"train_loss": -6.608482508432298, "global_step": 130157, "epoch": 3098, "val_loss": 68037.453125} {"train_loss": -6.700761795043945, "global_step": 130158, "epoch": 3099} {"train_loss": -6.634677886962891, "global_step": 130159, "epoch": 3099} {"train_loss": -6.627180099487305, "global_step": 130160, "epoch": 3099} {"train_loss": -6.608928680419922, "global_step": 130161, "epoch": 3099} {"train_loss": -6.658059120178223, "global_step": 130162, "epoch": 3099} {"train_loss": -6.576223850250244, "global_step": 130163, "epoch": 3099} {"train_loss": -6.625720024108887, "global_step": 130164, "epoch": 3099} {"train_loss": -6.479753017425537, "global_step": 130165, "epoch": 3099} {"train_loss": -6.762120246887207, "global_step": 130166, "epoch": 3099} {"train_loss": -6.504358291625977, "global_step": 130167, "epoch": 3099} {"train_loss": -6.609547138214111, "global_step": 130168, "epoch": 3099} {"train_loss": -6.6805267333984375, "global_step": 130169, "epoch": 3099} {"train_loss": -6.539703369140625, "global_step": 130170, "epoch": 3099} {"train_loss": -6.5121564865112305, "global_step": 130171, "epoch": 3099} {"train_loss": -6.6430983543396, "global_step": 130172, "epoch": 3099} {"train_loss": -6.641850471496582, "global_step": 130173, "epoch": 3099} {"train_loss": -6.530640602111816, "global_step": 130174, "epoch": 3099} {"train_loss": -6.605790138244629, "global_step": 130175, "epoch": 3099} {"train_loss": -6.446011066436768, "global_step": 130176, "epoch": 3099} {"train_loss": -6.501396179199219, "global_step": 130177, "epoch": 3099} {"train_loss": -6.676273822784424, "global_step": 130178, "epoch": 3099} {"train_loss": -6.541351318359375, "global_step": 130179, "epoch": 3099} {"train_loss": -6.599440097808838, "global_step": 130180, "epoch": 3099} {"train_loss": -6.638289451599121, "global_step": 130181, "epoch": 3099} {"train_loss": -6.597054481506348, "global_step": 130182, "epoch": 3099} {"train_loss": -6.4272003173828125, "global_step": 130183, "epoch": 3099} {"train_loss": -6.56718635559082, "global_step": 130184, "epoch": 3099} {"train_loss": -6.551849365234375, "global_step": 130185, "epoch": 3099} {"train_loss": -6.556870460510254, "global_step": 130186, "epoch": 3099} {"train_loss": -6.584142684936523, "global_step": 130187, "epoch": 3099} {"train_loss": -6.535243988037109, "global_step": 130188, "epoch": 3099} {"train_loss": -6.539299011230469, "global_step": 130189, "epoch": 3099} {"train_loss": -6.454559326171875, "global_step": 130190, "epoch": 3099} {"train_loss": -6.501633167266846, "global_step": 130191, "epoch": 3099} {"train_loss": -6.696393966674805, "global_step": 130192, "epoch": 3099} {"train_loss": -6.546508312225342, "global_step": 130193, "epoch": 3099} {"train_loss": -6.663910865783691, "global_step": 130194, "epoch": 3099} {"train_loss": -6.587324142456055, "global_step": 130195, "epoch": 3099} {"train_loss": -6.668376922607422, "global_step": 130196, "epoch": 3099} {"train_loss": -6.647916793823242, "global_step": 130197, "epoch": 3099} {"train_loss": -6.598163604736328, "global_step": 130198, "epoch": 3099} {"train_loss": -6.585811070033482, "global_step": 130199, "epoch": 3099, "val_loss": 68176.625} {"train_loss": -6.623271942138672, "global_step": 130200, "epoch": 3100} {"train_loss": -6.530484199523926, "global_step": 130201, "epoch": 3100} {"train_loss": -6.5105366706848145, "global_step": 130202, "epoch": 3100} {"train_loss": -6.529557228088379, "global_step": 130203, "epoch": 3100} {"train_loss": -6.649325370788574, "global_step": 130204, "epoch": 3100} {"train_loss": -6.663814544677734, "global_step": 130205, "epoch": 3100} {"train_loss": -6.441845893859863, "global_step": 130206, "epoch": 3100} {"train_loss": -6.646293640136719, "global_step": 130207, "epoch": 3100} {"train_loss": -6.616881370544434, "global_step": 130208, "epoch": 3100} {"train_loss": -6.579094886779785, "global_step": 130209, "epoch": 3100} {"train_loss": -6.608994007110596, "global_step": 130210, "epoch": 3100} {"train_loss": -6.637674808502197, "global_step": 130211, "epoch": 3100} {"train_loss": -6.677609920501709, "global_step": 130212, "epoch": 3100} {"train_loss": -6.581816673278809, "global_step": 130213, "epoch": 3100} {"train_loss": -6.6227216720581055, "global_step": 130214, "epoch": 3100} {"train_loss": -6.663083076477051, "global_step": 130215, "epoch": 3100} {"train_loss": -6.601416110992432, "global_step": 130216, "epoch": 3100} {"train_loss": -6.5494794845581055, "global_step": 130217, "epoch": 3100} {"train_loss": -6.675620079040527, "global_step": 130218, "epoch": 3100} {"train_loss": -6.614630699157715, "global_step": 130219, "epoch": 3100} {"train_loss": -6.56435489654541, "global_step": 130220, "epoch": 3100} {"train_loss": -6.66623067855835, "global_step": 130221, "epoch": 3100} {"train_loss": -6.587176322937012, "global_step": 130222, "epoch": 3100} {"train_loss": -6.583756446838379, "global_step": 130223, "epoch": 3100} {"train_loss": -6.639023780822754, "global_step": 130224, "epoch": 3100} {"train_loss": -6.669158935546875, "global_step": 130225, "epoch": 3100} {"train_loss": -6.656132698059082, "global_step": 130226, "epoch": 3100} {"train_loss": -6.709323883056641, "global_step": 130227, "epoch": 3100} {"train_loss": -6.632757663726807, "global_step": 130228, "epoch": 3100} {"train_loss": -6.66619873046875, "global_step": 130229, "epoch": 3100} {"train_loss": -6.602609157562256, "global_step": 130230, "epoch": 3100} {"train_loss": -6.736894607543945, "global_step": 130231, "epoch": 3100} {"train_loss": -6.57772159576416, "global_step": 130232, "epoch": 3100} {"train_loss": -6.740042209625244, "global_step": 130233, "epoch": 3100} {"train_loss": -6.543015480041504, "global_step": 130234, "epoch": 3100} {"train_loss": -6.516313552856445, "global_step": 130235, "epoch": 3100} {"train_loss": -6.607238292694092, "global_step": 130236, "epoch": 3100} {"train_loss": -6.592688083648682, "global_step": 130237, "epoch": 3100} {"train_loss": -6.675786972045898, "global_step": 130238, "epoch": 3100} {"train_loss": -6.647021293640137, "global_step": 130239, "epoch": 3100} {"train_loss": -6.509194374084473, "global_step": 130240, "epoch": 3100} {"train_loss": -6.61415924344744, "global_step": 130241, "epoch": 3100, "train/sim_max_reward_0": 0.1946793111195469, "train/sim_max_reward_1": 0.9722566579622712, "train/sim_max_reward_2": 0.8231191552543056, "train/sim_max_reward_3": 0.14039665844315144, "train/sim_max_reward_4": 0.9450449601898891, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.21194490907890526, "test/sim_max_reward_4400001": 0.4864935108735972, "test/sim_max_reward_4400002": 0.5489186097239923, "test/sim_max_reward_4400003": 0.0011118057723486202, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9958575221620808, "test/sim_max_reward_4400006": 0.9891953745021371, "test/sim_max_reward_4400007": 0.8359356264694785, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9914304848565257, "test/sim_max_reward_4400010": 0.20398728299624114, "test/sim_max_reward_4400011": 0.6342921833033464, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.2854350487937265, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24882377251316892, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.967834573331097, "test/sim_max_reward_4400021": 0.4694416208736121, "test/sim_max_reward_4400022": 0.9264109068580686, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.9676335533292066, "test/sim_max_reward_4400025": 0.26124865208770226, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.03398279828389774, "test/sim_max_reward_4400028": 0.40445454325367863, "test/sim_max_reward_4400029": 0.5568007056334737, "test/sim_max_reward_4400030": 0.9817289539131173, "test/sim_max_reward_4400031": 0.9739336277494587, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9162337162672701, "test/sim_max_reward_4400034": 0.8815072910419781, "test/sim_max_reward_4400035": 0.9173732333903483, "test/sim_max_reward_4400036": 0.3629087234588733, "test/sim_max_reward_4400037": 0.946641282593946, "test/sim_max_reward_4400038": 0.9321306502666982, "test/sim_max_reward_4400039": 0.8729388695770225, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9485026150652143, "test/sim_max_reward_4400042": 0.8971762664092221, "test/sim_max_reward_4400043": 0.9861234207230734, "test/sim_max_reward_4400044": 0.9825757022716235, "test/sim_max_reward_4400045": 0.8507647556745108, "test/sim_max_reward_4400046": 0.36513288306598946, "test/sim_max_reward_4400047": 0.9199398074067726, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.4433213021585293, "train/mean_score": 0.5447469170552253, "test/mean_score": 0.5733595632221209, "val_loss": 68237.390625} {"train_loss": -6.583774089813232, "global_step": 130242, "epoch": 3101} {"train_loss": -6.66181755065918, "global_step": 130243, "epoch": 3101} {"train_loss": -6.664348602294922, "global_step": 130244, "epoch": 3101} {"train_loss": -6.638525485992432, "global_step": 130245, "epoch": 3101} {"train_loss": -6.586942672729492, "global_step": 130246, "epoch": 3101} {"train_loss": -6.582683563232422, "global_step": 130247, "epoch": 3101} {"train_loss": -6.548113822937012, "global_step": 130248, "epoch": 3101} {"train_loss": -6.685434818267822, "global_step": 130249, "epoch": 3101} {"train_loss": -6.5354814529418945, "global_step": 130250, "epoch": 3101} {"train_loss": -6.720858573913574, "global_step": 130251, "epoch": 3101} {"train_loss": -6.521345138549805, "global_step": 130252, "epoch": 3101} {"train_loss": -6.66272497177124, "global_step": 130253, "epoch": 3101} {"train_loss": -6.642910957336426, "global_step": 130254, "epoch": 3101} {"train_loss": -6.656119346618652, "global_step": 130255, "epoch": 3101} {"train_loss": -6.575236797332764, "global_step": 130256, "epoch": 3101} {"train_loss": -6.576696395874023, "global_step": 130257, "epoch": 3101} {"train_loss": -6.5291643142700195, "global_step": 130258, "epoch": 3101} {"train_loss": -6.598639011383057, "global_step": 130259, "epoch": 3101} {"train_loss": -6.613012313842773, "global_step": 130260, "epoch": 3101} {"train_loss": -6.540559768676758, "global_step": 130261, "epoch": 3101} {"train_loss": -6.465356826782227, "global_step": 130262, "epoch": 3101} {"train_loss": -6.565771579742432, "global_step": 130263, "epoch": 3101} {"train_loss": -6.526276588439941, "global_step": 130264, "epoch": 3101} {"train_loss": -6.565382480621338, "global_step": 130265, "epoch": 3101} {"train_loss": -6.56294059753418, "global_step": 130266, "epoch": 3101} {"train_loss": -6.628570556640625, "global_step": 130267, "epoch": 3101} {"train_loss": -6.497332572937012, "global_step": 130268, "epoch": 3101} {"train_loss": -6.494452476501465, "global_step": 130269, "epoch": 3101} {"train_loss": -6.637730121612549, "global_step": 130270, "epoch": 3101} {"train_loss": -6.637075424194336, "global_step": 130271, "epoch": 3101} {"train_loss": -6.536298751831055, "global_step": 130272, "epoch": 3101} {"train_loss": -6.611047267913818, "global_step": 130273, "epoch": 3101} {"train_loss": -6.45207405090332, "global_step": 130274, "epoch": 3101} {"train_loss": -6.657596588134766, "global_step": 130275, "epoch": 3101} {"train_loss": -6.665737152099609, "global_step": 130276, "epoch": 3101} {"train_loss": -6.645621299743652, "global_step": 130277, "epoch": 3101} {"train_loss": -6.6996541023254395, "global_step": 130278, "epoch": 3101} {"train_loss": -6.609321594238281, "global_step": 130279, "epoch": 3101} {"train_loss": -6.645326614379883, "global_step": 130280, "epoch": 3101} {"train_loss": -6.579800128936768, "global_step": 130281, "epoch": 3101} {"train_loss": -6.719036102294922, "global_step": 130282, "epoch": 3101} {"train_loss": -6.5981544199444, "global_step": 130283, "epoch": 3101, "val_loss": 68154.0625} {"train_loss": -6.587420463562012, "global_step": 130284, "epoch": 3102} {"train_loss": -6.627590179443359, "global_step": 130285, "epoch": 3102} {"train_loss": -6.626773834228516, "global_step": 130286, "epoch": 3102} {"train_loss": -6.616586685180664, "global_step": 130287, "epoch": 3102} {"train_loss": -6.522974967956543, "global_step": 130288, "epoch": 3102} {"train_loss": -6.621480941772461, "global_step": 130289, "epoch": 3102} {"train_loss": -6.5694780349731445, "global_step": 130290, "epoch": 3102} {"train_loss": -6.567344665527344, "global_step": 130291, "epoch": 3102} {"train_loss": -6.671733379364014, "global_step": 130292, "epoch": 3102} {"train_loss": -6.629499435424805, "global_step": 130293, "epoch": 3102} {"train_loss": -6.561431884765625, "global_step": 130294, "epoch": 3102} {"train_loss": -6.7749223709106445, "global_step": 130295, "epoch": 3102} {"train_loss": -6.646392822265625, "global_step": 130296, "epoch": 3102} {"train_loss": -6.669232368469238, "global_step": 130297, "epoch": 3102} {"train_loss": -6.606889724731445, "global_step": 130298, "epoch": 3102} {"train_loss": -6.620072364807129, "global_step": 130299, "epoch": 3102} {"train_loss": -6.6788330078125, "global_step": 130300, "epoch": 3102} {"train_loss": -6.601518630981445, "global_step": 130301, "epoch": 3102} {"train_loss": -6.6354241371154785, "global_step": 130302, "epoch": 3102} {"train_loss": -6.595951080322266, "global_step": 130303, "epoch": 3102} {"train_loss": -6.6554975509643555, "global_step": 130304, "epoch": 3102} {"train_loss": -6.628345012664795, "global_step": 130305, "epoch": 3102} {"train_loss": -6.511831283569336, "global_step": 130306, "epoch": 3102} {"train_loss": -6.56510066986084, "global_step": 130307, "epoch": 3102} {"train_loss": -6.733342170715332, "global_step": 130308, "epoch": 3102} {"train_loss": -6.6689372062683105, "global_step": 130309, "epoch": 3102} {"train_loss": -6.607345104217529, "global_step": 130310, "epoch": 3102} {"train_loss": -6.5593485832214355, "global_step": 130311, "epoch": 3102} {"train_loss": -6.682806491851807, "global_step": 130312, "epoch": 3102} {"train_loss": -6.614642143249512, "global_step": 130313, "epoch": 3102} {"train_loss": -6.6589250564575195, "global_step": 130314, "epoch": 3102} {"train_loss": -6.708783149719238, "global_step": 130315, "epoch": 3102} {"train_loss": -6.695281982421875, "global_step": 130316, "epoch": 3102} {"train_loss": -6.636475563049316, "global_step": 130317, "epoch": 3102} {"train_loss": -6.672693252563477, "global_step": 130318, "epoch": 3102} {"train_loss": -6.536995887756348, "global_step": 130319, "epoch": 3102} {"train_loss": -6.679690837860107, "global_step": 130320, "epoch": 3102} {"train_loss": -6.671341419219971, "global_step": 130321, "epoch": 3102} {"train_loss": -6.78696346282959, "global_step": 130322, "epoch": 3102} {"train_loss": -6.747589588165283, "global_step": 130323, "epoch": 3102} {"train_loss": -6.665553569793701, "global_step": 130324, "epoch": 3102} {"train_loss": -6.636249723888579, "global_step": 130325, "epoch": 3102, "val_loss": 68080.0625} {"train_loss": -6.674047470092773, "global_step": 130326, "epoch": 3103} {"train_loss": -6.765324115753174, "global_step": 130327, "epoch": 3103} {"train_loss": -6.658718109130859, "global_step": 130328, "epoch": 3103} {"train_loss": -6.731333255767822, "global_step": 130329, "epoch": 3103} {"train_loss": -6.7695159912109375, "global_step": 130330, "epoch": 3103} {"train_loss": -6.6389923095703125, "global_step": 130331, "epoch": 3103} {"train_loss": -6.736767768859863, "global_step": 130332, "epoch": 3103} {"train_loss": -6.707757472991943, "global_step": 130333, "epoch": 3103} {"train_loss": -6.7144646644592285, "global_step": 130334, "epoch": 3103} {"train_loss": -6.696534633636475, "global_step": 130335, "epoch": 3103} {"train_loss": -6.678894519805908, "global_step": 130336, "epoch": 3103} {"train_loss": -6.637096405029297, "global_step": 130337, "epoch": 3103} {"train_loss": -6.670008659362793, "global_step": 130338, "epoch": 3103} {"train_loss": -6.696245193481445, "global_step": 130339, "epoch": 3103} {"train_loss": -6.751175880432129, "global_step": 130340, "epoch": 3103} {"train_loss": -6.811662197113037, "global_step": 130341, "epoch": 3103} {"train_loss": -6.66571044921875, "global_step": 130342, "epoch": 3103} {"train_loss": -6.685856819152832, "global_step": 130343, "epoch": 3103} {"train_loss": -6.657961845397949, "global_step": 130344, "epoch": 3103} {"train_loss": -6.621054172515869, "global_step": 130345, "epoch": 3103} {"train_loss": -6.559905529022217, "global_step": 130346, "epoch": 3103} {"train_loss": -6.714839935302734, "global_step": 130347, "epoch": 3103} {"train_loss": -6.576611042022705, "global_step": 130348, "epoch": 3103} {"train_loss": -6.626195907592773, "global_step": 130349, "epoch": 3103} {"train_loss": -6.582760334014893, "global_step": 130350, "epoch": 3103} {"train_loss": -6.70112943649292, "global_step": 130351, "epoch": 3103} {"train_loss": -6.5696306228637695, "global_step": 130352, "epoch": 3103} {"train_loss": -6.614187240600586, "global_step": 130353, "epoch": 3103} {"train_loss": -6.636969089508057, "global_step": 130354, "epoch": 3103} {"train_loss": -6.626978397369385, "global_step": 130355, "epoch": 3103} {"train_loss": -6.560324192047119, "global_step": 130356, "epoch": 3103} {"train_loss": -6.642065048217773, "global_step": 130357, "epoch": 3103} {"train_loss": -6.529192924499512, "global_step": 130358, "epoch": 3103} {"train_loss": -6.563413143157959, "global_step": 130359, "epoch": 3103} {"train_loss": -6.581630706787109, "global_step": 130360, "epoch": 3103} {"train_loss": -6.4531049728393555, "global_step": 130361, "epoch": 3103} {"train_loss": -6.620388507843018, "global_step": 130362, "epoch": 3103} {"train_loss": -6.5759806632995605, "global_step": 130363, "epoch": 3103} {"train_loss": -6.627508163452148, "global_step": 130364, "epoch": 3103} {"train_loss": -6.539185523986816, "global_step": 130365, "epoch": 3103} {"train_loss": -6.610280990600586, "global_step": 130366, "epoch": 3103} {"train_loss": -6.647532338187808, "global_step": 130367, "epoch": 3103, "val_loss": 68165.828125} {"train_loss": -6.562626361846924, "global_step": 130368, "epoch": 3104} {"train_loss": -6.623401641845703, "global_step": 130369, "epoch": 3104} {"train_loss": -6.657003402709961, "global_step": 130370, "epoch": 3104} {"train_loss": -6.583915710449219, "global_step": 130371, "epoch": 3104} {"train_loss": -6.624322891235352, "global_step": 130372, "epoch": 3104} {"train_loss": -6.573798179626465, "global_step": 130373, "epoch": 3104} {"train_loss": -6.604536056518555, "global_step": 130374, "epoch": 3104} {"train_loss": -6.576639652252197, "global_step": 130375, "epoch": 3104} {"train_loss": -6.635420799255371, "global_step": 130376, "epoch": 3104} {"train_loss": -6.708217144012451, "global_step": 130377, "epoch": 3104} {"train_loss": -6.608987331390381, "global_step": 130378, "epoch": 3104} {"train_loss": -6.6002421379089355, "global_step": 130379, "epoch": 3104} {"train_loss": -6.591250896453857, "global_step": 130380, "epoch": 3104} {"train_loss": -6.675464630126953, "global_step": 130381, "epoch": 3104} {"train_loss": -6.538295745849609, "global_step": 130382, "epoch": 3104} {"train_loss": -6.7153425216674805, "global_step": 130383, "epoch": 3104} {"train_loss": -6.734114646911621, "global_step": 130384, "epoch": 3104} {"train_loss": -6.517436504364014, "global_step": 130385, "epoch": 3104} {"train_loss": -6.596183776855469, "global_step": 130386, "epoch": 3104} {"train_loss": -6.654930114746094, "global_step": 130387, "epoch": 3104} {"train_loss": -6.5864667892456055, "global_step": 130388, "epoch": 3104} {"train_loss": -6.616682529449463, "global_step": 130389, "epoch": 3104} {"train_loss": -6.701295375823975, "global_step": 130390, "epoch": 3104} {"train_loss": -6.598442554473877, "global_step": 130391, "epoch": 3104} {"train_loss": -6.649706840515137, "global_step": 130392, "epoch": 3104} {"train_loss": -6.574071884155273, "global_step": 130393, "epoch": 3104} {"train_loss": -6.689866542816162, "global_step": 130394, "epoch": 3104} {"train_loss": -6.61808443069458, "global_step": 130395, "epoch": 3104} {"train_loss": -6.614504814147949, "global_step": 130396, "epoch": 3104} {"train_loss": -6.5868144035339355, "global_step": 130397, "epoch": 3104} {"train_loss": -6.656713485717773, "global_step": 130398, "epoch": 3104} {"train_loss": -6.63054084777832, "global_step": 130399, "epoch": 3104} {"train_loss": -6.684543132781982, "global_step": 130400, "epoch": 3104} {"train_loss": -6.594594478607178, "global_step": 130401, "epoch": 3104} {"train_loss": -6.525686264038086, "global_step": 130402, "epoch": 3104} {"train_loss": -6.652093410491943, "global_step": 130403, "epoch": 3104} {"train_loss": -6.6531662940979, "global_step": 130404, "epoch": 3104} {"train_loss": -6.5633320808410645, "global_step": 130405, "epoch": 3104} {"train_loss": -6.610360145568848, "global_step": 130406, "epoch": 3104} {"train_loss": -6.732367515563965, "global_step": 130407, "epoch": 3104} {"train_loss": -6.806281089782715, "global_step": 130408, "epoch": 3104} {"train_loss": -6.6291184425354, "global_step": 130409, "epoch": 3104, "val_loss": 68243.984375} {"train_loss": -6.719823837280273, "global_step": 130410, "epoch": 3105} {"train_loss": -6.668354034423828, "global_step": 130411, "epoch": 3105} {"train_loss": -6.6538896560668945, "global_step": 130412, "epoch": 3105} {"train_loss": -6.646143913269043, "global_step": 130413, "epoch": 3105} {"train_loss": -6.577485084533691, "global_step": 130414, "epoch": 3105} {"train_loss": -6.572396755218506, "global_step": 130415, "epoch": 3105} {"train_loss": -6.6521100997924805, "global_step": 130416, "epoch": 3105} {"train_loss": -6.650857448577881, "global_step": 130417, "epoch": 3105} {"train_loss": -6.690075397491455, "global_step": 130418, "epoch": 3105} {"train_loss": -6.539036750793457, "global_step": 130419, "epoch": 3105} {"train_loss": -6.61541223526001, "global_step": 130420, "epoch": 3105} {"train_loss": -6.6081461906433105, "global_step": 130421, "epoch": 3105} {"train_loss": -6.555506706237793, "global_step": 130422, "epoch": 3105} {"train_loss": -6.669528961181641, "global_step": 130423, "epoch": 3105} {"train_loss": -6.57205867767334, "global_step": 130424, "epoch": 3105} {"train_loss": -6.535022735595703, "global_step": 130425, "epoch": 3105} {"train_loss": -6.670022010803223, "global_step": 130426, "epoch": 3105} {"train_loss": -6.603209495544434, "global_step": 130427, "epoch": 3105} {"train_loss": -6.431227207183838, "global_step": 130428, "epoch": 3105} {"train_loss": -6.679140090942383, "global_step": 130429, "epoch": 3105} {"train_loss": -6.586144924163818, "global_step": 130430, "epoch": 3105} {"train_loss": -6.556370735168457, "global_step": 130431, "epoch": 3105} {"train_loss": -6.674132823944092, "global_step": 130432, "epoch": 3105} {"train_loss": -6.550507545471191, "global_step": 130433, "epoch": 3105} {"train_loss": -6.680240631103516, "global_step": 130434, "epoch": 3105} {"train_loss": -6.56593132019043, "global_step": 130435, "epoch": 3105} {"train_loss": -6.684379577636719, "global_step": 130436, "epoch": 3105} {"train_loss": -6.6369524002075195, "global_step": 130437, "epoch": 3105} {"train_loss": -6.668645858764648, "global_step": 130438, "epoch": 3105} {"train_loss": -6.678718566894531, "global_step": 130439, "epoch": 3105} {"train_loss": -6.574972152709961, "global_step": 130440, "epoch": 3105} {"train_loss": -6.509100914001465, "global_step": 130441, "epoch": 3105} {"train_loss": -6.784185886383057, "global_step": 130442, "epoch": 3105} {"train_loss": -6.605694770812988, "global_step": 130443, "epoch": 3105} {"train_loss": -6.693670272827148, "global_step": 130444, "epoch": 3105} {"train_loss": -6.617154121398926, "global_step": 130445, "epoch": 3105} {"train_loss": -6.6156182289123535, "global_step": 130446, "epoch": 3105} {"train_loss": -6.768214225769043, "global_step": 130447, "epoch": 3105} {"train_loss": -6.593121528625488, "global_step": 130448, "epoch": 3105} {"train_loss": -6.522701740264893, "global_step": 130449, "epoch": 3105} {"train_loss": -6.6278839111328125, "global_step": 130450, "epoch": 3105} {"train_loss": -6.618384463446481, "global_step": 130451, "epoch": 3105, "val_loss": 68193.015625} {"train_loss": -6.681694030761719, "global_step": 130452, "epoch": 3106} {"train_loss": -6.66954231262207, "global_step": 130453, "epoch": 3106} {"train_loss": -6.647055149078369, "global_step": 130454, "epoch": 3106} {"train_loss": -6.66812801361084, "global_step": 130455, "epoch": 3106} {"train_loss": -6.77925968170166, "global_step": 130456, "epoch": 3106} {"train_loss": -6.608708381652832, "global_step": 130457, "epoch": 3106} {"train_loss": -6.6810150146484375, "global_step": 130458, "epoch": 3106} {"train_loss": -6.704762935638428, "global_step": 130459, "epoch": 3106} {"train_loss": -6.667352676391602, "global_step": 130460, "epoch": 3106} {"train_loss": -6.6388068199157715, "global_step": 130461, "epoch": 3106} {"train_loss": -6.6418256759643555, "global_step": 130462, "epoch": 3106} {"train_loss": -6.559523582458496, "global_step": 130463, "epoch": 3106} {"train_loss": -6.740567207336426, "global_step": 130464, "epoch": 3106} {"train_loss": -6.72803258895874, "global_step": 130465, "epoch": 3106} {"train_loss": -6.746279239654541, "global_step": 130466, "epoch": 3106} {"train_loss": -6.641042709350586, "global_step": 130467, "epoch": 3106} {"train_loss": -6.683470726013184, "global_step": 130468, "epoch": 3106} {"train_loss": -6.726885795593262, "global_step": 130469, "epoch": 3106} {"train_loss": -6.6690874099731445, "global_step": 130470, "epoch": 3106} {"train_loss": -6.608196258544922, "global_step": 130471, "epoch": 3106} {"train_loss": -6.6472086906433105, "global_step": 130472, "epoch": 3106} {"train_loss": -6.643321990966797, "global_step": 130473, "epoch": 3106} {"train_loss": -6.779598236083984, "global_step": 130474, "epoch": 3106} {"train_loss": -6.718031883239746, "global_step": 130475, "epoch": 3106} {"train_loss": -6.690358638763428, "global_step": 130476, "epoch": 3106} {"train_loss": -6.642120361328125, "global_step": 130477, "epoch": 3106} {"train_loss": -6.69293737411499, "global_step": 130478, "epoch": 3106} {"train_loss": -6.687305450439453, "global_step": 130479, "epoch": 3106} {"train_loss": -6.736001014709473, "global_step": 130480, "epoch": 3106} {"train_loss": -6.712277412414551, "global_step": 130481, "epoch": 3106} {"train_loss": -6.597407341003418, "global_step": 130482, "epoch": 3106} {"train_loss": -6.696606159210205, "global_step": 130483, "epoch": 3106} {"train_loss": -6.569974899291992, "global_step": 130484, "epoch": 3106} {"train_loss": -6.663949012756348, "global_step": 130485, "epoch": 3106} {"train_loss": -6.5815558433532715, "global_step": 130486, "epoch": 3106} {"train_loss": -6.519711494445801, "global_step": 130487, "epoch": 3106} {"train_loss": -6.5256547927856445, "global_step": 130488, "epoch": 3106} {"train_loss": -6.728177070617676, "global_step": 130489, "epoch": 3106} {"train_loss": -6.556651592254639, "global_step": 130490, "epoch": 3106} {"train_loss": -6.605348110198975, "global_step": 130491, "epoch": 3106} {"train_loss": -6.567843914031982, "global_step": 130492, "epoch": 3106} {"train_loss": -6.657970507939656, "global_step": 130493, "epoch": 3106, "val_loss": 68114.71875} {"train_loss": -6.693082809448242, "global_step": 130494, "epoch": 3107} {"train_loss": -6.490485668182373, "global_step": 130495, "epoch": 3107} {"train_loss": -6.532359600067139, "global_step": 130496, "epoch": 3107} {"train_loss": -6.536416053771973, "global_step": 130497, "epoch": 3107} {"train_loss": -6.544353008270264, "global_step": 130498, "epoch": 3107} {"train_loss": -6.594637870788574, "global_step": 130499, "epoch": 3107} {"train_loss": -6.545162200927734, "global_step": 130500, "epoch": 3107} {"train_loss": -6.67359733581543, "global_step": 130501, "epoch": 3107} {"train_loss": -6.543688774108887, "global_step": 130502, "epoch": 3107} {"train_loss": -6.593929767608643, "global_step": 130503, "epoch": 3107} {"train_loss": -6.539649963378906, "global_step": 130504, "epoch": 3107} {"train_loss": -6.456873416900635, "global_step": 130505, "epoch": 3107} {"train_loss": -6.629347801208496, "global_step": 130506, "epoch": 3107} {"train_loss": -6.364156246185303, "global_step": 130507, "epoch": 3107} {"train_loss": -6.554386138916016, "global_step": 130508, "epoch": 3107} {"train_loss": -6.3624067306518555, "global_step": 130509, "epoch": 3107} {"train_loss": -6.5735554695129395, "global_step": 130510, "epoch": 3107} {"train_loss": -6.546245574951172, "global_step": 130511, "epoch": 3107} {"train_loss": -6.622065544128418, "global_step": 130512, "epoch": 3107} {"train_loss": -6.333970546722412, "global_step": 130513, "epoch": 3107} {"train_loss": -6.652009963989258, "global_step": 130514, "epoch": 3107} {"train_loss": -6.383597373962402, "global_step": 130515, "epoch": 3107} {"train_loss": -6.588563442230225, "global_step": 130516, "epoch": 3107} {"train_loss": -6.479855537414551, "global_step": 130517, "epoch": 3107} {"train_loss": -6.696120738983154, "global_step": 130518, "epoch": 3107} {"train_loss": -6.575811386108398, "global_step": 130519, "epoch": 3107} {"train_loss": -6.662693977355957, "global_step": 130520, "epoch": 3107} {"train_loss": -6.576160430908203, "global_step": 130521, "epoch": 3107} {"train_loss": -6.601899147033691, "global_step": 130522, "epoch": 3107} {"train_loss": -6.683189392089844, "global_step": 130523, "epoch": 3107} {"train_loss": -6.617201328277588, "global_step": 130524, "epoch": 3107} {"train_loss": -6.536674499511719, "global_step": 130525, "epoch": 3107} {"train_loss": -6.661263942718506, "global_step": 130526, "epoch": 3107} {"train_loss": -6.506044387817383, "global_step": 130527, "epoch": 3107} {"train_loss": -6.544008255004883, "global_step": 130528, "epoch": 3107} {"train_loss": -6.573014736175537, "global_step": 130529, "epoch": 3107} {"train_loss": -6.567567825317383, "global_step": 130530, "epoch": 3107} {"train_loss": -6.532273292541504, "global_step": 130531, "epoch": 3107} {"train_loss": -6.430544376373291, "global_step": 130532, "epoch": 3107} {"train_loss": -6.616569995880127, "global_step": 130533, "epoch": 3107} {"train_loss": -6.477801322937012, "global_step": 130534, "epoch": 3107} {"train_loss": -6.555742649804978, "global_step": 130535, "epoch": 3107, "val_loss": 68273.9375} {"train_loss": -6.654053688049316, "global_step": 130536, "epoch": 3108} {"train_loss": -6.542503833770752, "global_step": 130537, "epoch": 3108} {"train_loss": -6.651540756225586, "global_step": 130538, "epoch": 3108} {"train_loss": -6.581524848937988, "global_step": 130539, "epoch": 3108} {"train_loss": -6.715959548950195, "global_step": 130540, "epoch": 3108} {"train_loss": -6.637448310852051, "global_step": 130541, "epoch": 3108} {"train_loss": -6.680726051330566, "global_step": 130542, "epoch": 3108} {"train_loss": -6.607730865478516, "global_step": 130543, "epoch": 3108} {"train_loss": -6.675374984741211, "global_step": 130544, "epoch": 3108} {"train_loss": -6.628876686096191, "global_step": 130545, "epoch": 3108} {"train_loss": -6.676478385925293, "global_step": 130546, "epoch": 3108} {"train_loss": -6.666780471801758, "global_step": 130547, "epoch": 3108} {"train_loss": -6.590616703033447, "global_step": 130548, "epoch": 3108} {"train_loss": -6.660384178161621, "global_step": 130549, "epoch": 3108} {"train_loss": -6.647454261779785, "global_step": 130550, "epoch": 3108} {"train_loss": -6.696837902069092, "global_step": 130551, "epoch": 3108} {"train_loss": -6.82163143157959, "global_step": 130552, "epoch": 3108} {"train_loss": -6.6609039306640625, "global_step": 130553, "epoch": 3108} {"train_loss": -6.8517255783081055, "global_step": 130554, "epoch": 3108} {"train_loss": -6.66598653793335, "global_step": 130555, "epoch": 3108} {"train_loss": -6.6817851066589355, "global_step": 130556, "epoch": 3108} {"train_loss": -6.736578464508057, "global_step": 130557, "epoch": 3108} {"train_loss": -6.702908515930176, "global_step": 130558, "epoch": 3108} {"train_loss": -6.711080551147461, "global_step": 130559, "epoch": 3108} {"train_loss": -6.688740253448486, "global_step": 130560, "epoch": 3108} {"train_loss": -6.650972366333008, "global_step": 130561, "epoch": 3108} {"train_loss": -6.637714862823486, "global_step": 130562, "epoch": 3108} {"train_loss": -6.7354912757873535, "global_step": 130563, "epoch": 3108} {"train_loss": -6.585131645202637, "global_step": 130564, "epoch": 3108} {"train_loss": -6.661873817443848, "global_step": 130565, "epoch": 3108} {"train_loss": -6.708558082580566, "global_step": 130566, "epoch": 3108} {"train_loss": -6.693441867828369, "global_step": 130567, "epoch": 3108} {"train_loss": -6.690749168395996, "global_step": 130568, "epoch": 3108} {"train_loss": -6.814910888671875, "global_step": 130569, "epoch": 3108} {"train_loss": -6.679617881774902, "global_step": 130570, "epoch": 3108} {"train_loss": -6.606625556945801, "global_step": 130571, "epoch": 3108} {"train_loss": -6.59471321105957, "global_step": 130572, "epoch": 3108} {"train_loss": -6.632421970367432, "global_step": 130573, "epoch": 3108} {"train_loss": -6.627793788909912, "global_step": 130574, "epoch": 3108} {"train_loss": -6.7863874435424805, "global_step": 130575, "epoch": 3108} {"train_loss": -6.675771713256836, "global_step": 130576, "epoch": 3108} {"train_loss": -6.673707610084897, "global_step": 130577, "epoch": 3108, "val_loss": 67912.9140625} {"train_loss": -6.674129009246826, "global_step": 130578, "epoch": 3109} {"train_loss": -6.620302677154541, "global_step": 130579, "epoch": 3109} {"train_loss": -6.722431659698486, "global_step": 130580, "epoch": 3109} {"train_loss": -6.634772777557373, "global_step": 130581, "epoch": 3109} {"train_loss": -6.745434761047363, "global_step": 130582, "epoch": 3109} {"train_loss": -6.671472549438477, "global_step": 130583, "epoch": 3109} {"train_loss": -6.679469585418701, "global_step": 130584, "epoch": 3109} {"train_loss": -6.680655479431152, "global_step": 130585, "epoch": 3109} {"train_loss": -6.524568557739258, "global_step": 130586, "epoch": 3109} {"train_loss": -6.6053547859191895, "global_step": 130587, "epoch": 3109} {"train_loss": -6.691470146179199, "global_step": 130588, "epoch": 3109} {"train_loss": -6.587819576263428, "global_step": 130589, "epoch": 3109} {"train_loss": -6.600221633911133, "global_step": 130590, "epoch": 3109} {"train_loss": -6.696583271026611, "global_step": 130591, "epoch": 3109} {"train_loss": -6.710148811340332, "global_step": 130592, "epoch": 3109} {"train_loss": -6.620492458343506, "global_step": 130593, "epoch": 3109} {"train_loss": -6.690199851989746, "global_step": 130594, "epoch": 3109} {"train_loss": -6.627605438232422, "global_step": 130595, "epoch": 3109} {"train_loss": -6.577816009521484, "global_step": 130596, "epoch": 3109} {"train_loss": -6.576949596405029, "global_step": 130597, "epoch": 3109} {"train_loss": -6.585262298583984, "global_step": 130598, "epoch": 3109} {"train_loss": -6.622143745422363, "global_step": 130599, "epoch": 3109} {"train_loss": -6.591946601867676, "global_step": 130600, "epoch": 3109} {"train_loss": -6.716567039489746, "global_step": 130601, "epoch": 3109} {"train_loss": -6.565212726593018, "global_step": 130602, "epoch": 3109} {"train_loss": -6.565211296081543, "global_step": 130603, "epoch": 3109} {"train_loss": -6.626940727233887, "global_step": 130604, "epoch": 3109} {"train_loss": -6.571053504943848, "global_step": 130605, "epoch": 3109} {"train_loss": -6.43189811706543, "global_step": 130606, "epoch": 3109} {"train_loss": -6.597492218017578, "global_step": 130607, "epoch": 3109} {"train_loss": -6.5530500411987305, "global_step": 130608, "epoch": 3109} {"train_loss": -6.510043621063232, "global_step": 130609, "epoch": 3109} {"train_loss": -6.584895133972168, "global_step": 130610, "epoch": 3109} {"train_loss": -6.590539932250977, "global_step": 130611, "epoch": 3109} {"train_loss": -6.627591133117676, "global_step": 130612, "epoch": 3109} {"train_loss": -6.581247329711914, "global_step": 130613, "epoch": 3109} {"train_loss": -6.566116809844971, "global_step": 130614, "epoch": 3109} {"train_loss": -6.562388896942139, "global_step": 130615, "epoch": 3109} {"train_loss": -6.780044078826904, "global_step": 130616, "epoch": 3109} {"train_loss": -6.6717376708984375, "global_step": 130617, "epoch": 3109} {"train_loss": -6.582020282745361, "global_step": 130618, "epoch": 3109} {"train_loss": -6.621661833354405, "global_step": 130619, "epoch": 3109, "val_loss": 68263.515625} {"train_loss": -6.726539611816406, "global_step": 130620, "epoch": 3110} {"train_loss": -6.6346659660339355, "global_step": 130621, "epoch": 3110} {"train_loss": -6.542448997497559, "global_step": 130622, "epoch": 3110} {"train_loss": -6.569218635559082, "global_step": 130623, "epoch": 3110} {"train_loss": -6.566875457763672, "global_step": 130624, "epoch": 3110} {"train_loss": -6.635032653808594, "global_step": 130625, "epoch": 3110} {"train_loss": -6.727474212646484, "global_step": 130626, "epoch": 3110} {"train_loss": -6.4806718826293945, "global_step": 130627, "epoch": 3110} {"train_loss": -6.623166084289551, "global_step": 130628, "epoch": 3110} {"train_loss": -6.570687770843506, "global_step": 130629, "epoch": 3110} {"train_loss": -6.5553741455078125, "global_step": 130630, "epoch": 3110} {"train_loss": -6.534180641174316, "global_step": 130631, "epoch": 3110} {"train_loss": -6.579154968261719, "global_step": 130632, "epoch": 3110} {"train_loss": -6.484801769256592, "global_step": 130633, "epoch": 3110} {"train_loss": -6.373702049255371, "global_step": 130634, "epoch": 3110} {"train_loss": -6.597143650054932, "global_step": 130635, "epoch": 3110} {"train_loss": -6.4684247970581055, "global_step": 130636, "epoch": 3110} {"train_loss": -6.619207382202148, "global_step": 130637, "epoch": 3110} {"train_loss": -6.5763258934021, "global_step": 130638, "epoch": 3110} {"train_loss": -6.590364456176758, "global_step": 130639, "epoch": 3110} {"train_loss": -6.589770317077637, "global_step": 130640, "epoch": 3110} {"train_loss": -6.525775909423828, "global_step": 130641, "epoch": 3110} {"train_loss": -6.614024639129639, "global_step": 130642, "epoch": 3110} {"train_loss": -6.679043769836426, "global_step": 130643, "epoch": 3110} {"train_loss": -6.618828773498535, "global_step": 130644, "epoch": 3110} {"train_loss": -6.6849365234375, "global_step": 130645, "epoch": 3110} {"train_loss": -6.508942604064941, "global_step": 130646, "epoch": 3110} {"train_loss": -6.555332183837891, "global_step": 130647, "epoch": 3110} {"train_loss": -6.617655277252197, "global_step": 130648, "epoch": 3110} {"train_loss": -6.5903000831604, "global_step": 130649, "epoch": 3110} {"train_loss": -6.765613555908203, "global_step": 130650, "epoch": 3110} {"train_loss": -6.643064498901367, "global_step": 130651, "epoch": 3110} {"train_loss": -6.655674934387207, "global_step": 130652, "epoch": 3110} {"train_loss": -6.610044956207275, "global_step": 130653, "epoch": 3110} {"train_loss": -6.648347854614258, "global_step": 130654, "epoch": 3110} {"train_loss": -6.6828765869140625, "global_step": 130655, "epoch": 3110} {"train_loss": -6.452117919921875, "global_step": 130656, "epoch": 3110} {"train_loss": -6.566648483276367, "global_step": 130657, "epoch": 3110} {"train_loss": -6.7157440185546875, "global_step": 130658, "epoch": 3110} {"train_loss": -6.600955486297607, "global_step": 130659, "epoch": 3110} {"train_loss": -6.589180946350098, "global_step": 130660, "epoch": 3110} {"train_loss": -6.595278172265916, "global_step": 130661, "epoch": 3110, "val_loss": 68155.3359375} {"train_loss": -6.569780349731445, "global_step": 130662, "epoch": 3111} {"train_loss": -6.6443071365356445, "global_step": 130663, "epoch": 3111} {"train_loss": -6.68928861618042, "global_step": 130664, "epoch": 3111} {"train_loss": -6.577592372894287, "global_step": 130665, "epoch": 3111} {"train_loss": -6.543547630310059, "global_step": 130666, "epoch": 3111} {"train_loss": -6.5938520431518555, "global_step": 130667, "epoch": 3111} {"train_loss": -6.556578636169434, "global_step": 130668, "epoch": 3111} {"train_loss": -6.6134843826293945, "global_step": 130669, "epoch": 3111} {"train_loss": -6.6428937911987305, "global_step": 130670, "epoch": 3111} {"train_loss": -6.513384819030762, "global_step": 130671, "epoch": 3111} {"train_loss": -6.670368194580078, "global_step": 130672, "epoch": 3111} {"train_loss": -6.696926116943359, "global_step": 130673, "epoch": 3111} {"train_loss": -6.691198825836182, "global_step": 130674, "epoch": 3111} {"train_loss": -6.591927528381348, "global_step": 130675, "epoch": 3111} {"train_loss": -6.634990692138672, "global_step": 130676, "epoch": 3111} {"train_loss": -6.664588451385498, "global_step": 130677, "epoch": 3111} {"train_loss": -6.708472728729248, "global_step": 130678, "epoch": 3111} {"train_loss": -6.551060199737549, "global_step": 130679, "epoch": 3111} {"train_loss": -6.687154293060303, "global_step": 130680, "epoch": 3111} {"train_loss": -6.593447208404541, "global_step": 130681, "epoch": 3111} {"train_loss": -6.652691841125488, "global_step": 130682, "epoch": 3111} {"train_loss": -6.758452415466309, "global_step": 130683, "epoch": 3111} {"train_loss": -6.6062469482421875, "global_step": 130684, "epoch": 3111} {"train_loss": -6.67466926574707, "global_step": 130685, "epoch": 3111} {"train_loss": -6.779521942138672, "global_step": 130686, "epoch": 3111} {"train_loss": -6.768810272216797, "global_step": 130687, "epoch": 3111} {"train_loss": -6.67591667175293, "global_step": 130688, "epoch": 3111} {"train_loss": -6.794512748718262, "global_step": 130689, "epoch": 3111} {"train_loss": -6.703833103179932, "global_step": 130690, "epoch": 3111} {"train_loss": -6.704312324523926, "global_step": 130691, "epoch": 3111} {"train_loss": -6.698204040527344, "global_step": 130692, "epoch": 3111} {"train_loss": -6.645709991455078, "global_step": 130693, "epoch": 3111} {"train_loss": -6.623238563537598, "global_step": 130694, "epoch": 3111} {"train_loss": -6.61385440826416, "global_step": 130695, "epoch": 3111} {"train_loss": -6.73099422454834, "global_step": 130696, "epoch": 3111} {"train_loss": -6.586294174194336, "global_step": 130697, "epoch": 3111} {"train_loss": -6.628098487854004, "global_step": 130698, "epoch": 3111} {"train_loss": -6.504909515380859, "global_step": 130699, "epoch": 3111} {"train_loss": -6.591638565063477, "global_step": 130700, "epoch": 3111} {"train_loss": -6.494852542877197, "global_step": 130701, "epoch": 3111} {"train_loss": -6.5929765701293945, "global_step": 130702, "epoch": 3111} {"train_loss": -6.638269106547038, "global_step": 130703, "epoch": 3111, "val_loss": 68144.34375} {"train_loss": -6.6158976554870605, "global_step": 130704, "epoch": 3112} {"train_loss": -6.564004898071289, "global_step": 130705, "epoch": 3112} {"train_loss": -6.598625183105469, "global_step": 130706, "epoch": 3112} {"train_loss": -6.477241039276123, "global_step": 130707, "epoch": 3112} {"train_loss": -6.672238349914551, "global_step": 130708, "epoch": 3112} {"train_loss": -6.615615367889404, "global_step": 130709, "epoch": 3112} {"train_loss": -6.567525386810303, "global_step": 130710, "epoch": 3112} {"train_loss": -6.570241451263428, "global_step": 130711, "epoch": 3112} {"train_loss": -6.589353561401367, "global_step": 130712, "epoch": 3112} {"train_loss": -6.502828598022461, "global_step": 130713, "epoch": 3112} {"train_loss": -6.60090446472168, "global_step": 130714, "epoch": 3112} {"train_loss": -6.641458511352539, "global_step": 130715, "epoch": 3112} {"train_loss": -6.577234268188477, "global_step": 130716, "epoch": 3112} {"train_loss": -6.624267578125, "global_step": 130717, "epoch": 3112} {"train_loss": -6.630171298980713, "global_step": 130718, "epoch": 3112} {"train_loss": -6.7446489334106445, "global_step": 130719, "epoch": 3112} {"train_loss": -6.631092071533203, "global_step": 130720, "epoch": 3112} {"train_loss": -6.562897682189941, "global_step": 130721, "epoch": 3112} {"train_loss": -6.62991189956665, "global_step": 130722, "epoch": 3112} {"train_loss": -6.653505802154541, "global_step": 130723, "epoch": 3112} {"train_loss": -6.697455883026123, "global_step": 130724, "epoch": 3112} {"train_loss": -6.676972389221191, "global_step": 130725, "epoch": 3112} {"train_loss": -6.688936710357666, "global_step": 130726, "epoch": 3112} {"train_loss": -6.5401787757873535, "global_step": 130727, "epoch": 3112} {"train_loss": -6.703475475311279, "global_step": 130728, "epoch": 3112} {"train_loss": -6.663248062133789, "global_step": 130729, "epoch": 3112} {"train_loss": -6.631208419799805, "global_step": 130730, "epoch": 3112} {"train_loss": -6.6354289054870605, "global_step": 130731, "epoch": 3112} {"train_loss": -6.656991004943848, "global_step": 130732, "epoch": 3112} {"train_loss": -6.60076904296875, "global_step": 130733, "epoch": 3112} {"train_loss": -6.661748886108398, "global_step": 130734, "epoch": 3112} {"train_loss": -6.654844284057617, "global_step": 130735, "epoch": 3112} {"train_loss": -6.602000713348389, "global_step": 130736, "epoch": 3112} {"train_loss": -6.6453399658203125, "global_step": 130737, "epoch": 3112} {"train_loss": -6.699177265167236, "global_step": 130738, "epoch": 3112} {"train_loss": -6.670917987823486, "global_step": 130739, "epoch": 3112} {"train_loss": -6.473887920379639, "global_step": 130740, "epoch": 3112} {"train_loss": -6.763511657714844, "global_step": 130741, "epoch": 3112} {"train_loss": -6.479339599609375, "global_step": 130742, "epoch": 3112} {"train_loss": -6.561018943786621, "global_step": 130743, "epoch": 3112} {"train_loss": -6.668956279754639, "global_step": 130744, "epoch": 3112} {"train_loss": -6.621496643338885, "global_step": 130745, "epoch": 3112, "val_loss": 68202.0390625} {"train_loss": -6.566987991333008, "global_step": 130746, "epoch": 3113} {"train_loss": -6.7056169509887695, "global_step": 130747, "epoch": 3113} {"train_loss": -6.673255920410156, "global_step": 130748, "epoch": 3113} {"train_loss": -6.690437316894531, "global_step": 130749, "epoch": 3113} {"train_loss": -6.7109832763671875, "global_step": 130750, "epoch": 3113} {"train_loss": -6.718387603759766, "global_step": 130751, "epoch": 3113} {"train_loss": -6.595828533172607, "global_step": 130752, "epoch": 3113} {"train_loss": -6.587879180908203, "global_step": 130753, "epoch": 3113} {"train_loss": -6.650712490081787, "global_step": 130754, "epoch": 3113} {"train_loss": -6.678943634033203, "global_step": 130755, "epoch": 3113} {"train_loss": -6.644845008850098, "global_step": 130756, "epoch": 3113} {"train_loss": -6.728564262390137, "global_step": 130757, "epoch": 3113} {"train_loss": -6.652890682220459, "global_step": 130758, "epoch": 3113} {"train_loss": -6.630779266357422, "global_step": 130759, "epoch": 3113} {"train_loss": -6.623689651489258, "global_step": 130760, "epoch": 3113} {"train_loss": -6.533958435058594, "global_step": 130761, "epoch": 3113} {"train_loss": -6.73016357421875, "global_step": 130762, "epoch": 3113} {"train_loss": -6.667503356933594, "global_step": 130763, "epoch": 3113} {"train_loss": -6.674927234649658, "global_step": 130764, "epoch": 3113} {"train_loss": -6.792874336242676, "global_step": 130765, "epoch": 3113} {"train_loss": -6.626514911651611, "global_step": 130766, "epoch": 3113} {"train_loss": -6.722786903381348, "global_step": 130767, "epoch": 3113} {"train_loss": -6.736757755279541, "global_step": 130768, "epoch": 3113} {"train_loss": -6.693304061889648, "global_step": 130769, "epoch": 3113} {"train_loss": -6.629238605499268, "global_step": 130770, "epoch": 3113} {"train_loss": -6.559509754180908, "global_step": 130771, "epoch": 3113} {"train_loss": -6.610329627990723, "global_step": 130772, "epoch": 3113} {"train_loss": -6.611875057220459, "global_step": 130773, "epoch": 3113} {"train_loss": -6.681771755218506, "global_step": 130774, "epoch": 3113} {"train_loss": -6.604766368865967, "global_step": 130775, "epoch": 3113} {"train_loss": -6.649461269378662, "global_step": 130776, "epoch": 3113} {"train_loss": -6.629782676696777, "global_step": 130777, "epoch": 3113} {"train_loss": -6.6057891845703125, "global_step": 130778, "epoch": 3113} {"train_loss": -6.681760787963867, "global_step": 130779, "epoch": 3113} {"train_loss": -6.713876724243164, "global_step": 130780, "epoch": 3113} {"train_loss": -6.7381181716918945, "global_step": 130781, "epoch": 3113} {"train_loss": -6.5924296379089355, "global_step": 130782, "epoch": 3113} {"train_loss": -6.662940979003906, "global_step": 130783, "epoch": 3113} {"train_loss": -6.654644966125488, "global_step": 130784, "epoch": 3113} {"train_loss": -6.71597146987915, "global_step": 130785, "epoch": 3113} {"train_loss": -6.578906536102295, "global_step": 130786, "epoch": 3113} {"train_loss": -6.658235300154913, "global_step": 130787, "epoch": 3113, "val_loss": 68314.53125} {"train_loss": -6.603472709655762, "global_step": 130788, "epoch": 3114} {"train_loss": -6.655277252197266, "global_step": 130789, "epoch": 3114} {"train_loss": -6.527812480926514, "global_step": 130790, "epoch": 3114} {"train_loss": -6.609058380126953, "global_step": 130791, "epoch": 3114} {"train_loss": -6.646121025085449, "global_step": 130792, "epoch": 3114} {"train_loss": -6.6223907470703125, "global_step": 130793, "epoch": 3114} {"train_loss": -6.7204084396362305, "global_step": 130794, "epoch": 3114} {"train_loss": -6.644373416900635, "global_step": 130795, "epoch": 3114} {"train_loss": -6.699356555938721, "global_step": 130796, "epoch": 3114} {"train_loss": -6.660909652709961, "global_step": 130797, "epoch": 3114} {"train_loss": -6.619755744934082, "global_step": 130798, "epoch": 3114} {"train_loss": -6.696796417236328, "global_step": 130799, "epoch": 3114} {"train_loss": -6.688652038574219, "global_step": 130800, "epoch": 3114} {"train_loss": -6.568970680236816, "global_step": 130801, "epoch": 3114} {"train_loss": -6.742556571960449, "global_step": 130802, "epoch": 3114} {"train_loss": -6.714393615722656, "global_step": 130803, "epoch": 3114} {"train_loss": -6.628854751586914, "global_step": 130804, "epoch": 3114} {"train_loss": -6.679973125457764, "global_step": 130805, "epoch": 3114} {"train_loss": -6.652533054351807, "global_step": 130806, "epoch": 3114} {"train_loss": -6.640897750854492, "global_step": 130807, "epoch": 3114} {"train_loss": -6.618443012237549, "global_step": 130808, "epoch": 3114} {"train_loss": -6.683550834655762, "global_step": 130809, "epoch": 3114} {"train_loss": -6.697514057159424, "global_step": 130810, "epoch": 3114} {"train_loss": -6.549182891845703, "global_step": 130811, "epoch": 3114} {"train_loss": -6.570030689239502, "global_step": 130812, "epoch": 3114} {"train_loss": -6.566498279571533, "global_step": 130813, "epoch": 3114} {"train_loss": -6.589491844177246, "global_step": 130814, "epoch": 3114} {"train_loss": -6.691659450531006, "global_step": 130815, "epoch": 3114} {"train_loss": -6.6204729080200195, "global_step": 130816, "epoch": 3114} {"train_loss": -6.490355968475342, "global_step": 130817, "epoch": 3114} {"train_loss": -6.584348201751709, "global_step": 130818, "epoch": 3114} {"train_loss": -6.502017974853516, "global_step": 130819, "epoch": 3114} {"train_loss": -6.642515182495117, "global_step": 130820, "epoch": 3114} {"train_loss": -6.547800064086914, "global_step": 130821, "epoch": 3114} {"train_loss": -6.53460693359375, "global_step": 130822, "epoch": 3114} {"train_loss": -6.647859573364258, "global_step": 130823, "epoch": 3114} {"train_loss": -6.47463321685791, "global_step": 130824, "epoch": 3114} {"train_loss": -6.64646053314209, "global_step": 130825, "epoch": 3114} {"train_loss": -6.756092071533203, "global_step": 130826, "epoch": 3114} {"train_loss": -6.499232292175293, "global_step": 130827, "epoch": 3114} {"train_loss": -6.602512359619141, "global_step": 130828, "epoch": 3114} {"train_loss": -6.619093679246449, "global_step": 130829, "epoch": 3114, "val_loss": 68374.578125} {"train_loss": -6.500851154327393, "global_step": 130830, "epoch": 3115} {"train_loss": -6.750053882598877, "global_step": 130831, "epoch": 3115} {"train_loss": -6.5893659591674805, "global_step": 130832, "epoch": 3115} {"train_loss": -6.644268989562988, "global_step": 130833, "epoch": 3115} {"train_loss": -6.613410949707031, "global_step": 130834, "epoch": 3115} {"train_loss": -6.555763244628906, "global_step": 130835, "epoch": 3115} {"train_loss": -6.6947526931762695, "global_step": 130836, "epoch": 3115} {"train_loss": -6.580933570861816, "global_step": 130837, "epoch": 3115} {"train_loss": -6.622049331665039, "global_step": 130838, "epoch": 3115} {"train_loss": -6.513511657714844, "global_step": 130839, "epoch": 3115} {"train_loss": -6.638646602630615, "global_step": 130840, "epoch": 3115} {"train_loss": -6.737232208251953, "global_step": 130841, "epoch": 3115} {"train_loss": -6.6419806480407715, "global_step": 130842, "epoch": 3115} {"train_loss": -6.614188194274902, "global_step": 130843, "epoch": 3115} {"train_loss": -6.606686592102051, "global_step": 130844, "epoch": 3115} {"train_loss": -6.559664249420166, "global_step": 130845, "epoch": 3115} {"train_loss": -6.691776275634766, "global_step": 130846, "epoch": 3115} {"train_loss": -6.656208515167236, "global_step": 130847, "epoch": 3115} {"train_loss": -6.614599704742432, "global_step": 130848, "epoch": 3115} {"train_loss": -6.686078071594238, "global_step": 130849, "epoch": 3115} {"train_loss": -6.5641188621521, "global_step": 130850, "epoch": 3115} {"train_loss": -6.595175743103027, "global_step": 130851, "epoch": 3115} {"train_loss": -6.6386871337890625, "global_step": 130852, "epoch": 3115} {"train_loss": -6.604861736297607, "global_step": 130853, "epoch": 3115} {"train_loss": -6.6705851554870605, "global_step": 130854, "epoch": 3115} {"train_loss": -6.526298522949219, "global_step": 130855, "epoch": 3115} {"train_loss": -6.644103050231934, "global_step": 130856, "epoch": 3115} {"train_loss": -6.592006683349609, "global_step": 130857, "epoch": 3115} {"train_loss": -6.638272285461426, "global_step": 130858, "epoch": 3115} {"train_loss": -6.659353256225586, "global_step": 130859, "epoch": 3115} {"train_loss": -6.619868278503418, "global_step": 130860, "epoch": 3115} {"train_loss": -6.653832912445068, "global_step": 130861, "epoch": 3115} {"train_loss": -6.5465779304504395, "global_step": 130862, "epoch": 3115} {"train_loss": -6.5819854736328125, "global_step": 130863, "epoch": 3115} {"train_loss": -6.666095733642578, "global_step": 130864, "epoch": 3115} {"train_loss": -6.498146057128906, "global_step": 130865, "epoch": 3115} {"train_loss": -6.543517589569092, "global_step": 130866, "epoch": 3115} {"train_loss": -6.679337501525879, "global_step": 130867, "epoch": 3115} {"train_loss": -6.5430588722229, "global_step": 130868, "epoch": 3115} {"train_loss": -6.576584815979004, "global_step": 130869, "epoch": 3115} {"train_loss": -6.5345001220703125, "global_step": 130870, "epoch": 3115} {"train_loss": -6.608803476606097, "global_step": 130871, "epoch": 3115, "val_loss": 68030.6953125} {"train_loss": -6.5760087966918945, "global_step": 130872, "epoch": 3116} {"train_loss": -6.658683776855469, "global_step": 130873, "epoch": 3116} {"train_loss": -6.465928554534912, "global_step": 130874, "epoch": 3116} {"train_loss": -6.420936584472656, "global_step": 130875, "epoch": 3116} {"train_loss": -6.6269402503967285, "global_step": 130876, "epoch": 3116} {"train_loss": -6.335110664367676, "global_step": 130877, "epoch": 3116} {"train_loss": -6.593328475952148, "global_step": 130878, "epoch": 3116} {"train_loss": -6.520458698272705, "global_step": 130879, "epoch": 3116} {"train_loss": -6.558485984802246, "global_step": 130880, "epoch": 3116} {"train_loss": -6.4375481605529785, "global_step": 130881, "epoch": 3116} {"train_loss": -6.576909065246582, "global_step": 130882, "epoch": 3116} {"train_loss": -6.581443786621094, "global_step": 130883, "epoch": 3116} {"train_loss": -6.5477752685546875, "global_step": 130884, "epoch": 3116} {"train_loss": -6.607878684997559, "global_step": 130885, "epoch": 3116} {"train_loss": -6.366927146911621, "global_step": 130886, "epoch": 3116} {"train_loss": -6.502090930938721, "global_step": 130887, "epoch": 3116} {"train_loss": -6.425420761108398, "global_step": 130888, "epoch": 3116} {"train_loss": -6.495515823364258, "global_step": 130889, "epoch": 3116} {"train_loss": -6.412452697753906, "global_step": 130890, "epoch": 3116} {"train_loss": -6.516520023345947, "global_step": 130891, "epoch": 3116} {"train_loss": -6.483173370361328, "global_step": 130892, "epoch": 3116} {"train_loss": -6.576848030090332, "global_step": 130893, "epoch": 3116} {"train_loss": -6.468857765197754, "global_step": 130894, "epoch": 3116} {"train_loss": -6.440849781036377, "global_step": 130895, "epoch": 3116} {"train_loss": -6.488667964935303, "global_step": 130896, "epoch": 3116} {"train_loss": -6.476722717285156, "global_step": 130897, "epoch": 3116} {"train_loss": -6.505003452301025, "global_step": 130898, "epoch": 3116} {"train_loss": -6.458210468292236, "global_step": 130899, "epoch": 3116} {"train_loss": -6.496970176696777, "global_step": 130900, "epoch": 3116} {"train_loss": -6.481780052185059, "global_step": 130901, "epoch": 3116} {"train_loss": -6.560076713562012, "global_step": 130902, "epoch": 3116} {"train_loss": -6.619521617889404, "global_step": 130903, "epoch": 3116} {"train_loss": -6.674077987670898, "global_step": 130904, "epoch": 3116} {"train_loss": -6.580214977264404, "global_step": 130905, "epoch": 3116} {"train_loss": -6.6147871017456055, "global_step": 130906, "epoch": 3116} {"train_loss": -6.462784767150879, "global_step": 130907, "epoch": 3116} {"train_loss": -6.669440269470215, "global_step": 130908, "epoch": 3116} {"train_loss": -6.533754348754883, "global_step": 130909, "epoch": 3116} {"train_loss": -6.648775100708008, "global_step": 130910, "epoch": 3116} {"train_loss": -6.458866119384766, "global_step": 130911, "epoch": 3116} {"train_loss": -6.749443054199219, "global_step": 130912, "epoch": 3116} {"train_loss": -6.53190465200515, "global_step": 130913, "epoch": 3116, "val_loss": 68027.140625} {"train_loss": -6.6075005531311035, "global_step": 130914, "epoch": 3117} {"train_loss": -6.586038112640381, "global_step": 130915, "epoch": 3117} {"train_loss": -6.597664833068848, "global_step": 130916, "epoch": 3117} {"train_loss": -6.639850616455078, "global_step": 130917, "epoch": 3117} {"train_loss": -6.69127082824707, "global_step": 130918, "epoch": 3117} {"train_loss": -6.685606479644775, "global_step": 130919, "epoch": 3117} {"train_loss": -6.623745918273926, "global_step": 130920, "epoch": 3117} {"train_loss": -6.668275833129883, "global_step": 130921, "epoch": 3117} {"train_loss": -6.572264194488525, "global_step": 130922, "epoch": 3117} {"train_loss": -6.689233779907227, "global_step": 130923, "epoch": 3117} {"train_loss": -6.537363052368164, "global_step": 130924, "epoch": 3117} {"train_loss": -6.664567947387695, "global_step": 130925, "epoch": 3117} {"train_loss": -6.536711692810059, "global_step": 130926, "epoch": 3117} {"train_loss": -6.637766361236572, "global_step": 130927, "epoch": 3117} {"train_loss": -6.704602241516113, "global_step": 130928, "epoch": 3117} {"train_loss": -6.532644271850586, "global_step": 130929, "epoch": 3117} {"train_loss": -6.694796562194824, "global_step": 130930, "epoch": 3117} {"train_loss": -6.729035377502441, "global_step": 130931, "epoch": 3117} {"train_loss": -6.691408157348633, "global_step": 130932, "epoch": 3117} {"train_loss": -6.586426258087158, "global_step": 130933, "epoch": 3117} {"train_loss": -6.770654678344727, "global_step": 130934, "epoch": 3117} {"train_loss": -6.56450080871582, "global_step": 130935, "epoch": 3117} {"train_loss": -6.650763988494873, "global_step": 130936, "epoch": 3117} {"train_loss": -6.5697431564331055, "global_step": 130937, "epoch": 3117} {"train_loss": -6.636115074157715, "global_step": 130938, "epoch": 3117} {"train_loss": -6.675511360168457, "global_step": 130939, "epoch": 3117} {"train_loss": -6.681252479553223, "global_step": 130940, "epoch": 3117} {"train_loss": -6.765061378479004, "global_step": 130941, "epoch": 3117} {"train_loss": -6.664335250854492, "global_step": 130942, "epoch": 3117} {"train_loss": -6.69408655166626, "global_step": 130943, "epoch": 3117} {"train_loss": -6.723656177520752, "global_step": 130944, "epoch": 3117} {"train_loss": -6.7339606285095215, "global_step": 130945, "epoch": 3117} {"train_loss": -6.574239730834961, "global_step": 130946, "epoch": 3117} {"train_loss": -6.5755767822265625, "global_step": 130947, "epoch": 3117} {"train_loss": -6.66155481338501, "global_step": 130948, "epoch": 3117} {"train_loss": -6.697728157043457, "global_step": 130949, "epoch": 3117} {"train_loss": -6.762376308441162, "global_step": 130950, "epoch": 3117} {"train_loss": -6.662891387939453, "global_step": 130951, "epoch": 3117} {"train_loss": -6.771993637084961, "global_step": 130952, "epoch": 3117} {"train_loss": -6.458118438720703, "global_step": 130953, "epoch": 3117} {"train_loss": -6.715731620788574, "global_step": 130954, "epoch": 3117} {"train_loss": -6.649048646291097, "global_step": 130955, "epoch": 3117, "val_loss": 68212.46875} {"train_loss": -6.578192710876465, "global_step": 130956, "epoch": 3118} {"train_loss": -6.588600158691406, "global_step": 130957, "epoch": 3118} {"train_loss": -6.720373630523682, "global_step": 130958, "epoch": 3118} {"train_loss": -6.702149391174316, "global_step": 130959, "epoch": 3118} {"train_loss": -6.628383159637451, "global_step": 130960, "epoch": 3118} {"train_loss": -6.6016693115234375, "global_step": 130961, "epoch": 3118} {"train_loss": -6.6566162109375, "global_step": 130962, "epoch": 3118} {"train_loss": -6.647594451904297, "global_step": 130963, "epoch": 3118} {"train_loss": -6.747411727905273, "global_step": 130964, "epoch": 3118} {"train_loss": -6.719246864318848, "global_step": 130965, "epoch": 3118} {"train_loss": -6.612160682678223, "global_step": 130966, "epoch": 3118} {"train_loss": -6.7230424880981445, "global_step": 130967, "epoch": 3118} {"train_loss": -6.725768566131592, "global_step": 130968, "epoch": 3118} {"train_loss": -6.588826656341553, "global_step": 130969, "epoch": 3118} {"train_loss": -6.648498058319092, "global_step": 130970, "epoch": 3118} {"train_loss": -6.597899436950684, "global_step": 130971, "epoch": 3118} {"train_loss": -6.772995948791504, "global_step": 130972, "epoch": 3118} {"train_loss": -6.545200824737549, "global_step": 130973, "epoch": 3118} {"train_loss": -6.608165740966797, "global_step": 130974, "epoch": 3118} {"train_loss": -6.689591884613037, "global_step": 130975, "epoch": 3118} {"train_loss": -6.577147960662842, "global_step": 130976, "epoch": 3118} {"train_loss": -6.590161323547363, "global_step": 130977, "epoch": 3118} {"train_loss": -6.6334547996521, "global_step": 130978, "epoch": 3118} {"train_loss": -6.5560808181762695, "global_step": 130979, "epoch": 3118} {"train_loss": -6.634427070617676, "global_step": 130980, "epoch": 3118} {"train_loss": -6.702028274536133, "global_step": 130981, "epoch": 3118} {"train_loss": -6.567657470703125, "global_step": 130982, "epoch": 3118} {"train_loss": -6.663571357727051, "global_step": 130983, "epoch": 3118} {"train_loss": -6.6100754737854, "global_step": 130984, "epoch": 3118} {"train_loss": -6.662579536437988, "global_step": 130985, "epoch": 3118} {"train_loss": -6.702383041381836, "global_step": 130986, "epoch": 3118} {"train_loss": -6.687028884887695, "global_step": 130987, "epoch": 3118} {"train_loss": -6.718562126159668, "global_step": 130988, "epoch": 3118} {"train_loss": -6.679196834564209, "global_step": 130989, "epoch": 3118} {"train_loss": -6.710251331329346, "global_step": 130990, "epoch": 3118} {"train_loss": -6.569266319274902, "global_step": 130991, "epoch": 3118} {"train_loss": -6.775757789611816, "global_step": 130992, "epoch": 3118} {"train_loss": -6.630824565887451, "global_step": 130993, "epoch": 3118} {"train_loss": -6.522334098815918, "global_step": 130994, "epoch": 3118} {"train_loss": -6.649364471435547, "global_step": 130995, "epoch": 3118} {"train_loss": -6.5844526290893555, "global_step": 130996, "epoch": 3118} {"train_loss": -6.646562792005993, "global_step": 130997, "epoch": 3118, "val_loss": 68067.2421875} {"train_loss": -6.561509132385254, "global_step": 130998, "epoch": 3119} {"train_loss": -6.6381072998046875, "global_step": 130999, "epoch": 3119} {"train_loss": -6.682576656341553, "global_step": 131000, "epoch": 3119} {"train_loss": -6.54670524597168, "global_step": 131001, "epoch": 3119} {"train_loss": -6.522242069244385, "global_step": 131002, "epoch": 3119} {"train_loss": -6.686102867126465, "global_step": 131003, "epoch": 3119} {"train_loss": -6.662412166595459, "global_step": 131004, "epoch": 3119} {"train_loss": -6.534360885620117, "global_step": 131005, "epoch": 3119} {"train_loss": -6.72025203704834, "global_step": 131006, "epoch": 3119} {"train_loss": -6.599108695983887, "global_step": 131007, "epoch": 3119} {"train_loss": -6.457468032836914, "global_step": 131008, "epoch": 3119} {"train_loss": -6.670499801635742, "global_step": 131009, "epoch": 3119} {"train_loss": -6.615253448486328, "global_step": 131010, "epoch": 3119} {"train_loss": -6.626731872558594, "global_step": 131011, "epoch": 3119} {"train_loss": -6.6180877685546875, "global_step": 131012, "epoch": 3119} {"train_loss": -6.4608659744262695, "global_step": 131013, "epoch": 3119} {"train_loss": -6.736180305480957, "global_step": 131014, "epoch": 3119} {"train_loss": -6.537135124206543, "global_step": 131015, "epoch": 3119} {"train_loss": -6.396967887878418, "global_step": 131016, "epoch": 3119} {"train_loss": -6.622002124786377, "global_step": 131017, "epoch": 3119} {"train_loss": -6.531784534454346, "global_step": 131018, "epoch": 3119} {"train_loss": -6.5820841789245605, "global_step": 131019, "epoch": 3119} {"train_loss": -6.489326477050781, "global_step": 131020, "epoch": 3119} {"train_loss": -6.7064104080200195, "global_step": 131021, "epoch": 3119} {"train_loss": -6.452025413513184, "global_step": 131022, "epoch": 3119} {"train_loss": -6.623736381530762, "global_step": 131023, "epoch": 3119} {"train_loss": -6.582262992858887, "global_step": 131024, "epoch": 3119} {"train_loss": -6.587982654571533, "global_step": 131025, "epoch": 3119} {"train_loss": -6.4987969398498535, "global_step": 131026, "epoch": 3119} {"train_loss": -6.549350738525391, "global_step": 131027, "epoch": 3119} {"train_loss": -6.5875244140625, "global_step": 131028, "epoch": 3119} {"train_loss": -6.659271240234375, "global_step": 131029, "epoch": 3119} {"train_loss": -6.6145477294921875, "global_step": 131030, "epoch": 3119} {"train_loss": -6.600595951080322, "global_step": 131031, "epoch": 3119} {"train_loss": -6.690967559814453, "global_step": 131032, "epoch": 3119} {"train_loss": -6.601146697998047, "global_step": 131033, "epoch": 3119} {"train_loss": -6.546896934509277, "global_step": 131034, "epoch": 3119} {"train_loss": -6.597329139709473, "global_step": 131035, "epoch": 3119} {"train_loss": -6.575826644897461, "global_step": 131036, "epoch": 3119} {"train_loss": -6.720852851867676, "global_step": 131037, "epoch": 3119} {"train_loss": -6.582751274108887, "global_step": 131038, "epoch": 3119} {"train_loss": -6.591350623539516, "global_step": 131039, "epoch": 3119, "val_loss": 68068.8046875} {"train_loss": -6.641444206237793, "global_step": 131040, "epoch": 3120} {"train_loss": -6.540791034698486, "global_step": 131041, "epoch": 3120} {"train_loss": -6.639526844024658, "global_step": 131042, "epoch": 3120} {"train_loss": -6.726724147796631, "global_step": 131043, "epoch": 3120} {"train_loss": -6.7287092208862305, "global_step": 131044, "epoch": 3120} {"train_loss": -6.556793212890625, "global_step": 131045, "epoch": 3120} {"train_loss": -6.601014614105225, "global_step": 131046, "epoch": 3120} {"train_loss": -6.539849281311035, "global_step": 131047, "epoch": 3120} {"train_loss": -6.692332744598389, "global_step": 131048, "epoch": 3120} {"train_loss": -6.684802055358887, "global_step": 131049, "epoch": 3120} {"train_loss": -6.689874172210693, "global_step": 131050, "epoch": 3120} {"train_loss": -6.668729305267334, "global_step": 131051, "epoch": 3120} {"train_loss": -6.599393844604492, "global_step": 131052, "epoch": 3120} {"train_loss": -6.724931240081787, "global_step": 131053, "epoch": 3120} {"train_loss": -6.547281265258789, "global_step": 131054, "epoch": 3120} {"train_loss": -6.653799533843994, "global_step": 131055, "epoch": 3120} {"train_loss": -6.647897243499756, "global_step": 131056, "epoch": 3120} {"train_loss": -6.710908889770508, "global_step": 131057, "epoch": 3120} {"train_loss": -6.709293365478516, "global_step": 131058, "epoch": 3120} {"train_loss": -6.550653457641602, "global_step": 131059, "epoch": 3120} {"train_loss": -6.609626770019531, "global_step": 131060, "epoch": 3120} {"train_loss": -6.63970422744751, "global_step": 131061, "epoch": 3120} {"train_loss": -6.7093706130981445, "global_step": 131062, "epoch": 3120} {"train_loss": -6.589353561401367, "global_step": 131063, "epoch": 3120} {"train_loss": -6.657181739807129, "global_step": 131064, "epoch": 3120} {"train_loss": -6.769465923309326, "global_step": 131065, "epoch": 3120} {"train_loss": -6.658681869506836, "global_step": 131066, "epoch": 3120} {"train_loss": -6.701255798339844, "global_step": 131067, "epoch": 3120} {"train_loss": -6.65286922454834, "global_step": 131068, "epoch": 3120} {"train_loss": -6.687150478363037, "global_step": 131069, "epoch": 3120} {"train_loss": -6.567447662353516, "global_step": 131070, "epoch": 3120} {"train_loss": -6.543764114379883, "global_step": 131071, "epoch": 3120} {"train_loss": -6.718436241149902, "global_step": 131072, "epoch": 3120} {"train_loss": -6.607723236083984, "global_step": 131073, "epoch": 3120} {"train_loss": -6.491137504577637, "global_step": 131074, "epoch": 3120} {"train_loss": -6.556327819824219, "global_step": 131075, "epoch": 3120} {"train_loss": -6.702004432678223, "global_step": 131076, "epoch": 3120} {"train_loss": -6.421314239501953, "global_step": 131077, "epoch": 3120} {"train_loss": -6.633449077606201, "global_step": 131078, "epoch": 3120} {"train_loss": -6.513612270355225, "global_step": 131079, "epoch": 3120} {"train_loss": -6.631195545196533, "global_step": 131080, "epoch": 3120} {"train_loss": -6.633118300210862, "global_step": 131081, "epoch": 3120, "val_loss": 68041.2421875} {"train_loss": -6.554481506347656, "global_step": 131082, "epoch": 3121} {"train_loss": -6.449141502380371, "global_step": 131083, "epoch": 3121} {"train_loss": -6.679757595062256, "global_step": 131084, "epoch": 3121} {"train_loss": -6.650605201721191, "global_step": 131085, "epoch": 3121} {"train_loss": -6.519252777099609, "global_step": 131086, "epoch": 3121} {"train_loss": -6.653717994689941, "global_step": 131087, "epoch": 3121} {"train_loss": -6.638779640197754, "global_step": 131088, "epoch": 3121} {"train_loss": -6.6159467697143555, "global_step": 131089, "epoch": 3121} {"train_loss": -6.680582046508789, "global_step": 131090, "epoch": 3121} {"train_loss": -6.679625034332275, "global_step": 131091, "epoch": 3121} {"train_loss": -6.610435485839844, "global_step": 131092, "epoch": 3121} {"train_loss": -6.560718059539795, "global_step": 131093, "epoch": 3121} {"train_loss": -6.598691463470459, "global_step": 131094, "epoch": 3121} {"train_loss": -6.668205261230469, "global_step": 131095, "epoch": 3121} {"train_loss": -6.697381973266602, "global_step": 131096, "epoch": 3121} {"train_loss": -6.630516052246094, "global_step": 131097, "epoch": 3121} {"train_loss": -6.653622627258301, "global_step": 131098, "epoch": 3121} {"train_loss": -6.62884521484375, "global_step": 131099, "epoch": 3121} {"train_loss": -6.649256706237793, "global_step": 131100, "epoch": 3121} {"train_loss": -6.530180931091309, "global_step": 131101, "epoch": 3121} {"train_loss": -6.707215785980225, "global_step": 131102, "epoch": 3121} {"train_loss": -6.632058620452881, "global_step": 131103, "epoch": 3121} {"train_loss": -6.533614158630371, "global_step": 131104, "epoch": 3121} {"train_loss": -6.7181196212768555, "global_step": 131105, "epoch": 3121} {"train_loss": -6.621542453765869, "global_step": 131106, "epoch": 3121} {"train_loss": -6.707034111022949, "global_step": 131107, "epoch": 3121} {"train_loss": -6.664240837097168, "global_step": 131108, "epoch": 3121} {"train_loss": -6.583885192871094, "global_step": 131109, "epoch": 3121} {"train_loss": -6.658420085906982, "global_step": 131110, "epoch": 3121} {"train_loss": -6.691680908203125, "global_step": 131111, "epoch": 3121} {"train_loss": -6.6981048583984375, "global_step": 131112, "epoch": 3121} {"train_loss": -6.708889007568359, "global_step": 131113, "epoch": 3121} {"train_loss": -6.6732258796691895, "global_step": 131114, "epoch": 3121} {"train_loss": -6.716036319732666, "global_step": 131115, "epoch": 3121} {"train_loss": -6.677256107330322, "global_step": 131116, "epoch": 3121} {"train_loss": -6.622193336486816, "global_step": 131117, "epoch": 3121} {"train_loss": -6.591714859008789, "global_step": 131118, "epoch": 3121} {"train_loss": -6.58811092376709, "global_step": 131119, "epoch": 3121} {"train_loss": -6.605674743652344, "global_step": 131120, "epoch": 3121} {"train_loss": -6.680315017700195, "global_step": 131121, "epoch": 3121} {"train_loss": -6.627405166625977, "global_step": 131122, "epoch": 3121} {"train_loss": -6.63572553225926, "global_step": 131123, "epoch": 3121, "val_loss": 68168.6796875} {"train_loss": -6.6483659744262695, "global_step": 131124, "epoch": 3122} {"train_loss": -6.6926984786987305, "global_step": 131125, "epoch": 3122} {"train_loss": -6.733107566833496, "global_step": 131126, "epoch": 3122} {"train_loss": -6.510307312011719, "global_step": 131127, "epoch": 3122} {"train_loss": -6.671575546264648, "global_step": 131128, "epoch": 3122} {"train_loss": -6.561978340148926, "global_step": 131129, "epoch": 3122} {"train_loss": -6.62531852722168, "global_step": 131130, "epoch": 3122} {"train_loss": -6.680108070373535, "global_step": 131131, "epoch": 3122} {"train_loss": -6.690959930419922, "global_step": 131132, "epoch": 3122} {"train_loss": -6.651858329772949, "global_step": 131133, "epoch": 3122} {"train_loss": -6.693993091583252, "global_step": 131134, "epoch": 3122} {"train_loss": -6.701846122741699, "global_step": 131135, "epoch": 3122} {"train_loss": -6.512505054473877, "global_step": 131136, "epoch": 3122} {"train_loss": -6.593758583068848, "global_step": 131137, "epoch": 3122} {"train_loss": -6.562914848327637, "global_step": 131138, "epoch": 3122} {"train_loss": -6.695828437805176, "global_step": 131139, "epoch": 3122} {"train_loss": -6.7206130027771, "global_step": 131140, "epoch": 3122} {"train_loss": -6.680906772613525, "global_step": 131141, "epoch": 3122} {"train_loss": -6.588104724884033, "global_step": 131142, "epoch": 3122} {"train_loss": -6.720285415649414, "global_step": 131143, "epoch": 3122} {"train_loss": -6.623467445373535, "global_step": 131144, "epoch": 3122} {"train_loss": -6.637063503265381, "global_step": 131145, "epoch": 3122} {"train_loss": -6.620554447174072, "global_step": 131146, "epoch": 3122} {"train_loss": -6.6985578536987305, "global_step": 131147, "epoch": 3122} {"train_loss": -6.618386268615723, "global_step": 131148, "epoch": 3122} {"train_loss": -6.690521240234375, "global_step": 131149, "epoch": 3122} {"train_loss": -6.678303241729736, "global_step": 131150, "epoch": 3122} {"train_loss": -6.727024078369141, "global_step": 131151, "epoch": 3122} {"train_loss": -6.812372207641602, "global_step": 131152, "epoch": 3122} {"train_loss": -6.707094192504883, "global_step": 131153, "epoch": 3122} {"train_loss": -6.6959052085876465, "global_step": 131154, "epoch": 3122} {"train_loss": -6.645068168640137, "global_step": 131155, "epoch": 3122} {"train_loss": -6.747602462768555, "global_step": 131156, "epoch": 3122} {"train_loss": -6.662805557250977, "global_step": 131157, "epoch": 3122} {"train_loss": -6.705629348754883, "global_step": 131158, "epoch": 3122} {"train_loss": -6.655941009521484, "global_step": 131159, "epoch": 3122} {"train_loss": -6.543198108673096, "global_step": 131160, "epoch": 3122} {"train_loss": -6.660974502563477, "global_step": 131161, "epoch": 3122} {"train_loss": -6.615898132324219, "global_step": 131162, "epoch": 3122} {"train_loss": -6.697948455810547, "global_step": 131163, "epoch": 3122} {"train_loss": -6.670383453369141, "global_step": 131164, "epoch": 3122} {"train_loss": -6.657656533377511, "global_step": 131165, "epoch": 3122, "val_loss": 68126.171875} {"train_loss": -6.635071754455566, "global_step": 131166, "epoch": 3123} {"train_loss": -6.669187545776367, "global_step": 131167, "epoch": 3123} {"train_loss": -6.603777885437012, "global_step": 131168, "epoch": 3123} {"train_loss": -6.539159774780273, "global_step": 131169, "epoch": 3123} {"train_loss": -6.644139289855957, "global_step": 131170, "epoch": 3123} {"train_loss": -6.497663497924805, "global_step": 131171, "epoch": 3123} {"train_loss": -6.668558597564697, "global_step": 131172, "epoch": 3123} {"train_loss": -6.56818962097168, "global_step": 131173, "epoch": 3123} {"train_loss": -6.581593036651611, "global_step": 131174, "epoch": 3123} {"train_loss": -6.526915073394775, "global_step": 131175, "epoch": 3123} {"train_loss": -6.492948055267334, "global_step": 131176, "epoch": 3123} {"train_loss": -6.661484241485596, "global_step": 131177, "epoch": 3123} {"train_loss": -6.60905647277832, "global_step": 131178, "epoch": 3123} {"train_loss": -6.634212017059326, "global_step": 131179, "epoch": 3123} {"train_loss": -6.640987396240234, "global_step": 131180, "epoch": 3123} {"train_loss": -6.534970283508301, "global_step": 131181, "epoch": 3123} {"train_loss": -6.50408935546875, "global_step": 131182, "epoch": 3123} {"train_loss": -6.568881034851074, "global_step": 131183, "epoch": 3123} {"train_loss": -6.487156391143799, "global_step": 131184, "epoch": 3123} {"train_loss": -6.596237659454346, "global_step": 131185, "epoch": 3123} {"train_loss": -6.543971061706543, "global_step": 131186, "epoch": 3123} {"train_loss": -6.557485103607178, "global_step": 131187, "epoch": 3123} {"train_loss": -6.543453693389893, "global_step": 131188, "epoch": 3123} {"train_loss": -6.58491325378418, "global_step": 131189, "epoch": 3123} {"train_loss": -6.55271577835083, "global_step": 131190, "epoch": 3123} {"train_loss": -6.586243152618408, "global_step": 131191, "epoch": 3123} {"train_loss": -6.543587684631348, "global_step": 131192, "epoch": 3123} {"train_loss": -6.620673179626465, "global_step": 131193, "epoch": 3123} {"train_loss": -6.62359619140625, "global_step": 131194, "epoch": 3123} {"train_loss": -6.572139739990234, "global_step": 131195, "epoch": 3123} {"train_loss": -6.6561079025268555, "global_step": 131196, "epoch": 3123} {"train_loss": -6.678703308105469, "global_step": 131197, "epoch": 3123} {"train_loss": -6.721189498901367, "global_step": 131198, "epoch": 3123} {"train_loss": -6.635281085968018, "global_step": 131199, "epoch": 3123} {"train_loss": -6.516019821166992, "global_step": 131200, "epoch": 3123} {"train_loss": -6.7563018798828125, "global_step": 131201, "epoch": 3123} {"train_loss": -6.546901702880859, "global_step": 131202, "epoch": 3123} {"train_loss": -6.724940299987793, "global_step": 131203, "epoch": 3123} {"train_loss": -6.637618064880371, "global_step": 131204, "epoch": 3123} {"train_loss": -6.599809646606445, "global_step": 131205, "epoch": 3123} {"train_loss": -6.624656677246094, "global_step": 131206, "epoch": 3123} {"train_loss": -6.596538282576061, "global_step": 131207, "epoch": 3123, "val_loss": 68393.25} {"train_loss": -6.649750232696533, "global_step": 131208, "epoch": 3124} {"train_loss": -6.627092361450195, "global_step": 131209, "epoch": 3124} {"train_loss": -6.788299560546875, "global_step": 131210, "epoch": 3124} {"train_loss": -6.661938667297363, "global_step": 131211, "epoch": 3124} {"train_loss": -6.744332313537598, "global_step": 131212, "epoch": 3124} {"train_loss": -6.67246150970459, "global_step": 131213, "epoch": 3124} {"train_loss": -6.682547569274902, "global_step": 131214, "epoch": 3124} {"train_loss": -6.687594413757324, "global_step": 131215, "epoch": 3124} {"train_loss": -6.604524612426758, "global_step": 131216, "epoch": 3124} {"train_loss": -6.542102813720703, "global_step": 131217, "epoch": 3124} {"train_loss": -6.697962760925293, "global_step": 131218, "epoch": 3124} {"train_loss": -6.681310653686523, "global_step": 131219, "epoch": 3124} {"train_loss": -6.7013397216796875, "global_step": 131220, "epoch": 3124} {"train_loss": -6.549050807952881, "global_step": 131221, "epoch": 3124} {"train_loss": -6.602841377258301, "global_step": 131222, "epoch": 3124} {"train_loss": -6.666847229003906, "global_step": 131223, "epoch": 3124} {"train_loss": -6.615875244140625, "global_step": 131224, "epoch": 3124} {"train_loss": -6.697751522064209, "global_step": 131225, "epoch": 3124} {"train_loss": -6.514004230499268, "global_step": 131226, "epoch": 3124} {"train_loss": -6.652924537658691, "global_step": 131227, "epoch": 3124} {"train_loss": -6.586816787719727, "global_step": 131228, "epoch": 3124} {"train_loss": -6.628458023071289, "global_step": 131229, "epoch": 3124} {"train_loss": -6.607447624206543, "global_step": 131230, "epoch": 3124} {"train_loss": -6.662879467010498, "global_step": 131231, "epoch": 3124} {"train_loss": -6.748065948486328, "global_step": 131232, "epoch": 3124} {"train_loss": -6.593183517456055, "global_step": 131233, "epoch": 3124} {"train_loss": -6.675910949707031, "global_step": 131234, "epoch": 3124} {"train_loss": -6.778237342834473, "global_step": 131235, "epoch": 3124} {"train_loss": -6.624755382537842, "global_step": 131236, "epoch": 3124} {"train_loss": -6.7021965980529785, "global_step": 131237, "epoch": 3124} {"train_loss": -6.673515319824219, "global_step": 131238, "epoch": 3124} {"train_loss": -6.799110412597656, "global_step": 131239, "epoch": 3124} {"train_loss": -6.512131214141846, "global_step": 131240, "epoch": 3124} {"train_loss": -6.675273895263672, "global_step": 131241, "epoch": 3124} {"train_loss": -6.772607803344727, "global_step": 131242, "epoch": 3124} {"train_loss": -6.5868096351623535, "global_step": 131243, "epoch": 3124} {"train_loss": -6.660195350646973, "global_step": 131244, "epoch": 3124} {"train_loss": -6.6705427169799805, "global_step": 131245, "epoch": 3124} {"train_loss": -6.584591388702393, "global_step": 131246, "epoch": 3124} {"train_loss": -6.642741680145264, "global_step": 131247, "epoch": 3124} {"train_loss": -6.6843109130859375, "global_step": 131248, "epoch": 3124} {"train_loss": -6.654325541995821, "global_step": 131249, "epoch": 3124, "val_loss": 68287.5} {"train_loss": -6.672433376312256, "global_step": 131250, "epoch": 3125} {"train_loss": -6.565462112426758, "global_step": 131251, "epoch": 3125} {"train_loss": -6.470759391784668, "global_step": 131252, "epoch": 3125} {"train_loss": -6.613284111022949, "global_step": 131253, "epoch": 3125} {"train_loss": -6.574580192565918, "global_step": 131254, "epoch": 3125} {"train_loss": -6.450617790222168, "global_step": 131255, "epoch": 3125} {"train_loss": -6.6326494216918945, "global_step": 131256, "epoch": 3125} {"train_loss": -6.645698070526123, "global_step": 131257, "epoch": 3125} {"train_loss": -6.685429096221924, "global_step": 131258, "epoch": 3125} {"train_loss": -6.693470001220703, "global_step": 131259, "epoch": 3125} {"train_loss": -6.683346748352051, "global_step": 131260, "epoch": 3125} {"train_loss": -6.809211254119873, "global_step": 131261, "epoch": 3125} {"train_loss": -6.543788909912109, "global_step": 131262, "epoch": 3125} {"train_loss": -6.644865989685059, "global_step": 131263, "epoch": 3125} {"train_loss": -6.721512794494629, "global_step": 131264, "epoch": 3125} {"train_loss": -6.593104362487793, "global_step": 131265, "epoch": 3125} {"train_loss": -6.627452373504639, "global_step": 131266, "epoch": 3125} {"train_loss": -6.740090370178223, "global_step": 131267, "epoch": 3125} {"train_loss": -6.585293769836426, "global_step": 131268, "epoch": 3125} {"train_loss": -6.584379196166992, "global_step": 131269, "epoch": 3125} {"train_loss": -6.666677474975586, "global_step": 131270, "epoch": 3125} {"train_loss": -6.650899887084961, "global_step": 131271, "epoch": 3125} {"train_loss": -6.497628211975098, "global_step": 131272, "epoch": 3125} {"train_loss": -6.653367042541504, "global_step": 131273, "epoch": 3125} {"train_loss": -6.566525459289551, "global_step": 131274, "epoch": 3125} {"train_loss": -6.64569091796875, "global_step": 131275, "epoch": 3125} {"train_loss": -6.759747505187988, "global_step": 131276, "epoch": 3125} {"train_loss": -6.68202018737793, "global_step": 131277, "epoch": 3125} {"train_loss": -6.545215606689453, "global_step": 131278, "epoch": 3125} {"train_loss": -6.645708084106445, "global_step": 131279, "epoch": 3125} {"train_loss": -6.657292366027832, "global_step": 131280, "epoch": 3125} {"train_loss": -6.732117652893066, "global_step": 131281, "epoch": 3125} {"train_loss": -6.71686315536499, "global_step": 131282, "epoch": 3125} {"train_loss": -6.662700653076172, "global_step": 131283, "epoch": 3125} {"train_loss": -6.690201759338379, "global_step": 131284, "epoch": 3125} {"train_loss": -6.643526077270508, "global_step": 131285, "epoch": 3125} {"train_loss": -6.639732360839844, "global_step": 131286, "epoch": 3125} {"train_loss": -6.718212604522705, "global_step": 131287, "epoch": 3125} {"train_loss": -6.733372211456299, "global_step": 131288, "epoch": 3125} {"train_loss": -6.619900703430176, "global_step": 131289, "epoch": 3125} {"train_loss": -6.572224140167236, "global_step": 131290, "epoch": 3125} {"train_loss": -6.639539253144037, "global_step": 131291, "epoch": 3125, "val_loss": 68028.5625} {"train_loss": -6.728049278259277, "global_step": 131292, "epoch": 3126} {"train_loss": -6.684641361236572, "global_step": 131293, "epoch": 3126} {"train_loss": -6.649755477905273, "global_step": 131294, "epoch": 3126} {"train_loss": -6.577526092529297, "global_step": 131295, "epoch": 3126} {"train_loss": -6.641371726989746, "global_step": 131296, "epoch": 3126} {"train_loss": -6.684474468231201, "global_step": 131297, "epoch": 3126} {"train_loss": -6.585870742797852, "global_step": 131298, "epoch": 3126} {"train_loss": -6.682528972625732, "global_step": 131299, "epoch": 3126} {"train_loss": -6.722480773925781, "global_step": 131300, "epoch": 3126} {"train_loss": -6.682905197143555, "global_step": 131301, "epoch": 3126} {"train_loss": -6.671170711517334, "global_step": 131302, "epoch": 3126} {"train_loss": -6.606305122375488, "global_step": 131303, "epoch": 3126} {"train_loss": -6.60606575012207, "global_step": 131304, "epoch": 3126} {"train_loss": -6.546677589416504, "global_step": 131305, "epoch": 3126} {"train_loss": -6.611782073974609, "global_step": 131306, "epoch": 3126} {"train_loss": -6.589514255523682, "global_step": 131307, "epoch": 3126} {"train_loss": -6.616006851196289, "global_step": 131308, "epoch": 3126} {"train_loss": -6.529839515686035, "global_step": 131309, "epoch": 3126} {"train_loss": -6.676634311676025, "global_step": 131310, "epoch": 3126} {"train_loss": -6.494960784912109, "global_step": 131311, "epoch": 3126} {"train_loss": -6.69130802154541, "global_step": 131312, "epoch": 3126} {"train_loss": -6.46953010559082, "global_step": 131313, "epoch": 3126} {"train_loss": -6.57671594619751, "global_step": 131314, "epoch": 3126} {"train_loss": -6.603909492492676, "global_step": 131315, "epoch": 3126} {"train_loss": -6.74417781829834, "global_step": 131316, "epoch": 3126} {"train_loss": -6.673080921173096, "global_step": 131317, "epoch": 3126} {"train_loss": -6.502829074859619, "global_step": 131318, "epoch": 3126} {"train_loss": -6.705765247344971, "global_step": 131319, "epoch": 3126} {"train_loss": -6.656875133514404, "global_step": 131320, "epoch": 3126} {"train_loss": -6.597776889801025, "global_step": 131321, "epoch": 3126} {"train_loss": -6.621527671813965, "global_step": 131322, "epoch": 3126} {"train_loss": -6.5886359214782715, "global_step": 131323, "epoch": 3126} {"train_loss": -6.582850456237793, "global_step": 131324, "epoch": 3126} {"train_loss": -6.654863357543945, "global_step": 131325, "epoch": 3126} {"train_loss": -6.545716762542725, "global_step": 131326, "epoch": 3126} {"train_loss": -6.5706467628479, "global_step": 131327, "epoch": 3126} {"train_loss": -6.686927795410156, "global_step": 131328, "epoch": 3126} {"train_loss": -6.67188835144043, "global_step": 131329, "epoch": 3126} {"train_loss": -6.728133201599121, "global_step": 131330, "epoch": 3126} {"train_loss": -6.681632995605469, "global_step": 131331, "epoch": 3126} {"train_loss": -6.72414493560791, "global_step": 131332, "epoch": 3126} {"train_loss": -6.630382878439767, "global_step": 131333, "epoch": 3126, "val_loss": 68110.0078125} {"train_loss": -6.7425737380981445, "global_step": 131334, "epoch": 3127} {"train_loss": -6.652091979980469, "global_step": 131335, "epoch": 3127} {"train_loss": -6.695634841918945, "global_step": 131336, "epoch": 3127} {"train_loss": -6.656337738037109, "global_step": 131337, "epoch": 3127} {"train_loss": -6.636776924133301, "global_step": 131338, "epoch": 3127} {"train_loss": -6.682164669036865, "global_step": 131339, "epoch": 3127} {"train_loss": -6.614866733551025, "global_step": 131340, "epoch": 3127} {"train_loss": -6.60954475402832, "global_step": 131341, "epoch": 3127} {"train_loss": -6.605023384094238, "global_step": 131342, "epoch": 3127} {"train_loss": -6.795072555541992, "global_step": 131343, "epoch": 3127} {"train_loss": -6.699422836303711, "global_step": 131344, "epoch": 3127} {"train_loss": -6.716195106506348, "global_step": 131345, "epoch": 3127} {"train_loss": -6.70130729675293, "global_step": 131346, "epoch": 3127} {"train_loss": -6.6307878494262695, "global_step": 131347, "epoch": 3127} {"train_loss": -6.747738838195801, "global_step": 131348, "epoch": 3127} {"train_loss": -6.707221031188965, "global_step": 131349, "epoch": 3127} {"train_loss": -6.667289733886719, "global_step": 131350, "epoch": 3127} {"train_loss": -6.644296646118164, "global_step": 131351, "epoch": 3127} {"train_loss": -6.64341402053833, "global_step": 131352, "epoch": 3127} {"train_loss": -6.655515670776367, "global_step": 131353, "epoch": 3127} {"train_loss": -6.493500709533691, "global_step": 131354, "epoch": 3127} {"train_loss": -6.658512115478516, "global_step": 131355, "epoch": 3127} {"train_loss": -6.704180717468262, "global_step": 131356, "epoch": 3127} {"train_loss": -6.629900932312012, "global_step": 131357, "epoch": 3127} {"train_loss": -6.558218002319336, "global_step": 131358, "epoch": 3127} {"train_loss": -6.660926818847656, "global_step": 131359, "epoch": 3127} {"train_loss": -6.621950149536133, "global_step": 131360, "epoch": 3127} {"train_loss": -6.559941291809082, "global_step": 131361, "epoch": 3127} {"train_loss": -6.602648735046387, "global_step": 131362, "epoch": 3127} {"train_loss": -6.61921501159668, "global_step": 131363, "epoch": 3127} {"train_loss": -6.57838249206543, "global_step": 131364, "epoch": 3127} {"train_loss": -6.6437225341796875, "global_step": 131365, "epoch": 3127} {"train_loss": -6.671444892883301, "global_step": 131366, "epoch": 3127} {"train_loss": -6.642719268798828, "global_step": 131367, "epoch": 3127} {"train_loss": -6.687888145446777, "global_step": 131368, "epoch": 3127} {"train_loss": -6.631530284881592, "global_step": 131369, "epoch": 3127} {"train_loss": -6.631033897399902, "global_step": 131370, "epoch": 3127} {"train_loss": -6.634899139404297, "global_step": 131371, "epoch": 3127} {"train_loss": -6.48278284072876, "global_step": 131372, "epoch": 3127} {"train_loss": -6.613714694976807, "global_step": 131373, "epoch": 3127} {"train_loss": -6.594750881195068, "global_step": 131374, "epoch": 3127} {"train_loss": -6.644450380688622, "global_step": 131375, "epoch": 3127, "val_loss": 68217.7734375} {"train_loss": -6.651391983032227, "global_step": 131376, "epoch": 3128} {"train_loss": -6.558279037475586, "global_step": 131377, "epoch": 3128} {"train_loss": -6.52876091003418, "global_step": 131378, "epoch": 3128} {"train_loss": -6.60825252532959, "global_step": 131379, "epoch": 3128} {"train_loss": -6.617075443267822, "global_step": 131380, "epoch": 3128} {"train_loss": -6.721209526062012, "global_step": 131381, "epoch": 3128} {"train_loss": -6.7329230308532715, "global_step": 131382, "epoch": 3128} {"train_loss": -6.625253200531006, "global_step": 131383, "epoch": 3128} {"train_loss": -6.6634063720703125, "global_step": 131384, "epoch": 3128} {"train_loss": -6.606306552886963, "global_step": 131385, "epoch": 3128} {"train_loss": -6.717618942260742, "global_step": 131386, "epoch": 3128} {"train_loss": -6.618589401245117, "global_step": 131387, "epoch": 3128} {"train_loss": -6.725305557250977, "global_step": 131388, "epoch": 3128} {"train_loss": -6.672050952911377, "global_step": 131389, "epoch": 3128} {"train_loss": -6.694153785705566, "global_step": 131390, "epoch": 3128} {"train_loss": -6.759062767028809, "global_step": 131391, "epoch": 3128} {"train_loss": -6.7042107582092285, "global_step": 131392, "epoch": 3128} {"train_loss": -6.701876163482666, "global_step": 131393, "epoch": 3128} {"train_loss": -6.632076740264893, "global_step": 131394, "epoch": 3128} {"train_loss": -6.696502208709717, "global_step": 131395, "epoch": 3128} {"train_loss": -6.627302169799805, "global_step": 131396, "epoch": 3128} {"train_loss": -6.723090648651123, "global_step": 131397, "epoch": 3128} {"train_loss": -6.740722179412842, "global_step": 131398, "epoch": 3128} {"train_loss": -6.545832633972168, "global_step": 131399, "epoch": 3128} {"train_loss": -6.598893165588379, "global_step": 131400, "epoch": 3128} {"train_loss": -6.66684627532959, "global_step": 131401, "epoch": 3128} {"train_loss": -6.598427772521973, "global_step": 131402, "epoch": 3128} {"train_loss": -6.530221462249756, "global_step": 131403, "epoch": 3128} {"train_loss": -6.596982479095459, "global_step": 131404, "epoch": 3128} {"train_loss": -6.6846089363098145, "global_step": 131405, "epoch": 3128} {"train_loss": -6.571582794189453, "global_step": 131406, "epoch": 3128} {"train_loss": -6.764008045196533, "global_step": 131407, "epoch": 3128} {"train_loss": -6.6659746170043945, "global_step": 131408, "epoch": 3128} {"train_loss": -6.69251012802124, "global_step": 131409, "epoch": 3128} {"train_loss": -6.536179065704346, "global_step": 131410, "epoch": 3128} {"train_loss": -6.642642974853516, "global_step": 131411, "epoch": 3128} {"train_loss": -6.67214298248291, "global_step": 131412, "epoch": 3128} {"train_loss": -6.79253625869751, "global_step": 131413, "epoch": 3128} {"train_loss": -6.7089762687683105, "global_step": 131414, "epoch": 3128} {"train_loss": -6.736557960510254, "global_step": 131415, "epoch": 3128} {"train_loss": -6.758116245269775, "global_step": 131416, "epoch": 3128} {"train_loss": -6.662011714208694, "global_step": 131417, "epoch": 3128, "val_loss": 68153.296875} {"train_loss": -6.623032569885254, "global_step": 131418, "epoch": 3129} {"train_loss": -6.628307342529297, "global_step": 131419, "epoch": 3129} {"train_loss": -6.687854766845703, "global_step": 131420, "epoch": 3129} {"train_loss": -6.710616111755371, "global_step": 131421, "epoch": 3129} {"train_loss": -6.677534580230713, "global_step": 131422, "epoch": 3129} {"train_loss": -6.664680480957031, "global_step": 131423, "epoch": 3129} {"train_loss": -6.751172065734863, "global_step": 131424, "epoch": 3129} {"train_loss": -6.680018424987793, "global_step": 131425, "epoch": 3129} {"train_loss": -6.655193328857422, "global_step": 131426, "epoch": 3129} {"train_loss": -6.635710716247559, "global_step": 131427, "epoch": 3129} {"train_loss": -6.808909893035889, "global_step": 131428, "epoch": 3129} {"train_loss": -6.628053665161133, "global_step": 131429, "epoch": 3129} {"train_loss": -6.638373374938965, "global_step": 131430, "epoch": 3129} {"train_loss": -6.609667778015137, "global_step": 131431, "epoch": 3129} {"train_loss": -6.711517333984375, "global_step": 131432, "epoch": 3129} {"train_loss": -6.567427158355713, "global_step": 131433, "epoch": 3129} {"train_loss": -6.616971015930176, "global_step": 131434, "epoch": 3129} {"train_loss": -6.544036865234375, "global_step": 131435, "epoch": 3129} {"train_loss": -6.6465253829956055, "global_step": 131436, "epoch": 3129} {"train_loss": -6.659095764160156, "global_step": 131437, "epoch": 3129} {"train_loss": -6.641641139984131, "global_step": 131438, "epoch": 3129} {"train_loss": -6.652498245239258, "global_step": 131439, "epoch": 3129} {"train_loss": -6.659626483917236, "global_step": 131440, "epoch": 3129} {"train_loss": -6.7046098709106445, "global_step": 131441, "epoch": 3129} {"train_loss": -6.557569980621338, "global_step": 131442, "epoch": 3129} {"train_loss": -6.595485210418701, "global_step": 131443, "epoch": 3129} {"train_loss": -6.591208457946777, "global_step": 131444, "epoch": 3129} {"train_loss": -6.752237796783447, "global_step": 131445, "epoch": 3129} {"train_loss": -6.68414306640625, "global_step": 131446, "epoch": 3129} {"train_loss": -6.647865295410156, "global_step": 131447, "epoch": 3129} {"train_loss": -6.490992546081543, "global_step": 131448, "epoch": 3129} {"train_loss": -6.7324538230896, "global_step": 131449, "epoch": 3129} {"train_loss": -6.572437286376953, "global_step": 131450, "epoch": 3129} {"train_loss": -6.5276689529418945, "global_step": 131451, "epoch": 3129} {"train_loss": -6.57960844039917, "global_step": 131452, "epoch": 3129} {"train_loss": -6.459853172302246, "global_step": 131453, "epoch": 3129} {"train_loss": -6.524336814880371, "global_step": 131454, "epoch": 3129} {"train_loss": -6.396697044372559, "global_step": 131455, "epoch": 3129} {"train_loss": -6.576684951782227, "global_step": 131456, "epoch": 3129} {"train_loss": -6.639389991760254, "global_step": 131457, "epoch": 3129} {"train_loss": -6.406599044799805, "global_step": 131458, "epoch": 3129} {"train_loss": -6.624513342266991, "global_step": 131459, "epoch": 3129, "val_loss": 68529.7890625} {"train_loss": -6.60194206237793, "global_step": 131460, "epoch": 3130} {"train_loss": -6.594230651855469, "global_step": 131461, "epoch": 3130} {"train_loss": -6.639196395874023, "global_step": 131462, "epoch": 3130} {"train_loss": -6.651797294616699, "global_step": 131463, "epoch": 3130} {"train_loss": -6.647253036499023, "global_step": 131464, "epoch": 3130} {"train_loss": -6.485131740570068, "global_step": 131465, "epoch": 3130} {"train_loss": -6.5896077156066895, "global_step": 131466, "epoch": 3130} {"train_loss": -6.472550392150879, "global_step": 131467, "epoch": 3130} {"train_loss": -6.647914886474609, "global_step": 131468, "epoch": 3130} {"train_loss": -6.632944107055664, "global_step": 131469, "epoch": 3130} {"train_loss": -6.590762615203857, "global_step": 131470, "epoch": 3130} {"train_loss": -6.5226969718933105, "global_step": 131471, "epoch": 3130} {"train_loss": -6.394091606140137, "global_step": 131472, "epoch": 3130} {"train_loss": -6.642058372497559, "global_step": 131473, "epoch": 3130} {"train_loss": -6.508579254150391, "global_step": 131474, "epoch": 3130} {"train_loss": -6.6405792236328125, "global_step": 131475, "epoch": 3130} {"train_loss": -6.641411781311035, "global_step": 131476, "epoch": 3130} {"train_loss": -6.670072555541992, "global_step": 131477, "epoch": 3130} {"train_loss": -6.5356597900390625, "global_step": 131478, "epoch": 3130} {"train_loss": -6.541469097137451, "global_step": 131479, "epoch": 3130} {"train_loss": -6.4934983253479, "global_step": 131480, "epoch": 3130} {"train_loss": -6.567416191101074, "global_step": 131481, "epoch": 3130} {"train_loss": -6.575313568115234, "global_step": 131482, "epoch": 3130} {"train_loss": -6.483241558074951, "global_step": 131483, "epoch": 3130} {"train_loss": -6.662671089172363, "global_step": 131484, "epoch": 3130} {"train_loss": -6.609246253967285, "global_step": 131485, "epoch": 3130} {"train_loss": -6.714058876037598, "global_step": 131486, "epoch": 3130} {"train_loss": -6.59800910949707, "global_step": 131487, "epoch": 3130} {"train_loss": -6.67410945892334, "global_step": 131488, "epoch": 3130} {"train_loss": -6.687335968017578, "global_step": 131489, "epoch": 3130} {"train_loss": -6.727142333984375, "global_step": 131490, "epoch": 3130} {"train_loss": -6.572211265563965, "global_step": 131491, "epoch": 3130} {"train_loss": -6.624401092529297, "global_step": 131492, "epoch": 3130} {"train_loss": -6.7387518882751465, "global_step": 131493, "epoch": 3130} {"train_loss": -6.78128719329834, "global_step": 131494, "epoch": 3130} {"train_loss": -6.717606067657471, "global_step": 131495, "epoch": 3130} {"train_loss": -6.563375473022461, "global_step": 131496, "epoch": 3130} {"train_loss": -6.695971488952637, "global_step": 131497, "epoch": 3130} {"train_loss": -6.527495384216309, "global_step": 131498, "epoch": 3130} {"train_loss": -6.7030720710754395, "global_step": 131499, "epoch": 3130} {"train_loss": -6.744818687438965, "global_step": 131500, "epoch": 3130} {"train_loss": -6.6104528449830555, "global_step": 131501, "epoch": 3130, "val_loss": 68071.9921875} {"train_loss": -6.666015148162842, "global_step": 131502, "epoch": 3131} {"train_loss": -6.599226951599121, "global_step": 131503, "epoch": 3131} {"train_loss": -6.620721340179443, "global_step": 131504, "epoch": 3131} {"train_loss": -6.541738033294678, "global_step": 131505, "epoch": 3131} {"train_loss": -6.641166687011719, "global_step": 131506, "epoch": 3131} {"train_loss": -6.5902838706970215, "global_step": 131507, "epoch": 3131} {"train_loss": -6.530535697937012, "global_step": 131508, "epoch": 3131} {"train_loss": -6.6716508865356445, "global_step": 131509, "epoch": 3131} {"train_loss": -6.562396049499512, "global_step": 131510, "epoch": 3131} {"train_loss": -6.585188865661621, "global_step": 131511, "epoch": 3131} {"train_loss": -6.626913070678711, "global_step": 131512, "epoch": 3131} {"train_loss": -6.5614423751831055, "global_step": 131513, "epoch": 3131} {"train_loss": -6.528409481048584, "global_step": 131514, "epoch": 3131} {"train_loss": -6.594160079956055, "global_step": 131515, "epoch": 3131} {"train_loss": -6.690235137939453, "global_step": 131516, "epoch": 3131} {"train_loss": -6.595180511474609, "global_step": 131517, "epoch": 3131} {"train_loss": -6.6720428466796875, "global_step": 131518, "epoch": 3131} {"train_loss": -6.7274370193481445, "global_step": 131519, "epoch": 3131} {"train_loss": -6.73785924911499, "global_step": 131520, "epoch": 3131} {"train_loss": -6.609105110168457, "global_step": 131521, "epoch": 3131} {"train_loss": -6.651172161102295, "global_step": 131522, "epoch": 3131} {"train_loss": -6.70272159576416, "global_step": 131523, "epoch": 3131} {"train_loss": -6.453508377075195, "global_step": 131524, "epoch": 3131} {"train_loss": -6.588543891906738, "global_step": 131525, "epoch": 3131} {"train_loss": -6.639966011047363, "global_step": 131526, "epoch": 3131} {"train_loss": -6.535700798034668, "global_step": 131527, "epoch": 3131} {"train_loss": -6.595980167388916, "global_step": 131528, "epoch": 3131} {"train_loss": -6.672354698181152, "global_step": 131529, "epoch": 3131} {"train_loss": -6.5088701248168945, "global_step": 131530, "epoch": 3131} {"train_loss": -6.544814109802246, "global_step": 131531, "epoch": 3131} {"train_loss": -6.605276584625244, "global_step": 131532, "epoch": 3131} {"train_loss": -6.4663777351379395, "global_step": 131533, "epoch": 3131} {"train_loss": -6.6370062828063965, "global_step": 131534, "epoch": 3131} {"train_loss": -6.516120910644531, "global_step": 131535, "epoch": 3131} {"train_loss": -6.513210773468018, "global_step": 131536, "epoch": 3131} {"train_loss": -6.470768451690674, "global_step": 131537, "epoch": 3131} {"train_loss": -6.517049312591553, "global_step": 131538, "epoch": 3131} {"train_loss": -6.588008880615234, "global_step": 131539, "epoch": 3131} {"train_loss": -6.560717582702637, "global_step": 131540, "epoch": 3131} {"train_loss": -6.369915008544922, "global_step": 131541, "epoch": 3131} {"train_loss": -6.649531364440918, "global_step": 131542, "epoch": 3131} {"train_loss": -6.58465854326884, "global_step": 131543, "epoch": 3131, "val_loss": 68530.2578125} {"train_loss": -6.454797267913818, "global_step": 131544, "epoch": 3132} {"train_loss": -6.547622203826904, "global_step": 131545, "epoch": 3132} {"train_loss": -6.563232421875, "global_step": 131546, "epoch": 3132} {"train_loss": -6.438392639160156, "global_step": 131547, "epoch": 3132} {"train_loss": -6.602497100830078, "global_step": 131548, "epoch": 3132} {"train_loss": -6.6223649978637695, "global_step": 131549, "epoch": 3132} {"train_loss": -6.527405261993408, "global_step": 131550, "epoch": 3132} {"train_loss": -6.6156134605407715, "global_step": 131551, "epoch": 3132} {"train_loss": -6.720730304718018, "global_step": 131552, "epoch": 3132} {"train_loss": -6.580868721008301, "global_step": 131553, "epoch": 3132} {"train_loss": -6.610354423522949, "global_step": 131554, "epoch": 3132} {"train_loss": -6.555665969848633, "global_step": 131555, "epoch": 3132} {"train_loss": -6.540230751037598, "global_step": 131556, "epoch": 3132} {"train_loss": -6.597078323364258, "global_step": 131557, "epoch": 3132} {"train_loss": -6.545389175415039, "global_step": 131558, "epoch": 3132} {"train_loss": -6.615067005157471, "global_step": 131559, "epoch": 3132} {"train_loss": -6.577442169189453, "global_step": 131560, "epoch": 3132} {"train_loss": -6.605467796325684, "global_step": 131561, "epoch": 3132} {"train_loss": -6.718064308166504, "global_step": 131562, "epoch": 3132} {"train_loss": -6.559989929199219, "global_step": 131563, "epoch": 3132} {"train_loss": -6.532558917999268, "global_step": 131564, "epoch": 3132} {"train_loss": -6.577546119689941, "global_step": 131565, "epoch": 3132} {"train_loss": -6.621384143829346, "global_step": 131566, "epoch": 3132} {"train_loss": -6.53704833984375, "global_step": 131567, "epoch": 3132} {"train_loss": -6.599257946014404, "global_step": 131568, "epoch": 3132} {"train_loss": -6.712530136108398, "global_step": 131569, "epoch": 3132} {"train_loss": -6.548955917358398, "global_step": 131570, "epoch": 3132} {"train_loss": -6.605996131896973, "global_step": 131571, "epoch": 3132} {"train_loss": -6.674994468688965, "global_step": 131572, "epoch": 3132} {"train_loss": -6.671989440917969, "global_step": 131573, "epoch": 3132} {"train_loss": -6.630537033081055, "global_step": 131574, "epoch": 3132} {"train_loss": -6.6495041847229, "global_step": 131575, "epoch": 3132} {"train_loss": -6.714468002319336, "global_step": 131576, "epoch": 3132} {"train_loss": -6.582525253295898, "global_step": 131577, "epoch": 3132} {"train_loss": -6.690126895904541, "global_step": 131578, "epoch": 3132} {"train_loss": -6.633296489715576, "global_step": 131579, "epoch": 3132} {"train_loss": -6.551295280456543, "global_step": 131580, "epoch": 3132} {"train_loss": -6.555624008178711, "global_step": 131581, "epoch": 3132} {"train_loss": -6.696244716644287, "global_step": 131582, "epoch": 3132} {"train_loss": -6.667182922363281, "global_step": 131583, "epoch": 3132} {"train_loss": -6.711345672607422, "global_step": 131584, "epoch": 3132} {"train_loss": -6.602704911004929, "global_step": 131585, "epoch": 3132, "val_loss": 68168.1015625} {"train_loss": -6.636535167694092, "global_step": 131586, "epoch": 3133} {"train_loss": -6.621344566345215, "global_step": 131587, "epoch": 3133} {"train_loss": -6.625741004943848, "global_step": 131588, "epoch": 3133} {"train_loss": -6.715054988861084, "global_step": 131589, "epoch": 3133} {"train_loss": -6.577767372131348, "global_step": 131590, "epoch": 3133} {"train_loss": -6.644675254821777, "global_step": 131591, "epoch": 3133} {"train_loss": -6.668505668640137, "global_step": 131592, "epoch": 3133} {"train_loss": -6.58913516998291, "global_step": 131593, "epoch": 3133} {"train_loss": -6.577040672302246, "global_step": 131594, "epoch": 3133} {"train_loss": -6.690131187438965, "global_step": 131595, "epoch": 3133} {"train_loss": -6.7143449783325195, "global_step": 131596, "epoch": 3133} {"train_loss": -6.685199737548828, "global_step": 131597, "epoch": 3133} {"train_loss": -6.6486663818359375, "global_step": 131598, "epoch": 3133} {"train_loss": -6.709832191467285, "global_step": 131599, "epoch": 3133} {"train_loss": -6.49444580078125, "global_step": 131600, "epoch": 3133} {"train_loss": -6.574521064758301, "global_step": 131601, "epoch": 3133} {"train_loss": -6.574037075042725, "global_step": 131602, "epoch": 3133} {"train_loss": -6.622218132019043, "global_step": 131603, "epoch": 3133} {"train_loss": -6.6834716796875, "global_step": 131604, "epoch": 3133} {"train_loss": -6.4830827713012695, "global_step": 131605, "epoch": 3133} {"train_loss": -6.622235298156738, "global_step": 131606, "epoch": 3133} {"train_loss": -6.650060653686523, "global_step": 131607, "epoch": 3133} {"train_loss": -6.64312744140625, "global_step": 131608, "epoch": 3133} {"train_loss": -6.707728862762451, "global_step": 131609, "epoch": 3133} {"train_loss": -6.6397385597229, "global_step": 131610, "epoch": 3133} {"train_loss": -6.567330360412598, "global_step": 131611, "epoch": 3133} {"train_loss": -6.6243462562561035, "global_step": 131612, "epoch": 3133} {"train_loss": -6.675972938537598, "global_step": 131613, "epoch": 3133} {"train_loss": -6.74577522277832, "global_step": 131614, "epoch": 3133} {"train_loss": -6.746960163116455, "global_step": 131615, "epoch": 3133} {"train_loss": -6.62208890914917, "global_step": 131616, "epoch": 3133} {"train_loss": -6.641899585723877, "global_step": 131617, "epoch": 3133} {"train_loss": -6.69365119934082, "global_step": 131618, "epoch": 3133} {"train_loss": -6.6880598068237305, "global_step": 131619, "epoch": 3133} {"train_loss": -6.672368049621582, "global_step": 131620, "epoch": 3133} {"train_loss": -6.838309288024902, "global_step": 131621, "epoch": 3133} {"train_loss": -6.728992462158203, "global_step": 131622, "epoch": 3133} {"train_loss": -6.687224388122559, "global_step": 131623, "epoch": 3133} {"train_loss": -6.740633487701416, "global_step": 131624, "epoch": 3133} {"train_loss": -6.702847480773926, "global_step": 131625, "epoch": 3133} {"train_loss": -6.855496883392334, "global_step": 131626, "epoch": 3133} {"train_loss": -6.660299017315819, "global_step": 131627, "epoch": 3133, "val_loss": 68071.3671875} {"train_loss": -6.752135276794434, "global_step": 131628, "epoch": 3134} {"train_loss": -6.630983352661133, "global_step": 131629, "epoch": 3134} {"train_loss": -6.637119293212891, "global_step": 131630, "epoch": 3134} {"train_loss": -6.722083568572998, "global_step": 131631, "epoch": 3134} {"train_loss": -6.700366973876953, "global_step": 131632, "epoch": 3134} {"train_loss": -6.760074138641357, "global_step": 131633, "epoch": 3134} {"train_loss": -6.553906440734863, "global_step": 131634, "epoch": 3134} {"train_loss": -6.629058837890625, "global_step": 131635, "epoch": 3134} {"train_loss": -6.646146297454834, "global_step": 131636, "epoch": 3134} {"train_loss": -6.658928871154785, "global_step": 131637, "epoch": 3134} {"train_loss": -6.745284080505371, "global_step": 131638, "epoch": 3134} {"train_loss": -6.674704551696777, "global_step": 131639, "epoch": 3134} {"train_loss": -6.583743095397949, "global_step": 131640, "epoch": 3134} {"train_loss": -6.640543460845947, "global_step": 131641, "epoch": 3134} {"train_loss": -6.560153007507324, "global_step": 131642, "epoch": 3134} {"train_loss": -6.648988723754883, "global_step": 131643, "epoch": 3134} {"train_loss": -6.710960865020752, "global_step": 131644, "epoch": 3134} {"train_loss": -6.564342498779297, "global_step": 131645, "epoch": 3134} {"train_loss": -6.62392520904541, "global_step": 131646, "epoch": 3134} {"train_loss": -6.5542402267456055, "global_step": 131647, "epoch": 3134} {"train_loss": -6.572719573974609, "global_step": 131648, "epoch": 3134} {"train_loss": -6.603148460388184, "global_step": 131649, "epoch": 3134} {"train_loss": -6.589750289916992, "global_step": 131650, "epoch": 3134} {"train_loss": -6.6361985206604, "global_step": 131651, "epoch": 3134} {"train_loss": -6.637998104095459, "global_step": 131652, "epoch": 3134} {"train_loss": -6.584761142730713, "global_step": 131653, "epoch": 3134} {"train_loss": -6.6388773918151855, "global_step": 131654, "epoch": 3134} {"train_loss": -6.59962272644043, "global_step": 131655, "epoch": 3134} {"train_loss": -6.66087532043457, "global_step": 131656, "epoch": 3134} {"train_loss": -6.635483741760254, "global_step": 131657, "epoch": 3134} {"train_loss": -6.631041526794434, "global_step": 131658, "epoch": 3134} {"train_loss": -6.621819019317627, "global_step": 131659, "epoch": 3134} {"train_loss": -6.616504669189453, "global_step": 131660, "epoch": 3134} {"train_loss": -6.674531936645508, "global_step": 131661, "epoch": 3134} {"train_loss": -6.634535312652588, "global_step": 131662, "epoch": 3134} {"train_loss": -6.417139053344727, "global_step": 131663, "epoch": 3134} {"train_loss": -6.648950576782227, "global_step": 131664, "epoch": 3134} {"train_loss": -6.564723491668701, "global_step": 131665, "epoch": 3134} {"train_loss": -6.655714988708496, "global_step": 131666, "epoch": 3134} {"train_loss": -6.607257843017578, "global_step": 131667, "epoch": 3134} {"train_loss": -6.55275821685791, "global_step": 131668, "epoch": 3134} {"train_loss": -6.630187477384295, "global_step": 131669, "epoch": 3134, "val_loss": 68223.171875} {"train_loss": -6.777182579040527, "global_step": 131670, "epoch": 3135} {"train_loss": -6.693878650665283, "global_step": 131671, "epoch": 3135} {"train_loss": -6.671536445617676, "global_step": 131672, "epoch": 3135} {"train_loss": -6.6936492919921875, "global_step": 131673, "epoch": 3135} {"train_loss": -6.599886894226074, "global_step": 131674, "epoch": 3135} {"train_loss": -6.702017784118652, "global_step": 131675, "epoch": 3135} {"train_loss": -6.593106269836426, "global_step": 131676, "epoch": 3135} {"train_loss": -6.619728088378906, "global_step": 131677, "epoch": 3135} {"train_loss": -6.726217269897461, "global_step": 131678, "epoch": 3135} {"train_loss": -6.654499053955078, "global_step": 131679, "epoch": 3135} {"train_loss": -6.613912105560303, "global_step": 131680, "epoch": 3135} {"train_loss": -6.630712985992432, "global_step": 131681, "epoch": 3135} {"train_loss": -6.66929817199707, "global_step": 131682, "epoch": 3135} {"train_loss": -6.628006458282471, "global_step": 131683, "epoch": 3135} {"train_loss": -6.674829959869385, "global_step": 131684, "epoch": 3135} {"train_loss": -6.604465484619141, "global_step": 131685, "epoch": 3135} {"train_loss": -6.619823455810547, "global_step": 131686, "epoch": 3135} {"train_loss": -6.68831729888916, "global_step": 131687, "epoch": 3135} {"train_loss": -6.648392677307129, "global_step": 131688, "epoch": 3135} {"train_loss": -6.689664363861084, "global_step": 131689, "epoch": 3135} {"train_loss": -6.557056427001953, "global_step": 131690, "epoch": 3135} {"train_loss": -6.614062309265137, "global_step": 131691, "epoch": 3135} {"train_loss": -6.695553779602051, "global_step": 131692, "epoch": 3135} {"train_loss": -6.707148551940918, "global_step": 131693, "epoch": 3135} {"train_loss": -6.647017955780029, "global_step": 131694, "epoch": 3135} {"train_loss": -6.683180809020996, "global_step": 131695, "epoch": 3135} {"train_loss": -6.67763614654541, "global_step": 131696, "epoch": 3135} {"train_loss": -6.707719802856445, "global_step": 131697, "epoch": 3135} {"train_loss": -6.61968469619751, "global_step": 131698, "epoch": 3135} {"train_loss": -6.716493129730225, "global_step": 131699, "epoch": 3135} {"train_loss": -6.616039276123047, "global_step": 131700, "epoch": 3135} {"train_loss": -6.596147060394287, "global_step": 131701, "epoch": 3135} {"train_loss": -6.629945278167725, "global_step": 131702, "epoch": 3135} {"train_loss": -6.729098320007324, "global_step": 131703, "epoch": 3135} {"train_loss": -6.710841178894043, "global_step": 131704, "epoch": 3135} {"train_loss": -6.567441940307617, "global_step": 131705, "epoch": 3135} {"train_loss": -6.714735984802246, "global_step": 131706, "epoch": 3135} {"train_loss": -6.6022748947143555, "global_step": 131707, "epoch": 3135} {"train_loss": -6.521205425262451, "global_step": 131708, "epoch": 3135} {"train_loss": -6.548108100891113, "global_step": 131709, "epoch": 3135} {"train_loss": -6.587089538574219, "global_step": 131710, "epoch": 3135} {"train_loss": -6.649197464897519, "global_step": 131711, "epoch": 3135, "val_loss": 68075.015625} {"train_loss": -6.72452449798584, "global_step": 131712, "epoch": 3136} {"train_loss": -6.596466541290283, "global_step": 131713, "epoch": 3136} {"train_loss": -6.631318092346191, "global_step": 131714, "epoch": 3136} {"train_loss": -6.628133296966553, "global_step": 131715, "epoch": 3136} {"train_loss": -6.648465156555176, "global_step": 131716, "epoch": 3136} {"train_loss": -6.640870094299316, "global_step": 131717, "epoch": 3136} {"train_loss": -6.509762763977051, "global_step": 131718, "epoch": 3136} {"train_loss": -6.643476486206055, "global_step": 131719, "epoch": 3136} {"train_loss": -6.606456756591797, "global_step": 131720, "epoch": 3136} {"train_loss": -6.741079330444336, "global_step": 131721, "epoch": 3136} {"train_loss": -6.706775665283203, "global_step": 131722, "epoch": 3136} {"train_loss": -6.596766471862793, "global_step": 131723, "epoch": 3136} {"train_loss": -6.579603672027588, "global_step": 131724, "epoch": 3136} {"train_loss": -6.609584808349609, "global_step": 131725, "epoch": 3136} {"train_loss": -6.676698684692383, "global_step": 131726, "epoch": 3136} {"train_loss": -6.679430961608887, "global_step": 131727, "epoch": 3136} {"train_loss": -6.679928779602051, "global_step": 131728, "epoch": 3136} {"train_loss": -6.648608207702637, "global_step": 131729, "epoch": 3136} {"train_loss": -6.752049446105957, "global_step": 131730, "epoch": 3136} {"train_loss": -6.576540946960449, "global_step": 131731, "epoch": 3136} {"train_loss": -6.657167434692383, "global_step": 131732, "epoch": 3136} {"train_loss": -6.72251033782959, "global_step": 131733, "epoch": 3136} {"train_loss": -6.637637138366699, "global_step": 131734, "epoch": 3136} {"train_loss": -6.712128162384033, "global_step": 131735, "epoch": 3136} {"train_loss": -6.65470552444458, "global_step": 131736, "epoch": 3136} {"train_loss": -6.644871711730957, "global_step": 131737, "epoch": 3136} {"train_loss": -6.672194004058838, "global_step": 131738, "epoch": 3136} {"train_loss": -6.702632904052734, "global_step": 131739, "epoch": 3136} {"train_loss": -6.581912040710449, "global_step": 131740, "epoch": 3136} {"train_loss": -6.734601974487305, "global_step": 131741, "epoch": 3136} {"train_loss": -6.715489387512207, "global_step": 131742, "epoch": 3136} {"train_loss": -6.588656425476074, "global_step": 131743, "epoch": 3136} {"train_loss": -6.661428928375244, "global_step": 131744, "epoch": 3136} {"train_loss": -6.744640350341797, "global_step": 131745, "epoch": 3136} {"train_loss": -6.5849833488464355, "global_step": 131746, "epoch": 3136} {"train_loss": -6.575933933258057, "global_step": 131747, "epoch": 3136} {"train_loss": -6.60628604888916, "global_step": 131748, "epoch": 3136} {"train_loss": -6.660552024841309, "global_step": 131749, "epoch": 3136} {"train_loss": -6.642133712768555, "global_step": 131750, "epoch": 3136} {"train_loss": -6.76875114440918, "global_step": 131751, "epoch": 3136} {"train_loss": -6.692539215087891, "global_step": 131752, "epoch": 3136} {"train_loss": -6.655346756889706, "global_step": 131753, "epoch": 3136, "val_loss": 68218.796875} {"train_loss": -6.650501251220703, "global_step": 131754, "epoch": 3137} {"train_loss": -6.677407264709473, "global_step": 131755, "epoch": 3137} {"train_loss": -6.7131195068359375, "global_step": 131756, "epoch": 3137} {"train_loss": -6.716022491455078, "global_step": 131757, "epoch": 3137} {"train_loss": -6.609920024871826, "global_step": 131758, "epoch": 3137} {"train_loss": -6.656201362609863, "global_step": 131759, "epoch": 3137} {"train_loss": -6.647733211517334, "global_step": 131760, "epoch": 3137} {"train_loss": -6.574576377868652, "global_step": 131761, "epoch": 3137} {"train_loss": -6.655281066894531, "global_step": 131762, "epoch": 3137} {"train_loss": -6.632464408874512, "global_step": 131763, "epoch": 3137} {"train_loss": -6.640161991119385, "global_step": 131764, "epoch": 3137} {"train_loss": -6.748779773712158, "global_step": 131765, "epoch": 3137} {"train_loss": -6.689639091491699, "global_step": 131766, "epoch": 3137} {"train_loss": -6.4841532707214355, "global_step": 131767, "epoch": 3137} {"train_loss": -6.679072380065918, "global_step": 131768, "epoch": 3137} {"train_loss": -6.614222526550293, "global_step": 131769, "epoch": 3137} {"train_loss": -6.645509719848633, "global_step": 131770, "epoch": 3137} {"train_loss": -6.534642696380615, "global_step": 131771, "epoch": 3137} {"train_loss": -6.600795269012451, "global_step": 131772, "epoch": 3137} {"train_loss": -6.675633430480957, "global_step": 131773, "epoch": 3137} {"train_loss": -6.626578330993652, "global_step": 131774, "epoch": 3137} {"train_loss": -6.661774158477783, "global_step": 131775, "epoch": 3137} {"train_loss": -6.709835052490234, "global_step": 131776, "epoch": 3137} {"train_loss": -6.478184700012207, "global_step": 131777, "epoch": 3137} {"train_loss": -6.60615348815918, "global_step": 131778, "epoch": 3137} {"train_loss": -6.577751159667969, "global_step": 131779, "epoch": 3137} {"train_loss": -6.686071395874023, "global_step": 131780, "epoch": 3137} {"train_loss": -6.676678657531738, "global_step": 131781, "epoch": 3137} {"train_loss": -6.567776679992676, "global_step": 131782, "epoch": 3137} {"train_loss": -6.733924865722656, "global_step": 131783, "epoch": 3137} {"train_loss": -6.470204830169678, "global_step": 131784, "epoch": 3137} {"train_loss": -6.642340183258057, "global_step": 131785, "epoch": 3137} {"train_loss": -6.647046089172363, "global_step": 131786, "epoch": 3137} {"train_loss": -6.606971263885498, "global_step": 131787, "epoch": 3137} {"train_loss": -6.506982326507568, "global_step": 131788, "epoch": 3137} {"train_loss": -6.586469650268555, "global_step": 131789, "epoch": 3137} {"train_loss": -6.71682071685791, "global_step": 131790, "epoch": 3137} {"train_loss": -6.491429328918457, "global_step": 131791, "epoch": 3137} {"train_loss": -6.548091888427734, "global_step": 131792, "epoch": 3137} {"train_loss": -6.681801795959473, "global_step": 131793, "epoch": 3137} {"train_loss": -6.627373218536377, "global_step": 131794, "epoch": 3137} {"train_loss": -6.626921585627964, "global_step": 131795, "epoch": 3137, "val_loss": 68062.671875} {"train_loss": -6.584787845611572, "global_step": 131796, "epoch": 3138} {"train_loss": -6.647754669189453, "global_step": 131797, "epoch": 3138} {"train_loss": -6.683802604675293, "global_step": 131798, "epoch": 3138} {"train_loss": -6.692364692687988, "global_step": 131799, "epoch": 3138} {"train_loss": -6.626317024230957, "global_step": 131800, "epoch": 3138} {"train_loss": -6.589676856994629, "global_step": 131801, "epoch": 3138} {"train_loss": -6.571067810058594, "global_step": 131802, "epoch": 3138} {"train_loss": -6.500756740570068, "global_step": 131803, "epoch": 3138} {"train_loss": -6.596797943115234, "global_step": 131804, "epoch": 3138} {"train_loss": -6.599639415740967, "global_step": 131805, "epoch": 3138} {"train_loss": -6.564867973327637, "global_step": 131806, "epoch": 3138} {"train_loss": -6.590376853942871, "global_step": 131807, "epoch": 3138} {"train_loss": -6.64413595199585, "global_step": 131808, "epoch": 3138} {"train_loss": -6.621254920959473, "global_step": 131809, "epoch": 3138} {"train_loss": -6.682295799255371, "global_step": 131810, "epoch": 3138} {"train_loss": -6.548709869384766, "global_step": 131811, "epoch": 3138} {"train_loss": -6.649327278137207, "global_step": 131812, "epoch": 3138} {"train_loss": -6.534825325012207, "global_step": 131813, "epoch": 3138} {"train_loss": -6.5544657707214355, "global_step": 131814, "epoch": 3138} {"train_loss": -6.658666610717773, "global_step": 131815, "epoch": 3138} {"train_loss": -6.627978801727295, "global_step": 131816, "epoch": 3138} {"train_loss": -6.678727626800537, "global_step": 131817, "epoch": 3138} {"train_loss": -6.777199745178223, "global_step": 131818, "epoch": 3138} {"train_loss": -6.546489715576172, "global_step": 131819, "epoch": 3138} {"train_loss": -6.647894859313965, "global_step": 131820, "epoch": 3138} {"train_loss": -6.61519718170166, "global_step": 131821, "epoch": 3138} {"train_loss": -6.6419572830200195, "global_step": 131822, "epoch": 3138} {"train_loss": -6.807744979858398, "global_step": 131823, "epoch": 3138} {"train_loss": -6.685643196105957, "global_step": 131824, "epoch": 3138} {"train_loss": -6.587754726409912, "global_step": 131825, "epoch": 3138} {"train_loss": -6.616758346557617, "global_step": 131826, "epoch": 3138} {"train_loss": -6.72662353515625, "global_step": 131827, "epoch": 3138} {"train_loss": -6.658387184143066, "global_step": 131828, "epoch": 3138} {"train_loss": -6.68447208404541, "global_step": 131829, "epoch": 3138} {"train_loss": -6.6662678718566895, "global_step": 131830, "epoch": 3138} {"train_loss": -6.76698112487793, "global_step": 131831, "epoch": 3138} {"train_loss": -6.5508832931518555, "global_step": 131832, "epoch": 3138} {"train_loss": -6.645397186279297, "global_step": 131833, "epoch": 3138} {"train_loss": -6.612094879150391, "global_step": 131834, "epoch": 3138} {"train_loss": -6.555297374725342, "global_step": 131835, "epoch": 3138} {"train_loss": -6.6759443283081055, "global_step": 131836, "epoch": 3138} {"train_loss": -6.629989782969157, "global_step": 131837, "epoch": 3138, "val_loss": 68387.6875} {"train_loss": -6.515230178833008, "global_step": 131838, "epoch": 3139} {"train_loss": -6.742897033691406, "global_step": 131839, "epoch": 3139} {"train_loss": -6.541478157043457, "global_step": 131840, "epoch": 3139} {"train_loss": -6.6446638107299805, "global_step": 131841, "epoch": 3139} {"train_loss": -6.581995964050293, "global_step": 131842, "epoch": 3139} {"train_loss": -6.588104724884033, "global_step": 131843, "epoch": 3139} {"train_loss": -6.633724212646484, "global_step": 131844, "epoch": 3139} {"train_loss": -6.482994079589844, "global_step": 131845, "epoch": 3139} {"train_loss": -6.49818754196167, "global_step": 131846, "epoch": 3139} {"train_loss": -6.656972408294678, "global_step": 131847, "epoch": 3139} {"train_loss": -6.510540962219238, "global_step": 131848, "epoch": 3139} {"train_loss": -6.544468879699707, "global_step": 131849, "epoch": 3139} {"train_loss": -6.643092155456543, "global_step": 131850, "epoch": 3139} {"train_loss": -6.492768287658691, "global_step": 131851, "epoch": 3139} {"train_loss": -6.523464202880859, "global_step": 131852, "epoch": 3139} {"train_loss": -6.465503692626953, "global_step": 131853, "epoch": 3139} {"train_loss": -6.462207794189453, "global_step": 131854, "epoch": 3139} {"train_loss": -6.512044429779053, "global_step": 131855, "epoch": 3139} {"train_loss": -6.540703773498535, "global_step": 131856, "epoch": 3139} {"train_loss": -6.6013712882995605, "global_step": 131857, "epoch": 3139} {"train_loss": -6.756396293640137, "global_step": 131858, "epoch": 3139} {"train_loss": -6.5627593994140625, "global_step": 131859, "epoch": 3139} {"train_loss": -6.575589179992676, "global_step": 131860, "epoch": 3139} {"train_loss": -6.549125671386719, "global_step": 131861, "epoch": 3139} {"train_loss": -6.525531768798828, "global_step": 131862, "epoch": 3139} {"train_loss": -6.613575458526611, "global_step": 131863, "epoch": 3139} {"train_loss": -6.674347400665283, "global_step": 131864, "epoch": 3139} {"train_loss": -6.675471782684326, "global_step": 131865, "epoch": 3139} {"train_loss": -6.655747890472412, "global_step": 131866, "epoch": 3139} {"train_loss": -6.641862869262695, "global_step": 131867, "epoch": 3139} {"train_loss": -6.694027900695801, "global_step": 131868, "epoch": 3139} {"train_loss": -6.64776611328125, "global_step": 131869, "epoch": 3139} {"train_loss": -6.595242500305176, "global_step": 131870, "epoch": 3139} {"train_loss": -6.548117637634277, "global_step": 131871, "epoch": 3139} {"train_loss": -6.710709571838379, "global_step": 131872, "epoch": 3139} {"train_loss": -6.756561279296875, "global_step": 131873, "epoch": 3139} {"train_loss": -6.663474082946777, "global_step": 131874, "epoch": 3139} {"train_loss": -6.610775947570801, "global_step": 131875, "epoch": 3139} {"train_loss": -6.712080955505371, "global_step": 131876, "epoch": 3139} {"train_loss": -6.770227432250977, "global_step": 131877, "epoch": 3139} {"train_loss": -6.691805839538574, "global_step": 131878, "epoch": 3139} {"train_loss": -6.6080383119129, "global_step": 131879, "epoch": 3139, "val_loss": 68127.8984375} {"train_loss": -6.69428825378418, "global_step": 131880, "epoch": 3140} {"train_loss": -6.6743574142456055, "global_step": 131881, "epoch": 3140} {"train_loss": -6.741237640380859, "global_step": 131882, "epoch": 3140} {"train_loss": -6.567732810974121, "global_step": 131883, "epoch": 3140} {"train_loss": -6.676441669464111, "global_step": 131884, "epoch": 3140} {"train_loss": -6.684443473815918, "global_step": 131885, "epoch": 3140} {"train_loss": -6.6320271492004395, "global_step": 131886, "epoch": 3140} {"train_loss": -6.743220329284668, "global_step": 131887, "epoch": 3140} {"train_loss": -6.762526512145996, "global_step": 131888, "epoch": 3140} {"train_loss": -6.632162570953369, "global_step": 131889, "epoch": 3140} {"train_loss": -6.638463973999023, "global_step": 131890, "epoch": 3140} {"train_loss": -6.646993637084961, "global_step": 131891, "epoch": 3140} {"train_loss": -6.653348922729492, "global_step": 131892, "epoch": 3140} {"train_loss": -6.671586513519287, "global_step": 131893, "epoch": 3140} {"train_loss": -6.587584495544434, "global_step": 131894, "epoch": 3140} {"train_loss": -6.6692633628845215, "global_step": 131895, "epoch": 3140} {"train_loss": -6.563653469085693, "global_step": 131896, "epoch": 3140} {"train_loss": -6.656002998352051, "global_step": 131897, "epoch": 3140} {"train_loss": -6.698759078979492, "global_step": 131898, "epoch": 3140} {"train_loss": -6.811357498168945, "global_step": 131899, "epoch": 3140} {"train_loss": -6.796030521392822, "global_step": 131900, "epoch": 3140} {"train_loss": -6.688222885131836, "global_step": 131901, "epoch": 3140} {"train_loss": -6.673770904541016, "global_step": 131902, "epoch": 3140} {"train_loss": -6.61768913269043, "global_step": 131903, "epoch": 3140} {"train_loss": -6.643461227416992, "global_step": 131904, "epoch": 3140} {"train_loss": -6.783604145050049, "global_step": 131905, "epoch": 3140} {"train_loss": -6.5902509689331055, "global_step": 131906, "epoch": 3140} {"train_loss": -6.674154758453369, "global_step": 131907, "epoch": 3140} {"train_loss": -6.606073379516602, "global_step": 131908, "epoch": 3140} {"train_loss": -6.620240688323975, "global_step": 131909, "epoch": 3140} {"train_loss": -6.687904357910156, "global_step": 131910, "epoch": 3140} {"train_loss": -6.690560817718506, "global_step": 131911, "epoch": 3140} {"train_loss": -6.660525321960449, "global_step": 131912, "epoch": 3140} {"train_loss": -6.747183799743652, "global_step": 131913, "epoch": 3140} {"train_loss": -6.779336929321289, "global_step": 131914, "epoch": 3140} {"train_loss": -6.641642093658447, "global_step": 131915, "epoch": 3140} {"train_loss": -6.652676582336426, "global_step": 131916, "epoch": 3140} {"train_loss": -6.5392608642578125, "global_step": 131917, "epoch": 3140} {"train_loss": -6.550329685211182, "global_step": 131918, "epoch": 3140} {"train_loss": -6.5827813148498535, "global_step": 131919, "epoch": 3140} {"train_loss": -6.492762565612793, "global_step": 131920, "epoch": 3140} {"train_loss": -6.658510571434384, "global_step": 131921, "epoch": 3140, "val_loss": 68165.84375} {"train_loss": -6.613767623901367, "global_step": 131922, "epoch": 3141} {"train_loss": -6.464393615722656, "global_step": 131923, "epoch": 3141} {"train_loss": -6.476974010467529, "global_step": 131924, "epoch": 3141} {"train_loss": -6.549617767333984, "global_step": 131925, "epoch": 3141} {"train_loss": -6.594440937042236, "global_step": 131926, "epoch": 3141} {"train_loss": -6.635500431060791, "global_step": 131927, "epoch": 3141} {"train_loss": -6.44549560546875, "global_step": 131928, "epoch": 3141} {"train_loss": -6.735057353973389, "global_step": 131929, "epoch": 3141} {"train_loss": -6.640191078186035, "global_step": 131930, "epoch": 3141} {"train_loss": -6.788374900817871, "global_step": 131931, "epoch": 3141} {"train_loss": -6.570888519287109, "global_step": 131932, "epoch": 3141} {"train_loss": -6.60556697845459, "global_step": 131933, "epoch": 3141} {"train_loss": -6.592441082000732, "global_step": 131934, "epoch": 3141} {"train_loss": -6.576517105102539, "global_step": 131935, "epoch": 3141} {"train_loss": -6.635260581970215, "global_step": 131936, "epoch": 3141} {"train_loss": -6.680729866027832, "global_step": 131937, "epoch": 3141} {"train_loss": -6.607234954833984, "global_step": 131938, "epoch": 3141} {"train_loss": -6.576930046081543, "global_step": 131939, "epoch": 3141} {"train_loss": -6.741457462310791, "global_step": 131940, "epoch": 3141} {"train_loss": -6.713250160217285, "global_step": 131941, "epoch": 3141} {"train_loss": -6.699272632598877, "global_step": 131942, "epoch": 3141} {"train_loss": -6.612748146057129, "global_step": 131943, "epoch": 3141} {"train_loss": -6.620790958404541, "global_step": 131944, "epoch": 3141} {"train_loss": -6.541280746459961, "global_step": 131945, "epoch": 3141} {"train_loss": -6.739734649658203, "global_step": 131946, "epoch": 3141} {"train_loss": -6.624464988708496, "global_step": 131947, "epoch": 3141} {"train_loss": -6.577648162841797, "global_step": 131948, "epoch": 3141} {"train_loss": -6.640753269195557, "global_step": 131949, "epoch": 3141} {"train_loss": -6.547205924987793, "global_step": 131950, "epoch": 3141} {"train_loss": -6.505425930023193, "global_step": 131951, "epoch": 3141} {"train_loss": -6.548524856567383, "global_step": 131952, "epoch": 3141} {"train_loss": -6.4821929931640625, "global_step": 131953, "epoch": 3141} {"train_loss": -6.710320949554443, "global_step": 131954, "epoch": 3141} {"train_loss": -6.465291500091553, "global_step": 131955, "epoch": 3141} {"train_loss": -6.401409149169922, "global_step": 131956, "epoch": 3141} {"train_loss": -6.548519134521484, "global_step": 131957, "epoch": 3141} {"train_loss": -6.531827926635742, "global_step": 131958, "epoch": 3141} {"train_loss": -6.6746110916137695, "global_step": 131959, "epoch": 3141} {"train_loss": -6.389832019805908, "global_step": 131960, "epoch": 3141} {"train_loss": -6.640726089477539, "global_step": 131961, "epoch": 3141} {"train_loss": -6.595968723297119, "global_step": 131962, "epoch": 3141} {"train_loss": -6.593135141191029, "global_step": 131963, "epoch": 3141, "val_loss": 68258.9140625} {"train_loss": -6.547422885894775, "global_step": 131964, "epoch": 3142} {"train_loss": -6.725310325622559, "global_step": 131965, "epoch": 3142} {"train_loss": -6.619943141937256, "global_step": 131966, "epoch": 3142} {"train_loss": -6.56514310836792, "global_step": 131967, "epoch": 3142} {"train_loss": -6.495107650756836, "global_step": 131968, "epoch": 3142} {"train_loss": -6.586241245269775, "global_step": 131969, "epoch": 3142} {"train_loss": -6.607518196105957, "global_step": 131970, "epoch": 3142} {"train_loss": -6.610381126403809, "global_step": 131971, "epoch": 3142} {"train_loss": -6.750564098358154, "global_step": 131972, "epoch": 3142} {"train_loss": -6.590939521789551, "global_step": 131973, "epoch": 3142} {"train_loss": -6.636091232299805, "global_step": 131974, "epoch": 3142} {"train_loss": -6.68265962600708, "global_step": 131975, "epoch": 3142} {"train_loss": -6.696206092834473, "global_step": 131976, "epoch": 3142} {"train_loss": -6.649019718170166, "global_step": 131977, "epoch": 3142} {"train_loss": -6.60073184967041, "global_step": 131978, "epoch": 3142} {"train_loss": -6.627774238586426, "global_step": 131979, "epoch": 3142} {"train_loss": -6.56710958480835, "global_step": 131980, "epoch": 3142} {"train_loss": -6.6538286209106445, "global_step": 131981, "epoch": 3142} {"train_loss": -6.718410491943359, "global_step": 131982, "epoch": 3142} {"train_loss": -6.6320037841796875, "global_step": 131983, "epoch": 3142} {"train_loss": -6.58583927154541, "global_step": 131984, "epoch": 3142} {"train_loss": -6.652717590332031, "global_step": 131985, "epoch": 3142} {"train_loss": -6.614526748657227, "global_step": 131986, "epoch": 3142} {"train_loss": -6.528323173522949, "global_step": 131987, "epoch": 3142} {"train_loss": -6.696948528289795, "global_step": 131988, "epoch": 3142} {"train_loss": -6.741926670074463, "global_step": 131989, "epoch": 3142} {"train_loss": -6.725234031677246, "global_step": 131990, "epoch": 3142} {"train_loss": -6.620974063873291, "global_step": 131991, "epoch": 3142} {"train_loss": -6.734269142150879, "global_step": 131992, "epoch": 3142} {"train_loss": -6.691150188446045, "global_step": 131993, "epoch": 3142} {"train_loss": -6.776220798492432, "global_step": 131994, "epoch": 3142} {"train_loss": -6.597805023193359, "global_step": 131995, "epoch": 3142} {"train_loss": -6.6586103439331055, "global_step": 131996, "epoch": 3142} {"train_loss": -6.660404205322266, "global_step": 131997, "epoch": 3142} {"train_loss": -6.5270280838012695, "global_step": 131998, "epoch": 3142} {"train_loss": -6.7015380859375, "global_step": 131999, "epoch": 3142} {"train_loss": -6.561417102813721, "global_step": 132000, "epoch": 3142} {"train_loss": -6.662528038024902, "global_step": 132001, "epoch": 3142} {"train_loss": -6.614134311676025, "global_step": 132002, "epoch": 3142} {"train_loss": -6.718414306640625, "global_step": 132003, "epoch": 3142} {"train_loss": -6.709115982055664, "global_step": 132004, "epoch": 3142} {"train_loss": -6.642123267764137, "global_step": 132005, "epoch": 3142, "val_loss": 68245.359375} {"train_loss": -6.561239719390869, "global_step": 132006, "epoch": 3143} {"train_loss": -6.611783981323242, "global_step": 132007, "epoch": 3143} {"train_loss": -6.606780052185059, "global_step": 132008, "epoch": 3143} {"train_loss": -6.716098785400391, "global_step": 132009, "epoch": 3143} {"train_loss": -6.555737495422363, "global_step": 132010, "epoch": 3143} {"train_loss": -6.622593879699707, "global_step": 132011, "epoch": 3143} {"train_loss": -6.684812545776367, "global_step": 132012, "epoch": 3143} {"train_loss": -6.67244815826416, "global_step": 132013, "epoch": 3143} {"train_loss": -6.656692981719971, "global_step": 132014, "epoch": 3143} {"train_loss": -6.634335994720459, "global_step": 132015, "epoch": 3143} {"train_loss": -6.667977809906006, "global_step": 132016, "epoch": 3143} {"train_loss": -6.537493705749512, "global_step": 132017, "epoch": 3143} {"train_loss": -6.682153701782227, "global_step": 132018, "epoch": 3143} {"train_loss": -6.662992477416992, "global_step": 132019, "epoch": 3143} {"train_loss": -6.680133819580078, "global_step": 132020, "epoch": 3143} {"train_loss": -6.793336868286133, "global_step": 132021, "epoch": 3143} {"train_loss": -6.763821601867676, "global_step": 132022, "epoch": 3143} {"train_loss": -6.676076889038086, "global_step": 132023, "epoch": 3143} {"train_loss": -6.8121538162231445, "global_step": 132024, "epoch": 3143} {"train_loss": -6.614812850952148, "global_step": 132025, "epoch": 3143} {"train_loss": -6.718125343322754, "global_step": 132026, "epoch": 3143} {"train_loss": -6.731244087219238, "global_step": 132027, "epoch": 3143} {"train_loss": -6.674675941467285, "global_step": 132028, "epoch": 3143} {"train_loss": -6.535037994384766, "global_step": 132029, "epoch": 3143} {"train_loss": -6.766539573669434, "global_step": 132030, "epoch": 3143} {"train_loss": -6.51298713684082, "global_step": 132031, "epoch": 3143} {"train_loss": -6.545747756958008, "global_step": 132032, "epoch": 3143} {"train_loss": -6.690745830535889, "global_step": 132033, "epoch": 3143} {"train_loss": -6.7317705154418945, "global_step": 132034, "epoch": 3143} {"train_loss": -6.666655540466309, "global_step": 132035, "epoch": 3143} {"train_loss": -6.660141944885254, "global_step": 132036, "epoch": 3143} {"train_loss": -6.603775978088379, "global_step": 132037, "epoch": 3143} {"train_loss": -6.736425876617432, "global_step": 132038, "epoch": 3143} {"train_loss": -6.66154146194458, "global_step": 132039, "epoch": 3143} {"train_loss": -6.563725471496582, "global_step": 132040, "epoch": 3143} {"train_loss": -6.602267742156982, "global_step": 132041, "epoch": 3143} {"train_loss": -6.681535720825195, "global_step": 132042, "epoch": 3143} {"train_loss": -6.659365653991699, "global_step": 132043, "epoch": 3143} {"train_loss": -6.762690544128418, "global_step": 132044, "epoch": 3143} {"train_loss": -6.6670026779174805, "global_step": 132045, "epoch": 3143} {"train_loss": -6.705427169799805, "global_step": 132046, "epoch": 3143} {"train_loss": -6.6608482883090065, "global_step": 132047, "epoch": 3143, "val_loss": 68198.984375} {"train_loss": -6.753017902374268, "global_step": 132048, "epoch": 3144} {"train_loss": -6.649641036987305, "global_step": 132049, "epoch": 3144} {"train_loss": -6.681815147399902, "global_step": 132050, "epoch": 3144} {"train_loss": -6.545163631439209, "global_step": 132051, "epoch": 3144} {"train_loss": -6.738910675048828, "global_step": 132052, "epoch": 3144} {"train_loss": -6.772365093231201, "global_step": 132053, "epoch": 3144} {"train_loss": -6.752159595489502, "global_step": 132054, "epoch": 3144} {"train_loss": -6.594281196594238, "global_step": 132055, "epoch": 3144} {"train_loss": -6.615452289581299, "global_step": 132056, "epoch": 3144} {"train_loss": -6.6668853759765625, "global_step": 132057, "epoch": 3144} {"train_loss": -6.553799152374268, "global_step": 132058, "epoch": 3144} {"train_loss": -6.631888389587402, "global_step": 132059, "epoch": 3144} {"train_loss": -6.641942977905273, "global_step": 132060, "epoch": 3144} {"train_loss": -6.5268449783325195, "global_step": 132061, "epoch": 3144} {"train_loss": -6.626054763793945, "global_step": 132062, "epoch": 3144} {"train_loss": -6.483508110046387, "global_step": 132063, "epoch": 3144} {"train_loss": -6.486455917358398, "global_step": 132064, "epoch": 3144} {"train_loss": -6.528584957122803, "global_step": 132065, "epoch": 3144} {"train_loss": -6.518346786499023, "global_step": 132066, "epoch": 3144} {"train_loss": -6.6313042640686035, "global_step": 132067, "epoch": 3144} {"train_loss": -6.532072067260742, "global_step": 132068, "epoch": 3144} {"train_loss": -6.600614547729492, "global_step": 132069, "epoch": 3144} {"train_loss": -6.615556240081787, "global_step": 132070, "epoch": 3144} {"train_loss": -6.728240013122559, "global_step": 132071, "epoch": 3144} {"train_loss": -6.613398551940918, "global_step": 132072, "epoch": 3144} {"train_loss": -6.537168502807617, "global_step": 132073, "epoch": 3144} {"train_loss": -6.60727071762085, "global_step": 132074, "epoch": 3144} {"train_loss": -6.604297637939453, "global_step": 132075, "epoch": 3144} {"train_loss": -6.556732177734375, "global_step": 132076, "epoch": 3144} {"train_loss": -6.638314723968506, "global_step": 132077, "epoch": 3144} {"train_loss": -6.683423042297363, "global_step": 132078, "epoch": 3144} {"train_loss": -6.652151107788086, "global_step": 132079, "epoch": 3144} {"train_loss": -6.643335342407227, "global_step": 132080, "epoch": 3144} {"train_loss": -6.627447128295898, "global_step": 132081, "epoch": 3144} {"train_loss": -6.698117256164551, "global_step": 132082, "epoch": 3144} {"train_loss": -6.55374002456665, "global_step": 132083, "epoch": 3144} {"train_loss": -6.586865425109863, "global_step": 132084, "epoch": 3144} {"train_loss": -6.48789644241333, "global_step": 132085, "epoch": 3144} {"train_loss": -6.6453537940979, "global_step": 132086, "epoch": 3144} {"train_loss": -6.610682487487793, "global_step": 132087, "epoch": 3144} {"train_loss": -6.627165794372559, "global_step": 132088, "epoch": 3144} {"train_loss": -6.61859739394415, "global_step": 132089, "epoch": 3144, "val_loss": 68115.15625} {"train_loss": -6.60774040222168, "global_step": 132090, "epoch": 3145} {"train_loss": -6.660164833068848, "global_step": 132091, "epoch": 3145} {"train_loss": -6.707719326019287, "global_step": 132092, "epoch": 3145} {"train_loss": -6.677142143249512, "global_step": 132093, "epoch": 3145} {"train_loss": -6.5575408935546875, "global_step": 132094, "epoch": 3145} {"train_loss": -6.653181076049805, "global_step": 132095, "epoch": 3145} {"train_loss": -6.614847183227539, "global_step": 132096, "epoch": 3145} {"train_loss": -6.62912654876709, "global_step": 132097, "epoch": 3145} {"train_loss": -6.706943988800049, "global_step": 132098, "epoch": 3145} {"train_loss": -6.616075038909912, "global_step": 132099, "epoch": 3145} {"train_loss": -6.695399284362793, "global_step": 132100, "epoch": 3145} {"train_loss": -6.766592979431152, "global_step": 132101, "epoch": 3145} {"train_loss": -6.730813980102539, "global_step": 132102, "epoch": 3145} {"train_loss": -6.670064926147461, "global_step": 132103, "epoch": 3145} {"train_loss": -6.544282913208008, "global_step": 132104, "epoch": 3145} {"train_loss": -6.729781150817871, "global_step": 132105, "epoch": 3145} {"train_loss": -6.685917854309082, "global_step": 132106, "epoch": 3145} {"train_loss": -6.605218887329102, "global_step": 132107, "epoch": 3145} {"train_loss": -6.596282958984375, "global_step": 132108, "epoch": 3145} {"train_loss": -6.65006685256958, "global_step": 132109, "epoch": 3145} {"train_loss": -6.666402816772461, "global_step": 132110, "epoch": 3145} {"train_loss": -6.724652290344238, "global_step": 132111, "epoch": 3145} {"train_loss": -6.700512409210205, "global_step": 132112, "epoch": 3145} {"train_loss": -6.75216007232666, "global_step": 132113, "epoch": 3145} {"train_loss": -6.634130477905273, "global_step": 132114, "epoch": 3145} {"train_loss": -6.691653251647949, "global_step": 132115, "epoch": 3145} {"train_loss": -6.644329071044922, "global_step": 132116, "epoch": 3145} {"train_loss": -6.657206058502197, "global_step": 132117, "epoch": 3145} {"train_loss": -6.640776634216309, "global_step": 132118, "epoch": 3145} {"train_loss": -6.635990142822266, "global_step": 132119, "epoch": 3145} {"train_loss": -6.594933032989502, "global_step": 132120, "epoch": 3145} {"train_loss": -6.696000099182129, "global_step": 132121, "epoch": 3145} {"train_loss": -6.5934157371521, "global_step": 132122, "epoch": 3145} {"train_loss": -6.711548328399658, "global_step": 132123, "epoch": 3145} {"train_loss": -6.562995910644531, "global_step": 132124, "epoch": 3145} {"train_loss": -6.681706428527832, "global_step": 132125, "epoch": 3145} {"train_loss": -6.602382659912109, "global_step": 132126, "epoch": 3145} {"train_loss": -6.771529674530029, "global_step": 132127, "epoch": 3145} {"train_loss": -6.646034240722656, "global_step": 132128, "epoch": 3145} {"train_loss": -6.66681432723999, "global_step": 132129, "epoch": 3145} {"train_loss": -6.558231830596924, "global_step": 132130, "epoch": 3145} {"train_loss": -6.656948112306141, "global_step": 132131, "epoch": 3145, "val_loss": 68288.3984375} {"train_loss": -6.540574073791504, "global_step": 132132, "epoch": 3146} {"train_loss": -6.618723392486572, "global_step": 132133, "epoch": 3146} {"train_loss": -6.776175498962402, "global_step": 132134, "epoch": 3146} {"train_loss": -6.605998992919922, "global_step": 132135, "epoch": 3146} {"train_loss": -6.710353851318359, "global_step": 132136, "epoch": 3146} {"train_loss": -6.552999973297119, "global_step": 132137, "epoch": 3146} {"train_loss": -6.680844783782959, "global_step": 132138, "epoch": 3146} {"train_loss": -6.710663795471191, "global_step": 132139, "epoch": 3146} {"train_loss": -6.606196403503418, "global_step": 132140, "epoch": 3146} {"train_loss": -6.558518409729004, "global_step": 132141, "epoch": 3146} {"train_loss": -6.672906875610352, "global_step": 132142, "epoch": 3146} {"train_loss": -6.6984663009643555, "global_step": 132143, "epoch": 3146} {"train_loss": -6.68953275680542, "global_step": 132144, "epoch": 3146} {"train_loss": -6.688774108886719, "global_step": 132145, "epoch": 3146} {"train_loss": -6.578969955444336, "global_step": 132146, "epoch": 3146} {"train_loss": -6.722138404846191, "global_step": 132147, "epoch": 3146} {"train_loss": -6.829052448272705, "global_step": 132148, "epoch": 3146} {"train_loss": -6.629280090332031, "global_step": 132149, "epoch": 3146} {"train_loss": -6.711739540100098, "global_step": 132150, "epoch": 3146} {"train_loss": -6.677738189697266, "global_step": 132151, "epoch": 3146} {"train_loss": -6.705263137817383, "global_step": 132152, "epoch": 3146} {"train_loss": -6.717217922210693, "global_step": 132153, "epoch": 3146} {"train_loss": -6.6517839431762695, "global_step": 132154, "epoch": 3146} {"train_loss": -6.675518989562988, "global_step": 132155, "epoch": 3146} {"train_loss": -6.673285484313965, "global_step": 132156, "epoch": 3146} {"train_loss": -6.618801116943359, "global_step": 132157, "epoch": 3146} {"train_loss": -6.677606582641602, "global_step": 132158, "epoch": 3146} {"train_loss": -6.653182029724121, "global_step": 132159, "epoch": 3146} {"train_loss": -6.650866508483887, "global_step": 132160, "epoch": 3146} {"train_loss": -6.641612529754639, "global_step": 132161, "epoch": 3146} {"train_loss": -6.6109724044799805, "global_step": 132162, "epoch": 3146} {"train_loss": -6.650069236755371, "global_step": 132163, "epoch": 3146} {"train_loss": -6.50820255279541, "global_step": 132164, "epoch": 3146} {"train_loss": -6.62713098526001, "global_step": 132165, "epoch": 3146} {"train_loss": -6.5986433029174805, "global_step": 132166, "epoch": 3146} {"train_loss": -6.623590469360352, "global_step": 132167, "epoch": 3146} {"train_loss": -6.63046407699585, "global_step": 132168, "epoch": 3146} {"train_loss": -6.643575668334961, "global_step": 132169, "epoch": 3146} {"train_loss": -6.598361968994141, "global_step": 132170, "epoch": 3146} {"train_loss": -6.616986274719238, "global_step": 132171, "epoch": 3146} {"train_loss": -6.689409255981445, "global_step": 132172, "epoch": 3146} {"train_loss": -6.650083076386225, "global_step": 132173, "epoch": 3146, "val_loss": 68153.09375} {"train_loss": -6.628241539001465, "global_step": 132174, "epoch": 3147} {"train_loss": -6.682316780090332, "global_step": 132175, "epoch": 3147} {"train_loss": -6.559817790985107, "global_step": 132176, "epoch": 3147} {"train_loss": -6.746221542358398, "global_step": 132177, "epoch": 3147} {"train_loss": -6.650867938995361, "global_step": 132178, "epoch": 3147} {"train_loss": -6.623734474182129, "global_step": 132179, "epoch": 3147} {"train_loss": -6.574672698974609, "global_step": 132180, "epoch": 3147} {"train_loss": -6.744605541229248, "global_step": 132181, "epoch": 3147} {"train_loss": -6.5062255859375, "global_step": 132182, "epoch": 3147} {"train_loss": -6.678271293640137, "global_step": 132183, "epoch": 3147} {"train_loss": -6.491475582122803, "global_step": 132184, "epoch": 3147} {"train_loss": -6.720890045166016, "global_step": 132185, "epoch": 3147} {"train_loss": -6.516933441162109, "global_step": 132186, "epoch": 3147} {"train_loss": -6.68087100982666, "global_step": 132187, "epoch": 3147} {"train_loss": -6.640819549560547, "global_step": 132188, "epoch": 3147} {"train_loss": -6.718077182769775, "global_step": 132189, "epoch": 3147} {"train_loss": -6.587769031524658, "global_step": 132190, "epoch": 3147} {"train_loss": -6.626063823699951, "global_step": 132191, "epoch": 3147} {"train_loss": -6.561418533325195, "global_step": 132192, "epoch": 3147} {"train_loss": -6.662107944488525, "global_step": 132193, "epoch": 3147} {"train_loss": -6.608346939086914, "global_step": 132194, "epoch": 3147} {"train_loss": -6.7131547927856445, "global_step": 132195, "epoch": 3147} {"train_loss": -6.56226110458374, "global_step": 132196, "epoch": 3147} {"train_loss": -6.638247966766357, "global_step": 132197, "epoch": 3147} {"train_loss": -6.655246734619141, "global_step": 132198, "epoch": 3147} {"train_loss": -6.46612548828125, "global_step": 132199, "epoch": 3147} {"train_loss": -6.6269426345825195, "global_step": 132200, "epoch": 3147} {"train_loss": -6.690546989440918, "global_step": 132201, "epoch": 3147} {"train_loss": -6.605659484863281, "global_step": 132202, "epoch": 3147} {"train_loss": -6.594611167907715, "global_step": 132203, "epoch": 3147} {"train_loss": -6.605198383331299, "global_step": 132204, "epoch": 3147} {"train_loss": -6.590579986572266, "global_step": 132205, "epoch": 3147} {"train_loss": -6.589377403259277, "global_step": 132206, "epoch": 3147} {"train_loss": -6.619294166564941, "global_step": 132207, "epoch": 3147} {"train_loss": -6.707127571105957, "global_step": 132208, "epoch": 3147} {"train_loss": -6.745609283447266, "global_step": 132209, "epoch": 3147} {"train_loss": -6.570701599121094, "global_step": 132210, "epoch": 3147} {"train_loss": -6.630122184753418, "global_step": 132211, "epoch": 3147} {"train_loss": -6.635541915893555, "global_step": 132212, "epoch": 3147} {"train_loss": -6.752471923828125, "global_step": 132213, "epoch": 3147} {"train_loss": -6.578006744384766, "global_step": 132214, "epoch": 3147} {"train_loss": -6.631678093047369, "global_step": 132215, "epoch": 3147, "val_loss": 68168.046875} {"train_loss": -6.750653266906738, "global_step": 132216, "epoch": 3148} {"train_loss": -6.580808162689209, "global_step": 132217, "epoch": 3148} {"train_loss": -6.5825090408325195, "global_step": 132218, "epoch": 3148} {"train_loss": -6.685758113861084, "global_step": 132219, "epoch": 3148} {"train_loss": -6.743494033813477, "global_step": 132220, "epoch": 3148} {"train_loss": -6.624781608581543, "global_step": 132221, "epoch": 3148} {"train_loss": -6.724066734313965, "global_step": 132222, "epoch": 3148} {"train_loss": -6.6482014656066895, "global_step": 132223, "epoch": 3148} {"train_loss": -6.654898643493652, "global_step": 132224, "epoch": 3148} {"train_loss": -6.699610710144043, "global_step": 132225, "epoch": 3148} {"train_loss": -6.787136077880859, "global_step": 132226, "epoch": 3148} {"train_loss": -6.662662506103516, "global_step": 132227, "epoch": 3148} {"train_loss": -6.852740287780762, "global_step": 132228, "epoch": 3148} {"train_loss": -6.850391864776611, "global_step": 132229, "epoch": 3148} {"train_loss": -6.648669719696045, "global_step": 132230, "epoch": 3148} {"train_loss": -6.708471298217773, "global_step": 132231, "epoch": 3148} {"train_loss": -6.816257476806641, "global_step": 132232, "epoch": 3148} {"train_loss": -6.693097114562988, "global_step": 132233, "epoch": 3148} {"train_loss": -6.617738723754883, "global_step": 132234, "epoch": 3148} {"train_loss": -6.729875564575195, "global_step": 132235, "epoch": 3148} {"train_loss": -6.785560607910156, "global_step": 132236, "epoch": 3148} {"train_loss": -6.747706890106201, "global_step": 132237, "epoch": 3148} {"train_loss": -6.6186299324035645, "global_step": 132238, "epoch": 3148} {"train_loss": -6.786272048950195, "global_step": 132239, "epoch": 3148} {"train_loss": -6.552684783935547, "global_step": 132240, "epoch": 3148} {"train_loss": -6.622457504272461, "global_step": 132241, "epoch": 3148} {"train_loss": -6.541035175323486, "global_step": 132242, "epoch": 3148} {"train_loss": -6.689730167388916, "global_step": 132243, "epoch": 3148} {"train_loss": -6.706066131591797, "global_step": 132244, "epoch": 3148} {"train_loss": -6.5332932472229, "global_step": 132245, "epoch": 3148} {"train_loss": -6.505390644073486, "global_step": 132246, "epoch": 3148} {"train_loss": -6.731953144073486, "global_step": 132247, "epoch": 3148} {"train_loss": -6.550865650177002, "global_step": 132248, "epoch": 3148} {"train_loss": -6.60396671295166, "global_step": 132249, "epoch": 3148} {"train_loss": -6.636401176452637, "global_step": 132250, "epoch": 3148} {"train_loss": -6.51810359954834, "global_step": 132251, "epoch": 3148} {"train_loss": -6.638466835021973, "global_step": 132252, "epoch": 3148} {"train_loss": -6.579618453979492, "global_step": 132253, "epoch": 3148} {"train_loss": -6.518204689025879, "global_step": 132254, "epoch": 3148} {"train_loss": -6.54645299911499, "global_step": 132255, "epoch": 3148} {"train_loss": -6.669777870178223, "global_step": 132256, "epoch": 3148} {"train_loss": -6.663399423871722, "global_step": 132257, "epoch": 3148, "val_loss": 68181.0390625} {"train_loss": -6.568102836608887, "global_step": 132258, "epoch": 3149} {"train_loss": -6.595789432525635, "global_step": 132259, "epoch": 3149} {"train_loss": -6.669922828674316, "global_step": 132260, "epoch": 3149} {"train_loss": -6.583146095275879, "global_step": 132261, "epoch": 3149} {"train_loss": -6.653661251068115, "global_step": 132262, "epoch": 3149} {"train_loss": -6.714174270629883, "global_step": 132263, "epoch": 3149} {"train_loss": -6.60690975189209, "global_step": 132264, "epoch": 3149} {"train_loss": -6.725561141967773, "global_step": 132265, "epoch": 3149} {"train_loss": -6.6666646003723145, "global_step": 132266, "epoch": 3149} {"train_loss": -6.63863468170166, "global_step": 132267, "epoch": 3149} {"train_loss": -6.619744300842285, "global_step": 132268, "epoch": 3149} {"train_loss": -6.561812877655029, "global_step": 132269, "epoch": 3149} {"train_loss": -6.732349395751953, "global_step": 132270, "epoch": 3149} {"train_loss": -6.372735023498535, "global_step": 132271, "epoch": 3149} {"train_loss": -6.614408493041992, "global_step": 132272, "epoch": 3149} {"train_loss": -6.644857883453369, "global_step": 132273, "epoch": 3149} {"train_loss": -6.622669219970703, "global_step": 132274, "epoch": 3149} {"train_loss": -6.616229057312012, "global_step": 132275, "epoch": 3149} {"train_loss": -6.563785552978516, "global_step": 132276, "epoch": 3149} {"train_loss": -6.595644950866699, "global_step": 132277, "epoch": 3149} {"train_loss": -6.529914855957031, "global_step": 132278, "epoch": 3149} {"train_loss": -6.531219959259033, "global_step": 132279, "epoch": 3149} {"train_loss": -6.501187324523926, "global_step": 132280, "epoch": 3149} {"train_loss": -6.508265972137451, "global_step": 132281, "epoch": 3149} {"train_loss": -6.584303379058838, "global_step": 132282, "epoch": 3149} {"train_loss": -6.543531894683838, "global_step": 132283, "epoch": 3149} {"train_loss": -6.652528762817383, "global_step": 132284, "epoch": 3149} {"train_loss": -6.5376787185668945, "global_step": 132285, "epoch": 3149} {"train_loss": -6.614673614501953, "global_step": 132286, "epoch": 3149} {"train_loss": -6.608131408691406, "global_step": 132287, "epoch": 3149} {"train_loss": -6.600075721740723, "global_step": 132288, "epoch": 3149} {"train_loss": -6.540223121643066, "global_step": 132289, "epoch": 3149} {"train_loss": -6.70540714263916, "global_step": 132290, "epoch": 3149} {"train_loss": -6.5669474601745605, "global_step": 132291, "epoch": 3149} {"train_loss": -6.697949409484863, "global_step": 132292, "epoch": 3149} {"train_loss": -6.689830780029297, "global_step": 132293, "epoch": 3149} {"train_loss": -6.616896152496338, "global_step": 132294, "epoch": 3149} {"train_loss": -6.580580711364746, "global_step": 132295, "epoch": 3149} {"train_loss": -6.6366777420043945, "global_step": 132296, "epoch": 3149} {"train_loss": -6.645607948303223, "global_step": 132297, "epoch": 3149} {"train_loss": -6.596713066101074, "global_step": 132298, "epoch": 3149} {"train_loss": -6.604484558105469, "global_step": 132299, "epoch": 3149, "val_loss": 68092.6640625} {"train_loss": -6.714986801147461, "global_step": 132300, "epoch": 3150} {"train_loss": -6.572414398193359, "global_step": 132301, "epoch": 3150} {"train_loss": -6.560547351837158, "global_step": 132302, "epoch": 3150} {"train_loss": -6.547043800354004, "global_step": 132303, "epoch": 3150} {"train_loss": -6.465620994567871, "global_step": 132304, "epoch": 3150} {"train_loss": -6.653242111206055, "global_step": 132305, "epoch": 3150} {"train_loss": -6.528468132019043, "global_step": 132306, "epoch": 3150} {"train_loss": -6.520279884338379, "global_step": 132307, "epoch": 3150} {"train_loss": -6.603677272796631, "global_step": 132308, "epoch": 3150} {"train_loss": -6.489165306091309, "global_step": 132309, "epoch": 3150} {"train_loss": -6.657831192016602, "global_step": 132310, "epoch": 3150} {"train_loss": -6.636322975158691, "global_step": 132311, "epoch": 3150} {"train_loss": -6.632413864135742, "global_step": 132312, "epoch": 3150} {"train_loss": -6.492249965667725, "global_step": 132313, "epoch": 3150} {"train_loss": -6.546158790588379, "global_step": 132314, "epoch": 3150} {"train_loss": -6.641740322113037, "global_step": 132315, "epoch": 3150} {"train_loss": -6.48834753036499, "global_step": 132316, "epoch": 3150} {"train_loss": -6.606286525726318, "global_step": 132317, "epoch": 3150} {"train_loss": -6.5562825202941895, "global_step": 132318, "epoch": 3150} {"train_loss": -6.555830001831055, "global_step": 132319, "epoch": 3150} {"train_loss": -6.5925469398498535, "global_step": 132320, "epoch": 3150} {"train_loss": -6.622666358947754, "global_step": 132321, "epoch": 3150} {"train_loss": -6.5580668449401855, "global_step": 132322, "epoch": 3150} {"train_loss": -6.587808609008789, "global_step": 132323, "epoch": 3150} {"train_loss": -6.698027610778809, "global_step": 132324, "epoch": 3150} {"train_loss": -6.697951316833496, "global_step": 132325, "epoch": 3150} {"train_loss": -6.661258697509766, "global_step": 132326, "epoch": 3150} {"train_loss": -6.704580783843994, "global_step": 132327, "epoch": 3150} {"train_loss": -6.602352142333984, "global_step": 132328, "epoch": 3150} {"train_loss": -6.5637640953063965, "global_step": 132329, "epoch": 3150} {"train_loss": -6.605813980102539, "global_step": 132330, "epoch": 3150} {"train_loss": -6.622364521026611, "global_step": 132331, "epoch": 3150} {"train_loss": -6.57399320602417, "global_step": 132332, "epoch": 3150} {"train_loss": -6.630641937255859, "global_step": 132333, "epoch": 3150} {"train_loss": -6.646154403686523, "global_step": 132334, "epoch": 3150} {"train_loss": -6.683335781097412, "global_step": 132335, "epoch": 3150} {"train_loss": -6.531527996063232, "global_step": 132336, "epoch": 3150} {"train_loss": -6.590018272399902, "global_step": 132337, "epoch": 3150} {"train_loss": -6.64346981048584, "global_step": 132338, "epoch": 3150} {"train_loss": -6.571531295776367, "global_step": 132339, "epoch": 3150} {"train_loss": -6.613524913787842, "global_step": 132340, "epoch": 3150} {"train_loss": -6.598805336725144, "global_step": 132341, "epoch": 3150, "train/sim_max_reward_0": 0.2277670979474764, "train/sim_max_reward_1": 0.9318143731355671, "train/sim_max_reward_2": 0.8700727683767786, "train/sim_max_reward_3": 0.13980677261293006, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.7636066424556662, "test/sim_max_reward_4400000": 0.16299763004485188, "test/sim_max_reward_4400001": 0.9312742356573868, "test/sim_max_reward_4400002": 0.0650138123189437, "test/sim_max_reward_4400003": 0.7587291803219223, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.22953166682106146, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.8089329177600388, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9706350876875782, "test/sim_max_reward_4400010": 0.18530584153895596, "test/sim_max_reward_4400011": 0.9622505542824692, "test/sim_max_reward_4400012": 0.9664192847051244, "test/sim_max_reward_4400013": 0.4018280212733311, "test/sim_max_reward_4400014": 0.2688198629580473, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.9516468739239704, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.21398623659709604, "test/sim_max_reward_4400019": 0.9470899370462655, "test/sim_max_reward_4400020": 0.006451390510546223, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.9517206594378974, "test/sim_max_reward_4400024": 0.8528482925128624, "test/sim_max_reward_4400025": 0.2642275757768461, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.02177773244325553, "test/sim_max_reward_4400028": 0.6892682015177579, "test/sim_max_reward_4400029": 0.9448763246975886, "test/sim_max_reward_4400030": 0.8744812676115998, "test/sim_max_reward_4400031": 0.8004085786799109, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9289868430179199, "test/sim_max_reward_4400034": 0.9750992839527746, "test/sim_max_reward_4400035": 0.40106174642514086, "test/sim_max_reward_4400036": 0.4114497151268088, "test/sim_max_reward_4400037": 0.9503710576649845, "test/sim_max_reward_4400038": 0.9943314954004434, "test/sim_max_reward_4400039": 0.8600399604048921, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7381424704903589, "test/sim_max_reward_4400042": 0.646505275306856, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.997840962874169, "test/sim_max_reward_4400045": 0.9513989124273193, "test/sim_max_reward_4400046": 0.9549694481695712, "test/sim_max_reward_4400047": 0.9911842507675093, "test/sim_max_reward_4400048": 0.9215328598923861, "test/sim_max_reward_4400049": 0.9073282032567002, "train/mean_score": 0.6555112757547364, "test/mean_score": 0.6126131480366592, "val_loss": 68341.2890625} {"train_loss": -6.616840362548828, "global_step": 132342, "epoch": 3151} {"train_loss": -6.558967590332031, "global_step": 132343, "epoch": 3151} {"train_loss": -6.640293121337891, "global_step": 132344, "epoch": 3151} {"train_loss": -6.4788079261779785, "global_step": 132345, "epoch": 3151} {"train_loss": -6.630805015563965, "global_step": 132346, "epoch": 3151} {"train_loss": -6.397950649261475, "global_step": 132347, "epoch": 3151} {"train_loss": -6.661774635314941, "global_step": 132348, "epoch": 3151} {"train_loss": -6.214500427246094, "global_step": 132349, "epoch": 3151} {"train_loss": -6.552690505981445, "global_step": 132350, "epoch": 3151} {"train_loss": -6.543094158172607, "global_step": 132351, "epoch": 3151} {"train_loss": -6.561517715454102, "global_step": 132352, "epoch": 3151} {"train_loss": -6.537288665771484, "global_step": 132353, "epoch": 3151} {"train_loss": -6.552815914154053, "global_step": 132354, "epoch": 3151} {"train_loss": -6.64639949798584, "global_step": 132355, "epoch": 3151} {"train_loss": -6.653884410858154, "global_step": 132356, "epoch": 3151} {"train_loss": -6.620285987854004, "global_step": 132357, "epoch": 3151} {"train_loss": -6.565827369689941, "global_step": 132358, "epoch": 3151} {"train_loss": -6.713788032531738, "global_step": 132359, "epoch": 3151} {"train_loss": -6.672880172729492, "global_step": 132360, "epoch": 3151} {"train_loss": -6.673932075500488, "global_step": 132361, "epoch": 3151} {"train_loss": -6.529325008392334, "global_step": 132362, "epoch": 3151} {"train_loss": -6.624331474304199, "global_step": 132363, "epoch": 3151} {"train_loss": -6.544775009155273, "global_step": 132364, "epoch": 3151} {"train_loss": -6.464637279510498, "global_step": 132365, "epoch": 3151} {"train_loss": -6.562205791473389, "global_step": 132366, "epoch": 3151} {"train_loss": -6.651618957519531, "global_step": 132367, "epoch": 3151} {"train_loss": -6.6687164306640625, "global_step": 132368, "epoch": 3151} {"train_loss": -6.650356769561768, "global_step": 132369, "epoch": 3151} {"train_loss": -6.574977874755859, "global_step": 132370, "epoch": 3151} {"train_loss": -6.7010016441345215, "global_step": 132371, "epoch": 3151} {"train_loss": -6.685245990753174, "global_step": 132372, "epoch": 3151} {"train_loss": -6.675878524780273, "global_step": 132373, "epoch": 3151} {"train_loss": -6.744316101074219, "global_step": 132374, "epoch": 3151} {"train_loss": -6.703679084777832, "global_step": 132375, "epoch": 3151} {"train_loss": -6.770500183105469, "global_step": 132376, "epoch": 3151} {"train_loss": -6.5576252937316895, "global_step": 132377, "epoch": 3151} {"train_loss": -6.649205207824707, "global_step": 132378, "epoch": 3151} {"train_loss": -6.690093040466309, "global_step": 132379, "epoch": 3151} {"train_loss": -6.646389007568359, "global_step": 132380, "epoch": 3151} {"train_loss": -6.659570693969727, "global_step": 132381, "epoch": 3151} {"train_loss": -6.64261531829834, "global_step": 132382, "epoch": 3151} {"train_loss": -6.608948968705677, "global_step": 132383, "epoch": 3151, "val_loss": 68231.671875} {"train_loss": -6.565010070800781, "global_step": 132384, "epoch": 3152} {"train_loss": -6.689845561981201, "global_step": 132385, "epoch": 3152} {"train_loss": -6.584913730621338, "global_step": 132386, "epoch": 3152} {"train_loss": -6.6772074699401855, "global_step": 132387, "epoch": 3152} {"train_loss": -6.652865409851074, "global_step": 132388, "epoch": 3152} {"train_loss": -6.638372421264648, "global_step": 132389, "epoch": 3152} {"train_loss": -6.597859859466553, "global_step": 132390, "epoch": 3152} {"train_loss": -6.650176048278809, "global_step": 132391, "epoch": 3152} {"train_loss": -6.616987228393555, "global_step": 132392, "epoch": 3152} {"train_loss": -6.595364093780518, "global_step": 132393, "epoch": 3152} {"train_loss": -6.675266742706299, "global_step": 132394, "epoch": 3152} {"train_loss": -6.626242637634277, "global_step": 132395, "epoch": 3152} {"train_loss": -6.660190582275391, "global_step": 132396, "epoch": 3152} {"train_loss": -6.558530807495117, "global_step": 132397, "epoch": 3152} {"train_loss": -6.6589179039001465, "global_step": 132398, "epoch": 3152} {"train_loss": -6.595376014709473, "global_step": 132399, "epoch": 3152} {"train_loss": -6.66679573059082, "global_step": 132400, "epoch": 3152} {"train_loss": -6.65499210357666, "global_step": 132401, "epoch": 3152} {"train_loss": -6.679555892944336, "global_step": 132402, "epoch": 3152} {"train_loss": -6.619325637817383, "global_step": 132403, "epoch": 3152} {"train_loss": -6.6721062660217285, "global_step": 132404, "epoch": 3152} {"train_loss": -6.696203231811523, "global_step": 132405, "epoch": 3152} {"train_loss": -6.628137588500977, "global_step": 132406, "epoch": 3152} {"train_loss": -6.557880878448486, "global_step": 132407, "epoch": 3152} {"train_loss": -6.776797294616699, "global_step": 132408, "epoch": 3152} {"train_loss": -6.61079216003418, "global_step": 132409, "epoch": 3152} {"train_loss": -6.569479942321777, "global_step": 132410, "epoch": 3152} {"train_loss": -6.585962772369385, "global_step": 132411, "epoch": 3152} {"train_loss": -6.600890159606934, "global_step": 132412, "epoch": 3152} {"train_loss": -6.752202987670898, "global_step": 132413, "epoch": 3152} {"train_loss": -6.729273796081543, "global_step": 132414, "epoch": 3152} {"train_loss": -6.562289237976074, "global_step": 132415, "epoch": 3152} {"train_loss": -6.800710678100586, "global_step": 132416, "epoch": 3152} {"train_loss": -6.695562362670898, "global_step": 132417, "epoch": 3152} {"train_loss": -6.65125846862793, "global_step": 132418, "epoch": 3152} {"train_loss": -6.774745941162109, "global_step": 132419, "epoch": 3152} {"train_loss": -6.782657623291016, "global_step": 132420, "epoch": 3152} {"train_loss": -6.677032470703125, "global_step": 132421, "epoch": 3152} {"train_loss": -6.724667549133301, "global_step": 132422, "epoch": 3152} {"train_loss": -6.763232707977295, "global_step": 132423, "epoch": 3152} {"train_loss": -6.524410724639893, "global_step": 132424, "epoch": 3152} {"train_loss": -6.651966946465628, "global_step": 132425, "epoch": 3152, "val_loss": 68257.03125} {"train_loss": -6.660099983215332, "global_step": 132426, "epoch": 3153} {"train_loss": -6.715031623840332, "global_step": 132427, "epoch": 3153} {"train_loss": -6.740812301635742, "global_step": 132428, "epoch": 3153} {"train_loss": -6.710894584655762, "global_step": 132429, "epoch": 3153} {"train_loss": -6.632830619812012, "global_step": 132430, "epoch": 3153} {"train_loss": -6.638582229614258, "global_step": 132431, "epoch": 3153} {"train_loss": -6.694241523742676, "global_step": 132432, "epoch": 3153} {"train_loss": -6.725518226623535, "global_step": 132433, "epoch": 3153} {"train_loss": -6.683873176574707, "global_step": 132434, "epoch": 3153} {"train_loss": -6.697835922241211, "global_step": 132435, "epoch": 3153} {"train_loss": -6.763478755950928, "global_step": 132436, "epoch": 3153} {"train_loss": -6.505588531494141, "global_step": 132437, "epoch": 3153} {"train_loss": -6.68544864654541, "global_step": 132438, "epoch": 3153} {"train_loss": -6.591218948364258, "global_step": 132439, "epoch": 3153} {"train_loss": -6.730058670043945, "global_step": 132440, "epoch": 3153} {"train_loss": -6.715235710144043, "global_step": 132441, "epoch": 3153} {"train_loss": -6.574214935302734, "global_step": 132442, "epoch": 3153} {"train_loss": -6.699557781219482, "global_step": 132443, "epoch": 3153} {"train_loss": -6.681207656860352, "global_step": 132444, "epoch": 3153} {"train_loss": -6.643301010131836, "global_step": 132445, "epoch": 3153} {"train_loss": -6.713033676147461, "global_step": 132446, "epoch": 3153} {"train_loss": -6.59989070892334, "global_step": 132447, "epoch": 3153} {"train_loss": -6.590218544006348, "global_step": 132448, "epoch": 3153} {"train_loss": -6.525022983551025, "global_step": 132449, "epoch": 3153} {"train_loss": -6.666008949279785, "global_step": 132450, "epoch": 3153} {"train_loss": -6.593307971954346, "global_step": 132451, "epoch": 3153} {"train_loss": -6.576999664306641, "global_step": 132452, "epoch": 3153} {"train_loss": -6.733002185821533, "global_step": 132453, "epoch": 3153} {"train_loss": -6.543342590332031, "global_step": 132454, "epoch": 3153} {"train_loss": -6.6626081466674805, "global_step": 132455, "epoch": 3153} {"train_loss": -6.647612571716309, "global_step": 132456, "epoch": 3153} {"train_loss": -6.512364864349365, "global_step": 132457, "epoch": 3153} {"train_loss": -6.539185523986816, "global_step": 132458, "epoch": 3153} {"train_loss": -6.653951644897461, "global_step": 132459, "epoch": 3153} {"train_loss": -6.5896992683410645, "global_step": 132460, "epoch": 3153} {"train_loss": -6.71254825592041, "global_step": 132461, "epoch": 3153} {"train_loss": -6.724809169769287, "global_step": 132462, "epoch": 3153} {"train_loss": -6.620129585266113, "global_step": 132463, "epoch": 3153} {"train_loss": -6.771747589111328, "global_step": 132464, "epoch": 3153} {"train_loss": -6.7591776847839355, "global_step": 132465, "epoch": 3153} {"train_loss": -6.642420291900635, "global_step": 132466, "epoch": 3153} {"train_loss": -6.653910375776745, "global_step": 132467, "epoch": 3153, "val_loss": 68151.3046875} {"train_loss": -6.582232475280762, "global_step": 132468, "epoch": 3154} {"train_loss": -6.643057823181152, "global_step": 132469, "epoch": 3154} {"train_loss": -6.775038242340088, "global_step": 132470, "epoch": 3154} {"train_loss": -6.646322250366211, "global_step": 132471, "epoch": 3154} {"train_loss": -6.627565383911133, "global_step": 132472, "epoch": 3154} {"train_loss": -6.704774379730225, "global_step": 132473, "epoch": 3154} {"train_loss": -6.641860485076904, "global_step": 132474, "epoch": 3154} {"train_loss": -6.599224090576172, "global_step": 132475, "epoch": 3154} {"train_loss": -6.687692165374756, "global_step": 132476, "epoch": 3154} {"train_loss": -6.620884418487549, "global_step": 132477, "epoch": 3154} {"train_loss": -6.656712055206299, "global_step": 132478, "epoch": 3154} {"train_loss": -6.633304595947266, "global_step": 132479, "epoch": 3154} {"train_loss": -6.554832458496094, "global_step": 132480, "epoch": 3154} {"train_loss": -6.660004615783691, "global_step": 132481, "epoch": 3154} {"train_loss": -6.626582622528076, "global_step": 132482, "epoch": 3154} {"train_loss": -6.721555709838867, "global_step": 132483, "epoch": 3154} {"train_loss": -6.726768493652344, "global_step": 132484, "epoch": 3154} {"train_loss": -6.520378589630127, "global_step": 132485, "epoch": 3154} {"train_loss": -6.641668319702148, "global_step": 132486, "epoch": 3154} {"train_loss": -6.632175445556641, "global_step": 132487, "epoch": 3154} {"train_loss": -6.59342622756958, "global_step": 132488, "epoch": 3154} {"train_loss": -6.69775390625, "global_step": 132489, "epoch": 3154} {"train_loss": -6.603708744049072, "global_step": 132490, "epoch": 3154} {"train_loss": -6.59339714050293, "global_step": 132491, "epoch": 3154} {"train_loss": -6.557066917419434, "global_step": 132492, "epoch": 3154} {"train_loss": -6.674449920654297, "global_step": 132493, "epoch": 3154} {"train_loss": -6.583741188049316, "global_step": 132494, "epoch": 3154} {"train_loss": -6.657161712646484, "global_step": 132495, "epoch": 3154} {"train_loss": -6.616732597351074, "global_step": 132496, "epoch": 3154} {"train_loss": -6.663479804992676, "global_step": 132497, "epoch": 3154} {"train_loss": -6.724447727203369, "global_step": 132498, "epoch": 3154} {"train_loss": -6.522960662841797, "global_step": 132499, "epoch": 3154} {"train_loss": -6.564784526824951, "global_step": 132500, "epoch": 3154} {"train_loss": -6.69915771484375, "global_step": 132501, "epoch": 3154} {"train_loss": -6.684305667877197, "global_step": 132502, "epoch": 3154} {"train_loss": -6.668275833129883, "global_step": 132503, "epoch": 3154} {"train_loss": -6.735448837280273, "global_step": 132504, "epoch": 3154} {"train_loss": -6.722066402435303, "global_step": 132505, "epoch": 3154} {"train_loss": -6.682591438293457, "global_step": 132506, "epoch": 3154} {"train_loss": -6.657768249511719, "global_step": 132507, "epoch": 3154} {"train_loss": -6.769403457641602, "global_step": 132508, "epoch": 3154} {"train_loss": -6.648163840884254, "global_step": 132509, "epoch": 3154, "val_loss": 68304.96875} {"train_loss": -6.746866226196289, "global_step": 132510, "epoch": 3155} {"train_loss": -6.656217098236084, "global_step": 132511, "epoch": 3155} {"train_loss": -6.736401557922363, "global_step": 132512, "epoch": 3155} {"train_loss": -6.708404064178467, "global_step": 132513, "epoch": 3155} {"train_loss": -6.609763145446777, "global_step": 132514, "epoch": 3155} {"train_loss": -6.640564918518066, "global_step": 132515, "epoch": 3155} {"train_loss": -6.695666313171387, "global_step": 132516, "epoch": 3155} {"train_loss": -6.783844947814941, "global_step": 132517, "epoch": 3155} {"train_loss": -6.638298034667969, "global_step": 132518, "epoch": 3155} {"train_loss": -6.839102745056152, "global_step": 132519, "epoch": 3155} {"train_loss": -6.662138938903809, "global_step": 132520, "epoch": 3155} {"train_loss": -6.595179080963135, "global_step": 132521, "epoch": 3155} {"train_loss": -6.725222110748291, "global_step": 132522, "epoch": 3155} {"train_loss": -6.791103839874268, "global_step": 132523, "epoch": 3155} {"train_loss": -6.650160789489746, "global_step": 132524, "epoch": 3155} {"train_loss": -6.776285171508789, "global_step": 132525, "epoch": 3155} {"train_loss": -6.692325115203857, "global_step": 132526, "epoch": 3155} {"train_loss": -6.62651252746582, "global_step": 132527, "epoch": 3155} {"train_loss": -6.575488090515137, "global_step": 132528, "epoch": 3155} {"train_loss": -6.64167594909668, "global_step": 132529, "epoch": 3155} {"train_loss": -6.638294696807861, "global_step": 132530, "epoch": 3155} {"train_loss": -6.685066223144531, "global_step": 132531, "epoch": 3155} {"train_loss": -6.56675910949707, "global_step": 132532, "epoch": 3155} {"train_loss": -6.69005823135376, "global_step": 132533, "epoch": 3155} {"train_loss": -6.715076923370361, "global_step": 132534, "epoch": 3155} {"train_loss": -6.525187015533447, "global_step": 132535, "epoch": 3155} {"train_loss": -6.7143049240112305, "global_step": 132536, "epoch": 3155} {"train_loss": -6.602771759033203, "global_step": 132537, "epoch": 3155} {"train_loss": -6.506019115447998, "global_step": 132538, "epoch": 3155} {"train_loss": -6.715503692626953, "global_step": 132539, "epoch": 3155} {"train_loss": -6.6507368087768555, "global_step": 132540, "epoch": 3155} {"train_loss": -6.701472282409668, "global_step": 132541, "epoch": 3155} {"train_loss": -6.659265041351318, "global_step": 132542, "epoch": 3155} {"train_loss": -6.668896675109863, "global_step": 132543, "epoch": 3155} {"train_loss": -6.660510540008545, "global_step": 132544, "epoch": 3155} {"train_loss": -6.601483345031738, "global_step": 132545, "epoch": 3155} {"train_loss": -6.630650520324707, "global_step": 132546, "epoch": 3155} {"train_loss": -6.647383689880371, "global_step": 132547, "epoch": 3155} {"train_loss": -6.655361175537109, "global_step": 132548, "epoch": 3155} {"train_loss": -6.687335014343262, "global_step": 132549, "epoch": 3155} {"train_loss": -6.5549702644348145, "global_step": 132550, "epoch": 3155} {"train_loss": -6.66477556455703, "global_step": 132551, "epoch": 3155, "val_loss": 68344.6953125} {"train_loss": -6.725800514221191, "global_step": 132552, "epoch": 3156} {"train_loss": -6.721418380737305, "global_step": 132553, "epoch": 3156} {"train_loss": -6.649473667144775, "global_step": 132554, "epoch": 3156} {"train_loss": -6.701711654663086, "global_step": 132555, "epoch": 3156} {"train_loss": -6.664361476898193, "global_step": 132556, "epoch": 3156} {"train_loss": -6.6165008544921875, "global_step": 132557, "epoch": 3156} {"train_loss": -6.713761329650879, "global_step": 132558, "epoch": 3156} {"train_loss": -6.701326847076416, "global_step": 132559, "epoch": 3156} {"train_loss": -6.662453651428223, "global_step": 132560, "epoch": 3156} {"train_loss": -6.735105991363525, "global_step": 132561, "epoch": 3156} {"train_loss": -6.646604537963867, "global_step": 132562, "epoch": 3156} {"train_loss": -6.665494918823242, "global_step": 132563, "epoch": 3156} {"train_loss": -6.504549980163574, "global_step": 132564, "epoch": 3156} {"train_loss": -6.706180572509766, "global_step": 132565, "epoch": 3156} {"train_loss": -6.704316139221191, "global_step": 132566, "epoch": 3156} {"train_loss": -6.749152660369873, "global_step": 132567, "epoch": 3156} {"train_loss": -6.7087202072143555, "global_step": 132568, "epoch": 3156} {"train_loss": -6.710184097290039, "global_step": 132569, "epoch": 3156} {"train_loss": -6.629062652587891, "global_step": 132570, "epoch": 3156} {"train_loss": -6.662148952484131, "global_step": 132571, "epoch": 3156} {"train_loss": -6.596284866333008, "global_step": 132572, "epoch": 3156} {"train_loss": -6.678656578063965, "global_step": 132573, "epoch": 3156} {"train_loss": -6.657864570617676, "global_step": 132574, "epoch": 3156} {"train_loss": -6.6768798828125, "global_step": 132575, "epoch": 3156} {"train_loss": -6.642675399780273, "global_step": 132576, "epoch": 3156} {"train_loss": -6.750831604003906, "global_step": 132577, "epoch": 3156} {"train_loss": -6.566348552703857, "global_step": 132578, "epoch": 3156} {"train_loss": -6.716407299041748, "global_step": 132579, "epoch": 3156} {"train_loss": -6.65721321105957, "global_step": 132580, "epoch": 3156} {"train_loss": -6.587289810180664, "global_step": 132581, "epoch": 3156} {"train_loss": -6.582818984985352, "global_step": 132582, "epoch": 3156} {"train_loss": -6.658940315246582, "global_step": 132583, "epoch": 3156} {"train_loss": -6.637550354003906, "global_step": 132584, "epoch": 3156} {"train_loss": -6.543422698974609, "global_step": 132585, "epoch": 3156} {"train_loss": -6.565851211547852, "global_step": 132586, "epoch": 3156} {"train_loss": -6.523427963256836, "global_step": 132587, "epoch": 3156} {"train_loss": -6.511643886566162, "global_step": 132588, "epoch": 3156} {"train_loss": -6.671670913696289, "global_step": 132589, "epoch": 3156} {"train_loss": -6.602625370025635, "global_step": 132590, "epoch": 3156} {"train_loss": -6.632109642028809, "global_step": 132591, "epoch": 3156} {"train_loss": -6.655883312225342, "global_step": 132592, "epoch": 3156} {"train_loss": -6.648718856629872, "global_step": 132593, "epoch": 3156, "val_loss": 68191.953125} {"train_loss": -6.556212425231934, "global_step": 132594, "epoch": 3157} {"train_loss": -6.540111541748047, "global_step": 132595, "epoch": 3157} {"train_loss": -6.618444442749023, "global_step": 132596, "epoch": 3157} {"train_loss": -6.498438835144043, "global_step": 132597, "epoch": 3157} {"train_loss": -6.639911651611328, "global_step": 132598, "epoch": 3157} {"train_loss": -6.511821269989014, "global_step": 132599, "epoch": 3157} {"train_loss": -6.673659324645996, "global_step": 132600, "epoch": 3157} {"train_loss": -6.586179733276367, "global_step": 132601, "epoch": 3157} {"train_loss": -6.523845672607422, "global_step": 132602, "epoch": 3157} {"train_loss": -6.577796936035156, "global_step": 132603, "epoch": 3157} {"train_loss": -6.517392158508301, "global_step": 132604, "epoch": 3157} {"train_loss": -6.561781883239746, "global_step": 132605, "epoch": 3157} {"train_loss": -6.538774013519287, "global_step": 132606, "epoch": 3157} {"train_loss": -6.570599555969238, "global_step": 132607, "epoch": 3157} {"train_loss": -6.524106025695801, "global_step": 132608, "epoch": 3157} {"train_loss": -6.622587203979492, "global_step": 132609, "epoch": 3157} {"train_loss": -6.613539218902588, "global_step": 132610, "epoch": 3157} {"train_loss": -6.716104030609131, "global_step": 132611, "epoch": 3157} {"train_loss": -6.637420654296875, "global_step": 132612, "epoch": 3157} {"train_loss": -6.518833637237549, "global_step": 132613, "epoch": 3157} {"train_loss": -6.712765693664551, "global_step": 132614, "epoch": 3157} {"train_loss": -6.528812885284424, "global_step": 132615, "epoch": 3157} {"train_loss": -6.649879455566406, "global_step": 132616, "epoch": 3157} {"train_loss": -6.431596279144287, "global_step": 132617, "epoch": 3157} {"train_loss": -6.741141319274902, "global_step": 132618, "epoch": 3157} {"train_loss": -6.626273155212402, "global_step": 132619, "epoch": 3157} {"train_loss": -6.737271308898926, "global_step": 132620, "epoch": 3157} {"train_loss": -6.640528202056885, "global_step": 132621, "epoch": 3157} {"train_loss": -6.625613212585449, "global_step": 132622, "epoch": 3157} {"train_loss": -6.642626762390137, "global_step": 132623, "epoch": 3157} {"train_loss": -6.652559757232666, "global_step": 132624, "epoch": 3157} {"train_loss": -6.753063201904297, "global_step": 132625, "epoch": 3157} {"train_loss": -6.656487941741943, "global_step": 132626, "epoch": 3157} {"train_loss": -6.643420219421387, "global_step": 132627, "epoch": 3157} {"train_loss": -6.729930877685547, "global_step": 132628, "epoch": 3157} {"train_loss": -6.663640975952148, "global_step": 132629, "epoch": 3157} {"train_loss": -6.699015140533447, "global_step": 132630, "epoch": 3157} {"train_loss": -6.731584548950195, "global_step": 132631, "epoch": 3157} {"train_loss": -6.693666458129883, "global_step": 132632, "epoch": 3157} {"train_loss": -6.644219875335693, "global_step": 132633, "epoch": 3157} {"train_loss": -6.60020112991333, "global_step": 132634, "epoch": 3157} {"train_loss": -6.618136428651356, "global_step": 132635, "epoch": 3157, "val_loss": 68033.6484375} {"train_loss": -6.472816467285156, "global_step": 132636, "epoch": 3158} {"train_loss": -6.7009077072143555, "global_step": 132637, "epoch": 3158} {"train_loss": -6.713385581970215, "global_step": 132638, "epoch": 3158} {"train_loss": -6.637691497802734, "global_step": 132639, "epoch": 3158} {"train_loss": -6.61885404586792, "global_step": 132640, "epoch": 3158} {"train_loss": -6.692212104797363, "global_step": 132641, "epoch": 3158} {"train_loss": -6.536107063293457, "global_step": 132642, "epoch": 3158} {"train_loss": -6.613353729248047, "global_step": 132643, "epoch": 3158} {"train_loss": -6.556579113006592, "global_step": 132644, "epoch": 3158} {"train_loss": -6.6769700050354, "global_step": 132645, "epoch": 3158} {"train_loss": -6.573622703552246, "global_step": 132646, "epoch": 3158} {"train_loss": -6.751730918884277, "global_step": 132647, "epoch": 3158} {"train_loss": -6.4694976806640625, "global_step": 132648, "epoch": 3158} {"train_loss": -6.590144634246826, "global_step": 132649, "epoch": 3158} {"train_loss": -6.436346054077148, "global_step": 132650, "epoch": 3158} {"train_loss": -6.494149208068848, "global_step": 132651, "epoch": 3158} {"train_loss": -6.529062271118164, "global_step": 132652, "epoch": 3158} {"train_loss": -6.459568023681641, "global_step": 132653, "epoch": 3158} {"train_loss": -6.650751113891602, "global_step": 132654, "epoch": 3158} {"train_loss": -6.428051948547363, "global_step": 132655, "epoch": 3158} {"train_loss": -6.670095443725586, "global_step": 132656, "epoch": 3158} {"train_loss": -6.5217180252075195, "global_step": 132657, "epoch": 3158} {"train_loss": -6.609689235687256, "global_step": 132658, "epoch": 3158} {"train_loss": -6.558446884155273, "global_step": 132659, "epoch": 3158} {"train_loss": -6.696478843688965, "global_step": 132660, "epoch": 3158} {"train_loss": -6.5603556632995605, "global_step": 132661, "epoch": 3158} {"train_loss": -6.647360324859619, "global_step": 132662, "epoch": 3158} {"train_loss": -6.533639907836914, "global_step": 132663, "epoch": 3158} {"train_loss": -6.582395553588867, "global_step": 132664, "epoch": 3158} {"train_loss": -6.606668472290039, "global_step": 132665, "epoch": 3158} {"train_loss": -6.713276386260986, "global_step": 132666, "epoch": 3158} {"train_loss": -6.595339775085449, "global_step": 132667, "epoch": 3158} {"train_loss": -6.752323150634766, "global_step": 132668, "epoch": 3158} {"train_loss": -6.680310249328613, "global_step": 132669, "epoch": 3158} {"train_loss": -6.557544708251953, "global_step": 132670, "epoch": 3158} {"train_loss": -6.6547017097473145, "global_step": 132671, "epoch": 3158} {"train_loss": -6.571902751922607, "global_step": 132672, "epoch": 3158} {"train_loss": -6.612791061401367, "global_step": 132673, "epoch": 3158} {"train_loss": -6.593904495239258, "global_step": 132674, "epoch": 3158} {"train_loss": -6.644618988037109, "global_step": 132675, "epoch": 3158} {"train_loss": -6.6094865798950195, "global_step": 132676, "epoch": 3158} {"train_loss": -6.598452193396432, "global_step": 132677, "epoch": 3158, "val_loss": 68232.46875} {"train_loss": -6.680171489715576, "global_step": 132678, "epoch": 3159} {"train_loss": -6.665966987609863, "global_step": 132679, "epoch": 3159} {"train_loss": -6.603046894073486, "global_step": 132680, "epoch": 3159} {"train_loss": -6.640483379364014, "global_step": 132681, "epoch": 3159} {"train_loss": -6.61593770980835, "global_step": 132682, "epoch": 3159} {"train_loss": -6.6757097244262695, "global_step": 132683, "epoch": 3159} {"train_loss": -6.575895309448242, "global_step": 132684, "epoch": 3159} {"train_loss": -6.622251510620117, "global_step": 132685, "epoch": 3159} {"train_loss": -6.692551136016846, "global_step": 132686, "epoch": 3159} {"train_loss": -6.513395309448242, "global_step": 132687, "epoch": 3159} {"train_loss": -6.696264266967773, "global_step": 132688, "epoch": 3159} {"train_loss": -6.573669910430908, "global_step": 132689, "epoch": 3159} {"train_loss": -6.670370101928711, "global_step": 132690, "epoch": 3159} {"train_loss": -6.613198757171631, "global_step": 132691, "epoch": 3159} {"train_loss": -6.527183532714844, "global_step": 132692, "epoch": 3159} {"train_loss": -6.4901509284973145, "global_step": 132693, "epoch": 3159} {"train_loss": -6.57070255279541, "global_step": 132694, "epoch": 3159} {"train_loss": -6.643987655639648, "global_step": 132695, "epoch": 3159} {"train_loss": -6.564800262451172, "global_step": 132696, "epoch": 3159} {"train_loss": -6.688677787780762, "global_step": 132697, "epoch": 3159} {"train_loss": -6.642668724060059, "global_step": 132698, "epoch": 3159} {"train_loss": -6.646800518035889, "global_step": 132699, "epoch": 3159} {"train_loss": -6.645055770874023, "global_step": 132700, "epoch": 3159} {"train_loss": -6.625779151916504, "global_step": 132701, "epoch": 3159} {"train_loss": -6.659692764282227, "global_step": 132702, "epoch": 3159} {"train_loss": -6.506460189819336, "global_step": 132703, "epoch": 3159} {"train_loss": -6.653656482696533, "global_step": 132704, "epoch": 3159} {"train_loss": -6.684017181396484, "global_step": 132705, "epoch": 3159} {"train_loss": -6.747392177581787, "global_step": 132706, "epoch": 3159} {"train_loss": -6.627333164215088, "global_step": 132707, "epoch": 3159} {"train_loss": -6.670775413513184, "global_step": 132708, "epoch": 3159} {"train_loss": -6.653993129730225, "global_step": 132709, "epoch": 3159} {"train_loss": -6.70295524597168, "global_step": 132710, "epoch": 3159} {"train_loss": -6.682031631469727, "global_step": 132711, "epoch": 3159} {"train_loss": -6.5430097579956055, "global_step": 132712, "epoch": 3159} {"train_loss": -6.608027458190918, "global_step": 132713, "epoch": 3159} {"train_loss": -6.597805976867676, "global_step": 132714, "epoch": 3159} {"train_loss": -6.634324550628662, "global_step": 132715, "epoch": 3159} {"train_loss": -6.749139308929443, "global_step": 132716, "epoch": 3159} {"train_loss": -6.615067481994629, "global_step": 132717, "epoch": 3159} {"train_loss": -6.600993633270264, "global_step": 132718, "epoch": 3159} {"train_loss": -6.631302334013439, "global_step": 132719, "epoch": 3159, "val_loss": 68150.78125} {"train_loss": -6.583733558654785, "global_step": 132720, "epoch": 3160} {"train_loss": -6.6668782234191895, "global_step": 132721, "epoch": 3160} {"train_loss": -6.685181617736816, "global_step": 132722, "epoch": 3160} {"train_loss": -6.516260147094727, "global_step": 132723, "epoch": 3160} {"train_loss": -6.658308029174805, "global_step": 132724, "epoch": 3160} {"train_loss": -6.541768550872803, "global_step": 132725, "epoch": 3160} {"train_loss": -6.691545009613037, "global_step": 132726, "epoch": 3160} {"train_loss": -6.550203323364258, "global_step": 132727, "epoch": 3160} {"train_loss": -6.725719451904297, "global_step": 132728, "epoch": 3160} {"train_loss": -6.55994176864624, "global_step": 132729, "epoch": 3160} {"train_loss": -6.58962345123291, "global_step": 132730, "epoch": 3160} {"train_loss": -6.644277572631836, "global_step": 132731, "epoch": 3160} {"train_loss": -6.624974250793457, "global_step": 132732, "epoch": 3160} {"train_loss": -6.765223503112793, "global_step": 132733, "epoch": 3160} {"train_loss": -6.5481767654418945, "global_step": 132734, "epoch": 3160} {"train_loss": -6.655300140380859, "global_step": 132735, "epoch": 3160} {"train_loss": -6.702828407287598, "global_step": 132736, "epoch": 3160} {"train_loss": -6.725916385650635, "global_step": 132737, "epoch": 3160} {"train_loss": -6.661339282989502, "global_step": 132738, "epoch": 3160} {"train_loss": -6.764368534088135, "global_step": 132739, "epoch": 3160} {"train_loss": -6.587777137756348, "global_step": 132740, "epoch": 3160} {"train_loss": -6.742773532867432, "global_step": 132741, "epoch": 3160} {"train_loss": -6.626211643218994, "global_step": 132742, "epoch": 3160} {"train_loss": -6.6937971115112305, "global_step": 132743, "epoch": 3160} {"train_loss": -6.689438819885254, "global_step": 132744, "epoch": 3160} {"train_loss": -6.703843593597412, "global_step": 132745, "epoch": 3160} {"train_loss": -6.705220699310303, "global_step": 132746, "epoch": 3160} {"train_loss": -6.6416521072387695, "global_step": 132747, "epoch": 3160} {"train_loss": -6.690525054931641, "global_step": 132748, "epoch": 3160} {"train_loss": -6.6705121994018555, "global_step": 132749, "epoch": 3160} {"train_loss": -6.690154075622559, "global_step": 132750, "epoch": 3160} {"train_loss": -6.803771495819092, "global_step": 132751, "epoch": 3160} {"train_loss": -6.732530117034912, "global_step": 132752, "epoch": 3160} {"train_loss": -6.811863422393799, "global_step": 132753, "epoch": 3160} {"train_loss": -6.7053704261779785, "global_step": 132754, "epoch": 3160} {"train_loss": -6.776925563812256, "global_step": 132755, "epoch": 3160} {"train_loss": -6.694671630859375, "global_step": 132756, "epoch": 3160} {"train_loss": -6.652284622192383, "global_step": 132757, "epoch": 3160} {"train_loss": -6.815049648284912, "global_step": 132758, "epoch": 3160} {"train_loss": -6.626175403594971, "global_step": 132759, "epoch": 3160} {"train_loss": -6.618982315063477, "global_step": 132760, "epoch": 3160} {"train_loss": -6.671389579772949, "global_step": 132761, "epoch": 3160, "val_loss": 68335.53125} {"train_loss": -6.648612022399902, "global_step": 132762, "epoch": 3161} {"train_loss": -6.641226768493652, "global_step": 132763, "epoch": 3161} {"train_loss": -6.6189398765563965, "global_step": 132764, "epoch": 3161} {"train_loss": -6.636046886444092, "global_step": 132765, "epoch": 3161} {"train_loss": -6.663236141204834, "global_step": 132766, "epoch": 3161} {"train_loss": -6.635164260864258, "global_step": 132767, "epoch": 3161} {"train_loss": -6.567239761352539, "global_step": 132768, "epoch": 3161} {"train_loss": -6.579639434814453, "global_step": 132769, "epoch": 3161} {"train_loss": -6.728736877441406, "global_step": 132770, "epoch": 3161} {"train_loss": -6.722001075744629, "global_step": 132771, "epoch": 3161} {"train_loss": -6.70079231262207, "global_step": 132772, "epoch": 3161} {"train_loss": -6.606733322143555, "global_step": 132773, "epoch": 3161} {"train_loss": -6.571613311767578, "global_step": 132774, "epoch": 3161} {"train_loss": -6.773366928100586, "global_step": 132775, "epoch": 3161} {"train_loss": -6.868381500244141, "global_step": 132776, "epoch": 3161} {"train_loss": -6.705719947814941, "global_step": 132777, "epoch": 3161} {"train_loss": -6.714234352111816, "global_step": 132778, "epoch": 3161} {"train_loss": -6.650936126708984, "global_step": 132779, "epoch": 3161} {"train_loss": -6.713370323181152, "global_step": 132780, "epoch": 3161} {"train_loss": -6.545418739318848, "global_step": 132781, "epoch": 3161} {"train_loss": -6.675168037414551, "global_step": 132782, "epoch": 3161} {"train_loss": -6.658550262451172, "global_step": 132783, "epoch": 3161} {"train_loss": -6.730800628662109, "global_step": 132784, "epoch": 3161} {"train_loss": -6.599821090698242, "global_step": 132785, "epoch": 3161} {"train_loss": -6.69761323928833, "global_step": 132786, "epoch": 3161} {"train_loss": -6.666839599609375, "global_step": 132787, "epoch": 3161} {"train_loss": -6.690617561340332, "global_step": 132788, "epoch": 3161} {"train_loss": -6.644714832305908, "global_step": 132789, "epoch": 3161} {"train_loss": -6.495461463928223, "global_step": 132790, "epoch": 3161} {"train_loss": -6.560770511627197, "global_step": 132791, "epoch": 3161} {"train_loss": -6.669342994689941, "global_step": 132792, "epoch": 3161} {"train_loss": -6.621587753295898, "global_step": 132793, "epoch": 3161} {"train_loss": -6.636646270751953, "global_step": 132794, "epoch": 3161} {"train_loss": -6.612444877624512, "global_step": 132795, "epoch": 3161} {"train_loss": -6.75766134262085, "global_step": 132796, "epoch": 3161} {"train_loss": -6.525784492492676, "global_step": 132797, "epoch": 3161} {"train_loss": -6.575048446655273, "global_step": 132798, "epoch": 3161} {"train_loss": -6.655559062957764, "global_step": 132799, "epoch": 3161} {"train_loss": -6.634654521942139, "global_step": 132800, "epoch": 3161} {"train_loss": -6.582457542419434, "global_step": 132801, "epoch": 3161} {"train_loss": -6.503391742706299, "global_step": 132802, "epoch": 3161} {"train_loss": -6.644490855080741, "global_step": 132803, "epoch": 3161, "val_loss": 68353.2890625} {"train_loss": -6.410484313964844, "global_step": 132804, "epoch": 3162} {"train_loss": -6.546293258666992, "global_step": 132805, "epoch": 3162} {"train_loss": -6.583174705505371, "global_step": 132806, "epoch": 3162} {"train_loss": -6.486526966094971, "global_step": 132807, "epoch": 3162} {"train_loss": -6.546025276184082, "global_step": 132808, "epoch": 3162} {"train_loss": -6.477419853210449, "global_step": 132809, "epoch": 3162} {"train_loss": -6.592044830322266, "global_step": 132810, "epoch": 3162} {"train_loss": -6.383866310119629, "global_step": 132811, "epoch": 3162} {"train_loss": -6.603160858154297, "global_step": 132812, "epoch": 3162} {"train_loss": -6.559939861297607, "global_step": 132813, "epoch": 3162} {"train_loss": -6.543545722961426, "global_step": 132814, "epoch": 3162} {"train_loss": -6.424942970275879, "global_step": 132815, "epoch": 3162} {"train_loss": -6.712818622589111, "global_step": 132816, "epoch": 3162} {"train_loss": -6.533124923706055, "global_step": 132817, "epoch": 3162} {"train_loss": -6.451119422912598, "global_step": 132818, "epoch": 3162} {"train_loss": -6.647222995758057, "global_step": 132819, "epoch": 3162} {"train_loss": -6.513469696044922, "global_step": 132820, "epoch": 3162} {"train_loss": -6.501204490661621, "global_step": 132821, "epoch": 3162} {"train_loss": -6.503618240356445, "global_step": 132822, "epoch": 3162} {"train_loss": -6.571630001068115, "global_step": 132823, "epoch": 3162} {"train_loss": -6.472809791564941, "global_step": 132824, "epoch": 3162} {"train_loss": -6.6204609870910645, "global_step": 132825, "epoch": 3162} {"train_loss": -6.566451072692871, "global_step": 132826, "epoch": 3162} {"train_loss": -6.552255153656006, "global_step": 132827, "epoch": 3162} {"train_loss": -6.536741256713867, "global_step": 132828, "epoch": 3162} {"train_loss": -6.683661460876465, "global_step": 132829, "epoch": 3162} {"train_loss": -6.590653419494629, "global_step": 132830, "epoch": 3162} {"train_loss": -6.637223243713379, "global_step": 132831, "epoch": 3162} {"train_loss": -6.605706214904785, "global_step": 132832, "epoch": 3162} {"train_loss": -6.688225746154785, "global_step": 132833, "epoch": 3162} {"train_loss": -6.696468353271484, "global_step": 132834, "epoch": 3162} {"train_loss": -6.645783424377441, "global_step": 132835, "epoch": 3162} {"train_loss": -6.632074356079102, "global_step": 132836, "epoch": 3162} {"train_loss": -6.731203556060791, "global_step": 132837, "epoch": 3162} {"train_loss": -6.6070661544799805, "global_step": 132838, "epoch": 3162} {"train_loss": -6.690235614776611, "global_step": 132839, "epoch": 3162} {"train_loss": -6.640292167663574, "global_step": 132840, "epoch": 3162} {"train_loss": -6.685380935668945, "global_step": 132841, "epoch": 3162} {"train_loss": -6.826679229736328, "global_step": 132842, "epoch": 3162} {"train_loss": -6.6829047203063965, "global_step": 132843, "epoch": 3162} {"train_loss": -6.803001403808594, "global_step": 132844, "epoch": 3162} {"train_loss": -6.593705336252849, "global_step": 132845, "epoch": 3162, "val_loss": 68101.875} {"train_loss": -6.715460777282715, "global_step": 132846, "epoch": 3163} {"train_loss": -6.7635345458984375, "global_step": 132847, "epoch": 3163} {"train_loss": -6.697882652282715, "global_step": 132848, "epoch": 3163} {"train_loss": -6.667119026184082, "global_step": 132849, "epoch": 3163} {"train_loss": -6.6654205322265625, "global_step": 132850, "epoch": 3163} {"train_loss": -6.5760297775268555, "global_step": 132851, "epoch": 3163} {"train_loss": -6.813240051269531, "global_step": 132852, "epoch": 3163} {"train_loss": -6.72928524017334, "global_step": 132853, "epoch": 3163} {"train_loss": -6.7315263748168945, "global_step": 132854, "epoch": 3163} {"train_loss": -6.608276844024658, "global_step": 132855, "epoch": 3163} {"train_loss": -6.724542617797852, "global_step": 132856, "epoch": 3163} {"train_loss": -6.737168312072754, "global_step": 132857, "epoch": 3163} {"train_loss": -6.648894786834717, "global_step": 132858, "epoch": 3163} {"train_loss": -6.632613182067871, "global_step": 132859, "epoch": 3163} {"train_loss": -6.750938415527344, "global_step": 132860, "epoch": 3163} {"train_loss": -6.639162540435791, "global_step": 132861, "epoch": 3163} {"train_loss": -6.77603006362915, "global_step": 132862, "epoch": 3163} {"train_loss": -6.5172038078308105, "global_step": 132863, "epoch": 3163} {"train_loss": -6.603065490722656, "global_step": 132864, "epoch": 3163} {"train_loss": -6.583033561706543, "global_step": 132865, "epoch": 3163} {"train_loss": -6.584825038909912, "global_step": 132866, "epoch": 3163} {"train_loss": -6.690004348754883, "global_step": 132867, "epoch": 3163} {"train_loss": -6.673968315124512, "global_step": 132868, "epoch": 3163} {"train_loss": -6.634690284729004, "global_step": 132869, "epoch": 3163} {"train_loss": -6.728689670562744, "global_step": 132870, "epoch": 3163} {"train_loss": -6.76753044128418, "global_step": 132871, "epoch": 3163} {"train_loss": -6.698332786560059, "global_step": 132872, "epoch": 3163} {"train_loss": -6.811946868896484, "global_step": 132873, "epoch": 3163} {"train_loss": -6.745427131652832, "global_step": 132874, "epoch": 3163} {"train_loss": -6.6140947341918945, "global_step": 132875, "epoch": 3163} {"train_loss": -6.649354934692383, "global_step": 132876, "epoch": 3163} {"train_loss": -6.69449520111084, "global_step": 132877, "epoch": 3163} {"train_loss": -6.757743835449219, "global_step": 132878, "epoch": 3163} {"train_loss": -6.738218307495117, "global_step": 132879, "epoch": 3163} {"train_loss": -6.684477806091309, "global_step": 132880, "epoch": 3163} {"train_loss": -6.812198162078857, "global_step": 132881, "epoch": 3163} {"train_loss": -6.693140029907227, "global_step": 132882, "epoch": 3163} {"train_loss": -6.6935858726501465, "global_step": 132883, "epoch": 3163} {"train_loss": -6.676729679107666, "global_step": 132884, "epoch": 3163} {"train_loss": -6.7396955490112305, "global_step": 132885, "epoch": 3163} {"train_loss": -6.776595115661621, "global_step": 132886, "epoch": 3163} {"train_loss": -6.6906590688796275, "global_step": 132887, "epoch": 3163, "val_loss": 68280.125} {"train_loss": -6.737660884857178, "global_step": 132888, "epoch": 3164} {"train_loss": -6.652897834777832, "global_step": 132889, "epoch": 3164} {"train_loss": -6.73232364654541, "global_step": 132890, "epoch": 3164} {"train_loss": -6.787316799163818, "global_step": 132891, "epoch": 3164} {"train_loss": -6.772759437561035, "global_step": 132892, "epoch": 3164} {"train_loss": -6.712920665740967, "global_step": 132893, "epoch": 3164} {"train_loss": -6.634065628051758, "global_step": 132894, "epoch": 3164} {"train_loss": -6.685296058654785, "global_step": 132895, "epoch": 3164} {"train_loss": -6.70603084564209, "global_step": 132896, "epoch": 3164} {"train_loss": -6.6882853507995605, "global_step": 132897, "epoch": 3164} {"train_loss": -6.536397933959961, "global_step": 132898, "epoch": 3164} {"train_loss": -6.483945846557617, "global_step": 132899, "epoch": 3164} {"train_loss": -6.757546901702881, "global_step": 132900, "epoch": 3164} {"train_loss": -6.611937999725342, "global_step": 132901, "epoch": 3164} {"train_loss": -6.642326354980469, "global_step": 132902, "epoch": 3164} {"train_loss": -6.596020698547363, "global_step": 132903, "epoch": 3164} {"train_loss": -6.642956733703613, "global_step": 132904, "epoch": 3164} {"train_loss": -6.569388389587402, "global_step": 132905, "epoch": 3164} {"train_loss": -6.672144889831543, "global_step": 132906, "epoch": 3164} {"train_loss": -6.676800727844238, "global_step": 132907, "epoch": 3164} {"train_loss": -6.624022960662842, "global_step": 132908, "epoch": 3164} {"train_loss": -6.606035232543945, "global_step": 132909, "epoch": 3164} {"train_loss": -6.550833225250244, "global_step": 132910, "epoch": 3164} {"train_loss": -6.6679840087890625, "global_step": 132911, "epoch": 3164} {"train_loss": -6.679338455200195, "global_step": 132912, "epoch": 3164} {"train_loss": -6.676309585571289, "global_step": 132913, "epoch": 3164} {"train_loss": -6.573163986206055, "global_step": 132914, "epoch": 3164} {"train_loss": -6.546353340148926, "global_step": 132915, "epoch": 3164} {"train_loss": -6.532754898071289, "global_step": 132916, "epoch": 3164} {"train_loss": -6.705687522888184, "global_step": 132917, "epoch": 3164} {"train_loss": -6.670543670654297, "global_step": 132918, "epoch": 3164} {"train_loss": -6.699018478393555, "global_step": 132919, "epoch": 3164} {"train_loss": -6.723503112792969, "global_step": 132920, "epoch": 3164} {"train_loss": -6.632328987121582, "global_step": 132921, "epoch": 3164} {"train_loss": -6.695145606994629, "global_step": 132922, "epoch": 3164} {"train_loss": -6.70345401763916, "global_step": 132923, "epoch": 3164} {"train_loss": -6.70304012298584, "global_step": 132924, "epoch": 3164} {"train_loss": -6.702238082885742, "global_step": 132925, "epoch": 3164} {"train_loss": -6.734878063201904, "global_step": 132926, "epoch": 3164} {"train_loss": -6.659870624542236, "global_step": 132927, "epoch": 3164} {"train_loss": -6.693137168884277, "global_step": 132928, "epoch": 3164} {"train_loss": -6.6632566679091685, "global_step": 132929, "epoch": 3164, "val_loss": 68152.109375} {"train_loss": -6.613915920257568, "global_step": 132930, "epoch": 3165} {"train_loss": -6.792912483215332, "global_step": 132931, "epoch": 3165} {"train_loss": -6.641547679901123, "global_step": 132932, "epoch": 3165} {"train_loss": -6.780159950256348, "global_step": 132933, "epoch": 3165} {"train_loss": -6.795511722564697, "global_step": 132934, "epoch": 3165} {"train_loss": -6.750025749206543, "global_step": 132935, "epoch": 3165} {"train_loss": -6.724093437194824, "global_step": 132936, "epoch": 3165} {"train_loss": -6.613338470458984, "global_step": 132937, "epoch": 3165} {"train_loss": -6.560031890869141, "global_step": 132938, "epoch": 3165} {"train_loss": -6.675505638122559, "global_step": 132939, "epoch": 3165} {"train_loss": -6.612748146057129, "global_step": 132940, "epoch": 3165} {"train_loss": -6.687695503234863, "global_step": 132941, "epoch": 3165} {"train_loss": -6.665651321411133, "global_step": 132942, "epoch": 3165} {"train_loss": -6.515657424926758, "global_step": 132943, "epoch": 3165} {"train_loss": -6.578533172607422, "global_step": 132944, "epoch": 3165} {"train_loss": -6.634943008422852, "global_step": 132945, "epoch": 3165} {"train_loss": -6.634500026702881, "global_step": 132946, "epoch": 3165} {"train_loss": -6.608145713806152, "global_step": 132947, "epoch": 3165} {"train_loss": -6.60623836517334, "global_step": 132948, "epoch": 3165} {"train_loss": -6.557305335998535, "global_step": 132949, "epoch": 3165} {"train_loss": -6.524589538574219, "global_step": 132950, "epoch": 3165} {"train_loss": -6.512856483459473, "global_step": 132951, "epoch": 3165} {"train_loss": -6.607944011688232, "global_step": 132952, "epoch": 3165} {"train_loss": -6.641563415527344, "global_step": 132953, "epoch": 3165} {"train_loss": -6.602740287780762, "global_step": 132954, "epoch": 3165} {"train_loss": -6.664584636688232, "global_step": 132955, "epoch": 3165} {"train_loss": -6.636078834533691, "global_step": 132956, "epoch": 3165} {"train_loss": -6.526162147521973, "global_step": 132957, "epoch": 3165} {"train_loss": -6.622062683105469, "global_step": 132958, "epoch": 3165} {"train_loss": -6.571540832519531, "global_step": 132959, "epoch": 3165} {"train_loss": -6.739314079284668, "global_step": 132960, "epoch": 3165} {"train_loss": -6.6128034591674805, "global_step": 132961, "epoch": 3165} {"train_loss": -6.6377458572387695, "global_step": 132962, "epoch": 3165} {"train_loss": -6.637221336364746, "global_step": 132963, "epoch": 3165} {"train_loss": -6.667449951171875, "global_step": 132964, "epoch": 3165} {"train_loss": -6.676766872406006, "global_step": 132965, "epoch": 3165} {"train_loss": -6.487004280090332, "global_step": 132966, "epoch": 3165} {"train_loss": -6.686923980712891, "global_step": 132967, "epoch": 3165} {"train_loss": -6.684171676635742, "global_step": 132968, "epoch": 3165} {"train_loss": -6.674272537231445, "global_step": 132969, "epoch": 3165} {"train_loss": -6.658053398132324, "global_step": 132970, "epoch": 3165} {"train_loss": -6.635201624461582, "global_step": 132971, "epoch": 3165, "val_loss": 68408.921875} {"train_loss": -6.674880027770996, "global_step": 132972, "epoch": 3166} {"train_loss": -6.6925811767578125, "global_step": 132973, "epoch": 3166} {"train_loss": -6.582268714904785, "global_step": 132974, "epoch": 3166} {"train_loss": -6.577938556671143, "global_step": 132975, "epoch": 3166} {"train_loss": -6.676418781280518, "global_step": 132976, "epoch": 3166} {"train_loss": -6.5496416091918945, "global_step": 132977, "epoch": 3166} {"train_loss": -6.729030132293701, "global_step": 132978, "epoch": 3166} {"train_loss": -6.489646911621094, "global_step": 132979, "epoch": 3166} {"train_loss": -6.494561195373535, "global_step": 132980, "epoch": 3166} {"train_loss": -6.480295181274414, "global_step": 132981, "epoch": 3166} {"train_loss": -6.714061260223389, "global_step": 132982, "epoch": 3166} {"train_loss": -6.614956855773926, "global_step": 132983, "epoch": 3166} {"train_loss": -6.625370025634766, "global_step": 132984, "epoch": 3166} {"train_loss": -6.509054183959961, "global_step": 132985, "epoch": 3166} {"train_loss": -6.658072471618652, "global_step": 132986, "epoch": 3166} {"train_loss": -6.708530426025391, "global_step": 132987, "epoch": 3166} {"train_loss": -6.717252254486084, "global_step": 132988, "epoch": 3166} {"train_loss": -6.629765033721924, "global_step": 132989, "epoch": 3166} {"train_loss": -6.668583869934082, "global_step": 132990, "epoch": 3166} {"train_loss": -6.621763229370117, "global_step": 132991, "epoch": 3166} {"train_loss": -6.61517333984375, "global_step": 132992, "epoch": 3166} {"train_loss": -6.598235607147217, "global_step": 132993, "epoch": 3166} {"train_loss": -6.547187328338623, "global_step": 132994, "epoch": 3166} {"train_loss": -6.781782150268555, "global_step": 132995, "epoch": 3166} {"train_loss": -6.6041669845581055, "global_step": 132996, "epoch": 3166} {"train_loss": -6.724216461181641, "global_step": 132997, "epoch": 3166} {"train_loss": -6.644743919372559, "global_step": 132998, "epoch": 3166} {"train_loss": -6.785550594329834, "global_step": 132999, "epoch": 3166} {"train_loss": -6.765513896942139, "global_step": 133000, "epoch": 3166} {"train_loss": -6.566875457763672, "global_step": 133001, "epoch": 3166} {"train_loss": -6.672737121582031, "global_step": 133002, "epoch": 3166} {"train_loss": -6.750293731689453, "global_step": 133003, "epoch": 3166} {"train_loss": -6.643460273742676, "global_step": 133004, "epoch": 3166} {"train_loss": -6.659067153930664, "global_step": 133005, "epoch": 3166} {"train_loss": -6.7088823318481445, "global_step": 133006, "epoch": 3166} {"train_loss": -6.714018821716309, "global_step": 133007, "epoch": 3166} {"train_loss": -6.7376275062561035, "global_step": 133008, "epoch": 3166} {"train_loss": -6.632129669189453, "global_step": 133009, "epoch": 3166} {"train_loss": -6.679832458496094, "global_step": 133010, "epoch": 3166} {"train_loss": -6.589740753173828, "global_step": 133011, "epoch": 3166} {"train_loss": -6.719793319702148, "global_step": 133012, "epoch": 3166} {"train_loss": -6.647016968045916, "global_step": 133013, "epoch": 3166, "val_loss": 68176.609375} {"train_loss": -6.6645073890686035, "global_step": 133014, "epoch": 3167} {"train_loss": -6.77113676071167, "global_step": 133015, "epoch": 3167} {"train_loss": -6.667287826538086, "global_step": 133016, "epoch": 3167} {"train_loss": -6.6653900146484375, "global_step": 133017, "epoch": 3167} {"train_loss": -6.7637505531311035, "global_step": 133018, "epoch": 3167} {"train_loss": -6.765018463134766, "global_step": 133019, "epoch": 3167} {"train_loss": -6.725752830505371, "global_step": 133020, "epoch": 3167} {"train_loss": -6.653049468994141, "global_step": 133021, "epoch": 3167} {"train_loss": -6.67500114440918, "global_step": 133022, "epoch": 3167} {"train_loss": -6.678094863891602, "global_step": 133023, "epoch": 3167} {"train_loss": -6.63820743560791, "global_step": 133024, "epoch": 3167} {"train_loss": -6.608991622924805, "global_step": 133025, "epoch": 3167} {"train_loss": -6.683411598205566, "global_step": 133026, "epoch": 3167} {"train_loss": -6.701123237609863, "global_step": 133027, "epoch": 3167} {"train_loss": -6.664874076843262, "global_step": 133028, "epoch": 3167} {"train_loss": -6.60524320602417, "global_step": 133029, "epoch": 3167} {"train_loss": -6.799044609069824, "global_step": 133030, "epoch": 3167} {"train_loss": -6.720598220825195, "global_step": 133031, "epoch": 3167} {"train_loss": -6.593523025512695, "global_step": 133032, "epoch": 3167} {"train_loss": -6.760366916656494, "global_step": 133033, "epoch": 3167} {"train_loss": -6.470696449279785, "global_step": 133034, "epoch": 3167} {"train_loss": -6.625009536743164, "global_step": 133035, "epoch": 3167} {"train_loss": -6.671051025390625, "global_step": 133036, "epoch": 3167} {"train_loss": -6.354427814483643, "global_step": 133037, "epoch": 3167} {"train_loss": -6.6390461921691895, "global_step": 133038, "epoch": 3167} {"train_loss": -6.523860931396484, "global_step": 133039, "epoch": 3167} {"train_loss": -6.572794437408447, "global_step": 133040, "epoch": 3167} {"train_loss": -6.658560752868652, "global_step": 133041, "epoch": 3167} {"train_loss": -6.456366539001465, "global_step": 133042, "epoch": 3167} {"train_loss": -6.537448883056641, "global_step": 133043, "epoch": 3167} {"train_loss": -6.502767562866211, "global_step": 133044, "epoch": 3167} {"train_loss": -6.482154846191406, "global_step": 133045, "epoch": 3167} {"train_loss": -6.5242156982421875, "global_step": 133046, "epoch": 3167} {"train_loss": -6.604890823364258, "global_step": 133047, "epoch": 3167} {"train_loss": -6.478545665740967, "global_step": 133048, "epoch": 3167} {"train_loss": -6.71159553527832, "global_step": 133049, "epoch": 3167} {"train_loss": -6.645755767822266, "global_step": 133050, "epoch": 3167} {"train_loss": -6.544027805328369, "global_step": 133051, "epoch": 3167} {"train_loss": -6.643301010131836, "global_step": 133052, "epoch": 3167} {"train_loss": -6.628074645996094, "global_step": 133053, "epoch": 3167} {"train_loss": -6.647270679473877, "global_step": 133054, "epoch": 3167} {"train_loss": -6.6253208092280795, "global_step": 133055, "epoch": 3167, "val_loss": 68049.28125} {"train_loss": -6.619551658630371, "global_step": 133056, "epoch": 3168} {"train_loss": -6.638773441314697, "global_step": 133057, "epoch": 3168} {"train_loss": -6.556457996368408, "global_step": 133058, "epoch": 3168} {"train_loss": -6.584701061248779, "global_step": 133059, "epoch": 3168} {"train_loss": -6.51265811920166, "global_step": 133060, "epoch": 3168} {"train_loss": -6.627101898193359, "global_step": 133061, "epoch": 3168} {"train_loss": -6.542538642883301, "global_step": 133062, "epoch": 3168} {"train_loss": -6.73630428314209, "global_step": 133063, "epoch": 3168} {"train_loss": -6.520146369934082, "global_step": 133064, "epoch": 3168} {"train_loss": -6.662210464477539, "global_step": 133065, "epoch": 3168} {"train_loss": -6.6959004402160645, "global_step": 133066, "epoch": 3168} {"train_loss": -6.756620407104492, "global_step": 133067, "epoch": 3168} {"train_loss": -6.702689170837402, "global_step": 133068, "epoch": 3168} {"train_loss": -6.631659984588623, "global_step": 133069, "epoch": 3168} {"train_loss": -6.647727966308594, "global_step": 133070, "epoch": 3168} {"train_loss": -6.623581886291504, "global_step": 133071, "epoch": 3168} {"train_loss": -6.633847236633301, "global_step": 133072, "epoch": 3168} {"train_loss": -6.692053318023682, "global_step": 133073, "epoch": 3168} {"train_loss": -6.690775394439697, "global_step": 133074, "epoch": 3168} {"train_loss": -6.751190185546875, "global_step": 133075, "epoch": 3168} {"train_loss": -6.7304582595825195, "global_step": 133076, "epoch": 3168} {"train_loss": -6.711372375488281, "global_step": 133077, "epoch": 3168} {"train_loss": -6.7919511795043945, "global_step": 133078, "epoch": 3168} {"train_loss": -6.703729152679443, "global_step": 133079, "epoch": 3168} {"train_loss": -6.6555256843566895, "global_step": 133080, "epoch": 3168} {"train_loss": -6.729267120361328, "global_step": 133081, "epoch": 3168} {"train_loss": -6.6560139656066895, "global_step": 133082, "epoch": 3168} {"train_loss": -6.611197471618652, "global_step": 133083, "epoch": 3168} {"train_loss": -6.7759013175964355, "global_step": 133084, "epoch": 3168} {"train_loss": -6.745154857635498, "global_step": 133085, "epoch": 3168} {"train_loss": -6.631058692932129, "global_step": 133086, "epoch": 3168} {"train_loss": -6.681580066680908, "global_step": 133087, "epoch": 3168} {"train_loss": -6.714931488037109, "global_step": 133088, "epoch": 3168} {"train_loss": -6.694750785827637, "global_step": 133089, "epoch": 3168} {"train_loss": -6.713475704193115, "global_step": 133090, "epoch": 3168} {"train_loss": -6.680185317993164, "global_step": 133091, "epoch": 3168} {"train_loss": -6.709282875061035, "global_step": 133092, "epoch": 3168} {"train_loss": -6.746940612792969, "global_step": 133093, "epoch": 3168} {"train_loss": -6.686945915222168, "global_step": 133094, "epoch": 3168} {"train_loss": -6.675106525421143, "global_step": 133095, "epoch": 3168} {"train_loss": -6.679984092712402, "global_step": 133096, "epoch": 3168} {"train_loss": -6.6750956035795665, "global_step": 133097, "epoch": 3168, "val_loss": 68326.84375} {"train_loss": -6.783731937408447, "global_step": 133098, "epoch": 3169} {"train_loss": -6.776834011077881, "global_step": 133099, "epoch": 3169} {"train_loss": -6.713354110717773, "global_step": 133100, "epoch": 3169} {"train_loss": -6.626607418060303, "global_step": 133101, "epoch": 3169} {"train_loss": -6.7380475997924805, "global_step": 133102, "epoch": 3169} {"train_loss": -6.653642654418945, "global_step": 133103, "epoch": 3169} {"train_loss": -6.5808515548706055, "global_step": 133104, "epoch": 3169} {"train_loss": -6.54386568069458, "global_step": 133105, "epoch": 3169} {"train_loss": -6.6245527267456055, "global_step": 133106, "epoch": 3169} {"train_loss": -6.543910980224609, "global_step": 133107, "epoch": 3169} {"train_loss": -6.48279333114624, "global_step": 133108, "epoch": 3169} {"train_loss": -6.722080230712891, "global_step": 133109, "epoch": 3169} {"train_loss": -6.518028259277344, "global_step": 133110, "epoch": 3169} {"train_loss": -6.584689140319824, "global_step": 133111, "epoch": 3169} {"train_loss": -6.606260299682617, "global_step": 133112, "epoch": 3169} {"train_loss": -6.535018444061279, "global_step": 133113, "epoch": 3169} {"train_loss": -6.712764263153076, "global_step": 133114, "epoch": 3169} {"train_loss": -6.563259601593018, "global_step": 133115, "epoch": 3169} {"train_loss": -6.627470016479492, "global_step": 133116, "epoch": 3169} {"train_loss": -6.611367225646973, "global_step": 133117, "epoch": 3169} {"train_loss": -6.602571487426758, "global_step": 133118, "epoch": 3169} {"train_loss": -6.547497272491455, "global_step": 133119, "epoch": 3169} {"train_loss": -6.419256210327148, "global_step": 133120, "epoch": 3169} {"train_loss": -6.603740692138672, "global_step": 133121, "epoch": 3169} {"train_loss": -6.572528839111328, "global_step": 133122, "epoch": 3169} {"train_loss": -6.604068756103516, "global_step": 133123, "epoch": 3169} {"train_loss": -6.397787570953369, "global_step": 133124, "epoch": 3169} {"train_loss": -6.5344038009643555, "global_step": 133125, "epoch": 3169} {"train_loss": -6.588447093963623, "global_step": 133126, "epoch": 3169} {"train_loss": -6.4751787185668945, "global_step": 133127, "epoch": 3169} {"train_loss": -6.631167888641357, "global_step": 133128, "epoch": 3169} {"train_loss": -6.572362422943115, "global_step": 133129, "epoch": 3169} {"train_loss": -6.541678428649902, "global_step": 133130, "epoch": 3169} {"train_loss": -6.548201560974121, "global_step": 133131, "epoch": 3169} {"train_loss": -6.5848565101623535, "global_step": 133132, "epoch": 3169} {"train_loss": -6.632350921630859, "global_step": 133133, "epoch": 3169} {"train_loss": -6.637572765350342, "global_step": 133134, "epoch": 3169} {"train_loss": -6.628478050231934, "global_step": 133135, "epoch": 3169} {"train_loss": -6.553951263427734, "global_step": 133136, "epoch": 3169} {"train_loss": -6.643996715545654, "global_step": 133137, "epoch": 3169} {"train_loss": -6.61679744720459, "global_step": 133138, "epoch": 3169} {"train_loss": -6.600590172268095, "global_step": 133139, "epoch": 3169, "val_loss": 68306.46875} {"train_loss": -6.723119735717773, "global_step": 133140, "epoch": 3170} {"train_loss": -6.682519435882568, "global_step": 133141, "epoch": 3170} {"train_loss": -6.700055122375488, "global_step": 133142, "epoch": 3170} {"train_loss": -6.538854122161865, "global_step": 133143, "epoch": 3170} {"train_loss": -6.696268081665039, "global_step": 133144, "epoch": 3170} {"train_loss": -6.585381031036377, "global_step": 133145, "epoch": 3170} {"train_loss": -6.636638641357422, "global_step": 133146, "epoch": 3170} {"train_loss": -6.686583518981934, "global_step": 133147, "epoch": 3170} {"train_loss": -6.579816818237305, "global_step": 133148, "epoch": 3170} {"train_loss": -6.6400146484375, "global_step": 133149, "epoch": 3170} {"train_loss": -6.690530776977539, "global_step": 133150, "epoch": 3170} {"train_loss": -6.657712936401367, "global_step": 133151, "epoch": 3170} {"train_loss": -6.689999580383301, "global_step": 133152, "epoch": 3170} {"train_loss": -6.662115097045898, "global_step": 133153, "epoch": 3170} {"train_loss": -6.768713474273682, "global_step": 133154, "epoch": 3170} {"train_loss": -6.783015251159668, "global_step": 133155, "epoch": 3170} {"train_loss": -6.704324245452881, "global_step": 133156, "epoch": 3170} {"train_loss": -6.743752956390381, "global_step": 133157, "epoch": 3170} {"train_loss": -6.649304389953613, "global_step": 133158, "epoch": 3170} {"train_loss": -6.538699150085449, "global_step": 133159, "epoch": 3170} {"train_loss": -6.64249324798584, "global_step": 133160, "epoch": 3170} {"train_loss": -6.6313371658325195, "global_step": 133161, "epoch": 3170} {"train_loss": -6.6353535652160645, "global_step": 133162, "epoch": 3170} {"train_loss": -6.736188888549805, "global_step": 133163, "epoch": 3170} {"train_loss": -6.732353210449219, "global_step": 133164, "epoch": 3170} {"train_loss": -6.701143264770508, "global_step": 133165, "epoch": 3170} {"train_loss": -6.671027183532715, "global_step": 133166, "epoch": 3170} {"train_loss": -6.779813766479492, "global_step": 133167, "epoch": 3170} {"train_loss": -6.681723594665527, "global_step": 133168, "epoch": 3170} {"train_loss": -6.755674362182617, "global_step": 133169, "epoch": 3170} {"train_loss": -6.729057312011719, "global_step": 133170, "epoch": 3170} {"train_loss": -6.633113861083984, "global_step": 133171, "epoch": 3170} {"train_loss": -6.675553798675537, "global_step": 133172, "epoch": 3170} {"train_loss": -6.655274868011475, "global_step": 133173, "epoch": 3170} {"train_loss": -6.809682369232178, "global_step": 133174, "epoch": 3170} {"train_loss": -6.77186393737793, "global_step": 133175, "epoch": 3170} {"train_loss": -6.668299674987793, "global_step": 133176, "epoch": 3170} {"train_loss": -6.632207870483398, "global_step": 133177, "epoch": 3170} {"train_loss": -6.780857563018799, "global_step": 133178, "epoch": 3170} {"train_loss": -6.533171653747559, "global_step": 133179, "epoch": 3170} {"train_loss": -6.553780555725098, "global_step": 133180, "epoch": 3170} {"train_loss": -6.679061424164545, "global_step": 133181, "epoch": 3170, "val_loss": 68177.734375} {"train_loss": -6.8042426109313965, "global_step": 133182, "epoch": 3171} {"train_loss": -6.659825801849365, "global_step": 133183, "epoch": 3171} {"train_loss": -6.663251876831055, "global_step": 133184, "epoch": 3171} {"train_loss": -6.761295795440674, "global_step": 133185, "epoch": 3171} {"train_loss": -6.573897361755371, "global_step": 133186, "epoch": 3171} {"train_loss": -6.754611492156982, "global_step": 133187, "epoch": 3171} {"train_loss": -6.699335098266602, "global_step": 133188, "epoch": 3171} {"train_loss": -6.707050323486328, "global_step": 133189, "epoch": 3171} {"train_loss": -6.803421974182129, "global_step": 133190, "epoch": 3171} {"train_loss": -6.725910663604736, "global_step": 133191, "epoch": 3171} {"train_loss": -6.743956565856934, "global_step": 133192, "epoch": 3171} {"train_loss": -6.640296459197998, "global_step": 133193, "epoch": 3171} {"train_loss": -6.7474236488342285, "global_step": 133194, "epoch": 3171} {"train_loss": -6.724693298339844, "global_step": 133195, "epoch": 3171} {"train_loss": -6.619977951049805, "global_step": 133196, "epoch": 3171} {"train_loss": -6.741764068603516, "global_step": 133197, "epoch": 3171} {"train_loss": -6.656523704528809, "global_step": 133198, "epoch": 3171} {"train_loss": -6.611590385437012, "global_step": 133199, "epoch": 3171} {"train_loss": -6.663947105407715, "global_step": 133200, "epoch": 3171} {"train_loss": -6.629001140594482, "global_step": 133201, "epoch": 3171} {"train_loss": -6.660196781158447, "global_step": 133202, "epoch": 3171} {"train_loss": -6.686000823974609, "global_step": 133203, "epoch": 3171} {"train_loss": -6.7380290031433105, "global_step": 133204, "epoch": 3171} {"train_loss": -6.715219497680664, "global_step": 133205, "epoch": 3171} {"train_loss": -6.63973331451416, "global_step": 133206, "epoch": 3171} {"train_loss": -6.674513339996338, "global_step": 133207, "epoch": 3171} {"train_loss": -6.735259056091309, "global_step": 133208, "epoch": 3171} {"train_loss": -6.745611190795898, "global_step": 133209, "epoch": 3171} {"train_loss": -6.6990251541137695, "global_step": 133210, "epoch": 3171} {"train_loss": -6.631494522094727, "global_step": 133211, "epoch": 3171} {"train_loss": -6.647796630859375, "global_step": 133212, "epoch": 3171} {"train_loss": -6.594771385192871, "global_step": 133213, "epoch": 3171} {"train_loss": -6.798776626586914, "global_step": 133214, "epoch": 3171} {"train_loss": -6.5458083152771, "global_step": 133215, "epoch": 3171} {"train_loss": -6.674313068389893, "global_step": 133216, "epoch": 3171} {"train_loss": -6.572449684143066, "global_step": 133217, "epoch": 3171} {"train_loss": -6.63328218460083, "global_step": 133218, "epoch": 3171} {"train_loss": -6.664549827575684, "global_step": 133219, "epoch": 3171} {"train_loss": -6.6710405349731445, "global_step": 133220, "epoch": 3171} {"train_loss": -6.724283218383789, "global_step": 133221, "epoch": 3171} {"train_loss": -6.6789870262146, "global_step": 133222, "epoch": 3171} {"train_loss": -6.68408066885812, "global_step": 133223, "epoch": 3171, "val_loss": 68135.984375} {"train_loss": -6.706137657165527, "global_step": 133224, "epoch": 3172} {"train_loss": -6.601733207702637, "global_step": 133225, "epoch": 3172} {"train_loss": -6.685433864593506, "global_step": 133226, "epoch": 3172} {"train_loss": -6.72647762298584, "global_step": 133227, "epoch": 3172} {"train_loss": -6.778202056884766, "global_step": 133228, "epoch": 3172} {"train_loss": -6.735941410064697, "global_step": 133229, "epoch": 3172} {"train_loss": -6.722770690917969, "global_step": 133230, "epoch": 3172} {"train_loss": -6.659850120544434, "global_step": 133231, "epoch": 3172} {"train_loss": -6.728693962097168, "global_step": 133232, "epoch": 3172} {"train_loss": -6.684330940246582, "global_step": 133233, "epoch": 3172} {"train_loss": -6.675680160522461, "global_step": 133234, "epoch": 3172} {"train_loss": -6.627096176147461, "global_step": 133235, "epoch": 3172} {"train_loss": -6.725355625152588, "global_step": 133236, "epoch": 3172} {"train_loss": -6.779288291931152, "global_step": 133237, "epoch": 3172} {"train_loss": -6.536065101623535, "global_step": 133238, "epoch": 3172} {"train_loss": -6.631566047668457, "global_step": 133239, "epoch": 3172} {"train_loss": -6.72789192199707, "global_step": 133240, "epoch": 3172} {"train_loss": -6.777935981750488, "global_step": 133241, "epoch": 3172} {"train_loss": -6.690608978271484, "global_step": 133242, "epoch": 3172} {"train_loss": -6.705816745758057, "global_step": 133243, "epoch": 3172} {"train_loss": -6.71951961517334, "global_step": 133244, "epoch": 3172} {"train_loss": -6.696062088012695, "global_step": 133245, "epoch": 3172} {"train_loss": -6.814895153045654, "global_step": 133246, "epoch": 3172} {"train_loss": -6.771726131439209, "global_step": 133247, "epoch": 3172} {"train_loss": -6.71495246887207, "global_step": 133248, "epoch": 3172} {"train_loss": -6.640865325927734, "global_step": 133249, "epoch": 3172} {"train_loss": -6.653456687927246, "global_step": 133250, "epoch": 3172} {"train_loss": -6.646539688110352, "global_step": 133251, "epoch": 3172} {"train_loss": -6.69891357421875, "global_step": 133252, "epoch": 3172} {"train_loss": -6.6339311599731445, "global_step": 133253, "epoch": 3172} {"train_loss": -6.7601470947265625, "global_step": 133254, "epoch": 3172} {"train_loss": -6.70128059387207, "global_step": 133255, "epoch": 3172} {"train_loss": -6.58517599105835, "global_step": 133256, "epoch": 3172} {"train_loss": -6.759633541107178, "global_step": 133257, "epoch": 3172} {"train_loss": -6.630116939544678, "global_step": 133258, "epoch": 3172} {"train_loss": -6.638140678405762, "global_step": 133259, "epoch": 3172} {"train_loss": -6.614727973937988, "global_step": 133260, "epoch": 3172} {"train_loss": -6.674312591552734, "global_step": 133261, "epoch": 3172} {"train_loss": -6.754157066345215, "global_step": 133262, "epoch": 3172} {"train_loss": -6.605762958526611, "global_step": 133263, "epoch": 3172} {"train_loss": -6.68599796295166, "global_step": 133264, "epoch": 3172} {"train_loss": -6.6911321594601585, "global_step": 133265, "epoch": 3172, "val_loss": 68297.6640625} {"train_loss": -6.85297966003418, "global_step": 133266, "epoch": 3173} {"train_loss": -6.635408401489258, "global_step": 133267, "epoch": 3173} {"train_loss": -6.669732093811035, "global_step": 133268, "epoch": 3173} {"train_loss": -6.749600887298584, "global_step": 133269, "epoch": 3173} {"train_loss": -6.653853416442871, "global_step": 133270, "epoch": 3173} {"train_loss": -6.7300004959106445, "global_step": 133271, "epoch": 3173} {"train_loss": -6.6952714920043945, "global_step": 133272, "epoch": 3173} {"train_loss": -6.74031925201416, "global_step": 133273, "epoch": 3173} {"train_loss": -6.658243179321289, "global_step": 133274, "epoch": 3173} {"train_loss": -6.744138717651367, "global_step": 133275, "epoch": 3173} {"train_loss": -6.695793628692627, "global_step": 133276, "epoch": 3173} {"train_loss": -6.595762252807617, "global_step": 133277, "epoch": 3173} {"train_loss": -6.683105945587158, "global_step": 133278, "epoch": 3173} {"train_loss": -6.630762100219727, "global_step": 133279, "epoch": 3173} {"train_loss": -6.561819553375244, "global_step": 133280, "epoch": 3173} {"train_loss": -6.700678825378418, "global_step": 133281, "epoch": 3173} {"train_loss": -6.6935577392578125, "global_step": 133282, "epoch": 3173} {"train_loss": -6.631877422332764, "global_step": 133283, "epoch": 3173} {"train_loss": -6.78355598449707, "global_step": 133284, "epoch": 3173} {"train_loss": -6.683505058288574, "global_step": 133285, "epoch": 3173} {"train_loss": -6.629188537597656, "global_step": 133286, "epoch": 3173} {"train_loss": -6.649519920349121, "global_step": 133287, "epoch": 3173} {"train_loss": -6.718784809112549, "global_step": 133288, "epoch": 3173} {"train_loss": -6.639655590057373, "global_step": 133289, "epoch": 3173} {"train_loss": -6.676243782043457, "global_step": 133290, "epoch": 3173} {"train_loss": -6.608440399169922, "global_step": 133291, "epoch": 3173} {"train_loss": -6.630515098571777, "global_step": 133292, "epoch": 3173} {"train_loss": -6.720427513122559, "global_step": 133293, "epoch": 3173} {"train_loss": -6.650678634643555, "global_step": 133294, "epoch": 3173} {"train_loss": -6.515664100646973, "global_step": 133295, "epoch": 3173} {"train_loss": -6.724571704864502, "global_step": 133296, "epoch": 3173} {"train_loss": -6.557628631591797, "global_step": 133297, "epoch": 3173} {"train_loss": -6.65115213394165, "global_step": 133298, "epoch": 3173} {"train_loss": -6.605038642883301, "global_step": 133299, "epoch": 3173} {"train_loss": -6.544699668884277, "global_step": 133300, "epoch": 3173} {"train_loss": -6.600213050842285, "global_step": 133301, "epoch": 3173} {"train_loss": -6.734295845031738, "global_step": 133302, "epoch": 3173} {"train_loss": -6.606222152709961, "global_step": 133303, "epoch": 3173} {"train_loss": -6.547990322113037, "global_step": 133304, "epoch": 3173} {"train_loss": -6.740424633026123, "global_step": 133305, "epoch": 3173} {"train_loss": -6.715710163116455, "global_step": 133306, "epoch": 3173} {"train_loss": -6.663428181693668, "global_step": 133307, "epoch": 3173, "val_loss": 68065.0078125} {"train_loss": -6.656060218811035, "global_step": 133308, "epoch": 3174} {"train_loss": -6.732378959655762, "global_step": 133309, "epoch": 3174} {"train_loss": -6.53565788269043, "global_step": 133310, "epoch": 3174} {"train_loss": -6.729397296905518, "global_step": 133311, "epoch": 3174} {"train_loss": -6.737125396728516, "global_step": 133312, "epoch": 3174} {"train_loss": -6.709867477416992, "global_step": 133313, "epoch": 3174} {"train_loss": -6.718716621398926, "global_step": 133314, "epoch": 3174} {"train_loss": -6.871626853942871, "global_step": 133315, "epoch": 3174} {"train_loss": -6.647995948791504, "global_step": 133316, "epoch": 3174} {"train_loss": -6.642900466918945, "global_step": 133317, "epoch": 3174} {"train_loss": -6.704972743988037, "global_step": 133318, "epoch": 3174} {"train_loss": -6.719697952270508, "global_step": 133319, "epoch": 3174} {"train_loss": -6.614691257476807, "global_step": 133320, "epoch": 3174} {"train_loss": -6.748036861419678, "global_step": 133321, "epoch": 3174} {"train_loss": -6.656437873840332, "global_step": 133322, "epoch": 3174} {"train_loss": -6.646274089813232, "global_step": 133323, "epoch": 3174} {"train_loss": -6.664493083953857, "global_step": 133324, "epoch": 3174} {"train_loss": -6.61673641204834, "global_step": 133325, "epoch": 3174} {"train_loss": -6.687232971191406, "global_step": 133326, "epoch": 3174} {"train_loss": -6.8373918533325195, "global_step": 133327, "epoch": 3174} {"train_loss": -6.739640235900879, "global_step": 133328, "epoch": 3174} {"train_loss": -6.681489944458008, "global_step": 133329, "epoch": 3174} {"train_loss": -6.758640289306641, "global_step": 133330, "epoch": 3174} {"train_loss": -6.75675106048584, "global_step": 133331, "epoch": 3174} {"train_loss": -6.653804779052734, "global_step": 133332, "epoch": 3174} {"train_loss": -6.732048988342285, "global_step": 133333, "epoch": 3174} {"train_loss": -6.679298400878906, "global_step": 133334, "epoch": 3174} {"train_loss": -6.769864082336426, "global_step": 133335, "epoch": 3174} {"train_loss": -6.705455780029297, "global_step": 133336, "epoch": 3174} {"train_loss": -6.635125160217285, "global_step": 133337, "epoch": 3174} {"train_loss": -6.723925590515137, "global_step": 133338, "epoch": 3174} {"train_loss": -6.66038179397583, "global_step": 133339, "epoch": 3174} {"train_loss": -6.653559684753418, "global_step": 133340, "epoch": 3174} {"train_loss": -6.700166702270508, "global_step": 133341, "epoch": 3174} {"train_loss": -6.705583095550537, "global_step": 133342, "epoch": 3174} {"train_loss": -6.672435760498047, "global_step": 133343, "epoch": 3174} {"train_loss": -6.6006598472595215, "global_step": 133344, "epoch": 3174} {"train_loss": -6.652585029602051, "global_step": 133345, "epoch": 3174} {"train_loss": -6.61509370803833, "global_step": 133346, "epoch": 3174} {"train_loss": -6.6536359786987305, "global_step": 133347, "epoch": 3174} {"train_loss": -6.706673622131348, "global_step": 133348, "epoch": 3174} {"train_loss": -6.688752469562349, "global_step": 133349, "epoch": 3174, "val_loss": 68135.4921875} {"train_loss": -6.741252899169922, "global_step": 133350, "epoch": 3175} {"train_loss": -6.59654426574707, "global_step": 133351, "epoch": 3175} {"train_loss": -6.692039489746094, "global_step": 133352, "epoch": 3175} {"train_loss": -6.7317399978637695, "global_step": 133353, "epoch": 3175} {"train_loss": -6.525180816650391, "global_step": 133354, "epoch": 3175} {"train_loss": -6.593195915222168, "global_step": 133355, "epoch": 3175} {"train_loss": -6.670145511627197, "global_step": 133356, "epoch": 3175} {"train_loss": -6.713879585266113, "global_step": 133357, "epoch": 3175} {"train_loss": -6.71970796585083, "global_step": 133358, "epoch": 3175} {"train_loss": -6.643311500549316, "global_step": 133359, "epoch": 3175} {"train_loss": -6.767894744873047, "global_step": 133360, "epoch": 3175} {"train_loss": -6.624353408813477, "global_step": 133361, "epoch": 3175} {"train_loss": -6.667351722717285, "global_step": 133362, "epoch": 3175} {"train_loss": -6.832634925842285, "global_step": 133363, "epoch": 3175} {"train_loss": -6.654483795166016, "global_step": 133364, "epoch": 3175} {"train_loss": -6.7441558837890625, "global_step": 133365, "epoch": 3175} {"train_loss": -6.663818359375, "global_step": 133366, "epoch": 3175} {"train_loss": -6.640239715576172, "global_step": 133367, "epoch": 3175} {"train_loss": -6.69976806640625, "global_step": 133368, "epoch": 3175} {"train_loss": -6.600409984588623, "global_step": 133369, "epoch": 3175} {"train_loss": -6.592742919921875, "global_step": 133370, "epoch": 3175} {"train_loss": -6.592536926269531, "global_step": 133371, "epoch": 3175} {"train_loss": -6.667107582092285, "global_step": 133372, "epoch": 3175} {"train_loss": -6.600683212280273, "global_step": 133373, "epoch": 3175} {"train_loss": -6.65812873840332, "global_step": 133374, "epoch": 3175} {"train_loss": -6.694650650024414, "global_step": 133375, "epoch": 3175} {"train_loss": -6.659920692443848, "global_step": 133376, "epoch": 3175} {"train_loss": -6.716304779052734, "global_step": 133377, "epoch": 3175} {"train_loss": -6.6884613037109375, "global_step": 133378, "epoch": 3175} {"train_loss": -6.634671688079834, "global_step": 133379, "epoch": 3175} {"train_loss": -6.537817001342773, "global_step": 133380, "epoch": 3175} {"train_loss": -6.542749404907227, "global_step": 133381, "epoch": 3175} {"train_loss": -6.624182224273682, "global_step": 133382, "epoch": 3175} {"train_loss": -6.584229946136475, "global_step": 133383, "epoch": 3175} {"train_loss": -6.692987442016602, "global_step": 133384, "epoch": 3175} {"train_loss": -6.679749488830566, "global_step": 133385, "epoch": 3175} {"train_loss": -6.578563690185547, "global_step": 133386, "epoch": 3175} {"train_loss": -6.595540523529053, "global_step": 133387, "epoch": 3175} {"train_loss": -6.735299110412598, "global_step": 133388, "epoch": 3175} {"train_loss": -6.736213684082031, "global_step": 133389, "epoch": 3175} {"train_loss": -6.747315883636475, "global_step": 133390, "epoch": 3175} {"train_loss": -6.662270591372535, "global_step": 133391, "epoch": 3175, "val_loss": 68376.828125} {"train_loss": -6.696773052215576, "global_step": 133392, "epoch": 3176} {"train_loss": -6.687034606933594, "global_step": 133393, "epoch": 3176} {"train_loss": -6.612836837768555, "global_step": 133394, "epoch": 3176} {"train_loss": -6.800698280334473, "global_step": 133395, "epoch": 3176} {"train_loss": -6.6826348304748535, "global_step": 133396, "epoch": 3176} {"train_loss": -6.599704742431641, "global_step": 133397, "epoch": 3176} {"train_loss": -6.692507266998291, "global_step": 133398, "epoch": 3176} {"train_loss": -6.621651649475098, "global_step": 133399, "epoch": 3176} {"train_loss": -6.700685501098633, "global_step": 133400, "epoch": 3176} {"train_loss": -6.7063775062561035, "global_step": 133401, "epoch": 3176} {"train_loss": -6.689647674560547, "global_step": 133402, "epoch": 3176} {"train_loss": -6.58172607421875, "global_step": 133403, "epoch": 3176} {"train_loss": -6.552171230316162, "global_step": 133404, "epoch": 3176} {"train_loss": -6.599535942077637, "global_step": 133405, "epoch": 3176} {"train_loss": -6.682257652282715, "global_step": 133406, "epoch": 3176} {"train_loss": -6.608269691467285, "global_step": 133407, "epoch": 3176} {"train_loss": -6.611701965332031, "global_step": 133408, "epoch": 3176} {"train_loss": -6.708256244659424, "global_step": 133409, "epoch": 3176} {"train_loss": -6.698755264282227, "global_step": 133410, "epoch": 3176} {"train_loss": -6.580266952514648, "global_step": 133411, "epoch": 3176} {"train_loss": -6.647211074829102, "global_step": 133412, "epoch": 3176} {"train_loss": -6.655313491821289, "global_step": 133413, "epoch": 3176} {"train_loss": -6.600123882293701, "global_step": 133414, "epoch": 3176} {"train_loss": -6.63477897644043, "global_step": 133415, "epoch": 3176} {"train_loss": -6.592681407928467, "global_step": 133416, "epoch": 3176} {"train_loss": -6.577013969421387, "global_step": 133417, "epoch": 3176} {"train_loss": -6.622333526611328, "global_step": 133418, "epoch": 3176} {"train_loss": -6.519542694091797, "global_step": 133419, "epoch": 3176} {"train_loss": -6.598433971405029, "global_step": 133420, "epoch": 3176} {"train_loss": -6.596644401550293, "global_step": 133421, "epoch": 3176} {"train_loss": -6.608656406402588, "global_step": 133422, "epoch": 3176} {"train_loss": -6.54069709777832, "global_step": 133423, "epoch": 3176} {"train_loss": -6.537879943847656, "global_step": 133424, "epoch": 3176} {"train_loss": -6.511605739593506, "global_step": 133425, "epoch": 3176} {"train_loss": -6.6005635261535645, "global_step": 133426, "epoch": 3176} {"train_loss": -6.652997970581055, "global_step": 133427, "epoch": 3176} {"train_loss": -6.571659088134766, "global_step": 133428, "epoch": 3176} {"train_loss": -6.674073219299316, "global_step": 133429, "epoch": 3176} {"train_loss": -6.773097038269043, "global_step": 133430, "epoch": 3176} {"train_loss": -6.538725852966309, "global_step": 133431, "epoch": 3176} {"train_loss": -6.603215217590332, "global_step": 133432, "epoch": 3176} {"train_loss": -6.625089917864118, "global_step": 133433, "epoch": 3176, "val_loss": 68342.4609375} {"train_loss": -6.6916117668151855, "global_step": 133434, "epoch": 3177} {"train_loss": -6.638197898864746, "global_step": 133435, "epoch": 3177} {"train_loss": -6.589934349060059, "global_step": 133436, "epoch": 3177} {"train_loss": -6.49092960357666, "global_step": 133437, "epoch": 3177} {"train_loss": -6.572278022766113, "global_step": 133438, "epoch": 3177} {"train_loss": -6.699965000152588, "global_step": 133439, "epoch": 3177} {"train_loss": -6.507935523986816, "global_step": 133440, "epoch": 3177} {"train_loss": -6.628483772277832, "global_step": 133441, "epoch": 3177} {"train_loss": -6.5177741050720215, "global_step": 133442, "epoch": 3177} {"train_loss": -6.540096282958984, "global_step": 133443, "epoch": 3177} {"train_loss": -6.672528266906738, "global_step": 133444, "epoch": 3177} {"train_loss": -6.493227958679199, "global_step": 133445, "epoch": 3177} {"train_loss": -6.67041015625, "global_step": 133446, "epoch": 3177} {"train_loss": -6.581859588623047, "global_step": 133447, "epoch": 3177} {"train_loss": -6.698661804199219, "global_step": 133448, "epoch": 3177} {"train_loss": -6.490089416503906, "global_step": 133449, "epoch": 3177} {"train_loss": -6.6868720054626465, "global_step": 133450, "epoch": 3177} {"train_loss": -6.652239799499512, "global_step": 133451, "epoch": 3177} {"train_loss": -6.61741828918457, "global_step": 133452, "epoch": 3177} {"train_loss": -6.634842872619629, "global_step": 133453, "epoch": 3177} {"train_loss": -6.558396339416504, "global_step": 133454, "epoch": 3177} {"train_loss": -6.641762733459473, "global_step": 133455, "epoch": 3177} {"train_loss": -6.591390132904053, "global_step": 133456, "epoch": 3177} {"train_loss": -6.6548614501953125, "global_step": 133457, "epoch": 3177} {"train_loss": -6.652897834777832, "global_step": 133458, "epoch": 3177} {"train_loss": -6.693277359008789, "global_step": 133459, "epoch": 3177} {"train_loss": -6.553647041320801, "global_step": 133460, "epoch": 3177} {"train_loss": -6.685487747192383, "global_step": 133461, "epoch": 3177} {"train_loss": -6.390476226806641, "global_step": 133462, "epoch": 3177} {"train_loss": -6.60097599029541, "global_step": 133463, "epoch": 3177} {"train_loss": -6.542762279510498, "global_step": 133464, "epoch": 3177} {"train_loss": -6.532724380493164, "global_step": 133465, "epoch": 3177} {"train_loss": -6.424325942993164, "global_step": 133466, "epoch": 3177} {"train_loss": -6.683662414550781, "global_step": 133467, "epoch": 3177} {"train_loss": -6.65085506439209, "global_step": 133468, "epoch": 3177} {"train_loss": -6.637577056884766, "global_step": 133469, "epoch": 3177} {"train_loss": -6.677231788635254, "global_step": 133470, "epoch": 3177} {"train_loss": -6.6353888511657715, "global_step": 133471, "epoch": 3177} {"train_loss": -6.62635612487793, "global_step": 133472, "epoch": 3177} {"train_loss": -6.629466533660889, "global_step": 133473, "epoch": 3177} {"train_loss": -6.667484283447266, "global_step": 133474, "epoch": 3177} {"train_loss": -6.606141862415132, "global_step": 133475, "epoch": 3177, "val_loss": 68287.96875} {"train_loss": -6.682526588439941, "global_step": 133476, "epoch": 3178} {"train_loss": -6.70456075668335, "global_step": 133477, "epoch": 3178} {"train_loss": -6.6639838218688965, "global_step": 133478, "epoch": 3178} {"train_loss": -6.677626609802246, "global_step": 133479, "epoch": 3178} {"train_loss": -6.749367713928223, "global_step": 133480, "epoch": 3178} {"train_loss": -6.634777069091797, "global_step": 133481, "epoch": 3178} {"train_loss": -6.72552490234375, "global_step": 133482, "epoch": 3178} {"train_loss": -6.719688415527344, "global_step": 133483, "epoch": 3178} {"train_loss": -6.698313236236572, "global_step": 133484, "epoch": 3178} {"train_loss": -6.661699295043945, "global_step": 133485, "epoch": 3178} {"train_loss": -6.771892547607422, "global_step": 133486, "epoch": 3178} {"train_loss": -6.717306137084961, "global_step": 133487, "epoch": 3178} {"train_loss": -6.727426528930664, "global_step": 133488, "epoch": 3178} {"train_loss": -6.569613933563232, "global_step": 133489, "epoch": 3178} {"train_loss": -6.68818998336792, "global_step": 133490, "epoch": 3178} {"train_loss": -6.661331653594971, "global_step": 133491, "epoch": 3178} {"train_loss": -6.797179698944092, "global_step": 133492, "epoch": 3178} {"train_loss": -6.745118141174316, "global_step": 133493, "epoch": 3178} {"train_loss": -6.6511054039001465, "global_step": 133494, "epoch": 3178} {"train_loss": -6.598381996154785, "global_step": 133495, "epoch": 3178} {"train_loss": -6.7422261238098145, "global_step": 133496, "epoch": 3178} {"train_loss": -6.716825008392334, "global_step": 133497, "epoch": 3178} {"train_loss": -6.648646831512451, "global_step": 133498, "epoch": 3178} {"train_loss": -6.62717342376709, "global_step": 133499, "epoch": 3178} {"train_loss": -6.745169162750244, "global_step": 133500, "epoch": 3178} {"train_loss": -6.7525954246521, "global_step": 133501, "epoch": 3178} {"train_loss": -6.759408473968506, "global_step": 133502, "epoch": 3178} {"train_loss": -6.711492538452148, "global_step": 133503, "epoch": 3178} {"train_loss": -6.58525276184082, "global_step": 133504, "epoch": 3178} {"train_loss": -6.638592720031738, "global_step": 133505, "epoch": 3178} {"train_loss": -6.656101226806641, "global_step": 133506, "epoch": 3178} {"train_loss": -6.727900505065918, "global_step": 133507, "epoch": 3178} {"train_loss": -6.691379547119141, "global_step": 133508, "epoch": 3178} {"train_loss": -6.669161319732666, "global_step": 133509, "epoch": 3178} {"train_loss": -6.668582916259766, "global_step": 133510, "epoch": 3178} {"train_loss": -6.713269233703613, "global_step": 133511, "epoch": 3178} {"train_loss": -6.620797157287598, "global_step": 133512, "epoch": 3178} {"train_loss": -6.617098808288574, "global_step": 133513, "epoch": 3178} {"train_loss": -6.711483955383301, "global_step": 133514, "epoch": 3178} {"train_loss": -6.5460615158081055, "global_step": 133515, "epoch": 3178} {"train_loss": -6.634174823760986, "global_step": 133516, "epoch": 3178} {"train_loss": -6.687566337131319, "global_step": 133517, "epoch": 3178, "val_loss": 68308.0859375} {"train_loss": -6.7429962158203125, "global_step": 133518, "epoch": 3179} {"train_loss": -6.732283592224121, "global_step": 133519, "epoch": 3179} {"train_loss": -6.724165916442871, "global_step": 133520, "epoch": 3179} {"train_loss": -6.699716567993164, "global_step": 133521, "epoch": 3179} {"train_loss": -6.676929473876953, "global_step": 133522, "epoch": 3179} {"train_loss": -6.738760948181152, "global_step": 133523, "epoch": 3179} {"train_loss": -6.6313276290893555, "global_step": 133524, "epoch": 3179} {"train_loss": -6.716794967651367, "global_step": 133525, "epoch": 3179} {"train_loss": -6.700646877288818, "global_step": 133526, "epoch": 3179} {"train_loss": -6.6192169189453125, "global_step": 133527, "epoch": 3179} {"train_loss": -6.655780792236328, "global_step": 133528, "epoch": 3179} {"train_loss": -6.793679714202881, "global_step": 133529, "epoch": 3179} {"train_loss": -6.680088520050049, "global_step": 133530, "epoch": 3179} {"train_loss": -6.643185615539551, "global_step": 133531, "epoch": 3179} {"train_loss": -6.739786148071289, "global_step": 133532, "epoch": 3179} {"train_loss": -6.56046199798584, "global_step": 133533, "epoch": 3179} {"train_loss": -6.617951393127441, "global_step": 133534, "epoch": 3179} {"train_loss": -6.614068031311035, "global_step": 133535, "epoch": 3179} {"train_loss": -6.720314025878906, "global_step": 133536, "epoch": 3179} {"train_loss": -6.7022385597229, "global_step": 133537, "epoch": 3179} {"train_loss": -6.7471771240234375, "global_step": 133538, "epoch": 3179} {"train_loss": -6.5957465171813965, "global_step": 133539, "epoch": 3179} {"train_loss": -6.694104194641113, "global_step": 133540, "epoch": 3179} {"train_loss": -6.718992233276367, "global_step": 133541, "epoch": 3179} {"train_loss": -6.766522407531738, "global_step": 133542, "epoch": 3179} {"train_loss": -6.563302040100098, "global_step": 133543, "epoch": 3179} {"train_loss": -6.587386131286621, "global_step": 133544, "epoch": 3179} {"train_loss": -6.660741329193115, "global_step": 133545, "epoch": 3179} {"train_loss": -6.697144508361816, "global_step": 133546, "epoch": 3179} {"train_loss": -6.571982383728027, "global_step": 133547, "epoch": 3179} {"train_loss": -6.722295761108398, "global_step": 133548, "epoch": 3179} {"train_loss": -6.566941738128662, "global_step": 133549, "epoch": 3179} {"train_loss": -6.625057220458984, "global_step": 133550, "epoch": 3179} {"train_loss": -6.491817474365234, "global_step": 133551, "epoch": 3179} {"train_loss": -6.602936267852783, "global_step": 133552, "epoch": 3179} {"train_loss": -6.686846733093262, "global_step": 133553, "epoch": 3179} {"train_loss": -6.565036773681641, "global_step": 133554, "epoch": 3179} {"train_loss": -6.538019180297852, "global_step": 133555, "epoch": 3179} {"train_loss": -6.622017860412598, "global_step": 133556, "epoch": 3179} {"train_loss": -6.62155818939209, "global_step": 133557, "epoch": 3179} {"train_loss": -6.436153411865234, "global_step": 133558, "epoch": 3179} {"train_loss": -6.653469312758673, "global_step": 133559, "epoch": 3179, "val_loss": 68231.890625} {"train_loss": -6.546564102172852, "global_step": 133560, "epoch": 3180} {"train_loss": -6.7543487548828125, "global_step": 133561, "epoch": 3180} {"train_loss": -6.624782085418701, "global_step": 133562, "epoch": 3180} {"train_loss": -6.66643762588501, "global_step": 133563, "epoch": 3180} {"train_loss": -6.6089277267456055, "global_step": 133564, "epoch": 3180} {"train_loss": -6.616388320922852, "global_step": 133565, "epoch": 3180} {"train_loss": -6.659401893615723, "global_step": 133566, "epoch": 3180} {"train_loss": -6.706149101257324, "global_step": 133567, "epoch": 3180} {"train_loss": -6.659185409545898, "global_step": 133568, "epoch": 3180} {"train_loss": -6.7112932205200195, "global_step": 133569, "epoch": 3180} {"train_loss": -6.672024726867676, "global_step": 133570, "epoch": 3180} {"train_loss": -6.672599792480469, "global_step": 133571, "epoch": 3180} {"train_loss": -6.632551670074463, "global_step": 133572, "epoch": 3180} {"train_loss": -6.549217224121094, "global_step": 133573, "epoch": 3180} {"train_loss": -6.619104862213135, "global_step": 133574, "epoch": 3180} {"train_loss": -6.714443206787109, "global_step": 133575, "epoch": 3180} {"train_loss": -6.488549709320068, "global_step": 133576, "epoch": 3180} {"train_loss": -6.621807098388672, "global_step": 133577, "epoch": 3180} {"train_loss": -6.648963928222656, "global_step": 133578, "epoch": 3180} {"train_loss": -6.621817111968994, "global_step": 133579, "epoch": 3180} {"train_loss": -6.603854656219482, "global_step": 133580, "epoch": 3180} {"train_loss": -6.591428756713867, "global_step": 133581, "epoch": 3180} {"train_loss": -6.5605669021606445, "global_step": 133582, "epoch": 3180} {"train_loss": -6.621007919311523, "global_step": 133583, "epoch": 3180} {"train_loss": -6.580100059509277, "global_step": 133584, "epoch": 3180} {"train_loss": -6.585577964782715, "global_step": 133585, "epoch": 3180} {"train_loss": -6.610160827636719, "global_step": 133586, "epoch": 3180} {"train_loss": -6.665432929992676, "global_step": 133587, "epoch": 3180} {"train_loss": -6.649036407470703, "global_step": 133588, "epoch": 3180} {"train_loss": -6.628116130828857, "global_step": 133589, "epoch": 3180} {"train_loss": -6.528491973876953, "global_step": 133590, "epoch": 3180} {"train_loss": -6.643611907958984, "global_step": 133591, "epoch": 3180} {"train_loss": -6.635777950286865, "global_step": 133592, "epoch": 3180} {"train_loss": -6.6922478675842285, "global_step": 133593, "epoch": 3180} {"train_loss": -6.630590915679932, "global_step": 133594, "epoch": 3180} {"train_loss": -6.683684349060059, "global_step": 133595, "epoch": 3180} {"train_loss": -6.648875713348389, "global_step": 133596, "epoch": 3180} {"train_loss": -6.5417561531066895, "global_step": 133597, "epoch": 3180} {"train_loss": -6.52956485748291, "global_step": 133598, "epoch": 3180} {"train_loss": -6.555802345275879, "global_step": 133599, "epoch": 3180} {"train_loss": -6.65397834777832, "global_step": 133600, "epoch": 3180} {"train_loss": -6.627771173204694, "global_step": 133601, "epoch": 3180, "val_loss": 68383.7890625} {"train_loss": -6.614049911499023, "global_step": 133602, "epoch": 3181} {"train_loss": -6.691567420959473, "global_step": 133603, "epoch": 3181} {"train_loss": -6.613881587982178, "global_step": 133604, "epoch": 3181} {"train_loss": -6.635890007019043, "global_step": 133605, "epoch": 3181} {"train_loss": -6.563648223876953, "global_step": 133606, "epoch": 3181} {"train_loss": -6.65565299987793, "global_step": 133607, "epoch": 3181} {"train_loss": -6.723254680633545, "global_step": 133608, "epoch": 3181} {"train_loss": -6.644421577453613, "global_step": 133609, "epoch": 3181} {"train_loss": -6.677054405212402, "global_step": 133610, "epoch": 3181} {"train_loss": -6.7010111808776855, "global_step": 133611, "epoch": 3181} {"train_loss": -6.67449951171875, "global_step": 133612, "epoch": 3181} {"train_loss": -6.706435203552246, "global_step": 133613, "epoch": 3181} {"train_loss": -6.709027290344238, "global_step": 133614, "epoch": 3181} {"train_loss": -6.691118240356445, "global_step": 133615, "epoch": 3181} {"train_loss": -6.644573211669922, "global_step": 133616, "epoch": 3181} {"train_loss": -6.7909746170043945, "global_step": 133617, "epoch": 3181} {"train_loss": -6.689083099365234, "global_step": 133618, "epoch": 3181} {"train_loss": -6.609472274780273, "global_step": 133619, "epoch": 3181} {"train_loss": -6.687687397003174, "global_step": 133620, "epoch": 3181} {"train_loss": -6.613127708435059, "global_step": 133621, "epoch": 3181} {"train_loss": -6.573779106140137, "global_step": 133622, "epoch": 3181} {"train_loss": -6.662838935852051, "global_step": 133623, "epoch": 3181} {"train_loss": -6.763764381408691, "global_step": 133624, "epoch": 3181} {"train_loss": -6.7749810218811035, "global_step": 133625, "epoch": 3181} {"train_loss": -6.813662052154541, "global_step": 133626, "epoch": 3181} {"train_loss": -6.727235794067383, "global_step": 133627, "epoch": 3181} {"train_loss": -6.69300651550293, "global_step": 133628, "epoch": 3181} {"train_loss": -6.634912490844727, "global_step": 133629, "epoch": 3181} {"train_loss": -6.785902976989746, "global_step": 133630, "epoch": 3181} {"train_loss": -6.7176971435546875, "global_step": 133631, "epoch": 3181} {"train_loss": -6.83254337310791, "global_step": 133632, "epoch": 3181} {"train_loss": -6.729337692260742, "global_step": 133633, "epoch": 3181} {"train_loss": -6.704165458679199, "global_step": 133634, "epoch": 3181} {"train_loss": -6.518405437469482, "global_step": 133635, "epoch": 3181} {"train_loss": -6.706300735473633, "global_step": 133636, "epoch": 3181} {"train_loss": -6.614686012268066, "global_step": 133637, "epoch": 3181} {"train_loss": -6.7038493156433105, "global_step": 133638, "epoch": 3181} {"train_loss": -6.52606725692749, "global_step": 133639, "epoch": 3181} {"train_loss": -6.783807754516602, "global_step": 133640, "epoch": 3181} {"train_loss": -6.6871442794799805, "global_step": 133641, "epoch": 3181} {"train_loss": -6.569218635559082, "global_step": 133642, "epoch": 3181} {"train_loss": -6.679455053238642, "global_step": 133643, "epoch": 3181, "val_loss": 68244.984375} {"train_loss": -6.525522232055664, "global_step": 133644, "epoch": 3182} {"train_loss": -6.544064044952393, "global_step": 133645, "epoch": 3182} {"train_loss": -6.706255912780762, "global_step": 133646, "epoch": 3182} {"train_loss": -6.622414588928223, "global_step": 133647, "epoch": 3182} {"train_loss": -6.653195858001709, "global_step": 133648, "epoch": 3182} {"train_loss": -6.615110874176025, "global_step": 133649, "epoch": 3182} {"train_loss": -6.632619857788086, "global_step": 133650, "epoch": 3182} {"train_loss": -6.728089332580566, "global_step": 133651, "epoch": 3182} {"train_loss": -6.766068935394287, "global_step": 133652, "epoch": 3182} {"train_loss": -6.644414901733398, "global_step": 133653, "epoch": 3182} {"train_loss": -6.4707536697387695, "global_step": 133654, "epoch": 3182} {"train_loss": -6.655477523803711, "global_step": 133655, "epoch": 3182} {"train_loss": -6.700930118560791, "global_step": 133656, "epoch": 3182} {"train_loss": -6.610374450683594, "global_step": 133657, "epoch": 3182} {"train_loss": -6.744081974029541, "global_step": 133658, "epoch": 3182} {"train_loss": -6.545339584350586, "global_step": 133659, "epoch": 3182} {"train_loss": -6.809622287750244, "global_step": 133660, "epoch": 3182} {"train_loss": -6.6399102210998535, "global_step": 133661, "epoch": 3182} {"train_loss": -6.712253570556641, "global_step": 133662, "epoch": 3182} {"train_loss": -6.699151992797852, "global_step": 133663, "epoch": 3182} {"train_loss": -6.696220397949219, "global_step": 133664, "epoch": 3182} {"train_loss": -6.833006858825684, "global_step": 133665, "epoch": 3182} {"train_loss": -6.6295576095581055, "global_step": 133666, "epoch": 3182} {"train_loss": -6.621854305267334, "global_step": 133667, "epoch": 3182} {"train_loss": -6.638287544250488, "global_step": 133668, "epoch": 3182} {"train_loss": -6.755481719970703, "global_step": 133669, "epoch": 3182} {"train_loss": -6.738255977630615, "global_step": 133670, "epoch": 3182} {"train_loss": -6.669581413269043, "global_step": 133671, "epoch": 3182} {"train_loss": -6.763922214508057, "global_step": 133672, "epoch": 3182} {"train_loss": -6.55816650390625, "global_step": 133673, "epoch": 3182} {"train_loss": -6.711861610412598, "global_step": 133674, "epoch": 3182} {"train_loss": -6.6226654052734375, "global_step": 133675, "epoch": 3182} {"train_loss": -6.596750259399414, "global_step": 133676, "epoch": 3182} {"train_loss": -6.767917633056641, "global_step": 133677, "epoch": 3182} {"train_loss": -6.549375534057617, "global_step": 133678, "epoch": 3182} {"train_loss": -6.815624237060547, "global_step": 133679, "epoch": 3182} {"train_loss": -6.67444372177124, "global_step": 133680, "epoch": 3182} {"train_loss": -6.572992324829102, "global_step": 133681, "epoch": 3182} {"train_loss": -6.657746315002441, "global_step": 133682, "epoch": 3182} {"train_loss": -6.609657287597656, "global_step": 133683, "epoch": 3182} {"train_loss": -6.647420883178711, "global_step": 133684, "epoch": 3182} {"train_loss": -6.662445022946312, "global_step": 133685, "epoch": 3182, "val_loss": 68241.515625} {"train_loss": -6.70847225189209, "global_step": 133686, "epoch": 3183} {"train_loss": -6.668035984039307, "global_step": 133687, "epoch": 3183} {"train_loss": -6.689886093139648, "global_step": 133688, "epoch": 3183} {"train_loss": -6.639402389526367, "global_step": 133689, "epoch": 3183} {"train_loss": -6.694169044494629, "global_step": 133690, "epoch": 3183} {"train_loss": -6.719432353973389, "global_step": 133691, "epoch": 3183} {"train_loss": -6.6855621337890625, "global_step": 133692, "epoch": 3183} {"train_loss": -6.645323753356934, "global_step": 133693, "epoch": 3183} {"train_loss": -6.5876641273498535, "global_step": 133694, "epoch": 3183} {"train_loss": -6.62088680267334, "global_step": 133695, "epoch": 3183} {"train_loss": -6.641915321350098, "global_step": 133696, "epoch": 3183} {"train_loss": -6.745456695556641, "global_step": 133697, "epoch": 3183} {"train_loss": -6.757378578186035, "global_step": 133698, "epoch": 3183} {"train_loss": -6.708555221557617, "global_step": 133699, "epoch": 3183} {"train_loss": -6.675588607788086, "global_step": 133700, "epoch": 3183} {"train_loss": -6.70748233795166, "global_step": 133701, "epoch": 3183} {"train_loss": -6.705699920654297, "global_step": 133702, "epoch": 3183} {"train_loss": -6.551492691040039, "global_step": 133703, "epoch": 3183} {"train_loss": -6.7375054359436035, "global_step": 133704, "epoch": 3183} {"train_loss": -6.642690181732178, "global_step": 133705, "epoch": 3183} {"train_loss": -6.5553765296936035, "global_step": 133706, "epoch": 3183} {"train_loss": -6.68817138671875, "global_step": 133707, "epoch": 3183} {"train_loss": -6.583788871765137, "global_step": 133708, "epoch": 3183} {"train_loss": -6.66566276550293, "global_step": 133709, "epoch": 3183} {"train_loss": -6.662101745605469, "global_step": 133710, "epoch": 3183} {"train_loss": -6.523078918457031, "global_step": 133711, "epoch": 3183} {"train_loss": -6.721320152282715, "global_step": 133712, "epoch": 3183} {"train_loss": -6.738117218017578, "global_step": 133713, "epoch": 3183} {"train_loss": -6.591953277587891, "global_step": 133714, "epoch": 3183} {"train_loss": -6.578573226928711, "global_step": 133715, "epoch": 3183} {"train_loss": -6.624444961547852, "global_step": 133716, "epoch": 3183} {"train_loss": -6.577635765075684, "global_step": 133717, "epoch": 3183} {"train_loss": -6.530726432800293, "global_step": 133718, "epoch": 3183} {"train_loss": -6.7057952880859375, "global_step": 133719, "epoch": 3183} {"train_loss": -6.600396633148193, "global_step": 133720, "epoch": 3183} {"train_loss": -6.619715690612793, "global_step": 133721, "epoch": 3183} {"train_loss": -6.66745138168335, "global_step": 133722, "epoch": 3183} {"train_loss": -6.740230560302734, "global_step": 133723, "epoch": 3183} {"train_loss": -6.642844200134277, "global_step": 133724, "epoch": 3183} {"train_loss": -6.611500263214111, "global_step": 133725, "epoch": 3183} {"train_loss": -6.70871639251709, "global_step": 133726, "epoch": 3183} {"train_loss": -6.657929636183239, "global_step": 133727, "epoch": 3183, "val_loss": 68449.28125} {"train_loss": -6.558103084564209, "global_step": 133728, "epoch": 3184} {"train_loss": -6.714150905609131, "global_step": 133729, "epoch": 3184} {"train_loss": -6.819222450256348, "global_step": 133730, "epoch": 3184} {"train_loss": -6.701274871826172, "global_step": 133731, "epoch": 3184} {"train_loss": -6.639881610870361, "global_step": 133732, "epoch": 3184} {"train_loss": -6.634183883666992, "global_step": 133733, "epoch": 3184} {"train_loss": -6.639069557189941, "global_step": 133734, "epoch": 3184} {"train_loss": -6.5692853927612305, "global_step": 133735, "epoch": 3184} {"train_loss": -6.543801307678223, "global_step": 133736, "epoch": 3184} {"train_loss": -6.689473628997803, "global_step": 133737, "epoch": 3184} {"train_loss": -6.625869274139404, "global_step": 133738, "epoch": 3184} {"train_loss": -6.681866645812988, "global_step": 133739, "epoch": 3184} {"train_loss": -6.602812767028809, "global_step": 133740, "epoch": 3184} {"train_loss": -6.720765590667725, "global_step": 133741, "epoch": 3184} {"train_loss": -6.620595932006836, "global_step": 133742, "epoch": 3184} {"train_loss": -6.6206817626953125, "global_step": 133743, "epoch": 3184} {"train_loss": -6.583014488220215, "global_step": 133744, "epoch": 3184} {"train_loss": -6.649240493774414, "global_step": 133745, "epoch": 3184} {"train_loss": -6.69538688659668, "global_step": 133746, "epoch": 3184} {"train_loss": -6.7013468742370605, "global_step": 133747, "epoch": 3184} {"train_loss": -6.639309883117676, "global_step": 133748, "epoch": 3184} {"train_loss": -6.691188812255859, "global_step": 133749, "epoch": 3184} {"train_loss": -6.636224269866943, "global_step": 133750, "epoch": 3184} {"train_loss": -6.596747875213623, "global_step": 133751, "epoch": 3184} {"train_loss": -6.683287143707275, "global_step": 133752, "epoch": 3184} {"train_loss": -6.776176452636719, "global_step": 133753, "epoch": 3184} {"train_loss": -6.723782539367676, "global_step": 133754, "epoch": 3184} {"train_loss": -6.7277936935424805, "global_step": 133755, "epoch": 3184} {"train_loss": -6.640038013458252, "global_step": 133756, "epoch": 3184} {"train_loss": -6.761656284332275, "global_step": 133757, "epoch": 3184} {"train_loss": -6.667054176330566, "global_step": 133758, "epoch": 3184} {"train_loss": -6.658299922943115, "global_step": 133759, "epoch": 3184} {"train_loss": -6.694102764129639, "global_step": 133760, "epoch": 3184} {"train_loss": -6.713228702545166, "global_step": 133761, "epoch": 3184} {"train_loss": -6.692690372467041, "global_step": 133762, "epoch": 3184} {"train_loss": -6.567199230194092, "global_step": 133763, "epoch": 3184} {"train_loss": -6.63288688659668, "global_step": 133764, "epoch": 3184} {"train_loss": -6.689852714538574, "global_step": 133765, "epoch": 3184} {"train_loss": -6.609952449798584, "global_step": 133766, "epoch": 3184} {"train_loss": -6.6145405769348145, "global_step": 133767, "epoch": 3184} {"train_loss": -6.683509826660156, "global_step": 133768, "epoch": 3184} {"train_loss": -6.660128014428275, "global_step": 133769, "epoch": 3184, "val_loss": 68374.578125} {"train_loss": -6.637703895568848, "global_step": 133770, "epoch": 3185} {"train_loss": -6.722641944885254, "global_step": 133771, "epoch": 3185} {"train_loss": -6.594886779785156, "global_step": 133772, "epoch": 3185} {"train_loss": -6.543423652648926, "global_step": 133773, "epoch": 3185} {"train_loss": -6.664353370666504, "global_step": 133774, "epoch": 3185} {"train_loss": -6.512262344360352, "global_step": 133775, "epoch": 3185} {"train_loss": -6.739497184753418, "global_step": 133776, "epoch": 3185} {"train_loss": -6.563958168029785, "global_step": 133777, "epoch": 3185} {"train_loss": -6.623932838439941, "global_step": 133778, "epoch": 3185} {"train_loss": -6.676944732666016, "global_step": 133779, "epoch": 3185} {"train_loss": -6.594759941101074, "global_step": 133780, "epoch": 3185} {"train_loss": -6.7218122482299805, "global_step": 133781, "epoch": 3185} {"train_loss": -6.5885009765625, "global_step": 133782, "epoch": 3185} {"train_loss": -6.578119277954102, "global_step": 133783, "epoch": 3185} {"train_loss": -6.492513656616211, "global_step": 133784, "epoch": 3185} {"train_loss": -6.681926727294922, "global_step": 133785, "epoch": 3185} {"train_loss": -6.619169235229492, "global_step": 133786, "epoch": 3185} {"train_loss": -6.754356384277344, "global_step": 133787, "epoch": 3185} {"train_loss": -6.720698833465576, "global_step": 133788, "epoch": 3185} {"train_loss": -6.569181442260742, "global_step": 133789, "epoch": 3185} {"train_loss": -6.779964923858643, "global_step": 133790, "epoch": 3185} {"train_loss": -6.565482139587402, "global_step": 133791, "epoch": 3185} {"train_loss": -6.687007904052734, "global_step": 133792, "epoch": 3185} {"train_loss": -6.690740585327148, "global_step": 133793, "epoch": 3185} {"train_loss": -6.644750118255615, "global_step": 133794, "epoch": 3185} {"train_loss": -6.747931957244873, "global_step": 133795, "epoch": 3185} {"train_loss": -6.5743889808654785, "global_step": 133796, "epoch": 3185} {"train_loss": -6.678684234619141, "global_step": 133797, "epoch": 3185} {"train_loss": -6.687259197235107, "global_step": 133798, "epoch": 3185} {"train_loss": -6.547131061553955, "global_step": 133799, "epoch": 3185} {"train_loss": -6.64543342590332, "global_step": 133800, "epoch": 3185} {"train_loss": -6.74301815032959, "global_step": 133801, "epoch": 3185} {"train_loss": -6.571815013885498, "global_step": 133802, "epoch": 3185} {"train_loss": -6.697833061218262, "global_step": 133803, "epoch": 3185} {"train_loss": -6.65349006652832, "global_step": 133804, "epoch": 3185} {"train_loss": -6.664416313171387, "global_step": 133805, "epoch": 3185} {"train_loss": -6.5876922607421875, "global_step": 133806, "epoch": 3185} {"train_loss": -6.623724937438965, "global_step": 133807, "epoch": 3185} {"train_loss": -6.596445083618164, "global_step": 133808, "epoch": 3185} {"train_loss": -6.584589958190918, "global_step": 133809, "epoch": 3185} {"train_loss": -6.444210052490234, "global_step": 133810, "epoch": 3185} {"train_loss": -6.634732904888335, "global_step": 133811, "epoch": 3185, "val_loss": 68277.046875} {"train_loss": -6.669472694396973, "global_step": 133812, "epoch": 3186} {"train_loss": -6.679496765136719, "global_step": 133813, "epoch": 3186} {"train_loss": -6.688033103942871, "global_step": 133814, "epoch": 3186} {"train_loss": -6.721780776977539, "global_step": 133815, "epoch": 3186} {"train_loss": -6.6166229248046875, "global_step": 133816, "epoch": 3186} {"train_loss": -6.756046295166016, "global_step": 133817, "epoch": 3186} {"train_loss": -6.733899116516113, "global_step": 133818, "epoch": 3186} {"train_loss": -6.676877498626709, "global_step": 133819, "epoch": 3186} {"train_loss": -6.75921106338501, "global_step": 133820, "epoch": 3186} {"train_loss": -6.583481311798096, "global_step": 133821, "epoch": 3186} {"train_loss": -6.5989227294921875, "global_step": 133822, "epoch": 3186} {"train_loss": -6.74368953704834, "global_step": 133823, "epoch": 3186} {"train_loss": -6.669075965881348, "global_step": 133824, "epoch": 3186} {"train_loss": -6.738934516906738, "global_step": 133825, "epoch": 3186} {"train_loss": -6.630413055419922, "global_step": 133826, "epoch": 3186} {"train_loss": -6.64108943939209, "global_step": 133827, "epoch": 3186} {"train_loss": -6.621956825256348, "global_step": 133828, "epoch": 3186} {"train_loss": -6.658987522125244, "global_step": 133829, "epoch": 3186} {"train_loss": -6.623022079467773, "global_step": 133830, "epoch": 3186} {"train_loss": -6.6038408279418945, "global_step": 133831, "epoch": 3186} {"train_loss": -6.63065767288208, "global_step": 133832, "epoch": 3186} {"train_loss": -6.498507499694824, "global_step": 133833, "epoch": 3186} {"train_loss": -6.745657920837402, "global_step": 133834, "epoch": 3186} {"train_loss": -6.578815460205078, "global_step": 133835, "epoch": 3186} {"train_loss": -6.540592193603516, "global_step": 133836, "epoch": 3186} {"train_loss": -6.772424697875977, "global_step": 133837, "epoch": 3186} {"train_loss": -6.557891845703125, "global_step": 133838, "epoch": 3186} {"train_loss": -6.629764080047607, "global_step": 133839, "epoch": 3186} {"train_loss": -6.535667419433594, "global_step": 133840, "epoch": 3186} {"train_loss": -6.563575744628906, "global_step": 133841, "epoch": 3186} {"train_loss": -6.686141014099121, "global_step": 133842, "epoch": 3186} {"train_loss": -6.660160064697266, "global_step": 133843, "epoch": 3186} {"train_loss": -6.6728339195251465, "global_step": 133844, "epoch": 3186} {"train_loss": -6.636213779449463, "global_step": 133845, "epoch": 3186} {"train_loss": -6.699734687805176, "global_step": 133846, "epoch": 3186} {"train_loss": -6.60584020614624, "global_step": 133847, "epoch": 3186} {"train_loss": -6.582803726196289, "global_step": 133848, "epoch": 3186} {"train_loss": -6.568354606628418, "global_step": 133849, "epoch": 3186} {"train_loss": -6.478009223937988, "global_step": 133850, "epoch": 3186} {"train_loss": -6.580634593963623, "global_step": 133851, "epoch": 3186} {"train_loss": -6.437613010406494, "global_step": 133852, "epoch": 3186} {"train_loss": -6.632894243512835, "global_step": 133853, "epoch": 3186, "val_loss": 68570.5} {"train_loss": -6.632429122924805, "global_step": 133854, "epoch": 3187} {"train_loss": -6.520296573638916, "global_step": 133855, "epoch": 3187} {"train_loss": -6.610459327697754, "global_step": 133856, "epoch": 3187} {"train_loss": -6.607165336608887, "global_step": 133857, "epoch": 3187} {"train_loss": -6.604368209838867, "global_step": 133858, "epoch": 3187} {"train_loss": -6.495318412780762, "global_step": 133859, "epoch": 3187} {"train_loss": -6.566657543182373, "global_step": 133860, "epoch": 3187} {"train_loss": -6.54580020904541, "global_step": 133861, "epoch": 3187} {"train_loss": -6.595468521118164, "global_step": 133862, "epoch": 3187} {"train_loss": -6.60697078704834, "global_step": 133863, "epoch": 3187} {"train_loss": -6.6278157234191895, "global_step": 133864, "epoch": 3187} {"train_loss": -6.649637699127197, "global_step": 133865, "epoch": 3187} {"train_loss": -6.673878192901611, "global_step": 133866, "epoch": 3187} {"train_loss": -6.621090888977051, "global_step": 133867, "epoch": 3187} {"train_loss": -6.4984049797058105, "global_step": 133868, "epoch": 3187} {"train_loss": -6.755255699157715, "global_step": 133869, "epoch": 3187} {"train_loss": -6.617093086242676, "global_step": 133870, "epoch": 3187} {"train_loss": -6.530200958251953, "global_step": 133871, "epoch": 3187} {"train_loss": -6.708379745483398, "global_step": 133872, "epoch": 3187} {"train_loss": -6.573719501495361, "global_step": 133873, "epoch": 3187} {"train_loss": -6.570682525634766, "global_step": 133874, "epoch": 3187} {"train_loss": -6.724028587341309, "global_step": 133875, "epoch": 3187} {"train_loss": -6.670053958892822, "global_step": 133876, "epoch": 3187} {"train_loss": -6.59765100479126, "global_step": 133877, "epoch": 3187} {"train_loss": -6.515231132507324, "global_step": 133878, "epoch": 3187} {"train_loss": -6.681818008422852, "global_step": 133879, "epoch": 3187} {"train_loss": -6.7053022384643555, "global_step": 133880, "epoch": 3187} {"train_loss": -6.546579360961914, "global_step": 133881, "epoch": 3187} {"train_loss": -6.596034049987793, "global_step": 133882, "epoch": 3187} {"train_loss": -6.459977626800537, "global_step": 133883, "epoch": 3187} {"train_loss": -6.612159729003906, "global_step": 133884, "epoch": 3187} {"train_loss": -6.688243865966797, "global_step": 133885, "epoch": 3187} {"train_loss": -6.548933029174805, "global_step": 133886, "epoch": 3187} {"train_loss": -6.652029991149902, "global_step": 133887, "epoch": 3187} {"train_loss": -6.659121513366699, "global_step": 133888, "epoch": 3187} {"train_loss": -6.620247840881348, "global_step": 133889, "epoch": 3187} {"train_loss": -6.76811408996582, "global_step": 133890, "epoch": 3187} {"train_loss": -6.641085624694824, "global_step": 133891, "epoch": 3187} {"train_loss": -6.689290523529053, "global_step": 133892, "epoch": 3187} {"train_loss": -6.651477336883545, "global_step": 133893, "epoch": 3187} {"train_loss": -6.650330543518066, "global_step": 133894, "epoch": 3187} {"train_loss": -6.618147974922543, "global_step": 133895, "epoch": 3187, "val_loss": 68128.8671875} {"train_loss": -6.730077266693115, "global_step": 133896, "epoch": 3188} {"train_loss": -6.636876106262207, "global_step": 133897, "epoch": 3188} {"train_loss": -6.657701015472412, "global_step": 133898, "epoch": 3188} {"train_loss": -6.657725811004639, "global_step": 133899, "epoch": 3188} {"train_loss": -6.671665191650391, "global_step": 133900, "epoch": 3188} {"train_loss": -6.521796226501465, "global_step": 133901, "epoch": 3188} {"train_loss": -6.604584693908691, "global_step": 133902, "epoch": 3188} {"train_loss": -6.600001335144043, "global_step": 133903, "epoch": 3188} {"train_loss": -6.8235015869140625, "global_step": 133904, "epoch": 3188} {"train_loss": -6.601486682891846, "global_step": 133905, "epoch": 3188} {"train_loss": -6.611901760101318, "global_step": 133906, "epoch": 3188} {"train_loss": -6.618413925170898, "global_step": 133907, "epoch": 3188} {"train_loss": -6.717119216918945, "global_step": 133908, "epoch": 3188} {"train_loss": -6.756964683532715, "global_step": 133909, "epoch": 3188} {"train_loss": -6.522340774536133, "global_step": 133910, "epoch": 3188} {"train_loss": -6.73415994644165, "global_step": 133911, "epoch": 3188} {"train_loss": -6.678229331970215, "global_step": 133912, "epoch": 3188} {"train_loss": -6.730360507965088, "global_step": 133913, "epoch": 3188} {"train_loss": -6.59258508682251, "global_step": 133914, "epoch": 3188} {"train_loss": -6.698192119598389, "global_step": 133915, "epoch": 3188} {"train_loss": -6.7226057052612305, "global_step": 133916, "epoch": 3188} {"train_loss": -6.654048919677734, "global_step": 133917, "epoch": 3188} {"train_loss": -6.70548677444458, "global_step": 133918, "epoch": 3188} {"train_loss": -6.748721122741699, "global_step": 133919, "epoch": 3188} {"train_loss": -6.675954818725586, "global_step": 133920, "epoch": 3188} {"train_loss": -6.68887996673584, "global_step": 133921, "epoch": 3188} {"train_loss": -6.6000165939331055, "global_step": 133922, "epoch": 3188} {"train_loss": -6.645179748535156, "global_step": 133923, "epoch": 3188} {"train_loss": -6.5988993644714355, "global_step": 133924, "epoch": 3188} {"train_loss": -6.677255153656006, "global_step": 133925, "epoch": 3188} {"train_loss": -6.749892234802246, "global_step": 133926, "epoch": 3188} {"train_loss": -6.659112930297852, "global_step": 133927, "epoch": 3188} {"train_loss": -6.563494682312012, "global_step": 133928, "epoch": 3188} {"train_loss": -6.793082237243652, "global_step": 133929, "epoch": 3188} {"train_loss": -6.619062423706055, "global_step": 133930, "epoch": 3188} {"train_loss": -6.550972938537598, "global_step": 133931, "epoch": 3188} {"train_loss": -6.7635393142700195, "global_step": 133932, "epoch": 3188} {"train_loss": -6.528995513916016, "global_step": 133933, "epoch": 3188} {"train_loss": -6.544425964355469, "global_step": 133934, "epoch": 3188} {"train_loss": -6.7690253257751465, "global_step": 133935, "epoch": 3188} {"train_loss": -6.4504194259643555, "global_step": 133936, "epoch": 3188} {"train_loss": -6.655263719104585, "global_step": 133937, "epoch": 3188, "val_loss": 68305.53125} {"train_loss": -6.655643463134766, "global_step": 133938, "epoch": 3189} {"train_loss": -6.5560503005981445, "global_step": 133939, "epoch": 3189} {"train_loss": -6.599759101867676, "global_step": 133940, "epoch": 3189} {"train_loss": -6.574250221252441, "global_step": 133941, "epoch": 3189} {"train_loss": -6.5995097160339355, "global_step": 133942, "epoch": 3189} {"train_loss": -6.649603366851807, "global_step": 133943, "epoch": 3189} {"train_loss": -6.555000305175781, "global_step": 133944, "epoch": 3189} {"train_loss": -6.649384498596191, "global_step": 133945, "epoch": 3189} {"train_loss": -6.611013412475586, "global_step": 133946, "epoch": 3189} {"train_loss": -6.611510753631592, "global_step": 133947, "epoch": 3189} {"train_loss": -6.739809036254883, "global_step": 133948, "epoch": 3189} {"train_loss": -6.658082008361816, "global_step": 133949, "epoch": 3189} {"train_loss": -6.641146659851074, "global_step": 133950, "epoch": 3189} {"train_loss": -6.712019920349121, "global_step": 133951, "epoch": 3189} {"train_loss": -6.685424327850342, "global_step": 133952, "epoch": 3189} {"train_loss": -6.64202356338501, "global_step": 133953, "epoch": 3189} {"train_loss": -6.65949821472168, "global_step": 133954, "epoch": 3189} {"train_loss": -6.61770486831665, "global_step": 133955, "epoch": 3189} {"train_loss": -6.742090702056885, "global_step": 133956, "epoch": 3189} {"train_loss": -6.6335859298706055, "global_step": 133957, "epoch": 3189} {"train_loss": -6.619970321655273, "global_step": 133958, "epoch": 3189} {"train_loss": -6.618671417236328, "global_step": 133959, "epoch": 3189} {"train_loss": -6.611756324768066, "global_step": 133960, "epoch": 3189} {"train_loss": -6.618839740753174, "global_step": 133961, "epoch": 3189} {"train_loss": -6.676536560058594, "global_step": 133962, "epoch": 3189} {"train_loss": -6.71266508102417, "global_step": 133963, "epoch": 3189} {"train_loss": -6.692768096923828, "global_step": 133964, "epoch": 3189} {"train_loss": -6.631704330444336, "global_step": 133965, "epoch": 3189} {"train_loss": -6.656861782073975, "global_step": 133966, "epoch": 3189} {"train_loss": -6.663246154785156, "global_step": 133967, "epoch": 3189} {"train_loss": -6.655667781829834, "global_step": 133968, "epoch": 3189} {"train_loss": -6.57059383392334, "global_step": 133969, "epoch": 3189} {"train_loss": -6.761979103088379, "global_step": 133970, "epoch": 3189} {"train_loss": -6.701188087463379, "global_step": 133971, "epoch": 3189} {"train_loss": -6.766509056091309, "global_step": 133972, "epoch": 3189} {"train_loss": -6.673772811889648, "global_step": 133973, "epoch": 3189} {"train_loss": -6.786167144775391, "global_step": 133974, "epoch": 3189} {"train_loss": -6.6346235275268555, "global_step": 133975, "epoch": 3189} {"train_loss": -6.652850151062012, "global_step": 133976, "epoch": 3189} {"train_loss": -6.64383602142334, "global_step": 133977, "epoch": 3189} {"train_loss": -6.775882244110107, "global_step": 133978, "epoch": 3189} {"train_loss": -6.6601299331301735, "global_step": 133979, "epoch": 3189, "val_loss": 68108.7265625} {"train_loss": -6.716856479644775, "global_step": 133980, "epoch": 3190} {"train_loss": -6.782898902893066, "global_step": 133981, "epoch": 3190} {"train_loss": -6.748894214630127, "global_step": 133982, "epoch": 3190} {"train_loss": -6.644717216491699, "global_step": 133983, "epoch": 3190} {"train_loss": -6.666357040405273, "global_step": 133984, "epoch": 3190} {"train_loss": -6.614410400390625, "global_step": 133985, "epoch": 3190} {"train_loss": -6.615515232086182, "global_step": 133986, "epoch": 3190} {"train_loss": -6.695132255554199, "global_step": 133987, "epoch": 3190} {"train_loss": -6.662493705749512, "global_step": 133988, "epoch": 3190} {"train_loss": -6.645476341247559, "global_step": 133989, "epoch": 3190} {"train_loss": -6.680212020874023, "global_step": 133990, "epoch": 3190} {"train_loss": -6.708423137664795, "global_step": 133991, "epoch": 3190} {"train_loss": -6.758507251739502, "global_step": 133992, "epoch": 3190} {"train_loss": -6.623162269592285, "global_step": 133993, "epoch": 3190} {"train_loss": -6.512521743774414, "global_step": 133994, "epoch": 3190} {"train_loss": -6.716033935546875, "global_step": 133995, "epoch": 3190} {"train_loss": -6.688068389892578, "global_step": 133996, "epoch": 3190} {"train_loss": -6.6581711769104, "global_step": 133997, "epoch": 3190} {"train_loss": -6.539437770843506, "global_step": 133998, "epoch": 3190} {"train_loss": -6.654841423034668, "global_step": 133999, "epoch": 3190} {"train_loss": -6.707611083984375, "global_step": 134000, "epoch": 3190} {"train_loss": -6.582507133483887, "global_step": 134001, "epoch": 3190} {"train_loss": -6.588968276977539, "global_step": 134002, "epoch": 3190} {"train_loss": -6.736328125, "global_step": 134003, "epoch": 3190} {"train_loss": -6.704631805419922, "global_step": 134004, "epoch": 3190} {"train_loss": -6.6724324226379395, "global_step": 134005, "epoch": 3190} {"train_loss": -6.626194953918457, "global_step": 134006, "epoch": 3190} {"train_loss": -6.6043291091918945, "global_step": 134007, "epoch": 3190} {"train_loss": -6.7812581062316895, "global_step": 134008, "epoch": 3190} {"train_loss": -6.625353813171387, "global_step": 134009, "epoch": 3190} {"train_loss": -6.737388610839844, "global_step": 134010, "epoch": 3190} {"train_loss": -6.6653947830200195, "global_step": 134011, "epoch": 3190} {"train_loss": -6.749601364135742, "global_step": 134012, "epoch": 3190} {"train_loss": -6.671813011169434, "global_step": 134013, "epoch": 3190} {"train_loss": -6.619946002960205, "global_step": 134014, "epoch": 3190} {"train_loss": -6.662668704986572, "global_step": 134015, "epoch": 3190} {"train_loss": -6.765924453735352, "global_step": 134016, "epoch": 3190} {"train_loss": -6.6696977615356445, "global_step": 134017, "epoch": 3190} {"train_loss": -6.692495822906494, "global_step": 134018, "epoch": 3190} {"train_loss": -6.693314552307129, "global_step": 134019, "epoch": 3190} {"train_loss": -6.685136795043945, "global_step": 134020, "epoch": 3190} {"train_loss": -6.671768892379034, "global_step": 134021, "epoch": 3190, "val_loss": 68016.3984375} {"train_loss": -6.503809928894043, "global_step": 134022, "epoch": 3191} {"train_loss": -6.662837505340576, "global_step": 134023, "epoch": 3191} {"train_loss": -6.666121006011963, "global_step": 134024, "epoch": 3191} {"train_loss": -6.772055149078369, "global_step": 134025, "epoch": 3191} {"train_loss": -6.64915657043457, "global_step": 134026, "epoch": 3191} {"train_loss": -6.6909990310668945, "global_step": 134027, "epoch": 3191} {"train_loss": -6.656879425048828, "global_step": 134028, "epoch": 3191} {"train_loss": -6.664206504821777, "global_step": 134029, "epoch": 3191} {"train_loss": -6.755807876586914, "global_step": 134030, "epoch": 3191} {"train_loss": -6.759894847869873, "global_step": 134031, "epoch": 3191} {"train_loss": -6.59388542175293, "global_step": 134032, "epoch": 3191} {"train_loss": -6.61546516418457, "global_step": 134033, "epoch": 3191} {"train_loss": -6.616874694824219, "global_step": 134034, "epoch": 3191} {"train_loss": -6.892904281616211, "global_step": 134035, "epoch": 3191} {"train_loss": -6.71638298034668, "global_step": 134036, "epoch": 3191} {"train_loss": -6.747853755950928, "global_step": 134037, "epoch": 3191} {"train_loss": -6.629892826080322, "global_step": 134038, "epoch": 3191} {"train_loss": -6.807161331176758, "global_step": 134039, "epoch": 3191} {"train_loss": -6.707174301147461, "global_step": 134040, "epoch": 3191} {"train_loss": -6.650849342346191, "global_step": 134041, "epoch": 3191} {"train_loss": -6.586510181427002, "global_step": 134042, "epoch": 3191} {"train_loss": -6.699263572692871, "global_step": 134043, "epoch": 3191} {"train_loss": -6.63218879699707, "global_step": 134044, "epoch": 3191} {"train_loss": -6.726825714111328, "global_step": 134045, "epoch": 3191} {"train_loss": -6.72010612487793, "global_step": 134046, "epoch": 3191} {"train_loss": -6.5985822677612305, "global_step": 134047, "epoch": 3191} {"train_loss": -6.752049446105957, "global_step": 134048, "epoch": 3191} {"train_loss": -6.589284420013428, "global_step": 134049, "epoch": 3191} {"train_loss": -6.627374649047852, "global_step": 134050, "epoch": 3191} {"train_loss": -6.531167984008789, "global_step": 134051, "epoch": 3191} {"train_loss": -6.587111473083496, "global_step": 134052, "epoch": 3191} {"train_loss": -6.639142990112305, "global_step": 134053, "epoch": 3191} {"train_loss": -6.7287092208862305, "global_step": 134054, "epoch": 3191} {"train_loss": -6.706498146057129, "global_step": 134055, "epoch": 3191} {"train_loss": -6.6000165939331055, "global_step": 134056, "epoch": 3191} {"train_loss": -6.690267562866211, "global_step": 134057, "epoch": 3191} {"train_loss": -6.587107181549072, "global_step": 134058, "epoch": 3191} {"train_loss": -6.654438495635986, "global_step": 134059, "epoch": 3191} {"train_loss": -6.654999256134033, "global_step": 134060, "epoch": 3191} {"train_loss": -6.663262367248535, "global_step": 134061, "epoch": 3191} {"train_loss": -6.701632976531982, "global_step": 134062, "epoch": 3191} {"train_loss": -6.668218419665382, "global_step": 134063, "epoch": 3191, "val_loss": 68388.03125} {"train_loss": -6.6504058837890625, "global_step": 134064, "epoch": 3192} {"train_loss": -6.665494918823242, "global_step": 134065, "epoch": 3192} {"train_loss": -6.609563827514648, "global_step": 134066, "epoch": 3192} {"train_loss": -6.653439044952393, "global_step": 134067, "epoch": 3192} {"train_loss": -6.656900405883789, "global_step": 134068, "epoch": 3192} {"train_loss": -6.659599304199219, "global_step": 134069, "epoch": 3192} {"train_loss": -6.739651203155518, "global_step": 134070, "epoch": 3192} {"train_loss": -6.673431873321533, "global_step": 134071, "epoch": 3192} {"train_loss": -6.655117034912109, "global_step": 134072, "epoch": 3192} {"train_loss": -6.647069454193115, "global_step": 134073, "epoch": 3192} {"train_loss": -6.681256294250488, "global_step": 134074, "epoch": 3192} {"train_loss": -6.665477752685547, "global_step": 134075, "epoch": 3192} {"train_loss": -6.676941871643066, "global_step": 134076, "epoch": 3192} {"train_loss": -6.680810451507568, "global_step": 134077, "epoch": 3192} {"train_loss": -6.727802753448486, "global_step": 134078, "epoch": 3192} {"train_loss": -6.69130277633667, "global_step": 134079, "epoch": 3192} {"train_loss": -6.6084794998168945, "global_step": 134080, "epoch": 3192} {"train_loss": -6.670663833618164, "global_step": 134081, "epoch": 3192} {"train_loss": -6.621503829956055, "global_step": 134082, "epoch": 3192} {"train_loss": -6.692471027374268, "global_step": 134083, "epoch": 3192} {"train_loss": -6.695664405822754, "global_step": 134084, "epoch": 3192} {"train_loss": -6.756220817565918, "global_step": 134085, "epoch": 3192} {"train_loss": -6.613552093505859, "global_step": 134086, "epoch": 3192} {"train_loss": -6.655670166015625, "global_step": 134087, "epoch": 3192} {"train_loss": -6.6469035148620605, "global_step": 134088, "epoch": 3192} {"train_loss": -6.644215106964111, "global_step": 134089, "epoch": 3192} {"train_loss": -6.661553859710693, "global_step": 134090, "epoch": 3192} {"train_loss": -6.580094337463379, "global_step": 134091, "epoch": 3192} {"train_loss": -6.548683166503906, "global_step": 134092, "epoch": 3192} {"train_loss": -6.64310359954834, "global_step": 134093, "epoch": 3192} {"train_loss": -6.648133277893066, "global_step": 134094, "epoch": 3192} {"train_loss": -6.697351455688477, "global_step": 134095, "epoch": 3192} {"train_loss": -6.649696350097656, "global_step": 134096, "epoch": 3192} {"train_loss": -6.792250156402588, "global_step": 134097, "epoch": 3192} {"train_loss": -6.655562400817871, "global_step": 134098, "epoch": 3192} {"train_loss": -6.629009246826172, "global_step": 134099, "epoch": 3192} {"train_loss": -6.7298688888549805, "global_step": 134100, "epoch": 3192} {"train_loss": -6.665616989135742, "global_step": 134101, "epoch": 3192} {"train_loss": -6.654965400695801, "global_step": 134102, "epoch": 3192} {"train_loss": -6.64703369140625, "global_step": 134103, "epoch": 3192} {"train_loss": -6.757823467254639, "global_step": 134104, "epoch": 3192} {"train_loss": -6.66722499756586, "global_step": 134105, "epoch": 3192, "val_loss": 68369.53125} {"train_loss": -6.778755187988281, "global_step": 134106, "epoch": 3193} {"train_loss": -6.6703057289123535, "global_step": 134107, "epoch": 3193} {"train_loss": -6.758700370788574, "global_step": 134108, "epoch": 3193} {"train_loss": -6.813505172729492, "global_step": 134109, "epoch": 3193} {"train_loss": -6.776712417602539, "global_step": 134110, "epoch": 3193} {"train_loss": -6.610967636108398, "global_step": 134111, "epoch": 3193} {"train_loss": -6.810662269592285, "global_step": 134112, "epoch": 3193} {"train_loss": -6.545104026794434, "global_step": 134113, "epoch": 3193} {"train_loss": -6.606902599334717, "global_step": 134114, "epoch": 3193} {"train_loss": -6.6590752601623535, "global_step": 134115, "epoch": 3193} {"train_loss": -6.621404647827148, "global_step": 134116, "epoch": 3193} {"train_loss": -6.691802024841309, "global_step": 134117, "epoch": 3193} {"train_loss": -6.671314239501953, "global_step": 134118, "epoch": 3193} {"train_loss": -6.553632736206055, "global_step": 134119, "epoch": 3193} {"train_loss": -6.674777507781982, "global_step": 134120, "epoch": 3193} {"train_loss": -6.604643821716309, "global_step": 134121, "epoch": 3193} {"train_loss": -6.649234771728516, "global_step": 134122, "epoch": 3193} {"train_loss": -6.666404724121094, "global_step": 134123, "epoch": 3193} {"train_loss": -6.605869293212891, "global_step": 134124, "epoch": 3193} {"train_loss": -6.744824409484863, "global_step": 134125, "epoch": 3193} {"train_loss": -6.570436954498291, "global_step": 134126, "epoch": 3193} {"train_loss": -6.730763912200928, "global_step": 134127, "epoch": 3193} {"train_loss": -6.648889064788818, "global_step": 134128, "epoch": 3193} {"train_loss": -6.792749404907227, "global_step": 134129, "epoch": 3193} {"train_loss": -6.515322685241699, "global_step": 134130, "epoch": 3193} {"train_loss": -6.686894416809082, "global_step": 134131, "epoch": 3193} {"train_loss": -6.600131034851074, "global_step": 134132, "epoch": 3193} {"train_loss": -6.659773826599121, "global_step": 134133, "epoch": 3193} {"train_loss": -6.668946266174316, "global_step": 134134, "epoch": 3193} {"train_loss": -6.69210147857666, "global_step": 134135, "epoch": 3193} {"train_loss": -6.654412269592285, "global_step": 134136, "epoch": 3193} {"train_loss": -6.675065994262695, "global_step": 134137, "epoch": 3193} {"train_loss": -6.679544448852539, "global_step": 134138, "epoch": 3193} {"train_loss": -6.598443031311035, "global_step": 134139, "epoch": 3193} {"train_loss": -6.677678108215332, "global_step": 134140, "epoch": 3193} {"train_loss": -6.654387474060059, "global_step": 134141, "epoch": 3193} {"train_loss": -6.546817302703857, "global_step": 134142, "epoch": 3193} {"train_loss": -6.589493751525879, "global_step": 134143, "epoch": 3193} {"train_loss": -6.683653831481934, "global_step": 134144, "epoch": 3193} {"train_loss": -6.699897766113281, "global_step": 134145, "epoch": 3193} {"train_loss": -6.7557244300842285, "global_step": 134146, "epoch": 3193} {"train_loss": -6.663076502936227, "global_step": 134147, "epoch": 3193, "val_loss": 68315.953125} {"train_loss": -6.704730033874512, "global_step": 134148, "epoch": 3194} {"train_loss": -6.656691551208496, "global_step": 134149, "epoch": 3194} {"train_loss": -6.723485946655273, "global_step": 134150, "epoch": 3194} {"train_loss": -6.619173049926758, "global_step": 134151, "epoch": 3194} {"train_loss": -6.65508508682251, "global_step": 134152, "epoch": 3194} {"train_loss": -6.626237392425537, "global_step": 134153, "epoch": 3194} {"train_loss": -6.710236549377441, "global_step": 134154, "epoch": 3194} {"train_loss": -6.785147666931152, "global_step": 134155, "epoch": 3194} {"train_loss": -6.670427322387695, "global_step": 134156, "epoch": 3194} {"train_loss": -6.68028450012207, "global_step": 134157, "epoch": 3194} {"train_loss": -6.88002347946167, "global_step": 134158, "epoch": 3194} {"train_loss": -6.7176923751831055, "global_step": 134159, "epoch": 3194} {"train_loss": -6.704812049865723, "global_step": 134160, "epoch": 3194} {"train_loss": -6.716629981994629, "global_step": 134161, "epoch": 3194} {"train_loss": -6.7606987953186035, "global_step": 134162, "epoch": 3194} {"train_loss": -6.689386367797852, "global_step": 134163, "epoch": 3194} {"train_loss": -6.739630222320557, "global_step": 134164, "epoch": 3194} {"train_loss": -6.859615802764893, "global_step": 134165, "epoch": 3194} {"train_loss": -6.607882022857666, "global_step": 134166, "epoch": 3194} {"train_loss": -6.81790828704834, "global_step": 134167, "epoch": 3194} {"train_loss": -6.5792131423950195, "global_step": 134168, "epoch": 3194} {"train_loss": -6.711580276489258, "global_step": 134169, "epoch": 3194} {"train_loss": -6.70704984664917, "global_step": 134170, "epoch": 3194} {"train_loss": -6.687055587768555, "global_step": 134171, "epoch": 3194} {"train_loss": -6.613450527191162, "global_step": 134172, "epoch": 3194} {"train_loss": -6.730184555053711, "global_step": 134173, "epoch": 3194} {"train_loss": -6.811718463897705, "global_step": 134174, "epoch": 3194} {"train_loss": -6.710619926452637, "global_step": 134175, "epoch": 3194} {"train_loss": -6.735453128814697, "global_step": 134176, "epoch": 3194} {"train_loss": -6.640151500701904, "global_step": 134177, "epoch": 3194} {"train_loss": -6.669563293457031, "global_step": 134178, "epoch": 3194} {"train_loss": -6.624719142913818, "global_step": 134179, "epoch": 3194} {"train_loss": -6.7278218269348145, "global_step": 134180, "epoch": 3194} {"train_loss": -6.676968574523926, "global_step": 134181, "epoch": 3194} {"train_loss": -6.601039409637451, "global_step": 134182, "epoch": 3194} {"train_loss": -6.718355655670166, "global_step": 134183, "epoch": 3194} {"train_loss": -6.780937194824219, "global_step": 134184, "epoch": 3194} {"train_loss": -6.805882453918457, "global_step": 134185, "epoch": 3194} {"train_loss": -6.668266773223877, "global_step": 134186, "epoch": 3194} {"train_loss": -6.532049179077148, "global_step": 134187, "epoch": 3194} {"train_loss": -6.74498176574707, "global_step": 134188, "epoch": 3194} {"train_loss": -6.6990870634714765, "global_step": 134189, "epoch": 3194, "val_loss": 68300.7890625} {"train_loss": -6.56137752532959, "global_step": 134190, "epoch": 3195} {"train_loss": -6.818641662597656, "global_step": 134191, "epoch": 3195} {"train_loss": -6.482216835021973, "global_step": 134192, "epoch": 3195} {"train_loss": -6.703094482421875, "global_step": 134193, "epoch": 3195} {"train_loss": -6.607545852661133, "global_step": 134194, "epoch": 3195} {"train_loss": -6.711470603942871, "global_step": 134195, "epoch": 3195} {"train_loss": -6.761838912963867, "global_step": 134196, "epoch": 3195} {"train_loss": -6.681789398193359, "global_step": 134197, "epoch": 3195} {"train_loss": -6.662825584411621, "global_step": 134198, "epoch": 3195} {"train_loss": -6.715538501739502, "global_step": 134199, "epoch": 3195} {"train_loss": -6.577393531799316, "global_step": 134200, "epoch": 3195} {"train_loss": -6.719889163970947, "global_step": 134201, "epoch": 3195} {"train_loss": -6.672985076904297, "global_step": 134202, "epoch": 3195} {"train_loss": -6.667797088623047, "global_step": 134203, "epoch": 3195} {"train_loss": -6.436014175415039, "global_step": 134204, "epoch": 3195} {"train_loss": -6.65826416015625, "global_step": 134205, "epoch": 3195} {"train_loss": -6.56938362121582, "global_step": 134206, "epoch": 3195} {"train_loss": -6.4668731689453125, "global_step": 134207, "epoch": 3195} {"train_loss": -6.653936386108398, "global_step": 134208, "epoch": 3195} {"train_loss": -6.614734649658203, "global_step": 134209, "epoch": 3195} {"train_loss": -6.6184797286987305, "global_step": 134210, "epoch": 3195} {"train_loss": -6.542566776275635, "global_step": 134211, "epoch": 3195} {"train_loss": -6.55760383605957, "global_step": 134212, "epoch": 3195} {"train_loss": -6.561058044433594, "global_step": 134213, "epoch": 3195} {"train_loss": -6.565940856933594, "global_step": 134214, "epoch": 3195} {"train_loss": -6.669798851013184, "global_step": 134215, "epoch": 3195} {"train_loss": -6.643128395080566, "global_step": 134216, "epoch": 3195} {"train_loss": -6.655440330505371, "global_step": 134217, "epoch": 3195} {"train_loss": -6.622171401977539, "global_step": 134218, "epoch": 3195} {"train_loss": -6.5903167724609375, "global_step": 134219, "epoch": 3195} {"train_loss": -6.739144325256348, "global_step": 134220, "epoch": 3195} {"train_loss": -6.638616561889648, "global_step": 134221, "epoch": 3195} {"train_loss": -6.62023401260376, "global_step": 134222, "epoch": 3195} {"train_loss": -6.672263145446777, "global_step": 134223, "epoch": 3195} {"train_loss": -6.771388053894043, "global_step": 134224, "epoch": 3195} {"train_loss": -6.696315765380859, "global_step": 134225, "epoch": 3195} {"train_loss": -6.569356918334961, "global_step": 134226, "epoch": 3195} {"train_loss": -6.659472942352295, "global_step": 134227, "epoch": 3195} {"train_loss": -6.638665199279785, "global_step": 134228, "epoch": 3195} {"train_loss": -6.605418682098389, "global_step": 134229, "epoch": 3195} {"train_loss": -6.662501335144043, "global_step": 134230, "epoch": 3195} {"train_loss": -6.63510925429208, "global_step": 134231, "epoch": 3195, "val_loss": 68262.0078125} {"train_loss": -6.641205787658691, "global_step": 134232, "epoch": 3196} {"train_loss": -6.693704605102539, "global_step": 134233, "epoch": 3196} {"train_loss": -6.668064117431641, "global_step": 134234, "epoch": 3196} {"train_loss": -6.602878570556641, "global_step": 134235, "epoch": 3196} {"train_loss": -6.747738361358643, "global_step": 134236, "epoch": 3196} {"train_loss": -6.593869686126709, "global_step": 134237, "epoch": 3196} {"train_loss": -6.643738746643066, "global_step": 134238, "epoch": 3196} {"train_loss": -6.694554328918457, "global_step": 134239, "epoch": 3196} {"train_loss": -6.777581691741943, "global_step": 134240, "epoch": 3196} {"train_loss": -6.590348243713379, "global_step": 134241, "epoch": 3196} {"train_loss": -6.645207405090332, "global_step": 134242, "epoch": 3196} {"train_loss": -6.570314407348633, "global_step": 134243, "epoch": 3196} {"train_loss": -6.717708587646484, "global_step": 134244, "epoch": 3196} {"train_loss": -6.657426834106445, "global_step": 134245, "epoch": 3196} {"train_loss": -6.60572624206543, "global_step": 134246, "epoch": 3196} {"train_loss": -6.65684700012207, "global_step": 134247, "epoch": 3196} {"train_loss": -6.602357864379883, "global_step": 134248, "epoch": 3196} {"train_loss": -6.65102481842041, "global_step": 134249, "epoch": 3196} {"train_loss": -6.54625940322876, "global_step": 134250, "epoch": 3196} {"train_loss": -6.523842811584473, "global_step": 134251, "epoch": 3196} {"train_loss": -6.679295063018799, "global_step": 134252, "epoch": 3196} {"train_loss": -6.4662981033325195, "global_step": 134253, "epoch": 3196} {"train_loss": -6.601354598999023, "global_step": 134254, "epoch": 3196} {"train_loss": -6.719154357910156, "global_step": 134255, "epoch": 3196} {"train_loss": -6.592466354370117, "global_step": 134256, "epoch": 3196} {"train_loss": -6.629362106323242, "global_step": 134257, "epoch": 3196} {"train_loss": -6.604653358459473, "global_step": 134258, "epoch": 3196} {"train_loss": -6.744143486022949, "global_step": 134259, "epoch": 3196} {"train_loss": -6.623635292053223, "global_step": 134260, "epoch": 3196} {"train_loss": -6.6145501136779785, "global_step": 134261, "epoch": 3196} {"train_loss": -6.654097557067871, "global_step": 134262, "epoch": 3196} {"train_loss": -6.5799665451049805, "global_step": 134263, "epoch": 3196} {"train_loss": -6.659472465515137, "global_step": 134264, "epoch": 3196} {"train_loss": -6.728323936462402, "global_step": 134265, "epoch": 3196} {"train_loss": -6.652263641357422, "global_step": 134266, "epoch": 3196} {"train_loss": -6.731761932373047, "global_step": 134267, "epoch": 3196} {"train_loss": -6.635435104370117, "global_step": 134268, "epoch": 3196} {"train_loss": -6.625812530517578, "global_step": 134269, "epoch": 3196} {"train_loss": -6.78087043762207, "global_step": 134270, "epoch": 3196} {"train_loss": -6.671502113342285, "global_step": 134271, "epoch": 3196} {"train_loss": -6.724249839782715, "global_step": 134272, "epoch": 3196} {"train_loss": -6.646883919125512, "global_step": 134273, "epoch": 3196, "val_loss": 68375.5078125} {"train_loss": -6.714421272277832, "global_step": 134274, "epoch": 3197} {"train_loss": -6.812570095062256, "global_step": 134275, "epoch": 3197} {"train_loss": -6.573011875152588, "global_step": 134276, "epoch": 3197} {"train_loss": -6.703402519226074, "global_step": 134277, "epoch": 3197} {"train_loss": -6.716499328613281, "global_step": 134278, "epoch": 3197} {"train_loss": -6.570908546447754, "global_step": 134279, "epoch": 3197} {"train_loss": -6.455203056335449, "global_step": 134280, "epoch": 3197} {"train_loss": -6.765822410583496, "global_step": 134281, "epoch": 3197} {"train_loss": -6.703831672668457, "global_step": 134282, "epoch": 3197} {"train_loss": -6.562522888183594, "global_step": 134283, "epoch": 3197} {"train_loss": -6.562308311462402, "global_step": 134284, "epoch": 3197} {"train_loss": -6.501679420471191, "global_step": 134285, "epoch": 3197} {"train_loss": -6.549832820892334, "global_step": 134286, "epoch": 3197} {"train_loss": -6.680924892425537, "global_step": 134287, "epoch": 3197} {"train_loss": -6.560272216796875, "global_step": 134288, "epoch": 3197} {"train_loss": -6.491212844848633, "global_step": 134289, "epoch": 3197} {"train_loss": -6.6143798828125, "global_step": 134290, "epoch": 3197} {"train_loss": -6.67669153213501, "global_step": 134291, "epoch": 3197} {"train_loss": -6.66881799697876, "global_step": 134292, "epoch": 3197} {"train_loss": -6.57355260848999, "global_step": 134293, "epoch": 3197} {"train_loss": -6.619682312011719, "global_step": 134294, "epoch": 3197} {"train_loss": -6.663771152496338, "global_step": 134295, "epoch": 3197} {"train_loss": -6.531609535217285, "global_step": 134296, "epoch": 3197} {"train_loss": -6.623344421386719, "global_step": 134297, "epoch": 3197} {"train_loss": -6.537675857543945, "global_step": 134298, "epoch": 3197} {"train_loss": -6.667132377624512, "global_step": 134299, "epoch": 3197} {"train_loss": -6.6286540031433105, "global_step": 134300, "epoch": 3197} {"train_loss": -6.589193344116211, "global_step": 134301, "epoch": 3197} {"train_loss": -6.563158988952637, "global_step": 134302, "epoch": 3197} {"train_loss": -6.71110725402832, "global_step": 134303, "epoch": 3197} {"train_loss": -6.68601131439209, "global_step": 134304, "epoch": 3197} {"train_loss": -6.665067672729492, "global_step": 134305, "epoch": 3197} {"train_loss": -6.726743698120117, "global_step": 134306, "epoch": 3197} {"train_loss": -6.7937846183776855, "global_step": 134307, "epoch": 3197} {"train_loss": -6.601178169250488, "global_step": 134308, "epoch": 3197} {"train_loss": -6.651514053344727, "global_step": 134309, "epoch": 3197} {"train_loss": -6.723150730133057, "global_step": 134310, "epoch": 3197} {"train_loss": -6.606490135192871, "global_step": 134311, "epoch": 3197} {"train_loss": -6.578813076019287, "global_step": 134312, "epoch": 3197} {"train_loss": -6.699795722961426, "global_step": 134313, "epoch": 3197} {"train_loss": -6.597247123718262, "global_step": 134314, "epoch": 3197} {"train_loss": -6.633013010025024, "global_step": 134315, "epoch": 3197, "val_loss": 68198.46875} {"train_loss": -6.5795488357543945, "global_step": 134316, "epoch": 3198} {"train_loss": -6.628795623779297, "global_step": 134317, "epoch": 3198} {"train_loss": -6.645697593688965, "global_step": 134318, "epoch": 3198} {"train_loss": -6.771627426147461, "global_step": 134319, "epoch": 3198} {"train_loss": -6.648085594177246, "global_step": 134320, "epoch": 3198} {"train_loss": -6.751368999481201, "global_step": 134321, "epoch": 3198} {"train_loss": -6.529681205749512, "global_step": 134322, "epoch": 3198} {"train_loss": -6.7175445556640625, "global_step": 134323, "epoch": 3198} {"train_loss": -6.686481952667236, "global_step": 134324, "epoch": 3198} {"train_loss": -6.65859317779541, "global_step": 134325, "epoch": 3198} {"train_loss": -6.624682426452637, "global_step": 134326, "epoch": 3198} {"train_loss": -6.693304061889648, "global_step": 134327, "epoch": 3198} {"train_loss": -6.643472194671631, "global_step": 134328, "epoch": 3198} {"train_loss": -6.708184242248535, "global_step": 134329, "epoch": 3198} {"train_loss": -6.706952095031738, "global_step": 134330, "epoch": 3198} {"train_loss": -6.750871658325195, "global_step": 134331, "epoch": 3198} {"train_loss": -6.655940055847168, "global_step": 134332, "epoch": 3198} {"train_loss": -6.6079487800598145, "global_step": 134333, "epoch": 3198} {"train_loss": -6.716052532196045, "global_step": 134334, "epoch": 3198} {"train_loss": -6.680769920349121, "global_step": 134335, "epoch": 3198} {"train_loss": -6.634055137634277, "global_step": 134336, "epoch": 3198} {"train_loss": -6.694862365722656, "global_step": 134337, "epoch": 3198} {"train_loss": -6.728578090667725, "global_step": 134338, "epoch": 3198} {"train_loss": -6.729210376739502, "global_step": 134339, "epoch": 3198} {"train_loss": -6.5056023597717285, "global_step": 134340, "epoch": 3198} {"train_loss": -6.686945915222168, "global_step": 134341, "epoch": 3198} {"train_loss": -6.5923309326171875, "global_step": 134342, "epoch": 3198} {"train_loss": -6.6504435539245605, "global_step": 134343, "epoch": 3198} {"train_loss": -6.568452835083008, "global_step": 134344, "epoch": 3198} {"train_loss": -6.656423091888428, "global_step": 134345, "epoch": 3198} {"train_loss": -6.673182487487793, "global_step": 134346, "epoch": 3198} {"train_loss": -6.691369533538818, "global_step": 134347, "epoch": 3198} {"train_loss": -6.6592183113098145, "global_step": 134348, "epoch": 3198} {"train_loss": -6.622380256652832, "global_step": 134349, "epoch": 3198} {"train_loss": -6.724269866943359, "global_step": 134350, "epoch": 3198} {"train_loss": -6.6845855712890625, "global_step": 134351, "epoch": 3198} {"train_loss": -6.746617317199707, "global_step": 134352, "epoch": 3198} {"train_loss": -6.655256271362305, "global_step": 134353, "epoch": 3198} {"train_loss": -6.680593490600586, "global_step": 134354, "epoch": 3198} {"train_loss": -6.6516265869140625, "global_step": 134355, "epoch": 3198} {"train_loss": -6.784693717956543, "global_step": 134356, "epoch": 3198} {"train_loss": -6.668612184978667, "global_step": 134357, "epoch": 3198, "val_loss": 68208.703125} {"train_loss": -6.726106643676758, "global_step": 134358, "epoch": 3199} {"train_loss": -6.735564231872559, "global_step": 134359, "epoch": 3199} {"train_loss": -6.639919281005859, "global_step": 134360, "epoch": 3199} {"train_loss": -6.619964599609375, "global_step": 134361, "epoch": 3199} {"train_loss": -6.62930965423584, "global_step": 134362, "epoch": 3199} {"train_loss": -6.5961408615112305, "global_step": 134363, "epoch": 3199} {"train_loss": -6.743844032287598, "global_step": 134364, "epoch": 3199} {"train_loss": -6.625889778137207, "global_step": 134365, "epoch": 3199} {"train_loss": -6.639225959777832, "global_step": 134366, "epoch": 3199} {"train_loss": -6.632030010223389, "global_step": 134367, "epoch": 3199} {"train_loss": -6.620000839233398, "global_step": 134368, "epoch": 3199} {"train_loss": -6.698797225952148, "global_step": 134369, "epoch": 3199} {"train_loss": -6.594278335571289, "global_step": 134370, "epoch": 3199} {"train_loss": -6.617256164550781, "global_step": 134371, "epoch": 3199} {"train_loss": -6.747345924377441, "global_step": 134372, "epoch": 3199} {"train_loss": -6.618136405944824, "global_step": 134373, "epoch": 3199} {"train_loss": -6.609744548797607, "global_step": 134374, "epoch": 3199} {"train_loss": -6.642192840576172, "global_step": 134375, "epoch": 3199} {"train_loss": -6.585808753967285, "global_step": 134376, "epoch": 3199} {"train_loss": -6.624567985534668, "global_step": 134377, "epoch": 3199} {"train_loss": -6.713687896728516, "global_step": 134378, "epoch": 3199} {"train_loss": -6.642148971557617, "global_step": 134379, "epoch": 3199} {"train_loss": -6.528547286987305, "global_step": 134380, "epoch": 3199} {"train_loss": -6.734309196472168, "global_step": 134381, "epoch": 3199} {"train_loss": -6.667954444885254, "global_step": 134382, "epoch": 3199} {"train_loss": -6.603830337524414, "global_step": 134383, "epoch": 3199} {"train_loss": -6.6930460929870605, "global_step": 134384, "epoch": 3199} {"train_loss": -6.571257591247559, "global_step": 134385, "epoch": 3199} {"train_loss": -6.555376052856445, "global_step": 134386, "epoch": 3199} {"train_loss": -6.687644958496094, "global_step": 134387, "epoch": 3199} {"train_loss": -6.593039035797119, "global_step": 134388, "epoch": 3199} {"train_loss": -6.694390296936035, "global_step": 134389, "epoch": 3199} {"train_loss": -6.674951553344727, "global_step": 134390, "epoch": 3199} {"train_loss": -6.423709869384766, "global_step": 134391, "epoch": 3199} {"train_loss": -6.685039520263672, "global_step": 134392, "epoch": 3199} {"train_loss": -6.588289260864258, "global_step": 134393, "epoch": 3199} {"train_loss": -6.614306449890137, "global_step": 134394, "epoch": 3199} {"train_loss": -6.718572616577148, "global_step": 134395, "epoch": 3199} {"train_loss": -6.748887062072754, "global_step": 134396, "epoch": 3199} {"train_loss": -6.653586387634277, "global_step": 134397, "epoch": 3199} {"train_loss": -6.748269557952881, "global_step": 134398, "epoch": 3199} {"train_loss": -6.648499874841599, "global_step": 134399, "epoch": 3199, "val_loss": 68377.1015625} {"train_loss": -6.684635162353516, "global_step": 134400, "epoch": 3200} {"train_loss": -6.686225891113281, "global_step": 134401, "epoch": 3200} {"train_loss": -6.688336372375488, "global_step": 134402, "epoch": 3200} {"train_loss": -6.683589935302734, "global_step": 134403, "epoch": 3200} {"train_loss": -6.652706146240234, "global_step": 134404, "epoch": 3200} {"train_loss": -6.659460067749023, "global_step": 134405, "epoch": 3200} {"train_loss": -6.719801425933838, "global_step": 134406, "epoch": 3200} {"train_loss": -6.71211051940918, "global_step": 134407, "epoch": 3200} {"train_loss": -6.742269992828369, "global_step": 134408, "epoch": 3200} {"train_loss": -6.70913028717041, "global_step": 134409, "epoch": 3200} {"train_loss": -6.823185443878174, "global_step": 134410, "epoch": 3200} {"train_loss": -6.733950614929199, "global_step": 134411, "epoch": 3200} {"train_loss": -6.703125953674316, "global_step": 134412, "epoch": 3200} {"train_loss": -6.46364164352417, "global_step": 134413, "epoch": 3200} {"train_loss": -6.769407272338867, "global_step": 134414, "epoch": 3200} {"train_loss": -6.748276710510254, "global_step": 134415, "epoch": 3200} {"train_loss": -6.6457839012146, "global_step": 134416, "epoch": 3200} {"train_loss": -6.734993934631348, "global_step": 134417, "epoch": 3200} {"train_loss": -6.766111850738525, "global_step": 134418, "epoch": 3200} {"train_loss": -6.708987236022949, "global_step": 134419, "epoch": 3200} {"train_loss": -6.8132476806640625, "global_step": 134420, "epoch": 3200} {"train_loss": -6.757261276245117, "global_step": 134421, "epoch": 3200} {"train_loss": -6.721861362457275, "global_step": 134422, "epoch": 3200} {"train_loss": -6.6655097007751465, "global_step": 134423, "epoch": 3200} {"train_loss": -6.729753017425537, "global_step": 134424, "epoch": 3200} {"train_loss": -6.749172210693359, "global_step": 134425, "epoch": 3200} {"train_loss": -6.673606872558594, "global_step": 134426, "epoch": 3200} {"train_loss": -6.759457588195801, "global_step": 134427, "epoch": 3200} {"train_loss": -6.702731132507324, "global_step": 134428, "epoch": 3200} {"train_loss": -6.745238780975342, "global_step": 134429, "epoch": 3200} {"train_loss": -6.723743438720703, "global_step": 134430, "epoch": 3200} {"train_loss": -6.720039367675781, "global_step": 134431, "epoch": 3200} {"train_loss": -6.693968296051025, "global_step": 134432, "epoch": 3200} {"train_loss": -6.6856913566589355, "global_step": 134433, "epoch": 3200} {"train_loss": -6.724792957305908, "global_step": 134434, "epoch": 3200} {"train_loss": -6.687854766845703, "global_step": 134435, "epoch": 3200} {"train_loss": -6.741360664367676, "global_step": 134436, "epoch": 3200} {"train_loss": -6.756017684936523, "global_step": 134437, "epoch": 3200} {"train_loss": -6.6553544998168945, "global_step": 134438, "epoch": 3200} {"train_loss": -6.628835678100586, "global_step": 134439, "epoch": 3200} {"train_loss": -6.532569885253906, "global_step": 134440, "epoch": 3200} {"train_loss": -6.705284981500535, "global_step": 134441, "epoch": 3200, "train/sim_max_reward_0": 0.20340448517424478, "train/sim_max_reward_1": 0.9290960594357686, "train/sim_max_reward_2": 0.9560359631498039, "train/sim_max_reward_3": 0.1327386480096774, "train/sim_max_reward_4": 0.4471668870762479, "train/sim_max_reward_5": 0.9926658497395391, "test/sim_max_reward_4400000": 0.28924463135179246, "test/sim_max_reward_4400001": 0.12397815573135028, "test/sim_max_reward_4400002": 0.9829310004229825, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9379939660883505, "test/sim_max_reward_4400006": 0.9942406933336423, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9760678895080152, "test/sim_max_reward_4400010": 0.9141551957969087, "test/sim_max_reward_4400011": 0.29669556062965213, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9753283127563481, "test/sim_max_reward_4400014": 0.15934003712029607, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.04707449642786001, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23179749038705133, "test/sim_max_reward_4400019": 0.5802674666412975, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.3223558289361299, "test/sim_max_reward_4400023": 0.8077122624610735, "test/sim_max_reward_4400024": 0.9671621701259144, "test/sim_max_reward_4400025": 0.2601135234862481, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.082028171649879, "test/sim_max_reward_4400028": 0.39960512533983905, "test/sim_max_reward_4400029": 0.4974638006309321, "test/sim_max_reward_4400030": 0.9978369701624931, "test/sim_max_reward_4400031": 0.9120903615962241, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9893236144609222, "test/sim_max_reward_4400034": 0.9555858346976116, "test/sim_max_reward_4400035": 0.6206621936968534, "test/sim_max_reward_4400036": 0.32618734173795194, "test/sim_max_reward_4400037": 0.8893405438441363, "test/sim_max_reward_4400038": 0.9365835773748172, "test/sim_max_reward_4400039": 0.9850204460342821, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9396872089856212, "test/sim_max_reward_4400042": 0.9133450808842388, "test/sim_max_reward_4400043": 0.9888872531288185, "test/sim_max_reward_4400044": 0.7933993745500292, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8624959573468829, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.9681667095536395, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.6101846487642136, "test/mean_score": 0.5767033843739876, "val_loss": 68236.5703125} {"train_loss": -6.770196914672852, "global_step": 134442, "epoch": 3201} {"train_loss": -6.529440879821777, "global_step": 134443, "epoch": 3201} {"train_loss": -6.822690963745117, "global_step": 134444, "epoch": 3201} {"train_loss": -6.595759391784668, "global_step": 134445, "epoch": 3201} {"train_loss": -6.5975494384765625, "global_step": 134446, "epoch": 3201} {"train_loss": -6.748490810394287, "global_step": 134447, "epoch": 3201} {"train_loss": -6.398393630981445, "global_step": 134448, "epoch": 3201} {"train_loss": -6.616687774658203, "global_step": 134449, "epoch": 3201} {"train_loss": -6.561336517333984, "global_step": 134450, "epoch": 3201} {"train_loss": -6.650887489318848, "global_step": 134451, "epoch": 3201} {"train_loss": -6.614632606506348, "global_step": 134452, "epoch": 3201} {"train_loss": -6.579738616943359, "global_step": 134453, "epoch": 3201} {"train_loss": -6.52298641204834, "global_step": 134454, "epoch": 3201} {"train_loss": -6.611356258392334, "global_step": 134455, "epoch": 3201} {"train_loss": -6.651324272155762, "global_step": 134456, "epoch": 3201} {"train_loss": -6.596534729003906, "global_step": 134457, "epoch": 3201} {"train_loss": -6.671810150146484, "global_step": 134458, "epoch": 3201} {"train_loss": -6.627551078796387, "global_step": 134459, "epoch": 3201} {"train_loss": -6.664240837097168, "global_step": 134460, "epoch": 3201} {"train_loss": -6.684968948364258, "global_step": 134461, "epoch": 3201} {"train_loss": -6.566826820373535, "global_step": 134462, "epoch": 3201} {"train_loss": -6.681069850921631, "global_step": 134463, "epoch": 3201} {"train_loss": -6.685611248016357, "global_step": 134464, "epoch": 3201} {"train_loss": -6.692978382110596, "global_step": 134465, "epoch": 3201} {"train_loss": -6.551080226898193, "global_step": 134466, "epoch": 3201} {"train_loss": -6.688663959503174, "global_step": 134467, "epoch": 3201} {"train_loss": -6.650437355041504, "global_step": 134468, "epoch": 3201} {"train_loss": -6.628221035003662, "global_step": 134469, "epoch": 3201} {"train_loss": -6.727155685424805, "global_step": 134470, "epoch": 3201} {"train_loss": -6.682376861572266, "global_step": 134471, "epoch": 3201} {"train_loss": -6.541609764099121, "global_step": 134472, "epoch": 3201} {"train_loss": -6.548022270202637, "global_step": 134473, "epoch": 3201} {"train_loss": -6.654088020324707, "global_step": 134474, "epoch": 3201} {"train_loss": -6.778168678283691, "global_step": 134475, "epoch": 3201} {"train_loss": -6.559966087341309, "global_step": 134476, "epoch": 3201} {"train_loss": -6.737547397613525, "global_step": 134477, "epoch": 3201} {"train_loss": -6.652459144592285, "global_step": 134478, "epoch": 3201} {"train_loss": -6.735511302947998, "global_step": 134479, "epoch": 3201} {"train_loss": -6.576605796813965, "global_step": 134480, "epoch": 3201} {"train_loss": -6.657499313354492, "global_step": 134481, "epoch": 3201} {"train_loss": -6.532506942749023, "global_step": 134482, "epoch": 3201} {"train_loss": -6.6367647761390325, "global_step": 134483, "epoch": 3201, "val_loss": 68371.6640625} {"train_loss": -6.641075134277344, "global_step": 134484, "epoch": 3202} {"train_loss": -6.807099342346191, "global_step": 134485, "epoch": 3202} {"train_loss": -6.483325481414795, "global_step": 134486, "epoch": 3202} {"train_loss": -6.454934120178223, "global_step": 134487, "epoch": 3202} {"train_loss": -6.646420478820801, "global_step": 134488, "epoch": 3202} {"train_loss": -6.508116722106934, "global_step": 134489, "epoch": 3202} {"train_loss": -6.654151916503906, "global_step": 134490, "epoch": 3202} {"train_loss": -6.546136856079102, "global_step": 134491, "epoch": 3202} {"train_loss": -6.504899024963379, "global_step": 134492, "epoch": 3202} {"train_loss": -6.668148994445801, "global_step": 134493, "epoch": 3202} {"train_loss": -6.424698829650879, "global_step": 134494, "epoch": 3202} {"train_loss": -6.578584671020508, "global_step": 134495, "epoch": 3202} {"train_loss": -6.405686855316162, "global_step": 134496, "epoch": 3202} {"train_loss": -6.513683319091797, "global_step": 134497, "epoch": 3202} {"train_loss": -6.485567092895508, "global_step": 134498, "epoch": 3202} {"train_loss": -6.70867919921875, "global_step": 134499, "epoch": 3202} {"train_loss": -6.507277488708496, "global_step": 134500, "epoch": 3202} {"train_loss": -6.824154853820801, "global_step": 134501, "epoch": 3202} {"train_loss": -6.541311264038086, "global_step": 134502, "epoch": 3202} {"train_loss": -6.666352272033691, "global_step": 134503, "epoch": 3202} {"train_loss": -6.570187568664551, "global_step": 134504, "epoch": 3202} {"train_loss": -6.622646808624268, "global_step": 134505, "epoch": 3202} {"train_loss": -6.597997188568115, "global_step": 134506, "epoch": 3202} {"train_loss": -6.619722366333008, "global_step": 134507, "epoch": 3202} {"train_loss": -6.631845951080322, "global_step": 134508, "epoch": 3202} {"train_loss": -6.661026954650879, "global_step": 134509, "epoch": 3202} {"train_loss": -6.524028778076172, "global_step": 134510, "epoch": 3202} {"train_loss": -6.719050884246826, "global_step": 134511, "epoch": 3202} {"train_loss": -6.553343296051025, "global_step": 134512, "epoch": 3202} {"train_loss": -6.621159076690674, "global_step": 134513, "epoch": 3202} {"train_loss": -6.628138542175293, "global_step": 134514, "epoch": 3202} {"train_loss": -6.608724594116211, "global_step": 134515, "epoch": 3202} {"train_loss": -6.615814208984375, "global_step": 134516, "epoch": 3202} {"train_loss": -6.621969223022461, "global_step": 134517, "epoch": 3202} {"train_loss": -6.664698123931885, "global_step": 134518, "epoch": 3202} {"train_loss": -6.606960773468018, "global_step": 134519, "epoch": 3202} {"train_loss": -6.617674827575684, "global_step": 134520, "epoch": 3202} {"train_loss": -6.505340576171875, "global_step": 134521, "epoch": 3202} {"train_loss": -6.648967742919922, "global_step": 134522, "epoch": 3202} {"train_loss": -6.5927252769470215, "global_step": 134523, "epoch": 3202} {"train_loss": -6.628182411193848, "global_step": 134524, "epoch": 3202} {"train_loss": -6.598842155365717, "global_step": 134525, "epoch": 3202, "val_loss": 68020.2734375} {"train_loss": -6.659769535064697, "global_step": 134526, "epoch": 3203} {"train_loss": -6.695886611938477, "global_step": 134527, "epoch": 3203} {"train_loss": -6.565008163452148, "global_step": 134528, "epoch": 3203} {"train_loss": -6.638892650604248, "global_step": 134529, "epoch": 3203} {"train_loss": -6.579831123352051, "global_step": 134530, "epoch": 3203} {"train_loss": -6.647421836853027, "global_step": 134531, "epoch": 3203} {"train_loss": -6.668615341186523, "global_step": 134532, "epoch": 3203} {"train_loss": -6.596540451049805, "global_step": 134533, "epoch": 3203} {"train_loss": -6.6820855140686035, "global_step": 134534, "epoch": 3203} {"train_loss": -6.435323238372803, "global_step": 134535, "epoch": 3203} {"train_loss": -6.567334175109863, "global_step": 134536, "epoch": 3203} {"train_loss": -6.546749114990234, "global_step": 134537, "epoch": 3203} {"train_loss": -6.437236785888672, "global_step": 134538, "epoch": 3203} {"train_loss": -6.5890069007873535, "global_step": 134539, "epoch": 3203} {"train_loss": -6.552151679992676, "global_step": 134540, "epoch": 3203} {"train_loss": -6.679431915283203, "global_step": 134541, "epoch": 3203} {"train_loss": -6.620391845703125, "global_step": 134542, "epoch": 3203} {"train_loss": -6.530302047729492, "global_step": 134543, "epoch": 3203} {"train_loss": -6.624762535095215, "global_step": 134544, "epoch": 3203} {"train_loss": -6.652096271514893, "global_step": 134545, "epoch": 3203} {"train_loss": -6.548545837402344, "global_step": 134546, "epoch": 3203} {"train_loss": -6.617336273193359, "global_step": 134547, "epoch": 3203} {"train_loss": -6.684714317321777, "global_step": 134548, "epoch": 3203} {"train_loss": -6.597208499908447, "global_step": 134549, "epoch": 3203} {"train_loss": -6.554169654846191, "global_step": 134550, "epoch": 3203} {"train_loss": -6.592254638671875, "global_step": 134551, "epoch": 3203} {"train_loss": -6.614464282989502, "global_step": 134552, "epoch": 3203} {"train_loss": -6.591626167297363, "global_step": 134553, "epoch": 3203} {"train_loss": -6.640237808227539, "global_step": 134554, "epoch": 3203} {"train_loss": -6.615622043609619, "global_step": 134555, "epoch": 3203} {"train_loss": -6.646761894226074, "global_step": 134556, "epoch": 3203} {"train_loss": -6.592728614807129, "global_step": 134557, "epoch": 3203} {"train_loss": -6.611114501953125, "global_step": 134558, "epoch": 3203} {"train_loss": -6.621469497680664, "global_step": 134559, "epoch": 3203} {"train_loss": -6.542577266693115, "global_step": 134560, "epoch": 3203} {"train_loss": -6.732166290283203, "global_step": 134561, "epoch": 3203} {"train_loss": -6.642025947570801, "global_step": 134562, "epoch": 3203} {"train_loss": -6.600696563720703, "global_step": 134563, "epoch": 3203} {"train_loss": -6.630842685699463, "global_step": 134564, "epoch": 3203} {"train_loss": -6.673645973205566, "global_step": 134565, "epoch": 3203} {"train_loss": -6.623071193695068, "global_step": 134566, "epoch": 3203} {"train_loss": -6.609448432922363, "global_step": 134567, "epoch": 3203, "val_loss": 68317.6796875} {"train_loss": -6.701364517211914, "global_step": 134568, "epoch": 3204} {"train_loss": -6.582721710205078, "global_step": 134569, "epoch": 3204} {"train_loss": -6.6449127197265625, "global_step": 134570, "epoch": 3204} {"train_loss": -6.589219093322754, "global_step": 134571, "epoch": 3204} {"train_loss": -6.691179275512695, "global_step": 134572, "epoch": 3204} {"train_loss": -6.646315574645996, "global_step": 134573, "epoch": 3204} {"train_loss": -6.60683536529541, "global_step": 134574, "epoch": 3204} {"train_loss": -6.585509777069092, "global_step": 134575, "epoch": 3204} {"train_loss": -6.548605918884277, "global_step": 134576, "epoch": 3204} {"train_loss": -6.510718822479248, "global_step": 134577, "epoch": 3204} {"train_loss": -6.566051483154297, "global_step": 134578, "epoch": 3204} {"train_loss": -6.591455459594727, "global_step": 134579, "epoch": 3204} {"train_loss": -6.751287937164307, "global_step": 134580, "epoch": 3204} {"train_loss": -6.635714530944824, "global_step": 134581, "epoch": 3204} {"train_loss": -6.718067169189453, "global_step": 134582, "epoch": 3204} {"train_loss": -6.632954120635986, "global_step": 134583, "epoch": 3204} {"train_loss": -6.64531135559082, "global_step": 134584, "epoch": 3204} {"train_loss": -6.681964874267578, "global_step": 134585, "epoch": 3204} {"train_loss": -6.6792402267456055, "global_step": 134586, "epoch": 3204} {"train_loss": -6.599172115325928, "global_step": 134587, "epoch": 3204} {"train_loss": -6.683859825134277, "global_step": 134588, "epoch": 3204} {"train_loss": -6.673153877258301, "global_step": 134589, "epoch": 3204} {"train_loss": -6.6203460693359375, "global_step": 134590, "epoch": 3204} {"train_loss": -6.579934120178223, "global_step": 134591, "epoch": 3204} {"train_loss": -6.543801307678223, "global_step": 134592, "epoch": 3204} {"train_loss": -6.641457557678223, "global_step": 134593, "epoch": 3204} {"train_loss": -6.651037693023682, "global_step": 134594, "epoch": 3204} {"train_loss": -6.629439353942871, "global_step": 134595, "epoch": 3204} {"train_loss": -6.5367889404296875, "global_step": 134596, "epoch": 3204} {"train_loss": -6.624059677124023, "global_step": 134597, "epoch": 3204} {"train_loss": -6.5850300788879395, "global_step": 134598, "epoch": 3204} {"train_loss": -6.705086708068848, "global_step": 134599, "epoch": 3204} {"train_loss": -6.624971866607666, "global_step": 134600, "epoch": 3204} {"train_loss": -6.50661563873291, "global_step": 134601, "epoch": 3204} {"train_loss": -6.735925674438477, "global_step": 134602, "epoch": 3204} {"train_loss": -6.656652450561523, "global_step": 134603, "epoch": 3204} {"train_loss": -6.595611572265625, "global_step": 134604, "epoch": 3204} {"train_loss": -6.678290367126465, "global_step": 134605, "epoch": 3204} {"train_loss": -6.548371315002441, "global_step": 134606, "epoch": 3204} {"train_loss": -6.7048444747924805, "global_step": 134607, "epoch": 3204} {"train_loss": -6.597034454345703, "global_step": 134608, "epoch": 3204} {"train_loss": -6.6285191377003985, "global_step": 134609, "epoch": 3204, "val_loss": 68167.8046875} {"train_loss": -6.673630714416504, "global_step": 134610, "epoch": 3205} {"train_loss": -6.570748329162598, "global_step": 134611, "epoch": 3205} {"train_loss": -6.717769145965576, "global_step": 134612, "epoch": 3205} {"train_loss": -6.825264930725098, "global_step": 134613, "epoch": 3205} {"train_loss": -6.676369667053223, "global_step": 134614, "epoch": 3205} {"train_loss": -6.63553524017334, "global_step": 134615, "epoch": 3205} {"train_loss": -6.701907157897949, "global_step": 134616, "epoch": 3205} {"train_loss": -6.719259738922119, "global_step": 134617, "epoch": 3205} {"train_loss": -6.675199508666992, "global_step": 134618, "epoch": 3205} {"train_loss": -6.750688552856445, "global_step": 134619, "epoch": 3205} {"train_loss": -6.651700019836426, "global_step": 134620, "epoch": 3205} {"train_loss": -6.657351493835449, "global_step": 134621, "epoch": 3205} {"train_loss": -6.809063911437988, "global_step": 134622, "epoch": 3205} {"train_loss": -6.6808905601501465, "global_step": 134623, "epoch": 3205} {"train_loss": -6.779655456542969, "global_step": 134624, "epoch": 3205} {"train_loss": -6.696969509124756, "global_step": 134625, "epoch": 3205} {"train_loss": -6.679114818572998, "global_step": 134626, "epoch": 3205} {"train_loss": -6.777118682861328, "global_step": 134627, "epoch": 3205} {"train_loss": -6.648388385772705, "global_step": 134628, "epoch": 3205} {"train_loss": -6.623185157775879, "global_step": 134629, "epoch": 3205} {"train_loss": -6.761857032775879, "global_step": 134630, "epoch": 3205} {"train_loss": -6.7861127853393555, "global_step": 134631, "epoch": 3205} {"train_loss": -6.664080619812012, "global_step": 134632, "epoch": 3205} {"train_loss": -6.655160903930664, "global_step": 134633, "epoch": 3205} {"train_loss": -6.531577110290527, "global_step": 134634, "epoch": 3205} {"train_loss": -6.5006890296936035, "global_step": 134635, "epoch": 3205} {"train_loss": -6.726839542388916, "global_step": 134636, "epoch": 3205} {"train_loss": -6.732354640960693, "global_step": 134637, "epoch": 3205} {"train_loss": -6.669022083282471, "global_step": 134638, "epoch": 3205} {"train_loss": -6.703333854675293, "global_step": 134639, "epoch": 3205} {"train_loss": -6.684315204620361, "global_step": 134640, "epoch": 3205} {"train_loss": -6.727080345153809, "global_step": 134641, "epoch": 3205} {"train_loss": -6.702643871307373, "global_step": 134642, "epoch": 3205} {"train_loss": -6.582207679748535, "global_step": 134643, "epoch": 3205} {"train_loss": -6.648846626281738, "global_step": 134644, "epoch": 3205} {"train_loss": -6.606570720672607, "global_step": 134645, "epoch": 3205} {"train_loss": -6.672894477844238, "global_step": 134646, "epoch": 3205} {"train_loss": -6.6731038093566895, "global_step": 134647, "epoch": 3205} {"train_loss": -6.701962471008301, "global_step": 134648, "epoch": 3205} {"train_loss": -6.707991600036621, "global_step": 134649, "epoch": 3205} {"train_loss": -6.676783084869385, "global_step": 134650, "epoch": 3205} {"train_loss": -6.68482045900254, "global_step": 134651, "epoch": 3205, "val_loss": 68271.4375} {"train_loss": -6.718704700469971, "global_step": 134652, "epoch": 3206} {"train_loss": -6.547914505004883, "global_step": 134653, "epoch": 3206} {"train_loss": -6.694296360015869, "global_step": 134654, "epoch": 3206} {"train_loss": -6.627572059631348, "global_step": 134655, "epoch": 3206} {"train_loss": -6.6097412109375, "global_step": 134656, "epoch": 3206} {"train_loss": -6.792394638061523, "global_step": 134657, "epoch": 3206} {"train_loss": -6.847037315368652, "global_step": 134658, "epoch": 3206} {"train_loss": -6.704006195068359, "global_step": 134659, "epoch": 3206} {"train_loss": -6.716352462768555, "global_step": 134660, "epoch": 3206} {"train_loss": -6.705495834350586, "global_step": 134661, "epoch": 3206} {"train_loss": -6.66019868850708, "global_step": 134662, "epoch": 3206} {"train_loss": -6.737360000610352, "global_step": 134663, "epoch": 3206} {"train_loss": -6.750331878662109, "global_step": 134664, "epoch": 3206} {"train_loss": -6.625060081481934, "global_step": 134665, "epoch": 3206} {"train_loss": -6.735257625579834, "global_step": 134666, "epoch": 3206} {"train_loss": -6.741733074188232, "global_step": 134667, "epoch": 3206} {"train_loss": -6.614494323730469, "global_step": 134668, "epoch": 3206} {"train_loss": -6.647635459899902, "global_step": 134669, "epoch": 3206} {"train_loss": -6.552617073059082, "global_step": 134670, "epoch": 3206} {"train_loss": -6.698850631713867, "global_step": 134671, "epoch": 3206} {"train_loss": -6.748720169067383, "global_step": 134672, "epoch": 3206} {"train_loss": -6.6467132568359375, "global_step": 134673, "epoch": 3206} {"train_loss": -6.701043128967285, "global_step": 134674, "epoch": 3206} {"train_loss": -6.779521465301514, "global_step": 134675, "epoch": 3206} {"train_loss": -6.682177543640137, "global_step": 134676, "epoch": 3206} {"train_loss": -6.667203903198242, "global_step": 134677, "epoch": 3206} {"train_loss": -6.7668962478637695, "global_step": 134678, "epoch": 3206} {"train_loss": -6.642139434814453, "global_step": 134679, "epoch": 3206} {"train_loss": -6.63837194442749, "global_step": 134680, "epoch": 3206} {"train_loss": -6.6640543937683105, "global_step": 134681, "epoch": 3206} {"train_loss": -6.616780757904053, "global_step": 134682, "epoch": 3206} {"train_loss": -6.7942962646484375, "global_step": 134683, "epoch": 3206} {"train_loss": -6.630609512329102, "global_step": 134684, "epoch": 3206} {"train_loss": -6.7499518394470215, "global_step": 134685, "epoch": 3206} {"train_loss": -6.608854293823242, "global_step": 134686, "epoch": 3206} {"train_loss": -6.599675178527832, "global_step": 134687, "epoch": 3206} {"train_loss": -6.668606281280518, "global_step": 134688, "epoch": 3206} {"train_loss": -6.6009745597839355, "global_step": 134689, "epoch": 3206} {"train_loss": -6.585240364074707, "global_step": 134690, "epoch": 3206} {"train_loss": -6.737282752990723, "global_step": 134691, "epoch": 3206} {"train_loss": -6.673986434936523, "global_step": 134692, "epoch": 3206} {"train_loss": -6.683320374715896, "global_step": 134693, "epoch": 3206, "val_loss": 68527.3203125} {"train_loss": -6.700640678405762, "global_step": 134694, "epoch": 3207} {"train_loss": -6.7462873458862305, "global_step": 134695, "epoch": 3207} {"train_loss": -6.740501403808594, "global_step": 134696, "epoch": 3207} {"train_loss": -6.712238788604736, "global_step": 134697, "epoch": 3207} {"train_loss": -6.6661152839660645, "global_step": 134698, "epoch": 3207} {"train_loss": -6.736303806304932, "global_step": 134699, "epoch": 3207} {"train_loss": -6.691794395446777, "global_step": 134700, "epoch": 3207} {"train_loss": -6.566303253173828, "global_step": 134701, "epoch": 3207} {"train_loss": -6.566195487976074, "global_step": 134702, "epoch": 3207} {"train_loss": -6.652352333068848, "global_step": 134703, "epoch": 3207} {"train_loss": -6.659392356872559, "global_step": 134704, "epoch": 3207} {"train_loss": -6.756425857543945, "global_step": 134705, "epoch": 3207} {"train_loss": -6.657258987426758, "global_step": 134706, "epoch": 3207} {"train_loss": -6.6255574226379395, "global_step": 134707, "epoch": 3207} {"train_loss": -6.751012325286865, "global_step": 134708, "epoch": 3207} {"train_loss": -6.717870712280273, "global_step": 134709, "epoch": 3207} {"train_loss": -6.711082458496094, "global_step": 134710, "epoch": 3207} {"train_loss": -6.794353008270264, "global_step": 134711, "epoch": 3207} {"train_loss": -6.73879337310791, "global_step": 134712, "epoch": 3207} {"train_loss": -6.760746002197266, "global_step": 134713, "epoch": 3207} {"train_loss": -6.626523017883301, "global_step": 134714, "epoch": 3207} {"train_loss": -6.68633508682251, "global_step": 134715, "epoch": 3207} {"train_loss": -6.662387371063232, "global_step": 134716, "epoch": 3207} {"train_loss": -6.671937465667725, "global_step": 134717, "epoch": 3207} {"train_loss": -6.76942777633667, "global_step": 134718, "epoch": 3207} {"train_loss": -6.609164237976074, "global_step": 134719, "epoch": 3207} {"train_loss": -6.641071796417236, "global_step": 134720, "epoch": 3207} {"train_loss": -6.706093788146973, "global_step": 134721, "epoch": 3207} {"train_loss": -6.651541709899902, "global_step": 134722, "epoch": 3207} {"train_loss": -6.699136734008789, "global_step": 134723, "epoch": 3207} {"train_loss": -6.755017280578613, "global_step": 134724, "epoch": 3207} {"train_loss": -6.632309913635254, "global_step": 134725, "epoch": 3207} {"train_loss": -6.661812782287598, "global_step": 134726, "epoch": 3207} {"train_loss": -6.757678031921387, "global_step": 134727, "epoch": 3207} {"train_loss": -6.666286468505859, "global_step": 134728, "epoch": 3207} {"train_loss": -6.798111438751221, "global_step": 134729, "epoch": 3207} {"train_loss": -6.637711524963379, "global_step": 134730, "epoch": 3207} {"train_loss": -6.629175662994385, "global_step": 134731, "epoch": 3207} {"train_loss": -6.653873443603516, "global_step": 134732, "epoch": 3207} {"train_loss": -6.617332458496094, "global_step": 134733, "epoch": 3207} {"train_loss": -6.609479904174805, "global_step": 134734, "epoch": 3207} {"train_loss": -6.683039415450323, "global_step": 134735, "epoch": 3207, "val_loss": 68439.5859375} {"train_loss": -6.65628719329834, "global_step": 134736, "epoch": 3208} {"train_loss": -6.704155445098877, "global_step": 134737, "epoch": 3208} {"train_loss": -6.692241191864014, "global_step": 134738, "epoch": 3208} {"train_loss": -6.707559585571289, "global_step": 134739, "epoch": 3208} {"train_loss": -6.791862487792969, "global_step": 134740, "epoch": 3208} {"train_loss": -6.592452049255371, "global_step": 134741, "epoch": 3208} {"train_loss": -6.593191623687744, "global_step": 134742, "epoch": 3208} {"train_loss": -6.624794960021973, "global_step": 134743, "epoch": 3208} {"train_loss": -6.616337776184082, "global_step": 134744, "epoch": 3208} {"train_loss": -6.674744606018066, "global_step": 134745, "epoch": 3208} {"train_loss": -6.5283308029174805, "global_step": 134746, "epoch": 3208} {"train_loss": -6.713220596313477, "global_step": 134747, "epoch": 3208} {"train_loss": -6.674686908721924, "global_step": 134748, "epoch": 3208} {"train_loss": -6.598109245300293, "global_step": 134749, "epoch": 3208} {"train_loss": -6.6646270751953125, "global_step": 134750, "epoch": 3208} {"train_loss": -6.609091281890869, "global_step": 134751, "epoch": 3208} {"train_loss": -6.626771926879883, "global_step": 134752, "epoch": 3208} {"train_loss": -6.789191722869873, "global_step": 134753, "epoch": 3208} {"train_loss": -6.669057369232178, "global_step": 134754, "epoch": 3208} {"train_loss": -6.703161239624023, "global_step": 134755, "epoch": 3208} {"train_loss": -6.6500654220581055, "global_step": 134756, "epoch": 3208} {"train_loss": -6.744139671325684, "global_step": 134757, "epoch": 3208} {"train_loss": -6.629344940185547, "global_step": 134758, "epoch": 3208} {"train_loss": -6.721564292907715, "global_step": 134759, "epoch": 3208} {"train_loss": -6.692552089691162, "global_step": 134760, "epoch": 3208} {"train_loss": -6.640149116516113, "global_step": 134761, "epoch": 3208} {"train_loss": -6.671441078186035, "global_step": 134762, "epoch": 3208} {"train_loss": -6.530481338500977, "global_step": 134763, "epoch": 3208} {"train_loss": -6.644199371337891, "global_step": 134764, "epoch": 3208} {"train_loss": -6.713766098022461, "global_step": 134765, "epoch": 3208} {"train_loss": -6.7004570960998535, "global_step": 134766, "epoch": 3208} {"train_loss": -6.731863021850586, "global_step": 134767, "epoch": 3208} {"train_loss": -6.634324073791504, "global_step": 134768, "epoch": 3208} {"train_loss": -6.735935211181641, "global_step": 134769, "epoch": 3208} {"train_loss": -6.585906028747559, "global_step": 134770, "epoch": 3208} {"train_loss": -6.665214538574219, "global_step": 134771, "epoch": 3208} {"train_loss": -6.677893161773682, "global_step": 134772, "epoch": 3208} {"train_loss": -6.693904876708984, "global_step": 134773, "epoch": 3208} {"train_loss": -6.7117919921875, "global_step": 134774, "epoch": 3208} {"train_loss": -6.756467819213867, "global_step": 134775, "epoch": 3208} {"train_loss": -6.619232177734375, "global_step": 134776, "epoch": 3208} {"train_loss": -6.664975847516741, "global_step": 134777, "epoch": 3208, "val_loss": 68261.2109375} {"train_loss": -6.7567291259765625, "global_step": 134778, "epoch": 3209} {"train_loss": -6.653166770935059, "global_step": 134779, "epoch": 3209} {"train_loss": -6.643892288208008, "global_step": 134780, "epoch": 3209} {"train_loss": -6.65138578414917, "global_step": 134781, "epoch": 3209} {"train_loss": -6.701279640197754, "global_step": 134782, "epoch": 3209} {"train_loss": -6.536038398742676, "global_step": 134783, "epoch": 3209} {"train_loss": -6.669432640075684, "global_step": 134784, "epoch": 3209} {"train_loss": -6.7338361740112305, "global_step": 134785, "epoch": 3209} {"train_loss": -6.63289737701416, "global_step": 134786, "epoch": 3209} {"train_loss": -6.640198707580566, "global_step": 134787, "epoch": 3209} {"train_loss": -6.637320518493652, "global_step": 134788, "epoch": 3209} {"train_loss": -6.575922966003418, "global_step": 134789, "epoch": 3209} {"train_loss": -6.782062530517578, "global_step": 134790, "epoch": 3209} {"train_loss": -6.612625598907471, "global_step": 134791, "epoch": 3209} {"train_loss": -6.737851619720459, "global_step": 134792, "epoch": 3209} {"train_loss": -6.668519020080566, "global_step": 134793, "epoch": 3209} {"train_loss": -6.628871917724609, "global_step": 134794, "epoch": 3209} {"train_loss": -6.674473285675049, "global_step": 134795, "epoch": 3209} {"train_loss": -6.643564701080322, "global_step": 134796, "epoch": 3209} {"train_loss": -6.765791416168213, "global_step": 134797, "epoch": 3209} {"train_loss": -6.724699974060059, "global_step": 134798, "epoch": 3209} {"train_loss": -6.80677604675293, "global_step": 134799, "epoch": 3209} {"train_loss": -6.6803507804870605, "global_step": 134800, "epoch": 3209} {"train_loss": -6.632708549499512, "global_step": 134801, "epoch": 3209} {"train_loss": -6.691802501678467, "global_step": 134802, "epoch": 3209} {"train_loss": -6.647456169128418, "global_step": 134803, "epoch": 3209} {"train_loss": -6.623311996459961, "global_step": 134804, "epoch": 3209} {"train_loss": -6.642318248748779, "global_step": 134805, "epoch": 3209} {"train_loss": -6.693484306335449, "global_step": 134806, "epoch": 3209} {"train_loss": -6.658926963806152, "global_step": 134807, "epoch": 3209} {"train_loss": -6.71483039855957, "global_step": 134808, "epoch": 3209} {"train_loss": -6.703885078430176, "global_step": 134809, "epoch": 3209} {"train_loss": -6.591302871704102, "global_step": 134810, "epoch": 3209} {"train_loss": -6.660286903381348, "global_step": 134811, "epoch": 3209} {"train_loss": -6.6496357917785645, "global_step": 134812, "epoch": 3209} {"train_loss": -6.658352851867676, "global_step": 134813, "epoch": 3209} {"train_loss": -6.650357246398926, "global_step": 134814, "epoch": 3209} {"train_loss": -6.593508720397949, "global_step": 134815, "epoch": 3209} {"train_loss": -6.738231182098389, "global_step": 134816, "epoch": 3209} {"train_loss": -6.547384262084961, "global_step": 134817, "epoch": 3209} {"train_loss": -6.714537143707275, "global_step": 134818, "epoch": 3209} {"train_loss": -6.670381443841117, "global_step": 134819, "epoch": 3209, "val_loss": 68224.7578125} {"train_loss": -6.643864154815674, "global_step": 134820, "epoch": 3210} {"train_loss": -6.6643266677856445, "global_step": 134821, "epoch": 3210} {"train_loss": -6.747535705566406, "global_step": 134822, "epoch": 3210} {"train_loss": -6.724034786224365, "global_step": 134823, "epoch": 3210} {"train_loss": -6.644460201263428, "global_step": 134824, "epoch": 3210} {"train_loss": -6.549169540405273, "global_step": 134825, "epoch": 3210} {"train_loss": -6.514036178588867, "global_step": 134826, "epoch": 3210} {"train_loss": -6.692469596862793, "global_step": 134827, "epoch": 3210} {"train_loss": -6.626086235046387, "global_step": 134828, "epoch": 3210} {"train_loss": -6.566011905670166, "global_step": 134829, "epoch": 3210} {"train_loss": -6.754008769989014, "global_step": 134830, "epoch": 3210} {"train_loss": -6.605673313140869, "global_step": 134831, "epoch": 3210} {"train_loss": -6.575965404510498, "global_step": 134832, "epoch": 3210} {"train_loss": -6.793851375579834, "global_step": 134833, "epoch": 3210} {"train_loss": -6.613185882568359, "global_step": 134834, "epoch": 3210} {"train_loss": -6.626679420471191, "global_step": 134835, "epoch": 3210} {"train_loss": -6.670731067657471, "global_step": 134836, "epoch": 3210} {"train_loss": -6.628442287445068, "global_step": 134837, "epoch": 3210} {"train_loss": -6.723795413970947, "global_step": 134838, "epoch": 3210} {"train_loss": -6.585480690002441, "global_step": 134839, "epoch": 3210} {"train_loss": -6.681204795837402, "global_step": 134840, "epoch": 3210} {"train_loss": -6.678608417510986, "global_step": 134841, "epoch": 3210} {"train_loss": -6.619253158569336, "global_step": 134842, "epoch": 3210} {"train_loss": -6.732527732849121, "global_step": 134843, "epoch": 3210} {"train_loss": -6.6432952880859375, "global_step": 134844, "epoch": 3210} {"train_loss": -6.732565879821777, "global_step": 134845, "epoch": 3210} {"train_loss": -6.825043678283691, "global_step": 134846, "epoch": 3210} {"train_loss": -6.69935417175293, "global_step": 134847, "epoch": 3210} {"train_loss": -6.755847930908203, "global_step": 134848, "epoch": 3210} {"train_loss": -6.6693620681762695, "global_step": 134849, "epoch": 3210} {"train_loss": -6.71577262878418, "global_step": 134850, "epoch": 3210} {"train_loss": -6.724529266357422, "global_step": 134851, "epoch": 3210} {"train_loss": -6.630777359008789, "global_step": 134852, "epoch": 3210} {"train_loss": -6.613025188446045, "global_step": 134853, "epoch": 3210} {"train_loss": -6.706459999084473, "global_step": 134854, "epoch": 3210} {"train_loss": -6.659406661987305, "global_step": 134855, "epoch": 3210} {"train_loss": -6.790672302246094, "global_step": 134856, "epoch": 3210} {"train_loss": -6.815699577331543, "global_step": 134857, "epoch": 3210} {"train_loss": -6.704814910888672, "global_step": 134858, "epoch": 3210} {"train_loss": -6.73554801940918, "global_step": 134859, "epoch": 3210} {"train_loss": -6.660455226898193, "global_step": 134860, "epoch": 3210} {"train_loss": -6.675258693240938, "global_step": 134861, "epoch": 3210, "val_loss": 68301.8984375} {"train_loss": -6.797257423400879, "global_step": 134862, "epoch": 3211} {"train_loss": -6.735330104827881, "global_step": 134863, "epoch": 3211} {"train_loss": -6.658632278442383, "global_step": 134864, "epoch": 3211} {"train_loss": -6.650829315185547, "global_step": 134865, "epoch": 3211} {"train_loss": -6.753591537475586, "global_step": 134866, "epoch": 3211} {"train_loss": -6.677933216094971, "global_step": 134867, "epoch": 3211} {"train_loss": -6.686923980712891, "global_step": 134868, "epoch": 3211} {"train_loss": -6.7081074714660645, "global_step": 134869, "epoch": 3211} {"train_loss": -6.707342147827148, "global_step": 134870, "epoch": 3211} {"train_loss": -6.536945819854736, "global_step": 134871, "epoch": 3211} {"train_loss": -6.710082054138184, "global_step": 134872, "epoch": 3211} {"train_loss": -6.602140426635742, "global_step": 134873, "epoch": 3211} {"train_loss": -6.592344760894775, "global_step": 134874, "epoch": 3211} {"train_loss": -6.6314191818237305, "global_step": 134875, "epoch": 3211} {"train_loss": -6.501487731933594, "global_step": 134876, "epoch": 3211} {"train_loss": -6.505499362945557, "global_step": 134877, "epoch": 3211} {"train_loss": -6.550969123840332, "global_step": 134878, "epoch": 3211} {"train_loss": -6.4970526695251465, "global_step": 134879, "epoch": 3211} {"train_loss": -6.6058268547058105, "global_step": 134880, "epoch": 3211} {"train_loss": -6.4141693115234375, "global_step": 134881, "epoch": 3211} {"train_loss": -6.581053733825684, "global_step": 134882, "epoch": 3211} {"train_loss": -6.561394691467285, "global_step": 134883, "epoch": 3211} {"train_loss": -6.607548713684082, "global_step": 134884, "epoch": 3211} {"train_loss": -6.59245491027832, "global_step": 134885, "epoch": 3211} {"train_loss": -6.609331130981445, "global_step": 134886, "epoch": 3211} {"train_loss": -6.498992919921875, "global_step": 134887, "epoch": 3211} {"train_loss": -6.6058125495910645, "global_step": 134888, "epoch": 3211} {"train_loss": -6.447726249694824, "global_step": 134889, "epoch": 3211} {"train_loss": -6.506480693817139, "global_step": 134890, "epoch": 3211} {"train_loss": -6.640529632568359, "global_step": 134891, "epoch": 3211} {"train_loss": -6.562979221343994, "global_step": 134892, "epoch": 3211} {"train_loss": -6.529779434204102, "global_step": 134893, "epoch": 3211} {"train_loss": -6.560477256774902, "global_step": 134894, "epoch": 3211} {"train_loss": -6.661469459533691, "global_step": 134895, "epoch": 3211} {"train_loss": -6.541880130767822, "global_step": 134896, "epoch": 3211} {"train_loss": -6.637240409851074, "global_step": 134897, "epoch": 3211} {"train_loss": -6.67213249206543, "global_step": 134898, "epoch": 3211} {"train_loss": -6.551009654998779, "global_step": 134899, "epoch": 3211} {"train_loss": -6.659210205078125, "global_step": 134900, "epoch": 3211} {"train_loss": -6.618847370147705, "global_step": 134901, "epoch": 3211} {"train_loss": -6.598452091217041, "global_step": 134902, "epoch": 3211} {"train_loss": -6.606562591734386, "global_step": 134903, "epoch": 3211, "val_loss": 68190.5078125} {"train_loss": -6.735716819763184, "global_step": 134904, "epoch": 3212} {"train_loss": -6.673693656921387, "global_step": 134905, "epoch": 3212} {"train_loss": -6.6190571784973145, "global_step": 134906, "epoch": 3212} {"train_loss": -6.650993347167969, "global_step": 134907, "epoch": 3212} {"train_loss": -6.7715864181518555, "global_step": 134908, "epoch": 3212} {"train_loss": -6.797823905944824, "global_step": 134909, "epoch": 3212} {"train_loss": -6.712967872619629, "global_step": 134910, "epoch": 3212} {"train_loss": -6.728088855743408, "global_step": 134911, "epoch": 3212} {"train_loss": -6.738307952880859, "global_step": 134912, "epoch": 3212} {"train_loss": -6.691516876220703, "global_step": 134913, "epoch": 3212} {"train_loss": -6.693037033081055, "global_step": 134914, "epoch": 3212} {"train_loss": -6.7724432945251465, "global_step": 134915, "epoch": 3212} {"train_loss": -6.679593086242676, "global_step": 134916, "epoch": 3212} {"train_loss": -6.751672744750977, "global_step": 134917, "epoch": 3212} {"train_loss": -6.655688762664795, "global_step": 134918, "epoch": 3212} {"train_loss": -6.725080966949463, "global_step": 134919, "epoch": 3212} {"train_loss": -6.66706657409668, "global_step": 134920, "epoch": 3212} {"train_loss": -6.720893859863281, "global_step": 134921, "epoch": 3212} {"train_loss": -6.7429609298706055, "global_step": 134922, "epoch": 3212} {"train_loss": -6.828611850738525, "global_step": 134923, "epoch": 3212} {"train_loss": -6.720308303833008, "global_step": 134924, "epoch": 3212} {"train_loss": -6.645287036895752, "global_step": 134925, "epoch": 3212} {"train_loss": -6.750482082366943, "global_step": 134926, "epoch": 3212} {"train_loss": -6.671309947967529, "global_step": 134927, "epoch": 3212} {"train_loss": -6.6046857833862305, "global_step": 134928, "epoch": 3212} {"train_loss": -6.675701141357422, "global_step": 134929, "epoch": 3212} {"train_loss": -6.743428707122803, "global_step": 134930, "epoch": 3212} {"train_loss": -6.616630554199219, "global_step": 134931, "epoch": 3212} {"train_loss": -6.651872634887695, "global_step": 134932, "epoch": 3212} {"train_loss": -6.7389068603515625, "global_step": 134933, "epoch": 3212} {"train_loss": -6.638365745544434, "global_step": 134934, "epoch": 3212} {"train_loss": -6.722332954406738, "global_step": 134935, "epoch": 3212} {"train_loss": -6.749720573425293, "global_step": 134936, "epoch": 3212} {"train_loss": -6.617931842803955, "global_step": 134937, "epoch": 3212} {"train_loss": -6.790970802307129, "global_step": 134938, "epoch": 3212} {"train_loss": -6.623806476593018, "global_step": 134939, "epoch": 3212} {"train_loss": -6.710544586181641, "global_step": 134940, "epoch": 3212} {"train_loss": -6.650979042053223, "global_step": 134941, "epoch": 3212} {"train_loss": -6.494229316711426, "global_step": 134942, "epoch": 3212} {"train_loss": -6.540866374969482, "global_step": 134943, "epoch": 3212} {"train_loss": -6.705351829528809, "global_step": 134944, "epoch": 3212} {"train_loss": -6.68967452503386, "global_step": 134945, "epoch": 3212, "val_loss": 68317.96875} {"train_loss": -6.548661231994629, "global_step": 134946, "epoch": 3213} {"train_loss": -6.749475002288818, "global_step": 134947, "epoch": 3213} {"train_loss": -6.6080732345581055, "global_step": 134948, "epoch": 3213} {"train_loss": -6.745244026184082, "global_step": 134949, "epoch": 3213} {"train_loss": -6.582210540771484, "global_step": 134950, "epoch": 3213} {"train_loss": -6.698177814483643, "global_step": 134951, "epoch": 3213} {"train_loss": -6.698272705078125, "global_step": 134952, "epoch": 3213} {"train_loss": -6.614289283752441, "global_step": 134953, "epoch": 3213} {"train_loss": -6.719763278961182, "global_step": 134954, "epoch": 3213} {"train_loss": -6.633551597595215, "global_step": 134955, "epoch": 3213} {"train_loss": -6.605678081512451, "global_step": 134956, "epoch": 3213} {"train_loss": -6.7218403816223145, "global_step": 134957, "epoch": 3213} {"train_loss": -6.563751220703125, "global_step": 134958, "epoch": 3213} {"train_loss": -6.619147300720215, "global_step": 134959, "epoch": 3213} {"train_loss": -6.629632949829102, "global_step": 134960, "epoch": 3213} {"train_loss": -6.6282148361206055, "global_step": 134961, "epoch": 3213} {"train_loss": -6.604915142059326, "global_step": 134962, "epoch": 3213} {"train_loss": -6.72256326675415, "global_step": 134963, "epoch": 3213} {"train_loss": -6.601449012756348, "global_step": 134964, "epoch": 3213} {"train_loss": -6.556893825531006, "global_step": 134965, "epoch": 3213} {"train_loss": -6.51420783996582, "global_step": 134966, "epoch": 3213} {"train_loss": -6.632715225219727, "global_step": 134967, "epoch": 3213} {"train_loss": -6.7333855628967285, "global_step": 134968, "epoch": 3213} {"train_loss": -6.64588737487793, "global_step": 134969, "epoch": 3213} {"train_loss": -6.666762351989746, "global_step": 134970, "epoch": 3213} {"train_loss": -6.68691349029541, "global_step": 134971, "epoch": 3213} {"train_loss": -6.559264183044434, "global_step": 134972, "epoch": 3213} {"train_loss": -6.6599273681640625, "global_step": 134973, "epoch": 3213} {"train_loss": -6.654770374298096, "global_step": 134974, "epoch": 3213} {"train_loss": -6.567300796508789, "global_step": 134975, "epoch": 3213} {"train_loss": -6.541750907897949, "global_step": 134976, "epoch": 3213} {"train_loss": -6.703249931335449, "global_step": 134977, "epoch": 3213} {"train_loss": -6.601714611053467, "global_step": 134978, "epoch": 3213} {"train_loss": -6.63607931137085, "global_step": 134979, "epoch": 3213} {"train_loss": -6.549222946166992, "global_step": 134980, "epoch": 3213} {"train_loss": -6.663547039031982, "global_step": 134981, "epoch": 3213} {"train_loss": -6.611059188842773, "global_step": 134982, "epoch": 3213} {"train_loss": -6.526237487792969, "global_step": 134983, "epoch": 3213} {"train_loss": -6.702930450439453, "global_step": 134984, "epoch": 3213} {"train_loss": -6.722790241241455, "global_step": 134985, "epoch": 3213} {"train_loss": -6.649252414703369, "global_step": 134986, "epoch": 3213} {"train_loss": -6.635295413789295, "global_step": 134987, "epoch": 3213, "val_loss": 68184.6953125} {"train_loss": -6.597762107849121, "global_step": 134988, "epoch": 3214} {"train_loss": -6.594106674194336, "global_step": 134989, "epoch": 3214} {"train_loss": -6.704296112060547, "global_step": 134990, "epoch": 3214} {"train_loss": -6.6629133224487305, "global_step": 134991, "epoch": 3214} {"train_loss": -6.5884480476379395, "global_step": 134992, "epoch": 3214} {"train_loss": -6.59046745300293, "global_step": 134993, "epoch": 3214} {"train_loss": -6.503791809082031, "global_step": 134994, "epoch": 3214} {"train_loss": -6.675551414489746, "global_step": 134995, "epoch": 3214} {"train_loss": -6.610968589782715, "global_step": 134996, "epoch": 3214} {"train_loss": -6.644685745239258, "global_step": 134997, "epoch": 3214} {"train_loss": -6.61594295501709, "global_step": 134998, "epoch": 3214} {"train_loss": -6.694156646728516, "global_step": 134999, "epoch": 3214} {"train_loss": -6.692975997924805, "global_step": 135000, "epoch": 3214} {"train_loss": -6.628715515136719, "global_step": 135001, "epoch": 3214} {"train_loss": -6.817270755767822, "global_step": 135002, "epoch": 3214} {"train_loss": -6.598505973815918, "global_step": 135003, "epoch": 3214} {"train_loss": -6.74693489074707, "global_step": 135004, "epoch": 3214} {"train_loss": -6.728302955627441, "global_step": 135005, "epoch": 3214} {"train_loss": -6.745570659637451, "global_step": 135006, "epoch": 3214} {"train_loss": -6.684692859649658, "global_step": 135007, "epoch": 3214} {"train_loss": -6.7192301750183105, "global_step": 135008, "epoch": 3214} {"train_loss": -6.732827186584473, "global_step": 135009, "epoch": 3214} {"train_loss": -6.654659748077393, "global_step": 135010, "epoch": 3214} {"train_loss": -6.556443214416504, "global_step": 135011, "epoch": 3214} {"train_loss": -6.650002479553223, "global_step": 135012, "epoch": 3214} {"train_loss": -6.646442413330078, "global_step": 135013, "epoch": 3214} {"train_loss": -6.674136161804199, "global_step": 135014, "epoch": 3214} {"train_loss": -6.7373762130737305, "global_step": 135015, "epoch": 3214} {"train_loss": -6.685426712036133, "global_step": 135016, "epoch": 3214} {"train_loss": -6.79550313949585, "global_step": 135017, "epoch": 3214} {"train_loss": -6.809274673461914, "global_step": 135018, "epoch": 3214} {"train_loss": -6.771889686584473, "global_step": 135019, "epoch": 3214} {"train_loss": -6.712558269500732, "global_step": 135020, "epoch": 3214} {"train_loss": -6.66976261138916, "global_step": 135021, "epoch": 3214} {"train_loss": -6.7945051193237305, "global_step": 135022, "epoch": 3214} {"train_loss": -6.63405704498291, "global_step": 135023, "epoch": 3214} {"train_loss": -6.686875343322754, "global_step": 135024, "epoch": 3214} {"train_loss": -6.797726154327393, "global_step": 135025, "epoch": 3214} {"train_loss": -6.699944496154785, "global_step": 135026, "epoch": 3214} {"train_loss": -6.745316505432129, "global_step": 135027, "epoch": 3214} {"train_loss": -6.753287315368652, "global_step": 135028, "epoch": 3214} {"train_loss": -6.682952472141811, "global_step": 135029, "epoch": 3214, "val_loss": 68174.7890625} {"train_loss": -6.602399826049805, "global_step": 135030, "epoch": 3215} {"train_loss": -6.75030517578125, "global_step": 135031, "epoch": 3215} {"train_loss": -6.725255966186523, "global_step": 135032, "epoch": 3215} {"train_loss": -6.749401569366455, "global_step": 135033, "epoch": 3215} {"train_loss": -6.804584503173828, "global_step": 135034, "epoch": 3215} {"train_loss": -6.821475982666016, "global_step": 135035, "epoch": 3215} {"train_loss": -6.64776611328125, "global_step": 135036, "epoch": 3215} {"train_loss": -6.747749328613281, "global_step": 135037, "epoch": 3215} {"train_loss": -6.838935852050781, "global_step": 135038, "epoch": 3215} {"train_loss": -6.6976823806762695, "global_step": 135039, "epoch": 3215} {"train_loss": -6.7031660079956055, "global_step": 135040, "epoch": 3215} {"train_loss": -6.7123703956604, "global_step": 135041, "epoch": 3215} {"train_loss": -6.837096214294434, "global_step": 135042, "epoch": 3215} {"train_loss": -6.83696174621582, "global_step": 135043, "epoch": 3215} {"train_loss": -6.705814838409424, "global_step": 135044, "epoch": 3215} {"train_loss": -6.789855003356934, "global_step": 135045, "epoch": 3215} {"train_loss": -6.719615936279297, "global_step": 135046, "epoch": 3215} {"train_loss": -6.717935562133789, "global_step": 135047, "epoch": 3215} {"train_loss": -6.712026596069336, "global_step": 135048, "epoch": 3215} {"train_loss": -6.497012138366699, "global_step": 135049, "epoch": 3215} {"train_loss": -6.736699104309082, "global_step": 135050, "epoch": 3215} {"train_loss": -6.662688255310059, "global_step": 135051, "epoch": 3215} {"train_loss": -6.658038139343262, "global_step": 135052, "epoch": 3215} {"train_loss": -6.67859411239624, "global_step": 135053, "epoch": 3215} {"train_loss": -6.721161842346191, "global_step": 135054, "epoch": 3215} {"train_loss": -6.7440032958984375, "global_step": 135055, "epoch": 3215} {"train_loss": -6.683008670806885, "global_step": 135056, "epoch": 3215} {"train_loss": -6.719939231872559, "global_step": 135057, "epoch": 3215} {"train_loss": -6.5077714920043945, "global_step": 135058, "epoch": 3215} {"train_loss": -6.570683479309082, "global_step": 135059, "epoch": 3215} {"train_loss": -6.700277805328369, "global_step": 135060, "epoch": 3215} {"train_loss": -6.490415573120117, "global_step": 135061, "epoch": 3215} {"train_loss": -6.617431640625, "global_step": 135062, "epoch": 3215} {"train_loss": -6.611432075500488, "global_step": 135063, "epoch": 3215} {"train_loss": -6.428549766540527, "global_step": 135064, "epoch": 3215} {"train_loss": -6.638723850250244, "global_step": 135065, "epoch": 3215} {"train_loss": -6.575749397277832, "global_step": 135066, "epoch": 3215} {"train_loss": -6.586555480957031, "global_step": 135067, "epoch": 3215} {"train_loss": -6.551455020904541, "global_step": 135068, "epoch": 3215} {"train_loss": -6.582489013671875, "global_step": 135069, "epoch": 3215} {"train_loss": -6.6635966300964355, "global_step": 135070, "epoch": 3215} {"train_loss": -6.674504348209926, "global_step": 135071, "epoch": 3215, "val_loss": 68160.078125} {"train_loss": -6.694929122924805, "global_step": 135072, "epoch": 3216} {"train_loss": -6.71513032913208, "global_step": 135073, "epoch": 3216} {"train_loss": -6.6323652267456055, "global_step": 135074, "epoch": 3216} {"train_loss": -6.664566516876221, "global_step": 135075, "epoch": 3216} {"train_loss": -6.664872646331787, "global_step": 135076, "epoch": 3216} {"train_loss": -6.688291549682617, "global_step": 135077, "epoch": 3216} {"train_loss": -6.770075798034668, "global_step": 135078, "epoch": 3216} {"train_loss": -6.696222305297852, "global_step": 135079, "epoch": 3216} {"train_loss": -6.7779951095581055, "global_step": 135080, "epoch": 3216} {"train_loss": -6.680183410644531, "global_step": 135081, "epoch": 3216} {"train_loss": -6.592079162597656, "global_step": 135082, "epoch": 3216} {"train_loss": -6.685352802276611, "global_step": 135083, "epoch": 3216} {"train_loss": -6.841604232788086, "global_step": 135084, "epoch": 3216} {"train_loss": -6.6808247566223145, "global_step": 135085, "epoch": 3216} {"train_loss": -6.631646633148193, "global_step": 135086, "epoch": 3216} {"train_loss": -6.698856830596924, "global_step": 135087, "epoch": 3216} {"train_loss": -6.7852911949157715, "global_step": 135088, "epoch": 3216} {"train_loss": -6.756796836853027, "global_step": 135089, "epoch": 3216} {"train_loss": -6.736404895782471, "global_step": 135090, "epoch": 3216} {"train_loss": -6.6646599769592285, "global_step": 135091, "epoch": 3216} {"train_loss": -6.78139591217041, "global_step": 135092, "epoch": 3216} {"train_loss": -6.612330436706543, "global_step": 135093, "epoch": 3216} {"train_loss": -6.582149505615234, "global_step": 135094, "epoch": 3216} {"train_loss": -6.636805534362793, "global_step": 135095, "epoch": 3216} {"train_loss": -6.742835998535156, "global_step": 135096, "epoch": 3216} {"train_loss": -6.5871686935424805, "global_step": 135097, "epoch": 3216} {"train_loss": -6.569867134094238, "global_step": 135098, "epoch": 3216} {"train_loss": -6.6851115226745605, "global_step": 135099, "epoch": 3216} {"train_loss": -6.543661594390869, "global_step": 135100, "epoch": 3216} {"train_loss": -6.646091461181641, "global_step": 135101, "epoch": 3216} {"train_loss": -6.5856032371521, "global_step": 135102, "epoch": 3216} {"train_loss": -6.3994574546813965, "global_step": 135103, "epoch": 3216} {"train_loss": -6.640256881713867, "global_step": 135104, "epoch": 3216} {"train_loss": -6.57820987701416, "global_step": 135105, "epoch": 3216} {"train_loss": -6.600618362426758, "global_step": 135106, "epoch": 3216} {"train_loss": -6.704723358154297, "global_step": 135107, "epoch": 3216} {"train_loss": -6.553314208984375, "global_step": 135108, "epoch": 3216} {"train_loss": -6.739964485168457, "global_step": 135109, "epoch": 3216} {"train_loss": -6.5192108154296875, "global_step": 135110, "epoch": 3216} {"train_loss": -6.698674201965332, "global_step": 135111, "epoch": 3216} {"train_loss": -6.552640914916992, "global_step": 135112, "epoch": 3216} {"train_loss": -6.6571991784232, "global_step": 135113, "epoch": 3216, "val_loss": 68185.921875} {"train_loss": -6.604195594787598, "global_step": 135114, "epoch": 3217} {"train_loss": -6.59578800201416, "global_step": 135115, "epoch": 3217} {"train_loss": -6.555299282073975, "global_step": 135116, "epoch": 3217} {"train_loss": -6.604350566864014, "global_step": 135117, "epoch": 3217} {"train_loss": -6.7539591789245605, "global_step": 135118, "epoch": 3217} {"train_loss": -6.552887916564941, "global_step": 135119, "epoch": 3217} {"train_loss": -6.67648458480835, "global_step": 135120, "epoch": 3217} {"train_loss": -6.594098091125488, "global_step": 135121, "epoch": 3217} {"train_loss": -6.622115612030029, "global_step": 135122, "epoch": 3217} {"train_loss": -6.631343841552734, "global_step": 135123, "epoch": 3217} {"train_loss": -6.687135696411133, "global_step": 135124, "epoch": 3217} {"train_loss": -6.576135635375977, "global_step": 135125, "epoch": 3217} {"train_loss": -6.610795974731445, "global_step": 135126, "epoch": 3217} {"train_loss": -6.634201526641846, "global_step": 135127, "epoch": 3217} {"train_loss": -6.729690074920654, "global_step": 135128, "epoch": 3217} {"train_loss": -6.595518112182617, "global_step": 135129, "epoch": 3217} {"train_loss": -6.601243019104004, "global_step": 135130, "epoch": 3217} {"train_loss": -6.598204612731934, "global_step": 135131, "epoch": 3217} {"train_loss": -6.632322311401367, "global_step": 135132, "epoch": 3217} {"train_loss": -6.6139373779296875, "global_step": 135133, "epoch": 3217} {"train_loss": -6.517321586608887, "global_step": 135134, "epoch": 3217} {"train_loss": -6.66234016418457, "global_step": 135135, "epoch": 3217} {"train_loss": -6.612232208251953, "global_step": 135136, "epoch": 3217} {"train_loss": -6.689310073852539, "global_step": 135137, "epoch": 3217} {"train_loss": -6.68709659576416, "global_step": 135138, "epoch": 3217} {"train_loss": -6.673827171325684, "global_step": 135139, "epoch": 3217} {"train_loss": -6.48100471496582, "global_step": 135140, "epoch": 3217} {"train_loss": -6.632495403289795, "global_step": 135141, "epoch": 3217} {"train_loss": -6.564043045043945, "global_step": 135142, "epoch": 3217} {"train_loss": -6.721556663513184, "global_step": 135143, "epoch": 3217} {"train_loss": -6.606854438781738, "global_step": 135144, "epoch": 3217} {"train_loss": -6.591870307922363, "global_step": 135145, "epoch": 3217} {"train_loss": -6.684744358062744, "global_step": 135146, "epoch": 3217} {"train_loss": -6.622174263000488, "global_step": 135147, "epoch": 3217} {"train_loss": -6.660920143127441, "global_step": 135148, "epoch": 3217} {"train_loss": -6.615336894989014, "global_step": 135149, "epoch": 3217} {"train_loss": -6.673252105712891, "global_step": 135150, "epoch": 3217} {"train_loss": -6.6310625076293945, "global_step": 135151, "epoch": 3217} {"train_loss": -6.807325839996338, "global_step": 135152, "epoch": 3217} {"train_loss": -6.56729793548584, "global_step": 135153, "epoch": 3217} {"train_loss": -6.645334243774414, "global_step": 135154, "epoch": 3217} {"train_loss": -6.6290737220219205, "global_step": 135155, "epoch": 3217, "val_loss": 68269.4296875} {"train_loss": -6.448347091674805, "global_step": 135156, "epoch": 3218} {"train_loss": -6.725689888000488, "global_step": 135157, "epoch": 3218} {"train_loss": -6.524895668029785, "global_step": 135158, "epoch": 3218} {"train_loss": -6.726346969604492, "global_step": 135159, "epoch": 3218} {"train_loss": -6.54897403717041, "global_step": 135160, "epoch": 3218} {"train_loss": -6.461624622344971, "global_step": 135161, "epoch": 3218} {"train_loss": -6.6019673347473145, "global_step": 135162, "epoch": 3218} {"train_loss": -6.595616340637207, "global_step": 135163, "epoch": 3218} {"train_loss": -6.704117774963379, "global_step": 135164, "epoch": 3218} {"train_loss": -6.539166450500488, "global_step": 135165, "epoch": 3218} {"train_loss": -6.703537940979004, "global_step": 135166, "epoch": 3218} {"train_loss": -6.4784440994262695, "global_step": 135167, "epoch": 3218} {"train_loss": -6.636205673217773, "global_step": 135168, "epoch": 3218} {"train_loss": -6.5962677001953125, "global_step": 135169, "epoch": 3218} {"train_loss": -6.6923980712890625, "global_step": 135170, "epoch": 3218} {"train_loss": -6.521256446838379, "global_step": 135171, "epoch": 3218} {"train_loss": -6.638906478881836, "global_step": 135172, "epoch": 3218} {"train_loss": -6.811172008514404, "global_step": 135173, "epoch": 3218} {"train_loss": -6.696902751922607, "global_step": 135174, "epoch": 3218} {"train_loss": -6.645272731781006, "global_step": 135175, "epoch": 3218} {"train_loss": -6.766109466552734, "global_step": 135176, "epoch": 3218} {"train_loss": -6.672471046447754, "global_step": 135177, "epoch": 3218} {"train_loss": -6.631924629211426, "global_step": 135178, "epoch": 3218} {"train_loss": -6.696352958679199, "global_step": 135179, "epoch": 3218} {"train_loss": -6.780102729797363, "global_step": 135180, "epoch": 3218} {"train_loss": -6.715434551239014, "global_step": 135181, "epoch": 3218} {"train_loss": -6.766993045806885, "global_step": 135182, "epoch": 3218} {"train_loss": -6.75321102142334, "global_step": 135183, "epoch": 3218} {"train_loss": -6.692601203918457, "global_step": 135184, "epoch": 3218} {"train_loss": -6.583612442016602, "global_step": 135185, "epoch": 3218} {"train_loss": -6.686706066131592, "global_step": 135186, "epoch": 3218} {"train_loss": -6.696966171264648, "global_step": 135187, "epoch": 3218} {"train_loss": -6.692943096160889, "global_step": 135188, "epoch": 3218} {"train_loss": -6.578176498413086, "global_step": 135189, "epoch": 3218} {"train_loss": -6.755668640136719, "global_step": 135190, "epoch": 3218} {"train_loss": -6.687077045440674, "global_step": 135191, "epoch": 3218} {"train_loss": -6.7577104568481445, "global_step": 135192, "epoch": 3218} {"train_loss": -6.740362644195557, "global_step": 135193, "epoch": 3218} {"train_loss": -6.709310531616211, "global_step": 135194, "epoch": 3218} {"train_loss": -6.752908229827881, "global_step": 135195, "epoch": 3218} {"train_loss": -6.746905326843262, "global_step": 135196, "epoch": 3218} {"train_loss": -6.663650932766142, "global_step": 135197, "epoch": 3218, "val_loss": 68117.203125} {"train_loss": -6.6997833251953125, "global_step": 135198, "epoch": 3219} {"train_loss": -6.668333053588867, "global_step": 135199, "epoch": 3219} {"train_loss": -6.734563827514648, "global_step": 135200, "epoch": 3219} {"train_loss": -6.723773002624512, "global_step": 135201, "epoch": 3219} {"train_loss": -6.782796859741211, "global_step": 135202, "epoch": 3219} {"train_loss": -6.633953094482422, "global_step": 135203, "epoch": 3219} {"train_loss": -6.808178901672363, "global_step": 135204, "epoch": 3219} {"train_loss": -6.685519218444824, "global_step": 135205, "epoch": 3219} {"train_loss": -6.597022533416748, "global_step": 135206, "epoch": 3219} {"train_loss": -6.695921897888184, "global_step": 135207, "epoch": 3219} {"train_loss": -6.807528972625732, "global_step": 135208, "epoch": 3219} {"train_loss": -6.668821811676025, "global_step": 135209, "epoch": 3219} {"train_loss": -6.698573112487793, "global_step": 135210, "epoch": 3219} {"train_loss": -6.6418776512146, "global_step": 135211, "epoch": 3219} {"train_loss": -6.6545023918151855, "global_step": 135212, "epoch": 3219} {"train_loss": -6.750574111938477, "global_step": 135213, "epoch": 3219} {"train_loss": -6.606683254241943, "global_step": 135214, "epoch": 3219} {"train_loss": -6.695644855499268, "global_step": 135215, "epoch": 3219} {"train_loss": -6.711830139160156, "global_step": 135216, "epoch": 3219} {"train_loss": -6.749455451965332, "global_step": 135217, "epoch": 3219} {"train_loss": -6.750124931335449, "global_step": 135218, "epoch": 3219} {"train_loss": -6.678772926330566, "global_step": 135219, "epoch": 3219} {"train_loss": -6.698740005493164, "global_step": 135220, "epoch": 3219} {"train_loss": -6.681025981903076, "global_step": 135221, "epoch": 3219} {"train_loss": -6.75462532043457, "global_step": 135222, "epoch": 3219} {"train_loss": -6.8509626388549805, "global_step": 135223, "epoch": 3219} {"train_loss": -6.758644104003906, "global_step": 135224, "epoch": 3219} {"train_loss": -6.530077934265137, "global_step": 135225, "epoch": 3219} {"train_loss": -6.646780014038086, "global_step": 135226, "epoch": 3219} {"train_loss": -6.635701656341553, "global_step": 135227, "epoch": 3219} {"train_loss": -6.681408882141113, "global_step": 135228, "epoch": 3219} {"train_loss": -6.676552772521973, "global_step": 135229, "epoch": 3219} {"train_loss": -6.686710357666016, "global_step": 135230, "epoch": 3219} {"train_loss": -6.6312336921691895, "global_step": 135231, "epoch": 3219} {"train_loss": -6.710589408874512, "global_step": 135232, "epoch": 3219} {"train_loss": -6.480419158935547, "global_step": 135233, "epoch": 3219} {"train_loss": -6.797183990478516, "global_step": 135234, "epoch": 3219} {"train_loss": -6.721757411956787, "global_step": 135235, "epoch": 3219} {"train_loss": -6.689752578735352, "global_step": 135236, "epoch": 3219} {"train_loss": -6.562278747558594, "global_step": 135237, "epoch": 3219} {"train_loss": -6.654808044433594, "global_step": 135238, "epoch": 3219} {"train_loss": -6.687379416965303, "global_step": 135239, "epoch": 3219, "val_loss": 68384.625} {"train_loss": -6.59017276763916, "global_step": 135240, "epoch": 3220} {"train_loss": -6.632950305938721, "global_step": 135241, "epoch": 3220} {"train_loss": -6.750976085662842, "global_step": 135242, "epoch": 3220} {"train_loss": -6.549015998840332, "global_step": 135243, "epoch": 3220} {"train_loss": -6.554567337036133, "global_step": 135244, "epoch": 3220} {"train_loss": -6.684176445007324, "global_step": 135245, "epoch": 3220} {"train_loss": -6.652545928955078, "global_step": 135246, "epoch": 3220} {"train_loss": -6.678290843963623, "global_step": 135247, "epoch": 3220} {"train_loss": -6.583134651184082, "global_step": 135248, "epoch": 3220} {"train_loss": -6.686158657073975, "global_step": 135249, "epoch": 3220} {"train_loss": -6.644746780395508, "global_step": 135250, "epoch": 3220} {"train_loss": -6.672177314758301, "global_step": 135251, "epoch": 3220} {"train_loss": -6.668190956115723, "global_step": 135252, "epoch": 3220} {"train_loss": -6.605053424835205, "global_step": 135253, "epoch": 3220} {"train_loss": -6.624258041381836, "global_step": 135254, "epoch": 3220} {"train_loss": -6.5419440269470215, "global_step": 135255, "epoch": 3220} {"train_loss": -6.623016834259033, "global_step": 135256, "epoch": 3220} {"train_loss": -6.575182914733887, "global_step": 135257, "epoch": 3220} {"train_loss": -6.598656177520752, "global_step": 135258, "epoch": 3220} {"train_loss": -6.651719570159912, "global_step": 135259, "epoch": 3220} {"train_loss": -6.716127395629883, "global_step": 135260, "epoch": 3220} {"train_loss": -6.782989978790283, "global_step": 135261, "epoch": 3220} {"train_loss": -6.64661169052124, "global_step": 135262, "epoch": 3220} {"train_loss": -6.637534141540527, "global_step": 135263, "epoch": 3220} {"train_loss": -6.755317687988281, "global_step": 135264, "epoch": 3220} {"train_loss": -6.685972690582275, "global_step": 135265, "epoch": 3220} {"train_loss": -6.680850505828857, "global_step": 135266, "epoch": 3220} {"train_loss": -6.704195022583008, "global_step": 135267, "epoch": 3220} {"train_loss": -6.723736763000488, "global_step": 135268, "epoch": 3220} {"train_loss": -6.694347381591797, "global_step": 135269, "epoch": 3220} {"train_loss": -6.693519592285156, "global_step": 135270, "epoch": 3220} {"train_loss": -6.6747236251831055, "global_step": 135271, "epoch": 3220} {"train_loss": -6.682612419128418, "global_step": 135272, "epoch": 3220} {"train_loss": -6.717443466186523, "global_step": 135273, "epoch": 3220} {"train_loss": -6.7356414794921875, "global_step": 135274, "epoch": 3220} {"train_loss": -6.759267807006836, "global_step": 135275, "epoch": 3220} {"train_loss": -6.692658424377441, "global_step": 135276, "epoch": 3220} {"train_loss": -6.733389854431152, "global_step": 135277, "epoch": 3220} {"train_loss": -6.662900924682617, "global_step": 135278, "epoch": 3220} {"train_loss": -6.670607566833496, "global_step": 135279, "epoch": 3220} {"train_loss": -6.686216354370117, "global_step": 135280, "epoch": 3220} {"train_loss": -6.666004952930269, "global_step": 135281, "epoch": 3220, "val_loss": 68294.0390625} {"train_loss": -6.749086380004883, "global_step": 135282, "epoch": 3221} {"train_loss": -6.626047134399414, "global_step": 135283, "epoch": 3221} {"train_loss": -6.753314018249512, "global_step": 135284, "epoch": 3221} {"train_loss": -6.634347915649414, "global_step": 135285, "epoch": 3221} {"train_loss": -6.724152565002441, "global_step": 135286, "epoch": 3221} {"train_loss": -6.808704376220703, "global_step": 135287, "epoch": 3221} {"train_loss": -6.7585039138793945, "global_step": 135288, "epoch": 3221} {"train_loss": -6.681081295013428, "global_step": 135289, "epoch": 3221} {"train_loss": -6.711597442626953, "global_step": 135290, "epoch": 3221} {"train_loss": -6.734315395355225, "global_step": 135291, "epoch": 3221} {"train_loss": -6.681794166564941, "global_step": 135292, "epoch": 3221} {"train_loss": -6.692379951477051, "global_step": 135293, "epoch": 3221} {"train_loss": -6.7567009925842285, "global_step": 135294, "epoch": 3221} {"train_loss": -6.688836097717285, "global_step": 135295, "epoch": 3221} {"train_loss": -6.7279767990112305, "global_step": 135296, "epoch": 3221} {"train_loss": -6.655466556549072, "global_step": 135297, "epoch": 3221} {"train_loss": -6.7057318687438965, "global_step": 135298, "epoch": 3221} {"train_loss": -6.637272834777832, "global_step": 135299, "epoch": 3221} {"train_loss": -6.778130054473877, "global_step": 135300, "epoch": 3221} {"train_loss": -6.761967658996582, "global_step": 135301, "epoch": 3221} {"train_loss": -6.748466491699219, "global_step": 135302, "epoch": 3221} {"train_loss": -6.669464588165283, "global_step": 135303, "epoch": 3221} {"train_loss": -6.800941467285156, "global_step": 135304, "epoch": 3221} {"train_loss": -6.7608418464660645, "global_step": 135305, "epoch": 3221} {"train_loss": -6.753760814666748, "global_step": 135306, "epoch": 3221} {"train_loss": -6.629539966583252, "global_step": 135307, "epoch": 3221} {"train_loss": -6.760641098022461, "global_step": 135308, "epoch": 3221} {"train_loss": -6.679854393005371, "global_step": 135309, "epoch": 3221} {"train_loss": -6.626068592071533, "global_step": 135310, "epoch": 3221} {"train_loss": -6.787824630737305, "global_step": 135311, "epoch": 3221} {"train_loss": -6.787994384765625, "global_step": 135312, "epoch": 3221} {"train_loss": -6.7000956535339355, "global_step": 135313, "epoch": 3221} {"train_loss": -6.725987434387207, "global_step": 135314, "epoch": 3221} {"train_loss": -6.638855934143066, "global_step": 135315, "epoch": 3221} {"train_loss": -6.650528430938721, "global_step": 135316, "epoch": 3221} {"train_loss": -6.649467945098877, "global_step": 135317, "epoch": 3221} {"train_loss": -6.789385795593262, "global_step": 135318, "epoch": 3221} {"train_loss": -6.606723308563232, "global_step": 135319, "epoch": 3221} {"train_loss": -6.726178169250488, "global_step": 135320, "epoch": 3221} {"train_loss": -6.706238746643066, "global_step": 135321, "epoch": 3221} {"train_loss": -6.746744155883789, "global_step": 135322, "epoch": 3221} {"train_loss": -6.710037515276954, "global_step": 135323, "epoch": 3221, "val_loss": 68247.4375} {"train_loss": -6.695850372314453, "global_step": 135324, "epoch": 3222} {"train_loss": -6.627273082733154, "global_step": 135325, "epoch": 3222} {"train_loss": -6.747296333312988, "global_step": 135326, "epoch": 3222} {"train_loss": -6.777096271514893, "global_step": 135327, "epoch": 3222} {"train_loss": -6.7261271476745605, "global_step": 135328, "epoch": 3222} {"train_loss": -6.675302505493164, "global_step": 135329, "epoch": 3222} {"train_loss": -6.674557685852051, "global_step": 135330, "epoch": 3222} {"train_loss": -6.7140045166015625, "global_step": 135331, "epoch": 3222} {"train_loss": -6.744755744934082, "global_step": 135332, "epoch": 3222} {"train_loss": -6.656482219696045, "global_step": 135333, "epoch": 3222} {"train_loss": -6.804866790771484, "global_step": 135334, "epoch": 3222} {"train_loss": -6.718517303466797, "global_step": 135335, "epoch": 3222} {"train_loss": -6.737372398376465, "global_step": 135336, "epoch": 3222} {"train_loss": -6.665131568908691, "global_step": 135337, "epoch": 3222} {"train_loss": -6.726813793182373, "global_step": 135338, "epoch": 3222} {"train_loss": -6.720050811767578, "global_step": 135339, "epoch": 3222} {"train_loss": -6.720468521118164, "global_step": 135340, "epoch": 3222} {"train_loss": -6.778428554534912, "global_step": 135341, "epoch": 3222} {"train_loss": -6.634709358215332, "global_step": 135342, "epoch": 3222} {"train_loss": -6.740946292877197, "global_step": 135343, "epoch": 3222} {"train_loss": -6.57438850402832, "global_step": 135344, "epoch": 3222} {"train_loss": -6.587027072906494, "global_step": 135345, "epoch": 3222} {"train_loss": -6.661471366882324, "global_step": 135346, "epoch": 3222} {"train_loss": -6.760477542877197, "global_step": 135347, "epoch": 3222} {"train_loss": -6.652998924255371, "global_step": 135348, "epoch": 3222} {"train_loss": -6.744932174682617, "global_step": 135349, "epoch": 3222} {"train_loss": -6.6380510330200195, "global_step": 135350, "epoch": 3222} {"train_loss": -6.755698204040527, "global_step": 135351, "epoch": 3222} {"train_loss": -6.635127067565918, "global_step": 135352, "epoch": 3222} {"train_loss": -6.6354875564575195, "global_step": 135353, "epoch": 3222} {"train_loss": -6.745196342468262, "global_step": 135354, "epoch": 3222} {"train_loss": -6.79632568359375, "global_step": 135355, "epoch": 3222} {"train_loss": -6.709222793579102, "global_step": 135356, "epoch": 3222} {"train_loss": -6.689884185791016, "global_step": 135357, "epoch": 3222} {"train_loss": -6.784689903259277, "global_step": 135358, "epoch": 3222} {"train_loss": -6.744145393371582, "global_step": 135359, "epoch": 3222} {"train_loss": -6.740818977355957, "global_step": 135360, "epoch": 3222} {"train_loss": -6.717764854431152, "global_step": 135361, "epoch": 3222} {"train_loss": -6.566927909851074, "global_step": 135362, "epoch": 3222} {"train_loss": -6.799871921539307, "global_step": 135363, "epoch": 3222} {"train_loss": -6.6248674392700195, "global_step": 135364, "epoch": 3222} {"train_loss": -6.704348473321824, "global_step": 135365, "epoch": 3222, "val_loss": 68263.8828125} {"train_loss": -6.743446350097656, "global_step": 135366, "epoch": 3223} {"train_loss": -6.757566928863525, "global_step": 135367, "epoch": 3223} {"train_loss": -6.608274936676025, "global_step": 135368, "epoch": 3223} {"train_loss": -6.650848388671875, "global_step": 135369, "epoch": 3223} {"train_loss": -6.783797264099121, "global_step": 135370, "epoch": 3223} {"train_loss": -6.685279846191406, "global_step": 135371, "epoch": 3223} {"train_loss": -6.687866687774658, "global_step": 135372, "epoch": 3223} {"train_loss": -6.556586265563965, "global_step": 135373, "epoch": 3223} {"train_loss": -6.636309623718262, "global_step": 135374, "epoch": 3223} {"train_loss": -6.620915412902832, "global_step": 135375, "epoch": 3223} {"train_loss": -6.524272918701172, "global_step": 135376, "epoch": 3223} {"train_loss": -6.737452507019043, "global_step": 135377, "epoch": 3223} {"train_loss": -6.626855850219727, "global_step": 135378, "epoch": 3223} {"train_loss": -6.575637340545654, "global_step": 135379, "epoch": 3223} {"train_loss": -6.612574577331543, "global_step": 135380, "epoch": 3223} {"train_loss": -6.646442413330078, "global_step": 135381, "epoch": 3223} {"train_loss": -6.767834663391113, "global_step": 135382, "epoch": 3223} {"train_loss": -6.7215142250061035, "global_step": 135383, "epoch": 3223} {"train_loss": -6.708807945251465, "global_step": 135384, "epoch": 3223} {"train_loss": -6.730238914489746, "global_step": 135385, "epoch": 3223} {"train_loss": -6.6562724113464355, "global_step": 135386, "epoch": 3223} {"train_loss": -6.680459976196289, "global_step": 135387, "epoch": 3223} {"train_loss": -6.637679100036621, "global_step": 135388, "epoch": 3223} {"train_loss": -6.652047157287598, "global_step": 135389, "epoch": 3223} {"train_loss": -6.629680633544922, "global_step": 135390, "epoch": 3223} {"train_loss": -6.709902763366699, "global_step": 135391, "epoch": 3223} {"train_loss": -6.804933547973633, "global_step": 135392, "epoch": 3223} {"train_loss": -6.674243450164795, "global_step": 135393, "epoch": 3223} {"train_loss": -6.536772727966309, "global_step": 135394, "epoch": 3223} {"train_loss": -6.665956497192383, "global_step": 135395, "epoch": 3223} {"train_loss": -6.722108840942383, "global_step": 135396, "epoch": 3223} {"train_loss": -6.64164924621582, "global_step": 135397, "epoch": 3223} {"train_loss": -6.668752670288086, "global_step": 135398, "epoch": 3223} {"train_loss": -6.719270706176758, "global_step": 135399, "epoch": 3223} {"train_loss": -6.783697128295898, "global_step": 135400, "epoch": 3223} {"train_loss": -6.581629753112793, "global_step": 135401, "epoch": 3223} {"train_loss": -6.64569616317749, "global_step": 135402, "epoch": 3223} {"train_loss": -6.722589015960693, "global_step": 135403, "epoch": 3223} {"train_loss": -6.709346294403076, "global_step": 135404, "epoch": 3223} {"train_loss": -6.737547874450684, "global_step": 135405, "epoch": 3223} {"train_loss": -6.586347579956055, "global_step": 135406, "epoch": 3223} {"train_loss": -6.669610102971395, "global_step": 135407, "epoch": 3223, "val_loss": 68203.171875} {"train_loss": -6.578534126281738, "global_step": 135408, "epoch": 3224} {"train_loss": -6.565426826477051, "global_step": 135409, "epoch": 3224} {"train_loss": -6.679710865020752, "global_step": 135410, "epoch": 3224} {"train_loss": -6.6993913650512695, "global_step": 135411, "epoch": 3224} {"train_loss": -6.6015520095825195, "global_step": 135412, "epoch": 3224} {"train_loss": -6.548116683959961, "global_step": 135413, "epoch": 3224} {"train_loss": -6.590515613555908, "global_step": 135414, "epoch": 3224} {"train_loss": -6.628026962280273, "global_step": 135415, "epoch": 3224} {"train_loss": -6.596768379211426, "global_step": 135416, "epoch": 3224} {"train_loss": -6.653322219848633, "global_step": 135417, "epoch": 3224} {"train_loss": -6.610831260681152, "global_step": 135418, "epoch": 3224} {"train_loss": -6.578183174133301, "global_step": 135419, "epoch": 3224} {"train_loss": -6.655344009399414, "global_step": 135420, "epoch": 3224} {"train_loss": -6.670063018798828, "global_step": 135421, "epoch": 3224} {"train_loss": -6.646900177001953, "global_step": 135422, "epoch": 3224} {"train_loss": -6.630923271179199, "global_step": 135423, "epoch": 3224} {"train_loss": -6.640284538269043, "global_step": 135424, "epoch": 3224} {"train_loss": -6.612278938293457, "global_step": 135425, "epoch": 3224} {"train_loss": -6.667417526245117, "global_step": 135426, "epoch": 3224} {"train_loss": -6.612001419067383, "global_step": 135427, "epoch": 3224} {"train_loss": -6.615348815917969, "global_step": 135428, "epoch": 3224} {"train_loss": -6.786666393280029, "global_step": 135429, "epoch": 3224} {"train_loss": -6.51042366027832, "global_step": 135430, "epoch": 3224} {"train_loss": -6.715897560119629, "global_step": 135431, "epoch": 3224} {"train_loss": -6.629491806030273, "global_step": 135432, "epoch": 3224} {"train_loss": -6.65275239944458, "global_step": 135433, "epoch": 3224} {"train_loss": -6.628863334655762, "global_step": 135434, "epoch": 3224} {"train_loss": -6.570583343505859, "global_step": 135435, "epoch": 3224} {"train_loss": -6.809138298034668, "global_step": 135436, "epoch": 3224} {"train_loss": -6.67936897277832, "global_step": 135437, "epoch": 3224} {"train_loss": -6.683441162109375, "global_step": 135438, "epoch": 3224} {"train_loss": -6.626650333404541, "global_step": 135439, "epoch": 3224} {"train_loss": -6.715692520141602, "global_step": 135440, "epoch": 3224} {"train_loss": -6.676478385925293, "global_step": 135441, "epoch": 3224} {"train_loss": -6.638004779815674, "global_step": 135442, "epoch": 3224} {"train_loss": -6.736159324645996, "global_step": 135443, "epoch": 3224} {"train_loss": -6.617097854614258, "global_step": 135444, "epoch": 3224} {"train_loss": -6.651871204376221, "global_step": 135445, "epoch": 3224} {"train_loss": -6.63810920715332, "global_step": 135446, "epoch": 3224} {"train_loss": -6.640390396118164, "global_step": 135447, "epoch": 3224} {"train_loss": -6.6841583251953125, "global_step": 135448, "epoch": 3224} {"train_loss": -6.6434731142861505, "global_step": 135449, "epoch": 3224, "val_loss": 68144.0390625} {"train_loss": -6.677496910095215, "global_step": 135450, "epoch": 3225} {"train_loss": -6.626458644866943, "global_step": 135451, "epoch": 3225} {"train_loss": -6.714542388916016, "global_step": 135452, "epoch": 3225} {"train_loss": -6.624563217163086, "global_step": 135453, "epoch": 3225} {"train_loss": -6.680512428283691, "global_step": 135454, "epoch": 3225} {"train_loss": -6.729606628417969, "global_step": 135455, "epoch": 3225} {"train_loss": -6.741018772125244, "global_step": 135456, "epoch": 3225} {"train_loss": -6.7884979248046875, "global_step": 135457, "epoch": 3225} {"train_loss": -6.6898884773254395, "global_step": 135458, "epoch": 3225} {"train_loss": -6.640560150146484, "global_step": 135459, "epoch": 3225} {"train_loss": -6.667119026184082, "global_step": 135460, "epoch": 3225} {"train_loss": -6.6886420249938965, "global_step": 135461, "epoch": 3225} {"train_loss": -6.749226093292236, "global_step": 135462, "epoch": 3225} {"train_loss": -6.829098701477051, "global_step": 135463, "epoch": 3225} {"train_loss": -6.748801231384277, "global_step": 135464, "epoch": 3225} {"train_loss": -6.803075790405273, "global_step": 135465, "epoch": 3225} {"train_loss": -6.706306457519531, "global_step": 135466, "epoch": 3225} {"train_loss": -6.729844093322754, "global_step": 135467, "epoch": 3225} {"train_loss": -6.76851224899292, "global_step": 135468, "epoch": 3225} {"train_loss": -6.707742691040039, "global_step": 135469, "epoch": 3225} {"train_loss": -6.655317306518555, "global_step": 135470, "epoch": 3225} {"train_loss": -6.765635013580322, "global_step": 135471, "epoch": 3225} {"train_loss": -6.607706069946289, "global_step": 135472, "epoch": 3225} {"train_loss": -6.717348098754883, "global_step": 135473, "epoch": 3225} {"train_loss": -6.757412910461426, "global_step": 135474, "epoch": 3225} {"train_loss": -6.613832950592041, "global_step": 135475, "epoch": 3225} {"train_loss": -6.636445045471191, "global_step": 135476, "epoch": 3225} {"train_loss": -6.807004928588867, "global_step": 135477, "epoch": 3225} {"train_loss": -6.792046070098877, "global_step": 135478, "epoch": 3225} {"train_loss": -6.7428436279296875, "global_step": 135479, "epoch": 3225} {"train_loss": -6.685234069824219, "global_step": 135480, "epoch": 3225} {"train_loss": -6.6654205322265625, "global_step": 135481, "epoch": 3225} {"train_loss": -6.673152446746826, "global_step": 135482, "epoch": 3225} {"train_loss": -6.6090989112854, "global_step": 135483, "epoch": 3225} {"train_loss": -6.670858383178711, "global_step": 135484, "epoch": 3225} {"train_loss": -6.7015228271484375, "global_step": 135485, "epoch": 3225} {"train_loss": -6.671666145324707, "global_step": 135486, "epoch": 3225} {"train_loss": -6.771139144897461, "global_step": 135487, "epoch": 3225} {"train_loss": -6.583970069885254, "global_step": 135488, "epoch": 3225} {"train_loss": -6.710188865661621, "global_step": 135489, "epoch": 3225} {"train_loss": -6.701821327209473, "global_step": 135490, "epoch": 3225} {"train_loss": -6.70222696803865, "global_step": 135491, "epoch": 3225, "val_loss": 68241.8046875} {"train_loss": -6.652242660522461, "global_step": 135492, "epoch": 3226} {"train_loss": -6.765547752380371, "global_step": 135493, "epoch": 3226} {"train_loss": -6.685117244720459, "global_step": 135494, "epoch": 3226} {"train_loss": -6.711861610412598, "global_step": 135495, "epoch": 3226} {"train_loss": -6.749730110168457, "global_step": 135496, "epoch": 3226} {"train_loss": -6.678166389465332, "global_step": 135497, "epoch": 3226} {"train_loss": -6.677853107452393, "global_step": 135498, "epoch": 3226} {"train_loss": -6.718020439147949, "global_step": 135499, "epoch": 3226} {"train_loss": -6.645315170288086, "global_step": 135500, "epoch": 3226} {"train_loss": -6.612444877624512, "global_step": 135501, "epoch": 3226} {"train_loss": -6.640931129455566, "global_step": 135502, "epoch": 3226} {"train_loss": -6.785964012145996, "global_step": 135503, "epoch": 3226} {"train_loss": -6.7682695388793945, "global_step": 135504, "epoch": 3226} {"train_loss": -6.639050483703613, "global_step": 135505, "epoch": 3226} {"train_loss": -6.767611503601074, "global_step": 135506, "epoch": 3226} {"train_loss": -6.730965614318848, "global_step": 135507, "epoch": 3226} {"train_loss": -6.684545516967773, "global_step": 135508, "epoch": 3226} {"train_loss": -6.676058769226074, "global_step": 135509, "epoch": 3226} {"train_loss": -6.711511135101318, "global_step": 135510, "epoch": 3226} {"train_loss": -6.767238616943359, "global_step": 135511, "epoch": 3226} {"train_loss": -6.662116050720215, "global_step": 135512, "epoch": 3226} {"train_loss": -6.670642852783203, "global_step": 135513, "epoch": 3226} {"train_loss": -6.777194023132324, "global_step": 135514, "epoch": 3226} {"train_loss": -6.690254211425781, "global_step": 135515, "epoch": 3226} {"train_loss": -6.700319766998291, "global_step": 135516, "epoch": 3226} {"train_loss": -6.794433116912842, "global_step": 135517, "epoch": 3226} {"train_loss": -6.6628007888793945, "global_step": 135518, "epoch": 3226} {"train_loss": -6.689372539520264, "global_step": 135519, "epoch": 3226} {"train_loss": -6.762550354003906, "global_step": 135520, "epoch": 3226} {"train_loss": -6.767182350158691, "global_step": 135521, "epoch": 3226} {"train_loss": -6.7441182136535645, "global_step": 135522, "epoch": 3226} {"train_loss": -6.726536273956299, "global_step": 135523, "epoch": 3226} {"train_loss": -6.626916408538818, "global_step": 135524, "epoch": 3226} {"train_loss": -6.630203723907471, "global_step": 135525, "epoch": 3226} {"train_loss": -6.62159538269043, "global_step": 135526, "epoch": 3226} {"train_loss": -6.664817810058594, "global_step": 135527, "epoch": 3226} {"train_loss": -6.657244682312012, "global_step": 135528, "epoch": 3226} {"train_loss": -6.758332252502441, "global_step": 135529, "epoch": 3226} {"train_loss": -6.728785514831543, "global_step": 135530, "epoch": 3226} {"train_loss": -6.624871730804443, "global_step": 135531, "epoch": 3226} {"train_loss": -6.603763103485107, "global_step": 135532, "epoch": 3226} {"train_loss": -6.695824316569737, "global_step": 135533, "epoch": 3226, "val_loss": 68183.0234375} {"train_loss": -6.6160688400268555, "global_step": 135534, "epoch": 3227} {"train_loss": -6.7038774490356445, "global_step": 135535, "epoch": 3227} {"train_loss": -6.723134994506836, "global_step": 135536, "epoch": 3227} {"train_loss": -6.777083396911621, "global_step": 135537, "epoch": 3227} {"train_loss": -6.5882158279418945, "global_step": 135538, "epoch": 3227} {"train_loss": -6.790999412536621, "global_step": 135539, "epoch": 3227} {"train_loss": -6.709632873535156, "global_step": 135540, "epoch": 3227} {"train_loss": -6.6725006103515625, "global_step": 135541, "epoch": 3227} {"train_loss": -6.743374824523926, "global_step": 135542, "epoch": 3227} {"train_loss": -6.660690784454346, "global_step": 135543, "epoch": 3227} {"train_loss": -6.7070512771606445, "global_step": 135544, "epoch": 3227} {"train_loss": -6.676541328430176, "global_step": 135545, "epoch": 3227} {"train_loss": -6.638799667358398, "global_step": 135546, "epoch": 3227} {"train_loss": -6.716957092285156, "global_step": 135547, "epoch": 3227} {"train_loss": -6.583037853240967, "global_step": 135548, "epoch": 3227} {"train_loss": -6.522480010986328, "global_step": 135549, "epoch": 3227} {"train_loss": -6.623082160949707, "global_step": 135550, "epoch": 3227} {"train_loss": -6.7225165367126465, "global_step": 135551, "epoch": 3227} {"train_loss": -6.712524890899658, "global_step": 135552, "epoch": 3227} {"train_loss": -6.691622257232666, "global_step": 135553, "epoch": 3227} {"train_loss": -6.6224212646484375, "global_step": 135554, "epoch": 3227} {"train_loss": -6.726601600646973, "global_step": 135555, "epoch": 3227} {"train_loss": -6.610710144042969, "global_step": 135556, "epoch": 3227} {"train_loss": -6.720121383666992, "global_step": 135557, "epoch": 3227} {"train_loss": -6.773916244506836, "global_step": 135558, "epoch": 3227} {"train_loss": -6.763009071350098, "global_step": 135559, "epoch": 3227} {"train_loss": -6.6679768562316895, "global_step": 135560, "epoch": 3227} {"train_loss": -6.717440605163574, "global_step": 135561, "epoch": 3227} {"train_loss": -6.646787643432617, "global_step": 135562, "epoch": 3227} {"train_loss": -6.720580101013184, "global_step": 135563, "epoch": 3227} {"train_loss": -6.749273300170898, "global_step": 135564, "epoch": 3227} {"train_loss": -6.81921911239624, "global_step": 135565, "epoch": 3227} {"train_loss": -6.710629463195801, "global_step": 135566, "epoch": 3227} {"train_loss": -6.657642364501953, "global_step": 135567, "epoch": 3227} {"train_loss": -6.679844856262207, "global_step": 135568, "epoch": 3227} {"train_loss": -6.68602180480957, "global_step": 135569, "epoch": 3227} {"train_loss": -6.595556259155273, "global_step": 135570, "epoch": 3227} {"train_loss": -6.602949619293213, "global_step": 135571, "epoch": 3227} {"train_loss": -6.585484027862549, "global_step": 135572, "epoch": 3227} {"train_loss": -6.717148303985596, "global_step": 135573, "epoch": 3227} {"train_loss": -6.594442367553711, "global_step": 135574, "epoch": 3227} {"train_loss": -6.6811864376068115, "global_step": 135575, "epoch": 3227, "val_loss": 68319.9375} {"train_loss": -6.636680603027344, "global_step": 135576, "epoch": 3228} {"train_loss": -6.650291919708252, "global_step": 135577, "epoch": 3228} {"train_loss": -6.815642356872559, "global_step": 135578, "epoch": 3228} {"train_loss": -6.7317214012146, "global_step": 135579, "epoch": 3228} {"train_loss": -6.667659282684326, "global_step": 135580, "epoch": 3228} {"train_loss": -6.6395463943481445, "global_step": 135581, "epoch": 3228} {"train_loss": -6.669419288635254, "global_step": 135582, "epoch": 3228} {"train_loss": -6.7717485427856445, "global_step": 135583, "epoch": 3228} {"train_loss": -6.680856704711914, "global_step": 135584, "epoch": 3228} {"train_loss": -6.630005359649658, "global_step": 135585, "epoch": 3228} {"train_loss": -6.733528137207031, "global_step": 135586, "epoch": 3228} {"train_loss": -6.650494575500488, "global_step": 135587, "epoch": 3228} {"train_loss": -6.756608963012695, "global_step": 135588, "epoch": 3228} {"train_loss": -6.650218963623047, "global_step": 135589, "epoch": 3228} {"train_loss": -6.605531215667725, "global_step": 135590, "epoch": 3228} {"train_loss": -6.548601150512695, "global_step": 135591, "epoch": 3228} {"train_loss": -6.785521507263184, "global_step": 135592, "epoch": 3228} {"train_loss": -6.661705017089844, "global_step": 135593, "epoch": 3228} {"train_loss": -6.554012775421143, "global_step": 135594, "epoch": 3228} {"train_loss": -6.782454490661621, "global_step": 135595, "epoch": 3228} {"train_loss": -6.8265252113342285, "global_step": 135596, "epoch": 3228} {"train_loss": -6.724221229553223, "global_step": 135597, "epoch": 3228} {"train_loss": -6.604598045349121, "global_step": 135598, "epoch": 3228} {"train_loss": -6.694594383239746, "global_step": 135599, "epoch": 3228} {"train_loss": -6.804903984069824, "global_step": 135600, "epoch": 3228} {"train_loss": -6.678881645202637, "global_step": 135601, "epoch": 3228} {"train_loss": -6.585134983062744, "global_step": 135602, "epoch": 3228} {"train_loss": -6.609706878662109, "global_step": 135603, "epoch": 3228} {"train_loss": -6.580972194671631, "global_step": 135604, "epoch": 3228} {"train_loss": -6.6142578125, "global_step": 135605, "epoch": 3228} {"train_loss": -6.690978050231934, "global_step": 135606, "epoch": 3228} {"train_loss": -6.731612205505371, "global_step": 135607, "epoch": 3228} {"train_loss": -6.661150932312012, "global_step": 135608, "epoch": 3228} {"train_loss": -6.773994445800781, "global_step": 135609, "epoch": 3228} {"train_loss": -6.703993320465088, "global_step": 135610, "epoch": 3228} {"train_loss": -6.754096031188965, "global_step": 135611, "epoch": 3228} {"train_loss": -6.543440341949463, "global_step": 135612, "epoch": 3228} {"train_loss": -6.725301742553711, "global_step": 135613, "epoch": 3228} {"train_loss": -6.637060642242432, "global_step": 135614, "epoch": 3228} {"train_loss": -6.723866939544678, "global_step": 135615, "epoch": 3228} {"train_loss": -6.767876148223877, "global_step": 135616, "epoch": 3228} {"train_loss": -6.685563235055833, "global_step": 135617, "epoch": 3228, "val_loss": 68413.3515625} {"train_loss": -6.63604736328125, "global_step": 135618, "epoch": 3229} {"train_loss": -6.688715934753418, "global_step": 135619, "epoch": 3229} {"train_loss": -6.561624526977539, "global_step": 135620, "epoch": 3229} {"train_loss": -6.5796403884887695, "global_step": 135621, "epoch": 3229} {"train_loss": -6.697308540344238, "global_step": 135622, "epoch": 3229} {"train_loss": -6.707063674926758, "global_step": 135623, "epoch": 3229} {"train_loss": -6.589315414428711, "global_step": 135624, "epoch": 3229} {"train_loss": -6.656761169433594, "global_step": 135625, "epoch": 3229} {"train_loss": -6.704413414001465, "global_step": 135626, "epoch": 3229} {"train_loss": -6.812646865844727, "global_step": 135627, "epoch": 3229} {"train_loss": -6.583649635314941, "global_step": 135628, "epoch": 3229} {"train_loss": -6.670875072479248, "global_step": 135629, "epoch": 3229} {"train_loss": -6.7150373458862305, "global_step": 135630, "epoch": 3229} {"train_loss": -6.619399070739746, "global_step": 135631, "epoch": 3229} {"train_loss": -6.7025346755981445, "global_step": 135632, "epoch": 3229} {"train_loss": -6.733516693115234, "global_step": 135633, "epoch": 3229} {"train_loss": -6.558969497680664, "global_step": 135634, "epoch": 3229} {"train_loss": -6.595574855804443, "global_step": 135635, "epoch": 3229} {"train_loss": -6.6236796379089355, "global_step": 135636, "epoch": 3229} {"train_loss": -6.679379463195801, "global_step": 135637, "epoch": 3229} {"train_loss": -6.651294708251953, "global_step": 135638, "epoch": 3229} {"train_loss": -6.680803298950195, "global_step": 135639, "epoch": 3229} {"train_loss": -6.705899715423584, "global_step": 135640, "epoch": 3229} {"train_loss": -6.780120849609375, "global_step": 135641, "epoch": 3229} {"train_loss": -6.717408180236816, "global_step": 135642, "epoch": 3229} {"train_loss": -6.698841094970703, "global_step": 135643, "epoch": 3229} {"train_loss": -6.766411781311035, "global_step": 135644, "epoch": 3229} {"train_loss": -6.677512168884277, "global_step": 135645, "epoch": 3229} {"train_loss": -6.608586311340332, "global_step": 135646, "epoch": 3229} {"train_loss": -6.595770835876465, "global_step": 135647, "epoch": 3229} {"train_loss": -6.586583137512207, "global_step": 135648, "epoch": 3229} {"train_loss": -6.677701473236084, "global_step": 135649, "epoch": 3229} {"train_loss": -6.649863243103027, "global_step": 135650, "epoch": 3229} {"train_loss": -6.611832618713379, "global_step": 135651, "epoch": 3229} {"train_loss": -6.790921211242676, "global_step": 135652, "epoch": 3229} {"train_loss": -6.811748504638672, "global_step": 135653, "epoch": 3229} {"train_loss": -6.698343276977539, "global_step": 135654, "epoch": 3229} {"train_loss": -6.724963665008545, "global_step": 135655, "epoch": 3229} {"train_loss": -6.744129657745361, "global_step": 135656, "epoch": 3229} {"train_loss": -6.690568447113037, "global_step": 135657, "epoch": 3229} {"train_loss": -6.716300010681152, "global_step": 135658, "epoch": 3229} {"train_loss": -6.676172914959135, "global_step": 135659, "epoch": 3229, "val_loss": 68349.6328125} {"train_loss": -6.744993686676025, "global_step": 135660, "epoch": 3230} {"train_loss": -6.703977584838867, "global_step": 135661, "epoch": 3230} {"train_loss": -6.684114933013916, "global_step": 135662, "epoch": 3230} {"train_loss": -6.634304046630859, "global_step": 135663, "epoch": 3230} {"train_loss": -6.764621734619141, "global_step": 135664, "epoch": 3230} {"train_loss": -6.71599006652832, "global_step": 135665, "epoch": 3230} {"train_loss": -6.574197769165039, "global_step": 135666, "epoch": 3230} {"train_loss": -6.587161540985107, "global_step": 135667, "epoch": 3230} {"train_loss": -6.6459856033325195, "global_step": 135668, "epoch": 3230} {"train_loss": -6.860816478729248, "global_step": 135669, "epoch": 3230} {"train_loss": -6.669860363006592, "global_step": 135670, "epoch": 3230} {"train_loss": -6.843054294586182, "global_step": 135671, "epoch": 3230} {"train_loss": -6.71628475189209, "global_step": 135672, "epoch": 3230} {"train_loss": -6.61692476272583, "global_step": 135673, "epoch": 3230} {"train_loss": -6.696488380432129, "global_step": 135674, "epoch": 3230} {"train_loss": -6.722240447998047, "global_step": 135675, "epoch": 3230} {"train_loss": -6.636558532714844, "global_step": 135676, "epoch": 3230} {"train_loss": -6.757973670959473, "global_step": 135677, "epoch": 3230} {"train_loss": -6.617591381072998, "global_step": 135678, "epoch": 3230} {"train_loss": -6.662609577178955, "global_step": 135679, "epoch": 3230} {"train_loss": -6.65726900100708, "global_step": 135680, "epoch": 3230} {"train_loss": -6.802165508270264, "global_step": 135681, "epoch": 3230} {"train_loss": -6.7281951904296875, "global_step": 135682, "epoch": 3230} {"train_loss": -6.589631080627441, "global_step": 135683, "epoch": 3230} {"train_loss": -6.708776473999023, "global_step": 135684, "epoch": 3230} {"train_loss": -6.672300338745117, "global_step": 135685, "epoch": 3230} {"train_loss": -6.607487201690674, "global_step": 135686, "epoch": 3230} {"train_loss": -6.681196212768555, "global_step": 135687, "epoch": 3230} {"train_loss": -6.697917461395264, "global_step": 135688, "epoch": 3230} {"train_loss": -6.6237640380859375, "global_step": 135689, "epoch": 3230} {"train_loss": -6.761926651000977, "global_step": 135690, "epoch": 3230} {"train_loss": -6.663710594177246, "global_step": 135691, "epoch": 3230} {"train_loss": -6.680612087249756, "global_step": 135692, "epoch": 3230} {"train_loss": -6.781947135925293, "global_step": 135693, "epoch": 3230} {"train_loss": -6.67586612701416, "global_step": 135694, "epoch": 3230} {"train_loss": -6.703876495361328, "global_step": 135695, "epoch": 3230} {"train_loss": -6.693475246429443, "global_step": 135696, "epoch": 3230} {"train_loss": -6.697953224182129, "global_step": 135697, "epoch": 3230} {"train_loss": -6.656424522399902, "global_step": 135698, "epoch": 3230} {"train_loss": -6.754720211029053, "global_step": 135699, "epoch": 3230} {"train_loss": -6.648952484130859, "global_step": 135700, "epoch": 3230} {"train_loss": -6.690238918576922, "global_step": 135701, "epoch": 3230, "val_loss": 68334.828125} {"train_loss": -6.738071441650391, "global_step": 135702, "epoch": 3231} {"train_loss": -6.712028980255127, "global_step": 135703, "epoch": 3231} {"train_loss": -6.6339263916015625, "global_step": 135704, "epoch": 3231} {"train_loss": -6.699463844299316, "global_step": 135705, "epoch": 3231} {"train_loss": -6.744912147521973, "global_step": 135706, "epoch": 3231} {"train_loss": -6.7125372886657715, "global_step": 135707, "epoch": 3231} {"train_loss": -6.71368408203125, "global_step": 135708, "epoch": 3231} {"train_loss": -6.701038360595703, "global_step": 135709, "epoch": 3231} {"train_loss": -6.735724449157715, "global_step": 135710, "epoch": 3231} {"train_loss": -6.714354038238525, "global_step": 135711, "epoch": 3231} {"train_loss": -6.65665864944458, "global_step": 135712, "epoch": 3231} {"train_loss": -6.662599563598633, "global_step": 135713, "epoch": 3231} {"train_loss": -6.702940940856934, "global_step": 135714, "epoch": 3231} {"train_loss": -6.715917587280273, "global_step": 135715, "epoch": 3231} {"train_loss": -6.611651420593262, "global_step": 135716, "epoch": 3231} {"train_loss": -6.7417073249816895, "global_step": 135717, "epoch": 3231} {"train_loss": -6.622043609619141, "global_step": 135718, "epoch": 3231} {"train_loss": -6.588064193725586, "global_step": 135719, "epoch": 3231} {"train_loss": -6.672183990478516, "global_step": 135720, "epoch": 3231} {"train_loss": -6.649012565612793, "global_step": 135721, "epoch": 3231} {"train_loss": -6.658637046813965, "global_step": 135722, "epoch": 3231} {"train_loss": -6.699051380157471, "global_step": 135723, "epoch": 3231} {"train_loss": -6.554101467132568, "global_step": 135724, "epoch": 3231} {"train_loss": -6.754430294036865, "global_step": 135725, "epoch": 3231} {"train_loss": -6.681099891662598, "global_step": 135726, "epoch": 3231} {"train_loss": -6.656402587890625, "global_step": 135727, "epoch": 3231} {"train_loss": -6.676662921905518, "global_step": 135728, "epoch": 3231} {"train_loss": -6.773322105407715, "global_step": 135729, "epoch": 3231} {"train_loss": -6.6819915771484375, "global_step": 135730, "epoch": 3231} {"train_loss": -6.673529624938965, "global_step": 135731, "epoch": 3231} {"train_loss": -6.79396915435791, "global_step": 135732, "epoch": 3231} {"train_loss": -6.634012222290039, "global_step": 135733, "epoch": 3231} {"train_loss": -6.735561847686768, "global_step": 135734, "epoch": 3231} {"train_loss": -6.742375373840332, "global_step": 135735, "epoch": 3231} {"train_loss": -6.64553689956665, "global_step": 135736, "epoch": 3231} {"train_loss": -6.674469947814941, "global_step": 135737, "epoch": 3231} {"train_loss": -6.742328643798828, "global_step": 135738, "epoch": 3231} {"train_loss": -6.661628246307373, "global_step": 135739, "epoch": 3231} {"train_loss": -6.742847442626953, "global_step": 135740, "epoch": 3231} {"train_loss": -6.657192230224609, "global_step": 135741, "epoch": 3231} {"train_loss": -6.788286209106445, "global_step": 135742, "epoch": 3231} {"train_loss": -6.694320837656657, "global_step": 135743, "epoch": 3231, "val_loss": 68269.03125} {"train_loss": -6.760834217071533, "global_step": 135744, "epoch": 3232} {"train_loss": -6.691024303436279, "global_step": 135745, "epoch": 3232} {"train_loss": -6.648833751678467, "global_step": 135746, "epoch": 3232} {"train_loss": -6.725167274475098, "global_step": 135747, "epoch": 3232} {"train_loss": -6.670014381408691, "global_step": 135748, "epoch": 3232} {"train_loss": -6.675593376159668, "global_step": 135749, "epoch": 3232} {"train_loss": -6.720078468322754, "global_step": 135750, "epoch": 3232} {"train_loss": -6.603724956512451, "global_step": 135751, "epoch": 3232} {"train_loss": -6.6750335693359375, "global_step": 135752, "epoch": 3232} {"train_loss": -6.682962417602539, "global_step": 135753, "epoch": 3232} {"train_loss": -6.655381202697754, "global_step": 135754, "epoch": 3232} {"train_loss": -6.655429840087891, "global_step": 135755, "epoch": 3232} {"train_loss": -6.559292793273926, "global_step": 135756, "epoch": 3232} {"train_loss": -6.755473613739014, "global_step": 135757, "epoch": 3232} {"train_loss": -6.4825439453125, "global_step": 135758, "epoch": 3232} {"train_loss": -6.679372787475586, "global_step": 135759, "epoch": 3232} {"train_loss": -6.563741683959961, "global_step": 135760, "epoch": 3232} {"train_loss": -6.573134422302246, "global_step": 135761, "epoch": 3232} {"train_loss": -6.626605987548828, "global_step": 135762, "epoch": 3232} {"train_loss": -6.677990913391113, "global_step": 135763, "epoch": 3232} {"train_loss": -6.6666364669799805, "global_step": 135764, "epoch": 3232} {"train_loss": -6.675524711608887, "global_step": 135765, "epoch": 3232} {"train_loss": -6.625088691711426, "global_step": 135766, "epoch": 3232} {"train_loss": -6.569660663604736, "global_step": 135767, "epoch": 3232} {"train_loss": -6.5760908126831055, "global_step": 135768, "epoch": 3232} {"train_loss": -6.622654914855957, "global_step": 135769, "epoch": 3232} {"train_loss": -6.645207405090332, "global_step": 135770, "epoch": 3232} {"train_loss": -6.479246616363525, "global_step": 135771, "epoch": 3232} {"train_loss": -6.624683380126953, "global_step": 135772, "epoch": 3232} {"train_loss": -6.585336208343506, "global_step": 135773, "epoch": 3232} {"train_loss": -6.655755996704102, "global_step": 135774, "epoch": 3232} {"train_loss": -6.710980415344238, "global_step": 135775, "epoch": 3232} {"train_loss": -6.769604682922363, "global_step": 135776, "epoch": 3232} {"train_loss": -6.691194534301758, "global_step": 135777, "epoch": 3232} {"train_loss": -6.608498573303223, "global_step": 135778, "epoch": 3232} {"train_loss": -6.681460380554199, "global_step": 135779, "epoch": 3232} {"train_loss": -6.727663993835449, "global_step": 135780, "epoch": 3232} {"train_loss": -6.630948066711426, "global_step": 135781, "epoch": 3232} {"train_loss": -6.574816703796387, "global_step": 135782, "epoch": 3232} {"train_loss": -6.585498809814453, "global_step": 135783, "epoch": 3232} {"train_loss": -6.64985466003418, "global_step": 135784, "epoch": 3232} {"train_loss": -6.643017519088018, "global_step": 135785, "epoch": 3232, "val_loss": 68352.6953125} {"train_loss": -6.621053695678711, "global_step": 135786, "epoch": 3233} {"train_loss": -6.701750755310059, "global_step": 135787, "epoch": 3233} {"train_loss": -6.826451301574707, "global_step": 135788, "epoch": 3233} {"train_loss": -6.6571502685546875, "global_step": 135789, "epoch": 3233} {"train_loss": -6.703249454498291, "global_step": 135790, "epoch": 3233} {"train_loss": -6.627715110778809, "global_step": 135791, "epoch": 3233} {"train_loss": -6.618010997772217, "global_step": 135792, "epoch": 3233} {"train_loss": -6.83261775970459, "global_step": 135793, "epoch": 3233} {"train_loss": -6.773618698120117, "global_step": 135794, "epoch": 3233} {"train_loss": -6.65717077255249, "global_step": 135795, "epoch": 3233} {"train_loss": -6.679504871368408, "global_step": 135796, "epoch": 3233} {"train_loss": -6.720587730407715, "global_step": 135797, "epoch": 3233} {"train_loss": -6.580561637878418, "global_step": 135798, "epoch": 3233} {"train_loss": -6.611854553222656, "global_step": 135799, "epoch": 3233} {"train_loss": -6.768502235412598, "global_step": 135800, "epoch": 3233} {"train_loss": -6.725959777832031, "global_step": 135801, "epoch": 3233} {"train_loss": -6.746732711791992, "global_step": 135802, "epoch": 3233} {"train_loss": -6.631449222564697, "global_step": 135803, "epoch": 3233} {"train_loss": -6.685661315917969, "global_step": 135804, "epoch": 3233} {"train_loss": -6.721162796020508, "global_step": 135805, "epoch": 3233} {"train_loss": -6.745893478393555, "global_step": 135806, "epoch": 3233} {"train_loss": -6.662775039672852, "global_step": 135807, "epoch": 3233} {"train_loss": -6.7050065994262695, "global_step": 135808, "epoch": 3233} {"train_loss": -6.667860984802246, "global_step": 135809, "epoch": 3233} {"train_loss": -6.650713920593262, "global_step": 135810, "epoch": 3233} {"train_loss": -6.672250270843506, "global_step": 135811, "epoch": 3233} {"train_loss": -6.615902900695801, "global_step": 135812, "epoch": 3233} {"train_loss": -6.744467258453369, "global_step": 135813, "epoch": 3233} {"train_loss": -6.634512901306152, "global_step": 135814, "epoch": 3233} {"train_loss": -6.749807357788086, "global_step": 135815, "epoch": 3233} {"train_loss": -6.714720249176025, "global_step": 135816, "epoch": 3233} {"train_loss": -6.770520210266113, "global_step": 135817, "epoch": 3233} {"train_loss": -6.629458427429199, "global_step": 135818, "epoch": 3233} {"train_loss": -6.742201805114746, "global_step": 135819, "epoch": 3233} {"train_loss": -6.731316089630127, "global_step": 135820, "epoch": 3233} {"train_loss": -6.613211631774902, "global_step": 135821, "epoch": 3233} {"train_loss": -6.67307186126709, "global_step": 135822, "epoch": 3233} {"train_loss": -6.618532180786133, "global_step": 135823, "epoch": 3233} {"train_loss": -6.570670127868652, "global_step": 135824, "epoch": 3233} {"train_loss": -6.69057035446167, "global_step": 135825, "epoch": 3233} {"train_loss": -6.635929107666016, "global_step": 135826, "epoch": 3233} {"train_loss": -6.684178352355957, "global_step": 135827, "epoch": 3233, "val_loss": 68414.953125} {"train_loss": -6.735123157501221, "global_step": 135828, "epoch": 3234} {"train_loss": -6.608094215393066, "global_step": 135829, "epoch": 3234} {"train_loss": -6.68940544128418, "global_step": 135830, "epoch": 3234} {"train_loss": -6.762605667114258, "global_step": 135831, "epoch": 3234} {"train_loss": -6.611342430114746, "global_step": 135832, "epoch": 3234} {"train_loss": -6.610953330993652, "global_step": 135833, "epoch": 3234} {"train_loss": -6.589870929718018, "global_step": 135834, "epoch": 3234} {"train_loss": -6.637187957763672, "global_step": 135835, "epoch": 3234} {"train_loss": -6.741361618041992, "global_step": 135836, "epoch": 3234} {"train_loss": -6.736055374145508, "global_step": 135837, "epoch": 3234} {"train_loss": -6.748424530029297, "global_step": 135838, "epoch": 3234} {"train_loss": -6.659691333770752, "global_step": 135839, "epoch": 3234} {"train_loss": -6.589433670043945, "global_step": 135840, "epoch": 3234} {"train_loss": -6.763833522796631, "global_step": 135841, "epoch": 3234} {"train_loss": -6.657449245452881, "global_step": 135842, "epoch": 3234} {"train_loss": -6.648266792297363, "global_step": 135843, "epoch": 3234} {"train_loss": -6.759214878082275, "global_step": 135844, "epoch": 3234} {"train_loss": -6.579109191894531, "global_step": 135845, "epoch": 3234} {"train_loss": -6.728171348571777, "global_step": 135846, "epoch": 3234} {"train_loss": -6.669207572937012, "global_step": 135847, "epoch": 3234} {"train_loss": -6.579886436462402, "global_step": 135848, "epoch": 3234} {"train_loss": -6.704687118530273, "global_step": 135849, "epoch": 3234} {"train_loss": -6.796414375305176, "global_step": 135850, "epoch": 3234} {"train_loss": -6.631241321563721, "global_step": 135851, "epoch": 3234} {"train_loss": -6.725139617919922, "global_step": 135852, "epoch": 3234} {"train_loss": -6.703572750091553, "global_step": 135853, "epoch": 3234} {"train_loss": -6.635629653930664, "global_step": 135854, "epoch": 3234} {"train_loss": -6.726334571838379, "global_step": 135855, "epoch": 3234} {"train_loss": -6.570573806762695, "global_step": 135856, "epoch": 3234} {"train_loss": -6.87308406829834, "global_step": 135857, "epoch": 3234} {"train_loss": -6.691572189331055, "global_step": 135858, "epoch": 3234} {"train_loss": -6.649557113647461, "global_step": 135859, "epoch": 3234} {"train_loss": -6.631082534790039, "global_step": 135860, "epoch": 3234} {"train_loss": -6.709341526031494, "global_step": 135861, "epoch": 3234} {"train_loss": -6.790770053863525, "global_step": 135862, "epoch": 3234} {"train_loss": -6.694530010223389, "global_step": 135863, "epoch": 3234} {"train_loss": -6.7036027908325195, "global_step": 135864, "epoch": 3234} {"train_loss": -6.645114421844482, "global_step": 135865, "epoch": 3234} {"train_loss": -6.622056484222412, "global_step": 135866, "epoch": 3234} {"train_loss": -6.608390808105469, "global_step": 135867, "epoch": 3234} {"train_loss": -6.711882591247559, "global_step": 135868, "epoch": 3234} {"train_loss": -6.683717557362148, "global_step": 135869, "epoch": 3234, "val_loss": 68198.796875} {"train_loss": -6.811247825622559, "global_step": 135870, "epoch": 3235} {"train_loss": -6.634363174438477, "global_step": 135871, "epoch": 3235} {"train_loss": -6.651698589324951, "global_step": 135872, "epoch": 3235} {"train_loss": -6.69690465927124, "global_step": 135873, "epoch": 3235} {"train_loss": -6.684906482696533, "global_step": 135874, "epoch": 3235} {"train_loss": -6.692123889923096, "global_step": 135875, "epoch": 3235} {"train_loss": -6.764211654663086, "global_step": 135876, "epoch": 3235} {"train_loss": -6.789260387420654, "global_step": 135877, "epoch": 3235} {"train_loss": -6.6060075759887695, "global_step": 135878, "epoch": 3235} {"train_loss": -6.797593116760254, "global_step": 135879, "epoch": 3235} {"train_loss": -6.724060535430908, "global_step": 135880, "epoch": 3235} {"train_loss": -6.751328468322754, "global_step": 135881, "epoch": 3235} {"train_loss": -6.744900703430176, "global_step": 135882, "epoch": 3235} {"train_loss": -6.530410289764404, "global_step": 135883, "epoch": 3235} {"train_loss": -6.735065460205078, "global_step": 135884, "epoch": 3235} {"train_loss": -6.613880157470703, "global_step": 135885, "epoch": 3235} {"train_loss": -6.533154010772705, "global_step": 135886, "epoch": 3235} {"train_loss": -6.58186149597168, "global_step": 135887, "epoch": 3235} {"train_loss": -6.591187477111816, "global_step": 135888, "epoch": 3235} {"train_loss": -6.678061485290527, "global_step": 135889, "epoch": 3235} {"train_loss": -6.559652328491211, "global_step": 135890, "epoch": 3235} {"train_loss": -6.491682529449463, "global_step": 135891, "epoch": 3235} {"train_loss": -6.578126430511475, "global_step": 135892, "epoch": 3235} {"train_loss": -6.653044700622559, "global_step": 135893, "epoch": 3235} {"train_loss": -6.661624908447266, "global_step": 135894, "epoch": 3235} {"train_loss": -6.593284606933594, "global_step": 135895, "epoch": 3235} {"train_loss": -6.576073169708252, "global_step": 135896, "epoch": 3235} {"train_loss": -6.6782331466674805, "global_step": 135897, "epoch": 3235} {"train_loss": -6.637476444244385, "global_step": 135898, "epoch": 3235} {"train_loss": -6.6770734786987305, "global_step": 135899, "epoch": 3235} {"train_loss": -6.664614677429199, "global_step": 135900, "epoch": 3235} {"train_loss": -6.5873870849609375, "global_step": 135901, "epoch": 3235} {"train_loss": -6.6611247062683105, "global_step": 135902, "epoch": 3235} {"train_loss": -6.630547523498535, "global_step": 135903, "epoch": 3235} {"train_loss": -6.686326026916504, "global_step": 135904, "epoch": 3235} {"train_loss": -6.6914963722229, "global_step": 135905, "epoch": 3235} {"train_loss": -6.677138328552246, "global_step": 135906, "epoch": 3235} {"train_loss": -6.6060028076171875, "global_step": 135907, "epoch": 3235} {"train_loss": -6.722194671630859, "global_step": 135908, "epoch": 3235} {"train_loss": -6.685896873474121, "global_step": 135909, "epoch": 3235} {"train_loss": -6.658390045166016, "global_step": 135910, "epoch": 3235} {"train_loss": -6.660103366488502, "global_step": 135911, "epoch": 3235, "val_loss": 68385.15625} {"train_loss": -6.621349811553955, "global_step": 135912, "epoch": 3236} {"train_loss": -6.7263078689575195, "global_step": 135913, "epoch": 3236} {"train_loss": -6.716556549072266, "global_step": 135914, "epoch": 3236} {"train_loss": -6.619205474853516, "global_step": 135915, "epoch": 3236} {"train_loss": -6.6803789138793945, "global_step": 135916, "epoch": 3236} {"train_loss": -6.658911228179932, "global_step": 135917, "epoch": 3236} {"train_loss": -6.705986022949219, "global_step": 135918, "epoch": 3236} {"train_loss": -6.726374626159668, "global_step": 135919, "epoch": 3236} {"train_loss": -6.68173360824585, "global_step": 135920, "epoch": 3236} {"train_loss": -6.765091896057129, "global_step": 135921, "epoch": 3236} {"train_loss": -6.677152633666992, "global_step": 135922, "epoch": 3236} {"train_loss": -6.595221519470215, "global_step": 135923, "epoch": 3236} {"train_loss": -6.594728469848633, "global_step": 135924, "epoch": 3236} {"train_loss": -6.6274309158325195, "global_step": 135925, "epoch": 3236} {"train_loss": -6.625293731689453, "global_step": 135926, "epoch": 3236} {"train_loss": -6.678227424621582, "global_step": 135927, "epoch": 3236} {"train_loss": -6.646778583526611, "global_step": 135928, "epoch": 3236} {"train_loss": -6.534317970275879, "global_step": 135929, "epoch": 3236} {"train_loss": -6.696014404296875, "global_step": 135930, "epoch": 3236} {"train_loss": -6.607392311096191, "global_step": 135931, "epoch": 3236} {"train_loss": -6.535488128662109, "global_step": 135932, "epoch": 3236} {"train_loss": -6.653215408325195, "global_step": 135933, "epoch": 3236} {"train_loss": -6.6208600997924805, "global_step": 135934, "epoch": 3236} {"train_loss": -6.774710655212402, "global_step": 135935, "epoch": 3236} {"train_loss": -6.528195381164551, "global_step": 135936, "epoch": 3236} {"train_loss": -6.681093215942383, "global_step": 135937, "epoch": 3236} {"train_loss": -6.623188495635986, "global_step": 135938, "epoch": 3236} {"train_loss": -6.7052764892578125, "global_step": 135939, "epoch": 3236} {"train_loss": -6.685451030731201, "global_step": 135940, "epoch": 3236} {"train_loss": -6.703279495239258, "global_step": 135941, "epoch": 3236} {"train_loss": -6.674881935119629, "global_step": 135942, "epoch": 3236} {"train_loss": -6.72107458114624, "global_step": 135943, "epoch": 3236} {"train_loss": -6.622308731079102, "global_step": 135944, "epoch": 3236} {"train_loss": -6.569183349609375, "global_step": 135945, "epoch": 3236} {"train_loss": -6.774724006652832, "global_step": 135946, "epoch": 3236} {"train_loss": -6.600537300109863, "global_step": 135947, "epoch": 3236} {"train_loss": -6.6070685386657715, "global_step": 135948, "epoch": 3236} {"train_loss": -6.606955051422119, "global_step": 135949, "epoch": 3236} {"train_loss": -6.585620403289795, "global_step": 135950, "epoch": 3236} {"train_loss": -6.676608085632324, "global_step": 135951, "epoch": 3236} {"train_loss": -6.726759910583496, "global_step": 135952, "epoch": 3236} {"train_loss": -6.656874327432542, "global_step": 135953, "epoch": 3236, "val_loss": 68312.234375} {"train_loss": -6.71453332901001, "global_step": 135954, "epoch": 3237} {"train_loss": -6.7370405197143555, "global_step": 135955, "epoch": 3237} {"train_loss": -6.724452018737793, "global_step": 135956, "epoch": 3237} {"train_loss": -6.697813987731934, "global_step": 135957, "epoch": 3237} {"train_loss": -6.772675514221191, "global_step": 135958, "epoch": 3237} {"train_loss": -6.736449241638184, "global_step": 135959, "epoch": 3237} {"train_loss": -6.699494361877441, "global_step": 135960, "epoch": 3237} {"train_loss": -6.67405366897583, "global_step": 135961, "epoch": 3237} {"train_loss": -6.619874954223633, "global_step": 135962, "epoch": 3237} {"train_loss": -6.795736312866211, "global_step": 135963, "epoch": 3237} {"train_loss": -6.65839958190918, "global_step": 135964, "epoch": 3237} {"train_loss": -6.700699806213379, "global_step": 135965, "epoch": 3237} {"train_loss": -6.633285999298096, "global_step": 135966, "epoch": 3237} {"train_loss": -6.599961757659912, "global_step": 135967, "epoch": 3237} {"train_loss": -6.687527656555176, "global_step": 135968, "epoch": 3237} {"train_loss": -6.476378440856934, "global_step": 135969, "epoch": 3237} {"train_loss": -6.618782043457031, "global_step": 135970, "epoch": 3237} {"train_loss": -6.724907875061035, "global_step": 135971, "epoch": 3237} {"train_loss": -6.711904048919678, "global_step": 135972, "epoch": 3237} {"train_loss": -6.519723892211914, "global_step": 135973, "epoch": 3237} {"train_loss": -6.647455215454102, "global_step": 135974, "epoch": 3237} {"train_loss": -6.700979709625244, "global_step": 135975, "epoch": 3237} {"train_loss": -6.671841621398926, "global_step": 135976, "epoch": 3237} {"train_loss": -6.780949592590332, "global_step": 135977, "epoch": 3237} {"train_loss": -6.614547252655029, "global_step": 135978, "epoch": 3237} {"train_loss": -6.7213134765625, "global_step": 135979, "epoch": 3237} {"train_loss": -6.631091117858887, "global_step": 135980, "epoch": 3237} {"train_loss": -6.536492824554443, "global_step": 135981, "epoch": 3237} {"train_loss": -6.73390007019043, "global_step": 135982, "epoch": 3237} {"train_loss": -6.58061408996582, "global_step": 135983, "epoch": 3237} {"train_loss": -6.709068775177002, "global_step": 135984, "epoch": 3237} {"train_loss": -6.644675254821777, "global_step": 135985, "epoch": 3237} {"train_loss": -6.72367525100708, "global_step": 135986, "epoch": 3237} {"train_loss": -6.725624084472656, "global_step": 135987, "epoch": 3237} {"train_loss": -6.664641380310059, "global_step": 135988, "epoch": 3237} {"train_loss": -6.534911155700684, "global_step": 135989, "epoch": 3237} {"train_loss": -6.745509624481201, "global_step": 135990, "epoch": 3237} {"train_loss": -6.574112415313721, "global_step": 135991, "epoch": 3237} {"train_loss": -6.651407241821289, "global_step": 135992, "epoch": 3237} {"train_loss": -6.6501359939575195, "global_step": 135993, "epoch": 3237} {"train_loss": -6.678225517272949, "global_step": 135994, "epoch": 3237} {"train_loss": -6.668985525767009, "global_step": 135995, "epoch": 3237, "val_loss": 68183.7109375} {"train_loss": -6.627737045288086, "global_step": 135996, "epoch": 3238} {"train_loss": -6.615804672241211, "global_step": 135997, "epoch": 3238} {"train_loss": -6.548647403717041, "global_step": 135998, "epoch": 3238} {"train_loss": -6.743407249450684, "global_step": 135999, "epoch": 3238} {"train_loss": -6.646262168884277, "global_step": 136000, "epoch": 3238} {"train_loss": -6.6695637702941895, "global_step": 136001, "epoch": 3238} {"train_loss": -6.632089614868164, "global_step": 136002, "epoch": 3238} {"train_loss": -6.600677013397217, "global_step": 136003, "epoch": 3238} {"train_loss": -6.726035118103027, "global_step": 136004, "epoch": 3238} {"train_loss": -6.740771770477295, "global_step": 136005, "epoch": 3238} {"train_loss": -6.738704681396484, "global_step": 136006, "epoch": 3238} {"train_loss": -6.640538215637207, "global_step": 136007, "epoch": 3238} {"train_loss": -6.561314582824707, "global_step": 136008, "epoch": 3238} {"train_loss": -6.673781394958496, "global_step": 136009, "epoch": 3238} {"train_loss": -6.667018890380859, "global_step": 136010, "epoch": 3238} {"train_loss": -6.625877380371094, "global_step": 136011, "epoch": 3238} {"train_loss": -6.756870746612549, "global_step": 136012, "epoch": 3238} {"train_loss": -6.633681297302246, "global_step": 136013, "epoch": 3238} {"train_loss": -6.750856876373291, "global_step": 136014, "epoch": 3238} {"train_loss": -6.692966461181641, "global_step": 136015, "epoch": 3238} {"train_loss": -6.667255401611328, "global_step": 136016, "epoch": 3238} {"train_loss": -6.625039577484131, "global_step": 136017, "epoch": 3238} {"train_loss": -6.728115558624268, "global_step": 136018, "epoch": 3238} {"train_loss": -6.68221378326416, "global_step": 136019, "epoch": 3238} {"train_loss": -6.69170618057251, "global_step": 136020, "epoch": 3238} {"train_loss": -6.620766639709473, "global_step": 136021, "epoch": 3238} {"train_loss": -6.703417778015137, "global_step": 136022, "epoch": 3238} {"train_loss": -6.572029113769531, "global_step": 136023, "epoch": 3238} {"train_loss": -6.569498538970947, "global_step": 136024, "epoch": 3238} {"train_loss": -6.706396579742432, "global_step": 136025, "epoch": 3238} {"train_loss": -6.668606281280518, "global_step": 136026, "epoch": 3238} {"train_loss": -6.6498637199401855, "global_step": 136027, "epoch": 3238} {"train_loss": -6.640044212341309, "global_step": 136028, "epoch": 3238} {"train_loss": -6.708785533905029, "global_step": 136029, "epoch": 3238} {"train_loss": -6.559630393981934, "global_step": 136030, "epoch": 3238} {"train_loss": -6.545254230499268, "global_step": 136031, "epoch": 3238} {"train_loss": -6.615578651428223, "global_step": 136032, "epoch": 3238} {"train_loss": -6.659972667694092, "global_step": 136033, "epoch": 3238} {"train_loss": -6.579401016235352, "global_step": 136034, "epoch": 3238} {"train_loss": -6.647886276245117, "global_step": 136035, "epoch": 3238} {"train_loss": -6.748831272125244, "global_step": 136036, "epoch": 3238} {"train_loss": -6.655558279582432, "global_step": 136037, "epoch": 3238, "val_loss": 68222.5859375} {"train_loss": -6.722930908203125, "global_step": 136038, "epoch": 3239} {"train_loss": -6.57757568359375, "global_step": 136039, "epoch": 3239} {"train_loss": -6.622788429260254, "global_step": 136040, "epoch": 3239} {"train_loss": -6.58425235748291, "global_step": 136041, "epoch": 3239} {"train_loss": -6.677695274353027, "global_step": 136042, "epoch": 3239} {"train_loss": -6.61475944519043, "global_step": 136043, "epoch": 3239} {"train_loss": -6.656895637512207, "global_step": 136044, "epoch": 3239} {"train_loss": -6.6355485916137695, "global_step": 136045, "epoch": 3239} {"train_loss": -6.712146282196045, "global_step": 136046, "epoch": 3239} {"train_loss": -6.7232160568237305, "global_step": 136047, "epoch": 3239} {"train_loss": -6.699965953826904, "global_step": 136048, "epoch": 3239} {"train_loss": -6.708754539489746, "global_step": 136049, "epoch": 3239} {"train_loss": -6.688928127288818, "global_step": 136050, "epoch": 3239} {"train_loss": -6.656044960021973, "global_step": 136051, "epoch": 3239} {"train_loss": -6.683213233947754, "global_step": 136052, "epoch": 3239} {"train_loss": -6.742245674133301, "global_step": 136053, "epoch": 3239} {"train_loss": -6.668309211730957, "global_step": 136054, "epoch": 3239} {"train_loss": -6.708403587341309, "global_step": 136055, "epoch": 3239} {"train_loss": -6.730742931365967, "global_step": 136056, "epoch": 3239} {"train_loss": -6.618043899536133, "global_step": 136057, "epoch": 3239} {"train_loss": -6.700305938720703, "global_step": 136058, "epoch": 3239} {"train_loss": -6.680750370025635, "global_step": 136059, "epoch": 3239} {"train_loss": -6.622480392456055, "global_step": 136060, "epoch": 3239} {"train_loss": -6.612972736358643, "global_step": 136061, "epoch": 3239} {"train_loss": -6.556368350982666, "global_step": 136062, "epoch": 3239} {"train_loss": -6.641149044036865, "global_step": 136063, "epoch": 3239} {"train_loss": -6.698792934417725, "global_step": 136064, "epoch": 3239} {"train_loss": -6.762383460998535, "global_step": 136065, "epoch": 3239} {"train_loss": -6.581144332885742, "global_step": 136066, "epoch": 3239} {"train_loss": -6.537668228149414, "global_step": 136067, "epoch": 3239} {"train_loss": -6.582743167877197, "global_step": 136068, "epoch": 3239} {"train_loss": -6.483193874359131, "global_step": 136069, "epoch": 3239} {"train_loss": -6.724612236022949, "global_step": 136070, "epoch": 3239} {"train_loss": -6.684510707855225, "global_step": 136071, "epoch": 3239} {"train_loss": -6.480722427368164, "global_step": 136072, "epoch": 3239} {"train_loss": -6.648480415344238, "global_step": 136073, "epoch": 3239} {"train_loss": -6.623750686645508, "global_step": 136074, "epoch": 3239} {"train_loss": -6.522771835327148, "global_step": 136075, "epoch": 3239} {"train_loss": -6.619237899780273, "global_step": 136076, "epoch": 3239} {"train_loss": -6.698631286621094, "global_step": 136077, "epoch": 3239} {"train_loss": -6.60526180267334, "global_step": 136078, "epoch": 3239} {"train_loss": -6.646559488205683, "global_step": 136079, "epoch": 3239, "val_loss": 68386.890625} {"train_loss": -6.673456192016602, "global_step": 136080, "epoch": 3240} {"train_loss": -6.634708404541016, "global_step": 136081, "epoch": 3240} {"train_loss": -6.632152557373047, "global_step": 136082, "epoch": 3240} {"train_loss": -6.644687652587891, "global_step": 136083, "epoch": 3240} {"train_loss": -6.6489763259887695, "global_step": 136084, "epoch": 3240} {"train_loss": -6.6418352127075195, "global_step": 136085, "epoch": 3240} {"train_loss": -6.584390640258789, "global_step": 136086, "epoch": 3240} {"train_loss": -6.637596130371094, "global_step": 136087, "epoch": 3240} {"train_loss": -6.606184959411621, "global_step": 136088, "epoch": 3240} {"train_loss": -6.634405136108398, "global_step": 136089, "epoch": 3240} {"train_loss": -6.599100112915039, "global_step": 136090, "epoch": 3240} {"train_loss": -6.6418304443359375, "global_step": 136091, "epoch": 3240} {"train_loss": -6.679583549499512, "global_step": 136092, "epoch": 3240} {"train_loss": -6.4496588706970215, "global_step": 136093, "epoch": 3240} {"train_loss": -6.681879997253418, "global_step": 136094, "epoch": 3240} {"train_loss": -6.794515132904053, "global_step": 136095, "epoch": 3240} {"train_loss": -6.6836466789245605, "global_step": 136096, "epoch": 3240} {"train_loss": -6.703298568725586, "global_step": 136097, "epoch": 3240} {"train_loss": -6.738399505615234, "global_step": 136098, "epoch": 3240} {"train_loss": -6.606126308441162, "global_step": 136099, "epoch": 3240} {"train_loss": -6.728195667266846, "global_step": 136100, "epoch": 3240} {"train_loss": -6.637851715087891, "global_step": 136101, "epoch": 3240} {"train_loss": -6.711697578430176, "global_step": 136102, "epoch": 3240} {"train_loss": -6.690134525299072, "global_step": 136103, "epoch": 3240} {"train_loss": -6.696185111999512, "global_step": 136104, "epoch": 3240} {"train_loss": -6.708564281463623, "global_step": 136105, "epoch": 3240} {"train_loss": -6.592695236206055, "global_step": 136106, "epoch": 3240} {"train_loss": -6.648569107055664, "global_step": 136107, "epoch": 3240} {"train_loss": -6.722156524658203, "global_step": 136108, "epoch": 3240} {"train_loss": -6.659282684326172, "global_step": 136109, "epoch": 3240} {"train_loss": -6.689362049102783, "global_step": 136110, "epoch": 3240} {"train_loss": -6.567786693572998, "global_step": 136111, "epoch": 3240} {"train_loss": -6.698999404907227, "global_step": 136112, "epoch": 3240} {"train_loss": -6.646300315856934, "global_step": 136113, "epoch": 3240} {"train_loss": -6.602359294891357, "global_step": 136114, "epoch": 3240} {"train_loss": -6.627761363983154, "global_step": 136115, "epoch": 3240} {"train_loss": -6.601912021636963, "global_step": 136116, "epoch": 3240} {"train_loss": -6.644479274749756, "global_step": 136117, "epoch": 3240} {"train_loss": -6.5820770263671875, "global_step": 136118, "epoch": 3240} {"train_loss": -6.711756706237793, "global_step": 136119, "epoch": 3240} {"train_loss": -6.6075005531311035, "global_step": 136120, "epoch": 3240} {"train_loss": -6.651455549966721, "global_step": 136121, "epoch": 3240, "val_loss": 68328.0546875} {"train_loss": -6.740926265716553, "global_step": 136122, "epoch": 3241} {"train_loss": -6.636031627655029, "global_step": 136123, "epoch": 3241} {"train_loss": -6.648240089416504, "global_step": 136124, "epoch": 3241} {"train_loss": -6.69194221496582, "global_step": 136125, "epoch": 3241} {"train_loss": -6.609699726104736, "global_step": 136126, "epoch": 3241} {"train_loss": -6.698022842407227, "global_step": 136127, "epoch": 3241} {"train_loss": -6.716391563415527, "global_step": 136128, "epoch": 3241} {"train_loss": -6.680761337280273, "global_step": 136129, "epoch": 3241} {"train_loss": -6.7106122970581055, "global_step": 136130, "epoch": 3241} {"train_loss": -6.654912948608398, "global_step": 136131, "epoch": 3241} {"train_loss": -6.741888999938965, "global_step": 136132, "epoch": 3241} {"train_loss": -6.808786392211914, "global_step": 136133, "epoch": 3241} {"train_loss": -6.688027381896973, "global_step": 136134, "epoch": 3241} {"train_loss": -6.870286464691162, "global_step": 136135, "epoch": 3241} {"train_loss": -6.729406833648682, "global_step": 136136, "epoch": 3241} {"train_loss": -6.677056312561035, "global_step": 136137, "epoch": 3241} {"train_loss": -6.754868984222412, "global_step": 136138, "epoch": 3241} {"train_loss": -6.776611328125, "global_step": 136139, "epoch": 3241} {"train_loss": -6.730782985687256, "global_step": 136140, "epoch": 3241} {"train_loss": -6.69605827331543, "global_step": 136141, "epoch": 3241} {"train_loss": -6.664124488830566, "global_step": 136142, "epoch": 3241} {"train_loss": -6.673296928405762, "global_step": 136143, "epoch": 3241} {"train_loss": -6.72943115234375, "global_step": 136144, "epoch": 3241} {"train_loss": -6.737949371337891, "global_step": 136145, "epoch": 3241} {"train_loss": -6.737044811248779, "global_step": 136146, "epoch": 3241} {"train_loss": -6.7734575271606445, "global_step": 136147, "epoch": 3241} {"train_loss": -6.704807758331299, "global_step": 136148, "epoch": 3241} {"train_loss": -6.678016662597656, "global_step": 136149, "epoch": 3241} {"train_loss": -6.704261302947998, "global_step": 136150, "epoch": 3241} {"train_loss": -6.746917724609375, "global_step": 136151, "epoch": 3241} {"train_loss": -6.80872917175293, "global_step": 136152, "epoch": 3241} {"train_loss": -6.668756008148193, "global_step": 136153, "epoch": 3241} {"train_loss": -6.625635147094727, "global_step": 136154, "epoch": 3241} {"train_loss": -6.806844711303711, "global_step": 136155, "epoch": 3241} {"train_loss": -6.71074104309082, "global_step": 136156, "epoch": 3241} {"train_loss": -6.576600074768066, "global_step": 136157, "epoch": 3241} {"train_loss": -6.662516117095947, "global_step": 136158, "epoch": 3241} {"train_loss": -6.794002532958984, "global_step": 136159, "epoch": 3241} {"train_loss": -6.779065132141113, "global_step": 136160, "epoch": 3241} {"train_loss": -6.669427871704102, "global_step": 136161, "epoch": 3241} {"train_loss": -6.6276116371154785, "global_step": 136162, "epoch": 3241} {"train_loss": -6.710966189702352, "global_step": 136163, "epoch": 3241, "val_loss": 68383.9921875} {"train_loss": -6.659852981567383, "global_step": 136164, "epoch": 3242} {"train_loss": -6.61728048324585, "global_step": 136165, "epoch": 3242} {"train_loss": -6.714622497558594, "global_step": 136166, "epoch": 3242} {"train_loss": -6.670546531677246, "global_step": 136167, "epoch": 3242} {"train_loss": -6.654157638549805, "global_step": 136168, "epoch": 3242} {"train_loss": -6.649024963378906, "global_step": 136169, "epoch": 3242} {"train_loss": -6.8212571144104, "global_step": 136170, "epoch": 3242} {"train_loss": -6.658184051513672, "global_step": 136171, "epoch": 3242} {"train_loss": -6.687376022338867, "global_step": 136172, "epoch": 3242} {"train_loss": -6.715611457824707, "global_step": 136173, "epoch": 3242} {"train_loss": -6.686969757080078, "global_step": 136174, "epoch": 3242} {"train_loss": -6.710805892944336, "global_step": 136175, "epoch": 3242} {"train_loss": -6.702590465545654, "global_step": 136176, "epoch": 3242} {"train_loss": -6.712353229522705, "global_step": 136177, "epoch": 3242} {"train_loss": -6.679975509643555, "global_step": 136178, "epoch": 3242} {"train_loss": -6.711356163024902, "global_step": 136179, "epoch": 3242} {"train_loss": -6.687573432922363, "global_step": 136180, "epoch": 3242} {"train_loss": -6.684128284454346, "global_step": 136181, "epoch": 3242} {"train_loss": -6.603200435638428, "global_step": 136182, "epoch": 3242} {"train_loss": -6.771914482116699, "global_step": 136183, "epoch": 3242} {"train_loss": -6.591121196746826, "global_step": 136184, "epoch": 3242} {"train_loss": -6.652831077575684, "global_step": 136185, "epoch": 3242} {"train_loss": -6.6698431968688965, "global_step": 136186, "epoch": 3242} {"train_loss": -6.689235210418701, "global_step": 136187, "epoch": 3242} {"train_loss": -6.551609992980957, "global_step": 136188, "epoch": 3242} {"train_loss": -6.824490547180176, "global_step": 136189, "epoch": 3242} {"train_loss": -6.600834846496582, "global_step": 136190, "epoch": 3242} {"train_loss": -6.735245704650879, "global_step": 136191, "epoch": 3242} {"train_loss": -6.747758388519287, "global_step": 136192, "epoch": 3242} {"train_loss": -6.629472255706787, "global_step": 136193, "epoch": 3242} {"train_loss": -6.5813798904418945, "global_step": 136194, "epoch": 3242} {"train_loss": -6.642023086547852, "global_step": 136195, "epoch": 3242} {"train_loss": -6.739021301269531, "global_step": 136196, "epoch": 3242} {"train_loss": -6.673336982727051, "global_step": 136197, "epoch": 3242} {"train_loss": -6.613187313079834, "global_step": 136198, "epoch": 3242} {"train_loss": -6.7169389724731445, "global_step": 136199, "epoch": 3242} {"train_loss": -6.630551815032959, "global_step": 136200, "epoch": 3242} {"train_loss": -6.800835609436035, "global_step": 136201, "epoch": 3242} {"train_loss": -6.530295372009277, "global_step": 136202, "epoch": 3242} {"train_loss": -6.554868698120117, "global_step": 136203, "epoch": 3242} {"train_loss": -6.724572658538818, "global_step": 136204, "epoch": 3242} {"train_loss": -6.673271826335362, "global_step": 136205, "epoch": 3242, "val_loss": 68437.6484375} {"train_loss": -6.598864555358887, "global_step": 136206, "epoch": 3243} {"train_loss": -6.635226726531982, "global_step": 136207, "epoch": 3243} {"train_loss": -6.610141754150391, "global_step": 136208, "epoch": 3243} {"train_loss": -6.771124839782715, "global_step": 136209, "epoch": 3243} {"train_loss": -6.5353217124938965, "global_step": 136210, "epoch": 3243} {"train_loss": -6.6379923820495605, "global_step": 136211, "epoch": 3243} {"train_loss": -6.725241184234619, "global_step": 136212, "epoch": 3243} {"train_loss": -6.579872131347656, "global_step": 136213, "epoch": 3243} {"train_loss": -6.68248176574707, "global_step": 136214, "epoch": 3243} {"train_loss": -6.605181694030762, "global_step": 136215, "epoch": 3243} {"train_loss": -6.616612434387207, "global_step": 136216, "epoch": 3243} {"train_loss": -6.677644729614258, "global_step": 136217, "epoch": 3243} {"train_loss": -6.673613548278809, "global_step": 136218, "epoch": 3243} {"train_loss": -6.715906143188477, "global_step": 136219, "epoch": 3243} {"train_loss": -6.637855052947998, "global_step": 136220, "epoch": 3243} {"train_loss": -6.678704738616943, "global_step": 136221, "epoch": 3243} {"train_loss": -6.795151710510254, "global_step": 136222, "epoch": 3243} {"train_loss": -6.759635925292969, "global_step": 136223, "epoch": 3243} {"train_loss": -6.763950347900391, "global_step": 136224, "epoch": 3243} {"train_loss": -6.852643966674805, "global_step": 136225, "epoch": 3243} {"train_loss": -6.6214070320129395, "global_step": 136226, "epoch": 3243} {"train_loss": -6.582786560058594, "global_step": 136227, "epoch": 3243} {"train_loss": -6.665684700012207, "global_step": 136228, "epoch": 3243} {"train_loss": -6.47488260269165, "global_step": 136229, "epoch": 3243} {"train_loss": -6.791337013244629, "global_step": 136230, "epoch": 3243} {"train_loss": -6.851189613342285, "global_step": 136231, "epoch": 3243} {"train_loss": -6.622095108032227, "global_step": 136232, "epoch": 3243} {"train_loss": -6.78004264831543, "global_step": 136233, "epoch": 3243} {"train_loss": -6.643032073974609, "global_step": 136234, "epoch": 3243} {"train_loss": -6.710873603820801, "global_step": 136235, "epoch": 3243} {"train_loss": -6.726194381713867, "global_step": 136236, "epoch": 3243} {"train_loss": -6.719090461730957, "global_step": 136237, "epoch": 3243} {"train_loss": -6.747129440307617, "global_step": 136238, "epoch": 3243} {"train_loss": -6.709653377532959, "global_step": 136239, "epoch": 3243} {"train_loss": -6.610245704650879, "global_step": 136240, "epoch": 3243} {"train_loss": -6.7598114013671875, "global_step": 136241, "epoch": 3243} {"train_loss": -6.619647026062012, "global_step": 136242, "epoch": 3243} {"train_loss": -6.672968864440918, "global_step": 136243, "epoch": 3243} {"train_loss": -6.64011287689209, "global_step": 136244, "epoch": 3243} {"train_loss": -6.69083309173584, "global_step": 136245, "epoch": 3243} {"train_loss": -6.625095367431641, "global_step": 136246, "epoch": 3243} {"train_loss": -6.676080737795148, "global_step": 136247, "epoch": 3243, "val_loss": 68126.1171875} {"train_loss": -6.707341194152832, "global_step": 136248, "epoch": 3244} {"train_loss": -6.664089679718018, "global_step": 136249, "epoch": 3244} {"train_loss": -6.617757797241211, "global_step": 136250, "epoch": 3244} {"train_loss": -6.583423137664795, "global_step": 136251, "epoch": 3244} {"train_loss": -6.689723014831543, "global_step": 136252, "epoch": 3244} {"train_loss": -6.713687419891357, "global_step": 136253, "epoch": 3244} {"train_loss": -6.742520332336426, "global_step": 136254, "epoch": 3244} {"train_loss": -6.648691177368164, "global_step": 136255, "epoch": 3244} {"train_loss": -6.681982040405273, "global_step": 136256, "epoch": 3244} {"train_loss": -6.652777671813965, "global_step": 136257, "epoch": 3244} {"train_loss": -6.696889400482178, "global_step": 136258, "epoch": 3244} {"train_loss": -6.801448822021484, "global_step": 136259, "epoch": 3244} {"train_loss": -6.641543388366699, "global_step": 136260, "epoch": 3244} {"train_loss": -6.620499610900879, "global_step": 136261, "epoch": 3244} {"train_loss": -6.686455249786377, "global_step": 136262, "epoch": 3244} {"train_loss": -6.633835792541504, "global_step": 136263, "epoch": 3244} {"train_loss": -6.816857814788818, "global_step": 136264, "epoch": 3244} {"train_loss": -6.555079460144043, "global_step": 136265, "epoch": 3244} {"train_loss": -6.68586540222168, "global_step": 136266, "epoch": 3244} {"train_loss": -6.705733299255371, "global_step": 136267, "epoch": 3244} {"train_loss": -6.593100070953369, "global_step": 136268, "epoch": 3244} {"train_loss": -6.6245222091674805, "global_step": 136269, "epoch": 3244} {"train_loss": -6.539185523986816, "global_step": 136270, "epoch": 3244} {"train_loss": -6.672296524047852, "global_step": 136271, "epoch": 3244} {"train_loss": -6.595219612121582, "global_step": 136272, "epoch": 3244} {"train_loss": -6.7263641357421875, "global_step": 136273, "epoch": 3244} {"train_loss": -6.449832916259766, "global_step": 136274, "epoch": 3244} {"train_loss": -6.514186859130859, "global_step": 136275, "epoch": 3244} {"train_loss": -6.561367988586426, "global_step": 136276, "epoch": 3244} {"train_loss": -6.527002811431885, "global_step": 136277, "epoch": 3244} {"train_loss": -6.564720153808594, "global_step": 136278, "epoch": 3244} {"train_loss": -6.45640754699707, "global_step": 136279, "epoch": 3244} {"train_loss": -6.583621025085449, "global_step": 136280, "epoch": 3244} {"train_loss": -6.460111141204834, "global_step": 136281, "epoch": 3244} {"train_loss": -6.7356343269348145, "global_step": 136282, "epoch": 3244} {"train_loss": -6.515718460083008, "global_step": 136283, "epoch": 3244} {"train_loss": -6.574675559997559, "global_step": 136284, "epoch": 3244} {"train_loss": -6.608788967132568, "global_step": 136285, "epoch": 3244} {"train_loss": -6.660927772521973, "global_step": 136286, "epoch": 3244} {"train_loss": -6.640532493591309, "global_step": 136287, "epoch": 3244} {"train_loss": -6.566545486450195, "global_step": 136288, "epoch": 3244} {"train_loss": -6.626836776733398, "global_step": 136289, "epoch": 3244, "val_loss": 68240.765625} {"train_loss": -6.6310014724731445, "global_step": 136290, "epoch": 3245} {"train_loss": -6.6957316398620605, "global_step": 136291, "epoch": 3245} {"train_loss": -6.603266716003418, "global_step": 136292, "epoch": 3245} {"train_loss": -6.6185455322265625, "global_step": 136293, "epoch": 3245} {"train_loss": -6.530150890350342, "global_step": 136294, "epoch": 3245} {"train_loss": -6.623671531677246, "global_step": 136295, "epoch": 3245} {"train_loss": -6.5826921463012695, "global_step": 136296, "epoch": 3245} {"train_loss": -6.6053924560546875, "global_step": 136297, "epoch": 3245} {"train_loss": -6.609901428222656, "global_step": 136298, "epoch": 3245} {"train_loss": -6.44338846206665, "global_step": 136299, "epoch": 3245} {"train_loss": -6.626454830169678, "global_step": 136300, "epoch": 3245} {"train_loss": -6.491888046264648, "global_step": 136301, "epoch": 3245} {"train_loss": -6.532393932342529, "global_step": 136302, "epoch": 3245} {"train_loss": -6.608419418334961, "global_step": 136303, "epoch": 3245} {"train_loss": -6.569618225097656, "global_step": 136304, "epoch": 3245} {"train_loss": -6.543194770812988, "global_step": 136305, "epoch": 3245} {"train_loss": -6.578034400939941, "global_step": 136306, "epoch": 3245} {"train_loss": -6.680871963500977, "global_step": 136307, "epoch": 3245} {"train_loss": -6.628751754760742, "global_step": 136308, "epoch": 3245} {"train_loss": -6.560155868530273, "global_step": 136309, "epoch": 3245} {"train_loss": -6.529976844787598, "global_step": 136310, "epoch": 3245} {"train_loss": -6.771105766296387, "global_step": 136311, "epoch": 3245} {"train_loss": -6.697587013244629, "global_step": 136312, "epoch": 3245} {"train_loss": -6.6978654861450195, "global_step": 136313, "epoch": 3245} {"train_loss": -6.557802677154541, "global_step": 136314, "epoch": 3245} {"train_loss": -6.684226989746094, "global_step": 136315, "epoch": 3245} {"train_loss": -6.660282135009766, "global_step": 136316, "epoch": 3245} {"train_loss": -6.673025131225586, "global_step": 136317, "epoch": 3245} {"train_loss": -6.610698699951172, "global_step": 136318, "epoch": 3245} {"train_loss": -6.584315776824951, "global_step": 136319, "epoch": 3245} {"train_loss": -6.7273664474487305, "global_step": 136320, "epoch": 3245} {"train_loss": -6.617722034454346, "global_step": 136321, "epoch": 3245} {"train_loss": -6.608508110046387, "global_step": 136322, "epoch": 3245} {"train_loss": -6.6239213943481445, "global_step": 136323, "epoch": 3245} {"train_loss": -6.769497871398926, "global_step": 136324, "epoch": 3245} {"train_loss": -6.730789661407471, "global_step": 136325, "epoch": 3245} {"train_loss": -6.71251106262207, "global_step": 136326, "epoch": 3245} {"train_loss": -6.7048845291137695, "global_step": 136327, "epoch": 3245} {"train_loss": -6.759132385253906, "global_step": 136328, "epoch": 3245} {"train_loss": -6.663235187530518, "global_step": 136329, "epoch": 3245} {"train_loss": -6.6542253494262695, "global_step": 136330, "epoch": 3245} {"train_loss": -6.632061867486863, "global_step": 136331, "epoch": 3245, "val_loss": 68306.75} {"train_loss": -6.692759037017822, "global_step": 136332, "epoch": 3246} {"train_loss": -6.632282257080078, "global_step": 136333, "epoch": 3246} {"train_loss": -6.698455333709717, "global_step": 136334, "epoch": 3246} {"train_loss": -6.775017738342285, "global_step": 136335, "epoch": 3246} {"train_loss": -6.643853187561035, "global_step": 136336, "epoch": 3246} {"train_loss": -6.737018585205078, "global_step": 136337, "epoch": 3246} {"train_loss": -6.711635589599609, "global_step": 136338, "epoch": 3246} {"train_loss": -6.62685489654541, "global_step": 136339, "epoch": 3246} {"train_loss": -6.746578216552734, "global_step": 136340, "epoch": 3246} {"train_loss": -6.777891159057617, "global_step": 136341, "epoch": 3246} {"train_loss": -6.668148994445801, "global_step": 136342, "epoch": 3246} {"train_loss": -6.735161304473877, "global_step": 136343, "epoch": 3246} {"train_loss": -6.807476997375488, "global_step": 136344, "epoch": 3246} {"train_loss": -6.783725738525391, "global_step": 136345, "epoch": 3246} {"train_loss": -6.835418224334717, "global_step": 136346, "epoch": 3246} {"train_loss": -6.797469139099121, "global_step": 136347, "epoch": 3246} {"train_loss": -6.669797897338867, "global_step": 136348, "epoch": 3246} {"train_loss": -6.6767401695251465, "global_step": 136349, "epoch": 3246} {"train_loss": -6.695829391479492, "global_step": 136350, "epoch": 3246} {"train_loss": -6.674638748168945, "global_step": 136351, "epoch": 3246} {"train_loss": -6.60986852645874, "global_step": 136352, "epoch": 3246} {"train_loss": -6.631464004516602, "global_step": 136353, "epoch": 3246} {"train_loss": -6.745676040649414, "global_step": 136354, "epoch": 3246} {"train_loss": -6.611310958862305, "global_step": 136355, "epoch": 3246} {"train_loss": -6.643258094787598, "global_step": 136356, "epoch": 3246} {"train_loss": -6.667145729064941, "global_step": 136357, "epoch": 3246} {"train_loss": -6.663139343261719, "global_step": 136358, "epoch": 3246} {"train_loss": -6.6346211433410645, "global_step": 136359, "epoch": 3246} {"train_loss": -6.701556205749512, "global_step": 136360, "epoch": 3246} {"train_loss": -6.7034220695495605, "global_step": 136361, "epoch": 3246} {"train_loss": -6.705106258392334, "global_step": 136362, "epoch": 3246} {"train_loss": -6.725142478942871, "global_step": 136363, "epoch": 3246} {"train_loss": -6.666311264038086, "global_step": 136364, "epoch": 3246} {"train_loss": -6.646483421325684, "global_step": 136365, "epoch": 3246} {"train_loss": -6.702259540557861, "global_step": 136366, "epoch": 3246} {"train_loss": -6.809013366699219, "global_step": 136367, "epoch": 3246} {"train_loss": -6.677725315093994, "global_step": 136368, "epoch": 3246} {"train_loss": -6.637040138244629, "global_step": 136369, "epoch": 3246} {"train_loss": -6.623867988586426, "global_step": 136370, "epoch": 3246} {"train_loss": -6.78193473815918, "global_step": 136371, "epoch": 3246} {"train_loss": -6.561007976531982, "global_step": 136372, "epoch": 3246} {"train_loss": -6.693558136622111, "global_step": 136373, "epoch": 3246, "val_loss": 68349.6640625} {"train_loss": -6.685395240783691, "global_step": 136374, "epoch": 3247} {"train_loss": -6.7423601150512695, "global_step": 136375, "epoch": 3247} {"train_loss": -6.580562591552734, "global_step": 136376, "epoch": 3247} {"train_loss": -6.6011433601379395, "global_step": 136377, "epoch": 3247} {"train_loss": -6.650171279907227, "global_step": 136378, "epoch": 3247} {"train_loss": -6.574075222015381, "global_step": 136379, "epoch": 3247} {"train_loss": -6.5440897941589355, "global_step": 136380, "epoch": 3247} {"train_loss": -6.663723945617676, "global_step": 136381, "epoch": 3247} {"train_loss": -6.478051662445068, "global_step": 136382, "epoch": 3247} {"train_loss": -6.656553268432617, "global_step": 136383, "epoch": 3247} {"train_loss": -6.521419048309326, "global_step": 136384, "epoch": 3247} {"train_loss": -6.57135009765625, "global_step": 136385, "epoch": 3247} {"train_loss": -6.5941314697265625, "global_step": 136386, "epoch": 3247} {"train_loss": -6.580519676208496, "global_step": 136387, "epoch": 3247} {"train_loss": -6.783101558685303, "global_step": 136388, "epoch": 3247} {"train_loss": -6.571308135986328, "global_step": 136389, "epoch": 3247} {"train_loss": -6.673699378967285, "global_step": 136390, "epoch": 3247} {"train_loss": -6.470526695251465, "global_step": 136391, "epoch": 3247} {"train_loss": -6.63765811920166, "global_step": 136392, "epoch": 3247} {"train_loss": -6.666800498962402, "global_step": 136393, "epoch": 3247} {"train_loss": -6.618894577026367, "global_step": 136394, "epoch": 3247} {"train_loss": -6.542973518371582, "global_step": 136395, "epoch": 3247} {"train_loss": -6.527187347412109, "global_step": 136396, "epoch": 3247} {"train_loss": -6.627965450286865, "global_step": 136397, "epoch": 3247} {"train_loss": -6.434788227081299, "global_step": 136398, "epoch": 3247} {"train_loss": -6.579030990600586, "global_step": 136399, "epoch": 3247} {"train_loss": -6.613094806671143, "global_step": 136400, "epoch": 3247} {"train_loss": -6.651184558868408, "global_step": 136401, "epoch": 3247} {"train_loss": -6.524049282073975, "global_step": 136402, "epoch": 3247} {"train_loss": -6.741335868835449, "global_step": 136403, "epoch": 3247} {"train_loss": -6.525600910186768, "global_step": 136404, "epoch": 3247} {"train_loss": -6.549808025360107, "global_step": 136405, "epoch": 3247} {"train_loss": -6.601986885070801, "global_step": 136406, "epoch": 3247} {"train_loss": -6.69130802154541, "global_step": 136407, "epoch": 3247} {"train_loss": -6.572941303253174, "global_step": 136408, "epoch": 3247} {"train_loss": -6.663370132446289, "global_step": 136409, "epoch": 3247} {"train_loss": -6.681838035583496, "global_step": 136410, "epoch": 3247} {"train_loss": -6.627633571624756, "global_step": 136411, "epoch": 3247} {"train_loss": -6.720998764038086, "global_step": 136412, "epoch": 3247} {"train_loss": -6.6200666427612305, "global_step": 136413, "epoch": 3247} {"train_loss": -6.659174919128418, "global_step": 136414, "epoch": 3247} {"train_loss": -6.616005227679298, "global_step": 136415, "epoch": 3247, "val_loss": 68329.125} {"train_loss": -6.661999225616455, "global_step": 136416, "epoch": 3248} {"train_loss": -6.723723411560059, "global_step": 136417, "epoch": 3248} {"train_loss": -6.652583599090576, "global_step": 136418, "epoch": 3248} {"train_loss": -6.680141925811768, "global_step": 136419, "epoch": 3248} {"train_loss": -6.698789119720459, "global_step": 136420, "epoch": 3248} {"train_loss": -6.671972751617432, "global_step": 136421, "epoch": 3248} {"train_loss": -6.655406951904297, "global_step": 136422, "epoch": 3248} {"train_loss": -6.650389194488525, "global_step": 136423, "epoch": 3248} {"train_loss": -6.63984489440918, "global_step": 136424, "epoch": 3248} {"train_loss": -6.692758560180664, "global_step": 136425, "epoch": 3248} {"train_loss": -6.7722344398498535, "global_step": 136426, "epoch": 3248} {"train_loss": -6.638152122497559, "global_step": 136427, "epoch": 3248} {"train_loss": -6.732457160949707, "global_step": 136428, "epoch": 3248} {"train_loss": -6.7112627029418945, "global_step": 136429, "epoch": 3248} {"train_loss": -6.8268585205078125, "global_step": 136430, "epoch": 3248} {"train_loss": -6.738129615783691, "global_step": 136431, "epoch": 3248} {"train_loss": -6.675815582275391, "global_step": 136432, "epoch": 3248} {"train_loss": -6.685746192932129, "global_step": 136433, "epoch": 3248} {"train_loss": -6.856047630310059, "global_step": 136434, "epoch": 3248} {"train_loss": -6.732485771179199, "global_step": 136435, "epoch": 3248} {"train_loss": -6.670350074768066, "global_step": 136436, "epoch": 3248} {"train_loss": -6.673703193664551, "global_step": 136437, "epoch": 3248} {"train_loss": -6.692380905151367, "global_step": 136438, "epoch": 3248} {"train_loss": -6.6992340087890625, "global_step": 136439, "epoch": 3248} {"train_loss": -6.697168350219727, "global_step": 136440, "epoch": 3248} {"train_loss": -6.618551254272461, "global_step": 136441, "epoch": 3248} {"train_loss": -6.7349395751953125, "global_step": 136442, "epoch": 3248} {"train_loss": -6.780794143676758, "global_step": 136443, "epoch": 3248} {"train_loss": -6.690187454223633, "global_step": 136444, "epoch": 3248} {"train_loss": -6.654280662536621, "global_step": 136445, "epoch": 3248} {"train_loss": -6.7235212326049805, "global_step": 136446, "epoch": 3248} {"train_loss": -6.680471897125244, "global_step": 136447, "epoch": 3248} {"train_loss": -6.751991271972656, "global_step": 136448, "epoch": 3248} {"train_loss": -6.552218437194824, "global_step": 136449, "epoch": 3248} {"train_loss": -6.710395812988281, "global_step": 136450, "epoch": 3248} {"train_loss": -6.74345064163208, "global_step": 136451, "epoch": 3248} {"train_loss": -6.652979850769043, "global_step": 136452, "epoch": 3248} {"train_loss": -6.685281753540039, "global_step": 136453, "epoch": 3248} {"train_loss": -6.677305221557617, "global_step": 136454, "epoch": 3248} {"train_loss": -6.696280002593994, "global_step": 136455, "epoch": 3248} {"train_loss": -6.7132158279418945, "global_step": 136456, "epoch": 3248} {"train_loss": -6.6988493374415805, "global_step": 136457, "epoch": 3248, "val_loss": 68169.7578125} {"train_loss": -6.799066543579102, "global_step": 136458, "epoch": 3249} {"train_loss": -6.6855010986328125, "global_step": 136459, "epoch": 3249} {"train_loss": -6.730480670928955, "global_step": 136460, "epoch": 3249} {"train_loss": -6.599520683288574, "global_step": 136461, "epoch": 3249} {"train_loss": -6.766063213348389, "global_step": 136462, "epoch": 3249} {"train_loss": -6.663065433502197, "global_step": 136463, "epoch": 3249} {"train_loss": -6.693596363067627, "global_step": 136464, "epoch": 3249} {"train_loss": -6.62653923034668, "global_step": 136465, "epoch": 3249} {"train_loss": -6.654346466064453, "global_step": 136466, "epoch": 3249} {"train_loss": -6.81353235244751, "global_step": 136467, "epoch": 3249} {"train_loss": -6.739801406860352, "global_step": 136468, "epoch": 3249} {"train_loss": -6.702912330627441, "global_step": 136469, "epoch": 3249} {"train_loss": -6.65401029586792, "global_step": 136470, "epoch": 3249} {"train_loss": -6.668811321258545, "global_step": 136471, "epoch": 3249} {"train_loss": -6.78267765045166, "global_step": 136472, "epoch": 3249} {"train_loss": -6.743956565856934, "global_step": 136473, "epoch": 3249} {"train_loss": -6.612631797790527, "global_step": 136474, "epoch": 3249} {"train_loss": -6.78636360168457, "global_step": 136475, "epoch": 3249} {"train_loss": -6.6714935302734375, "global_step": 136476, "epoch": 3249} {"train_loss": -6.65916633605957, "global_step": 136477, "epoch": 3249} {"train_loss": -6.5994415283203125, "global_step": 136478, "epoch": 3249} {"train_loss": -6.607737064361572, "global_step": 136479, "epoch": 3249} {"train_loss": -6.731118679046631, "global_step": 136480, "epoch": 3249} {"train_loss": -6.73945426940918, "global_step": 136481, "epoch": 3249} {"train_loss": -6.639766693115234, "global_step": 136482, "epoch": 3249} {"train_loss": -6.629152297973633, "global_step": 136483, "epoch": 3249} {"train_loss": -6.763664245605469, "global_step": 136484, "epoch": 3249} {"train_loss": -6.70859432220459, "global_step": 136485, "epoch": 3249} {"train_loss": -6.5532121658325195, "global_step": 136486, "epoch": 3249} {"train_loss": -6.751478672027588, "global_step": 136487, "epoch": 3249} {"train_loss": -6.682207107543945, "global_step": 136488, "epoch": 3249} {"train_loss": -6.740856170654297, "global_step": 136489, "epoch": 3249} {"train_loss": -6.636885643005371, "global_step": 136490, "epoch": 3249} {"train_loss": -6.717504978179932, "global_step": 136491, "epoch": 3249} {"train_loss": -6.666886806488037, "global_step": 136492, "epoch": 3249} {"train_loss": -6.652761459350586, "global_step": 136493, "epoch": 3249} {"train_loss": -6.764249801635742, "global_step": 136494, "epoch": 3249} {"train_loss": -6.689476490020752, "global_step": 136495, "epoch": 3249} {"train_loss": -6.653321266174316, "global_step": 136496, "epoch": 3249} {"train_loss": -6.668337821960449, "global_step": 136497, "epoch": 3249} {"train_loss": -6.6483025550842285, "global_step": 136498, "epoch": 3249} {"train_loss": -6.688796542939686, "global_step": 136499, "epoch": 3249, "val_loss": 68200.921875} {"train_loss": -6.651344299316406, "global_step": 136500, "epoch": 3250} {"train_loss": -6.718867778778076, "global_step": 136501, "epoch": 3250} {"train_loss": -6.622269153594971, "global_step": 136502, "epoch": 3250} {"train_loss": -6.605912208557129, "global_step": 136503, "epoch": 3250} {"train_loss": -6.679450988769531, "global_step": 136504, "epoch": 3250} {"train_loss": -6.6342058181762695, "global_step": 136505, "epoch": 3250} {"train_loss": -6.619235515594482, "global_step": 136506, "epoch": 3250} {"train_loss": -6.6114115715026855, "global_step": 136507, "epoch": 3250} {"train_loss": -6.545294284820557, "global_step": 136508, "epoch": 3250} {"train_loss": -6.702425956726074, "global_step": 136509, "epoch": 3250} {"train_loss": -6.678404331207275, "global_step": 136510, "epoch": 3250} {"train_loss": -6.578995704650879, "global_step": 136511, "epoch": 3250} {"train_loss": -6.7171525955200195, "global_step": 136512, "epoch": 3250} {"train_loss": -6.749286651611328, "global_step": 136513, "epoch": 3250} {"train_loss": -6.605978965759277, "global_step": 136514, "epoch": 3250} {"train_loss": -6.686079502105713, "global_step": 136515, "epoch": 3250} {"train_loss": -6.665668487548828, "global_step": 136516, "epoch": 3250} {"train_loss": -6.77598762512207, "global_step": 136517, "epoch": 3250} {"train_loss": -6.672540664672852, "global_step": 136518, "epoch": 3250} {"train_loss": -6.797419548034668, "global_step": 136519, "epoch": 3250} {"train_loss": -6.760258197784424, "global_step": 136520, "epoch": 3250} {"train_loss": -6.683338165283203, "global_step": 136521, "epoch": 3250} {"train_loss": -6.743537902832031, "global_step": 136522, "epoch": 3250} {"train_loss": -6.679686546325684, "global_step": 136523, "epoch": 3250} {"train_loss": -6.746444225311279, "global_step": 136524, "epoch": 3250} {"train_loss": -6.647263526916504, "global_step": 136525, "epoch": 3250} {"train_loss": -6.706502914428711, "global_step": 136526, "epoch": 3250} {"train_loss": -6.698428630828857, "global_step": 136527, "epoch": 3250} {"train_loss": -6.648741245269775, "global_step": 136528, "epoch": 3250} {"train_loss": -6.735721588134766, "global_step": 136529, "epoch": 3250} {"train_loss": -6.730039596557617, "global_step": 136530, "epoch": 3250} {"train_loss": -6.731986045837402, "global_step": 136531, "epoch": 3250} {"train_loss": -6.742956638336182, "global_step": 136532, "epoch": 3250} {"train_loss": -6.642427444458008, "global_step": 136533, "epoch": 3250} {"train_loss": -6.6648101806640625, "global_step": 136534, "epoch": 3250} {"train_loss": -6.735620975494385, "global_step": 136535, "epoch": 3250} {"train_loss": -6.691710472106934, "global_step": 136536, "epoch": 3250} {"train_loss": -6.762063980102539, "global_step": 136537, "epoch": 3250} {"train_loss": -6.69325590133667, "global_step": 136538, "epoch": 3250} {"train_loss": -6.704413414001465, "global_step": 136539, "epoch": 3250} {"train_loss": -6.626246452331543, "global_step": 136540, "epoch": 3250} {"train_loss": -6.686068023954119, "global_step": 136541, "epoch": 3250, "train/sim_max_reward_0": 0.20508641829773827, "train/sim_max_reward_1": 0.33997221553012424, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.13180328336407116, "train/sim_max_reward_4": 0.9556080638547026, "train/sim_max_reward_5": 0.9733341227817571, "test/sim_max_reward_4400000": 0.2847494594582787, "test/sim_max_reward_4400001": 0.3528363837702585, "test/sim_max_reward_4400002": 0.33159426319455376, "test/sim_max_reward_4400003": 0.6060836256326322, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.7181894792007005, "test/sim_max_reward_4400006": 0.976671821976959, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.2972401013426885, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 0.8524732146831709, "test/sim_max_reward_4400011": 0.07343031947342361, "test/sim_max_reward_4400012": 0.9889791625039447, "test/sim_max_reward_4400013": 0.973147332514967, "test/sim_max_reward_4400014": 0.918890583532324, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.9020906790169132, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2305625708176389, "test/sim_max_reward_4400019": 0.6700590974625477, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9554244380823702, "test/sim_max_reward_4400023": 0.6115379872701573, "test/sim_max_reward_4400024": 0.7980037397308248, "test/sim_max_reward_4400025": 0.253599877516172, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0651500835659677, "test/sim_max_reward_4400028": 0.3969195667341994, "test/sim_max_reward_4400029": 0.5294672583130051, "test/sim_max_reward_4400030": 0.958712428402669, "test/sim_max_reward_4400031": 0.9720201965455276, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.6497834297824621, "test/sim_max_reward_4400034": 0.8649773151034027, "test/sim_max_reward_4400035": 1.0, "test/sim_max_reward_4400036": 0.4455569365664512, "test/sim_max_reward_4400037": 0.22856090016175656, "test/sim_max_reward_4400038": 0.948341134791778, "test/sim_max_reward_4400039": 0.9850666805674594, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9358113140123324, "test/sim_max_reward_4400042": 0.6235221585829979, "test/sim_max_reward_4400043": 0.9845206919564908, "test/sim_max_reward_4400044": 0.9560521530320768, "test/sim_max_reward_4400045": 0.4484151550111841, "test/sim_max_reward_4400046": 0.4465036540148962, "test/sim_max_reward_4400047": 0.9927606933270651, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.9662616677606165, "train/mean_score": 0.6009673506380656, "test/mean_score": 0.5533439477157353, "val_loss": 68243.3203125} {"train_loss": -6.712345123291016, "global_step": 136542, "epoch": 3251} {"train_loss": -6.6354546546936035, "global_step": 136543, "epoch": 3251} {"train_loss": -6.694827556610107, "global_step": 136544, "epoch": 3251} {"train_loss": -6.623661518096924, "global_step": 136545, "epoch": 3251} {"train_loss": -6.633625030517578, "global_step": 136546, "epoch": 3251} {"train_loss": -6.755064964294434, "global_step": 136547, "epoch": 3251} {"train_loss": -6.734846591949463, "global_step": 136548, "epoch": 3251} {"train_loss": -6.7957024574279785, "global_step": 136549, "epoch": 3251} {"train_loss": -6.737188339233398, "global_step": 136550, "epoch": 3251} {"train_loss": -6.739581108093262, "global_step": 136551, "epoch": 3251} {"train_loss": -6.76773738861084, "global_step": 136552, "epoch": 3251} {"train_loss": -6.669429779052734, "global_step": 136553, "epoch": 3251} {"train_loss": -6.823795318603516, "global_step": 136554, "epoch": 3251} {"train_loss": -6.8199052810668945, "global_step": 136555, "epoch": 3251} {"train_loss": -6.697601318359375, "global_step": 136556, "epoch": 3251} {"train_loss": -6.649406909942627, "global_step": 136557, "epoch": 3251} {"train_loss": -6.825038909912109, "global_step": 136558, "epoch": 3251} {"train_loss": -6.58902645111084, "global_step": 136559, "epoch": 3251} {"train_loss": -6.644941806793213, "global_step": 136560, "epoch": 3251} {"train_loss": -6.740994930267334, "global_step": 136561, "epoch": 3251} {"train_loss": -6.771537780761719, "global_step": 136562, "epoch": 3251} {"train_loss": -6.7012410163879395, "global_step": 136563, "epoch": 3251} {"train_loss": -6.661017417907715, "global_step": 136564, "epoch": 3251} {"train_loss": -6.794454574584961, "global_step": 136565, "epoch": 3251} {"train_loss": -6.789612293243408, "global_step": 136566, "epoch": 3251} {"train_loss": -6.699713230133057, "global_step": 136567, "epoch": 3251} {"train_loss": -6.753094673156738, "global_step": 136568, "epoch": 3251} {"train_loss": -6.791712284088135, "global_step": 136569, "epoch": 3251} {"train_loss": -6.6801629066467285, "global_step": 136570, "epoch": 3251} {"train_loss": -6.774453639984131, "global_step": 136571, "epoch": 3251} {"train_loss": -6.617282867431641, "global_step": 136572, "epoch": 3251} {"train_loss": -6.6997904777526855, "global_step": 136573, "epoch": 3251} {"train_loss": -6.830967903137207, "global_step": 136574, "epoch": 3251} {"train_loss": -6.729803085327148, "global_step": 136575, "epoch": 3251} {"train_loss": -6.692551612854004, "global_step": 136576, "epoch": 3251} {"train_loss": -6.646924018859863, "global_step": 136577, "epoch": 3251} {"train_loss": -6.696068286895752, "global_step": 136578, "epoch": 3251} {"train_loss": -6.796909809112549, "global_step": 136579, "epoch": 3251} {"train_loss": -6.604785442352295, "global_step": 136580, "epoch": 3251} {"train_loss": -6.597412109375, "global_step": 136581, "epoch": 3251} {"train_loss": -6.753081798553467, "global_step": 136582, "epoch": 3251} {"train_loss": -6.713641632170904, "global_step": 136583, "epoch": 3251, "val_loss": 68340.3359375} {"train_loss": -6.713518142700195, "global_step": 136584, "epoch": 3252} {"train_loss": -6.66948127746582, "global_step": 136585, "epoch": 3252} {"train_loss": -6.698545455932617, "global_step": 136586, "epoch": 3252} {"train_loss": -6.836981296539307, "global_step": 136587, "epoch": 3252} {"train_loss": -6.654967308044434, "global_step": 136588, "epoch": 3252} {"train_loss": -6.654460430145264, "global_step": 136589, "epoch": 3252} {"train_loss": -6.678729057312012, "global_step": 136590, "epoch": 3252} {"train_loss": -6.717058181762695, "global_step": 136591, "epoch": 3252} {"train_loss": -6.645936965942383, "global_step": 136592, "epoch": 3252} {"train_loss": -6.684720516204834, "global_step": 136593, "epoch": 3252} {"train_loss": -6.753567218780518, "global_step": 136594, "epoch": 3252} {"train_loss": -6.602599620819092, "global_step": 136595, "epoch": 3252} {"train_loss": -6.6770172119140625, "global_step": 136596, "epoch": 3252} {"train_loss": -6.758586883544922, "global_step": 136597, "epoch": 3252} {"train_loss": -6.710295677185059, "global_step": 136598, "epoch": 3252} {"train_loss": -6.633813858032227, "global_step": 136599, "epoch": 3252} {"train_loss": -6.610256195068359, "global_step": 136600, "epoch": 3252} {"train_loss": -6.661311149597168, "global_step": 136601, "epoch": 3252} {"train_loss": -6.716089248657227, "global_step": 136602, "epoch": 3252} {"train_loss": -6.78615665435791, "global_step": 136603, "epoch": 3252} {"train_loss": -6.6909027099609375, "global_step": 136604, "epoch": 3252} {"train_loss": -6.709359169006348, "global_step": 136605, "epoch": 3252} {"train_loss": -6.654366493225098, "global_step": 136606, "epoch": 3252} {"train_loss": -6.662788391113281, "global_step": 136607, "epoch": 3252} {"train_loss": -6.668737411499023, "global_step": 136608, "epoch": 3252} {"train_loss": -6.7326860427856445, "global_step": 136609, "epoch": 3252} {"train_loss": -6.656938552856445, "global_step": 136610, "epoch": 3252} {"train_loss": -6.767153739929199, "global_step": 136611, "epoch": 3252} {"train_loss": -6.635103225708008, "global_step": 136612, "epoch": 3252} {"train_loss": -6.747436046600342, "global_step": 136613, "epoch": 3252} {"train_loss": -6.7591681480407715, "global_step": 136614, "epoch": 3252} {"train_loss": -6.477736473083496, "global_step": 136615, "epoch": 3252} {"train_loss": -6.656404972076416, "global_step": 136616, "epoch": 3252} {"train_loss": -6.673859596252441, "global_step": 136617, "epoch": 3252} {"train_loss": -6.666424751281738, "global_step": 136618, "epoch": 3252} {"train_loss": -6.723186492919922, "global_step": 136619, "epoch": 3252} {"train_loss": -6.688539505004883, "global_step": 136620, "epoch": 3252} {"train_loss": -6.582951545715332, "global_step": 136621, "epoch": 3252} {"train_loss": -6.65755033493042, "global_step": 136622, "epoch": 3252} {"train_loss": -6.560720920562744, "global_step": 136623, "epoch": 3252} {"train_loss": -6.683473587036133, "global_step": 136624, "epoch": 3252} {"train_loss": -6.683735609054565, "global_step": 136625, "epoch": 3252, "val_loss": 68541.390625} {"train_loss": -6.705491065979004, "global_step": 136626, "epoch": 3253} {"train_loss": -6.782227516174316, "global_step": 136627, "epoch": 3253} {"train_loss": -6.761404991149902, "global_step": 136628, "epoch": 3253} {"train_loss": -6.684932708740234, "global_step": 136629, "epoch": 3253} {"train_loss": -6.686860084533691, "global_step": 136630, "epoch": 3253} {"train_loss": -6.75834846496582, "global_step": 136631, "epoch": 3253} {"train_loss": -6.733583450317383, "global_step": 136632, "epoch": 3253} {"train_loss": -6.682636260986328, "global_step": 136633, "epoch": 3253} {"train_loss": -6.65467643737793, "global_step": 136634, "epoch": 3253} {"train_loss": -6.649029731750488, "global_step": 136635, "epoch": 3253} {"train_loss": -6.794816970825195, "global_step": 136636, "epoch": 3253} {"train_loss": -6.6351776123046875, "global_step": 136637, "epoch": 3253} {"train_loss": -6.734547138214111, "global_step": 136638, "epoch": 3253} {"train_loss": -6.6884074211120605, "global_step": 136639, "epoch": 3253} {"train_loss": -6.676996231079102, "global_step": 136640, "epoch": 3253} {"train_loss": -6.713078498840332, "global_step": 136641, "epoch": 3253} {"train_loss": -6.667610168457031, "global_step": 136642, "epoch": 3253} {"train_loss": -6.695127964019775, "global_step": 136643, "epoch": 3253} {"train_loss": -6.691956520080566, "global_step": 136644, "epoch": 3253} {"train_loss": -6.650719165802002, "global_step": 136645, "epoch": 3253} {"train_loss": -6.658540725708008, "global_step": 136646, "epoch": 3253} {"train_loss": -6.732235908508301, "global_step": 136647, "epoch": 3253} {"train_loss": -6.650686264038086, "global_step": 136648, "epoch": 3253} {"train_loss": -6.814580917358398, "global_step": 136649, "epoch": 3253} {"train_loss": -6.674490928649902, "global_step": 136650, "epoch": 3253} {"train_loss": -6.6608781814575195, "global_step": 136651, "epoch": 3253} {"train_loss": -6.702328681945801, "global_step": 136652, "epoch": 3253} {"train_loss": -6.659846782684326, "global_step": 136653, "epoch": 3253} {"train_loss": -6.658913612365723, "global_step": 136654, "epoch": 3253} {"train_loss": -6.799102783203125, "global_step": 136655, "epoch": 3253} {"train_loss": -6.614825248718262, "global_step": 136656, "epoch": 3253} {"train_loss": -6.604388236999512, "global_step": 136657, "epoch": 3253} {"train_loss": -6.695523738861084, "global_step": 136658, "epoch": 3253} {"train_loss": -6.641350746154785, "global_step": 136659, "epoch": 3253} {"train_loss": -6.545050621032715, "global_step": 136660, "epoch": 3253} {"train_loss": -6.592180252075195, "global_step": 136661, "epoch": 3253} {"train_loss": -6.496566295623779, "global_step": 136662, "epoch": 3253} {"train_loss": -6.568187713623047, "global_step": 136663, "epoch": 3253} {"train_loss": -6.678206920623779, "global_step": 136664, "epoch": 3253} {"train_loss": -6.727529525756836, "global_step": 136665, "epoch": 3253} {"train_loss": -6.626926898956299, "global_step": 136666, "epoch": 3253} {"train_loss": -6.67947869073777, "global_step": 136667, "epoch": 3253, "val_loss": 68192.1953125} {"train_loss": -6.617864608764648, "global_step": 136668, "epoch": 3254} {"train_loss": -6.621969223022461, "global_step": 136669, "epoch": 3254} {"train_loss": -6.603832244873047, "global_step": 136670, "epoch": 3254} {"train_loss": -6.56715202331543, "global_step": 136671, "epoch": 3254} {"train_loss": -6.745292663574219, "global_step": 136672, "epoch": 3254} {"train_loss": -6.677107810974121, "global_step": 136673, "epoch": 3254} {"train_loss": -6.6153883934021, "global_step": 136674, "epoch": 3254} {"train_loss": -6.68589448928833, "global_step": 136675, "epoch": 3254} {"train_loss": -6.625511169433594, "global_step": 136676, "epoch": 3254} {"train_loss": -6.574895858764648, "global_step": 136677, "epoch": 3254} {"train_loss": -6.551377773284912, "global_step": 136678, "epoch": 3254} {"train_loss": -6.730113983154297, "global_step": 136679, "epoch": 3254} {"train_loss": -6.7119140625, "global_step": 136680, "epoch": 3254} {"train_loss": -6.603790283203125, "global_step": 136681, "epoch": 3254} {"train_loss": -6.717658519744873, "global_step": 136682, "epoch": 3254} {"train_loss": -6.647743225097656, "global_step": 136683, "epoch": 3254} {"train_loss": -6.783378601074219, "global_step": 136684, "epoch": 3254} {"train_loss": -6.667129993438721, "global_step": 136685, "epoch": 3254} {"train_loss": -6.737142086029053, "global_step": 136686, "epoch": 3254} {"train_loss": -6.756208419799805, "global_step": 136687, "epoch": 3254} {"train_loss": -6.737121105194092, "global_step": 136688, "epoch": 3254} {"train_loss": -6.729568958282471, "global_step": 136689, "epoch": 3254} {"train_loss": -6.701416015625, "global_step": 136690, "epoch": 3254} {"train_loss": -6.636995315551758, "global_step": 136691, "epoch": 3254} {"train_loss": -6.751791000366211, "global_step": 136692, "epoch": 3254} {"train_loss": -6.744528770446777, "global_step": 136693, "epoch": 3254} {"train_loss": -6.670666217803955, "global_step": 136694, "epoch": 3254} {"train_loss": -6.743915557861328, "global_step": 136695, "epoch": 3254} {"train_loss": -6.601617813110352, "global_step": 136696, "epoch": 3254} {"train_loss": -6.561798572540283, "global_step": 136697, "epoch": 3254} {"train_loss": -6.529420852661133, "global_step": 136698, "epoch": 3254} {"train_loss": -6.652402877807617, "global_step": 136699, "epoch": 3254} {"train_loss": -6.618488788604736, "global_step": 136700, "epoch": 3254} {"train_loss": -6.613905429840088, "global_step": 136701, "epoch": 3254} {"train_loss": -6.647039890289307, "global_step": 136702, "epoch": 3254} {"train_loss": -6.597685813903809, "global_step": 136703, "epoch": 3254} {"train_loss": -6.552367210388184, "global_step": 136704, "epoch": 3254} {"train_loss": -6.585649490356445, "global_step": 136705, "epoch": 3254} {"train_loss": -6.6032891273498535, "global_step": 136706, "epoch": 3254} {"train_loss": -6.690577030181885, "global_step": 136707, "epoch": 3254} {"train_loss": -6.581352233886719, "global_step": 136708, "epoch": 3254} {"train_loss": -6.654554344358898, "global_step": 136709, "epoch": 3254, "val_loss": 68270.5625} {"train_loss": -6.664939880371094, "global_step": 136710, "epoch": 3255} {"train_loss": -6.645979404449463, "global_step": 136711, "epoch": 3255} {"train_loss": -6.691854000091553, "global_step": 136712, "epoch": 3255} {"train_loss": -6.5624237060546875, "global_step": 136713, "epoch": 3255} {"train_loss": -6.635563850402832, "global_step": 136714, "epoch": 3255} {"train_loss": -6.6017961502075195, "global_step": 136715, "epoch": 3255} {"train_loss": -6.725474834442139, "global_step": 136716, "epoch": 3255} {"train_loss": -6.615348815917969, "global_step": 136717, "epoch": 3255} {"train_loss": -6.653101444244385, "global_step": 136718, "epoch": 3255} {"train_loss": -6.685136318206787, "global_step": 136719, "epoch": 3255} {"train_loss": -6.673733711242676, "global_step": 136720, "epoch": 3255} {"train_loss": -6.631498336791992, "global_step": 136721, "epoch": 3255} {"train_loss": -6.638174057006836, "global_step": 136722, "epoch": 3255} {"train_loss": -6.624898433685303, "global_step": 136723, "epoch": 3255} {"train_loss": -6.673490047454834, "global_step": 136724, "epoch": 3255} {"train_loss": -6.662485599517822, "global_step": 136725, "epoch": 3255} {"train_loss": -6.705572605133057, "global_step": 136726, "epoch": 3255} {"train_loss": -6.690967082977295, "global_step": 136727, "epoch": 3255} {"train_loss": -6.700498580932617, "global_step": 136728, "epoch": 3255} {"train_loss": -6.709303855895996, "global_step": 136729, "epoch": 3255} {"train_loss": -6.7464494705200195, "global_step": 136730, "epoch": 3255} {"train_loss": -6.712799072265625, "global_step": 136731, "epoch": 3255} {"train_loss": -6.720761299133301, "global_step": 136732, "epoch": 3255} {"train_loss": -6.626886367797852, "global_step": 136733, "epoch": 3255} {"train_loss": -6.6841630935668945, "global_step": 136734, "epoch": 3255} {"train_loss": -6.736169338226318, "global_step": 136735, "epoch": 3255} {"train_loss": -6.691523551940918, "global_step": 136736, "epoch": 3255} {"train_loss": -6.746578216552734, "global_step": 136737, "epoch": 3255} {"train_loss": -6.685430526733398, "global_step": 136738, "epoch": 3255} {"train_loss": -6.611142158508301, "global_step": 136739, "epoch": 3255} {"train_loss": -6.745689392089844, "global_step": 136740, "epoch": 3255} {"train_loss": -6.725556373596191, "global_step": 136741, "epoch": 3255} {"train_loss": -6.711591720581055, "global_step": 136742, "epoch": 3255} {"train_loss": -6.827202796936035, "global_step": 136743, "epoch": 3255} {"train_loss": -6.666203498840332, "global_step": 136744, "epoch": 3255} {"train_loss": -6.68816614151001, "global_step": 136745, "epoch": 3255} {"train_loss": -6.68263053894043, "global_step": 136746, "epoch": 3255} {"train_loss": -6.706602096557617, "global_step": 136747, "epoch": 3255} {"train_loss": -6.719541549682617, "global_step": 136748, "epoch": 3255} {"train_loss": -6.7799811363220215, "global_step": 136749, "epoch": 3255} {"train_loss": -6.686315536499023, "global_step": 136750, "epoch": 3255} {"train_loss": -6.687728030341012, "global_step": 136751, "epoch": 3255, "val_loss": 68284.8515625} {"train_loss": -6.707309722900391, "global_step": 136752, "epoch": 3256} {"train_loss": -6.756572723388672, "global_step": 136753, "epoch": 3256} {"train_loss": -6.792940139770508, "global_step": 136754, "epoch": 3256} {"train_loss": -6.723428726196289, "global_step": 136755, "epoch": 3256} {"train_loss": -6.800644874572754, "global_step": 136756, "epoch": 3256} {"train_loss": -6.713269233703613, "global_step": 136757, "epoch": 3256} {"train_loss": -6.809972286224365, "global_step": 136758, "epoch": 3256} {"train_loss": -6.75332498550415, "global_step": 136759, "epoch": 3256} {"train_loss": -6.847467422485352, "global_step": 136760, "epoch": 3256} {"train_loss": -6.687953472137451, "global_step": 136761, "epoch": 3256} {"train_loss": -6.758928298950195, "global_step": 136762, "epoch": 3256} {"train_loss": -6.7746124267578125, "global_step": 136763, "epoch": 3256} {"train_loss": -6.745676040649414, "global_step": 136764, "epoch": 3256} {"train_loss": -6.777500152587891, "global_step": 136765, "epoch": 3256} {"train_loss": -6.746686935424805, "global_step": 136766, "epoch": 3256} {"train_loss": -6.750665664672852, "global_step": 136767, "epoch": 3256} {"train_loss": -6.7154011726379395, "global_step": 136768, "epoch": 3256} {"train_loss": -6.821950912475586, "global_step": 136769, "epoch": 3256} {"train_loss": -6.726763725280762, "global_step": 136770, "epoch": 3256} {"train_loss": -6.687819957733154, "global_step": 136771, "epoch": 3256} {"train_loss": -6.850172996520996, "global_step": 136772, "epoch": 3256} {"train_loss": -6.760048866271973, "global_step": 136773, "epoch": 3256} {"train_loss": -6.719344615936279, "global_step": 136774, "epoch": 3256} {"train_loss": -6.80922794342041, "global_step": 136775, "epoch": 3256} {"train_loss": -6.641980171203613, "global_step": 136776, "epoch": 3256} {"train_loss": -6.707205295562744, "global_step": 136777, "epoch": 3256} {"train_loss": -6.691198825836182, "global_step": 136778, "epoch": 3256} {"train_loss": -6.688995838165283, "global_step": 136779, "epoch": 3256} {"train_loss": -6.710779190063477, "global_step": 136780, "epoch": 3256} {"train_loss": -6.797152519226074, "global_step": 136781, "epoch": 3256} {"train_loss": -6.702202796936035, "global_step": 136782, "epoch": 3256} {"train_loss": -6.653098106384277, "global_step": 136783, "epoch": 3256} {"train_loss": -6.6342997550964355, "global_step": 136784, "epoch": 3256} {"train_loss": -6.709268569946289, "global_step": 136785, "epoch": 3256} {"train_loss": -6.8983917236328125, "global_step": 136786, "epoch": 3256} {"train_loss": -6.715404987335205, "global_step": 136787, "epoch": 3256} {"train_loss": -6.681676864624023, "global_step": 136788, "epoch": 3256} {"train_loss": -6.699220657348633, "global_step": 136789, "epoch": 3256} {"train_loss": -6.650218963623047, "global_step": 136790, "epoch": 3256} {"train_loss": -6.813876152038574, "global_step": 136791, "epoch": 3256} {"train_loss": -6.701021194458008, "global_step": 136792, "epoch": 3256} {"train_loss": -6.739483152117048, "global_step": 136793, "epoch": 3256, "val_loss": 68451.390625} {"train_loss": -6.611590385437012, "global_step": 136794, "epoch": 3257} {"train_loss": -6.640700340270996, "global_step": 136795, "epoch": 3257} {"train_loss": -6.769686698913574, "global_step": 136796, "epoch": 3257} {"train_loss": -6.60672664642334, "global_step": 136797, "epoch": 3257} {"train_loss": -6.620884418487549, "global_step": 136798, "epoch": 3257} {"train_loss": -6.708540916442871, "global_step": 136799, "epoch": 3257} {"train_loss": -6.61995267868042, "global_step": 136800, "epoch": 3257} {"train_loss": -6.4681396484375, "global_step": 136801, "epoch": 3257} {"train_loss": -6.6875810623168945, "global_step": 136802, "epoch": 3257} {"train_loss": -6.583536624908447, "global_step": 136803, "epoch": 3257} {"train_loss": -6.655405044555664, "global_step": 136804, "epoch": 3257} {"train_loss": -6.761283874511719, "global_step": 136805, "epoch": 3257} {"train_loss": -6.6397247314453125, "global_step": 136806, "epoch": 3257} {"train_loss": -6.659605026245117, "global_step": 136807, "epoch": 3257} {"train_loss": -6.640835762023926, "global_step": 136808, "epoch": 3257} {"train_loss": -6.749945163726807, "global_step": 136809, "epoch": 3257} {"train_loss": -6.713126182556152, "global_step": 136810, "epoch": 3257} {"train_loss": -6.659335613250732, "global_step": 136811, "epoch": 3257} {"train_loss": -6.789417266845703, "global_step": 136812, "epoch": 3257} {"train_loss": -6.752298355102539, "global_step": 136813, "epoch": 3257} {"train_loss": -6.702047348022461, "global_step": 136814, "epoch": 3257} {"train_loss": -6.772861003875732, "global_step": 136815, "epoch": 3257} {"train_loss": -6.622681617736816, "global_step": 136816, "epoch": 3257} {"train_loss": -6.739432334899902, "global_step": 136817, "epoch": 3257} {"train_loss": -6.64577579498291, "global_step": 136818, "epoch": 3257} {"train_loss": -6.648378849029541, "global_step": 136819, "epoch": 3257} {"train_loss": -6.695283889770508, "global_step": 136820, "epoch": 3257} {"train_loss": -6.761297702789307, "global_step": 136821, "epoch": 3257} {"train_loss": -6.650974273681641, "global_step": 136822, "epoch": 3257} {"train_loss": -6.683770179748535, "global_step": 136823, "epoch": 3257} {"train_loss": -6.766730785369873, "global_step": 136824, "epoch": 3257} {"train_loss": -6.614865779876709, "global_step": 136825, "epoch": 3257} {"train_loss": -6.633833885192871, "global_step": 136826, "epoch": 3257} {"train_loss": -6.831592559814453, "global_step": 136827, "epoch": 3257} {"train_loss": -6.7004899978637695, "global_step": 136828, "epoch": 3257} {"train_loss": -6.670106887817383, "global_step": 136829, "epoch": 3257} {"train_loss": -6.679246425628662, "global_step": 136830, "epoch": 3257} {"train_loss": -6.608569145202637, "global_step": 136831, "epoch": 3257} {"train_loss": -6.710965156555176, "global_step": 136832, "epoch": 3257} {"train_loss": -6.750310897827148, "global_step": 136833, "epoch": 3257} {"train_loss": -6.695634841918945, "global_step": 136834, "epoch": 3257} {"train_loss": -6.681740079607282, "global_step": 136835, "epoch": 3257, "val_loss": 68445.734375} {"train_loss": -6.660906791687012, "global_step": 136836, "epoch": 3258} {"train_loss": -6.7838134765625, "global_step": 136837, "epoch": 3258} {"train_loss": -6.627665996551514, "global_step": 136838, "epoch": 3258} {"train_loss": -6.668463706970215, "global_step": 136839, "epoch": 3258} {"train_loss": -6.71490478515625, "global_step": 136840, "epoch": 3258} {"train_loss": -6.7099504470825195, "global_step": 136841, "epoch": 3258} {"train_loss": -6.641719818115234, "global_step": 136842, "epoch": 3258} {"train_loss": -6.768612861633301, "global_step": 136843, "epoch": 3258} {"train_loss": -6.667394161224365, "global_step": 136844, "epoch": 3258} {"train_loss": -6.678707122802734, "global_step": 136845, "epoch": 3258} {"train_loss": -6.7804388999938965, "global_step": 136846, "epoch": 3258} {"train_loss": -6.605949878692627, "global_step": 136847, "epoch": 3258} {"train_loss": -6.683163642883301, "global_step": 136848, "epoch": 3258} {"train_loss": -6.5698981285095215, "global_step": 136849, "epoch": 3258} {"train_loss": -6.698300838470459, "global_step": 136850, "epoch": 3258} {"train_loss": -6.651028156280518, "global_step": 136851, "epoch": 3258} {"train_loss": -6.68480110168457, "global_step": 136852, "epoch": 3258} {"train_loss": -6.687154769897461, "global_step": 136853, "epoch": 3258} {"train_loss": -6.68418550491333, "global_step": 136854, "epoch": 3258} {"train_loss": -6.63358211517334, "global_step": 136855, "epoch": 3258} {"train_loss": -6.594086647033691, "global_step": 136856, "epoch": 3258} {"train_loss": -6.685939311981201, "global_step": 136857, "epoch": 3258} {"train_loss": -6.7801713943481445, "global_step": 136858, "epoch": 3258} {"train_loss": -6.566360950469971, "global_step": 136859, "epoch": 3258} {"train_loss": -6.662829399108887, "global_step": 136860, "epoch": 3258} {"train_loss": -6.644706726074219, "global_step": 136861, "epoch": 3258} {"train_loss": -6.604279518127441, "global_step": 136862, "epoch": 3258} {"train_loss": -6.603637218475342, "global_step": 136863, "epoch": 3258} {"train_loss": -6.685749530792236, "global_step": 136864, "epoch": 3258} {"train_loss": -6.72867488861084, "global_step": 136865, "epoch": 3258} {"train_loss": -6.70613956451416, "global_step": 136866, "epoch": 3258} {"train_loss": -6.667080879211426, "global_step": 136867, "epoch": 3258} {"train_loss": -6.734333038330078, "global_step": 136868, "epoch": 3258} {"train_loss": -6.699563980102539, "global_step": 136869, "epoch": 3258} {"train_loss": -6.658134460449219, "global_step": 136870, "epoch": 3258} {"train_loss": -6.604784965515137, "global_step": 136871, "epoch": 3258} {"train_loss": -6.676873207092285, "global_step": 136872, "epoch": 3258} {"train_loss": -6.699995994567871, "global_step": 136873, "epoch": 3258} {"train_loss": -6.788738250732422, "global_step": 136874, "epoch": 3258} {"train_loss": -6.70068883895874, "global_step": 136875, "epoch": 3258} {"train_loss": -6.630932807922363, "global_step": 136876, "epoch": 3258} {"train_loss": -6.678425709406535, "global_step": 136877, "epoch": 3258, "val_loss": 68182.5546875} {"train_loss": -6.701333999633789, "global_step": 136878, "epoch": 3259} {"train_loss": -6.7278313636779785, "global_step": 136879, "epoch": 3259} {"train_loss": -6.803670883178711, "global_step": 136880, "epoch": 3259} {"train_loss": -6.725896835327148, "global_step": 136881, "epoch": 3259} {"train_loss": -6.6717424392700195, "global_step": 136882, "epoch": 3259} {"train_loss": -6.765403747558594, "global_step": 136883, "epoch": 3259} {"train_loss": -6.802550315856934, "global_step": 136884, "epoch": 3259} {"train_loss": -6.693097114562988, "global_step": 136885, "epoch": 3259} {"train_loss": -6.701585292816162, "global_step": 136886, "epoch": 3259} {"train_loss": -6.782468795776367, "global_step": 136887, "epoch": 3259} {"train_loss": -6.683965682983398, "global_step": 136888, "epoch": 3259} {"train_loss": -6.731708526611328, "global_step": 136889, "epoch": 3259} {"train_loss": -6.778806686401367, "global_step": 136890, "epoch": 3259} {"train_loss": -6.719226837158203, "global_step": 136891, "epoch": 3259} {"train_loss": -6.814128398895264, "global_step": 136892, "epoch": 3259} {"train_loss": -6.77310037612915, "global_step": 136893, "epoch": 3259} {"train_loss": -6.843626976013184, "global_step": 136894, "epoch": 3259} {"train_loss": -6.766043663024902, "global_step": 136895, "epoch": 3259} {"train_loss": -6.63682746887207, "global_step": 136896, "epoch": 3259} {"train_loss": -6.692841529846191, "global_step": 136897, "epoch": 3259} {"train_loss": -6.661045074462891, "global_step": 136898, "epoch": 3259} {"train_loss": -6.689210891723633, "global_step": 136899, "epoch": 3259} {"train_loss": -6.705510139465332, "global_step": 136900, "epoch": 3259} {"train_loss": -6.674818992614746, "global_step": 136901, "epoch": 3259} {"train_loss": -6.6362738609313965, "global_step": 136902, "epoch": 3259} {"train_loss": -6.748372554779053, "global_step": 136903, "epoch": 3259} {"train_loss": -6.7153706550598145, "global_step": 136904, "epoch": 3259} {"train_loss": -6.638008117675781, "global_step": 136905, "epoch": 3259} {"train_loss": -6.7487616539001465, "global_step": 136906, "epoch": 3259} {"train_loss": -6.795012950897217, "global_step": 136907, "epoch": 3259} {"train_loss": -6.714694976806641, "global_step": 136908, "epoch": 3259} {"train_loss": -6.676322937011719, "global_step": 136909, "epoch": 3259} {"train_loss": -6.7716522216796875, "global_step": 136910, "epoch": 3259} {"train_loss": -6.567236423492432, "global_step": 136911, "epoch": 3259} {"train_loss": -6.763023853302002, "global_step": 136912, "epoch": 3259} {"train_loss": -6.782999515533447, "global_step": 136913, "epoch": 3259} {"train_loss": -6.642483711242676, "global_step": 136914, "epoch": 3259} {"train_loss": -6.657641410827637, "global_step": 136915, "epoch": 3259} {"train_loss": -6.651274681091309, "global_step": 136916, "epoch": 3259} {"train_loss": -6.734360218048096, "global_step": 136917, "epoch": 3259} {"train_loss": -6.864006996154785, "global_step": 136918, "epoch": 3259} {"train_loss": -6.721232641310919, "global_step": 136919, "epoch": 3259, "val_loss": 68119.625} {"train_loss": -6.813778877258301, "global_step": 136920, "epoch": 3260} {"train_loss": -6.822397232055664, "global_step": 136921, "epoch": 3260} {"train_loss": -6.851140022277832, "global_step": 136922, "epoch": 3260} {"train_loss": -6.780759811401367, "global_step": 136923, "epoch": 3260} {"train_loss": -6.731951713562012, "global_step": 136924, "epoch": 3260} {"train_loss": -6.708784103393555, "global_step": 136925, "epoch": 3260} {"train_loss": -6.756038665771484, "global_step": 136926, "epoch": 3260} {"train_loss": -6.828821182250977, "global_step": 136927, "epoch": 3260} {"train_loss": -6.6258440017700195, "global_step": 136928, "epoch": 3260} {"train_loss": -6.716896057128906, "global_step": 136929, "epoch": 3260} {"train_loss": -6.75632381439209, "global_step": 136930, "epoch": 3260} {"train_loss": -6.75306510925293, "global_step": 136931, "epoch": 3260} {"train_loss": -6.6954851150512695, "global_step": 136932, "epoch": 3260} {"train_loss": -6.765433311462402, "global_step": 136933, "epoch": 3260} {"train_loss": -6.772335052490234, "global_step": 136934, "epoch": 3260} {"train_loss": -6.658165454864502, "global_step": 136935, "epoch": 3260} {"train_loss": -6.791759967803955, "global_step": 136936, "epoch": 3260} {"train_loss": -6.770449161529541, "global_step": 136937, "epoch": 3260} {"train_loss": -6.715287208557129, "global_step": 136938, "epoch": 3260} {"train_loss": -6.744093418121338, "global_step": 136939, "epoch": 3260} {"train_loss": -6.706480026245117, "global_step": 136940, "epoch": 3260} {"train_loss": -6.577411651611328, "global_step": 136941, "epoch": 3260} {"train_loss": -6.653365135192871, "global_step": 136942, "epoch": 3260} {"train_loss": -6.677386283874512, "global_step": 136943, "epoch": 3260} {"train_loss": -6.622052192687988, "global_step": 136944, "epoch": 3260} {"train_loss": -6.595576286315918, "global_step": 136945, "epoch": 3260} {"train_loss": -6.589995384216309, "global_step": 136946, "epoch": 3260} {"train_loss": -6.6931962966918945, "global_step": 136947, "epoch": 3260} {"train_loss": -6.611112594604492, "global_step": 136948, "epoch": 3260} {"train_loss": -6.696413040161133, "global_step": 136949, "epoch": 3260} {"train_loss": -6.681185245513916, "global_step": 136950, "epoch": 3260} {"train_loss": -6.730836868286133, "global_step": 136951, "epoch": 3260} {"train_loss": -6.625896453857422, "global_step": 136952, "epoch": 3260} {"train_loss": -6.593412399291992, "global_step": 136953, "epoch": 3260} {"train_loss": -6.6945319175720215, "global_step": 136954, "epoch": 3260} {"train_loss": -6.778232574462891, "global_step": 136955, "epoch": 3260} {"train_loss": -6.607178688049316, "global_step": 136956, "epoch": 3260} {"train_loss": -6.714852809906006, "global_step": 136957, "epoch": 3260} {"train_loss": -6.60009765625, "global_step": 136958, "epoch": 3260} {"train_loss": -6.728255271911621, "global_step": 136959, "epoch": 3260} {"train_loss": -6.777677536010742, "global_step": 136960, "epoch": 3260} {"train_loss": -6.7075060322171165, "global_step": 136961, "epoch": 3260, "val_loss": 68281.3125} {"train_loss": -6.779473304748535, "global_step": 136962, "epoch": 3261} {"train_loss": -6.648440837860107, "global_step": 136963, "epoch": 3261} {"train_loss": -6.742697715759277, "global_step": 136964, "epoch": 3261} {"train_loss": -6.695093631744385, "global_step": 136965, "epoch": 3261} {"train_loss": -6.684591770172119, "global_step": 136966, "epoch": 3261} {"train_loss": -6.617212295532227, "global_step": 136967, "epoch": 3261} {"train_loss": -6.708743572235107, "global_step": 136968, "epoch": 3261} {"train_loss": -6.626163482666016, "global_step": 136969, "epoch": 3261} {"train_loss": -6.714942932128906, "global_step": 136970, "epoch": 3261} {"train_loss": -6.763143539428711, "global_step": 136971, "epoch": 3261} {"train_loss": -6.828167915344238, "global_step": 136972, "epoch": 3261} {"train_loss": -6.661838531494141, "global_step": 136973, "epoch": 3261} {"train_loss": -6.775035858154297, "global_step": 136974, "epoch": 3261} {"train_loss": -6.767496585845947, "global_step": 136975, "epoch": 3261} {"train_loss": -6.689054012298584, "global_step": 136976, "epoch": 3261} {"train_loss": -6.752110004425049, "global_step": 136977, "epoch": 3261} {"train_loss": -6.797558784484863, "global_step": 136978, "epoch": 3261} {"train_loss": -6.808534622192383, "global_step": 136979, "epoch": 3261} {"train_loss": -6.6183180809021, "global_step": 136980, "epoch": 3261} {"train_loss": -6.687640190124512, "global_step": 136981, "epoch": 3261} {"train_loss": -6.709628582000732, "global_step": 136982, "epoch": 3261} {"train_loss": -6.754602909088135, "global_step": 136983, "epoch": 3261} {"train_loss": -6.711679458618164, "global_step": 136984, "epoch": 3261} {"train_loss": -6.731640815734863, "global_step": 136985, "epoch": 3261} {"train_loss": -6.769092559814453, "global_step": 136986, "epoch": 3261} {"train_loss": -6.71751594543457, "global_step": 136987, "epoch": 3261} {"train_loss": -6.736703872680664, "global_step": 136988, "epoch": 3261} {"train_loss": -6.606889724731445, "global_step": 136989, "epoch": 3261} {"train_loss": -6.622262477874756, "global_step": 136990, "epoch": 3261} {"train_loss": -6.743814468383789, "global_step": 136991, "epoch": 3261} {"train_loss": -6.793938636779785, "global_step": 136992, "epoch": 3261} {"train_loss": -6.608362197875977, "global_step": 136993, "epoch": 3261} {"train_loss": -6.679953575134277, "global_step": 136994, "epoch": 3261} {"train_loss": -6.731346130371094, "global_step": 136995, "epoch": 3261} {"train_loss": -6.681501388549805, "global_step": 136996, "epoch": 3261} {"train_loss": -6.666938781738281, "global_step": 136997, "epoch": 3261} {"train_loss": -6.7989959716796875, "global_step": 136998, "epoch": 3261} {"train_loss": -6.711861610412598, "global_step": 136999, "epoch": 3261} {"train_loss": -6.637440204620361, "global_step": 137000, "epoch": 3261} {"train_loss": -6.670895099639893, "global_step": 137001, "epoch": 3261} {"train_loss": -6.782422065734863, "global_step": 137002, "epoch": 3261} {"train_loss": -6.714286304655529, "global_step": 137003, "epoch": 3261, "val_loss": 68273.1484375} {"train_loss": -6.660667419433594, "global_step": 137004, "epoch": 3262} {"train_loss": -6.749633312225342, "global_step": 137005, "epoch": 3262} {"train_loss": -6.767481803894043, "global_step": 137006, "epoch": 3262} {"train_loss": -6.772706985473633, "global_step": 137007, "epoch": 3262} {"train_loss": -6.6754279136657715, "global_step": 137008, "epoch": 3262} {"train_loss": -6.749248504638672, "global_step": 137009, "epoch": 3262} {"train_loss": -6.674138069152832, "global_step": 137010, "epoch": 3262} {"train_loss": -6.786169052124023, "global_step": 137011, "epoch": 3262} {"train_loss": -6.680815696716309, "global_step": 137012, "epoch": 3262} {"train_loss": -6.772558212280273, "global_step": 137013, "epoch": 3262} {"train_loss": -6.75596809387207, "global_step": 137014, "epoch": 3262} {"train_loss": -6.714198112487793, "global_step": 137015, "epoch": 3262} {"train_loss": -6.622167110443115, "global_step": 137016, "epoch": 3262} {"train_loss": -6.710887908935547, "global_step": 137017, "epoch": 3262} {"train_loss": -6.670869827270508, "global_step": 137018, "epoch": 3262} {"train_loss": -6.607378005981445, "global_step": 137019, "epoch": 3262} {"train_loss": -6.627688884735107, "global_step": 137020, "epoch": 3262} {"train_loss": -6.699700355529785, "global_step": 137021, "epoch": 3262} {"train_loss": -6.678399085998535, "global_step": 137022, "epoch": 3262} {"train_loss": -6.684773921966553, "global_step": 137023, "epoch": 3262} {"train_loss": -6.630544662475586, "global_step": 137024, "epoch": 3262} {"train_loss": -6.62941837310791, "global_step": 137025, "epoch": 3262} {"train_loss": -6.652682304382324, "global_step": 137026, "epoch": 3262} {"train_loss": -6.657461166381836, "global_step": 137027, "epoch": 3262} {"train_loss": -6.737507343292236, "global_step": 137028, "epoch": 3262} {"train_loss": -6.663253307342529, "global_step": 137029, "epoch": 3262} {"train_loss": -6.663992881774902, "global_step": 137030, "epoch": 3262} {"train_loss": -6.611100196838379, "global_step": 137031, "epoch": 3262} {"train_loss": -6.733838081359863, "global_step": 137032, "epoch": 3262} {"train_loss": -6.673056602478027, "global_step": 137033, "epoch": 3262} {"train_loss": -6.620421886444092, "global_step": 137034, "epoch": 3262} {"train_loss": -6.7319817543029785, "global_step": 137035, "epoch": 3262} {"train_loss": -6.609472751617432, "global_step": 137036, "epoch": 3262} {"train_loss": -6.7491774559021, "global_step": 137037, "epoch": 3262} {"train_loss": -6.676522731781006, "global_step": 137038, "epoch": 3262} {"train_loss": -6.568943500518799, "global_step": 137039, "epoch": 3262} {"train_loss": -6.7701568603515625, "global_step": 137040, "epoch": 3262} {"train_loss": -6.679452896118164, "global_step": 137041, "epoch": 3262} {"train_loss": -6.765554428100586, "global_step": 137042, "epoch": 3262} {"train_loss": -6.636468887329102, "global_step": 137043, "epoch": 3262} {"train_loss": -6.629892349243164, "global_step": 137044, "epoch": 3262} {"train_loss": -6.686447756631034, "global_step": 137045, "epoch": 3262, "val_loss": 68298.4140625} {"train_loss": -6.589847564697266, "global_step": 137046, "epoch": 3263} {"train_loss": -6.7470703125, "global_step": 137047, "epoch": 3263} {"train_loss": -6.609961986541748, "global_step": 137048, "epoch": 3263} {"train_loss": -6.692920207977295, "global_step": 137049, "epoch": 3263} {"train_loss": -6.706607818603516, "global_step": 137050, "epoch": 3263} {"train_loss": -6.60788631439209, "global_step": 137051, "epoch": 3263} {"train_loss": -6.723523139953613, "global_step": 137052, "epoch": 3263} {"train_loss": -6.615849494934082, "global_step": 137053, "epoch": 3263} {"train_loss": -6.779708385467529, "global_step": 137054, "epoch": 3263} {"train_loss": -6.795185089111328, "global_step": 137055, "epoch": 3263} {"train_loss": -6.617198944091797, "global_step": 137056, "epoch": 3263} {"train_loss": -6.7115631103515625, "global_step": 137057, "epoch": 3263} {"train_loss": -6.691660404205322, "global_step": 137058, "epoch": 3263} {"train_loss": -6.741914749145508, "global_step": 137059, "epoch": 3263} {"train_loss": -6.707174777984619, "global_step": 137060, "epoch": 3263} {"train_loss": -6.665657997131348, "global_step": 137061, "epoch": 3263} {"train_loss": -6.7305803298950195, "global_step": 137062, "epoch": 3263} {"train_loss": -6.800564765930176, "global_step": 137063, "epoch": 3263} {"train_loss": -6.7523298263549805, "global_step": 137064, "epoch": 3263} {"train_loss": -6.6836748123168945, "global_step": 137065, "epoch": 3263} {"train_loss": -6.712265968322754, "global_step": 137066, "epoch": 3263} {"train_loss": -6.596022605895996, "global_step": 137067, "epoch": 3263} {"train_loss": -6.715511798858643, "global_step": 137068, "epoch": 3263} {"train_loss": -6.62699556350708, "global_step": 137069, "epoch": 3263} {"train_loss": -6.6342644691467285, "global_step": 137070, "epoch": 3263} {"train_loss": -6.86478328704834, "global_step": 137071, "epoch": 3263} {"train_loss": -6.725728511810303, "global_step": 137072, "epoch": 3263} {"train_loss": -6.660141468048096, "global_step": 137073, "epoch": 3263} {"train_loss": -6.6001129150390625, "global_step": 137074, "epoch": 3263} {"train_loss": -6.706722259521484, "global_step": 137075, "epoch": 3263} {"train_loss": -6.617990493774414, "global_step": 137076, "epoch": 3263} {"train_loss": -6.763439178466797, "global_step": 137077, "epoch": 3263} {"train_loss": -6.657762050628662, "global_step": 137078, "epoch": 3263} {"train_loss": -6.683874130249023, "global_step": 137079, "epoch": 3263} {"train_loss": -6.689723968505859, "global_step": 137080, "epoch": 3263} {"train_loss": -6.660292625427246, "global_step": 137081, "epoch": 3263} {"train_loss": -6.705435752868652, "global_step": 137082, "epoch": 3263} {"train_loss": -6.694602012634277, "global_step": 137083, "epoch": 3263} {"train_loss": -6.783456802368164, "global_step": 137084, "epoch": 3263} {"train_loss": -6.5864787101745605, "global_step": 137085, "epoch": 3263} {"train_loss": -6.816160202026367, "global_step": 137086, "epoch": 3263} {"train_loss": -6.6970331101190474, "global_step": 137087, "epoch": 3263, "val_loss": 68192.1328125} {"train_loss": -6.8586835861206055, "global_step": 137088, "epoch": 3264} {"train_loss": -6.787689208984375, "global_step": 137089, "epoch": 3264} {"train_loss": -6.7263102531433105, "global_step": 137090, "epoch": 3264} {"train_loss": -6.710875511169434, "global_step": 137091, "epoch": 3264} {"train_loss": -6.747990608215332, "global_step": 137092, "epoch": 3264} {"train_loss": -6.637345314025879, "global_step": 137093, "epoch": 3264} {"train_loss": -6.90410041809082, "global_step": 137094, "epoch": 3264} {"train_loss": -6.764247417449951, "global_step": 137095, "epoch": 3264} {"train_loss": -6.689242362976074, "global_step": 137096, "epoch": 3264} {"train_loss": -6.665271759033203, "global_step": 137097, "epoch": 3264} {"train_loss": -6.772004127502441, "global_step": 137098, "epoch": 3264} {"train_loss": -6.688920974731445, "global_step": 137099, "epoch": 3264} {"train_loss": -6.706350326538086, "global_step": 137100, "epoch": 3264} {"train_loss": -6.8256025314331055, "global_step": 137101, "epoch": 3264} {"train_loss": -6.625565528869629, "global_step": 137102, "epoch": 3264} {"train_loss": -6.605782985687256, "global_step": 137103, "epoch": 3264} {"train_loss": -6.740915298461914, "global_step": 137104, "epoch": 3264} {"train_loss": -6.7426910400390625, "global_step": 137105, "epoch": 3264} {"train_loss": -6.636314868927002, "global_step": 137106, "epoch": 3264} {"train_loss": -6.779629707336426, "global_step": 137107, "epoch": 3264} {"train_loss": -6.63408899307251, "global_step": 137108, "epoch": 3264} {"train_loss": -6.676187515258789, "global_step": 137109, "epoch": 3264} {"train_loss": -6.671281337738037, "global_step": 137110, "epoch": 3264} {"train_loss": -6.697985649108887, "global_step": 137111, "epoch": 3264} {"train_loss": -6.713420391082764, "global_step": 137112, "epoch": 3264} {"train_loss": -6.5865583419799805, "global_step": 137113, "epoch": 3264} {"train_loss": -6.533349990844727, "global_step": 137114, "epoch": 3264} {"train_loss": -6.595423698425293, "global_step": 137115, "epoch": 3264} {"train_loss": -6.664772033691406, "global_step": 137116, "epoch": 3264} {"train_loss": -6.618852615356445, "global_step": 137117, "epoch": 3264} {"train_loss": -6.571254253387451, "global_step": 137118, "epoch": 3264} {"train_loss": -6.707286834716797, "global_step": 137119, "epoch": 3264} {"train_loss": -6.594560623168945, "global_step": 137120, "epoch": 3264} {"train_loss": -6.558542251586914, "global_step": 137121, "epoch": 3264} {"train_loss": -6.6070756912231445, "global_step": 137122, "epoch": 3264} {"train_loss": -6.647424221038818, "global_step": 137123, "epoch": 3264} {"train_loss": -6.711848258972168, "global_step": 137124, "epoch": 3264} {"train_loss": -6.678936004638672, "global_step": 137125, "epoch": 3264} {"train_loss": -6.63734769821167, "global_step": 137126, "epoch": 3264} {"train_loss": -6.692220687866211, "global_step": 137127, "epoch": 3264} {"train_loss": -6.702458381652832, "global_step": 137128, "epoch": 3264} {"train_loss": -6.686163152967181, "global_step": 137129, "epoch": 3264, "val_loss": 68253.9609375} {"train_loss": -6.669706344604492, "global_step": 137130, "epoch": 3265} {"train_loss": -6.6984100341796875, "global_step": 137131, "epoch": 3265} {"train_loss": -6.618117332458496, "global_step": 137132, "epoch": 3265} {"train_loss": -6.765813827514648, "global_step": 137133, "epoch": 3265} {"train_loss": -6.793831825256348, "global_step": 137134, "epoch": 3265} {"train_loss": -6.748729705810547, "global_step": 137135, "epoch": 3265} {"train_loss": -6.672697067260742, "global_step": 137136, "epoch": 3265} {"train_loss": -6.735371112823486, "global_step": 137137, "epoch": 3265} {"train_loss": -6.7780375480651855, "global_step": 137138, "epoch": 3265} {"train_loss": -6.730167388916016, "global_step": 137139, "epoch": 3265} {"train_loss": -6.716643333435059, "global_step": 137140, "epoch": 3265} {"train_loss": -6.764764785766602, "global_step": 137141, "epoch": 3265} {"train_loss": -6.6931352615356445, "global_step": 137142, "epoch": 3265} {"train_loss": -6.784419059753418, "global_step": 137143, "epoch": 3265} {"train_loss": -6.773345470428467, "global_step": 137144, "epoch": 3265} {"train_loss": -6.719266891479492, "global_step": 137145, "epoch": 3265} {"train_loss": -6.641472339630127, "global_step": 137146, "epoch": 3265} {"train_loss": -6.641225814819336, "global_step": 137147, "epoch": 3265} {"train_loss": -6.717249870300293, "global_step": 137148, "epoch": 3265} {"train_loss": -6.486814975738525, "global_step": 137149, "epoch": 3265} {"train_loss": -6.6630096435546875, "global_step": 137150, "epoch": 3265} {"train_loss": -6.6398234367370605, "global_step": 137151, "epoch": 3265} {"train_loss": -6.546239852905273, "global_step": 137152, "epoch": 3265} {"train_loss": -6.775175094604492, "global_step": 137153, "epoch": 3265} {"train_loss": -6.656808376312256, "global_step": 137154, "epoch": 3265} {"train_loss": -6.773425102233887, "global_step": 137155, "epoch": 3265} {"train_loss": -6.67213249206543, "global_step": 137156, "epoch": 3265} {"train_loss": -6.671303749084473, "global_step": 137157, "epoch": 3265} {"train_loss": -6.72955322265625, "global_step": 137158, "epoch": 3265} {"train_loss": -6.658985137939453, "global_step": 137159, "epoch": 3265} {"train_loss": -6.622837543487549, "global_step": 137160, "epoch": 3265} {"train_loss": -6.736556053161621, "global_step": 137161, "epoch": 3265} {"train_loss": -6.672738075256348, "global_step": 137162, "epoch": 3265} {"train_loss": -6.706801414489746, "global_step": 137163, "epoch": 3265} {"train_loss": -6.6204328536987305, "global_step": 137164, "epoch": 3265} {"train_loss": -6.680160999298096, "global_step": 137165, "epoch": 3265} {"train_loss": -6.799508094787598, "global_step": 137166, "epoch": 3265} {"train_loss": -6.633222579956055, "global_step": 137167, "epoch": 3265} {"train_loss": -6.856884479522705, "global_step": 137168, "epoch": 3265} {"train_loss": -6.571375846862793, "global_step": 137169, "epoch": 3265} {"train_loss": -6.636726379394531, "global_step": 137170, "epoch": 3265} {"train_loss": -6.696680659339542, "global_step": 137171, "epoch": 3265, "val_loss": 68398.9453125} {"train_loss": -6.61494779586792, "global_step": 137172, "epoch": 3266} {"train_loss": -6.560730934143066, "global_step": 137173, "epoch": 3266} {"train_loss": -6.629701614379883, "global_step": 137174, "epoch": 3266} {"train_loss": -6.727629661560059, "global_step": 137175, "epoch": 3266} {"train_loss": -6.709331512451172, "global_step": 137176, "epoch": 3266} {"train_loss": -6.629781723022461, "global_step": 137177, "epoch": 3266} {"train_loss": -6.641404151916504, "global_step": 137178, "epoch": 3266} {"train_loss": -6.654600620269775, "global_step": 137179, "epoch": 3266} {"train_loss": -6.6135077476501465, "global_step": 137180, "epoch": 3266} {"train_loss": -6.585784912109375, "global_step": 137181, "epoch": 3266} {"train_loss": -6.678966522216797, "global_step": 137182, "epoch": 3266} {"train_loss": -6.49708366394043, "global_step": 137183, "epoch": 3266} {"train_loss": -6.494167327880859, "global_step": 137184, "epoch": 3266} {"train_loss": -6.659202575683594, "global_step": 137185, "epoch": 3266} {"train_loss": -6.601524829864502, "global_step": 137186, "epoch": 3266} {"train_loss": -6.564539909362793, "global_step": 137187, "epoch": 3266} {"train_loss": -6.727415561676025, "global_step": 137188, "epoch": 3266} {"train_loss": -6.721445083618164, "global_step": 137189, "epoch": 3266} {"train_loss": -6.791252613067627, "global_step": 137190, "epoch": 3266} {"train_loss": -6.633859157562256, "global_step": 137191, "epoch": 3266} {"train_loss": -6.700071811676025, "global_step": 137192, "epoch": 3266} {"train_loss": -6.576658248901367, "global_step": 137193, "epoch": 3266} {"train_loss": -6.609203338623047, "global_step": 137194, "epoch": 3266} {"train_loss": -6.663539886474609, "global_step": 137195, "epoch": 3266} {"train_loss": -6.517674446105957, "global_step": 137196, "epoch": 3266} {"train_loss": -6.737302303314209, "global_step": 137197, "epoch": 3266} {"train_loss": -6.534302234649658, "global_step": 137198, "epoch": 3266} {"train_loss": -6.559035301208496, "global_step": 137199, "epoch": 3266} {"train_loss": -6.553439140319824, "global_step": 137200, "epoch": 3266} {"train_loss": -6.559530258178711, "global_step": 137201, "epoch": 3266} {"train_loss": -6.495998382568359, "global_step": 137202, "epoch": 3266} {"train_loss": -6.642852306365967, "global_step": 137203, "epoch": 3266} {"train_loss": -6.538416862487793, "global_step": 137204, "epoch": 3266} {"train_loss": -6.715841293334961, "global_step": 137205, "epoch": 3266} {"train_loss": -6.646151542663574, "global_step": 137206, "epoch": 3266} {"train_loss": -6.629591941833496, "global_step": 137207, "epoch": 3266} {"train_loss": -6.714384078979492, "global_step": 137208, "epoch": 3266} {"train_loss": -6.676797866821289, "global_step": 137209, "epoch": 3266} {"train_loss": -6.7123494148254395, "global_step": 137210, "epoch": 3266} {"train_loss": -6.765605926513672, "global_step": 137211, "epoch": 3266} {"train_loss": -6.562701225280762, "global_step": 137212, "epoch": 3266} {"train_loss": -6.631600118818737, "global_step": 137213, "epoch": 3266, "val_loss": 68519.3125} {"train_loss": -6.666082859039307, "global_step": 137214, "epoch": 3267} {"train_loss": -6.692817687988281, "global_step": 137215, "epoch": 3267} {"train_loss": -6.731422424316406, "global_step": 137216, "epoch": 3267} {"train_loss": -6.614250183105469, "global_step": 137217, "epoch": 3267} {"train_loss": -6.631683349609375, "global_step": 137218, "epoch": 3267} {"train_loss": -6.719564914703369, "global_step": 137219, "epoch": 3267} {"train_loss": -6.713647365570068, "global_step": 137220, "epoch": 3267} {"train_loss": -6.68141508102417, "global_step": 137221, "epoch": 3267} {"train_loss": -6.734031677246094, "global_step": 137222, "epoch": 3267} {"train_loss": -6.667433738708496, "global_step": 137223, "epoch": 3267} {"train_loss": -6.684928894042969, "global_step": 137224, "epoch": 3267} {"train_loss": -6.764464855194092, "global_step": 137225, "epoch": 3267} {"train_loss": -6.750783920288086, "global_step": 137226, "epoch": 3267} {"train_loss": -6.595999717712402, "global_step": 137227, "epoch": 3267} {"train_loss": -6.752783298492432, "global_step": 137228, "epoch": 3267} {"train_loss": -6.635161399841309, "global_step": 137229, "epoch": 3267} {"train_loss": -6.670095443725586, "global_step": 137230, "epoch": 3267} {"train_loss": -6.775373458862305, "global_step": 137231, "epoch": 3267} {"train_loss": -6.751547813415527, "global_step": 137232, "epoch": 3267} {"train_loss": -6.813494682312012, "global_step": 137233, "epoch": 3267} {"train_loss": -6.667679309844971, "global_step": 137234, "epoch": 3267} {"train_loss": -6.593686103820801, "global_step": 137235, "epoch": 3267} {"train_loss": -6.729013442993164, "global_step": 137236, "epoch": 3267} {"train_loss": -6.749115943908691, "global_step": 137237, "epoch": 3267} {"train_loss": -6.7388715744018555, "global_step": 137238, "epoch": 3267} {"train_loss": -6.768033027648926, "global_step": 137239, "epoch": 3267} {"train_loss": -6.736725807189941, "global_step": 137240, "epoch": 3267} {"train_loss": -6.8017425537109375, "global_step": 137241, "epoch": 3267} {"train_loss": -6.777744293212891, "global_step": 137242, "epoch": 3267} {"train_loss": -6.6565680503845215, "global_step": 137243, "epoch": 3267} {"train_loss": -6.722430229187012, "global_step": 137244, "epoch": 3267} {"train_loss": -6.672883033752441, "global_step": 137245, "epoch": 3267} {"train_loss": -6.70991849899292, "global_step": 137246, "epoch": 3267} {"train_loss": -6.699148178100586, "global_step": 137247, "epoch": 3267} {"train_loss": -6.6230597496032715, "global_step": 137248, "epoch": 3267} {"train_loss": -6.536085605621338, "global_step": 137249, "epoch": 3267} {"train_loss": -6.7752838134765625, "global_step": 137250, "epoch": 3267} {"train_loss": -6.612510681152344, "global_step": 137251, "epoch": 3267} {"train_loss": -6.5919647216796875, "global_step": 137252, "epoch": 3267} {"train_loss": -6.750369071960449, "global_step": 137253, "epoch": 3267} {"train_loss": -6.576041221618652, "global_step": 137254, "epoch": 3267} {"train_loss": -6.693677277792068, "global_step": 137255, "epoch": 3267, "val_loss": 68459.9921875} {"train_loss": -6.605471134185791, "global_step": 137256, "epoch": 3268} {"train_loss": -6.5474934577941895, "global_step": 137257, "epoch": 3268} {"train_loss": -6.694138526916504, "global_step": 137258, "epoch": 3268} {"train_loss": -6.5446248054504395, "global_step": 137259, "epoch": 3268} {"train_loss": -6.498392105102539, "global_step": 137260, "epoch": 3268} {"train_loss": -6.515251159667969, "global_step": 137261, "epoch": 3268} {"train_loss": -6.513369083404541, "global_step": 137262, "epoch": 3268} {"train_loss": -6.627078056335449, "global_step": 137263, "epoch": 3268} {"train_loss": -6.616733551025391, "global_step": 137264, "epoch": 3268} {"train_loss": -6.592004299163818, "global_step": 137265, "epoch": 3268} {"train_loss": -6.656715393066406, "global_step": 137266, "epoch": 3268} {"train_loss": -6.591296195983887, "global_step": 137267, "epoch": 3268} {"train_loss": -6.656554698944092, "global_step": 137268, "epoch": 3268} {"train_loss": -6.635364055633545, "global_step": 137269, "epoch": 3268} {"train_loss": -6.7488017082214355, "global_step": 137270, "epoch": 3268} {"train_loss": -6.693777084350586, "global_step": 137271, "epoch": 3268} {"train_loss": -6.772487640380859, "global_step": 137272, "epoch": 3268} {"train_loss": -6.673237323760986, "global_step": 137273, "epoch": 3268} {"train_loss": -6.577634334564209, "global_step": 137274, "epoch": 3268} {"train_loss": -6.813800811767578, "global_step": 137275, "epoch": 3268} {"train_loss": -6.558537483215332, "global_step": 137276, "epoch": 3268} {"train_loss": -6.622071266174316, "global_step": 137277, "epoch": 3268} {"train_loss": -6.752781867980957, "global_step": 137278, "epoch": 3268} {"train_loss": -6.660272598266602, "global_step": 137279, "epoch": 3268} {"train_loss": -6.713364601135254, "global_step": 137280, "epoch": 3268} {"train_loss": -6.718262672424316, "global_step": 137281, "epoch": 3268} {"train_loss": -6.753046989440918, "global_step": 137282, "epoch": 3268} {"train_loss": -6.705717086791992, "global_step": 137283, "epoch": 3268} {"train_loss": -6.72385835647583, "global_step": 137284, "epoch": 3268} {"train_loss": -6.554465293884277, "global_step": 137285, "epoch": 3268} {"train_loss": -6.753769874572754, "global_step": 137286, "epoch": 3268} {"train_loss": -6.611187934875488, "global_step": 137287, "epoch": 3268} {"train_loss": -6.6688032150268555, "global_step": 137288, "epoch": 3268} {"train_loss": -6.6532368659973145, "global_step": 137289, "epoch": 3268} {"train_loss": -6.6733503341674805, "global_step": 137290, "epoch": 3268} {"train_loss": -6.6172261238098145, "global_step": 137291, "epoch": 3268} {"train_loss": -6.7293853759765625, "global_step": 137292, "epoch": 3268} {"train_loss": -6.720884323120117, "global_step": 137293, "epoch": 3268} {"train_loss": -6.715200901031494, "global_step": 137294, "epoch": 3268} {"train_loss": -6.670136451721191, "global_step": 137295, "epoch": 3268} {"train_loss": -6.70758056640625, "global_step": 137296, "epoch": 3268} {"train_loss": -6.657985562369937, "global_step": 137297, "epoch": 3268, "val_loss": 68638.6171875} {"train_loss": -6.6355791091918945, "global_step": 137298, "epoch": 3269} {"train_loss": -6.506854057312012, "global_step": 137299, "epoch": 3269} {"train_loss": -6.7031474113464355, "global_step": 137300, "epoch": 3269} {"train_loss": -6.712190628051758, "global_step": 137301, "epoch": 3269} {"train_loss": -6.712522029876709, "global_step": 137302, "epoch": 3269} {"train_loss": -6.636643886566162, "global_step": 137303, "epoch": 3269} {"train_loss": -6.649120330810547, "global_step": 137304, "epoch": 3269} {"train_loss": -6.67119026184082, "global_step": 137305, "epoch": 3269} {"train_loss": -6.767867565155029, "global_step": 137306, "epoch": 3269} {"train_loss": -6.734920978546143, "global_step": 137307, "epoch": 3269} {"train_loss": -6.619619369506836, "global_step": 137308, "epoch": 3269} {"train_loss": -6.625415325164795, "global_step": 137309, "epoch": 3269} {"train_loss": -6.741456508636475, "global_step": 137310, "epoch": 3269} {"train_loss": -6.609270095825195, "global_step": 137311, "epoch": 3269} {"train_loss": -6.692117214202881, "global_step": 137312, "epoch": 3269} {"train_loss": -6.56346321105957, "global_step": 137313, "epoch": 3269} {"train_loss": -6.666085720062256, "global_step": 137314, "epoch": 3269} {"train_loss": -6.705538749694824, "global_step": 137315, "epoch": 3269} {"train_loss": -6.739212512969971, "global_step": 137316, "epoch": 3269} {"train_loss": -6.63987922668457, "global_step": 137317, "epoch": 3269} {"train_loss": -6.535545825958252, "global_step": 137318, "epoch": 3269} {"train_loss": -6.679344177246094, "global_step": 137319, "epoch": 3269} {"train_loss": -6.645284652709961, "global_step": 137320, "epoch": 3269} {"train_loss": -6.761416435241699, "global_step": 137321, "epoch": 3269} {"train_loss": -6.616691589355469, "global_step": 137322, "epoch": 3269} {"train_loss": -6.644715785980225, "global_step": 137323, "epoch": 3269} {"train_loss": -6.679558277130127, "global_step": 137324, "epoch": 3269} {"train_loss": -6.529061794281006, "global_step": 137325, "epoch": 3269} {"train_loss": -6.59152889251709, "global_step": 137326, "epoch": 3269} {"train_loss": -6.78908634185791, "global_step": 137327, "epoch": 3269} {"train_loss": -6.735886096954346, "global_step": 137328, "epoch": 3269} {"train_loss": -6.792353630065918, "global_step": 137329, "epoch": 3269} {"train_loss": -6.595909118652344, "global_step": 137330, "epoch": 3269} {"train_loss": -6.690443515777588, "global_step": 137331, "epoch": 3269} {"train_loss": -6.655097007751465, "global_step": 137332, "epoch": 3269} {"train_loss": -6.705537796020508, "global_step": 137333, "epoch": 3269} {"train_loss": -6.606664180755615, "global_step": 137334, "epoch": 3269} {"train_loss": -6.625861167907715, "global_step": 137335, "epoch": 3269} {"train_loss": -6.679043292999268, "global_step": 137336, "epoch": 3269} {"train_loss": -6.712231636047363, "global_step": 137337, "epoch": 3269} {"train_loss": -6.694518566131592, "global_step": 137338, "epoch": 3269} {"train_loss": -6.667338757287888, "global_step": 137339, "epoch": 3269, "val_loss": 68413.6875} {"train_loss": -6.599484920501709, "global_step": 137340, "epoch": 3270} {"train_loss": -6.566618919372559, "global_step": 137341, "epoch": 3270} {"train_loss": -6.690607070922852, "global_step": 137342, "epoch": 3270} {"train_loss": -6.787389755249023, "global_step": 137343, "epoch": 3270} {"train_loss": -6.77894926071167, "global_step": 137344, "epoch": 3270} {"train_loss": -6.5601606369018555, "global_step": 137345, "epoch": 3270} {"train_loss": -6.654728889465332, "global_step": 137346, "epoch": 3270} {"train_loss": -6.651266098022461, "global_step": 137347, "epoch": 3270} {"train_loss": -6.679416179656982, "global_step": 137348, "epoch": 3270} {"train_loss": -6.762189865112305, "global_step": 137349, "epoch": 3270} {"train_loss": -6.675854682922363, "global_step": 137350, "epoch": 3270} {"train_loss": -6.640711784362793, "global_step": 137351, "epoch": 3270} {"train_loss": -6.595898151397705, "global_step": 137352, "epoch": 3270} {"train_loss": -6.621136665344238, "global_step": 137353, "epoch": 3270} {"train_loss": -6.524714469909668, "global_step": 137354, "epoch": 3270} {"train_loss": -6.655817031860352, "global_step": 137355, "epoch": 3270} {"train_loss": -6.70970344543457, "global_step": 137356, "epoch": 3270} {"train_loss": -6.651451110839844, "global_step": 137357, "epoch": 3270} {"train_loss": -6.646839618682861, "global_step": 137358, "epoch": 3270} {"train_loss": -6.679549217224121, "global_step": 137359, "epoch": 3270} {"train_loss": -6.652411460876465, "global_step": 137360, "epoch": 3270} {"train_loss": -6.705825328826904, "global_step": 137361, "epoch": 3270} {"train_loss": -6.682567596435547, "global_step": 137362, "epoch": 3270} {"train_loss": -6.749650001525879, "global_step": 137363, "epoch": 3270} {"train_loss": -6.575463771820068, "global_step": 137364, "epoch": 3270} {"train_loss": -6.7160186767578125, "global_step": 137365, "epoch": 3270} {"train_loss": -6.625688552856445, "global_step": 137366, "epoch": 3270} {"train_loss": -6.612253189086914, "global_step": 137367, "epoch": 3270} {"train_loss": -6.555340766906738, "global_step": 137368, "epoch": 3270} {"train_loss": -6.711369514465332, "global_step": 137369, "epoch": 3270} {"train_loss": -6.723468780517578, "global_step": 137370, "epoch": 3270} {"train_loss": -6.6602654457092285, "global_step": 137371, "epoch": 3270} {"train_loss": -6.6615214347839355, "global_step": 137372, "epoch": 3270} {"train_loss": -6.71631383895874, "global_step": 137373, "epoch": 3270} {"train_loss": -6.710542678833008, "global_step": 137374, "epoch": 3270} {"train_loss": -6.68994140625, "global_step": 137375, "epoch": 3270} {"train_loss": -6.787223815917969, "global_step": 137376, "epoch": 3270} {"train_loss": -6.632236480712891, "global_step": 137377, "epoch": 3270} {"train_loss": -6.787395477294922, "global_step": 137378, "epoch": 3270} {"train_loss": -6.751910209655762, "global_step": 137379, "epoch": 3270} {"train_loss": -6.7068190574646, "global_step": 137380, "epoch": 3270} {"train_loss": -6.673941476004464, "global_step": 137381, "epoch": 3270, "val_loss": 68254.0234375} {"train_loss": -6.680894374847412, "global_step": 137382, "epoch": 3271} {"train_loss": -6.694528579711914, "global_step": 137383, "epoch": 3271} {"train_loss": -6.722495079040527, "global_step": 137384, "epoch": 3271} {"train_loss": -6.7464141845703125, "global_step": 137385, "epoch": 3271} {"train_loss": -6.725890159606934, "global_step": 137386, "epoch": 3271} {"train_loss": -6.811261177062988, "global_step": 137387, "epoch": 3271} {"train_loss": -6.6995625495910645, "global_step": 137388, "epoch": 3271} {"train_loss": -6.721529483795166, "global_step": 137389, "epoch": 3271} {"train_loss": -6.754118919372559, "global_step": 137390, "epoch": 3271} {"train_loss": -6.740901947021484, "global_step": 137391, "epoch": 3271} {"train_loss": -6.671428680419922, "global_step": 137392, "epoch": 3271} {"train_loss": -6.820988655090332, "global_step": 137393, "epoch": 3271} {"train_loss": -6.804867267608643, "global_step": 137394, "epoch": 3271} {"train_loss": -6.691113471984863, "global_step": 137395, "epoch": 3271} {"train_loss": -6.735751628875732, "global_step": 137396, "epoch": 3271} {"train_loss": -6.6351094245910645, "global_step": 137397, "epoch": 3271} {"train_loss": -6.653831481933594, "global_step": 137398, "epoch": 3271} {"train_loss": -6.6233062744140625, "global_step": 137399, "epoch": 3271} {"train_loss": -6.698089599609375, "global_step": 137400, "epoch": 3271} {"train_loss": -6.659768104553223, "global_step": 137401, "epoch": 3271} {"train_loss": -6.652387619018555, "global_step": 137402, "epoch": 3271} {"train_loss": -6.6164116859436035, "global_step": 137403, "epoch": 3271} {"train_loss": -6.625566005706787, "global_step": 137404, "epoch": 3271} {"train_loss": -6.607405662536621, "global_step": 137405, "epoch": 3271} {"train_loss": -6.621697902679443, "global_step": 137406, "epoch": 3271} {"train_loss": -6.814009666442871, "global_step": 137407, "epoch": 3271} {"train_loss": -6.649389743804932, "global_step": 137408, "epoch": 3271} {"train_loss": -6.610015869140625, "global_step": 137409, "epoch": 3271} {"train_loss": -6.7220001220703125, "global_step": 137410, "epoch": 3271} {"train_loss": -6.566152572631836, "global_step": 137411, "epoch": 3271} {"train_loss": -6.672298431396484, "global_step": 137412, "epoch": 3271} {"train_loss": -6.605462074279785, "global_step": 137413, "epoch": 3271} {"train_loss": -6.605438709259033, "global_step": 137414, "epoch": 3271} {"train_loss": -6.669731140136719, "global_step": 137415, "epoch": 3271} {"train_loss": -6.624911308288574, "global_step": 137416, "epoch": 3271} {"train_loss": -6.740912914276123, "global_step": 137417, "epoch": 3271} {"train_loss": -6.577103614807129, "global_step": 137418, "epoch": 3271} {"train_loss": -6.590219497680664, "global_step": 137419, "epoch": 3271} {"train_loss": -6.703011512756348, "global_step": 137420, "epoch": 3271} {"train_loss": -6.636740207672119, "global_step": 137421, "epoch": 3271} {"train_loss": -6.776577949523926, "global_step": 137422, "epoch": 3271} {"train_loss": -6.682938848223005, "global_step": 137423, "epoch": 3271, "val_loss": 68245.484375} {"train_loss": -6.666675567626953, "global_step": 137424, "epoch": 3272} {"train_loss": -6.794015884399414, "global_step": 137425, "epoch": 3272} {"train_loss": -6.689056396484375, "global_step": 137426, "epoch": 3272} {"train_loss": -6.636891841888428, "global_step": 137427, "epoch": 3272} {"train_loss": -6.653801918029785, "global_step": 137428, "epoch": 3272} {"train_loss": -6.777327537536621, "global_step": 137429, "epoch": 3272} {"train_loss": -6.576747417449951, "global_step": 137430, "epoch": 3272} {"train_loss": -6.608860969543457, "global_step": 137431, "epoch": 3272} {"train_loss": -6.515716075897217, "global_step": 137432, "epoch": 3272} {"train_loss": -6.698134422302246, "global_step": 137433, "epoch": 3272} {"train_loss": -6.7848711013793945, "global_step": 137434, "epoch": 3272} {"train_loss": -6.643579959869385, "global_step": 137435, "epoch": 3272} {"train_loss": -6.798279762268066, "global_step": 137436, "epoch": 3272} {"train_loss": -6.6888203620910645, "global_step": 137437, "epoch": 3272} {"train_loss": -6.758292198181152, "global_step": 137438, "epoch": 3272} {"train_loss": -6.849152565002441, "global_step": 137439, "epoch": 3272} {"train_loss": -6.669344425201416, "global_step": 137440, "epoch": 3272} {"train_loss": -6.728219032287598, "global_step": 137441, "epoch": 3272} {"train_loss": -6.8138427734375, "global_step": 137442, "epoch": 3272} {"train_loss": -6.624222755432129, "global_step": 137443, "epoch": 3272} {"train_loss": -6.765429496765137, "global_step": 137444, "epoch": 3272} {"train_loss": -6.705011367797852, "global_step": 137445, "epoch": 3272} {"train_loss": -6.636192321777344, "global_step": 137446, "epoch": 3272} {"train_loss": -6.763829231262207, "global_step": 137447, "epoch": 3272} {"train_loss": -6.6582255363464355, "global_step": 137448, "epoch": 3272} {"train_loss": -6.741329193115234, "global_step": 137449, "epoch": 3272} {"train_loss": -6.798609733581543, "global_step": 137450, "epoch": 3272} {"train_loss": -6.6548380851745605, "global_step": 137451, "epoch": 3272} {"train_loss": -6.661479949951172, "global_step": 137452, "epoch": 3272} {"train_loss": -6.784017562866211, "global_step": 137453, "epoch": 3272} {"train_loss": -6.741399765014648, "global_step": 137454, "epoch": 3272} {"train_loss": -6.723446846008301, "global_step": 137455, "epoch": 3272} {"train_loss": -6.686138153076172, "global_step": 137456, "epoch": 3272} {"train_loss": -6.697423934936523, "global_step": 137457, "epoch": 3272} {"train_loss": -6.6829833984375, "global_step": 137458, "epoch": 3272} {"train_loss": -6.71715784072876, "global_step": 137459, "epoch": 3272} {"train_loss": -6.809096336364746, "global_step": 137460, "epoch": 3272} {"train_loss": -6.827040195465088, "global_step": 137461, "epoch": 3272} {"train_loss": -6.723141670227051, "global_step": 137462, "epoch": 3272} {"train_loss": -6.771216869354248, "global_step": 137463, "epoch": 3272} {"train_loss": -6.7159247398376465, "global_step": 137464, "epoch": 3272} {"train_loss": -6.716266813732329, "global_step": 137465, "epoch": 3272, "val_loss": 68274.75} {"train_loss": -6.736061096191406, "global_step": 137466, "epoch": 3273} {"train_loss": -6.796566963195801, "global_step": 137467, "epoch": 3273} {"train_loss": -6.652084827423096, "global_step": 137468, "epoch": 3273} {"train_loss": -6.808679580688477, "global_step": 137469, "epoch": 3273} {"train_loss": -6.817584991455078, "global_step": 137470, "epoch": 3273} {"train_loss": -6.685356140136719, "global_step": 137471, "epoch": 3273} {"train_loss": -6.778964042663574, "global_step": 137472, "epoch": 3273} {"train_loss": -6.794703483581543, "global_step": 137473, "epoch": 3273} {"train_loss": -6.7742390632629395, "global_step": 137474, "epoch": 3273} {"train_loss": -6.889153480529785, "global_step": 137475, "epoch": 3273} {"train_loss": -6.783225059509277, "global_step": 137476, "epoch": 3273} {"train_loss": -6.6521220207214355, "global_step": 137477, "epoch": 3273} {"train_loss": -6.759616374969482, "global_step": 137478, "epoch": 3273} {"train_loss": -6.677875518798828, "global_step": 137479, "epoch": 3273} {"train_loss": -6.725502014160156, "global_step": 137480, "epoch": 3273} {"train_loss": -6.61579704284668, "global_step": 137481, "epoch": 3273} {"train_loss": -6.75239896774292, "global_step": 137482, "epoch": 3273} {"train_loss": -6.761485576629639, "global_step": 137483, "epoch": 3273} {"train_loss": -6.801531791687012, "global_step": 137484, "epoch": 3273} {"train_loss": -6.744372844696045, "global_step": 137485, "epoch": 3273} {"train_loss": -6.7835187911987305, "global_step": 137486, "epoch": 3273} {"train_loss": -6.571034908294678, "global_step": 137487, "epoch": 3273} {"train_loss": -6.661311149597168, "global_step": 137488, "epoch": 3273} {"train_loss": -6.79172420501709, "global_step": 137489, "epoch": 3273} {"train_loss": -6.782759666442871, "global_step": 137490, "epoch": 3273} {"train_loss": -6.720335006713867, "global_step": 137491, "epoch": 3273} {"train_loss": -6.713694095611572, "global_step": 137492, "epoch": 3273} {"train_loss": -6.697233200073242, "global_step": 137493, "epoch": 3273} {"train_loss": -6.66996955871582, "global_step": 137494, "epoch": 3273} {"train_loss": -6.696335792541504, "global_step": 137495, "epoch": 3273} {"train_loss": -6.712832450866699, "global_step": 137496, "epoch": 3273} {"train_loss": -6.8065996170043945, "global_step": 137497, "epoch": 3273} {"train_loss": -6.65108585357666, "global_step": 137498, "epoch": 3273} {"train_loss": -6.694391250610352, "global_step": 137499, "epoch": 3273} {"train_loss": -6.672452926635742, "global_step": 137500, "epoch": 3273} {"train_loss": -6.6009907722473145, "global_step": 137501, "epoch": 3273} {"train_loss": -6.630537509918213, "global_step": 137502, "epoch": 3273} {"train_loss": -6.662140846252441, "global_step": 137503, "epoch": 3273} {"train_loss": -6.6271209716796875, "global_step": 137504, "epoch": 3273} {"train_loss": -6.564449787139893, "global_step": 137505, "epoch": 3273} {"train_loss": -6.660464763641357, "global_step": 137506, "epoch": 3273} {"train_loss": -6.714698916389828, "global_step": 137507, "epoch": 3273, "val_loss": 68407.328125} {"train_loss": -6.554841041564941, "global_step": 137508, "epoch": 3274} {"train_loss": -6.642396926879883, "global_step": 137509, "epoch": 3274} {"train_loss": -6.375584602355957, "global_step": 137510, "epoch": 3274} {"train_loss": -6.680080413818359, "global_step": 137511, "epoch": 3274} {"train_loss": -6.60325813293457, "global_step": 137512, "epoch": 3274} {"train_loss": -6.560159683227539, "global_step": 137513, "epoch": 3274} {"train_loss": -6.668473243713379, "global_step": 137514, "epoch": 3274} {"train_loss": -6.541170597076416, "global_step": 137515, "epoch": 3274} {"train_loss": -6.755983829498291, "global_step": 137516, "epoch": 3274} {"train_loss": -6.5495171546936035, "global_step": 137517, "epoch": 3274} {"train_loss": -6.6635026931762695, "global_step": 137518, "epoch": 3274} {"train_loss": -6.601310729980469, "global_step": 137519, "epoch": 3274} {"train_loss": -6.552156448364258, "global_step": 137520, "epoch": 3274} {"train_loss": -6.537441253662109, "global_step": 137521, "epoch": 3274} {"train_loss": -6.736978530883789, "global_step": 137522, "epoch": 3274} {"train_loss": -6.536359786987305, "global_step": 137523, "epoch": 3274} {"train_loss": -6.66090202331543, "global_step": 137524, "epoch": 3274} {"train_loss": -6.617057800292969, "global_step": 137525, "epoch": 3274} {"train_loss": -6.563327789306641, "global_step": 137526, "epoch": 3274} {"train_loss": -6.49686336517334, "global_step": 137527, "epoch": 3274} {"train_loss": -6.7824506759643555, "global_step": 137528, "epoch": 3274} {"train_loss": -6.723175525665283, "global_step": 137529, "epoch": 3274} {"train_loss": -6.777431488037109, "global_step": 137530, "epoch": 3274} {"train_loss": -6.849431037902832, "global_step": 137531, "epoch": 3274} {"train_loss": -6.558332443237305, "global_step": 137532, "epoch": 3274} {"train_loss": -6.661054611206055, "global_step": 137533, "epoch": 3274} {"train_loss": -6.717146396636963, "global_step": 137534, "epoch": 3274} {"train_loss": -6.686390399932861, "global_step": 137535, "epoch": 3274} {"train_loss": -6.783921241760254, "global_step": 137536, "epoch": 3274} {"train_loss": -6.521121025085449, "global_step": 137537, "epoch": 3274} {"train_loss": -6.696659088134766, "global_step": 137538, "epoch": 3274} {"train_loss": -6.636680603027344, "global_step": 137539, "epoch": 3274} {"train_loss": -6.760034561157227, "global_step": 137540, "epoch": 3274} {"train_loss": -6.68271541595459, "global_step": 137541, "epoch": 3274} {"train_loss": -6.739232063293457, "global_step": 137542, "epoch": 3274} {"train_loss": -6.675618648529053, "global_step": 137543, "epoch": 3274} {"train_loss": -6.641873836517334, "global_step": 137544, "epoch": 3274} {"train_loss": -6.800835132598877, "global_step": 137545, "epoch": 3274} {"train_loss": -6.678501605987549, "global_step": 137546, "epoch": 3274} {"train_loss": -6.755524635314941, "global_step": 137547, "epoch": 3274} {"train_loss": -6.793410301208496, "global_step": 137548, "epoch": 3274} {"train_loss": -6.656644378389631, "global_step": 137549, "epoch": 3274, "val_loss": 68214.03125} {"train_loss": -6.713884353637695, "global_step": 137550, "epoch": 3275} {"train_loss": -6.611774444580078, "global_step": 137551, "epoch": 3275} {"train_loss": -6.742563247680664, "global_step": 137552, "epoch": 3275} {"train_loss": -6.627830505371094, "global_step": 137553, "epoch": 3275} {"train_loss": -6.717666149139404, "global_step": 137554, "epoch": 3275} {"train_loss": -6.826658248901367, "global_step": 137555, "epoch": 3275} {"train_loss": -6.761940002441406, "global_step": 137556, "epoch": 3275} {"train_loss": -6.6522955894470215, "global_step": 137557, "epoch": 3275} {"train_loss": -6.447422981262207, "global_step": 137558, "epoch": 3275} {"train_loss": -6.677585601806641, "global_step": 137559, "epoch": 3275} {"train_loss": -6.678944110870361, "global_step": 137560, "epoch": 3275} {"train_loss": -6.663446426391602, "global_step": 137561, "epoch": 3275} {"train_loss": -6.644936561584473, "global_step": 137562, "epoch": 3275} {"train_loss": -6.689777374267578, "global_step": 137563, "epoch": 3275} {"train_loss": -6.5041584968566895, "global_step": 137564, "epoch": 3275} {"train_loss": -6.695335388183594, "global_step": 137565, "epoch": 3275} {"train_loss": -6.710381984710693, "global_step": 137566, "epoch": 3275} {"train_loss": -6.75279426574707, "global_step": 137567, "epoch": 3275} {"train_loss": -6.703529357910156, "global_step": 137568, "epoch": 3275} {"train_loss": -6.702049732208252, "global_step": 137569, "epoch": 3275} {"train_loss": -6.639245510101318, "global_step": 137570, "epoch": 3275} {"train_loss": -6.666194915771484, "global_step": 137571, "epoch": 3275} {"train_loss": -6.662872314453125, "global_step": 137572, "epoch": 3275} {"train_loss": -6.797560691833496, "global_step": 137573, "epoch": 3275} {"train_loss": -6.631977081298828, "global_step": 137574, "epoch": 3275} {"train_loss": -6.7896881103515625, "global_step": 137575, "epoch": 3275} {"train_loss": -6.635891914367676, "global_step": 137576, "epoch": 3275} {"train_loss": -6.616454601287842, "global_step": 137577, "epoch": 3275} {"train_loss": -6.642395496368408, "global_step": 137578, "epoch": 3275} {"train_loss": -6.654506683349609, "global_step": 137579, "epoch": 3275} {"train_loss": -6.767764091491699, "global_step": 137580, "epoch": 3275} {"train_loss": -6.67512845993042, "global_step": 137581, "epoch": 3275} {"train_loss": -6.538527965545654, "global_step": 137582, "epoch": 3275} {"train_loss": -6.655125141143799, "global_step": 137583, "epoch": 3275} {"train_loss": -6.6296796798706055, "global_step": 137584, "epoch": 3275} {"train_loss": -6.709063529968262, "global_step": 137585, "epoch": 3275} {"train_loss": -6.7272539138793945, "global_step": 137586, "epoch": 3275} {"train_loss": -6.70836877822876, "global_step": 137587, "epoch": 3275} {"train_loss": -6.769028663635254, "global_step": 137588, "epoch": 3275} {"train_loss": -6.749236106872559, "global_step": 137589, "epoch": 3275} {"train_loss": -6.857236862182617, "global_step": 137590, "epoch": 3275} {"train_loss": -6.685932477315267, "global_step": 137591, "epoch": 3275, "val_loss": 68157.578125} {"train_loss": -6.704953670501709, "global_step": 137592, "epoch": 3276} {"train_loss": -6.764521598815918, "global_step": 137593, "epoch": 3276} {"train_loss": -6.803110122680664, "global_step": 137594, "epoch": 3276} {"train_loss": -6.686906814575195, "global_step": 137595, "epoch": 3276} {"train_loss": -6.909519195556641, "global_step": 137596, "epoch": 3276} {"train_loss": -6.738197326660156, "global_step": 137597, "epoch": 3276} {"train_loss": -6.73468542098999, "global_step": 137598, "epoch": 3276} {"train_loss": -6.777443885803223, "global_step": 137599, "epoch": 3276} {"train_loss": -6.737458229064941, "global_step": 137600, "epoch": 3276} {"train_loss": -6.6947174072265625, "global_step": 137601, "epoch": 3276} {"train_loss": -6.784079074859619, "global_step": 137602, "epoch": 3276} {"train_loss": -6.752093315124512, "global_step": 137603, "epoch": 3276} {"train_loss": -6.77390193939209, "global_step": 137604, "epoch": 3276} {"train_loss": -6.723745822906494, "global_step": 137605, "epoch": 3276} {"train_loss": -6.729758262634277, "global_step": 137606, "epoch": 3276} {"train_loss": -6.72965145111084, "global_step": 137607, "epoch": 3276} {"train_loss": -6.773445129394531, "global_step": 137608, "epoch": 3276} {"train_loss": -6.679283142089844, "global_step": 137609, "epoch": 3276} {"train_loss": -6.627993106842041, "global_step": 137610, "epoch": 3276} {"train_loss": -6.786746025085449, "global_step": 137611, "epoch": 3276} {"train_loss": -6.700251579284668, "global_step": 137612, "epoch": 3276} {"train_loss": -6.562931060791016, "global_step": 137613, "epoch": 3276} {"train_loss": -6.780290603637695, "global_step": 137614, "epoch": 3276} {"train_loss": -6.680185317993164, "global_step": 137615, "epoch": 3276} {"train_loss": -6.76779842376709, "global_step": 137616, "epoch": 3276} {"train_loss": -6.742007255554199, "global_step": 137617, "epoch": 3276} {"train_loss": -6.76924467086792, "global_step": 137618, "epoch": 3276} {"train_loss": -6.736172676086426, "global_step": 137619, "epoch": 3276} {"train_loss": -6.608614921569824, "global_step": 137620, "epoch": 3276} {"train_loss": -6.639086723327637, "global_step": 137621, "epoch": 3276} {"train_loss": -6.731317520141602, "global_step": 137622, "epoch": 3276} {"train_loss": -6.812459945678711, "global_step": 137623, "epoch": 3276} {"train_loss": -6.648747444152832, "global_step": 137624, "epoch": 3276} {"train_loss": -6.694911003112793, "global_step": 137625, "epoch": 3276} {"train_loss": -6.69349479675293, "global_step": 137626, "epoch": 3276} {"train_loss": -6.770932197570801, "global_step": 137627, "epoch": 3276} {"train_loss": -6.7140302658081055, "global_step": 137628, "epoch": 3276} {"train_loss": -6.791807174682617, "global_step": 137629, "epoch": 3276} {"train_loss": -6.8499979972839355, "global_step": 137630, "epoch": 3276} {"train_loss": -6.675769805908203, "global_step": 137631, "epoch": 3276} {"train_loss": -6.629791736602783, "global_step": 137632, "epoch": 3276} {"train_loss": -6.7285877750033425, "global_step": 137633, "epoch": 3276, "val_loss": 68366.4921875} {"train_loss": -6.73430061340332, "global_step": 137634, "epoch": 3277} {"train_loss": -6.706153392791748, "global_step": 137635, "epoch": 3277} {"train_loss": -6.790524959564209, "global_step": 137636, "epoch": 3277} {"train_loss": -6.781244277954102, "global_step": 137637, "epoch": 3277} {"train_loss": -6.730515480041504, "global_step": 137638, "epoch": 3277} {"train_loss": -6.7542643547058105, "global_step": 137639, "epoch": 3277} {"train_loss": -6.768678188323975, "global_step": 137640, "epoch": 3277} {"train_loss": -6.670499801635742, "global_step": 137641, "epoch": 3277} {"train_loss": -6.687065601348877, "global_step": 137642, "epoch": 3277} {"train_loss": -6.794745445251465, "global_step": 137643, "epoch": 3277} {"train_loss": -6.713581085205078, "global_step": 137644, "epoch": 3277} {"train_loss": -6.69217586517334, "global_step": 137645, "epoch": 3277} {"train_loss": -6.8168721199035645, "global_step": 137646, "epoch": 3277} {"train_loss": -6.84042501449585, "global_step": 137647, "epoch": 3277} {"train_loss": -6.769129753112793, "global_step": 137648, "epoch": 3277} {"train_loss": -6.797608375549316, "global_step": 137649, "epoch": 3277} {"train_loss": -6.766453742980957, "global_step": 137650, "epoch": 3277} {"train_loss": -6.800344944000244, "global_step": 137651, "epoch": 3277} {"train_loss": -6.6567487716674805, "global_step": 137652, "epoch": 3277} {"train_loss": -6.703555583953857, "global_step": 137653, "epoch": 3277} {"train_loss": -6.720163345336914, "global_step": 137654, "epoch": 3277} {"train_loss": -6.795456409454346, "global_step": 137655, "epoch": 3277} {"train_loss": -6.634026050567627, "global_step": 137656, "epoch": 3277} {"train_loss": -6.8073625564575195, "global_step": 137657, "epoch": 3277} {"train_loss": -6.702281951904297, "global_step": 137658, "epoch": 3277} {"train_loss": -6.7901411056518555, "global_step": 137659, "epoch": 3277} {"train_loss": -6.790992736816406, "global_step": 137660, "epoch": 3277} {"train_loss": -6.6118483543396, "global_step": 137661, "epoch": 3277} {"train_loss": -6.790273666381836, "global_step": 137662, "epoch": 3277} {"train_loss": -6.780585289001465, "global_step": 137663, "epoch": 3277} {"train_loss": -6.667166709899902, "global_step": 137664, "epoch": 3277} {"train_loss": -6.857937812805176, "global_step": 137665, "epoch": 3277} {"train_loss": -6.7558698654174805, "global_step": 137666, "epoch": 3277} {"train_loss": -6.739274978637695, "global_step": 137667, "epoch": 3277} {"train_loss": -6.815007209777832, "global_step": 137668, "epoch": 3277} {"train_loss": -6.795455455780029, "global_step": 137669, "epoch": 3277} {"train_loss": -6.59885311126709, "global_step": 137670, "epoch": 3277} {"train_loss": -6.742246627807617, "global_step": 137671, "epoch": 3277} {"train_loss": -6.7129807472229, "global_step": 137672, "epoch": 3277} {"train_loss": -6.571266174316406, "global_step": 137673, "epoch": 3277} {"train_loss": -6.631404876708984, "global_step": 137674, "epoch": 3277} {"train_loss": -6.737250066938854, "global_step": 137675, "epoch": 3277, "val_loss": 68295.671875} {"train_loss": -6.7899580001831055, "global_step": 137676, "epoch": 3278} {"train_loss": -6.547233581542969, "global_step": 137677, "epoch": 3278} {"train_loss": -6.7065019607543945, "global_step": 137678, "epoch": 3278} {"train_loss": -6.627584457397461, "global_step": 137679, "epoch": 3278} {"train_loss": -6.672579288482666, "global_step": 137680, "epoch": 3278} {"train_loss": -6.651686668395996, "global_step": 137681, "epoch": 3278} {"train_loss": -6.610625267028809, "global_step": 137682, "epoch": 3278} {"train_loss": -6.697751522064209, "global_step": 137683, "epoch": 3278} {"train_loss": -6.6305694580078125, "global_step": 137684, "epoch": 3278} {"train_loss": -6.779808521270752, "global_step": 137685, "epoch": 3278} {"train_loss": -6.678826332092285, "global_step": 137686, "epoch": 3278} {"train_loss": -6.646539688110352, "global_step": 137687, "epoch": 3278} {"train_loss": -6.660530090332031, "global_step": 137688, "epoch": 3278} {"train_loss": -6.734187126159668, "global_step": 137689, "epoch": 3278} {"train_loss": -6.628287315368652, "global_step": 137690, "epoch": 3278} {"train_loss": -6.726810932159424, "global_step": 137691, "epoch": 3278} {"train_loss": -6.639872074127197, "global_step": 137692, "epoch": 3278} {"train_loss": -6.604160308837891, "global_step": 137693, "epoch": 3278} {"train_loss": -6.7423295974731445, "global_step": 137694, "epoch": 3278} {"train_loss": -6.693198204040527, "global_step": 137695, "epoch": 3278} {"train_loss": -6.6902875900268555, "global_step": 137696, "epoch": 3278} {"train_loss": -6.599950313568115, "global_step": 137697, "epoch": 3278} {"train_loss": -6.749298572540283, "global_step": 137698, "epoch": 3278} {"train_loss": -6.646334171295166, "global_step": 137699, "epoch": 3278} {"train_loss": -6.557447910308838, "global_step": 137700, "epoch": 3278} {"train_loss": -6.572056770324707, "global_step": 137701, "epoch": 3278} {"train_loss": -6.611482620239258, "global_step": 137702, "epoch": 3278} {"train_loss": -6.490708351135254, "global_step": 137703, "epoch": 3278} {"train_loss": -6.613228797912598, "global_step": 137704, "epoch": 3278} {"train_loss": -6.649744987487793, "global_step": 137705, "epoch": 3278} {"train_loss": -6.700412750244141, "global_step": 137706, "epoch": 3278} {"train_loss": -6.763688564300537, "global_step": 137707, "epoch": 3278} {"train_loss": -6.5784125328063965, "global_step": 137708, "epoch": 3278} {"train_loss": -6.683259010314941, "global_step": 137709, "epoch": 3278} {"train_loss": -6.639652252197266, "global_step": 137710, "epoch": 3278} {"train_loss": -6.670550346374512, "global_step": 137711, "epoch": 3278} {"train_loss": -6.746948719024658, "global_step": 137712, "epoch": 3278} {"train_loss": -6.576807975769043, "global_step": 137713, "epoch": 3278} {"train_loss": -6.49955940246582, "global_step": 137714, "epoch": 3278} {"train_loss": -6.593075752258301, "global_step": 137715, "epoch": 3278} {"train_loss": -6.727760314941406, "global_step": 137716, "epoch": 3278} {"train_loss": -6.652006217411587, "global_step": 137717, "epoch": 3278, "val_loss": 68312.8828125} {"train_loss": -6.585104942321777, "global_step": 137718, "epoch": 3279} {"train_loss": -6.643457889556885, "global_step": 137719, "epoch": 3279} {"train_loss": -6.779487609863281, "global_step": 137720, "epoch": 3279} {"train_loss": -6.748874187469482, "global_step": 137721, "epoch": 3279} {"train_loss": -6.572254657745361, "global_step": 137722, "epoch": 3279} {"train_loss": -6.744412422180176, "global_step": 137723, "epoch": 3279} {"train_loss": -6.571103572845459, "global_step": 137724, "epoch": 3279} {"train_loss": -6.643655776977539, "global_step": 137725, "epoch": 3279} {"train_loss": -6.684017658233643, "global_step": 137726, "epoch": 3279} {"train_loss": -6.643725872039795, "global_step": 137727, "epoch": 3279} {"train_loss": -6.7024431228637695, "global_step": 137728, "epoch": 3279} {"train_loss": -6.576374530792236, "global_step": 137729, "epoch": 3279} {"train_loss": -6.635751247406006, "global_step": 137730, "epoch": 3279} {"train_loss": -6.700790882110596, "global_step": 137731, "epoch": 3279} {"train_loss": -6.727329730987549, "global_step": 137732, "epoch": 3279} {"train_loss": -6.773900985717773, "global_step": 137733, "epoch": 3279} {"train_loss": -6.634923934936523, "global_step": 137734, "epoch": 3279} {"train_loss": -6.556641578674316, "global_step": 137735, "epoch": 3279} {"train_loss": -6.582620620727539, "global_step": 137736, "epoch": 3279} {"train_loss": -6.5704851150512695, "global_step": 137737, "epoch": 3279} {"train_loss": -6.807577610015869, "global_step": 137738, "epoch": 3279} {"train_loss": -6.548348426818848, "global_step": 137739, "epoch": 3279} {"train_loss": -6.664541721343994, "global_step": 137740, "epoch": 3279} {"train_loss": -6.549063682556152, "global_step": 137741, "epoch": 3279} {"train_loss": -6.730849266052246, "global_step": 137742, "epoch": 3279} {"train_loss": -6.624815464019775, "global_step": 137743, "epoch": 3279} {"train_loss": -6.6832170486450195, "global_step": 137744, "epoch": 3279} {"train_loss": -6.68514347076416, "global_step": 137745, "epoch": 3279} {"train_loss": -6.648181438446045, "global_step": 137746, "epoch": 3279} {"train_loss": -6.72158145904541, "global_step": 137747, "epoch": 3279} {"train_loss": -6.666767597198486, "global_step": 137748, "epoch": 3279} {"train_loss": -6.75294303894043, "global_step": 137749, "epoch": 3279} {"train_loss": -6.658947944641113, "global_step": 137750, "epoch": 3279} {"train_loss": -6.710219860076904, "global_step": 137751, "epoch": 3279} {"train_loss": -6.657723426818848, "global_step": 137752, "epoch": 3279} {"train_loss": -6.529107093811035, "global_step": 137753, "epoch": 3279} {"train_loss": -6.557011604309082, "global_step": 137754, "epoch": 3279} {"train_loss": -6.6469011306762695, "global_step": 137755, "epoch": 3279} {"train_loss": -6.579056262969971, "global_step": 137756, "epoch": 3279} {"train_loss": -6.497148513793945, "global_step": 137757, "epoch": 3279} {"train_loss": -6.689952850341797, "global_step": 137758, "epoch": 3279} {"train_loss": -6.651292358125959, "global_step": 137759, "epoch": 3279, "val_loss": 68526.96875} {"train_loss": -6.677756309509277, "global_step": 137760, "epoch": 3280} {"train_loss": -6.762032985687256, "global_step": 137761, "epoch": 3280} {"train_loss": -6.64970064163208, "global_step": 137762, "epoch": 3280} {"train_loss": -6.698390483856201, "global_step": 137763, "epoch": 3280} {"train_loss": -6.689690589904785, "global_step": 137764, "epoch": 3280} {"train_loss": -6.737853050231934, "global_step": 137765, "epoch": 3280} {"train_loss": -6.591443061828613, "global_step": 137766, "epoch": 3280} {"train_loss": -6.725930690765381, "global_step": 137767, "epoch": 3280} {"train_loss": -6.659633159637451, "global_step": 137768, "epoch": 3280} {"train_loss": -6.722082138061523, "global_step": 137769, "epoch": 3280} {"train_loss": -6.594344139099121, "global_step": 137770, "epoch": 3280} {"train_loss": -6.651166915893555, "global_step": 137771, "epoch": 3280} {"train_loss": -6.7121477127075195, "global_step": 137772, "epoch": 3280} {"train_loss": -6.701804161071777, "global_step": 137773, "epoch": 3280} {"train_loss": -6.632112979888916, "global_step": 137774, "epoch": 3280} {"train_loss": -6.710139274597168, "global_step": 137775, "epoch": 3280} {"train_loss": -6.713781356811523, "global_step": 137776, "epoch": 3280} {"train_loss": -6.797759056091309, "global_step": 137777, "epoch": 3280} {"train_loss": -6.56687068939209, "global_step": 137778, "epoch": 3280} {"train_loss": -6.577104568481445, "global_step": 137779, "epoch": 3280} {"train_loss": -6.757302284240723, "global_step": 137780, "epoch": 3280} {"train_loss": -6.771768569946289, "global_step": 137781, "epoch": 3280} {"train_loss": -6.713593482971191, "global_step": 137782, "epoch": 3280} {"train_loss": -6.696950912475586, "global_step": 137783, "epoch": 3280} {"train_loss": -6.79714298248291, "global_step": 137784, "epoch": 3280} {"train_loss": -6.6655731201171875, "global_step": 137785, "epoch": 3280} {"train_loss": -6.655577659606934, "global_step": 137786, "epoch": 3280} {"train_loss": -6.802467346191406, "global_step": 137787, "epoch": 3280} {"train_loss": -6.663207054138184, "global_step": 137788, "epoch": 3280} {"train_loss": -6.72731876373291, "global_step": 137789, "epoch": 3280} {"train_loss": -6.769989490509033, "global_step": 137790, "epoch": 3280} {"train_loss": -6.59027099609375, "global_step": 137791, "epoch": 3280} {"train_loss": -6.540183067321777, "global_step": 137792, "epoch": 3280} {"train_loss": -6.748287677764893, "global_step": 137793, "epoch": 3280} {"train_loss": -6.6677117347717285, "global_step": 137794, "epoch": 3280} {"train_loss": -6.766112804412842, "global_step": 137795, "epoch": 3280} {"train_loss": -6.764863967895508, "global_step": 137796, "epoch": 3280} {"train_loss": -6.582001209259033, "global_step": 137797, "epoch": 3280} {"train_loss": -6.691332817077637, "global_step": 137798, "epoch": 3280} {"train_loss": -6.5910210609436035, "global_step": 137799, "epoch": 3280} {"train_loss": -6.576632499694824, "global_step": 137800, "epoch": 3280} {"train_loss": -6.683703740437825, "global_step": 137801, "epoch": 3280, "val_loss": 68528.578125} {"train_loss": -6.470693111419678, "global_step": 137802, "epoch": 3281} {"train_loss": -6.73995304107666, "global_step": 137803, "epoch": 3281} {"train_loss": -6.630577087402344, "global_step": 137804, "epoch": 3281} {"train_loss": -6.463397026062012, "global_step": 137805, "epoch": 3281} {"train_loss": -6.701338768005371, "global_step": 137806, "epoch": 3281} {"train_loss": -6.5299835205078125, "global_step": 137807, "epoch": 3281} {"train_loss": -6.598755836486816, "global_step": 137808, "epoch": 3281} {"train_loss": -6.654907703399658, "global_step": 137809, "epoch": 3281} {"train_loss": -6.464812278747559, "global_step": 137810, "epoch": 3281} {"train_loss": -6.630477428436279, "global_step": 137811, "epoch": 3281} {"train_loss": -6.564986228942871, "global_step": 137812, "epoch": 3281} {"train_loss": -6.61013126373291, "global_step": 137813, "epoch": 3281} {"train_loss": -6.694652557373047, "global_step": 137814, "epoch": 3281} {"train_loss": -6.591958999633789, "global_step": 137815, "epoch": 3281} {"train_loss": -6.674925804138184, "global_step": 137816, "epoch": 3281} {"train_loss": -6.710304260253906, "global_step": 137817, "epoch": 3281} {"train_loss": -6.687998294830322, "global_step": 137818, "epoch": 3281} {"train_loss": -6.560667991638184, "global_step": 137819, "epoch": 3281} {"train_loss": -6.684001922607422, "global_step": 137820, "epoch": 3281} {"train_loss": -6.697147369384766, "global_step": 137821, "epoch": 3281} {"train_loss": -6.625629901885986, "global_step": 137822, "epoch": 3281} {"train_loss": -6.676037788391113, "global_step": 137823, "epoch": 3281} {"train_loss": -6.6591033935546875, "global_step": 137824, "epoch": 3281} {"train_loss": -6.634100914001465, "global_step": 137825, "epoch": 3281} {"train_loss": -6.588409423828125, "global_step": 137826, "epoch": 3281} {"train_loss": -6.692558288574219, "global_step": 137827, "epoch": 3281} {"train_loss": -6.658946990966797, "global_step": 137828, "epoch": 3281} {"train_loss": -6.661158084869385, "global_step": 137829, "epoch": 3281} {"train_loss": -6.69651460647583, "global_step": 137830, "epoch": 3281} {"train_loss": -6.665543556213379, "global_step": 137831, "epoch": 3281} {"train_loss": -6.679351329803467, "global_step": 137832, "epoch": 3281} {"train_loss": -6.665175437927246, "global_step": 137833, "epoch": 3281} {"train_loss": -6.662338733673096, "global_step": 137834, "epoch": 3281} {"train_loss": -6.630172252655029, "global_step": 137835, "epoch": 3281} {"train_loss": -6.691108703613281, "global_step": 137836, "epoch": 3281} {"train_loss": -6.666778564453125, "global_step": 137837, "epoch": 3281} {"train_loss": -6.573083877563477, "global_step": 137838, "epoch": 3281} {"train_loss": -6.733084678649902, "global_step": 137839, "epoch": 3281} {"train_loss": -6.674116611480713, "global_step": 137840, "epoch": 3281} {"train_loss": -6.6235504150390625, "global_step": 137841, "epoch": 3281} {"train_loss": -6.758028030395508, "global_step": 137842, "epoch": 3281} {"train_loss": -6.640814088639759, "global_step": 137843, "epoch": 3281, "val_loss": 68380.7734375} {"train_loss": -6.766445159912109, "global_step": 137844, "epoch": 3282} {"train_loss": -6.646985054016113, "global_step": 137845, "epoch": 3282} {"train_loss": -6.821078777313232, "global_step": 137846, "epoch": 3282} {"train_loss": -6.726944923400879, "global_step": 137847, "epoch": 3282} {"train_loss": -6.717116832733154, "global_step": 137848, "epoch": 3282} {"train_loss": -6.652922630310059, "global_step": 137849, "epoch": 3282} {"train_loss": -6.776538848876953, "global_step": 137850, "epoch": 3282} {"train_loss": -6.7042107582092285, "global_step": 137851, "epoch": 3282} {"train_loss": -6.745026588439941, "global_step": 137852, "epoch": 3282} {"train_loss": -6.704493045806885, "global_step": 137853, "epoch": 3282} {"train_loss": -6.630664825439453, "global_step": 137854, "epoch": 3282} {"train_loss": -6.785984039306641, "global_step": 137855, "epoch": 3282} {"train_loss": -6.679423809051514, "global_step": 137856, "epoch": 3282} {"train_loss": -6.7015838623046875, "global_step": 137857, "epoch": 3282} {"train_loss": -6.759842395782471, "global_step": 137858, "epoch": 3282} {"train_loss": -6.654587268829346, "global_step": 137859, "epoch": 3282} {"train_loss": -6.7088117599487305, "global_step": 137860, "epoch": 3282} {"train_loss": -6.649628639221191, "global_step": 137861, "epoch": 3282} {"train_loss": -6.674238204956055, "global_step": 137862, "epoch": 3282} {"train_loss": -6.817224025726318, "global_step": 137863, "epoch": 3282} {"train_loss": -6.7317585945129395, "global_step": 137864, "epoch": 3282} {"train_loss": -6.714756965637207, "global_step": 137865, "epoch": 3282} {"train_loss": -6.671761512756348, "global_step": 137866, "epoch": 3282} {"train_loss": -6.813750267028809, "global_step": 137867, "epoch": 3282} {"train_loss": -6.804831027984619, "global_step": 137868, "epoch": 3282} {"train_loss": -6.69398307800293, "global_step": 137869, "epoch": 3282} {"train_loss": -6.685843467712402, "global_step": 137870, "epoch": 3282} {"train_loss": -6.736852645874023, "global_step": 137871, "epoch": 3282} {"train_loss": -6.796423435211182, "global_step": 137872, "epoch": 3282} {"train_loss": -6.653338432312012, "global_step": 137873, "epoch": 3282} {"train_loss": -6.619821548461914, "global_step": 137874, "epoch": 3282} {"train_loss": -6.686673641204834, "global_step": 137875, "epoch": 3282} {"train_loss": -6.736300468444824, "global_step": 137876, "epoch": 3282} {"train_loss": -6.637347221374512, "global_step": 137877, "epoch": 3282} {"train_loss": -6.688814640045166, "global_step": 137878, "epoch": 3282} {"train_loss": -6.726723670959473, "global_step": 137879, "epoch": 3282} {"train_loss": -6.80582332611084, "global_step": 137880, "epoch": 3282} {"train_loss": -6.680200576782227, "global_step": 137881, "epoch": 3282} {"train_loss": -6.746765613555908, "global_step": 137882, "epoch": 3282} {"train_loss": -6.819820404052734, "global_step": 137883, "epoch": 3282} {"train_loss": -6.6986494064331055, "global_step": 137884, "epoch": 3282} {"train_loss": -6.718821616399856, "global_step": 137885, "epoch": 3282, "val_loss": 68416.9609375} {"train_loss": -6.682104587554932, "global_step": 137886, "epoch": 3283} {"train_loss": -6.661009788513184, "global_step": 137887, "epoch": 3283} {"train_loss": -6.69768762588501, "global_step": 137888, "epoch": 3283} {"train_loss": -6.662432670593262, "global_step": 137889, "epoch": 3283} {"train_loss": -6.7938690185546875, "global_step": 137890, "epoch": 3283} {"train_loss": -6.724364280700684, "global_step": 137891, "epoch": 3283} {"train_loss": -6.628815650939941, "global_step": 137892, "epoch": 3283} {"train_loss": -6.535408973693848, "global_step": 137893, "epoch": 3283} {"train_loss": -6.756100654602051, "global_step": 137894, "epoch": 3283} {"train_loss": -6.713367462158203, "global_step": 137895, "epoch": 3283} {"train_loss": -6.681035995483398, "global_step": 137896, "epoch": 3283} {"train_loss": -6.759374141693115, "global_step": 137897, "epoch": 3283} {"train_loss": -6.608778476715088, "global_step": 137898, "epoch": 3283} {"train_loss": -6.720301151275635, "global_step": 137899, "epoch": 3283} {"train_loss": -6.8025689125061035, "global_step": 137900, "epoch": 3283} {"train_loss": -6.760037422180176, "global_step": 137901, "epoch": 3283} {"train_loss": -6.641176700592041, "global_step": 137902, "epoch": 3283} {"train_loss": -6.5709757804870605, "global_step": 137903, "epoch": 3283} {"train_loss": -6.633856296539307, "global_step": 137904, "epoch": 3283} {"train_loss": -6.720393180847168, "global_step": 137905, "epoch": 3283} {"train_loss": -6.704427719116211, "global_step": 137906, "epoch": 3283} {"train_loss": -6.610751152038574, "global_step": 137907, "epoch": 3283} {"train_loss": -6.658119201660156, "global_step": 137908, "epoch": 3283} {"train_loss": -6.729207992553711, "global_step": 137909, "epoch": 3283} {"train_loss": -6.7002153396606445, "global_step": 137910, "epoch": 3283} {"train_loss": -6.724857330322266, "global_step": 137911, "epoch": 3283} {"train_loss": -6.726127624511719, "global_step": 137912, "epoch": 3283} {"train_loss": -6.770673751831055, "global_step": 137913, "epoch": 3283} {"train_loss": -6.76373291015625, "global_step": 137914, "epoch": 3283} {"train_loss": -6.732662200927734, "global_step": 137915, "epoch": 3283} {"train_loss": -6.796572208404541, "global_step": 137916, "epoch": 3283} {"train_loss": -6.828028678894043, "global_step": 137917, "epoch": 3283} {"train_loss": -6.751720428466797, "global_step": 137918, "epoch": 3283} {"train_loss": -6.609285831451416, "global_step": 137919, "epoch": 3283} {"train_loss": -6.727189064025879, "global_step": 137920, "epoch": 3283} {"train_loss": -6.800521373748779, "global_step": 137921, "epoch": 3283} {"train_loss": -6.7336812019348145, "global_step": 137922, "epoch": 3283} {"train_loss": -6.70394229888916, "global_step": 137923, "epoch": 3283} {"train_loss": -6.775837421417236, "global_step": 137924, "epoch": 3283} {"train_loss": -6.68942403793335, "global_step": 137925, "epoch": 3283} {"train_loss": -6.705615520477295, "global_step": 137926, "epoch": 3283} {"train_loss": -6.708397411164784, "global_step": 137927, "epoch": 3283, "val_loss": 68363.8359375} {"train_loss": -6.772420883178711, "global_step": 137928, "epoch": 3284} {"train_loss": -6.6572771072387695, "global_step": 137929, "epoch": 3284} {"train_loss": -6.69666051864624, "global_step": 137930, "epoch": 3284} {"train_loss": -6.545530319213867, "global_step": 137931, "epoch": 3284} {"train_loss": -6.696660041809082, "global_step": 137932, "epoch": 3284} {"train_loss": -6.717324733734131, "global_step": 137933, "epoch": 3284} {"train_loss": -6.687558174133301, "global_step": 137934, "epoch": 3284} {"train_loss": -6.7184038162231445, "global_step": 137935, "epoch": 3284} {"train_loss": -6.6005353927612305, "global_step": 137936, "epoch": 3284} {"train_loss": -6.722360610961914, "global_step": 137937, "epoch": 3284} {"train_loss": -6.720780372619629, "global_step": 137938, "epoch": 3284} {"train_loss": -6.716852188110352, "global_step": 137939, "epoch": 3284} {"train_loss": -6.805906295776367, "global_step": 137940, "epoch": 3284} {"train_loss": -6.7218780517578125, "global_step": 137941, "epoch": 3284} {"train_loss": -6.676012992858887, "global_step": 137942, "epoch": 3284} {"train_loss": -6.698565483093262, "global_step": 137943, "epoch": 3284} {"train_loss": -6.733991622924805, "global_step": 137944, "epoch": 3284} {"train_loss": -6.68248176574707, "global_step": 137945, "epoch": 3284} {"train_loss": -6.661529541015625, "global_step": 137946, "epoch": 3284} {"train_loss": -6.668747901916504, "global_step": 137947, "epoch": 3284} {"train_loss": -6.712000846862793, "global_step": 137948, "epoch": 3284} {"train_loss": -6.643747329711914, "global_step": 137949, "epoch": 3284} {"train_loss": -6.578108310699463, "global_step": 137950, "epoch": 3284} {"train_loss": -6.687047004699707, "global_step": 137951, "epoch": 3284} {"train_loss": -6.749675273895264, "global_step": 137952, "epoch": 3284} {"train_loss": -6.582773208618164, "global_step": 137953, "epoch": 3284} {"train_loss": -6.57770299911499, "global_step": 137954, "epoch": 3284} {"train_loss": -6.585379123687744, "global_step": 137955, "epoch": 3284} {"train_loss": -6.575307846069336, "global_step": 137956, "epoch": 3284} {"train_loss": -6.737459182739258, "global_step": 137957, "epoch": 3284} {"train_loss": -6.518249034881592, "global_step": 137958, "epoch": 3284} {"train_loss": -6.643689155578613, "global_step": 137959, "epoch": 3284} {"train_loss": -6.705635070800781, "global_step": 137960, "epoch": 3284} {"train_loss": -6.626143455505371, "global_step": 137961, "epoch": 3284} {"train_loss": -6.583097457885742, "global_step": 137962, "epoch": 3284} {"train_loss": -6.531588077545166, "global_step": 137963, "epoch": 3284} {"train_loss": -6.697420120239258, "global_step": 137964, "epoch": 3284} {"train_loss": -6.511760711669922, "global_step": 137965, "epoch": 3284} {"train_loss": -6.61932897567749, "global_step": 137966, "epoch": 3284} {"train_loss": -6.645439147949219, "global_step": 137967, "epoch": 3284} {"train_loss": -6.571743965148926, "global_step": 137968, "epoch": 3284} {"train_loss": -6.655582348505656, "global_step": 137969, "epoch": 3284, "val_loss": 68105.5703125} {"train_loss": -6.559599876403809, "global_step": 137970, "epoch": 3285} {"train_loss": -6.631289005279541, "global_step": 137971, "epoch": 3285} {"train_loss": -6.57663631439209, "global_step": 137972, "epoch": 3285} {"train_loss": -6.621601104736328, "global_step": 137973, "epoch": 3285} {"train_loss": -6.671326160430908, "global_step": 137974, "epoch": 3285} {"train_loss": -6.51377534866333, "global_step": 137975, "epoch": 3285} {"train_loss": -6.5705766677856445, "global_step": 137976, "epoch": 3285} {"train_loss": -6.679272651672363, "global_step": 137977, "epoch": 3285} {"train_loss": -6.739865303039551, "global_step": 137978, "epoch": 3285} {"train_loss": -6.587540626525879, "global_step": 137979, "epoch": 3285} {"train_loss": -6.6205573081970215, "global_step": 137980, "epoch": 3285} {"train_loss": -6.749298572540283, "global_step": 137981, "epoch": 3285} {"train_loss": -6.683619022369385, "global_step": 137982, "epoch": 3285} {"train_loss": -6.644252777099609, "global_step": 137983, "epoch": 3285} {"train_loss": -6.74547004699707, "global_step": 137984, "epoch": 3285} {"train_loss": -6.674216270446777, "global_step": 137985, "epoch": 3285} {"train_loss": -6.671176433563232, "global_step": 137986, "epoch": 3285} {"train_loss": -6.711198806762695, "global_step": 137987, "epoch": 3285} {"train_loss": -6.6815667152404785, "global_step": 137988, "epoch": 3285} {"train_loss": -6.668981552124023, "global_step": 137989, "epoch": 3285} {"train_loss": -6.679887771606445, "global_step": 137990, "epoch": 3285} {"train_loss": -6.726492404937744, "global_step": 137991, "epoch": 3285} {"train_loss": -6.735731601715088, "global_step": 137992, "epoch": 3285} {"train_loss": -6.7397871017456055, "global_step": 137993, "epoch": 3285} {"train_loss": -6.849431037902832, "global_step": 137994, "epoch": 3285} {"train_loss": -6.752152442932129, "global_step": 137995, "epoch": 3285} {"train_loss": -6.74066162109375, "global_step": 137996, "epoch": 3285} {"train_loss": -6.782027721405029, "global_step": 137997, "epoch": 3285} {"train_loss": -6.702727317810059, "global_step": 137998, "epoch": 3285} {"train_loss": -6.842050075531006, "global_step": 137999, "epoch": 3285} {"train_loss": -6.708728313446045, "global_step": 138000, "epoch": 3285} {"train_loss": -6.694225311279297, "global_step": 138001, "epoch": 3285} {"train_loss": -6.802350997924805, "global_step": 138002, "epoch": 3285} {"train_loss": -6.650204181671143, "global_step": 138003, "epoch": 3285} {"train_loss": -6.63151741027832, "global_step": 138004, "epoch": 3285} {"train_loss": -6.693569660186768, "global_step": 138005, "epoch": 3285} {"train_loss": -6.612190246582031, "global_step": 138006, "epoch": 3285} {"train_loss": -6.6807169914245605, "global_step": 138007, "epoch": 3285} {"train_loss": -6.670099258422852, "global_step": 138008, "epoch": 3285} {"train_loss": -6.644688606262207, "global_step": 138009, "epoch": 3285} {"train_loss": -6.629097938537598, "global_step": 138010, "epoch": 3285} {"train_loss": -6.683756623949323, "global_step": 138011, "epoch": 3285, "val_loss": 68358.4296875} {"train_loss": -6.660694599151611, "global_step": 138012, "epoch": 3286} {"train_loss": -6.710757255554199, "global_step": 138013, "epoch": 3286} {"train_loss": -6.579154014587402, "global_step": 138014, "epoch": 3286} {"train_loss": -6.675508499145508, "global_step": 138015, "epoch": 3286} {"train_loss": -6.712686538696289, "global_step": 138016, "epoch": 3286} {"train_loss": -6.65646505355835, "global_step": 138017, "epoch": 3286} {"train_loss": -6.721769332885742, "global_step": 138018, "epoch": 3286} {"train_loss": -6.676065921783447, "global_step": 138019, "epoch": 3286} {"train_loss": -6.700477123260498, "global_step": 138020, "epoch": 3286} {"train_loss": -6.766393184661865, "global_step": 138021, "epoch": 3286} {"train_loss": -6.751075744628906, "global_step": 138022, "epoch": 3286} {"train_loss": -6.659046173095703, "global_step": 138023, "epoch": 3286} {"train_loss": -6.791008949279785, "global_step": 138024, "epoch": 3286} {"train_loss": -6.653470039367676, "global_step": 138025, "epoch": 3286} {"train_loss": -6.713362693786621, "global_step": 138026, "epoch": 3286} {"train_loss": -6.797518730163574, "global_step": 138027, "epoch": 3286} {"train_loss": -6.688997268676758, "global_step": 138028, "epoch": 3286} {"train_loss": -6.7669878005981445, "global_step": 138029, "epoch": 3286} {"train_loss": -6.7777276039123535, "global_step": 138030, "epoch": 3286} {"train_loss": -6.5919084548950195, "global_step": 138031, "epoch": 3286} {"train_loss": -6.585243225097656, "global_step": 138032, "epoch": 3286} {"train_loss": -6.749357223510742, "global_step": 138033, "epoch": 3286} {"train_loss": -6.721128463745117, "global_step": 138034, "epoch": 3286} {"train_loss": -6.770415782928467, "global_step": 138035, "epoch": 3286} {"train_loss": -6.711843013763428, "global_step": 138036, "epoch": 3286} {"train_loss": -6.702083587646484, "global_step": 138037, "epoch": 3286} {"train_loss": -6.7268195152282715, "global_step": 138038, "epoch": 3286} {"train_loss": -6.720608711242676, "global_step": 138039, "epoch": 3286} {"train_loss": -6.733926773071289, "global_step": 138040, "epoch": 3286} {"train_loss": -6.720495700836182, "global_step": 138041, "epoch": 3286} {"train_loss": -6.793779373168945, "global_step": 138042, "epoch": 3286} {"train_loss": -6.70821475982666, "global_step": 138043, "epoch": 3286} {"train_loss": -6.760545253753662, "global_step": 138044, "epoch": 3286} {"train_loss": -6.742869853973389, "global_step": 138045, "epoch": 3286} {"train_loss": -6.741313934326172, "global_step": 138046, "epoch": 3286} {"train_loss": -6.753202438354492, "global_step": 138047, "epoch": 3286} {"train_loss": -6.699249744415283, "global_step": 138048, "epoch": 3286} {"train_loss": -6.742161273956299, "global_step": 138049, "epoch": 3286} {"train_loss": -6.634171009063721, "global_step": 138050, "epoch": 3286} {"train_loss": -6.741276741027832, "global_step": 138051, "epoch": 3286} {"train_loss": -6.655338287353516, "global_step": 138052, "epoch": 3286} {"train_loss": -6.708968684786842, "global_step": 138053, "epoch": 3286, "val_loss": 68165.5546875} {"train_loss": -6.638437271118164, "global_step": 138054, "epoch": 3287} {"train_loss": -6.640615463256836, "global_step": 138055, "epoch": 3287} {"train_loss": -6.691039562225342, "global_step": 138056, "epoch": 3287} {"train_loss": -6.575361728668213, "global_step": 138057, "epoch": 3287} {"train_loss": -6.672574520111084, "global_step": 138058, "epoch": 3287} {"train_loss": -6.779058456420898, "global_step": 138059, "epoch": 3287} {"train_loss": -6.745730400085449, "global_step": 138060, "epoch": 3287} {"train_loss": -6.783304214477539, "global_step": 138061, "epoch": 3287} {"train_loss": -6.802298069000244, "global_step": 138062, "epoch": 3287} {"train_loss": -6.644641399383545, "global_step": 138063, "epoch": 3287} {"train_loss": -6.7977752685546875, "global_step": 138064, "epoch": 3287} {"train_loss": -6.740100860595703, "global_step": 138065, "epoch": 3287} {"train_loss": -6.658373832702637, "global_step": 138066, "epoch": 3287} {"train_loss": -6.763694763183594, "global_step": 138067, "epoch": 3287} {"train_loss": -6.59468936920166, "global_step": 138068, "epoch": 3287} {"train_loss": -6.754465103149414, "global_step": 138069, "epoch": 3287} {"train_loss": -6.717494487762451, "global_step": 138070, "epoch": 3287} {"train_loss": -6.682143211364746, "global_step": 138071, "epoch": 3287} {"train_loss": -6.641810417175293, "global_step": 138072, "epoch": 3287} {"train_loss": -6.624855995178223, "global_step": 138073, "epoch": 3287} {"train_loss": -6.6870927810668945, "global_step": 138074, "epoch": 3287} {"train_loss": -6.606498718261719, "global_step": 138075, "epoch": 3287} {"train_loss": -6.713870048522949, "global_step": 138076, "epoch": 3287} {"train_loss": -6.503173828125, "global_step": 138077, "epoch": 3287} {"train_loss": -6.7175211906433105, "global_step": 138078, "epoch": 3287} {"train_loss": -6.58360481262207, "global_step": 138079, "epoch": 3287} {"train_loss": -6.670706272125244, "global_step": 138080, "epoch": 3287} {"train_loss": -6.676473617553711, "global_step": 138081, "epoch": 3287} {"train_loss": -6.6911091804504395, "global_step": 138082, "epoch": 3287} {"train_loss": -6.679095268249512, "global_step": 138083, "epoch": 3287} {"train_loss": -6.555727958679199, "global_step": 138084, "epoch": 3287} {"train_loss": -6.694540023803711, "global_step": 138085, "epoch": 3287} {"train_loss": -6.666254997253418, "global_step": 138086, "epoch": 3287} {"train_loss": -6.579520225524902, "global_step": 138087, "epoch": 3287} {"train_loss": -6.691049575805664, "global_step": 138088, "epoch": 3287} {"train_loss": -6.6761064529418945, "global_step": 138089, "epoch": 3287} {"train_loss": -6.658108711242676, "global_step": 138090, "epoch": 3287} {"train_loss": -6.685959815979004, "global_step": 138091, "epoch": 3287} {"train_loss": -6.656264781951904, "global_step": 138092, "epoch": 3287} {"train_loss": -6.727179050445557, "global_step": 138093, "epoch": 3287} {"train_loss": -6.663555145263672, "global_step": 138094, "epoch": 3287} {"train_loss": -6.676033587682815, "global_step": 138095, "epoch": 3287, "val_loss": 68426.46875} {"train_loss": -6.697405815124512, "global_step": 138096, "epoch": 3288} {"train_loss": -6.616302490234375, "global_step": 138097, "epoch": 3288} {"train_loss": -6.748455047607422, "global_step": 138098, "epoch": 3288} {"train_loss": -6.801374435424805, "global_step": 138099, "epoch": 3288} {"train_loss": -6.824002265930176, "global_step": 138100, "epoch": 3288} {"train_loss": -6.730884075164795, "global_step": 138101, "epoch": 3288} {"train_loss": -6.723333835601807, "global_step": 138102, "epoch": 3288} {"train_loss": -6.742768287658691, "global_step": 138103, "epoch": 3288} {"train_loss": -6.767282962799072, "global_step": 138104, "epoch": 3288} {"train_loss": -6.7692718505859375, "global_step": 138105, "epoch": 3288} {"train_loss": -6.763546943664551, "global_step": 138106, "epoch": 3288} {"train_loss": -6.751383304595947, "global_step": 138107, "epoch": 3288} {"train_loss": -6.838976860046387, "global_step": 138108, "epoch": 3288} {"train_loss": -6.694092750549316, "global_step": 138109, "epoch": 3288} {"train_loss": -6.783003330230713, "global_step": 138110, "epoch": 3288} {"train_loss": -6.719991683959961, "global_step": 138111, "epoch": 3288} {"train_loss": -6.826067924499512, "global_step": 138112, "epoch": 3288} {"train_loss": -6.577487945556641, "global_step": 138113, "epoch": 3288} {"train_loss": -6.698268890380859, "global_step": 138114, "epoch": 3288} {"train_loss": -6.6664910316467285, "global_step": 138115, "epoch": 3288} {"train_loss": -6.637333393096924, "global_step": 138116, "epoch": 3288} {"train_loss": -6.70950984954834, "global_step": 138117, "epoch": 3288} {"train_loss": -6.689243316650391, "global_step": 138118, "epoch": 3288} {"train_loss": -6.718064308166504, "global_step": 138119, "epoch": 3288} {"train_loss": -6.60417366027832, "global_step": 138120, "epoch": 3288} {"train_loss": -6.648115158081055, "global_step": 138121, "epoch": 3288} {"train_loss": -6.663917541503906, "global_step": 138122, "epoch": 3288} {"train_loss": -6.735798358917236, "global_step": 138123, "epoch": 3288} {"train_loss": -6.634832859039307, "global_step": 138124, "epoch": 3288} {"train_loss": -6.58234977722168, "global_step": 138125, "epoch": 3288} {"train_loss": -6.780484676361084, "global_step": 138126, "epoch": 3288} {"train_loss": -6.613055229187012, "global_step": 138127, "epoch": 3288} {"train_loss": -6.706022262573242, "global_step": 138128, "epoch": 3288} {"train_loss": -6.6895341873168945, "global_step": 138129, "epoch": 3288} {"train_loss": -6.651823043823242, "global_step": 138130, "epoch": 3288} {"train_loss": -6.733578681945801, "global_step": 138131, "epoch": 3288} {"train_loss": -6.775484085083008, "global_step": 138132, "epoch": 3288} {"train_loss": -6.68653678894043, "global_step": 138133, "epoch": 3288} {"train_loss": -6.6590118408203125, "global_step": 138134, "epoch": 3288} {"train_loss": -6.730795860290527, "global_step": 138135, "epoch": 3288} {"train_loss": -6.549299240112305, "global_step": 138136, "epoch": 3288} {"train_loss": -6.705541031701224, "global_step": 138137, "epoch": 3288, "val_loss": 68476.6953125} {"train_loss": -6.685199737548828, "global_step": 138138, "epoch": 3289} {"train_loss": -6.794135093688965, "global_step": 138139, "epoch": 3289} {"train_loss": -6.721508026123047, "global_step": 138140, "epoch": 3289} {"train_loss": -6.6996965408325195, "global_step": 138141, "epoch": 3289} {"train_loss": -6.671848297119141, "global_step": 138142, "epoch": 3289} {"train_loss": -6.655984878540039, "global_step": 138143, "epoch": 3289} {"train_loss": -6.722127914428711, "global_step": 138144, "epoch": 3289} {"train_loss": -6.791469097137451, "global_step": 138145, "epoch": 3289} {"train_loss": -6.720013618469238, "global_step": 138146, "epoch": 3289} {"train_loss": -6.692391395568848, "global_step": 138147, "epoch": 3289} {"train_loss": -6.808868408203125, "global_step": 138148, "epoch": 3289} {"train_loss": -6.853987693786621, "global_step": 138149, "epoch": 3289} {"train_loss": -6.753009796142578, "global_step": 138150, "epoch": 3289} {"train_loss": -6.749419212341309, "global_step": 138151, "epoch": 3289} {"train_loss": -6.725640296936035, "global_step": 138152, "epoch": 3289} {"train_loss": -6.706762313842773, "global_step": 138153, "epoch": 3289} {"train_loss": -6.757732391357422, "global_step": 138154, "epoch": 3289} {"train_loss": -6.796123027801514, "global_step": 138155, "epoch": 3289} {"train_loss": -6.776368141174316, "global_step": 138156, "epoch": 3289} {"train_loss": -6.754949569702148, "global_step": 138157, "epoch": 3289} {"train_loss": -6.8002519607543945, "global_step": 138158, "epoch": 3289} {"train_loss": -6.742765426635742, "global_step": 138159, "epoch": 3289} {"train_loss": -6.681235313415527, "global_step": 138160, "epoch": 3289} {"train_loss": -6.699782371520996, "global_step": 138161, "epoch": 3289} {"train_loss": -6.683147430419922, "global_step": 138162, "epoch": 3289} {"train_loss": -6.6552839279174805, "global_step": 138163, "epoch": 3289} {"train_loss": -6.826386451721191, "global_step": 138164, "epoch": 3289} {"train_loss": -6.71796989440918, "global_step": 138165, "epoch": 3289} {"train_loss": -6.610718727111816, "global_step": 138166, "epoch": 3289} {"train_loss": -6.688850402832031, "global_step": 138167, "epoch": 3289} {"train_loss": -6.699644088745117, "global_step": 138168, "epoch": 3289} {"train_loss": -6.76391077041626, "global_step": 138169, "epoch": 3289} {"train_loss": -6.691514015197754, "global_step": 138170, "epoch": 3289} {"train_loss": -6.660970687866211, "global_step": 138171, "epoch": 3289} {"train_loss": -6.660451889038086, "global_step": 138172, "epoch": 3289} {"train_loss": -6.649623870849609, "global_step": 138173, "epoch": 3289} {"train_loss": -6.711181640625, "global_step": 138174, "epoch": 3289} {"train_loss": -6.771737575531006, "global_step": 138175, "epoch": 3289} {"train_loss": -6.712985038757324, "global_step": 138176, "epoch": 3289} {"train_loss": -6.6166887283325195, "global_step": 138177, "epoch": 3289} {"train_loss": -6.741788387298584, "global_step": 138178, "epoch": 3289} {"train_loss": -6.721246957778931, "global_step": 138179, "epoch": 3289, "val_loss": 68232.5546875} {"train_loss": -6.777180194854736, "global_step": 138180, "epoch": 3290} {"train_loss": -6.714077949523926, "global_step": 138181, "epoch": 3290} {"train_loss": -6.736702919006348, "global_step": 138182, "epoch": 3290} {"train_loss": -6.663787841796875, "global_step": 138183, "epoch": 3290} {"train_loss": -6.753691673278809, "global_step": 138184, "epoch": 3290} {"train_loss": -6.774420261383057, "global_step": 138185, "epoch": 3290} {"train_loss": -6.6969146728515625, "global_step": 138186, "epoch": 3290} {"train_loss": -6.725511074066162, "global_step": 138187, "epoch": 3290} {"train_loss": -6.684183120727539, "global_step": 138188, "epoch": 3290} {"train_loss": -6.670297622680664, "global_step": 138189, "epoch": 3290} {"train_loss": -6.694754600524902, "global_step": 138190, "epoch": 3290} {"train_loss": -6.714119911193848, "global_step": 138191, "epoch": 3290} {"train_loss": -6.783334732055664, "global_step": 138192, "epoch": 3290} {"train_loss": -6.703086853027344, "global_step": 138193, "epoch": 3290} {"train_loss": -6.67658805847168, "global_step": 138194, "epoch": 3290} {"train_loss": -6.779078483581543, "global_step": 138195, "epoch": 3290} {"train_loss": -6.704409599304199, "global_step": 138196, "epoch": 3290} {"train_loss": -6.61167049407959, "global_step": 138197, "epoch": 3290} {"train_loss": -6.728055953979492, "global_step": 138198, "epoch": 3290} {"train_loss": -6.659590721130371, "global_step": 138199, "epoch": 3290} {"train_loss": -6.779886722564697, "global_step": 138200, "epoch": 3290} {"train_loss": -6.719325065612793, "global_step": 138201, "epoch": 3290} {"train_loss": -6.606754302978516, "global_step": 138202, "epoch": 3290} {"train_loss": -6.694543361663818, "global_step": 138203, "epoch": 3290} {"train_loss": -6.787909507751465, "global_step": 138204, "epoch": 3290} {"train_loss": -6.77764892578125, "global_step": 138205, "epoch": 3290} {"train_loss": -6.682253837585449, "global_step": 138206, "epoch": 3290} {"train_loss": -6.58524227142334, "global_step": 138207, "epoch": 3290} {"train_loss": -6.733782768249512, "global_step": 138208, "epoch": 3290} {"train_loss": -6.52572774887085, "global_step": 138209, "epoch": 3290} {"train_loss": -6.699371337890625, "global_step": 138210, "epoch": 3290} {"train_loss": -6.504457950592041, "global_step": 138211, "epoch": 3290} {"train_loss": -6.480831623077393, "global_step": 138212, "epoch": 3290} {"train_loss": -6.762580871582031, "global_step": 138213, "epoch": 3290} {"train_loss": -6.625485420227051, "global_step": 138214, "epoch": 3290} {"train_loss": -6.593502998352051, "global_step": 138215, "epoch": 3290} {"train_loss": -6.585209846496582, "global_step": 138216, "epoch": 3290} {"train_loss": -6.625347137451172, "global_step": 138217, "epoch": 3290} {"train_loss": -6.5502448081970215, "global_step": 138218, "epoch": 3290} {"train_loss": -6.616422176361084, "global_step": 138219, "epoch": 3290} {"train_loss": -6.676110744476318, "global_step": 138220, "epoch": 3290} {"train_loss": -6.678072089240665, "global_step": 138221, "epoch": 3290, "val_loss": 68424.0625} {"train_loss": -6.760092735290527, "global_step": 138222, "epoch": 3291} {"train_loss": -6.611775875091553, "global_step": 138223, "epoch": 3291} {"train_loss": -6.632269382476807, "global_step": 138224, "epoch": 3291} {"train_loss": -6.691287994384766, "global_step": 138225, "epoch": 3291} {"train_loss": -6.516445159912109, "global_step": 138226, "epoch": 3291} {"train_loss": -6.610976219177246, "global_step": 138227, "epoch": 3291} {"train_loss": -6.621311187744141, "global_step": 138228, "epoch": 3291} {"train_loss": -6.66497802734375, "global_step": 138229, "epoch": 3291} {"train_loss": -6.725954055786133, "global_step": 138230, "epoch": 3291} {"train_loss": -6.615265846252441, "global_step": 138231, "epoch": 3291} {"train_loss": -6.6387224197387695, "global_step": 138232, "epoch": 3291} {"train_loss": -6.641869068145752, "global_step": 138233, "epoch": 3291} {"train_loss": -6.660036563873291, "global_step": 138234, "epoch": 3291} {"train_loss": -6.768007278442383, "global_step": 138235, "epoch": 3291} {"train_loss": -6.667977809906006, "global_step": 138236, "epoch": 3291} {"train_loss": -6.828728675842285, "global_step": 138237, "epoch": 3291} {"train_loss": -6.786717891693115, "global_step": 138238, "epoch": 3291} {"train_loss": -6.772210121154785, "global_step": 138239, "epoch": 3291} {"train_loss": -6.68357515335083, "global_step": 138240, "epoch": 3291} {"train_loss": -6.678521633148193, "global_step": 138241, "epoch": 3291} {"train_loss": -6.667492866516113, "global_step": 138242, "epoch": 3291} {"train_loss": -6.725111961364746, "global_step": 138243, "epoch": 3291} {"train_loss": -6.594805717468262, "global_step": 138244, "epoch": 3291} {"train_loss": -6.570497512817383, "global_step": 138245, "epoch": 3291} {"train_loss": -6.642650604248047, "global_step": 138246, "epoch": 3291} {"train_loss": -6.60621452331543, "global_step": 138247, "epoch": 3291} {"train_loss": -6.654322624206543, "global_step": 138248, "epoch": 3291} {"train_loss": -6.653312683105469, "global_step": 138249, "epoch": 3291} {"train_loss": -6.804939270019531, "global_step": 138250, "epoch": 3291} {"train_loss": -6.7243523597717285, "global_step": 138251, "epoch": 3291} {"train_loss": -6.706892967224121, "global_step": 138252, "epoch": 3291} {"train_loss": -6.647284030914307, "global_step": 138253, "epoch": 3291} {"train_loss": -6.730320930480957, "global_step": 138254, "epoch": 3291} {"train_loss": -6.647449493408203, "global_step": 138255, "epoch": 3291} {"train_loss": -6.78651762008667, "global_step": 138256, "epoch": 3291} {"train_loss": -6.702374458312988, "global_step": 138257, "epoch": 3291} {"train_loss": -6.634021282196045, "global_step": 138258, "epoch": 3291} {"train_loss": -6.702969551086426, "global_step": 138259, "epoch": 3291} {"train_loss": -6.6650004386901855, "global_step": 138260, "epoch": 3291} {"train_loss": -6.739545822143555, "global_step": 138261, "epoch": 3291} {"train_loss": -6.760936737060547, "global_step": 138262, "epoch": 3291} {"train_loss": -6.682425680614653, "global_step": 138263, "epoch": 3291, "val_loss": 68067.3203125} {"train_loss": -6.602452278137207, "global_step": 138264, "epoch": 3292} {"train_loss": -6.6538310050964355, "global_step": 138265, "epoch": 3292} {"train_loss": -6.7469282150268555, "global_step": 138266, "epoch": 3292} {"train_loss": -6.7988691329956055, "global_step": 138267, "epoch": 3292} {"train_loss": -6.729200839996338, "global_step": 138268, "epoch": 3292} {"train_loss": -6.61622428894043, "global_step": 138269, "epoch": 3292} {"train_loss": -6.788259029388428, "global_step": 138270, "epoch": 3292} {"train_loss": -6.6583428382873535, "global_step": 138271, "epoch": 3292} {"train_loss": -6.719884395599365, "global_step": 138272, "epoch": 3292} {"train_loss": -6.777871608734131, "global_step": 138273, "epoch": 3292} {"train_loss": -6.697306156158447, "global_step": 138274, "epoch": 3292} {"train_loss": -6.810695648193359, "global_step": 138275, "epoch": 3292} {"train_loss": -6.6926798820495605, "global_step": 138276, "epoch": 3292} {"train_loss": -6.645479202270508, "global_step": 138277, "epoch": 3292} {"train_loss": -6.6797566413879395, "global_step": 138278, "epoch": 3292} {"train_loss": -6.717751502990723, "global_step": 138279, "epoch": 3292} {"train_loss": -6.685790061950684, "global_step": 138280, "epoch": 3292} {"train_loss": -6.738837718963623, "global_step": 138281, "epoch": 3292} {"train_loss": -6.633642196655273, "global_step": 138282, "epoch": 3292} {"train_loss": -6.535776138305664, "global_step": 138283, "epoch": 3292} {"train_loss": -6.638894081115723, "global_step": 138284, "epoch": 3292} {"train_loss": -6.494032382965088, "global_step": 138285, "epoch": 3292} {"train_loss": -6.520535469055176, "global_step": 138286, "epoch": 3292} {"train_loss": -6.604334354400635, "global_step": 138287, "epoch": 3292} {"train_loss": -6.500799179077148, "global_step": 138288, "epoch": 3292} {"train_loss": -6.5410966873168945, "global_step": 138289, "epoch": 3292} {"train_loss": -6.411858558654785, "global_step": 138290, "epoch": 3292} {"train_loss": -6.572279453277588, "global_step": 138291, "epoch": 3292} {"train_loss": -6.521826267242432, "global_step": 138292, "epoch": 3292} {"train_loss": -6.560871124267578, "global_step": 138293, "epoch": 3292} {"train_loss": -6.519609451293945, "global_step": 138294, "epoch": 3292} {"train_loss": -6.703824043273926, "global_step": 138295, "epoch": 3292} {"train_loss": -6.578083038330078, "global_step": 138296, "epoch": 3292} {"train_loss": -6.654088020324707, "global_step": 138297, "epoch": 3292} {"train_loss": -6.604268550872803, "global_step": 138298, "epoch": 3292} {"train_loss": -6.715182304382324, "global_step": 138299, "epoch": 3292} {"train_loss": -6.651599884033203, "global_step": 138300, "epoch": 3292} {"train_loss": -6.704744338989258, "global_step": 138301, "epoch": 3292} {"train_loss": -6.720640659332275, "global_step": 138302, "epoch": 3292} {"train_loss": -6.639021873474121, "global_step": 138303, "epoch": 3292} {"train_loss": -6.618192672729492, "global_step": 138304, "epoch": 3292} {"train_loss": -6.644302004859561, "global_step": 138305, "epoch": 3292, "val_loss": 68230.109375} {"train_loss": -6.7333502769470215, "global_step": 138306, "epoch": 3293} {"train_loss": -6.738198280334473, "global_step": 138307, "epoch": 3293} {"train_loss": -6.663295745849609, "global_step": 138308, "epoch": 3293} {"train_loss": -6.732515811920166, "global_step": 138309, "epoch": 3293} {"train_loss": -6.74582576751709, "global_step": 138310, "epoch": 3293} {"train_loss": -6.718440055847168, "global_step": 138311, "epoch": 3293} {"train_loss": -6.731531143188477, "global_step": 138312, "epoch": 3293} {"train_loss": -6.681138038635254, "global_step": 138313, "epoch": 3293} {"train_loss": -6.663967132568359, "global_step": 138314, "epoch": 3293} {"train_loss": -6.729014873504639, "global_step": 138315, "epoch": 3293} {"train_loss": -6.797939300537109, "global_step": 138316, "epoch": 3293} {"train_loss": -6.704067707061768, "global_step": 138317, "epoch": 3293} {"train_loss": -6.772756576538086, "global_step": 138318, "epoch": 3293} {"train_loss": -6.764166831970215, "global_step": 138319, "epoch": 3293} {"train_loss": -6.687082290649414, "global_step": 138320, "epoch": 3293} {"train_loss": -6.764658451080322, "global_step": 138321, "epoch": 3293} {"train_loss": -6.73734188079834, "global_step": 138322, "epoch": 3293} {"train_loss": -6.760506629943848, "global_step": 138323, "epoch": 3293} {"train_loss": -6.788644313812256, "global_step": 138324, "epoch": 3293} {"train_loss": -6.6804046630859375, "global_step": 138325, "epoch": 3293} {"train_loss": -6.692846298217773, "global_step": 138326, "epoch": 3293} {"train_loss": -6.872334957122803, "global_step": 138327, "epoch": 3293} {"train_loss": -6.759660243988037, "global_step": 138328, "epoch": 3293} {"train_loss": -6.8909101486206055, "global_step": 138329, "epoch": 3293} {"train_loss": -6.8226447105407715, "global_step": 138330, "epoch": 3293} {"train_loss": -6.788638591766357, "global_step": 138331, "epoch": 3293} {"train_loss": -6.686183929443359, "global_step": 138332, "epoch": 3293} {"train_loss": -6.811507701873779, "global_step": 138333, "epoch": 3293} {"train_loss": -6.75508975982666, "global_step": 138334, "epoch": 3293} {"train_loss": -6.694645404815674, "global_step": 138335, "epoch": 3293} {"train_loss": -6.740415573120117, "global_step": 138336, "epoch": 3293} {"train_loss": -6.793992042541504, "global_step": 138337, "epoch": 3293} {"train_loss": -6.67274284362793, "global_step": 138338, "epoch": 3293} {"train_loss": -6.741703510284424, "global_step": 138339, "epoch": 3293} {"train_loss": -6.722576141357422, "global_step": 138340, "epoch": 3293} {"train_loss": -6.747128486633301, "global_step": 138341, "epoch": 3293} {"train_loss": -6.759619235992432, "global_step": 138342, "epoch": 3293} {"train_loss": -6.627833366394043, "global_step": 138343, "epoch": 3293} {"train_loss": -6.789709091186523, "global_step": 138344, "epoch": 3293} {"train_loss": -6.737272262573242, "global_step": 138345, "epoch": 3293} {"train_loss": -6.757076263427734, "global_step": 138346, "epoch": 3293} {"train_loss": -6.745255038851783, "global_step": 138347, "epoch": 3293, "val_loss": 68178.4921875} {"train_loss": -6.8094282150268555, "global_step": 138348, "epoch": 3294} {"train_loss": -6.747459411621094, "global_step": 138349, "epoch": 3294} {"train_loss": -6.813214302062988, "global_step": 138350, "epoch": 3294} {"train_loss": -6.800312042236328, "global_step": 138351, "epoch": 3294} {"train_loss": -6.7106475830078125, "global_step": 138352, "epoch": 3294} {"train_loss": -6.82034969329834, "global_step": 138353, "epoch": 3294} {"train_loss": -6.740736484527588, "global_step": 138354, "epoch": 3294} {"train_loss": -6.742557525634766, "global_step": 138355, "epoch": 3294} {"train_loss": -6.691702842712402, "global_step": 138356, "epoch": 3294} {"train_loss": -6.783632278442383, "global_step": 138357, "epoch": 3294} {"train_loss": -6.738114356994629, "global_step": 138358, "epoch": 3294} {"train_loss": -6.777700424194336, "global_step": 138359, "epoch": 3294} {"train_loss": -6.755102157592773, "global_step": 138360, "epoch": 3294} {"train_loss": -6.663932800292969, "global_step": 138361, "epoch": 3294} {"train_loss": -6.76692008972168, "global_step": 138362, "epoch": 3294} {"train_loss": -6.787574291229248, "global_step": 138363, "epoch": 3294} {"train_loss": -6.674699306488037, "global_step": 138364, "epoch": 3294} {"train_loss": -6.766080856323242, "global_step": 138365, "epoch": 3294} {"train_loss": -6.609201908111572, "global_step": 138366, "epoch": 3294} {"train_loss": -6.7266926765441895, "global_step": 138367, "epoch": 3294} {"train_loss": -6.754443645477295, "global_step": 138368, "epoch": 3294} {"train_loss": -6.728378772735596, "global_step": 138369, "epoch": 3294} {"train_loss": -6.794195175170898, "global_step": 138370, "epoch": 3294} {"train_loss": -6.770737648010254, "global_step": 138371, "epoch": 3294} {"train_loss": -6.724483489990234, "global_step": 138372, "epoch": 3294} {"train_loss": -6.573221206665039, "global_step": 138373, "epoch": 3294} {"train_loss": -6.689167022705078, "global_step": 138374, "epoch": 3294} {"train_loss": -6.692917346954346, "global_step": 138375, "epoch": 3294} {"train_loss": -6.618744850158691, "global_step": 138376, "epoch": 3294} {"train_loss": -6.589096546173096, "global_step": 138377, "epoch": 3294} {"train_loss": -6.701061248779297, "global_step": 138378, "epoch": 3294} {"train_loss": -6.7421369552612305, "global_step": 138379, "epoch": 3294} {"train_loss": -6.593256950378418, "global_step": 138380, "epoch": 3294} {"train_loss": -6.687831878662109, "global_step": 138381, "epoch": 3294} {"train_loss": -6.755846977233887, "global_step": 138382, "epoch": 3294} {"train_loss": -6.7841081619262695, "global_step": 138383, "epoch": 3294} {"train_loss": -6.7381720542907715, "global_step": 138384, "epoch": 3294} {"train_loss": -6.708420753479004, "global_step": 138385, "epoch": 3294} {"train_loss": -6.663398742675781, "global_step": 138386, "epoch": 3294} {"train_loss": -6.5907697677612305, "global_step": 138387, "epoch": 3294} {"train_loss": -6.734096527099609, "global_step": 138388, "epoch": 3294} {"train_loss": -6.721374954496111, "global_step": 138389, "epoch": 3294, "val_loss": 68294.2890625} {"train_loss": -6.564001083374023, "global_step": 138390, "epoch": 3295} {"train_loss": -6.797519683837891, "global_step": 138391, "epoch": 3295} {"train_loss": -6.687185764312744, "global_step": 138392, "epoch": 3295} {"train_loss": -6.6897735595703125, "global_step": 138393, "epoch": 3295} {"train_loss": -6.672081470489502, "global_step": 138394, "epoch": 3295} {"train_loss": -6.591835021972656, "global_step": 138395, "epoch": 3295} {"train_loss": -6.719962120056152, "global_step": 138396, "epoch": 3295} {"train_loss": -6.798937797546387, "global_step": 138397, "epoch": 3295} {"train_loss": -6.676119327545166, "global_step": 138398, "epoch": 3295} {"train_loss": -6.646180152893066, "global_step": 138399, "epoch": 3295} {"train_loss": -6.663130283355713, "global_step": 138400, "epoch": 3295} {"train_loss": -6.69782829284668, "global_step": 138401, "epoch": 3295} {"train_loss": -6.692334175109863, "global_step": 138402, "epoch": 3295} {"train_loss": -6.677089214324951, "global_step": 138403, "epoch": 3295} {"train_loss": -6.6325178146362305, "global_step": 138404, "epoch": 3295} {"train_loss": -6.603827476501465, "global_step": 138405, "epoch": 3295} {"train_loss": -6.730600357055664, "global_step": 138406, "epoch": 3295} {"train_loss": -6.704891204833984, "global_step": 138407, "epoch": 3295} {"train_loss": -6.686944484710693, "global_step": 138408, "epoch": 3295} {"train_loss": -6.6935343742370605, "global_step": 138409, "epoch": 3295} {"train_loss": -6.733325958251953, "global_step": 138410, "epoch": 3295} {"train_loss": -6.648171901702881, "global_step": 138411, "epoch": 3295} {"train_loss": -6.729888916015625, "global_step": 138412, "epoch": 3295} {"train_loss": -6.660213947296143, "global_step": 138413, "epoch": 3295} {"train_loss": -6.653799533843994, "global_step": 138414, "epoch": 3295} {"train_loss": -6.7068891525268555, "global_step": 138415, "epoch": 3295} {"train_loss": -6.674482345581055, "global_step": 138416, "epoch": 3295} {"train_loss": -6.711085319519043, "global_step": 138417, "epoch": 3295} {"train_loss": -6.680746078491211, "global_step": 138418, "epoch": 3295} {"train_loss": -6.70689582824707, "global_step": 138419, "epoch": 3295} {"train_loss": -6.703949451446533, "global_step": 138420, "epoch": 3295} {"train_loss": -6.713879108428955, "global_step": 138421, "epoch": 3295} {"train_loss": -6.795190334320068, "global_step": 138422, "epoch": 3295} {"train_loss": -6.65424919128418, "global_step": 138423, "epoch": 3295} {"train_loss": -6.661759376525879, "global_step": 138424, "epoch": 3295} {"train_loss": -6.796052932739258, "global_step": 138425, "epoch": 3295} {"train_loss": -6.733853340148926, "global_step": 138426, "epoch": 3295} {"train_loss": -6.69862699508667, "global_step": 138427, "epoch": 3295} {"train_loss": -6.717390060424805, "global_step": 138428, "epoch": 3295} {"train_loss": -6.637956619262695, "global_step": 138429, "epoch": 3295} {"train_loss": -6.569643497467041, "global_step": 138430, "epoch": 3295} {"train_loss": -6.684972070512318, "global_step": 138431, "epoch": 3295, "val_loss": 68328.1015625} {"train_loss": -6.662553787231445, "global_step": 138432, "epoch": 3296} {"train_loss": -6.643514633178711, "global_step": 138433, "epoch": 3296} {"train_loss": -6.674673080444336, "global_step": 138434, "epoch": 3296} {"train_loss": -6.682554244995117, "global_step": 138435, "epoch": 3296} {"train_loss": -6.616158485412598, "global_step": 138436, "epoch": 3296} {"train_loss": -6.723414421081543, "global_step": 138437, "epoch": 3296} {"train_loss": -6.753208160400391, "global_step": 138438, "epoch": 3296} {"train_loss": -6.604527950286865, "global_step": 138439, "epoch": 3296} {"train_loss": -6.794137001037598, "global_step": 138440, "epoch": 3296} {"train_loss": -6.563659191131592, "global_step": 138441, "epoch": 3296} {"train_loss": -6.652154922485352, "global_step": 138442, "epoch": 3296} {"train_loss": -6.682070732116699, "global_step": 138443, "epoch": 3296} {"train_loss": -6.803251266479492, "global_step": 138444, "epoch": 3296} {"train_loss": -6.79443883895874, "global_step": 138445, "epoch": 3296} {"train_loss": -6.677545547485352, "global_step": 138446, "epoch": 3296} {"train_loss": -6.695611000061035, "global_step": 138447, "epoch": 3296} {"train_loss": -6.655217170715332, "global_step": 138448, "epoch": 3296} {"train_loss": -6.719787120819092, "global_step": 138449, "epoch": 3296} {"train_loss": -6.6994757652282715, "global_step": 138450, "epoch": 3296} {"train_loss": -6.602790832519531, "global_step": 138451, "epoch": 3296} {"train_loss": -6.7230377197265625, "global_step": 138452, "epoch": 3296} {"train_loss": -6.671512603759766, "global_step": 138453, "epoch": 3296} {"train_loss": -6.751603126525879, "global_step": 138454, "epoch": 3296} {"train_loss": -6.6550703048706055, "global_step": 138455, "epoch": 3296} {"train_loss": -6.709514617919922, "global_step": 138456, "epoch": 3296} {"train_loss": -6.72011661529541, "global_step": 138457, "epoch": 3296} {"train_loss": -6.757983207702637, "global_step": 138458, "epoch": 3296} {"train_loss": -6.750782012939453, "global_step": 138459, "epoch": 3296} {"train_loss": -6.600702285766602, "global_step": 138460, "epoch": 3296} {"train_loss": -6.689609527587891, "global_step": 138461, "epoch": 3296} {"train_loss": -6.681533336639404, "global_step": 138462, "epoch": 3296} {"train_loss": -6.666017532348633, "global_step": 138463, "epoch": 3296} {"train_loss": -6.740513801574707, "global_step": 138464, "epoch": 3296} {"train_loss": -6.667231559753418, "global_step": 138465, "epoch": 3296} {"train_loss": -6.709609508514404, "global_step": 138466, "epoch": 3296} {"train_loss": -6.741389274597168, "global_step": 138467, "epoch": 3296} {"train_loss": -6.812797546386719, "global_step": 138468, "epoch": 3296} {"train_loss": -6.659211158752441, "global_step": 138469, "epoch": 3296} {"train_loss": -6.616329669952393, "global_step": 138470, "epoch": 3296} {"train_loss": -6.730767250061035, "global_step": 138471, "epoch": 3296} {"train_loss": -6.63190221786499, "global_step": 138472, "epoch": 3296} {"train_loss": -6.693794193721953, "global_step": 138473, "epoch": 3296, "val_loss": 68229.34375} {"train_loss": -6.7637619972229, "global_step": 138474, "epoch": 3297} {"train_loss": -6.794842720031738, "global_step": 138475, "epoch": 3297} {"train_loss": -6.733259201049805, "global_step": 138476, "epoch": 3297} {"train_loss": -6.672842025756836, "global_step": 138477, "epoch": 3297} {"train_loss": -6.646226406097412, "global_step": 138478, "epoch": 3297} {"train_loss": -6.683416366577148, "global_step": 138479, "epoch": 3297} {"train_loss": -6.765684604644775, "global_step": 138480, "epoch": 3297} {"train_loss": -6.702549934387207, "global_step": 138481, "epoch": 3297} {"train_loss": -6.879387855529785, "global_step": 138482, "epoch": 3297} {"train_loss": -6.890074253082275, "global_step": 138483, "epoch": 3297} {"train_loss": -6.795050621032715, "global_step": 138484, "epoch": 3297} {"train_loss": -6.716900825500488, "global_step": 138485, "epoch": 3297} {"train_loss": -6.733617782592773, "global_step": 138486, "epoch": 3297} {"train_loss": -6.71980094909668, "global_step": 138487, "epoch": 3297} {"train_loss": -6.767897605895996, "global_step": 138488, "epoch": 3297} {"train_loss": -6.714454650878906, "global_step": 138489, "epoch": 3297} {"train_loss": -6.736782550811768, "global_step": 138490, "epoch": 3297} {"train_loss": -6.74330472946167, "global_step": 138491, "epoch": 3297} {"train_loss": -6.7351393699646, "global_step": 138492, "epoch": 3297} {"train_loss": -6.738617897033691, "global_step": 138493, "epoch": 3297} {"train_loss": -6.756547451019287, "global_step": 138494, "epoch": 3297} {"train_loss": -6.687443733215332, "global_step": 138495, "epoch": 3297} {"train_loss": -6.762465953826904, "global_step": 138496, "epoch": 3297} {"train_loss": -6.822950839996338, "global_step": 138497, "epoch": 3297} {"train_loss": -6.75881290435791, "global_step": 138498, "epoch": 3297} {"train_loss": -6.794543743133545, "global_step": 138499, "epoch": 3297} {"train_loss": -6.654109954833984, "global_step": 138500, "epoch": 3297} {"train_loss": -6.711795806884766, "global_step": 138501, "epoch": 3297} {"train_loss": -6.692526817321777, "global_step": 138502, "epoch": 3297} {"train_loss": -6.809257507324219, "global_step": 138503, "epoch": 3297} {"train_loss": -6.634907245635986, "global_step": 138504, "epoch": 3297} {"train_loss": -6.642573833465576, "global_step": 138505, "epoch": 3297} {"train_loss": -6.674118995666504, "global_step": 138506, "epoch": 3297} {"train_loss": -6.647216320037842, "global_step": 138507, "epoch": 3297} {"train_loss": -6.634361743927002, "global_step": 138508, "epoch": 3297} {"train_loss": -6.774991035461426, "global_step": 138509, "epoch": 3297} {"train_loss": -6.731074810028076, "global_step": 138510, "epoch": 3297} {"train_loss": -6.759805679321289, "global_step": 138511, "epoch": 3297} {"train_loss": -6.836239814758301, "global_step": 138512, "epoch": 3297} {"train_loss": -6.640586853027344, "global_step": 138513, "epoch": 3297} {"train_loss": -6.735032558441162, "global_step": 138514, "epoch": 3297} {"train_loss": -6.73321178981236, "global_step": 138515, "epoch": 3297, "val_loss": 68255.03125} {"train_loss": -6.719365119934082, "global_step": 138516, "epoch": 3298} {"train_loss": -6.718489170074463, "global_step": 138517, "epoch": 3298} {"train_loss": -6.728134632110596, "global_step": 138518, "epoch": 3298} {"train_loss": -6.753173828125, "global_step": 138519, "epoch": 3298} {"train_loss": -6.826228141784668, "global_step": 138520, "epoch": 3298} {"train_loss": -6.736396789550781, "global_step": 138521, "epoch": 3298} {"train_loss": -6.751296043395996, "global_step": 138522, "epoch": 3298} {"train_loss": -6.628779411315918, "global_step": 138523, "epoch": 3298} {"train_loss": -6.7599945068359375, "global_step": 138524, "epoch": 3298} {"train_loss": -6.701994895935059, "global_step": 138525, "epoch": 3298} {"train_loss": -6.797036170959473, "global_step": 138526, "epoch": 3298} {"train_loss": -6.6904802322387695, "global_step": 138527, "epoch": 3298} {"train_loss": -6.696489334106445, "global_step": 138528, "epoch": 3298} {"train_loss": -6.7601318359375, "global_step": 138529, "epoch": 3298} {"train_loss": -6.729668140411377, "global_step": 138530, "epoch": 3298} {"train_loss": -6.646390914916992, "global_step": 138531, "epoch": 3298} {"train_loss": -6.799582481384277, "global_step": 138532, "epoch": 3298} {"train_loss": -6.752499580383301, "global_step": 138533, "epoch": 3298} {"train_loss": -6.819685935974121, "global_step": 138534, "epoch": 3298} {"train_loss": -6.776731014251709, "global_step": 138535, "epoch": 3298} {"train_loss": -6.733092308044434, "global_step": 138536, "epoch": 3298} {"train_loss": -6.673160552978516, "global_step": 138537, "epoch": 3298} {"train_loss": -6.933484077453613, "global_step": 138538, "epoch": 3298} {"train_loss": -6.6589460372924805, "global_step": 138539, "epoch": 3298} {"train_loss": -6.767926216125488, "global_step": 138540, "epoch": 3298} {"train_loss": -6.654191017150879, "global_step": 138541, "epoch": 3298} {"train_loss": -6.801772117614746, "global_step": 138542, "epoch": 3298} {"train_loss": -6.709399223327637, "global_step": 138543, "epoch": 3298} {"train_loss": -6.7575225830078125, "global_step": 138544, "epoch": 3298} {"train_loss": -6.751665115356445, "global_step": 138545, "epoch": 3298} {"train_loss": -6.809996128082275, "global_step": 138546, "epoch": 3298} {"train_loss": -6.770665645599365, "global_step": 138547, "epoch": 3298} {"train_loss": -6.7645063400268555, "global_step": 138548, "epoch": 3298} {"train_loss": -6.718602180480957, "global_step": 138549, "epoch": 3298} {"train_loss": -6.674403190612793, "global_step": 138550, "epoch": 3298} {"train_loss": -6.790618896484375, "global_step": 138551, "epoch": 3298} {"train_loss": -6.709717750549316, "global_step": 138552, "epoch": 3298} {"train_loss": -6.697904586791992, "global_step": 138553, "epoch": 3298} {"train_loss": -6.692319869995117, "global_step": 138554, "epoch": 3298} {"train_loss": -6.677768230438232, "global_step": 138555, "epoch": 3298} {"train_loss": -6.635809898376465, "global_step": 138556, "epoch": 3298} {"train_loss": -6.734677314758301, "global_step": 138557, "epoch": 3298, "val_loss": 68341.9453125} {"train_loss": -6.6682915687561035, "global_step": 138558, "epoch": 3299} {"train_loss": -6.72261905670166, "global_step": 138559, "epoch": 3299} {"train_loss": -6.761448860168457, "global_step": 138560, "epoch": 3299} {"train_loss": -6.742447376251221, "global_step": 138561, "epoch": 3299} {"train_loss": -6.811238765716553, "global_step": 138562, "epoch": 3299} {"train_loss": -6.715739727020264, "global_step": 138563, "epoch": 3299} {"train_loss": -6.843790054321289, "global_step": 138564, "epoch": 3299} {"train_loss": -6.740577220916748, "global_step": 138565, "epoch": 3299} {"train_loss": -6.68741512298584, "global_step": 138566, "epoch": 3299} {"train_loss": -6.752642631530762, "global_step": 138567, "epoch": 3299} {"train_loss": -6.6223273277282715, "global_step": 138568, "epoch": 3299} {"train_loss": -6.631463050842285, "global_step": 138569, "epoch": 3299} {"train_loss": -6.834436416625977, "global_step": 138570, "epoch": 3299} {"train_loss": -6.639751434326172, "global_step": 138571, "epoch": 3299} {"train_loss": -6.7353620529174805, "global_step": 138572, "epoch": 3299} {"train_loss": -6.744657516479492, "global_step": 138573, "epoch": 3299} {"train_loss": -6.76580810546875, "global_step": 138574, "epoch": 3299} {"train_loss": -6.708637714385986, "global_step": 138575, "epoch": 3299} {"train_loss": -6.8097333908081055, "global_step": 138576, "epoch": 3299} {"train_loss": -6.641199111938477, "global_step": 138577, "epoch": 3299} {"train_loss": -6.683614730834961, "global_step": 138578, "epoch": 3299} {"train_loss": -6.666689395904541, "global_step": 138579, "epoch": 3299} {"train_loss": -6.6568379402160645, "global_step": 138580, "epoch": 3299} {"train_loss": -6.711651802062988, "global_step": 138581, "epoch": 3299} {"train_loss": -6.680014610290527, "global_step": 138582, "epoch": 3299} {"train_loss": -6.782710552215576, "global_step": 138583, "epoch": 3299} {"train_loss": -6.7361369132995605, "global_step": 138584, "epoch": 3299} {"train_loss": -6.608366012573242, "global_step": 138585, "epoch": 3299} {"train_loss": -6.702223777770996, "global_step": 138586, "epoch": 3299} {"train_loss": -6.636120319366455, "global_step": 138587, "epoch": 3299} {"train_loss": -6.709429740905762, "global_step": 138588, "epoch": 3299} {"train_loss": -6.830386161804199, "global_step": 138589, "epoch": 3299} {"train_loss": -6.74269962310791, "global_step": 138590, "epoch": 3299} {"train_loss": -6.693841934204102, "global_step": 138591, "epoch": 3299} {"train_loss": -6.691125869750977, "global_step": 138592, "epoch": 3299} {"train_loss": -6.698535919189453, "global_step": 138593, "epoch": 3299} {"train_loss": -6.743498802185059, "global_step": 138594, "epoch": 3299} {"train_loss": -6.726645469665527, "global_step": 138595, "epoch": 3299} {"train_loss": -6.605071067810059, "global_step": 138596, "epoch": 3299} {"train_loss": -6.641875743865967, "global_step": 138597, "epoch": 3299} {"train_loss": -6.571972370147705, "global_step": 138598, "epoch": 3299} {"train_loss": -6.707856814066569, "global_step": 138599, "epoch": 3299, "val_loss": 68553.109375} {"train_loss": -6.674676895141602, "global_step": 138600, "epoch": 3300} {"train_loss": -6.537207126617432, "global_step": 138601, "epoch": 3300} {"train_loss": -6.576127529144287, "global_step": 138602, "epoch": 3300} {"train_loss": -6.462991714477539, "global_step": 138603, "epoch": 3300} {"train_loss": -6.603069305419922, "global_step": 138604, "epoch": 3300} {"train_loss": -6.534002304077148, "global_step": 138605, "epoch": 3300} {"train_loss": -6.612065315246582, "global_step": 138606, "epoch": 3300} {"train_loss": -6.7079877853393555, "global_step": 138607, "epoch": 3300} {"train_loss": -6.59312629699707, "global_step": 138608, "epoch": 3300} {"train_loss": -6.629971504211426, "global_step": 138609, "epoch": 3300} {"train_loss": -6.730637550354004, "global_step": 138610, "epoch": 3300} {"train_loss": -6.692202568054199, "global_step": 138611, "epoch": 3300} {"train_loss": -6.707518577575684, "global_step": 138612, "epoch": 3300} {"train_loss": -6.690822601318359, "global_step": 138613, "epoch": 3300} {"train_loss": -6.740259170532227, "global_step": 138614, "epoch": 3300} {"train_loss": -6.701749801635742, "global_step": 138615, "epoch": 3300} {"train_loss": -6.612420082092285, "global_step": 138616, "epoch": 3300} {"train_loss": -6.50927734375, "global_step": 138617, "epoch": 3300} {"train_loss": -6.715040683746338, "global_step": 138618, "epoch": 3300} {"train_loss": -6.6414361000061035, "global_step": 138619, "epoch": 3300} {"train_loss": -6.760334491729736, "global_step": 138620, "epoch": 3300} {"train_loss": -6.698943614959717, "global_step": 138621, "epoch": 3300} {"train_loss": -6.623733043670654, "global_step": 138622, "epoch": 3300} {"train_loss": -6.735282897949219, "global_step": 138623, "epoch": 3300} {"train_loss": -6.877793312072754, "global_step": 138624, "epoch": 3300} {"train_loss": -6.657050132751465, "global_step": 138625, "epoch": 3300} {"train_loss": -6.664860725402832, "global_step": 138626, "epoch": 3300} {"train_loss": -6.650332450866699, "global_step": 138627, "epoch": 3300} {"train_loss": -6.725030899047852, "global_step": 138628, "epoch": 3300} {"train_loss": -6.636706352233887, "global_step": 138629, "epoch": 3300} {"train_loss": -6.633612632751465, "global_step": 138630, "epoch": 3300} {"train_loss": -6.671100616455078, "global_step": 138631, "epoch": 3300} {"train_loss": -6.734821319580078, "global_step": 138632, "epoch": 3300} {"train_loss": -6.830136299133301, "global_step": 138633, "epoch": 3300} {"train_loss": -6.650726795196533, "global_step": 138634, "epoch": 3300} {"train_loss": -6.691625595092773, "global_step": 138635, "epoch": 3300} {"train_loss": -6.72409725189209, "global_step": 138636, "epoch": 3300} {"train_loss": -6.5901689529418945, "global_step": 138637, "epoch": 3300} {"train_loss": -6.676428318023682, "global_step": 138638, "epoch": 3300} {"train_loss": -6.663539886474609, "global_step": 138639, "epoch": 3300} {"train_loss": -6.691195964813232, "global_step": 138640, "epoch": 3300} {"train_loss": -6.665634756996518, "global_step": 138641, "epoch": 3300, "train/sim_max_reward_0": 0.995716195592291, "train/sim_max_reward_1": 0.8662432545558606, "train/sim_max_reward_2": 0.5435532573761753, "train/sim_max_reward_3": 0.11637661641771709, "train/sim_max_reward_4": 0.8393806906651134, "train/sim_max_reward_5": 0.5728659157521601, "test/sim_max_reward_4400000": 0.152111812965604, "test/sim_max_reward_4400001": 0.9726244279150079, "test/sim_max_reward_4400002": 0.5064599294229143, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.24330384182391251, "test/sim_max_reward_4400006": 0.8485446869411153, "test/sim_max_reward_4400007": 0.8293250600458945, "test/sim_max_reward_4400008": 0.3024973809876018, "test/sim_max_reward_4400009": 0.8648453580484126, "test/sim_max_reward_4400010": 0.2696871430228578, "test/sim_max_reward_4400011": 0.28492834994602656, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9365185753403751, "test/sim_max_reward_4400014": 0.9150998434652491, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.14035674665017608, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24491191414734426, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9481319087516111, "test/sim_max_reward_4400023": 0.8755067472238683, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.2706434816527314, "test/sim_max_reward_4400026": 0.8305606803592521, "test/sim_max_reward_4400027": 0.0057004877544381966, "test/sim_max_reward_4400028": 0.9446043231350296, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.8916504593583371, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8314790931942434, "test/sim_max_reward_4400034": 0.8409282202530801, "test/sim_max_reward_4400035": 0.558794723382371, "test/sim_max_reward_4400036": 0.3970524917190837, "test/sim_max_reward_4400037": 0.9276053635380459, "test/sim_max_reward_4400038": 0.9918766244067525, "test/sim_max_reward_4400039": 0.7981806115589057, "test/sim_max_reward_4400040": 0.9403131774995629, "test/sim_max_reward_4400041": 0.9666735556957075, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.8794043370533683, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8140806692411636, "test/sim_max_reward_4400047": 0.9408624498884808, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.857149878485649, "train/mean_score": 0.6556893217265529, "test/mean_score": 0.592735028130751, "val_loss": 68187.28125} {"train_loss": -6.718726634979248, "global_step": 138642, "epoch": 3301} {"train_loss": -6.813600540161133, "global_step": 138643, "epoch": 3301} {"train_loss": -6.704416275024414, "global_step": 138644, "epoch": 3301} {"train_loss": -6.726202011108398, "global_step": 138645, "epoch": 3301} {"train_loss": -6.752904891967773, "global_step": 138646, "epoch": 3301} {"train_loss": -6.852971076965332, "global_step": 138647, "epoch": 3301} {"train_loss": -6.712586879730225, "global_step": 138648, "epoch": 3301} {"train_loss": -6.720076560974121, "global_step": 138649, "epoch": 3301} {"train_loss": -6.771984577178955, "global_step": 138650, "epoch": 3301} {"train_loss": -6.727688789367676, "global_step": 138651, "epoch": 3301} {"train_loss": -6.830470561981201, "global_step": 138652, "epoch": 3301} {"train_loss": -6.653745174407959, "global_step": 138653, "epoch": 3301} {"train_loss": -6.696872711181641, "global_step": 138654, "epoch": 3301} {"train_loss": -6.656909942626953, "global_step": 138655, "epoch": 3301} {"train_loss": -6.702971458435059, "global_step": 138656, "epoch": 3301} {"train_loss": -6.766408920288086, "global_step": 138657, "epoch": 3301} {"train_loss": -6.746631622314453, "global_step": 138658, "epoch": 3301} {"train_loss": -6.7497782707214355, "global_step": 138659, "epoch": 3301} {"train_loss": -6.817202091217041, "global_step": 138660, "epoch": 3301} {"train_loss": -6.676357746124268, "global_step": 138661, "epoch": 3301} {"train_loss": -6.722267150878906, "global_step": 138662, "epoch": 3301} {"train_loss": -6.692163467407227, "global_step": 138663, "epoch": 3301} {"train_loss": -6.63743257522583, "global_step": 138664, "epoch": 3301} {"train_loss": -6.653369903564453, "global_step": 138665, "epoch": 3301} {"train_loss": -6.595541954040527, "global_step": 138666, "epoch": 3301} {"train_loss": -6.755223751068115, "global_step": 138667, "epoch": 3301} {"train_loss": -6.774621486663818, "global_step": 138668, "epoch": 3301} {"train_loss": -6.644623756408691, "global_step": 138669, "epoch": 3301} {"train_loss": -6.804089069366455, "global_step": 138670, "epoch": 3301} {"train_loss": -6.688249588012695, "global_step": 138671, "epoch": 3301} {"train_loss": -6.715819358825684, "global_step": 138672, "epoch": 3301} {"train_loss": -6.655675888061523, "global_step": 138673, "epoch": 3301} {"train_loss": -6.823871612548828, "global_step": 138674, "epoch": 3301} {"train_loss": -6.795597553253174, "global_step": 138675, "epoch": 3301} {"train_loss": -6.63463830947876, "global_step": 138676, "epoch": 3301} {"train_loss": -6.693187713623047, "global_step": 138677, "epoch": 3301} {"train_loss": -6.55833625793457, "global_step": 138678, "epoch": 3301} {"train_loss": -6.565089225769043, "global_step": 138679, "epoch": 3301} {"train_loss": -6.615758419036865, "global_step": 138680, "epoch": 3301} {"train_loss": -6.739920616149902, "global_step": 138681, "epoch": 3301} {"train_loss": -6.710036754608154, "global_step": 138682, "epoch": 3301} {"train_loss": -6.710104329245431, "global_step": 138683, "epoch": 3301, "val_loss": 68648.40625} {"train_loss": -6.6736741065979, "global_step": 138684, "epoch": 3302} {"train_loss": -6.627283096313477, "global_step": 138685, "epoch": 3302} {"train_loss": -6.669506549835205, "global_step": 138686, "epoch": 3302} {"train_loss": -6.694571018218994, "global_step": 138687, "epoch": 3302} {"train_loss": -6.600128173828125, "global_step": 138688, "epoch": 3302} {"train_loss": -6.671070575714111, "global_step": 138689, "epoch": 3302} {"train_loss": -6.561087131500244, "global_step": 138690, "epoch": 3302} {"train_loss": -6.67820405960083, "global_step": 138691, "epoch": 3302} {"train_loss": -6.647688865661621, "global_step": 138692, "epoch": 3302} {"train_loss": -6.667087554931641, "global_step": 138693, "epoch": 3302} {"train_loss": -6.702632427215576, "global_step": 138694, "epoch": 3302} {"train_loss": -6.73203182220459, "global_step": 138695, "epoch": 3302} {"train_loss": -6.662207126617432, "global_step": 138696, "epoch": 3302} {"train_loss": -6.778120040893555, "global_step": 138697, "epoch": 3302} {"train_loss": -6.575656890869141, "global_step": 138698, "epoch": 3302} {"train_loss": -6.635863304138184, "global_step": 138699, "epoch": 3302} {"train_loss": -6.711268424987793, "global_step": 138700, "epoch": 3302} {"train_loss": -6.714533805847168, "global_step": 138701, "epoch": 3302} {"train_loss": -6.714044094085693, "global_step": 138702, "epoch": 3302} {"train_loss": -6.816530227661133, "global_step": 138703, "epoch": 3302} {"train_loss": -6.796240329742432, "global_step": 138704, "epoch": 3302} {"train_loss": -6.784144401550293, "global_step": 138705, "epoch": 3302} {"train_loss": -6.685266971588135, "global_step": 138706, "epoch": 3302} {"train_loss": -6.693994522094727, "global_step": 138707, "epoch": 3302} {"train_loss": -6.674150466918945, "global_step": 138708, "epoch": 3302} {"train_loss": -6.7654266357421875, "global_step": 138709, "epoch": 3302} {"train_loss": -6.746128082275391, "global_step": 138710, "epoch": 3302} {"train_loss": -6.706166744232178, "global_step": 138711, "epoch": 3302} {"train_loss": -6.745722770690918, "global_step": 138712, "epoch": 3302} {"train_loss": -6.689039707183838, "global_step": 138713, "epoch": 3302} {"train_loss": -6.738512992858887, "global_step": 138714, "epoch": 3302} {"train_loss": -6.740014553070068, "global_step": 138715, "epoch": 3302} {"train_loss": -6.7258477210998535, "global_step": 138716, "epoch": 3302} {"train_loss": -6.7001495361328125, "global_step": 138717, "epoch": 3302} {"train_loss": -6.653783798217773, "global_step": 138718, "epoch": 3302} {"train_loss": -6.678412437438965, "global_step": 138719, "epoch": 3302} {"train_loss": -6.752269744873047, "global_step": 138720, "epoch": 3302} {"train_loss": -6.720822334289551, "global_step": 138721, "epoch": 3302} {"train_loss": -6.658590316772461, "global_step": 138722, "epoch": 3302} {"train_loss": -6.7627787590026855, "global_step": 138723, "epoch": 3302} {"train_loss": -6.656880855560303, "global_step": 138724, "epoch": 3302} {"train_loss": -6.697630428132557, "global_step": 138725, "epoch": 3302, "val_loss": 68254.7421875} {"train_loss": -6.769570350646973, "global_step": 138726, "epoch": 3303} {"train_loss": -6.785196304321289, "global_step": 138727, "epoch": 3303} {"train_loss": -6.625166893005371, "global_step": 138728, "epoch": 3303} {"train_loss": -6.718448638916016, "global_step": 138729, "epoch": 3303} {"train_loss": -6.7774529457092285, "global_step": 138730, "epoch": 3303} {"train_loss": -6.8617048263549805, "global_step": 138731, "epoch": 3303} {"train_loss": -6.737295150756836, "global_step": 138732, "epoch": 3303} {"train_loss": -6.7144670486450195, "global_step": 138733, "epoch": 3303} {"train_loss": -6.638654708862305, "global_step": 138734, "epoch": 3303} {"train_loss": -6.577080249786377, "global_step": 138735, "epoch": 3303} {"train_loss": -6.67034912109375, "global_step": 138736, "epoch": 3303} {"train_loss": -6.604951858520508, "global_step": 138737, "epoch": 3303} {"train_loss": -6.672076225280762, "global_step": 138738, "epoch": 3303} {"train_loss": -6.727181911468506, "global_step": 138739, "epoch": 3303} {"train_loss": -6.677284240722656, "global_step": 138740, "epoch": 3303} {"train_loss": -6.6777849197387695, "global_step": 138741, "epoch": 3303} {"train_loss": -6.780368328094482, "global_step": 138742, "epoch": 3303} {"train_loss": -6.729518413543701, "global_step": 138743, "epoch": 3303} {"train_loss": -6.636408805847168, "global_step": 138744, "epoch": 3303} {"train_loss": -6.808140754699707, "global_step": 138745, "epoch": 3303} {"train_loss": -6.6414947509765625, "global_step": 138746, "epoch": 3303} {"train_loss": -6.659940242767334, "global_step": 138747, "epoch": 3303} {"train_loss": -6.685264587402344, "global_step": 138748, "epoch": 3303} {"train_loss": -6.804284572601318, "global_step": 138749, "epoch": 3303} {"train_loss": -6.676600456237793, "global_step": 138750, "epoch": 3303} {"train_loss": -6.690948009490967, "global_step": 138751, "epoch": 3303} {"train_loss": -6.682622909545898, "global_step": 138752, "epoch": 3303} {"train_loss": -6.672911643981934, "global_step": 138753, "epoch": 3303} {"train_loss": -6.640724182128906, "global_step": 138754, "epoch": 3303} {"train_loss": -6.785423278808594, "global_step": 138755, "epoch": 3303} {"train_loss": -6.677050590515137, "global_step": 138756, "epoch": 3303} {"train_loss": -6.689450263977051, "global_step": 138757, "epoch": 3303} {"train_loss": -6.677792072296143, "global_step": 138758, "epoch": 3303} {"train_loss": -6.713498115539551, "global_step": 138759, "epoch": 3303} {"train_loss": -6.740938186645508, "global_step": 138760, "epoch": 3303} {"train_loss": -6.688777923583984, "global_step": 138761, "epoch": 3303} {"train_loss": -6.716954231262207, "global_step": 138762, "epoch": 3303} {"train_loss": -6.703697681427002, "global_step": 138763, "epoch": 3303} {"train_loss": -6.797504901885986, "global_step": 138764, "epoch": 3303} {"train_loss": -6.7437896728515625, "global_step": 138765, "epoch": 3303} {"train_loss": -6.7961812019348145, "global_step": 138766, "epoch": 3303} {"train_loss": -6.708869162059965, "global_step": 138767, "epoch": 3303, "val_loss": 68303.8515625} {"train_loss": -6.612213134765625, "global_step": 138768, "epoch": 3304} {"train_loss": -6.766012668609619, "global_step": 138769, "epoch": 3304} {"train_loss": -6.732405662536621, "global_step": 138770, "epoch": 3304} {"train_loss": -6.751646995544434, "global_step": 138771, "epoch": 3304} {"train_loss": -6.790543079376221, "global_step": 138772, "epoch": 3304} {"train_loss": -6.757508277893066, "global_step": 138773, "epoch": 3304} {"train_loss": -6.784830093383789, "global_step": 138774, "epoch": 3304} {"train_loss": -6.879159450531006, "global_step": 138775, "epoch": 3304} {"train_loss": -6.677495956420898, "global_step": 138776, "epoch": 3304} {"train_loss": -6.726207733154297, "global_step": 138777, "epoch": 3304} {"train_loss": -6.744683265686035, "global_step": 138778, "epoch": 3304} {"train_loss": -6.789346694946289, "global_step": 138779, "epoch": 3304} {"train_loss": -6.670550346374512, "global_step": 138780, "epoch": 3304} {"train_loss": -6.703001022338867, "global_step": 138781, "epoch": 3304} {"train_loss": -6.773630142211914, "global_step": 138782, "epoch": 3304} {"train_loss": -6.725236892700195, "global_step": 138783, "epoch": 3304} {"train_loss": -6.83648681640625, "global_step": 138784, "epoch": 3304} {"train_loss": -6.833558082580566, "global_step": 138785, "epoch": 3304} {"train_loss": -6.842931270599365, "global_step": 138786, "epoch": 3304} {"train_loss": -6.714419364929199, "global_step": 138787, "epoch": 3304} {"train_loss": -6.723886489868164, "global_step": 138788, "epoch": 3304} {"train_loss": -6.654609680175781, "global_step": 138789, "epoch": 3304} {"train_loss": -6.725519180297852, "global_step": 138790, "epoch": 3304} {"train_loss": -6.648152828216553, "global_step": 138791, "epoch": 3304} {"train_loss": -6.755795955657959, "global_step": 138792, "epoch": 3304} {"train_loss": -6.703004837036133, "global_step": 138793, "epoch": 3304} {"train_loss": -6.6827592849731445, "global_step": 138794, "epoch": 3304} {"train_loss": -6.700366497039795, "global_step": 138795, "epoch": 3304} {"train_loss": -6.677955150604248, "global_step": 138796, "epoch": 3304} {"train_loss": -6.622156620025635, "global_step": 138797, "epoch": 3304} {"train_loss": -6.652560234069824, "global_step": 138798, "epoch": 3304} {"train_loss": -6.6424055099487305, "global_step": 138799, "epoch": 3304} {"train_loss": -6.70632266998291, "global_step": 138800, "epoch": 3304} {"train_loss": -6.593478202819824, "global_step": 138801, "epoch": 3304} {"train_loss": -6.620516777038574, "global_step": 138802, "epoch": 3304} {"train_loss": -6.746257305145264, "global_step": 138803, "epoch": 3304} {"train_loss": -6.561011791229248, "global_step": 138804, "epoch": 3304} {"train_loss": -6.6608686447143555, "global_step": 138805, "epoch": 3304} {"train_loss": -6.665688514709473, "global_step": 138806, "epoch": 3304} {"train_loss": -6.624855041503906, "global_step": 138807, "epoch": 3304} {"train_loss": -6.650348663330078, "global_step": 138808, "epoch": 3304} {"train_loss": -6.708912792659941, "global_step": 138809, "epoch": 3304, "val_loss": 68224.4921875} {"train_loss": -6.6825432777404785, "global_step": 138810, "epoch": 3305} {"train_loss": -6.673804759979248, "global_step": 138811, "epoch": 3305} {"train_loss": -6.733513832092285, "global_step": 138812, "epoch": 3305} {"train_loss": -6.671988487243652, "global_step": 138813, "epoch": 3305} {"train_loss": -6.608194351196289, "global_step": 138814, "epoch": 3305} {"train_loss": -6.702603816986084, "global_step": 138815, "epoch": 3305} {"train_loss": -6.64058780670166, "global_step": 138816, "epoch": 3305} {"train_loss": -6.622186660766602, "global_step": 138817, "epoch": 3305} {"train_loss": -6.788013458251953, "global_step": 138818, "epoch": 3305} {"train_loss": -6.749096870422363, "global_step": 138819, "epoch": 3305} {"train_loss": -6.594998836517334, "global_step": 138820, "epoch": 3305} {"train_loss": -6.64699649810791, "global_step": 138821, "epoch": 3305} {"train_loss": -6.714572429656982, "global_step": 138822, "epoch": 3305} {"train_loss": -6.7253031730651855, "global_step": 138823, "epoch": 3305} {"train_loss": -6.7419328689575195, "global_step": 138824, "epoch": 3305} {"train_loss": -6.6621856689453125, "global_step": 138825, "epoch": 3305} {"train_loss": -6.641095161437988, "global_step": 138826, "epoch": 3305} {"train_loss": -6.7138261795043945, "global_step": 138827, "epoch": 3305} {"train_loss": -6.578311920166016, "global_step": 138828, "epoch": 3305} {"train_loss": -6.644115447998047, "global_step": 138829, "epoch": 3305} {"train_loss": -6.67990255355835, "global_step": 138830, "epoch": 3305} {"train_loss": -6.4921674728393555, "global_step": 138831, "epoch": 3305} {"train_loss": -6.70346212387085, "global_step": 138832, "epoch": 3305} {"train_loss": -6.45430850982666, "global_step": 138833, "epoch": 3305} {"train_loss": -6.516513824462891, "global_step": 138834, "epoch": 3305} {"train_loss": -6.618108749389648, "global_step": 138835, "epoch": 3305} {"train_loss": -6.564275741577148, "global_step": 138836, "epoch": 3305} {"train_loss": -6.679800033569336, "global_step": 138837, "epoch": 3305} {"train_loss": -6.76212215423584, "global_step": 138838, "epoch": 3305} {"train_loss": -6.654847145080566, "global_step": 138839, "epoch": 3305} {"train_loss": -6.52154541015625, "global_step": 138840, "epoch": 3305} {"train_loss": -6.541411876678467, "global_step": 138841, "epoch": 3305} {"train_loss": -6.641136169433594, "global_step": 138842, "epoch": 3305} {"train_loss": -6.584847450256348, "global_step": 138843, "epoch": 3305} {"train_loss": -6.581830978393555, "global_step": 138844, "epoch": 3305} {"train_loss": -6.636260986328125, "global_step": 138845, "epoch": 3305} {"train_loss": -6.70152473449707, "global_step": 138846, "epoch": 3305} {"train_loss": -6.809450149536133, "global_step": 138847, "epoch": 3305} {"train_loss": -6.744172096252441, "global_step": 138848, "epoch": 3305} {"train_loss": -6.744269371032715, "global_step": 138849, "epoch": 3305} {"train_loss": -6.760602951049805, "global_step": 138850, "epoch": 3305} {"train_loss": -6.659065030869984, "global_step": 138851, "epoch": 3305, "val_loss": 68324.8671875} {"train_loss": -6.637479782104492, "global_step": 138852, "epoch": 3306} {"train_loss": -6.646755695343018, "global_step": 138853, "epoch": 3306} {"train_loss": -6.546049118041992, "global_step": 138854, "epoch": 3306} {"train_loss": -6.616909980773926, "global_step": 138855, "epoch": 3306} {"train_loss": -6.801052570343018, "global_step": 138856, "epoch": 3306} {"train_loss": -6.6269426345825195, "global_step": 138857, "epoch": 3306} {"train_loss": -6.678836822509766, "global_step": 138858, "epoch": 3306} {"train_loss": -6.751469135284424, "global_step": 138859, "epoch": 3306} {"train_loss": -6.73313570022583, "global_step": 138860, "epoch": 3306} {"train_loss": -6.752734184265137, "global_step": 138861, "epoch": 3306} {"train_loss": -6.783980369567871, "global_step": 138862, "epoch": 3306} {"train_loss": -6.828124046325684, "global_step": 138863, "epoch": 3306} {"train_loss": -6.575167179107666, "global_step": 138864, "epoch": 3306} {"train_loss": -6.654870986938477, "global_step": 138865, "epoch": 3306} {"train_loss": -6.786416530609131, "global_step": 138866, "epoch": 3306} {"train_loss": -6.749154090881348, "global_step": 138867, "epoch": 3306} {"train_loss": -6.752185821533203, "global_step": 138868, "epoch": 3306} {"train_loss": -6.83323860168457, "global_step": 138869, "epoch": 3306} {"train_loss": -6.719979286193848, "global_step": 138870, "epoch": 3306} {"train_loss": -6.6822919845581055, "global_step": 138871, "epoch": 3306} {"train_loss": -6.830355167388916, "global_step": 138872, "epoch": 3306} {"train_loss": -6.796898365020752, "global_step": 138873, "epoch": 3306} {"train_loss": -6.679162979125977, "global_step": 138874, "epoch": 3306} {"train_loss": -6.7509050369262695, "global_step": 138875, "epoch": 3306} {"train_loss": -6.756279945373535, "global_step": 138876, "epoch": 3306} {"train_loss": -6.751609802246094, "global_step": 138877, "epoch": 3306} {"train_loss": -6.682309150695801, "global_step": 138878, "epoch": 3306} {"train_loss": -6.649046421051025, "global_step": 138879, "epoch": 3306} {"train_loss": -6.6988115310668945, "global_step": 138880, "epoch": 3306} {"train_loss": -6.637092113494873, "global_step": 138881, "epoch": 3306} {"train_loss": -6.664178848266602, "global_step": 138882, "epoch": 3306} {"train_loss": -6.644355773925781, "global_step": 138883, "epoch": 3306} {"train_loss": -6.693697929382324, "global_step": 138884, "epoch": 3306} {"train_loss": -6.6935014724731445, "global_step": 138885, "epoch": 3306} {"train_loss": -6.794187068939209, "global_step": 138886, "epoch": 3306} {"train_loss": -6.638969421386719, "global_step": 138887, "epoch": 3306} {"train_loss": -6.681236267089844, "global_step": 138888, "epoch": 3306} {"train_loss": -6.697384834289551, "global_step": 138889, "epoch": 3306} {"train_loss": -6.608137130737305, "global_step": 138890, "epoch": 3306} {"train_loss": -6.702672958374023, "global_step": 138891, "epoch": 3306} {"train_loss": -6.637983322143555, "global_step": 138892, "epoch": 3306} {"train_loss": -6.7024985040937155, "global_step": 138893, "epoch": 3306, "val_loss": 68478.390625} {"train_loss": -6.780184745788574, "global_step": 138894, "epoch": 3307} {"train_loss": -6.788274765014648, "global_step": 138895, "epoch": 3307} {"train_loss": -6.772809982299805, "global_step": 138896, "epoch": 3307} {"train_loss": -6.586652755737305, "global_step": 138897, "epoch": 3307} {"train_loss": -6.6947736740112305, "global_step": 138898, "epoch": 3307} {"train_loss": -6.785834312438965, "global_step": 138899, "epoch": 3307} {"train_loss": -6.656580448150635, "global_step": 138900, "epoch": 3307} {"train_loss": -6.6522111892700195, "global_step": 138901, "epoch": 3307} {"train_loss": -6.662114143371582, "global_step": 138902, "epoch": 3307} {"train_loss": -6.763895511627197, "global_step": 138903, "epoch": 3307} {"train_loss": -6.807553768157959, "global_step": 138904, "epoch": 3307} {"train_loss": -6.6789631843566895, "global_step": 138905, "epoch": 3307} {"train_loss": -6.6818718910217285, "global_step": 138906, "epoch": 3307} {"train_loss": -6.68013858795166, "global_step": 138907, "epoch": 3307} {"train_loss": -6.726442337036133, "global_step": 138908, "epoch": 3307} {"train_loss": -6.76696252822876, "global_step": 138909, "epoch": 3307} {"train_loss": -6.651636123657227, "global_step": 138910, "epoch": 3307} {"train_loss": -6.636777400970459, "global_step": 138911, "epoch": 3307} {"train_loss": -6.702834606170654, "global_step": 138912, "epoch": 3307} {"train_loss": -6.679235458374023, "global_step": 138913, "epoch": 3307} {"train_loss": -6.696392059326172, "global_step": 138914, "epoch": 3307} {"train_loss": -6.564541816711426, "global_step": 138915, "epoch": 3307} {"train_loss": -6.752147197723389, "global_step": 138916, "epoch": 3307} {"train_loss": -6.578266620635986, "global_step": 138917, "epoch": 3307} {"train_loss": -6.636599540710449, "global_step": 138918, "epoch": 3307} {"train_loss": -6.868663787841797, "global_step": 138919, "epoch": 3307} {"train_loss": -6.671274185180664, "global_step": 138920, "epoch": 3307} {"train_loss": -6.719633102416992, "global_step": 138921, "epoch": 3307} {"train_loss": -6.677330493927002, "global_step": 138922, "epoch": 3307} {"train_loss": -6.666047096252441, "global_step": 138923, "epoch": 3307} {"train_loss": -6.707460880279541, "global_step": 138924, "epoch": 3307} {"train_loss": -6.687431812286377, "global_step": 138925, "epoch": 3307} {"train_loss": -6.753592491149902, "global_step": 138926, "epoch": 3307} {"train_loss": -6.6569600105285645, "global_step": 138927, "epoch": 3307} {"train_loss": -6.696633338928223, "global_step": 138928, "epoch": 3307} {"train_loss": -6.672781467437744, "global_step": 138929, "epoch": 3307} {"train_loss": -6.7895283699035645, "global_step": 138930, "epoch": 3307} {"train_loss": -6.692385673522949, "global_step": 138931, "epoch": 3307} {"train_loss": -6.628143310546875, "global_step": 138932, "epoch": 3307} {"train_loss": -6.72889518737793, "global_step": 138933, "epoch": 3307} {"train_loss": -6.657446384429932, "global_step": 138934, "epoch": 3307} {"train_loss": -6.700866608392625, "global_step": 138935, "epoch": 3307, "val_loss": 68461.6484375} {"train_loss": -6.612834453582764, "global_step": 138936, "epoch": 3308} {"train_loss": -6.743067264556885, "global_step": 138937, "epoch": 3308} {"train_loss": -6.761358261108398, "global_step": 138938, "epoch": 3308} {"train_loss": -6.563681602478027, "global_step": 138939, "epoch": 3308} {"train_loss": -6.636052131652832, "global_step": 138940, "epoch": 3308} {"train_loss": -6.700011253356934, "global_step": 138941, "epoch": 3308} {"train_loss": -6.712510585784912, "global_step": 138942, "epoch": 3308} {"train_loss": -6.771933555603027, "global_step": 138943, "epoch": 3308} {"train_loss": -6.635937690734863, "global_step": 138944, "epoch": 3308} {"train_loss": -6.641838073730469, "global_step": 138945, "epoch": 3308} {"train_loss": -6.551905632019043, "global_step": 138946, "epoch": 3308} {"train_loss": -6.609671592712402, "global_step": 138947, "epoch": 3308} {"train_loss": -6.475274085998535, "global_step": 138948, "epoch": 3308} {"train_loss": -6.61287260055542, "global_step": 138949, "epoch": 3308} {"train_loss": -6.712325572967529, "global_step": 138950, "epoch": 3308} {"train_loss": -6.645352840423584, "global_step": 138951, "epoch": 3308} {"train_loss": -6.69912052154541, "global_step": 138952, "epoch": 3308} {"train_loss": -6.642928600311279, "global_step": 138953, "epoch": 3308} {"train_loss": -6.63063907623291, "global_step": 138954, "epoch": 3308} {"train_loss": -6.7587995529174805, "global_step": 138955, "epoch": 3308} {"train_loss": -6.687286376953125, "global_step": 138956, "epoch": 3308} {"train_loss": -6.508688926696777, "global_step": 138957, "epoch": 3308} {"train_loss": -6.647026062011719, "global_step": 138958, "epoch": 3308} {"train_loss": -6.652249813079834, "global_step": 138959, "epoch": 3308} {"train_loss": -6.663725852966309, "global_step": 138960, "epoch": 3308} {"train_loss": -6.728287220001221, "global_step": 138961, "epoch": 3308} {"train_loss": -6.674612045288086, "global_step": 138962, "epoch": 3308} {"train_loss": -6.764520645141602, "global_step": 138963, "epoch": 3308} {"train_loss": -6.689986228942871, "global_step": 138964, "epoch": 3308} {"train_loss": -6.793542861938477, "global_step": 138965, "epoch": 3308} {"train_loss": -6.84809684753418, "global_step": 138966, "epoch": 3308} {"train_loss": -6.7401909828186035, "global_step": 138967, "epoch": 3308} {"train_loss": -6.735603332519531, "global_step": 138968, "epoch": 3308} {"train_loss": -6.643754005432129, "global_step": 138969, "epoch": 3308} {"train_loss": -6.663063049316406, "global_step": 138970, "epoch": 3308} {"train_loss": -6.641605377197266, "global_step": 138971, "epoch": 3308} {"train_loss": -6.819769859313965, "global_step": 138972, "epoch": 3308} {"train_loss": -6.747049808502197, "global_step": 138973, "epoch": 3308} {"train_loss": -6.747474670410156, "global_step": 138974, "epoch": 3308} {"train_loss": -6.597865581512451, "global_step": 138975, "epoch": 3308} {"train_loss": -6.779674530029297, "global_step": 138976, "epoch": 3308} {"train_loss": -6.680780740011306, "global_step": 138977, "epoch": 3308, "val_loss": 68319.671875} {"train_loss": -6.761528968811035, "global_step": 138978, "epoch": 3309} {"train_loss": -6.7071943283081055, "global_step": 138979, "epoch": 3309} {"train_loss": -6.703044891357422, "global_step": 138980, "epoch": 3309} {"train_loss": -6.695451259613037, "global_step": 138981, "epoch": 3309} {"train_loss": -6.68209171295166, "global_step": 138982, "epoch": 3309} {"train_loss": -6.750225067138672, "global_step": 138983, "epoch": 3309} {"train_loss": -6.753523826599121, "global_step": 138984, "epoch": 3309} {"train_loss": -6.731980323791504, "global_step": 138985, "epoch": 3309} {"train_loss": -6.8379316329956055, "global_step": 138986, "epoch": 3309} {"train_loss": -6.660671234130859, "global_step": 138987, "epoch": 3309} {"train_loss": -6.6054887771606445, "global_step": 138988, "epoch": 3309} {"train_loss": -6.756076812744141, "global_step": 138989, "epoch": 3309} {"train_loss": -6.731614112854004, "global_step": 138990, "epoch": 3309} {"train_loss": -6.657827854156494, "global_step": 138991, "epoch": 3309} {"train_loss": -6.729328632354736, "global_step": 138992, "epoch": 3309} {"train_loss": -6.743230819702148, "global_step": 138993, "epoch": 3309} {"train_loss": -6.7025299072265625, "global_step": 138994, "epoch": 3309} {"train_loss": -6.642250061035156, "global_step": 138995, "epoch": 3309} {"train_loss": -6.709150314331055, "global_step": 138996, "epoch": 3309} {"train_loss": -6.693706512451172, "global_step": 138997, "epoch": 3309} {"train_loss": -6.844688415527344, "global_step": 138998, "epoch": 3309} {"train_loss": -6.721809387207031, "global_step": 138999, "epoch": 3309} {"train_loss": -6.75368595123291, "global_step": 139000, "epoch": 3309} {"train_loss": -6.788670539855957, "global_step": 139001, "epoch": 3309} {"train_loss": -6.6731109619140625, "global_step": 139002, "epoch": 3309} {"train_loss": -6.785677433013916, "global_step": 139003, "epoch": 3309} {"train_loss": -6.8321380615234375, "global_step": 139004, "epoch": 3309} {"train_loss": -6.7694196701049805, "global_step": 139005, "epoch": 3309} {"train_loss": -6.756775856018066, "global_step": 139006, "epoch": 3309} {"train_loss": -6.609192848205566, "global_step": 139007, "epoch": 3309} {"train_loss": -6.719170570373535, "global_step": 139008, "epoch": 3309} {"train_loss": -6.765162467956543, "global_step": 139009, "epoch": 3309} {"train_loss": -6.664263725280762, "global_step": 139010, "epoch": 3309} {"train_loss": -6.777496337890625, "global_step": 139011, "epoch": 3309} {"train_loss": -6.766916751861572, "global_step": 139012, "epoch": 3309} {"train_loss": -6.650420188903809, "global_step": 139013, "epoch": 3309} {"train_loss": -6.804629325866699, "global_step": 139014, "epoch": 3309} {"train_loss": -6.672212600708008, "global_step": 139015, "epoch": 3309} {"train_loss": -6.728063583374023, "global_step": 139016, "epoch": 3309} {"train_loss": -6.714385986328125, "global_step": 139017, "epoch": 3309} {"train_loss": -6.577436923980713, "global_step": 139018, "epoch": 3309} {"train_loss": -6.722431773231143, "global_step": 139019, "epoch": 3309, "val_loss": 68197.625} {"train_loss": -6.6953654289245605, "global_step": 139020, "epoch": 3310} {"train_loss": -6.570602893829346, "global_step": 139021, "epoch": 3310} {"train_loss": -6.621200084686279, "global_step": 139022, "epoch": 3310} {"train_loss": -6.565044403076172, "global_step": 139023, "epoch": 3310} {"train_loss": -6.6550798416137695, "global_step": 139024, "epoch": 3310} {"train_loss": -6.788393974304199, "global_step": 139025, "epoch": 3310} {"train_loss": -6.67325496673584, "global_step": 139026, "epoch": 3310} {"train_loss": -6.757251739501953, "global_step": 139027, "epoch": 3310} {"train_loss": -6.757122993469238, "global_step": 139028, "epoch": 3310} {"train_loss": -6.701555252075195, "global_step": 139029, "epoch": 3310} {"train_loss": -6.694975852966309, "global_step": 139030, "epoch": 3310} {"train_loss": -6.787930488586426, "global_step": 139031, "epoch": 3310} {"train_loss": -6.787667274475098, "global_step": 139032, "epoch": 3310} {"train_loss": -6.6240386962890625, "global_step": 139033, "epoch": 3310} {"train_loss": -6.632917881011963, "global_step": 139034, "epoch": 3310} {"train_loss": -6.686652183532715, "global_step": 139035, "epoch": 3310} {"train_loss": -6.708160877227783, "global_step": 139036, "epoch": 3310} {"train_loss": -6.763815879821777, "global_step": 139037, "epoch": 3310} {"train_loss": -6.724641799926758, "global_step": 139038, "epoch": 3310} {"train_loss": -6.816626071929932, "global_step": 139039, "epoch": 3310} {"train_loss": -6.64357852935791, "global_step": 139040, "epoch": 3310} {"train_loss": -6.742833137512207, "global_step": 139041, "epoch": 3310} {"train_loss": -6.757079124450684, "global_step": 139042, "epoch": 3310} {"train_loss": -6.603668689727783, "global_step": 139043, "epoch": 3310} {"train_loss": -6.813758850097656, "global_step": 139044, "epoch": 3310} {"train_loss": -6.663552284240723, "global_step": 139045, "epoch": 3310} {"train_loss": -6.693918228149414, "global_step": 139046, "epoch": 3310} {"train_loss": -6.715703010559082, "global_step": 139047, "epoch": 3310} {"train_loss": -6.768014907836914, "global_step": 139048, "epoch": 3310} {"train_loss": -6.6739397048950195, "global_step": 139049, "epoch": 3310} {"train_loss": -6.682598114013672, "global_step": 139050, "epoch": 3310} {"train_loss": -6.618131160736084, "global_step": 139051, "epoch": 3310} {"train_loss": -6.673291206359863, "global_step": 139052, "epoch": 3310} {"train_loss": -6.623706817626953, "global_step": 139053, "epoch": 3310} {"train_loss": -6.781723976135254, "global_step": 139054, "epoch": 3310} {"train_loss": -6.804727554321289, "global_step": 139055, "epoch": 3310} {"train_loss": -6.7790961265563965, "global_step": 139056, "epoch": 3310} {"train_loss": -6.739610195159912, "global_step": 139057, "epoch": 3310} {"train_loss": -6.689794063568115, "global_step": 139058, "epoch": 3310} {"train_loss": -6.76265811920166, "global_step": 139059, "epoch": 3310} {"train_loss": -6.761430740356445, "global_step": 139060, "epoch": 3310} {"train_loss": -6.707464047840664, "global_step": 139061, "epoch": 3310, "val_loss": 68405.59375} {"train_loss": -6.736376762390137, "global_step": 139062, "epoch": 3311} {"train_loss": -6.744272708892822, "global_step": 139063, "epoch": 3311} {"train_loss": -6.826916694641113, "global_step": 139064, "epoch": 3311} {"train_loss": -6.715245723724365, "global_step": 139065, "epoch": 3311} {"train_loss": -6.738511562347412, "global_step": 139066, "epoch": 3311} {"train_loss": -6.846462249755859, "global_step": 139067, "epoch": 3311} {"train_loss": -6.628871440887451, "global_step": 139068, "epoch": 3311} {"train_loss": -6.729955196380615, "global_step": 139069, "epoch": 3311} {"train_loss": -6.775163173675537, "global_step": 139070, "epoch": 3311} {"train_loss": -6.862912654876709, "global_step": 139071, "epoch": 3311} {"train_loss": -6.812851905822754, "global_step": 139072, "epoch": 3311} {"train_loss": -6.776686668395996, "global_step": 139073, "epoch": 3311} {"train_loss": -6.784134864807129, "global_step": 139074, "epoch": 3311} {"train_loss": -6.8621649742126465, "global_step": 139075, "epoch": 3311} {"train_loss": -6.718371391296387, "global_step": 139076, "epoch": 3311} {"train_loss": -6.729580879211426, "global_step": 139077, "epoch": 3311} {"train_loss": -6.693195343017578, "global_step": 139078, "epoch": 3311} {"train_loss": -6.69456672668457, "global_step": 139079, "epoch": 3311} {"train_loss": -6.806288719177246, "global_step": 139080, "epoch": 3311} {"train_loss": -6.68443489074707, "global_step": 139081, "epoch": 3311} {"train_loss": -6.710638046264648, "global_step": 139082, "epoch": 3311} {"train_loss": -6.669012069702148, "global_step": 139083, "epoch": 3311} {"train_loss": -6.7206220626831055, "global_step": 139084, "epoch": 3311} {"train_loss": -6.793426513671875, "global_step": 139085, "epoch": 3311} {"train_loss": -6.818696975708008, "global_step": 139086, "epoch": 3311} {"train_loss": -6.779195785522461, "global_step": 139087, "epoch": 3311} {"train_loss": -6.870097637176514, "global_step": 139088, "epoch": 3311} {"train_loss": -6.675682067871094, "global_step": 139089, "epoch": 3311} {"train_loss": -6.77497673034668, "global_step": 139090, "epoch": 3311} {"train_loss": -6.782534599304199, "global_step": 139091, "epoch": 3311} {"train_loss": -6.700510025024414, "global_step": 139092, "epoch": 3311} {"train_loss": -6.729583263397217, "global_step": 139093, "epoch": 3311} {"train_loss": -6.706364154815674, "global_step": 139094, "epoch": 3311} {"train_loss": -6.784999847412109, "global_step": 139095, "epoch": 3311} {"train_loss": -6.819887161254883, "global_step": 139096, "epoch": 3311} {"train_loss": -6.731139659881592, "global_step": 139097, "epoch": 3311} {"train_loss": -6.692160606384277, "global_step": 139098, "epoch": 3311} {"train_loss": -6.675178527832031, "global_step": 139099, "epoch": 3311} {"train_loss": -6.594731330871582, "global_step": 139100, "epoch": 3311} {"train_loss": -6.704767227172852, "global_step": 139101, "epoch": 3311} {"train_loss": -6.718785285949707, "global_step": 139102, "epoch": 3311} {"train_loss": -6.744306121553693, "global_step": 139103, "epoch": 3311, "val_loss": 68373.78125} {"train_loss": -6.5765180587768555, "global_step": 139104, "epoch": 3312} {"train_loss": -6.67300271987915, "global_step": 139105, "epoch": 3312} {"train_loss": -6.551785469055176, "global_step": 139106, "epoch": 3312} {"train_loss": -6.487635612487793, "global_step": 139107, "epoch": 3312} {"train_loss": -6.710576057434082, "global_step": 139108, "epoch": 3312} {"train_loss": -6.585957050323486, "global_step": 139109, "epoch": 3312} {"train_loss": -6.6134796142578125, "global_step": 139110, "epoch": 3312} {"train_loss": -6.5831146240234375, "global_step": 139111, "epoch": 3312} {"train_loss": -6.763181209564209, "global_step": 139112, "epoch": 3312} {"train_loss": -6.617402076721191, "global_step": 139113, "epoch": 3312} {"train_loss": -6.73097038269043, "global_step": 139114, "epoch": 3312} {"train_loss": -6.720419883728027, "global_step": 139115, "epoch": 3312} {"train_loss": -6.558338165283203, "global_step": 139116, "epoch": 3312} {"train_loss": -6.716658592224121, "global_step": 139117, "epoch": 3312} {"train_loss": -6.646331787109375, "global_step": 139118, "epoch": 3312} {"train_loss": -6.701657772064209, "global_step": 139119, "epoch": 3312} {"train_loss": -6.568288326263428, "global_step": 139120, "epoch": 3312} {"train_loss": -6.710978984832764, "global_step": 139121, "epoch": 3312} {"train_loss": -6.587375164031982, "global_step": 139122, "epoch": 3312} {"train_loss": -6.686761856079102, "global_step": 139123, "epoch": 3312} {"train_loss": -6.596460819244385, "global_step": 139124, "epoch": 3312} {"train_loss": -6.582136154174805, "global_step": 139125, "epoch": 3312} {"train_loss": -6.683218479156494, "global_step": 139126, "epoch": 3312} {"train_loss": -6.651093482971191, "global_step": 139127, "epoch": 3312} {"train_loss": -6.527416229248047, "global_step": 139128, "epoch": 3312} {"train_loss": -6.469171524047852, "global_step": 139129, "epoch": 3312} {"train_loss": -6.727973937988281, "global_step": 139130, "epoch": 3312} {"train_loss": -6.598564624786377, "global_step": 139131, "epoch": 3312} {"train_loss": -6.709717750549316, "global_step": 139132, "epoch": 3312} {"train_loss": -6.4949822425842285, "global_step": 139133, "epoch": 3312} {"train_loss": -6.50191068649292, "global_step": 139134, "epoch": 3312} {"train_loss": -6.674452304840088, "global_step": 139135, "epoch": 3312} {"train_loss": -6.692661762237549, "global_step": 139136, "epoch": 3312} {"train_loss": -6.676030158996582, "global_step": 139137, "epoch": 3312} {"train_loss": -6.6983184814453125, "global_step": 139138, "epoch": 3312} {"train_loss": -6.699512481689453, "global_step": 139139, "epoch": 3312} {"train_loss": -6.753451824188232, "global_step": 139140, "epoch": 3312} {"train_loss": -6.56803035736084, "global_step": 139141, "epoch": 3312} {"train_loss": -6.71521520614624, "global_step": 139142, "epoch": 3312} {"train_loss": -6.759808540344238, "global_step": 139143, "epoch": 3312} {"train_loss": -6.691364288330078, "global_step": 139144, "epoch": 3312} {"train_loss": -6.640999419348581, "global_step": 139145, "epoch": 3312, "val_loss": 68298.421875} {"train_loss": -6.629033088684082, "global_step": 139146, "epoch": 3313} {"train_loss": -6.738690376281738, "global_step": 139147, "epoch": 3313} {"train_loss": -6.692368507385254, "global_step": 139148, "epoch": 3313} {"train_loss": -6.69287109375, "global_step": 139149, "epoch": 3313} {"train_loss": -6.6466474533081055, "global_step": 139150, "epoch": 3313} {"train_loss": -6.637096405029297, "global_step": 139151, "epoch": 3313} {"train_loss": -6.693214416503906, "global_step": 139152, "epoch": 3313} {"train_loss": -6.719423294067383, "global_step": 139153, "epoch": 3313} {"train_loss": -6.698202610015869, "global_step": 139154, "epoch": 3313} {"train_loss": -6.754375457763672, "global_step": 139155, "epoch": 3313} {"train_loss": -6.729644775390625, "global_step": 139156, "epoch": 3313} {"train_loss": -6.64149284362793, "global_step": 139157, "epoch": 3313} {"train_loss": -6.7465715408325195, "global_step": 139158, "epoch": 3313} {"train_loss": -6.715049743652344, "global_step": 139159, "epoch": 3313} {"train_loss": -6.877932548522949, "global_step": 139160, "epoch": 3313} {"train_loss": -6.495569229125977, "global_step": 139161, "epoch": 3313} {"train_loss": -6.80447244644165, "global_step": 139162, "epoch": 3313} {"train_loss": -6.671045303344727, "global_step": 139163, "epoch": 3313} {"train_loss": -6.474643707275391, "global_step": 139164, "epoch": 3313} {"train_loss": -6.692522048950195, "global_step": 139165, "epoch": 3313} {"train_loss": -6.794405460357666, "global_step": 139166, "epoch": 3313} {"train_loss": -6.712169647216797, "global_step": 139167, "epoch": 3313} {"train_loss": -6.705405235290527, "global_step": 139168, "epoch": 3313} {"train_loss": -6.569973468780518, "global_step": 139169, "epoch": 3313} {"train_loss": -6.694096088409424, "global_step": 139170, "epoch": 3313} {"train_loss": -6.60689640045166, "global_step": 139171, "epoch": 3313} {"train_loss": -6.666078090667725, "global_step": 139172, "epoch": 3313} {"train_loss": -6.725492477416992, "global_step": 139173, "epoch": 3313} {"train_loss": -6.6228766441345215, "global_step": 139174, "epoch": 3313} {"train_loss": -6.631272315979004, "global_step": 139175, "epoch": 3313} {"train_loss": -6.692819595336914, "global_step": 139176, "epoch": 3313} {"train_loss": -6.861894130706787, "global_step": 139177, "epoch": 3313} {"train_loss": -6.674421310424805, "global_step": 139178, "epoch": 3313} {"train_loss": -6.682003974914551, "global_step": 139179, "epoch": 3313} {"train_loss": -6.686793327331543, "global_step": 139180, "epoch": 3313} {"train_loss": -6.70121955871582, "global_step": 139181, "epoch": 3313} {"train_loss": -6.690914154052734, "global_step": 139182, "epoch": 3313} {"train_loss": -6.649669170379639, "global_step": 139183, "epoch": 3313} {"train_loss": -6.743442058563232, "global_step": 139184, "epoch": 3313} {"train_loss": -6.664794445037842, "global_step": 139185, "epoch": 3313} {"train_loss": -6.626088619232178, "global_step": 139186, "epoch": 3313} {"train_loss": -6.688090415227981, "global_step": 139187, "epoch": 3313, "val_loss": 68323.46875} {"train_loss": -6.7110748291015625, "global_step": 139188, "epoch": 3314} {"train_loss": -6.739257335662842, "global_step": 139189, "epoch": 3314} {"train_loss": -6.711201190948486, "global_step": 139190, "epoch": 3314} {"train_loss": -6.735414981842041, "global_step": 139191, "epoch": 3314} {"train_loss": -6.718409538269043, "global_step": 139192, "epoch": 3314} {"train_loss": -6.672634124755859, "global_step": 139193, "epoch": 3314} {"train_loss": -6.714959144592285, "global_step": 139194, "epoch": 3314} {"train_loss": -6.616674423217773, "global_step": 139195, "epoch": 3314} {"train_loss": -6.712718963623047, "global_step": 139196, "epoch": 3314} {"train_loss": -6.7063446044921875, "global_step": 139197, "epoch": 3314} {"train_loss": -6.809429168701172, "global_step": 139198, "epoch": 3314} {"train_loss": -6.747645854949951, "global_step": 139199, "epoch": 3314} {"train_loss": -6.656497001647949, "global_step": 139200, "epoch": 3314} {"train_loss": -6.72455358505249, "global_step": 139201, "epoch": 3314} {"train_loss": -6.73699951171875, "global_step": 139202, "epoch": 3314} {"train_loss": -6.794181823730469, "global_step": 139203, "epoch": 3314} {"train_loss": -6.832437992095947, "global_step": 139204, "epoch": 3314} {"train_loss": -6.630862236022949, "global_step": 139205, "epoch": 3314} {"train_loss": -6.754131317138672, "global_step": 139206, "epoch": 3314} {"train_loss": -6.756925582885742, "global_step": 139207, "epoch": 3314} {"train_loss": -6.648190498352051, "global_step": 139208, "epoch": 3314} {"train_loss": -6.766844749450684, "global_step": 139209, "epoch": 3314} {"train_loss": -6.610755920410156, "global_step": 139210, "epoch": 3314} {"train_loss": -6.823511123657227, "global_step": 139211, "epoch": 3314} {"train_loss": -6.692450523376465, "global_step": 139212, "epoch": 3314} {"train_loss": -6.662744522094727, "global_step": 139213, "epoch": 3314} {"train_loss": -6.9452714920043945, "global_step": 139214, "epoch": 3314} {"train_loss": -6.7855610847473145, "global_step": 139215, "epoch": 3314} {"train_loss": -6.702925682067871, "global_step": 139216, "epoch": 3314} {"train_loss": -6.685421943664551, "global_step": 139217, "epoch": 3314} {"train_loss": -6.737724781036377, "global_step": 139218, "epoch": 3314} {"train_loss": -6.7924957275390625, "global_step": 139219, "epoch": 3314} {"train_loss": -6.7054033279418945, "global_step": 139220, "epoch": 3314} {"train_loss": -6.6235270500183105, "global_step": 139221, "epoch": 3314} {"train_loss": -6.665071487426758, "global_step": 139222, "epoch": 3314} {"train_loss": -6.743990421295166, "global_step": 139223, "epoch": 3314} {"train_loss": -6.551056861877441, "global_step": 139224, "epoch": 3314} {"train_loss": -6.6375627517700195, "global_step": 139225, "epoch": 3314} {"train_loss": -6.535157203674316, "global_step": 139226, "epoch": 3314} {"train_loss": -6.590471267700195, "global_step": 139227, "epoch": 3314} {"train_loss": -6.677613258361816, "global_step": 139228, "epoch": 3314} {"train_loss": -6.702787070047288, "global_step": 139229, "epoch": 3314, "val_loss": 68469.453125} {"train_loss": -6.624356269836426, "global_step": 139230, "epoch": 3315} {"train_loss": -6.578624725341797, "global_step": 139231, "epoch": 3315} {"train_loss": -6.612689018249512, "global_step": 139232, "epoch": 3315} {"train_loss": -6.726888179779053, "global_step": 139233, "epoch": 3315} {"train_loss": -6.591099739074707, "global_step": 139234, "epoch": 3315} {"train_loss": -6.621840000152588, "global_step": 139235, "epoch": 3315} {"train_loss": -6.639153957366943, "global_step": 139236, "epoch": 3315} {"train_loss": -6.650617599487305, "global_step": 139237, "epoch": 3315} {"train_loss": -6.795011520385742, "global_step": 139238, "epoch": 3315} {"train_loss": -6.642831802368164, "global_step": 139239, "epoch": 3315} {"train_loss": -6.595147609710693, "global_step": 139240, "epoch": 3315} {"train_loss": -6.6590471267700195, "global_step": 139241, "epoch": 3315} {"train_loss": -6.6764326095581055, "global_step": 139242, "epoch": 3315} {"train_loss": -6.744818687438965, "global_step": 139243, "epoch": 3315} {"train_loss": -6.754123687744141, "global_step": 139244, "epoch": 3315} {"train_loss": -6.77641487121582, "global_step": 139245, "epoch": 3315} {"train_loss": -6.720822334289551, "global_step": 139246, "epoch": 3315} {"train_loss": -6.714689254760742, "global_step": 139247, "epoch": 3315} {"train_loss": -6.713205337524414, "global_step": 139248, "epoch": 3315} {"train_loss": -6.699739933013916, "global_step": 139249, "epoch": 3315} {"train_loss": -6.769476413726807, "global_step": 139250, "epoch": 3315} {"train_loss": -6.660676956176758, "global_step": 139251, "epoch": 3315} {"train_loss": -6.738168239593506, "global_step": 139252, "epoch": 3315} {"train_loss": -6.721445083618164, "global_step": 139253, "epoch": 3315} {"train_loss": -6.652863502502441, "global_step": 139254, "epoch": 3315} {"train_loss": -6.570441246032715, "global_step": 139255, "epoch": 3315} {"train_loss": -6.726154327392578, "global_step": 139256, "epoch": 3315} {"train_loss": -6.71454381942749, "global_step": 139257, "epoch": 3315} {"train_loss": -6.833335876464844, "global_step": 139258, "epoch": 3315} {"train_loss": -6.7520751953125, "global_step": 139259, "epoch": 3315} {"train_loss": -6.650973796844482, "global_step": 139260, "epoch": 3315} {"train_loss": -6.7799601554870605, "global_step": 139261, "epoch": 3315} {"train_loss": -6.70644474029541, "global_step": 139262, "epoch": 3315} {"train_loss": -6.791376113891602, "global_step": 139263, "epoch": 3315} {"train_loss": -6.650019645690918, "global_step": 139264, "epoch": 3315} {"train_loss": -6.745964050292969, "global_step": 139265, "epoch": 3315} {"train_loss": -6.849884033203125, "global_step": 139266, "epoch": 3315} {"train_loss": -6.732264518737793, "global_step": 139267, "epoch": 3315} {"train_loss": -6.765536308288574, "global_step": 139268, "epoch": 3315} {"train_loss": -6.754147052764893, "global_step": 139269, "epoch": 3315} {"train_loss": -6.77852725982666, "global_step": 139270, "epoch": 3315} {"train_loss": -6.702128376279559, "global_step": 139271, "epoch": 3315, "val_loss": 68340.7109375} {"train_loss": -6.603941440582275, "global_step": 139272, "epoch": 3316} {"train_loss": -6.849024772644043, "global_step": 139273, "epoch": 3316} {"train_loss": -6.779997825622559, "global_step": 139274, "epoch": 3316} {"train_loss": -6.879366874694824, "global_step": 139275, "epoch": 3316} {"train_loss": -6.649120330810547, "global_step": 139276, "epoch": 3316} {"train_loss": -6.755268096923828, "global_step": 139277, "epoch": 3316} {"train_loss": -6.69175910949707, "global_step": 139278, "epoch": 3316} {"train_loss": -6.693289756774902, "global_step": 139279, "epoch": 3316} {"train_loss": -6.66770076751709, "global_step": 139280, "epoch": 3316} {"train_loss": -6.645133972167969, "global_step": 139281, "epoch": 3316} {"train_loss": -6.77473258972168, "global_step": 139282, "epoch": 3316} {"train_loss": -6.660942077636719, "global_step": 139283, "epoch": 3316} {"train_loss": -6.735170364379883, "global_step": 139284, "epoch": 3316} {"train_loss": -6.722629070281982, "global_step": 139285, "epoch": 3316} {"train_loss": -6.687283039093018, "global_step": 139286, "epoch": 3316} {"train_loss": -6.696332931518555, "global_step": 139287, "epoch": 3316} {"train_loss": -6.708349227905273, "global_step": 139288, "epoch": 3316} {"train_loss": -6.661880016326904, "global_step": 139289, "epoch": 3316} {"train_loss": -6.65330171585083, "global_step": 139290, "epoch": 3316} {"train_loss": -6.649211883544922, "global_step": 139291, "epoch": 3316} {"train_loss": -6.66367769241333, "global_step": 139292, "epoch": 3316} {"train_loss": -6.6207122802734375, "global_step": 139293, "epoch": 3316} {"train_loss": -6.645448684692383, "global_step": 139294, "epoch": 3316} {"train_loss": -6.670421600341797, "global_step": 139295, "epoch": 3316} {"train_loss": -6.730762958526611, "global_step": 139296, "epoch": 3316} {"train_loss": -6.594030857086182, "global_step": 139297, "epoch": 3316} {"train_loss": -6.656959533691406, "global_step": 139298, "epoch": 3316} {"train_loss": -6.688425540924072, "global_step": 139299, "epoch": 3316} {"train_loss": -6.620769500732422, "global_step": 139300, "epoch": 3316} {"train_loss": -6.731927871704102, "global_step": 139301, "epoch": 3316} {"train_loss": -6.698092460632324, "global_step": 139302, "epoch": 3316} {"train_loss": -6.703620910644531, "global_step": 139303, "epoch": 3316} {"train_loss": -6.70976448059082, "global_step": 139304, "epoch": 3316} {"train_loss": -6.585980415344238, "global_step": 139305, "epoch": 3316} {"train_loss": -6.578526496887207, "global_step": 139306, "epoch": 3316} {"train_loss": -6.585475921630859, "global_step": 139307, "epoch": 3316} {"train_loss": -6.582160949707031, "global_step": 139308, "epoch": 3316} {"train_loss": -6.687055587768555, "global_step": 139309, "epoch": 3316} {"train_loss": -6.610803604125977, "global_step": 139310, "epoch": 3316} {"train_loss": -6.600689888000488, "global_step": 139311, "epoch": 3316} {"train_loss": -6.567814826965332, "global_step": 139312, "epoch": 3316} {"train_loss": -6.675589958826701, "global_step": 139313, "epoch": 3316, "val_loss": 68349.828125} {"train_loss": -6.699803352355957, "global_step": 139314, "epoch": 3317} {"train_loss": -6.625732421875, "global_step": 139315, "epoch": 3317} {"train_loss": -6.695993423461914, "global_step": 139316, "epoch": 3317} {"train_loss": -6.680517196655273, "global_step": 139317, "epoch": 3317} {"train_loss": -6.776281356811523, "global_step": 139318, "epoch": 3317} {"train_loss": -6.691051483154297, "global_step": 139319, "epoch": 3317} {"train_loss": -6.6753644943237305, "global_step": 139320, "epoch": 3317} {"train_loss": -6.709598541259766, "global_step": 139321, "epoch": 3317} {"train_loss": -6.666064262390137, "global_step": 139322, "epoch": 3317} {"train_loss": -6.687515735626221, "global_step": 139323, "epoch": 3317} {"train_loss": -6.635621070861816, "global_step": 139324, "epoch": 3317} {"train_loss": -6.709187030792236, "global_step": 139325, "epoch": 3317} {"train_loss": -6.68098258972168, "global_step": 139326, "epoch": 3317} {"train_loss": -6.842029094696045, "global_step": 139327, "epoch": 3317} {"train_loss": -6.685967922210693, "global_step": 139328, "epoch": 3317} {"train_loss": -6.6401591300964355, "global_step": 139329, "epoch": 3317} {"train_loss": -6.67106819152832, "global_step": 139330, "epoch": 3317} {"train_loss": -6.765091419219971, "global_step": 139331, "epoch": 3317} {"train_loss": -6.73546028137207, "global_step": 139332, "epoch": 3317} {"train_loss": -6.758262634277344, "global_step": 139333, "epoch": 3317} {"train_loss": -6.784502029418945, "global_step": 139334, "epoch": 3317} {"train_loss": -6.667160987854004, "global_step": 139335, "epoch": 3317} {"train_loss": -6.704927444458008, "global_step": 139336, "epoch": 3317} {"train_loss": -6.78237771987915, "global_step": 139337, "epoch": 3317} {"train_loss": -6.7135009765625, "global_step": 139338, "epoch": 3317} {"train_loss": -6.788782119750977, "global_step": 139339, "epoch": 3317} {"train_loss": -6.793866157531738, "global_step": 139340, "epoch": 3317} {"train_loss": -6.711857318878174, "global_step": 139341, "epoch": 3317} {"train_loss": -6.666942119598389, "global_step": 139342, "epoch": 3317} {"train_loss": -6.804634094238281, "global_step": 139343, "epoch": 3317} {"train_loss": -6.675933837890625, "global_step": 139344, "epoch": 3317} {"train_loss": -6.680667877197266, "global_step": 139345, "epoch": 3317} {"train_loss": -6.656674861907959, "global_step": 139346, "epoch": 3317} {"train_loss": -6.687848091125488, "global_step": 139347, "epoch": 3317} {"train_loss": -6.631260395050049, "global_step": 139348, "epoch": 3317} {"train_loss": -6.606266975402832, "global_step": 139349, "epoch": 3317} {"train_loss": -6.726635456085205, "global_step": 139350, "epoch": 3317} {"train_loss": -6.599175453186035, "global_step": 139351, "epoch": 3317} {"train_loss": -6.567852973937988, "global_step": 139352, "epoch": 3317} {"train_loss": -6.529478073120117, "global_step": 139353, "epoch": 3317} {"train_loss": -6.5432000160217285, "global_step": 139354, "epoch": 3317} {"train_loss": -6.688357307797387, "global_step": 139355, "epoch": 3317, "val_loss": 68423.7265625} {"train_loss": -6.724770545959473, "global_step": 139356, "epoch": 3318} {"train_loss": -6.6603684425354, "global_step": 139357, "epoch": 3318} {"train_loss": -6.677509307861328, "global_step": 139358, "epoch": 3318} {"train_loss": -6.660947799682617, "global_step": 139359, "epoch": 3318} {"train_loss": -6.7206525802612305, "global_step": 139360, "epoch": 3318} {"train_loss": -6.619682312011719, "global_step": 139361, "epoch": 3318} {"train_loss": -6.70292854309082, "global_step": 139362, "epoch": 3318} {"train_loss": -6.750855922698975, "global_step": 139363, "epoch": 3318} {"train_loss": -6.656742095947266, "global_step": 139364, "epoch": 3318} {"train_loss": -6.6969804763793945, "global_step": 139365, "epoch": 3318} {"train_loss": -6.601349830627441, "global_step": 139366, "epoch": 3318} {"train_loss": -6.755770683288574, "global_step": 139367, "epoch": 3318} {"train_loss": -6.633271217346191, "global_step": 139368, "epoch": 3318} {"train_loss": -6.623557090759277, "global_step": 139369, "epoch": 3318} {"train_loss": -6.703883171081543, "global_step": 139370, "epoch": 3318} {"train_loss": -6.68110990524292, "global_step": 139371, "epoch": 3318} {"train_loss": -6.738327980041504, "global_step": 139372, "epoch": 3318} {"train_loss": -6.7466936111450195, "global_step": 139373, "epoch": 3318} {"train_loss": -6.806896686553955, "global_step": 139374, "epoch": 3318} {"train_loss": -6.733222961425781, "global_step": 139375, "epoch": 3318} {"train_loss": -6.7614898681640625, "global_step": 139376, "epoch": 3318} {"train_loss": -6.694066524505615, "global_step": 139377, "epoch": 3318} {"train_loss": -6.683260917663574, "global_step": 139378, "epoch": 3318} {"train_loss": -6.749666690826416, "global_step": 139379, "epoch": 3318} {"train_loss": -6.697516441345215, "global_step": 139380, "epoch": 3318} {"train_loss": -6.7276458740234375, "global_step": 139381, "epoch": 3318} {"train_loss": -6.749423503875732, "global_step": 139382, "epoch": 3318} {"train_loss": -6.677923202514648, "global_step": 139383, "epoch": 3318} {"train_loss": -6.754766941070557, "global_step": 139384, "epoch": 3318} {"train_loss": -6.731501579284668, "global_step": 139385, "epoch": 3318} {"train_loss": -6.733023643493652, "global_step": 139386, "epoch": 3318} {"train_loss": -6.740689277648926, "global_step": 139387, "epoch": 3318} {"train_loss": -6.822482109069824, "global_step": 139388, "epoch": 3318} {"train_loss": -6.739911079406738, "global_step": 139389, "epoch": 3318} {"train_loss": -6.861315727233887, "global_step": 139390, "epoch": 3318} {"train_loss": -6.712769985198975, "global_step": 139391, "epoch": 3318} {"train_loss": -6.695038795471191, "global_step": 139392, "epoch": 3318} {"train_loss": -6.7159295082092285, "global_step": 139393, "epoch": 3318} {"train_loss": -6.6417083740234375, "global_step": 139394, "epoch": 3318} {"train_loss": -6.650796890258789, "global_step": 139395, "epoch": 3318} {"train_loss": -6.838583946228027, "global_step": 139396, "epoch": 3318} {"train_loss": -6.714093480791364, "global_step": 139397, "epoch": 3318, "val_loss": 68342.5078125} {"train_loss": -6.756161689758301, "global_step": 139398, "epoch": 3319} {"train_loss": -6.832940101623535, "global_step": 139399, "epoch": 3319} {"train_loss": -6.779706954956055, "global_step": 139400, "epoch": 3319} {"train_loss": -6.6587629318237305, "global_step": 139401, "epoch": 3319} {"train_loss": -6.748870849609375, "global_step": 139402, "epoch": 3319} {"train_loss": -6.731047630310059, "global_step": 139403, "epoch": 3319} {"train_loss": -6.842280864715576, "global_step": 139404, "epoch": 3319} {"train_loss": -6.6230998039245605, "global_step": 139405, "epoch": 3319} {"train_loss": -6.8241682052612305, "global_step": 139406, "epoch": 3319} {"train_loss": -6.702129364013672, "global_step": 139407, "epoch": 3319} {"train_loss": -6.762540817260742, "global_step": 139408, "epoch": 3319} {"train_loss": -6.74800968170166, "global_step": 139409, "epoch": 3319} {"train_loss": -6.782635688781738, "global_step": 139410, "epoch": 3319} {"train_loss": -6.766100883483887, "global_step": 139411, "epoch": 3319} {"train_loss": -6.838000297546387, "global_step": 139412, "epoch": 3319} {"train_loss": -6.742175102233887, "global_step": 139413, "epoch": 3319} {"train_loss": -6.806243896484375, "global_step": 139414, "epoch": 3319} {"train_loss": -6.694224834442139, "global_step": 139415, "epoch": 3319} {"train_loss": -6.697124481201172, "global_step": 139416, "epoch": 3319} {"train_loss": -6.776361465454102, "global_step": 139417, "epoch": 3319} {"train_loss": -6.674619674682617, "global_step": 139418, "epoch": 3319} {"train_loss": -6.696585178375244, "global_step": 139419, "epoch": 3319} {"train_loss": -6.642999172210693, "global_step": 139420, "epoch": 3319} {"train_loss": -6.632971286773682, "global_step": 139421, "epoch": 3319} {"train_loss": -6.7849440574646, "global_step": 139422, "epoch": 3319} {"train_loss": -6.524019718170166, "global_step": 139423, "epoch": 3319} {"train_loss": -6.644709587097168, "global_step": 139424, "epoch": 3319} {"train_loss": -6.587517261505127, "global_step": 139425, "epoch": 3319} {"train_loss": -6.556450366973877, "global_step": 139426, "epoch": 3319} {"train_loss": -6.635720252990723, "global_step": 139427, "epoch": 3319} {"train_loss": -6.464433670043945, "global_step": 139428, "epoch": 3319} {"train_loss": -6.697630405426025, "global_step": 139429, "epoch": 3319} {"train_loss": -6.513998508453369, "global_step": 139430, "epoch": 3319} {"train_loss": -6.634241104125977, "global_step": 139431, "epoch": 3319} {"train_loss": -6.6160502433776855, "global_step": 139432, "epoch": 3319} {"train_loss": -6.649632453918457, "global_step": 139433, "epoch": 3319} {"train_loss": -6.679455757141113, "global_step": 139434, "epoch": 3319} {"train_loss": -6.529699325561523, "global_step": 139435, "epoch": 3319} {"train_loss": -6.678727149963379, "global_step": 139436, "epoch": 3319} {"train_loss": -6.6377668380737305, "global_step": 139437, "epoch": 3319} {"train_loss": -6.755640029907227, "global_step": 139438, "epoch": 3319} {"train_loss": -6.69167483420599, "global_step": 139439, "epoch": 3319, "val_loss": 68325.328125} {"train_loss": -6.6862311363220215, "global_step": 139440, "epoch": 3320} {"train_loss": -6.638896465301514, "global_step": 139441, "epoch": 3320} {"train_loss": -6.669718265533447, "global_step": 139442, "epoch": 3320} {"train_loss": -6.650745868682861, "global_step": 139443, "epoch": 3320} {"train_loss": -6.665749549865723, "global_step": 139444, "epoch": 3320} {"train_loss": -6.5681915283203125, "global_step": 139445, "epoch": 3320} {"train_loss": -6.713301658630371, "global_step": 139446, "epoch": 3320} {"train_loss": -6.764076232910156, "global_step": 139447, "epoch": 3320} {"train_loss": -6.7527689933776855, "global_step": 139448, "epoch": 3320} {"train_loss": -6.698846340179443, "global_step": 139449, "epoch": 3320} {"train_loss": -6.556057929992676, "global_step": 139450, "epoch": 3320} {"train_loss": -6.796511650085449, "global_step": 139451, "epoch": 3320} {"train_loss": -6.627363204956055, "global_step": 139452, "epoch": 3320} {"train_loss": -6.72722864151001, "global_step": 139453, "epoch": 3320} {"train_loss": -6.8529815673828125, "global_step": 139454, "epoch": 3320} {"train_loss": -6.59144401550293, "global_step": 139455, "epoch": 3320} {"train_loss": -6.5906267166137695, "global_step": 139456, "epoch": 3320} {"train_loss": -6.659564018249512, "global_step": 139457, "epoch": 3320} {"train_loss": -6.645964622497559, "global_step": 139458, "epoch": 3320} {"train_loss": -6.646025657653809, "global_step": 139459, "epoch": 3320} {"train_loss": -6.710119247436523, "global_step": 139460, "epoch": 3320} {"train_loss": -6.725594520568848, "global_step": 139461, "epoch": 3320} {"train_loss": -6.654158592224121, "global_step": 139462, "epoch": 3320} {"train_loss": -6.738003730773926, "global_step": 139463, "epoch": 3320} {"train_loss": -6.732318878173828, "global_step": 139464, "epoch": 3320} {"train_loss": -6.8318281173706055, "global_step": 139465, "epoch": 3320} {"train_loss": -6.617487907409668, "global_step": 139466, "epoch": 3320} {"train_loss": -6.7680816650390625, "global_step": 139467, "epoch": 3320} {"train_loss": -6.709319114685059, "global_step": 139468, "epoch": 3320} {"train_loss": -6.7198991775512695, "global_step": 139469, "epoch": 3320} {"train_loss": -6.6718549728393555, "global_step": 139470, "epoch": 3320} {"train_loss": -6.724178314208984, "global_step": 139471, "epoch": 3320} {"train_loss": -6.806020736694336, "global_step": 139472, "epoch": 3320} {"train_loss": -6.728132247924805, "global_step": 139473, "epoch": 3320} {"train_loss": -6.687504768371582, "global_step": 139474, "epoch": 3320} {"train_loss": -6.676770210266113, "global_step": 139475, "epoch": 3320} {"train_loss": -6.7394890785217285, "global_step": 139476, "epoch": 3320} {"train_loss": -6.632745742797852, "global_step": 139477, "epoch": 3320} {"train_loss": -6.597099304199219, "global_step": 139478, "epoch": 3320} {"train_loss": -6.850780487060547, "global_step": 139479, "epoch": 3320} {"train_loss": -6.483306884765625, "global_step": 139480, "epoch": 3320} {"train_loss": -6.6904843761807395, "global_step": 139481, "epoch": 3320, "val_loss": 68320.640625} {"train_loss": -6.686986446380615, "global_step": 139482, "epoch": 3321} {"train_loss": -6.634278774261475, "global_step": 139483, "epoch": 3321} {"train_loss": -6.711309432983398, "global_step": 139484, "epoch": 3321} {"train_loss": -6.694465637207031, "global_step": 139485, "epoch": 3321} {"train_loss": -6.641594409942627, "global_step": 139486, "epoch": 3321} {"train_loss": -6.651623725891113, "global_step": 139487, "epoch": 3321} {"train_loss": -6.707427978515625, "global_step": 139488, "epoch": 3321} {"train_loss": -6.634063243865967, "global_step": 139489, "epoch": 3321} {"train_loss": -6.729526996612549, "global_step": 139490, "epoch": 3321} {"train_loss": -6.733613014221191, "global_step": 139491, "epoch": 3321} {"train_loss": -6.504326343536377, "global_step": 139492, "epoch": 3321} {"train_loss": -6.788532257080078, "global_step": 139493, "epoch": 3321} {"train_loss": -6.6530256271362305, "global_step": 139494, "epoch": 3321} {"train_loss": -6.747565269470215, "global_step": 139495, "epoch": 3321} {"train_loss": -6.7163920402526855, "global_step": 139496, "epoch": 3321} {"train_loss": -6.653521537780762, "global_step": 139497, "epoch": 3321} {"train_loss": -6.68093729019165, "global_step": 139498, "epoch": 3321} {"train_loss": -6.662860870361328, "global_step": 139499, "epoch": 3321} {"train_loss": -6.744336128234863, "global_step": 139500, "epoch": 3321} {"train_loss": -6.7257819175720215, "global_step": 139501, "epoch": 3321} {"train_loss": -6.742359161376953, "global_step": 139502, "epoch": 3321} {"train_loss": -6.605622291564941, "global_step": 139503, "epoch": 3321} {"train_loss": -6.6048784255981445, "global_step": 139504, "epoch": 3321} {"train_loss": -6.65792179107666, "global_step": 139505, "epoch": 3321} {"train_loss": -6.708765506744385, "global_step": 139506, "epoch": 3321} {"train_loss": -6.600881099700928, "global_step": 139507, "epoch": 3321} {"train_loss": -6.782256126403809, "global_step": 139508, "epoch": 3321} {"train_loss": -6.71210241317749, "global_step": 139509, "epoch": 3321} {"train_loss": -6.70646858215332, "global_step": 139510, "epoch": 3321} {"train_loss": -6.692139625549316, "global_step": 139511, "epoch": 3321} {"train_loss": -6.768499851226807, "global_step": 139512, "epoch": 3321} {"train_loss": -6.623626708984375, "global_step": 139513, "epoch": 3321} {"train_loss": -6.776151657104492, "global_step": 139514, "epoch": 3321} {"train_loss": -6.727720260620117, "global_step": 139515, "epoch": 3321} {"train_loss": -6.798255920410156, "global_step": 139516, "epoch": 3321} {"train_loss": -6.790651321411133, "global_step": 139517, "epoch": 3321} {"train_loss": -6.736262321472168, "global_step": 139518, "epoch": 3321} {"train_loss": -6.718072891235352, "global_step": 139519, "epoch": 3321} {"train_loss": -6.785623550415039, "global_step": 139520, "epoch": 3321} {"train_loss": -6.670223236083984, "global_step": 139521, "epoch": 3321} {"train_loss": -6.730569362640381, "global_step": 139522, "epoch": 3321} {"train_loss": -6.700323331923712, "global_step": 139523, "epoch": 3321, "val_loss": 68149.640625} {"train_loss": -6.708878993988037, "global_step": 139524, "epoch": 3322} {"train_loss": -6.771955490112305, "global_step": 139525, "epoch": 3322} {"train_loss": -6.720898628234863, "global_step": 139526, "epoch": 3322} {"train_loss": -6.805152893066406, "global_step": 139527, "epoch": 3322} {"train_loss": -6.677643299102783, "global_step": 139528, "epoch": 3322} {"train_loss": -6.792928218841553, "global_step": 139529, "epoch": 3322} {"train_loss": -6.8410749435424805, "global_step": 139530, "epoch": 3322} {"train_loss": -6.77474308013916, "global_step": 139531, "epoch": 3322} {"train_loss": -6.787750244140625, "global_step": 139532, "epoch": 3322} {"train_loss": -6.744830131530762, "global_step": 139533, "epoch": 3322} {"train_loss": -6.734655380249023, "global_step": 139534, "epoch": 3322} {"train_loss": -6.658356666564941, "global_step": 139535, "epoch": 3322} {"train_loss": -6.74984073638916, "global_step": 139536, "epoch": 3322} {"train_loss": -6.810977935791016, "global_step": 139537, "epoch": 3322} {"train_loss": -6.628252029418945, "global_step": 139538, "epoch": 3322} {"train_loss": -6.563259124755859, "global_step": 139539, "epoch": 3322} {"train_loss": -6.749163627624512, "global_step": 139540, "epoch": 3322} {"train_loss": -6.61619758605957, "global_step": 139541, "epoch": 3322} {"train_loss": -6.740057468414307, "global_step": 139542, "epoch": 3322} {"train_loss": -6.6965413093566895, "global_step": 139543, "epoch": 3322} {"train_loss": -6.675838470458984, "global_step": 139544, "epoch": 3322} {"train_loss": -6.783048629760742, "global_step": 139545, "epoch": 3322} {"train_loss": -6.83091402053833, "global_step": 139546, "epoch": 3322} {"train_loss": -6.463884353637695, "global_step": 139547, "epoch": 3322} {"train_loss": -6.627953052520752, "global_step": 139548, "epoch": 3322} {"train_loss": -6.645371437072754, "global_step": 139549, "epoch": 3322} {"train_loss": -6.534468650817871, "global_step": 139550, "epoch": 3322} {"train_loss": -6.742803573608398, "global_step": 139551, "epoch": 3322} {"train_loss": -6.755553722381592, "global_step": 139552, "epoch": 3322} {"train_loss": -6.635928630828857, "global_step": 139553, "epoch": 3322} {"train_loss": -6.777419090270996, "global_step": 139554, "epoch": 3322} {"train_loss": -6.540361404418945, "global_step": 139555, "epoch": 3322} {"train_loss": -6.645907402038574, "global_step": 139556, "epoch": 3322} {"train_loss": -6.66229248046875, "global_step": 139557, "epoch": 3322} {"train_loss": -6.764210224151611, "global_step": 139558, "epoch": 3322} {"train_loss": -6.74554967880249, "global_step": 139559, "epoch": 3322} {"train_loss": -6.723816871643066, "global_step": 139560, "epoch": 3322} {"train_loss": -6.708620071411133, "global_step": 139561, "epoch": 3322} {"train_loss": -6.7533392906188965, "global_step": 139562, "epoch": 3322} {"train_loss": -6.697416305541992, "global_step": 139563, "epoch": 3322} {"train_loss": -6.6840643882751465, "global_step": 139564, "epoch": 3322} {"train_loss": -6.709451641355242, "global_step": 139565, "epoch": 3322, "val_loss": 68273.3828125} {"train_loss": -6.697933197021484, "global_step": 139566, "epoch": 3323} {"train_loss": -6.698925018310547, "global_step": 139567, "epoch": 3323} {"train_loss": -6.748566627502441, "global_step": 139568, "epoch": 3323} {"train_loss": -6.651288032531738, "global_step": 139569, "epoch": 3323} {"train_loss": -6.812979698181152, "global_step": 139570, "epoch": 3323} {"train_loss": -6.671381950378418, "global_step": 139571, "epoch": 3323} {"train_loss": -6.79939079284668, "global_step": 139572, "epoch": 3323} {"train_loss": -6.523799419403076, "global_step": 139573, "epoch": 3323} {"train_loss": -6.772480487823486, "global_step": 139574, "epoch": 3323} {"train_loss": -6.666667461395264, "global_step": 139575, "epoch": 3323} {"train_loss": -6.716503620147705, "global_step": 139576, "epoch": 3323} {"train_loss": -6.525775909423828, "global_step": 139577, "epoch": 3323} {"train_loss": -6.690176486968994, "global_step": 139578, "epoch": 3323} {"train_loss": -6.741708755493164, "global_step": 139579, "epoch": 3323} {"train_loss": -6.808844566345215, "global_step": 139580, "epoch": 3323} {"train_loss": -6.730627059936523, "global_step": 139581, "epoch": 3323} {"train_loss": -6.769448280334473, "global_step": 139582, "epoch": 3323} {"train_loss": -6.8414411544799805, "global_step": 139583, "epoch": 3323} {"train_loss": -6.823299407958984, "global_step": 139584, "epoch": 3323} {"train_loss": -6.777856826782227, "global_step": 139585, "epoch": 3323} {"train_loss": -6.669978141784668, "global_step": 139586, "epoch": 3323} {"train_loss": -6.778400421142578, "global_step": 139587, "epoch": 3323} {"train_loss": -6.697607040405273, "global_step": 139588, "epoch": 3323} {"train_loss": -6.776494979858398, "global_step": 139589, "epoch": 3323} {"train_loss": -6.717231750488281, "global_step": 139590, "epoch": 3323} {"train_loss": -6.806402206420898, "global_step": 139591, "epoch": 3323} {"train_loss": -6.728794097900391, "global_step": 139592, "epoch": 3323} {"train_loss": -6.752474784851074, "global_step": 139593, "epoch": 3323} {"train_loss": -6.7452898025512695, "global_step": 139594, "epoch": 3323} {"train_loss": -6.663120746612549, "global_step": 139595, "epoch": 3323} {"train_loss": -6.742311477661133, "global_step": 139596, "epoch": 3323} {"train_loss": -6.587705612182617, "global_step": 139597, "epoch": 3323} {"train_loss": -6.76962423324585, "global_step": 139598, "epoch": 3323} {"train_loss": -6.816750526428223, "global_step": 139599, "epoch": 3323} {"train_loss": -6.723361015319824, "global_step": 139600, "epoch": 3323} {"train_loss": -6.6431989669799805, "global_step": 139601, "epoch": 3323} {"train_loss": -6.5860137939453125, "global_step": 139602, "epoch": 3323} {"train_loss": -6.822219371795654, "global_step": 139603, "epoch": 3323} {"train_loss": -6.732440948486328, "global_step": 139604, "epoch": 3323} {"train_loss": -6.802019119262695, "global_step": 139605, "epoch": 3323} {"train_loss": -6.678133010864258, "global_step": 139606, "epoch": 3323} {"train_loss": -6.723531348364694, "global_step": 139607, "epoch": 3323, "val_loss": 68451.0078125} {"train_loss": -6.641130447387695, "global_step": 139608, "epoch": 3324} {"train_loss": -6.629561424255371, "global_step": 139609, "epoch": 3324} {"train_loss": -6.713741779327393, "global_step": 139610, "epoch": 3324} {"train_loss": -6.684810638427734, "global_step": 139611, "epoch": 3324} {"train_loss": -6.700218200683594, "global_step": 139612, "epoch": 3324} {"train_loss": -6.715509414672852, "global_step": 139613, "epoch": 3324} {"train_loss": -6.627747058868408, "global_step": 139614, "epoch": 3324} {"train_loss": -6.559426784515381, "global_step": 139615, "epoch": 3324} {"train_loss": -6.716108322143555, "global_step": 139616, "epoch": 3324} {"train_loss": -6.718017578125, "global_step": 139617, "epoch": 3324} {"train_loss": -6.51132869720459, "global_step": 139618, "epoch": 3324} {"train_loss": -6.6984052658081055, "global_step": 139619, "epoch": 3324} {"train_loss": -6.6519341468811035, "global_step": 139620, "epoch": 3324} {"train_loss": -6.670357704162598, "global_step": 139621, "epoch": 3324} {"train_loss": -6.70786190032959, "global_step": 139622, "epoch": 3324} {"train_loss": -6.66726016998291, "global_step": 139623, "epoch": 3324} {"train_loss": -6.749336242675781, "global_step": 139624, "epoch": 3324} {"train_loss": -6.693211555480957, "global_step": 139625, "epoch": 3324} {"train_loss": -6.647356033325195, "global_step": 139626, "epoch": 3324} {"train_loss": -6.683311462402344, "global_step": 139627, "epoch": 3324} {"train_loss": -6.7681121826171875, "global_step": 139628, "epoch": 3324} {"train_loss": -6.692404270172119, "global_step": 139629, "epoch": 3324} {"train_loss": -6.755999565124512, "global_step": 139630, "epoch": 3324} {"train_loss": -6.664813041687012, "global_step": 139631, "epoch": 3324} {"train_loss": -6.570977210998535, "global_step": 139632, "epoch": 3324} {"train_loss": -6.747537612915039, "global_step": 139633, "epoch": 3324} {"train_loss": -6.709346771240234, "global_step": 139634, "epoch": 3324} {"train_loss": -6.717122554779053, "global_step": 139635, "epoch": 3324} {"train_loss": -6.591803073883057, "global_step": 139636, "epoch": 3324} {"train_loss": -6.640573501586914, "global_step": 139637, "epoch": 3324} {"train_loss": -6.738492012023926, "global_step": 139638, "epoch": 3324} {"train_loss": -6.621003150939941, "global_step": 139639, "epoch": 3324} {"train_loss": -6.61421012878418, "global_step": 139640, "epoch": 3324} {"train_loss": -6.687143802642822, "global_step": 139641, "epoch": 3324} {"train_loss": -6.708138942718506, "global_step": 139642, "epoch": 3324} {"train_loss": -6.635889530181885, "global_step": 139643, "epoch": 3324} {"train_loss": -6.632052421569824, "global_step": 139644, "epoch": 3324} {"train_loss": -6.5519118309021, "global_step": 139645, "epoch": 3324} {"train_loss": -6.684540748596191, "global_step": 139646, "epoch": 3324} {"train_loss": -6.672521591186523, "global_step": 139647, "epoch": 3324} {"train_loss": -6.8280134201049805, "global_step": 139648, "epoch": 3324} {"train_loss": -6.671747128168742, "global_step": 139649, "epoch": 3324, "val_loss": 68406.234375} {"train_loss": -6.780294418334961, "global_step": 139650, "epoch": 3325} {"train_loss": -6.714854717254639, "global_step": 139651, "epoch": 3325} {"train_loss": -6.721229553222656, "global_step": 139652, "epoch": 3325} {"train_loss": -6.7135796546936035, "global_step": 139653, "epoch": 3325} {"train_loss": -6.824252605438232, "global_step": 139654, "epoch": 3325} {"train_loss": -6.778218746185303, "global_step": 139655, "epoch": 3325} {"train_loss": -6.823840141296387, "global_step": 139656, "epoch": 3325} {"train_loss": -6.633940696716309, "global_step": 139657, "epoch": 3325} {"train_loss": -6.809174060821533, "global_step": 139658, "epoch": 3325} {"train_loss": -6.660463333129883, "global_step": 139659, "epoch": 3325} {"train_loss": -6.762620449066162, "global_step": 139660, "epoch": 3325} {"train_loss": -6.740355491638184, "global_step": 139661, "epoch": 3325} {"train_loss": -6.700704574584961, "global_step": 139662, "epoch": 3325} {"train_loss": -6.824272632598877, "global_step": 139663, "epoch": 3325} {"train_loss": -6.768118381500244, "global_step": 139664, "epoch": 3325} {"train_loss": -6.6772661209106445, "global_step": 139665, "epoch": 3325} {"train_loss": -6.780279159545898, "global_step": 139666, "epoch": 3325} {"train_loss": -6.752158164978027, "global_step": 139667, "epoch": 3325} {"train_loss": -6.7270355224609375, "global_step": 139668, "epoch": 3325} {"train_loss": -6.80965518951416, "global_step": 139669, "epoch": 3325} {"train_loss": -6.700370788574219, "global_step": 139670, "epoch": 3325} {"train_loss": -6.883251190185547, "global_step": 139671, "epoch": 3325} {"train_loss": -6.740177154541016, "global_step": 139672, "epoch": 3325} {"train_loss": -6.797721862792969, "global_step": 139673, "epoch": 3325} {"train_loss": -6.836947917938232, "global_step": 139674, "epoch": 3325} {"train_loss": -6.776780128479004, "global_step": 139675, "epoch": 3325} {"train_loss": -6.817737102508545, "global_step": 139676, "epoch": 3325} {"train_loss": -6.8153181076049805, "global_step": 139677, "epoch": 3325} {"train_loss": -6.766919136047363, "global_step": 139678, "epoch": 3325} {"train_loss": -6.719212532043457, "global_step": 139679, "epoch": 3325} {"train_loss": -6.703325271606445, "global_step": 139680, "epoch": 3325} {"train_loss": -6.674145698547363, "global_step": 139681, "epoch": 3325} {"train_loss": -6.753270149230957, "global_step": 139682, "epoch": 3325} {"train_loss": -6.752103328704834, "global_step": 139683, "epoch": 3325} {"train_loss": -6.668506145477295, "global_step": 139684, "epoch": 3325} {"train_loss": -6.660068035125732, "global_step": 139685, "epoch": 3325} {"train_loss": -6.766550064086914, "global_step": 139686, "epoch": 3325} {"train_loss": -6.646435260772705, "global_step": 139687, "epoch": 3325} {"train_loss": -6.710783004760742, "global_step": 139688, "epoch": 3325} {"train_loss": -6.786334037780762, "global_step": 139689, "epoch": 3325} {"train_loss": -6.761323928833008, "global_step": 139690, "epoch": 3325} {"train_loss": -6.746348528634934, "global_step": 139691, "epoch": 3325, "val_loss": 68139.015625} {"train_loss": -6.7841620445251465, "global_step": 139692, "epoch": 3326} {"train_loss": -6.833270072937012, "global_step": 139693, "epoch": 3326} {"train_loss": -6.824893951416016, "global_step": 139694, "epoch": 3326} {"train_loss": -6.718723773956299, "global_step": 139695, "epoch": 3326} {"train_loss": -6.759809494018555, "global_step": 139696, "epoch": 3326} {"train_loss": -6.794661521911621, "global_step": 139697, "epoch": 3326} {"train_loss": -6.779721260070801, "global_step": 139698, "epoch": 3326} {"train_loss": -6.775336265563965, "global_step": 139699, "epoch": 3326} {"train_loss": -6.67503547668457, "global_step": 139700, "epoch": 3326} {"train_loss": -6.58485221862793, "global_step": 139701, "epoch": 3326} {"train_loss": -6.761617660522461, "global_step": 139702, "epoch": 3326} {"train_loss": -6.729907512664795, "global_step": 139703, "epoch": 3326} {"train_loss": -6.802170753479004, "global_step": 139704, "epoch": 3326} {"train_loss": -6.755846977233887, "global_step": 139705, "epoch": 3326} {"train_loss": -6.781272888183594, "global_step": 139706, "epoch": 3326} {"train_loss": -6.806254863739014, "global_step": 139707, "epoch": 3326} {"train_loss": -6.682055473327637, "global_step": 139708, "epoch": 3326} {"train_loss": -6.5922627449035645, "global_step": 139709, "epoch": 3326} {"train_loss": -6.72243070602417, "global_step": 139710, "epoch": 3326} {"train_loss": -6.828385353088379, "global_step": 139711, "epoch": 3326} {"train_loss": -6.677668571472168, "global_step": 139712, "epoch": 3326} {"train_loss": -6.756938934326172, "global_step": 139713, "epoch": 3326} {"train_loss": -6.702267646789551, "global_step": 139714, "epoch": 3326} {"train_loss": -6.753383159637451, "global_step": 139715, "epoch": 3326} {"train_loss": -6.669673442840576, "global_step": 139716, "epoch": 3326} {"train_loss": -6.764436721801758, "global_step": 139717, "epoch": 3326} {"train_loss": -6.741394996643066, "global_step": 139718, "epoch": 3326} {"train_loss": -6.663937568664551, "global_step": 139719, "epoch": 3326} {"train_loss": -6.863106727600098, "global_step": 139720, "epoch": 3326} {"train_loss": -6.686963081359863, "global_step": 139721, "epoch": 3326} {"train_loss": -6.751997947692871, "global_step": 139722, "epoch": 3326} {"train_loss": -6.708309173583984, "global_step": 139723, "epoch": 3326} {"train_loss": -6.781217098236084, "global_step": 139724, "epoch": 3326} {"train_loss": -6.797065734863281, "global_step": 139725, "epoch": 3326} {"train_loss": -6.660078048706055, "global_step": 139726, "epoch": 3326} {"train_loss": -6.782057762145996, "global_step": 139727, "epoch": 3326} {"train_loss": -6.758851051330566, "global_step": 139728, "epoch": 3326} {"train_loss": -6.773561477661133, "global_step": 139729, "epoch": 3326} {"train_loss": -6.703638076782227, "global_step": 139730, "epoch": 3326} {"train_loss": -6.735622406005859, "global_step": 139731, "epoch": 3326} {"train_loss": -6.8148980140686035, "global_step": 139732, "epoch": 3326} {"train_loss": -6.746273483548846, "global_step": 139733, "epoch": 3326, "val_loss": 68439.0390625} {"train_loss": -6.788771152496338, "global_step": 139734, "epoch": 3327} {"train_loss": -6.793186187744141, "global_step": 139735, "epoch": 3327} {"train_loss": -6.758423328399658, "global_step": 139736, "epoch": 3327} {"train_loss": -6.728184700012207, "global_step": 139737, "epoch": 3327} {"train_loss": -6.840606212615967, "global_step": 139738, "epoch": 3327} {"train_loss": -6.77337121963501, "global_step": 139739, "epoch": 3327} {"train_loss": -6.7399187088012695, "global_step": 139740, "epoch": 3327} {"train_loss": -6.802887916564941, "global_step": 139741, "epoch": 3327} {"train_loss": -6.551202297210693, "global_step": 139742, "epoch": 3327} {"train_loss": -6.770822525024414, "global_step": 139743, "epoch": 3327} {"train_loss": -6.6701531410217285, "global_step": 139744, "epoch": 3327} {"train_loss": -6.757956504821777, "global_step": 139745, "epoch": 3327} {"train_loss": -6.7375898361206055, "global_step": 139746, "epoch": 3327} {"train_loss": -6.798251152038574, "global_step": 139747, "epoch": 3327} {"train_loss": -6.628010272979736, "global_step": 139748, "epoch": 3327} {"train_loss": -6.701474666595459, "global_step": 139749, "epoch": 3327} {"train_loss": -6.798840522766113, "global_step": 139750, "epoch": 3327} {"train_loss": -6.6646246910095215, "global_step": 139751, "epoch": 3327} {"train_loss": -6.697082996368408, "global_step": 139752, "epoch": 3327} {"train_loss": -6.771076202392578, "global_step": 139753, "epoch": 3327} {"train_loss": -6.680602073669434, "global_step": 139754, "epoch": 3327} {"train_loss": -6.622768402099609, "global_step": 139755, "epoch": 3327} {"train_loss": -6.60935115814209, "global_step": 139756, "epoch": 3327} {"train_loss": -6.730835437774658, "global_step": 139757, "epoch": 3327} {"train_loss": -6.714200973510742, "global_step": 139758, "epoch": 3327} {"train_loss": -6.7678351402282715, "global_step": 139759, "epoch": 3327} {"train_loss": -6.658066749572754, "global_step": 139760, "epoch": 3327} {"train_loss": -6.657544136047363, "global_step": 139761, "epoch": 3327} {"train_loss": -6.678866863250732, "global_step": 139762, "epoch": 3327} {"train_loss": -6.568939208984375, "global_step": 139763, "epoch": 3327} {"train_loss": -6.753810882568359, "global_step": 139764, "epoch": 3327} {"train_loss": -6.622900009155273, "global_step": 139765, "epoch": 3327} {"train_loss": -6.5941267013549805, "global_step": 139766, "epoch": 3327} {"train_loss": -6.603774070739746, "global_step": 139767, "epoch": 3327} {"train_loss": -6.72188663482666, "global_step": 139768, "epoch": 3327} {"train_loss": -6.655069828033447, "global_step": 139769, "epoch": 3327} {"train_loss": -6.707147121429443, "global_step": 139770, "epoch": 3327} {"train_loss": -6.6740875244140625, "global_step": 139771, "epoch": 3327} {"train_loss": -6.6086039543151855, "global_step": 139772, "epoch": 3327} {"train_loss": -6.699161529541016, "global_step": 139773, "epoch": 3327} {"train_loss": -6.599632263183594, "global_step": 139774, "epoch": 3327} {"train_loss": -6.702778532391503, "global_step": 139775, "epoch": 3327, "val_loss": 68398.3828125} {"train_loss": -6.693303108215332, "global_step": 139776, "epoch": 3328} {"train_loss": -6.72714900970459, "global_step": 139777, "epoch": 3328} {"train_loss": -6.692038536071777, "global_step": 139778, "epoch": 3328} {"train_loss": -6.67033576965332, "global_step": 139779, "epoch": 3328} {"train_loss": -6.725909233093262, "global_step": 139780, "epoch": 3328} {"train_loss": -6.728208541870117, "global_step": 139781, "epoch": 3328} {"train_loss": -6.715810775756836, "global_step": 139782, "epoch": 3328} {"train_loss": -6.715357303619385, "global_step": 139783, "epoch": 3328} {"train_loss": -6.773898124694824, "global_step": 139784, "epoch": 3328} {"train_loss": -6.743705749511719, "global_step": 139785, "epoch": 3328} {"train_loss": -6.872027397155762, "global_step": 139786, "epoch": 3328} {"train_loss": -6.724968433380127, "global_step": 139787, "epoch": 3328} {"train_loss": -6.66998291015625, "global_step": 139788, "epoch": 3328} {"train_loss": -6.6484246253967285, "global_step": 139789, "epoch": 3328} {"train_loss": -6.632867813110352, "global_step": 139790, "epoch": 3328} {"train_loss": -6.8227081298828125, "global_step": 139791, "epoch": 3328} {"train_loss": -6.628106117248535, "global_step": 139792, "epoch": 3328} {"train_loss": -6.624439239501953, "global_step": 139793, "epoch": 3328} {"train_loss": -6.660384654998779, "global_step": 139794, "epoch": 3328} {"train_loss": -6.570032119750977, "global_step": 139795, "epoch": 3328} {"train_loss": -6.727621555328369, "global_step": 139796, "epoch": 3328} {"train_loss": -6.6552557945251465, "global_step": 139797, "epoch": 3328} {"train_loss": -6.766509056091309, "global_step": 139798, "epoch": 3328} {"train_loss": -6.754854202270508, "global_step": 139799, "epoch": 3328} {"train_loss": -6.598228454589844, "global_step": 139800, "epoch": 3328} {"train_loss": -6.7252197265625, "global_step": 139801, "epoch": 3328} {"train_loss": -6.644531726837158, "global_step": 139802, "epoch": 3328} {"train_loss": -6.7111968994140625, "global_step": 139803, "epoch": 3328} {"train_loss": -6.601639270782471, "global_step": 139804, "epoch": 3328} {"train_loss": -6.63290548324585, "global_step": 139805, "epoch": 3328} {"train_loss": -6.535074710845947, "global_step": 139806, "epoch": 3328} {"train_loss": -6.753795623779297, "global_step": 139807, "epoch": 3328} {"train_loss": -6.703839302062988, "global_step": 139808, "epoch": 3328} {"train_loss": -6.791059970855713, "global_step": 139809, "epoch": 3328} {"train_loss": -6.602419376373291, "global_step": 139810, "epoch": 3328} {"train_loss": -6.7470221519470215, "global_step": 139811, "epoch": 3328} {"train_loss": -6.703314781188965, "global_step": 139812, "epoch": 3328} {"train_loss": -6.626010894775391, "global_step": 139813, "epoch": 3328} {"train_loss": -6.733262538909912, "global_step": 139814, "epoch": 3328} {"train_loss": -6.599349021911621, "global_step": 139815, "epoch": 3328} {"train_loss": -6.677204132080078, "global_step": 139816, "epoch": 3328} {"train_loss": -6.690166813986642, "global_step": 139817, "epoch": 3328, "val_loss": 68442.1796875} {"train_loss": -6.762833595275879, "global_step": 139818, "epoch": 3329} {"train_loss": -6.620105743408203, "global_step": 139819, "epoch": 3329} {"train_loss": -6.750971794128418, "global_step": 139820, "epoch": 3329} {"train_loss": -6.560222625732422, "global_step": 139821, "epoch": 3329} {"train_loss": -6.707329750061035, "global_step": 139822, "epoch": 3329} {"train_loss": -6.564689636230469, "global_step": 139823, "epoch": 3329} {"train_loss": -6.584873199462891, "global_step": 139824, "epoch": 3329} {"train_loss": -6.766705513000488, "global_step": 139825, "epoch": 3329} {"train_loss": -6.769641399383545, "global_step": 139826, "epoch": 3329} {"train_loss": -6.75580358505249, "global_step": 139827, "epoch": 3329} {"train_loss": -6.822906970977783, "global_step": 139828, "epoch": 3329} {"train_loss": -6.719272613525391, "global_step": 139829, "epoch": 3329} {"train_loss": -6.614554405212402, "global_step": 139830, "epoch": 3329} {"train_loss": -6.726467609405518, "global_step": 139831, "epoch": 3329} {"train_loss": -6.5977373123168945, "global_step": 139832, "epoch": 3329} {"train_loss": -6.750261306762695, "global_step": 139833, "epoch": 3329} {"train_loss": -6.695499420166016, "global_step": 139834, "epoch": 3329} {"train_loss": -6.684182167053223, "global_step": 139835, "epoch": 3329} {"train_loss": -6.874774932861328, "global_step": 139836, "epoch": 3329} {"train_loss": -6.730919361114502, "global_step": 139837, "epoch": 3329} {"train_loss": -6.673999786376953, "global_step": 139838, "epoch": 3329} {"train_loss": -6.74110221862793, "global_step": 139839, "epoch": 3329} {"train_loss": -6.691367149353027, "global_step": 139840, "epoch": 3329} {"train_loss": -6.690491676330566, "global_step": 139841, "epoch": 3329} {"train_loss": -6.762135982513428, "global_step": 139842, "epoch": 3329} {"train_loss": -6.888147354125977, "global_step": 139843, "epoch": 3329} {"train_loss": -6.792303562164307, "global_step": 139844, "epoch": 3329} {"train_loss": -6.842867851257324, "global_step": 139845, "epoch": 3329} {"train_loss": -6.674391269683838, "global_step": 139846, "epoch": 3329} {"train_loss": -6.6880292892456055, "global_step": 139847, "epoch": 3329} {"train_loss": -6.6789045333862305, "global_step": 139848, "epoch": 3329} {"train_loss": -6.70164680480957, "global_step": 139849, "epoch": 3329} {"train_loss": -6.762962341308594, "global_step": 139850, "epoch": 3329} {"train_loss": -6.6971282958984375, "global_step": 139851, "epoch": 3329} {"train_loss": -6.707479000091553, "global_step": 139852, "epoch": 3329} {"train_loss": -6.724408149719238, "global_step": 139853, "epoch": 3329} {"train_loss": -6.729837894439697, "global_step": 139854, "epoch": 3329} {"train_loss": -6.6884684562683105, "global_step": 139855, "epoch": 3329} {"train_loss": -6.642904281616211, "global_step": 139856, "epoch": 3329} {"train_loss": -6.73868989944458, "global_step": 139857, "epoch": 3329} {"train_loss": -6.795949935913086, "global_step": 139858, "epoch": 3329} {"train_loss": -6.717305308296567, "global_step": 139859, "epoch": 3329, "val_loss": 68335.9375} {"train_loss": -6.756180286407471, "global_step": 139860, "epoch": 3330} {"train_loss": -6.766888618469238, "global_step": 139861, "epoch": 3330} {"train_loss": -6.741886138916016, "global_step": 139862, "epoch": 3330} {"train_loss": -6.787842750549316, "global_step": 139863, "epoch": 3330} {"train_loss": -6.777948379516602, "global_step": 139864, "epoch": 3330} {"train_loss": -6.709495544433594, "global_step": 139865, "epoch": 3330} {"train_loss": -6.805080413818359, "global_step": 139866, "epoch": 3330} {"train_loss": -6.80679988861084, "global_step": 139867, "epoch": 3330} {"train_loss": -6.772602081298828, "global_step": 139868, "epoch": 3330} {"train_loss": -6.698184490203857, "global_step": 139869, "epoch": 3330} {"train_loss": -6.83757209777832, "global_step": 139870, "epoch": 3330} {"train_loss": -6.759321689605713, "global_step": 139871, "epoch": 3330} {"train_loss": -6.663664817810059, "global_step": 139872, "epoch": 3330} {"train_loss": -6.764443397521973, "global_step": 139873, "epoch": 3330} {"train_loss": -6.710908889770508, "global_step": 139874, "epoch": 3330} {"train_loss": -6.881040573120117, "global_step": 139875, "epoch": 3330} {"train_loss": -6.7545905113220215, "global_step": 139876, "epoch": 3330} {"train_loss": -6.786174774169922, "global_step": 139877, "epoch": 3330} {"train_loss": -6.742674827575684, "global_step": 139878, "epoch": 3330} {"train_loss": -6.732346534729004, "global_step": 139879, "epoch": 3330} {"train_loss": -6.597529411315918, "global_step": 139880, "epoch": 3330} {"train_loss": -6.66749382019043, "global_step": 139881, "epoch": 3330} {"train_loss": -6.682443618774414, "global_step": 139882, "epoch": 3330} {"train_loss": -6.733136177062988, "global_step": 139883, "epoch": 3330} {"train_loss": -6.726467132568359, "global_step": 139884, "epoch": 3330} {"train_loss": -6.687841415405273, "global_step": 139885, "epoch": 3330} {"train_loss": -6.707932472229004, "global_step": 139886, "epoch": 3330} {"train_loss": -6.710940361022949, "global_step": 139887, "epoch": 3330} {"train_loss": -6.719743251800537, "global_step": 139888, "epoch": 3330} {"train_loss": -6.700839042663574, "global_step": 139889, "epoch": 3330} {"train_loss": -6.727723121643066, "global_step": 139890, "epoch": 3330} {"train_loss": -6.631188869476318, "global_step": 139891, "epoch": 3330} {"train_loss": -6.60228967666626, "global_step": 139892, "epoch": 3330} {"train_loss": -6.63719367980957, "global_step": 139893, "epoch": 3330} {"train_loss": -6.598426342010498, "global_step": 139894, "epoch": 3330} {"train_loss": -6.558277130126953, "global_step": 139895, "epoch": 3330} {"train_loss": -6.618339538574219, "global_step": 139896, "epoch": 3330} {"train_loss": -6.640758991241455, "global_step": 139897, "epoch": 3330} {"train_loss": -6.572844505310059, "global_step": 139898, "epoch": 3330} {"train_loss": -6.698203086853027, "global_step": 139899, "epoch": 3330} {"train_loss": -6.746585845947266, "global_step": 139900, "epoch": 3330} {"train_loss": -6.71178488504319, "global_step": 139901, "epoch": 3330, "val_loss": 68394.84375} {"train_loss": -6.570856094360352, "global_step": 139902, "epoch": 3331} {"train_loss": -6.711147308349609, "global_step": 139903, "epoch": 3331} {"train_loss": -6.643167495727539, "global_step": 139904, "epoch": 3331} {"train_loss": -6.549581527709961, "global_step": 139905, "epoch": 3331} {"train_loss": -6.666064739227295, "global_step": 139906, "epoch": 3331} {"train_loss": -6.594457149505615, "global_step": 139907, "epoch": 3331} {"train_loss": -6.709472179412842, "global_step": 139908, "epoch": 3331} {"train_loss": -6.618282794952393, "global_step": 139909, "epoch": 3331} {"train_loss": -6.664757251739502, "global_step": 139910, "epoch": 3331} {"train_loss": -6.707779884338379, "global_step": 139911, "epoch": 3331} {"train_loss": -6.654426574707031, "global_step": 139912, "epoch": 3331} {"train_loss": -6.756427764892578, "global_step": 139913, "epoch": 3331} {"train_loss": -6.657875061035156, "global_step": 139914, "epoch": 3331} {"train_loss": -6.660443305969238, "global_step": 139915, "epoch": 3331} {"train_loss": -6.672112464904785, "global_step": 139916, "epoch": 3331} {"train_loss": -6.79198694229126, "global_step": 139917, "epoch": 3331} {"train_loss": -6.695644378662109, "global_step": 139918, "epoch": 3331} {"train_loss": -6.728236198425293, "global_step": 139919, "epoch": 3331} {"train_loss": -6.677783012390137, "global_step": 139920, "epoch": 3331} {"train_loss": -6.789610862731934, "global_step": 139921, "epoch": 3331} {"train_loss": -6.666101455688477, "global_step": 139922, "epoch": 3331} {"train_loss": -6.732754707336426, "global_step": 139923, "epoch": 3331} {"train_loss": -6.654338836669922, "global_step": 139924, "epoch": 3331} {"train_loss": -6.70994234085083, "global_step": 139925, "epoch": 3331} {"train_loss": -6.7243242263793945, "global_step": 139926, "epoch": 3331} {"train_loss": -6.674289703369141, "global_step": 139927, "epoch": 3331} {"train_loss": -6.685212135314941, "global_step": 139928, "epoch": 3331} {"train_loss": -6.710942268371582, "global_step": 139929, "epoch": 3331} {"train_loss": -6.6800642013549805, "global_step": 139930, "epoch": 3331} {"train_loss": -6.842965602874756, "global_step": 139931, "epoch": 3331} {"train_loss": -6.536684513092041, "global_step": 139932, "epoch": 3331} {"train_loss": -6.674405097961426, "global_step": 139933, "epoch": 3331} {"train_loss": -6.682086944580078, "global_step": 139934, "epoch": 3331} {"train_loss": -6.6618332862854, "global_step": 139935, "epoch": 3331} {"train_loss": -6.788730621337891, "global_step": 139936, "epoch": 3331} {"train_loss": -6.623940467834473, "global_step": 139937, "epoch": 3331} {"train_loss": -6.557969093322754, "global_step": 139938, "epoch": 3331} {"train_loss": -6.673197269439697, "global_step": 139939, "epoch": 3331} {"train_loss": -6.4726033210754395, "global_step": 139940, "epoch": 3331} {"train_loss": -6.707606792449951, "global_step": 139941, "epoch": 3331} {"train_loss": -6.584786415100098, "global_step": 139942, "epoch": 3331} {"train_loss": -6.672806966872442, "global_step": 139943, "epoch": 3331, "val_loss": 68214.40625} {"train_loss": -6.7495222091674805, "global_step": 139944, "epoch": 3332} {"train_loss": -6.627622127532959, "global_step": 139945, "epoch": 3332} {"train_loss": -6.772584915161133, "global_step": 139946, "epoch": 3332} {"train_loss": -6.619391441345215, "global_step": 139947, "epoch": 3332} {"train_loss": -6.757959365844727, "global_step": 139948, "epoch": 3332} {"train_loss": -6.625343322753906, "global_step": 139949, "epoch": 3332} {"train_loss": -6.763106822967529, "global_step": 139950, "epoch": 3332} {"train_loss": -6.508199691772461, "global_step": 139951, "epoch": 3332} {"train_loss": -6.698067665100098, "global_step": 139952, "epoch": 3332} {"train_loss": -6.804582595825195, "global_step": 139953, "epoch": 3332} {"train_loss": -6.634137153625488, "global_step": 139954, "epoch": 3332} {"train_loss": -6.73732852935791, "global_step": 139955, "epoch": 3332} {"train_loss": -6.512377738952637, "global_step": 139956, "epoch": 3332} {"train_loss": -6.652286052703857, "global_step": 139957, "epoch": 3332} {"train_loss": -6.692619323730469, "global_step": 139958, "epoch": 3332} {"train_loss": -6.662055969238281, "global_step": 139959, "epoch": 3332} {"train_loss": -6.637242317199707, "global_step": 139960, "epoch": 3332} {"train_loss": -6.749575138092041, "global_step": 139961, "epoch": 3332} {"train_loss": -6.7258477210998535, "global_step": 139962, "epoch": 3332} {"train_loss": -6.679386138916016, "global_step": 139963, "epoch": 3332} {"train_loss": -6.729630947113037, "global_step": 139964, "epoch": 3332} {"train_loss": -6.64763069152832, "global_step": 139965, "epoch": 3332} {"train_loss": -6.7602081298828125, "global_step": 139966, "epoch": 3332} {"train_loss": -6.760285377502441, "global_step": 139967, "epoch": 3332} {"train_loss": -6.774979591369629, "global_step": 139968, "epoch": 3332} {"train_loss": -6.7043328285217285, "global_step": 139969, "epoch": 3332} {"train_loss": -6.775399684906006, "global_step": 139970, "epoch": 3332} {"train_loss": -6.711050033569336, "global_step": 139971, "epoch": 3332} {"train_loss": -6.772525787353516, "global_step": 139972, "epoch": 3332} {"train_loss": -6.8549089431762695, "global_step": 139973, "epoch": 3332} {"train_loss": -6.796140193939209, "global_step": 139974, "epoch": 3332} {"train_loss": -6.791760444641113, "global_step": 139975, "epoch": 3332} {"train_loss": -6.809444904327393, "global_step": 139976, "epoch": 3332} {"train_loss": -6.8281354904174805, "global_step": 139977, "epoch": 3332} {"train_loss": -6.797395706176758, "global_step": 139978, "epoch": 3332} {"train_loss": -6.8306989669799805, "global_step": 139979, "epoch": 3332} {"train_loss": -6.765063285827637, "global_step": 139980, "epoch": 3332} {"train_loss": -6.830415725708008, "global_step": 139981, "epoch": 3332} {"train_loss": -6.793522834777832, "global_step": 139982, "epoch": 3332} {"train_loss": -6.723649024963379, "global_step": 139983, "epoch": 3332} {"train_loss": -6.612865447998047, "global_step": 139984, "epoch": 3332} {"train_loss": -6.724717855453491, "global_step": 139985, "epoch": 3332, "val_loss": 68216.015625} {"train_loss": -6.75474739074707, "global_step": 139986, "epoch": 3333} {"train_loss": -6.752695083618164, "global_step": 139987, "epoch": 3333} {"train_loss": -6.824225902557373, "global_step": 139988, "epoch": 3333} {"train_loss": -6.850934982299805, "global_step": 139989, "epoch": 3333} {"train_loss": -6.784116744995117, "global_step": 139990, "epoch": 3333} {"train_loss": -6.7286529541015625, "global_step": 139991, "epoch": 3333} {"train_loss": -6.787655830383301, "global_step": 139992, "epoch": 3333} {"train_loss": -6.7634992599487305, "global_step": 139993, "epoch": 3333} {"train_loss": -6.871997833251953, "global_step": 139994, "epoch": 3333} {"train_loss": -6.712385177612305, "global_step": 139995, "epoch": 3333} {"train_loss": -6.797826290130615, "global_step": 139996, "epoch": 3333} {"train_loss": -6.775981903076172, "global_step": 139997, "epoch": 3333} {"train_loss": -6.680220603942871, "global_step": 139998, "epoch": 3333} {"train_loss": -6.879481315612793, "global_step": 139999, "epoch": 3333} {"train_loss": -6.612070083618164, "global_step": 140000, "epoch": 3333} {"train_loss": -6.729640960693359, "global_step": 140001, "epoch": 3333} {"train_loss": -6.834421157836914, "global_step": 140002, "epoch": 3333} {"train_loss": -6.739997863769531, "global_step": 140003, "epoch": 3333} {"train_loss": -6.725401878356934, "global_step": 140004, "epoch": 3333} {"train_loss": -6.891997337341309, "global_step": 140005, "epoch": 3333} {"train_loss": -6.746086597442627, "global_step": 140006, "epoch": 3333} {"train_loss": -6.757204532623291, "global_step": 140007, "epoch": 3333} {"train_loss": -6.771062850952148, "global_step": 140008, "epoch": 3333} {"train_loss": -6.763065814971924, "global_step": 140009, "epoch": 3333} {"train_loss": -6.726956844329834, "global_step": 140010, "epoch": 3333} {"train_loss": -6.7145280838012695, "global_step": 140011, "epoch": 3333} {"train_loss": -6.748501777648926, "global_step": 140012, "epoch": 3333} {"train_loss": -6.905648231506348, "global_step": 140013, "epoch": 3333} {"train_loss": -6.744217872619629, "global_step": 140014, "epoch": 3333} {"train_loss": -6.796876907348633, "global_step": 140015, "epoch": 3333} {"train_loss": -6.705476760864258, "global_step": 140016, "epoch": 3333} {"train_loss": -6.863836288452148, "global_step": 140017, "epoch": 3333} {"train_loss": -6.758152484893799, "global_step": 140018, "epoch": 3333} {"train_loss": -6.813680648803711, "global_step": 140019, "epoch": 3333} {"train_loss": -6.812994480133057, "global_step": 140020, "epoch": 3333} {"train_loss": -6.730175018310547, "global_step": 140021, "epoch": 3333} {"train_loss": -6.865143775939941, "global_step": 140022, "epoch": 3333} {"train_loss": -6.691070556640625, "global_step": 140023, "epoch": 3333} {"train_loss": -6.708471298217773, "global_step": 140024, "epoch": 3333} {"train_loss": -6.66731071472168, "global_step": 140025, "epoch": 3333} {"train_loss": -6.792552471160889, "global_step": 140026, "epoch": 3333} {"train_loss": -6.773642346972511, "global_step": 140027, "epoch": 3333, "val_loss": 68509.1875} {"train_loss": -6.728762626647949, "global_step": 140028, "epoch": 3334} {"train_loss": -6.779452800750732, "global_step": 140029, "epoch": 3334} {"train_loss": -6.758962631225586, "global_step": 140030, "epoch": 3334} {"train_loss": -6.711938858032227, "global_step": 140031, "epoch": 3334} {"train_loss": -6.808937072753906, "global_step": 140032, "epoch": 3334} {"train_loss": -6.703510284423828, "global_step": 140033, "epoch": 3334} {"train_loss": -6.786539077758789, "global_step": 140034, "epoch": 3334} {"train_loss": -6.811248779296875, "global_step": 140035, "epoch": 3334} {"train_loss": -6.735381126403809, "global_step": 140036, "epoch": 3334} {"train_loss": -6.778853416442871, "global_step": 140037, "epoch": 3334} {"train_loss": -6.72945499420166, "global_step": 140038, "epoch": 3334} {"train_loss": -6.779326438903809, "global_step": 140039, "epoch": 3334} {"train_loss": -6.792762756347656, "global_step": 140040, "epoch": 3334} {"train_loss": -6.64304256439209, "global_step": 140041, "epoch": 3334} {"train_loss": -6.7519378662109375, "global_step": 140042, "epoch": 3334} {"train_loss": -6.637423038482666, "global_step": 140043, "epoch": 3334} {"train_loss": -6.747140884399414, "global_step": 140044, "epoch": 3334} {"train_loss": -6.6948394775390625, "global_step": 140045, "epoch": 3334} {"train_loss": -6.734757900238037, "global_step": 140046, "epoch": 3334} {"train_loss": -6.716815948486328, "global_step": 140047, "epoch": 3334} {"train_loss": -6.6182169914245605, "global_step": 140048, "epoch": 3334} {"train_loss": -6.808564186096191, "global_step": 140049, "epoch": 3334} {"train_loss": -6.645168304443359, "global_step": 140050, "epoch": 3334} {"train_loss": -6.5769267082214355, "global_step": 140051, "epoch": 3334} {"train_loss": -6.695530891418457, "global_step": 140052, "epoch": 3334} {"train_loss": -6.517596244812012, "global_step": 140053, "epoch": 3334} {"train_loss": -6.746244430541992, "global_step": 140054, "epoch": 3334} {"train_loss": -6.530913829803467, "global_step": 140055, "epoch": 3334} {"train_loss": -6.50108528137207, "global_step": 140056, "epoch": 3334} {"train_loss": -6.603165626525879, "global_step": 140057, "epoch": 3334} {"train_loss": -6.689800262451172, "global_step": 140058, "epoch": 3334} {"train_loss": -6.566892623901367, "global_step": 140059, "epoch": 3334} {"train_loss": -6.557318687438965, "global_step": 140060, "epoch": 3334} {"train_loss": -6.579155921936035, "global_step": 140061, "epoch": 3334} {"train_loss": -6.695627689361572, "global_step": 140062, "epoch": 3334} {"train_loss": -6.779180526733398, "global_step": 140063, "epoch": 3334} {"train_loss": -6.603837966918945, "global_step": 140064, "epoch": 3334} {"train_loss": -6.6826677322387695, "global_step": 140065, "epoch": 3334} {"train_loss": -6.675568580627441, "global_step": 140066, "epoch": 3334} {"train_loss": -6.6069841384887695, "global_step": 140067, "epoch": 3334} {"train_loss": -6.594271183013916, "global_step": 140068, "epoch": 3334} {"train_loss": -6.683726481028965, "global_step": 140069, "epoch": 3334, "val_loss": 68286.5546875} {"train_loss": -6.6956634521484375, "global_step": 140070, "epoch": 3335} {"train_loss": -6.716703414916992, "global_step": 140071, "epoch": 3335} {"train_loss": -6.642199516296387, "global_step": 140072, "epoch": 3335} {"train_loss": -6.769369125366211, "global_step": 140073, "epoch": 3335} {"train_loss": -6.6305036544799805, "global_step": 140074, "epoch": 3335} {"train_loss": -6.727826118469238, "global_step": 140075, "epoch": 3335} {"train_loss": -6.701648712158203, "global_step": 140076, "epoch": 3335} {"train_loss": -6.781703948974609, "global_step": 140077, "epoch": 3335} {"train_loss": -6.734968185424805, "global_step": 140078, "epoch": 3335} {"train_loss": -6.681359767913818, "global_step": 140079, "epoch": 3335} {"train_loss": -6.620778560638428, "global_step": 140080, "epoch": 3335} {"train_loss": -6.662010192871094, "global_step": 140081, "epoch": 3335} {"train_loss": -6.736321449279785, "global_step": 140082, "epoch": 3335} {"train_loss": -6.806587219238281, "global_step": 140083, "epoch": 3335} {"train_loss": -6.720700263977051, "global_step": 140084, "epoch": 3335} {"train_loss": -6.8311662673950195, "global_step": 140085, "epoch": 3335} {"train_loss": -6.668067455291748, "global_step": 140086, "epoch": 3335} {"train_loss": -6.67819881439209, "global_step": 140087, "epoch": 3335} {"train_loss": -6.619903564453125, "global_step": 140088, "epoch": 3335} {"train_loss": -6.749952793121338, "global_step": 140089, "epoch": 3335} {"train_loss": -6.6531171798706055, "global_step": 140090, "epoch": 3335} {"train_loss": -6.737086296081543, "global_step": 140091, "epoch": 3335} {"train_loss": -6.593899250030518, "global_step": 140092, "epoch": 3335} {"train_loss": -6.471259117126465, "global_step": 140093, "epoch": 3335} {"train_loss": -6.68610954284668, "global_step": 140094, "epoch": 3335} {"train_loss": -6.618060111999512, "global_step": 140095, "epoch": 3335} {"train_loss": -6.596225261688232, "global_step": 140096, "epoch": 3335} {"train_loss": -6.685896873474121, "global_step": 140097, "epoch": 3335} {"train_loss": -6.6517438888549805, "global_step": 140098, "epoch": 3335} {"train_loss": -6.765796661376953, "global_step": 140099, "epoch": 3335} {"train_loss": -6.750273704528809, "global_step": 140100, "epoch": 3335} {"train_loss": -6.734296798706055, "global_step": 140101, "epoch": 3335} {"train_loss": -6.581066131591797, "global_step": 140102, "epoch": 3335} {"train_loss": -6.676361083984375, "global_step": 140103, "epoch": 3335} {"train_loss": -6.703020095825195, "global_step": 140104, "epoch": 3335} {"train_loss": -6.7510576248168945, "global_step": 140105, "epoch": 3335} {"train_loss": -6.632493019104004, "global_step": 140106, "epoch": 3335} {"train_loss": -6.671257495880127, "global_step": 140107, "epoch": 3335} {"train_loss": -6.795023441314697, "global_step": 140108, "epoch": 3335} {"train_loss": -6.717127799987793, "global_step": 140109, "epoch": 3335} {"train_loss": -6.764950752258301, "global_step": 140110, "epoch": 3335} {"train_loss": -6.693896804537092, "global_step": 140111, "epoch": 3335, "val_loss": 68523.03125} {"train_loss": -6.718203067779541, "global_step": 140112, "epoch": 3336} {"train_loss": -6.870970726013184, "global_step": 140113, "epoch": 3336} {"train_loss": -6.613162994384766, "global_step": 140114, "epoch": 3336} {"train_loss": -6.784209728240967, "global_step": 140115, "epoch": 3336} {"train_loss": -6.72387170791626, "global_step": 140116, "epoch": 3336} {"train_loss": -6.7362189292907715, "global_step": 140117, "epoch": 3336} {"train_loss": -6.765403747558594, "global_step": 140118, "epoch": 3336} {"train_loss": -6.7970685958862305, "global_step": 140119, "epoch": 3336} {"train_loss": -6.829227447509766, "global_step": 140120, "epoch": 3336} {"train_loss": -6.720868110656738, "global_step": 140121, "epoch": 3336} {"train_loss": -6.774581432342529, "global_step": 140122, "epoch": 3336} {"train_loss": -6.8003411293029785, "global_step": 140123, "epoch": 3336} {"train_loss": -6.777884006500244, "global_step": 140124, "epoch": 3336} {"train_loss": -6.733747482299805, "global_step": 140125, "epoch": 3336} {"train_loss": -6.685705184936523, "global_step": 140126, "epoch": 3336} {"train_loss": -6.563169002532959, "global_step": 140127, "epoch": 3336} {"train_loss": -6.740058898925781, "global_step": 140128, "epoch": 3336} {"train_loss": -6.672422885894775, "global_step": 140129, "epoch": 3336} {"train_loss": -6.687970161437988, "global_step": 140130, "epoch": 3336} {"train_loss": -6.632724285125732, "global_step": 140131, "epoch": 3336} {"train_loss": -6.662662982940674, "global_step": 140132, "epoch": 3336} {"train_loss": -6.798944473266602, "global_step": 140133, "epoch": 3336} {"train_loss": -6.742404937744141, "global_step": 140134, "epoch": 3336} {"train_loss": -6.80567741394043, "global_step": 140135, "epoch": 3336} {"train_loss": -6.701122760772705, "global_step": 140136, "epoch": 3336} {"train_loss": -6.682553768157959, "global_step": 140137, "epoch": 3336} {"train_loss": -6.670927047729492, "global_step": 140138, "epoch": 3336} {"train_loss": -6.734295845031738, "global_step": 140139, "epoch": 3336} {"train_loss": -6.656952381134033, "global_step": 140140, "epoch": 3336} {"train_loss": -6.648608207702637, "global_step": 140141, "epoch": 3336} {"train_loss": -6.614932060241699, "global_step": 140142, "epoch": 3336} {"train_loss": -6.673834800720215, "global_step": 140143, "epoch": 3336} {"train_loss": -6.777217864990234, "global_step": 140144, "epoch": 3336} {"train_loss": -6.835277557373047, "global_step": 140145, "epoch": 3336} {"train_loss": -6.725368022918701, "global_step": 140146, "epoch": 3336} {"train_loss": -6.773251533508301, "global_step": 140147, "epoch": 3336} {"train_loss": -6.602585792541504, "global_step": 140148, "epoch": 3336} {"train_loss": -6.744139194488525, "global_step": 140149, "epoch": 3336} {"train_loss": -6.86027717590332, "global_step": 140150, "epoch": 3336} {"train_loss": -6.684069633483887, "global_step": 140151, "epoch": 3336} {"train_loss": -6.669915199279785, "global_step": 140152, "epoch": 3336} {"train_loss": -6.725072009222848, "global_step": 140153, "epoch": 3336, "val_loss": 68254.0703125} {"train_loss": -6.773305892944336, "global_step": 140154, "epoch": 3337} {"train_loss": -6.786347389221191, "global_step": 140155, "epoch": 3337} {"train_loss": -6.676843643188477, "global_step": 140156, "epoch": 3337} {"train_loss": -6.68776798248291, "global_step": 140157, "epoch": 3337} {"train_loss": -6.787685871124268, "global_step": 140158, "epoch": 3337} {"train_loss": -6.6501312255859375, "global_step": 140159, "epoch": 3337} {"train_loss": -6.563920021057129, "global_step": 140160, "epoch": 3337} {"train_loss": -6.6943817138671875, "global_step": 140161, "epoch": 3337} {"train_loss": -6.466288089752197, "global_step": 140162, "epoch": 3337} {"train_loss": -6.674853324890137, "global_step": 140163, "epoch": 3337} {"train_loss": -6.763338088989258, "global_step": 140164, "epoch": 3337} {"train_loss": -6.614206314086914, "global_step": 140165, "epoch": 3337} {"train_loss": -6.665292263031006, "global_step": 140166, "epoch": 3337} {"train_loss": -6.697977066040039, "global_step": 140167, "epoch": 3337} {"train_loss": -6.716611862182617, "global_step": 140168, "epoch": 3337} {"train_loss": -6.724173545837402, "global_step": 140169, "epoch": 3337} {"train_loss": -6.775570392608643, "global_step": 140170, "epoch": 3337} {"train_loss": -6.667338848114014, "global_step": 140171, "epoch": 3337} {"train_loss": -6.638726234436035, "global_step": 140172, "epoch": 3337} {"train_loss": -6.723941802978516, "global_step": 140173, "epoch": 3337} {"train_loss": -6.708919048309326, "global_step": 140174, "epoch": 3337} {"train_loss": -6.666776657104492, "global_step": 140175, "epoch": 3337} {"train_loss": -6.684295177459717, "global_step": 140176, "epoch": 3337} {"train_loss": -6.709830284118652, "global_step": 140177, "epoch": 3337} {"train_loss": -6.646893501281738, "global_step": 140178, "epoch": 3337} {"train_loss": -6.706515789031982, "global_step": 140179, "epoch": 3337} {"train_loss": -6.677498817443848, "global_step": 140180, "epoch": 3337} {"train_loss": -6.642557144165039, "global_step": 140181, "epoch": 3337} {"train_loss": -6.748902797698975, "global_step": 140182, "epoch": 3337} {"train_loss": -6.7251482009887695, "global_step": 140183, "epoch": 3337} {"train_loss": -6.577641010284424, "global_step": 140184, "epoch": 3337} {"train_loss": -6.751224994659424, "global_step": 140185, "epoch": 3337} {"train_loss": -6.538820266723633, "global_step": 140186, "epoch": 3337} {"train_loss": -6.692850112915039, "global_step": 140187, "epoch": 3337} {"train_loss": -6.696165084838867, "global_step": 140188, "epoch": 3337} {"train_loss": -6.772228240966797, "global_step": 140189, "epoch": 3337} {"train_loss": -6.684196472167969, "global_step": 140190, "epoch": 3337} {"train_loss": -6.774387836456299, "global_step": 140191, "epoch": 3337} {"train_loss": -6.67203426361084, "global_step": 140192, "epoch": 3337} {"train_loss": -6.647696018218994, "global_step": 140193, "epoch": 3337} {"train_loss": -6.7278008460998535, "global_step": 140194, "epoch": 3337} {"train_loss": -6.690440972646077, "global_step": 140195, "epoch": 3337, "val_loss": 68289.1640625} {"train_loss": -6.741695404052734, "global_step": 140196, "epoch": 3338} {"train_loss": -6.630113124847412, "global_step": 140197, "epoch": 3338} {"train_loss": -6.794243812561035, "global_step": 140198, "epoch": 3338} {"train_loss": -6.751517295837402, "global_step": 140199, "epoch": 3338} {"train_loss": -6.728482246398926, "global_step": 140200, "epoch": 3338} {"train_loss": -6.743194580078125, "global_step": 140201, "epoch": 3338} {"train_loss": -6.75048303604126, "global_step": 140202, "epoch": 3338} {"train_loss": -6.734655380249023, "global_step": 140203, "epoch": 3338} {"train_loss": -6.781402111053467, "global_step": 140204, "epoch": 3338} {"train_loss": -6.763835906982422, "global_step": 140205, "epoch": 3338} {"train_loss": -6.77046012878418, "global_step": 140206, "epoch": 3338} {"train_loss": -6.824436187744141, "global_step": 140207, "epoch": 3338} {"train_loss": -6.7958664894104, "global_step": 140208, "epoch": 3338} {"train_loss": -6.710125923156738, "global_step": 140209, "epoch": 3338} {"train_loss": -6.8359150886535645, "global_step": 140210, "epoch": 3338} {"train_loss": -6.778154373168945, "global_step": 140211, "epoch": 3338} {"train_loss": -6.82296895980835, "global_step": 140212, "epoch": 3338} {"train_loss": -6.798525810241699, "global_step": 140213, "epoch": 3338} {"train_loss": -6.887762546539307, "global_step": 140214, "epoch": 3338} {"train_loss": -6.7984771728515625, "global_step": 140215, "epoch": 3338} {"train_loss": -6.776184558868408, "global_step": 140216, "epoch": 3338} {"train_loss": -6.688850402832031, "global_step": 140217, "epoch": 3338} {"train_loss": -6.702672958374023, "global_step": 140218, "epoch": 3338} {"train_loss": -6.678910255432129, "global_step": 140219, "epoch": 3338} {"train_loss": -6.870436191558838, "global_step": 140220, "epoch": 3338} {"train_loss": -6.813358306884766, "global_step": 140221, "epoch": 3338} {"train_loss": -6.79750919342041, "global_step": 140222, "epoch": 3338} {"train_loss": -6.779915809631348, "global_step": 140223, "epoch": 3338} {"train_loss": -6.77176570892334, "global_step": 140224, "epoch": 3338} {"train_loss": -6.770958423614502, "global_step": 140225, "epoch": 3338} {"train_loss": -6.8105268478393555, "global_step": 140226, "epoch": 3338} {"train_loss": -6.765618324279785, "global_step": 140227, "epoch": 3338} {"train_loss": -6.566519260406494, "global_step": 140228, "epoch": 3338} {"train_loss": -6.867546558380127, "global_step": 140229, "epoch": 3338} {"train_loss": -6.729615688323975, "global_step": 140230, "epoch": 3338} {"train_loss": -6.725738525390625, "global_step": 140231, "epoch": 3338} {"train_loss": -6.673487186431885, "global_step": 140232, "epoch": 3338} {"train_loss": -6.749880313873291, "global_step": 140233, "epoch": 3338} {"train_loss": -6.722119331359863, "global_step": 140234, "epoch": 3338} {"train_loss": -6.6637725830078125, "global_step": 140235, "epoch": 3338} {"train_loss": -6.793964385986328, "global_step": 140236, "epoch": 3338} {"train_loss": -6.757672877538772, "global_step": 140237, "epoch": 3338, "val_loss": 68459.3046875} {"train_loss": -6.847896575927734, "global_step": 140238, "epoch": 3339} {"train_loss": -6.776901721954346, "global_step": 140239, "epoch": 3339} {"train_loss": -6.574955940246582, "global_step": 140240, "epoch": 3339} {"train_loss": -6.771689414978027, "global_step": 140241, "epoch": 3339} {"train_loss": -6.754438400268555, "global_step": 140242, "epoch": 3339} {"train_loss": -6.678855895996094, "global_step": 140243, "epoch": 3339} {"train_loss": -6.854905128479004, "global_step": 140244, "epoch": 3339} {"train_loss": -6.73763370513916, "global_step": 140245, "epoch": 3339} {"train_loss": -6.820221900939941, "global_step": 140246, "epoch": 3339} {"train_loss": -6.701405048370361, "global_step": 140247, "epoch": 3339} {"train_loss": -6.699286937713623, "global_step": 140248, "epoch": 3339} {"train_loss": -6.723698616027832, "global_step": 140249, "epoch": 3339} {"train_loss": -6.675458908081055, "global_step": 140250, "epoch": 3339} {"train_loss": -6.8170342445373535, "global_step": 140251, "epoch": 3339} {"train_loss": -6.720585823059082, "global_step": 140252, "epoch": 3339} {"train_loss": -6.679239273071289, "global_step": 140253, "epoch": 3339} {"train_loss": -6.711228847503662, "global_step": 140254, "epoch": 3339} {"train_loss": -6.6983747482299805, "global_step": 140255, "epoch": 3339} {"train_loss": -6.717723846435547, "global_step": 140256, "epoch": 3339} {"train_loss": -6.7100934982299805, "global_step": 140257, "epoch": 3339} {"train_loss": -6.775554180145264, "global_step": 140258, "epoch": 3339} {"train_loss": -6.5822296142578125, "global_step": 140259, "epoch": 3339} {"train_loss": -6.7642974853515625, "global_step": 140260, "epoch": 3339} {"train_loss": -6.826593399047852, "global_step": 140261, "epoch": 3339} {"train_loss": -6.8124189376831055, "global_step": 140262, "epoch": 3339} {"train_loss": -6.813836097717285, "global_step": 140263, "epoch": 3339} {"train_loss": -6.720551013946533, "global_step": 140264, "epoch": 3339} {"train_loss": -6.683326244354248, "global_step": 140265, "epoch": 3339} {"train_loss": -6.753418922424316, "global_step": 140266, "epoch": 3339} {"train_loss": -6.68803596496582, "global_step": 140267, "epoch": 3339} {"train_loss": -6.684176445007324, "global_step": 140268, "epoch": 3339} {"train_loss": -6.728316307067871, "global_step": 140269, "epoch": 3339} {"train_loss": -6.704843044281006, "global_step": 140270, "epoch": 3339} {"train_loss": -6.718196392059326, "global_step": 140271, "epoch": 3339} {"train_loss": -6.702152252197266, "global_step": 140272, "epoch": 3339} {"train_loss": -6.645329475402832, "global_step": 140273, "epoch": 3339} {"train_loss": -6.4821696281433105, "global_step": 140274, "epoch": 3339} {"train_loss": -6.597062110900879, "global_step": 140275, "epoch": 3339} {"train_loss": -6.589508056640625, "global_step": 140276, "epoch": 3339} {"train_loss": -6.6905412673950195, "global_step": 140277, "epoch": 3339} {"train_loss": -6.4716644287109375, "global_step": 140278, "epoch": 3339} {"train_loss": -6.7115122590746195, "global_step": 140279, "epoch": 3339, "val_loss": 68205.6015625} {"train_loss": -6.773571014404297, "global_step": 140280, "epoch": 3340} {"train_loss": -6.672797203063965, "global_step": 140281, "epoch": 3340} {"train_loss": -6.690511703491211, "global_step": 140282, "epoch": 3340} {"train_loss": -6.797466278076172, "global_step": 140283, "epoch": 3340} {"train_loss": -6.794708251953125, "global_step": 140284, "epoch": 3340} {"train_loss": -6.6680169105529785, "global_step": 140285, "epoch": 3340} {"train_loss": -6.715639114379883, "global_step": 140286, "epoch": 3340} {"train_loss": -6.77144718170166, "global_step": 140287, "epoch": 3340} {"train_loss": -6.720434665679932, "global_step": 140288, "epoch": 3340} {"train_loss": -6.665214538574219, "global_step": 140289, "epoch": 3340} {"train_loss": -6.660000801086426, "global_step": 140290, "epoch": 3340} {"train_loss": -6.702788829803467, "global_step": 140291, "epoch": 3340} {"train_loss": -6.6477813720703125, "global_step": 140292, "epoch": 3340} {"train_loss": -6.813239097595215, "global_step": 140293, "epoch": 3340} {"train_loss": -6.715599060058594, "global_step": 140294, "epoch": 3340} {"train_loss": -6.784931182861328, "global_step": 140295, "epoch": 3340} {"train_loss": -6.684548854827881, "global_step": 140296, "epoch": 3340} {"train_loss": -6.782798767089844, "global_step": 140297, "epoch": 3340} {"train_loss": -6.735387802124023, "global_step": 140298, "epoch": 3340} {"train_loss": -6.707000732421875, "global_step": 140299, "epoch": 3340} {"train_loss": -6.717520236968994, "global_step": 140300, "epoch": 3340} {"train_loss": -6.736578941345215, "global_step": 140301, "epoch": 3340} {"train_loss": -6.774665832519531, "global_step": 140302, "epoch": 3340} {"train_loss": -6.725947380065918, "global_step": 140303, "epoch": 3340} {"train_loss": -6.777349472045898, "global_step": 140304, "epoch": 3340} {"train_loss": -6.74101448059082, "global_step": 140305, "epoch": 3340} {"train_loss": -6.727324485778809, "global_step": 140306, "epoch": 3340} {"train_loss": -6.765054225921631, "global_step": 140307, "epoch": 3340} {"train_loss": -6.724207878112793, "global_step": 140308, "epoch": 3340} {"train_loss": -6.710895538330078, "global_step": 140309, "epoch": 3340} {"train_loss": -6.710659027099609, "global_step": 140310, "epoch": 3340} {"train_loss": -6.658209800720215, "global_step": 140311, "epoch": 3340} {"train_loss": -6.658731460571289, "global_step": 140312, "epoch": 3340} {"train_loss": -6.760955810546875, "global_step": 140313, "epoch": 3340} {"train_loss": -6.691213130950928, "global_step": 140314, "epoch": 3340} {"train_loss": -6.728096961975098, "global_step": 140315, "epoch": 3340} {"train_loss": -6.702146530151367, "global_step": 140316, "epoch": 3340} {"train_loss": -6.780092716217041, "global_step": 140317, "epoch": 3340} {"train_loss": -6.655359268188477, "global_step": 140318, "epoch": 3340} {"train_loss": -6.713937759399414, "global_step": 140319, "epoch": 3340} {"train_loss": -6.748237133026123, "global_step": 140320, "epoch": 3340} {"train_loss": -6.7280451229640414, "global_step": 140321, "epoch": 3340, "val_loss": 68499.2421875} {"train_loss": -6.688966751098633, "global_step": 140322, "epoch": 3341} {"train_loss": -6.816323280334473, "global_step": 140323, "epoch": 3341} {"train_loss": -6.747245788574219, "global_step": 140324, "epoch": 3341} {"train_loss": -6.739727020263672, "global_step": 140325, "epoch": 3341} {"train_loss": -6.700231552124023, "global_step": 140326, "epoch": 3341} {"train_loss": -6.7118330001831055, "global_step": 140327, "epoch": 3341} {"train_loss": -6.755732536315918, "global_step": 140328, "epoch": 3341} {"train_loss": -6.666844367980957, "global_step": 140329, "epoch": 3341} {"train_loss": -6.697795867919922, "global_step": 140330, "epoch": 3341} {"train_loss": -6.7459235191345215, "global_step": 140331, "epoch": 3341} {"train_loss": -6.796003341674805, "global_step": 140332, "epoch": 3341} {"train_loss": -6.742084503173828, "global_step": 140333, "epoch": 3341} {"train_loss": -6.667545795440674, "global_step": 140334, "epoch": 3341} {"train_loss": -6.655322074890137, "global_step": 140335, "epoch": 3341} {"train_loss": -6.813997268676758, "global_step": 140336, "epoch": 3341} {"train_loss": -6.669301986694336, "global_step": 140337, "epoch": 3341} {"train_loss": -6.65589714050293, "global_step": 140338, "epoch": 3341} {"train_loss": -6.776313304901123, "global_step": 140339, "epoch": 3341} {"train_loss": -6.758795738220215, "global_step": 140340, "epoch": 3341} {"train_loss": -6.6201491355896, "global_step": 140341, "epoch": 3341} {"train_loss": -6.713805198669434, "global_step": 140342, "epoch": 3341} {"train_loss": -6.740543365478516, "global_step": 140343, "epoch": 3341} {"train_loss": -6.7428154945373535, "global_step": 140344, "epoch": 3341} {"train_loss": -6.6862263679504395, "global_step": 140345, "epoch": 3341} {"train_loss": -6.699938774108887, "global_step": 140346, "epoch": 3341} {"train_loss": -6.774657249450684, "global_step": 140347, "epoch": 3341} {"train_loss": -6.566097736358643, "global_step": 140348, "epoch": 3341} {"train_loss": -6.741907119750977, "global_step": 140349, "epoch": 3341} {"train_loss": -6.807219982147217, "global_step": 140350, "epoch": 3341} {"train_loss": -6.826222896575928, "global_step": 140351, "epoch": 3341} {"train_loss": -6.671814918518066, "global_step": 140352, "epoch": 3341} {"train_loss": -6.631343364715576, "global_step": 140353, "epoch": 3341} {"train_loss": -6.776887893676758, "global_step": 140354, "epoch": 3341} {"train_loss": -6.697943687438965, "global_step": 140355, "epoch": 3341} {"train_loss": -6.864612579345703, "global_step": 140356, "epoch": 3341} {"train_loss": -6.823063373565674, "global_step": 140357, "epoch": 3341} {"train_loss": -6.68669319152832, "global_step": 140358, "epoch": 3341} {"train_loss": -6.8120527267456055, "global_step": 140359, "epoch": 3341} {"train_loss": -6.6955108642578125, "global_step": 140360, "epoch": 3341} {"train_loss": -6.655134201049805, "global_step": 140361, "epoch": 3341} {"train_loss": -6.7169189453125, "global_step": 140362, "epoch": 3341} {"train_loss": -6.722580932435536, "global_step": 140363, "epoch": 3341, "val_loss": 68388.984375} {"train_loss": -6.793291091918945, "global_step": 140364, "epoch": 3342} {"train_loss": -6.699001312255859, "global_step": 140365, "epoch": 3342} {"train_loss": -6.663689613342285, "global_step": 140366, "epoch": 3342} {"train_loss": -6.808418273925781, "global_step": 140367, "epoch": 3342} {"train_loss": -6.601144790649414, "global_step": 140368, "epoch": 3342} {"train_loss": -6.645733833312988, "global_step": 140369, "epoch": 3342} {"train_loss": -6.64373779296875, "global_step": 140370, "epoch": 3342} {"train_loss": -6.620759010314941, "global_step": 140371, "epoch": 3342} {"train_loss": -6.637554168701172, "global_step": 140372, "epoch": 3342} {"train_loss": -6.6224565505981445, "global_step": 140373, "epoch": 3342} {"train_loss": -6.673737049102783, "global_step": 140374, "epoch": 3342} {"train_loss": -6.666918754577637, "global_step": 140375, "epoch": 3342} {"train_loss": -6.7811279296875, "global_step": 140376, "epoch": 3342} {"train_loss": -6.579970359802246, "global_step": 140377, "epoch": 3342} {"train_loss": -6.582149505615234, "global_step": 140378, "epoch": 3342} {"train_loss": -6.6320061683654785, "global_step": 140379, "epoch": 3342} {"train_loss": -6.681698799133301, "global_step": 140380, "epoch": 3342} {"train_loss": -6.7218804359436035, "global_step": 140381, "epoch": 3342} {"train_loss": -6.729435920715332, "global_step": 140382, "epoch": 3342} {"train_loss": -6.613944053649902, "global_step": 140383, "epoch": 3342} {"train_loss": -6.5772809982299805, "global_step": 140384, "epoch": 3342} {"train_loss": -6.710669994354248, "global_step": 140385, "epoch": 3342} {"train_loss": -6.674736976623535, "global_step": 140386, "epoch": 3342} {"train_loss": -6.694714069366455, "global_step": 140387, "epoch": 3342} {"train_loss": -6.587095260620117, "global_step": 140388, "epoch": 3342} {"train_loss": -6.6005377769470215, "global_step": 140389, "epoch": 3342} {"train_loss": -6.6904473304748535, "global_step": 140390, "epoch": 3342} {"train_loss": -6.516751766204834, "global_step": 140391, "epoch": 3342} {"train_loss": -6.684700012207031, "global_step": 140392, "epoch": 3342} {"train_loss": -6.54753303527832, "global_step": 140393, "epoch": 3342} {"train_loss": -6.636845588684082, "global_step": 140394, "epoch": 3342} {"train_loss": -6.560540199279785, "global_step": 140395, "epoch": 3342} {"train_loss": -6.600878715515137, "global_step": 140396, "epoch": 3342} {"train_loss": -6.633914947509766, "global_step": 140397, "epoch": 3342} {"train_loss": -6.56387996673584, "global_step": 140398, "epoch": 3342} {"train_loss": -6.707798480987549, "global_step": 140399, "epoch": 3342} {"train_loss": -6.607505798339844, "global_step": 140400, "epoch": 3342} {"train_loss": -6.722406387329102, "global_step": 140401, "epoch": 3342} {"train_loss": -6.549294948577881, "global_step": 140402, "epoch": 3342} {"train_loss": -6.800726890563965, "global_step": 140403, "epoch": 3342} {"train_loss": -6.615059852600098, "global_step": 140404, "epoch": 3342} {"train_loss": -6.650612865175519, "global_step": 140405, "epoch": 3342, "val_loss": 68128.28125} {"train_loss": -6.524005889892578, "global_step": 140406, "epoch": 3343} {"train_loss": -6.714186191558838, "global_step": 140407, "epoch": 3343} {"train_loss": -6.66262149810791, "global_step": 140408, "epoch": 3343} {"train_loss": -6.663094520568848, "global_step": 140409, "epoch": 3343} {"train_loss": -6.61526346206665, "global_step": 140410, "epoch": 3343} {"train_loss": -6.698814392089844, "global_step": 140411, "epoch": 3343} {"train_loss": -6.640734672546387, "global_step": 140412, "epoch": 3343} {"train_loss": -6.678039073944092, "global_step": 140413, "epoch": 3343} {"train_loss": -6.713757514953613, "global_step": 140414, "epoch": 3343} {"train_loss": -6.716692924499512, "global_step": 140415, "epoch": 3343} {"train_loss": -6.61775016784668, "global_step": 140416, "epoch": 3343} {"train_loss": -6.810276985168457, "global_step": 140417, "epoch": 3343} {"train_loss": -6.732231616973877, "global_step": 140418, "epoch": 3343} {"train_loss": -6.656239032745361, "global_step": 140419, "epoch": 3343} {"train_loss": -6.705150604248047, "global_step": 140420, "epoch": 3343} {"train_loss": -6.7060627937316895, "global_step": 140421, "epoch": 3343} {"train_loss": -6.728738784790039, "global_step": 140422, "epoch": 3343} {"train_loss": -6.802417755126953, "global_step": 140423, "epoch": 3343} {"train_loss": -6.65830135345459, "global_step": 140424, "epoch": 3343} {"train_loss": -6.700407028198242, "global_step": 140425, "epoch": 3343} {"train_loss": -6.693305969238281, "global_step": 140426, "epoch": 3343} {"train_loss": -6.698074817657471, "global_step": 140427, "epoch": 3343} {"train_loss": -6.765153884887695, "global_step": 140428, "epoch": 3343} {"train_loss": -6.625134468078613, "global_step": 140429, "epoch": 3343} {"train_loss": -6.661301136016846, "global_step": 140430, "epoch": 3343} {"train_loss": -6.808103561401367, "global_step": 140431, "epoch": 3343} {"train_loss": -6.727108955383301, "global_step": 140432, "epoch": 3343} {"train_loss": -6.794198989868164, "global_step": 140433, "epoch": 3343} {"train_loss": -6.775163650512695, "global_step": 140434, "epoch": 3343} {"train_loss": -6.777848243713379, "global_step": 140435, "epoch": 3343} {"train_loss": -6.781847953796387, "global_step": 140436, "epoch": 3343} {"train_loss": -6.643238067626953, "global_step": 140437, "epoch": 3343} {"train_loss": -6.799849510192871, "global_step": 140438, "epoch": 3343} {"train_loss": -6.807195663452148, "global_step": 140439, "epoch": 3343} {"train_loss": -6.691638946533203, "global_step": 140440, "epoch": 3343} {"train_loss": -6.840338706970215, "global_step": 140441, "epoch": 3343} {"train_loss": -6.7960124015808105, "global_step": 140442, "epoch": 3343} {"train_loss": -6.7431559562683105, "global_step": 140443, "epoch": 3343} {"train_loss": -6.750405788421631, "global_step": 140444, "epoch": 3343} {"train_loss": -6.708234786987305, "global_step": 140445, "epoch": 3343} {"train_loss": -6.745965957641602, "global_step": 140446, "epoch": 3343} {"train_loss": -6.7188686075664705, "global_step": 140447, "epoch": 3343, "val_loss": 68263.421875} {"train_loss": -6.8817291259765625, "global_step": 140448, "epoch": 3344} {"train_loss": -6.578578948974609, "global_step": 140449, "epoch": 3344} {"train_loss": -6.659929275512695, "global_step": 140450, "epoch": 3344} {"train_loss": -6.726828575134277, "global_step": 140451, "epoch": 3344} {"train_loss": -6.740511894226074, "global_step": 140452, "epoch": 3344} {"train_loss": -6.670505046844482, "global_step": 140453, "epoch": 3344} {"train_loss": -6.711422920227051, "global_step": 140454, "epoch": 3344} {"train_loss": -6.7505412101745605, "global_step": 140455, "epoch": 3344} {"train_loss": -6.7748260498046875, "global_step": 140456, "epoch": 3344} {"train_loss": -6.788714408874512, "global_step": 140457, "epoch": 3344} {"train_loss": -6.748266696929932, "global_step": 140458, "epoch": 3344} {"train_loss": -6.7256011962890625, "global_step": 140459, "epoch": 3344} {"train_loss": -6.854565620422363, "global_step": 140460, "epoch": 3344} {"train_loss": -6.703780651092529, "global_step": 140461, "epoch": 3344} {"train_loss": -6.739651679992676, "global_step": 140462, "epoch": 3344} {"train_loss": -6.760625839233398, "global_step": 140463, "epoch": 3344} {"train_loss": -6.8415021896362305, "global_step": 140464, "epoch": 3344} {"train_loss": -6.776332378387451, "global_step": 140465, "epoch": 3344} {"train_loss": -6.760289669036865, "global_step": 140466, "epoch": 3344} {"train_loss": -6.7103753089904785, "global_step": 140467, "epoch": 3344} {"train_loss": -6.748006343841553, "global_step": 140468, "epoch": 3344} {"train_loss": -6.704581260681152, "global_step": 140469, "epoch": 3344} {"train_loss": -6.717677116394043, "global_step": 140470, "epoch": 3344} {"train_loss": -6.826464653015137, "global_step": 140471, "epoch": 3344} {"train_loss": -6.751680374145508, "global_step": 140472, "epoch": 3344} {"train_loss": -6.872835159301758, "global_step": 140473, "epoch": 3344} {"train_loss": -6.728824138641357, "global_step": 140474, "epoch": 3344} {"train_loss": -6.927256107330322, "global_step": 140475, "epoch": 3344} {"train_loss": -6.773914337158203, "global_step": 140476, "epoch": 3344} {"train_loss": -6.717952251434326, "global_step": 140477, "epoch": 3344} {"train_loss": -6.789595603942871, "global_step": 140478, "epoch": 3344} {"train_loss": -6.755029678344727, "global_step": 140479, "epoch": 3344} {"train_loss": -6.710217475891113, "global_step": 140480, "epoch": 3344} {"train_loss": -6.803900718688965, "global_step": 140481, "epoch": 3344} {"train_loss": -6.638613700866699, "global_step": 140482, "epoch": 3344} {"train_loss": -6.692427158355713, "global_step": 140483, "epoch": 3344} {"train_loss": -6.745251655578613, "global_step": 140484, "epoch": 3344} {"train_loss": -6.655536651611328, "global_step": 140485, "epoch": 3344} {"train_loss": -6.719006538391113, "global_step": 140486, "epoch": 3344} {"train_loss": -6.7337799072265625, "global_step": 140487, "epoch": 3344} {"train_loss": -6.658919334411621, "global_step": 140488, "epoch": 3344} {"train_loss": -6.745920987356277, "global_step": 140489, "epoch": 3344, "val_loss": 68408.484375} {"train_loss": -6.784728050231934, "global_step": 140490, "epoch": 3345} {"train_loss": -6.762360095977783, "global_step": 140491, "epoch": 3345} {"train_loss": -6.7634382247924805, "global_step": 140492, "epoch": 3345} {"train_loss": -6.69649600982666, "global_step": 140493, "epoch": 3345} {"train_loss": -6.659111499786377, "global_step": 140494, "epoch": 3345} {"train_loss": -6.651227951049805, "global_step": 140495, "epoch": 3345} {"train_loss": -6.856164932250977, "global_step": 140496, "epoch": 3345} {"train_loss": -6.487649917602539, "global_step": 140497, "epoch": 3345} {"train_loss": -6.702873229980469, "global_step": 140498, "epoch": 3345} {"train_loss": -6.754616737365723, "global_step": 140499, "epoch": 3345} {"train_loss": -6.545604705810547, "global_step": 140500, "epoch": 3345} {"train_loss": -6.671487808227539, "global_step": 140501, "epoch": 3345} {"train_loss": -6.776926040649414, "global_step": 140502, "epoch": 3345} {"train_loss": -6.7029194831848145, "global_step": 140503, "epoch": 3345} {"train_loss": -6.705450057983398, "global_step": 140504, "epoch": 3345} {"train_loss": -6.6332926750183105, "global_step": 140505, "epoch": 3345} {"train_loss": -6.710433006286621, "global_step": 140506, "epoch": 3345} {"train_loss": -6.686404228210449, "global_step": 140507, "epoch": 3345} {"train_loss": -6.814430236816406, "global_step": 140508, "epoch": 3345} {"train_loss": -6.705428123474121, "global_step": 140509, "epoch": 3345} {"train_loss": -6.572542190551758, "global_step": 140510, "epoch": 3345} {"train_loss": -6.715470314025879, "global_step": 140511, "epoch": 3345} {"train_loss": -6.591609954833984, "global_step": 140512, "epoch": 3345} {"train_loss": -6.818953514099121, "global_step": 140513, "epoch": 3345} {"train_loss": -6.682266712188721, "global_step": 140514, "epoch": 3345} {"train_loss": -6.726339340209961, "global_step": 140515, "epoch": 3345} {"train_loss": -6.649781227111816, "global_step": 140516, "epoch": 3345} {"train_loss": -6.767455101013184, "global_step": 140517, "epoch": 3345} {"train_loss": -6.559120178222656, "global_step": 140518, "epoch": 3345} {"train_loss": -6.6952619552612305, "global_step": 140519, "epoch": 3345} {"train_loss": -6.635631561279297, "global_step": 140520, "epoch": 3345} {"train_loss": -6.679230690002441, "global_step": 140521, "epoch": 3345} {"train_loss": -6.556935787200928, "global_step": 140522, "epoch": 3345} {"train_loss": -6.760283470153809, "global_step": 140523, "epoch": 3345} {"train_loss": -6.729912757873535, "global_step": 140524, "epoch": 3345} {"train_loss": -6.670236587524414, "global_step": 140525, "epoch": 3345} {"train_loss": -6.465226173400879, "global_step": 140526, "epoch": 3345} {"train_loss": -6.793713569641113, "global_step": 140527, "epoch": 3345} {"train_loss": -6.637389183044434, "global_step": 140528, "epoch": 3345} {"train_loss": -6.624018669128418, "global_step": 140529, "epoch": 3345} {"train_loss": -6.633688449859619, "global_step": 140530, "epoch": 3345} {"train_loss": -6.682521820068359, "global_step": 140531, "epoch": 3345, "val_loss": 68181.140625} {"train_loss": -6.683477401733398, "global_step": 140532, "epoch": 3346} {"train_loss": -6.64487886428833, "global_step": 140533, "epoch": 3346} {"train_loss": -6.696173667907715, "global_step": 140534, "epoch": 3346} {"train_loss": -6.692549705505371, "global_step": 140535, "epoch": 3346} {"train_loss": -6.691844940185547, "global_step": 140536, "epoch": 3346} {"train_loss": -6.646823883056641, "global_step": 140537, "epoch": 3346} {"train_loss": -6.832963943481445, "global_step": 140538, "epoch": 3346} {"train_loss": -6.809313774108887, "global_step": 140539, "epoch": 3346} {"train_loss": -6.7019171714782715, "global_step": 140540, "epoch": 3346} {"train_loss": -6.780120372772217, "global_step": 140541, "epoch": 3346} {"train_loss": -6.710021495819092, "global_step": 140542, "epoch": 3346} {"train_loss": -6.761154651641846, "global_step": 140543, "epoch": 3346} {"train_loss": -6.733653545379639, "global_step": 140544, "epoch": 3346} {"train_loss": -6.698096752166748, "global_step": 140545, "epoch": 3346} {"train_loss": -6.715902328491211, "global_step": 140546, "epoch": 3346} {"train_loss": -6.7243242263793945, "global_step": 140547, "epoch": 3346} {"train_loss": -6.649003982543945, "global_step": 140548, "epoch": 3346} {"train_loss": -6.789939880371094, "global_step": 140549, "epoch": 3346} {"train_loss": -6.737499713897705, "global_step": 140550, "epoch": 3346} {"train_loss": -6.712522506713867, "global_step": 140551, "epoch": 3346} {"train_loss": -6.715215682983398, "global_step": 140552, "epoch": 3346} {"train_loss": -6.820971488952637, "global_step": 140553, "epoch": 3346} {"train_loss": -6.75123929977417, "global_step": 140554, "epoch": 3346} {"train_loss": -6.710850715637207, "global_step": 140555, "epoch": 3346} {"train_loss": -6.758023262023926, "global_step": 140556, "epoch": 3346} {"train_loss": -6.800467491149902, "global_step": 140557, "epoch": 3346} {"train_loss": -6.716104984283447, "global_step": 140558, "epoch": 3346} {"train_loss": -6.715429782867432, "global_step": 140559, "epoch": 3346} {"train_loss": -6.746556282043457, "global_step": 140560, "epoch": 3346} {"train_loss": -6.640625, "global_step": 140561, "epoch": 3346} {"train_loss": -6.753485679626465, "global_step": 140562, "epoch": 3346} {"train_loss": -6.762677192687988, "global_step": 140563, "epoch": 3346} {"train_loss": -6.546409606933594, "global_step": 140564, "epoch": 3346} {"train_loss": -6.8381218910217285, "global_step": 140565, "epoch": 3346} {"train_loss": -6.736320495605469, "global_step": 140566, "epoch": 3346} {"train_loss": -6.720189094543457, "global_step": 140567, "epoch": 3346} {"train_loss": -6.662747383117676, "global_step": 140568, "epoch": 3346} {"train_loss": -6.682204246520996, "global_step": 140569, "epoch": 3346} {"train_loss": -6.634434700012207, "global_step": 140570, "epoch": 3346} {"train_loss": -6.703334808349609, "global_step": 140571, "epoch": 3346} {"train_loss": -6.830927848815918, "global_step": 140572, "epoch": 3346} {"train_loss": -6.72477836835952, "global_step": 140573, "epoch": 3346, "val_loss": 68265.765625} {"train_loss": -6.798727512359619, "global_step": 140574, "epoch": 3347} {"train_loss": -6.72843074798584, "global_step": 140575, "epoch": 3347} {"train_loss": -6.7744269371032715, "global_step": 140576, "epoch": 3347} {"train_loss": -6.655247211456299, "global_step": 140577, "epoch": 3347} {"train_loss": -6.700594902038574, "global_step": 140578, "epoch": 3347} {"train_loss": -6.731748104095459, "global_step": 140579, "epoch": 3347} {"train_loss": -6.761025428771973, "global_step": 140580, "epoch": 3347} {"train_loss": -6.664628982543945, "global_step": 140581, "epoch": 3347} {"train_loss": -6.668399333953857, "global_step": 140582, "epoch": 3347} {"train_loss": -6.750910758972168, "global_step": 140583, "epoch": 3347} {"train_loss": -6.6703200340271, "global_step": 140584, "epoch": 3347} {"train_loss": -6.728564262390137, "global_step": 140585, "epoch": 3347} {"train_loss": -6.718180179595947, "global_step": 140586, "epoch": 3347} {"train_loss": -6.819091796875, "global_step": 140587, "epoch": 3347} {"train_loss": -6.6560163497924805, "global_step": 140588, "epoch": 3347} {"train_loss": -6.808789253234863, "global_step": 140589, "epoch": 3347} {"train_loss": -6.693915367126465, "global_step": 140590, "epoch": 3347} {"train_loss": -6.777803421020508, "global_step": 140591, "epoch": 3347} {"train_loss": -6.679906845092773, "global_step": 140592, "epoch": 3347} {"train_loss": -6.577101707458496, "global_step": 140593, "epoch": 3347} {"train_loss": -6.64708948135376, "global_step": 140594, "epoch": 3347} {"train_loss": -6.818173885345459, "global_step": 140595, "epoch": 3347} {"train_loss": -6.7433552742004395, "global_step": 140596, "epoch": 3347} {"train_loss": -6.738109111785889, "global_step": 140597, "epoch": 3347} {"train_loss": -6.674990653991699, "global_step": 140598, "epoch": 3347} {"train_loss": -6.761302947998047, "global_step": 140599, "epoch": 3347} {"train_loss": -6.631430149078369, "global_step": 140600, "epoch": 3347} {"train_loss": -6.71287727355957, "global_step": 140601, "epoch": 3347} {"train_loss": -6.68453311920166, "global_step": 140602, "epoch": 3347} {"train_loss": -6.658700942993164, "global_step": 140603, "epoch": 3347} {"train_loss": -6.738226413726807, "global_step": 140604, "epoch": 3347} {"train_loss": -6.715675354003906, "global_step": 140605, "epoch": 3347} {"train_loss": -6.682182312011719, "global_step": 140606, "epoch": 3347} {"train_loss": -6.712155342102051, "global_step": 140607, "epoch": 3347} {"train_loss": -6.751527309417725, "global_step": 140608, "epoch": 3347} {"train_loss": -6.661433219909668, "global_step": 140609, "epoch": 3347} {"train_loss": -6.726419448852539, "global_step": 140610, "epoch": 3347} {"train_loss": -6.749080657958984, "global_step": 140611, "epoch": 3347} {"train_loss": -6.698329925537109, "global_step": 140612, "epoch": 3347} {"train_loss": -6.63650369644165, "global_step": 140613, "epoch": 3347} {"train_loss": -6.731218338012695, "global_step": 140614, "epoch": 3347} {"train_loss": -6.71339784349714, "global_step": 140615, "epoch": 3347, "val_loss": 68387.7265625} {"train_loss": -6.697449684143066, "global_step": 140616, "epoch": 3348} {"train_loss": -6.629294395446777, "global_step": 140617, "epoch": 3348} {"train_loss": -6.778528213500977, "global_step": 140618, "epoch": 3348} {"train_loss": -6.682994842529297, "global_step": 140619, "epoch": 3348} {"train_loss": -6.7576375007629395, "global_step": 140620, "epoch": 3348} {"train_loss": -6.759879112243652, "global_step": 140621, "epoch": 3348} {"train_loss": -6.697251796722412, "global_step": 140622, "epoch": 3348} {"train_loss": -6.69257926940918, "global_step": 140623, "epoch": 3348} {"train_loss": -6.659211158752441, "global_step": 140624, "epoch": 3348} {"train_loss": -6.631422519683838, "global_step": 140625, "epoch": 3348} {"train_loss": -6.77766227722168, "global_step": 140626, "epoch": 3348} {"train_loss": -6.506194114685059, "global_step": 140627, "epoch": 3348} {"train_loss": -6.719403266906738, "global_step": 140628, "epoch": 3348} {"train_loss": -6.684032440185547, "global_step": 140629, "epoch": 3348} {"train_loss": -6.683680057525635, "global_step": 140630, "epoch": 3348} {"train_loss": -6.739804744720459, "global_step": 140631, "epoch": 3348} {"train_loss": -6.717641353607178, "global_step": 140632, "epoch": 3348} {"train_loss": -6.666266441345215, "global_step": 140633, "epoch": 3348} {"train_loss": -6.681084632873535, "global_step": 140634, "epoch": 3348} {"train_loss": -6.779325485229492, "global_step": 140635, "epoch": 3348} {"train_loss": -6.772439956665039, "global_step": 140636, "epoch": 3348} {"train_loss": -6.708731174468994, "global_step": 140637, "epoch": 3348} {"train_loss": -6.742298603057861, "global_step": 140638, "epoch": 3348} {"train_loss": -6.760787487030029, "global_step": 140639, "epoch": 3348} {"train_loss": -6.694177150726318, "global_step": 140640, "epoch": 3348} {"train_loss": -6.617475509643555, "global_step": 140641, "epoch": 3348} {"train_loss": -6.708517074584961, "global_step": 140642, "epoch": 3348} {"train_loss": -6.810275077819824, "global_step": 140643, "epoch": 3348} {"train_loss": -6.80763053894043, "global_step": 140644, "epoch": 3348} {"train_loss": -6.737753868103027, "global_step": 140645, "epoch": 3348} {"train_loss": -6.749007225036621, "global_step": 140646, "epoch": 3348} {"train_loss": -6.68511962890625, "global_step": 140647, "epoch": 3348} {"train_loss": -6.792539596557617, "global_step": 140648, "epoch": 3348} {"train_loss": -6.645570278167725, "global_step": 140649, "epoch": 3348} {"train_loss": -6.674120903015137, "global_step": 140650, "epoch": 3348} {"train_loss": -6.656039237976074, "global_step": 140651, "epoch": 3348} {"train_loss": -6.6580610275268555, "global_step": 140652, "epoch": 3348} {"train_loss": -6.741584777832031, "global_step": 140653, "epoch": 3348} {"train_loss": -6.662350177764893, "global_step": 140654, "epoch": 3348} {"train_loss": -6.678727149963379, "global_step": 140655, "epoch": 3348} {"train_loss": -6.513466835021973, "global_step": 140656, "epoch": 3348} {"train_loss": -6.697630371366229, "global_step": 140657, "epoch": 3348, "val_loss": 68156.9765625} {"train_loss": -6.7102766036987305, "global_step": 140658, "epoch": 3349} {"train_loss": -6.61883544921875, "global_step": 140659, "epoch": 3349} {"train_loss": -6.57693338394165, "global_step": 140660, "epoch": 3349} {"train_loss": -6.67165994644165, "global_step": 140661, "epoch": 3349} {"train_loss": -6.627192497253418, "global_step": 140662, "epoch": 3349} {"train_loss": -6.672417640686035, "global_step": 140663, "epoch": 3349} {"train_loss": -6.553413391113281, "global_step": 140664, "epoch": 3349} {"train_loss": -6.661676406860352, "global_step": 140665, "epoch": 3349} {"train_loss": -6.623047351837158, "global_step": 140666, "epoch": 3349} {"train_loss": -6.73280143737793, "global_step": 140667, "epoch": 3349} {"train_loss": -6.523015975952148, "global_step": 140668, "epoch": 3349} {"train_loss": -6.675472259521484, "global_step": 140669, "epoch": 3349} {"train_loss": -6.714829444885254, "global_step": 140670, "epoch": 3349} {"train_loss": -6.663193702697754, "global_step": 140671, "epoch": 3349} {"train_loss": -6.784067153930664, "global_step": 140672, "epoch": 3349} {"train_loss": -6.816651821136475, "global_step": 140673, "epoch": 3349} {"train_loss": -6.83207893371582, "global_step": 140674, "epoch": 3349} {"train_loss": -6.676036834716797, "global_step": 140675, "epoch": 3349} {"train_loss": -6.7009382247924805, "global_step": 140676, "epoch": 3349} {"train_loss": -6.780267238616943, "global_step": 140677, "epoch": 3349} {"train_loss": -6.7466020584106445, "global_step": 140678, "epoch": 3349} {"train_loss": -6.705233573913574, "global_step": 140679, "epoch": 3349} {"train_loss": -6.752084255218506, "global_step": 140680, "epoch": 3349} {"train_loss": -6.768052101135254, "global_step": 140681, "epoch": 3349} {"train_loss": -6.750847339630127, "global_step": 140682, "epoch": 3349} {"train_loss": -6.766651153564453, "global_step": 140683, "epoch": 3349} {"train_loss": -6.74428653717041, "global_step": 140684, "epoch": 3349} {"train_loss": -6.804939270019531, "global_step": 140685, "epoch": 3349} {"train_loss": -6.6784772872924805, "global_step": 140686, "epoch": 3349} {"train_loss": -6.836001873016357, "global_step": 140687, "epoch": 3349} {"train_loss": -6.672666072845459, "global_step": 140688, "epoch": 3349} {"train_loss": -6.658286094665527, "global_step": 140689, "epoch": 3349} {"train_loss": -6.8205037117004395, "global_step": 140690, "epoch": 3349} {"train_loss": -6.730107307434082, "global_step": 140691, "epoch": 3349} {"train_loss": -6.776640892028809, "global_step": 140692, "epoch": 3349} {"train_loss": -6.7150726318359375, "global_step": 140693, "epoch": 3349} {"train_loss": -6.752138137817383, "global_step": 140694, "epoch": 3349} {"train_loss": -6.7504963874816895, "global_step": 140695, "epoch": 3349} {"train_loss": -6.787067413330078, "global_step": 140696, "epoch": 3349} {"train_loss": -6.807429313659668, "global_step": 140697, "epoch": 3349} {"train_loss": -6.654537200927734, "global_step": 140698, "epoch": 3349} {"train_loss": -6.713281120572772, "global_step": 140699, "epoch": 3349, "val_loss": 68302.5859375} {"train_loss": -6.826393127441406, "global_step": 140700, "epoch": 3350} {"train_loss": -6.747368812561035, "global_step": 140701, "epoch": 3350} {"train_loss": -6.739389419555664, "global_step": 140702, "epoch": 3350} {"train_loss": -6.7876996994018555, "global_step": 140703, "epoch": 3350} {"train_loss": -6.73702335357666, "global_step": 140704, "epoch": 3350} {"train_loss": -6.844215393066406, "global_step": 140705, "epoch": 3350} {"train_loss": -6.888085842132568, "global_step": 140706, "epoch": 3350} {"train_loss": -6.831042766571045, "global_step": 140707, "epoch": 3350} {"train_loss": -6.631159782409668, "global_step": 140708, "epoch": 3350} {"train_loss": -6.779227256774902, "global_step": 140709, "epoch": 3350} {"train_loss": -6.8355889320373535, "global_step": 140710, "epoch": 3350} {"train_loss": -6.727448463439941, "global_step": 140711, "epoch": 3350} {"train_loss": -6.740264892578125, "global_step": 140712, "epoch": 3350} {"train_loss": -6.792403221130371, "global_step": 140713, "epoch": 3350} {"train_loss": -6.732676029205322, "global_step": 140714, "epoch": 3350} {"train_loss": -6.6933698654174805, "global_step": 140715, "epoch": 3350} {"train_loss": -6.8162431716918945, "global_step": 140716, "epoch": 3350} {"train_loss": -6.8267316818237305, "global_step": 140717, "epoch": 3350} {"train_loss": -6.782932758331299, "global_step": 140718, "epoch": 3350} {"train_loss": -6.869558334350586, "global_step": 140719, "epoch": 3350} {"train_loss": -6.869440078735352, "global_step": 140720, "epoch": 3350} {"train_loss": -6.69771671295166, "global_step": 140721, "epoch": 3350} {"train_loss": -6.681107521057129, "global_step": 140722, "epoch": 3350} {"train_loss": -6.724032402038574, "global_step": 140723, "epoch": 3350} {"train_loss": -6.721768856048584, "global_step": 140724, "epoch": 3350} {"train_loss": -6.793440818786621, "global_step": 140725, "epoch": 3350} {"train_loss": -6.725668430328369, "global_step": 140726, "epoch": 3350} {"train_loss": -6.786998748779297, "global_step": 140727, "epoch": 3350} {"train_loss": -6.639726638793945, "global_step": 140728, "epoch": 3350} {"train_loss": -6.704387664794922, "global_step": 140729, "epoch": 3350} {"train_loss": -6.786354064941406, "global_step": 140730, "epoch": 3350} {"train_loss": -6.746702194213867, "global_step": 140731, "epoch": 3350} {"train_loss": -6.645164489746094, "global_step": 140732, "epoch": 3350} {"train_loss": -6.643393516540527, "global_step": 140733, "epoch": 3350} {"train_loss": -6.714365005493164, "global_step": 140734, "epoch": 3350} {"train_loss": -6.618539810180664, "global_step": 140735, "epoch": 3350} {"train_loss": -6.8078789710998535, "global_step": 140736, "epoch": 3350} {"train_loss": -6.80782413482666, "global_step": 140737, "epoch": 3350} {"train_loss": -6.74876594543457, "global_step": 140738, "epoch": 3350} {"train_loss": -6.763514041900635, "global_step": 140739, "epoch": 3350} {"train_loss": -6.665267467498779, "global_step": 140740, "epoch": 3350} {"train_loss": -6.752392814272926, "global_step": 140741, "epoch": 3350, "train/sim_max_reward_0": 0.25126761522136243, "train/sim_max_reward_1": 0.9606691653892782, "train/sim_max_reward_2": 0.8486006848334149, "train/sim_max_reward_3": 0.13640744665501064, "train/sim_max_reward_4": 0.3747319662792676, "train/sim_max_reward_5": 0.9537509504611447, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.9582959289557019, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.9328813258634858, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9677398336680028, "test/sim_max_reward_4400006": 0.9951183064190614, "test/sim_max_reward_4400007": 0.7950991733261762, "test/sim_max_reward_4400008": 0.3225476971404502, "test/sim_max_reward_4400009": 0.9230414396076342, "test/sim_max_reward_4400010": 0.19132785552094603, "test/sim_max_reward_4400011": 0.9640407892438053, "test/sim_max_reward_4400012": 0.4474731593618791, "test/sim_max_reward_4400013": 0.9091458603443882, "test/sim_max_reward_4400014": 0.8463441191995623, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.02331500586364236, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2826013415496205, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9436415510481161, "test/sim_max_reward_4400023": 0.9894400642683387, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.257599141315955, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.046811346236765014, "test/sim_max_reward_4400028": 0.8247576897716132, "test/sim_max_reward_4400029": 0.030933876777263468, "test/sim_max_reward_4400030": 0.9401703252091971, "test/sim_max_reward_4400031": 0.9923952791259255, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9641273621138652, "test/sim_max_reward_4400034": 0.9852725461496533, "test/sim_max_reward_4400035": 0.9546792732562781, "test/sim_max_reward_4400036": 0.33115834113577725, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.7530061327801801, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9031337739002822, "test/sim_max_reward_4400042": 0.0914772122687692, "test/sim_max_reward_4400043": 0.8104287891083084, "test/sim_max_reward_4400044": 0.9987299221807334, "test/sim_max_reward_4400045": 0.7943307187213278, "test/sim_max_reward_4400046": 0.9359371405688444, "test/sim_max_reward_4400047": 0.9547121995212319, "test/sim_max_reward_4400048": 0.9951941147746266, "test/sim_max_reward_4400049": 0.7433899992050655, "train/mean_score": 0.5875713048065797, "test/mean_score": 0.6083491466200311, "val_loss": 68495.21875} {"train_loss": -6.695950031280518, "global_step": 140742, "epoch": 3351} {"train_loss": -6.74761962890625, "global_step": 140743, "epoch": 3351} {"train_loss": -6.655528545379639, "global_step": 140744, "epoch": 3351} {"train_loss": -6.699856281280518, "global_step": 140745, "epoch": 3351} {"train_loss": -6.679070472717285, "global_step": 140746, "epoch": 3351} {"train_loss": -6.561929702758789, "global_step": 140747, "epoch": 3351} {"train_loss": -6.656714916229248, "global_step": 140748, "epoch": 3351} {"train_loss": -6.566326141357422, "global_step": 140749, "epoch": 3351} {"train_loss": -6.699589729309082, "global_step": 140750, "epoch": 3351} {"train_loss": -6.684609889984131, "global_step": 140751, "epoch": 3351} {"train_loss": -6.647237300872803, "global_step": 140752, "epoch": 3351} {"train_loss": -6.786121368408203, "global_step": 140753, "epoch": 3351} {"train_loss": -6.586464881896973, "global_step": 140754, "epoch": 3351} {"train_loss": -6.603816032409668, "global_step": 140755, "epoch": 3351} {"train_loss": -6.739519119262695, "global_step": 140756, "epoch": 3351} {"train_loss": -6.646547317504883, "global_step": 140757, "epoch": 3351} {"train_loss": -6.673052787780762, "global_step": 140758, "epoch": 3351} {"train_loss": -6.681883335113525, "global_step": 140759, "epoch": 3351} {"train_loss": -6.693008899688721, "global_step": 140760, "epoch": 3351} {"train_loss": -6.646544933319092, "global_step": 140761, "epoch": 3351} {"train_loss": -6.70228385925293, "global_step": 140762, "epoch": 3351} {"train_loss": -6.5543718338012695, "global_step": 140763, "epoch": 3351} {"train_loss": -6.603247165679932, "global_step": 140764, "epoch": 3351} {"train_loss": -6.638643264770508, "global_step": 140765, "epoch": 3351} {"train_loss": -6.649104595184326, "global_step": 140766, "epoch": 3351} {"train_loss": -6.649412631988525, "global_step": 140767, "epoch": 3351} {"train_loss": -6.603094577789307, "global_step": 140768, "epoch": 3351} {"train_loss": -6.591164588928223, "global_step": 140769, "epoch": 3351} {"train_loss": -6.597221374511719, "global_step": 140770, "epoch": 3351} {"train_loss": -6.637914657592773, "global_step": 140771, "epoch": 3351} {"train_loss": -6.753291606903076, "global_step": 140772, "epoch": 3351} {"train_loss": -6.605010986328125, "global_step": 140773, "epoch": 3351} {"train_loss": -6.509293556213379, "global_step": 140774, "epoch": 3351} {"train_loss": -6.644023895263672, "global_step": 140775, "epoch": 3351} {"train_loss": -6.601650238037109, "global_step": 140776, "epoch": 3351} {"train_loss": -6.6205949783325195, "global_step": 140777, "epoch": 3351} {"train_loss": -6.624688148498535, "global_step": 140778, "epoch": 3351} {"train_loss": -6.6313934326171875, "global_step": 140779, "epoch": 3351} {"train_loss": -6.586130142211914, "global_step": 140780, "epoch": 3351} {"train_loss": -6.5738325119018555, "global_step": 140781, "epoch": 3351} {"train_loss": -6.7061967849731445, "global_step": 140782, "epoch": 3351} {"train_loss": -6.646274055753436, "global_step": 140783, "epoch": 3351, "val_loss": 68351.03125} {"train_loss": -6.688233852386475, "global_step": 140784, "epoch": 3352} {"train_loss": -6.595909595489502, "global_step": 140785, "epoch": 3352} {"train_loss": -6.598937034606934, "global_step": 140786, "epoch": 3352} {"train_loss": -6.704286575317383, "global_step": 140787, "epoch": 3352} {"train_loss": -6.682084560394287, "global_step": 140788, "epoch": 3352} {"train_loss": -6.749809265136719, "global_step": 140789, "epoch": 3352} {"train_loss": -6.731314659118652, "global_step": 140790, "epoch": 3352} {"train_loss": -6.668666839599609, "global_step": 140791, "epoch": 3352} {"train_loss": -6.689979076385498, "global_step": 140792, "epoch": 3352} {"train_loss": -6.663718223571777, "global_step": 140793, "epoch": 3352} {"train_loss": -6.737937927246094, "global_step": 140794, "epoch": 3352} {"train_loss": -6.707948684692383, "global_step": 140795, "epoch": 3352} {"train_loss": -6.687512397766113, "global_step": 140796, "epoch": 3352} {"train_loss": -6.767154693603516, "global_step": 140797, "epoch": 3352} {"train_loss": -6.788729667663574, "global_step": 140798, "epoch": 3352} {"train_loss": -6.705833911895752, "global_step": 140799, "epoch": 3352} {"train_loss": -6.798244476318359, "global_step": 140800, "epoch": 3352} {"train_loss": -6.741721153259277, "global_step": 140801, "epoch": 3352} {"train_loss": -6.822845935821533, "global_step": 140802, "epoch": 3352} {"train_loss": -6.683384895324707, "global_step": 140803, "epoch": 3352} {"train_loss": -6.691350936889648, "global_step": 140804, "epoch": 3352} {"train_loss": -6.789344310760498, "global_step": 140805, "epoch": 3352} {"train_loss": -6.814669132232666, "global_step": 140806, "epoch": 3352} {"train_loss": -6.777307510375977, "global_step": 140807, "epoch": 3352} {"train_loss": -6.73875093460083, "global_step": 140808, "epoch": 3352} {"train_loss": -6.863527297973633, "global_step": 140809, "epoch": 3352} {"train_loss": -6.7063140869140625, "global_step": 140810, "epoch": 3352} {"train_loss": -6.772497177124023, "global_step": 140811, "epoch": 3352} {"train_loss": -6.7666521072387695, "global_step": 140812, "epoch": 3352} {"train_loss": -6.675511360168457, "global_step": 140813, "epoch": 3352} {"train_loss": -6.814400672912598, "global_step": 140814, "epoch": 3352} {"train_loss": -6.810543060302734, "global_step": 140815, "epoch": 3352} {"train_loss": -6.754484176635742, "global_step": 140816, "epoch": 3352} {"train_loss": -6.773716449737549, "global_step": 140817, "epoch": 3352} {"train_loss": -6.758191108703613, "global_step": 140818, "epoch": 3352} {"train_loss": -6.786221504211426, "global_step": 140819, "epoch": 3352} {"train_loss": -6.851951599121094, "global_step": 140820, "epoch": 3352} {"train_loss": -6.806957244873047, "global_step": 140821, "epoch": 3352} {"train_loss": -6.69480037689209, "global_step": 140822, "epoch": 3352} {"train_loss": -6.683876991271973, "global_step": 140823, "epoch": 3352} {"train_loss": -6.726561546325684, "global_step": 140824, "epoch": 3352} {"train_loss": -6.7392667929331465, "global_step": 140825, "epoch": 3352, "val_loss": 68519.40625} {"train_loss": -6.585720062255859, "global_step": 140826, "epoch": 3353} {"train_loss": -6.709364891052246, "global_step": 140827, "epoch": 3353} {"train_loss": -6.565497398376465, "global_step": 140828, "epoch": 3353} {"train_loss": -6.656707763671875, "global_step": 140829, "epoch": 3353} {"train_loss": -6.574349403381348, "global_step": 140830, "epoch": 3353} {"train_loss": -6.644036293029785, "global_step": 140831, "epoch": 3353} {"train_loss": -6.673126220703125, "global_step": 140832, "epoch": 3353} {"train_loss": -6.662206649780273, "global_step": 140833, "epoch": 3353} {"train_loss": -6.868903160095215, "global_step": 140834, "epoch": 3353} {"train_loss": -6.72066068649292, "global_step": 140835, "epoch": 3353} {"train_loss": -6.77650260925293, "global_step": 140836, "epoch": 3353} {"train_loss": -6.7372636795043945, "global_step": 140837, "epoch": 3353} {"train_loss": -6.717663764953613, "global_step": 140838, "epoch": 3353} {"train_loss": -6.725010871887207, "global_step": 140839, "epoch": 3353} {"train_loss": -6.743562698364258, "global_step": 140840, "epoch": 3353} {"train_loss": -6.83787727355957, "global_step": 140841, "epoch": 3353} {"train_loss": -6.785895824432373, "global_step": 140842, "epoch": 3353} {"train_loss": -6.733786582946777, "global_step": 140843, "epoch": 3353} {"train_loss": -6.7754058837890625, "global_step": 140844, "epoch": 3353} {"train_loss": -6.777364730834961, "global_step": 140845, "epoch": 3353} {"train_loss": -6.825029373168945, "global_step": 140846, "epoch": 3353} {"train_loss": -6.699197292327881, "global_step": 140847, "epoch": 3353} {"train_loss": -6.743349075317383, "global_step": 140848, "epoch": 3353} {"train_loss": -6.785096645355225, "global_step": 140849, "epoch": 3353} {"train_loss": -6.670154571533203, "global_step": 140850, "epoch": 3353} {"train_loss": -6.739315032958984, "global_step": 140851, "epoch": 3353} {"train_loss": -6.700029373168945, "global_step": 140852, "epoch": 3353} {"train_loss": -6.7815775871276855, "global_step": 140853, "epoch": 3353} {"train_loss": -6.725366115570068, "global_step": 140854, "epoch": 3353} {"train_loss": -6.782256603240967, "global_step": 140855, "epoch": 3353} {"train_loss": -6.850307464599609, "global_step": 140856, "epoch": 3353} {"train_loss": -6.762419700622559, "global_step": 140857, "epoch": 3353} {"train_loss": -6.772377967834473, "global_step": 140858, "epoch": 3353} {"train_loss": -6.820084571838379, "global_step": 140859, "epoch": 3353} {"train_loss": -6.785282135009766, "global_step": 140860, "epoch": 3353} {"train_loss": -6.718622207641602, "global_step": 140861, "epoch": 3353} {"train_loss": -6.772418975830078, "global_step": 140862, "epoch": 3353} {"train_loss": -6.789927005767822, "global_step": 140863, "epoch": 3353} {"train_loss": -6.674886703491211, "global_step": 140864, "epoch": 3353} {"train_loss": -6.755406379699707, "global_step": 140865, "epoch": 3353} {"train_loss": -6.7422404289245605, "global_step": 140866, "epoch": 3353} {"train_loss": -6.735454809098017, "global_step": 140867, "epoch": 3353, "val_loss": 68353.125} {"train_loss": -6.7288289070129395, "global_step": 140868, "epoch": 3354} {"train_loss": -6.721597671508789, "global_step": 140869, "epoch": 3354} {"train_loss": -6.785045623779297, "global_step": 140870, "epoch": 3354} {"train_loss": -6.772233009338379, "global_step": 140871, "epoch": 3354} {"train_loss": -6.7807793617248535, "global_step": 140872, "epoch": 3354} {"train_loss": -6.794354438781738, "global_step": 140873, "epoch": 3354} {"train_loss": -6.798765182495117, "global_step": 140874, "epoch": 3354} {"train_loss": -6.783432483673096, "global_step": 140875, "epoch": 3354} {"train_loss": -6.823750019073486, "global_step": 140876, "epoch": 3354} {"train_loss": -6.745732307434082, "global_step": 140877, "epoch": 3354} {"train_loss": -6.776991844177246, "global_step": 140878, "epoch": 3354} {"train_loss": -6.786406517028809, "global_step": 140879, "epoch": 3354} {"train_loss": -6.754451751708984, "global_step": 140880, "epoch": 3354} {"train_loss": -6.665363788604736, "global_step": 140881, "epoch": 3354} {"train_loss": -6.760644912719727, "global_step": 140882, "epoch": 3354} {"train_loss": -6.8567914962768555, "global_step": 140883, "epoch": 3354} {"train_loss": -6.773702144622803, "global_step": 140884, "epoch": 3354} {"train_loss": -6.66716194152832, "global_step": 140885, "epoch": 3354} {"train_loss": -6.69888162612915, "global_step": 140886, "epoch": 3354} {"train_loss": -6.564946174621582, "global_step": 140887, "epoch": 3354} {"train_loss": -6.6788740158081055, "global_step": 140888, "epoch": 3354} {"train_loss": -6.684613227844238, "global_step": 140889, "epoch": 3354} {"train_loss": -6.577437400817871, "global_step": 140890, "epoch": 3354} {"train_loss": -6.712215423583984, "global_step": 140891, "epoch": 3354} {"train_loss": -6.596894264221191, "global_step": 140892, "epoch": 3354} {"train_loss": -6.6887617111206055, "global_step": 140893, "epoch": 3354} {"train_loss": -6.684601783752441, "global_step": 140894, "epoch": 3354} {"train_loss": -6.561667442321777, "global_step": 140895, "epoch": 3354} {"train_loss": -6.671362400054932, "global_step": 140896, "epoch": 3354} {"train_loss": -6.503535270690918, "global_step": 140897, "epoch": 3354} {"train_loss": -6.6590118408203125, "global_step": 140898, "epoch": 3354} {"train_loss": -6.6170806884765625, "global_step": 140899, "epoch": 3354} {"train_loss": -6.592702388763428, "global_step": 140900, "epoch": 3354} {"train_loss": -6.53125524520874, "global_step": 140901, "epoch": 3354} {"train_loss": -6.539742469787598, "global_step": 140902, "epoch": 3354} {"train_loss": -6.54216194152832, "global_step": 140903, "epoch": 3354} {"train_loss": -6.664795398712158, "global_step": 140904, "epoch": 3354} {"train_loss": -6.559521675109863, "global_step": 140905, "epoch": 3354} {"train_loss": -6.648744583129883, "global_step": 140906, "epoch": 3354} {"train_loss": -6.6193342208862305, "global_step": 140907, "epoch": 3354} {"train_loss": -6.6880412101745605, "global_step": 140908, "epoch": 3354} {"train_loss": -6.684285561243693, "global_step": 140909, "epoch": 3354, "val_loss": 68235.2578125} {"train_loss": -6.739650726318359, "global_step": 140910, "epoch": 3355} {"train_loss": -6.697472095489502, "global_step": 140911, "epoch": 3355} {"train_loss": -6.5465779304504395, "global_step": 140912, "epoch": 3355} {"train_loss": -6.770114898681641, "global_step": 140913, "epoch": 3355} {"train_loss": -6.767824172973633, "global_step": 140914, "epoch": 3355} {"train_loss": -6.616901874542236, "global_step": 140915, "epoch": 3355} {"train_loss": -6.625919342041016, "global_step": 140916, "epoch": 3355} {"train_loss": -6.758996963500977, "global_step": 140917, "epoch": 3355} {"train_loss": -6.714539527893066, "global_step": 140918, "epoch": 3355} {"train_loss": -6.700703144073486, "global_step": 140919, "epoch": 3355} {"train_loss": -6.643307209014893, "global_step": 140920, "epoch": 3355} {"train_loss": -6.561276435852051, "global_step": 140921, "epoch": 3355} {"train_loss": -6.669004440307617, "global_step": 140922, "epoch": 3355} {"train_loss": -6.670963287353516, "global_step": 140923, "epoch": 3355} {"train_loss": -6.768088340759277, "global_step": 140924, "epoch": 3355} {"train_loss": -6.656636714935303, "global_step": 140925, "epoch": 3355} {"train_loss": -6.691679954528809, "global_step": 140926, "epoch": 3355} {"train_loss": -6.709812164306641, "global_step": 140927, "epoch": 3355} {"train_loss": -6.693398952484131, "global_step": 140928, "epoch": 3355} {"train_loss": -6.6922526359558105, "global_step": 140929, "epoch": 3355} {"train_loss": -6.677167892456055, "global_step": 140930, "epoch": 3355} {"train_loss": -6.743109226226807, "global_step": 140931, "epoch": 3355} {"train_loss": -6.714815139770508, "global_step": 140932, "epoch": 3355} {"train_loss": -6.647584915161133, "global_step": 140933, "epoch": 3355} {"train_loss": -6.769420146942139, "global_step": 140934, "epoch": 3355} {"train_loss": -6.792919635772705, "global_step": 140935, "epoch": 3355} {"train_loss": -6.718897819519043, "global_step": 140936, "epoch": 3355} {"train_loss": -6.779562473297119, "global_step": 140937, "epoch": 3355} {"train_loss": -6.782276153564453, "global_step": 140938, "epoch": 3355} {"train_loss": -6.708000183105469, "global_step": 140939, "epoch": 3355} {"train_loss": -6.80426025390625, "global_step": 140940, "epoch": 3355} {"train_loss": -6.72646427154541, "global_step": 140941, "epoch": 3355} {"train_loss": -6.803839206695557, "global_step": 140942, "epoch": 3355} {"train_loss": -6.756597518920898, "global_step": 140943, "epoch": 3355} {"train_loss": -6.545198917388916, "global_step": 140944, "epoch": 3355} {"train_loss": -6.699117183685303, "global_step": 140945, "epoch": 3355} {"train_loss": -6.6171393394470215, "global_step": 140946, "epoch": 3355} {"train_loss": -6.718188285827637, "global_step": 140947, "epoch": 3355} {"train_loss": -6.693163871765137, "global_step": 140948, "epoch": 3355} {"train_loss": -6.717538833618164, "global_step": 140949, "epoch": 3355} {"train_loss": -6.758332252502441, "global_step": 140950, "epoch": 3355} {"train_loss": -6.701652220317295, "global_step": 140951, "epoch": 3355, "val_loss": 68151.96875} {"train_loss": -6.708252429962158, "global_step": 140952, "epoch": 3356} {"train_loss": -6.729846954345703, "global_step": 140953, "epoch": 3356} {"train_loss": -6.665655612945557, "global_step": 140954, "epoch": 3356} {"train_loss": -6.685388565063477, "global_step": 140955, "epoch": 3356} {"train_loss": -6.682867050170898, "global_step": 140956, "epoch": 3356} {"train_loss": -6.609755039215088, "global_step": 140957, "epoch": 3356} {"train_loss": -6.823657035827637, "global_step": 140958, "epoch": 3356} {"train_loss": -6.688544273376465, "global_step": 140959, "epoch": 3356} {"train_loss": -6.634160041809082, "global_step": 140960, "epoch": 3356} {"train_loss": -6.686737060546875, "global_step": 140961, "epoch": 3356} {"train_loss": -6.700447082519531, "global_step": 140962, "epoch": 3356} {"train_loss": -6.74085807800293, "global_step": 140963, "epoch": 3356} {"train_loss": -6.792662143707275, "global_step": 140964, "epoch": 3356} {"train_loss": -6.784712791442871, "global_step": 140965, "epoch": 3356} {"train_loss": -6.752249717712402, "global_step": 140966, "epoch": 3356} {"train_loss": -6.658321380615234, "global_step": 140967, "epoch": 3356} {"train_loss": -6.672771453857422, "global_step": 140968, "epoch": 3356} {"train_loss": -6.799507141113281, "global_step": 140969, "epoch": 3356} {"train_loss": -6.6304802894592285, "global_step": 140970, "epoch": 3356} {"train_loss": -6.5880022048950195, "global_step": 140971, "epoch": 3356} {"train_loss": -6.687090873718262, "global_step": 140972, "epoch": 3356} {"train_loss": -6.620840072631836, "global_step": 140973, "epoch": 3356} {"train_loss": -6.721470355987549, "global_step": 140974, "epoch": 3356} {"train_loss": -6.7126359939575195, "global_step": 140975, "epoch": 3356} {"train_loss": -6.716403961181641, "global_step": 140976, "epoch": 3356} {"train_loss": -6.688260078430176, "global_step": 140977, "epoch": 3356} {"train_loss": -6.784771919250488, "global_step": 140978, "epoch": 3356} {"train_loss": -6.846415996551514, "global_step": 140979, "epoch": 3356} {"train_loss": -6.781637191772461, "global_step": 140980, "epoch": 3356} {"train_loss": -6.685966968536377, "global_step": 140981, "epoch": 3356} {"train_loss": -6.664263725280762, "global_step": 140982, "epoch": 3356} {"train_loss": -6.6123151779174805, "global_step": 140983, "epoch": 3356} {"train_loss": -6.735462188720703, "global_step": 140984, "epoch": 3356} {"train_loss": -6.684272289276123, "global_step": 140985, "epoch": 3356} {"train_loss": -6.621366024017334, "global_step": 140986, "epoch": 3356} {"train_loss": -6.606124401092529, "global_step": 140987, "epoch": 3356} {"train_loss": -6.755441188812256, "global_step": 140988, "epoch": 3356} {"train_loss": -6.683753967285156, "global_step": 140989, "epoch": 3356} {"train_loss": -6.774450778961182, "global_step": 140990, "epoch": 3356} {"train_loss": -6.73325777053833, "global_step": 140991, "epoch": 3356} {"train_loss": -6.698618412017822, "global_step": 140992, "epoch": 3356} {"train_loss": -6.704656896137056, "global_step": 140993, "epoch": 3356, "val_loss": 68456.453125} {"train_loss": -6.723941326141357, "global_step": 140994, "epoch": 3357} {"train_loss": -6.70197868347168, "global_step": 140995, "epoch": 3357} {"train_loss": -6.7441864013671875, "global_step": 140996, "epoch": 3357} {"train_loss": -6.743697166442871, "global_step": 140997, "epoch": 3357} {"train_loss": -6.608721733093262, "global_step": 140998, "epoch": 3357} {"train_loss": -6.81082010269165, "global_step": 140999, "epoch": 3357} {"train_loss": -6.815064907073975, "global_step": 141000, "epoch": 3357} {"train_loss": -6.717009544372559, "global_step": 141001, "epoch": 3357} {"train_loss": -6.774758815765381, "global_step": 141002, "epoch": 3357} {"train_loss": -6.7517170906066895, "global_step": 141003, "epoch": 3357} {"train_loss": -6.717341423034668, "global_step": 141004, "epoch": 3357} {"train_loss": -6.870815753936768, "global_step": 141005, "epoch": 3357} {"train_loss": -6.827741622924805, "global_step": 141006, "epoch": 3357} {"train_loss": -6.817965030670166, "global_step": 141007, "epoch": 3357} {"train_loss": -6.678229331970215, "global_step": 141008, "epoch": 3357} {"train_loss": -6.788636207580566, "global_step": 141009, "epoch": 3357} {"train_loss": -6.718084812164307, "global_step": 141010, "epoch": 3357} {"train_loss": -6.769448280334473, "global_step": 141011, "epoch": 3357} {"train_loss": -6.746818542480469, "global_step": 141012, "epoch": 3357} {"train_loss": -6.713435173034668, "global_step": 141013, "epoch": 3357} {"train_loss": -6.7108612060546875, "global_step": 141014, "epoch": 3357} {"train_loss": -6.774330139160156, "global_step": 141015, "epoch": 3357} {"train_loss": -6.785483360290527, "global_step": 141016, "epoch": 3357} {"train_loss": -6.606858253479004, "global_step": 141017, "epoch": 3357} {"train_loss": -6.841927528381348, "global_step": 141018, "epoch": 3357} {"train_loss": -6.687597274780273, "global_step": 141019, "epoch": 3357} {"train_loss": -6.738396644592285, "global_step": 141020, "epoch": 3357} {"train_loss": -6.584184646606445, "global_step": 141021, "epoch": 3357} {"train_loss": -6.672329902648926, "global_step": 141022, "epoch": 3357} {"train_loss": -6.685924530029297, "global_step": 141023, "epoch": 3357} {"train_loss": -6.668695449829102, "global_step": 141024, "epoch": 3357} {"train_loss": -6.581939220428467, "global_step": 141025, "epoch": 3357} {"train_loss": -6.672276496887207, "global_step": 141026, "epoch": 3357} {"train_loss": -6.709387302398682, "global_step": 141027, "epoch": 3357} {"train_loss": -6.6062822341918945, "global_step": 141028, "epoch": 3357} {"train_loss": -6.685394287109375, "global_step": 141029, "epoch": 3357} {"train_loss": -6.716857433319092, "global_step": 141030, "epoch": 3357} {"train_loss": -6.821959495544434, "global_step": 141031, "epoch": 3357} {"train_loss": -6.604879379272461, "global_step": 141032, "epoch": 3357} {"train_loss": -6.78740119934082, "global_step": 141033, "epoch": 3357} {"train_loss": -6.703797340393066, "global_step": 141034, "epoch": 3357} {"train_loss": -6.72615875516619, "global_step": 141035, "epoch": 3357, "val_loss": 68353.25} {"train_loss": -6.773993015289307, "global_step": 141036, "epoch": 3358} {"train_loss": -6.747503757476807, "global_step": 141037, "epoch": 3358} {"train_loss": -6.83184289932251, "global_step": 141038, "epoch": 3358} {"train_loss": -6.918095588684082, "global_step": 141039, "epoch": 3358} {"train_loss": -6.841581344604492, "global_step": 141040, "epoch": 3358} {"train_loss": -6.840749263763428, "global_step": 141041, "epoch": 3358} {"train_loss": -6.871916770935059, "global_step": 141042, "epoch": 3358} {"train_loss": -6.753963947296143, "global_step": 141043, "epoch": 3358} {"train_loss": -6.731704235076904, "global_step": 141044, "epoch": 3358} {"train_loss": -6.751272201538086, "global_step": 141045, "epoch": 3358} {"train_loss": -6.7254228591918945, "global_step": 141046, "epoch": 3358} {"train_loss": -6.722722053527832, "global_step": 141047, "epoch": 3358} {"train_loss": -6.717278480529785, "global_step": 141048, "epoch": 3358} {"train_loss": -6.734686851501465, "global_step": 141049, "epoch": 3358} {"train_loss": -6.687471389770508, "global_step": 141050, "epoch": 3358} {"train_loss": -6.849503040313721, "global_step": 141051, "epoch": 3358} {"train_loss": -6.727424621582031, "global_step": 141052, "epoch": 3358} {"train_loss": -6.791399002075195, "global_step": 141053, "epoch": 3358} {"train_loss": -6.657890319824219, "global_step": 141054, "epoch": 3358} {"train_loss": -6.749407768249512, "global_step": 141055, "epoch": 3358} {"train_loss": -6.8251729011535645, "global_step": 141056, "epoch": 3358} {"train_loss": -6.572542190551758, "global_step": 141057, "epoch": 3358} {"train_loss": -6.690485000610352, "global_step": 141058, "epoch": 3358} {"train_loss": -6.670995712280273, "global_step": 141059, "epoch": 3358} {"train_loss": -6.612025260925293, "global_step": 141060, "epoch": 3358} {"train_loss": -6.732117652893066, "global_step": 141061, "epoch": 3358} {"train_loss": -6.742489337921143, "global_step": 141062, "epoch": 3358} {"train_loss": -6.7530012130737305, "global_step": 141063, "epoch": 3358} {"train_loss": -6.713793754577637, "global_step": 141064, "epoch": 3358} {"train_loss": -6.729551315307617, "global_step": 141065, "epoch": 3358} {"train_loss": -6.6042914390563965, "global_step": 141066, "epoch": 3358} {"train_loss": -6.795641899108887, "global_step": 141067, "epoch": 3358} {"train_loss": -6.746551990509033, "global_step": 141068, "epoch": 3358} {"train_loss": -6.672259330749512, "global_step": 141069, "epoch": 3358} {"train_loss": -6.746986389160156, "global_step": 141070, "epoch": 3358} {"train_loss": -6.591884136199951, "global_step": 141071, "epoch": 3358} {"train_loss": -6.8148674964904785, "global_step": 141072, "epoch": 3358} {"train_loss": -6.610468864440918, "global_step": 141073, "epoch": 3358} {"train_loss": -6.670493125915527, "global_step": 141074, "epoch": 3358} {"train_loss": -6.640556335449219, "global_step": 141075, "epoch": 3358} {"train_loss": -6.632821083068848, "global_step": 141076, "epoch": 3358} {"train_loss": -6.7312255132766, "global_step": 141077, "epoch": 3358, "val_loss": 68413.3125} {"train_loss": -6.626835823059082, "global_step": 141078, "epoch": 3359} {"train_loss": -6.68362283706665, "global_step": 141079, "epoch": 3359} {"train_loss": -6.659076690673828, "global_step": 141080, "epoch": 3359} {"train_loss": -6.668235778808594, "global_step": 141081, "epoch": 3359} {"train_loss": -6.864485740661621, "global_step": 141082, "epoch": 3359} {"train_loss": -6.546923637390137, "global_step": 141083, "epoch": 3359} {"train_loss": -6.645599365234375, "global_step": 141084, "epoch": 3359} {"train_loss": -6.7771196365356445, "global_step": 141085, "epoch": 3359} {"train_loss": -6.6948041915893555, "global_step": 141086, "epoch": 3359} {"train_loss": -6.797239303588867, "global_step": 141087, "epoch": 3359} {"train_loss": -6.636833190917969, "global_step": 141088, "epoch": 3359} {"train_loss": -6.80565071105957, "global_step": 141089, "epoch": 3359} {"train_loss": -6.771438121795654, "global_step": 141090, "epoch": 3359} {"train_loss": -6.748414993286133, "global_step": 141091, "epoch": 3359} {"train_loss": -6.807120323181152, "global_step": 141092, "epoch": 3359} {"train_loss": -6.771944999694824, "global_step": 141093, "epoch": 3359} {"train_loss": -6.764246940612793, "global_step": 141094, "epoch": 3359} {"train_loss": -6.597041130065918, "global_step": 141095, "epoch": 3359} {"train_loss": -6.774086952209473, "global_step": 141096, "epoch": 3359} {"train_loss": -6.661276817321777, "global_step": 141097, "epoch": 3359} {"train_loss": -6.5480637550354, "global_step": 141098, "epoch": 3359} {"train_loss": -6.676344394683838, "global_step": 141099, "epoch": 3359} {"train_loss": -6.657343864440918, "global_step": 141100, "epoch": 3359} {"train_loss": -6.560751438140869, "global_step": 141101, "epoch": 3359} {"train_loss": -6.695181369781494, "global_step": 141102, "epoch": 3359} {"train_loss": -6.6218695640563965, "global_step": 141103, "epoch": 3359} {"train_loss": -6.648334980010986, "global_step": 141104, "epoch": 3359} {"train_loss": -6.734957695007324, "global_step": 141105, "epoch": 3359} {"train_loss": -6.87625789642334, "global_step": 141106, "epoch": 3359} {"train_loss": -6.70905065536499, "global_step": 141107, "epoch": 3359} {"train_loss": -6.652413368225098, "global_step": 141108, "epoch": 3359} {"train_loss": -6.65891695022583, "global_step": 141109, "epoch": 3359} {"train_loss": -6.664417266845703, "global_step": 141110, "epoch": 3359} {"train_loss": -6.838901519775391, "global_step": 141111, "epoch": 3359} {"train_loss": -6.778518199920654, "global_step": 141112, "epoch": 3359} {"train_loss": -6.6474928855896, "global_step": 141113, "epoch": 3359} {"train_loss": -6.7177605628967285, "global_step": 141114, "epoch": 3359} {"train_loss": -6.654253005981445, "global_step": 141115, "epoch": 3359} {"train_loss": -6.65253210067749, "global_step": 141116, "epoch": 3359} {"train_loss": -6.728359222412109, "global_step": 141117, "epoch": 3359} {"train_loss": -6.716855049133301, "global_step": 141118, "epoch": 3359} {"train_loss": -6.700676611491612, "global_step": 141119, "epoch": 3359, "val_loss": 68212.921875} {"train_loss": -6.750478267669678, "global_step": 141120, "epoch": 3360} {"train_loss": -6.7762250900268555, "global_step": 141121, "epoch": 3360} {"train_loss": -6.740627288818359, "global_step": 141122, "epoch": 3360} {"train_loss": -6.73653507232666, "global_step": 141123, "epoch": 3360} {"train_loss": -6.560499668121338, "global_step": 141124, "epoch": 3360} {"train_loss": -6.678441047668457, "global_step": 141125, "epoch": 3360} {"train_loss": -6.637933731079102, "global_step": 141126, "epoch": 3360} {"train_loss": -6.557618618011475, "global_step": 141127, "epoch": 3360} {"train_loss": -6.715205192565918, "global_step": 141128, "epoch": 3360} {"train_loss": -6.661972999572754, "global_step": 141129, "epoch": 3360} {"train_loss": -6.656249046325684, "global_step": 141130, "epoch": 3360} {"train_loss": -6.754310607910156, "global_step": 141131, "epoch": 3360} {"train_loss": -6.787350654602051, "global_step": 141132, "epoch": 3360} {"train_loss": -6.7012858390808105, "global_step": 141133, "epoch": 3360} {"train_loss": -6.6381988525390625, "global_step": 141134, "epoch": 3360} {"train_loss": -6.634223937988281, "global_step": 141135, "epoch": 3360} {"train_loss": -6.689950942993164, "global_step": 141136, "epoch": 3360} {"train_loss": -6.778111457824707, "global_step": 141137, "epoch": 3360} {"train_loss": -6.587153434753418, "global_step": 141138, "epoch": 3360} {"train_loss": -6.6700286865234375, "global_step": 141139, "epoch": 3360} {"train_loss": -6.70503568649292, "global_step": 141140, "epoch": 3360} {"train_loss": -6.808685779571533, "global_step": 141141, "epoch": 3360} {"train_loss": -6.7569403648376465, "global_step": 141142, "epoch": 3360} {"train_loss": -6.710906028747559, "global_step": 141143, "epoch": 3360} {"train_loss": -6.736936092376709, "global_step": 141144, "epoch": 3360} {"train_loss": -6.647863864898682, "global_step": 141145, "epoch": 3360} {"train_loss": -6.7151641845703125, "global_step": 141146, "epoch": 3360} {"train_loss": -6.639677047729492, "global_step": 141147, "epoch": 3360} {"train_loss": -6.753778457641602, "global_step": 141148, "epoch": 3360} {"train_loss": -6.639570236206055, "global_step": 141149, "epoch": 3360} {"train_loss": -6.7336835861206055, "global_step": 141150, "epoch": 3360} {"train_loss": -6.6970438957214355, "global_step": 141151, "epoch": 3360} {"train_loss": -6.599237442016602, "global_step": 141152, "epoch": 3360} {"train_loss": -6.812944412231445, "global_step": 141153, "epoch": 3360} {"train_loss": -6.769669532775879, "global_step": 141154, "epoch": 3360} {"train_loss": -6.756588459014893, "global_step": 141155, "epoch": 3360} {"train_loss": -6.762889862060547, "global_step": 141156, "epoch": 3360} {"train_loss": -6.786594867706299, "global_step": 141157, "epoch": 3360} {"train_loss": -6.728893280029297, "global_step": 141158, "epoch": 3360} {"train_loss": -6.868691444396973, "global_step": 141159, "epoch": 3360} {"train_loss": -6.743661880493164, "global_step": 141160, "epoch": 3360} {"train_loss": -6.711377632050287, "global_step": 141161, "epoch": 3360, "val_loss": 68249.9140625} {"train_loss": -6.725061416625977, "global_step": 141162, "epoch": 3361} {"train_loss": -6.614269256591797, "global_step": 141163, "epoch": 3361} {"train_loss": -6.744279861450195, "global_step": 141164, "epoch": 3361} {"train_loss": -6.789977550506592, "global_step": 141165, "epoch": 3361} {"train_loss": -6.674698352813721, "global_step": 141166, "epoch": 3361} {"train_loss": -6.643939971923828, "global_step": 141167, "epoch": 3361} {"train_loss": -6.6817169189453125, "global_step": 141168, "epoch": 3361} {"train_loss": -6.740853309631348, "global_step": 141169, "epoch": 3361} {"train_loss": -6.655639171600342, "global_step": 141170, "epoch": 3361} {"train_loss": -6.814949989318848, "global_step": 141171, "epoch": 3361} {"train_loss": -6.769170761108398, "global_step": 141172, "epoch": 3361} {"train_loss": -6.712839603424072, "global_step": 141173, "epoch": 3361} {"train_loss": -6.686655044555664, "global_step": 141174, "epoch": 3361} {"train_loss": -6.720147132873535, "global_step": 141175, "epoch": 3361} {"train_loss": -6.744017601013184, "global_step": 141176, "epoch": 3361} {"train_loss": -6.72686767578125, "global_step": 141177, "epoch": 3361} {"train_loss": -6.876579284667969, "global_step": 141178, "epoch": 3361} {"train_loss": -6.759693145751953, "global_step": 141179, "epoch": 3361} {"train_loss": -6.726780891418457, "global_step": 141180, "epoch": 3361} {"train_loss": -6.832158088684082, "global_step": 141181, "epoch": 3361} {"train_loss": -6.825048446655273, "global_step": 141182, "epoch": 3361} {"train_loss": -6.835826873779297, "global_step": 141183, "epoch": 3361} {"train_loss": -6.774069786071777, "global_step": 141184, "epoch": 3361} {"train_loss": -6.827592849731445, "global_step": 141185, "epoch": 3361} {"train_loss": -6.685154914855957, "global_step": 141186, "epoch": 3361} {"train_loss": -6.788458824157715, "global_step": 141187, "epoch": 3361} {"train_loss": -6.8358659744262695, "global_step": 141188, "epoch": 3361} {"train_loss": -6.830477714538574, "global_step": 141189, "epoch": 3361} {"train_loss": -6.848278045654297, "global_step": 141190, "epoch": 3361} {"train_loss": -6.876168251037598, "global_step": 141191, "epoch": 3361} {"train_loss": -6.767329216003418, "global_step": 141192, "epoch": 3361} {"train_loss": -6.898385047912598, "global_step": 141193, "epoch": 3361} {"train_loss": -6.752093315124512, "global_step": 141194, "epoch": 3361} {"train_loss": -6.664688587188721, "global_step": 141195, "epoch": 3361} {"train_loss": -6.881209373474121, "global_step": 141196, "epoch": 3361} {"train_loss": -6.7743096351623535, "global_step": 141197, "epoch": 3361} {"train_loss": -6.801962375640869, "global_step": 141198, "epoch": 3361} {"train_loss": -6.740935325622559, "global_step": 141199, "epoch": 3361} {"train_loss": -6.711556911468506, "global_step": 141200, "epoch": 3361} {"train_loss": -6.686903953552246, "global_step": 141201, "epoch": 3361} {"train_loss": -6.638225555419922, "global_step": 141202, "epoch": 3361} {"train_loss": -6.757871321269444, "global_step": 141203, "epoch": 3361, "val_loss": 68386.015625} {"train_loss": -6.623089790344238, "global_step": 141204, "epoch": 3362} {"train_loss": -6.789999485015869, "global_step": 141205, "epoch": 3362} {"train_loss": -6.77426815032959, "global_step": 141206, "epoch": 3362} {"train_loss": -6.669104099273682, "global_step": 141207, "epoch": 3362} {"train_loss": -6.807609558105469, "global_step": 141208, "epoch": 3362} {"train_loss": -6.64886474609375, "global_step": 141209, "epoch": 3362} {"train_loss": -6.739266872406006, "global_step": 141210, "epoch": 3362} {"train_loss": -6.700794219970703, "global_step": 141211, "epoch": 3362} {"train_loss": -6.669079780578613, "global_step": 141212, "epoch": 3362} {"train_loss": -6.768755912780762, "global_step": 141213, "epoch": 3362} {"train_loss": -6.662508487701416, "global_step": 141214, "epoch": 3362} {"train_loss": -6.508762359619141, "global_step": 141215, "epoch": 3362} {"train_loss": -6.763245105743408, "global_step": 141216, "epoch": 3362} {"train_loss": -6.807844161987305, "global_step": 141217, "epoch": 3362} {"train_loss": -6.603601932525635, "global_step": 141218, "epoch": 3362} {"train_loss": -6.704819679260254, "global_step": 141219, "epoch": 3362} {"train_loss": -6.677187442779541, "global_step": 141220, "epoch": 3362} {"train_loss": -6.669730186462402, "global_step": 141221, "epoch": 3362} {"train_loss": -6.73020601272583, "global_step": 141222, "epoch": 3362} {"train_loss": -6.733625411987305, "global_step": 141223, "epoch": 3362} {"train_loss": -6.77901554107666, "global_step": 141224, "epoch": 3362} {"train_loss": -6.61946439743042, "global_step": 141225, "epoch": 3362} {"train_loss": -6.713372230529785, "global_step": 141226, "epoch": 3362} {"train_loss": -6.714193820953369, "global_step": 141227, "epoch": 3362} {"train_loss": -6.639339923858643, "global_step": 141228, "epoch": 3362} {"train_loss": -6.652932167053223, "global_step": 141229, "epoch": 3362} {"train_loss": -6.674685478210449, "global_step": 141230, "epoch": 3362} {"train_loss": -6.664815902709961, "global_step": 141231, "epoch": 3362} {"train_loss": -6.5845537185668945, "global_step": 141232, "epoch": 3362} {"train_loss": -6.573480606079102, "global_step": 141233, "epoch": 3362} {"train_loss": -6.695291042327881, "global_step": 141234, "epoch": 3362} {"train_loss": -6.651577949523926, "global_step": 141235, "epoch": 3362} {"train_loss": -6.718829154968262, "global_step": 141236, "epoch": 3362} {"train_loss": -6.668049335479736, "global_step": 141237, "epoch": 3362} {"train_loss": -6.7844038009643555, "global_step": 141238, "epoch": 3362} {"train_loss": -6.801116943359375, "global_step": 141239, "epoch": 3362} {"train_loss": -6.636361122131348, "global_step": 141240, "epoch": 3362} {"train_loss": -6.781278610229492, "global_step": 141241, "epoch": 3362} {"train_loss": -6.743020534515381, "global_step": 141242, "epoch": 3362} {"train_loss": -6.697275638580322, "global_step": 141243, "epoch": 3362} {"train_loss": -6.712288856506348, "global_step": 141244, "epoch": 3362} {"train_loss": -6.69734331539699, "global_step": 141245, "epoch": 3362, "val_loss": 68345.4140625} {"train_loss": -6.715165138244629, "global_step": 141246, "epoch": 3363} {"train_loss": -6.737163543701172, "global_step": 141247, "epoch": 3363} {"train_loss": -6.8302812576293945, "global_step": 141248, "epoch": 3363} {"train_loss": -6.736968994140625, "global_step": 141249, "epoch": 3363} {"train_loss": -6.638091087341309, "global_step": 141250, "epoch": 3363} {"train_loss": -6.662117004394531, "global_step": 141251, "epoch": 3363} {"train_loss": -6.763047695159912, "global_step": 141252, "epoch": 3363} {"train_loss": -6.842798709869385, "global_step": 141253, "epoch": 3363} {"train_loss": -6.686556816101074, "global_step": 141254, "epoch": 3363} {"train_loss": -6.810834884643555, "global_step": 141255, "epoch": 3363} {"train_loss": -6.742161273956299, "global_step": 141256, "epoch": 3363} {"train_loss": -6.7295732498168945, "global_step": 141257, "epoch": 3363} {"train_loss": -6.80601692199707, "global_step": 141258, "epoch": 3363} {"train_loss": -6.837094306945801, "global_step": 141259, "epoch": 3363} {"train_loss": -6.715417861938477, "global_step": 141260, "epoch": 3363} {"train_loss": -6.753251075744629, "global_step": 141261, "epoch": 3363} {"train_loss": -6.7573370933532715, "global_step": 141262, "epoch": 3363} {"train_loss": -6.73411750793457, "global_step": 141263, "epoch": 3363} {"train_loss": -6.730301856994629, "global_step": 141264, "epoch": 3363} {"train_loss": -6.8136186599731445, "global_step": 141265, "epoch": 3363} {"train_loss": -6.7998480796813965, "global_step": 141266, "epoch": 3363} {"train_loss": -6.84830904006958, "global_step": 141267, "epoch": 3363} {"train_loss": -6.797752380371094, "global_step": 141268, "epoch": 3363} {"train_loss": -6.791290283203125, "global_step": 141269, "epoch": 3363} {"train_loss": -6.732371807098389, "global_step": 141270, "epoch": 3363} {"train_loss": -6.79396390914917, "global_step": 141271, "epoch": 3363} {"train_loss": -6.58867073059082, "global_step": 141272, "epoch": 3363} {"train_loss": -6.704975128173828, "global_step": 141273, "epoch": 3363} {"train_loss": -6.616235256195068, "global_step": 141274, "epoch": 3363} {"train_loss": -6.54075813293457, "global_step": 141275, "epoch": 3363} {"train_loss": -6.668872356414795, "global_step": 141276, "epoch": 3363} {"train_loss": -6.549286365509033, "global_step": 141277, "epoch": 3363} {"train_loss": -6.715308666229248, "global_step": 141278, "epoch": 3363} {"train_loss": -6.6834893226623535, "global_step": 141279, "epoch": 3363} {"train_loss": -6.607746601104736, "global_step": 141280, "epoch": 3363} {"train_loss": -6.724596977233887, "global_step": 141281, "epoch": 3363} {"train_loss": -6.627358436584473, "global_step": 141282, "epoch": 3363} {"train_loss": -6.69235372543335, "global_step": 141283, "epoch": 3363} {"train_loss": -6.717378616333008, "global_step": 141284, "epoch": 3363} {"train_loss": -6.723433017730713, "global_step": 141285, "epoch": 3363} {"train_loss": -6.68167781829834, "global_step": 141286, "epoch": 3363} {"train_loss": -6.722221181506202, "global_step": 141287, "epoch": 3363, "val_loss": 68382.7578125} {"train_loss": -6.673996448516846, "global_step": 141288, "epoch": 3364} {"train_loss": -6.852207183837891, "global_step": 141289, "epoch": 3364} {"train_loss": -6.761188983917236, "global_step": 141290, "epoch": 3364} {"train_loss": -6.5751848220825195, "global_step": 141291, "epoch": 3364} {"train_loss": -6.712139129638672, "global_step": 141292, "epoch": 3364} {"train_loss": -6.781661510467529, "global_step": 141293, "epoch": 3364} {"train_loss": -6.650686264038086, "global_step": 141294, "epoch": 3364} {"train_loss": -6.799260139465332, "global_step": 141295, "epoch": 3364} {"train_loss": -6.7509307861328125, "global_step": 141296, "epoch": 3364} {"train_loss": -6.6673126220703125, "global_step": 141297, "epoch": 3364} {"train_loss": -6.679765701293945, "global_step": 141298, "epoch": 3364} {"train_loss": -6.70001220703125, "global_step": 141299, "epoch": 3364} {"train_loss": -6.637342929840088, "global_step": 141300, "epoch": 3364} {"train_loss": -6.762837886810303, "global_step": 141301, "epoch": 3364} {"train_loss": -6.7653703689575195, "global_step": 141302, "epoch": 3364} {"train_loss": -6.663455963134766, "global_step": 141303, "epoch": 3364} {"train_loss": -6.714415550231934, "global_step": 141304, "epoch": 3364} {"train_loss": -6.629299163818359, "global_step": 141305, "epoch": 3364} {"train_loss": -6.596912384033203, "global_step": 141306, "epoch": 3364} {"train_loss": -6.615775108337402, "global_step": 141307, "epoch": 3364} {"train_loss": -6.606175422668457, "global_step": 141308, "epoch": 3364} {"train_loss": -6.572409152984619, "global_step": 141309, "epoch": 3364} {"train_loss": -6.619419574737549, "global_step": 141310, "epoch": 3364} {"train_loss": -6.641327857971191, "global_step": 141311, "epoch": 3364} {"train_loss": -6.735286235809326, "global_step": 141312, "epoch": 3364} {"train_loss": -6.694661617279053, "global_step": 141313, "epoch": 3364} {"train_loss": -6.673532009124756, "global_step": 141314, "epoch": 3364} {"train_loss": -6.719189643859863, "global_step": 141315, "epoch": 3364} {"train_loss": -6.674374103546143, "global_step": 141316, "epoch": 3364} {"train_loss": -6.727151393890381, "global_step": 141317, "epoch": 3364} {"train_loss": -6.638150215148926, "global_step": 141318, "epoch": 3364} {"train_loss": -6.669856071472168, "global_step": 141319, "epoch": 3364} {"train_loss": -6.662962913513184, "global_step": 141320, "epoch": 3364} {"train_loss": -6.6620259284973145, "global_step": 141321, "epoch": 3364} {"train_loss": -6.646111011505127, "global_step": 141322, "epoch": 3364} {"train_loss": -6.5885772705078125, "global_step": 141323, "epoch": 3364} {"train_loss": -6.651790142059326, "global_step": 141324, "epoch": 3364} {"train_loss": -6.631700038909912, "global_step": 141325, "epoch": 3364} {"train_loss": -6.707806587219238, "global_step": 141326, "epoch": 3364} {"train_loss": -6.8219099044799805, "global_step": 141327, "epoch": 3364} {"train_loss": -6.522895336151123, "global_step": 141328, "epoch": 3364} {"train_loss": -6.6794370128994895, "global_step": 141329, "epoch": 3364, "val_loss": 68280.484375} {"train_loss": -6.727187156677246, "global_step": 141330, "epoch": 3365} {"train_loss": -6.670680522918701, "global_step": 141331, "epoch": 3365} {"train_loss": -6.6285834312438965, "global_step": 141332, "epoch": 3365} {"train_loss": -6.6620988845825195, "global_step": 141333, "epoch": 3365} {"train_loss": -6.749560356140137, "global_step": 141334, "epoch": 3365} {"train_loss": -6.776092529296875, "global_step": 141335, "epoch": 3365} {"train_loss": -6.750479698181152, "global_step": 141336, "epoch": 3365} {"train_loss": -6.69932746887207, "global_step": 141337, "epoch": 3365} {"train_loss": -6.796024322509766, "global_step": 141338, "epoch": 3365} {"train_loss": -6.828721046447754, "global_step": 141339, "epoch": 3365} {"train_loss": -6.824932098388672, "global_step": 141340, "epoch": 3365} {"train_loss": -6.840917110443115, "global_step": 141341, "epoch": 3365} {"train_loss": -6.7534637451171875, "global_step": 141342, "epoch": 3365} {"train_loss": -6.710643291473389, "global_step": 141343, "epoch": 3365} {"train_loss": -6.802691459655762, "global_step": 141344, "epoch": 3365} {"train_loss": -6.776204586029053, "global_step": 141345, "epoch": 3365} {"train_loss": -6.6765336990356445, "global_step": 141346, "epoch": 3365} {"train_loss": -6.832642555236816, "global_step": 141347, "epoch": 3365} {"train_loss": -6.79335355758667, "global_step": 141348, "epoch": 3365} {"train_loss": -6.828397274017334, "global_step": 141349, "epoch": 3365} {"train_loss": -6.822540283203125, "global_step": 141350, "epoch": 3365} {"train_loss": -6.756994247436523, "global_step": 141351, "epoch": 3365} {"train_loss": -6.8151164054870605, "global_step": 141352, "epoch": 3365} {"train_loss": -6.690513610839844, "global_step": 141353, "epoch": 3365} {"train_loss": -6.6701436042785645, "global_step": 141354, "epoch": 3365} {"train_loss": -6.776407241821289, "global_step": 141355, "epoch": 3365} {"train_loss": -6.826075553894043, "global_step": 141356, "epoch": 3365} {"train_loss": -6.753656387329102, "global_step": 141357, "epoch": 3365} {"train_loss": -6.707538604736328, "global_step": 141358, "epoch": 3365} {"train_loss": -6.749810218811035, "global_step": 141359, "epoch": 3365} {"train_loss": -6.713149070739746, "global_step": 141360, "epoch": 3365} {"train_loss": -6.779871940612793, "global_step": 141361, "epoch": 3365} {"train_loss": -6.895969390869141, "global_step": 141362, "epoch": 3365} {"train_loss": -6.741168975830078, "global_step": 141363, "epoch": 3365} {"train_loss": -6.756281852722168, "global_step": 141364, "epoch": 3365} {"train_loss": -6.558561325073242, "global_step": 141365, "epoch": 3365} {"train_loss": -6.564852237701416, "global_step": 141366, "epoch": 3365} {"train_loss": -6.76326847076416, "global_step": 141367, "epoch": 3365} {"train_loss": -6.750853061676025, "global_step": 141368, "epoch": 3365} {"train_loss": -6.652978897094727, "global_step": 141369, "epoch": 3365} {"train_loss": -6.80833101272583, "global_step": 141370, "epoch": 3365} {"train_loss": -6.747443233217512, "global_step": 141371, "epoch": 3365, "val_loss": 68308.2109375} {"train_loss": -6.7776031494140625, "global_step": 141372, "epoch": 3366} {"train_loss": -6.735997676849365, "global_step": 141373, "epoch": 3366} {"train_loss": -6.800939559936523, "global_step": 141374, "epoch": 3366} {"train_loss": -6.805817604064941, "global_step": 141375, "epoch": 3366} {"train_loss": -6.704257965087891, "global_step": 141376, "epoch": 3366} {"train_loss": -6.806999206542969, "global_step": 141377, "epoch": 3366} {"train_loss": -6.77967643737793, "global_step": 141378, "epoch": 3366} {"train_loss": -6.772466659545898, "global_step": 141379, "epoch": 3366} {"train_loss": -6.734523773193359, "global_step": 141380, "epoch": 3366} {"train_loss": -6.813765525817871, "global_step": 141381, "epoch": 3366} {"train_loss": -6.707978248596191, "global_step": 141382, "epoch": 3366} {"train_loss": -6.830190658569336, "global_step": 141383, "epoch": 3366} {"train_loss": -6.739448070526123, "global_step": 141384, "epoch": 3366} {"train_loss": -6.731003284454346, "global_step": 141385, "epoch": 3366} {"train_loss": -6.868671894073486, "global_step": 141386, "epoch": 3366} {"train_loss": -6.736419677734375, "global_step": 141387, "epoch": 3366} {"train_loss": -6.780206680297852, "global_step": 141388, "epoch": 3366} {"train_loss": -6.771385669708252, "global_step": 141389, "epoch": 3366} {"train_loss": -6.783071041107178, "global_step": 141390, "epoch": 3366} {"train_loss": -6.664228439331055, "global_step": 141391, "epoch": 3366} {"train_loss": -6.780511856079102, "global_step": 141392, "epoch": 3366} {"train_loss": -6.7456746101379395, "global_step": 141393, "epoch": 3366} {"train_loss": -6.727628231048584, "global_step": 141394, "epoch": 3366} {"train_loss": -6.744841575622559, "global_step": 141395, "epoch": 3366} {"train_loss": -6.796067714691162, "global_step": 141396, "epoch": 3366} {"train_loss": -6.740206718444824, "global_step": 141397, "epoch": 3366} {"train_loss": -6.835142135620117, "global_step": 141398, "epoch": 3366} {"train_loss": -6.780797004699707, "global_step": 141399, "epoch": 3366} {"train_loss": -6.845541954040527, "global_step": 141400, "epoch": 3366} {"train_loss": -6.849320411682129, "global_step": 141401, "epoch": 3366} {"train_loss": -6.754234313964844, "global_step": 141402, "epoch": 3366} {"train_loss": -6.781574726104736, "global_step": 141403, "epoch": 3366} {"train_loss": -6.993506908416748, "global_step": 141404, "epoch": 3366} {"train_loss": -6.744974136352539, "global_step": 141405, "epoch": 3366} {"train_loss": -6.762124538421631, "global_step": 141406, "epoch": 3366} {"train_loss": -6.908550262451172, "global_step": 141407, "epoch": 3366} {"train_loss": -6.75702428817749, "global_step": 141408, "epoch": 3366} {"train_loss": -6.7483978271484375, "global_step": 141409, "epoch": 3366} {"train_loss": -6.854580879211426, "global_step": 141410, "epoch": 3366} {"train_loss": -6.760998725891113, "global_step": 141411, "epoch": 3366} {"train_loss": -6.857105255126953, "global_step": 141412, "epoch": 3366} {"train_loss": -6.783599353971935, "global_step": 141413, "epoch": 3366, "val_loss": 68361.1328125} {"train_loss": -6.7426252365112305, "global_step": 141414, "epoch": 3367} {"train_loss": -6.810009002685547, "global_step": 141415, "epoch": 3367} {"train_loss": -6.839168548583984, "global_step": 141416, "epoch": 3367} {"train_loss": -6.795555114746094, "global_step": 141417, "epoch": 3367} {"train_loss": -6.908560752868652, "global_step": 141418, "epoch": 3367} {"train_loss": -6.749852180480957, "global_step": 141419, "epoch": 3367} {"train_loss": -6.891477584838867, "global_step": 141420, "epoch": 3367} {"train_loss": -6.859043121337891, "global_step": 141421, "epoch": 3367} {"train_loss": -6.764410495758057, "global_step": 141422, "epoch": 3367} {"train_loss": -6.751040935516357, "global_step": 141423, "epoch": 3367} {"train_loss": -6.883394718170166, "global_step": 141424, "epoch": 3367} {"train_loss": -6.629268646240234, "global_step": 141425, "epoch": 3367} {"train_loss": -6.8749799728393555, "global_step": 141426, "epoch": 3367} {"train_loss": -6.803313255310059, "global_step": 141427, "epoch": 3367} {"train_loss": -6.641748905181885, "global_step": 141428, "epoch": 3367} {"train_loss": -6.769040107727051, "global_step": 141429, "epoch": 3367} {"train_loss": -6.714215278625488, "global_step": 141430, "epoch": 3367} {"train_loss": -6.854759216308594, "global_step": 141431, "epoch": 3367} {"train_loss": -6.658844470977783, "global_step": 141432, "epoch": 3367} {"train_loss": -6.753382682800293, "global_step": 141433, "epoch": 3367} {"train_loss": -6.807861804962158, "global_step": 141434, "epoch": 3367} {"train_loss": -6.689871311187744, "global_step": 141435, "epoch": 3367} {"train_loss": -6.813358306884766, "global_step": 141436, "epoch": 3367} {"train_loss": -6.741644859313965, "global_step": 141437, "epoch": 3367} {"train_loss": -6.7643537521362305, "global_step": 141438, "epoch": 3367} {"train_loss": -6.737430572509766, "global_step": 141439, "epoch": 3367} {"train_loss": -6.797192573547363, "global_step": 141440, "epoch": 3367} {"train_loss": -6.842794418334961, "global_step": 141441, "epoch": 3367} {"train_loss": -6.804080009460449, "global_step": 141442, "epoch": 3367} {"train_loss": -6.690839767456055, "global_step": 141443, "epoch": 3367} {"train_loss": -6.773210048675537, "global_step": 141444, "epoch": 3367} {"train_loss": -6.703400135040283, "global_step": 141445, "epoch": 3367} {"train_loss": -6.728209495544434, "global_step": 141446, "epoch": 3367} {"train_loss": -6.709908485412598, "global_step": 141447, "epoch": 3367} {"train_loss": -6.789813995361328, "global_step": 141448, "epoch": 3367} {"train_loss": -6.706354141235352, "global_step": 141449, "epoch": 3367} {"train_loss": -6.640514373779297, "global_step": 141450, "epoch": 3367} {"train_loss": -6.670957565307617, "global_step": 141451, "epoch": 3367} {"train_loss": -6.782352924346924, "global_step": 141452, "epoch": 3367} {"train_loss": -6.665549278259277, "global_step": 141453, "epoch": 3367} {"train_loss": -6.722185134887695, "global_step": 141454, "epoch": 3367} {"train_loss": -6.7615423656645275, "global_step": 141455, "epoch": 3367, "val_loss": 68322.2578125} {"train_loss": -6.816926002502441, "global_step": 141456, "epoch": 3368} {"train_loss": -6.744472026824951, "global_step": 141457, "epoch": 3368} {"train_loss": -6.591513633728027, "global_step": 141458, "epoch": 3368} {"train_loss": -6.635607719421387, "global_step": 141459, "epoch": 3368} {"train_loss": -6.730382442474365, "global_step": 141460, "epoch": 3368} {"train_loss": -6.753240585327148, "global_step": 141461, "epoch": 3368} {"train_loss": -6.58016300201416, "global_step": 141462, "epoch": 3368} {"train_loss": -6.738549709320068, "global_step": 141463, "epoch": 3368} {"train_loss": -6.707836151123047, "global_step": 141464, "epoch": 3368} {"train_loss": -6.589909553527832, "global_step": 141465, "epoch": 3368} {"train_loss": -6.638679504394531, "global_step": 141466, "epoch": 3368} {"train_loss": -6.6698479652404785, "global_step": 141467, "epoch": 3368} {"train_loss": -6.653563976287842, "global_step": 141468, "epoch": 3368} {"train_loss": -6.556684494018555, "global_step": 141469, "epoch": 3368} {"train_loss": -6.677003860473633, "global_step": 141470, "epoch": 3368} {"train_loss": -6.603951454162598, "global_step": 141471, "epoch": 3368} {"train_loss": -6.75822114944458, "global_step": 141472, "epoch": 3368} {"train_loss": -6.73127555847168, "global_step": 141473, "epoch": 3368} {"train_loss": -6.70411491394043, "global_step": 141474, "epoch": 3368} {"train_loss": -6.782704830169678, "global_step": 141475, "epoch": 3368} {"train_loss": -6.759215354919434, "global_step": 141476, "epoch": 3368} {"train_loss": -6.688249588012695, "global_step": 141477, "epoch": 3368} {"train_loss": -6.651268005371094, "global_step": 141478, "epoch": 3368} {"train_loss": -6.627009391784668, "global_step": 141479, "epoch": 3368} {"train_loss": -6.579492092132568, "global_step": 141480, "epoch": 3368} {"train_loss": -6.676828861236572, "global_step": 141481, "epoch": 3368} {"train_loss": -6.6825666427612305, "global_step": 141482, "epoch": 3368} {"train_loss": -6.660986423492432, "global_step": 141483, "epoch": 3368} {"train_loss": -6.689826965332031, "global_step": 141484, "epoch": 3368} {"train_loss": -6.720945835113525, "global_step": 141485, "epoch": 3368} {"train_loss": -6.791566848754883, "global_step": 141486, "epoch": 3368} {"train_loss": -6.742221832275391, "global_step": 141487, "epoch": 3368} {"train_loss": -6.6210856437683105, "global_step": 141488, "epoch": 3368} {"train_loss": -6.73032283782959, "global_step": 141489, "epoch": 3368} {"train_loss": -6.704724311828613, "global_step": 141490, "epoch": 3368} {"train_loss": -6.659307479858398, "global_step": 141491, "epoch": 3368} {"train_loss": -6.751237392425537, "global_step": 141492, "epoch": 3368} {"train_loss": -6.658906936645508, "global_step": 141493, "epoch": 3368} {"train_loss": -6.743636131286621, "global_step": 141494, "epoch": 3368} {"train_loss": -6.711632251739502, "global_step": 141495, "epoch": 3368} {"train_loss": -6.698655128479004, "global_step": 141496, "epoch": 3368} {"train_loss": -6.689225230898176, "global_step": 141497, "epoch": 3368, "val_loss": 68114.1640625} {"train_loss": -6.8115105628967285, "global_step": 141498, "epoch": 3369} {"train_loss": -6.790314674377441, "global_step": 141499, "epoch": 3369} {"train_loss": -6.692853927612305, "global_step": 141500, "epoch": 3369} {"train_loss": -6.668515205383301, "global_step": 141501, "epoch": 3369} {"train_loss": -6.892564296722412, "global_step": 141502, "epoch": 3369} {"train_loss": -6.613804817199707, "global_step": 141503, "epoch": 3369} {"train_loss": -6.744930267333984, "global_step": 141504, "epoch": 3369} {"train_loss": -6.6636528968811035, "global_step": 141505, "epoch": 3369} {"train_loss": -6.76939582824707, "global_step": 141506, "epoch": 3369} {"train_loss": -6.6928629875183105, "global_step": 141507, "epoch": 3369} {"train_loss": -6.790063858032227, "global_step": 141508, "epoch": 3369} {"train_loss": -6.793954372406006, "global_step": 141509, "epoch": 3369} {"train_loss": -6.763051986694336, "global_step": 141510, "epoch": 3369} {"train_loss": -6.775574207305908, "global_step": 141511, "epoch": 3369} {"train_loss": -6.743228435516357, "global_step": 141512, "epoch": 3369} {"train_loss": -6.791880130767822, "global_step": 141513, "epoch": 3369} {"train_loss": -6.706411361694336, "global_step": 141514, "epoch": 3369} {"train_loss": -6.673023223876953, "global_step": 141515, "epoch": 3369} {"train_loss": -6.71989631652832, "global_step": 141516, "epoch": 3369} {"train_loss": -6.75569486618042, "global_step": 141517, "epoch": 3369} {"train_loss": -6.763808250427246, "global_step": 141518, "epoch": 3369} {"train_loss": -6.6327595710754395, "global_step": 141519, "epoch": 3369} {"train_loss": -6.807987213134766, "global_step": 141520, "epoch": 3369} {"train_loss": -6.735207557678223, "global_step": 141521, "epoch": 3369} {"train_loss": -6.745440483093262, "global_step": 141522, "epoch": 3369} {"train_loss": -6.755068778991699, "global_step": 141523, "epoch": 3369} {"train_loss": -6.735264778137207, "global_step": 141524, "epoch": 3369} {"train_loss": -6.710967063903809, "global_step": 141525, "epoch": 3369} {"train_loss": -6.701145172119141, "global_step": 141526, "epoch": 3369} {"train_loss": -6.732439041137695, "global_step": 141527, "epoch": 3369} {"train_loss": -6.794680595397949, "global_step": 141528, "epoch": 3369} {"train_loss": -6.603261947631836, "global_step": 141529, "epoch": 3369} {"train_loss": -6.829286575317383, "global_step": 141530, "epoch": 3369} {"train_loss": -6.77499532699585, "global_step": 141531, "epoch": 3369} {"train_loss": -6.823063850402832, "global_step": 141532, "epoch": 3369} {"train_loss": -6.706766605377197, "global_step": 141533, "epoch": 3369} {"train_loss": -6.666382789611816, "global_step": 141534, "epoch": 3369} {"train_loss": -6.733918190002441, "global_step": 141535, "epoch": 3369} {"train_loss": -6.81821870803833, "global_step": 141536, "epoch": 3369} {"train_loss": -6.735020637512207, "global_step": 141537, "epoch": 3369} {"train_loss": -6.682577610015869, "global_step": 141538, "epoch": 3369} {"train_loss": -6.74049957593282, "global_step": 141539, "epoch": 3369, "val_loss": 68325.796875} {"train_loss": -6.6824564933776855, "global_step": 141540, "epoch": 3370} {"train_loss": -6.856066703796387, "global_step": 141541, "epoch": 3370} {"train_loss": -6.745749473571777, "global_step": 141542, "epoch": 3370} {"train_loss": -6.805608749389648, "global_step": 141543, "epoch": 3370} {"train_loss": -6.708413124084473, "global_step": 141544, "epoch": 3370} {"train_loss": -6.782214164733887, "global_step": 141545, "epoch": 3370} {"train_loss": -6.705732345581055, "global_step": 141546, "epoch": 3370} {"train_loss": -6.72866678237915, "global_step": 141547, "epoch": 3370} {"train_loss": -6.7148542404174805, "global_step": 141548, "epoch": 3370} {"train_loss": -6.74586296081543, "global_step": 141549, "epoch": 3370} {"train_loss": -6.690879821777344, "global_step": 141550, "epoch": 3370} {"train_loss": -6.672486305236816, "global_step": 141551, "epoch": 3370} {"train_loss": -6.587497711181641, "global_step": 141552, "epoch": 3370} {"train_loss": -6.791501998901367, "global_step": 141553, "epoch": 3370} {"train_loss": -6.711758613586426, "global_step": 141554, "epoch": 3370} {"train_loss": -6.723567962646484, "global_step": 141555, "epoch": 3370} {"train_loss": -6.725586414337158, "global_step": 141556, "epoch": 3370} {"train_loss": -6.627989292144775, "global_step": 141557, "epoch": 3370} {"train_loss": -6.774575233459473, "global_step": 141558, "epoch": 3370} {"train_loss": -6.745630264282227, "global_step": 141559, "epoch": 3370} {"train_loss": -6.740002632141113, "global_step": 141560, "epoch": 3370} {"train_loss": -6.718535423278809, "global_step": 141561, "epoch": 3370} {"train_loss": -6.741236209869385, "global_step": 141562, "epoch": 3370} {"train_loss": -6.742595672607422, "global_step": 141563, "epoch": 3370} {"train_loss": -6.70375394821167, "global_step": 141564, "epoch": 3370} {"train_loss": -6.683223724365234, "global_step": 141565, "epoch": 3370} {"train_loss": -6.904570579528809, "global_step": 141566, "epoch": 3370} {"train_loss": -6.707674980163574, "global_step": 141567, "epoch": 3370} {"train_loss": -6.709871768951416, "global_step": 141568, "epoch": 3370} {"train_loss": -6.768975734710693, "global_step": 141569, "epoch": 3370} {"train_loss": -6.754827976226807, "global_step": 141570, "epoch": 3370} {"train_loss": -6.7619099617004395, "global_step": 141571, "epoch": 3370} {"train_loss": -6.597506046295166, "global_step": 141572, "epoch": 3370} {"train_loss": -6.800831317901611, "global_step": 141573, "epoch": 3370} {"train_loss": -6.782844543457031, "global_step": 141574, "epoch": 3370} {"train_loss": -6.740884780883789, "global_step": 141575, "epoch": 3370} {"train_loss": -6.743391990661621, "global_step": 141576, "epoch": 3370} {"train_loss": -6.684159278869629, "global_step": 141577, "epoch": 3370} {"train_loss": -6.788183212280273, "global_step": 141578, "epoch": 3370} {"train_loss": -6.740877628326416, "global_step": 141579, "epoch": 3370} {"train_loss": -6.792162895202637, "global_step": 141580, "epoch": 3370} {"train_loss": -6.732460600989206, "global_step": 141581, "epoch": 3370, "val_loss": 68473.609375} {"train_loss": -6.75773286819458, "global_step": 141582, "epoch": 3371} {"train_loss": -6.721916198730469, "global_step": 141583, "epoch": 3371} {"train_loss": -6.8403191566467285, "global_step": 141584, "epoch": 3371} {"train_loss": -6.5695037841796875, "global_step": 141585, "epoch": 3371} {"train_loss": -6.794390678405762, "global_step": 141586, "epoch": 3371} {"train_loss": -6.632490158081055, "global_step": 141587, "epoch": 3371} {"train_loss": -6.680852890014648, "global_step": 141588, "epoch": 3371} {"train_loss": -6.779061317443848, "global_step": 141589, "epoch": 3371} {"train_loss": -6.608911514282227, "global_step": 141590, "epoch": 3371} {"train_loss": -6.646892070770264, "global_step": 141591, "epoch": 3371} {"train_loss": -6.759385585784912, "global_step": 141592, "epoch": 3371} {"train_loss": -6.906489372253418, "global_step": 141593, "epoch": 3371} {"train_loss": -6.82429313659668, "global_step": 141594, "epoch": 3371} {"train_loss": -6.6363654136657715, "global_step": 141595, "epoch": 3371} {"train_loss": -6.680939674377441, "global_step": 141596, "epoch": 3371} {"train_loss": -6.587794303894043, "global_step": 141597, "epoch": 3371} {"train_loss": -6.517838478088379, "global_step": 141598, "epoch": 3371} {"train_loss": -6.712360382080078, "global_step": 141599, "epoch": 3371} {"train_loss": -6.698674201965332, "global_step": 141600, "epoch": 3371} {"train_loss": -6.661256790161133, "global_step": 141601, "epoch": 3371} {"train_loss": -6.563949108123779, "global_step": 141602, "epoch": 3371} {"train_loss": -6.699003219604492, "global_step": 141603, "epoch": 3371} {"train_loss": -6.686075210571289, "global_step": 141604, "epoch": 3371} {"train_loss": -6.625596523284912, "global_step": 141605, "epoch": 3371} {"train_loss": -6.5177507400512695, "global_step": 141606, "epoch": 3371} {"train_loss": -6.597889423370361, "global_step": 141607, "epoch": 3371} {"train_loss": -6.520408630371094, "global_step": 141608, "epoch": 3371} {"train_loss": -6.494053840637207, "global_step": 141609, "epoch": 3371} {"train_loss": -6.5299506187438965, "global_step": 141610, "epoch": 3371} {"train_loss": -6.56735897064209, "global_step": 141611, "epoch": 3371} {"train_loss": -6.556753158569336, "global_step": 141612, "epoch": 3371} {"train_loss": -6.588086128234863, "global_step": 141613, "epoch": 3371} {"train_loss": -6.412811279296875, "global_step": 141614, "epoch": 3371} {"train_loss": -6.632146835327148, "global_step": 141615, "epoch": 3371} {"train_loss": -6.563535213470459, "global_step": 141616, "epoch": 3371} {"train_loss": -6.717768669128418, "global_step": 141617, "epoch": 3371} {"train_loss": -6.616253852844238, "global_step": 141618, "epoch": 3371} {"train_loss": -6.520062446594238, "global_step": 141619, "epoch": 3371} {"train_loss": -6.601886749267578, "global_step": 141620, "epoch": 3371} {"train_loss": -6.567648887634277, "global_step": 141621, "epoch": 3371} {"train_loss": -6.431192398071289, "global_step": 141622, "epoch": 3371} {"train_loss": -6.6325809842064265, "global_step": 141623, "epoch": 3371, "val_loss": 68436.21875} {"train_loss": -6.699348449707031, "global_step": 141624, "epoch": 3372} {"train_loss": -6.522106647491455, "global_step": 141625, "epoch": 3372} {"train_loss": -6.68775749206543, "global_step": 141626, "epoch": 3372} {"train_loss": -6.533140182495117, "global_step": 141627, "epoch": 3372} {"train_loss": -6.50809907913208, "global_step": 141628, "epoch": 3372} {"train_loss": -6.577388763427734, "global_step": 141629, "epoch": 3372} {"train_loss": -6.731810569763184, "global_step": 141630, "epoch": 3372} {"train_loss": -6.661865234375, "global_step": 141631, "epoch": 3372} {"train_loss": -6.634608745574951, "global_step": 141632, "epoch": 3372} {"train_loss": -6.65583610534668, "global_step": 141633, "epoch": 3372} {"train_loss": -6.536994934082031, "global_step": 141634, "epoch": 3372} {"train_loss": -6.667871475219727, "global_step": 141635, "epoch": 3372} {"train_loss": -6.6962666511535645, "global_step": 141636, "epoch": 3372} {"train_loss": -6.707272052764893, "global_step": 141637, "epoch": 3372} {"train_loss": -6.758493900299072, "global_step": 141638, "epoch": 3372} {"train_loss": -6.7567338943481445, "global_step": 141639, "epoch": 3372} {"train_loss": -6.6292901039123535, "global_step": 141640, "epoch": 3372} {"train_loss": -6.639901161193848, "global_step": 141641, "epoch": 3372} {"train_loss": -6.717278957366943, "global_step": 141642, "epoch": 3372} {"train_loss": -6.787073612213135, "global_step": 141643, "epoch": 3372} {"train_loss": -6.750594139099121, "global_step": 141644, "epoch": 3372} {"train_loss": -6.737467288970947, "global_step": 141645, "epoch": 3372} {"train_loss": -6.827569007873535, "global_step": 141646, "epoch": 3372} {"train_loss": -6.730697154998779, "global_step": 141647, "epoch": 3372} {"train_loss": -6.677469253540039, "global_step": 141648, "epoch": 3372} {"train_loss": -6.741477012634277, "global_step": 141649, "epoch": 3372} {"train_loss": -6.694635391235352, "global_step": 141650, "epoch": 3372} {"train_loss": -6.653173446655273, "global_step": 141651, "epoch": 3372} {"train_loss": -6.787350654602051, "global_step": 141652, "epoch": 3372} {"train_loss": -6.680973052978516, "global_step": 141653, "epoch": 3372} {"train_loss": -6.675273895263672, "global_step": 141654, "epoch": 3372} {"train_loss": -6.753544807434082, "global_step": 141655, "epoch": 3372} {"train_loss": -6.757503509521484, "global_step": 141656, "epoch": 3372} {"train_loss": -6.730297565460205, "global_step": 141657, "epoch": 3372} {"train_loss": -6.756936073303223, "global_step": 141658, "epoch": 3372} {"train_loss": -6.648629665374756, "global_step": 141659, "epoch": 3372} {"train_loss": -6.694928169250488, "global_step": 141660, "epoch": 3372} {"train_loss": -6.693388938903809, "global_step": 141661, "epoch": 3372} {"train_loss": -6.690788745880127, "global_step": 141662, "epoch": 3372} {"train_loss": -6.584677219390869, "global_step": 141663, "epoch": 3372} {"train_loss": -6.665225028991699, "global_step": 141664, "epoch": 3372} {"train_loss": -6.686408826283047, "global_step": 141665, "epoch": 3372, "val_loss": 68233.4140625} {"train_loss": -6.714609146118164, "global_step": 141666, "epoch": 3373} {"train_loss": -6.693244457244873, "global_step": 141667, "epoch": 3373} {"train_loss": -6.759200096130371, "global_step": 141668, "epoch": 3373} {"train_loss": -6.790920257568359, "global_step": 141669, "epoch": 3373} {"train_loss": -6.802953720092773, "global_step": 141670, "epoch": 3373} {"train_loss": -6.746068000793457, "global_step": 141671, "epoch": 3373} {"train_loss": -6.778948783874512, "global_step": 141672, "epoch": 3373} {"train_loss": -6.755795001983643, "global_step": 141673, "epoch": 3373} {"train_loss": -6.819174289703369, "global_step": 141674, "epoch": 3373} {"train_loss": -6.715397834777832, "global_step": 141675, "epoch": 3373} {"train_loss": -6.83443546295166, "global_step": 141676, "epoch": 3373} {"train_loss": -6.790574073791504, "global_step": 141677, "epoch": 3373} {"train_loss": -6.867597579956055, "global_step": 141678, "epoch": 3373} {"train_loss": -6.792074203491211, "global_step": 141679, "epoch": 3373} {"train_loss": -6.785981178283691, "global_step": 141680, "epoch": 3373} {"train_loss": -6.812466621398926, "global_step": 141681, "epoch": 3373} {"train_loss": -6.691079139709473, "global_step": 141682, "epoch": 3373} {"train_loss": -6.776215076446533, "global_step": 141683, "epoch": 3373} {"train_loss": -6.744126319885254, "global_step": 141684, "epoch": 3373} {"train_loss": -6.877865791320801, "global_step": 141685, "epoch": 3373} {"train_loss": -6.792688846588135, "global_step": 141686, "epoch": 3373} {"train_loss": -6.738880634307861, "global_step": 141687, "epoch": 3373} {"train_loss": -6.755687713623047, "global_step": 141688, "epoch": 3373} {"train_loss": -6.728346824645996, "global_step": 141689, "epoch": 3373} {"train_loss": -6.8707194328308105, "global_step": 141690, "epoch": 3373} {"train_loss": -6.846689224243164, "global_step": 141691, "epoch": 3373} {"train_loss": -6.750912666320801, "global_step": 141692, "epoch": 3373} {"train_loss": -6.748774528503418, "global_step": 141693, "epoch": 3373} {"train_loss": -6.780856132507324, "global_step": 141694, "epoch": 3373} {"train_loss": -6.804414749145508, "global_step": 141695, "epoch": 3373} {"train_loss": -6.763498783111572, "global_step": 141696, "epoch": 3373} {"train_loss": -6.778801918029785, "global_step": 141697, "epoch": 3373} {"train_loss": -6.602095127105713, "global_step": 141698, "epoch": 3373} {"train_loss": -6.819586753845215, "global_step": 141699, "epoch": 3373} {"train_loss": -6.882748126983643, "global_step": 141700, "epoch": 3373} {"train_loss": -6.630548477172852, "global_step": 141701, "epoch": 3373} {"train_loss": -6.844121932983398, "global_step": 141702, "epoch": 3373} {"train_loss": -6.700956344604492, "global_step": 141703, "epoch": 3373} {"train_loss": -6.725017547607422, "global_step": 141704, "epoch": 3373} {"train_loss": -6.816540241241455, "global_step": 141705, "epoch": 3373} {"train_loss": -6.68155574798584, "global_step": 141706, "epoch": 3373} {"train_loss": -6.768379234132313, "global_step": 141707, "epoch": 3373, "val_loss": 68193.3203125} {"train_loss": -6.664541244506836, "global_step": 141708, "epoch": 3374} {"train_loss": -6.5714874267578125, "global_step": 141709, "epoch": 3374} {"train_loss": -6.797845840454102, "global_step": 141710, "epoch": 3374} {"train_loss": -6.696629524230957, "global_step": 141711, "epoch": 3374} {"train_loss": -6.645101547241211, "global_step": 141712, "epoch": 3374} {"train_loss": -6.748288154602051, "global_step": 141713, "epoch": 3374} {"train_loss": -6.674619674682617, "global_step": 141714, "epoch": 3374} {"train_loss": -6.704400539398193, "global_step": 141715, "epoch": 3374} {"train_loss": -6.62877082824707, "global_step": 141716, "epoch": 3374} {"train_loss": -6.683487892150879, "global_step": 141717, "epoch": 3374} {"train_loss": -6.708909034729004, "global_step": 141718, "epoch": 3374} {"train_loss": -6.717236518859863, "global_step": 141719, "epoch": 3374} {"train_loss": -6.583949565887451, "global_step": 141720, "epoch": 3374} {"train_loss": -6.698731422424316, "global_step": 141721, "epoch": 3374} {"train_loss": -6.76539421081543, "global_step": 141722, "epoch": 3374} {"train_loss": -6.689111709594727, "global_step": 141723, "epoch": 3374} {"train_loss": -6.653613567352295, "global_step": 141724, "epoch": 3374} {"train_loss": -6.640682220458984, "global_step": 141725, "epoch": 3374} {"train_loss": -6.699664115905762, "global_step": 141726, "epoch": 3374} {"train_loss": -6.709105491638184, "global_step": 141727, "epoch": 3374} {"train_loss": -6.788424491882324, "global_step": 141728, "epoch": 3374} {"train_loss": -6.655643463134766, "global_step": 141729, "epoch": 3374} {"train_loss": -6.682201862335205, "global_step": 141730, "epoch": 3374} {"train_loss": -6.752875804901123, "global_step": 141731, "epoch": 3374} {"train_loss": -6.631741523742676, "global_step": 141732, "epoch": 3374} {"train_loss": -6.741631984710693, "global_step": 141733, "epoch": 3374} {"train_loss": -6.719069957733154, "global_step": 141734, "epoch": 3374} {"train_loss": -6.724855422973633, "global_step": 141735, "epoch": 3374} {"train_loss": -6.62930965423584, "global_step": 141736, "epoch": 3374} {"train_loss": -6.700237274169922, "global_step": 141737, "epoch": 3374} {"train_loss": -6.620872974395752, "global_step": 141738, "epoch": 3374} {"train_loss": -6.7148871421813965, "global_step": 141739, "epoch": 3374} {"train_loss": -6.720251083374023, "global_step": 141740, "epoch": 3374} {"train_loss": -6.697951316833496, "global_step": 141741, "epoch": 3374} {"train_loss": -6.758481979370117, "global_step": 141742, "epoch": 3374} {"train_loss": -6.578649997711182, "global_step": 141743, "epoch": 3374} {"train_loss": -6.743313312530518, "global_step": 141744, "epoch": 3374} {"train_loss": -6.685473442077637, "global_step": 141745, "epoch": 3374} {"train_loss": -6.680392265319824, "global_step": 141746, "epoch": 3374} {"train_loss": -6.6174540519714355, "global_step": 141747, "epoch": 3374} {"train_loss": -6.723410606384277, "global_step": 141748, "epoch": 3374} {"train_loss": -6.690012000855946, "global_step": 141749, "epoch": 3374, "val_loss": 68200.46875} {"train_loss": -6.750400066375732, "global_step": 141750, "epoch": 3375} {"train_loss": -6.677974224090576, "global_step": 141751, "epoch": 3375} {"train_loss": -6.672217845916748, "global_step": 141752, "epoch": 3375} {"train_loss": -6.627008438110352, "global_step": 141753, "epoch": 3375} {"train_loss": -6.767536640167236, "global_step": 141754, "epoch": 3375} {"train_loss": -6.789043426513672, "global_step": 141755, "epoch": 3375} {"train_loss": -6.711030960083008, "global_step": 141756, "epoch": 3375} {"train_loss": -6.663212776184082, "global_step": 141757, "epoch": 3375} {"train_loss": -6.777345657348633, "global_step": 141758, "epoch": 3375} {"train_loss": -6.717751502990723, "global_step": 141759, "epoch": 3375} {"train_loss": -6.75167989730835, "global_step": 141760, "epoch": 3375} {"train_loss": -6.70225715637207, "global_step": 141761, "epoch": 3375} {"train_loss": -6.708664417266846, "global_step": 141762, "epoch": 3375} {"train_loss": -6.762086868286133, "global_step": 141763, "epoch": 3375} {"train_loss": -6.605501651763916, "global_step": 141764, "epoch": 3375} {"train_loss": -6.701437473297119, "global_step": 141765, "epoch": 3375} {"train_loss": -6.674398899078369, "global_step": 141766, "epoch": 3375} {"train_loss": -6.813296318054199, "global_step": 141767, "epoch": 3375} {"train_loss": -6.646501064300537, "global_step": 141768, "epoch": 3375} {"train_loss": -6.860909938812256, "global_step": 141769, "epoch": 3375} {"train_loss": -6.790896415710449, "global_step": 141770, "epoch": 3375} {"train_loss": -6.771001815795898, "global_step": 141771, "epoch": 3375} {"train_loss": -6.771082878112793, "global_step": 141772, "epoch": 3375} {"train_loss": -6.748198509216309, "global_step": 141773, "epoch": 3375} {"train_loss": -6.859153747558594, "global_step": 141774, "epoch": 3375} {"train_loss": -6.786855220794678, "global_step": 141775, "epoch": 3375} {"train_loss": -6.823088645935059, "global_step": 141776, "epoch": 3375} {"train_loss": -6.736724376678467, "global_step": 141777, "epoch": 3375} {"train_loss": -6.662577152252197, "global_step": 141778, "epoch": 3375} {"train_loss": -6.742513179779053, "global_step": 141779, "epoch": 3375} {"train_loss": -6.770796775817871, "global_step": 141780, "epoch": 3375} {"train_loss": -6.703393459320068, "global_step": 141781, "epoch": 3375} {"train_loss": -6.762998580932617, "global_step": 141782, "epoch": 3375} {"train_loss": -6.6699018478393555, "global_step": 141783, "epoch": 3375} {"train_loss": -6.7517218589782715, "global_step": 141784, "epoch": 3375} {"train_loss": -6.767493724822998, "global_step": 141785, "epoch": 3375} {"train_loss": -6.622147560119629, "global_step": 141786, "epoch": 3375} {"train_loss": -6.693234443664551, "global_step": 141787, "epoch": 3375} {"train_loss": -6.631661891937256, "global_step": 141788, "epoch": 3375} {"train_loss": -6.842023849487305, "global_step": 141789, "epoch": 3375} {"train_loss": -6.750818252563477, "global_step": 141790, "epoch": 3375} {"train_loss": -6.732486066364107, "global_step": 141791, "epoch": 3375, "val_loss": 68398.671875} {"train_loss": -6.836824417114258, "global_step": 141792, "epoch": 3376} {"train_loss": -6.722463607788086, "global_step": 141793, "epoch": 3376} {"train_loss": -6.723295211791992, "global_step": 141794, "epoch": 3376} {"train_loss": -6.715015888214111, "global_step": 141795, "epoch": 3376} {"train_loss": -6.715602397918701, "global_step": 141796, "epoch": 3376} {"train_loss": -6.764203071594238, "global_step": 141797, "epoch": 3376} {"train_loss": -6.700198650360107, "global_step": 141798, "epoch": 3376} {"train_loss": -6.671200752258301, "global_step": 141799, "epoch": 3376} {"train_loss": -6.771035194396973, "global_step": 141800, "epoch": 3376} {"train_loss": -6.636280536651611, "global_step": 141801, "epoch": 3376} {"train_loss": -6.713131427764893, "global_step": 141802, "epoch": 3376} {"train_loss": -6.633584499359131, "global_step": 141803, "epoch": 3376} {"train_loss": -6.562507629394531, "global_step": 141804, "epoch": 3376} {"train_loss": -6.7202606201171875, "global_step": 141805, "epoch": 3376} {"train_loss": -6.525193214416504, "global_step": 141806, "epoch": 3376} {"train_loss": -6.748777866363525, "global_step": 141807, "epoch": 3376} {"train_loss": -6.773241996765137, "global_step": 141808, "epoch": 3376} {"train_loss": -6.664686679840088, "global_step": 141809, "epoch": 3376} {"train_loss": -6.716987133026123, "global_step": 141810, "epoch": 3376} {"train_loss": -6.675544738769531, "global_step": 141811, "epoch": 3376} {"train_loss": -6.886042594909668, "global_step": 141812, "epoch": 3376} {"train_loss": -6.65177059173584, "global_step": 141813, "epoch": 3376} {"train_loss": -6.823559761047363, "global_step": 141814, "epoch": 3376} {"train_loss": -6.768857002258301, "global_step": 141815, "epoch": 3376} {"train_loss": -6.728376388549805, "global_step": 141816, "epoch": 3376} {"train_loss": -6.745077133178711, "global_step": 141817, "epoch": 3376} {"train_loss": -6.692685127258301, "global_step": 141818, "epoch": 3376} {"train_loss": -6.611742973327637, "global_step": 141819, "epoch": 3376} {"train_loss": -6.680835723876953, "global_step": 141820, "epoch": 3376} {"train_loss": -6.730067729949951, "global_step": 141821, "epoch": 3376} {"train_loss": -6.7019805908203125, "global_step": 141822, "epoch": 3376} {"train_loss": -6.708110809326172, "global_step": 141823, "epoch": 3376} {"train_loss": -6.770522117614746, "global_step": 141824, "epoch": 3376} {"train_loss": -6.718324661254883, "global_step": 141825, "epoch": 3376} {"train_loss": -6.660379409790039, "global_step": 141826, "epoch": 3376} {"train_loss": -6.716838836669922, "global_step": 141827, "epoch": 3376} {"train_loss": -6.70960807800293, "global_step": 141828, "epoch": 3376} {"train_loss": -6.733279228210449, "global_step": 141829, "epoch": 3376} {"train_loss": -6.718032360076904, "global_step": 141830, "epoch": 3376} {"train_loss": -6.7348103523254395, "global_step": 141831, "epoch": 3376} {"train_loss": -6.6551690101623535, "global_step": 141832, "epoch": 3376} {"train_loss": -6.7114386558532715, "global_step": 141833, "epoch": 3376, "val_loss": 68424.4921875} {"train_loss": -6.685656547546387, "global_step": 141834, "epoch": 3377} {"train_loss": -6.7702484130859375, "global_step": 141835, "epoch": 3377} {"train_loss": -6.7436699867248535, "global_step": 141836, "epoch": 3377} {"train_loss": -6.702438831329346, "global_step": 141837, "epoch": 3377} {"train_loss": -6.832466125488281, "global_step": 141838, "epoch": 3377} {"train_loss": -6.736146926879883, "global_step": 141839, "epoch": 3377} {"train_loss": -6.889129638671875, "global_step": 141840, "epoch": 3377} {"train_loss": -6.748266696929932, "global_step": 141841, "epoch": 3377} {"train_loss": -6.794343948364258, "global_step": 141842, "epoch": 3377} {"train_loss": -6.826250076293945, "global_step": 141843, "epoch": 3377} {"train_loss": -6.820738792419434, "global_step": 141844, "epoch": 3377} {"train_loss": -6.79727029800415, "global_step": 141845, "epoch": 3377} {"train_loss": -6.801896095275879, "global_step": 141846, "epoch": 3377} {"train_loss": -6.774582862854004, "global_step": 141847, "epoch": 3377} {"train_loss": -6.812295913696289, "global_step": 141848, "epoch": 3377} {"train_loss": -6.713446140289307, "global_step": 141849, "epoch": 3377} {"train_loss": -6.678653240203857, "global_step": 141850, "epoch": 3377} {"train_loss": -6.651134967803955, "global_step": 141851, "epoch": 3377} {"train_loss": -6.770124912261963, "global_step": 141852, "epoch": 3377} {"train_loss": -6.669492721557617, "global_step": 141853, "epoch": 3377} {"train_loss": -6.857476234436035, "global_step": 141854, "epoch": 3377} {"train_loss": -6.677720069885254, "global_step": 141855, "epoch": 3377} {"train_loss": -6.678778648376465, "global_step": 141856, "epoch": 3377} {"train_loss": -6.759490966796875, "global_step": 141857, "epoch": 3377} {"train_loss": -6.672292709350586, "global_step": 141858, "epoch": 3377} {"train_loss": -6.679933071136475, "global_step": 141859, "epoch": 3377} {"train_loss": -6.820713996887207, "global_step": 141860, "epoch": 3377} {"train_loss": -6.650726318359375, "global_step": 141861, "epoch": 3377} {"train_loss": -6.785057067871094, "global_step": 141862, "epoch": 3377} {"train_loss": -6.816683769226074, "global_step": 141863, "epoch": 3377} {"train_loss": -6.720703125, "global_step": 141864, "epoch": 3377} {"train_loss": -6.800992965698242, "global_step": 141865, "epoch": 3377} {"train_loss": -6.782340049743652, "global_step": 141866, "epoch": 3377} {"train_loss": -6.71227502822876, "global_step": 141867, "epoch": 3377} {"train_loss": -6.821799278259277, "global_step": 141868, "epoch": 3377} {"train_loss": -6.793649673461914, "global_step": 141869, "epoch": 3377} {"train_loss": -6.762997627258301, "global_step": 141870, "epoch": 3377} {"train_loss": -6.841965675354004, "global_step": 141871, "epoch": 3377} {"train_loss": -6.6431708335876465, "global_step": 141872, "epoch": 3377} {"train_loss": -6.679123878479004, "global_step": 141873, "epoch": 3377} {"train_loss": -6.777336120605469, "global_step": 141874, "epoch": 3377} {"train_loss": -6.754123971575782, "global_step": 141875, "epoch": 3377, "val_loss": 68457.5390625} {"train_loss": -6.794273853302002, "global_step": 141876, "epoch": 3378} {"train_loss": -6.732460021972656, "global_step": 141877, "epoch": 3378} {"train_loss": -6.738602161407471, "global_step": 141878, "epoch": 3378} {"train_loss": -6.78237247467041, "global_step": 141879, "epoch": 3378} {"train_loss": -6.802459716796875, "global_step": 141880, "epoch": 3378} {"train_loss": -6.782320022583008, "global_step": 141881, "epoch": 3378} {"train_loss": -6.816339492797852, "global_step": 141882, "epoch": 3378} {"train_loss": -6.7385735511779785, "global_step": 141883, "epoch": 3378} {"train_loss": -6.724438667297363, "global_step": 141884, "epoch": 3378} {"train_loss": -6.732368469238281, "global_step": 141885, "epoch": 3378} {"train_loss": -6.775027275085449, "global_step": 141886, "epoch": 3378} {"train_loss": -6.83720588684082, "global_step": 141887, "epoch": 3378} {"train_loss": -6.778717994689941, "global_step": 141888, "epoch": 3378} {"train_loss": -6.77437162399292, "global_step": 141889, "epoch": 3378} {"train_loss": -6.71345329284668, "global_step": 141890, "epoch": 3378} {"train_loss": -6.78308629989624, "global_step": 141891, "epoch": 3378} {"train_loss": -6.7722625732421875, "global_step": 141892, "epoch": 3378} {"train_loss": -6.778395652770996, "global_step": 141893, "epoch": 3378} {"train_loss": -6.844736099243164, "global_step": 141894, "epoch": 3378} {"train_loss": -6.718372821807861, "global_step": 141895, "epoch": 3378} {"train_loss": -6.759592533111572, "global_step": 141896, "epoch": 3378} {"train_loss": -6.76582670211792, "global_step": 141897, "epoch": 3378} {"train_loss": -6.6571044921875, "global_step": 141898, "epoch": 3378} {"train_loss": -6.835371494293213, "global_step": 141899, "epoch": 3378} {"train_loss": -6.6636962890625, "global_step": 141900, "epoch": 3378} {"train_loss": -6.7494964599609375, "global_step": 141901, "epoch": 3378} {"train_loss": -6.7265543937683105, "global_step": 141902, "epoch": 3378} {"train_loss": -6.872829437255859, "global_step": 141903, "epoch": 3378} {"train_loss": -6.7355217933654785, "global_step": 141904, "epoch": 3378} {"train_loss": -6.801031112670898, "global_step": 141905, "epoch": 3378} {"train_loss": -6.680787563323975, "global_step": 141906, "epoch": 3378} {"train_loss": -6.615798473358154, "global_step": 141907, "epoch": 3378} {"train_loss": -6.722510814666748, "global_step": 141908, "epoch": 3378} {"train_loss": -6.7816362380981445, "global_step": 141909, "epoch": 3378} {"train_loss": -6.790097713470459, "global_step": 141910, "epoch": 3378} {"train_loss": -6.837599754333496, "global_step": 141911, "epoch": 3378} {"train_loss": -6.848729133605957, "global_step": 141912, "epoch": 3378} {"train_loss": -6.7165937423706055, "global_step": 141913, "epoch": 3378} {"train_loss": -6.63485050201416, "global_step": 141914, "epoch": 3378} {"train_loss": -6.824690341949463, "global_step": 141915, "epoch": 3378} {"train_loss": -6.843809604644775, "global_step": 141916, "epoch": 3378} {"train_loss": -6.766004937035697, "global_step": 141917, "epoch": 3378, "val_loss": 68323.5546875} {"train_loss": -6.870123386383057, "global_step": 141918, "epoch": 3379} {"train_loss": -6.73692512512207, "global_step": 141919, "epoch": 3379} {"train_loss": -6.782768726348877, "global_step": 141920, "epoch": 3379} {"train_loss": -6.688912391662598, "global_step": 141921, "epoch": 3379} {"train_loss": -6.695717811584473, "global_step": 141922, "epoch": 3379} {"train_loss": -6.698089599609375, "global_step": 141923, "epoch": 3379} {"train_loss": -6.924611568450928, "global_step": 141924, "epoch": 3379} {"train_loss": -6.720102310180664, "global_step": 141925, "epoch": 3379} {"train_loss": -6.79741096496582, "global_step": 141926, "epoch": 3379} {"train_loss": -6.690781116485596, "global_step": 141927, "epoch": 3379} {"train_loss": -6.617619514465332, "global_step": 141928, "epoch": 3379} {"train_loss": -6.7594523429870605, "global_step": 141929, "epoch": 3379} {"train_loss": -6.633902549743652, "global_step": 141930, "epoch": 3379} {"train_loss": -6.689661502838135, "global_step": 141931, "epoch": 3379} {"train_loss": -6.632007598876953, "global_step": 141932, "epoch": 3379} {"train_loss": -6.686942100524902, "global_step": 141933, "epoch": 3379} {"train_loss": -6.861280918121338, "global_step": 141934, "epoch": 3379} {"train_loss": -6.678359031677246, "global_step": 141935, "epoch": 3379} {"train_loss": -6.654836654663086, "global_step": 141936, "epoch": 3379} {"train_loss": -6.674751281738281, "global_step": 141937, "epoch": 3379} {"train_loss": -6.683806419372559, "global_step": 141938, "epoch": 3379} {"train_loss": -6.72304630279541, "global_step": 141939, "epoch": 3379} {"train_loss": -6.631304740905762, "global_step": 141940, "epoch": 3379} {"train_loss": -6.831522464752197, "global_step": 141941, "epoch": 3379} {"train_loss": -6.726891994476318, "global_step": 141942, "epoch": 3379} {"train_loss": -6.7553911209106445, "global_step": 141943, "epoch": 3379} {"train_loss": -6.676188945770264, "global_step": 141944, "epoch": 3379} {"train_loss": -6.755451202392578, "global_step": 141945, "epoch": 3379} {"train_loss": -6.721335411071777, "global_step": 141946, "epoch": 3379} {"train_loss": -6.7373504638671875, "global_step": 141947, "epoch": 3379} {"train_loss": -6.791555881500244, "global_step": 141948, "epoch": 3379} {"train_loss": -6.775933742523193, "global_step": 141949, "epoch": 3379} {"train_loss": -6.708424091339111, "global_step": 141950, "epoch": 3379} {"train_loss": -6.760791778564453, "global_step": 141951, "epoch": 3379} {"train_loss": -6.677376747131348, "global_step": 141952, "epoch": 3379} {"train_loss": -6.739336013793945, "global_step": 141953, "epoch": 3379} {"train_loss": -6.780473709106445, "global_step": 141954, "epoch": 3379} {"train_loss": -6.798679351806641, "global_step": 141955, "epoch": 3379} {"train_loss": -6.742263317108154, "global_step": 141956, "epoch": 3379} {"train_loss": -6.816425323486328, "global_step": 141957, "epoch": 3379} {"train_loss": -6.721774578094482, "global_step": 141958, "epoch": 3379} {"train_loss": -6.731301773162115, "global_step": 141959, "epoch": 3379, "val_loss": 68462.609375} {"train_loss": -6.658020496368408, "global_step": 141960, "epoch": 3380} {"train_loss": -6.667623043060303, "global_step": 141961, "epoch": 3380} {"train_loss": -6.7501912117004395, "global_step": 141962, "epoch": 3380} {"train_loss": -6.828167915344238, "global_step": 141963, "epoch": 3380} {"train_loss": -6.840980529785156, "global_step": 141964, "epoch": 3380} {"train_loss": -6.772855758666992, "global_step": 141965, "epoch": 3380} {"train_loss": -6.667766094207764, "global_step": 141966, "epoch": 3380} {"train_loss": -6.828860282897949, "global_step": 141967, "epoch": 3380} {"train_loss": -6.597163200378418, "global_step": 141968, "epoch": 3380} {"train_loss": -6.803179740905762, "global_step": 141969, "epoch": 3380} {"train_loss": -6.746705532073975, "global_step": 141970, "epoch": 3380} {"train_loss": -6.668344497680664, "global_step": 141971, "epoch": 3380} {"train_loss": -6.830638408660889, "global_step": 141972, "epoch": 3380} {"train_loss": -6.6922831535339355, "global_step": 141973, "epoch": 3380} {"train_loss": -6.764796733856201, "global_step": 141974, "epoch": 3380} {"train_loss": -6.770807266235352, "global_step": 141975, "epoch": 3380} {"train_loss": -6.6729021072387695, "global_step": 141976, "epoch": 3380} {"train_loss": -6.728427886962891, "global_step": 141977, "epoch": 3380} {"train_loss": -6.829089641571045, "global_step": 141978, "epoch": 3380} {"train_loss": -6.8135175704956055, "global_step": 141979, "epoch": 3380} {"train_loss": -6.814260959625244, "global_step": 141980, "epoch": 3380} {"train_loss": -6.8443989753723145, "global_step": 141981, "epoch": 3380} {"train_loss": -6.7390923500061035, "global_step": 141982, "epoch": 3380} {"train_loss": -6.663555145263672, "global_step": 141983, "epoch": 3380} {"train_loss": -6.91180419921875, "global_step": 141984, "epoch": 3380} {"train_loss": -6.842192649841309, "global_step": 141985, "epoch": 3380} {"train_loss": -6.827142238616943, "global_step": 141986, "epoch": 3380} {"train_loss": -6.687919616699219, "global_step": 141987, "epoch": 3380} {"train_loss": -6.675065040588379, "global_step": 141988, "epoch": 3380} {"train_loss": -6.661995887756348, "global_step": 141989, "epoch": 3380} {"train_loss": -6.826888561248779, "global_step": 141990, "epoch": 3380} {"train_loss": -6.788061141967773, "global_step": 141991, "epoch": 3380} {"train_loss": -6.700170516967773, "global_step": 141992, "epoch": 3380} {"train_loss": -6.777387619018555, "global_step": 141993, "epoch": 3380} {"train_loss": -6.731559753417969, "global_step": 141994, "epoch": 3380} {"train_loss": -6.756051063537598, "global_step": 141995, "epoch": 3380} {"train_loss": -6.764595985412598, "global_step": 141996, "epoch": 3380} {"train_loss": -6.736967086791992, "global_step": 141997, "epoch": 3380} {"train_loss": -6.78558349609375, "global_step": 141998, "epoch": 3380} {"train_loss": -6.696392059326172, "global_step": 141999, "epoch": 3380} {"train_loss": -6.650669097900391, "global_step": 142000, "epoch": 3380} {"train_loss": -6.7515677611033125, "global_step": 142001, "epoch": 3380, "val_loss": 68443.9453125} {"train_loss": -6.824224472045898, "global_step": 142002, "epoch": 3381} {"train_loss": -6.639692306518555, "global_step": 142003, "epoch": 3381} {"train_loss": -6.693385124206543, "global_step": 142004, "epoch": 3381} {"train_loss": -6.754134178161621, "global_step": 142005, "epoch": 3381} {"train_loss": -6.754931449890137, "global_step": 142006, "epoch": 3381} {"train_loss": -6.664502143859863, "global_step": 142007, "epoch": 3381} {"train_loss": -6.78614616394043, "global_step": 142008, "epoch": 3381} {"train_loss": -6.775182723999023, "global_step": 142009, "epoch": 3381} {"train_loss": -6.724692344665527, "global_step": 142010, "epoch": 3381} {"train_loss": -6.865579605102539, "global_step": 142011, "epoch": 3381} {"train_loss": -6.701903343200684, "global_step": 142012, "epoch": 3381} {"train_loss": -6.650577545166016, "global_step": 142013, "epoch": 3381} {"train_loss": -6.857975482940674, "global_step": 142014, "epoch": 3381} {"train_loss": -6.737624645233154, "global_step": 142015, "epoch": 3381} {"train_loss": -6.6960883140563965, "global_step": 142016, "epoch": 3381} {"train_loss": -6.823223114013672, "global_step": 142017, "epoch": 3381} {"train_loss": -6.669337272644043, "global_step": 142018, "epoch": 3381} {"train_loss": -6.60702657699585, "global_step": 142019, "epoch": 3381} {"train_loss": -6.725639343261719, "global_step": 142020, "epoch": 3381} {"train_loss": -6.699517726898193, "global_step": 142021, "epoch": 3381} {"train_loss": -6.600548267364502, "global_step": 142022, "epoch": 3381} {"train_loss": -6.7016215324401855, "global_step": 142023, "epoch": 3381} {"train_loss": -6.747168064117432, "global_step": 142024, "epoch": 3381} {"train_loss": -6.72791862487793, "global_step": 142025, "epoch": 3381} {"train_loss": -6.761765003204346, "global_step": 142026, "epoch": 3381} {"train_loss": -6.5823283195495605, "global_step": 142027, "epoch": 3381} {"train_loss": -6.7648468017578125, "global_step": 142028, "epoch": 3381} {"train_loss": -6.76202392578125, "global_step": 142029, "epoch": 3381} {"train_loss": -6.778369903564453, "global_step": 142030, "epoch": 3381} {"train_loss": -6.712851524353027, "global_step": 142031, "epoch": 3381} {"train_loss": -6.740511417388916, "global_step": 142032, "epoch": 3381} {"train_loss": -6.784048080444336, "global_step": 142033, "epoch": 3381} {"train_loss": -6.775750160217285, "global_step": 142034, "epoch": 3381} {"train_loss": -6.724863529205322, "global_step": 142035, "epoch": 3381} {"train_loss": -6.73386287689209, "global_step": 142036, "epoch": 3381} {"train_loss": -6.734577178955078, "global_step": 142037, "epoch": 3381} {"train_loss": -6.755055904388428, "global_step": 142038, "epoch": 3381} {"train_loss": -6.694218158721924, "global_step": 142039, "epoch": 3381} {"train_loss": -6.766178131103516, "global_step": 142040, "epoch": 3381} {"train_loss": -6.737298488616943, "global_step": 142041, "epoch": 3381} {"train_loss": -6.616499900817871, "global_step": 142042, "epoch": 3381} {"train_loss": -6.728419144948323, "global_step": 142043, "epoch": 3381, "val_loss": 68368.1640625} {"train_loss": -6.786538124084473, "global_step": 142044, "epoch": 3382} {"train_loss": -6.709941864013672, "global_step": 142045, "epoch": 3382} {"train_loss": -6.82740592956543, "global_step": 142046, "epoch": 3382} {"train_loss": -6.728564262390137, "global_step": 142047, "epoch": 3382} {"train_loss": -6.729736328125, "global_step": 142048, "epoch": 3382} {"train_loss": -6.709484100341797, "global_step": 142049, "epoch": 3382} {"train_loss": -6.742466926574707, "global_step": 142050, "epoch": 3382} {"train_loss": -6.704465866088867, "global_step": 142051, "epoch": 3382} {"train_loss": -6.777841091156006, "global_step": 142052, "epoch": 3382} {"train_loss": -6.667636394500732, "global_step": 142053, "epoch": 3382} {"train_loss": -6.665009021759033, "global_step": 142054, "epoch": 3382} {"train_loss": -6.694684982299805, "global_step": 142055, "epoch": 3382} {"train_loss": -6.686864852905273, "global_step": 142056, "epoch": 3382} {"train_loss": -6.758918762207031, "global_step": 142057, "epoch": 3382} {"train_loss": -6.796295166015625, "global_step": 142058, "epoch": 3382} {"train_loss": -6.675970077514648, "global_step": 142059, "epoch": 3382} {"train_loss": -6.722367763519287, "global_step": 142060, "epoch": 3382} {"train_loss": -6.67585563659668, "global_step": 142061, "epoch": 3382} {"train_loss": -6.771801948547363, "global_step": 142062, "epoch": 3382} {"train_loss": -6.614802360534668, "global_step": 142063, "epoch": 3382} {"train_loss": -6.705202102661133, "global_step": 142064, "epoch": 3382} {"train_loss": -6.6193342208862305, "global_step": 142065, "epoch": 3382} {"train_loss": -6.6740288734436035, "global_step": 142066, "epoch": 3382} {"train_loss": -6.726513385772705, "global_step": 142067, "epoch": 3382} {"train_loss": -6.663822174072266, "global_step": 142068, "epoch": 3382} {"train_loss": -6.784270286560059, "global_step": 142069, "epoch": 3382} {"train_loss": -6.723721981048584, "global_step": 142070, "epoch": 3382} {"train_loss": -6.736349582672119, "global_step": 142071, "epoch": 3382} {"train_loss": -6.687803268432617, "global_step": 142072, "epoch": 3382} {"train_loss": -6.676878929138184, "global_step": 142073, "epoch": 3382} {"train_loss": -6.698209762573242, "global_step": 142074, "epoch": 3382} {"train_loss": -6.8040361404418945, "global_step": 142075, "epoch": 3382} {"train_loss": -6.72312593460083, "global_step": 142076, "epoch": 3382} {"train_loss": -6.7696332931518555, "global_step": 142077, "epoch": 3382} {"train_loss": -6.7187299728393555, "global_step": 142078, "epoch": 3382} {"train_loss": -6.740050792694092, "global_step": 142079, "epoch": 3382} {"train_loss": -6.676225662231445, "global_step": 142080, "epoch": 3382} {"train_loss": -6.724575042724609, "global_step": 142081, "epoch": 3382} {"train_loss": -6.787835121154785, "global_step": 142082, "epoch": 3382} {"train_loss": -6.7853779792785645, "global_step": 142083, "epoch": 3382} {"train_loss": -6.83699369430542, "global_step": 142084, "epoch": 3382} {"train_loss": -6.724503789629255, "global_step": 142085, "epoch": 3382, "val_loss": 68566.484375} {"train_loss": -6.844964981079102, "global_step": 142086, "epoch": 3383} {"train_loss": -6.7286376953125, "global_step": 142087, "epoch": 3383} {"train_loss": -6.7981061935424805, "global_step": 142088, "epoch": 3383} {"train_loss": -6.739673137664795, "global_step": 142089, "epoch": 3383} {"train_loss": -6.716324329376221, "global_step": 142090, "epoch": 3383} {"train_loss": -6.847548007965088, "global_step": 142091, "epoch": 3383} {"train_loss": -6.739478588104248, "global_step": 142092, "epoch": 3383} {"train_loss": -6.666939735412598, "global_step": 142093, "epoch": 3383} {"train_loss": -6.809685707092285, "global_step": 142094, "epoch": 3383} {"train_loss": -6.828951835632324, "global_step": 142095, "epoch": 3383} {"train_loss": -6.736014366149902, "global_step": 142096, "epoch": 3383} {"train_loss": -6.825626850128174, "global_step": 142097, "epoch": 3383} {"train_loss": -6.824489593505859, "global_step": 142098, "epoch": 3383} {"train_loss": -6.771527290344238, "global_step": 142099, "epoch": 3383} {"train_loss": -6.729683876037598, "global_step": 142100, "epoch": 3383} {"train_loss": -6.678500175476074, "global_step": 142101, "epoch": 3383} {"train_loss": -6.776614189147949, "global_step": 142102, "epoch": 3383} {"train_loss": -6.803314208984375, "global_step": 142103, "epoch": 3383} {"train_loss": -6.711620807647705, "global_step": 142104, "epoch": 3383} {"train_loss": -6.795769691467285, "global_step": 142105, "epoch": 3383} {"train_loss": -6.739215850830078, "global_step": 142106, "epoch": 3383} {"train_loss": -6.727916240692139, "global_step": 142107, "epoch": 3383} {"train_loss": -6.606250762939453, "global_step": 142108, "epoch": 3383} {"train_loss": -6.663583755493164, "global_step": 142109, "epoch": 3383} {"train_loss": -6.755922794342041, "global_step": 142110, "epoch": 3383} {"train_loss": -6.653075218200684, "global_step": 142111, "epoch": 3383} {"train_loss": -6.750085830688477, "global_step": 142112, "epoch": 3383} {"train_loss": -6.686687469482422, "global_step": 142113, "epoch": 3383} {"train_loss": -6.587084770202637, "global_step": 142114, "epoch": 3383} {"train_loss": -6.669657230377197, "global_step": 142115, "epoch": 3383} {"train_loss": -6.587424278259277, "global_step": 142116, "epoch": 3383} {"train_loss": -6.484991550445557, "global_step": 142117, "epoch": 3383} {"train_loss": -6.666266441345215, "global_step": 142118, "epoch": 3383} {"train_loss": -6.45481014251709, "global_step": 142119, "epoch": 3383} {"train_loss": -6.641622543334961, "global_step": 142120, "epoch": 3383} {"train_loss": -6.505841255187988, "global_step": 142121, "epoch": 3383} {"train_loss": -6.655451774597168, "global_step": 142122, "epoch": 3383} {"train_loss": -6.42158317565918, "global_step": 142123, "epoch": 3383} {"train_loss": -6.742541790008545, "global_step": 142124, "epoch": 3383} {"train_loss": -6.531227111816406, "global_step": 142125, "epoch": 3383} {"train_loss": -6.825006484985352, "global_step": 142126, "epoch": 3383} {"train_loss": -6.694236437479655, "global_step": 142127, "epoch": 3383, "val_loss": 68320.3046875} {"train_loss": -6.770042419433594, "global_step": 142128, "epoch": 3384} {"train_loss": -6.569405555725098, "global_step": 142129, "epoch": 3384} {"train_loss": -6.645137786865234, "global_step": 142130, "epoch": 3384} {"train_loss": -6.460419654846191, "global_step": 142131, "epoch": 3384} {"train_loss": -6.6763081550598145, "global_step": 142132, "epoch": 3384} {"train_loss": -6.580256462097168, "global_step": 142133, "epoch": 3384} {"train_loss": -6.523312568664551, "global_step": 142134, "epoch": 3384} {"train_loss": -6.6459245681762695, "global_step": 142135, "epoch": 3384} {"train_loss": -6.695130348205566, "global_step": 142136, "epoch": 3384} {"train_loss": -6.697081565856934, "global_step": 142137, "epoch": 3384} {"train_loss": -6.578615188598633, "global_step": 142138, "epoch": 3384} {"train_loss": -6.643074989318848, "global_step": 142139, "epoch": 3384} {"train_loss": -6.650128364562988, "global_step": 142140, "epoch": 3384} {"train_loss": -6.651482582092285, "global_step": 142141, "epoch": 3384} {"train_loss": -6.735045909881592, "global_step": 142142, "epoch": 3384} {"train_loss": -6.737199783325195, "global_step": 142143, "epoch": 3384} {"train_loss": -6.62733793258667, "global_step": 142144, "epoch": 3384} {"train_loss": -6.665269374847412, "global_step": 142145, "epoch": 3384} {"train_loss": -6.64444637298584, "global_step": 142146, "epoch": 3384} {"train_loss": -6.740865230560303, "global_step": 142147, "epoch": 3384} {"train_loss": -6.763099670410156, "global_step": 142148, "epoch": 3384} {"train_loss": -6.8011860847473145, "global_step": 142149, "epoch": 3384} {"train_loss": -6.739217758178711, "global_step": 142150, "epoch": 3384} {"train_loss": -6.7701334953308105, "global_step": 142151, "epoch": 3384} {"train_loss": -6.680294036865234, "global_step": 142152, "epoch": 3384} {"train_loss": -6.697596549987793, "global_step": 142153, "epoch": 3384} {"train_loss": -6.764854431152344, "global_step": 142154, "epoch": 3384} {"train_loss": -6.744600296020508, "global_step": 142155, "epoch": 3384} {"train_loss": -6.721332550048828, "global_step": 142156, "epoch": 3384} {"train_loss": -6.707638740539551, "global_step": 142157, "epoch": 3384} {"train_loss": -6.754478454589844, "global_step": 142158, "epoch": 3384} {"train_loss": -6.715642929077148, "global_step": 142159, "epoch": 3384} {"train_loss": -6.760527610778809, "global_step": 142160, "epoch": 3384} {"train_loss": -6.815905570983887, "global_step": 142161, "epoch": 3384} {"train_loss": -6.724237442016602, "global_step": 142162, "epoch": 3384} {"train_loss": -6.736384391784668, "global_step": 142163, "epoch": 3384} {"train_loss": -6.734657287597656, "global_step": 142164, "epoch": 3384} {"train_loss": -6.861249923706055, "global_step": 142165, "epoch": 3384} {"train_loss": -6.747010707855225, "global_step": 142166, "epoch": 3384} {"train_loss": -6.7856903076171875, "global_step": 142167, "epoch": 3384} {"train_loss": -6.72526216506958, "global_step": 142168, "epoch": 3384} {"train_loss": -6.701733464286441, "global_step": 142169, "epoch": 3384, "val_loss": 68175.4375} {"train_loss": -6.621389865875244, "global_step": 142170, "epoch": 3385} {"train_loss": -6.6895904541015625, "global_step": 142171, "epoch": 3385} {"train_loss": -6.768118858337402, "global_step": 142172, "epoch": 3385} {"train_loss": -6.6981401443481445, "global_step": 142173, "epoch": 3385} {"train_loss": -6.8420000076293945, "global_step": 142174, "epoch": 3385} {"train_loss": -6.801264762878418, "global_step": 142175, "epoch": 3385} {"train_loss": -6.8466691970825195, "global_step": 142176, "epoch": 3385} {"train_loss": -6.855384826660156, "global_step": 142177, "epoch": 3385} {"train_loss": -6.734857082366943, "global_step": 142178, "epoch": 3385} {"train_loss": -6.812171936035156, "global_step": 142179, "epoch": 3385} {"train_loss": -6.883824348449707, "global_step": 142180, "epoch": 3385} {"train_loss": -6.774815082550049, "global_step": 142181, "epoch": 3385} {"train_loss": -6.779892921447754, "global_step": 142182, "epoch": 3385} {"train_loss": -6.720479488372803, "global_step": 142183, "epoch": 3385} {"train_loss": -6.753600120544434, "global_step": 142184, "epoch": 3385} {"train_loss": -6.883942127227783, "global_step": 142185, "epoch": 3385} {"train_loss": -6.718177795410156, "global_step": 142186, "epoch": 3385} {"train_loss": -6.724742889404297, "global_step": 142187, "epoch": 3385} {"train_loss": -6.8551435470581055, "global_step": 142188, "epoch": 3385} {"train_loss": -6.7279558181762695, "global_step": 142189, "epoch": 3385} {"train_loss": -6.674938201904297, "global_step": 142190, "epoch": 3385} {"train_loss": -6.6525444984436035, "global_step": 142191, "epoch": 3385} {"train_loss": -6.8907670974731445, "global_step": 142192, "epoch": 3385} {"train_loss": -6.776991844177246, "global_step": 142193, "epoch": 3385} {"train_loss": -6.796236038208008, "global_step": 142194, "epoch": 3385} {"train_loss": -6.75742244720459, "global_step": 142195, "epoch": 3385} {"train_loss": -6.793702125549316, "global_step": 142196, "epoch": 3385} {"train_loss": -6.827108383178711, "global_step": 142197, "epoch": 3385} {"train_loss": -6.7571563720703125, "global_step": 142198, "epoch": 3385} {"train_loss": -6.763640403747559, "global_step": 142199, "epoch": 3385} {"train_loss": -6.748540878295898, "global_step": 142200, "epoch": 3385} {"train_loss": -6.6963019371032715, "global_step": 142201, "epoch": 3385} {"train_loss": -6.80204963684082, "global_step": 142202, "epoch": 3385} {"train_loss": -6.8428053855896, "global_step": 142203, "epoch": 3385} {"train_loss": -6.6748199462890625, "global_step": 142204, "epoch": 3385} {"train_loss": -6.71142053604126, "global_step": 142205, "epoch": 3385} {"train_loss": -6.756138324737549, "global_step": 142206, "epoch": 3385} {"train_loss": -6.730406761169434, "global_step": 142207, "epoch": 3385} {"train_loss": -6.707834720611572, "global_step": 142208, "epoch": 3385} {"train_loss": -6.827778339385986, "global_step": 142209, "epoch": 3385} {"train_loss": -6.591233253479004, "global_step": 142210, "epoch": 3385} {"train_loss": -6.7623197464715865, "global_step": 142211, "epoch": 3385, "val_loss": 68501.8046875} {"train_loss": -6.781466484069824, "global_step": 142212, "epoch": 3386} {"train_loss": -6.6334638595581055, "global_step": 142213, "epoch": 3386} {"train_loss": -6.732634544372559, "global_step": 142214, "epoch": 3386} {"train_loss": -6.771917343139648, "global_step": 142215, "epoch": 3386} {"train_loss": -6.7543182373046875, "global_step": 142216, "epoch": 3386} {"train_loss": -6.8427414894104, "global_step": 142217, "epoch": 3386} {"train_loss": -6.675870895385742, "global_step": 142218, "epoch": 3386} {"train_loss": -6.697014331817627, "global_step": 142219, "epoch": 3386} {"train_loss": -6.70725679397583, "global_step": 142220, "epoch": 3386} {"train_loss": -6.734281063079834, "global_step": 142221, "epoch": 3386} {"train_loss": -6.830805778503418, "global_step": 142222, "epoch": 3386} {"train_loss": -6.7342023849487305, "global_step": 142223, "epoch": 3386} {"train_loss": -6.728728294372559, "global_step": 142224, "epoch": 3386} {"train_loss": -6.735186576843262, "global_step": 142225, "epoch": 3386} {"train_loss": -6.630441188812256, "global_step": 142226, "epoch": 3386} {"train_loss": -6.658871650695801, "global_step": 142227, "epoch": 3386} {"train_loss": -6.654542922973633, "global_step": 142228, "epoch": 3386} {"train_loss": -6.701684951782227, "global_step": 142229, "epoch": 3386} {"train_loss": -6.733940124511719, "global_step": 142230, "epoch": 3386} {"train_loss": -6.639352321624756, "global_step": 142231, "epoch": 3386} {"train_loss": -6.814102649688721, "global_step": 142232, "epoch": 3386} {"train_loss": -6.606870174407959, "global_step": 142233, "epoch": 3386} {"train_loss": -6.566501617431641, "global_step": 142234, "epoch": 3386} {"train_loss": -6.678356170654297, "global_step": 142235, "epoch": 3386} {"train_loss": -6.588781833648682, "global_step": 142236, "epoch": 3386} {"train_loss": -6.738317966461182, "global_step": 142237, "epoch": 3386} {"train_loss": -6.6789021492004395, "global_step": 142238, "epoch": 3386} {"train_loss": -6.738254547119141, "global_step": 142239, "epoch": 3386} {"train_loss": -6.707305908203125, "global_step": 142240, "epoch": 3386} {"train_loss": -6.676689147949219, "global_step": 142241, "epoch": 3386} {"train_loss": -6.789158821105957, "global_step": 142242, "epoch": 3386} {"train_loss": -6.676368713378906, "global_step": 142243, "epoch": 3386} {"train_loss": -6.665295600891113, "global_step": 142244, "epoch": 3386} {"train_loss": -6.743351459503174, "global_step": 142245, "epoch": 3386} {"train_loss": -6.798539161682129, "global_step": 142246, "epoch": 3386} {"train_loss": -6.764073371887207, "global_step": 142247, "epoch": 3386} {"train_loss": -6.7495880126953125, "global_step": 142248, "epoch": 3386} {"train_loss": -6.805733680725098, "global_step": 142249, "epoch": 3386} {"train_loss": -6.751479148864746, "global_step": 142250, "epoch": 3386} {"train_loss": -6.721839904785156, "global_step": 142251, "epoch": 3386} {"train_loss": -6.675398826599121, "global_step": 142252, "epoch": 3386} {"train_loss": -6.712883915219988, "global_step": 142253, "epoch": 3386, "val_loss": 68282.171875} {"train_loss": -6.798338890075684, "global_step": 142254, "epoch": 3387} {"train_loss": -6.7790961265563965, "global_step": 142255, "epoch": 3387} {"train_loss": -6.745002746582031, "global_step": 142256, "epoch": 3387} {"train_loss": -6.688239097595215, "global_step": 142257, "epoch": 3387} {"train_loss": -6.79249382019043, "global_step": 142258, "epoch": 3387} {"train_loss": -6.758719444274902, "global_step": 142259, "epoch": 3387} {"train_loss": -6.889289379119873, "global_step": 142260, "epoch": 3387} {"train_loss": -6.834566116333008, "global_step": 142261, "epoch": 3387} {"train_loss": -6.894051551818848, "global_step": 142262, "epoch": 3387} {"train_loss": -6.753445625305176, "global_step": 142263, "epoch": 3387} {"train_loss": -6.8159027099609375, "global_step": 142264, "epoch": 3387} {"train_loss": -6.863339900970459, "global_step": 142265, "epoch": 3387} {"train_loss": -6.893808364868164, "global_step": 142266, "epoch": 3387} {"train_loss": -6.698177337646484, "global_step": 142267, "epoch": 3387} {"train_loss": -6.822932243347168, "global_step": 142268, "epoch": 3387} {"train_loss": -6.7818145751953125, "global_step": 142269, "epoch": 3387} {"train_loss": -6.681130409240723, "global_step": 142270, "epoch": 3387} {"train_loss": -6.642939567565918, "global_step": 142271, "epoch": 3387} {"train_loss": -6.672834873199463, "global_step": 142272, "epoch": 3387} {"train_loss": -6.676886558532715, "global_step": 142273, "epoch": 3387} {"train_loss": -6.692111968994141, "global_step": 142274, "epoch": 3387} {"train_loss": -6.6872406005859375, "global_step": 142275, "epoch": 3387} {"train_loss": -6.823244094848633, "global_step": 142276, "epoch": 3387} {"train_loss": -6.651415824890137, "global_step": 142277, "epoch": 3387} {"train_loss": -6.8197174072265625, "global_step": 142278, "epoch": 3387} {"train_loss": -6.744545936584473, "global_step": 142279, "epoch": 3387} {"train_loss": -6.7814741134643555, "global_step": 142280, "epoch": 3387} {"train_loss": -6.760067939758301, "global_step": 142281, "epoch": 3387} {"train_loss": -6.730724811553955, "global_step": 142282, "epoch": 3387} {"train_loss": -6.622782230377197, "global_step": 142283, "epoch": 3387} {"train_loss": -6.806591987609863, "global_step": 142284, "epoch": 3387} {"train_loss": -6.599432945251465, "global_step": 142285, "epoch": 3387} {"train_loss": -6.690995216369629, "global_step": 142286, "epoch": 3387} {"train_loss": -6.771803855895996, "global_step": 142287, "epoch": 3387} {"train_loss": -6.68428897857666, "global_step": 142288, "epoch": 3387} {"train_loss": -6.767601490020752, "global_step": 142289, "epoch": 3387} {"train_loss": -6.6251749992370605, "global_step": 142290, "epoch": 3387} {"train_loss": -6.751789093017578, "global_step": 142291, "epoch": 3387} {"train_loss": -6.725163459777832, "global_step": 142292, "epoch": 3387} {"train_loss": -6.619937419891357, "global_step": 142293, "epoch": 3387} {"train_loss": -6.709956645965576, "global_step": 142294, "epoch": 3387} {"train_loss": -6.740512189410982, "global_step": 142295, "epoch": 3387, "val_loss": 68447.0859375} {"train_loss": -6.588650703430176, "global_step": 142296, "epoch": 3388} {"train_loss": -6.664118766784668, "global_step": 142297, "epoch": 3388} {"train_loss": -6.767848014831543, "global_step": 142298, "epoch": 3388} {"train_loss": -6.628084182739258, "global_step": 142299, "epoch": 3388} {"train_loss": -6.804418563842773, "global_step": 142300, "epoch": 3388} {"train_loss": -6.6504974365234375, "global_step": 142301, "epoch": 3388} {"train_loss": -6.51055908203125, "global_step": 142302, "epoch": 3388} {"train_loss": -6.758890151977539, "global_step": 142303, "epoch": 3388} {"train_loss": -6.597990036010742, "global_step": 142304, "epoch": 3388} {"train_loss": -6.70747184753418, "global_step": 142305, "epoch": 3388} {"train_loss": -6.600941181182861, "global_step": 142306, "epoch": 3388} {"train_loss": -6.7401885986328125, "global_step": 142307, "epoch": 3388} {"train_loss": -6.677802085876465, "global_step": 142308, "epoch": 3388} {"train_loss": -6.604379653930664, "global_step": 142309, "epoch": 3388} {"train_loss": -6.860719680786133, "global_step": 142310, "epoch": 3388} {"train_loss": -6.713700294494629, "global_step": 142311, "epoch": 3388} {"train_loss": -6.790948867797852, "global_step": 142312, "epoch": 3388} {"train_loss": -6.803680419921875, "global_step": 142313, "epoch": 3388} {"train_loss": -6.756636619567871, "global_step": 142314, "epoch": 3388} {"train_loss": -6.768502235412598, "global_step": 142315, "epoch": 3388} {"train_loss": -6.745461463928223, "global_step": 142316, "epoch": 3388} {"train_loss": -6.574856281280518, "global_step": 142317, "epoch": 3388} {"train_loss": -6.767077445983887, "global_step": 142318, "epoch": 3388} {"train_loss": -6.714529991149902, "global_step": 142319, "epoch": 3388} {"train_loss": -6.709127426147461, "global_step": 142320, "epoch": 3388} {"train_loss": -6.752022743225098, "global_step": 142321, "epoch": 3388} {"train_loss": -6.8190765380859375, "global_step": 142322, "epoch": 3388} {"train_loss": -6.793252944946289, "global_step": 142323, "epoch": 3388} {"train_loss": -6.830211639404297, "global_step": 142324, "epoch": 3388} {"train_loss": -6.801583290100098, "global_step": 142325, "epoch": 3388} {"train_loss": -6.765149116516113, "global_step": 142326, "epoch": 3388} {"train_loss": -6.788702011108398, "global_step": 142327, "epoch": 3388} {"train_loss": -6.779225826263428, "global_step": 142328, "epoch": 3388} {"train_loss": -6.820746898651123, "global_step": 142329, "epoch": 3388} {"train_loss": -6.8113627433776855, "global_step": 142330, "epoch": 3388} {"train_loss": -6.647781848907471, "global_step": 142331, "epoch": 3388} {"train_loss": -6.897356986999512, "global_step": 142332, "epoch": 3388} {"train_loss": -6.828951835632324, "global_step": 142333, "epoch": 3388} {"train_loss": -6.778215408325195, "global_step": 142334, "epoch": 3388} {"train_loss": -6.759878158569336, "global_step": 142335, "epoch": 3388} {"train_loss": -6.809018611907959, "global_step": 142336, "epoch": 3388} {"train_loss": -6.736774626232329, "global_step": 142337, "epoch": 3388, "val_loss": 68437.1328125} {"train_loss": -6.737112045288086, "global_step": 142338, "epoch": 3389} {"train_loss": -6.790790557861328, "global_step": 142339, "epoch": 3389} {"train_loss": -6.701390266418457, "global_step": 142340, "epoch": 3389} {"train_loss": -6.597851276397705, "global_step": 142341, "epoch": 3389} {"train_loss": -6.592507362365723, "global_step": 142342, "epoch": 3389} {"train_loss": -6.623392105102539, "global_step": 142343, "epoch": 3389} {"train_loss": -6.53352165222168, "global_step": 142344, "epoch": 3389} {"train_loss": -6.665553092956543, "global_step": 142345, "epoch": 3389} {"train_loss": -6.626352310180664, "global_step": 142346, "epoch": 3389} {"train_loss": -6.711030960083008, "global_step": 142347, "epoch": 3389} {"train_loss": -6.803313255310059, "global_step": 142348, "epoch": 3389} {"train_loss": -6.712964057922363, "global_step": 142349, "epoch": 3389} {"train_loss": -6.595975875854492, "global_step": 142350, "epoch": 3389} {"train_loss": -6.565847396850586, "global_step": 142351, "epoch": 3389} {"train_loss": -6.782243728637695, "global_step": 142352, "epoch": 3389} {"train_loss": -6.712320804595947, "global_step": 142353, "epoch": 3389} {"train_loss": -6.676574230194092, "global_step": 142354, "epoch": 3389} {"train_loss": -6.749514579772949, "global_step": 142355, "epoch": 3389} {"train_loss": -6.762792587280273, "global_step": 142356, "epoch": 3389} {"train_loss": -6.735177040100098, "global_step": 142357, "epoch": 3389} {"train_loss": -6.7349748611450195, "global_step": 142358, "epoch": 3389} {"train_loss": -6.694211959838867, "global_step": 142359, "epoch": 3389} {"train_loss": -6.662696361541748, "global_step": 142360, "epoch": 3389} {"train_loss": -6.729482173919678, "global_step": 142361, "epoch": 3389} {"train_loss": -6.771522045135498, "global_step": 142362, "epoch": 3389} {"train_loss": -6.716363906860352, "global_step": 142363, "epoch": 3389} {"train_loss": -6.633876800537109, "global_step": 142364, "epoch": 3389} {"train_loss": -6.912425994873047, "global_step": 142365, "epoch": 3389} {"train_loss": -6.703202247619629, "global_step": 142366, "epoch": 3389} {"train_loss": -6.709443092346191, "global_step": 142367, "epoch": 3389} {"train_loss": -6.785203456878662, "global_step": 142368, "epoch": 3389} {"train_loss": -6.4878644943237305, "global_step": 142369, "epoch": 3389} {"train_loss": -6.647549152374268, "global_step": 142370, "epoch": 3389} {"train_loss": -6.505693435668945, "global_step": 142371, "epoch": 3389} {"train_loss": -6.607885837554932, "global_step": 142372, "epoch": 3389} {"train_loss": -6.816567420959473, "global_step": 142373, "epoch": 3389} {"train_loss": -6.548506259918213, "global_step": 142374, "epoch": 3389} {"train_loss": -6.612001419067383, "global_step": 142375, "epoch": 3389} {"train_loss": -6.643011569976807, "global_step": 142376, "epoch": 3389} {"train_loss": -6.631204605102539, "global_step": 142377, "epoch": 3389} {"train_loss": -6.640681266784668, "global_step": 142378, "epoch": 3389} {"train_loss": -6.674765246255057, "global_step": 142379, "epoch": 3389, "val_loss": 68514.875} {"train_loss": -6.781638145446777, "global_step": 142380, "epoch": 3390} {"train_loss": -6.555093765258789, "global_step": 142381, "epoch": 3390} {"train_loss": -6.716259002685547, "global_step": 142382, "epoch": 3390} {"train_loss": -6.645869255065918, "global_step": 142383, "epoch": 3390} {"train_loss": -6.697751045227051, "global_step": 142384, "epoch": 3390} {"train_loss": -6.779068946838379, "global_step": 142385, "epoch": 3390} {"train_loss": -6.704017639160156, "global_step": 142386, "epoch": 3390} {"train_loss": -6.865972995758057, "global_step": 142387, "epoch": 3390} {"train_loss": -6.7987141609191895, "global_step": 142388, "epoch": 3390} {"train_loss": -6.673644065856934, "global_step": 142389, "epoch": 3390} {"train_loss": -6.792489051818848, "global_step": 142390, "epoch": 3390} {"train_loss": -6.74996280670166, "global_step": 142391, "epoch": 3390} {"train_loss": -6.725844383239746, "global_step": 142392, "epoch": 3390} {"train_loss": -6.801923751831055, "global_step": 142393, "epoch": 3390} {"train_loss": -6.74402379989624, "global_step": 142394, "epoch": 3390} {"train_loss": -6.744014739990234, "global_step": 142395, "epoch": 3390} {"train_loss": -6.7435760498046875, "global_step": 142396, "epoch": 3390} {"train_loss": -6.665040969848633, "global_step": 142397, "epoch": 3390} {"train_loss": -6.772674083709717, "global_step": 142398, "epoch": 3390} {"train_loss": -6.597881317138672, "global_step": 142399, "epoch": 3390} {"train_loss": -6.720341682434082, "global_step": 142400, "epoch": 3390} {"train_loss": -6.756762504577637, "global_step": 142401, "epoch": 3390} {"train_loss": -6.837822914123535, "global_step": 142402, "epoch": 3390} {"train_loss": -6.71343994140625, "global_step": 142403, "epoch": 3390} {"train_loss": -6.828416347503662, "global_step": 142404, "epoch": 3390} {"train_loss": -6.749192237854004, "global_step": 142405, "epoch": 3390} {"train_loss": -6.819612979888916, "global_step": 142406, "epoch": 3390} {"train_loss": -6.550387859344482, "global_step": 142407, "epoch": 3390} {"train_loss": -6.729190826416016, "global_step": 142408, "epoch": 3390} {"train_loss": -6.74570369720459, "global_step": 142409, "epoch": 3390} {"train_loss": -6.656623840332031, "global_step": 142410, "epoch": 3390} {"train_loss": -6.768589019775391, "global_step": 142411, "epoch": 3390} {"train_loss": -6.581504821777344, "global_step": 142412, "epoch": 3390} {"train_loss": -6.740965366363525, "global_step": 142413, "epoch": 3390} {"train_loss": -6.732113361358643, "global_step": 142414, "epoch": 3390} {"train_loss": -6.794058799743652, "global_step": 142415, "epoch": 3390} {"train_loss": -6.695754051208496, "global_step": 142416, "epoch": 3390} {"train_loss": -6.834664821624756, "global_step": 142417, "epoch": 3390} {"train_loss": -6.756949424743652, "global_step": 142418, "epoch": 3390} {"train_loss": -6.800641059875488, "global_step": 142419, "epoch": 3390} {"train_loss": -6.740924835205078, "global_step": 142420, "epoch": 3390} {"train_loss": -6.733414161772955, "global_step": 142421, "epoch": 3390, "val_loss": 68410.7421875} {"train_loss": -6.763332366943359, "global_step": 142422, "epoch": 3391} {"train_loss": -6.709195613861084, "global_step": 142423, "epoch": 3391} {"train_loss": -6.710809707641602, "global_step": 142424, "epoch": 3391} {"train_loss": -6.717992782592773, "global_step": 142425, "epoch": 3391} {"train_loss": -6.756167411804199, "global_step": 142426, "epoch": 3391} {"train_loss": -6.722630023956299, "global_step": 142427, "epoch": 3391} {"train_loss": -6.808287620544434, "global_step": 142428, "epoch": 3391} {"train_loss": -6.808290004730225, "global_step": 142429, "epoch": 3391} {"train_loss": -6.818894386291504, "global_step": 142430, "epoch": 3391} {"train_loss": -6.8032121658325195, "global_step": 142431, "epoch": 3391} {"train_loss": -6.681184768676758, "global_step": 142432, "epoch": 3391} {"train_loss": -6.758155345916748, "global_step": 142433, "epoch": 3391} {"train_loss": -6.8971171379089355, "global_step": 142434, "epoch": 3391} {"train_loss": -6.780832290649414, "global_step": 142435, "epoch": 3391} {"train_loss": -6.754022598266602, "global_step": 142436, "epoch": 3391} {"train_loss": -6.893409252166748, "global_step": 142437, "epoch": 3391} {"train_loss": -6.774007797241211, "global_step": 142438, "epoch": 3391} {"train_loss": -6.8559160232543945, "global_step": 142439, "epoch": 3391} {"train_loss": -6.722879886627197, "global_step": 142440, "epoch": 3391} {"train_loss": -6.83865213394165, "global_step": 142441, "epoch": 3391} {"train_loss": -6.795234680175781, "global_step": 142442, "epoch": 3391} {"train_loss": -6.701343536376953, "global_step": 142443, "epoch": 3391} {"train_loss": -6.623645782470703, "global_step": 142444, "epoch": 3391} {"train_loss": -6.916481971740723, "global_step": 142445, "epoch": 3391} {"train_loss": -6.767568111419678, "global_step": 142446, "epoch": 3391} {"train_loss": -6.816502571105957, "global_step": 142447, "epoch": 3391} {"train_loss": -6.783884048461914, "global_step": 142448, "epoch": 3391} {"train_loss": -6.695652008056641, "global_step": 142449, "epoch": 3391} {"train_loss": -6.8093719482421875, "global_step": 142450, "epoch": 3391} {"train_loss": -6.57987117767334, "global_step": 142451, "epoch": 3391} {"train_loss": -6.740230083465576, "global_step": 142452, "epoch": 3391} {"train_loss": -6.748608589172363, "global_step": 142453, "epoch": 3391} {"train_loss": -6.678497314453125, "global_step": 142454, "epoch": 3391} {"train_loss": -6.58099889755249, "global_step": 142455, "epoch": 3391} {"train_loss": -6.53228759765625, "global_step": 142456, "epoch": 3391} {"train_loss": -6.744912147521973, "global_step": 142457, "epoch": 3391} {"train_loss": -6.718752861022949, "global_step": 142458, "epoch": 3391} {"train_loss": -6.5899658203125, "global_step": 142459, "epoch": 3391} {"train_loss": -6.70026969909668, "global_step": 142460, "epoch": 3391} {"train_loss": -6.690183639526367, "global_step": 142461, "epoch": 3391} {"train_loss": -6.628120422363281, "global_step": 142462, "epoch": 3391} {"train_loss": -6.7398878165653775, "global_step": 142463, "epoch": 3391, "val_loss": 68423.34375} {"train_loss": -6.7515997886657715, "global_step": 142464, "epoch": 3392} {"train_loss": -6.6560564041137695, "global_step": 142465, "epoch": 3392} {"train_loss": -6.762230396270752, "global_step": 142466, "epoch": 3392} {"train_loss": -6.701811790466309, "global_step": 142467, "epoch": 3392} {"train_loss": -6.763062000274658, "global_step": 142468, "epoch": 3392} {"train_loss": -6.655786514282227, "global_step": 142469, "epoch": 3392} {"train_loss": -6.7042622566223145, "global_step": 142470, "epoch": 3392} {"train_loss": -6.66496467590332, "global_step": 142471, "epoch": 3392} {"train_loss": -6.855465888977051, "global_step": 142472, "epoch": 3392} {"train_loss": -6.61759090423584, "global_step": 142473, "epoch": 3392} {"train_loss": -6.673577308654785, "global_step": 142474, "epoch": 3392} {"train_loss": -6.69478702545166, "global_step": 142475, "epoch": 3392} {"train_loss": -6.674948215484619, "global_step": 142476, "epoch": 3392} {"train_loss": -6.8841705322265625, "global_step": 142477, "epoch": 3392} {"train_loss": -6.615601539611816, "global_step": 142478, "epoch": 3392} {"train_loss": -6.768892288208008, "global_step": 142479, "epoch": 3392} {"train_loss": -6.758449554443359, "global_step": 142480, "epoch": 3392} {"train_loss": -6.875637054443359, "global_step": 142481, "epoch": 3392} {"train_loss": -6.704808712005615, "global_step": 142482, "epoch": 3392} {"train_loss": -6.875182151794434, "global_step": 142483, "epoch": 3392} {"train_loss": -6.859224796295166, "global_step": 142484, "epoch": 3392} {"train_loss": -6.766814231872559, "global_step": 142485, "epoch": 3392} {"train_loss": -6.733048915863037, "global_step": 142486, "epoch": 3392} {"train_loss": -6.677814483642578, "global_step": 142487, "epoch": 3392} {"train_loss": -6.824390411376953, "global_step": 142488, "epoch": 3392} {"train_loss": -6.6783037185668945, "global_step": 142489, "epoch": 3392} {"train_loss": -6.736008644104004, "global_step": 142490, "epoch": 3392} {"train_loss": -6.7310895919799805, "global_step": 142491, "epoch": 3392} {"train_loss": -6.747835636138916, "global_step": 142492, "epoch": 3392} {"train_loss": -6.723424911499023, "global_step": 142493, "epoch": 3392} {"train_loss": -6.686720848083496, "global_step": 142494, "epoch": 3392} {"train_loss": -6.674677848815918, "global_step": 142495, "epoch": 3392} {"train_loss": -6.8184075355529785, "global_step": 142496, "epoch": 3392} {"train_loss": -6.704319000244141, "global_step": 142497, "epoch": 3392} {"train_loss": -6.785266876220703, "global_step": 142498, "epoch": 3392} {"train_loss": -6.835188388824463, "global_step": 142499, "epoch": 3392} {"train_loss": -6.786921501159668, "global_step": 142500, "epoch": 3392} {"train_loss": -6.738210678100586, "global_step": 142501, "epoch": 3392} {"train_loss": -6.7223663330078125, "global_step": 142502, "epoch": 3392} {"train_loss": -6.815274715423584, "global_step": 142503, "epoch": 3392} {"train_loss": -6.762233734130859, "global_step": 142504, "epoch": 3392} {"train_loss": -6.744225626900082, "global_step": 142505, "epoch": 3392, "val_loss": 68429.984375} {"train_loss": -6.836160659790039, "global_step": 142506, "epoch": 3393} {"train_loss": -6.805793762207031, "global_step": 142507, "epoch": 3393} {"train_loss": -6.722837448120117, "global_step": 142508, "epoch": 3393} {"train_loss": -6.839900493621826, "global_step": 142509, "epoch": 3393} {"train_loss": -6.700624465942383, "global_step": 142510, "epoch": 3393} {"train_loss": -6.793217182159424, "global_step": 142511, "epoch": 3393} {"train_loss": -6.659893989562988, "global_step": 142512, "epoch": 3393} {"train_loss": -6.6091203689575195, "global_step": 142513, "epoch": 3393} {"train_loss": -6.724276542663574, "global_step": 142514, "epoch": 3393} {"train_loss": -6.698241233825684, "global_step": 142515, "epoch": 3393} {"train_loss": -6.645009994506836, "global_step": 142516, "epoch": 3393} {"train_loss": -6.727919578552246, "global_step": 142517, "epoch": 3393} {"train_loss": -6.627816200256348, "global_step": 142518, "epoch": 3393} {"train_loss": -6.716804504394531, "global_step": 142519, "epoch": 3393} {"train_loss": -6.608830451965332, "global_step": 142520, "epoch": 3393} {"train_loss": -6.719757080078125, "global_step": 142521, "epoch": 3393} {"train_loss": -6.742815017700195, "global_step": 142522, "epoch": 3393} {"train_loss": -6.680440902709961, "global_step": 142523, "epoch": 3393} {"train_loss": -6.811930179595947, "global_step": 142524, "epoch": 3393} {"train_loss": -6.724792957305908, "global_step": 142525, "epoch": 3393} {"train_loss": -6.776642799377441, "global_step": 142526, "epoch": 3393} {"train_loss": -6.748726844787598, "global_step": 142527, "epoch": 3393} {"train_loss": -6.760596752166748, "global_step": 142528, "epoch": 3393} {"train_loss": -6.75749397277832, "global_step": 142529, "epoch": 3393} {"train_loss": -6.694629192352295, "global_step": 142530, "epoch": 3393} {"train_loss": -6.81369161605835, "global_step": 142531, "epoch": 3393} {"train_loss": -6.677350997924805, "global_step": 142532, "epoch": 3393} {"train_loss": -6.585413932800293, "global_step": 142533, "epoch": 3393} {"train_loss": -6.7310051918029785, "global_step": 142534, "epoch": 3393} {"train_loss": -6.746046543121338, "global_step": 142535, "epoch": 3393} {"train_loss": -6.723941802978516, "global_step": 142536, "epoch": 3393} {"train_loss": -6.848371505737305, "global_step": 142537, "epoch": 3393} {"train_loss": -6.639315605163574, "global_step": 142538, "epoch": 3393} {"train_loss": -6.714605331420898, "global_step": 142539, "epoch": 3393} {"train_loss": -6.742379188537598, "global_step": 142540, "epoch": 3393} {"train_loss": -6.709328651428223, "global_step": 142541, "epoch": 3393} {"train_loss": -6.728646278381348, "global_step": 142542, "epoch": 3393} {"train_loss": -6.79283332824707, "global_step": 142543, "epoch": 3393} {"train_loss": -6.667291164398193, "global_step": 142544, "epoch": 3393} {"train_loss": -6.808349609375, "global_step": 142545, "epoch": 3393} {"train_loss": -6.8350019454956055, "global_step": 142546, "epoch": 3393} {"train_loss": -6.732453141893659, "global_step": 142547, "epoch": 3393, "val_loss": 68313.2109375} {"train_loss": -6.799675941467285, "global_step": 142548, "epoch": 3394} {"train_loss": -6.828683376312256, "global_step": 142549, "epoch": 3394} {"train_loss": -6.7781877517700195, "global_step": 142550, "epoch": 3394} {"train_loss": -6.742285251617432, "global_step": 142551, "epoch": 3394} {"train_loss": -6.745414733886719, "global_step": 142552, "epoch": 3394} {"train_loss": -6.851168632507324, "global_step": 142553, "epoch": 3394} {"train_loss": -6.790860652923584, "global_step": 142554, "epoch": 3394} {"train_loss": -6.830617904663086, "global_step": 142555, "epoch": 3394} {"train_loss": -6.677635192871094, "global_step": 142556, "epoch": 3394} {"train_loss": -6.821930408477783, "global_step": 142557, "epoch": 3394} {"train_loss": -6.751721382141113, "global_step": 142558, "epoch": 3394} {"train_loss": -6.681567668914795, "global_step": 142559, "epoch": 3394} {"train_loss": -6.7213335037231445, "global_step": 142560, "epoch": 3394} {"train_loss": -6.732330322265625, "global_step": 142561, "epoch": 3394} {"train_loss": -6.712680816650391, "global_step": 142562, "epoch": 3394} {"train_loss": -6.642570495605469, "global_step": 142563, "epoch": 3394} {"train_loss": -6.6904096603393555, "global_step": 142564, "epoch": 3394} {"train_loss": -6.758490562438965, "global_step": 142565, "epoch": 3394} {"train_loss": -6.637890815734863, "global_step": 142566, "epoch": 3394} {"train_loss": -6.634373664855957, "global_step": 142567, "epoch": 3394} {"train_loss": -6.681182861328125, "global_step": 142568, "epoch": 3394} {"train_loss": -6.698060989379883, "global_step": 142569, "epoch": 3394} {"train_loss": -6.749595642089844, "global_step": 142570, "epoch": 3394} {"train_loss": -6.671173572540283, "global_step": 142571, "epoch": 3394} {"train_loss": -6.739645004272461, "global_step": 142572, "epoch": 3394} {"train_loss": -6.755794048309326, "global_step": 142573, "epoch": 3394} {"train_loss": -6.624370098114014, "global_step": 142574, "epoch": 3394} {"train_loss": -6.717947959899902, "global_step": 142575, "epoch": 3394} {"train_loss": -6.814735412597656, "global_step": 142576, "epoch": 3394} {"train_loss": -6.6256422996521, "global_step": 142577, "epoch": 3394} {"train_loss": -6.776534557342529, "global_step": 142578, "epoch": 3394} {"train_loss": -6.745574951171875, "global_step": 142579, "epoch": 3394} {"train_loss": -6.650825023651123, "global_step": 142580, "epoch": 3394} {"train_loss": -6.720481872558594, "global_step": 142581, "epoch": 3394} {"train_loss": -6.753256797790527, "global_step": 142582, "epoch": 3394} {"train_loss": -6.730716705322266, "global_step": 142583, "epoch": 3394} {"train_loss": -6.75588846206665, "global_step": 142584, "epoch": 3394} {"train_loss": -6.729585647583008, "global_step": 142585, "epoch": 3394} {"train_loss": -6.744777202606201, "global_step": 142586, "epoch": 3394} {"train_loss": -6.735411167144775, "global_step": 142587, "epoch": 3394} {"train_loss": -6.693361282348633, "global_step": 142588, "epoch": 3394} {"train_loss": -6.732526654288883, "global_step": 142589, "epoch": 3394, "val_loss": 68499.1484375} {"train_loss": -6.749629020690918, "global_step": 142590, "epoch": 3395} {"train_loss": -6.627378463745117, "global_step": 142591, "epoch": 3395} {"train_loss": -6.763949394226074, "global_step": 142592, "epoch": 3395} {"train_loss": -6.687600612640381, "global_step": 142593, "epoch": 3395} {"train_loss": -6.703266143798828, "global_step": 142594, "epoch": 3395} {"train_loss": -6.656223297119141, "global_step": 142595, "epoch": 3395} {"train_loss": -6.683520317077637, "global_step": 142596, "epoch": 3395} {"train_loss": -6.820762634277344, "global_step": 142597, "epoch": 3395} {"train_loss": -6.731818199157715, "global_step": 142598, "epoch": 3395} {"train_loss": -6.730743885040283, "global_step": 142599, "epoch": 3395} {"train_loss": -6.617651462554932, "global_step": 142600, "epoch": 3395} {"train_loss": -6.717884063720703, "global_step": 142601, "epoch": 3395} {"train_loss": -6.687325954437256, "global_step": 142602, "epoch": 3395} {"train_loss": -6.567312240600586, "global_step": 142603, "epoch": 3395} {"train_loss": -6.675577163696289, "global_step": 142604, "epoch": 3395} {"train_loss": -6.6890869140625, "global_step": 142605, "epoch": 3395} {"train_loss": -6.637139320373535, "global_step": 142606, "epoch": 3395} {"train_loss": -6.680028915405273, "global_step": 142607, "epoch": 3395} {"train_loss": -6.643274307250977, "global_step": 142608, "epoch": 3395} {"train_loss": -6.726759910583496, "global_step": 142609, "epoch": 3395} {"train_loss": -6.457907676696777, "global_step": 142610, "epoch": 3395} {"train_loss": -6.654777526855469, "global_step": 142611, "epoch": 3395} {"train_loss": -6.661635398864746, "global_step": 142612, "epoch": 3395} {"train_loss": -6.6657867431640625, "global_step": 142613, "epoch": 3395} {"train_loss": -6.616714954376221, "global_step": 142614, "epoch": 3395} {"train_loss": -6.512112617492676, "global_step": 142615, "epoch": 3395} {"train_loss": -6.625399589538574, "global_step": 142616, "epoch": 3395} {"train_loss": -6.492814064025879, "global_step": 142617, "epoch": 3395} {"train_loss": -6.745298862457275, "global_step": 142618, "epoch": 3395} {"train_loss": -6.537473678588867, "global_step": 142619, "epoch": 3395} {"train_loss": -6.614086151123047, "global_step": 142620, "epoch": 3395} {"train_loss": -6.627511024475098, "global_step": 142621, "epoch": 3395} {"train_loss": -6.5342302322387695, "global_step": 142622, "epoch": 3395} {"train_loss": -6.694931983947754, "global_step": 142623, "epoch": 3395} {"train_loss": -6.6111931800842285, "global_step": 142624, "epoch": 3395} {"train_loss": -6.684962272644043, "global_step": 142625, "epoch": 3395} {"train_loss": -6.619548797607422, "global_step": 142626, "epoch": 3395} {"train_loss": -6.68611478805542, "global_step": 142627, "epoch": 3395} {"train_loss": -6.573054790496826, "global_step": 142628, "epoch": 3395} {"train_loss": -6.680675506591797, "global_step": 142629, "epoch": 3395} {"train_loss": -6.644738674163818, "global_step": 142630, "epoch": 3395} {"train_loss": -6.655033145632062, "global_step": 142631, "epoch": 3395, "val_loss": 68334.2578125} {"train_loss": -6.562617778778076, "global_step": 142632, "epoch": 3396} {"train_loss": -6.557195663452148, "global_step": 142633, "epoch": 3396} {"train_loss": -6.772993564605713, "global_step": 142634, "epoch": 3396} {"train_loss": -6.72210168838501, "global_step": 142635, "epoch": 3396} {"train_loss": -6.788134574890137, "global_step": 142636, "epoch": 3396} {"train_loss": -6.603854179382324, "global_step": 142637, "epoch": 3396} {"train_loss": -6.840985298156738, "global_step": 142638, "epoch": 3396} {"train_loss": -6.809906959533691, "global_step": 142639, "epoch": 3396} {"train_loss": -6.727065086364746, "global_step": 142640, "epoch": 3396} {"train_loss": -6.79417610168457, "global_step": 142641, "epoch": 3396} {"train_loss": -6.6703314781188965, "global_step": 142642, "epoch": 3396} {"train_loss": -6.617964744567871, "global_step": 142643, "epoch": 3396} {"train_loss": -6.6117730140686035, "global_step": 142644, "epoch": 3396} {"train_loss": -6.758706092834473, "global_step": 142645, "epoch": 3396} {"train_loss": -6.860209941864014, "global_step": 142646, "epoch": 3396} {"train_loss": -6.6777448654174805, "global_step": 142647, "epoch": 3396} {"train_loss": -6.492107391357422, "global_step": 142648, "epoch": 3396} {"train_loss": -6.728711128234863, "global_step": 142649, "epoch": 3396} {"train_loss": -6.745006561279297, "global_step": 142650, "epoch": 3396} {"train_loss": -6.840762615203857, "global_step": 142651, "epoch": 3396} {"train_loss": -6.82949686050415, "global_step": 142652, "epoch": 3396} {"train_loss": -6.812405586242676, "global_step": 142653, "epoch": 3396} {"train_loss": -6.824071884155273, "global_step": 142654, "epoch": 3396} {"train_loss": -6.786669731140137, "global_step": 142655, "epoch": 3396} {"train_loss": -6.850612640380859, "global_step": 142656, "epoch": 3396} {"train_loss": -6.830383777618408, "global_step": 142657, "epoch": 3396} {"train_loss": -6.69113302230835, "global_step": 142658, "epoch": 3396} {"train_loss": -6.778485298156738, "global_step": 142659, "epoch": 3396} {"train_loss": -6.8445048332214355, "global_step": 142660, "epoch": 3396} {"train_loss": -6.7066240310668945, "global_step": 142661, "epoch": 3396} {"train_loss": -6.753244876861572, "global_step": 142662, "epoch": 3396} {"train_loss": -6.80931282043457, "global_step": 142663, "epoch": 3396} {"train_loss": -6.793940544128418, "global_step": 142664, "epoch": 3396} {"train_loss": -6.707710266113281, "global_step": 142665, "epoch": 3396} {"train_loss": -6.713984489440918, "global_step": 142666, "epoch": 3396} {"train_loss": -6.844667434692383, "global_step": 142667, "epoch": 3396} {"train_loss": -6.721364974975586, "global_step": 142668, "epoch": 3396} {"train_loss": -6.639373302459717, "global_step": 142669, "epoch": 3396} {"train_loss": -6.7186431884765625, "global_step": 142670, "epoch": 3396} {"train_loss": -6.767959117889404, "global_step": 142671, "epoch": 3396} {"train_loss": -6.730626106262207, "global_step": 142672, "epoch": 3396} {"train_loss": -6.739222185952323, "global_step": 142673, "epoch": 3396, "val_loss": 68448.53125} {"train_loss": -6.697197437286377, "global_step": 142674, "epoch": 3397} {"train_loss": -6.908557891845703, "global_step": 142675, "epoch": 3397} {"train_loss": -6.688359260559082, "global_step": 142676, "epoch": 3397} {"train_loss": -6.834376811981201, "global_step": 142677, "epoch": 3397} {"train_loss": -6.775320053100586, "global_step": 142678, "epoch": 3397} {"train_loss": -6.730944633483887, "global_step": 142679, "epoch": 3397} {"train_loss": -6.759500026702881, "global_step": 142680, "epoch": 3397} {"train_loss": -6.624801158905029, "global_step": 142681, "epoch": 3397} {"train_loss": -6.629481792449951, "global_step": 142682, "epoch": 3397} {"train_loss": -6.59356164932251, "global_step": 142683, "epoch": 3397} {"train_loss": -6.590497016906738, "global_step": 142684, "epoch": 3397} {"train_loss": -6.647037029266357, "global_step": 142685, "epoch": 3397} {"train_loss": -6.718697547912598, "global_step": 142686, "epoch": 3397} {"train_loss": -6.673793792724609, "global_step": 142687, "epoch": 3397} {"train_loss": -6.753236770629883, "global_step": 142688, "epoch": 3397} {"train_loss": -6.679771423339844, "global_step": 142689, "epoch": 3397} {"train_loss": -6.742286682128906, "global_step": 142690, "epoch": 3397} {"train_loss": -6.598209381103516, "global_step": 142691, "epoch": 3397} {"train_loss": -6.73675537109375, "global_step": 142692, "epoch": 3397} {"train_loss": -6.592960834503174, "global_step": 142693, "epoch": 3397} {"train_loss": -6.757979393005371, "global_step": 142694, "epoch": 3397} {"train_loss": -6.6841583251953125, "global_step": 142695, "epoch": 3397} {"train_loss": -6.762892723083496, "global_step": 142696, "epoch": 3397} {"train_loss": -6.70090389251709, "global_step": 142697, "epoch": 3397} {"train_loss": -6.66401481628418, "global_step": 142698, "epoch": 3397} {"train_loss": -6.737828254699707, "global_step": 142699, "epoch": 3397} {"train_loss": -6.733880996704102, "global_step": 142700, "epoch": 3397} {"train_loss": -6.786128997802734, "global_step": 142701, "epoch": 3397} {"train_loss": -6.775487899780273, "global_step": 142702, "epoch": 3397} {"train_loss": -6.792547225952148, "global_step": 142703, "epoch": 3397} {"train_loss": -6.767911911010742, "global_step": 142704, "epoch": 3397} {"train_loss": -6.833075523376465, "global_step": 142705, "epoch": 3397} {"train_loss": -6.888336181640625, "global_step": 142706, "epoch": 3397} {"train_loss": -6.777308940887451, "global_step": 142707, "epoch": 3397} {"train_loss": -6.7820634841918945, "global_step": 142708, "epoch": 3397} {"train_loss": -6.771958827972412, "global_step": 142709, "epoch": 3397} {"train_loss": -6.777224540710449, "global_step": 142710, "epoch": 3397} {"train_loss": -6.777750492095947, "global_step": 142711, "epoch": 3397} {"train_loss": -6.741694450378418, "global_step": 142712, "epoch": 3397} {"train_loss": -6.78411865234375, "global_step": 142713, "epoch": 3397} {"train_loss": -6.7251129150390625, "global_step": 142714, "epoch": 3397} {"train_loss": -6.73224477540879, "global_step": 142715, "epoch": 3397, "val_loss": 68345.5390625} {"train_loss": -6.751969337463379, "global_step": 142716, "epoch": 3398} {"train_loss": -6.845709323883057, "global_step": 142717, "epoch": 3398} {"train_loss": -6.665665626525879, "global_step": 142718, "epoch": 3398} {"train_loss": -6.732869625091553, "global_step": 142719, "epoch": 3398} {"train_loss": -6.834981441497803, "global_step": 142720, "epoch": 3398} {"train_loss": -6.773207664489746, "global_step": 142721, "epoch": 3398} {"train_loss": -6.757145881652832, "global_step": 142722, "epoch": 3398} {"train_loss": -6.803016185760498, "global_step": 142723, "epoch": 3398} {"train_loss": -6.774257183074951, "global_step": 142724, "epoch": 3398} {"train_loss": -6.73002290725708, "global_step": 142725, "epoch": 3398} {"train_loss": -6.831165790557861, "global_step": 142726, "epoch": 3398} {"train_loss": -6.653370380401611, "global_step": 142727, "epoch": 3398} {"train_loss": -6.7847065925598145, "global_step": 142728, "epoch": 3398} {"train_loss": -6.759255886077881, "global_step": 142729, "epoch": 3398} {"train_loss": -6.6906609535217285, "global_step": 142730, "epoch": 3398} {"train_loss": -6.653782367706299, "global_step": 142731, "epoch": 3398} {"train_loss": -6.81654167175293, "global_step": 142732, "epoch": 3398} {"train_loss": -6.836477279663086, "global_step": 142733, "epoch": 3398} {"train_loss": -6.765659809112549, "global_step": 142734, "epoch": 3398} {"train_loss": -6.656081199645996, "global_step": 142735, "epoch": 3398} {"train_loss": -6.724686145782471, "global_step": 142736, "epoch": 3398} {"train_loss": -6.591818809509277, "global_step": 142737, "epoch": 3398} {"train_loss": -6.8292436599731445, "global_step": 142738, "epoch": 3398} {"train_loss": -6.700571060180664, "global_step": 142739, "epoch": 3398} {"train_loss": -6.750107765197754, "global_step": 142740, "epoch": 3398} {"train_loss": -6.911753177642822, "global_step": 142741, "epoch": 3398} {"train_loss": -6.812741279602051, "global_step": 142742, "epoch": 3398} {"train_loss": -6.862217903137207, "global_step": 142743, "epoch": 3398} {"train_loss": -6.7174787521362305, "global_step": 142744, "epoch": 3398} {"train_loss": -6.76149320602417, "global_step": 142745, "epoch": 3398} {"train_loss": -6.7572126388549805, "global_step": 142746, "epoch": 3398} {"train_loss": -6.785397529602051, "global_step": 142747, "epoch": 3398} {"train_loss": -6.809168815612793, "global_step": 142748, "epoch": 3398} {"train_loss": -6.750204563140869, "global_step": 142749, "epoch": 3398} {"train_loss": -6.700432777404785, "global_step": 142750, "epoch": 3398} {"train_loss": -6.848091125488281, "global_step": 142751, "epoch": 3398} {"train_loss": -6.709253311157227, "global_step": 142752, "epoch": 3398} {"train_loss": -6.868885040283203, "global_step": 142753, "epoch": 3398} {"train_loss": -6.801761627197266, "global_step": 142754, "epoch": 3398} {"train_loss": -6.801884651184082, "global_step": 142755, "epoch": 3398} {"train_loss": -6.656044006347656, "global_step": 142756, "epoch": 3398} {"train_loss": -6.7619720186506, "global_step": 142757, "epoch": 3398, "val_loss": 68297.890625} {"train_loss": -6.625101089477539, "global_step": 142758, "epoch": 3399} {"train_loss": -6.849423408508301, "global_step": 142759, "epoch": 3399} {"train_loss": -6.78989315032959, "global_step": 142760, "epoch": 3399} {"train_loss": -6.67775821685791, "global_step": 142761, "epoch": 3399} {"train_loss": -6.874709606170654, "global_step": 142762, "epoch": 3399} {"train_loss": -6.734841823577881, "global_step": 142763, "epoch": 3399} {"train_loss": -6.82820987701416, "global_step": 142764, "epoch": 3399} {"train_loss": -6.795492172241211, "global_step": 142765, "epoch": 3399} {"train_loss": -6.910301208496094, "global_step": 142766, "epoch": 3399} {"train_loss": -6.805860996246338, "global_step": 142767, "epoch": 3399} {"train_loss": -6.783466339111328, "global_step": 142768, "epoch": 3399} {"train_loss": -6.840828895568848, "global_step": 142769, "epoch": 3399} {"train_loss": -6.8368449211120605, "global_step": 142770, "epoch": 3399} {"train_loss": -6.881956577301025, "global_step": 142771, "epoch": 3399} {"train_loss": -6.83170223236084, "global_step": 142772, "epoch": 3399} {"train_loss": -6.794126033782959, "global_step": 142773, "epoch": 3399} {"train_loss": -6.712995529174805, "global_step": 142774, "epoch": 3399} {"train_loss": -6.858136177062988, "global_step": 142775, "epoch": 3399} {"train_loss": -6.749508857727051, "global_step": 142776, "epoch": 3399} {"train_loss": -6.704353332519531, "global_step": 142777, "epoch": 3399} {"train_loss": -6.750035285949707, "global_step": 142778, "epoch": 3399} {"train_loss": -6.79948091506958, "global_step": 142779, "epoch": 3399} {"train_loss": -6.848380088806152, "global_step": 142780, "epoch": 3399} {"train_loss": -6.7277679443359375, "global_step": 142781, "epoch": 3399} {"train_loss": -6.735418319702148, "global_step": 142782, "epoch": 3399} {"train_loss": -6.788397789001465, "global_step": 142783, "epoch": 3399} {"train_loss": -6.836306095123291, "global_step": 142784, "epoch": 3399} {"train_loss": -6.7580366134643555, "global_step": 142785, "epoch": 3399} {"train_loss": -6.800374984741211, "global_step": 142786, "epoch": 3399} {"train_loss": -6.806456565856934, "global_step": 142787, "epoch": 3399} {"train_loss": -6.795191287994385, "global_step": 142788, "epoch": 3399} {"train_loss": -6.881888389587402, "global_step": 142789, "epoch": 3399} {"train_loss": -6.7389326095581055, "global_step": 142790, "epoch": 3399} {"train_loss": -6.829399585723877, "global_step": 142791, "epoch": 3399} {"train_loss": -6.813658237457275, "global_step": 142792, "epoch": 3399} {"train_loss": -6.926176071166992, "global_step": 142793, "epoch": 3399} {"train_loss": -6.895373344421387, "global_step": 142794, "epoch": 3399} {"train_loss": -6.824593544006348, "global_step": 142795, "epoch": 3399} {"train_loss": -6.891963481903076, "global_step": 142796, "epoch": 3399} {"train_loss": -6.866147994995117, "global_step": 142797, "epoch": 3399} {"train_loss": -6.787110328674316, "global_step": 142798, "epoch": 3399} {"train_loss": -6.802179109482538, "global_step": 142799, "epoch": 3399, "val_loss": 68340.421875} {"train_loss": -6.7475972175598145, "global_step": 142800, "epoch": 3400} {"train_loss": -6.859636306762695, "global_step": 142801, "epoch": 3400} {"train_loss": -6.742800235748291, "global_step": 142802, "epoch": 3400} {"train_loss": -6.631643295288086, "global_step": 142803, "epoch": 3400} {"train_loss": -6.709629058837891, "global_step": 142804, "epoch": 3400} {"train_loss": -6.674657821655273, "global_step": 142805, "epoch": 3400} {"train_loss": -6.651937007904053, "global_step": 142806, "epoch": 3400} {"train_loss": -6.671736717224121, "global_step": 142807, "epoch": 3400} {"train_loss": -6.659808158874512, "global_step": 142808, "epoch": 3400} {"train_loss": -6.716353416442871, "global_step": 142809, "epoch": 3400} {"train_loss": -6.779912948608398, "global_step": 142810, "epoch": 3400} {"train_loss": -6.556042671203613, "global_step": 142811, "epoch": 3400} {"train_loss": -6.675098896026611, "global_step": 142812, "epoch": 3400} {"train_loss": -6.706755638122559, "global_step": 142813, "epoch": 3400} {"train_loss": -6.688891410827637, "global_step": 142814, "epoch": 3400} {"train_loss": -6.588417053222656, "global_step": 142815, "epoch": 3400} {"train_loss": -6.607761383056641, "global_step": 142816, "epoch": 3400} {"train_loss": -6.717370510101318, "global_step": 142817, "epoch": 3400} {"train_loss": -6.617926120758057, "global_step": 142818, "epoch": 3400} {"train_loss": -6.6908979415893555, "global_step": 142819, "epoch": 3400} {"train_loss": -6.736005783081055, "global_step": 142820, "epoch": 3400} {"train_loss": -6.646061420440674, "global_step": 142821, "epoch": 3400} {"train_loss": -6.730696678161621, "global_step": 142822, "epoch": 3400} {"train_loss": -6.73982572555542, "global_step": 142823, "epoch": 3400} {"train_loss": -6.714784145355225, "global_step": 142824, "epoch": 3400} {"train_loss": -6.695156574249268, "global_step": 142825, "epoch": 3400} {"train_loss": -6.7336883544921875, "global_step": 142826, "epoch": 3400} {"train_loss": -6.738186836242676, "global_step": 142827, "epoch": 3400} {"train_loss": -6.719873428344727, "global_step": 142828, "epoch": 3400} {"train_loss": -6.782054901123047, "global_step": 142829, "epoch": 3400} {"train_loss": -6.680584907531738, "global_step": 142830, "epoch": 3400} {"train_loss": -6.705048561096191, "global_step": 142831, "epoch": 3400} {"train_loss": -6.572336196899414, "global_step": 142832, "epoch": 3400} {"train_loss": -6.741374492645264, "global_step": 142833, "epoch": 3400} {"train_loss": -6.699867248535156, "global_step": 142834, "epoch": 3400} {"train_loss": -6.685596466064453, "global_step": 142835, "epoch": 3400} {"train_loss": -6.647416591644287, "global_step": 142836, "epoch": 3400} {"train_loss": -6.717085361480713, "global_step": 142837, "epoch": 3400} {"train_loss": -6.822851181030273, "global_step": 142838, "epoch": 3400} {"train_loss": -6.642911434173584, "global_step": 142839, "epoch": 3400} {"train_loss": -6.708797454833984, "global_step": 142840, "epoch": 3400} {"train_loss": -6.696263971782866, "global_step": 142841, "epoch": 3400, "train/sim_max_reward_0": 0.2297030353333489, "train/sim_max_reward_1": 0.8830319610072829, "train/sim_max_reward_2": 0.9443073033473282, "train/sim_max_reward_3": 0.145606489130597, "train/sim_max_reward_4": 0.9759495187979118, "train/sim_max_reward_5": 0.9338950422461101, "test/sim_max_reward_4400000": 0.23511099316841919, "test/sim_max_reward_4400001": 0.9117769670942761, "test/sim_max_reward_4400002": 0.9377048415426761, "test/sim_max_reward_4400003": 0.8575863998870421, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.8320127973578257, "test/sim_max_reward_4400006": 0.9485285007349246, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.30598765432324165, "test/sim_max_reward_4400009": 0.87155809195563, "test/sim_max_reward_4400010": 0.20280800067282584, "test/sim_max_reward_4400011": 0.1028196415934442, "test/sim_max_reward_4400012": 0.8212965244057758, "test/sim_max_reward_4400013": 0.9246753496655832, "test/sim_max_reward_4400014": 0.9058505561053481, "test/sim_max_reward_4400015": 0.06162064860028479, "test/sim_max_reward_4400016": 0.04696137266702151, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2652665283778357, "test/sim_max_reward_4400019": 0.24559352465552084, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.224713139785731, "test/sim_max_reward_4400023": 0.9180197121527064, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.23707622015013005, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.9420767471914357, "test/sim_max_reward_4400029": 0.8025752959547007, "test/sim_max_reward_4400030": 0.9146764878942149, "test/sim_max_reward_4400031": 0.9748908262544236, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7231483087656917, "test/sim_max_reward_4400034": 0.9542261765287409, "test/sim_max_reward_4400035": 0.8380465516096317, "test/sim_max_reward_4400036": 0.6047091238592504, "test/sim_max_reward_4400037": 0.9866429078597742, "test/sim_max_reward_4400038": 0.9854958582046655, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8886372074155708, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.9344379325749383, "test/sim_max_reward_4400044": 0.9487566845508876, "test/sim_max_reward_4400045": 0.9459279935811955, "test/sim_max_reward_4400046": 0.9131717519011201, "test/sim_max_reward_4400047": 0.9781605157380329, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8295581742628939, "train/mean_score": 0.6854155583104298, "test/mean_score": 0.5518770582369055, "val_loss": 68557.109375} {"train_loss": -6.715464115142822, "global_step": 142842, "epoch": 3401} {"train_loss": -6.801294326782227, "global_step": 142843, "epoch": 3401} {"train_loss": -6.576274394989014, "global_step": 142844, "epoch": 3401} {"train_loss": -6.6762590408325195, "global_step": 142845, "epoch": 3401} {"train_loss": -6.6568803787231445, "global_step": 142846, "epoch": 3401} {"train_loss": -6.621312141418457, "global_step": 142847, "epoch": 3401} {"train_loss": -6.738715648651123, "global_step": 142848, "epoch": 3401} {"train_loss": -6.776668548583984, "global_step": 142849, "epoch": 3401} {"train_loss": -6.754488945007324, "global_step": 142850, "epoch": 3401} {"train_loss": -6.699843406677246, "global_step": 142851, "epoch": 3401} {"train_loss": -6.739299774169922, "global_step": 142852, "epoch": 3401} {"train_loss": -6.893883228302002, "global_step": 142853, "epoch": 3401} {"train_loss": -6.591238021850586, "global_step": 142854, "epoch": 3401} {"train_loss": -6.7098236083984375, "global_step": 142855, "epoch": 3401} {"train_loss": -6.665069103240967, "global_step": 142856, "epoch": 3401} {"train_loss": -6.731371879577637, "global_step": 142857, "epoch": 3401} {"train_loss": -6.8085784912109375, "global_step": 142858, "epoch": 3401} {"train_loss": -6.618983268737793, "global_step": 142859, "epoch": 3401} {"train_loss": -6.718430995941162, "global_step": 142860, "epoch": 3401} {"train_loss": -6.61297607421875, "global_step": 142861, "epoch": 3401} {"train_loss": -6.680181503295898, "global_step": 142862, "epoch": 3401} {"train_loss": -6.760717391967773, "global_step": 142863, "epoch": 3401} {"train_loss": -6.59679651260376, "global_step": 142864, "epoch": 3401} {"train_loss": -6.627365589141846, "global_step": 142865, "epoch": 3401} {"train_loss": -6.768004894256592, "global_step": 142866, "epoch": 3401} {"train_loss": -6.644278526306152, "global_step": 142867, "epoch": 3401} {"train_loss": -6.719043731689453, "global_step": 142868, "epoch": 3401} {"train_loss": -6.613431930541992, "global_step": 142869, "epoch": 3401} {"train_loss": -6.616368770599365, "global_step": 142870, "epoch": 3401} {"train_loss": -6.747072696685791, "global_step": 142871, "epoch": 3401} {"train_loss": -6.638260841369629, "global_step": 142872, "epoch": 3401} {"train_loss": -6.742812156677246, "global_step": 142873, "epoch": 3401} {"train_loss": -6.726435661315918, "global_step": 142874, "epoch": 3401} {"train_loss": -6.724143028259277, "global_step": 142875, "epoch": 3401} {"train_loss": -6.788061141967773, "global_step": 142876, "epoch": 3401} {"train_loss": -6.747786521911621, "global_step": 142877, "epoch": 3401} {"train_loss": -6.670095443725586, "global_step": 142878, "epoch": 3401} {"train_loss": -6.7382049560546875, "global_step": 142879, "epoch": 3401} {"train_loss": -6.751137733459473, "global_step": 142880, "epoch": 3401} {"train_loss": -6.829824447631836, "global_step": 142881, "epoch": 3401} {"train_loss": -6.842296123504639, "global_step": 142882, "epoch": 3401} {"train_loss": -6.709565946034023, "global_step": 142883, "epoch": 3401, "val_loss": 68346.6640625} {"train_loss": -6.773516654968262, "global_step": 142884, "epoch": 3402} {"train_loss": -6.7987236976623535, "global_step": 142885, "epoch": 3402} {"train_loss": -6.907959938049316, "global_step": 142886, "epoch": 3402} {"train_loss": -6.913675308227539, "global_step": 142887, "epoch": 3402} {"train_loss": -6.830135822296143, "global_step": 142888, "epoch": 3402} {"train_loss": -6.807494163513184, "global_step": 142889, "epoch": 3402} {"train_loss": -6.793601989746094, "global_step": 142890, "epoch": 3402} {"train_loss": -6.8711090087890625, "global_step": 142891, "epoch": 3402} {"train_loss": -6.808838844299316, "global_step": 142892, "epoch": 3402} {"train_loss": -6.731807708740234, "global_step": 142893, "epoch": 3402} {"train_loss": -6.843405723571777, "global_step": 142894, "epoch": 3402} {"train_loss": -6.779819488525391, "global_step": 142895, "epoch": 3402} {"train_loss": -6.878382682800293, "global_step": 142896, "epoch": 3402} {"train_loss": -6.750617027282715, "global_step": 142897, "epoch": 3402} {"train_loss": -6.699987411499023, "global_step": 142898, "epoch": 3402} {"train_loss": -6.796114921569824, "global_step": 142899, "epoch": 3402} {"train_loss": -6.7437286376953125, "global_step": 142900, "epoch": 3402} {"train_loss": -6.827847480773926, "global_step": 142901, "epoch": 3402} {"train_loss": -6.700667381286621, "global_step": 142902, "epoch": 3402} {"train_loss": -6.763412952423096, "global_step": 142903, "epoch": 3402} {"train_loss": -6.707332611083984, "global_step": 142904, "epoch": 3402} {"train_loss": -6.612067222595215, "global_step": 142905, "epoch": 3402} {"train_loss": -6.727119445800781, "global_step": 142906, "epoch": 3402} {"train_loss": -6.7024688720703125, "global_step": 142907, "epoch": 3402} {"train_loss": -6.672615051269531, "global_step": 142908, "epoch": 3402} {"train_loss": -6.644946098327637, "global_step": 142909, "epoch": 3402} {"train_loss": -6.676482200622559, "global_step": 142910, "epoch": 3402} {"train_loss": -6.648324012756348, "global_step": 142911, "epoch": 3402} {"train_loss": -6.674358367919922, "global_step": 142912, "epoch": 3402} {"train_loss": -6.621854782104492, "global_step": 142913, "epoch": 3402} {"train_loss": -6.715225696563721, "global_step": 142914, "epoch": 3402} {"train_loss": -6.684232711791992, "global_step": 142915, "epoch": 3402} {"train_loss": -6.732390403747559, "global_step": 142916, "epoch": 3402} {"train_loss": -6.649857044219971, "global_step": 142917, "epoch": 3402} {"train_loss": -6.55567741394043, "global_step": 142918, "epoch": 3402} {"train_loss": -6.792254447937012, "global_step": 142919, "epoch": 3402} {"train_loss": -6.679835319519043, "global_step": 142920, "epoch": 3402} {"train_loss": -6.6925458908081055, "global_step": 142921, "epoch": 3402} {"train_loss": -6.714877605438232, "global_step": 142922, "epoch": 3402} {"train_loss": -6.693462371826172, "global_step": 142923, "epoch": 3402} {"train_loss": -6.791444778442383, "global_step": 142924, "epoch": 3402} {"train_loss": -6.74323110353379, "global_step": 142925, "epoch": 3402, "val_loss": 68505.5} {"train_loss": -6.74123477935791, "global_step": 142926, "epoch": 3403} {"train_loss": -6.755270004272461, "global_step": 142927, "epoch": 3403} {"train_loss": -6.820533752441406, "global_step": 142928, "epoch": 3403} {"train_loss": -6.770693778991699, "global_step": 142929, "epoch": 3403} {"train_loss": -6.731393814086914, "global_step": 142930, "epoch": 3403} {"train_loss": -6.671563625335693, "global_step": 142931, "epoch": 3403} {"train_loss": -6.775561332702637, "global_step": 142932, "epoch": 3403} {"train_loss": -6.819292068481445, "global_step": 142933, "epoch": 3403} {"train_loss": -6.847132682800293, "global_step": 142934, "epoch": 3403} {"train_loss": -6.887598037719727, "global_step": 142935, "epoch": 3403} {"train_loss": -6.736546993255615, "global_step": 142936, "epoch": 3403} {"train_loss": -6.846296310424805, "global_step": 142937, "epoch": 3403} {"train_loss": -6.77802848815918, "global_step": 142938, "epoch": 3403} {"train_loss": -6.803413391113281, "global_step": 142939, "epoch": 3403} {"train_loss": -6.724225044250488, "global_step": 142940, "epoch": 3403} {"train_loss": -6.8283586502075195, "global_step": 142941, "epoch": 3403} {"train_loss": -6.697098731994629, "global_step": 142942, "epoch": 3403} {"train_loss": -6.799054145812988, "global_step": 142943, "epoch": 3403} {"train_loss": -6.7201972007751465, "global_step": 142944, "epoch": 3403} {"train_loss": -6.861443996429443, "global_step": 142945, "epoch": 3403} {"train_loss": -6.695897102355957, "global_step": 142946, "epoch": 3403} {"train_loss": -6.852147102355957, "global_step": 142947, "epoch": 3403} {"train_loss": -6.731600284576416, "global_step": 142948, "epoch": 3403} {"train_loss": -6.782524108886719, "global_step": 142949, "epoch": 3403} {"train_loss": -6.809531211853027, "global_step": 142950, "epoch": 3403} {"train_loss": -6.697302341461182, "global_step": 142951, "epoch": 3403} {"train_loss": -6.751623630523682, "global_step": 142952, "epoch": 3403} {"train_loss": -6.764742851257324, "global_step": 142953, "epoch": 3403} {"train_loss": -6.737864017486572, "global_step": 142954, "epoch": 3403} {"train_loss": -6.671283721923828, "global_step": 142955, "epoch": 3403} {"train_loss": -6.813116073608398, "global_step": 142956, "epoch": 3403} {"train_loss": -6.655849456787109, "global_step": 142957, "epoch": 3403} {"train_loss": -6.733661651611328, "global_step": 142958, "epoch": 3403} {"train_loss": -6.64593505859375, "global_step": 142959, "epoch": 3403} {"train_loss": -6.662660598754883, "global_step": 142960, "epoch": 3403} {"train_loss": -6.634085655212402, "global_step": 142961, "epoch": 3403} {"train_loss": -6.705137729644775, "global_step": 142962, "epoch": 3403} {"train_loss": -6.734050750732422, "global_step": 142963, "epoch": 3403} {"train_loss": -6.503395080566406, "global_step": 142964, "epoch": 3403} {"train_loss": -6.730683326721191, "global_step": 142965, "epoch": 3403} {"train_loss": -6.5633344650268555, "global_step": 142966, "epoch": 3403} {"train_loss": -6.740621975490025, "global_step": 142967, "epoch": 3403, "val_loss": 68325.140625} {"train_loss": -6.71013069152832, "global_step": 142968, "epoch": 3404} {"train_loss": -6.639005661010742, "global_step": 142969, "epoch": 3404} {"train_loss": -6.785376071929932, "global_step": 142970, "epoch": 3404} {"train_loss": -6.651154518127441, "global_step": 142971, "epoch": 3404} {"train_loss": -6.682218551635742, "global_step": 142972, "epoch": 3404} {"train_loss": -6.71182918548584, "global_step": 142973, "epoch": 3404} {"train_loss": -6.779450416564941, "global_step": 142974, "epoch": 3404} {"train_loss": -6.835603713989258, "global_step": 142975, "epoch": 3404} {"train_loss": -6.574273109436035, "global_step": 142976, "epoch": 3404} {"train_loss": -6.689862251281738, "global_step": 142977, "epoch": 3404} {"train_loss": -6.807027816772461, "global_step": 142978, "epoch": 3404} {"train_loss": -6.737339973449707, "global_step": 142979, "epoch": 3404} {"train_loss": -6.675737380981445, "global_step": 142980, "epoch": 3404} {"train_loss": -6.809358596801758, "global_step": 142981, "epoch": 3404} {"train_loss": -6.7509379386901855, "global_step": 142982, "epoch": 3404} {"train_loss": -6.7568745613098145, "global_step": 142983, "epoch": 3404} {"train_loss": -6.755834579467773, "global_step": 142984, "epoch": 3404} {"train_loss": -6.776315212249756, "global_step": 142985, "epoch": 3404} {"train_loss": -6.6920952796936035, "global_step": 142986, "epoch": 3404} {"train_loss": -6.862213134765625, "global_step": 142987, "epoch": 3404} {"train_loss": -6.739968299865723, "global_step": 142988, "epoch": 3404} {"train_loss": -6.720129489898682, "global_step": 142989, "epoch": 3404} {"train_loss": -6.769899845123291, "global_step": 142990, "epoch": 3404} {"train_loss": -6.755127906799316, "global_step": 142991, "epoch": 3404} {"train_loss": -6.764025688171387, "global_step": 142992, "epoch": 3404} {"train_loss": -6.8491902351379395, "global_step": 142993, "epoch": 3404} {"train_loss": -6.668476104736328, "global_step": 142994, "epoch": 3404} {"train_loss": -6.731383323669434, "global_step": 142995, "epoch": 3404} {"train_loss": -6.817129135131836, "global_step": 142996, "epoch": 3404} {"train_loss": -6.8245849609375, "global_step": 142997, "epoch": 3404} {"train_loss": -6.72840690612793, "global_step": 142998, "epoch": 3404} {"train_loss": -6.737410068511963, "global_step": 142999, "epoch": 3404} {"train_loss": -6.718502044677734, "global_step": 143000, "epoch": 3404} {"train_loss": -6.825490474700928, "global_step": 143001, "epoch": 3404} {"train_loss": -6.716183662414551, "global_step": 143002, "epoch": 3404} {"train_loss": -6.736438751220703, "global_step": 143003, "epoch": 3404} {"train_loss": -6.740209579467773, "global_step": 143004, "epoch": 3404} {"train_loss": -6.708250045776367, "global_step": 143005, "epoch": 3404} {"train_loss": -6.711480617523193, "global_step": 143006, "epoch": 3404} {"train_loss": -6.793930530548096, "global_step": 143007, "epoch": 3404} {"train_loss": -6.783899784088135, "global_step": 143008, "epoch": 3404} {"train_loss": -6.74802185240246, "global_step": 143009, "epoch": 3404, "val_loss": 68355.6640625} {"train_loss": -6.758147239685059, "global_step": 143010, "epoch": 3405} {"train_loss": -6.802064895629883, "global_step": 143011, "epoch": 3405} {"train_loss": -6.835980415344238, "global_step": 143012, "epoch": 3405} {"train_loss": -6.667061805725098, "global_step": 143013, "epoch": 3405} {"train_loss": -6.774309158325195, "global_step": 143014, "epoch": 3405} {"train_loss": -6.686984062194824, "global_step": 143015, "epoch": 3405} {"train_loss": -6.77016544342041, "global_step": 143016, "epoch": 3405} {"train_loss": -6.779424667358398, "global_step": 143017, "epoch": 3405} {"train_loss": -6.776616096496582, "global_step": 143018, "epoch": 3405} {"train_loss": -6.81380558013916, "global_step": 143019, "epoch": 3405} {"train_loss": -6.755096435546875, "global_step": 143020, "epoch": 3405} {"train_loss": -6.84706974029541, "global_step": 143021, "epoch": 3405} {"train_loss": -6.810116767883301, "global_step": 143022, "epoch": 3405} {"train_loss": -6.806013584136963, "global_step": 143023, "epoch": 3405} {"train_loss": -6.798560619354248, "global_step": 143024, "epoch": 3405} {"train_loss": -6.7557573318481445, "global_step": 143025, "epoch": 3405} {"train_loss": -6.7912774085998535, "global_step": 143026, "epoch": 3405} {"train_loss": -6.872450828552246, "global_step": 143027, "epoch": 3405} {"train_loss": -6.820643901824951, "global_step": 143028, "epoch": 3405} {"train_loss": -6.812204360961914, "global_step": 143029, "epoch": 3405} {"train_loss": -6.711498260498047, "global_step": 143030, "epoch": 3405} {"train_loss": -6.839683532714844, "global_step": 143031, "epoch": 3405} {"train_loss": -6.846536636352539, "global_step": 143032, "epoch": 3405} {"train_loss": -6.842015266418457, "global_step": 143033, "epoch": 3405} {"train_loss": -6.776442050933838, "global_step": 143034, "epoch": 3405} {"train_loss": -6.93036413192749, "global_step": 143035, "epoch": 3405} {"train_loss": -6.841854095458984, "global_step": 143036, "epoch": 3405} {"train_loss": -6.751951694488525, "global_step": 143037, "epoch": 3405} {"train_loss": -6.73716926574707, "global_step": 143038, "epoch": 3405} {"train_loss": -6.788193702697754, "global_step": 143039, "epoch": 3405} {"train_loss": -6.6648173332214355, "global_step": 143040, "epoch": 3405} {"train_loss": -6.716823577880859, "global_step": 143041, "epoch": 3405} {"train_loss": -6.7050065994262695, "global_step": 143042, "epoch": 3405} {"train_loss": -6.886283874511719, "global_step": 143043, "epoch": 3405} {"train_loss": -6.804121017456055, "global_step": 143044, "epoch": 3405} {"train_loss": -6.734450817108154, "global_step": 143045, "epoch": 3405} {"train_loss": -6.770125389099121, "global_step": 143046, "epoch": 3405} {"train_loss": -6.6981892585754395, "global_step": 143047, "epoch": 3405} {"train_loss": -6.6772050857543945, "global_step": 143048, "epoch": 3405} {"train_loss": -6.7830352783203125, "global_step": 143049, "epoch": 3405} {"train_loss": -6.72397518157959, "global_step": 143050, "epoch": 3405} {"train_loss": -6.7787763845352895, "global_step": 143051, "epoch": 3405, "val_loss": 68436.765625} {"train_loss": -6.68808650970459, "global_step": 143052, "epoch": 3406} {"train_loss": -6.7782206535339355, "global_step": 143053, "epoch": 3406} {"train_loss": -6.741083145141602, "global_step": 143054, "epoch": 3406} {"train_loss": -6.84033727645874, "global_step": 143055, "epoch": 3406} {"train_loss": -6.708437919616699, "global_step": 143056, "epoch": 3406} {"train_loss": -6.844160079956055, "global_step": 143057, "epoch": 3406} {"train_loss": -6.76640510559082, "global_step": 143058, "epoch": 3406} {"train_loss": -6.797395706176758, "global_step": 143059, "epoch": 3406} {"train_loss": -6.628166198730469, "global_step": 143060, "epoch": 3406} {"train_loss": -6.717187404632568, "global_step": 143061, "epoch": 3406} {"train_loss": -6.656487464904785, "global_step": 143062, "epoch": 3406} {"train_loss": -6.811319828033447, "global_step": 143063, "epoch": 3406} {"train_loss": -6.822689056396484, "global_step": 143064, "epoch": 3406} {"train_loss": -6.844175338745117, "global_step": 143065, "epoch": 3406} {"train_loss": -6.824169158935547, "global_step": 143066, "epoch": 3406} {"train_loss": -6.77160120010376, "global_step": 143067, "epoch": 3406} {"train_loss": -6.836402416229248, "global_step": 143068, "epoch": 3406} {"train_loss": -6.8373517990112305, "global_step": 143069, "epoch": 3406} {"train_loss": -6.716238498687744, "global_step": 143070, "epoch": 3406} {"train_loss": -6.666652202606201, "global_step": 143071, "epoch": 3406} {"train_loss": -6.4786882400512695, "global_step": 143072, "epoch": 3406} {"train_loss": -6.721158027648926, "global_step": 143073, "epoch": 3406} {"train_loss": -6.676508903503418, "global_step": 143074, "epoch": 3406} {"train_loss": -6.718461990356445, "global_step": 143075, "epoch": 3406} {"train_loss": -6.830872058868408, "global_step": 143076, "epoch": 3406} {"train_loss": -6.698291778564453, "global_step": 143077, "epoch": 3406} {"train_loss": -6.738499641418457, "global_step": 143078, "epoch": 3406} {"train_loss": -6.654947280883789, "global_step": 143079, "epoch": 3406} {"train_loss": -6.757199287414551, "global_step": 143080, "epoch": 3406} {"train_loss": -6.899736404418945, "global_step": 143081, "epoch": 3406} {"train_loss": -6.74454927444458, "global_step": 143082, "epoch": 3406} {"train_loss": -6.554147720336914, "global_step": 143083, "epoch": 3406} {"train_loss": -6.716065883636475, "global_step": 143084, "epoch": 3406} {"train_loss": -6.657983779907227, "global_step": 143085, "epoch": 3406} {"train_loss": -6.7157487869262695, "global_step": 143086, "epoch": 3406} {"train_loss": -6.723873138427734, "global_step": 143087, "epoch": 3406} {"train_loss": -6.781349182128906, "global_step": 143088, "epoch": 3406} {"train_loss": -6.667233467102051, "global_step": 143089, "epoch": 3406} {"train_loss": -6.748607635498047, "global_step": 143090, "epoch": 3406} {"train_loss": -6.768802165985107, "global_step": 143091, "epoch": 3406} {"train_loss": -6.700071334838867, "global_step": 143092, "epoch": 3406} {"train_loss": -6.739669357027326, "global_step": 143093, "epoch": 3406, "val_loss": 68583.6640625} {"train_loss": -6.773857116699219, "global_step": 143094, "epoch": 3407} {"train_loss": -6.638092041015625, "global_step": 143095, "epoch": 3407} {"train_loss": -6.79987907409668, "global_step": 143096, "epoch": 3407} {"train_loss": -6.818395614624023, "global_step": 143097, "epoch": 3407} {"train_loss": -6.817488670349121, "global_step": 143098, "epoch": 3407} {"train_loss": -6.76481819152832, "global_step": 143099, "epoch": 3407} {"train_loss": -6.835588455200195, "global_step": 143100, "epoch": 3407} {"train_loss": -6.853314399719238, "global_step": 143101, "epoch": 3407} {"train_loss": -6.785919666290283, "global_step": 143102, "epoch": 3407} {"train_loss": -6.856017112731934, "global_step": 143103, "epoch": 3407} {"train_loss": -6.729249954223633, "global_step": 143104, "epoch": 3407} {"train_loss": -6.815090656280518, "global_step": 143105, "epoch": 3407} {"train_loss": -6.743954658508301, "global_step": 143106, "epoch": 3407} {"train_loss": -6.7692975997924805, "global_step": 143107, "epoch": 3407} {"train_loss": -6.7660675048828125, "global_step": 143108, "epoch": 3407} {"train_loss": -6.662048816680908, "global_step": 143109, "epoch": 3407} {"train_loss": -6.871725082397461, "global_step": 143110, "epoch": 3407} {"train_loss": -6.736679553985596, "global_step": 143111, "epoch": 3407} {"train_loss": -6.853532791137695, "global_step": 143112, "epoch": 3407} {"train_loss": -6.880495548248291, "global_step": 143113, "epoch": 3407} {"train_loss": -6.904903888702393, "global_step": 143114, "epoch": 3407} {"train_loss": -6.715413570404053, "global_step": 143115, "epoch": 3407} {"train_loss": -6.699284076690674, "global_step": 143116, "epoch": 3407} {"train_loss": -6.813859462738037, "global_step": 143117, "epoch": 3407} {"train_loss": -6.74603796005249, "global_step": 143118, "epoch": 3407} {"train_loss": -6.726153373718262, "global_step": 143119, "epoch": 3407} {"train_loss": -6.827942848205566, "global_step": 143120, "epoch": 3407} {"train_loss": -6.618113994598389, "global_step": 143121, "epoch": 3407} {"train_loss": -6.75006103515625, "global_step": 143122, "epoch": 3407} {"train_loss": -6.7413129806518555, "global_step": 143123, "epoch": 3407} {"train_loss": -6.687079906463623, "global_step": 143124, "epoch": 3407} {"train_loss": -6.753774166107178, "global_step": 143125, "epoch": 3407} {"train_loss": -6.627993106842041, "global_step": 143126, "epoch": 3407} {"train_loss": -6.6785078048706055, "global_step": 143127, "epoch": 3407} {"train_loss": -6.645934104919434, "global_step": 143128, "epoch": 3407} {"train_loss": -6.655596733093262, "global_step": 143129, "epoch": 3407} {"train_loss": -6.734775066375732, "global_step": 143130, "epoch": 3407} {"train_loss": -6.651464462280273, "global_step": 143131, "epoch": 3407} {"train_loss": -6.711972236633301, "global_step": 143132, "epoch": 3407} {"train_loss": -6.715816974639893, "global_step": 143133, "epoch": 3407} {"train_loss": -6.674498081207275, "global_step": 143134, "epoch": 3407} {"train_loss": -6.753147329602923, "global_step": 143135, "epoch": 3407, "val_loss": 68434.71875} {"train_loss": -6.676341533660889, "global_step": 143136, "epoch": 3408} {"train_loss": -6.817225456237793, "global_step": 143137, "epoch": 3408} {"train_loss": -6.897124290466309, "global_step": 143138, "epoch": 3408} {"train_loss": -6.641390323638916, "global_step": 143139, "epoch": 3408} {"train_loss": -6.6901984214782715, "global_step": 143140, "epoch": 3408} {"train_loss": -6.8602752685546875, "global_step": 143141, "epoch": 3408} {"train_loss": -6.723701000213623, "global_step": 143142, "epoch": 3408} {"train_loss": -6.57839298248291, "global_step": 143143, "epoch": 3408} {"train_loss": -6.813187599182129, "global_step": 143144, "epoch": 3408} {"train_loss": -6.794018745422363, "global_step": 143145, "epoch": 3408} {"train_loss": -6.828812599182129, "global_step": 143146, "epoch": 3408} {"train_loss": -6.813069820404053, "global_step": 143147, "epoch": 3408} {"train_loss": -6.809635162353516, "global_step": 143148, "epoch": 3408} {"train_loss": -6.749960422515869, "global_step": 143149, "epoch": 3408} {"train_loss": -6.836269378662109, "global_step": 143150, "epoch": 3408} {"train_loss": -6.760666847229004, "global_step": 143151, "epoch": 3408} {"train_loss": -6.76725435256958, "global_step": 143152, "epoch": 3408} {"train_loss": -6.786890506744385, "global_step": 143153, "epoch": 3408} {"train_loss": -6.699059009552002, "global_step": 143154, "epoch": 3408} {"train_loss": -6.6453986167907715, "global_step": 143155, "epoch": 3408} {"train_loss": -6.809719562530518, "global_step": 143156, "epoch": 3408} {"train_loss": -6.737266540527344, "global_step": 143157, "epoch": 3408} {"train_loss": -6.696416854858398, "global_step": 143158, "epoch": 3408} {"train_loss": -6.685615539550781, "global_step": 143159, "epoch": 3408} {"train_loss": -6.843428611755371, "global_step": 143160, "epoch": 3408} {"train_loss": -6.809995651245117, "global_step": 143161, "epoch": 3408} {"train_loss": -6.759994029998779, "global_step": 143162, "epoch": 3408} {"train_loss": -6.830766677856445, "global_step": 143163, "epoch": 3408} {"train_loss": -6.877416610717773, "global_step": 143164, "epoch": 3408} {"train_loss": -6.916348457336426, "global_step": 143165, "epoch": 3408} {"train_loss": -6.786110877990723, "global_step": 143166, "epoch": 3408} {"train_loss": -6.781851291656494, "global_step": 143167, "epoch": 3408} {"train_loss": -6.811248779296875, "global_step": 143168, "epoch": 3408} {"train_loss": -6.752532482147217, "global_step": 143169, "epoch": 3408} {"train_loss": -6.690127849578857, "global_step": 143170, "epoch": 3408} {"train_loss": -6.678107261657715, "global_step": 143171, "epoch": 3408} {"train_loss": -6.7883710861206055, "global_step": 143172, "epoch": 3408} {"train_loss": -6.702486515045166, "global_step": 143173, "epoch": 3408} {"train_loss": -6.7409162521362305, "global_step": 143174, "epoch": 3408} {"train_loss": -6.74293327331543, "global_step": 143175, "epoch": 3408} {"train_loss": -6.616925239562988, "global_step": 143176, "epoch": 3408} {"train_loss": -6.759760697682698, "global_step": 143177, "epoch": 3408, "val_loss": 68879.0078125} {"train_loss": -6.434329032897949, "global_step": 143178, "epoch": 3409} {"train_loss": -6.700827598571777, "global_step": 143179, "epoch": 3409} {"train_loss": -6.687763214111328, "global_step": 143180, "epoch": 3409} {"train_loss": -6.5977067947387695, "global_step": 143181, "epoch": 3409} {"train_loss": -6.529390811920166, "global_step": 143182, "epoch": 3409} {"train_loss": -6.579100608825684, "global_step": 143183, "epoch": 3409} {"train_loss": -6.7926836013793945, "global_step": 143184, "epoch": 3409} {"train_loss": -6.423997402191162, "global_step": 143185, "epoch": 3409} {"train_loss": -6.6570000648498535, "global_step": 143186, "epoch": 3409} {"train_loss": -6.596689224243164, "global_step": 143187, "epoch": 3409} {"train_loss": -6.597021102905273, "global_step": 143188, "epoch": 3409} {"train_loss": -6.687824726104736, "global_step": 143189, "epoch": 3409} {"train_loss": -6.6437668800354, "global_step": 143190, "epoch": 3409} {"train_loss": -6.5493950843811035, "global_step": 143191, "epoch": 3409} {"train_loss": -6.745849609375, "global_step": 143192, "epoch": 3409} {"train_loss": -6.643144607543945, "global_step": 143193, "epoch": 3409} {"train_loss": -6.7252302169799805, "global_step": 143194, "epoch": 3409} {"train_loss": -6.701936721801758, "global_step": 143195, "epoch": 3409} {"train_loss": -6.651474952697754, "global_step": 143196, "epoch": 3409} {"train_loss": -6.744483947753906, "global_step": 143197, "epoch": 3409} {"train_loss": -6.7518310546875, "global_step": 143198, "epoch": 3409} {"train_loss": -6.633340358734131, "global_step": 143199, "epoch": 3409} {"train_loss": -6.719012260437012, "global_step": 143200, "epoch": 3409} {"train_loss": -6.697989463806152, "global_step": 143201, "epoch": 3409} {"train_loss": -6.67428731918335, "global_step": 143202, "epoch": 3409} {"train_loss": -6.743062973022461, "global_step": 143203, "epoch": 3409} {"train_loss": -6.6046142578125, "global_step": 143204, "epoch": 3409} {"train_loss": -6.773408889770508, "global_step": 143205, "epoch": 3409} {"train_loss": -6.73520565032959, "global_step": 143206, "epoch": 3409} {"train_loss": -6.8367414474487305, "global_step": 143207, "epoch": 3409} {"train_loss": -6.7909088134765625, "global_step": 143208, "epoch": 3409} {"train_loss": -6.812919616699219, "global_step": 143209, "epoch": 3409} {"train_loss": -6.79080867767334, "global_step": 143210, "epoch": 3409} {"train_loss": -6.775992393493652, "global_step": 143211, "epoch": 3409} {"train_loss": -6.785135269165039, "global_step": 143212, "epoch": 3409} {"train_loss": -6.730853080749512, "global_step": 143213, "epoch": 3409} {"train_loss": -6.822732925415039, "global_step": 143214, "epoch": 3409} {"train_loss": -6.751019477844238, "global_step": 143215, "epoch": 3409} {"train_loss": -6.754345893859863, "global_step": 143216, "epoch": 3409} {"train_loss": -6.8170695304870605, "global_step": 143217, "epoch": 3409} {"train_loss": -6.669126510620117, "global_step": 143218, "epoch": 3409} {"train_loss": -6.693251575742449, "global_step": 143219, "epoch": 3409, "val_loss": 68324.375} {"train_loss": -6.812788963317871, "global_step": 143220, "epoch": 3410} {"train_loss": -6.812108516693115, "global_step": 143221, "epoch": 3410} {"train_loss": -6.79030704498291, "global_step": 143222, "epoch": 3410} {"train_loss": -6.813298225402832, "global_step": 143223, "epoch": 3410} {"train_loss": -6.746356010437012, "global_step": 143224, "epoch": 3410} {"train_loss": -6.769939422607422, "global_step": 143225, "epoch": 3410} {"train_loss": -6.8299946784973145, "global_step": 143226, "epoch": 3410} {"train_loss": -6.686347961425781, "global_step": 143227, "epoch": 3410} {"train_loss": -6.7115631103515625, "global_step": 143228, "epoch": 3410} {"train_loss": -6.830783843994141, "global_step": 143229, "epoch": 3410} {"train_loss": -6.803083896636963, "global_step": 143230, "epoch": 3410} {"train_loss": -6.8908305168151855, "global_step": 143231, "epoch": 3410} {"train_loss": -6.8903303146362305, "global_step": 143232, "epoch": 3410} {"train_loss": -6.779163360595703, "global_step": 143233, "epoch": 3410} {"train_loss": -6.7823076248168945, "global_step": 143234, "epoch": 3410} {"train_loss": -6.8578267097473145, "global_step": 143235, "epoch": 3410} {"train_loss": -6.740324974060059, "global_step": 143236, "epoch": 3410} {"train_loss": -6.82588529586792, "global_step": 143237, "epoch": 3410} {"train_loss": -6.7766876220703125, "global_step": 143238, "epoch": 3410} {"train_loss": -6.617771625518799, "global_step": 143239, "epoch": 3410} {"train_loss": -6.753449440002441, "global_step": 143240, "epoch": 3410} {"train_loss": -6.6498565673828125, "global_step": 143241, "epoch": 3410} {"train_loss": -6.712517738342285, "global_step": 143242, "epoch": 3410} {"train_loss": -6.70426607131958, "global_step": 143243, "epoch": 3410} {"train_loss": -6.666101455688477, "global_step": 143244, "epoch": 3410} {"train_loss": -6.684471607208252, "global_step": 143245, "epoch": 3410} {"train_loss": -6.658273696899414, "global_step": 143246, "epoch": 3410} {"train_loss": -6.720278263092041, "global_step": 143247, "epoch": 3410} {"train_loss": -6.636078834533691, "global_step": 143248, "epoch": 3410} {"train_loss": -6.6689453125, "global_step": 143249, "epoch": 3410} {"train_loss": -6.705316543579102, "global_step": 143250, "epoch": 3410} {"train_loss": -6.63978910446167, "global_step": 143251, "epoch": 3410} {"train_loss": -6.811436653137207, "global_step": 143252, "epoch": 3410} {"train_loss": -6.688596248626709, "global_step": 143253, "epoch": 3410} {"train_loss": -6.684922218322754, "global_step": 143254, "epoch": 3410} {"train_loss": -6.711838722229004, "global_step": 143255, "epoch": 3410} {"train_loss": -6.706633567810059, "global_step": 143256, "epoch": 3410} {"train_loss": -6.8408203125, "global_step": 143257, "epoch": 3410} {"train_loss": -6.795297622680664, "global_step": 143258, "epoch": 3410} {"train_loss": -6.771264553070068, "global_step": 143259, "epoch": 3410} {"train_loss": -6.763115406036377, "global_step": 143260, "epoch": 3410} {"train_loss": -6.749321494783674, "global_step": 143261, "epoch": 3410, "val_loss": 68521.859375} {"train_loss": -6.729550361633301, "global_step": 143262, "epoch": 3411} {"train_loss": -6.664545059204102, "global_step": 143263, "epoch": 3411} {"train_loss": -6.65181827545166, "global_step": 143264, "epoch": 3411} {"train_loss": -6.756686210632324, "global_step": 143265, "epoch": 3411} {"train_loss": -6.713168621063232, "global_step": 143266, "epoch": 3411} {"train_loss": -6.804035663604736, "global_step": 143267, "epoch": 3411} {"train_loss": -6.813636779785156, "global_step": 143268, "epoch": 3411} {"train_loss": -6.792829513549805, "global_step": 143269, "epoch": 3411} {"train_loss": -6.769718170166016, "global_step": 143270, "epoch": 3411} {"train_loss": -6.766977310180664, "global_step": 143271, "epoch": 3411} {"train_loss": -6.6169304847717285, "global_step": 143272, "epoch": 3411} {"train_loss": -6.760804653167725, "global_step": 143273, "epoch": 3411} {"train_loss": -6.816515922546387, "global_step": 143274, "epoch": 3411} {"train_loss": -6.720958709716797, "global_step": 143275, "epoch": 3411} {"train_loss": -6.745347023010254, "global_step": 143276, "epoch": 3411} {"train_loss": -6.783480167388916, "global_step": 143277, "epoch": 3411} {"train_loss": -6.754892349243164, "global_step": 143278, "epoch": 3411} {"train_loss": -6.914466857910156, "global_step": 143279, "epoch": 3411} {"train_loss": -6.745230197906494, "global_step": 143280, "epoch": 3411} {"train_loss": -6.7766008377075195, "global_step": 143281, "epoch": 3411} {"train_loss": -6.766806125640869, "global_step": 143282, "epoch": 3411} {"train_loss": -6.8168206214904785, "global_step": 143283, "epoch": 3411} {"train_loss": -6.659049987792969, "global_step": 143284, "epoch": 3411} {"train_loss": -6.733094692230225, "global_step": 143285, "epoch": 3411} {"train_loss": -6.681792736053467, "global_step": 143286, "epoch": 3411} {"train_loss": -6.752006530761719, "global_step": 143287, "epoch": 3411} {"train_loss": -6.768396377563477, "global_step": 143288, "epoch": 3411} {"train_loss": -6.796189308166504, "global_step": 143289, "epoch": 3411} {"train_loss": -6.622012615203857, "global_step": 143290, "epoch": 3411} {"train_loss": -6.850976467132568, "global_step": 143291, "epoch": 3411} {"train_loss": -6.835402965545654, "global_step": 143292, "epoch": 3411} {"train_loss": -6.805648326873779, "global_step": 143293, "epoch": 3411} {"train_loss": -6.8239874839782715, "global_step": 143294, "epoch": 3411} {"train_loss": -6.832126617431641, "global_step": 143295, "epoch": 3411} {"train_loss": -6.655050754547119, "global_step": 143296, "epoch": 3411} {"train_loss": -6.763140678405762, "global_step": 143297, "epoch": 3411} {"train_loss": -6.723714351654053, "global_step": 143298, "epoch": 3411} {"train_loss": -6.738579273223877, "global_step": 143299, "epoch": 3411} {"train_loss": -6.877132415771484, "global_step": 143300, "epoch": 3411} {"train_loss": -6.752247333526611, "global_step": 143301, "epoch": 3411} {"train_loss": -6.794811248779297, "global_step": 143302, "epoch": 3411} {"train_loss": -6.761277914047241, "global_step": 143303, "epoch": 3411, "val_loss": 68474.6484375} {"train_loss": -6.756475448608398, "global_step": 143304, "epoch": 3412} {"train_loss": -6.806281566619873, "global_step": 143305, "epoch": 3412} {"train_loss": -6.828179836273193, "global_step": 143306, "epoch": 3412} {"train_loss": -6.803225517272949, "global_step": 143307, "epoch": 3412} {"train_loss": -6.601397514343262, "global_step": 143308, "epoch": 3412} {"train_loss": -6.796514511108398, "global_step": 143309, "epoch": 3412} {"train_loss": -6.801471710205078, "global_step": 143310, "epoch": 3412} {"train_loss": -6.741518020629883, "global_step": 143311, "epoch": 3412} {"train_loss": -6.749757766723633, "global_step": 143312, "epoch": 3412} {"train_loss": -6.7860260009765625, "global_step": 143313, "epoch": 3412} {"train_loss": -6.780240058898926, "global_step": 143314, "epoch": 3412} {"train_loss": -6.719613075256348, "global_step": 143315, "epoch": 3412} {"train_loss": -6.73140811920166, "global_step": 143316, "epoch": 3412} {"train_loss": -6.688684463500977, "global_step": 143317, "epoch": 3412} {"train_loss": -6.776585578918457, "global_step": 143318, "epoch": 3412} {"train_loss": -6.740837097167969, "global_step": 143319, "epoch": 3412} {"train_loss": -6.797956466674805, "global_step": 143320, "epoch": 3412} {"train_loss": -6.801504135131836, "global_step": 143321, "epoch": 3412} {"train_loss": -6.739946365356445, "global_step": 143322, "epoch": 3412} {"train_loss": -6.670124530792236, "global_step": 143323, "epoch": 3412} {"train_loss": -6.78021240234375, "global_step": 143324, "epoch": 3412} {"train_loss": -6.822641372680664, "global_step": 143325, "epoch": 3412} {"train_loss": -6.610700607299805, "global_step": 143326, "epoch": 3412} {"train_loss": -6.6370954513549805, "global_step": 143327, "epoch": 3412} {"train_loss": -6.7807135581970215, "global_step": 143328, "epoch": 3412} {"train_loss": -6.680374622344971, "global_step": 143329, "epoch": 3412} {"train_loss": -6.601961135864258, "global_step": 143330, "epoch": 3412} {"train_loss": -6.6686811447143555, "global_step": 143331, "epoch": 3412} {"train_loss": -6.668717384338379, "global_step": 143332, "epoch": 3412} {"train_loss": -6.618335723876953, "global_step": 143333, "epoch": 3412} {"train_loss": -6.723710060119629, "global_step": 143334, "epoch": 3412} {"train_loss": -6.757047653198242, "global_step": 143335, "epoch": 3412} {"train_loss": -6.820857048034668, "global_step": 143336, "epoch": 3412} {"train_loss": -6.681635856628418, "global_step": 143337, "epoch": 3412} {"train_loss": -6.581819534301758, "global_step": 143338, "epoch": 3412} {"train_loss": -6.857295989990234, "global_step": 143339, "epoch": 3412} {"train_loss": -6.591113090515137, "global_step": 143340, "epoch": 3412} {"train_loss": -6.609967231750488, "global_step": 143341, "epoch": 3412} {"train_loss": -6.854601860046387, "global_step": 143342, "epoch": 3412} {"train_loss": -6.750774383544922, "global_step": 143343, "epoch": 3412} {"train_loss": -6.710176467895508, "global_step": 143344, "epoch": 3412} {"train_loss": -6.727061192194621, "global_step": 143345, "epoch": 3412, "val_loss": 68648.234375} {"train_loss": -6.657448768615723, "global_step": 143346, "epoch": 3413} {"train_loss": -6.610116958618164, "global_step": 143347, "epoch": 3413} {"train_loss": -6.768670558929443, "global_step": 143348, "epoch": 3413} {"train_loss": -6.647998809814453, "global_step": 143349, "epoch": 3413} {"train_loss": -6.830848217010498, "global_step": 143350, "epoch": 3413} {"train_loss": -6.612096309661865, "global_step": 143351, "epoch": 3413} {"train_loss": -6.777130126953125, "global_step": 143352, "epoch": 3413} {"train_loss": -6.747820854187012, "global_step": 143353, "epoch": 3413} {"train_loss": -6.712674140930176, "global_step": 143354, "epoch": 3413} {"train_loss": -6.779667854309082, "global_step": 143355, "epoch": 3413} {"train_loss": -6.725522994995117, "global_step": 143356, "epoch": 3413} {"train_loss": -6.701062202453613, "global_step": 143357, "epoch": 3413} {"train_loss": -6.683430194854736, "global_step": 143358, "epoch": 3413} {"train_loss": -6.87017822265625, "global_step": 143359, "epoch": 3413} {"train_loss": -6.774288177490234, "global_step": 143360, "epoch": 3413} {"train_loss": -6.651916980743408, "global_step": 143361, "epoch": 3413} {"train_loss": -6.772727966308594, "global_step": 143362, "epoch": 3413} {"train_loss": -6.710468292236328, "global_step": 143363, "epoch": 3413} {"train_loss": -6.630911350250244, "global_step": 143364, "epoch": 3413} {"train_loss": -6.70081901550293, "global_step": 143365, "epoch": 3413} {"train_loss": -6.745083808898926, "global_step": 143366, "epoch": 3413} {"train_loss": -6.660087585449219, "global_step": 143367, "epoch": 3413} {"train_loss": -6.707087993621826, "global_step": 143368, "epoch": 3413} {"train_loss": -6.662972450256348, "global_step": 143369, "epoch": 3413} {"train_loss": -6.830643653869629, "global_step": 143370, "epoch": 3413} {"train_loss": -6.664003372192383, "global_step": 143371, "epoch": 3413} {"train_loss": -6.747825622558594, "global_step": 143372, "epoch": 3413} {"train_loss": -6.80432653427124, "global_step": 143373, "epoch": 3413} {"train_loss": -6.773713111877441, "global_step": 143374, "epoch": 3413} {"train_loss": -6.467396259307861, "global_step": 143375, "epoch": 3413} {"train_loss": -6.634668350219727, "global_step": 143376, "epoch": 3413} {"train_loss": -6.5970306396484375, "global_step": 143377, "epoch": 3413} {"train_loss": -6.5551347732543945, "global_step": 143378, "epoch": 3413} {"train_loss": -6.685345649719238, "global_step": 143379, "epoch": 3413} {"train_loss": -6.642927646636963, "global_step": 143380, "epoch": 3413} {"train_loss": -6.703518867492676, "global_step": 143381, "epoch": 3413} {"train_loss": -6.637969017028809, "global_step": 143382, "epoch": 3413} {"train_loss": -6.633766174316406, "global_step": 143383, "epoch": 3413} {"train_loss": -6.6519269943237305, "global_step": 143384, "epoch": 3413} {"train_loss": -6.644599437713623, "global_step": 143385, "epoch": 3413} {"train_loss": -6.76264762878418, "global_step": 143386, "epoch": 3413} {"train_loss": -6.695035923094976, "global_step": 143387, "epoch": 3413, "val_loss": 68386.9140625} {"train_loss": -6.656417369842529, "global_step": 143388, "epoch": 3414} {"train_loss": -6.725269794464111, "global_step": 143389, "epoch": 3414} {"train_loss": -6.51216459274292, "global_step": 143390, "epoch": 3414} {"train_loss": -6.712820053100586, "global_step": 143391, "epoch": 3414} {"train_loss": -6.624229431152344, "global_step": 143392, "epoch": 3414} {"train_loss": -6.717278003692627, "global_step": 143393, "epoch": 3414} {"train_loss": -6.675037384033203, "global_step": 143394, "epoch": 3414} {"train_loss": -6.72420597076416, "global_step": 143395, "epoch": 3414} {"train_loss": -6.666801452636719, "global_step": 143396, "epoch": 3414} {"train_loss": -6.710748672485352, "global_step": 143397, "epoch": 3414} {"train_loss": -6.581816673278809, "global_step": 143398, "epoch": 3414} {"train_loss": -6.703568935394287, "global_step": 143399, "epoch": 3414} {"train_loss": -6.729095458984375, "global_step": 143400, "epoch": 3414} {"train_loss": -6.716297149658203, "global_step": 143401, "epoch": 3414} {"train_loss": -6.654201030731201, "global_step": 143402, "epoch": 3414} {"train_loss": -6.613832473754883, "global_step": 143403, "epoch": 3414} {"train_loss": -6.787154674530029, "global_step": 143404, "epoch": 3414} {"train_loss": -6.660922050476074, "global_step": 143405, "epoch": 3414} {"train_loss": -6.71656608581543, "global_step": 143406, "epoch": 3414} {"train_loss": -6.770877838134766, "global_step": 143407, "epoch": 3414} {"train_loss": -6.761898994445801, "global_step": 143408, "epoch": 3414} {"train_loss": -6.899092674255371, "global_step": 143409, "epoch": 3414} {"train_loss": -6.768566131591797, "global_step": 143410, "epoch": 3414} {"train_loss": -6.88431978225708, "global_step": 143411, "epoch": 3414} {"train_loss": -6.778714179992676, "global_step": 143412, "epoch": 3414} {"train_loss": -6.761049270629883, "global_step": 143413, "epoch": 3414} {"train_loss": -6.933834075927734, "global_step": 143414, "epoch": 3414} {"train_loss": -6.705522537231445, "global_step": 143415, "epoch": 3414} {"train_loss": -6.834902763366699, "global_step": 143416, "epoch": 3414} {"train_loss": -6.7349534034729, "global_step": 143417, "epoch": 3414} {"train_loss": -6.724582672119141, "global_step": 143418, "epoch": 3414} {"train_loss": -6.733304023742676, "global_step": 143419, "epoch": 3414} {"train_loss": -6.824624061584473, "global_step": 143420, "epoch": 3414} {"train_loss": -6.719187259674072, "global_step": 143421, "epoch": 3414} {"train_loss": -6.654893398284912, "global_step": 143422, "epoch": 3414} {"train_loss": -6.7675089836120605, "global_step": 143423, "epoch": 3414} {"train_loss": -6.74718713760376, "global_step": 143424, "epoch": 3414} {"train_loss": -6.774970054626465, "global_step": 143425, "epoch": 3414} {"train_loss": -6.9176740646362305, "global_step": 143426, "epoch": 3414} {"train_loss": -6.901671886444092, "global_step": 143427, "epoch": 3414} {"train_loss": -6.844322204589844, "global_step": 143428, "epoch": 3414} {"train_loss": -6.739796956380208, "global_step": 143429, "epoch": 3414, "val_loss": 68217.0625} {"train_loss": -6.835211753845215, "global_step": 143430, "epoch": 3415} {"train_loss": -6.804301738739014, "global_step": 143431, "epoch": 3415} {"train_loss": -6.7957916259765625, "global_step": 143432, "epoch": 3415} {"train_loss": -6.8143310546875, "global_step": 143433, "epoch": 3415} {"train_loss": -6.777618408203125, "global_step": 143434, "epoch": 3415} {"train_loss": -6.846662998199463, "global_step": 143435, "epoch": 3415} {"train_loss": -6.8357462882995605, "global_step": 143436, "epoch": 3415} {"train_loss": -6.849118709564209, "global_step": 143437, "epoch": 3415} {"train_loss": -6.806484222412109, "global_step": 143438, "epoch": 3415} {"train_loss": -6.858160018920898, "global_step": 143439, "epoch": 3415} {"train_loss": -6.924836158752441, "global_step": 143440, "epoch": 3415} {"train_loss": -6.751058578491211, "global_step": 143441, "epoch": 3415} {"train_loss": -6.845609664916992, "global_step": 143442, "epoch": 3415} {"train_loss": -6.700910568237305, "global_step": 143443, "epoch": 3415} {"train_loss": -6.756320953369141, "global_step": 143444, "epoch": 3415} {"train_loss": -6.904216766357422, "global_step": 143445, "epoch": 3415} {"train_loss": -6.877803325653076, "global_step": 143446, "epoch": 3415} {"train_loss": -6.8133697509765625, "global_step": 143447, "epoch": 3415} {"train_loss": -6.7301130294799805, "global_step": 143448, "epoch": 3415} {"train_loss": -6.829108238220215, "global_step": 143449, "epoch": 3415} {"train_loss": -6.795971870422363, "global_step": 143450, "epoch": 3415} {"train_loss": -6.8611650466918945, "global_step": 143451, "epoch": 3415} {"train_loss": -6.671943664550781, "global_step": 143452, "epoch": 3415} {"train_loss": -6.76246976852417, "global_step": 143453, "epoch": 3415} {"train_loss": -6.764135360717773, "global_step": 143454, "epoch": 3415} {"train_loss": -6.664604187011719, "global_step": 143455, "epoch": 3415} {"train_loss": -6.791028022766113, "global_step": 143456, "epoch": 3415} {"train_loss": -6.726812362670898, "global_step": 143457, "epoch": 3415} {"train_loss": -6.817052841186523, "global_step": 143458, "epoch": 3415} {"train_loss": -6.701010704040527, "global_step": 143459, "epoch": 3415} {"train_loss": -6.806203842163086, "global_step": 143460, "epoch": 3415} {"train_loss": -6.941728591918945, "global_step": 143461, "epoch": 3415} {"train_loss": -6.760959625244141, "global_step": 143462, "epoch": 3415} {"train_loss": -6.865968704223633, "global_step": 143463, "epoch": 3415} {"train_loss": -6.880109786987305, "global_step": 143464, "epoch": 3415} {"train_loss": -6.794882774353027, "global_step": 143465, "epoch": 3415} {"train_loss": -6.706271171569824, "global_step": 143466, "epoch": 3415} {"train_loss": -6.82762336730957, "global_step": 143467, "epoch": 3415} {"train_loss": -6.6465840339660645, "global_step": 143468, "epoch": 3415} {"train_loss": -6.732748508453369, "global_step": 143469, "epoch": 3415} {"train_loss": -6.874253273010254, "global_step": 143470, "epoch": 3415} {"train_loss": -6.796593643370128, "global_step": 143471, "epoch": 3415, "val_loss": 68437.9375} {"train_loss": -6.853001594543457, "global_step": 143472, "epoch": 3416} {"train_loss": -6.796006202697754, "global_step": 143473, "epoch": 3416} {"train_loss": -6.833325386047363, "global_step": 143474, "epoch": 3416} {"train_loss": -6.8747358322143555, "global_step": 143475, "epoch": 3416} {"train_loss": -6.748735427856445, "global_step": 143476, "epoch": 3416} {"train_loss": -6.758771896362305, "global_step": 143477, "epoch": 3416} {"train_loss": -6.8924760818481445, "global_step": 143478, "epoch": 3416} {"train_loss": -6.732985496520996, "global_step": 143479, "epoch": 3416} {"train_loss": -6.758049964904785, "global_step": 143480, "epoch": 3416} {"train_loss": -6.819762706756592, "global_step": 143481, "epoch": 3416} {"train_loss": -6.751879692077637, "global_step": 143482, "epoch": 3416} {"train_loss": -6.828800201416016, "global_step": 143483, "epoch": 3416} {"train_loss": -6.788243770599365, "global_step": 143484, "epoch": 3416} {"train_loss": -6.721345901489258, "global_step": 143485, "epoch": 3416} {"train_loss": -6.903497695922852, "global_step": 143486, "epoch": 3416} {"train_loss": -6.875190734863281, "global_step": 143487, "epoch": 3416} {"train_loss": -6.834908485412598, "global_step": 143488, "epoch": 3416} {"train_loss": -6.770689964294434, "global_step": 143489, "epoch": 3416} {"train_loss": -6.833191871643066, "global_step": 143490, "epoch": 3416} {"train_loss": -6.789726257324219, "global_step": 143491, "epoch": 3416} {"train_loss": -6.787936210632324, "global_step": 143492, "epoch": 3416} {"train_loss": -6.699878692626953, "global_step": 143493, "epoch": 3416} {"train_loss": -6.659369468688965, "global_step": 143494, "epoch": 3416} {"train_loss": -6.756954193115234, "global_step": 143495, "epoch": 3416} {"train_loss": -6.713868141174316, "global_step": 143496, "epoch": 3416} {"train_loss": -6.822918891906738, "global_step": 143497, "epoch": 3416} {"train_loss": -6.740866661071777, "global_step": 143498, "epoch": 3416} {"train_loss": -6.704479694366455, "global_step": 143499, "epoch": 3416} {"train_loss": -6.717891693115234, "global_step": 143500, "epoch": 3416} {"train_loss": -6.691388130187988, "global_step": 143501, "epoch": 3416} {"train_loss": -6.604642868041992, "global_step": 143502, "epoch": 3416} {"train_loss": -6.705202102661133, "global_step": 143503, "epoch": 3416} {"train_loss": -6.854793548583984, "global_step": 143504, "epoch": 3416} {"train_loss": -6.846467971801758, "global_step": 143505, "epoch": 3416} {"train_loss": -6.750801086425781, "global_step": 143506, "epoch": 3416} {"train_loss": -6.817773818969727, "global_step": 143507, "epoch": 3416} {"train_loss": -6.7737298011779785, "global_step": 143508, "epoch": 3416} {"train_loss": -6.7424750328063965, "global_step": 143509, "epoch": 3416} {"train_loss": -6.708500385284424, "global_step": 143510, "epoch": 3416} {"train_loss": -6.7426605224609375, "global_step": 143511, "epoch": 3416} {"train_loss": -6.766828536987305, "global_step": 143512, "epoch": 3416} {"train_loss": -6.7750701904296875, "global_step": 143513, "epoch": 3416, "val_loss": 68358.9140625} {"train_loss": -6.78529167175293, "global_step": 143514, "epoch": 3417} {"train_loss": -6.803750038146973, "global_step": 143515, "epoch": 3417} {"train_loss": -6.760605812072754, "global_step": 143516, "epoch": 3417} {"train_loss": -6.908622741699219, "global_step": 143517, "epoch": 3417} {"train_loss": -6.795759201049805, "global_step": 143518, "epoch": 3417} {"train_loss": -6.694725513458252, "global_step": 143519, "epoch": 3417} {"train_loss": -6.8931660652160645, "global_step": 143520, "epoch": 3417} {"train_loss": -6.764031410217285, "global_step": 143521, "epoch": 3417} {"train_loss": -6.731291770935059, "global_step": 143522, "epoch": 3417} {"train_loss": -6.878325462341309, "global_step": 143523, "epoch": 3417} {"train_loss": -6.825650215148926, "global_step": 143524, "epoch": 3417} {"train_loss": -6.695840835571289, "global_step": 143525, "epoch": 3417} {"train_loss": -6.796938896179199, "global_step": 143526, "epoch": 3417} {"train_loss": -6.923131942749023, "global_step": 143527, "epoch": 3417} {"train_loss": -6.811802864074707, "global_step": 143528, "epoch": 3417} {"train_loss": -6.678348541259766, "global_step": 143529, "epoch": 3417} {"train_loss": -6.636476993560791, "global_step": 143530, "epoch": 3417} {"train_loss": -6.847264289855957, "global_step": 143531, "epoch": 3417} {"train_loss": -6.721118927001953, "global_step": 143532, "epoch": 3417} {"train_loss": -6.717092514038086, "global_step": 143533, "epoch": 3417} {"train_loss": -6.816928863525391, "global_step": 143534, "epoch": 3417} {"train_loss": -6.830535411834717, "global_step": 143535, "epoch": 3417} {"train_loss": -6.765363693237305, "global_step": 143536, "epoch": 3417} {"train_loss": -6.730717658996582, "global_step": 143537, "epoch": 3417} {"train_loss": -6.758606910705566, "global_step": 143538, "epoch": 3417} {"train_loss": -6.794395923614502, "global_step": 143539, "epoch": 3417} {"train_loss": -6.755059242248535, "global_step": 143540, "epoch": 3417} {"train_loss": -6.687150001525879, "global_step": 143541, "epoch": 3417} {"train_loss": -6.679672718048096, "global_step": 143542, "epoch": 3417} {"train_loss": -6.787221908569336, "global_step": 143543, "epoch": 3417} {"train_loss": -6.642411231994629, "global_step": 143544, "epoch": 3417} {"train_loss": -6.657037734985352, "global_step": 143545, "epoch": 3417} {"train_loss": -6.7956156730651855, "global_step": 143546, "epoch": 3417} {"train_loss": -6.565793037414551, "global_step": 143547, "epoch": 3417} {"train_loss": -6.688392639160156, "global_step": 143548, "epoch": 3417} {"train_loss": -6.68990421295166, "global_step": 143549, "epoch": 3417} {"train_loss": -6.727449417114258, "global_step": 143550, "epoch": 3417} {"train_loss": -6.746734619140625, "global_step": 143551, "epoch": 3417} {"train_loss": -6.828815460205078, "global_step": 143552, "epoch": 3417} {"train_loss": -6.665068626403809, "global_step": 143553, "epoch": 3417} {"train_loss": -6.733417510986328, "global_step": 143554, "epoch": 3417} {"train_loss": -6.755605992816744, "global_step": 143555, "epoch": 3417, "val_loss": 68671.0546875} {"train_loss": -6.668740272521973, "global_step": 143556, "epoch": 3418} {"train_loss": -6.68977165222168, "global_step": 143557, "epoch": 3418} {"train_loss": -6.733956813812256, "global_step": 143558, "epoch": 3418} {"train_loss": -6.5856122970581055, "global_step": 143559, "epoch": 3418} {"train_loss": -6.765348434448242, "global_step": 143560, "epoch": 3418} {"train_loss": -6.625959873199463, "global_step": 143561, "epoch": 3418} {"train_loss": -6.718865394592285, "global_step": 143562, "epoch": 3418} {"train_loss": -6.810859680175781, "global_step": 143563, "epoch": 3418} {"train_loss": -6.701415061950684, "global_step": 143564, "epoch": 3418} {"train_loss": -6.721283912658691, "global_step": 143565, "epoch": 3418} {"train_loss": -6.684479713439941, "global_step": 143566, "epoch": 3418} {"train_loss": -6.758028030395508, "global_step": 143567, "epoch": 3418} {"train_loss": -6.745100975036621, "global_step": 143568, "epoch": 3418} {"train_loss": -6.829793453216553, "global_step": 143569, "epoch": 3418} {"train_loss": -6.867404937744141, "global_step": 143570, "epoch": 3418} {"train_loss": -6.648563861846924, "global_step": 143571, "epoch": 3418} {"train_loss": -6.706464767456055, "global_step": 143572, "epoch": 3418} {"train_loss": -6.823796272277832, "global_step": 143573, "epoch": 3418} {"train_loss": -6.815583229064941, "global_step": 143574, "epoch": 3418} {"train_loss": -6.737700462341309, "global_step": 143575, "epoch": 3418} {"train_loss": -6.772150993347168, "global_step": 143576, "epoch": 3418} {"train_loss": -6.82517147064209, "global_step": 143577, "epoch": 3418} {"train_loss": -6.8538618087768555, "global_step": 143578, "epoch": 3418} {"train_loss": -6.762395858764648, "global_step": 143579, "epoch": 3418} {"train_loss": -6.698668003082275, "global_step": 143580, "epoch": 3418} {"train_loss": -6.6915154457092285, "global_step": 143581, "epoch": 3418} {"train_loss": -6.6961774826049805, "global_step": 143582, "epoch": 3418} {"train_loss": -6.701292037963867, "global_step": 143583, "epoch": 3418} {"train_loss": -6.705626487731934, "global_step": 143584, "epoch": 3418} {"train_loss": -6.681445121765137, "global_step": 143585, "epoch": 3418} {"train_loss": -6.800693511962891, "global_step": 143586, "epoch": 3418} {"train_loss": -6.639017105102539, "global_step": 143587, "epoch": 3418} {"train_loss": -6.775386810302734, "global_step": 143588, "epoch": 3418} {"train_loss": -6.690678596496582, "global_step": 143589, "epoch": 3418} {"train_loss": -6.759626388549805, "global_step": 143590, "epoch": 3418} {"train_loss": -6.76917839050293, "global_step": 143591, "epoch": 3418} {"train_loss": -6.774350643157959, "global_step": 143592, "epoch": 3418} {"train_loss": -6.757803440093994, "global_step": 143593, "epoch": 3418} {"train_loss": -6.760709762573242, "global_step": 143594, "epoch": 3418} {"train_loss": -6.756025791168213, "global_step": 143595, "epoch": 3418} {"train_loss": -6.814684867858887, "global_step": 143596, "epoch": 3418} {"train_loss": -6.739489260173979, "global_step": 143597, "epoch": 3418, "val_loss": 68395.515625} {"train_loss": -6.801732540130615, "global_step": 143598, "epoch": 3419} {"train_loss": -6.87965202331543, "global_step": 143599, "epoch": 3419} {"train_loss": -6.787580966949463, "global_step": 143600, "epoch": 3419} {"train_loss": -6.760419845581055, "global_step": 143601, "epoch": 3419} {"train_loss": -6.73993444442749, "global_step": 143602, "epoch": 3419} {"train_loss": -6.756731033325195, "global_step": 143603, "epoch": 3419} {"train_loss": -6.739112854003906, "global_step": 143604, "epoch": 3419} {"train_loss": -6.84364128112793, "global_step": 143605, "epoch": 3419} {"train_loss": -6.8731842041015625, "global_step": 143606, "epoch": 3419} {"train_loss": -6.782227039337158, "global_step": 143607, "epoch": 3419} {"train_loss": -6.9054412841796875, "global_step": 143608, "epoch": 3419} {"train_loss": -6.710929870605469, "global_step": 143609, "epoch": 3419} {"train_loss": -6.895946502685547, "global_step": 143610, "epoch": 3419} {"train_loss": -6.764991760253906, "global_step": 143611, "epoch": 3419} {"train_loss": -6.803949356079102, "global_step": 143612, "epoch": 3419} {"train_loss": -6.841416358947754, "global_step": 143613, "epoch": 3419} {"train_loss": -6.826592445373535, "global_step": 143614, "epoch": 3419} {"train_loss": -6.824239730834961, "global_step": 143615, "epoch": 3419} {"train_loss": -6.730597496032715, "global_step": 143616, "epoch": 3419} {"train_loss": -6.7526750564575195, "global_step": 143617, "epoch": 3419} {"train_loss": -6.840481758117676, "global_step": 143618, "epoch": 3419} {"train_loss": -6.624715328216553, "global_step": 143619, "epoch": 3419} {"train_loss": -6.872133731842041, "global_step": 143620, "epoch": 3419} {"train_loss": -6.793087005615234, "global_step": 143621, "epoch": 3419} {"train_loss": -6.694567680358887, "global_step": 143622, "epoch": 3419} {"train_loss": -6.754256248474121, "global_step": 143623, "epoch": 3419} {"train_loss": -6.76279354095459, "global_step": 143624, "epoch": 3419} {"train_loss": -6.7912492752075195, "global_step": 143625, "epoch": 3419} {"train_loss": -6.817706108093262, "global_step": 143626, "epoch": 3419} {"train_loss": -6.725560665130615, "global_step": 143627, "epoch": 3419} {"train_loss": -6.760597229003906, "global_step": 143628, "epoch": 3419} {"train_loss": -6.756956100463867, "global_step": 143629, "epoch": 3419} {"train_loss": -6.741764545440674, "global_step": 143630, "epoch": 3419} {"train_loss": -6.752453327178955, "global_step": 143631, "epoch": 3419} {"train_loss": -6.824062347412109, "global_step": 143632, "epoch": 3419} {"train_loss": -6.759276866912842, "global_step": 143633, "epoch": 3419} {"train_loss": -6.7389326095581055, "global_step": 143634, "epoch": 3419} {"train_loss": -6.835169315338135, "global_step": 143635, "epoch": 3419} {"train_loss": -6.711066722869873, "global_step": 143636, "epoch": 3419} {"train_loss": -6.803917407989502, "global_step": 143637, "epoch": 3419} {"train_loss": -6.702558517456055, "global_step": 143638, "epoch": 3419} {"train_loss": -6.779638233638945, "global_step": 143639, "epoch": 3419, "val_loss": 68233.875} {"train_loss": -6.881997585296631, "global_step": 143640, "epoch": 3420} {"train_loss": -6.694144248962402, "global_step": 143641, "epoch": 3420} {"train_loss": -6.787810325622559, "global_step": 143642, "epoch": 3420} {"train_loss": -6.747814655303955, "global_step": 143643, "epoch": 3420} {"train_loss": -6.763571739196777, "global_step": 143644, "epoch": 3420} {"train_loss": -6.831356525421143, "global_step": 143645, "epoch": 3420} {"train_loss": -6.795029640197754, "global_step": 143646, "epoch": 3420} {"train_loss": -6.744488716125488, "global_step": 143647, "epoch": 3420} {"train_loss": -6.827242374420166, "global_step": 143648, "epoch": 3420} {"train_loss": -6.88163948059082, "global_step": 143649, "epoch": 3420} {"train_loss": -6.955994606018066, "global_step": 143650, "epoch": 3420} {"train_loss": -6.865854263305664, "global_step": 143651, "epoch": 3420} {"train_loss": -6.668323516845703, "global_step": 143652, "epoch": 3420} {"train_loss": -6.6470947265625, "global_step": 143653, "epoch": 3420} {"train_loss": -6.6731438636779785, "global_step": 143654, "epoch": 3420} {"train_loss": -6.770254135131836, "global_step": 143655, "epoch": 3420} {"train_loss": -6.6998982429504395, "global_step": 143656, "epoch": 3420} {"train_loss": -6.792301177978516, "global_step": 143657, "epoch": 3420} {"train_loss": -6.8326826095581055, "global_step": 143658, "epoch": 3420} {"train_loss": -6.789575576782227, "global_step": 143659, "epoch": 3420} {"train_loss": -6.821301460266113, "global_step": 143660, "epoch": 3420} {"train_loss": -6.701631546020508, "global_step": 143661, "epoch": 3420} {"train_loss": -6.74714469909668, "global_step": 143662, "epoch": 3420} {"train_loss": -6.673469066619873, "global_step": 143663, "epoch": 3420} {"train_loss": -6.856664657592773, "global_step": 143664, "epoch": 3420} {"train_loss": -6.799001216888428, "global_step": 143665, "epoch": 3420} {"train_loss": -6.749083518981934, "global_step": 143666, "epoch": 3420} {"train_loss": -6.738380432128906, "global_step": 143667, "epoch": 3420} {"train_loss": -6.72556734085083, "global_step": 143668, "epoch": 3420} {"train_loss": -6.698362350463867, "global_step": 143669, "epoch": 3420} {"train_loss": -6.780492782592773, "global_step": 143670, "epoch": 3420} {"train_loss": -6.739406585693359, "global_step": 143671, "epoch": 3420} {"train_loss": -6.74664306640625, "global_step": 143672, "epoch": 3420} {"train_loss": -6.690572738647461, "global_step": 143673, "epoch": 3420} {"train_loss": -6.713875770568848, "global_step": 143674, "epoch": 3420} {"train_loss": -6.758547782897949, "global_step": 143675, "epoch": 3420} {"train_loss": -6.877681255340576, "global_step": 143676, "epoch": 3420} {"train_loss": -6.792987823486328, "global_step": 143677, "epoch": 3420} {"train_loss": -6.758972644805908, "global_step": 143678, "epoch": 3420} {"train_loss": -6.8052568435668945, "global_step": 143679, "epoch": 3420} {"train_loss": -6.685091972351074, "global_step": 143680, "epoch": 3420} {"train_loss": -6.7672741413116455, "global_step": 143681, "epoch": 3420, "val_loss": 68376.0078125} {"train_loss": -6.77691650390625, "global_step": 143682, "epoch": 3421} {"train_loss": -6.787718296051025, "global_step": 143683, "epoch": 3421} {"train_loss": -6.743494987487793, "global_step": 143684, "epoch": 3421} {"train_loss": -6.895465850830078, "global_step": 143685, "epoch": 3421} {"train_loss": -6.666197776794434, "global_step": 143686, "epoch": 3421} {"train_loss": -6.740199089050293, "global_step": 143687, "epoch": 3421} {"train_loss": -6.83740234375, "global_step": 143688, "epoch": 3421} {"train_loss": -6.7169389724731445, "global_step": 143689, "epoch": 3421} {"train_loss": -6.673751354217529, "global_step": 143690, "epoch": 3421} {"train_loss": -6.681288719177246, "global_step": 143691, "epoch": 3421} {"train_loss": -6.709650993347168, "global_step": 143692, "epoch": 3421} {"train_loss": -6.81113862991333, "global_step": 143693, "epoch": 3421} {"train_loss": -6.792085647583008, "global_step": 143694, "epoch": 3421} {"train_loss": -6.8730549812316895, "global_step": 143695, "epoch": 3421} {"train_loss": -6.830695629119873, "global_step": 143696, "epoch": 3421} {"train_loss": -6.734972953796387, "global_step": 143697, "epoch": 3421} {"train_loss": -6.787024974822998, "global_step": 143698, "epoch": 3421} {"train_loss": -6.794345378875732, "global_step": 143699, "epoch": 3421} {"train_loss": -6.675675392150879, "global_step": 143700, "epoch": 3421} {"train_loss": -6.778305530548096, "global_step": 143701, "epoch": 3421} {"train_loss": -6.726830005645752, "global_step": 143702, "epoch": 3421} {"train_loss": -6.8318586349487305, "global_step": 143703, "epoch": 3421} {"train_loss": -6.900954723358154, "global_step": 143704, "epoch": 3421} {"train_loss": -6.719894886016846, "global_step": 143705, "epoch": 3421} {"train_loss": -6.811187744140625, "global_step": 143706, "epoch": 3421} {"train_loss": -6.837116241455078, "global_step": 143707, "epoch": 3421} {"train_loss": -6.7786865234375, "global_step": 143708, "epoch": 3421} {"train_loss": -6.817212104797363, "global_step": 143709, "epoch": 3421} {"train_loss": -6.742931365966797, "global_step": 143710, "epoch": 3421} {"train_loss": -6.7106032371521, "global_step": 143711, "epoch": 3421} {"train_loss": -6.806339263916016, "global_step": 143712, "epoch": 3421} {"train_loss": -6.8093132972717285, "global_step": 143713, "epoch": 3421} {"train_loss": -6.759137153625488, "global_step": 143714, "epoch": 3421} {"train_loss": -6.749880313873291, "global_step": 143715, "epoch": 3421} {"train_loss": -6.752904415130615, "global_step": 143716, "epoch": 3421} {"train_loss": -6.638047218322754, "global_step": 143717, "epoch": 3421} {"train_loss": -6.726713180541992, "global_step": 143718, "epoch": 3421} {"train_loss": -6.716004371643066, "global_step": 143719, "epoch": 3421} {"train_loss": -6.7378339767456055, "global_step": 143720, "epoch": 3421} {"train_loss": -6.647990703582764, "global_step": 143721, "epoch": 3421} {"train_loss": -6.627074241638184, "global_step": 143722, "epoch": 3421} {"train_loss": -6.762044849849882, "global_step": 143723, "epoch": 3421, "val_loss": 68445.0078125} {"train_loss": -6.71975040435791, "global_step": 143724, "epoch": 3422} {"train_loss": -6.880451202392578, "global_step": 143725, "epoch": 3422} {"train_loss": -6.682036876678467, "global_step": 143726, "epoch": 3422} {"train_loss": -6.718716621398926, "global_step": 143727, "epoch": 3422} {"train_loss": -6.743862628936768, "global_step": 143728, "epoch": 3422} {"train_loss": -6.72693395614624, "global_step": 143729, "epoch": 3422} {"train_loss": -6.770096778869629, "global_step": 143730, "epoch": 3422} {"train_loss": -6.739668846130371, "global_step": 143731, "epoch": 3422} {"train_loss": -6.768075466156006, "global_step": 143732, "epoch": 3422} {"train_loss": -6.708242893218994, "global_step": 143733, "epoch": 3422} {"train_loss": -6.789694786071777, "global_step": 143734, "epoch": 3422} {"train_loss": -6.606891632080078, "global_step": 143735, "epoch": 3422} {"train_loss": -6.646047592163086, "global_step": 143736, "epoch": 3422} {"train_loss": -6.759889602661133, "global_step": 143737, "epoch": 3422} {"train_loss": -6.697274208068848, "global_step": 143738, "epoch": 3422} {"train_loss": -6.764570713043213, "global_step": 143739, "epoch": 3422} {"train_loss": -6.805929183959961, "global_step": 143740, "epoch": 3422} {"train_loss": -6.653016090393066, "global_step": 143741, "epoch": 3422} {"train_loss": -6.693763732910156, "global_step": 143742, "epoch": 3422} {"train_loss": -6.728050708770752, "global_step": 143743, "epoch": 3422} {"train_loss": -6.797626972198486, "global_step": 143744, "epoch": 3422} {"train_loss": -6.818336009979248, "global_step": 143745, "epoch": 3422} {"train_loss": -6.6650590896606445, "global_step": 143746, "epoch": 3422} {"train_loss": -6.548445701599121, "global_step": 143747, "epoch": 3422} {"train_loss": -6.725851058959961, "global_step": 143748, "epoch": 3422} {"train_loss": -6.705265998840332, "global_step": 143749, "epoch": 3422} {"train_loss": -6.624577522277832, "global_step": 143750, "epoch": 3422} {"train_loss": -6.789535999298096, "global_step": 143751, "epoch": 3422} {"train_loss": -6.731964111328125, "global_step": 143752, "epoch": 3422} {"train_loss": -6.652603626251221, "global_step": 143753, "epoch": 3422} {"train_loss": -6.728826522827148, "global_step": 143754, "epoch": 3422} {"train_loss": -6.65692138671875, "global_step": 143755, "epoch": 3422} {"train_loss": -6.772022247314453, "global_step": 143756, "epoch": 3422} {"train_loss": -6.768594264984131, "global_step": 143757, "epoch": 3422} {"train_loss": -6.6562819480896, "global_step": 143758, "epoch": 3422} {"train_loss": -6.696997165679932, "global_step": 143759, "epoch": 3422} {"train_loss": -6.656837463378906, "global_step": 143760, "epoch": 3422} {"train_loss": -6.645259857177734, "global_step": 143761, "epoch": 3422} {"train_loss": -6.474529266357422, "global_step": 143762, "epoch": 3422} {"train_loss": -6.497800827026367, "global_step": 143763, "epoch": 3422} {"train_loss": -6.713928699493408, "global_step": 143764, "epoch": 3422} {"train_loss": -6.700273036956787, "global_step": 143765, "epoch": 3422, "val_loss": 68500.8046875} {"train_loss": -6.6117706298828125, "global_step": 143766, "epoch": 3423} {"train_loss": -6.600658893585205, "global_step": 143767, "epoch": 3423} {"train_loss": -6.514926910400391, "global_step": 143768, "epoch": 3423} {"train_loss": -6.822377681732178, "global_step": 143769, "epoch": 3423} {"train_loss": -6.6263813972473145, "global_step": 143770, "epoch": 3423} {"train_loss": -6.650768280029297, "global_step": 143771, "epoch": 3423} {"train_loss": -6.708105087280273, "global_step": 143772, "epoch": 3423} {"train_loss": -6.631775856018066, "global_step": 143773, "epoch": 3423} {"train_loss": -6.686426162719727, "global_step": 143774, "epoch": 3423} {"train_loss": -6.783803462982178, "global_step": 143775, "epoch": 3423} {"train_loss": -6.798334121704102, "global_step": 143776, "epoch": 3423} {"train_loss": -6.887403964996338, "global_step": 143777, "epoch": 3423} {"train_loss": -6.830535888671875, "global_step": 143778, "epoch": 3423} {"train_loss": -6.7149248123168945, "global_step": 143779, "epoch": 3423} {"train_loss": -6.736604690551758, "global_step": 143780, "epoch": 3423} {"train_loss": -6.766610622406006, "global_step": 143781, "epoch": 3423} {"train_loss": -6.836611270904541, "global_step": 143782, "epoch": 3423} {"train_loss": -6.806048393249512, "global_step": 143783, "epoch": 3423} {"train_loss": -6.790508270263672, "global_step": 143784, "epoch": 3423} {"train_loss": -6.74626350402832, "global_step": 143785, "epoch": 3423} {"train_loss": -6.897456645965576, "global_step": 143786, "epoch": 3423} {"train_loss": -6.838972568511963, "global_step": 143787, "epoch": 3423} {"train_loss": -6.820985794067383, "global_step": 143788, "epoch": 3423} {"train_loss": -6.878785133361816, "global_step": 143789, "epoch": 3423} {"train_loss": -6.812277317047119, "global_step": 143790, "epoch": 3423} {"train_loss": -6.849386215209961, "global_step": 143791, "epoch": 3423} {"train_loss": -6.834737777709961, "global_step": 143792, "epoch": 3423} {"train_loss": -6.773890495300293, "global_step": 143793, "epoch": 3423} {"train_loss": -6.810067176818848, "global_step": 143794, "epoch": 3423} {"train_loss": -6.764291286468506, "global_step": 143795, "epoch": 3423} {"train_loss": -6.735054016113281, "global_step": 143796, "epoch": 3423} {"train_loss": -6.8201799392700195, "global_step": 143797, "epoch": 3423} {"train_loss": -6.6851091384887695, "global_step": 143798, "epoch": 3423} {"train_loss": -6.828469276428223, "global_step": 143799, "epoch": 3423} {"train_loss": -6.831859588623047, "global_step": 143800, "epoch": 3423} {"train_loss": -6.665787696838379, "global_step": 143801, "epoch": 3423} {"train_loss": -6.644014835357666, "global_step": 143802, "epoch": 3423} {"train_loss": -6.844622611999512, "global_step": 143803, "epoch": 3423} {"train_loss": -6.776082992553711, "global_step": 143804, "epoch": 3423} {"train_loss": -6.732646942138672, "global_step": 143805, "epoch": 3423} {"train_loss": -6.785804748535156, "global_step": 143806, "epoch": 3423} {"train_loss": -6.761068344116211, "global_step": 143807, "epoch": 3423, "val_loss": 68294.421875} {"train_loss": -6.643716812133789, "global_step": 143808, "epoch": 3424} {"train_loss": -6.8425726890563965, "global_step": 143809, "epoch": 3424} {"train_loss": -6.711300373077393, "global_step": 143810, "epoch": 3424} {"train_loss": -6.886188507080078, "global_step": 143811, "epoch": 3424} {"train_loss": -6.786772727966309, "global_step": 143812, "epoch": 3424} {"train_loss": -6.7906880378723145, "global_step": 143813, "epoch": 3424} {"train_loss": -6.8440704345703125, "global_step": 143814, "epoch": 3424} {"train_loss": -6.756893157958984, "global_step": 143815, "epoch": 3424} {"train_loss": -6.637125492095947, "global_step": 143816, "epoch": 3424} {"train_loss": -6.841884136199951, "global_step": 143817, "epoch": 3424} {"train_loss": -6.819916725158691, "global_step": 143818, "epoch": 3424} {"train_loss": -6.69650411605835, "global_step": 143819, "epoch": 3424} {"train_loss": -6.833423137664795, "global_step": 143820, "epoch": 3424} {"train_loss": -6.778407573699951, "global_step": 143821, "epoch": 3424} {"train_loss": -6.772113800048828, "global_step": 143822, "epoch": 3424} {"train_loss": -6.7560553550720215, "global_step": 143823, "epoch": 3424} {"train_loss": -6.847490310668945, "global_step": 143824, "epoch": 3424} {"train_loss": -6.9004411697387695, "global_step": 143825, "epoch": 3424} {"train_loss": -6.727296352386475, "global_step": 143826, "epoch": 3424} {"train_loss": -6.691675186157227, "global_step": 143827, "epoch": 3424} {"train_loss": -6.700730323791504, "global_step": 143828, "epoch": 3424} {"train_loss": -6.763911247253418, "global_step": 143829, "epoch": 3424} {"train_loss": -6.763768196105957, "global_step": 143830, "epoch": 3424} {"train_loss": -6.740486145019531, "global_step": 143831, "epoch": 3424} {"train_loss": -6.787016868591309, "global_step": 143832, "epoch": 3424} {"train_loss": -6.752567768096924, "global_step": 143833, "epoch": 3424} {"train_loss": -6.681604862213135, "global_step": 143834, "epoch": 3424} {"train_loss": -6.667506217956543, "global_step": 143835, "epoch": 3424} {"train_loss": -6.859261512756348, "global_step": 143836, "epoch": 3424} {"train_loss": -6.600911617279053, "global_step": 143837, "epoch": 3424} {"train_loss": -6.675348281860352, "global_step": 143838, "epoch": 3424} {"train_loss": -6.704833507537842, "global_step": 143839, "epoch": 3424} {"train_loss": -6.6059889793396, "global_step": 143840, "epoch": 3424} {"train_loss": -6.810960292816162, "global_step": 143841, "epoch": 3424} {"train_loss": -6.598091125488281, "global_step": 143842, "epoch": 3424} {"train_loss": -6.650884628295898, "global_step": 143843, "epoch": 3424} {"train_loss": -6.739520072937012, "global_step": 143844, "epoch": 3424} {"train_loss": -6.6143598556518555, "global_step": 143845, "epoch": 3424} {"train_loss": -6.733648300170898, "global_step": 143846, "epoch": 3424} {"train_loss": -6.693256855010986, "global_step": 143847, "epoch": 3424} {"train_loss": -6.661397933959961, "global_step": 143848, "epoch": 3424} {"train_loss": -6.739081098919823, "global_step": 143849, "epoch": 3424, "val_loss": 68434.609375} {"train_loss": -6.758540153503418, "global_step": 143850, "epoch": 3425} {"train_loss": -6.878955841064453, "global_step": 143851, "epoch": 3425} {"train_loss": -6.690240859985352, "global_step": 143852, "epoch": 3425} {"train_loss": -6.836531639099121, "global_step": 143853, "epoch": 3425} {"train_loss": -6.789860725402832, "global_step": 143854, "epoch": 3425} {"train_loss": -6.765303611755371, "global_step": 143855, "epoch": 3425} {"train_loss": -6.740998268127441, "global_step": 143856, "epoch": 3425} {"train_loss": -6.791722297668457, "global_step": 143857, "epoch": 3425} {"train_loss": -6.690651893615723, "global_step": 143858, "epoch": 3425} {"train_loss": -6.804172039031982, "global_step": 143859, "epoch": 3425} {"train_loss": -6.784904479980469, "global_step": 143860, "epoch": 3425} {"train_loss": -6.697632789611816, "global_step": 143861, "epoch": 3425} {"train_loss": -6.811491012573242, "global_step": 143862, "epoch": 3425} {"train_loss": -6.774023056030273, "global_step": 143863, "epoch": 3425} {"train_loss": -6.744974136352539, "global_step": 143864, "epoch": 3425} {"train_loss": -6.868133544921875, "global_step": 143865, "epoch": 3425} {"train_loss": -6.8529815673828125, "global_step": 143866, "epoch": 3425} {"train_loss": -6.720104217529297, "global_step": 143867, "epoch": 3425} {"train_loss": -6.76870059967041, "global_step": 143868, "epoch": 3425} {"train_loss": -6.777456283569336, "global_step": 143869, "epoch": 3425} {"train_loss": -6.7494001388549805, "global_step": 143870, "epoch": 3425} {"train_loss": -6.770021438598633, "global_step": 143871, "epoch": 3425} {"train_loss": -6.717823028564453, "global_step": 143872, "epoch": 3425} {"train_loss": -6.686443328857422, "global_step": 143873, "epoch": 3425} {"train_loss": -6.647674083709717, "global_step": 143874, "epoch": 3425} {"train_loss": -6.608933448791504, "global_step": 143875, "epoch": 3425} {"train_loss": -6.7799201011657715, "global_step": 143876, "epoch": 3425} {"train_loss": -6.626830101013184, "global_step": 143877, "epoch": 3425} {"train_loss": -6.730954647064209, "global_step": 143878, "epoch": 3425} {"train_loss": -6.6461381912231445, "global_step": 143879, "epoch": 3425} {"train_loss": -6.689870834350586, "global_step": 143880, "epoch": 3425} {"train_loss": -6.761260986328125, "global_step": 143881, "epoch": 3425} {"train_loss": -6.748552322387695, "global_step": 143882, "epoch": 3425} {"train_loss": -6.7510986328125, "global_step": 143883, "epoch": 3425} {"train_loss": -6.714482307434082, "global_step": 143884, "epoch": 3425} {"train_loss": -6.73093843460083, "global_step": 143885, "epoch": 3425} {"train_loss": -6.733164310455322, "global_step": 143886, "epoch": 3425} {"train_loss": -6.845091819763184, "global_step": 143887, "epoch": 3425} {"train_loss": -6.714266777038574, "global_step": 143888, "epoch": 3425} {"train_loss": -6.655121326446533, "global_step": 143889, "epoch": 3425} {"train_loss": -6.817739486694336, "global_step": 143890, "epoch": 3425} {"train_loss": -6.7499233313969205, "global_step": 143891, "epoch": 3425, "val_loss": 68319.921875} {"train_loss": -6.724189758300781, "global_step": 143892, "epoch": 3426} {"train_loss": -6.750823497772217, "global_step": 143893, "epoch": 3426} {"train_loss": -6.790067672729492, "global_step": 143894, "epoch": 3426} {"train_loss": -6.807102680206299, "global_step": 143895, "epoch": 3426} {"train_loss": -6.739373207092285, "global_step": 143896, "epoch": 3426} {"train_loss": -6.768847465515137, "global_step": 143897, "epoch": 3426} {"train_loss": -6.722353458404541, "global_step": 143898, "epoch": 3426} {"train_loss": -6.8319091796875, "global_step": 143899, "epoch": 3426} {"train_loss": -6.667167663574219, "global_step": 143900, "epoch": 3426} {"train_loss": -6.601832866668701, "global_step": 143901, "epoch": 3426} {"train_loss": -6.685410976409912, "global_step": 143902, "epoch": 3426} {"train_loss": -6.825920581817627, "global_step": 143903, "epoch": 3426} {"train_loss": -6.624520301818848, "global_step": 143904, "epoch": 3426} {"train_loss": -6.71315860748291, "global_step": 143905, "epoch": 3426} {"train_loss": -6.658989906311035, "global_step": 143906, "epoch": 3426} {"train_loss": -6.704748630523682, "global_step": 143907, "epoch": 3426} {"train_loss": -6.558627128601074, "global_step": 143908, "epoch": 3426} {"train_loss": -6.747488975524902, "global_step": 143909, "epoch": 3426} {"train_loss": -6.656597137451172, "global_step": 143910, "epoch": 3426} {"train_loss": -6.74229097366333, "global_step": 143911, "epoch": 3426} {"train_loss": -6.790894508361816, "global_step": 143912, "epoch": 3426} {"train_loss": -6.744176387786865, "global_step": 143913, "epoch": 3426} {"train_loss": -6.731078147888184, "global_step": 143914, "epoch": 3426} {"train_loss": -6.62722110748291, "global_step": 143915, "epoch": 3426} {"train_loss": -6.6135969161987305, "global_step": 143916, "epoch": 3426} {"train_loss": -6.7014055252075195, "global_step": 143917, "epoch": 3426} {"train_loss": -6.687979698181152, "global_step": 143918, "epoch": 3426} {"train_loss": -6.737513065338135, "global_step": 143919, "epoch": 3426} {"train_loss": -6.781495094299316, "global_step": 143920, "epoch": 3426} {"train_loss": -6.63308048248291, "global_step": 143921, "epoch": 3426} {"train_loss": -6.7902421951293945, "global_step": 143922, "epoch": 3426} {"train_loss": -6.601661682128906, "global_step": 143923, "epoch": 3426} {"train_loss": -6.687300682067871, "global_step": 143924, "epoch": 3426} {"train_loss": -6.756321907043457, "global_step": 143925, "epoch": 3426} {"train_loss": -6.784994125366211, "global_step": 143926, "epoch": 3426} {"train_loss": -6.776670932769775, "global_step": 143927, "epoch": 3426} {"train_loss": -6.801210403442383, "global_step": 143928, "epoch": 3426} {"train_loss": -6.834695816040039, "global_step": 143929, "epoch": 3426} {"train_loss": -6.749870777130127, "global_step": 143930, "epoch": 3426} {"train_loss": -6.691411972045898, "global_step": 143931, "epoch": 3426} {"train_loss": -6.767104148864746, "global_step": 143932, "epoch": 3426} {"train_loss": -6.725937480018253, "global_step": 143933, "epoch": 3426, "val_loss": 68343.1640625} {"train_loss": -6.767355442047119, "global_step": 143934, "epoch": 3427} {"train_loss": -6.734531402587891, "global_step": 143935, "epoch": 3427} {"train_loss": -6.68010950088501, "global_step": 143936, "epoch": 3427} {"train_loss": -6.646766662597656, "global_step": 143937, "epoch": 3427} {"train_loss": -6.686963081359863, "global_step": 143938, "epoch": 3427} {"train_loss": -6.773768424987793, "global_step": 143939, "epoch": 3427} {"train_loss": -6.6537628173828125, "global_step": 143940, "epoch": 3427} {"train_loss": -6.761888027191162, "global_step": 143941, "epoch": 3427} {"train_loss": -6.6629838943481445, "global_step": 143942, "epoch": 3427} {"train_loss": -6.694361686706543, "global_step": 143943, "epoch": 3427} {"train_loss": -6.664584159851074, "global_step": 143944, "epoch": 3427} {"train_loss": -6.658864974975586, "global_step": 143945, "epoch": 3427} {"train_loss": -6.728970050811768, "global_step": 143946, "epoch": 3427} {"train_loss": -6.5757155418396, "global_step": 143947, "epoch": 3427} {"train_loss": -6.829920768737793, "global_step": 143948, "epoch": 3427} {"train_loss": -6.747964859008789, "global_step": 143949, "epoch": 3427} {"train_loss": -6.656416416168213, "global_step": 143950, "epoch": 3427} {"train_loss": -6.752488136291504, "global_step": 143951, "epoch": 3427} {"train_loss": -6.721108436584473, "global_step": 143952, "epoch": 3427} {"train_loss": -6.757407188415527, "global_step": 143953, "epoch": 3427} {"train_loss": -6.6204142570495605, "global_step": 143954, "epoch": 3427} {"train_loss": -6.6975507736206055, "global_step": 143955, "epoch": 3427} {"train_loss": -6.799167633056641, "global_step": 143956, "epoch": 3427} {"train_loss": -6.673563003540039, "global_step": 143957, "epoch": 3427} {"train_loss": -6.665804386138916, "global_step": 143958, "epoch": 3427} {"train_loss": -6.804323673248291, "global_step": 143959, "epoch": 3427} {"train_loss": -6.692641258239746, "global_step": 143960, "epoch": 3427} {"train_loss": -6.723604202270508, "global_step": 143961, "epoch": 3427} {"train_loss": -6.768700122833252, "global_step": 143962, "epoch": 3427} {"train_loss": -6.7631988525390625, "global_step": 143963, "epoch": 3427} {"train_loss": -6.695220947265625, "global_step": 143964, "epoch": 3427} {"train_loss": -6.745325088500977, "global_step": 143965, "epoch": 3427} {"train_loss": -6.752439022064209, "global_step": 143966, "epoch": 3427} {"train_loss": -6.662275314331055, "global_step": 143967, "epoch": 3427} {"train_loss": -6.782388210296631, "global_step": 143968, "epoch": 3427} {"train_loss": -6.722540378570557, "global_step": 143969, "epoch": 3427} {"train_loss": -6.760522365570068, "global_step": 143970, "epoch": 3427} {"train_loss": -6.705774784088135, "global_step": 143971, "epoch": 3427} {"train_loss": -6.649013042449951, "global_step": 143972, "epoch": 3427} {"train_loss": -6.777440071105957, "global_step": 143973, "epoch": 3427} {"train_loss": -6.821094989776611, "global_step": 143974, "epoch": 3427} {"train_loss": -6.71938909803118, "global_step": 143975, "epoch": 3427, "val_loss": 68306.1015625} {"train_loss": -6.713041305541992, "global_step": 143976, "epoch": 3428} {"train_loss": -6.773841857910156, "global_step": 143977, "epoch": 3428} {"train_loss": -6.777759552001953, "global_step": 143978, "epoch": 3428} {"train_loss": -6.681886196136475, "global_step": 143979, "epoch": 3428} {"train_loss": -6.73062801361084, "global_step": 143980, "epoch": 3428} {"train_loss": -6.782264709472656, "global_step": 143981, "epoch": 3428} {"train_loss": -6.79947566986084, "global_step": 143982, "epoch": 3428} {"train_loss": -6.881613731384277, "global_step": 143983, "epoch": 3428} {"train_loss": -6.696181297302246, "global_step": 143984, "epoch": 3428} {"train_loss": -6.853651523590088, "global_step": 143985, "epoch": 3428} {"train_loss": -6.649989604949951, "global_step": 143986, "epoch": 3428} {"train_loss": -6.7010908126831055, "global_step": 143987, "epoch": 3428} {"train_loss": -6.765801429748535, "global_step": 143988, "epoch": 3428} {"train_loss": -6.710305213928223, "global_step": 143989, "epoch": 3428} {"train_loss": -6.858557224273682, "global_step": 143990, "epoch": 3428} {"train_loss": -6.8664140701293945, "global_step": 143991, "epoch": 3428} {"train_loss": -6.714388370513916, "global_step": 143992, "epoch": 3428} {"train_loss": -6.817305564880371, "global_step": 143993, "epoch": 3428} {"train_loss": -6.734261512756348, "global_step": 143994, "epoch": 3428} {"train_loss": -6.779634475708008, "global_step": 143995, "epoch": 3428} {"train_loss": -6.7472052574157715, "global_step": 143996, "epoch": 3428} {"train_loss": -6.841754913330078, "global_step": 143997, "epoch": 3428} {"train_loss": -6.822412967681885, "global_step": 143998, "epoch": 3428} {"train_loss": -6.75631856918335, "global_step": 143999, "epoch": 3428} {"train_loss": -6.765398025512695, "global_step": 144000, "epoch": 3428} {"train_loss": -6.665155410766602, "global_step": 144001, "epoch": 3428} {"train_loss": -6.728172302246094, "global_step": 144002, "epoch": 3428} {"train_loss": -6.798213005065918, "global_step": 144003, "epoch": 3428} {"train_loss": -6.743365287780762, "global_step": 144004, "epoch": 3428} {"train_loss": -6.774843215942383, "global_step": 144005, "epoch": 3428} {"train_loss": -6.718608379364014, "global_step": 144006, "epoch": 3428} {"train_loss": -6.779489040374756, "global_step": 144007, "epoch": 3428} {"train_loss": -6.793912887573242, "global_step": 144008, "epoch": 3428} {"train_loss": -6.764434814453125, "global_step": 144009, "epoch": 3428} {"train_loss": -6.932312488555908, "global_step": 144010, "epoch": 3428} {"train_loss": -6.817049980163574, "global_step": 144011, "epoch": 3428} {"train_loss": -6.814582824707031, "global_step": 144012, "epoch": 3428} {"train_loss": -6.901073455810547, "global_step": 144013, "epoch": 3428} {"train_loss": -6.833322525024414, "global_step": 144014, "epoch": 3428} {"train_loss": -6.781251430511475, "global_step": 144015, "epoch": 3428} {"train_loss": -6.7457990646362305, "global_step": 144016, "epoch": 3428} {"train_loss": -6.774605660211472, "global_step": 144017, "epoch": 3428, "val_loss": 68457.2109375} {"train_loss": -6.837255477905273, "global_step": 144018, "epoch": 3429} {"train_loss": -6.835276126861572, "global_step": 144019, "epoch": 3429} {"train_loss": -6.800637245178223, "global_step": 144020, "epoch": 3429} {"train_loss": -6.870235443115234, "global_step": 144021, "epoch": 3429} {"train_loss": -6.6881632804870605, "global_step": 144022, "epoch": 3429} {"train_loss": -6.700660705566406, "global_step": 144023, "epoch": 3429} {"train_loss": -6.806874752044678, "global_step": 144024, "epoch": 3429} {"train_loss": -6.608428955078125, "global_step": 144025, "epoch": 3429} {"train_loss": -6.744603157043457, "global_step": 144026, "epoch": 3429} {"train_loss": -6.836370468139648, "global_step": 144027, "epoch": 3429} {"train_loss": -6.843977928161621, "global_step": 144028, "epoch": 3429} {"train_loss": -6.792095184326172, "global_step": 144029, "epoch": 3429} {"train_loss": -6.784986972808838, "global_step": 144030, "epoch": 3429} {"train_loss": -6.9395647048950195, "global_step": 144031, "epoch": 3429} {"train_loss": -6.662965774536133, "global_step": 144032, "epoch": 3429} {"train_loss": -6.523293972015381, "global_step": 144033, "epoch": 3429} {"train_loss": -6.66611385345459, "global_step": 144034, "epoch": 3429} {"train_loss": -6.801766395568848, "global_step": 144035, "epoch": 3429} {"train_loss": -6.6964921951293945, "global_step": 144036, "epoch": 3429} {"train_loss": -6.687716484069824, "global_step": 144037, "epoch": 3429} {"train_loss": -6.806118965148926, "global_step": 144038, "epoch": 3429} {"train_loss": -6.606581687927246, "global_step": 144039, "epoch": 3429} {"train_loss": -6.72965669631958, "global_step": 144040, "epoch": 3429} {"train_loss": -6.682415008544922, "global_step": 144041, "epoch": 3429} {"train_loss": -6.755564212799072, "global_step": 144042, "epoch": 3429} {"train_loss": -6.846818447113037, "global_step": 144043, "epoch": 3429} {"train_loss": -6.699737071990967, "global_step": 144044, "epoch": 3429} {"train_loss": -6.788560390472412, "global_step": 144045, "epoch": 3429} {"train_loss": -6.675368309020996, "global_step": 144046, "epoch": 3429} {"train_loss": -6.64324426651001, "global_step": 144047, "epoch": 3429} {"train_loss": -6.750530242919922, "global_step": 144048, "epoch": 3429} {"train_loss": -6.868025302886963, "global_step": 144049, "epoch": 3429} {"train_loss": -6.790905952453613, "global_step": 144050, "epoch": 3429} {"train_loss": -6.705373287200928, "global_step": 144051, "epoch": 3429} {"train_loss": -6.81958532333374, "global_step": 144052, "epoch": 3429} {"train_loss": -6.704022407531738, "global_step": 144053, "epoch": 3429} {"train_loss": -6.762724876403809, "global_step": 144054, "epoch": 3429} {"train_loss": -6.692241668701172, "global_step": 144055, "epoch": 3429} {"train_loss": -6.7054643630981445, "global_step": 144056, "epoch": 3429} {"train_loss": -6.717609882354736, "global_step": 144057, "epoch": 3429} {"train_loss": -6.557757377624512, "global_step": 144058, "epoch": 3429} {"train_loss": -6.742764518374488, "global_step": 144059, "epoch": 3429, "val_loss": 68537.421875} {"train_loss": -6.5783891677856445, "global_step": 144060, "epoch": 3430} {"train_loss": -6.650567054748535, "global_step": 144061, "epoch": 3430} {"train_loss": -6.830280303955078, "global_step": 144062, "epoch": 3430} {"train_loss": -6.676403999328613, "global_step": 144063, "epoch": 3430} {"train_loss": -6.76835823059082, "global_step": 144064, "epoch": 3430} {"train_loss": -6.79144287109375, "global_step": 144065, "epoch": 3430} {"train_loss": -6.764834880828857, "global_step": 144066, "epoch": 3430} {"train_loss": -6.811933994293213, "global_step": 144067, "epoch": 3430} {"train_loss": -6.769007205963135, "global_step": 144068, "epoch": 3430} {"train_loss": -6.823805809020996, "global_step": 144069, "epoch": 3430} {"train_loss": -6.7489118576049805, "global_step": 144070, "epoch": 3430} {"train_loss": -6.822909355163574, "global_step": 144071, "epoch": 3430} {"train_loss": -6.75567626953125, "global_step": 144072, "epoch": 3430} {"train_loss": -6.715538024902344, "global_step": 144073, "epoch": 3430} {"train_loss": -6.701900482177734, "global_step": 144074, "epoch": 3430} {"train_loss": -6.791983604431152, "global_step": 144075, "epoch": 3430} {"train_loss": -6.751397132873535, "global_step": 144076, "epoch": 3430} {"train_loss": -6.7848639488220215, "global_step": 144077, "epoch": 3430} {"train_loss": -6.807534694671631, "global_step": 144078, "epoch": 3430} {"train_loss": -6.791737079620361, "global_step": 144079, "epoch": 3430} {"train_loss": -6.704070568084717, "global_step": 144080, "epoch": 3430} {"train_loss": -6.776308059692383, "global_step": 144081, "epoch": 3430} {"train_loss": -6.890041828155518, "global_step": 144082, "epoch": 3430} {"train_loss": -6.721593856811523, "global_step": 144083, "epoch": 3430} {"train_loss": -6.803375244140625, "global_step": 144084, "epoch": 3430} {"train_loss": -6.717337608337402, "global_step": 144085, "epoch": 3430} {"train_loss": -6.7054643630981445, "global_step": 144086, "epoch": 3430} {"train_loss": -6.5687713623046875, "global_step": 144087, "epoch": 3430} {"train_loss": -6.7014007568359375, "global_step": 144088, "epoch": 3430} {"train_loss": -6.673496723175049, "global_step": 144089, "epoch": 3430} {"train_loss": -6.65138053894043, "global_step": 144090, "epoch": 3430} {"train_loss": -6.725593566894531, "global_step": 144091, "epoch": 3430} {"train_loss": -6.744733810424805, "global_step": 144092, "epoch": 3430} {"train_loss": -6.726625442504883, "global_step": 144093, "epoch": 3430} {"train_loss": -6.768930912017822, "global_step": 144094, "epoch": 3430} {"train_loss": -6.746038913726807, "global_step": 144095, "epoch": 3430} {"train_loss": -6.630364894866943, "global_step": 144096, "epoch": 3430} {"train_loss": -6.851718902587891, "global_step": 144097, "epoch": 3430} {"train_loss": -6.6704816818237305, "global_step": 144098, "epoch": 3430} {"train_loss": -6.7486724853515625, "global_step": 144099, "epoch": 3430} {"train_loss": -6.719831943511963, "global_step": 144100, "epoch": 3430} {"train_loss": -6.738812435240972, "global_step": 144101, "epoch": 3430, "val_loss": 68275.796875} {"train_loss": -6.700943946838379, "global_step": 144102, "epoch": 3431} {"train_loss": -6.64731502532959, "global_step": 144103, "epoch": 3431} {"train_loss": -6.814655780792236, "global_step": 144104, "epoch": 3431} {"train_loss": -6.768453598022461, "global_step": 144105, "epoch": 3431} {"train_loss": -6.743788719177246, "global_step": 144106, "epoch": 3431} {"train_loss": -6.843144416809082, "global_step": 144107, "epoch": 3431} {"train_loss": -6.710396766662598, "global_step": 144108, "epoch": 3431} {"train_loss": -6.70236873626709, "global_step": 144109, "epoch": 3431} {"train_loss": -6.745753288269043, "global_step": 144110, "epoch": 3431} {"train_loss": -6.830704212188721, "global_step": 144111, "epoch": 3431} {"train_loss": -6.87058687210083, "global_step": 144112, "epoch": 3431} {"train_loss": -6.784362316131592, "global_step": 144113, "epoch": 3431} {"train_loss": -6.796092987060547, "global_step": 144114, "epoch": 3431} {"train_loss": -6.724830627441406, "global_step": 144115, "epoch": 3431} {"train_loss": -6.901797294616699, "global_step": 144116, "epoch": 3431} {"train_loss": -6.851728916168213, "global_step": 144117, "epoch": 3431} {"train_loss": -6.888089656829834, "global_step": 144118, "epoch": 3431} {"train_loss": -6.892996788024902, "global_step": 144119, "epoch": 3431} {"train_loss": -6.826839447021484, "global_step": 144120, "epoch": 3431} {"train_loss": -6.832472801208496, "global_step": 144121, "epoch": 3431} {"train_loss": -6.729104995727539, "global_step": 144122, "epoch": 3431} {"train_loss": -6.803106784820557, "global_step": 144123, "epoch": 3431} {"train_loss": -6.809939861297607, "global_step": 144124, "epoch": 3431} {"train_loss": -6.831465244293213, "global_step": 144125, "epoch": 3431} {"train_loss": -6.8009538650512695, "global_step": 144126, "epoch": 3431} {"train_loss": -6.780096530914307, "global_step": 144127, "epoch": 3431} {"train_loss": -6.803051471710205, "global_step": 144128, "epoch": 3431} {"train_loss": -6.710749626159668, "global_step": 144129, "epoch": 3431} {"train_loss": -6.852445125579834, "global_step": 144130, "epoch": 3431} {"train_loss": -6.738292217254639, "global_step": 144131, "epoch": 3431} {"train_loss": -6.734558582305908, "global_step": 144132, "epoch": 3431} {"train_loss": -6.700711727142334, "global_step": 144133, "epoch": 3431} {"train_loss": -6.579141616821289, "global_step": 144134, "epoch": 3431} {"train_loss": -6.820115089416504, "global_step": 144135, "epoch": 3431} {"train_loss": -6.658413887023926, "global_step": 144136, "epoch": 3431} {"train_loss": -6.715016841888428, "global_step": 144137, "epoch": 3431} {"train_loss": -6.7304463386535645, "global_step": 144138, "epoch": 3431} {"train_loss": -6.550623893737793, "global_step": 144139, "epoch": 3431} {"train_loss": -6.609282493591309, "global_step": 144140, "epoch": 3431} {"train_loss": -6.63868522644043, "global_step": 144141, "epoch": 3431} {"train_loss": -6.630731582641602, "global_step": 144142, "epoch": 3431} {"train_loss": -6.756740604128156, "global_step": 144143, "epoch": 3431, "val_loss": 68588.96875} {"train_loss": -6.7542877197265625, "global_step": 144144, "epoch": 3432} {"train_loss": -6.628864288330078, "global_step": 144145, "epoch": 3432} {"train_loss": -6.6073760986328125, "global_step": 144146, "epoch": 3432} {"train_loss": -6.765203475952148, "global_step": 144147, "epoch": 3432} {"train_loss": -6.641997814178467, "global_step": 144148, "epoch": 3432} {"train_loss": -6.587800025939941, "global_step": 144149, "epoch": 3432} {"train_loss": -6.554105758666992, "global_step": 144150, "epoch": 3432} {"train_loss": -6.800278663635254, "global_step": 144151, "epoch": 3432} {"train_loss": -6.504447937011719, "global_step": 144152, "epoch": 3432} {"train_loss": -6.771603107452393, "global_step": 144153, "epoch": 3432} {"train_loss": -6.640058994293213, "global_step": 144154, "epoch": 3432} {"train_loss": -6.654449462890625, "global_step": 144155, "epoch": 3432} {"train_loss": -6.603452682495117, "global_step": 144156, "epoch": 3432} {"train_loss": -6.669332504272461, "global_step": 144157, "epoch": 3432} {"train_loss": -6.739748001098633, "global_step": 144158, "epoch": 3432} {"train_loss": -6.704431056976318, "global_step": 144159, "epoch": 3432} {"train_loss": -6.691617012023926, "global_step": 144160, "epoch": 3432} {"train_loss": -6.848970890045166, "global_step": 144161, "epoch": 3432} {"train_loss": -6.6210222244262695, "global_step": 144162, "epoch": 3432} {"train_loss": -6.82172966003418, "global_step": 144163, "epoch": 3432} {"train_loss": -6.661025524139404, "global_step": 144164, "epoch": 3432} {"train_loss": -6.692238807678223, "global_step": 144165, "epoch": 3432} {"train_loss": -6.792770862579346, "global_step": 144166, "epoch": 3432} {"train_loss": -6.7299041748046875, "global_step": 144167, "epoch": 3432} {"train_loss": -6.72062349319458, "global_step": 144168, "epoch": 3432} {"train_loss": -6.7311296463012695, "global_step": 144169, "epoch": 3432} {"train_loss": -6.871731281280518, "global_step": 144170, "epoch": 3432} {"train_loss": -6.764363765716553, "global_step": 144171, "epoch": 3432} {"train_loss": -6.808484077453613, "global_step": 144172, "epoch": 3432} {"train_loss": -6.8014421463012695, "global_step": 144173, "epoch": 3432} {"train_loss": -6.749755859375, "global_step": 144174, "epoch": 3432} {"train_loss": -6.764334201812744, "global_step": 144175, "epoch": 3432} {"train_loss": -6.706559181213379, "global_step": 144176, "epoch": 3432} {"train_loss": -6.760563373565674, "global_step": 144177, "epoch": 3432} {"train_loss": -6.695817947387695, "global_step": 144178, "epoch": 3432} {"train_loss": -6.788758277893066, "global_step": 144179, "epoch": 3432} {"train_loss": -6.83251428604126, "global_step": 144180, "epoch": 3432} {"train_loss": -6.7672882080078125, "global_step": 144181, "epoch": 3432} {"train_loss": -6.766125679016113, "global_step": 144182, "epoch": 3432} {"train_loss": -6.765460014343262, "global_step": 144183, "epoch": 3432} {"train_loss": -6.730629920959473, "global_step": 144184, "epoch": 3432} {"train_loss": -6.719157854715983, "global_step": 144185, "epoch": 3432, "val_loss": 68352.6484375} {"train_loss": -6.769003391265869, "global_step": 144186, "epoch": 3433} {"train_loss": -6.839313983917236, "global_step": 144187, "epoch": 3433} {"train_loss": -6.703962802886963, "global_step": 144188, "epoch": 3433} {"train_loss": -6.8137359619140625, "global_step": 144189, "epoch": 3433} {"train_loss": -6.71280574798584, "global_step": 144190, "epoch": 3433} {"train_loss": -6.731050491333008, "global_step": 144191, "epoch": 3433} {"train_loss": -6.772294998168945, "global_step": 144192, "epoch": 3433} {"train_loss": -6.74196195602417, "global_step": 144193, "epoch": 3433} {"train_loss": -6.747140884399414, "global_step": 144194, "epoch": 3433} {"train_loss": -6.646911144256592, "global_step": 144195, "epoch": 3433} {"train_loss": -6.705682754516602, "global_step": 144196, "epoch": 3433} {"train_loss": -6.7536516189575195, "global_step": 144197, "epoch": 3433} {"train_loss": -6.604907989501953, "global_step": 144198, "epoch": 3433} {"train_loss": -6.731507301330566, "global_step": 144199, "epoch": 3433} {"train_loss": -6.611159324645996, "global_step": 144200, "epoch": 3433} {"train_loss": -6.749752044677734, "global_step": 144201, "epoch": 3433} {"train_loss": -6.700702667236328, "global_step": 144202, "epoch": 3433} {"train_loss": -6.701634883880615, "global_step": 144203, "epoch": 3433} {"train_loss": -6.7690935134887695, "global_step": 144204, "epoch": 3433} {"train_loss": -6.667413711547852, "global_step": 144205, "epoch": 3433} {"train_loss": -6.718587875366211, "global_step": 144206, "epoch": 3433} {"train_loss": -6.7580180168151855, "global_step": 144207, "epoch": 3433} {"train_loss": -6.732813835144043, "global_step": 144208, "epoch": 3433} {"train_loss": -6.592960357666016, "global_step": 144209, "epoch": 3433} {"train_loss": -6.799310207366943, "global_step": 144210, "epoch": 3433} {"train_loss": -6.656006813049316, "global_step": 144211, "epoch": 3433} {"train_loss": -6.739896774291992, "global_step": 144212, "epoch": 3433} {"train_loss": -6.620882987976074, "global_step": 144213, "epoch": 3433} {"train_loss": -6.792400360107422, "global_step": 144214, "epoch": 3433} {"train_loss": -6.674783706665039, "global_step": 144215, "epoch": 3433} {"train_loss": -6.629948616027832, "global_step": 144216, "epoch": 3433} {"train_loss": -6.835562229156494, "global_step": 144217, "epoch": 3433} {"train_loss": -6.729727745056152, "global_step": 144218, "epoch": 3433} {"train_loss": -6.769135475158691, "global_step": 144219, "epoch": 3433} {"train_loss": -6.7501630783081055, "global_step": 144220, "epoch": 3433} {"train_loss": -6.735055446624756, "global_step": 144221, "epoch": 3433} {"train_loss": -6.831042289733887, "global_step": 144222, "epoch": 3433} {"train_loss": -6.758793354034424, "global_step": 144223, "epoch": 3433} {"train_loss": -6.749976634979248, "global_step": 144224, "epoch": 3433} {"train_loss": -6.767215251922607, "global_step": 144225, "epoch": 3433} {"train_loss": -6.688228607177734, "global_step": 144226, "epoch": 3433} {"train_loss": -6.726365747905913, "global_step": 144227, "epoch": 3433, "val_loss": 68458.734375} {"train_loss": -6.734234809875488, "global_step": 144228, "epoch": 3434} {"train_loss": -6.773930072784424, "global_step": 144229, "epoch": 3434} {"train_loss": -6.853841304779053, "global_step": 144230, "epoch": 3434} {"train_loss": -6.6263041496276855, "global_step": 144231, "epoch": 3434} {"train_loss": -6.8061676025390625, "global_step": 144232, "epoch": 3434} {"train_loss": -6.695479393005371, "global_step": 144233, "epoch": 3434} {"train_loss": -6.718199729919434, "global_step": 144234, "epoch": 3434} {"train_loss": -6.8318634033203125, "global_step": 144235, "epoch": 3434} {"train_loss": -6.709863662719727, "global_step": 144236, "epoch": 3434} {"train_loss": -6.7491865158081055, "global_step": 144237, "epoch": 3434} {"train_loss": -6.711529731750488, "global_step": 144238, "epoch": 3434} {"train_loss": -6.672223091125488, "global_step": 144239, "epoch": 3434} {"train_loss": -6.789696216583252, "global_step": 144240, "epoch": 3434} {"train_loss": -6.748437881469727, "global_step": 144241, "epoch": 3434} {"train_loss": -6.796648979187012, "global_step": 144242, "epoch": 3434} {"train_loss": -6.833682060241699, "global_step": 144243, "epoch": 3434} {"train_loss": -6.77162504196167, "global_step": 144244, "epoch": 3434} {"train_loss": -6.702399253845215, "global_step": 144245, "epoch": 3434} {"train_loss": -6.7617950439453125, "global_step": 144246, "epoch": 3434} {"train_loss": -6.740496635437012, "global_step": 144247, "epoch": 3434} {"train_loss": -6.805468559265137, "global_step": 144248, "epoch": 3434} {"train_loss": -6.678854465484619, "global_step": 144249, "epoch": 3434} {"train_loss": -6.766098499298096, "global_step": 144250, "epoch": 3434} {"train_loss": -6.882767677307129, "global_step": 144251, "epoch": 3434} {"train_loss": -6.738752365112305, "global_step": 144252, "epoch": 3434} {"train_loss": -6.698292255401611, "global_step": 144253, "epoch": 3434} {"train_loss": -6.867623329162598, "global_step": 144254, "epoch": 3434} {"train_loss": -6.805723667144775, "global_step": 144255, "epoch": 3434} {"train_loss": -6.809226036071777, "global_step": 144256, "epoch": 3434} {"train_loss": -6.825146675109863, "global_step": 144257, "epoch": 3434} {"train_loss": -6.814043045043945, "global_step": 144258, "epoch": 3434} {"train_loss": -6.886861801147461, "global_step": 144259, "epoch": 3434} {"train_loss": -6.835518836975098, "global_step": 144260, "epoch": 3434} {"train_loss": -6.714374542236328, "global_step": 144261, "epoch": 3434} {"train_loss": -6.807154655456543, "global_step": 144262, "epoch": 3434} {"train_loss": -6.862469673156738, "global_step": 144263, "epoch": 3434} {"train_loss": -6.715108871459961, "global_step": 144264, "epoch": 3434} {"train_loss": -6.816516399383545, "global_step": 144265, "epoch": 3434} {"train_loss": -6.680395126342773, "global_step": 144266, "epoch": 3434} {"train_loss": -6.745532035827637, "global_step": 144267, "epoch": 3434} {"train_loss": -6.763584136962891, "global_step": 144268, "epoch": 3434} {"train_loss": -6.768559285572597, "global_step": 144269, "epoch": 3434, "val_loss": 68454.984375} {"train_loss": -6.761867523193359, "global_step": 144270, "epoch": 3435} {"train_loss": -6.879832744598389, "global_step": 144271, "epoch": 3435} {"train_loss": -6.721062660217285, "global_step": 144272, "epoch": 3435} {"train_loss": -6.82515287399292, "global_step": 144273, "epoch": 3435} {"train_loss": -6.5908637046813965, "global_step": 144274, "epoch": 3435} {"train_loss": -6.694412708282471, "global_step": 144275, "epoch": 3435} {"train_loss": -6.653510093688965, "global_step": 144276, "epoch": 3435} {"train_loss": -6.720252990722656, "global_step": 144277, "epoch": 3435} {"train_loss": -6.809366703033447, "global_step": 144278, "epoch": 3435} {"train_loss": -6.633533477783203, "global_step": 144279, "epoch": 3435} {"train_loss": -6.755069732666016, "global_step": 144280, "epoch": 3435} {"train_loss": -6.640576362609863, "global_step": 144281, "epoch": 3435} {"train_loss": -6.747631549835205, "global_step": 144282, "epoch": 3435} {"train_loss": -6.791006088256836, "global_step": 144283, "epoch": 3435} {"train_loss": -6.693599700927734, "global_step": 144284, "epoch": 3435} {"train_loss": -6.768838882446289, "global_step": 144285, "epoch": 3435} {"train_loss": -6.690645217895508, "global_step": 144286, "epoch": 3435} {"train_loss": -6.693972110748291, "global_step": 144287, "epoch": 3435} {"train_loss": -6.884125709533691, "global_step": 144288, "epoch": 3435} {"train_loss": -6.781745910644531, "global_step": 144289, "epoch": 3435} {"train_loss": -6.897276878356934, "global_step": 144290, "epoch": 3435} {"train_loss": -6.703056812286377, "global_step": 144291, "epoch": 3435} {"train_loss": -6.762935161590576, "global_step": 144292, "epoch": 3435} {"train_loss": -6.850068092346191, "global_step": 144293, "epoch": 3435} {"train_loss": -6.77492618560791, "global_step": 144294, "epoch": 3435} {"train_loss": -6.669517517089844, "global_step": 144295, "epoch": 3435} {"train_loss": -6.808479309082031, "global_step": 144296, "epoch": 3435} {"train_loss": -6.903831481933594, "global_step": 144297, "epoch": 3435} {"train_loss": -6.8083720207214355, "global_step": 144298, "epoch": 3435} {"train_loss": -6.862155914306641, "global_step": 144299, "epoch": 3435} {"train_loss": -6.767696380615234, "global_step": 144300, "epoch": 3435} {"train_loss": -6.805665016174316, "global_step": 144301, "epoch": 3435} {"train_loss": -6.8112993240356445, "global_step": 144302, "epoch": 3435} {"train_loss": -6.640280723571777, "global_step": 144303, "epoch": 3435} {"train_loss": -6.798675060272217, "global_step": 144304, "epoch": 3435} {"train_loss": -6.858560562133789, "global_step": 144305, "epoch": 3435} {"train_loss": -6.773582458496094, "global_step": 144306, "epoch": 3435} {"train_loss": -6.803203582763672, "global_step": 144307, "epoch": 3435} {"train_loss": -6.820461273193359, "global_step": 144308, "epoch": 3435} {"train_loss": -6.770825386047363, "global_step": 144309, "epoch": 3435} {"train_loss": -6.872093200683594, "global_step": 144310, "epoch": 3435} {"train_loss": -6.769670384270804, "global_step": 144311, "epoch": 3435, "val_loss": 68343.8046875} {"train_loss": -6.930124759674072, "global_step": 144312, "epoch": 3436} {"train_loss": -6.79217004776001, "global_step": 144313, "epoch": 3436} {"train_loss": -6.859709739685059, "global_step": 144314, "epoch": 3436} {"train_loss": -6.833151817321777, "global_step": 144315, "epoch": 3436} {"train_loss": -6.876529693603516, "global_step": 144316, "epoch": 3436} {"train_loss": -6.76508903503418, "global_step": 144317, "epoch": 3436} {"train_loss": -6.929050445556641, "global_step": 144318, "epoch": 3436} {"train_loss": -6.909258842468262, "global_step": 144319, "epoch": 3436} {"train_loss": -6.725612640380859, "global_step": 144320, "epoch": 3436} {"train_loss": -6.776851654052734, "global_step": 144321, "epoch": 3436} {"train_loss": -6.809544563293457, "global_step": 144322, "epoch": 3436} {"train_loss": -6.845134735107422, "global_step": 144323, "epoch": 3436} {"train_loss": -6.84998893737793, "global_step": 144324, "epoch": 3436} {"train_loss": -6.88303804397583, "global_step": 144325, "epoch": 3436} {"train_loss": -6.736166000366211, "global_step": 144326, "epoch": 3436} {"train_loss": -6.775674819946289, "global_step": 144327, "epoch": 3436} {"train_loss": -6.723883628845215, "global_step": 144328, "epoch": 3436} {"train_loss": -6.689072608947754, "global_step": 144329, "epoch": 3436} {"train_loss": -6.77305269241333, "global_step": 144330, "epoch": 3436} {"train_loss": -6.863317012786865, "global_step": 144331, "epoch": 3436} {"train_loss": -6.947094917297363, "global_step": 144332, "epoch": 3436} {"train_loss": -6.8599443435668945, "global_step": 144333, "epoch": 3436} {"train_loss": -6.905958652496338, "global_step": 144334, "epoch": 3436} {"train_loss": -6.892561435699463, "global_step": 144335, "epoch": 3436} {"train_loss": -6.833601951599121, "global_step": 144336, "epoch": 3436} {"train_loss": -6.76524543762207, "global_step": 144337, "epoch": 3436} {"train_loss": -6.7415361404418945, "global_step": 144338, "epoch": 3436} {"train_loss": -6.817873477935791, "global_step": 144339, "epoch": 3436} {"train_loss": -6.886442184448242, "global_step": 144340, "epoch": 3436} {"train_loss": -6.771579742431641, "global_step": 144341, "epoch": 3436} {"train_loss": -6.591209411621094, "global_step": 144342, "epoch": 3436} {"train_loss": -6.753537178039551, "global_step": 144343, "epoch": 3436} {"train_loss": -6.750383377075195, "global_step": 144344, "epoch": 3436} {"train_loss": -6.577516555786133, "global_step": 144345, "epoch": 3436} {"train_loss": -6.731749534606934, "global_step": 144346, "epoch": 3436} {"train_loss": -6.688729286193848, "global_step": 144347, "epoch": 3436} {"train_loss": -6.58723258972168, "global_step": 144348, "epoch": 3436} {"train_loss": -6.659000396728516, "global_step": 144349, "epoch": 3436} {"train_loss": -6.646161079406738, "global_step": 144350, "epoch": 3436} {"train_loss": -6.797562599182129, "global_step": 144351, "epoch": 3436} {"train_loss": -6.730227470397949, "global_step": 144352, "epoch": 3436} {"train_loss": -6.780669007982526, "global_step": 144353, "epoch": 3436, "val_loss": 68707.1640625} {"train_loss": -6.7016754150390625, "global_step": 144354, "epoch": 3437} {"train_loss": -6.744460105895996, "global_step": 144355, "epoch": 3437} {"train_loss": -6.731176853179932, "global_step": 144356, "epoch": 3437} {"train_loss": -6.756268501281738, "global_step": 144357, "epoch": 3437} {"train_loss": -6.681675434112549, "global_step": 144358, "epoch": 3437} {"train_loss": -6.704326629638672, "global_step": 144359, "epoch": 3437} {"train_loss": -6.655023097991943, "global_step": 144360, "epoch": 3437} {"train_loss": -6.720334053039551, "global_step": 144361, "epoch": 3437} {"train_loss": -6.578728675842285, "global_step": 144362, "epoch": 3437} {"train_loss": -6.687921524047852, "global_step": 144363, "epoch": 3437} {"train_loss": -6.6281304359436035, "global_step": 144364, "epoch": 3437} {"train_loss": -6.656291961669922, "global_step": 144365, "epoch": 3437} {"train_loss": -6.695131301879883, "global_step": 144366, "epoch": 3437} {"train_loss": -6.630241870880127, "global_step": 144367, "epoch": 3437} {"train_loss": -6.717929840087891, "global_step": 144368, "epoch": 3437} {"train_loss": -6.752671241760254, "global_step": 144369, "epoch": 3437} {"train_loss": -6.643521785736084, "global_step": 144370, "epoch": 3437} {"train_loss": -6.748664379119873, "global_step": 144371, "epoch": 3437} {"train_loss": -6.823671340942383, "global_step": 144372, "epoch": 3437} {"train_loss": -6.7615966796875, "global_step": 144373, "epoch": 3437} {"train_loss": -6.794322490692139, "global_step": 144374, "epoch": 3437} {"train_loss": -6.748490333557129, "global_step": 144375, "epoch": 3437} {"train_loss": -6.838937282562256, "global_step": 144376, "epoch": 3437} {"train_loss": -6.6902289390563965, "global_step": 144377, "epoch": 3437} {"train_loss": -6.790943145751953, "global_step": 144378, "epoch": 3437} {"train_loss": -6.77424430847168, "global_step": 144379, "epoch": 3437} {"train_loss": -6.706695556640625, "global_step": 144380, "epoch": 3437} {"train_loss": -6.749903202056885, "global_step": 144381, "epoch": 3437} {"train_loss": -6.79090690612793, "global_step": 144382, "epoch": 3437} {"train_loss": -6.696766376495361, "global_step": 144383, "epoch": 3437} {"train_loss": -6.727568626403809, "global_step": 144384, "epoch": 3437} {"train_loss": -6.628064155578613, "global_step": 144385, "epoch": 3437} {"train_loss": -6.710956573486328, "global_step": 144386, "epoch": 3437} {"train_loss": -6.625560283660889, "global_step": 144387, "epoch": 3437} {"train_loss": -6.720972537994385, "global_step": 144388, "epoch": 3437} {"train_loss": -6.729621410369873, "global_step": 144389, "epoch": 3437} {"train_loss": -6.726393222808838, "global_step": 144390, "epoch": 3437} {"train_loss": -6.6914567947387695, "global_step": 144391, "epoch": 3437} {"train_loss": -6.513033866882324, "global_step": 144392, "epoch": 3437} {"train_loss": -6.7152605056762695, "global_step": 144393, "epoch": 3437} {"train_loss": -6.670538902282715, "global_step": 144394, "epoch": 3437} {"train_loss": -6.711580719266619, "global_step": 144395, "epoch": 3437, "val_loss": 68439.640625} {"train_loss": -6.754613876342773, "global_step": 144396, "epoch": 3438} {"train_loss": -6.661073207855225, "global_step": 144397, "epoch": 3438} {"train_loss": -6.707223892211914, "global_step": 144398, "epoch": 3438} {"train_loss": -6.7006096839904785, "global_step": 144399, "epoch": 3438} {"train_loss": -6.545864105224609, "global_step": 144400, "epoch": 3438} {"train_loss": -6.763223648071289, "global_step": 144401, "epoch": 3438} {"train_loss": -6.663327693939209, "global_step": 144402, "epoch": 3438} {"train_loss": -6.594843864440918, "global_step": 144403, "epoch": 3438} {"train_loss": -6.724206924438477, "global_step": 144404, "epoch": 3438} {"train_loss": -6.7287187576293945, "global_step": 144405, "epoch": 3438} {"train_loss": -6.7108635902404785, "global_step": 144406, "epoch": 3438} {"train_loss": -6.697139739990234, "global_step": 144407, "epoch": 3438} {"train_loss": -6.679108619689941, "global_step": 144408, "epoch": 3438} {"train_loss": -6.607374668121338, "global_step": 144409, "epoch": 3438} {"train_loss": -6.683698654174805, "global_step": 144410, "epoch": 3438} {"train_loss": -6.733737945556641, "global_step": 144411, "epoch": 3438} {"train_loss": -6.689055442810059, "global_step": 144412, "epoch": 3438} {"train_loss": -6.712267875671387, "global_step": 144413, "epoch": 3438} {"train_loss": -6.5781402587890625, "global_step": 144414, "epoch": 3438} {"train_loss": -6.702880382537842, "global_step": 144415, "epoch": 3438} {"train_loss": -6.716054916381836, "global_step": 144416, "epoch": 3438} {"train_loss": -6.605382919311523, "global_step": 144417, "epoch": 3438} {"train_loss": -6.700653553009033, "global_step": 144418, "epoch": 3438} {"train_loss": -6.770793914794922, "global_step": 144419, "epoch": 3438} {"train_loss": -6.763811111450195, "global_step": 144420, "epoch": 3438} {"train_loss": -6.702391624450684, "global_step": 144421, "epoch": 3438} {"train_loss": -6.599884033203125, "global_step": 144422, "epoch": 3438} {"train_loss": -6.75261116027832, "global_step": 144423, "epoch": 3438} {"train_loss": -6.819456577301025, "global_step": 144424, "epoch": 3438} {"train_loss": -6.843484878540039, "global_step": 144425, "epoch": 3438} {"train_loss": -6.791301727294922, "global_step": 144426, "epoch": 3438} {"train_loss": -6.716377258300781, "global_step": 144427, "epoch": 3438} {"train_loss": -6.741779804229736, "global_step": 144428, "epoch": 3438} {"train_loss": -6.750722408294678, "global_step": 144429, "epoch": 3438} {"train_loss": -6.769375801086426, "global_step": 144430, "epoch": 3438} {"train_loss": -6.778790473937988, "global_step": 144431, "epoch": 3438} {"train_loss": -6.831975936889648, "global_step": 144432, "epoch": 3438} {"train_loss": -6.813289165496826, "global_step": 144433, "epoch": 3438} {"train_loss": -6.8292155265808105, "global_step": 144434, "epoch": 3438} {"train_loss": -6.786351203918457, "global_step": 144435, "epoch": 3438} {"train_loss": -6.691208362579346, "global_step": 144436, "epoch": 3438} {"train_loss": -6.720093397867112, "global_step": 144437, "epoch": 3438, "val_loss": 68410.2734375} {"train_loss": -6.778020858764648, "global_step": 144438, "epoch": 3439} {"train_loss": -6.866474151611328, "global_step": 144439, "epoch": 3439} {"train_loss": -6.700944423675537, "global_step": 144440, "epoch": 3439} {"train_loss": -6.800893306732178, "global_step": 144441, "epoch": 3439} {"train_loss": -6.7259745597839355, "global_step": 144442, "epoch": 3439} {"train_loss": -6.677145004272461, "global_step": 144443, "epoch": 3439} {"train_loss": -6.778759002685547, "global_step": 144444, "epoch": 3439} {"train_loss": -6.723194122314453, "global_step": 144445, "epoch": 3439} {"train_loss": -6.750638008117676, "global_step": 144446, "epoch": 3439} {"train_loss": -6.921778678894043, "global_step": 144447, "epoch": 3439} {"train_loss": -6.741094589233398, "global_step": 144448, "epoch": 3439} {"train_loss": -6.72679328918457, "global_step": 144449, "epoch": 3439} {"train_loss": -6.843811988830566, "global_step": 144450, "epoch": 3439} {"train_loss": -6.870330810546875, "global_step": 144451, "epoch": 3439} {"train_loss": -6.797269821166992, "global_step": 144452, "epoch": 3439} {"train_loss": -6.777427673339844, "global_step": 144453, "epoch": 3439} {"train_loss": -6.783923149108887, "global_step": 144454, "epoch": 3439} {"train_loss": -6.727019309997559, "global_step": 144455, "epoch": 3439} {"train_loss": -6.775596618652344, "global_step": 144456, "epoch": 3439} {"train_loss": -6.684328556060791, "global_step": 144457, "epoch": 3439} {"train_loss": -6.729825019836426, "global_step": 144458, "epoch": 3439} {"train_loss": -6.852752208709717, "global_step": 144459, "epoch": 3439} {"train_loss": -6.645617485046387, "global_step": 144460, "epoch": 3439} {"train_loss": -6.77943229675293, "global_step": 144461, "epoch": 3439} {"train_loss": -6.73500919342041, "global_step": 144462, "epoch": 3439} {"train_loss": -6.551664352416992, "global_step": 144463, "epoch": 3439} {"train_loss": -6.8667497634887695, "global_step": 144464, "epoch": 3439} {"train_loss": -6.653535842895508, "global_step": 144465, "epoch": 3439} {"train_loss": -6.7532758712768555, "global_step": 144466, "epoch": 3439} {"train_loss": -6.720339775085449, "global_step": 144467, "epoch": 3439} {"train_loss": -6.603966236114502, "global_step": 144468, "epoch": 3439} {"train_loss": -6.8685173988342285, "global_step": 144469, "epoch": 3439} {"train_loss": -6.711922645568848, "global_step": 144470, "epoch": 3439} {"train_loss": -6.807419300079346, "global_step": 144471, "epoch": 3439} {"train_loss": -6.702993869781494, "global_step": 144472, "epoch": 3439} {"train_loss": -6.848824501037598, "global_step": 144473, "epoch": 3439} {"train_loss": -6.717165946960449, "global_step": 144474, "epoch": 3439} {"train_loss": -6.6400041580200195, "global_step": 144475, "epoch": 3439} {"train_loss": -6.74765157699585, "global_step": 144476, "epoch": 3439} {"train_loss": -6.777602195739746, "global_step": 144477, "epoch": 3439} {"train_loss": -6.736601829528809, "global_step": 144478, "epoch": 3439} {"train_loss": -6.751708859489078, "global_step": 144479, "epoch": 3439, "val_loss": 68231.90625} {"train_loss": -6.802788734436035, "global_step": 144480, "epoch": 3440} {"train_loss": -6.729320526123047, "global_step": 144481, "epoch": 3440} {"train_loss": -6.747222423553467, "global_step": 144482, "epoch": 3440} {"train_loss": -6.76518440246582, "global_step": 144483, "epoch": 3440} {"train_loss": -6.715217113494873, "global_step": 144484, "epoch": 3440} {"train_loss": -6.663243293762207, "global_step": 144485, "epoch": 3440} {"train_loss": -6.847570419311523, "global_step": 144486, "epoch": 3440} {"train_loss": -6.798114776611328, "global_step": 144487, "epoch": 3440} {"train_loss": -6.705031394958496, "global_step": 144488, "epoch": 3440} {"train_loss": -6.671926021575928, "global_step": 144489, "epoch": 3440} {"train_loss": -6.682385444641113, "global_step": 144490, "epoch": 3440} {"train_loss": -6.762111663818359, "global_step": 144491, "epoch": 3440} {"train_loss": -6.843151569366455, "global_step": 144492, "epoch": 3440} {"train_loss": -6.74839448928833, "global_step": 144493, "epoch": 3440} {"train_loss": -6.817421913146973, "global_step": 144494, "epoch": 3440} {"train_loss": -6.776686191558838, "global_step": 144495, "epoch": 3440} {"train_loss": -6.783973693847656, "global_step": 144496, "epoch": 3440} {"train_loss": -6.842267036437988, "global_step": 144497, "epoch": 3440} {"train_loss": -6.778571128845215, "global_step": 144498, "epoch": 3440} {"train_loss": -6.77839994430542, "global_step": 144499, "epoch": 3440} {"train_loss": -6.819942474365234, "global_step": 144500, "epoch": 3440} {"train_loss": -6.719363212585449, "global_step": 144501, "epoch": 3440} {"train_loss": -6.813047409057617, "global_step": 144502, "epoch": 3440} {"train_loss": -6.7816243171691895, "global_step": 144503, "epoch": 3440} {"train_loss": -6.779915809631348, "global_step": 144504, "epoch": 3440} {"train_loss": -6.641233921051025, "global_step": 144505, "epoch": 3440} {"train_loss": -6.689986228942871, "global_step": 144506, "epoch": 3440} {"train_loss": -6.8782243728637695, "global_step": 144507, "epoch": 3440} {"train_loss": -6.729927062988281, "global_step": 144508, "epoch": 3440} {"train_loss": -6.68546199798584, "global_step": 144509, "epoch": 3440} {"train_loss": -6.757479667663574, "global_step": 144510, "epoch": 3440} {"train_loss": -6.807639122009277, "global_step": 144511, "epoch": 3440} {"train_loss": -6.776894569396973, "global_step": 144512, "epoch": 3440} {"train_loss": -6.836626052856445, "global_step": 144513, "epoch": 3440} {"train_loss": -6.649848937988281, "global_step": 144514, "epoch": 3440} {"train_loss": -6.679023742675781, "global_step": 144515, "epoch": 3440} {"train_loss": -6.782525062561035, "global_step": 144516, "epoch": 3440} {"train_loss": -6.635309219360352, "global_step": 144517, "epoch": 3440} {"train_loss": -6.79484748840332, "global_step": 144518, "epoch": 3440} {"train_loss": -6.887378692626953, "global_step": 144519, "epoch": 3440} {"train_loss": -6.80836820602417, "global_step": 144520, "epoch": 3440} {"train_loss": -6.761098384857178, "global_step": 144521, "epoch": 3440, "val_loss": 68587.7734375} {"train_loss": -6.7404680252075195, "global_step": 144522, "epoch": 3441} {"train_loss": -6.778933525085449, "global_step": 144523, "epoch": 3441} {"train_loss": -6.711659908294678, "global_step": 144524, "epoch": 3441} {"train_loss": -6.718451499938965, "global_step": 144525, "epoch": 3441} {"train_loss": -6.754952430725098, "global_step": 144526, "epoch": 3441} {"train_loss": -6.62796688079834, "global_step": 144527, "epoch": 3441} {"train_loss": -6.773502349853516, "global_step": 144528, "epoch": 3441} {"train_loss": -6.856765270233154, "global_step": 144529, "epoch": 3441} {"train_loss": -6.750614166259766, "global_step": 144530, "epoch": 3441} {"train_loss": -6.752145290374756, "global_step": 144531, "epoch": 3441} {"train_loss": -6.657418251037598, "global_step": 144532, "epoch": 3441} {"train_loss": -6.705281734466553, "global_step": 144533, "epoch": 3441} {"train_loss": -6.774534702301025, "global_step": 144534, "epoch": 3441} {"train_loss": -6.657459259033203, "global_step": 144535, "epoch": 3441} {"train_loss": -6.753357887268066, "global_step": 144536, "epoch": 3441} {"train_loss": -6.702399253845215, "global_step": 144537, "epoch": 3441} {"train_loss": -6.711574554443359, "global_step": 144538, "epoch": 3441} {"train_loss": -6.7578887939453125, "global_step": 144539, "epoch": 3441} {"train_loss": -6.706411361694336, "global_step": 144540, "epoch": 3441} {"train_loss": -6.757080554962158, "global_step": 144541, "epoch": 3441} {"train_loss": -6.72283411026001, "global_step": 144542, "epoch": 3441} {"train_loss": -6.682047367095947, "global_step": 144543, "epoch": 3441} {"train_loss": -6.822990417480469, "global_step": 144544, "epoch": 3441} {"train_loss": -6.677506446838379, "global_step": 144545, "epoch": 3441} {"train_loss": -6.683002948760986, "global_step": 144546, "epoch": 3441} {"train_loss": -6.711325645446777, "global_step": 144547, "epoch": 3441} {"train_loss": -6.859328269958496, "global_step": 144548, "epoch": 3441} {"train_loss": -6.695310592651367, "global_step": 144549, "epoch": 3441} {"train_loss": -6.7190752029418945, "global_step": 144550, "epoch": 3441} {"train_loss": -6.7201104164123535, "global_step": 144551, "epoch": 3441} {"train_loss": -6.8556671142578125, "global_step": 144552, "epoch": 3441} {"train_loss": -6.76505184173584, "global_step": 144553, "epoch": 3441} {"train_loss": -6.812155723571777, "global_step": 144554, "epoch": 3441} {"train_loss": -6.731297492980957, "global_step": 144555, "epoch": 3441} {"train_loss": -6.724582672119141, "global_step": 144556, "epoch": 3441} {"train_loss": -6.791140556335449, "global_step": 144557, "epoch": 3441} {"train_loss": -6.722141265869141, "global_step": 144558, "epoch": 3441} {"train_loss": -6.6631011962890625, "global_step": 144559, "epoch": 3441} {"train_loss": -6.65407657623291, "global_step": 144560, "epoch": 3441} {"train_loss": -6.734580039978027, "global_step": 144561, "epoch": 3441} {"train_loss": -6.920770168304443, "global_step": 144562, "epoch": 3441} {"train_loss": -6.740960268747239, "global_step": 144563, "epoch": 3441, "val_loss": 68100.265625} {"train_loss": -6.8163557052612305, "global_step": 144564, "epoch": 3442} {"train_loss": -6.68935489654541, "global_step": 144565, "epoch": 3442} {"train_loss": -6.712442874908447, "global_step": 144566, "epoch": 3442} {"train_loss": -6.755908489227295, "global_step": 144567, "epoch": 3442} {"train_loss": -6.6478166580200195, "global_step": 144568, "epoch": 3442} {"train_loss": -6.86302375793457, "global_step": 144569, "epoch": 3442} {"train_loss": -6.742744445800781, "global_step": 144570, "epoch": 3442} {"train_loss": -6.737748146057129, "global_step": 144571, "epoch": 3442} {"train_loss": -6.728717803955078, "global_step": 144572, "epoch": 3442} {"train_loss": -6.802972793579102, "global_step": 144573, "epoch": 3442} {"train_loss": -6.722679138183594, "global_step": 144574, "epoch": 3442} {"train_loss": -6.839017391204834, "global_step": 144575, "epoch": 3442} {"train_loss": -6.78041934967041, "global_step": 144576, "epoch": 3442} {"train_loss": -6.727174758911133, "global_step": 144577, "epoch": 3442} {"train_loss": -6.671053409576416, "global_step": 144578, "epoch": 3442} {"train_loss": -6.6546711921691895, "global_step": 144579, "epoch": 3442} {"train_loss": -6.84907865524292, "global_step": 144580, "epoch": 3442} {"train_loss": -6.69882869720459, "global_step": 144581, "epoch": 3442} {"train_loss": -6.831775665283203, "global_step": 144582, "epoch": 3442} {"train_loss": -6.714776515960693, "global_step": 144583, "epoch": 3442} {"train_loss": -6.796023368835449, "global_step": 144584, "epoch": 3442} {"train_loss": -6.6137237548828125, "global_step": 144585, "epoch": 3442} {"train_loss": -6.813231468200684, "global_step": 144586, "epoch": 3442} {"train_loss": -6.666797161102295, "global_step": 144587, "epoch": 3442} {"train_loss": -6.658410549163818, "global_step": 144588, "epoch": 3442} {"train_loss": -6.864038944244385, "global_step": 144589, "epoch": 3442} {"train_loss": -6.718148231506348, "global_step": 144590, "epoch": 3442} {"train_loss": -6.746950626373291, "global_step": 144591, "epoch": 3442} {"train_loss": -6.710960388183594, "global_step": 144592, "epoch": 3442} {"train_loss": -6.830349445343018, "global_step": 144593, "epoch": 3442} {"train_loss": -6.817081451416016, "global_step": 144594, "epoch": 3442} {"train_loss": -6.661803245544434, "global_step": 144595, "epoch": 3442} {"train_loss": -6.718398571014404, "global_step": 144596, "epoch": 3442} {"train_loss": -6.691545009613037, "global_step": 144597, "epoch": 3442} {"train_loss": -6.80908727645874, "global_step": 144598, "epoch": 3442} {"train_loss": -6.715597629547119, "global_step": 144599, "epoch": 3442} {"train_loss": -6.721161842346191, "global_step": 144600, "epoch": 3442} {"train_loss": -6.800536155700684, "global_step": 144601, "epoch": 3442} {"train_loss": -6.7020769119262695, "global_step": 144602, "epoch": 3442} {"train_loss": -6.794607162475586, "global_step": 144603, "epoch": 3442} {"train_loss": -6.71401309967041, "global_step": 144604, "epoch": 3442} {"train_loss": -6.7418229920523505, "global_step": 144605, "epoch": 3442, "val_loss": 68445.21875} {"train_loss": -6.676614761352539, "global_step": 144606, "epoch": 3443} {"train_loss": -6.758624076843262, "global_step": 144607, "epoch": 3443} {"train_loss": -6.733660697937012, "global_step": 144608, "epoch": 3443} {"train_loss": -6.6454386711120605, "global_step": 144609, "epoch": 3443} {"train_loss": -6.751291751861572, "global_step": 144610, "epoch": 3443} {"train_loss": -6.788434982299805, "global_step": 144611, "epoch": 3443} {"train_loss": -6.729792594909668, "global_step": 144612, "epoch": 3443} {"train_loss": -6.639236927032471, "global_step": 144613, "epoch": 3443} {"train_loss": -6.768690586090088, "global_step": 144614, "epoch": 3443} {"train_loss": -6.758237838745117, "global_step": 144615, "epoch": 3443} {"train_loss": -6.714818477630615, "global_step": 144616, "epoch": 3443} {"train_loss": -6.781454086303711, "global_step": 144617, "epoch": 3443} {"train_loss": -6.71851921081543, "global_step": 144618, "epoch": 3443} {"train_loss": -6.782243728637695, "global_step": 144619, "epoch": 3443} {"train_loss": -6.800436973571777, "global_step": 144620, "epoch": 3443} {"train_loss": -6.763009071350098, "global_step": 144621, "epoch": 3443} {"train_loss": -6.809841632843018, "global_step": 144622, "epoch": 3443} {"train_loss": -6.802995681762695, "global_step": 144623, "epoch": 3443} {"train_loss": -6.723695755004883, "global_step": 144624, "epoch": 3443} {"train_loss": -6.798352241516113, "global_step": 144625, "epoch": 3443} {"train_loss": -6.850277423858643, "global_step": 144626, "epoch": 3443} {"train_loss": -6.6565117835998535, "global_step": 144627, "epoch": 3443} {"train_loss": -6.761782646179199, "global_step": 144628, "epoch": 3443} {"train_loss": -6.737761497497559, "global_step": 144629, "epoch": 3443} {"train_loss": -6.750505447387695, "global_step": 144630, "epoch": 3443} {"train_loss": -6.749730587005615, "global_step": 144631, "epoch": 3443} {"train_loss": -6.706071853637695, "global_step": 144632, "epoch": 3443} {"train_loss": -6.800997734069824, "global_step": 144633, "epoch": 3443} {"train_loss": -6.899256706237793, "global_step": 144634, "epoch": 3443} {"train_loss": -6.856725692749023, "global_step": 144635, "epoch": 3443} {"train_loss": -6.760165214538574, "global_step": 144636, "epoch": 3443} {"train_loss": -6.907716274261475, "global_step": 144637, "epoch": 3443} {"train_loss": -6.68568229675293, "global_step": 144638, "epoch": 3443} {"train_loss": -6.756614685058594, "global_step": 144639, "epoch": 3443} {"train_loss": -6.792960166931152, "global_step": 144640, "epoch": 3443} {"train_loss": -6.71599817276001, "global_step": 144641, "epoch": 3443} {"train_loss": -6.816580772399902, "global_step": 144642, "epoch": 3443} {"train_loss": -6.746739864349365, "global_step": 144643, "epoch": 3443} {"train_loss": -6.886512279510498, "global_step": 144644, "epoch": 3443} {"train_loss": -6.839638710021973, "global_step": 144645, "epoch": 3443} {"train_loss": -6.777716159820557, "global_step": 144646, "epoch": 3443} {"train_loss": -6.764344737643287, "global_step": 144647, "epoch": 3443, "val_loss": 68418.0} {"train_loss": -6.786068916320801, "global_step": 144648, "epoch": 3444} {"train_loss": -6.806816577911377, "global_step": 144649, "epoch": 3444} {"train_loss": -6.789798736572266, "global_step": 144650, "epoch": 3444} {"train_loss": -6.784800052642822, "global_step": 144651, "epoch": 3444} {"train_loss": -6.7585673332214355, "global_step": 144652, "epoch": 3444} {"train_loss": -6.809767723083496, "global_step": 144653, "epoch": 3444} {"train_loss": -6.898290634155273, "global_step": 144654, "epoch": 3444} {"train_loss": -6.640783786773682, "global_step": 144655, "epoch": 3444} {"train_loss": -6.915510177612305, "global_step": 144656, "epoch": 3444} {"train_loss": -6.794033050537109, "global_step": 144657, "epoch": 3444} {"train_loss": -6.748698711395264, "global_step": 144658, "epoch": 3444} {"train_loss": -6.858828067779541, "global_step": 144659, "epoch": 3444} {"train_loss": -6.725895881652832, "global_step": 144660, "epoch": 3444} {"train_loss": -6.789829254150391, "global_step": 144661, "epoch": 3444} {"train_loss": -6.815661430358887, "global_step": 144662, "epoch": 3444} {"train_loss": -6.748658180236816, "global_step": 144663, "epoch": 3444} {"train_loss": -6.670414447784424, "global_step": 144664, "epoch": 3444} {"train_loss": -6.860020637512207, "global_step": 144665, "epoch": 3444} {"train_loss": -6.801127910614014, "global_step": 144666, "epoch": 3444} {"train_loss": -6.69665002822876, "global_step": 144667, "epoch": 3444} {"train_loss": -6.738096237182617, "global_step": 144668, "epoch": 3444} {"train_loss": -6.700160980224609, "global_step": 144669, "epoch": 3444} {"train_loss": -6.7077226638793945, "global_step": 144670, "epoch": 3444} {"train_loss": -6.840443134307861, "global_step": 144671, "epoch": 3444} {"train_loss": -6.875473976135254, "global_step": 144672, "epoch": 3444} {"train_loss": -6.823160171508789, "global_step": 144673, "epoch": 3444} {"train_loss": -6.804680824279785, "global_step": 144674, "epoch": 3444} {"train_loss": -6.77954626083374, "global_step": 144675, "epoch": 3444} {"train_loss": -6.769304275512695, "global_step": 144676, "epoch": 3444} {"train_loss": -6.879743576049805, "global_step": 144677, "epoch": 3444} {"train_loss": -6.7763214111328125, "global_step": 144678, "epoch": 3444} {"train_loss": -6.872208595275879, "global_step": 144679, "epoch": 3444} {"train_loss": -6.801222801208496, "global_step": 144680, "epoch": 3444} {"train_loss": -6.799251556396484, "global_step": 144681, "epoch": 3444} {"train_loss": -6.673447608947754, "global_step": 144682, "epoch": 3444} {"train_loss": -6.70986270904541, "global_step": 144683, "epoch": 3444} {"train_loss": -6.8288679122924805, "global_step": 144684, "epoch": 3444} {"train_loss": -6.632903099060059, "global_step": 144685, "epoch": 3444} {"train_loss": -6.757201671600342, "global_step": 144686, "epoch": 3444} {"train_loss": -6.835773944854736, "global_step": 144687, "epoch": 3444} {"train_loss": -6.704883575439453, "global_step": 144688, "epoch": 3444} {"train_loss": -6.779894136247181, "global_step": 144689, "epoch": 3444, "val_loss": 68447.7578125} {"train_loss": -6.797155380249023, "global_step": 144690, "epoch": 3445} {"train_loss": -6.840553283691406, "global_step": 144691, "epoch": 3445} {"train_loss": -6.816612243652344, "global_step": 144692, "epoch": 3445} {"train_loss": -6.816716194152832, "global_step": 144693, "epoch": 3445} {"train_loss": -6.781960487365723, "global_step": 144694, "epoch": 3445} {"train_loss": -6.752425193786621, "global_step": 144695, "epoch": 3445} {"train_loss": -6.761506080627441, "global_step": 144696, "epoch": 3445} {"train_loss": -6.844823837280273, "global_step": 144697, "epoch": 3445} {"train_loss": -6.7178778648376465, "global_step": 144698, "epoch": 3445} {"train_loss": -6.631608486175537, "global_step": 144699, "epoch": 3445} {"train_loss": -6.893161773681641, "global_step": 144700, "epoch": 3445} {"train_loss": -6.808262825012207, "global_step": 144701, "epoch": 3445} {"train_loss": -6.6987504959106445, "global_step": 144702, "epoch": 3445} {"train_loss": -6.828651428222656, "global_step": 144703, "epoch": 3445} {"train_loss": -6.89045524597168, "global_step": 144704, "epoch": 3445} {"train_loss": -6.750335693359375, "global_step": 144705, "epoch": 3445} {"train_loss": -6.697270393371582, "global_step": 144706, "epoch": 3445} {"train_loss": -6.614569187164307, "global_step": 144707, "epoch": 3445} {"train_loss": -6.711154937744141, "global_step": 144708, "epoch": 3445} {"train_loss": -6.679024696350098, "global_step": 144709, "epoch": 3445} {"train_loss": -6.745316982269287, "global_step": 144710, "epoch": 3445} {"train_loss": -6.699877738952637, "global_step": 144711, "epoch": 3445} {"train_loss": -6.68233060836792, "global_step": 144712, "epoch": 3445} {"train_loss": -6.736980438232422, "global_step": 144713, "epoch": 3445} {"train_loss": -6.690553665161133, "global_step": 144714, "epoch": 3445} {"train_loss": -6.560097694396973, "global_step": 144715, "epoch": 3445} {"train_loss": -6.697505950927734, "global_step": 144716, "epoch": 3445} {"train_loss": -6.697793483734131, "global_step": 144717, "epoch": 3445} {"train_loss": -6.667610168457031, "global_step": 144718, "epoch": 3445} {"train_loss": -6.634064674377441, "global_step": 144719, "epoch": 3445} {"train_loss": -6.731997966766357, "global_step": 144720, "epoch": 3445} {"train_loss": -6.740695476531982, "global_step": 144721, "epoch": 3445} {"train_loss": -6.662027835845947, "global_step": 144722, "epoch": 3445} {"train_loss": -6.689428329467773, "global_step": 144723, "epoch": 3445} {"train_loss": -6.7045793533325195, "global_step": 144724, "epoch": 3445} {"train_loss": -6.682627201080322, "global_step": 144725, "epoch": 3445} {"train_loss": -6.667139053344727, "global_step": 144726, "epoch": 3445} {"train_loss": -6.596626281738281, "global_step": 144727, "epoch": 3445} {"train_loss": -6.806219100952148, "global_step": 144728, "epoch": 3445} {"train_loss": -6.814232349395752, "global_step": 144729, "epoch": 3445} {"train_loss": -6.635544300079346, "global_step": 144730, "epoch": 3445} {"train_loss": -6.727747803642636, "global_step": 144731, "epoch": 3445, "val_loss": 68315.1640625} {"train_loss": -6.805971145629883, "global_step": 144732, "epoch": 3446} {"train_loss": -6.760840892791748, "global_step": 144733, "epoch": 3446} {"train_loss": -6.837937831878662, "global_step": 144734, "epoch": 3446} {"train_loss": -6.841421127319336, "global_step": 144735, "epoch": 3446} {"train_loss": -6.720629692077637, "global_step": 144736, "epoch": 3446} {"train_loss": -6.742781639099121, "global_step": 144737, "epoch": 3446} {"train_loss": -6.770354747772217, "global_step": 144738, "epoch": 3446} {"train_loss": -6.794891834259033, "global_step": 144739, "epoch": 3446} {"train_loss": -6.838715553283691, "global_step": 144740, "epoch": 3446} {"train_loss": -6.80458927154541, "global_step": 144741, "epoch": 3446} {"train_loss": -6.825588226318359, "global_step": 144742, "epoch": 3446} {"train_loss": -6.700242042541504, "global_step": 144743, "epoch": 3446} {"train_loss": -6.7817769050598145, "global_step": 144744, "epoch": 3446} {"train_loss": -6.826057434082031, "global_step": 144745, "epoch": 3446} {"train_loss": -6.742184162139893, "global_step": 144746, "epoch": 3446} {"train_loss": -6.841333866119385, "global_step": 144747, "epoch": 3446} {"train_loss": -6.7670135498046875, "global_step": 144748, "epoch": 3446} {"train_loss": -6.817924499511719, "global_step": 144749, "epoch": 3446} {"train_loss": -6.736931800842285, "global_step": 144750, "epoch": 3446} {"train_loss": -6.903403282165527, "global_step": 144751, "epoch": 3446} {"train_loss": -6.856167793273926, "global_step": 144752, "epoch": 3446} {"train_loss": -6.871703624725342, "global_step": 144753, "epoch": 3446} {"train_loss": -6.72943115234375, "global_step": 144754, "epoch": 3446} {"train_loss": -6.752554416656494, "global_step": 144755, "epoch": 3446} {"train_loss": -6.8290839195251465, "global_step": 144756, "epoch": 3446} {"train_loss": -6.797482490539551, "global_step": 144757, "epoch": 3446} {"train_loss": -6.760847091674805, "global_step": 144758, "epoch": 3446} {"train_loss": -6.7532548904418945, "global_step": 144759, "epoch": 3446} {"train_loss": -6.710489273071289, "global_step": 144760, "epoch": 3446} {"train_loss": -6.693974494934082, "global_step": 144761, "epoch": 3446} {"train_loss": -6.837867736816406, "global_step": 144762, "epoch": 3446} {"train_loss": -6.821591377258301, "global_step": 144763, "epoch": 3446} {"train_loss": -6.862349987030029, "global_step": 144764, "epoch": 3446} {"train_loss": -6.847861289978027, "global_step": 144765, "epoch": 3446} {"train_loss": -6.63379430770874, "global_step": 144766, "epoch": 3446} {"train_loss": -6.890501976013184, "global_step": 144767, "epoch": 3446} {"train_loss": -6.699122905731201, "global_step": 144768, "epoch": 3446} {"train_loss": -6.680376052856445, "global_step": 144769, "epoch": 3446} {"train_loss": -6.702549934387207, "global_step": 144770, "epoch": 3446} {"train_loss": -6.781919479370117, "global_step": 144771, "epoch": 3446} {"train_loss": -6.846087455749512, "global_step": 144772, "epoch": 3446} {"train_loss": -6.782097237450736, "global_step": 144773, "epoch": 3446, "val_loss": 68419.9375} {"train_loss": -6.8444719314575195, "global_step": 144774, "epoch": 3447} {"train_loss": -6.733233451843262, "global_step": 144775, "epoch": 3447} {"train_loss": -6.7099127769470215, "global_step": 144776, "epoch": 3447} {"train_loss": -6.71785306930542, "global_step": 144777, "epoch": 3447} {"train_loss": -6.825611114501953, "global_step": 144778, "epoch": 3447} {"train_loss": -6.69727897644043, "global_step": 144779, "epoch": 3447} {"train_loss": -6.730842590332031, "global_step": 144780, "epoch": 3447} {"train_loss": -6.649972915649414, "global_step": 144781, "epoch": 3447} {"train_loss": -6.637266159057617, "global_step": 144782, "epoch": 3447} {"train_loss": -6.564740180969238, "global_step": 144783, "epoch": 3447} {"train_loss": -6.628260612487793, "global_step": 144784, "epoch": 3447} {"train_loss": -6.706202983856201, "global_step": 144785, "epoch": 3447} {"train_loss": -6.713936805725098, "global_step": 144786, "epoch": 3447} {"train_loss": -6.69561767578125, "global_step": 144787, "epoch": 3447} {"train_loss": -6.712251663208008, "global_step": 144788, "epoch": 3447} {"train_loss": -6.63492488861084, "global_step": 144789, "epoch": 3447} {"train_loss": -6.67427921295166, "global_step": 144790, "epoch": 3447} {"train_loss": -6.718602180480957, "global_step": 144791, "epoch": 3447} {"train_loss": -6.6713480949401855, "global_step": 144792, "epoch": 3447} {"train_loss": -6.748087406158447, "global_step": 144793, "epoch": 3447} {"train_loss": -6.7215166091918945, "global_step": 144794, "epoch": 3447} {"train_loss": -6.740653991699219, "global_step": 144795, "epoch": 3447} {"train_loss": -6.730467796325684, "global_step": 144796, "epoch": 3447} {"train_loss": -6.751811981201172, "global_step": 144797, "epoch": 3447} {"train_loss": -6.750019073486328, "global_step": 144798, "epoch": 3447} {"train_loss": -6.723561763763428, "global_step": 144799, "epoch": 3447} {"train_loss": -6.821451663970947, "global_step": 144800, "epoch": 3447} {"train_loss": -6.764176368713379, "global_step": 144801, "epoch": 3447} {"train_loss": -6.658251762390137, "global_step": 144802, "epoch": 3447} {"train_loss": -6.74119758605957, "global_step": 144803, "epoch": 3447} {"train_loss": -6.800081253051758, "global_step": 144804, "epoch": 3447} {"train_loss": -6.668384552001953, "global_step": 144805, "epoch": 3447} {"train_loss": -6.751333236694336, "global_step": 144806, "epoch": 3447} {"train_loss": -6.777987957000732, "global_step": 144807, "epoch": 3447} {"train_loss": -6.756657600402832, "global_step": 144808, "epoch": 3447} {"train_loss": -6.686161994934082, "global_step": 144809, "epoch": 3447} {"train_loss": -6.840229511260986, "global_step": 144810, "epoch": 3447} {"train_loss": -6.752045154571533, "global_step": 144811, "epoch": 3447} {"train_loss": -6.859962463378906, "global_step": 144812, "epoch": 3447} {"train_loss": -6.845330238342285, "global_step": 144813, "epoch": 3447} {"train_loss": -6.7822747230529785, "global_step": 144814, "epoch": 3447} {"train_loss": -6.732705207098098, "global_step": 144815, "epoch": 3447, "val_loss": 68324.3984375} {"train_loss": -6.760924816131592, "global_step": 144816, "epoch": 3448} {"train_loss": -6.883782386779785, "global_step": 144817, "epoch": 3448} {"train_loss": -6.816580772399902, "global_step": 144818, "epoch": 3448} {"train_loss": -6.838537216186523, "global_step": 144819, "epoch": 3448} {"train_loss": -6.8410563468933105, "global_step": 144820, "epoch": 3448} {"train_loss": -6.754544258117676, "global_step": 144821, "epoch": 3448} {"train_loss": -6.76043176651001, "global_step": 144822, "epoch": 3448} {"train_loss": -6.68842887878418, "global_step": 144823, "epoch": 3448} {"train_loss": -6.609706878662109, "global_step": 144824, "epoch": 3448} {"train_loss": -6.891427040100098, "global_step": 144825, "epoch": 3448} {"train_loss": -6.695234298706055, "global_step": 144826, "epoch": 3448} {"train_loss": -6.715290069580078, "global_step": 144827, "epoch": 3448} {"train_loss": -6.8196282386779785, "global_step": 144828, "epoch": 3448} {"train_loss": -6.753132343292236, "global_step": 144829, "epoch": 3448} {"train_loss": -6.697543621063232, "global_step": 144830, "epoch": 3448} {"train_loss": -6.83449649810791, "global_step": 144831, "epoch": 3448} {"train_loss": -6.829662322998047, "global_step": 144832, "epoch": 3448} {"train_loss": -6.7969651222229, "global_step": 144833, "epoch": 3448} {"train_loss": -6.773429870605469, "global_step": 144834, "epoch": 3448} {"train_loss": -6.757761001586914, "global_step": 144835, "epoch": 3448} {"train_loss": -6.692095756530762, "global_step": 144836, "epoch": 3448} {"train_loss": -6.587127685546875, "global_step": 144837, "epoch": 3448} {"train_loss": -6.838155746459961, "global_step": 144838, "epoch": 3448} {"train_loss": -6.760032653808594, "global_step": 144839, "epoch": 3448} {"train_loss": -6.761537551879883, "global_step": 144840, "epoch": 3448} {"train_loss": -6.836293697357178, "global_step": 144841, "epoch": 3448} {"train_loss": -6.838217735290527, "global_step": 144842, "epoch": 3448} {"train_loss": -6.793445587158203, "global_step": 144843, "epoch": 3448} {"train_loss": -6.840765476226807, "global_step": 144844, "epoch": 3448} {"train_loss": -6.832724571228027, "global_step": 144845, "epoch": 3448} {"train_loss": -6.725000858306885, "global_step": 144846, "epoch": 3448} {"train_loss": -6.709841728210449, "global_step": 144847, "epoch": 3448} {"train_loss": -6.785508155822754, "global_step": 144848, "epoch": 3448} {"train_loss": -6.916585922241211, "global_step": 144849, "epoch": 3448} {"train_loss": -6.789532661437988, "global_step": 144850, "epoch": 3448} {"train_loss": -6.825347900390625, "global_step": 144851, "epoch": 3448} {"train_loss": -6.858660697937012, "global_step": 144852, "epoch": 3448} {"train_loss": -6.63484001159668, "global_step": 144853, "epoch": 3448} {"train_loss": -6.707540512084961, "global_step": 144854, "epoch": 3448} {"train_loss": -6.710062503814697, "global_step": 144855, "epoch": 3448} {"train_loss": -6.833547592163086, "global_step": 144856, "epoch": 3448} {"train_loss": -6.775529872803461, "global_step": 144857, "epoch": 3448, "val_loss": 68493.109375} {"train_loss": -6.72210693359375, "global_step": 144858, "epoch": 3449} {"train_loss": -6.730005264282227, "global_step": 144859, "epoch": 3449} {"train_loss": -6.716691017150879, "global_step": 144860, "epoch": 3449} {"train_loss": -6.547428131103516, "global_step": 144861, "epoch": 3449} {"train_loss": -6.817405700683594, "global_step": 144862, "epoch": 3449} {"train_loss": -6.680557727813721, "global_step": 144863, "epoch": 3449} {"train_loss": -6.709615230560303, "global_step": 144864, "epoch": 3449} {"train_loss": -6.709470272064209, "global_step": 144865, "epoch": 3449} {"train_loss": -6.6343231201171875, "global_step": 144866, "epoch": 3449} {"train_loss": -6.7392048835754395, "global_step": 144867, "epoch": 3449} {"train_loss": -6.655230522155762, "global_step": 144868, "epoch": 3449} {"train_loss": -6.782975196838379, "global_step": 144869, "epoch": 3449} {"train_loss": -6.724560737609863, "global_step": 144870, "epoch": 3449} {"train_loss": -6.772814750671387, "global_step": 144871, "epoch": 3449} {"train_loss": -6.691310882568359, "global_step": 144872, "epoch": 3449} {"train_loss": -6.782650470733643, "global_step": 144873, "epoch": 3449} {"train_loss": -6.679286956787109, "global_step": 144874, "epoch": 3449} {"train_loss": -6.711170196533203, "global_step": 144875, "epoch": 3449} {"train_loss": -6.695369720458984, "global_step": 144876, "epoch": 3449} {"train_loss": -6.823007583618164, "global_step": 144877, "epoch": 3449} {"train_loss": -6.827140808105469, "global_step": 144878, "epoch": 3449} {"train_loss": -6.841442108154297, "global_step": 144879, "epoch": 3449} {"train_loss": -6.681180953979492, "global_step": 144880, "epoch": 3449} {"train_loss": -6.7938432693481445, "global_step": 144881, "epoch": 3449} {"train_loss": -6.787374496459961, "global_step": 144882, "epoch": 3449} {"train_loss": -6.756928443908691, "global_step": 144883, "epoch": 3449} {"train_loss": -6.795451641082764, "global_step": 144884, "epoch": 3449} {"train_loss": -6.7802019119262695, "global_step": 144885, "epoch": 3449} {"train_loss": -6.792848587036133, "global_step": 144886, "epoch": 3449} {"train_loss": -6.753489017486572, "global_step": 144887, "epoch": 3449} {"train_loss": -6.73712158203125, "global_step": 144888, "epoch": 3449} {"train_loss": -6.787319183349609, "global_step": 144889, "epoch": 3449} {"train_loss": -6.789666175842285, "global_step": 144890, "epoch": 3449} {"train_loss": -6.786738395690918, "global_step": 144891, "epoch": 3449} {"train_loss": -6.732892036437988, "global_step": 144892, "epoch": 3449} {"train_loss": -6.781863689422607, "global_step": 144893, "epoch": 3449} {"train_loss": -6.672451496124268, "global_step": 144894, "epoch": 3449} {"train_loss": -6.793107986450195, "global_step": 144895, "epoch": 3449} {"train_loss": -6.6793928146362305, "global_step": 144896, "epoch": 3449} {"train_loss": -6.556733131408691, "global_step": 144897, "epoch": 3449} {"train_loss": -6.662250518798828, "global_step": 144898, "epoch": 3449} {"train_loss": -6.7343996706463045, "global_step": 144899, "epoch": 3449, "val_loss": 68317.1640625} {"train_loss": -6.684840202331543, "global_step": 144900, "epoch": 3450} {"train_loss": -6.686501502990723, "global_step": 144901, "epoch": 3450} {"train_loss": -6.489416122436523, "global_step": 144902, "epoch": 3450} {"train_loss": -6.651557922363281, "global_step": 144903, "epoch": 3450} {"train_loss": -6.724956512451172, "global_step": 144904, "epoch": 3450} {"train_loss": -6.80251407623291, "global_step": 144905, "epoch": 3450} {"train_loss": -6.628575325012207, "global_step": 144906, "epoch": 3450} {"train_loss": -6.717510223388672, "global_step": 144907, "epoch": 3450} {"train_loss": -6.70233154296875, "global_step": 144908, "epoch": 3450} {"train_loss": -6.678174018859863, "global_step": 144909, "epoch": 3450} {"train_loss": -6.597728729248047, "global_step": 144910, "epoch": 3450} {"train_loss": -6.77008056640625, "global_step": 144911, "epoch": 3450} {"train_loss": -6.7538909912109375, "global_step": 144912, "epoch": 3450} {"train_loss": -6.701472282409668, "global_step": 144913, "epoch": 3450} {"train_loss": -6.772347450256348, "global_step": 144914, "epoch": 3450} {"train_loss": -6.686209678649902, "global_step": 144915, "epoch": 3450} {"train_loss": -6.820032596588135, "global_step": 144916, "epoch": 3450} {"train_loss": -6.738033294677734, "global_step": 144917, "epoch": 3450} {"train_loss": -6.775101184844971, "global_step": 144918, "epoch": 3450} {"train_loss": -6.793098449707031, "global_step": 144919, "epoch": 3450} {"train_loss": -6.799870491027832, "global_step": 144920, "epoch": 3450} {"train_loss": -6.715461730957031, "global_step": 144921, "epoch": 3450} {"train_loss": -6.725201606750488, "global_step": 144922, "epoch": 3450} {"train_loss": -6.718189716339111, "global_step": 144923, "epoch": 3450} {"train_loss": -6.8138532638549805, "global_step": 144924, "epoch": 3450} {"train_loss": -6.799626350402832, "global_step": 144925, "epoch": 3450} {"train_loss": -6.839016437530518, "global_step": 144926, "epoch": 3450} {"train_loss": -6.688755035400391, "global_step": 144927, "epoch": 3450} {"train_loss": -6.6373677253723145, "global_step": 144928, "epoch": 3450} {"train_loss": -6.81039571762085, "global_step": 144929, "epoch": 3450} {"train_loss": -6.776086807250977, "global_step": 144930, "epoch": 3450} {"train_loss": -6.6104888916015625, "global_step": 144931, "epoch": 3450} {"train_loss": -6.7414350509643555, "global_step": 144932, "epoch": 3450} {"train_loss": -6.75185489654541, "global_step": 144933, "epoch": 3450} {"train_loss": -6.58954381942749, "global_step": 144934, "epoch": 3450} {"train_loss": -6.842805862426758, "global_step": 144935, "epoch": 3450} {"train_loss": -6.520528316497803, "global_step": 144936, "epoch": 3450} {"train_loss": -6.74916934967041, "global_step": 144937, "epoch": 3450} {"train_loss": -6.6577863693237305, "global_step": 144938, "epoch": 3450} {"train_loss": -6.568313121795654, "global_step": 144939, "epoch": 3450} {"train_loss": -6.679886817932129, "global_step": 144940, "epoch": 3450} {"train_loss": -6.712167297090803, "global_step": 144941, "epoch": 3450, "train/sim_max_reward_0": 0.23008729878325151, "train/sim_max_reward_1": 0.7544780466845221, "train/sim_max_reward_2": 0.3688236802620569, "train/sim_max_reward_3": 0.13280642813739538, "train/sim_max_reward_4": 0.990195029388121, "train/sim_max_reward_5": 0.976318788078656, "test/sim_max_reward_4400000": 0.16995232881502695, "test/sim_max_reward_4400001": 0.45367311035102487, "test/sim_max_reward_4400002": 0.7639588846085202, "test/sim_max_reward_4400003": 0.9546258206104569, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9245283373712819, "test/sim_max_reward_4400006": 0.9655088271939323, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3237068975279194, "test/sim_max_reward_4400009": 0.9022544740816193, "test/sim_max_reward_4400010": 0.2074389093392638, "test/sim_max_reward_4400011": 0.19645174317826583, "test/sim_max_reward_4400012": 0.5801886926721038, "test/sim_max_reward_4400013": 0.8047325558072568, "test/sim_max_reward_4400014": 0.9242172271172411, "test/sim_max_reward_4400015": 0.07105622720699607, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.22763672189131914, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.944178705717484, "test/sim_max_reward_4400023": 0.9964706898464081, "test/sim_max_reward_4400024": 0.7604586046978256, "test/sim_max_reward_4400025": 0.25555554919651957, "test/sim_max_reward_4400026": 0.00031686768367666734, "test/sim_max_reward_4400027": 0.03888383670673406, "test/sim_max_reward_4400028": 0.75688751901085, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9753952216577529, "test/sim_max_reward_4400031": 0.9392124178783616, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9060231629579962, "test/sim_max_reward_4400034": 0.8763541198800087, "test/sim_max_reward_4400035": 1.0, "test/sim_max_reward_4400036": 0.9422257890839449, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.27948825857431026, "test/sim_max_reward_4400039": 0.9951435658331917, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8571258712949407, "test/sim_max_reward_4400042": 0.9877860851690076, "test/sim_max_reward_4400043": 0.9595162648547574, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9560626538188018, "test/sim_max_reward_4400046": 0.8478562358417431, "test/sim_max_reward_4400047": 0.9685112787624167, "test/sim_max_reward_4400048": 0.7340983419882561, "test/sim_max_reward_4400049": 0.9690586424845957, "train/mean_score": 0.5754515452223339, "test/mean_score": 0.5777954054217141, "val_loss": 68455.6640625} {"train_loss": -6.752455711364746, "global_step": 144942, "epoch": 3451} {"train_loss": -6.6637983322143555, "global_step": 144943, "epoch": 3451} {"train_loss": -6.755084991455078, "global_step": 144944, "epoch": 3451} {"train_loss": -6.837395191192627, "global_step": 144945, "epoch": 3451} {"train_loss": -6.677639961242676, "global_step": 144946, "epoch": 3451} {"train_loss": -6.816463470458984, "global_step": 144947, "epoch": 3451} {"train_loss": -6.759086608886719, "global_step": 144948, "epoch": 3451} {"train_loss": -6.801810264587402, "global_step": 144949, "epoch": 3451} {"train_loss": -6.723065376281738, "global_step": 144950, "epoch": 3451} {"train_loss": -6.724404335021973, "global_step": 144951, "epoch": 3451} {"train_loss": -6.605530738830566, "global_step": 144952, "epoch": 3451} {"train_loss": -6.810870170593262, "global_step": 144953, "epoch": 3451} {"train_loss": -6.670778274536133, "global_step": 144954, "epoch": 3451} {"train_loss": -6.686936378479004, "global_step": 144955, "epoch": 3451} {"train_loss": -6.829954624176025, "global_step": 144956, "epoch": 3451} {"train_loss": -6.69330358505249, "global_step": 144957, "epoch": 3451} {"train_loss": -6.857683181762695, "global_step": 144958, "epoch": 3451} {"train_loss": -6.808477401733398, "global_step": 144959, "epoch": 3451} {"train_loss": -6.67935848236084, "global_step": 144960, "epoch": 3451} {"train_loss": -6.789702892303467, "global_step": 144961, "epoch": 3451} {"train_loss": -6.768882751464844, "global_step": 144962, "epoch": 3451} {"train_loss": -6.817330360412598, "global_step": 144963, "epoch": 3451} {"train_loss": -6.783330917358398, "global_step": 144964, "epoch": 3451} {"train_loss": -6.855774879455566, "global_step": 144965, "epoch": 3451} {"train_loss": -6.78801155090332, "global_step": 144966, "epoch": 3451} {"train_loss": -6.756978988647461, "global_step": 144967, "epoch": 3451} {"train_loss": -6.726981163024902, "global_step": 144968, "epoch": 3451} {"train_loss": -6.891681671142578, "global_step": 144969, "epoch": 3451} {"train_loss": -6.830657958984375, "global_step": 144970, "epoch": 3451} {"train_loss": -6.826854705810547, "global_step": 144971, "epoch": 3451} {"train_loss": -6.7645769119262695, "global_step": 144972, "epoch": 3451} {"train_loss": -6.760140419006348, "global_step": 144973, "epoch": 3451} {"train_loss": -6.820748329162598, "global_step": 144974, "epoch": 3451} {"train_loss": -6.593384265899658, "global_step": 144975, "epoch": 3451} {"train_loss": -6.73319673538208, "global_step": 144976, "epoch": 3451} {"train_loss": -6.829556941986084, "global_step": 144977, "epoch": 3451} {"train_loss": -6.812711715698242, "global_step": 144978, "epoch": 3451} {"train_loss": -6.786332130432129, "global_step": 144979, "epoch": 3451} {"train_loss": -6.827000617980957, "global_step": 144980, "epoch": 3451} {"train_loss": -6.702096939086914, "global_step": 144981, "epoch": 3451} {"train_loss": -6.774547576904297, "global_step": 144982, "epoch": 3451} {"train_loss": -6.764306613377163, "global_step": 144983, "epoch": 3451, "val_loss": 68344.3125} {"train_loss": -6.769752502441406, "global_step": 144984, "epoch": 3452} {"train_loss": -6.797679901123047, "global_step": 144985, "epoch": 3452} {"train_loss": -6.762986183166504, "global_step": 144986, "epoch": 3452} {"train_loss": -6.768499374389648, "global_step": 144987, "epoch": 3452} {"train_loss": -6.862943649291992, "global_step": 144988, "epoch": 3452} {"train_loss": -6.76499080657959, "global_step": 144989, "epoch": 3452} {"train_loss": -6.713559150695801, "global_step": 144990, "epoch": 3452} {"train_loss": -6.810779571533203, "global_step": 144991, "epoch": 3452} {"train_loss": -6.745922088623047, "global_step": 144992, "epoch": 3452} {"train_loss": -6.710325717926025, "global_step": 144993, "epoch": 3452} {"train_loss": -6.774135112762451, "global_step": 144994, "epoch": 3452} {"train_loss": -6.566555976867676, "global_step": 144995, "epoch": 3452} {"train_loss": -6.739449977874756, "global_step": 144996, "epoch": 3452} {"train_loss": -6.779702186584473, "global_step": 144997, "epoch": 3452} {"train_loss": -6.550678730010986, "global_step": 144998, "epoch": 3452} {"train_loss": -6.724087715148926, "global_step": 144999, "epoch": 3452} {"train_loss": -6.631974220275879, "global_step": 145000, "epoch": 3452} {"train_loss": -6.77932596206665, "global_step": 145001, "epoch": 3452} {"train_loss": -6.648202896118164, "global_step": 145002, "epoch": 3452} {"train_loss": -6.725627899169922, "global_step": 145003, "epoch": 3452} {"train_loss": -6.690397262573242, "global_step": 145004, "epoch": 3452} {"train_loss": -6.673533916473389, "global_step": 145005, "epoch": 3452} {"train_loss": -6.759429931640625, "global_step": 145006, "epoch": 3452} {"train_loss": -6.580217361450195, "global_step": 145007, "epoch": 3452} {"train_loss": -6.620141506195068, "global_step": 145008, "epoch": 3452} {"train_loss": -6.760100364685059, "global_step": 145009, "epoch": 3452} {"train_loss": -6.751500606536865, "global_step": 145010, "epoch": 3452} {"train_loss": -6.772394180297852, "global_step": 145011, "epoch": 3452} {"train_loss": -6.701083183288574, "global_step": 145012, "epoch": 3452} {"train_loss": -6.730697154998779, "global_step": 145013, "epoch": 3452} {"train_loss": -6.69964075088501, "global_step": 145014, "epoch": 3452} {"train_loss": -6.680890083312988, "global_step": 145015, "epoch": 3452} {"train_loss": -6.684876918792725, "global_step": 145016, "epoch": 3452} {"train_loss": -6.700688362121582, "global_step": 145017, "epoch": 3452} {"train_loss": -6.6599016189575195, "global_step": 145018, "epoch": 3452} {"train_loss": -6.674735069274902, "global_step": 145019, "epoch": 3452} {"train_loss": -6.736453533172607, "global_step": 145020, "epoch": 3452} {"train_loss": -6.716764450073242, "global_step": 145021, "epoch": 3452} {"train_loss": -6.67004919052124, "global_step": 145022, "epoch": 3452} {"train_loss": -6.727405548095703, "global_step": 145023, "epoch": 3452} {"train_loss": -6.713160037994385, "global_step": 145024, "epoch": 3452} {"train_loss": -6.716919660568237, "global_step": 145025, "epoch": 3452, "val_loss": 68100.765625} {"train_loss": -6.821915626525879, "global_step": 145026, "epoch": 3453} {"train_loss": -6.764690399169922, "global_step": 145027, "epoch": 3453} {"train_loss": -6.719254016876221, "global_step": 145028, "epoch": 3453} {"train_loss": -6.6598711013793945, "global_step": 145029, "epoch": 3453} {"train_loss": -6.754284858703613, "global_step": 145030, "epoch": 3453} {"train_loss": -6.7799835205078125, "global_step": 145031, "epoch": 3453} {"train_loss": -6.796817779541016, "global_step": 145032, "epoch": 3453} {"train_loss": -6.848426818847656, "global_step": 145033, "epoch": 3453} {"train_loss": -6.821067810058594, "global_step": 145034, "epoch": 3453} {"train_loss": -6.845209121704102, "global_step": 145035, "epoch": 3453} {"train_loss": -6.835371971130371, "global_step": 145036, "epoch": 3453} {"train_loss": -6.887661933898926, "global_step": 145037, "epoch": 3453} {"train_loss": -6.827994346618652, "global_step": 145038, "epoch": 3453} {"train_loss": -6.8617987632751465, "global_step": 145039, "epoch": 3453} {"train_loss": -6.817901611328125, "global_step": 145040, "epoch": 3453} {"train_loss": -6.827153205871582, "global_step": 145041, "epoch": 3453} {"train_loss": -6.857059478759766, "global_step": 145042, "epoch": 3453} {"train_loss": -6.879594326019287, "global_step": 145043, "epoch": 3453} {"train_loss": -6.834616661071777, "global_step": 145044, "epoch": 3453} {"train_loss": -6.866399765014648, "global_step": 145045, "epoch": 3453} {"train_loss": -6.8047380447387695, "global_step": 145046, "epoch": 3453} {"train_loss": -6.775999069213867, "global_step": 145047, "epoch": 3453} {"train_loss": -6.750536918640137, "global_step": 145048, "epoch": 3453} {"train_loss": -6.772207260131836, "global_step": 145049, "epoch": 3453} {"train_loss": -6.707863807678223, "global_step": 145050, "epoch": 3453} {"train_loss": -6.694280624389648, "global_step": 145051, "epoch": 3453} {"train_loss": -6.827334403991699, "global_step": 145052, "epoch": 3453} {"train_loss": -6.7029290199279785, "global_step": 145053, "epoch": 3453} {"train_loss": -6.771778106689453, "global_step": 145054, "epoch": 3453} {"train_loss": -6.7622880935668945, "global_step": 145055, "epoch": 3453} {"train_loss": -6.715936660766602, "global_step": 145056, "epoch": 3453} {"train_loss": -6.774844169616699, "global_step": 145057, "epoch": 3453} {"train_loss": -6.735696792602539, "global_step": 145058, "epoch": 3453} {"train_loss": -6.746581554412842, "global_step": 145059, "epoch": 3453} {"train_loss": -6.890199661254883, "global_step": 145060, "epoch": 3453} {"train_loss": -6.531563758850098, "global_step": 145061, "epoch": 3453} {"train_loss": -6.572113990783691, "global_step": 145062, "epoch": 3453} {"train_loss": -6.794519424438477, "global_step": 145063, "epoch": 3453} {"train_loss": -6.689150810241699, "global_step": 145064, "epoch": 3453} {"train_loss": -6.6952056884765625, "global_step": 145065, "epoch": 3453} {"train_loss": -6.702463150024414, "global_step": 145066, "epoch": 3453} {"train_loss": -6.772364979698544, "global_step": 145067, "epoch": 3453, "val_loss": 68459.9140625} {"train_loss": -6.685378074645996, "global_step": 145068, "epoch": 3454} {"train_loss": -6.613123416900635, "global_step": 145069, "epoch": 3454} {"train_loss": -6.7801713943481445, "global_step": 145070, "epoch": 3454} {"train_loss": -6.832789421081543, "global_step": 145071, "epoch": 3454} {"train_loss": -6.736237525939941, "global_step": 145072, "epoch": 3454} {"train_loss": -6.7023468017578125, "global_step": 145073, "epoch": 3454} {"train_loss": -6.796201705932617, "global_step": 145074, "epoch": 3454} {"train_loss": -6.80479621887207, "global_step": 145075, "epoch": 3454} {"train_loss": -6.630072593688965, "global_step": 145076, "epoch": 3454} {"train_loss": -6.845955848693848, "global_step": 145077, "epoch": 3454} {"train_loss": -6.769085884094238, "global_step": 145078, "epoch": 3454} {"train_loss": -6.772725582122803, "global_step": 145079, "epoch": 3454} {"train_loss": -6.744468688964844, "global_step": 145080, "epoch": 3454} {"train_loss": -6.724033355712891, "global_step": 145081, "epoch": 3454} {"train_loss": -6.8036298751831055, "global_step": 145082, "epoch": 3454} {"train_loss": -6.725218772888184, "global_step": 145083, "epoch": 3454} {"train_loss": -6.81901741027832, "global_step": 145084, "epoch": 3454} {"train_loss": -6.709626197814941, "global_step": 145085, "epoch": 3454} {"train_loss": -6.83634090423584, "global_step": 145086, "epoch": 3454} {"train_loss": -6.834027290344238, "global_step": 145087, "epoch": 3454} {"train_loss": -6.751875877380371, "global_step": 145088, "epoch": 3454} {"train_loss": -6.924318313598633, "global_step": 145089, "epoch": 3454} {"train_loss": -6.659511566162109, "global_step": 145090, "epoch": 3454} {"train_loss": -6.762666702270508, "global_step": 145091, "epoch": 3454} {"train_loss": -6.653360843658447, "global_step": 145092, "epoch": 3454} {"train_loss": -6.634531021118164, "global_step": 145093, "epoch": 3454} {"train_loss": -6.748178958892822, "global_step": 145094, "epoch": 3454} {"train_loss": -6.692594528198242, "global_step": 145095, "epoch": 3454} {"train_loss": -6.630486488342285, "global_step": 145096, "epoch": 3454} {"train_loss": -6.832542419433594, "global_step": 145097, "epoch": 3454} {"train_loss": -6.621621131896973, "global_step": 145098, "epoch": 3454} {"train_loss": -6.744106769561768, "global_step": 145099, "epoch": 3454} {"train_loss": -6.667267799377441, "global_step": 145100, "epoch": 3454} {"train_loss": -6.719886302947998, "global_step": 145101, "epoch": 3454} {"train_loss": -6.728764533996582, "global_step": 145102, "epoch": 3454} {"train_loss": -6.657898902893066, "global_step": 145103, "epoch": 3454} {"train_loss": -6.729849815368652, "global_step": 145104, "epoch": 3454} {"train_loss": -6.553900718688965, "global_step": 145105, "epoch": 3454} {"train_loss": -6.675018310546875, "global_step": 145106, "epoch": 3454} {"train_loss": -6.585309982299805, "global_step": 145107, "epoch": 3454} {"train_loss": -6.738585948944092, "global_step": 145108, "epoch": 3454} {"train_loss": -6.724593889145624, "global_step": 145109, "epoch": 3454, "val_loss": 68865.828125} {"train_loss": -6.557121276855469, "global_step": 145110, "epoch": 3455} {"train_loss": -6.702426910400391, "global_step": 145111, "epoch": 3455} {"train_loss": -6.610851287841797, "global_step": 145112, "epoch": 3455} {"train_loss": -6.765746116638184, "global_step": 145113, "epoch": 3455} {"train_loss": -6.534279823303223, "global_step": 145114, "epoch": 3455} {"train_loss": -6.661449909210205, "global_step": 145115, "epoch": 3455} {"train_loss": -6.585309028625488, "global_step": 145116, "epoch": 3455} {"train_loss": -6.707755088806152, "global_step": 145117, "epoch": 3455} {"train_loss": -6.652570724487305, "global_step": 145118, "epoch": 3455} {"train_loss": -6.674288272857666, "global_step": 145119, "epoch": 3455} {"train_loss": -6.550217628479004, "global_step": 145120, "epoch": 3455} {"train_loss": -6.58823299407959, "global_step": 145121, "epoch": 3455} {"train_loss": -6.732704162597656, "global_step": 145122, "epoch": 3455} {"train_loss": -6.7061262130737305, "global_step": 145123, "epoch": 3455} {"train_loss": -6.659484386444092, "global_step": 145124, "epoch": 3455} {"train_loss": -6.668459892272949, "global_step": 145125, "epoch": 3455} {"train_loss": -6.704084396362305, "global_step": 145126, "epoch": 3455} {"train_loss": -6.670108795166016, "global_step": 145127, "epoch": 3455} {"train_loss": -6.620743274688721, "global_step": 145128, "epoch": 3455} {"train_loss": -6.722881317138672, "global_step": 145129, "epoch": 3455} {"train_loss": -6.699089527130127, "global_step": 145130, "epoch": 3455} {"train_loss": -6.671927452087402, "global_step": 145131, "epoch": 3455} {"train_loss": -6.654336929321289, "global_step": 145132, "epoch": 3455} {"train_loss": -6.618917942047119, "global_step": 145133, "epoch": 3455} {"train_loss": -6.657479286193848, "global_step": 145134, "epoch": 3455} {"train_loss": -6.807902812957764, "global_step": 145135, "epoch": 3455} {"train_loss": -6.707144260406494, "global_step": 145136, "epoch": 3455} {"train_loss": -6.70163631439209, "global_step": 145137, "epoch": 3455} {"train_loss": -6.6148576736450195, "global_step": 145138, "epoch": 3455} {"train_loss": -6.822076797485352, "global_step": 145139, "epoch": 3455} {"train_loss": -6.743458271026611, "global_step": 145140, "epoch": 3455} {"train_loss": -6.744181156158447, "global_step": 145141, "epoch": 3455} {"train_loss": -6.712222576141357, "global_step": 145142, "epoch": 3455} {"train_loss": -6.80816125869751, "global_step": 145143, "epoch": 3455} {"train_loss": -6.753334999084473, "global_step": 145144, "epoch": 3455} {"train_loss": -6.78269100189209, "global_step": 145145, "epoch": 3455} {"train_loss": -6.837946891784668, "global_step": 145146, "epoch": 3455} {"train_loss": -6.800031661987305, "global_step": 145147, "epoch": 3455} {"train_loss": -6.856345176696777, "global_step": 145148, "epoch": 3455} {"train_loss": -6.830556869506836, "global_step": 145149, "epoch": 3455} {"train_loss": -6.683877944946289, "global_step": 145150, "epoch": 3455} {"train_loss": -6.701208455221994, "global_step": 145151, "epoch": 3455, "val_loss": 68348.1875} {"train_loss": -6.719420433044434, "global_step": 145152, "epoch": 3456} {"train_loss": -6.8690643310546875, "global_step": 145153, "epoch": 3456} {"train_loss": -6.706747055053711, "global_step": 145154, "epoch": 3456} {"train_loss": -6.529895782470703, "global_step": 145155, "epoch": 3456} {"train_loss": -6.67656135559082, "global_step": 145156, "epoch": 3456} {"train_loss": -6.725316524505615, "global_step": 145157, "epoch": 3456} {"train_loss": -6.833709716796875, "global_step": 145158, "epoch": 3456} {"train_loss": -6.756269454956055, "global_step": 145159, "epoch": 3456} {"train_loss": -6.73799991607666, "global_step": 145160, "epoch": 3456} {"train_loss": -6.703086853027344, "global_step": 145161, "epoch": 3456} {"train_loss": -6.743549346923828, "global_step": 145162, "epoch": 3456} {"train_loss": -6.713773727416992, "global_step": 145163, "epoch": 3456} {"train_loss": -6.755727291107178, "global_step": 145164, "epoch": 3456} {"train_loss": -6.612890243530273, "global_step": 145165, "epoch": 3456} {"train_loss": -6.719764709472656, "global_step": 145166, "epoch": 3456} {"train_loss": -6.618274688720703, "global_step": 145167, "epoch": 3456} {"train_loss": -6.7808074951171875, "global_step": 145168, "epoch": 3456} {"train_loss": -6.795541763305664, "global_step": 145169, "epoch": 3456} {"train_loss": -6.90989875793457, "global_step": 145170, "epoch": 3456} {"train_loss": -6.749250411987305, "global_step": 145171, "epoch": 3456} {"train_loss": -6.729366302490234, "global_step": 145172, "epoch": 3456} {"train_loss": -6.755500793457031, "global_step": 145173, "epoch": 3456} {"train_loss": -6.783949851989746, "global_step": 145174, "epoch": 3456} {"train_loss": -6.909340858459473, "global_step": 145175, "epoch": 3456} {"train_loss": -6.854339122772217, "global_step": 145176, "epoch": 3456} {"train_loss": -6.6876678466796875, "global_step": 145177, "epoch": 3456} {"train_loss": -6.818482398986816, "global_step": 145178, "epoch": 3456} {"train_loss": -6.6935625076293945, "global_step": 145179, "epoch": 3456} {"train_loss": -6.695169925689697, "global_step": 145180, "epoch": 3456} {"train_loss": -6.748942852020264, "global_step": 145181, "epoch": 3456} {"train_loss": -6.766230583190918, "global_step": 145182, "epoch": 3456} {"train_loss": -6.933626174926758, "global_step": 145183, "epoch": 3456} {"train_loss": -6.774325847625732, "global_step": 145184, "epoch": 3456} {"train_loss": -6.7561116218566895, "global_step": 145185, "epoch": 3456} {"train_loss": -6.873104095458984, "global_step": 145186, "epoch": 3456} {"train_loss": -6.761785507202148, "global_step": 145187, "epoch": 3456} {"train_loss": -6.856992721557617, "global_step": 145188, "epoch": 3456} {"train_loss": -6.867925643920898, "global_step": 145189, "epoch": 3456} {"train_loss": -6.784835338592529, "global_step": 145190, "epoch": 3456} {"train_loss": -6.883571624755859, "global_step": 145191, "epoch": 3456} {"train_loss": -6.937167167663574, "global_step": 145192, "epoch": 3456} {"train_loss": -6.770789714086623, "global_step": 145193, "epoch": 3456, "val_loss": 68348.8515625} {"train_loss": -6.791200160980225, "global_step": 145194, "epoch": 3457} {"train_loss": -6.7892327308654785, "global_step": 145195, "epoch": 3457} {"train_loss": -6.861650466918945, "global_step": 145196, "epoch": 3457} {"train_loss": -6.836381912231445, "global_step": 145197, "epoch": 3457} {"train_loss": -6.790278434753418, "global_step": 145198, "epoch": 3457} {"train_loss": -6.786602973937988, "global_step": 145199, "epoch": 3457} {"train_loss": -6.923266410827637, "global_step": 145200, "epoch": 3457} {"train_loss": -6.8137736320495605, "global_step": 145201, "epoch": 3457} {"train_loss": -6.855940818786621, "global_step": 145202, "epoch": 3457} {"train_loss": -6.934478282928467, "global_step": 145203, "epoch": 3457} {"train_loss": -6.847869873046875, "global_step": 145204, "epoch": 3457} {"train_loss": -6.721895694732666, "global_step": 145205, "epoch": 3457} {"train_loss": -6.816050052642822, "global_step": 145206, "epoch": 3457} {"train_loss": -6.844465255737305, "global_step": 145207, "epoch": 3457} {"train_loss": -6.837018966674805, "global_step": 145208, "epoch": 3457} {"train_loss": -6.820428848266602, "global_step": 145209, "epoch": 3457} {"train_loss": -6.823877334594727, "global_step": 145210, "epoch": 3457} {"train_loss": -6.8718791007995605, "global_step": 145211, "epoch": 3457} {"train_loss": -6.877320766448975, "global_step": 145212, "epoch": 3457} {"train_loss": -6.752131938934326, "global_step": 145213, "epoch": 3457} {"train_loss": -6.854987144470215, "global_step": 145214, "epoch": 3457} {"train_loss": -6.864776611328125, "global_step": 145215, "epoch": 3457} {"train_loss": -6.83009147644043, "global_step": 145216, "epoch": 3457} {"train_loss": -6.6782732009887695, "global_step": 145217, "epoch": 3457} {"train_loss": -6.896963119506836, "global_step": 145218, "epoch": 3457} {"train_loss": -6.710097312927246, "global_step": 145219, "epoch": 3457} {"train_loss": -6.805026054382324, "global_step": 145220, "epoch": 3457} {"train_loss": -6.686561107635498, "global_step": 145221, "epoch": 3457} {"train_loss": -6.816186904907227, "global_step": 145222, "epoch": 3457} {"train_loss": -6.745330810546875, "global_step": 145223, "epoch": 3457} {"train_loss": -6.853244781494141, "global_step": 145224, "epoch": 3457} {"train_loss": -6.831116676330566, "global_step": 145225, "epoch": 3457} {"train_loss": -6.834427833557129, "global_step": 145226, "epoch": 3457} {"train_loss": -6.793600082397461, "global_step": 145227, "epoch": 3457} {"train_loss": -6.826045513153076, "global_step": 145228, "epoch": 3457} {"train_loss": -6.818098545074463, "global_step": 145229, "epoch": 3457} {"train_loss": -6.703917503356934, "global_step": 145230, "epoch": 3457} {"train_loss": -6.687048435211182, "global_step": 145231, "epoch": 3457} {"train_loss": -6.668597221374512, "global_step": 145232, "epoch": 3457} {"train_loss": -6.767740249633789, "global_step": 145233, "epoch": 3457} {"train_loss": -6.7070088386535645, "global_step": 145234, "epoch": 3457} {"train_loss": -6.805033275059292, "global_step": 145235, "epoch": 3457, "val_loss": 68311.4921875} {"train_loss": -6.840295314788818, "global_step": 145236, "epoch": 3458} {"train_loss": -6.661088943481445, "global_step": 145237, "epoch": 3458} {"train_loss": -6.773773193359375, "global_step": 145238, "epoch": 3458} {"train_loss": -6.644798278808594, "global_step": 145239, "epoch": 3458} {"train_loss": -6.774108409881592, "global_step": 145240, "epoch": 3458} {"train_loss": -6.805488109588623, "global_step": 145241, "epoch": 3458} {"train_loss": -6.604160308837891, "global_step": 145242, "epoch": 3458} {"train_loss": -6.838929176330566, "global_step": 145243, "epoch": 3458} {"train_loss": -6.6303582191467285, "global_step": 145244, "epoch": 3458} {"train_loss": -6.794573783874512, "global_step": 145245, "epoch": 3458} {"train_loss": -6.770058631896973, "global_step": 145246, "epoch": 3458} {"train_loss": -6.647319793701172, "global_step": 145247, "epoch": 3458} {"train_loss": -6.758773326873779, "global_step": 145248, "epoch": 3458} {"train_loss": -6.7635908126831055, "global_step": 145249, "epoch": 3458} {"train_loss": -6.855410575866699, "global_step": 145250, "epoch": 3458} {"train_loss": -6.719507694244385, "global_step": 145251, "epoch": 3458} {"train_loss": -6.717773914337158, "global_step": 145252, "epoch": 3458} {"train_loss": -6.781260013580322, "global_step": 145253, "epoch": 3458} {"train_loss": -6.725950241088867, "global_step": 145254, "epoch": 3458} {"train_loss": -6.8148956298828125, "global_step": 145255, "epoch": 3458} {"train_loss": -6.767999649047852, "global_step": 145256, "epoch": 3458} {"train_loss": -6.848943710327148, "global_step": 145257, "epoch": 3458} {"train_loss": -6.721900939941406, "global_step": 145258, "epoch": 3458} {"train_loss": -6.718914031982422, "global_step": 145259, "epoch": 3458} {"train_loss": -6.714728832244873, "global_step": 145260, "epoch": 3458} {"train_loss": -6.759400844573975, "global_step": 145261, "epoch": 3458} {"train_loss": -6.742484092712402, "global_step": 145262, "epoch": 3458} {"train_loss": -6.892676830291748, "global_step": 145263, "epoch": 3458} {"train_loss": -6.846108913421631, "global_step": 145264, "epoch": 3458} {"train_loss": -6.81026554107666, "global_step": 145265, "epoch": 3458} {"train_loss": -6.775161266326904, "global_step": 145266, "epoch": 3458} {"train_loss": -6.8230299949646, "global_step": 145267, "epoch": 3458} {"train_loss": -6.8530473709106445, "global_step": 145268, "epoch": 3458} {"train_loss": -6.8572821617126465, "global_step": 145269, "epoch": 3458} {"train_loss": -6.713581085205078, "global_step": 145270, "epoch": 3458} {"train_loss": -6.724369049072266, "global_step": 145271, "epoch": 3458} {"train_loss": -6.7182512283325195, "global_step": 145272, "epoch": 3458} {"train_loss": -6.783975601196289, "global_step": 145273, "epoch": 3458} {"train_loss": -6.813968658447266, "global_step": 145274, "epoch": 3458} {"train_loss": -6.906612396240234, "global_step": 145275, "epoch": 3458} {"train_loss": -6.7659196853637695, "global_step": 145276, "epoch": 3458} {"train_loss": -6.766776334671747, "global_step": 145277, "epoch": 3458, "val_loss": 68470.671875} {"train_loss": -6.744081974029541, "global_step": 145278, "epoch": 3459} {"train_loss": -6.666765213012695, "global_step": 145279, "epoch": 3459} {"train_loss": -6.799410343170166, "global_step": 145280, "epoch": 3459} {"train_loss": -6.81397008895874, "global_step": 145281, "epoch": 3459} {"train_loss": -6.854472637176514, "global_step": 145282, "epoch": 3459} {"train_loss": -6.7778167724609375, "global_step": 145283, "epoch": 3459} {"train_loss": -6.792991638183594, "global_step": 145284, "epoch": 3459} {"train_loss": -6.778156280517578, "global_step": 145285, "epoch": 3459} {"train_loss": -6.736006736755371, "global_step": 145286, "epoch": 3459} {"train_loss": -6.805514335632324, "global_step": 145287, "epoch": 3459} {"train_loss": -6.745107173919678, "global_step": 145288, "epoch": 3459} {"train_loss": -6.808968544006348, "global_step": 145289, "epoch": 3459} {"train_loss": -6.8319902420043945, "global_step": 145290, "epoch": 3459} {"train_loss": -6.832164764404297, "global_step": 145291, "epoch": 3459} {"train_loss": -6.762166500091553, "global_step": 145292, "epoch": 3459} {"train_loss": -6.772026062011719, "global_step": 145293, "epoch": 3459} {"train_loss": -6.5794782638549805, "global_step": 145294, "epoch": 3459} {"train_loss": -6.866246223449707, "global_step": 145295, "epoch": 3459} {"train_loss": -6.76970100402832, "global_step": 145296, "epoch": 3459} {"train_loss": -6.6670942306518555, "global_step": 145297, "epoch": 3459} {"train_loss": -6.71803092956543, "global_step": 145298, "epoch": 3459} {"train_loss": -6.659845352172852, "global_step": 145299, "epoch": 3459} {"train_loss": -6.727373123168945, "global_step": 145300, "epoch": 3459} {"train_loss": -6.511590957641602, "global_step": 145301, "epoch": 3459} {"train_loss": -6.721716403961182, "global_step": 145302, "epoch": 3459} {"train_loss": -6.736777305603027, "global_step": 145303, "epoch": 3459} {"train_loss": -6.471182823181152, "global_step": 145304, "epoch": 3459} {"train_loss": -6.857222557067871, "global_step": 145305, "epoch": 3459} {"train_loss": -6.712084770202637, "global_step": 145306, "epoch": 3459} {"train_loss": -6.679922103881836, "global_step": 145307, "epoch": 3459} {"train_loss": -6.642675876617432, "global_step": 145308, "epoch": 3459} {"train_loss": -6.699192523956299, "global_step": 145309, "epoch": 3459} {"train_loss": -6.767314910888672, "global_step": 145310, "epoch": 3459} {"train_loss": -6.601764678955078, "global_step": 145311, "epoch": 3459} {"train_loss": -6.72081184387207, "global_step": 145312, "epoch": 3459} {"train_loss": -6.71193790435791, "global_step": 145313, "epoch": 3459} {"train_loss": -6.733917236328125, "global_step": 145314, "epoch": 3459} {"train_loss": -6.787182807922363, "global_step": 145315, "epoch": 3459} {"train_loss": -6.638298988342285, "global_step": 145316, "epoch": 3459} {"train_loss": -6.582034111022949, "global_step": 145317, "epoch": 3459} {"train_loss": -6.729576110839844, "global_step": 145318, "epoch": 3459} {"train_loss": -6.724755968366351, "global_step": 145319, "epoch": 3459, "val_loss": 68377.671875} {"train_loss": -6.702488899230957, "global_step": 145320, "epoch": 3460} {"train_loss": -6.654253959655762, "global_step": 145321, "epoch": 3460} {"train_loss": -6.56334114074707, "global_step": 145322, "epoch": 3460} {"train_loss": -6.674481391906738, "global_step": 145323, "epoch": 3460} {"train_loss": -6.706603050231934, "global_step": 145324, "epoch": 3460} {"train_loss": -6.7505412101745605, "global_step": 145325, "epoch": 3460} {"train_loss": -6.675154685974121, "global_step": 145326, "epoch": 3460} {"train_loss": -6.778071403503418, "global_step": 145327, "epoch": 3460} {"train_loss": -6.745021343231201, "global_step": 145328, "epoch": 3460} {"train_loss": -6.6818695068359375, "global_step": 145329, "epoch": 3460} {"train_loss": -6.706746578216553, "global_step": 145330, "epoch": 3460} {"train_loss": -6.754528045654297, "global_step": 145331, "epoch": 3460} {"train_loss": -6.660547256469727, "global_step": 145332, "epoch": 3460} {"train_loss": -6.7256760597229, "global_step": 145333, "epoch": 3460} {"train_loss": -6.5815277099609375, "global_step": 145334, "epoch": 3460} {"train_loss": -6.828350067138672, "global_step": 145335, "epoch": 3460} {"train_loss": -6.750335693359375, "global_step": 145336, "epoch": 3460} {"train_loss": -6.793994426727295, "global_step": 145337, "epoch": 3460} {"train_loss": -6.8239030838012695, "global_step": 145338, "epoch": 3460} {"train_loss": -6.564357280731201, "global_step": 145339, "epoch": 3460} {"train_loss": -6.719176292419434, "global_step": 145340, "epoch": 3460} {"train_loss": -6.604246139526367, "global_step": 145341, "epoch": 3460} {"train_loss": -6.805069923400879, "global_step": 145342, "epoch": 3460} {"train_loss": -6.641045093536377, "global_step": 145343, "epoch": 3460} {"train_loss": -6.730499744415283, "global_step": 145344, "epoch": 3460} {"train_loss": -6.807989597320557, "global_step": 145345, "epoch": 3460} {"train_loss": -6.726323127746582, "global_step": 145346, "epoch": 3460} {"train_loss": -6.768242835998535, "global_step": 145347, "epoch": 3460} {"train_loss": -6.785807132720947, "global_step": 145348, "epoch": 3460} {"train_loss": -6.771759510040283, "global_step": 145349, "epoch": 3460} {"train_loss": -6.786434650421143, "global_step": 145350, "epoch": 3460} {"train_loss": -6.82235050201416, "global_step": 145351, "epoch": 3460} {"train_loss": -6.7992706298828125, "global_step": 145352, "epoch": 3460} {"train_loss": -6.737631797790527, "global_step": 145353, "epoch": 3460} {"train_loss": -6.776419639587402, "global_step": 145354, "epoch": 3460} {"train_loss": -6.896483421325684, "global_step": 145355, "epoch": 3460} {"train_loss": -6.801220893859863, "global_step": 145356, "epoch": 3460} {"train_loss": -6.763280391693115, "global_step": 145357, "epoch": 3460} {"train_loss": -6.802089691162109, "global_step": 145358, "epoch": 3460} {"train_loss": -6.894852638244629, "global_step": 145359, "epoch": 3460} {"train_loss": -6.920297622680664, "global_step": 145360, "epoch": 3460} {"train_loss": -6.744272811072213, "global_step": 145361, "epoch": 3460, "val_loss": 68287.109375} {"train_loss": -6.716578483581543, "global_step": 145362, "epoch": 3461} {"train_loss": -6.69747257232666, "global_step": 145363, "epoch": 3461} {"train_loss": -6.761717796325684, "global_step": 145364, "epoch": 3461} {"train_loss": -6.881507873535156, "global_step": 145365, "epoch": 3461} {"train_loss": -6.772841453552246, "global_step": 145366, "epoch": 3461} {"train_loss": -6.65224552154541, "global_step": 145367, "epoch": 3461} {"train_loss": -6.8643999099731445, "global_step": 145368, "epoch": 3461} {"train_loss": -6.696175575256348, "global_step": 145369, "epoch": 3461} {"train_loss": -6.738689422607422, "global_step": 145370, "epoch": 3461} {"train_loss": -6.817598342895508, "global_step": 145371, "epoch": 3461} {"train_loss": -6.7668681144714355, "global_step": 145372, "epoch": 3461} {"train_loss": -6.771732330322266, "global_step": 145373, "epoch": 3461} {"train_loss": -6.787464618682861, "global_step": 145374, "epoch": 3461} {"train_loss": -6.81596565246582, "global_step": 145375, "epoch": 3461} {"train_loss": -6.8245849609375, "global_step": 145376, "epoch": 3461} {"train_loss": -6.855931758880615, "global_step": 145377, "epoch": 3461} {"train_loss": -6.722293853759766, "global_step": 145378, "epoch": 3461} {"train_loss": -6.720434188842773, "global_step": 145379, "epoch": 3461} {"train_loss": -6.821263313293457, "global_step": 145380, "epoch": 3461} {"train_loss": -6.826379776000977, "global_step": 145381, "epoch": 3461} {"train_loss": -6.882564544677734, "global_step": 145382, "epoch": 3461} {"train_loss": -6.783081531524658, "global_step": 145383, "epoch": 3461} {"train_loss": -6.844537734985352, "global_step": 145384, "epoch": 3461} {"train_loss": -6.8738908767700195, "global_step": 145385, "epoch": 3461} {"train_loss": -6.844277381896973, "global_step": 145386, "epoch": 3461} {"train_loss": -6.717310905456543, "global_step": 145387, "epoch": 3461} {"train_loss": -6.802689552307129, "global_step": 145388, "epoch": 3461} {"train_loss": -6.824466228485107, "global_step": 145389, "epoch": 3461} {"train_loss": -6.821571350097656, "global_step": 145390, "epoch": 3461} {"train_loss": -6.742818832397461, "global_step": 145391, "epoch": 3461} {"train_loss": -6.885148048400879, "global_step": 145392, "epoch": 3461} {"train_loss": -6.755139350891113, "global_step": 145393, "epoch": 3461} {"train_loss": -6.903621673583984, "global_step": 145394, "epoch": 3461} {"train_loss": -6.719586372375488, "global_step": 145395, "epoch": 3461} {"train_loss": -6.894202709197998, "global_step": 145396, "epoch": 3461} {"train_loss": -6.7473249435424805, "global_step": 145397, "epoch": 3461} {"train_loss": -6.873216152191162, "global_step": 145398, "epoch": 3461} {"train_loss": -6.791033744812012, "global_step": 145399, "epoch": 3461} {"train_loss": -6.8309454917907715, "global_step": 145400, "epoch": 3461} {"train_loss": -6.837737560272217, "global_step": 145401, "epoch": 3461} {"train_loss": -6.733423709869385, "global_step": 145402, "epoch": 3461} {"train_loss": -6.7967979453858876, "global_step": 145403, "epoch": 3461, "val_loss": 68444.3984375} {"train_loss": -6.809276103973389, "global_step": 145404, "epoch": 3462} {"train_loss": -6.848973274230957, "global_step": 145405, "epoch": 3462} {"train_loss": -6.735555648803711, "global_step": 145406, "epoch": 3462} {"train_loss": -6.665533065795898, "global_step": 145407, "epoch": 3462} {"train_loss": -6.869049072265625, "global_step": 145408, "epoch": 3462} {"train_loss": -6.687164306640625, "global_step": 145409, "epoch": 3462} {"train_loss": -6.857155799865723, "global_step": 145410, "epoch": 3462} {"train_loss": -6.784950256347656, "global_step": 145411, "epoch": 3462} {"train_loss": -6.731362342834473, "global_step": 145412, "epoch": 3462} {"train_loss": -6.743319034576416, "global_step": 145413, "epoch": 3462} {"train_loss": -6.748705863952637, "global_step": 145414, "epoch": 3462} {"train_loss": -6.7622456550598145, "global_step": 145415, "epoch": 3462} {"train_loss": -6.722071647644043, "global_step": 145416, "epoch": 3462} {"train_loss": -6.732351303100586, "global_step": 145417, "epoch": 3462} {"train_loss": -6.6436944007873535, "global_step": 145418, "epoch": 3462} {"train_loss": -6.730686187744141, "global_step": 145419, "epoch": 3462} {"train_loss": -6.779967784881592, "global_step": 145420, "epoch": 3462} {"train_loss": -6.724664688110352, "global_step": 145421, "epoch": 3462} {"train_loss": -6.813939094543457, "global_step": 145422, "epoch": 3462} {"train_loss": -6.758764266967773, "global_step": 145423, "epoch": 3462} {"train_loss": -6.815418243408203, "global_step": 145424, "epoch": 3462} {"train_loss": -6.790102481842041, "global_step": 145425, "epoch": 3462} {"train_loss": -6.704839706420898, "global_step": 145426, "epoch": 3462} {"train_loss": -6.773815155029297, "global_step": 145427, "epoch": 3462} {"train_loss": -6.762050628662109, "global_step": 145428, "epoch": 3462} {"train_loss": -6.749137878417969, "global_step": 145429, "epoch": 3462} {"train_loss": -6.701700210571289, "global_step": 145430, "epoch": 3462} {"train_loss": -6.7149338722229, "global_step": 145431, "epoch": 3462} {"train_loss": -6.742892742156982, "global_step": 145432, "epoch": 3462} {"train_loss": -6.72054386138916, "global_step": 145433, "epoch": 3462} {"train_loss": -6.889120101928711, "global_step": 145434, "epoch": 3462} {"train_loss": -6.810357570648193, "global_step": 145435, "epoch": 3462} {"train_loss": -6.706146717071533, "global_step": 145436, "epoch": 3462} {"train_loss": -6.853544235229492, "global_step": 145437, "epoch": 3462} {"train_loss": -6.740555763244629, "global_step": 145438, "epoch": 3462} {"train_loss": -6.814589977264404, "global_step": 145439, "epoch": 3462} {"train_loss": -6.734989166259766, "global_step": 145440, "epoch": 3462} {"train_loss": -6.602074146270752, "global_step": 145441, "epoch": 3462} {"train_loss": -6.774325370788574, "global_step": 145442, "epoch": 3462} {"train_loss": -6.730217933654785, "global_step": 145443, "epoch": 3462} {"train_loss": -6.668004512786865, "global_step": 145444, "epoch": 3462} {"train_loss": -6.758234205700102, "global_step": 145445, "epoch": 3462, "val_loss": 68276.5859375} {"train_loss": -6.728841304779053, "global_step": 145446, "epoch": 3463} {"train_loss": -6.712454319000244, "global_step": 145447, "epoch": 3463} {"train_loss": -6.658757209777832, "global_step": 145448, "epoch": 3463} {"train_loss": -6.575052261352539, "global_step": 145449, "epoch": 3463} {"train_loss": -6.849432945251465, "global_step": 145450, "epoch": 3463} {"train_loss": -6.812314510345459, "global_step": 145451, "epoch": 3463} {"train_loss": -6.678478240966797, "global_step": 145452, "epoch": 3463} {"train_loss": -6.775269031524658, "global_step": 145453, "epoch": 3463} {"train_loss": -6.530092239379883, "global_step": 145454, "epoch": 3463} {"train_loss": -6.705931663513184, "global_step": 145455, "epoch": 3463} {"train_loss": -6.533203125, "global_step": 145456, "epoch": 3463} {"train_loss": -6.659824848175049, "global_step": 145457, "epoch": 3463} {"train_loss": -6.708375930786133, "global_step": 145458, "epoch": 3463} {"train_loss": -6.74553918838501, "global_step": 145459, "epoch": 3463} {"train_loss": -6.7707929611206055, "global_step": 145460, "epoch": 3463} {"train_loss": -6.722265243530273, "global_step": 145461, "epoch": 3463} {"train_loss": -6.792261123657227, "global_step": 145462, "epoch": 3463} {"train_loss": -6.817112922668457, "global_step": 145463, "epoch": 3463} {"train_loss": -6.73339319229126, "global_step": 145464, "epoch": 3463} {"train_loss": -6.776089191436768, "global_step": 145465, "epoch": 3463} {"train_loss": -6.73294734954834, "global_step": 145466, "epoch": 3463} {"train_loss": -6.750697135925293, "global_step": 145467, "epoch": 3463} {"train_loss": -6.769637584686279, "global_step": 145468, "epoch": 3463} {"train_loss": -6.654878616333008, "global_step": 145469, "epoch": 3463} {"train_loss": -6.6887922286987305, "global_step": 145470, "epoch": 3463} {"train_loss": -6.6794281005859375, "global_step": 145471, "epoch": 3463} {"train_loss": -6.765957832336426, "global_step": 145472, "epoch": 3463} {"train_loss": -6.688846588134766, "global_step": 145473, "epoch": 3463} {"train_loss": -6.797884941101074, "global_step": 145474, "epoch": 3463} {"train_loss": -6.579110145568848, "global_step": 145475, "epoch": 3463} {"train_loss": -6.717503547668457, "global_step": 145476, "epoch": 3463} {"train_loss": -6.7523884773254395, "global_step": 145477, "epoch": 3463} {"train_loss": -6.746748924255371, "global_step": 145478, "epoch": 3463} {"train_loss": -6.6684417724609375, "global_step": 145479, "epoch": 3463} {"train_loss": -6.790220737457275, "global_step": 145480, "epoch": 3463} {"train_loss": -6.745051860809326, "global_step": 145481, "epoch": 3463} {"train_loss": -6.718022346496582, "global_step": 145482, "epoch": 3463} {"train_loss": -6.652119159698486, "global_step": 145483, "epoch": 3463} {"train_loss": -6.723118782043457, "global_step": 145484, "epoch": 3463} {"train_loss": -6.702901363372803, "global_step": 145485, "epoch": 3463} {"train_loss": -6.802985191345215, "global_step": 145486, "epoch": 3463} {"train_loss": -6.721645911534627, "global_step": 145487, "epoch": 3463, "val_loss": 68218.3046875} {"train_loss": -6.744358062744141, "global_step": 145488, "epoch": 3464} {"train_loss": -6.761488437652588, "global_step": 145489, "epoch": 3464} {"train_loss": -6.62937068939209, "global_step": 145490, "epoch": 3464} {"train_loss": -6.7900495529174805, "global_step": 145491, "epoch": 3464} {"train_loss": -6.855782508850098, "global_step": 145492, "epoch": 3464} {"train_loss": -6.625535011291504, "global_step": 145493, "epoch": 3464} {"train_loss": -6.88126277923584, "global_step": 145494, "epoch": 3464} {"train_loss": -6.763005256652832, "global_step": 145495, "epoch": 3464} {"train_loss": -6.724612712860107, "global_step": 145496, "epoch": 3464} {"train_loss": -6.883782863616943, "global_step": 145497, "epoch": 3464} {"train_loss": -6.797924995422363, "global_step": 145498, "epoch": 3464} {"train_loss": -6.867768287658691, "global_step": 145499, "epoch": 3464} {"train_loss": -6.617681980133057, "global_step": 145500, "epoch": 3464} {"train_loss": -6.687007904052734, "global_step": 145501, "epoch": 3464} {"train_loss": -6.777705192565918, "global_step": 145502, "epoch": 3464} {"train_loss": -6.6363115310668945, "global_step": 145503, "epoch": 3464} {"train_loss": -6.884193420410156, "global_step": 145504, "epoch": 3464} {"train_loss": -6.765722751617432, "global_step": 145505, "epoch": 3464} {"train_loss": -6.764686584472656, "global_step": 145506, "epoch": 3464} {"train_loss": -6.824461936950684, "global_step": 145507, "epoch": 3464} {"train_loss": -6.840296745300293, "global_step": 145508, "epoch": 3464} {"train_loss": -6.718729019165039, "global_step": 145509, "epoch": 3464} {"train_loss": -6.812570571899414, "global_step": 145510, "epoch": 3464} {"train_loss": -6.8425397872924805, "global_step": 145511, "epoch": 3464} {"train_loss": -6.972884178161621, "global_step": 145512, "epoch": 3464} {"train_loss": -6.756674766540527, "global_step": 145513, "epoch": 3464} {"train_loss": -6.718719959259033, "global_step": 145514, "epoch": 3464} {"train_loss": -6.8456220626831055, "global_step": 145515, "epoch": 3464} {"train_loss": -6.651086330413818, "global_step": 145516, "epoch": 3464} {"train_loss": -6.800295829772949, "global_step": 145517, "epoch": 3464} {"train_loss": -6.7178144454956055, "global_step": 145518, "epoch": 3464} {"train_loss": -6.864739418029785, "global_step": 145519, "epoch": 3464} {"train_loss": -6.850157260894775, "global_step": 145520, "epoch": 3464} {"train_loss": -6.920383930206299, "global_step": 145521, "epoch": 3464} {"train_loss": -6.8000946044921875, "global_step": 145522, "epoch": 3464} {"train_loss": -6.833111763000488, "global_step": 145523, "epoch": 3464} {"train_loss": -6.742215156555176, "global_step": 145524, "epoch": 3464} {"train_loss": -6.910884380340576, "global_step": 145525, "epoch": 3464} {"train_loss": -6.8739471435546875, "global_step": 145526, "epoch": 3464} {"train_loss": -6.814340591430664, "global_step": 145527, "epoch": 3464} {"train_loss": -6.8051934242248535, "global_step": 145528, "epoch": 3464} {"train_loss": -6.791153385525658, "global_step": 145529, "epoch": 3464, "val_loss": 68270.2265625} {"train_loss": -6.8998894691467285, "global_step": 145530, "epoch": 3465} {"train_loss": -6.837360858917236, "global_step": 145531, "epoch": 3465} {"train_loss": -6.811407089233398, "global_step": 145532, "epoch": 3465} {"train_loss": -6.79324197769165, "global_step": 145533, "epoch": 3465} {"train_loss": -6.80844783782959, "global_step": 145534, "epoch": 3465} {"train_loss": -6.918760299682617, "global_step": 145535, "epoch": 3465} {"train_loss": -6.910784721374512, "global_step": 145536, "epoch": 3465} {"train_loss": -6.829195022583008, "global_step": 145537, "epoch": 3465} {"train_loss": -6.933321475982666, "global_step": 145538, "epoch": 3465} {"train_loss": -6.707054615020752, "global_step": 145539, "epoch": 3465} {"train_loss": -6.721288204193115, "global_step": 145540, "epoch": 3465} {"train_loss": -6.85282039642334, "global_step": 145541, "epoch": 3465} {"train_loss": -6.819790363311768, "global_step": 145542, "epoch": 3465} {"train_loss": -6.68385124206543, "global_step": 145543, "epoch": 3465} {"train_loss": -6.701991081237793, "global_step": 145544, "epoch": 3465} {"train_loss": -6.846502780914307, "global_step": 145545, "epoch": 3465} {"train_loss": -6.789377212524414, "global_step": 145546, "epoch": 3465} {"train_loss": -6.845166206359863, "global_step": 145547, "epoch": 3465} {"train_loss": -6.655653953552246, "global_step": 145548, "epoch": 3465} {"train_loss": -6.760538101196289, "global_step": 145549, "epoch": 3465} {"train_loss": -6.8318772315979, "global_step": 145550, "epoch": 3465} {"train_loss": -6.761898994445801, "global_step": 145551, "epoch": 3465} {"train_loss": -6.794429302215576, "global_step": 145552, "epoch": 3465} {"train_loss": -6.643818378448486, "global_step": 145553, "epoch": 3465} {"train_loss": -6.661868095397949, "global_step": 145554, "epoch": 3465} {"train_loss": -6.80729866027832, "global_step": 145555, "epoch": 3465} {"train_loss": -6.743107795715332, "global_step": 145556, "epoch": 3465} {"train_loss": -6.821879863739014, "global_step": 145557, "epoch": 3465} {"train_loss": -6.834817886352539, "global_step": 145558, "epoch": 3465} {"train_loss": -6.8255133628845215, "global_step": 145559, "epoch": 3465} {"train_loss": -6.6885762214660645, "global_step": 145560, "epoch": 3465} {"train_loss": -6.639369964599609, "global_step": 145561, "epoch": 3465} {"train_loss": -6.761774063110352, "global_step": 145562, "epoch": 3465} {"train_loss": -6.733953475952148, "global_step": 145563, "epoch": 3465} {"train_loss": -6.827602386474609, "global_step": 145564, "epoch": 3465} {"train_loss": -6.706896781921387, "global_step": 145565, "epoch": 3465} {"train_loss": -6.862454891204834, "global_step": 145566, "epoch": 3465} {"train_loss": -6.822384357452393, "global_step": 145567, "epoch": 3465} {"train_loss": -6.699553489685059, "global_step": 145568, "epoch": 3465} {"train_loss": -6.84989595413208, "global_step": 145569, "epoch": 3465} {"train_loss": -6.785636901855469, "global_step": 145570, "epoch": 3465} {"train_loss": -6.784233604158674, "global_step": 145571, "epoch": 3465, "val_loss": 68281.3125} {"train_loss": -6.696657180786133, "global_step": 145572, "epoch": 3466} {"train_loss": -6.927349090576172, "global_step": 145573, "epoch": 3466} {"train_loss": -6.8968353271484375, "global_step": 145574, "epoch": 3466} {"train_loss": -6.814896106719971, "global_step": 145575, "epoch": 3466} {"train_loss": -6.7543439865112305, "global_step": 145576, "epoch": 3466} {"train_loss": -6.704649925231934, "global_step": 145577, "epoch": 3466} {"train_loss": -6.806758403778076, "global_step": 145578, "epoch": 3466} {"train_loss": -6.710687637329102, "global_step": 145579, "epoch": 3466} {"train_loss": -6.866046905517578, "global_step": 145580, "epoch": 3466} {"train_loss": -6.749900817871094, "global_step": 145581, "epoch": 3466} {"train_loss": -6.818326950073242, "global_step": 145582, "epoch": 3466} {"train_loss": -6.806299686431885, "global_step": 145583, "epoch": 3466} {"train_loss": -6.8312201499938965, "global_step": 145584, "epoch": 3466} {"train_loss": -6.771074295043945, "global_step": 145585, "epoch": 3466} {"train_loss": -6.891045570373535, "global_step": 145586, "epoch": 3466} {"train_loss": -6.821441173553467, "global_step": 145587, "epoch": 3466} {"train_loss": -6.793021202087402, "global_step": 145588, "epoch": 3466} {"train_loss": -6.843904495239258, "global_step": 145589, "epoch": 3466} {"train_loss": -6.740775108337402, "global_step": 145590, "epoch": 3466} {"train_loss": -6.781589984893799, "global_step": 145591, "epoch": 3466} {"train_loss": -6.795527458190918, "global_step": 145592, "epoch": 3466} {"train_loss": -6.719992160797119, "global_step": 145593, "epoch": 3466} {"train_loss": -6.875456809997559, "global_step": 145594, "epoch": 3466} {"train_loss": -6.693575859069824, "global_step": 145595, "epoch": 3466} {"train_loss": -6.77134895324707, "global_step": 145596, "epoch": 3466} {"train_loss": -6.843600273132324, "global_step": 145597, "epoch": 3466} {"train_loss": -6.629223823547363, "global_step": 145598, "epoch": 3466} {"train_loss": -6.765186309814453, "global_step": 145599, "epoch": 3466} {"train_loss": -6.683120250701904, "global_step": 145600, "epoch": 3466} {"train_loss": -6.810271263122559, "global_step": 145601, "epoch": 3466} {"train_loss": -6.825963020324707, "global_step": 145602, "epoch": 3466} {"train_loss": -6.677089691162109, "global_step": 145603, "epoch": 3466} {"train_loss": -6.860992431640625, "global_step": 145604, "epoch": 3466} {"train_loss": -6.74622917175293, "global_step": 145605, "epoch": 3466} {"train_loss": -6.798387050628662, "global_step": 145606, "epoch": 3466} {"train_loss": -6.720372676849365, "global_step": 145607, "epoch": 3466} {"train_loss": -6.627820014953613, "global_step": 145608, "epoch": 3466} {"train_loss": -6.855587959289551, "global_step": 145609, "epoch": 3466} {"train_loss": -6.766089916229248, "global_step": 145610, "epoch": 3466} {"train_loss": -6.7123613357543945, "global_step": 145611, "epoch": 3466} {"train_loss": -6.84223747253418, "global_step": 145612, "epoch": 3466} {"train_loss": -6.780921107246762, "global_step": 145613, "epoch": 3466, "val_loss": 68510.2890625} {"train_loss": -6.8368706703186035, "global_step": 145614, "epoch": 3467} {"train_loss": -6.792030334472656, "global_step": 145615, "epoch": 3467} {"train_loss": -6.849870681762695, "global_step": 145616, "epoch": 3467} {"train_loss": -6.710935592651367, "global_step": 145617, "epoch": 3467} {"train_loss": -6.8009796142578125, "global_step": 145618, "epoch": 3467} {"train_loss": -6.856186389923096, "global_step": 145619, "epoch": 3467} {"train_loss": -6.8943376541137695, "global_step": 145620, "epoch": 3467} {"train_loss": -6.793577194213867, "global_step": 145621, "epoch": 3467} {"train_loss": -6.735601902008057, "global_step": 145622, "epoch": 3467} {"train_loss": -6.847390174865723, "global_step": 145623, "epoch": 3467} {"train_loss": -6.7175397872924805, "global_step": 145624, "epoch": 3467} {"train_loss": -6.712619304656982, "global_step": 145625, "epoch": 3467} {"train_loss": -6.7848334312438965, "global_step": 145626, "epoch": 3467} {"train_loss": -6.724784851074219, "global_step": 145627, "epoch": 3467} {"train_loss": -6.689439296722412, "global_step": 145628, "epoch": 3467} {"train_loss": -6.6839141845703125, "global_step": 145629, "epoch": 3467} {"train_loss": -6.691448211669922, "global_step": 145630, "epoch": 3467} {"train_loss": -6.679518699645996, "global_step": 145631, "epoch": 3467} {"train_loss": -6.619815826416016, "global_step": 145632, "epoch": 3467} {"train_loss": -6.754086971282959, "global_step": 145633, "epoch": 3467} {"train_loss": -6.530811309814453, "global_step": 145634, "epoch": 3467} {"train_loss": -6.640050888061523, "global_step": 145635, "epoch": 3467} {"train_loss": -6.746210098266602, "global_step": 145636, "epoch": 3467} {"train_loss": -6.673110008239746, "global_step": 145637, "epoch": 3467} {"train_loss": -6.768668174743652, "global_step": 145638, "epoch": 3467} {"train_loss": -6.6530866622924805, "global_step": 145639, "epoch": 3467} {"train_loss": -6.668158531188965, "global_step": 145640, "epoch": 3467} {"train_loss": -6.667876720428467, "global_step": 145641, "epoch": 3467} {"train_loss": -6.603607177734375, "global_step": 145642, "epoch": 3467} {"train_loss": -6.705112457275391, "global_step": 145643, "epoch": 3467} {"train_loss": -6.8342976570129395, "global_step": 145644, "epoch": 3467} {"train_loss": -6.7259111404418945, "global_step": 145645, "epoch": 3467} {"train_loss": -6.7365031242370605, "global_step": 145646, "epoch": 3467} {"train_loss": -6.747723579406738, "global_step": 145647, "epoch": 3467} {"train_loss": -6.754504680633545, "global_step": 145648, "epoch": 3467} {"train_loss": -6.737425804138184, "global_step": 145649, "epoch": 3467} {"train_loss": -6.680486679077148, "global_step": 145650, "epoch": 3467} {"train_loss": -6.708857536315918, "global_step": 145651, "epoch": 3467} {"train_loss": -6.713783264160156, "global_step": 145652, "epoch": 3467} {"train_loss": -6.750786781311035, "global_step": 145653, "epoch": 3467} {"train_loss": -6.880864143371582, "global_step": 145654, "epoch": 3467} {"train_loss": -6.736345166251773, "global_step": 145655, "epoch": 3467, "val_loss": 68456.46875} {"train_loss": -6.719438552856445, "global_step": 145656, "epoch": 3468} {"train_loss": -6.786848068237305, "global_step": 145657, "epoch": 3468} {"train_loss": -6.736010551452637, "global_step": 145658, "epoch": 3468} {"train_loss": -6.794898509979248, "global_step": 145659, "epoch": 3468} {"train_loss": -6.559114456176758, "global_step": 145660, "epoch": 3468} {"train_loss": -6.724722862243652, "global_step": 145661, "epoch": 3468} {"train_loss": -6.740067958831787, "global_step": 145662, "epoch": 3468} {"train_loss": -6.6138458251953125, "global_step": 145663, "epoch": 3468} {"train_loss": -6.829058647155762, "global_step": 145664, "epoch": 3468} {"train_loss": -6.622087478637695, "global_step": 145665, "epoch": 3468} {"train_loss": -6.676962852478027, "global_step": 145666, "epoch": 3468} {"train_loss": -6.7543816566467285, "global_step": 145667, "epoch": 3468} {"train_loss": -6.696032524108887, "global_step": 145668, "epoch": 3468} {"train_loss": -6.829294204711914, "global_step": 145669, "epoch": 3468} {"train_loss": -6.677744388580322, "global_step": 145670, "epoch": 3468} {"train_loss": -6.875253677368164, "global_step": 145671, "epoch": 3468} {"train_loss": -6.783919811248779, "global_step": 145672, "epoch": 3468} {"train_loss": -6.773575305938721, "global_step": 145673, "epoch": 3468} {"train_loss": -6.733325958251953, "global_step": 145674, "epoch": 3468} {"train_loss": -6.739147186279297, "global_step": 145675, "epoch": 3468} {"train_loss": -6.79356575012207, "global_step": 145676, "epoch": 3468} {"train_loss": -6.773563385009766, "global_step": 145677, "epoch": 3468} {"train_loss": -6.837456226348877, "global_step": 145678, "epoch": 3468} {"train_loss": -6.631198883056641, "global_step": 145679, "epoch": 3468} {"train_loss": -6.784343719482422, "global_step": 145680, "epoch": 3468} {"train_loss": -6.751344680786133, "global_step": 145681, "epoch": 3468} {"train_loss": -6.743719100952148, "global_step": 145682, "epoch": 3468} {"train_loss": -6.653931140899658, "global_step": 145683, "epoch": 3468} {"train_loss": -6.773245334625244, "global_step": 145684, "epoch": 3468} {"train_loss": -6.783562183380127, "global_step": 145685, "epoch": 3468} {"train_loss": -6.877859592437744, "global_step": 145686, "epoch": 3468} {"train_loss": -6.791157245635986, "global_step": 145687, "epoch": 3468} {"train_loss": -6.864026069641113, "global_step": 145688, "epoch": 3468} {"train_loss": -6.871214866638184, "global_step": 145689, "epoch": 3468} {"train_loss": -6.775646209716797, "global_step": 145690, "epoch": 3468} {"train_loss": -6.811525344848633, "global_step": 145691, "epoch": 3468} {"train_loss": -6.702383995056152, "global_step": 145692, "epoch": 3468} {"train_loss": -6.742083549499512, "global_step": 145693, "epoch": 3468} {"train_loss": -6.808516502380371, "global_step": 145694, "epoch": 3468} {"train_loss": -6.730922698974609, "global_step": 145695, "epoch": 3468} {"train_loss": -6.802436351776123, "global_step": 145696, "epoch": 3468} {"train_loss": -6.7565995170956565, "global_step": 145697, "epoch": 3468, "val_loss": 68382.7734375} {"train_loss": -6.758116722106934, "global_step": 145698, "epoch": 3469} {"train_loss": -6.769986152648926, "global_step": 145699, "epoch": 3469} {"train_loss": -6.767043113708496, "global_step": 145700, "epoch": 3469} {"train_loss": -6.841362953186035, "global_step": 145701, "epoch": 3469} {"train_loss": -6.632009506225586, "global_step": 145702, "epoch": 3469} {"train_loss": -6.671906471252441, "global_step": 145703, "epoch": 3469} {"train_loss": -6.769874572753906, "global_step": 145704, "epoch": 3469} {"train_loss": -6.785815238952637, "global_step": 145705, "epoch": 3469} {"train_loss": -6.699284553527832, "global_step": 145706, "epoch": 3469} {"train_loss": -6.785901069641113, "global_step": 145707, "epoch": 3469} {"train_loss": -6.747378349304199, "global_step": 145708, "epoch": 3469} {"train_loss": -6.829741477966309, "global_step": 145709, "epoch": 3469} {"train_loss": -6.907479286193848, "global_step": 145710, "epoch": 3469} {"train_loss": -6.783243179321289, "global_step": 145711, "epoch": 3469} {"train_loss": -6.801339149475098, "global_step": 145712, "epoch": 3469} {"train_loss": -6.6731343269348145, "global_step": 145713, "epoch": 3469} {"train_loss": -6.673505783081055, "global_step": 145714, "epoch": 3469} {"train_loss": -6.848923206329346, "global_step": 145715, "epoch": 3469} {"train_loss": -6.764492034912109, "global_step": 145716, "epoch": 3469} {"train_loss": -6.704277992248535, "global_step": 145717, "epoch": 3469} {"train_loss": -6.7900543212890625, "global_step": 145718, "epoch": 3469} {"train_loss": -6.718470573425293, "global_step": 145719, "epoch": 3469} {"train_loss": -6.7499918937683105, "global_step": 145720, "epoch": 3469} {"train_loss": -6.8389129638671875, "global_step": 145721, "epoch": 3469} {"train_loss": -6.657169342041016, "global_step": 145722, "epoch": 3469} {"train_loss": -6.785173416137695, "global_step": 145723, "epoch": 3469} {"train_loss": -6.774401664733887, "global_step": 145724, "epoch": 3469} {"train_loss": -6.698848724365234, "global_step": 145725, "epoch": 3469} {"train_loss": -6.76804256439209, "global_step": 145726, "epoch": 3469} {"train_loss": -6.759088516235352, "global_step": 145727, "epoch": 3469} {"train_loss": -6.802180767059326, "global_step": 145728, "epoch": 3469} {"train_loss": -6.624485015869141, "global_step": 145729, "epoch": 3469} {"train_loss": -6.602872848510742, "global_step": 145730, "epoch": 3469} {"train_loss": -6.851553916931152, "global_step": 145731, "epoch": 3469} {"train_loss": -6.696389198303223, "global_step": 145732, "epoch": 3469} {"train_loss": -6.693874359130859, "global_step": 145733, "epoch": 3469} {"train_loss": -6.787613868713379, "global_step": 145734, "epoch": 3469} {"train_loss": -6.839545249938965, "global_step": 145735, "epoch": 3469} {"train_loss": -6.871277332305908, "global_step": 145736, "epoch": 3469} {"train_loss": -6.917153835296631, "global_step": 145737, "epoch": 3469} {"train_loss": -6.7657365798950195, "global_step": 145738, "epoch": 3469} {"train_loss": -6.7615840548560735, "global_step": 145739, "epoch": 3469, "val_loss": 68463.6640625} {"train_loss": -6.854020118713379, "global_step": 145740, "epoch": 3470} {"train_loss": -6.788005828857422, "global_step": 145741, "epoch": 3470} {"train_loss": -6.938980579376221, "global_step": 145742, "epoch": 3470} {"train_loss": -6.794886112213135, "global_step": 145743, "epoch": 3470} {"train_loss": -6.813385009765625, "global_step": 145744, "epoch": 3470} {"train_loss": -6.791916847229004, "global_step": 145745, "epoch": 3470} {"train_loss": -6.953444004058838, "global_step": 145746, "epoch": 3470} {"train_loss": -6.73939323425293, "global_step": 145747, "epoch": 3470} {"train_loss": -6.752298355102539, "global_step": 145748, "epoch": 3470} {"train_loss": -6.818603515625, "global_step": 145749, "epoch": 3470} {"train_loss": -6.847625732421875, "global_step": 145750, "epoch": 3470} {"train_loss": -6.758076190948486, "global_step": 145751, "epoch": 3470} {"train_loss": -6.8058552742004395, "global_step": 145752, "epoch": 3470} {"train_loss": -6.7688446044921875, "global_step": 145753, "epoch": 3470} {"train_loss": -6.803919792175293, "global_step": 145754, "epoch": 3470} {"train_loss": -6.958828926086426, "global_step": 145755, "epoch": 3470} {"train_loss": -6.884912490844727, "global_step": 145756, "epoch": 3470} {"train_loss": -6.877422332763672, "global_step": 145757, "epoch": 3470} {"train_loss": -6.830517768859863, "global_step": 145758, "epoch": 3470} {"train_loss": -6.757854461669922, "global_step": 145759, "epoch": 3470} {"train_loss": -6.873560905456543, "global_step": 145760, "epoch": 3470} {"train_loss": -6.739470481872559, "global_step": 145761, "epoch": 3470} {"train_loss": -6.886482238769531, "global_step": 145762, "epoch": 3470} {"train_loss": -6.811964988708496, "global_step": 145763, "epoch": 3470} {"train_loss": -6.883965015411377, "global_step": 145764, "epoch": 3470} {"train_loss": -6.849237442016602, "global_step": 145765, "epoch": 3470} {"train_loss": -6.819684982299805, "global_step": 145766, "epoch": 3470} {"train_loss": -6.771975517272949, "global_step": 145767, "epoch": 3470} {"train_loss": -6.773131370544434, "global_step": 145768, "epoch": 3470} {"train_loss": -6.9601616859436035, "global_step": 145769, "epoch": 3470} {"train_loss": -6.82887077331543, "global_step": 145770, "epoch": 3470} {"train_loss": -6.904033660888672, "global_step": 145771, "epoch": 3470} {"train_loss": -6.808892250061035, "global_step": 145772, "epoch": 3470} {"train_loss": -6.750453948974609, "global_step": 145773, "epoch": 3470} {"train_loss": -6.8417558670043945, "global_step": 145774, "epoch": 3470} {"train_loss": -6.770014762878418, "global_step": 145775, "epoch": 3470} {"train_loss": -6.754999160766602, "global_step": 145776, "epoch": 3470} {"train_loss": -6.786611557006836, "global_step": 145777, "epoch": 3470} {"train_loss": -6.779664039611816, "global_step": 145778, "epoch": 3470} {"train_loss": -6.7291178703308105, "global_step": 145779, "epoch": 3470} {"train_loss": -6.738454818725586, "global_step": 145780, "epoch": 3470} {"train_loss": -6.816992271514166, "global_step": 145781, "epoch": 3470, "val_loss": 68359.515625} {"train_loss": -6.606490135192871, "global_step": 145782, "epoch": 3471} {"train_loss": -6.7588629722595215, "global_step": 145783, "epoch": 3471} {"train_loss": -6.863578796386719, "global_step": 145784, "epoch": 3471} {"train_loss": -6.71923303604126, "global_step": 145785, "epoch": 3471} {"train_loss": -6.811675548553467, "global_step": 145786, "epoch": 3471} {"train_loss": -6.7080583572387695, "global_step": 145787, "epoch": 3471} {"train_loss": -6.647356033325195, "global_step": 145788, "epoch": 3471} {"train_loss": -6.890631675720215, "global_step": 145789, "epoch": 3471} {"train_loss": -6.698794364929199, "global_step": 145790, "epoch": 3471} {"train_loss": -6.763230323791504, "global_step": 145791, "epoch": 3471} {"train_loss": -6.704034328460693, "global_step": 145792, "epoch": 3471} {"train_loss": -6.724124908447266, "global_step": 145793, "epoch": 3471} {"train_loss": -6.77205228805542, "global_step": 145794, "epoch": 3471} {"train_loss": -6.764381408691406, "global_step": 145795, "epoch": 3471} {"train_loss": -6.84420919418335, "global_step": 145796, "epoch": 3471} {"train_loss": -6.652164936065674, "global_step": 145797, "epoch": 3471} {"train_loss": -6.746058940887451, "global_step": 145798, "epoch": 3471} {"train_loss": -6.773636341094971, "global_step": 145799, "epoch": 3471} {"train_loss": -6.793065071105957, "global_step": 145800, "epoch": 3471} {"train_loss": -6.822144508361816, "global_step": 145801, "epoch": 3471} {"train_loss": -6.837895393371582, "global_step": 145802, "epoch": 3471} {"train_loss": -6.765541076660156, "global_step": 145803, "epoch": 3471} {"train_loss": -6.76776123046875, "global_step": 145804, "epoch": 3471} {"train_loss": -6.704074382781982, "global_step": 145805, "epoch": 3471} {"train_loss": -6.801603317260742, "global_step": 145806, "epoch": 3471} {"train_loss": -6.808992385864258, "global_step": 145807, "epoch": 3471} {"train_loss": -6.72784423828125, "global_step": 145808, "epoch": 3471} {"train_loss": -6.762171268463135, "global_step": 145809, "epoch": 3471} {"train_loss": -6.84592342376709, "global_step": 145810, "epoch": 3471} {"train_loss": -6.773007869720459, "global_step": 145811, "epoch": 3471} {"train_loss": -6.683459758758545, "global_step": 145812, "epoch": 3471} {"train_loss": -6.847352981567383, "global_step": 145813, "epoch": 3471} {"train_loss": -6.612794399261475, "global_step": 145814, "epoch": 3471} {"train_loss": -6.649497985839844, "global_step": 145815, "epoch": 3471} {"train_loss": -6.805764675140381, "global_step": 145816, "epoch": 3471} {"train_loss": -6.703050136566162, "global_step": 145817, "epoch": 3471} {"train_loss": -6.875683784484863, "global_step": 145818, "epoch": 3471} {"train_loss": -6.778755187988281, "global_step": 145819, "epoch": 3471} {"train_loss": -6.687578201293945, "global_step": 145820, "epoch": 3471} {"train_loss": -6.768685340881348, "global_step": 145821, "epoch": 3471} {"train_loss": -6.736679553985596, "global_step": 145822, "epoch": 3471} {"train_loss": -6.756200597399757, "global_step": 145823, "epoch": 3471, "val_loss": 68528.25} {"train_loss": -6.867757797241211, "global_step": 145824, "epoch": 3472} {"train_loss": -6.850523948669434, "global_step": 145825, "epoch": 3472} {"train_loss": -6.82508659362793, "global_step": 145826, "epoch": 3472} {"train_loss": -6.734277248382568, "global_step": 145827, "epoch": 3472} {"train_loss": -6.760509490966797, "global_step": 145828, "epoch": 3472} {"train_loss": -6.9548492431640625, "global_step": 145829, "epoch": 3472} {"train_loss": -6.649178504943848, "global_step": 145830, "epoch": 3472} {"train_loss": -6.745583534240723, "global_step": 145831, "epoch": 3472} {"train_loss": -6.767426490783691, "global_step": 145832, "epoch": 3472} {"train_loss": -6.770788192749023, "global_step": 145833, "epoch": 3472} {"train_loss": -6.850696086883545, "global_step": 145834, "epoch": 3472} {"train_loss": -6.769316673278809, "global_step": 145835, "epoch": 3472} {"train_loss": -6.754546642303467, "global_step": 145836, "epoch": 3472} {"train_loss": -6.871003150939941, "global_step": 145837, "epoch": 3472} {"train_loss": -6.725368022918701, "global_step": 145838, "epoch": 3472} {"train_loss": -6.756253242492676, "global_step": 145839, "epoch": 3472} {"train_loss": -6.831034183502197, "global_step": 145840, "epoch": 3472} {"train_loss": -6.874907970428467, "global_step": 145841, "epoch": 3472} {"train_loss": -6.754775047302246, "global_step": 145842, "epoch": 3472} {"train_loss": -6.814152717590332, "global_step": 145843, "epoch": 3472} {"train_loss": -6.811165809631348, "global_step": 145844, "epoch": 3472} {"train_loss": -6.79135799407959, "global_step": 145845, "epoch": 3472} {"train_loss": -6.903713226318359, "global_step": 145846, "epoch": 3472} {"train_loss": -6.802013874053955, "global_step": 145847, "epoch": 3472} {"train_loss": -6.709782600402832, "global_step": 145848, "epoch": 3472} {"train_loss": -6.902101516723633, "global_step": 145849, "epoch": 3472} {"train_loss": -6.773788928985596, "global_step": 145850, "epoch": 3472} {"train_loss": -6.8556623458862305, "global_step": 145851, "epoch": 3472} {"train_loss": -6.853221893310547, "global_step": 145852, "epoch": 3472} {"train_loss": -6.768633842468262, "global_step": 145853, "epoch": 3472} {"train_loss": -6.783899307250977, "global_step": 145854, "epoch": 3472} {"train_loss": -6.779895782470703, "global_step": 145855, "epoch": 3472} {"train_loss": -6.72985315322876, "global_step": 145856, "epoch": 3472} {"train_loss": -6.7411603927612305, "global_step": 145857, "epoch": 3472} {"train_loss": -6.752062797546387, "global_step": 145858, "epoch": 3472} {"train_loss": -6.760678291320801, "global_step": 145859, "epoch": 3472} {"train_loss": -6.687286853790283, "global_step": 145860, "epoch": 3472} {"train_loss": -6.745954990386963, "global_step": 145861, "epoch": 3472} {"train_loss": -6.808588981628418, "global_step": 145862, "epoch": 3472} {"train_loss": -6.791632652282715, "global_step": 145863, "epoch": 3472} {"train_loss": -6.758382797241211, "global_step": 145864, "epoch": 3472} {"train_loss": -6.791768755231585, "global_step": 145865, "epoch": 3472, "val_loss": 68414.2109375} {"train_loss": -6.702812194824219, "global_step": 145866, "epoch": 3473} {"train_loss": -6.624680519104004, "global_step": 145867, "epoch": 3473} {"train_loss": -6.74691915512085, "global_step": 145868, "epoch": 3473} {"train_loss": -6.507122039794922, "global_step": 145869, "epoch": 3473} {"train_loss": -6.723165035247803, "global_step": 145870, "epoch": 3473} {"train_loss": -6.655791282653809, "global_step": 145871, "epoch": 3473} {"train_loss": -6.540513038635254, "global_step": 145872, "epoch": 3473} {"train_loss": -6.721802234649658, "global_step": 145873, "epoch": 3473} {"train_loss": -6.614945411682129, "global_step": 145874, "epoch": 3473} {"train_loss": -6.713162899017334, "global_step": 145875, "epoch": 3473} {"train_loss": -6.676595687866211, "global_step": 145876, "epoch": 3473} {"train_loss": -6.6499457359313965, "global_step": 145877, "epoch": 3473} {"train_loss": -6.73250675201416, "global_step": 145878, "epoch": 3473} {"train_loss": -6.745550632476807, "global_step": 145879, "epoch": 3473} {"train_loss": -6.6989874839782715, "global_step": 145880, "epoch": 3473} {"train_loss": -6.768914222717285, "global_step": 145881, "epoch": 3473} {"train_loss": -6.685516357421875, "global_step": 145882, "epoch": 3473} {"train_loss": -6.626684188842773, "global_step": 145883, "epoch": 3473} {"train_loss": -6.729729652404785, "global_step": 145884, "epoch": 3473} {"train_loss": -6.757002830505371, "global_step": 145885, "epoch": 3473} {"train_loss": -6.716520309448242, "global_step": 145886, "epoch": 3473} {"train_loss": -6.818727970123291, "global_step": 145887, "epoch": 3473} {"train_loss": -6.658649921417236, "global_step": 145888, "epoch": 3473} {"train_loss": -6.816025733947754, "global_step": 145889, "epoch": 3473} {"train_loss": -6.794958591461182, "global_step": 145890, "epoch": 3473} {"train_loss": -6.6456379890441895, "global_step": 145891, "epoch": 3473} {"train_loss": -6.912309646606445, "global_step": 145892, "epoch": 3473} {"train_loss": -6.749422073364258, "global_step": 145893, "epoch": 3473} {"train_loss": -6.6524858474731445, "global_step": 145894, "epoch": 3473} {"train_loss": -6.790956020355225, "global_step": 145895, "epoch": 3473} {"train_loss": -6.703266143798828, "global_step": 145896, "epoch": 3473} {"train_loss": -6.7470703125, "global_step": 145897, "epoch": 3473} {"train_loss": -6.7756195068359375, "global_step": 145898, "epoch": 3473} {"train_loss": -6.841367721557617, "global_step": 145899, "epoch": 3473} {"train_loss": -6.762453079223633, "global_step": 145900, "epoch": 3473} {"train_loss": -6.638545036315918, "global_step": 145901, "epoch": 3473} {"train_loss": -6.846473693847656, "global_step": 145902, "epoch": 3473} {"train_loss": -6.6933159828186035, "global_step": 145903, "epoch": 3473} {"train_loss": -6.75852632522583, "global_step": 145904, "epoch": 3473} {"train_loss": -6.747798919677734, "global_step": 145905, "epoch": 3473} {"train_loss": -6.80735969543457, "global_step": 145906, "epoch": 3473} {"train_loss": -6.719591856002808, "global_step": 145907, "epoch": 3473, "val_loss": 68588.421875} {"train_loss": -6.765750885009766, "global_step": 145908, "epoch": 3474} {"train_loss": -6.770092964172363, "global_step": 145909, "epoch": 3474} {"train_loss": -6.800812244415283, "global_step": 145910, "epoch": 3474} {"train_loss": -6.669757843017578, "global_step": 145911, "epoch": 3474} {"train_loss": -6.885349750518799, "global_step": 145912, "epoch": 3474} {"train_loss": -6.732427597045898, "global_step": 145913, "epoch": 3474} {"train_loss": -6.607995986938477, "global_step": 145914, "epoch": 3474} {"train_loss": -6.786259651184082, "global_step": 145915, "epoch": 3474} {"train_loss": -6.675985336303711, "global_step": 145916, "epoch": 3474} {"train_loss": -6.672519683837891, "global_step": 145917, "epoch": 3474} {"train_loss": -6.710748195648193, "global_step": 145918, "epoch": 3474} {"train_loss": -6.823345184326172, "global_step": 145919, "epoch": 3474} {"train_loss": -6.711808204650879, "global_step": 145920, "epoch": 3474} {"train_loss": -6.789350509643555, "global_step": 145921, "epoch": 3474} {"train_loss": -6.753127098083496, "global_step": 145922, "epoch": 3474} {"train_loss": -6.748587608337402, "global_step": 145923, "epoch": 3474} {"train_loss": -6.757241725921631, "global_step": 145924, "epoch": 3474} {"train_loss": -6.771509170532227, "global_step": 145925, "epoch": 3474} {"train_loss": -6.722918510437012, "global_step": 145926, "epoch": 3474} {"train_loss": -6.763538360595703, "global_step": 145927, "epoch": 3474} {"train_loss": -6.639933109283447, "global_step": 145928, "epoch": 3474} {"train_loss": -6.763869285583496, "global_step": 145929, "epoch": 3474} {"train_loss": -6.637758255004883, "global_step": 145930, "epoch": 3474} {"train_loss": -6.738003730773926, "global_step": 145931, "epoch": 3474} {"train_loss": -6.5844221115112305, "global_step": 145932, "epoch": 3474} {"train_loss": -6.6462249755859375, "global_step": 145933, "epoch": 3474} {"train_loss": -6.726924896240234, "global_step": 145934, "epoch": 3474} {"train_loss": -6.570346832275391, "global_step": 145935, "epoch": 3474} {"train_loss": -6.8231282234191895, "global_step": 145936, "epoch": 3474} {"train_loss": -6.564435958862305, "global_step": 145937, "epoch": 3474} {"train_loss": -6.694947242736816, "global_step": 145938, "epoch": 3474} {"train_loss": -6.780686378479004, "global_step": 145939, "epoch": 3474} {"train_loss": -6.6709465980529785, "global_step": 145940, "epoch": 3474} {"train_loss": -6.852239608764648, "global_step": 145941, "epoch": 3474} {"train_loss": -6.656896591186523, "global_step": 145942, "epoch": 3474} {"train_loss": -6.745258331298828, "global_step": 145943, "epoch": 3474} {"train_loss": -6.690709114074707, "global_step": 145944, "epoch": 3474} {"train_loss": -6.729977607727051, "global_step": 145945, "epoch": 3474} {"train_loss": -6.836496353149414, "global_step": 145946, "epoch": 3474} {"train_loss": -6.8033246994018555, "global_step": 145947, "epoch": 3474} {"train_loss": -6.755783557891846, "global_step": 145948, "epoch": 3474} {"train_loss": -6.730550958996727, "global_step": 145949, "epoch": 3474, "val_loss": 68256.078125} {"train_loss": -6.750304698944092, "global_step": 145950, "epoch": 3475} {"train_loss": -6.850193977355957, "global_step": 145951, "epoch": 3475} {"train_loss": -6.637019634246826, "global_step": 145952, "epoch": 3475} {"train_loss": -6.62794828414917, "global_step": 145953, "epoch": 3475} {"train_loss": -6.775379657745361, "global_step": 145954, "epoch": 3475} {"train_loss": -6.616869926452637, "global_step": 145955, "epoch": 3475} {"train_loss": -6.915976524353027, "global_step": 145956, "epoch": 3475} {"train_loss": -6.779219627380371, "global_step": 145957, "epoch": 3475} {"train_loss": -6.701542854309082, "global_step": 145958, "epoch": 3475} {"train_loss": -6.8192901611328125, "global_step": 145959, "epoch": 3475} {"train_loss": -6.682568073272705, "global_step": 145960, "epoch": 3475} {"train_loss": -6.852605819702148, "global_step": 145961, "epoch": 3475} {"train_loss": -6.759055137634277, "global_step": 145962, "epoch": 3475} {"train_loss": -6.67928409576416, "global_step": 145963, "epoch": 3475} {"train_loss": -6.673591613769531, "global_step": 145964, "epoch": 3475} {"train_loss": -6.829058647155762, "global_step": 145965, "epoch": 3475} {"train_loss": -6.793566703796387, "global_step": 145966, "epoch": 3475} {"train_loss": -6.708994388580322, "global_step": 145967, "epoch": 3475} {"train_loss": -6.669377326965332, "global_step": 145968, "epoch": 3475} {"train_loss": -6.878681182861328, "global_step": 145969, "epoch": 3475} {"train_loss": -6.656219482421875, "global_step": 145970, "epoch": 3475} {"train_loss": -6.82841682434082, "global_step": 145971, "epoch": 3475} {"train_loss": -6.794097423553467, "global_step": 145972, "epoch": 3475} {"train_loss": -6.785882472991943, "global_step": 145973, "epoch": 3475} {"train_loss": -6.747868537902832, "global_step": 145974, "epoch": 3475} {"train_loss": -6.813307285308838, "global_step": 145975, "epoch": 3475} {"train_loss": -6.761598587036133, "global_step": 145976, "epoch": 3475} {"train_loss": -6.791044235229492, "global_step": 145977, "epoch": 3475} {"train_loss": -6.7068681716918945, "global_step": 145978, "epoch": 3475} {"train_loss": -6.82273006439209, "global_step": 145979, "epoch": 3475} {"train_loss": -6.732452392578125, "global_step": 145980, "epoch": 3475} {"train_loss": -6.812352180480957, "global_step": 145981, "epoch": 3475} {"train_loss": -6.861475467681885, "global_step": 145982, "epoch": 3475} {"train_loss": -6.873319625854492, "global_step": 145983, "epoch": 3475} {"train_loss": -6.896063804626465, "global_step": 145984, "epoch": 3475} {"train_loss": -6.829315185546875, "global_step": 145985, "epoch": 3475} {"train_loss": -6.724969863891602, "global_step": 145986, "epoch": 3475} {"train_loss": -6.791487216949463, "global_step": 145987, "epoch": 3475} {"train_loss": -6.730032920837402, "global_step": 145988, "epoch": 3475} {"train_loss": -6.818179130554199, "global_step": 145989, "epoch": 3475} {"train_loss": -6.898106575012207, "global_step": 145990, "epoch": 3475} {"train_loss": -6.7747107573917935, "global_step": 145991, "epoch": 3475, "val_loss": 68185.7421875} {"train_loss": -6.884776592254639, "global_step": 145992, "epoch": 3476} {"train_loss": -6.817086219787598, "global_step": 145993, "epoch": 3476} {"train_loss": -6.687451362609863, "global_step": 145994, "epoch": 3476} {"train_loss": -6.815360069274902, "global_step": 145995, "epoch": 3476} {"train_loss": -6.783926963806152, "global_step": 145996, "epoch": 3476} {"train_loss": -6.833328723907471, "global_step": 145997, "epoch": 3476} {"train_loss": -6.81843900680542, "global_step": 145998, "epoch": 3476} {"train_loss": -6.773899078369141, "global_step": 145999, "epoch": 3476} {"train_loss": -6.8275556564331055, "global_step": 146000, "epoch": 3476} {"train_loss": -6.747635841369629, "global_step": 146001, "epoch": 3476} {"train_loss": -6.85163688659668, "global_step": 146002, "epoch": 3476} {"train_loss": -6.685908317565918, "global_step": 146003, "epoch": 3476} {"train_loss": -6.703998565673828, "global_step": 146004, "epoch": 3476} {"train_loss": -6.671333312988281, "global_step": 146005, "epoch": 3476} {"train_loss": -6.692498683929443, "global_step": 146006, "epoch": 3476} {"train_loss": -6.853533744812012, "global_step": 146007, "epoch": 3476} {"train_loss": -6.789813995361328, "global_step": 146008, "epoch": 3476} {"train_loss": -6.615784168243408, "global_step": 146009, "epoch": 3476} {"train_loss": -6.713400840759277, "global_step": 146010, "epoch": 3476} {"train_loss": -6.7151336669921875, "global_step": 146011, "epoch": 3476} {"train_loss": -6.705420017242432, "global_step": 146012, "epoch": 3476} {"train_loss": -6.790676116943359, "global_step": 146013, "epoch": 3476} {"train_loss": -6.623820781707764, "global_step": 146014, "epoch": 3476} {"train_loss": -6.774615287780762, "global_step": 146015, "epoch": 3476} {"train_loss": -6.632697105407715, "global_step": 146016, "epoch": 3476} {"train_loss": -6.707175254821777, "global_step": 146017, "epoch": 3476} {"train_loss": -6.732609272003174, "global_step": 146018, "epoch": 3476} {"train_loss": -6.560117721557617, "global_step": 146019, "epoch": 3476} {"train_loss": -6.723076820373535, "global_step": 146020, "epoch": 3476} {"train_loss": -6.630245685577393, "global_step": 146021, "epoch": 3476} {"train_loss": -6.668877124786377, "global_step": 146022, "epoch": 3476} {"train_loss": -6.791415214538574, "global_step": 146023, "epoch": 3476} {"train_loss": -6.881756782531738, "global_step": 146024, "epoch": 3476} {"train_loss": -6.8265275955200195, "global_step": 146025, "epoch": 3476} {"train_loss": -6.779694080352783, "global_step": 146026, "epoch": 3476} {"train_loss": -6.779699325561523, "global_step": 146027, "epoch": 3476} {"train_loss": -6.674102783203125, "global_step": 146028, "epoch": 3476} {"train_loss": -6.820956707000732, "global_step": 146029, "epoch": 3476} {"train_loss": -6.792111873626709, "global_step": 146030, "epoch": 3476} {"train_loss": -6.826897144317627, "global_step": 146031, "epoch": 3476} {"train_loss": -6.74044132232666, "global_step": 146032, "epoch": 3476} {"train_loss": -6.749951782680693, "global_step": 146033, "epoch": 3476, "val_loss": 68334.34375} {"train_loss": -6.882743835449219, "global_step": 146034, "epoch": 3477} {"train_loss": -6.7972540855407715, "global_step": 146035, "epoch": 3477} {"train_loss": -6.749286651611328, "global_step": 146036, "epoch": 3477} {"train_loss": -6.742961883544922, "global_step": 146037, "epoch": 3477} {"train_loss": -6.814617156982422, "global_step": 146038, "epoch": 3477} {"train_loss": -6.90201473236084, "global_step": 146039, "epoch": 3477} {"train_loss": -6.740710258483887, "global_step": 146040, "epoch": 3477} {"train_loss": -6.848512172698975, "global_step": 146041, "epoch": 3477} {"train_loss": -6.85001277923584, "global_step": 146042, "epoch": 3477} {"train_loss": -6.656118869781494, "global_step": 146043, "epoch": 3477} {"train_loss": -6.908758163452148, "global_step": 146044, "epoch": 3477} {"train_loss": -6.7978410720825195, "global_step": 146045, "epoch": 3477} {"train_loss": -6.829981803894043, "global_step": 146046, "epoch": 3477} {"train_loss": -6.885568618774414, "global_step": 146047, "epoch": 3477} {"train_loss": -6.916468620300293, "global_step": 146048, "epoch": 3477} {"train_loss": -6.7925825119018555, "global_step": 146049, "epoch": 3477} {"train_loss": -6.848903656005859, "global_step": 146050, "epoch": 3477} {"train_loss": -6.742301940917969, "global_step": 146051, "epoch": 3477} {"train_loss": -6.812503814697266, "global_step": 146052, "epoch": 3477} {"train_loss": -6.8640336990356445, "global_step": 146053, "epoch": 3477} {"train_loss": -6.866947650909424, "global_step": 146054, "epoch": 3477} {"train_loss": -6.770337104797363, "global_step": 146055, "epoch": 3477} {"train_loss": -6.894419193267822, "global_step": 146056, "epoch": 3477} {"train_loss": -6.858628273010254, "global_step": 146057, "epoch": 3477} {"train_loss": -6.747306823730469, "global_step": 146058, "epoch": 3477} {"train_loss": -6.752964019775391, "global_step": 146059, "epoch": 3477} {"train_loss": -6.826542854309082, "global_step": 146060, "epoch": 3477} {"train_loss": -6.80663537979126, "global_step": 146061, "epoch": 3477} {"train_loss": -6.976535797119141, "global_step": 146062, "epoch": 3477} {"train_loss": -6.840502738952637, "global_step": 146063, "epoch": 3477} {"train_loss": -6.7288007736206055, "global_step": 146064, "epoch": 3477} {"train_loss": -6.704375267028809, "global_step": 146065, "epoch": 3477} {"train_loss": -6.829944133758545, "global_step": 146066, "epoch": 3477} {"train_loss": -6.830931663513184, "global_step": 146067, "epoch": 3477} {"train_loss": -6.8043365478515625, "global_step": 146068, "epoch": 3477} {"train_loss": -6.793411731719971, "global_step": 146069, "epoch": 3477} {"train_loss": -6.721811294555664, "global_step": 146070, "epoch": 3477} {"train_loss": -6.840070724487305, "global_step": 146071, "epoch": 3477} {"train_loss": -6.821493148803711, "global_step": 146072, "epoch": 3477} {"train_loss": -6.839922904968262, "global_step": 146073, "epoch": 3477} {"train_loss": -6.849522590637207, "global_step": 146074, "epoch": 3477} {"train_loss": -6.81551768666222, "global_step": 146075, "epoch": 3477, "val_loss": 68523.828125} {"train_loss": -6.721146583557129, "global_step": 146076, "epoch": 3478} {"train_loss": -6.699183940887451, "global_step": 146077, "epoch": 3478} {"train_loss": -6.845231056213379, "global_step": 146078, "epoch": 3478} {"train_loss": -6.736083030700684, "global_step": 146079, "epoch": 3478} {"train_loss": -6.71850061416626, "global_step": 146080, "epoch": 3478} {"train_loss": -6.830671787261963, "global_step": 146081, "epoch": 3478} {"train_loss": -6.766817092895508, "global_step": 146082, "epoch": 3478} {"train_loss": -6.678533554077148, "global_step": 146083, "epoch": 3478} {"train_loss": -6.759366989135742, "global_step": 146084, "epoch": 3478} {"train_loss": -6.728603363037109, "global_step": 146085, "epoch": 3478} {"train_loss": -6.69205379486084, "global_step": 146086, "epoch": 3478} {"train_loss": -6.810337066650391, "global_step": 146087, "epoch": 3478} {"train_loss": -6.805642127990723, "global_step": 146088, "epoch": 3478} {"train_loss": -6.740348815917969, "global_step": 146089, "epoch": 3478} {"train_loss": -6.779841899871826, "global_step": 146090, "epoch": 3478} {"train_loss": -6.746277809143066, "global_step": 146091, "epoch": 3478} {"train_loss": -6.773121356964111, "global_step": 146092, "epoch": 3478} {"train_loss": -6.749503135681152, "global_step": 146093, "epoch": 3478} {"train_loss": -6.75476598739624, "global_step": 146094, "epoch": 3478} {"train_loss": -6.82462215423584, "global_step": 146095, "epoch": 3478} {"train_loss": -6.763909339904785, "global_step": 146096, "epoch": 3478} {"train_loss": -6.852665901184082, "global_step": 146097, "epoch": 3478} {"train_loss": -6.674781322479248, "global_step": 146098, "epoch": 3478} {"train_loss": -6.8418073654174805, "global_step": 146099, "epoch": 3478} {"train_loss": -6.863893032073975, "global_step": 146100, "epoch": 3478} {"train_loss": -6.824457168579102, "global_step": 146101, "epoch": 3478} {"train_loss": -6.907839775085449, "global_step": 146102, "epoch": 3478} {"train_loss": -6.8518877029418945, "global_step": 146103, "epoch": 3478} {"train_loss": -6.7913055419921875, "global_step": 146104, "epoch": 3478} {"train_loss": -6.778474807739258, "global_step": 146105, "epoch": 3478} {"train_loss": -6.769951343536377, "global_step": 146106, "epoch": 3478} {"train_loss": -6.831467628479004, "global_step": 146107, "epoch": 3478} {"train_loss": -6.899083614349365, "global_step": 146108, "epoch": 3478} {"train_loss": -6.762327194213867, "global_step": 146109, "epoch": 3478} {"train_loss": -6.9528398513793945, "global_step": 146110, "epoch": 3478} {"train_loss": -6.908277988433838, "global_step": 146111, "epoch": 3478} {"train_loss": -6.80139684677124, "global_step": 146112, "epoch": 3478} {"train_loss": -6.823050498962402, "global_step": 146113, "epoch": 3478} {"train_loss": -6.794370651245117, "global_step": 146114, "epoch": 3478} {"train_loss": -6.815616607666016, "global_step": 146115, "epoch": 3478} {"train_loss": -6.831718444824219, "global_step": 146116, "epoch": 3478} {"train_loss": -6.793196678161621, "global_step": 146117, "epoch": 3478, "val_loss": 68348.640625} {"train_loss": -6.865473747253418, "global_step": 146118, "epoch": 3479} {"train_loss": -6.787352561950684, "global_step": 146119, "epoch": 3479} {"train_loss": -6.729220867156982, "global_step": 146120, "epoch": 3479} {"train_loss": -6.839607238769531, "global_step": 146121, "epoch": 3479} {"train_loss": -6.792135238647461, "global_step": 146122, "epoch": 3479} {"train_loss": -6.785346031188965, "global_step": 146123, "epoch": 3479} {"train_loss": -6.737548828125, "global_step": 146124, "epoch": 3479} {"train_loss": -6.772451877593994, "global_step": 146125, "epoch": 3479} {"train_loss": -6.734378814697266, "global_step": 146126, "epoch": 3479} {"train_loss": -6.732669830322266, "global_step": 146127, "epoch": 3479} {"train_loss": -6.819164276123047, "global_step": 146128, "epoch": 3479} {"train_loss": -6.722419738769531, "global_step": 146129, "epoch": 3479} {"train_loss": -6.657097816467285, "global_step": 146130, "epoch": 3479} {"train_loss": -6.658416748046875, "global_step": 146131, "epoch": 3479} {"train_loss": -6.621641159057617, "global_step": 146132, "epoch": 3479} {"train_loss": -6.63994026184082, "global_step": 146133, "epoch": 3479} {"train_loss": -6.759478569030762, "global_step": 146134, "epoch": 3479} {"train_loss": -6.857646942138672, "global_step": 146135, "epoch": 3479} {"train_loss": -6.653681755065918, "global_step": 146136, "epoch": 3479} {"train_loss": -6.685770034790039, "global_step": 146137, "epoch": 3479} {"train_loss": -6.787543773651123, "global_step": 146138, "epoch": 3479} {"train_loss": -6.737004280090332, "global_step": 146139, "epoch": 3479} {"train_loss": -6.66609525680542, "global_step": 146140, "epoch": 3479} {"train_loss": -6.81620979309082, "global_step": 146141, "epoch": 3479} {"train_loss": -6.816519737243652, "global_step": 146142, "epoch": 3479} {"train_loss": -6.642553329467773, "global_step": 146143, "epoch": 3479} {"train_loss": -6.698208808898926, "global_step": 146144, "epoch": 3479} {"train_loss": -6.70926570892334, "global_step": 146145, "epoch": 3479} {"train_loss": -6.736807823181152, "global_step": 146146, "epoch": 3479} {"train_loss": -6.866184234619141, "global_step": 146147, "epoch": 3479} {"train_loss": -6.814630508422852, "global_step": 146148, "epoch": 3479} {"train_loss": -6.787844657897949, "global_step": 146149, "epoch": 3479} {"train_loss": -6.722269535064697, "global_step": 146150, "epoch": 3479} {"train_loss": -6.645144939422607, "global_step": 146151, "epoch": 3479} {"train_loss": -6.732116222381592, "global_step": 146152, "epoch": 3479} {"train_loss": -6.817958354949951, "global_step": 146153, "epoch": 3479} {"train_loss": -6.750050067901611, "global_step": 146154, "epoch": 3479} {"train_loss": -6.763134002685547, "global_step": 146155, "epoch": 3479} {"train_loss": -6.810266494750977, "global_step": 146156, "epoch": 3479} {"train_loss": -6.809113502502441, "global_step": 146157, "epoch": 3479} {"train_loss": -6.723703384399414, "global_step": 146158, "epoch": 3479} {"train_loss": -6.74958932967413, "global_step": 146159, "epoch": 3479, "val_loss": 68584.359375} {"train_loss": -6.778440952301025, "global_step": 146160, "epoch": 3480} {"train_loss": -6.811633586883545, "global_step": 146161, "epoch": 3480} {"train_loss": -6.71408748626709, "global_step": 146162, "epoch": 3480} {"train_loss": -6.815886497497559, "global_step": 146163, "epoch": 3480} {"train_loss": -6.822500705718994, "global_step": 146164, "epoch": 3480} {"train_loss": -6.8317036628723145, "global_step": 146165, "epoch": 3480} {"train_loss": -6.810910224914551, "global_step": 146166, "epoch": 3480} {"train_loss": -6.7532453536987305, "global_step": 146167, "epoch": 3480} {"train_loss": -6.876150131225586, "global_step": 146168, "epoch": 3480} {"train_loss": -6.743852615356445, "global_step": 146169, "epoch": 3480} {"train_loss": -6.893304824829102, "global_step": 146170, "epoch": 3480} {"train_loss": -6.930408000946045, "global_step": 146171, "epoch": 3480} {"train_loss": -6.915889739990234, "global_step": 146172, "epoch": 3480} {"train_loss": -6.833224296569824, "global_step": 146173, "epoch": 3480} {"train_loss": -6.862722396850586, "global_step": 146174, "epoch": 3480} {"train_loss": -6.904176712036133, "global_step": 146175, "epoch": 3480} {"train_loss": -6.942791938781738, "global_step": 146176, "epoch": 3480} {"train_loss": -6.904997825622559, "global_step": 146177, "epoch": 3480} {"train_loss": -6.818936824798584, "global_step": 146178, "epoch": 3480} {"train_loss": -6.773839950561523, "global_step": 146179, "epoch": 3480} {"train_loss": -6.7709059715271, "global_step": 146180, "epoch": 3480} {"train_loss": -6.803800582885742, "global_step": 146181, "epoch": 3480} {"train_loss": -6.679128646850586, "global_step": 146182, "epoch": 3480} {"train_loss": -6.700137138366699, "global_step": 146183, "epoch": 3480} {"train_loss": -6.619660377502441, "global_step": 146184, "epoch": 3480} {"train_loss": -6.838690757751465, "global_step": 146185, "epoch": 3480} {"train_loss": -6.861018180847168, "global_step": 146186, "epoch": 3480} {"train_loss": -6.816036224365234, "global_step": 146187, "epoch": 3480} {"train_loss": -6.851090431213379, "global_step": 146188, "epoch": 3480} {"train_loss": -6.773595809936523, "global_step": 146189, "epoch": 3480} {"train_loss": -6.795618057250977, "global_step": 146190, "epoch": 3480} {"train_loss": -6.875578880310059, "global_step": 146191, "epoch": 3480} {"train_loss": -6.764011383056641, "global_step": 146192, "epoch": 3480} {"train_loss": -6.795043468475342, "global_step": 146193, "epoch": 3480} {"train_loss": -6.905304908752441, "global_step": 146194, "epoch": 3480} {"train_loss": -6.8933539390563965, "global_step": 146195, "epoch": 3480} {"train_loss": -6.808925628662109, "global_step": 146196, "epoch": 3480} {"train_loss": -6.833754539489746, "global_step": 146197, "epoch": 3480} {"train_loss": -6.820245265960693, "global_step": 146198, "epoch": 3480} {"train_loss": -6.8160319328308105, "global_step": 146199, "epoch": 3480} {"train_loss": -6.816405773162842, "global_step": 146200, "epoch": 3480} {"train_loss": -6.8161693300519675, "global_step": 146201, "epoch": 3480, "val_loss": 68354.0859375} {"train_loss": -6.834573745727539, "global_step": 146202, "epoch": 3481} {"train_loss": -6.81471586227417, "global_step": 146203, "epoch": 3481} {"train_loss": -6.8561577796936035, "global_step": 146204, "epoch": 3481} {"train_loss": -6.907190322875977, "global_step": 146205, "epoch": 3481} {"train_loss": -6.809125900268555, "global_step": 146206, "epoch": 3481} {"train_loss": -6.832912445068359, "global_step": 146207, "epoch": 3481} {"train_loss": -6.824288845062256, "global_step": 146208, "epoch": 3481} {"train_loss": -6.751168251037598, "global_step": 146209, "epoch": 3481} {"train_loss": -6.935931205749512, "global_step": 146210, "epoch": 3481} {"train_loss": -6.760426998138428, "global_step": 146211, "epoch": 3481} {"train_loss": -6.666294097900391, "global_step": 146212, "epoch": 3481} {"train_loss": -6.793604850769043, "global_step": 146213, "epoch": 3481} {"train_loss": -6.736993789672852, "global_step": 146214, "epoch": 3481} {"train_loss": -6.831674575805664, "global_step": 146215, "epoch": 3481} {"train_loss": -6.821218013763428, "global_step": 146216, "epoch": 3481} {"train_loss": -6.8520917892456055, "global_step": 146217, "epoch": 3481} {"train_loss": -6.859208106994629, "global_step": 146218, "epoch": 3481} {"train_loss": -6.815598487854004, "global_step": 146219, "epoch": 3481} {"train_loss": -6.780474662780762, "global_step": 146220, "epoch": 3481} {"train_loss": -6.668245792388916, "global_step": 146221, "epoch": 3481} {"train_loss": -6.693090438842773, "global_step": 146222, "epoch": 3481} {"train_loss": -6.704967498779297, "global_step": 146223, "epoch": 3481} {"train_loss": -6.687240123748779, "global_step": 146224, "epoch": 3481} {"train_loss": -6.683244705200195, "global_step": 146225, "epoch": 3481} {"train_loss": -6.859333038330078, "global_step": 146226, "epoch": 3481} {"train_loss": -6.765478134155273, "global_step": 146227, "epoch": 3481} {"train_loss": -6.737048149108887, "global_step": 146228, "epoch": 3481} {"train_loss": -6.8037309646606445, "global_step": 146229, "epoch": 3481} {"train_loss": -6.74685525894165, "global_step": 146230, "epoch": 3481} {"train_loss": -6.69650936126709, "global_step": 146231, "epoch": 3481} {"train_loss": -6.755349159240723, "global_step": 146232, "epoch": 3481} {"train_loss": -6.787766456604004, "global_step": 146233, "epoch": 3481} {"train_loss": -6.845067024230957, "global_step": 146234, "epoch": 3481} {"train_loss": -6.726601600646973, "global_step": 146235, "epoch": 3481} {"train_loss": -6.784592151641846, "global_step": 146236, "epoch": 3481} {"train_loss": -6.729530334472656, "global_step": 146237, "epoch": 3481} {"train_loss": -6.754242420196533, "global_step": 146238, "epoch": 3481} {"train_loss": -6.850729942321777, "global_step": 146239, "epoch": 3481} {"train_loss": -6.732149600982666, "global_step": 146240, "epoch": 3481} {"train_loss": -6.6113386154174805, "global_step": 146241, "epoch": 3481} {"train_loss": -6.66967248916626, "global_step": 146242, "epoch": 3481} {"train_loss": -6.775992643265497, "global_step": 146243, "epoch": 3481, "val_loss": 68330.484375} {"train_loss": -6.592104434967041, "global_step": 146244, "epoch": 3482} {"train_loss": -6.767816543579102, "global_step": 146245, "epoch": 3482} {"train_loss": -6.701803684234619, "global_step": 146246, "epoch": 3482} {"train_loss": -6.689648151397705, "global_step": 146247, "epoch": 3482} {"train_loss": -6.729522228240967, "global_step": 146248, "epoch": 3482} {"train_loss": -6.789012908935547, "global_step": 146249, "epoch": 3482} {"train_loss": -6.786017894744873, "global_step": 146250, "epoch": 3482} {"train_loss": -6.7686567306518555, "global_step": 146251, "epoch": 3482} {"train_loss": -6.742999076843262, "global_step": 146252, "epoch": 3482} {"train_loss": -6.560672760009766, "global_step": 146253, "epoch": 3482} {"train_loss": -6.719900131225586, "global_step": 146254, "epoch": 3482} {"train_loss": -6.801529884338379, "global_step": 146255, "epoch": 3482} {"train_loss": -6.69321346282959, "global_step": 146256, "epoch": 3482} {"train_loss": -6.594884872436523, "global_step": 146257, "epoch": 3482} {"train_loss": -6.741477012634277, "global_step": 146258, "epoch": 3482} {"train_loss": -6.836512565612793, "global_step": 146259, "epoch": 3482} {"train_loss": -6.706945419311523, "global_step": 146260, "epoch": 3482} {"train_loss": -6.740571022033691, "global_step": 146261, "epoch": 3482} {"train_loss": -6.755571365356445, "global_step": 146262, "epoch": 3482} {"train_loss": -6.702844619750977, "global_step": 146263, "epoch": 3482} {"train_loss": -6.642126083374023, "global_step": 146264, "epoch": 3482} {"train_loss": -6.829500198364258, "global_step": 146265, "epoch": 3482} {"train_loss": -6.793558120727539, "global_step": 146266, "epoch": 3482} {"train_loss": -6.891916275024414, "global_step": 146267, "epoch": 3482} {"train_loss": -6.74072265625, "global_step": 146268, "epoch": 3482} {"train_loss": -6.692324638366699, "global_step": 146269, "epoch": 3482} {"train_loss": -6.88092041015625, "global_step": 146270, "epoch": 3482} {"train_loss": -6.680161476135254, "global_step": 146271, "epoch": 3482} {"train_loss": -6.736207962036133, "global_step": 146272, "epoch": 3482} {"train_loss": -6.727604389190674, "global_step": 146273, "epoch": 3482} {"train_loss": -6.775380611419678, "global_step": 146274, "epoch": 3482} {"train_loss": -6.8450703620910645, "global_step": 146275, "epoch": 3482} {"train_loss": -6.786416053771973, "global_step": 146276, "epoch": 3482} {"train_loss": -6.857083320617676, "global_step": 146277, "epoch": 3482} {"train_loss": -6.831839084625244, "global_step": 146278, "epoch": 3482} {"train_loss": -6.915950298309326, "global_step": 146279, "epoch": 3482} {"train_loss": -6.704578399658203, "global_step": 146280, "epoch": 3482} {"train_loss": -6.800324440002441, "global_step": 146281, "epoch": 3482} {"train_loss": -6.787697792053223, "global_step": 146282, "epoch": 3482} {"train_loss": -6.734526634216309, "global_step": 146283, "epoch": 3482} {"train_loss": -6.58774995803833, "global_step": 146284, "epoch": 3482} {"train_loss": -6.746558564049857, "global_step": 146285, "epoch": 3482, "val_loss": 68456.0234375} {"train_loss": -6.791820526123047, "global_step": 146286, "epoch": 3483} {"train_loss": -6.458438396453857, "global_step": 146287, "epoch": 3483} {"train_loss": -6.635285377502441, "global_step": 146288, "epoch": 3483} {"train_loss": -6.697772026062012, "global_step": 146289, "epoch": 3483} {"train_loss": -6.567516326904297, "global_step": 146290, "epoch": 3483} {"train_loss": -6.656010627746582, "global_step": 146291, "epoch": 3483} {"train_loss": -6.670140266418457, "global_step": 146292, "epoch": 3483} {"train_loss": -6.50330924987793, "global_step": 146293, "epoch": 3483} {"train_loss": -6.6146345138549805, "global_step": 146294, "epoch": 3483} {"train_loss": -6.684579849243164, "global_step": 146295, "epoch": 3483} {"train_loss": -6.7065277099609375, "global_step": 146296, "epoch": 3483} {"train_loss": -6.5281877517700195, "global_step": 146297, "epoch": 3483} {"train_loss": -6.666470527648926, "global_step": 146298, "epoch": 3483} {"train_loss": -6.694882392883301, "global_step": 146299, "epoch": 3483} {"train_loss": -6.7380900382995605, "global_step": 146300, "epoch": 3483} {"train_loss": -6.640275955200195, "global_step": 146301, "epoch": 3483} {"train_loss": -6.709007263183594, "global_step": 146302, "epoch": 3483} {"train_loss": -6.708744049072266, "global_step": 146303, "epoch": 3483} {"train_loss": -6.637023448944092, "global_step": 146304, "epoch": 3483} {"train_loss": -6.721529006958008, "global_step": 146305, "epoch": 3483} {"train_loss": -6.772012710571289, "global_step": 146306, "epoch": 3483} {"train_loss": -6.778468132019043, "global_step": 146307, "epoch": 3483} {"train_loss": -6.757911205291748, "global_step": 146308, "epoch": 3483} {"train_loss": -6.768519878387451, "global_step": 146309, "epoch": 3483} {"train_loss": -6.798248291015625, "global_step": 146310, "epoch": 3483} {"train_loss": -6.753264904022217, "global_step": 146311, "epoch": 3483} {"train_loss": -6.712100982666016, "global_step": 146312, "epoch": 3483} {"train_loss": -6.736371040344238, "global_step": 146313, "epoch": 3483} {"train_loss": -6.823970794677734, "global_step": 146314, "epoch": 3483} {"train_loss": -6.6523518562316895, "global_step": 146315, "epoch": 3483} {"train_loss": -6.864701271057129, "global_step": 146316, "epoch": 3483} {"train_loss": -6.888062953948975, "global_step": 146317, "epoch": 3483} {"train_loss": -6.832033157348633, "global_step": 146318, "epoch": 3483} {"train_loss": -6.708539962768555, "global_step": 146319, "epoch": 3483} {"train_loss": -6.663895606994629, "global_step": 146320, "epoch": 3483} {"train_loss": -6.84405517578125, "global_step": 146321, "epoch": 3483} {"train_loss": -6.705070495605469, "global_step": 146322, "epoch": 3483} {"train_loss": -6.73214864730835, "global_step": 146323, "epoch": 3483} {"train_loss": -6.870184898376465, "global_step": 146324, "epoch": 3483} {"train_loss": -6.593425750732422, "global_step": 146325, "epoch": 3483} {"train_loss": -6.71558952331543, "global_step": 146326, "epoch": 3483} {"train_loss": -6.70718731198992, "global_step": 146327, "epoch": 3483, "val_loss": 68523.6875} {"train_loss": -6.614118576049805, "global_step": 146328, "epoch": 3484} {"train_loss": -6.776444911956787, "global_step": 146329, "epoch": 3484} {"train_loss": -6.601944923400879, "global_step": 146330, "epoch": 3484} {"train_loss": -6.72354793548584, "global_step": 146331, "epoch": 3484} {"train_loss": -6.681374549865723, "global_step": 146332, "epoch": 3484} {"train_loss": -6.714253902435303, "global_step": 146333, "epoch": 3484} {"train_loss": -6.702362537384033, "global_step": 146334, "epoch": 3484} {"train_loss": -6.59225606918335, "global_step": 146335, "epoch": 3484} {"train_loss": -6.799808979034424, "global_step": 146336, "epoch": 3484} {"train_loss": -6.807281494140625, "global_step": 146337, "epoch": 3484} {"train_loss": -6.713240623474121, "global_step": 146338, "epoch": 3484} {"train_loss": -6.7490620613098145, "global_step": 146339, "epoch": 3484} {"train_loss": -6.678211212158203, "global_step": 146340, "epoch": 3484} {"train_loss": -6.804991722106934, "global_step": 146341, "epoch": 3484} {"train_loss": -6.738480567932129, "global_step": 146342, "epoch": 3484} {"train_loss": -6.7285475730896, "global_step": 146343, "epoch": 3484} {"train_loss": -6.784749984741211, "global_step": 146344, "epoch": 3484} {"train_loss": -6.8340678215026855, "global_step": 146345, "epoch": 3484} {"train_loss": -6.756195545196533, "global_step": 146346, "epoch": 3484} {"train_loss": -6.839649200439453, "global_step": 146347, "epoch": 3484} {"train_loss": -6.764553546905518, "global_step": 146348, "epoch": 3484} {"train_loss": -6.835301399230957, "global_step": 146349, "epoch": 3484} {"train_loss": -6.728588104248047, "global_step": 146350, "epoch": 3484} {"train_loss": -6.644329071044922, "global_step": 146351, "epoch": 3484} {"train_loss": -6.8249735832214355, "global_step": 146352, "epoch": 3484} {"train_loss": -6.805996894836426, "global_step": 146353, "epoch": 3484} {"train_loss": -6.8033342361450195, "global_step": 146354, "epoch": 3484} {"train_loss": -6.795275688171387, "global_step": 146355, "epoch": 3484} {"train_loss": -6.798586845397949, "global_step": 146356, "epoch": 3484} {"train_loss": -6.787426471710205, "global_step": 146357, "epoch": 3484} {"train_loss": -6.736173152923584, "global_step": 146358, "epoch": 3484} {"train_loss": -6.770883560180664, "global_step": 146359, "epoch": 3484} {"train_loss": -6.721759796142578, "global_step": 146360, "epoch": 3484} {"train_loss": -6.70075798034668, "global_step": 146361, "epoch": 3484} {"train_loss": -6.837614059448242, "global_step": 146362, "epoch": 3484} {"train_loss": -6.740468978881836, "global_step": 146363, "epoch": 3484} {"train_loss": -6.847710609436035, "global_step": 146364, "epoch": 3484} {"train_loss": -6.819219589233398, "global_step": 146365, "epoch": 3484} {"train_loss": -6.775116920471191, "global_step": 146366, "epoch": 3484} {"train_loss": -6.8997931480407715, "global_step": 146367, "epoch": 3484} {"train_loss": -6.76242208480835, "global_step": 146368, "epoch": 3484} {"train_loss": -6.7567593937828425, "global_step": 146369, "epoch": 3484, "val_loss": 68281.8203125} {"train_loss": -6.894889831542969, "global_step": 146370, "epoch": 3485} {"train_loss": -6.844862937927246, "global_step": 146371, "epoch": 3485} {"train_loss": -6.858925819396973, "global_step": 146372, "epoch": 3485} {"train_loss": -6.8186726570129395, "global_step": 146373, "epoch": 3485} {"train_loss": -6.77891731262207, "global_step": 146374, "epoch": 3485} {"train_loss": -6.863964557647705, "global_step": 146375, "epoch": 3485} {"train_loss": -6.739787578582764, "global_step": 146376, "epoch": 3485} {"train_loss": -6.68300724029541, "global_step": 146377, "epoch": 3485} {"train_loss": -6.753487586975098, "global_step": 146378, "epoch": 3485} {"train_loss": -6.8119096755981445, "global_step": 146379, "epoch": 3485} {"train_loss": -6.899786949157715, "global_step": 146380, "epoch": 3485} {"train_loss": -6.70656156539917, "global_step": 146381, "epoch": 3485} {"train_loss": -6.856497764587402, "global_step": 146382, "epoch": 3485} {"train_loss": -6.69505500793457, "global_step": 146383, "epoch": 3485} {"train_loss": -6.770323753356934, "global_step": 146384, "epoch": 3485} {"train_loss": -6.7740325927734375, "global_step": 146385, "epoch": 3485} {"train_loss": -6.802718162536621, "global_step": 146386, "epoch": 3485} {"train_loss": -6.863554954528809, "global_step": 146387, "epoch": 3485} {"train_loss": -6.823047637939453, "global_step": 146388, "epoch": 3485} {"train_loss": -6.869114398956299, "global_step": 146389, "epoch": 3485} {"train_loss": -6.849560737609863, "global_step": 146390, "epoch": 3485} {"train_loss": -6.875527858734131, "global_step": 146391, "epoch": 3485} {"train_loss": -6.78259801864624, "global_step": 146392, "epoch": 3485} {"train_loss": -6.731349945068359, "global_step": 146393, "epoch": 3485} {"train_loss": -6.768767356872559, "global_step": 146394, "epoch": 3485} {"train_loss": -6.899509429931641, "global_step": 146395, "epoch": 3485} {"train_loss": -6.894550800323486, "global_step": 146396, "epoch": 3485} {"train_loss": -6.742262840270996, "global_step": 146397, "epoch": 3485} {"train_loss": -6.85852575302124, "global_step": 146398, "epoch": 3485} {"train_loss": -6.908168315887451, "global_step": 146399, "epoch": 3485} {"train_loss": -6.76633358001709, "global_step": 146400, "epoch": 3485} {"train_loss": -6.827366828918457, "global_step": 146401, "epoch": 3485} {"train_loss": -6.787503719329834, "global_step": 146402, "epoch": 3485} {"train_loss": -6.826415538787842, "global_step": 146403, "epoch": 3485} {"train_loss": -6.892955303192139, "global_step": 146404, "epoch": 3485} {"train_loss": -6.917651176452637, "global_step": 146405, "epoch": 3485} {"train_loss": -6.586146354675293, "global_step": 146406, "epoch": 3485} {"train_loss": -6.828936576843262, "global_step": 146407, "epoch": 3485} {"train_loss": -6.820382595062256, "global_step": 146408, "epoch": 3485} {"train_loss": -6.787314414978027, "global_step": 146409, "epoch": 3485} {"train_loss": -6.7812604904174805, "global_step": 146410, "epoch": 3485} {"train_loss": -6.81043096951076, "global_step": 146411, "epoch": 3485, "val_loss": 68477.2734375} {"train_loss": -6.731113910675049, "global_step": 146412, "epoch": 3486} {"train_loss": -6.791675090789795, "global_step": 146413, "epoch": 3486} {"train_loss": -6.767045974731445, "global_step": 146414, "epoch": 3486} {"train_loss": -6.904202461242676, "global_step": 146415, "epoch": 3486} {"train_loss": -6.826003074645996, "global_step": 146416, "epoch": 3486} {"train_loss": -6.799793720245361, "global_step": 146417, "epoch": 3486} {"train_loss": -6.838710784912109, "global_step": 146418, "epoch": 3486} {"train_loss": -6.77069091796875, "global_step": 146419, "epoch": 3486} {"train_loss": -6.826183795928955, "global_step": 146420, "epoch": 3486} {"train_loss": -6.747744560241699, "global_step": 146421, "epoch": 3486} {"train_loss": -6.824167251586914, "global_step": 146422, "epoch": 3486} {"train_loss": -6.790539264678955, "global_step": 146423, "epoch": 3486} {"train_loss": -6.706306457519531, "global_step": 146424, "epoch": 3486} {"train_loss": -6.775966644287109, "global_step": 146425, "epoch": 3486} {"train_loss": -6.810491561889648, "global_step": 146426, "epoch": 3486} {"train_loss": -6.7510294914245605, "global_step": 146427, "epoch": 3486} {"train_loss": -6.7377471923828125, "global_step": 146428, "epoch": 3486} {"train_loss": -6.841376304626465, "global_step": 146429, "epoch": 3486} {"train_loss": -6.846008777618408, "global_step": 146430, "epoch": 3486} {"train_loss": -6.786643028259277, "global_step": 146431, "epoch": 3486} {"train_loss": -6.84888219833374, "global_step": 146432, "epoch": 3486} {"train_loss": -6.8002777099609375, "global_step": 146433, "epoch": 3486} {"train_loss": -6.692368507385254, "global_step": 146434, "epoch": 3486} {"train_loss": -6.749885559082031, "global_step": 146435, "epoch": 3486} {"train_loss": -6.766324996948242, "global_step": 146436, "epoch": 3486} {"train_loss": -6.792100429534912, "global_step": 146437, "epoch": 3486} {"train_loss": -6.894458770751953, "global_step": 146438, "epoch": 3486} {"train_loss": -6.745487213134766, "global_step": 146439, "epoch": 3486} {"train_loss": -6.760134696960449, "global_step": 146440, "epoch": 3486} {"train_loss": -6.784517765045166, "global_step": 146441, "epoch": 3486} {"train_loss": -6.729830265045166, "global_step": 146442, "epoch": 3486} {"train_loss": -6.643885612487793, "global_step": 146443, "epoch": 3486} {"train_loss": -6.6925859451293945, "global_step": 146444, "epoch": 3486} {"train_loss": -6.706806659698486, "global_step": 146445, "epoch": 3486} {"train_loss": -6.583773136138916, "global_step": 146446, "epoch": 3486} {"train_loss": -6.73465633392334, "global_step": 146447, "epoch": 3486} {"train_loss": -6.743638038635254, "global_step": 146448, "epoch": 3486} {"train_loss": -6.693515777587891, "global_step": 146449, "epoch": 3486} {"train_loss": -6.895097732543945, "global_step": 146450, "epoch": 3486} {"train_loss": -6.796041965484619, "global_step": 146451, "epoch": 3486} {"train_loss": -6.690250873565674, "global_step": 146452, "epoch": 3486} {"train_loss": -6.769354547773089, "global_step": 146453, "epoch": 3486, "val_loss": 68628.171875} {"train_loss": -6.723671913146973, "global_step": 146454, "epoch": 3487} {"train_loss": -6.789011478424072, "global_step": 146455, "epoch": 3487} {"train_loss": -6.748101234436035, "global_step": 146456, "epoch": 3487} {"train_loss": -6.782840728759766, "global_step": 146457, "epoch": 3487} {"train_loss": -6.708451271057129, "global_step": 146458, "epoch": 3487} {"train_loss": -6.802687644958496, "global_step": 146459, "epoch": 3487} {"train_loss": -6.740079402923584, "global_step": 146460, "epoch": 3487} {"train_loss": -6.816093444824219, "global_step": 146461, "epoch": 3487} {"train_loss": -6.759575843811035, "global_step": 146462, "epoch": 3487} {"train_loss": -6.706741809844971, "global_step": 146463, "epoch": 3487} {"train_loss": -6.673863887786865, "global_step": 146464, "epoch": 3487} {"train_loss": -6.710419654846191, "global_step": 146465, "epoch": 3487} {"train_loss": -6.83490514755249, "global_step": 146466, "epoch": 3487} {"train_loss": -6.7412943840026855, "global_step": 146467, "epoch": 3487} {"train_loss": -6.644198894500732, "global_step": 146468, "epoch": 3487} {"train_loss": -6.720048427581787, "global_step": 146469, "epoch": 3487} {"train_loss": -6.6397809982299805, "global_step": 146470, "epoch": 3487} {"train_loss": -6.658408164978027, "global_step": 146471, "epoch": 3487} {"train_loss": -6.891690254211426, "global_step": 146472, "epoch": 3487} {"train_loss": -6.76563024520874, "global_step": 146473, "epoch": 3487} {"train_loss": -6.73158073425293, "global_step": 146474, "epoch": 3487} {"train_loss": -6.664540767669678, "global_step": 146475, "epoch": 3487} {"train_loss": -6.762689590454102, "global_step": 146476, "epoch": 3487} {"train_loss": -6.809362411499023, "global_step": 146477, "epoch": 3487} {"train_loss": -6.748992919921875, "global_step": 146478, "epoch": 3487} {"train_loss": -6.8726911544799805, "global_step": 146479, "epoch": 3487} {"train_loss": -6.776605606079102, "global_step": 146480, "epoch": 3487} {"train_loss": -6.696408748626709, "global_step": 146481, "epoch": 3487} {"train_loss": -6.625648021697998, "global_step": 146482, "epoch": 3487} {"train_loss": -6.716787815093994, "global_step": 146483, "epoch": 3487} {"train_loss": -6.746393203735352, "global_step": 146484, "epoch": 3487} {"train_loss": -6.779362201690674, "global_step": 146485, "epoch": 3487} {"train_loss": -6.841165542602539, "global_step": 146486, "epoch": 3487} {"train_loss": -6.818631172180176, "global_step": 146487, "epoch": 3487} {"train_loss": -6.805207252502441, "global_step": 146488, "epoch": 3487} {"train_loss": -6.700780868530273, "global_step": 146489, "epoch": 3487} {"train_loss": -6.815591812133789, "global_step": 146490, "epoch": 3487} {"train_loss": -6.799415588378906, "global_step": 146491, "epoch": 3487} {"train_loss": -6.859711170196533, "global_step": 146492, "epoch": 3487} {"train_loss": -6.77020263671875, "global_step": 146493, "epoch": 3487} {"train_loss": -6.796606063842773, "global_step": 146494, "epoch": 3487} {"train_loss": -6.757708118075416, "global_step": 146495, "epoch": 3487, "val_loss": 68414.109375} {"train_loss": -6.792285919189453, "global_step": 146496, "epoch": 3488} {"train_loss": -6.909995079040527, "global_step": 146497, "epoch": 3488} {"train_loss": -6.744172096252441, "global_step": 146498, "epoch": 3488} {"train_loss": -6.829798698425293, "global_step": 146499, "epoch": 3488} {"train_loss": -6.794897079467773, "global_step": 146500, "epoch": 3488} {"train_loss": -6.815971374511719, "global_step": 146501, "epoch": 3488} {"train_loss": -6.82366418838501, "global_step": 146502, "epoch": 3488} {"train_loss": -6.871457099914551, "global_step": 146503, "epoch": 3488} {"train_loss": -6.806053638458252, "global_step": 146504, "epoch": 3488} {"train_loss": -6.791734218597412, "global_step": 146505, "epoch": 3488} {"train_loss": -6.8115153312683105, "global_step": 146506, "epoch": 3488} {"train_loss": -6.8127055168151855, "global_step": 146507, "epoch": 3488} {"train_loss": -6.809318542480469, "global_step": 146508, "epoch": 3488} {"train_loss": -6.853644847869873, "global_step": 146509, "epoch": 3488} {"train_loss": -6.792407035827637, "global_step": 146510, "epoch": 3488} {"train_loss": -6.797488212585449, "global_step": 146511, "epoch": 3488} {"train_loss": -6.80942440032959, "global_step": 146512, "epoch": 3488} {"train_loss": -6.889573097229004, "global_step": 146513, "epoch": 3488} {"train_loss": -6.699383735656738, "global_step": 146514, "epoch": 3488} {"train_loss": -6.754602909088135, "global_step": 146515, "epoch": 3488} {"train_loss": -6.78596305847168, "global_step": 146516, "epoch": 3488} {"train_loss": -6.79288387298584, "global_step": 146517, "epoch": 3488} {"train_loss": -6.8258185386657715, "global_step": 146518, "epoch": 3488} {"train_loss": -6.806928634643555, "global_step": 146519, "epoch": 3488} {"train_loss": -6.7527642250061035, "global_step": 146520, "epoch": 3488} {"train_loss": -6.837011337280273, "global_step": 146521, "epoch": 3488} {"train_loss": -6.825479507446289, "global_step": 146522, "epoch": 3488} {"train_loss": -6.871699810028076, "global_step": 146523, "epoch": 3488} {"train_loss": -6.861581802368164, "global_step": 146524, "epoch": 3488} {"train_loss": -6.773454666137695, "global_step": 146525, "epoch": 3488} {"train_loss": -6.708235740661621, "global_step": 146526, "epoch": 3488} {"train_loss": -6.812589168548584, "global_step": 146527, "epoch": 3488} {"train_loss": -6.853087425231934, "global_step": 146528, "epoch": 3488} {"train_loss": -6.794863700866699, "global_step": 146529, "epoch": 3488} {"train_loss": -6.8319172859191895, "global_step": 146530, "epoch": 3488} {"train_loss": -6.812020301818848, "global_step": 146531, "epoch": 3488} {"train_loss": -6.514770984649658, "global_step": 146532, "epoch": 3488} {"train_loss": -6.76171875, "global_step": 146533, "epoch": 3488} {"train_loss": -6.5617194175720215, "global_step": 146534, "epoch": 3488} {"train_loss": -6.483185768127441, "global_step": 146535, "epoch": 3488} {"train_loss": -6.735476016998291, "global_step": 146536, "epoch": 3488} {"train_loss": -6.778123980476742, "global_step": 146537, "epoch": 3488, "val_loss": 68406.5859375} {"train_loss": -6.693065643310547, "global_step": 146538, "epoch": 3489} {"train_loss": -6.696958541870117, "global_step": 146539, "epoch": 3489} {"train_loss": -6.690832614898682, "global_step": 146540, "epoch": 3489} {"train_loss": -6.662297248840332, "global_step": 146541, "epoch": 3489} {"train_loss": -6.586953163146973, "global_step": 146542, "epoch": 3489} {"train_loss": -6.664955139160156, "global_step": 146543, "epoch": 3489} {"train_loss": -6.701315402984619, "global_step": 146544, "epoch": 3489} {"train_loss": -6.673766613006592, "global_step": 146545, "epoch": 3489} {"train_loss": -6.678132057189941, "global_step": 146546, "epoch": 3489} {"train_loss": -6.705898761749268, "global_step": 146547, "epoch": 3489} {"train_loss": -6.694331169128418, "global_step": 146548, "epoch": 3489} {"train_loss": -6.711113929748535, "global_step": 146549, "epoch": 3489} {"train_loss": -6.748539924621582, "global_step": 146550, "epoch": 3489} {"train_loss": -6.735251426696777, "global_step": 146551, "epoch": 3489} {"train_loss": -6.686226844787598, "global_step": 146552, "epoch": 3489} {"train_loss": -6.765100002288818, "global_step": 146553, "epoch": 3489} {"train_loss": -6.647580146789551, "global_step": 146554, "epoch": 3489} {"train_loss": -6.7010626792907715, "global_step": 146555, "epoch": 3489} {"train_loss": -6.720508575439453, "global_step": 146556, "epoch": 3489} {"train_loss": -6.7790117263793945, "global_step": 146557, "epoch": 3489} {"train_loss": -6.734269142150879, "global_step": 146558, "epoch": 3489} {"train_loss": -6.733050346374512, "global_step": 146559, "epoch": 3489} {"train_loss": -6.609064102172852, "global_step": 146560, "epoch": 3489} {"train_loss": -6.628346920013428, "global_step": 146561, "epoch": 3489} {"train_loss": -6.706596374511719, "global_step": 146562, "epoch": 3489} {"train_loss": -6.700632095336914, "global_step": 146563, "epoch": 3489} {"train_loss": -6.842979431152344, "global_step": 146564, "epoch": 3489} {"train_loss": -6.755771636962891, "global_step": 146565, "epoch": 3489} {"train_loss": -6.796838760375977, "global_step": 146566, "epoch": 3489} {"train_loss": -6.645224571228027, "global_step": 146567, "epoch": 3489} {"train_loss": -6.714524269104004, "global_step": 146568, "epoch": 3489} {"train_loss": -6.781756401062012, "global_step": 146569, "epoch": 3489} {"train_loss": -6.605658531188965, "global_step": 146570, "epoch": 3489} {"train_loss": -6.745382785797119, "global_step": 146571, "epoch": 3489} {"train_loss": -6.718326568603516, "global_step": 146572, "epoch": 3489} {"train_loss": -6.574893474578857, "global_step": 146573, "epoch": 3489} {"train_loss": -6.693850040435791, "global_step": 146574, "epoch": 3489} {"train_loss": -6.6134724617004395, "global_step": 146575, "epoch": 3489} {"train_loss": -6.714844703674316, "global_step": 146576, "epoch": 3489} {"train_loss": -6.716724395751953, "global_step": 146577, "epoch": 3489} {"train_loss": -6.673482894897461, "global_step": 146578, "epoch": 3489} {"train_loss": -6.699467307045346, "global_step": 146579, "epoch": 3489, "val_loss": 68440.1328125} {"train_loss": -6.707040309906006, "global_step": 146580, "epoch": 3490} {"train_loss": -6.8221330642700195, "global_step": 146581, "epoch": 3490} {"train_loss": -6.76807165145874, "global_step": 146582, "epoch": 3490} {"train_loss": -6.853407859802246, "global_step": 146583, "epoch": 3490} {"train_loss": -6.685594081878662, "global_step": 146584, "epoch": 3490} {"train_loss": -6.752678871154785, "global_step": 146585, "epoch": 3490} {"train_loss": -6.706760406494141, "global_step": 146586, "epoch": 3490} {"train_loss": -6.735367774963379, "global_step": 146587, "epoch": 3490} {"train_loss": -6.701381683349609, "global_step": 146588, "epoch": 3490} {"train_loss": -6.7230916023254395, "global_step": 146589, "epoch": 3490} {"train_loss": -6.779441833496094, "global_step": 146590, "epoch": 3490} {"train_loss": -6.6761250495910645, "global_step": 146591, "epoch": 3490} {"train_loss": -6.756203651428223, "global_step": 146592, "epoch": 3490} {"train_loss": -6.6820292472839355, "global_step": 146593, "epoch": 3490} {"train_loss": -6.698404312133789, "global_step": 146594, "epoch": 3490} {"train_loss": -6.701992034912109, "global_step": 146595, "epoch": 3490} {"train_loss": -6.787406921386719, "global_step": 146596, "epoch": 3490} {"train_loss": -6.7803120613098145, "global_step": 146597, "epoch": 3490} {"train_loss": -6.695949554443359, "global_step": 146598, "epoch": 3490} {"train_loss": -6.728598117828369, "global_step": 146599, "epoch": 3490} {"train_loss": -6.772378444671631, "global_step": 146600, "epoch": 3490} {"train_loss": -6.726037979125977, "global_step": 146601, "epoch": 3490} {"train_loss": -6.740453720092773, "global_step": 146602, "epoch": 3490} {"train_loss": -6.7867817878723145, "global_step": 146603, "epoch": 3490} {"train_loss": -6.823836803436279, "global_step": 146604, "epoch": 3490} {"train_loss": -6.88640022277832, "global_step": 146605, "epoch": 3490} {"train_loss": -6.811809539794922, "global_step": 146606, "epoch": 3490} {"train_loss": -6.841546535491943, "global_step": 146607, "epoch": 3490} {"train_loss": -6.830193519592285, "global_step": 146608, "epoch": 3490} {"train_loss": -6.645437717437744, "global_step": 146609, "epoch": 3490} {"train_loss": -6.743906021118164, "global_step": 146610, "epoch": 3490} {"train_loss": -6.666060447692871, "global_step": 146611, "epoch": 3490} {"train_loss": -6.807474136352539, "global_step": 146612, "epoch": 3490} {"train_loss": -6.848372936248779, "global_step": 146613, "epoch": 3490} {"train_loss": -6.843050003051758, "global_step": 146614, "epoch": 3490} {"train_loss": -6.715663909912109, "global_step": 146615, "epoch": 3490} {"train_loss": -6.7602386474609375, "global_step": 146616, "epoch": 3490} {"train_loss": -6.739521503448486, "global_step": 146617, "epoch": 3490} {"train_loss": -6.633388042449951, "global_step": 146618, "epoch": 3490} {"train_loss": -6.784613609313965, "global_step": 146619, "epoch": 3490} {"train_loss": -6.8051605224609375, "global_step": 146620, "epoch": 3490} {"train_loss": -6.753741752533686, "global_step": 146621, "epoch": 3490, "val_loss": 68339.3125} {"train_loss": -6.91370153427124, "global_step": 146622, "epoch": 3491} {"train_loss": -6.594112396240234, "global_step": 146623, "epoch": 3491} {"train_loss": -6.737609386444092, "global_step": 146624, "epoch": 3491} {"train_loss": -6.822927474975586, "global_step": 146625, "epoch": 3491} {"train_loss": -6.710464000701904, "global_step": 146626, "epoch": 3491} {"train_loss": -6.812470436096191, "global_step": 146627, "epoch": 3491} {"train_loss": -6.713313102722168, "global_step": 146628, "epoch": 3491} {"train_loss": -6.767410755157471, "global_step": 146629, "epoch": 3491} {"train_loss": -6.774140357971191, "global_step": 146630, "epoch": 3491} {"train_loss": -6.792900562286377, "global_step": 146631, "epoch": 3491} {"train_loss": -6.85487699508667, "global_step": 146632, "epoch": 3491} {"train_loss": -6.830732345581055, "global_step": 146633, "epoch": 3491} {"train_loss": -6.714905738830566, "global_step": 146634, "epoch": 3491} {"train_loss": -6.810462951660156, "global_step": 146635, "epoch": 3491} {"train_loss": -6.855123996734619, "global_step": 146636, "epoch": 3491} {"train_loss": -6.69880485534668, "global_step": 146637, "epoch": 3491} {"train_loss": -6.825531959533691, "global_step": 146638, "epoch": 3491} {"train_loss": -6.797430515289307, "global_step": 146639, "epoch": 3491} {"train_loss": -6.77421760559082, "global_step": 146640, "epoch": 3491} {"train_loss": -6.851656436920166, "global_step": 146641, "epoch": 3491} {"train_loss": -6.799310684204102, "global_step": 146642, "epoch": 3491} {"train_loss": -6.787047386169434, "global_step": 146643, "epoch": 3491} {"train_loss": -6.862618446350098, "global_step": 146644, "epoch": 3491} {"train_loss": -6.756461143493652, "global_step": 146645, "epoch": 3491} {"train_loss": -6.876860618591309, "global_step": 146646, "epoch": 3491} {"train_loss": -6.924113750457764, "global_step": 146647, "epoch": 3491} {"train_loss": -6.753347396850586, "global_step": 146648, "epoch": 3491} {"train_loss": -6.8610076904296875, "global_step": 146649, "epoch": 3491} {"train_loss": -6.770643711090088, "global_step": 146650, "epoch": 3491} {"train_loss": -6.761806488037109, "global_step": 146651, "epoch": 3491} {"train_loss": -6.920166969299316, "global_step": 146652, "epoch": 3491} {"train_loss": -6.758349418640137, "global_step": 146653, "epoch": 3491} {"train_loss": -6.875514030456543, "global_step": 146654, "epoch": 3491} {"train_loss": -6.907085418701172, "global_step": 146655, "epoch": 3491} {"train_loss": -6.877824306488037, "global_step": 146656, "epoch": 3491} {"train_loss": -6.826092720031738, "global_step": 146657, "epoch": 3491} {"train_loss": -6.814809322357178, "global_step": 146658, "epoch": 3491} {"train_loss": -6.852568626403809, "global_step": 146659, "epoch": 3491} {"train_loss": -6.8601975440979, "global_step": 146660, "epoch": 3491} {"train_loss": -6.8517632484436035, "global_step": 146661, "epoch": 3491} {"train_loss": -6.78053092956543, "global_step": 146662, "epoch": 3491} {"train_loss": -6.806455260231381, "global_step": 146663, "epoch": 3491, "val_loss": 68288.125} {"train_loss": -6.879079818725586, "global_step": 146664, "epoch": 3492} {"train_loss": -6.891693592071533, "global_step": 146665, "epoch": 3492} {"train_loss": -6.752711772918701, "global_step": 146666, "epoch": 3492} {"train_loss": -6.7454833984375, "global_step": 146667, "epoch": 3492} {"train_loss": -6.761569976806641, "global_step": 146668, "epoch": 3492} {"train_loss": -6.845867156982422, "global_step": 146669, "epoch": 3492} {"train_loss": -6.842898368835449, "global_step": 146670, "epoch": 3492} {"train_loss": -6.737051010131836, "global_step": 146671, "epoch": 3492} {"train_loss": -6.887986183166504, "global_step": 146672, "epoch": 3492} {"train_loss": -6.798308849334717, "global_step": 146673, "epoch": 3492} {"train_loss": -6.782479286193848, "global_step": 146674, "epoch": 3492} {"train_loss": -6.819867134094238, "global_step": 146675, "epoch": 3492} {"train_loss": -6.740314483642578, "global_step": 146676, "epoch": 3492} {"train_loss": -6.777996063232422, "global_step": 146677, "epoch": 3492} {"train_loss": -6.818574905395508, "global_step": 146678, "epoch": 3492} {"train_loss": -6.621335029602051, "global_step": 146679, "epoch": 3492} {"train_loss": -6.7355217933654785, "global_step": 146680, "epoch": 3492} {"train_loss": -6.715828895568848, "global_step": 146681, "epoch": 3492} {"train_loss": -6.787328720092773, "global_step": 146682, "epoch": 3492} {"train_loss": -6.8141584396362305, "global_step": 146683, "epoch": 3492} {"train_loss": -6.699237823486328, "global_step": 146684, "epoch": 3492} {"train_loss": -6.792891979217529, "global_step": 146685, "epoch": 3492} {"train_loss": -6.8324995040893555, "global_step": 146686, "epoch": 3492} {"train_loss": -6.761069297790527, "global_step": 146687, "epoch": 3492} {"train_loss": -6.8178486824035645, "global_step": 146688, "epoch": 3492} {"train_loss": -6.796711444854736, "global_step": 146689, "epoch": 3492} {"train_loss": -6.808143138885498, "global_step": 146690, "epoch": 3492} {"train_loss": -6.8982038497924805, "global_step": 146691, "epoch": 3492} {"train_loss": -6.773978233337402, "global_step": 146692, "epoch": 3492} {"train_loss": -6.805551052093506, "global_step": 146693, "epoch": 3492} {"train_loss": -6.6689252853393555, "global_step": 146694, "epoch": 3492} {"train_loss": -6.841945171356201, "global_step": 146695, "epoch": 3492} {"train_loss": -6.778888702392578, "global_step": 146696, "epoch": 3492} {"train_loss": -6.733348369598389, "global_step": 146697, "epoch": 3492} {"train_loss": -6.744019031524658, "global_step": 146698, "epoch": 3492} {"train_loss": -6.7471160888671875, "global_step": 146699, "epoch": 3492} {"train_loss": -6.705599784851074, "global_step": 146700, "epoch": 3492} {"train_loss": -6.760691165924072, "global_step": 146701, "epoch": 3492} {"train_loss": -6.714293479919434, "global_step": 146702, "epoch": 3492} {"train_loss": -6.818408012390137, "global_step": 146703, "epoch": 3492} {"train_loss": -6.66419792175293, "global_step": 146704, "epoch": 3492} {"train_loss": -6.778173878079369, "global_step": 146705, "epoch": 3492, "val_loss": 68335.5859375} {"train_loss": -6.714910507202148, "global_step": 146706, "epoch": 3493} {"train_loss": -6.740013122558594, "global_step": 146707, "epoch": 3493} {"train_loss": -6.868598937988281, "global_step": 146708, "epoch": 3493} {"train_loss": -6.803396224975586, "global_step": 146709, "epoch": 3493} {"train_loss": -6.870973587036133, "global_step": 146710, "epoch": 3493} {"train_loss": -6.758053302764893, "global_step": 146711, "epoch": 3493} {"train_loss": -6.826502799987793, "global_step": 146712, "epoch": 3493} {"train_loss": -6.8106160163879395, "global_step": 146713, "epoch": 3493} {"train_loss": -6.775856018066406, "global_step": 146714, "epoch": 3493} {"train_loss": -6.7599945068359375, "global_step": 146715, "epoch": 3493} {"train_loss": -6.712034225463867, "global_step": 146716, "epoch": 3493} {"train_loss": -6.8423357009887695, "global_step": 146717, "epoch": 3493} {"train_loss": -6.80790901184082, "global_step": 146718, "epoch": 3493} {"train_loss": -6.858062744140625, "global_step": 146719, "epoch": 3493} {"train_loss": -6.785135269165039, "global_step": 146720, "epoch": 3493} {"train_loss": -6.780697822570801, "global_step": 146721, "epoch": 3493} {"train_loss": -6.826723098754883, "global_step": 146722, "epoch": 3493} {"train_loss": -6.809361934661865, "global_step": 146723, "epoch": 3493} {"train_loss": -6.758991241455078, "global_step": 146724, "epoch": 3493} {"train_loss": -6.833097457885742, "global_step": 146725, "epoch": 3493} {"train_loss": -6.898584842681885, "global_step": 146726, "epoch": 3493} {"train_loss": -6.844470977783203, "global_step": 146727, "epoch": 3493} {"train_loss": -6.856630802154541, "global_step": 146728, "epoch": 3493} {"train_loss": -6.7907938957214355, "global_step": 146729, "epoch": 3493} {"train_loss": -6.729884147644043, "global_step": 146730, "epoch": 3493} {"train_loss": -6.726944446563721, "global_step": 146731, "epoch": 3493} {"train_loss": -6.757657527923584, "global_step": 146732, "epoch": 3493} {"train_loss": -6.805385589599609, "global_step": 146733, "epoch": 3493} {"train_loss": -6.794733047485352, "global_step": 146734, "epoch": 3493} {"train_loss": -6.796946048736572, "global_step": 146735, "epoch": 3493} {"train_loss": -6.707863807678223, "global_step": 146736, "epoch": 3493} {"train_loss": -6.799020767211914, "global_step": 146737, "epoch": 3493} {"train_loss": -6.768765926361084, "global_step": 146738, "epoch": 3493} {"train_loss": -6.816440105438232, "global_step": 146739, "epoch": 3493} {"train_loss": -6.765227317810059, "global_step": 146740, "epoch": 3493} {"train_loss": -6.6840667724609375, "global_step": 146741, "epoch": 3493} {"train_loss": -6.720834732055664, "global_step": 146742, "epoch": 3493} {"train_loss": -6.746766090393066, "global_step": 146743, "epoch": 3493} {"train_loss": -6.739837169647217, "global_step": 146744, "epoch": 3493} {"train_loss": -6.774514198303223, "global_step": 146745, "epoch": 3493} {"train_loss": -6.572310447692871, "global_step": 146746, "epoch": 3493} {"train_loss": -6.780556383587065, "global_step": 146747, "epoch": 3493, "val_loss": 68447.2734375} {"train_loss": -6.790523529052734, "global_step": 146748, "epoch": 3494} {"train_loss": -6.759456157684326, "global_step": 146749, "epoch": 3494} {"train_loss": -6.781309127807617, "global_step": 146750, "epoch": 3494} {"train_loss": -6.816819667816162, "global_step": 146751, "epoch": 3494} {"train_loss": -6.833019733428955, "global_step": 146752, "epoch": 3494} {"train_loss": -6.893309593200684, "global_step": 146753, "epoch": 3494} {"train_loss": -6.783283233642578, "global_step": 146754, "epoch": 3494} {"train_loss": -6.751596927642822, "global_step": 146755, "epoch": 3494} {"train_loss": -6.785719871520996, "global_step": 146756, "epoch": 3494} {"train_loss": -6.889871597290039, "global_step": 146757, "epoch": 3494} {"train_loss": -6.834015369415283, "global_step": 146758, "epoch": 3494} {"train_loss": -6.7181620597839355, "global_step": 146759, "epoch": 3494} {"train_loss": -6.645087242126465, "global_step": 146760, "epoch": 3494} {"train_loss": -6.816239356994629, "global_step": 146761, "epoch": 3494} {"train_loss": -6.706901550292969, "global_step": 146762, "epoch": 3494} {"train_loss": -6.752167701721191, "global_step": 146763, "epoch": 3494} {"train_loss": -6.679413795471191, "global_step": 146764, "epoch": 3494} {"train_loss": -6.692120552062988, "global_step": 146765, "epoch": 3494} {"train_loss": -6.813045978546143, "global_step": 146766, "epoch": 3494} {"train_loss": -6.739316463470459, "global_step": 146767, "epoch": 3494} {"train_loss": -6.714915752410889, "global_step": 146768, "epoch": 3494} {"train_loss": -6.6912384033203125, "global_step": 146769, "epoch": 3494} {"train_loss": -6.810681343078613, "global_step": 146770, "epoch": 3494} {"train_loss": -6.7715606689453125, "global_step": 146771, "epoch": 3494} {"train_loss": -6.7739667892456055, "global_step": 146772, "epoch": 3494} {"train_loss": -6.848641395568848, "global_step": 146773, "epoch": 3494} {"train_loss": -6.991753578186035, "global_step": 146774, "epoch": 3494} {"train_loss": -6.773326396942139, "global_step": 146775, "epoch": 3494} {"train_loss": -6.750317096710205, "global_step": 146776, "epoch": 3494} {"train_loss": -6.897391319274902, "global_step": 146777, "epoch": 3494} {"train_loss": -6.79138708114624, "global_step": 146778, "epoch": 3494} {"train_loss": -6.70717191696167, "global_step": 146779, "epoch": 3494} {"train_loss": -6.806992053985596, "global_step": 146780, "epoch": 3494} {"train_loss": -6.845623016357422, "global_step": 146781, "epoch": 3494} {"train_loss": -6.794769287109375, "global_step": 146782, "epoch": 3494} {"train_loss": -6.744065284729004, "global_step": 146783, "epoch": 3494} {"train_loss": -6.783013820648193, "global_step": 146784, "epoch": 3494} {"train_loss": -6.765103816986084, "global_step": 146785, "epoch": 3494} {"train_loss": -6.753826141357422, "global_step": 146786, "epoch": 3494} {"train_loss": -6.668270587921143, "global_step": 146787, "epoch": 3494} {"train_loss": -6.7460832595825195, "global_step": 146788, "epoch": 3494} {"train_loss": -6.77837594350179, "global_step": 146789, "epoch": 3494, "val_loss": 68528.8203125} {"train_loss": -6.752633094787598, "global_step": 146790, "epoch": 3495} {"train_loss": -6.855012893676758, "global_step": 146791, "epoch": 3495} {"train_loss": -6.6941399574279785, "global_step": 146792, "epoch": 3495} {"train_loss": -6.737700462341309, "global_step": 146793, "epoch": 3495} {"train_loss": -6.663212776184082, "global_step": 146794, "epoch": 3495} {"train_loss": -6.69051456451416, "global_step": 146795, "epoch": 3495} {"train_loss": -6.780128002166748, "global_step": 146796, "epoch": 3495} {"train_loss": -6.601250648498535, "global_step": 146797, "epoch": 3495} {"train_loss": -6.597830772399902, "global_step": 146798, "epoch": 3495} {"train_loss": -6.742287635803223, "global_step": 146799, "epoch": 3495} {"train_loss": -6.731926918029785, "global_step": 146800, "epoch": 3495} {"train_loss": -6.703105926513672, "global_step": 146801, "epoch": 3495} {"train_loss": -6.777487754821777, "global_step": 146802, "epoch": 3495} {"train_loss": -6.761262893676758, "global_step": 146803, "epoch": 3495} {"train_loss": -6.865561008453369, "global_step": 146804, "epoch": 3495} {"train_loss": -6.766685485839844, "global_step": 146805, "epoch": 3495} {"train_loss": -6.590084075927734, "global_step": 146806, "epoch": 3495} {"train_loss": -6.836559295654297, "global_step": 146807, "epoch": 3495} {"train_loss": -6.675110340118408, "global_step": 146808, "epoch": 3495} {"train_loss": -6.582742691040039, "global_step": 146809, "epoch": 3495} {"train_loss": -6.725164413452148, "global_step": 146810, "epoch": 3495} {"train_loss": -6.626065254211426, "global_step": 146811, "epoch": 3495} {"train_loss": -6.645074844360352, "global_step": 146812, "epoch": 3495} {"train_loss": -6.58120059967041, "global_step": 146813, "epoch": 3495} {"train_loss": -6.720610618591309, "global_step": 146814, "epoch": 3495} {"train_loss": -6.684170722961426, "global_step": 146815, "epoch": 3495} {"train_loss": -6.810644149780273, "global_step": 146816, "epoch": 3495} {"train_loss": -6.6809000968933105, "global_step": 146817, "epoch": 3495} {"train_loss": -6.661635398864746, "global_step": 146818, "epoch": 3495} {"train_loss": -6.765124797821045, "global_step": 146819, "epoch": 3495} {"train_loss": -6.6845550537109375, "global_step": 146820, "epoch": 3495} {"train_loss": -6.67866325378418, "global_step": 146821, "epoch": 3495} {"train_loss": -6.691018581390381, "global_step": 146822, "epoch": 3495} {"train_loss": -6.663991451263428, "global_step": 146823, "epoch": 3495} {"train_loss": -6.709691047668457, "global_step": 146824, "epoch": 3495} {"train_loss": -6.713628768920898, "global_step": 146825, "epoch": 3495} {"train_loss": -6.6535234451293945, "global_step": 146826, "epoch": 3495} {"train_loss": -6.7194366455078125, "global_step": 146827, "epoch": 3495} {"train_loss": -6.6894683837890625, "global_step": 146828, "epoch": 3495} {"train_loss": -6.517998695373535, "global_step": 146829, "epoch": 3495} {"train_loss": -6.6762800216674805, "global_step": 146830, "epoch": 3495} {"train_loss": -6.698897668293545, "global_step": 146831, "epoch": 3495, "val_loss": 68708.984375} {"train_loss": -6.611793518066406, "global_step": 146832, "epoch": 3496} {"train_loss": -6.6894121170043945, "global_step": 146833, "epoch": 3496} {"train_loss": -6.604379653930664, "global_step": 146834, "epoch": 3496} {"train_loss": -6.697169303894043, "global_step": 146835, "epoch": 3496} {"train_loss": -6.611159324645996, "global_step": 146836, "epoch": 3496} {"train_loss": -6.738960266113281, "global_step": 146837, "epoch": 3496} {"train_loss": -6.628324508666992, "global_step": 146838, "epoch": 3496} {"train_loss": -6.703189849853516, "global_step": 146839, "epoch": 3496} {"train_loss": -6.839146614074707, "global_step": 146840, "epoch": 3496} {"train_loss": -6.709281921386719, "global_step": 146841, "epoch": 3496} {"train_loss": -6.7867326736450195, "global_step": 146842, "epoch": 3496} {"train_loss": -6.6386213302612305, "global_step": 146843, "epoch": 3496} {"train_loss": -6.674161911010742, "global_step": 146844, "epoch": 3496} {"train_loss": -6.6619415283203125, "global_step": 146845, "epoch": 3496} {"train_loss": -6.786359786987305, "global_step": 146846, "epoch": 3496} {"train_loss": -6.577342987060547, "global_step": 146847, "epoch": 3496} {"train_loss": -6.664705276489258, "global_step": 146848, "epoch": 3496} {"train_loss": -6.7810163497924805, "global_step": 146849, "epoch": 3496} {"train_loss": -6.656436443328857, "global_step": 146850, "epoch": 3496} {"train_loss": -6.774741172790527, "global_step": 146851, "epoch": 3496} {"train_loss": -6.721683502197266, "global_step": 146852, "epoch": 3496} {"train_loss": -6.7064995765686035, "global_step": 146853, "epoch": 3496} {"train_loss": -6.732506275177002, "global_step": 146854, "epoch": 3496} {"train_loss": -6.7174296379089355, "global_step": 146855, "epoch": 3496} {"train_loss": -6.749564170837402, "global_step": 146856, "epoch": 3496} {"train_loss": -6.879421234130859, "global_step": 146857, "epoch": 3496} {"train_loss": -6.599036693572998, "global_step": 146858, "epoch": 3496} {"train_loss": -6.819368362426758, "global_step": 146859, "epoch": 3496} {"train_loss": -6.734913349151611, "global_step": 146860, "epoch": 3496} {"train_loss": -6.688365936279297, "global_step": 146861, "epoch": 3496} {"train_loss": -6.817312240600586, "global_step": 146862, "epoch": 3496} {"train_loss": -6.852104187011719, "global_step": 146863, "epoch": 3496} {"train_loss": -6.782332420349121, "global_step": 146864, "epoch": 3496} {"train_loss": -6.799344062805176, "global_step": 146865, "epoch": 3496} {"train_loss": -6.745814323425293, "global_step": 146866, "epoch": 3496} {"train_loss": -6.730764865875244, "global_step": 146867, "epoch": 3496} {"train_loss": -6.789390563964844, "global_step": 146868, "epoch": 3496} {"train_loss": -6.765993118286133, "global_step": 146869, "epoch": 3496} {"train_loss": -6.70330810546875, "global_step": 146870, "epoch": 3496} {"train_loss": -6.8841471672058105, "global_step": 146871, "epoch": 3496} {"train_loss": -6.8037543296813965, "global_step": 146872, "epoch": 3496} {"train_loss": -6.729883784339542, "global_step": 146873, "epoch": 3496, "val_loss": 68399.1640625} {"train_loss": -6.751281261444092, "global_step": 146874, "epoch": 3497} {"train_loss": -6.754127025604248, "global_step": 146875, "epoch": 3497} {"train_loss": -6.707757949829102, "global_step": 146876, "epoch": 3497} {"train_loss": -6.810520172119141, "global_step": 146877, "epoch": 3497} {"train_loss": -6.838921546936035, "global_step": 146878, "epoch": 3497} {"train_loss": -6.9460601806640625, "global_step": 146879, "epoch": 3497} {"train_loss": -6.786991119384766, "global_step": 146880, "epoch": 3497} {"train_loss": -6.94140625, "global_step": 146881, "epoch": 3497} {"train_loss": -7.001437187194824, "global_step": 146882, "epoch": 3497} {"train_loss": -6.961045265197754, "global_step": 146883, "epoch": 3497} {"train_loss": -6.910866737365723, "global_step": 146884, "epoch": 3497} {"train_loss": -6.948163032531738, "global_step": 146885, "epoch": 3497} {"train_loss": -6.937054634094238, "global_step": 146886, "epoch": 3497} {"train_loss": -6.936922073364258, "global_step": 146887, "epoch": 3497} {"train_loss": -6.93215274810791, "global_step": 146888, "epoch": 3497} {"train_loss": -6.7244977951049805, "global_step": 146889, "epoch": 3497} {"train_loss": -6.775726795196533, "global_step": 146890, "epoch": 3497} {"train_loss": -6.791191101074219, "global_step": 146891, "epoch": 3497} {"train_loss": -6.793161392211914, "global_step": 146892, "epoch": 3497} {"train_loss": -6.9708452224731445, "global_step": 146893, "epoch": 3497} {"train_loss": -6.845735549926758, "global_step": 146894, "epoch": 3497} {"train_loss": -6.892849922180176, "global_step": 146895, "epoch": 3497} {"train_loss": -6.879428863525391, "global_step": 146896, "epoch": 3497} {"train_loss": -6.741105079650879, "global_step": 146897, "epoch": 3497} {"train_loss": -6.777807235717773, "global_step": 146898, "epoch": 3497} {"train_loss": -6.882196426391602, "global_step": 146899, "epoch": 3497} {"train_loss": -6.800606727600098, "global_step": 146900, "epoch": 3497} {"train_loss": -6.763180732727051, "global_step": 146901, "epoch": 3497} {"train_loss": -6.928953647613525, "global_step": 146902, "epoch": 3497} {"train_loss": -6.761153697967529, "global_step": 146903, "epoch": 3497} {"train_loss": -6.76707649230957, "global_step": 146904, "epoch": 3497} {"train_loss": -6.841208457946777, "global_step": 146905, "epoch": 3497} {"train_loss": -6.673415184020996, "global_step": 146906, "epoch": 3497} {"train_loss": -6.68529748916626, "global_step": 146907, "epoch": 3497} {"train_loss": -6.78471565246582, "global_step": 146908, "epoch": 3497} {"train_loss": -6.720938682556152, "global_step": 146909, "epoch": 3497} {"train_loss": -6.7350969314575195, "global_step": 146910, "epoch": 3497} {"train_loss": -6.704951286315918, "global_step": 146911, "epoch": 3497} {"train_loss": -6.722621917724609, "global_step": 146912, "epoch": 3497} {"train_loss": -6.698720455169678, "global_step": 146913, "epoch": 3497} {"train_loss": -6.730877876281738, "global_step": 146914, "epoch": 3497} {"train_loss": -6.818210885638282, "global_step": 146915, "epoch": 3497, "val_loss": 68432.296875} {"train_loss": -6.77991247177124, "global_step": 146916, "epoch": 3498} {"train_loss": -6.753493309020996, "global_step": 146917, "epoch": 3498} {"train_loss": -6.777264595031738, "global_step": 146918, "epoch": 3498} {"train_loss": -6.798589706420898, "global_step": 146919, "epoch": 3498} {"train_loss": -6.785432815551758, "global_step": 146920, "epoch": 3498} {"train_loss": -6.810771942138672, "global_step": 146921, "epoch": 3498} {"train_loss": -6.748435020446777, "global_step": 146922, "epoch": 3498} {"train_loss": -6.769659996032715, "global_step": 146923, "epoch": 3498} {"train_loss": -6.732901573181152, "global_step": 146924, "epoch": 3498} {"train_loss": -6.7351975440979, "global_step": 146925, "epoch": 3498} {"train_loss": -6.665441036224365, "global_step": 146926, "epoch": 3498} {"train_loss": -6.717539310455322, "global_step": 146927, "epoch": 3498} {"train_loss": -6.924091339111328, "global_step": 146928, "epoch": 3498} {"train_loss": -6.825640678405762, "global_step": 146929, "epoch": 3498} {"train_loss": -6.860775947570801, "global_step": 146930, "epoch": 3498} {"train_loss": -6.693937301635742, "global_step": 146931, "epoch": 3498} {"train_loss": -6.607439041137695, "global_step": 146932, "epoch": 3498} {"train_loss": -6.81943941116333, "global_step": 146933, "epoch": 3498} {"train_loss": -6.7540998458862305, "global_step": 146934, "epoch": 3498} {"train_loss": -6.740508556365967, "global_step": 146935, "epoch": 3498} {"train_loss": -6.745048999786377, "global_step": 146936, "epoch": 3498} {"train_loss": -6.73484468460083, "global_step": 146937, "epoch": 3498} {"train_loss": -6.761556148529053, "global_step": 146938, "epoch": 3498} {"train_loss": -6.749205589294434, "global_step": 146939, "epoch": 3498} {"train_loss": -6.779929161071777, "global_step": 146940, "epoch": 3498} {"train_loss": -6.819058418273926, "global_step": 146941, "epoch": 3498} {"train_loss": -6.767119407653809, "global_step": 146942, "epoch": 3498} {"train_loss": -6.872103214263916, "global_step": 146943, "epoch": 3498} {"train_loss": -6.8716888427734375, "global_step": 146944, "epoch": 3498} {"train_loss": -6.839194297790527, "global_step": 146945, "epoch": 3498} {"train_loss": -6.865243911743164, "global_step": 146946, "epoch": 3498} {"train_loss": -6.813540935516357, "global_step": 146947, "epoch": 3498} {"train_loss": -6.909796714782715, "global_step": 146948, "epoch": 3498} {"train_loss": -6.814601898193359, "global_step": 146949, "epoch": 3498} {"train_loss": -6.868031978607178, "global_step": 146950, "epoch": 3498} {"train_loss": -6.891611576080322, "global_step": 146951, "epoch": 3498} {"train_loss": -6.8152360916137695, "global_step": 146952, "epoch": 3498} {"train_loss": -6.85896635055542, "global_step": 146953, "epoch": 3498} {"train_loss": -6.88099479675293, "global_step": 146954, "epoch": 3498} {"train_loss": -6.748508930206299, "global_step": 146955, "epoch": 3498} {"train_loss": -6.8855299949646, "global_step": 146956, "epoch": 3498} {"train_loss": -6.794020368939354, "global_step": 146957, "epoch": 3498, "val_loss": 68291.3515625} {"train_loss": -6.740853786468506, "global_step": 146958, "epoch": 3499} {"train_loss": -6.727272987365723, "global_step": 146959, "epoch": 3499} {"train_loss": -6.787960052490234, "global_step": 146960, "epoch": 3499} {"train_loss": -6.804222106933594, "global_step": 146961, "epoch": 3499} {"train_loss": -6.853860855102539, "global_step": 146962, "epoch": 3499} {"train_loss": -6.859370231628418, "global_step": 146963, "epoch": 3499} {"train_loss": -6.79630184173584, "global_step": 146964, "epoch": 3499} {"train_loss": -6.8119096755981445, "global_step": 146965, "epoch": 3499} {"train_loss": -6.827517986297607, "global_step": 146966, "epoch": 3499} {"train_loss": -6.788393974304199, "global_step": 146967, "epoch": 3499} {"train_loss": -6.735304832458496, "global_step": 146968, "epoch": 3499} {"train_loss": -6.863219261169434, "global_step": 146969, "epoch": 3499} {"train_loss": -6.806236267089844, "global_step": 146970, "epoch": 3499} {"train_loss": -6.8099894523620605, "global_step": 146971, "epoch": 3499} {"train_loss": -6.884371757507324, "global_step": 146972, "epoch": 3499} {"train_loss": -6.792627334594727, "global_step": 146973, "epoch": 3499} {"train_loss": -6.808690547943115, "global_step": 146974, "epoch": 3499} {"train_loss": -6.909690856933594, "global_step": 146975, "epoch": 3499} {"train_loss": -6.779502868652344, "global_step": 146976, "epoch": 3499} {"train_loss": -6.816851615905762, "global_step": 146977, "epoch": 3499} {"train_loss": -6.828479766845703, "global_step": 146978, "epoch": 3499} {"train_loss": -6.856682777404785, "global_step": 146979, "epoch": 3499} {"train_loss": -6.894180774688721, "global_step": 146980, "epoch": 3499} {"train_loss": -6.819979190826416, "global_step": 146981, "epoch": 3499} {"train_loss": -6.980518341064453, "global_step": 146982, "epoch": 3499} {"train_loss": -6.8037004470825195, "global_step": 146983, "epoch": 3499} {"train_loss": -6.8261237144470215, "global_step": 146984, "epoch": 3499} {"train_loss": -6.76065731048584, "global_step": 146985, "epoch": 3499} {"train_loss": -6.773836135864258, "global_step": 146986, "epoch": 3499} {"train_loss": -6.884883403778076, "global_step": 146987, "epoch": 3499} {"train_loss": -6.79654598236084, "global_step": 146988, "epoch": 3499} {"train_loss": -6.712307453155518, "global_step": 146989, "epoch": 3499} {"train_loss": -6.914701461791992, "global_step": 146990, "epoch": 3499} {"train_loss": -6.644753456115723, "global_step": 146991, "epoch": 3499} {"train_loss": -6.834164619445801, "global_step": 146992, "epoch": 3499} {"train_loss": -6.761075019836426, "global_step": 146993, "epoch": 3499} {"train_loss": -6.879094123840332, "global_step": 146994, "epoch": 3499} {"train_loss": -6.902243614196777, "global_step": 146995, "epoch": 3499} {"train_loss": -6.853146553039551, "global_step": 146996, "epoch": 3499} {"train_loss": -6.72363805770874, "global_step": 146997, "epoch": 3499} {"train_loss": -6.798535346984863, "global_step": 146998, "epoch": 3499} {"train_loss": -6.816289867673602, "global_step": 146999, "epoch": 3499, "val_loss": 68367.6875} {"train_loss": -6.761670112609863, "global_step": 147000, "epoch": 3500} {"train_loss": -6.9028730392456055, "global_step": 147001, "epoch": 3500} {"train_loss": -6.8844451904296875, "global_step": 147002, "epoch": 3500} {"train_loss": -6.825222969055176, "global_step": 147003, "epoch": 3500} {"train_loss": -6.766239643096924, "global_step": 147004, "epoch": 3500} {"train_loss": -6.862215042114258, "global_step": 147005, "epoch": 3500} {"train_loss": -6.93954610824585, "global_step": 147006, "epoch": 3500} {"train_loss": -6.74167537689209, "global_step": 147007, "epoch": 3500} {"train_loss": -6.774535655975342, "global_step": 147008, "epoch": 3500} {"train_loss": -6.892919540405273, "global_step": 147009, "epoch": 3500} {"train_loss": -6.725837230682373, "global_step": 147010, "epoch": 3500} {"train_loss": -6.851694107055664, "global_step": 147011, "epoch": 3500} {"train_loss": -6.749808311462402, "global_step": 147012, "epoch": 3500} {"train_loss": -6.857834339141846, "global_step": 147013, "epoch": 3500} {"train_loss": -6.911016464233398, "global_step": 147014, "epoch": 3500} {"train_loss": -6.8400983810424805, "global_step": 147015, "epoch": 3500} {"train_loss": -6.97313117980957, "global_step": 147016, "epoch": 3500} {"train_loss": -6.827105522155762, "global_step": 147017, "epoch": 3500} {"train_loss": -6.838251113891602, "global_step": 147018, "epoch": 3500} {"train_loss": -6.7418060302734375, "global_step": 147019, "epoch": 3500} {"train_loss": -6.764575004577637, "global_step": 147020, "epoch": 3500} {"train_loss": -6.832702159881592, "global_step": 147021, "epoch": 3500} {"train_loss": -6.701554298400879, "global_step": 147022, "epoch": 3500} {"train_loss": -6.864965438842773, "global_step": 147023, "epoch": 3500} {"train_loss": -6.861767292022705, "global_step": 147024, "epoch": 3500} {"train_loss": -6.81561279296875, "global_step": 147025, "epoch": 3500} {"train_loss": -6.84005880355835, "global_step": 147026, "epoch": 3500} {"train_loss": -6.633690357208252, "global_step": 147027, "epoch": 3500} {"train_loss": -6.8366217613220215, "global_step": 147028, "epoch": 3500} {"train_loss": -6.778521537780762, "global_step": 147029, "epoch": 3500} {"train_loss": -6.6213884353637695, "global_step": 147030, "epoch": 3500} {"train_loss": -6.716738224029541, "global_step": 147031, "epoch": 3500} {"train_loss": -6.714658737182617, "global_step": 147032, "epoch": 3500} {"train_loss": -6.778687000274658, "global_step": 147033, "epoch": 3500} {"train_loss": -6.787655830383301, "global_step": 147034, "epoch": 3500} {"train_loss": -6.779332637786865, "global_step": 147035, "epoch": 3500} {"train_loss": -6.81662654876709, "global_step": 147036, "epoch": 3500} {"train_loss": -6.731325149536133, "global_step": 147037, "epoch": 3500} {"train_loss": -6.782589435577393, "global_step": 147038, "epoch": 3500} {"train_loss": -6.740549087524414, "global_step": 147039, "epoch": 3500} {"train_loss": -6.849399566650391, "global_step": 147040, "epoch": 3500} {"train_loss": -6.803605863026211, "global_step": 147041, "epoch": 3500, "train/sim_max_reward_0": 0.27521680607084753, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.593194811025944, "train/sim_max_reward_3": 0.9770891460628192, "train/sim_max_reward_4": 0.3995967908021155, "train/sim_max_reward_5": 0.8921578482773432, "test/sim_max_reward_4400000": 0.20831312672379493, "test/sim_max_reward_4400001": 0.20050353661400597, "test/sim_max_reward_4400002": 0.7103440214456636, "test/sim_max_reward_4400003": 0.9288937776040791, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.3098082674223084, "test/sim_max_reward_4400006": 0.9464533221045496, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.31962191400936696, "test/sim_max_reward_4400009": 0.8136561622925905, "test/sim_max_reward_4400010": 0.19543754820184422, "test/sim_max_reward_4400011": 0.217627935804186, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9896244822059218, "test/sim_max_reward_4400014": 0.1519252124706197, "test/sim_max_reward_4400015": 0.15845498083026294, "test/sim_max_reward_4400016": 0.15605780584304113, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24725151854167213, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9641116507331968, "test/sim_max_reward_4400023": 0.9573169015141907, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.25801899823615526, "test/sim_max_reward_4400026": 0.12327332219666962, "test/sim_max_reward_4400027": 0.042720857389532095, "test/sim_max_reward_4400028": 0.9212627590590887, "test/sim_max_reward_4400029": 0.8464417302744464, "test/sim_max_reward_4400030": 0.9349788637462002, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9206944577063203, "test/sim_max_reward_4400034": 0.9940941811006709, "test/sim_max_reward_4400035": 0.6786698007009557, "test/sim_max_reward_4400036": 0.3316667195754094, "test/sim_max_reward_4400037": 0.9694459411928859, "test/sim_max_reward_4400038": 0.9957449608951134, "test/sim_max_reward_4400039": 0.9507270877177495, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9917355113117599, "test/sim_max_reward_4400042": 0.9458607223240129, "test/sim_max_reward_4400043": 0.9760239448070268, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.958140273713099, "test/sim_max_reward_4400046": 0.33256357782279766, "test/sim_max_reward_4400047": 0.9800493371234844, "test/sim_max_reward_4400048": 0.10006159658084686, "test/sim_max_reward_4400049": 0.9804491781158913, "train/mean_score": 0.6895425670398448, "test/mean_score": 0.5455954577750655, "val_loss": 68364.9375} {"train_loss": -6.793783664703369, "global_step": 147042, "epoch": 3501} {"train_loss": -6.8890485763549805, "global_step": 147043, "epoch": 3501} {"train_loss": -6.8740925788879395, "global_step": 147044, "epoch": 3501} {"train_loss": -6.908651351928711, "global_step": 147045, "epoch": 3501} {"train_loss": -6.799003601074219, "global_step": 147046, "epoch": 3501} {"train_loss": -6.747287750244141, "global_step": 147047, "epoch": 3501} {"train_loss": -6.86460018157959, "global_step": 147048, "epoch": 3501} {"train_loss": -6.841883659362793, "global_step": 147049, "epoch": 3501} {"train_loss": -6.750575542449951, "global_step": 147050, "epoch": 3501} {"train_loss": -6.7609663009643555, "global_step": 147051, "epoch": 3501} {"train_loss": -6.84177303314209, "global_step": 147052, "epoch": 3501} {"train_loss": -6.821437835693359, "global_step": 147053, "epoch": 3501} {"train_loss": -6.773097991943359, "global_step": 147054, "epoch": 3501} {"train_loss": -6.8129425048828125, "global_step": 147055, "epoch": 3501} {"train_loss": -6.698324203491211, "global_step": 147056, "epoch": 3501} {"train_loss": -6.826509475708008, "global_step": 147057, "epoch": 3501} {"train_loss": -6.697780609130859, "global_step": 147058, "epoch": 3501} {"train_loss": -6.603510856628418, "global_step": 147059, "epoch": 3501} {"train_loss": -6.72189474105835, "global_step": 147060, "epoch": 3501} {"train_loss": -6.567734718322754, "global_step": 147061, "epoch": 3501} {"train_loss": -6.740453720092773, "global_step": 147062, "epoch": 3501} {"train_loss": -6.796622276306152, "global_step": 147063, "epoch": 3501} {"train_loss": -6.627531051635742, "global_step": 147064, "epoch": 3501} {"train_loss": -6.8281755447387695, "global_step": 147065, "epoch": 3501} {"train_loss": -6.721118927001953, "global_step": 147066, "epoch": 3501} {"train_loss": -6.78279447555542, "global_step": 147067, "epoch": 3501} {"train_loss": -6.726505279541016, "global_step": 147068, "epoch": 3501} {"train_loss": -6.612104415893555, "global_step": 147069, "epoch": 3501} {"train_loss": -6.69895076751709, "global_step": 147070, "epoch": 3501} {"train_loss": -6.777515888214111, "global_step": 147071, "epoch": 3501} {"train_loss": -6.66763162612915, "global_step": 147072, "epoch": 3501} {"train_loss": -6.83968448638916, "global_step": 147073, "epoch": 3501} {"train_loss": -6.771719932556152, "global_step": 147074, "epoch": 3501} {"train_loss": -6.680564880371094, "global_step": 147075, "epoch": 3501} {"train_loss": -6.692697525024414, "global_step": 147076, "epoch": 3501} {"train_loss": -6.779246807098389, "global_step": 147077, "epoch": 3501} {"train_loss": -6.79259729385376, "global_step": 147078, "epoch": 3501} {"train_loss": -6.764955520629883, "global_step": 147079, "epoch": 3501} {"train_loss": -6.806048393249512, "global_step": 147080, "epoch": 3501} {"train_loss": -6.653531074523926, "global_step": 147081, "epoch": 3501} {"train_loss": -6.926516056060791, "global_step": 147082, "epoch": 3501} {"train_loss": -6.763102077302479, "global_step": 147083, "epoch": 3501, "val_loss": 68359.875} {"train_loss": -6.731862545013428, "global_step": 147084, "epoch": 3502} {"train_loss": -6.807013988494873, "global_step": 147085, "epoch": 3502} {"train_loss": -6.788809776306152, "global_step": 147086, "epoch": 3502} {"train_loss": -6.506206512451172, "global_step": 147087, "epoch": 3502} {"train_loss": -6.806850910186768, "global_step": 147088, "epoch": 3502} {"train_loss": -6.823366165161133, "global_step": 147089, "epoch": 3502} {"train_loss": -6.770478248596191, "global_step": 147090, "epoch": 3502} {"train_loss": -6.8187575340271, "global_step": 147091, "epoch": 3502} {"train_loss": -6.7275471687316895, "global_step": 147092, "epoch": 3502} {"train_loss": -6.6738457679748535, "global_step": 147093, "epoch": 3502} {"train_loss": -6.707418441772461, "global_step": 147094, "epoch": 3502} {"train_loss": -6.7569475173950195, "global_step": 147095, "epoch": 3502} {"train_loss": -6.809831619262695, "global_step": 147096, "epoch": 3502} {"train_loss": -6.751307964324951, "global_step": 147097, "epoch": 3502} {"train_loss": -6.783725738525391, "global_step": 147098, "epoch": 3502} {"train_loss": -6.737421035766602, "global_step": 147099, "epoch": 3502} {"train_loss": -6.5428876876831055, "global_step": 147100, "epoch": 3502} {"train_loss": -6.715343952178955, "global_step": 147101, "epoch": 3502} {"train_loss": -6.702401638031006, "global_step": 147102, "epoch": 3502} {"train_loss": -6.757421970367432, "global_step": 147103, "epoch": 3502} {"train_loss": -6.781159400939941, "global_step": 147104, "epoch": 3502} {"train_loss": -6.58648681640625, "global_step": 147105, "epoch": 3502} {"train_loss": -6.676113128662109, "global_step": 147106, "epoch": 3502} {"train_loss": -6.738485336303711, "global_step": 147107, "epoch": 3502} {"train_loss": -6.614105224609375, "global_step": 147108, "epoch": 3502} {"train_loss": -6.838879108428955, "global_step": 147109, "epoch": 3502} {"train_loss": -6.7565388679504395, "global_step": 147110, "epoch": 3502} {"train_loss": -6.852222442626953, "global_step": 147111, "epoch": 3502} {"train_loss": -6.779604911804199, "global_step": 147112, "epoch": 3502} {"train_loss": -6.718505859375, "global_step": 147113, "epoch": 3502} {"train_loss": -6.8400797843933105, "global_step": 147114, "epoch": 3502} {"train_loss": -6.847771644592285, "global_step": 147115, "epoch": 3502} {"train_loss": -6.778060436248779, "global_step": 147116, "epoch": 3502} {"train_loss": -6.763672351837158, "global_step": 147117, "epoch": 3502} {"train_loss": -6.705819129943848, "global_step": 147118, "epoch": 3502} {"train_loss": -6.776836395263672, "global_step": 147119, "epoch": 3502} {"train_loss": -6.724072456359863, "global_step": 147120, "epoch": 3502} {"train_loss": -6.791766166687012, "global_step": 147121, "epoch": 3502} {"train_loss": -6.69722843170166, "global_step": 147122, "epoch": 3502} {"train_loss": -6.806449890136719, "global_step": 147123, "epoch": 3502} {"train_loss": -6.622615814208984, "global_step": 147124, "epoch": 3502} {"train_loss": -6.742438123339698, "global_step": 147125, "epoch": 3502, "val_loss": 68509.1796875} {"train_loss": -6.764864444732666, "global_step": 147126, "epoch": 3503} {"train_loss": -6.704107284545898, "global_step": 147127, "epoch": 3503} {"train_loss": -6.835498809814453, "global_step": 147128, "epoch": 3503} {"train_loss": -6.812123775482178, "global_step": 147129, "epoch": 3503} {"train_loss": -6.849544525146484, "global_step": 147130, "epoch": 3503} {"train_loss": -6.79924201965332, "global_step": 147131, "epoch": 3503} {"train_loss": -6.713316440582275, "global_step": 147132, "epoch": 3503} {"train_loss": -6.815914630889893, "global_step": 147133, "epoch": 3503} {"train_loss": -6.917469024658203, "global_step": 147134, "epoch": 3503} {"train_loss": -6.807881832122803, "global_step": 147135, "epoch": 3503} {"train_loss": -6.731966018676758, "global_step": 147136, "epoch": 3503} {"train_loss": -6.662411689758301, "global_step": 147137, "epoch": 3503} {"train_loss": -6.793558597564697, "global_step": 147138, "epoch": 3503} {"train_loss": -6.759505271911621, "global_step": 147139, "epoch": 3503} {"train_loss": -6.749293804168701, "global_step": 147140, "epoch": 3503} {"train_loss": -6.832492828369141, "global_step": 147141, "epoch": 3503} {"train_loss": -6.853255271911621, "global_step": 147142, "epoch": 3503} {"train_loss": -6.851250648498535, "global_step": 147143, "epoch": 3503} {"train_loss": -6.825341701507568, "global_step": 147144, "epoch": 3503} {"train_loss": -6.790390491485596, "global_step": 147145, "epoch": 3503} {"train_loss": -6.78079891204834, "global_step": 147146, "epoch": 3503} {"train_loss": -6.741373538970947, "global_step": 147147, "epoch": 3503} {"train_loss": -6.776432037353516, "global_step": 147148, "epoch": 3503} {"train_loss": -6.846643924713135, "global_step": 147149, "epoch": 3503} {"train_loss": -6.892545700073242, "global_step": 147150, "epoch": 3503} {"train_loss": -6.779901027679443, "global_step": 147151, "epoch": 3503} {"train_loss": -6.779908180236816, "global_step": 147152, "epoch": 3503} {"train_loss": -6.689535140991211, "global_step": 147153, "epoch": 3503} {"train_loss": -6.852239608764648, "global_step": 147154, "epoch": 3503} {"train_loss": -6.7879462242126465, "global_step": 147155, "epoch": 3503} {"train_loss": -6.855069160461426, "global_step": 147156, "epoch": 3503} {"train_loss": -6.70681095123291, "global_step": 147157, "epoch": 3503} {"train_loss": -6.832649230957031, "global_step": 147158, "epoch": 3503} {"train_loss": -6.822388172149658, "global_step": 147159, "epoch": 3503} {"train_loss": -6.838320732116699, "global_step": 147160, "epoch": 3503} {"train_loss": -6.684241771697998, "global_step": 147161, "epoch": 3503} {"train_loss": -6.824254989624023, "global_step": 147162, "epoch": 3503} {"train_loss": -6.811917304992676, "global_step": 147163, "epoch": 3503} {"train_loss": -6.668584823608398, "global_step": 147164, "epoch": 3503} {"train_loss": -6.850292205810547, "global_step": 147165, "epoch": 3503} {"train_loss": -6.724365234375, "global_step": 147166, "epoch": 3503} {"train_loss": -6.791169325510661, "global_step": 147167, "epoch": 3503, "val_loss": 68473.421875} {"train_loss": -6.835765838623047, "global_step": 147168, "epoch": 3504} {"train_loss": -6.821344375610352, "global_step": 147169, "epoch": 3504} {"train_loss": -6.752011299133301, "global_step": 147170, "epoch": 3504} {"train_loss": -6.740165710449219, "global_step": 147171, "epoch": 3504} {"train_loss": -6.793149471282959, "global_step": 147172, "epoch": 3504} {"train_loss": -6.855930328369141, "global_step": 147173, "epoch": 3504} {"train_loss": -6.825860023498535, "global_step": 147174, "epoch": 3504} {"train_loss": -6.898961067199707, "global_step": 147175, "epoch": 3504} {"train_loss": -6.845134735107422, "global_step": 147176, "epoch": 3504} {"train_loss": -6.8338212966918945, "global_step": 147177, "epoch": 3504} {"train_loss": -6.906657695770264, "global_step": 147178, "epoch": 3504} {"train_loss": -6.749642372131348, "global_step": 147179, "epoch": 3504} {"train_loss": -6.821385383605957, "global_step": 147180, "epoch": 3504} {"train_loss": -6.764126777648926, "global_step": 147181, "epoch": 3504} {"train_loss": -6.8115434646606445, "global_step": 147182, "epoch": 3504} {"train_loss": -6.793423175811768, "global_step": 147183, "epoch": 3504} {"train_loss": -6.656367301940918, "global_step": 147184, "epoch": 3504} {"train_loss": -6.9382524490356445, "global_step": 147185, "epoch": 3504} {"train_loss": -6.836804389953613, "global_step": 147186, "epoch": 3504} {"train_loss": -6.777724266052246, "global_step": 147187, "epoch": 3504} {"train_loss": -6.904638767242432, "global_step": 147188, "epoch": 3504} {"train_loss": -6.668858528137207, "global_step": 147189, "epoch": 3504} {"train_loss": -6.853900909423828, "global_step": 147190, "epoch": 3504} {"train_loss": -6.784843444824219, "global_step": 147191, "epoch": 3504} {"train_loss": -6.740577220916748, "global_step": 147192, "epoch": 3504} {"train_loss": -6.731154918670654, "global_step": 147193, "epoch": 3504} {"train_loss": -6.726970672607422, "global_step": 147194, "epoch": 3504} {"train_loss": -6.677708625793457, "global_step": 147195, "epoch": 3504} {"train_loss": -6.7509002685546875, "global_step": 147196, "epoch": 3504} {"train_loss": -6.751015663146973, "global_step": 147197, "epoch": 3504} {"train_loss": -6.7038726806640625, "global_step": 147198, "epoch": 3504} {"train_loss": -6.842639446258545, "global_step": 147199, "epoch": 3504} {"train_loss": -6.695429801940918, "global_step": 147200, "epoch": 3504} {"train_loss": -6.602386474609375, "global_step": 147201, "epoch": 3504} {"train_loss": -6.730149269104004, "global_step": 147202, "epoch": 3504} {"train_loss": -6.567795276641846, "global_step": 147203, "epoch": 3504} {"train_loss": -6.742105484008789, "global_step": 147204, "epoch": 3504} {"train_loss": -6.762274265289307, "global_step": 147205, "epoch": 3504} {"train_loss": -6.687166213989258, "global_step": 147206, "epoch": 3504} {"train_loss": -6.840595245361328, "global_step": 147207, "epoch": 3504} {"train_loss": -6.688287734985352, "global_step": 147208, "epoch": 3504} {"train_loss": -6.772106238773891, "global_step": 147209, "epoch": 3504, "val_loss": 68534.875} {"train_loss": -6.755293846130371, "global_step": 147210, "epoch": 3505} {"train_loss": -6.774711608886719, "global_step": 147211, "epoch": 3505} {"train_loss": -6.71798038482666, "global_step": 147212, "epoch": 3505} {"train_loss": -6.744321823120117, "global_step": 147213, "epoch": 3505} {"train_loss": -6.883963584899902, "global_step": 147214, "epoch": 3505} {"train_loss": -6.850027084350586, "global_step": 147215, "epoch": 3505} {"train_loss": -6.668286323547363, "global_step": 147216, "epoch": 3505} {"train_loss": -6.783426284790039, "global_step": 147217, "epoch": 3505} {"train_loss": -6.76711368560791, "global_step": 147218, "epoch": 3505} {"train_loss": -6.800161361694336, "global_step": 147219, "epoch": 3505} {"train_loss": -6.73686408996582, "global_step": 147220, "epoch": 3505} {"train_loss": -6.76783561706543, "global_step": 147221, "epoch": 3505} {"train_loss": -6.761991024017334, "global_step": 147222, "epoch": 3505} {"train_loss": -6.783378601074219, "global_step": 147223, "epoch": 3505} {"train_loss": -6.783294200897217, "global_step": 147224, "epoch": 3505} {"train_loss": -6.751524448394775, "global_step": 147225, "epoch": 3505} {"train_loss": -6.866131782531738, "global_step": 147226, "epoch": 3505} {"train_loss": -6.738590240478516, "global_step": 147227, "epoch": 3505} {"train_loss": -6.711933135986328, "global_step": 147228, "epoch": 3505} {"train_loss": -6.692111015319824, "global_step": 147229, "epoch": 3505} {"train_loss": -6.915679931640625, "global_step": 147230, "epoch": 3505} {"train_loss": -6.896759986877441, "global_step": 147231, "epoch": 3505} {"train_loss": -6.90070104598999, "global_step": 147232, "epoch": 3505} {"train_loss": -6.7411932945251465, "global_step": 147233, "epoch": 3505} {"train_loss": -6.923462867736816, "global_step": 147234, "epoch": 3505} {"train_loss": -6.811361312866211, "global_step": 147235, "epoch": 3505} {"train_loss": -6.737663269042969, "global_step": 147236, "epoch": 3505} {"train_loss": -6.854561805725098, "global_step": 147237, "epoch": 3505} {"train_loss": -6.775900840759277, "global_step": 147238, "epoch": 3505} {"train_loss": -6.802375793457031, "global_step": 147239, "epoch": 3505} {"train_loss": -6.797381401062012, "global_step": 147240, "epoch": 3505} {"train_loss": -7.004140377044678, "global_step": 147241, "epoch": 3505} {"train_loss": -6.90837287902832, "global_step": 147242, "epoch": 3505} {"train_loss": -6.9277143478393555, "global_step": 147243, "epoch": 3505} {"train_loss": -6.822294235229492, "global_step": 147244, "epoch": 3505} {"train_loss": -6.740175247192383, "global_step": 147245, "epoch": 3505} {"train_loss": -6.922380447387695, "global_step": 147246, "epoch": 3505} {"train_loss": -6.716339588165283, "global_step": 147247, "epoch": 3505} {"train_loss": -6.764863967895508, "global_step": 147248, "epoch": 3505} {"train_loss": -6.775522708892822, "global_step": 147249, "epoch": 3505} {"train_loss": -6.824345588684082, "global_step": 147250, "epoch": 3505} {"train_loss": -6.8038185551053, "global_step": 147251, "epoch": 3505, "val_loss": 68251.6796875} {"train_loss": -6.97585916519165, "global_step": 147252, "epoch": 3506} {"train_loss": -6.782009124755859, "global_step": 147253, "epoch": 3506} {"train_loss": -6.867240905761719, "global_step": 147254, "epoch": 3506} {"train_loss": -6.76906681060791, "global_step": 147255, "epoch": 3506} {"train_loss": -6.674069881439209, "global_step": 147256, "epoch": 3506} {"train_loss": -6.873941421508789, "global_step": 147257, "epoch": 3506} {"train_loss": -6.792107582092285, "global_step": 147258, "epoch": 3506} {"train_loss": -6.7265305519104, "global_step": 147259, "epoch": 3506} {"train_loss": -6.692545413970947, "global_step": 147260, "epoch": 3506} {"train_loss": -6.782947540283203, "global_step": 147261, "epoch": 3506} {"train_loss": -6.774528503417969, "global_step": 147262, "epoch": 3506} {"train_loss": -6.642683982849121, "global_step": 147263, "epoch": 3506} {"train_loss": -6.777069091796875, "global_step": 147264, "epoch": 3506} {"train_loss": -6.77882194519043, "global_step": 147265, "epoch": 3506} {"train_loss": -6.731215953826904, "global_step": 147266, "epoch": 3506} {"train_loss": -6.802277088165283, "global_step": 147267, "epoch": 3506} {"train_loss": -6.722655773162842, "global_step": 147268, "epoch": 3506} {"train_loss": -6.757246971130371, "global_step": 147269, "epoch": 3506} {"train_loss": -6.731106281280518, "global_step": 147270, "epoch": 3506} {"train_loss": -6.754873752593994, "global_step": 147271, "epoch": 3506} {"train_loss": -6.7429094314575195, "global_step": 147272, "epoch": 3506} {"train_loss": -6.708192348480225, "global_step": 147273, "epoch": 3506} {"train_loss": -6.640551567077637, "global_step": 147274, "epoch": 3506} {"train_loss": -6.7131123542785645, "global_step": 147275, "epoch": 3506} {"train_loss": -6.4999098777771, "global_step": 147276, "epoch": 3506} {"train_loss": -6.719114303588867, "global_step": 147277, "epoch": 3506} {"train_loss": -6.688262939453125, "global_step": 147278, "epoch": 3506} {"train_loss": -6.68303918838501, "global_step": 147279, "epoch": 3506} {"train_loss": -6.697873115539551, "global_step": 147280, "epoch": 3506} {"train_loss": -6.5725016593933105, "global_step": 147281, "epoch": 3506} {"train_loss": -6.760443687438965, "global_step": 147282, "epoch": 3506} {"train_loss": -6.699880123138428, "global_step": 147283, "epoch": 3506} {"train_loss": -6.682013511657715, "global_step": 147284, "epoch": 3506} {"train_loss": -6.694334983825684, "global_step": 147285, "epoch": 3506} {"train_loss": -6.705456733703613, "global_step": 147286, "epoch": 3506} {"train_loss": -6.640958786010742, "global_step": 147287, "epoch": 3506} {"train_loss": -6.735240936279297, "global_step": 147288, "epoch": 3506} {"train_loss": -6.671708583831787, "global_step": 147289, "epoch": 3506} {"train_loss": -6.778842926025391, "global_step": 147290, "epoch": 3506} {"train_loss": -6.809482097625732, "global_step": 147291, "epoch": 3506} {"train_loss": -6.672159194946289, "global_step": 147292, "epoch": 3506} {"train_loss": -6.729823498498826, "global_step": 147293, "epoch": 3506, "val_loss": 68387.5859375} {"train_loss": -6.74652624130249, "global_step": 147294, "epoch": 3507} {"train_loss": -6.65894889831543, "global_step": 147295, "epoch": 3507} {"train_loss": -6.643668174743652, "global_step": 147296, "epoch": 3507} {"train_loss": -6.630917549133301, "global_step": 147297, "epoch": 3507} {"train_loss": -6.703183174133301, "global_step": 147298, "epoch": 3507} {"train_loss": -6.717949390411377, "global_step": 147299, "epoch": 3507} {"train_loss": -6.803424835205078, "global_step": 147300, "epoch": 3507} {"train_loss": -6.638326168060303, "global_step": 147301, "epoch": 3507} {"train_loss": -6.8354997634887695, "global_step": 147302, "epoch": 3507} {"train_loss": -6.7343525886535645, "global_step": 147303, "epoch": 3507} {"train_loss": -6.833209037780762, "global_step": 147304, "epoch": 3507} {"train_loss": -6.822732925415039, "global_step": 147305, "epoch": 3507} {"train_loss": -6.710637092590332, "global_step": 147306, "epoch": 3507} {"train_loss": -6.887102127075195, "global_step": 147307, "epoch": 3507} {"train_loss": -6.74957275390625, "global_step": 147308, "epoch": 3507} {"train_loss": -6.71614933013916, "global_step": 147309, "epoch": 3507} {"train_loss": -6.770902633666992, "global_step": 147310, "epoch": 3507} {"train_loss": -6.840859889984131, "global_step": 147311, "epoch": 3507} {"train_loss": -6.806961536407471, "global_step": 147312, "epoch": 3507} {"train_loss": -6.814543724060059, "global_step": 147313, "epoch": 3507} {"train_loss": -6.61982536315918, "global_step": 147314, "epoch": 3507} {"train_loss": -6.8119683265686035, "global_step": 147315, "epoch": 3507} {"train_loss": -6.791407585144043, "global_step": 147316, "epoch": 3507} {"train_loss": -6.752046585083008, "global_step": 147317, "epoch": 3507} {"train_loss": -6.800422668457031, "global_step": 147318, "epoch": 3507} {"train_loss": -6.702373027801514, "global_step": 147319, "epoch": 3507} {"train_loss": -6.767378807067871, "global_step": 147320, "epoch": 3507} {"train_loss": -6.651046276092529, "global_step": 147321, "epoch": 3507} {"train_loss": -6.726673126220703, "global_step": 147322, "epoch": 3507} {"train_loss": -6.697500228881836, "global_step": 147323, "epoch": 3507} {"train_loss": -6.679126739501953, "global_step": 147324, "epoch": 3507} {"train_loss": -6.819097518920898, "global_step": 147325, "epoch": 3507} {"train_loss": -6.696206092834473, "global_step": 147326, "epoch": 3507} {"train_loss": -6.641087532043457, "global_step": 147327, "epoch": 3507} {"train_loss": -6.853827476501465, "global_step": 147328, "epoch": 3507} {"train_loss": -6.728157043457031, "global_step": 147329, "epoch": 3507} {"train_loss": -6.897946834564209, "global_step": 147330, "epoch": 3507} {"train_loss": -6.664012432098389, "global_step": 147331, "epoch": 3507} {"train_loss": -6.78574275970459, "global_step": 147332, "epoch": 3507} {"train_loss": -6.67429256439209, "global_step": 147333, "epoch": 3507} {"train_loss": -6.780839920043945, "global_step": 147334, "epoch": 3507} {"train_loss": -6.74549134572347, "global_step": 147335, "epoch": 3507, "val_loss": 68486.5703125} {"train_loss": -6.800260543823242, "global_step": 147336, "epoch": 3508} {"train_loss": -6.642292499542236, "global_step": 147337, "epoch": 3508} {"train_loss": -6.858205795288086, "global_step": 147338, "epoch": 3508} {"train_loss": -6.824804782867432, "global_step": 147339, "epoch": 3508} {"train_loss": -6.79578971862793, "global_step": 147340, "epoch": 3508} {"train_loss": -6.849801063537598, "global_step": 147341, "epoch": 3508} {"train_loss": -6.737170219421387, "global_step": 147342, "epoch": 3508} {"train_loss": -6.767985820770264, "global_step": 147343, "epoch": 3508} {"train_loss": -6.769904136657715, "global_step": 147344, "epoch": 3508} {"train_loss": -6.713761329650879, "global_step": 147345, "epoch": 3508} {"train_loss": -6.826797008514404, "global_step": 147346, "epoch": 3508} {"train_loss": -6.746664047241211, "global_step": 147347, "epoch": 3508} {"train_loss": -6.755492210388184, "global_step": 147348, "epoch": 3508} {"train_loss": -6.825590133666992, "global_step": 147349, "epoch": 3508} {"train_loss": -6.906043529510498, "global_step": 147350, "epoch": 3508} {"train_loss": -6.751272201538086, "global_step": 147351, "epoch": 3508} {"train_loss": -6.787562370300293, "global_step": 147352, "epoch": 3508} {"train_loss": -6.827210903167725, "global_step": 147353, "epoch": 3508} {"train_loss": -6.786880016326904, "global_step": 147354, "epoch": 3508} {"train_loss": -6.890743255615234, "global_step": 147355, "epoch": 3508} {"train_loss": -6.8141279220581055, "global_step": 147356, "epoch": 3508} {"train_loss": -6.862831115722656, "global_step": 147357, "epoch": 3508} {"train_loss": -6.8399858474731445, "global_step": 147358, "epoch": 3508} {"train_loss": -6.713029384613037, "global_step": 147359, "epoch": 3508} {"train_loss": -6.7587785720825195, "global_step": 147360, "epoch": 3508} {"train_loss": -6.779301166534424, "global_step": 147361, "epoch": 3508} {"train_loss": -6.8409223556518555, "global_step": 147362, "epoch": 3508} {"train_loss": -6.675384521484375, "global_step": 147363, "epoch": 3508} {"train_loss": -6.781389236450195, "global_step": 147364, "epoch": 3508} {"train_loss": -6.802717208862305, "global_step": 147365, "epoch": 3508} {"train_loss": -6.690106391906738, "global_step": 147366, "epoch": 3508} {"train_loss": -6.725917816162109, "global_step": 147367, "epoch": 3508} {"train_loss": -6.61855411529541, "global_step": 147368, "epoch": 3508} {"train_loss": -6.909672737121582, "global_step": 147369, "epoch": 3508} {"train_loss": -6.831181049346924, "global_step": 147370, "epoch": 3508} {"train_loss": -6.763644218444824, "global_step": 147371, "epoch": 3508} {"train_loss": -6.705806732177734, "global_step": 147372, "epoch": 3508} {"train_loss": -6.775500297546387, "global_step": 147373, "epoch": 3508} {"train_loss": -6.868354797363281, "global_step": 147374, "epoch": 3508} {"train_loss": -6.8289690017700195, "global_step": 147375, "epoch": 3508} {"train_loss": -6.842199325561523, "global_step": 147376, "epoch": 3508} {"train_loss": -6.7880465757279165, "global_step": 147377, "epoch": 3508, "val_loss": 68295.8203125} {"train_loss": -6.835089683532715, "global_step": 147378, "epoch": 3509} {"train_loss": -6.8567986488342285, "global_step": 147379, "epoch": 3509} {"train_loss": -6.81545877456665, "global_step": 147380, "epoch": 3509} {"train_loss": -6.814852714538574, "global_step": 147381, "epoch": 3509} {"train_loss": -6.779117584228516, "global_step": 147382, "epoch": 3509} {"train_loss": -6.893232345581055, "global_step": 147383, "epoch": 3509} {"train_loss": -6.615947246551514, "global_step": 147384, "epoch": 3509} {"train_loss": -6.7736334800720215, "global_step": 147385, "epoch": 3509} {"train_loss": -6.809328556060791, "global_step": 147386, "epoch": 3509} {"train_loss": -6.712553977966309, "global_step": 147387, "epoch": 3509} {"train_loss": -6.761692047119141, "global_step": 147388, "epoch": 3509} {"train_loss": -6.756219387054443, "global_step": 147389, "epoch": 3509} {"train_loss": -6.658161163330078, "global_step": 147390, "epoch": 3509} {"train_loss": -6.855637550354004, "global_step": 147391, "epoch": 3509} {"train_loss": -6.740574359893799, "global_step": 147392, "epoch": 3509} {"train_loss": -6.678490161895752, "global_step": 147393, "epoch": 3509} {"train_loss": -6.807052135467529, "global_step": 147394, "epoch": 3509} {"train_loss": -6.6932806968688965, "global_step": 147395, "epoch": 3509} {"train_loss": -6.761327266693115, "global_step": 147396, "epoch": 3509} {"train_loss": -6.768862247467041, "global_step": 147397, "epoch": 3509} {"train_loss": -6.713212013244629, "global_step": 147398, "epoch": 3509} {"train_loss": -6.911042213439941, "global_step": 147399, "epoch": 3509} {"train_loss": -6.717840194702148, "global_step": 147400, "epoch": 3509} {"train_loss": -6.75015926361084, "global_step": 147401, "epoch": 3509} {"train_loss": -6.83437442779541, "global_step": 147402, "epoch": 3509} {"train_loss": -6.83758544921875, "global_step": 147403, "epoch": 3509} {"train_loss": -6.816269397735596, "global_step": 147404, "epoch": 3509} {"train_loss": -6.883200645446777, "global_step": 147405, "epoch": 3509} {"train_loss": -6.720403671264648, "global_step": 147406, "epoch": 3509} {"train_loss": -6.686412811279297, "global_step": 147407, "epoch": 3509} {"train_loss": -6.639324188232422, "global_step": 147408, "epoch": 3509} {"train_loss": -6.876766681671143, "global_step": 147409, "epoch": 3509} {"train_loss": -6.787004470825195, "global_step": 147410, "epoch": 3509} {"train_loss": -6.83203649520874, "global_step": 147411, "epoch": 3509} {"train_loss": -6.7552337646484375, "global_step": 147412, "epoch": 3509} {"train_loss": -6.7249755859375, "global_step": 147413, "epoch": 3509} {"train_loss": -6.777745246887207, "global_step": 147414, "epoch": 3509} {"train_loss": -6.871562957763672, "global_step": 147415, "epoch": 3509} {"train_loss": -6.81557559967041, "global_step": 147416, "epoch": 3509} {"train_loss": -6.78286075592041, "global_step": 147417, "epoch": 3509} {"train_loss": -6.787169456481934, "global_step": 147418, "epoch": 3509} {"train_loss": -6.778784002576556, "global_step": 147419, "epoch": 3509, "val_loss": 68272.375} {"train_loss": -6.893915176391602, "global_step": 147420, "epoch": 3510} {"train_loss": -6.78655481338501, "global_step": 147421, "epoch": 3510} {"train_loss": -6.857120513916016, "global_step": 147422, "epoch": 3510} {"train_loss": -6.8322906494140625, "global_step": 147423, "epoch": 3510} {"train_loss": -6.71495246887207, "global_step": 147424, "epoch": 3510} {"train_loss": -6.80043363571167, "global_step": 147425, "epoch": 3510} {"train_loss": -6.807581901550293, "global_step": 147426, "epoch": 3510} {"train_loss": -6.7270894050598145, "global_step": 147427, "epoch": 3510} {"train_loss": -6.908940315246582, "global_step": 147428, "epoch": 3510} {"train_loss": -6.6869916915893555, "global_step": 147429, "epoch": 3510} {"train_loss": -6.781312465667725, "global_step": 147430, "epoch": 3510} {"train_loss": -6.745051383972168, "global_step": 147431, "epoch": 3510} {"train_loss": -6.681232929229736, "global_step": 147432, "epoch": 3510} {"train_loss": -6.810486793518066, "global_step": 147433, "epoch": 3510} {"train_loss": -6.565693378448486, "global_step": 147434, "epoch": 3510} {"train_loss": -6.923092842102051, "global_step": 147435, "epoch": 3510} {"train_loss": -6.726314067840576, "global_step": 147436, "epoch": 3510} {"train_loss": -6.6894450187683105, "global_step": 147437, "epoch": 3510} {"train_loss": -6.839519500732422, "global_step": 147438, "epoch": 3510} {"train_loss": -6.712770462036133, "global_step": 147439, "epoch": 3510} {"train_loss": -6.874053001403809, "global_step": 147440, "epoch": 3510} {"train_loss": -6.764922142028809, "global_step": 147441, "epoch": 3510} {"train_loss": -6.920165061950684, "global_step": 147442, "epoch": 3510} {"train_loss": -6.819366455078125, "global_step": 147443, "epoch": 3510} {"train_loss": -6.741161346435547, "global_step": 147444, "epoch": 3510} {"train_loss": -6.804587364196777, "global_step": 147445, "epoch": 3510} {"train_loss": -6.695174217224121, "global_step": 147446, "epoch": 3510} {"train_loss": -6.834577560424805, "global_step": 147447, "epoch": 3510} {"train_loss": -6.809299468994141, "global_step": 147448, "epoch": 3510} {"train_loss": -6.830634593963623, "global_step": 147449, "epoch": 3510} {"train_loss": -6.807591438293457, "global_step": 147450, "epoch": 3510} {"train_loss": -6.773053169250488, "global_step": 147451, "epoch": 3510} {"train_loss": -6.71943473815918, "global_step": 147452, "epoch": 3510} {"train_loss": -6.6870598793029785, "global_step": 147453, "epoch": 3510} {"train_loss": -6.8053789138793945, "global_step": 147454, "epoch": 3510} {"train_loss": -6.781106948852539, "global_step": 147455, "epoch": 3510} {"train_loss": -6.6854248046875, "global_step": 147456, "epoch": 3510} {"train_loss": -6.732396125793457, "global_step": 147457, "epoch": 3510} {"train_loss": -6.735733509063721, "global_step": 147458, "epoch": 3510} {"train_loss": -6.860066890716553, "global_step": 147459, "epoch": 3510} {"train_loss": -6.7401604652404785, "global_step": 147460, "epoch": 3510} {"train_loss": -6.776433990115211, "global_step": 147461, "epoch": 3510, "val_loss": 68358.0390625} {"train_loss": -6.7716474533081055, "global_step": 147462, "epoch": 3511} {"train_loss": -6.778738975524902, "global_step": 147463, "epoch": 3511} {"train_loss": -6.718757629394531, "global_step": 147464, "epoch": 3511} {"train_loss": -6.769350051879883, "global_step": 147465, "epoch": 3511} {"train_loss": -6.730792045593262, "global_step": 147466, "epoch": 3511} {"train_loss": -6.792472839355469, "global_step": 147467, "epoch": 3511} {"train_loss": -6.7416510581970215, "global_step": 147468, "epoch": 3511} {"train_loss": -6.78430700302124, "global_step": 147469, "epoch": 3511} {"train_loss": -6.821047782897949, "global_step": 147470, "epoch": 3511} {"train_loss": -6.683184623718262, "global_step": 147471, "epoch": 3511} {"train_loss": -6.8085198402404785, "global_step": 147472, "epoch": 3511} {"train_loss": -6.856801986694336, "global_step": 147473, "epoch": 3511} {"train_loss": -6.766596794128418, "global_step": 147474, "epoch": 3511} {"train_loss": -6.8076019287109375, "global_step": 147475, "epoch": 3511} {"train_loss": -6.8093485832214355, "global_step": 147476, "epoch": 3511} {"train_loss": -6.828470706939697, "global_step": 147477, "epoch": 3511} {"train_loss": -6.821387767791748, "global_step": 147478, "epoch": 3511} {"train_loss": -6.837285041809082, "global_step": 147479, "epoch": 3511} {"train_loss": -6.811570167541504, "global_step": 147480, "epoch": 3511} {"train_loss": -6.810840606689453, "global_step": 147481, "epoch": 3511} {"train_loss": -6.844744682312012, "global_step": 147482, "epoch": 3511} {"train_loss": -6.762381076812744, "global_step": 147483, "epoch": 3511} {"train_loss": -6.776206016540527, "global_step": 147484, "epoch": 3511} {"train_loss": -6.639278411865234, "global_step": 147485, "epoch": 3511} {"train_loss": -6.843376159667969, "global_step": 147486, "epoch": 3511} {"train_loss": -6.836946487426758, "global_step": 147487, "epoch": 3511} {"train_loss": -6.751941680908203, "global_step": 147488, "epoch": 3511} {"train_loss": -6.841740608215332, "global_step": 147489, "epoch": 3511} {"train_loss": -6.798462867736816, "global_step": 147490, "epoch": 3511} {"train_loss": -6.813896179199219, "global_step": 147491, "epoch": 3511} {"train_loss": -6.803743362426758, "global_step": 147492, "epoch": 3511} {"train_loss": -6.827160835266113, "global_step": 147493, "epoch": 3511} {"train_loss": -6.879292011260986, "global_step": 147494, "epoch": 3511} {"train_loss": -6.8321685791015625, "global_step": 147495, "epoch": 3511} {"train_loss": -6.881865978240967, "global_step": 147496, "epoch": 3511} {"train_loss": -6.870844841003418, "global_step": 147497, "epoch": 3511} {"train_loss": -6.830706596374512, "global_step": 147498, "epoch": 3511} {"train_loss": -6.759105205535889, "global_step": 147499, "epoch": 3511} {"train_loss": -6.810985565185547, "global_step": 147500, "epoch": 3511} {"train_loss": -6.832404613494873, "global_step": 147501, "epoch": 3511} {"train_loss": -6.7759246826171875, "global_step": 147502, "epoch": 3511} {"train_loss": -6.796758106776646, "global_step": 147503, "epoch": 3511, "val_loss": 68392.609375} {"train_loss": -6.692392349243164, "global_step": 147504, "epoch": 3512} {"train_loss": -6.880794525146484, "global_step": 147505, "epoch": 3512} {"train_loss": -6.87631368637085, "global_step": 147506, "epoch": 3512} {"train_loss": -6.851858139038086, "global_step": 147507, "epoch": 3512} {"train_loss": -6.7733259201049805, "global_step": 147508, "epoch": 3512} {"train_loss": -6.835600852966309, "global_step": 147509, "epoch": 3512} {"train_loss": -6.830273628234863, "global_step": 147510, "epoch": 3512} {"train_loss": -6.798579216003418, "global_step": 147511, "epoch": 3512} {"train_loss": -6.499007225036621, "global_step": 147512, "epoch": 3512} {"train_loss": -6.844032287597656, "global_step": 147513, "epoch": 3512} {"train_loss": -6.875140190124512, "global_step": 147514, "epoch": 3512} {"train_loss": -6.767724990844727, "global_step": 147515, "epoch": 3512} {"train_loss": -6.807645797729492, "global_step": 147516, "epoch": 3512} {"train_loss": -6.756886005401611, "global_step": 147517, "epoch": 3512} {"train_loss": -6.71369743347168, "global_step": 147518, "epoch": 3512} {"train_loss": -6.749933242797852, "global_step": 147519, "epoch": 3512} {"train_loss": -6.765430450439453, "global_step": 147520, "epoch": 3512} {"train_loss": -6.753662109375, "global_step": 147521, "epoch": 3512} {"train_loss": -6.862995147705078, "global_step": 147522, "epoch": 3512} {"train_loss": -6.7540082931518555, "global_step": 147523, "epoch": 3512} {"train_loss": -6.77602481842041, "global_step": 147524, "epoch": 3512} {"train_loss": -6.743597030639648, "global_step": 147525, "epoch": 3512} {"train_loss": -6.8101959228515625, "global_step": 147526, "epoch": 3512} {"train_loss": -6.830376625061035, "global_step": 147527, "epoch": 3512} {"train_loss": -6.695186614990234, "global_step": 147528, "epoch": 3512} {"train_loss": -6.844205379486084, "global_step": 147529, "epoch": 3512} {"train_loss": -6.821389198303223, "global_step": 147530, "epoch": 3512} {"train_loss": -6.76116943359375, "global_step": 147531, "epoch": 3512} {"train_loss": -6.840264320373535, "global_step": 147532, "epoch": 3512} {"train_loss": -6.727954864501953, "global_step": 147533, "epoch": 3512} {"train_loss": -6.8093743324279785, "global_step": 147534, "epoch": 3512} {"train_loss": -6.626644134521484, "global_step": 147535, "epoch": 3512} {"train_loss": -6.842109680175781, "global_step": 147536, "epoch": 3512} {"train_loss": -6.821074485778809, "global_step": 147537, "epoch": 3512} {"train_loss": -6.678511619567871, "global_step": 147538, "epoch": 3512} {"train_loss": -6.867975234985352, "global_step": 147539, "epoch": 3512} {"train_loss": -6.706478118896484, "global_step": 147540, "epoch": 3512} {"train_loss": -6.758914947509766, "global_step": 147541, "epoch": 3512} {"train_loss": -6.7738776206970215, "global_step": 147542, "epoch": 3512} {"train_loss": -6.830897808074951, "global_step": 147543, "epoch": 3512} {"train_loss": -6.696750640869141, "global_step": 147544, "epoch": 3512} {"train_loss": -6.777887537365868, "global_step": 147545, "epoch": 3512, "val_loss": 68345.8046875} {"train_loss": -6.779876708984375, "global_step": 147546, "epoch": 3513} {"train_loss": -6.733562469482422, "global_step": 147547, "epoch": 3513} {"train_loss": -6.823803901672363, "global_step": 147548, "epoch": 3513} {"train_loss": -6.778140068054199, "global_step": 147549, "epoch": 3513} {"train_loss": -6.690587997436523, "global_step": 147550, "epoch": 3513} {"train_loss": -6.757976531982422, "global_step": 147551, "epoch": 3513} {"train_loss": -6.724214553833008, "global_step": 147552, "epoch": 3513} {"train_loss": -6.855108261108398, "global_step": 147553, "epoch": 3513} {"train_loss": -6.745351791381836, "global_step": 147554, "epoch": 3513} {"train_loss": -6.685476303100586, "global_step": 147555, "epoch": 3513} {"train_loss": -6.780104160308838, "global_step": 147556, "epoch": 3513} {"train_loss": -6.626786231994629, "global_step": 147557, "epoch": 3513} {"train_loss": -6.87701940536499, "global_step": 147558, "epoch": 3513} {"train_loss": -6.737753868103027, "global_step": 147559, "epoch": 3513} {"train_loss": -6.820889472961426, "global_step": 147560, "epoch": 3513} {"train_loss": -6.809967041015625, "global_step": 147561, "epoch": 3513} {"train_loss": -6.76791524887085, "global_step": 147562, "epoch": 3513} {"train_loss": -6.750942707061768, "global_step": 147563, "epoch": 3513} {"train_loss": -6.707505226135254, "global_step": 147564, "epoch": 3513} {"train_loss": -6.7703447341918945, "global_step": 147565, "epoch": 3513} {"train_loss": -6.743261814117432, "global_step": 147566, "epoch": 3513} {"train_loss": -6.6102294921875, "global_step": 147567, "epoch": 3513} {"train_loss": -6.9335246086120605, "global_step": 147568, "epoch": 3513} {"train_loss": -6.853440284729004, "global_step": 147569, "epoch": 3513} {"train_loss": -6.757796287536621, "global_step": 147570, "epoch": 3513} {"train_loss": -6.807033538818359, "global_step": 147571, "epoch": 3513} {"train_loss": -6.811798095703125, "global_step": 147572, "epoch": 3513} {"train_loss": -6.751588821411133, "global_step": 147573, "epoch": 3513} {"train_loss": -6.869237899780273, "global_step": 147574, "epoch": 3513} {"train_loss": -6.758687496185303, "global_step": 147575, "epoch": 3513} {"train_loss": -6.846301078796387, "global_step": 147576, "epoch": 3513} {"train_loss": -6.909329891204834, "global_step": 147577, "epoch": 3513} {"train_loss": -6.865808486938477, "global_step": 147578, "epoch": 3513} {"train_loss": -6.819754600524902, "global_step": 147579, "epoch": 3513} {"train_loss": -6.8052473068237305, "global_step": 147580, "epoch": 3513} {"train_loss": -6.784049987792969, "global_step": 147581, "epoch": 3513} {"train_loss": -6.792457580566406, "global_step": 147582, "epoch": 3513} {"train_loss": -6.68858528137207, "global_step": 147583, "epoch": 3513} {"train_loss": -6.76022481918335, "global_step": 147584, "epoch": 3513} {"train_loss": -6.687557220458984, "global_step": 147585, "epoch": 3513} {"train_loss": -6.789144039154053, "global_step": 147586, "epoch": 3513} {"train_loss": -6.777188017254784, "global_step": 147587, "epoch": 3513, "val_loss": 68073.734375} {"train_loss": -6.882752418518066, "global_step": 147588, "epoch": 3514} {"train_loss": -6.745035648345947, "global_step": 147589, "epoch": 3514} {"train_loss": -6.735527992248535, "global_step": 147590, "epoch": 3514} {"train_loss": -6.821606636047363, "global_step": 147591, "epoch": 3514} {"train_loss": -6.837352752685547, "global_step": 147592, "epoch": 3514} {"train_loss": -6.848597526550293, "global_step": 147593, "epoch": 3514} {"train_loss": -6.8223676681518555, "global_step": 147594, "epoch": 3514} {"train_loss": -6.888579845428467, "global_step": 147595, "epoch": 3514} {"train_loss": -6.813223361968994, "global_step": 147596, "epoch": 3514} {"train_loss": -6.886089324951172, "global_step": 147597, "epoch": 3514} {"train_loss": -6.870121002197266, "global_step": 147598, "epoch": 3514} {"train_loss": -6.832535266876221, "global_step": 147599, "epoch": 3514} {"train_loss": -6.866033554077148, "global_step": 147600, "epoch": 3514} {"train_loss": -6.893956184387207, "global_step": 147601, "epoch": 3514} {"train_loss": -6.933743476867676, "global_step": 147602, "epoch": 3514} {"train_loss": -6.841341495513916, "global_step": 147603, "epoch": 3514} {"train_loss": -6.8049821853637695, "global_step": 147604, "epoch": 3514} {"train_loss": -6.8712029457092285, "global_step": 147605, "epoch": 3514} {"train_loss": -6.897710800170898, "global_step": 147606, "epoch": 3514} {"train_loss": -6.846270561218262, "global_step": 147607, "epoch": 3514} {"train_loss": -6.8817572593688965, "global_step": 147608, "epoch": 3514} {"train_loss": -6.813956260681152, "global_step": 147609, "epoch": 3514} {"train_loss": -6.7471795082092285, "global_step": 147610, "epoch": 3514} {"train_loss": -6.822553634643555, "global_step": 147611, "epoch": 3514} {"train_loss": -6.717677116394043, "global_step": 147612, "epoch": 3514} {"train_loss": -6.824576377868652, "global_step": 147613, "epoch": 3514} {"train_loss": -6.754155158996582, "global_step": 147614, "epoch": 3514} {"train_loss": -6.881978988647461, "global_step": 147615, "epoch": 3514} {"train_loss": -6.753589630126953, "global_step": 147616, "epoch": 3514} {"train_loss": -6.720663070678711, "global_step": 147617, "epoch": 3514} {"train_loss": -6.767798900604248, "global_step": 147618, "epoch": 3514} {"train_loss": -6.713144302368164, "global_step": 147619, "epoch": 3514} {"train_loss": -6.781422138214111, "global_step": 147620, "epoch": 3514} {"train_loss": -6.7373247146606445, "global_step": 147621, "epoch": 3514} {"train_loss": -6.711437225341797, "global_step": 147622, "epoch": 3514} {"train_loss": -6.782696723937988, "global_step": 147623, "epoch": 3514} {"train_loss": -6.782011985778809, "global_step": 147624, "epoch": 3514} {"train_loss": -6.903938293457031, "global_step": 147625, "epoch": 3514} {"train_loss": -6.690182685852051, "global_step": 147626, "epoch": 3514} {"train_loss": -6.7098565101623535, "global_step": 147627, "epoch": 3514} {"train_loss": -6.837708473205566, "global_step": 147628, "epoch": 3514} {"train_loss": -6.810632682981945, "global_step": 147629, "epoch": 3514, "val_loss": 68338.4921875} {"train_loss": -6.848691940307617, "global_step": 147630, "epoch": 3515} {"train_loss": -6.911333084106445, "global_step": 147631, "epoch": 3515} {"train_loss": -6.778239727020264, "global_step": 147632, "epoch": 3515} {"train_loss": -6.8700408935546875, "global_step": 147633, "epoch": 3515} {"train_loss": -6.832878589630127, "global_step": 147634, "epoch": 3515} {"train_loss": -6.735337257385254, "global_step": 147635, "epoch": 3515} {"train_loss": -6.766249656677246, "global_step": 147636, "epoch": 3515} {"train_loss": -6.902578353881836, "global_step": 147637, "epoch": 3515} {"train_loss": -6.843082427978516, "global_step": 147638, "epoch": 3515} {"train_loss": -6.840034484863281, "global_step": 147639, "epoch": 3515} {"train_loss": -6.79707145690918, "global_step": 147640, "epoch": 3515} {"train_loss": -6.873791694641113, "global_step": 147641, "epoch": 3515} {"train_loss": -6.844898223876953, "global_step": 147642, "epoch": 3515} {"train_loss": -6.785286903381348, "global_step": 147643, "epoch": 3515} {"train_loss": -6.863578796386719, "global_step": 147644, "epoch": 3515} {"train_loss": -6.786834239959717, "global_step": 147645, "epoch": 3515} {"train_loss": -6.81926155090332, "global_step": 147646, "epoch": 3515} {"train_loss": -6.77227783203125, "global_step": 147647, "epoch": 3515} {"train_loss": -6.762058734893799, "global_step": 147648, "epoch": 3515} {"train_loss": -6.870552062988281, "global_step": 147649, "epoch": 3515} {"train_loss": -6.785292625427246, "global_step": 147650, "epoch": 3515} {"train_loss": -6.837002277374268, "global_step": 147651, "epoch": 3515} {"train_loss": -6.767149448394775, "global_step": 147652, "epoch": 3515} {"train_loss": -6.819356918334961, "global_step": 147653, "epoch": 3515} {"train_loss": -6.83854866027832, "global_step": 147654, "epoch": 3515} {"train_loss": -6.786233901977539, "global_step": 147655, "epoch": 3515} {"train_loss": -6.726225852966309, "global_step": 147656, "epoch": 3515} {"train_loss": -6.614627838134766, "global_step": 147657, "epoch": 3515} {"train_loss": -6.80315637588501, "global_step": 147658, "epoch": 3515} {"train_loss": -6.816431999206543, "global_step": 147659, "epoch": 3515} {"train_loss": -6.741983890533447, "global_step": 147660, "epoch": 3515} {"train_loss": -6.805202960968018, "global_step": 147661, "epoch": 3515} {"train_loss": -6.909657955169678, "global_step": 147662, "epoch": 3515} {"train_loss": -6.894763946533203, "global_step": 147663, "epoch": 3515} {"train_loss": -6.850053787231445, "global_step": 147664, "epoch": 3515} {"train_loss": -6.760598659515381, "global_step": 147665, "epoch": 3515} {"train_loss": -6.761765480041504, "global_step": 147666, "epoch": 3515} {"train_loss": -6.799077033996582, "global_step": 147667, "epoch": 3515} {"train_loss": -6.765658378601074, "global_step": 147668, "epoch": 3515} {"train_loss": -6.680532932281494, "global_step": 147669, "epoch": 3515} {"train_loss": -6.7672119140625, "global_step": 147670, "epoch": 3515} {"train_loss": -6.800304185776484, "global_step": 147671, "epoch": 3515, "val_loss": 68661.0} {"train_loss": -6.539179801940918, "global_step": 147672, "epoch": 3516} {"train_loss": -6.847469329833984, "global_step": 147673, "epoch": 3516} {"train_loss": -6.661315441131592, "global_step": 147674, "epoch": 3516} {"train_loss": -6.756081581115723, "global_step": 147675, "epoch": 3516} {"train_loss": -6.745894432067871, "global_step": 147676, "epoch": 3516} {"train_loss": -6.565472602844238, "global_step": 147677, "epoch": 3516} {"train_loss": -6.712366580963135, "global_step": 147678, "epoch": 3516} {"train_loss": -6.679644584655762, "global_step": 147679, "epoch": 3516} {"train_loss": -6.669454574584961, "global_step": 147680, "epoch": 3516} {"train_loss": -6.69830322265625, "global_step": 147681, "epoch": 3516} {"train_loss": -6.746393203735352, "global_step": 147682, "epoch": 3516} {"train_loss": -6.6232147216796875, "global_step": 147683, "epoch": 3516} {"train_loss": -6.806651592254639, "global_step": 147684, "epoch": 3516} {"train_loss": -6.701971054077148, "global_step": 147685, "epoch": 3516} {"train_loss": -6.806524276733398, "global_step": 147686, "epoch": 3516} {"train_loss": -6.828248023986816, "global_step": 147687, "epoch": 3516} {"train_loss": -6.715150356292725, "global_step": 147688, "epoch": 3516} {"train_loss": -6.727382183074951, "global_step": 147689, "epoch": 3516} {"train_loss": -6.665461540222168, "global_step": 147690, "epoch": 3516} {"train_loss": -6.837161064147949, "global_step": 147691, "epoch": 3516} {"train_loss": -6.786056995391846, "global_step": 147692, "epoch": 3516} {"train_loss": -6.783337116241455, "global_step": 147693, "epoch": 3516} {"train_loss": -6.759183883666992, "global_step": 147694, "epoch": 3516} {"train_loss": -6.720829010009766, "global_step": 147695, "epoch": 3516} {"train_loss": -6.791402816772461, "global_step": 147696, "epoch": 3516} {"train_loss": -6.799009323120117, "global_step": 147697, "epoch": 3516} {"train_loss": -6.773109436035156, "global_step": 147698, "epoch": 3516} {"train_loss": -6.866412162780762, "global_step": 147699, "epoch": 3516} {"train_loss": -6.888306140899658, "global_step": 147700, "epoch": 3516} {"train_loss": -6.677606582641602, "global_step": 147701, "epoch": 3516} {"train_loss": -6.780520915985107, "global_step": 147702, "epoch": 3516} {"train_loss": -6.820867538452148, "global_step": 147703, "epoch": 3516} {"train_loss": -6.813956260681152, "global_step": 147704, "epoch": 3516} {"train_loss": -6.84871768951416, "global_step": 147705, "epoch": 3516} {"train_loss": -6.745560646057129, "global_step": 147706, "epoch": 3516} {"train_loss": -6.822701930999756, "global_step": 147707, "epoch": 3516} {"train_loss": -6.740601539611816, "global_step": 147708, "epoch": 3516} {"train_loss": -6.828121662139893, "global_step": 147709, "epoch": 3516} {"train_loss": -6.872523784637451, "global_step": 147710, "epoch": 3516} {"train_loss": -6.833029747009277, "global_step": 147711, "epoch": 3516} {"train_loss": -6.711674690246582, "global_step": 147712, "epoch": 3516} {"train_loss": -6.75782501129877, "global_step": 147713, "epoch": 3516, "val_loss": 68446.9375} {"train_loss": -6.8398213386535645, "global_step": 147714, "epoch": 3517} {"train_loss": -6.770108222961426, "global_step": 147715, "epoch": 3517} {"train_loss": -6.7615647315979, "global_step": 147716, "epoch": 3517} {"train_loss": -6.816926002502441, "global_step": 147717, "epoch": 3517} {"train_loss": -6.808629989624023, "global_step": 147718, "epoch": 3517} {"train_loss": -6.820182800292969, "global_step": 147719, "epoch": 3517} {"train_loss": -6.897427558898926, "global_step": 147720, "epoch": 3517} {"train_loss": -6.856746673583984, "global_step": 147721, "epoch": 3517} {"train_loss": -6.847695350646973, "global_step": 147722, "epoch": 3517} {"train_loss": -6.836780548095703, "global_step": 147723, "epoch": 3517} {"train_loss": -6.853799819946289, "global_step": 147724, "epoch": 3517} {"train_loss": -6.795169830322266, "global_step": 147725, "epoch": 3517} {"train_loss": -6.830169677734375, "global_step": 147726, "epoch": 3517} {"train_loss": -6.856736183166504, "global_step": 147727, "epoch": 3517} {"train_loss": -6.734747886657715, "global_step": 147728, "epoch": 3517} {"train_loss": -6.828962326049805, "global_step": 147729, "epoch": 3517} {"train_loss": -6.768348693847656, "global_step": 147730, "epoch": 3517} {"train_loss": -6.689067840576172, "global_step": 147731, "epoch": 3517} {"train_loss": -6.579337120056152, "global_step": 147732, "epoch": 3517} {"train_loss": -6.731989860534668, "global_step": 147733, "epoch": 3517} {"train_loss": -6.729496002197266, "global_step": 147734, "epoch": 3517} {"train_loss": -6.765650749206543, "global_step": 147735, "epoch": 3517} {"train_loss": -6.698368549346924, "global_step": 147736, "epoch": 3517} {"train_loss": -6.727057933807373, "global_step": 147737, "epoch": 3517} {"train_loss": -6.79439640045166, "global_step": 147738, "epoch": 3517} {"train_loss": -6.842105865478516, "global_step": 147739, "epoch": 3517} {"train_loss": -6.847447395324707, "global_step": 147740, "epoch": 3517} {"train_loss": -6.733633041381836, "global_step": 147741, "epoch": 3517} {"train_loss": -6.900790214538574, "global_step": 147742, "epoch": 3517} {"train_loss": -6.7670440673828125, "global_step": 147743, "epoch": 3517} {"train_loss": -6.727309226989746, "global_step": 147744, "epoch": 3517} {"train_loss": -6.7308244705200195, "global_step": 147745, "epoch": 3517} {"train_loss": -6.788478851318359, "global_step": 147746, "epoch": 3517} {"train_loss": -6.840785503387451, "global_step": 147747, "epoch": 3517} {"train_loss": -6.774825096130371, "global_step": 147748, "epoch": 3517} {"train_loss": -6.864234924316406, "global_step": 147749, "epoch": 3517} {"train_loss": -6.688657760620117, "global_step": 147750, "epoch": 3517} {"train_loss": -6.81702995300293, "global_step": 147751, "epoch": 3517} {"train_loss": -6.75502872467041, "global_step": 147752, "epoch": 3517} {"train_loss": -6.697141170501709, "global_step": 147753, "epoch": 3517} {"train_loss": -6.794425010681152, "global_step": 147754, "epoch": 3517} {"train_loss": -6.784920431318737, "global_step": 147755, "epoch": 3517, "val_loss": 68360.3359375} {"train_loss": -6.8654584884643555, "global_step": 147756, "epoch": 3518} {"train_loss": -6.846226692199707, "global_step": 147757, "epoch": 3518} {"train_loss": -6.811641693115234, "global_step": 147758, "epoch": 3518} {"train_loss": -6.851290702819824, "global_step": 147759, "epoch": 3518} {"train_loss": -6.856758117675781, "global_step": 147760, "epoch": 3518} {"train_loss": -6.90354585647583, "global_step": 147761, "epoch": 3518} {"train_loss": -6.9186692237854, "global_step": 147762, "epoch": 3518} {"train_loss": -6.768686294555664, "global_step": 147763, "epoch": 3518} {"train_loss": -6.875251770019531, "global_step": 147764, "epoch": 3518} {"train_loss": -6.767545223236084, "global_step": 147765, "epoch": 3518} {"train_loss": -6.842320442199707, "global_step": 147766, "epoch": 3518} {"train_loss": -6.828191757202148, "global_step": 147767, "epoch": 3518} {"train_loss": -6.784489631652832, "global_step": 147768, "epoch": 3518} {"train_loss": -6.778748035430908, "global_step": 147769, "epoch": 3518} {"train_loss": -6.809553146362305, "global_step": 147770, "epoch": 3518} {"train_loss": -6.946314811706543, "global_step": 147771, "epoch": 3518} {"train_loss": -6.663980007171631, "global_step": 147772, "epoch": 3518} {"train_loss": -6.790643215179443, "global_step": 147773, "epoch": 3518} {"train_loss": -6.879166603088379, "global_step": 147774, "epoch": 3518} {"train_loss": -6.901180267333984, "global_step": 147775, "epoch": 3518} {"train_loss": -6.825883865356445, "global_step": 147776, "epoch": 3518} {"train_loss": -6.750948429107666, "global_step": 147777, "epoch": 3518} {"train_loss": -6.7750959396362305, "global_step": 147778, "epoch": 3518} {"train_loss": -6.791169166564941, "global_step": 147779, "epoch": 3518} {"train_loss": -6.798356056213379, "global_step": 147780, "epoch": 3518} {"train_loss": -6.858213424682617, "global_step": 147781, "epoch": 3518} {"train_loss": -6.737402439117432, "global_step": 147782, "epoch": 3518} {"train_loss": -6.807552337646484, "global_step": 147783, "epoch": 3518} {"train_loss": -6.795041084289551, "global_step": 147784, "epoch": 3518} {"train_loss": -6.681436538696289, "global_step": 147785, "epoch": 3518} {"train_loss": -6.905979156494141, "global_step": 147786, "epoch": 3518} {"train_loss": -6.68890380859375, "global_step": 147787, "epoch": 3518} {"train_loss": -6.868206977844238, "global_step": 147788, "epoch": 3518} {"train_loss": -6.766155242919922, "global_step": 147789, "epoch": 3518} {"train_loss": -6.846279144287109, "global_step": 147790, "epoch": 3518} {"train_loss": -6.811236381530762, "global_step": 147791, "epoch": 3518} {"train_loss": -6.771852493286133, "global_step": 147792, "epoch": 3518} {"train_loss": -6.804377555847168, "global_step": 147793, "epoch": 3518} {"train_loss": -6.7905802726745605, "global_step": 147794, "epoch": 3518} {"train_loss": -6.774722099304199, "global_step": 147795, "epoch": 3518} {"train_loss": -6.753011226654053, "global_step": 147796, "epoch": 3518} {"train_loss": -6.810325826917376, "global_step": 147797, "epoch": 3518, "val_loss": 68423.8828125} {"train_loss": -6.797840595245361, "global_step": 147798, "epoch": 3519} {"train_loss": -6.9645819664001465, "global_step": 147799, "epoch": 3519} {"train_loss": -6.66930627822876, "global_step": 147800, "epoch": 3519} {"train_loss": -6.866001605987549, "global_step": 147801, "epoch": 3519} {"train_loss": -6.9115071296691895, "global_step": 147802, "epoch": 3519} {"train_loss": -6.839322090148926, "global_step": 147803, "epoch": 3519} {"train_loss": -6.780614376068115, "global_step": 147804, "epoch": 3519} {"train_loss": -6.856700897216797, "global_step": 147805, "epoch": 3519} {"train_loss": -6.867883682250977, "global_step": 147806, "epoch": 3519} {"train_loss": -6.891277313232422, "global_step": 147807, "epoch": 3519} {"train_loss": -6.835695266723633, "global_step": 147808, "epoch": 3519} {"train_loss": -6.729033470153809, "global_step": 147809, "epoch": 3519} {"train_loss": -6.705765247344971, "global_step": 147810, "epoch": 3519} {"train_loss": -6.775477409362793, "global_step": 147811, "epoch": 3519} {"train_loss": -6.753582954406738, "global_step": 147812, "epoch": 3519} {"train_loss": -6.756922721862793, "global_step": 147813, "epoch": 3519} {"train_loss": -6.765202522277832, "global_step": 147814, "epoch": 3519} {"train_loss": -6.811552047729492, "global_step": 147815, "epoch": 3519} {"train_loss": -6.794585227966309, "global_step": 147816, "epoch": 3519} {"train_loss": -6.71077823638916, "global_step": 147817, "epoch": 3519} {"train_loss": -6.819565773010254, "global_step": 147818, "epoch": 3519} {"train_loss": -6.737865924835205, "global_step": 147819, "epoch": 3519} {"train_loss": -6.805563926696777, "global_step": 147820, "epoch": 3519} {"train_loss": -6.802021503448486, "global_step": 147821, "epoch": 3519} {"train_loss": -6.779541015625, "global_step": 147822, "epoch": 3519} {"train_loss": -6.716065883636475, "global_step": 147823, "epoch": 3519} {"train_loss": -6.923686981201172, "global_step": 147824, "epoch": 3519} {"train_loss": -6.901119232177734, "global_step": 147825, "epoch": 3519} {"train_loss": -6.813051223754883, "global_step": 147826, "epoch": 3519} {"train_loss": -6.7629499435424805, "global_step": 147827, "epoch": 3519} {"train_loss": -6.83270263671875, "global_step": 147828, "epoch": 3519} {"train_loss": -6.726118087768555, "global_step": 147829, "epoch": 3519} {"train_loss": -6.761749267578125, "global_step": 147830, "epoch": 3519} {"train_loss": -6.687037467956543, "global_step": 147831, "epoch": 3519} {"train_loss": -6.858790397644043, "global_step": 147832, "epoch": 3519} {"train_loss": -6.735910415649414, "global_step": 147833, "epoch": 3519} {"train_loss": -6.666478157043457, "global_step": 147834, "epoch": 3519} {"train_loss": -6.8270697593688965, "global_step": 147835, "epoch": 3519} {"train_loss": -6.81005859375, "global_step": 147836, "epoch": 3519} {"train_loss": -6.855201721191406, "global_step": 147837, "epoch": 3519} {"train_loss": -6.8272504806518555, "global_step": 147838, "epoch": 3519} {"train_loss": -6.798183043797811, "global_step": 147839, "epoch": 3519, "val_loss": 68528.2109375} {"train_loss": -6.851529598236084, "global_step": 147840, "epoch": 3520} {"train_loss": -6.815176963806152, "global_step": 147841, "epoch": 3520} {"train_loss": -6.8796868324279785, "global_step": 147842, "epoch": 3520} {"train_loss": -6.873318672180176, "global_step": 147843, "epoch": 3520} {"train_loss": -6.869025230407715, "global_step": 147844, "epoch": 3520} {"train_loss": -6.79055118560791, "global_step": 147845, "epoch": 3520} {"train_loss": -6.765413284301758, "global_step": 147846, "epoch": 3520} {"train_loss": -6.825530529022217, "global_step": 147847, "epoch": 3520} {"train_loss": -6.78089714050293, "global_step": 147848, "epoch": 3520} {"train_loss": -6.713670253753662, "global_step": 147849, "epoch": 3520} {"train_loss": -6.612117767333984, "global_step": 147850, "epoch": 3520} {"train_loss": -6.512009620666504, "global_step": 147851, "epoch": 3520} {"train_loss": -6.80426025390625, "global_step": 147852, "epoch": 3520} {"train_loss": -6.745625972747803, "global_step": 147853, "epoch": 3520} {"train_loss": -6.651640892028809, "global_step": 147854, "epoch": 3520} {"train_loss": -6.77291202545166, "global_step": 147855, "epoch": 3520} {"train_loss": -6.648409366607666, "global_step": 147856, "epoch": 3520} {"train_loss": -6.705533027648926, "global_step": 147857, "epoch": 3520} {"train_loss": -6.831794738769531, "global_step": 147858, "epoch": 3520} {"train_loss": -6.690436840057373, "global_step": 147859, "epoch": 3520} {"train_loss": -6.750733375549316, "global_step": 147860, "epoch": 3520} {"train_loss": -6.764225959777832, "global_step": 147861, "epoch": 3520} {"train_loss": -6.634426116943359, "global_step": 147862, "epoch": 3520} {"train_loss": -6.71164608001709, "global_step": 147863, "epoch": 3520} {"train_loss": -6.800511360168457, "global_step": 147864, "epoch": 3520} {"train_loss": -6.694612503051758, "global_step": 147865, "epoch": 3520} {"train_loss": -6.735622406005859, "global_step": 147866, "epoch": 3520} {"train_loss": -6.7885541915893555, "global_step": 147867, "epoch": 3520} {"train_loss": -6.817482948303223, "global_step": 147868, "epoch": 3520} {"train_loss": -6.787807464599609, "global_step": 147869, "epoch": 3520} {"train_loss": -6.796356678009033, "global_step": 147870, "epoch": 3520} {"train_loss": -6.751991271972656, "global_step": 147871, "epoch": 3520} {"train_loss": -6.835879802703857, "global_step": 147872, "epoch": 3520} {"train_loss": -6.76064395904541, "global_step": 147873, "epoch": 3520} {"train_loss": -6.7607574462890625, "global_step": 147874, "epoch": 3520} {"train_loss": -6.867033004760742, "global_step": 147875, "epoch": 3520} {"train_loss": -6.8619489669799805, "global_step": 147876, "epoch": 3520} {"train_loss": -6.782576084136963, "global_step": 147877, "epoch": 3520} {"train_loss": -6.805967330932617, "global_step": 147878, "epoch": 3520} {"train_loss": -6.773524284362793, "global_step": 147879, "epoch": 3520} {"train_loss": -6.728756904602051, "global_step": 147880, "epoch": 3520} {"train_loss": -6.763792855398996, "global_step": 147881, "epoch": 3520, "val_loss": 68481.8671875} {"train_loss": -6.900219440460205, "global_step": 147882, "epoch": 3521} {"train_loss": -6.844682693481445, "global_step": 147883, "epoch": 3521} {"train_loss": -6.866046905517578, "global_step": 147884, "epoch": 3521} {"train_loss": -6.797573089599609, "global_step": 147885, "epoch": 3521} {"train_loss": -6.8506903648376465, "global_step": 147886, "epoch": 3521} {"train_loss": -6.893082141876221, "global_step": 147887, "epoch": 3521} {"train_loss": -6.8306498527526855, "global_step": 147888, "epoch": 3521} {"train_loss": -6.904794692993164, "global_step": 147889, "epoch": 3521} {"train_loss": -6.939671039581299, "global_step": 147890, "epoch": 3521} {"train_loss": -6.799319267272949, "global_step": 147891, "epoch": 3521} {"train_loss": -6.890471458435059, "global_step": 147892, "epoch": 3521} {"train_loss": -6.880478858947754, "global_step": 147893, "epoch": 3521} {"train_loss": -6.883344650268555, "global_step": 147894, "epoch": 3521} {"train_loss": -6.800808906555176, "global_step": 147895, "epoch": 3521} {"train_loss": -6.748501777648926, "global_step": 147896, "epoch": 3521} {"train_loss": -6.859231948852539, "global_step": 147897, "epoch": 3521} {"train_loss": -6.736049652099609, "global_step": 147898, "epoch": 3521} {"train_loss": -6.816040992736816, "global_step": 147899, "epoch": 3521} {"train_loss": -6.726153373718262, "global_step": 147900, "epoch": 3521} {"train_loss": -6.782900810241699, "global_step": 147901, "epoch": 3521} {"train_loss": -6.811453819274902, "global_step": 147902, "epoch": 3521} {"train_loss": -6.814572334289551, "global_step": 147903, "epoch": 3521} {"train_loss": -6.87543249130249, "global_step": 147904, "epoch": 3521} {"train_loss": -6.823331356048584, "global_step": 147905, "epoch": 3521} {"train_loss": -6.794747352600098, "global_step": 147906, "epoch": 3521} {"train_loss": -6.819910526275635, "global_step": 147907, "epoch": 3521} {"train_loss": -6.840086936950684, "global_step": 147908, "epoch": 3521} {"train_loss": -6.88718318939209, "global_step": 147909, "epoch": 3521} {"train_loss": -6.964707374572754, "global_step": 147910, "epoch": 3521} {"train_loss": -6.800485134124756, "global_step": 147911, "epoch": 3521} {"train_loss": -6.921295642852783, "global_step": 147912, "epoch": 3521} {"train_loss": -6.841163635253906, "global_step": 147913, "epoch": 3521} {"train_loss": -6.8303985595703125, "global_step": 147914, "epoch": 3521} {"train_loss": -6.870290756225586, "global_step": 147915, "epoch": 3521} {"train_loss": -6.802539348602295, "global_step": 147916, "epoch": 3521} {"train_loss": -6.854885101318359, "global_step": 147917, "epoch": 3521} {"train_loss": -6.811888217926025, "global_step": 147918, "epoch": 3521} {"train_loss": -6.846590518951416, "global_step": 147919, "epoch": 3521} {"train_loss": -6.770799160003662, "global_step": 147920, "epoch": 3521} {"train_loss": -6.823962688446045, "global_step": 147921, "epoch": 3521} {"train_loss": -6.779364585876465, "global_step": 147922, "epoch": 3521} {"train_loss": -6.836385068439302, "global_step": 147923, "epoch": 3521, "val_loss": 68386.5625} {"train_loss": -6.770243167877197, "global_step": 147924, "epoch": 3522} {"train_loss": -6.809896945953369, "global_step": 147925, "epoch": 3522} {"train_loss": -6.706925392150879, "global_step": 147926, "epoch": 3522} {"train_loss": -6.724933624267578, "global_step": 147927, "epoch": 3522} {"train_loss": -6.831420421600342, "global_step": 147928, "epoch": 3522} {"train_loss": -6.760555267333984, "global_step": 147929, "epoch": 3522} {"train_loss": -6.7975664138793945, "global_step": 147930, "epoch": 3522} {"train_loss": -6.7020392417907715, "global_step": 147931, "epoch": 3522} {"train_loss": -6.816566467285156, "global_step": 147932, "epoch": 3522} {"train_loss": -6.755340099334717, "global_step": 147933, "epoch": 3522} {"train_loss": -6.790210247039795, "global_step": 147934, "epoch": 3522} {"train_loss": -6.763036251068115, "global_step": 147935, "epoch": 3522} {"train_loss": -6.877309799194336, "global_step": 147936, "epoch": 3522} {"train_loss": -6.740912437438965, "global_step": 147937, "epoch": 3522} {"train_loss": -6.769347667694092, "global_step": 147938, "epoch": 3522} {"train_loss": -6.817073822021484, "global_step": 147939, "epoch": 3522} {"train_loss": -6.927950382232666, "global_step": 147940, "epoch": 3522} {"train_loss": -6.872126579284668, "global_step": 147941, "epoch": 3522} {"train_loss": -6.746188163757324, "global_step": 147942, "epoch": 3522} {"train_loss": -6.868470668792725, "global_step": 147943, "epoch": 3522} {"train_loss": -6.823958396911621, "global_step": 147944, "epoch": 3522} {"train_loss": -6.852919578552246, "global_step": 147945, "epoch": 3522} {"train_loss": -6.756504058837891, "global_step": 147946, "epoch": 3522} {"train_loss": -6.882809638977051, "global_step": 147947, "epoch": 3522} {"train_loss": -6.783239364624023, "global_step": 147948, "epoch": 3522} {"train_loss": -6.740630149841309, "global_step": 147949, "epoch": 3522} {"train_loss": -6.78848123550415, "global_step": 147950, "epoch": 3522} {"train_loss": -6.696933746337891, "global_step": 147951, "epoch": 3522} {"train_loss": -6.769144535064697, "global_step": 147952, "epoch": 3522} {"train_loss": -6.718235015869141, "global_step": 147953, "epoch": 3522} {"train_loss": -6.746715545654297, "global_step": 147954, "epoch": 3522} {"train_loss": -6.835548400878906, "global_step": 147955, "epoch": 3522} {"train_loss": -6.7017974853515625, "global_step": 147956, "epoch": 3522} {"train_loss": -6.687948703765869, "global_step": 147957, "epoch": 3522} {"train_loss": -6.6602606773376465, "global_step": 147958, "epoch": 3522} {"train_loss": -6.638521194458008, "global_step": 147959, "epoch": 3522} {"train_loss": -6.7436699867248535, "global_step": 147960, "epoch": 3522} {"train_loss": -6.674310207366943, "global_step": 147961, "epoch": 3522} {"train_loss": -6.810596466064453, "global_step": 147962, "epoch": 3522} {"train_loss": -6.716543197631836, "global_step": 147963, "epoch": 3522} {"train_loss": -6.609193801879883, "global_step": 147964, "epoch": 3522} {"train_loss": -6.765893266314552, "global_step": 147965, "epoch": 3522, "val_loss": 68329.9609375} {"train_loss": -6.678499698638916, "global_step": 147966, "epoch": 3523} {"train_loss": -6.787035942077637, "global_step": 147967, "epoch": 3523} {"train_loss": -6.797276020050049, "global_step": 147968, "epoch": 3523} {"train_loss": -6.784113883972168, "global_step": 147969, "epoch": 3523} {"train_loss": -6.949342727661133, "global_step": 147970, "epoch": 3523} {"train_loss": -6.786572456359863, "global_step": 147971, "epoch": 3523} {"train_loss": -6.811185359954834, "global_step": 147972, "epoch": 3523} {"train_loss": -6.756765365600586, "global_step": 147973, "epoch": 3523} {"train_loss": -6.740968704223633, "global_step": 147974, "epoch": 3523} {"train_loss": -6.738883018493652, "global_step": 147975, "epoch": 3523} {"train_loss": -6.82054328918457, "global_step": 147976, "epoch": 3523} {"train_loss": -6.8683576583862305, "global_step": 147977, "epoch": 3523} {"train_loss": -6.687872886657715, "global_step": 147978, "epoch": 3523} {"train_loss": -6.853239059448242, "global_step": 147979, "epoch": 3523} {"train_loss": -6.7902936935424805, "global_step": 147980, "epoch": 3523} {"train_loss": -6.685157299041748, "global_step": 147981, "epoch": 3523} {"train_loss": -6.762421131134033, "global_step": 147982, "epoch": 3523} {"train_loss": -6.688920974731445, "global_step": 147983, "epoch": 3523} {"train_loss": -6.808019638061523, "global_step": 147984, "epoch": 3523} {"train_loss": -6.688518524169922, "global_step": 147985, "epoch": 3523} {"train_loss": -6.676623344421387, "global_step": 147986, "epoch": 3523} {"train_loss": -6.706512928009033, "global_step": 147987, "epoch": 3523} {"train_loss": -6.715956687927246, "global_step": 147988, "epoch": 3523} {"train_loss": -6.785140514373779, "global_step": 147989, "epoch": 3523} {"train_loss": -6.823846340179443, "global_step": 147990, "epoch": 3523} {"train_loss": -6.72749137878418, "global_step": 147991, "epoch": 3523} {"train_loss": -6.901500701904297, "global_step": 147992, "epoch": 3523} {"train_loss": -6.577075481414795, "global_step": 147993, "epoch": 3523} {"train_loss": -6.692553520202637, "global_step": 147994, "epoch": 3523} {"train_loss": -6.5941619873046875, "global_step": 147995, "epoch": 3523} {"train_loss": -6.697458267211914, "global_step": 147996, "epoch": 3523} {"train_loss": -6.905672073364258, "global_step": 147997, "epoch": 3523} {"train_loss": -6.8105621337890625, "global_step": 147998, "epoch": 3523} {"train_loss": -6.677565574645996, "global_step": 147999, "epoch": 3523} {"train_loss": -6.645787715911865, "global_step": 148000, "epoch": 3523} {"train_loss": -6.707391738891602, "global_step": 148001, "epoch": 3523} {"train_loss": -6.66502571105957, "global_step": 148002, "epoch": 3523} {"train_loss": -6.789799690246582, "global_step": 148003, "epoch": 3523} {"train_loss": -6.639044284820557, "global_step": 148004, "epoch": 3523} {"train_loss": -6.64096736907959, "global_step": 148005, "epoch": 3523} {"train_loss": -6.797142028808594, "global_step": 148006, "epoch": 3523} {"train_loss": -6.7467407158442905, "global_step": 148007, "epoch": 3523, "val_loss": 68472.03125} {"train_loss": -6.75801944732666, "global_step": 148008, "epoch": 3524} {"train_loss": -6.730129718780518, "global_step": 148009, "epoch": 3524} {"train_loss": -6.851161479949951, "global_step": 148010, "epoch": 3524} {"train_loss": -6.690354824066162, "global_step": 148011, "epoch": 3524} {"train_loss": -6.653630256652832, "global_step": 148012, "epoch": 3524} {"train_loss": -6.807677268981934, "global_step": 148013, "epoch": 3524} {"train_loss": -6.777594566345215, "global_step": 148014, "epoch": 3524} {"train_loss": -6.789828300476074, "global_step": 148015, "epoch": 3524} {"train_loss": -6.911975860595703, "global_step": 148016, "epoch": 3524} {"train_loss": -6.733292579650879, "global_step": 148017, "epoch": 3524} {"train_loss": -6.749096870422363, "global_step": 148018, "epoch": 3524} {"train_loss": -6.813791275024414, "global_step": 148019, "epoch": 3524} {"train_loss": -6.859580039978027, "global_step": 148020, "epoch": 3524} {"train_loss": -6.805376052856445, "global_step": 148021, "epoch": 3524} {"train_loss": -6.830369472503662, "global_step": 148022, "epoch": 3524} {"train_loss": -6.750540733337402, "global_step": 148023, "epoch": 3524} {"train_loss": -6.811736106872559, "global_step": 148024, "epoch": 3524} {"train_loss": -6.854964256286621, "global_step": 148025, "epoch": 3524} {"train_loss": -6.847787857055664, "global_step": 148026, "epoch": 3524} {"train_loss": -6.742425918579102, "global_step": 148027, "epoch": 3524} {"train_loss": -6.733429908752441, "global_step": 148028, "epoch": 3524} {"train_loss": -6.75704288482666, "global_step": 148029, "epoch": 3524} {"train_loss": -6.782990455627441, "global_step": 148030, "epoch": 3524} {"train_loss": -6.847177028656006, "global_step": 148031, "epoch": 3524} {"train_loss": -6.88850212097168, "global_step": 148032, "epoch": 3524} {"train_loss": -6.752823352813721, "global_step": 148033, "epoch": 3524} {"train_loss": -6.7999067306518555, "global_step": 148034, "epoch": 3524} {"train_loss": -6.8166093826293945, "global_step": 148035, "epoch": 3524} {"train_loss": -6.811997890472412, "global_step": 148036, "epoch": 3524} {"train_loss": -6.838491916656494, "global_step": 148037, "epoch": 3524} {"train_loss": -6.7620439529418945, "global_step": 148038, "epoch": 3524} {"train_loss": -6.798861026763916, "global_step": 148039, "epoch": 3524} {"train_loss": -6.919032096862793, "global_step": 148040, "epoch": 3524} {"train_loss": -6.928045749664307, "global_step": 148041, "epoch": 3524} {"train_loss": -6.750998497009277, "global_step": 148042, "epoch": 3524} {"train_loss": -6.786840438842773, "global_step": 148043, "epoch": 3524} {"train_loss": -6.859038829803467, "global_step": 148044, "epoch": 3524} {"train_loss": -6.7701029777526855, "global_step": 148045, "epoch": 3524} {"train_loss": -6.914423942565918, "global_step": 148046, "epoch": 3524} {"train_loss": -6.8276801109313965, "global_step": 148047, "epoch": 3524} {"train_loss": -6.829037666320801, "global_step": 148048, "epoch": 3524} {"train_loss": -6.803549096697853, "global_step": 148049, "epoch": 3524, "val_loss": 68343.7734375} {"train_loss": -6.927130222320557, "global_step": 148050, "epoch": 3525} {"train_loss": -6.810365676879883, "global_step": 148051, "epoch": 3525} {"train_loss": -6.766979694366455, "global_step": 148052, "epoch": 3525} {"train_loss": -6.843451976776123, "global_step": 148053, "epoch": 3525} {"train_loss": -6.881024360656738, "global_step": 148054, "epoch": 3525} {"train_loss": -6.75875186920166, "global_step": 148055, "epoch": 3525} {"train_loss": -6.804529190063477, "global_step": 148056, "epoch": 3525} {"train_loss": -6.798433303833008, "global_step": 148057, "epoch": 3525} {"train_loss": -6.7336931228637695, "global_step": 148058, "epoch": 3525} {"train_loss": -6.920804023742676, "global_step": 148059, "epoch": 3525} {"train_loss": -6.706695079803467, "global_step": 148060, "epoch": 3525} {"train_loss": -6.716358184814453, "global_step": 148061, "epoch": 3525} {"train_loss": -6.806215286254883, "global_step": 148062, "epoch": 3525} {"train_loss": -6.669268608093262, "global_step": 148063, "epoch": 3525} {"train_loss": -6.731254577636719, "global_step": 148064, "epoch": 3525} {"train_loss": -6.7716064453125, "global_step": 148065, "epoch": 3525} {"train_loss": -6.7254228591918945, "global_step": 148066, "epoch": 3525} {"train_loss": -6.841941833496094, "global_step": 148067, "epoch": 3525} {"train_loss": -6.804354667663574, "global_step": 148068, "epoch": 3525} {"train_loss": -6.701714515686035, "global_step": 148069, "epoch": 3525} {"train_loss": -6.787535667419434, "global_step": 148070, "epoch": 3525} {"train_loss": -6.754952430725098, "global_step": 148071, "epoch": 3525} {"train_loss": -6.8166680335998535, "global_step": 148072, "epoch": 3525} {"train_loss": -6.62173318862915, "global_step": 148073, "epoch": 3525} {"train_loss": -6.822114944458008, "global_step": 148074, "epoch": 3525} {"train_loss": -6.707974433898926, "global_step": 148075, "epoch": 3525} {"train_loss": -6.791816234588623, "global_step": 148076, "epoch": 3525} {"train_loss": -6.850837707519531, "global_step": 148077, "epoch": 3525} {"train_loss": -6.705318450927734, "global_step": 148078, "epoch": 3525} {"train_loss": -6.710451602935791, "global_step": 148079, "epoch": 3525} {"train_loss": -6.682602882385254, "global_step": 148080, "epoch": 3525} {"train_loss": -6.8135905265808105, "global_step": 148081, "epoch": 3525} {"train_loss": -6.7264838218688965, "global_step": 148082, "epoch": 3525} {"train_loss": -6.6787004470825195, "global_step": 148083, "epoch": 3525} {"train_loss": -6.820691108703613, "global_step": 148084, "epoch": 3525} {"train_loss": -6.75926399230957, "global_step": 148085, "epoch": 3525} {"train_loss": -6.664236068725586, "global_step": 148086, "epoch": 3525} {"train_loss": -6.794927597045898, "global_step": 148087, "epoch": 3525} {"train_loss": -6.700277805328369, "global_step": 148088, "epoch": 3525} {"train_loss": -6.809505462646484, "global_step": 148089, "epoch": 3525} {"train_loss": -6.80023193359375, "global_step": 148090, "epoch": 3525} {"train_loss": -6.768657900038219, "global_step": 148091, "epoch": 3525, "val_loss": 68299.9140625} {"train_loss": -6.667713165283203, "global_step": 148092, "epoch": 3526} {"train_loss": -6.68251371383667, "global_step": 148093, "epoch": 3526} {"train_loss": -6.722541809082031, "global_step": 148094, "epoch": 3526} {"train_loss": -6.700444221496582, "global_step": 148095, "epoch": 3526} {"train_loss": -6.67092227935791, "global_step": 148096, "epoch": 3526} {"train_loss": -6.728771209716797, "global_step": 148097, "epoch": 3526} {"train_loss": -6.736299514770508, "global_step": 148098, "epoch": 3526} {"train_loss": -6.817868232727051, "global_step": 148099, "epoch": 3526} {"train_loss": -6.721710681915283, "global_step": 148100, "epoch": 3526} {"train_loss": -6.753126621246338, "global_step": 148101, "epoch": 3526} {"train_loss": -6.802783966064453, "global_step": 148102, "epoch": 3526} {"train_loss": -6.795200347900391, "global_step": 148103, "epoch": 3526} {"train_loss": -6.7761640548706055, "global_step": 148104, "epoch": 3526} {"train_loss": -6.812045097351074, "global_step": 148105, "epoch": 3526} {"train_loss": -6.743354797363281, "global_step": 148106, "epoch": 3526} {"train_loss": -6.726056098937988, "global_step": 148107, "epoch": 3526} {"train_loss": -6.825397491455078, "global_step": 148108, "epoch": 3526} {"train_loss": -6.83592414855957, "global_step": 148109, "epoch": 3526} {"train_loss": -6.659824848175049, "global_step": 148110, "epoch": 3526} {"train_loss": -6.844000816345215, "global_step": 148111, "epoch": 3526} {"train_loss": -6.948287487030029, "global_step": 148112, "epoch": 3526} {"train_loss": -6.810162544250488, "global_step": 148113, "epoch": 3526} {"train_loss": -6.877390384674072, "global_step": 148114, "epoch": 3526} {"train_loss": -6.819477081298828, "global_step": 148115, "epoch": 3526} {"train_loss": -6.744791507720947, "global_step": 148116, "epoch": 3526} {"train_loss": -6.891969203948975, "global_step": 148117, "epoch": 3526} {"train_loss": -6.944925308227539, "global_step": 148118, "epoch": 3526} {"train_loss": -6.839984893798828, "global_step": 148119, "epoch": 3526} {"train_loss": -6.779623031616211, "global_step": 148120, "epoch": 3526} {"train_loss": -6.820030689239502, "global_step": 148121, "epoch": 3526} {"train_loss": -6.735294342041016, "global_step": 148122, "epoch": 3526} {"train_loss": -6.7904276847839355, "global_step": 148123, "epoch": 3526} {"train_loss": -6.7254958152771, "global_step": 148124, "epoch": 3526} {"train_loss": -6.739712238311768, "global_step": 148125, "epoch": 3526} {"train_loss": -6.801416873931885, "global_step": 148126, "epoch": 3526} {"train_loss": -6.691099166870117, "global_step": 148127, "epoch": 3526} {"train_loss": -6.790227890014648, "global_step": 148128, "epoch": 3526} {"train_loss": -6.752366065979004, "global_step": 148129, "epoch": 3526} {"train_loss": -6.666818618774414, "global_step": 148130, "epoch": 3526} {"train_loss": -6.871579647064209, "global_step": 148131, "epoch": 3526} {"train_loss": -6.840548515319824, "global_step": 148132, "epoch": 3526} {"train_loss": -6.780157509304228, "global_step": 148133, "epoch": 3526, "val_loss": 68353.390625} {"train_loss": -6.697800636291504, "global_step": 148134, "epoch": 3527} {"train_loss": -6.812778472900391, "global_step": 148135, "epoch": 3527} {"train_loss": -6.784971714019775, "global_step": 148136, "epoch": 3527} {"train_loss": -6.714200973510742, "global_step": 148137, "epoch": 3527} {"train_loss": -6.800636291503906, "global_step": 148138, "epoch": 3527} {"train_loss": -6.830211639404297, "global_step": 148139, "epoch": 3527} {"train_loss": -6.7797698974609375, "global_step": 148140, "epoch": 3527} {"train_loss": -6.794788360595703, "global_step": 148141, "epoch": 3527} {"train_loss": -6.802525520324707, "global_step": 148142, "epoch": 3527} {"train_loss": -6.914459228515625, "global_step": 148143, "epoch": 3527} {"train_loss": -6.814231872558594, "global_step": 148144, "epoch": 3527} {"train_loss": -6.892148971557617, "global_step": 148145, "epoch": 3527} {"train_loss": -6.940962314605713, "global_step": 148146, "epoch": 3527} {"train_loss": -6.805690765380859, "global_step": 148147, "epoch": 3527} {"train_loss": -6.839519023895264, "global_step": 148148, "epoch": 3527} {"train_loss": -6.762561321258545, "global_step": 148149, "epoch": 3527} {"train_loss": -6.894583225250244, "global_step": 148150, "epoch": 3527} {"train_loss": -6.811323165893555, "global_step": 148151, "epoch": 3527} {"train_loss": -6.86110782623291, "global_step": 148152, "epoch": 3527} {"train_loss": -6.760509967803955, "global_step": 148153, "epoch": 3527} {"train_loss": -6.862435817718506, "global_step": 148154, "epoch": 3527} {"train_loss": -6.8455705642700195, "global_step": 148155, "epoch": 3527} {"train_loss": -6.835630893707275, "global_step": 148156, "epoch": 3527} {"train_loss": -6.96260404586792, "global_step": 148157, "epoch": 3527} {"train_loss": -6.794206142425537, "global_step": 148158, "epoch": 3527} {"train_loss": -6.875598907470703, "global_step": 148159, "epoch": 3527} {"train_loss": -6.841372013092041, "global_step": 148160, "epoch": 3527} {"train_loss": -6.821640968322754, "global_step": 148161, "epoch": 3527} {"train_loss": -6.834839344024658, "global_step": 148162, "epoch": 3527} {"train_loss": -6.863581657409668, "global_step": 148163, "epoch": 3527} {"train_loss": -6.766556739807129, "global_step": 148164, "epoch": 3527} {"train_loss": -6.856337547302246, "global_step": 148165, "epoch": 3527} {"train_loss": -6.850711345672607, "global_step": 148166, "epoch": 3527} {"train_loss": -6.903693199157715, "global_step": 148167, "epoch": 3527} {"train_loss": -6.869871139526367, "global_step": 148168, "epoch": 3527} {"train_loss": -6.888810634613037, "global_step": 148169, "epoch": 3527} {"train_loss": -6.8395795822143555, "global_step": 148170, "epoch": 3527} {"train_loss": -6.725594997406006, "global_step": 148171, "epoch": 3527} {"train_loss": -6.7834858894348145, "global_step": 148172, "epoch": 3527} {"train_loss": -6.952629089355469, "global_step": 148173, "epoch": 3527} {"train_loss": -6.871608734130859, "global_step": 148174, "epoch": 3527} {"train_loss": -6.833965539932251, "global_step": 148175, "epoch": 3527, "val_loss": 68488.0390625} {"train_loss": -6.84920597076416, "global_step": 148176, "epoch": 3528} {"train_loss": -6.856995105743408, "global_step": 148177, "epoch": 3528} {"train_loss": -6.909725666046143, "global_step": 148178, "epoch": 3528} {"train_loss": -6.952780246734619, "global_step": 148179, "epoch": 3528} {"train_loss": -6.861454010009766, "global_step": 148180, "epoch": 3528} {"train_loss": -6.854979515075684, "global_step": 148181, "epoch": 3528} {"train_loss": -6.859825134277344, "global_step": 148182, "epoch": 3528} {"train_loss": -6.755041122436523, "global_step": 148183, "epoch": 3528} {"train_loss": -6.832096099853516, "global_step": 148184, "epoch": 3528} {"train_loss": -6.884410858154297, "global_step": 148185, "epoch": 3528} {"train_loss": -6.815889835357666, "global_step": 148186, "epoch": 3528} {"train_loss": -6.871394157409668, "global_step": 148187, "epoch": 3528} {"train_loss": -6.80692195892334, "global_step": 148188, "epoch": 3528} {"train_loss": -6.797292709350586, "global_step": 148189, "epoch": 3528} {"train_loss": -6.709062576293945, "global_step": 148190, "epoch": 3528} {"train_loss": -6.844699859619141, "global_step": 148191, "epoch": 3528} {"train_loss": -6.7276387214660645, "global_step": 148192, "epoch": 3528} {"train_loss": -6.675624370574951, "global_step": 148193, "epoch": 3528} {"train_loss": -6.844096660614014, "global_step": 148194, "epoch": 3528} {"train_loss": -6.645855903625488, "global_step": 148195, "epoch": 3528} {"train_loss": -6.7903032302856445, "global_step": 148196, "epoch": 3528} {"train_loss": -6.7405805587768555, "global_step": 148197, "epoch": 3528} {"train_loss": -6.723611831665039, "global_step": 148198, "epoch": 3528} {"train_loss": -6.744948387145996, "global_step": 148199, "epoch": 3528} {"train_loss": -6.703299045562744, "global_step": 148200, "epoch": 3528} {"train_loss": -6.748958587646484, "global_step": 148201, "epoch": 3528} {"train_loss": -6.653554916381836, "global_step": 148202, "epoch": 3528} {"train_loss": -6.763365745544434, "global_step": 148203, "epoch": 3528} {"train_loss": -6.856503486633301, "global_step": 148204, "epoch": 3528} {"train_loss": -6.653531551361084, "global_step": 148205, "epoch": 3528} {"train_loss": -6.7959442138671875, "global_step": 148206, "epoch": 3528} {"train_loss": -6.70065450668335, "global_step": 148207, "epoch": 3528} {"train_loss": -6.725823402404785, "global_step": 148208, "epoch": 3528} {"train_loss": -6.704856872558594, "global_step": 148209, "epoch": 3528} {"train_loss": -6.733541488647461, "global_step": 148210, "epoch": 3528} {"train_loss": -6.732964038848877, "global_step": 148211, "epoch": 3528} {"train_loss": -6.639051914215088, "global_step": 148212, "epoch": 3528} {"train_loss": -6.693596839904785, "global_step": 148213, "epoch": 3528} {"train_loss": -6.826972961425781, "global_step": 148214, "epoch": 3528} {"train_loss": -6.710781097412109, "global_step": 148215, "epoch": 3528} {"train_loss": -6.706882953643799, "global_step": 148216, "epoch": 3528} {"train_loss": -6.7734552792140414, "global_step": 148217, "epoch": 3528, "val_loss": 68327.71875} {"train_loss": -6.742424011230469, "global_step": 148218, "epoch": 3529} {"train_loss": -6.745166778564453, "global_step": 148219, "epoch": 3529} {"train_loss": -6.8485565185546875, "global_step": 148220, "epoch": 3529} {"train_loss": -6.69754695892334, "global_step": 148221, "epoch": 3529} {"train_loss": -6.734992504119873, "global_step": 148222, "epoch": 3529} {"train_loss": -6.62335729598999, "global_step": 148223, "epoch": 3529} {"train_loss": -6.735272407531738, "global_step": 148224, "epoch": 3529} {"train_loss": -6.693770408630371, "global_step": 148225, "epoch": 3529} {"train_loss": -6.587157249450684, "global_step": 148226, "epoch": 3529} {"train_loss": -6.823043346405029, "global_step": 148227, "epoch": 3529} {"train_loss": -6.630687236785889, "global_step": 148228, "epoch": 3529} {"train_loss": -6.700100898742676, "global_step": 148229, "epoch": 3529} {"train_loss": -6.613243103027344, "global_step": 148230, "epoch": 3529} {"train_loss": -6.703564167022705, "global_step": 148231, "epoch": 3529} {"train_loss": -6.751189708709717, "global_step": 148232, "epoch": 3529} {"train_loss": -6.683542251586914, "global_step": 148233, "epoch": 3529} {"train_loss": -6.6531829833984375, "global_step": 148234, "epoch": 3529} {"train_loss": -6.712970733642578, "global_step": 148235, "epoch": 3529} {"train_loss": -6.517244815826416, "global_step": 148236, "epoch": 3529} {"train_loss": -6.679668426513672, "global_step": 148237, "epoch": 3529} {"train_loss": -6.683170318603516, "global_step": 148238, "epoch": 3529} {"train_loss": -6.651435375213623, "global_step": 148239, "epoch": 3529} {"train_loss": -6.637637138366699, "global_step": 148240, "epoch": 3529} {"train_loss": -6.587084770202637, "global_step": 148241, "epoch": 3529} {"train_loss": -6.6635541915893555, "global_step": 148242, "epoch": 3529} {"train_loss": -6.699464797973633, "global_step": 148243, "epoch": 3529} {"train_loss": -6.758808612823486, "global_step": 148244, "epoch": 3529} {"train_loss": -6.506135940551758, "global_step": 148245, "epoch": 3529} {"train_loss": -6.705777168273926, "global_step": 148246, "epoch": 3529} {"train_loss": -6.706008434295654, "global_step": 148247, "epoch": 3529} {"train_loss": -6.797360420227051, "global_step": 148248, "epoch": 3529} {"train_loss": -6.713220596313477, "global_step": 148249, "epoch": 3529} {"train_loss": -6.753695011138916, "global_step": 148250, "epoch": 3529} {"train_loss": -6.797830581665039, "global_step": 148251, "epoch": 3529} {"train_loss": -6.815923690795898, "global_step": 148252, "epoch": 3529} {"train_loss": -6.807441234588623, "global_step": 148253, "epoch": 3529} {"train_loss": -6.7876763343811035, "global_step": 148254, "epoch": 3529} {"train_loss": -6.780577659606934, "global_step": 148255, "epoch": 3529} {"train_loss": -6.744821548461914, "global_step": 148256, "epoch": 3529} {"train_loss": -6.694938659667969, "global_step": 148257, "epoch": 3529} {"train_loss": -6.743617057800293, "global_step": 148258, "epoch": 3529} {"train_loss": -6.7044942151932485, "global_step": 148259, "epoch": 3529, "val_loss": 68322.421875} {"train_loss": -6.79086971282959, "global_step": 148260, "epoch": 3530} {"train_loss": -6.766632080078125, "global_step": 148261, "epoch": 3530} {"train_loss": -6.832793235778809, "global_step": 148262, "epoch": 3530} {"train_loss": -6.65870475769043, "global_step": 148263, "epoch": 3530} {"train_loss": -6.895326614379883, "global_step": 148264, "epoch": 3530} {"train_loss": -6.93722677230835, "global_step": 148265, "epoch": 3530} {"train_loss": -6.745589256286621, "global_step": 148266, "epoch": 3530} {"train_loss": -6.790067672729492, "global_step": 148267, "epoch": 3530} {"train_loss": -6.796688079833984, "global_step": 148268, "epoch": 3530} {"train_loss": -6.798548698425293, "global_step": 148269, "epoch": 3530} {"train_loss": -6.841555595397949, "global_step": 148270, "epoch": 3530} {"train_loss": -6.792837142944336, "global_step": 148271, "epoch": 3530} {"train_loss": -6.821429252624512, "global_step": 148272, "epoch": 3530} {"train_loss": -6.836615562438965, "global_step": 148273, "epoch": 3530} {"train_loss": -6.933252334594727, "global_step": 148274, "epoch": 3530} {"train_loss": -6.748913764953613, "global_step": 148275, "epoch": 3530} {"train_loss": -6.848289489746094, "global_step": 148276, "epoch": 3530} {"train_loss": -6.747468948364258, "global_step": 148277, "epoch": 3530} {"train_loss": -6.8234663009643555, "global_step": 148278, "epoch": 3530} {"train_loss": -6.710188865661621, "global_step": 148279, "epoch": 3530} {"train_loss": -6.8369059562683105, "global_step": 148280, "epoch": 3530} {"train_loss": -6.692049980163574, "global_step": 148281, "epoch": 3530} {"train_loss": -6.8567070960998535, "global_step": 148282, "epoch": 3530} {"train_loss": -6.827219009399414, "global_step": 148283, "epoch": 3530} {"train_loss": -6.781811714172363, "global_step": 148284, "epoch": 3530} {"train_loss": -6.876810550689697, "global_step": 148285, "epoch": 3530} {"train_loss": -6.8463640213012695, "global_step": 148286, "epoch": 3530} {"train_loss": -6.813906669616699, "global_step": 148287, "epoch": 3530} {"train_loss": -6.766505718231201, "global_step": 148288, "epoch": 3530} {"train_loss": -6.881036758422852, "global_step": 148289, "epoch": 3530} {"train_loss": -6.950037956237793, "global_step": 148290, "epoch": 3530} {"train_loss": -6.796916961669922, "global_step": 148291, "epoch": 3530} {"train_loss": -6.8852410316467285, "global_step": 148292, "epoch": 3530} {"train_loss": -6.933886528015137, "global_step": 148293, "epoch": 3530} {"train_loss": -6.941010475158691, "global_step": 148294, "epoch": 3530} {"train_loss": -6.925997734069824, "global_step": 148295, "epoch": 3530} {"train_loss": -6.977001190185547, "global_step": 148296, "epoch": 3530} {"train_loss": -6.883265495300293, "global_step": 148297, "epoch": 3530} {"train_loss": -6.771847724914551, "global_step": 148298, "epoch": 3530} {"train_loss": -6.7944440841674805, "global_step": 148299, "epoch": 3530} {"train_loss": -6.909282684326172, "global_step": 148300, "epoch": 3530} {"train_loss": -6.831234761646816, "global_step": 148301, "epoch": 3530, "val_loss": 68464.859375} {"train_loss": -6.8016252517700195, "global_step": 148302, "epoch": 3531} {"train_loss": -6.87764835357666, "global_step": 148303, "epoch": 3531} {"train_loss": -6.813570976257324, "global_step": 148304, "epoch": 3531} {"train_loss": -6.868072509765625, "global_step": 148305, "epoch": 3531} {"train_loss": -6.80292272567749, "global_step": 148306, "epoch": 3531} {"train_loss": -6.791807651519775, "global_step": 148307, "epoch": 3531} {"train_loss": -6.891051292419434, "global_step": 148308, "epoch": 3531} {"train_loss": -6.79086971282959, "global_step": 148309, "epoch": 3531} {"train_loss": -6.927516937255859, "global_step": 148310, "epoch": 3531} {"train_loss": -6.718712329864502, "global_step": 148311, "epoch": 3531} {"train_loss": -6.716766834259033, "global_step": 148312, "epoch": 3531} {"train_loss": -6.793447494506836, "global_step": 148313, "epoch": 3531} {"train_loss": -6.827629566192627, "global_step": 148314, "epoch": 3531} {"train_loss": -6.801052570343018, "global_step": 148315, "epoch": 3531} {"train_loss": -6.811086654663086, "global_step": 148316, "epoch": 3531} {"train_loss": -6.780454635620117, "global_step": 148317, "epoch": 3531} {"train_loss": -6.822339057922363, "global_step": 148318, "epoch": 3531} {"train_loss": -6.860833644866943, "global_step": 148319, "epoch": 3531} {"train_loss": -6.756848335266113, "global_step": 148320, "epoch": 3531} {"train_loss": -6.839700698852539, "global_step": 148321, "epoch": 3531} {"train_loss": -6.884551048278809, "global_step": 148322, "epoch": 3531} {"train_loss": -6.861229419708252, "global_step": 148323, "epoch": 3531} {"train_loss": -6.881583213806152, "global_step": 148324, "epoch": 3531} {"train_loss": -6.775612831115723, "global_step": 148325, "epoch": 3531} {"train_loss": -6.850189685821533, "global_step": 148326, "epoch": 3531} {"train_loss": -6.774470329284668, "global_step": 148327, "epoch": 3531} {"train_loss": -6.796635150909424, "global_step": 148328, "epoch": 3531} {"train_loss": -6.824951171875, "global_step": 148329, "epoch": 3531} {"train_loss": -6.840018272399902, "global_step": 148330, "epoch": 3531} {"train_loss": -6.736379623413086, "global_step": 148331, "epoch": 3531} {"train_loss": -6.918921947479248, "global_step": 148332, "epoch": 3531} {"train_loss": -6.726038932800293, "global_step": 148333, "epoch": 3531} {"train_loss": -6.868844509124756, "global_step": 148334, "epoch": 3531} {"train_loss": -6.876810550689697, "global_step": 148335, "epoch": 3531} {"train_loss": -6.815564155578613, "global_step": 148336, "epoch": 3531} {"train_loss": -6.832375526428223, "global_step": 148337, "epoch": 3531} {"train_loss": -6.88852596282959, "global_step": 148338, "epoch": 3531} {"train_loss": -6.895155906677246, "global_step": 148339, "epoch": 3531} {"train_loss": -6.800346851348877, "global_step": 148340, "epoch": 3531} {"train_loss": -6.84187126159668, "global_step": 148341, "epoch": 3531} {"train_loss": -6.868704795837402, "global_step": 148342, "epoch": 3531} {"train_loss": -6.826654241198585, "global_step": 148343, "epoch": 3531, "val_loss": 68382.390625} {"train_loss": -6.953299522399902, "global_step": 148344, "epoch": 3532} {"train_loss": -6.796156883239746, "global_step": 148345, "epoch": 3532} {"train_loss": -6.807498931884766, "global_step": 148346, "epoch": 3532} {"train_loss": -6.883853435516357, "global_step": 148347, "epoch": 3532} {"train_loss": -6.846451759338379, "global_step": 148348, "epoch": 3532} {"train_loss": -6.709262847900391, "global_step": 148349, "epoch": 3532} {"train_loss": -6.863541603088379, "global_step": 148350, "epoch": 3532} {"train_loss": -6.838688373565674, "global_step": 148351, "epoch": 3532} {"train_loss": -6.792153358459473, "global_step": 148352, "epoch": 3532} {"train_loss": -6.930891513824463, "global_step": 148353, "epoch": 3532} {"train_loss": -6.823202133178711, "global_step": 148354, "epoch": 3532} {"train_loss": -6.868903636932373, "global_step": 148355, "epoch": 3532} {"train_loss": -6.800222873687744, "global_step": 148356, "epoch": 3532} {"train_loss": -6.784521579742432, "global_step": 148357, "epoch": 3532} {"train_loss": -6.835746765136719, "global_step": 148358, "epoch": 3532} {"train_loss": -6.865602493286133, "global_step": 148359, "epoch": 3532} {"train_loss": -6.8193745613098145, "global_step": 148360, "epoch": 3532} {"train_loss": -6.84377384185791, "global_step": 148361, "epoch": 3532} {"train_loss": -6.749178886413574, "global_step": 148362, "epoch": 3532} {"train_loss": -6.848511695861816, "global_step": 148363, "epoch": 3532} {"train_loss": -6.914850234985352, "global_step": 148364, "epoch": 3532} {"train_loss": -6.856185436248779, "global_step": 148365, "epoch": 3532} {"train_loss": -6.844425678253174, "global_step": 148366, "epoch": 3532} {"train_loss": -6.836630821228027, "global_step": 148367, "epoch": 3532} {"train_loss": -6.819628715515137, "global_step": 148368, "epoch": 3532} {"train_loss": -6.853933334350586, "global_step": 148369, "epoch": 3532} {"train_loss": -6.762581825256348, "global_step": 148370, "epoch": 3532} {"train_loss": -6.733864784240723, "global_step": 148371, "epoch": 3532} {"train_loss": -6.854931831359863, "global_step": 148372, "epoch": 3532} {"train_loss": -6.582456111907959, "global_step": 148373, "epoch": 3532} {"train_loss": -6.796567440032959, "global_step": 148374, "epoch": 3532} {"train_loss": -6.7562971115112305, "global_step": 148375, "epoch": 3532} {"train_loss": -6.745905876159668, "global_step": 148376, "epoch": 3532} {"train_loss": -6.731561183929443, "global_step": 148377, "epoch": 3532} {"train_loss": -6.73978328704834, "global_step": 148378, "epoch": 3532} {"train_loss": -6.7412004470825195, "global_step": 148379, "epoch": 3532} {"train_loss": -6.803646564483643, "global_step": 148380, "epoch": 3532} {"train_loss": -6.856886863708496, "global_step": 148381, "epoch": 3532} {"train_loss": -6.794233798980713, "global_step": 148382, "epoch": 3532} {"train_loss": -6.849210739135742, "global_step": 148383, "epoch": 3532} {"train_loss": -6.798823356628418, "global_step": 148384, "epoch": 3532} {"train_loss": -6.8145379566010975, "global_step": 148385, "epoch": 3532, "val_loss": 68308.921875} {"train_loss": -6.945406913757324, "global_step": 148386, "epoch": 3533} {"train_loss": -6.872603416442871, "global_step": 148387, "epoch": 3533} {"train_loss": -6.805514812469482, "global_step": 148388, "epoch": 3533} {"train_loss": -6.893775939941406, "global_step": 148389, "epoch": 3533} {"train_loss": -6.834349155426025, "global_step": 148390, "epoch": 3533} {"train_loss": -6.803768157958984, "global_step": 148391, "epoch": 3533} {"train_loss": -6.878565788269043, "global_step": 148392, "epoch": 3533} {"train_loss": -6.840505599975586, "global_step": 148393, "epoch": 3533} {"train_loss": -6.804335594177246, "global_step": 148394, "epoch": 3533} {"train_loss": -6.846892833709717, "global_step": 148395, "epoch": 3533} {"train_loss": -6.886087417602539, "global_step": 148396, "epoch": 3533} {"train_loss": -6.88759708404541, "global_step": 148397, "epoch": 3533} {"train_loss": -6.846547603607178, "global_step": 148398, "epoch": 3533} {"train_loss": -6.854779243469238, "global_step": 148399, "epoch": 3533} {"train_loss": -6.887997627258301, "global_step": 148400, "epoch": 3533} {"train_loss": -6.833155155181885, "global_step": 148401, "epoch": 3533} {"train_loss": -6.695971488952637, "global_step": 148402, "epoch": 3533} {"train_loss": -6.913406848907471, "global_step": 148403, "epoch": 3533} {"train_loss": -6.896881580352783, "global_step": 148404, "epoch": 3533} {"train_loss": -6.836867332458496, "global_step": 148405, "epoch": 3533} {"train_loss": -6.701074600219727, "global_step": 148406, "epoch": 3533} {"train_loss": -6.711887359619141, "global_step": 148407, "epoch": 3533} {"train_loss": -6.806902885437012, "global_step": 148408, "epoch": 3533} {"train_loss": -6.7138566970825195, "global_step": 148409, "epoch": 3533} {"train_loss": -6.729972839355469, "global_step": 148410, "epoch": 3533} {"train_loss": -6.794729232788086, "global_step": 148411, "epoch": 3533} {"train_loss": -6.6242475509643555, "global_step": 148412, "epoch": 3533} {"train_loss": -6.686044216156006, "global_step": 148413, "epoch": 3533} {"train_loss": -6.743106365203857, "global_step": 148414, "epoch": 3533} {"train_loss": -6.66640043258667, "global_step": 148415, "epoch": 3533} {"train_loss": -6.752039909362793, "global_step": 148416, "epoch": 3533} {"train_loss": -6.536085605621338, "global_step": 148417, "epoch": 3533} {"train_loss": -6.758636474609375, "global_step": 148418, "epoch": 3533} {"train_loss": -6.603358268737793, "global_step": 148419, "epoch": 3533} {"train_loss": -6.752018451690674, "global_step": 148420, "epoch": 3533} {"train_loss": -6.600481986999512, "global_step": 148421, "epoch": 3533} {"train_loss": -6.755244255065918, "global_step": 148422, "epoch": 3533} {"train_loss": -6.66545295715332, "global_step": 148423, "epoch": 3533} {"train_loss": -6.742579936981201, "global_step": 148424, "epoch": 3533} {"train_loss": -6.862378120422363, "global_step": 148425, "epoch": 3533} {"train_loss": -6.6744561195373535, "global_step": 148426, "epoch": 3533} {"train_loss": -6.780001129422869, "global_step": 148427, "epoch": 3533, "val_loss": 68608.171875} {"train_loss": -6.679499626159668, "global_step": 148428, "epoch": 3534} {"train_loss": -6.848217487335205, "global_step": 148429, "epoch": 3534} {"train_loss": -6.77337646484375, "global_step": 148430, "epoch": 3534} {"train_loss": -6.794289588928223, "global_step": 148431, "epoch": 3534} {"train_loss": -6.781952857971191, "global_step": 148432, "epoch": 3534} {"train_loss": -6.752497673034668, "global_step": 148433, "epoch": 3534} {"train_loss": -6.779836654663086, "global_step": 148434, "epoch": 3534} {"train_loss": -6.663836479187012, "global_step": 148435, "epoch": 3534} {"train_loss": -6.834138870239258, "global_step": 148436, "epoch": 3534} {"train_loss": -6.788427829742432, "global_step": 148437, "epoch": 3534} {"train_loss": -6.680776596069336, "global_step": 148438, "epoch": 3534} {"train_loss": -6.859700679779053, "global_step": 148439, "epoch": 3534} {"train_loss": -6.754723072052002, "global_step": 148440, "epoch": 3534} {"train_loss": -6.9390058517456055, "global_step": 148441, "epoch": 3534} {"train_loss": -6.746313095092773, "global_step": 148442, "epoch": 3534} {"train_loss": -6.711682319641113, "global_step": 148443, "epoch": 3534} {"train_loss": -6.868135452270508, "global_step": 148444, "epoch": 3534} {"train_loss": -6.739584922790527, "global_step": 148445, "epoch": 3534} {"train_loss": -6.931061267852783, "global_step": 148446, "epoch": 3534} {"train_loss": -6.778692245483398, "global_step": 148447, "epoch": 3534} {"train_loss": -6.792491912841797, "global_step": 148448, "epoch": 3534} {"train_loss": -6.77407169342041, "global_step": 148449, "epoch": 3534} {"train_loss": -6.9224700927734375, "global_step": 148450, "epoch": 3534} {"train_loss": -6.831071853637695, "global_step": 148451, "epoch": 3534} {"train_loss": -6.8328351974487305, "global_step": 148452, "epoch": 3534} {"train_loss": -6.768029689788818, "global_step": 148453, "epoch": 3534} {"train_loss": -6.785139083862305, "global_step": 148454, "epoch": 3534} {"train_loss": -6.881091117858887, "global_step": 148455, "epoch": 3534} {"train_loss": -6.696433067321777, "global_step": 148456, "epoch": 3534} {"train_loss": -6.890681743621826, "global_step": 148457, "epoch": 3534} {"train_loss": -6.790085315704346, "global_step": 148458, "epoch": 3534} {"train_loss": -6.959896087646484, "global_step": 148459, "epoch": 3534} {"train_loss": -6.854674339294434, "global_step": 148460, "epoch": 3534} {"train_loss": -6.841203689575195, "global_step": 148461, "epoch": 3534} {"train_loss": -6.796951770782471, "global_step": 148462, "epoch": 3534} {"train_loss": -6.728201866149902, "global_step": 148463, "epoch": 3534} {"train_loss": -6.756615161895752, "global_step": 148464, "epoch": 3534} {"train_loss": -6.681421279907227, "global_step": 148465, "epoch": 3534} {"train_loss": -6.670970916748047, "global_step": 148466, "epoch": 3534} {"train_loss": -6.769946575164795, "global_step": 148467, "epoch": 3534} {"train_loss": -6.749489784240723, "global_step": 148468, "epoch": 3534} {"train_loss": -6.791147379648118, "global_step": 148469, "epoch": 3534, "val_loss": 68455.5859375} {"train_loss": -6.823088645935059, "global_step": 148470, "epoch": 3535} {"train_loss": -6.710045337677002, "global_step": 148471, "epoch": 3535} {"train_loss": -6.823008060455322, "global_step": 148472, "epoch": 3535} {"train_loss": -6.986379623413086, "global_step": 148473, "epoch": 3535} {"train_loss": -6.784460544586182, "global_step": 148474, "epoch": 3535} {"train_loss": -6.773926258087158, "global_step": 148475, "epoch": 3535} {"train_loss": -6.654385089874268, "global_step": 148476, "epoch": 3535} {"train_loss": -6.69180965423584, "global_step": 148477, "epoch": 3535} {"train_loss": -6.846697807312012, "global_step": 148478, "epoch": 3535} {"train_loss": -6.762009143829346, "global_step": 148479, "epoch": 3535} {"train_loss": -6.741673469543457, "global_step": 148480, "epoch": 3535} {"train_loss": -6.783872604370117, "global_step": 148481, "epoch": 3535} {"train_loss": -6.598629951477051, "global_step": 148482, "epoch": 3535} {"train_loss": -6.6928606033325195, "global_step": 148483, "epoch": 3535} {"train_loss": -6.600969314575195, "global_step": 148484, "epoch": 3535} {"train_loss": -6.830178737640381, "global_step": 148485, "epoch": 3535} {"train_loss": -6.774456977844238, "global_step": 148486, "epoch": 3535} {"train_loss": -6.876812934875488, "global_step": 148487, "epoch": 3535} {"train_loss": -6.786832809448242, "global_step": 148488, "epoch": 3535} {"train_loss": -6.7111358642578125, "global_step": 148489, "epoch": 3535} {"train_loss": -6.631162643432617, "global_step": 148490, "epoch": 3535} {"train_loss": -6.825132846832275, "global_step": 148491, "epoch": 3535} {"train_loss": -6.747097492218018, "global_step": 148492, "epoch": 3535} {"train_loss": -6.786983013153076, "global_step": 148493, "epoch": 3535} {"train_loss": -6.741925239562988, "global_step": 148494, "epoch": 3535} {"train_loss": -6.674504280090332, "global_step": 148495, "epoch": 3535} {"train_loss": -6.715860366821289, "global_step": 148496, "epoch": 3535} {"train_loss": -6.6780290603637695, "global_step": 148497, "epoch": 3535} {"train_loss": -6.732422828674316, "global_step": 148498, "epoch": 3535} {"train_loss": -6.76502799987793, "global_step": 148499, "epoch": 3535} {"train_loss": -6.6900482177734375, "global_step": 148500, "epoch": 3535} {"train_loss": -6.731051445007324, "global_step": 148501, "epoch": 3535} {"train_loss": -6.677647590637207, "global_step": 148502, "epoch": 3535} {"train_loss": -6.746688365936279, "global_step": 148503, "epoch": 3535} {"train_loss": -6.717022895812988, "global_step": 148504, "epoch": 3535} {"train_loss": -6.757943630218506, "global_step": 148505, "epoch": 3535} {"train_loss": -6.845729827880859, "global_step": 148506, "epoch": 3535} {"train_loss": -6.660079002380371, "global_step": 148507, "epoch": 3535} {"train_loss": -6.814788341522217, "global_step": 148508, "epoch": 3535} {"train_loss": -6.806313514709473, "global_step": 148509, "epoch": 3535} {"train_loss": -6.685016632080078, "global_step": 148510, "epoch": 3535} {"train_loss": -6.748408987408593, "global_step": 148511, "epoch": 3535, "val_loss": 68379.859375} {"train_loss": -6.777889251708984, "global_step": 148512, "epoch": 3536} {"train_loss": -6.739551067352295, "global_step": 148513, "epoch": 3536} {"train_loss": -6.737229347229004, "global_step": 148514, "epoch": 3536} {"train_loss": -6.741565704345703, "global_step": 148515, "epoch": 3536} {"train_loss": -6.734617233276367, "global_step": 148516, "epoch": 3536} {"train_loss": -6.827528953552246, "global_step": 148517, "epoch": 3536} {"train_loss": -6.773283958435059, "global_step": 148518, "epoch": 3536} {"train_loss": -6.6894211769104, "global_step": 148519, "epoch": 3536} {"train_loss": -6.930437088012695, "global_step": 148520, "epoch": 3536} {"train_loss": -6.794655799865723, "global_step": 148521, "epoch": 3536} {"train_loss": -6.665708541870117, "global_step": 148522, "epoch": 3536} {"train_loss": -6.766922950744629, "global_step": 148523, "epoch": 3536} {"train_loss": -6.780804634094238, "global_step": 148524, "epoch": 3536} {"train_loss": -6.829410076141357, "global_step": 148525, "epoch": 3536} {"train_loss": -6.894179344177246, "global_step": 148526, "epoch": 3536} {"train_loss": -6.768923759460449, "global_step": 148527, "epoch": 3536} {"train_loss": -6.676139831542969, "global_step": 148528, "epoch": 3536} {"train_loss": -6.7713189125061035, "global_step": 148529, "epoch": 3536} {"train_loss": -6.791469573974609, "global_step": 148530, "epoch": 3536} {"train_loss": -6.709963798522949, "global_step": 148531, "epoch": 3536} {"train_loss": -6.776060581207275, "global_step": 148532, "epoch": 3536} {"train_loss": -6.801854133605957, "global_step": 148533, "epoch": 3536} {"train_loss": -6.759214401245117, "global_step": 148534, "epoch": 3536} {"train_loss": -6.867194175720215, "global_step": 148535, "epoch": 3536} {"train_loss": -6.699851036071777, "global_step": 148536, "epoch": 3536} {"train_loss": -6.761140823364258, "global_step": 148537, "epoch": 3536} {"train_loss": -6.833709239959717, "global_step": 148538, "epoch": 3536} {"train_loss": -6.750091075897217, "global_step": 148539, "epoch": 3536} {"train_loss": -6.907009124755859, "global_step": 148540, "epoch": 3536} {"train_loss": -6.810044765472412, "global_step": 148541, "epoch": 3536} {"train_loss": -6.704432487487793, "global_step": 148542, "epoch": 3536} {"train_loss": -6.8371686935424805, "global_step": 148543, "epoch": 3536} {"train_loss": -6.804388999938965, "global_step": 148544, "epoch": 3536} {"train_loss": -6.7931718826293945, "global_step": 148545, "epoch": 3536} {"train_loss": -6.767080307006836, "global_step": 148546, "epoch": 3536} {"train_loss": -6.853124618530273, "global_step": 148547, "epoch": 3536} {"train_loss": -6.7458038330078125, "global_step": 148548, "epoch": 3536} {"train_loss": -6.815117835998535, "global_step": 148549, "epoch": 3536} {"train_loss": -6.782113552093506, "global_step": 148550, "epoch": 3536} {"train_loss": -6.756936073303223, "global_step": 148551, "epoch": 3536} {"train_loss": -6.954636096954346, "global_step": 148552, "epoch": 3536} {"train_loss": -6.784398771467663, "global_step": 148553, "epoch": 3536, "val_loss": 68405.7109375} {"train_loss": -6.788722515106201, "global_step": 148554, "epoch": 3537} {"train_loss": -6.782829284667969, "global_step": 148555, "epoch": 3537} {"train_loss": -6.808509349822998, "global_step": 148556, "epoch": 3537} {"train_loss": -6.755311012268066, "global_step": 148557, "epoch": 3537} {"train_loss": -6.791341781616211, "global_step": 148558, "epoch": 3537} {"train_loss": -6.746360778808594, "global_step": 148559, "epoch": 3537} {"train_loss": -6.854918479919434, "global_step": 148560, "epoch": 3537} {"train_loss": -6.715765953063965, "global_step": 148561, "epoch": 3537} {"train_loss": -6.798201560974121, "global_step": 148562, "epoch": 3537} {"train_loss": -6.826221466064453, "global_step": 148563, "epoch": 3537} {"train_loss": -6.732290267944336, "global_step": 148564, "epoch": 3537} {"train_loss": -6.717485427856445, "global_step": 148565, "epoch": 3537} {"train_loss": -6.694604873657227, "global_step": 148566, "epoch": 3537} {"train_loss": -6.737043380737305, "global_step": 148567, "epoch": 3537} {"train_loss": -6.729930400848389, "global_step": 148568, "epoch": 3537} {"train_loss": -6.578925132751465, "global_step": 148569, "epoch": 3537} {"train_loss": -6.791562080383301, "global_step": 148570, "epoch": 3537} {"train_loss": -6.665018558502197, "global_step": 148571, "epoch": 3537} {"train_loss": -6.75257682800293, "global_step": 148572, "epoch": 3537} {"train_loss": -6.816371440887451, "global_step": 148573, "epoch": 3537} {"train_loss": -6.6658616065979, "global_step": 148574, "epoch": 3537} {"train_loss": -6.7357025146484375, "global_step": 148575, "epoch": 3537} {"train_loss": -6.735741138458252, "global_step": 148576, "epoch": 3537} {"train_loss": -6.711232662200928, "global_step": 148577, "epoch": 3537} {"train_loss": -6.711005210876465, "global_step": 148578, "epoch": 3537} {"train_loss": -6.809913635253906, "global_step": 148579, "epoch": 3537} {"train_loss": -6.823847770690918, "global_step": 148580, "epoch": 3537} {"train_loss": -6.862113952636719, "global_step": 148581, "epoch": 3537} {"train_loss": -6.766392707824707, "global_step": 148582, "epoch": 3537} {"train_loss": -6.820854187011719, "global_step": 148583, "epoch": 3537} {"train_loss": -6.828575134277344, "global_step": 148584, "epoch": 3537} {"train_loss": -6.875858783721924, "global_step": 148585, "epoch": 3537} {"train_loss": -6.7872514724731445, "global_step": 148586, "epoch": 3537} {"train_loss": -6.797886371612549, "global_step": 148587, "epoch": 3537} {"train_loss": -6.823599815368652, "global_step": 148588, "epoch": 3537} {"train_loss": -6.730318069458008, "global_step": 148589, "epoch": 3537} {"train_loss": -6.876647472381592, "global_step": 148590, "epoch": 3537} {"train_loss": -6.950308322906494, "global_step": 148591, "epoch": 3537} {"train_loss": -6.892853736877441, "global_step": 148592, "epoch": 3537} {"train_loss": -6.819008827209473, "global_step": 148593, "epoch": 3537} {"train_loss": -6.831514358520508, "global_step": 148594, "epoch": 3537} {"train_loss": -6.781700565701439, "global_step": 148595, "epoch": 3537, "val_loss": 68536.1953125} {"train_loss": -6.836503505706787, "global_step": 148596, "epoch": 3538} {"train_loss": -6.872403144836426, "global_step": 148597, "epoch": 3538} {"train_loss": -6.873719215393066, "global_step": 148598, "epoch": 3538} {"train_loss": -6.856330871582031, "global_step": 148599, "epoch": 3538} {"train_loss": -6.892479419708252, "global_step": 148600, "epoch": 3538} {"train_loss": -6.887470722198486, "global_step": 148601, "epoch": 3538} {"train_loss": -6.941167831420898, "global_step": 148602, "epoch": 3538} {"train_loss": -6.861742973327637, "global_step": 148603, "epoch": 3538} {"train_loss": -6.847410678863525, "global_step": 148604, "epoch": 3538} {"train_loss": -6.869266033172607, "global_step": 148605, "epoch": 3538} {"train_loss": -6.920214653015137, "global_step": 148606, "epoch": 3538} {"train_loss": -6.842404365539551, "global_step": 148607, "epoch": 3538} {"train_loss": -6.815314292907715, "global_step": 148608, "epoch": 3538} {"train_loss": -6.826694011688232, "global_step": 148609, "epoch": 3538} {"train_loss": -6.757371425628662, "global_step": 148610, "epoch": 3538} {"train_loss": -6.767485618591309, "global_step": 148611, "epoch": 3538} {"train_loss": -6.895390510559082, "global_step": 148612, "epoch": 3538} {"train_loss": -6.944310665130615, "global_step": 148613, "epoch": 3538} {"train_loss": -6.902194499969482, "global_step": 148614, "epoch": 3538} {"train_loss": -7.017484664916992, "global_step": 148615, "epoch": 3538} {"train_loss": -6.776957035064697, "global_step": 148616, "epoch": 3538} {"train_loss": -6.769470691680908, "global_step": 148617, "epoch": 3538} {"train_loss": -6.741698741912842, "global_step": 148618, "epoch": 3538} {"train_loss": -6.729310035705566, "global_step": 148619, "epoch": 3538} {"train_loss": -6.771993637084961, "global_step": 148620, "epoch": 3538} {"train_loss": -6.817181587219238, "global_step": 148621, "epoch": 3538} {"train_loss": -6.804901123046875, "global_step": 148622, "epoch": 3538} {"train_loss": -6.799742698669434, "global_step": 148623, "epoch": 3538} {"train_loss": -6.8202009201049805, "global_step": 148624, "epoch": 3538} {"train_loss": -6.876028060913086, "global_step": 148625, "epoch": 3538} {"train_loss": -6.788568496704102, "global_step": 148626, "epoch": 3538} {"train_loss": -6.800314903259277, "global_step": 148627, "epoch": 3538} {"train_loss": -6.854205131530762, "global_step": 148628, "epoch": 3538} {"train_loss": -6.728171348571777, "global_step": 148629, "epoch": 3538} {"train_loss": -6.754968643188477, "global_step": 148630, "epoch": 3538} {"train_loss": -6.91099739074707, "global_step": 148631, "epoch": 3538} {"train_loss": -6.818829536437988, "global_step": 148632, "epoch": 3538} {"train_loss": -6.82203483581543, "global_step": 148633, "epoch": 3538} {"train_loss": -6.813342094421387, "global_step": 148634, "epoch": 3538} {"train_loss": -6.736087799072266, "global_step": 148635, "epoch": 3538} {"train_loss": -6.832766532897949, "global_step": 148636, "epoch": 3538} {"train_loss": -6.836193697793143, "global_step": 148637, "epoch": 3538, "val_loss": 68430.1328125} {"train_loss": -6.7451581954956055, "global_step": 148638, "epoch": 3539} {"train_loss": -6.944431781768799, "global_step": 148639, "epoch": 3539} {"train_loss": -6.954444885253906, "global_step": 148640, "epoch": 3539} {"train_loss": -6.850161552429199, "global_step": 148641, "epoch": 3539} {"train_loss": -6.815196990966797, "global_step": 148642, "epoch": 3539} {"train_loss": -6.761620998382568, "global_step": 148643, "epoch": 3539} {"train_loss": -6.841580390930176, "global_step": 148644, "epoch": 3539} {"train_loss": -6.901874542236328, "global_step": 148645, "epoch": 3539} {"train_loss": -6.9300007820129395, "global_step": 148646, "epoch": 3539} {"train_loss": -6.9025983810424805, "global_step": 148647, "epoch": 3539} {"train_loss": -6.825765609741211, "global_step": 148648, "epoch": 3539} {"train_loss": -6.873133659362793, "global_step": 148649, "epoch": 3539} {"train_loss": -6.882467269897461, "global_step": 148650, "epoch": 3539} {"train_loss": -6.8637375831604, "global_step": 148651, "epoch": 3539} {"train_loss": -6.989166259765625, "global_step": 148652, "epoch": 3539} {"train_loss": -6.869952201843262, "global_step": 148653, "epoch": 3539} {"train_loss": -6.792681694030762, "global_step": 148654, "epoch": 3539} {"train_loss": -6.782639503479004, "global_step": 148655, "epoch": 3539} {"train_loss": -6.804416179656982, "global_step": 148656, "epoch": 3539} {"train_loss": -6.761247634887695, "global_step": 148657, "epoch": 3539} {"train_loss": -6.90432596206665, "global_step": 148658, "epoch": 3539} {"train_loss": -6.852371692657471, "global_step": 148659, "epoch": 3539} {"train_loss": -6.872447967529297, "global_step": 148660, "epoch": 3539} {"train_loss": -6.898214340209961, "global_step": 148661, "epoch": 3539} {"train_loss": -6.865935325622559, "global_step": 148662, "epoch": 3539} {"train_loss": -6.841433525085449, "global_step": 148663, "epoch": 3539} {"train_loss": -6.870626926422119, "global_step": 148664, "epoch": 3539} {"train_loss": -6.82501220703125, "global_step": 148665, "epoch": 3539} {"train_loss": -6.878244876861572, "global_step": 148666, "epoch": 3539} {"train_loss": -6.885438919067383, "global_step": 148667, "epoch": 3539} {"train_loss": -6.803616523742676, "global_step": 148668, "epoch": 3539} {"train_loss": -6.759445667266846, "global_step": 148669, "epoch": 3539} {"train_loss": -6.874358654022217, "global_step": 148670, "epoch": 3539} {"train_loss": -6.740389347076416, "global_step": 148671, "epoch": 3539} {"train_loss": -6.793758392333984, "global_step": 148672, "epoch": 3539} {"train_loss": -6.793191909790039, "global_step": 148673, "epoch": 3539} {"train_loss": -6.872539520263672, "global_step": 148674, "epoch": 3539} {"train_loss": -6.922584533691406, "global_step": 148675, "epoch": 3539} {"train_loss": -6.838905334472656, "global_step": 148676, "epoch": 3539} {"train_loss": -6.842593193054199, "global_step": 148677, "epoch": 3539} {"train_loss": -6.690621376037598, "global_step": 148678, "epoch": 3539} {"train_loss": -6.844233967009044, "global_step": 148679, "epoch": 3539, "val_loss": 68273.40625} {"train_loss": -6.769869804382324, "global_step": 148680, "epoch": 3540} {"train_loss": -6.750097274780273, "global_step": 148681, "epoch": 3540} {"train_loss": -6.855777263641357, "global_step": 148682, "epoch": 3540} {"train_loss": -6.8637895584106445, "global_step": 148683, "epoch": 3540} {"train_loss": -6.7657790184021, "global_step": 148684, "epoch": 3540} {"train_loss": -6.817523956298828, "global_step": 148685, "epoch": 3540} {"train_loss": -6.689816474914551, "global_step": 148686, "epoch": 3540} {"train_loss": -6.711007118225098, "global_step": 148687, "epoch": 3540} {"train_loss": -6.8961567878723145, "global_step": 148688, "epoch": 3540} {"train_loss": -6.59840726852417, "global_step": 148689, "epoch": 3540} {"train_loss": -6.93162202835083, "global_step": 148690, "epoch": 3540} {"train_loss": -6.670670509338379, "global_step": 148691, "epoch": 3540} {"train_loss": -6.566725730895996, "global_step": 148692, "epoch": 3540} {"train_loss": -6.744028091430664, "global_step": 148693, "epoch": 3540} {"train_loss": -6.713959693908691, "global_step": 148694, "epoch": 3540} {"train_loss": -6.7273969650268555, "global_step": 148695, "epoch": 3540} {"train_loss": -6.79290771484375, "global_step": 148696, "epoch": 3540} {"train_loss": -6.818351745605469, "global_step": 148697, "epoch": 3540} {"train_loss": -6.817925453186035, "global_step": 148698, "epoch": 3540} {"train_loss": -6.754472255706787, "global_step": 148699, "epoch": 3540} {"train_loss": -6.812578201293945, "global_step": 148700, "epoch": 3540} {"train_loss": -6.7525529861450195, "global_step": 148701, "epoch": 3540} {"train_loss": -6.830958366394043, "global_step": 148702, "epoch": 3540} {"train_loss": -6.729250907897949, "global_step": 148703, "epoch": 3540} {"train_loss": -6.79112434387207, "global_step": 148704, "epoch": 3540} {"train_loss": -6.769598007202148, "global_step": 148705, "epoch": 3540} {"train_loss": -6.679298400878906, "global_step": 148706, "epoch": 3540} {"train_loss": -6.8529253005981445, "global_step": 148707, "epoch": 3540} {"train_loss": -6.894656181335449, "global_step": 148708, "epoch": 3540} {"train_loss": -6.734449863433838, "global_step": 148709, "epoch": 3540} {"train_loss": -6.847530364990234, "global_step": 148710, "epoch": 3540} {"train_loss": -6.8605217933654785, "global_step": 148711, "epoch": 3540} {"train_loss": -6.749789714813232, "global_step": 148712, "epoch": 3540} {"train_loss": -6.8135528564453125, "global_step": 148713, "epoch": 3540} {"train_loss": -6.790625095367432, "global_step": 148714, "epoch": 3540} {"train_loss": -6.7697672843933105, "global_step": 148715, "epoch": 3540} {"train_loss": -6.826389312744141, "global_step": 148716, "epoch": 3540} {"train_loss": -6.859891891479492, "global_step": 148717, "epoch": 3540} {"train_loss": -6.8266520500183105, "global_step": 148718, "epoch": 3540} {"train_loss": -6.770968437194824, "global_step": 148719, "epoch": 3540} {"train_loss": -6.780795574188232, "global_step": 148720, "epoch": 3540} {"train_loss": -6.78313456262861, "global_step": 148721, "epoch": 3540, "val_loss": 68269.4140625} {"train_loss": -6.87015962600708, "global_step": 148722, "epoch": 3541} {"train_loss": -6.6456804275512695, "global_step": 148723, "epoch": 3541} {"train_loss": -6.635588645935059, "global_step": 148724, "epoch": 3541} {"train_loss": -6.83448600769043, "global_step": 148725, "epoch": 3541} {"train_loss": -6.749122142791748, "global_step": 148726, "epoch": 3541} {"train_loss": -6.602329254150391, "global_step": 148727, "epoch": 3541} {"train_loss": -6.784249782562256, "global_step": 148728, "epoch": 3541} {"train_loss": -6.551923751831055, "global_step": 148729, "epoch": 3541} {"train_loss": -6.748776435852051, "global_step": 148730, "epoch": 3541} {"train_loss": -6.752655029296875, "global_step": 148731, "epoch": 3541} {"train_loss": -6.515921115875244, "global_step": 148732, "epoch": 3541} {"train_loss": -6.693488597869873, "global_step": 148733, "epoch": 3541} {"train_loss": -6.781213760375977, "global_step": 148734, "epoch": 3541} {"train_loss": -6.698368072509766, "global_step": 148735, "epoch": 3541} {"train_loss": -6.860459327697754, "global_step": 148736, "epoch": 3541} {"train_loss": -6.7208251953125, "global_step": 148737, "epoch": 3541} {"train_loss": -6.838975429534912, "global_step": 148738, "epoch": 3541} {"train_loss": -6.666719436645508, "global_step": 148739, "epoch": 3541} {"train_loss": -6.80142879486084, "global_step": 148740, "epoch": 3541} {"train_loss": -6.534823417663574, "global_step": 148741, "epoch": 3541} {"train_loss": -6.771876335144043, "global_step": 148742, "epoch": 3541} {"train_loss": -6.772336483001709, "global_step": 148743, "epoch": 3541} {"train_loss": -6.7925519943237305, "global_step": 148744, "epoch": 3541} {"train_loss": -6.800281524658203, "global_step": 148745, "epoch": 3541} {"train_loss": -6.718996047973633, "global_step": 148746, "epoch": 3541} {"train_loss": -6.748637676239014, "global_step": 148747, "epoch": 3541} {"train_loss": -6.651033401489258, "global_step": 148748, "epoch": 3541} {"train_loss": -6.775771141052246, "global_step": 148749, "epoch": 3541} {"train_loss": -6.77258825302124, "global_step": 148750, "epoch": 3541} {"train_loss": -6.751387596130371, "global_step": 148751, "epoch": 3541} {"train_loss": -6.86747932434082, "global_step": 148752, "epoch": 3541} {"train_loss": -6.767393112182617, "global_step": 148753, "epoch": 3541} {"train_loss": -6.854186058044434, "global_step": 148754, "epoch": 3541} {"train_loss": -6.898028373718262, "global_step": 148755, "epoch": 3541} {"train_loss": -6.868617534637451, "global_step": 148756, "epoch": 3541} {"train_loss": -6.685494899749756, "global_step": 148757, "epoch": 3541} {"train_loss": -6.836921691894531, "global_step": 148758, "epoch": 3541} {"train_loss": -6.790700912475586, "global_step": 148759, "epoch": 3541} {"train_loss": -6.866397857666016, "global_step": 148760, "epoch": 3541} {"train_loss": -6.818961143493652, "global_step": 148761, "epoch": 3541} {"train_loss": -6.817136287689209, "global_step": 148762, "epoch": 3541} {"train_loss": -6.751655839738392, "global_step": 148763, "epoch": 3541, "val_loss": 68345.875} {"train_loss": -6.825673580169678, "global_step": 148764, "epoch": 3542} {"train_loss": -6.828834533691406, "global_step": 148765, "epoch": 3542} {"train_loss": -6.7823662757873535, "global_step": 148766, "epoch": 3542} {"train_loss": -6.772103786468506, "global_step": 148767, "epoch": 3542} {"train_loss": -6.881120681762695, "global_step": 148768, "epoch": 3542} {"train_loss": -6.760480880737305, "global_step": 148769, "epoch": 3542} {"train_loss": -6.805304527282715, "global_step": 148770, "epoch": 3542} {"train_loss": -6.761870384216309, "global_step": 148771, "epoch": 3542} {"train_loss": -6.770708084106445, "global_step": 148772, "epoch": 3542} {"train_loss": -6.706906795501709, "global_step": 148773, "epoch": 3542} {"train_loss": -6.6626787185668945, "global_step": 148774, "epoch": 3542} {"train_loss": -6.819104194641113, "global_step": 148775, "epoch": 3542} {"train_loss": -6.762056350708008, "global_step": 148776, "epoch": 3542} {"train_loss": -6.714122295379639, "global_step": 148777, "epoch": 3542} {"train_loss": -6.84611701965332, "global_step": 148778, "epoch": 3542} {"train_loss": -6.655279159545898, "global_step": 148779, "epoch": 3542} {"train_loss": -6.765790939331055, "global_step": 148780, "epoch": 3542} {"train_loss": -6.739946365356445, "global_step": 148781, "epoch": 3542} {"train_loss": -6.827995300292969, "global_step": 148782, "epoch": 3542} {"train_loss": -6.740342140197754, "global_step": 148783, "epoch": 3542} {"train_loss": -6.819096088409424, "global_step": 148784, "epoch": 3542} {"train_loss": -6.730574131011963, "global_step": 148785, "epoch": 3542} {"train_loss": -6.808427810668945, "global_step": 148786, "epoch": 3542} {"train_loss": -6.881414413452148, "global_step": 148787, "epoch": 3542} {"train_loss": -6.818652629852295, "global_step": 148788, "epoch": 3542} {"train_loss": -6.695274353027344, "global_step": 148789, "epoch": 3542} {"train_loss": -6.68201208114624, "global_step": 148790, "epoch": 3542} {"train_loss": -6.924195289611816, "global_step": 148791, "epoch": 3542} {"train_loss": -6.797611236572266, "global_step": 148792, "epoch": 3542} {"train_loss": -6.726489543914795, "global_step": 148793, "epoch": 3542} {"train_loss": -6.87790584564209, "global_step": 148794, "epoch": 3542} {"train_loss": -6.756606101989746, "global_step": 148795, "epoch": 3542} {"train_loss": -6.774094581604004, "global_step": 148796, "epoch": 3542} {"train_loss": -6.787258148193359, "global_step": 148797, "epoch": 3542} {"train_loss": -6.76106071472168, "global_step": 148798, "epoch": 3542} {"train_loss": -6.855798721313477, "global_step": 148799, "epoch": 3542} {"train_loss": -6.868560791015625, "global_step": 148800, "epoch": 3542} {"train_loss": -6.713500022888184, "global_step": 148801, "epoch": 3542} {"train_loss": -6.718725681304932, "global_step": 148802, "epoch": 3542} {"train_loss": -6.850788116455078, "global_step": 148803, "epoch": 3542} {"train_loss": -6.661284446716309, "global_step": 148804, "epoch": 3542} {"train_loss": -6.7809486502692815, "global_step": 148805, "epoch": 3542, "val_loss": 68432.8515625} {"train_loss": -6.689009666442871, "global_step": 148806, "epoch": 3543} {"train_loss": -6.75482702255249, "global_step": 148807, "epoch": 3543} {"train_loss": -6.791309833526611, "global_step": 148808, "epoch": 3543} {"train_loss": -6.718761920928955, "global_step": 148809, "epoch": 3543} {"train_loss": -6.824011325836182, "global_step": 148810, "epoch": 3543} {"train_loss": -6.772989273071289, "global_step": 148811, "epoch": 3543} {"train_loss": -6.898415565490723, "global_step": 148812, "epoch": 3543} {"train_loss": -6.706964492797852, "global_step": 148813, "epoch": 3543} {"train_loss": -6.795910835266113, "global_step": 148814, "epoch": 3543} {"train_loss": -6.702337265014648, "global_step": 148815, "epoch": 3543} {"train_loss": -6.612618923187256, "global_step": 148816, "epoch": 3543} {"train_loss": -6.737104415893555, "global_step": 148817, "epoch": 3543} {"train_loss": -6.769028663635254, "global_step": 148818, "epoch": 3543} {"train_loss": -6.746518611907959, "global_step": 148819, "epoch": 3543} {"train_loss": -6.792049407958984, "global_step": 148820, "epoch": 3543} {"train_loss": -6.739264488220215, "global_step": 148821, "epoch": 3543} {"train_loss": -6.756858825683594, "global_step": 148822, "epoch": 3543} {"train_loss": -6.724093437194824, "global_step": 148823, "epoch": 3543} {"train_loss": -6.776149272918701, "global_step": 148824, "epoch": 3543} {"train_loss": -6.779865264892578, "global_step": 148825, "epoch": 3543} {"train_loss": -6.746905326843262, "global_step": 148826, "epoch": 3543} {"train_loss": -6.839372634887695, "global_step": 148827, "epoch": 3543} {"train_loss": -6.848034858703613, "global_step": 148828, "epoch": 3543} {"train_loss": -6.762399673461914, "global_step": 148829, "epoch": 3543} {"train_loss": -6.661598205566406, "global_step": 148830, "epoch": 3543} {"train_loss": -6.756379127502441, "global_step": 148831, "epoch": 3543} {"train_loss": -6.795557498931885, "global_step": 148832, "epoch": 3543} {"train_loss": -6.842206001281738, "global_step": 148833, "epoch": 3543} {"train_loss": -6.839014530181885, "global_step": 148834, "epoch": 3543} {"train_loss": -6.789121627807617, "global_step": 148835, "epoch": 3543} {"train_loss": -6.8135151863098145, "global_step": 148836, "epoch": 3543} {"train_loss": -6.709085464477539, "global_step": 148837, "epoch": 3543} {"train_loss": -6.760289192199707, "global_step": 148838, "epoch": 3543} {"train_loss": -6.584519386291504, "global_step": 148839, "epoch": 3543} {"train_loss": -6.767214775085449, "global_step": 148840, "epoch": 3543} {"train_loss": -6.689391136169434, "global_step": 148841, "epoch": 3543} {"train_loss": -6.700351715087891, "global_step": 148842, "epoch": 3543} {"train_loss": -6.895943641662598, "global_step": 148843, "epoch": 3543} {"train_loss": -6.7690277099609375, "global_step": 148844, "epoch": 3543} {"train_loss": -6.675985813140869, "global_step": 148845, "epoch": 3543} {"train_loss": -6.757053375244141, "global_step": 148846, "epoch": 3543} {"train_loss": -6.757746741885231, "global_step": 148847, "epoch": 3543, "val_loss": 68395.3984375} {"train_loss": -6.755613803863525, "global_step": 148848, "epoch": 3544} {"train_loss": -6.75827693939209, "global_step": 148849, "epoch": 3544} {"train_loss": -6.689503192901611, "global_step": 148850, "epoch": 3544} {"train_loss": -6.8760786056518555, "global_step": 148851, "epoch": 3544} {"train_loss": -6.7528228759765625, "global_step": 148852, "epoch": 3544} {"train_loss": -6.7403130531311035, "global_step": 148853, "epoch": 3544} {"train_loss": -6.654419898986816, "global_step": 148854, "epoch": 3544} {"train_loss": -6.73570442199707, "global_step": 148855, "epoch": 3544} {"train_loss": -6.598166465759277, "global_step": 148856, "epoch": 3544} {"train_loss": -6.716817378997803, "global_step": 148857, "epoch": 3544} {"train_loss": -6.654858589172363, "global_step": 148858, "epoch": 3544} {"train_loss": -6.664035797119141, "global_step": 148859, "epoch": 3544} {"train_loss": -6.7500481605529785, "global_step": 148860, "epoch": 3544} {"train_loss": -6.758387565612793, "global_step": 148861, "epoch": 3544} {"train_loss": -6.776593208312988, "global_step": 148862, "epoch": 3544} {"train_loss": -6.662906169891357, "global_step": 148863, "epoch": 3544} {"train_loss": -6.777538299560547, "global_step": 148864, "epoch": 3544} {"train_loss": -6.777669906616211, "global_step": 148865, "epoch": 3544} {"train_loss": -6.821410655975342, "global_step": 148866, "epoch": 3544} {"train_loss": -6.805339336395264, "global_step": 148867, "epoch": 3544} {"train_loss": -6.687459945678711, "global_step": 148868, "epoch": 3544} {"train_loss": -6.824702739715576, "global_step": 148869, "epoch": 3544} {"train_loss": -6.735170364379883, "global_step": 148870, "epoch": 3544} {"train_loss": -6.782821178436279, "global_step": 148871, "epoch": 3544} {"train_loss": -6.681977272033691, "global_step": 148872, "epoch": 3544} {"train_loss": -6.8813934326171875, "global_step": 148873, "epoch": 3544} {"train_loss": -6.7748003005981445, "global_step": 148874, "epoch": 3544} {"train_loss": -6.7299089431762695, "global_step": 148875, "epoch": 3544} {"train_loss": -6.840651988983154, "global_step": 148876, "epoch": 3544} {"train_loss": -6.854741096496582, "global_step": 148877, "epoch": 3544} {"train_loss": -6.733867645263672, "global_step": 148878, "epoch": 3544} {"train_loss": -6.819408416748047, "global_step": 148879, "epoch": 3544} {"train_loss": -6.777054786682129, "global_step": 148880, "epoch": 3544} {"train_loss": -6.814655780792236, "global_step": 148881, "epoch": 3544} {"train_loss": -6.715318202972412, "global_step": 148882, "epoch": 3544} {"train_loss": -6.825292587280273, "global_step": 148883, "epoch": 3544} {"train_loss": -6.831484794616699, "global_step": 148884, "epoch": 3544} {"train_loss": -6.87523078918457, "global_step": 148885, "epoch": 3544} {"train_loss": -6.822658538818359, "global_step": 148886, "epoch": 3544} {"train_loss": -6.734443664550781, "global_step": 148887, "epoch": 3544} {"train_loss": -6.809613227844238, "global_step": 148888, "epoch": 3544} {"train_loss": -6.766779717944917, "global_step": 148889, "epoch": 3544, "val_loss": 68577.9453125} {"train_loss": -6.792842388153076, "global_step": 148890, "epoch": 3545} {"train_loss": -6.82914924621582, "global_step": 148891, "epoch": 3545} {"train_loss": -6.713228702545166, "global_step": 148892, "epoch": 3545} {"train_loss": -6.699742794036865, "global_step": 148893, "epoch": 3545} {"train_loss": -6.748898029327393, "global_step": 148894, "epoch": 3545} {"train_loss": -6.863410949707031, "global_step": 148895, "epoch": 3545} {"train_loss": -6.723145484924316, "global_step": 148896, "epoch": 3545} {"train_loss": -6.7458343505859375, "global_step": 148897, "epoch": 3545} {"train_loss": -6.873534202575684, "global_step": 148898, "epoch": 3545} {"train_loss": -6.65383768081665, "global_step": 148899, "epoch": 3545} {"train_loss": -6.832881927490234, "global_step": 148900, "epoch": 3545} {"train_loss": -6.7501726150512695, "global_step": 148901, "epoch": 3545} {"train_loss": -6.755084991455078, "global_step": 148902, "epoch": 3545} {"train_loss": -6.755779266357422, "global_step": 148903, "epoch": 3545} {"train_loss": -6.780509948730469, "global_step": 148904, "epoch": 3545} {"train_loss": -6.698871612548828, "global_step": 148905, "epoch": 3545} {"train_loss": -6.773972511291504, "global_step": 148906, "epoch": 3545} {"train_loss": -6.632645130157471, "global_step": 148907, "epoch": 3545} {"train_loss": -6.720499038696289, "global_step": 148908, "epoch": 3545} {"train_loss": -6.702669620513916, "global_step": 148909, "epoch": 3545} {"train_loss": -6.528707027435303, "global_step": 148910, "epoch": 3545} {"train_loss": -6.690208435058594, "global_step": 148911, "epoch": 3545} {"train_loss": -6.625433444976807, "global_step": 148912, "epoch": 3545} {"train_loss": -6.702122688293457, "global_step": 148913, "epoch": 3545} {"train_loss": -6.562236785888672, "global_step": 148914, "epoch": 3545} {"train_loss": -6.566965579986572, "global_step": 148915, "epoch": 3545} {"train_loss": -6.734915733337402, "global_step": 148916, "epoch": 3545} {"train_loss": -6.7154693603515625, "global_step": 148917, "epoch": 3545} {"train_loss": -6.783176898956299, "global_step": 148918, "epoch": 3545} {"train_loss": -6.704028129577637, "global_step": 148919, "epoch": 3545} {"train_loss": -6.7779693603515625, "global_step": 148920, "epoch": 3545} {"train_loss": -6.804361820220947, "global_step": 148921, "epoch": 3545} {"train_loss": -6.630987167358398, "global_step": 148922, "epoch": 3545} {"train_loss": -6.708451271057129, "global_step": 148923, "epoch": 3545} {"train_loss": -6.7029266357421875, "global_step": 148924, "epoch": 3545} {"train_loss": -6.731349945068359, "global_step": 148925, "epoch": 3545} {"train_loss": -6.69305944442749, "global_step": 148926, "epoch": 3545} {"train_loss": -6.9303998947143555, "global_step": 148927, "epoch": 3545} {"train_loss": -6.787766456604004, "global_step": 148928, "epoch": 3545} {"train_loss": -6.709496021270752, "global_step": 148929, "epoch": 3545} {"train_loss": -6.840672492980957, "global_step": 148930, "epoch": 3545} {"train_loss": -6.730908405213129, "global_step": 148931, "epoch": 3545, "val_loss": 68396.7734375} {"train_loss": -6.79172420501709, "global_step": 148932, "epoch": 3546} {"train_loss": -6.773820877075195, "global_step": 148933, "epoch": 3546} {"train_loss": -6.769076824188232, "global_step": 148934, "epoch": 3546} {"train_loss": -6.748177528381348, "global_step": 148935, "epoch": 3546} {"train_loss": -6.780179977416992, "global_step": 148936, "epoch": 3546} {"train_loss": -6.803993225097656, "global_step": 148937, "epoch": 3546} {"train_loss": -6.843808174133301, "global_step": 148938, "epoch": 3546} {"train_loss": -6.818389892578125, "global_step": 148939, "epoch": 3546} {"train_loss": -6.750919342041016, "global_step": 148940, "epoch": 3546} {"train_loss": -6.8665876388549805, "global_step": 148941, "epoch": 3546} {"train_loss": -6.869951248168945, "global_step": 148942, "epoch": 3546} {"train_loss": -6.842046737670898, "global_step": 148943, "epoch": 3546} {"train_loss": -6.857211112976074, "global_step": 148944, "epoch": 3546} {"train_loss": -6.823001861572266, "global_step": 148945, "epoch": 3546} {"train_loss": -6.77021598815918, "global_step": 148946, "epoch": 3546} {"train_loss": -6.767691135406494, "global_step": 148947, "epoch": 3546} {"train_loss": -6.7423481941223145, "global_step": 148948, "epoch": 3546} {"train_loss": -6.736752510070801, "global_step": 148949, "epoch": 3546} {"train_loss": -6.846554279327393, "global_step": 148950, "epoch": 3546} {"train_loss": -6.802347660064697, "global_step": 148951, "epoch": 3546} {"train_loss": -6.837642669677734, "global_step": 148952, "epoch": 3546} {"train_loss": -6.831966400146484, "global_step": 148953, "epoch": 3546} {"train_loss": -6.806554794311523, "global_step": 148954, "epoch": 3546} {"train_loss": -6.8616838455200195, "global_step": 148955, "epoch": 3546} {"train_loss": -6.864623069763184, "global_step": 148956, "epoch": 3546} {"train_loss": -6.828695774078369, "global_step": 148957, "epoch": 3546} {"train_loss": -6.835675239562988, "global_step": 148958, "epoch": 3546} {"train_loss": -6.76137638092041, "global_step": 148959, "epoch": 3546} {"train_loss": -6.9294586181640625, "global_step": 148960, "epoch": 3546} {"train_loss": -6.7918009757995605, "global_step": 148961, "epoch": 3546} {"train_loss": -6.841728210449219, "global_step": 148962, "epoch": 3546} {"train_loss": -6.738887786865234, "global_step": 148963, "epoch": 3546} {"train_loss": -6.7940168380737305, "global_step": 148964, "epoch": 3546} {"train_loss": -6.892110824584961, "global_step": 148965, "epoch": 3546} {"train_loss": -6.847207069396973, "global_step": 148966, "epoch": 3546} {"train_loss": -6.748313903808594, "global_step": 148967, "epoch": 3546} {"train_loss": -6.79160213470459, "global_step": 148968, "epoch": 3546} {"train_loss": -6.817379951477051, "global_step": 148969, "epoch": 3546} {"train_loss": -6.742664337158203, "global_step": 148970, "epoch": 3546} {"train_loss": -6.822512626647949, "global_step": 148971, "epoch": 3546} {"train_loss": -6.774850845336914, "global_step": 148972, "epoch": 3546} {"train_loss": -6.8099915981292725, "global_step": 148973, "epoch": 3546, "val_loss": 68481.578125} {"train_loss": -6.830092430114746, "global_step": 148974, "epoch": 3547} {"train_loss": -6.824610710144043, "global_step": 148975, "epoch": 3547} {"train_loss": -6.851248741149902, "global_step": 148976, "epoch": 3547} {"train_loss": -6.816876411437988, "global_step": 148977, "epoch": 3547} {"train_loss": -6.8752665519714355, "global_step": 148978, "epoch": 3547} {"train_loss": -6.886091232299805, "global_step": 148979, "epoch": 3547} {"train_loss": -6.843911170959473, "global_step": 148980, "epoch": 3547} {"train_loss": -6.74176025390625, "global_step": 148981, "epoch": 3547} {"train_loss": -6.834954261779785, "global_step": 148982, "epoch": 3547} {"train_loss": -6.867289066314697, "global_step": 148983, "epoch": 3547} {"train_loss": -6.805522918701172, "global_step": 148984, "epoch": 3547} {"train_loss": -6.926070213317871, "global_step": 148985, "epoch": 3547} {"train_loss": -6.716796398162842, "global_step": 148986, "epoch": 3547} {"train_loss": -6.814165115356445, "global_step": 148987, "epoch": 3547} {"train_loss": -6.907998085021973, "global_step": 148988, "epoch": 3547} {"train_loss": -6.773656845092773, "global_step": 148989, "epoch": 3547} {"train_loss": -7.017287254333496, "global_step": 148990, "epoch": 3547} {"train_loss": -6.850011825561523, "global_step": 148991, "epoch": 3547} {"train_loss": -6.840240001678467, "global_step": 148992, "epoch": 3547} {"train_loss": -6.745868682861328, "global_step": 148993, "epoch": 3547} {"train_loss": -6.810049533843994, "global_step": 148994, "epoch": 3547} {"train_loss": -6.744441032409668, "global_step": 148995, "epoch": 3547} {"train_loss": -6.90093994140625, "global_step": 148996, "epoch": 3547} {"train_loss": -6.813928604125977, "global_step": 148997, "epoch": 3547} {"train_loss": -6.896940231323242, "global_step": 148998, "epoch": 3547} {"train_loss": -6.713875770568848, "global_step": 148999, "epoch": 3547} {"train_loss": -6.841934680938721, "global_step": 149000, "epoch": 3547} {"train_loss": -6.704963684082031, "global_step": 149001, "epoch": 3547} {"train_loss": -6.798868179321289, "global_step": 149002, "epoch": 3547} {"train_loss": -6.79202938079834, "global_step": 149003, "epoch": 3547} {"train_loss": -6.611428260803223, "global_step": 149004, "epoch": 3547} {"train_loss": -6.855215549468994, "global_step": 149005, "epoch": 3547} {"train_loss": -6.719732284545898, "global_step": 149006, "epoch": 3547} {"train_loss": -6.704617023468018, "global_step": 149007, "epoch": 3547} {"train_loss": -6.786345481872559, "global_step": 149008, "epoch": 3547} {"train_loss": -6.707756042480469, "global_step": 149009, "epoch": 3547} {"train_loss": -6.909882545471191, "global_step": 149010, "epoch": 3547} {"train_loss": -6.637526512145996, "global_step": 149011, "epoch": 3547} {"train_loss": -6.846229553222656, "global_step": 149012, "epoch": 3547} {"train_loss": -6.688420295715332, "global_step": 149013, "epoch": 3547} {"train_loss": -6.678178310394287, "global_step": 149014, "epoch": 3547} {"train_loss": -6.801847707657587, "global_step": 149015, "epoch": 3547, "val_loss": 68307.6953125} {"train_loss": -6.71491813659668, "global_step": 149016, "epoch": 3548} {"train_loss": -6.7198381423950195, "global_step": 149017, "epoch": 3548} {"train_loss": -6.783604621887207, "global_step": 149018, "epoch": 3548} {"train_loss": -6.776798248291016, "global_step": 149019, "epoch": 3548} {"train_loss": -6.6797285079956055, "global_step": 149020, "epoch": 3548} {"train_loss": -6.74086856842041, "global_step": 149021, "epoch": 3548} {"train_loss": -6.676125526428223, "global_step": 149022, "epoch": 3548} {"train_loss": -6.8152546882629395, "global_step": 149023, "epoch": 3548} {"train_loss": -6.691874027252197, "global_step": 149024, "epoch": 3548} {"train_loss": -6.7288360595703125, "global_step": 149025, "epoch": 3548} {"train_loss": -6.747790336608887, "global_step": 149026, "epoch": 3548} {"train_loss": -6.684867858886719, "global_step": 149027, "epoch": 3548} {"train_loss": -6.715705871582031, "global_step": 149028, "epoch": 3548} {"train_loss": -6.847875595092773, "global_step": 149029, "epoch": 3548} {"train_loss": -6.736101150512695, "global_step": 149030, "epoch": 3548} {"train_loss": -6.851716995239258, "global_step": 149031, "epoch": 3548} {"train_loss": -6.689940452575684, "global_step": 149032, "epoch": 3548} {"train_loss": -6.854104518890381, "global_step": 149033, "epoch": 3548} {"train_loss": -6.737387657165527, "global_step": 149034, "epoch": 3548} {"train_loss": -6.688022613525391, "global_step": 149035, "epoch": 3548} {"train_loss": -6.86789608001709, "global_step": 149036, "epoch": 3548} {"train_loss": -6.624025344848633, "global_step": 149037, "epoch": 3548} {"train_loss": -6.859313011169434, "global_step": 149038, "epoch": 3548} {"train_loss": -6.815495491027832, "global_step": 149039, "epoch": 3548} {"train_loss": -6.730227947235107, "global_step": 149040, "epoch": 3548} {"train_loss": -6.755603313446045, "global_step": 149041, "epoch": 3548} {"train_loss": -6.733323097229004, "global_step": 149042, "epoch": 3548} {"train_loss": -6.9103922843933105, "global_step": 149043, "epoch": 3548} {"train_loss": -6.655440330505371, "global_step": 149044, "epoch": 3548} {"train_loss": -6.826935768127441, "global_step": 149045, "epoch": 3548} {"train_loss": -6.736922264099121, "global_step": 149046, "epoch": 3548} {"train_loss": -6.706979274749756, "global_step": 149047, "epoch": 3548} {"train_loss": -6.755390644073486, "global_step": 149048, "epoch": 3548} {"train_loss": -6.7307634353637695, "global_step": 149049, "epoch": 3548} {"train_loss": -6.754560470581055, "global_step": 149050, "epoch": 3548} {"train_loss": -6.866422653198242, "global_step": 149051, "epoch": 3548} {"train_loss": -6.692142486572266, "global_step": 149052, "epoch": 3548} {"train_loss": -6.748254776000977, "global_step": 149053, "epoch": 3548} {"train_loss": -6.689383506774902, "global_step": 149054, "epoch": 3548} {"train_loss": -6.8654656410217285, "global_step": 149055, "epoch": 3548} {"train_loss": -6.74947452545166, "global_step": 149056, "epoch": 3548} {"train_loss": -6.75472921416873, "global_step": 149057, "epoch": 3548, "val_loss": 68348.453125} {"train_loss": -6.860159873962402, "global_step": 149058, "epoch": 3549} {"train_loss": -6.769749164581299, "global_step": 149059, "epoch": 3549} {"train_loss": -6.678591728210449, "global_step": 149060, "epoch": 3549} {"train_loss": -6.670166969299316, "global_step": 149061, "epoch": 3549} {"train_loss": -6.8669114112854, "global_step": 149062, "epoch": 3549} {"train_loss": -6.857429504394531, "global_step": 149063, "epoch": 3549} {"train_loss": -6.672092437744141, "global_step": 149064, "epoch": 3549} {"train_loss": -6.795879364013672, "global_step": 149065, "epoch": 3549} {"train_loss": -6.861739158630371, "global_step": 149066, "epoch": 3549} {"train_loss": -6.813163757324219, "global_step": 149067, "epoch": 3549} {"train_loss": -6.78475284576416, "global_step": 149068, "epoch": 3549} {"train_loss": -6.918480396270752, "global_step": 149069, "epoch": 3549} {"train_loss": -6.872154235839844, "global_step": 149070, "epoch": 3549} {"train_loss": -6.813918113708496, "global_step": 149071, "epoch": 3549} {"train_loss": -6.917598247528076, "global_step": 149072, "epoch": 3549} {"train_loss": -6.750826835632324, "global_step": 149073, "epoch": 3549} {"train_loss": -6.778883934020996, "global_step": 149074, "epoch": 3549} {"train_loss": -6.758798599243164, "global_step": 149075, "epoch": 3549} {"train_loss": -6.826800346374512, "global_step": 149076, "epoch": 3549} {"train_loss": -6.911539554595947, "global_step": 149077, "epoch": 3549} {"train_loss": -6.78441047668457, "global_step": 149078, "epoch": 3549} {"train_loss": -6.800541877746582, "global_step": 149079, "epoch": 3549} {"train_loss": -6.800116062164307, "global_step": 149080, "epoch": 3549} {"train_loss": -6.844399929046631, "global_step": 149081, "epoch": 3549} {"train_loss": -6.835731029510498, "global_step": 149082, "epoch": 3549} {"train_loss": -6.939703941345215, "global_step": 149083, "epoch": 3549} {"train_loss": -6.755850791931152, "global_step": 149084, "epoch": 3549} {"train_loss": -6.904025077819824, "global_step": 149085, "epoch": 3549} {"train_loss": -6.883365154266357, "global_step": 149086, "epoch": 3549} {"train_loss": -6.853232383728027, "global_step": 149087, "epoch": 3549} {"train_loss": -6.795039176940918, "global_step": 149088, "epoch": 3549} {"train_loss": -6.797908782958984, "global_step": 149089, "epoch": 3549} {"train_loss": -6.858044624328613, "global_step": 149090, "epoch": 3549} {"train_loss": -6.804394721984863, "global_step": 149091, "epoch": 3549} {"train_loss": -6.73388671875, "global_step": 149092, "epoch": 3549} {"train_loss": -6.861660957336426, "global_step": 149093, "epoch": 3549} {"train_loss": -6.7729668617248535, "global_step": 149094, "epoch": 3549} {"train_loss": -6.899749755859375, "global_step": 149095, "epoch": 3549} {"train_loss": -6.847357749938965, "global_step": 149096, "epoch": 3549} {"train_loss": -6.846348762512207, "global_step": 149097, "epoch": 3549} {"train_loss": -6.719676971435547, "global_step": 149098, "epoch": 3549} {"train_loss": -6.815831104914348, "global_step": 149099, "epoch": 3549, "val_loss": 68258.0546875} {"train_loss": -6.796189308166504, "global_step": 149100, "epoch": 3550} {"train_loss": -6.754555702209473, "global_step": 149101, "epoch": 3550} {"train_loss": -6.79044246673584, "global_step": 149102, "epoch": 3550} {"train_loss": -6.762363433837891, "global_step": 149103, "epoch": 3550} {"train_loss": -6.820364952087402, "global_step": 149104, "epoch": 3550} {"train_loss": -6.751241683959961, "global_step": 149105, "epoch": 3550} {"train_loss": -6.827488422393799, "global_step": 149106, "epoch": 3550} {"train_loss": -6.8399248123168945, "global_step": 149107, "epoch": 3550} {"train_loss": -6.7616071701049805, "global_step": 149108, "epoch": 3550} {"train_loss": -6.789830684661865, "global_step": 149109, "epoch": 3550} {"train_loss": -6.9052839279174805, "global_step": 149110, "epoch": 3550} {"train_loss": -6.8733367919921875, "global_step": 149111, "epoch": 3550} {"train_loss": -6.69950008392334, "global_step": 149112, "epoch": 3550} {"train_loss": -6.88819694519043, "global_step": 149113, "epoch": 3550} {"train_loss": -6.765789985656738, "global_step": 149114, "epoch": 3550} {"train_loss": -6.655117988586426, "global_step": 149115, "epoch": 3550} {"train_loss": -6.781775951385498, "global_step": 149116, "epoch": 3550} {"train_loss": -6.701974391937256, "global_step": 149117, "epoch": 3550} {"train_loss": -6.807479381561279, "global_step": 149118, "epoch": 3550} {"train_loss": -6.639039993286133, "global_step": 149119, "epoch": 3550} {"train_loss": -6.840956687927246, "global_step": 149120, "epoch": 3550} {"train_loss": -6.695102691650391, "global_step": 149121, "epoch": 3550} {"train_loss": -6.821296691894531, "global_step": 149122, "epoch": 3550} {"train_loss": -6.910041809082031, "global_step": 149123, "epoch": 3550} {"train_loss": -6.716324806213379, "global_step": 149124, "epoch": 3550} {"train_loss": -6.702478885650635, "global_step": 149125, "epoch": 3550} {"train_loss": -6.769126892089844, "global_step": 149126, "epoch": 3550} {"train_loss": -6.705725193023682, "global_step": 149127, "epoch": 3550} {"train_loss": -6.836512088775635, "global_step": 149128, "epoch": 3550} {"train_loss": -6.8106279373168945, "global_step": 149129, "epoch": 3550} {"train_loss": -6.739346027374268, "global_step": 149130, "epoch": 3550} {"train_loss": -6.6956377029418945, "global_step": 149131, "epoch": 3550} {"train_loss": -6.795220375061035, "global_step": 149132, "epoch": 3550} {"train_loss": -6.650697708129883, "global_step": 149133, "epoch": 3550} {"train_loss": -6.88132381439209, "global_step": 149134, "epoch": 3550} {"train_loss": -6.772568702697754, "global_step": 149135, "epoch": 3550} {"train_loss": -6.712337017059326, "global_step": 149136, "epoch": 3550} {"train_loss": -6.771003723144531, "global_step": 149137, "epoch": 3550} {"train_loss": -6.786961078643799, "global_step": 149138, "epoch": 3550} {"train_loss": -6.799057483673096, "global_step": 149139, "epoch": 3550} {"train_loss": -6.740485191345215, "global_step": 149140, "epoch": 3550} {"train_loss": -6.776196740922474, "global_step": 149141, "epoch": 3550, "train/sim_max_reward_0": 0.2206844243529268, "train/sim_max_reward_1": 0.26714573115208984, "train/sim_max_reward_2": 0.26341766396545147, "train/sim_max_reward_3": 0.9637021537236086, "train/sim_max_reward_4": 0.40713399109659465, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.19843256953086388, "test/sim_max_reward_4400001": 0.8718387709861215, "test/sim_max_reward_4400002": 0.3519347671223452, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9271462904517792, "test/sim_max_reward_4400007": 0.8629093629882798, "test/sim_max_reward_4400008": 0.31741963561360215, "test/sim_max_reward_4400009": 0.9437185996238573, "test/sim_max_reward_4400010": 0.36257558330348383, "test/sim_max_reward_4400011": 0.08300850891307628, "test/sim_max_reward_4400012": 0.8456703077987567, "test/sim_max_reward_4400013": 0.4392414531993333, "test/sim_max_reward_4400014": 0.3666686817456986, "test/sim_max_reward_4400015": 0.13393092723391883, "test/sim_max_reward_4400016": 0.07905455157458312, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23724633203848167, "test/sim_max_reward_4400019": 0.5579976952229702, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9472667263038238, "test/sim_max_reward_4400023": 0.9993602850940773, "test/sim_max_reward_4400024": 0.9749934376209353, "test/sim_max_reward_4400025": 0.26376556870219386, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.07013657605221003, "test/sim_max_reward_4400028": 0.6192719982554412, "test/sim_max_reward_4400029": 0.941094415271659, "test/sim_max_reward_4400030": 0.9474415004903184, "test/sim_max_reward_4400031": 0.3853251262983415, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.993859138799289, "test/sim_max_reward_4400034": 0.6709906023748105, "test/sim_max_reward_4400035": 0.4163503158935367, "test/sim_max_reward_4400036": 0.3976273207080227, "test/sim_max_reward_4400037": 0.9182920937481563, "test/sim_max_reward_4400038": 0.7836738244782557, "test/sim_max_reward_4400039": 0.8576481116275786, "test/sim_max_reward_4400040": 0.3525021522127686, "test/sim_max_reward_4400041": 0.987106784592495, "test/sim_max_reward_4400042": 0.7132819070438671, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.8770826736473744, "test/sim_max_reward_4400045": 0.9453120452237369, "test/sim_max_reward_4400046": 0.8993463661449952, "test/sim_max_reward_4400047": 0.9655379479551209, "test/sim_max_reward_4400048": 0.06009032261258787, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.5203473273817786, "test/mean_score": 0.5607876221774528, "val_loss": 68434.609375} {"train_loss": -6.735653400421143, "global_step": 149142, "epoch": 3551} {"train_loss": -6.834951877593994, "global_step": 149143, "epoch": 3551} {"train_loss": -6.851653575897217, "global_step": 149144, "epoch": 3551} {"train_loss": -6.896366119384766, "global_step": 149145, "epoch": 3551} {"train_loss": -6.881929397583008, "global_step": 149146, "epoch": 3551} {"train_loss": -6.847872734069824, "global_step": 149147, "epoch": 3551} {"train_loss": -6.7880144119262695, "global_step": 149148, "epoch": 3551} {"train_loss": -6.824372291564941, "global_step": 149149, "epoch": 3551} {"train_loss": -6.869278430938721, "global_step": 149150, "epoch": 3551} {"train_loss": -6.795656204223633, "global_step": 149151, "epoch": 3551} {"train_loss": -6.856152057647705, "global_step": 149152, "epoch": 3551} {"train_loss": -6.783935546875, "global_step": 149153, "epoch": 3551} {"train_loss": -6.802809715270996, "global_step": 149154, "epoch": 3551} {"train_loss": -6.70294189453125, "global_step": 149155, "epoch": 3551} {"train_loss": -6.788297176361084, "global_step": 149156, "epoch": 3551} {"train_loss": -6.861692428588867, "global_step": 149157, "epoch": 3551} {"train_loss": -6.712303161621094, "global_step": 149158, "epoch": 3551} {"train_loss": -6.857872009277344, "global_step": 149159, "epoch": 3551} {"train_loss": -6.86958122253418, "global_step": 149160, "epoch": 3551} {"train_loss": -6.736331939697266, "global_step": 149161, "epoch": 3551} {"train_loss": -6.750832557678223, "global_step": 149162, "epoch": 3551} {"train_loss": -6.875493049621582, "global_step": 149163, "epoch": 3551} {"train_loss": -6.831313133239746, "global_step": 149164, "epoch": 3551} {"train_loss": -6.8917036056518555, "global_step": 149165, "epoch": 3551} {"train_loss": -6.802691459655762, "global_step": 149166, "epoch": 3551} {"train_loss": -6.793027877807617, "global_step": 149167, "epoch": 3551} {"train_loss": -6.902016639709473, "global_step": 149168, "epoch": 3551} {"train_loss": -6.683480262756348, "global_step": 149169, "epoch": 3551} {"train_loss": -6.975236415863037, "global_step": 149170, "epoch": 3551} {"train_loss": -6.8751373291015625, "global_step": 149171, "epoch": 3551} {"train_loss": -6.903428554534912, "global_step": 149172, "epoch": 3551} {"train_loss": -6.877779960632324, "global_step": 149173, "epoch": 3551} {"train_loss": -6.896805286407471, "global_step": 149174, "epoch": 3551} {"train_loss": -6.818576812744141, "global_step": 149175, "epoch": 3551} {"train_loss": -6.813814163208008, "global_step": 149176, "epoch": 3551} {"train_loss": -6.833623886108398, "global_step": 149177, "epoch": 3551} {"train_loss": -6.8727312088012695, "global_step": 149178, "epoch": 3551} {"train_loss": -6.724382400512695, "global_step": 149179, "epoch": 3551} {"train_loss": -6.874251365661621, "global_step": 149180, "epoch": 3551} {"train_loss": -6.882241249084473, "global_step": 149181, "epoch": 3551} {"train_loss": -6.845308303833008, "global_step": 149182, "epoch": 3551} {"train_loss": -6.827998104549589, "global_step": 149183, "epoch": 3551, "val_loss": 68453.6953125} {"train_loss": -6.8808488845825195, "global_step": 149184, "epoch": 3552} {"train_loss": -6.838663101196289, "global_step": 149185, "epoch": 3552} {"train_loss": -6.79966926574707, "global_step": 149186, "epoch": 3552} {"train_loss": -6.7639994621276855, "global_step": 149187, "epoch": 3552} {"train_loss": -6.897510528564453, "global_step": 149188, "epoch": 3552} {"train_loss": -6.808262348175049, "global_step": 149189, "epoch": 3552} {"train_loss": -6.745588302612305, "global_step": 149190, "epoch": 3552} {"train_loss": -6.785898208618164, "global_step": 149191, "epoch": 3552} {"train_loss": -6.789534568786621, "global_step": 149192, "epoch": 3552} {"train_loss": -6.856945991516113, "global_step": 149193, "epoch": 3552} {"train_loss": -6.910586833953857, "global_step": 149194, "epoch": 3552} {"train_loss": -6.776445388793945, "global_step": 149195, "epoch": 3552} {"train_loss": -6.709558963775635, "global_step": 149196, "epoch": 3552} {"train_loss": -6.859772682189941, "global_step": 149197, "epoch": 3552} {"train_loss": -6.744146823883057, "global_step": 149198, "epoch": 3552} {"train_loss": -6.838133811950684, "global_step": 149199, "epoch": 3552} {"train_loss": -6.816762924194336, "global_step": 149200, "epoch": 3552} {"train_loss": -6.812262535095215, "global_step": 149201, "epoch": 3552} {"train_loss": -6.778633117675781, "global_step": 149202, "epoch": 3552} {"train_loss": -6.792479038238525, "global_step": 149203, "epoch": 3552} {"train_loss": -6.773877143859863, "global_step": 149204, "epoch": 3552} {"train_loss": -6.81788444519043, "global_step": 149205, "epoch": 3552} {"train_loss": -6.845647811889648, "global_step": 149206, "epoch": 3552} {"train_loss": -6.7343034744262695, "global_step": 149207, "epoch": 3552} {"train_loss": -6.745172500610352, "global_step": 149208, "epoch": 3552} {"train_loss": -6.680872440338135, "global_step": 149209, "epoch": 3552} {"train_loss": -6.671154022216797, "global_step": 149210, "epoch": 3552} {"train_loss": -6.783502578735352, "global_step": 149211, "epoch": 3552} {"train_loss": -6.778543472290039, "global_step": 149212, "epoch": 3552} {"train_loss": -6.73490047454834, "global_step": 149213, "epoch": 3552} {"train_loss": -6.818194389343262, "global_step": 149214, "epoch": 3552} {"train_loss": -6.7823286056518555, "global_step": 149215, "epoch": 3552} {"train_loss": -6.8556904792785645, "global_step": 149216, "epoch": 3552} {"train_loss": -6.816317558288574, "global_step": 149217, "epoch": 3552} {"train_loss": -6.84776496887207, "global_step": 149218, "epoch": 3552} {"train_loss": -6.789211750030518, "global_step": 149219, "epoch": 3552} {"train_loss": -6.781457901000977, "global_step": 149220, "epoch": 3552} {"train_loss": -6.861379623413086, "global_step": 149221, "epoch": 3552} {"train_loss": -6.699466705322266, "global_step": 149222, "epoch": 3552} {"train_loss": -6.830907821655273, "global_step": 149223, "epoch": 3552} {"train_loss": -6.854067802429199, "global_step": 149224, "epoch": 3552} {"train_loss": -6.7978398232232955, "global_step": 149225, "epoch": 3552, "val_loss": 68588.390625} {"train_loss": -6.863587856292725, "global_step": 149226, "epoch": 3553} {"train_loss": -6.859743118286133, "global_step": 149227, "epoch": 3553} {"train_loss": -6.765588283538818, "global_step": 149228, "epoch": 3553} {"train_loss": -6.815320014953613, "global_step": 149229, "epoch": 3553} {"train_loss": -6.73020601272583, "global_step": 149230, "epoch": 3553} {"train_loss": -6.837610721588135, "global_step": 149231, "epoch": 3553} {"train_loss": -6.7498626708984375, "global_step": 149232, "epoch": 3553} {"train_loss": -6.796375274658203, "global_step": 149233, "epoch": 3553} {"train_loss": -6.87409782409668, "global_step": 149234, "epoch": 3553} {"train_loss": -6.840822219848633, "global_step": 149235, "epoch": 3553} {"train_loss": -6.850033760070801, "global_step": 149236, "epoch": 3553} {"train_loss": -6.772317409515381, "global_step": 149237, "epoch": 3553} {"train_loss": -6.848241806030273, "global_step": 149238, "epoch": 3553} {"train_loss": -6.792793273925781, "global_step": 149239, "epoch": 3553} {"train_loss": -6.676242828369141, "global_step": 149240, "epoch": 3553} {"train_loss": -6.844841003417969, "global_step": 149241, "epoch": 3553} {"train_loss": -6.823866844177246, "global_step": 149242, "epoch": 3553} {"train_loss": -6.861614227294922, "global_step": 149243, "epoch": 3553} {"train_loss": -6.8625922203063965, "global_step": 149244, "epoch": 3553} {"train_loss": -6.802219390869141, "global_step": 149245, "epoch": 3553} {"train_loss": -6.851484298706055, "global_step": 149246, "epoch": 3553} {"train_loss": -6.7637176513671875, "global_step": 149247, "epoch": 3553} {"train_loss": -6.782586097717285, "global_step": 149248, "epoch": 3553} {"train_loss": -6.76395845413208, "global_step": 149249, "epoch": 3553} {"train_loss": -6.771801471710205, "global_step": 149250, "epoch": 3553} {"train_loss": -6.811483383178711, "global_step": 149251, "epoch": 3553} {"train_loss": -6.838953018188477, "global_step": 149252, "epoch": 3553} {"train_loss": -6.695976734161377, "global_step": 149253, "epoch": 3553} {"train_loss": -6.666062831878662, "global_step": 149254, "epoch": 3553} {"train_loss": -6.802513122558594, "global_step": 149255, "epoch": 3553} {"train_loss": -6.779719352722168, "global_step": 149256, "epoch": 3553} {"train_loss": -6.718189239501953, "global_step": 149257, "epoch": 3553} {"train_loss": -6.85455322265625, "global_step": 149258, "epoch": 3553} {"train_loss": -6.839550018310547, "global_step": 149259, "epoch": 3553} {"train_loss": -6.794430732727051, "global_step": 149260, "epoch": 3553} {"train_loss": -6.848354339599609, "global_step": 149261, "epoch": 3553} {"train_loss": -6.925515174865723, "global_step": 149262, "epoch": 3553} {"train_loss": -6.770375728607178, "global_step": 149263, "epoch": 3553} {"train_loss": -6.788565158843994, "global_step": 149264, "epoch": 3553} {"train_loss": -6.892641067504883, "global_step": 149265, "epoch": 3553} {"train_loss": -6.769442081451416, "global_step": 149266, "epoch": 3553} {"train_loss": -6.806537525994437, "global_step": 149267, "epoch": 3553, "val_loss": 68423.9375} {"train_loss": -6.83515739440918, "global_step": 149268, "epoch": 3554} {"train_loss": -6.76217794418335, "global_step": 149269, "epoch": 3554} {"train_loss": -6.830795764923096, "global_step": 149270, "epoch": 3554} {"train_loss": -6.912261009216309, "global_step": 149271, "epoch": 3554} {"train_loss": -6.866023063659668, "global_step": 149272, "epoch": 3554} {"train_loss": -6.676353454589844, "global_step": 149273, "epoch": 3554} {"train_loss": -6.732229709625244, "global_step": 149274, "epoch": 3554} {"train_loss": -6.771975517272949, "global_step": 149275, "epoch": 3554} {"train_loss": -6.846804141998291, "global_step": 149276, "epoch": 3554} {"train_loss": -6.901301860809326, "global_step": 149277, "epoch": 3554} {"train_loss": -6.888010025024414, "global_step": 149278, "epoch": 3554} {"train_loss": -6.8560943603515625, "global_step": 149279, "epoch": 3554} {"train_loss": -6.792837142944336, "global_step": 149280, "epoch": 3554} {"train_loss": -6.759730339050293, "global_step": 149281, "epoch": 3554} {"train_loss": -6.78090238571167, "global_step": 149282, "epoch": 3554} {"train_loss": -6.85706090927124, "global_step": 149283, "epoch": 3554} {"train_loss": -6.881650924682617, "global_step": 149284, "epoch": 3554} {"train_loss": -6.805778503417969, "global_step": 149285, "epoch": 3554} {"train_loss": -6.816282272338867, "global_step": 149286, "epoch": 3554} {"train_loss": -6.786643028259277, "global_step": 149287, "epoch": 3554} {"train_loss": -6.835911750793457, "global_step": 149288, "epoch": 3554} {"train_loss": -6.770602226257324, "global_step": 149289, "epoch": 3554} {"train_loss": -6.8293352127075195, "global_step": 149290, "epoch": 3554} {"train_loss": -6.843484878540039, "global_step": 149291, "epoch": 3554} {"train_loss": -6.89266300201416, "global_step": 149292, "epoch": 3554} {"train_loss": -6.876594066619873, "global_step": 149293, "epoch": 3554} {"train_loss": -6.771105766296387, "global_step": 149294, "epoch": 3554} {"train_loss": -6.776192665100098, "global_step": 149295, "epoch": 3554} {"train_loss": -6.756900787353516, "global_step": 149296, "epoch": 3554} {"train_loss": -6.892483234405518, "global_step": 149297, "epoch": 3554} {"train_loss": -6.807747840881348, "global_step": 149298, "epoch": 3554} {"train_loss": -6.748739719390869, "global_step": 149299, "epoch": 3554} {"train_loss": -6.809695243835449, "global_step": 149300, "epoch": 3554} {"train_loss": -6.890766143798828, "global_step": 149301, "epoch": 3554} {"train_loss": -6.815851211547852, "global_step": 149302, "epoch": 3554} {"train_loss": -6.848165512084961, "global_step": 149303, "epoch": 3554} {"train_loss": -6.787938117980957, "global_step": 149304, "epoch": 3554} {"train_loss": -6.860958576202393, "global_step": 149305, "epoch": 3554} {"train_loss": -6.738015651702881, "global_step": 149306, "epoch": 3554} {"train_loss": -6.733242034912109, "global_step": 149307, "epoch": 3554} {"train_loss": -6.906420707702637, "global_step": 149308, "epoch": 3554} {"train_loss": -6.819939488456363, "global_step": 149309, "epoch": 3554, "val_loss": 68637.0625} {"train_loss": -6.773392677307129, "global_step": 149310, "epoch": 3555} {"train_loss": -6.842437744140625, "global_step": 149311, "epoch": 3555} {"train_loss": -6.84068489074707, "global_step": 149312, "epoch": 3555} {"train_loss": -6.799586296081543, "global_step": 149313, "epoch": 3555} {"train_loss": -6.764537811279297, "global_step": 149314, "epoch": 3555} {"train_loss": -6.716225624084473, "global_step": 149315, "epoch": 3555} {"train_loss": -6.715406894683838, "global_step": 149316, "epoch": 3555} {"train_loss": -6.750077247619629, "global_step": 149317, "epoch": 3555} {"train_loss": -6.7380242347717285, "global_step": 149318, "epoch": 3555} {"train_loss": -6.800329208374023, "global_step": 149319, "epoch": 3555} {"train_loss": -6.863772392272949, "global_step": 149320, "epoch": 3555} {"train_loss": -6.860209941864014, "global_step": 149321, "epoch": 3555} {"train_loss": -6.740722179412842, "global_step": 149322, "epoch": 3555} {"train_loss": -6.832763671875, "global_step": 149323, "epoch": 3555} {"train_loss": -6.874446868896484, "global_step": 149324, "epoch": 3555} {"train_loss": -6.701320648193359, "global_step": 149325, "epoch": 3555} {"train_loss": -6.839076995849609, "global_step": 149326, "epoch": 3555} {"train_loss": -6.756755352020264, "global_step": 149327, "epoch": 3555} {"train_loss": -6.846308708190918, "global_step": 149328, "epoch": 3555} {"train_loss": -6.772378444671631, "global_step": 149329, "epoch": 3555} {"train_loss": -6.75386905670166, "global_step": 149330, "epoch": 3555} {"train_loss": -6.690167427062988, "global_step": 149331, "epoch": 3555} {"train_loss": -6.856051445007324, "global_step": 149332, "epoch": 3555} {"train_loss": -6.772004127502441, "global_step": 149333, "epoch": 3555} {"train_loss": -6.804657459259033, "global_step": 149334, "epoch": 3555} {"train_loss": -6.732790470123291, "global_step": 149335, "epoch": 3555} {"train_loss": -6.721349716186523, "global_step": 149336, "epoch": 3555} {"train_loss": -6.870060920715332, "global_step": 149337, "epoch": 3555} {"train_loss": -6.841259002685547, "global_step": 149338, "epoch": 3555} {"train_loss": -6.798863887786865, "global_step": 149339, "epoch": 3555} {"train_loss": -6.744046211242676, "global_step": 149340, "epoch": 3555} {"train_loss": -6.863217830657959, "global_step": 149341, "epoch": 3555} {"train_loss": -6.754935264587402, "global_step": 149342, "epoch": 3555} {"train_loss": -6.6623406410217285, "global_step": 149343, "epoch": 3555} {"train_loss": -6.782219409942627, "global_step": 149344, "epoch": 3555} {"train_loss": -6.6544084548950195, "global_step": 149345, "epoch": 3555} {"train_loss": -6.762558937072754, "global_step": 149346, "epoch": 3555} {"train_loss": -6.779521942138672, "global_step": 149347, "epoch": 3555} {"train_loss": -6.781252861022949, "global_step": 149348, "epoch": 3555} {"train_loss": -6.708651065826416, "global_step": 149349, "epoch": 3555} {"train_loss": -6.646397590637207, "global_step": 149350, "epoch": 3555} {"train_loss": -6.778427282969157, "global_step": 149351, "epoch": 3555, "val_loss": 68210.4921875} {"train_loss": -6.73651123046875, "global_step": 149352, "epoch": 3556} {"train_loss": -6.719337463378906, "global_step": 149353, "epoch": 3556} {"train_loss": -6.7697529792785645, "global_step": 149354, "epoch": 3556} {"train_loss": -6.706392288208008, "global_step": 149355, "epoch": 3556} {"train_loss": -6.783446311950684, "global_step": 149356, "epoch": 3556} {"train_loss": -6.679315567016602, "global_step": 149357, "epoch": 3556} {"train_loss": -6.825016021728516, "global_step": 149358, "epoch": 3556} {"train_loss": -6.778294563293457, "global_step": 149359, "epoch": 3556} {"train_loss": -6.698733329772949, "global_step": 149360, "epoch": 3556} {"train_loss": -6.862578868865967, "global_step": 149361, "epoch": 3556} {"train_loss": -6.712640285491943, "global_step": 149362, "epoch": 3556} {"train_loss": -6.75023078918457, "global_step": 149363, "epoch": 3556} {"train_loss": -6.6651129722595215, "global_step": 149364, "epoch": 3556} {"train_loss": -6.709583282470703, "global_step": 149365, "epoch": 3556} {"train_loss": -6.692817687988281, "global_step": 149366, "epoch": 3556} {"train_loss": -6.651406764984131, "global_step": 149367, "epoch": 3556} {"train_loss": -6.705053329467773, "global_step": 149368, "epoch": 3556} {"train_loss": -6.748407363891602, "global_step": 149369, "epoch": 3556} {"train_loss": -6.71163272857666, "global_step": 149370, "epoch": 3556} {"train_loss": -6.78102970123291, "global_step": 149371, "epoch": 3556} {"train_loss": -6.754904747009277, "global_step": 149372, "epoch": 3556} {"train_loss": -6.690793991088867, "global_step": 149373, "epoch": 3556} {"train_loss": -6.806129455566406, "global_step": 149374, "epoch": 3556} {"train_loss": -6.667151927947998, "global_step": 149375, "epoch": 3556} {"train_loss": -6.797208309173584, "global_step": 149376, "epoch": 3556} {"train_loss": -6.834506988525391, "global_step": 149377, "epoch": 3556} {"train_loss": -6.85012149810791, "global_step": 149378, "epoch": 3556} {"train_loss": -6.720119953155518, "global_step": 149379, "epoch": 3556} {"train_loss": -6.722193717956543, "global_step": 149380, "epoch": 3556} {"train_loss": -6.72146463394165, "global_step": 149381, "epoch": 3556} {"train_loss": -6.703671932220459, "global_step": 149382, "epoch": 3556} {"train_loss": -6.757244110107422, "global_step": 149383, "epoch": 3556} {"train_loss": -6.744068622589111, "global_step": 149384, "epoch": 3556} {"train_loss": -6.830718517303467, "global_step": 149385, "epoch": 3556} {"train_loss": -6.768742561340332, "global_step": 149386, "epoch": 3556} {"train_loss": -6.696254253387451, "global_step": 149387, "epoch": 3556} {"train_loss": -6.806478023529053, "global_step": 149388, "epoch": 3556} {"train_loss": -6.766661643981934, "global_step": 149389, "epoch": 3556} {"train_loss": -6.831273078918457, "global_step": 149390, "epoch": 3556} {"train_loss": -6.894459247589111, "global_step": 149391, "epoch": 3556} {"train_loss": -6.790112495422363, "global_step": 149392, "epoch": 3556} {"train_loss": -6.752928370521182, "global_step": 149393, "epoch": 3556, "val_loss": 68418.0234375} {"train_loss": -6.838578224182129, "global_step": 149394, "epoch": 3557} {"train_loss": -6.811642646789551, "global_step": 149395, "epoch": 3557} {"train_loss": -6.856348991394043, "global_step": 149396, "epoch": 3557} {"train_loss": -6.813177108764648, "global_step": 149397, "epoch": 3557} {"train_loss": -6.771779537200928, "global_step": 149398, "epoch": 3557} {"train_loss": -6.759391784667969, "global_step": 149399, "epoch": 3557} {"train_loss": -6.842410087585449, "global_step": 149400, "epoch": 3557} {"train_loss": -6.852005481719971, "global_step": 149401, "epoch": 3557} {"train_loss": -6.8088836669921875, "global_step": 149402, "epoch": 3557} {"train_loss": -6.744744300842285, "global_step": 149403, "epoch": 3557} {"train_loss": -6.864208221435547, "global_step": 149404, "epoch": 3557} {"train_loss": -6.809166431427002, "global_step": 149405, "epoch": 3557} {"train_loss": -6.932971000671387, "global_step": 149406, "epoch": 3557} {"train_loss": -6.838688850402832, "global_step": 149407, "epoch": 3557} {"train_loss": -6.862322807312012, "global_step": 149408, "epoch": 3557} {"train_loss": -6.893068313598633, "global_step": 149409, "epoch": 3557} {"train_loss": -6.847680568695068, "global_step": 149410, "epoch": 3557} {"train_loss": -6.7986555099487305, "global_step": 149411, "epoch": 3557} {"train_loss": -6.82198429107666, "global_step": 149412, "epoch": 3557} {"train_loss": -6.661637306213379, "global_step": 149413, "epoch": 3557} {"train_loss": -6.832505226135254, "global_step": 149414, "epoch": 3557} {"train_loss": -6.75247859954834, "global_step": 149415, "epoch": 3557} {"train_loss": -6.809340476989746, "global_step": 149416, "epoch": 3557} {"train_loss": -6.7704668045043945, "global_step": 149417, "epoch": 3557} {"train_loss": -6.757287979125977, "global_step": 149418, "epoch": 3557} {"train_loss": -6.83439302444458, "global_step": 149419, "epoch": 3557} {"train_loss": -6.8970184326171875, "global_step": 149420, "epoch": 3557} {"train_loss": -6.849959373474121, "global_step": 149421, "epoch": 3557} {"train_loss": -6.731098651885986, "global_step": 149422, "epoch": 3557} {"train_loss": -6.928469181060791, "global_step": 149423, "epoch": 3557} {"train_loss": -6.881421089172363, "global_step": 149424, "epoch": 3557} {"train_loss": -6.928845405578613, "global_step": 149425, "epoch": 3557} {"train_loss": -6.830600261688232, "global_step": 149426, "epoch": 3557} {"train_loss": -6.777251720428467, "global_step": 149427, "epoch": 3557} {"train_loss": -6.778547286987305, "global_step": 149428, "epoch": 3557} {"train_loss": -6.802802562713623, "global_step": 149429, "epoch": 3557} {"train_loss": -6.844122886657715, "global_step": 149430, "epoch": 3557} {"train_loss": -6.819332122802734, "global_step": 149431, "epoch": 3557} {"train_loss": -6.931357383728027, "global_step": 149432, "epoch": 3557} {"train_loss": -6.854897975921631, "global_step": 149433, "epoch": 3557} {"train_loss": -6.860824108123779, "global_step": 149434, "epoch": 3557} {"train_loss": -6.826183046613421, "global_step": 149435, "epoch": 3557, "val_loss": 68340.171875} {"train_loss": -6.877535820007324, "global_step": 149436, "epoch": 3558} {"train_loss": -6.887834548950195, "global_step": 149437, "epoch": 3558} {"train_loss": -6.921070575714111, "global_step": 149438, "epoch": 3558} {"train_loss": -6.790063858032227, "global_step": 149439, "epoch": 3558} {"train_loss": -6.766056060791016, "global_step": 149440, "epoch": 3558} {"train_loss": -6.873856544494629, "global_step": 149441, "epoch": 3558} {"train_loss": -6.979564666748047, "global_step": 149442, "epoch": 3558} {"train_loss": -6.826392650604248, "global_step": 149443, "epoch": 3558} {"train_loss": -6.852823257446289, "global_step": 149444, "epoch": 3558} {"train_loss": -6.958247184753418, "global_step": 149445, "epoch": 3558} {"train_loss": -6.858869552612305, "global_step": 149446, "epoch": 3558} {"train_loss": -6.788120269775391, "global_step": 149447, "epoch": 3558} {"train_loss": -6.8614888191223145, "global_step": 149448, "epoch": 3558} {"train_loss": -6.776412010192871, "global_step": 149449, "epoch": 3558} {"train_loss": -6.84194278717041, "global_step": 149450, "epoch": 3558} {"train_loss": -6.868049621582031, "global_step": 149451, "epoch": 3558} {"train_loss": -6.905419826507568, "global_step": 149452, "epoch": 3558} {"train_loss": -6.782872200012207, "global_step": 149453, "epoch": 3558} {"train_loss": -6.911037445068359, "global_step": 149454, "epoch": 3558} {"train_loss": -6.805169105529785, "global_step": 149455, "epoch": 3558} {"train_loss": -6.890842914581299, "global_step": 149456, "epoch": 3558} {"train_loss": -6.785560607910156, "global_step": 149457, "epoch": 3558} {"train_loss": -6.827197551727295, "global_step": 149458, "epoch": 3558} {"train_loss": -6.8560791015625, "global_step": 149459, "epoch": 3558} {"train_loss": -6.8506598472595215, "global_step": 149460, "epoch": 3558} {"train_loss": -6.792794227600098, "global_step": 149461, "epoch": 3558} {"train_loss": -6.686332702636719, "global_step": 149462, "epoch": 3558} {"train_loss": -6.81181526184082, "global_step": 149463, "epoch": 3558} {"train_loss": -6.694454193115234, "global_step": 149464, "epoch": 3558} {"train_loss": -6.795937538146973, "global_step": 149465, "epoch": 3558} {"train_loss": -6.743298053741455, "global_step": 149466, "epoch": 3558} {"train_loss": -6.74519157409668, "global_step": 149467, "epoch": 3558} {"train_loss": -6.764665603637695, "global_step": 149468, "epoch": 3558} {"train_loss": -6.782402038574219, "global_step": 149469, "epoch": 3558} {"train_loss": -6.773159980773926, "global_step": 149470, "epoch": 3558} {"train_loss": -6.747197151184082, "global_step": 149471, "epoch": 3558} {"train_loss": -6.7944111824035645, "global_step": 149472, "epoch": 3558} {"train_loss": -6.718833923339844, "global_step": 149473, "epoch": 3558} {"train_loss": -6.749912261962891, "global_step": 149474, "epoch": 3558} {"train_loss": -6.741353988647461, "global_step": 149475, "epoch": 3558} {"train_loss": -6.755319595336914, "global_step": 149476, "epoch": 3558} {"train_loss": -6.813545045398531, "global_step": 149477, "epoch": 3558, "val_loss": 68588.921875} {"train_loss": -6.716711521148682, "global_step": 149478, "epoch": 3559} {"train_loss": -6.837405204772949, "global_step": 149479, "epoch": 3559} {"train_loss": -6.656621932983398, "global_step": 149480, "epoch": 3559} {"train_loss": -6.751904487609863, "global_step": 149481, "epoch": 3559} {"train_loss": -6.7806396484375, "global_step": 149482, "epoch": 3559} {"train_loss": -6.82485294342041, "global_step": 149483, "epoch": 3559} {"train_loss": -6.73138427734375, "global_step": 149484, "epoch": 3559} {"train_loss": -6.719898223876953, "global_step": 149485, "epoch": 3559} {"train_loss": -6.759784698486328, "global_step": 149486, "epoch": 3559} {"train_loss": -6.617286205291748, "global_step": 149487, "epoch": 3559} {"train_loss": -6.7119855880737305, "global_step": 149488, "epoch": 3559} {"train_loss": -6.696532726287842, "global_step": 149489, "epoch": 3559} {"train_loss": -6.660749912261963, "global_step": 149490, "epoch": 3559} {"train_loss": -6.710824489593506, "global_step": 149491, "epoch": 3559} {"train_loss": -6.737794876098633, "global_step": 149492, "epoch": 3559} {"train_loss": -6.742060661315918, "global_step": 149493, "epoch": 3559} {"train_loss": -6.658432483673096, "global_step": 149494, "epoch": 3559} {"train_loss": -6.698578834533691, "global_step": 149495, "epoch": 3559} {"train_loss": -6.629543781280518, "global_step": 149496, "epoch": 3559} {"train_loss": -6.73989200592041, "global_step": 149497, "epoch": 3559} {"train_loss": -6.8238019943237305, "global_step": 149498, "epoch": 3559} {"train_loss": -6.688355445861816, "global_step": 149499, "epoch": 3559} {"train_loss": -6.813671588897705, "global_step": 149500, "epoch": 3559} {"train_loss": -6.853214740753174, "global_step": 149501, "epoch": 3559} {"train_loss": -6.774864196777344, "global_step": 149502, "epoch": 3559} {"train_loss": -6.819268226623535, "global_step": 149503, "epoch": 3559} {"train_loss": -6.819584846496582, "global_step": 149504, "epoch": 3559} {"train_loss": -6.790653705596924, "global_step": 149505, "epoch": 3559} {"train_loss": -6.784940719604492, "global_step": 149506, "epoch": 3559} {"train_loss": -6.874342918395996, "global_step": 149507, "epoch": 3559} {"train_loss": -6.792455673217773, "global_step": 149508, "epoch": 3559} {"train_loss": -6.695435523986816, "global_step": 149509, "epoch": 3559} {"train_loss": -6.856783866882324, "global_step": 149510, "epoch": 3559} {"train_loss": -6.947674751281738, "global_step": 149511, "epoch": 3559} {"train_loss": -6.7844953536987305, "global_step": 149512, "epoch": 3559} {"train_loss": -6.8014326095581055, "global_step": 149513, "epoch": 3559} {"train_loss": -6.84381103515625, "global_step": 149514, "epoch": 3559} {"train_loss": -6.79909610748291, "global_step": 149515, "epoch": 3559} {"train_loss": -6.835505485534668, "global_step": 149516, "epoch": 3559} {"train_loss": -6.798247337341309, "global_step": 149517, "epoch": 3559} {"train_loss": -6.862296104431152, "global_step": 149518, "epoch": 3559} {"train_loss": -6.769569340206328, "global_step": 149519, "epoch": 3559, "val_loss": 68375.3203125} {"train_loss": -6.765570163726807, "global_step": 149520, "epoch": 3560} {"train_loss": -6.938632965087891, "global_step": 149521, "epoch": 3560} {"train_loss": -6.818256378173828, "global_step": 149522, "epoch": 3560} {"train_loss": -6.918856620788574, "global_step": 149523, "epoch": 3560} {"train_loss": -6.881648063659668, "global_step": 149524, "epoch": 3560} {"train_loss": -6.736882209777832, "global_step": 149525, "epoch": 3560} {"train_loss": -6.90125846862793, "global_step": 149526, "epoch": 3560} {"train_loss": -6.850656509399414, "global_step": 149527, "epoch": 3560} {"train_loss": -6.845853805541992, "global_step": 149528, "epoch": 3560} {"train_loss": -6.898754119873047, "global_step": 149529, "epoch": 3560} {"train_loss": -6.9040374755859375, "global_step": 149530, "epoch": 3560} {"train_loss": -6.849481582641602, "global_step": 149531, "epoch": 3560} {"train_loss": -6.927401065826416, "global_step": 149532, "epoch": 3560} {"train_loss": -6.90778112411499, "global_step": 149533, "epoch": 3560} {"train_loss": -6.825187683105469, "global_step": 149534, "epoch": 3560} {"train_loss": -6.767045974731445, "global_step": 149535, "epoch": 3560} {"train_loss": -6.785020351409912, "global_step": 149536, "epoch": 3560} {"train_loss": -6.815123081207275, "global_step": 149537, "epoch": 3560} {"train_loss": -6.805492401123047, "global_step": 149538, "epoch": 3560} {"train_loss": -6.886656761169434, "global_step": 149539, "epoch": 3560} {"train_loss": -6.899317741394043, "global_step": 149540, "epoch": 3560} {"train_loss": -6.84293270111084, "global_step": 149541, "epoch": 3560} {"train_loss": -6.963634490966797, "global_step": 149542, "epoch": 3560} {"train_loss": -6.849426746368408, "global_step": 149543, "epoch": 3560} {"train_loss": -6.894169807434082, "global_step": 149544, "epoch": 3560} {"train_loss": -6.88276481628418, "global_step": 149545, "epoch": 3560} {"train_loss": -6.854496002197266, "global_step": 149546, "epoch": 3560} {"train_loss": -6.838767051696777, "global_step": 149547, "epoch": 3560} {"train_loss": -6.788631439208984, "global_step": 149548, "epoch": 3560} {"train_loss": -6.780486106872559, "global_step": 149549, "epoch": 3560} {"train_loss": -6.783330917358398, "global_step": 149550, "epoch": 3560} {"train_loss": -6.825868606567383, "global_step": 149551, "epoch": 3560} {"train_loss": -6.677671432495117, "global_step": 149552, "epoch": 3560} {"train_loss": -6.851637840270996, "global_step": 149553, "epoch": 3560} {"train_loss": -6.681431770324707, "global_step": 149554, "epoch": 3560} {"train_loss": -6.734042167663574, "global_step": 149555, "epoch": 3560} {"train_loss": -6.796000957489014, "global_step": 149556, "epoch": 3560} {"train_loss": -6.802952766418457, "global_step": 149557, "epoch": 3560} {"train_loss": -6.733478546142578, "global_step": 149558, "epoch": 3560} {"train_loss": -6.848498344421387, "global_step": 149559, "epoch": 3560} {"train_loss": -6.72367000579834, "global_step": 149560, "epoch": 3560} {"train_loss": -6.8274347214471724, "global_step": 149561, "epoch": 3560, "val_loss": 68262.8125} {"train_loss": -6.833675384521484, "global_step": 149562, "epoch": 3561} {"train_loss": -6.919565200805664, "global_step": 149563, "epoch": 3561} {"train_loss": -6.821271896362305, "global_step": 149564, "epoch": 3561} {"train_loss": -6.860535621643066, "global_step": 149565, "epoch": 3561} {"train_loss": -6.732364654541016, "global_step": 149566, "epoch": 3561} {"train_loss": -6.8365397453308105, "global_step": 149567, "epoch": 3561} {"train_loss": -6.849550247192383, "global_step": 149568, "epoch": 3561} {"train_loss": -6.7996978759765625, "global_step": 149569, "epoch": 3561} {"train_loss": -6.801027297973633, "global_step": 149570, "epoch": 3561} {"train_loss": -6.818959712982178, "global_step": 149571, "epoch": 3561} {"train_loss": -6.766719818115234, "global_step": 149572, "epoch": 3561} {"train_loss": -6.801871299743652, "global_step": 149573, "epoch": 3561} {"train_loss": -6.793894290924072, "global_step": 149574, "epoch": 3561} {"train_loss": -6.80879020690918, "global_step": 149575, "epoch": 3561} {"train_loss": -6.756000995635986, "global_step": 149576, "epoch": 3561} {"train_loss": -6.798855781555176, "global_step": 149577, "epoch": 3561} {"train_loss": -6.893497943878174, "global_step": 149578, "epoch": 3561} {"train_loss": -6.816808700561523, "global_step": 149579, "epoch": 3561} {"train_loss": -6.855273723602295, "global_step": 149580, "epoch": 3561} {"train_loss": -6.7247490882873535, "global_step": 149581, "epoch": 3561} {"train_loss": -6.840993881225586, "global_step": 149582, "epoch": 3561} {"train_loss": -6.866282939910889, "global_step": 149583, "epoch": 3561} {"train_loss": -6.684549331665039, "global_step": 149584, "epoch": 3561} {"train_loss": -6.672133445739746, "global_step": 149585, "epoch": 3561} {"train_loss": -6.689849853515625, "global_step": 149586, "epoch": 3561} {"train_loss": -6.6231536865234375, "global_step": 149587, "epoch": 3561} {"train_loss": -6.765006065368652, "global_step": 149588, "epoch": 3561} {"train_loss": -6.74936580657959, "global_step": 149589, "epoch": 3561} {"train_loss": -6.760587215423584, "global_step": 149590, "epoch": 3561} {"train_loss": -6.704706192016602, "global_step": 149591, "epoch": 3561} {"train_loss": -6.7825140953063965, "global_step": 149592, "epoch": 3561} {"train_loss": -6.730977535247803, "global_step": 149593, "epoch": 3561} {"train_loss": -6.700091361999512, "global_step": 149594, "epoch": 3561} {"train_loss": -6.652655601501465, "global_step": 149595, "epoch": 3561} {"train_loss": -6.729318618774414, "global_step": 149596, "epoch": 3561} {"train_loss": -6.692447662353516, "global_step": 149597, "epoch": 3561} {"train_loss": -6.6485443115234375, "global_step": 149598, "epoch": 3561} {"train_loss": -6.749557018280029, "global_step": 149599, "epoch": 3561} {"train_loss": -6.687793731689453, "global_step": 149600, "epoch": 3561} {"train_loss": -6.700370788574219, "global_step": 149601, "epoch": 3561} {"train_loss": -6.701630115509033, "global_step": 149602, "epoch": 3561} {"train_loss": -6.766462019511631, "global_step": 149603, "epoch": 3561, "val_loss": 68438.1875} {"train_loss": -6.734665870666504, "global_step": 149604, "epoch": 3562} {"train_loss": -6.760532855987549, "global_step": 149605, "epoch": 3562} {"train_loss": -6.729945182800293, "global_step": 149606, "epoch": 3562} {"train_loss": -6.823517322540283, "global_step": 149607, "epoch": 3562} {"train_loss": -6.7001190185546875, "global_step": 149608, "epoch": 3562} {"train_loss": -6.829760551452637, "global_step": 149609, "epoch": 3562} {"train_loss": -6.773327827453613, "global_step": 149610, "epoch": 3562} {"train_loss": -6.833932876586914, "global_step": 149611, "epoch": 3562} {"train_loss": -6.774590492248535, "global_step": 149612, "epoch": 3562} {"train_loss": -6.84305477142334, "global_step": 149613, "epoch": 3562} {"train_loss": -6.806097507476807, "global_step": 149614, "epoch": 3562} {"train_loss": -6.851385593414307, "global_step": 149615, "epoch": 3562} {"train_loss": -6.7723069190979, "global_step": 149616, "epoch": 3562} {"train_loss": -6.720113754272461, "global_step": 149617, "epoch": 3562} {"train_loss": -6.792026996612549, "global_step": 149618, "epoch": 3562} {"train_loss": -6.899005889892578, "global_step": 149619, "epoch": 3562} {"train_loss": -6.74658203125, "global_step": 149620, "epoch": 3562} {"train_loss": -6.842441558837891, "global_step": 149621, "epoch": 3562} {"train_loss": -6.9050164222717285, "global_step": 149622, "epoch": 3562} {"train_loss": -6.881556510925293, "global_step": 149623, "epoch": 3562} {"train_loss": -6.899949073791504, "global_step": 149624, "epoch": 3562} {"train_loss": -6.783854007720947, "global_step": 149625, "epoch": 3562} {"train_loss": -6.737822532653809, "global_step": 149626, "epoch": 3562} {"train_loss": -6.858066082000732, "global_step": 149627, "epoch": 3562} {"train_loss": -6.7511305809021, "global_step": 149628, "epoch": 3562} {"train_loss": -6.873446464538574, "global_step": 149629, "epoch": 3562} {"train_loss": -6.848236083984375, "global_step": 149630, "epoch": 3562} {"train_loss": -6.861625671386719, "global_step": 149631, "epoch": 3562} {"train_loss": -6.887823104858398, "global_step": 149632, "epoch": 3562} {"train_loss": -6.834115505218506, "global_step": 149633, "epoch": 3562} {"train_loss": -6.802303314208984, "global_step": 149634, "epoch": 3562} {"train_loss": -6.809216022491455, "global_step": 149635, "epoch": 3562} {"train_loss": -6.848567962646484, "global_step": 149636, "epoch": 3562} {"train_loss": -6.827455520629883, "global_step": 149637, "epoch": 3562} {"train_loss": -6.841177940368652, "global_step": 149638, "epoch": 3562} {"train_loss": -6.851435661315918, "global_step": 149639, "epoch": 3562} {"train_loss": -6.811368942260742, "global_step": 149640, "epoch": 3562} {"train_loss": -6.900559425354004, "global_step": 149641, "epoch": 3562} {"train_loss": -6.934009075164795, "global_step": 149642, "epoch": 3562} {"train_loss": -6.880621910095215, "global_step": 149643, "epoch": 3562} {"train_loss": -6.872800827026367, "global_step": 149644, "epoch": 3562} {"train_loss": -6.823955535888672, "global_step": 149645, "epoch": 3562, "val_loss": 68299.953125} {"train_loss": -6.9033989906311035, "global_step": 149646, "epoch": 3563} {"train_loss": -6.776582717895508, "global_step": 149647, "epoch": 3563} {"train_loss": -6.799936771392822, "global_step": 149648, "epoch": 3563} {"train_loss": -6.780531883239746, "global_step": 149649, "epoch": 3563} {"train_loss": -6.760343551635742, "global_step": 149650, "epoch": 3563} {"train_loss": -6.791146278381348, "global_step": 149651, "epoch": 3563} {"train_loss": -6.7934417724609375, "global_step": 149652, "epoch": 3563} {"train_loss": -6.684014320373535, "global_step": 149653, "epoch": 3563} {"train_loss": -6.767696380615234, "global_step": 149654, "epoch": 3563} {"train_loss": -6.696732997894287, "global_step": 149655, "epoch": 3563} {"train_loss": -6.75730562210083, "global_step": 149656, "epoch": 3563} {"train_loss": -6.68250846862793, "global_step": 149657, "epoch": 3563} {"train_loss": -6.852900505065918, "global_step": 149658, "epoch": 3563} {"train_loss": -6.851029396057129, "global_step": 149659, "epoch": 3563} {"train_loss": -6.885673522949219, "global_step": 149660, "epoch": 3563} {"train_loss": -6.675817012786865, "global_step": 149661, "epoch": 3563} {"train_loss": -6.832559108734131, "global_step": 149662, "epoch": 3563} {"train_loss": -6.740461349487305, "global_step": 149663, "epoch": 3563} {"train_loss": -6.640501976013184, "global_step": 149664, "epoch": 3563} {"train_loss": -6.750123977661133, "global_step": 149665, "epoch": 3563} {"train_loss": -6.791226863861084, "global_step": 149666, "epoch": 3563} {"train_loss": -6.788175582885742, "global_step": 149667, "epoch": 3563} {"train_loss": -6.737122058868408, "global_step": 149668, "epoch": 3563} {"train_loss": -6.674187660217285, "global_step": 149669, "epoch": 3563} {"train_loss": -6.667922019958496, "global_step": 149670, "epoch": 3563} {"train_loss": -6.883724689483643, "global_step": 149671, "epoch": 3563} {"train_loss": -6.759350776672363, "global_step": 149672, "epoch": 3563} {"train_loss": -6.7198333740234375, "global_step": 149673, "epoch": 3563} {"train_loss": -6.741917610168457, "global_step": 149674, "epoch": 3563} {"train_loss": -6.764031410217285, "global_step": 149675, "epoch": 3563} {"train_loss": -6.813262939453125, "global_step": 149676, "epoch": 3563} {"train_loss": -6.814536094665527, "global_step": 149677, "epoch": 3563} {"train_loss": -6.762779235839844, "global_step": 149678, "epoch": 3563} {"train_loss": -6.787888526916504, "global_step": 149679, "epoch": 3563} {"train_loss": -6.841031551361084, "global_step": 149680, "epoch": 3563} {"train_loss": -6.74534273147583, "global_step": 149681, "epoch": 3563} {"train_loss": -6.799182415008545, "global_step": 149682, "epoch": 3563} {"train_loss": -6.765645980834961, "global_step": 149683, "epoch": 3563} {"train_loss": -6.699737548828125, "global_step": 149684, "epoch": 3563} {"train_loss": -6.749934673309326, "global_step": 149685, "epoch": 3563} {"train_loss": -6.763566017150879, "global_step": 149686, "epoch": 3563} {"train_loss": -6.7686520758129305, "global_step": 149687, "epoch": 3563, "val_loss": 68540.9375} {"train_loss": -6.789177894592285, "global_step": 149688, "epoch": 3564} {"train_loss": -6.799535751342773, "global_step": 149689, "epoch": 3564} {"train_loss": -6.805599212646484, "global_step": 149690, "epoch": 3564} {"train_loss": -6.844718933105469, "global_step": 149691, "epoch": 3564} {"train_loss": -6.809642314910889, "global_step": 149692, "epoch": 3564} {"train_loss": -6.697022914886475, "global_step": 149693, "epoch": 3564} {"train_loss": -6.868691444396973, "global_step": 149694, "epoch": 3564} {"train_loss": -6.7586493492126465, "global_step": 149695, "epoch": 3564} {"train_loss": -6.8726959228515625, "global_step": 149696, "epoch": 3564} {"train_loss": -6.773481845855713, "global_step": 149697, "epoch": 3564} {"train_loss": -6.814481735229492, "global_step": 149698, "epoch": 3564} {"train_loss": -6.791585445404053, "global_step": 149699, "epoch": 3564} {"train_loss": -6.83104133605957, "global_step": 149700, "epoch": 3564} {"train_loss": -6.789237976074219, "global_step": 149701, "epoch": 3564} {"train_loss": -6.893847942352295, "global_step": 149702, "epoch": 3564} {"train_loss": -6.700138092041016, "global_step": 149703, "epoch": 3564} {"train_loss": -6.848596572875977, "global_step": 149704, "epoch": 3564} {"train_loss": -6.835762023925781, "global_step": 149705, "epoch": 3564} {"train_loss": -6.714284896850586, "global_step": 149706, "epoch": 3564} {"train_loss": -6.848176956176758, "global_step": 149707, "epoch": 3564} {"train_loss": -6.783082008361816, "global_step": 149708, "epoch": 3564} {"train_loss": -6.78865385055542, "global_step": 149709, "epoch": 3564} {"train_loss": -6.7253570556640625, "global_step": 149710, "epoch": 3564} {"train_loss": -6.719281196594238, "global_step": 149711, "epoch": 3564} {"train_loss": -6.808722019195557, "global_step": 149712, "epoch": 3564} {"train_loss": -6.698927879333496, "global_step": 149713, "epoch": 3564} {"train_loss": -6.858076095581055, "global_step": 149714, "epoch": 3564} {"train_loss": -6.6310529708862305, "global_step": 149715, "epoch": 3564} {"train_loss": -6.654910087585449, "global_step": 149716, "epoch": 3564} {"train_loss": -6.741665840148926, "global_step": 149717, "epoch": 3564} {"train_loss": -6.848985195159912, "global_step": 149718, "epoch": 3564} {"train_loss": -6.766863822937012, "global_step": 149719, "epoch": 3564} {"train_loss": -6.718868255615234, "global_step": 149720, "epoch": 3564} {"train_loss": -6.794193267822266, "global_step": 149721, "epoch": 3564} {"train_loss": -6.796489715576172, "global_step": 149722, "epoch": 3564} {"train_loss": -6.779379844665527, "global_step": 149723, "epoch": 3564} {"train_loss": -6.702769756317139, "global_step": 149724, "epoch": 3564} {"train_loss": -6.788698196411133, "global_step": 149725, "epoch": 3564} {"train_loss": -6.736809253692627, "global_step": 149726, "epoch": 3564} {"train_loss": -6.780086517333984, "global_step": 149727, "epoch": 3564} {"train_loss": -6.8483476638793945, "global_step": 149728, "epoch": 3564} {"train_loss": -6.783878689720517, "global_step": 149729, "epoch": 3564, "val_loss": 68595.3828125} {"train_loss": -6.763389587402344, "global_step": 149730, "epoch": 3565} {"train_loss": -6.812263488769531, "global_step": 149731, "epoch": 3565} {"train_loss": -6.776021480560303, "global_step": 149732, "epoch": 3565} {"train_loss": -6.785506248474121, "global_step": 149733, "epoch": 3565} {"train_loss": -6.748476028442383, "global_step": 149734, "epoch": 3565} {"train_loss": -6.909921169281006, "global_step": 149735, "epoch": 3565} {"train_loss": -6.805394172668457, "global_step": 149736, "epoch": 3565} {"train_loss": -6.8092145919799805, "global_step": 149737, "epoch": 3565} {"train_loss": -6.77971076965332, "global_step": 149738, "epoch": 3565} {"train_loss": -6.819770812988281, "global_step": 149739, "epoch": 3565} {"train_loss": -6.802707195281982, "global_step": 149740, "epoch": 3565} {"train_loss": -6.837460517883301, "global_step": 149741, "epoch": 3565} {"train_loss": -6.8187408447265625, "global_step": 149742, "epoch": 3565} {"train_loss": -6.821362018585205, "global_step": 149743, "epoch": 3565} {"train_loss": -6.85209321975708, "global_step": 149744, "epoch": 3565} {"train_loss": -6.791902542114258, "global_step": 149745, "epoch": 3565} {"train_loss": -6.866545677185059, "global_step": 149746, "epoch": 3565} {"train_loss": -6.923469066619873, "global_step": 149747, "epoch": 3565} {"train_loss": -6.8023505210876465, "global_step": 149748, "epoch": 3565} {"train_loss": -6.76859712600708, "global_step": 149749, "epoch": 3565} {"train_loss": -6.780398368835449, "global_step": 149750, "epoch": 3565} {"train_loss": -6.844642162322998, "global_step": 149751, "epoch": 3565} {"train_loss": -6.826857566833496, "global_step": 149752, "epoch": 3565} {"train_loss": -6.767364025115967, "global_step": 149753, "epoch": 3565} {"train_loss": -6.741551876068115, "global_step": 149754, "epoch": 3565} {"train_loss": -6.763402938842773, "global_step": 149755, "epoch": 3565} {"train_loss": -6.841240882873535, "global_step": 149756, "epoch": 3565} {"train_loss": -6.829041481018066, "global_step": 149757, "epoch": 3565} {"train_loss": -6.828508377075195, "global_step": 149758, "epoch": 3565} {"train_loss": -6.885336875915527, "global_step": 149759, "epoch": 3565} {"train_loss": -6.817206859588623, "global_step": 149760, "epoch": 3565} {"train_loss": -6.769072532653809, "global_step": 149761, "epoch": 3565} {"train_loss": -6.797050476074219, "global_step": 149762, "epoch": 3565} {"train_loss": -6.8656158447265625, "global_step": 149763, "epoch": 3565} {"train_loss": -6.744287967681885, "global_step": 149764, "epoch": 3565} {"train_loss": -6.7386322021484375, "global_step": 149765, "epoch": 3565} {"train_loss": -6.769979476928711, "global_step": 149766, "epoch": 3565} {"train_loss": -6.7717719078063965, "global_step": 149767, "epoch": 3565} {"train_loss": -6.736629486083984, "global_step": 149768, "epoch": 3565} {"train_loss": -6.8579301834106445, "global_step": 149769, "epoch": 3565} {"train_loss": -6.803208351135254, "global_step": 149770, "epoch": 3565} {"train_loss": -6.809034551892962, "global_step": 149771, "epoch": 3565, "val_loss": 68561.484375} {"train_loss": -6.797013282775879, "global_step": 149772, "epoch": 3566} {"train_loss": -6.731635093688965, "global_step": 149773, "epoch": 3566} {"train_loss": -6.769015312194824, "global_step": 149774, "epoch": 3566} {"train_loss": -6.695520877838135, "global_step": 149775, "epoch": 3566} {"train_loss": -6.75862455368042, "global_step": 149776, "epoch": 3566} {"train_loss": -6.638031959533691, "global_step": 149777, "epoch": 3566} {"train_loss": -6.767183303833008, "global_step": 149778, "epoch": 3566} {"train_loss": -6.752205848693848, "global_step": 149779, "epoch": 3566} {"train_loss": -6.751579284667969, "global_step": 149780, "epoch": 3566} {"train_loss": -6.843079566955566, "global_step": 149781, "epoch": 3566} {"train_loss": -6.751400947570801, "global_step": 149782, "epoch": 3566} {"train_loss": -6.774659633636475, "global_step": 149783, "epoch": 3566} {"train_loss": -6.85051965713501, "global_step": 149784, "epoch": 3566} {"train_loss": -6.767492294311523, "global_step": 149785, "epoch": 3566} {"train_loss": -6.8573994636535645, "global_step": 149786, "epoch": 3566} {"train_loss": -6.764001846313477, "global_step": 149787, "epoch": 3566} {"train_loss": -6.836203575134277, "global_step": 149788, "epoch": 3566} {"train_loss": -6.8549299240112305, "global_step": 149789, "epoch": 3566} {"train_loss": -6.838788986206055, "global_step": 149790, "epoch": 3566} {"train_loss": -6.757810592651367, "global_step": 149791, "epoch": 3566} {"train_loss": -6.613516330718994, "global_step": 149792, "epoch": 3566} {"train_loss": -6.862502574920654, "global_step": 149793, "epoch": 3566} {"train_loss": -6.803853511810303, "global_step": 149794, "epoch": 3566} {"train_loss": -6.83519172668457, "global_step": 149795, "epoch": 3566} {"train_loss": -6.810232639312744, "global_step": 149796, "epoch": 3566} {"train_loss": -6.834468841552734, "global_step": 149797, "epoch": 3566} {"train_loss": -6.871931552886963, "global_step": 149798, "epoch": 3566} {"train_loss": -6.8096923828125, "global_step": 149799, "epoch": 3566} {"train_loss": -6.779008865356445, "global_step": 149800, "epoch": 3566} {"train_loss": -6.834883689880371, "global_step": 149801, "epoch": 3566} {"train_loss": -6.837887763977051, "global_step": 149802, "epoch": 3566} {"train_loss": -6.7579755783081055, "global_step": 149803, "epoch": 3566} {"train_loss": -6.847404956817627, "global_step": 149804, "epoch": 3566} {"train_loss": -6.916505336761475, "global_step": 149805, "epoch": 3566} {"train_loss": -6.7999420166015625, "global_step": 149806, "epoch": 3566} {"train_loss": -6.762917518615723, "global_step": 149807, "epoch": 3566} {"train_loss": -6.7176618576049805, "global_step": 149808, "epoch": 3566} {"train_loss": -6.780515670776367, "global_step": 149809, "epoch": 3566} {"train_loss": -6.784792900085449, "global_step": 149810, "epoch": 3566} {"train_loss": -6.839230537414551, "global_step": 149811, "epoch": 3566} {"train_loss": -6.917889595031738, "global_step": 149812, "epoch": 3566} {"train_loss": -6.796293383552914, "global_step": 149813, "epoch": 3566, "val_loss": 68433.9140625} {"train_loss": -6.781590461730957, "global_step": 149814, "epoch": 3567} {"train_loss": -6.849729537963867, "global_step": 149815, "epoch": 3567} {"train_loss": -6.8769211769104, "global_step": 149816, "epoch": 3567} {"train_loss": -6.855843544006348, "global_step": 149817, "epoch": 3567} {"train_loss": -6.876584053039551, "global_step": 149818, "epoch": 3567} {"train_loss": -6.8080902099609375, "global_step": 149819, "epoch": 3567} {"train_loss": -6.8011369705200195, "global_step": 149820, "epoch": 3567} {"train_loss": -6.782670021057129, "global_step": 149821, "epoch": 3567} {"train_loss": -6.8552751541137695, "global_step": 149822, "epoch": 3567} {"train_loss": -6.881200790405273, "global_step": 149823, "epoch": 3567} {"train_loss": -6.7038116455078125, "global_step": 149824, "epoch": 3567} {"train_loss": -6.756735801696777, "global_step": 149825, "epoch": 3567} {"train_loss": -6.905592918395996, "global_step": 149826, "epoch": 3567} {"train_loss": -6.865330219268799, "global_step": 149827, "epoch": 3567} {"train_loss": -6.90792989730835, "global_step": 149828, "epoch": 3567} {"train_loss": -6.896943092346191, "global_step": 149829, "epoch": 3567} {"train_loss": -6.92326545715332, "global_step": 149830, "epoch": 3567} {"train_loss": -6.942653179168701, "global_step": 149831, "epoch": 3567} {"train_loss": -6.824153423309326, "global_step": 149832, "epoch": 3567} {"train_loss": -6.937147617340088, "global_step": 149833, "epoch": 3567} {"train_loss": -6.927581787109375, "global_step": 149834, "epoch": 3567} {"train_loss": -6.8425493240356445, "global_step": 149835, "epoch": 3567} {"train_loss": -6.96993350982666, "global_step": 149836, "epoch": 3567} {"train_loss": -6.830864906311035, "global_step": 149837, "epoch": 3567} {"train_loss": -6.911711692810059, "global_step": 149838, "epoch": 3567} {"train_loss": -6.745428085327148, "global_step": 149839, "epoch": 3567} {"train_loss": -6.943717956542969, "global_step": 149840, "epoch": 3567} {"train_loss": -6.939257621765137, "global_step": 149841, "epoch": 3567} {"train_loss": -6.865769386291504, "global_step": 149842, "epoch": 3567} {"train_loss": -6.891714572906494, "global_step": 149843, "epoch": 3567} {"train_loss": -6.925729274749756, "global_step": 149844, "epoch": 3567} {"train_loss": -6.84774112701416, "global_step": 149845, "epoch": 3567} {"train_loss": -6.861954689025879, "global_step": 149846, "epoch": 3567} {"train_loss": -6.785515785217285, "global_step": 149847, "epoch": 3567} {"train_loss": -6.800994396209717, "global_step": 149848, "epoch": 3567} {"train_loss": -6.970457077026367, "global_step": 149849, "epoch": 3567} {"train_loss": -6.788139820098877, "global_step": 149850, "epoch": 3567} {"train_loss": -6.831920146942139, "global_step": 149851, "epoch": 3567} {"train_loss": -6.784646511077881, "global_step": 149852, "epoch": 3567} {"train_loss": -6.8264923095703125, "global_step": 149853, "epoch": 3567} {"train_loss": -6.875515460968018, "global_step": 149854, "epoch": 3567} {"train_loss": -6.860135929925101, "global_step": 149855, "epoch": 3567, "val_loss": 68345.40625} {"train_loss": -6.754292011260986, "global_step": 149856, "epoch": 3568} {"train_loss": -6.7837629318237305, "global_step": 149857, "epoch": 3568} {"train_loss": -6.911382675170898, "global_step": 149858, "epoch": 3568} {"train_loss": -6.7443647384643555, "global_step": 149859, "epoch": 3568} {"train_loss": -6.752956390380859, "global_step": 149860, "epoch": 3568} {"train_loss": -6.934186935424805, "global_step": 149861, "epoch": 3568} {"train_loss": -6.797528266906738, "global_step": 149862, "epoch": 3568} {"train_loss": -6.790702819824219, "global_step": 149863, "epoch": 3568} {"train_loss": -6.829193592071533, "global_step": 149864, "epoch": 3568} {"train_loss": -6.761970520019531, "global_step": 149865, "epoch": 3568} {"train_loss": -6.854307174682617, "global_step": 149866, "epoch": 3568} {"train_loss": -6.872287750244141, "global_step": 149867, "epoch": 3568} {"train_loss": -6.760881423950195, "global_step": 149868, "epoch": 3568} {"train_loss": -6.805826663970947, "global_step": 149869, "epoch": 3568} {"train_loss": -6.927848815917969, "global_step": 149870, "epoch": 3568} {"train_loss": -6.837765693664551, "global_step": 149871, "epoch": 3568} {"train_loss": -6.854091167449951, "global_step": 149872, "epoch": 3568} {"train_loss": -6.797806739807129, "global_step": 149873, "epoch": 3568} {"train_loss": -6.774700164794922, "global_step": 149874, "epoch": 3568} {"train_loss": -6.697910308837891, "global_step": 149875, "epoch": 3568} {"train_loss": -6.779197692871094, "global_step": 149876, "epoch": 3568} {"train_loss": -6.820557594299316, "global_step": 149877, "epoch": 3568} {"train_loss": -6.748695373535156, "global_step": 149878, "epoch": 3568} {"train_loss": -6.666040420532227, "global_step": 149879, "epoch": 3568} {"train_loss": -6.786954879760742, "global_step": 149880, "epoch": 3568} {"train_loss": -6.713062286376953, "global_step": 149881, "epoch": 3568} {"train_loss": -6.615294933319092, "global_step": 149882, "epoch": 3568} {"train_loss": -6.921588897705078, "global_step": 149883, "epoch": 3568} {"train_loss": -6.70347785949707, "global_step": 149884, "epoch": 3568} {"train_loss": -6.719206809997559, "global_step": 149885, "epoch": 3568} {"train_loss": -6.717375755310059, "global_step": 149886, "epoch": 3568} {"train_loss": -6.75499153137207, "global_step": 149887, "epoch": 3568} {"train_loss": -6.751940727233887, "global_step": 149888, "epoch": 3568} {"train_loss": -6.737977504730225, "global_step": 149889, "epoch": 3568} {"train_loss": -6.762082099914551, "global_step": 149890, "epoch": 3568} {"train_loss": -6.772487640380859, "global_step": 149891, "epoch": 3568} {"train_loss": -6.692461967468262, "global_step": 149892, "epoch": 3568} {"train_loss": -6.817601203918457, "global_step": 149893, "epoch": 3568} {"train_loss": -6.8455705642700195, "global_step": 149894, "epoch": 3568} {"train_loss": -6.828683853149414, "global_step": 149895, "epoch": 3568} {"train_loss": -6.7865471839904785, "global_step": 149896, "epoch": 3568} {"train_loss": -6.785627705710275, "global_step": 149897, "epoch": 3568, "val_loss": 68410.578125} {"train_loss": -6.757786273956299, "global_step": 149898, "epoch": 3569} {"train_loss": -6.791111946105957, "global_step": 149899, "epoch": 3569} {"train_loss": -6.812392711639404, "global_step": 149900, "epoch": 3569} {"train_loss": -6.816925048828125, "global_step": 149901, "epoch": 3569} {"train_loss": -6.857852935791016, "global_step": 149902, "epoch": 3569} {"train_loss": -6.923422813415527, "global_step": 149903, "epoch": 3569} {"train_loss": -6.707000732421875, "global_step": 149904, "epoch": 3569} {"train_loss": -6.766834259033203, "global_step": 149905, "epoch": 3569} {"train_loss": -6.819902420043945, "global_step": 149906, "epoch": 3569} {"train_loss": -6.786924362182617, "global_step": 149907, "epoch": 3569} {"train_loss": -6.696558952331543, "global_step": 149908, "epoch": 3569} {"train_loss": -6.8030500411987305, "global_step": 149909, "epoch": 3569} {"train_loss": -6.623969078063965, "global_step": 149910, "epoch": 3569} {"train_loss": -6.871528625488281, "global_step": 149911, "epoch": 3569} {"train_loss": -6.725523471832275, "global_step": 149912, "epoch": 3569} {"train_loss": -6.708476543426514, "global_step": 149913, "epoch": 3569} {"train_loss": -6.741316795349121, "global_step": 149914, "epoch": 3569} {"train_loss": -6.72275447845459, "global_step": 149915, "epoch": 3569} {"train_loss": -6.7446489334106445, "global_step": 149916, "epoch": 3569} {"train_loss": -6.70850944519043, "global_step": 149917, "epoch": 3569} {"train_loss": -6.8617095947265625, "global_step": 149918, "epoch": 3569} {"train_loss": -6.724562644958496, "global_step": 149919, "epoch": 3569} {"train_loss": -6.720678329467773, "global_step": 149920, "epoch": 3569} {"train_loss": -6.745945930480957, "global_step": 149921, "epoch": 3569} {"train_loss": -6.787763595581055, "global_step": 149922, "epoch": 3569} {"train_loss": -6.909523010253906, "global_step": 149923, "epoch": 3569} {"train_loss": -6.775060653686523, "global_step": 149924, "epoch": 3569} {"train_loss": -6.719186782836914, "global_step": 149925, "epoch": 3569} {"train_loss": -6.838726043701172, "global_step": 149926, "epoch": 3569} {"train_loss": -6.680192947387695, "global_step": 149927, "epoch": 3569} {"train_loss": -6.86083459854126, "global_step": 149928, "epoch": 3569} {"train_loss": -6.6854753494262695, "global_step": 149929, "epoch": 3569} {"train_loss": -6.795873641967773, "global_step": 149930, "epoch": 3569} {"train_loss": -6.7478790283203125, "global_step": 149931, "epoch": 3569} {"train_loss": -6.823166847229004, "global_step": 149932, "epoch": 3569} {"train_loss": -6.87266731262207, "global_step": 149933, "epoch": 3569} {"train_loss": -6.7397613525390625, "global_step": 149934, "epoch": 3569} {"train_loss": -6.803162574768066, "global_step": 149935, "epoch": 3569} {"train_loss": -6.827866077423096, "global_step": 149936, "epoch": 3569} {"train_loss": -6.926301002502441, "global_step": 149937, "epoch": 3569} {"train_loss": -6.850649833679199, "global_step": 149938, "epoch": 3569} {"train_loss": -6.784128143673851, "global_step": 149939, "epoch": 3569, "val_loss": 68656.03125} {"train_loss": -6.916195869445801, "global_step": 149940, "epoch": 3570} {"train_loss": -6.75964879989624, "global_step": 149941, "epoch": 3570} {"train_loss": -6.926321029663086, "global_step": 149942, "epoch": 3570} {"train_loss": -6.80936861038208, "global_step": 149943, "epoch": 3570} {"train_loss": -6.750326633453369, "global_step": 149944, "epoch": 3570} {"train_loss": -7.0013427734375, "global_step": 149945, "epoch": 3570} {"train_loss": -6.841994285583496, "global_step": 149946, "epoch": 3570} {"train_loss": -6.799776554107666, "global_step": 149947, "epoch": 3570} {"train_loss": -6.8498735427856445, "global_step": 149948, "epoch": 3570} {"train_loss": -6.829277992248535, "global_step": 149949, "epoch": 3570} {"train_loss": -6.823180198669434, "global_step": 149950, "epoch": 3570} {"train_loss": -6.7922515869140625, "global_step": 149951, "epoch": 3570} {"train_loss": -6.827490329742432, "global_step": 149952, "epoch": 3570} {"train_loss": -6.871415138244629, "global_step": 149953, "epoch": 3570} {"train_loss": -6.822893142700195, "global_step": 149954, "epoch": 3570} {"train_loss": -6.80743408203125, "global_step": 149955, "epoch": 3570} {"train_loss": -6.854013442993164, "global_step": 149956, "epoch": 3570} {"train_loss": -6.943687438964844, "global_step": 149957, "epoch": 3570} {"train_loss": -6.806631088256836, "global_step": 149958, "epoch": 3570} {"train_loss": -6.867084503173828, "global_step": 149959, "epoch": 3570} {"train_loss": -6.837845802307129, "global_step": 149960, "epoch": 3570} {"train_loss": -6.814742565155029, "global_step": 149961, "epoch": 3570} {"train_loss": -6.826842308044434, "global_step": 149962, "epoch": 3570} {"train_loss": -6.834671974182129, "global_step": 149963, "epoch": 3570} {"train_loss": -7.001980304718018, "global_step": 149964, "epoch": 3570} {"train_loss": -6.886685848236084, "global_step": 149965, "epoch": 3570} {"train_loss": -6.948113918304443, "global_step": 149966, "epoch": 3570} {"train_loss": -6.823562145233154, "global_step": 149967, "epoch": 3570} {"train_loss": -6.835925579071045, "global_step": 149968, "epoch": 3570} {"train_loss": -6.801303386688232, "global_step": 149969, "epoch": 3570} {"train_loss": -6.910378456115723, "global_step": 149970, "epoch": 3570} {"train_loss": -6.877194404602051, "global_step": 149971, "epoch": 3570} {"train_loss": -6.828587055206299, "global_step": 149972, "epoch": 3570} {"train_loss": -6.815308570861816, "global_step": 149973, "epoch": 3570} {"train_loss": -6.864168643951416, "global_step": 149974, "epoch": 3570} {"train_loss": -6.988530158996582, "global_step": 149975, "epoch": 3570} {"train_loss": -6.883688449859619, "global_step": 149976, "epoch": 3570} {"train_loss": -6.730996131896973, "global_step": 149977, "epoch": 3570} {"train_loss": -6.80567741394043, "global_step": 149978, "epoch": 3570} {"train_loss": -6.809789657592773, "global_step": 149979, "epoch": 3570} {"train_loss": -6.870519638061523, "global_step": 149980, "epoch": 3570} {"train_loss": -6.849344730377197, "global_step": 149981, "epoch": 3570, "val_loss": 68349.6875} {"train_loss": -6.776039123535156, "global_step": 149982, "epoch": 3571} {"train_loss": -6.81526517868042, "global_step": 149983, "epoch": 3571} {"train_loss": -6.788664817810059, "global_step": 149984, "epoch": 3571} {"train_loss": -6.740656852722168, "global_step": 149985, "epoch": 3571} {"train_loss": -6.897493839263916, "global_step": 149986, "epoch": 3571} {"train_loss": -6.873371124267578, "global_step": 149987, "epoch": 3571} {"train_loss": -6.819300174713135, "global_step": 149988, "epoch": 3571} {"train_loss": -6.766534328460693, "global_step": 149989, "epoch": 3571} {"train_loss": -6.863164901733398, "global_step": 149990, "epoch": 3571} {"train_loss": -6.70317268371582, "global_step": 149991, "epoch": 3571} {"train_loss": -6.845812797546387, "global_step": 149992, "epoch": 3571} {"train_loss": -6.864266395568848, "global_step": 149993, "epoch": 3571} {"train_loss": -6.7505292892456055, "global_step": 149994, "epoch": 3571} {"train_loss": -6.772224426269531, "global_step": 149995, "epoch": 3571} {"train_loss": -6.819109916687012, "global_step": 149996, "epoch": 3571} {"train_loss": -6.767496585845947, "global_step": 149997, "epoch": 3571} {"train_loss": -6.901116371154785, "global_step": 149998, "epoch": 3571} {"train_loss": -6.808363437652588, "global_step": 149999, "epoch": 3571} {"train_loss": -6.841217041015625, "global_step": 150000, "epoch": 3571} {"train_loss": -6.7744245529174805, "global_step": 150001, "epoch": 3571} {"train_loss": -6.693633556365967, "global_step": 150002, "epoch": 3571} {"train_loss": -6.846310615539551, "global_step": 150003, "epoch": 3571} {"train_loss": -6.7789506912231445, "global_step": 150004, "epoch": 3571} {"train_loss": -6.733821392059326, "global_step": 150005, "epoch": 3571} {"train_loss": -6.780345439910889, "global_step": 150006, "epoch": 3571} {"train_loss": -6.882138252258301, "global_step": 150007, "epoch": 3571} {"train_loss": -6.735459327697754, "global_step": 150008, "epoch": 3571} {"train_loss": -6.908042907714844, "global_step": 150009, "epoch": 3571} {"train_loss": -6.770971298217773, "global_step": 150010, "epoch": 3571} {"train_loss": -6.783402919769287, "global_step": 150011, "epoch": 3571} {"train_loss": -6.790036678314209, "global_step": 150012, "epoch": 3571} {"train_loss": -6.793795585632324, "global_step": 150013, "epoch": 3571} {"train_loss": -6.726230621337891, "global_step": 150014, "epoch": 3571} {"train_loss": -6.795815467834473, "global_step": 150015, "epoch": 3571} {"train_loss": -6.64115047454834, "global_step": 150016, "epoch": 3571} {"train_loss": -6.723657131195068, "global_step": 150017, "epoch": 3571} {"train_loss": -6.568481922149658, "global_step": 150018, "epoch": 3571} {"train_loss": -6.683610439300537, "global_step": 150019, "epoch": 3571} {"train_loss": -6.657871723175049, "global_step": 150020, "epoch": 3571} {"train_loss": -6.443042755126953, "global_step": 150021, "epoch": 3571} {"train_loss": -6.789751052856445, "global_step": 150022, "epoch": 3571} {"train_loss": -6.766643285751343, "global_step": 150023, "epoch": 3571, "val_loss": 68510.1953125} {"train_loss": -6.706359386444092, "global_step": 150024, "epoch": 3572} {"train_loss": -6.717157363891602, "global_step": 150025, "epoch": 3572} {"train_loss": -6.628478527069092, "global_step": 150026, "epoch": 3572} {"train_loss": -6.738197326660156, "global_step": 150027, "epoch": 3572} {"train_loss": -6.759156227111816, "global_step": 150028, "epoch": 3572} {"train_loss": -6.750412464141846, "global_step": 150029, "epoch": 3572} {"train_loss": -6.720479965209961, "global_step": 150030, "epoch": 3572} {"train_loss": -6.708673000335693, "global_step": 150031, "epoch": 3572} {"train_loss": -6.829672813415527, "global_step": 150032, "epoch": 3572} {"train_loss": -6.836141586303711, "global_step": 150033, "epoch": 3572} {"train_loss": -6.81696891784668, "global_step": 150034, "epoch": 3572} {"train_loss": -6.69655704498291, "global_step": 150035, "epoch": 3572} {"train_loss": -6.786404609680176, "global_step": 150036, "epoch": 3572} {"train_loss": -6.735884666442871, "global_step": 150037, "epoch": 3572} {"train_loss": -6.799140453338623, "global_step": 150038, "epoch": 3572} {"train_loss": -6.877674102783203, "global_step": 150039, "epoch": 3572} {"train_loss": -6.805566310882568, "global_step": 150040, "epoch": 3572} {"train_loss": -6.755786418914795, "global_step": 150041, "epoch": 3572} {"train_loss": -6.788918972015381, "global_step": 150042, "epoch": 3572} {"train_loss": -6.82960319519043, "global_step": 150043, "epoch": 3572} {"train_loss": -6.834505081176758, "global_step": 150044, "epoch": 3572} {"train_loss": -6.77677059173584, "global_step": 150045, "epoch": 3572} {"train_loss": -6.826013565063477, "global_step": 150046, "epoch": 3572} {"train_loss": -6.815517902374268, "global_step": 150047, "epoch": 3572} {"train_loss": -6.985889434814453, "global_step": 150048, "epoch": 3572} {"train_loss": -6.764833450317383, "global_step": 150049, "epoch": 3572} {"train_loss": -6.716718673706055, "global_step": 150050, "epoch": 3572} {"train_loss": -6.854525566101074, "global_step": 150051, "epoch": 3572} {"train_loss": -6.897000312805176, "global_step": 150052, "epoch": 3572} {"train_loss": -6.811312675476074, "global_step": 150053, "epoch": 3572} {"train_loss": -6.86099910736084, "global_step": 150054, "epoch": 3572} {"train_loss": -6.9415998458862305, "global_step": 150055, "epoch": 3572} {"train_loss": -6.787459373474121, "global_step": 150056, "epoch": 3572} {"train_loss": -6.898435592651367, "global_step": 150057, "epoch": 3572} {"train_loss": -6.916766166687012, "global_step": 150058, "epoch": 3572} {"train_loss": -6.800128936767578, "global_step": 150059, "epoch": 3572} {"train_loss": -6.759983062744141, "global_step": 150060, "epoch": 3572} {"train_loss": -6.988704204559326, "global_step": 150061, "epoch": 3572} {"train_loss": -6.82927131652832, "global_step": 150062, "epoch": 3572} {"train_loss": -6.820309638977051, "global_step": 150063, "epoch": 3572} {"train_loss": -6.91895866394043, "global_step": 150064, "epoch": 3572} {"train_loss": -6.807499669847035, "global_step": 150065, "epoch": 3572, "val_loss": 68387.4921875} {"train_loss": -6.965076446533203, "global_step": 150066, "epoch": 3573} {"train_loss": -6.90728235244751, "global_step": 150067, "epoch": 3573} {"train_loss": -6.780245304107666, "global_step": 150068, "epoch": 3573} {"train_loss": -6.833430290222168, "global_step": 150069, "epoch": 3573} {"train_loss": -6.811643600463867, "global_step": 150070, "epoch": 3573} {"train_loss": -6.8411545753479, "global_step": 150071, "epoch": 3573} {"train_loss": -6.727719306945801, "global_step": 150072, "epoch": 3573} {"train_loss": -6.790304183959961, "global_step": 150073, "epoch": 3573} {"train_loss": -6.666390419006348, "global_step": 150074, "epoch": 3573} {"train_loss": -6.792896270751953, "global_step": 150075, "epoch": 3573} {"train_loss": -6.717618942260742, "global_step": 150076, "epoch": 3573} {"train_loss": -6.90584659576416, "global_step": 150077, "epoch": 3573} {"train_loss": -6.842534065246582, "global_step": 150078, "epoch": 3573} {"train_loss": -6.934699058532715, "global_step": 150079, "epoch": 3573} {"train_loss": -6.869765281677246, "global_step": 150080, "epoch": 3573} {"train_loss": -6.822076797485352, "global_step": 150081, "epoch": 3573} {"train_loss": -6.818435192108154, "global_step": 150082, "epoch": 3573} {"train_loss": -6.71460485458374, "global_step": 150083, "epoch": 3573} {"train_loss": -6.797183990478516, "global_step": 150084, "epoch": 3573} {"train_loss": -6.797098636627197, "global_step": 150085, "epoch": 3573} {"train_loss": -6.7543511390686035, "global_step": 150086, "epoch": 3573} {"train_loss": -6.789282321929932, "global_step": 150087, "epoch": 3573} {"train_loss": -6.755863189697266, "global_step": 150088, "epoch": 3573} {"train_loss": -6.820632457733154, "global_step": 150089, "epoch": 3573} {"train_loss": -6.757109642028809, "global_step": 150090, "epoch": 3573} {"train_loss": -6.809581756591797, "global_step": 150091, "epoch": 3573} {"train_loss": -6.823915481567383, "global_step": 150092, "epoch": 3573} {"train_loss": -6.832223892211914, "global_step": 150093, "epoch": 3573} {"train_loss": -6.805713176727295, "global_step": 150094, "epoch": 3573} {"train_loss": -6.801044464111328, "global_step": 150095, "epoch": 3573} {"train_loss": -6.768891334533691, "global_step": 150096, "epoch": 3573} {"train_loss": -6.838543891906738, "global_step": 150097, "epoch": 3573} {"train_loss": -6.856813430786133, "global_step": 150098, "epoch": 3573} {"train_loss": -6.686134338378906, "global_step": 150099, "epoch": 3573} {"train_loss": -6.87753963470459, "global_step": 150100, "epoch": 3573} {"train_loss": -6.807502269744873, "global_step": 150101, "epoch": 3573} {"train_loss": -6.769317626953125, "global_step": 150102, "epoch": 3573} {"train_loss": -6.852267265319824, "global_step": 150103, "epoch": 3573} {"train_loss": -6.7674689292907715, "global_step": 150104, "epoch": 3573} {"train_loss": -6.758014678955078, "global_step": 150105, "epoch": 3573} {"train_loss": -6.820592403411865, "global_step": 150106, "epoch": 3573} {"train_loss": -6.8098315965561635, "global_step": 150107, "epoch": 3573, "val_loss": 68312.609375} {"train_loss": -6.937966823577881, "global_step": 150108, "epoch": 3574} {"train_loss": -6.921060085296631, "global_step": 150109, "epoch": 3574} {"train_loss": -6.894077301025391, "global_step": 150110, "epoch": 3574} {"train_loss": -6.814052581787109, "global_step": 150111, "epoch": 3574} {"train_loss": -6.933643817901611, "global_step": 150112, "epoch": 3574} {"train_loss": -6.84272575378418, "global_step": 150113, "epoch": 3574} {"train_loss": -6.692572593688965, "global_step": 150114, "epoch": 3574} {"train_loss": -6.898073196411133, "global_step": 150115, "epoch": 3574} {"train_loss": -6.872318267822266, "global_step": 150116, "epoch": 3574} {"train_loss": -6.612722873687744, "global_step": 150117, "epoch": 3574} {"train_loss": -6.7049665451049805, "global_step": 150118, "epoch": 3574} {"train_loss": -6.6955671310424805, "global_step": 150119, "epoch": 3574} {"train_loss": -6.814982891082764, "global_step": 150120, "epoch": 3574} {"train_loss": -6.781035423278809, "global_step": 150121, "epoch": 3574} {"train_loss": -6.684842109680176, "global_step": 150122, "epoch": 3574} {"train_loss": -6.678262233734131, "global_step": 150123, "epoch": 3574} {"train_loss": -6.635350227355957, "global_step": 150124, "epoch": 3574} {"train_loss": -6.68435001373291, "global_step": 150125, "epoch": 3574} {"train_loss": -6.721980094909668, "global_step": 150126, "epoch": 3574} {"train_loss": -6.656095504760742, "global_step": 150127, "epoch": 3574} {"train_loss": -6.750572204589844, "global_step": 150128, "epoch": 3574} {"train_loss": -6.79880952835083, "global_step": 150129, "epoch": 3574} {"train_loss": -6.708639621734619, "global_step": 150130, "epoch": 3574} {"train_loss": -6.769620895385742, "global_step": 150131, "epoch": 3574} {"train_loss": -6.686922550201416, "global_step": 150132, "epoch": 3574} {"train_loss": -6.7966413497924805, "global_step": 150133, "epoch": 3574} {"train_loss": -6.8798112869262695, "global_step": 150134, "epoch": 3574} {"train_loss": -6.804751396179199, "global_step": 150135, "epoch": 3574} {"train_loss": -6.869734764099121, "global_step": 150136, "epoch": 3574} {"train_loss": -6.818758487701416, "global_step": 150137, "epoch": 3574} {"train_loss": -6.783895015716553, "global_step": 150138, "epoch": 3574} {"train_loss": -6.714581489562988, "global_step": 150139, "epoch": 3574} {"train_loss": -6.766493320465088, "global_step": 150140, "epoch": 3574} {"train_loss": -6.823927879333496, "global_step": 150141, "epoch": 3574} {"train_loss": -6.776459693908691, "global_step": 150142, "epoch": 3574} {"train_loss": -6.81187629699707, "global_step": 150143, "epoch": 3574} {"train_loss": -6.811841011047363, "global_step": 150144, "epoch": 3574} {"train_loss": -6.850533485412598, "global_step": 150145, "epoch": 3574} {"train_loss": -6.7646918296813965, "global_step": 150146, "epoch": 3574} {"train_loss": -6.830352306365967, "global_step": 150147, "epoch": 3574} {"train_loss": -6.678796291351318, "global_step": 150148, "epoch": 3574} {"train_loss": -6.780880087897891, "global_step": 150149, "epoch": 3574, "val_loss": 68552.234375} {"train_loss": -6.82745361328125, "global_step": 150150, "epoch": 3575} {"train_loss": -6.846534729003906, "global_step": 150151, "epoch": 3575} {"train_loss": -6.8680219650268555, "global_step": 150152, "epoch": 3575} {"train_loss": -6.827288627624512, "global_step": 150153, "epoch": 3575} {"train_loss": -6.886904239654541, "global_step": 150154, "epoch": 3575} {"train_loss": -6.847957611083984, "global_step": 150155, "epoch": 3575} {"train_loss": -6.816898345947266, "global_step": 150156, "epoch": 3575} {"train_loss": -6.849633693695068, "global_step": 150157, "epoch": 3575} {"train_loss": -6.795448303222656, "global_step": 150158, "epoch": 3575} {"train_loss": -6.901228427886963, "global_step": 150159, "epoch": 3575} {"train_loss": -6.847224235534668, "global_step": 150160, "epoch": 3575} {"train_loss": -6.750830173492432, "global_step": 150161, "epoch": 3575} {"train_loss": -6.868471622467041, "global_step": 150162, "epoch": 3575} {"train_loss": -6.8664727210998535, "global_step": 150163, "epoch": 3575} {"train_loss": -6.7285966873168945, "global_step": 150164, "epoch": 3575} {"train_loss": -6.839458465576172, "global_step": 150165, "epoch": 3575} {"train_loss": -6.785483360290527, "global_step": 150166, "epoch": 3575} {"train_loss": -6.693810939788818, "global_step": 150167, "epoch": 3575} {"train_loss": -6.872826099395752, "global_step": 150168, "epoch": 3575} {"train_loss": -6.750208854675293, "global_step": 150169, "epoch": 3575} {"train_loss": -6.778833389282227, "global_step": 150170, "epoch": 3575} {"train_loss": -6.815887451171875, "global_step": 150171, "epoch": 3575} {"train_loss": -6.703271865844727, "global_step": 150172, "epoch": 3575} {"train_loss": -6.759087562561035, "global_step": 150173, "epoch": 3575} {"train_loss": -6.703129768371582, "global_step": 150174, "epoch": 3575} {"train_loss": -6.866511821746826, "global_step": 150175, "epoch": 3575} {"train_loss": -6.842632293701172, "global_step": 150176, "epoch": 3575} {"train_loss": -6.787207126617432, "global_step": 150177, "epoch": 3575} {"train_loss": -6.761085033416748, "global_step": 150178, "epoch": 3575} {"train_loss": -6.872533321380615, "global_step": 150179, "epoch": 3575} {"train_loss": -6.6823296546936035, "global_step": 150180, "epoch": 3575} {"train_loss": -6.831995964050293, "global_step": 150181, "epoch": 3575} {"train_loss": -6.905289649963379, "global_step": 150182, "epoch": 3575} {"train_loss": -6.795098781585693, "global_step": 150183, "epoch": 3575} {"train_loss": -6.754644393920898, "global_step": 150184, "epoch": 3575} {"train_loss": -6.753261089324951, "global_step": 150185, "epoch": 3575} {"train_loss": -6.823313236236572, "global_step": 150186, "epoch": 3575} {"train_loss": -6.761009216308594, "global_step": 150187, "epoch": 3575} {"train_loss": -6.868326187133789, "global_step": 150188, "epoch": 3575} {"train_loss": -6.834892749786377, "global_step": 150189, "epoch": 3575} {"train_loss": -6.972896575927734, "global_step": 150190, "epoch": 3575} {"train_loss": -6.814844210942586, "global_step": 150191, "epoch": 3575, "val_loss": 68379.8671875} {"train_loss": -6.877321720123291, "global_step": 150192, "epoch": 3576} {"train_loss": -6.872947692871094, "global_step": 150193, "epoch": 3576} {"train_loss": -6.888449668884277, "global_step": 150194, "epoch": 3576} {"train_loss": -6.861839294433594, "global_step": 150195, "epoch": 3576} {"train_loss": -6.859472274780273, "global_step": 150196, "epoch": 3576} {"train_loss": -6.870061874389648, "global_step": 150197, "epoch": 3576} {"train_loss": -6.881684303283691, "global_step": 150198, "epoch": 3576} {"train_loss": -6.855330944061279, "global_step": 150199, "epoch": 3576} {"train_loss": -6.867905139923096, "global_step": 150200, "epoch": 3576} {"train_loss": -6.912412643432617, "global_step": 150201, "epoch": 3576} {"train_loss": -6.788995265960693, "global_step": 150202, "epoch": 3576} {"train_loss": -6.876175880432129, "global_step": 150203, "epoch": 3576} {"train_loss": -6.908321380615234, "global_step": 150204, "epoch": 3576} {"train_loss": -6.94135856628418, "global_step": 150205, "epoch": 3576} {"train_loss": -6.90574836730957, "global_step": 150206, "epoch": 3576} {"train_loss": -6.903321266174316, "global_step": 150207, "epoch": 3576} {"train_loss": -6.87205696105957, "global_step": 150208, "epoch": 3576} {"train_loss": -6.843630790710449, "global_step": 150209, "epoch": 3576} {"train_loss": -6.995448112487793, "global_step": 150210, "epoch": 3576} {"train_loss": -6.825111389160156, "global_step": 150211, "epoch": 3576} {"train_loss": -6.847141742706299, "global_step": 150212, "epoch": 3576} {"train_loss": -6.768733024597168, "global_step": 150213, "epoch": 3576} {"train_loss": -6.800420761108398, "global_step": 150214, "epoch": 3576} {"train_loss": -6.819530487060547, "global_step": 150215, "epoch": 3576} {"train_loss": -6.728131294250488, "global_step": 150216, "epoch": 3576} {"train_loss": -6.79065465927124, "global_step": 150217, "epoch": 3576} {"train_loss": -6.746129035949707, "global_step": 150218, "epoch": 3576} {"train_loss": -6.705395221710205, "global_step": 150219, "epoch": 3576} {"train_loss": -6.689262390136719, "global_step": 150220, "epoch": 3576} {"train_loss": -6.764697074890137, "global_step": 150221, "epoch": 3576} {"train_loss": -6.763611793518066, "global_step": 150222, "epoch": 3576} {"train_loss": -6.717439651489258, "global_step": 150223, "epoch": 3576} {"train_loss": -6.921962738037109, "global_step": 150224, "epoch": 3576} {"train_loss": -6.785621643066406, "global_step": 150225, "epoch": 3576} {"train_loss": -6.597426891326904, "global_step": 150226, "epoch": 3576} {"train_loss": -6.7841339111328125, "global_step": 150227, "epoch": 3576} {"train_loss": -6.683164596557617, "global_step": 150228, "epoch": 3576} {"train_loss": -6.755737781524658, "global_step": 150229, "epoch": 3576} {"train_loss": -6.779608726501465, "global_step": 150230, "epoch": 3576} {"train_loss": -6.742034435272217, "global_step": 150231, "epoch": 3576} {"train_loss": -6.752292156219482, "global_step": 150232, "epoch": 3576} {"train_loss": -6.8148161343165805, "global_step": 150233, "epoch": 3576, "val_loss": 68504.1015625} {"train_loss": -6.758131980895996, "global_step": 150234, "epoch": 3577} {"train_loss": -6.757999897003174, "global_step": 150235, "epoch": 3577} {"train_loss": -6.799433708190918, "global_step": 150236, "epoch": 3577} {"train_loss": -6.705706596374512, "global_step": 150237, "epoch": 3577} {"train_loss": -6.875382423400879, "global_step": 150238, "epoch": 3577} {"train_loss": -6.781489372253418, "global_step": 150239, "epoch": 3577} {"train_loss": -6.707266330718994, "global_step": 150240, "epoch": 3577} {"train_loss": -6.7306084632873535, "global_step": 150241, "epoch": 3577} {"train_loss": -6.768275260925293, "global_step": 150242, "epoch": 3577} {"train_loss": -6.817811012268066, "global_step": 150243, "epoch": 3577} {"train_loss": -6.80780553817749, "global_step": 150244, "epoch": 3577} {"train_loss": -6.726029396057129, "global_step": 150245, "epoch": 3577} {"train_loss": -6.753967761993408, "global_step": 150246, "epoch": 3577} {"train_loss": -6.7595624923706055, "global_step": 150247, "epoch": 3577} {"train_loss": -6.834850311279297, "global_step": 150248, "epoch": 3577} {"train_loss": -6.754486083984375, "global_step": 150249, "epoch": 3577} {"train_loss": -6.813703536987305, "global_step": 150250, "epoch": 3577} {"train_loss": -6.731714725494385, "global_step": 150251, "epoch": 3577} {"train_loss": -6.8524274826049805, "global_step": 150252, "epoch": 3577} {"train_loss": -6.645596504211426, "global_step": 150253, "epoch": 3577} {"train_loss": -6.771451950073242, "global_step": 150254, "epoch": 3577} {"train_loss": -6.777240753173828, "global_step": 150255, "epoch": 3577} {"train_loss": -6.794424057006836, "global_step": 150256, "epoch": 3577} {"train_loss": -6.846004486083984, "global_step": 150257, "epoch": 3577} {"train_loss": -6.689225673675537, "global_step": 150258, "epoch": 3577} {"train_loss": -6.6980085372924805, "global_step": 150259, "epoch": 3577} {"train_loss": -6.772008895874023, "global_step": 150260, "epoch": 3577} {"train_loss": -6.673078536987305, "global_step": 150261, "epoch": 3577} {"train_loss": -6.812921524047852, "global_step": 150262, "epoch": 3577} {"train_loss": -6.6829681396484375, "global_step": 150263, "epoch": 3577} {"train_loss": -6.67978572845459, "global_step": 150264, "epoch": 3577} {"train_loss": -6.845342636108398, "global_step": 150265, "epoch": 3577} {"train_loss": -6.624614715576172, "global_step": 150266, "epoch": 3577} {"train_loss": -6.842046737670898, "global_step": 150267, "epoch": 3577} {"train_loss": -6.691328525543213, "global_step": 150268, "epoch": 3577} {"train_loss": -6.759815216064453, "global_step": 150269, "epoch": 3577} {"train_loss": -6.807704925537109, "global_step": 150270, "epoch": 3577} {"train_loss": -6.720992088317871, "global_step": 150271, "epoch": 3577} {"train_loss": -6.801820755004883, "global_step": 150272, "epoch": 3577} {"train_loss": -6.838793754577637, "global_step": 150273, "epoch": 3577} {"train_loss": -6.734668731689453, "global_step": 150274, "epoch": 3577} {"train_loss": -6.763755151203701, "global_step": 150275, "epoch": 3577, "val_loss": 68511.234375} {"train_loss": -6.781488418579102, "global_step": 150276, "epoch": 3578} {"train_loss": -6.862792491912842, "global_step": 150277, "epoch": 3578} {"train_loss": -6.77311897277832, "global_step": 150278, "epoch": 3578} {"train_loss": -6.830557823181152, "global_step": 150279, "epoch": 3578} {"train_loss": -6.910737037658691, "global_step": 150280, "epoch": 3578} {"train_loss": -6.846719741821289, "global_step": 150281, "epoch": 3578} {"train_loss": -6.864764213562012, "global_step": 150282, "epoch": 3578} {"train_loss": -6.908838272094727, "global_step": 150283, "epoch": 3578} {"train_loss": -6.784100532531738, "global_step": 150284, "epoch": 3578} {"train_loss": -6.796008110046387, "global_step": 150285, "epoch": 3578} {"train_loss": -6.820004940032959, "global_step": 150286, "epoch": 3578} {"train_loss": -6.86136531829834, "global_step": 150287, "epoch": 3578} {"train_loss": -6.8881659507751465, "global_step": 150288, "epoch": 3578} {"train_loss": -6.790701866149902, "global_step": 150289, "epoch": 3578} {"train_loss": -6.772600173950195, "global_step": 150290, "epoch": 3578} {"train_loss": -6.824481964111328, "global_step": 150291, "epoch": 3578} {"train_loss": -6.906721115112305, "global_step": 150292, "epoch": 3578} {"train_loss": -6.946056365966797, "global_step": 150293, "epoch": 3578} {"train_loss": -6.845298767089844, "global_step": 150294, "epoch": 3578} {"train_loss": -6.803525924682617, "global_step": 150295, "epoch": 3578} {"train_loss": -6.714526176452637, "global_step": 150296, "epoch": 3578} {"train_loss": -6.745852470397949, "global_step": 150297, "epoch": 3578} {"train_loss": -6.909263610839844, "global_step": 150298, "epoch": 3578} {"train_loss": -6.687697410583496, "global_step": 150299, "epoch": 3578} {"train_loss": -6.742493152618408, "global_step": 150300, "epoch": 3578} {"train_loss": -6.798670768737793, "global_step": 150301, "epoch": 3578} {"train_loss": -6.710938453674316, "global_step": 150302, "epoch": 3578} {"train_loss": -6.800172805786133, "global_step": 150303, "epoch": 3578} {"train_loss": -6.89137077331543, "global_step": 150304, "epoch": 3578} {"train_loss": -6.755959510803223, "global_step": 150305, "epoch": 3578} {"train_loss": -6.786718368530273, "global_step": 150306, "epoch": 3578} {"train_loss": -6.73531436920166, "global_step": 150307, "epoch": 3578} {"train_loss": -6.652701377868652, "global_step": 150308, "epoch": 3578} {"train_loss": -6.76730489730835, "global_step": 150309, "epoch": 3578} {"train_loss": -6.756847858428955, "global_step": 150310, "epoch": 3578} {"train_loss": -6.791522026062012, "global_step": 150311, "epoch": 3578} {"train_loss": -6.738909721374512, "global_step": 150312, "epoch": 3578} {"train_loss": -6.649712562561035, "global_step": 150313, "epoch": 3578} {"train_loss": -6.823520660400391, "global_step": 150314, "epoch": 3578} {"train_loss": -6.715311050415039, "global_step": 150315, "epoch": 3578} {"train_loss": -6.6727728843688965, "global_step": 150316, "epoch": 3578} {"train_loss": -6.795771689642043, "global_step": 150317, "epoch": 3578, "val_loss": 68515.609375} {"train_loss": -6.820929527282715, "global_step": 150318, "epoch": 3579} {"train_loss": -6.743758201599121, "global_step": 150319, "epoch": 3579} {"train_loss": -6.780653953552246, "global_step": 150320, "epoch": 3579} {"train_loss": -6.800755500793457, "global_step": 150321, "epoch": 3579} {"train_loss": -6.714115142822266, "global_step": 150322, "epoch": 3579} {"train_loss": -6.704292297363281, "global_step": 150323, "epoch": 3579} {"train_loss": -6.809413909912109, "global_step": 150324, "epoch": 3579} {"train_loss": -6.652680397033691, "global_step": 150325, "epoch": 3579} {"train_loss": -6.874956130981445, "global_step": 150326, "epoch": 3579} {"train_loss": -6.666840553283691, "global_step": 150327, "epoch": 3579} {"train_loss": -6.708083152770996, "global_step": 150328, "epoch": 3579} {"train_loss": -6.706527233123779, "global_step": 150329, "epoch": 3579} {"train_loss": -6.782186508178711, "global_step": 150330, "epoch": 3579} {"train_loss": -6.744448661804199, "global_step": 150331, "epoch": 3579} {"train_loss": -6.860162734985352, "global_step": 150332, "epoch": 3579} {"train_loss": -6.90228271484375, "global_step": 150333, "epoch": 3579} {"train_loss": -6.816793918609619, "global_step": 150334, "epoch": 3579} {"train_loss": -6.934647560119629, "global_step": 150335, "epoch": 3579} {"train_loss": -6.864933490753174, "global_step": 150336, "epoch": 3579} {"train_loss": -6.772212028503418, "global_step": 150337, "epoch": 3579} {"train_loss": -6.817045211791992, "global_step": 150338, "epoch": 3579} {"train_loss": -6.853567123413086, "global_step": 150339, "epoch": 3579} {"train_loss": -6.933265686035156, "global_step": 150340, "epoch": 3579} {"train_loss": -6.875430107116699, "global_step": 150341, "epoch": 3579} {"train_loss": -6.822158336639404, "global_step": 150342, "epoch": 3579} {"train_loss": -6.862366676330566, "global_step": 150343, "epoch": 3579} {"train_loss": -6.888352870941162, "global_step": 150344, "epoch": 3579} {"train_loss": -6.854194641113281, "global_step": 150345, "epoch": 3579} {"train_loss": -6.776440620422363, "global_step": 150346, "epoch": 3579} {"train_loss": -6.845149993896484, "global_step": 150347, "epoch": 3579} {"train_loss": -6.824069499969482, "global_step": 150348, "epoch": 3579} {"train_loss": -6.950011730194092, "global_step": 150349, "epoch": 3579} {"train_loss": -6.9477033615112305, "global_step": 150350, "epoch": 3579} {"train_loss": -6.721320152282715, "global_step": 150351, "epoch": 3579} {"train_loss": -6.741605758666992, "global_step": 150352, "epoch": 3579} {"train_loss": -6.928615570068359, "global_step": 150353, "epoch": 3579} {"train_loss": -6.900662422180176, "global_step": 150354, "epoch": 3579} {"train_loss": -6.832034111022949, "global_step": 150355, "epoch": 3579} {"train_loss": -6.820158958435059, "global_step": 150356, "epoch": 3579} {"train_loss": -6.776553630828857, "global_step": 150357, "epoch": 3579} {"train_loss": -6.880010604858398, "global_step": 150358, "epoch": 3579} {"train_loss": -6.814474877857027, "global_step": 150359, "epoch": 3579, "val_loss": 68476.75} {"train_loss": -6.702054500579834, "global_step": 150360, "epoch": 3580} {"train_loss": -6.871369361877441, "global_step": 150361, "epoch": 3580} {"train_loss": -6.975077152252197, "global_step": 150362, "epoch": 3580} {"train_loss": -6.807573318481445, "global_step": 150363, "epoch": 3580} {"train_loss": -6.7876129150390625, "global_step": 150364, "epoch": 3580} {"train_loss": -6.8779520988464355, "global_step": 150365, "epoch": 3580} {"train_loss": -6.8934221267700195, "global_step": 150366, "epoch": 3580} {"train_loss": -6.843376636505127, "global_step": 150367, "epoch": 3580} {"train_loss": -6.871748924255371, "global_step": 150368, "epoch": 3580} {"train_loss": -6.799075126647949, "global_step": 150369, "epoch": 3580} {"train_loss": -6.838739395141602, "global_step": 150370, "epoch": 3580} {"train_loss": -6.798519611358643, "global_step": 150371, "epoch": 3580} {"train_loss": -6.930527210235596, "global_step": 150372, "epoch": 3580} {"train_loss": -6.978216171264648, "global_step": 150373, "epoch": 3580} {"train_loss": -6.958660125732422, "global_step": 150374, "epoch": 3580} {"train_loss": -6.794927597045898, "global_step": 150375, "epoch": 3580} {"train_loss": -6.912773132324219, "global_step": 150376, "epoch": 3580} {"train_loss": -6.822124481201172, "global_step": 150377, "epoch": 3580} {"train_loss": -6.788260459899902, "global_step": 150378, "epoch": 3580} {"train_loss": -6.910002708435059, "global_step": 150379, "epoch": 3580} {"train_loss": -6.730320930480957, "global_step": 150380, "epoch": 3580} {"train_loss": -6.739630699157715, "global_step": 150381, "epoch": 3580} {"train_loss": -6.7948503494262695, "global_step": 150382, "epoch": 3580} {"train_loss": -6.862898826599121, "global_step": 150383, "epoch": 3580} {"train_loss": -6.82282018661499, "global_step": 150384, "epoch": 3580} {"train_loss": -6.857326030731201, "global_step": 150385, "epoch": 3580} {"train_loss": -6.873685359954834, "global_step": 150386, "epoch": 3580} {"train_loss": -6.8809814453125, "global_step": 150387, "epoch": 3580} {"train_loss": -6.849182605743408, "global_step": 150388, "epoch": 3580} {"train_loss": -6.803264141082764, "global_step": 150389, "epoch": 3580} {"train_loss": -6.719202995300293, "global_step": 150390, "epoch": 3580} {"train_loss": -6.831210136413574, "global_step": 150391, "epoch": 3580} {"train_loss": -6.825995922088623, "global_step": 150392, "epoch": 3580} {"train_loss": -6.743327617645264, "global_step": 150393, "epoch": 3580} {"train_loss": -6.874347686767578, "global_step": 150394, "epoch": 3580} {"train_loss": -6.917337894439697, "global_step": 150395, "epoch": 3580} {"train_loss": -6.9270453453063965, "global_step": 150396, "epoch": 3580} {"train_loss": -6.8572492599487305, "global_step": 150397, "epoch": 3580} {"train_loss": -6.89009428024292, "global_step": 150398, "epoch": 3580} {"train_loss": -6.951440811157227, "global_step": 150399, "epoch": 3580} {"train_loss": -6.91452693939209, "global_step": 150400, "epoch": 3580} {"train_loss": -6.851915189198086, "global_step": 150401, "epoch": 3580, "val_loss": 68492.9375} {"train_loss": -6.781553268432617, "global_step": 150402, "epoch": 3581} {"train_loss": -6.801828384399414, "global_step": 150403, "epoch": 3581} {"train_loss": -6.893726825714111, "global_step": 150404, "epoch": 3581} {"train_loss": -6.9034104347229, "global_step": 150405, "epoch": 3581} {"train_loss": -6.805468559265137, "global_step": 150406, "epoch": 3581} {"train_loss": -6.925684452056885, "global_step": 150407, "epoch": 3581} {"train_loss": -6.851005554199219, "global_step": 150408, "epoch": 3581} {"train_loss": -6.8443403244018555, "global_step": 150409, "epoch": 3581} {"train_loss": -6.820691108703613, "global_step": 150410, "epoch": 3581} {"train_loss": -6.897459506988525, "global_step": 150411, "epoch": 3581} {"train_loss": -6.700747489929199, "global_step": 150412, "epoch": 3581} {"train_loss": -6.810702323913574, "global_step": 150413, "epoch": 3581} {"train_loss": -6.723291397094727, "global_step": 150414, "epoch": 3581} {"train_loss": -6.6948394775390625, "global_step": 150415, "epoch": 3581} {"train_loss": -6.938261032104492, "global_step": 150416, "epoch": 3581} {"train_loss": -6.788403034210205, "global_step": 150417, "epoch": 3581} {"train_loss": -6.763933181762695, "global_step": 150418, "epoch": 3581} {"train_loss": -6.753984451293945, "global_step": 150419, "epoch": 3581} {"train_loss": -6.788177490234375, "global_step": 150420, "epoch": 3581} {"train_loss": -6.833984851837158, "global_step": 150421, "epoch": 3581} {"train_loss": -6.68842887878418, "global_step": 150422, "epoch": 3581} {"train_loss": -6.791109085083008, "global_step": 150423, "epoch": 3581} {"train_loss": -6.903350353240967, "global_step": 150424, "epoch": 3581} {"train_loss": -6.971811294555664, "global_step": 150425, "epoch": 3581} {"train_loss": -6.869898319244385, "global_step": 150426, "epoch": 3581} {"train_loss": -6.87091064453125, "global_step": 150427, "epoch": 3581} {"train_loss": -6.788744926452637, "global_step": 150428, "epoch": 3581} {"train_loss": -6.832700729370117, "global_step": 150429, "epoch": 3581} {"train_loss": -6.886347770690918, "global_step": 150430, "epoch": 3581} {"train_loss": -6.895904541015625, "global_step": 150431, "epoch": 3581} {"train_loss": -6.7491655349731445, "global_step": 150432, "epoch": 3581} {"train_loss": -6.854008674621582, "global_step": 150433, "epoch": 3581} {"train_loss": -6.745881080627441, "global_step": 150434, "epoch": 3581} {"train_loss": -6.772675514221191, "global_step": 150435, "epoch": 3581} {"train_loss": -6.773746490478516, "global_step": 150436, "epoch": 3581} {"train_loss": -6.834980010986328, "global_step": 150437, "epoch": 3581} {"train_loss": -6.800647735595703, "global_step": 150438, "epoch": 3581} {"train_loss": -6.763691425323486, "global_step": 150439, "epoch": 3581} {"train_loss": -6.818300247192383, "global_step": 150440, "epoch": 3581} {"train_loss": -6.797711372375488, "global_step": 150441, "epoch": 3581} {"train_loss": -6.831427574157715, "global_step": 150442, "epoch": 3581} {"train_loss": -6.81660735039484, "global_step": 150443, "epoch": 3581, "val_loss": 68303.2421875} {"train_loss": -6.861010551452637, "global_step": 150444, "epoch": 3582} {"train_loss": -6.8844499588012695, "global_step": 150445, "epoch": 3582} {"train_loss": -6.863391876220703, "global_step": 150446, "epoch": 3582} {"train_loss": -6.839850425720215, "global_step": 150447, "epoch": 3582} {"train_loss": -6.936346054077148, "global_step": 150448, "epoch": 3582} {"train_loss": -6.787623405456543, "global_step": 150449, "epoch": 3582} {"train_loss": -6.893795967102051, "global_step": 150450, "epoch": 3582} {"train_loss": -6.808826923370361, "global_step": 150451, "epoch": 3582} {"train_loss": -6.927838325500488, "global_step": 150452, "epoch": 3582} {"train_loss": -6.904391288757324, "global_step": 150453, "epoch": 3582} {"train_loss": -6.861713409423828, "global_step": 150454, "epoch": 3582} {"train_loss": -6.771368026733398, "global_step": 150455, "epoch": 3582} {"train_loss": -6.894147872924805, "global_step": 150456, "epoch": 3582} {"train_loss": -6.839603424072266, "global_step": 150457, "epoch": 3582} {"train_loss": -6.787314414978027, "global_step": 150458, "epoch": 3582} {"train_loss": -6.626378059387207, "global_step": 150459, "epoch": 3582} {"train_loss": -6.614553451538086, "global_step": 150460, "epoch": 3582} {"train_loss": -6.8004841804504395, "global_step": 150461, "epoch": 3582} {"train_loss": -6.727799892425537, "global_step": 150462, "epoch": 3582} {"train_loss": -6.763120651245117, "global_step": 150463, "epoch": 3582} {"train_loss": -6.856711387634277, "global_step": 150464, "epoch": 3582} {"train_loss": -6.8186235427856445, "global_step": 150465, "epoch": 3582} {"train_loss": -6.788708209991455, "global_step": 150466, "epoch": 3582} {"train_loss": -6.770289421081543, "global_step": 150467, "epoch": 3582} {"train_loss": -6.721135139465332, "global_step": 150468, "epoch": 3582} {"train_loss": -6.807859420776367, "global_step": 150469, "epoch": 3582} {"train_loss": -6.649542331695557, "global_step": 150470, "epoch": 3582} {"train_loss": -6.873092174530029, "global_step": 150471, "epoch": 3582} {"train_loss": -6.793583869934082, "global_step": 150472, "epoch": 3582} {"train_loss": -6.789540767669678, "global_step": 150473, "epoch": 3582} {"train_loss": -6.933886528015137, "global_step": 150474, "epoch": 3582} {"train_loss": -6.77942419052124, "global_step": 150475, "epoch": 3582} {"train_loss": -6.724093437194824, "global_step": 150476, "epoch": 3582} {"train_loss": -6.828625679016113, "global_step": 150477, "epoch": 3582} {"train_loss": -6.757748603820801, "global_step": 150478, "epoch": 3582} {"train_loss": -6.833322048187256, "global_step": 150479, "epoch": 3582} {"train_loss": -6.896729946136475, "global_step": 150480, "epoch": 3582} {"train_loss": -6.931928634643555, "global_step": 150481, "epoch": 3582} {"train_loss": -6.79576301574707, "global_step": 150482, "epoch": 3582} {"train_loss": -6.849177360534668, "global_step": 150483, "epoch": 3582} {"train_loss": -6.732550621032715, "global_step": 150484, "epoch": 3582} {"train_loss": -6.813196420669556, "global_step": 150485, "epoch": 3582, "val_loss": 68851.8359375} {"train_loss": -6.664375305175781, "global_step": 150486, "epoch": 3583} {"train_loss": -6.933013916015625, "global_step": 150487, "epoch": 3583} {"train_loss": -6.734902858734131, "global_step": 150488, "epoch": 3583} {"train_loss": -6.708277702331543, "global_step": 150489, "epoch": 3583} {"train_loss": -6.787806034088135, "global_step": 150490, "epoch": 3583} {"train_loss": -6.824773788452148, "global_step": 150491, "epoch": 3583} {"train_loss": -6.762683868408203, "global_step": 150492, "epoch": 3583} {"train_loss": -6.772062301635742, "global_step": 150493, "epoch": 3583} {"train_loss": -6.849006652832031, "global_step": 150494, "epoch": 3583} {"train_loss": -6.6947922706604, "global_step": 150495, "epoch": 3583} {"train_loss": -6.824186325073242, "global_step": 150496, "epoch": 3583} {"train_loss": -6.801460266113281, "global_step": 150497, "epoch": 3583} {"train_loss": -6.7686967849731445, "global_step": 150498, "epoch": 3583} {"train_loss": -6.839346885681152, "global_step": 150499, "epoch": 3583} {"train_loss": -6.704631805419922, "global_step": 150500, "epoch": 3583} {"train_loss": -6.822970867156982, "global_step": 150501, "epoch": 3583} {"train_loss": -6.854088306427002, "global_step": 150502, "epoch": 3583} {"train_loss": -6.834428787231445, "global_step": 150503, "epoch": 3583} {"train_loss": -6.73185396194458, "global_step": 150504, "epoch": 3583} {"train_loss": -6.880712509155273, "global_step": 150505, "epoch": 3583} {"train_loss": -6.7298784255981445, "global_step": 150506, "epoch": 3583} {"train_loss": -6.853573799133301, "global_step": 150507, "epoch": 3583} {"train_loss": -6.88155460357666, "global_step": 150508, "epoch": 3583} {"train_loss": -6.788357257843018, "global_step": 150509, "epoch": 3583} {"train_loss": -6.790543556213379, "global_step": 150510, "epoch": 3583} {"train_loss": -6.834658145904541, "global_step": 150511, "epoch": 3583} {"train_loss": -6.724360942840576, "global_step": 150512, "epoch": 3583} {"train_loss": -6.811366081237793, "global_step": 150513, "epoch": 3583} {"train_loss": -6.868788242340088, "global_step": 150514, "epoch": 3583} {"train_loss": -6.77687931060791, "global_step": 150515, "epoch": 3583} {"train_loss": -6.866093635559082, "global_step": 150516, "epoch": 3583} {"train_loss": -6.860219955444336, "global_step": 150517, "epoch": 3583} {"train_loss": -6.7166972160339355, "global_step": 150518, "epoch": 3583} {"train_loss": -6.862923622131348, "global_step": 150519, "epoch": 3583} {"train_loss": -6.934345722198486, "global_step": 150520, "epoch": 3583} {"train_loss": -6.932324409484863, "global_step": 150521, "epoch": 3583} {"train_loss": -6.762740135192871, "global_step": 150522, "epoch": 3583} {"train_loss": -6.8357391357421875, "global_step": 150523, "epoch": 3583} {"train_loss": -6.902884483337402, "global_step": 150524, "epoch": 3583} {"train_loss": -6.79322624206543, "global_step": 150525, "epoch": 3583} {"train_loss": -6.909106731414795, "global_step": 150526, "epoch": 3583} {"train_loss": -6.810548407690866, "global_step": 150527, "epoch": 3583, "val_loss": 68480.90625} {"train_loss": -6.802799224853516, "global_step": 150528, "epoch": 3584} {"train_loss": -6.9508585929870605, "global_step": 150529, "epoch": 3584} {"train_loss": -6.856966018676758, "global_step": 150530, "epoch": 3584} {"train_loss": -6.820697784423828, "global_step": 150531, "epoch": 3584} {"train_loss": -6.847193717956543, "global_step": 150532, "epoch": 3584} {"train_loss": -6.896880626678467, "global_step": 150533, "epoch": 3584} {"train_loss": -6.8034467697143555, "global_step": 150534, "epoch": 3584} {"train_loss": -6.682981491088867, "global_step": 150535, "epoch": 3584} {"train_loss": -6.8359503746032715, "global_step": 150536, "epoch": 3584} {"train_loss": -6.806866645812988, "global_step": 150537, "epoch": 3584} {"train_loss": -6.817098617553711, "global_step": 150538, "epoch": 3584} {"train_loss": -6.770730972290039, "global_step": 150539, "epoch": 3584} {"train_loss": -6.818138122558594, "global_step": 150540, "epoch": 3584} {"train_loss": -6.79124641418457, "global_step": 150541, "epoch": 3584} {"train_loss": -6.8484930992126465, "global_step": 150542, "epoch": 3584} {"train_loss": -6.779589653015137, "global_step": 150543, "epoch": 3584} {"train_loss": -6.945923805236816, "global_step": 150544, "epoch": 3584} {"train_loss": -6.863887786865234, "global_step": 150545, "epoch": 3584} {"train_loss": -6.84688138961792, "global_step": 150546, "epoch": 3584} {"train_loss": -6.893404006958008, "global_step": 150547, "epoch": 3584} {"train_loss": -6.840249538421631, "global_step": 150548, "epoch": 3584} {"train_loss": -6.919677257537842, "global_step": 150549, "epoch": 3584} {"train_loss": -6.8335723876953125, "global_step": 150550, "epoch": 3584} {"train_loss": -7.009611129760742, "global_step": 150551, "epoch": 3584} {"train_loss": -6.828084468841553, "global_step": 150552, "epoch": 3584} {"train_loss": -6.794949531555176, "global_step": 150553, "epoch": 3584} {"train_loss": -6.854928016662598, "global_step": 150554, "epoch": 3584} {"train_loss": -6.861626625061035, "global_step": 150555, "epoch": 3584} {"train_loss": -6.913238525390625, "global_step": 150556, "epoch": 3584} {"train_loss": -6.779720306396484, "global_step": 150557, "epoch": 3584} {"train_loss": -6.735692024230957, "global_step": 150558, "epoch": 3584} {"train_loss": -6.875093460083008, "global_step": 150559, "epoch": 3584} {"train_loss": -6.865093231201172, "global_step": 150560, "epoch": 3584} {"train_loss": -6.7212605476379395, "global_step": 150561, "epoch": 3584} {"train_loss": -6.893260955810547, "global_step": 150562, "epoch": 3584} {"train_loss": -6.744335651397705, "global_step": 150563, "epoch": 3584} {"train_loss": -6.83998966217041, "global_step": 150564, "epoch": 3584} {"train_loss": -6.784472942352295, "global_step": 150565, "epoch": 3584} {"train_loss": -6.854048252105713, "global_step": 150566, "epoch": 3584} {"train_loss": -6.752845764160156, "global_step": 150567, "epoch": 3584} {"train_loss": -6.843184471130371, "global_step": 150568, "epoch": 3584} {"train_loss": -6.834373178936186, "global_step": 150569, "epoch": 3584, "val_loss": 68323.484375} {"train_loss": -6.8493876457214355, "global_step": 150570, "epoch": 3585} {"train_loss": -6.7509613037109375, "global_step": 150571, "epoch": 3585} {"train_loss": -6.797449111938477, "global_step": 150572, "epoch": 3585} {"train_loss": -6.808894157409668, "global_step": 150573, "epoch": 3585} {"train_loss": -6.81979513168335, "global_step": 150574, "epoch": 3585} {"train_loss": -6.880928039550781, "global_step": 150575, "epoch": 3585} {"train_loss": -6.7468366622924805, "global_step": 150576, "epoch": 3585} {"train_loss": -6.822439670562744, "global_step": 150577, "epoch": 3585} {"train_loss": -6.658751487731934, "global_step": 150578, "epoch": 3585} {"train_loss": -6.881525039672852, "global_step": 150579, "epoch": 3585} {"train_loss": -6.763376235961914, "global_step": 150580, "epoch": 3585} {"train_loss": -6.732420444488525, "global_step": 150581, "epoch": 3585} {"train_loss": -6.859661102294922, "global_step": 150582, "epoch": 3585} {"train_loss": -6.766300201416016, "global_step": 150583, "epoch": 3585} {"train_loss": -6.645601272583008, "global_step": 150584, "epoch": 3585} {"train_loss": -6.753170013427734, "global_step": 150585, "epoch": 3585} {"train_loss": -6.646645545959473, "global_step": 150586, "epoch": 3585} {"train_loss": -6.796119689941406, "global_step": 150587, "epoch": 3585} {"train_loss": -6.7274603843688965, "global_step": 150588, "epoch": 3585} {"train_loss": -6.730406284332275, "global_step": 150589, "epoch": 3585} {"train_loss": -6.757952690124512, "global_step": 150590, "epoch": 3585} {"train_loss": -6.753997325897217, "global_step": 150591, "epoch": 3585} {"train_loss": -6.839506149291992, "global_step": 150592, "epoch": 3585} {"train_loss": -6.831109523773193, "global_step": 150593, "epoch": 3585} {"train_loss": -6.962234020233154, "global_step": 150594, "epoch": 3585} {"train_loss": -6.773472785949707, "global_step": 150595, "epoch": 3585} {"train_loss": -6.832547664642334, "global_step": 150596, "epoch": 3585} {"train_loss": -6.7308669090271, "global_step": 150597, "epoch": 3585} {"train_loss": -6.904407501220703, "global_step": 150598, "epoch": 3585} {"train_loss": -6.74553918838501, "global_step": 150599, "epoch": 3585} {"train_loss": -6.823862552642822, "global_step": 150600, "epoch": 3585} {"train_loss": -6.878956317901611, "global_step": 150601, "epoch": 3585} {"train_loss": -6.753271102905273, "global_step": 150602, "epoch": 3585} {"train_loss": -6.831430912017822, "global_step": 150603, "epoch": 3585} {"train_loss": -6.697926044464111, "global_step": 150604, "epoch": 3585} {"train_loss": -6.95145320892334, "global_step": 150605, "epoch": 3585} {"train_loss": -6.737263202667236, "global_step": 150606, "epoch": 3585} {"train_loss": -6.761720657348633, "global_step": 150607, "epoch": 3585} {"train_loss": -6.964740753173828, "global_step": 150608, "epoch": 3585} {"train_loss": -6.781195640563965, "global_step": 150609, "epoch": 3585} {"train_loss": -6.871577262878418, "global_step": 150610, "epoch": 3585} {"train_loss": -6.796927009310041, "global_step": 150611, "epoch": 3585, "val_loss": 68487.671875} {"train_loss": -6.737360954284668, "global_step": 150612, "epoch": 3586} {"train_loss": -6.941234588623047, "global_step": 150613, "epoch": 3586} {"train_loss": -6.806666374206543, "global_step": 150614, "epoch": 3586} {"train_loss": -6.790440559387207, "global_step": 150615, "epoch": 3586} {"train_loss": -6.900943279266357, "global_step": 150616, "epoch": 3586} {"train_loss": -6.8372650146484375, "global_step": 150617, "epoch": 3586} {"train_loss": -6.85209846496582, "global_step": 150618, "epoch": 3586} {"train_loss": -6.669679641723633, "global_step": 150619, "epoch": 3586} {"train_loss": -6.895953178405762, "global_step": 150620, "epoch": 3586} {"train_loss": -6.711690902709961, "global_step": 150621, "epoch": 3586} {"train_loss": -6.753798007965088, "global_step": 150622, "epoch": 3586} {"train_loss": -6.773656845092773, "global_step": 150623, "epoch": 3586} {"train_loss": -6.779470443725586, "global_step": 150624, "epoch": 3586} {"train_loss": -6.805930137634277, "global_step": 150625, "epoch": 3586} {"train_loss": -6.7655181884765625, "global_step": 150626, "epoch": 3586} {"train_loss": -6.795886039733887, "global_step": 150627, "epoch": 3586} {"train_loss": -6.78609561920166, "global_step": 150628, "epoch": 3586} {"train_loss": -6.884385108947754, "global_step": 150629, "epoch": 3586} {"train_loss": -6.885042190551758, "global_step": 150630, "epoch": 3586} {"train_loss": -6.741263389587402, "global_step": 150631, "epoch": 3586} {"train_loss": -6.894747734069824, "global_step": 150632, "epoch": 3586} {"train_loss": -6.880335807800293, "global_step": 150633, "epoch": 3586} {"train_loss": -6.849575996398926, "global_step": 150634, "epoch": 3586} {"train_loss": -6.851866722106934, "global_step": 150635, "epoch": 3586} {"train_loss": -6.817639350891113, "global_step": 150636, "epoch": 3586} {"train_loss": -6.811428070068359, "global_step": 150637, "epoch": 3586} {"train_loss": -6.785545349121094, "global_step": 150638, "epoch": 3586} {"train_loss": -6.869489669799805, "global_step": 150639, "epoch": 3586} {"train_loss": -6.947010040283203, "global_step": 150640, "epoch": 3586} {"train_loss": -6.756586074829102, "global_step": 150641, "epoch": 3586} {"train_loss": -6.8750457763671875, "global_step": 150642, "epoch": 3586} {"train_loss": -6.941996097564697, "global_step": 150643, "epoch": 3586} {"train_loss": -6.981704235076904, "global_step": 150644, "epoch": 3586} {"train_loss": -6.934649467468262, "global_step": 150645, "epoch": 3586} {"train_loss": -6.850894451141357, "global_step": 150646, "epoch": 3586} {"train_loss": -6.822527885437012, "global_step": 150647, "epoch": 3586} {"train_loss": -6.895515441894531, "global_step": 150648, "epoch": 3586} {"train_loss": -6.75570011138916, "global_step": 150649, "epoch": 3586} {"train_loss": -6.916004657745361, "global_step": 150650, "epoch": 3586} {"train_loss": -6.967916965484619, "global_step": 150651, "epoch": 3586} {"train_loss": -6.861910820007324, "global_step": 150652, "epoch": 3586} {"train_loss": -6.842341207322621, "global_step": 150653, "epoch": 3586, "val_loss": 68326.609375} {"train_loss": -6.850337505340576, "global_step": 150654, "epoch": 3587} {"train_loss": -6.98515510559082, "global_step": 150655, "epoch": 3587} {"train_loss": -6.859618186950684, "global_step": 150656, "epoch": 3587} {"train_loss": -6.770544528961182, "global_step": 150657, "epoch": 3587} {"train_loss": -6.9589362144470215, "global_step": 150658, "epoch": 3587} {"train_loss": -6.768489360809326, "global_step": 150659, "epoch": 3587} {"train_loss": -6.842096328735352, "global_step": 150660, "epoch": 3587} {"train_loss": -6.852289199829102, "global_step": 150661, "epoch": 3587} {"train_loss": -6.764832019805908, "global_step": 150662, "epoch": 3587} {"train_loss": -6.849468231201172, "global_step": 150663, "epoch": 3587} {"train_loss": -6.824404716491699, "global_step": 150664, "epoch": 3587} {"train_loss": -6.77445125579834, "global_step": 150665, "epoch": 3587} {"train_loss": -6.7918596267700195, "global_step": 150666, "epoch": 3587} {"train_loss": -6.820796012878418, "global_step": 150667, "epoch": 3587} {"train_loss": -6.927923202514648, "global_step": 150668, "epoch": 3587} {"train_loss": -6.793087005615234, "global_step": 150669, "epoch": 3587} {"train_loss": -6.828526496887207, "global_step": 150670, "epoch": 3587} {"train_loss": -6.850252151489258, "global_step": 150671, "epoch": 3587} {"train_loss": -6.897247314453125, "global_step": 150672, "epoch": 3587} {"train_loss": -6.901727676391602, "global_step": 150673, "epoch": 3587} {"train_loss": -6.8204193115234375, "global_step": 150674, "epoch": 3587} {"train_loss": -6.7685675621032715, "global_step": 150675, "epoch": 3587} {"train_loss": -6.820677757263184, "global_step": 150676, "epoch": 3587} {"train_loss": -6.800863742828369, "global_step": 150677, "epoch": 3587} {"train_loss": -6.827893257141113, "global_step": 150678, "epoch": 3587} {"train_loss": -6.835838794708252, "global_step": 150679, "epoch": 3587} {"train_loss": -6.756093502044678, "global_step": 150680, "epoch": 3587} {"train_loss": -6.831336975097656, "global_step": 150681, "epoch": 3587} {"train_loss": -6.837552070617676, "global_step": 150682, "epoch": 3587} {"train_loss": -6.705875396728516, "global_step": 150683, "epoch": 3587} {"train_loss": -6.735742568969727, "global_step": 150684, "epoch": 3587} {"train_loss": -6.797277450561523, "global_step": 150685, "epoch": 3587} {"train_loss": -6.78566837310791, "global_step": 150686, "epoch": 3587} {"train_loss": -6.73573112487793, "global_step": 150687, "epoch": 3587} {"train_loss": -6.748085975646973, "global_step": 150688, "epoch": 3587} {"train_loss": -6.7884063720703125, "global_step": 150689, "epoch": 3587} {"train_loss": -6.759253025054932, "global_step": 150690, "epoch": 3587} {"train_loss": -6.692298889160156, "global_step": 150691, "epoch": 3587} {"train_loss": -6.778421401977539, "global_step": 150692, "epoch": 3587} {"train_loss": -6.7471795082092285, "global_step": 150693, "epoch": 3587} {"train_loss": -6.803676128387451, "global_step": 150694, "epoch": 3587} {"train_loss": -6.809385152090163, "global_step": 150695, "epoch": 3587, "val_loss": 68396.9453125} {"train_loss": -6.805266857147217, "global_step": 150696, "epoch": 3588} {"train_loss": -6.722240447998047, "global_step": 150697, "epoch": 3588} {"train_loss": -6.840888023376465, "global_step": 150698, "epoch": 3588} {"train_loss": -6.714935779571533, "global_step": 150699, "epoch": 3588} {"train_loss": -6.739782333374023, "global_step": 150700, "epoch": 3588} {"train_loss": -6.642111778259277, "global_step": 150701, "epoch": 3588} {"train_loss": -6.7744879722595215, "global_step": 150702, "epoch": 3588} {"train_loss": -6.42794132232666, "global_step": 150703, "epoch": 3588} {"train_loss": -6.817639350891113, "global_step": 150704, "epoch": 3588} {"train_loss": -6.589109420776367, "global_step": 150705, "epoch": 3588} {"train_loss": -6.751422882080078, "global_step": 150706, "epoch": 3588} {"train_loss": -6.5789594650268555, "global_step": 150707, "epoch": 3588} {"train_loss": -6.7622857093811035, "global_step": 150708, "epoch": 3588} {"train_loss": -6.792101860046387, "global_step": 150709, "epoch": 3588} {"train_loss": -6.672780990600586, "global_step": 150710, "epoch": 3588} {"train_loss": -6.722753524780273, "global_step": 150711, "epoch": 3588} {"train_loss": -6.758365631103516, "global_step": 150712, "epoch": 3588} {"train_loss": -6.760006904602051, "global_step": 150713, "epoch": 3588} {"train_loss": -6.683437347412109, "global_step": 150714, "epoch": 3588} {"train_loss": -6.7308549880981445, "global_step": 150715, "epoch": 3588} {"train_loss": -6.686124801635742, "global_step": 150716, "epoch": 3588} {"train_loss": -6.652023792266846, "global_step": 150717, "epoch": 3588} {"train_loss": -6.775102615356445, "global_step": 150718, "epoch": 3588} {"train_loss": -6.7996673583984375, "global_step": 150719, "epoch": 3588} {"train_loss": -6.714714050292969, "global_step": 150720, "epoch": 3588} {"train_loss": -6.813265800476074, "global_step": 150721, "epoch": 3588} {"train_loss": -6.604535102844238, "global_step": 150722, "epoch": 3588} {"train_loss": -6.77894401550293, "global_step": 150723, "epoch": 3588} {"train_loss": -6.756682872772217, "global_step": 150724, "epoch": 3588} {"train_loss": -6.782829761505127, "global_step": 150725, "epoch": 3588} {"train_loss": -6.7603888511657715, "global_step": 150726, "epoch": 3588} {"train_loss": -6.7528076171875, "global_step": 150727, "epoch": 3588} {"train_loss": -6.714694976806641, "global_step": 150728, "epoch": 3588} {"train_loss": -6.794835567474365, "global_step": 150729, "epoch": 3588} {"train_loss": -6.750515937805176, "global_step": 150730, "epoch": 3588} {"train_loss": -6.69956636428833, "global_step": 150731, "epoch": 3588} {"train_loss": -6.84128475189209, "global_step": 150732, "epoch": 3588} {"train_loss": -6.722906589508057, "global_step": 150733, "epoch": 3588} {"train_loss": -6.8207244873046875, "global_step": 150734, "epoch": 3588} {"train_loss": -6.682644367218018, "global_step": 150735, "epoch": 3588} {"train_loss": -6.753946304321289, "global_step": 150736, "epoch": 3588} {"train_loss": -6.729804300126576, "global_step": 150737, "epoch": 3588, "val_loss": 68597.1875} {"train_loss": -6.689620494842529, "global_step": 150738, "epoch": 3589} {"train_loss": -6.695640563964844, "global_step": 150739, "epoch": 3589} {"train_loss": -6.698143005371094, "global_step": 150740, "epoch": 3589} {"train_loss": -6.680737495422363, "global_step": 150741, "epoch": 3589} {"train_loss": -6.769686698913574, "global_step": 150742, "epoch": 3589} {"train_loss": -6.757770538330078, "global_step": 150743, "epoch": 3589} {"train_loss": -6.763232707977295, "global_step": 150744, "epoch": 3589} {"train_loss": -6.76831579208374, "global_step": 150745, "epoch": 3589} {"train_loss": -6.78377628326416, "global_step": 150746, "epoch": 3589} {"train_loss": -6.849315643310547, "global_step": 150747, "epoch": 3589} {"train_loss": -6.800131797790527, "global_step": 150748, "epoch": 3589} {"train_loss": -6.772276878356934, "global_step": 150749, "epoch": 3589} {"train_loss": -6.714791297912598, "global_step": 150750, "epoch": 3589} {"train_loss": -6.863736152648926, "global_step": 150751, "epoch": 3589} {"train_loss": -6.839535713195801, "global_step": 150752, "epoch": 3589} {"train_loss": -6.744747161865234, "global_step": 150753, "epoch": 3589} {"train_loss": -6.900464057922363, "global_step": 150754, "epoch": 3589} {"train_loss": -6.800508499145508, "global_step": 150755, "epoch": 3589} {"train_loss": -6.8178815841674805, "global_step": 150756, "epoch": 3589} {"train_loss": -6.7776312828063965, "global_step": 150757, "epoch": 3589} {"train_loss": -6.874213218688965, "global_step": 150758, "epoch": 3589} {"train_loss": -6.707175254821777, "global_step": 150759, "epoch": 3589} {"train_loss": -6.788666725158691, "global_step": 150760, "epoch": 3589} {"train_loss": -6.836822032928467, "global_step": 150761, "epoch": 3589} {"train_loss": -6.696167469024658, "global_step": 150762, "epoch": 3589} {"train_loss": -6.756069183349609, "global_step": 150763, "epoch": 3589} {"train_loss": -6.949518203735352, "global_step": 150764, "epoch": 3589} {"train_loss": -6.828907012939453, "global_step": 150765, "epoch": 3589} {"train_loss": -6.860341548919678, "global_step": 150766, "epoch": 3589} {"train_loss": -6.809082984924316, "global_step": 150767, "epoch": 3589} {"train_loss": -6.824040412902832, "global_step": 150768, "epoch": 3589} {"train_loss": -6.888069152832031, "global_step": 150769, "epoch": 3589} {"train_loss": -6.848610877990723, "global_step": 150770, "epoch": 3589} {"train_loss": -6.73061466217041, "global_step": 150771, "epoch": 3589} {"train_loss": -6.845404148101807, "global_step": 150772, "epoch": 3589} {"train_loss": -6.804973602294922, "global_step": 150773, "epoch": 3589} {"train_loss": -6.93251895904541, "global_step": 150774, "epoch": 3589} {"train_loss": -6.808354377746582, "global_step": 150775, "epoch": 3589} {"train_loss": -6.846796989440918, "global_step": 150776, "epoch": 3589} {"train_loss": -6.922560691833496, "global_step": 150777, "epoch": 3589} {"train_loss": -6.807945251464844, "global_step": 150778, "epoch": 3589} {"train_loss": -6.799170641672044, "global_step": 150779, "epoch": 3589, "val_loss": 68248.5390625} {"train_loss": -6.917148113250732, "global_step": 150780, "epoch": 3590} {"train_loss": -6.869480133056641, "global_step": 150781, "epoch": 3590} {"train_loss": -6.7667951583862305, "global_step": 150782, "epoch": 3590} {"train_loss": -6.774971961975098, "global_step": 150783, "epoch": 3590} {"train_loss": -6.939627647399902, "global_step": 150784, "epoch": 3590} {"train_loss": -6.836479663848877, "global_step": 150785, "epoch": 3590} {"train_loss": -6.788649082183838, "global_step": 150786, "epoch": 3590} {"train_loss": -6.879745006561279, "global_step": 150787, "epoch": 3590} {"train_loss": -6.92300271987915, "global_step": 150788, "epoch": 3590} {"train_loss": -6.863262176513672, "global_step": 150789, "epoch": 3590} {"train_loss": -6.8600616455078125, "global_step": 150790, "epoch": 3590} {"train_loss": -6.840541839599609, "global_step": 150791, "epoch": 3590} {"train_loss": -6.845172882080078, "global_step": 150792, "epoch": 3590} {"train_loss": -6.774655342102051, "global_step": 150793, "epoch": 3590} {"train_loss": -6.863255977630615, "global_step": 150794, "epoch": 3590} {"train_loss": -6.855952739715576, "global_step": 150795, "epoch": 3590} {"train_loss": -6.813864707946777, "global_step": 150796, "epoch": 3590} {"train_loss": -6.761529922485352, "global_step": 150797, "epoch": 3590} {"train_loss": -6.806814670562744, "global_step": 150798, "epoch": 3590} {"train_loss": -6.889187812805176, "global_step": 150799, "epoch": 3590} {"train_loss": -6.807887554168701, "global_step": 150800, "epoch": 3590} {"train_loss": -6.850752353668213, "global_step": 150801, "epoch": 3590} {"train_loss": -6.919929504394531, "global_step": 150802, "epoch": 3590} {"train_loss": -6.963789463043213, "global_step": 150803, "epoch": 3590} {"train_loss": -6.828976631164551, "global_step": 150804, "epoch": 3590} {"train_loss": -6.839803695678711, "global_step": 150805, "epoch": 3590} {"train_loss": -6.769535064697266, "global_step": 150806, "epoch": 3590} {"train_loss": -6.748134136199951, "global_step": 150807, "epoch": 3590} {"train_loss": -6.7733154296875, "global_step": 150808, "epoch": 3590} {"train_loss": -6.707300662994385, "global_step": 150809, "epoch": 3590} {"train_loss": -6.723675727844238, "global_step": 150810, "epoch": 3590} {"train_loss": -6.8630571365356445, "global_step": 150811, "epoch": 3590} {"train_loss": -6.949443817138672, "global_step": 150812, "epoch": 3590} {"train_loss": -6.698143005371094, "global_step": 150813, "epoch": 3590} {"train_loss": -6.869637489318848, "global_step": 150814, "epoch": 3590} {"train_loss": -6.874073505401611, "global_step": 150815, "epoch": 3590} {"train_loss": -6.854582786560059, "global_step": 150816, "epoch": 3590} {"train_loss": -6.865359306335449, "global_step": 150817, "epoch": 3590} {"train_loss": -6.825816631317139, "global_step": 150818, "epoch": 3590} {"train_loss": -6.913002014160156, "global_step": 150819, "epoch": 3590} {"train_loss": -6.799431800842285, "global_step": 150820, "epoch": 3590} {"train_loss": -6.837477082297916, "global_step": 150821, "epoch": 3590, "val_loss": 68501.9765625} {"train_loss": -6.780616760253906, "global_step": 150822, "epoch": 3591} {"train_loss": -6.823398590087891, "global_step": 150823, "epoch": 3591} {"train_loss": -6.7659382820129395, "global_step": 150824, "epoch": 3591} {"train_loss": -6.871809005737305, "global_step": 150825, "epoch": 3591} {"train_loss": -6.641411781311035, "global_step": 150826, "epoch": 3591} {"train_loss": -6.857294082641602, "global_step": 150827, "epoch": 3591} {"train_loss": -6.849742889404297, "global_step": 150828, "epoch": 3591} {"train_loss": -6.855045318603516, "global_step": 150829, "epoch": 3591} {"train_loss": -6.886818885803223, "global_step": 150830, "epoch": 3591} {"train_loss": -6.8858771324157715, "global_step": 150831, "epoch": 3591} {"train_loss": -6.87312126159668, "global_step": 150832, "epoch": 3591} {"train_loss": -6.837495803833008, "global_step": 150833, "epoch": 3591} {"train_loss": -6.8129072189331055, "global_step": 150834, "epoch": 3591} {"train_loss": -6.805202484130859, "global_step": 150835, "epoch": 3591} {"train_loss": -7.014222621917725, "global_step": 150836, "epoch": 3591} {"train_loss": -6.904290199279785, "global_step": 150837, "epoch": 3591} {"train_loss": -6.773863792419434, "global_step": 150838, "epoch": 3591} {"train_loss": -6.861847400665283, "global_step": 150839, "epoch": 3591} {"train_loss": -6.819273471832275, "global_step": 150840, "epoch": 3591} {"train_loss": -6.832642555236816, "global_step": 150841, "epoch": 3591} {"train_loss": -6.693294525146484, "global_step": 150842, "epoch": 3591} {"train_loss": -6.818053245544434, "global_step": 150843, "epoch": 3591} {"train_loss": -6.874035835266113, "global_step": 150844, "epoch": 3591} {"train_loss": -6.737324237823486, "global_step": 150845, "epoch": 3591} {"train_loss": -6.877864837646484, "global_step": 150846, "epoch": 3591} {"train_loss": -6.909767150878906, "global_step": 150847, "epoch": 3591} {"train_loss": -6.878289699554443, "global_step": 150848, "epoch": 3591} {"train_loss": -6.904835224151611, "global_step": 150849, "epoch": 3591} {"train_loss": -6.913743019104004, "global_step": 150850, "epoch": 3591} {"train_loss": -6.8212175369262695, "global_step": 150851, "epoch": 3591} {"train_loss": -6.810563564300537, "global_step": 150852, "epoch": 3591} {"train_loss": -6.883967876434326, "global_step": 150853, "epoch": 3591} {"train_loss": -6.820823669433594, "global_step": 150854, "epoch": 3591} {"train_loss": -6.853177070617676, "global_step": 150855, "epoch": 3591} {"train_loss": -6.8099212646484375, "global_step": 150856, "epoch": 3591} {"train_loss": -6.825578212738037, "global_step": 150857, "epoch": 3591} {"train_loss": -6.915563583374023, "global_step": 150858, "epoch": 3591} {"train_loss": -6.752463340759277, "global_step": 150859, "epoch": 3591} {"train_loss": -6.801976680755615, "global_step": 150860, "epoch": 3591} {"train_loss": -6.792168617248535, "global_step": 150861, "epoch": 3591} {"train_loss": -6.823403358459473, "global_step": 150862, "epoch": 3591} {"train_loss": -6.836328063692365, "global_step": 150863, "epoch": 3591, "val_loss": 68508.8671875} {"train_loss": -6.917768478393555, "global_step": 150864, "epoch": 3592} {"train_loss": -6.8420329093933105, "global_step": 150865, "epoch": 3592} {"train_loss": -6.847308158874512, "global_step": 150866, "epoch": 3592} {"train_loss": -6.841753005981445, "global_step": 150867, "epoch": 3592} {"train_loss": -6.82374382019043, "global_step": 150868, "epoch": 3592} {"train_loss": -6.836878299713135, "global_step": 150869, "epoch": 3592} {"train_loss": -6.7989654541015625, "global_step": 150870, "epoch": 3592} {"train_loss": -6.842691421508789, "global_step": 150871, "epoch": 3592} {"train_loss": -6.791663646697998, "global_step": 150872, "epoch": 3592} {"train_loss": -6.6966047286987305, "global_step": 150873, "epoch": 3592} {"train_loss": -6.694772720336914, "global_step": 150874, "epoch": 3592} {"train_loss": -6.8298845291137695, "global_step": 150875, "epoch": 3592} {"train_loss": -6.763463020324707, "global_step": 150876, "epoch": 3592} {"train_loss": -6.765037536621094, "global_step": 150877, "epoch": 3592} {"train_loss": -6.7777252197265625, "global_step": 150878, "epoch": 3592} {"train_loss": -6.800797462463379, "global_step": 150879, "epoch": 3592} {"train_loss": -6.768971920013428, "global_step": 150880, "epoch": 3592} {"train_loss": -6.918201923370361, "global_step": 150881, "epoch": 3592} {"train_loss": -6.7459564208984375, "global_step": 150882, "epoch": 3592} {"train_loss": -6.766324043273926, "global_step": 150883, "epoch": 3592} {"train_loss": -6.8854169845581055, "global_step": 150884, "epoch": 3592} {"train_loss": -6.7686543464660645, "global_step": 150885, "epoch": 3592} {"train_loss": -6.741053104400635, "global_step": 150886, "epoch": 3592} {"train_loss": -6.836441993713379, "global_step": 150887, "epoch": 3592} {"train_loss": -6.848067760467529, "global_step": 150888, "epoch": 3592} {"train_loss": -6.790076732635498, "global_step": 150889, "epoch": 3592} {"train_loss": -6.831974983215332, "global_step": 150890, "epoch": 3592} {"train_loss": -6.857745170593262, "global_step": 150891, "epoch": 3592} {"train_loss": -6.780219554901123, "global_step": 150892, "epoch": 3592} {"train_loss": -6.808959484100342, "global_step": 150893, "epoch": 3592} {"train_loss": -6.80775785446167, "global_step": 150894, "epoch": 3592} {"train_loss": -6.795740127563477, "global_step": 150895, "epoch": 3592} {"train_loss": -6.764754295349121, "global_step": 150896, "epoch": 3592} {"train_loss": -6.8178277015686035, "global_step": 150897, "epoch": 3592} {"train_loss": -6.837512969970703, "global_step": 150898, "epoch": 3592} {"train_loss": -6.694485664367676, "global_step": 150899, "epoch": 3592} {"train_loss": -6.766440391540527, "global_step": 150900, "epoch": 3592} {"train_loss": -6.873333930969238, "global_step": 150901, "epoch": 3592} {"train_loss": -6.693239212036133, "global_step": 150902, "epoch": 3592} {"train_loss": -6.874593734741211, "global_step": 150903, "epoch": 3592} {"train_loss": -6.792004585266113, "global_step": 150904, "epoch": 3592} {"train_loss": -6.800964434941609, "global_step": 150905, "epoch": 3592, "val_loss": 68503.2578125} {"train_loss": -6.684497833251953, "global_step": 150906, "epoch": 3593} {"train_loss": -6.871931076049805, "global_step": 150907, "epoch": 3593} {"train_loss": -6.8817596435546875, "global_step": 150908, "epoch": 3593} {"train_loss": -6.801815032958984, "global_step": 150909, "epoch": 3593} {"train_loss": -6.805144309997559, "global_step": 150910, "epoch": 3593} {"train_loss": -6.822619438171387, "global_step": 150911, "epoch": 3593} {"train_loss": -6.69618034362793, "global_step": 150912, "epoch": 3593} {"train_loss": -6.907233715057373, "global_step": 150913, "epoch": 3593} {"train_loss": -6.8766889572143555, "global_step": 150914, "epoch": 3593} {"train_loss": -6.848397254943848, "global_step": 150915, "epoch": 3593} {"train_loss": -6.907086372375488, "global_step": 150916, "epoch": 3593} {"train_loss": -6.777153491973877, "global_step": 150917, "epoch": 3593} {"train_loss": -6.700763702392578, "global_step": 150918, "epoch": 3593} {"train_loss": -6.8590006828308105, "global_step": 150919, "epoch": 3593} {"train_loss": -6.825270652770996, "global_step": 150920, "epoch": 3593} {"train_loss": -6.87931489944458, "global_step": 150921, "epoch": 3593} {"train_loss": -6.789379119873047, "global_step": 150922, "epoch": 3593} {"train_loss": -6.807345390319824, "global_step": 150923, "epoch": 3593} {"train_loss": -6.938817024230957, "global_step": 150924, "epoch": 3593} {"train_loss": -6.726965427398682, "global_step": 150925, "epoch": 3593} {"train_loss": -6.818758964538574, "global_step": 150926, "epoch": 3593} {"train_loss": -6.770908355712891, "global_step": 150927, "epoch": 3593} {"train_loss": -6.706840515136719, "global_step": 150928, "epoch": 3593} {"train_loss": -6.752659797668457, "global_step": 150929, "epoch": 3593} {"train_loss": -6.775946617126465, "global_step": 150930, "epoch": 3593} {"train_loss": -6.803197860717773, "global_step": 150931, "epoch": 3593} {"train_loss": -6.844393730163574, "global_step": 150932, "epoch": 3593} {"train_loss": -6.773697853088379, "global_step": 150933, "epoch": 3593} {"train_loss": -6.827999114990234, "global_step": 150934, "epoch": 3593} {"train_loss": -6.718085765838623, "global_step": 150935, "epoch": 3593} {"train_loss": -6.707516193389893, "global_step": 150936, "epoch": 3593} {"train_loss": -6.7759857177734375, "global_step": 150937, "epoch": 3593} {"train_loss": -6.8602294921875, "global_step": 150938, "epoch": 3593} {"train_loss": -6.834261894226074, "global_step": 150939, "epoch": 3593} {"train_loss": -6.697317600250244, "global_step": 150940, "epoch": 3593} {"train_loss": -6.855958938598633, "global_step": 150941, "epoch": 3593} {"train_loss": -6.831764221191406, "global_step": 150942, "epoch": 3593} {"train_loss": -6.864612579345703, "global_step": 150943, "epoch": 3593} {"train_loss": -6.706109046936035, "global_step": 150944, "epoch": 3593} {"train_loss": -6.688249588012695, "global_step": 150945, "epoch": 3593} {"train_loss": -6.919654369354248, "global_step": 150946, "epoch": 3593} {"train_loss": -6.8023171084267755, "global_step": 150947, "epoch": 3593, "val_loss": 68491.6796875} {"train_loss": -6.768352508544922, "global_step": 150948, "epoch": 3594} {"train_loss": -6.820404052734375, "global_step": 150949, "epoch": 3594} {"train_loss": -6.719756126403809, "global_step": 150950, "epoch": 3594} {"train_loss": -6.722531318664551, "global_step": 150951, "epoch": 3594} {"train_loss": -6.721282482147217, "global_step": 150952, "epoch": 3594} {"train_loss": -6.821842193603516, "global_step": 150953, "epoch": 3594} {"train_loss": -6.845065116882324, "global_step": 150954, "epoch": 3594} {"train_loss": -6.746611595153809, "global_step": 150955, "epoch": 3594} {"train_loss": -6.706449508666992, "global_step": 150956, "epoch": 3594} {"train_loss": -6.940832138061523, "global_step": 150957, "epoch": 3594} {"train_loss": -6.702644348144531, "global_step": 150958, "epoch": 3594} {"train_loss": -6.799299240112305, "global_step": 150959, "epoch": 3594} {"train_loss": -6.804854393005371, "global_step": 150960, "epoch": 3594} {"train_loss": -6.640952110290527, "global_step": 150961, "epoch": 3594} {"train_loss": -6.823208808898926, "global_step": 150962, "epoch": 3594} {"train_loss": -6.758489608764648, "global_step": 150963, "epoch": 3594} {"train_loss": -6.740185737609863, "global_step": 150964, "epoch": 3594} {"train_loss": -6.887030124664307, "global_step": 150965, "epoch": 3594} {"train_loss": -6.799992561340332, "global_step": 150966, "epoch": 3594} {"train_loss": -6.770663261413574, "global_step": 150967, "epoch": 3594} {"train_loss": -6.785670757293701, "global_step": 150968, "epoch": 3594} {"train_loss": -6.832425117492676, "global_step": 150969, "epoch": 3594} {"train_loss": -6.827402114868164, "global_step": 150970, "epoch": 3594} {"train_loss": -6.795814514160156, "global_step": 150971, "epoch": 3594} {"train_loss": -6.837309837341309, "global_step": 150972, "epoch": 3594} {"train_loss": -6.774091720581055, "global_step": 150973, "epoch": 3594} {"train_loss": -6.834875583648682, "global_step": 150974, "epoch": 3594} {"train_loss": -6.777996063232422, "global_step": 150975, "epoch": 3594} {"train_loss": -6.906376838684082, "global_step": 150976, "epoch": 3594} {"train_loss": -6.898908615112305, "global_step": 150977, "epoch": 3594} {"train_loss": -6.784932613372803, "global_step": 150978, "epoch": 3594} {"train_loss": -6.781668186187744, "global_step": 150979, "epoch": 3594} {"train_loss": -6.900572776794434, "global_step": 150980, "epoch": 3594} {"train_loss": -6.734343528747559, "global_step": 150981, "epoch": 3594} {"train_loss": -6.695746421813965, "global_step": 150982, "epoch": 3594} {"train_loss": -6.75502872467041, "global_step": 150983, "epoch": 3594} {"train_loss": -6.730491638183594, "global_step": 150984, "epoch": 3594} {"train_loss": -6.726215839385986, "global_step": 150985, "epoch": 3594} {"train_loss": -6.833165168762207, "global_step": 150986, "epoch": 3594} {"train_loss": -6.667960166931152, "global_step": 150987, "epoch": 3594} {"train_loss": -6.6376953125, "global_step": 150988, "epoch": 3594} {"train_loss": -6.783336037681217, "global_step": 150989, "epoch": 3594, "val_loss": 68392.3046875} {"train_loss": -6.774360179901123, "global_step": 150990, "epoch": 3595} {"train_loss": -6.81452751159668, "global_step": 150991, "epoch": 3595} {"train_loss": -6.832064628601074, "global_step": 150992, "epoch": 3595} {"train_loss": -6.643877029418945, "global_step": 150993, "epoch": 3595} {"train_loss": -6.738409042358398, "global_step": 150994, "epoch": 3595} {"train_loss": -6.805232524871826, "global_step": 150995, "epoch": 3595} {"train_loss": -6.8101654052734375, "global_step": 150996, "epoch": 3595} {"train_loss": -6.733588695526123, "global_step": 150997, "epoch": 3595} {"train_loss": -6.765376091003418, "global_step": 150998, "epoch": 3595} {"train_loss": -6.697373867034912, "global_step": 150999, "epoch": 3595} {"train_loss": -6.857544422149658, "global_step": 151000, "epoch": 3595} {"train_loss": -6.7870707511901855, "global_step": 151001, "epoch": 3595} {"train_loss": -6.848666667938232, "global_step": 151002, "epoch": 3595} {"train_loss": -6.826606750488281, "global_step": 151003, "epoch": 3595} {"train_loss": -6.700413703918457, "global_step": 151004, "epoch": 3595} {"train_loss": -6.847029685974121, "global_step": 151005, "epoch": 3595} {"train_loss": -6.692304611206055, "global_step": 151006, "epoch": 3595} {"train_loss": -6.760943412780762, "global_step": 151007, "epoch": 3595} {"train_loss": -6.826382637023926, "global_step": 151008, "epoch": 3595} {"train_loss": -6.79374361038208, "global_step": 151009, "epoch": 3595} {"train_loss": -6.7959699630737305, "global_step": 151010, "epoch": 3595} {"train_loss": -6.718862533569336, "global_step": 151011, "epoch": 3595} {"train_loss": -6.891566753387451, "global_step": 151012, "epoch": 3595} {"train_loss": -6.705097198486328, "global_step": 151013, "epoch": 3595} {"train_loss": -6.750174522399902, "global_step": 151014, "epoch": 3595} {"train_loss": -6.764660835266113, "global_step": 151015, "epoch": 3595} {"train_loss": -6.801327705383301, "global_step": 151016, "epoch": 3595} {"train_loss": -6.790976047515869, "global_step": 151017, "epoch": 3595} {"train_loss": -6.701501846313477, "global_step": 151018, "epoch": 3595} {"train_loss": -6.834468841552734, "global_step": 151019, "epoch": 3595} {"train_loss": -6.886277198791504, "global_step": 151020, "epoch": 3595} {"train_loss": -6.714879512786865, "global_step": 151021, "epoch": 3595} {"train_loss": -6.7388200759887695, "global_step": 151022, "epoch": 3595} {"train_loss": -6.793456077575684, "global_step": 151023, "epoch": 3595} {"train_loss": -6.873661041259766, "global_step": 151024, "epoch": 3595} {"train_loss": -6.750276565551758, "global_step": 151025, "epoch": 3595} {"train_loss": -6.870258331298828, "global_step": 151026, "epoch": 3595} {"train_loss": -6.869575500488281, "global_step": 151027, "epoch": 3595} {"train_loss": -6.817117691040039, "global_step": 151028, "epoch": 3595} {"train_loss": -6.939797878265381, "global_step": 151029, "epoch": 3595} {"train_loss": -6.8385114669799805, "global_step": 151030, "epoch": 3595} {"train_loss": -6.791366259256999, "global_step": 151031, "epoch": 3595, "val_loss": 68389.2421875} {"train_loss": -6.819247245788574, "global_step": 151032, "epoch": 3596} {"train_loss": -6.868383884429932, "global_step": 151033, "epoch": 3596} {"train_loss": -6.891388416290283, "global_step": 151034, "epoch": 3596} {"train_loss": -6.856075286865234, "global_step": 151035, "epoch": 3596} {"train_loss": -6.937917232513428, "global_step": 151036, "epoch": 3596} {"train_loss": -6.851885795593262, "global_step": 151037, "epoch": 3596} {"train_loss": -6.9108662605285645, "global_step": 151038, "epoch": 3596} {"train_loss": -6.861405849456787, "global_step": 151039, "epoch": 3596} {"train_loss": -6.999979496002197, "global_step": 151040, "epoch": 3596} {"train_loss": -6.851744174957275, "global_step": 151041, "epoch": 3596} {"train_loss": -6.965397834777832, "global_step": 151042, "epoch": 3596} {"train_loss": -6.868160247802734, "global_step": 151043, "epoch": 3596} {"train_loss": -6.8509063720703125, "global_step": 151044, "epoch": 3596} {"train_loss": -6.822295188903809, "global_step": 151045, "epoch": 3596} {"train_loss": -6.84832763671875, "global_step": 151046, "epoch": 3596} {"train_loss": -6.820684432983398, "global_step": 151047, "epoch": 3596} {"train_loss": -6.720052242279053, "global_step": 151048, "epoch": 3596} {"train_loss": -6.846048831939697, "global_step": 151049, "epoch": 3596} {"train_loss": -6.864648818969727, "global_step": 151050, "epoch": 3596} {"train_loss": -6.825008392333984, "global_step": 151051, "epoch": 3596} {"train_loss": -6.795452117919922, "global_step": 151052, "epoch": 3596} {"train_loss": -6.768719673156738, "global_step": 151053, "epoch": 3596} {"train_loss": -6.954642295837402, "global_step": 151054, "epoch": 3596} {"train_loss": -6.845340728759766, "global_step": 151055, "epoch": 3596} {"train_loss": -6.8109941482543945, "global_step": 151056, "epoch": 3596} {"train_loss": -6.960186004638672, "global_step": 151057, "epoch": 3596} {"train_loss": -6.938153266906738, "global_step": 151058, "epoch": 3596} {"train_loss": -6.902370452880859, "global_step": 151059, "epoch": 3596} {"train_loss": -6.905304431915283, "global_step": 151060, "epoch": 3596} {"train_loss": -6.85622501373291, "global_step": 151061, "epoch": 3596} {"train_loss": -6.764310836791992, "global_step": 151062, "epoch": 3596} {"train_loss": -6.781350135803223, "global_step": 151063, "epoch": 3596} {"train_loss": -6.937112808227539, "global_step": 151064, "epoch": 3596} {"train_loss": -6.801912307739258, "global_step": 151065, "epoch": 3596} {"train_loss": -6.91940975189209, "global_step": 151066, "epoch": 3596} {"train_loss": -6.6699538230896, "global_step": 151067, "epoch": 3596} {"train_loss": -6.844668388366699, "global_step": 151068, "epoch": 3596} {"train_loss": -6.800138473510742, "global_step": 151069, "epoch": 3596} {"train_loss": -6.777414798736572, "global_step": 151070, "epoch": 3596} {"train_loss": -6.803754806518555, "global_step": 151071, "epoch": 3596} {"train_loss": -6.751162528991699, "global_step": 151072, "epoch": 3596} {"train_loss": -6.85103398277646, "global_step": 151073, "epoch": 3596, "val_loss": 68367.0859375} {"train_loss": -6.776260852813721, "global_step": 151074, "epoch": 3597} {"train_loss": -6.86945104598999, "global_step": 151075, "epoch": 3597} {"train_loss": -6.899974346160889, "global_step": 151076, "epoch": 3597} {"train_loss": -6.773069858551025, "global_step": 151077, "epoch": 3597} {"train_loss": -6.76900577545166, "global_step": 151078, "epoch": 3597} {"train_loss": -6.722731590270996, "global_step": 151079, "epoch": 3597} {"train_loss": -6.885846138000488, "global_step": 151080, "epoch": 3597} {"train_loss": -6.840525150299072, "global_step": 151081, "epoch": 3597} {"train_loss": -6.759274482727051, "global_step": 151082, "epoch": 3597} {"train_loss": -6.818431854248047, "global_step": 151083, "epoch": 3597} {"train_loss": -6.771461009979248, "global_step": 151084, "epoch": 3597} {"train_loss": -6.853130340576172, "global_step": 151085, "epoch": 3597} {"train_loss": -6.684772968292236, "global_step": 151086, "epoch": 3597} {"train_loss": -6.742463111877441, "global_step": 151087, "epoch": 3597} {"train_loss": -6.839910507202148, "global_step": 151088, "epoch": 3597} {"train_loss": -6.835569381713867, "global_step": 151089, "epoch": 3597} {"train_loss": -6.795114040374756, "global_step": 151090, "epoch": 3597} {"train_loss": -6.7415361404418945, "global_step": 151091, "epoch": 3597} {"train_loss": -6.830134391784668, "global_step": 151092, "epoch": 3597} {"train_loss": -6.79411506652832, "global_step": 151093, "epoch": 3597} {"train_loss": -6.821911334991455, "global_step": 151094, "epoch": 3597} {"train_loss": -6.78016471862793, "global_step": 151095, "epoch": 3597} {"train_loss": -6.783791542053223, "global_step": 151096, "epoch": 3597} {"train_loss": -6.819169044494629, "global_step": 151097, "epoch": 3597} {"train_loss": -6.745379447937012, "global_step": 151098, "epoch": 3597} {"train_loss": -6.745943546295166, "global_step": 151099, "epoch": 3597} {"train_loss": -6.84279727935791, "global_step": 151100, "epoch": 3597} {"train_loss": -6.80746603012085, "global_step": 151101, "epoch": 3597} {"train_loss": -6.759413719177246, "global_step": 151102, "epoch": 3597} {"train_loss": -6.823424339294434, "global_step": 151103, "epoch": 3597} {"train_loss": -6.7550225257873535, "global_step": 151104, "epoch": 3597} {"train_loss": -6.888286590576172, "global_step": 151105, "epoch": 3597} {"train_loss": -6.863706588745117, "global_step": 151106, "epoch": 3597} {"train_loss": -6.810224533081055, "global_step": 151107, "epoch": 3597} {"train_loss": -6.899114608764648, "global_step": 151108, "epoch": 3597} {"train_loss": -6.789658546447754, "global_step": 151109, "epoch": 3597} {"train_loss": -6.788039684295654, "global_step": 151110, "epoch": 3597} {"train_loss": -6.6454973220825195, "global_step": 151111, "epoch": 3597} {"train_loss": -6.724730491638184, "global_step": 151112, "epoch": 3597} {"train_loss": -6.919370651245117, "global_step": 151113, "epoch": 3597} {"train_loss": -6.679498672485352, "global_step": 151114, "epoch": 3597} {"train_loss": -6.797907250268119, "global_step": 151115, "epoch": 3597, "val_loss": 68747.7578125} {"train_loss": -6.677890777587891, "global_step": 151116, "epoch": 3598} {"train_loss": -6.834196090698242, "global_step": 151117, "epoch": 3598} {"train_loss": -6.926497459411621, "global_step": 151118, "epoch": 3598} {"train_loss": -6.778841972351074, "global_step": 151119, "epoch": 3598} {"train_loss": -6.774712562561035, "global_step": 151120, "epoch": 3598} {"train_loss": -6.794425964355469, "global_step": 151121, "epoch": 3598} {"train_loss": -6.774681568145752, "global_step": 151122, "epoch": 3598} {"train_loss": -6.801536560058594, "global_step": 151123, "epoch": 3598} {"train_loss": -6.851034641265869, "global_step": 151124, "epoch": 3598} {"train_loss": -6.834562301635742, "global_step": 151125, "epoch": 3598} {"train_loss": -6.86631965637207, "global_step": 151126, "epoch": 3598} {"train_loss": -6.647928714752197, "global_step": 151127, "epoch": 3598} {"train_loss": -6.764266014099121, "global_step": 151128, "epoch": 3598} {"train_loss": -6.795520782470703, "global_step": 151129, "epoch": 3598} {"train_loss": -6.814907073974609, "global_step": 151130, "epoch": 3598} {"train_loss": -6.802826881408691, "global_step": 151131, "epoch": 3598} {"train_loss": -6.886319637298584, "global_step": 151132, "epoch": 3598} {"train_loss": -6.8705525398254395, "global_step": 151133, "epoch": 3598} {"train_loss": -6.992990493774414, "global_step": 151134, "epoch": 3598} {"train_loss": -6.837723731994629, "global_step": 151135, "epoch": 3598} {"train_loss": -6.877671241760254, "global_step": 151136, "epoch": 3598} {"train_loss": -6.800559997558594, "global_step": 151137, "epoch": 3598} {"train_loss": -6.94532585144043, "global_step": 151138, "epoch": 3598} {"train_loss": -6.754171371459961, "global_step": 151139, "epoch": 3598} {"train_loss": -6.8206377029418945, "global_step": 151140, "epoch": 3598} {"train_loss": -6.699894428253174, "global_step": 151141, "epoch": 3598} {"train_loss": -6.792285919189453, "global_step": 151142, "epoch": 3598} {"train_loss": -6.685511112213135, "global_step": 151143, "epoch": 3598} {"train_loss": -6.820866107940674, "global_step": 151144, "epoch": 3598} {"train_loss": -6.786461353302002, "global_step": 151145, "epoch": 3598} {"train_loss": -6.779599666595459, "global_step": 151146, "epoch": 3598} {"train_loss": -6.807456016540527, "global_step": 151147, "epoch": 3598} {"train_loss": -6.61207389831543, "global_step": 151148, "epoch": 3598} {"train_loss": -6.7073540687561035, "global_step": 151149, "epoch": 3598} {"train_loss": -6.823704719543457, "global_step": 151150, "epoch": 3598} {"train_loss": -6.7643327713012695, "global_step": 151151, "epoch": 3598} {"train_loss": -6.74183464050293, "global_step": 151152, "epoch": 3598} {"train_loss": -6.840795993804932, "global_step": 151153, "epoch": 3598} {"train_loss": -6.839453220367432, "global_step": 151154, "epoch": 3598} {"train_loss": -6.792971134185791, "global_step": 151155, "epoch": 3598} {"train_loss": -6.775721073150635, "global_step": 151156, "epoch": 3598} {"train_loss": -6.801085472106934, "global_step": 151157, "epoch": 3598, "val_loss": 68701.3828125} {"train_loss": -6.836461067199707, "global_step": 151158, "epoch": 3599} {"train_loss": -6.772254943847656, "global_step": 151159, "epoch": 3599} {"train_loss": -6.85402250289917, "global_step": 151160, "epoch": 3599} {"train_loss": -6.838401794433594, "global_step": 151161, "epoch": 3599} {"train_loss": -6.823790550231934, "global_step": 151162, "epoch": 3599} {"train_loss": -6.734794616699219, "global_step": 151163, "epoch": 3599} {"train_loss": -6.874734878540039, "global_step": 151164, "epoch": 3599} {"train_loss": -6.864203453063965, "global_step": 151165, "epoch": 3599} {"train_loss": -6.8498454093933105, "global_step": 151166, "epoch": 3599} {"train_loss": -6.861094951629639, "global_step": 151167, "epoch": 3599} {"train_loss": -6.867978096008301, "global_step": 151168, "epoch": 3599} {"train_loss": -6.93209171295166, "global_step": 151169, "epoch": 3599} {"train_loss": -6.82131290435791, "global_step": 151170, "epoch": 3599} {"train_loss": -6.858885765075684, "global_step": 151171, "epoch": 3599} {"train_loss": -6.764747619628906, "global_step": 151172, "epoch": 3599} {"train_loss": -6.894179344177246, "global_step": 151173, "epoch": 3599} {"train_loss": -6.860304832458496, "global_step": 151174, "epoch": 3599} {"train_loss": -6.81675910949707, "global_step": 151175, "epoch": 3599} {"train_loss": -6.731540679931641, "global_step": 151176, "epoch": 3599} {"train_loss": -6.811138153076172, "global_step": 151177, "epoch": 3599} {"train_loss": -6.920767784118652, "global_step": 151178, "epoch": 3599} {"train_loss": -6.817352294921875, "global_step": 151179, "epoch": 3599} {"train_loss": -6.9255757331848145, "global_step": 151180, "epoch": 3599} {"train_loss": -6.792057514190674, "global_step": 151181, "epoch": 3599} {"train_loss": -6.840206623077393, "global_step": 151182, "epoch": 3599} {"train_loss": -6.74841833114624, "global_step": 151183, "epoch": 3599} {"train_loss": -6.868753910064697, "global_step": 151184, "epoch": 3599} {"train_loss": -6.811612129211426, "global_step": 151185, "epoch": 3599} {"train_loss": -6.87824821472168, "global_step": 151186, "epoch": 3599} {"train_loss": -6.862220764160156, "global_step": 151187, "epoch": 3599} {"train_loss": -6.893307685852051, "global_step": 151188, "epoch": 3599} {"train_loss": -6.773662090301514, "global_step": 151189, "epoch": 3599} {"train_loss": -6.867722511291504, "global_step": 151190, "epoch": 3599} {"train_loss": -6.9072794914245605, "global_step": 151191, "epoch": 3599} {"train_loss": -6.834397792816162, "global_step": 151192, "epoch": 3599} {"train_loss": -6.883029460906982, "global_step": 151193, "epoch": 3599} {"train_loss": -6.884930610656738, "global_step": 151194, "epoch": 3599} {"train_loss": -6.805036544799805, "global_step": 151195, "epoch": 3599} {"train_loss": -6.973889350891113, "global_step": 151196, "epoch": 3599} {"train_loss": -6.834722518920898, "global_step": 151197, "epoch": 3599} {"train_loss": -6.902456283569336, "global_step": 151198, "epoch": 3599} {"train_loss": -6.8468634855179555, "global_step": 151199, "epoch": 3599, "val_loss": 68443.6484375} {"train_loss": -6.791127681732178, "global_step": 151200, "epoch": 3600} {"train_loss": -6.818902969360352, "global_step": 151201, "epoch": 3600} {"train_loss": -6.769556999206543, "global_step": 151202, "epoch": 3600} {"train_loss": -6.819838523864746, "global_step": 151203, "epoch": 3600} {"train_loss": -6.798198699951172, "global_step": 151204, "epoch": 3600} {"train_loss": -6.8417205810546875, "global_step": 151205, "epoch": 3600} {"train_loss": -6.7301435470581055, "global_step": 151206, "epoch": 3600} {"train_loss": -6.807447910308838, "global_step": 151207, "epoch": 3600} {"train_loss": -6.766499042510986, "global_step": 151208, "epoch": 3600} {"train_loss": -6.770695209503174, "global_step": 151209, "epoch": 3600} {"train_loss": -6.874444484710693, "global_step": 151210, "epoch": 3600} {"train_loss": -6.847312927246094, "global_step": 151211, "epoch": 3600} {"train_loss": -6.849035739898682, "global_step": 151212, "epoch": 3600} {"train_loss": -6.878798961639404, "global_step": 151213, "epoch": 3600} {"train_loss": -6.903749465942383, "global_step": 151214, "epoch": 3600} {"train_loss": -6.911012649536133, "global_step": 151215, "epoch": 3600} {"train_loss": -6.782271385192871, "global_step": 151216, "epoch": 3600} {"train_loss": -6.855204105377197, "global_step": 151217, "epoch": 3600} {"train_loss": -6.873293876647949, "global_step": 151218, "epoch": 3600} {"train_loss": -6.765566825866699, "global_step": 151219, "epoch": 3600} {"train_loss": -6.79963493347168, "global_step": 151220, "epoch": 3600} {"train_loss": -6.864163398742676, "global_step": 151221, "epoch": 3600} {"train_loss": -6.76236629486084, "global_step": 151222, "epoch": 3600} {"train_loss": -6.719603061676025, "global_step": 151223, "epoch": 3600} {"train_loss": -6.867579460144043, "global_step": 151224, "epoch": 3600} {"train_loss": -6.856472969055176, "global_step": 151225, "epoch": 3600} {"train_loss": -6.888455867767334, "global_step": 151226, "epoch": 3600} {"train_loss": -6.891563415527344, "global_step": 151227, "epoch": 3600} {"train_loss": -6.833939552307129, "global_step": 151228, "epoch": 3600} {"train_loss": -6.804948806762695, "global_step": 151229, "epoch": 3600} {"train_loss": -6.912938117980957, "global_step": 151230, "epoch": 3600} {"train_loss": -6.808084487915039, "global_step": 151231, "epoch": 3600} {"train_loss": -6.889233589172363, "global_step": 151232, "epoch": 3600} {"train_loss": -6.819238662719727, "global_step": 151233, "epoch": 3600} {"train_loss": -6.921352386474609, "global_step": 151234, "epoch": 3600} {"train_loss": -6.847588062286377, "global_step": 151235, "epoch": 3600} {"train_loss": -6.929251670837402, "global_step": 151236, "epoch": 3600} {"train_loss": -6.867743968963623, "global_step": 151237, "epoch": 3600} {"train_loss": -6.763428211212158, "global_step": 151238, "epoch": 3600} {"train_loss": -6.833829879760742, "global_step": 151239, "epoch": 3600} {"train_loss": -6.904733180999756, "global_step": 151240, "epoch": 3600} {"train_loss": -6.831564619427636, "global_step": 151241, "epoch": 3600, "train/sim_max_reward_0": 0.6504444901756982, "train/sim_max_reward_1": 0.9368731153997962, "train/sim_max_reward_2": 0.6308977659839872, "train/sim_max_reward_3": 0.12948057410417446, "train/sim_max_reward_4": 0.47575377140347186, "train/sim_max_reward_5": 0.8062135307363463, "test/sim_max_reward_4400000": 0.3117710009205282, "test/sim_max_reward_4400001": 0.9642232716279483, "test/sim_max_reward_4400002": 0.3408802161805403, "test/sim_max_reward_4400003": 0.9555845105721376, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.987760306559018, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.30405914742112583, "test/sim_max_reward_4400009": 0.8782143204471891, "test/sim_max_reward_4400010": 0.9204546808313172, "test/sim_max_reward_4400011": 0.07858523552055459, "test/sim_max_reward_4400012": 0.9721106771644353, "test/sim_max_reward_4400013": 0.8894037919987559, "test/sim_max_reward_4400014": 0.9842987464586402, "test/sim_max_reward_4400015": 0.992743024657877, "test/sim_max_reward_4400016": 0.10443910322931796, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.25847256298775756, "test/sim_max_reward_4400019": 0.002815644177284741, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.31748376108648907, "test/sim_max_reward_4400023": 0.9338589530641191, "test/sim_max_reward_4400024": 0.9685336344655091, "test/sim_max_reward_4400025": 0.25659628820057645, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.011793835871726142, "test/sim_max_reward_4400028": 0.9806353846632669, "test/sim_max_reward_4400029": 0.7079038322904095, "test/sim_max_reward_4400030": 0.9016903981897109, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9948991383168833, "test/sim_max_reward_4400034": 0.9184277200388965, "test/sim_max_reward_4400035": 0.39615151322251047, "test/sim_max_reward_4400036": 0.4032598211592142, "test/sim_max_reward_4400037": 0.9308848626336154, "test/sim_max_reward_4400038": 0.9504456765932122, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.81494098520961, "test/sim_max_reward_4400042": 0.888419597574043, "test/sim_max_reward_4400043": 0.9269093689230751, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9699004948936684, "test/sim_max_reward_4400046": 0.8681109187604896, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.9540180572839927, "train/mean_score": 0.6049438746339124, "test/mean_score": 0.6102824147835133, "val_loss": 68425.3125} {"train_loss": -6.905396461486816, "global_step": 151242, "epoch": 3601} {"train_loss": -6.669523239135742, "global_step": 151243, "epoch": 3601} {"train_loss": -6.8879714012146, "global_step": 151244, "epoch": 3601} {"train_loss": -6.743443489074707, "global_step": 151245, "epoch": 3601} {"train_loss": -6.836694717407227, "global_step": 151246, "epoch": 3601} {"train_loss": -6.696202278137207, "global_step": 151247, "epoch": 3601} {"train_loss": -6.57579231262207, "global_step": 151248, "epoch": 3601} {"train_loss": -6.581943511962891, "global_step": 151249, "epoch": 3601} {"train_loss": -6.663713455200195, "global_step": 151250, "epoch": 3601} {"train_loss": -6.646365165710449, "global_step": 151251, "epoch": 3601} {"train_loss": -6.721485614776611, "global_step": 151252, "epoch": 3601} {"train_loss": -6.615290641784668, "global_step": 151253, "epoch": 3601} {"train_loss": -6.619304656982422, "global_step": 151254, "epoch": 3601} {"train_loss": -6.628627777099609, "global_step": 151255, "epoch": 3601} {"train_loss": -6.540399551391602, "global_step": 151256, "epoch": 3601} {"train_loss": -6.714290142059326, "global_step": 151257, "epoch": 3601} {"train_loss": -6.698660850524902, "global_step": 151258, "epoch": 3601} {"train_loss": -6.736187934875488, "global_step": 151259, "epoch": 3601} {"train_loss": -6.6937785148620605, "global_step": 151260, "epoch": 3601} {"train_loss": -6.598393440246582, "global_step": 151261, "epoch": 3601} {"train_loss": -6.7368388175964355, "global_step": 151262, "epoch": 3601} {"train_loss": -6.649312973022461, "global_step": 151263, "epoch": 3601} {"train_loss": -6.730558395385742, "global_step": 151264, "epoch": 3601} {"train_loss": -6.7119035720825195, "global_step": 151265, "epoch": 3601} {"train_loss": -6.74429178237915, "global_step": 151266, "epoch": 3601} {"train_loss": -6.706634521484375, "global_step": 151267, "epoch": 3601} {"train_loss": -6.677243232727051, "global_step": 151268, "epoch": 3601} {"train_loss": -6.777139663696289, "global_step": 151269, "epoch": 3601} {"train_loss": -6.7508544921875, "global_step": 151270, "epoch": 3601} {"train_loss": -6.879329681396484, "global_step": 151271, "epoch": 3601} {"train_loss": -6.80362606048584, "global_step": 151272, "epoch": 3601} {"train_loss": -6.77786922454834, "global_step": 151273, "epoch": 3601} {"train_loss": -6.791360855102539, "global_step": 151274, "epoch": 3601} {"train_loss": -6.8246588706970215, "global_step": 151275, "epoch": 3601} {"train_loss": -6.667551040649414, "global_step": 151276, "epoch": 3601} {"train_loss": -6.896023750305176, "global_step": 151277, "epoch": 3601} {"train_loss": -6.8110151290893555, "global_step": 151278, "epoch": 3601} {"train_loss": -6.797604084014893, "global_step": 151279, "epoch": 3601} {"train_loss": -6.889744758605957, "global_step": 151280, "epoch": 3601} {"train_loss": -6.840151786804199, "global_step": 151281, "epoch": 3601} {"train_loss": -6.910490036010742, "global_step": 151282, "epoch": 3601} {"train_loss": -6.73756574449085, "global_step": 151283, "epoch": 3601, "val_loss": 68476.609375} {"train_loss": -6.776811122894287, "global_step": 151284, "epoch": 3602} {"train_loss": -6.9057769775390625, "global_step": 151285, "epoch": 3602} {"train_loss": -6.935273170471191, "global_step": 151286, "epoch": 3602} {"train_loss": -6.792109489440918, "global_step": 151287, "epoch": 3602} {"train_loss": -6.995121955871582, "global_step": 151288, "epoch": 3602} {"train_loss": -6.929976940155029, "global_step": 151289, "epoch": 3602} {"train_loss": -6.919711112976074, "global_step": 151290, "epoch": 3602} {"train_loss": -6.882521629333496, "global_step": 151291, "epoch": 3602} {"train_loss": -6.821978569030762, "global_step": 151292, "epoch": 3602} {"train_loss": -6.810336589813232, "global_step": 151293, "epoch": 3602} {"train_loss": -6.770061016082764, "global_step": 151294, "epoch": 3602} {"train_loss": -6.817286491394043, "global_step": 151295, "epoch": 3602} {"train_loss": -6.7865142822265625, "global_step": 151296, "epoch": 3602} {"train_loss": -6.796545028686523, "global_step": 151297, "epoch": 3602} {"train_loss": -6.74308967590332, "global_step": 151298, "epoch": 3602} {"train_loss": -6.861835479736328, "global_step": 151299, "epoch": 3602} {"train_loss": -6.918115615844727, "global_step": 151300, "epoch": 3602} {"train_loss": -6.764963626861572, "global_step": 151301, "epoch": 3602} {"train_loss": -6.770476341247559, "global_step": 151302, "epoch": 3602} {"train_loss": -6.626376152038574, "global_step": 151303, "epoch": 3602} {"train_loss": -6.809205532073975, "global_step": 151304, "epoch": 3602} {"train_loss": -6.816455841064453, "global_step": 151305, "epoch": 3602} {"train_loss": -6.800357818603516, "global_step": 151306, "epoch": 3602} {"train_loss": -6.740303039550781, "global_step": 151307, "epoch": 3602} {"train_loss": -6.868108749389648, "global_step": 151308, "epoch": 3602} {"train_loss": -6.8978166580200195, "global_step": 151309, "epoch": 3602} {"train_loss": -6.7922749519348145, "global_step": 151310, "epoch": 3602} {"train_loss": -6.884466171264648, "global_step": 151311, "epoch": 3602} {"train_loss": -6.753713607788086, "global_step": 151312, "epoch": 3602} {"train_loss": -6.828341484069824, "global_step": 151313, "epoch": 3602} {"train_loss": -6.8260178565979, "global_step": 151314, "epoch": 3602} {"train_loss": -6.772904396057129, "global_step": 151315, "epoch": 3602} {"train_loss": -6.73646354675293, "global_step": 151316, "epoch": 3602} {"train_loss": -6.8758063316345215, "global_step": 151317, "epoch": 3602} {"train_loss": -6.801380634307861, "global_step": 151318, "epoch": 3602} {"train_loss": -6.826724052429199, "global_step": 151319, "epoch": 3602} {"train_loss": -6.772815704345703, "global_step": 151320, "epoch": 3602} {"train_loss": -6.922076225280762, "global_step": 151321, "epoch": 3602} {"train_loss": -6.782559394836426, "global_step": 151322, "epoch": 3602} {"train_loss": -6.763958930969238, "global_step": 151323, "epoch": 3602} {"train_loss": -6.943408966064453, "global_step": 151324, "epoch": 3602} {"train_loss": -6.825043383098784, "global_step": 151325, "epoch": 3602, "val_loss": 68319.6953125} {"train_loss": -6.79934549331665, "global_step": 151326, "epoch": 3603} {"train_loss": -6.91251802444458, "global_step": 151327, "epoch": 3603} {"train_loss": -6.813844680786133, "global_step": 151328, "epoch": 3603} {"train_loss": -6.837772369384766, "global_step": 151329, "epoch": 3603} {"train_loss": -6.886645317077637, "global_step": 151330, "epoch": 3603} {"train_loss": -6.848659038543701, "global_step": 151331, "epoch": 3603} {"train_loss": -6.788000106811523, "global_step": 151332, "epoch": 3603} {"train_loss": -6.8741960525512695, "global_step": 151333, "epoch": 3603} {"train_loss": -6.806269645690918, "global_step": 151334, "epoch": 3603} {"train_loss": -6.770005226135254, "global_step": 151335, "epoch": 3603} {"train_loss": -6.770330429077148, "global_step": 151336, "epoch": 3603} {"train_loss": -6.904965400695801, "global_step": 151337, "epoch": 3603} {"train_loss": -6.760008811950684, "global_step": 151338, "epoch": 3603} {"train_loss": -6.855162620544434, "global_step": 151339, "epoch": 3603} {"train_loss": -6.861323356628418, "global_step": 151340, "epoch": 3603} {"train_loss": -6.727474212646484, "global_step": 151341, "epoch": 3603} {"train_loss": -6.893525123596191, "global_step": 151342, "epoch": 3603} {"train_loss": -6.747557640075684, "global_step": 151343, "epoch": 3603} {"train_loss": -6.935605525970459, "global_step": 151344, "epoch": 3603} {"train_loss": -6.863740921020508, "global_step": 151345, "epoch": 3603} {"train_loss": -6.752429008483887, "global_step": 151346, "epoch": 3603} {"train_loss": -6.878769874572754, "global_step": 151347, "epoch": 3603} {"train_loss": -6.781464099884033, "global_step": 151348, "epoch": 3603} {"train_loss": -6.788844108581543, "global_step": 151349, "epoch": 3603} {"train_loss": -6.815892219543457, "global_step": 151350, "epoch": 3603} {"train_loss": -6.85958194732666, "global_step": 151351, "epoch": 3603} {"train_loss": -6.833802223205566, "global_step": 151352, "epoch": 3603} {"train_loss": -6.916176795959473, "global_step": 151353, "epoch": 3603} {"train_loss": -6.8304443359375, "global_step": 151354, "epoch": 3603} {"train_loss": -6.808384895324707, "global_step": 151355, "epoch": 3603} {"train_loss": -6.738437652587891, "global_step": 151356, "epoch": 3603} {"train_loss": -6.875922203063965, "global_step": 151357, "epoch": 3603} {"train_loss": -6.833542823791504, "global_step": 151358, "epoch": 3603} {"train_loss": -6.893144607543945, "global_step": 151359, "epoch": 3603} {"train_loss": -6.810543537139893, "global_step": 151360, "epoch": 3603} {"train_loss": -6.879161357879639, "global_step": 151361, "epoch": 3603} {"train_loss": -6.8147430419921875, "global_step": 151362, "epoch": 3603} {"train_loss": -6.841836452484131, "global_step": 151363, "epoch": 3603} {"train_loss": -6.904018878936768, "global_step": 151364, "epoch": 3603} {"train_loss": -6.867673873901367, "global_step": 151365, "epoch": 3603} {"train_loss": -6.9257659912109375, "global_step": 151366, "epoch": 3603} {"train_loss": -6.839679967789423, "global_step": 151367, "epoch": 3603, "val_loss": 68380.6953125} {"train_loss": -6.963605880737305, "global_step": 151368, "epoch": 3604} {"train_loss": -6.949517726898193, "global_step": 151369, "epoch": 3604} {"train_loss": -6.830621242523193, "global_step": 151370, "epoch": 3604} {"train_loss": -6.809561252593994, "global_step": 151371, "epoch": 3604} {"train_loss": -6.82238245010376, "global_step": 151372, "epoch": 3604} {"train_loss": -6.878255367279053, "global_step": 151373, "epoch": 3604} {"train_loss": -6.9226226806640625, "global_step": 151374, "epoch": 3604} {"train_loss": -6.8306884765625, "global_step": 151375, "epoch": 3604} {"train_loss": -6.8347320556640625, "global_step": 151376, "epoch": 3604} {"train_loss": -6.824497699737549, "global_step": 151377, "epoch": 3604} {"train_loss": -6.826493263244629, "global_step": 151378, "epoch": 3604} {"train_loss": -6.6816301345825195, "global_step": 151379, "epoch": 3604} {"train_loss": -6.79347038269043, "global_step": 151380, "epoch": 3604} {"train_loss": -6.92390775680542, "global_step": 151381, "epoch": 3604} {"train_loss": -6.903301239013672, "global_step": 151382, "epoch": 3604} {"train_loss": -6.910339832305908, "global_step": 151383, "epoch": 3604} {"train_loss": -6.921192646026611, "global_step": 151384, "epoch": 3604} {"train_loss": -6.882569313049316, "global_step": 151385, "epoch": 3604} {"train_loss": -6.7089338302612305, "global_step": 151386, "epoch": 3604} {"train_loss": -6.778696060180664, "global_step": 151387, "epoch": 3604} {"train_loss": -6.8760576248168945, "global_step": 151388, "epoch": 3604} {"train_loss": -6.848200798034668, "global_step": 151389, "epoch": 3604} {"train_loss": -6.9116058349609375, "global_step": 151390, "epoch": 3604} {"train_loss": -6.957342147827148, "global_step": 151391, "epoch": 3604} {"train_loss": -6.896128177642822, "global_step": 151392, "epoch": 3604} {"train_loss": -6.840593338012695, "global_step": 151393, "epoch": 3604} {"train_loss": -6.630331039428711, "global_step": 151394, "epoch": 3604} {"train_loss": -6.83880615234375, "global_step": 151395, "epoch": 3604} {"train_loss": -6.901400566101074, "global_step": 151396, "epoch": 3604} {"train_loss": -6.888568878173828, "global_step": 151397, "epoch": 3604} {"train_loss": -6.845823287963867, "global_step": 151398, "epoch": 3604} {"train_loss": -6.894451141357422, "global_step": 151399, "epoch": 3604} {"train_loss": -6.902606964111328, "global_step": 151400, "epoch": 3604} {"train_loss": -6.918169021606445, "global_step": 151401, "epoch": 3604} {"train_loss": -6.969301223754883, "global_step": 151402, "epoch": 3604} {"train_loss": -6.805244445800781, "global_step": 151403, "epoch": 3604} {"train_loss": -6.838249206542969, "global_step": 151404, "epoch": 3604} {"train_loss": -6.787809371948242, "global_step": 151405, "epoch": 3604} {"train_loss": -6.724409580230713, "global_step": 151406, "epoch": 3604} {"train_loss": -6.792686939239502, "global_step": 151407, "epoch": 3604} {"train_loss": -6.794702529907227, "global_step": 151408, "epoch": 3604} {"train_loss": -6.848970027196975, "global_step": 151409, "epoch": 3604, "val_loss": 68435.984375} {"train_loss": -6.666061878204346, "global_step": 151410, "epoch": 3605} {"train_loss": -6.781612396240234, "global_step": 151411, "epoch": 3605} {"train_loss": -6.692967414855957, "global_step": 151412, "epoch": 3605} {"train_loss": -6.695940017700195, "global_step": 151413, "epoch": 3605} {"train_loss": -6.709819793701172, "global_step": 151414, "epoch": 3605} {"train_loss": -6.675703048706055, "global_step": 151415, "epoch": 3605} {"train_loss": -6.6924543380737305, "global_step": 151416, "epoch": 3605} {"train_loss": -6.789358139038086, "global_step": 151417, "epoch": 3605} {"train_loss": -6.789004802703857, "global_step": 151418, "epoch": 3605} {"train_loss": -6.564027786254883, "global_step": 151419, "epoch": 3605} {"train_loss": -6.704952716827393, "global_step": 151420, "epoch": 3605} {"train_loss": -6.670751571655273, "global_step": 151421, "epoch": 3605} {"train_loss": -6.758511066436768, "global_step": 151422, "epoch": 3605} {"train_loss": -6.661561965942383, "global_step": 151423, "epoch": 3605} {"train_loss": -6.762158393859863, "global_step": 151424, "epoch": 3605} {"train_loss": -6.652766227722168, "global_step": 151425, "epoch": 3605} {"train_loss": -6.773555755615234, "global_step": 151426, "epoch": 3605} {"train_loss": -6.667451858520508, "global_step": 151427, "epoch": 3605} {"train_loss": -6.750014305114746, "global_step": 151428, "epoch": 3605} {"train_loss": -6.597113132476807, "global_step": 151429, "epoch": 3605} {"train_loss": -6.7914509773254395, "global_step": 151430, "epoch": 3605} {"train_loss": -6.737578392028809, "global_step": 151431, "epoch": 3605} {"train_loss": -6.835344314575195, "global_step": 151432, "epoch": 3605} {"train_loss": -6.710948944091797, "global_step": 151433, "epoch": 3605} {"train_loss": -6.722599029541016, "global_step": 151434, "epoch": 3605} {"train_loss": -6.773618698120117, "global_step": 151435, "epoch": 3605} {"train_loss": -6.915764331817627, "global_step": 151436, "epoch": 3605} {"train_loss": -6.752577781677246, "global_step": 151437, "epoch": 3605} {"train_loss": -6.751517295837402, "global_step": 151438, "epoch": 3605} {"train_loss": -6.726742267608643, "global_step": 151439, "epoch": 3605} {"train_loss": -6.718411445617676, "global_step": 151440, "epoch": 3605} {"train_loss": -6.807788848876953, "global_step": 151441, "epoch": 3605} {"train_loss": -6.821384429931641, "global_step": 151442, "epoch": 3605} {"train_loss": -6.819323539733887, "global_step": 151443, "epoch": 3605} {"train_loss": -6.817483901977539, "global_step": 151444, "epoch": 3605} {"train_loss": -6.74436092376709, "global_step": 151445, "epoch": 3605} {"train_loss": -6.894807815551758, "global_step": 151446, "epoch": 3605} {"train_loss": -6.66221809387207, "global_step": 151447, "epoch": 3605} {"train_loss": -6.767958641052246, "global_step": 151448, "epoch": 3605} {"train_loss": -6.628767490386963, "global_step": 151449, "epoch": 3605} {"train_loss": -6.823390960693359, "global_step": 151450, "epoch": 3605} {"train_loss": -6.738427400588989, "global_step": 151451, "epoch": 3605, "val_loss": 68546.03125} {"train_loss": -6.852787494659424, "global_step": 151452, "epoch": 3606} {"train_loss": -6.625223636627197, "global_step": 151453, "epoch": 3606} {"train_loss": -6.790186882019043, "global_step": 151454, "epoch": 3606} {"train_loss": -6.682604789733887, "global_step": 151455, "epoch": 3606} {"train_loss": -6.834231376647949, "global_step": 151456, "epoch": 3606} {"train_loss": -6.787886619567871, "global_step": 151457, "epoch": 3606} {"train_loss": -6.784299373626709, "global_step": 151458, "epoch": 3606} {"train_loss": -6.799215316772461, "global_step": 151459, "epoch": 3606} {"train_loss": -6.790154457092285, "global_step": 151460, "epoch": 3606} {"train_loss": -6.752457141876221, "global_step": 151461, "epoch": 3606} {"train_loss": -6.8633713722229, "global_step": 151462, "epoch": 3606} {"train_loss": -6.664223670959473, "global_step": 151463, "epoch": 3606} {"train_loss": -6.884342670440674, "global_step": 151464, "epoch": 3606} {"train_loss": -6.864681243896484, "global_step": 151465, "epoch": 3606} {"train_loss": -6.767371654510498, "global_step": 151466, "epoch": 3606} {"train_loss": -6.796659469604492, "global_step": 151467, "epoch": 3606} {"train_loss": -6.8054070472717285, "global_step": 151468, "epoch": 3606} {"train_loss": -6.6818623542785645, "global_step": 151469, "epoch": 3606} {"train_loss": -6.7175140380859375, "global_step": 151470, "epoch": 3606} {"train_loss": -6.79088830947876, "global_step": 151471, "epoch": 3606} {"train_loss": -6.743314266204834, "global_step": 151472, "epoch": 3606} {"train_loss": -6.774651527404785, "global_step": 151473, "epoch": 3606} {"train_loss": -6.733144760131836, "global_step": 151474, "epoch": 3606} {"train_loss": -6.8581156730651855, "global_step": 151475, "epoch": 3606} {"train_loss": -6.750267505645752, "global_step": 151476, "epoch": 3606} {"train_loss": -6.809422016143799, "global_step": 151477, "epoch": 3606} {"train_loss": -6.758413314819336, "global_step": 151478, "epoch": 3606} {"train_loss": -6.746750831604004, "global_step": 151479, "epoch": 3606} {"train_loss": -6.81173849105835, "global_step": 151480, "epoch": 3606} {"train_loss": -6.7696685791015625, "global_step": 151481, "epoch": 3606} {"train_loss": -6.775291919708252, "global_step": 151482, "epoch": 3606} {"train_loss": -6.678687572479248, "global_step": 151483, "epoch": 3606} {"train_loss": -6.721370220184326, "global_step": 151484, "epoch": 3606} {"train_loss": -6.738381862640381, "global_step": 151485, "epoch": 3606} {"train_loss": -6.712587356567383, "global_step": 151486, "epoch": 3606} {"train_loss": -6.728937149047852, "global_step": 151487, "epoch": 3606} {"train_loss": -6.895819664001465, "global_step": 151488, "epoch": 3606} {"train_loss": -6.784889221191406, "global_step": 151489, "epoch": 3606} {"train_loss": -6.800705432891846, "global_step": 151490, "epoch": 3606} {"train_loss": -6.77714729309082, "global_step": 151491, "epoch": 3606} {"train_loss": -6.773294925689697, "global_step": 151492, "epoch": 3606} {"train_loss": -6.772564922060285, "global_step": 151493, "epoch": 3606, "val_loss": 68365.3515625} {"train_loss": -6.786145210266113, "global_step": 151494, "epoch": 3607} {"train_loss": -6.819945812225342, "global_step": 151495, "epoch": 3607} {"train_loss": -6.831636428833008, "global_step": 151496, "epoch": 3607} {"train_loss": -6.915270805358887, "global_step": 151497, "epoch": 3607} {"train_loss": -6.874533176422119, "global_step": 151498, "epoch": 3607} {"train_loss": -6.90906286239624, "global_step": 151499, "epoch": 3607} {"train_loss": -6.8386030197143555, "global_step": 151500, "epoch": 3607} {"train_loss": -6.818489074707031, "global_step": 151501, "epoch": 3607} {"train_loss": -6.7982587814331055, "global_step": 151502, "epoch": 3607} {"train_loss": -6.815361499786377, "global_step": 151503, "epoch": 3607} {"train_loss": -6.932372093200684, "global_step": 151504, "epoch": 3607} {"train_loss": -6.816841125488281, "global_step": 151505, "epoch": 3607} {"train_loss": -6.889522552490234, "global_step": 151506, "epoch": 3607} {"train_loss": -6.882611274719238, "global_step": 151507, "epoch": 3607} {"train_loss": -6.867770195007324, "global_step": 151508, "epoch": 3607} {"train_loss": -7.000484943389893, "global_step": 151509, "epoch": 3607} {"train_loss": -6.80690336227417, "global_step": 151510, "epoch": 3607} {"train_loss": -6.911430358886719, "global_step": 151511, "epoch": 3607} {"train_loss": -6.86849308013916, "global_step": 151512, "epoch": 3607} {"train_loss": -6.78968620300293, "global_step": 151513, "epoch": 3607} {"train_loss": -6.800742149353027, "global_step": 151514, "epoch": 3607} {"train_loss": -6.908730506896973, "global_step": 151515, "epoch": 3607} {"train_loss": -6.838615417480469, "global_step": 151516, "epoch": 3607} {"train_loss": -6.856045722961426, "global_step": 151517, "epoch": 3607} {"train_loss": -6.845484733581543, "global_step": 151518, "epoch": 3607} {"train_loss": -6.8054094314575195, "global_step": 151519, "epoch": 3607} {"train_loss": -6.918909072875977, "global_step": 151520, "epoch": 3607} {"train_loss": -6.753643035888672, "global_step": 151521, "epoch": 3607} {"train_loss": -6.933651924133301, "global_step": 151522, "epoch": 3607} {"train_loss": -6.977685451507568, "global_step": 151523, "epoch": 3607} {"train_loss": -6.771024703979492, "global_step": 151524, "epoch": 3607} {"train_loss": -6.786322593688965, "global_step": 151525, "epoch": 3607} {"train_loss": -6.805273056030273, "global_step": 151526, "epoch": 3607} {"train_loss": -6.908791542053223, "global_step": 151527, "epoch": 3607} {"train_loss": -6.876898765563965, "global_step": 151528, "epoch": 3607} {"train_loss": -6.821262836456299, "global_step": 151529, "epoch": 3607} {"train_loss": -7.03930139541626, "global_step": 151530, "epoch": 3607} {"train_loss": -6.82426643371582, "global_step": 151531, "epoch": 3607} {"train_loss": -6.818055629730225, "global_step": 151532, "epoch": 3607} {"train_loss": -6.866413116455078, "global_step": 151533, "epoch": 3607} {"train_loss": -6.792273998260498, "global_step": 151534, "epoch": 3607} {"train_loss": -6.856086923962548, "global_step": 151535, "epoch": 3607, "val_loss": 68290.3125} {"train_loss": -6.847543239593506, "global_step": 151536, "epoch": 3608} {"train_loss": -6.939894199371338, "global_step": 151537, "epoch": 3608} {"train_loss": -6.924311637878418, "global_step": 151538, "epoch": 3608} {"train_loss": -6.778680801391602, "global_step": 151539, "epoch": 3608} {"train_loss": -6.848315238952637, "global_step": 151540, "epoch": 3608} {"train_loss": -6.940707683563232, "global_step": 151541, "epoch": 3608} {"train_loss": -7.0283589363098145, "global_step": 151542, "epoch": 3608} {"train_loss": -6.765538215637207, "global_step": 151543, "epoch": 3608} {"train_loss": -7.015506267547607, "global_step": 151544, "epoch": 3608} {"train_loss": -7.007525444030762, "global_step": 151545, "epoch": 3608} {"train_loss": -6.798372268676758, "global_step": 151546, "epoch": 3608} {"train_loss": -6.841277599334717, "global_step": 151547, "epoch": 3608} {"train_loss": -6.86337423324585, "global_step": 151548, "epoch": 3608} {"train_loss": -6.7985005378723145, "global_step": 151549, "epoch": 3608} {"train_loss": -6.9112677574157715, "global_step": 151550, "epoch": 3608} {"train_loss": -6.872917175292969, "global_step": 151551, "epoch": 3608} {"train_loss": -6.780123710632324, "global_step": 151552, "epoch": 3608} {"train_loss": -6.797268867492676, "global_step": 151553, "epoch": 3608} {"train_loss": -6.861591339111328, "global_step": 151554, "epoch": 3608} {"train_loss": -6.922441482543945, "global_step": 151555, "epoch": 3608} {"train_loss": -6.850896835327148, "global_step": 151556, "epoch": 3608} {"train_loss": -6.780385971069336, "global_step": 151557, "epoch": 3608} {"train_loss": -6.820284843444824, "global_step": 151558, "epoch": 3608} {"train_loss": -6.902324676513672, "global_step": 151559, "epoch": 3608} {"train_loss": -6.7612528800964355, "global_step": 151560, "epoch": 3608} {"train_loss": -6.764409065246582, "global_step": 151561, "epoch": 3608} {"train_loss": -6.83438777923584, "global_step": 151562, "epoch": 3608} {"train_loss": -6.881750583648682, "global_step": 151563, "epoch": 3608} {"train_loss": -6.789063930511475, "global_step": 151564, "epoch": 3608} {"train_loss": -6.83930778503418, "global_step": 151565, "epoch": 3608} {"train_loss": -6.717950344085693, "global_step": 151566, "epoch": 3608} {"train_loss": -6.822473526000977, "global_step": 151567, "epoch": 3608} {"train_loss": -6.757711410522461, "global_step": 151568, "epoch": 3608} {"train_loss": -6.907585620880127, "global_step": 151569, "epoch": 3608} {"train_loss": -6.878507614135742, "global_step": 151570, "epoch": 3608} {"train_loss": -6.748756408691406, "global_step": 151571, "epoch": 3608} {"train_loss": -6.8333353996276855, "global_step": 151572, "epoch": 3608} {"train_loss": -6.807850360870361, "global_step": 151573, "epoch": 3608} {"train_loss": -6.76359748840332, "global_step": 151574, "epoch": 3608} {"train_loss": -6.907090187072754, "global_step": 151575, "epoch": 3608} {"train_loss": -6.988903522491455, "global_step": 151576, "epoch": 3608} {"train_loss": -6.850942202976772, "global_step": 151577, "epoch": 3608, "val_loss": 68497.1328125} {"train_loss": -6.799928665161133, "global_step": 151578, "epoch": 3609} {"train_loss": -6.926182270050049, "global_step": 151579, "epoch": 3609} {"train_loss": -6.806178092956543, "global_step": 151580, "epoch": 3609} {"train_loss": -6.782570838928223, "global_step": 151581, "epoch": 3609} {"train_loss": -6.894712924957275, "global_step": 151582, "epoch": 3609} {"train_loss": -6.877066612243652, "global_step": 151583, "epoch": 3609} {"train_loss": -6.855731010437012, "global_step": 151584, "epoch": 3609} {"train_loss": -6.842001914978027, "global_step": 151585, "epoch": 3609} {"train_loss": -6.906853675842285, "global_step": 151586, "epoch": 3609} {"train_loss": -6.871140480041504, "global_step": 151587, "epoch": 3609} {"train_loss": -7.0346150398254395, "global_step": 151588, "epoch": 3609} {"train_loss": -6.804665565490723, "global_step": 151589, "epoch": 3609} {"train_loss": -6.814296245574951, "global_step": 151590, "epoch": 3609} {"train_loss": -6.889046669006348, "global_step": 151591, "epoch": 3609} {"train_loss": -6.979994297027588, "global_step": 151592, "epoch": 3609} {"train_loss": -6.755439758300781, "global_step": 151593, "epoch": 3609} {"train_loss": -6.912644863128662, "global_step": 151594, "epoch": 3609} {"train_loss": -6.823971748352051, "global_step": 151595, "epoch": 3609} {"train_loss": -6.819853782653809, "global_step": 151596, "epoch": 3609} {"train_loss": -6.859532833099365, "global_step": 151597, "epoch": 3609} {"train_loss": -6.827066421508789, "global_step": 151598, "epoch": 3609} {"train_loss": -6.857639312744141, "global_step": 151599, "epoch": 3609} {"train_loss": -6.847414970397949, "global_step": 151600, "epoch": 3609} {"train_loss": -6.885738849639893, "global_step": 151601, "epoch": 3609} {"train_loss": -6.8478827476501465, "global_step": 151602, "epoch": 3609} {"train_loss": -6.762125015258789, "global_step": 151603, "epoch": 3609} {"train_loss": -6.856922149658203, "global_step": 151604, "epoch": 3609} {"train_loss": -6.872706413269043, "global_step": 151605, "epoch": 3609} {"train_loss": -6.831452369689941, "global_step": 151606, "epoch": 3609} {"train_loss": -6.784567356109619, "global_step": 151607, "epoch": 3609} {"train_loss": -6.737082004547119, "global_step": 151608, "epoch": 3609} {"train_loss": -6.744931697845459, "global_step": 151609, "epoch": 3609} {"train_loss": -6.845137596130371, "global_step": 151610, "epoch": 3609} {"train_loss": -6.849161148071289, "global_step": 151611, "epoch": 3609} {"train_loss": -6.756892681121826, "global_step": 151612, "epoch": 3609} {"train_loss": -6.81895637512207, "global_step": 151613, "epoch": 3609} {"train_loss": -6.789455413818359, "global_step": 151614, "epoch": 3609} {"train_loss": -6.802029132843018, "global_step": 151615, "epoch": 3609} {"train_loss": -6.923126220703125, "global_step": 151616, "epoch": 3609} {"train_loss": -6.739264965057373, "global_step": 151617, "epoch": 3609} {"train_loss": -6.819754600524902, "global_step": 151618, "epoch": 3609} {"train_loss": -6.840201877412342, "global_step": 151619, "epoch": 3609, "val_loss": 68452.9296875} {"train_loss": -6.801164627075195, "global_step": 151620, "epoch": 3610} {"train_loss": -6.687735557556152, "global_step": 151621, "epoch": 3610} {"train_loss": -7.043569564819336, "global_step": 151622, "epoch": 3610} {"train_loss": -6.794932842254639, "global_step": 151623, "epoch": 3610} {"train_loss": -6.675139427185059, "global_step": 151624, "epoch": 3610} {"train_loss": -6.790897369384766, "global_step": 151625, "epoch": 3610} {"train_loss": -6.8229522705078125, "global_step": 151626, "epoch": 3610} {"train_loss": -6.778755187988281, "global_step": 151627, "epoch": 3610} {"train_loss": -6.812483787536621, "global_step": 151628, "epoch": 3610} {"train_loss": -6.879917144775391, "global_step": 151629, "epoch": 3610} {"train_loss": -6.762068748474121, "global_step": 151630, "epoch": 3610} {"train_loss": -6.764164924621582, "global_step": 151631, "epoch": 3610} {"train_loss": -6.798078536987305, "global_step": 151632, "epoch": 3610} {"train_loss": -6.709596633911133, "global_step": 151633, "epoch": 3610} {"train_loss": -6.740597724914551, "global_step": 151634, "epoch": 3610} {"train_loss": -6.777153015136719, "global_step": 151635, "epoch": 3610} {"train_loss": -6.7745208740234375, "global_step": 151636, "epoch": 3610} {"train_loss": -6.71385383605957, "global_step": 151637, "epoch": 3610} {"train_loss": -6.647165298461914, "global_step": 151638, "epoch": 3610} {"train_loss": -6.75474739074707, "global_step": 151639, "epoch": 3610} {"train_loss": -6.881498336791992, "global_step": 151640, "epoch": 3610} {"train_loss": -6.808297157287598, "global_step": 151641, "epoch": 3610} {"train_loss": -6.82928466796875, "global_step": 151642, "epoch": 3610} {"train_loss": -6.880515098571777, "global_step": 151643, "epoch": 3610} {"train_loss": -6.777983665466309, "global_step": 151644, "epoch": 3610} {"train_loss": -6.869001865386963, "global_step": 151645, "epoch": 3610} {"train_loss": -6.78847599029541, "global_step": 151646, "epoch": 3610} {"train_loss": -6.827178955078125, "global_step": 151647, "epoch": 3610} {"train_loss": -6.84785795211792, "global_step": 151648, "epoch": 3610} {"train_loss": -6.678417205810547, "global_step": 151649, "epoch": 3610} {"train_loss": -6.793802261352539, "global_step": 151650, "epoch": 3610} {"train_loss": -6.813871383666992, "global_step": 151651, "epoch": 3610} {"train_loss": -6.884739875793457, "global_step": 151652, "epoch": 3610} {"train_loss": -6.704258441925049, "global_step": 151653, "epoch": 3610} {"train_loss": -6.677671432495117, "global_step": 151654, "epoch": 3610} {"train_loss": -6.776504039764404, "global_step": 151655, "epoch": 3610} {"train_loss": -6.6629438400268555, "global_step": 151656, "epoch": 3610} {"train_loss": -6.75044059753418, "global_step": 151657, "epoch": 3610} {"train_loss": -6.732285499572754, "global_step": 151658, "epoch": 3610} {"train_loss": -6.636875152587891, "global_step": 151659, "epoch": 3610} {"train_loss": -6.832494735717773, "global_step": 151660, "epoch": 3610} {"train_loss": -6.780228387741816, "global_step": 151661, "epoch": 3610, "val_loss": 68511.9140625} {"train_loss": -6.933823585510254, "global_step": 151662, "epoch": 3611} {"train_loss": -6.7614569664001465, "global_step": 151663, "epoch": 3611} {"train_loss": -6.8182373046875, "global_step": 151664, "epoch": 3611} {"train_loss": -6.876259803771973, "global_step": 151665, "epoch": 3611} {"train_loss": -6.743629455566406, "global_step": 151666, "epoch": 3611} {"train_loss": -6.691067695617676, "global_step": 151667, "epoch": 3611} {"train_loss": -6.771083354949951, "global_step": 151668, "epoch": 3611} {"train_loss": -6.710192680358887, "global_step": 151669, "epoch": 3611} {"train_loss": -6.7013773918151855, "global_step": 151670, "epoch": 3611} {"train_loss": -6.822457313537598, "global_step": 151671, "epoch": 3611} {"train_loss": -6.740670204162598, "global_step": 151672, "epoch": 3611} {"train_loss": -6.767581939697266, "global_step": 151673, "epoch": 3611} {"train_loss": -6.76253604888916, "global_step": 151674, "epoch": 3611} {"train_loss": -6.746100425720215, "global_step": 151675, "epoch": 3611} {"train_loss": -6.803810119628906, "global_step": 151676, "epoch": 3611} {"train_loss": -6.716273307800293, "global_step": 151677, "epoch": 3611} {"train_loss": -6.787551403045654, "global_step": 151678, "epoch": 3611} {"train_loss": -6.920562744140625, "global_step": 151679, "epoch": 3611} {"train_loss": -6.833599090576172, "global_step": 151680, "epoch": 3611} {"train_loss": -6.7468695640563965, "global_step": 151681, "epoch": 3611} {"train_loss": -6.793497562408447, "global_step": 151682, "epoch": 3611} {"train_loss": -6.762609004974365, "global_step": 151683, "epoch": 3611} {"train_loss": -6.82464599609375, "global_step": 151684, "epoch": 3611} {"train_loss": -6.814004898071289, "global_step": 151685, "epoch": 3611} {"train_loss": -6.883295059204102, "global_step": 151686, "epoch": 3611} {"train_loss": -6.773848533630371, "global_step": 151687, "epoch": 3611} {"train_loss": -6.8688836097717285, "global_step": 151688, "epoch": 3611} {"train_loss": -6.790146350860596, "global_step": 151689, "epoch": 3611} {"train_loss": -6.816187858581543, "global_step": 151690, "epoch": 3611} {"train_loss": -6.92427921295166, "global_step": 151691, "epoch": 3611} {"train_loss": -6.782186031341553, "global_step": 151692, "epoch": 3611} {"train_loss": -6.93968391418457, "global_step": 151693, "epoch": 3611} {"train_loss": -6.840778350830078, "global_step": 151694, "epoch": 3611} {"train_loss": -6.878385066986084, "global_step": 151695, "epoch": 3611} {"train_loss": -6.77769136428833, "global_step": 151696, "epoch": 3611} {"train_loss": -6.847033500671387, "global_step": 151697, "epoch": 3611} {"train_loss": -6.786133766174316, "global_step": 151698, "epoch": 3611} {"train_loss": -6.9046759605407715, "global_step": 151699, "epoch": 3611} {"train_loss": -6.772176742553711, "global_step": 151700, "epoch": 3611} {"train_loss": -6.765963554382324, "global_step": 151701, "epoch": 3611} {"train_loss": -6.920496940612793, "global_step": 151702, "epoch": 3611} {"train_loss": -6.8074556191762285, "global_step": 151703, "epoch": 3611, "val_loss": 68496.96875} {"train_loss": -6.914371967315674, "global_step": 151704, "epoch": 3612} {"train_loss": -6.903307914733887, "global_step": 151705, "epoch": 3612} {"train_loss": -6.838429927825928, "global_step": 151706, "epoch": 3612} {"train_loss": -6.908778190612793, "global_step": 151707, "epoch": 3612} {"train_loss": -6.827762126922607, "global_step": 151708, "epoch": 3612} {"train_loss": -6.924915313720703, "global_step": 151709, "epoch": 3612} {"train_loss": -6.966360092163086, "global_step": 151710, "epoch": 3612} {"train_loss": -6.807572364807129, "global_step": 151711, "epoch": 3612} {"train_loss": -6.891902923583984, "global_step": 151712, "epoch": 3612} {"train_loss": -6.905278205871582, "global_step": 151713, "epoch": 3612} {"train_loss": -6.882940292358398, "global_step": 151714, "epoch": 3612} {"train_loss": -6.823554515838623, "global_step": 151715, "epoch": 3612} {"train_loss": -6.798685073852539, "global_step": 151716, "epoch": 3612} {"train_loss": -6.822657585144043, "global_step": 151717, "epoch": 3612} {"train_loss": -6.873509407043457, "global_step": 151718, "epoch": 3612} {"train_loss": -6.804982662200928, "global_step": 151719, "epoch": 3612} {"train_loss": -6.859260559082031, "global_step": 151720, "epoch": 3612} {"train_loss": -6.788069248199463, "global_step": 151721, "epoch": 3612} {"train_loss": -6.721208572387695, "global_step": 151722, "epoch": 3612} {"train_loss": -6.757835388183594, "global_step": 151723, "epoch": 3612} {"train_loss": -6.742758274078369, "global_step": 151724, "epoch": 3612} {"train_loss": -6.861654281616211, "global_step": 151725, "epoch": 3612} {"train_loss": -6.780179977416992, "global_step": 151726, "epoch": 3612} {"train_loss": -6.823204040527344, "global_step": 151727, "epoch": 3612} {"train_loss": -6.806330680847168, "global_step": 151728, "epoch": 3612} {"train_loss": -6.817570686340332, "global_step": 151729, "epoch": 3612} {"train_loss": -6.725336074829102, "global_step": 151730, "epoch": 3612} {"train_loss": -6.708951950073242, "global_step": 151731, "epoch": 3612} {"train_loss": -6.804634094238281, "global_step": 151732, "epoch": 3612} {"train_loss": -6.841053485870361, "global_step": 151733, "epoch": 3612} {"train_loss": -6.835677146911621, "global_step": 151734, "epoch": 3612} {"train_loss": -6.794622898101807, "global_step": 151735, "epoch": 3612} {"train_loss": -6.833868980407715, "global_step": 151736, "epoch": 3612} {"train_loss": -6.797247409820557, "global_step": 151737, "epoch": 3612} {"train_loss": -6.803403377532959, "global_step": 151738, "epoch": 3612} {"train_loss": -6.81250524520874, "global_step": 151739, "epoch": 3612} {"train_loss": -6.697702407836914, "global_step": 151740, "epoch": 3612} {"train_loss": -6.780577659606934, "global_step": 151741, "epoch": 3612} {"train_loss": -6.787589073181152, "global_step": 151742, "epoch": 3612} {"train_loss": -6.830362796783447, "global_step": 151743, "epoch": 3612} {"train_loss": -6.7858195304870605, "global_step": 151744, "epoch": 3612} {"train_loss": -6.820505017325992, "global_step": 151745, "epoch": 3612, "val_loss": 68406.2578125} {"train_loss": -6.828070640563965, "global_step": 151746, "epoch": 3613} {"train_loss": -6.760306358337402, "global_step": 151747, "epoch": 3613} {"train_loss": -6.77964973449707, "global_step": 151748, "epoch": 3613} {"train_loss": -6.820199012756348, "global_step": 151749, "epoch": 3613} {"train_loss": -6.759825706481934, "global_step": 151750, "epoch": 3613} {"train_loss": -6.77847146987915, "global_step": 151751, "epoch": 3613} {"train_loss": -6.912275314331055, "global_step": 151752, "epoch": 3613} {"train_loss": -6.764729976654053, "global_step": 151753, "epoch": 3613} {"train_loss": -6.711583137512207, "global_step": 151754, "epoch": 3613} {"train_loss": -6.890294551849365, "global_step": 151755, "epoch": 3613} {"train_loss": -6.7351250648498535, "global_step": 151756, "epoch": 3613} {"train_loss": -6.877669334411621, "global_step": 151757, "epoch": 3613} {"train_loss": -6.921018123626709, "global_step": 151758, "epoch": 3613} {"train_loss": -6.726475715637207, "global_step": 151759, "epoch": 3613} {"train_loss": -6.842667579650879, "global_step": 151760, "epoch": 3613} {"train_loss": -6.815642833709717, "global_step": 151761, "epoch": 3613} {"train_loss": -6.942542552947998, "global_step": 151762, "epoch": 3613} {"train_loss": -6.848834037780762, "global_step": 151763, "epoch": 3613} {"train_loss": -6.754929542541504, "global_step": 151764, "epoch": 3613} {"train_loss": -6.86380672454834, "global_step": 151765, "epoch": 3613} {"train_loss": -6.8185906410217285, "global_step": 151766, "epoch": 3613} {"train_loss": -7.040909767150879, "global_step": 151767, "epoch": 3613} {"train_loss": -6.832008361816406, "global_step": 151768, "epoch": 3613} {"train_loss": -6.832143783569336, "global_step": 151769, "epoch": 3613} {"train_loss": -6.82161283493042, "global_step": 151770, "epoch": 3613} {"train_loss": -6.783537864685059, "global_step": 151771, "epoch": 3613} {"train_loss": -6.825344085693359, "global_step": 151772, "epoch": 3613} {"train_loss": -6.884349822998047, "global_step": 151773, "epoch": 3613} {"train_loss": -6.894329071044922, "global_step": 151774, "epoch": 3613} {"train_loss": -6.763625144958496, "global_step": 151775, "epoch": 3613} {"train_loss": -6.937774658203125, "global_step": 151776, "epoch": 3613} {"train_loss": -6.821939468383789, "global_step": 151777, "epoch": 3613} {"train_loss": -6.820993423461914, "global_step": 151778, "epoch": 3613} {"train_loss": -6.9054274559021, "global_step": 151779, "epoch": 3613} {"train_loss": -6.852864742279053, "global_step": 151780, "epoch": 3613} {"train_loss": -6.832802772521973, "global_step": 151781, "epoch": 3613} {"train_loss": -6.885012626647949, "global_step": 151782, "epoch": 3613} {"train_loss": -6.881710052490234, "global_step": 151783, "epoch": 3613} {"train_loss": -6.8189873695373535, "global_step": 151784, "epoch": 3613} {"train_loss": -6.816619873046875, "global_step": 151785, "epoch": 3613} {"train_loss": -6.869967460632324, "global_step": 151786, "epoch": 3613} {"train_loss": -6.83520675840832, "global_step": 151787, "epoch": 3613, "val_loss": 68395.9140625} {"train_loss": -6.877101898193359, "global_step": 151788, "epoch": 3614} {"train_loss": -6.911603927612305, "global_step": 151789, "epoch": 3614} {"train_loss": -6.854143142700195, "global_step": 151790, "epoch": 3614} {"train_loss": -6.96587610244751, "global_step": 151791, "epoch": 3614} {"train_loss": -6.844865798950195, "global_step": 151792, "epoch": 3614} {"train_loss": -6.889578819274902, "global_step": 151793, "epoch": 3614} {"train_loss": -6.918401718139648, "global_step": 151794, "epoch": 3614} {"train_loss": -6.883629322052002, "global_step": 151795, "epoch": 3614} {"train_loss": -6.723928451538086, "global_step": 151796, "epoch": 3614} {"train_loss": -6.805398941040039, "global_step": 151797, "epoch": 3614} {"train_loss": -6.8967790603637695, "global_step": 151798, "epoch": 3614} {"train_loss": -6.708939552307129, "global_step": 151799, "epoch": 3614} {"train_loss": -6.805373191833496, "global_step": 151800, "epoch": 3614} {"train_loss": -6.928136825561523, "global_step": 151801, "epoch": 3614} {"train_loss": -6.726390361785889, "global_step": 151802, "epoch": 3614} {"train_loss": -6.7469587326049805, "global_step": 151803, "epoch": 3614} {"train_loss": -6.8165602684021, "global_step": 151804, "epoch": 3614} {"train_loss": -6.801743507385254, "global_step": 151805, "epoch": 3614} {"train_loss": -6.789405822753906, "global_step": 151806, "epoch": 3614} {"train_loss": -6.866767883300781, "global_step": 151807, "epoch": 3614} {"train_loss": -6.841512680053711, "global_step": 151808, "epoch": 3614} {"train_loss": -6.838330268859863, "global_step": 151809, "epoch": 3614} {"train_loss": -6.693350791931152, "global_step": 151810, "epoch": 3614} {"train_loss": -6.8304219245910645, "global_step": 151811, "epoch": 3614} {"train_loss": -6.744183540344238, "global_step": 151812, "epoch": 3614} {"train_loss": -6.722198009490967, "global_step": 151813, "epoch": 3614} {"train_loss": -6.8849711418151855, "global_step": 151814, "epoch": 3614} {"train_loss": -6.7874555587768555, "global_step": 151815, "epoch": 3614} {"train_loss": -6.775449752807617, "global_step": 151816, "epoch": 3614} {"train_loss": -6.823822498321533, "global_step": 151817, "epoch": 3614} {"train_loss": -6.7601823806762695, "global_step": 151818, "epoch": 3614} {"train_loss": -6.824383735656738, "global_step": 151819, "epoch": 3614} {"train_loss": -6.831742763519287, "global_step": 151820, "epoch": 3614} {"train_loss": -6.729638576507568, "global_step": 151821, "epoch": 3614} {"train_loss": -6.687479496002197, "global_step": 151822, "epoch": 3614} {"train_loss": -6.797628879547119, "global_step": 151823, "epoch": 3614} {"train_loss": -6.8159685134887695, "global_step": 151824, "epoch": 3614} {"train_loss": -6.894078254699707, "global_step": 151825, "epoch": 3614} {"train_loss": -6.787328243255615, "global_step": 151826, "epoch": 3614} {"train_loss": -6.847808837890625, "global_step": 151827, "epoch": 3614} {"train_loss": -6.894216537475586, "global_step": 151828, "epoch": 3614} {"train_loss": -6.81885568300883, "global_step": 151829, "epoch": 3614, "val_loss": 68333.2421875} {"train_loss": -6.868152618408203, "global_step": 151830, "epoch": 3615} {"train_loss": -6.915980815887451, "global_step": 151831, "epoch": 3615} {"train_loss": -6.841296195983887, "global_step": 151832, "epoch": 3615} {"train_loss": -6.925478935241699, "global_step": 151833, "epoch": 3615} {"train_loss": -6.831911087036133, "global_step": 151834, "epoch": 3615} {"train_loss": -6.726367950439453, "global_step": 151835, "epoch": 3615} {"train_loss": -6.879084587097168, "global_step": 151836, "epoch": 3615} {"train_loss": -6.883216381072998, "global_step": 151837, "epoch": 3615} {"train_loss": -6.825159549713135, "global_step": 151838, "epoch": 3615} {"train_loss": -6.8026018142700195, "global_step": 151839, "epoch": 3615} {"train_loss": -6.8285369873046875, "global_step": 151840, "epoch": 3615} {"train_loss": -6.795086860656738, "global_step": 151841, "epoch": 3615} {"train_loss": -6.835044860839844, "global_step": 151842, "epoch": 3615} {"train_loss": -6.749884605407715, "global_step": 151843, "epoch": 3615} {"train_loss": -6.798455238342285, "global_step": 151844, "epoch": 3615} {"train_loss": -6.800332069396973, "global_step": 151845, "epoch": 3615} {"train_loss": -6.742519855499268, "global_step": 151846, "epoch": 3615} {"train_loss": -6.727298259735107, "global_step": 151847, "epoch": 3615} {"train_loss": -6.784399032592773, "global_step": 151848, "epoch": 3615} {"train_loss": -6.887456893920898, "global_step": 151849, "epoch": 3615} {"train_loss": -6.831485748291016, "global_step": 151850, "epoch": 3615} {"train_loss": -6.8677496910095215, "global_step": 151851, "epoch": 3615} {"train_loss": -6.73746919631958, "global_step": 151852, "epoch": 3615} {"train_loss": -6.913552284240723, "global_step": 151853, "epoch": 3615} {"train_loss": -6.863706588745117, "global_step": 151854, "epoch": 3615} {"train_loss": -6.903453826904297, "global_step": 151855, "epoch": 3615} {"train_loss": -6.962850570678711, "global_step": 151856, "epoch": 3615} {"train_loss": -6.816340446472168, "global_step": 151857, "epoch": 3615} {"train_loss": -6.864439487457275, "global_step": 151858, "epoch": 3615} {"train_loss": -6.954866886138916, "global_step": 151859, "epoch": 3615} {"train_loss": -6.9569621086120605, "global_step": 151860, "epoch": 3615} {"train_loss": -6.875001430511475, "global_step": 151861, "epoch": 3615} {"train_loss": -6.970904350280762, "global_step": 151862, "epoch": 3615} {"train_loss": -6.838047504425049, "global_step": 151863, "epoch": 3615} {"train_loss": -6.844245910644531, "global_step": 151864, "epoch": 3615} {"train_loss": -6.877050399780273, "global_step": 151865, "epoch": 3615} {"train_loss": -6.922158241271973, "global_step": 151866, "epoch": 3615} {"train_loss": -6.7481889724731445, "global_step": 151867, "epoch": 3615} {"train_loss": -6.848023414611816, "global_step": 151868, "epoch": 3615} {"train_loss": -6.8923869132995605, "global_step": 151869, "epoch": 3615} {"train_loss": -6.795817852020264, "global_step": 151870, "epoch": 3615} {"train_loss": -6.846419720422654, "global_step": 151871, "epoch": 3615, "val_loss": 68557.6015625} {"train_loss": -6.951570510864258, "global_step": 151872, "epoch": 3616} {"train_loss": -6.862067699432373, "global_step": 151873, "epoch": 3616} {"train_loss": -6.967659950256348, "global_step": 151874, "epoch": 3616} {"train_loss": -6.753721714019775, "global_step": 151875, "epoch": 3616} {"train_loss": -6.805238246917725, "global_step": 151876, "epoch": 3616} {"train_loss": -7.003983497619629, "global_step": 151877, "epoch": 3616} {"train_loss": -6.828848361968994, "global_step": 151878, "epoch": 3616} {"train_loss": -6.842318534851074, "global_step": 151879, "epoch": 3616} {"train_loss": -6.855023384094238, "global_step": 151880, "epoch": 3616} {"train_loss": -6.8677473068237305, "global_step": 151881, "epoch": 3616} {"train_loss": -6.885305404663086, "global_step": 151882, "epoch": 3616} {"train_loss": -6.790407180786133, "global_step": 151883, "epoch": 3616} {"train_loss": -6.8089094161987305, "global_step": 151884, "epoch": 3616} {"train_loss": -6.828327178955078, "global_step": 151885, "epoch": 3616} {"train_loss": -6.8269267082214355, "global_step": 151886, "epoch": 3616} {"train_loss": -6.768050670623779, "global_step": 151887, "epoch": 3616} {"train_loss": -6.872251510620117, "global_step": 151888, "epoch": 3616} {"train_loss": -6.606897830963135, "global_step": 151889, "epoch": 3616} {"train_loss": -6.645927429199219, "global_step": 151890, "epoch": 3616} {"train_loss": -6.845491886138916, "global_step": 151891, "epoch": 3616} {"train_loss": -6.676070690155029, "global_step": 151892, "epoch": 3616} {"train_loss": -6.836827278137207, "global_step": 151893, "epoch": 3616} {"train_loss": -6.8270416259765625, "global_step": 151894, "epoch": 3616} {"train_loss": -6.906466960906982, "global_step": 151895, "epoch": 3616} {"train_loss": -6.739536762237549, "global_step": 151896, "epoch": 3616} {"train_loss": -6.833376407623291, "global_step": 151897, "epoch": 3616} {"train_loss": -6.840221881866455, "global_step": 151898, "epoch": 3616} {"train_loss": -6.815206527709961, "global_step": 151899, "epoch": 3616} {"train_loss": -6.834437370300293, "global_step": 151900, "epoch": 3616} {"train_loss": -6.741111755371094, "global_step": 151901, "epoch": 3616} {"train_loss": -6.756371021270752, "global_step": 151902, "epoch": 3616} {"train_loss": -6.728644371032715, "global_step": 151903, "epoch": 3616} {"train_loss": -6.870209217071533, "global_step": 151904, "epoch": 3616} {"train_loss": -6.854092597961426, "global_step": 151905, "epoch": 3616} {"train_loss": -6.707293510437012, "global_step": 151906, "epoch": 3616} {"train_loss": -6.861857891082764, "global_step": 151907, "epoch": 3616} {"train_loss": -6.821518421173096, "global_step": 151908, "epoch": 3616} {"train_loss": -6.845911026000977, "global_step": 151909, "epoch": 3616} {"train_loss": -6.928502082824707, "global_step": 151910, "epoch": 3616} {"train_loss": -6.802261829376221, "global_step": 151911, "epoch": 3616} {"train_loss": -6.907364845275879, "global_step": 151912, "epoch": 3616} {"train_loss": -6.825520481382098, "global_step": 151913, "epoch": 3616, "val_loss": 68478.8984375} {"train_loss": -6.850662708282471, "global_step": 151914, "epoch": 3617} {"train_loss": -6.81912899017334, "global_step": 151915, "epoch": 3617} {"train_loss": -6.8383402824401855, "global_step": 151916, "epoch": 3617} {"train_loss": -6.797979831695557, "global_step": 151917, "epoch": 3617} {"train_loss": -6.887678623199463, "global_step": 151918, "epoch": 3617} {"train_loss": -6.712460994720459, "global_step": 151919, "epoch": 3617} {"train_loss": -6.835970401763916, "global_step": 151920, "epoch": 3617} {"train_loss": -6.833094596862793, "global_step": 151921, "epoch": 3617} {"train_loss": -6.823834419250488, "global_step": 151922, "epoch": 3617} {"train_loss": -6.896235466003418, "global_step": 151923, "epoch": 3617} {"train_loss": -6.822328567504883, "global_step": 151924, "epoch": 3617} {"train_loss": -6.908517837524414, "global_step": 151925, "epoch": 3617} {"train_loss": -6.954018592834473, "global_step": 151926, "epoch": 3617} {"train_loss": -6.960050582885742, "global_step": 151927, "epoch": 3617} {"train_loss": -6.8115925788879395, "global_step": 151928, "epoch": 3617} {"train_loss": -6.898829460144043, "global_step": 151929, "epoch": 3617} {"train_loss": -6.830079078674316, "global_step": 151930, "epoch": 3617} {"train_loss": -6.8500261306762695, "global_step": 151931, "epoch": 3617} {"train_loss": -6.844316005706787, "global_step": 151932, "epoch": 3617} {"train_loss": -6.737053871154785, "global_step": 151933, "epoch": 3617} {"train_loss": -6.767241477966309, "global_step": 151934, "epoch": 3617} {"train_loss": -6.79775333404541, "global_step": 151935, "epoch": 3617} {"train_loss": -6.799622535705566, "global_step": 151936, "epoch": 3617} {"train_loss": -6.82058048248291, "global_step": 151937, "epoch": 3617} {"train_loss": -6.821326732635498, "global_step": 151938, "epoch": 3617} {"train_loss": -6.891932487487793, "global_step": 151939, "epoch": 3617} {"train_loss": -6.839700698852539, "global_step": 151940, "epoch": 3617} {"train_loss": -6.848260879516602, "global_step": 151941, "epoch": 3617} {"train_loss": -6.83524227142334, "global_step": 151942, "epoch": 3617} {"train_loss": -6.753105163574219, "global_step": 151943, "epoch": 3617} {"train_loss": -6.8537702560424805, "global_step": 151944, "epoch": 3617} {"train_loss": -6.7522125244140625, "global_step": 151945, "epoch": 3617} {"train_loss": -6.778762340545654, "global_step": 151946, "epoch": 3617} {"train_loss": -6.7706804275512695, "global_step": 151947, "epoch": 3617} {"train_loss": -6.8071746826171875, "global_step": 151948, "epoch": 3617} {"train_loss": -6.874014377593994, "global_step": 151949, "epoch": 3617} {"train_loss": -6.7463178634643555, "global_step": 151950, "epoch": 3617} {"train_loss": -6.810675144195557, "global_step": 151951, "epoch": 3617} {"train_loss": -6.8563432693481445, "global_step": 151952, "epoch": 3617} {"train_loss": -6.887385368347168, "global_step": 151953, "epoch": 3617} {"train_loss": -6.8099212646484375, "global_step": 151954, "epoch": 3617} {"train_loss": -6.832889783950079, "global_step": 151955, "epoch": 3617, "val_loss": 68551.8359375} {"train_loss": -6.881587982177734, "global_step": 151956, "epoch": 3618} {"train_loss": -6.770730018615723, "global_step": 151957, "epoch": 3618} {"train_loss": -6.78209114074707, "global_step": 151958, "epoch": 3618} {"train_loss": -6.831580638885498, "global_step": 151959, "epoch": 3618} {"train_loss": -6.791034698486328, "global_step": 151960, "epoch": 3618} {"train_loss": -6.904853820800781, "global_step": 151961, "epoch": 3618} {"train_loss": -6.726192474365234, "global_step": 151962, "epoch": 3618} {"train_loss": -6.841714382171631, "global_step": 151963, "epoch": 3618} {"train_loss": -6.83539342880249, "global_step": 151964, "epoch": 3618} {"train_loss": -6.842310428619385, "global_step": 151965, "epoch": 3618} {"train_loss": -6.824525833129883, "global_step": 151966, "epoch": 3618} {"train_loss": -6.8607940673828125, "global_step": 151967, "epoch": 3618} {"train_loss": -6.881470680236816, "global_step": 151968, "epoch": 3618} {"train_loss": -6.780096530914307, "global_step": 151969, "epoch": 3618} {"train_loss": -6.9242844581604, "global_step": 151970, "epoch": 3618} {"train_loss": -6.943239212036133, "global_step": 151971, "epoch": 3618} {"train_loss": -6.909552097320557, "global_step": 151972, "epoch": 3618} {"train_loss": -6.850604057312012, "global_step": 151973, "epoch": 3618} {"train_loss": -6.854460716247559, "global_step": 151974, "epoch": 3618} {"train_loss": -6.908388137817383, "global_step": 151975, "epoch": 3618} {"train_loss": -6.8728132247924805, "global_step": 151976, "epoch": 3618} {"train_loss": -6.905829429626465, "global_step": 151977, "epoch": 3618} {"train_loss": -6.793797492980957, "global_step": 151978, "epoch": 3618} {"train_loss": -6.809861183166504, "global_step": 151979, "epoch": 3618} {"train_loss": -6.756166458129883, "global_step": 151980, "epoch": 3618} {"train_loss": -6.710000038146973, "global_step": 151981, "epoch": 3618} {"train_loss": -6.7970170974731445, "global_step": 151982, "epoch": 3618} {"train_loss": -6.773490905761719, "global_step": 151983, "epoch": 3618} {"train_loss": -6.823897361755371, "global_step": 151984, "epoch": 3618} {"train_loss": -6.644863128662109, "global_step": 151985, "epoch": 3618} {"train_loss": -6.727035045623779, "global_step": 151986, "epoch": 3618} {"train_loss": -6.695182800292969, "global_step": 151987, "epoch": 3618} {"train_loss": -6.669708251953125, "global_step": 151988, "epoch": 3618} {"train_loss": -6.758561611175537, "global_step": 151989, "epoch": 3618} {"train_loss": -6.612857818603516, "global_step": 151990, "epoch": 3618} {"train_loss": -6.736789703369141, "global_step": 151991, "epoch": 3618} {"train_loss": -6.711292266845703, "global_step": 151992, "epoch": 3618} {"train_loss": -6.751490592956543, "global_step": 151993, "epoch": 3618} {"train_loss": -6.706566333770752, "global_step": 151994, "epoch": 3618} {"train_loss": -6.835347652435303, "global_step": 151995, "epoch": 3618} {"train_loss": -6.823859691619873, "global_step": 151996, "epoch": 3618} {"train_loss": -6.800273656845093, "global_step": 151997, "epoch": 3618, "val_loss": 68369.109375} {"train_loss": -6.775200843811035, "global_step": 151998, "epoch": 3619} {"train_loss": -6.693573951721191, "global_step": 151999, "epoch": 3619} {"train_loss": -6.836194038391113, "global_step": 152000, "epoch": 3619} {"train_loss": -6.846141815185547, "global_step": 152001, "epoch": 3619} {"train_loss": -6.7673492431640625, "global_step": 152002, "epoch": 3619} {"train_loss": -6.747927665710449, "global_step": 152003, "epoch": 3619} {"train_loss": -6.948502063751221, "global_step": 152004, "epoch": 3619} {"train_loss": -6.726201057434082, "global_step": 152005, "epoch": 3619} {"train_loss": -6.825051307678223, "global_step": 152006, "epoch": 3619} {"train_loss": -6.6845879554748535, "global_step": 152007, "epoch": 3619} {"train_loss": -6.958858013153076, "global_step": 152008, "epoch": 3619} {"train_loss": -6.895908355712891, "global_step": 152009, "epoch": 3619} {"train_loss": -6.837672233581543, "global_step": 152010, "epoch": 3619} {"train_loss": -6.842342853546143, "global_step": 152011, "epoch": 3619} {"train_loss": -6.843360424041748, "global_step": 152012, "epoch": 3619} {"train_loss": -6.8002166748046875, "global_step": 152013, "epoch": 3619} {"train_loss": -6.812417984008789, "global_step": 152014, "epoch": 3619} {"train_loss": -6.939125061035156, "global_step": 152015, "epoch": 3619} {"train_loss": -6.880003452301025, "global_step": 152016, "epoch": 3619} {"train_loss": -6.777407646179199, "global_step": 152017, "epoch": 3619} {"train_loss": -6.811641693115234, "global_step": 152018, "epoch": 3619} {"train_loss": -6.767059803009033, "global_step": 152019, "epoch": 3619} {"train_loss": -6.806406021118164, "global_step": 152020, "epoch": 3619} {"train_loss": -6.694424152374268, "global_step": 152021, "epoch": 3619} {"train_loss": -6.816787242889404, "global_step": 152022, "epoch": 3619} {"train_loss": -6.775153160095215, "global_step": 152023, "epoch": 3619} {"train_loss": -6.7075090408325195, "global_step": 152024, "epoch": 3619} {"train_loss": -6.736731052398682, "global_step": 152025, "epoch": 3619} {"train_loss": -6.750591278076172, "global_step": 152026, "epoch": 3619} {"train_loss": -6.871186256408691, "global_step": 152027, "epoch": 3619} {"train_loss": -6.76668643951416, "global_step": 152028, "epoch": 3619} {"train_loss": -6.7704315185546875, "global_step": 152029, "epoch": 3619} {"train_loss": -6.79496431350708, "global_step": 152030, "epoch": 3619} {"train_loss": -6.703395843505859, "global_step": 152031, "epoch": 3619} {"train_loss": -6.754542350769043, "global_step": 152032, "epoch": 3619} {"train_loss": -6.838367462158203, "global_step": 152033, "epoch": 3619} {"train_loss": -6.9204254150390625, "global_step": 152034, "epoch": 3619} {"train_loss": -6.842130661010742, "global_step": 152035, "epoch": 3619} {"train_loss": -6.882925033569336, "global_step": 152036, "epoch": 3619} {"train_loss": -6.682036399841309, "global_step": 152037, "epoch": 3619} {"train_loss": -6.792046070098877, "global_step": 152038, "epoch": 3619} {"train_loss": -6.802998917443412, "global_step": 152039, "epoch": 3619, "val_loss": 68578.046875} {"train_loss": -6.689323425292969, "global_step": 152040, "epoch": 3620} {"train_loss": -6.7613067626953125, "global_step": 152041, "epoch": 3620} {"train_loss": -6.776811122894287, "global_step": 152042, "epoch": 3620} {"train_loss": -6.7276082038879395, "global_step": 152043, "epoch": 3620} {"train_loss": -6.92025899887085, "global_step": 152044, "epoch": 3620} {"train_loss": -6.809334754943848, "global_step": 152045, "epoch": 3620} {"train_loss": -6.8442535400390625, "global_step": 152046, "epoch": 3620} {"train_loss": -6.717092514038086, "global_step": 152047, "epoch": 3620} {"train_loss": -6.74086856842041, "global_step": 152048, "epoch": 3620} {"train_loss": -6.790075302124023, "global_step": 152049, "epoch": 3620} {"train_loss": -6.763288974761963, "global_step": 152050, "epoch": 3620} {"train_loss": -6.885829925537109, "global_step": 152051, "epoch": 3620} {"train_loss": -6.878808975219727, "global_step": 152052, "epoch": 3620} {"train_loss": -6.818550109863281, "global_step": 152053, "epoch": 3620} {"train_loss": -6.8527398109436035, "global_step": 152054, "epoch": 3620} {"train_loss": -6.791135311126709, "global_step": 152055, "epoch": 3620} {"train_loss": -6.752353668212891, "global_step": 152056, "epoch": 3620} {"train_loss": -6.755777359008789, "global_step": 152057, "epoch": 3620} {"train_loss": -6.909283638000488, "global_step": 152058, "epoch": 3620} {"train_loss": -6.776622772216797, "global_step": 152059, "epoch": 3620} {"train_loss": -6.875083923339844, "global_step": 152060, "epoch": 3620} {"train_loss": -6.79158353805542, "global_step": 152061, "epoch": 3620} {"train_loss": -6.877742767333984, "global_step": 152062, "epoch": 3620} {"train_loss": -6.79835319519043, "global_step": 152063, "epoch": 3620} {"train_loss": -6.834752082824707, "global_step": 152064, "epoch": 3620} {"train_loss": -6.839323997497559, "global_step": 152065, "epoch": 3620} {"train_loss": -6.836721420288086, "global_step": 152066, "epoch": 3620} {"train_loss": -6.785321235656738, "global_step": 152067, "epoch": 3620} {"train_loss": -6.7708258628845215, "global_step": 152068, "epoch": 3620} {"train_loss": -6.730517387390137, "global_step": 152069, "epoch": 3620} {"train_loss": -6.83592414855957, "global_step": 152070, "epoch": 3620} {"train_loss": -6.733908653259277, "global_step": 152071, "epoch": 3620} {"train_loss": -6.665172100067139, "global_step": 152072, "epoch": 3620} {"train_loss": -6.716519355773926, "global_step": 152073, "epoch": 3620} {"train_loss": -6.778885841369629, "global_step": 152074, "epoch": 3620} {"train_loss": -6.720350742340088, "global_step": 152075, "epoch": 3620} {"train_loss": -6.817185401916504, "global_step": 152076, "epoch": 3620} {"train_loss": -6.61930513381958, "global_step": 152077, "epoch": 3620} {"train_loss": -6.926828384399414, "global_step": 152078, "epoch": 3620} {"train_loss": -6.888484001159668, "global_step": 152079, "epoch": 3620} {"train_loss": -6.707943916320801, "global_step": 152080, "epoch": 3620} {"train_loss": -6.790182261239915, "global_step": 152081, "epoch": 3620, "val_loss": 68471.0390625} {"train_loss": -6.747623920440674, "global_step": 152082, "epoch": 3621} {"train_loss": -6.877597808837891, "global_step": 152083, "epoch": 3621} {"train_loss": -6.784282684326172, "global_step": 152084, "epoch": 3621} {"train_loss": -6.858237266540527, "global_step": 152085, "epoch": 3621} {"train_loss": -6.812514781951904, "global_step": 152086, "epoch": 3621} {"train_loss": -6.737109661102295, "global_step": 152087, "epoch": 3621} {"train_loss": -6.631081581115723, "global_step": 152088, "epoch": 3621} {"train_loss": -6.79838752746582, "global_step": 152089, "epoch": 3621} {"train_loss": -6.737735271453857, "global_step": 152090, "epoch": 3621} {"train_loss": -6.707727432250977, "global_step": 152091, "epoch": 3621} {"train_loss": -6.8453688621521, "global_step": 152092, "epoch": 3621} {"train_loss": -6.835549354553223, "global_step": 152093, "epoch": 3621} {"train_loss": -6.694675922393799, "global_step": 152094, "epoch": 3621} {"train_loss": -6.805914878845215, "global_step": 152095, "epoch": 3621} {"train_loss": -6.841523170471191, "global_step": 152096, "epoch": 3621} {"train_loss": -6.782711029052734, "global_step": 152097, "epoch": 3621} {"train_loss": -6.860842704772949, "global_step": 152098, "epoch": 3621} {"train_loss": -6.809293746948242, "global_step": 152099, "epoch": 3621} {"train_loss": -6.820544242858887, "global_step": 152100, "epoch": 3621} {"train_loss": -6.9357476234436035, "global_step": 152101, "epoch": 3621} {"train_loss": -6.855312347412109, "global_step": 152102, "epoch": 3621} {"train_loss": -6.730794429779053, "global_step": 152103, "epoch": 3621} {"train_loss": -6.849732398986816, "global_step": 152104, "epoch": 3621} {"train_loss": -6.7547926902771, "global_step": 152105, "epoch": 3621} {"train_loss": -6.743863105773926, "global_step": 152106, "epoch": 3621} {"train_loss": -6.865417003631592, "global_step": 152107, "epoch": 3621} {"train_loss": -6.888108730316162, "global_step": 152108, "epoch": 3621} {"train_loss": -6.8605146408081055, "global_step": 152109, "epoch": 3621} {"train_loss": -6.863595008850098, "global_step": 152110, "epoch": 3621} {"train_loss": -6.847633361816406, "global_step": 152111, "epoch": 3621} {"train_loss": -6.91167688369751, "global_step": 152112, "epoch": 3621} {"train_loss": -6.95207405090332, "global_step": 152113, "epoch": 3621} {"train_loss": -6.880777359008789, "global_step": 152114, "epoch": 3621} {"train_loss": -6.836365222930908, "global_step": 152115, "epoch": 3621} {"train_loss": -6.843194961547852, "global_step": 152116, "epoch": 3621} {"train_loss": -6.739315032958984, "global_step": 152117, "epoch": 3621} {"train_loss": -6.816039085388184, "global_step": 152118, "epoch": 3621} {"train_loss": -6.924311637878418, "global_step": 152119, "epoch": 3621} {"train_loss": -6.747617721557617, "global_step": 152120, "epoch": 3621} {"train_loss": -6.705682754516602, "global_step": 152121, "epoch": 3621} {"train_loss": -6.828673362731934, "global_step": 152122, "epoch": 3621} {"train_loss": -6.812424409957159, "global_step": 152123, "epoch": 3621, "val_loss": 68493.140625} {"train_loss": -6.839241027832031, "global_step": 152124, "epoch": 3622} {"train_loss": -6.938047409057617, "global_step": 152125, "epoch": 3622} {"train_loss": -6.909430027008057, "global_step": 152126, "epoch": 3622} {"train_loss": -6.836116790771484, "global_step": 152127, "epoch": 3622} {"train_loss": -6.821305274963379, "global_step": 152128, "epoch": 3622} {"train_loss": -6.806834697723389, "global_step": 152129, "epoch": 3622} {"train_loss": -6.803041458129883, "global_step": 152130, "epoch": 3622} {"train_loss": -6.774257659912109, "global_step": 152131, "epoch": 3622} {"train_loss": -6.850587368011475, "global_step": 152132, "epoch": 3622} {"train_loss": -6.791711330413818, "global_step": 152133, "epoch": 3622} {"train_loss": -6.859024524688721, "global_step": 152134, "epoch": 3622} {"train_loss": -6.754421234130859, "global_step": 152135, "epoch": 3622} {"train_loss": -6.844515800476074, "global_step": 152136, "epoch": 3622} {"train_loss": -6.715526580810547, "global_step": 152137, "epoch": 3622} {"train_loss": -6.960060119628906, "global_step": 152138, "epoch": 3622} {"train_loss": -6.9200263023376465, "global_step": 152139, "epoch": 3622} {"train_loss": -6.925785064697266, "global_step": 152140, "epoch": 3622} {"train_loss": -6.828144073486328, "global_step": 152141, "epoch": 3622} {"train_loss": -6.938020706176758, "global_step": 152142, "epoch": 3622} {"train_loss": -6.87379264831543, "global_step": 152143, "epoch": 3622} {"train_loss": -6.890613555908203, "global_step": 152144, "epoch": 3622} {"train_loss": -6.888880729675293, "global_step": 152145, "epoch": 3622} {"train_loss": -6.89255428314209, "global_step": 152146, "epoch": 3622} {"train_loss": -6.851884365081787, "global_step": 152147, "epoch": 3622} {"train_loss": -6.909903526306152, "global_step": 152148, "epoch": 3622} {"train_loss": -6.767324447631836, "global_step": 152149, "epoch": 3622} {"train_loss": -6.907067775726318, "global_step": 152150, "epoch": 3622} {"train_loss": -6.7043681144714355, "global_step": 152151, "epoch": 3622} {"train_loss": -6.943475246429443, "global_step": 152152, "epoch": 3622} {"train_loss": -6.864741325378418, "global_step": 152153, "epoch": 3622} {"train_loss": -6.92512321472168, "global_step": 152154, "epoch": 3622} {"train_loss": -6.885087013244629, "global_step": 152155, "epoch": 3622} {"train_loss": -6.825386047363281, "global_step": 152156, "epoch": 3622} {"train_loss": -6.923426628112793, "global_step": 152157, "epoch": 3622} {"train_loss": -6.851499557495117, "global_step": 152158, "epoch": 3622} {"train_loss": -6.786332130432129, "global_step": 152159, "epoch": 3622} {"train_loss": -6.841887474060059, "global_step": 152160, "epoch": 3622} {"train_loss": -6.841246604919434, "global_step": 152161, "epoch": 3622} {"train_loss": -6.583106994628906, "global_step": 152162, "epoch": 3622} {"train_loss": -6.851988792419434, "global_step": 152163, "epoch": 3622} {"train_loss": -6.820731163024902, "global_step": 152164, "epoch": 3622} {"train_loss": -6.84679008665539, "global_step": 152165, "epoch": 3622, "val_loss": 68407.1015625} {"train_loss": -6.8494133949279785, "global_step": 152166, "epoch": 3623} {"train_loss": -6.698023796081543, "global_step": 152167, "epoch": 3623} {"train_loss": -6.814420223236084, "global_step": 152168, "epoch": 3623} {"train_loss": -6.777121543884277, "global_step": 152169, "epoch": 3623} {"train_loss": -6.739206314086914, "global_step": 152170, "epoch": 3623} {"train_loss": -6.861863136291504, "global_step": 152171, "epoch": 3623} {"train_loss": -6.679699897766113, "global_step": 152172, "epoch": 3623} {"train_loss": -6.608438014984131, "global_step": 152173, "epoch": 3623} {"train_loss": -6.848894119262695, "global_step": 152174, "epoch": 3623} {"train_loss": -6.642951965332031, "global_step": 152175, "epoch": 3623} {"train_loss": -6.679740905761719, "global_step": 152176, "epoch": 3623} {"train_loss": -6.7565765380859375, "global_step": 152177, "epoch": 3623} {"train_loss": -6.722079753875732, "global_step": 152178, "epoch": 3623} {"train_loss": -6.715338230133057, "global_step": 152179, "epoch": 3623} {"train_loss": -6.73492431640625, "global_step": 152180, "epoch": 3623} {"train_loss": -6.762887954711914, "global_step": 152181, "epoch": 3623} {"train_loss": -6.827040672302246, "global_step": 152182, "epoch": 3623} {"train_loss": -6.793179035186768, "global_step": 152183, "epoch": 3623} {"train_loss": -6.793652534484863, "global_step": 152184, "epoch": 3623} {"train_loss": -6.769443988800049, "global_step": 152185, "epoch": 3623} {"train_loss": -6.857485771179199, "global_step": 152186, "epoch": 3623} {"train_loss": -6.854080677032471, "global_step": 152187, "epoch": 3623} {"train_loss": -6.736636161804199, "global_step": 152188, "epoch": 3623} {"train_loss": -6.886717319488525, "global_step": 152189, "epoch": 3623} {"train_loss": -6.870244026184082, "global_step": 152190, "epoch": 3623} {"train_loss": -6.818487167358398, "global_step": 152191, "epoch": 3623} {"train_loss": -6.722753524780273, "global_step": 152192, "epoch": 3623} {"train_loss": -6.816161155700684, "global_step": 152193, "epoch": 3623} {"train_loss": -6.7519330978393555, "global_step": 152194, "epoch": 3623} {"train_loss": -6.821657180786133, "global_step": 152195, "epoch": 3623} {"train_loss": -6.828424453735352, "global_step": 152196, "epoch": 3623} {"train_loss": -6.770685195922852, "global_step": 152197, "epoch": 3623} {"train_loss": -6.80267333984375, "global_step": 152198, "epoch": 3623} {"train_loss": -6.7969865798950195, "global_step": 152199, "epoch": 3623} {"train_loss": -6.814393997192383, "global_step": 152200, "epoch": 3623} {"train_loss": -6.8750810623168945, "global_step": 152201, "epoch": 3623} {"train_loss": -6.786172866821289, "global_step": 152202, "epoch": 3623} {"train_loss": -6.8563995361328125, "global_step": 152203, "epoch": 3623} {"train_loss": -6.905921936035156, "global_step": 152204, "epoch": 3623} {"train_loss": -6.844328880310059, "global_step": 152205, "epoch": 3623} {"train_loss": -6.784902095794678, "global_step": 152206, "epoch": 3623} {"train_loss": -6.789407275971913, "global_step": 152207, "epoch": 3623, "val_loss": 68502.109375} {"train_loss": -6.842759132385254, "global_step": 152208, "epoch": 3624} {"train_loss": -6.911438941955566, "global_step": 152209, "epoch": 3624} {"train_loss": -6.859933376312256, "global_step": 152210, "epoch": 3624} {"train_loss": -6.831498146057129, "global_step": 152211, "epoch": 3624} {"train_loss": -6.734070301055908, "global_step": 152212, "epoch": 3624} {"train_loss": -6.811814785003662, "global_step": 152213, "epoch": 3624} {"train_loss": -7.025504112243652, "global_step": 152214, "epoch": 3624} {"train_loss": -6.864248275756836, "global_step": 152215, "epoch": 3624} {"train_loss": -6.825422286987305, "global_step": 152216, "epoch": 3624} {"train_loss": -6.8398237228393555, "global_step": 152217, "epoch": 3624} {"train_loss": -6.808762550354004, "global_step": 152218, "epoch": 3624} {"train_loss": -6.719754219055176, "global_step": 152219, "epoch": 3624} {"train_loss": -6.720081806182861, "global_step": 152220, "epoch": 3624} {"train_loss": -6.8970818519592285, "global_step": 152221, "epoch": 3624} {"train_loss": -6.717644691467285, "global_step": 152222, "epoch": 3624} {"train_loss": -6.739790916442871, "global_step": 152223, "epoch": 3624} {"train_loss": -6.816563606262207, "global_step": 152224, "epoch": 3624} {"train_loss": -6.608206272125244, "global_step": 152225, "epoch": 3624} {"train_loss": -6.908870697021484, "global_step": 152226, "epoch": 3624} {"train_loss": -6.847719192504883, "global_step": 152227, "epoch": 3624} {"train_loss": -6.693946361541748, "global_step": 152228, "epoch": 3624} {"train_loss": -6.831748962402344, "global_step": 152229, "epoch": 3624} {"train_loss": -6.828418254852295, "global_step": 152230, "epoch": 3624} {"train_loss": -6.792253494262695, "global_step": 152231, "epoch": 3624} {"train_loss": -6.727694511413574, "global_step": 152232, "epoch": 3624} {"train_loss": -6.927271366119385, "global_step": 152233, "epoch": 3624} {"train_loss": -6.726080417633057, "global_step": 152234, "epoch": 3624} {"train_loss": -6.862987995147705, "global_step": 152235, "epoch": 3624} {"train_loss": -6.866618633270264, "global_step": 152236, "epoch": 3624} {"train_loss": -6.804093360900879, "global_step": 152237, "epoch": 3624} {"train_loss": -6.850329399108887, "global_step": 152238, "epoch": 3624} {"train_loss": -6.948761940002441, "global_step": 152239, "epoch": 3624} {"train_loss": -6.826664924621582, "global_step": 152240, "epoch": 3624} {"train_loss": -6.740204811096191, "global_step": 152241, "epoch": 3624} {"train_loss": -6.792402267456055, "global_step": 152242, "epoch": 3624} {"train_loss": -6.84589958190918, "global_step": 152243, "epoch": 3624} {"train_loss": -6.806455612182617, "global_step": 152244, "epoch": 3624} {"train_loss": -6.7501935958862305, "global_step": 152245, "epoch": 3624} {"train_loss": -6.7863450050354, "global_step": 152246, "epoch": 3624} {"train_loss": -6.9173712730407715, "global_step": 152247, "epoch": 3624} {"train_loss": -6.874002933502197, "global_step": 152248, "epoch": 3624} {"train_loss": -6.816042718433199, "global_step": 152249, "epoch": 3624, "val_loss": 68305.46875} {"train_loss": -6.993906497955322, "global_step": 152250, "epoch": 3625} {"train_loss": -6.819262504577637, "global_step": 152251, "epoch": 3625} {"train_loss": -6.796167373657227, "global_step": 152252, "epoch": 3625} {"train_loss": -6.923801422119141, "global_step": 152253, "epoch": 3625} {"train_loss": -6.875337600708008, "global_step": 152254, "epoch": 3625} {"train_loss": -6.866042137145996, "global_step": 152255, "epoch": 3625} {"train_loss": -6.892547130584717, "global_step": 152256, "epoch": 3625} {"train_loss": -6.829641342163086, "global_step": 152257, "epoch": 3625} {"train_loss": -6.935057640075684, "global_step": 152258, "epoch": 3625} {"train_loss": -6.875188827514648, "global_step": 152259, "epoch": 3625} {"train_loss": -6.917142868041992, "global_step": 152260, "epoch": 3625} {"train_loss": -6.812647819519043, "global_step": 152261, "epoch": 3625} {"train_loss": -6.802206516265869, "global_step": 152262, "epoch": 3625} {"train_loss": -6.869453430175781, "global_step": 152263, "epoch": 3625} {"train_loss": -6.907896041870117, "global_step": 152264, "epoch": 3625} {"train_loss": -6.811222076416016, "global_step": 152265, "epoch": 3625} {"train_loss": -6.8471221923828125, "global_step": 152266, "epoch": 3625} {"train_loss": -6.828604698181152, "global_step": 152267, "epoch": 3625} {"train_loss": -6.890012741088867, "global_step": 152268, "epoch": 3625} {"train_loss": -6.783005237579346, "global_step": 152269, "epoch": 3625} {"train_loss": -6.873977184295654, "global_step": 152270, "epoch": 3625} {"train_loss": -6.889963150024414, "global_step": 152271, "epoch": 3625} {"train_loss": -6.758990287780762, "global_step": 152272, "epoch": 3625} {"train_loss": -6.900568962097168, "global_step": 152273, "epoch": 3625} {"train_loss": -6.896605491638184, "global_step": 152274, "epoch": 3625} {"train_loss": -6.671965599060059, "global_step": 152275, "epoch": 3625} {"train_loss": -6.768812656402588, "global_step": 152276, "epoch": 3625} {"train_loss": -6.82595157623291, "global_step": 152277, "epoch": 3625} {"train_loss": -6.7193193435668945, "global_step": 152278, "epoch": 3625} {"train_loss": -6.907171726226807, "global_step": 152279, "epoch": 3625} {"train_loss": -6.747809410095215, "global_step": 152280, "epoch": 3625} {"train_loss": -6.79868221282959, "global_step": 152281, "epoch": 3625} {"train_loss": -6.790056228637695, "global_step": 152282, "epoch": 3625} {"train_loss": -6.873546600341797, "global_step": 152283, "epoch": 3625} {"train_loss": -6.671319007873535, "global_step": 152284, "epoch": 3625} {"train_loss": -6.9299397468566895, "global_step": 152285, "epoch": 3625} {"train_loss": -6.775570869445801, "global_step": 152286, "epoch": 3625} {"train_loss": -6.803438663482666, "global_step": 152287, "epoch": 3625} {"train_loss": -6.819404602050781, "global_step": 152288, "epoch": 3625} {"train_loss": -6.809488773345947, "global_step": 152289, "epoch": 3625} {"train_loss": -6.8193230628967285, "global_step": 152290, "epoch": 3625} {"train_loss": -6.834932270504179, "global_step": 152291, "epoch": 3625, "val_loss": 68556.453125} {"train_loss": -6.699126720428467, "global_step": 152292, "epoch": 3626} {"train_loss": -6.897486686706543, "global_step": 152293, "epoch": 3626} {"train_loss": -6.832339286804199, "global_step": 152294, "epoch": 3626} {"train_loss": -6.835870742797852, "global_step": 152295, "epoch": 3626} {"train_loss": -6.818007946014404, "global_step": 152296, "epoch": 3626} {"train_loss": -6.663768768310547, "global_step": 152297, "epoch": 3626} {"train_loss": -6.831790924072266, "global_step": 152298, "epoch": 3626} {"train_loss": -6.872771263122559, "global_step": 152299, "epoch": 3626} {"train_loss": -6.8554792404174805, "global_step": 152300, "epoch": 3626} {"train_loss": -6.743032932281494, "global_step": 152301, "epoch": 3626} {"train_loss": -6.750433921813965, "global_step": 152302, "epoch": 3626} {"train_loss": -6.872040748596191, "global_step": 152303, "epoch": 3626} {"train_loss": -6.815912246704102, "global_step": 152304, "epoch": 3626} {"train_loss": -6.786351203918457, "global_step": 152305, "epoch": 3626} {"train_loss": -6.776647567749023, "global_step": 152306, "epoch": 3626} {"train_loss": -6.770925045013428, "global_step": 152307, "epoch": 3626} {"train_loss": -6.804055213928223, "global_step": 152308, "epoch": 3626} {"train_loss": -6.816180229187012, "global_step": 152309, "epoch": 3626} {"train_loss": -6.8110857009887695, "global_step": 152310, "epoch": 3626} {"train_loss": -6.861716270446777, "global_step": 152311, "epoch": 3626} {"train_loss": -6.886968612670898, "global_step": 152312, "epoch": 3626} {"train_loss": -6.825440406799316, "global_step": 152313, "epoch": 3626} {"train_loss": -6.792842864990234, "global_step": 152314, "epoch": 3626} {"train_loss": -6.860746383666992, "global_step": 152315, "epoch": 3626} {"train_loss": -6.76617431640625, "global_step": 152316, "epoch": 3626} {"train_loss": -6.888235569000244, "global_step": 152317, "epoch": 3626} {"train_loss": -6.858869552612305, "global_step": 152318, "epoch": 3626} {"train_loss": -6.9247026443481445, "global_step": 152319, "epoch": 3626} {"train_loss": -6.9446563720703125, "global_step": 152320, "epoch": 3626} {"train_loss": -6.896285533905029, "global_step": 152321, "epoch": 3626} {"train_loss": -6.927898406982422, "global_step": 152322, "epoch": 3626} {"train_loss": -6.824061393737793, "global_step": 152323, "epoch": 3626} {"train_loss": -6.802996635437012, "global_step": 152324, "epoch": 3626} {"train_loss": -6.846386909484863, "global_step": 152325, "epoch": 3626} {"train_loss": -6.906254768371582, "global_step": 152326, "epoch": 3626} {"train_loss": -6.918039321899414, "global_step": 152327, "epoch": 3626} {"train_loss": -6.835819244384766, "global_step": 152328, "epoch": 3626} {"train_loss": -6.850877285003662, "global_step": 152329, "epoch": 3626} {"train_loss": -6.80328369140625, "global_step": 152330, "epoch": 3626} {"train_loss": -6.858382225036621, "global_step": 152331, "epoch": 3626} {"train_loss": -6.649930477142334, "global_step": 152332, "epoch": 3626} {"train_loss": -6.827545608792986, "global_step": 152333, "epoch": 3626, "val_loss": 68428.4453125} {"train_loss": -6.8239874839782715, "global_step": 152334, "epoch": 3627} {"train_loss": -6.732431411743164, "global_step": 152335, "epoch": 3627} {"train_loss": -6.841996192932129, "global_step": 152336, "epoch": 3627} {"train_loss": -6.950010299682617, "global_step": 152337, "epoch": 3627} {"train_loss": -6.847533702850342, "global_step": 152338, "epoch": 3627} {"train_loss": -6.793731689453125, "global_step": 152339, "epoch": 3627} {"train_loss": -6.912235736846924, "global_step": 152340, "epoch": 3627} {"train_loss": -6.745246887207031, "global_step": 152341, "epoch": 3627} {"train_loss": -6.886008262634277, "global_step": 152342, "epoch": 3627} {"train_loss": -6.867909908294678, "global_step": 152343, "epoch": 3627} {"train_loss": -6.849364280700684, "global_step": 152344, "epoch": 3627} {"train_loss": -6.941834449768066, "global_step": 152345, "epoch": 3627} {"train_loss": -6.946344375610352, "global_step": 152346, "epoch": 3627} {"train_loss": -6.824755668640137, "global_step": 152347, "epoch": 3627} {"train_loss": -6.7696428298950195, "global_step": 152348, "epoch": 3627} {"train_loss": -6.850406169891357, "global_step": 152349, "epoch": 3627} {"train_loss": -6.8488945960998535, "global_step": 152350, "epoch": 3627} {"train_loss": -6.880228042602539, "global_step": 152351, "epoch": 3627} {"train_loss": -6.756469249725342, "global_step": 152352, "epoch": 3627} {"train_loss": -6.777973175048828, "global_step": 152353, "epoch": 3627} {"train_loss": -6.756292343139648, "global_step": 152354, "epoch": 3627} {"train_loss": -6.927703857421875, "global_step": 152355, "epoch": 3627} {"train_loss": -6.850092887878418, "global_step": 152356, "epoch": 3627} {"train_loss": -6.79874324798584, "global_step": 152357, "epoch": 3627} {"train_loss": -6.823299884796143, "global_step": 152358, "epoch": 3627} {"train_loss": -6.828197956085205, "global_step": 152359, "epoch": 3627} {"train_loss": -6.8496623039245605, "global_step": 152360, "epoch": 3627} {"train_loss": -6.797295093536377, "global_step": 152361, "epoch": 3627} {"train_loss": -6.868838310241699, "global_step": 152362, "epoch": 3627} {"train_loss": -6.817894458770752, "global_step": 152363, "epoch": 3627} {"train_loss": -6.87210750579834, "global_step": 152364, "epoch": 3627} {"train_loss": -6.768866062164307, "global_step": 152365, "epoch": 3627} {"train_loss": -6.815680503845215, "global_step": 152366, "epoch": 3627} {"train_loss": -6.796602725982666, "global_step": 152367, "epoch": 3627} {"train_loss": -6.917705535888672, "global_step": 152368, "epoch": 3627} {"train_loss": -6.821056365966797, "global_step": 152369, "epoch": 3627} {"train_loss": -6.794097423553467, "global_step": 152370, "epoch": 3627} {"train_loss": -6.915682315826416, "global_step": 152371, "epoch": 3627} {"train_loss": -6.815896511077881, "global_step": 152372, "epoch": 3627} {"train_loss": -6.805567741394043, "global_step": 152373, "epoch": 3627} {"train_loss": -6.876066207885742, "global_step": 152374, "epoch": 3627} {"train_loss": -6.835845788319905, "global_step": 152375, "epoch": 3627, "val_loss": 68666.0859375} {"train_loss": -6.807318687438965, "global_step": 152376, "epoch": 3628} {"train_loss": -6.756901741027832, "global_step": 152377, "epoch": 3628} {"train_loss": -6.8975419998168945, "global_step": 152378, "epoch": 3628} {"train_loss": -6.809100151062012, "global_step": 152379, "epoch": 3628} {"train_loss": -6.915807723999023, "global_step": 152380, "epoch": 3628} {"train_loss": -6.793268203735352, "global_step": 152381, "epoch": 3628} {"train_loss": -6.689487457275391, "global_step": 152382, "epoch": 3628} {"train_loss": -6.732504844665527, "global_step": 152383, "epoch": 3628} {"train_loss": -6.827348709106445, "global_step": 152384, "epoch": 3628} {"train_loss": -6.752481460571289, "global_step": 152385, "epoch": 3628} {"train_loss": -6.734243392944336, "global_step": 152386, "epoch": 3628} {"train_loss": -6.6586198806762695, "global_step": 152387, "epoch": 3628} {"train_loss": -6.787909507751465, "global_step": 152388, "epoch": 3628} {"train_loss": -6.919602394104004, "global_step": 152389, "epoch": 3628} {"train_loss": -6.638757705688477, "global_step": 152390, "epoch": 3628} {"train_loss": -6.589191436767578, "global_step": 152391, "epoch": 3628} {"train_loss": -6.770246505737305, "global_step": 152392, "epoch": 3628} {"train_loss": -6.736761569976807, "global_step": 152393, "epoch": 3628} {"train_loss": -6.827842712402344, "global_step": 152394, "epoch": 3628} {"train_loss": -6.658233642578125, "global_step": 152395, "epoch": 3628} {"train_loss": -6.797948837280273, "global_step": 152396, "epoch": 3628} {"train_loss": -6.809642791748047, "global_step": 152397, "epoch": 3628} {"train_loss": -6.722233772277832, "global_step": 152398, "epoch": 3628} {"train_loss": -6.6879425048828125, "global_step": 152399, "epoch": 3628} {"train_loss": -6.867021560668945, "global_step": 152400, "epoch": 3628} {"train_loss": -6.718232154846191, "global_step": 152401, "epoch": 3628} {"train_loss": -6.872969627380371, "global_step": 152402, "epoch": 3628} {"train_loss": -6.887092113494873, "global_step": 152403, "epoch": 3628} {"train_loss": -6.788181781768799, "global_step": 152404, "epoch": 3628} {"train_loss": -6.740004539489746, "global_step": 152405, "epoch": 3628} {"train_loss": -6.804677486419678, "global_step": 152406, "epoch": 3628} {"train_loss": -6.765949249267578, "global_step": 152407, "epoch": 3628} {"train_loss": -6.819036483764648, "global_step": 152408, "epoch": 3628} {"train_loss": -6.84928035736084, "global_step": 152409, "epoch": 3628} {"train_loss": -6.765476226806641, "global_step": 152410, "epoch": 3628} {"train_loss": -6.814812660217285, "global_step": 152411, "epoch": 3628} {"train_loss": -6.812929153442383, "global_step": 152412, "epoch": 3628} {"train_loss": -6.867419719696045, "global_step": 152413, "epoch": 3628} {"train_loss": -6.854935646057129, "global_step": 152414, "epoch": 3628} {"train_loss": -6.758489608764648, "global_step": 152415, "epoch": 3628} {"train_loss": -6.733219623565674, "global_step": 152416, "epoch": 3628} {"train_loss": -6.784602460407076, "global_step": 152417, "epoch": 3628, "val_loss": 68458.5546875} {"train_loss": -6.718110084533691, "global_step": 152418, "epoch": 3629} {"train_loss": -6.830594539642334, "global_step": 152419, "epoch": 3629} {"train_loss": -6.982958793640137, "global_step": 152420, "epoch": 3629} {"train_loss": -6.798681735992432, "global_step": 152421, "epoch": 3629} {"train_loss": -6.67601203918457, "global_step": 152422, "epoch": 3629} {"train_loss": -6.891136646270752, "global_step": 152423, "epoch": 3629} {"train_loss": -6.899136066436768, "global_step": 152424, "epoch": 3629} {"train_loss": -6.79298734664917, "global_step": 152425, "epoch": 3629} {"train_loss": -6.774425506591797, "global_step": 152426, "epoch": 3629} {"train_loss": -6.838372230529785, "global_step": 152427, "epoch": 3629} {"train_loss": -6.789691925048828, "global_step": 152428, "epoch": 3629} {"train_loss": -6.8225417137146, "global_step": 152429, "epoch": 3629} {"train_loss": -6.882541179656982, "global_step": 152430, "epoch": 3629} {"train_loss": -6.8314619064331055, "global_step": 152431, "epoch": 3629} {"train_loss": -6.862007141113281, "global_step": 152432, "epoch": 3629} {"train_loss": -6.877338886260986, "global_step": 152433, "epoch": 3629} {"train_loss": -6.76884651184082, "global_step": 152434, "epoch": 3629} {"train_loss": -6.886592864990234, "global_step": 152435, "epoch": 3629} {"train_loss": -6.845953941345215, "global_step": 152436, "epoch": 3629} {"train_loss": -6.770078659057617, "global_step": 152437, "epoch": 3629} {"train_loss": -6.853307723999023, "global_step": 152438, "epoch": 3629} {"train_loss": -6.910367965698242, "global_step": 152439, "epoch": 3629} {"train_loss": -6.823789596557617, "global_step": 152440, "epoch": 3629} {"train_loss": -6.7852783203125, "global_step": 152441, "epoch": 3629} {"train_loss": -6.739418983459473, "global_step": 152442, "epoch": 3629} {"train_loss": -6.74098014831543, "global_step": 152443, "epoch": 3629} {"train_loss": -6.836857795715332, "global_step": 152444, "epoch": 3629} {"train_loss": -6.8411712646484375, "global_step": 152445, "epoch": 3629} {"train_loss": -6.814197540283203, "global_step": 152446, "epoch": 3629} {"train_loss": -6.881921768188477, "global_step": 152447, "epoch": 3629} {"train_loss": -6.861092567443848, "global_step": 152448, "epoch": 3629} {"train_loss": -6.87832498550415, "global_step": 152449, "epoch": 3629} {"train_loss": -6.784297943115234, "global_step": 152450, "epoch": 3629} {"train_loss": -6.862496852874756, "global_step": 152451, "epoch": 3629} {"train_loss": -6.851741790771484, "global_step": 152452, "epoch": 3629} {"train_loss": -6.808836936950684, "global_step": 152453, "epoch": 3629} {"train_loss": -6.898439407348633, "global_step": 152454, "epoch": 3629} {"train_loss": -6.926730155944824, "global_step": 152455, "epoch": 3629} {"train_loss": -6.926973342895508, "global_step": 152456, "epoch": 3629} {"train_loss": -6.891294479370117, "global_step": 152457, "epoch": 3629} {"train_loss": -6.933656215667725, "global_step": 152458, "epoch": 3629} {"train_loss": -6.839387394133068, "global_step": 152459, "epoch": 3629, "val_loss": 68597.234375} {"train_loss": -6.771347522735596, "global_step": 152460, "epoch": 3630} {"train_loss": -6.892758369445801, "global_step": 152461, "epoch": 3630} {"train_loss": -6.894183158874512, "global_step": 152462, "epoch": 3630} {"train_loss": -6.838100433349609, "global_step": 152463, "epoch": 3630} {"train_loss": -6.881464004516602, "global_step": 152464, "epoch": 3630} {"train_loss": -6.8227739334106445, "global_step": 152465, "epoch": 3630} {"train_loss": -6.839552879333496, "global_step": 152466, "epoch": 3630} {"train_loss": -6.784102439880371, "global_step": 152467, "epoch": 3630} {"train_loss": -6.884642124176025, "global_step": 152468, "epoch": 3630} {"train_loss": -6.821969985961914, "global_step": 152469, "epoch": 3630} {"train_loss": -6.961635112762451, "global_step": 152470, "epoch": 3630} {"train_loss": -6.900580406188965, "global_step": 152471, "epoch": 3630} {"train_loss": -6.861459732055664, "global_step": 152472, "epoch": 3630} {"train_loss": -6.82071590423584, "global_step": 152473, "epoch": 3630} {"train_loss": -6.852304458618164, "global_step": 152474, "epoch": 3630} {"train_loss": -6.9022650718688965, "global_step": 152475, "epoch": 3630} {"train_loss": -6.853381156921387, "global_step": 152476, "epoch": 3630} {"train_loss": -6.908536434173584, "global_step": 152477, "epoch": 3630} {"train_loss": -6.963408470153809, "global_step": 152478, "epoch": 3630} {"train_loss": -6.882468223571777, "global_step": 152479, "epoch": 3630} {"train_loss": -6.7540435791015625, "global_step": 152480, "epoch": 3630} {"train_loss": -6.880667686462402, "global_step": 152481, "epoch": 3630} {"train_loss": -6.8186445236206055, "global_step": 152482, "epoch": 3630} {"train_loss": -6.855801105499268, "global_step": 152483, "epoch": 3630} {"train_loss": -6.833812236785889, "global_step": 152484, "epoch": 3630} {"train_loss": -6.893197059631348, "global_step": 152485, "epoch": 3630} {"train_loss": -6.848814964294434, "global_step": 152486, "epoch": 3630} {"train_loss": -6.9461588859558105, "global_step": 152487, "epoch": 3630} {"train_loss": -6.855834007263184, "global_step": 152488, "epoch": 3630} {"train_loss": -6.931062698364258, "global_step": 152489, "epoch": 3630} {"train_loss": -6.889987945556641, "global_step": 152490, "epoch": 3630} {"train_loss": -6.875057220458984, "global_step": 152491, "epoch": 3630} {"train_loss": -6.8290557861328125, "global_step": 152492, "epoch": 3630} {"train_loss": -6.865597724914551, "global_step": 152493, "epoch": 3630} {"train_loss": -6.9367451667785645, "global_step": 152494, "epoch": 3630} {"train_loss": -6.932424068450928, "global_step": 152495, "epoch": 3630} {"train_loss": -6.908324241638184, "global_step": 152496, "epoch": 3630} {"train_loss": -6.913667678833008, "global_step": 152497, "epoch": 3630} {"train_loss": -6.899844169616699, "global_step": 152498, "epoch": 3630} {"train_loss": -6.755169868469238, "global_step": 152499, "epoch": 3630} {"train_loss": -6.735842704772949, "global_step": 152500, "epoch": 3630} {"train_loss": -6.8670070852552145, "global_step": 152501, "epoch": 3630, "val_loss": 68496.2109375} {"train_loss": -6.778124809265137, "global_step": 152502, "epoch": 3631} {"train_loss": -6.810908317565918, "global_step": 152503, "epoch": 3631} {"train_loss": -6.829748153686523, "global_step": 152504, "epoch": 3631} {"train_loss": -6.870505332946777, "global_step": 152505, "epoch": 3631} {"train_loss": -6.906949996948242, "global_step": 152506, "epoch": 3631} {"train_loss": -6.994247913360596, "global_step": 152507, "epoch": 3631} {"train_loss": -6.711120128631592, "global_step": 152508, "epoch": 3631} {"train_loss": -6.843971252441406, "global_step": 152509, "epoch": 3631} {"train_loss": -6.867124557495117, "global_step": 152510, "epoch": 3631} {"train_loss": -6.970942497253418, "global_step": 152511, "epoch": 3631} {"train_loss": -6.852538585662842, "global_step": 152512, "epoch": 3631} {"train_loss": -6.937094688415527, "global_step": 152513, "epoch": 3631} {"train_loss": -6.882488250732422, "global_step": 152514, "epoch": 3631} {"train_loss": -6.841488838195801, "global_step": 152515, "epoch": 3631} {"train_loss": -6.831306457519531, "global_step": 152516, "epoch": 3631} {"train_loss": -6.925767421722412, "global_step": 152517, "epoch": 3631} {"train_loss": -6.823328971862793, "global_step": 152518, "epoch": 3631} {"train_loss": -6.819056510925293, "global_step": 152519, "epoch": 3631} {"train_loss": -6.920581817626953, "global_step": 152520, "epoch": 3631} {"train_loss": -6.78665828704834, "global_step": 152521, "epoch": 3631} {"train_loss": -6.864233493804932, "global_step": 152522, "epoch": 3631} {"train_loss": -6.650339603424072, "global_step": 152523, "epoch": 3631} {"train_loss": -6.604506492614746, "global_step": 152524, "epoch": 3631} {"train_loss": -6.7637505531311035, "global_step": 152525, "epoch": 3631} {"train_loss": -6.707535743713379, "global_step": 152526, "epoch": 3631} {"train_loss": -6.738033771514893, "global_step": 152527, "epoch": 3631} {"train_loss": -6.789525985717773, "global_step": 152528, "epoch": 3631} {"train_loss": -6.666871547698975, "global_step": 152529, "epoch": 3631} {"train_loss": -6.8381571769714355, "global_step": 152530, "epoch": 3631} {"train_loss": -6.8141937255859375, "global_step": 152531, "epoch": 3631} {"train_loss": -6.837949275970459, "global_step": 152532, "epoch": 3631} {"train_loss": -6.73582649230957, "global_step": 152533, "epoch": 3631} {"train_loss": -6.907866477966309, "global_step": 152534, "epoch": 3631} {"train_loss": -6.880919456481934, "global_step": 152535, "epoch": 3631} {"train_loss": -6.73582649230957, "global_step": 152536, "epoch": 3631} {"train_loss": -6.822193145751953, "global_step": 152537, "epoch": 3631} {"train_loss": -6.870632171630859, "global_step": 152538, "epoch": 3631} {"train_loss": -6.801489353179932, "global_step": 152539, "epoch": 3631} {"train_loss": -6.756019592285156, "global_step": 152540, "epoch": 3631} {"train_loss": -6.7457075119018555, "global_step": 152541, "epoch": 3631} {"train_loss": -6.886425971984863, "global_step": 152542, "epoch": 3631} {"train_loss": -6.819640307199387, "global_step": 152543, "epoch": 3631, "val_loss": 68521.8125} {"train_loss": -6.8640031814575195, "global_step": 152544, "epoch": 3632} {"train_loss": -6.85496711730957, "global_step": 152545, "epoch": 3632} {"train_loss": -6.776392459869385, "global_step": 152546, "epoch": 3632} {"train_loss": -6.822309494018555, "global_step": 152547, "epoch": 3632} {"train_loss": -6.869095802307129, "global_step": 152548, "epoch": 3632} {"train_loss": -6.701870918273926, "global_step": 152549, "epoch": 3632} {"train_loss": -6.724864959716797, "global_step": 152550, "epoch": 3632} {"train_loss": -6.771292209625244, "global_step": 152551, "epoch": 3632} {"train_loss": -6.823308944702148, "global_step": 152552, "epoch": 3632} {"train_loss": -6.977009296417236, "global_step": 152553, "epoch": 3632} {"train_loss": -6.882641315460205, "global_step": 152554, "epoch": 3632} {"train_loss": -6.7801666259765625, "global_step": 152555, "epoch": 3632} {"train_loss": -6.885249137878418, "global_step": 152556, "epoch": 3632} {"train_loss": -6.904095649719238, "global_step": 152557, "epoch": 3632} {"train_loss": -6.973090171813965, "global_step": 152558, "epoch": 3632} {"train_loss": -6.724740982055664, "global_step": 152559, "epoch": 3632} {"train_loss": -6.800088882446289, "global_step": 152560, "epoch": 3632} {"train_loss": -6.79709529876709, "global_step": 152561, "epoch": 3632} {"train_loss": -6.778460502624512, "global_step": 152562, "epoch": 3632} {"train_loss": -6.879376411437988, "global_step": 152563, "epoch": 3632} {"train_loss": -6.793334484100342, "global_step": 152564, "epoch": 3632} {"train_loss": -6.7691545486450195, "global_step": 152565, "epoch": 3632} {"train_loss": -6.8624773025512695, "global_step": 152566, "epoch": 3632} {"train_loss": -6.77984619140625, "global_step": 152567, "epoch": 3632} {"train_loss": -6.767334938049316, "global_step": 152568, "epoch": 3632} {"train_loss": -6.732298851013184, "global_step": 152569, "epoch": 3632} {"train_loss": -6.789833068847656, "global_step": 152570, "epoch": 3632} {"train_loss": -6.748400688171387, "global_step": 152571, "epoch": 3632} {"train_loss": -6.74719762802124, "global_step": 152572, "epoch": 3632} {"train_loss": -6.876992225646973, "global_step": 152573, "epoch": 3632} {"train_loss": -6.86628532409668, "global_step": 152574, "epoch": 3632} {"train_loss": -6.672521591186523, "global_step": 152575, "epoch": 3632} {"train_loss": -6.725368499755859, "global_step": 152576, "epoch": 3632} {"train_loss": -6.765124797821045, "global_step": 152577, "epoch": 3632} {"train_loss": -6.775608062744141, "global_step": 152578, "epoch": 3632} {"train_loss": -6.695402145385742, "global_step": 152579, "epoch": 3632} {"train_loss": -6.780331134796143, "global_step": 152580, "epoch": 3632} {"train_loss": -6.722687721252441, "global_step": 152581, "epoch": 3632} {"train_loss": -6.6516008377075195, "global_step": 152582, "epoch": 3632} {"train_loss": -6.72745418548584, "global_step": 152583, "epoch": 3632} {"train_loss": -6.8063507080078125, "global_step": 152584, "epoch": 3632} {"train_loss": -6.795453366779146, "global_step": 152585, "epoch": 3632, "val_loss": 68395.6484375} {"train_loss": -6.74397087097168, "global_step": 152586, "epoch": 3633} {"train_loss": -6.771925926208496, "global_step": 152587, "epoch": 3633} {"train_loss": -6.724149703979492, "global_step": 152588, "epoch": 3633} {"train_loss": -6.858281135559082, "global_step": 152589, "epoch": 3633} {"train_loss": -6.749407768249512, "global_step": 152590, "epoch": 3633} {"train_loss": -6.818142890930176, "global_step": 152591, "epoch": 3633} {"train_loss": -6.742458343505859, "global_step": 152592, "epoch": 3633} {"train_loss": -6.786728858947754, "global_step": 152593, "epoch": 3633} {"train_loss": -6.841858863830566, "global_step": 152594, "epoch": 3633} {"train_loss": -6.734246253967285, "global_step": 152595, "epoch": 3633} {"train_loss": -6.7588043212890625, "global_step": 152596, "epoch": 3633} {"train_loss": -6.638726711273193, "global_step": 152597, "epoch": 3633} {"train_loss": -6.890225410461426, "global_step": 152598, "epoch": 3633} {"train_loss": -6.751306056976318, "global_step": 152599, "epoch": 3633} {"train_loss": -6.774003028869629, "global_step": 152600, "epoch": 3633} {"train_loss": -6.732688903808594, "global_step": 152601, "epoch": 3633} {"train_loss": -6.712437629699707, "global_step": 152602, "epoch": 3633} {"train_loss": -6.856747627258301, "global_step": 152603, "epoch": 3633} {"train_loss": -6.807106018066406, "global_step": 152604, "epoch": 3633} {"train_loss": -6.894357204437256, "global_step": 152605, "epoch": 3633} {"train_loss": -6.703817367553711, "global_step": 152606, "epoch": 3633} {"train_loss": -6.787906646728516, "global_step": 152607, "epoch": 3633} {"train_loss": -6.6461896896362305, "global_step": 152608, "epoch": 3633} {"train_loss": -6.858819007873535, "global_step": 152609, "epoch": 3633} {"train_loss": -6.844860076904297, "global_step": 152610, "epoch": 3633} {"train_loss": -6.856539726257324, "global_step": 152611, "epoch": 3633} {"train_loss": -6.785011291503906, "global_step": 152612, "epoch": 3633} {"train_loss": -6.751036167144775, "global_step": 152613, "epoch": 3633} {"train_loss": -6.92825174331665, "global_step": 152614, "epoch": 3633} {"train_loss": -6.750793933868408, "global_step": 152615, "epoch": 3633} {"train_loss": -6.856926918029785, "global_step": 152616, "epoch": 3633} {"train_loss": -6.899718761444092, "global_step": 152617, "epoch": 3633} {"train_loss": -6.7377848625183105, "global_step": 152618, "epoch": 3633} {"train_loss": -6.827194690704346, "global_step": 152619, "epoch": 3633} {"train_loss": -6.787721633911133, "global_step": 152620, "epoch": 3633} {"train_loss": -6.936934471130371, "global_step": 152621, "epoch": 3633} {"train_loss": -6.76881217956543, "global_step": 152622, "epoch": 3633} {"train_loss": -6.834465026855469, "global_step": 152623, "epoch": 3633} {"train_loss": -6.851123809814453, "global_step": 152624, "epoch": 3633} {"train_loss": -6.899713516235352, "global_step": 152625, "epoch": 3633} {"train_loss": -6.858270645141602, "global_step": 152626, "epoch": 3633} {"train_loss": -6.801516078767323, "global_step": 152627, "epoch": 3633, "val_loss": 68401.546875} {"train_loss": -6.826025009155273, "global_step": 152628, "epoch": 3634} {"train_loss": -6.831682205200195, "global_step": 152629, "epoch": 3634} {"train_loss": -6.839984893798828, "global_step": 152630, "epoch": 3634} {"train_loss": -6.755805015563965, "global_step": 152631, "epoch": 3634} {"train_loss": -6.778565406799316, "global_step": 152632, "epoch": 3634} {"train_loss": -6.869828224182129, "global_step": 152633, "epoch": 3634} {"train_loss": -6.760831356048584, "global_step": 152634, "epoch": 3634} {"train_loss": -6.8640899658203125, "global_step": 152635, "epoch": 3634} {"train_loss": -6.882782936096191, "global_step": 152636, "epoch": 3634} {"train_loss": -6.884713172912598, "global_step": 152637, "epoch": 3634} {"train_loss": -6.874308109283447, "global_step": 152638, "epoch": 3634} {"train_loss": -6.85980224609375, "global_step": 152639, "epoch": 3634} {"train_loss": -6.883040428161621, "global_step": 152640, "epoch": 3634} {"train_loss": -6.865688323974609, "global_step": 152641, "epoch": 3634} {"train_loss": -6.823978424072266, "global_step": 152642, "epoch": 3634} {"train_loss": -6.84906530380249, "global_step": 152643, "epoch": 3634} {"train_loss": -6.892239093780518, "global_step": 152644, "epoch": 3634} {"train_loss": -6.893830299377441, "global_step": 152645, "epoch": 3634} {"train_loss": -6.798316955566406, "global_step": 152646, "epoch": 3634} {"train_loss": -6.754273414611816, "global_step": 152647, "epoch": 3634} {"train_loss": -6.858709812164307, "global_step": 152648, "epoch": 3634} {"train_loss": -6.906899929046631, "global_step": 152649, "epoch": 3634} {"train_loss": -6.9405927658081055, "global_step": 152650, "epoch": 3634} {"train_loss": -6.838960647583008, "global_step": 152651, "epoch": 3634} {"train_loss": -6.79819393157959, "global_step": 152652, "epoch": 3634} {"train_loss": -6.879243850708008, "global_step": 152653, "epoch": 3634} {"train_loss": -6.736184597015381, "global_step": 152654, "epoch": 3634} {"train_loss": -6.828853607177734, "global_step": 152655, "epoch": 3634} {"train_loss": -6.843421936035156, "global_step": 152656, "epoch": 3634} {"train_loss": -6.837738990783691, "global_step": 152657, "epoch": 3634} {"train_loss": -6.861262321472168, "global_step": 152658, "epoch": 3634} {"train_loss": -6.879998207092285, "global_step": 152659, "epoch": 3634} {"train_loss": -6.8575592041015625, "global_step": 152660, "epoch": 3634} {"train_loss": -6.885712623596191, "global_step": 152661, "epoch": 3634} {"train_loss": -6.866222381591797, "global_step": 152662, "epoch": 3634} {"train_loss": -6.835024356842041, "global_step": 152663, "epoch": 3634} {"train_loss": -6.895388126373291, "global_step": 152664, "epoch": 3634} {"train_loss": -6.767960548400879, "global_step": 152665, "epoch": 3634} {"train_loss": -6.854629993438721, "global_step": 152666, "epoch": 3634} {"train_loss": -6.989438533782959, "global_step": 152667, "epoch": 3634} {"train_loss": -6.82537317276001, "global_step": 152668, "epoch": 3634} {"train_loss": -6.8509017285846525, "global_step": 152669, "epoch": 3634, "val_loss": 68561.765625} {"train_loss": -6.833235740661621, "global_step": 152670, "epoch": 3635} {"train_loss": -6.852038383483887, "global_step": 152671, "epoch": 3635} {"train_loss": -6.990175247192383, "global_step": 152672, "epoch": 3635} {"train_loss": -6.9378509521484375, "global_step": 152673, "epoch": 3635} {"train_loss": -6.897927284240723, "global_step": 152674, "epoch": 3635} {"train_loss": -6.846102714538574, "global_step": 152675, "epoch": 3635} {"train_loss": -6.757562637329102, "global_step": 152676, "epoch": 3635} {"train_loss": -6.773822784423828, "global_step": 152677, "epoch": 3635} {"train_loss": -6.748224258422852, "global_step": 152678, "epoch": 3635} {"train_loss": -6.8968706130981445, "global_step": 152679, "epoch": 3635} {"train_loss": -6.679070472717285, "global_step": 152680, "epoch": 3635} {"train_loss": -6.880327224731445, "global_step": 152681, "epoch": 3635} {"train_loss": -6.886045932769775, "global_step": 152682, "epoch": 3635} {"train_loss": -6.951650142669678, "global_step": 152683, "epoch": 3635} {"train_loss": -6.865323066711426, "global_step": 152684, "epoch": 3635} {"train_loss": -6.792318344116211, "global_step": 152685, "epoch": 3635} {"train_loss": -6.845054626464844, "global_step": 152686, "epoch": 3635} {"train_loss": -6.8509345054626465, "global_step": 152687, "epoch": 3635} {"train_loss": -6.7408447265625, "global_step": 152688, "epoch": 3635} {"train_loss": -6.815859317779541, "global_step": 152689, "epoch": 3635} {"train_loss": -6.849039077758789, "global_step": 152690, "epoch": 3635} {"train_loss": -6.868648529052734, "global_step": 152691, "epoch": 3635} {"train_loss": -6.811440467834473, "global_step": 152692, "epoch": 3635} {"train_loss": -6.900500297546387, "global_step": 152693, "epoch": 3635} {"train_loss": -6.908601760864258, "global_step": 152694, "epoch": 3635} {"train_loss": -6.745718002319336, "global_step": 152695, "epoch": 3635} {"train_loss": -6.850868225097656, "global_step": 152696, "epoch": 3635} {"train_loss": -6.741449356079102, "global_step": 152697, "epoch": 3635} {"train_loss": -6.638152122497559, "global_step": 152698, "epoch": 3635} {"train_loss": -6.795971393585205, "global_step": 152699, "epoch": 3635} {"train_loss": -6.806702613830566, "global_step": 152700, "epoch": 3635} {"train_loss": -6.842959403991699, "global_step": 152701, "epoch": 3635} {"train_loss": -6.72206974029541, "global_step": 152702, "epoch": 3635} {"train_loss": -6.8415632247924805, "global_step": 152703, "epoch": 3635} {"train_loss": -6.864168643951416, "global_step": 152704, "epoch": 3635} {"train_loss": -6.777935028076172, "global_step": 152705, "epoch": 3635} {"train_loss": -6.862697601318359, "global_step": 152706, "epoch": 3635} {"train_loss": -6.916463375091553, "global_step": 152707, "epoch": 3635} {"train_loss": -6.873023986816406, "global_step": 152708, "epoch": 3635} {"train_loss": -6.901652812957764, "global_step": 152709, "epoch": 3635} {"train_loss": -6.915030002593994, "global_step": 152710, "epoch": 3635} {"train_loss": -6.834715559369042, "global_step": 152711, "epoch": 3635, "val_loss": 68541.140625} {"train_loss": -6.859360694885254, "global_step": 152712, "epoch": 3636} {"train_loss": -6.8396077156066895, "global_step": 152713, "epoch": 3636} {"train_loss": -6.848121643066406, "global_step": 152714, "epoch": 3636} {"train_loss": -6.921826362609863, "global_step": 152715, "epoch": 3636} {"train_loss": -6.831697940826416, "global_step": 152716, "epoch": 3636} {"train_loss": -6.79249382019043, "global_step": 152717, "epoch": 3636} {"train_loss": -6.823370933532715, "global_step": 152718, "epoch": 3636} {"train_loss": -6.84865140914917, "global_step": 152719, "epoch": 3636} {"train_loss": -6.864295959472656, "global_step": 152720, "epoch": 3636} {"train_loss": -6.890509128570557, "global_step": 152721, "epoch": 3636} {"train_loss": -6.979867935180664, "global_step": 152722, "epoch": 3636} {"train_loss": -6.894682884216309, "global_step": 152723, "epoch": 3636} {"train_loss": -6.89030122756958, "global_step": 152724, "epoch": 3636} {"train_loss": -6.768689155578613, "global_step": 152725, "epoch": 3636} {"train_loss": -6.918069839477539, "global_step": 152726, "epoch": 3636} {"train_loss": -6.767066955566406, "global_step": 152727, "epoch": 3636} {"train_loss": -6.88919734954834, "global_step": 152728, "epoch": 3636} {"train_loss": -6.99476432800293, "global_step": 152729, "epoch": 3636} {"train_loss": -6.891959190368652, "global_step": 152730, "epoch": 3636} {"train_loss": -6.8410563468933105, "global_step": 152731, "epoch": 3636} {"train_loss": -6.911712169647217, "global_step": 152732, "epoch": 3636} {"train_loss": -6.807642936706543, "global_step": 152733, "epoch": 3636} {"train_loss": -6.872251033782959, "global_step": 152734, "epoch": 3636} {"train_loss": -6.858034133911133, "global_step": 152735, "epoch": 3636} {"train_loss": -6.821163177490234, "global_step": 152736, "epoch": 3636} {"train_loss": -6.930302619934082, "global_step": 152737, "epoch": 3636} {"train_loss": -6.799309730529785, "global_step": 152738, "epoch": 3636} {"train_loss": -6.749937057495117, "global_step": 152739, "epoch": 3636} {"train_loss": -6.865104675292969, "global_step": 152740, "epoch": 3636} {"train_loss": -6.817985534667969, "global_step": 152741, "epoch": 3636} {"train_loss": -6.665932655334473, "global_step": 152742, "epoch": 3636} {"train_loss": -6.798826217651367, "global_step": 152743, "epoch": 3636} {"train_loss": -6.808544158935547, "global_step": 152744, "epoch": 3636} {"train_loss": -6.9178266525268555, "global_step": 152745, "epoch": 3636} {"train_loss": -6.727845668792725, "global_step": 152746, "epoch": 3636} {"train_loss": -6.720180511474609, "global_step": 152747, "epoch": 3636} {"train_loss": -6.837589740753174, "global_step": 152748, "epoch": 3636} {"train_loss": -6.853918075561523, "global_step": 152749, "epoch": 3636} {"train_loss": -6.820374011993408, "global_step": 152750, "epoch": 3636} {"train_loss": -6.910252571105957, "global_step": 152751, "epoch": 3636} {"train_loss": -6.78436803817749, "global_step": 152752, "epoch": 3636} {"train_loss": -6.842356318519229, "global_step": 152753, "epoch": 3636, "val_loss": 68540.6484375} {"train_loss": -6.736889839172363, "global_step": 152754, "epoch": 3637} {"train_loss": -6.699810028076172, "global_step": 152755, "epoch": 3637} {"train_loss": -6.743155002593994, "global_step": 152756, "epoch": 3637} {"train_loss": -6.726751327514648, "global_step": 152757, "epoch": 3637} {"train_loss": -6.799356460571289, "global_step": 152758, "epoch": 3637} {"train_loss": -6.889863014221191, "global_step": 152759, "epoch": 3637} {"train_loss": -6.812256813049316, "global_step": 152760, "epoch": 3637} {"train_loss": -6.884156227111816, "global_step": 152761, "epoch": 3637} {"train_loss": -6.790062427520752, "global_step": 152762, "epoch": 3637} {"train_loss": -6.8613810539245605, "global_step": 152763, "epoch": 3637} {"train_loss": -6.850750923156738, "global_step": 152764, "epoch": 3637} {"train_loss": -6.860266208648682, "global_step": 152765, "epoch": 3637} {"train_loss": -6.878278732299805, "global_step": 152766, "epoch": 3637} {"train_loss": -6.856925010681152, "global_step": 152767, "epoch": 3637} {"train_loss": -6.836616516113281, "global_step": 152768, "epoch": 3637} {"train_loss": -6.7924275398254395, "global_step": 152769, "epoch": 3637} {"train_loss": -6.843136787414551, "global_step": 152770, "epoch": 3637} {"train_loss": -6.837123870849609, "global_step": 152771, "epoch": 3637} {"train_loss": -6.751379013061523, "global_step": 152772, "epoch": 3637} {"train_loss": -6.7251667976379395, "global_step": 152773, "epoch": 3637} {"train_loss": -6.769415855407715, "global_step": 152774, "epoch": 3637} {"train_loss": -6.922104358673096, "global_step": 152775, "epoch": 3637} {"train_loss": -6.860200881958008, "global_step": 152776, "epoch": 3637} {"train_loss": -6.782415390014648, "global_step": 152777, "epoch": 3637} {"train_loss": -6.704233169555664, "global_step": 152778, "epoch": 3637} {"train_loss": -6.661591529846191, "global_step": 152779, "epoch": 3637} {"train_loss": -6.7695512771606445, "global_step": 152780, "epoch": 3637} {"train_loss": -6.759430885314941, "global_step": 152781, "epoch": 3637} {"train_loss": -6.609194755554199, "global_step": 152782, "epoch": 3637} {"train_loss": -6.864055156707764, "global_step": 152783, "epoch": 3637} {"train_loss": -6.668148517608643, "global_step": 152784, "epoch": 3637} {"train_loss": -6.724798202514648, "global_step": 152785, "epoch": 3637} {"train_loss": -6.810469627380371, "global_step": 152786, "epoch": 3637} {"train_loss": -6.618053913116455, "global_step": 152787, "epoch": 3637} {"train_loss": -6.780247688293457, "global_step": 152788, "epoch": 3637} {"train_loss": -6.619551658630371, "global_step": 152789, "epoch": 3637} {"train_loss": -6.8571624755859375, "global_step": 152790, "epoch": 3637} {"train_loss": -6.726888656616211, "global_step": 152791, "epoch": 3637} {"train_loss": -6.822873115539551, "global_step": 152792, "epoch": 3637} {"train_loss": -6.805326461791992, "global_step": 152793, "epoch": 3637} {"train_loss": -6.724831581115723, "global_step": 152794, "epoch": 3637} {"train_loss": -6.778439067658924, "global_step": 152795, "epoch": 3637, "val_loss": 68541.46875} {"train_loss": -6.767398357391357, "global_step": 152796, "epoch": 3638} {"train_loss": -6.890473365783691, "global_step": 152797, "epoch": 3638} {"train_loss": -6.689902305603027, "global_step": 152798, "epoch": 3638} {"train_loss": -6.918306827545166, "global_step": 152799, "epoch": 3638} {"train_loss": -6.82218599319458, "global_step": 152800, "epoch": 3638} {"train_loss": -6.846860885620117, "global_step": 152801, "epoch": 3638} {"train_loss": -6.835555076599121, "global_step": 152802, "epoch": 3638} {"train_loss": -6.835130214691162, "global_step": 152803, "epoch": 3638} {"train_loss": -6.807766914367676, "global_step": 152804, "epoch": 3638} {"train_loss": -6.72734260559082, "global_step": 152805, "epoch": 3638} {"train_loss": -6.857277870178223, "global_step": 152806, "epoch": 3638} {"train_loss": -6.782032012939453, "global_step": 152807, "epoch": 3638} {"train_loss": -6.907207012176514, "global_step": 152808, "epoch": 3638} {"train_loss": -6.86075496673584, "global_step": 152809, "epoch": 3638} {"train_loss": -6.852766990661621, "global_step": 152810, "epoch": 3638} {"train_loss": -6.82243537902832, "global_step": 152811, "epoch": 3638} {"train_loss": -6.866584300994873, "global_step": 152812, "epoch": 3638} {"train_loss": -6.851349830627441, "global_step": 152813, "epoch": 3638} {"train_loss": -6.891628742218018, "global_step": 152814, "epoch": 3638} {"train_loss": -6.85559606552124, "global_step": 152815, "epoch": 3638} {"train_loss": -6.835268020629883, "global_step": 152816, "epoch": 3638} {"train_loss": -6.736753463745117, "global_step": 152817, "epoch": 3638} {"train_loss": -6.79203462600708, "global_step": 152818, "epoch": 3638} {"train_loss": -6.869428634643555, "global_step": 152819, "epoch": 3638} {"train_loss": -6.80888557434082, "global_step": 152820, "epoch": 3638} {"train_loss": -6.9328460693359375, "global_step": 152821, "epoch": 3638} {"train_loss": -6.799445152282715, "global_step": 152822, "epoch": 3638} {"train_loss": -6.8944292068481445, "global_step": 152823, "epoch": 3638} {"train_loss": -7.002922058105469, "global_step": 152824, "epoch": 3638} {"train_loss": -6.898587226867676, "global_step": 152825, "epoch": 3638} {"train_loss": -6.947390556335449, "global_step": 152826, "epoch": 3638} {"train_loss": -6.875463485717773, "global_step": 152827, "epoch": 3638} {"train_loss": -6.85759162902832, "global_step": 152828, "epoch": 3638} {"train_loss": -6.903671741485596, "global_step": 152829, "epoch": 3638} {"train_loss": -6.908927917480469, "global_step": 152830, "epoch": 3638} {"train_loss": -6.825389862060547, "global_step": 152831, "epoch": 3638} {"train_loss": -6.803715705871582, "global_step": 152832, "epoch": 3638} {"train_loss": -7.01712703704834, "global_step": 152833, "epoch": 3638} {"train_loss": -6.869898796081543, "global_step": 152834, "epoch": 3638} {"train_loss": -6.948083400726318, "global_step": 152835, "epoch": 3638} {"train_loss": -6.926630973815918, "global_step": 152836, "epoch": 3638} {"train_loss": -6.8581759589059015, "global_step": 152837, "epoch": 3638, "val_loss": 68358.8125} {"train_loss": -6.858389854431152, "global_step": 152838, "epoch": 3639} {"train_loss": -6.899777889251709, "global_step": 152839, "epoch": 3639} {"train_loss": -6.954520225524902, "global_step": 152840, "epoch": 3639} {"train_loss": -6.882390975952148, "global_step": 152841, "epoch": 3639} {"train_loss": -6.929131507873535, "global_step": 152842, "epoch": 3639} {"train_loss": -7.010629177093506, "global_step": 152843, "epoch": 3639} {"train_loss": -6.901135444641113, "global_step": 152844, "epoch": 3639} {"train_loss": -6.844123840332031, "global_step": 152845, "epoch": 3639} {"train_loss": -6.866328239440918, "global_step": 152846, "epoch": 3639} {"train_loss": -6.88628625869751, "global_step": 152847, "epoch": 3639} {"train_loss": -6.866697311401367, "global_step": 152848, "epoch": 3639} {"train_loss": -6.874207973480225, "global_step": 152849, "epoch": 3639} {"train_loss": -6.858333587646484, "global_step": 152850, "epoch": 3639} {"train_loss": -6.947113513946533, "global_step": 152851, "epoch": 3639} {"train_loss": -6.875938415527344, "global_step": 152852, "epoch": 3639} {"train_loss": -6.898852348327637, "global_step": 152853, "epoch": 3639} {"train_loss": -6.850086688995361, "global_step": 152854, "epoch": 3639} {"train_loss": -6.906478404998779, "global_step": 152855, "epoch": 3639} {"train_loss": -6.791606903076172, "global_step": 152856, "epoch": 3639} {"train_loss": -6.682541847229004, "global_step": 152857, "epoch": 3639} {"train_loss": -6.8668365478515625, "global_step": 152858, "epoch": 3639} {"train_loss": -6.8381667137146, "global_step": 152859, "epoch": 3639} {"train_loss": -6.899643898010254, "global_step": 152860, "epoch": 3639} {"train_loss": -6.956199645996094, "global_step": 152861, "epoch": 3639} {"train_loss": -6.887242317199707, "global_step": 152862, "epoch": 3639} {"train_loss": -6.885119438171387, "global_step": 152863, "epoch": 3639} {"train_loss": -6.763646125793457, "global_step": 152864, "epoch": 3639} {"train_loss": -6.955929756164551, "global_step": 152865, "epoch": 3639} {"train_loss": -6.6823344230651855, "global_step": 152866, "epoch": 3639} {"train_loss": -6.694864273071289, "global_step": 152867, "epoch": 3639} {"train_loss": -6.869050025939941, "global_step": 152868, "epoch": 3639} {"train_loss": -6.880819797515869, "global_step": 152869, "epoch": 3639} {"train_loss": -6.724546432495117, "global_step": 152870, "epoch": 3639} {"train_loss": -6.8208136558532715, "global_step": 152871, "epoch": 3639} {"train_loss": -6.610649585723877, "global_step": 152872, "epoch": 3639} {"train_loss": -6.822858810424805, "global_step": 152873, "epoch": 3639} {"train_loss": -6.633089065551758, "global_step": 152874, "epoch": 3639} {"train_loss": -6.7925567626953125, "global_step": 152875, "epoch": 3639} {"train_loss": -6.744351863861084, "global_step": 152876, "epoch": 3639} {"train_loss": -6.7598185539245605, "global_step": 152877, "epoch": 3639} {"train_loss": -6.76435661315918, "global_step": 152878, "epoch": 3639} {"train_loss": -6.837296837852115, "global_step": 152879, "epoch": 3639, "val_loss": 68553.7265625} {"train_loss": -6.83081579208374, "global_step": 152880, "epoch": 3640} {"train_loss": -6.797970294952393, "global_step": 152881, "epoch": 3640} {"train_loss": -6.865204811096191, "global_step": 152882, "epoch": 3640} {"train_loss": -6.874520301818848, "global_step": 152883, "epoch": 3640} {"train_loss": -6.902616500854492, "global_step": 152884, "epoch": 3640} {"train_loss": -6.803674697875977, "global_step": 152885, "epoch": 3640} {"train_loss": -6.800801753997803, "global_step": 152886, "epoch": 3640} {"train_loss": -6.838245391845703, "global_step": 152887, "epoch": 3640} {"train_loss": -6.781212329864502, "global_step": 152888, "epoch": 3640} {"train_loss": -6.833347320556641, "global_step": 152889, "epoch": 3640} {"train_loss": -6.726020812988281, "global_step": 152890, "epoch": 3640} {"train_loss": -6.889194488525391, "global_step": 152891, "epoch": 3640} {"train_loss": -6.852053165435791, "global_step": 152892, "epoch": 3640} {"train_loss": -6.820346355438232, "global_step": 152893, "epoch": 3640} {"train_loss": -6.837121963500977, "global_step": 152894, "epoch": 3640} {"train_loss": -6.924794673919678, "global_step": 152895, "epoch": 3640} {"train_loss": -6.9250617027282715, "global_step": 152896, "epoch": 3640} {"train_loss": -6.899330139160156, "global_step": 152897, "epoch": 3640} {"train_loss": -6.854592323303223, "global_step": 152898, "epoch": 3640} {"train_loss": -6.823229789733887, "global_step": 152899, "epoch": 3640} {"train_loss": -6.904222011566162, "global_step": 152900, "epoch": 3640} {"train_loss": -6.837243556976318, "global_step": 152901, "epoch": 3640} {"train_loss": -6.79969596862793, "global_step": 152902, "epoch": 3640} {"train_loss": -6.7984819412231445, "global_step": 152903, "epoch": 3640} {"train_loss": -6.7507123947143555, "global_step": 152904, "epoch": 3640} {"train_loss": -6.71539831161499, "global_step": 152905, "epoch": 3640} {"train_loss": -6.820874214172363, "global_step": 152906, "epoch": 3640} {"train_loss": -6.797407150268555, "global_step": 152907, "epoch": 3640} {"train_loss": -6.795764446258545, "global_step": 152908, "epoch": 3640} {"train_loss": -6.715898513793945, "global_step": 152909, "epoch": 3640} {"train_loss": -6.828838348388672, "global_step": 152910, "epoch": 3640} {"train_loss": -6.756927490234375, "global_step": 152911, "epoch": 3640} {"train_loss": -6.806792736053467, "global_step": 152912, "epoch": 3640} {"train_loss": -6.826520919799805, "global_step": 152913, "epoch": 3640} {"train_loss": -6.788851737976074, "global_step": 152914, "epoch": 3640} {"train_loss": -6.8331074714660645, "global_step": 152915, "epoch": 3640} {"train_loss": -6.884974479675293, "global_step": 152916, "epoch": 3640} {"train_loss": -6.733548164367676, "global_step": 152917, "epoch": 3640} {"train_loss": -6.714590549468994, "global_step": 152918, "epoch": 3640} {"train_loss": -6.818523406982422, "global_step": 152919, "epoch": 3640} {"train_loss": -6.851655006408691, "global_step": 152920, "epoch": 3640} {"train_loss": -6.821232545943487, "global_step": 152921, "epoch": 3640, "val_loss": 68424.5390625} {"train_loss": -6.830809593200684, "global_step": 152922, "epoch": 3641} {"train_loss": -6.778800964355469, "global_step": 152923, "epoch": 3641} {"train_loss": -6.828848838806152, "global_step": 152924, "epoch": 3641} {"train_loss": -6.79658317565918, "global_step": 152925, "epoch": 3641} {"train_loss": -6.820018768310547, "global_step": 152926, "epoch": 3641} {"train_loss": -6.793787956237793, "global_step": 152927, "epoch": 3641} {"train_loss": -6.664037227630615, "global_step": 152928, "epoch": 3641} {"train_loss": -6.793234348297119, "global_step": 152929, "epoch": 3641} {"train_loss": -6.8370866775512695, "global_step": 152930, "epoch": 3641} {"train_loss": -6.865688323974609, "global_step": 152931, "epoch": 3641} {"train_loss": -6.812417984008789, "global_step": 152932, "epoch": 3641} {"train_loss": -6.793025016784668, "global_step": 152933, "epoch": 3641} {"train_loss": -6.958701133728027, "global_step": 152934, "epoch": 3641} {"train_loss": -6.820868968963623, "global_step": 152935, "epoch": 3641} {"train_loss": -6.861721992492676, "global_step": 152936, "epoch": 3641} {"train_loss": -6.7260236740112305, "global_step": 152937, "epoch": 3641} {"train_loss": -6.831247329711914, "global_step": 152938, "epoch": 3641} {"train_loss": -6.900095462799072, "global_step": 152939, "epoch": 3641} {"train_loss": -6.84190559387207, "global_step": 152940, "epoch": 3641} {"train_loss": -6.814125061035156, "global_step": 152941, "epoch": 3641} {"train_loss": -6.822861671447754, "global_step": 152942, "epoch": 3641} {"train_loss": -6.8000593185424805, "global_step": 152943, "epoch": 3641} {"train_loss": -6.739555358886719, "global_step": 152944, "epoch": 3641} {"train_loss": -6.718756675720215, "global_step": 152945, "epoch": 3641} {"train_loss": -6.814729690551758, "global_step": 152946, "epoch": 3641} {"train_loss": -6.813203811645508, "global_step": 152947, "epoch": 3641} {"train_loss": -6.789464950561523, "global_step": 152948, "epoch": 3641} {"train_loss": -6.932826995849609, "global_step": 152949, "epoch": 3641} {"train_loss": -6.8372650146484375, "global_step": 152950, "epoch": 3641} {"train_loss": -7.020817279815674, "global_step": 152951, "epoch": 3641} {"train_loss": -6.814420700073242, "global_step": 152952, "epoch": 3641} {"train_loss": -6.785965919494629, "global_step": 152953, "epoch": 3641} {"train_loss": -6.934401512145996, "global_step": 152954, "epoch": 3641} {"train_loss": -6.830786228179932, "global_step": 152955, "epoch": 3641} {"train_loss": -6.849740505218506, "global_step": 152956, "epoch": 3641} {"train_loss": -6.854434013366699, "global_step": 152957, "epoch": 3641} {"train_loss": -6.89943790435791, "global_step": 152958, "epoch": 3641} {"train_loss": -6.886709213256836, "global_step": 152959, "epoch": 3641} {"train_loss": -6.976907253265381, "global_step": 152960, "epoch": 3641} {"train_loss": -6.825394630432129, "global_step": 152961, "epoch": 3641} {"train_loss": -6.888233184814453, "global_step": 152962, "epoch": 3641} {"train_loss": -6.835472833542597, "global_step": 152963, "epoch": 3641, "val_loss": 68462.2734375} {"train_loss": -6.981375694274902, "global_step": 152964, "epoch": 3642} {"train_loss": -6.856678009033203, "global_step": 152965, "epoch": 3642} {"train_loss": -6.884740352630615, "global_step": 152966, "epoch": 3642} {"train_loss": -6.881706237792969, "global_step": 152967, "epoch": 3642} {"train_loss": -6.880285263061523, "global_step": 152968, "epoch": 3642} {"train_loss": -6.910452842712402, "global_step": 152969, "epoch": 3642} {"train_loss": -6.943517684936523, "global_step": 152970, "epoch": 3642} {"train_loss": -6.890542984008789, "global_step": 152971, "epoch": 3642} {"train_loss": -6.923834323883057, "global_step": 152972, "epoch": 3642} {"train_loss": -6.918497085571289, "global_step": 152973, "epoch": 3642} {"train_loss": -6.940359115600586, "global_step": 152974, "epoch": 3642} {"train_loss": -6.9186930656433105, "global_step": 152975, "epoch": 3642} {"train_loss": -6.928740501403809, "global_step": 152976, "epoch": 3642} {"train_loss": -6.910440921783447, "global_step": 152977, "epoch": 3642} {"train_loss": -6.84324836730957, "global_step": 152978, "epoch": 3642} {"train_loss": -6.917812347412109, "global_step": 152979, "epoch": 3642} {"train_loss": -6.821374893188477, "global_step": 152980, "epoch": 3642} {"train_loss": -6.885189056396484, "global_step": 152981, "epoch": 3642} {"train_loss": -6.8526201248168945, "global_step": 152982, "epoch": 3642} {"train_loss": -6.928688049316406, "global_step": 152983, "epoch": 3642} {"train_loss": -6.853494644165039, "global_step": 152984, "epoch": 3642} {"train_loss": -6.910676956176758, "global_step": 152985, "epoch": 3642} {"train_loss": -6.924948692321777, "global_step": 152986, "epoch": 3642} {"train_loss": -6.786369323730469, "global_step": 152987, "epoch": 3642} {"train_loss": -7.007081031799316, "global_step": 152988, "epoch": 3642} {"train_loss": -6.864214897155762, "global_step": 152989, "epoch": 3642} {"train_loss": -6.897457122802734, "global_step": 152990, "epoch": 3642} {"train_loss": -6.859940052032471, "global_step": 152991, "epoch": 3642} {"train_loss": -6.7951459884643555, "global_step": 152992, "epoch": 3642} {"train_loss": -6.795198917388916, "global_step": 152993, "epoch": 3642} {"train_loss": -6.9443254470825195, "global_step": 152994, "epoch": 3642} {"train_loss": -6.904857635498047, "global_step": 152995, "epoch": 3642} {"train_loss": -6.838702201843262, "global_step": 152996, "epoch": 3642} {"train_loss": -6.8458967208862305, "global_step": 152997, "epoch": 3642} {"train_loss": -6.810939788818359, "global_step": 152998, "epoch": 3642} {"train_loss": -6.821516036987305, "global_step": 152999, "epoch": 3642} {"train_loss": -6.8828558921813965, "global_step": 153000, "epoch": 3642} {"train_loss": -6.889016151428223, "global_step": 153001, "epoch": 3642} {"train_loss": -6.776191234588623, "global_step": 153002, "epoch": 3642} {"train_loss": -6.798773765563965, "global_step": 153003, "epoch": 3642} {"train_loss": -6.788106918334961, "global_step": 153004, "epoch": 3642} {"train_loss": -6.875503233500889, "global_step": 153005, "epoch": 3642, "val_loss": 68742.4921875} {"train_loss": -6.769534111022949, "global_step": 153006, "epoch": 3643} {"train_loss": -6.816362380981445, "global_step": 153007, "epoch": 3643} {"train_loss": -6.7767252922058105, "global_step": 153008, "epoch": 3643} {"train_loss": -6.810319423675537, "global_step": 153009, "epoch": 3643} {"train_loss": -6.771686553955078, "global_step": 153010, "epoch": 3643} {"train_loss": -6.789889335632324, "global_step": 153011, "epoch": 3643} {"train_loss": -6.833464622497559, "global_step": 153012, "epoch": 3643} {"train_loss": -6.819155693054199, "global_step": 153013, "epoch": 3643} {"train_loss": -6.845792770385742, "global_step": 153014, "epoch": 3643} {"train_loss": -6.880506992340088, "global_step": 153015, "epoch": 3643} {"train_loss": -6.822991847991943, "global_step": 153016, "epoch": 3643} {"train_loss": -6.83721923828125, "global_step": 153017, "epoch": 3643} {"train_loss": -6.7666239738464355, "global_step": 153018, "epoch": 3643} {"train_loss": -6.8696722984313965, "global_step": 153019, "epoch": 3643} {"train_loss": -6.760732650756836, "global_step": 153020, "epoch": 3643} {"train_loss": -6.791888236999512, "global_step": 153021, "epoch": 3643} {"train_loss": -6.910605430603027, "global_step": 153022, "epoch": 3643} {"train_loss": -6.773427486419678, "global_step": 153023, "epoch": 3643} {"train_loss": -6.9386396408081055, "global_step": 153024, "epoch": 3643} {"train_loss": -6.861990928649902, "global_step": 153025, "epoch": 3643} {"train_loss": -6.834632873535156, "global_step": 153026, "epoch": 3643} {"train_loss": -6.823976993560791, "global_step": 153027, "epoch": 3643} {"train_loss": -6.802076816558838, "global_step": 153028, "epoch": 3643} {"train_loss": -6.909085273742676, "global_step": 153029, "epoch": 3643} {"train_loss": -6.822715759277344, "global_step": 153030, "epoch": 3643} {"train_loss": -6.832955360412598, "global_step": 153031, "epoch": 3643} {"train_loss": -6.846658706665039, "global_step": 153032, "epoch": 3643} {"train_loss": -6.897019386291504, "global_step": 153033, "epoch": 3643} {"train_loss": -6.898681640625, "global_step": 153034, "epoch": 3643} {"train_loss": -6.825638771057129, "global_step": 153035, "epoch": 3643} {"train_loss": -6.89209508895874, "global_step": 153036, "epoch": 3643} {"train_loss": -6.836897850036621, "global_step": 153037, "epoch": 3643} {"train_loss": -6.788141250610352, "global_step": 153038, "epoch": 3643} {"train_loss": -6.767427444458008, "global_step": 153039, "epoch": 3643} {"train_loss": -6.871786117553711, "global_step": 153040, "epoch": 3643} {"train_loss": -6.879602432250977, "global_step": 153041, "epoch": 3643} {"train_loss": -6.762225151062012, "global_step": 153042, "epoch": 3643} {"train_loss": -6.749944686889648, "global_step": 153043, "epoch": 3643} {"train_loss": -6.929007530212402, "global_step": 153044, "epoch": 3643} {"train_loss": -6.849103927612305, "global_step": 153045, "epoch": 3643} {"train_loss": -6.7519731521606445, "global_step": 153046, "epoch": 3643} {"train_loss": -6.83158818880717, "global_step": 153047, "epoch": 3643, "val_loss": 68533.6953125} {"train_loss": -6.815177917480469, "global_step": 153048, "epoch": 3644} {"train_loss": -6.859381198883057, "global_step": 153049, "epoch": 3644} {"train_loss": -6.949309349060059, "global_step": 153050, "epoch": 3644} {"train_loss": -6.831089019775391, "global_step": 153051, "epoch": 3644} {"train_loss": -6.942143440246582, "global_step": 153052, "epoch": 3644} {"train_loss": -6.798175811767578, "global_step": 153053, "epoch": 3644} {"train_loss": -6.909398555755615, "global_step": 153054, "epoch": 3644} {"train_loss": -6.903637886047363, "global_step": 153055, "epoch": 3644} {"train_loss": -7.004502296447754, "global_step": 153056, "epoch": 3644} {"train_loss": -6.841153144836426, "global_step": 153057, "epoch": 3644} {"train_loss": -6.785191059112549, "global_step": 153058, "epoch": 3644} {"train_loss": -6.851855278015137, "global_step": 153059, "epoch": 3644} {"train_loss": -6.830411911010742, "global_step": 153060, "epoch": 3644} {"train_loss": -6.919063091278076, "global_step": 153061, "epoch": 3644} {"train_loss": -6.784104824066162, "global_step": 153062, "epoch": 3644} {"train_loss": -6.833014965057373, "global_step": 153063, "epoch": 3644} {"train_loss": -6.805423259735107, "global_step": 153064, "epoch": 3644} {"train_loss": -6.806506633758545, "global_step": 153065, "epoch": 3644} {"train_loss": -6.897413730621338, "global_step": 153066, "epoch": 3644} {"train_loss": -6.841625690460205, "global_step": 153067, "epoch": 3644} {"train_loss": -6.912341117858887, "global_step": 153068, "epoch": 3644} {"train_loss": -6.817193031311035, "global_step": 153069, "epoch": 3644} {"train_loss": -6.881817817687988, "global_step": 153070, "epoch": 3644} {"train_loss": -6.799187660217285, "global_step": 153071, "epoch": 3644} {"train_loss": -6.817819595336914, "global_step": 153072, "epoch": 3644} {"train_loss": -6.908324241638184, "global_step": 153073, "epoch": 3644} {"train_loss": -6.832979202270508, "global_step": 153074, "epoch": 3644} {"train_loss": -6.919358253479004, "global_step": 153075, "epoch": 3644} {"train_loss": -6.794778823852539, "global_step": 153076, "epoch": 3644} {"train_loss": -6.8286333084106445, "global_step": 153077, "epoch": 3644} {"train_loss": -6.8703765869140625, "global_step": 153078, "epoch": 3644} {"train_loss": -6.789236068725586, "global_step": 153079, "epoch": 3644} {"train_loss": -6.812206745147705, "global_step": 153080, "epoch": 3644} {"train_loss": -6.8123674392700195, "global_step": 153081, "epoch": 3644} {"train_loss": -6.91400671005249, "global_step": 153082, "epoch": 3644} {"train_loss": -6.83257532119751, "global_step": 153083, "epoch": 3644} {"train_loss": -6.624871253967285, "global_step": 153084, "epoch": 3644} {"train_loss": -6.812690734863281, "global_step": 153085, "epoch": 3644} {"train_loss": -6.809591293334961, "global_step": 153086, "epoch": 3644} {"train_loss": -6.674258708953857, "global_step": 153087, "epoch": 3644} {"train_loss": -6.711791038513184, "global_step": 153088, "epoch": 3644} {"train_loss": -6.837427184695289, "global_step": 153089, "epoch": 3644, "val_loss": 68537.5625} {"train_loss": -6.688775062561035, "global_step": 153090, "epoch": 3645} {"train_loss": -6.792126655578613, "global_step": 153091, "epoch": 3645} {"train_loss": -6.854500770568848, "global_step": 153092, "epoch": 3645} {"train_loss": -6.744919776916504, "global_step": 153093, "epoch": 3645} {"train_loss": -6.7381086349487305, "global_step": 153094, "epoch": 3645} {"train_loss": -6.783951759338379, "global_step": 153095, "epoch": 3645} {"train_loss": -6.717607498168945, "global_step": 153096, "epoch": 3645} {"train_loss": -6.8226752281188965, "global_step": 153097, "epoch": 3645} {"train_loss": -6.844081878662109, "global_step": 153098, "epoch": 3645} {"train_loss": -6.755970001220703, "global_step": 153099, "epoch": 3645} {"train_loss": -6.7934184074401855, "global_step": 153100, "epoch": 3645} {"train_loss": -6.812150955200195, "global_step": 153101, "epoch": 3645} {"train_loss": -6.8575849533081055, "global_step": 153102, "epoch": 3645} {"train_loss": -6.864941120147705, "global_step": 153103, "epoch": 3645} {"train_loss": -6.879794120788574, "global_step": 153104, "epoch": 3645} {"train_loss": -6.766001224517822, "global_step": 153105, "epoch": 3645} {"train_loss": -6.903090476989746, "global_step": 153106, "epoch": 3645} {"train_loss": -6.905147552490234, "global_step": 153107, "epoch": 3645} {"train_loss": -6.873111724853516, "global_step": 153108, "epoch": 3645} {"train_loss": -6.773227691650391, "global_step": 153109, "epoch": 3645} {"train_loss": -6.8404412269592285, "global_step": 153110, "epoch": 3645} {"train_loss": -6.8793134689331055, "global_step": 153111, "epoch": 3645} {"train_loss": -6.964868545532227, "global_step": 153112, "epoch": 3645} {"train_loss": -6.831709861755371, "global_step": 153113, "epoch": 3645} {"train_loss": -6.874644756317139, "global_step": 153114, "epoch": 3645} {"train_loss": -6.9097394943237305, "global_step": 153115, "epoch": 3645} {"train_loss": -6.897238254547119, "global_step": 153116, "epoch": 3645} {"train_loss": -6.8551411628723145, "global_step": 153117, "epoch": 3645} {"train_loss": -6.957176208496094, "global_step": 153118, "epoch": 3645} {"train_loss": -6.9736528396606445, "global_step": 153119, "epoch": 3645} {"train_loss": -6.847572326660156, "global_step": 153120, "epoch": 3645} {"train_loss": -6.901617527008057, "global_step": 153121, "epoch": 3645} {"train_loss": -6.896146297454834, "global_step": 153122, "epoch": 3645} {"train_loss": -6.831036567687988, "global_step": 153123, "epoch": 3645} {"train_loss": -6.817378997802734, "global_step": 153124, "epoch": 3645} {"train_loss": -6.859040260314941, "global_step": 153125, "epoch": 3645} {"train_loss": -6.943978786468506, "global_step": 153126, "epoch": 3645} {"train_loss": -6.891643524169922, "global_step": 153127, "epoch": 3645} {"train_loss": -6.83065128326416, "global_step": 153128, "epoch": 3645} {"train_loss": -6.7057390213012695, "global_step": 153129, "epoch": 3645} {"train_loss": -6.733005523681641, "global_step": 153130, "epoch": 3645} {"train_loss": -6.839665174484253, "global_step": 153131, "epoch": 3645, "val_loss": 68500.6015625} {"train_loss": -6.804033279418945, "global_step": 153132, "epoch": 3646} {"train_loss": -6.892979621887207, "global_step": 153133, "epoch": 3646} {"train_loss": -6.685210227966309, "global_step": 153134, "epoch": 3646} {"train_loss": -6.945815086364746, "global_step": 153135, "epoch": 3646} {"train_loss": -6.718282699584961, "global_step": 153136, "epoch": 3646} {"train_loss": -6.680575847625732, "global_step": 153137, "epoch": 3646} {"train_loss": -6.7437896728515625, "global_step": 153138, "epoch": 3646} {"train_loss": -6.693577766418457, "global_step": 153139, "epoch": 3646} {"train_loss": -6.801694869995117, "global_step": 153140, "epoch": 3646} {"train_loss": -6.559507369995117, "global_step": 153141, "epoch": 3646} {"train_loss": -6.7399678230285645, "global_step": 153142, "epoch": 3646} {"train_loss": -6.573694705963135, "global_step": 153143, "epoch": 3646} {"train_loss": -6.684412956237793, "global_step": 153144, "epoch": 3646} {"train_loss": -6.752785682678223, "global_step": 153145, "epoch": 3646} {"train_loss": -6.7831950187683105, "global_step": 153146, "epoch": 3646} {"train_loss": -6.771001815795898, "global_step": 153147, "epoch": 3646} {"train_loss": -6.672816276550293, "global_step": 153148, "epoch": 3646} {"train_loss": -6.753042221069336, "global_step": 153149, "epoch": 3646} {"train_loss": -6.829159736633301, "global_step": 153150, "epoch": 3646} {"train_loss": -6.849851131439209, "global_step": 153151, "epoch": 3646} {"train_loss": -6.833278656005859, "global_step": 153152, "epoch": 3646} {"train_loss": -6.735639572143555, "global_step": 153153, "epoch": 3646} {"train_loss": -6.814341068267822, "global_step": 153154, "epoch": 3646} {"train_loss": -6.882329940795898, "global_step": 153155, "epoch": 3646} {"train_loss": -6.703052043914795, "global_step": 153156, "epoch": 3646} {"train_loss": -6.817138671875, "global_step": 153157, "epoch": 3646} {"train_loss": -6.739248275756836, "global_step": 153158, "epoch": 3646} {"train_loss": -6.8173017501831055, "global_step": 153159, "epoch": 3646} {"train_loss": -6.852260112762451, "global_step": 153160, "epoch": 3646} {"train_loss": -6.6749162673950195, "global_step": 153161, "epoch": 3646} {"train_loss": -6.749429702758789, "global_step": 153162, "epoch": 3646} {"train_loss": -6.741302490234375, "global_step": 153163, "epoch": 3646} {"train_loss": -6.768524646759033, "global_step": 153164, "epoch": 3646} {"train_loss": -6.810178279876709, "global_step": 153165, "epoch": 3646} {"train_loss": -6.8159894943237305, "global_step": 153166, "epoch": 3646} {"train_loss": -6.764464378356934, "global_step": 153167, "epoch": 3646} {"train_loss": -6.846651554107666, "global_step": 153168, "epoch": 3646} {"train_loss": -6.693737506866455, "global_step": 153169, "epoch": 3646} {"train_loss": -6.79987096786499, "global_step": 153170, "epoch": 3646} {"train_loss": -6.844174385070801, "global_step": 153171, "epoch": 3646} {"train_loss": -6.689647197723389, "global_step": 153172, "epoch": 3646} {"train_loss": -6.764052436465309, "global_step": 153173, "epoch": 3646, "val_loss": 68420.234375} {"train_loss": -6.675987243652344, "global_step": 153174, "epoch": 3647} {"train_loss": -6.851596355438232, "global_step": 153175, "epoch": 3647} {"train_loss": -6.78377628326416, "global_step": 153176, "epoch": 3647} {"train_loss": -6.82559061050415, "global_step": 153177, "epoch": 3647} {"train_loss": -6.89674186706543, "global_step": 153178, "epoch": 3647} {"train_loss": -6.6696014404296875, "global_step": 153179, "epoch": 3647} {"train_loss": -6.9664998054504395, "global_step": 153180, "epoch": 3647} {"train_loss": -6.795777797698975, "global_step": 153181, "epoch": 3647} {"train_loss": -6.720969200134277, "global_step": 153182, "epoch": 3647} {"train_loss": -6.877225875854492, "global_step": 153183, "epoch": 3647} {"train_loss": -6.841927528381348, "global_step": 153184, "epoch": 3647} {"train_loss": -6.857624053955078, "global_step": 153185, "epoch": 3647} {"train_loss": -6.767292022705078, "global_step": 153186, "epoch": 3647} {"train_loss": -6.777963638305664, "global_step": 153187, "epoch": 3647} {"train_loss": -6.846763610839844, "global_step": 153188, "epoch": 3647} {"train_loss": -6.795845031738281, "global_step": 153189, "epoch": 3647} {"train_loss": -6.905069351196289, "global_step": 153190, "epoch": 3647} {"train_loss": -6.77946662902832, "global_step": 153191, "epoch": 3647} {"train_loss": -6.772683143615723, "global_step": 153192, "epoch": 3647} {"train_loss": -6.779884338378906, "global_step": 153193, "epoch": 3647} {"train_loss": -6.8502912521362305, "global_step": 153194, "epoch": 3647} {"train_loss": -6.8395256996154785, "global_step": 153195, "epoch": 3647} {"train_loss": -6.694366931915283, "global_step": 153196, "epoch": 3647} {"train_loss": -6.847373008728027, "global_step": 153197, "epoch": 3647} {"train_loss": -6.749561309814453, "global_step": 153198, "epoch": 3647} {"train_loss": -6.752741813659668, "global_step": 153199, "epoch": 3647} {"train_loss": -6.8993024826049805, "global_step": 153200, "epoch": 3647} {"train_loss": -6.745193958282471, "global_step": 153201, "epoch": 3647} {"train_loss": -6.875423431396484, "global_step": 153202, "epoch": 3647} {"train_loss": -6.733610153198242, "global_step": 153203, "epoch": 3647} {"train_loss": -6.774003028869629, "global_step": 153204, "epoch": 3647} {"train_loss": -6.904273986816406, "global_step": 153205, "epoch": 3647} {"train_loss": -6.91262149810791, "global_step": 153206, "epoch": 3647} {"train_loss": -6.72312068939209, "global_step": 153207, "epoch": 3647} {"train_loss": -6.790077209472656, "global_step": 153208, "epoch": 3647} {"train_loss": -6.885190963745117, "global_step": 153209, "epoch": 3647} {"train_loss": -6.849300384521484, "global_step": 153210, "epoch": 3647} {"train_loss": -6.812230110168457, "global_step": 153211, "epoch": 3647} {"train_loss": -6.7519941329956055, "global_step": 153212, "epoch": 3647} {"train_loss": -6.827157497406006, "global_step": 153213, "epoch": 3647} {"train_loss": -6.786088466644287, "global_step": 153214, "epoch": 3647} {"train_loss": -6.810905638195219, "global_step": 153215, "epoch": 3647, "val_loss": 68576.3359375} {"train_loss": -6.834780693054199, "global_step": 153216, "epoch": 3648} {"train_loss": -6.713667392730713, "global_step": 153217, "epoch": 3648} {"train_loss": -6.881804466247559, "global_step": 153218, "epoch": 3648} {"train_loss": -6.907784461975098, "global_step": 153219, "epoch": 3648} {"train_loss": -6.85677433013916, "global_step": 153220, "epoch": 3648} {"train_loss": -6.833442687988281, "global_step": 153221, "epoch": 3648} {"train_loss": -6.897751808166504, "global_step": 153222, "epoch": 3648} {"train_loss": -6.899135589599609, "global_step": 153223, "epoch": 3648} {"train_loss": -6.80629825592041, "global_step": 153224, "epoch": 3648} {"train_loss": -6.891505241394043, "global_step": 153225, "epoch": 3648} {"train_loss": -6.719727516174316, "global_step": 153226, "epoch": 3648} {"train_loss": -6.802769184112549, "global_step": 153227, "epoch": 3648} {"train_loss": -6.890795707702637, "global_step": 153228, "epoch": 3648} {"train_loss": -6.862980842590332, "global_step": 153229, "epoch": 3648} {"train_loss": -6.9420952796936035, "global_step": 153230, "epoch": 3648} {"train_loss": -6.8907318115234375, "global_step": 153231, "epoch": 3648} {"train_loss": -6.808540344238281, "global_step": 153232, "epoch": 3648} {"train_loss": -6.877314567565918, "global_step": 153233, "epoch": 3648} {"train_loss": -6.929993152618408, "global_step": 153234, "epoch": 3648} {"train_loss": -6.844470977783203, "global_step": 153235, "epoch": 3648} {"train_loss": -6.9123311042785645, "global_step": 153236, "epoch": 3648} {"train_loss": -6.827473163604736, "global_step": 153237, "epoch": 3648} {"train_loss": -6.891020774841309, "global_step": 153238, "epoch": 3648} {"train_loss": -6.903406143188477, "global_step": 153239, "epoch": 3648} {"train_loss": -6.882192611694336, "global_step": 153240, "epoch": 3648} {"train_loss": -6.881290435791016, "global_step": 153241, "epoch": 3648} {"train_loss": -6.990443229675293, "global_step": 153242, "epoch": 3648} {"train_loss": -6.7969970703125, "global_step": 153243, "epoch": 3648} {"train_loss": -6.853788375854492, "global_step": 153244, "epoch": 3648} {"train_loss": -6.883214950561523, "global_step": 153245, "epoch": 3648} {"train_loss": -6.808548450469971, "global_step": 153246, "epoch": 3648} {"train_loss": -6.883502006530762, "global_step": 153247, "epoch": 3648} {"train_loss": -6.809638977050781, "global_step": 153248, "epoch": 3648} {"train_loss": -6.882867336273193, "global_step": 153249, "epoch": 3648} {"train_loss": -6.863274574279785, "global_step": 153250, "epoch": 3648} {"train_loss": -6.909675121307373, "global_step": 153251, "epoch": 3648} {"train_loss": -6.855240821838379, "global_step": 153252, "epoch": 3648} {"train_loss": -6.839946269989014, "global_step": 153253, "epoch": 3648} {"train_loss": -6.901508331298828, "global_step": 153254, "epoch": 3648} {"train_loss": -6.835499286651611, "global_step": 153255, "epoch": 3648} {"train_loss": -6.820948600769043, "global_step": 153256, "epoch": 3648} {"train_loss": -6.862098148890904, "global_step": 153257, "epoch": 3648, "val_loss": 68419.125} {"train_loss": -6.879986763000488, "global_step": 153258, "epoch": 3649} {"train_loss": -6.974891185760498, "global_step": 153259, "epoch": 3649} {"train_loss": -6.825407981872559, "global_step": 153260, "epoch": 3649} {"train_loss": -7.031089782714844, "global_step": 153261, "epoch": 3649} {"train_loss": -6.873232841491699, "global_step": 153262, "epoch": 3649} {"train_loss": -6.954024791717529, "global_step": 153263, "epoch": 3649} {"train_loss": -6.785056114196777, "global_step": 153264, "epoch": 3649} {"train_loss": -6.833485126495361, "global_step": 153265, "epoch": 3649} {"train_loss": -6.9347381591796875, "global_step": 153266, "epoch": 3649} {"train_loss": -6.8335771560668945, "global_step": 153267, "epoch": 3649} {"train_loss": -6.948718547821045, "global_step": 153268, "epoch": 3649} {"train_loss": -6.869622230529785, "global_step": 153269, "epoch": 3649} {"train_loss": -6.91278076171875, "global_step": 153270, "epoch": 3649} {"train_loss": -6.7684502601623535, "global_step": 153271, "epoch": 3649} {"train_loss": -6.785375118255615, "global_step": 153272, "epoch": 3649} {"train_loss": -6.876494884490967, "global_step": 153273, "epoch": 3649} {"train_loss": -6.729543685913086, "global_step": 153274, "epoch": 3649} {"train_loss": -6.779831886291504, "global_step": 153275, "epoch": 3649} {"train_loss": -6.8587188720703125, "global_step": 153276, "epoch": 3649} {"train_loss": -6.756566047668457, "global_step": 153277, "epoch": 3649} {"train_loss": -6.820369720458984, "global_step": 153278, "epoch": 3649} {"train_loss": -6.755770683288574, "global_step": 153279, "epoch": 3649} {"train_loss": -6.7626566886901855, "global_step": 153280, "epoch": 3649} {"train_loss": -6.86788272857666, "global_step": 153281, "epoch": 3649} {"train_loss": -6.869182586669922, "global_step": 153282, "epoch": 3649} {"train_loss": -6.749256610870361, "global_step": 153283, "epoch": 3649} {"train_loss": -6.77070426940918, "global_step": 153284, "epoch": 3649} {"train_loss": -6.841133117675781, "global_step": 153285, "epoch": 3649} {"train_loss": -6.711671829223633, "global_step": 153286, "epoch": 3649} {"train_loss": -6.793881893157959, "global_step": 153287, "epoch": 3649} {"train_loss": -6.755810737609863, "global_step": 153288, "epoch": 3649} {"train_loss": -6.836400985717773, "global_step": 153289, "epoch": 3649} {"train_loss": -6.698295593261719, "global_step": 153290, "epoch": 3649} {"train_loss": -6.901573181152344, "global_step": 153291, "epoch": 3649} {"train_loss": -6.783871650695801, "global_step": 153292, "epoch": 3649} {"train_loss": -6.7734270095825195, "global_step": 153293, "epoch": 3649} {"train_loss": -6.880771636962891, "global_step": 153294, "epoch": 3649} {"train_loss": -6.797998905181885, "global_step": 153295, "epoch": 3649} {"train_loss": -6.738864421844482, "global_step": 153296, "epoch": 3649} {"train_loss": -6.825842380523682, "global_step": 153297, "epoch": 3649} {"train_loss": -6.66656494140625, "global_step": 153298, "epoch": 3649} {"train_loss": -6.823405651819138, "global_step": 153299, "epoch": 3649, "val_loss": 68611.0859375} {"train_loss": -6.892988204956055, "global_step": 153300, "epoch": 3650} {"train_loss": -6.812048435211182, "global_step": 153301, "epoch": 3650} {"train_loss": -6.7825422286987305, "global_step": 153302, "epoch": 3650} {"train_loss": -6.92602014541626, "global_step": 153303, "epoch": 3650} {"train_loss": -6.711354732513428, "global_step": 153304, "epoch": 3650} {"train_loss": -6.82463264465332, "global_step": 153305, "epoch": 3650} {"train_loss": -6.731471061706543, "global_step": 153306, "epoch": 3650} {"train_loss": -6.818020820617676, "global_step": 153307, "epoch": 3650} {"train_loss": -6.665717124938965, "global_step": 153308, "epoch": 3650} {"train_loss": -6.633016586303711, "global_step": 153309, "epoch": 3650} {"train_loss": -6.76713752746582, "global_step": 153310, "epoch": 3650} {"train_loss": -6.6309895515441895, "global_step": 153311, "epoch": 3650} {"train_loss": -6.84865665435791, "global_step": 153312, "epoch": 3650} {"train_loss": -6.7207350730896, "global_step": 153313, "epoch": 3650} {"train_loss": -6.782054424285889, "global_step": 153314, "epoch": 3650} {"train_loss": -6.713550567626953, "global_step": 153315, "epoch": 3650} {"train_loss": -6.690679550170898, "global_step": 153316, "epoch": 3650} {"train_loss": -6.75852632522583, "global_step": 153317, "epoch": 3650} {"train_loss": -6.7415971755981445, "global_step": 153318, "epoch": 3650} {"train_loss": -6.769659042358398, "global_step": 153319, "epoch": 3650} {"train_loss": -6.79642391204834, "global_step": 153320, "epoch": 3650} {"train_loss": -6.773374557495117, "global_step": 153321, "epoch": 3650} {"train_loss": -6.784965515136719, "global_step": 153322, "epoch": 3650} {"train_loss": -6.92690372467041, "global_step": 153323, "epoch": 3650} {"train_loss": -6.804698944091797, "global_step": 153324, "epoch": 3650} {"train_loss": -6.949609756469727, "global_step": 153325, "epoch": 3650} {"train_loss": -6.796509742736816, "global_step": 153326, "epoch": 3650} {"train_loss": -6.821384429931641, "global_step": 153327, "epoch": 3650} {"train_loss": -6.809195518493652, "global_step": 153328, "epoch": 3650} {"train_loss": -6.835812568664551, "global_step": 153329, "epoch": 3650} {"train_loss": -6.942683219909668, "global_step": 153330, "epoch": 3650} {"train_loss": -6.813896179199219, "global_step": 153331, "epoch": 3650} {"train_loss": -6.913981914520264, "global_step": 153332, "epoch": 3650} {"train_loss": -6.805830955505371, "global_step": 153333, "epoch": 3650} {"train_loss": -6.785795211791992, "global_step": 153334, "epoch": 3650} {"train_loss": -6.799574851989746, "global_step": 153335, "epoch": 3650} {"train_loss": -6.971976280212402, "global_step": 153336, "epoch": 3650} {"train_loss": -6.926682949066162, "global_step": 153337, "epoch": 3650} {"train_loss": -6.869410514831543, "global_step": 153338, "epoch": 3650} {"train_loss": -6.884563446044922, "global_step": 153339, "epoch": 3650} {"train_loss": -6.971349716186523, "global_step": 153340, "epoch": 3650} {"train_loss": -6.811829453422909, "global_step": 153341, "epoch": 3650, "train/sim_max_reward_0": 0.5300315332605345, "train/sim_max_reward_1": 0.7591259247006624, "train/sim_max_reward_2": 0.5763866038372801, "train/sim_max_reward_3": 0.11482614845580846, "train/sim_max_reward_4": 0.43754640428432495, "train/sim_max_reward_5": 0.9185308464156379, "test/sim_max_reward_4400000": 0.9377645758861384, "test/sim_max_reward_4400001": 0.3695218295543696, "test/sim_max_reward_4400002": 0.22436892039477177, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9413104802061338, "test/sim_max_reward_4400006": 0.5783609207726219, "test/sim_max_reward_4400007": 0.8927215561300744, "test/sim_max_reward_4400008": 0.311974221247865, "test/sim_max_reward_4400009": 0.6883169817222714, "test/sim_max_reward_4400010": 0.22111231992230287, "test/sim_max_reward_4400011": 0.2388074794036202, "test/sim_max_reward_4400012": 0.9417400257809363, "test/sim_max_reward_4400013": 0.9318799380705917, "test/sim_max_reward_4400014": 0.1725739804915727, "test/sim_max_reward_4400015": 0.09322800052189835, "test/sim_max_reward_4400016": 0.30586746871005216, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.22636888932646418, "test/sim_max_reward_4400019": 0.01890276672410311, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.2018167246509427, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.9944306447087151, "test/sim_max_reward_4400025": 0.2838138174863081, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.001620569075239818, "test/sim_max_reward_4400028": 0.8904013605197025, "test/sim_max_reward_4400029": 0.04310798655853964, "test/sim_max_reward_4400030": 0.9446203329476254, "test/sim_max_reward_4400031": 0.9577869935648531, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9900053020967596, "test/sim_max_reward_4400034": 0.8835275796065525, "test/sim_max_reward_4400035": 0.9850899504644018, "test/sim_max_reward_4400036": 0.4808745028459281, "test/sim_max_reward_4400037": 0.9767589721902091, "test/sim_max_reward_4400038": 0.9757931303747747, "test/sim_max_reward_4400039": 0.9057359950112974, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9150653723017876, "test/sim_max_reward_4400042": 0.6125887617732901, "test/sim_max_reward_4400043": 0.9682190638274376, "test/sim_max_reward_4400044": 0.8413194359616082, "test/sim_max_reward_4400045": 0.9658623425400604, "test/sim_max_reward_4400046": 0.4048495192812417, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.9610128941361624, "test/sim_max_reward_4400049": 0.9803657469195405, "train/mean_score": 0.5560745768257079, "test/mean_score": 0.5546543436816532, "val_loss": 68416.7578125} {"train_loss": -6.858838081359863, "global_step": 153342, "epoch": 3651} {"train_loss": -6.885556221008301, "global_step": 153343, "epoch": 3651} {"train_loss": -6.853866100311279, "global_step": 153344, "epoch": 3651} {"train_loss": -6.883785247802734, "global_step": 153345, "epoch": 3651} {"train_loss": -6.863299369812012, "global_step": 153346, "epoch": 3651} {"train_loss": -6.903833389282227, "global_step": 153347, "epoch": 3651} {"train_loss": -6.787107944488525, "global_step": 153348, "epoch": 3651} {"train_loss": -6.966784477233887, "global_step": 153349, "epoch": 3651} {"train_loss": -6.792926788330078, "global_step": 153350, "epoch": 3651} {"train_loss": -6.950579643249512, "global_step": 153351, "epoch": 3651} {"train_loss": -6.849781036376953, "global_step": 153352, "epoch": 3651} {"train_loss": -6.894186973571777, "global_step": 153353, "epoch": 3651} {"train_loss": -6.823329925537109, "global_step": 153354, "epoch": 3651} {"train_loss": -6.749768257141113, "global_step": 153355, "epoch": 3651} {"train_loss": -6.673774719238281, "global_step": 153356, "epoch": 3651} {"train_loss": -6.848987579345703, "global_step": 153357, "epoch": 3651} {"train_loss": -6.847930431365967, "global_step": 153358, "epoch": 3651} {"train_loss": -6.901796817779541, "global_step": 153359, "epoch": 3651} {"train_loss": -6.845077037811279, "global_step": 153360, "epoch": 3651} {"train_loss": -6.807468414306641, "global_step": 153361, "epoch": 3651} {"train_loss": -6.775819778442383, "global_step": 153362, "epoch": 3651} {"train_loss": -6.820703029632568, "global_step": 153363, "epoch": 3651} {"train_loss": -6.801531791687012, "global_step": 153364, "epoch": 3651} {"train_loss": -6.859532833099365, "global_step": 153365, "epoch": 3651} {"train_loss": -6.892574787139893, "global_step": 153366, "epoch": 3651} {"train_loss": -6.7881646156311035, "global_step": 153367, "epoch": 3651} {"train_loss": -6.909967422485352, "global_step": 153368, "epoch": 3651} {"train_loss": -6.717985153198242, "global_step": 153369, "epoch": 3651} {"train_loss": -6.836209297180176, "global_step": 153370, "epoch": 3651} {"train_loss": -6.952103614807129, "global_step": 153371, "epoch": 3651} {"train_loss": -6.858725547790527, "global_step": 153372, "epoch": 3651} {"train_loss": -6.925662040710449, "global_step": 153373, "epoch": 3651} {"train_loss": -6.747684955596924, "global_step": 153374, "epoch": 3651} {"train_loss": -6.799321174621582, "global_step": 153375, "epoch": 3651} {"train_loss": -6.7740678787231445, "global_step": 153376, "epoch": 3651} {"train_loss": -6.839260578155518, "global_step": 153377, "epoch": 3651} {"train_loss": -6.919551849365234, "global_step": 153378, "epoch": 3651} {"train_loss": -6.856345176696777, "global_step": 153379, "epoch": 3651} {"train_loss": -6.797765254974365, "global_step": 153380, "epoch": 3651} {"train_loss": -6.79293155670166, "global_step": 153381, "epoch": 3651} {"train_loss": -6.751882553100586, "global_step": 153382, "epoch": 3651} {"train_loss": -6.839493161156064, "global_step": 153383, "epoch": 3651, "val_loss": 68542.3828125} {"train_loss": -6.866734027862549, "global_step": 153384, "epoch": 3652} {"train_loss": -6.774812698364258, "global_step": 153385, "epoch": 3652} {"train_loss": -6.896974086761475, "global_step": 153386, "epoch": 3652} {"train_loss": -6.878321647644043, "global_step": 153387, "epoch": 3652} {"train_loss": -6.777395248413086, "global_step": 153388, "epoch": 3652} {"train_loss": -6.855876922607422, "global_step": 153389, "epoch": 3652} {"train_loss": -6.898922920227051, "global_step": 153390, "epoch": 3652} {"train_loss": -6.8240251541137695, "global_step": 153391, "epoch": 3652} {"train_loss": -6.804678916931152, "global_step": 153392, "epoch": 3652} {"train_loss": -6.806509017944336, "global_step": 153393, "epoch": 3652} {"train_loss": -6.788884162902832, "global_step": 153394, "epoch": 3652} {"train_loss": -6.815648078918457, "global_step": 153395, "epoch": 3652} {"train_loss": -6.817034721374512, "global_step": 153396, "epoch": 3652} {"train_loss": -6.767358779907227, "global_step": 153397, "epoch": 3652} {"train_loss": -6.790444850921631, "global_step": 153398, "epoch": 3652} {"train_loss": -6.782515525817871, "global_step": 153399, "epoch": 3652} {"train_loss": -6.89010763168335, "global_step": 153400, "epoch": 3652} {"train_loss": -6.749300479888916, "global_step": 153401, "epoch": 3652} {"train_loss": -6.811718463897705, "global_step": 153402, "epoch": 3652} {"train_loss": -6.884572505950928, "global_step": 153403, "epoch": 3652} {"train_loss": -6.760892868041992, "global_step": 153404, "epoch": 3652} {"train_loss": -6.814858913421631, "global_step": 153405, "epoch": 3652} {"train_loss": -6.83392333984375, "global_step": 153406, "epoch": 3652} {"train_loss": -6.7967529296875, "global_step": 153407, "epoch": 3652} {"train_loss": -6.894936561584473, "global_step": 153408, "epoch": 3652} {"train_loss": -6.762044429779053, "global_step": 153409, "epoch": 3652} {"train_loss": -6.823298454284668, "global_step": 153410, "epoch": 3652} {"train_loss": -6.934755325317383, "global_step": 153411, "epoch": 3652} {"train_loss": -6.921572685241699, "global_step": 153412, "epoch": 3652} {"train_loss": -6.862388610839844, "global_step": 153413, "epoch": 3652} {"train_loss": -6.786233901977539, "global_step": 153414, "epoch": 3652} {"train_loss": -6.855499267578125, "global_step": 153415, "epoch": 3652} {"train_loss": -6.872804641723633, "global_step": 153416, "epoch": 3652} {"train_loss": -6.7595906257629395, "global_step": 153417, "epoch": 3652} {"train_loss": -6.833321571350098, "global_step": 153418, "epoch": 3652} {"train_loss": -6.891119956970215, "global_step": 153419, "epoch": 3652} {"train_loss": -6.859458923339844, "global_step": 153420, "epoch": 3652} {"train_loss": -6.884090423583984, "global_step": 153421, "epoch": 3652} {"train_loss": -6.928031921386719, "global_step": 153422, "epoch": 3652} {"train_loss": -6.986510753631592, "global_step": 153423, "epoch": 3652} {"train_loss": -6.920533180236816, "global_step": 153424, "epoch": 3652} {"train_loss": -6.840314842405773, "global_step": 153425, "epoch": 3652, "val_loss": 68395.3515625} {"train_loss": -6.93131685256958, "global_step": 153426, "epoch": 3653} {"train_loss": -6.919753551483154, "global_step": 153427, "epoch": 3653} {"train_loss": -6.8716583251953125, "global_step": 153428, "epoch": 3653} {"train_loss": -7.024416446685791, "global_step": 153429, "epoch": 3653} {"train_loss": -6.978632926940918, "global_step": 153430, "epoch": 3653} {"train_loss": -6.941669940948486, "global_step": 153431, "epoch": 3653} {"train_loss": -6.832657814025879, "global_step": 153432, "epoch": 3653} {"train_loss": -6.8918681144714355, "global_step": 153433, "epoch": 3653} {"train_loss": -6.951807975769043, "global_step": 153434, "epoch": 3653} {"train_loss": -6.893838405609131, "global_step": 153435, "epoch": 3653} {"train_loss": -6.8456950187683105, "global_step": 153436, "epoch": 3653} {"train_loss": -6.827263832092285, "global_step": 153437, "epoch": 3653} {"train_loss": -6.753968715667725, "global_step": 153438, "epoch": 3653} {"train_loss": -6.876887321472168, "global_step": 153439, "epoch": 3653} {"train_loss": -6.847187042236328, "global_step": 153440, "epoch": 3653} {"train_loss": -6.816063404083252, "global_step": 153441, "epoch": 3653} {"train_loss": -6.838926315307617, "global_step": 153442, "epoch": 3653} {"train_loss": -6.795221328735352, "global_step": 153443, "epoch": 3653} {"train_loss": -6.886455535888672, "global_step": 153444, "epoch": 3653} {"train_loss": -6.892794609069824, "global_step": 153445, "epoch": 3653} {"train_loss": -7.005614280700684, "global_step": 153446, "epoch": 3653} {"train_loss": -6.810354232788086, "global_step": 153447, "epoch": 3653} {"train_loss": -6.8284430503845215, "global_step": 153448, "epoch": 3653} {"train_loss": -6.862512588500977, "global_step": 153449, "epoch": 3653} {"train_loss": -6.8403120040893555, "global_step": 153450, "epoch": 3653} {"train_loss": -6.903314590454102, "global_step": 153451, "epoch": 3653} {"train_loss": -6.8521833419799805, "global_step": 153452, "epoch": 3653} {"train_loss": -6.916038513183594, "global_step": 153453, "epoch": 3653} {"train_loss": -6.887754440307617, "global_step": 153454, "epoch": 3653} {"train_loss": -6.922748565673828, "global_step": 153455, "epoch": 3653} {"train_loss": -6.879578590393066, "global_step": 153456, "epoch": 3653} {"train_loss": -6.811068534851074, "global_step": 153457, "epoch": 3653} {"train_loss": -6.888657569885254, "global_step": 153458, "epoch": 3653} {"train_loss": -6.877353668212891, "global_step": 153459, "epoch": 3653} {"train_loss": -6.838934421539307, "global_step": 153460, "epoch": 3653} {"train_loss": -6.844544410705566, "global_step": 153461, "epoch": 3653} {"train_loss": -6.823737621307373, "global_step": 153462, "epoch": 3653} {"train_loss": -6.9556121826171875, "global_step": 153463, "epoch": 3653} {"train_loss": -6.918752670288086, "global_step": 153464, "epoch": 3653} {"train_loss": -6.866670608520508, "global_step": 153465, "epoch": 3653} {"train_loss": -6.814986228942871, "global_step": 153466, "epoch": 3653} {"train_loss": -6.877513613019671, "global_step": 153467, "epoch": 3653, "val_loss": 68564.71875} {"train_loss": -6.924531936645508, "global_step": 153468, "epoch": 3654} {"train_loss": -6.932201385498047, "global_step": 153469, "epoch": 3654} {"train_loss": -6.887279510498047, "global_step": 153470, "epoch": 3654} {"train_loss": -6.958316802978516, "global_step": 153471, "epoch": 3654} {"train_loss": -6.977293014526367, "global_step": 153472, "epoch": 3654} {"train_loss": -6.711073875427246, "global_step": 153473, "epoch": 3654} {"train_loss": -6.962982654571533, "global_step": 153474, "epoch": 3654} {"train_loss": -6.912578582763672, "global_step": 153475, "epoch": 3654} {"train_loss": -6.873281478881836, "global_step": 153476, "epoch": 3654} {"train_loss": -6.7678632736206055, "global_step": 153477, "epoch": 3654} {"train_loss": -6.934491157531738, "global_step": 153478, "epoch": 3654} {"train_loss": -6.96359920501709, "global_step": 153479, "epoch": 3654} {"train_loss": -6.919221878051758, "global_step": 153480, "epoch": 3654} {"train_loss": -6.750896453857422, "global_step": 153481, "epoch": 3654} {"train_loss": -6.860102653503418, "global_step": 153482, "epoch": 3654} {"train_loss": -6.743588447570801, "global_step": 153483, "epoch": 3654} {"train_loss": -6.900818824768066, "global_step": 153484, "epoch": 3654} {"train_loss": -6.770848274230957, "global_step": 153485, "epoch": 3654} {"train_loss": -6.757698059082031, "global_step": 153486, "epoch": 3654} {"train_loss": -6.777560234069824, "global_step": 153487, "epoch": 3654} {"train_loss": -6.843554973602295, "global_step": 153488, "epoch": 3654} {"train_loss": -6.678445816040039, "global_step": 153489, "epoch": 3654} {"train_loss": -6.779282093048096, "global_step": 153490, "epoch": 3654} {"train_loss": -6.855334758758545, "global_step": 153491, "epoch": 3654} {"train_loss": -6.694466590881348, "global_step": 153492, "epoch": 3654} {"train_loss": -6.785782814025879, "global_step": 153493, "epoch": 3654} {"train_loss": -6.809062957763672, "global_step": 153494, "epoch": 3654} {"train_loss": -6.905261993408203, "global_step": 153495, "epoch": 3654} {"train_loss": -6.929533958435059, "global_step": 153496, "epoch": 3654} {"train_loss": -6.956046104431152, "global_step": 153497, "epoch": 3654} {"train_loss": -6.8887038230896, "global_step": 153498, "epoch": 3654} {"train_loss": -6.761129379272461, "global_step": 153499, "epoch": 3654} {"train_loss": -6.812726974487305, "global_step": 153500, "epoch": 3654} {"train_loss": -6.7693963050842285, "global_step": 153501, "epoch": 3654} {"train_loss": -6.885104179382324, "global_step": 153502, "epoch": 3654} {"train_loss": -6.774312496185303, "global_step": 153503, "epoch": 3654} {"train_loss": -6.75942850112915, "global_step": 153504, "epoch": 3654} {"train_loss": -6.861994743347168, "global_step": 153505, "epoch": 3654} {"train_loss": -6.815206527709961, "global_step": 153506, "epoch": 3654} {"train_loss": -6.910089015960693, "global_step": 153507, "epoch": 3654} {"train_loss": -6.804477214813232, "global_step": 153508, "epoch": 3654} {"train_loss": -6.842966931206839, "global_step": 153509, "epoch": 3654, "val_loss": 68585.8515625} {"train_loss": -6.782937526702881, "global_step": 153510, "epoch": 3655} {"train_loss": -6.867908954620361, "global_step": 153511, "epoch": 3655} {"train_loss": -6.813628196716309, "global_step": 153512, "epoch": 3655} {"train_loss": -6.816485404968262, "global_step": 153513, "epoch": 3655} {"train_loss": -6.850699424743652, "global_step": 153514, "epoch": 3655} {"train_loss": -6.91609525680542, "global_step": 153515, "epoch": 3655} {"train_loss": -6.898235321044922, "global_step": 153516, "epoch": 3655} {"train_loss": -6.916417121887207, "global_step": 153517, "epoch": 3655} {"train_loss": -6.833967208862305, "global_step": 153518, "epoch": 3655} {"train_loss": -6.816434860229492, "global_step": 153519, "epoch": 3655} {"train_loss": -6.901088237762451, "global_step": 153520, "epoch": 3655} {"train_loss": -6.893986701965332, "global_step": 153521, "epoch": 3655} {"train_loss": -6.790796756744385, "global_step": 153522, "epoch": 3655} {"train_loss": -6.829154014587402, "global_step": 153523, "epoch": 3655} {"train_loss": -6.860663890838623, "global_step": 153524, "epoch": 3655} {"train_loss": -6.799359321594238, "global_step": 153525, "epoch": 3655} {"train_loss": -6.674509048461914, "global_step": 153526, "epoch": 3655} {"train_loss": -6.872458457946777, "global_step": 153527, "epoch": 3655} {"train_loss": -6.806199550628662, "global_step": 153528, "epoch": 3655} {"train_loss": -6.792961120605469, "global_step": 153529, "epoch": 3655} {"train_loss": -6.803514003753662, "global_step": 153530, "epoch": 3655} {"train_loss": -6.776041030883789, "global_step": 153531, "epoch": 3655} {"train_loss": -6.748355388641357, "global_step": 153532, "epoch": 3655} {"train_loss": -6.84929084777832, "global_step": 153533, "epoch": 3655} {"train_loss": -6.714939594268799, "global_step": 153534, "epoch": 3655} {"train_loss": -6.728481769561768, "global_step": 153535, "epoch": 3655} {"train_loss": -6.587362289428711, "global_step": 153536, "epoch": 3655} {"train_loss": -6.876689910888672, "global_step": 153537, "epoch": 3655} {"train_loss": -6.616359233856201, "global_step": 153538, "epoch": 3655} {"train_loss": -6.730501174926758, "global_step": 153539, "epoch": 3655} {"train_loss": -6.76851749420166, "global_step": 153540, "epoch": 3655} {"train_loss": -6.595698356628418, "global_step": 153541, "epoch": 3655} {"train_loss": -6.837407112121582, "global_step": 153542, "epoch": 3655} {"train_loss": -6.637964248657227, "global_step": 153543, "epoch": 3655} {"train_loss": -6.713954448699951, "global_step": 153544, "epoch": 3655} {"train_loss": -6.866662979125977, "global_step": 153545, "epoch": 3655} {"train_loss": -6.584257125854492, "global_step": 153546, "epoch": 3655} {"train_loss": -6.856520652770996, "global_step": 153547, "epoch": 3655} {"train_loss": -6.674606800079346, "global_step": 153548, "epoch": 3655} {"train_loss": -6.750646114349365, "global_step": 153549, "epoch": 3655} {"train_loss": -6.713860511779785, "global_step": 153550, "epoch": 3655} {"train_loss": -6.784938505717686, "global_step": 153551, "epoch": 3655, "val_loss": 68402.4453125} {"train_loss": -6.700815677642822, "global_step": 153552, "epoch": 3656} {"train_loss": -6.8459014892578125, "global_step": 153553, "epoch": 3656} {"train_loss": -6.77080774307251, "global_step": 153554, "epoch": 3656} {"train_loss": -6.755990028381348, "global_step": 153555, "epoch": 3656} {"train_loss": -6.8642096519470215, "global_step": 153556, "epoch": 3656} {"train_loss": -6.758012294769287, "global_step": 153557, "epoch": 3656} {"train_loss": -6.684962272644043, "global_step": 153558, "epoch": 3656} {"train_loss": -6.725746154785156, "global_step": 153559, "epoch": 3656} {"train_loss": -6.79837703704834, "global_step": 153560, "epoch": 3656} {"train_loss": -6.770996570587158, "global_step": 153561, "epoch": 3656} {"train_loss": -6.816283226013184, "global_step": 153562, "epoch": 3656} {"train_loss": -6.795393943786621, "global_step": 153563, "epoch": 3656} {"train_loss": -6.826352596282959, "global_step": 153564, "epoch": 3656} {"train_loss": -6.72054386138916, "global_step": 153565, "epoch": 3656} {"train_loss": -6.850506782531738, "global_step": 153566, "epoch": 3656} {"train_loss": -6.847326278686523, "global_step": 153567, "epoch": 3656} {"train_loss": -6.723690509796143, "global_step": 153568, "epoch": 3656} {"train_loss": -6.831639766693115, "global_step": 153569, "epoch": 3656} {"train_loss": -6.781306743621826, "global_step": 153570, "epoch": 3656} {"train_loss": -6.865940570831299, "global_step": 153571, "epoch": 3656} {"train_loss": -6.718982696533203, "global_step": 153572, "epoch": 3656} {"train_loss": -6.855826377868652, "global_step": 153573, "epoch": 3656} {"train_loss": -6.824855327606201, "global_step": 153574, "epoch": 3656} {"train_loss": -6.839700698852539, "global_step": 153575, "epoch": 3656} {"train_loss": -6.86361026763916, "global_step": 153576, "epoch": 3656} {"train_loss": -6.81015682220459, "global_step": 153577, "epoch": 3656} {"train_loss": -6.896036148071289, "global_step": 153578, "epoch": 3656} {"train_loss": -6.771015167236328, "global_step": 153579, "epoch": 3656} {"train_loss": -6.812857151031494, "global_step": 153580, "epoch": 3656} {"train_loss": -6.736536979675293, "global_step": 153581, "epoch": 3656} {"train_loss": -6.811385154724121, "global_step": 153582, "epoch": 3656} {"train_loss": -6.7694501876831055, "global_step": 153583, "epoch": 3656} {"train_loss": -6.81198787689209, "global_step": 153584, "epoch": 3656} {"train_loss": -6.965892791748047, "global_step": 153585, "epoch": 3656} {"train_loss": -6.824434757232666, "global_step": 153586, "epoch": 3656} {"train_loss": -6.800853729248047, "global_step": 153587, "epoch": 3656} {"train_loss": -6.905122756958008, "global_step": 153588, "epoch": 3656} {"train_loss": -6.840010166168213, "global_step": 153589, "epoch": 3656} {"train_loss": -6.849933624267578, "global_step": 153590, "epoch": 3656} {"train_loss": -6.887956619262695, "global_step": 153591, "epoch": 3656} {"train_loss": -6.807905673980713, "global_step": 153592, "epoch": 3656} {"train_loss": -6.808729625883556, "global_step": 153593, "epoch": 3656, "val_loss": 68409.8125} {"train_loss": -6.854084014892578, "global_step": 153594, "epoch": 3657} {"train_loss": -6.931506156921387, "global_step": 153595, "epoch": 3657} {"train_loss": -6.841035842895508, "global_step": 153596, "epoch": 3657} {"train_loss": -6.698920249938965, "global_step": 153597, "epoch": 3657} {"train_loss": -6.94438362121582, "global_step": 153598, "epoch": 3657} {"train_loss": -6.8782758712768555, "global_step": 153599, "epoch": 3657} {"train_loss": -6.733271598815918, "global_step": 153600, "epoch": 3657} {"train_loss": -6.942519187927246, "global_step": 153601, "epoch": 3657} {"train_loss": -6.832468032836914, "global_step": 153602, "epoch": 3657} {"train_loss": -6.774620532989502, "global_step": 153603, "epoch": 3657} {"train_loss": -6.772595405578613, "global_step": 153604, "epoch": 3657} {"train_loss": -6.829865455627441, "global_step": 153605, "epoch": 3657} {"train_loss": -6.85489559173584, "global_step": 153606, "epoch": 3657} {"train_loss": -6.884208679199219, "global_step": 153607, "epoch": 3657} {"train_loss": -6.811942100524902, "global_step": 153608, "epoch": 3657} {"train_loss": -6.9043192863464355, "global_step": 153609, "epoch": 3657} {"train_loss": -6.87647819519043, "global_step": 153610, "epoch": 3657} {"train_loss": -6.815906047821045, "global_step": 153611, "epoch": 3657} {"train_loss": -6.8486409187316895, "global_step": 153612, "epoch": 3657} {"train_loss": -6.829195022583008, "global_step": 153613, "epoch": 3657} {"train_loss": -6.866469383239746, "global_step": 153614, "epoch": 3657} {"train_loss": -6.8378448486328125, "global_step": 153615, "epoch": 3657} {"train_loss": -6.938924789428711, "global_step": 153616, "epoch": 3657} {"train_loss": -6.915848731994629, "global_step": 153617, "epoch": 3657} {"train_loss": -6.807901382446289, "global_step": 153618, "epoch": 3657} {"train_loss": -6.913309574127197, "global_step": 153619, "epoch": 3657} {"train_loss": -6.889466285705566, "global_step": 153620, "epoch": 3657} {"train_loss": -6.895092964172363, "global_step": 153621, "epoch": 3657} {"train_loss": -6.953662872314453, "global_step": 153622, "epoch": 3657} {"train_loss": -6.968814849853516, "global_step": 153623, "epoch": 3657} {"train_loss": -6.825652599334717, "global_step": 153624, "epoch": 3657} {"train_loss": -6.982486724853516, "global_step": 153625, "epoch": 3657} {"train_loss": -6.82320499420166, "global_step": 153626, "epoch": 3657} {"train_loss": -6.923944473266602, "global_step": 153627, "epoch": 3657} {"train_loss": -6.912421703338623, "global_step": 153628, "epoch": 3657} {"train_loss": -6.918867111206055, "global_step": 153629, "epoch": 3657} {"train_loss": -6.882325172424316, "global_step": 153630, "epoch": 3657} {"train_loss": -6.883031368255615, "global_step": 153631, "epoch": 3657} {"train_loss": -6.7863311767578125, "global_step": 153632, "epoch": 3657} {"train_loss": -6.8266801834106445, "global_step": 153633, "epoch": 3657} {"train_loss": -6.87745475769043, "global_step": 153634, "epoch": 3657} {"train_loss": -6.8612627528962635, "global_step": 153635, "epoch": 3657, "val_loss": 68350.640625} {"train_loss": -6.7776947021484375, "global_step": 153636, "epoch": 3658} {"train_loss": -6.782822132110596, "global_step": 153637, "epoch": 3658} {"train_loss": -6.792458534240723, "global_step": 153638, "epoch": 3658} {"train_loss": -6.9495344161987305, "global_step": 153639, "epoch": 3658} {"train_loss": -6.802117347717285, "global_step": 153640, "epoch": 3658} {"train_loss": -6.763800621032715, "global_step": 153641, "epoch": 3658} {"train_loss": -6.826780319213867, "global_step": 153642, "epoch": 3658} {"train_loss": -6.813189506530762, "global_step": 153643, "epoch": 3658} {"train_loss": -6.852601528167725, "global_step": 153644, "epoch": 3658} {"train_loss": -6.873858451843262, "global_step": 153645, "epoch": 3658} {"train_loss": -6.767229080200195, "global_step": 153646, "epoch": 3658} {"train_loss": -6.852372169494629, "global_step": 153647, "epoch": 3658} {"train_loss": -6.806012153625488, "global_step": 153648, "epoch": 3658} {"train_loss": -6.8277740478515625, "global_step": 153649, "epoch": 3658} {"train_loss": -6.8425726890563965, "global_step": 153650, "epoch": 3658} {"train_loss": -6.71934175491333, "global_step": 153651, "epoch": 3658} {"train_loss": -6.901599407196045, "global_step": 153652, "epoch": 3658} {"train_loss": -6.7954559326171875, "global_step": 153653, "epoch": 3658} {"train_loss": -6.722202301025391, "global_step": 153654, "epoch": 3658} {"train_loss": -6.86916446685791, "global_step": 153655, "epoch": 3658} {"train_loss": -6.765571594238281, "global_step": 153656, "epoch": 3658} {"train_loss": -6.89605188369751, "global_step": 153657, "epoch": 3658} {"train_loss": -6.6780548095703125, "global_step": 153658, "epoch": 3658} {"train_loss": -6.844761848449707, "global_step": 153659, "epoch": 3658} {"train_loss": -6.778801918029785, "global_step": 153660, "epoch": 3658} {"train_loss": -6.826810836791992, "global_step": 153661, "epoch": 3658} {"train_loss": -6.8171234130859375, "global_step": 153662, "epoch": 3658} {"train_loss": -6.8782243728637695, "global_step": 153663, "epoch": 3658} {"train_loss": -6.750316619873047, "global_step": 153664, "epoch": 3658} {"train_loss": -6.863595962524414, "global_step": 153665, "epoch": 3658} {"train_loss": -6.764880180358887, "global_step": 153666, "epoch": 3658} {"train_loss": -6.747828483581543, "global_step": 153667, "epoch": 3658} {"train_loss": -6.926105499267578, "global_step": 153668, "epoch": 3658} {"train_loss": -6.814324378967285, "global_step": 153669, "epoch": 3658} {"train_loss": -6.929023265838623, "global_step": 153670, "epoch": 3658} {"train_loss": -6.800793170928955, "global_step": 153671, "epoch": 3658} {"train_loss": -6.86318302154541, "global_step": 153672, "epoch": 3658} {"train_loss": -6.780928134918213, "global_step": 153673, "epoch": 3658} {"train_loss": -6.928592681884766, "global_step": 153674, "epoch": 3658} {"train_loss": -6.757256984710693, "global_step": 153675, "epoch": 3658} {"train_loss": -6.8824615478515625, "global_step": 153676, "epoch": 3658} {"train_loss": -6.820934420540219, "global_step": 153677, "epoch": 3658, "val_loss": 68680.65625} {"train_loss": -6.745680809020996, "global_step": 153678, "epoch": 3659} {"train_loss": -6.849552154541016, "global_step": 153679, "epoch": 3659} {"train_loss": -6.844445705413818, "global_step": 153680, "epoch": 3659} {"train_loss": -6.8334479331970215, "global_step": 153681, "epoch": 3659} {"train_loss": -6.800662994384766, "global_step": 153682, "epoch": 3659} {"train_loss": -6.686075687408447, "global_step": 153683, "epoch": 3659} {"train_loss": -6.839228630065918, "global_step": 153684, "epoch": 3659} {"train_loss": -6.793910026550293, "global_step": 153685, "epoch": 3659} {"train_loss": -6.7351861000061035, "global_step": 153686, "epoch": 3659} {"train_loss": -6.8112053871154785, "global_step": 153687, "epoch": 3659} {"train_loss": -6.771917819976807, "global_step": 153688, "epoch": 3659} {"train_loss": -6.883062362670898, "global_step": 153689, "epoch": 3659} {"train_loss": -6.679076194763184, "global_step": 153690, "epoch": 3659} {"train_loss": -6.878803253173828, "global_step": 153691, "epoch": 3659} {"train_loss": -6.751315116882324, "global_step": 153692, "epoch": 3659} {"train_loss": -6.824549198150635, "global_step": 153693, "epoch": 3659} {"train_loss": -6.874863147735596, "global_step": 153694, "epoch": 3659} {"train_loss": -6.864692211151123, "global_step": 153695, "epoch": 3659} {"train_loss": -6.918813705444336, "global_step": 153696, "epoch": 3659} {"train_loss": -6.836566925048828, "global_step": 153697, "epoch": 3659} {"train_loss": -6.921115398406982, "global_step": 153698, "epoch": 3659} {"train_loss": -6.685098171234131, "global_step": 153699, "epoch": 3659} {"train_loss": -6.803762435913086, "global_step": 153700, "epoch": 3659} {"train_loss": -6.848658084869385, "global_step": 153701, "epoch": 3659} {"train_loss": -6.922978401184082, "global_step": 153702, "epoch": 3659} {"train_loss": -6.867151737213135, "global_step": 153703, "epoch": 3659} {"train_loss": -6.880852222442627, "global_step": 153704, "epoch": 3659} {"train_loss": -6.796934604644775, "global_step": 153705, "epoch": 3659} {"train_loss": -6.8299241065979, "global_step": 153706, "epoch": 3659} {"train_loss": -6.918988227844238, "global_step": 153707, "epoch": 3659} {"train_loss": -6.851420879364014, "global_step": 153708, "epoch": 3659} {"train_loss": -6.741540431976318, "global_step": 153709, "epoch": 3659} {"train_loss": -6.885519027709961, "global_step": 153710, "epoch": 3659} {"train_loss": -6.757254600524902, "global_step": 153711, "epoch": 3659} {"train_loss": -6.737314701080322, "global_step": 153712, "epoch": 3659} {"train_loss": -6.788413047790527, "global_step": 153713, "epoch": 3659} {"train_loss": -6.743612289428711, "global_step": 153714, "epoch": 3659} {"train_loss": -6.753170967102051, "global_step": 153715, "epoch": 3659} {"train_loss": -6.779747009277344, "global_step": 153716, "epoch": 3659} {"train_loss": -6.862178325653076, "global_step": 153717, "epoch": 3659} {"train_loss": -6.7664384841918945, "global_step": 153718, "epoch": 3659} {"train_loss": -6.813575176965623, "global_step": 153719, "epoch": 3659, "val_loss": 68693.984375} {"train_loss": -6.682950973510742, "global_step": 153720, "epoch": 3660} {"train_loss": -6.6285881996154785, "global_step": 153721, "epoch": 3660} {"train_loss": -6.738153457641602, "global_step": 153722, "epoch": 3660} {"train_loss": -6.920294284820557, "global_step": 153723, "epoch": 3660} {"train_loss": -6.78264045715332, "global_step": 153724, "epoch": 3660} {"train_loss": -6.754977226257324, "global_step": 153725, "epoch": 3660} {"train_loss": -6.785489082336426, "global_step": 153726, "epoch": 3660} {"train_loss": -6.754433631896973, "global_step": 153727, "epoch": 3660} {"train_loss": -6.986944675445557, "global_step": 153728, "epoch": 3660} {"train_loss": -6.734010219573975, "global_step": 153729, "epoch": 3660} {"train_loss": -6.918095111846924, "global_step": 153730, "epoch": 3660} {"train_loss": -6.87016487121582, "global_step": 153731, "epoch": 3660} {"train_loss": -6.806455135345459, "global_step": 153732, "epoch": 3660} {"train_loss": -6.8862175941467285, "global_step": 153733, "epoch": 3660} {"train_loss": -6.694353103637695, "global_step": 153734, "epoch": 3660} {"train_loss": -6.8938374519348145, "global_step": 153735, "epoch": 3660} {"train_loss": -6.865355491638184, "global_step": 153736, "epoch": 3660} {"train_loss": -6.842982292175293, "global_step": 153737, "epoch": 3660} {"train_loss": -6.696057319641113, "global_step": 153738, "epoch": 3660} {"train_loss": -6.8465189933776855, "global_step": 153739, "epoch": 3660} {"train_loss": -6.921939373016357, "global_step": 153740, "epoch": 3660} {"train_loss": -6.9521870613098145, "global_step": 153741, "epoch": 3660} {"train_loss": -6.784233093261719, "global_step": 153742, "epoch": 3660} {"train_loss": -7.010998725891113, "global_step": 153743, "epoch": 3660} {"train_loss": -6.884027481079102, "global_step": 153744, "epoch": 3660} {"train_loss": -6.8163604736328125, "global_step": 153745, "epoch": 3660} {"train_loss": -6.810420989990234, "global_step": 153746, "epoch": 3660} {"train_loss": -6.90243673324585, "global_step": 153747, "epoch": 3660} {"train_loss": -6.866756916046143, "global_step": 153748, "epoch": 3660} {"train_loss": -6.809457778930664, "global_step": 153749, "epoch": 3660} {"train_loss": -6.824300765991211, "global_step": 153750, "epoch": 3660} {"train_loss": -6.748389720916748, "global_step": 153751, "epoch": 3660} {"train_loss": -6.986322402954102, "global_step": 153752, "epoch": 3660} {"train_loss": -6.922041893005371, "global_step": 153753, "epoch": 3660} {"train_loss": -6.859228134155273, "global_step": 153754, "epoch": 3660} {"train_loss": -6.9302215576171875, "global_step": 153755, "epoch": 3660} {"train_loss": -6.879426002502441, "global_step": 153756, "epoch": 3660} {"train_loss": -6.859994888305664, "global_step": 153757, "epoch": 3660} {"train_loss": -6.724257469177246, "global_step": 153758, "epoch": 3660} {"train_loss": -6.868701934814453, "global_step": 153759, "epoch": 3660} {"train_loss": -6.877227783203125, "global_step": 153760, "epoch": 3660} {"train_loss": -6.836499236878895, "global_step": 153761, "epoch": 3660, "val_loss": 68603.0546875} {"train_loss": -6.978801727294922, "global_step": 153762, "epoch": 3661} {"train_loss": -6.8441290855407715, "global_step": 153763, "epoch": 3661} {"train_loss": -6.877500534057617, "global_step": 153764, "epoch": 3661} {"train_loss": -6.94532585144043, "global_step": 153765, "epoch": 3661} {"train_loss": -6.874642372131348, "global_step": 153766, "epoch": 3661} {"train_loss": -6.899409770965576, "global_step": 153767, "epoch": 3661} {"train_loss": -6.9527788162231445, "global_step": 153768, "epoch": 3661} {"train_loss": -6.822104454040527, "global_step": 153769, "epoch": 3661} {"train_loss": -6.807804107666016, "global_step": 153770, "epoch": 3661} {"train_loss": -6.8912153244018555, "global_step": 153771, "epoch": 3661} {"train_loss": -6.748991966247559, "global_step": 153772, "epoch": 3661} {"train_loss": -6.804786682128906, "global_step": 153773, "epoch": 3661} {"train_loss": -6.9054365158081055, "global_step": 153774, "epoch": 3661} {"train_loss": -6.870674133300781, "global_step": 153775, "epoch": 3661} {"train_loss": -6.851578712463379, "global_step": 153776, "epoch": 3661} {"train_loss": -6.793454170227051, "global_step": 153777, "epoch": 3661} {"train_loss": -6.831488132476807, "global_step": 153778, "epoch": 3661} {"train_loss": -6.843017578125, "global_step": 153779, "epoch": 3661} {"train_loss": -6.804956912994385, "global_step": 153780, "epoch": 3661} {"train_loss": -6.792132377624512, "global_step": 153781, "epoch": 3661} {"train_loss": -6.8560333251953125, "global_step": 153782, "epoch": 3661} {"train_loss": -6.778738021850586, "global_step": 153783, "epoch": 3661} {"train_loss": -6.745996475219727, "global_step": 153784, "epoch": 3661} {"train_loss": -6.791585922241211, "global_step": 153785, "epoch": 3661} {"train_loss": -6.742110252380371, "global_step": 153786, "epoch": 3661} {"train_loss": -6.6864519119262695, "global_step": 153787, "epoch": 3661} {"train_loss": -6.83226203918457, "global_step": 153788, "epoch": 3661} {"train_loss": -6.747036933898926, "global_step": 153789, "epoch": 3661} {"train_loss": -6.704526424407959, "global_step": 153790, "epoch": 3661} {"train_loss": -6.810343265533447, "global_step": 153791, "epoch": 3661} {"train_loss": -6.707874298095703, "global_step": 153792, "epoch": 3661} {"train_loss": -6.711564064025879, "global_step": 153793, "epoch": 3661} {"train_loss": -6.779214859008789, "global_step": 153794, "epoch": 3661} {"train_loss": -6.7664947509765625, "global_step": 153795, "epoch": 3661} {"train_loss": -6.8734235763549805, "global_step": 153796, "epoch": 3661} {"train_loss": -6.6695876121521, "global_step": 153797, "epoch": 3661} {"train_loss": -6.786408424377441, "global_step": 153798, "epoch": 3661} {"train_loss": -6.778385639190674, "global_step": 153799, "epoch": 3661} {"train_loss": -6.691812515258789, "global_step": 153800, "epoch": 3661} {"train_loss": -6.912284851074219, "global_step": 153801, "epoch": 3661} {"train_loss": -6.730038642883301, "global_step": 153802, "epoch": 3661} {"train_loss": -6.809619540259952, "global_step": 153803, "epoch": 3661, "val_loss": 68395.5078125} {"train_loss": -6.890289306640625, "global_step": 153804, "epoch": 3662} {"train_loss": -6.778360843658447, "global_step": 153805, "epoch": 3662} {"train_loss": -6.785126686096191, "global_step": 153806, "epoch": 3662} {"train_loss": -6.924319267272949, "global_step": 153807, "epoch": 3662} {"train_loss": -6.795899391174316, "global_step": 153808, "epoch": 3662} {"train_loss": -6.873513221740723, "global_step": 153809, "epoch": 3662} {"train_loss": -6.731910705566406, "global_step": 153810, "epoch": 3662} {"train_loss": -6.6951985359191895, "global_step": 153811, "epoch": 3662} {"train_loss": -6.894662380218506, "global_step": 153812, "epoch": 3662} {"train_loss": -6.851806640625, "global_step": 153813, "epoch": 3662} {"train_loss": -6.890674591064453, "global_step": 153814, "epoch": 3662} {"train_loss": -6.803104877471924, "global_step": 153815, "epoch": 3662} {"train_loss": -6.837936878204346, "global_step": 153816, "epoch": 3662} {"train_loss": -6.844471454620361, "global_step": 153817, "epoch": 3662} {"train_loss": -6.858824729919434, "global_step": 153818, "epoch": 3662} {"train_loss": -6.786550521850586, "global_step": 153819, "epoch": 3662} {"train_loss": -7.02427864074707, "global_step": 153820, "epoch": 3662} {"train_loss": -6.759350299835205, "global_step": 153821, "epoch": 3662} {"train_loss": -6.863422393798828, "global_step": 153822, "epoch": 3662} {"train_loss": -6.930433750152588, "global_step": 153823, "epoch": 3662} {"train_loss": -6.921358585357666, "global_step": 153824, "epoch": 3662} {"train_loss": -6.894216060638428, "global_step": 153825, "epoch": 3662} {"train_loss": -6.866355895996094, "global_step": 153826, "epoch": 3662} {"train_loss": -6.950793266296387, "global_step": 153827, "epoch": 3662} {"train_loss": -6.7929582595825195, "global_step": 153828, "epoch": 3662} {"train_loss": -6.818740367889404, "global_step": 153829, "epoch": 3662} {"train_loss": -6.815106391906738, "global_step": 153830, "epoch": 3662} {"train_loss": -6.7522478103637695, "global_step": 153831, "epoch": 3662} {"train_loss": -6.828784942626953, "global_step": 153832, "epoch": 3662} {"train_loss": -6.902120590209961, "global_step": 153833, "epoch": 3662} {"train_loss": -6.742112159729004, "global_step": 153834, "epoch": 3662} {"train_loss": -6.797896385192871, "global_step": 153835, "epoch": 3662} {"train_loss": -6.791085243225098, "global_step": 153836, "epoch": 3662} {"train_loss": -6.837924957275391, "global_step": 153837, "epoch": 3662} {"train_loss": -6.8158063888549805, "global_step": 153838, "epoch": 3662} {"train_loss": -6.720200061798096, "global_step": 153839, "epoch": 3662} {"train_loss": -6.880524635314941, "global_step": 153840, "epoch": 3662} {"train_loss": -6.758202075958252, "global_step": 153841, "epoch": 3662} {"train_loss": -6.687075614929199, "global_step": 153842, "epoch": 3662} {"train_loss": -6.718008995056152, "global_step": 153843, "epoch": 3662} {"train_loss": -6.870104789733887, "global_step": 153844, "epoch": 3662} {"train_loss": -6.8274364698500865, "global_step": 153845, "epoch": 3662, "val_loss": 68432.421875} {"train_loss": -6.808626651763916, "global_step": 153846, "epoch": 3663} {"train_loss": -6.8758649826049805, "global_step": 153847, "epoch": 3663} {"train_loss": -6.8368144035339355, "global_step": 153848, "epoch": 3663} {"train_loss": -6.698247909545898, "global_step": 153849, "epoch": 3663} {"train_loss": -6.891631126403809, "global_step": 153850, "epoch": 3663} {"train_loss": -6.873585224151611, "global_step": 153851, "epoch": 3663} {"train_loss": -6.759023189544678, "global_step": 153852, "epoch": 3663} {"train_loss": -6.910467624664307, "global_step": 153853, "epoch": 3663} {"train_loss": -6.800024032592773, "global_step": 153854, "epoch": 3663} {"train_loss": -6.889010429382324, "global_step": 153855, "epoch": 3663} {"train_loss": -6.86818265914917, "global_step": 153856, "epoch": 3663} {"train_loss": -6.7263898849487305, "global_step": 153857, "epoch": 3663} {"train_loss": -6.884457588195801, "global_step": 153858, "epoch": 3663} {"train_loss": -6.6971564292907715, "global_step": 153859, "epoch": 3663} {"train_loss": -6.8295698165893555, "global_step": 153860, "epoch": 3663} {"train_loss": -6.817032814025879, "global_step": 153861, "epoch": 3663} {"train_loss": -6.698065757751465, "global_step": 153862, "epoch": 3663} {"train_loss": -6.646116256713867, "global_step": 153863, "epoch": 3663} {"train_loss": -6.794363975524902, "global_step": 153864, "epoch": 3663} {"train_loss": -6.716860771179199, "global_step": 153865, "epoch": 3663} {"train_loss": -6.841610908508301, "global_step": 153866, "epoch": 3663} {"train_loss": -6.767246246337891, "global_step": 153867, "epoch": 3663} {"train_loss": -6.568687438964844, "global_step": 153868, "epoch": 3663} {"train_loss": -6.805727958679199, "global_step": 153869, "epoch": 3663} {"train_loss": -6.589825630187988, "global_step": 153870, "epoch": 3663} {"train_loss": -6.722467422485352, "global_step": 153871, "epoch": 3663} {"train_loss": -6.744206428527832, "global_step": 153872, "epoch": 3663} {"train_loss": -6.600641250610352, "global_step": 153873, "epoch": 3663} {"train_loss": -6.682483673095703, "global_step": 153874, "epoch": 3663} {"train_loss": -6.707670211791992, "global_step": 153875, "epoch": 3663} {"train_loss": -6.837752342224121, "global_step": 153876, "epoch": 3663} {"train_loss": -6.6618571281433105, "global_step": 153877, "epoch": 3663} {"train_loss": -6.665002822875977, "global_step": 153878, "epoch": 3663} {"train_loss": -6.875014305114746, "global_step": 153879, "epoch": 3663} {"train_loss": -6.803843021392822, "global_step": 153880, "epoch": 3663} {"train_loss": -6.767393589019775, "global_step": 153881, "epoch": 3663} {"train_loss": -6.7992472648620605, "global_step": 153882, "epoch": 3663} {"train_loss": -6.86458158493042, "global_step": 153883, "epoch": 3663} {"train_loss": -6.71553897857666, "global_step": 153884, "epoch": 3663} {"train_loss": -6.805026054382324, "global_step": 153885, "epoch": 3663} {"train_loss": -6.721724510192871, "global_step": 153886, "epoch": 3663} {"train_loss": -6.770788374401274, "global_step": 153887, "epoch": 3663, "val_loss": 68502.96875} {"train_loss": -6.945058822631836, "global_step": 153888, "epoch": 3664} {"train_loss": -6.798600196838379, "global_step": 153889, "epoch": 3664} {"train_loss": -6.847623825073242, "global_step": 153890, "epoch": 3664} {"train_loss": -6.763880729675293, "global_step": 153891, "epoch": 3664} {"train_loss": -6.762571334838867, "global_step": 153892, "epoch": 3664} {"train_loss": -6.903865337371826, "global_step": 153893, "epoch": 3664} {"train_loss": -6.811348915100098, "global_step": 153894, "epoch": 3664} {"train_loss": -6.868011474609375, "global_step": 153895, "epoch": 3664} {"train_loss": -6.73332405090332, "global_step": 153896, "epoch": 3664} {"train_loss": -6.808632850646973, "global_step": 153897, "epoch": 3664} {"train_loss": -6.717818737030029, "global_step": 153898, "epoch": 3664} {"train_loss": -6.840029716491699, "global_step": 153899, "epoch": 3664} {"train_loss": -6.8057966232299805, "global_step": 153900, "epoch": 3664} {"train_loss": -6.918082237243652, "global_step": 153901, "epoch": 3664} {"train_loss": -6.79028844833374, "global_step": 153902, "epoch": 3664} {"train_loss": -6.913599014282227, "global_step": 153903, "epoch": 3664} {"train_loss": -6.67003870010376, "global_step": 153904, "epoch": 3664} {"train_loss": -6.845222473144531, "global_step": 153905, "epoch": 3664} {"train_loss": -6.823963165283203, "global_step": 153906, "epoch": 3664} {"train_loss": -6.788461685180664, "global_step": 153907, "epoch": 3664} {"train_loss": -6.687809944152832, "global_step": 153908, "epoch": 3664} {"train_loss": -6.804698944091797, "global_step": 153909, "epoch": 3664} {"train_loss": -6.787248611450195, "global_step": 153910, "epoch": 3664} {"train_loss": -6.794070243835449, "global_step": 153911, "epoch": 3664} {"train_loss": -6.775812149047852, "global_step": 153912, "epoch": 3664} {"train_loss": -6.90512752532959, "global_step": 153913, "epoch": 3664} {"train_loss": -6.788581848144531, "global_step": 153914, "epoch": 3664} {"train_loss": -6.76639461517334, "global_step": 153915, "epoch": 3664} {"train_loss": -6.731433868408203, "global_step": 153916, "epoch": 3664} {"train_loss": -6.793271064758301, "global_step": 153917, "epoch": 3664} {"train_loss": -6.778643608093262, "global_step": 153918, "epoch": 3664} {"train_loss": -6.807732105255127, "global_step": 153919, "epoch": 3664} {"train_loss": -6.804941177368164, "global_step": 153920, "epoch": 3664} {"train_loss": -6.86049747467041, "global_step": 153921, "epoch": 3664} {"train_loss": -6.737894535064697, "global_step": 153922, "epoch": 3664} {"train_loss": -6.863102912902832, "global_step": 153923, "epoch": 3664} {"train_loss": -6.908686637878418, "global_step": 153924, "epoch": 3664} {"train_loss": -6.838954448699951, "global_step": 153925, "epoch": 3664} {"train_loss": -6.820367336273193, "global_step": 153926, "epoch": 3664} {"train_loss": -6.812484264373779, "global_step": 153927, "epoch": 3664} {"train_loss": -6.799271583557129, "global_step": 153928, "epoch": 3664} {"train_loss": -6.812565610522316, "global_step": 153929, "epoch": 3664, "val_loss": 68564.125} {"train_loss": -6.753754615783691, "global_step": 153930, "epoch": 3665} {"train_loss": -6.778672218322754, "global_step": 153931, "epoch": 3665} {"train_loss": -6.8686628341674805, "global_step": 153932, "epoch": 3665} {"train_loss": -6.848207473754883, "global_step": 153933, "epoch": 3665} {"train_loss": -6.89927339553833, "global_step": 153934, "epoch": 3665} {"train_loss": -6.806755065917969, "global_step": 153935, "epoch": 3665} {"train_loss": -6.783979892730713, "global_step": 153936, "epoch": 3665} {"train_loss": -6.877342224121094, "global_step": 153937, "epoch": 3665} {"train_loss": -6.908644676208496, "global_step": 153938, "epoch": 3665} {"train_loss": -6.785897731781006, "global_step": 153939, "epoch": 3665} {"train_loss": -6.844698905944824, "global_step": 153940, "epoch": 3665} {"train_loss": -6.838929653167725, "global_step": 153941, "epoch": 3665} {"train_loss": -6.917309761047363, "global_step": 153942, "epoch": 3665} {"train_loss": -6.8334550857543945, "global_step": 153943, "epoch": 3665} {"train_loss": -6.869441032409668, "global_step": 153944, "epoch": 3665} {"train_loss": -6.861666679382324, "global_step": 153945, "epoch": 3665} {"train_loss": -6.824455261230469, "global_step": 153946, "epoch": 3665} {"train_loss": -6.827915191650391, "global_step": 153947, "epoch": 3665} {"train_loss": -6.8905181884765625, "global_step": 153948, "epoch": 3665} {"train_loss": -6.924346923828125, "global_step": 153949, "epoch": 3665} {"train_loss": -6.901673316955566, "global_step": 153950, "epoch": 3665} {"train_loss": -6.936473846435547, "global_step": 153951, "epoch": 3665} {"train_loss": -6.971930503845215, "global_step": 153952, "epoch": 3665} {"train_loss": -6.820553302764893, "global_step": 153953, "epoch": 3665} {"train_loss": -6.864692687988281, "global_step": 153954, "epoch": 3665} {"train_loss": -6.927632808685303, "global_step": 153955, "epoch": 3665} {"train_loss": -6.903346538543701, "global_step": 153956, "epoch": 3665} {"train_loss": -6.956183433532715, "global_step": 153957, "epoch": 3665} {"train_loss": -6.888422966003418, "global_step": 153958, "epoch": 3665} {"train_loss": -6.82781982421875, "global_step": 153959, "epoch": 3665} {"train_loss": -6.877869129180908, "global_step": 153960, "epoch": 3665} {"train_loss": -6.918032646179199, "global_step": 153961, "epoch": 3665} {"train_loss": -6.7846903800964355, "global_step": 153962, "epoch": 3665} {"train_loss": -6.84124755859375, "global_step": 153963, "epoch": 3665} {"train_loss": -6.928495407104492, "global_step": 153964, "epoch": 3665} {"train_loss": -6.805912971496582, "global_step": 153965, "epoch": 3665} {"train_loss": -6.77630615234375, "global_step": 153966, "epoch": 3665} {"train_loss": -6.834842681884766, "global_step": 153967, "epoch": 3665} {"train_loss": -6.8620076179504395, "global_step": 153968, "epoch": 3665} {"train_loss": -6.84234619140625, "global_step": 153969, "epoch": 3665} {"train_loss": -6.83506965637207, "global_step": 153970, "epoch": 3665} {"train_loss": -6.860355377197266, "global_step": 153971, "epoch": 3665, "val_loss": 68656.921875} {"train_loss": -6.9165120124816895, "global_step": 153972, "epoch": 3666} {"train_loss": -6.91538143157959, "global_step": 153973, "epoch": 3666} {"train_loss": -6.922560691833496, "global_step": 153974, "epoch": 3666} {"train_loss": -6.862211227416992, "global_step": 153975, "epoch": 3666} {"train_loss": -6.854328155517578, "global_step": 153976, "epoch": 3666} {"train_loss": -6.95829963684082, "global_step": 153977, "epoch": 3666} {"train_loss": -6.893096923828125, "global_step": 153978, "epoch": 3666} {"train_loss": -6.852168083190918, "global_step": 153979, "epoch": 3666} {"train_loss": -6.912817001342773, "global_step": 153980, "epoch": 3666} {"train_loss": -6.925731182098389, "global_step": 153981, "epoch": 3666} {"train_loss": -6.854940414428711, "global_step": 153982, "epoch": 3666} {"train_loss": -6.882590293884277, "global_step": 153983, "epoch": 3666} {"train_loss": -6.768930912017822, "global_step": 153984, "epoch": 3666} {"train_loss": -7.088798999786377, "global_step": 153985, "epoch": 3666} {"train_loss": -6.9250288009643555, "global_step": 153986, "epoch": 3666} {"train_loss": -6.871669292449951, "global_step": 153987, "epoch": 3666} {"train_loss": -6.872514724731445, "global_step": 153988, "epoch": 3666} {"train_loss": -6.9853410720825195, "global_step": 153989, "epoch": 3666} {"train_loss": -6.902865409851074, "global_step": 153990, "epoch": 3666} {"train_loss": -6.790794372558594, "global_step": 153991, "epoch": 3666} {"train_loss": -6.873979568481445, "global_step": 153992, "epoch": 3666} {"train_loss": -6.843150615692139, "global_step": 153993, "epoch": 3666} {"train_loss": -6.8718109130859375, "global_step": 153994, "epoch": 3666} {"train_loss": -6.945651054382324, "global_step": 153995, "epoch": 3666} {"train_loss": -6.837363243103027, "global_step": 153996, "epoch": 3666} {"train_loss": -6.884583950042725, "global_step": 153997, "epoch": 3666} {"train_loss": -6.882271766662598, "global_step": 153998, "epoch": 3666} {"train_loss": -6.814140319824219, "global_step": 153999, "epoch": 3666} {"train_loss": -7.010223388671875, "global_step": 154000, "epoch": 3666} {"train_loss": -6.774899959564209, "global_step": 154001, "epoch": 3666} {"train_loss": -6.833580493927002, "global_step": 154002, "epoch": 3666} {"train_loss": -6.909067630767822, "global_step": 154003, "epoch": 3666} {"train_loss": -6.8846845626831055, "global_step": 154004, "epoch": 3666} {"train_loss": -6.827667236328125, "global_step": 154005, "epoch": 3666} {"train_loss": -6.909322738647461, "global_step": 154006, "epoch": 3666} {"train_loss": -6.820708274841309, "global_step": 154007, "epoch": 3666} {"train_loss": -7.001698970794678, "global_step": 154008, "epoch": 3666} {"train_loss": -6.849635124206543, "global_step": 154009, "epoch": 3666} {"train_loss": -6.921178340911865, "global_step": 154010, "epoch": 3666} {"train_loss": -6.8420844078063965, "global_step": 154011, "epoch": 3666} {"train_loss": -6.9049177169799805, "global_step": 154012, "epoch": 3666} {"train_loss": -6.884188606625512, "global_step": 154013, "epoch": 3666, "val_loss": 68564.859375} {"train_loss": -6.854617118835449, "global_step": 154014, "epoch": 3667} {"train_loss": -6.881222724914551, "global_step": 154015, "epoch": 3667} {"train_loss": -6.828691005706787, "global_step": 154016, "epoch": 3667} {"train_loss": -6.855576515197754, "global_step": 154017, "epoch": 3667} {"train_loss": -6.85669469833374, "global_step": 154018, "epoch": 3667} {"train_loss": -6.769967079162598, "global_step": 154019, "epoch": 3667} {"train_loss": -6.835285663604736, "global_step": 154020, "epoch": 3667} {"train_loss": -6.857458591461182, "global_step": 154021, "epoch": 3667} {"train_loss": -6.822680950164795, "global_step": 154022, "epoch": 3667} {"train_loss": -6.915778160095215, "global_step": 154023, "epoch": 3667} {"train_loss": -6.891589164733887, "global_step": 154024, "epoch": 3667} {"train_loss": -6.681304454803467, "global_step": 154025, "epoch": 3667} {"train_loss": -6.825570106506348, "global_step": 154026, "epoch": 3667} {"train_loss": -6.953047275543213, "global_step": 154027, "epoch": 3667} {"train_loss": -6.742283821105957, "global_step": 154028, "epoch": 3667} {"train_loss": -6.894538879394531, "global_step": 154029, "epoch": 3667} {"train_loss": -6.820298194885254, "global_step": 154030, "epoch": 3667} {"train_loss": -6.800256729125977, "global_step": 154031, "epoch": 3667} {"train_loss": -6.748148441314697, "global_step": 154032, "epoch": 3667} {"train_loss": -6.840508460998535, "global_step": 154033, "epoch": 3667} {"train_loss": -6.855472564697266, "global_step": 154034, "epoch": 3667} {"train_loss": -6.7934675216674805, "global_step": 154035, "epoch": 3667} {"train_loss": -6.843297958374023, "global_step": 154036, "epoch": 3667} {"train_loss": -6.736611366271973, "global_step": 154037, "epoch": 3667} {"train_loss": -6.763317584991455, "global_step": 154038, "epoch": 3667} {"train_loss": -6.816468238830566, "global_step": 154039, "epoch": 3667} {"train_loss": -6.871685981750488, "global_step": 154040, "epoch": 3667} {"train_loss": -6.828268051147461, "global_step": 154041, "epoch": 3667} {"train_loss": -6.951122283935547, "global_step": 154042, "epoch": 3667} {"train_loss": -6.878195762634277, "global_step": 154043, "epoch": 3667} {"train_loss": -6.8573198318481445, "global_step": 154044, "epoch": 3667} {"train_loss": -6.821527481079102, "global_step": 154045, "epoch": 3667} {"train_loss": -6.930697917938232, "global_step": 154046, "epoch": 3667} {"train_loss": -6.7932963371276855, "global_step": 154047, "epoch": 3667} {"train_loss": -6.907115936279297, "global_step": 154048, "epoch": 3667} {"train_loss": -6.768429279327393, "global_step": 154049, "epoch": 3667} {"train_loss": -6.91697359085083, "global_step": 154050, "epoch": 3667} {"train_loss": -6.865545272827148, "global_step": 154051, "epoch": 3667} {"train_loss": -6.893215179443359, "global_step": 154052, "epoch": 3667} {"train_loss": -6.822056770324707, "global_step": 154053, "epoch": 3667} {"train_loss": -6.831202983856201, "global_step": 154054, "epoch": 3667} {"train_loss": -6.839407307761056, "global_step": 154055, "epoch": 3667, "val_loss": 68491.6953125} {"train_loss": -6.781349182128906, "global_step": 154056, "epoch": 3668} {"train_loss": -6.847723484039307, "global_step": 154057, "epoch": 3668} {"train_loss": -6.879724502563477, "global_step": 154058, "epoch": 3668} {"train_loss": -6.895359039306641, "global_step": 154059, "epoch": 3668} {"train_loss": -6.806375503540039, "global_step": 154060, "epoch": 3668} {"train_loss": -6.855469703674316, "global_step": 154061, "epoch": 3668} {"train_loss": -6.875054359436035, "global_step": 154062, "epoch": 3668} {"train_loss": -6.882891654968262, "global_step": 154063, "epoch": 3668} {"train_loss": -6.965458869934082, "global_step": 154064, "epoch": 3668} {"train_loss": -6.7990827560424805, "global_step": 154065, "epoch": 3668} {"train_loss": -6.862135887145996, "global_step": 154066, "epoch": 3668} {"train_loss": -6.8036956787109375, "global_step": 154067, "epoch": 3668} {"train_loss": -6.913087844848633, "global_step": 154068, "epoch": 3668} {"train_loss": -6.876758098602295, "global_step": 154069, "epoch": 3668} {"train_loss": -6.991476058959961, "global_step": 154070, "epoch": 3668} {"train_loss": -6.7802534103393555, "global_step": 154071, "epoch": 3668} {"train_loss": -7.035390853881836, "global_step": 154072, "epoch": 3668} {"train_loss": -6.976104736328125, "global_step": 154073, "epoch": 3668} {"train_loss": -6.914461135864258, "global_step": 154074, "epoch": 3668} {"train_loss": -6.915346145629883, "global_step": 154075, "epoch": 3668} {"train_loss": -6.937666416168213, "global_step": 154076, "epoch": 3668} {"train_loss": -6.882681846618652, "global_step": 154077, "epoch": 3668} {"train_loss": -6.8950324058532715, "global_step": 154078, "epoch": 3668} {"train_loss": -6.913207054138184, "global_step": 154079, "epoch": 3668} {"train_loss": -6.865224838256836, "global_step": 154080, "epoch": 3668} {"train_loss": -6.821868896484375, "global_step": 154081, "epoch": 3668} {"train_loss": -6.925475120544434, "global_step": 154082, "epoch": 3668} {"train_loss": -6.805593490600586, "global_step": 154083, "epoch": 3668} {"train_loss": -6.912698268890381, "global_step": 154084, "epoch": 3668} {"train_loss": -6.862234115600586, "global_step": 154085, "epoch": 3668} {"train_loss": -6.7648091316223145, "global_step": 154086, "epoch": 3668} {"train_loss": -6.846304893493652, "global_step": 154087, "epoch": 3668} {"train_loss": -6.697886943817139, "global_step": 154088, "epoch": 3668} {"train_loss": -6.773863792419434, "global_step": 154089, "epoch": 3668} {"train_loss": -6.821445941925049, "global_step": 154090, "epoch": 3668} {"train_loss": -6.6809844970703125, "global_step": 154091, "epoch": 3668} {"train_loss": -6.780672550201416, "global_step": 154092, "epoch": 3668} {"train_loss": -6.741695404052734, "global_step": 154093, "epoch": 3668} {"train_loss": -6.8278679847717285, "global_step": 154094, "epoch": 3668} {"train_loss": -6.66323709487915, "global_step": 154095, "epoch": 3668} {"train_loss": -6.85073184967041, "global_step": 154096, "epoch": 3668} {"train_loss": -6.847061577297392, "global_step": 154097, "epoch": 3668, "val_loss": 68674.1328125} {"train_loss": -6.738956451416016, "global_step": 154098, "epoch": 3669} {"train_loss": -6.782552719116211, "global_step": 154099, "epoch": 3669} {"train_loss": -6.73311710357666, "global_step": 154100, "epoch": 3669} {"train_loss": -6.819602012634277, "global_step": 154101, "epoch": 3669} {"train_loss": -6.790222644805908, "global_step": 154102, "epoch": 3669} {"train_loss": -6.736461639404297, "global_step": 154103, "epoch": 3669} {"train_loss": -6.862062454223633, "global_step": 154104, "epoch": 3669} {"train_loss": -6.800084114074707, "global_step": 154105, "epoch": 3669} {"train_loss": -6.788899898529053, "global_step": 154106, "epoch": 3669} {"train_loss": -6.8466691970825195, "global_step": 154107, "epoch": 3669} {"train_loss": -6.769656181335449, "global_step": 154108, "epoch": 3669} {"train_loss": -6.8401408195495605, "global_step": 154109, "epoch": 3669} {"train_loss": -6.886656284332275, "global_step": 154110, "epoch": 3669} {"train_loss": -6.798487663269043, "global_step": 154111, "epoch": 3669} {"train_loss": -6.770658016204834, "global_step": 154112, "epoch": 3669} {"train_loss": -6.819815635681152, "global_step": 154113, "epoch": 3669} {"train_loss": -6.951885223388672, "global_step": 154114, "epoch": 3669} {"train_loss": -6.744623184204102, "global_step": 154115, "epoch": 3669} {"train_loss": -6.774060249328613, "global_step": 154116, "epoch": 3669} {"train_loss": -6.886258125305176, "global_step": 154117, "epoch": 3669} {"train_loss": -6.854726791381836, "global_step": 154118, "epoch": 3669} {"train_loss": -6.750330924987793, "global_step": 154119, "epoch": 3669} {"train_loss": -6.882494926452637, "global_step": 154120, "epoch": 3669} {"train_loss": -6.803218841552734, "global_step": 154121, "epoch": 3669} {"train_loss": -6.806674957275391, "global_step": 154122, "epoch": 3669} {"train_loss": -6.843847751617432, "global_step": 154123, "epoch": 3669} {"train_loss": -6.782157897949219, "global_step": 154124, "epoch": 3669} {"train_loss": -6.866089820861816, "global_step": 154125, "epoch": 3669} {"train_loss": -6.732977867126465, "global_step": 154126, "epoch": 3669} {"train_loss": -6.785257816314697, "global_step": 154127, "epoch": 3669} {"train_loss": -6.981751441955566, "global_step": 154128, "epoch": 3669} {"train_loss": -7.0231757164001465, "global_step": 154129, "epoch": 3669} {"train_loss": -6.710195541381836, "global_step": 154130, "epoch": 3669} {"train_loss": -6.955477237701416, "global_step": 154131, "epoch": 3669} {"train_loss": -6.947484016418457, "global_step": 154132, "epoch": 3669} {"train_loss": -6.870802879333496, "global_step": 154133, "epoch": 3669} {"train_loss": -6.915335655212402, "global_step": 154134, "epoch": 3669} {"train_loss": -6.757562637329102, "global_step": 154135, "epoch": 3669} {"train_loss": -6.915321350097656, "global_step": 154136, "epoch": 3669} {"train_loss": -6.826632499694824, "global_step": 154137, "epoch": 3669} {"train_loss": -6.847204208374023, "global_step": 154138, "epoch": 3669} {"train_loss": -6.832574322110131, "global_step": 154139, "epoch": 3669, "val_loss": 68485.5390625} {"train_loss": -6.959746360778809, "global_step": 154140, "epoch": 3670} {"train_loss": -6.923972129821777, "global_step": 154141, "epoch": 3670} {"train_loss": -6.875557899475098, "global_step": 154142, "epoch": 3670} {"train_loss": -6.844710350036621, "global_step": 154143, "epoch": 3670} {"train_loss": -6.952681541442871, "global_step": 154144, "epoch": 3670} {"train_loss": -6.720993518829346, "global_step": 154145, "epoch": 3670} {"train_loss": -6.808261871337891, "global_step": 154146, "epoch": 3670} {"train_loss": -6.815388202667236, "global_step": 154147, "epoch": 3670} {"train_loss": -6.757842063903809, "global_step": 154148, "epoch": 3670} {"train_loss": -6.902113437652588, "global_step": 154149, "epoch": 3670} {"train_loss": -6.823392868041992, "global_step": 154150, "epoch": 3670} {"train_loss": -6.8736138343811035, "global_step": 154151, "epoch": 3670} {"train_loss": -6.955449104309082, "global_step": 154152, "epoch": 3670} {"train_loss": -6.936982154846191, "global_step": 154153, "epoch": 3670} {"train_loss": -6.898877143859863, "global_step": 154154, "epoch": 3670} {"train_loss": -6.829108715057373, "global_step": 154155, "epoch": 3670} {"train_loss": -6.879598617553711, "global_step": 154156, "epoch": 3670} {"train_loss": -6.898975372314453, "global_step": 154157, "epoch": 3670} {"train_loss": -6.966793537139893, "global_step": 154158, "epoch": 3670} {"train_loss": -6.879899501800537, "global_step": 154159, "epoch": 3670} {"train_loss": -6.8048601150512695, "global_step": 154160, "epoch": 3670} {"train_loss": -6.872292995452881, "global_step": 154161, "epoch": 3670} {"train_loss": -7.001589775085449, "global_step": 154162, "epoch": 3670} {"train_loss": -6.875235557556152, "global_step": 154163, "epoch": 3670} {"train_loss": -6.868799209594727, "global_step": 154164, "epoch": 3670} {"train_loss": -7.041886329650879, "global_step": 154165, "epoch": 3670} {"train_loss": -6.856346130371094, "global_step": 154166, "epoch": 3670} {"train_loss": -6.8923726081848145, "global_step": 154167, "epoch": 3670} {"train_loss": -6.90963077545166, "global_step": 154168, "epoch": 3670} {"train_loss": -6.974414348602295, "global_step": 154169, "epoch": 3670} {"train_loss": -6.941064357757568, "global_step": 154170, "epoch": 3670} {"train_loss": -7.005579948425293, "global_step": 154171, "epoch": 3670} {"train_loss": -6.977692127227783, "global_step": 154172, "epoch": 3670} {"train_loss": -6.897741794586182, "global_step": 154173, "epoch": 3670} {"train_loss": -6.895434856414795, "global_step": 154174, "epoch": 3670} {"train_loss": -6.917996406555176, "global_step": 154175, "epoch": 3670} {"train_loss": -6.881741523742676, "global_step": 154176, "epoch": 3670} {"train_loss": -6.9053955078125, "global_step": 154177, "epoch": 3670} {"train_loss": -6.96447229385376, "global_step": 154178, "epoch": 3670} {"train_loss": -6.864574909210205, "global_step": 154179, "epoch": 3670} {"train_loss": -6.929498195648193, "global_step": 154180, "epoch": 3670} {"train_loss": -6.9000763438996815, "global_step": 154181, "epoch": 3670, "val_loss": 68352.1875} {"train_loss": -6.842329978942871, "global_step": 154182, "epoch": 3671} {"train_loss": -6.912932395935059, "global_step": 154183, "epoch": 3671} {"train_loss": -6.965712070465088, "global_step": 154184, "epoch": 3671} {"train_loss": -7.0369977951049805, "global_step": 154185, "epoch": 3671} {"train_loss": -6.886240005493164, "global_step": 154186, "epoch": 3671} {"train_loss": -7.039038181304932, "global_step": 154187, "epoch": 3671} {"train_loss": -6.919193744659424, "global_step": 154188, "epoch": 3671} {"train_loss": -6.957757949829102, "global_step": 154189, "epoch": 3671} {"train_loss": -7.011618614196777, "global_step": 154190, "epoch": 3671} {"train_loss": -6.835573673248291, "global_step": 154191, "epoch": 3671} {"train_loss": -6.917497634887695, "global_step": 154192, "epoch": 3671} {"train_loss": -6.920734882354736, "global_step": 154193, "epoch": 3671} {"train_loss": -6.924814224243164, "global_step": 154194, "epoch": 3671} {"train_loss": -6.833446502685547, "global_step": 154195, "epoch": 3671} {"train_loss": -6.939670562744141, "global_step": 154196, "epoch": 3671} {"train_loss": -6.833146095275879, "global_step": 154197, "epoch": 3671} {"train_loss": -6.780461311340332, "global_step": 154198, "epoch": 3671} {"train_loss": -6.917078018188477, "global_step": 154199, "epoch": 3671} {"train_loss": -6.8265204429626465, "global_step": 154200, "epoch": 3671} {"train_loss": -6.855213165283203, "global_step": 154201, "epoch": 3671} {"train_loss": -6.86544942855835, "global_step": 154202, "epoch": 3671} {"train_loss": -6.899909496307373, "global_step": 154203, "epoch": 3671} {"train_loss": -6.784771919250488, "global_step": 154204, "epoch": 3671} {"train_loss": -6.820391654968262, "global_step": 154205, "epoch": 3671} {"train_loss": -6.706849098205566, "global_step": 154206, "epoch": 3671} {"train_loss": -6.858336925506592, "global_step": 154207, "epoch": 3671} {"train_loss": -6.821732997894287, "global_step": 154208, "epoch": 3671} {"train_loss": -6.924686431884766, "global_step": 154209, "epoch": 3671} {"train_loss": -6.848509788513184, "global_step": 154210, "epoch": 3671} {"train_loss": -6.938655376434326, "global_step": 154211, "epoch": 3671} {"train_loss": -6.658147811889648, "global_step": 154212, "epoch": 3671} {"train_loss": -6.917558193206787, "global_step": 154213, "epoch": 3671} {"train_loss": -6.906841278076172, "global_step": 154214, "epoch": 3671} {"train_loss": -6.784661293029785, "global_step": 154215, "epoch": 3671} {"train_loss": -6.7569580078125, "global_step": 154216, "epoch": 3671} {"train_loss": -6.752688407897949, "global_step": 154217, "epoch": 3671} {"train_loss": -6.80446720123291, "global_step": 154218, "epoch": 3671} {"train_loss": -6.77459716796875, "global_step": 154219, "epoch": 3671} {"train_loss": -6.8045454025268555, "global_step": 154220, "epoch": 3671} {"train_loss": -6.883178234100342, "global_step": 154221, "epoch": 3671} {"train_loss": -6.733260154724121, "global_step": 154222, "epoch": 3671} {"train_loss": -6.864139159520467, "global_step": 154223, "epoch": 3671, "val_loss": 68740.0} {"train_loss": -6.770484447479248, "global_step": 154224, "epoch": 3672} {"train_loss": -6.803821563720703, "global_step": 154225, "epoch": 3672} {"train_loss": -6.9258809089660645, "global_step": 154226, "epoch": 3672} {"train_loss": -6.815791130065918, "global_step": 154227, "epoch": 3672} {"train_loss": -6.839434623718262, "global_step": 154228, "epoch": 3672} {"train_loss": -6.833464622497559, "global_step": 154229, "epoch": 3672} {"train_loss": -6.909124851226807, "global_step": 154230, "epoch": 3672} {"train_loss": -6.987881660461426, "global_step": 154231, "epoch": 3672} {"train_loss": -6.854942321777344, "global_step": 154232, "epoch": 3672} {"train_loss": -6.8492021560668945, "global_step": 154233, "epoch": 3672} {"train_loss": -6.8375244140625, "global_step": 154234, "epoch": 3672} {"train_loss": -6.910841464996338, "global_step": 154235, "epoch": 3672} {"train_loss": -6.849498271942139, "global_step": 154236, "epoch": 3672} {"train_loss": -6.799764156341553, "global_step": 154237, "epoch": 3672} {"train_loss": -6.870908260345459, "global_step": 154238, "epoch": 3672} {"train_loss": -6.9077372550964355, "global_step": 154239, "epoch": 3672} {"train_loss": -6.889297962188721, "global_step": 154240, "epoch": 3672} {"train_loss": -6.796564102172852, "global_step": 154241, "epoch": 3672} {"train_loss": -6.83691930770874, "global_step": 154242, "epoch": 3672} {"train_loss": -6.978460788726807, "global_step": 154243, "epoch": 3672} {"train_loss": -6.899836540222168, "global_step": 154244, "epoch": 3672} {"train_loss": -6.768237113952637, "global_step": 154245, "epoch": 3672} {"train_loss": -6.833256244659424, "global_step": 154246, "epoch": 3672} {"train_loss": -6.748076438903809, "global_step": 154247, "epoch": 3672} {"train_loss": -6.777253150939941, "global_step": 154248, "epoch": 3672} {"train_loss": -6.739971160888672, "global_step": 154249, "epoch": 3672} {"train_loss": -6.526655673980713, "global_step": 154250, "epoch": 3672} {"train_loss": -6.776723861694336, "global_step": 154251, "epoch": 3672} {"train_loss": -6.688992500305176, "global_step": 154252, "epoch": 3672} {"train_loss": -6.688136100769043, "global_step": 154253, "epoch": 3672} {"train_loss": -6.756551742553711, "global_step": 154254, "epoch": 3672} {"train_loss": -6.473441123962402, "global_step": 154255, "epoch": 3672} {"train_loss": -6.760067939758301, "global_step": 154256, "epoch": 3672} {"train_loss": -6.301878929138184, "global_step": 154257, "epoch": 3672} {"train_loss": -6.852687358856201, "global_step": 154258, "epoch": 3672} {"train_loss": -6.592179298400879, "global_step": 154259, "epoch": 3672} {"train_loss": -6.656097888946533, "global_step": 154260, "epoch": 3672} {"train_loss": -6.735074996948242, "global_step": 154261, "epoch": 3672} {"train_loss": -6.803982734680176, "global_step": 154262, "epoch": 3672} {"train_loss": -6.660362243652344, "global_step": 154263, "epoch": 3672} {"train_loss": -6.705885410308838, "global_step": 154264, "epoch": 3672} {"train_loss": -6.779019151415143, "global_step": 154265, "epoch": 3672, "val_loss": 68574.3984375} {"train_loss": -6.730463981628418, "global_step": 154266, "epoch": 3673} {"train_loss": -6.660239219665527, "global_step": 154267, "epoch": 3673} {"train_loss": -6.6482253074646, "global_step": 154268, "epoch": 3673} {"train_loss": -6.744763374328613, "global_step": 154269, "epoch": 3673} {"train_loss": -6.728219509124756, "global_step": 154270, "epoch": 3673} {"train_loss": -6.812783241271973, "global_step": 154271, "epoch": 3673} {"train_loss": -6.7643561363220215, "global_step": 154272, "epoch": 3673} {"train_loss": -6.807611465454102, "global_step": 154273, "epoch": 3673} {"train_loss": -6.820198059082031, "global_step": 154274, "epoch": 3673} {"train_loss": -6.762248992919922, "global_step": 154275, "epoch": 3673} {"train_loss": -6.815920829772949, "global_step": 154276, "epoch": 3673} {"train_loss": -6.798436164855957, "global_step": 154277, "epoch": 3673} {"train_loss": -6.795488357543945, "global_step": 154278, "epoch": 3673} {"train_loss": -6.7903971672058105, "global_step": 154279, "epoch": 3673} {"train_loss": -6.820898532867432, "global_step": 154280, "epoch": 3673} {"train_loss": -6.896511077880859, "global_step": 154281, "epoch": 3673} {"train_loss": -6.755642414093018, "global_step": 154282, "epoch": 3673} {"train_loss": -6.8830366134643555, "global_step": 154283, "epoch": 3673} {"train_loss": -6.775955677032471, "global_step": 154284, "epoch": 3673} {"train_loss": -6.850809097290039, "global_step": 154285, "epoch": 3673} {"train_loss": -6.923420429229736, "global_step": 154286, "epoch": 3673} {"train_loss": -6.900845527648926, "global_step": 154287, "epoch": 3673} {"train_loss": -6.88283109664917, "global_step": 154288, "epoch": 3673} {"train_loss": -6.819226264953613, "global_step": 154289, "epoch": 3673} {"train_loss": -6.8261613845825195, "global_step": 154290, "epoch": 3673} {"train_loss": -6.859361171722412, "global_step": 154291, "epoch": 3673} {"train_loss": -6.993597507476807, "global_step": 154292, "epoch": 3673} {"train_loss": -6.951386451721191, "global_step": 154293, "epoch": 3673} {"train_loss": -6.855076789855957, "global_step": 154294, "epoch": 3673} {"train_loss": -6.8245415687561035, "global_step": 154295, "epoch": 3673} {"train_loss": -6.862606048583984, "global_step": 154296, "epoch": 3673} {"train_loss": -6.847724437713623, "global_step": 154297, "epoch": 3673} {"train_loss": -6.808022499084473, "global_step": 154298, "epoch": 3673} {"train_loss": -6.8954973220825195, "global_step": 154299, "epoch": 3673} {"train_loss": -6.9498701095581055, "global_step": 154300, "epoch": 3673} {"train_loss": -6.854052543640137, "global_step": 154301, "epoch": 3673} {"train_loss": -6.863980293273926, "global_step": 154302, "epoch": 3673} {"train_loss": -6.85801362991333, "global_step": 154303, "epoch": 3673} {"train_loss": -6.953155994415283, "global_step": 154304, "epoch": 3673} {"train_loss": -6.832646369934082, "global_step": 154305, "epoch": 3673} {"train_loss": -6.835474014282227, "global_step": 154306, "epoch": 3673} {"train_loss": -6.83137709753854, "global_step": 154307, "epoch": 3673, "val_loss": 68586.9453125} {"train_loss": -6.828982353210449, "global_step": 154308, "epoch": 3674} {"train_loss": -6.928221702575684, "global_step": 154309, "epoch": 3674} {"train_loss": -6.923395156860352, "global_step": 154310, "epoch": 3674} {"train_loss": -6.811032772064209, "global_step": 154311, "epoch": 3674} {"train_loss": -6.956908226013184, "global_step": 154312, "epoch": 3674} {"train_loss": -6.891397953033447, "global_step": 154313, "epoch": 3674} {"train_loss": -6.858183860778809, "global_step": 154314, "epoch": 3674} {"train_loss": -6.921233177185059, "global_step": 154315, "epoch": 3674} {"train_loss": -6.825907230377197, "global_step": 154316, "epoch": 3674} {"train_loss": -6.935527801513672, "global_step": 154317, "epoch": 3674} {"train_loss": -6.979274749755859, "global_step": 154318, "epoch": 3674} {"train_loss": -6.893157958984375, "global_step": 154319, "epoch": 3674} {"train_loss": -6.945694923400879, "global_step": 154320, "epoch": 3674} {"train_loss": -6.8235650062561035, "global_step": 154321, "epoch": 3674} {"train_loss": -6.793458461761475, "global_step": 154322, "epoch": 3674} {"train_loss": -6.934207916259766, "global_step": 154323, "epoch": 3674} {"train_loss": -6.787397861480713, "global_step": 154324, "epoch": 3674} {"train_loss": -6.629398345947266, "global_step": 154325, "epoch": 3674} {"train_loss": -6.785031318664551, "global_step": 154326, "epoch": 3674} {"train_loss": -6.996935844421387, "global_step": 154327, "epoch": 3674} {"train_loss": -6.811553001403809, "global_step": 154328, "epoch": 3674} {"train_loss": -6.881431579589844, "global_step": 154329, "epoch": 3674} {"train_loss": -6.730510711669922, "global_step": 154330, "epoch": 3674} {"train_loss": -6.780069828033447, "global_step": 154331, "epoch": 3674} {"train_loss": -6.8732404708862305, "global_step": 154332, "epoch": 3674} {"train_loss": -6.938564300537109, "global_step": 154333, "epoch": 3674} {"train_loss": -6.9148335456848145, "global_step": 154334, "epoch": 3674} {"train_loss": -6.828124523162842, "global_step": 154335, "epoch": 3674} {"train_loss": -6.845171928405762, "global_step": 154336, "epoch": 3674} {"train_loss": -6.917541027069092, "global_step": 154337, "epoch": 3674} {"train_loss": -6.881251811981201, "global_step": 154338, "epoch": 3674} {"train_loss": -6.759511947631836, "global_step": 154339, "epoch": 3674} {"train_loss": -6.753800392150879, "global_step": 154340, "epoch": 3674} {"train_loss": -6.851625442504883, "global_step": 154341, "epoch": 3674} {"train_loss": -6.8432536125183105, "global_step": 154342, "epoch": 3674} {"train_loss": -6.967792510986328, "global_step": 154343, "epoch": 3674} {"train_loss": -6.833230972290039, "global_step": 154344, "epoch": 3674} {"train_loss": -6.780434608459473, "global_step": 154345, "epoch": 3674} {"train_loss": -6.894128799438477, "global_step": 154346, "epoch": 3674} {"train_loss": -6.8969221115112305, "global_step": 154347, "epoch": 3674} {"train_loss": -6.85731315612793, "global_step": 154348, "epoch": 3674} {"train_loss": -6.856029010954357, "global_step": 154349, "epoch": 3674, "val_loss": 68419.1328125} {"train_loss": -6.973494052886963, "global_step": 154350, "epoch": 3675} {"train_loss": -6.973770618438721, "global_step": 154351, "epoch": 3675} {"train_loss": -6.890729904174805, "global_step": 154352, "epoch": 3675} {"train_loss": -6.828432083129883, "global_step": 154353, "epoch": 3675} {"train_loss": -6.79112434387207, "global_step": 154354, "epoch": 3675} {"train_loss": -6.878830432891846, "global_step": 154355, "epoch": 3675} {"train_loss": -6.7851972579956055, "global_step": 154356, "epoch": 3675} {"train_loss": -6.926576614379883, "global_step": 154357, "epoch": 3675} {"train_loss": -6.863092422485352, "global_step": 154358, "epoch": 3675} {"train_loss": -6.843189239501953, "global_step": 154359, "epoch": 3675} {"train_loss": -6.874537467956543, "global_step": 154360, "epoch": 3675} {"train_loss": -6.875216484069824, "global_step": 154361, "epoch": 3675} {"train_loss": -6.885838508605957, "global_step": 154362, "epoch": 3675} {"train_loss": -6.862330436706543, "global_step": 154363, "epoch": 3675} {"train_loss": -6.820659637451172, "global_step": 154364, "epoch": 3675} {"train_loss": -6.924361705780029, "global_step": 154365, "epoch": 3675} {"train_loss": -6.911191463470459, "global_step": 154366, "epoch": 3675} {"train_loss": -6.884354591369629, "global_step": 154367, "epoch": 3675} {"train_loss": -6.91037654876709, "global_step": 154368, "epoch": 3675} {"train_loss": -6.7781782150268555, "global_step": 154369, "epoch": 3675} {"train_loss": -6.894780158996582, "global_step": 154370, "epoch": 3675} {"train_loss": -6.85391902923584, "global_step": 154371, "epoch": 3675} {"train_loss": -6.779684066772461, "global_step": 154372, "epoch": 3675} {"train_loss": -6.8683648109436035, "global_step": 154373, "epoch": 3675} {"train_loss": -6.726648330688477, "global_step": 154374, "epoch": 3675} {"train_loss": -6.734724521636963, "global_step": 154375, "epoch": 3675} {"train_loss": -6.814490795135498, "global_step": 154376, "epoch": 3675} {"train_loss": -6.51348876953125, "global_step": 154377, "epoch": 3675} {"train_loss": -6.570036888122559, "global_step": 154378, "epoch": 3675} {"train_loss": -6.627283573150635, "global_step": 154379, "epoch": 3675} {"train_loss": -6.7002434730529785, "global_step": 154380, "epoch": 3675} {"train_loss": -6.755830764770508, "global_step": 154381, "epoch": 3675} {"train_loss": -6.557145118713379, "global_step": 154382, "epoch": 3675} {"train_loss": -6.802777290344238, "global_step": 154383, "epoch": 3675} {"train_loss": -6.547076225280762, "global_step": 154384, "epoch": 3675} {"train_loss": -6.747475624084473, "global_step": 154385, "epoch": 3675} {"train_loss": -6.700568199157715, "global_step": 154386, "epoch": 3675} {"train_loss": -6.5258893966674805, "global_step": 154387, "epoch": 3675} {"train_loss": -6.628714561462402, "global_step": 154388, "epoch": 3675} {"train_loss": -6.678171634674072, "global_step": 154389, "epoch": 3675} {"train_loss": -6.728025436401367, "global_step": 154390, "epoch": 3675} {"train_loss": -6.782965682801747, "global_step": 154391, "epoch": 3675, "val_loss": 68713.78125} {"train_loss": -6.748388290405273, "global_step": 154392, "epoch": 3676} {"train_loss": -6.748684406280518, "global_step": 154393, "epoch": 3676} {"train_loss": -6.81998348236084, "global_step": 154394, "epoch": 3676} {"train_loss": -6.642670631408691, "global_step": 154395, "epoch": 3676} {"train_loss": -6.779515266418457, "global_step": 154396, "epoch": 3676} {"train_loss": -6.762733459472656, "global_step": 154397, "epoch": 3676} {"train_loss": -6.818121433258057, "global_step": 154398, "epoch": 3676} {"train_loss": -6.781248092651367, "global_step": 154399, "epoch": 3676} {"train_loss": -6.823186874389648, "global_step": 154400, "epoch": 3676} {"train_loss": -6.897719383239746, "global_step": 154401, "epoch": 3676} {"train_loss": -6.895412921905518, "global_step": 154402, "epoch": 3676} {"train_loss": -6.870461940765381, "global_step": 154403, "epoch": 3676} {"train_loss": -6.812463283538818, "global_step": 154404, "epoch": 3676} {"train_loss": -6.941249847412109, "global_step": 154405, "epoch": 3676} {"train_loss": -6.827247619628906, "global_step": 154406, "epoch": 3676} {"train_loss": -6.788521766662598, "global_step": 154407, "epoch": 3676} {"train_loss": -6.865908622741699, "global_step": 154408, "epoch": 3676} {"train_loss": -6.869349956512451, "global_step": 154409, "epoch": 3676} {"train_loss": -6.814873695373535, "global_step": 154410, "epoch": 3676} {"train_loss": -6.878842830657959, "global_step": 154411, "epoch": 3676} {"train_loss": -6.7789082527160645, "global_step": 154412, "epoch": 3676} {"train_loss": -6.870773792266846, "global_step": 154413, "epoch": 3676} {"train_loss": -6.890386581420898, "global_step": 154414, "epoch": 3676} {"train_loss": -6.913296222686768, "global_step": 154415, "epoch": 3676} {"train_loss": -6.7319254875183105, "global_step": 154416, "epoch": 3676} {"train_loss": -6.838618278503418, "global_step": 154417, "epoch": 3676} {"train_loss": -6.845006942749023, "global_step": 154418, "epoch": 3676} {"train_loss": -7.018579959869385, "global_step": 154419, "epoch": 3676} {"train_loss": -6.896508693695068, "global_step": 154420, "epoch": 3676} {"train_loss": -6.893354415893555, "global_step": 154421, "epoch": 3676} {"train_loss": -6.855463981628418, "global_step": 154422, "epoch": 3676} {"train_loss": -6.832377910614014, "global_step": 154423, "epoch": 3676} {"train_loss": -6.716246604919434, "global_step": 154424, "epoch": 3676} {"train_loss": -6.8615593910217285, "global_step": 154425, "epoch": 3676} {"train_loss": -6.798516273498535, "global_step": 154426, "epoch": 3676} {"train_loss": -6.860189914703369, "global_step": 154427, "epoch": 3676} {"train_loss": -6.761388778686523, "global_step": 154428, "epoch": 3676} {"train_loss": -6.819411754608154, "global_step": 154429, "epoch": 3676} {"train_loss": -6.813514709472656, "global_step": 154430, "epoch": 3676} {"train_loss": -6.844146251678467, "global_step": 154431, "epoch": 3676} {"train_loss": -6.896661758422852, "global_step": 154432, "epoch": 3676} {"train_loss": -6.835068316686721, "global_step": 154433, "epoch": 3676, "val_loss": 68504.515625} {"train_loss": -6.858007431030273, "global_step": 154434, "epoch": 3677} {"train_loss": -6.910286903381348, "global_step": 154435, "epoch": 3677} {"train_loss": -6.89368200302124, "global_step": 154436, "epoch": 3677} {"train_loss": -6.984563827514648, "global_step": 154437, "epoch": 3677} {"train_loss": -6.870339393615723, "global_step": 154438, "epoch": 3677} {"train_loss": -6.826144218444824, "global_step": 154439, "epoch": 3677} {"train_loss": -6.682372570037842, "global_step": 154440, "epoch": 3677} {"train_loss": -6.762945652008057, "global_step": 154441, "epoch": 3677} {"train_loss": -6.793351650238037, "global_step": 154442, "epoch": 3677} {"train_loss": -6.752750396728516, "global_step": 154443, "epoch": 3677} {"train_loss": -6.965173244476318, "global_step": 154444, "epoch": 3677} {"train_loss": -6.757560729980469, "global_step": 154445, "epoch": 3677} {"train_loss": -6.85493278503418, "global_step": 154446, "epoch": 3677} {"train_loss": -6.784865856170654, "global_step": 154447, "epoch": 3677} {"train_loss": -6.731043338775635, "global_step": 154448, "epoch": 3677} {"train_loss": -6.796640396118164, "global_step": 154449, "epoch": 3677} {"train_loss": -6.91918420791626, "global_step": 154450, "epoch": 3677} {"train_loss": -6.740467071533203, "global_step": 154451, "epoch": 3677} {"train_loss": -6.781427383422852, "global_step": 154452, "epoch": 3677} {"train_loss": -6.8050737380981445, "global_step": 154453, "epoch": 3677} {"train_loss": -6.818009376525879, "global_step": 154454, "epoch": 3677} {"train_loss": -6.7549028396606445, "global_step": 154455, "epoch": 3677} {"train_loss": -6.822149276733398, "global_step": 154456, "epoch": 3677} {"train_loss": -6.83262825012207, "global_step": 154457, "epoch": 3677} {"train_loss": -6.753931999206543, "global_step": 154458, "epoch": 3677} {"train_loss": -6.848689556121826, "global_step": 154459, "epoch": 3677} {"train_loss": -6.856500148773193, "global_step": 154460, "epoch": 3677} {"train_loss": -6.775635719299316, "global_step": 154461, "epoch": 3677} {"train_loss": -6.840022087097168, "global_step": 154462, "epoch": 3677} {"train_loss": -6.8730974197387695, "global_step": 154463, "epoch": 3677} {"train_loss": -6.911844730377197, "global_step": 154464, "epoch": 3677} {"train_loss": -6.797163009643555, "global_step": 154465, "epoch": 3677} {"train_loss": -6.929466247558594, "global_step": 154466, "epoch": 3677} {"train_loss": -6.777482032775879, "global_step": 154467, "epoch": 3677} {"train_loss": -6.787073135375977, "global_step": 154468, "epoch": 3677} {"train_loss": -6.826137065887451, "global_step": 154469, "epoch": 3677} {"train_loss": -6.812376022338867, "global_step": 154470, "epoch": 3677} {"train_loss": -6.6765971183776855, "global_step": 154471, "epoch": 3677} {"train_loss": -6.872320652008057, "global_step": 154472, "epoch": 3677} {"train_loss": -6.817419052124023, "global_step": 154473, "epoch": 3677} {"train_loss": -6.7262115478515625, "global_step": 154474, "epoch": 3677} {"train_loss": -6.819071190697806, "global_step": 154475, "epoch": 3677, "val_loss": 68510.2890625} {"train_loss": -6.747376441955566, "global_step": 154476, "epoch": 3678} {"train_loss": -6.813720703125, "global_step": 154477, "epoch": 3678} {"train_loss": -6.9365644454956055, "global_step": 154478, "epoch": 3678} {"train_loss": -6.708820819854736, "global_step": 154479, "epoch": 3678} {"train_loss": -6.763727188110352, "global_step": 154480, "epoch": 3678} {"train_loss": -6.91471004486084, "global_step": 154481, "epoch": 3678} {"train_loss": -6.770976543426514, "global_step": 154482, "epoch": 3678} {"train_loss": -6.907805442810059, "global_step": 154483, "epoch": 3678} {"train_loss": -6.706743240356445, "global_step": 154484, "epoch": 3678} {"train_loss": -6.707014083862305, "global_step": 154485, "epoch": 3678} {"train_loss": -6.789504051208496, "global_step": 154486, "epoch": 3678} {"train_loss": -6.6506028175354, "global_step": 154487, "epoch": 3678} {"train_loss": -6.838118553161621, "global_step": 154488, "epoch": 3678} {"train_loss": -6.844973564147949, "global_step": 154489, "epoch": 3678} {"train_loss": -6.880067825317383, "global_step": 154490, "epoch": 3678} {"train_loss": -6.811960220336914, "global_step": 154491, "epoch": 3678} {"train_loss": -6.784360885620117, "global_step": 154492, "epoch": 3678} {"train_loss": -6.862735748291016, "global_step": 154493, "epoch": 3678} {"train_loss": -6.738825798034668, "global_step": 154494, "epoch": 3678} {"train_loss": -6.776168346405029, "global_step": 154495, "epoch": 3678} {"train_loss": -6.649863243103027, "global_step": 154496, "epoch": 3678} {"train_loss": -6.757887840270996, "global_step": 154497, "epoch": 3678} {"train_loss": -6.907862663269043, "global_step": 154498, "epoch": 3678} {"train_loss": -6.860849857330322, "global_step": 154499, "epoch": 3678} {"train_loss": -6.7793660163879395, "global_step": 154500, "epoch": 3678} {"train_loss": -6.878579616546631, "global_step": 154501, "epoch": 3678} {"train_loss": -6.837183952331543, "global_step": 154502, "epoch": 3678} {"train_loss": -6.8692402839660645, "global_step": 154503, "epoch": 3678} {"train_loss": -6.837412357330322, "global_step": 154504, "epoch": 3678} {"train_loss": -6.923906326293945, "global_step": 154505, "epoch": 3678} {"train_loss": -6.708260536193848, "global_step": 154506, "epoch": 3678} {"train_loss": -6.956730365753174, "global_step": 154507, "epoch": 3678} {"train_loss": -6.8847784996032715, "global_step": 154508, "epoch": 3678} {"train_loss": -6.862849712371826, "global_step": 154509, "epoch": 3678} {"train_loss": -6.919411659240723, "global_step": 154510, "epoch": 3678} {"train_loss": -6.9079155921936035, "global_step": 154511, "epoch": 3678} {"train_loss": -6.867847919464111, "global_step": 154512, "epoch": 3678} {"train_loss": -6.856043338775635, "global_step": 154513, "epoch": 3678} {"train_loss": -6.858137130737305, "global_step": 154514, "epoch": 3678} {"train_loss": -7.007246971130371, "global_step": 154515, "epoch": 3678} {"train_loss": -6.864964008331299, "global_step": 154516, "epoch": 3678} {"train_loss": -6.826994396391369, "global_step": 154517, "epoch": 3678, "val_loss": 68608.921875} {"train_loss": -6.8677897453308105, "global_step": 154518, "epoch": 3679} {"train_loss": -6.7331624031066895, "global_step": 154519, "epoch": 3679} {"train_loss": -6.900918960571289, "global_step": 154520, "epoch": 3679} {"train_loss": -6.784363746643066, "global_step": 154521, "epoch": 3679} {"train_loss": -6.822851181030273, "global_step": 154522, "epoch": 3679} {"train_loss": -6.859025955200195, "global_step": 154523, "epoch": 3679} {"train_loss": -6.888649940490723, "global_step": 154524, "epoch": 3679} {"train_loss": -6.861483097076416, "global_step": 154525, "epoch": 3679} {"train_loss": -6.852303504943848, "global_step": 154526, "epoch": 3679} {"train_loss": -6.8448166847229, "global_step": 154527, "epoch": 3679} {"train_loss": -6.799561023712158, "global_step": 154528, "epoch": 3679} {"train_loss": -6.95780086517334, "global_step": 154529, "epoch": 3679} {"train_loss": -6.8306121826171875, "global_step": 154530, "epoch": 3679} {"train_loss": -6.970587730407715, "global_step": 154531, "epoch": 3679} {"train_loss": -7.018225193023682, "global_step": 154532, "epoch": 3679} {"train_loss": -6.9981160163879395, "global_step": 154533, "epoch": 3679} {"train_loss": -6.966695785522461, "global_step": 154534, "epoch": 3679} {"train_loss": -6.9478888511657715, "global_step": 154535, "epoch": 3679} {"train_loss": -6.959762096405029, "global_step": 154536, "epoch": 3679} {"train_loss": -6.85324764251709, "global_step": 154537, "epoch": 3679} {"train_loss": -6.886161804199219, "global_step": 154538, "epoch": 3679} {"train_loss": -6.856226444244385, "global_step": 154539, "epoch": 3679} {"train_loss": -6.867049217224121, "global_step": 154540, "epoch": 3679} {"train_loss": -6.79780387878418, "global_step": 154541, "epoch": 3679} {"train_loss": -6.9104743003845215, "global_step": 154542, "epoch": 3679} {"train_loss": -6.874220371246338, "global_step": 154543, "epoch": 3679} {"train_loss": -6.857546329498291, "global_step": 154544, "epoch": 3679} {"train_loss": -6.964311599731445, "global_step": 154545, "epoch": 3679} {"train_loss": -6.893613815307617, "global_step": 154546, "epoch": 3679} {"train_loss": -6.857478141784668, "global_step": 154547, "epoch": 3679} {"train_loss": -6.898769378662109, "global_step": 154548, "epoch": 3679} {"train_loss": -6.777652740478516, "global_step": 154549, "epoch": 3679} {"train_loss": -6.8313398361206055, "global_step": 154550, "epoch": 3679} {"train_loss": -6.879024982452393, "global_step": 154551, "epoch": 3679} {"train_loss": -6.844048023223877, "global_step": 154552, "epoch": 3679} {"train_loss": -6.831478118896484, "global_step": 154553, "epoch": 3679} {"train_loss": -6.700039863586426, "global_step": 154554, "epoch": 3679} {"train_loss": -6.813240051269531, "global_step": 154555, "epoch": 3679} {"train_loss": -6.850592136383057, "global_step": 154556, "epoch": 3679} {"train_loss": -6.864105224609375, "global_step": 154557, "epoch": 3679} {"train_loss": -6.911664962768555, "global_step": 154558, "epoch": 3679} {"train_loss": -6.871452547255016, "global_step": 154559, "epoch": 3679, "val_loss": 68440.265625} {"train_loss": -6.858540058135986, "global_step": 154560, "epoch": 3680} {"train_loss": -6.979635238647461, "global_step": 154561, "epoch": 3680} {"train_loss": -6.867959022521973, "global_step": 154562, "epoch": 3680} {"train_loss": -6.809372901916504, "global_step": 154563, "epoch": 3680} {"train_loss": -6.876411437988281, "global_step": 154564, "epoch": 3680} {"train_loss": -6.8302106857299805, "global_step": 154565, "epoch": 3680} {"train_loss": -6.922390937805176, "global_step": 154566, "epoch": 3680} {"train_loss": -6.947447776794434, "global_step": 154567, "epoch": 3680} {"train_loss": -6.801893711090088, "global_step": 154568, "epoch": 3680} {"train_loss": -6.852911949157715, "global_step": 154569, "epoch": 3680} {"train_loss": -6.761775970458984, "global_step": 154570, "epoch": 3680} {"train_loss": -6.902939796447754, "global_step": 154571, "epoch": 3680} {"train_loss": -6.826403617858887, "global_step": 154572, "epoch": 3680} {"train_loss": -6.917156219482422, "global_step": 154573, "epoch": 3680} {"train_loss": -6.851520538330078, "global_step": 154574, "epoch": 3680} {"train_loss": -6.769463539123535, "global_step": 154575, "epoch": 3680} {"train_loss": -6.797377586364746, "global_step": 154576, "epoch": 3680} {"train_loss": -6.802094459533691, "global_step": 154577, "epoch": 3680} {"train_loss": -6.857687473297119, "global_step": 154578, "epoch": 3680} {"train_loss": -6.902186393737793, "global_step": 154579, "epoch": 3680} {"train_loss": -6.953192710876465, "global_step": 154580, "epoch": 3680} {"train_loss": -6.8913774490356445, "global_step": 154581, "epoch": 3680} {"train_loss": -6.872062683105469, "global_step": 154582, "epoch": 3680} {"train_loss": -6.964332580566406, "global_step": 154583, "epoch": 3680} {"train_loss": -6.835234642028809, "global_step": 154584, "epoch": 3680} {"train_loss": -6.913191795349121, "global_step": 154585, "epoch": 3680} {"train_loss": -6.962089538574219, "global_step": 154586, "epoch": 3680} {"train_loss": -6.820019721984863, "global_step": 154587, "epoch": 3680} {"train_loss": -6.9097394943237305, "global_step": 154588, "epoch": 3680} {"train_loss": -6.878959655761719, "global_step": 154589, "epoch": 3680} {"train_loss": -6.9353437423706055, "global_step": 154590, "epoch": 3680} {"train_loss": -7.00654935836792, "global_step": 154591, "epoch": 3680} {"train_loss": -6.9535746574401855, "global_step": 154592, "epoch": 3680} {"train_loss": -6.820918083190918, "global_step": 154593, "epoch": 3680} {"train_loss": -6.957764625549316, "global_step": 154594, "epoch": 3680} {"train_loss": -6.939294338226318, "global_step": 154595, "epoch": 3680} {"train_loss": -6.904789924621582, "global_step": 154596, "epoch": 3680} {"train_loss": -6.937697887420654, "global_step": 154597, "epoch": 3680} {"train_loss": -6.886959075927734, "global_step": 154598, "epoch": 3680} {"train_loss": -6.904183387756348, "global_step": 154599, "epoch": 3680} {"train_loss": -6.947609901428223, "global_step": 154600, "epoch": 3680} {"train_loss": -6.884218738192604, "global_step": 154601, "epoch": 3680, "val_loss": 68366.3125} {"train_loss": -6.843173027038574, "global_step": 154602, "epoch": 3681} {"train_loss": -6.853020191192627, "global_step": 154603, "epoch": 3681} {"train_loss": -6.947502136230469, "global_step": 154604, "epoch": 3681} {"train_loss": -6.951530456542969, "global_step": 154605, "epoch": 3681} {"train_loss": -6.844860076904297, "global_step": 154606, "epoch": 3681} {"train_loss": -6.820829391479492, "global_step": 154607, "epoch": 3681} {"train_loss": -6.873371124267578, "global_step": 154608, "epoch": 3681} {"train_loss": -6.861991882324219, "global_step": 154609, "epoch": 3681} {"train_loss": -7.058697700500488, "global_step": 154610, "epoch": 3681} {"train_loss": -6.8335652351379395, "global_step": 154611, "epoch": 3681} {"train_loss": -6.898316383361816, "global_step": 154612, "epoch": 3681} {"train_loss": -6.893455505371094, "global_step": 154613, "epoch": 3681} {"train_loss": -6.959793567657471, "global_step": 154614, "epoch": 3681} {"train_loss": -6.908829212188721, "global_step": 154615, "epoch": 3681} {"train_loss": -6.970754623413086, "global_step": 154616, "epoch": 3681} {"train_loss": -6.936013221740723, "global_step": 154617, "epoch": 3681} {"train_loss": -6.931156158447266, "global_step": 154618, "epoch": 3681} {"train_loss": -6.869540691375732, "global_step": 154619, "epoch": 3681} {"train_loss": -6.916135787963867, "global_step": 154620, "epoch": 3681} {"train_loss": -6.815855503082275, "global_step": 154621, "epoch": 3681} {"train_loss": -6.848493576049805, "global_step": 154622, "epoch": 3681} {"train_loss": -6.837057113647461, "global_step": 154623, "epoch": 3681} {"train_loss": -6.956106185913086, "global_step": 154624, "epoch": 3681} {"train_loss": -6.869822025299072, "global_step": 154625, "epoch": 3681} {"train_loss": -6.874121189117432, "global_step": 154626, "epoch": 3681} {"train_loss": -6.811639785766602, "global_step": 154627, "epoch": 3681} {"train_loss": -6.787347793579102, "global_step": 154628, "epoch": 3681} {"train_loss": -6.872489929199219, "global_step": 154629, "epoch": 3681} {"train_loss": -6.78857421875, "global_step": 154630, "epoch": 3681} {"train_loss": -6.785743713378906, "global_step": 154631, "epoch": 3681} {"train_loss": -6.880665302276611, "global_step": 154632, "epoch": 3681} {"train_loss": -6.734841346740723, "global_step": 154633, "epoch": 3681} {"train_loss": -6.8160600662231445, "global_step": 154634, "epoch": 3681} {"train_loss": -6.751563549041748, "global_step": 154635, "epoch": 3681} {"train_loss": -6.911470413208008, "global_step": 154636, "epoch": 3681} {"train_loss": -6.878264904022217, "global_step": 154637, "epoch": 3681} {"train_loss": -6.860013961791992, "global_step": 154638, "epoch": 3681} {"train_loss": -6.874449729919434, "global_step": 154639, "epoch": 3681} {"train_loss": -6.82722806930542, "global_step": 154640, "epoch": 3681} {"train_loss": -6.9162211418151855, "global_step": 154641, "epoch": 3681} {"train_loss": -6.946589469909668, "global_step": 154642, "epoch": 3681} {"train_loss": -6.870991184597924, "global_step": 154643, "epoch": 3681, "val_loss": 68405.78125} {"train_loss": -6.888638973236084, "global_step": 154644, "epoch": 3682} {"train_loss": -6.802855968475342, "global_step": 154645, "epoch": 3682} {"train_loss": -6.952176094055176, "global_step": 154646, "epoch": 3682} {"train_loss": -6.941624641418457, "global_step": 154647, "epoch": 3682} {"train_loss": -6.791843891143799, "global_step": 154648, "epoch": 3682} {"train_loss": -6.963123798370361, "global_step": 154649, "epoch": 3682} {"train_loss": -6.913103103637695, "global_step": 154650, "epoch": 3682} {"train_loss": -6.985547065734863, "global_step": 154651, "epoch": 3682} {"train_loss": -6.816615104675293, "global_step": 154652, "epoch": 3682} {"train_loss": -6.819369316101074, "global_step": 154653, "epoch": 3682} {"train_loss": -6.902135848999023, "global_step": 154654, "epoch": 3682} {"train_loss": -6.78819465637207, "global_step": 154655, "epoch": 3682} {"train_loss": -6.856217384338379, "global_step": 154656, "epoch": 3682} {"train_loss": -6.870306968688965, "global_step": 154657, "epoch": 3682} {"train_loss": -6.863861083984375, "global_step": 154658, "epoch": 3682} {"train_loss": -7.081722259521484, "global_step": 154659, "epoch": 3682} {"train_loss": -6.852936744689941, "global_step": 154660, "epoch": 3682} {"train_loss": -6.960537433624268, "global_step": 154661, "epoch": 3682} {"train_loss": -6.931400299072266, "global_step": 154662, "epoch": 3682} {"train_loss": -6.765387058258057, "global_step": 154663, "epoch": 3682} {"train_loss": -6.90792179107666, "global_step": 154664, "epoch": 3682} {"train_loss": -6.847853660583496, "global_step": 154665, "epoch": 3682} {"train_loss": -6.766944885253906, "global_step": 154666, "epoch": 3682} {"train_loss": -6.900580406188965, "global_step": 154667, "epoch": 3682} {"train_loss": -6.7751030921936035, "global_step": 154668, "epoch": 3682} {"train_loss": -6.776916027069092, "global_step": 154669, "epoch": 3682} {"train_loss": -6.759355545043945, "global_step": 154670, "epoch": 3682} {"train_loss": -6.799314022064209, "global_step": 154671, "epoch": 3682} {"train_loss": -6.860220909118652, "global_step": 154672, "epoch": 3682} {"train_loss": -6.917886257171631, "global_step": 154673, "epoch": 3682} {"train_loss": -6.712736129760742, "global_step": 154674, "epoch": 3682} {"train_loss": -6.78387451171875, "global_step": 154675, "epoch": 3682} {"train_loss": -6.902040481567383, "global_step": 154676, "epoch": 3682} {"train_loss": -6.703316688537598, "global_step": 154677, "epoch": 3682} {"train_loss": -6.807245254516602, "global_step": 154678, "epoch": 3682} {"train_loss": -6.864828109741211, "global_step": 154679, "epoch": 3682} {"train_loss": -6.8063859939575195, "global_step": 154680, "epoch": 3682} {"train_loss": -6.893940448760986, "global_step": 154681, "epoch": 3682} {"train_loss": -6.838537693023682, "global_step": 154682, "epoch": 3682} {"train_loss": -6.758749008178711, "global_step": 154683, "epoch": 3682} {"train_loss": -6.874204635620117, "global_step": 154684, "epoch": 3682} {"train_loss": -6.856761114937918, "global_step": 154685, "epoch": 3682, "val_loss": 68605.390625} {"train_loss": -6.885868549346924, "global_step": 154686, "epoch": 3683} {"train_loss": -6.8523335456848145, "global_step": 154687, "epoch": 3683} {"train_loss": -6.894101142883301, "global_step": 154688, "epoch": 3683} {"train_loss": -6.819868087768555, "global_step": 154689, "epoch": 3683} {"train_loss": -6.8340911865234375, "global_step": 154690, "epoch": 3683} {"train_loss": -6.826026439666748, "global_step": 154691, "epoch": 3683} {"train_loss": -6.713131904602051, "global_step": 154692, "epoch": 3683} {"train_loss": -6.9218316078186035, "global_step": 154693, "epoch": 3683} {"train_loss": -6.892184257507324, "global_step": 154694, "epoch": 3683} {"train_loss": -6.885340690612793, "global_step": 154695, "epoch": 3683} {"train_loss": -6.776412010192871, "global_step": 154696, "epoch": 3683} {"train_loss": -6.741463661193848, "global_step": 154697, "epoch": 3683} {"train_loss": -6.712008476257324, "global_step": 154698, "epoch": 3683} {"train_loss": -6.662487983703613, "global_step": 154699, "epoch": 3683} {"train_loss": -6.7428765296936035, "global_step": 154700, "epoch": 3683} {"train_loss": -6.764212131500244, "global_step": 154701, "epoch": 3683} {"train_loss": -6.73508358001709, "global_step": 154702, "epoch": 3683} {"train_loss": -6.671719551086426, "global_step": 154703, "epoch": 3683} {"train_loss": -6.843418121337891, "global_step": 154704, "epoch": 3683} {"train_loss": -6.753740310668945, "global_step": 154705, "epoch": 3683} {"train_loss": -6.775863170623779, "global_step": 154706, "epoch": 3683} {"train_loss": -6.829245567321777, "global_step": 154707, "epoch": 3683} {"train_loss": -6.818950653076172, "global_step": 154708, "epoch": 3683} {"train_loss": -6.96798038482666, "global_step": 154709, "epoch": 3683} {"train_loss": -6.652692794799805, "global_step": 154710, "epoch": 3683} {"train_loss": -6.799775123596191, "global_step": 154711, "epoch": 3683} {"train_loss": -6.9050445556640625, "global_step": 154712, "epoch": 3683} {"train_loss": -6.737363338470459, "global_step": 154713, "epoch": 3683} {"train_loss": -6.704769134521484, "global_step": 154714, "epoch": 3683} {"train_loss": -6.722959518432617, "global_step": 154715, "epoch": 3683} {"train_loss": -6.918887615203857, "global_step": 154716, "epoch": 3683} {"train_loss": -6.867199897766113, "global_step": 154717, "epoch": 3683} {"train_loss": -6.8673858642578125, "global_step": 154718, "epoch": 3683} {"train_loss": -6.839421272277832, "global_step": 154719, "epoch": 3683} {"train_loss": -6.839925765991211, "global_step": 154720, "epoch": 3683} {"train_loss": -6.856866359710693, "global_step": 154721, "epoch": 3683} {"train_loss": -6.835219383239746, "global_step": 154722, "epoch": 3683} {"train_loss": -6.9476141929626465, "global_step": 154723, "epoch": 3683} {"train_loss": -7.029308795928955, "global_step": 154724, "epoch": 3683} {"train_loss": -6.865725040435791, "global_step": 154725, "epoch": 3683} {"train_loss": -6.950834274291992, "global_step": 154726, "epoch": 3683} {"train_loss": -6.823634317943028, "global_step": 154727, "epoch": 3683, "val_loss": 68461.78125} {"train_loss": -6.8779144287109375, "global_step": 154728, "epoch": 3684} {"train_loss": -6.839313507080078, "global_step": 154729, "epoch": 3684} {"train_loss": -6.798336029052734, "global_step": 154730, "epoch": 3684} {"train_loss": -6.974693775177002, "global_step": 154731, "epoch": 3684} {"train_loss": -6.789813995361328, "global_step": 154732, "epoch": 3684} {"train_loss": -6.780155181884766, "global_step": 154733, "epoch": 3684} {"train_loss": -6.893409729003906, "global_step": 154734, "epoch": 3684} {"train_loss": -6.857209205627441, "global_step": 154735, "epoch": 3684} {"train_loss": -6.846409797668457, "global_step": 154736, "epoch": 3684} {"train_loss": -6.899885177612305, "global_step": 154737, "epoch": 3684} {"train_loss": -6.962310314178467, "global_step": 154738, "epoch": 3684} {"train_loss": -6.9140849113464355, "global_step": 154739, "epoch": 3684} {"train_loss": -6.995433807373047, "global_step": 154740, "epoch": 3684} {"train_loss": -6.946270942687988, "global_step": 154741, "epoch": 3684} {"train_loss": -6.80141544342041, "global_step": 154742, "epoch": 3684} {"train_loss": -6.856006145477295, "global_step": 154743, "epoch": 3684} {"train_loss": -6.994783401489258, "global_step": 154744, "epoch": 3684} {"train_loss": -6.790740966796875, "global_step": 154745, "epoch": 3684} {"train_loss": -6.914846897125244, "global_step": 154746, "epoch": 3684} {"train_loss": -6.9225969314575195, "global_step": 154747, "epoch": 3684} {"train_loss": -7.007500648498535, "global_step": 154748, "epoch": 3684} {"train_loss": -6.850316524505615, "global_step": 154749, "epoch": 3684} {"train_loss": -6.927554130554199, "global_step": 154750, "epoch": 3684} {"train_loss": -6.906798362731934, "global_step": 154751, "epoch": 3684} {"train_loss": -6.89462423324585, "global_step": 154752, "epoch": 3684} {"train_loss": -6.901480674743652, "global_step": 154753, "epoch": 3684} {"train_loss": -6.942235946655273, "global_step": 154754, "epoch": 3684} {"train_loss": -6.924884796142578, "global_step": 154755, "epoch": 3684} {"train_loss": -6.981795787811279, "global_step": 154756, "epoch": 3684} {"train_loss": -6.855587959289551, "global_step": 154757, "epoch": 3684} {"train_loss": -6.940142631530762, "global_step": 154758, "epoch": 3684} {"train_loss": -6.886293411254883, "global_step": 154759, "epoch": 3684} {"train_loss": -6.813714027404785, "global_step": 154760, "epoch": 3684} {"train_loss": -6.809231281280518, "global_step": 154761, "epoch": 3684} {"train_loss": -6.954768180847168, "global_step": 154762, "epoch": 3684} {"train_loss": -6.898872375488281, "global_step": 154763, "epoch": 3684} {"train_loss": -6.83141565322876, "global_step": 154764, "epoch": 3684} {"train_loss": -6.956360816955566, "global_step": 154765, "epoch": 3684} {"train_loss": -6.8530192375183105, "global_step": 154766, "epoch": 3684} {"train_loss": -6.850767135620117, "global_step": 154767, "epoch": 3684} {"train_loss": -6.872302055358887, "global_step": 154768, "epoch": 3684} {"train_loss": -6.886861812500727, "global_step": 154769, "epoch": 3684, "val_loss": 68570.6171875} {"train_loss": -6.850801467895508, "global_step": 154770, "epoch": 3685} {"train_loss": -6.760839462280273, "global_step": 154771, "epoch": 3685} {"train_loss": -6.904269218444824, "global_step": 154772, "epoch": 3685} {"train_loss": -6.915760517120361, "global_step": 154773, "epoch": 3685} {"train_loss": -6.846475601196289, "global_step": 154774, "epoch": 3685} {"train_loss": -6.815313339233398, "global_step": 154775, "epoch": 3685} {"train_loss": -6.872832298278809, "global_step": 154776, "epoch": 3685} {"train_loss": -6.745362281799316, "global_step": 154777, "epoch": 3685} {"train_loss": -6.962224006652832, "global_step": 154778, "epoch": 3685} {"train_loss": -6.801533222198486, "global_step": 154779, "epoch": 3685} {"train_loss": -6.807372570037842, "global_step": 154780, "epoch": 3685} {"train_loss": -6.87713623046875, "global_step": 154781, "epoch": 3685} {"train_loss": -6.895020484924316, "global_step": 154782, "epoch": 3685} {"train_loss": -6.971758842468262, "global_step": 154783, "epoch": 3685} {"train_loss": -6.779595851898193, "global_step": 154784, "epoch": 3685} {"train_loss": -6.760751724243164, "global_step": 154785, "epoch": 3685} {"train_loss": -6.917646408081055, "global_step": 154786, "epoch": 3685} {"train_loss": -6.872797966003418, "global_step": 154787, "epoch": 3685} {"train_loss": -6.8668012619018555, "global_step": 154788, "epoch": 3685} {"train_loss": -6.887633323669434, "global_step": 154789, "epoch": 3685} {"train_loss": -6.856957912445068, "global_step": 154790, "epoch": 3685} {"train_loss": -6.882201194763184, "global_step": 154791, "epoch": 3685} {"train_loss": -6.839526176452637, "global_step": 154792, "epoch": 3685} {"train_loss": -6.849050045013428, "global_step": 154793, "epoch": 3685} {"train_loss": -6.86472225189209, "global_step": 154794, "epoch": 3685} {"train_loss": -6.9027099609375, "global_step": 154795, "epoch": 3685} {"train_loss": -6.758673191070557, "global_step": 154796, "epoch": 3685} {"train_loss": -6.839776515960693, "global_step": 154797, "epoch": 3685} {"train_loss": -6.809510707855225, "global_step": 154798, "epoch": 3685} {"train_loss": -6.890456199645996, "global_step": 154799, "epoch": 3685} {"train_loss": -6.872511863708496, "global_step": 154800, "epoch": 3685} {"train_loss": -6.931210994720459, "global_step": 154801, "epoch": 3685} {"train_loss": -6.777002334594727, "global_step": 154802, "epoch": 3685} {"train_loss": -6.8534064292907715, "global_step": 154803, "epoch": 3685} {"train_loss": -6.8832221031188965, "global_step": 154804, "epoch": 3685} {"train_loss": -6.975934982299805, "global_step": 154805, "epoch": 3685} {"train_loss": -6.768452167510986, "global_step": 154806, "epoch": 3685} {"train_loss": -6.828005790710449, "global_step": 154807, "epoch": 3685} {"train_loss": -6.89302396774292, "global_step": 154808, "epoch": 3685} {"train_loss": -6.900184631347656, "global_step": 154809, "epoch": 3685} {"train_loss": -6.6915411949157715, "global_step": 154810, "epoch": 3685} {"train_loss": -6.852628412700835, "global_step": 154811, "epoch": 3685, "val_loss": 68450.2734375} {"train_loss": -6.819431304931641, "global_step": 154812, "epoch": 3686} {"train_loss": -7.017115592956543, "global_step": 154813, "epoch": 3686} {"train_loss": -6.870561599731445, "global_step": 154814, "epoch": 3686} {"train_loss": -6.810634613037109, "global_step": 154815, "epoch": 3686} {"train_loss": -6.787067413330078, "global_step": 154816, "epoch": 3686} {"train_loss": -6.821884632110596, "global_step": 154817, "epoch": 3686} {"train_loss": -6.814741134643555, "global_step": 154818, "epoch": 3686} {"train_loss": -6.814619541168213, "global_step": 154819, "epoch": 3686} {"train_loss": -6.882158279418945, "global_step": 154820, "epoch": 3686} {"train_loss": -6.792691707611084, "global_step": 154821, "epoch": 3686} {"train_loss": -6.832391262054443, "global_step": 154822, "epoch": 3686} {"train_loss": -6.864285469055176, "global_step": 154823, "epoch": 3686} {"train_loss": -6.814566612243652, "global_step": 154824, "epoch": 3686} {"train_loss": -6.756939888000488, "global_step": 154825, "epoch": 3686} {"train_loss": -6.840090751647949, "global_step": 154826, "epoch": 3686} {"train_loss": -6.771653175354004, "global_step": 154827, "epoch": 3686} {"train_loss": -7.000225067138672, "global_step": 154828, "epoch": 3686} {"train_loss": -6.848239898681641, "global_step": 154829, "epoch": 3686} {"train_loss": -6.885709762573242, "global_step": 154830, "epoch": 3686} {"train_loss": -6.804726600646973, "global_step": 154831, "epoch": 3686} {"train_loss": -6.8123698234558105, "global_step": 154832, "epoch": 3686} {"train_loss": -6.884482383728027, "global_step": 154833, "epoch": 3686} {"train_loss": -6.82561731338501, "global_step": 154834, "epoch": 3686} {"train_loss": -6.866107940673828, "global_step": 154835, "epoch": 3686} {"train_loss": -6.921689987182617, "global_step": 154836, "epoch": 3686} {"train_loss": -6.8914947509765625, "global_step": 154837, "epoch": 3686} {"train_loss": -6.770841598510742, "global_step": 154838, "epoch": 3686} {"train_loss": -6.824251174926758, "global_step": 154839, "epoch": 3686} {"train_loss": -6.839086055755615, "global_step": 154840, "epoch": 3686} {"train_loss": -6.912306308746338, "global_step": 154841, "epoch": 3686} {"train_loss": -6.898996353149414, "global_step": 154842, "epoch": 3686} {"train_loss": -6.883810043334961, "global_step": 154843, "epoch": 3686} {"train_loss": -6.911192893981934, "global_step": 154844, "epoch": 3686} {"train_loss": -6.831212997436523, "global_step": 154845, "epoch": 3686} {"train_loss": -6.821463584899902, "global_step": 154846, "epoch": 3686} {"train_loss": -6.808642387390137, "global_step": 154847, "epoch": 3686} {"train_loss": -6.906187057495117, "global_step": 154848, "epoch": 3686} {"train_loss": -6.827107906341553, "global_step": 154849, "epoch": 3686} {"train_loss": -6.915533065795898, "global_step": 154850, "epoch": 3686} {"train_loss": -6.803220748901367, "global_step": 154851, "epoch": 3686} {"train_loss": -6.867482662200928, "global_step": 154852, "epoch": 3686} {"train_loss": -6.8494007133302235, "global_step": 154853, "epoch": 3686, "val_loss": 68421.3203125} {"train_loss": -6.886276721954346, "global_step": 154854, "epoch": 3687} {"train_loss": -6.8200531005859375, "global_step": 154855, "epoch": 3687} {"train_loss": -6.874306678771973, "global_step": 154856, "epoch": 3687} {"train_loss": -6.890346527099609, "global_step": 154857, "epoch": 3687} {"train_loss": -6.8679656982421875, "global_step": 154858, "epoch": 3687} {"train_loss": -6.937384605407715, "global_step": 154859, "epoch": 3687} {"train_loss": -6.832440376281738, "global_step": 154860, "epoch": 3687} {"train_loss": -6.869015216827393, "global_step": 154861, "epoch": 3687} {"train_loss": -6.897570610046387, "global_step": 154862, "epoch": 3687} {"train_loss": -6.786667346954346, "global_step": 154863, "epoch": 3687} {"train_loss": -6.903934478759766, "global_step": 154864, "epoch": 3687} {"train_loss": -6.890862464904785, "global_step": 154865, "epoch": 3687} {"train_loss": -6.867144584655762, "global_step": 154866, "epoch": 3687} {"train_loss": -6.822598934173584, "global_step": 154867, "epoch": 3687} {"train_loss": -6.824526786804199, "global_step": 154868, "epoch": 3687} {"train_loss": -6.796760559082031, "global_step": 154869, "epoch": 3687} {"train_loss": -6.869980812072754, "global_step": 154870, "epoch": 3687} {"train_loss": -6.846931457519531, "global_step": 154871, "epoch": 3687} {"train_loss": -6.7937331199646, "global_step": 154872, "epoch": 3687} {"train_loss": -6.729737281799316, "global_step": 154873, "epoch": 3687} {"train_loss": -6.80661678314209, "global_step": 154874, "epoch": 3687} {"train_loss": -6.660312175750732, "global_step": 154875, "epoch": 3687} {"train_loss": -6.754822731018066, "global_step": 154876, "epoch": 3687} {"train_loss": -6.791268825531006, "global_step": 154877, "epoch": 3687} {"train_loss": -6.783452987670898, "global_step": 154878, "epoch": 3687} {"train_loss": -6.72050666809082, "global_step": 154879, "epoch": 3687} {"train_loss": -6.789006233215332, "global_step": 154880, "epoch": 3687} {"train_loss": -6.769447326660156, "global_step": 154881, "epoch": 3687} {"train_loss": -6.653990745544434, "global_step": 154882, "epoch": 3687} {"train_loss": -6.853621006011963, "global_step": 154883, "epoch": 3687} {"train_loss": -6.564022064208984, "global_step": 154884, "epoch": 3687} {"train_loss": -6.7859697341918945, "global_step": 154885, "epoch": 3687} {"train_loss": -6.753383636474609, "global_step": 154886, "epoch": 3687} {"train_loss": -6.664184093475342, "global_step": 154887, "epoch": 3687} {"train_loss": -6.7983880043029785, "global_step": 154888, "epoch": 3687} {"train_loss": -6.692776203155518, "global_step": 154889, "epoch": 3687} {"train_loss": -6.785595417022705, "global_step": 154890, "epoch": 3687} {"train_loss": -6.755209922790527, "global_step": 154891, "epoch": 3687} {"train_loss": -6.732048988342285, "global_step": 154892, "epoch": 3687} {"train_loss": -6.67720365524292, "global_step": 154893, "epoch": 3687} {"train_loss": -6.837459564208984, "global_step": 154894, "epoch": 3687} {"train_loss": -6.795424552190871, "global_step": 154895, "epoch": 3687, "val_loss": 68339.8671875} {"train_loss": -6.692676544189453, "global_step": 154896, "epoch": 3688} {"train_loss": -6.901673316955566, "global_step": 154897, "epoch": 3688} {"train_loss": -6.849786281585693, "global_step": 154898, "epoch": 3688} {"train_loss": -6.822844505310059, "global_step": 154899, "epoch": 3688} {"train_loss": -6.780622482299805, "global_step": 154900, "epoch": 3688} {"train_loss": -6.872497081756592, "global_step": 154901, "epoch": 3688} {"train_loss": -6.728122234344482, "global_step": 154902, "epoch": 3688} {"train_loss": -6.833125114440918, "global_step": 154903, "epoch": 3688} {"train_loss": -6.876220703125, "global_step": 154904, "epoch": 3688} {"train_loss": -6.7972869873046875, "global_step": 154905, "epoch": 3688} {"train_loss": -6.884085178375244, "global_step": 154906, "epoch": 3688} {"train_loss": -6.748958110809326, "global_step": 154907, "epoch": 3688} {"train_loss": -6.68189811706543, "global_step": 154908, "epoch": 3688} {"train_loss": -6.724417686462402, "global_step": 154909, "epoch": 3688} {"train_loss": -6.746201515197754, "global_step": 154910, "epoch": 3688} {"train_loss": -6.837430000305176, "global_step": 154911, "epoch": 3688} {"train_loss": -6.7931904792785645, "global_step": 154912, "epoch": 3688} {"train_loss": -6.782820224761963, "global_step": 154913, "epoch": 3688} {"train_loss": -6.690938472747803, "global_step": 154914, "epoch": 3688} {"train_loss": -6.875690460205078, "global_step": 154915, "epoch": 3688} {"train_loss": -6.803243637084961, "global_step": 154916, "epoch": 3688} {"train_loss": -6.7059478759765625, "global_step": 154917, "epoch": 3688} {"train_loss": -6.932103157043457, "global_step": 154918, "epoch": 3688} {"train_loss": -6.729830741882324, "global_step": 154919, "epoch": 3688} {"train_loss": -6.882914066314697, "global_step": 154920, "epoch": 3688} {"train_loss": -6.740825653076172, "global_step": 154921, "epoch": 3688} {"train_loss": -6.818258285522461, "global_step": 154922, "epoch": 3688} {"train_loss": -6.899178504943848, "global_step": 154923, "epoch": 3688} {"train_loss": -6.714329719543457, "global_step": 154924, "epoch": 3688} {"train_loss": -6.849941253662109, "global_step": 154925, "epoch": 3688} {"train_loss": -6.843625545501709, "global_step": 154926, "epoch": 3688} {"train_loss": -6.77571964263916, "global_step": 154927, "epoch": 3688} {"train_loss": -6.7998199462890625, "global_step": 154928, "epoch": 3688} {"train_loss": -6.87587833404541, "global_step": 154929, "epoch": 3688} {"train_loss": -6.848280429840088, "global_step": 154930, "epoch": 3688} {"train_loss": -6.820863246917725, "global_step": 154931, "epoch": 3688} {"train_loss": -6.72011661529541, "global_step": 154932, "epoch": 3688} {"train_loss": -6.810083389282227, "global_step": 154933, "epoch": 3688} {"train_loss": -6.826593399047852, "global_step": 154934, "epoch": 3688} {"train_loss": -6.8012495040893555, "global_step": 154935, "epoch": 3688} {"train_loss": -6.8973588943481445, "global_step": 154936, "epoch": 3688} {"train_loss": -6.805160091036842, "global_step": 154937, "epoch": 3688, "val_loss": 68538.7578125} {"train_loss": -6.781437397003174, "global_step": 154938, "epoch": 3689} {"train_loss": -6.847097396850586, "global_step": 154939, "epoch": 3689} {"train_loss": -6.708746433258057, "global_step": 154940, "epoch": 3689} {"train_loss": -6.900084018707275, "global_step": 154941, "epoch": 3689} {"train_loss": -6.766088485717773, "global_step": 154942, "epoch": 3689} {"train_loss": -6.874637126922607, "global_step": 154943, "epoch": 3689} {"train_loss": -6.787042140960693, "global_step": 154944, "epoch": 3689} {"train_loss": -6.798820495605469, "global_step": 154945, "epoch": 3689} {"train_loss": -6.819507598876953, "global_step": 154946, "epoch": 3689} {"train_loss": -6.8345537185668945, "global_step": 154947, "epoch": 3689} {"train_loss": -6.712904453277588, "global_step": 154948, "epoch": 3689} {"train_loss": -6.906129360198975, "global_step": 154949, "epoch": 3689} {"train_loss": -6.702120780944824, "global_step": 154950, "epoch": 3689} {"train_loss": -6.904326915740967, "global_step": 154951, "epoch": 3689} {"train_loss": -6.852627277374268, "global_step": 154952, "epoch": 3689} {"train_loss": -6.917135238647461, "global_step": 154953, "epoch": 3689} {"train_loss": -6.939967155456543, "global_step": 154954, "epoch": 3689} {"train_loss": -6.87879753112793, "global_step": 154955, "epoch": 3689} {"train_loss": -6.867501735687256, "global_step": 154956, "epoch": 3689} {"train_loss": -6.798300743103027, "global_step": 154957, "epoch": 3689} {"train_loss": -6.8494744300842285, "global_step": 154958, "epoch": 3689} {"train_loss": -6.752553462982178, "global_step": 154959, "epoch": 3689} {"train_loss": -6.783873558044434, "global_step": 154960, "epoch": 3689} {"train_loss": -6.705347061157227, "global_step": 154961, "epoch": 3689} {"train_loss": -6.914034843444824, "global_step": 154962, "epoch": 3689} {"train_loss": -6.773536682128906, "global_step": 154963, "epoch": 3689} {"train_loss": -6.835575580596924, "global_step": 154964, "epoch": 3689} {"train_loss": -6.818360328674316, "global_step": 154965, "epoch": 3689} {"train_loss": -6.815906047821045, "global_step": 154966, "epoch": 3689} {"train_loss": -6.892855644226074, "global_step": 154967, "epoch": 3689} {"train_loss": -6.848088264465332, "global_step": 154968, "epoch": 3689} {"train_loss": -6.840156555175781, "global_step": 154969, "epoch": 3689} {"train_loss": -6.743699550628662, "global_step": 154970, "epoch": 3689} {"train_loss": -6.890694618225098, "global_step": 154971, "epoch": 3689} {"train_loss": -6.780248641967773, "global_step": 154972, "epoch": 3689} {"train_loss": -6.86624813079834, "global_step": 154973, "epoch": 3689} {"train_loss": -6.835158348083496, "global_step": 154974, "epoch": 3689} {"train_loss": -6.838578701019287, "global_step": 154975, "epoch": 3689} {"train_loss": -6.884195327758789, "global_step": 154976, "epoch": 3689} {"train_loss": -6.776614189147949, "global_step": 154977, "epoch": 3689} {"train_loss": -6.9531354904174805, "global_step": 154978, "epoch": 3689} {"train_loss": -6.829632236844017, "global_step": 154979, "epoch": 3689, "val_loss": 68297.859375} {"train_loss": -6.84804105758667, "global_step": 154980, "epoch": 3690} {"train_loss": -6.851956367492676, "global_step": 154981, "epoch": 3690} {"train_loss": -6.943934440612793, "global_step": 154982, "epoch": 3690} {"train_loss": -6.8846635818481445, "global_step": 154983, "epoch": 3690} {"train_loss": -6.968723297119141, "global_step": 154984, "epoch": 3690} {"train_loss": -6.810656547546387, "global_step": 154985, "epoch": 3690} {"train_loss": -6.896083354949951, "global_step": 154986, "epoch": 3690} {"train_loss": -6.796877861022949, "global_step": 154987, "epoch": 3690} {"train_loss": -6.816986083984375, "global_step": 154988, "epoch": 3690} {"train_loss": -6.884800434112549, "global_step": 154989, "epoch": 3690} {"train_loss": -6.925209999084473, "global_step": 154990, "epoch": 3690} {"train_loss": -6.905487060546875, "global_step": 154991, "epoch": 3690} {"train_loss": -6.841076850891113, "global_step": 154992, "epoch": 3690} {"train_loss": -6.943305969238281, "global_step": 154993, "epoch": 3690} {"train_loss": -6.852903842926025, "global_step": 154994, "epoch": 3690} {"train_loss": -6.831783294677734, "global_step": 154995, "epoch": 3690} {"train_loss": -6.839412689208984, "global_step": 154996, "epoch": 3690} {"train_loss": -6.933221817016602, "global_step": 154997, "epoch": 3690} {"train_loss": -6.8803181648254395, "global_step": 154998, "epoch": 3690} {"train_loss": -6.928964138031006, "global_step": 154999, "epoch": 3690} {"train_loss": -6.933444976806641, "global_step": 155000, "epoch": 3690} {"train_loss": -6.910561561584473, "global_step": 155001, "epoch": 3690} {"train_loss": -6.76397180557251, "global_step": 155002, "epoch": 3690} {"train_loss": -6.898542404174805, "global_step": 155003, "epoch": 3690} {"train_loss": -6.839016437530518, "global_step": 155004, "epoch": 3690} {"train_loss": -6.832910537719727, "global_step": 155005, "epoch": 3690} {"train_loss": -6.802706718444824, "global_step": 155006, "epoch": 3690} {"train_loss": -6.902415752410889, "global_step": 155007, "epoch": 3690} {"train_loss": -6.7781662940979, "global_step": 155008, "epoch": 3690} {"train_loss": -6.8302483558654785, "global_step": 155009, "epoch": 3690} {"train_loss": -6.900934219360352, "global_step": 155010, "epoch": 3690} {"train_loss": -6.842695236206055, "global_step": 155011, "epoch": 3690} {"train_loss": -6.854406356811523, "global_step": 155012, "epoch": 3690} {"train_loss": -6.8025641441345215, "global_step": 155013, "epoch": 3690} {"train_loss": -6.881537914276123, "global_step": 155014, "epoch": 3690} {"train_loss": -6.863409042358398, "global_step": 155015, "epoch": 3690} {"train_loss": -6.7862348556518555, "global_step": 155016, "epoch": 3690} {"train_loss": -6.825791358947754, "global_step": 155017, "epoch": 3690} {"train_loss": -6.970107078552246, "global_step": 155018, "epoch": 3690} {"train_loss": -6.799442768096924, "global_step": 155019, "epoch": 3690} {"train_loss": -6.8960490226745605, "global_step": 155020, "epoch": 3690} {"train_loss": -6.864740780421665, "global_step": 155021, "epoch": 3690, "val_loss": 68500.34375} {"train_loss": -6.755669593811035, "global_step": 155022, "epoch": 3691} {"train_loss": -6.908998012542725, "global_step": 155023, "epoch": 3691} {"train_loss": -6.870990753173828, "global_step": 155024, "epoch": 3691} {"train_loss": -6.880173683166504, "global_step": 155025, "epoch": 3691} {"train_loss": -6.9330315589904785, "global_step": 155026, "epoch": 3691} {"train_loss": -6.904560089111328, "global_step": 155027, "epoch": 3691} {"train_loss": -7.014420509338379, "global_step": 155028, "epoch": 3691} {"train_loss": -6.823381423950195, "global_step": 155029, "epoch": 3691} {"train_loss": -6.859909534454346, "global_step": 155030, "epoch": 3691} {"train_loss": -6.882020950317383, "global_step": 155031, "epoch": 3691} {"train_loss": -6.845117568969727, "global_step": 155032, "epoch": 3691} {"train_loss": -6.852241516113281, "global_step": 155033, "epoch": 3691} {"train_loss": -6.893167495727539, "global_step": 155034, "epoch": 3691} {"train_loss": -6.857785224914551, "global_step": 155035, "epoch": 3691} {"train_loss": -6.8650617599487305, "global_step": 155036, "epoch": 3691} {"train_loss": -6.854710102081299, "global_step": 155037, "epoch": 3691} {"train_loss": -6.945196151733398, "global_step": 155038, "epoch": 3691} {"train_loss": -6.871118545532227, "global_step": 155039, "epoch": 3691} {"train_loss": -6.792924880981445, "global_step": 155040, "epoch": 3691} {"train_loss": -6.814644813537598, "global_step": 155041, "epoch": 3691} {"train_loss": -6.81323766708374, "global_step": 155042, "epoch": 3691} {"train_loss": -6.8266215324401855, "global_step": 155043, "epoch": 3691} {"train_loss": -6.797190189361572, "global_step": 155044, "epoch": 3691} {"train_loss": -6.862097263336182, "global_step": 155045, "epoch": 3691} {"train_loss": -6.813414096832275, "global_step": 155046, "epoch": 3691} {"train_loss": -6.837436676025391, "global_step": 155047, "epoch": 3691} {"train_loss": -6.8556976318359375, "global_step": 155048, "epoch": 3691} {"train_loss": -6.867467880249023, "global_step": 155049, "epoch": 3691} {"train_loss": -6.86713981628418, "global_step": 155050, "epoch": 3691} {"train_loss": -6.909573554992676, "global_step": 155051, "epoch": 3691} {"train_loss": -6.800189018249512, "global_step": 155052, "epoch": 3691} {"train_loss": -6.835395336151123, "global_step": 155053, "epoch": 3691} {"train_loss": -6.854341983795166, "global_step": 155054, "epoch": 3691} {"train_loss": -6.921351432800293, "global_step": 155055, "epoch": 3691} {"train_loss": -6.785571098327637, "global_step": 155056, "epoch": 3691} {"train_loss": -6.657549858093262, "global_step": 155057, "epoch": 3691} {"train_loss": -6.8457136154174805, "global_step": 155058, "epoch": 3691} {"train_loss": -6.763481140136719, "global_step": 155059, "epoch": 3691} {"train_loss": -6.708784103393555, "global_step": 155060, "epoch": 3691} {"train_loss": -6.875368118286133, "global_step": 155061, "epoch": 3691} {"train_loss": -6.749361038208008, "global_step": 155062, "epoch": 3691} {"train_loss": -6.844094060716175, "global_step": 155063, "epoch": 3691, "val_loss": 68614.4140625} {"train_loss": -6.726219177246094, "global_step": 155064, "epoch": 3692} {"train_loss": -6.7518630027771, "global_step": 155065, "epoch": 3692} {"train_loss": -6.77524471282959, "global_step": 155066, "epoch": 3692} {"train_loss": -6.797070503234863, "global_step": 155067, "epoch": 3692} {"train_loss": -6.791286468505859, "global_step": 155068, "epoch": 3692} {"train_loss": -6.694211959838867, "global_step": 155069, "epoch": 3692} {"train_loss": -6.89333963394165, "global_step": 155070, "epoch": 3692} {"train_loss": -6.779413223266602, "global_step": 155071, "epoch": 3692} {"train_loss": -6.817817687988281, "global_step": 155072, "epoch": 3692} {"train_loss": -6.812949180603027, "global_step": 155073, "epoch": 3692} {"train_loss": -6.767168045043945, "global_step": 155074, "epoch": 3692} {"train_loss": -6.868535041809082, "global_step": 155075, "epoch": 3692} {"train_loss": -6.765737056732178, "global_step": 155076, "epoch": 3692} {"train_loss": -6.7666521072387695, "global_step": 155077, "epoch": 3692} {"train_loss": -6.85524845123291, "global_step": 155078, "epoch": 3692} {"train_loss": -6.677048683166504, "global_step": 155079, "epoch": 3692} {"train_loss": -6.765724182128906, "global_step": 155080, "epoch": 3692} {"train_loss": -6.793763637542725, "global_step": 155081, "epoch": 3692} {"train_loss": -6.761989593505859, "global_step": 155082, "epoch": 3692} {"train_loss": -6.83448600769043, "global_step": 155083, "epoch": 3692} {"train_loss": -6.790726661682129, "global_step": 155084, "epoch": 3692} {"train_loss": -6.880046367645264, "global_step": 155085, "epoch": 3692} {"train_loss": -6.897153854370117, "global_step": 155086, "epoch": 3692} {"train_loss": -6.830888748168945, "global_step": 155087, "epoch": 3692} {"train_loss": -6.8986053466796875, "global_step": 155088, "epoch": 3692} {"train_loss": -6.8146257400512695, "global_step": 155089, "epoch": 3692} {"train_loss": -6.894492149353027, "global_step": 155090, "epoch": 3692} {"train_loss": -6.8722429275512695, "global_step": 155091, "epoch": 3692} {"train_loss": -6.811200141906738, "global_step": 155092, "epoch": 3692} {"train_loss": -6.906302452087402, "global_step": 155093, "epoch": 3692} {"train_loss": -6.779366493225098, "global_step": 155094, "epoch": 3692} {"train_loss": -6.915591716766357, "global_step": 155095, "epoch": 3692} {"train_loss": -6.938619613647461, "global_step": 155096, "epoch": 3692} {"train_loss": -6.926019668579102, "global_step": 155097, "epoch": 3692} {"train_loss": -6.851261615753174, "global_step": 155098, "epoch": 3692} {"train_loss": -6.921334743499756, "global_step": 155099, "epoch": 3692} {"train_loss": -6.980230331420898, "global_step": 155100, "epoch": 3692} {"train_loss": -6.850555896759033, "global_step": 155101, "epoch": 3692} {"train_loss": -6.933567047119141, "global_step": 155102, "epoch": 3692} {"train_loss": -6.904147148132324, "global_step": 155103, "epoch": 3692} {"train_loss": -6.942198753356934, "global_step": 155104, "epoch": 3692} {"train_loss": -6.836056675229754, "global_step": 155105, "epoch": 3692, "val_loss": 68389.46875} {"train_loss": -6.9208760261535645, "global_step": 155106, "epoch": 3693} {"train_loss": -6.899358749389648, "global_step": 155107, "epoch": 3693} {"train_loss": -6.885531425476074, "global_step": 155108, "epoch": 3693} {"train_loss": -6.853443145751953, "global_step": 155109, "epoch": 3693} {"train_loss": -6.835241794586182, "global_step": 155110, "epoch": 3693} {"train_loss": -6.931447505950928, "global_step": 155111, "epoch": 3693} {"train_loss": -7.019641876220703, "global_step": 155112, "epoch": 3693} {"train_loss": -7.02724027633667, "global_step": 155113, "epoch": 3693} {"train_loss": -6.873222351074219, "global_step": 155114, "epoch": 3693} {"train_loss": -6.859292984008789, "global_step": 155115, "epoch": 3693} {"train_loss": -6.9816694259643555, "global_step": 155116, "epoch": 3693} {"train_loss": -6.84669303894043, "global_step": 155117, "epoch": 3693} {"train_loss": -6.773524284362793, "global_step": 155118, "epoch": 3693} {"train_loss": -6.804075241088867, "global_step": 155119, "epoch": 3693} {"train_loss": -6.773488998413086, "global_step": 155120, "epoch": 3693} {"train_loss": -6.785599708557129, "global_step": 155121, "epoch": 3693} {"train_loss": -6.879082679748535, "global_step": 155122, "epoch": 3693} {"train_loss": -6.749309539794922, "global_step": 155123, "epoch": 3693} {"train_loss": -6.888446807861328, "global_step": 155124, "epoch": 3693} {"train_loss": -6.795651435852051, "global_step": 155125, "epoch": 3693} {"train_loss": -6.83635950088501, "global_step": 155126, "epoch": 3693} {"train_loss": -6.991632461547852, "global_step": 155127, "epoch": 3693} {"train_loss": -6.732755184173584, "global_step": 155128, "epoch": 3693} {"train_loss": -6.929387092590332, "global_step": 155129, "epoch": 3693} {"train_loss": -6.804967880249023, "global_step": 155130, "epoch": 3693} {"train_loss": -6.861835479736328, "global_step": 155131, "epoch": 3693} {"train_loss": -6.989378452301025, "global_step": 155132, "epoch": 3693} {"train_loss": -6.864727020263672, "global_step": 155133, "epoch": 3693} {"train_loss": -6.852258682250977, "global_step": 155134, "epoch": 3693} {"train_loss": -6.835161209106445, "global_step": 155135, "epoch": 3693} {"train_loss": -6.7737555503845215, "global_step": 155136, "epoch": 3693} {"train_loss": -6.927682876586914, "global_step": 155137, "epoch": 3693} {"train_loss": -6.901349067687988, "global_step": 155138, "epoch": 3693} {"train_loss": -6.91558313369751, "global_step": 155139, "epoch": 3693} {"train_loss": -6.86761474609375, "global_step": 155140, "epoch": 3693} {"train_loss": -6.8795599937438965, "global_step": 155141, "epoch": 3693} {"train_loss": -6.847093105316162, "global_step": 155142, "epoch": 3693} {"train_loss": -6.848049163818359, "global_step": 155143, "epoch": 3693} {"train_loss": -6.8848185539245605, "global_step": 155144, "epoch": 3693} {"train_loss": -6.942636966705322, "global_step": 155145, "epoch": 3693} {"train_loss": -7.009883880615234, "global_step": 155146, "epoch": 3693} {"train_loss": -6.876987230210077, "global_step": 155147, "epoch": 3693, "val_loss": 68496.28125} {"train_loss": -6.923033714294434, "global_step": 155148, "epoch": 3694} {"train_loss": -6.787156581878662, "global_step": 155149, "epoch": 3694} {"train_loss": -6.954384803771973, "global_step": 155150, "epoch": 3694} {"train_loss": -6.885941505432129, "global_step": 155151, "epoch": 3694} {"train_loss": -6.858593463897705, "global_step": 155152, "epoch": 3694} {"train_loss": -6.8310089111328125, "global_step": 155153, "epoch": 3694} {"train_loss": -6.81992244720459, "global_step": 155154, "epoch": 3694} {"train_loss": -6.907084941864014, "global_step": 155155, "epoch": 3694} {"train_loss": -6.853729724884033, "global_step": 155156, "epoch": 3694} {"train_loss": -6.933404922485352, "global_step": 155157, "epoch": 3694} {"train_loss": -6.844476699829102, "global_step": 155158, "epoch": 3694} {"train_loss": -6.830724239349365, "global_step": 155159, "epoch": 3694} {"train_loss": -6.898136138916016, "global_step": 155160, "epoch": 3694} {"train_loss": -6.750298976898193, "global_step": 155161, "epoch": 3694} {"train_loss": -6.910984039306641, "global_step": 155162, "epoch": 3694} {"train_loss": -6.9223175048828125, "global_step": 155163, "epoch": 3694} {"train_loss": -6.748288154602051, "global_step": 155164, "epoch": 3694} {"train_loss": -6.700418472290039, "global_step": 155165, "epoch": 3694} {"train_loss": -6.8166093826293945, "global_step": 155166, "epoch": 3694} {"train_loss": -6.868526458740234, "global_step": 155167, "epoch": 3694} {"train_loss": -6.757417678833008, "global_step": 155168, "epoch": 3694} {"train_loss": -6.9669294357299805, "global_step": 155169, "epoch": 3694} {"train_loss": -6.952588081359863, "global_step": 155170, "epoch": 3694} {"train_loss": -6.9109416007995605, "global_step": 155171, "epoch": 3694} {"train_loss": -6.889564037322998, "global_step": 155172, "epoch": 3694} {"train_loss": -6.924328804016113, "global_step": 155173, "epoch": 3694} {"train_loss": -6.8115105628967285, "global_step": 155174, "epoch": 3694} {"train_loss": -6.853062629699707, "global_step": 155175, "epoch": 3694} {"train_loss": -6.836419105529785, "global_step": 155176, "epoch": 3694} {"train_loss": -6.939763069152832, "global_step": 155177, "epoch": 3694} {"train_loss": -6.754711151123047, "global_step": 155178, "epoch": 3694} {"train_loss": -6.9027228355407715, "global_step": 155179, "epoch": 3694} {"train_loss": -6.8013410568237305, "global_step": 155180, "epoch": 3694} {"train_loss": -6.841018199920654, "global_step": 155181, "epoch": 3694} {"train_loss": -6.95088005065918, "global_step": 155182, "epoch": 3694} {"train_loss": -6.860511302947998, "global_step": 155183, "epoch": 3694} {"train_loss": -6.841076850891113, "global_step": 155184, "epoch": 3694} {"train_loss": -6.850710868835449, "global_step": 155185, "epoch": 3694} {"train_loss": -6.791234016418457, "global_step": 155186, "epoch": 3694} {"train_loss": -7.001979827880859, "global_step": 155187, "epoch": 3694} {"train_loss": -6.845015525817871, "global_step": 155188, "epoch": 3694} {"train_loss": -6.864785728000459, "global_step": 155189, "epoch": 3694, "val_loss": 68563.8125} {"train_loss": -6.915110111236572, "global_step": 155190, "epoch": 3695} {"train_loss": -6.913477897644043, "global_step": 155191, "epoch": 3695} {"train_loss": -6.86140251159668, "global_step": 155192, "epoch": 3695} {"train_loss": -6.785730361938477, "global_step": 155193, "epoch": 3695} {"train_loss": -6.818827152252197, "global_step": 155194, "epoch": 3695} {"train_loss": -6.850111484527588, "global_step": 155195, "epoch": 3695} {"train_loss": -6.767115592956543, "global_step": 155196, "epoch": 3695} {"train_loss": -6.836369037628174, "global_step": 155197, "epoch": 3695} {"train_loss": -6.828361988067627, "global_step": 155198, "epoch": 3695} {"train_loss": -6.70331335067749, "global_step": 155199, "epoch": 3695} {"train_loss": -6.974514961242676, "global_step": 155200, "epoch": 3695} {"train_loss": -6.879758358001709, "global_step": 155201, "epoch": 3695} {"train_loss": -6.926617622375488, "global_step": 155202, "epoch": 3695} {"train_loss": -6.821311950683594, "global_step": 155203, "epoch": 3695} {"train_loss": -6.824432373046875, "global_step": 155204, "epoch": 3695} {"train_loss": -6.8839569091796875, "global_step": 155205, "epoch": 3695} {"train_loss": -6.866584777832031, "global_step": 155206, "epoch": 3695} {"train_loss": -6.877871990203857, "global_step": 155207, "epoch": 3695} {"train_loss": -6.884187698364258, "global_step": 155208, "epoch": 3695} {"train_loss": -6.7240471839904785, "global_step": 155209, "epoch": 3695} {"train_loss": -6.849539756774902, "global_step": 155210, "epoch": 3695} {"train_loss": -6.819530487060547, "global_step": 155211, "epoch": 3695} {"train_loss": -6.797298431396484, "global_step": 155212, "epoch": 3695} {"train_loss": -6.845539569854736, "global_step": 155213, "epoch": 3695} {"train_loss": -6.784666061401367, "global_step": 155214, "epoch": 3695} {"train_loss": -6.801289081573486, "global_step": 155215, "epoch": 3695} {"train_loss": -6.807720184326172, "global_step": 155216, "epoch": 3695} {"train_loss": -6.744162559509277, "global_step": 155217, "epoch": 3695} {"train_loss": -6.607229232788086, "global_step": 155218, "epoch": 3695} {"train_loss": -6.8319292068481445, "global_step": 155219, "epoch": 3695} {"train_loss": -6.706336498260498, "global_step": 155220, "epoch": 3695} {"train_loss": -6.77957010269165, "global_step": 155221, "epoch": 3695} {"train_loss": -6.755278587341309, "global_step": 155222, "epoch": 3695} {"train_loss": -6.724992752075195, "global_step": 155223, "epoch": 3695} {"train_loss": -6.939313888549805, "global_step": 155224, "epoch": 3695} {"train_loss": -6.817500114440918, "global_step": 155225, "epoch": 3695} {"train_loss": -6.78118896484375, "global_step": 155226, "epoch": 3695} {"train_loss": -6.769373416900635, "global_step": 155227, "epoch": 3695} {"train_loss": -6.750494480133057, "global_step": 155228, "epoch": 3695} {"train_loss": -6.765194416046143, "global_step": 155229, "epoch": 3695} {"train_loss": -6.740670680999756, "global_step": 155230, "epoch": 3695} {"train_loss": -6.81295649210612, "global_step": 155231, "epoch": 3695, "val_loss": 68388.3515625} {"train_loss": -6.674851894378662, "global_step": 155232, "epoch": 3696} {"train_loss": -6.858574867248535, "global_step": 155233, "epoch": 3696} {"train_loss": -6.794346332550049, "global_step": 155234, "epoch": 3696} {"train_loss": -6.763547420501709, "global_step": 155235, "epoch": 3696} {"train_loss": -6.895693778991699, "global_step": 155236, "epoch": 3696} {"train_loss": -6.929181098937988, "global_step": 155237, "epoch": 3696} {"train_loss": -6.750920295715332, "global_step": 155238, "epoch": 3696} {"train_loss": -6.8880696296691895, "global_step": 155239, "epoch": 3696} {"train_loss": -6.914401054382324, "global_step": 155240, "epoch": 3696} {"train_loss": -6.982900619506836, "global_step": 155241, "epoch": 3696} {"train_loss": -6.971091270446777, "global_step": 155242, "epoch": 3696} {"train_loss": -6.886133670806885, "global_step": 155243, "epoch": 3696} {"train_loss": -6.888980865478516, "global_step": 155244, "epoch": 3696} {"train_loss": -6.867661952972412, "global_step": 155245, "epoch": 3696} {"train_loss": -6.990560054779053, "global_step": 155246, "epoch": 3696} {"train_loss": -6.824511528015137, "global_step": 155247, "epoch": 3696} {"train_loss": -6.892030239105225, "global_step": 155248, "epoch": 3696} {"train_loss": -6.901154041290283, "global_step": 155249, "epoch": 3696} {"train_loss": -6.851925849914551, "global_step": 155250, "epoch": 3696} {"train_loss": -6.973949432373047, "global_step": 155251, "epoch": 3696} {"train_loss": -6.931490421295166, "global_step": 155252, "epoch": 3696} {"train_loss": -6.917390823364258, "global_step": 155253, "epoch": 3696} {"train_loss": -6.849160671234131, "global_step": 155254, "epoch": 3696} {"train_loss": -6.906291961669922, "global_step": 155255, "epoch": 3696} {"train_loss": -6.908731460571289, "global_step": 155256, "epoch": 3696} {"train_loss": -6.888972759246826, "global_step": 155257, "epoch": 3696} {"train_loss": -6.8757123947143555, "global_step": 155258, "epoch": 3696} {"train_loss": -6.863241195678711, "global_step": 155259, "epoch": 3696} {"train_loss": -7.011009216308594, "global_step": 155260, "epoch": 3696} {"train_loss": -6.904392242431641, "global_step": 155261, "epoch": 3696} {"train_loss": -6.859302520751953, "global_step": 155262, "epoch": 3696} {"train_loss": -6.86855411529541, "global_step": 155263, "epoch": 3696} {"train_loss": -6.898033142089844, "global_step": 155264, "epoch": 3696} {"train_loss": -6.962360382080078, "global_step": 155265, "epoch": 3696} {"train_loss": -6.917086601257324, "global_step": 155266, "epoch": 3696} {"train_loss": -6.859310150146484, "global_step": 155267, "epoch": 3696} {"train_loss": -6.894372463226318, "global_step": 155268, "epoch": 3696} {"train_loss": -6.913511276245117, "global_step": 155269, "epoch": 3696} {"train_loss": -6.8933587074279785, "global_step": 155270, "epoch": 3696} {"train_loss": -6.752900123596191, "global_step": 155271, "epoch": 3696} {"train_loss": -6.878269195556641, "global_step": 155272, "epoch": 3696} {"train_loss": -6.88393809681847, "global_step": 155273, "epoch": 3696, "val_loss": 68491.8203125} {"train_loss": -6.891002655029297, "global_step": 155274, "epoch": 3697} {"train_loss": -6.837111473083496, "global_step": 155275, "epoch": 3697} {"train_loss": -6.807165145874023, "global_step": 155276, "epoch": 3697} {"train_loss": -6.838372230529785, "global_step": 155277, "epoch": 3697} {"train_loss": -6.976381301879883, "global_step": 155278, "epoch": 3697} {"train_loss": -6.953299522399902, "global_step": 155279, "epoch": 3697} {"train_loss": -6.800323486328125, "global_step": 155280, "epoch": 3697} {"train_loss": -6.932944297790527, "global_step": 155281, "epoch": 3697} {"train_loss": -6.918116569519043, "global_step": 155282, "epoch": 3697} {"train_loss": -6.834167957305908, "global_step": 155283, "epoch": 3697} {"train_loss": -6.924323081970215, "global_step": 155284, "epoch": 3697} {"train_loss": -6.817380905151367, "global_step": 155285, "epoch": 3697} {"train_loss": -6.86843204498291, "global_step": 155286, "epoch": 3697} {"train_loss": -6.797117233276367, "global_step": 155287, "epoch": 3697} {"train_loss": -6.91267728805542, "global_step": 155288, "epoch": 3697} {"train_loss": -7.010077476501465, "global_step": 155289, "epoch": 3697} {"train_loss": -6.845088005065918, "global_step": 155290, "epoch": 3697} {"train_loss": -6.768396854400635, "global_step": 155291, "epoch": 3697} {"train_loss": -6.844488620758057, "global_step": 155292, "epoch": 3697} {"train_loss": -6.8460564613342285, "global_step": 155293, "epoch": 3697} {"train_loss": -6.809230804443359, "global_step": 155294, "epoch": 3697} {"train_loss": -6.848268508911133, "global_step": 155295, "epoch": 3697} {"train_loss": -6.834298133850098, "global_step": 155296, "epoch": 3697} {"train_loss": -6.732807159423828, "global_step": 155297, "epoch": 3697} {"train_loss": -6.7856550216674805, "global_step": 155298, "epoch": 3697} {"train_loss": -6.753435134887695, "global_step": 155299, "epoch": 3697} {"train_loss": -6.747750759124756, "global_step": 155300, "epoch": 3697} {"train_loss": -6.835390090942383, "global_step": 155301, "epoch": 3697} {"train_loss": -6.79802131652832, "global_step": 155302, "epoch": 3697} {"train_loss": -6.820777893066406, "global_step": 155303, "epoch": 3697} {"train_loss": -6.880113124847412, "global_step": 155304, "epoch": 3697} {"train_loss": -6.746840476989746, "global_step": 155305, "epoch": 3697} {"train_loss": -6.876815319061279, "global_step": 155306, "epoch": 3697} {"train_loss": -6.810141563415527, "global_step": 155307, "epoch": 3697} {"train_loss": -6.768568515777588, "global_step": 155308, "epoch": 3697} {"train_loss": -6.7040863037109375, "global_step": 155309, "epoch": 3697} {"train_loss": -6.810922622680664, "global_step": 155310, "epoch": 3697} {"train_loss": -6.777126312255859, "global_step": 155311, "epoch": 3697} {"train_loss": -6.853010177612305, "global_step": 155312, "epoch": 3697} {"train_loss": -6.857675552368164, "global_step": 155313, "epoch": 3697} {"train_loss": -6.821313858032227, "global_step": 155314, "epoch": 3697} {"train_loss": -6.836507445289975, "global_step": 155315, "epoch": 3697, "val_loss": 68544.046875} {"train_loss": -6.842803478240967, "global_step": 155316, "epoch": 3698} {"train_loss": -6.828691482543945, "global_step": 155317, "epoch": 3698} {"train_loss": -6.898143768310547, "global_step": 155318, "epoch": 3698} {"train_loss": -6.8528900146484375, "global_step": 155319, "epoch": 3698} {"train_loss": -6.859755992889404, "global_step": 155320, "epoch": 3698} {"train_loss": -6.888319969177246, "global_step": 155321, "epoch": 3698} {"train_loss": -6.833365440368652, "global_step": 155322, "epoch": 3698} {"train_loss": -6.828170299530029, "global_step": 155323, "epoch": 3698} {"train_loss": -6.841702938079834, "global_step": 155324, "epoch": 3698} {"train_loss": -6.851991653442383, "global_step": 155325, "epoch": 3698} {"train_loss": -6.806441307067871, "global_step": 155326, "epoch": 3698} {"train_loss": -6.813992977142334, "global_step": 155327, "epoch": 3698} {"train_loss": -6.7957763671875, "global_step": 155328, "epoch": 3698} {"train_loss": -6.814453601837158, "global_step": 155329, "epoch": 3698} {"train_loss": -6.89921236038208, "global_step": 155330, "epoch": 3698} {"train_loss": -6.780799388885498, "global_step": 155331, "epoch": 3698} {"train_loss": -6.842255592346191, "global_step": 155332, "epoch": 3698} {"train_loss": -6.882046222686768, "global_step": 155333, "epoch": 3698} {"train_loss": -6.871071815490723, "global_step": 155334, "epoch": 3698} {"train_loss": -6.790162086486816, "global_step": 155335, "epoch": 3698} {"train_loss": -6.737368106842041, "global_step": 155336, "epoch": 3698} {"train_loss": -6.894688606262207, "global_step": 155337, "epoch": 3698} {"train_loss": -6.840878486633301, "global_step": 155338, "epoch": 3698} {"train_loss": -6.875452995300293, "global_step": 155339, "epoch": 3698} {"train_loss": -6.822980880737305, "global_step": 155340, "epoch": 3698} {"train_loss": -6.738133907318115, "global_step": 155341, "epoch": 3698} {"train_loss": -6.878270149230957, "global_step": 155342, "epoch": 3698} {"train_loss": -6.799276351928711, "global_step": 155343, "epoch": 3698} {"train_loss": -6.91715145111084, "global_step": 155344, "epoch": 3698} {"train_loss": -6.870070457458496, "global_step": 155345, "epoch": 3698} {"train_loss": -6.941274166107178, "global_step": 155346, "epoch": 3698} {"train_loss": -6.727020263671875, "global_step": 155347, "epoch": 3698} {"train_loss": -6.835777282714844, "global_step": 155348, "epoch": 3698} {"train_loss": -6.86527156829834, "global_step": 155349, "epoch": 3698} {"train_loss": -6.944820880889893, "global_step": 155350, "epoch": 3698} {"train_loss": -6.764289855957031, "global_step": 155351, "epoch": 3698} {"train_loss": -6.791135787963867, "global_step": 155352, "epoch": 3698} {"train_loss": -6.87113094329834, "global_step": 155353, "epoch": 3698} {"train_loss": -6.786407947540283, "global_step": 155354, "epoch": 3698} {"train_loss": -6.780482769012451, "global_step": 155355, "epoch": 3698} {"train_loss": -6.7733964920043945, "global_step": 155356, "epoch": 3698} {"train_loss": -6.835990065620059, "global_step": 155357, "epoch": 3698, "val_loss": 68604.2265625} {"train_loss": -6.885647773742676, "global_step": 155358, "epoch": 3699} {"train_loss": -6.911179065704346, "global_step": 155359, "epoch": 3699} {"train_loss": -6.896918773651123, "global_step": 155360, "epoch": 3699} {"train_loss": -6.962660789489746, "global_step": 155361, "epoch": 3699} {"train_loss": -6.979526042938232, "global_step": 155362, "epoch": 3699} {"train_loss": -6.939945220947266, "global_step": 155363, "epoch": 3699} {"train_loss": -6.9041290283203125, "global_step": 155364, "epoch": 3699} {"train_loss": -6.891030311584473, "global_step": 155365, "epoch": 3699} {"train_loss": -6.797307968139648, "global_step": 155366, "epoch": 3699} {"train_loss": -6.933138847351074, "global_step": 155367, "epoch": 3699} {"train_loss": -6.8596038818359375, "global_step": 155368, "epoch": 3699} {"train_loss": -6.931324005126953, "global_step": 155369, "epoch": 3699} {"train_loss": -6.9817657470703125, "global_step": 155370, "epoch": 3699} {"train_loss": -6.827104091644287, "global_step": 155371, "epoch": 3699} {"train_loss": -6.862868309020996, "global_step": 155372, "epoch": 3699} {"train_loss": -6.949039459228516, "global_step": 155373, "epoch": 3699} {"train_loss": -6.726003646850586, "global_step": 155374, "epoch": 3699} {"train_loss": -6.8682451248168945, "global_step": 155375, "epoch": 3699} {"train_loss": -6.87374210357666, "global_step": 155376, "epoch": 3699} {"train_loss": -6.88753604888916, "global_step": 155377, "epoch": 3699} {"train_loss": -6.774172782897949, "global_step": 155378, "epoch": 3699} {"train_loss": -6.937702655792236, "global_step": 155379, "epoch": 3699} {"train_loss": -6.780158996582031, "global_step": 155380, "epoch": 3699} {"train_loss": -6.763179302215576, "global_step": 155381, "epoch": 3699} {"train_loss": -6.890529155731201, "global_step": 155382, "epoch": 3699} {"train_loss": -6.729543209075928, "global_step": 155383, "epoch": 3699} {"train_loss": -6.833904266357422, "global_step": 155384, "epoch": 3699} {"train_loss": -6.885042190551758, "global_step": 155385, "epoch": 3699} {"train_loss": -6.876577377319336, "global_step": 155386, "epoch": 3699} {"train_loss": -6.850319862365723, "global_step": 155387, "epoch": 3699} {"train_loss": -6.906231880187988, "global_step": 155388, "epoch": 3699} {"train_loss": -6.8924150466918945, "global_step": 155389, "epoch": 3699} {"train_loss": -6.9111762046813965, "global_step": 155390, "epoch": 3699} {"train_loss": -6.85628604888916, "global_step": 155391, "epoch": 3699} {"train_loss": -6.931867599487305, "global_step": 155392, "epoch": 3699} {"train_loss": -6.811738967895508, "global_step": 155393, "epoch": 3699} {"train_loss": -6.883744239807129, "global_step": 155394, "epoch": 3699} {"train_loss": -6.8871660232543945, "global_step": 155395, "epoch": 3699} {"train_loss": -6.791869163513184, "global_step": 155396, "epoch": 3699} {"train_loss": -6.826590538024902, "global_step": 155397, "epoch": 3699} {"train_loss": -6.780282020568848, "global_step": 155398, "epoch": 3699} {"train_loss": -6.869500353222802, "global_step": 155399, "epoch": 3699, "val_loss": 68477.25} {"train_loss": -6.909900665283203, "global_step": 155400, "epoch": 3700} {"train_loss": -6.902128219604492, "global_step": 155401, "epoch": 3700} {"train_loss": -6.695898532867432, "global_step": 155402, "epoch": 3700} {"train_loss": -6.856544017791748, "global_step": 155403, "epoch": 3700} {"train_loss": -6.808382511138916, "global_step": 155404, "epoch": 3700} {"train_loss": -6.802482604980469, "global_step": 155405, "epoch": 3700} {"train_loss": -6.8602094650268555, "global_step": 155406, "epoch": 3700} {"train_loss": -6.948418617248535, "global_step": 155407, "epoch": 3700} {"train_loss": -6.941591262817383, "global_step": 155408, "epoch": 3700} {"train_loss": -6.927989482879639, "global_step": 155409, "epoch": 3700} {"train_loss": -6.6860857009887695, "global_step": 155410, "epoch": 3700} {"train_loss": -6.8972272872924805, "global_step": 155411, "epoch": 3700} {"train_loss": -6.860480308532715, "global_step": 155412, "epoch": 3700} {"train_loss": -6.745228290557861, "global_step": 155413, "epoch": 3700} {"train_loss": -6.852400779724121, "global_step": 155414, "epoch": 3700} {"train_loss": -6.780664443969727, "global_step": 155415, "epoch": 3700} {"train_loss": -6.730380058288574, "global_step": 155416, "epoch": 3700} {"train_loss": -6.810056686401367, "global_step": 155417, "epoch": 3700} {"train_loss": -6.7147650718688965, "global_step": 155418, "epoch": 3700} {"train_loss": -6.729835510253906, "global_step": 155419, "epoch": 3700} {"train_loss": -6.677911758422852, "global_step": 155420, "epoch": 3700} {"train_loss": -6.757741928100586, "global_step": 155421, "epoch": 3700} {"train_loss": -6.804527282714844, "global_step": 155422, "epoch": 3700} {"train_loss": -6.8154520988464355, "global_step": 155423, "epoch": 3700} {"train_loss": -6.861891746520996, "global_step": 155424, "epoch": 3700} {"train_loss": -6.8385820388793945, "global_step": 155425, "epoch": 3700} {"train_loss": -6.800798416137695, "global_step": 155426, "epoch": 3700} {"train_loss": -6.831271171569824, "global_step": 155427, "epoch": 3700} {"train_loss": -6.821035385131836, "global_step": 155428, "epoch": 3700} {"train_loss": -6.6917595863342285, "global_step": 155429, "epoch": 3700} {"train_loss": -6.81562614440918, "global_step": 155430, "epoch": 3700} {"train_loss": -6.7813920974731445, "global_step": 155431, "epoch": 3700} {"train_loss": -6.760802268981934, "global_step": 155432, "epoch": 3700} {"train_loss": -6.758430480957031, "global_step": 155433, "epoch": 3700} {"train_loss": -6.812295913696289, "global_step": 155434, "epoch": 3700} {"train_loss": -6.918942451477051, "global_step": 155435, "epoch": 3700} {"train_loss": -6.939075946807861, "global_step": 155436, "epoch": 3700} {"train_loss": -6.730449676513672, "global_step": 155437, "epoch": 3700} {"train_loss": -6.888108253479004, "global_step": 155438, "epoch": 3700} {"train_loss": -6.908440113067627, "global_step": 155439, "epoch": 3700} {"train_loss": -6.854241847991943, "global_step": 155440, "epoch": 3700} {"train_loss": -6.818679468972342, "global_step": 155441, "epoch": 3700, "train/sim_max_reward_0": 0.24313917395633752, "train/sim_max_reward_1": 0.9905988906144819, "train/sim_max_reward_2": 0.639896448997963, "train/sim_max_reward_3": 0.7610797460961312, "train/sim_max_reward_4": 0.9649224482023717, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.2765293669000729, "test/sim_max_reward_4400001": 0.9230831590262097, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.7321513885436004, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9139526380231893, "test/sim_max_reward_4400006": 0.9600165383422999, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9096274656365674, "test/sim_max_reward_4400010": 0.1943105413406458, "test/sim_max_reward_4400011": 0.21456391761504787, "test/sim_max_reward_4400012": 0.8316900918570777, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.4400084475233564, "test/sim_max_reward_4400015": 0.04674139228937862, "test/sim_max_reward_4400016": 0.22972247867063447, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24841167750579193, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.26537326123294314, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.9904023302512038, "test/sim_max_reward_4400025": 0.2540019315899775, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.023751812147953816, "test/sim_max_reward_4400028": 0.5869974112517277, "test/sim_max_reward_4400029": 0.7545513945323866, "test/sim_max_reward_4400030": 0.9496606335671376, "test/sim_max_reward_4400031": 0.997084805201717, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.792459768029293, "test/sim_max_reward_4400034": 0.981049277684796, "test/sim_max_reward_4400035": 0.8202186217830704, "test/sim_max_reward_4400036": 0.3365159901939442, "test/sim_max_reward_4400037": 0.9631947408840499, "test/sim_max_reward_4400038": 0.9352266103435541, "test/sim_max_reward_4400039": 0.7706784332614249, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9651165385000992, "test/sim_max_reward_4400042": 0.8858800647173656, "test/sim_max_reward_4400043": 0.941854733981719, "test/sim_max_reward_4400044": 0.9518318973796418, "test/sim_max_reward_4400045": 0.9962423807021551, "test/sim_max_reward_4400046": 0.39239299771245484, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.5869960640811617, "test/sim_max_reward_4400049": 0.8952160740908814, "train/mean_score": 0.7666061179778808, "test/mean_score": 0.5745522210506134, "val_loss": 68371.875} {"train_loss": -6.886117458343506, "global_step": 155442, "epoch": 3701} {"train_loss": -6.824034690856934, "global_step": 155443, "epoch": 3701} {"train_loss": -6.808818340301514, "global_step": 155444, "epoch": 3701} {"train_loss": -6.8545050621032715, "global_step": 155445, "epoch": 3701} {"train_loss": -6.8205485343933105, "global_step": 155446, "epoch": 3701} {"train_loss": -6.942220687866211, "global_step": 155447, "epoch": 3701} {"train_loss": -6.7490715980529785, "global_step": 155448, "epoch": 3701} {"train_loss": -6.901279926300049, "global_step": 155449, "epoch": 3701} {"train_loss": -6.7788286209106445, "global_step": 155450, "epoch": 3701} {"train_loss": -6.925556182861328, "global_step": 155451, "epoch": 3701} {"train_loss": -6.838686943054199, "global_step": 155452, "epoch": 3701} {"train_loss": -6.7725019454956055, "global_step": 155453, "epoch": 3701} {"train_loss": -6.893030166625977, "global_step": 155454, "epoch": 3701} {"train_loss": -7.003063201904297, "global_step": 155455, "epoch": 3701} {"train_loss": -6.773638725280762, "global_step": 155456, "epoch": 3701} {"train_loss": -6.701700210571289, "global_step": 155457, "epoch": 3701} {"train_loss": -6.872191429138184, "global_step": 155458, "epoch": 3701} {"train_loss": -6.815252304077148, "global_step": 155459, "epoch": 3701} {"train_loss": -6.785466194152832, "global_step": 155460, "epoch": 3701} {"train_loss": -6.775687217712402, "global_step": 155461, "epoch": 3701} {"train_loss": -6.866284370422363, "global_step": 155462, "epoch": 3701} {"train_loss": -6.876016139984131, "global_step": 155463, "epoch": 3701} {"train_loss": -6.804736614227295, "global_step": 155464, "epoch": 3701} {"train_loss": -6.777961730957031, "global_step": 155465, "epoch": 3701} {"train_loss": -6.810460090637207, "global_step": 155466, "epoch": 3701} {"train_loss": -6.828496932983398, "global_step": 155467, "epoch": 3701} {"train_loss": -6.954541206359863, "global_step": 155468, "epoch": 3701} {"train_loss": -6.873037338256836, "global_step": 155469, "epoch": 3701} {"train_loss": -6.931623458862305, "global_step": 155470, "epoch": 3701} {"train_loss": -6.918496131896973, "global_step": 155471, "epoch": 3701} {"train_loss": -6.856019973754883, "global_step": 155472, "epoch": 3701} {"train_loss": -6.949514389038086, "global_step": 155473, "epoch": 3701} {"train_loss": -6.967514514923096, "global_step": 155474, "epoch": 3701} {"train_loss": -6.941561698913574, "global_step": 155475, "epoch": 3701} {"train_loss": -6.879854202270508, "global_step": 155476, "epoch": 3701} {"train_loss": -6.89558219909668, "global_step": 155477, "epoch": 3701} {"train_loss": -6.828305721282959, "global_step": 155478, "epoch": 3701} {"train_loss": -6.924739837646484, "global_step": 155479, "epoch": 3701} {"train_loss": -6.954364776611328, "global_step": 155480, "epoch": 3701} {"train_loss": -6.95291805267334, "global_step": 155481, "epoch": 3701} {"train_loss": -6.9250640869140625, "global_step": 155482, "epoch": 3701} {"train_loss": -6.865654003052485, "global_step": 155483, "epoch": 3701, "val_loss": 68592.359375} {"train_loss": -6.768563270568848, "global_step": 155484, "epoch": 3702} {"train_loss": -6.837677001953125, "global_step": 155485, "epoch": 3702} {"train_loss": -6.899527072906494, "global_step": 155486, "epoch": 3702} {"train_loss": -6.898115158081055, "global_step": 155487, "epoch": 3702} {"train_loss": -6.869238376617432, "global_step": 155488, "epoch": 3702} {"train_loss": -6.836919784545898, "global_step": 155489, "epoch": 3702} {"train_loss": -6.903171062469482, "global_step": 155490, "epoch": 3702} {"train_loss": -6.864335060119629, "global_step": 155491, "epoch": 3702} {"train_loss": -6.857590675354004, "global_step": 155492, "epoch": 3702} {"train_loss": -6.804844379425049, "global_step": 155493, "epoch": 3702} {"train_loss": -6.828134059906006, "global_step": 155494, "epoch": 3702} {"train_loss": -7.015980243682861, "global_step": 155495, "epoch": 3702} {"train_loss": -6.958776473999023, "global_step": 155496, "epoch": 3702} {"train_loss": -6.879606246948242, "global_step": 155497, "epoch": 3702} {"train_loss": -6.832118034362793, "global_step": 155498, "epoch": 3702} {"train_loss": -7.002069473266602, "global_step": 155499, "epoch": 3702} {"train_loss": -6.9069719314575195, "global_step": 155500, "epoch": 3702} {"train_loss": -6.897112846374512, "global_step": 155501, "epoch": 3702} {"train_loss": -6.891685485839844, "global_step": 155502, "epoch": 3702} {"train_loss": -6.881856918334961, "global_step": 155503, "epoch": 3702} {"train_loss": -6.8784260749816895, "global_step": 155504, "epoch": 3702} {"train_loss": -6.90322208404541, "global_step": 155505, "epoch": 3702} {"train_loss": -6.868213653564453, "global_step": 155506, "epoch": 3702} {"train_loss": -6.831319808959961, "global_step": 155507, "epoch": 3702} {"train_loss": -7.03523063659668, "global_step": 155508, "epoch": 3702} {"train_loss": -6.881833076477051, "global_step": 155509, "epoch": 3702} {"train_loss": -6.877021312713623, "global_step": 155510, "epoch": 3702} {"train_loss": -6.943362712860107, "global_step": 155511, "epoch": 3702} {"train_loss": -6.829628944396973, "global_step": 155512, "epoch": 3702} {"train_loss": -6.9000701904296875, "global_step": 155513, "epoch": 3702} {"train_loss": -6.9330644607543945, "global_step": 155514, "epoch": 3702} {"train_loss": -6.9509806632995605, "global_step": 155515, "epoch": 3702} {"train_loss": -6.8835554122924805, "global_step": 155516, "epoch": 3702} {"train_loss": -6.907988548278809, "global_step": 155517, "epoch": 3702} {"train_loss": -6.938840866088867, "global_step": 155518, "epoch": 3702} {"train_loss": -6.794239044189453, "global_step": 155519, "epoch": 3702} {"train_loss": -6.874575614929199, "global_step": 155520, "epoch": 3702} {"train_loss": -6.899487495422363, "global_step": 155521, "epoch": 3702} {"train_loss": -6.886107921600342, "global_step": 155522, "epoch": 3702} {"train_loss": -6.857933044433594, "global_step": 155523, "epoch": 3702} {"train_loss": -6.777619361877441, "global_step": 155524, "epoch": 3702} {"train_loss": -6.884894552684965, "global_step": 155525, "epoch": 3702, "val_loss": 68651.8671875} {"train_loss": -6.88722038269043, "global_step": 155526, "epoch": 3703} {"train_loss": -6.890351295471191, "global_step": 155527, "epoch": 3703} {"train_loss": -6.915340900421143, "global_step": 155528, "epoch": 3703} {"train_loss": -6.821861267089844, "global_step": 155529, "epoch": 3703} {"train_loss": -6.853537559509277, "global_step": 155530, "epoch": 3703} {"train_loss": -6.954309463500977, "global_step": 155531, "epoch": 3703} {"train_loss": -6.944937705993652, "global_step": 155532, "epoch": 3703} {"train_loss": -6.849518775939941, "global_step": 155533, "epoch": 3703} {"train_loss": -6.904247283935547, "global_step": 155534, "epoch": 3703} {"train_loss": -6.803269386291504, "global_step": 155535, "epoch": 3703} {"train_loss": -6.951198101043701, "global_step": 155536, "epoch": 3703} {"train_loss": -6.9192681312561035, "global_step": 155537, "epoch": 3703} {"train_loss": -6.770597457885742, "global_step": 155538, "epoch": 3703} {"train_loss": -6.9006547927856445, "global_step": 155539, "epoch": 3703} {"train_loss": -7.065428256988525, "global_step": 155540, "epoch": 3703} {"train_loss": -6.906710147857666, "global_step": 155541, "epoch": 3703} {"train_loss": -6.90286922454834, "global_step": 155542, "epoch": 3703} {"train_loss": -6.767828941345215, "global_step": 155543, "epoch": 3703} {"train_loss": -6.79920768737793, "global_step": 155544, "epoch": 3703} {"train_loss": -6.86361026763916, "global_step": 155545, "epoch": 3703} {"train_loss": -6.906801700592041, "global_step": 155546, "epoch": 3703} {"train_loss": -6.868436336517334, "global_step": 155547, "epoch": 3703} {"train_loss": -6.853081703186035, "global_step": 155548, "epoch": 3703} {"train_loss": -6.833892822265625, "global_step": 155549, "epoch": 3703} {"train_loss": -6.761578559875488, "global_step": 155550, "epoch": 3703} {"train_loss": -6.898886680603027, "global_step": 155551, "epoch": 3703} {"train_loss": -6.834328651428223, "global_step": 155552, "epoch": 3703} {"train_loss": -6.713679313659668, "global_step": 155553, "epoch": 3703} {"train_loss": -6.84868049621582, "global_step": 155554, "epoch": 3703} {"train_loss": -6.720291614532471, "global_step": 155555, "epoch": 3703} {"train_loss": -6.777870178222656, "global_step": 155556, "epoch": 3703} {"train_loss": -6.909689903259277, "global_step": 155557, "epoch": 3703} {"train_loss": -6.851032257080078, "global_step": 155558, "epoch": 3703} {"train_loss": -6.740579605102539, "global_step": 155559, "epoch": 3703} {"train_loss": -6.80043888092041, "global_step": 155560, "epoch": 3703} {"train_loss": -6.8542094230651855, "global_step": 155561, "epoch": 3703} {"train_loss": -6.869225978851318, "global_step": 155562, "epoch": 3703} {"train_loss": -6.765357971191406, "global_step": 155563, "epoch": 3703} {"train_loss": -6.925175666809082, "global_step": 155564, "epoch": 3703} {"train_loss": -6.803037643432617, "global_step": 155565, "epoch": 3703} {"train_loss": -6.856162071228027, "global_step": 155566, "epoch": 3703} {"train_loss": -6.855826264335995, "global_step": 155567, "epoch": 3703, "val_loss": 68363.125} {"train_loss": -6.895249843597412, "global_step": 155568, "epoch": 3704} {"train_loss": -6.7673563957214355, "global_step": 155569, "epoch": 3704} {"train_loss": -6.74560546875, "global_step": 155570, "epoch": 3704} {"train_loss": -6.838113307952881, "global_step": 155571, "epoch": 3704} {"train_loss": -6.917358875274658, "global_step": 155572, "epoch": 3704} {"train_loss": -6.940042495727539, "global_step": 155573, "epoch": 3704} {"train_loss": -6.907473564147949, "global_step": 155574, "epoch": 3704} {"train_loss": -6.906595230102539, "global_step": 155575, "epoch": 3704} {"train_loss": -6.794523239135742, "global_step": 155576, "epoch": 3704} {"train_loss": -6.873955726623535, "global_step": 155577, "epoch": 3704} {"train_loss": -6.8151397705078125, "global_step": 155578, "epoch": 3704} {"train_loss": -6.878477573394775, "global_step": 155579, "epoch": 3704} {"train_loss": -6.965285778045654, "global_step": 155580, "epoch": 3704} {"train_loss": -6.741485595703125, "global_step": 155581, "epoch": 3704} {"train_loss": -6.783010482788086, "global_step": 155582, "epoch": 3704} {"train_loss": -6.897383213043213, "global_step": 155583, "epoch": 3704} {"train_loss": -6.831676483154297, "global_step": 155584, "epoch": 3704} {"train_loss": -6.887750625610352, "global_step": 155585, "epoch": 3704} {"train_loss": -6.8044915199279785, "global_step": 155586, "epoch": 3704} {"train_loss": -6.8707733154296875, "global_step": 155587, "epoch": 3704} {"train_loss": -6.819333076477051, "global_step": 155588, "epoch": 3704} {"train_loss": -6.876090049743652, "global_step": 155589, "epoch": 3704} {"train_loss": -6.855191230773926, "global_step": 155590, "epoch": 3704} {"train_loss": -6.835894584655762, "global_step": 155591, "epoch": 3704} {"train_loss": -6.921469688415527, "global_step": 155592, "epoch": 3704} {"train_loss": -6.832712173461914, "global_step": 155593, "epoch": 3704} {"train_loss": -6.795271873474121, "global_step": 155594, "epoch": 3704} {"train_loss": -6.83650541305542, "global_step": 155595, "epoch": 3704} {"train_loss": -6.87506628036499, "global_step": 155596, "epoch": 3704} {"train_loss": -6.980362892150879, "global_step": 155597, "epoch": 3704} {"train_loss": -6.825987339019775, "global_step": 155598, "epoch": 3704} {"train_loss": -6.885709762573242, "global_step": 155599, "epoch": 3704} {"train_loss": -6.92214822769165, "global_step": 155600, "epoch": 3704} {"train_loss": -6.931240081787109, "global_step": 155601, "epoch": 3704} {"train_loss": -6.861952781677246, "global_step": 155602, "epoch": 3704} {"train_loss": -6.84382438659668, "global_step": 155603, "epoch": 3704} {"train_loss": -6.857424736022949, "global_step": 155604, "epoch": 3704} {"train_loss": -6.856342315673828, "global_step": 155605, "epoch": 3704} {"train_loss": -6.90831184387207, "global_step": 155606, "epoch": 3704} {"train_loss": -6.903520584106445, "global_step": 155607, "epoch": 3704} {"train_loss": -6.865233421325684, "global_step": 155608, "epoch": 3704} {"train_loss": -6.86251213437035, "global_step": 155609, "epoch": 3704, "val_loss": 68440.1953125} {"train_loss": -6.719259262084961, "global_step": 155610, "epoch": 3705} {"train_loss": -6.790355682373047, "global_step": 155611, "epoch": 3705} {"train_loss": -6.879217147827148, "global_step": 155612, "epoch": 3705} {"train_loss": -6.776140213012695, "global_step": 155613, "epoch": 3705} {"train_loss": -6.802426338195801, "global_step": 155614, "epoch": 3705} {"train_loss": -6.901102542877197, "global_step": 155615, "epoch": 3705} {"train_loss": -6.829354286193848, "global_step": 155616, "epoch": 3705} {"train_loss": -6.857176780700684, "global_step": 155617, "epoch": 3705} {"train_loss": -6.737215042114258, "global_step": 155618, "epoch": 3705} {"train_loss": -6.806268215179443, "global_step": 155619, "epoch": 3705} {"train_loss": -6.80996036529541, "global_step": 155620, "epoch": 3705} {"train_loss": -6.783174514770508, "global_step": 155621, "epoch": 3705} {"train_loss": -6.906053066253662, "global_step": 155622, "epoch": 3705} {"train_loss": -6.8221354484558105, "global_step": 155623, "epoch": 3705} {"train_loss": -6.8127031326293945, "global_step": 155624, "epoch": 3705} {"train_loss": -6.773054122924805, "global_step": 155625, "epoch": 3705} {"train_loss": -6.787057876586914, "global_step": 155626, "epoch": 3705} {"train_loss": -6.799549102783203, "global_step": 155627, "epoch": 3705} {"train_loss": -6.819662570953369, "global_step": 155628, "epoch": 3705} {"train_loss": -6.855861186981201, "global_step": 155629, "epoch": 3705} {"train_loss": -6.751938819885254, "global_step": 155630, "epoch": 3705} {"train_loss": -6.76857852935791, "global_step": 155631, "epoch": 3705} {"train_loss": -6.7924394607543945, "global_step": 155632, "epoch": 3705} {"train_loss": -6.693263053894043, "global_step": 155633, "epoch": 3705} {"train_loss": -6.7824859619140625, "global_step": 155634, "epoch": 3705} {"train_loss": -6.826183319091797, "global_step": 155635, "epoch": 3705} {"train_loss": -6.649831295013428, "global_step": 155636, "epoch": 3705} {"train_loss": -6.748147010803223, "global_step": 155637, "epoch": 3705} {"train_loss": -6.632102012634277, "global_step": 155638, "epoch": 3705} {"train_loss": -6.8784027099609375, "global_step": 155639, "epoch": 3705} {"train_loss": -6.903442859649658, "global_step": 155640, "epoch": 3705} {"train_loss": -6.9756879806518555, "global_step": 155641, "epoch": 3705} {"train_loss": -6.637155532836914, "global_step": 155642, "epoch": 3705} {"train_loss": -6.72597074508667, "global_step": 155643, "epoch": 3705} {"train_loss": -6.718172073364258, "global_step": 155644, "epoch": 3705} {"train_loss": -6.728411674499512, "global_step": 155645, "epoch": 3705} {"train_loss": -6.736885070800781, "global_step": 155646, "epoch": 3705} {"train_loss": -6.767292022705078, "global_step": 155647, "epoch": 3705} {"train_loss": -6.826948642730713, "global_step": 155648, "epoch": 3705} {"train_loss": -6.696071147918701, "global_step": 155649, "epoch": 3705} {"train_loss": -6.791014671325684, "global_step": 155650, "epoch": 3705} {"train_loss": -6.789586044493175, "global_step": 155651, "epoch": 3705, "val_loss": 68446.421875} {"train_loss": -6.813741683959961, "global_step": 155652, "epoch": 3706} {"train_loss": -6.9326171875, "global_step": 155653, "epoch": 3706} {"train_loss": -6.816077709197998, "global_step": 155654, "epoch": 3706} {"train_loss": -6.911096572875977, "global_step": 155655, "epoch": 3706} {"train_loss": -6.892181396484375, "global_step": 155656, "epoch": 3706} {"train_loss": -6.85981559753418, "global_step": 155657, "epoch": 3706} {"train_loss": -6.873301982879639, "global_step": 155658, "epoch": 3706} {"train_loss": -6.870441913604736, "global_step": 155659, "epoch": 3706} {"train_loss": -6.89304256439209, "global_step": 155660, "epoch": 3706} {"train_loss": -6.92148494720459, "global_step": 155661, "epoch": 3706} {"train_loss": -6.7696852684021, "global_step": 155662, "epoch": 3706} {"train_loss": -6.933292388916016, "global_step": 155663, "epoch": 3706} {"train_loss": -6.92488956451416, "global_step": 155664, "epoch": 3706} {"train_loss": -6.878389358520508, "global_step": 155665, "epoch": 3706} {"train_loss": -6.8181657791137695, "global_step": 155666, "epoch": 3706} {"train_loss": -6.847085952758789, "global_step": 155667, "epoch": 3706} {"train_loss": -6.877964973449707, "global_step": 155668, "epoch": 3706} {"train_loss": -6.877631187438965, "global_step": 155669, "epoch": 3706} {"train_loss": -6.9316020011901855, "global_step": 155670, "epoch": 3706} {"train_loss": -6.713202476501465, "global_step": 155671, "epoch": 3706} {"train_loss": -6.704777717590332, "global_step": 155672, "epoch": 3706} {"train_loss": -6.845864772796631, "global_step": 155673, "epoch": 3706} {"train_loss": -6.885515213012695, "global_step": 155674, "epoch": 3706} {"train_loss": -6.715701103210449, "global_step": 155675, "epoch": 3706} {"train_loss": -6.821295261383057, "global_step": 155676, "epoch": 3706} {"train_loss": -6.681126594543457, "global_step": 155677, "epoch": 3706} {"train_loss": -6.784478187561035, "global_step": 155678, "epoch": 3706} {"train_loss": -6.823665618896484, "global_step": 155679, "epoch": 3706} {"train_loss": -6.82621431350708, "global_step": 155680, "epoch": 3706} {"train_loss": -6.875664710998535, "global_step": 155681, "epoch": 3706} {"train_loss": -6.706170082092285, "global_step": 155682, "epoch": 3706} {"train_loss": -6.849064826965332, "global_step": 155683, "epoch": 3706} {"train_loss": -6.890280246734619, "global_step": 155684, "epoch": 3706} {"train_loss": -6.74232292175293, "global_step": 155685, "epoch": 3706} {"train_loss": -6.865830898284912, "global_step": 155686, "epoch": 3706} {"train_loss": -6.970162868499756, "global_step": 155687, "epoch": 3706} {"train_loss": -6.9375410079956055, "global_step": 155688, "epoch": 3706} {"train_loss": -6.862885475158691, "global_step": 155689, "epoch": 3706} {"train_loss": -6.875367641448975, "global_step": 155690, "epoch": 3706} {"train_loss": -6.841510772705078, "global_step": 155691, "epoch": 3706} {"train_loss": -6.765384197235107, "global_step": 155692, "epoch": 3706} {"train_loss": -6.8441877365112305, "global_step": 155693, "epoch": 3706, "val_loss": 68633.7109375} {"train_loss": -6.869966506958008, "global_step": 155694, "epoch": 3707} {"train_loss": -6.880800247192383, "global_step": 155695, "epoch": 3707} {"train_loss": -6.853765487670898, "global_step": 155696, "epoch": 3707} {"train_loss": -6.900993347167969, "global_step": 155697, "epoch": 3707} {"train_loss": -6.858814716339111, "global_step": 155698, "epoch": 3707} {"train_loss": -6.917859077453613, "global_step": 155699, "epoch": 3707} {"train_loss": -6.7950968742370605, "global_step": 155700, "epoch": 3707} {"train_loss": -6.8632612228393555, "global_step": 155701, "epoch": 3707} {"train_loss": -6.867465972900391, "global_step": 155702, "epoch": 3707} {"train_loss": -6.764091491699219, "global_step": 155703, "epoch": 3707} {"train_loss": -6.7448039054870605, "global_step": 155704, "epoch": 3707} {"train_loss": -6.849242687225342, "global_step": 155705, "epoch": 3707} {"train_loss": -6.910236358642578, "global_step": 155706, "epoch": 3707} {"train_loss": -6.862156867980957, "global_step": 155707, "epoch": 3707} {"train_loss": -6.777893543243408, "global_step": 155708, "epoch": 3707} {"train_loss": -6.779438018798828, "global_step": 155709, "epoch": 3707} {"train_loss": -6.764808654785156, "global_step": 155710, "epoch": 3707} {"train_loss": -6.772900581359863, "global_step": 155711, "epoch": 3707} {"train_loss": -6.939069747924805, "global_step": 155712, "epoch": 3707} {"train_loss": -6.828948020935059, "global_step": 155713, "epoch": 3707} {"train_loss": -6.839329719543457, "global_step": 155714, "epoch": 3707} {"train_loss": -6.8212127685546875, "global_step": 155715, "epoch": 3707} {"train_loss": -6.653376579284668, "global_step": 155716, "epoch": 3707} {"train_loss": -6.856891632080078, "global_step": 155717, "epoch": 3707} {"train_loss": -6.799783229827881, "global_step": 155718, "epoch": 3707} {"train_loss": -6.787880897521973, "global_step": 155719, "epoch": 3707} {"train_loss": -6.913745880126953, "global_step": 155720, "epoch": 3707} {"train_loss": -6.768582344055176, "global_step": 155721, "epoch": 3707} {"train_loss": -6.756429195404053, "global_step": 155722, "epoch": 3707} {"train_loss": -6.761868476867676, "global_step": 155723, "epoch": 3707} {"train_loss": -6.881610870361328, "global_step": 155724, "epoch": 3707} {"train_loss": -6.915738582611084, "global_step": 155725, "epoch": 3707} {"train_loss": -6.830324172973633, "global_step": 155726, "epoch": 3707} {"train_loss": -6.780959129333496, "global_step": 155727, "epoch": 3707} {"train_loss": -6.766931533813477, "global_step": 155728, "epoch": 3707} {"train_loss": -6.794325828552246, "global_step": 155729, "epoch": 3707} {"train_loss": -6.708707809448242, "global_step": 155730, "epoch": 3707} {"train_loss": -6.9008588790893555, "global_step": 155731, "epoch": 3707} {"train_loss": -6.7901105880737305, "global_step": 155732, "epoch": 3707} {"train_loss": -6.814436435699463, "global_step": 155733, "epoch": 3707} {"train_loss": -6.753547191619873, "global_step": 155734, "epoch": 3707} {"train_loss": -6.819427512940907, "global_step": 155735, "epoch": 3707, "val_loss": 68609.484375} {"train_loss": -6.906454563140869, "global_step": 155736, "epoch": 3708} {"train_loss": -6.82759952545166, "global_step": 155737, "epoch": 3708} {"train_loss": -6.741804122924805, "global_step": 155738, "epoch": 3708} {"train_loss": -6.917430877685547, "global_step": 155739, "epoch": 3708} {"train_loss": -6.880566120147705, "global_step": 155740, "epoch": 3708} {"train_loss": -6.757979393005371, "global_step": 155741, "epoch": 3708} {"train_loss": -6.923771858215332, "global_step": 155742, "epoch": 3708} {"train_loss": -6.8497538566589355, "global_step": 155743, "epoch": 3708} {"train_loss": -6.810634613037109, "global_step": 155744, "epoch": 3708} {"train_loss": -6.789802551269531, "global_step": 155745, "epoch": 3708} {"train_loss": -6.836071968078613, "global_step": 155746, "epoch": 3708} {"train_loss": -6.826778888702393, "global_step": 155747, "epoch": 3708} {"train_loss": -6.818954944610596, "global_step": 155748, "epoch": 3708} {"train_loss": -6.803545951843262, "global_step": 155749, "epoch": 3708} {"train_loss": -6.890607833862305, "global_step": 155750, "epoch": 3708} {"train_loss": -6.763664245605469, "global_step": 155751, "epoch": 3708} {"train_loss": -6.847960472106934, "global_step": 155752, "epoch": 3708} {"train_loss": -6.892409324645996, "global_step": 155753, "epoch": 3708} {"train_loss": -6.827980041503906, "global_step": 155754, "epoch": 3708} {"train_loss": -6.780509948730469, "global_step": 155755, "epoch": 3708} {"train_loss": -6.822463512420654, "global_step": 155756, "epoch": 3708} {"train_loss": -6.808536529541016, "global_step": 155757, "epoch": 3708} {"train_loss": -7.00219202041626, "global_step": 155758, "epoch": 3708} {"train_loss": -6.82890510559082, "global_step": 155759, "epoch": 3708} {"train_loss": -6.843186378479004, "global_step": 155760, "epoch": 3708} {"train_loss": -6.700392723083496, "global_step": 155761, "epoch": 3708} {"train_loss": -6.796173095703125, "global_step": 155762, "epoch": 3708} {"train_loss": -6.880043983459473, "global_step": 155763, "epoch": 3708} {"train_loss": -6.8852643966674805, "global_step": 155764, "epoch": 3708} {"train_loss": -6.969598770141602, "global_step": 155765, "epoch": 3708} {"train_loss": -6.866584300994873, "global_step": 155766, "epoch": 3708} {"train_loss": -6.995543956756592, "global_step": 155767, "epoch": 3708} {"train_loss": -6.8625078201293945, "global_step": 155768, "epoch": 3708} {"train_loss": -6.918177604675293, "global_step": 155769, "epoch": 3708} {"train_loss": -6.897380828857422, "global_step": 155770, "epoch": 3708} {"train_loss": -6.791245460510254, "global_step": 155771, "epoch": 3708} {"train_loss": -6.846733093261719, "global_step": 155772, "epoch": 3708} {"train_loss": -6.9145097732543945, "global_step": 155773, "epoch": 3708} {"train_loss": -6.78306245803833, "global_step": 155774, "epoch": 3708} {"train_loss": -6.942624092102051, "global_step": 155775, "epoch": 3708} {"train_loss": -6.9346818923950195, "global_step": 155776, "epoch": 3708} {"train_loss": -6.855761596134731, "global_step": 155777, "epoch": 3708, "val_loss": 68593.421875} {"train_loss": -6.927655220031738, "global_step": 155778, "epoch": 3709} {"train_loss": -6.937076568603516, "global_step": 155779, "epoch": 3709} {"train_loss": -6.973480224609375, "global_step": 155780, "epoch": 3709} {"train_loss": -6.9422149658203125, "global_step": 155781, "epoch": 3709} {"train_loss": -6.897934913635254, "global_step": 155782, "epoch": 3709} {"train_loss": -6.835074424743652, "global_step": 155783, "epoch": 3709} {"train_loss": -6.90657901763916, "global_step": 155784, "epoch": 3709} {"train_loss": -6.872515678405762, "global_step": 155785, "epoch": 3709} {"train_loss": -6.973238468170166, "global_step": 155786, "epoch": 3709} {"train_loss": -6.887648105621338, "global_step": 155787, "epoch": 3709} {"train_loss": -6.846546173095703, "global_step": 155788, "epoch": 3709} {"train_loss": -6.90785026550293, "global_step": 155789, "epoch": 3709} {"train_loss": -6.789447784423828, "global_step": 155790, "epoch": 3709} {"train_loss": -6.9431962966918945, "global_step": 155791, "epoch": 3709} {"train_loss": -6.828750133514404, "global_step": 155792, "epoch": 3709} {"train_loss": -6.911160469055176, "global_step": 155793, "epoch": 3709} {"train_loss": -6.911645889282227, "global_step": 155794, "epoch": 3709} {"train_loss": -6.890630722045898, "global_step": 155795, "epoch": 3709} {"train_loss": -6.904552459716797, "global_step": 155796, "epoch": 3709} {"train_loss": -6.825860023498535, "global_step": 155797, "epoch": 3709} {"train_loss": -6.689302444458008, "global_step": 155798, "epoch": 3709} {"train_loss": -6.8844194412231445, "global_step": 155799, "epoch": 3709} {"train_loss": -6.898399353027344, "global_step": 155800, "epoch": 3709} {"train_loss": -6.725380897521973, "global_step": 155801, "epoch": 3709} {"train_loss": -6.955540180206299, "global_step": 155802, "epoch": 3709} {"train_loss": -6.803692817687988, "global_step": 155803, "epoch": 3709} {"train_loss": -6.668076515197754, "global_step": 155804, "epoch": 3709} {"train_loss": -6.903543472290039, "global_step": 155805, "epoch": 3709} {"train_loss": -6.882946491241455, "global_step": 155806, "epoch": 3709} {"train_loss": -6.858785152435303, "global_step": 155807, "epoch": 3709} {"train_loss": -6.903931617736816, "global_step": 155808, "epoch": 3709} {"train_loss": -6.634860038757324, "global_step": 155809, "epoch": 3709} {"train_loss": -6.948137283325195, "global_step": 155810, "epoch": 3709} {"train_loss": -6.877658843994141, "global_step": 155811, "epoch": 3709} {"train_loss": -6.935539245605469, "global_step": 155812, "epoch": 3709} {"train_loss": -6.803400039672852, "global_step": 155813, "epoch": 3709} {"train_loss": -6.8340020179748535, "global_step": 155814, "epoch": 3709} {"train_loss": -6.940634727478027, "global_step": 155815, "epoch": 3709} {"train_loss": -6.8865532875061035, "global_step": 155816, "epoch": 3709} {"train_loss": -6.872372150421143, "global_step": 155817, "epoch": 3709} {"train_loss": -6.792985916137695, "global_step": 155818, "epoch": 3709} {"train_loss": -6.865798813956125, "global_step": 155819, "epoch": 3709, "val_loss": 68597.3359375} {"train_loss": -6.810708999633789, "global_step": 155820, "epoch": 3710} {"train_loss": -6.945179462432861, "global_step": 155821, "epoch": 3710} {"train_loss": -6.771470546722412, "global_step": 155822, "epoch": 3710} {"train_loss": -6.7647013664245605, "global_step": 155823, "epoch": 3710} {"train_loss": -6.774015426635742, "global_step": 155824, "epoch": 3710} {"train_loss": -6.950746536254883, "global_step": 155825, "epoch": 3710} {"train_loss": -6.765073776245117, "global_step": 155826, "epoch": 3710} {"train_loss": -6.906852722167969, "global_step": 155827, "epoch": 3710} {"train_loss": -6.9275102615356445, "global_step": 155828, "epoch": 3710} {"train_loss": -6.840480804443359, "global_step": 155829, "epoch": 3710} {"train_loss": -6.772982597351074, "global_step": 155830, "epoch": 3710} {"train_loss": -6.841106414794922, "global_step": 155831, "epoch": 3710} {"train_loss": -6.954463005065918, "global_step": 155832, "epoch": 3710} {"train_loss": -6.944793224334717, "global_step": 155833, "epoch": 3710} {"train_loss": -6.8002519607543945, "global_step": 155834, "epoch": 3710} {"train_loss": -6.9743733406066895, "global_step": 155835, "epoch": 3710} {"train_loss": -6.75313663482666, "global_step": 155836, "epoch": 3710} {"train_loss": -6.770990371704102, "global_step": 155837, "epoch": 3710} {"train_loss": -6.9113359451293945, "global_step": 155838, "epoch": 3710} {"train_loss": -6.8247575759887695, "global_step": 155839, "epoch": 3710} {"train_loss": -6.877577304840088, "global_step": 155840, "epoch": 3710} {"train_loss": -6.832080841064453, "global_step": 155841, "epoch": 3710} {"train_loss": -6.935535430908203, "global_step": 155842, "epoch": 3710} {"train_loss": -7.000630855560303, "global_step": 155843, "epoch": 3710} {"train_loss": -6.927197456359863, "global_step": 155844, "epoch": 3710} {"train_loss": -6.831029415130615, "global_step": 155845, "epoch": 3710} {"train_loss": -6.907889366149902, "global_step": 155846, "epoch": 3710} {"train_loss": -6.889082431793213, "global_step": 155847, "epoch": 3710} {"train_loss": -6.944027423858643, "global_step": 155848, "epoch": 3710} {"train_loss": -6.882629871368408, "global_step": 155849, "epoch": 3710} {"train_loss": -6.8736371994018555, "global_step": 155850, "epoch": 3710} {"train_loss": -6.997673034667969, "global_step": 155851, "epoch": 3710} {"train_loss": -6.8625688552856445, "global_step": 155852, "epoch": 3710} {"train_loss": -6.932880401611328, "global_step": 155853, "epoch": 3710} {"train_loss": -6.828044891357422, "global_step": 155854, "epoch": 3710} {"train_loss": -6.875776767730713, "global_step": 155855, "epoch": 3710} {"train_loss": -6.977905750274658, "global_step": 155856, "epoch": 3710} {"train_loss": -6.830951690673828, "global_step": 155857, "epoch": 3710} {"train_loss": -6.904294490814209, "global_step": 155858, "epoch": 3710} {"train_loss": -6.953068256378174, "global_step": 155859, "epoch": 3710} {"train_loss": -6.801230430603027, "global_step": 155860, "epoch": 3710} {"train_loss": -6.877771150498163, "global_step": 155861, "epoch": 3710, "val_loss": 68504.1875} {"train_loss": -6.850141525268555, "global_step": 155862, "epoch": 3711} {"train_loss": -6.927433967590332, "global_step": 155863, "epoch": 3711} {"train_loss": -6.965747833251953, "global_step": 155864, "epoch": 3711} {"train_loss": -6.885727882385254, "global_step": 155865, "epoch": 3711} {"train_loss": -6.840142250061035, "global_step": 155866, "epoch": 3711} {"train_loss": -6.874479293823242, "global_step": 155867, "epoch": 3711} {"train_loss": -6.9445905685424805, "global_step": 155868, "epoch": 3711} {"train_loss": -6.875668525695801, "global_step": 155869, "epoch": 3711} {"train_loss": -6.844010353088379, "global_step": 155870, "epoch": 3711} {"train_loss": -6.873619079589844, "global_step": 155871, "epoch": 3711} {"train_loss": -6.924760818481445, "global_step": 155872, "epoch": 3711} {"train_loss": -6.801048278808594, "global_step": 155873, "epoch": 3711} {"train_loss": -6.92411994934082, "global_step": 155874, "epoch": 3711} {"train_loss": -6.890820503234863, "global_step": 155875, "epoch": 3711} {"train_loss": -6.802802085876465, "global_step": 155876, "epoch": 3711} {"train_loss": -6.848455429077148, "global_step": 155877, "epoch": 3711} {"train_loss": -6.9241437911987305, "global_step": 155878, "epoch": 3711} {"train_loss": -6.772103309631348, "global_step": 155879, "epoch": 3711} {"train_loss": -6.847805023193359, "global_step": 155880, "epoch": 3711} {"train_loss": -6.767383098602295, "global_step": 155881, "epoch": 3711} {"train_loss": -6.69303035736084, "global_step": 155882, "epoch": 3711} {"train_loss": -6.774806976318359, "global_step": 155883, "epoch": 3711} {"train_loss": -6.817474365234375, "global_step": 155884, "epoch": 3711} {"train_loss": -6.821722984313965, "global_step": 155885, "epoch": 3711} {"train_loss": -6.755305767059326, "global_step": 155886, "epoch": 3711} {"train_loss": -6.956737518310547, "global_step": 155887, "epoch": 3711} {"train_loss": -6.889063835144043, "global_step": 155888, "epoch": 3711} {"train_loss": -6.763213157653809, "global_step": 155889, "epoch": 3711} {"train_loss": -6.828619956970215, "global_step": 155890, "epoch": 3711} {"train_loss": -6.675278663635254, "global_step": 155891, "epoch": 3711} {"train_loss": -6.728305816650391, "global_step": 155892, "epoch": 3711} {"train_loss": -6.699108600616455, "global_step": 155893, "epoch": 3711} {"train_loss": -6.695134162902832, "global_step": 155894, "epoch": 3711} {"train_loss": -6.736171722412109, "global_step": 155895, "epoch": 3711} {"train_loss": -6.647772789001465, "global_step": 155896, "epoch": 3711} {"train_loss": -6.859591960906982, "global_step": 155897, "epoch": 3711} {"train_loss": -6.614965438842773, "global_step": 155898, "epoch": 3711} {"train_loss": -6.897272109985352, "global_step": 155899, "epoch": 3711} {"train_loss": -6.630499362945557, "global_step": 155900, "epoch": 3711} {"train_loss": -6.8476409912109375, "global_step": 155901, "epoch": 3711} {"train_loss": -6.720312595367432, "global_step": 155902, "epoch": 3711} {"train_loss": -6.8136503128778365, "global_step": 155903, "epoch": 3711, "val_loss": 68602.9375} {"train_loss": -6.766327857971191, "global_step": 155904, "epoch": 3712} {"train_loss": -6.824244499206543, "global_step": 155905, "epoch": 3712} {"train_loss": -6.706199645996094, "global_step": 155906, "epoch": 3712} {"train_loss": -6.775294303894043, "global_step": 155907, "epoch": 3712} {"train_loss": -6.8007941246032715, "global_step": 155908, "epoch": 3712} {"train_loss": -6.811122417449951, "global_step": 155909, "epoch": 3712} {"train_loss": -6.804938793182373, "global_step": 155910, "epoch": 3712} {"train_loss": -6.78267765045166, "global_step": 155911, "epoch": 3712} {"train_loss": -6.9166436195373535, "global_step": 155912, "epoch": 3712} {"train_loss": -6.948999404907227, "global_step": 155913, "epoch": 3712} {"train_loss": -6.871983528137207, "global_step": 155914, "epoch": 3712} {"train_loss": -6.820574760437012, "global_step": 155915, "epoch": 3712} {"train_loss": -6.927496910095215, "global_step": 155916, "epoch": 3712} {"train_loss": -6.882336616516113, "global_step": 155917, "epoch": 3712} {"train_loss": -6.944341659545898, "global_step": 155918, "epoch": 3712} {"train_loss": -6.868462085723877, "global_step": 155919, "epoch": 3712} {"train_loss": -6.850725173950195, "global_step": 155920, "epoch": 3712} {"train_loss": -6.929196357727051, "global_step": 155921, "epoch": 3712} {"train_loss": -7.022042274475098, "global_step": 155922, "epoch": 3712} {"train_loss": -6.955956935882568, "global_step": 155923, "epoch": 3712} {"train_loss": -6.94283390045166, "global_step": 155924, "epoch": 3712} {"train_loss": -7.052770614624023, "global_step": 155925, "epoch": 3712} {"train_loss": -6.944178104400635, "global_step": 155926, "epoch": 3712} {"train_loss": -6.935651779174805, "global_step": 155927, "epoch": 3712} {"train_loss": -6.915677070617676, "global_step": 155928, "epoch": 3712} {"train_loss": -6.87013578414917, "global_step": 155929, "epoch": 3712} {"train_loss": -6.932408332824707, "global_step": 155930, "epoch": 3712} {"train_loss": -6.948486328125, "global_step": 155931, "epoch": 3712} {"train_loss": -6.880704879760742, "global_step": 155932, "epoch": 3712} {"train_loss": -6.886466026306152, "global_step": 155933, "epoch": 3712} {"train_loss": -6.94166374206543, "global_step": 155934, "epoch": 3712} {"train_loss": -6.8117828369140625, "global_step": 155935, "epoch": 3712} {"train_loss": -6.82785177230835, "global_step": 155936, "epoch": 3712} {"train_loss": -6.9591803550720215, "global_step": 155937, "epoch": 3712} {"train_loss": -6.945498466491699, "global_step": 155938, "epoch": 3712} {"train_loss": -6.921977519989014, "global_step": 155939, "epoch": 3712} {"train_loss": -6.816418647766113, "global_step": 155940, "epoch": 3712} {"train_loss": -6.8160400390625, "global_step": 155941, "epoch": 3712} {"train_loss": -6.884847640991211, "global_step": 155942, "epoch": 3712} {"train_loss": -6.870588302612305, "global_step": 155943, "epoch": 3712} {"train_loss": -6.868264198303223, "global_step": 155944, "epoch": 3712} {"train_loss": -6.883392719995408, "global_step": 155945, "epoch": 3712, "val_loss": 68418.296875} {"train_loss": -6.884181976318359, "global_step": 155946, "epoch": 3713} {"train_loss": -6.874853134155273, "global_step": 155947, "epoch": 3713} {"train_loss": -6.981819152832031, "global_step": 155948, "epoch": 3713} {"train_loss": -6.9010467529296875, "global_step": 155949, "epoch": 3713} {"train_loss": -6.914071559906006, "global_step": 155950, "epoch": 3713} {"train_loss": -6.83079719543457, "global_step": 155951, "epoch": 3713} {"train_loss": -6.9257612228393555, "global_step": 155952, "epoch": 3713} {"train_loss": -6.894782543182373, "global_step": 155953, "epoch": 3713} {"train_loss": -6.854780197143555, "global_step": 155954, "epoch": 3713} {"train_loss": -6.904061794281006, "global_step": 155955, "epoch": 3713} {"train_loss": -6.921186447143555, "global_step": 155956, "epoch": 3713} {"train_loss": -6.977733612060547, "global_step": 155957, "epoch": 3713} {"train_loss": -6.891861915588379, "global_step": 155958, "epoch": 3713} {"train_loss": -6.829265117645264, "global_step": 155959, "epoch": 3713} {"train_loss": -6.719319820404053, "global_step": 155960, "epoch": 3713} {"train_loss": -6.8717498779296875, "global_step": 155961, "epoch": 3713} {"train_loss": -6.8444085121154785, "global_step": 155962, "epoch": 3713} {"train_loss": -6.706796169281006, "global_step": 155963, "epoch": 3713} {"train_loss": -6.823147773742676, "global_step": 155964, "epoch": 3713} {"train_loss": -6.745761871337891, "global_step": 155965, "epoch": 3713} {"train_loss": -6.824995994567871, "global_step": 155966, "epoch": 3713} {"train_loss": -6.929563522338867, "global_step": 155967, "epoch": 3713} {"train_loss": -6.7735514640808105, "global_step": 155968, "epoch": 3713} {"train_loss": -6.698019981384277, "global_step": 155969, "epoch": 3713} {"train_loss": -6.739733695983887, "global_step": 155970, "epoch": 3713} {"train_loss": -6.549227714538574, "global_step": 155971, "epoch": 3713} {"train_loss": -6.838599681854248, "global_step": 155972, "epoch": 3713} {"train_loss": -6.820250034332275, "global_step": 155973, "epoch": 3713} {"train_loss": -6.830857753753662, "global_step": 155974, "epoch": 3713} {"train_loss": -6.597599983215332, "global_step": 155975, "epoch": 3713} {"train_loss": -6.754563331604004, "global_step": 155976, "epoch": 3713} {"train_loss": -6.63391637802124, "global_step": 155977, "epoch": 3713} {"train_loss": -6.723504543304443, "global_step": 155978, "epoch": 3713} {"train_loss": -6.756776332855225, "global_step": 155979, "epoch": 3713} {"train_loss": -6.967643737792969, "global_step": 155980, "epoch": 3713} {"train_loss": -6.72995662689209, "global_step": 155981, "epoch": 3713} {"train_loss": -6.873304843902588, "global_step": 155982, "epoch": 3713} {"train_loss": -6.802194595336914, "global_step": 155983, "epoch": 3713} {"train_loss": -6.799404144287109, "global_step": 155984, "epoch": 3713} {"train_loss": -6.8230085372924805, "global_step": 155985, "epoch": 3713} {"train_loss": -6.88494873046875, "global_step": 155986, "epoch": 3713} {"train_loss": -6.819595984050205, "global_step": 155987, "epoch": 3713, "val_loss": 68397.640625} {"train_loss": -6.847480297088623, "global_step": 155988, "epoch": 3714} {"train_loss": -6.817564010620117, "global_step": 155989, "epoch": 3714} {"train_loss": -6.863399028778076, "global_step": 155990, "epoch": 3714} {"train_loss": -6.947511672973633, "global_step": 155991, "epoch": 3714} {"train_loss": -6.784878730773926, "global_step": 155992, "epoch": 3714} {"train_loss": -6.886484146118164, "global_step": 155993, "epoch": 3714} {"train_loss": -6.881054878234863, "global_step": 155994, "epoch": 3714} {"train_loss": -6.868218898773193, "global_step": 155995, "epoch": 3714} {"train_loss": -7.00314998626709, "global_step": 155996, "epoch": 3714} {"train_loss": -6.925747394561768, "global_step": 155997, "epoch": 3714} {"train_loss": -6.9703216552734375, "global_step": 155998, "epoch": 3714} {"train_loss": -6.852781295776367, "global_step": 155999, "epoch": 3714} {"train_loss": -6.9067254066467285, "global_step": 156000, "epoch": 3714} {"train_loss": -6.8174214363098145, "global_step": 156001, "epoch": 3714} {"train_loss": -6.921191215515137, "global_step": 156002, "epoch": 3714} {"train_loss": -6.892437934875488, "global_step": 156003, "epoch": 3714} {"train_loss": -6.813716888427734, "global_step": 156004, "epoch": 3714} {"train_loss": -6.884722709655762, "global_step": 156005, "epoch": 3714} {"train_loss": -6.803177356719971, "global_step": 156006, "epoch": 3714} {"train_loss": -6.790970802307129, "global_step": 156007, "epoch": 3714} {"train_loss": -6.888582706451416, "global_step": 156008, "epoch": 3714} {"train_loss": -6.919988632202148, "global_step": 156009, "epoch": 3714} {"train_loss": -6.820569038391113, "global_step": 156010, "epoch": 3714} {"train_loss": -6.888840198516846, "global_step": 156011, "epoch": 3714} {"train_loss": -6.869848251342773, "global_step": 156012, "epoch": 3714} {"train_loss": -6.852542877197266, "global_step": 156013, "epoch": 3714} {"train_loss": -6.896228790283203, "global_step": 156014, "epoch": 3714} {"train_loss": -6.924847602844238, "global_step": 156015, "epoch": 3714} {"train_loss": -6.976335525512695, "global_step": 156016, "epoch": 3714} {"train_loss": -6.795828819274902, "global_step": 156017, "epoch": 3714} {"train_loss": -6.980584144592285, "global_step": 156018, "epoch": 3714} {"train_loss": -7.001257419586182, "global_step": 156019, "epoch": 3714} {"train_loss": -6.8361406326293945, "global_step": 156020, "epoch": 3714} {"train_loss": -6.954384803771973, "global_step": 156021, "epoch": 3714} {"train_loss": -6.796860694885254, "global_step": 156022, "epoch": 3714} {"train_loss": -6.909365653991699, "global_step": 156023, "epoch": 3714} {"train_loss": -6.882647514343262, "global_step": 156024, "epoch": 3714} {"train_loss": -6.9411492347717285, "global_step": 156025, "epoch": 3714} {"train_loss": -6.933998107910156, "global_step": 156026, "epoch": 3714} {"train_loss": -6.967593193054199, "global_step": 156027, "epoch": 3714} {"train_loss": -6.9277424812316895, "global_step": 156028, "epoch": 3714} {"train_loss": -6.888989028476534, "global_step": 156029, "epoch": 3714, "val_loss": 68440.8984375} {"train_loss": -6.907064914703369, "global_step": 156030, "epoch": 3715} {"train_loss": -6.871114730834961, "global_step": 156031, "epoch": 3715} {"train_loss": -6.961777210235596, "global_step": 156032, "epoch": 3715} {"train_loss": -6.78719425201416, "global_step": 156033, "epoch": 3715} {"train_loss": -6.990372180938721, "global_step": 156034, "epoch": 3715} {"train_loss": -6.827221870422363, "global_step": 156035, "epoch": 3715} {"train_loss": -6.970828056335449, "global_step": 156036, "epoch": 3715} {"train_loss": -6.939958095550537, "global_step": 156037, "epoch": 3715} {"train_loss": -6.827075004577637, "global_step": 156038, "epoch": 3715} {"train_loss": -6.980573654174805, "global_step": 156039, "epoch": 3715} {"train_loss": -6.966291427612305, "global_step": 156040, "epoch": 3715} {"train_loss": -6.804135322570801, "global_step": 156041, "epoch": 3715} {"train_loss": -6.933658123016357, "global_step": 156042, "epoch": 3715} {"train_loss": -6.822159767150879, "global_step": 156043, "epoch": 3715} {"train_loss": -6.919345855712891, "global_step": 156044, "epoch": 3715} {"train_loss": -6.760024070739746, "global_step": 156045, "epoch": 3715} {"train_loss": -6.753848075866699, "global_step": 156046, "epoch": 3715} {"train_loss": -6.814678192138672, "global_step": 156047, "epoch": 3715} {"train_loss": -6.6915130615234375, "global_step": 156048, "epoch": 3715} {"train_loss": -6.680731773376465, "global_step": 156049, "epoch": 3715} {"train_loss": -6.915249347686768, "global_step": 156050, "epoch": 3715} {"train_loss": -6.7932939529418945, "global_step": 156051, "epoch": 3715} {"train_loss": -6.827732086181641, "global_step": 156052, "epoch": 3715} {"train_loss": -6.808563232421875, "global_step": 156053, "epoch": 3715} {"train_loss": -6.795083522796631, "global_step": 156054, "epoch": 3715} {"train_loss": -6.910823822021484, "global_step": 156055, "epoch": 3715} {"train_loss": -6.910282135009766, "global_step": 156056, "epoch": 3715} {"train_loss": -6.712884902954102, "global_step": 156057, "epoch": 3715} {"train_loss": -6.789589881896973, "global_step": 156058, "epoch": 3715} {"train_loss": -6.741361618041992, "global_step": 156059, "epoch": 3715} {"train_loss": -6.844367027282715, "global_step": 156060, "epoch": 3715} {"train_loss": -6.744734287261963, "global_step": 156061, "epoch": 3715} {"train_loss": -6.711981773376465, "global_step": 156062, "epoch": 3715} {"train_loss": -6.9333648681640625, "global_step": 156063, "epoch": 3715} {"train_loss": -6.619267463684082, "global_step": 156064, "epoch": 3715} {"train_loss": -6.874858379364014, "global_step": 156065, "epoch": 3715} {"train_loss": -6.848443031311035, "global_step": 156066, "epoch": 3715} {"train_loss": -6.842889308929443, "global_step": 156067, "epoch": 3715} {"train_loss": -6.828494071960449, "global_step": 156068, "epoch": 3715} {"train_loss": -6.668454170227051, "global_step": 156069, "epoch": 3715} {"train_loss": -6.791342258453369, "global_step": 156070, "epoch": 3715} {"train_loss": -6.831036817459833, "global_step": 156071, "epoch": 3715, "val_loss": 68568.3671875} {"train_loss": -6.751104354858398, "global_step": 156072, "epoch": 3716} {"train_loss": -6.675866603851318, "global_step": 156073, "epoch": 3716} {"train_loss": -6.750617027282715, "global_step": 156074, "epoch": 3716} {"train_loss": -6.750180244445801, "global_step": 156075, "epoch": 3716} {"train_loss": -6.640826225280762, "global_step": 156076, "epoch": 3716} {"train_loss": -6.861446380615234, "global_step": 156077, "epoch": 3716} {"train_loss": -6.741385459899902, "global_step": 156078, "epoch": 3716} {"train_loss": -6.841176509857178, "global_step": 156079, "epoch": 3716} {"train_loss": -6.815235614776611, "global_step": 156080, "epoch": 3716} {"train_loss": -6.6857500076293945, "global_step": 156081, "epoch": 3716} {"train_loss": -6.761316776275635, "global_step": 156082, "epoch": 3716} {"train_loss": -6.615975379943848, "global_step": 156083, "epoch": 3716} {"train_loss": -6.7610883712768555, "global_step": 156084, "epoch": 3716} {"train_loss": -6.664657115936279, "global_step": 156085, "epoch": 3716} {"train_loss": -6.706382751464844, "global_step": 156086, "epoch": 3716} {"train_loss": -6.846512794494629, "global_step": 156087, "epoch": 3716} {"train_loss": -6.722284317016602, "global_step": 156088, "epoch": 3716} {"train_loss": -6.77001953125, "global_step": 156089, "epoch": 3716} {"train_loss": -6.8248090744018555, "global_step": 156090, "epoch": 3716} {"train_loss": -6.759711265563965, "global_step": 156091, "epoch": 3716} {"train_loss": -6.6607279777526855, "global_step": 156092, "epoch": 3716} {"train_loss": -6.829127311706543, "global_step": 156093, "epoch": 3716} {"train_loss": -6.755634307861328, "global_step": 156094, "epoch": 3716} {"train_loss": -6.809020519256592, "global_step": 156095, "epoch": 3716} {"train_loss": -6.815418720245361, "global_step": 156096, "epoch": 3716} {"train_loss": -6.799955368041992, "global_step": 156097, "epoch": 3716} {"train_loss": -6.893930435180664, "global_step": 156098, "epoch": 3716} {"train_loss": -6.7980427742004395, "global_step": 156099, "epoch": 3716} {"train_loss": -6.79036808013916, "global_step": 156100, "epoch": 3716} {"train_loss": -6.938368320465088, "global_step": 156101, "epoch": 3716} {"train_loss": -6.808127403259277, "global_step": 156102, "epoch": 3716} {"train_loss": -6.860493183135986, "global_step": 156103, "epoch": 3716} {"train_loss": -6.88311767578125, "global_step": 156104, "epoch": 3716} {"train_loss": -6.854936599731445, "global_step": 156105, "epoch": 3716} {"train_loss": -6.755873680114746, "global_step": 156106, "epoch": 3716} {"train_loss": -6.970524311065674, "global_step": 156107, "epoch": 3716} {"train_loss": -6.823605537414551, "global_step": 156108, "epoch": 3716} {"train_loss": -6.875338554382324, "global_step": 156109, "epoch": 3716} {"train_loss": -6.937404155731201, "global_step": 156110, "epoch": 3716} {"train_loss": -7.0118842124938965, "global_step": 156111, "epoch": 3716} {"train_loss": -6.864406585693359, "global_step": 156112, "epoch": 3716} {"train_loss": -6.798937377475557, "global_step": 156113, "epoch": 3716, "val_loss": 68568.265625} {"train_loss": -6.796356201171875, "global_step": 156114, "epoch": 3717} {"train_loss": -6.90120792388916, "global_step": 156115, "epoch": 3717} {"train_loss": -6.819249153137207, "global_step": 156116, "epoch": 3717} {"train_loss": -6.923013687133789, "global_step": 156117, "epoch": 3717} {"train_loss": -6.974195957183838, "global_step": 156118, "epoch": 3717} {"train_loss": -6.872565269470215, "global_step": 156119, "epoch": 3717} {"train_loss": -6.935723781585693, "global_step": 156120, "epoch": 3717} {"train_loss": -6.793789863586426, "global_step": 156121, "epoch": 3717} {"train_loss": -6.690520286560059, "global_step": 156122, "epoch": 3717} {"train_loss": -6.909843444824219, "global_step": 156123, "epoch": 3717} {"train_loss": -6.797477722167969, "global_step": 156124, "epoch": 3717} {"train_loss": -6.8686957359313965, "global_step": 156125, "epoch": 3717} {"train_loss": -6.914691925048828, "global_step": 156126, "epoch": 3717} {"train_loss": -6.80919075012207, "global_step": 156127, "epoch": 3717} {"train_loss": -6.899271011352539, "global_step": 156128, "epoch": 3717} {"train_loss": -6.852791786193848, "global_step": 156129, "epoch": 3717} {"train_loss": -6.7708330154418945, "global_step": 156130, "epoch": 3717} {"train_loss": -6.97405481338501, "global_step": 156131, "epoch": 3717} {"train_loss": -6.7818450927734375, "global_step": 156132, "epoch": 3717} {"train_loss": -6.703622817993164, "global_step": 156133, "epoch": 3717} {"train_loss": -6.854828357696533, "global_step": 156134, "epoch": 3717} {"train_loss": -6.760702133178711, "global_step": 156135, "epoch": 3717} {"train_loss": -6.845283508300781, "global_step": 156136, "epoch": 3717} {"train_loss": -6.7881388664245605, "global_step": 156137, "epoch": 3717} {"train_loss": -6.838276386260986, "global_step": 156138, "epoch": 3717} {"train_loss": -6.751599311828613, "global_step": 156139, "epoch": 3717} {"train_loss": -6.762808799743652, "global_step": 156140, "epoch": 3717} {"train_loss": -6.764349937438965, "global_step": 156141, "epoch": 3717} {"train_loss": -6.854952812194824, "global_step": 156142, "epoch": 3717} {"train_loss": -6.88793420791626, "global_step": 156143, "epoch": 3717} {"train_loss": -6.882846832275391, "global_step": 156144, "epoch": 3717} {"train_loss": -6.841256618499756, "global_step": 156145, "epoch": 3717} {"train_loss": -6.831001281738281, "global_step": 156146, "epoch": 3717} {"train_loss": -6.853271961212158, "global_step": 156147, "epoch": 3717} {"train_loss": -6.8652262687683105, "global_step": 156148, "epoch": 3717} {"train_loss": -6.7938103675842285, "global_step": 156149, "epoch": 3717} {"train_loss": -6.759840488433838, "global_step": 156150, "epoch": 3717} {"train_loss": -6.825319290161133, "global_step": 156151, "epoch": 3717} {"train_loss": -6.761086463928223, "global_step": 156152, "epoch": 3717} {"train_loss": -6.825448513031006, "global_step": 156153, "epoch": 3717} {"train_loss": -6.844668388366699, "global_step": 156154, "epoch": 3717} {"train_loss": -6.8329866500127885, "global_step": 156155, "epoch": 3717, "val_loss": 68487.4375} {"train_loss": -6.935822486877441, "global_step": 156156, "epoch": 3718} {"train_loss": -6.909478664398193, "global_step": 156157, "epoch": 3718} {"train_loss": -6.858254432678223, "global_step": 156158, "epoch": 3718} {"train_loss": -6.860583305358887, "global_step": 156159, "epoch": 3718} {"train_loss": -6.763798236846924, "global_step": 156160, "epoch": 3718} {"train_loss": -6.853754043579102, "global_step": 156161, "epoch": 3718} {"train_loss": -6.882312774658203, "global_step": 156162, "epoch": 3718} {"train_loss": -6.867171287536621, "global_step": 156163, "epoch": 3718} {"train_loss": -6.7746477127075195, "global_step": 156164, "epoch": 3718} {"train_loss": -6.8678669929504395, "global_step": 156165, "epoch": 3718} {"train_loss": -6.91433048248291, "global_step": 156166, "epoch": 3718} {"train_loss": -6.8496246337890625, "global_step": 156167, "epoch": 3718} {"train_loss": -6.678667068481445, "global_step": 156168, "epoch": 3718} {"train_loss": -6.938048362731934, "global_step": 156169, "epoch": 3718} {"train_loss": -6.925100326538086, "global_step": 156170, "epoch": 3718} {"train_loss": -6.8810625076293945, "global_step": 156171, "epoch": 3718} {"train_loss": -6.861312389373779, "global_step": 156172, "epoch": 3718} {"train_loss": -6.77106237411499, "global_step": 156173, "epoch": 3718} {"train_loss": -6.851968288421631, "global_step": 156174, "epoch": 3718} {"train_loss": -6.797513961791992, "global_step": 156175, "epoch": 3718} {"train_loss": -6.881227493286133, "global_step": 156176, "epoch": 3718} {"train_loss": -6.8767852783203125, "global_step": 156177, "epoch": 3718} {"train_loss": -6.943845272064209, "global_step": 156178, "epoch": 3718} {"train_loss": -6.984811782836914, "global_step": 156179, "epoch": 3718} {"train_loss": -7.006686687469482, "global_step": 156180, "epoch": 3718} {"train_loss": -6.935084342956543, "global_step": 156181, "epoch": 3718} {"train_loss": -6.881811141967773, "global_step": 156182, "epoch": 3718} {"train_loss": -6.94137716293335, "global_step": 156183, "epoch": 3718} {"train_loss": -6.912712574005127, "global_step": 156184, "epoch": 3718} {"train_loss": -6.785650253295898, "global_step": 156185, "epoch": 3718} {"train_loss": -6.9548516273498535, "global_step": 156186, "epoch": 3718} {"train_loss": -6.9481353759765625, "global_step": 156187, "epoch": 3718} {"train_loss": -6.953660488128662, "global_step": 156188, "epoch": 3718} {"train_loss": -6.861146450042725, "global_step": 156189, "epoch": 3718} {"train_loss": -6.873798847198486, "global_step": 156190, "epoch": 3718} {"train_loss": -6.843877792358398, "global_step": 156191, "epoch": 3718} {"train_loss": -6.8417487144470215, "global_step": 156192, "epoch": 3718} {"train_loss": -6.854231834411621, "global_step": 156193, "epoch": 3718} {"train_loss": -6.895002365112305, "global_step": 156194, "epoch": 3718} {"train_loss": -6.874851226806641, "global_step": 156195, "epoch": 3718} {"train_loss": -6.891237735748291, "global_step": 156196, "epoch": 3718} {"train_loss": -6.878937914257958, "global_step": 156197, "epoch": 3718, "val_loss": 68567.4453125} {"train_loss": -6.863770484924316, "global_step": 156198, "epoch": 3719} {"train_loss": -6.858932971954346, "global_step": 156199, "epoch": 3719} {"train_loss": -6.8407816886901855, "global_step": 156200, "epoch": 3719} {"train_loss": -6.817095756530762, "global_step": 156201, "epoch": 3719} {"train_loss": -6.8139190673828125, "global_step": 156202, "epoch": 3719} {"train_loss": -6.696285247802734, "global_step": 156203, "epoch": 3719} {"train_loss": -6.935873031616211, "global_step": 156204, "epoch": 3719} {"train_loss": -6.979109287261963, "global_step": 156205, "epoch": 3719} {"train_loss": -6.79292631149292, "global_step": 156206, "epoch": 3719} {"train_loss": -6.908156394958496, "global_step": 156207, "epoch": 3719} {"train_loss": -6.751981735229492, "global_step": 156208, "epoch": 3719} {"train_loss": -6.983729362487793, "global_step": 156209, "epoch": 3719} {"train_loss": -6.880398273468018, "global_step": 156210, "epoch": 3719} {"train_loss": -6.866758346557617, "global_step": 156211, "epoch": 3719} {"train_loss": -6.801724433898926, "global_step": 156212, "epoch": 3719} {"train_loss": -6.9266486167907715, "global_step": 156213, "epoch": 3719} {"train_loss": -6.9626383781433105, "global_step": 156214, "epoch": 3719} {"train_loss": -6.964982986450195, "global_step": 156215, "epoch": 3719} {"train_loss": -6.872259140014648, "global_step": 156216, "epoch": 3719} {"train_loss": -6.8983259201049805, "global_step": 156217, "epoch": 3719} {"train_loss": -7.057636260986328, "global_step": 156218, "epoch": 3719} {"train_loss": -6.827374458312988, "global_step": 156219, "epoch": 3719} {"train_loss": -6.958930969238281, "global_step": 156220, "epoch": 3719} {"train_loss": -6.887864112854004, "global_step": 156221, "epoch": 3719} {"train_loss": -6.818063259124756, "global_step": 156222, "epoch": 3719} {"train_loss": -6.852957725524902, "global_step": 156223, "epoch": 3719} {"train_loss": -6.874792098999023, "global_step": 156224, "epoch": 3719} {"train_loss": -6.822348594665527, "global_step": 156225, "epoch": 3719} {"train_loss": -6.874077796936035, "global_step": 156226, "epoch": 3719} {"train_loss": -7.058749198913574, "global_step": 156227, "epoch": 3719} {"train_loss": -6.9232892990112305, "global_step": 156228, "epoch": 3719} {"train_loss": -6.8622565269470215, "global_step": 156229, "epoch": 3719} {"train_loss": -6.808223724365234, "global_step": 156230, "epoch": 3719} {"train_loss": -6.841831207275391, "global_step": 156231, "epoch": 3719} {"train_loss": -6.860913276672363, "global_step": 156232, "epoch": 3719} {"train_loss": -6.878162384033203, "global_step": 156233, "epoch": 3719} {"train_loss": -6.866583824157715, "global_step": 156234, "epoch": 3719} {"train_loss": -6.868659973144531, "global_step": 156235, "epoch": 3719} {"train_loss": -6.884248733520508, "global_step": 156236, "epoch": 3719} {"train_loss": -6.887439250946045, "global_step": 156237, "epoch": 3719} {"train_loss": -6.802472114562988, "global_step": 156238, "epoch": 3719} {"train_loss": -6.873186679113479, "global_step": 156239, "epoch": 3719, "val_loss": 68751.109375} {"train_loss": -6.670053482055664, "global_step": 156240, "epoch": 3720} {"train_loss": -6.785911560058594, "global_step": 156241, "epoch": 3720} {"train_loss": -6.7087202072143555, "global_step": 156242, "epoch": 3720} {"train_loss": -6.895662784576416, "global_step": 156243, "epoch": 3720} {"train_loss": -6.857354164123535, "global_step": 156244, "epoch": 3720} {"train_loss": -6.8565521240234375, "global_step": 156245, "epoch": 3720} {"train_loss": -6.8264055252075195, "global_step": 156246, "epoch": 3720} {"train_loss": -6.918607234954834, "global_step": 156247, "epoch": 3720} {"train_loss": -6.847853660583496, "global_step": 156248, "epoch": 3720} {"train_loss": -6.848939895629883, "global_step": 156249, "epoch": 3720} {"train_loss": -6.909928321838379, "global_step": 156250, "epoch": 3720} {"train_loss": -6.8424577713012695, "global_step": 156251, "epoch": 3720} {"train_loss": -6.9535369873046875, "global_step": 156252, "epoch": 3720} {"train_loss": -6.84877347946167, "global_step": 156253, "epoch": 3720} {"train_loss": -6.699282646179199, "global_step": 156254, "epoch": 3720} {"train_loss": -6.744872570037842, "global_step": 156255, "epoch": 3720} {"train_loss": -6.874843597412109, "global_step": 156256, "epoch": 3720} {"train_loss": -6.926697254180908, "global_step": 156257, "epoch": 3720} {"train_loss": -6.70842981338501, "global_step": 156258, "epoch": 3720} {"train_loss": -6.864354133605957, "global_step": 156259, "epoch": 3720} {"train_loss": -6.922456741333008, "global_step": 156260, "epoch": 3720} {"train_loss": -6.77192497253418, "global_step": 156261, "epoch": 3720} {"train_loss": -6.736512660980225, "global_step": 156262, "epoch": 3720} {"train_loss": -6.899291515350342, "global_step": 156263, "epoch": 3720} {"train_loss": -6.770066261291504, "global_step": 156264, "epoch": 3720} {"train_loss": -6.799960136413574, "global_step": 156265, "epoch": 3720} {"train_loss": -6.829173564910889, "global_step": 156266, "epoch": 3720} {"train_loss": -6.8201470375061035, "global_step": 156267, "epoch": 3720} {"train_loss": -6.787367820739746, "global_step": 156268, "epoch": 3720} {"train_loss": -6.754315376281738, "global_step": 156269, "epoch": 3720} {"train_loss": -6.8159613609313965, "global_step": 156270, "epoch": 3720} {"train_loss": -6.730123519897461, "global_step": 156271, "epoch": 3720} {"train_loss": -6.76666259765625, "global_step": 156272, "epoch": 3720} {"train_loss": -6.902937889099121, "global_step": 156273, "epoch": 3720} {"train_loss": -6.818445682525635, "global_step": 156274, "epoch": 3720} {"train_loss": -6.819063186645508, "global_step": 156275, "epoch": 3720} {"train_loss": -6.786347389221191, "global_step": 156276, "epoch": 3720} {"train_loss": -6.909672260284424, "global_step": 156277, "epoch": 3720} {"train_loss": -6.822455406188965, "global_step": 156278, "epoch": 3720} {"train_loss": -6.826286315917969, "global_step": 156279, "epoch": 3720} {"train_loss": -6.78336238861084, "global_step": 156280, "epoch": 3720} {"train_loss": -6.823638416471935, "global_step": 156281, "epoch": 3720, "val_loss": 68595.34375} {"train_loss": -6.950472354888916, "global_step": 156282, "epoch": 3721} {"train_loss": -6.924174785614014, "global_step": 156283, "epoch": 3721} {"train_loss": -6.816998481750488, "global_step": 156284, "epoch": 3721} {"train_loss": -6.889758586883545, "global_step": 156285, "epoch": 3721} {"train_loss": -6.659797191619873, "global_step": 156286, "epoch": 3721} {"train_loss": -6.87699031829834, "global_step": 156287, "epoch": 3721} {"train_loss": -6.705703258514404, "global_step": 156288, "epoch": 3721} {"train_loss": -6.877683639526367, "global_step": 156289, "epoch": 3721} {"train_loss": -6.782004356384277, "global_step": 156290, "epoch": 3721} {"train_loss": -6.928161144256592, "global_step": 156291, "epoch": 3721} {"train_loss": -6.8576555252075195, "global_step": 156292, "epoch": 3721} {"train_loss": -6.813484191894531, "global_step": 156293, "epoch": 3721} {"train_loss": -6.7107977867126465, "global_step": 156294, "epoch": 3721} {"train_loss": -6.8570942878723145, "global_step": 156295, "epoch": 3721} {"train_loss": -6.672023773193359, "global_step": 156296, "epoch": 3721} {"train_loss": -6.698916435241699, "global_step": 156297, "epoch": 3721} {"train_loss": -6.8631978034973145, "global_step": 156298, "epoch": 3721} {"train_loss": -6.794217109680176, "global_step": 156299, "epoch": 3721} {"train_loss": -6.839364051818848, "global_step": 156300, "epoch": 3721} {"train_loss": -6.9714202880859375, "global_step": 156301, "epoch": 3721} {"train_loss": -6.710324287414551, "global_step": 156302, "epoch": 3721} {"train_loss": -6.862483978271484, "global_step": 156303, "epoch": 3721} {"train_loss": -6.7403244972229, "global_step": 156304, "epoch": 3721} {"train_loss": -6.7749128341674805, "global_step": 156305, "epoch": 3721} {"train_loss": -6.9214959144592285, "global_step": 156306, "epoch": 3721} {"train_loss": -6.734386444091797, "global_step": 156307, "epoch": 3721} {"train_loss": -6.913073539733887, "global_step": 156308, "epoch": 3721} {"train_loss": -6.933697700500488, "global_step": 156309, "epoch": 3721} {"train_loss": -6.833783149719238, "global_step": 156310, "epoch": 3721} {"train_loss": -6.870542526245117, "global_step": 156311, "epoch": 3721} {"train_loss": -6.885429382324219, "global_step": 156312, "epoch": 3721} {"train_loss": -6.784285068511963, "global_step": 156313, "epoch": 3721} {"train_loss": -6.8016180992126465, "global_step": 156314, "epoch": 3721} {"train_loss": -6.923903465270996, "global_step": 156315, "epoch": 3721} {"train_loss": -6.796389579772949, "global_step": 156316, "epoch": 3721} {"train_loss": -6.773245811462402, "global_step": 156317, "epoch": 3721} {"train_loss": -6.794390678405762, "global_step": 156318, "epoch": 3721} {"train_loss": -6.8423919677734375, "global_step": 156319, "epoch": 3721} {"train_loss": -6.966699600219727, "global_step": 156320, "epoch": 3721} {"train_loss": -6.758033752441406, "global_step": 156321, "epoch": 3721} {"train_loss": -6.93809175491333, "global_step": 156322, "epoch": 3721} {"train_loss": -6.83240845089867, "global_step": 156323, "epoch": 3721, "val_loss": 68455.046875} {"train_loss": -6.855462074279785, "global_step": 156324, "epoch": 3722} {"train_loss": -6.995109558105469, "global_step": 156325, "epoch": 3722} {"train_loss": -6.978973388671875, "global_step": 156326, "epoch": 3722} {"train_loss": -6.847731590270996, "global_step": 156327, "epoch": 3722} {"train_loss": -6.966053009033203, "global_step": 156328, "epoch": 3722} {"train_loss": -6.95377254486084, "global_step": 156329, "epoch": 3722} {"train_loss": -6.877913475036621, "global_step": 156330, "epoch": 3722} {"train_loss": -6.906660556793213, "global_step": 156331, "epoch": 3722} {"train_loss": -6.921160697937012, "global_step": 156332, "epoch": 3722} {"train_loss": -6.885430335998535, "global_step": 156333, "epoch": 3722} {"train_loss": -6.848928451538086, "global_step": 156334, "epoch": 3722} {"train_loss": -6.951391220092773, "global_step": 156335, "epoch": 3722} {"train_loss": -6.842769622802734, "global_step": 156336, "epoch": 3722} {"train_loss": -6.908355236053467, "global_step": 156337, "epoch": 3722} {"train_loss": -6.919392108917236, "global_step": 156338, "epoch": 3722} {"train_loss": -6.821883678436279, "global_step": 156339, "epoch": 3722} {"train_loss": -6.776248931884766, "global_step": 156340, "epoch": 3722} {"train_loss": -6.855323791503906, "global_step": 156341, "epoch": 3722} {"train_loss": -6.835988998413086, "global_step": 156342, "epoch": 3722} {"train_loss": -6.900522232055664, "global_step": 156343, "epoch": 3722} {"train_loss": -6.891170024871826, "global_step": 156344, "epoch": 3722} {"train_loss": -6.889528751373291, "global_step": 156345, "epoch": 3722} {"train_loss": -6.886368751525879, "global_step": 156346, "epoch": 3722} {"train_loss": -6.865140914916992, "global_step": 156347, "epoch": 3722} {"train_loss": -6.826299667358398, "global_step": 156348, "epoch": 3722} {"train_loss": -6.782071113586426, "global_step": 156349, "epoch": 3722} {"train_loss": -6.901665687561035, "global_step": 156350, "epoch": 3722} {"train_loss": -6.795775413513184, "global_step": 156351, "epoch": 3722} {"train_loss": -6.864864826202393, "global_step": 156352, "epoch": 3722} {"train_loss": -6.835119247436523, "global_step": 156353, "epoch": 3722} {"train_loss": -6.787482738494873, "global_step": 156354, "epoch": 3722} {"train_loss": -6.82169246673584, "global_step": 156355, "epoch": 3722} {"train_loss": -6.698724746704102, "global_step": 156356, "epoch": 3722} {"train_loss": -6.89735746383667, "global_step": 156357, "epoch": 3722} {"train_loss": -6.898135185241699, "global_step": 156358, "epoch": 3722} {"train_loss": -6.791666030883789, "global_step": 156359, "epoch": 3722} {"train_loss": -6.824021816253662, "global_step": 156360, "epoch": 3722} {"train_loss": -6.879306793212891, "global_step": 156361, "epoch": 3722} {"train_loss": -6.849010467529297, "global_step": 156362, "epoch": 3722} {"train_loss": -6.951777458190918, "global_step": 156363, "epoch": 3722} {"train_loss": -6.812756061553955, "global_step": 156364, "epoch": 3722} {"train_loss": -6.86700237364996, "global_step": 156365, "epoch": 3722, "val_loss": 68594.4921875} {"train_loss": -6.808455944061279, "global_step": 156366, "epoch": 3723} {"train_loss": -6.965673923492432, "global_step": 156367, "epoch": 3723} {"train_loss": -6.842310905456543, "global_step": 156368, "epoch": 3723} {"train_loss": -6.866603374481201, "global_step": 156369, "epoch": 3723} {"train_loss": -6.926390647888184, "global_step": 156370, "epoch": 3723} {"train_loss": -6.905877590179443, "global_step": 156371, "epoch": 3723} {"train_loss": -6.905493259429932, "global_step": 156372, "epoch": 3723} {"train_loss": -6.894186496734619, "global_step": 156373, "epoch": 3723} {"train_loss": -6.905472755432129, "global_step": 156374, "epoch": 3723} {"train_loss": -6.812719821929932, "global_step": 156375, "epoch": 3723} {"train_loss": -6.931446075439453, "global_step": 156376, "epoch": 3723} {"train_loss": -6.943101406097412, "global_step": 156377, "epoch": 3723} {"train_loss": -6.80190372467041, "global_step": 156378, "epoch": 3723} {"train_loss": -6.885812759399414, "global_step": 156379, "epoch": 3723} {"train_loss": -6.922113418579102, "global_step": 156380, "epoch": 3723} {"train_loss": -6.894448757171631, "global_step": 156381, "epoch": 3723} {"train_loss": -6.98582649230957, "global_step": 156382, "epoch": 3723} {"train_loss": -6.844718933105469, "global_step": 156383, "epoch": 3723} {"train_loss": -6.983006954193115, "global_step": 156384, "epoch": 3723} {"train_loss": -6.821574687957764, "global_step": 156385, "epoch": 3723} {"train_loss": -6.912530899047852, "global_step": 156386, "epoch": 3723} {"train_loss": -6.850165367126465, "global_step": 156387, "epoch": 3723} {"train_loss": -6.906847953796387, "global_step": 156388, "epoch": 3723} {"train_loss": -6.799045562744141, "global_step": 156389, "epoch": 3723} {"train_loss": -6.753252983093262, "global_step": 156390, "epoch": 3723} {"train_loss": -6.826423168182373, "global_step": 156391, "epoch": 3723} {"train_loss": -6.782962799072266, "global_step": 156392, "epoch": 3723} {"train_loss": -6.770712852478027, "global_step": 156393, "epoch": 3723} {"train_loss": -6.850725173950195, "global_step": 156394, "epoch": 3723} {"train_loss": -6.828411102294922, "global_step": 156395, "epoch": 3723} {"train_loss": -6.794145584106445, "global_step": 156396, "epoch": 3723} {"train_loss": -6.731874942779541, "global_step": 156397, "epoch": 3723} {"train_loss": -6.728917121887207, "global_step": 156398, "epoch": 3723} {"train_loss": -6.778890609741211, "global_step": 156399, "epoch": 3723} {"train_loss": -6.78184175491333, "global_step": 156400, "epoch": 3723} {"train_loss": -6.667997360229492, "global_step": 156401, "epoch": 3723} {"train_loss": -6.8881354331970215, "global_step": 156402, "epoch": 3723} {"train_loss": -6.741887092590332, "global_step": 156403, "epoch": 3723} {"train_loss": -6.79831600189209, "global_step": 156404, "epoch": 3723} {"train_loss": -6.770445823669434, "global_step": 156405, "epoch": 3723} {"train_loss": -6.700771808624268, "global_step": 156406, "epoch": 3723} {"train_loss": -6.839885700316656, "global_step": 156407, "epoch": 3723, "val_loss": 68788.6015625} {"train_loss": -6.80800199508667, "global_step": 156408, "epoch": 3724} {"train_loss": -6.762058258056641, "global_step": 156409, "epoch": 3724} {"train_loss": -6.648135185241699, "global_step": 156410, "epoch": 3724} {"train_loss": -6.667210102081299, "global_step": 156411, "epoch": 3724} {"train_loss": -6.8432159423828125, "global_step": 156412, "epoch": 3724} {"train_loss": -6.746100902557373, "global_step": 156413, "epoch": 3724} {"train_loss": -6.764705657958984, "global_step": 156414, "epoch": 3724} {"train_loss": -6.882368087768555, "global_step": 156415, "epoch": 3724} {"train_loss": -6.686542987823486, "global_step": 156416, "epoch": 3724} {"train_loss": -6.831549644470215, "global_step": 156417, "epoch": 3724} {"train_loss": -6.854039192199707, "global_step": 156418, "epoch": 3724} {"train_loss": -6.82097053527832, "global_step": 156419, "epoch": 3724} {"train_loss": -6.890570640563965, "global_step": 156420, "epoch": 3724} {"train_loss": -6.716248989105225, "global_step": 156421, "epoch": 3724} {"train_loss": -6.8625898361206055, "global_step": 156422, "epoch": 3724} {"train_loss": -6.88653039932251, "global_step": 156423, "epoch": 3724} {"train_loss": -6.800019264221191, "global_step": 156424, "epoch": 3724} {"train_loss": -6.892156600952148, "global_step": 156425, "epoch": 3724} {"train_loss": -6.934678077697754, "global_step": 156426, "epoch": 3724} {"train_loss": -6.859339237213135, "global_step": 156427, "epoch": 3724} {"train_loss": -6.967452049255371, "global_step": 156428, "epoch": 3724} {"train_loss": -6.91956901550293, "global_step": 156429, "epoch": 3724} {"train_loss": -6.822850227355957, "global_step": 156430, "epoch": 3724} {"train_loss": -6.937020778656006, "global_step": 156431, "epoch": 3724} {"train_loss": -6.904592037200928, "global_step": 156432, "epoch": 3724} {"train_loss": -6.998595714569092, "global_step": 156433, "epoch": 3724} {"train_loss": -6.8771281242370605, "global_step": 156434, "epoch": 3724} {"train_loss": -6.828424453735352, "global_step": 156435, "epoch": 3724} {"train_loss": -6.895374298095703, "global_step": 156436, "epoch": 3724} {"train_loss": -6.943398475646973, "global_step": 156437, "epoch": 3724} {"train_loss": -6.97963285446167, "global_step": 156438, "epoch": 3724} {"train_loss": -6.944626331329346, "global_step": 156439, "epoch": 3724} {"train_loss": -6.935423851013184, "global_step": 156440, "epoch": 3724} {"train_loss": -6.887441635131836, "global_step": 156441, "epoch": 3724} {"train_loss": -6.896883010864258, "global_step": 156442, "epoch": 3724} {"train_loss": -6.807552337646484, "global_step": 156443, "epoch": 3724} {"train_loss": -6.91145133972168, "global_step": 156444, "epoch": 3724} {"train_loss": -6.814629554748535, "global_step": 156445, "epoch": 3724} {"train_loss": -6.800479888916016, "global_step": 156446, "epoch": 3724} {"train_loss": -6.971746444702148, "global_step": 156447, "epoch": 3724} {"train_loss": -6.804716110229492, "global_step": 156448, "epoch": 3724} {"train_loss": -6.852999312537057, "global_step": 156449, "epoch": 3724, "val_loss": 68521.1640625} {"train_loss": -6.93880033493042, "global_step": 156450, "epoch": 3725} {"train_loss": -6.77773380279541, "global_step": 156451, "epoch": 3725} {"train_loss": -6.899304389953613, "global_step": 156452, "epoch": 3725} {"train_loss": -6.796581268310547, "global_step": 156453, "epoch": 3725} {"train_loss": -6.747296333312988, "global_step": 156454, "epoch": 3725} {"train_loss": -6.750457763671875, "global_step": 156455, "epoch": 3725} {"train_loss": -6.839935302734375, "global_step": 156456, "epoch": 3725} {"train_loss": -6.8358869552612305, "global_step": 156457, "epoch": 3725} {"train_loss": -6.770999908447266, "global_step": 156458, "epoch": 3725} {"train_loss": -6.888546943664551, "global_step": 156459, "epoch": 3725} {"train_loss": -6.91202449798584, "global_step": 156460, "epoch": 3725} {"train_loss": -6.861242294311523, "global_step": 156461, "epoch": 3725} {"train_loss": -6.88743782043457, "global_step": 156462, "epoch": 3725} {"train_loss": -6.83501672744751, "global_step": 156463, "epoch": 3725} {"train_loss": -6.80342960357666, "global_step": 156464, "epoch": 3725} {"train_loss": -6.839616298675537, "global_step": 156465, "epoch": 3725} {"train_loss": -6.7932281494140625, "global_step": 156466, "epoch": 3725} {"train_loss": -6.863736152648926, "global_step": 156467, "epoch": 3725} {"train_loss": -6.829422473907471, "global_step": 156468, "epoch": 3725} {"train_loss": -6.924369812011719, "global_step": 156469, "epoch": 3725} {"train_loss": -6.878735065460205, "global_step": 156470, "epoch": 3725} {"train_loss": -6.918292999267578, "global_step": 156471, "epoch": 3725} {"train_loss": -6.798676490783691, "global_step": 156472, "epoch": 3725} {"train_loss": -6.8803300857543945, "global_step": 156473, "epoch": 3725} {"train_loss": -6.900825500488281, "global_step": 156474, "epoch": 3725} {"train_loss": -6.877735614776611, "global_step": 156475, "epoch": 3725} {"train_loss": -6.851062297821045, "global_step": 156476, "epoch": 3725} {"train_loss": -6.948931694030762, "global_step": 156477, "epoch": 3725} {"train_loss": -6.711947441101074, "global_step": 156478, "epoch": 3725} {"train_loss": -6.844989776611328, "global_step": 156479, "epoch": 3725} {"train_loss": -6.8616204261779785, "global_step": 156480, "epoch": 3725} {"train_loss": -6.7243194580078125, "global_step": 156481, "epoch": 3725} {"train_loss": -6.719274520874023, "global_step": 156482, "epoch": 3725} {"train_loss": -6.82090950012207, "global_step": 156483, "epoch": 3725} {"train_loss": -6.76839542388916, "global_step": 156484, "epoch": 3725} {"train_loss": -6.873618125915527, "global_step": 156485, "epoch": 3725} {"train_loss": -6.847917556762695, "global_step": 156486, "epoch": 3725} {"train_loss": -6.659717559814453, "global_step": 156487, "epoch": 3725} {"train_loss": -6.789856910705566, "global_step": 156488, "epoch": 3725} {"train_loss": -6.82997989654541, "global_step": 156489, "epoch": 3725} {"train_loss": -6.769205570220947, "global_step": 156490, "epoch": 3725} {"train_loss": -6.8309487501780195, "global_step": 156491, "epoch": 3725, "val_loss": 68753.265625} {"train_loss": -6.854103088378906, "global_step": 156492, "epoch": 3726} {"train_loss": -6.830325126647949, "global_step": 156493, "epoch": 3726} {"train_loss": -6.925082206726074, "global_step": 156494, "epoch": 3726} {"train_loss": -6.691667556762695, "global_step": 156495, "epoch": 3726} {"train_loss": -6.882384300231934, "global_step": 156496, "epoch": 3726} {"train_loss": -6.891213417053223, "global_step": 156497, "epoch": 3726} {"train_loss": -6.80937385559082, "global_step": 156498, "epoch": 3726} {"train_loss": -6.876445770263672, "global_step": 156499, "epoch": 3726} {"train_loss": -6.779412746429443, "global_step": 156500, "epoch": 3726} {"train_loss": -6.920751571655273, "global_step": 156501, "epoch": 3726} {"train_loss": -6.882899284362793, "global_step": 156502, "epoch": 3726} {"train_loss": -6.829801559448242, "global_step": 156503, "epoch": 3726} {"train_loss": -6.971769332885742, "global_step": 156504, "epoch": 3726} {"train_loss": -6.805472373962402, "global_step": 156505, "epoch": 3726} {"train_loss": -6.7750349044799805, "global_step": 156506, "epoch": 3726} {"train_loss": -6.7829694747924805, "global_step": 156507, "epoch": 3726} {"train_loss": -6.867984771728516, "global_step": 156508, "epoch": 3726} {"train_loss": -6.831459045410156, "global_step": 156509, "epoch": 3726} {"train_loss": -6.825674533843994, "global_step": 156510, "epoch": 3726} {"train_loss": -6.925685882568359, "global_step": 156511, "epoch": 3726} {"train_loss": -6.892116546630859, "global_step": 156512, "epoch": 3726} {"train_loss": -6.961837291717529, "global_step": 156513, "epoch": 3726} {"train_loss": -6.821145057678223, "global_step": 156514, "epoch": 3726} {"train_loss": -6.902135372161865, "global_step": 156515, "epoch": 3726} {"train_loss": -6.802961349487305, "global_step": 156516, "epoch": 3726} {"train_loss": -6.826413154602051, "global_step": 156517, "epoch": 3726} {"train_loss": -6.897610664367676, "global_step": 156518, "epoch": 3726} {"train_loss": -6.797198295593262, "global_step": 156519, "epoch": 3726} {"train_loss": -6.959297180175781, "global_step": 156520, "epoch": 3726} {"train_loss": -6.839949607849121, "global_step": 156521, "epoch": 3726} {"train_loss": -6.873028755187988, "global_step": 156522, "epoch": 3726} {"train_loss": -6.767333030700684, "global_step": 156523, "epoch": 3726} {"train_loss": -6.824388027191162, "global_step": 156524, "epoch": 3726} {"train_loss": -6.912992477416992, "global_step": 156525, "epoch": 3726} {"train_loss": -6.8206024169921875, "global_step": 156526, "epoch": 3726} {"train_loss": -6.876893520355225, "global_step": 156527, "epoch": 3726} {"train_loss": -6.800731658935547, "global_step": 156528, "epoch": 3726} {"train_loss": -6.825619220733643, "global_step": 156529, "epoch": 3726} {"train_loss": -6.818621635437012, "global_step": 156530, "epoch": 3726} {"train_loss": -6.782304763793945, "global_step": 156531, "epoch": 3726} {"train_loss": -6.894915580749512, "global_step": 156532, "epoch": 3726} {"train_loss": -6.851694867724464, "global_step": 156533, "epoch": 3726, "val_loss": 68502.84375} {"train_loss": -6.827889442443848, "global_step": 156534, "epoch": 3727} {"train_loss": -6.986503601074219, "global_step": 156535, "epoch": 3727} {"train_loss": -6.917783737182617, "global_step": 156536, "epoch": 3727} {"train_loss": -6.886639595031738, "global_step": 156537, "epoch": 3727} {"train_loss": -7.059595108032227, "global_step": 156538, "epoch": 3727} {"train_loss": -6.873099327087402, "global_step": 156539, "epoch": 3727} {"train_loss": -6.944083213806152, "global_step": 156540, "epoch": 3727} {"train_loss": -6.825225830078125, "global_step": 156541, "epoch": 3727} {"train_loss": -6.800251007080078, "global_step": 156542, "epoch": 3727} {"train_loss": -6.694979190826416, "global_step": 156543, "epoch": 3727} {"train_loss": -6.883829116821289, "global_step": 156544, "epoch": 3727} {"train_loss": -6.7166361808776855, "global_step": 156545, "epoch": 3727} {"train_loss": -6.898319721221924, "global_step": 156546, "epoch": 3727} {"train_loss": -6.750240325927734, "global_step": 156547, "epoch": 3727} {"train_loss": -6.8070549964904785, "global_step": 156548, "epoch": 3727} {"train_loss": -6.918607711791992, "global_step": 156549, "epoch": 3727} {"train_loss": -6.755934715270996, "global_step": 156550, "epoch": 3727} {"train_loss": -6.780710697174072, "global_step": 156551, "epoch": 3727} {"train_loss": -6.819431781768799, "global_step": 156552, "epoch": 3727} {"train_loss": -6.9122161865234375, "global_step": 156553, "epoch": 3727} {"train_loss": -6.756042003631592, "global_step": 156554, "epoch": 3727} {"train_loss": -6.850434303283691, "global_step": 156555, "epoch": 3727} {"train_loss": -6.852688312530518, "global_step": 156556, "epoch": 3727} {"train_loss": -6.833746433258057, "global_step": 156557, "epoch": 3727} {"train_loss": -6.749092102050781, "global_step": 156558, "epoch": 3727} {"train_loss": -6.987561225891113, "global_step": 156559, "epoch": 3727} {"train_loss": -6.861030578613281, "global_step": 156560, "epoch": 3727} {"train_loss": -6.833968639373779, "global_step": 156561, "epoch": 3727} {"train_loss": -6.869651794433594, "global_step": 156562, "epoch": 3727} {"train_loss": -6.855257987976074, "global_step": 156563, "epoch": 3727} {"train_loss": -6.881373405456543, "global_step": 156564, "epoch": 3727} {"train_loss": -6.871659278869629, "global_step": 156565, "epoch": 3727} {"train_loss": -6.912137031555176, "global_step": 156566, "epoch": 3727} {"train_loss": -6.94975471496582, "global_step": 156567, "epoch": 3727} {"train_loss": -6.941562652587891, "global_step": 156568, "epoch": 3727} {"train_loss": -6.9167914390563965, "global_step": 156569, "epoch": 3727} {"train_loss": -6.945497512817383, "global_step": 156570, "epoch": 3727} {"train_loss": -6.825626373291016, "global_step": 156571, "epoch": 3727} {"train_loss": -6.7544097900390625, "global_step": 156572, "epoch": 3727} {"train_loss": -6.942171096801758, "global_step": 156573, "epoch": 3727} {"train_loss": -6.833291530609131, "global_step": 156574, "epoch": 3727} {"train_loss": -6.862025306338356, "global_step": 156575, "epoch": 3727, "val_loss": 68482.4375} {"train_loss": -6.82990837097168, "global_step": 156576, "epoch": 3728} {"train_loss": -6.980669021606445, "global_step": 156577, "epoch": 3728} {"train_loss": -6.988819599151611, "global_step": 156578, "epoch": 3728} {"train_loss": -6.940147876739502, "global_step": 156579, "epoch": 3728} {"train_loss": -6.848944664001465, "global_step": 156580, "epoch": 3728} {"train_loss": -6.766453742980957, "global_step": 156581, "epoch": 3728} {"train_loss": -6.853752136230469, "global_step": 156582, "epoch": 3728} {"train_loss": -6.961982250213623, "global_step": 156583, "epoch": 3728} {"train_loss": -6.877661228179932, "global_step": 156584, "epoch": 3728} {"train_loss": -7.014824867248535, "global_step": 156585, "epoch": 3728} {"train_loss": -6.979625701904297, "global_step": 156586, "epoch": 3728} {"train_loss": -6.856414794921875, "global_step": 156587, "epoch": 3728} {"train_loss": -6.886322975158691, "global_step": 156588, "epoch": 3728} {"train_loss": -7.024587631225586, "global_step": 156589, "epoch": 3728} {"train_loss": -6.963146209716797, "global_step": 156590, "epoch": 3728} {"train_loss": -6.8739728927612305, "global_step": 156591, "epoch": 3728} {"train_loss": -6.927159786224365, "global_step": 156592, "epoch": 3728} {"train_loss": -6.8795881271362305, "global_step": 156593, "epoch": 3728} {"train_loss": -6.973523139953613, "global_step": 156594, "epoch": 3728} {"train_loss": -6.962089538574219, "global_step": 156595, "epoch": 3728} {"train_loss": -6.903446197509766, "global_step": 156596, "epoch": 3728} {"train_loss": -6.9480881690979, "global_step": 156597, "epoch": 3728} {"train_loss": -6.946807861328125, "global_step": 156598, "epoch": 3728} {"train_loss": -6.922260284423828, "global_step": 156599, "epoch": 3728} {"train_loss": -6.920844078063965, "global_step": 156600, "epoch": 3728} {"train_loss": -6.852083206176758, "global_step": 156601, "epoch": 3728} {"train_loss": -6.809847354888916, "global_step": 156602, "epoch": 3728} {"train_loss": -6.954568862915039, "global_step": 156603, "epoch": 3728} {"train_loss": -6.8486151695251465, "global_step": 156604, "epoch": 3728} {"train_loss": -6.80399227142334, "global_step": 156605, "epoch": 3728} {"train_loss": -6.7616119384765625, "global_step": 156606, "epoch": 3728} {"train_loss": -6.942551136016846, "global_step": 156607, "epoch": 3728} {"train_loss": -6.9257707595825195, "global_step": 156608, "epoch": 3728} {"train_loss": -6.896386623382568, "global_step": 156609, "epoch": 3728} {"train_loss": -6.851835250854492, "global_step": 156610, "epoch": 3728} {"train_loss": -6.836657524108887, "global_step": 156611, "epoch": 3728} {"train_loss": -6.954873561859131, "global_step": 156612, "epoch": 3728} {"train_loss": -6.848950386047363, "global_step": 156613, "epoch": 3728} {"train_loss": -6.963912487030029, "global_step": 156614, "epoch": 3728} {"train_loss": -6.873337745666504, "global_step": 156615, "epoch": 3728} {"train_loss": -6.790706634521484, "global_step": 156616, "epoch": 3728} {"train_loss": -6.900775205521357, "global_step": 156617, "epoch": 3728, "val_loss": 68547.125} {"train_loss": -6.8568525314331055, "global_step": 156618, "epoch": 3729} {"train_loss": -6.779645919799805, "global_step": 156619, "epoch": 3729} {"train_loss": -6.8442840576171875, "global_step": 156620, "epoch": 3729} {"train_loss": -6.90462589263916, "global_step": 156621, "epoch": 3729} {"train_loss": -6.8559489250183105, "global_step": 156622, "epoch": 3729} {"train_loss": -6.934926986694336, "global_step": 156623, "epoch": 3729} {"train_loss": -6.868518352508545, "global_step": 156624, "epoch": 3729} {"train_loss": -6.815062046051025, "global_step": 156625, "epoch": 3729} {"train_loss": -6.824936866760254, "global_step": 156626, "epoch": 3729} {"train_loss": -6.900547504425049, "global_step": 156627, "epoch": 3729} {"train_loss": -6.772518157958984, "global_step": 156628, "epoch": 3729} {"train_loss": -6.905957221984863, "global_step": 156629, "epoch": 3729} {"train_loss": -6.969448089599609, "global_step": 156630, "epoch": 3729} {"train_loss": -6.856605529785156, "global_step": 156631, "epoch": 3729} {"train_loss": -6.799274444580078, "global_step": 156632, "epoch": 3729} {"train_loss": -6.857985973358154, "global_step": 156633, "epoch": 3729} {"train_loss": -6.94610595703125, "global_step": 156634, "epoch": 3729} {"train_loss": -6.841802597045898, "global_step": 156635, "epoch": 3729} {"train_loss": -6.9568352699279785, "global_step": 156636, "epoch": 3729} {"train_loss": -6.92107629776001, "global_step": 156637, "epoch": 3729} {"train_loss": -6.896219253540039, "global_step": 156638, "epoch": 3729} {"train_loss": -6.972332954406738, "global_step": 156639, "epoch": 3729} {"train_loss": -6.878933429718018, "global_step": 156640, "epoch": 3729} {"train_loss": -6.882289886474609, "global_step": 156641, "epoch": 3729} {"train_loss": -6.849045276641846, "global_step": 156642, "epoch": 3729} {"train_loss": -6.79213809967041, "global_step": 156643, "epoch": 3729} {"train_loss": -6.921050548553467, "global_step": 156644, "epoch": 3729} {"train_loss": -6.889799118041992, "global_step": 156645, "epoch": 3729} {"train_loss": -6.8560404777526855, "global_step": 156646, "epoch": 3729} {"train_loss": -7.017841339111328, "global_step": 156647, "epoch": 3729} {"train_loss": -6.945529937744141, "global_step": 156648, "epoch": 3729} {"train_loss": -6.895350456237793, "global_step": 156649, "epoch": 3729} {"train_loss": -6.860347270965576, "global_step": 156650, "epoch": 3729} {"train_loss": -6.932055473327637, "global_step": 156651, "epoch": 3729} {"train_loss": -6.921260833740234, "global_step": 156652, "epoch": 3729} {"train_loss": -6.851796627044678, "global_step": 156653, "epoch": 3729} {"train_loss": -6.939048767089844, "global_step": 156654, "epoch": 3729} {"train_loss": -6.861870765686035, "global_step": 156655, "epoch": 3729} {"train_loss": -6.842020034790039, "global_step": 156656, "epoch": 3729} {"train_loss": -6.830764293670654, "global_step": 156657, "epoch": 3729} {"train_loss": -6.807625770568848, "global_step": 156658, "epoch": 3729} {"train_loss": -6.876263289224534, "global_step": 156659, "epoch": 3729, "val_loss": 68551.65625} {"train_loss": -6.933082103729248, "global_step": 156660, "epoch": 3730} {"train_loss": -6.835720062255859, "global_step": 156661, "epoch": 3730} {"train_loss": -6.958015441894531, "global_step": 156662, "epoch": 3730} {"train_loss": -6.945223808288574, "global_step": 156663, "epoch": 3730} {"train_loss": -6.9677300453186035, "global_step": 156664, "epoch": 3730} {"train_loss": -6.945133209228516, "global_step": 156665, "epoch": 3730} {"train_loss": -6.894166469573975, "global_step": 156666, "epoch": 3730} {"train_loss": -6.958931922912598, "global_step": 156667, "epoch": 3730} {"train_loss": -6.754963397979736, "global_step": 156668, "epoch": 3730} {"train_loss": -6.865363597869873, "global_step": 156669, "epoch": 3730} {"train_loss": -6.870765209197998, "global_step": 156670, "epoch": 3730} {"train_loss": -6.969155311584473, "global_step": 156671, "epoch": 3730} {"train_loss": -6.808469772338867, "global_step": 156672, "epoch": 3730} {"train_loss": -6.797882080078125, "global_step": 156673, "epoch": 3730} {"train_loss": -6.898261547088623, "global_step": 156674, "epoch": 3730} {"train_loss": -7.008047103881836, "global_step": 156675, "epoch": 3730} {"train_loss": -6.871182441711426, "global_step": 156676, "epoch": 3730} {"train_loss": -6.843404293060303, "global_step": 156677, "epoch": 3730} {"train_loss": -6.822684288024902, "global_step": 156678, "epoch": 3730} {"train_loss": -6.696688652038574, "global_step": 156679, "epoch": 3730} {"train_loss": -6.883530139923096, "global_step": 156680, "epoch": 3730} {"train_loss": -6.736118316650391, "global_step": 156681, "epoch": 3730} {"train_loss": -6.907925605773926, "global_step": 156682, "epoch": 3730} {"train_loss": -6.868592262268066, "global_step": 156683, "epoch": 3730} {"train_loss": -6.841228485107422, "global_step": 156684, "epoch": 3730} {"train_loss": -6.876199245452881, "global_step": 156685, "epoch": 3730} {"train_loss": -6.839951515197754, "global_step": 156686, "epoch": 3730} {"train_loss": -6.616612434387207, "global_step": 156687, "epoch": 3730} {"train_loss": -6.9259138107299805, "global_step": 156688, "epoch": 3730} {"train_loss": -6.694855213165283, "global_step": 156689, "epoch": 3730} {"train_loss": -6.919255256652832, "global_step": 156690, "epoch": 3730} {"train_loss": -6.891475677490234, "global_step": 156691, "epoch": 3730} {"train_loss": -6.839175224304199, "global_step": 156692, "epoch": 3730} {"train_loss": -6.830775260925293, "global_step": 156693, "epoch": 3730} {"train_loss": -6.829990386962891, "global_step": 156694, "epoch": 3730} {"train_loss": -6.9111647605896, "global_step": 156695, "epoch": 3730} {"train_loss": -6.915403366088867, "global_step": 156696, "epoch": 3730} {"train_loss": -6.671244144439697, "global_step": 156697, "epoch": 3730} {"train_loss": -6.775026321411133, "global_step": 156698, "epoch": 3730} {"train_loss": -6.893449306488037, "global_step": 156699, "epoch": 3730} {"train_loss": -6.889686584472656, "global_step": 156700, "epoch": 3730} {"train_loss": -6.86029349054609, "global_step": 156701, "epoch": 3730, "val_loss": 68548.3984375} {"train_loss": -6.921119689941406, "global_step": 156702, "epoch": 3731} {"train_loss": -6.783713340759277, "global_step": 156703, "epoch": 3731} {"train_loss": -6.8566412925720215, "global_step": 156704, "epoch": 3731} {"train_loss": -6.856716156005859, "global_step": 156705, "epoch": 3731} {"train_loss": -6.9925642013549805, "global_step": 156706, "epoch": 3731} {"train_loss": -6.877668380737305, "global_step": 156707, "epoch": 3731} {"train_loss": -6.864292144775391, "global_step": 156708, "epoch": 3731} {"train_loss": -6.798709869384766, "global_step": 156709, "epoch": 3731} {"train_loss": -6.874549388885498, "global_step": 156710, "epoch": 3731} {"train_loss": -6.925141334533691, "global_step": 156711, "epoch": 3731} {"train_loss": -6.7641401290893555, "global_step": 156712, "epoch": 3731} {"train_loss": -6.922038555145264, "global_step": 156713, "epoch": 3731} {"train_loss": -6.893011093139648, "global_step": 156714, "epoch": 3731} {"train_loss": -6.870513916015625, "global_step": 156715, "epoch": 3731} {"train_loss": -6.822195053100586, "global_step": 156716, "epoch": 3731} {"train_loss": -6.813721656799316, "global_step": 156717, "epoch": 3731} {"train_loss": -6.915714740753174, "global_step": 156718, "epoch": 3731} {"train_loss": -6.817654609680176, "global_step": 156719, "epoch": 3731} {"train_loss": -6.913818836212158, "global_step": 156720, "epoch": 3731} {"train_loss": -6.904320240020752, "global_step": 156721, "epoch": 3731} {"train_loss": -6.949214458465576, "global_step": 156722, "epoch": 3731} {"train_loss": -6.843941688537598, "global_step": 156723, "epoch": 3731} {"train_loss": -6.900867462158203, "global_step": 156724, "epoch": 3731} {"train_loss": -6.90493106842041, "global_step": 156725, "epoch": 3731} {"train_loss": -6.829533576965332, "global_step": 156726, "epoch": 3731} {"train_loss": -6.800865173339844, "global_step": 156727, "epoch": 3731} {"train_loss": -6.924544334411621, "global_step": 156728, "epoch": 3731} {"train_loss": -7.036457061767578, "global_step": 156729, "epoch": 3731} {"train_loss": -6.909276962280273, "global_step": 156730, "epoch": 3731} {"train_loss": -6.849837303161621, "global_step": 156731, "epoch": 3731} {"train_loss": -6.97511625289917, "global_step": 156732, "epoch": 3731} {"train_loss": -6.762214660644531, "global_step": 156733, "epoch": 3731} {"train_loss": -6.813479900360107, "global_step": 156734, "epoch": 3731} {"train_loss": -6.8910017013549805, "global_step": 156735, "epoch": 3731} {"train_loss": -6.774542808532715, "global_step": 156736, "epoch": 3731} {"train_loss": -6.861612319946289, "global_step": 156737, "epoch": 3731} {"train_loss": -6.86065149307251, "global_step": 156738, "epoch": 3731} {"train_loss": -6.748241424560547, "global_step": 156739, "epoch": 3731} {"train_loss": -6.757300853729248, "global_step": 156740, "epoch": 3731} {"train_loss": -6.833343982696533, "global_step": 156741, "epoch": 3731} {"train_loss": -6.994168758392334, "global_step": 156742, "epoch": 3731} {"train_loss": -6.862554209572928, "global_step": 156743, "epoch": 3731, "val_loss": 68577.84375} {"train_loss": -6.689770698547363, "global_step": 156744, "epoch": 3732} {"train_loss": -6.6925506591796875, "global_step": 156745, "epoch": 3732} {"train_loss": -6.768320083618164, "global_step": 156746, "epoch": 3732} {"train_loss": -6.802595615386963, "global_step": 156747, "epoch": 3732} {"train_loss": -6.602720737457275, "global_step": 156748, "epoch": 3732} {"train_loss": -6.742457389831543, "global_step": 156749, "epoch": 3732} {"train_loss": -6.875210285186768, "global_step": 156750, "epoch": 3732} {"train_loss": -6.863038063049316, "global_step": 156751, "epoch": 3732} {"train_loss": -6.825113296508789, "global_step": 156752, "epoch": 3732} {"train_loss": -6.786468982696533, "global_step": 156753, "epoch": 3732} {"train_loss": -6.913896560668945, "global_step": 156754, "epoch": 3732} {"train_loss": -6.730974197387695, "global_step": 156755, "epoch": 3732} {"train_loss": -6.869997978210449, "global_step": 156756, "epoch": 3732} {"train_loss": -6.7635955810546875, "global_step": 156757, "epoch": 3732} {"train_loss": -6.750441074371338, "global_step": 156758, "epoch": 3732} {"train_loss": -6.817338466644287, "global_step": 156759, "epoch": 3732} {"train_loss": -6.922094821929932, "global_step": 156760, "epoch": 3732} {"train_loss": -6.879544734954834, "global_step": 156761, "epoch": 3732} {"train_loss": -6.861688137054443, "global_step": 156762, "epoch": 3732} {"train_loss": -6.827330112457275, "global_step": 156763, "epoch": 3732} {"train_loss": -6.910858631134033, "global_step": 156764, "epoch": 3732} {"train_loss": -6.753255844116211, "global_step": 156765, "epoch": 3732} {"train_loss": -6.90858268737793, "global_step": 156766, "epoch": 3732} {"train_loss": -6.917438507080078, "global_step": 156767, "epoch": 3732} {"train_loss": -6.8218183517456055, "global_step": 156768, "epoch": 3732} {"train_loss": -6.942260265350342, "global_step": 156769, "epoch": 3732} {"train_loss": -6.8341064453125, "global_step": 156770, "epoch": 3732} {"train_loss": -6.8231964111328125, "global_step": 156771, "epoch": 3732} {"train_loss": -7.058173179626465, "global_step": 156772, "epoch": 3732} {"train_loss": -6.830379009246826, "global_step": 156773, "epoch": 3732} {"train_loss": -6.954106330871582, "global_step": 156774, "epoch": 3732} {"train_loss": -6.930047988891602, "global_step": 156775, "epoch": 3732} {"train_loss": -6.962265968322754, "global_step": 156776, "epoch": 3732} {"train_loss": -6.822527885437012, "global_step": 156777, "epoch": 3732} {"train_loss": -6.930814266204834, "global_step": 156778, "epoch": 3732} {"train_loss": -6.812896728515625, "global_step": 156779, "epoch": 3732} {"train_loss": -6.6983537673950195, "global_step": 156780, "epoch": 3732} {"train_loss": -6.883369445800781, "global_step": 156781, "epoch": 3732} {"train_loss": -6.82356595993042, "global_step": 156782, "epoch": 3732} {"train_loss": -6.707006454467773, "global_step": 156783, "epoch": 3732} {"train_loss": -6.881618499755859, "global_step": 156784, "epoch": 3732} {"train_loss": -6.832590659459432, "global_step": 156785, "epoch": 3732, "val_loss": 68516.1640625} {"train_loss": -6.772983074188232, "global_step": 156786, "epoch": 3733} {"train_loss": -6.777052402496338, "global_step": 156787, "epoch": 3733} {"train_loss": -6.618664741516113, "global_step": 156788, "epoch": 3733} {"train_loss": -6.734651565551758, "global_step": 156789, "epoch": 3733} {"train_loss": -6.797844886779785, "global_step": 156790, "epoch": 3733} {"train_loss": -6.766432762145996, "global_step": 156791, "epoch": 3733} {"train_loss": -6.893716335296631, "global_step": 156792, "epoch": 3733} {"train_loss": -6.764588356018066, "global_step": 156793, "epoch": 3733} {"train_loss": -6.789493560791016, "global_step": 156794, "epoch": 3733} {"train_loss": -6.869349479675293, "global_step": 156795, "epoch": 3733} {"train_loss": -6.772538661956787, "global_step": 156796, "epoch": 3733} {"train_loss": -6.763017654418945, "global_step": 156797, "epoch": 3733} {"train_loss": -6.89668083190918, "global_step": 156798, "epoch": 3733} {"train_loss": -6.941205024719238, "global_step": 156799, "epoch": 3733} {"train_loss": -6.851088523864746, "global_step": 156800, "epoch": 3733} {"train_loss": -6.958610534667969, "global_step": 156801, "epoch": 3733} {"train_loss": -6.876832008361816, "global_step": 156802, "epoch": 3733} {"train_loss": -6.919329643249512, "global_step": 156803, "epoch": 3733} {"train_loss": -6.939911365509033, "global_step": 156804, "epoch": 3733} {"train_loss": -6.842063903808594, "global_step": 156805, "epoch": 3733} {"train_loss": -6.632630348205566, "global_step": 156806, "epoch": 3733} {"train_loss": -6.916251182556152, "global_step": 156807, "epoch": 3733} {"train_loss": -6.882837295532227, "global_step": 156808, "epoch": 3733} {"train_loss": -6.823397159576416, "global_step": 156809, "epoch": 3733} {"train_loss": -6.940618515014648, "global_step": 156810, "epoch": 3733} {"train_loss": -6.783304214477539, "global_step": 156811, "epoch": 3733} {"train_loss": -6.846368789672852, "global_step": 156812, "epoch": 3733} {"train_loss": -6.799873352050781, "global_step": 156813, "epoch": 3733} {"train_loss": -6.880706310272217, "global_step": 156814, "epoch": 3733} {"train_loss": -6.820723533630371, "global_step": 156815, "epoch": 3733} {"train_loss": -6.855602741241455, "global_step": 156816, "epoch": 3733} {"train_loss": -6.918918132781982, "global_step": 156817, "epoch": 3733} {"train_loss": -6.886173248291016, "global_step": 156818, "epoch": 3733} {"train_loss": -6.890813827514648, "global_step": 156819, "epoch": 3733} {"train_loss": -6.827970027923584, "global_step": 156820, "epoch": 3733} {"train_loss": -6.94488000869751, "global_step": 156821, "epoch": 3733} {"train_loss": -6.7772088050842285, "global_step": 156822, "epoch": 3733} {"train_loss": -6.845529556274414, "global_step": 156823, "epoch": 3733} {"train_loss": -6.829468727111816, "global_step": 156824, "epoch": 3733} {"train_loss": -6.735886573791504, "global_step": 156825, "epoch": 3733} {"train_loss": -6.935310363769531, "global_step": 156826, "epoch": 3733} {"train_loss": -6.841386681511288, "global_step": 156827, "epoch": 3733, "val_loss": 68609.4375} {"train_loss": -6.837068557739258, "global_step": 156828, "epoch": 3734} {"train_loss": -6.993574142456055, "global_step": 156829, "epoch": 3734} {"train_loss": -6.901663780212402, "global_step": 156830, "epoch": 3734} {"train_loss": -6.892461776733398, "global_step": 156831, "epoch": 3734} {"train_loss": -6.829326629638672, "global_step": 156832, "epoch": 3734} {"train_loss": -6.820199966430664, "global_step": 156833, "epoch": 3734} {"train_loss": -6.840994358062744, "global_step": 156834, "epoch": 3734} {"train_loss": -6.85623025894165, "global_step": 156835, "epoch": 3734} {"train_loss": -6.842754364013672, "global_step": 156836, "epoch": 3734} {"train_loss": -6.823315620422363, "global_step": 156837, "epoch": 3734} {"train_loss": -6.964277267456055, "global_step": 156838, "epoch": 3734} {"train_loss": -6.870214462280273, "global_step": 156839, "epoch": 3734} {"train_loss": -6.843050003051758, "global_step": 156840, "epoch": 3734} {"train_loss": -6.925941467285156, "global_step": 156841, "epoch": 3734} {"train_loss": -6.815746784210205, "global_step": 156842, "epoch": 3734} {"train_loss": -6.936821460723877, "global_step": 156843, "epoch": 3734} {"train_loss": -6.834296226501465, "global_step": 156844, "epoch": 3734} {"train_loss": -6.8459672927856445, "global_step": 156845, "epoch": 3734} {"train_loss": -6.713863372802734, "global_step": 156846, "epoch": 3734} {"train_loss": -6.849123954772949, "global_step": 156847, "epoch": 3734} {"train_loss": -6.803648948669434, "global_step": 156848, "epoch": 3734} {"train_loss": -6.99232292175293, "global_step": 156849, "epoch": 3734} {"train_loss": -6.944859504699707, "global_step": 156850, "epoch": 3734} {"train_loss": -6.912407398223877, "global_step": 156851, "epoch": 3734} {"train_loss": -6.903217315673828, "global_step": 156852, "epoch": 3734} {"train_loss": -6.965388298034668, "global_step": 156853, "epoch": 3734} {"train_loss": -6.709389686584473, "global_step": 156854, "epoch": 3734} {"train_loss": -6.861761093139648, "global_step": 156855, "epoch": 3734} {"train_loss": -6.864014625549316, "global_step": 156856, "epoch": 3734} {"train_loss": -6.849065780639648, "global_step": 156857, "epoch": 3734} {"train_loss": -6.911828517913818, "global_step": 156858, "epoch": 3734} {"train_loss": -6.745017051696777, "global_step": 156859, "epoch": 3734} {"train_loss": -6.849671840667725, "global_step": 156860, "epoch": 3734} {"train_loss": -7.007153034210205, "global_step": 156861, "epoch": 3734} {"train_loss": -6.881231307983398, "global_step": 156862, "epoch": 3734} {"train_loss": -6.7926130294799805, "global_step": 156863, "epoch": 3734} {"train_loss": -6.824749946594238, "global_step": 156864, "epoch": 3734} {"train_loss": -6.820248126983643, "global_step": 156865, "epoch": 3734} {"train_loss": -6.756898880004883, "global_step": 156866, "epoch": 3734} {"train_loss": -6.874644756317139, "global_step": 156867, "epoch": 3734} {"train_loss": -6.892621994018555, "global_step": 156868, "epoch": 3734} {"train_loss": -6.866420132773263, "global_step": 156869, "epoch": 3734, "val_loss": 68544.8046875} {"train_loss": -6.765167236328125, "global_step": 156870, "epoch": 3735} {"train_loss": -6.905274391174316, "global_step": 156871, "epoch": 3735} {"train_loss": -6.759829521179199, "global_step": 156872, "epoch": 3735} {"train_loss": -6.789271831512451, "global_step": 156873, "epoch": 3735} {"train_loss": -6.798299312591553, "global_step": 156874, "epoch": 3735} {"train_loss": -6.8233513832092285, "global_step": 156875, "epoch": 3735} {"train_loss": -6.837162017822266, "global_step": 156876, "epoch": 3735} {"train_loss": -6.847173690795898, "global_step": 156877, "epoch": 3735} {"train_loss": -6.829357147216797, "global_step": 156878, "epoch": 3735} {"train_loss": -6.734575271606445, "global_step": 156879, "epoch": 3735} {"train_loss": -6.911818504333496, "global_step": 156880, "epoch": 3735} {"train_loss": -6.751996994018555, "global_step": 156881, "epoch": 3735} {"train_loss": -6.859626770019531, "global_step": 156882, "epoch": 3735} {"train_loss": -6.835122108459473, "global_step": 156883, "epoch": 3735} {"train_loss": -6.843597888946533, "global_step": 156884, "epoch": 3735} {"train_loss": -6.868391513824463, "global_step": 156885, "epoch": 3735} {"train_loss": -6.853461265563965, "global_step": 156886, "epoch": 3735} {"train_loss": -6.814999103546143, "global_step": 156887, "epoch": 3735} {"train_loss": -6.847600936889648, "global_step": 156888, "epoch": 3735} {"train_loss": -6.708307266235352, "global_step": 156889, "epoch": 3735} {"train_loss": -6.839489936828613, "global_step": 156890, "epoch": 3735} {"train_loss": -6.923165321350098, "global_step": 156891, "epoch": 3735} {"train_loss": -6.897154808044434, "global_step": 156892, "epoch": 3735} {"train_loss": -6.86669921875, "global_step": 156893, "epoch": 3735} {"train_loss": -6.8984270095825195, "global_step": 156894, "epoch": 3735} {"train_loss": -6.909544944763184, "global_step": 156895, "epoch": 3735} {"train_loss": -6.9568986892700195, "global_step": 156896, "epoch": 3735} {"train_loss": -6.901528358459473, "global_step": 156897, "epoch": 3735} {"train_loss": -6.934647560119629, "global_step": 156898, "epoch": 3735} {"train_loss": -6.813821315765381, "global_step": 156899, "epoch": 3735} {"train_loss": -6.978426933288574, "global_step": 156900, "epoch": 3735} {"train_loss": -6.977509021759033, "global_step": 156901, "epoch": 3735} {"train_loss": -6.975912094116211, "global_step": 156902, "epoch": 3735} {"train_loss": -6.920010566711426, "global_step": 156903, "epoch": 3735} {"train_loss": -6.8218865394592285, "global_step": 156904, "epoch": 3735} {"train_loss": -6.802701950073242, "global_step": 156905, "epoch": 3735} {"train_loss": -6.9344587326049805, "global_step": 156906, "epoch": 3735} {"train_loss": -6.9406208992004395, "global_step": 156907, "epoch": 3735} {"train_loss": -6.8104567527771, "global_step": 156908, "epoch": 3735} {"train_loss": -6.8879594802856445, "global_step": 156909, "epoch": 3735} {"train_loss": -6.814015865325928, "global_step": 156910, "epoch": 3735} {"train_loss": -6.8571256796518965, "global_step": 156911, "epoch": 3735, "val_loss": 68586.9375} {"train_loss": -6.997618198394775, "global_step": 156912, "epoch": 3736} {"train_loss": -6.877280235290527, "global_step": 156913, "epoch": 3736} {"train_loss": -6.874298095703125, "global_step": 156914, "epoch": 3736} {"train_loss": -6.806666374206543, "global_step": 156915, "epoch": 3736} {"train_loss": -6.788010120391846, "global_step": 156916, "epoch": 3736} {"train_loss": -6.9069061279296875, "global_step": 156917, "epoch": 3736} {"train_loss": -6.863981246948242, "global_step": 156918, "epoch": 3736} {"train_loss": -7.0551581382751465, "global_step": 156919, "epoch": 3736} {"train_loss": -6.818700790405273, "global_step": 156920, "epoch": 3736} {"train_loss": -6.992403030395508, "global_step": 156921, "epoch": 3736} {"train_loss": -6.901142597198486, "global_step": 156922, "epoch": 3736} {"train_loss": -6.8859710693359375, "global_step": 156923, "epoch": 3736} {"train_loss": -6.84562873840332, "global_step": 156924, "epoch": 3736} {"train_loss": -6.848538875579834, "global_step": 156925, "epoch": 3736} {"train_loss": -6.888009548187256, "global_step": 156926, "epoch": 3736} {"train_loss": -6.774813652038574, "global_step": 156927, "epoch": 3736} {"train_loss": -6.8534417152404785, "global_step": 156928, "epoch": 3736} {"train_loss": -6.753993511199951, "global_step": 156929, "epoch": 3736} {"train_loss": -6.991344928741455, "global_step": 156930, "epoch": 3736} {"train_loss": -6.92210578918457, "global_step": 156931, "epoch": 3736} {"train_loss": -6.844787120819092, "global_step": 156932, "epoch": 3736} {"train_loss": -6.982799530029297, "global_step": 156933, "epoch": 3736} {"train_loss": -6.84968376159668, "global_step": 156934, "epoch": 3736} {"train_loss": -6.801818370819092, "global_step": 156935, "epoch": 3736} {"train_loss": -6.925930023193359, "global_step": 156936, "epoch": 3736} {"train_loss": -6.931551933288574, "global_step": 156937, "epoch": 3736} {"train_loss": -6.7706451416015625, "global_step": 156938, "epoch": 3736} {"train_loss": -7.024952411651611, "global_step": 156939, "epoch": 3736} {"train_loss": -6.854922294616699, "global_step": 156940, "epoch": 3736} {"train_loss": -6.828967571258545, "global_step": 156941, "epoch": 3736} {"train_loss": -6.905819416046143, "global_step": 156942, "epoch": 3736} {"train_loss": -6.832027435302734, "global_step": 156943, "epoch": 3736} {"train_loss": -6.9778852462768555, "global_step": 156944, "epoch": 3736} {"train_loss": -6.936877250671387, "global_step": 156945, "epoch": 3736} {"train_loss": -6.938563346862793, "global_step": 156946, "epoch": 3736} {"train_loss": -6.8165082931518555, "global_step": 156947, "epoch": 3736} {"train_loss": -6.912435531616211, "global_step": 156948, "epoch": 3736} {"train_loss": -6.8550004959106445, "global_step": 156949, "epoch": 3736} {"train_loss": -6.976040840148926, "global_step": 156950, "epoch": 3736} {"train_loss": -6.841827869415283, "global_step": 156951, "epoch": 3736} {"train_loss": -6.80333948135376, "global_step": 156952, "epoch": 3736} {"train_loss": -6.8846794083004905, "global_step": 156953, "epoch": 3736, "val_loss": 68630.109375} {"train_loss": -6.808562278747559, "global_step": 156954, "epoch": 3737} {"train_loss": -6.903474807739258, "global_step": 156955, "epoch": 3737} {"train_loss": -6.708317279815674, "global_step": 156956, "epoch": 3737} {"train_loss": -6.775313854217529, "global_step": 156957, "epoch": 3737} {"train_loss": -6.800563812255859, "global_step": 156958, "epoch": 3737} {"train_loss": -6.970530033111572, "global_step": 156959, "epoch": 3737} {"train_loss": -6.720576286315918, "global_step": 156960, "epoch": 3737} {"train_loss": -6.73927116394043, "global_step": 156961, "epoch": 3737} {"train_loss": -6.794172286987305, "global_step": 156962, "epoch": 3737} {"train_loss": -6.854891777038574, "global_step": 156963, "epoch": 3737} {"train_loss": -6.8253583908081055, "global_step": 156964, "epoch": 3737} {"train_loss": -6.805034637451172, "global_step": 156965, "epoch": 3737} {"train_loss": -6.735713481903076, "global_step": 156966, "epoch": 3737} {"train_loss": -6.6681694984436035, "global_step": 156967, "epoch": 3737} {"train_loss": -6.7784528732299805, "global_step": 156968, "epoch": 3737} {"train_loss": -6.850286483764648, "global_step": 156969, "epoch": 3737} {"train_loss": -6.753331661224365, "global_step": 156970, "epoch": 3737} {"train_loss": -6.89866828918457, "global_step": 156971, "epoch": 3737} {"train_loss": -6.834918022155762, "global_step": 156972, "epoch": 3737} {"train_loss": -6.73592472076416, "global_step": 156973, "epoch": 3737} {"train_loss": -6.859409332275391, "global_step": 156974, "epoch": 3737} {"train_loss": -6.909404754638672, "global_step": 156975, "epoch": 3737} {"train_loss": -6.759104251861572, "global_step": 156976, "epoch": 3737} {"train_loss": -6.8763747215271, "global_step": 156977, "epoch": 3737} {"train_loss": -6.784857749938965, "global_step": 156978, "epoch": 3737} {"train_loss": -6.813924312591553, "global_step": 156979, "epoch": 3737} {"train_loss": -6.9045000076293945, "global_step": 156980, "epoch": 3737} {"train_loss": -6.90275239944458, "global_step": 156981, "epoch": 3737} {"train_loss": -6.856863975524902, "global_step": 156982, "epoch": 3737} {"train_loss": -6.8240814208984375, "global_step": 156983, "epoch": 3737} {"train_loss": -6.95255708694458, "global_step": 156984, "epoch": 3737} {"train_loss": -6.938666820526123, "global_step": 156985, "epoch": 3737} {"train_loss": -6.876794815063477, "global_step": 156986, "epoch": 3737} {"train_loss": -6.911050796508789, "global_step": 156987, "epoch": 3737} {"train_loss": -6.845592975616455, "global_step": 156988, "epoch": 3737} {"train_loss": -6.932249069213867, "global_step": 156989, "epoch": 3737} {"train_loss": -6.939411163330078, "global_step": 156990, "epoch": 3737} {"train_loss": -7.029685020446777, "global_step": 156991, "epoch": 3737} {"train_loss": -6.8758440017700195, "global_step": 156992, "epoch": 3737} {"train_loss": -6.873586177825928, "global_step": 156993, "epoch": 3737} {"train_loss": -6.927644729614258, "global_step": 156994, "epoch": 3737} {"train_loss": -6.846999054863339, "global_step": 156995, "epoch": 3737, "val_loss": 68529.1015625} {"train_loss": -7.011063098907471, "global_step": 156996, "epoch": 3738} {"train_loss": -6.797306537628174, "global_step": 156997, "epoch": 3738} {"train_loss": -6.872734069824219, "global_step": 156998, "epoch": 3738} {"train_loss": -6.807136535644531, "global_step": 156999, "epoch": 3738} {"train_loss": -6.93149471282959, "global_step": 157000, "epoch": 3738} {"train_loss": -6.926583766937256, "global_step": 157001, "epoch": 3738} {"train_loss": -6.908890724182129, "global_step": 157002, "epoch": 3738} {"train_loss": -6.983867168426514, "global_step": 157003, "epoch": 3738} {"train_loss": -6.871176242828369, "global_step": 157004, "epoch": 3738} {"train_loss": -6.993343353271484, "global_step": 157005, "epoch": 3738} {"train_loss": -6.910928249359131, "global_step": 157006, "epoch": 3738} {"train_loss": -6.913017272949219, "global_step": 157007, "epoch": 3738} {"train_loss": -6.918045997619629, "global_step": 157008, "epoch": 3738} {"train_loss": -6.885190963745117, "global_step": 157009, "epoch": 3738} {"train_loss": -6.952583312988281, "global_step": 157010, "epoch": 3738} {"train_loss": -6.7796549797058105, "global_step": 157011, "epoch": 3738} {"train_loss": -6.826860427856445, "global_step": 157012, "epoch": 3738} {"train_loss": -6.89068078994751, "global_step": 157013, "epoch": 3738} {"train_loss": -6.868036270141602, "global_step": 157014, "epoch": 3738} {"train_loss": -6.869431972503662, "global_step": 157015, "epoch": 3738} {"train_loss": -6.90158224105835, "global_step": 157016, "epoch": 3738} {"train_loss": -6.914575099945068, "global_step": 157017, "epoch": 3738} {"train_loss": -6.874883651733398, "global_step": 157018, "epoch": 3738} {"train_loss": -6.93157434463501, "global_step": 157019, "epoch": 3738} {"train_loss": -6.893548488616943, "global_step": 157020, "epoch": 3738} {"train_loss": -6.839566230773926, "global_step": 157021, "epoch": 3738} {"train_loss": -6.944897174835205, "global_step": 157022, "epoch": 3738} {"train_loss": -6.917088508605957, "global_step": 157023, "epoch": 3738} {"train_loss": -6.9505438804626465, "global_step": 157024, "epoch": 3738} {"train_loss": -6.927144527435303, "global_step": 157025, "epoch": 3738} {"train_loss": -6.863564491271973, "global_step": 157026, "epoch": 3738} {"train_loss": -6.983951091766357, "global_step": 157027, "epoch": 3738} {"train_loss": -6.9237213134765625, "global_step": 157028, "epoch": 3738} {"train_loss": -6.895621299743652, "global_step": 157029, "epoch": 3738} {"train_loss": -7.009658336639404, "global_step": 157030, "epoch": 3738} {"train_loss": -6.787674427032471, "global_step": 157031, "epoch": 3738} {"train_loss": -6.844900131225586, "global_step": 157032, "epoch": 3738} {"train_loss": -6.923954010009766, "global_step": 157033, "epoch": 3738} {"train_loss": -6.826667785644531, "global_step": 157034, "epoch": 3738} {"train_loss": -6.743285179138184, "global_step": 157035, "epoch": 3738} {"train_loss": -6.846780776977539, "global_step": 157036, "epoch": 3738} {"train_loss": -6.891836427506947, "global_step": 157037, "epoch": 3738, "val_loss": 68549.234375} {"train_loss": -6.851718902587891, "global_step": 157038, "epoch": 3739} {"train_loss": -7.005825996398926, "global_step": 157039, "epoch": 3739} {"train_loss": -6.832354545593262, "global_step": 157040, "epoch": 3739} {"train_loss": -6.780582427978516, "global_step": 157041, "epoch": 3739} {"train_loss": -6.732657432556152, "global_step": 157042, "epoch": 3739} {"train_loss": -6.774005889892578, "global_step": 157043, "epoch": 3739} {"train_loss": -6.762670516967773, "global_step": 157044, "epoch": 3739} {"train_loss": -6.8753275871276855, "global_step": 157045, "epoch": 3739} {"train_loss": -6.869194984436035, "global_step": 157046, "epoch": 3739} {"train_loss": -6.787878036499023, "global_step": 157047, "epoch": 3739} {"train_loss": -6.764097213745117, "global_step": 157048, "epoch": 3739} {"train_loss": -6.905145168304443, "global_step": 157049, "epoch": 3739} {"train_loss": -6.887970924377441, "global_step": 157050, "epoch": 3739} {"train_loss": -6.730767250061035, "global_step": 157051, "epoch": 3739} {"train_loss": -6.875947952270508, "global_step": 157052, "epoch": 3739} {"train_loss": -6.928498268127441, "global_step": 157053, "epoch": 3739} {"train_loss": -6.839564800262451, "global_step": 157054, "epoch": 3739} {"train_loss": -6.812681198120117, "global_step": 157055, "epoch": 3739} {"train_loss": -6.7205681800842285, "global_step": 157056, "epoch": 3739} {"train_loss": -6.765226364135742, "global_step": 157057, "epoch": 3739} {"train_loss": -6.847935676574707, "global_step": 157058, "epoch": 3739} {"train_loss": -6.746075630187988, "global_step": 157059, "epoch": 3739} {"train_loss": -6.884746551513672, "global_step": 157060, "epoch": 3739} {"train_loss": -6.8903374671936035, "global_step": 157061, "epoch": 3739} {"train_loss": -6.806052207946777, "global_step": 157062, "epoch": 3739} {"train_loss": -6.967098236083984, "global_step": 157063, "epoch": 3739} {"train_loss": -6.717086315155029, "global_step": 157064, "epoch": 3739} {"train_loss": -6.827594757080078, "global_step": 157065, "epoch": 3739} {"train_loss": -6.782419204711914, "global_step": 157066, "epoch": 3739} {"train_loss": -6.691169738769531, "global_step": 157067, "epoch": 3739} {"train_loss": -6.816417217254639, "global_step": 157068, "epoch": 3739} {"train_loss": -6.69965934753418, "global_step": 157069, "epoch": 3739} {"train_loss": -6.750221252441406, "global_step": 157070, "epoch": 3739} {"train_loss": -6.784087181091309, "global_step": 157071, "epoch": 3739} {"train_loss": -6.703866958618164, "global_step": 157072, "epoch": 3739} {"train_loss": -6.830643177032471, "global_step": 157073, "epoch": 3739} {"train_loss": -6.6841888427734375, "global_step": 157074, "epoch": 3739} {"train_loss": -6.718695640563965, "global_step": 157075, "epoch": 3739} {"train_loss": -6.726624965667725, "global_step": 157076, "epoch": 3739} {"train_loss": -6.704560279846191, "global_step": 157077, "epoch": 3739} {"train_loss": -6.710384368896484, "global_step": 157078, "epoch": 3739} {"train_loss": -6.7982089178902765, "global_step": 157079, "epoch": 3739, "val_loss": 68676.75} {"train_loss": -6.691654205322266, "global_step": 157080, "epoch": 3740} {"train_loss": -6.7184600830078125, "global_step": 157081, "epoch": 3740} {"train_loss": -6.671054363250732, "global_step": 157082, "epoch": 3740} {"train_loss": -6.79896354675293, "global_step": 157083, "epoch": 3740} {"train_loss": -6.797010898590088, "global_step": 157084, "epoch": 3740} {"train_loss": -6.785035133361816, "global_step": 157085, "epoch": 3740} {"train_loss": -6.568431377410889, "global_step": 157086, "epoch": 3740} {"train_loss": -6.835294246673584, "global_step": 157087, "epoch": 3740} {"train_loss": -6.751189708709717, "global_step": 157088, "epoch": 3740} {"train_loss": -6.80188512802124, "global_step": 157089, "epoch": 3740} {"train_loss": -6.754332065582275, "global_step": 157090, "epoch": 3740} {"train_loss": -6.747544288635254, "global_step": 157091, "epoch": 3740} {"train_loss": -6.821134567260742, "global_step": 157092, "epoch": 3740} {"train_loss": -6.825162887573242, "global_step": 157093, "epoch": 3740} {"train_loss": -6.853322982788086, "global_step": 157094, "epoch": 3740} {"train_loss": -6.855588436126709, "global_step": 157095, "epoch": 3740} {"train_loss": -6.796457290649414, "global_step": 157096, "epoch": 3740} {"train_loss": -6.9406585693359375, "global_step": 157097, "epoch": 3740} {"train_loss": -6.746810436248779, "global_step": 157098, "epoch": 3740} {"train_loss": -6.818826675415039, "global_step": 157099, "epoch": 3740} {"train_loss": -7.0652852058410645, "global_step": 157100, "epoch": 3740} {"train_loss": -6.870750427246094, "global_step": 157101, "epoch": 3740} {"train_loss": -6.74350643157959, "global_step": 157102, "epoch": 3740} {"train_loss": -6.789124011993408, "global_step": 157103, "epoch": 3740} {"train_loss": -6.891592025756836, "global_step": 157104, "epoch": 3740} {"train_loss": -6.755487442016602, "global_step": 157105, "epoch": 3740} {"train_loss": -7.00223970413208, "global_step": 157106, "epoch": 3740} {"train_loss": -6.896458625793457, "global_step": 157107, "epoch": 3740} {"train_loss": -6.925322532653809, "global_step": 157108, "epoch": 3740} {"train_loss": -6.921215057373047, "global_step": 157109, "epoch": 3740} {"train_loss": -6.846388816833496, "global_step": 157110, "epoch": 3740} {"train_loss": -6.847469329833984, "global_step": 157111, "epoch": 3740} {"train_loss": -6.8614983558654785, "global_step": 157112, "epoch": 3740} {"train_loss": -6.898242950439453, "global_step": 157113, "epoch": 3740} {"train_loss": -6.958088397979736, "global_step": 157114, "epoch": 3740} {"train_loss": -6.8079986572265625, "global_step": 157115, "epoch": 3740} {"train_loss": -6.931837558746338, "global_step": 157116, "epoch": 3740} {"train_loss": -6.836828708648682, "global_step": 157117, "epoch": 3740} {"train_loss": -6.990859031677246, "global_step": 157118, "epoch": 3740} {"train_loss": -6.862791061401367, "global_step": 157119, "epoch": 3740} {"train_loss": -6.774996280670166, "global_step": 157120, "epoch": 3740} {"train_loss": -6.830270029249645, "global_step": 157121, "epoch": 3740, "val_loss": 68481.390625} {"train_loss": -6.829960823059082, "global_step": 157122, "epoch": 3741} {"train_loss": -6.844941139221191, "global_step": 157123, "epoch": 3741} {"train_loss": -6.955082893371582, "global_step": 157124, "epoch": 3741} {"train_loss": -6.943833351135254, "global_step": 157125, "epoch": 3741} {"train_loss": -6.924012184143066, "global_step": 157126, "epoch": 3741} {"train_loss": -6.9693684577941895, "global_step": 157127, "epoch": 3741} {"train_loss": -6.7835588455200195, "global_step": 157128, "epoch": 3741} {"train_loss": -6.823204040527344, "global_step": 157129, "epoch": 3741} {"train_loss": -6.902405261993408, "global_step": 157130, "epoch": 3741} {"train_loss": -6.773418426513672, "global_step": 157131, "epoch": 3741} {"train_loss": -6.928437232971191, "global_step": 157132, "epoch": 3741} {"train_loss": -6.869668960571289, "global_step": 157133, "epoch": 3741} {"train_loss": -6.888942718505859, "global_step": 157134, "epoch": 3741} {"train_loss": -6.913192272186279, "global_step": 157135, "epoch": 3741} {"train_loss": -6.797418594360352, "global_step": 157136, "epoch": 3741} {"train_loss": -6.994094371795654, "global_step": 157137, "epoch": 3741} {"train_loss": -6.818150520324707, "global_step": 157138, "epoch": 3741} {"train_loss": -6.933238506317139, "global_step": 157139, "epoch": 3741} {"train_loss": -6.814450263977051, "global_step": 157140, "epoch": 3741} {"train_loss": -6.871012210845947, "global_step": 157141, "epoch": 3741} {"train_loss": -6.9733991622924805, "global_step": 157142, "epoch": 3741} {"train_loss": -6.851009845733643, "global_step": 157143, "epoch": 3741} {"train_loss": -6.8687944412231445, "global_step": 157144, "epoch": 3741} {"train_loss": -6.867643356323242, "global_step": 157145, "epoch": 3741} {"train_loss": -6.8103928565979, "global_step": 157146, "epoch": 3741} {"train_loss": -6.853361129760742, "global_step": 157147, "epoch": 3741} {"train_loss": -6.88651180267334, "global_step": 157148, "epoch": 3741} {"train_loss": -6.87651252746582, "global_step": 157149, "epoch": 3741} {"train_loss": -6.956740379333496, "global_step": 157150, "epoch": 3741} {"train_loss": -6.884914398193359, "global_step": 157151, "epoch": 3741} {"train_loss": -6.78762149810791, "global_step": 157152, "epoch": 3741} {"train_loss": -6.756524085998535, "global_step": 157153, "epoch": 3741} {"train_loss": -6.790265083312988, "global_step": 157154, "epoch": 3741} {"train_loss": -6.926176071166992, "global_step": 157155, "epoch": 3741} {"train_loss": -6.994416236877441, "global_step": 157156, "epoch": 3741} {"train_loss": -6.921619892120361, "global_step": 157157, "epoch": 3741} {"train_loss": -6.8492584228515625, "global_step": 157158, "epoch": 3741} {"train_loss": -6.896385192871094, "global_step": 157159, "epoch": 3741} {"train_loss": -6.868776321411133, "global_step": 157160, "epoch": 3741} {"train_loss": -6.884699821472168, "global_step": 157161, "epoch": 3741} {"train_loss": -6.916254997253418, "global_step": 157162, "epoch": 3741} {"train_loss": -6.8782012122018, "global_step": 157163, "epoch": 3741, "val_loss": 68676.171875} {"train_loss": -6.857055187225342, "global_step": 157164, "epoch": 3742} {"train_loss": -6.929165840148926, "global_step": 157165, "epoch": 3742} {"train_loss": -6.816377639770508, "global_step": 157166, "epoch": 3742} {"train_loss": -6.873895645141602, "global_step": 157167, "epoch": 3742} {"train_loss": -6.962983131408691, "global_step": 157168, "epoch": 3742} {"train_loss": -6.786385536193848, "global_step": 157169, "epoch": 3742} {"train_loss": -6.874519348144531, "global_step": 157170, "epoch": 3742} {"train_loss": -6.827566623687744, "global_step": 157171, "epoch": 3742} {"train_loss": -6.712255954742432, "global_step": 157172, "epoch": 3742} {"train_loss": -6.813338279724121, "global_step": 157173, "epoch": 3742} {"train_loss": -6.725044250488281, "global_step": 157174, "epoch": 3742} {"train_loss": -6.753100872039795, "global_step": 157175, "epoch": 3742} {"train_loss": -6.6670427322387695, "global_step": 157176, "epoch": 3742} {"train_loss": -6.8040313720703125, "global_step": 157177, "epoch": 3742} {"train_loss": -6.786073684692383, "global_step": 157178, "epoch": 3742} {"train_loss": -6.790420055389404, "global_step": 157179, "epoch": 3742} {"train_loss": -6.815639495849609, "global_step": 157180, "epoch": 3742} {"train_loss": -6.717414855957031, "global_step": 157181, "epoch": 3742} {"train_loss": -6.90952205657959, "global_step": 157182, "epoch": 3742} {"train_loss": -6.89100980758667, "global_step": 157183, "epoch": 3742} {"train_loss": -6.722979545593262, "global_step": 157184, "epoch": 3742} {"train_loss": -6.766185760498047, "global_step": 157185, "epoch": 3742} {"train_loss": -6.709347724914551, "global_step": 157186, "epoch": 3742} {"train_loss": -6.929332733154297, "global_step": 157187, "epoch": 3742} {"train_loss": -6.906050682067871, "global_step": 157188, "epoch": 3742} {"train_loss": -6.830260276794434, "global_step": 157189, "epoch": 3742} {"train_loss": -6.796186447143555, "global_step": 157190, "epoch": 3742} {"train_loss": -6.725170135498047, "global_step": 157191, "epoch": 3742} {"train_loss": -6.835124969482422, "global_step": 157192, "epoch": 3742} {"train_loss": -6.797671794891357, "global_step": 157193, "epoch": 3742} {"train_loss": -6.815834999084473, "global_step": 157194, "epoch": 3742} {"train_loss": -6.7111921310424805, "global_step": 157195, "epoch": 3742} {"train_loss": -6.770501613616943, "global_step": 157196, "epoch": 3742} {"train_loss": -6.844135761260986, "global_step": 157197, "epoch": 3742} {"train_loss": -6.789770126342773, "global_step": 157198, "epoch": 3742} {"train_loss": -6.844607353210449, "global_step": 157199, "epoch": 3742} {"train_loss": -6.961212158203125, "global_step": 157200, "epoch": 3742} {"train_loss": -6.948225975036621, "global_step": 157201, "epoch": 3742} {"train_loss": -6.897324562072754, "global_step": 157202, "epoch": 3742} {"train_loss": -6.793737888336182, "global_step": 157203, "epoch": 3742} {"train_loss": -6.928071975708008, "global_step": 157204, "epoch": 3742} {"train_loss": -6.823186794916789, "global_step": 157205, "epoch": 3742, "val_loss": 68486.0859375} {"train_loss": -6.877110958099365, "global_step": 157206, "epoch": 3743} {"train_loss": -6.970163345336914, "global_step": 157207, "epoch": 3743} {"train_loss": -6.869472503662109, "global_step": 157208, "epoch": 3743} {"train_loss": -6.940969944000244, "global_step": 157209, "epoch": 3743} {"train_loss": -6.870196342468262, "global_step": 157210, "epoch": 3743} {"train_loss": -6.881032466888428, "global_step": 157211, "epoch": 3743} {"train_loss": -6.952683448791504, "global_step": 157212, "epoch": 3743} {"train_loss": -6.945609092712402, "global_step": 157213, "epoch": 3743} {"train_loss": -6.9030070304870605, "global_step": 157214, "epoch": 3743} {"train_loss": -6.9183349609375, "global_step": 157215, "epoch": 3743} {"train_loss": -6.829347610473633, "global_step": 157216, "epoch": 3743} {"train_loss": -6.86094856262207, "global_step": 157217, "epoch": 3743} {"train_loss": -6.910675048828125, "global_step": 157218, "epoch": 3743} {"train_loss": -6.962904930114746, "global_step": 157219, "epoch": 3743} {"train_loss": -6.900309085845947, "global_step": 157220, "epoch": 3743} {"train_loss": -6.961666107177734, "global_step": 157221, "epoch": 3743} {"train_loss": -6.947408199310303, "global_step": 157222, "epoch": 3743} {"train_loss": -6.85806941986084, "global_step": 157223, "epoch": 3743} {"train_loss": -6.888772010803223, "global_step": 157224, "epoch": 3743} {"train_loss": -6.875670909881592, "global_step": 157225, "epoch": 3743} {"train_loss": -6.873992443084717, "global_step": 157226, "epoch": 3743} {"train_loss": -6.996210098266602, "global_step": 157227, "epoch": 3743} {"train_loss": -6.729416370391846, "global_step": 157228, "epoch": 3743} {"train_loss": -6.937784194946289, "global_step": 157229, "epoch": 3743} {"train_loss": -6.901394844055176, "global_step": 157230, "epoch": 3743} {"train_loss": -6.849544525146484, "global_step": 157231, "epoch": 3743} {"train_loss": -6.8578033447265625, "global_step": 157232, "epoch": 3743} {"train_loss": -6.931267738342285, "global_step": 157233, "epoch": 3743} {"train_loss": -6.860126495361328, "global_step": 157234, "epoch": 3743} {"train_loss": -6.877471446990967, "global_step": 157235, "epoch": 3743} {"train_loss": -6.891872406005859, "global_step": 157236, "epoch": 3743} {"train_loss": -6.832194805145264, "global_step": 157237, "epoch": 3743} {"train_loss": -6.722803115844727, "global_step": 157238, "epoch": 3743} {"train_loss": -7.005285263061523, "global_step": 157239, "epoch": 3743} {"train_loss": -6.833145618438721, "global_step": 157240, "epoch": 3743} {"train_loss": -6.8453803062438965, "global_step": 157241, "epoch": 3743} {"train_loss": -6.854544639587402, "global_step": 157242, "epoch": 3743} {"train_loss": -6.91591215133667, "global_step": 157243, "epoch": 3743} {"train_loss": -6.826578140258789, "global_step": 157244, "epoch": 3743} {"train_loss": -6.774589538574219, "global_step": 157245, "epoch": 3743} {"train_loss": -6.955456733703613, "global_step": 157246, "epoch": 3743} {"train_loss": -6.888085615067255, "global_step": 157247, "epoch": 3743, "val_loss": 68752.3046875} {"train_loss": -6.947324752807617, "global_step": 157248, "epoch": 3744} {"train_loss": -6.8689985275268555, "global_step": 157249, "epoch": 3744} {"train_loss": -6.762609004974365, "global_step": 157250, "epoch": 3744} {"train_loss": -6.865135192871094, "global_step": 157251, "epoch": 3744} {"train_loss": -6.78762674331665, "global_step": 157252, "epoch": 3744} {"train_loss": -6.925362586975098, "global_step": 157253, "epoch": 3744} {"train_loss": -6.851161956787109, "global_step": 157254, "epoch": 3744} {"train_loss": -6.964398384094238, "global_step": 157255, "epoch": 3744} {"train_loss": -6.846660137176514, "global_step": 157256, "epoch": 3744} {"train_loss": -6.976011276245117, "global_step": 157257, "epoch": 3744} {"train_loss": -6.924576759338379, "global_step": 157258, "epoch": 3744} {"train_loss": -6.873900890350342, "global_step": 157259, "epoch": 3744} {"train_loss": -6.978671073913574, "global_step": 157260, "epoch": 3744} {"train_loss": -6.817771911621094, "global_step": 157261, "epoch": 3744} {"train_loss": -6.9110612869262695, "global_step": 157262, "epoch": 3744} {"train_loss": -6.8703293800354, "global_step": 157263, "epoch": 3744} {"train_loss": -6.917208671569824, "global_step": 157264, "epoch": 3744} {"train_loss": -6.8498640060424805, "global_step": 157265, "epoch": 3744} {"train_loss": -6.929847240447998, "global_step": 157266, "epoch": 3744} {"train_loss": -6.963144302368164, "global_step": 157267, "epoch": 3744} {"train_loss": -6.953634738922119, "global_step": 157268, "epoch": 3744} {"train_loss": -6.941963195800781, "global_step": 157269, "epoch": 3744} {"train_loss": -6.917990207672119, "global_step": 157270, "epoch": 3744} {"train_loss": -6.862506866455078, "global_step": 157271, "epoch": 3744} {"train_loss": -6.793944358825684, "global_step": 157272, "epoch": 3744} {"train_loss": -6.956075668334961, "global_step": 157273, "epoch": 3744} {"train_loss": -6.952236175537109, "global_step": 157274, "epoch": 3744} {"train_loss": -6.816354274749756, "global_step": 157275, "epoch": 3744} {"train_loss": -6.702712059020996, "global_step": 157276, "epoch": 3744} {"train_loss": -6.916374206542969, "global_step": 157277, "epoch": 3744} {"train_loss": -6.877016067504883, "global_step": 157278, "epoch": 3744} {"train_loss": -6.924160003662109, "global_step": 157279, "epoch": 3744} {"train_loss": -6.972503662109375, "global_step": 157280, "epoch": 3744} {"train_loss": -6.837288856506348, "global_step": 157281, "epoch": 3744} {"train_loss": -6.827601432800293, "global_step": 157282, "epoch": 3744} {"train_loss": -6.85089111328125, "global_step": 157283, "epoch": 3744} {"train_loss": -6.93511962890625, "global_step": 157284, "epoch": 3744} {"train_loss": -6.768150329589844, "global_step": 157285, "epoch": 3744} {"train_loss": -6.832242012023926, "global_step": 157286, "epoch": 3744} {"train_loss": -6.903943061828613, "global_step": 157287, "epoch": 3744} {"train_loss": -6.886322021484375, "global_step": 157288, "epoch": 3744} {"train_loss": -6.882953961690267, "global_step": 157289, "epoch": 3744, "val_loss": 68334.2890625} {"train_loss": -6.9466872215271, "global_step": 157290, "epoch": 3745} {"train_loss": -6.863372325897217, "global_step": 157291, "epoch": 3745} {"train_loss": -6.762048244476318, "global_step": 157292, "epoch": 3745} {"train_loss": -6.809079170227051, "global_step": 157293, "epoch": 3745} {"train_loss": -6.860106945037842, "global_step": 157294, "epoch": 3745} {"train_loss": -6.882174491882324, "global_step": 157295, "epoch": 3745} {"train_loss": -6.930438995361328, "global_step": 157296, "epoch": 3745} {"train_loss": -6.717229843139648, "global_step": 157297, "epoch": 3745} {"train_loss": -6.924835205078125, "global_step": 157298, "epoch": 3745} {"train_loss": -6.8856120109558105, "global_step": 157299, "epoch": 3745} {"train_loss": -6.886679649353027, "global_step": 157300, "epoch": 3745} {"train_loss": -6.8470001220703125, "global_step": 157301, "epoch": 3745} {"train_loss": -6.798413276672363, "global_step": 157302, "epoch": 3745} {"train_loss": -6.927478313446045, "global_step": 157303, "epoch": 3745} {"train_loss": -6.842241287231445, "global_step": 157304, "epoch": 3745} {"train_loss": -6.811840534210205, "global_step": 157305, "epoch": 3745} {"train_loss": -6.853511810302734, "global_step": 157306, "epoch": 3745} {"train_loss": -6.7693915367126465, "global_step": 157307, "epoch": 3745} {"train_loss": -6.7771782875061035, "global_step": 157308, "epoch": 3745} {"train_loss": -6.80538272857666, "global_step": 157309, "epoch": 3745} {"train_loss": -6.870670318603516, "global_step": 157310, "epoch": 3745} {"train_loss": -6.937587261199951, "global_step": 157311, "epoch": 3745} {"train_loss": -6.844414710998535, "global_step": 157312, "epoch": 3745} {"train_loss": -6.766103267669678, "global_step": 157313, "epoch": 3745} {"train_loss": -6.861319541931152, "global_step": 157314, "epoch": 3745} {"train_loss": -6.860998153686523, "global_step": 157315, "epoch": 3745} {"train_loss": -6.784643173217773, "global_step": 157316, "epoch": 3745} {"train_loss": -6.842644691467285, "global_step": 157317, "epoch": 3745} {"train_loss": -6.757376194000244, "global_step": 157318, "epoch": 3745} {"train_loss": -6.7868242263793945, "global_step": 157319, "epoch": 3745} {"train_loss": -6.829157829284668, "global_step": 157320, "epoch": 3745} {"train_loss": -6.726484775543213, "global_step": 157321, "epoch": 3745} {"train_loss": -6.969704627990723, "global_step": 157322, "epoch": 3745} {"train_loss": -6.833540916442871, "global_step": 157323, "epoch": 3745} {"train_loss": -6.801322937011719, "global_step": 157324, "epoch": 3745} {"train_loss": -6.826693058013916, "global_step": 157325, "epoch": 3745} {"train_loss": -6.944758415222168, "global_step": 157326, "epoch": 3745} {"train_loss": -6.775864124298096, "global_step": 157327, "epoch": 3745} {"train_loss": -6.935155391693115, "global_step": 157328, "epoch": 3745} {"train_loss": -6.946540832519531, "global_step": 157329, "epoch": 3745} {"train_loss": -6.854598522186279, "global_step": 157330, "epoch": 3745} {"train_loss": -6.8447621549878805, "global_step": 157331, "epoch": 3745, "val_loss": 68634.6796875} {"train_loss": -6.834573745727539, "global_step": 157332, "epoch": 3746} {"train_loss": -6.913166522979736, "global_step": 157333, "epoch": 3746} {"train_loss": -6.827171802520752, "global_step": 157334, "epoch": 3746} {"train_loss": -6.834521770477295, "global_step": 157335, "epoch": 3746} {"train_loss": -6.892735481262207, "global_step": 157336, "epoch": 3746} {"train_loss": -6.855812072753906, "global_step": 157337, "epoch": 3746} {"train_loss": -6.90298318862915, "global_step": 157338, "epoch": 3746} {"train_loss": -6.803642272949219, "global_step": 157339, "epoch": 3746} {"train_loss": -6.903506278991699, "global_step": 157340, "epoch": 3746} {"train_loss": -6.896777153015137, "global_step": 157341, "epoch": 3746} {"train_loss": -6.944031715393066, "global_step": 157342, "epoch": 3746} {"train_loss": -6.932473182678223, "global_step": 157343, "epoch": 3746} {"train_loss": -6.900054931640625, "global_step": 157344, "epoch": 3746} {"train_loss": -6.953551292419434, "global_step": 157345, "epoch": 3746} {"train_loss": -6.823087215423584, "global_step": 157346, "epoch": 3746} {"train_loss": -6.953635215759277, "global_step": 157347, "epoch": 3746} {"train_loss": -6.914979934692383, "global_step": 157348, "epoch": 3746} {"train_loss": -6.863331317901611, "global_step": 157349, "epoch": 3746} {"train_loss": -6.836724758148193, "global_step": 157350, "epoch": 3746} {"train_loss": -6.786492347717285, "global_step": 157351, "epoch": 3746} {"train_loss": -6.9793243408203125, "global_step": 157352, "epoch": 3746} {"train_loss": -6.875829696655273, "global_step": 157353, "epoch": 3746} {"train_loss": -6.904557228088379, "global_step": 157354, "epoch": 3746} {"train_loss": -6.961578369140625, "global_step": 157355, "epoch": 3746} {"train_loss": -6.9053263664245605, "global_step": 157356, "epoch": 3746} {"train_loss": -6.874788284301758, "global_step": 157357, "epoch": 3746} {"train_loss": -6.904157638549805, "global_step": 157358, "epoch": 3746} {"train_loss": -6.795561790466309, "global_step": 157359, "epoch": 3746} {"train_loss": -6.868718147277832, "global_step": 157360, "epoch": 3746} {"train_loss": -6.85188627243042, "global_step": 157361, "epoch": 3746} {"train_loss": -6.741173267364502, "global_step": 157362, "epoch": 3746} {"train_loss": -6.843838214874268, "global_step": 157363, "epoch": 3746} {"train_loss": -6.829760551452637, "global_step": 157364, "epoch": 3746} {"train_loss": -7.0239949226379395, "global_step": 157365, "epoch": 3746} {"train_loss": -6.832435607910156, "global_step": 157366, "epoch": 3746} {"train_loss": -6.731405258178711, "global_step": 157367, "epoch": 3746} {"train_loss": -6.961153030395508, "global_step": 157368, "epoch": 3746} {"train_loss": -6.943957328796387, "global_step": 157369, "epoch": 3746} {"train_loss": -6.845090866088867, "global_step": 157370, "epoch": 3746} {"train_loss": -6.955121040344238, "global_step": 157371, "epoch": 3746} {"train_loss": -6.914122581481934, "global_step": 157372, "epoch": 3746} {"train_loss": -6.883715833936419, "global_step": 157373, "epoch": 3746, "val_loss": 68542.53125} {"train_loss": -6.910408020019531, "global_step": 157374, "epoch": 3747} {"train_loss": -6.965031623840332, "global_step": 157375, "epoch": 3747} {"train_loss": -6.778505325317383, "global_step": 157376, "epoch": 3747} {"train_loss": -6.895713806152344, "global_step": 157377, "epoch": 3747} {"train_loss": -6.982882499694824, "global_step": 157378, "epoch": 3747} {"train_loss": -6.905364513397217, "global_step": 157379, "epoch": 3747} {"train_loss": -6.906521797180176, "global_step": 157380, "epoch": 3747} {"train_loss": -6.836594581604004, "global_step": 157381, "epoch": 3747} {"train_loss": -6.839929580688477, "global_step": 157382, "epoch": 3747} {"train_loss": -6.796236038208008, "global_step": 157383, "epoch": 3747} {"train_loss": -6.812792778015137, "global_step": 157384, "epoch": 3747} {"train_loss": -6.982686996459961, "global_step": 157385, "epoch": 3747} {"train_loss": -6.898806095123291, "global_step": 157386, "epoch": 3747} {"train_loss": -7.024990081787109, "global_step": 157387, "epoch": 3747} {"train_loss": -6.872886657714844, "global_step": 157388, "epoch": 3747} {"train_loss": -6.828208923339844, "global_step": 157389, "epoch": 3747} {"train_loss": -6.89987850189209, "global_step": 157390, "epoch": 3747} {"train_loss": -6.93695068359375, "global_step": 157391, "epoch": 3747} {"train_loss": -6.739788055419922, "global_step": 157392, "epoch": 3747} {"train_loss": -7.0266523361206055, "global_step": 157393, "epoch": 3747} {"train_loss": -6.944378852844238, "global_step": 157394, "epoch": 3747} {"train_loss": -6.665333271026611, "global_step": 157395, "epoch": 3747} {"train_loss": -6.8568878173828125, "global_step": 157396, "epoch": 3747} {"train_loss": -6.9910993576049805, "global_step": 157397, "epoch": 3747} {"train_loss": -6.775300979614258, "global_step": 157398, "epoch": 3747} {"train_loss": -6.862470626831055, "global_step": 157399, "epoch": 3747} {"train_loss": -6.913212776184082, "global_step": 157400, "epoch": 3747} {"train_loss": -6.801859378814697, "global_step": 157401, "epoch": 3747} {"train_loss": -6.875408172607422, "global_step": 157402, "epoch": 3747} {"train_loss": -6.863058567047119, "global_step": 157403, "epoch": 3747} {"train_loss": -6.797019958496094, "global_step": 157404, "epoch": 3747} {"train_loss": -6.853935241699219, "global_step": 157405, "epoch": 3747} {"train_loss": -6.920442581176758, "global_step": 157406, "epoch": 3747} {"train_loss": -6.807430267333984, "global_step": 157407, "epoch": 3747} {"train_loss": -6.871975898742676, "global_step": 157408, "epoch": 3747} {"train_loss": -6.578512668609619, "global_step": 157409, "epoch": 3747} {"train_loss": -6.897323131561279, "global_step": 157410, "epoch": 3747} {"train_loss": -6.67464017868042, "global_step": 157411, "epoch": 3747} {"train_loss": -6.729818820953369, "global_step": 157412, "epoch": 3747} {"train_loss": -6.739816665649414, "global_step": 157413, "epoch": 3747} {"train_loss": -6.578387260437012, "global_step": 157414, "epoch": 3747} {"train_loss": -6.846423569179716, "global_step": 157415, "epoch": 3747, "val_loss": 68770.234375} {"train_loss": -6.632943153381348, "global_step": 157416, "epoch": 3748} {"train_loss": -6.856350898742676, "global_step": 157417, "epoch": 3748} {"train_loss": -6.678152084350586, "global_step": 157418, "epoch": 3748} {"train_loss": -6.801583290100098, "global_step": 157419, "epoch": 3748} {"train_loss": -6.7220659255981445, "global_step": 157420, "epoch": 3748} {"train_loss": -6.669562339782715, "global_step": 157421, "epoch": 3748} {"train_loss": -6.711503982543945, "global_step": 157422, "epoch": 3748} {"train_loss": -6.7320237159729, "global_step": 157423, "epoch": 3748} {"train_loss": -6.8321638107299805, "global_step": 157424, "epoch": 3748} {"train_loss": -6.823244094848633, "global_step": 157425, "epoch": 3748} {"train_loss": -6.794379711151123, "global_step": 157426, "epoch": 3748} {"train_loss": -6.889913558959961, "global_step": 157427, "epoch": 3748} {"train_loss": -6.867811679840088, "global_step": 157428, "epoch": 3748} {"train_loss": -6.820456504821777, "global_step": 157429, "epoch": 3748} {"train_loss": -6.795502662658691, "global_step": 157430, "epoch": 3748} {"train_loss": -6.8466973304748535, "global_step": 157431, "epoch": 3748} {"train_loss": -6.867232322692871, "global_step": 157432, "epoch": 3748} {"train_loss": -6.841618061065674, "global_step": 157433, "epoch": 3748} {"train_loss": -6.939905166625977, "global_step": 157434, "epoch": 3748} {"train_loss": -6.703713417053223, "global_step": 157435, "epoch": 3748} {"train_loss": -6.884339332580566, "global_step": 157436, "epoch": 3748} {"train_loss": -6.916189670562744, "global_step": 157437, "epoch": 3748} {"train_loss": -6.786269187927246, "global_step": 157438, "epoch": 3748} {"train_loss": -6.844075679779053, "global_step": 157439, "epoch": 3748} {"train_loss": -6.849398612976074, "global_step": 157440, "epoch": 3748} {"train_loss": -6.908941745758057, "global_step": 157441, "epoch": 3748} {"train_loss": -6.893818378448486, "global_step": 157442, "epoch": 3748} {"train_loss": -6.783815860748291, "global_step": 157443, "epoch": 3748} {"train_loss": -6.905604839324951, "global_step": 157444, "epoch": 3748} {"train_loss": -7.093202590942383, "global_step": 157445, "epoch": 3748} {"train_loss": -6.816167831420898, "global_step": 157446, "epoch": 3748} {"train_loss": -6.874899864196777, "global_step": 157447, "epoch": 3748} {"train_loss": -6.882798194885254, "global_step": 157448, "epoch": 3748} {"train_loss": -6.9305500984191895, "global_step": 157449, "epoch": 3748} {"train_loss": -6.938178062438965, "global_step": 157450, "epoch": 3748} {"train_loss": -7.088924407958984, "global_step": 157451, "epoch": 3748} {"train_loss": -6.9589362144470215, "global_step": 157452, "epoch": 3748} {"train_loss": -6.913589954376221, "global_step": 157453, "epoch": 3748} {"train_loss": -7.058308124542236, "global_step": 157454, "epoch": 3748} {"train_loss": -6.913968086242676, "global_step": 157455, "epoch": 3748} {"train_loss": -6.9020586013793945, "global_step": 157456, "epoch": 3748} {"train_loss": -6.854633581070673, "global_step": 157457, "epoch": 3748, "val_loss": 68478.8046875} {"train_loss": -7.043763160705566, "global_step": 157458, "epoch": 3749} {"train_loss": -6.923886299133301, "global_step": 157459, "epoch": 3749} {"train_loss": -6.881547927856445, "global_step": 157460, "epoch": 3749} {"train_loss": -6.930580139160156, "global_step": 157461, "epoch": 3749} {"train_loss": -6.866639137268066, "global_step": 157462, "epoch": 3749} {"train_loss": -6.955063819885254, "global_step": 157463, "epoch": 3749} {"train_loss": -6.9011712074279785, "global_step": 157464, "epoch": 3749} {"train_loss": -6.946045398712158, "global_step": 157465, "epoch": 3749} {"train_loss": -7.025010108947754, "global_step": 157466, "epoch": 3749} {"train_loss": -6.934303283691406, "global_step": 157467, "epoch": 3749} {"train_loss": -6.918001651763916, "global_step": 157468, "epoch": 3749} {"train_loss": -6.842512607574463, "global_step": 157469, "epoch": 3749} {"train_loss": -7.0484819412231445, "global_step": 157470, "epoch": 3749} {"train_loss": -6.934331893920898, "global_step": 157471, "epoch": 3749} {"train_loss": -6.835491180419922, "global_step": 157472, "epoch": 3749} {"train_loss": -6.89394474029541, "global_step": 157473, "epoch": 3749} {"train_loss": -6.9744038581848145, "global_step": 157474, "epoch": 3749} {"train_loss": -6.932960510253906, "global_step": 157475, "epoch": 3749} {"train_loss": -6.765701770782471, "global_step": 157476, "epoch": 3749} {"train_loss": -6.955214500427246, "global_step": 157477, "epoch": 3749} {"train_loss": -6.894657135009766, "global_step": 157478, "epoch": 3749} {"train_loss": -6.911154747009277, "global_step": 157479, "epoch": 3749} {"train_loss": -6.851222991943359, "global_step": 157480, "epoch": 3749} {"train_loss": -6.884055137634277, "global_step": 157481, "epoch": 3749} {"train_loss": -6.911485195159912, "global_step": 157482, "epoch": 3749} {"train_loss": -6.879092216491699, "global_step": 157483, "epoch": 3749} {"train_loss": -6.871593952178955, "global_step": 157484, "epoch": 3749} {"train_loss": -6.746777057647705, "global_step": 157485, "epoch": 3749} {"train_loss": -6.881425857543945, "global_step": 157486, "epoch": 3749} {"train_loss": -6.797351837158203, "global_step": 157487, "epoch": 3749} {"train_loss": -6.886528491973877, "global_step": 157488, "epoch": 3749} {"train_loss": -6.827991962432861, "global_step": 157489, "epoch": 3749} {"train_loss": -6.938279628753662, "global_step": 157490, "epoch": 3749} {"train_loss": -6.906503677368164, "global_step": 157491, "epoch": 3749} {"train_loss": -6.84566593170166, "global_step": 157492, "epoch": 3749} {"train_loss": -6.800661563873291, "global_step": 157493, "epoch": 3749} {"train_loss": -6.805548667907715, "global_step": 157494, "epoch": 3749} {"train_loss": -6.829418182373047, "global_step": 157495, "epoch": 3749} {"train_loss": -6.835896015167236, "global_step": 157496, "epoch": 3749} {"train_loss": -6.902047157287598, "global_step": 157497, "epoch": 3749} {"train_loss": -6.817587852478027, "global_step": 157498, "epoch": 3749} {"train_loss": -6.885445935385568, "global_step": 157499, "epoch": 3749, "val_loss": 68643.484375} {"train_loss": -6.949810028076172, "global_step": 157500, "epoch": 3750} {"train_loss": -6.888339042663574, "global_step": 157501, "epoch": 3750} {"train_loss": -6.7981486320495605, "global_step": 157502, "epoch": 3750} {"train_loss": -6.817509651184082, "global_step": 157503, "epoch": 3750} {"train_loss": -6.780263900756836, "global_step": 157504, "epoch": 3750} {"train_loss": -6.893119812011719, "global_step": 157505, "epoch": 3750} {"train_loss": -6.892494201660156, "global_step": 157506, "epoch": 3750} {"train_loss": -6.701955795288086, "global_step": 157507, "epoch": 3750} {"train_loss": -6.8200483322143555, "global_step": 157508, "epoch": 3750} {"train_loss": -6.835605621337891, "global_step": 157509, "epoch": 3750} {"train_loss": -6.909817695617676, "global_step": 157510, "epoch": 3750} {"train_loss": -6.987130641937256, "global_step": 157511, "epoch": 3750} {"train_loss": -6.8588361740112305, "global_step": 157512, "epoch": 3750} {"train_loss": -6.881200790405273, "global_step": 157513, "epoch": 3750} {"train_loss": -6.914589881896973, "global_step": 157514, "epoch": 3750} {"train_loss": -6.877920150756836, "global_step": 157515, "epoch": 3750} {"train_loss": -6.911269187927246, "global_step": 157516, "epoch": 3750} {"train_loss": -6.739342212677002, "global_step": 157517, "epoch": 3750} {"train_loss": -6.900142669677734, "global_step": 157518, "epoch": 3750} {"train_loss": -6.851840972900391, "global_step": 157519, "epoch": 3750} {"train_loss": -6.776248931884766, "global_step": 157520, "epoch": 3750} {"train_loss": -6.854351043701172, "global_step": 157521, "epoch": 3750} {"train_loss": -6.917614459991455, "global_step": 157522, "epoch": 3750} {"train_loss": -6.825440406799316, "global_step": 157523, "epoch": 3750} {"train_loss": -6.852402210235596, "global_step": 157524, "epoch": 3750} {"train_loss": -6.9603986740112305, "global_step": 157525, "epoch": 3750} {"train_loss": -6.933529853820801, "global_step": 157526, "epoch": 3750} {"train_loss": -6.975673198699951, "global_step": 157527, "epoch": 3750} {"train_loss": -6.858705520629883, "global_step": 157528, "epoch": 3750} {"train_loss": -6.8984832763671875, "global_step": 157529, "epoch": 3750} {"train_loss": -6.879975318908691, "global_step": 157530, "epoch": 3750} {"train_loss": -6.759088516235352, "global_step": 157531, "epoch": 3750} {"train_loss": -6.873722553253174, "global_step": 157532, "epoch": 3750} {"train_loss": -6.960038661956787, "global_step": 157533, "epoch": 3750} {"train_loss": -6.838863849639893, "global_step": 157534, "epoch": 3750} {"train_loss": -6.870964527130127, "global_step": 157535, "epoch": 3750} {"train_loss": -6.9769978523254395, "global_step": 157536, "epoch": 3750} {"train_loss": -6.77417516708374, "global_step": 157537, "epoch": 3750} {"train_loss": -6.933804035186768, "global_step": 157538, "epoch": 3750} {"train_loss": -6.812868118286133, "global_step": 157539, "epoch": 3750} {"train_loss": -6.83740234375, "global_step": 157540, "epoch": 3750} {"train_loss": -6.868191060565767, "global_step": 157541, "epoch": 3750, "train/sim_max_reward_0": 0.21590223085184082, "train/sim_max_reward_1": 0.9851855657124748, "train/sim_max_reward_2": 0.7725217244533126, "train/sim_max_reward_3": 0.7253991801770164, "train/sim_max_reward_4": 0.407996381368649, "train/sim_max_reward_5": 0.9033240456479908, "test/sim_max_reward_4400000": 0.15573472354107104, "test/sim_max_reward_4400001": 0.4377118185316913, "test/sim_max_reward_4400002": 0.29474880343382903, "test/sim_max_reward_4400003": 0.9774151816405651, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.4021761610523471, "test/sim_max_reward_4400006": 0.18784054671645165, "test/sim_max_reward_4400007": 0.932590022339957, "test/sim_max_reward_4400008": 0.29820835731578416, "test/sim_max_reward_4400009": 0.8185525731225008, "test/sim_max_reward_4400010": 0.25810201905464636, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9735538819906742, "test/sim_max_reward_4400013": 0.9552233764831518, "test/sim_max_reward_4400014": 0.9544238745519823, "test/sim_max_reward_4400015": 0.051554220488333295, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.23293271033104598, "test/sim_max_reward_4400019": 0.622864269738474, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.36776425879621627, "test/sim_max_reward_4400022": 0.30168045377979336, "test/sim_max_reward_4400023": 0.8912851347056984, "test/sim_max_reward_4400024": 0.867139903255295, "test/sim_max_reward_4400025": 0.261726344069384, "test/sim_max_reward_4400026": 0.7234635622350859, "test/sim_max_reward_4400027": 0.002296095239057295, "test/sim_max_reward_4400028": 0.4528445242260667, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.8912481421421431, "test/sim_max_reward_4400031": 0.9868450090052422, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.995695649642964, "test/sim_max_reward_4400034": 0.9734465298960244, "test/sim_max_reward_4400035": 0.6916867419383717, "test/sim_max_reward_4400036": 0.40534452002616705, "test/sim_max_reward_4400037": 0.9760682591761424, "test/sim_max_reward_4400038": 0.8810121911543951, "test/sim_max_reward_4400039": 0.8615614090989583, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9874990822587557, "test/sim_max_reward_4400042": 0.9645745787209054, "test/sim_max_reward_4400043": 0.9787337780681304, "test/sim_max_reward_4400044": 0.9305798645045673, "test/sim_max_reward_4400045": 0.9751871467042428, "test/sim_max_reward_4400046": 0.9917988606536755, "test/sim_max_reward_4400047": 0.965886189783508, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8637018240499141, "train/mean_score": 0.6683881880352142, "test/mean_score": 0.5597363079768081, "val_loss": 68535.7578125} {"train_loss": -6.7791337966918945, "global_step": 157542, "epoch": 3751} {"train_loss": -6.94696044921875, "global_step": 157543, "epoch": 3751} {"train_loss": -6.872159957885742, "global_step": 157544, "epoch": 3751} {"train_loss": -6.931035995483398, "global_step": 157545, "epoch": 3751} {"train_loss": -6.8527984619140625, "global_step": 157546, "epoch": 3751} {"train_loss": -6.798508167266846, "global_step": 157547, "epoch": 3751} {"train_loss": -6.907797813415527, "global_step": 157548, "epoch": 3751} {"train_loss": -6.775351524353027, "global_step": 157549, "epoch": 3751} {"train_loss": -6.9641242027282715, "global_step": 157550, "epoch": 3751} {"train_loss": -6.859173774719238, "global_step": 157551, "epoch": 3751} {"train_loss": -6.922138690948486, "global_step": 157552, "epoch": 3751} {"train_loss": -6.861687660217285, "global_step": 157553, "epoch": 3751} {"train_loss": -6.96785831451416, "global_step": 157554, "epoch": 3751} {"train_loss": -6.946162700653076, "global_step": 157555, "epoch": 3751} {"train_loss": -6.88687801361084, "global_step": 157556, "epoch": 3751} {"train_loss": -6.836541175842285, "global_step": 157557, "epoch": 3751} {"train_loss": -6.859021186828613, "global_step": 157558, "epoch": 3751} {"train_loss": -6.863377571105957, "global_step": 157559, "epoch": 3751} {"train_loss": -6.992315769195557, "global_step": 157560, "epoch": 3751} {"train_loss": -6.793784141540527, "global_step": 157561, "epoch": 3751} {"train_loss": -6.832196235656738, "global_step": 157562, "epoch": 3751} {"train_loss": -6.879012107849121, "global_step": 157563, "epoch": 3751} {"train_loss": -6.744367599487305, "global_step": 157564, "epoch": 3751} {"train_loss": -6.755937099456787, "global_step": 157565, "epoch": 3751} {"train_loss": -6.868759632110596, "global_step": 157566, "epoch": 3751} {"train_loss": -6.817103385925293, "global_step": 157567, "epoch": 3751} {"train_loss": -6.7835469245910645, "global_step": 157568, "epoch": 3751} {"train_loss": -6.733421325683594, "global_step": 157569, "epoch": 3751} {"train_loss": -6.929993629455566, "global_step": 157570, "epoch": 3751} {"train_loss": -6.713312149047852, "global_step": 157571, "epoch": 3751} {"train_loss": -6.774386882781982, "global_step": 157572, "epoch": 3751} {"train_loss": -6.9024739265441895, "global_step": 157573, "epoch": 3751} {"train_loss": -6.713878631591797, "global_step": 157574, "epoch": 3751} {"train_loss": -6.795594692230225, "global_step": 157575, "epoch": 3751} {"train_loss": -6.750164031982422, "global_step": 157576, "epoch": 3751} {"train_loss": -6.821952819824219, "global_step": 157577, "epoch": 3751} {"train_loss": -6.792667388916016, "global_step": 157578, "epoch": 3751} {"train_loss": -6.780636787414551, "global_step": 157579, "epoch": 3751} {"train_loss": -6.985918998718262, "global_step": 157580, "epoch": 3751} {"train_loss": -6.863596439361572, "global_step": 157581, "epoch": 3751} {"train_loss": -6.780969142913818, "global_step": 157582, "epoch": 3751} {"train_loss": -6.844499701545352, "global_step": 157583, "epoch": 3751, "val_loss": 68612.4609375} {"train_loss": -6.983943939208984, "global_step": 157584, "epoch": 3752} {"train_loss": -6.871851444244385, "global_step": 157585, "epoch": 3752} {"train_loss": -6.846906661987305, "global_step": 157586, "epoch": 3752} {"train_loss": -6.795851230621338, "global_step": 157587, "epoch": 3752} {"train_loss": -6.948708534240723, "global_step": 157588, "epoch": 3752} {"train_loss": -6.796759128570557, "global_step": 157589, "epoch": 3752} {"train_loss": -6.820481300354004, "global_step": 157590, "epoch": 3752} {"train_loss": -6.929600715637207, "global_step": 157591, "epoch": 3752} {"train_loss": -6.963222503662109, "global_step": 157592, "epoch": 3752} {"train_loss": -6.775109767913818, "global_step": 157593, "epoch": 3752} {"train_loss": -6.942233085632324, "global_step": 157594, "epoch": 3752} {"train_loss": -6.894288539886475, "global_step": 157595, "epoch": 3752} {"train_loss": -6.833568096160889, "global_step": 157596, "epoch": 3752} {"train_loss": -6.91696834564209, "global_step": 157597, "epoch": 3752} {"train_loss": -6.8463029861450195, "global_step": 157598, "epoch": 3752} {"train_loss": -6.801349639892578, "global_step": 157599, "epoch": 3752} {"train_loss": -6.8482561111450195, "global_step": 157600, "epoch": 3752} {"train_loss": -6.828399181365967, "global_step": 157601, "epoch": 3752} {"train_loss": -6.79067850112915, "global_step": 157602, "epoch": 3752} {"train_loss": -6.940370082855225, "global_step": 157603, "epoch": 3752} {"train_loss": -6.784715175628662, "global_step": 157604, "epoch": 3752} {"train_loss": -6.948820114135742, "global_step": 157605, "epoch": 3752} {"train_loss": -6.826250076293945, "global_step": 157606, "epoch": 3752} {"train_loss": -6.970832824707031, "global_step": 157607, "epoch": 3752} {"train_loss": -6.950713157653809, "global_step": 157608, "epoch": 3752} {"train_loss": -6.7991790771484375, "global_step": 157609, "epoch": 3752} {"train_loss": -6.923525810241699, "global_step": 157610, "epoch": 3752} {"train_loss": -6.848233222961426, "global_step": 157611, "epoch": 3752} {"train_loss": -6.961061477661133, "global_step": 157612, "epoch": 3752} {"train_loss": -6.737417697906494, "global_step": 157613, "epoch": 3752} {"train_loss": -6.834269046783447, "global_step": 157614, "epoch": 3752} {"train_loss": -6.892694473266602, "global_step": 157615, "epoch": 3752} {"train_loss": -6.874427318572998, "global_step": 157616, "epoch": 3752} {"train_loss": -6.963562965393066, "global_step": 157617, "epoch": 3752} {"train_loss": -6.851585388183594, "global_step": 157618, "epoch": 3752} {"train_loss": -6.871335029602051, "global_step": 157619, "epoch": 3752} {"train_loss": -7.035430431365967, "global_step": 157620, "epoch": 3752} {"train_loss": -6.920838356018066, "global_step": 157621, "epoch": 3752} {"train_loss": -6.851465225219727, "global_step": 157622, "epoch": 3752} {"train_loss": -6.9543046951293945, "global_step": 157623, "epoch": 3752} {"train_loss": -6.991950511932373, "global_step": 157624, "epoch": 3752} {"train_loss": -6.882015534809658, "global_step": 157625, "epoch": 3752, "val_loss": 68760.03125} {"train_loss": -6.79725456237793, "global_step": 157626, "epoch": 3753} {"train_loss": -6.980007648468018, "global_step": 157627, "epoch": 3753} {"train_loss": -6.965237617492676, "global_step": 157628, "epoch": 3753} {"train_loss": -6.771059036254883, "global_step": 157629, "epoch": 3753} {"train_loss": -6.938782215118408, "global_step": 157630, "epoch": 3753} {"train_loss": -6.783930778503418, "global_step": 157631, "epoch": 3753} {"train_loss": -6.969387054443359, "global_step": 157632, "epoch": 3753} {"train_loss": -6.86897087097168, "global_step": 157633, "epoch": 3753} {"train_loss": -6.999156951904297, "global_step": 157634, "epoch": 3753} {"train_loss": -6.916604042053223, "global_step": 157635, "epoch": 3753} {"train_loss": -6.792202949523926, "global_step": 157636, "epoch": 3753} {"train_loss": -6.852242469787598, "global_step": 157637, "epoch": 3753} {"train_loss": -6.748141288757324, "global_step": 157638, "epoch": 3753} {"train_loss": -6.738409519195557, "global_step": 157639, "epoch": 3753} {"train_loss": -6.821682929992676, "global_step": 157640, "epoch": 3753} {"train_loss": -6.85343074798584, "global_step": 157641, "epoch": 3753} {"train_loss": -6.783860683441162, "global_step": 157642, "epoch": 3753} {"train_loss": -6.8703765869140625, "global_step": 157643, "epoch": 3753} {"train_loss": -6.8756561279296875, "global_step": 157644, "epoch": 3753} {"train_loss": -6.848972797393799, "global_step": 157645, "epoch": 3753} {"train_loss": -6.852733135223389, "global_step": 157646, "epoch": 3753} {"train_loss": -6.831027984619141, "global_step": 157647, "epoch": 3753} {"train_loss": -6.854043960571289, "global_step": 157648, "epoch": 3753} {"train_loss": -6.966475486755371, "global_step": 157649, "epoch": 3753} {"train_loss": -6.915999412536621, "global_step": 157650, "epoch": 3753} {"train_loss": -6.800909042358398, "global_step": 157651, "epoch": 3753} {"train_loss": -6.831855773925781, "global_step": 157652, "epoch": 3753} {"train_loss": -6.91162109375, "global_step": 157653, "epoch": 3753} {"train_loss": -6.831254959106445, "global_step": 157654, "epoch": 3753} {"train_loss": -6.841708660125732, "global_step": 157655, "epoch": 3753} {"train_loss": -6.858065605163574, "global_step": 157656, "epoch": 3753} {"train_loss": -6.867927074432373, "global_step": 157657, "epoch": 3753} {"train_loss": -6.852086067199707, "global_step": 157658, "epoch": 3753} {"train_loss": -6.852828502655029, "global_step": 157659, "epoch": 3753} {"train_loss": -6.912787914276123, "global_step": 157660, "epoch": 3753} {"train_loss": -6.805915832519531, "global_step": 157661, "epoch": 3753} {"train_loss": -6.9615478515625, "global_step": 157662, "epoch": 3753} {"train_loss": -6.927314758300781, "global_step": 157663, "epoch": 3753} {"train_loss": -6.992901802062988, "global_step": 157664, "epoch": 3753} {"train_loss": -6.9422760009765625, "global_step": 157665, "epoch": 3753} {"train_loss": -6.89887809753418, "global_step": 157666, "epoch": 3753} {"train_loss": -6.8713071800413585, "global_step": 157667, "epoch": 3753, "val_loss": 68539.921875} {"train_loss": -6.979753494262695, "global_step": 157668, "epoch": 3754} {"train_loss": -6.903151512145996, "global_step": 157669, "epoch": 3754} {"train_loss": -6.936688423156738, "global_step": 157670, "epoch": 3754} {"train_loss": -6.880719184875488, "global_step": 157671, "epoch": 3754} {"train_loss": -6.976317405700684, "global_step": 157672, "epoch": 3754} {"train_loss": -6.8931050300598145, "global_step": 157673, "epoch": 3754} {"train_loss": -6.955087184906006, "global_step": 157674, "epoch": 3754} {"train_loss": -6.8898210525512695, "global_step": 157675, "epoch": 3754} {"train_loss": -6.941934585571289, "global_step": 157676, "epoch": 3754} {"train_loss": -6.85432243347168, "global_step": 157677, "epoch": 3754} {"train_loss": -6.990954399108887, "global_step": 157678, "epoch": 3754} {"train_loss": -6.861350059509277, "global_step": 157679, "epoch": 3754} {"train_loss": -6.890534400939941, "global_step": 157680, "epoch": 3754} {"train_loss": -6.744224548339844, "global_step": 157681, "epoch": 3754} {"train_loss": -6.919707775115967, "global_step": 157682, "epoch": 3754} {"train_loss": -6.927418231964111, "global_step": 157683, "epoch": 3754} {"train_loss": -6.774141788482666, "global_step": 157684, "epoch": 3754} {"train_loss": -6.838414192199707, "global_step": 157685, "epoch": 3754} {"train_loss": -6.838346004486084, "global_step": 157686, "epoch": 3754} {"train_loss": -6.708906173706055, "global_step": 157687, "epoch": 3754} {"train_loss": -6.8497772216796875, "global_step": 157688, "epoch": 3754} {"train_loss": -6.885079383850098, "global_step": 157689, "epoch": 3754} {"train_loss": -6.695928573608398, "global_step": 157690, "epoch": 3754} {"train_loss": -6.925075054168701, "global_step": 157691, "epoch": 3754} {"train_loss": -6.888765335083008, "global_step": 157692, "epoch": 3754} {"train_loss": -6.817214012145996, "global_step": 157693, "epoch": 3754} {"train_loss": -6.888162136077881, "global_step": 157694, "epoch": 3754} {"train_loss": -6.865426540374756, "global_step": 157695, "epoch": 3754} {"train_loss": -6.94926643371582, "global_step": 157696, "epoch": 3754} {"train_loss": -6.965083122253418, "global_step": 157697, "epoch": 3754} {"train_loss": -6.901019096374512, "global_step": 157698, "epoch": 3754} {"train_loss": -6.9235992431640625, "global_step": 157699, "epoch": 3754} {"train_loss": -6.8419189453125, "global_step": 157700, "epoch": 3754} {"train_loss": -6.900204658508301, "global_step": 157701, "epoch": 3754} {"train_loss": -6.862900733947754, "global_step": 157702, "epoch": 3754} {"train_loss": -6.886857032775879, "global_step": 157703, "epoch": 3754} {"train_loss": -6.972495079040527, "global_step": 157704, "epoch": 3754} {"train_loss": -6.914657115936279, "global_step": 157705, "epoch": 3754} {"train_loss": -6.87666130065918, "global_step": 157706, "epoch": 3754} {"train_loss": -6.93946647644043, "global_step": 157707, "epoch": 3754} {"train_loss": -6.9119977951049805, "global_step": 157708, "epoch": 3754} {"train_loss": -6.889877307982672, "global_step": 157709, "epoch": 3754, "val_loss": 68469.71875} {"train_loss": -6.943075180053711, "global_step": 157710, "epoch": 3755} {"train_loss": -6.895913124084473, "global_step": 157711, "epoch": 3755} {"train_loss": -7.058653831481934, "global_step": 157712, "epoch": 3755} {"train_loss": -6.8759870529174805, "global_step": 157713, "epoch": 3755} {"train_loss": -6.916808128356934, "global_step": 157714, "epoch": 3755} {"train_loss": -6.894792556762695, "global_step": 157715, "epoch": 3755} {"train_loss": -6.915881633758545, "global_step": 157716, "epoch": 3755} {"train_loss": -7.041662216186523, "global_step": 157717, "epoch": 3755} {"train_loss": -6.926433563232422, "global_step": 157718, "epoch": 3755} {"train_loss": -6.870424270629883, "global_step": 157719, "epoch": 3755} {"train_loss": -6.933219909667969, "global_step": 157720, "epoch": 3755} {"train_loss": -6.9487810134887695, "global_step": 157721, "epoch": 3755} {"train_loss": -6.9494218826293945, "global_step": 157722, "epoch": 3755} {"train_loss": -6.985254287719727, "global_step": 157723, "epoch": 3755} {"train_loss": -6.859663963317871, "global_step": 157724, "epoch": 3755} {"train_loss": -6.90572452545166, "global_step": 157725, "epoch": 3755} {"train_loss": -6.933835029602051, "global_step": 157726, "epoch": 3755} {"train_loss": -6.834188938140869, "global_step": 157727, "epoch": 3755} {"train_loss": -6.876011848449707, "global_step": 157728, "epoch": 3755} {"train_loss": -6.917914390563965, "global_step": 157729, "epoch": 3755} {"train_loss": -6.805909156799316, "global_step": 157730, "epoch": 3755} {"train_loss": -6.917210102081299, "global_step": 157731, "epoch": 3755} {"train_loss": -6.789407730102539, "global_step": 157732, "epoch": 3755} {"train_loss": -6.72990083694458, "global_step": 157733, "epoch": 3755} {"train_loss": -6.788446426391602, "global_step": 157734, "epoch": 3755} {"train_loss": -6.864670753479004, "global_step": 157735, "epoch": 3755} {"train_loss": -6.902228355407715, "global_step": 157736, "epoch": 3755} {"train_loss": -6.8542890548706055, "global_step": 157737, "epoch": 3755} {"train_loss": -6.927364349365234, "global_step": 157738, "epoch": 3755} {"train_loss": -6.8683037757873535, "global_step": 157739, "epoch": 3755} {"train_loss": -6.861490249633789, "global_step": 157740, "epoch": 3755} {"train_loss": -6.969918251037598, "global_step": 157741, "epoch": 3755} {"train_loss": -6.85028076171875, "global_step": 157742, "epoch": 3755} {"train_loss": -6.821938991546631, "global_step": 157743, "epoch": 3755} {"train_loss": -6.911395072937012, "global_step": 157744, "epoch": 3755} {"train_loss": -6.873041152954102, "global_step": 157745, "epoch": 3755} {"train_loss": -6.637880325317383, "global_step": 157746, "epoch": 3755} {"train_loss": -6.744062423706055, "global_step": 157747, "epoch": 3755} {"train_loss": -6.884500980377197, "global_step": 157748, "epoch": 3755} {"train_loss": -6.73679256439209, "global_step": 157749, "epoch": 3755} {"train_loss": -6.885281562805176, "global_step": 157750, "epoch": 3755} {"train_loss": -6.877171028228033, "global_step": 157751, "epoch": 3755, "val_loss": 68719.484375} {"train_loss": -6.761979579925537, "global_step": 157752, "epoch": 3756} {"train_loss": -6.799555778503418, "global_step": 157753, "epoch": 3756} {"train_loss": -6.596528053283691, "global_step": 157754, "epoch": 3756} {"train_loss": -6.924975395202637, "global_step": 157755, "epoch": 3756} {"train_loss": -6.888794898986816, "global_step": 157756, "epoch": 3756} {"train_loss": -6.669269561767578, "global_step": 157757, "epoch": 3756} {"train_loss": -6.838286399841309, "global_step": 157758, "epoch": 3756} {"train_loss": -6.6234636306762695, "global_step": 157759, "epoch": 3756} {"train_loss": -6.811140060424805, "global_step": 157760, "epoch": 3756} {"train_loss": -6.738765716552734, "global_step": 157761, "epoch": 3756} {"train_loss": -6.827942371368408, "global_step": 157762, "epoch": 3756} {"train_loss": -6.735295295715332, "global_step": 157763, "epoch": 3756} {"train_loss": -6.822251319885254, "global_step": 157764, "epoch": 3756} {"train_loss": -6.8306779861450195, "global_step": 157765, "epoch": 3756} {"train_loss": -6.872574329376221, "global_step": 157766, "epoch": 3756} {"train_loss": -6.871919631958008, "global_step": 157767, "epoch": 3756} {"train_loss": -6.951705455780029, "global_step": 157768, "epoch": 3756} {"train_loss": -6.9333953857421875, "global_step": 157769, "epoch": 3756} {"train_loss": -6.869116306304932, "global_step": 157770, "epoch": 3756} {"train_loss": -6.887945652008057, "global_step": 157771, "epoch": 3756} {"train_loss": -6.93485164642334, "global_step": 157772, "epoch": 3756} {"train_loss": -6.970096588134766, "global_step": 157773, "epoch": 3756} {"train_loss": -6.932271957397461, "global_step": 157774, "epoch": 3756} {"train_loss": -6.862305641174316, "global_step": 157775, "epoch": 3756} {"train_loss": -6.922732830047607, "global_step": 157776, "epoch": 3756} {"train_loss": -6.814538955688477, "global_step": 157777, "epoch": 3756} {"train_loss": -6.8526811599731445, "global_step": 157778, "epoch": 3756} {"train_loss": -6.826360702514648, "global_step": 157779, "epoch": 3756} {"train_loss": -6.923131465911865, "global_step": 157780, "epoch": 3756} {"train_loss": -6.982009410858154, "global_step": 157781, "epoch": 3756} {"train_loss": -6.748258113861084, "global_step": 157782, "epoch": 3756} {"train_loss": -6.939586639404297, "global_step": 157783, "epoch": 3756} {"train_loss": -6.832232475280762, "global_step": 157784, "epoch": 3756} {"train_loss": -6.851312160491943, "global_step": 157785, "epoch": 3756} {"train_loss": -6.941192626953125, "global_step": 157786, "epoch": 3756} {"train_loss": -6.927623748779297, "global_step": 157787, "epoch": 3756} {"train_loss": -6.908356666564941, "global_step": 157788, "epoch": 3756} {"train_loss": -6.881556987762451, "global_step": 157789, "epoch": 3756} {"train_loss": -6.886553764343262, "global_step": 157790, "epoch": 3756} {"train_loss": -6.900278091430664, "global_step": 157791, "epoch": 3756} {"train_loss": -6.927268028259277, "global_step": 157792, "epoch": 3756} {"train_loss": -6.85732220468067, "global_step": 157793, "epoch": 3756, "val_loss": 68589.9609375} {"train_loss": -6.775838851928711, "global_step": 157794, "epoch": 3757} {"train_loss": -6.967155933380127, "global_step": 157795, "epoch": 3757} {"train_loss": -6.990781784057617, "global_step": 157796, "epoch": 3757} {"train_loss": -6.832633018493652, "global_step": 157797, "epoch": 3757} {"train_loss": -6.894967555999756, "global_step": 157798, "epoch": 3757} {"train_loss": -6.944625377655029, "global_step": 157799, "epoch": 3757} {"train_loss": -6.947292804718018, "global_step": 157800, "epoch": 3757} {"train_loss": -6.8695831298828125, "global_step": 157801, "epoch": 3757} {"train_loss": -6.955977439880371, "global_step": 157802, "epoch": 3757} {"train_loss": -6.912652492523193, "global_step": 157803, "epoch": 3757} {"train_loss": -6.945950508117676, "global_step": 157804, "epoch": 3757} {"train_loss": -6.870479106903076, "global_step": 157805, "epoch": 3757} {"train_loss": -6.9048991203308105, "global_step": 157806, "epoch": 3757} {"train_loss": -6.904318809509277, "global_step": 157807, "epoch": 3757} {"train_loss": -6.952888011932373, "global_step": 157808, "epoch": 3757} {"train_loss": -7.058588027954102, "global_step": 157809, "epoch": 3757} {"train_loss": -6.887432098388672, "global_step": 157810, "epoch": 3757} {"train_loss": -6.939776420593262, "global_step": 157811, "epoch": 3757} {"train_loss": -6.868826389312744, "global_step": 157812, "epoch": 3757} {"train_loss": -6.90512752532959, "global_step": 157813, "epoch": 3757} {"train_loss": -7.004594802856445, "global_step": 157814, "epoch": 3757} {"train_loss": -6.826003074645996, "global_step": 157815, "epoch": 3757} {"train_loss": -6.893044471740723, "global_step": 157816, "epoch": 3757} {"train_loss": -6.829280376434326, "global_step": 157817, "epoch": 3757} {"train_loss": -6.685685634613037, "global_step": 157818, "epoch": 3757} {"train_loss": -6.906212329864502, "global_step": 157819, "epoch": 3757} {"train_loss": -6.931417465209961, "global_step": 157820, "epoch": 3757} {"train_loss": -6.705338478088379, "global_step": 157821, "epoch": 3757} {"train_loss": -6.85099983215332, "global_step": 157822, "epoch": 3757} {"train_loss": -6.777041435241699, "global_step": 157823, "epoch": 3757} {"train_loss": -6.761418342590332, "global_step": 157824, "epoch": 3757} {"train_loss": -6.761399745941162, "global_step": 157825, "epoch": 3757} {"train_loss": -6.659479141235352, "global_step": 157826, "epoch": 3757} {"train_loss": -6.851142883300781, "global_step": 157827, "epoch": 3757} {"train_loss": -6.662097454071045, "global_step": 157828, "epoch": 3757} {"train_loss": -6.9163498878479, "global_step": 157829, "epoch": 3757} {"train_loss": -6.873857021331787, "global_step": 157830, "epoch": 3757} {"train_loss": -6.840496063232422, "global_step": 157831, "epoch": 3757} {"train_loss": -6.746776580810547, "global_step": 157832, "epoch": 3757} {"train_loss": -6.71634578704834, "global_step": 157833, "epoch": 3757} {"train_loss": -6.8314619064331055, "global_step": 157834, "epoch": 3757} {"train_loss": -6.8595988636925105, "global_step": 157835, "epoch": 3757, "val_loss": 68724.359375} {"train_loss": -6.740394115447998, "global_step": 157836, "epoch": 3758} {"train_loss": -6.88526725769043, "global_step": 157837, "epoch": 3758} {"train_loss": -6.786366939544678, "global_step": 157838, "epoch": 3758} {"train_loss": -6.845890522003174, "global_step": 157839, "epoch": 3758} {"train_loss": -6.889078140258789, "global_step": 157840, "epoch": 3758} {"train_loss": -6.897161960601807, "global_step": 157841, "epoch": 3758} {"train_loss": -6.893182754516602, "global_step": 157842, "epoch": 3758} {"train_loss": -6.855266094207764, "global_step": 157843, "epoch": 3758} {"train_loss": -6.840859889984131, "global_step": 157844, "epoch": 3758} {"train_loss": -6.823160171508789, "global_step": 157845, "epoch": 3758} {"train_loss": -6.928725242614746, "global_step": 157846, "epoch": 3758} {"train_loss": -6.907291889190674, "global_step": 157847, "epoch": 3758} {"train_loss": -6.891925811767578, "global_step": 157848, "epoch": 3758} {"train_loss": -6.898676872253418, "global_step": 157849, "epoch": 3758} {"train_loss": -6.895774841308594, "global_step": 157850, "epoch": 3758} {"train_loss": -6.903006076812744, "global_step": 157851, "epoch": 3758} {"train_loss": -6.988144874572754, "global_step": 157852, "epoch": 3758} {"train_loss": -6.860473155975342, "global_step": 157853, "epoch": 3758} {"train_loss": -6.878446102142334, "global_step": 157854, "epoch": 3758} {"train_loss": -6.903225898742676, "global_step": 157855, "epoch": 3758} {"train_loss": -6.857855796813965, "global_step": 157856, "epoch": 3758} {"train_loss": -6.92625617980957, "global_step": 157857, "epoch": 3758} {"train_loss": -6.8309526443481445, "global_step": 157858, "epoch": 3758} {"train_loss": -6.779604911804199, "global_step": 157859, "epoch": 3758} {"train_loss": -6.937967300415039, "global_step": 157860, "epoch": 3758} {"train_loss": -6.865619659423828, "global_step": 157861, "epoch": 3758} {"train_loss": -6.8905229568481445, "global_step": 157862, "epoch": 3758} {"train_loss": -6.955938339233398, "global_step": 157863, "epoch": 3758} {"train_loss": -6.7104902267456055, "global_step": 157864, "epoch": 3758} {"train_loss": -6.955042839050293, "global_step": 157865, "epoch": 3758} {"train_loss": -6.879523277282715, "global_step": 157866, "epoch": 3758} {"train_loss": -6.849324703216553, "global_step": 157867, "epoch": 3758} {"train_loss": -6.853024005889893, "global_step": 157868, "epoch": 3758} {"train_loss": -6.863724708557129, "global_step": 157869, "epoch": 3758} {"train_loss": -6.861868858337402, "global_step": 157870, "epoch": 3758} {"train_loss": -6.793184280395508, "global_step": 157871, "epoch": 3758} {"train_loss": -6.876993179321289, "global_step": 157872, "epoch": 3758} {"train_loss": -6.893490314483643, "global_step": 157873, "epoch": 3758} {"train_loss": -6.9178595542907715, "global_step": 157874, "epoch": 3758} {"train_loss": -6.933930397033691, "global_step": 157875, "epoch": 3758} {"train_loss": -6.891214847564697, "global_step": 157876, "epoch": 3758} {"train_loss": -6.874358790261405, "global_step": 157877, "epoch": 3758, "val_loss": 68467.3515625} {"train_loss": -6.754837512969971, "global_step": 157878, "epoch": 3759} {"train_loss": -6.916451454162598, "global_step": 157879, "epoch": 3759} {"train_loss": -6.939583778381348, "global_step": 157880, "epoch": 3759} {"train_loss": -6.781452178955078, "global_step": 157881, "epoch": 3759} {"train_loss": -6.854638576507568, "global_step": 157882, "epoch": 3759} {"train_loss": -6.8589935302734375, "global_step": 157883, "epoch": 3759} {"train_loss": -6.8658366203308105, "global_step": 157884, "epoch": 3759} {"train_loss": -6.835243225097656, "global_step": 157885, "epoch": 3759} {"train_loss": -6.906704425811768, "global_step": 157886, "epoch": 3759} {"train_loss": -6.979195594787598, "global_step": 157887, "epoch": 3759} {"train_loss": -6.946255683898926, "global_step": 157888, "epoch": 3759} {"train_loss": -7.061256408691406, "global_step": 157889, "epoch": 3759} {"train_loss": -6.834617614746094, "global_step": 157890, "epoch": 3759} {"train_loss": -6.884493827819824, "global_step": 157891, "epoch": 3759} {"train_loss": -6.897733211517334, "global_step": 157892, "epoch": 3759} {"train_loss": -6.990440368652344, "global_step": 157893, "epoch": 3759} {"train_loss": -6.929381847381592, "global_step": 157894, "epoch": 3759} {"train_loss": -6.8660430908203125, "global_step": 157895, "epoch": 3759} {"train_loss": -6.9574809074401855, "global_step": 157896, "epoch": 3759} {"train_loss": -6.985263824462891, "global_step": 157897, "epoch": 3759} {"train_loss": -6.96989107131958, "global_step": 157898, "epoch": 3759} {"train_loss": -6.93756628036499, "global_step": 157899, "epoch": 3759} {"train_loss": -6.937238693237305, "global_step": 157900, "epoch": 3759} {"train_loss": -6.966477394104004, "global_step": 157901, "epoch": 3759} {"train_loss": -7.009200096130371, "global_step": 157902, "epoch": 3759} {"train_loss": -7.003790855407715, "global_step": 157903, "epoch": 3759} {"train_loss": -6.884714603424072, "global_step": 157904, "epoch": 3759} {"train_loss": -6.87794303894043, "global_step": 157905, "epoch": 3759} {"train_loss": -6.9432573318481445, "global_step": 157906, "epoch": 3759} {"train_loss": -7.062115669250488, "global_step": 157907, "epoch": 3759} {"train_loss": -6.871530532836914, "global_step": 157908, "epoch": 3759} {"train_loss": -6.876513481140137, "global_step": 157909, "epoch": 3759} {"train_loss": -6.916012763977051, "global_step": 157910, "epoch": 3759} {"train_loss": -6.8143815994262695, "global_step": 157911, "epoch": 3759} {"train_loss": -6.904819011688232, "global_step": 157912, "epoch": 3759} {"train_loss": -6.863605499267578, "global_step": 157913, "epoch": 3759} {"train_loss": -6.945860862731934, "global_step": 157914, "epoch": 3759} {"train_loss": -6.9200005531311035, "global_step": 157915, "epoch": 3759} {"train_loss": -6.858443260192871, "global_step": 157916, "epoch": 3759} {"train_loss": -6.92843770980835, "global_step": 157917, "epoch": 3759} {"train_loss": -6.828874588012695, "global_step": 157918, "epoch": 3759} {"train_loss": -6.909132991518293, "global_step": 157919, "epoch": 3759, "val_loss": 68617.0625} {"train_loss": -6.873793601989746, "global_step": 157920, "epoch": 3760} {"train_loss": -6.9127326011657715, "global_step": 157921, "epoch": 3760} {"train_loss": -6.911472797393799, "global_step": 157922, "epoch": 3760} {"train_loss": -6.954214572906494, "global_step": 157923, "epoch": 3760} {"train_loss": -6.9109601974487305, "global_step": 157924, "epoch": 3760} {"train_loss": -6.907382011413574, "global_step": 157925, "epoch": 3760} {"train_loss": -6.950030326843262, "global_step": 157926, "epoch": 3760} {"train_loss": -6.830799102783203, "global_step": 157927, "epoch": 3760} {"train_loss": -7.022582054138184, "global_step": 157928, "epoch": 3760} {"train_loss": -6.836410999298096, "global_step": 157929, "epoch": 3760} {"train_loss": -6.940413951873779, "global_step": 157930, "epoch": 3760} {"train_loss": -6.712635040283203, "global_step": 157931, "epoch": 3760} {"train_loss": -6.915592670440674, "global_step": 157932, "epoch": 3760} {"train_loss": -7.025508880615234, "global_step": 157933, "epoch": 3760} {"train_loss": -6.935618877410889, "global_step": 157934, "epoch": 3760} {"train_loss": -6.835051536560059, "global_step": 157935, "epoch": 3760} {"train_loss": -6.9893293380737305, "global_step": 157936, "epoch": 3760} {"train_loss": -6.812849998474121, "global_step": 157937, "epoch": 3760} {"train_loss": -6.8518548011779785, "global_step": 157938, "epoch": 3760} {"train_loss": -6.924920082092285, "global_step": 157939, "epoch": 3760} {"train_loss": -6.83046817779541, "global_step": 157940, "epoch": 3760} {"train_loss": -6.890989780426025, "global_step": 157941, "epoch": 3760} {"train_loss": -6.862849712371826, "global_step": 157942, "epoch": 3760} {"train_loss": -6.9204559326171875, "global_step": 157943, "epoch": 3760} {"train_loss": -6.824156761169434, "global_step": 157944, "epoch": 3760} {"train_loss": -6.8967509269714355, "global_step": 157945, "epoch": 3760} {"train_loss": -6.822310447692871, "global_step": 157946, "epoch": 3760} {"train_loss": -6.746232986450195, "global_step": 157947, "epoch": 3760} {"train_loss": -6.931819915771484, "global_step": 157948, "epoch": 3760} {"train_loss": -6.947122097015381, "global_step": 157949, "epoch": 3760} {"train_loss": -6.831068992614746, "global_step": 157950, "epoch": 3760} {"train_loss": -6.861017227172852, "global_step": 157951, "epoch": 3760} {"train_loss": -6.847498893737793, "global_step": 157952, "epoch": 3760} {"train_loss": -6.738100051879883, "global_step": 157953, "epoch": 3760} {"train_loss": -6.8186140060424805, "global_step": 157954, "epoch": 3760} {"train_loss": -6.87277889251709, "global_step": 157955, "epoch": 3760} {"train_loss": -6.781217098236084, "global_step": 157956, "epoch": 3760} {"train_loss": -6.888514518737793, "global_step": 157957, "epoch": 3760} {"train_loss": -6.775099754333496, "global_step": 157958, "epoch": 3760} {"train_loss": -6.886753082275391, "global_step": 157959, "epoch": 3760} {"train_loss": -6.8434576988220215, "global_step": 157960, "epoch": 3760} {"train_loss": -6.8742729028066, "global_step": 157961, "epoch": 3760, "val_loss": 68697.6484375} {"train_loss": -6.884515285491943, "global_step": 157962, "epoch": 3761} {"train_loss": -6.7956461906433105, "global_step": 157963, "epoch": 3761} {"train_loss": -6.921873092651367, "global_step": 157964, "epoch": 3761} {"train_loss": -6.930535793304443, "global_step": 157965, "epoch": 3761} {"train_loss": -6.910687446594238, "global_step": 157966, "epoch": 3761} {"train_loss": -6.814429759979248, "global_step": 157967, "epoch": 3761} {"train_loss": -6.939942359924316, "global_step": 157968, "epoch": 3761} {"train_loss": -6.850354194641113, "global_step": 157969, "epoch": 3761} {"train_loss": -6.824734687805176, "global_step": 157970, "epoch": 3761} {"train_loss": -6.902463912963867, "global_step": 157971, "epoch": 3761} {"train_loss": -6.938586235046387, "global_step": 157972, "epoch": 3761} {"train_loss": -6.765616416931152, "global_step": 157973, "epoch": 3761} {"train_loss": -6.868807792663574, "global_step": 157974, "epoch": 3761} {"train_loss": -6.852717399597168, "global_step": 157975, "epoch": 3761} {"train_loss": -6.814370632171631, "global_step": 157976, "epoch": 3761} {"train_loss": -6.905925750732422, "global_step": 157977, "epoch": 3761} {"train_loss": -6.883617401123047, "global_step": 157978, "epoch": 3761} {"train_loss": -6.887594223022461, "global_step": 157979, "epoch": 3761} {"train_loss": -6.90925407409668, "global_step": 157980, "epoch": 3761} {"train_loss": -6.912021636962891, "global_step": 157981, "epoch": 3761} {"train_loss": -6.952419757843018, "global_step": 157982, "epoch": 3761} {"train_loss": -6.847405433654785, "global_step": 157983, "epoch": 3761} {"train_loss": -6.898059844970703, "global_step": 157984, "epoch": 3761} {"train_loss": -6.940607070922852, "global_step": 157985, "epoch": 3761} {"train_loss": -6.753647804260254, "global_step": 157986, "epoch": 3761} {"train_loss": -6.901608467102051, "global_step": 157987, "epoch": 3761} {"train_loss": -6.834019660949707, "global_step": 157988, "epoch": 3761} {"train_loss": -6.884676933288574, "global_step": 157989, "epoch": 3761} {"train_loss": -6.829346656799316, "global_step": 157990, "epoch": 3761} {"train_loss": -6.926105499267578, "global_step": 157991, "epoch": 3761} {"train_loss": -6.872952461242676, "global_step": 157992, "epoch": 3761} {"train_loss": -7.019352912902832, "global_step": 157993, "epoch": 3761} {"train_loss": -6.874330520629883, "global_step": 157994, "epoch": 3761} {"train_loss": -6.9295196533203125, "global_step": 157995, "epoch": 3761} {"train_loss": -6.978298187255859, "global_step": 157996, "epoch": 3761} {"train_loss": -6.887474536895752, "global_step": 157997, "epoch": 3761} {"train_loss": -6.803174018859863, "global_step": 157998, "epoch": 3761} {"train_loss": -6.886194705963135, "global_step": 157999, "epoch": 3761} {"train_loss": -6.826066970825195, "global_step": 158000, "epoch": 3761} {"train_loss": -6.866430282592773, "global_step": 158001, "epoch": 3761} {"train_loss": -6.856529712677002, "global_step": 158002, "epoch": 3761} {"train_loss": -6.879883698054722, "global_step": 158003, "epoch": 3761, "val_loss": 68689.2578125} {"train_loss": -6.904586315155029, "global_step": 158004, "epoch": 3762} {"train_loss": -6.946181774139404, "global_step": 158005, "epoch": 3762} {"train_loss": -6.77341890335083, "global_step": 158006, "epoch": 3762} {"train_loss": -6.945040702819824, "global_step": 158007, "epoch": 3762} {"train_loss": -7.017434597015381, "global_step": 158008, "epoch": 3762} {"train_loss": -6.952093124389648, "global_step": 158009, "epoch": 3762} {"train_loss": -6.750605583190918, "global_step": 158010, "epoch": 3762} {"train_loss": -6.926147937774658, "global_step": 158011, "epoch": 3762} {"train_loss": -6.8397369384765625, "global_step": 158012, "epoch": 3762} {"train_loss": -6.87254524230957, "global_step": 158013, "epoch": 3762} {"train_loss": -6.863503456115723, "global_step": 158014, "epoch": 3762} {"train_loss": -6.909049987792969, "global_step": 158015, "epoch": 3762} {"train_loss": -6.898852348327637, "global_step": 158016, "epoch": 3762} {"train_loss": -6.928507328033447, "global_step": 158017, "epoch": 3762} {"train_loss": -6.809852600097656, "global_step": 158018, "epoch": 3762} {"train_loss": -6.863151550292969, "global_step": 158019, "epoch": 3762} {"train_loss": -6.759613990783691, "global_step": 158020, "epoch": 3762} {"train_loss": -6.809764862060547, "global_step": 158021, "epoch": 3762} {"train_loss": -6.989038467407227, "global_step": 158022, "epoch": 3762} {"train_loss": -6.785159587860107, "global_step": 158023, "epoch": 3762} {"train_loss": -6.834695816040039, "global_step": 158024, "epoch": 3762} {"train_loss": -6.863855838775635, "global_step": 158025, "epoch": 3762} {"train_loss": -6.78544807434082, "global_step": 158026, "epoch": 3762} {"train_loss": -6.825697898864746, "global_step": 158027, "epoch": 3762} {"train_loss": -6.869443893432617, "global_step": 158028, "epoch": 3762} {"train_loss": -6.851805686950684, "global_step": 158029, "epoch": 3762} {"train_loss": -6.8232598304748535, "global_step": 158030, "epoch": 3762} {"train_loss": -6.897940635681152, "global_step": 158031, "epoch": 3762} {"train_loss": -6.839517593383789, "global_step": 158032, "epoch": 3762} {"train_loss": -6.966773986816406, "global_step": 158033, "epoch": 3762} {"train_loss": -6.873291015625, "global_step": 158034, "epoch": 3762} {"train_loss": -6.924072265625, "global_step": 158035, "epoch": 3762} {"train_loss": -6.981450080871582, "global_step": 158036, "epoch": 3762} {"train_loss": -6.845036506652832, "global_step": 158037, "epoch": 3762} {"train_loss": -6.820651054382324, "global_step": 158038, "epoch": 3762} {"train_loss": -6.922272205352783, "global_step": 158039, "epoch": 3762} {"train_loss": -7.08763313293457, "global_step": 158040, "epoch": 3762} {"train_loss": -6.788553237915039, "global_step": 158041, "epoch": 3762} {"train_loss": -6.836143493652344, "global_step": 158042, "epoch": 3762} {"train_loss": -6.924236297607422, "global_step": 158043, "epoch": 3762} {"train_loss": -6.677012920379639, "global_step": 158044, "epoch": 3762} {"train_loss": -6.87058374995277, "global_step": 158045, "epoch": 3762, "val_loss": 68429.96875} {"train_loss": -6.858201026916504, "global_step": 158046, "epoch": 3763} {"train_loss": -6.928433418273926, "global_step": 158047, "epoch": 3763} {"train_loss": -6.835850715637207, "global_step": 158048, "epoch": 3763} {"train_loss": -6.91424036026001, "global_step": 158049, "epoch": 3763} {"train_loss": -7.011747360229492, "global_step": 158050, "epoch": 3763} {"train_loss": -6.835041046142578, "global_step": 158051, "epoch": 3763} {"train_loss": -7.009032249450684, "global_step": 158052, "epoch": 3763} {"train_loss": -6.790913105010986, "global_step": 158053, "epoch": 3763} {"train_loss": -6.853759765625, "global_step": 158054, "epoch": 3763} {"train_loss": -6.877225875854492, "global_step": 158055, "epoch": 3763} {"train_loss": -6.711464881896973, "global_step": 158056, "epoch": 3763} {"train_loss": -6.951878070831299, "global_step": 158057, "epoch": 3763} {"train_loss": -6.872200012207031, "global_step": 158058, "epoch": 3763} {"train_loss": -6.8045334815979, "global_step": 158059, "epoch": 3763} {"train_loss": -6.994320392608643, "global_step": 158060, "epoch": 3763} {"train_loss": -6.851640224456787, "global_step": 158061, "epoch": 3763} {"train_loss": -6.923085689544678, "global_step": 158062, "epoch": 3763} {"train_loss": -6.97252893447876, "global_step": 158063, "epoch": 3763} {"train_loss": -6.931365966796875, "global_step": 158064, "epoch": 3763} {"train_loss": -6.926257610321045, "global_step": 158065, "epoch": 3763} {"train_loss": -6.9074482917785645, "global_step": 158066, "epoch": 3763} {"train_loss": -6.81284236907959, "global_step": 158067, "epoch": 3763} {"train_loss": -6.9489545822143555, "global_step": 158068, "epoch": 3763} {"train_loss": -6.886017322540283, "global_step": 158069, "epoch": 3763} {"train_loss": -6.9128241539001465, "global_step": 158070, "epoch": 3763} {"train_loss": -6.911748886108398, "global_step": 158071, "epoch": 3763} {"train_loss": -6.976849555969238, "global_step": 158072, "epoch": 3763} {"train_loss": -6.84577751159668, "global_step": 158073, "epoch": 3763} {"train_loss": -6.824005126953125, "global_step": 158074, "epoch": 3763} {"train_loss": -6.880399227142334, "global_step": 158075, "epoch": 3763} {"train_loss": -6.930812835693359, "global_step": 158076, "epoch": 3763} {"train_loss": -6.9454240798950195, "global_step": 158077, "epoch": 3763} {"train_loss": -6.905185699462891, "global_step": 158078, "epoch": 3763} {"train_loss": -6.768139839172363, "global_step": 158079, "epoch": 3763} {"train_loss": -6.7766432762146, "global_step": 158080, "epoch": 3763} {"train_loss": -6.802523612976074, "global_step": 158081, "epoch": 3763} {"train_loss": -6.897891044616699, "global_step": 158082, "epoch": 3763} {"train_loss": -6.7795586585998535, "global_step": 158083, "epoch": 3763} {"train_loss": -6.844935417175293, "global_step": 158084, "epoch": 3763} {"train_loss": -6.909167289733887, "global_step": 158085, "epoch": 3763} {"train_loss": -6.848813056945801, "global_step": 158086, "epoch": 3763} {"train_loss": -6.880161875770206, "global_step": 158087, "epoch": 3763, "val_loss": 68392.5078125} {"train_loss": -6.8103532791137695, "global_step": 158088, "epoch": 3764} {"train_loss": -6.902973175048828, "global_step": 158089, "epoch": 3764} {"train_loss": -6.765649795532227, "global_step": 158090, "epoch": 3764} {"train_loss": -6.915915489196777, "global_step": 158091, "epoch": 3764} {"train_loss": -7.054980754852295, "global_step": 158092, "epoch": 3764} {"train_loss": -6.866264343261719, "global_step": 158093, "epoch": 3764} {"train_loss": -6.919221878051758, "global_step": 158094, "epoch": 3764} {"train_loss": -6.901311874389648, "global_step": 158095, "epoch": 3764} {"train_loss": -6.8928070068359375, "global_step": 158096, "epoch": 3764} {"train_loss": -6.831790924072266, "global_step": 158097, "epoch": 3764} {"train_loss": -6.77048397064209, "global_step": 158098, "epoch": 3764} {"train_loss": -6.897820949554443, "global_step": 158099, "epoch": 3764} {"train_loss": -6.955913543701172, "global_step": 158100, "epoch": 3764} {"train_loss": -6.889216899871826, "global_step": 158101, "epoch": 3764} {"train_loss": -6.965747833251953, "global_step": 158102, "epoch": 3764} {"train_loss": -6.998673439025879, "global_step": 158103, "epoch": 3764} {"train_loss": -6.933664321899414, "global_step": 158104, "epoch": 3764} {"train_loss": -6.828736305236816, "global_step": 158105, "epoch": 3764} {"train_loss": -6.974359512329102, "global_step": 158106, "epoch": 3764} {"train_loss": -6.903131484985352, "global_step": 158107, "epoch": 3764} {"train_loss": -6.904338836669922, "global_step": 158108, "epoch": 3764} {"train_loss": -6.9301018714904785, "global_step": 158109, "epoch": 3764} {"train_loss": -6.9167561531066895, "global_step": 158110, "epoch": 3764} {"train_loss": -6.895170211791992, "global_step": 158111, "epoch": 3764} {"train_loss": -6.90369987487793, "global_step": 158112, "epoch": 3764} {"train_loss": -7.001951694488525, "global_step": 158113, "epoch": 3764} {"train_loss": -6.930064678192139, "global_step": 158114, "epoch": 3764} {"train_loss": -6.830358982086182, "global_step": 158115, "epoch": 3764} {"train_loss": -6.960088729858398, "global_step": 158116, "epoch": 3764} {"train_loss": -6.880069732666016, "global_step": 158117, "epoch": 3764} {"train_loss": -6.856743335723877, "global_step": 158118, "epoch": 3764} {"train_loss": -6.821961402893066, "global_step": 158119, "epoch": 3764} {"train_loss": -6.8523359298706055, "global_step": 158120, "epoch": 3764} {"train_loss": -6.838224411010742, "global_step": 158121, "epoch": 3764} {"train_loss": -6.8910722732543945, "global_step": 158122, "epoch": 3764} {"train_loss": -6.7750349044799805, "global_step": 158123, "epoch": 3764} {"train_loss": -6.88925313949585, "global_step": 158124, "epoch": 3764} {"train_loss": -6.790497779846191, "global_step": 158125, "epoch": 3764} {"train_loss": -6.680018424987793, "global_step": 158126, "epoch": 3764} {"train_loss": -6.793204307556152, "global_step": 158127, "epoch": 3764} {"train_loss": -6.910220623016357, "global_step": 158128, "epoch": 3764} {"train_loss": -6.881824731826782, "global_step": 158129, "epoch": 3764, "val_loss": 68756.03125} {"train_loss": -6.80927848815918, "global_step": 158130, "epoch": 3765} {"train_loss": -6.999996185302734, "global_step": 158131, "epoch": 3765} {"train_loss": -6.819069862365723, "global_step": 158132, "epoch": 3765} {"train_loss": -6.730674743652344, "global_step": 158133, "epoch": 3765} {"train_loss": -6.926879405975342, "global_step": 158134, "epoch": 3765} {"train_loss": -6.910945415496826, "global_step": 158135, "epoch": 3765} {"train_loss": -6.780736923217773, "global_step": 158136, "epoch": 3765} {"train_loss": -6.95449686050415, "global_step": 158137, "epoch": 3765} {"train_loss": -6.751115322113037, "global_step": 158138, "epoch": 3765} {"train_loss": -6.890073299407959, "global_step": 158139, "epoch": 3765} {"train_loss": -6.818548202514648, "global_step": 158140, "epoch": 3765} {"train_loss": -6.922801971435547, "global_step": 158141, "epoch": 3765} {"train_loss": -6.919623851776123, "global_step": 158142, "epoch": 3765} {"train_loss": -6.913311004638672, "global_step": 158143, "epoch": 3765} {"train_loss": -6.894083023071289, "global_step": 158144, "epoch": 3765} {"train_loss": -6.980591773986816, "global_step": 158145, "epoch": 3765} {"train_loss": -6.954225540161133, "global_step": 158146, "epoch": 3765} {"train_loss": -6.825860977172852, "global_step": 158147, "epoch": 3765} {"train_loss": -6.924604415893555, "global_step": 158148, "epoch": 3765} {"train_loss": -6.961312294006348, "global_step": 158149, "epoch": 3765} {"train_loss": -6.922511100769043, "global_step": 158150, "epoch": 3765} {"train_loss": -6.836485385894775, "global_step": 158151, "epoch": 3765} {"train_loss": -6.944784164428711, "global_step": 158152, "epoch": 3765} {"train_loss": -6.833987236022949, "global_step": 158153, "epoch": 3765} {"train_loss": -6.812869548797607, "global_step": 158154, "epoch": 3765} {"train_loss": -6.83622932434082, "global_step": 158155, "epoch": 3765} {"train_loss": -6.961216926574707, "global_step": 158156, "epoch": 3765} {"train_loss": -6.817438125610352, "global_step": 158157, "epoch": 3765} {"train_loss": -6.854842185974121, "global_step": 158158, "epoch": 3765} {"train_loss": -6.916416168212891, "global_step": 158159, "epoch": 3765} {"train_loss": -6.911169528961182, "global_step": 158160, "epoch": 3765} {"train_loss": -6.901390552520752, "global_step": 158161, "epoch": 3765} {"train_loss": -6.75874662399292, "global_step": 158162, "epoch": 3765} {"train_loss": -6.897547721862793, "global_step": 158163, "epoch": 3765} {"train_loss": -6.912124156951904, "global_step": 158164, "epoch": 3765} {"train_loss": -6.834524631500244, "global_step": 158165, "epoch": 3765} {"train_loss": -6.708658218383789, "global_step": 158166, "epoch": 3765} {"train_loss": -6.904143333435059, "global_step": 158167, "epoch": 3765} {"train_loss": -6.888956069946289, "global_step": 158168, "epoch": 3765} {"train_loss": -6.87785530090332, "global_step": 158169, "epoch": 3765} {"train_loss": -6.882315635681152, "global_step": 158170, "epoch": 3765} {"train_loss": -6.8739181359608965, "global_step": 158171, "epoch": 3765, "val_loss": 68715.21875} {"train_loss": -6.822988986968994, "global_step": 158172, "epoch": 3766} {"train_loss": -6.97342586517334, "global_step": 158173, "epoch": 3766} {"train_loss": -6.9436845779418945, "global_step": 158174, "epoch": 3766} {"train_loss": -6.770877838134766, "global_step": 158175, "epoch": 3766} {"train_loss": -6.869948387145996, "global_step": 158176, "epoch": 3766} {"train_loss": -6.867423057556152, "global_step": 158177, "epoch": 3766} {"train_loss": -6.893919944763184, "global_step": 158178, "epoch": 3766} {"train_loss": -6.824934005737305, "global_step": 158179, "epoch": 3766} {"train_loss": -6.798184394836426, "global_step": 158180, "epoch": 3766} {"train_loss": -6.8350324630737305, "global_step": 158181, "epoch": 3766} {"train_loss": -6.700114727020264, "global_step": 158182, "epoch": 3766} {"train_loss": -6.912747383117676, "global_step": 158183, "epoch": 3766} {"train_loss": -6.847264289855957, "global_step": 158184, "epoch": 3766} {"train_loss": -6.83270263671875, "global_step": 158185, "epoch": 3766} {"train_loss": -6.914422512054443, "global_step": 158186, "epoch": 3766} {"train_loss": -6.815281867980957, "global_step": 158187, "epoch": 3766} {"train_loss": -6.736128330230713, "global_step": 158188, "epoch": 3766} {"train_loss": -6.840057373046875, "global_step": 158189, "epoch": 3766} {"train_loss": -6.6742143630981445, "global_step": 158190, "epoch": 3766} {"train_loss": -6.658670425415039, "global_step": 158191, "epoch": 3766} {"train_loss": -6.7375335693359375, "global_step": 158192, "epoch": 3766} {"train_loss": -6.85792875289917, "global_step": 158193, "epoch": 3766} {"train_loss": -6.869101047515869, "global_step": 158194, "epoch": 3766} {"train_loss": -6.734362602233887, "global_step": 158195, "epoch": 3766} {"train_loss": -6.990370750427246, "global_step": 158196, "epoch": 3766} {"train_loss": -6.869724750518799, "global_step": 158197, "epoch": 3766} {"train_loss": -6.853507995605469, "global_step": 158198, "epoch": 3766} {"train_loss": -6.878759384155273, "global_step": 158199, "epoch": 3766} {"train_loss": -6.839910507202148, "global_step": 158200, "epoch": 3766} {"train_loss": -6.952349662780762, "global_step": 158201, "epoch": 3766} {"train_loss": -6.882325172424316, "global_step": 158202, "epoch": 3766} {"train_loss": -6.808626174926758, "global_step": 158203, "epoch": 3766} {"train_loss": -7.045348644256592, "global_step": 158204, "epoch": 3766} {"train_loss": -6.875137805938721, "global_step": 158205, "epoch": 3766} {"train_loss": -7.002457618713379, "global_step": 158206, "epoch": 3766} {"train_loss": -7.008224010467529, "global_step": 158207, "epoch": 3766} {"train_loss": -6.919367790222168, "global_step": 158208, "epoch": 3766} {"train_loss": -6.96876335144043, "global_step": 158209, "epoch": 3766} {"train_loss": -6.9217987060546875, "global_step": 158210, "epoch": 3766} {"train_loss": -6.782521724700928, "global_step": 158211, "epoch": 3766} {"train_loss": -6.871172904968262, "global_step": 158212, "epoch": 3766} {"train_loss": -6.859354223523821, "global_step": 158213, "epoch": 3766, "val_loss": 68710.8359375} {"train_loss": -6.679706573486328, "global_step": 158214, "epoch": 3767} {"train_loss": -6.869936943054199, "global_step": 158215, "epoch": 3767} {"train_loss": -6.890890598297119, "global_step": 158216, "epoch": 3767} {"train_loss": -6.806401252746582, "global_step": 158217, "epoch": 3767} {"train_loss": -7.071124076843262, "global_step": 158218, "epoch": 3767} {"train_loss": -6.853418350219727, "global_step": 158219, "epoch": 3767} {"train_loss": -6.887009143829346, "global_step": 158220, "epoch": 3767} {"train_loss": -6.945509433746338, "global_step": 158221, "epoch": 3767} {"train_loss": -6.905135154724121, "global_step": 158222, "epoch": 3767} {"train_loss": -6.908868789672852, "global_step": 158223, "epoch": 3767} {"train_loss": -6.935451507568359, "global_step": 158224, "epoch": 3767} {"train_loss": -6.809686660766602, "global_step": 158225, "epoch": 3767} {"train_loss": -6.870838165283203, "global_step": 158226, "epoch": 3767} {"train_loss": -6.816715240478516, "global_step": 158227, "epoch": 3767} {"train_loss": -6.872933387756348, "global_step": 158228, "epoch": 3767} {"train_loss": -6.954046249389648, "global_step": 158229, "epoch": 3767} {"train_loss": -6.9048566818237305, "global_step": 158230, "epoch": 3767} {"train_loss": -6.848527908325195, "global_step": 158231, "epoch": 3767} {"train_loss": -6.919034004211426, "global_step": 158232, "epoch": 3767} {"train_loss": -6.83338737487793, "global_step": 158233, "epoch": 3767} {"train_loss": -6.9405107498168945, "global_step": 158234, "epoch": 3767} {"train_loss": -7.008388519287109, "global_step": 158235, "epoch": 3767} {"train_loss": -6.889928340911865, "global_step": 158236, "epoch": 3767} {"train_loss": -6.987703800201416, "global_step": 158237, "epoch": 3767} {"train_loss": -6.9508056640625, "global_step": 158238, "epoch": 3767} {"train_loss": -6.884999752044678, "global_step": 158239, "epoch": 3767} {"train_loss": -6.981888294219971, "global_step": 158240, "epoch": 3767} {"train_loss": -6.96691370010376, "global_step": 158241, "epoch": 3767} {"train_loss": -6.834798812866211, "global_step": 158242, "epoch": 3767} {"train_loss": -7.036469459533691, "global_step": 158243, "epoch": 3767} {"train_loss": -6.941878795623779, "global_step": 158244, "epoch": 3767} {"train_loss": -6.7978010177612305, "global_step": 158245, "epoch": 3767} {"train_loss": -6.8282928466796875, "global_step": 158246, "epoch": 3767} {"train_loss": -6.911335468292236, "global_step": 158247, "epoch": 3767} {"train_loss": -6.957644462585449, "global_step": 158248, "epoch": 3767} {"train_loss": -6.87281608581543, "global_step": 158249, "epoch": 3767} {"train_loss": -6.8010101318359375, "global_step": 158250, "epoch": 3767} {"train_loss": -6.8801469802856445, "global_step": 158251, "epoch": 3767} {"train_loss": -6.819417953491211, "global_step": 158252, "epoch": 3767} {"train_loss": -6.8736701011657715, "global_step": 158253, "epoch": 3767} {"train_loss": -6.7661848068237305, "global_step": 158254, "epoch": 3767} {"train_loss": -6.8863739513215565, "global_step": 158255, "epoch": 3767, "val_loss": 68603.0390625} {"train_loss": -7.007410049438477, "global_step": 158256, "epoch": 3768} {"train_loss": -6.86574649810791, "global_step": 158257, "epoch": 3768} {"train_loss": -6.856995105743408, "global_step": 158258, "epoch": 3768} {"train_loss": -6.921685218811035, "global_step": 158259, "epoch": 3768} {"train_loss": -6.878041744232178, "global_step": 158260, "epoch": 3768} {"train_loss": -6.796087265014648, "global_step": 158261, "epoch": 3768} {"train_loss": -6.90037727355957, "global_step": 158262, "epoch": 3768} {"train_loss": -6.813899993896484, "global_step": 158263, "epoch": 3768} {"train_loss": -6.8304643630981445, "global_step": 158264, "epoch": 3768} {"train_loss": -6.925106048583984, "global_step": 158265, "epoch": 3768} {"train_loss": -6.905416488647461, "global_step": 158266, "epoch": 3768} {"train_loss": -6.844354152679443, "global_step": 158267, "epoch": 3768} {"train_loss": -6.916586875915527, "global_step": 158268, "epoch": 3768} {"train_loss": -6.80036735534668, "global_step": 158269, "epoch": 3768} {"train_loss": -6.7850236892700195, "global_step": 158270, "epoch": 3768} {"train_loss": -6.892635345458984, "global_step": 158271, "epoch": 3768} {"train_loss": -6.729035377502441, "global_step": 158272, "epoch": 3768} {"train_loss": -6.955459117889404, "global_step": 158273, "epoch": 3768} {"train_loss": -6.667881965637207, "global_step": 158274, "epoch": 3768} {"train_loss": -6.881901741027832, "global_step": 158275, "epoch": 3768} {"train_loss": -6.817885875701904, "global_step": 158276, "epoch": 3768} {"train_loss": -6.882569789886475, "global_step": 158277, "epoch": 3768} {"train_loss": -6.938163757324219, "global_step": 158278, "epoch": 3768} {"train_loss": -6.765003204345703, "global_step": 158279, "epoch": 3768} {"train_loss": -6.8323774337768555, "global_step": 158280, "epoch": 3768} {"train_loss": -6.923986434936523, "global_step": 158281, "epoch": 3768} {"train_loss": -6.873589515686035, "global_step": 158282, "epoch": 3768} {"train_loss": -6.890837669372559, "global_step": 158283, "epoch": 3768} {"train_loss": -6.976815223693848, "global_step": 158284, "epoch": 3768} {"train_loss": -6.888972282409668, "global_step": 158285, "epoch": 3768} {"train_loss": -6.899484157562256, "global_step": 158286, "epoch": 3768} {"train_loss": -6.8231916427612305, "global_step": 158287, "epoch": 3768} {"train_loss": -6.83586311340332, "global_step": 158288, "epoch": 3768} {"train_loss": -6.759652137756348, "global_step": 158289, "epoch": 3768} {"train_loss": -6.841307640075684, "global_step": 158290, "epoch": 3768} {"train_loss": -6.870439529418945, "global_step": 158291, "epoch": 3768} {"train_loss": -6.836206436157227, "global_step": 158292, "epoch": 3768} {"train_loss": -6.933548927307129, "global_step": 158293, "epoch": 3768} {"train_loss": -6.846464157104492, "global_step": 158294, "epoch": 3768} {"train_loss": -6.966141700744629, "global_step": 158295, "epoch": 3768} {"train_loss": -6.916977405548096, "global_step": 158296, "epoch": 3768} {"train_loss": -6.864593176614671, "global_step": 158297, "epoch": 3768, "val_loss": 68370.109375} {"train_loss": -6.984969139099121, "global_step": 158298, "epoch": 3769} {"train_loss": -6.933704376220703, "global_step": 158299, "epoch": 3769} {"train_loss": -6.975915908813477, "global_step": 158300, "epoch": 3769} {"train_loss": -6.8838887214660645, "global_step": 158301, "epoch": 3769} {"train_loss": -6.781126022338867, "global_step": 158302, "epoch": 3769} {"train_loss": -6.815547943115234, "global_step": 158303, "epoch": 3769} {"train_loss": -6.733329772949219, "global_step": 158304, "epoch": 3769} {"train_loss": -6.814871788024902, "global_step": 158305, "epoch": 3769} {"train_loss": -6.819149017333984, "global_step": 158306, "epoch": 3769} {"train_loss": -6.626977920532227, "global_step": 158307, "epoch": 3769} {"train_loss": -6.838069915771484, "global_step": 158308, "epoch": 3769} {"train_loss": -6.722015857696533, "global_step": 158309, "epoch": 3769} {"train_loss": -6.90257453918457, "global_step": 158310, "epoch": 3769} {"train_loss": -6.817807197570801, "global_step": 158311, "epoch": 3769} {"train_loss": -6.721379280090332, "global_step": 158312, "epoch": 3769} {"train_loss": -6.731834411621094, "global_step": 158313, "epoch": 3769} {"train_loss": -6.733818054199219, "global_step": 158314, "epoch": 3769} {"train_loss": -6.8079915046691895, "global_step": 158315, "epoch": 3769} {"train_loss": -6.866411209106445, "global_step": 158316, "epoch": 3769} {"train_loss": -6.82775354385376, "global_step": 158317, "epoch": 3769} {"train_loss": -6.733648300170898, "global_step": 158318, "epoch": 3769} {"train_loss": -6.728009223937988, "global_step": 158319, "epoch": 3769} {"train_loss": -6.7987470626831055, "global_step": 158320, "epoch": 3769} {"train_loss": -6.789420127868652, "global_step": 158321, "epoch": 3769} {"train_loss": -6.723695755004883, "global_step": 158322, "epoch": 3769} {"train_loss": -6.809913635253906, "global_step": 158323, "epoch": 3769} {"train_loss": -6.748601913452148, "global_step": 158324, "epoch": 3769} {"train_loss": -7.007630348205566, "global_step": 158325, "epoch": 3769} {"train_loss": -6.787222862243652, "global_step": 158326, "epoch": 3769} {"train_loss": -6.733546257019043, "global_step": 158327, "epoch": 3769} {"train_loss": -6.825443267822266, "global_step": 158328, "epoch": 3769} {"train_loss": -6.8544745445251465, "global_step": 158329, "epoch": 3769} {"train_loss": -6.854837894439697, "global_step": 158330, "epoch": 3769} {"train_loss": -6.882229328155518, "global_step": 158331, "epoch": 3769} {"train_loss": -6.758183479309082, "global_step": 158332, "epoch": 3769} {"train_loss": -6.791682243347168, "global_step": 158333, "epoch": 3769} {"train_loss": -6.925328254699707, "global_step": 158334, "epoch": 3769} {"train_loss": -6.7629241943359375, "global_step": 158335, "epoch": 3769} {"train_loss": -6.809946060180664, "global_step": 158336, "epoch": 3769} {"train_loss": -6.906398773193359, "global_step": 158337, "epoch": 3769} {"train_loss": -6.862742900848389, "global_step": 158338, "epoch": 3769} {"train_loss": -6.815556548890614, "global_step": 158339, "epoch": 3769, "val_loss": 68484.0625} {"train_loss": -6.896450996398926, "global_step": 158340, "epoch": 3770} {"train_loss": -6.968825340270996, "global_step": 158341, "epoch": 3770} {"train_loss": -6.930628776550293, "global_step": 158342, "epoch": 3770} {"train_loss": -6.820157051086426, "global_step": 158343, "epoch": 3770} {"train_loss": -7.0241570472717285, "global_step": 158344, "epoch": 3770} {"train_loss": -6.990726947784424, "global_step": 158345, "epoch": 3770} {"train_loss": -6.882335662841797, "global_step": 158346, "epoch": 3770} {"train_loss": -6.948155403137207, "global_step": 158347, "epoch": 3770} {"train_loss": -6.862215995788574, "global_step": 158348, "epoch": 3770} {"train_loss": -6.910076141357422, "global_step": 158349, "epoch": 3770} {"train_loss": -6.827376365661621, "global_step": 158350, "epoch": 3770} {"train_loss": -6.918328285217285, "global_step": 158351, "epoch": 3770} {"train_loss": -6.961230278015137, "global_step": 158352, "epoch": 3770} {"train_loss": -6.906886100769043, "global_step": 158353, "epoch": 3770} {"train_loss": -6.797787189483643, "global_step": 158354, "epoch": 3770} {"train_loss": -6.932553768157959, "global_step": 158355, "epoch": 3770} {"train_loss": -6.876224517822266, "global_step": 158356, "epoch": 3770} {"train_loss": -6.7616682052612305, "global_step": 158357, "epoch": 3770} {"train_loss": -7.013162612915039, "global_step": 158358, "epoch": 3770} {"train_loss": -6.921480178833008, "global_step": 158359, "epoch": 3770} {"train_loss": -6.721511363983154, "global_step": 158360, "epoch": 3770} {"train_loss": -6.8313164710998535, "global_step": 158361, "epoch": 3770} {"train_loss": -6.814510822296143, "global_step": 158362, "epoch": 3770} {"train_loss": -6.934469699859619, "global_step": 158363, "epoch": 3770} {"train_loss": -6.947391510009766, "global_step": 158364, "epoch": 3770} {"train_loss": -6.777352809906006, "global_step": 158365, "epoch": 3770} {"train_loss": -6.8661017417907715, "global_step": 158366, "epoch": 3770} {"train_loss": -6.834636688232422, "global_step": 158367, "epoch": 3770} {"train_loss": -6.856498718261719, "global_step": 158368, "epoch": 3770} {"train_loss": -6.901796817779541, "global_step": 158369, "epoch": 3770} {"train_loss": -6.813769340515137, "global_step": 158370, "epoch": 3770} {"train_loss": -6.887944221496582, "global_step": 158371, "epoch": 3770} {"train_loss": -6.957119941711426, "global_step": 158372, "epoch": 3770} {"train_loss": -6.76740837097168, "global_step": 158373, "epoch": 3770} {"train_loss": -6.935337066650391, "global_step": 158374, "epoch": 3770} {"train_loss": -6.841721534729004, "global_step": 158375, "epoch": 3770} {"train_loss": -6.817752838134766, "global_step": 158376, "epoch": 3770} {"train_loss": -6.83383321762085, "global_step": 158377, "epoch": 3770} {"train_loss": -6.880027770996094, "global_step": 158378, "epoch": 3770} {"train_loss": -6.930051326751709, "global_step": 158379, "epoch": 3770} {"train_loss": -6.8376359939575195, "global_step": 158380, "epoch": 3770} {"train_loss": -6.882936795552571, "global_step": 158381, "epoch": 3770, "val_loss": 68602.1328125} {"train_loss": -6.872377872467041, "global_step": 158382, "epoch": 3771} {"train_loss": -6.881426811218262, "global_step": 158383, "epoch": 3771} {"train_loss": -6.900908470153809, "global_step": 158384, "epoch": 3771} {"train_loss": -6.863269805908203, "global_step": 158385, "epoch": 3771} {"train_loss": -6.882395267486572, "global_step": 158386, "epoch": 3771} {"train_loss": -6.879988193511963, "global_step": 158387, "epoch": 3771} {"train_loss": -6.858994483947754, "global_step": 158388, "epoch": 3771} {"train_loss": -6.937117576599121, "global_step": 158389, "epoch": 3771} {"train_loss": -6.914494514465332, "global_step": 158390, "epoch": 3771} {"train_loss": -6.8852715492248535, "global_step": 158391, "epoch": 3771} {"train_loss": -6.787054538726807, "global_step": 158392, "epoch": 3771} {"train_loss": -6.8260416984558105, "global_step": 158393, "epoch": 3771} {"train_loss": -6.876082420349121, "global_step": 158394, "epoch": 3771} {"train_loss": -6.802050590515137, "global_step": 158395, "epoch": 3771} {"train_loss": -6.854631423950195, "global_step": 158396, "epoch": 3771} {"train_loss": -6.702373027801514, "global_step": 158397, "epoch": 3771} {"train_loss": -6.924037933349609, "global_step": 158398, "epoch": 3771} {"train_loss": -6.769247055053711, "global_step": 158399, "epoch": 3771} {"train_loss": -6.886803150177002, "global_step": 158400, "epoch": 3771} {"train_loss": -6.877317428588867, "global_step": 158401, "epoch": 3771} {"train_loss": -6.885551452636719, "global_step": 158402, "epoch": 3771} {"train_loss": -6.898354530334473, "global_step": 158403, "epoch": 3771} {"train_loss": -6.909353256225586, "global_step": 158404, "epoch": 3771} {"train_loss": -6.744301795959473, "global_step": 158405, "epoch": 3771} {"train_loss": -6.796021461486816, "global_step": 158406, "epoch": 3771} {"train_loss": -6.74759578704834, "global_step": 158407, "epoch": 3771} {"train_loss": -6.759488105773926, "global_step": 158408, "epoch": 3771} {"train_loss": -6.909303188323975, "global_step": 158409, "epoch": 3771} {"train_loss": -6.883037567138672, "global_step": 158410, "epoch": 3771} {"train_loss": -6.816880226135254, "global_step": 158411, "epoch": 3771} {"train_loss": -6.834322929382324, "global_step": 158412, "epoch": 3771} {"train_loss": -6.888027191162109, "global_step": 158413, "epoch": 3771} {"train_loss": -6.994222640991211, "global_step": 158414, "epoch": 3771} {"train_loss": -6.750107765197754, "global_step": 158415, "epoch": 3771} {"train_loss": -6.795413017272949, "global_step": 158416, "epoch": 3771} {"train_loss": -6.950003623962402, "global_step": 158417, "epoch": 3771} {"train_loss": -6.836705684661865, "global_step": 158418, "epoch": 3771} {"train_loss": -6.915816307067871, "global_step": 158419, "epoch": 3771} {"train_loss": -6.816817283630371, "global_step": 158420, "epoch": 3771} {"train_loss": -6.802156925201416, "global_step": 158421, "epoch": 3771} {"train_loss": -6.978416442871094, "global_step": 158422, "epoch": 3771} {"train_loss": -6.858680123374576, "global_step": 158423, "epoch": 3771, "val_loss": 68415.7890625} {"train_loss": -6.901144981384277, "global_step": 158424, "epoch": 3772} {"train_loss": -6.970796585083008, "global_step": 158425, "epoch": 3772} {"train_loss": -6.694908142089844, "global_step": 158426, "epoch": 3772} {"train_loss": -6.775195121765137, "global_step": 158427, "epoch": 3772} {"train_loss": -6.914633750915527, "global_step": 158428, "epoch": 3772} {"train_loss": -6.814489364624023, "global_step": 158429, "epoch": 3772} {"train_loss": -6.751741409301758, "global_step": 158430, "epoch": 3772} {"train_loss": -6.789644241333008, "global_step": 158431, "epoch": 3772} {"train_loss": -6.902841567993164, "global_step": 158432, "epoch": 3772} {"train_loss": -6.829313278198242, "global_step": 158433, "epoch": 3772} {"train_loss": -6.933688163757324, "global_step": 158434, "epoch": 3772} {"train_loss": -6.781471252441406, "global_step": 158435, "epoch": 3772} {"train_loss": -6.863893508911133, "global_step": 158436, "epoch": 3772} {"train_loss": -6.9682722091674805, "global_step": 158437, "epoch": 3772} {"train_loss": -6.748514175415039, "global_step": 158438, "epoch": 3772} {"train_loss": -6.775101661682129, "global_step": 158439, "epoch": 3772} {"train_loss": -6.843050956726074, "global_step": 158440, "epoch": 3772} {"train_loss": -6.824439525604248, "global_step": 158441, "epoch": 3772} {"train_loss": -6.833284378051758, "global_step": 158442, "epoch": 3772} {"train_loss": -6.923852920532227, "global_step": 158443, "epoch": 3772} {"train_loss": -6.8123064041137695, "global_step": 158444, "epoch": 3772} {"train_loss": -7.0148115158081055, "global_step": 158445, "epoch": 3772} {"train_loss": -6.964136123657227, "global_step": 158446, "epoch": 3772} {"train_loss": -6.940542221069336, "global_step": 158447, "epoch": 3772} {"train_loss": -6.882748603820801, "global_step": 158448, "epoch": 3772} {"train_loss": -6.95726203918457, "global_step": 158449, "epoch": 3772} {"train_loss": -6.758604049682617, "global_step": 158450, "epoch": 3772} {"train_loss": -6.927574634552002, "global_step": 158451, "epoch": 3772} {"train_loss": -6.9847259521484375, "global_step": 158452, "epoch": 3772} {"train_loss": -6.995265483856201, "global_step": 158453, "epoch": 3772} {"train_loss": -6.982305526733398, "global_step": 158454, "epoch": 3772} {"train_loss": -6.911135673522949, "global_step": 158455, "epoch": 3772} {"train_loss": -6.85761833190918, "global_step": 158456, "epoch": 3772} {"train_loss": -6.967555999755859, "global_step": 158457, "epoch": 3772} {"train_loss": -6.897525787353516, "global_step": 158458, "epoch": 3772} {"train_loss": -6.717564582824707, "global_step": 158459, "epoch": 3772} {"train_loss": -6.857110977172852, "global_step": 158460, "epoch": 3772} {"train_loss": -6.848063945770264, "global_step": 158461, "epoch": 3772} {"train_loss": -6.890725135803223, "global_step": 158462, "epoch": 3772} {"train_loss": -6.926831245422363, "global_step": 158463, "epoch": 3772} {"train_loss": -6.934207916259766, "global_step": 158464, "epoch": 3772} {"train_loss": -6.8760750861394975, "global_step": 158465, "epoch": 3772, "val_loss": 68631.1171875} {"train_loss": -6.8296685218811035, "global_step": 158466, "epoch": 3773} {"train_loss": -6.9352545738220215, "global_step": 158467, "epoch": 3773} {"train_loss": -6.933143138885498, "global_step": 158468, "epoch": 3773} {"train_loss": -6.852902889251709, "global_step": 158469, "epoch": 3773} {"train_loss": -6.93864631652832, "global_step": 158470, "epoch": 3773} {"train_loss": -6.905383110046387, "global_step": 158471, "epoch": 3773} {"train_loss": -6.9805006980896, "global_step": 158472, "epoch": 3773} {"train_loss": -6.9698944091796875, "global_step": 158473, "epoch": 3773} {"train_loss": -6.9964752197265625, "global_step": 158474, "epoch": 3773} {"train_loss": -6.879754066467285, "global_step": 158475, "epoch": 3773} {"train_loss": -6.920147895812988, "global_step": 158476, "epoch": 3773} {"train_loss": -6.952154159545898, "global_step": 158477, "epoch": 3773} {"train_loss": -6.935198783874512, "global_step": 158478, "epoch": 3773} {"train_loss": -7.035589218139648, "global_step": 158479, "epoch": 3773} {"train_loss": -6.911435127258301, "global_step": 158480, "epoch": 3773} {"train_loss": -7.059910774230957, "global_step": 158481, "epoch": 3773} {"train_loss": -6.960111618041992, "global_step": 158482, "epoch": 3773} {"train_loss": -6.993185997009277, "global_step": 158483, "epoch": 3773} {"train_loss": -7.0037665367126465, "global_step": 158484, "epoch": 3773} {"train_loss": -6.896917819976807, "global_step": 158485, "epoch": 3773} {"train_loss": -7.01704216003418, "global_step": 158486, "epoch": 3773} {"train_loss": -7.015212059020996, "global_step": 158487, "epoch": 3773} {"train_loss": -6.898937225341797, "global_step": 158488, "epoch": 3773} {"train_loss": -6.978147983551025, "global_step": 158489, "epoch": 3773} {"train_loss": -6.929040431976318, "global_step": 158490, "epoch": 3773} {"train_loss": -7.030296325683594, "global_step": 158491, "epoch": 3773} {"train_loss": -6.934947967529297, "global_step": 158492, "epoch": 3773} {"train_loss": -6.895773887634277, "global_step": 158493, "epoch": 3773} {"train_loss": -6.951406955718994, "global_step": 158494, "epoch": 3773} {"train_loss": -6.96645450592041, "global_step": 158495, "epoch": 3773} {"train_loss": -6.913899898529053, "global_step": 158496, "epoch": 3773} {"train_loss": -6.8663330078125, "global_step": 158497, "epoch": 3773} {"train_loss": -6.945949554443359, "global_step": 158498, "epoch": 3773} {"train_loss": -6.934155464172363, "global_step": 158499, "epoch": 3773} {"train_loss": -6.955931663513184, "global_step": 158500, "epoch": 3773} {"train_loss": -6.96300745010376, "global_step": 158501, "epoch": 3773} {"train_loss": -6.950041770935059, "global_step": 158502, "epoch": 3773} {"train_loss": -6.878675937652588, "global_step": 158503, "epoch": 3773} {"train_loss": -6.914653301239014, "global_step": 158504, "epoch": 3773} {"train_loss": -6.914145469665527, "global_step": 158505, "epoch": 3773} {"train_loss": -7.011541366577148, "global_step": 158506, "epoch": 3773} {"train_loss": -6.9459380649385, "global_step": 158507, "epoch": 3773, "val_loss": 68429.359375} {"train_loss": -6.879197597503662, "global_step": 158508, "epoch": 3774} {"train_loss": -6.898589134216309, "global_step": 158509, "epoch": 3774} {"train_loss": -6.997275352478027, "global_step": 158510, "epoch": 3774} {"train_loss": -6.8279709815979, "global_step": 158511, "epoch": 3774} {"train_loss": -7.027578830718994, "global_step": 158512, "epoch": 3774} {"train_loss": -6.879183769226074, "global_step": 158513, "epoch": 3774} {"train_loss": -6.901884078979492, "global_step": 158514, "epoch": 3774} {"train_loss": -6.910130500793457, "global_step": 158515, "epoch": 3774} {"train_loss": -6.912178039550781, "global_step": 158516, "epoch": 3774} {"train_loss": -6.918048858642578, "global_step": 158517, "epoch": 3774} {"train_loss": -6.973656177520752, "global_step": 158518, "epoch": 3774} {"train_loss": -6.954299449920654, "global_step": 158519, "epoch": 3774} {"train_loss": -6.9449920654296875, "global_step": 158520, "epoch": 3774} {"train_loss": -6.928122520446777, "global_step": 158521, "epoch": 3774} {"train_loss": -6.923699378967285, "global_step": 158522, "epoch": 3774} {"train_loss": -6.804463863372803, "global_step": 158523, "epoch": 3774} {"train_loss": -6.915070533752441, "global_step": 158524, "epoch": 3774} {"train_loss": -6.922325134277344, "global_step": 158525, "epoch": 3774} {"train_loss": -6.956758975982666, "global_step": 158526, "epoch": 3774} {"train_loss": -7.044692039489746, "global_step": 158527, "epoch": 3774} {"train_loss": -6.987765312194824, "global_step": 158528, "epoch": 3774} {"train_loss": -6.942373752593994, "global_step": 158529, "epoch": 3774} {"train_loss": -6.923229217529297, "global_step": 158530, "epoch": 3774} {"train_loss": -6.886385917663574, "global_step": 158531, "epoch": 3774} {"train_loss": -6.9371819496154785, "global_step": 158532, "epoch": 3774} {"train_loss": -6.880547523498535, "global_step": 158533, "epoch": 3774} {"train_loss": -6.987353801727295, "global_step": 158534, "epoch": 3774} {"train_loss": -6.8989105224609375, "global_step": 158535, "epoch": 3774} {"train_loss": -6.931652069091797, "global_step": 158536, "epoch": 3774} {"train_loss": -6.907427787780762, "global_step": 158537, "epoch": 3774} {"train_loss": -6.883570194244385, "global_step": 158538, "epoch": 3774} {"train_loss": -6.97652530670166, "global_step": 158539, "epoch": 3774} {"train_loss": -6.978662967681885, "global_step": 158540, "epoch": 3774} {"train_loss": -6.973562240600586, "global_step": 158541, "epoch": 3774} {"train_loss": -6.877927780151367, "global_step": 158542, "epoch": 3774} {"train_loss": -6.964047908782959, "global_step": 158543, "epoch": 3774} {"train_loss": -6.837524890899658, "global_step": 158544, "epoch": 3774} {"train_loss": -6.835172653198242, "global_step": 158545, "epoch": 3774} {"train_loss": -6.9728851318359375, "global_step": 158546, "epoch": 3774} {"train_loss": -7.004477500915527, "global_step": 158547, "epoch": 3774} {"train_loss": -6.881615161895752, "global_step": 158548, "epoch": 3774} {"train_loss": -6.919343664532616, "global_step": 158549, "epoch": 3774, "val_loss": 68727.171875} {"train_loss": -6.837646484375, "global_step": 158550, "epoch": 3775} {"train_loss": -6.854328155517578, "global_step": 158551, "epoch": 3775} {"train_loss": -6.976008415222168, "global_step": 158552, "epoch": 3775} {"train_loss": -6.92137336730957, "global_step": 158553, "epoch": 3775} {"train_loss": -6.989198207855225, "global_step": 158554, "epoch": 3775} {"train_loss": -6.921339988708496, "global_step": 158555, "epoch": 3775} {"train_loss": -7.004404067993164, "global_step": 158556, "epoch": 3775} {"train_loss": -6.818650245666504, "global_step": 158557, "epoch": 3775} {"train_loss": -6.874358177185059, "global_step": 158558, "epoch": 3775} {"train_loss": -6.920800685882568, "global_step": 158559, "epoch": 3775} {"train_loss": -6.79434871673584, "global_step": 158560, "epoch": 3775} {"train_loss": -6.939057350158691, "global_step": 158561, "epoch": 3775} {"train_loss": -6.9282402992248535, "global_step": 158562, "epoch": 3775} {"train_loss": -6.608198642730713, "global_step": 158563, "epoch": 3775} {"train_loss": -6.770195960998535, "global_step": 158564, "epoch": 3775} {"train_loss": -6.856064319610596, "global_step": 158565, "epoch": 3775} {"train_loss": -6.8945512771606445, "global_step": 158566, "epoch": 3775} {"train_loss": -6.887856483459473, "global_step": 158567, "epoch": 3775} {"train_loss": -6.8680644035339355, "global_step": 158568, "epoch": 3775} {"train_loss": -6.826905727386475, "global_step": 158569, "epoch": 3775} {"train_loss": -6.978740215301514, "global_step": 158570, "epoch": 3775} {"train_loss": -6.878875732421875, "global_step": 158571, "epoch": 3775} {"train_loss": -7.041015625, "global_step": 158572, "epoch": 3775} {"train_loss": -6.970746040344238, "global_step": 158573, "epoch": 3775} {"train_loss": -6.880403995513916, "global_step": 158574, "epoch": 3775} {"train_loss": -6.878188133239746, "global_step": 158575, "epoch": 3775} {"train_loss": -6.937765121459961, "global_step": 158576, "epoch": 3775} {"train_loss": -6.809588432312012, "global_step": 158577, "epoch": 3775} {"train_loss": -6.870031833648682, "global_step": 158578, "epoch": 3775} {"train_loss": -6.797739028930664, "global_step": 158579, "epoch": 3775} {"train_loss": -6.827889442443848, "global_step": 158580, "epoch": 3775} {"train_loss": -6.923849105834961, "global_step": 158581, "epoch": 3775} {"train_loss": -6.8538689613342285, "global_step": 158582, "epoch": 3775} {"train_loss": -6.904767990112305, "global_step": 158583, "epoch": 3775} {"train_loss": -6.8387041091918945, "global_step": 158584, "epoch": 3775} {"train_loss": -6.823044776916504, "global_step": 158585, "epoch": 3775} {"train_loss": -6.876153945922852, "global_step": 158586, "epoch": 3775} {"train_loss": -6.787581443786621, "global_step": 158587, "epoch": 3775} {"train_loss": -6.842129707336426, "global_step": 158588, "epoch": 3775} {"train_loss": -6.887740612030029, "global_step": 158589, "epoch": 3775} {"train_loss": -6.812856197357178, "global_step": 158590, "epoch": 3775} {"train_loss": -6.877790065038772, "global_step": 158591, "epoch": 3775, "val_loss": 68263.3046875} {"train_loss": -6.891160011291504, "global_step": 158592, "epoch": 3776} {"train_loss": -6.887768745422363, "global_step": 158593, "epoch": 3776} {"train_loss": -6.86844539642334, "global_step": 158594, "epoch": 3776} {"train_loss": -6.929254531860352, "global_step": 158595, "epoch": 3776} {"train_loss": -6.975491046905518, "global_step": 158596, "epoch": 3776} {"train_loss": -6.802473068237305, "global_step": 158597, "epoch": 3776} {"train_loss": -6.888741493225098, "global_step": 158598, "epoch": 3776} {"train_loss": -6.87716007232666, "global_step": 158599, "epoch": 3776} {"train_loss": -6.839840412139893, "global_step": 158600, "epoch": 3776} {"train_loss": -7.0249457359313965, "global_step": 158601, "epoch": 3776} {"train_loss": -6.849771499633789, "global_step": 158602, "epoch": 3776} {"train_loss": -7.001858234405518, "global_step": 158603, "epoch": 3776} {"train_loss": -6.846879482269287, "global_step": 158604, "epoch": 3776} {"train_loss": -6.7786455154418945, "global_step": 158605, "epoch": 3776} {"train_loss": -6.926663875579834, "global_step": 158606, "epoch": 3776} {"train_loss": -6.873890399932861, "global_step": 158607, "epoch": 3776} {"train_loss": -6.729113578796387, "global_step": 158608, "epoch": 3776} {"train_loss": -6.935447692871094, "global_step": 158609, "epoch": 3776} {"train_loss": -6.838963031768799, "global_step": 158610, "epoch": 3776} {"train_loss": -6.799282550811768, "global_step": 158611, "epoch": 3776} {"train_loss": -6.847223281860352, "global_step": 158612, "epoch": 3776} {"train_loss": -6.806619167327881, "global_step": 158613, "epoch": 3776} {"train_loss": -6.921962738037109, "global_step": 158614, "epoch": 3776} {"train_loss": -6.860825061798096, "global_step": 158615, "epoch": 3776} {"train_loss": -6.860337734222412, "global_step": 158616, "epoch": 3776} {"train_loss": -6.921292781829834, "global_step": 158617, "epoch": 3776} {"train_loss": -7.011239528656006, "global_step": 158618, "epoch": 3776} {"train_loss": -6.931734085083008, "global_step": 158619, "epoch": 3776} {"train_loss": -6.981893539428711, "global_step": 158620, "epoch": 3776} {"train_loss": -6.921501159667969, "global_step": 158621, "epoch": 3776} {"train_loss": -6.874139785766602, "global_step": 158622, "epoch": 3776} {"train_loss": -6.844400882720947, "global_step": 158623, "epoch": 3776} {"train_loss": -6.884951591491699, "global_step": 158624, "epoch": 3776} {"train_loss": -6.994108200073242, "global_step": 158625, "epoch": 3776} {"train_loss": -6.883227348327637, "global_step": 158626, "epoch": 3776} {"train_loss": -6.87360954284668, "global_step": 158627, "epoch": 3776} {"train_loss": -6.801026821136475, "global_step": 158628, "epoch": 3776} {"train_loss": -6.9193806648254395, "global_step": 158629, "epoch": 3776} {"train_loss": -6.848121643066406, "global_step": 158630, "epoch": 3776} {"train_loss": -6.869507789611816, "global_step": 158631, "epoch": 3776} {"train_loss": -6.931448459625244, "global_step": 158632, "epoch": 3776} {"train_loss": -6.885815665835426, "global_step": 158633, "epoch": 3776, "val_loss": 68468.6953125} {"train_loss": -7.108432769775391, "global_step": 158634, "epoch": 3777} {"train_loss": -6.903141021728516, "global_step": 158635, "epoch": 3777} {"train_loss": -6.99733829498291, "global_step": 158636, "epoch": 3777} {"train_loss": -6.936466217041016, "global_step": 158637, "epoch": 3777} {"train_loss": -6.994179725646973, "global_step": 158638, "epoch": 3777} {"train_loss": -6.938992500305176, "global_step": 158639, "epoch": 3777} {"train_loss": -6.9288177490234375, "global_step": 158640, "epoch": 3777} {"train_loss": -6.876777648925781, "global_step": 158641, "epoch": 3777} {"train_loss": -6.7356390953063965, "global_step": 158642, "epoch": 3777} {"train_loss": -6.880829334259033, "global_step": 158643, "epoch": 3777} {"train_loss": -6.813955783843994, "global_step": 158644, "epoch": 3777} {"train_loss": -6.810379505157471, "global_step": 158645, "epoch": 3777} {"train_loss": -6.792309284210205, "global_step": 158646, "epoch": 3777} {"train_loss": -6.756028175354004, "global_step": 158647, "epoch": 3777} {"train_loss": -6.879998207092285, "global_step": 158648, "epoch": 3777} {"train_loss": -6.723719596862793, "global_step": 158649, "epoch": 3777} {"train_loss": -6.878546714782715, "global_step": 158650, "epoch": 3777} {"train_loss": -6.730439186096191, "global_step": 158651, "epoch": 3777} {"train_loss": -6.8215837478637695, "global_step": 158652, "epoch": 3777} {"train_loss": -6.912896633148193, "global_step": 158653, "epoch": 3777} {"train_loss": -6.881897926330566, "global_step": 158654, "epoch": 3777} {"train_loss": -6.875249862670898, "global_step": 158655, "epoch": 3777} {"train_loss": -6.817874431610107, "global_step": 158656, "epoch": 3777} {"train_loss": -6.83980131149292, "global_step": 158657, "epoch": 3777} {"train_loss": -6.811017990112305, "global_step": 158658, "epoch": 3777} {"train_loss": -6.922944068908691, "global_step": 158659, "epoch": 3777} {"train_loss": -6.818317413330078, "global_step": 158660, "epoch": 3777} {"train_loss": -6.830993175506592, "global_step": 158661, "epoch": 3777} {"train_loss": -6.898458957672119, "global_step": 158662, "epoch": 3777} {"train_loss": -6.890754699707031, "global_step": 158663, "epoch": 3777} {"train_loss": -6.817629337310791, "global_step": 158664, "epoch": 3777} {"train_loss": -6.955587863922119, "global_step": 158665, "epoch": 3777} {"train_loss": -6.821964263916016, "global_step": 158666, "epoch": 3777} {"train_loss": -6.873851776123047, "global_step": 158667, "epoch": 3777} {"train_loss": -6.899752616882324, "global_step": 158668, "epoch": 3777} {"train_loss": -6.846831321716309, "global_step": 158669, "epoch": 3777} {"train_loss": -6.908596038818359, "global_step": 158670, "epoch": 3777} {"train_loss": -6.919146537780762, "global_step": 158671, "epoch": 3777} {"train_loss": -6.778055667877197, "global_step": 158672, "epoch": 3777} {"train_loss": -6.753856182098389, "global_step": 158673, "epoch": 3777} {"train_loss": -6.956904411315918, "global_step": 158674, "epoch": 3777} {"train_loss": -6.865692184084938, "global_step": 158675, "epoch": 3777, "val_loss": 68694.921875} {"train_loss": -6.868502140045166, "global_step": 158676, "epoch": 3778} {"train_loss": -6.80494499206543, "global_step": 158677, "epoch": 3778} {"train_loss": -6.829127788543701, "global_step": 158678, "epoch": 3778} {"train_loss": -6.94401741027832, "global_step": 158679, "epoch": 3778} {"train_loss": -6.923482894897461, "global_step": 158680, "epoch": 3778} {"train_loss": -6.8675432205200195, "global_step": 158681, "epoch": 3778} {"train_loss": -6.883583068847656, "global_step": 158682, "epoch": 3778} {"train_loss": -6.7970428466796875, "global_step": 158683, "epoch": 3778} {"train_loss": -6.809050559997559, "global_step": 158684, "epoch": 3778} {"train_loss": -6.904463291168213, "global_step": 158685, "epoch": 3778} {"train_loss": -6.754184722900391, "global_step": 158686, "epoch": 3778} {"train_loss": -6.689761638641357, "global_step": 158687, "epoch": 3778} {"train_loss": -6.8303680419921875, "global_step": 158688, "epoch": 3778} {"train_loss": -6.682222843170166, "global_step": 158689, "epoch": 3778} {"train_loss": -6.816739559173584, "global_step": 158690, "epoch": 3778} {"train_loss": -6.788911819458008, "global_step": 158691, "epoch": 3778} {"train_loss": -6.751443862915039, "global_step": 158692, "epoch": 3778} {"train_loss": -6.93297004699707, "global_step": 158693, "epoch": 3778} {"train_loss": -6.739985466003418, "global_step": 158694, "epoch": 3778} {"train_loss": -6.780701637268066, "global_step": 158695, "epoch": 3778} {"train_loss": -6.680815696716309, "global_step": 158696, "epoch": 3778} {"train_loss": -6.762101650238037, "global_step": 158697, "epoch": 3778} {"train_loss": -6.760902404785156, "global_step": 158698, "epoch": 3778} {"train_loss": -6.671412467956543, "global_step": 158699, "epoch": 3778} {"train_loss": -6.69007682800293, "global_step": 158700, "epoch": 3778} {"train_loss": -6.728908538818359, "global_step": 158701, "epoch": 3778} {"train_loss": -6.8805437088012695, "global_step": 158702, "epoch": 3778} {"train_loss": -6.762303352355957, "global_step": 158703, "epoch": 3778} {"train_loss": -6.72203254699707, "global_step": 158704, "epoch": 3778} {"train_loss": -6.681666851043701, "global_step": 158705, "epoch": 3778} {"train_loss": -6.8523993492126465, "global_step": 158706, "epoch": 3778} {"train_loss": -6.756286144256592, "global_step": 158707, "epoch": 3778} {"train_loss": -6.870425701141357, "global_step": 158708, "epoch": 3778} {"train_loss": -6.891928672790527, "global_step": 158709, "epoch": 3778} {"train_loss": -6.859489440917969, "global_step": 158710, "epoch": 3778} {"train_loss": -6.768176078796387, "global_step": 158711, "epoch": 3778} {"train_loss": -6.853849411010742, "global_step": 158712, "epoch": 3778} {"train_loss": -6.833564758300781, "global_step": 158713, "epoch": 3778} {"train_loss": -6.787154674530029, "global_step": 158714, "epoch": 3778} {"train_loss": -6.881487846374512, "global_step": 158715, "epoch": 3778} {"train_loss": -6.866365432739258, "global_step": 158716, "epoch": 3778} {"train_loss": -6.807352792649042, "global_step": 158717, "epoch": 3778, "val_loss": 68389.4453125} {"train_loss": -7.057408332824707, "global_step": 158718, "epoch": 3779} {"train_loss": -7.00462532043457, "global_step": 158719, "epoch": 3779} {"train_loss": -6.958758354187012, "global_step": 158720, "epoch": 3779} {"train_loss": -6.921687126159668, "global_step": 158721, "epoch": 3779} {"train_loss": -6.873203277587891, "global_step": 158722, "epoch": 3779} {"train_loss": -6.92050313949585, "global_step": 158723, "epoch": 3779} {"train_loss": -7.0435261726379395, "global_step": 158724, "epoch": 3779} {"train_loss": -6.915682792663574, "global_step": 158725, "epoch": 3779} {"train_loss": -6.972489356994629, "global_step": 158726, "epoch": 3779} {"train_loss": -6.967721462249756, "global_step": 158727, "epoch": 3779} {"train_loss": -6.909184455871582, "global_step": 158728, "epoch": 3779} {"train_loss": -7.008518695831299, "global_step": 158729, "epoch": 3779} {"train_loss": -6.985767364501953, "global_step": 158730, "epoch": 3779} {"train_loss": -7.003013610839844, "global_step": 158731, "epoch": 3779} {"train_loss": -6.909617900848389, "global_step": 158732, "epoch": 3779} {"train_loss": -6.826006889343262, "global_step": 158733, "epoch": 3779} {"train_loss": -6.836761474609375, "global_step": 158734, "epoch": 3779} {"train_loss": -7.023849010467529, "global_step": 158735, "epoch": 3779} {"train_loss": -6.926482200622559, "global_step": 158736, "epoch": 3779} {"train_loss": -6.834474086761475, "global_step": 158737, "epoch": 3779} {"train_loss": -6.904960632324219, "global_step": 158738, "epoch": 3779} {"train_loss": -6.8941450119018555, "global_step": 158739, "epoch": 3779} {"train_loss": -6.939062118530273, "global_step": 158740, "epoch": 3779} {"train_loss": -6.8650970458984375, "global_step": 158741, "epoch": 3779} {"train_loss": -6.863071441650391, "global_step": 158742, "epoch": 3779} {"train_loss": -6.894071578979492, "global_step": 158743, "epoch": 3779} {"train_loss": -6.839052677154541, "global_step": 158744, "epoch": 3779} {"train_loss": -6.81639289855957, "global_step": 158745, "epoch": 3779} {"train_loss": -6.906798362731934, "global_step": 158746, "epoch": 3779} {"train_loss": -6.826713562011719, "global_step": 158747, "epoch": 3779} {"train_loss": -6.8896636962890625, "global_step": 158748, "epoch": 3779} {"train_loss": -6.896035194396973, "global_step": 158749, "epoch": 3779} {"train_loss": -7.015467643737793, "global_step": 158750, "epoch": 3779} {"train_loss": -6.868405342102051, "global_step": 158751, "epoch": 3779} {"train_loss": -6.8662214279174805, "global_step": 158752, "epoch": 3779} {"train_loss": -6.800482749938965, "global_step": 158753, "epoch": 3779} {"train_loss": -6.817919731140137, "global_step": 158754, "epoch": 3779} {"train_loss": -6.693351745605469, "global_step": 158755, "epoch": 3779} {"train_loss": -6.886900424957275, "global_step": 158756, "epoch": 3779} {"train_loss": -6.787976264953613, "global_step": 158757, "epoch": 3779} {"train_loss": -6.93064022064209, "global_step": 158758, "epoch": 3779} {"train_loss": -6.904525427591233, "global_step": 158759, "epoch": 3779, "val_loss": 68495.6171875} {"train_loss": -6.944103240966797, "global_step": 158760, "epoch": 3780} {"train_loss": -6.856339931488037, "global_step": 158761, "epoch": 3780} {"train_loss": -6.932889461517334, "global_step": 158762, "epoch": 3780} {"train_loss": -6.8473920822143555, "global_step": 158763, "epoch": 3780} {"train_loss": -6.910992622375488, "global_step": 158764, "epoch": 3780} {"train_loss": -6.984523773193359, "global_step": 158765, "epoch": 3780} {"train_loss": -6.917662620544434, "global_step": 158766, "epoch": 3780} {"train_loss": -6.922701835632324, "global_step": 158767, "epoch": 3780} {"train_loss": -6.899404525756836, "global_step": 158768, "epoch": 3780} {"train_loss": -6.931836128234863, "global_step": 158769, "epoch": 3780} {"train_loss": -6.837983131408691, "global_step": 158770, "epoch": 3780} {"train_loss": -6.860538482666016, "global_step": 158771, "epoch": 3780} {"train_loss": -6.828236103057861, "global_step": 158772, "epoch": 3780} {"train_loss": -6.8213090896606445, "global_step": 158773, "epoch": 3780} {"train_loss": -6.872856140136719, "global_step": 158774, "epoch": 3780} {"train_loss": -6.929149627685547, "global_step": 158775, "epoch": 3780} {"train_loss": -6.891042709350586, "global_step": 158776, "epoch": 3780} {"train_loss": -6.959155082702637, "global_step": 158777, "epoch": 3780} {"train_loss": -6.90854549407959, "global_step": 158778, "epoch": 3780} {"train_loss": -6.985932350158691, "global_step": 158779, "epoch": 3780} {"train_loss": -6.875087261199951, "global_step": 158780, "epoch": 3780} {"train_loss": -7.0002336502075195, "global_step": 158781, "epoch": 3780} {"train_loss": -7.011410713195801, "global_step": 158782, "epoch": 3780} {"train_loss": -6.8648881912231445, "global_step": 158783, "epoch": 3780} {"train_loss": -6.9451093673706055, "global_step": 158784, "epoch": 3780} {"train_loss": -6.96054744720459, "global_step": 158785, "epoch": 3780} {"train_loss": -6.9008283615112305, "global_step": 158786, "epoch": 3780} {"train_loss": -6.8523335456848145, "global_step": 158787, "epoch": 3780} {"train_loss": -6.806328773498535, "global_step": 158788, "epoch": 3780} {"train_loss": -6.944532871246338, "global_step": 158789, "epoch": 3780} {"train_loss": -6.886436462402344, "global_step": 158790, "epoch": 3780} {"train_loss": -6.884217262268066, "global_step": 158791, "epoch": 3780} {"train_loss": -6.97316837310791, "global_step": 158792, "epoch": 3780} {"train_loss": -6.985196113586426, "global_step": 158793, "epoch": 3780} {"train_loss": -6.873378753662109, "global_step": 158794, "epoch": 3780} {"train_loss": -6.973711013793945, "global_step": 158795, "epoch": 3780} {"train_loss": -6.860837936401367, "global_step": 158796, "epoch": 3780} {"train_loss": -6.847270965576172, "global_step": 158797, "epoch": 3780} {"train_loss": -6.854593753814697, "global_step": 158798, "epoch": 3780} {"train_loss": -6.963726043701172, "global_step": 158799, "epoch": 3780} {"train_loss": -6.902360439300537, "global_step": 158800, "epoch": 3780} {"train_loss": -6.9075681027911955, "global_step": 158801, "epoch": 3780, "val_loss": 68504.1796875} {"train_loss": -6.931723594665527, "global_step": 158802, "epoch": 3781} {"train_loss": -6.922694206237793, "global_step": 158803, "epoch": 3781} {"train_loss": -6.915676116943359, "global_step": 158804, "epoch": 3781} {"train_loss": -6.879883766174316, "global_step": 158805, "epoch": 3781} {"train_loss": -6.87309455871582, "global_step": 158806, "epoch": 3781} {"train_loss": -7.057065963745117, "global_step": 158807, "epoch": 3781} {"train_loss": -6.847200393676758, "global_step": 158808, "epoch": 3781} {"train_loss": -6.759050369262695, "global_step": 158809, "epoch": 3781} {"train_loss": -6.872504234313965, "global_step": 158810, "epoch": 3781} {"train_loss": -6.758279800415039, "global_step": 158811, "epoch": 3781} {"train_loss": -6.780266761779785, "global_step": 158812, "epoch": 3781} {"train_loss": -6.835668563842773, "global_step": 158813, "epoch": 3781} {"train_loss": -6.776237487792969, "global_step": 158814, "epoch": 3781} {"train_loss": -6.859674453735352, "global_step": 158815, "epoch": 3781} {"train_loss": -6.850427627563477, "global_step": 158816, "epoch": 3781} {"train_loss": -6.697779655456543, "global_step": 158817, "epoch": 3781} {"train_loss": -6.7195611000061035, "global_step": 158818, "epoch": 3781} {"train_loss": -6.7634758949279785, "global_step": 158819, "epoch": 3781} {"train_loss": -6.736382007598877, "global_step": 158820, "epoch": 3781} {"train_loss": -6.78244686126709, "global_step": 158821, "epoch": 3781} {"train_loss": -6.740557670593262, "global_step": 158822, "epoch": 3781} {"train_loss": -6.776950359344482, "global_step": 158823, "epoch": 3781} {"train_loss": -6.805852890014648, "global_step": 158824, "epoch": 3781} {"train_loss": -6.833986282348633, "global_step": 158825, "epoch": 3781} {"train_loss": -6.783468246459961, "global_step": 158826, "epoch": 3781} {"train_loss": -6.899181365966797, "global_step": 158827, "epoch": 3781} {"train_loss": -6.928046226501465, "global_step": 158828, "epoch": 3781} {"train_loss": -6.816164970397949, "global_step": 158829, "epoch": 3781} {"train_loss": -6.74302339553833, "global_step": 158830, "epoch": 3781} {"train_loss": -6.8798627853393555, "global_step": 158831, "epoch": 3781} {"train_loss": -6.926030158996582, "global_step": 158832, "epoch": 3781} {"train_loss": -6.773605823516846, "global_step": 158833, "epoch": 3781} {"train_loss": -6.869388580322266, "global_step": 158834, "epoch": 3781} {"train_loss": -6.957670211791992, "global_step": 158835, "epoch": 3781} {"train_loss": -6.863916873931885, "global_step": 158836, "epoch": 3781} {"train_loss": -6.977597236633301, "global_step": 158837, "epoch": 3781} {"train_loss": -6.814574718475342, "global_step": 158838, "epoch": 3781} {"train_loss": -6.762697219848633, "global_step": 158839, "epoch": 3781} {"train_loss": -6.889106273651123, "global_step": 158840, "epoch": 3781} {"train_loss": -6.939303398132324, "global_step": 158841, "epoch": 3781} {"train_loss": -6.830474853515625, "global_step": 158842, "epoch": 3781} {"train_loss": -6.8425037406739735, "global_step": 158843, "epoch": 3781, "val_loss": 68542.6328125} {"train_loss": -7.03895378112793, "global_step": 158844, "epoch": 3782} {"train_loss": -6.931984901428223, "global_step": 158845, "epoch": 3782} {"train_loss": -6.839505195617676, "global_step": 158846, "epoch": 3782} {"train_loss": -6.852896690368652, "global_step": 158847, "epoch": 3782} {"train_loss": -6.857309341430664, "global_step": 158848, "epoch": 3782} {"train_loss": -6.966270446777344, "global_step": 158849, "epoch": 3782} {"train_loss": -7.018259048461914, "global_step": 158850, "epoch": 3782} {"train_loss": -6.93498420715332, "global_step": 158851, "epoch": 3782} {"train_loss": -7.036909103393555, "global_step": 158852, "epoch": 3782} {"train_loss": -7.043956756591797, "global_step": 158853, "epoch": 3782} {"train_loss": -6.85623836517334, "global_step": 158854, "epoch": 3782} {"train_loss": -6.845832824707031, "global_step": 158855, "epoch": 3782} {"train_loss": -6.915866851806641, "global_step": 158856, "epoch": 3782} {"train_loss": -6.969559669494629, "global_step": 158857, "epoch": 3782} {"train_loss": -6.860267162322998, "global_step": 158858, "epoch": 3782} {"train_loss": -6.90783166885376, "global_step": 158859, "epoch": 3782} {"train_loss": -6.785575866699219, "global_step": 158860, "epoch": 3782} {"train_loss": -6.963476657867432, "global_step": 158861, "epoch": 3782} {"train_loss": -6.9797868728637695, "global_step": 158862, "epoch": 3782} {"train_loss": -6.858577251434326, "global_step": 158863, "epoch": 3782} {"train_loss": -6.85658073425293, "global_step": 158864, "epoch": 3782} {"train_loss": -6.868955612182617, "global_step": 158865, "epoch": 3782} {"train_loss": -6.86378288269043, "global_step": 158866, "epoch": 3782} {"train_loss": -6.77336311340332, "global_step": 158867, "epoch": 3782} {"train_loss": -6.871799945831299, "global_step": 158868, "epoch": 3782} {"train_loss": -6.8507080078125, "global_step": 158869, "epoch": 3782} {"train_loss": -6.843994140625, "global_step": 158870, "epoch": 3782} {"train_loss": -6.852407932281494, "global_step": 158871, "epoch": 3782} {"train_loss": -6.8072190284729, "global_step": 158872, "epoch": 3782} {"train_loss": -6.825864315032959, "global_step": 158873, "epoch": 3782} {"train_loss": -6.899369239807129, "global_step": 158874, "epoch": 3782} {"train_loss": -6.90977144241333, "global_step": 158875, "epoch": 3782} {"train_loss": -6.880653381347656, "global_step": 158876, "epoch": 3782} {"train_loss": -6.8746795654296875, "global_step": 158877, "epoch": 3782} {"train_loss": -6.8281707763671875, "global_step": 158878, "epoch": 3782} {"train_loss": -6.936598777770996, "global_step": 158879, "epoch": 3782} {"train_loss": -6.828061103820801, "global_step": 158880, "epoch": 3782} {"train_loss": -6.935952186584473, "global_step": 158881, "epoch": 3782} {"train_loss": -6.894235610961914, "global_step": 158882, "epoch": 3782} {"train_loss": -6.8497700691223145, "global_step": 158883, "epoch": 3782} {"train_loss": -6.7902679443359375, "global_step": 158884, "epoch": 3782} {"train_loss": -6.889366229375203, "global_step": 158885, "epoch": 3782, "val_loss": 68648.7109375} {"train_loss": -6.979292869567871, "global_step": 158886, "epoch": 3783} {"train_loss": -6.9615678787231445, "global_step": 158887, "epoch": 3783} {"train_loss": -6.8547210693359375, "global_step": 158888, "epoch": 3783} {"train_loss": -6.935576438903809, "global_step": 158889, "epoch": 3783} {"train_loss": -6.88610315322876, "global_step": 158890, "epoch": 3783} {"train_loss": -6.7753095626831055, "global_step": 158891, "epoch": 3783} {"train_loss": -6.883770942687988, "global_step": 158892, "epoch": 3783} {"train_loss": -6.82459020614624, "global_step": 158893, "epoch": 3783} {"train_loss": -6.936488151550293, "global_step": 158894, "epoch": 3783} {"train_loss": -6.805613994598389, "global_step": 158895, "epoch": 3783} {"train_loss": -6.853873252868652, "global_step": 158896, "epoch": 3783} {"train_loss": -6.8366804122924805, "global_step": 158897, "epoch": 3783} {"train_loss": -6.849886417388916, "global_step": 158898, "epoch": 3783} {"train_loss": -6.9423627853393555, "global_step": 158899, "epoch": 3783} {"train_loss": -6.764520645141602, "global_step": 158900, "epoch": 3783} {"train_loss": -6.877259254455566, "global_step": 158901, "epoch": 3783} {"train_loss": -6.985109329223633, "global_step": 158902, "epoch": 3783} {"train_loss": -6.816540241241455, "global_step": 158903, "epoch": 3783} {"train_loss": -6.973245143890381, "global_step": 158904, "epoch": 3783} {"train_loss": -6.816065788269043, "global_step": 158905, "epoch": 3783} {"train_loss": -6.786399841308594, "global_step": 158906, "epoch": 3783} {"train_loss": -6.895410537719727, "global_step": 158907, "epoch": 3783} {"train_loss": -6.865286350250244, "global_step": 158908, "epoch": 3783} {"train_loss": -6.918347358703613, "global_step": 158909, "epoch": 3783} {"train_loss": -6.791917324066162, "global_step": 158910, "epoch": 3783} {"train_loss": -6.819923400878906, "global_step": 158911, "epoch": 3783} {"train_loss": -6.862986087799072, "global_step": 158912, "epoch": 3783} {"train_loss": -6.853081703186035, "global_step": 158913, "epoch": 3783} {"train_loss": -6.927873611450195, "global_step": 158914, "epoch": 3783} {"train_loss": -6.945075035095215, "global_step": 158915, "epoch": 3783} {"train_loss": -6.945288181304932, "global_step": 158916, "epoch": 3783} {"train_loss": -6.946638107299805, "global_step": 158917, "epoch": 3783} {"train_loss": -6.873893737792969, "global_step": 158918, "epoch": 3783} {"train_loss": -6.8817362785339355, "global_step": 158919, "epoch": 3783} {"train_loss": -6.917169570922852, "global_step": 158920, "epoch": 3783} {"train_loss": -6.830705642700195, "global_step": 158921, "epoch": 3783} {"train_loss": -6.889120101928711, "global_step": 158922, "epoch": 3783} {"train_loss": -6.754622459411621, "global_step": 158923, "epoch": 3783} {"train_loss": -6.734024524688721, "global_step": 158924, "epoch": 3783} {"train_loss": -6.904993534088135, "global_step": 158925, "epoch": 3783} {"train_loss": -6.903121471405029, "global_step": 158926, "epoch": 3783} {"train_loss": -6.871437084107172, "global_step": 158927, "epoch": 3783, "val_loss": 68613.7578125} {"train_loss": -6.865833282470703, "global_step": 158928, "epoch": 3784} {"train_loss": -6.842161655426025, "global_step": 158929, "epoch": 3784} {"train_loss": -6.838827133178711, "global_step": 158930, "epoch": 3784} {"train_loss": -6.829931735992432, "global_step": 158931, "epoch": 3784} {"train_loss": -6.892145156860352, "global_step": 158932, "epoch": 3784} {"train_loss": -6.910843849182129, "global_step": 158933, "epoch": 3784} {"train_loss": -6.8293914794921875, "global_step": 158934, "epoch": 3784} {"train_loss": -6.866986274719238, "global_step": 158935, "epoch": 3784} {"train_loss": -6.888426780700684, "global_step": 158936, "epoch": 3784} {"train_loss": -6.946791648864746, "global_step": 158937, "epoch": 3784} {"train_loss": -6.853360176086426, "global_step": 158938, "epoch": 3784} {"train_loss": -6.969870567321777, "global_step": 158939, "epoch": 3784} {"train_loss": -6.89009428024292, "global_step": 158940, "epoch": 3784} {"train_loss": -6.85813045501709, "global_step": 158941, "epoch": 3784} {"train_loss": -6.921205043792725, "global_step": 158942, "epoch": 3784} {"train_loss": -6.925586700439453, "global_step": 158943, "epoch": 3784} {"train_loss": -6.885992050170898, "global_step": 158944, "epoch": 3784} {"train_loss": -6.854605674743652, "global_step": 158945, "epoch": 3784} {"train_loss": -6.812561988830566, "global_step": 158946, "epoch": 3784} {"train_loss": -6.818051338195801, "global_step": 158947, "epoch": 3784} {"train_loss": -6.721940517425537, "global_step": 158948, "epoch": 3784} {"train_loss": -6.8304033279418945, "global_step": 158949, "epoch": 3784} {"train_loss": -6.5944037437438965, "global_step": 158950, "epoch": 3784} {"train_loss": -6.806648254394531, "global_step": 158951, "epoch": 3784} {"train_loss": -6.946605682373047, "global_step": 158952, "epoch": 3784} {"train_loss": -6.805102348327637, "global_step": 158953, "epoch": 3784} {"train_loss": -6.979396820068359, "global_step": 158954, "epoch": 3784} {"train_loss": -6.76759147644043, "global_step": 158955, "epoch": 3784} {"train_loss": -6.871603965759277, "global_step": 158956, "epoch": 3784} {"train_loss": -6.77977180480957, "global_step": 158957, "epoch": 3784} {"train_loss": -6.815387725830078, "global_step": 158958, "epoch": 3784} {"train_loss": -6.8000078201293945, "global_step": 158959, "epoch": 3784} {"train_loss": -6.866198539733887, "global_step": 158960, "epoch": 3784} {"train_loss": -6.837237358093262, "global_step": 158961, "epoch": 3784} {"train_loss": -6.861133098602295, "global_step": 158962, "epoch": 3784} {"train_loss": -6.899169445037842, "global_step": 158963, "epoch": 3784} {"train_loss": -6.913495063781738, "global_step": 158964, "epoch": 3784} {"train_loss": -6.945094585418701, "global_step": 158965, "epoch": 3784} {"train_loss": -6.895949363708496, "global_step": 158966, "epoch": 3784} {"train_loss": -6.835522174835205, "global_step": 158967, "epoch": 3784} {"train_loss": -6.8642401695251465, "global_step": 158968, "epoch": 3784} {"train_loss": -6.858695870354062, "global_step": 158969, "epoch": 3784, "val_loss": 68641.125} {"train_loss": -6.880853652954102, "global_step": 158970, "epoch": 3785} {"train_loss": -6.9113969802856445, "global_step": 158971, "epoch": 3785} {"train_loss": -6.847855567932129, "global_step": 158972, "epoch": 3785} {"train_loss": -6.990151405334473, "global_step": 158973, "epoch": 3785} {"train_loss": -6.871212005615234, "global_step": 158974, "epoch": 3785} {"train_loss": -6.984105110168457, "global_step": 158975, "epoch": 3785} {"train_loss": -6.863183975219727, "global_step": 158976, "epoch": 3785} {"train_loss": -6.978399276733398, "global_step": 158977, "epoch": 3785} {"train_loss": -6.912666320800781, "global_step": 158978, "epoch": 3785} {"train_loss": -6.965588569641113, "global_step": 158979, "epoch": 3785} {"train_loss": -6.840429306030273, "global_step": 158980, "epoch": 3785} {"train_loss": -6.8969244956970215, "global_step": 158981, "epoch": 3785} {"train_loss": -6.881133079528809, "global_step": 158982, "epoch": 3785} {"train_loss": -6.828104496002197, "global_step": 158983, "epoch": 3785} {"train_loss": -6.893429756164551, "global_step": 158984, "epoch": 3785} {"train_loss": -6.97101354598999, "global_step": 158985, "epoch": 3785} {"train_loss": -6.8515424728393555, "global_step": 158986, "epoch": 3785} {"train_loss": -6.953407287597656, "global_step": 158987, "epoch": 3785} {"train_loss": -6.9135966300964355, "global_step": 158988, "epoch": 3785} {"train_loss": -6.763284683227539, "global_step": 158989, "epoch": 3785} {"train_loss": -7.037242412567139, "global_step": 158990, "epoch": 3785} {"train_loss": -6.953587532043457, "global_step": 158991, "epoch": 3785} {"train_loss": -6.792937278747559, "global_step": 158992, "epoch": 3785} {"train_loss": -6.965435981750488, "global_step": 158993, "epoch": 3785} {"train_loss": -6.8241143226623535, "global_step": 158994, "epoch": 3785} {"train_loss": -6.88724946975708, "global_step": 158995, "epoch": 3785} {"train_loss": -7.025485992431641, "global_step": 158996, "epoch": 3785} {"train_loss": -6.93173885345459, "global_step": 158997, "epoch": 3785} {"train_loss": -6.877689361572266, "global_step": 158998, "epoch": 3785} {"train_loss": -6.939391136169434, "global_step": 158999, "epoch": 3785} {"train_loss": -6.9297776222229, "global_step": 159000, "epoch": 3785} {"train_loss": -6.883652687072754, "global_step": 159001, "epoch": 3785} {"train_loss": -7.0234293937683105, "global_step": 159002, "epoch": 3785} {"train_loss": -6.792106628417969, "global_step": 159003, "epoch": 3785} {"train_loss": -6.956954479217529, "global_step": 159004, "epoch": 3785} {"train_loss": -6.8993964195251465, "global_step": 159005, "epoch": 3785} {"train_loss": -6.790099143981934, "global_step": 159006, "epoch": 3785} {"train_loss": -6.923442363739014, "global_step": 159007, "epoch": 3785} {"train_loss": -6.912880897521973, "global_step": 159008, "epoch": 3785} {"train_loss": -6.926105499267578, "global_step": 159009, "epoch": 3785} {"train_loss": -6.832470417022705, "global_step": 159010, "epoch": 3785} {"train_loss": -6.9015064012436635, "global_step": 159011, "epoch": 3785, "val_loss": 68469.6875} {"train_loss": -6.885509490966797, "global_step": 159012, "epoch": 3786} {"train_loss": -6.854277610778809, "global_step": 159013, "epoch": 3786} {"train_loss": -6.6999053955078125, "global_step": 159014, "epoch": 3786} {"train_loss": -6.795751571655273, "global_step": 159015, "epoch": 3786} {"train_loss": -6.805074691772461, "global_step": 159016, "epoch": 3786} {"train_loss": -6.73061466217041, "global_step": 159017, "epoch": 3786} {"train_loss": -6.9463701248168945, "global_step": 159018, "epoch": 3786} {"train_loss": -6.832551956176758, "global_step": 159019, "epoch": 3786} {"train_loss": -6.904019832611084, "global_step": 159020, "epoch": 3786} {"train_loss": -6.80306339263916, "global_step": 159021, "epoch": 3786} {"train_loss": -6.824092388153076, "global_step": 159022, "epoch": 3786} {"train_loss": -6.8997650146484375, "global_step": 159023, "epoch": 3786} {"train_loss": -6.810606956481934, "global_step": 159024, "epoch": 3786} {"train_loss": -6.932948112487793, "global_step": 159025, "epoch": 3786} {"train_loss": -6.9038190841674805, "global_step": 159026, "epoch": 3786} {"train_loss": -6.877040386199951, "global_step": 159027, "epoch": 3786} {"train_loss": -6.864077091217041, "global_step": 159028, "epoch": 3786} {"train_loss": -6.826295852661133, "global_step": 159029, "epoch": 3786} {"train_loss": -6.89913272857666, "global_step": 159030, "epoch": 3786} {"train_loss": -6.792416095733643, "global_step": 159031, "epoch": 3786} {"train_loss": -6.87689208984375, "global_step": 159032, "epoch": 3786} {"train_loss": -6.914011001586914, "global_step": 159033, "epoch": 3786} {"train_loss": -6.784475326538086, "global_step": 159034, "epoch": 3786} {"train_loss": -6.8713059425354, "global_step": 159035, "epoch": 3786} {"train_loss": -6.858912944793701, "global_step": 159036, "epoch": 3786} {"train_loss": -6.908043384552002, "global_step": 159037, "epoch": 3786} {"train_loss": -6.880356311798096, "global_step": 159038, "epoch": 3786} {"train_loss": -6.872508525848389, "global_step": 159039, "epoch": 3786} {"train_loss": -6.865479469299316, "global_step": 159040, "epoch": 3786} {"train_loss": -6.874032020568848, "global_step": 159041, "epoch": 3786} {"train_loss": -6.901616096496582, "global_step": 159042, "epoch": 3786} {"train_loss": -6.890437126159668, "global_step": 159043, "epoch": 3786} {"train_loss": -6.922627925872803, "global_step": 159044, "epoch": 3786} {"train_loss": -6.900579452514648, "global_step": 159045, "epoch": 3786} {"train_loss": -6.996691703796387, "global_step": 159046, "epoch": 3786} {"train_loss": -6.860771656036377, "global_step": 159047, "epoch": 3786} {"train_loss": -6.955091953277588, "global_step": 159048, "epoch": 3786} {"train_loss": -6.883282661437988, "global_step": 159049, "epoch": 3786} {"train_loss": -6.884005546569824, "global_step": 159050, "epoch": 3786} {"train_loss": -6.884232521057129, "global_step": 159051, "epoch": 3786} {"train_loss": -7.023054122924805, "global_step": 159052, "epoch": 3786} {"train_loss": -6.870819727579753, "global_step": 159053, "epoch": 3786, "val_loss": 68724.1640625} {"train_loss": -6.8716936111450195, "global_step": 159054, "epoch": 3787} {"train_loss": -6.900045394897461, "global_step": 159055, "epoch": 3787} {"train_loss": -6.961672306060791, "global_step": 159056, "epoch": 3787} {"train_loss": -6.984445571899414, "global_step": 159057, "epoch": 3787} {"train_loss": -6.91566276550293, "global_step": 159058, "epoch": 3787} {"train_loss": -6.906230926513672, "global_step": 159059, "epoch": 3787} {"train_loss": -6.917318344116211, "global_step": 159060, "epoch": 3787} {"train_loss": -6.820182800292969, "global_step": 159061, "epoch": 3787} {"train_loss": -6.904748916625977, "global_step": 159062, "epoch": 3787} {"train_loss": -6.96165657043457, "global_step": 159063, "epoch": 3787} {"train_loss": -6.787869930267334, "global_step": 159064, "epoch": 3787} {"train_loss": -6.880085468292236, "global_step": 159065, "epoch": 3787} {"train_loss": -6.886357307434082, "global_step": 159066, "epoch": 3787} {"train_loss": -6.793220520019531, "global_step": 159067, "epoch": 3787} {"train_loss": -6.821906089782715, "global_step": 159068, "epoch": 3787} {"train_loss": -6.866642951965332, "global_step": 159069, "epoch": 3787} {"train_loss": -6.861147880554199, "global_step": 159070, "epoch": 3787} {"train_loss": -6.818657875061035, "global_step": 159071, "epoch": 3787} {"train_loss": -6.991560935974121, "global_step": 159072, "epoch": 3787} {"train_loss": -6.846504211425781, "global_step": 159073, "epoch": 3787} {"train_loss": -6.991743087768555, "global_step": 159074, "epoch": 3787} {"train_loss": -6.94526481628418, "global_step": 159075, "epoch": 3787} {"train_loss": -6.9723381996154785, "global_step": 159076, "epoch": 3787} {"train_loss": -6.993293762207031, "global_step": 159077, "epoch": 3787} {"train_loss": -6.930140018463135, "global_step": 159078, "epoch": 3787} {"train_loss": -7.025677680969238, "global_step": 159079, "epoch": 3787} {"train_loss": -7.022179126739502, "global_step": 159080, "epoch": 3787} {"train_loss": -6.901932716369629, "global_step": 159081, "epoch": 3787} {"train_loss": -7.003025054931641, "global_step": 159082, "epoch": 3787} {"train_loss": -6.964041709899902, "global_step": 159083, "epoch": 3787} {"train_loss": -6.873101234436035, "global_step": 159084, "epoch": 3787} {"train_loss": -6.74880838394165, "global_step": 159085, "epoch": 3787} {"train_loss": -6.9085693359375, "global_step": 159086, "epoch": 3787} {"train_loss": -6.963648796081543, "global_step": 159087, "epoch": 3787} {"train_loss": -6.886037826538086, "global_step": 159088, "epoch": 3787} {"train_loss": -6.989368438720703, "global_step": 159089, "epoch": 3787} {"train_loss": -6.951406478881836, "global_step": 159090, "epoch": 3787} {"train_loss": -6.981791019439697, "global_step": 159091, "epoch": 3787} {"train_loss": -6.981462478637695, "global_step": 159092, "epoch": 3787} {"train_loss": -6.885605812072754, "global_step": 159093, "epoch": 3787} {"train_loss": -6.982222557067871, "global_step": 159094, "epoch": 3787} {"train_loss": -6.914772578648159, "global_step": 159095, "epoch": 3787, "val_loss": 68581.6640625} {"train_loss": -7.037567615509033, "global_step": 159096, "epoch": 3788} {"train_loss": -6.944521427154541, "global_step": 159097, "epoch": 3788} {"train_loss": -6.773510932922363, "global_step": 159098, "epoch": 3788} {"train_loss": -6.881165027618408, "global_step": 159099, "epoch": 3788} {"train_loss": -6.956265926361084, "global_step": 159100, "epoch": 3788} {"train_loss": -6.785167694091797, "global_step": 159101, "epoch": 3788} {"train_loss": -6.77968692779541, "global_step": 159102, "epoch": 3788} {"train_loss": -6.850142002105713, "global_step": 159103, "epoch": 3788} {"train_loss": -6.873940467834473, "global_step": 159104, "epoch": 3788} {"train_loss": -6.851548194885254, "global_step": 159105, "epoch": 3788} {"train_loss": -6.800048351287842, "global_step": 159106, "epoch": 3788} {"train_loss": -6.843649864196777, "global_step": 159107, "epoch": 3788} {"train_loss": -6.876242160797119, "global_step": 159108, "epoch": 3788} {"train_loss": -6.898120403289795, "global_step": 159109, "epoch": 3788} {"train_loss": -6.884352207183838, "global_step": 159110, "epoch": 3788} {"train_loss": -6.90669059753418, "global_step": 159111, "epoch": 3788} {"train_loss": -6.934321403503418, "global_step": 159112, "epoch": 3788} {"train_loss": -6.759367942810059, "global_step": 159113, "epoch": 3788} {"train_loss": -6.930041313171387, "global_step": 159114, "epoch": 3788} {"train_loss": -6.9954094886779785, "global_step": 159115, "epoch": 3788} {"train_loss": -6.897011756896973, "global_step": 159116, "epoch": 3788} {"train_loss": -6.866962432861328, "global_step": 159117, "epoch": 3788} {"train_loss": -6.804920196533203, "global_step": 159118, "epoch": 3788} {"train_loss": -6.789009094238281, "global_step": 159119, "epoch": 3788} {"train_loss": -6.906103134155273, "global_step": 159120, "epoch": 3788} {"train_loss": -6.800685882568359, "global_step": 159121, "epoch": 3788} {"train_loss": -6.783388137817383, "global_step": 159122, "epoch": 3788} {"train_loss": -6.9432806968688965, "global_step": 159123, "epoch": 3788} {"train_loss": -6.831377029418945, "global_step": 159124, "epoch": 3788} {"train_loss": -6.882190704345703, "global_step": 159125, "epoch": 3788} {"train_loss": -6.832313537597656, "global_step": 159126, "epoch": 3788} {"train_loss": -6.783483028411865, "global_step": 159127, "epoch": 3788} {"train_loss": -6.972731590270996, "global_step": 159128, "epoch": 3788} {"train_loss": -6.89069938659668, "global_step": 159129, "epoch": 3788} {"train_loss": -6.982055187225342, "global_step": 159130, "epoch": 3788} {"train_loss": -6.839236736297607, "global_step": 159131, "epoch": 3788} {"train_loss": -6.977773189544678, "global_step": 159132, "epoch": 3788} {"train_loss": -6.924068927764893, "global_step": 159133, "epoch": 3788} {"train_loss": -6.891033172607422, "global_step": 159134, "epoch": 3788} {"train_loss": -6.938136100769043, "global_step": 159135, "epoch": 3788} {"train_loss": -6.809629440307617, "global_step": 159136, "epoch": 3788} {"train_loss": -6.874627919424148, "global_step": 159137, "epoch": 3788, "val_loss": 68661.6875} {"train_loss": -6.751727104187012, "global_step": 159138, "epoch": 3789} {"train_loss": -6.839961051940918, "global_step": 159139, "epoch": 3789} {"train_loss": -6.935843467712402, "global_step": 159140, "epoch": 3789} {"train_loss": -6.869998931884766, "global_step": 159141, "epoch": 3789} {"train_loss": -6.818728446960449, "global_step": 159142, "epoch": 3789} {"train_loss": -6.873802661895752, "global_step": 159143, "epoch": 3789} {"train_loss": -6.896691799163818, "global_step": 159144, "epoch": 3789} {"train_loss": -7.002623558044434, "global_step": 159145, "epoch": 3789} {"train_loss": -6.943600177764893, "global_step": 159146, "epoch": 3789} {"train_loss": -6.783987998962402, "global_step": 159147, "epoch": 3789} {"train_loss": -6.918066024780273, "global_step": 159148, "epoch": 3789} {"train_loss": -7.000583648681641, "global_step": 159149, "epoch": 3789} {"train_loss": -6.772592067718506, "global_step": 159150, "epoch": 3789} {"train_loss": -6.812478542327881, "global_step": 159151, "epoch": 3789} {"train_loss": -6.687008857727051, "global_step": 159152, "epoch": 3789} {"train_loss": -6.8213396072387695, "global_step": 159153, "epoch": 3789} {"train_loss": -6.966057777404785, "global_step": 159154, "epoch": 3789} {"train_loss": -6.9629034996032715, "global_step": 159155, "epoch": 3789} {"train_loss": -7.005124092102051, "global_step": 159156, "epoch": 3789} {"train_loss": -6.888926029205322, "global_step": 159157, "epoch": 3789} {"train_loss": -6.89900016784668, "global_step": 159158, "epoch": 3789} {"train_loss": -7.005179405212402, "global_step": 159159, "epoch": 3789} {"train_loss": -6.788210868835449, "global_step": 159160, "epoch": 3789} {"train_loss": -6.946977615356445, "global_step": 159161, "epoch": 3789} {"train_loss": -6.822225570678711, "global_step": 159162, "epoch": 3789} {"train_loss": -6.927844047546387, "global_step": 159163, "epoch": 3789} {"train_loss": -6.819293975830078, "global_step": 159164, "epoch": 3789} {"train_loss": -6.889480113983154, "global_step": 159165, "epoch": 3789} {"train_loss": -6.768490791320801, "global_step": 159166, "epoch": 3789} {"train_loss": -6.941262245178223, "global_step": 159167, "epoch": 3789} {"train_loss": -6.845070838928223, "global_step": 159168, "epoch": 3789} {"train_loss": -6.800079822540283, "global_step": 159169, "epoch": 3789} {"train_loss": -6.743805885314941, "global_step": 159170, "epoch": 3789} {"train_loss": -6.9437761306762695, "global_step": 159171, "epoch": 3789} {"train_loss": -6.780673980712891, "global_step": 159172, "epoch": 3789} {"train_loss": -6.897970676422119, "global_step": 159173, "epoch": 3789} {"train_loss": -6.812310695648193, "global_step": 159174, "epoch": 3789} {"train_loss": -6.683595657348633, "global_step": 159175, "epoch": 3789} {"train_loss": -6.877747535705566, "global_step": 159176, "epoch": 3789} {"train_loss": -6.776698112487793, "global_step": 159177, "epoch": 3789} {"train_loss": -6.916074752807617, "global_step": 159178, "epoch": 3789} {"train_loss": -6.863790455318632, "global_step": 159179, "epoch": 3789, "val_loss": 68524.125} {"train_loss": -6.969764232635498, "global_step": 159180, "epoch": 3790} {"train_loss": -6.786243438720703, "global_step": 159181, "epoch": 3790} {"train_loss": -6.935945510864258, "global_step": 159182, "epoch": 3790} {"train_loss": -7.0174970626831055, "global_step": 159183, "epoch": 3790} {"train_loss": -6.890859603881836, "global_step": 159184, "epoch": 3790} {"train_loss": -6.959668159484863, "global_step": 159185, "epoch": 3790} {"train_loss": -6.866938591003418, "global_step": 159186, "epoch": 3790} {"train_loss": -6.958008766174316, "global_step": 159187, "epoch": 3790} {"train_loss": -6.921719551086426, "global_step": 159188, "epoch": 3790} {"train_loss": -6.9316205978393555, "global_step": 159189, "epoch": 3790} {"train_loss": -6.973563194274902, "global_step": 159190, "epoch": 3790} {"train_loss": -6.940312385559082, "global_step": 159191, "epoch": 3790} {"train_loss": -6.935513019561768, "global_step": 159192, "epoch": 3790} {"train_loss": -6.964376449584961, "global_step": 159193, "epoch": 3790} {"train_loss": -7.031403541564941, "global_step": 159194, "epoch": 3790} {"train_loss": -6.999412536621094, "global_step": 159195, "epoch": 3790} {"train_loss": -7.038507461547852, "global_step": 159196, "epoch": 3790} {"train_loss": -6.937248706817627, "global_step": 159197, "epoch": 3790} {"train_loss": -6.912126541137695, "global_step": 159198, "epoch": 3790} {"train_loss": -7.000030994415283, "global_step": 159199, "epoch": 3790} {"train_loss": -7.02933931350708, "global_step": 159200, "epoch": 3790} {"train_loss": -6.978994369506836, "global_step": 159201, "epoch": 3790} {"train_loss": -6.978639125823975, "global_step": 159202, "epoch": 3790} {"train_loss": -6.839289665222168, "global_step": 159203, "epoch": 3790} {"train_loss": -6.947439193725586, "global_step": 159204, "epoch": 3790} {"train_loss": -6.902555465698242, "global_step": 159205, "epoch": 3790} {"train_loss": -6.962327003479004, "global_step": 159206, "epoch": 3790} {"train_loss": -6.942258834838867, "global_step": 159207, "epoch": 3790} {"train_loss": -6.838404655456543, "global_step": 159208, "epoch": 3790} {"train_loss": -6.914947509765625, "global_step": 159209, "epoch": 3790} {"train_loss": -6.760148525238037, "global_step": 159210, "epoch": 3790} {"train_loss": -6.867952823638916, "global_step": 159211, "epoch": 3790} {"train_loss": -6.8001708984375, "global_step": 159212, "epoch": 3790} {"train_loss": -6.87156343460083, "global_step": 159213, "epoch": 3790} {"train_loss": -7.041565895080566, "global_step": 159214, "epoch": 3790} {"train_loss": -6.756412506103516, "global_step": 159215, "epoch": 3790} {"train_loss": -6.930187702178955, "global_step": 159216, "epoch": 3790} {"train_loss": -6.859945297241211, "global_step": 159217, "epoch": 3790} {"train_loss": -6.8822221755981445, "global_step": 159218, "epoch": 3790} {"train_loss": -6.931928634643555, "global_step": 159219, "epoch": 3790} {"train_loss": -6.83290433883667, "global_step": 159220, "epoch": 3790} {"train_loss": -6.9212737537565685, "global_step": 159221, "epoch": 3790, "val_loss": 68479.8359375} {"train_loss": -6.92449426651001, "global_step": 159222, "epoch": 3791} {"train_loss": -6.883437633514404, "global_step": 159223, "epoch": 3791} {"train_loss": -6.858841896057129, "global_step": 159224, "epoch": 3791} {"train_loss": -6.945507526397705, "global_step": 159225, "epoch": 3791} {"train_loss": -6.895841121673584, "global_step": 159226, "epoch": 3791} {"train_loss": -6.870149612426758, "global_step": 159227, "epoch": 3791} {"train_loss": -6.943562984466553, "global_step": 159228, "epoch": 3791} {"train_loss": -6.756471633911133, "global_step": 159229, "epoch": 3791} {"train_loss": -6.796026229858398, "global_step": 159230, "epoch": 3791} {"train_loss": -6.851953506469727, "global_step": 159231, "epoch": 3791} {"train_loss": -6.724842548370361, "global_step": 159232, "epoch": 3791} {"train_loss": -6.906162738800049, "global_step": 159233, "epoch": 3791} {"train_loss": -6.864524841308594, "global_step": 159234, "epoch": 3791} {"train_loss": -6.862239837646484, "global_step": 159235, "epoch": 3791} {"train_loss": -6.8808417320251465, "global_step": 159236, "epoch": 3791} {"train_loss": -6.907220840454102, "global_step": 159237, "epoch": 3791} {"train_loss": -6.810731887817383, "global_step": 159238, "epoch": 3791} {"train_loss": -6.935391426086426, "global_step": 159239, "epoch": 3791} {"train_loss": -6.846975326538086, "global_step": 159240, "epoch": 3791} {"train_loss": -6.87759256362915, "global_step": 159241, "epoch": 3791} {"train_loss": -6.909082412719727, "global_step": 159242, "epoch": 3791} {"train_loss": -6.869706630706787, "global_step": 159243, "epoch": 3791} {"train_loss": -6.781379222869873, "global_step": 159244, "epoch": 3791} {"train_loss": -6.83258056640625, "global_step": 159245, "epoch": 3791} {"train_loss": -6.824163913726807, "global_step": 159246, "epoch": 3791} {"train_loss": -6.7401275634765625, "global_step": 159247, "epoch": 3791} {"train_loss": -6.854135990142822, "global_step": 159248, "epoch": 3791} {"train_loss": -6.597173690795898, "global_step": 159249, "epoch": 3791} {"train_loss": -6.7931227684021, "global_step": 159250, "epoch": 3791} {"train_loss": -6.940656661987305, "global_step": 159251, "epoch": 3791} {"train_loss": -6.7345685958862305, "global_step": 159252, "epoch": 3791} {"train_loss": -6.836816787719727, "global_step": 159253, "epoch": 3791} {"train_loss": -6.80805778503418, "global_step": 159254, "epoch": 3791} {"train_loss": -6.7798027992248535, "global_step": 159255, "epoch": 3791} {"train_loss": -6.691922187805176, "global_step": 159256, "epoch": 3791} {"train_loss": -6.819421768188477, "global_step": 159257, "epoch": 3791} {"train_loss": -6.841925621032715, "global_step": 159258, "epoch": 3791} {"train_loss": -6.726609230041504, "global_step": 159259, "epoch": 3791} {"train_loss": -6.763077735900879, "global_step": 159260, "epoch": 3791} {"train_loss": -6.784306049346924, "global_step": 159261, "epoch": 3791} {"train_loss": -6.845734119415283, "global_step": 159262, "epoch": 3791} {"train_loss": -6.831649916512625, "global_step": 159263, "epoch": 3791, "val_loss": 68562.8984375} {"train_loss": -6.8796234130859375, "global_step": 159264, "epoch": 3792} {"train_loss": -6.837759971618652, "global_step": 159265, "epoch": 3792} {"train_loss": -6.782329559326172, "global_step": 159266, "epoch": 3792} {"train_loss": -6.950064182281494, "global_step": 159267, "epoch": 3792} {"train_loss": -6.845305919647217, "global_step": 159268, "epoch": 3792} {"train_loss": -7.001346588134766, "global_step": 159269, "epoch": 3792} {"train_loss": -6.890625, "global_step": 159270, "epoch": 3792} {"train_loss": -6.911438941955566, "global_step": 159271, "epoch": 3792} {"train_loss": -6.912827491760254, "global_step": 159272, "epoch": 3792} {"train_loss": -6.900778293609619, "global_step": 159273, "epoch": 3792} {"train_loss": -6.9533538818359375, "global_step": 159274, "epoch": 3792} {"train_loss": -6.7758026123046875, "global_step": 159275, "epoch": 3792} {"train_loss": -6.920598030090332, "global_step": 159276, "epoch": 3792} {"train_loss": -6.719839572906494, "global_step": 159277, "epoch": 3792} {"train_loss": -6.9456787109375, "global_step": 159278, "epoch": 3792} {"train_loss": -6.876246929168701, "global_step": 159279, "epoch": 3792} {"train_loss": -6.9385504722595215, "global_step": 159280, "epoch": 3792} {"train_loss": -6.8844218254089355, "global_step": 159281, "epoch": 3792} {"train_loss": -6.8017683029174805, "global_step": 159282, "epoch": 3792} {"train_loss": -7.034421443939209, "global_step": 159283, "epoch": 3792} {"train_loss": -6.8677167892456055, "global_step": 159284, "epoch": 3792} {"train_loss": -6.773404121398926, "global_step": 159285, "epoch": 3792} {"train_loss": -6.8676605224609375, "global_step": 159286, "epoch": 3792} {"train_loss": -6.905442714691162, "global_step": 159287, "epoch": 3792} {"train_loss": -6.868802547454834, "global_step": 159288, "epoch": 3792} {"train_loss": -6.771795272827148, "global_step": 159289, "epoch": 3792} {"train_loss": -6.8949294090271, "global_step": 159290, "epoch": 3792} {"train_loss": -7.028213024139404, "global_step": 159291, "epoch": 3792} {"train_loss": -6.905341625213623, "global_step": 159292, "epoch": 3792} {"train_loss": -6.896924018859863, "global_step": 159293, "epoch": 3792} {"train_loss": -6.92338228225708, "global_step": 159294, "epoch": 3792} {"train_loss": -6.915458679199219, "global_step": 159295, "epoch": 3792} {"train_loss": -6.890585899353027, "global_step": 159296, "epoch": 3792} {"train_loss": -6.9784650802612305, "global_step": 159297, "epoch": 3792} {"train_loss": -6.939878940582275, "global_step": 159298, "epoch": 3792} {"train_loss": -6.837831497192383, "global_step": 159299, "epoch": 3792} {"train_loss": -6.948657989501953, "global_step": 159300, "epoch": 3792} {"train_loss": -6.970959663391113, "global_step": 159301, "epoch": 3792} {"train_loss": -6.849337577819824, "global_step": 159302, "epoch": 3792} {"train_loss": -6.941550254821777, "global_step": 159303, "epoch": 3792} {"train_loss": -6.927357196807861, "global_step": 159304, "epoch": 3792} {"train_loss": -6.897028094246274, "global_step": 159305, "epoch": 3792, "val_loss": 68573.3828125} {"train_loss": -6.9164910316467285, "global_step": 159306, "epoch": 3793} {"train_loss": -6.867666244506836, "global_step": 159307, "epoch": 3793} {"train_loss": -6.9772796630859375, "global_step": 159308, "epoch": 3793} {"train_loss": -6.910845756530762, "global_step": 159309, "epoch": 3793} {"train_loss": -7.040467262268066, "global_step": 159310, "epoch": 3793} {"train_loss": -6.903595447540283, "global_step": 159311, "epoch": 3793} {"train_loss": -6.977433681488037, "global_step": 159312, "epoch": 3793} {"train_loss": -6.93550968170166, "global_step": 159313, "epoch": 3793} {"train_loss": -6.882634162902832, "global_step": 159314, "epoch": 3793} {"train_loss": -6.972562789916992, "global_step": 159315, "epoch": 3793} {"train_loss": -6.922206401824951, "global_step": 159316, "epoch": 3793} {"train_loss": -6.898259162902832, "global_step": 159317, "epoch": 3793} {"train_loss": -6.73515510559082, "global_step": 159318, "epoch": 3793} {"train_loss": -6.853999614715576, "global_step": 159319, "epoch": 3793} {"train_loss": -6.847198009490967, "global_step": 159320, "epoch": 3793} {"train_loss": -6.869962215423584, "global_step": 159321, "epoch": 3793} {"train_loss": -6.937436580657959, "global_step": 159322, "epoch": 3793} {"train_loss": -6.884275913238525, "global_step": 159323, "epoch": 3793} {"train_loss": -6.86604118347168, "global_step": 159324, "epoch": 3793} {"train_loss": -6.808338642120361, "global_step": 159325, "epoch": 3793} {"train_loss": -6.937661647796631, "global_step": 159326, "epoch": 3793} {"train_loss": -6.770885944366455, "global_step": 159327, "epoch": 3793} {"train_loss": -6.862700462341309, "global_step": 159328, "epoch": 3793} {"train_loss": -6.96901273727417, "global_step": 159329, "epoch": 3793} {"train_loss": -6.873802185058594, "global_step": 159330, "epoch": 3793} {"train_loss": -6.901185035705566, "global_step": 159331, "epoch": 3793} {"train_loss": -6.912769317626953, "global_step": 159332, "epoch": 3793} {"train_loss": -6.9170660972595215, "global_step": 159333, "epoch": 3793} {"train_loss": -6.893594264984131, "global_step": 159334, "epoch": 3793} {"train_loss": -6.882978439331055, "global_step": 159335, "epoch": 3793} {"train_loss": -6.967545032501221, "global_step": 159336, "epoch": 3793} {"train_loss": -6.941076278686523, "global_step": 159337, "epoch": 3793} {"train_loss": -6.985836982727051, "global_step": 159338, "epoch": 3793} {"train_loss": -6.816959381103516, "global_step": 159339, "epoch": 3793} {"train_loss": -6.854931831359863, "global_step": 159340, "epoch": 3793} {"train_loss": -6.889540672302246, "global_step": 159341, "epoch": 3793} {"train_loss": -6.961135387420654, "global_step": 159342, "epoch": 3793} {"train_loss": -6.840145111083984, "global_step": 159343, "epoch": 3793} {"train_loss": -6.946824073791504, "global_step": 159344, "epoch": 3793} {"train_loss": -6.911632537841797, "global_step": 159345, "epoch": 3793} {"train_loss": -6.893973350524902, "global_step": 159346, "epoch": 3793} {"train_loss": -6.900902384803409, "global_step": 159347, "epoch": 3793, "val_loss": 68486.75} {"train_loss": -6.9807820320129395, "global_step": 159348, "epoch": 3794} {"train_loss": -7.0017781257629395, "global_step": 159349, "epoch": 3794} {"train_loss": -6.891945838928223, "global_step": 159350, "epoch": 3794} {"train_loss": -6.86181116104126, "global_step": 159351, "epoch": 3794} {"train_loss": -7.041791915893555, "global_step": 159352, "epoch": 3794} {"train_loss": -6.860588073730469, "global_step": 159353, "epoch": 3794} {"train_loss": -6.821436882019043, "global_step": 159354, "epoch": 3794} {"train_loss": -6.854581832885742, "global_step": 159355, "epoch": 3794} {"train_loss": -6.957494735717773, "global_step": 159356, "epoch": 3794} {"train_loss": -6.959820747375488, "global_step": 159357, "epoch": 3794} {"train_loss": -6.880310535430908, "global_step": 159358, "epoch": 3794} {"train_loss": -7.070155143737793, "global_step": 159359, "epoch": 3794} {"train_loss": -6.902993202209473, "global_step": 159360, "epoch": 3794} {"train_loss": -6.934992790222168, "global_step": 159361, "epoch": 3794} {"train_loss": -6.837186813354492, "global_step": 159362, "epoch": 3794} {"train_loss": -6.929574489593506, "global_step": 159363, "epoch": 3794} {"train_loss": -6.879027366638184, "global_step": 159364, "epoch": 3794} {"train_loss": -6.8754167556762695, "global_step": 159365, "epoch": 3794} {"train_loss": -7.021125793457031, "global_step": 159366, "epoch": 3794} {"train_loss": -6.885316848754883, "global_step": 159367, "epoch": 3794} {"train_loss": -6.852212905883789, "global_step": 159368, "epoch": 3794} {"train_loss": -6.811004638671875, "global_step": 159369, "epoch": 3794} {"train_loss": -6.978114128112793, "global_step": 159370, "epoch": 3794} {"train_loss": -6.803409576416016, "global_step": 159371, "epoch": 3794} {"train_loss": -6.947993278503418, "global_step": 159372, "epoch": 3794} {"train_loss": -6.788921356201172, "global_step": 159373, "epoch": 3794} {"train_loss": -6.74446439743042, "global_step": 159374, "epoch": 3794} {"train_loss": -6.785342693328857, "global_step": 159375, "epoch": 3794} {"train_loss": -6.885593414306641, "global_step": 159376, "epoch": 3794} {"train_loss": -6.89199686050415, "global_step": 159377, "epoch": 3794} {"train_loss": -6.88908576965332, "global_step": 159378, "epoch": 3794} {"train_loss": -6.809678077697754, "global_step": 159379, "epoch": 3794} {"train_loss": -6.924099922180176, "global_step": 159380, "epoch": 3794} {"train_loss": -6.892251014709473, "global_step": 159381, "epoch": 3794} {"train_loss": -6.831334590911865, "global_step": 159382, "epoch": 3794} {"train_loss": -6.837924957275391, "global_step": 159383, "epoch": 3794} {"train_loss": -6.673027038574219, "global_step": 159384, "epoch": 3794} {"train_loss": -6.802207946777344, "global_step": 159385, "epoch": 3794} {"train_loss": -6.83064603805542, "global_step": 159386, "epoch": 3794} {"train_loss": -6.694519519805908, "global_step": 159387, "epoch": 3794} {"train_loss": -6.80972957611084, "global_step": 159388, "epoch": 3794} {"train_loss": -6.871064492634365, "global_step": 159389, "epoch": 3794, "val_loss": 68695.7421875} {"train_loss": -6.776376247406006, "global_step": 159390, "epoch": 3795} {"train_loss": -6.645719051361084, "global_step": 159391, "epoch": 3795} {"train_loss": -6.855582237243652, "global_step": 159392, "epoch": 3795} {"train_loss": -6.570673942565918, "global_step": 159393, "epoch": 3795} {"train_loss": -6.753073692321777, "global_step": 159394, "epoch": 3795} {"train_loss": -6.808042526245117, "global_step": 159395, "epoch": 3795} {"train_loss": -6.892236709594727, "global_step": 159396, "epoch": 3795} {"train_loss": -6.741513252258301, "global_step": 159397, "epoch": 3795} {"train_loss": -6.82578182220459, "global_step": 159398, "epoch": 3795} {"train_loss": -6.848191738128662, "global_step": 159399, "epoch": 3795} {"train_loss": -6.787671089172363, "global_step": 159400, "epoch": 3795} {"train_loss": -6.862820625305176, "global_step": 159401, "epoch": 3795} {"train_loss": -6.8348236083984375, "global_step": 159402, "epoch": 3795} {"train_loss": -6.864287853240967, "global_step": 159403, "epoch": 3795} {"train_loss": -6.749902248382568, "global_step": 159404, "epoch": 3795} {"train_loss": -6.971424102783203, "global_step": 159405, "epoch": 3795} {"train_loss": -6.709867477416992, "global_step": 159406, "epoch": 3795} {"train_loss": -6.906491279602051, "global_step": 159407, "epoch": 3795} {"train_loss": -6.766884803771973, "global_step": 159408, "epoch": 3795} {"train_loss": -7.0340256690979, "global_step": 159409, "epoch": 3795} {"train_loss": -6.846608638763428, "global_step": 159410, "epoch": 3795} {"train_loss": -6.8406219482421875, "global_step": 159411, "epoch": 3795} {"train_loss": -6.762337684631348, "global_step": 159412, "epoch": 3795} {"train_loss": -6.84987735748291, "global_step": 159413, "epoch": 3795} {"train_loss": -6.897982597351074, "global_step": 159414, "epoch": 3795} {"train_loss": -6.837521553039551, "global_step": 159415, "epoch": 3795} {"train_loss": -6.874416351318359, "global_step": 159416, "epoch": 3795} {"train_loss": -6.847941875457764, "global_step": 159417, "epoch": 3795} {"train_loss": -6.766568660736084, "global_step": 159418, "epoch": 3795} {"train_loss": -6.826458930969238, "global_step": 159419, "epoch": 3795} {"train_loss": -6.624325752258301, "global_step": 159420, "epoch": 3795} {"train_loss": -6.8684234619140625, "global_step": 159421, "epoch": 3795} {"train_loss": -6.811766624450684, "global_step": 159422, "epoch": 3795} {"train_loss": -6.856839179992676, "global_step": 159423, "epoch": 3795} {"train_loss": -6.830609321594238, "global_step": 159424, "epoch": 3795} {"train_loss": -6.803267478942871, "global_step": 159425, "epoch": 3795} {"train_loss": -6.782796382904053, "global_step": 159426, "epoch": 3795} {"train_loss": -6.90323543548584, "global_step": 159427, "epoch": 3795} {"train_loss": -6.871408462524414, "global_step": 159428, "epoch": 3795} {"train_loss": -6.869021415710449, "global_step": 159429, "epoch": 3795} {"train_loss": -6.847414016723633, "global_step": 159430, "epoch": 3795} {"train_loss": -6.818755013602121, "global_step": 159431, "epoch": 3795, "val_loss": 68649.140625} {"train_loss": -6.791532516479492, "global_step": 159432, "epoch": 3796} {"train_loss": -6.796256065368652, "global_step": 159433, "epoch": 3796} {"train_loss": -6.796124458312988, "global_step": 159434, "epoch": 3796} {"train_loss": -6.780313491821289, "global_step": 159435, "epoch": 3796} {"train_loss": -6.838140487670898, "global_step": 159436, "epoch": 3796} {"train_loss": -6.910725116729736, "global_step": 159437, "epoch": 3796} {"train_loss": -6.778555870056152, "global_step": 159438, "epoch": 3796} {"train_loss": -6.964791774749756, "global_step": 159439, "epoch": 3796} {"train_loss": -6.76807975769043, "global_step": 159440, "epoch": 3796} {"train_loss": -6.832435131072998, "global_step": 159441, "epoch": 3796} {"train_loss": -6.875974178314209, "global_step": 159442, "epoch": 3796} {"train_loss": -6.9903974533081055, "global_step": 159443, "epoch": 3796} {"train_loss": -6.801724433898926, "global_step": 159444, "epoch": 3796} {"train_loss": -6.94257926940918, "global_step": 159445, "epoch": 3796} {"train_loss": -6.832603454589844, "global_step": 159446, "epoch": 3796} {"train_loss": -6.949082374572754, "global_step": 159447, "epoch": 3796} {"train_loss": -6.907814025878906, "global_step": 159448, "epoch": 3796} {"train_loss": -6.755486488342285, "global_step": 159449, "epoch": 3796} {"train_loss": -6.9423041343688965, "global_step": 159450, "epoch": 3796} {"train_loss": -6.865264892578125, "global_step": 159451, "epoch": 3796} {"train_loss": -6.824932098388672, "global_step": 159452, "epoch": 3796} {"train_loss": -7.044177055358887, "global_step": 159453, "epoch": 3796} {"train_loss": -6.900045394897461, "global_step": 159454, "epoch": 3796} {"train_loss": -6.90670108795166, "global_step": 159455, "epoch": 3796} {"train_loss": -7.006308078765869, "global_step": 159456, "epoch": 3796} {"train_loss": -6.8819899559021, "global_step": 159457, "epoch": 3796} {"train_loss": -7.023687839508057, "global_step": 159458, "epoch": 3796} {"train_loss": -6.787443161010742, "global_step": 159459, "epoch": 3796} {"train_loss": -6.808106899261475, "global_step": 159460, "epoch": 3796} {"train_loss": -6.940925598144531, "global_step": 159461, "epoch": 3796} {"train_loss": -6.9764299392700195, "global_step": 159462, "epoch": 3796} {"train_loss": -6.940752983093262, "global_step": 159463, "epoch": 3796} {"train_loss": -6.833820819854736, "global_step": 159464, "epoch": 3796} {"train_loss": -6.894648551940918, "global_step": 159465, "epoch": 3796} {"train_loss": -6.893134117126465, "global_step": 159466, "epoch": 3796} {"train_loss": -6.864323616027832, "global_step": 159467, "epoch": 3796} {"train_loss": -7.083229064941406, "global_step": 159468, "epoch": 3796} {"train_loss": -7.05609130859375, "global_step": 159469, "epoch": 3796} {"train_loss": -6.868878364562988, "global_step": 159470, "epoch": 3796} {"train_loss": -6.975187301635742, "global_step": 159471, "epoch": 3796} {"train_loss": -6.865993022918701, "global_step": 159472, "epoch": 3796} {"train_loss": -6.890747399557204, "global_step": 159473, "epoch": 3796, "val_loss": 68571.4453125} {"train_loss": -6.942630767822266, "global_step": 159474, "epoch": 3797} {"train_loss": -6.942773818969727, "global_step": 159475, "epoch": 3797} {"train_loss": -6.878685474395752, "global_step": 159476, "epoch": 3797} {"train_loss": -6.90076208114624, "global_step": 159477, "epoch": 3797} {"train_loss": -6.812420845031738, "global_step": 159478, "epoch": 3797} {"train_loss": -6.908535003662109, "global_step": 159479, "epoch": 3797} {"train_loss": -6.83689022064209, "global_step": 159480, "epoch": 3797} {"train_loss": -6.928967475891113, "global_step": 159481, "epoch": 3797} {"train_loss": -7.000075340270996, "global_step": 159482, "epoch": 3797} {"train_loss": -6.905182838439941, "global_step": 159483, "epoch": 3797} {"train_loss": -6.918907165527344, "global_step": 159484, "epoch": 3797} {"train_loss": -6.837283134460449, "global_step": 159485, "epoch": 3797} {"train_loss": -6.801347732543945, "global_step": 159486, "epoch": 3797} {"train_loss": -6.770455360412598, "global_step": 159487, "epoch": 3797} {"train_loss": -6.762205123901367, "global_step": 159488, "epoch": 3797} {"train_loss": -6.975162506103516, "global_step": 159489, "epoch": 3797} {"train_loss": -6.90666389465332, "global_step": 159490, "epoch": 3797} {"train_loss": -6.910426616668701, "global_step": 159491, "epoch": 3797} {"train_loss": -6.8237457275390625, "global_step": 159492, "epoch": 3797} {"train_loss": -6.827091693878174, "global_step": 159493, "epoch": 3797} {"train_loss": -6.962245941162109, "global_step": 159494, "epoch": 3797} {"train_loss": -6.893537521362305, "global_step": 159495, "epoch": 3797} {"train_loss": -6.940977096557617, "global_step": 159496, "epoch": 3797} {"train_loss": -6.836671829223633, "global_step": 159497, "epoch": 3797} {"train_loss": -6.875069618225098, "global_step": 159498, "epoch": 3797} {"train_loss": -6.953920364379883, "global_step": 159499, "epoch": 3797} {"train_loss": -6.77569580078125, "global_step": 159500, "epoch": 3797} {"train_loss": -6.830059051513672, "global_step": 159501, "epoch": 3797} {"train_loss": -6.836109638214111, "global_step": 159502, "epoch": 3797} {"train_loss": -6.880292892456055, "global_step": 159503, "epoch": 3797} {"train_loss": -6.868441581726074, "global_step": 159504, "epoch": 3797} {"train_loss": -6.945728302001953, "global_step": 159505, "epoch": 3797} {"train_loss": -6.851443290710449, "global_step": 159506, "epoch": 3797} {"train_loss": -6.881912708282471, "global_step": 159507, "epoch": 3797} {"train_loss": -6.930681228637695, "global_step": 159508, "epoch": 3797} {"train_loss": -6.966410160064697, "global_step": 159509, "epoch": 3797} {"train_loss": -6.847179412841797, "global_step": 159510, "epoch": 3797} {"train_loss": -6.90501594543457, "global_step": 159511, "epoch": 3797} {"train_loss": -6.902464866638184, "global_step": 159512, "epoch": 3797} {"train_loss": -6.950998783111572, "global_step": 159513, "epoch": 3797} {"train_loss": -6.856377124786377, "global_step": 159514, "epoch": 3797} {"train_loss": -6.8831231480553035, "global_step": 159515, "epoch": 3797, "val_loss": 68534.34375} {"train_loss": -6.839625835418701, "global_step": 159516, "epoch": 3798} {"train_loss": -6.836990833282471, "global_step": 159517, "epoch": 3798} {"train_loss": -6.899163246154785, "global_step": 159518, "epoch": 3798} {"train_loss": -6.974821090698242, "global_step": 159519, "epoch": 3798} {"train_loss": -6.897866725921631, "global_step": 159520, "epoch": 3798} {"train_loss": -6.939326286315918, "global_step": 159521, "epoch": 3798} {"train_loss": -6.908372402191162, "global_step": 159522, "epoch": 3798} {"train_loss": -6.9623517990112305, "global_step": 159523, "epoch": 3798} {"train_loss": -6.917575836181641, "global_step": 159524, "epoch": 3798} {"train_loss": -6.805639266967773, "global_step": 159525, "epoch": 3798} {"train_loss": -6.870553970336914, "global_step": 159526, "epoch": 3798} {"train_loss": -6.982161045074463, "global_step": 159527, "epoch": 3798} {"train_loss": -6.87051248550415, "global_step": 159528, "epoch": 3798} {"train_loss": -6.966705322265625, "global_step": 159529, "epoch": 3798} {"train_loss": -6.935194969177246, "global_step": 159530, "epoch": 3798} {"train_loss": -6.826059341430664, "global_step": 159531, "epoch": 3798} {"train_loss": -6.973071098327637, "global_step": 159532, "epoch": 3798} {"train_loss": -6.791995525360107, "global_step": 159533, "epoch": 3798} {"train_loss": -6.898255348205566, "global_step": 159534, "epoch": 3798} {"train_loss": -6.829705238342285, "global_step": 159535, "epoch": 3798} {"train_loss": -6.832622528076172, "global_step": 159536, "epoch": 3798} {"train_loss": -6.7911200523376465, "global_step": 159537, "epoch": 3798} {"train_loss": -6.794371604919434, "global_step": 159538, "epoch": 3798} {"train_loss": -6.980588912963867, "global_step": 159539, "epoch": 3798} {"train_loss": -6.904245853424072, "global_step": 159540, "epoch": 3798} {"train_loss": -6.78570556640625, "global_step": 159541, "epoch": 3798} {"train_loss": -6.984158515930176, "global_step": 159542, "epoch": 3798} {"train_loss": -6.76060676574707, "global_step": 159543, "epoch": 3798} {"train_loss": -6.950075149536133, "global_step": 159544, "epoch": 3798} {"train_loss": -6.7385430335998535, "global_step": 159545, "epoch": 3798} {"train_loss": -6.862431526184082, "global_step": 159546, "epoch": 3798} {"train_loss": -6.880377769470215, "global_step": 159547, "epoch": 3798} {"train_loss": -6.87349271774292, "global_step": 159548, "epoch": 3798} {"train_loss": -6.926421642303467, "global_step": 159549, "epoch": 3798} {"train_loss": -6.831024169921875, "global_step": 159550, "epoch": 3798} {"train_loss": -6.926726818084717, "global_step": 159551, "epoch": 3798} {"train_loss": -6.870171070098877, "global_step": 159552, "epoch": 3798} {"train_loss": -6.934640884399414, "global_step": 159553, "epoch": 3798} {"train_loss": -6.995762348175049, "global_step": 159554, "epoch": 3798} {"train_loss": -6.908315181732178, "global_step": 159555, "epoch": 3798} {"train_loss": -6.953840732574463, "global_step": 159556, "epoch": 3798} {"train_loss": -6.888132731119792, "global_step": 159557, "epoch": 3798, "val_loss": 68429.28125} {"train_loss": -6.882269382476807, "global_step": 159558, "epoch": 3799} {"train_loss": -6.8528900146484375, "global_step": 159559, "epoch": 3799} {"train_loss": -6.9955525398254395, "global_step": 159560, "epoch": 3799} {"train_loss": -6.893432140350342, "global_step": 159561, "epoch": 3799} {"train_loss": -6.958270072937012, "global_step": 159562, "epoch": 3799} {"train_loss": -6.89548397064209, "global_step": 159563, "epoch": 3799} {"train_loss": -6.938326835632324, "global_step": 159564, "epoch": 3799} {"train_loss": -6.889589786529541, "global_step": 159565, "epoch": 3799} {"train_loss": -6.986519813537598, "global_step": 159566, "epoch": 3799} {"train_loss": -6.888850212097168, "global_step": 159567, "epoch": 3799} {"train_loss": -6.882882118225098, "global_step": 159568, "epoch": 3799} {"train_loss": -6.996918678283691, "global_step": 159569, "epoch": 3799} {"train_loss": -6.95292854309082, "global_step": 159570, "epoch": 3799} {"train_loss": -6.932890892028809, "global_step": 159571, "epoch": 3799} {"train_loss": -6.858717918395996, "global_step": 159572, "epoch": 3799} {"train_loss": -6.880402565002441, "global_step": 159573, "epoch": 3799} {"train_loss": -6.925452709197998, "global_step": 159574, "epoch": 3799} {"train_loss": -6.958566665649414, "global_step": 159575, "epoch": 3799} {"train_loss": -6.951558589935303, "global_step": 159576, "epoch": 3799} {"train_loss": -6.983454704284668, "global_step": 159577, "epoch": 3799} {"train_loss": -6.945835590362549, "global_step": 159578, "epoch": 3799} {"train_loss": -6.940445423126221, "global_step": 159579, "epoch": 3799} {"train_loss": -6.885392665863037, "global_step": 159580, "epoch": 3799} {"train_loss": -6.921882629394531, "global_step": 159581, "epoch": 3799} {"train_loss": -6.978754997253418, "global_step": 159582, "epoch": 3799} {"train_loss": -6.991438865661621, "global_step": 159583, "epoch": 3799} {"train_loss": -7.018049240112305, "global_step": 159584, "epoch": 3799} {"train_loss": -6.911559581756592, "global_step": 159585, "epoch": 3799} {"train_loss": -6.92975378036499, "global_step": 159586, "epoch": 3799} {"train_loss": -7.002905368804932, "global_step": 159587, "epoch": 3799} {"train_loss": -6.946228981018066, "global_step": 159588, "epoch": 3799} {"train_loss": -6.822014808654785, "global_step": 159589, "epoch": 3799} {"train_loss": -6.893161296844482, "global_step": 159590, "epoch": 3799} {"train_loss": -6.875653266906738, "global_step": 159591, "epoch": 3799} {"train_loss": -6.9359540939331055, "global_step": 159592, "epoch": 3799} {"train_loss": -6.8377180099487305, "global_step": 159593, "epoch": 3799} {"train_loss": -6.819378852844238, "global_step": 159594, "epoch": 3799} {"train_loss": -6.95155143737793, "global_step": 159595, "epoch": 3799} {"train_loss": -6.838642120361328, "global_step": 159596, "epoch": 3799} {"train_loss": -6.940724849700928, "global_step": 159597, "epoch": 3799} {"train_loss": -6.8923187255859375, "global_step": 159598, "epoch": 3799} {"train_loss": -6.919782752082462, "global_step": 159599, "epoch": 3799, "val_loss": 68643.921875} {"train_loss": -7.019899845123291, "global_step": 159600, "epoch": 3800} {"train_loss": -6.859792709350586, "global_step": 159601, "epoch": 3800} {"train_loss": -6.872519016265869, "global_step": 159602, "epoch": 3800} {"train_loss": -6.814867973327637, "global_step": 159603, "epoch": 3800} {"train_loss": -6.8888325691223145, "global_step": 159604, "epoch": 3800} {"train_loss": -6.793410301208496, "global_step": 159605, "epoch": 3800} {"train_loss": -6.800350189208984, "global_step": 159606, "epoch": 3800} {"train_loss": -6.917715072631836, "global_step": 159607, "epoch": 3800} {"train_loss": -6.773439407348633, "global_step": 159608, "epoch": 3800} {"train_loss": -6.8690290451049805, "global_step": 159609, "epoch": 3800} {"train_loss": -6.850502967834473, "global_step": 159610, "epoch": 3800} {"train_loss": -6.878363609313965, "global_step": 159611, "epoch": 3800} {"train_loss": -6.904655456542969, "global_step": 159612, "epoch": 3800} {"train_loss": -6.820212364196777, "global_step": 159613, "epoch": 3800} {"train_loss": -6.899235725402832, "global_step": 159614, "epoch": 3800} {"train_loss": -6.731315612792969, "global_step": 159615, "epoch": 3800} {"train_loss": -6.915378570556641, "global_step": 159616, "epoch": 3800} {"train_loss": -6.986533164978027, "global_step": 159617, "epoch": 3800} {"train_loss": -6.949666976928711, "global_step": 159618, "epoch": 3800} {"train_loss": -6.796842098236084, "global_step": 159619, "epoch": 3800} {"train_loss": -6.7783098220825195, "global_step": 159620, "epoch": 3800} {"train_loss": -6.825232982635498, "global_step": 159621, "epoch": 3800} {"train_loss": -6.925321578979492, "global_step": 159622, "epoch": 3800} {"train_loss": -7.068965911865234, "global_step": 159623, "epoch": 3800} {"train_loss": -6.8359055519104, "global_step": 159624, "epoch": 3800} {"train_loss": -6.910571098327637, "global_step": 159625, "epoch": 3800} {"train_loss": -6.844240188598633, "global_step": 159626, "epoch": 3800} {"train_loss": -6.77828311920166, "global_step": 159627, "epoch": 3800} {"train_loss": -6.98179817199707, "global_step": 159628, "epoch": 3800} {"train_loss": -7.01239013671875, "global_step": 159629, "epoch": 3800} {"train_loss": -6.968001365661621, "global_step": 159630, "epoch": 3800} {"train_loss": -7.006353378295898, "global_step": 159631, "epoch": 3800} {"train_loss": -6.980676651000977, "global_step": 159632, "epoch": 3800} {"train_loss": -6.889819145202637, "global_step": 159633, "epoch": 3800} {"train_loss": -6.947175025939941, "global_step": 159634, "epoch": 3800} {"train_loss": -6.963355541229248, "global_step": 159635, "epoch": 3800} {"train_loss": -7.011752128601074, "global_step": 159636, "epoch": 3800} {"train_loss": -6.815980911254883, "global_step": 159637, "epoch": 3800} {"train_loss": -7.0281982421875, "global_step": 159638, "epoch": 3800} {"train_loss": -7.013121604919434, "global_step": 159639, "epoch": 3800} {"train_loss": -6.908711910247803, "global_step": 159640, "epoch": 3800} {"train_loss": -6.899045671735491, "global_step": 159641, "epoch": 3800, "train/sim_max_reward_0": 0.2236067280158624, "train/sim_max_reward_1": 0.9707245017961373, "train/sim_max_reward_2": 0.35144843805989623, "train/sim_max_reward_3": 0.12932443938792001, "train/sim_max_reward_4": 0.9738663722755758, "train/sim_max_reward_5": 0.9072772208850604, "test/sim_max_reward_4400000": 0.9013853947659063, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 0.9394841361146321, "test/sim_max_reward_4400003": 0.9519317638176502, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9663663556234887, "test/sim_max_reward_4400006": 0.9813098380818462, "test/sim_max_reward_4400007": 0.9409513568944299, "test/sim_max_reward_4400008": 0.2997362813652982, "test/sim_max_reward_4400009": 0.8569287854399228, "test/sim_max_reward_4400010": 0.19230957373813837, "test/sim_max_reward_4400011": 0.24916368764863236, "test/sim_max_reward_4400012": 0.9334572657234605, "test/sim_max_reward_4400013": 0.9963333789403195, "test/sim_max_reward_4400014": 0.8299312326841036, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.1609148450027336, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.25143428095224957, "test/sim_max_reward_4400019": 0.3572976448910281, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9619432219567362, "test/sim_max_reward_4400023": 0.9719974594241265, "test/sim_max_reward_4400024": 0.9209538967740147, "test/sim_max_reward_4400025": 0.2638045353419337, "test/sim_max_reward_4400026": 0.820944773363127, "test/sim_max_reward_4400027": 0.023159308084104834, "test/sim_max_reward_4400028": 0.812331344158441, "test/sim_max_reward_4400029": 0.4398900000016837, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9539132405770036, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8304857855457403, "test/sim_max_reward_4400034": 0.9936610898793644, "test/sim_max_reward_4400035": 0.3955781887891834, "test/sim_max_reward_4400036": 0.33418488841901406, "test/sim_max_reward_4400037": 0.9300658372196403, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9825033572117985, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.815247563117031, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9300140120967756, "test/sim_max_reward_4400045": 0.9926701904697011, "test/sim_max_reward_4400046": 0.6748257373556956, "test/sim_max_reward_4400047": 0.9559664454100777, "test/sim_max_reward_4400048": 0.8968350929522375, "test/sim_max_reward_4400049": 0.982064581965966, "train/mean_score": 0.5927079500700754, "test/mean_score": 0.6633041240434226, "val_loss": 68535.4453125} {"train_loss": -7.030055522918701, "global_step": 159642, "epoch": 3801} {"train_loss": -7.03626012802124, "global_step": 159643, "epoch": 3801} {"train_loss": -7.070291519165039, "global_step": 159644, "epoch": 3801} {"train_loss": -6.902553081512451, "global_step": 159645, "epoch": 3801} {"train_loss": -6.936338424682617, "global_step": 159646, "epoch": 3801} {"train_loss": -6.960143089294434, "global_step": 159647, "epoch": 3801} {"train_loss": -6.846738815307617, "global_step": 159648, "epoch": 3801} {"train_loss": -7.082956790924072, "global_step": 159649, "epoch": 3801} {"train_loss": -7.004354476928711, "global_step": 159650, "epoch": 3801} {"train_loss": -6.958540916442871, "global_step": 159651, "epoch": 3801} {"train_loss": -6.918384075164795, "global_step": 159652, "epoch": 3801} {"train_loss": -6.962218284606934, "global_step": 159653, "epoch": 3801} {"train_loss": -6.99461555480957, "global_step": 159654, "epoch": 3801} {"train_loss": -7.129343509674072, "global_step": 159655, "epoch": 3801} {"train_loss": -6.931188583374023, "global_step": 159656, "epoch": 3801} {"train_loss": -6.956179618835449, "global_step": 159657, "epoch": 3801} {"train_loss": -6.990169048309326, "global_step": 159658, "epoch": 3801} {"train_loss": -6.892893314361572, "global_step": 159659, "epoch": 3801} {"train_loss": -6.8716278076171875, "global_step": 159660, "epoch": 3801} {"train_loss": -6.992191314697266, "global_step": 159661, "epoch": 3801} {"train_loss": -6.950012683868408, "global_step": 159662, "epoch": 3801} {"train_loss": -6.9307451248168945, "global_step": 159663, "epoch": 3801} {"train_loss": -6.881983757019043, "global_step": 159664, "epoch": 3801} {"train_loss": -6.809109687805176, "global_step": 159665, "epoch": 3801} {"train_loss": -6.945047855377197, "global_step": 159666, "epoch": 3801} {"train_loss": -6.853048324584961, "global_step": 159667, "epoch": 3801} {"train_loss": -6.842959880828857, "global_step": 159668, "epoch": 3801} {"train_loss": -6.829367637634277, "global_step": 159669, "epoch": 3801} {"train_loss": -6.886883735656738, "global_step": 159670, "epoch": 3801} {"train_loss": -6.869632720947266, "global_step": 159671, "epoch": 3801} {"train_loss": -6.902439117431641, "global_step": 159672, "epoch": 3801} {"train_loss": -6.650142669677734, "global_step": 159673, "epoch": 3801} {"train_loss": -6.889892101287842, "global_step": 159674, "epoch": 3801} {"train_loss": -6.805089950561523, "global_step": 159675, "epoch": 3801} {"train_loss": -6.651466369628906, "global_step": 159676, "epoch": 3801} {"train_loss": -6.810671806335449, "global_step": 159677, "epoch": 3801} {"train_loss": -6.783084869384766, "global_step": 159678, "epoch": 3801} {"train_loss": -6.753912925720215, "global_step": 159679, "epoch": 3801} {"train_loss": -6.83117151260376, "global_step": 159680, "epoch": 3801} {"train_loss": -6.787997722625732, "global_step": 159681, "epoch": 3801} {"train_loss": -6.92593240737915, "global_step": 159682, "epoch": 3801} {"train_loss": -6.8999705995832175, "global_step": 159683, "epoch": 3801, "val_loss": 68537.6171875} {"train_loss": -6.853676795959473, "global_step": 159684, "epoch": 3802} {"train_loss": -6.842494964599609, "global_step": 159685, "epoch": 3802} {"train_loss": -6.968014717102051, "global_step": 159686, "epoch": 3802} {"train_loss": -6.948786735534668, "global_step": 159687, "epoch": 3802} {"train_loss": -6.850640773773193, "global_step": 159688, "epoch": 3802} {"train_loss": -6.94725227355957, "global_step": 159689, "epoch": 3802} {"train_loss": -6.891305923461914, "global_step": 159690, "epoch": 3802} {"train_loss": -6.687073707580566, "global_step": 159691, "epoch": 3802} {"train_loss": -6.915648460388184, "global_step": 159692, "epoch": 3802} {"train_loss": -6.692502975463867, "global_step": 159693, "epoch": 3802} {"train_loss": -6.775190353393555, "global_step": 159694, "epoch": 3802} {"train_loss": -6.87318229675293, "global_step": 159695, "epoch": 3802} {"train_loss": -6.825291156768799, "global_step": 159696, "epoch": 3802} {"train_loss": -6.758105278015137, "global_step": 159697, "epoch": 3802} {"train_loss": -6.819600582122803, "global_step": 159698, "epoch": 3802} {"train_loss": -6.750903129577637, "global_step": 159699, "epoch": 3802} {"train_loss": -7.040212631225586, "global_step": 159700, "epoch": 3802} {"train_loss": -6.754275321960449, "global_step": 159701, "epoch": 3802} {"train_loss": -6.93009090423584, "global_step": 159702, "epoch": 3802} {"train_loss": -6.9535369873046875, "global_step": 159703, "epoch": 3802} {"train_loss": -6.83797550201416, "global_step": 159704, "epoch": 3802} {"train_loss": -6.962277889251709, "global_step": 159705, "epoch": 3802} {"train_loss": -6.923794269561768, "global_step": 159706, "epoch": 3802} {"train_loss": -6.805222511291504, "global_step": 159707, "epoch": 3802} {"train_loss": -6.891535758972168, "global_step": 159708, "epoch": 3802} {"train_loss": -6.746119976043701, "global_step": 159709, "epoch": 3802} {"train_loss": -6.829507827758789, "global_step": 159710, "epoch": 3802} {"train_loss": -6.938578128814697, "global_step": 159711, "epoch": 3802} {"train_loss": -6.829184532165527, "global_step": 159712, "epoch": 3802} {"train_loss": -6.917588233947754, "global_step": 159713, "epoch": 3802} {"train_loss": -6.830024242401123, "global_step": 159714, "epoch": 3802} {"train_loss": -6.757681846618652, "global_step": 159715, "epoch": 3802} {"train_loss": -6.8338823318481445, "global_step": 159716, "epoch": 3802} {"train_loss": -6.940698623657227, "global_step": 159717, "epoch": 3802} {"train_loss": -6.879570960998535, "global_step": 159718, "epoch": 3802} {"train_loss": -6.852913856506348, "global_step": 159719, "epoch": 3802} {"train_loss": -6.871250629425049, "global_step": 159720, "epoch": 3802} {"train_loss": -6.744712829589844, "global_step": 159721, "epoch": 3802} {"train_loss": -6.891523838043213, "global_step": 159722, "epoch": 3802} {"train_loss": -6.892583847045898, "global_step": 159723, "epoch": 3802} {"train_loss": -6.953540802001953, "global_step": 159724, "epoch": 3802} {"train_loss": -6.861468076705933, "global_step": 159725, "epoch": 3802, "val_loss": 68434.984375} {"train_loss": -6.802279472351074, "global_step": 159726, "epoch": 3803} {"train_loss": -6.827548503875732, "global_step": 159727, "epoch": 3803} {"train_loss": -6.89164400100708, "global_step": 159728, "epoch": 3803} {"train_loss": -6.945796966552734, "global_step": 159729, "epoch": 3803} {"train_loss": -6.9168620109558105, "global_step": 159730, "epoch": 3803} {"train_loss": -6.918052673339844, "global_step": 159731, "epoch": 3803} {"train_loss": -6.89475154876709, "global_step": 159732, "epoch": 3803} {"train_loss": -6.915251731872559, "global_step": 159733, "epoch": 3803} {"train_loss": -6.912902355194092, "global_step": 159734, "epoch": 3803} {"train_loss": -6.961734771728516, "global_step": 159735, "epoch": 3803} {"train_loss": -6.860832214355469, "global_step": 159736, "epoch": 3803} {"train_loss": -7.020643711090088, "global_step": 159737, "epoch": 3803} {"train_loss": -6.979652404785156, "global_step": 159738, "epoch": 3803} {"train_loss": -6.983919143676758, "global_step": 159739, "epoch": 3803} {"train_loss": -6.981292247772217, "global_step": 159740, "epoch": 3803} {"train_loss": -6.973119735717773, "global_step": 159741, "epoch": 3803} {"train_loss": -6.801997184753418, "global_step": 159742, "epoch": 3803} {"train_loss": -6.93469762802124, "global_step": 159743, "epoch": 3803} {"train_loss": -6.935532569885254, "global_step": 159744, "epoch": 3803} {"train_loss": -6.8148956298828125, "global_step": 159745, "epoch": 3803} {"train_loss": -6.902556419372559, "global_step": 159746, "epoch": 3803} {"train_loss": -6.929830074310303, "global_step": 159747, "epoch": 3803} {"train_loss": -6.887772083282471, "global_step": 159748, "epoch": 3803} {"train_loss": -6.815960884094238, "global_step": 159749, "epoch": 3803} {"train_loss": -6.843595504760742, "global_step": 159750, "epoch": 3803} {"train_loss": -6.843423843383789, "global_step": 159751, "epoch": 3803} {"train_loss": -6.882669448852539, "global_step": 159752, "epoch": 3803} {"train_loss": -6.919660568237305, "global_step": 159753, "epoch": 3803} {"train_loss": -6.8804121017456055, "global_step": 159754, "epoch": 3803} {"train_loss": -6.879525184631348, "global_step": 159755, "epoch": 3803} {"train_loss": -6.956302165985107, "global_step": 159756, "epoch": 3803} {"train_loss": -6.904790878295898, "global_step": 159757, "epoch": 3803} {"train_loss": -6.931862831115723, "global_step": 159758, "epoch": 3803} {"train_loss": -6.902795791625977, "global_step": 159759, "epoch": 3803} {"train_loss": -6.889495849609375, "global_step": 159760, "epoch": 3803} {"train_loss": -6.936591148376465, "global_step": 159761, "epoch": 3803} {"train_loss": -6.740487575531006, "global_step": 159762, "epoch": 3803} {"train_loss": -6.890837669372559, "global_step": 159763, "epoch": 3803} {"train_loss": -6.793709754943848, "global_step": 159764, "epoch": 3803} {"train_loss": -6.942130088806152, "global_step": 159765, "epoch": 3803} {"train_loss": -6.87961483001709, "global_step": 159766, "epoch": 3803} {"train_loss": -6.89852355775379, "global_step": 159767, "epoch": 3803, "val_loss": 68724.40625} {"train_loss": -6.881962776184082, "global_step": 159768, "epoch": 3804} {"train_loss": -6.864311218261719, "global_step": 159769, "epoch": 3804} {"train_loss": -6.857481956481934, "global_step": 159770, "epoch": 3804} {"train_loss": -6.729272365570068, "global_step": 159771, "epoch": 3804} {"train_loss": -6.902872562408447, "global_step": 159772, "epoch": 3804} {"train_loss": -6.800820350646973, "global_step": 159773, "epoch": 3804} {"train_loss": -6.88105583190918, "global_step": 159774, "epoch": 3804} {"train_loss": -6.921494483947754, "global_step": 159775, "epoch": 3804} {"train_loss": -6.9442548751831055, "global_step": 159776, "epoch": 3804} {"train_loss": -6.844110488891602, "global_step": 159777, "epoch": 3804} {"train_loss": -6.819893836975098, "global_step": 159778, "epoch": 3804} {"train_loss": -7.000767230987549, "global_step": 159779, "epoch": 3804} {"train_loss": -6.870837211608887, "global_step": 159780, "epoch": 3804} {"train_loss": -7.000557899475098, "global_step": 159781, "epoch": 3804} {"train_loss": -6.878397464752197, "global_step": 159782, "epoch": 3804} {"train_loss": -6.891115188598633, "global_step": 159783, "epoch": 3804} {"train_loss": -6.812032222747803, "global_step": 159784, "epoch": 3804} {"train_loss": -6.94956111907959, "global_step": 159785, "epoch": 3804} {"train_loss": -6.859437465667725, "global_step": 159786, "epoch": 3804} {"train_loss": -6.897777557373047, "global_step": 159787, "epoch": 3804} {"train_loss": -6.685673236846924, "global_step": 159788, "epoch": 3804} {"train_loss": -6.782932281494141, "global_step": 159789, "epoch": 3804} {"train_loss": -6.841991424560547, "global_step": 159790, "epoch": 3804} {"train_loss": -6.862771034240723, "global_step": 159791, "epoch": 3804} {"train_loss": -6.844465255737305, "global_step": 159792, "epoch": 3804} {"train_loss": -6.831484317779541, "global_step": 159793, "epoch": 3804} {"train_loss": -7.026606559753418, "global_step": 159794, "epoch": 3804} {"train_loss": -6.874235153198242, "global_step": 159795, "epoch": 3804} {"train_loss": -6.82264518737793, "global_step": 159796, "epoch": 3804} {"train_loss": -6.784460067749023, "global_step": 159797, "epoch": 3804} {"train_loss": -6.743690490722656, "global_step": 159798, "epoch": 3804} {"train_loss": -6.952674865722656, "global_step": 159799, "epoch": 3804} {"train_loss": -6.871830940246582, "global_step": 159800, "epoch": 3804} {"train_loss": -6.791126251220703, "global_step": 159801, "epoch": 3804} {"train_loss": -6.943026542663574, "global_step": 159802, "epoch": 3804} {"train_loss": -6.812142372131348, "global_step": 159803, "epoch": 3804} {"train_loss": -6.797066688537598, "global_step": 159804, "epoch": 3804} {"train_loss": -6.997068405151367, "global_step": 159805, "epoch": 3804} {"train_loss": -6.906903266906738, "global_step": 159806, "epoch": 3804} {"train_loss": -6.883542060852051, "global_step": 159807, "epoch": 3804} {"train_loss": -6.801448822021484, "global_step": 159808, "epoch": 3804} {"train_loss": -6.8653885296412875, "global_step": 159809, "epoch": 3804, "val_loss": 68779.6015625} {"train_loss": -6.905522346496582, "global_step": 159810, "epoch": 3805} {"train_loss": -6.845858097076416, "global_step": 159811, "epoch": 3805} {"train_loss": -6.855334281921387, "global_step": 159812, "epoch": 3805} {"train_loss": -6.864184856414795, "global_step": 159813, "epoch": 3805} {"train_loss": -6.755643367767334, "global_step": 159814, "epoch": 3805} {"train_loss": -6.904618740081787, "global_step": 159815, "epoch": 3805} {"train_loss": -6.950640678405762, "global_step": 159816, "epoch": 3805} {"train_loss": -6.796525955200195, "global_step": 159817, "epoch": 3805} {"train_loss": -6.953707695007324, "global_step": 159818, "epoch": 3805} {"train_loss": -6.987882614135742, "global_step": 159819, "epoch": 3805} {"train_loss": -6.952488422393799, "global_step": 159820, "epoch": 3805} {"train_loss": -6.946369171142578, "global_step": 159821, "epoch": 3805} {"train_loss": -6.891374588012695, "global_step": 159822, "epoch": 3805} {"train_loss": -6.936553478240967, "global_step": 159823, "epoch": 3805} {"train_loss": -6.931613922119141, "global_step": 159824, "epoch": 3805} {"train_loss": -6.992859363555908, "global_step": 159825, "epoch": 3805} {"train_loss": -7.000397682189941, "global_step": 159826, "epoch": 3805} {"train_loss": -6.903494834899902, "global_step": 159827, "epoch": 3805} {"train_loss": -7.030230522155762, "global_step": 159828, "epoch": 3805} {"train_loss": -6.933618545532227, "global_step": 159829, "epoch": 3805} {"train_loss": -6.901561737060547, "global_step": 159830, "epoch": 3805} {"train_loss": -7.052535057067871, "global_step": 159831, "epoch": 3805} {"train_loss": -6.836617469787598, "global_step": 159832, "epoch": 3805} {"train_loss": -6.747336387634277, "global_step": 159833, "epoch": 3805} {"train_loss": -6.846607208251953, "global_step": 159834, "epoch": 3805} {"train_loss": -6.855928421020508, "global_step": 159835, "epoch": 3805} {"train_loss": -6.924358367919922, "global_step": 159836, "epoch": 3805} {"train_loss": -6.819204330444336, "global_step": 159837, "epoch": 3805} {"train_loss": -6.994927406311035, "global_step": 159838, "epoch": 3805} {"train_loss": -6.872215270996094, "global_step": 159839, "epoch": 3805} {"train_loss": -6.804111480712891, "global_step": 159840, "epoch": 3805} {"train_loss": -6.858558177947998, "global_step": 159841, "epoch": 3805} {"train_loss": -6.776712417602539, "global_step": 159842, "epoch": 3805} {"train_loss": -6.878734588623047, "global_step": 159843, "epoch": 3805} {"train_loss": -6.982050895690918, "global_step": 159844, "epoch": 3805} {"train_loss": -6.824654579162598, "global_step": 159845, "epoch": 3805} {"train_loss": -6.9153032302856445, "global_step": 159846, "epoch": 3805} {"train_loss": -6.916036605834961, "global_step": 159847, "epoch": 3805} {"train_loss": -6.85474157333374, "global_step": 159848, "epoch": 3805} {"train_loss": -6.887922286987305, "global_step": 159849, "epoch": 3805} {"train_loss": -6.802204132080078, "global_step": 159850, "epoch": 3805} {"train_loss": -6.896090235028948, "global_step": 159851, "epoch": 3805, "val_loss": 68475.3125} {"train_loss": -6.981777667999268, "global_step": 159852, "epoch": 3806} {"train_loss": -6.913931369781494, "global_step": 159853, "epoch": 3806} {"train_loss": -6.927621841430664, "global_step": 159854, "epoch": 3806} {"train_loss": -6.8851728439331055, "global_step": 159855, "epoch": 3806} {"train_loss": -6.864952564239502, "global_step": 159856, "epoch": 3806} {"train_loss": -6.875218868255615, "global_step": 159857, "epoch": 3806} {"train_loss": -6.768645286560059, "global_step": 159858, "epoch": 3806} {"train_loss": -6.939566135406494, "global_step": 159859, "epoch": 3806} {"train_loss": -6.8870463371276855, "global_step": 159860, "epoch": 3806} {"train_loss": -7.016698360443115, "global_step": 159861, "epoch": 3806} {"train_loss": -6.824962139129639, "global_step": 159862, "epoch": 3806} {"train_loss": -6.987270832061768, "global_step": 159863, "epoch": 3806} {"train_loss": -6.9317498207092285, "global_step": 159864, "epoch": 3806} {"train_loss": -6.840516090393066, "global_step": 159865, "epoch": 3806} {"train_loss": -6.8099517822265625, "global_step": 159866, "epoch": 3806} {"train_loss": -6.927423477172852, "global_step": 159867, "epoch": 3806} {"train_loss": -6.977246284484863, "global_step": 159868, "epoch": 3806} {"train_loss": -6.870265483856201, "global_step": 159869, "epoch": 3806} {"train_loss": -6.952424049377441, "global_step": 159870, "epoch": 3806} {"train_loss": -6.752679347991943, "global_step": 159871, "epoch": 3806} {"train_loss": -6.892417907714844, "global_step": 159872, "epoch": 3806} {"train_loss": -6.820470809936523, "global_step": 159873, "epoch": 3806} {"train_loss": -6.856058597564697, "global_step": 159874, "epoch": 3806} {"train_loss": -6.718618869781494, "global_step": 159875, "epoch": 3806} {"train_loss": -6.96488618850708, "global_step": 159876, "epoch": 3806} {"train_loss": -6.9732513427734375, "global_step": 159877, "epoch": 3806} {"train_loss": -6.891791343688965, "global_step": 159878, "epoch": 3806} {"train_loss": -6.933139324188232, "global_step": 159879, "epoch": 3806} {"train_loss": -6.829223155975342, "global_step": 159880, "epoch": 3806} {"train_loss": -7.103172302246094, "global_step": 159881, "epoch": 3806} {"train_loss": -6.845601558685303, "global_step": 159882, "epoch": 3806} {"train_loss": -6.9330291748046875, "global_step": 159883, "epoch": 3806} {"train_loss": -6.831223964691162, "global_step": 159884, "epoch": 3806} {"train_loss": -6.870216369628906, "global_step": 159885, "epoch": 3806} {"train_loss": -6.8955559730529785, "global_step": 159886, "epoch": 3806} {"train_loss": -6.93022346496582, "global_step": 159887, "epoch": 3806} {"train_loss": -6.790815830230713, "global_step": 159888, "epoch": 3806} {"train_loss": -6.910360336303711, "global_step": 159889, "epoch": 3806} {"train_loss": -6.906435489654541, "global_step": 159890, "epoch": 3806} {"train_loss": -6.94140625, "global_step": 159891, "epoch": 3806} {"train_loss": -6.838808059692383, "global_step": 159892, "epoch": 3806} {"train_loss": -6.892817088535854, "global_step": 159893, "epoch": 3806, "val_loss": 68491.6875} {"train_loss": -6.859945774078369, "global_step": 159894, "epoch": 3807} {"train_loss": -6.953665733337402, "global_step": 159895, "epoch": 3807} {"train_loss": -6.948868751525879, "global_step": 159896, "epoch": 3807} {"train_loss": -6.982505798339844, "global_step": 159897, "epoch": 3807} {"train_loss": -6.838937759399414, "global_step": 159898, "epoch": 3807} {"train_loss": -6.949151039123535, "global_step": 159899, "epoch": 3807} {"train_loss": -6.998189926147461, "global_step": 159900, "epoch": 3807} {"train_loss": -6.901318550109863, "global_step": 159901, "epoch": 3807} {"train_loss": -7.017900466918945, "global_step": 159902, "epoch": 3807} {"train_loss": -6.984132766723633, "global_step": 159903, "epoch": 3807} {"train_loss": -6.918813705444336, "global_step": 159904, "epoch": 3807} {"train_loss": -6.9284257888793945, "global_step": 159905, "epoch": 3807} {"train_loss": -6.848084449768066, "global_step": 159906, "epoch": 3807} {"train_loss": -6.935364723205566, "global_step": 159907, "epoch": 3807} {"train_loss": -6.959725856781006, "global_step": 159908, "epoch": 3807} {"train_loss": -6.88640022277832, "global_step": 159909, "epoch": 3807} {"train_loss": -6.997895240783691, "global_step": 159910, "epoch": 3807} {"train_loss": -6.9196062088012695, "global_step": 159911, "epoch": 3807} {"train_loss": -6.809309005737305, "global_step": 159912, "epoch": 3807} {"train_loss": -6.878247261047363, "global_step": 159913, "epoch": 3807} {"train_loss": -6.980039596557617, "global_step": 159914, "epoch": 3807} {"train_loss": -6.8580451011657715, "global_step": 159915, "epoch": 3807} {"train_loss": -6.917818069458008, "global_step": 159916, "epoch": 3807} {"train_loss": -6.823980331420898, "global_step": 159917, "epoch": 3807} {"train_loss": -6.795742034912109, "global_step": 159918, "epoch": 3807} {"train_loss": -6.846399307250977, "global_step": 159919, "epoch": 3807} {"train_loss": -6.898670196533203, "global_step": 159920, "epoch": 3807} {"train_loss": -6.856235027313232, "global_step": 159921, "epoch": 3807} {"train_loss": -6.819524765014648, "global_step": 159922, "epoch": 3807} {"train_loss": -6.78361701965332, "global_step": 159923, "epoch": 3807} {"train_loss": -6.750162601470947, "global_step": 159924, "epoch": 3807} {"train_loss": -6.950011730194092, "global_step": 159925, "epoch": 3807} {"train_loss": -6.79189395904541, "global_step": 159926, "epoch": 3807} {"train_loss": -6.718270301818848, "global_step": 159927, "epoch": 3807} {"train_loss": -6.940011501312256, "global_step": 159928, "epoch": 3807} {"train_loss": -6.740001678466797, "global_step": 159929, "epoch": 3807} {"train_loss": -6.863949298858643, "global_step": 159930, "epoch": 3807} {"train_loss": -6.735813140869141, "global_step": 159931, "epoch": 3807} {"train_loss": -6.882840156555176, "global_step": 159932, "epoch": 3807} {"train_loss": -6.963708877563477, "global_step": 159933, "epoch": 3807} {"train_loss": -6.8487548828125, "global_step": 159934, "epoch": 3807} {"train_loss": -6.889569941021147, "global_step": 159935, "epoch": 3807, "val_loss": 68520.28125} {"train_loss": -6.9370622634887695, "global_step": 159936, "epoch": 3808} {"train_loss": -6.952875137329102, "global_step": 159937, "epoch": 3808} {"train_loss": -7.02859354019165, "global_step": 159938, "epoch": 3808} {"train_loss": -6.900907516479492, "global_step": 159939, "epoch": 3808} {"train_loss": -6.815711975097656, "global_step": 159940, "epoch": 3808} {"train_loss": -6.859354496002197, "global_step": 159941, "epoch": 3808} {"train_loss": -6.815593719482422, "global_step": 159942, "epoch": 3808} {"train_loss": -6.965526580810547, "global_step": 159943, "epoch": 3808} {"train_loss": -6.93297004699707, "global_step": 159944, "epoch": 3808} {"train_loss": -6.837803363800049, "global_step": 159945, "epoch": 3808} {"train_loss": -6.856932640075684, "global_step": 159946, "epoch": 3808} {"train_loss": -6.952008247375488, "global_step": 159947, "epoch": 3808} {"train_loss": -6.933257102966309, "global_step": 159948, "epoch": 3808} {"train_loss": -6.91207218170166, "global_step": 159949, "epoch": 3808} {"train_loss": -6.852203369140625, "global_step": 159950, "epoch": 3808} {"train_loss": -7.004549980163574, "global_step": 159951, "epoch": 3808} {"train_loss": -6.94922399520874, "global_step": 159952, "epoch": 3808} {"train_loss": -6.875853538513184, "global_step": 159953, "epoch": 3808} {"train_loss": -6.954373836517334, "global_step": 159954, "epoch": 3808} {"train_loss": -6.850472927093506, "global_step": 159955, "epoch": 3808} {"train_loss": -6.929722785949707, "global_step": 159956, "epoch": 3808} {"train_loss": -6.912384033203125, "global_step": 159957, "epoch": 3808} {"train_loss": -6.977496147155762, "global_step": 159958, "epoch": 3808} {"train_loss": -6.951416492462158, "global_step": 159959, "epoch": 3808} {"train_loss": -6.949416637420654, "global_step": 159960, "epoch": 3808} {"train_loss": -7.022465705871582, "global_step": 159961, "epoch": 3808} {"train_loss": -6.888591289520264, "global_step": 159962, "epoch": 3808} {"train_loss": -6.979909896850586, "global_step": 159963, "epoch": 3808} {"train_loss": -6.997583866119385, "global_step": 159964, "epoch": 3808} {"train_loss": -6.962981700897217, "global_step": 159965, "epoch": 3808} {"train_loss": -6.99104118347168, "global_step": 159966, "epoch": 3808} {"train_loss": -6.896327018737793, "global_step": 159967, "epoch": 3808} {"train_loss": -6.97157096862793, "global_step": 159968, "epoch": 3808} {"train_loss": -6.86803674697876, "global_step": 159969, "epoch": 3808} {"train_loss": -6.97947883605957, "global_step": 159970, "epoch": 3808} {"train_loss": -6.911709308624268, "global_step": 159971, "epoch": 3808} {"train_loss": -6.955832004547119, "global_step": 159972, "epoch": 3808} {"train_loss": -6.9208831787109375, "global_step": 159973, "epoch": 3808} {"train_loss": -6.90377950668335, "global_step": 159974, "epoch": 3808} {"train_loss": -6.875448226928711, "global_step": 159975, "epoch": 3808} {"train_loss": -6.931324481964111, "global_step": 159976, "epoch": 3808} {"train_loss": -6.927497375579107, "global_step": 159977, "epoch": 3808, "val_loss": 68650.5} {"train_loss": -6.996521472930908, "global_step": 159978, "epoch": 3809} {"train_loss": -6.858635902404785, "global_step": 159979, "epoch": 3809} {"train_loss": -6.939882278442383, "global_step": 159980, "epoch": 3809} {"train_loss": -6.936052322387695, "global_step": 159981, "epoch": 3809} {"train_loss": -6.8690900802612305, "global_step": 159982, "epoch": 3809} {"train_loss": -6.949237823486328, "global_step": 159983, "epoch": 3809} {"train_loss": -6.940061569213867, "global_step": 159984, "epoch": 3809} {"train_loss": -6.938690662384033, "global_step": 159985, "epoch": 3809} {"train_loss": -7.03938102722168, "global_step": 159986, "epoch": 3809} {"train_loss": -6.8926286697387695, "global_step": 159987, "epoch": 3809} {"train_loss": -7.020236015319824, "global_step": 159988, "epoch": 3809} {"train_loss": -7.018456935882568, "global_step": 159989, "epoch": 3809} {"train_loss": -6.843409538269043, "global_step": 159990, "epoch": 3809} {"train_loss": -6.90078592300415, "global_step": 159991, "epoch": 3809} {"train_loss": -7.0175628662109375, "global_step": 159992, "epoch": 3809} {"train_loss": -6.899014472961426, "global_step": 159993, "epoch": 3809} {"train_loss": -6.993513107299805, "global_step": 159994, "epoch": 3809} {"train_loss": -6.934812068939209, "global_step": 159995, "epoch": 3809} {"train_loss": -6.926912307739258, "global_step": 159996, "epoch": 3809} {"train_loss": -6.921598434448242, "global_step": 159997, "epoch": 3809} {"train_loss": -6.956680774688721, "global_step": 159998, "epoch": 3809} {"train_loss": -6.8924384117126465, "global_step": 159999, "epoch": 3809} {"train_loss": -6.961324691772461, "global_step": 160000, "epoch": 3809} {"train_loss": -6.939001560211182, "global_step": 160001, "epoch": 3809} {"train_loss": -7.07222843170166, "global_step": 160002, "epoch": 3809} {"train_loss": -6.992687702178955, "global_step": 160003, "epoch": 3809} {"train_loss": -6.95587158203125, "global_step": 160004, "epoch": 3809} {"train_loss": -7.039973258972168, "global_step": 160005, "epoch": 3809} {"train_loss": -6.809425354003906, "global_step": 160006, "epoch": 3809} {"train_loss": -6.954380035400391, "global_step": 160007, "epoch": 3809} {"train_loss": -7.032436370849609, "global_step": 160008, "epoch": 3809} {"train_loss": -6.950420379638672, "global_step": 160009, "epoch": 3809} {"train_loss": -6.945784568786621, "global_step": 160010, "epoch": 3809} {"train_loss": -6.990167617797852, "global_step": 160011, "epoch": 3809} {"train_loss": -6.896970272064209, "global_step": 160012, "epoch": 3809} {"train_loss": -6.7813897132873535, "global_step": 160013, "epoch": 3809} {"train_loss": -6.9000630378723145, "global_step": 160014, "epoch": 3809} {"train_loss": -6.9479756355285645, "global_step": 160015, "epoch": 3809} {"train_loss": -6.88191032409668, "global_step": 160016, "epoch": 3809} {"train_loss": -6.927906513214111, "global_step": 160017, "epoch": 3809} {"train_loss": -6.913388252258301, "global_step": 160018, "epoch": 3809} {"train_loss": -6.939491090320406, "global_step": 160019, "epoch": 3809, "val_loss": 68596.671875} {"train_loss": -6.92338752746582, "global_step": 160020, "epoch": 3810} {"train_loss": -6.853482246398926, "global_step": 160021, "epoch": 3810} {"train_loss": -6.79371976852417, "global_step": 160022, "epoch": 3810} {"train_loss": -6.834102153778076, "global_step": 160023, "epoch": 3810} {"train_loss": -6.901176452636719, "global_step": 160024, "epoch": 3810} {"train_loss": -6.951295852661133, "global_step": 160025, "epoch": 3810} {"train_loss": -6.911036491394043, "global_step": 160026, "epoch": 3810} {"train_loss": -6.818249702453613, "global_step": 160027, "epoch": 3810} {"train_loss": -6.7472429275512695, "global_step": 160028, "epoch": 3810} {"train_loss": -6.828554153442383, "global_step": 160029, "epoch": 3810} {"train_loss": -6.889512538909912, "global_step": 160030, "epoch": 3810} {"train_loss": -6.8569769859313965, "global_step": 160031, "epoch": 3810} {"train_loss": -7.0183210372924805, "global_step": 160032, "epoch": 3810} {"train_loss": -6.933828353881836, "global_step": 160033, "epoch": 3810} {"train_loss": -6.9700469970703125, "global_step": 160034, "epoch": 3810} {"train_loss": -6.972869873046875, "global_step": 160035, "epoch": 3810} {"train_loss": -6.98581600189209, "global_step": 160036, "epoch": 3810} {"train_loss": -6.911769866943359, "global_step": 160037, "epoch": 3810} {"train_loss": -6.902390956878662, "global_step": 160038, "epoch": 3810} {"train_loss": -6.86635684967041, "global_step": 160039, "epoch": 3810} {"train_loss": -6.8367085456848145, "global_step": 160040, "epoch": 3810} {"train_loss": -6.866430759429932, "global_step": 160041, "epoch": 3810} {"train_loss": -6.822973251342773, "global_step": 160042, "epoch": 3810} {"train_loss": -6.940934658050537, "global_step": 160043, "epoch": 3810} {"train_loss": -6.885054111480713, "global_step": 160044, "epoch": 3810} {"train_loss": -6.751104354858398, "global_step": 160045, "epoch": 3810} {"train_loss": -6.698111534118652, "global_step": 160046, "epoch": 3810} {"train_loss": -6.927306652069092, "global_step": 160047, "epoch": 3810} {"train_loss": -6.796177387237549, "global_step": 160048, "epoch": 3810} {"train_loss": -6.745648384094238, "global_step": 160049, "epoch": 3810} {"train_loss": -6.914019584655762, "global_step": 160050, "epoch": 3810} {"train_loss": -6.841997146606445, "global_step": 160051, "epoch": 3810} {"train_loss": -6.7356133460998535, "global_step": 160052, "epoch": 3810} {"train_loss": -6.927501201629639, "global_step": 160053, "epoch": 3810} {"train_loss": -6.838709831237793, "global_step": 160054, "epoch": 3810} {"train_loss": -6.967178821563721, "global_step": 160055, "epoch": 3810} {"train_loss": -6.836065292358398, "global_step": 160056, "epoch": 3810} {"train_loss": -6.888858795166016, "global_step": 160057, "epoch": 3810} {"train_loss": -6.891425132751465, "global_step": 160058, "epoch": 3810} {"train_loss": -6.938227653503418, "global_step": 160059, "epoch": 3810} {"train_loss": -6.857730865478516, "global_step": 160060, "epoch": 3810} {"train_loss": -6.872554120563326, "global_step": 160061, "epoch": 3810, "val_loss": 68443.140625} {"train_loss": -6.9349775314331055, "global_step": 160062, "epoch": 3811} {"train_loss": -6.8010358810424805, "global_step": 160063, "epoch": 3811} {"train_loss": -6.815609931945801, "global_step": 160064, "epoch": 3811} {"train_loss": -6.897226810455322, "global_step": 160065, "epoch": 3811} {"train_loss": -6.916320323944092, "global_step": 160066, "epoch": 3811} {"train_loss": -6.872720718383789, "global_step": 160067, "epoch": 3811} {"train_loss": -6.982889175415039, "global_step": 160068, "epoch": 3811} {"train_loss": -6.818581581115723, "global_step": 160069, "epoch": 3811} {"train_loss": -6.8388471603393555, "global_step": 160070, "epoch": 3811} {"train_loss": -6.859217166900635, "global_step": 160071, "epoch": 3811} {"train_loss": -6.877563953399658, "global_step": 160072, "epoch": 3811} {"train_loss": -6.851225852966309, "global_step": 160073, "epoch": 3811} {"train_loss": -6.817777156829834, "global_step": 160074, "epoch": 3811} {"train_loss": -6.854430198669434, "global_step": 160075, "epoch": 3811} {"train_loss": -6.820597171783447, "global_step": 160076, "epoch": 3811} {"train_loss": -6.961501121520996, "global_step": 160077, "epoch": 3811} {"train_loss": -6.878390312194824, "global_step": 160078, "epoch": 3811} {"train_loss": -6.876185894012451, "global_step": 160079, "epoch": 3811} {"train_loss": -6.94692325592041, "global_step": 160080, "epoch": 3811} {"train_loss": -6.973220348358154, "global_step": 160081, "epoch": 3811} {"train_loss": -6.991598606109619, "global_step": 160082, "epoch": 3811} {"train_loss": -6.970210075378418, "global_step": 160083, "epoch": 3811} {"train_loss": -6.981820106506348, "global_step": 160084, "epoch": 3811} {"train_loss": -7.063166618347168, "global_step": 160085, "epoch": 3811} {"train_loss": -6.975985050201416, "global_step": 160086, "epoch": 3811} {"train_loss": -7.0457658767700195, "global_step": 160087, "epoch": 3811} {"train_loss": -6.916680335998535, "global_step": 160088, "epoch": 3811} {"train_loss": -6.86177921295166, "global_step": 160089, "epoch": 3811} {"train_loss": -6.929100513458252, "global_step": 160090, "epoch": 3811} {"train_loss": -6.89417839050293, "global_step": 160091, "epoch": 3811} {"train_loss": -6.921383380889893, "global_step": 160092, "epoch": 3811} {"train_loss": -6.959739685058594, "global_step": 160093, "epoch": 3811} {"train_loss": -6.851558685302734, "global_step": 160094, "epoch": 3811} {"train_loss": -6.897818088531494, "global_step": 160095, "epoch": 3811} {"train_loss": -6.952450752258301, "global_step": 160096, "epoch": 3811} {"train_loss": -7.000513076782227, "global_step": 160097, "epoch": 3811} {"train_loss": -6.851596832275391, "global_step": 160098, "epoch": 3811} {"train_loss": -6.997689723968506, "global_step": 160099, "epoch": 3811} {"train_loss": -6.719386100769043, "global_step": 160100, "epoch": 3811} {"train_loss": -6.9924774169921875, "global_step": 160101, "epoch": 3811} {"train_loss": -6.89796257019043, "global_step": 160102, "epoch": 3811} {"train_loss": -6.910862332298642, "global_step": 160103, "epoch": 3811, "val_loss": 68437.390625} {"train_loss": -6.8670244216918945, "global_step": 160104, "epoch": 3812} {"train_loss": -6.801031589508057, "global_step": 160105, "epoch": 3812} {"train_loss": -6.893703460693359, "global_step": 160106, "epoch": 3812} {"train_loss": -6.811252117156982, "global_step": 160107, "epoch": 3812} {"train_loss": -6.749268531799316, "global_step": 160108, "epoch": 3812} {"train_loss": -6.971404075622559, "global_step": 160109, "epoch": 3812} {"train_loss": -6.837685585021973, "global_step": 160110, "epoch": 3812} {"train_loss": -6.753507614135742, "global_step": 160111, "epoch": 3812} {"train_loss": -6.836325645446777, "global_step": 160112, "epoch": 3812} {"train_loss": -6.837276935577393, "global_step": 160113, "epoch": 3812} {"train_loss": -6.83697509765625, "global_step": 160114, "epoch": 3812} {"train_loss": -6.924288749694824, "global_step": 160115, "epoch": 3812} {"train_loss": -6.707059860229492, "global_step": 160116, "epoch": 3812} {"train_loss": -6.870722770690918, "global_step": 160117, "epoch": 3812} {"train_loss": -6.972455024719238, "global_step": 160118, "epoch": 3812} {"train_loss": -6.774205684661865, "global_step": 160119, "epoch": 3812} {"train_loss": -6.8076982498168945, "global_step": 160120, "epoch": 3812} {"train_loss": -6.8481597900390625, "global_step": 160121, "epoch": 3812} {"train_loss": -6.886815547943115, "global_step": 160122, "epoch": 3812} {"train_loss": -6.987964153289795, "global_step": 160123, "epoch": 3812} {"train_loss": -6.877047538757324, "global_step": 160124, "epoch": 3812} {"train_loss": -6.853282928466797, "global_step": 160125, "epoch": 3812} {"train_loss": -6.840215682983398, "global_step": 160126, "epoch": 3812} {"train_loss": -6.9263129234313965, "global_step": 160127, "epoch": 3812} {"train_loss": -6.9323625564575195, "global_step": 160128, "epoch": 3812} {"train_loss": -6.989392280578613, "global_step": 160129, "epoch": 3812} {"train_loss": -6.849579811096191, "global_step": 160130, "epoch": 3812} {"train_loss": -6.836570739746094, "global_step": 160131, "epoch": 3812} {"train_loss": -6.90578031539917, "global_step": 160132, "epoch": 3812} {"train_loss": -6.834878444671631, "global_step": 160133, "epoch": 3812} {"train_loss": -6.994807243347168, "global_step": 160134, "epoch": 3812} {"train_loss": -6.915119171142578, "global_step": 160135, "epoch": 3812} {"train_loss": -6.902723789215088, "global_step": 160136, "epoch": 3812} {"train_loss": -6.953425407409668, "global_step": 160137, "epoch": 3812} {"train_loss": -6.836375713348389, "global_step": 160138, "epoch": 3812} {"train_loss": -7.047379016876221, "global_step": 160139, "epoch": 3812} {"train_loss": -6.949068069458008, "global_step": 160140, "epoch": 3812} {"train_loss": -6.77626895904541, "global_step": 160141, "epoch": 3812} {"train_loss": -6.898194313049316, "global_step": 160142, "epoch": 3812} {"train_loss": -6.7661638259887695, "global_step": 160143, "epoch": 3812} {"train_loss": -6.851157188415527, "global_step": 160144, "epoch": 3812} {"train_loss": -6.869940337680635, "global_step": 160145, "epoch": 3812, "val_loss": 68656.2578125} {"train_loss": -6.801623344421387, "global_step": 160146, "epoch": 3813} {"train_loss": -6.768138885498047, "global_step": 160147, "epoch": 3813} {"train_loss": -6.796693801879883, "global_step": 160148, "epoch": 3813} {"train_loss": -6.730958938598633, "global_step": 160149, "epoch": 3813} {"train_loss": -6.862586975097656, "global_step": 160150, "epoch": 3813} {"train_loss": -6.786197662353516, "global_step": 160151, "epoch": 3813} {"train_loss": -7.010074615478516, "global_step": 160152, "epoch": 3813} {"train_loss": -6.807062149047852, "global_step": 160153, "epoch": 3813} {"train_loss": -6.735832214355469, "global_step": 160154, "epoch": 3813} {"train_loss": -6.856907844543457, "global_step": 160155, "epoch": 3813} {"train_loss": -6.815794944763184, "global_step": 160156, "epoch": 3813} {"train_loss": -6.85607385635376, "global_step": 160157, "epoch": 3813} {"train_loss": -6.851462364196777, "global_step": 160158, "epoch": 3813} {"train_loss": -6.898342132568359, "global_step": 160159, "epoch": 3813} {"train_loss": -6.826724529266357, "global_step": 160160, "epoch": 3813} {"train_loss": -6.881269454956055, "global_step": 160161, "epoch": 3813} {"train_loss": -6.887041091918945, "global_step": 160162, "epoch": 3813} {"train_loss": -6.887451648712158, "global_step": 160163, "epoch": 3813} {"train_loss": -6.8630194664001465, "global_step": 160164, "epoch": 3813} {"train_loss": -6.804845809936523, "global_step": 160165, "epoch": 3813} {"train_loss": -6.850394248962402, "global_step": 160166, "epoch": 3813} {"train_loss": -6.872051239013672, "global_step": 160167, "epoch": 3813} {"train_loss": -6.858278274536133, "global_step": 160168, "epoch": 3813} {"train_loss": -6.864046096801758, "global_step": 160169, "epoch": 3813} {"train_loss": -6.854283809661865, "global_step": 160170, "epoch": 3813} {"train_loss": -6.827733039855957, "global_step": 160171, "epoch": 3813} {"train_loss": -6.956757545471191, "global_step": 160172, "epoch": 3813} {"train_loss": -6.680230140686035, "global_step": 160173, "epoch": 3813} {"train_loss": -6.911535263061523, "global_step": 160174, "epoch": 3813} {"train_loss": -6.756381988525391, "global_step": 160175, "epoch": 3813} {"train_loss": -6.885242462158203, "global_step": 160176, "epoch": 3813} {"train_loss": -6.939168930053711, "global_step": 160177, "epoch": 3813} {"train_loss": -6.788372993469238, "global_step": 160178, "epoch": 3813} {"train_loss": -6.813541412353516, "global_step": 160179, "epoch": 3813} {"train_loss": -6.87744665145874, "global_step": 160180, "epoch": 3813} {"train_loss": -6.925725936889648, "global_step": 160181, "epoch": 3813} {"train_loss": -6.9178242683410645, "global_step": 160182, "epoch": 3813} {"train_loss": -6.8866119384765625, "global_step": 160183, "epoch": 3813} {"train_loss": -6.985136032104492, "global_step": 160184, "epoch": 3813} {"train_loss": -7.0063066482543945, "global_step": 160185, "epoch": 3813} {"train_loss": -6.933082103729248, "global_step": 160186, "epoch": 3813} {"train_loss": -6.856854802086239, "global_step": 160187, "epoch": 3813, "val_loss": 68614.953125} {"train_loss": -6.93546199798584, "global_step": 160188, "epoch": 3814} {"train_loss": -6.953651428222656, "global_step": 160189, "epoch": 3814} {"train_loss": -6.8939080238342285, "global_step": 160190, "epoch": 3814} {"train_loss": -6.925856590270996, "global_step": 160191, "epoch": 3814} {"train_loss": -6.919798851013184, "global_step": 160192, "epoch": 3814} {"train_loss": -7.0102739334106445, "global_step": 160193, "epoch": 3814} {"train_loss": -6.961374282836914, "global_step": 160194, "epoch": 3814} {"train_loss": -6.879644393920898, "global_step": 160195, "epoch": 3814} {"train_loss": -7.078126907348633, "global_step": 160196, "epoch": 3814} {"train_loss": -6.9304399490356445, "global_step": 160197, "epoch": 3814} {"train_loss": -6.972438812255859, "global_step": 160198, "epoch": 3814} {"train_loss": -6.9572553634643555, "global_step": 160199, "epoch": 3814} {"train_loss": -6.9953107833862305, "global_step": 160200, "epoch": 3814} {"train_loss": -6.895075798034668, "global_step": 160201, "epoch": 3814} {"train_loss": -6.968839645385742, "global_step": 160202, "epoch": 3814} {"train_loss": -6.943978309631348, "global_step": 160203, "epoch": 3814} {"train_loss": -6.841136932373047, "global_step": 160204, "epoch": 3814} {"train_loss": -6.831710338592529, "global_step": 160205, "epoch": 3814} {"train_loss": -6.8925886154174805, "global_step": 160206, "epoch": 3814} {"train_loss": -6.83306360244751, "global_step": 160207, "epoch": 3814} {"train_loss": -6.853703498840332, "global_step": 160208, "epoch": 3814} {"train_loss": -6.968132019042969, "global_step": 160209, "epoch": 3814} {"train_loss": -6.877964019775391, "global_step": 160210, "epoch": 3814} {"train_loss": -6.942137241363525, "global_step": 160211, "epoch": 3814} {"train_loss": -6.891977310180664, "global_step": 160212, "epoch": 3814} {"train_loss": -6.869740962982178, "global_step": 160213, "epoch": 3814} {"train_loss": -6.926246643066406, "global_step": 160214, "epoch": 3814} {"train_loss": -6.954507827758789, "global_step": 160215, "epoch": 3814} {"train_loss": -6.889729976654053, "global_step": 160216, "epoch": 3814} {"train_loss": -6.947363376617432, "global_step": 160217, "epoch": 3814} {"train_loss": -7.053142547607422, "global_step": 160218, "epoch": 3814} {"train_loss": -6.956967353820801, "global_step": 160219, "epoch": 3814} {"train_loss": -7.027595520019531, "global_step": 160220, "epoch": 3814} {"train_loss": -7.016397953033447, "global_step": 160221, "epoch": 3814} {"train_loss": -6.894857406616211, "global_step": 160222, "epoch": 3814} {"train_loss": -7.036322593688965, "global_step": 160223, "epoch": 3814} {"train_loss": -6.820880889892578, "global_step": 160224, "epoch": 3814} {"train_loss": -6.930053234100342, "global_step": 160225, "epoch": 3814} {"train_loss": -6.826527118682861, "global_step": 160226, "epoch": 3814} {"train_loss": -6.95590877532959, "global_step": 160227, "epoch": 3814} {"train_loss": -6.90764856338501, "global_step": 160228, "epoch": 3814} {"train_loss": -6.929172470456078, "global_step": 160229, "epoch": 3814, "val_loss": 68579.1796875} {"train_loss": -6.974281311035156, "global_step": 160230, "epoch": 3815} {"train_loss": -6.913481712341309, "global_step": 160231, "epoch": 3815} {"train_loss": -6.89074182510376, "global_step": 160232, "epoch": 3815} {"train_loss": -6.771256446838379, "global_step": 160233, "epoch": 3815} {"train_loss": -6.828563690185547, "global_step": 160234, "epoch": 3815} {"train_loss": -6.909585952758789, "global_step": 160235, "epoch": 3815} {"train_loss": -6.918644905090332, "global_step": 160236, "epoch": 3815} {"train_loss": -6.832894325256348, "global_step": 160237, "epoch": 3815} {"train_loss": -6.907257080078125, "global_step": 160238, "epoch": 3815} {"train_loss": -6.890286445617676, "global_step": 160239, "epoch": 3815} {"train_loss": -6.918400764465332, "global_step": 160240, "epoch": 3815} {"train_loss": -6.815835475921631, "global_step": 160241, "epoch": 3815} {"train_loss": -6.869425296783447, "global_step": 160242, "epoch": 3815} {"train_loss": -6.857727527618408, "global_step": 160243, "epoch": 3815} {"train_loss": -6.787768840789795, "global_step": 160244, "epoch": 3815} {"train_loss": -6.843586444854736, "global_step": 160245, "epoch": 3815} {"train_loss": -6.907535552978516, "global_step": 160246, "epoch": 3815} {"train_loss": -6.846717834472656, "global_step": 160247, "epoch": 3815} {"train_loss": -6.875452518463135, "global_step": 160248, "epoch": 3815} {"train_loss": -6.852684497833252, "global_step": 160249, "epoch": 3815} {"train_loss": -6.916952133178711, "global_step": 160250, "epoch": 3815} {"train_loss": -6.840237617492676, "global_step": 160251, "epoch": 3815} {"train_loss": -6.760385513305664, "global_step": 160252, "epoch": 3815} {"train_loss": -6.938569068908691, "global_step": 160253, "epoch": 3815} {"train_loss": -6.786419868469238, "global_step": 160254, "epoch": 3815} {"train_loss": -6.854705810546875, "global_step": 160255, "epoch": 3815} {"train_loss": -6.930927276611328, "global_step": 160256, "epoch": 3815} {"train_loss": -6.881710529327393, "global_step": 160257, "epoch": 3815} {"train_loss": -7.0024261474609375, "global_step": 160258, "epoch": 3815} {"train_loss": -6.933171272277832, "global_step": 160259, "epoch": 3815} {"train_loss": -6.93408727645874, "global_step": 160260, "epoch": 3815} {"train_loss": -6.968739986419678, "global_step": 160261, "epoch": 3815} {"train_loss": -6.904218673706055, "global_step": 160262, "epoch": 3815} {"train_loss": -6.822463035583496, "global_step": 160263, "epoch": 3815} {"train_loss": -6.921988487243652, "global_step": 160264, "epoch": 3815} {"train_loss": -6.842531204223633, "global_step": 160265, "epoch": 3815} {"train_loss": -6.870375633239746, "global_step": 160266, "epoch": 3815} {"train_loss": -6.866812229156494, "global_step": 160267, "epoch": 3815} {"train_loss": -6.892352104187012, "global_step": 160268, "epoch": 3815} {"train_loss": -6.834225654602051, "global_step": 160269, "epoch": 3815} {"train_loss": -6.8816962242126465, "global_step": 160270, "epoch": 3815} {"train_loss": -6.882058688572475, "global_step": 160271, "epoch": 3815, "val_loss": 68736.1484375} {"train_loss": -6.975964546203613, "global_step": 160272, "epoch": 3816} {"train_loss": -6.880537986755371, "global_step": 160273, "epoch": 3816} {"train_loss": -6.980314254760742, "global_step": 160274, "epoch": 3816} {"train_loss": -6.93890380859375, "global_step": 160275, "epoch": 3816} {"train_loss": -6.830789566040039, "global_step": 160276, "epoch": 3816} {"train_loss": -6.900432109832764, "global_step": 160277, "epoch": 3816} {"train_loss": -6.840122222900391, "global_step": 160278, "epoch": 3816} {"train_loss": -6.811520576477051, "global_step": 160279, "epoch": 3816} {"train_loss": -6.973459720611572, "global_step": 160280, "epoch": 3816} {"train_loss": -6.877737045288086, "global_step": 160281, "epoch": 3816} {"train_loss": -6.89794921875, "global_step": 160282, "epoch": 3816} {"train_loss": -6.953037261962891, "global_step": 160283, "epoch": 3816} {"train_loss": -6.8249311447143555, "global_step": 160284, "epoch": 3816} {"train_loss": -6.776535987854004, "global_step": 160285, "epoch": 3816} {"train_loss": -6.811294078826904, "global_step": 160286, "epoch": 3816} {"train_loss": -6.900814056396484, "global_step": 160287, "epoch": 3816} {"train_loss": -6.896008491516113, "global_step": 160288, "epoch": 3816} {"train_loss": -6.880131721496582, "global_step": 160289, "epoch": 3816} {"train_loss": -6.8336358070373535, "global_step": 160290, "epoch": 3816} {"train_loss": -6.997450828552246, "global_step": 160291, "epoch": 3816} {"train_loss": -6.781317710876465, "global_step": 160292, "epoch": 3816} {"train_loss": -6.806422710418701, "global_step": 160293, "epoch": 3816} {"train_loss": -6.966702938079834, "global_step": 160294, "epoch": 3816} {"train_loss": -7.017745494842529, "global_step": 160295, "epoch": 3816} {"train_loss": -6.954344749450684, "global_step": 160296, "epoch": 3816} {"train_loss": -6.793203353881836, "global_step": 160297, "epoch": 3816} {"train_loss": -6.966740608215332, "global_step": 160298, "epoch": 3816} {"train_loss": -6.836544036865234, "global_step": 160299, "epoch": 3816} {"train_loss": -6.835638999938965, "global_step": 160300, "epoch": 3816} {"train_loss": -6.82069206237793, "global_step": 160301, "epoch": 3816} {"train_loss": -6.913731575012207, "global_step": 160302, "epoch": 3816} {"train_loss": -6.83404541015625, "global_step": 160303, "epoch": 3816} {"train_loss": -6.820399761199951, "global_step": 160304, "epoch": 3816} {"train_loss": -6.879515647888184, "global_step": 160305, "epoch": 3816} {"train_loss": -6.872115135192871, "global_step": 160306, "epoch": 3816} {"train_loss": -6.812225341796875, "global_step": 160307, "epoch": 3816} {"train_loss": -6.947099685668945, "global_step": 160308, "epoch": 3816} {"train_loss": -6.785933494567871, "global_step": 160309, "epoch": 3816} {"train_loss": -6.914337158203125, "global_step": 160310, "epoch": 3816} {"train_loss": -6.862835884094238, "global_step": 160311, "epoch": 3816} {"train_loss": -6.989291191101074, "global_step": 160312, "epoch": 3816} {"train_loss": -6.882532982599168, "global_step": 160313, "epoch": 3816, "val_loss": 68456.2578125} {"train_loss": -6.906318187713623, "global_step": 160314, "epoch": 3817} {"train_loss": -6.926816940307617, "global_step": 160315, "epoch": 3817} {"train_loss": -7.011783599853516, "global_step": 160316, "epoch": 3817} {"train_loss": -6.873309135437012, "global_step": 160317, "epoch": 3817} {"train_loss": -6.875792503356934, "global_step": 160318, "epoch": 3817} {"train_loss": -6.854253768920898, "global_step": 160319, "epoch": 3817} {"train_loss": -6.847438335418701, "global_step": 160320, "epoch": 3817} {"train_loss": -6.9665422439575195, "global_step": 160321, "epoch": 3817} {"train_loss": -6.868449687957764, "global_step": 160322, "epoch": 3817} {"train_loss": -6.877130508422852, "global_step": 160323, "epoch": 3817} {"train_loss": -6.903971195220947, "global_step": 160324, "epoch": 3817} {"train_loss": -7.1069231033325195, "global_step": 160325, "epoch": 3817} {"train_loss": -6.911799430847168, "global_step": 160326, "epoch": 3817} {"train_loss": -6.874231338500977, "global_step": 160327, "epoch": 3817} {"train_loss": -6.873808860778809, "global_step": 160328, "epoch": 3817} {"train_loss": -6.887491226196289, "global_step": 160329, "epoch": 3817} {"train_loss": -6.8896331787109375, "global_step": 160330, "epoch": 3817} {"train_loss": -6.835651397705078, "global_step": 160331, "epoch": 3817} {"train_loss": -6.871567726135254, "global_step": 160332, "epoch": 3817} {"train_loss": -6.951136589050293, "global_step": 160333, "epoch": 3817} {"train_loss": -6.918373107910156, "global_step": 160334, "epoch": 3817} {"train_loss": -6.87644100189209, "global_step": 160335, "epoch": 3817} {"train_loss": -6.930715560913086, "global_step": 160336, "epoch": 3817} {"train_loss": -7.011957168579102, "global_step": 160337, "epoch": 3817} {"train_loss": -7.004369735717773, "global_step": 160338, "epoch": 3817} {"train_loss": -6.991921424865723, "global_step": 160339, "epoch": 3817} {"train_loss": -6.762821197509766, "global_step": 160340, "epoch": 3817} {"train_loss": -7.011229991912842, "global_step": 160341, "epoch": 3817} {"train_loss": -7.032978057861328, "global_step": 160342, "epoch": 3817} {"train_loss": -6.888275146484375, "global_step": 160343, "epoch": 3817} {"train_loss": -6.928636074066162, "global_step": 160344, "epoch": 3817} {"train_loss": -6.906830787658691, "global_step": 160345, "epoch": 3817} {"train_loss": -6.838064193725586, "global_step": 160346, "epoch": 3817} {"train_loss": -7.044218063354492, "global_step": 160347, "epoch": 3817} {"train_loss": -6.954293251037598, "global_step": 160348, "epoch": 3817} {"train_loss": -6.930599212646484, "global_step": 160349, "epoch": 3817} {"train_loss": -6.916151523590088, "global_step": 160350, "epoch": 3817} {"train_loss": -6.896515846252441, "global_step": 160351, "epoch": 3817} {"train_loss": -7.039310455322266, "global_step": 160352, "epoch": 3817} {"train_loss": -6.930485725402832, "global_step": 160353, "epoch": 3817} {"train_loss": -6.838139533996582, "global_step": 160354, "epoch": 3817} {"train_loss": -6.919972431092035, "global_step": 160355, "epoch": 3817, "val_loss": 68658.921875} {"train_loss": -6.972621917724609, "global_step": 160356, "epoch": 3818} {"train_loss": -6.954100608825684, "global_step": 160357, "epoch": 3818} {"train_loss": -6.996437072753906, "global_step": 160358, "epoch": 3818} {"train_loss": -6.966676712036133, "global_step": 160359, "epoch": 3818} {"train_loss": -6.946883678436279, "global_step": 160360, "epoch": 3818} {"train_loss": -6.775529861450195, "global_step": 160361, "epoch": 3818} {"train_loss": -6.888815879821777, "global_step": 160362, "epoch": 3818} {"train_loss": -6.910161018371582, "global_step": 160363, "epoch": 3818} {"train_loss": -6.966992378234863, "global_step": 160364, "epoch": 3818} {"train_loss": -6.8613810539245605, "global_step": 160365, "epoch": 3818} {"train_loss": -6.836255073547363, "global_step": 160366, "epoch": 3818} {"train_loss": -6.958405494689941, "global_step": 160367, "epoch": 3818} {"train_loss": -6.824680805206299, "global_step": 160368, "epoch": 3818} {"train_loss": -6.826395034790039, "global_step": 160369, "epoch": 3818} {"train_loss": -6.943477630615234, "global_step": 160370, "epoch": 3818} {"train_loss": -6.862792015075684, "global_step": 160371, "epoch": 3818} {"train_loss": -6.8500776290893555, "global_step": 160372, "epoch": 3818} {"train_loss": -6.869250297546387, "global_step": 160373, "epoch": 3818} {"train_loss": -6.881455421447754, "global_step": 160374, "epoch": 3818} {"train_loss": -6.8461222648620605, "global_step": 160375, "epoch": 3818} {"train_loss": -6.7303056716918945, "global_step": 160376, "epoch": 3818} {"train_loss": -6.918131351470947, "global_step": 160377, "epoch": 3818} {"train_loss": -6.822641849517822, "global_step": 160378, "epoch": 3818} {"train_loss": -6.8326945304870605, "global_step": 160379, "epoch": 3818} {"train_loss": -6.819815158843994, "global_step": 160380, "epoch": 3818} {"train_loss": -6.824191093444824, "global_step": 160381, "epoch": 3818} {"train_loss": -7.007554054260254, "global_step": 160382, "epoch": 3818} {"train_loss": -6.923068046569824, "global_step": 160383, "epoch": 3818} {"train_loss": -6.884215354919434, "global_step": 160384, "epoch": 3818} {"train_loss": -6.8648529052734375, "global_step": 160385, "epoch": 3818} {"train_loss": -6.8403215408325195, "global_step": 160386, "epoch": 3818} {"train_loss": -6.728020668029785, "global_step": 160387, "epoch": 3818} {"train_loss": -6.888781547546387, "global_step": 160388, "epoch": 3818} {"train_loss": -6.755485534667969, "global_step": 160389, "epoch": 3818} {"train_loss": -6.699199676513672, "global_step": 160390, "epoch": 3818} {"train_loss": -6.839975833892822, "global_step": 160391, "epoch": 3818} {"train_loss": -6.6878767013549805, "global_step": 160392, "epoch": 3818} {"train_loss": -7.006955146789551, "global_step": 160393, "epoch": 3818} {"train_loss": -6.814770698547363, "global_step": 160394, "epoch": 3818} {"train_loss": -6.821281433105469, "global_step": 160395, "epoch": 3818} {"train_loss": -6.889294624328613, "global_step": 160396, "epoch": 3818} {"train_loss": -6.8683978489467075, "global_step": 160397, "epoch": 3818, "val_loss": 68757.109375} {"train_loss": -6.845242500305176, "global_step": 160398, "epoch": 3819} {"train_loss": -6.850705623626709, "global_step": 160399, "epoch": 3819} {"train_loss": -7.009210586547852, "global_step": 160400, "epoch": 3819} {"train_loss": -6.842796325683594, "global_step": 160401, "epoch": 3819} {"train_loss": -6.886699199676514, "global_step": 160402, "epoch": 3819} {"train_loss": -6.89654541015625, "global_step": 160403, "epoch": 3819} {"train_loss": -6.9097394943237305, "global_step": 160404, "epoch": 3819} {"train_loss": -6.8590898513793945, "global_step": 160405, "epoch": 3819} {"train_loss": -6.8484296798706055, "global_step": 160406, "epoch": 3819} {"train_loss": -6.934701919555664, "global_step": 160407, "epoch": 3819} {"train_loss": -6.923853874206543, "global_step": 160408, "epoch": 3819} {"train_loss": -6.815220832824707, "global_step": 160409, "epoch": 3819} {"train_loss": -6.892210483551025, "global_step": 160410, "epoch": 3819} {"train_loss": -6.78426456451416, "global_step": 160411, "epoch": 3819} {"train_loss": -6.858456611633301, "global_step": 160412, "epoch": 3819} {"train_loss": -6.9120941162109375, "global_step": 160413, "epoch": 3819} {"train_loss": -6.8899455070495605, "global_step": 160414, "epoch": 3819} {"train_loss": -6.876139163970947, "global_step": 160415, "epoch": 3819} {"train_loss": -7.017154216766357, "global_step": 160416, "epoch": 3819} {"train_loss": -6.870394706726074, "global_step": 160417, "epoch": 3819} {"train_loss": -6.780331611633301, "global_step": 160418, "epoch": 3819} {"train_loss": -7.002520561218262, "global_step": 160419, "epoch": 3819} {"train_loss": -6.94741153717041, "global_step": 160420, "epoch": 3819} {"train_loss": -6.903379440307617, "global_step": 160421, "epoch": 3819} {"train_loss": -6.808134078979492, "global_step": 160422, "epoch": 3819} {"train_loss": -6.82427453994751, "global_step": 160423, "epoch": 3819} {"train_loss": -6.971453666687012, "global_step": 160424, "epoch": 3819} {"train_loss": -6.840885162353516, "global_step": 160425, "epoch": 3819} {"train_loss": -6.813262939453125, "global_step": 160426, "epoch": 3819} {"train_loss": -6.996020317077637, "global_step": 160427, "epoch": 3819} {"train_loss": -6.84172248840332, "global_step": 160428, "epoch": 3819} {"train_loss": -6.838686943054199, "global_step": 160429, "epoch": 3819} {"train_loss": -6.853830337524414, "global_step": 160430, "epoch": 3819} {"train_loss": -6.862321853637695, "global_step": 160431, "epoch": 3819} {"train_loss": -6.846728324890137, "global_step": 160432, "epoch": 3819} {"train_loss": -6.905117988586426, "global_step": 160433, "epoch": 3819} {"train_loss": -6.839837074279785, "global_step": 160434, "epoch": 3819} {"train_loss": -6.870504379272461, "global_step": 160435, "epoch": 3819} {"train_loss": -6.830634593963623, "global_step": 160436, "epoch": 3819} {"train_loss": -6.96623420715332, "global_step": 160437, "epoch": 3819} {"train_loss": -6.851271152496338, "global_step": 160438, "epoch": 3819} {"train_loss": -6.880030927203951, "global_step": 160439, "epoch": 3819, "val_loss": 68795.03125} {"train_loss": -6.902802467346191, "global_step": 160440, "epoch": 3820} {"train_loss": -6.816328525543213, "global_step": 160441, "epoch": 3820} {"train_loss": -6.941142559051514, "global_step": 160442, "epoch": 3820} {"train_loss": -6.832057952880859, "global_step": 160443, "epoch": 3820} {"train_loss": -6.946816444396973, "global_step": 160444, "epoch": 3820} {"train_loss": -6.8341827392578125, "global_step": 160445, "epoch": 3820} {"train_loss": -6.805479049682617, "global_step": 160446, "epoch": 3820} {"train_loss": -6.768515586853027, "global_step": 160447, "epoch": 3820} {"train_loss": -6.888099670410156, "global_step": 160448, "epoch": 3820} {"train_loss": -6.816867351531982, "global_step": 160449, "epoch": 3820} {"train_loss": -6.820762634277344, "global_step": 160450, "epoch": 3820} {"train_loss": -6.9300079345703125, "global_step": 160451, "epoch": 3820} {"train_loss": -6.821123123168945, "global_step": 160452, "epoch": 3820} {"train_loss": -6.842073917388916, "global_step": 160453, "epoch": 3820} {"train_loss": -6.879855155944824, "global_step": 160454, "epoch": 3820} {"train_loss": -6.907088279724121, "global_step": 160455, "epoch": 3820} {"train_loss": -6.877366065979004, "global_step": 160456, "epoch": 3820} {"train_loss": -6.925836086273193, "global_step": 160457, "epoch": 3820} {"train_loss": -6.962836742401123, "global_step": 160458, "epoch": 3820} {"train_loss": -6.8515424728393555, "global_step": 160459, "epoch": 3820} {"train_loss": -6.974935531616211, "global_step": 160460, "epoch": 3820} {"train_loss": -7.032025337219238, "global_step": 160461, "epoch": 3820} {"train_loss": -6.9733476638793945, "global_step": 160462, "epoch": 3820} {"train_loss": -7.089226722717285, "global_step": 160463, "epoch": 3820} {"train_loss": -6.828815937042236, "global_step": 160464, "epoch": 3820} {"train_loss": -6.869675636291504, "global_step": 160465, "epoch": 3820} {"train_loss": -6.898564338684082, "global_step": 160466, "epoch": 3820} {"train_loss": -6.916337490081787, "global_step": 160467, "epoch": 3820} {"train_loss": -7.024513244628906, "global_step": 160468, "epoch": 3820} {"train_loss": -7.01971435546875, "global_step": 160469, "epoch": 3820} {"train_loss": -6.998416900634766, "global_step": 160470, "epoch": 3820} {"train_loss": -7.004796981811523, "global_step": 160471, "epoch": 3820} {"train_loss": -6.93479061126709, "global_step": 160472, "epoch": 3820} {"train_loss": -6.859395503997803, "global_step": 160473, "epoch": 3820} {"train_loss": -6.872594833374023, "global_step": 160474, "epoch": 3820} {"train_loss": -6.839447975158691, "global_step": 160475, "epoch": 3820} {"train_loss": -6.939085006713867, "global_step": 160476, "epoch": 3820} {"train_loss": -6.888304710388184, "global_step": 160477, "epoch": 3820} {"train_loss": -6.895450592041016, "global_step": 160478, "epoch": 3820} {"train_loss": -6.859370231628418, "global_step": 160479, "epoch": 3820} {"train_loss": -6.997844696044922, "global_step": 160480, "epoch": 3820} {"train_loss": -6.903584400812785, "global_step": 160481, "epoch": 3820, "val_loss": 68410.1875} {"train_loss": -7.031938552856445, "global_step": 160482, "epoch": 3821} {"train_loss": -6.948791027069092, "global_step": 160483, "epoch": 3821} {"train_loss": -6.892825603485107, "global_step": 160484, "epoch": 3821} {"train_loss": -6.963975429534912, "global_step": 160485, "epoch": 3821} {"train_loss": -6.894050121307373, "global_step": 160486, "epoch": 3821} {"train_loss": -6.959820747375488, "global_step": 160487, "epoch": 3821} {"train_loss": -6.930200576782227, "global_step": 160488, "epoch": 3821} {"train_loss": -6.866489410400391, "global_step": 160489, "epoch": 3821} {"train_loss": -6.832919120788574, "global_step": 160490, "epoch": 3821} {"train_loss": -6.957747459411621, "global_step": 160491, "epoch": 3821} {"train_loss": -6.908468246459961, "global_step": 160492, "epoch": 3821} {"train_loss": -7.015372276306152, "global_step": 160493, "epoch": 3821} {"train_loss": -6.954797744750977, "global_step": 160494, "epoch": 3821} {"train_loss": -6.931231498718262, "global_step": 160495, "epoch": 3821} {"train_loss": -6.935978889465332, "global_step": 160496, "epoch": 3821} {"train_loss": -6.90732479095459, "global_step": 160497, "epoch": 3821} {"train_loss": -6.832540512084961, "global_step": 160498, "epoch": 3821} {"train_loss": -6.881525039672852, "global_step": 160499, "epoch": 3821} {"train_loss": -6.983086585998535, "global_step": 160500, "epoch": 3821} {"train_loss": -6.8607869148254395, "global_step": 160501, "epoch": 3821} {"train_loss": -6.80117654800415, "global_step": 160502, "epoch": 3821} {"train_loss": -6.924112796783447, "global_step": 160503, "epoch": 3821} {"train_loss": -6.914194583892822, "global_step": 160504, "epoch": 3821} {"train_loss": -6.964813232421875, "global_step": 160505, "epoch": 3821} {"train_loss": -6.951418399810791, "global_step": 160506, "epoch": 3821} {"train_loss": -6.872938632965088, "global_step": 160507, "epoch": 3821} {"train_loss": -6.935542106628418, "global_step": 160508, "epoch": 3821} {"train_loss": -6.974155426025391, "global_step": 160509, "epoch": 3821} {"train_loss": -6.820867538452148, "global_step": 160510, "epoch": 3821} {"train_loss": -6.851056098937988, "global_step": 160511, "epoch": 3821} {"train_loss": -6.986281394958496, "global_step": 160512, "epoch": 3821} {"train_loss": -6.805855751037598, "global_step": 160513, "epoch": 3821} {"train_loss": -6.880956172943115, "global_step": 160514, "epoch": 3821} {"train_loss": -6.9247026443481445, "global_step": 160515, "epoch": 3821} {"train_loss": -6.911038875579834, "global_step": 160516, "epoch": 3821} {"train_loss": -6.852882385253906, "global_step": 160517, "epoch": 3821} {"train_loss": -6.710501194000244, "global_step": 160518, "epoch": 3821} {"train_loss": -6.8345794677734375, "global_step": 160519, "epoch": 3821} {"train_loss": -6.771200180053711, "global_step": 160520, "epoch": 3821} {"train_loss": -6.8784918785095215, "global_step": 160521, "epoch": 3821} {"train_loss": -6.869441986083984, "global_step": 160522, "epoch": 3821} {"train_loss": -6.901124590919132, "global_step": 160523, "epoch": 3821, "val_loss": 68588.578125} {"train_loss": -6.913623809814453, "global_step": 160524, "epoch": 3822} {"train_loss": -6.991938591003418, "global_step": 160525, "epoch": 3822} {"train_loss": -6.804340839385986, "global_step": 160526, "epoch": 3822} {"train_loss": -6.963080883026123, "global_step": 160527, "epoch": 3822} {"train_loss": -6.9587225914001465, "global_step": 160528, "epoch": 3822} {"train_loss": -6.876768589019775, "global_step": 160529, "epoch": 3822} {"train_loss": -6.953672409057617, "global_step": 160530, "epoch": 3822} {"train_loss": -6.902759552001953, "global_step": 160531, "epoch": 3822} {"train_loss": -6.912123680114746, "global_step": 160532, "epoch": 3822} {"train_loss": -6.932893753051758, "global_step": 160533, "epoch": 3822} {"train_loss": -6.876142501831055, "global_step": 160534, "epoch": 3822} {"train_loss": -6.803945541381836, "global_step": 160535, "epoch": 3822} {"train_loss": -6.9169769287109375, "global_step": 160536, "epoch": 3822} {"train_loss": -6.958205223083496, "global_step": 160537, "epoch": 3822} {"train_loss": -6.903877258300781, "global_step": 160538, "epoch": 3822} {"train_loss": -6.875688076019287, "global_step": 160539, "epoch": 3822} {"train_loss": -6.897699356079102, "global_step": 160540, "epoch": 3822} {"train_loss": -7.090835094451904, "global_step": 160541, "epoch": 3822} {"train_loss": -7.0567731857299805, "global_step": 160542, "epoch": 3822} {"train_loss": -6.944305419921875, "global_step": 160543, "epoch": 3822} {"train_loss": -6.951887130737305, "global_step": 160544, "epoch": 3822} {"train_loss": -6.889100551605225, "global_step": 160545, "epoch": 3822} {"train_loss": -6.866326332092285, "global_step": 160546, "epoch": 3822} {"train_loss": -6.892795085906982, "global_step": 160547, "epoch": 3822} {"train_loss": -6.892828464508057, "global_step": 160548, "epoch": 3822} {"train_loss": -7.014841079711914, "global_step": 160549, "epoch": 3822} {"train_loss": -6.814781188964844, "global_step": 160550, "epoch": 3822} {"train_loss": -6.9314866065979, "global_step": 160551, "epoch": 3822} {"train_loss": -7.066893577575684, "global_step": 160552, "epoch": 3822} {"train_loss": -6.91146993637085, "global_step": 160553, "epoch": 3822} {"train_loss": -6.97853422164917, "global_step": 160554, "epoch": 3822} {"train_loss": -6.860343933105469, "global_step": 160555, "epoch": 3822} {"train_loss": -6.916469097137451, "global_step": 160556, "epoch": 3822} {"train_loss": -6.93701171875, "global_step": 160557, "epoch": 3822} {"train_loss": -6.903095245361328, "global_step": 160558, "epoch": 3822} {"train_loss": -6.91463041305542, "global_step": 160559, "epoch": 3822} {"train_loss": -6.940077781677246, "global_step": 160560, "epoch": 3822} {"train_loss": -6.929617881774902, "global_step": 160561, "epoch": 3822} {"train_loss": -6.897726058959961, "global_step": 160562, "epoch": 3822} {"train_loss": -6.837771415710449, "global_step": 160563, "epoch": 3822} {"train_loss": -7.033431053161621, "global_step": 160564, "epoch": 3822} {"train_loss": -6.922609476816087, "global_step": 160565, "epoch": 3822, "val_loss": 68784.953125} {"train_loss": -6.925854206085205, "global_step": 160566, "epoch": 3823} {"train_loss": -6.994378089904785, "global_step": 160567, "epoch": 3823} {"train_loss": -6.880921363830566, "global_step": 160568, "epoch": 3823} {"train_loss": -6.834309101104736, "global_step": 160569, "epoch": 3823} {"train_loss": -6.879610538482666, "global_step": 160570, "epoch": 3823} {"train_loss": -6.8278326988220215, "global_step": 160571, "epoch": 3823} {"train_loss": -6.908674716949463, "global_step": 160572, "epoch": 3823} {"train_loss": -6.952264785766602, "global_step": 160573, "epoch": 3823} {"train_loss": -6.863417625427246, "global_step": 160574, "epoch": 3823} {"train_loss": -6.854253768920898, "global_step": 160575, "epoch": 3823} {"train_loss": -6.952669620513916, "global_step": 160576, "epoch": 3823} {"train_loss": -6.970949172973633, "global_step": 160577, "epoch": 3823} {"train_loss": -6.8777313232421875, "global_step": 160578, "epoch": 3823} {"train_loss": -6.931166172027588, "global_step": 160579, "epoch": 3823} {"train_loss": -6.924763202667236, "global_step": 160580, "epoch": 3823} {"train_loss": -6.9333648681640625, "global_step": 160581, "epoch": 3823} {"train_loss": -6.910204887390137, "global_step": 160582, "epoch": 3823} {"train_loss": -6.881817817687988, "global_step": 160583, "epoch": 3823} {"train_loss": -6.940812110900879, "global_step": 160584, "epoch": 3823} {"train_loss": -6.852931499481201, "global_step": 160585, "epoch": 3823} {"train_loss": -6.896188735961914, "global_step": 160586, "epoch": 3823} {"train_loss": -6.973142147064209, "global_step": 160587, "epoch": 3823} {"train_loss": -6.976644039154053, "global_step": 160588, "epoch": 3823} {"train_loss": -7.064617156982422, "global_step": 160589, "epoch": 3823} {"train_loss": -6.9663472175598145, "global_step": 160590, "epoch": 3823} {"train_loss": -6.948794364929199, "global_step": 160591, "epoch": 3823} {"train_loss": -6.834488391876221, "global_step": 160592, "epoch": 3823} {"train_loss": -6.918169021606445, "global_step": 160593, "epoch": 3823} {"train_loss": -6.827974319458008, "global_step": 160594, "epoch": 3823} {"train_loss": -6.907156944274902, "global_step": 160595, "epoch": 3823} {"train_loss": -6.878522872924805, "global_step": 160596, "epoch": 3823} {"train_loss": -6.823058128356934, "global_step": 160597, "epoch": 3823} {"train_loss": -6.914111137390137, "global_step": 160598, "epoch": 3823} {"train_loss": -6.758103847503662, "global_step": 160599, "epoch": 3823} {"train_loss": -6.765517711639404, "global_step": 160600, "epoch": 3823} {"train_loss": -6.871441841125488, "global_step": 160601, "epoch": 3823} {"train_loss": -6.69892692565918, "global_step": 160602, "epoch": 3823} {"train_loss": -6.767085075378418, "global_step": 160603, "epoch": 3823} {"train_loss": -6.919747829437256, "global_step": 160604, "epoch": 3823} {"train_loss": -6.775043964385986, "global_step": 160605, "epoch": 3823} {"train_loss": -6.858229637145996, "global_step": 160606, "epoch": 3823} {"train_loss": -6.890243166968936, "global_step": 160607, "epoch": 3823, "val_loss": 68804.7734375} {"train_loss": -6.778143882751465, "global_step": 160608, "epoch": 3824} {"train_loss": -6.862539291381836, "global_step": 160609, "epoch": 3824} {"train_loss": -6.785861968994141, "global_step": 160610, "epoch": 3824} {"train_loss": -6.851809978485107, "global_step": 160611, "epoch": 3824} {"train_loss": -6.754417419433594, "global_step": 160612, "epoch": 3824} {"train_loss": -6.748689651489258, "global_step": 160613, "epoch": 3824} {"train_loss": -6.751446723937988, "global_step": 160614, "epoch": 3824} {"train_loss": -6.867580413818359, "global_step": 160615, "epoch": 3824} {"train_loss": -6.829133033752441, "global_step": 160616, "epoch": 3824} {"train_loss": -6.982348442077637, "global_step": 160617, "epoch": 3824} {"train_loss": -6.881801128387451, "global_step": 160618, "epoch": 3824} {"train_loss": -6.808807373046875, "global_step": 160619, "epoch": 3824} {"train_loss": -6.787294387817383, "global_step": 160620, "epoch": 3824} {"train_loss": -6.826739311218262, "global_step": 160621, "epoch": 3824} {"train_loss": -6.945285320281982, "global_step": 160622, "epoch": 3824} {"train_loss": -6.895486831665039, "global_step": 160623, "epoch": 3824} {"train_loss": -6.909741401672363, "global_step": 160624, "epoch": 3824} {"train_loss": -6.883999824523926, "global_step": 160625, "epoch": 3824} {"train_loss": -6.793590068817139, "global_step": 160626, "epoch": 3824} {"train_loss": -6.930541038513184, "global_step": 160627, "epoch": 3824} {"train_loss": -6.973737716674805, "global_step": 160628, "epoch": 3824} {"train_loss": -6.837944030761719, "global_step": 160629, "epoch": 3824} {"train_loss": -6.833453178405762, "global_step": 160630, "epoch": 3824} {"train_loss": -7.0525970458984375, "global_step": 160631, "epoch": 3824} {"train_loss": -6.8358049392700195, "global_step": 160632, "epoch": 3824} {"train_loss": -6.904764652252197, "global_step": 160633, "epoch": 3824} {"train_loss": -6.840174674987793, "global_step": 160634, "epoch": 3824} {"train_loss": -6.870463848114014, "global_step": 160635, "epoch": 3824} {"train_loss": -6.785959243774414, "global_step": 160636, "epoch": 3824} {"train_loss": -6.883490562438965, "global_step": 160637, "epoch": 3824} {"train_loss": -6.90352201461792, "global_step": 160638, "epoch": 3824} {"train_loss": -6.7519989013671875, "global_step": 160639, "epoch": 3824} {"train_loss": -6.823030471801758, "global_step": 160640, "epoch": 3824} {"train_loss": -6.930728912353516, "global_step": 160641, "epoch": 3824} {"train_loss": -6.908315181732178, "global_step": 160642, "epoch": 3824} {"train_loss": -6.883260250091553, "global_step": 160643, "epoch": 3824} {"train_loss": -6.866034984588623, "global_step": 160644, "epoch": 3824} {"train_loss": -6.893404960632324, "global_step": 160645, "epoch": 3824} {"train_loss": -6.890997409820557, "global_step": 160646, "epoch": 3824} {"train_loss": -6.795896530151367, "global_step": 160647, "epoch": 3824} {"train_loss": -6.948278427124023, "global_step": 160648, "epoch": 3824} {"train_loss": -6.861910899480184, "global_step": 160649, "epoch": 3824, "val_loss": 68595.1640625} {"train_loss": -6.929352283477783, "global_step": 160650, "epoch": 3825} {"train_loss": -7.0059685707092285, "global_step": 160651, "epoch": 3825} {"train_loss": -7.010926246643066, "global_step": 160652, "epoch": 3825} {"train_loss": -6.9332685470581055, "global_step": 160653, "epoch": 3825} {"train_loss": -7.019474983215332, "global_step": 160654, "epoch": 3825} {"train_loss": -6.91847038269043, "global_step": 160655, "epoch": 3825} {"train_loss": -6.8655171394348145, "global_step": 160656, "epoch": 3825} {"train_loss": -6.823808193206787, "global_step": 160657, "epoch": 3825} {"train_loss": -6.88333797454834, "global_step": 160658, "epoch": 3825} {"train_loss": -6.952252388000488, "global_step": 160659, "epoch": 3825} {"train_loss": -6.805671691894531, "global_step": 160660, "epoch": 3825} {"train_loss": -6.854792594909668, "global_step": 160661, "epoch": 3825} {"train_loss": -6.819909572601318, "global_step": 160662, "epoch": 3825} {"train_loss": -6.827678203582764, "global_step": 160663, "epoch": 3825} {"train_loss": -6.812849998474121, "global_step": 160664, "epoch": 3825} {"train_loss": -6.99600887298584, "global_step": 160665, "epoch": 3825} {"train_loss": -6.863606929779053, "global_step": 160666, "epoch": 3825} {"train_loss": -6.892943859100342, "global_step": 160667, "epoch": 3825} {"train_loss": -6.88687801361084, "global_step": 160668, "epoch": 3825} {"train_loss": -6.778411865234375, "global_step": 160669, "epoch": 3825} {"train_loss": -6.934784889221191, "global_step": 160670, "epoch": 3825} {"train_loss": -6.808967590332031, "global_step": 160671, "epoch": 3825} {"train_loss": -6.773731708526611, "global_step": 160672, "epoch": 3825} {"train_loss": -6.89708948135376, "global_step": 160673, "epoch": 3825} {"train_loss": -6.812161922454834, "global_step": 160674, "epoch": 3825} {"train_loss": -6.795034408569336, "global_step": 160675, "epoch": 3825} {"train_loss": -6.94183349609375, "global_step": 160676, "epoch": 3825} {"train_loss": -6.762373924255371, "global_step": 160677, "epoch": 3825} {"train_loss": -6.92277717590332, "global_step": 160678, "epoch": 3825} {"train_loss": -6.878779411315918, "global_step": 160679, "epoch": 3825} {"train_loss": -6.89010763168335, "global_step": 160680, "epoch": 3825} {"train_loss": -7.034509181976318, "global_step": 160681, "epoch": 3825} {"train_loss": -6.893980026245117, "global_step": 160682, "epoch": 3825} {"train_loss": -6.950449466705322, "global_step": 160683, "epoch": 3825} {"train_loss": -7.014238357543945, "global_step": 160684, "epoch": 3825} {"train_loss": -6.886773109436035, "global_step": 160685, "epoch": 3825} {"train_loss": -6.874911308288574, "global_step": 160686, "epoch": 3825} {"train_loss": -6.964858055114746, "global_step": 160687, "epoch": 3825} {"train_loss": -6.948256969451904, "global_step": 160688, "epoch": 3825} {"train_loss": -7.055655479431152, "global_step": 160689, "epoch": 3825} {"train_loss": -6.981045246124268, "global_step": 160690, "epoch": 3825} {"train_loss": -6.901900813693092, "global_step": 160691, "epoch": 3825, "val_loss": 68604.078125} {"train_loss": -6.877024173736572, "global_step": 160692, "epoch": 3826} {"train_loss": -6.938024997711182, "global_step": 160693, "epoch": 3826} {"train_loss": -6.841934680938721, "global_step": 160694, "epoch": 3826} {"train_loss": -6.938214302062988, "global_step": 160695, "epoch": 3826} {"train_loss": -6.940421104431152, "global_step": 160696, "epoch": 3826} {"train_loss": -7.003159046173096, "global_step": 160697, "epoch": 3826} {"train_loss": -6.9975385665893555, "global_step": 160698, "epoch": 3826} {"train_loss": -6.899344444274902, "global_step": 160699, "epoch": 3826} {"train_loss": -6.92129373550415, "global_step": 160700, "epoch": 3826} {"train_loss": -6.936089515686035, "global_step": 160701, "epoch": 3826} {"train_loss": -7.09368896484375, "global_step": 160702, "epoch": 3826} {"train_loss": -6.932298183441162, "global_step": 160703, "epoch": 3826} {"train_loss": -6.973884105682373, "global_step": 160704, "epoch": 3826} {"train_loss": -6.927170753479004, "global_step": 160705, "epoch": 3826} {"train_loss": -6.984559059143066, "global_step": 160706, "epoch": 3826} {"train_loss": -6.97414493560791, "global_step": 160707, "epoch": 3826} {"train_loss": -6.817639350891113, "global_step": 160708, "epoch": 3826} {"train_loss": -6.992645263671875, "global_step": 160709, "epoch": 3826} {"train_loss": -6.892233848571777, "global_step": 160710, "epoch": 3826} {"train_loss": -6.91949462890625, "global_step": 160711, "epoch": 3826} {"train_loss": -6.832850933074951, "global_step": 160712, "epoch": 3826} {"train_loss": -6.929622650146484, "global_step": 160713, "epoch": 3826} {"train_loss": -6.818050384521484, "global_step": 160714, "epoch": 3826} {"train_loss": -6.825381278991699, "global_step": 160715, "epoch": 3826} {"train_loss": -6.832768440246582, "global_step": 160716, "epoch": 3826} {"train_loss": -6.881317138671875, "global_step": 160717, "epoch": 3826} {"train_loss": -6.822951316833496, "global_step": 160718, "epoch": 3826} {"train_loss": -6.983503341674805, "global_step": 160719, "epoch": 3826} {"train_loss": -6.865835666656494, "global_step": 160720, "epoch": 3826} {"train_loss": -6.846621513366699, "global_step": 160721, "epoch": 3826} {"train_loss": -6.836546421051025, "global_step": 160722, "epoch": 3826} {"train_loss": -6.852720737457275, "global_step": 160723, "epoch": 3826} {"train_loss": -6.711944580078125, "global_step": 160724, "epoch": 3826} {"train_loss": -6.792695999145508, "global_step": 160725, "epoch": 3826} {"train_loss": -6.91154670715332, "global_step": 160726, "epoch": 3826} {"train_loss": -6.653279781341553, "global_step": 160727, "epoch": 3826} {"train_loss": -6.830153465270996, "global_step": 160728, "epoch": 3826} {"train_loss": -6.620668411254883, "global_step": 160729, "epoch": 3826} {"train_loss": -6.823628902435303, "global_step": 160730, "epoch": 3826} {"train_loss": -6.714151382446289, "global_step": 160731, "epoch": 3826} {"train_loss": -6.751233100891113, "global_step": 160732, "epoch": 3826} {"train_loss": -6.871711186000279, "global_step": 160733, "epoch": 3826, "val_loss": 68985.4453125} {"train_loss": -6.769231796264648, "global_step": 160734, "epoch": 3827} {"train_loss": -6.749359130859375, "global_step": 160735, "epoch": 3827} {"train_loss": -6.807035446166992, "global_step": 160736, "epoch": 3827} {"train_loss": -6.733119010925293, "global_step": 160737, "epoch": 3827} {"train_loss": -6.917488098144531, "global_step": 160738, "epoch": 3827} {"train_loss": -6.792720317840576, "global_step": 160739, "epoch": 3827} {"train_loss": -6.885611534118652, "global_step": 160740, "epoch": 3827} {"train_loss": -6.974562168121338, "global_step": 160741, "epoch": 3827} {"train_loss": -6.712503433227539, "global_step": 160742, "epoch": 3827} {"train_loss": -6.877946376800537, "global_step": 160743, "epoch": 3827} {"train_loss": -6.805914402008057, "global_step": 160744, "epoch": 3827} {"train_loss": -6.796789646148682, "global_step": 160745, "epoch": 3827} {"train_loss": -6.806708812713623, "global_step": 160746, "epoch": 3827} {"train_loss": -6.767920017242432, "global_step": 160747, "epoch": 3827} {"train_loss": -6.893054962158203, "global_step": 160748, "epoch": 3827} {"train_loss": -6.806807518005371, "global_step": 160749, "epoch": 3827} {"train_loss": -6.899859428405762, "global_step": 160750, "epoch": 3827} {"train_loss": -6.936773300170898, "global_step": 160751, "epoch": 3827} {"train_loss": -6.865556716918945, "global_step": 160752, "epoch": 3827} {"train_loss": -6.920143127441406, "global_step": 160753, "epoch": 3827} {"train_loss": -6.881165504455566, "global_step": 160754, "epoch": 3827} {"train_loss": -6.873601913452148, "global_step": 160755, "epoch": 3827} {"train_loss": -6.887718677520752, "global_step": 160756, "epoch": 3827} {"train_loss": -7.052355766296387, "global_step": 160757, "epoch": 3827} {"train_loss": -6.891989707946777, "global_step": 160758, "epoch": 3827} {"train_loss": -6.849210262298584, "global_step": 160759, "epoch": 3827} {"train_loss": -6.826107501983643, "global_step": 160760, "epoch": 3827} {"train_loss": -7.041355609893799, "global_step": 160761, "epoch": 3827} {"train_loss": -6.970518112182617, "global_step": 160762, "epoch": 3827} {"train_loss": -6.9254045486450195, "global_step": 160763, "epoch": 3827} {"train_loss": -6.853874206542969, "global_step": 160764, "epoch": 3827} {"train_loss": -6.969336986541748, "global_step": 160765, "epoch": 3827} {"train_loss": -6.917938232421875, "global_step": 160766, "epoch": 3827} {"train_loss": -6.799911975860596, "global_step": 160767, "epoch": 3827} {"train_loss": -6.916742324829102, "global_step": 160768, "epoch": 3827} {"train_loss": -6.9504523277282715, "global_step": 160769, "epoch": 3827} {"train_loss": -6.897415637969971, "global_step": 160770, "epoch": 3827} {"train_loss": -6.989121913909912, "global_step": 160771, "epoch": 3827} {"train_loss": -6.853981018066406, "global_step": 160772, "epoch": 3827} {"train_loss": -6.873421669006348, "global_step": 160773, "epoch": 3827} {"train_loss": -6.865225315093994, "global_step": 160774, "epoch": 3827} {"train_loss": -6.874564693087623, "global_step": 160775, "epoch": 3827, "val_loss": 68439.828125} {"train_loss": -6.843618392944336, "global_step": 160776, "epoch": 3828} {"train_loss": -6.92244815826416, "global_step": 160777, "epoch": 3828} {"train_loss": -6.990960597991943, "global_step": 160778, "epoch": 3828} {"train_loss": -6.840710163116455, "global_step": 160779, "epoch": 3828} {"train_loss": -7.004400253295898, "global_step": 160780, "epoch": 3828} {"train_loss": -6.864812850952148, "global_step": 160781, "epoch": 3828} {"train_loss": -6.89080810546875, "global_step": 160782, "epoch": 3828} {"train_loss": -6.860742568969727, "global_step": 160783, "epoch": 3828} {"train_loss": -6.954141616821289, "global_step": 160784, "epoch": 3828} {"train_loss": -6.83837366104126, "global_step": 160785, "epoch": 3828} {"train_loss": -6.796426296234131, "global_step": 160786, "epoch": 3828} {"train_loss": -6.853157043457031, "global_step": 160787, "epoch": 3828} {"train_loss": -6.841034889221191, "global_step": 160788, "epoch": 3828} {"train_loss": -6.879342079162598, "global_step": 160789, "epoch": 3828} {"train_loss": -6.903146743774414, "global_step": 160790, "epoch": 3828} {"train_loss": -6.900504112243652, "global_step": 160791, "epoch": 3828} {"train_loss": -6.918073654174805, "global_step": 160792, "epoch": 3828} {"train_loss": -6.85800838470459, "global_step": 160793, "epoch": 3828} {"train_loss": -6.805312156677246, "global_step": 160794, "epoch": 3828} {"train_loss": -6.778431415557861, "global_step": 160795, "epoch": 3828} {"train_loss": -6.8405280113220215, "global_step": 160796, "epoch": 3828} {"train_loss": -6.930905818939209, "global_step": 160797, "epoch": 3828} {"train_loss": -6.836332321166992, "global_step": 160798, "epoch": 3828} {"train_loss": -6.832513332366943, "global_step": 160799, "epoch": 3828} {"train_loss": -6.7859954833984375, "global_step": 160800, "epoch": 3828} {"train_loss": -6.933691024780273, "global_step": 160801, "epoch": 3828} {"train_loss": -6.861311435699463, "global_step": 160802, "epoch": 3828} {"train_loss": -6.837089538574219, "global_step": 160803, "epoch": 3828} {"train_loss": -6.757564544677734, "global_step": 160804, "epoch": 3828} {"train_loss": -6.905506610870361, "global_step": 160805, "epoch": 3828} {"train_loss": -6.889753341674805, "global_step": 160806, "epoch": 3828} {"train_loss": -6.963744640350342, "global_step": 160807, "epoch": 3828} {"train_loss": -6.976397514343262, "global_step": 160808, "epoch": 3828} {"train_loss": -7.060235977172852, "global_step": 160809, "epoch": 3828} {"train_loss": -6.9218220710754395, "global_step": 160810, "epoch": 3828} {"train_loss": -6.908474445343018, "global_step": 160811, "epoch": 3828} {"train_loss": -6.97877836227417, "global_step": 160812, "epoch": 3828} {"train_loss": -6.934678077697754, "global_step": 160813, "epoch": 3828} {"train_loss": -6.870428085327148, "global_step": 160814, "epoch": 3828} {"train_loss": -6.9460039138793945, "global_step": 160815, "epoch": 3828} {"train_loss": -7.035493850708008, "global_step": 160816, "epoch": 3828} {"train_loss": -6.894966397966657, "global_step": 160817, "epoch": 3828, "val_loss": 68603.78125} {"train_loss": -6.998904228210449, "global_step": 160818, "epoch": 3829} {"train_loss": -6.997838020324707, "global_step": 160819, "epoch": 3829} {"train_loss": -6.965667724609375, "global_step": 160820, "epoch": 3829} {"train_loss": -7.090193748474121, "global_step": 160821, "epoch": 3829} {"train_loss": -6.94982385635376, "global_step": 160822, "epoch": 3829} {"train_loss": -6.920926570892334, "global_step": 160823, "epoch": 3829} {"train_loss": -7.035141944885254, "global_step": 160824, "epoch": 3829} {"train_loss": -6.8821868896484375, "global_step": 160825, "epoch": 3829} {"train_loss": -6.9378180503845215, "global_step": 160826, "epoch": 3829} {"train_loss": -6.80839729309082, "global_step": 160827, "epoch": 3829} {"train_loss": -6.873988151550293, "global_step": 160828, "epoch": 3829} {"train_loss": -6.802350997924805, "global_step": 160829, "epoch": 3829} {"train_loss": -7.035937786102295, "global_step": 160830, "epoch": 3829} {"train_loss": -6.92315149307251, "global_step": 160831, "epoch": 3829} {"train_loss": -6.980010032653809, "global_step": 160832, "epoch": 3829} {"train_loss": -6.995966911315918, "global_step": 160833, "epoch": 3829} {"train_loss": -6.864676475524902, "global_step": 160834, "epoch": 3829} {"train_loss": -6.9478535652160645, "global_step": 160835, "epoch": 3829} {"train_loss": -6.925050735473633, "global_step": 160836, "epoch": 3829} {"train_loss": -6.9550862312316895, "global_step": 160837, "epoch": 3829} {"train_loss": -7.0253119468688965, "global_step": 160838, "epoch": 3829} {"train_loss": -6.832755088806152, "global_step": 160839, "epoch": 3829} {"train_loss": -6.886927604675293, "global_step": 160840, "epoch": 3829} {"train_loss": -6.859528541564941, "global_step": 160841, "epoch": 3829} {"train_loss": -6.910160064697266, "global_step": 160842, "epoch": 3829} {"train_loss": -6.7964067459106445, "global_step": 160843, "epoch": 3829} {"train_loss": -6.893586158752441, "global_step": 160844, "epoch": 3829} {"train_loss": -6.97822904586792, "global_step": 160845, "epoch": 3829} {"train_loss": -6.946319580078125, "global_step": 160846, "epoch": 3829} {"train_loss": -6.972641468048096, "global_step": 160847, "epoch": 3829} {"train_loss": -7.037993431091309, "global_step": 160848, "epoch": 3829} {"train_loss": -6.8749098777771, "global_step": 160849, "epoch": 3829} {"train_loss": -6.841978073120117, "global_step": 160850, "epoch": 3829} {"train_loss": -6.910640716552734, "global_step": 160851, "epoch": 3829} {"train_loss": -6.912854194641113, "global_step": 160852, "epoch": 3829} {"train_loss": -6.955618858337402, "global_step": 160853, "epoch": 3829} {"train_loss": -6.986005783081055, "global_step": 160854, "epoch": 3829} {"train_loss": -6.909445762634277, "global_step": 160855, "epoch": 3829} {"train_loss": -6.884169578552246, "global_step": 160856, "epoch": 3829} {"train_loss": -6.90962553024292, "global_step": 160857, "epoch": 3829} {"train_loss": -6.827365875244141, "global_step": 160858, "epoch": 3829} {"train_loss": -6.9290458134242465, "global_step": 160859, "epoch": 3829, "val_loss": 68561.28125} {"train_loss": -7.004205703735352, "global_step": 160860, "epoch": 3830} {"train_loss": -6.861572265625, "global_step": 160861, "epoch": 3830} {"train_loss": -6.918434143066406, "global_step": 160862, "epoch": 3830} {"train_loss": -6.848779201507568, "global_step": 160863, "epoch": 3830} {"train_loss": -6.805747032165527, "global_step": 160864, "epoch": 3830} {"train_loss": -6.824719429016113, "global_step": 160865, "epoch": 3830} {"train_loss": -6.976426124572754, "global_step": 160866, "epoch": 3830} {"train_loss": -6.887885093688965, "global_step": 160867, "epoch": 3830} {"train_loss": -6.896525859832764, "global_step": 160868, "epoch": 3830} {"train_loss": -6.879779815673828, "global_step": 160869, "epoch": 3830} {"train_loss": -7.040534973144531, "global_step": 160870, "epoch": 3830} {"train_loss": -6.898777008056641, "global_step": 160871, "epoch": 3830} {"train_loss": -6.9000444412231445, "global_step": 160872, "epoch": 3830} {"train_loss": -6.853277683258057, "global_step": 160873, "epoch": 3830} {"train_loss": -6.970627784729004, "global_step": 160874, "epoch": 3830} {"train_loss": -6.838151931762695, "global_step": 160875, "epoch": 3830} {"train_loss": -6.8007001876831055, "global_step": 160876, "epoch": 3830} {"train_loss": -6.81919527053833, "global_step": 160877, "epoch": 3830} {"train_loss": -6.963600158691406, "global_step": 160878, "epoch": 3830} {"train_loss": -6.808635711669922, "global_step": 160879, "epoch": 3830} {"train_loss": -6.896097183227539, "global_step": 160880, "epoch": 3830} {"train_loss": -6.9070844650268555, "global_step": 160881, "epoch": 3830} {"train_loss": -6.722402095794678, "global_step": 160882, "epoch": 3830} {"train_loss": -6.849271297454834, "global_step": 160883, "epoch": 3830} {"train_loss": -6.921702861785889, "global_step": 160884, "epoch": 3830} {"train_loss": -6.832935333251953, "global_step": 160885, "epoch": 3830} {"train_loss": -6.84650993347168, "global_step": 160886, "epoch": 3830} {"train_loss": -6.928932189941406, "global_step": 160887, "epoch": 3830} {"train_loss": -6.84726095199585, "global_step": 160888, "epoch": 3830} {"train_loss": -6.807888984680176, "global_step": 160889, "epoch": 3830} {"train_loss": -6.888242244720459, "global_step": 160890, "epoch": 3830} {"train_loss": -6.894512176513672, "global_step": 160891, "epoch": 3830} {"train_loss": -6.916921615600586, "global_step": 160892, "epoch": 3830} {"train_loss": -7.0596184730529785, "global_step": 160893, "epoch": 3830} {"train_loss": -6.892361164093018, "global_step": 160894, "epoch": 3830} {"train_loss": -6.915288925170898, "global_step": 160895, "epoch": 3830} {"train_loss": -6.987856864929199, "global_step": 160896, "epoch": 3830} {"train_loss": -6.858395576477051, "global_step": 160897, "epoch": 3830} {"train_loss": -6.978704452514648, "global_step": 160898, "epoch": 3830} {"train_loss": -7.027632713317871, "global_step": 160899, "epoch": 3830} {"train_loss": -6.922861576080322, "global_step": 160900, "epoch": 3830} {"train_loss": -6.893618833451044, "global_step": 160901, "epoch": 3830, "val_loss": 68622.3359375} {"train_loss": -6.956959247589111, "global_step": 160902, "epoch": 3831} {"train_loss": -6.826107978820801, "global_step": 160903, "epoch": 3831} {"train_loss": -6.829054355621338, "global_step": 160904, "epoch": 3831} {"train_loss": -6.953019618988037, "global_step": 160905, "epoch": 3831} {"train_loss": -6.936254501342773, "global_step": 160906, "epoch": 3831} {"train_loss": -6.934624195098877, "global_step": 160907, "epoch": 3831} {"train_loss": -6.803841590881348, "global_step": 160908, "epoch": 3831} {"train_loss": -6.929545879364014, "global_step": 160909, "epoch": 3831} {"train_loss": -6.900595664978027, "global_step": 160910, "epoch": 3831} {"train_loss": -6.900753021240234, "global_step": 160911, "epoch": 3831} {"train_loss": -6.827751159667969, "global_step": 160912, "epoch": 3831} {"train_loss": -6.791324615478516, "global_step": 160913, "epoch": 3831} {"train_loss": -6.7367143630981445, "global_step": 160914, "epoch": 3831} {"train_loss": -6.939398765563965, "global_step": 160915, "epoch": 3831} {"train_loss": -6.986181259155273, "global_step": 160916, "epoch": 3831} {"train_loss": -6.806069374084473, "global_step": 160917, "epoch": 3831} {"train_loss": -6.874757289886475, "global_step": 160918, "epoch": 3831} {"train_loss": -6.721100330352783, "global_step": 160919, "epoch": 3831} {"train_loss": -6.803492546081543, "global_step": 160920, "epoch": 3831} {"train_loss": -6.829394340515137, "global_step": 160921, "epoch": 3831} {"train_loss": -6.808386325836182, "global_step": 160922, "epoch": 3831} {"train_loss": -6.918675899505615, "global_step": 160923, "epoch": 3831} {"train_loss": -6.908347129821777, "global_step": 160924, "epoch": 3831} {"train_loss": -6.742475986480713, "global_step": 160925, "epoch": 3831} {"train_loss": -6.8132781982421875, "global_step": 160926, "epoch": 3831} {"train_loss": -6.906607627868652, "global_step": 160927, "epoch": 3831} {"train_loss": -6.866639137268066, "global_step": 160928, "epoch": 3831} {"train_loss": -6.992506504058838, "global_step": 160929, "epoch": 3831} {"train_loss": -6.9858317375183105, "global_step": 160930, "epoch": 3831} {"train_loss": -6.956695556640625, "global_step": 160931, "epoch": 3831} {"train_loss": -6.993504047393799, "global_step": 160932, "epoch": 3831} {"train_loss": -6.958935260772705, "global_step": 160933, "epoch": 3831} {"train_loss": -6.962984085083008, "global_step": 160934, "epoch": 3831} {"train_loss": -6.903892517089844, "global_step": 160935, "epoch": 3831} {"train_loss": -6.9207940101623535, "global_step": 160936, "epoch": 3831} {"train_loss": -6.91383171081543, "global_step": 160937, "epoch": 3831} {"train_loss": -6.8996357917785645, "global_step": 160938, "epoch": 3831} {"train_loss": -6.983037948608398, "global_step": 160939, "epoch": 3831} {"train_loss": -6.885319709777832, "global_step": 160940, "epoch": 3831} {"train_loss": -6.953544616699219, "global_step": 160941, "epoch": 3831} {"train_loss": -7.002015113830566, "global_step": 160942, "epoch": 3831} {"train_loss": -6.8916053885505315, "global_step": 160943, "epoch": 3831, "val_loss": 68595.2578125} {"train_loss": -6.972020149230957, "global_step": 160944, "epoch": 3832} {"train_loss": -7.057500839233398, "global_step": 160945, "epoch": 3832} {"train_loss": -6.867517471313477, "global_step": 160946, "epoch": 3832} {"train_loss": -6.7765984535217285, "global_step": 160947, "epoch": 3832} {"train_loss": -6.853633880615234, "global_step": 160948, "epoch": 3832} {"train_loss": -7.023543357849121, "global_step": 160949, "epoch": 3832} {"train_loss": -7.005880832672119, "global_step": 160950, "epoch": 3832} {"train_loss": -6.831430435180664, "global_step": 160951, "epoch": 3832} {"train_loss": -6.943434715270996, "global_step": 160952, "epoch": 3832} {"train_loss": -6.804264068603516, "global_step": 160953, "epoch": 3832} {"train_loss": -7.024084091186523, "global_step": 160954, "epoch": 3832} {"train_loss": -6.906719207763672, "global_step": 160955, "epoch": 3832} {"train_loss": -6.964402675628662, "global_step": 160956, "epoch": 3832} {"train_loss": -6.81141996383667, "global_step": 160957, "epoch": 3832} {"train_loss": -6.852761745452881, "global_step": 160958, "epoch": 3832} {"train_loss": -7.000319957733154, "global_step": 160959, "epoch": 3832} {"train_loss": -7.016369342803955, "global_step": 160960, "epoch": 3832} {"train_loss": -6.914999008178711, "global_step": 160961, "epoch": 3832} {"train_loss": -6.999388694763184, "global_step": 160962, "epoch": 3832} {"train_loss": -6.910852432250977, "global_step": 160963, "epoch": 3832} {"train_loss": -6.942476272583008, "global_step": 160964, "epoch": 3832} {"train_loss": -6.857741355895996, "global_step": 160965, "epoch": 3832} {"train_loss": -6.979610443115234, "global_step": 160966, "epoch": 3832} {"train_loss": -6.840891361236572, "global_step": 160967, "epoch": 3832} {"train_loss": -6.929698467254639, "global_step": 160968, "epoch": 3832} {"train_loss": -6.901181697845459, "global_step": 160969, "epoch": 3832} {"train_loss": -7.03954553604126, "global_step": 160970, "epoch": 3832} {"train_loss": -6.998291015625, "global_step": 160971, "epoch": 3832} {"train_loss": -6.913016319274902, "global_step": 160972, "epoch": 3832} {"train_loss": -6.947384834289551, "global_step": 160973, "epoch": 3832} {"train_loss": -6.932901382446289, "global_step": 160974, "epoch": 3832} {"train_loss": -6.955144882202148, "global_step": 160975, "epoch": 3832} {"train_loss": -6.993827819824219, "global_step": 160976, "epoch": 3832} {"train_loss": -7.050902843475342, "global_step": 160977, "epoch": 3832} {"train_loss": -6.909189701080322, "global_step": 160978, "epoch": 3832} {"train_loss": -7.015684127807617, "global_step": 160979, "epoch": 3832} {"train_loss": -6.914970397949219, "global_step": 160980, "epoch": 3832} {"train_loss": -6.832642555236816, "global_step": 160981, "epoch": 3832} {"train_loss": -6.952361106872559, "global_step": 160982, "epoch": 3832} {"train_loss": -6.902872085571289, "global_step": 160983, "epoch": 3832} {"train_loss": -6.814178466796875, "global_step": 160984, "epoch": 3832} {"train_loss": -6.928923254921322, "global_step": 160985, "epoch": 3832, "val_loss": 68607.625} {"train_loss": -6.7878899574279785, "global_step": 160986, "epoch": 3833} {"train_loss": -6.923603057861328, "global_step": 160987, "epoch": 3833} {"train_loss": -6.9326348304748535, "global_step": 160988, "epoch": 3833} {"train_loss": -6.901361465454102, "global_step": 160989, "epoch": 3833} {"train_loss": -6.994294166564941, "global_step": 160990, "epoch": 3833} {"train_loss": -6.917659759521484, "global_step": 160991, "epoch": 3833} {"train_loss": -6.887211799621582, "global_step": 160992, "epoch": 3833} {"train_loss": -6.871992111206055, "global_step": 160993, "epoch": 3833} {"train_loss": -6.968404769897461, "global_step": 160994, "epoch": 3833} {"train_loss": -6.959551811218262, "global_step": 160995, "epoch": 3833} {"train_loss": -6.843789100646973, "global_step": 160996, "epoch": 3833} {"train_loss": -6.856488227844238, "global_step": 160997, "epoch": 3833} {"train_loss": -6.858935356140137, "global_step": 160998, "epoch": 3833} {"train_loss": -6.829227924346924, "global_step": 160999, "epoch": 3833} {"train_loss": -6.899365425109863, "global_step": 161000, "epoch": 3833} {"train_loss": -6.8483734130859375, "global_step": 161001, "epoch": 3833} {"train_loss": -6.905610084533691, "global_step": 161002, "epoch": 3833} {"train_loss": -6.994504451751709, "global_step": 161003, "epoch": 3833} {"train_loss": -6.730488300323486, "global_step": 161004, "epoch": 3833} {"train_loss": -6.887353897094727, "global_step": 161005, "epoch": 3833} {"train_loss": -6.935233116149902, "global_step": 161006, "epoch": 3833} {"train_loss": -6.77885627746582, "global_step": 161007, "epoch": 3833} {"train_loss": -6.878429412841797, "global_step": 161008, "epoch": 3833} {"train_loss": -6.8147077560424805, "global_step": 161009, "epoch": 3833} {"train_loss": -6.868232250213623, "global_step": 161010, "epoch": 3833} {"train_loss": -6.873101234436035, "global_step": 161011, "epoch": 3833} {"train_loss": -6.947819232940674, "global_step": 161012, "epoch": 3833} {"train_loss": -6.880982398986816, "global_step": 161013, "epoch": 3833} {"train_loss": -6.831780910491943, "global_step": 161014, "epoch": 3833} {"train_loss": -6.806358337402344, "global_step": 161015, "epoch": 3833} {"train_loss": -6.88374662399292, "global_step": 161016, "epoch": 3833} {"train_loss": -6.864574432373047, "global_step": 161017, "epoch": 3833} {"train_loss": -6.978813171386719, "global_step": 161018, "epoch": 3833} {"train_loss": -6.906778812408447, "global_step": 161019, "epoch": 3833} {"train_loss": -6.734193801879883, "global_step": 161020, "epoch": 3833} {"train_loss": -6.838456630706787, "global_step": 161021, "epoch": 3833} {"train_loss": -6.86054801940918, "global_step": 161022, "epoch": 3833} {"train_loss": -6.775447368621826, "global_step": 161023, "epoch": 3833} {"train_loss": -6.833430767059326, "global_step": 161024, "epoch": 3833} {"train_loss": -6.831876754760742, "global_step": 161025, "epoch": 3833} {"train_loss": -6.943131446838379, "global_step": 161026, "epoch": 3833} {"train_loss": -6.876341638110933, "global_step": 161027, "epoch": 3833, "val_loss": 68399.140625} {"train_loss": -6.883867263793945, "global_step": 161028, "epoch": 3834} {"train_loss": -6.940352439880371, "global_step": 161029, "epoch": 3834} {"train_loss": -6.9215497970581055, "global_step": 161030, "epoch": 3834} {"train_loss": -6.865322113037109, "global_step": 161031, "epoch": 3834} {"train_loss": -6.887648582458496, "global_step": 161032, "epoch": 3834} {"train_loss": -6.893324375152588, "global_step": 161033, "epoch": 3834} {"train_loss": -6.850936412811279, "global_step": 161034, "epoch": 3834} {"train_loss": -6.948888778686523, "global_step": 161035, "epoch": 3834} {"train_loss": -6.89708137512207, "global_step": 161036, "epoch": 3834} {"train_loss": -7.011625289916992, "global_step": 161037, "epoch": 3834} {"train_loss": -6.913080215454102, "global_step": 161038, "epoch": 3834} {"train_loss": -6.865819931030273, "global_step": 161039, "epoch": 3834} {"train_loss": -6.983652114868164, "global_step": 161040, "epoch": 3834} {"train_loss": -6.880469799041748, "global_step": 161041, "epoch": 3834} {"train_loss": -6.746772289276123, "global_step": 161042, "epoch": 3834} {"train_loss": -6.849725723266602, "global_step": 161043, "epoch": 3834} {"train_loss": -6.884119033813477, "global_step": 161044, "epoch": 3834} {"train_loss": -6.923077583312988, "global_step": 161045, "epoch": 3834} {"train_loss": -6.904389381408691, "global_step": 161046, "epoch": 3834} {"train_loss": -6.905475616455078, "global_step": 161047, "epoch": 3834} {"train_loss": -6.754240036010742, "global_step": 161048, "epoch": 3834} {"train_loss": -6.890961647033691, "global_step": 161049, "epoch": 3834} {"train_loss": -6.844273567199707, "global_step": 161050, "epoch": 3834} {"train_loss": -6.945704460144043, "global_step": 161051, "epoch": 3834} {"train_loss": -6.840807914733887, "global_step": 161052, "epoch": 3834} {"train_loss": -6.833071231842041, "global_step": 161053, "epoch": 3834} {"train_loss": -6.789299488067627, "global_step": 161054, "epoch": 3834} {"train_loss": -6.839280128479004, "global_step": 161055, "epoch": 3834} {"train_loss": -6.892335891723633, "global_step": 161056, "epoch": 3834} {"train_loss": -6.812028884887695, "global_step": 161057, "epoch": 3834} {"train_loss": -6.884157657623291, "global_step": 161058, "epoch": 3834} {"train_loss": -6.884061336517334, "global_step": 161059, "epoch": 3834} {"train_loss": -6.8707990646362305, "global_step": 161060, "epoch": 3834} {"train_loss": -6.853117942810059, "global_step": 161061, "epoch": 3834} {"train_loss": -6.705537796020508, "global_step": 161062, "epoch": 3834} {"train_loss": -6.812139987945557, "global_step": 161063, "epoch": 3834} {"train_loss": -6.809415340423584, "global_step": 161064, "epoch": 3834} {"train_loss": -6.849693298339844, "global_step": 161065, "epoch": 3834} {"train_loss": -6.854395866394043, "global_step": 161066, "epoch": 3834} {"train_loss": -6.822700023651123, "global_step": 161067, "epoch": 3834} {"train_loss": -6.882687568664551, "global_step": 161068, "epoch": 3834} {"train_loss": -6.867841436749413, "global_step": 161069, "epoch": 3834, "val_loss": 68964.734375} {"train_loss": -6.743132591247559, "global_step": 161070, "epoch": 3835} {"train_loss": -6.858755588531494, "global_step": 161071, "epoch": 3835} {"train_loss": -6.699559211730957, "global_step": 161072, "epoch": 3835} {"train_loss": -6.7991943359375, "global_step": 161073, "epoch": 3835} {"train_loss": -6.772340774536133, "global_step": 161074, "epoch": 3835} {"train_loss": -6.751618385314941, "global_step": 161075, "epoch": 3835} {"train_loss": -6.837967395782471, "global_step": 161076, "epoch": 3835} {"train_loss": -6.825949668884277, "global_step": 161077, "epoch": 3835} {"train_loss": -6.934436798095703, "global_step": 161078, "epoch": 3835} {"train_loss": -6.834039688110352, "global_step": 161079, "epoch": 3835} {"train_loss": -6.773565292358398, "global_step": 161080, "epoch": 3835} {"train_loss": -6.812895774841309, "global_step": 161081, "epoch": 3835} {"train_loss": -6.8100666999816895, "global_step": 161082, "epoch": 3835} {"train_loss": -6.850228309631348, "global_step": 161083, "epoch": 3835} {"train_loss": -6.785616874694824, "global_step": 161084, "epoch": 3835} {"train_loss": -6.901678562164307, "global_step": 161085, "epoch": 3835} {"train_loss": -6.827980995178223, "global_step": 161086, "epoch": 3835} {"train_loss": -6.8743181228637695, "global_step": 161087, "epoch": 3835} {"train_loss": -6.802846908569336, "global_step": 161088, "epoch": 3835} {"train_loss": -6.845813751220703, "global_step": 161089, "epoch": 3835} {"train_loss": -6.882352828979492, "global_step": 161090, "epoch": 3835} {"train_loss": -6.8712849617004395, "global_step": 161091, "epoch": 3835} {"train_loss": -6.989048004150391, "global_step": 161092, "epoch": 3835} {"train_loss": -6.9566802978515625, "global_step": 161093, "epoch": 3835} {"train_loss": -6.965985298156738, "global_step": 161094, "epoch": 3835} {"train_loss": -6.976090431213379, "global_step": 161095, "epoch": 3835} {"train_loss": -6.886665344238281, "global_step": 161096, "epoch": 3835} {"train_loss": -6.952116012573242, "global_step": 161097, "epoch": 3835} {"train_loss": -6.923801422119141, "global_step": 161098, "epoch": 3835} {"train_loss": -6.908468246459961, "global_step": 161099, "epoch": 3835} {"train_loss": -6.840761184692383, "global_step": 161100, "epoch": 3835} {"train_loss": -6.8977155685424805, "global_step": 161101, "epoch": 3835} {"train_loss": -6.9905877113342285, "global_step": 161102, "epoch": 3835} {"train_loss": -6.875267505645752, "global_step": 161103, "epoch": 3835} {"train_loss": -6.972240447998047, "global_step": 161104, "epoch": 3835} {"train_loss": -6.940954208374023, "global_step": 161105, "epoch": 3835} {"train_loss": -6.921030044555664, "global_step": 161106, "epoch": 3835} {"train_loss": -6.978232383728027, "global_step": 161107, "epoch": 3835} {"train_loss": -6.815700531005859, "global_step": 161108, "epoch": 3835} {"train_loss": -6.993875026702881, "global_step": 161109, "epoch": 3835} {"train_loss": -6.863254070281982, "global_step": 161110, "epoch": 3835} {"train_loss": -6.87161492166065, "global_step": 161111, "epoch": 3835, "val_loss": 68541.7265625} {"train_loss": -6.920194625854492, "global_step": 161112, "epoch": 3836} {"train_loss": -6.906582832336426, "global_step": 161113, "epoch": 3836} {"train_loss": -6.900477886199951, "global_step": 161114, "epoch": 3836} {"train_loss": -6.9713335037231445, "global_step": 161115, "epoch": 3836} {"train_loss": -6.9342193603515625, "global_step": 161116, "epoch": 3836} {"train_loss": -6.851093769073486, "global_step": 161117, "epoch": 3836} {"train_loss": -6.889894485473633, "global_step": 161118, "epoch": 3836} {"train_loss": -6.85682487487793, "global_step": 161119, "epoch": 3836} {"train_loss": -6.919517517089844, "global_step": 161120, "epoch": 3836} {"train_loss": -6.8689374923706055, "global_step": 161121, "epoch": 3836} {"train_loss": -6.938979625701904, "global_step": 161122, "epoch": 3836} {"train_loss": -7.046403408050537, "global_step": 161123, "epoch": 3836} {"train_loss": -6.977622985839844, "global_step": 161124, "epoch": 3836} {"train_loss": -6.802440166473389, "global_step": 161125, "epoch": 3836} {"train_loss": -6.971711158752441, "global_step": 161126, "epoch": 3836} {"train_loss": -6.979070663452148, "global_step": 161127, "epoch": 3836} {"train_loss": -7.0297980308532715, "global_step": 161128, "epoch": 3836} {"train_loss": -6.890349388122559, "global_step": 161129, "epoch": 3836} {"train_loss": -7.0337443351745605, "global_step": 161130, "epoch": 3836} {"train_loss": -6.7396559715271, "global_step": 161131, "epoch": 3836} {"train_loss": -6.985681056976318, "global_step": 161132, "epoch": 3836} {"train_loss": -7.007796764373779, "global_step": 161133, "epoch": 3836} {"train_loss": -6.820374488830566, "global_step": 161134, "epoch": 3836} {"train_loss": -7.050320625305176, "global_step": 161135, "epoch": 3836} {"train_loss": -6.8514814376831055, "global_step": 161136, "epoch": 3836} {"train_loss": -6.96132230758667, "global_step": 161137, "epoch": 3836} {"train_loss": -6.990924835205078, "global_step": 161138, "epoch": 3836} {"train_loss": -6.891613960266113, "global_step": 161139, "epoch": 3836} {"train_loss": -6.965670585632324, "global_step": 161140, "epoch": 3836} {"train_loss": -6.832773685455322, "global_step": 161141, "epoch": 3836} {"train_loss": -6.940132141113281, "global_step": 161142, "epoch": 3836} {"train_loss": -6.864843845367432, "global_step": 161143, "epoch": 3836} {"train_loss": -6.871922969818115, "global_step": 161144, "epoch": 3836} {"train_loss": -6.959210395812988, "global_step": 161145, "epoch": 3836} {"train_loss": -6.877294540405273, "global_step": 161146, "epoch": 3836} {"train_loss": -6.879779815673828, "global_step": 161147, "epoch": 3836} {"train_loss": -6.971402168273926, "global_step": 161148, "epoch": 3836} {"train_loss": -6.848974227905273, "global_step": 161149, "epoch": 3836} {"train_loss": -6.970734596252441, "global_step": 161150, "epoch": 3836} {"train_loss": -6.990096569061279, "global_step": 161151, "epoch": 3836} {"train_loss": -6.875868320465088, "global_step": 161152, "epoch": 3836} {"train_loss": -6.922248079663231, "global_step": 161153, "epoch": 3836, "val_loss": 68549.0859375} {"train_loss": -6.941424369812012, "global_step": 161154, "epoch": 3837} {"train_loss": -6.900085926055908, "global_step": 161155, "epoch": 3837} {"train_loss": -6.879765510559082, "global_step": 161156, "epoch": 3837} {"train_loss": -6.865045547485352, "global_step": 161157, "epoch": 3837} {"train_loss": -6.994504928588867, "global_step": 161158, "epoch": 3837} {"train_loss": -6.976768970489502, "global_step": 161159, "epoch": 3837} {"train_loss": -7.079028129577637, "global_step": 161160, "epoch": 3837} {"train_loss": -6.886338233947754, "global_step": 161161, "epoch": 3837} {"train_loss": -6.826789855957031, "global_step": 161162, "epoch": 3837} {"train_loss": -7.008641242980957, "global_step": 161163, "epoch": 3837} {"train_loss": -6.976136207580566, "global_step": 161164, "epoch": 3837} {"train_loss": -7.043689250946045, "global_step": 161165, "epoch": 3837} {"train_loss": -6.9029741287231445, "global_step": 161166, "epoch": 3837} {"train_loss": -6.9755730628967285, "global_step": 161167, "epoch": 3837} {"train_loss": -6.975192070007324, "global_step": 161168, "epoch": 3837} {"train_loss": -6.891386032104492, "global_step": 161169, "epoch": 3837} {"train_loss": -6.941256523132324, "global_step": 161170, "epoch": 3837} {"train_loss": -6.949283599853516, "global_step": 161171, "epoch": 3837} {"train_loss": -6.763580322265625, "global_step": 161172, "epoch": 3837} {"train_loss": -6.917054653167725, "global_step": 161173, "epoch": 3837} {"train_loss": -6.968133926391602, "global_step": 161174, "epoch": 3837} {"train_loss": -6.763646125793457, "global_step": 161175, "epoch": 3837} {"train_loss": -7.0505690574646, "global_step": 161176, "epoch": 3837} {"train_loss": -6.963131904602051, "global_step": 161177, "epoch": 3837} {"train_loss": -6.850261688232422, "global_step": 161178, "epoch": 3837} {"train_loss": -6.922289848327637, "global_step": 161179, "epoch": 3837} {"train_loss": -6.853041648864746, "global_step": 161180, "epoch": 3837} {"train_loss": -6.92941427230835, "global_step": 161181, "epoch": 3837} {"train_loss": -6.829425811767578, "global_step": 161182, "epoch": 3837} {"train_loss": -6.925139427185059, "global_step": 161183, "epoch": 3837} {"train_loss": -6.829336643218994, "global_step": 161184, "epoch": 3837} {"train_loss": -6.830890655517578, "global_step": 161185, "epoch": 3837} {"train_loss": -6.894436836242676, "global_step": 161186, "epoch": 3837} {"train_loss": -6.836555480957031, "global_step": 161187, "epoch": 3837} {"train_loss": -6.905505657196045, "global_step": 161188, "epoch": 3837} {"train_loss": -6.986941814422607, "global_step": 161189, "epoch": 3837} {"train_loss": -6.928384304046631, "global_step": 161190, "epoch": 3837} {"train_loss": -6.9718241691589355, "global_step": 161191, "epoch": 3837} {"train_loss": -6.9371442794799805, "global_step": 161192, "epoch": 3837} {"train_loss": -6.754568099975586, "global_step": 161193, "epoch": 3837} {"train_loss": -6.989438533782959, "global_step": 161194, "epoch": 3837} {"train_loss": -6.918110813413348, "global_step": 161195, "epoch": 3837, "val_loss": 68465.640625} {"train_loss": -6.848733425140381, "global_step": 161196, "epoch": 3838} {"train_loss": -6.875579357147217, "global_step": 161197, "epoch": 3838} {"train_loss": -6.741936683654785, "global_step": 161198, "epoch": 3838} {"train_loss": -6.944659233093262, "global_step": 161199, "epoch": 3838} {"train_loss": -6.911177635192871, "global_step": 161200, "epoch": 3838} {"train_loss": -6.921282768249512, "global_step": 161201, "epoch": 3838} {"train_loss": -6.781850814819336, "global_step": 161202, "epoch": 3838} {"train_loss": -6.882065773010254, "global_step": 161203, "epoch": 3838} {"train_loss": -6.921405792236328, "global_step": 161204, "epoch": 3838} {"train_loss": -6.845210075378418, "global_step": 161205, "epoch": 3838} {"train_loss": -7.018196105957031, "global_step": 161206, "epoch": 3838} {"train_loss": -6.895144462585449, "global_step": 161207, "epoch": 3838} {"train_loss": -6.8365631103515625, "global_step": 161208, "epoch": 3838} {"train_loss": -6.86398983001709, "global_step": 161209, "epoch": 3838} {"train_loss": -6.8887481689453125, "global_step": 161210, "epoch": 3838} {"train_loss": -6.8871049880981445, "global_step": 161211, "epoch": 3838} {"train_loss": -6.830723762512207, "global_step": 161212, "epoch": 3838} {"train_loss": -6.903264045715332, "global_step": 161213, "epoch": 3838} {"train_loss": -6.950579643249512, "global_step": 161214, "epoch": 3838} {"train_loss": -6.869470596313477, "global_step": 161215, "epoch": 3838} {"train_loss": -6.870377063751221, "global_step": 161216, "epoch": 3838} {"train_loss": -6.7651238441467285, "global_step": 161217, "epoch": 3838} {"train_loss": -6.853089332580566, "global_step": 161218, "epoch": 3838} {"train_loss": -6.8625311851501465, "global_step": 161219, "epoch": 3838} {"train_loss": -6.739511966705322, "global_step": 161220, "epoch": 3838} {"train_loss": -6.855373382568359, "global_step": 161221, "epoch": 3838} {"train_loss": -6.936498641967773, "global_step": 161222, "epoch": 3838} {"train_loss": -6.931921005249023, "global_step": 161223, "epoch": 3838} {"train_loss": -6.876167297363281, "global_step": 161224, "epoch": 3838} {"train_loss": -6.866340160369873, "global_step": 161225, "epoch": 3838} {"train_loss": -6.8473052978515625, "global_step": 161226, "epoch": 3838} {"train_loss": -6.935510635375977, "global_step": 161227, "epoch": 3838} {"train_loss": -6.939765453338623, "global_step": 161228, "epoch": 3838} {"train_loss": -6.880006790161133, "global_step": 161229, "epoch": 3838} {"train_loss": -6.68391752243042, "global_step": 161230, "epoch": 3838} {"train_loss": -6.894639015197754, "global_step": 161231, "epoch": 3838} {"train_loss": -6.905776023864746, "global_step": 161232, "epoch": 3838} {"train_loss": -6.889072418212891, "global_step": 161233, "epoch": 3838} {"train_loss": -6.881120204925537, "global_step": 161234, "epoch": 3838} {"train_loss": -6.872723579406738, "global_step": 161235, "epoch": 3838} {"train_loss": -6.914742946624756, "global_step": 161236, "epoch": 3838} {"train_loss": -6.87501395316351, "global_step": 161237, "epoch": 3838, "val_loss": 68558.0625} {"train_loss": -6.868635177612305, "global_step": 161238, "epoch": 3839} {"train_loss": -6.959378242492676, "global_step": 161239, "epoch": 3839} {"train_loss": -6.862738609313965, "global_step": 161240, "epoch": 3839} {"train_loss": -7.000148773193359, "global_step": 161241, "epoch": 3839} {"train_loss": -6.915382385253906, "global_step": 161242, "epoch": 3839} {"train_loss": -6.899109840393066, "global_step": 161243, "epoch": 3839} {"train_loss": -6.867984294891357, "global_step": 161244, "epoch": 3839} {"train_loss": -6.918378829956055, "global_step": 161245, "epoch": 3839} {"train_loss": -6.904531955718994, "global_step": 161246, "epoch": 3839} {"train_loss": -6.824721336364746, "global_step": 161247, "epoch": 3839} {"train_loss": -6.89109992980957, "global_step": 161248, "epoch": 3839} {"train_loss": -6.940943717956543, "global_step": 161249, "epoch": 3839} {"train_loss": -6.901226997375488, "global_step": 161250, "epoch": 3839} {"train_loss": -6.949742317199707, "global_step": 161251, "epoch": 3839} {"train_loss": -6.908751487731934, "global_step": 161252, "epoch": 3839} {"train_loss": -6.8367695808410645, "global_step": 161253, "epoch": 3839} {"train_loss": -6.842329978942871, "global_step": 161254, "epoch": 3839} {"train_loss": -6.907951354980469, "global_step": 161255, "epoch": 3839} {"train_loss": -6.949181079864502, "global_step": 161256, "epoch": 3839} {"train_loss": -6.880686283111572, "global_step": 161257, "epoch": 3839} {"train_loss": -6.96377420425415, "global_step": 161258, "epoch": 3839} {"train_loss": -7.012240409851074, "global_step": 161259, "epoch": 3839} {"train_loss": -6.934709548950195, "global_step": 161260, "epoch": 3839} {"train_loss": -6.925869464874268, "global_step": 161261, "epoch": 3839} {"train_loss": -6.9640793800354, "global_step": 161262, "epoch": 3839} {"train_loss": -7.041688919067383, "global_step": 161263, "epoch": 3839} {"train_loss": -6.858623504638672, "global_step": 161264, "epoch": 3839} {"train_loss": -6.92352819442749, "global_step": 161265, "epoch": 3839} {"train_loss": -6.974854469299316, "global_step": 161266, "epoch": 3839} {"train_loss": -6.860004425048828, "global_step": 161267, "epoch": 3839} {"train_loss": -6.931819915771484, "global_step": 161268, "epoch": 3839} {"train_loss": -6.919227600097656, "global_step": 161269, "epoch": 3839} {"train_loss": -6.973964691162109, "global_step": 161270, "epoch": 3839} {"train_loss": -7.078217506408691, "global_step": 161271, "epoch": 3839} {"train_loss": -7.065357208251953, "global_step": 161272, "epoch": 3839} {"train_loss": -6.924452781677246, "global_step": 161273, "epoch": 3839} {"train_loss": -6.919830322265625, "global_step": 161274, "epoch": 3839} {"train_loss": -6.777207374572754, "global_step": 161275, "epoch": 3839} {"train_loss": -6.9163970947265625, "global_step": 161276, "epoch": 3839} {"train_loss": -6.968805313110352, "global_step": 161277, "epoch": 3839} {"train_loss": -6.867897987365723, "global_step": 161278, "epoch": 3839} {"train_loss": -6.924421753202166, "global_step": 161279, "epoch": 3839, "val_loss": 68462.234375} {"train_loss": -7.019996643066406, "global_step": 161280, "epoch": 3840} {"train_loss": -6.972541809082031, "global_step": 161281, "epoch": 3840} {"train_loss": -6.889915466308594, "global_step": 161282, "epoch": 3840} {"train_loss": -7.010848522186279, "global_step": 161283, "epoch": 3840} {"train_loss": -7.016835689544678, "global_step": 161284, "epoch": 3840} {"train_loss": -6.935527801513672, "global_step": 161285, "epoch": 3840} {"train_loss": -6.9783124923706055, "global_step": 161286, "epoch": 3840} {"train_loss": -6.980640411376953, "global_step": 161287, "epoch": 3840} {"train_loss": -6.843357086181641, "global_step": 161288, "epoch": 3840} {"train_loss": -6.892290115356445, "global_step": 161289, "epoch": 3840} {"train_loss": -6.947238922119141, "global_step": 161290, "epoch": 3840} {"train_loss": -6.996221542358398, "global_step": 161291, "epoch": 3840} {"train_loss": -6.984806060791016, "global_step": 161292, "epoch": 3840} {"train_loss": -6.970639705657959, "global_step": 161293, "epoch": 3840} {"train_loss": -6.905266284942627, "global_step": 161294, "epoch": 3840} {"train_loss": -6.91585636138916, "global_step": 161295, "epoch": 3840} {"train_loss": -6.80511999130249, "global_step": 161296, "epoch": 3840} {"train_loss": -6.944586753845215, "global_step": 161297, "epoch": 3840} {"train_loss": -7.0618157386779785, "global_step": 161298, "epoch": 3840} {"train_loss": -6.842920303344727, "global_step": 161299, "epoch": 3840} {"train_loss": -6.9437665939331055, "global_step": 161300, "epoch": 3840} {"train_loss": -6.968595504760742, "global_step": 161301, "epoch": 3840} {"train_loss": -6.840394973754883, "global_step": 161302, "epoch": 3840} {"train_loss": -6.921910285949707, "global_step": 161303, "epoch": 3840} {"train_loss": -6.903364181518555, "global_step": 161304, "epoch": 3840} {"train_loss": -6.9226861000061035, "global_step": 161305, "epoch": 3840} {"train_loss": -6.818848609924316, "global_step": 161306, "epoch": 3840} {"train_loss": -6.931939601898193, "global_step": 161307, "epoch": 3840} {"train_loss": -6.989230155944824, "global_step": 161308, "epoch": 3840} {"train_loss": -6.79679012298584, "global_step": 161309, "epoch": 3840} {"train_loss": -6.967353820800781, "global_step": 161310, "epoch": 3840} {"train_loss": -6.905089378356934, "global_step": 161311, "epoch": 3840} {"train_loss": -6.9282636642456055, "global_step": 161312, "epoch": 3840} {"train_loss": -7.0341291427612305, "global_step": 161313, "epoch": 3840} {"train_loss": -6.892726898193359, "global_step": 161314, "epoch": 3840} {"train_loss": -6.875496864318848, "global_step": 161315, "epoch": 3840} {"train_loss": -6.839092254638672, "global_step": 161316, "epoch": 3840} {"train_loss": -6.883307456970215, "global_step": 161317, "epoch": 3840} {"train_loss": -6.880999565124512, "global_step": 161318, "epoch": 3840} {"train_loss": -6.845810890197754, "global_step": 161319, "epoch": 3840} {"train_loss": -6.7537641525268555, "global_step": 161320, "epoch": 3840} {"train_loss": -6.919404029846191, "global_step": 161321, "epoch": 3840, "val_loss": 68731.9921875} {"train_loss": -6.891831398010254, "global_step": 161322, "epoch": 3841} {"train_loss": -6.949273109436035, "global_step": 161323, "epoch": 3841} {"train_loss": -6.891432285308838, "global_step": 161324, "epoch": 3841} {"train_loss": -6.965396881103516, "global_step": 161325, "epoch": 3841} {"train_loss": -6.880680084228516, "global_step": 161326, "epoch": 3841} {"train_loss": -6.9596357345581055, "global_step": 161327, "epoch": 3841} {"train_loss": -6.8760294914245605, "global_step": 161328, "epoch": 3841} {"train_loss": -7.028997898101807, "global_step": 161329, "epoch": 3841} {"train_loss": -7.101873874664307, "global_step": 161330, "epoch": 3841} {"train_loss": -6.849920749664307, "global_step": 161331, "epoch": 3841} {"train_loss": -6.8976569175720215, "global_step": 161332, "epoch": 3841} {"train_loss": -6.957420349121094, "global_step": 161333, "epoch": 3841} {"train_loss": -6.851307392120361, "global_step": 161334, "epoch": 3841} {"train_loss": -6.9701128005981445, "global_step": 161335, "epoch": 3841} {"train_loss": -6.973941802978516, "global_step": 161336, "epoch": 3841} {"train_loss": -6.922518730163574, "global_step": 161337, "epoch": 3841} {"train_loss": -7.001362323760986, "global_step": 161338, "epoch": 3841} {"train_loss": -6.935920715332031, "global_step": 161339, "epoch": 3841} {"train_loss": -6.943214416503906, "global_step": 161340, "epoch": 3841} {"train_loss": -7.023414134979248, "global_step": 161341, "epoch": 3841} {"train_loss": -6.924790382385254, "global_step": 161342, "epoch": 3841} {"train_loss": -6.893181324005127, "global_step": 161343, "epoch": 3841} {"train_loss": -6.859776020050049, "global_step": 161344, "epoch": 3841} {"train_loss": -6.686529636383057, "global_step": 161345, "epoch": 3841} {"train_loss": -6.973600387573242, "global_step": 161346, "epoch": 3841} {"train_loss": -6.994228363037109, "global_step": 161347, "epoch": 3841} {"train_loss": -6.813729286193848, "global_step": 161348, "epoch": 3841} {"train_loss": -6.888708114624023, "global_step": 161349, "epoch": 3841} {"train_loss": -6.838845252990723, "global_step": 161350, "epoch": 3841} {"train_loss": -6.818115711212158, "global_step": 161351, "epoch": 3841} {"train_loss": -6.936781883239746, "global_step": 161352, "epoch": 3841} {"train_loss": -6.937373638153076, "global_step": 161353, "epoch": 3841} {"train_loss": -6.882129192352295, "global_step": 161354, "epoch": 3841} {"train_loss": -6.772327423095703, "global_step": 161355, "epoch": 3841} {"train_loss": -6.8167033195495605, "global_step": 161356, "epoch": 3841} {"train_loss": -6.899196624755859, "global_step": 161357, "epoch": 3841} {"train_loss": -6.732581615447998, "global_step": 161358, "epoch": 3841} {"train_loss": -7.055006980895996, "global_step": 161359, "epoch": 3841} {"train_loss": -6.812456130981445, "global_step": 161360, "epoch": 3841} {"train_loss": -6.806550025939941, "global_step": 161361, "epoch": 3841} {"train_loss": -6.866209983825684, "global_step": 161362, "epoch": 3841} {"train_loss": -6.90129398164295, "global_step": 161363, "epoch": 3841, "val_loss": 68388.28125} {"train_loss": -6.851531982421875, "global_step": 161364, "epoch": 3842} {"train_loss": -6.764924049377441, "global_step": 161365, "epoch": 3842} {"train_loss": -6.785131931304932, "global_step": 161366, "epoch": 3842} {"train_loss": -6.859025955200195, "global_step": 161367, "epoch": 3842} {"train_loss": -6.657686233520508, "global_step": 161368, "epoch": 3842} {"train_loss": -6.879700660705566, "global_step": 161369, "epoch": 3842} {"train_loss": -6.824387550354004, "global_step": 161370, "epoch": 3842} {"train_loss": -6.817111015319824, "global_step": 161371, "epoch": 3842} {"train_loss": -6.825945854187012, "global_step": 161372, "epoch": 3842} {"train_loss": -6.733098983764648, "global_step": 161373, "epoch": 3842} {"train_loss": -6.684338092803955, "global_step": 161374, "epoch": 3842} {"train_loss": -6.914210796356201, "global_step": 161375, "epoch": 3842} {"train_loss": -6.782165050506592, "global_step": 161376, "epoch": 3842} {"train_loss": -6.7272629737854, "global_step": 161377, "epoch": 3842} {"train_loss": -6.768892288208008, "global_step": 161378, "epoch": 3842} {"train_loss": -6.84470272064209, "global_step": 161379, "epoch": 3842} {"train_loss": -6.884275436401367, "global_step": 161380, "epoch": 3842} {"train_loss": -6.890955924987793, "global_step": 161381, "epoch": 3842} {"train_loss": -6.890036106109619, "global_step": 161382, "epoch": 3842} {"train_loss": -6.776681900024414, "global_step": 161383, "epoch": 3842} {"train_loss": -6.896615028381348, "global_step": 161384, "epoch": 3842} {"train_loss": -6.809332370758057, "global_step": 161385, "epoch": 3842} {"train_loss": -6.887306213378906, "global_step": 161386, "epoch": 3842} {"train_loss": -6.906227111816406, "global_step": 161387, "epoch": 3842} {"train_loss": -6.920209884643555, "global_step": 161388, "epoch": 3842} {"train_loss": -6.878862380981445, "global_step": 161389, "epoch": 3842} {"train_loss": -6.885505199432373, "global_step": 161390, "epoch": 3842} {"train_loss": -6.8394012451171875, "global_step": 161391, "epoch": 3842} {"train_loss": -7.0448198318481445, "global_step": 161392, "epoch": 3842} {"train_loss": -6.882054805755615, "global_step": 161393, "epoch": 3842} {"train_loss": -6.908023834228516, "global_step": 161394, "epoch": 3842} {"train_loss": -6.864780902862549, "global_step": 161395, "epoch": 3842} {"train_loss": -6.850221633911133, "global_step": 161396, "epoch": 3842} {"train_loss": -6.912273406982422, "global_step": 161397, "epoch": 3842} {"train_loss": -6.954132080078125, "global_step": 161398, "epoch": 3842} {"train_loss": -6.921574115753174, "global_step": 161399, "epoch": 3842} {"train_loss": -6.99796724319458, "global_step": 161400, "epoch": 3842} {"train_loss": -6.848688125610352, "global_step": 161401, "epoch": 3842} {"train_loss": -6.891471862792969, "global_step": 161402, "epoch": 3842} {"train_loss": -6.9470438957214355, "global_step": 161403, "epoch": 3842} {"train_loss": -6.979029178619385, "global_step": 161404, "epoch": 3842} {"train_loss": -6.858788626534598, "global_step": 161405, "epoch": 3842, "val_loss": 68672.3359375} {"train_loss": -6.9427618980407715, "global_step": 161406, "epoch": 3843} {"train_loss": -6.981048583984375, "global_step": 161407, "epoch": 3843} {"train_loss": -6.823594093322754, "global_step": 161408, "epoch": 3843} {"train_loss": -6.845255374908447, "global_step": 161409, "epoch": 3843} {"train_loss": -6.970376014709473, "global_step": 161410, "epoch": 3843} {"train_loss": -6.848015308380127, "global_step": 161411, "epoch": 3843} {"train_loss": -6.951832294464111, "global_step": 161412, "epoch": 3843} {"train_loss": -6.868921756744385, "global_step": 161413, "epoch": 3843} {"train_loss": -6.837615013122559, "global_step": 161414, "epoch": 3843} {"train_loss": -6.955025672912598, "global_step": 161415, "epoch": 3843} {"train_loss": -6.793034076690674, "global_step": 161416, "epoch": 3843} {"train_loss": -6.844539165496826, "global_step": 161417, "epoch": 3843} {"train_loss": -6.764066696166992, "global_step": 161418, "epoch": 3843} {"train_loss": -6.792866230010986, "global_step": 161419, "epoch": 3843} {"train_loss": -6.816133499145508, "global_step": 161420, "epoch": 3843} {"train_loss": -6.893098831176758, "global_step": 161421, "epoch": 3843} {"train_loss": -6.781910419464111, "global_step": 161422, "epoch": 3843} {"train_loss": -6.921359062194824, "global_step": 161423, "epoch": 3843} {"train_loss": -6.924882411956787, "global_step": 161424, "epoch": 3843} {"train_loss": -6.96079158782959, "global_step": 161425, "epoch": 3843} {"train_loss": -6.85255765914917, "global_step": 161426, "epoch": 3843} {"train_loss": -6.836533546447754, "global_step": 161427, "epoch": 3843} {"train_loss": -6.875545501708984, "global_step": 161428, "epoch": 3843} {"train_loss": -6.8676862716674805, "global_step": 161429, "epoch": 3843} {"train_loss": -6.923223495483398, "global_step": 161430, "epoch": 3843} {"train_loss": -6.94069766998291, "global_step": 161431, "epoch": 3843} {"train_loss": -6.884417533874512, "global_step": 161432, "epoch": 3843} {"train_loss": -6.8412628173828125, "global_step": 161433, "epoch": 3843} {"train_loss": -6.866758823394775, "global_step": 161434, "epoch": 3843} {"train_loss": -6.782975196838379, "global_step": 161435, "epoch": 3843} {"train_loss": -7.0673933029174805, "global_step": 161436, "epoch": 3843} {"train_loss": -6.938792705535889, "global_step": 161437, "epoch": 3843} {"train_loss": -6.861630439758301, "global_step": 161438, "epoch": 3843} {"train_loss": -6.857294082641602, "global_step": 161439, "epoch": 3843} {"train_loss": -7.040185928344727, "global_step": 161440, "epoch": 3843} {"train_loss": -6.919717788696289, "global_step": 161441, "epoch": 3843} {"train_loss": -6.959782600402832, "global_step": 161442, "epoch": 3843} {"train_loss": -6.796270370483398, "global_step": 161443, "epoch": 3843} {"train_loss": -6.922991752624512, "global_step": 161444, "epoch": 3843} {"train_loss": -6.966655731201172, "global_step": 161445, "epoch": 3843} {"train_loss": -7.033766746520996, "global_step": 161446, "epoch": 3843} {"train_loss": -6.8925889900752475, "global_step": 161447, "epoch": 3843, "val_loss": 68465.3984375} {"train_loss": -6.861514091491699, "global_step": 161448, "epoch": 3844} {"train_loss": -6.940582275390625, "global_step": 161449, "epoch": 3844} {"train_loss": -7.033322334289551, "global_step": 161450, "epoch": 3844} {"train_loss": -6.919153213500977, "global_step": 161451, "epoch": 3844} {"train_loss": -6.951358795166016, "global_step": 161452, "epoch": 3844} {"train_loss": -7.081887722015381, "global_step": 161453, "epoch": 3844} {"train_loss": -6.981134414672852, "global_step": 161454, "epoch": 3844} {"train_loss": -6.984199523925781, "global_step": 161455, "epoch": 3844} {"train_loss": -7.005808353424072, "global_step": 161456, "epoch": 3844} {"train_loss": -6.969636917114258, "global_step": 161457, "epoch": 3844} {"train_loss": -6.910921573638916, "global_step": 161458, "epoch": 3844} {"train_loss": -6.963596343994141, "global_step": 161459, "epoch": 3844} {"train_loss": -6.949450969696045, "global_step": 161460, "epoch": 3844} {"train_loss": -6.965869903564453, "global_step": 161461, "epoch": 3844} {"train_loss": -6.930231094360352, "global_step": 161462, "epoch": 3844} {"train_loss": -6.945710182189941, "global_step": 161463, "epoch": 3844} {"train_loss": -6.985867977142334, "global_step": 161464, "epoch": 3844} {"train_loss": -6.864922523498535, "global_step": 161465, "epoch": 3844} {"train_loss": -7.0369954109191895, "global_step": 161466, "epoch": 3844} {"train_loss": -7.109260559082031, "global_step": 161467, "epoch": 3844} {"train_loss": -7.042322158813477, "global_step": 161468, "epoch": 3844} {"train_loss": -6.967369556427002, "global_step": 161469, "epoch": 3844} {"train_loss": -7.093334197998047, "global_step": 161470, "epoch": 3844} {"train_loss": -6.912355422973633, "global_step": 161471, "epoch": 3844} {"train_loss": -6.945841312408447, "global_step": 161472, "epoch": 3844} {"train_loss": -6.951385974884033, "global_step": 161473, "epoch": 3844} {"train_loss": -6.879334926605225, "global_step": 161474, "epoch": 3844} {"train_loss": -6.991555213928223, "global_step": 161475, "epoch": 3844} {"train_loss": -6.933828830718994, "global_step": 161476, "epoch": 3844} {"train_loss": -6.961935043334961, "global_step": 161477, "epoch": 3844} {"train_loss": -6.876012802124023, "global_step": 161478, "epoch": 3844} {"train_loss": -6.9245710372924805, "global_step": 161479, "epoch": 3844} {"train_loss": -6.898153305053711, "global_step": 161480, "epoch": 3844} {"train_loss": -6.867099761962891, "global_step": 161481, "epoch": 3844} {"train_loss": -6.983867168426514, "global_step": 161482, "epoch": 3844} {"train_loss": -6.940204620361328, "global_step": 161483, "epoch": 3844} {"train_loss": -6.968746662139893, "global_step": 161484, "epoch": 3844} {"train_loss": -6.97938346862793, "global_step": 161485, "epoch": 3844} {"train_loss": -6.921204566955566, "global_step": 161486, "epoch": 3844} {"train_loss": -6.980839729309082, "global_step": 161487, "epoch": 3844} {"train_loss": -7.008979797363281, "global_step": 161488, "epoch": 3844} {"train_loss": -6.958556833721342, "global_step": 161489, "epoch": 3844, "val_loss": 68767.0546875} {"train_loss": -6.856598854064941, "global_step": 161490, "epoch": 3845} {"train_loss": -6.880495071411133, "global_step": 161491, "epoch": 3845} {"train_loss": -6.9190354347229, "global_step": 161492, "epoch": 3845} {"train_loss": -6.85174560546875, "global_step": 161493, "epoch": 3845} {"train_loss": -6.781343936920166, "global_step": 161494, "epoch": 3845} {"train_loss": -6.917872428894043, "global_step": 161495, "epoch": 3845} {"train_loss": -6.938943386077881, "global_step": 161496, "epoch": 3845} {"train_loss": -6.853875637054443, "global_step": 161497, "epoch": 3845} {"train_loss": -6.788610458374023, "global_step": 161498, "epoch": 3845} {"train_loss": -6.925777912139893, "global_step": 161499, "epoch": 3845} {"train_loss": -6.8056230545043945, "global_step": 161500, "epoch": 3845} {"train_loss": -6.795560359954834, "global_step": 161501, "epoch": 3845} {"train_loss": -6.86617374420166, "global_step": 161502, "epoch": 3845} {"train_loss": -6.889056205749512, "global_step": 161503, "epoch": 3845} {"train_loss": -6.898480415344238, "global_step": 161504, "epoch": 3845} {"train_loss": -6.982048511505127, "global_step": 161505, "epoch": 3845} {"train_loss": -6.9520463943481445, "global_step": 161506, "epoch": 3845} {"train_loss": -6.792471885681152, "global_step": 161507, "epoch": 3845} {"train_loss": -6.915736198425293, "global_step": 161508, "epoch": 3845} {"train_loss": -6.846801280975342, "global_step": 161509, "epoch": 3845} {"train_loss": -6.80988883972168, "global_step": 161510, "epoch": 3845} {"train_loss": -6.954653263092041, "global_step": 161511, "epoch": 3845} {"train_loss": -6.950460433959961, "global_step": 161512, "epoch": 3845} {"train_loss": -6.86124849319458, "global_step": 161513, "epoch": 3845} {"train_loss": -6.908416748046875, "global_step": 161514, "epoch": 3845} {"train_loss": -6.869568824768066, "global_step": 161515, "epoch": 3845} {"train_loss": -7.006596565246582, "global_step": 161516, "epoch": 3845} {"train_loss": -6.915562629699707, "global_step": 161517, "epoch": 3845} {"train_loss": -7.021475315093994, "global_step": 161518, "epoch": 3845} {"train_loss": -6.9658403396606445, "global_step": 161519, "epoch": 3845} {"train_loss": -6.917566776275635, "global_step": 161520, "epoch": 3845} {"train_loss": -7.0470476150512695, "global_step": 161521, "epoch": 3845} {"train_loss": -6.875337600708008, "global_step": 161522, "epoch": 3845} {"train_loss": -7.026963233947754, "global_step": 161523, "epoch": 3845} {"train_loss": -6.906833648681641, "global_step": 161524, "epoch": 3845} {"train_loss": -6.768448829650879, "global_step": 161525, "epoch": 3845} {"train_loss": -6.932692050933838, "global_step": 161526, "epoch": 3845} {"train_loss": -6.99714469909668, "global_step": 161527, "epoch": 3845} {"train_loss": -6.905206680297852, "global_step": 161528, "epoch": 3845} {"train_loss": -6.8676533699035645, "global_step": 161529, "epoch": 3845} {"train_loss": -6.951270580291748, "global_step": 161530, "epoch": 3845} {"train_loss": -6.900703929719471, "global_step": 161531, "epoch": 3845, "val_loss": 68477.4375} {"train_loss": -6.941558837890625, "global_step": 161532, "epoch": 3846} {"train_loss": -6.8460917472839355, "global_step": 161533, "epoch": 3846} {"train_loss": -6.810033798217773, "global_step": 161534, "epoch": 3846} {"train_loss": -6.961709976196289, "global_step": 161535, "epoch": 3846} {"train_loss": -7.028798580169678, "global_step": 161536, "epoch": 3846} {"train_loss": -6.814839839935303, "global_step": 161537, "epoch": 3846} {"train_loss": -7.032253742218018, "global_step": 161538, "epoch": 3846} {"train_loss": -6.851161956787109, "global_step": 161539, "epoch": 3846} {"train_loss": -6.818630695343018, "global_step": 161540, "epoch": 3846} {"train_loss": -6.85709285736084, "global_step": 161541, "epoch": 3846} {"train_loss": -6.88309383392334, "global_step": 161542, "epoch": 3846} {"train_loss": -6.83533239364624, "global_step": 161543, "epoch": 3846} {"train_loss": -7.02974796295166, "global_step": 161544, "epoch": 3846} {"train_loss": -6.828764915466309, "global_step": 161545, "epoch": 3846} {"train_loss": -6.849845886230469, "global_step": 161546, "epoch": 3846} {"train_loss": -6.896565914154053, "global_step": 161547, "epoch": 3846} {"train_loss": -6.822927474975586, "global_step": 161548, "epoch": 3846} {"train_loss": -6.792207717895508, "global_step": 161549, "epoch": 3846} {"train_loss": -6.899812698364258, "global_step": 161550, "epoch": 3846} {"train_loss": -6.802109718322754, "global_step": 161551, "epoch": 3846} {"train_loss": -6.765054702758789, "global_step": 161552, "epoch": 3846} {"train_loss": -6.813701629638672, "global_step": 161553, "epoch": 3846} {"train_loss": -6.891119003295898, "global_step": 161554, "epoch": 3846} {"train_loss": -6.945764541625977, "global_step": 161555, "epoch": 3846} {"train_loss": -6.915535926818848, "global_step": 161556, "epoch": 3846} {"train_loss": -6.823428153991699, "global_step": 161557, "epoch": 3846} {"train_loss": -6.986981391906738, "global_step": 161558, "epoch": 3846} {"train_loss": -6.773176193237305, "global_step": 161559, "epoch": 3846} {"train_loss": -6.934926986694336, "global_step": 161560, "epoch": 3846} {"train_loss": -6.956354141235352, "global_step": 161561, "epoch": 3846} {"train_loss": -6.8394293785095215, "global_step": 161562, "epoch": 3846} {"train_loss": -7.00314998626709, "global_step": 161563, "epoch": 3846} {"train_loss": -6.987982749938965, "global_step": 161564, "epoch": 3846} {"train_loss": -6.85249137878418, "global_step": 161565, "epoch": 3846} {"train_loss": -6.985552787780762, "global_step": 161566, "epoch": 3846} {"train_loss": -6.82603645324707, "global_step": 161567, "epoch": 3846} {"train_loss": -6.961128234863281, "global_step": 161568, "epoch": 3846} {"train_loss": -6.795863151550293, "global_step": 161569, "epoch": 3846} {"train_loss": -7.0455427169799805, "global_step": 161570, "epoch": 3846} {"train_loss": -6.961399078369141, "global_step": 161571, "epoch": 3846} {"train_loss": -6.869135856628418, "global_step": 161572, "epoch": 3846} {"train_loss": -6.889111598332723, "global_step": 161573, "epoch": 3846, "val_loss": 68459.5625} {"train_loss": -6.930289268493652, "global_step": 161574, "epoch": 3847} {"train_loss": -6.991945743560791, "global_step": 161575, "epoch": 3847} {"train_loss": -6.8549699783325195, "global_step": 161576, "epoch": 3847} {"train_loss": -6.944117546081543, "global_step": 161577, "epoch": 3847} {"train_loss": -6.923490524291992, "global_step": 161578, "epoch": 3847} {"train_loss": -6.923376083374023, "global_step": 161579, "epoch": 3847} {"train_loss": -6.758991718292236, "global_step": 161580, "epoch": 3847} {"train_loss": -6.863530158996582, "global_step": 161581, "epoch": 3847} {"train_loss": -7.026796340942383, "global_step": 161582, "epoch": 3847} {"train_loss": -6.732138633728027, "global_step": 161583, "epoch": 3847} {"train_loss": -6.9221320152282715, "global_step": 161584, "epoch": 3847} {"train_loss": -6.957427024841309, "global_step": 161585, "epoch": 3847} {"train_loss": -6.979524612426758, "global_step": 161586, "epoch": 3847} {"train_loss": -6.909846305847168, "global_step": 161587, "epoch": 3847} {"train_loss": -6.896936416625977, "global_step": 161588, "epoch": 3847} {"train_loss": -6.941784381866455, "global_step": 161589, "epoch": 3847} {"train_loss": -6.9278483390808105, "global_step": 161590, "epoch": 3847} {"train_loss": -6.9097137451171875, "global_step": 161591, "epoch": 3847} {"train_loss": -6.984265327453613, "global_step": 161592, "epoch": 3847} {"train_loss": -6.9529852867126465, "global_step": 161593, "epoch": 3847} {"train_loss": -6.983665466308594, "global_step": 161594, "epoch": 3847} {"train_loss": -7.008563995361328, "global_step": 161595, "epoch": 3847} {"train_loss": -7.02206563949585, "global_step": 161596, "epoch": 3847} {"train_loss": -6.979704856872559, "global_step": 161597, "epoch": 3847} {"train_loss": -6.926679611206055, "global_step": 161598, "epoch": 3847} {"train_loss": -7.0044660568237305, "global_step": 161599, "epoch": 3847} {"train_loss": -7.0329413414001465, "global_step": 161600, "epoch": 3847} {"train_loss": -6.918766021728516, "global_step": 161601, "epoch": 3847} {"train_loss": -6.980321407318115, "global_step": 161602, "epoch": 3847} {"train_loss": -6.975831985473633, "global_step": 161603, "epoch": 3847} {"train_loss": -6.856894493103027, "global_step": 161604, "epoch": 3847} {"train_loss": -6.991228103637695, "global_step": 161605, "epoch": 3847} {"train_loss": -6.899301052093506, "global_step": 161606, "epoch": 3847} {"train_loss": -6.92324161529541, "global_step": 161607, "epoch": 3847} {"train_loss": -6.877266883850098, "global_step": 161608, "epoch": 3847} {"train_loss": -6.961843490600586, "global_step": 161609, "epoch": 3847} {"train_loss": -6.98923397064209, "global_step": 161610, "epoch": 3847} {"train_loss": -6.882794380187988, "global_step": 161611, "epoch": 3847} {"train_loss": -6.757602691650391, "global_step": 161612, "epoch": 3847} {"train_loss": -7.020820617675781, "global_step": 161613, "epoch": 3847} {"train_loss": -6.814976692199707, "global_step": 161614, "epoch": 3847} {"train_loss": -6.9261489822751, "global_step": 161615, "epoch": 3847, "val_loss": 68445.53125} {"train_loss": -6.904517650604248, "global_step": 161616, "epoch": 3848} {"train_loss": -6.919166564941406, "global_step": 161617, "epoch": 3848} {"train_loss": -6.864925384521484, "global_step": 161618, "epoch": 3848} {"train_loss": -6.875087738037109, "global_step": 161619, "epoch": 3848} {"train_loss": -6.775576591491699, "global_step": 161620, "epoch": 3848} {"train_loss": -6.9187703132629395, "global_step": 161621, "epoch": 3848} {"train_loss": -6.936887264251709, "global_step": 161622, "epoch": 3848} {"train_loss": -6.8564558029174805, "global_step": 161623, "epoch": 3848} {"train_loss": -6.800898551940918, "global_step": 161624, "epoch": 3848} {"train_loss": -6.96353816986084, "global_step": 161625, "epoch": 3848} {"train_loss": -6.823434829711914, "global_step": 161626, "epoch": 3848} {"train_loss": -6.897553443908691, "global_step": 161627, "epoch": 3848} {"train_loss": -6.86522102355957, "global_step": 161628, "epoch": 3848} {"train_loss": -6.937748908996582, "global_step": 161629, "epoch": 3848} {"train_loss": -7.0191264152526855, "global_step": 161630, "epoch": 3848} {"train_loss": -6.817361354827881, "global_step": 161631, "epoch": 3848} {"train_loss": -6.959705829620361, "global_step": 161632, "epoch": 3848} {"train_loss": -7.002085208892822, "global_step": 161633, "epoch": 3848} {"train_loss": -6.807040691375732, "global_step": 161634, "epoch": 3848} {"train_loss": -7.065108299255371, "global_step": 161635, "epoch": 3848} {"train_loss": -6.87385892868042, "global_step": 161636, "epoch": 3848} {"train_loss": -6.812315940856934, "global_step": 161637, "epoch": 3848} {"train_loss": -6.780113220214844, "global_step": 161638, "epoch": 3848} {"train_loss": -6.8861799240112305, "global_step": 161639, "epoch": 3848} {"train_loss": -6.8790082931518555, "global_step": 161640, "epoch": 3848} {"train_loss": -6.859375, "global_step": 161641, "epoch": 3848} {"train_loss": -7.022464752197266, "global_step": 161642, "epoch": 3848} {"train_loss": -6.873762130737305, "global_step": 161643, "epoch": 3848} {"train_loss": -6.9941582679748535, "global_step": 161644, "epoch": 3848} {"train_loss": -6.908751487731934, "global_step": 161645, "epoch": 3848} {"train_loss": -6.849446773529053, "global_step": 161646, "epoch": 3848} {"train_loss": -6.92011022567749, "global_step": 161647, "epoch": 3848} {"train_loss": -6.933209419250488, "global_step": 161648, "epoch": 3848} {"train_loss": -6.892437934875488, "global_step": 161649, "epoch": 3848} {"train_loss": -6.843784332275391, "global_step": 161650, "epoch": 3848} {"train_loss": -7.05152702331543, "global_step": 161651, "epoch": 3848} {"train_loss": -7.000328063964844, "global_step": 161652, "epoch": 3848} {"train_loss": -6.848369598388672, "global_step": 161653, "epoch": 3848} {"train_loss": -6.9556427001953125, "global_step": 161654, "epoch": 3848} {"train_loss": -6.911837577819824, "global_step": 161655, "epoch": 3848} {"train_loss": -6.958752632141113, "global_step": 161656, "epoch": 3848} {"train_loss": -6.9055024328685946, "global_step": 161657, "epoch": 3848, "val_loss": 68619.078125} {"train_loss": -6.967057228088379, "global_step": 161658, "epoch": 3849} {"train_loss": -6.9112701416015625, "global_step": 161659, "epoch": 3849} {"train_loss": -6.912267684936523, "global_step": 161660, "epoch": 3849} {"train_loss": -6.945522308349609, "global_step": 161661, "epoch": 3849} {"train_loss": -6.961807727813721, "global_step": 161662, "epoch": 3849} {"train_loss": -6.940666198730469, "global_step": 161663, "epoch": 3849} {"train_loss": -7.031379222869873, "global_step": 161664, "epoch": 3849} {"train_loss": -6.990481376647949, "global_step": 161665, "epoch": 3849} {"train_loss": -6.863150119781494, "global_step": 161666, "epoch": 3849} {"train_loss": -6.926901340484619, "global_step": 161667, "epoch": 3849} {"train_loss": -7.000423908233643, "global_step": 161668, "epoch": 3849} {"train_loss": -6.958012580871582, "global_step": 161669, "epoch": 3849} {"train_loss": -6.975917816162109, "global_step": 161670, "epoch": 3849} {"train_loss": -6.982837677001953, "global_step": 161671, "epoch": 3849} {"train_loss": -6.900041580200195, "global_step": 161672, "epoch": 3849} {"train_loss": -6.9615278244018555, "global_step": 161673, "epoch": 3849} {"train_loss": -6.973541736602783, "global_step": 161674, "epoch": 3849} {"train_loss": -7.0029449462890625, "global_step": 161675, "epoch": 3849} {"train_loss": -6.974581718444824, "global_step": 161676, "epoch": 3849} {"train_loss": -6.987760543823242, "global_step": 161677, "epoch": 3849} {"train_loss": -6.950218677520752, "global_step": 161678, "epoch": 3849} {"train_loss": -6.958822250366211, "global_step": 161679, "epoch": 3849} {"train_loss": -6.939217567443848, "global_step": 161680, "epoch": 3849} {"train_loss": -6.941417694091797, "global_step": 161681, "epoch": 3849} {"train_loss": -6.968189239501953, "global_step": 161682, "epoch": 3849} {"train_loss": -6.759490966796875, "global_step": 161683, "epoch": 3849} {"train_loss": -6.834597587585449, "global_step": 161684, "epoch": 3849} {"train_loss": -6.907537460327148, "global_step": 161685, "epoch": 3849} {"train_loss": -6.895325660705566, "global_step": 161686, "epoch": 3849} {"train_loss": -6.922497272491455, "global_step": 161687, "epoch": 3849} {"train_loss": -6.959088325500488, "global_step": 161688, "epoch": 3849} {"train_loss": -6.981205463409424, "global_step": 161689, "epoch": 3849} {"train_loss": -6.9451189041137695, "global_step": 161690, "epoch": 3849} {"train_loss": -6.928197860717773, "global_step": 161691, "epoch": 3849} {"train_loss": -6.855735778808594, "global_step": 161692, "epoch": 3849} {"train_loss": -7.033082962036133, "global_step": 161693, "epoch": 3849} {"train_loss": -6.924848556518555, "global_step": 161694, "epoch": 3849} {"train_loss": -6.86058235168457, "global_step": 161695, "epoch": 3849} {"train_loss": -6.9894890785217285, "global_step": 161696, "epoch": 3849} {"train_loss": -6.916263103485107, "global_step": 161697, "epoch": 3849} {"train_loss": -7.004685878753662, "global_step": 161698, "epoch": 3849} {"train_loss": -6.941731396175566, "global_step": 161699, "epoch": 3849, "val_loss": 68521.171875} {"train_loss": -7.009067058563232, "global_step": 161700, "epoch": 3850} {"train_loss": -7.003671646118164, "global_step": 161701, "epoch": 3850} {"train_loss": -6.923442840576172, "global_step": 161702, "epoch": 3850} {"train_loss": -6.9631500244140625, "global_step": 161703, "epoch": 3850} {"train_loss": -6.866515159606934, "global_step": 161704, "epoch": 3850} {"train_loss": -6.9480438232421875, "global_step": 161705, "epoch": 3850} {"train_loss": -6.900524139404297, "global_step": 161706, "epoch": 3850} {"train_loss": -6.88238525390625, "global_step": 161707, "epoch": 3850} {"train_loss": -6.991817951202393, "global_step": 161708, "epoch": 3850} {"train_loss": -6.872866630554199, "global_step": 161709, "epoch": 3850} {"train_loss": -6.865929126739502, "global_step": 161710, "epoch": 3850} {"train_loss": -7.020537376403809, "global_step": 161711, "epoch": 3850} {"train_loss": -6.978480339050293, "global_step": 161712, "epoch": 3850} {"train_loss": -6.868345260620117, "global_step": 161713, "epoch": 3850} {"train_loss": -6.857512474060059, "global_step": 161714, "epoch": 3850} {"train_loss": -6.874186992645264, "global_step": 161715, "epoch": 3850} {"train_loss": -6.840330123901367, "global_step": 161716, "epoch": 3850} {"train_loss": -6.926337242126465, "global_step": 161717, "epoch": 3850} {"train_loss": -6.79927921295166, "global_step": 161718, "epoch": 3850} {"train_loss": -6.846038818359375, "global_step": 161719, "epoch": 3850} {"train_loss": -6.874150276184082, "global_step": 161720, "epoch": 3850} {"train_loss": -6.8632354736328125, "global_step": 161721, "epoch": 3850} {"train_loss": -6.987836837768555, "global_step": 161722, "epoch": 3850} {"train_loss": -6.924154281616211, "global_step": 161723, "epoch": 3850} {"train_loss": -6.717308044433594, "global_step": 161724, "epoch": 3850} {"train_loss": -6.916902542114258, "global_step": 161725, "epoch": 3850} {"train_loss": -6.964577674865723, "global_step": 161726, "epoch": 3850} {"train_loss": -6.938755989074707, "global_step": 161727, "epoch": 3850} {"train_loss": -6.933376312255859, "global_step": 161728, "epoch": 3850} {"train_loss": -6.995643615722656, "global_step": 161729, "epoch": 3850} {"train_loss": -6.952986717224121, "global_step": 161730, "epoch": 3850} {"train_loss": -6.948794364929199, "global_step": 161731, "epoch": 3850} {"train_loss": -6.772239685058594, "global_step": 161732, "epoch": 3850} {"train_loss": -6.844493865966797, "global_step": 161733, "epoch": 3850} {"train_loss": -6.94618558883667, "global_step": 161734, "epoch": 3850} {"train_loss": -7.039397239685059, "global_step": 161735, "epoch": 3850} {"train_loss": -6.924752235412598, "global_step": 161736, "epoch": 3850} {"train_loss": -6.928330898284912, "global_step": 161737, "epoch": 3850} {"train_loss": -6.912042617797852, "global_step": 161738, "epoch": 3850} {"train_loss": -6.974727630615234, "global_step": 161739, "epoch": 3850} {"train_loss": -7.0415167808532715, "global_step": 161740, "epoch": 3850} {"train_loss": -6.916574716567993, "global_step": 161741, "epoch": 3850, "train/sim_max_reward_0": 0.2424862967785142, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.7720483467295046, "train/sim_max_reward_3": 0.3892273425043404, "train/sim_max_reward_4": 0.9944076381099881, "train/sim_max_reward_5": 0.9586475392381328, "test/sim_max_reward_4400000": 0.8948613308946444, "test/sim_max_reward_4400001": 0.33969236806755504, "test/sim_max_reward_4400002": 0.9048486345043492, "test/sim_max_reward_4400003": 0.8792666302300798, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.6234330505976721, "test/sim_max_reward_4400006": 0.9609242277412192, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.31190210944653723, "test/sim_max_reward_4400009": 0.9827949908162352, "test/sim_max_reward_4400010": 0.9135214754231986, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9896684016590644, "test/sim_max_reward_4400013": 0.839012184146386, "test/sim_max_reward_4400014": 0.8924403819201242, "test/sim_max_reward_4400015": 0.4973029812950595, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24747535161204529, "test/sim_max_reward_4400019": 0.00019749179870471169, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9100775102973034, "test/sim_max_reward_4400023": 0.8153141494968811, "test/sim_max_reward_4400024": 0.9678287502227121, "test/sim_max_reward_4400025": 0.2648668475902712, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.006890238613499369, "test/sim_max_reward_4400028": 0.8294608343100323, "test/sim_max_reward_4400029": 0.8423679831333225, "test/sim_max_reward_4400030": 0.9205084593539696, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.545616861024375, "test/sim_max_reward_4400034": 0.8494289254940435, "test/sim_max_reward_4400035": 0.8605099291673731, "test/sim_max_reward_4400036": 0.5398837273709872, "test/sim_max_reward_4400037": 0.9845601997023493, "test/sim_max_reward_4400038": 0.8853651858650552, "test/sim_max_reward_4400039": 0.9687880667378806, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8591264119545904, "test/sim_max_reward_4400042": 0.5148403947742806, "test/sim_max_reward_4400043": 0.920216973820165, "test/sim_max_reward_4400044": 0.7013752759861277, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 0.9804385208028878, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.9665546141868981, "train/mean_score": 0.7261361938934133, "test/mean_score": 0.5991511290117755, "val_loss": 68566.4453125} {"train_loss": -6.9762444496154785, "global_step": 161742, "epoch": 3851} {"train_loss": -6.990167617797852, "global_step": 161743, "epoch": 3851} {"train_loss": -6.969188213348389, "global_step": 161744, "epoch": 3851} {"train_loss": -6.973335266113281, "global_step": 161745, "epoch": 3851} {"train_loss": -6.914534568786621, "global_step": 161746, "epoch": 3851} {"train_loss": -6.886504650115967, "global_step": 161747, "epoch": 3851} {"train_loss": -6.8886260986328125, "global_step": 161748, "epoch": 3851} {"train_loss": -7.115243911743164, "global_step": 161749, "epoch": 3851} {"train_loss": -6.983224868774414, "global_step": 161750, "epoch": 3851} {"train_loss": -6.907940864562988, "global_step": 161751, "epoch": 3851} {"train_loss": -6.906810760498047, "global_step": 161752, "epoch": 3851} {"train_loss": -6.995649337768555, "global_step": 161753, "epoch": 3851} {"train_loss": -6.924848556518555, "global_step": 161754, "epoch": 3851} {"train_loss": -6.948644638061523, "global_step": 161755, "epoch": 3851} {"train_loss": -6.932358741760254, "global_step": 161756, "epoch": 3851} {"train_loss": -6.853710651397705, "global_step": 161757, "epoch": 3851} {"train_loss": -6.969878196716309, "global_step": 161758, "epoch": 3851} {"train_loss": -6.955313205718994, "global_step": 161759, "epoch": 3851} {"train_loss": -6.984758377075195, "global_step": 161760, "epoch": 3851} {"train_loss": -6.8572998046875, "global_step": 161761, "epoch": 3851} {"train_loss": -6.989558696746826, "global_step": 161762, "epoch": 3851} {"train_loss": -6.813503742218018, "global_step": 161763, "epoch": 3851} {"train_loss": -6.894030570983887, "global_step": 161764, "epoch": 3851} {"train_loss": -6.8753862380981445, "global_step": 161765, "epoch": 3851} {"train_loss": -6.83077335357666, "global_step": 161766, "epoch": 3851} {"train_loss": -6.918269157409668, "global_step": 161767, "epoch": 3851} {"train_loss": -6.917829513549805, "global_step": 161768, "epoch": 3851} {"train_loss": -6.8160271644592285, "global_step": 161769, "epoch": 3851} {"train_loss": -6.842381477355957, "global_step": 161770, "epoch": 3851} {"train_loss": -6.903823375701904, "global_step": 161771, "epoch": 3851} {"train_loss": -6.9045562744140625, "global_step": 161772, "epoch": 3851} {"train_loss": -6.93889045715332, "global_step": 161773, "epoch": 3851} {"train_loss": -6.957501411437988, "global_step": 161774, "epoch": 3851} {"train_loss": -6.886929035186768, "global_step": 161775, "epoch": 3851} {"train_loss": -6.925877094268799, "global_step": 161776, "epoch": 3851} {"train_loss": -6.996297836303711, "global_step": 161777, "epoch": 3851} {"train_loss": -6.88179874420166, "global_step": 161778, "epoch": 3851} {"train_loss": -6.804356575012207, "global_step": 161779, "epoch": 3851} {"train_loss": -6.8442840576171875, "global_step": 161780, "epoch": 3851} {"train_loss": -6.8165483474731445, "global_step": 161781, "epoch": 3851} {"train_loss": -6.870648384094238, "global_step": 161782, "epoch": 3851} {"train_loss": -6.915502650397165, "global_step": 161783, "epoch": 3851, "val_loss": 68704.640625} {"train_loss": -6.803441047668457, "global_step": 161784, "epoch": 3852} {"train_loss": -6.937469005584717, "global_step": 161785, "epoch": 3852} {"train_loss": -6.959071159362793, "global_step": 161786, "epoch": 3852} {"train_loss": -6.912507057189941, "global_step": 161787, "epoch": 3852} {"train_loss": -6.936395168304443, "global_step": 161788, "epoch": 3852} {"train_loss": -6.841472625732422, "global_step": 161789, "epoch": 3852} {"train_loss": -6.930400848388672, "global_step": 161790, "epoch": 3852} {"train_loss": -6.840630054473877, "global_step": 161791, "epoch": 3852} {"train_loss": -6.901761531829834, "global_step": 161792, "epoch": 3852} {"train_loss": -6.837493896484375, "global_step": 161793, "epoch": 3852} {"train_loss": -7.017393112182617, "global_step": 161794, "epoch": 3852} {"train_loss": -6.965567111968994, "global_step": 161795, "epoch": 3852} {"train_loss": -6.7720208168029785, "global_step": 161796, "epoch": 3852} {"train_loss": -6.835992336273193, "global_step": 161797, "epoch": 3852} {"train_loss": -6.860011100769043, "global_step": 161798, "epoch": 3852} {"train_loss": -6.885376930236816, "global_step": 161799, "epoch": 3852} {"train_loss": -6.910789966583252, "global_step": 161800, "epoch": 3852} {"train_loss": -7.01865291595459, "global_step": 161801, "epoch": 3852} {"train_loss": -6.935135841369629, "global_step": 161802, "epoch": 3852} {"train_loss": -6.847050666809082, "global_step": 161803, "epoch": 3852} {"train_loss": -6.907297134399414, "global_step": 161804, "epoch": 3852} {"train_loss": -6.978113174438477, "global_step": 161805, "epoch": 3852} {"train_loss": -6.816577911376953, "global_step": 161806, "epoch": 3852} {"train_loss": -6.904643535614014, "global_step": 161807, "epoch": 3852} {"train_loss": -6.8431925773620605, "global_step": 161808, "epoch": 3852} {"train_loss": -6.876847743988037, "global_step": 161809, "epoch": 3852} {"train_loss": -6.917903423309326, "global_step": 161810, "epoch": 3852} {"train_loss": -6.893723487854004, "global_step": 161811, "epoch": 3852} {"train_loss": -6.916672706604004, "global_step": 161812, "epoch": 3852} {"train_loss": -6.989248275756836, "global_step": 161813, "epoch": 3852} {"train_loss": -6.993335247039795, "global_step": 161814, "epoch": 3852} {"train_loss": -6.888790130615234, "global_step": 161815, "epoch": 3852} {"train_loss": -6.879281997680664, "global_step": 161816, "epoch": 3852} {"train_loss": -6.934542655944824, "global_step": 161817, "epoch": 3852} {"train_loss": -6.981616973876953, "global_step": 161818, "epoch": 3852} {"train_loss": -7.059983730316162, "global_step": 161819, "epoch": 3852} {"train_loss": -6.938052654266357, "global_step": 161820, "epoch": 3852} {"train_loss": -6.807311534881592, "global_step": 161821, "epoch": 3852} {"train_loss": -7.016332149505615, "global_step": 161822, "epoch": 3852} {"train_loss": -6.947088241577148, "global_step": 161823, "epoch": 3852} {"train_loss": -6.8127007484436035, "global_step": 161824, "epoch": 3852} {"train_loss": -6.907536007109142, "global_step": 161825, "epoch": 3852, "val_loss": 68376.609375} {"train_loss": -6.937347412109375, "global_step": 161826, "epoch": 3853} {"train_loss": -6.837306022644043, "global_step": 161827, "epoch": 3853} {"train_loss": -6.916841506958008, "global_step": 161828, "epoch": 3853} {"train_loss": -6.999079704284668, "global_step": 161829, "epoch": 3853} {"train_loss": -7.024567604064941, "global_step": 161830, "epoch": 3853} {"train_loss": -6.964118957519531, "global_step": 161831, "epoch": 3853} {"train_loss": -6.949466705322266, "global_step": 161832, "epoch": 3853} {"train_loss": -6.903652667999268, "global_step": 161833, "epoch": 3853} {"train_loss": -6.849762916564941, "global_step": 161834, "epoch": 3853} {"train_loss": -6.874667167663574, "global_step": 161835, "epoch": 3853} {"train_loss": -6.826434135437012, "global_step": 161836, "epoch": 3853} {"train_loss": -6.941385269165039, "global_step": 161837, "epoch": 3853} {"train_loss": -6.820232391357422, "global_step": 161838, "epoch": 3853} {"train_loss": -6.763640403747559, "global_step": 161839, "epoch": 3853} {"train_loss": -7.036767959594727, "global_step": 161840, "epoch": 3853} {"train_loss": -6.970792770385742, "global_step": 161841, "epoch": 3853} {"train_loss": -6.820556640625, "global_step": 161842, "epoch": 3853} {"train_loss": -6.89469051361084, "global_step": 161843, "epoch": 3853} {"train_loss": -6.915290832519531, "global_step": 161844, "epoch": 3853} {"train_loss": -6.826241493225098, "global_step": 161845, "epoch": 3853} {"train_loss": -6.908069133758545, "global_step": 161846, "epoch": 3853} {"train_loss": -6.895502090454102, "global_step": 161847, "epoch": 3853} {"train_loss": -6.857151985168457, "global_step": 161848, "epoch": 3853} {"train_loss": -6.956864833831787, "global_step": 161849, "epoch": 3853} {"train_loss": -6.873405933380127, "global_step": 161850, "epoch": 3853} {"train_loss": -6.903828144073486, "global_step": 161851, "epoch": 3853} {"train_loss": -7.002692222595215, "global_step": 161852, "epoch": 3853} {"train_loss": -6.868247032165527, "global_step": 161853, "epoch": 3853} {"train_loss": -6.772505760192871, "global_step": 161854, "epoch": 3853} {"train_loss": -6.8753814697265625, "global_step": 161855, "epoch": 3853} {"train_loss": -6.83936882019043, "global_step": 161856, "epoch": 3853} {"train_loss": -6.773219108581543, "global_step": 161857, "epoch": 3853} {"train_loss": -6.889002323150635, "global_step": 161858, "epoch": 3853} {"train_loss": -6.800163269042969, "global_step": 161859, "epoch": 3853} {"train_loss": -6.848272323608398, "global_step": 161860, "epoch": 3853} {"train_loss": -6.91827917098999, "global_step": 161861, "epoch": 3853} {"train_loss": -6.869659423828125, "global_step": 161862, "epoch": 3853} {"train_loss": -6.81771183013916, "global_step": 161863, "epoch": 3853} {"train_loss": -6.880409240722656, "global_step": 161864, "epoch": 3853} {"train_loss": -6.946146011352539, "global_step": 161865, "epoch": 3853} {"train_loss": -6.844967842102051, "global_step": 161866, "epoch": 3853} {"train_loss": -6.886143843332927, "global_step": 161867, "epoch": 3853, "val_loss": 68385.9140625} {"train_loss": -6.881435871124268, "global_step": 161868, "epoch": 3854} {"train_loss": -6.927224159240723, "global_step": 161869, "epoch": 3854} {"train_loss": -6.889670372009277, "global_step": 161870, "epoch": 3854} {"train_loss": -6.9281415939331055, "global_step": 161871, "epoch": 3854} {"train_loss": -6.903948783874512, "global_step": 161872, "epoch": 3854} {"train_loss": -6.882573127746582, "global_step": 161873, "epoch": 3854} {"train_loss": -6.836801528930664, "global_step": 161874, "epoch": 3854} {"train_loss": -6.853869438171387, "global_step": 161875, "epoch": 3854} {"train_loss": -6.913532257080078, "global_step": 161876, "epoch": 3854} {"train_loss": -6.939945220947266, "global_step": 161877, "epoch": 3854} {"train_loss": -6.9370198249816895, "global_step": 161878, "epoch": 3854} {"train_loss": -6.862698078155518, "global_step": 161879, "epoch": 3854} {"train_loss": -6.9423322677612305, "global_step": 161880, "epoch": 3854} {"train_loss": -6.6637983322143555, "global_step": 161881, "epoch": 3854} {"train_loss": -6.94340705871582, "global_step": 161882, "epoch": 3854} {"train_loss": -6.8446221351623535, "global_step": 161883, "epoch": 3854} {"train_loss": -6.727234840393066, "global_step": 161884, "epoch": 3854} {"train_loss": -6.821100234985352, "global_step": 161885, "epoch": 3854} {"train_loss": -6.8717041015625, "global_step": 161886, "epoch": 3854} {"train_loss": -6.9604339599609375, "global_step": 161887, "epoch": 3854} {"train_loss": -6.775908946990967, "global_step": 161888, "epoch": 3854} {"train_loss": -6.822116851806641, "global_step": 161889, "epoch": 3854} {"train_loss": -6.830007553100586, "global_step": 161890, "epoch": 3854} {"train_loss": -6.806863307952881, "global_step": 161891, "epoch": 3854} {"train_loss": -6.858033180236816, "global_step": 161892, "epoch": 3854} {"train_loss": -6.8996171951293945, "global_step": 161893, "epoch": 3854} {"train_loss": -6.77225923538208, "global_step": 161894, "epoch": 3854} {"train_loss": -6.851866722106934, "global_step": 161895, "epoch": 3854} {"train_loss": -6.886636257171631, "global_step": 161896, "epoch": 3854} {"train_loss": -6.841073513031006, "global_step": 161897, "epoch": 3854} {"train_loss": -6.909924507141113, "global_step": 161898, "epoch": 3854} {"train_loss": -6.7602691650390625, "global_step": 161899, "epoch": 3854} {"train_loss": -6.766592025756836, "global_step": 161900, "epoch": 3854} {"train_loss": -6.758386135101318, "global_step": 161901, "epoch": 3854} {"train_loss": -6.878291606903076, "global_step": 161902, "epoch": 3854} {"train_loss": -6.877414703369141, "global_step": 161903, "epoch": 3854} {"train_loss": -7.009099960327148, "global_step": 161904, "epoch": 3854} {"train_loss": -6.775910377502441, "global_step": 161905, "epoch": 3854} {"train_loss": -6.927704811096191, "global_step": 161906, "epoch": 3854} {"train_loss": -6.848726749420166, "global_step": 161907, "epoch": 3854} {"train_loss": -6.940639019012451, "global_step": 161908, "epoch": 3854} {"train_loss": -6.8637060551416305, "global_step": 161909, "epoch": 3854, "val_loss": 68661.5390625} {"train_loss": -6.845672607421875, "global_step": 161910, "epoch": 3855} {"train_loss": -7.033023834228516, "global_step": 161911, "epoch": 3855} {"train_loss": -6.930140495300293, "global_step": 161912, "epoch": 3855} {"train_loss": -6.940008640289307, "global_step": 161913, "epoch": 3855} {"train_loss": -6.8763532638549805, "global_step": 161914, "epoch": 3855} {"train_loss": -6.862498760223389, "global_step": 161915, "epoch": 3855} {"train_loss": -6.895633697509766, "global_step": 161916, "epoch": 3855} {"train_loss": -6.9694108963012695, "global_step": 161917, "epoch": 3855} {"train_loss": -6.983222961425781, "global_step": 161918, "epoch": 3855} {"train_loss": -6.831364154815674, "global_step": 161919, "epoch": 3855} {"train_loss": -6.92266845703125, "global_step": 161920, "epoch": 3855} {"train_loss": -6.906625747680664, "global_step": 161921, "epoch": 3855} {"train_loss": -6.946508407592773, "global_step": 161922, "epoch": 3855} {"train_loss": -6.8593549728393555, "global_step": 161923, "epoch": 3855} {"train_loss": -6.956385612487793, "global_step": 161924, "epoch": 3855} {"train_loss": -7.02069091796875, "global_step": 161925, "epoch": 3855} {"train_loss": -7.050215721130371, "global_step": 161926, "epoch": 3855} {"train_loss": -6.834881782531738, "global_step": 161927, "epoch": 3855} {"train_loss": -6.93018913269043, "global_step": 161928, "epoch": 3855} {"train_loss": -6.892485618591309, "global_step": 161929, "epoch": 3855} {"train_loss": -6.955849647521973, "global_step": 161930, "epoch": 3855} {"train_loss": -6.913814544677734, "global_step": 161931, "epoch": 3855} {"train_loss": -6.9050726890563965, "global_step": 161932, "epoch": 3855} {"train_loss": -6.893969535827637, "global_step": 161933, "epoch": 3855} {"train_loss": -7.000916957855225, "global_step": 161934, "epoch": 3855} {"train_loss": -6.988439559936523, "global_step": 161935, "epoch": 3855} {"train_loss": -7.067116737365723, "global_step": 161936, "epoch": 3855} {"train_loss": -6.959840774536133, "global_step": 161937, "epoch": 3855} {"train_loss": -6.874205112457275, "global_step": 161938, "epoch": 3855} {"train_loss": -7.03407096862793, "global_step": 161939, "epoch": 3855} {"train_loss": -6.890872955322266, "global_step": 161940, "epoch": 3855} {"train_loss": -6.990239143371582, "global_step": 161941, "epoch": 3855} {"train_loss": -6.980717658996582, "global_step": 161942, "epoch": 3855} {"train_loss": -6.971244812011719, "global_step": 161943, "epoch": 3855} {"train_loss": -6.906008720397949, "global_step": 161944, "epoch": 3855} {"train_loss": -7.054690361022949, "global_step": 161945, "epoch": 3855} {"train_loss": -6.883942604064941, "global_step": 161946, "epoch": 3855} {"train_loss": -6.892719268798828, "global_step": 161947, "epoch": 3855} {"train_loss": -6.868515968322754, "global_step": 161948, "epoch": 3855} {"train_loss": -6.938539981842041, "global_step": 161949, "epoch": 3855} {"train_loss": -6.995119094848633, "global_step": 161950, "epoch": 3855} {"train_loss": -6.935362055188134, "global_step": 161951, "epoch": 3855, "val_loss": 68809.4921875} {"train_loss": -6.897067546844482, "global_step": 161952, "epoch": 3856} {"train_loss": -6.90023136138916, "global_step": 161953, "epoch": 3856} {"train_loss": -6.851014137268066, "global_step": 161954, "epoch": 3856} {"train_loss": -7.025765419006348, "global_step": 161955, "epoch": 3856} {"train_loss": -6.9691901206970215, "global_step": 161956, "epoch": 3856} {"train_loss": -6.906037330627441, "global_step": 161957, "epoch": 3856} {"train_loss": -6.9347920417785645, "global_step": 161958, "epoch": 3856} {"train_loss": -6.834987163543701, "global_step": 161959, "epoch": 3856} {"train_loss": -6.902644157409668, "global_step": 161960, "epoch": 3856} {"train_loss": -7.036048889160156, "global_step": 161961, "epoch": 3856} {"train_loss": -6.816098213195801, "global_step": 161962, "epoch": 3856} {"train_loss": -6.954633712768555, "global_step": 161963, "epoch": 3856} {"train_loss": -6.966872215270996, "global_step": 161964, "epoch": 3856} {"train_loss": -6.835731029510498, "global_step": 161965, "epoch": 3856} {"train_loss": -6.874177932739258, "global_step": 161966, "epoch": 3856} {"train_loss": -6.827207565307617, "global_step": 161967, "epoch": 3856} {"train_loss": -6.829875946044922, "global_step": 161968, "epoch": 3856} {"train_loss": -6.752924919128418, "global_step": 161969, "epoch": 3856} {"train_loss": -6.850759506225586, "global_step": 161970, "epoch": 3856} {"train_loss": -6.674333572387695, "global_step": 161971, "epoch": 3856} {"train_loss": -6.872564315795898, "global_step": 161972, "epoch": 3856} {"train_loss": -6.74818229675293, "global_step": 161973, "epoch": 3856} {"train_loss": -6.82070255279541, "global_step": 161974, "epoch": 3856} {"train_loss": -6.69352912902832, "global_step": 161975, "epoch": 3856} {"train_loss": -6.690690994262695, "global_step": 161976, "epoch": 3856} {"train_loss": -6.679614543914795, "global_step": 161977, "epoch": 3856} {"train_loss": -6.816277503967285, "global_step": 161978, "epoch": 3856} {"train_loss": -6.671368598937988, "global_step": 161979, "epoch": 3856} {"train_loss": -6.6651434898376465, "global_step": 161980, "epoch": 3856} {"train_loss": -6.755627155303955, "global_step": 161981, "epoch": 3856} {"train_loss": -6.789765357971191, "global_step": 161982, "epoch": 3856} {"train_loss": -6.685206413269043, "global_step": 161983, "epoch": 3856} {"train_loss": -6.843894004821777, "global_step": 161984, "epoch": 3856} {"train_loss": -6.756106376647949, "global_step": 161985, "epoch": 3856} {"train_loss": -6.7863664627075195, "global_step": 161986, "epoch": 3856} {"train_loss": -6.772373199462891, "global_step": 161987, "epoch": 3856} {"train_loss": -6.800175666809082, "global_step": 161988, "epoch": 3856} {"train_loss": -6.775796890258789, "global_step": 161989, "epoch": 3856} {"train_loss": -6.748384475708008, "global_step": 161990, "epoch": 3856} {"train_loss": -6.790994644165039, "global_step": 161991, "epoch": 3856} {"train_loss": -6.84720516204834, "global_step": 161992, "epoch": 3856} {"train_loss": -6.820835465476627, "global_step": 161993, "epoch": 3856, "val_loss": 68615.3359375} {"train_loss": -6.756035804748535, "global_step": 161994, "epoch": 3857} {"train_loss": -6.748327255249023, "global_step": 161995, "epoch": 3857} {"train_loss": -6.951407432556152, "global_step": 161996, "epoch": 3857} {"train_loss": -6.881331443786621, "global_step": 161997, "epoch": 3857} {"train_loss": -6.827880859375, "global_step": 161998, "epoch": 3857} {"train_loss": -6.866601943969727, "global_step": 161999, "epoch": 3857} {"train_loss": -7.070500373840332, "global_step": 162000, "epoch": 3857} {"train_loss": -6.897372245788574, "global_step": 162001, "epoch": 3857} {"train_loss": -6.932822227478027, "global_step": 162002, "epoch": 3857} {"train_loss": -6.776462554931641, "global_step": 162003, "epoch": 3857} {"train_loss": -6.630616664886475, "global_step": 162004, "epoch": 3857} {"train_loss": -7.011773109436035, "global_step": 162005, "epoch": 3857} {"train_loss": -6.768045902252197, "global_step": 162006, "epoch": 3857} {"train_loss": -6.787794589996338, "global_step": 162007, "epoch": 3857} {"train_loss": -6.924398899078369, "global_step": 162008, "epoch": 3857} {"train_loss": -6.755276679992676, "global_step": 162009, "epoch": 3857} {"train_loss": -6.89970588684082, "global_step": 162010, "epoch": 3857} {"train_loss": -6.748312473297119, "global_step": 162011, "epoch": 3857} {"train_loss": -6.7720537185668945, "global_step": 162012, "epoch": 3857} {"train_loss": -6.966718673706055, "global_step": 162013, "epoch": 3857} {"train_loss": -6.7962846755981445, "global_step": 162014, "epoch": 3857} {"train_loss": -6.85983943939209, "global_step": 162015, "epoch": 3857} {"train_loss": -6.939963340759277, "global_step": 162016, "epoch": 3857} {"train_loss": -6.778701305389404, "global_step": 162017, "epoch": 3857} {"train_loss": -6.752926826477051, "global_step": 162018, "epoch": 3857} {"train_loss": -6.671979904174805, "global_step": 162019, "epoch": 3857} {"train_loss": -6.870439052581787, "global_step": 162020, "epoch": 3857} {"train_loss": -6.638287544250488, "global_step": 162021, "epoch": 3857} {"train_loss": -6.79282283782959, "global_step": 162022, "epoch": 3857} {"train_loss": -6.772589683532715, "global_step": 162023, "epoch": 3857} {"train_loss": -6.729056358337402, "global_step": 162024, "epoch": 3857} {"train_loss": -6.808932304382324, "global_step": 162025, "epoch": 3857} {"train_loss": -6.756990432739258, "global_step": 162026, "epoch": 3857} {"train_loss": -6.889187335968018, "global_step": 162027, "epoch": 3857} {"train_loss": -6.691761016845703, "global_step": 162028, "epoch": 3857} {"train_loss": -6.747517108917236, "global_step": 162029, "epoch": 3857} {"train_loss": -6.774383544921875, "global_step": 162030, "epoch": 3857} {"train_loss": -6.787883758544922, "global_step": 162031, "epoch": 3857} {"train_loss": -6.781167030334473, "global_step": 162032, "epoch": 3857} {"train_loss": -6.795238018035889, "global_step": 162033, "epoch": 3857} {"train_loss": -6.877676963806152, "global_step": 162034, "epoch": 3857} {"train_loss": -6.820801564625332, "global_step": 162035, "epoch": 3857, "val_loss": 68730.53125} {"train_loss": -6.848783493041992, "global_step": 162036, "epoch": 3858} {"train_loss": -6.889876365661621, "global_step": 162037, "epoch": 3858} {"train_loss": -6.919979095458984, "global_step": 162038, "epoch": 3858} {"train_loss": -7.005752086639404, "global_step": 162039, "epoch": 3858} {"train_loss": -6.92576789855957, "global_step": 162040, "epoch": 3858} {"train_loss": -6.887033462524414, "global_step": 162041, "epoch": 3858} {"train_loss": -6.87204647064209, "global_step": 162042, "epoch": 3858} {"train_loss": -6.845311164855957, "global_step": 162043, "epoch": 3858} {"train_loss": -6.914540767669678, "global_step": 162044, "epoch": 3858} {"train_loss": -6.966614723205566, "global_step": 162045, "epoch": 3858} {"train_loss": -6.901593208312988, "global_step": 162046, "epoch": 3858} {"train_loss": -6.917584419250488, "global_step": 162047, "epoch": 3858} {"train_loss": -6.874303340911865, "global_step": 162048, "epoch": 3858} {"train_loss": -6.926398277282715, "global_step": 162049, "epoch": 3858} {"train_loss": -6.889099597930908, "global_step": 162050, "epoch": 3858} {"train_loss": -6.8819899559021, "global_step": 162051, "epoch": 3858} {"train_loss": -6.904767036437988, "global_step": 162052, "epoch": 3858} {"train_loss": -6.735506057739258, "global_step": 162053, "epoch": 3858} {"train_loss": -6.863783359527588, "global_step": 162054, "epoch": 3858} {"train_loss": -6.756067752838135, "global_step": 162055, "epoch": 3858} {"train_loss": -6.813732624053955, "global_step": 162056, "epoch": 3858} {"train_loss": -6.902895450592041, "global_step": 162057, "epoch": 3858} {"train_loss": -6.9205827713012695, "global_step": 162058, "epoch": 3858} {"train_loss": -6.951026916503906, "global_step": 162059, "epoch": 3858} {"train_loss": -6.931070327758789, "global_step": 162060, "epoch": 3858} {"train_loss": -6.9192214012146, "global_step": 162061, "epoch": 3858} {"train_loss": -6.93519926071167, "global_step": 162062, "epoch": 3858} {"train_loss": -7.0029754638671875, "global_step": 162063, "epoch": 3858} {"train_loss": -6.906957626342773, "global_step": 162064, "epoch": 3858} {"train_loss": -6.979640960693359, "global_step": 162065, "epoch": 3858} {"train_loss": -7.0362324714660645, "global_step": 162066, "epoch": 3858} {"train_loss": -6.917208194732666, "global_step": 162067, "epoch": 3858} {"train_loss": -6.889252662658691, "global_step": 162068, "epoch": 3858} {"train_loss": -6.809387683868408, "global_step": 162069, "epoch": 3858} {"train_loss": -6.917995452880859, "global_step": 162070, "epoch": 3858} {"train_loss": -6.9523820877075195, "global_step": 162071, "epoch": 3858} {"train_loss": -6.919387340545654, "global_step": 162072, "epoch": 3858} {"train_loss": -6.96306037902832, "global_step": 162073, "epoch": 3858} {"train_loss": -6.964037895202637, "global_step": 162074, "epoch": 3858} {"train_loss": -6.98179292678833, "global_step": 162075, "epoch": 3858} {"train_loss": -6.941527843475342, "global_step": 162076, "epoch": 3858} {"train_loss": -6.90919245992388, "global_step": 162077, "epoch": 3858, "val_loss": 68643.015625} {"train_loss": -6.889540672302246, "global_step": 162078, "epoch": 3859} {"train_loss": -6.967110633850098, "global_step": 162079, "epoch": 3859} {"train_loss": -7.087744235992432, "global_step": 162080, "epoch": 3859} {"train_loss": -7.014598369598389, "global_step": 162081, "epoch": 3859} {"train_loss": -6.871781349182129, "global_step": 162082, "epoch": 3859} {"train_loss": -7.0095415115356445, "global_step": 162083, "epoch": 3859} {"train_loss": -6.8907246589660645, "global_step": 162084, "epoch": 3859} {"train_loss": -6.851291656494141, "global_step": 162085, "epoch": 3859} {"train_loss": -6.950202941894531, "global_step": 162086, "epoch": 3859} {"train_loss": -6.992125511169434, "global_step": 162087, "epoch": 3859} {"train_loss": -6.827835559844971, "global_step": 162088, "epoch": 3859} {"train_loss": -7.0103607177734375, "global_step": 162089, "epoch": 3859} {"train_loss": -7.013051986694336, "global_step": 162090, "epoch": 3859} {"train_loss": -6.848280429840088, "global_step": 162091, "epoch": 3859} {"train_loss": -7.025215148925781, "global_step": 162092, "epoch": 3859} {"train_loss": -6.896912574768066, "global_step": 162093, "epoch": 3859} {"train_loss": -6.880303382873535, "global_step": 162094, "epoch": 3859} {"train_loss": -6.895127773284912, "global_step": 162095, "epoch": 3859} {"train_loss": -6.909961700439453, "global_step": 162096, "epoch": 3859} {"train_loss": -6.963037014007568, "global_step": 162097, "epoch": 3859} {"train_loss": -6.909346580505371, "global_step": 162098, "epoch": 3859} {"train_loss": -6.908557415008545, "global_step": 162099, "epoch": 3859} {"train_loss": -6.918245792388916, "global_step": 162100, "epoch": 3859} {"train_loss": -6.964984893798828, "global_step": 162101, "epoch": 3859} {"train_loss": -6.885058879852295, "global_step": 162102, "epoch": 3859} {"train_loss": -6.9378252029418945, "global_step": 162103, "epoch": 3859} {"train_loss": -6.995519638061523, "global_step": 162104, "epoch": 3859} {"train_loss": -6.864678382873535, "global_step": 162105, "epoch": 3859} {"train_loss": -6.889710426330566, "global_step": 162106, "epoch": 3859} {"train_loss": -6.8480119705200195, "global_step": 162107, "epoch": 3859} {"train_loss": -6.909270763397217, "global_step": 162108, "epoch": 3859} {"train_loss": -7.0303497314453125, "global_step": 162109, "epoch": 3859} {"train_loss": -6.884335041046143, "global_step": 162110, "epoch": 3859} {"train_loss": -6.995473384857178, "global_step": 162111, "epoch": 3859} {"train_loss": -6.859777450561523, "global_step": 162112, "epoch": 3859} {"train_loss": -6.859212398529053, "global_step": 162113, "epoch": 3859} {"train_loss": -6.866110801696777, "global_step": 162114, "epoch": 3859} {"train_loss": -6.793927192687988, "global_step": 162115, "epoch": 3859} {"train_loss": -6.914634704589844, "global_step": 162116, "epoch": 3859} {"train_loss": -6.8434553146362305, "global_step": 162117, "epoch": 3859} {"train_loss": -6.826726913452148, "global_step": 162118, "epoch": 3859} {"train_loss": -6.917598065875826, "global_step": 162119, "epoch": 3859, "val_loss": 68717.53125} {"train_loss": -6.90598201751709, "global_step": 162120, "epoch": 3860} {"train_loss": -6.87274694442749, "global_step": 162121, "epoch": 3860} {"train_loss": -6.844020843505859, "global_step": 162122, "epoch": 3860} {"train_loss": -6.808779239654541, "global_step": 162123, "epoch": 3860} {"train_loss": -6.9077653884887695, "global_step": 162124, "epoch": 3860} {"train_loss": -6.7480244636535645, "global_step": 162125, "epoch": 3860} {"train_loss": -6.9905195236206055, "global_step": 162126, "epoch": 3860} {"train_loss": -6.985485553741455, "global_step": 162127, "epoch": 3860} {"train_loss": -6.739410400390625, "global_step": 162128, "epoch": 3860} {"train_loss": -6.874344825744629, "global_step": 162129, "epoch": 3860} {"train_loss": -6.836540222167969, "global_step": 162130, "epoch": 3860} {"train_loss": -6.8050923347473145, "global_step": 162131, "epoch": 3860} {"train_loss": -6.832392692565918, "global_step": 162132, "epoch": 3860} {"train_loss": -6.8029255867004395, "global_step": 162133, "epoch": 3860} {"train_loss": -6.859187126159668, "global_step": 162134, "epoch": 3860} {"train_loss": -6.928520202636719, "global_step": 162135, "epoch": 3860} {"train_loss": -6.852256774902344, "global_step": 162136, "epoch": 3860} {"train_loss": -6.711424827575684, "global_step": 162137, "epoch": 3860} {"train_loss": -6.885622978210449, "global_step": 162138, "epoch": 3860} {"train_loss": -6.787772178649902, "global_step": 162139, "epoch": 3860} {"train_loss": -6.771303176879883, "global_step": 162140, "epoch": 3860} {"train_loss": -6.870972156524658, "global_step": 162141, "epoch": 3860} {"train_loss": -6.798059463500977, "global_step": 162142, "epoch": 3860} {"train_loss": -6.930558204650879, "global_step": 162143, "epoch": 3860} {"train_loss": -6.9425811767578125, "global_step": 162144, "epoch": 3860} {"train_loss": -6.846221446990967, "global_step": 162145, "epoch": 3860} {"train_loss": -6.9048967361450195, "global_step": 162146, "epoch": 3860} {"train_loss": -6.785149574279785, "global_step": 162147, "epoch": 3860} {"train_loss": -6.965738296508789, "global_step": 162148, "epoch": 3860} {"train_loss": -6.9117889404296875, "global_step": 162149, "epoch": 3860} {"train_loss": -6.897341728210449, "global_step": 162150, "epoch": 3860} {"train_loss": -6.968986511230469, "global_step": 162151, "epoch": 3860} {"train_loss": -6.969085693359375, "global_step": 162152, "epoch": 3860} {"train_loss": -6.868551254272461, "global_step": 162153, "epoch": 3860} {"train_loss": -6.916347503662109, "global_step": 162154, "epoch": 3860} {"train_loss": -6.855501174926758, "global_step": 162155, "epoch": 3860} {"train_loss": -6.927617073059082, "global_step": 162156, "epoch": 3860} {"train_loss": -6.820637226104736, "global_step": 162157, "epoch": 3860} {"train_loss": -6.7998456954956055, "global_step": 162158, "epoch": 3860} {"train_loss": -6.930545806884766, "global_step": 162159, "epoch": 3860} {"train_loss": -6.911595344543457, "global_step": 162160, "epoch": 3860} {"train_loss": -6.869635570616949, "global_step": 162161, "epoch": 3860, "val_loss": 68535.15625} {"train_loss": -6.84019136428833, "global_step": 162162, "epoch": 3861} {"train_loss": -6.825399875640869, "global_step": 162163, "epoch": 3861} {"train_loss": -6.9733123779296875, "global_step": 162164, "epoch": 3861} {"train_loss": -6.8720831871032715, "global_step": 162165, "epoch": 3861} {"train_loss": -6.960082054138184, "global_step": 162166, "epoch": 3861} {"train_loss": -6.910179138183594, "global_step": 162167, "epoch": 3861} {"train_loss": -6.874918460845947, "global_step": 162168, "epoch": 3861} {"train_loss": -6.866368293762207, "global_step": 162169, "epoch": 3861} {"train_loss": -6.919454574584961, "global_step": 162170, "epoch": 3861} {"train_loss": -6.816551685333252, "global_step": 162171, "epoch": 3861} {"train_loss": -6.828383445739746, "global_step": 162172, "epoch": 3861} {"train_loss": -6.8737077713012695, "global_step": 162173, "epoch": 3861} {"train_loss": -6.806492805480957, "global_step": 162174, "epoch": 3861} {"train_loss": -6.914484977722168, "global_step": 162175, "epoch": 3861} {"train_loss": -6.847057342529297, "global_step": 162176, "epoch": 3861} {"train_loss": -6.948525428771973, "global_step": 162177, "epoch": 3861} {"train_loss": -6.870031833648682, "global_step": 162178, "epoch": 3861} {"train_loss": -6.907496452331543, "global_step": 162179, "epoch": 3861} {"train_loss": -6.961024284362793, "global_step": 162180, "epoch": 3861} {"train_loss": -6.874161243438721, "global_step": 162181, "epoch": 3861} {"train_loss": -6.979529857635498, "global_step": 162182, "epoch": 3861} {"train_loss": -6.93389892578125, "global_step": 162183, "epoch": 3861} {"train_loss": -6.918867111206055, "global_step": 162184, "epoch": 3861} {"train_loss": -6.91980504989624, "global_step": 162185, "epoch": 3861} {"train_loss": -6.8446221351623535, "global_step": 162186, "epoch": 3861} {"train_loss": -6.877486228942871, "global_step": 162187, "epoch": 3861} {"train_loss": -6.936375141143799, "global_step": 162188, "epoch": 3861} {"train_loss": -6.779243469238281, "global_step": 162189, "epoch": 3861} {"train_loss": -6.812399864196777, "global_step": 162190, "epoch": 3861} {"train_loss": -6.881555557250977, "global_step": 162191, "epoch": 3861} {"train_loss": -6.945284366607666, "global_step": 162192, "epoch": 3861} {"train_loss": -6.86949348449707, "global_step": 162193, "epoch": 3861} {"train_loss": -6.978017330169678, "global_step": 162194, "epoch": 3861} {"train_loss": -6.933794021606445, "global_step": 162195, "epoch": 3861} {"train_loss": -6.919064521789551, "global_step": 162196, "epoch": 3861} {"train_loss": -6.908070087432861, "global_step": 162197, "epoch": 3861} {"train_loss": -6.854121208190918, "global_step": 162198, "epoch": 3861} {"train_loss": -6.923501968383789, "global_step": 162199, "epoch": 3861} {"train_loss": -6.908695697784424, "global_step": 162200, "epoch": 3861} {"train_loss": -6.765206336975098, "global_step": 162201, "epoch": 3861} {"train_loss": -6.967504978179932, "global_step": 162202, "epoch": 3861} {"train_loss": -6.887991053717477, "global_step": 162203, "epoch": 3861, "val_loss": 68682.0078125} {"train_loss": -6.98779821395874, "global_step": 162204, "epoch": 3862} {"train_loss": -6.859179496765137, "global_step": 162205, "epoch": 3862} {"train_loss": -6.9688215255737305, "global_step": 162206, "epoch": 3862} {"train_loss": -6.960689544677734, "global_step": 162207, "epoch": 3862} {"train_loss": -6.888875484466553, "global_step": 162208, "epoch": 3862} {"train_loss": -6.860456466674805, "global_step": 162209, "epoch": 3862} {"train_loss": -6.871788024902344, "global_step": 162210, "epoch": 3862} {"train_loss": -6.996767520904541, "global_step": 162211, "epoch": 3862} {"train_loss": -6.930423736572266, "global_step": 162212, "epoch": 3862} {"train_loss": -6.826476097106934, "global_step": 162213, "epoch": 3862} {"train_loss": -6.963659763336182, "global_step": 162214, "epoch": 3862} {"train_loss": -6.9978814125061035, "global_step": 162215, "epoch": 3862} {"train_loss": -6.88505744934082, "global_step": 162216, "epoch": 3862} {"train_loss": -6.89879035949707, "global_step": 162217, "epoch": 3862} {"train_loss": -6.991556167602539, "global_step": 162218, "epoch": 3862} {"train_loss": -6.94975471496582, "global_step": 162219, "epoch": 3862} {"train_loss": -6.924497604370117, "global_step": 162220, "epoch": 3862} {"train_loss": -6.904923915863037, "global_step": 162221, "epoch": 3862} {"train_loss": -6.880169868469238, "global_step": 162222, "epoch": 3862} {"train_loss": -6.913058280944824, "global_step": 162223, "epoch": 3862} {"train_loss": -6.899704456329346, "global_step": 162224, "epoch": 3862} {"train_loss": -6.8811845779418945, "global_step": 162225, "epoch": 3862} {"train_loss": -7.030284881591797, "global_step": 162226, "epoch": 3862} {"train_loss": -6.965175628662109, "global_step": 162227, "epoch": 3862} {"train_loss": -6.960421562194824, "global_step": 162228, "epoch": 3862} {"train_loss": -7.027827739715576, "global_step": 162229, "epoch": 3862} {"train_loss": -6.952844619750977, "global_step": 162230, "epoch": 3862} {"train_loss": -6.911959648132324, "global_step": 162231, "epoch": 3862} {"train_loss": -6.966602325439453, "global_step": 162232, "epoch": 3862} {"train_loss": -7.161585807800293, "global_step": 162233, "epoch": 3862} {"train_loss": -7.028128623962402, "global_step": 162234, "epoch": 3862} {"train_loss": -6.922796249389648, "global_step": 162235, "epoch": 3862} {"train_loss": -6.947495460510254, "global_step": 162236, "epoch": 3862} {"train_loss": -6.892704486846924, "global_step": 162237, "epoch": 3862} {"train_loss": -6.91734504699707, "global_step": 162238, "epoch": 3862} {"train_loss": -6.991716384887695, "global_step": 162239, "epoch": 3862} {"train_loss": -6.816615581512451, "global_step": 162240, "epoch": 3862} {"train_loss": -6.81107234954834, "global_step": 162241, "epoch": 3862} {"train_loss": -6.845611095428467, "global_step": 162242, "epoch": 3862} {"train_loss": -6.8851776123046875, "global_step": 162243, "epoch": 3862} {"train_loss": -6.910069942474365, "global_step": 162244, "epoch": 3862} {"train_loss": -6.929599307832264, "global_step": 162245, "epoch": 3862, "val_loss": 68485.2109375} {"train_loss": -6.883213043212891, "global_step": 162246, "epoch": 3863} {"train_loss": -6.972631454467773, "global_step": 162247, "epoch": 3863} {"train_loss": -6.916436195373535, "global_step": 162248, "epoch": 3863} {"train_loss": -6.9531450271606445, "global_step": 162249, "epoch": 3863} {"train_loss": -6.97274112701416, "global_step": 162250, "epoch": 3863} {"train_loss": -7.010397434234619, "global_step": 162251, "epoch": 3863} {"train_loss": -6.860803127288818, "global_step": 162252, "epoch": 3863} {"train_loss": -7.027918815612793, "global_step": 162253, "epoch": 3863} {"train_loss": -6.851701736450195, "global_step": 162254, "epoch": 3863} {"train_loss": -6.913182258605957, "global_step": 162255, "epoch": 3863} {"train_loss": -6.919363975524902, "global_step": 162256, "epoch": 3863} {"train_loss": -6.855245113372803, "global_step": 162257, "epoch": 3863} {"train_loss": -6.95250129699707, "global_step": 162258, "epoch": 3863} {"train_loss": -6.945291042327881, "global_step": 162259, "epoch": 3863} {"train_loss": -6.905731201171875, "global_step": 162260, "epoch": 3863} {"train_loss": -6.914119720458984, "global_step": 162261, "epoch": 3863} {"train_loss": -6.953515529632568, "global_step": 162262, "epoch": 3863} {"train_loss": -6.980072975158691, "global_step": 162263, "epoch": 3863} {"train_loss": -6.967431545257568, "global_step": 162264, "epoch": 3863} {"train_loss": -6.916001319885254, "global_step": 162265, "epoch": 3863} {"train_loss": -7.012999534606934, "global_step": 162266, "epoch": 3863} {"train_loss": -6.836372375488281, "global_step": 162267, "epoch": 3863} {"train_loss": -6.838934898376465, "global_step": 162268, "epoch": 3863} {"train_loss": -6.9801812171936035, "global_step": 162269, "epoch": 3863} {"train_loss": -6.895113945007324, "global_step": 162270, "epoch": 3863} {"train_loss": -6.907910346984863, "global_step": 162271, "epoch": 3863} {"train_loss": -6.947247505187988, "global_step": 162272, "epoch": 3863} {"train_loss": -6.984421730041504, "global_step": 162273, "epoch": 3863} {"train_loss": -7.025123119354248, "global_step": 162274, "epoch": 3863} {"train_loss": -6.920253276824951, "global_step": 162275, "epoch": 3863} {"train_loss": -6.930868148803711, "global_step": 162276, "epoch": 3863} {"train_loss": -6.890920639038086, "global_step": 162277, "epoch": 3863} {"train_loss": -6.843832969665527, "global_step": 162278, "epoch": 3863} {"train_loss": -6.8321075439453125, "global_step": 162279, "epoch": 3863} {"train_loss": -6.975393295288086, "global_step": 162280, "epoch": 3863} {"train_loss": -7.02299690246582, "global_step": 162281, "epoch": 3863} {"train_loss": -6.830756664276123, "global_step": 162282, "epoch": 3863} {"train_loss": -6.806122779846191, "global_step": 162283, "epoch": 3863} {"train_loss": -7.010916709899902, "global_step": 162284, "epoch": 3863} {"train_loss": -6.9345197677612305, "global_step": 162285, "epoch": 3863} {"train_loss": -6.8137712478637695, "global_step": 162286, "epoch": 3863} {"train_loss": -6.9266010239010765, "global_step": 162287, "epoch": 3863, "val_loss": 68549.3515625} {"train_loss": -6.817248344421387, "global_step": 162288, "epoch": 3864} {"train_loss": -7.058856010437012, "global_step": 162289, "epoch": 3864} {"train_loss": -6.93095064163208, "global_step": 162290, "epoch": 3864} {"train_loss": -6.972468376159668, "global_step": 162291, "epoch": 3864} {"train_loss": -6.885830879211426, "global_step": 162292, "epoch": 3864} {"train_loss": -6.821122646331787, "global_step": 162293, "epoch": 3864} {"train_loss": -6.972803115844727, "global_step": 162294, "epoch": 3864} {"train_loss": -6.818479537963867, "global_step": 162295, "epoch": 3864} {"train_loss": -6.761083602905273, "global_step": 162296, "epoch": 3864} {"train_loss": -6.869828224182129, "global_step": 162297, "epoch": 3864} {"train_loss": -6.884637355804443, "global_step": 162298, "epoch": 3864} {"train_loss": -6.867877006530762, "global_step": 162299, "epoch": 3864} {"train_loss": -6.9637370109558105, "global_step": 162300, "epoch": 3864} {"train_loss": -6.864838123321533, "global_step": 162301, "epoch": 3864} {"train_loss": -6.9230241775512695, "global_step": 162302, "epoch": 3864} {"train_loss": -6.93769645690918, "global_step": 162303, "epoch": 3864} {"train_loss": -6.908658504486084, "global_step": 162304, "epoch": 3864} {"train_loss": -6.995429039001465, "global_step": 162305, "epoch": 3864} {"train_loss": -6.809858322143555, "global_step": 162306, "epoch": 3864} {"train_loss": -6.890089511871338, "global_step": 162307, "epoch": 3864} {"train_loss": -6.994192600250244, "global_step": 162308, "epoch": 3864} {"train_loss": -6.963906288146973, "global_step": 162309, "epoch": 3864} {"train_loss": -6.9243245124816895, "global_step": 162310, "epoch": 3864} {"train_loss": -6.805356025695801, "global_step": 162311, "epoch": 3864} {"train_loss": -6.921204566955566, "global_step": 162312, "epoch": 3864} {"train_loss": -6.92503547668457, "global_step": 162313, "epoch": 3864} {"train_loss": -6.9204182624816895, "global_step": 162314, "epoch": 3864} {"train_loss": -6.920693397521973, "global_step": 162315, "epoch": 3864} {"train_loss": -7.002773284912109, "global_step": 162316, "epoch": 3864} {"train_loss": -6.918548583984375, "global_step": 162317, "epoch": 3864} {"train_loss": -6.914698600769043, "global_step": 162318, "epoch": 3864} {"train_loss": -6.882289886474609, "global_step": 162319, "epoch": 3864} {"train_loss": -6.902663707733154, "global_step": 162320, "epoch": 3864} {"train_loss": -6.948230743408203, "global_step": 162321, "epoch": 3864} {"train_loss": -6.873222351074219, "global_step": 162322, "epoch": 3864} {"train_loss": -6.943058967590332, "global_step": 162323, "epoch": 3864} {"train_loss": -6.936773300170898, "global_step": 162324, "epoch": 3864} {"train_loss": -6.896713733673096, "global_step": 162325, "epoch": 3864} {"train_loss": -6.850979804992676, "global_step": 162326, "epoch": 3864} {"train_loss": -6.92302942276001, "global_step": 162327, "epoch": 3864} {"train_loss": -6.799312591552734, "global_step": 162328, "epoch": 3864} {"train_loss": -6.904465289342971, "global_step": 162329, "epoch": 3864, "val_loss": 68706.8984375} {"train_loss": -6.7448410987854, "global_step": 162330, "epoch": 3865} {"train_loss": -6.984009742736816, "global_step": 162331, "epoch": 3865} {"train_loss": -6.809460639953613, "global_step": 162332, "epoch": 3865} {"train_loss": -6.8641252517700195, "global_step": 162333, "epoch": 3865} {"train_loss": -6.902071475982666, "global_step": 162334, "epoch": 3865} {"train_loss": -6.858985900878906, "global_step": 162335, "epoch": 3865} {"train_loss": -6.939083576202393, "global_step": 162336, "epoch": 3865} {"train_loss": -6.8389105796813965, "global_step": 162337, "epoch": 3865} {"train_loss": -6.882781028747559, "global_step": 162338, "epoch": 3865} {"train_loss": -6.85157585144043, "global_step": 162339, "epoch": 3865} {"train_loss": -6.844649314880371, "global_step": 162340, "epoch": 3865} {"train_loss": -6.9227294921875, "global_step": 162341, "epoch": 3865} {"train_loss": -6.96372127532959, "global_step": 162342, "epoch": 3865} {"train_loss": -6.965088844299316, "global_step": 162343, "epoch": 3865} {"train_loss": -6.956452369689941, "global_step": 162344, "epoch": 3865} {"train_loss": -7.030830383300781, "global_step": 162345, "epoch": 3865} {"train_loss": -6.96529483795166, "global_step": 162346, "epoch": 3865} {"train_loss": -6.944460868835449, "global_step": 162347, "epoch": 3865} {"train_loss": -6.927152633666992, "global_step": 162348, "epoch": 3865} {"train_loss": -6.944019317626953, "global_step": 162349, "epoch": 3865} {"train_loss": -6.966370582580566, "global_step": 162350, "epoch": 3865} {"train_loss": -6.929973602294922, "global_step": 162351, "epoch": 3865} {"train_loss": -7.077872276306152, "global_step": 162352, "epoch": 3865} {"train_loss": -6.91627311706543, "global_step": 162353, "epoch": 3865} {"train_loss": -7.024733543395996, "global_step": 162354, "epoch": 3865} {"train_loss": -7.0271100997924805, "global_step": 162355, "epoch": 3865} {"train_loss": -7.0094709396362305, "global_step": 162356, "epoch": 3865} {"train_loss": -6.946148872375488, "global_step": 162357, "epoch": 3865} {"train_loss": -7.01158332824707, "global_step": 162358, "epoch": 3865} {"train_loss": -7.05632209777832, "global_step": 162359, "epoch": 3865} {"train_loss": -6.888938903808594, "global_step": 162360, "epoch": 3865} {"train_loss": -6.97582483291626, "global_step": 162361, "epoch": 3865} {"train_loss": -6.987827777862549, "global_step": 162362, "epoch": 3865} {"train_loss": -6.959325313568115, "global_step": 162363, "epoch": 3865} {"train_loss": -6.923220157623291, "global_step": 162364, "epoch": 3865} {"train_loss": -6.999625205993652, "global_step": 162365, "epoch": 3865} {"train_loss": -6.99349308013916, "global_step": 162366, "epoch": 3865} {"train_loss": -6.898262977600098, "global_step": 162367, "epoch": 3865} {"train_loss": -6.989002227783203, "global_step": 162368, "epoch": 3865} {"train_loss": -6.99739933013916, "global_step": 162369, "epoch": 3865} {"train_loss": -6.949962615966797, "global_step": 162370, "epoch": 3865} {"train_loss": -6.944006533849807, "global_step": 162371, "epoch": 3865, "val_loss": 68573.8125} {"train_loss": -7.018924713134766, "global_step": 162372, "epoch": 3866} {"train_loss": -6.934910297393799, "global_step": 162373, "epoch": 3866} {"train_loss": -6.9316725730896, "global_step": 162374, "epoch": 3866} {"train_loss": -6.716489315032959, "global_step": 162375, "epoch": 3866} {"train_loss": -7.0350871086120605, "global_step": 162376, "epoch": 3866} {"train_loss": -6.874110221862793, "global_step": 162377, "epoch": 3866} {"train_loss": -6.879678726196289, "global_step": 162378, "epoch": 3866} {"train_loss": -6.910823822021484, "global_step": 162379, "epoch": 3866} {"train_loss": -6.98698091506958, "global_step": 162380, "epoch": 3866} {"train_loss": -6.986509323120117, "global_step": 162381, "epoch": 3866} {"train_loss": -6.960134029388428, "global_step": 162382, "epoch": 3866} {"train_loss": -6.885775089263916, "global_step": 162383, "epoch": 3866} {"train_loss": -6.723657608032227, "global_step": 162384, "epoch": 3866} {"train_loss": -6.774491310119629, "global_step": 162385, "epoch": 3866} {"train_loss": -6.784698009490967, "global_step": 162386, "epoch": 3866} {"train_loss": -6.930505752563477, "global_step": 162387, "epoch": 3866} {"train_loss": -6.849736213684082, "global_step": 162388, "epoch": 3866} {"train_loss": -6.660361289978027, "global_step": 162389, "epoch": 3866} {"train_loss": -6.868966102600098, "global_step": 162390, "epoch": 3866} {"train_loss": -6.908756256103516, "global_step": 162391, "epoch": 3866} {"train_loss": -6.803691864013672, "global_step": 162392, "epoch": 3866} {"train_loss": -6.790260314941406, "global_step": 162393, "epoch": 3866} {"train_loss": -6.886754989624023, "global_step": 162394, "epoch": 3866} {"train_loss": -6.789490699768066, "global_step": 162395, "epoch": 3866} {"train_loss": -6.795812129974365, "global_step": 162396, "epoch": 3866} {"train_loss": -6.816105365753174, "global_step": 162397, "epoch": 3866} {"train_loss": -6.774574279785156, "global_step": 162398, "epoch": 3866} {"train_loss": -6.853427410125732, "global_step": 162399, "epoch": 3866} {"train_loss": -6.82415771484375, "global_step": 162400, "epoch": 3866} {"train_loss": -6.847278594970703, "global_step": 162401, "epoch": 3866} {"train_loss": -6.889754295349121, "global_step": 162402, "epoch": 3866} {"train_loss": -6.930089950561523, "global_step": 162403, "epoch": 3866} {"train_loss": -6.922604560852051, "global_step": 162404, "epoch": 3866} {"train_loss": -6.75313663482666, "global_step": 162405, "epoch": 3866} {"train_loss": -6.8785295486450195, "global_step": 162406, "epoch": 3866} {"train_loss": -6.890292167663574, "global_step": 162407, "epoch": 3866} {"train_loss": -6.794891357421875, "global_step": 162408, "epoch": 3866} {"train_loss": -6.8833208084106445, "global_step": 162409, "epoch": 3866} {"train_loss": -6.8811140060424805, "global_step": 162410, "epoch": 3866} {"train_loss": -6.957157611846924, "global_step": 162411, "epoch": 3866} {"train_loss": -6.73108434677124, "global_step": 162412, "epoch": 3866} {"train_loss": -6.863062427157447, "global_step": 162413, "epoch": 3866, "val_loss": 68504.4375} {"train_loss": -6.882506370544434, "global_step": 162414, "epoch": 3867} {"train_loss": -6.768249034881592, "global_step": 162415, "epoch": 3867} {"train_loss": -6.875080585479736, "global_step": 162416, "epoch": 3867} {"train_loss": -6.7166547775268555, "global_step": 162417, "epoch": 3867} {"train_loss": -6.950412273406982, "global_step": 162418, "epoch": 3867} {"train_loss": -6.780293941497803, "global_step": 162419, "epoch": 3867} {"train_loss": -6.883950233459473, "global_step": 162420, "epoch": 3867} {"train_loss": -6.839757919311523, "global_step": 162421, "epoch": 3867} {"train_loss": -6.941108703613281, "global_step": 162422, "epoch": 3867} {"train_loss": -6.837521076202393, "global_step": 162423, "epoch": 3867} {"train_loss": -6.861269474029541, "global_step": 162424, "epoch": 3867} {"train_loss": -6.977837562561035, "global_step": 162425, "epoch": 3867} {"train_loss": -6.824605941772461, "global_step": 162426, "epoch": 3867} {"train_loss": -6.910870552062988, "global_step": 162427, "epoch": 3867} {"train_loss": -6.8104119300842285, "global_step": 162428, "epoch": 3867} {"train_loss": -6.929272651672363, "global_step": 162429, "epoch": 3867} {"train_loss": -6.8801469802856445, "global_step": 162430, "epoch": 3867} {"train_loss": -6.852540493011475, "global_step": 162431, "epoch": 3867} {"train_loss": -6.931392669677734, "global_step": 162432, "epoch": 3867} {"train_loss": -6.928005218505859, "global_step": 162433, "epoch": 3867} {"train_loss": -6.883121967315674, "global_step": 162434, "epoch": 3867} {"train_loss": -6.845100402832031, "global_step": 162435, "epoch": 3867} {"train_loss": -6.913127899169922, "global_step": 162436, "epoch": 3867} {"train_loss": -6.923630237579346, "global_step": 162437, "epoch": 3867} {"train_loss": -6.923519134521484, "global_step": 162438, "epoch": 3867} {"train_loss": -6.943793296813965, "global_step": 162439, "epoch": 3867} {"train_loss": -6.872849464416504, "global_step": 162440, "epoch": 3867} {"train_loss": -6.892157554626465, "global_step": 162441, "epoch": 3867} {"train_loss": -7.003786087036133, "global_step": 162442, "epoch": 3867} {"train_loss": -7.007660388946533, "global_step": 162443, "epoch": 3867} {"train_loss": -6.896273136138916, "global_step": 162444, "epoch": 3867} {"train_loss": -6.868379592895508, "global_step": 162445, "epoch": 3867} {"train_loss": -6.807175636291504, "global_step": 162446, "epoch": 3867} {"train_loss": -6.986793518066406, "global_step": 162447, "epoch": 3867} {"train_loss": -6.8901872634887695, "global_step": 162448, "epoch": 3867} {"train_loss": -6.9193315505981445, "global_step": 162449, "epoch": 3867} {"train_loss": -7.008121490478516, "global_step": 162450, "epoch": 3867} {"train_loss": -6.874706268310547, "global_step": 162451, "epoch": 3867} {"train_loss": -6.913150787353516, "global_step": 162452, "epoch": 3867} {"train_loss": -6.865121364593506, "global_step": 162453, "epoch": 3867} {"train_loss": -6.872787952423096, "global_step": 162454, "epoch": 3867} {"train_loss": -6.887706450053623, "global_step": 162455, "epoch": 3867, "val_loss": 68714.3984375} {"train_loss": -6.783747673034668, "global_step": 162456, "epoch": 3868} {"train_loss": -7.060317516326904, "global_step": 162457, "epoch": 3868} {"train_loss": -6.780231952667236, "global_step": 162458, "epoch": 3868} {"train_loss": -6.901378631591797, "global_step": 162459, "epoch": 3868} {"train_loss": -6.974252223968506, "global_step": 162460, "epoch": 3868} {"train_loss": -6.746737480163574, "global_step": 162461, "epoch": 3868} {"train_loss": -6.846258163452148, "global_step": 162462, "epoch": 3868} {"train_loss": -6.786064147949219, "global_step": 162463, "epoch": 3868} {"train_loss": -6.9474029541015625, "global_step": 162464, "epoch": 3868} {"train_loss": -6.793073654174805, "global_step": 162465, "epoch": 3868} {"train_loss": -6.940884590148926, "global_step": 162466, "epoch": 3868} {"train_loss": -6.992097854614258, "global_step": 162467, "epoch": 3868} {"train_loss": -6.860912322998047, "global_step": 162468, "epoch": 3868} {"train_loss": -6.975872993469238, "global_step": 162469, "epoch": 3868} {"train_loss": -6.81842041015625, "global_step": 162470, "epoch": 3868} {"train_loss": -6.94547176361084, "global_step": 162471, "epoch": 3868} {"train_loss": -7.000985145568848, "global_step": 162472, "epoch": 3868} {"train_loss": -6.903027057647705, "global_step": 162473, "epoch": 3868} {"train_loss": -6.926446914672852, "global_step": 162474, "epoch": 3868} {"train_loss": -6.956306457519531, "global_step": 162475, "epoch": 3868} {"train_loss": -6.954668045043945, "global_step": 162476, "epoch": 3868} {"train_loss": -6.953317642211914, "global_step": 162477, "epoch": 3868} {"train_loss": -6.945003509521484, "global_step": 162478, "epoch": 3868} {"train_loss": -6.969937324523926, "global_step": 162479, "epoch": 3868} {"train_loss": -7.087370872497559, "global_step": 162480, "epoch": 3868} {"train_loss": -6.943557262420654, "global_step": 162481, "epoch": 3868} {"train_loss": -6.935500621795654, "global_step": 162482, "epoch": 3868} {"train_loss": -6.880862712860107, "global_step": 162483, "epoch": 3868} {"train_loss": -6.90120792388916, "global_step": 162484, "epoch": 3868} {"train_loss": -6.893075942993164, "global_step": 162485, "epoch": 3868} {"train_loss": -6.856326103210449, "global_step": 162486, "epoch": 3868} {"train_loss": -6.969294548034668, "global_step": 162487, "epoch": 3868} {"train_loss": -7.019672393798828, "global_step": 162488, "epoch": 3868} {"train_loss": -6.958382606506348, "global_step": 162489, "epoch": 3868} {"train_loss": -6.969588279724121, "global_step": 162490, "epoch": 3868} {"train_loss": -6.952550888061523, "global_step": 162491, "epoch": 3868} {"train_loss": -6.909770965576172, "global_step": 162492, "epoch": 3868} {"train_loss": -6.942553520202637, "global_step": 162493, "epoch": 3868} {"train_loss": -6.94671630859375, "global_step": 162494, "epoch": 3868} {"train_loss": -6.880171775817871, "global_step": 162495, "epoch": 3868} {"train_loss": -6.879825592041016, "global_step": 162496, "epoch": 3868} {"train_loss": -6.922013793672834, "global_step": 162497, "epoch": 3868, "val_loss": 68567.1328125} {"train_loss": -6.980315208435059, "global_step": 162498, "epoch": 3869} {"train_loss": -6.940144062042236, "global_step": 162499, "epoch": 3869} {"train_loss": -6.985743999481201, "global_step": 162500, "epoch": 3869} {"train_loss": -7.046446800231934, "global_step": 162501, "epoch": 3869} {"train_loss": -6.918388366699219, "global_step": 162502, "epoch": 3869} {"train_loss": -6.891329765319824, "global_step": 162503, "epoch": 3869} {"train_loss": -7.010653972625732, "global_step": 162504, "epoch": 3869} {"train_loss": -7.000473976135254, "global_step": 162505, "epoch": 3869} {"train_loss": -6.969965934753418, "global_step": 162506, "epoch": 3869} {"train_loss": -7.034544467926025, "global_step": 162507, "epoch": 3869} {"train_loss": -7.041392803192139, "global_step": 162508, "epoch": 3869} {"train_loss": -6.973146438598633, "global_step": 162509, "epoch": 3869} {"train_loss": -7.028256416320801, "global_step": 162510, "epoch": 3869} {"train_loss": -7.06160831451416, "global_step": 162511, "epoch": 3869} {"train_loss": -6.938094615936279, "global_step": 162512, "epoch": 3869} {"train_loss": -7.036283493041992, "global_step": 162513, "epoch": 3869} {"train_loss": -7.016353607177734, "global_step": 162514, "epoch": 3869} {"train_loss": -6.940604209899902, "global_step": 162515, "epoch": 3869} {"train_loss": -6.9847798347473145, "global_step": 162516, "epoch": 3869} {"train_loss": -6.880695819854736, "global_step": 162517, "epoch": 3869} {"train_loss": -6.874513626098633, "global_step": 162518, "epoch": 3869} {"train_loss": -6.973775863647461, "global_step": 162519, "epoch": 3869} {"train_loss": -6.8963751792907715, "global_step": 162520, "epoch": 3869} {"train_loss": -6.838953971862793, "global_step": 162521, "epoch": 3869} {"train_loss": -6.949994087219238, "global_step": 162522, "epoch": 3869} {"train_loss": -6.889161109924316, "global_step": 162523, "epoch": 3869} {"train_loss": -6.862491607666016, "global_step": 162524, "epoch": 3869} {"train_loss": -6.994769096374512, "global_step": 162525, "epoch": 3869} {"train_loss": -6.938985347747803, "global_step": 162526, "epoch": 3869} {"train_loss": -6.878392219543457, "global_step": 162527, "epoch": 3869} {"train_loss": -6.8122992515563965, "global_step": 162528, "epoch": 3869} {"train_loss": -6.898040294647217, "global_step": 162529, "epoch": 3869} {"train_loss": -6.913115978240967, "global_step": 162530, "epoch": 3869} {"train_loss": -6.816877841949463, "global_step": 162531, "epoch": 3869} {"train_loss": -6.931410789489746, "global_step": 162532, "epoch": 3869} {"train_loss": -6.733189105987549, "global_step": 162533, "epoch": 3869} {"train_loss": -6.810022354125977, "global_step": 162534, "epoch": 3869} {"train_loss": -6.969463348388672, "global_step": 162535, "epoch": 3869} {"train_loss": -6.8905816078186035, "global_step": 162536, "epoch": 3869} {"train_loss": -6.866304397583008, "global_step": 162537, "epoch": 3869} {"train_loss": -6.750369071960449, "global_step": 162538, "epoch": 3869} {"train_loss": -6.93147071202596, "global_step": 162539, "epoch": 3869, "val_loss": 68809.6875} {"train_loss": -6.741588592529297, "global_step": 162540, "epoch": 3870} {"train_loss": -6.928645133972168, "global_step": 162541, "epoch": 3870} {"train_loss": -6.840786457061768, "global_step": 162542, "epoch": 3870} {"train_loss": -6.795033931732178, "global_step": 162543, "epoch": 3870} {"train_loss": -6.757317543029785, "global_step": 162544, "epoch": 3870} {"train_loss": -6.775835037231445, "global_step": 162545, "epoch": 3870} {"train_loss": -6.891901016235352, "global_step": 162546, "epoch": 3870} {"train_loss": -6.858022689819336, "global_step": 162547, "epoch": 3870} {"train_loss": -6.9733781814575195, "global_step": 162548, "epoch": 3870} {"train_loss": -6.9628424644470215, "global_step": 162549, "epoch": 3870} {"train_loss": -7.004607677459717, "global_step": 162550, "epoch": 3870} {"train_loss": -6.941352844238281, "global_step": 162551, "epoch": 3870} {"train_loss": -6.842478275299072, "global_step": 162552, "epoch": 3870} {"train_loss": -6.9431586265563965, "global_step": 162553, "epoch": 3870} {"train_loss": -6.947800159454346, "global_step": 162554, "epoch": 3870} {"train_loss": -6.966911315917969, "global_step": 162555, "epoch": 3870} {"train_loss": -6.913538932800293, "global_step": 162556, "epoch": 3870} {"train_loss": -6.8607707023620605, "global_step": 162557, "epoch": 3870} {"train_loss": -6.846675872802734, "global_step": 162558, "epoch": 3870} {"train_loss": -6.934889793395996, "global_step": 162559, "epoch": 3870} {"train_loss": -6.913082122802734, "global_step": 162560, "epoch": 3870} {"train_loss": -6.911731719970703, "global_step": 162561, "epoch": 3870} {"train_loss": -6.85599422454834, "global_step": 162562, "epoch": 3870} {"train_loss": -6.844863414764404, "global_step": 162563, "epoch": 3870} {"train_loss": -6.921415328979492, "global_step": 162564, "epoch": 3870} {"train_loss": -6.868166923522949, "global_step": 162565, "epoch": 3870} {"train_loss": -6.94188117980957, "global_step": 162566, "epoch": 3870} {"train_loss": -6.989263534545898, "global_step": 162567, "epoch": 3870} {"train_loss": -6.903353691101074, "global_step": 162568, "epoch": 3870} {"train_loss": -6.863701820373535, "global_step": 162569, "epoch": 3870} {"train_loss": -6.8469743728637695, "global_step": 162570, "epoch": 3870} {"train_loss": -6.964404582977295, "global_step": 162571, "epoch": 3870} {"train_loss": -6.950065612792969, "global_step": 162572, "epoch": 3870} {"train_loss": -6.845767021179199, "global_step": 162573, "epoch": 3870} {"train_loss": -7.038001537322998, "global_step": 162574, "epoch": 3870} {"train_loss": -6.952319145202637, "global_step": 162575, "epoch": 3870} {"train_loss": -6.927944183349609, "global_step": 162576, "epoch": 3870} {"train_loss": -6.880087375640869, "global_step": 162577, "epoch": 3870} {"train_loss": -6.8788957595825195, "global_step": 162578, "epoch": 3870} {"train_loss": -6.945875644683838, "global_step": 162579, "epoch": 3870} {"train_loss": -6.82166862487793, "global_step": 162580, "epoch": 3870} {"train_loss": -6.900946503593808, "global_step": 162581, "epoch": 3870, "val_loss": 68506.46875} {"train_loss": -6.962912082672119, "global_step": 162582, "epoch": 3871} {"train_loss": -6.944505214691162, "global_step": 162583, "epoch": 3871} {"train_loss": -6.912230491638184, "global_step": 162584, "epoch": 3871} {"train_loss": -6.929275035858154, "global_step": 162585, "epoch": 3871} {"train_loss": -7.019132614135742, "global_step": 162586, "epoch": 3871} {"train_loss": -7.023697853088379, "global_step": 162587, "epoch": 3871} {"train_loss": -7.11652135848999, "global_step": 162588, "epoch": 3871} {"train_loss": -7.021064758300781, "global_step": 162589, "epoch": 3871} {"train_loss": -7.041326522827148, "global_step": 162590, "epoch": 3871} {"train_loss": -6.972234725952148, "global_step": 162591, "epoch": 3871} {"train_loss": -7.030850410461426, "global_step": 162592, "epoch": 3871} {"train_loss": -6.9309844970703125, "global_step": 162593, "epoch": 3871} {"train_loss": -6.937520980834961, "global_step": 162594, "epoch": 3871} {"train_loss": -6.911574363708496, "global_step": 162595, "epoch": 3871} {"train_loss": -6.946157455444336, "global_step": 162596, "epoch": 3871} {"train_loss": -7.103546142578125, "global_step": 162597, "epoch": 3871} {"train_loss": -6.962095737457275, "global_step": 162598, "epoch": 3871} {"train_loss": -6.993432998657227, "global_step": 162599, "epoch": 3871} {"train_loss": -6.944596767425537, "global_step": 162600, "epoch": 3871} {"train_loss": -6.987202167510986, "global_step": 162601, "epoch": 3871} {"train_loss": -6.943065166473389, "global_step": 162602, "epoch": 3871} {"train_loss": -6.9912519454956055, "global_step": 162603, "epoch": 3871} {"train_loss": -6.930718421936035, "global_step": 162604, "epoch": 3871} {"train_loss": -6.968626976013184, "global_step": 162605, "epoch": 3871} {"train_loss": -6.979102611541748, "global_step": 162606, "epoch": 3871} {"train_loss": -6.78287410736084, "global_step": 162607, "epoch": 3871} {"train_loss": -6.769984722137451, "global_step": 162608, "epoch": 3871} {"train_loss": -6.908186912536621, "global_step": 162609, "epoch": 3871} {"train_loss": -6.915170669555664, "global_step": 162610, "epoch": 3871} {"train_loss": -6.809568405151367, "global_step": 162611, "epoch": 3871} {"train_loss": -6.774249076843262, "global_step": 162612, "epoch": 3871} {"train_loss": -6.86199951171875, "global_step": 162613, "epoch": 3871} {"train_loss": -6.752647399902344, "global_step": 162614, "epoch": 3871} {"train_loss": -6.911386489868164, "global_step": 162615, "epoch": 3871} {"train_loss": -6.778168201446533, "global_step": 162616, "epoch": 3871} {"train_loss": -6.815085411071777, "global_step": 162617, "epoch": 3871} {"train_loss": -6.871381759643555, "global_step": 162618, "epoch": 3871} {"train_loss": -6.779833793640137, "global_step": 162619, "epoch": 3871} {"train_loss": -6.89406681060791, "global_step": 162620, "epoch": 3871} {"train_loss": -6.823599338531494, "global_step": 162621, "epoch": 3871} {"train_loss": -6.7682342529296875, "global_step": 162622, "epoch": 3871} {"train_loss": -6.916529553277152, "global_step": 162623, "epoch": 3871, "val_loss": 68716.0859375} {"train_loss": -6.8098835945129395, "global_step": 162624, "epoch": 3872} {"train_loss": -6.854484558105469, "global_step": 162625, "epoch": 3872} {"train_loss": -6.888152599334717, "global_step": 162626, "epoch": 3872} {"train_loss": -6.952906608581543, "global_step": 162627, "epoch": 3872} {"train_loss": -6.983936786651611, "global_step": 162628, "epoch": 3872} {"train_loss": -6.872065544128418, "global_step": 162629, "epoch": 3872} {"train_loss": -6.821825981140137, "global_step": 162630, "epoch": 3872} {"train_loss": -6.901166915893555, "global_step": 162631, "epoch": 3872} {"train_loss": -6.796358585357666, "global_step": 162632, "epoch": 3872} {"train_loss": -6.869544982910156, "global_step": 162633, "epoch": 3872} {"train_loss": -7.007128715515137, "global_step": 162634, "epoch": 3872} {"train_loss": -6.785429954528809, "global_step": 162635, "epoch": 3872} {"train_loss": -6.898723602294922, "global_step": 162636, "epoch": 3872} {"train_loss": -6.915916442871094, "global_step": 162637, "epoch": 3872} {"train_loss": -6.94150447845459, "global_step": 162638, "epoch": 3872} {"train_loss": -6.96341609954834, "global_step": 162639, "epoch": 3872} {"train_loss": -6.924105167388916, "global_step": 162640, "epoch": 3872} {"train_loss": -6.975688934326172, "global_step": 162641, "epoch": 3872} {"train_loss": -6.941493034362793, "global_step": 162642, "epoch": 3872} {"train_loss": -6.91560697555542, "global_step": 162643, "epoch": 3872} {"train_loss": -6.978752136230469, "global_step": 162644, "epoch": 3872} {"train_loss": -6.978538990020752, "global_step": 162645, "epoch": 3872} {"train_loss": -6.861663818359375, "global_step": 162646, "epoch": 3872} {"train_loss": -6.984158515930176, "global_step": 162647, "epoch": 3872} {"train_loss": -6.782604217529297, "global_step": 162648, "epoch": 3872} {"train_loss": -6.894141674041748, "global_step": 162649, "epoch": 3872} {"train_loss": -6.890146255493164, "global_step": 162650, "epoch": 3872} {"train_loss": -6.825847625732422, "global_step": 162651, "epoch": 3872} {"train_loss": -6.884734153747559, "global_step": 162652, "epoch": 3872} {"train_loss": -7.046454429626465, "global_step": 162653, "epoch": 3872} {"train_loss": -6.933698654174805, "global_step": 162654, "epoch": 3872} {"train_loss": -6.798684120178223, "global_step": 162655, "epoch": 3872} {"train_loss": -6.973079681396484, "global_step": 162656, "epoch": 3872} {"train_loss": -6.8127264976501465, "global_step": 162657, "epoch": 3872} {"train_loss": -6.927699565887451, "global_step": 162658, "epoch": 3872} {"train_loss": -6.973171234130859, "global_step": 162659, "epoch": 3872} {"train_loss": -6.947531223297119, "global_step": 162660, "epoch": 3872} {"train_loss": -6.892918586730957, "global_step": 162661, "epoch": 3872} {"train_loss": -6.910303115844727, "global_step": 162662, "epoch": 3872} {"train_loss": -7.031373023986816, "global_step": 162663, "epoch": 3872} {"train_loss": -6.899354934692383, "global_step": 162664, "epoch": 3872} {"train_loss": -6.90927943729219, "global_step": 162665, "epoch": 3872, "val_loss": 68602.3125} {"train_loss": -6.953110694885254, "global_step": 162666, "epoch": 3873} {"train_loss": -6.863552093505859, "global_step": 162667, "epoch": 3873} {"train_loss": -6.876592636108398, "global_step": 162668, "epoch": 3873} {"train_loss": -7.020191192626953, "global_step": 162669, "epoch": 3873} {"train_loss": -6.956284523010254, "global_step": 162670, "epoch": 3873} {"train_loss": -6.949810981750488, "global_step": 162671, "epoch": 3873} {"train_loss": -6.923459529876709, "global_step": 162672, "epoch": 3873} {"train_loss": -7.0051445960998535, "global_step": 162673, "epoch": 3873} {"train_loss": -6.943267345428467, "global_step": 162674, "epoch": 3873} {"train_loss": -6.839226245880127, "global_step": 162675, "epoch": 3873} {"train_loss": -6.965291500091553, "global_step": 162676, "epoch": 3873} {"train_loss": -6.913383960723877, "global_step": 162677, "epoch": 3873} {"train_loss": -6.851006507873535, "global_step": 162678, "epoch": 3873} {"train_loss": -6.904620170593262, "global_step": 162679, "epoch": 3873} {"train_loss": -7.004814624786377, "global_step": 162680, "epoch": 3873} {"train_loss": -6.914008140563965, "global_step": 162681, "epoch": 3873} {"train_loss": -6.875663757324219, "global_step": 162682, "epoch": 3873} {"train_loss": -6.916779041290283, "global_step": 162683, "epoch": 3873} {"train_loss": -6.92589807510376, "global_step": 162684, "epoch": 3873} {"train_loss": -6.912317276000977, "global_step": 162685, "epoch": 3873} {"train_loss": -6.879411220550537, "global_step": 162686, "epoch": 3873} {"train_loss": -6.852280139923096, "global_step": 162687, "epoch": 3873} {"train_loss": -6.955835819244385, "global_step": 162688, "epoch": 3873} {"train_loss": -6.875973701477051, "global_step": 162689, "epoch": 3873} {"train_loss": -6.887887001037598, "global_step": 162690, "epoch": 3873} {"train_loss": -7.003769874572754, "global_step": 162691, "epoch": 3873} {"train_loss": -6.993542671203613, "global_step": 162692, "epoch": 3873} {"train_loss": -6.884084701538086, "global_step": 162693, "epoch": 3873} {"train_loss": -6.987163543701172, "global_step": 162694, "epoch": 3873} {"train_loss": -6.839067459106445, "global_step": 162695, "epoch": 3873} {"train_loss": -7.064963340759277, "global_step": 162696, "epoch": 3873} {"train_loss": -6.943819046020508, "global_step": 162697, "epoch": 3873} {"train_loss": -7.003906726837158, "global_step": 162698, "epoch": 3873} {"train_loss": -7.06279182434082, "global_step": 162699, "epoch": 3873} {"train_loss": -7.0438995361328125, "global_step": 162700, "epoch": 3873} {"train_loss": -6.836416244506836, "global_step": 162701, "epoch": 3873} {"train_loss": -6.938899040222168, "global_step": 162702, "epoch": 3873} {"train_loss": -6.99458122253418, "global_step": 162703, "epoch": 3873} {"train_loss": -6.971889972686768, "global_step": 162704, "epoch": 3873} {"train_loss": -6.967187881469727, "global_step": 162705, "epoch": 3873} {"train_loss": -6.893682479858398, "global_step": 162706, "epoch": 3873} {"train_loss": -6.938003698984782, "global_step": 162707, "epoch": 3873, "val_loss": 68396.265625} {"train_loss": -6.875255584716797, "global_step": 162708, "epoch": 3874} {"train_loss": -6.94439172744751, "global_step": 162709, "epoch": 3874} {"train_loss": -6.964013576507568, "global_step": 162710, "epoch": 3874} {"train_loss": -7.015144348144531, "global_step": 162711, "epoch": 3874} {"train_loss": -7.018803596496582, "global_step": 162712, "epoch": 3874} {"train_loss": -7.037933826446533, "global_step": 162713, "epoch": 3874} {"train_loss": -6.981945991516113, "global_step": 162714, "epoch": 3874} {"train_loss": -6.966914653778076, "global_step": 162715, "epoch": 3874} {"train_loss": -6.99055290222168, "global_step": 162716, "epoch": 3874} {"train_loss": -6.855487823486328, "global_step": 162717, "epoch": 3874} {"train_loss": -6.865081787109375, "global_step": 162718, "epoch": 3874} {"train_loss": -7.02494478225708, "global_step": 162719, "epoch": 3874} {"train_loss": -6.8822784423828125, "global_step": 162720, "epoch": 3874} {"train_loss": -6.900567054748535, "global_step": 162721, "epoch": 3874} {"train_loss": -6.942905426025391, "global_step": 162722, "epoch": 3874} {"train_loss": -6.938082695007324, "global_step": 162723, "epoch": 3874} {"train_loss": -6.898387908935547, "global_step": 162724, "epoch": 3874} {"train_loss": -6.925950050354004, "global_step": 162725, "epoch": 3874} {"train_loss": -6.971558094024658, "global_step": 162726, "epoch": 3874} {"train_loss": -6.949341773986816, "global_step": 162727, "epoch": 3874} {"train_loss": -6.959310531616211, "global_step": 162728, "epoch": 3874} {"train_loss": -6.855990886688232, "global_step": 162729, "epoch": 3874} {"train_loss": -6.814469814300537, "global_step": 162730, "epoch": 3874} {"train_loss": -6.888658046722412, "global_step": 162731, "epoch": 3874} {"train_loss": -6.870338439941406, "global_step": 162732, "epoch": 3874} {"train_loss": -6.968688488006592, "global_step": 162733, "epoch": 3874} {"train_loss": -6.808202743530273, "global_step": 162734, "epoch": 3874} {"train_loss": -6.74103307723999, "global_step": 162735, "epoch": 3874} {"train_loss": -6.808005332946777, "global_step": 162736, "epoch": 3874} {"train_loss": -6.898660659790039, "global_step": 162737, "epoch": 3874} {"train_loss": -6.751381874084473, "global_step": 162738, "epoch": 3874} {"train_loss": -6.9759840965271, "global_step": 162739, "epoch": 3874} {"train_loss": -6.939427852630615, "global_step": 162740, "epoch": 3874} {"train_loss": -6.855444431304932, "global_step": 162741, "epoch": 3874} {"train_loss": -6.907425880432129, "global_step": 162742, "epoch": 3874} {"train_loss": -6.892881393432617, "global_step": 162743, "epoch": 3874} {"train_loss": -6.827415466308594, "global_step": 162744, "epoch": 3874} {"train_loss": -6.927074432373047, "global_step": 162745, "epoch": 3874} {"train_loss": -6.905903339385986, "global_step": 162746, "epoch": 3874} {"train_loss": -6.872783660888672, "global_step": 162747, "epoch": 3874} {"train_loss": -6.9248857498168945, "global_step": 162748, "epoch": 3874} {"train_loss": -6.9113005456470304, "global_step": 162749, "epoch": 3874, "val_loss": 68524.015625} {"train_loss": -6.939910411834717, "global_step": 162750, "epoch": 3875} {"train_loss": -6.849880695343018, "global_step": 162751, "epoch": 3875} {"train_loss": -7.016849517822266, "global_step": 162752, "epoch": 3875} {"train_loss": -6.743948459625244, "global_step": 162753, "epoch": 3875} {"train_loss": -6.789813041687012, "global_step": 162754, "epoch": 3875} {"train_loss": -6.801814079284668, "global_step": 162755, "epoch": 3875} {"train_loss": -6.669109344482422, "global_step": 162756, "epoch": 3875} {"train_loss": -6.813161849975586, "global_step": 162757, "epoch": 3875} {"train_loss": -6.8242902755737305, "global_step": 162758, "epoch": 3875} {"train_loss": -6.772010803222656, "global_step": 162759, "epoch": 3875} {"train_loss": -6.893854141235352, "global_step": 162760, "epoch": 3875} {"train_loss": -6.883702754974365, "global_step": 162761, "epoch": 3875} {"train_loss": -6.8409271240234375, "global_step": 162762, "epoch": 3875} {"train_loss": -6.870208263397217, "global_step": 162763, "epoch": 3875} {"train_loss": -6.8135199546813965, "global_step": 162764, "epoch": 3875} {"train_loss": -6.782427787780762, "global_step": 162765, "epoch": 3875} {"train_loss": -6.912044525146484, "global_step": 162766, "epoch": 3875} {"train_loss": -6.985959053039551, "global_step": 162767, "epoch": 3875} {"train_loss": -6.8609843254089355, "global_step": 162768, "epoch": 3875} {"train_loss": -6.9129533767700195, "global_step": 162769, "epoch": 3875} {"train_loss": -6.779365539550781, "global_step": 162770, "epoch": 3875} {"train_loss": -6.840980052947998, "global_step": 162771, "epoch": 3875} {"train_loss": -6.839969635009766, "global_step": 162772, "epoch": 3875} {"train_loss": -6.881673812866211, "global_step": 162773, "epoch": 3875} {"train_loss": -6.920812129974365, "global_step": 162774, "epoch": 3875} {"train_loss": -6.832034587860107, "global_step": 162775, "epoch": 3875} {"train_loss": -6.972967147827148, "global_step": 162776, "epoch": 3875} {"train_loss": -6.877500534057617, "global_step": 162777, "epoch": 3875} {"train_loss": -6.905946731567383, "global_step": 162778, "epoch": 3875} {"train_loss": -6.9119720458984375, "global_step": 162779, "epoch": 3875} {"train_loss": -6.839190483093262, "global_step": 162780, "epoch": 3875} {"train_loss": -6.741339683532715, "global_step": 162781, "epoch": 3875} {"train_loss": -6.928731918334961, "global_step": 162782, "epoch": 3875} {"train_loss": -6.861934185028076, "global_step": 162783, "epoch": 3875} {"train_loss": -6.888964653015137, "global_step": 162784, "epoch": 3875} {"train_loss": -6.779693603515625, "global_step": 162785, "epoch": 3875} {"train_loss": -6.877607345581055, "global_step": 162786, "epoch": 3875} {"train_loss": -6.789414405822754, "global_step": 162787, "epoch": 3875} {"train_loss": -6.765584468841553, "global_step": 162788, "epoch": 3875} {"train_loss": -6.954423904418945, "global_step": 162789, "epoch": 3875} {"train_loss": -6.81362247467041, "global_step": 162790, "epoch": 3875} {"train_loss": -6.85047155334836, "global_step": 162791, "epoch": 3875, "val_loss": 68473.09375} {"train_loss": -6.844852447509766, "global_step": 162792, "epoch": 3876} {"train_loss": -7.017413139343262, "global_step": 162793, "epoch": 3876} {"train_loss": -7.019309043884277, "global_step": 162794, "epoch": 3876} {"train_loss": -6.832146644592285, "global_step": 162795, "epoch": 3876} {"train_loss": -6.965864181518555, "global_step": 162796, "epoch": 3876} {"train_loss": -6.844726085662842, "global_step": 162797, "epoch": 3876} {"train_loss": -6.985525131225586, "global_step": 162798, "epoch": 3876} {"train_loss": -6.92181396484375, "global_step": 162799, "epoch": 3876} {"train_loss": -6.884949684143066, "global_step": 162800, "epoch": 3876} {"train_loss": -6.9484543800354, "global_step": 162801, "epoch": 3876} {"train_loss": -7.026358604431152, "global_step": 162802, "epoch": 3876} {"train_loss": -6.968962669372559, "global_step": 162803, "epoch": 3876} {"train_loss": -7.005793571472168, "global_step": 162804, "epoch": 3876} {"train_loss": -6.937503337860107, "global_step": 162805, "epoch": 3876} {"train_loss": -6.999073028564453, "global_step": 162806, "epoch": 3876} {"train_loss": -7.005206108093262, "global_step": 162807, "epoch": 3876} {"train_loss": -7.037728786468506, "global_step": 162808, "epoch": 3876} {"train_loss": -6.986676216125488, "global_step": 162809, "epoch": 3876} {"train_loss": -6.986769676208496, "global_step": 162810, "epoch": 3876} {"train_loss": -6.97825813293457, "global_step": 162811, "epoch": 3876} {"train_loss": -6.9651899337768555, "global_step": 162812, "epoch": 3876} {"train_loss": -7.014222145080566, "global_step": 162813, "epoch": 3876} {"train_loss": -6.988554000854492, "global_step": 162814, "epoch": 3876} {"train_loss": -6.92685604095459, "global_step": 162815, "epoch": 3876} {"train_loss": -7.086762428283691, "global_step": 162816, "epoch": 3876} {"train_loss": -6.914624214172363, "global_step": 162817, "epoch": 3876} {"train_loss": -6.929258346557617, "global_step": 162818, "epoch": 3876} {"train_loss": -6.896728515625, "global_step": 162819, "epoch": 3876} {"train_loss": -6.944457054138184, "global_step": 162820, "epoch": 3876} {"train_loss": -6.99716329574585, "global_step": 162821, "epoch": 3876} {"train_loss": -6.835837364196777, "global_step": 162822, "epoch": 3876} {"train_loss": -6.905056953430176, "global_step": 162823, "epoch": 3876} {"train_loss": -6.885496139526367, "global_step": 162824, "epoch": 3876} {"train_loss": -6.852360725402832, "global_step": 162825, "epoch": 3876} {"train_loss": -6.927865028381348, "global_step": 162826, "epoch": 3876} {"train_loss": -6.896709442138672, "global_step": 162827, "epoch": 3876} {"train_loss": -6.829824924468994, "global_step": 162828, "epoch": 3876} {"train_loss": -6.944021224975586, "global_step": 162829, "epoch": 3876} {"train_loss": -6.980019569396973, "global_step": 162830, "epoch": 3876} {"train_loss": -6.871046543121338, "global_step": 162831, "epoch": 3876} {"train_loss": -6.957742214202881, "global_step": 162832, "epoch": 3876} {"train_loss": -6.94495609828404, "global_step": 162833, "epoch": 3876, "val_loss": 68559.0078125} {"train_loss": -6.826520919799805, "global_step": 162834, "epoch": 3877} {"train_loss": -6.983484268188477, "global_step": 162835, "epoch": 3877} {"train_loss": -6.935434341430664, "global_step": 162836, "epoch": 3877} {"train_loss": -7.011009216308594, "global_step": 162837, "epoch": 3877} {"train_loss": -7.010334491729736, "global_step": 162838, "epoch": 3877} {"train_loss": -7.022403717041016, "global_step": 162839, "epoch": 3877} {"train_loss": -6.94313383102417, "global_step": 162840, "epoch": 3877} {"train_loss": -6.905786991119385, "global_step": 162841, "epoch": 3877} {"train_loss": -6.920814514160156, "global_step": 162842, "epoch": 3877} {"train_loss": -6.984286785125732, "global_step": 162843, "epoch": 3877} {"train_loss": -6.983532905578613, "global_step": 162844, "epoch": 3877} {"train_loss": -6.810699462890625, "global_step": 162845, "epoch": 3877} {"train_loss": -6.954253673553467, "global_step": 162846, "epoch": 3877} {"train_loss": -6.905173301696777, "global_step": 162847, "epoch": 3877} {"train_loss": -6.874626159667969, "global_step": 162848, "epoch": 3877} {"train_loss": -6.959729194641113, "global_step": 162849, "epoch": 3877} {"train_loss": -6.888703346252441, "global_step": 162850, "epoch": 3877} {"train_loss": -6.902577877044678, "global_step": 162851, "epoch": 3877} {"train_loss": -6.902515888214111, "global_step": 162852, "epoch": 3877} {"train_loss": -7.000459671020508, "global_step": 162853, "epoch": 3877} {"train_loss": -6.8914384841918945, "global_step": 162854, "epoch": 3877} {"train_loss": -6.9166131019592285, "global_step": 162855, "epoch": 3877} {"train_loss": -6.848200798034668, "global_step": 162856, "epoch": 3877} {"train_loss": -6.969379425048828, "global_step": 162857, "epoch": 3877} {"train_loss": -6.878809928894043, "global_step": 162858, "epoch": 3877} {"train_loss": -6.951211929321289, "global_step": 162859, "epoch": 3877} {"train_loss": -6.855591773986816, "global_step": 162860, "epoch": 3877} {"train_loss": -6.957033634185791, "global_step": 162861, "epoch": 3877} {"train_loss": -6.896312236785889, "global_step": 162862, "epoch": 3877} {"train_loss": -6.7868757247924805, "global_step": 162863, "epoch": 3877} {"train_loss": -7.056217670440674, "global_step": 162864, "epoch": 3877} {"train_loss": -6.8512139320373535, "global_step": 162865, "epoch": 3877} {"train_loss": -6.912783622741699, "global_step": 162866, "epoch": 3877} {"train_loss": -6.911191463470459, "global_step": 162867, "epoch": 3877} {"train_loss": -6.747874736785889, "global_step": 162868, "epoch": 3877} {"train_loss": -6.811730861663818, "global_step": 162869, "epoch": 3877} {"train_loss": -7.020098686218262, "global_step": 162870, "epoch": 3877} {"train_loss": -6.872708320617676, "global_step": 162871, "epoch": 3877} {"train_loss": -6.947940826416016, "global_step": 162872, "epoch": 3877} {"train_loss": -6.759390830993652, "global_step": 162873, "epoch": 3877} {"train_loss": -6.816568374633789, "global_step": 162874, "epoch": 3877} {"train_loss": -6.9126174336387995, "global_step": 162875, "epoch": 3877, "val_loss": 68495.96875} {"train_loss": -6.8337860107421875, "global_step": 162876, "epoch": 3878} {"train_loss": -6.907431602478027, "global_step": 162877, "epoch": 3878} {"train_loss": -6.996755599975586, "global_step": 162878, "epoch": 3878} {"train_loss": -6.75502872467041, "global_step": 162879, "epoch": 3878} {"train_loss": -6.8118391036987305, "global_step": 162880, "epoch": 3878} {"train_loss": -6.934714317321777, "global_step": 162881, "epoch": 3878} {"train_loss": -6.823077201843262, "global_step": 162882, "epoch": 3878} {"train_loss": -6.9783735275268555, "global_step": 162883, "epoch": 3878} {"train_loss": -6.805737018585205, "global_step": 162884, "epoch": 3878} {"train_loss": -6.8989362716674805, "global_step": 162885, "epoch": 3878} {"train_loss": -6.830666542053223, "global_step": 162886, "epoch": 3878} {"train_loss": -6.947317123413086, "global_step": 162887, "epoch": 3878} {"train_loss": -6.856790542602539, "global_step": 162888, "epoch": 3878} {"train_loss": -6.8713178634643555, "global_step": 162889, "epoch": 3878} {"train_loss": -6.9755940437316895, "global_step": 162890, "epoch": 3878} {"train_loss": -6.926178455352783, "global_step": 162891, "epoch": 3878} {"train_loss": -6.951188087463379, "global_step": 162892, "epoch": 3878} {"train_loss": -7.026337623596191, "global_step": 162893, "epoch": 3878} {"train_loss": -6.890715599060059, "global_step": 162894, "epoch": 3878} {"train_loss": -6.917823791503906, "global_step": 162895, "epoch": 3878} {"train_loss": -6.834282875061035, "global_step": 162896, "epoch": 3878} {"train_loss": -6.98961067199707, "global_step": 162897, "epoch": 3878} {"train_loss": -6.963153839111328, "global_step": 162898, "epoch": 3878} {"train_loss": -7.007060527801514, "global_step": 162899, "epoch": 3878} {"train_loss": -7.036343574523926, "global_step": 162900, "epoch": 3878} {"train_loss": -7.078806400299072, "global_step": 162901, "epoch": 3878} {"train_loss": -7.003110885620117, "global_step": 162902, "epoch": 3878} {"train_loss": -6.952320098876953, "global_step": 162903, "epoch": 3878} {"train_loss": -6.94425630569458, "global_step": 162904, "epoch": 3878} {"train_loss": -7.058282852172852, "global_step": 162905, "epoch": 3878} {"train_loss": -7.003558158874512, "global_step": 162906, "epoch": 3878} {"train_loss": -6.949149131774902, "global_step": 162907, "epoch": 3878} {"train_loss": -7.01792049407959, "global_step": 162908, "epoch": 3878} {"train_loss": -6.965760231018066, "global_step": 162909, "epoch": 3878} {"train_loss": -6.990937232971191, "global_step": 162910, "epoch": 3878} {"train_loss": -6.937221527099609, "global_step": 162911, "epoch": 3878} {"train_loss": -6.822579383850098, "global_step": 162912, "epoch": 3878} {"train_loss": -6.949374198913574, "global_step": 162913, "epoch": 3878} {"train_loss": -6.89748477935791, "global_step": 162914, "epoch": 3878} {"train_loss": -6.968808174133301, "global_step": 162915, "epoch": 3878} {"train_loss": -6.886885166168213, "global_step": 162916, "epoch": 3878} {"train_loss": -6.934794982274373, "global_step": 162917, "epoch": 3878, "val_loss": 68453.296875} {"train_loss": -7.0179290771484375, "global_step": 162918, "epoch": 3879} {"train_loss": -7.006749153137207, "global_step": 162919, "epoch": 3879} {"train_loss": -7.068723678588867, "global_step": 162920, "epoch": 3879} {"train_loss": -7.077796936035156, "global_step": 162921, "epoch": 3879} {"train_loss": -6.90580940246582, "global_step": 162922, "epoch": 3879} {"train_loss": -6.878803253173828, "global_step": 162923, "epoch": 3879} {"train_loss": -6.946598052978516, "global_step": 162924, "epoch": 3879} {"train_loss": -6.845617771148682, "global_step": 162925, "epoch": 3879} {"train_loss": -7.050848007202148, "global_step": 162926, "epoch": 3879} {"train_loss": -6.911214828491211, "global_step": 162927, "epoch": 3879} {"train_loss": -6.925196647644043, "global_step": 162928, "epoch": 3879} {"train_loss": -6.80253791809082, "global_step": 162929, "epoch": 3879} {"train_loss": -6.951692581176758, "global_step": 162930, "epoch": 3879} {"train_loss": -6.836881637573242, "global_step": 162931, "epoch": 3879} {"train_loss": -6.766596794128418, "global_step": 162932, "epoch": 3879} {"train_loss": -6.986249923706055, "global_step": 162933, "epoch": 3879} {"train_loss": -7.043148040771484, "global_step": 162934, "epoch": 3879} {"train_loss": -6.880202293395996, "global_step": 162935, "epoch": 3879} {"train_loss": -6.9129557609558105, "global_step": 162936, "epoch": 3879} {"train_loss": -6.981171131134033, "global_step": 162937, "epoch": 3879} {"train_loss": -6.8495965003967285, "global_step": 162938, "epoch": 3879} {"train_loss": -6.9963860511779785, "global_step": 162939, "epoch": 3879} {"train_loss": -6.924173831939697, "global_step": 162940, "epoch": 3879} {"train_loss": -6.912344932556152, "global_step": 162941, "epoch": 3879} {"train_loss": -6.907930374145508, "global_step": 162942, "epoch": 3879} {"train_loss": -6.824889183044434, "global_step": 162943, "epoch": 3879} {"train_loss": -6.882628440856934, "global_step": 162944, "epoch": 3879} {"train_loss": -6.837043762207031, "global_step": 162945, "epoch": 3879} {"train_loss": -6.855706214904785, "global_step": 162946, "epoch": 3879} {"train_loss": -6.896185874938965, "global_step": 162947, "epoch": 3879} {"train_loss": -6.814094543457031, "global_step": 162948, "epoch": 3879} {"train_loss": -6.852722644805908, "global_step": 162949, "epoch": 3879} {"train_loss": -6.962080001831055, "global_step": 162950, "epoch": 3879} {"train_loss": -6.931282043457031, "global_step": 162951, "epoch": 3879} {"train_loss": -6.933765411376953, "global_step": 162952, "epoch": 3879} {"train_loss": -6.866279602050781, "global_step": 162953, "epoch": 3879} {"train_loss": -6.940887451171875, "global_step": 162954, "epoch": 3879} {"train_loss": -6.864907264709473, "global_step": 162955, "epoch": 3879} {"train_loss": -6.778932094573975, "global_step": 162956, "epoch": 3879} {"train_loss": -6.845968723297119, "global_step": 162957, "epoch": 3879} {"train_loss": -6.899506092071533, "global_step": 162958, "epoch": 3879} {"train_loss": -6.910839534941173, "global_step": 162959, "epoch": 3879, "val_loss": 68605.1640625} {"train_loss": -6.944266319274902, "global_step": 162960, "epoch": 3880} {"train_loss": -6.878063678741455, "global_step": 162961, "epoch": 3880} {"train_loss": -6.97005033493042, "global_step": 162962, "epoch": 3880} {"train_loss": -6.981021881103516, "global_step": 162963, "epoch": 3880} {"train_loss": -6.793586730957031, "global_step": 162964, "epoch": 3880} {"train_loss": -6.910713195800781, "global_step": 162965, "epoch": 3880} {"train_loss": -6.983757019042969, "global_step": 162966, "epoch": 3880} {"train_loss": -6.913463115692139, "global_step": 162967, "epoch": 3880} {"train_loss": -6.98727560043335, "global_step": 162968, "epoch": 3880} {"train_loss": -6.9280266761779785, "global_step": 162969, "epoch": 3880} {"train_loss": -6.881723880767822, "global_step": 162970, "epoch": 3880} {"train_loss": -7.087435722351074, "global_step": 162971, "epoch": 3880} {"train_loss": -6.9376325607299805, "global_step": 162972, "epoch": 3880} {"train_loss": -6.8411126136779785, "global_step": 162973, "epoch": 3880} {"train_loss": -6.939171314239502, "global_step": 162974, "epoch": 3880} {"train_loss": -6.956901550292969, "global_step": 162975, "epoch": 3880} {"train_loss": -6.946485996246338, "global_step": 162976, "epoch": 3880} {"train_loss": -6.961037635803223, "global_step": 162977, "epoch": 3880} {"train_loss": -6.905210494995117, "global_step": 162978, "epoch": 3880} {"train_loss": -6.906356334686279, "global_step": 162979, "epoch": 3880} {"train_loss": -6.839658737182617, "global_step": 162980, "epoch": 3880} {"train_loss": -7.047866344451904, "global_step": 162981, "epoch": 3880} {"train_loss": -6.896018028259277, "global_step": 162982, "epoch": 3880} {"train_loss": -6.961093902587891, "global_step": 162983, "epoch": 3880} {"train_loss": -6.98560905456543, "global_step": 162984, "epoch": 3880} {"train_loss": -6.991763114929199, "global_step": 162985, "epoch": 3880} {"train_loss": -6.894322395324707, "global_step": 162986, "epoch": 3880} {"train_loss": -6.9866461753845215, "global_step": 162987, "epoch": 3880} {"train_loss": -6.922163963317871, "global_step": 162988, "epoch": 3880} {"train_loss": -6.8232421875, "global_step": 162989, "epoch": 3880} {"train_loss": -6.961791038513184, "global_step": 162990, "epoch": 3880} {"train_loss": -6.927735805511475, "global_step": 162991, "epoch": 3880} {"train_loss": -6.838252067565918, "global_step": 162992, "epoch": 3880} {"train_loss": -6.9746856689453125, "global_step": 162993, "epoch": 3880} {"train_loss": -6.932985305786133, "global_step": 162994, "epoch": 3880} {"train_loss": -6.922151565551758, "global_step": 162995, "epoch": 3880} {"train_loss": -6.939291000366211, "global_step": 162996, "epoch": 3880} {"train_loss": -7.051199913024902, "global_step": 162997, "epoch": 3880} {"train_loss": -6.981183052062988, "global_step": 162998, "epoch": 3880} {"train_loss": -7.047626972198486, "global_step": 162999, "epoch": 3880} {"train_loss": -7.03959321975708, "global_step": 163000, "epoch": 3880} {"train_loss": -6.942172095889137, "global_step": 163001, "epoch": 3880, "val_loss": 68474.0546875} {"train_loss": -7.016362190246582, "global_step": 163002, "epoch": 3881} {"train_loss": -6.849123001098633, "global_step": 163003, "epoch": 3881} {"train_loss": -6.823343753814697, "global_step": 163004, "epoch": 3881} {"train_loss": -6.9261627197265625, "global_step": 163005, "epoch": 3881} {"train_loss": -6.883962631225586, "global_step": 163006, "epoch": 3881} {"train_loss": -7.008730888366699, "global_step": 163007, "epoch": 3881} {"train_loss": -7.058529376983643, "global_step": 163008, "epoch": 3881} {"train_loss": -6.927397727966309, "global_step": 163009, "epoch": 3881} {"train_loss": -6.861998558044434, "global_step": 163010, "epoch": 3881} {"train_loss": -6.737880229949951, "global_step": 163011, "epoch": 3881} {"train_loss": -6.955548286437988, "global_step": 163012, "epoch": 3881} {"train_loss": -6.863227844238281, "global_step": 163013, "epoch": 3881} {"train_loss": -6.843733787536621, "global_step": 163014, "epoch": 3881} {"train_loss": -6.93552303314209, "global_step": 163015, "epoch": 3881} {"train_loss": -6.919361591339111, "global_step": 163016, "epoch": 3881} {"train_loss": -6.963748931884766, "global_step": 163017, "epoch": 3881} {"train_loss": -6.8882951736450195, "global_step": 163018, "epoch": 3881} {"train_loss": -6.935189247131348, "global_step": 163019, "epoch": 3881} {"train_loss": -6.8764777183532715, "global_step": 163020, "epoch": 3881} {"train_loss": -6.795033931732178, "global_step": 163021, "epoch": 3881} {"train_loss": -6.884908676147461, "global_step": 163022, "epoch": 3881} {"train_loss": -6.903872013092041, "global_step": 163023, "epoch": 3881} {"train_loss": -6.888677597045898, "global_step": 163024, "epoch": 3881} {"train_loss": -6.808774948120117, "global_step": 163025, "epoch": 3881} {"train_loss": -6.913431644439697, "global_step": 163026, "epoch": 3881} {"train_loss": -6.886205673217773, "global_step": 163027, "epoch": 3881} {"train_loss": -6.8860883712768555, "global_step": 163028, "epoch": 3881} {"train_loss": -6.86500358581543, "global_step": 163029, "epoch": 3881} {"train_loss": -6.939358711242676, "global_step": 163030, "epoch": 3881} {"train_loss": -6.929623603820801, "global_step": 163031, "epoch": 3881} {"train_loss": -6.925844669342041, "global_step": 163032, "epoch": 3881} {"train_loss": -6.871653079986572, "global_step": 163033, "epoch": 3881} {"train_loss": -6.881594181060791, "global_step": 163034, "epoch": 3881} {"train_loss": -6.879389762878418, "global_step": 163035, "epoch": 3881} {"train_loss": -6.8163909912109375, "global_step": 163036, "epoch": 3881} {"train_loss": -6.968870639801025, "global_step": 163037, "epoch": 3881} {"train_loss": -6.893655776977539, "global_step": 163038, "epoch": 3881} {"train_loss": -6.907018661499023, "global_step": 163039, "epoch": 3881} {"train_loss": -7.076124668121338, "global_step": 163040, "epoch": 3881} {"train_loss": -6.931372165679932, "global_step": 163041, "epoch": 3881} {"train_loss": -6.944769859313965, "global_step": 163042, "epoch": 3881} {"train_loss": -6.905514705748785, "global_step": 163043, "epoch": 3881, "val_loss": 68667.015625} {"train_loss": -6.877868175506592, "global_step": 163044, "epoch": 3882} {"train_loss": -6.999459743499756, "global_step": 163045, "epoch": 3882} {"train_loss": -6.853930473327637, "global_step": 163046, "epoch": 3882} {"train_loss": -6.886308193206787, "global_step": 163047, "epoch": 3882} {"train_loss": -6.835928916931152, "global_step": 163048, "epoch": 3882} {"train_loss": -6.979334831237793, "global_step": 163049, "epoch": 3882} {"train_loss": -6.889981746673584, "global_step": 163050, "epoch": 3882} {"train_loss": -6.911070823669434, "global_step": 163051, "epoch": 3882} {"train_loss": -6.826668739318848, "global_step": 163052, "epoch": 3882} {"train_loss": -6.940793514251709, "global_step": 163053, "epoch": 3882} {"train_loss": -6.721769332885742, "global_step": 163054, "epoch": 3882} {"train_loss": -6.874014854431152, "global_step": 163055, "epoch": 3882} {"train_loss": -6.8210344314575195, "global_step": 163056, "epoch": 3882} {"train_loss": -6.959364891052246, "global_step": 163057, "epoch": 3882} {"train_loss": -6.951837539672852, "global_step": 163058, "epoch": 3882} {"train_loss": -6.86065673828125, "global_step": 163059, "epoch": 3882} {"train_loss": -6.992301940917969, "global_step": 163060, "epoch": 3882} {"train_loss": -6.93886661529541, "global_step": 163061, "epoch": 3882} {"train_loss": -6.980330467224121, "global_step": 163062, "epoch": 3882} {"train_loss": -6.970015048980713, "global_step": 163063, "epoch": 3882} {"train_loss": -6.913186550140381, "global_step": 163064, "epoch": 3882} {"train_loss": -7.064444541931152, "global_step": 163065, "epoch": 3882} {"train_loss": -6.860241413116455, "global_step": 163066, "epoch": 3882} {"train_loss": -6.9998955726623535, "global_step": 163067, "epoch": 3882} {"train_loss": -6.99545955657959, "global_step": 163068, "epoch": 3882} {"train_loss": -6.969934463500977, "global_step": 163069, "epoch": 3882} {"train_loss": -6.954094409942627, "global_step": 163070, "epoch": 3882} {"train_loss": -7.10952091217041, "global_step": 163071, "epoch": 3882} {"train_loss": -7.061324119567871, "global_step": 163072, "epoch": 3882} {"train_loss": -7.01335334777832, "global_step": 163073, "epoch": 3882} {"train_loss": -7.0016188621521, "global_step": 163074, "epoch": 3882} {"train_loss": -7.1017889976501465, "global_step": 163075, "epoch": 3882} {"train_loss": -6.947709560394287, "global_step": 163076, "epoch": 3882} {"train_loss": -7.003521919250488, "global_step": 163077, "epoch": 3882} {"train_loss": -6.99339485168457, "global_step": 163078, "epoch": 3882} {"train_loss": -7.011504173278809, "global_step": 163079, "epoch": 3882} {"train_loss": -7.006628036499023, "global_step": 163080, "epoch": 3882} {"train_loss": -6.9662370681762695, "global_step": 163081, "epoch": 3882} {"train_loss": -6.981751441955566, "global_step": 163082, "epoch": 3882} {"train_loss": -7.006963729858398, "global_step": 163083, "epoch": 3882} {"train_loss": -6.938185691833496, "global_step": 163084, "epoch": 3882} {"train_loss": -6.951520374843052, "global_step": 163085, "epoch": 3882, "val_loss": 68517.0390625} {"train_loss": -7.067000389099121, "global_step": 163086, "epoch": 3883} {"train_loss": -7.083979606628418, "global_step": 163087, "epoch": 3883} {"train_loss": -6.893460273742676, "global_step": 163088, "epoch": 3883} {"train_loss": -6.905518531799316, "global_step": 163089, "epoch": 3883} {"train_loss": -7.134555816650391, "global_step": 163090, "epoch": 3883} {"train_loss": -7.091118812561035, "global_step": 163091, "epoch": 3883} {"train_loss": -6.970422267913818, "global_step": 163092, "epoch": 3883} {"train_loss": -7.036283016204834, "global_step": 163093, "epoch": 3883} {"train_loss": -6.988154411315918, "global_step": 163094, "epoch": 3883} {"train_loss": -7.067508220672607, "global_step": 163095, "epoch": 3883} {"train_loss": -6.9849348068237305, "global_step": 163096, "epoch": 3883} {"train_loss": -6.884998798370361, "global_step": 163097, "epoch": 3883} {"train_loss": -6.910735607147217, "global_step": 163098, "epoch": 3883} {"train_loss": -6.95257568359375, "global_step": 163099, "epoch": 3883} {"train_loss": -7.0045061111450195, "global_step": 163100, "epoch": 3883} {"train_loss": -6.861851692199707, "global_step": 163101, "epoch": 3883} {"train_loss": -6.844128608703613, "global_step": 163102, "epoch": 3883} {"train_loss": -6.995250225067139, "global_step": 163103, "epoch": 3883} {"train_loss": -6.973683834075928, "global_step": 163104, "epoch": 3883} {"train_loss": -6.789654731750488, "global_step": 163105, "epoch": 3883} {"train_loss": -6.978553295135498, "global_step": 163106, "epoch": 3883} {"train_loss": -6.870233535766602, "global_step": 163107, "epoch": 3883} {"train_loss": -6.894493103027344, "global_step": 163108, "epoch": 3883} {"train_loss": -6.9296956062316895, "global_step": 163109, "epoch": 3883} {"train_loss": -6.909446716308594, "global_step": 163110, "epoch": 3883} {"train_loss": -6.937913417816162, "global_step": 163111, "epoch": 3883} {"train_loss": -6.969246864318848, "global_step": 163112, "epoch": 3883} {"train_loss": -6.946924209594727, "global_step": 163113, "epoch": 3883} {"train_loss": -7.078014373779297, "global_step": 163114, "epoch": 3883} {"train_loss": -6.973625183105469, "global_step": 163115, "epoch": 3883} {"train_loss": -7.004472732543945, "global_step": 163116, "epoch": 3883} {"train_loss": -7.015837669372559, "global_step": 163117, "epoch": 3883} {"train_loss": -7.009624481201172, "global_step": 163118, "epoch": 3883} {"train_loss": -6.956000328063965, "global_step": 163119, "epoch": 3883} {"train_loss": -6.958893299102783, "global_step": 163120, "epoch": 3883} {"train_loss": -7.02285099029541, "global_step": 163121, "epoch": 3883} {"train_loss": -6.932879447937012, "global_step": 163122, "epoch": 3883} {"train_loss": -6.895620346069336, "global_step": 163123, "epoch": 3883} {"train_loss": -6.921241760253906, "global_step": 163124, "epoch": 3883} {"train_loss": -6.959010124206543, "global_step": 163125, "epoch": 3883} {"train_loss": -6.984377861022949, "global_step": 163126, "epoch": 3883} {"train_loss": -6.965617940539405, "global_step": 163127, "epoch": 3883, "val_loss": 68634.5546875} {"train_loss": -6.984185695648193, "global_step": 163128, "epoch": 3884} {"train_loss": -6.814123153686523, "global_step": 163129, "epoch": 3884} {"train_loss": -6.965662002563477, "global_step": 163130, "epoch": 3884} {"train_loss": -6.930178642272949, "global_step": 163131, "epoch": 3884} {"train_loss": -6.846339225769043, "global_step": 163132, "epoch": 3884} {"train_loss": -6.993823051452637, "global_step": 163133, "epoch": 3884} {"train_loss": -6.986695289611816, "global_step": 163134, "epoch": 3884} {"train_loss": -7.035000324249268, "global_step": 163135, "epoch": 3884} {"train_loss": -6.988869667053223, "global_step": 163136, "epoch": 3884} {"train_loss": -6.843730926513672, "global_step": 163137, "epoch": 3884} {"train_loss": -6.952300548553467, "global_step": 163138, "epoch": 3884} {"train_loss": -6.927087783813477, "global_step": 163139, "epoch": 3884} {"train_loss": -6.888485908508301, "global_step": 163140, "epoch": 3884} {"train_loss": -6.927669525146484, "global_step": 163141, "epoch": 3884} {"train_loss": -6.984564781188965, "global_step": 163142, "epoch": 3884} {"train_loss": -7.003701210021973, "global_step": 163143, "epoch": 3884} {"train_loss": -6.902429103851318, "global_step": 163144, "epoch": 3884} {"train_loss": -6.854561805725098, "global_step": 163145, "epoch": 3884} {"train_loss": -6.878782749176025, "global_step": 163146, "epoch": 3884} {"train_loss": -6.85722017288208, "global_step": 163147, "epoch": 3884} {"train_loss": -7.043647289276123, "global_step": 163148, "epoch": 3884} {"train_loss": -7.020280838012695, "global_step": 163149, "epoch": 3884} {"train_loss": -6.912417411804199, "global_step": 163150, "epoch": 3884} {"train_loss": -6.87983512878418, "global_step": 163151, "epoch": 3884} {"train_loss": -6.980017185211182, "global_step": 163152, "epoch": 3884} {"train_loss": -7.006271839141846, "global_step": 163153, "epoch": 3884} {"train_loss": -6.923582077026367, "global_step": 163154, "epoch": 3884} {"train_loss": -6.948056221008301, "global_step": 163155, "epoch": 3884} {"train_loss": -6.992615699768066, "global_step": 163156, "epoch": 3884} {"train_loss": -6.947301864624023, "global_step": 163157, "epoch": 3884} {"train_loss": -6.981792449951172, "global_step": 163158, "epoch": 3884} {"train_loss": -6.991183757781982, "global_step": 163159, "epoch": 3884} {"train_loss": -6.7872796058654785, "global_step": 163160, "epoch": 3884} {"train_loss": -6.872520446777344, "global_step": 163161, "epoch": 3884} {"train_loss": -6.853085517883301, "global_step": 163162, "epoch": 3884} {"train_loss": -6.941763401031494, "global_step": 163163, "epoch": 3884} {"train_loss": -6.837291717529297, "global_step": 163164, "epoch": 3884} {"train_loss": -6.869027137756348, "global_step": 163165, "epoch": 3884} {"train_loss": -6.917707443237305, "global_step": 163166, "epoch": 3884} {"train_loss": -6.957042694091797, "global_step": 163167, "epoch": 3884} {"train_loss": -7.027993679046631, "global_step": 163168, "epoch": 3884} {"train_loss": -6.932585080464681, "global_step": 163169, "epoch": 3884, "val_loss": 68494.5078125} {"train_loss": -7.017749309539795, "global_step": 163170, "epoch": 3885} {"train_loss": -6.9183430671691895, "global_step": 163171, "epoch": 3885} {"train_loss": -6.900907516479492, "global_step": 163172, "epoch": 3885} {"train_loss": -7.062061309814453, "global_step": 163173, "epoch": 3885} {"train_loss": -6.928544521331787, "global_step": 163174, "epoch": 3885} {"train_loss": -6.913331031799316, "global_step": 163175, "epoch": 3885} {"train_loss": -6.98650598526001, "global_step": 163176, "epoch": 3885} {"train_loss": -6.888339042663574, "global_step": 163177, "epoch": 3885} {"train_loss": -7.0277252197265625, "global_step": 163178, "epoch": 3885} {"train_loss": -7.015318393707275, "global_step": 163179, "epoch": 3885} {"train_loss": -6.892512321472168, "global_step": 163180, "epoch": 3885} {"train_loss": -6.992631435394287, "global_step": 163181, "epoch": 3885} {"train_loss": -6.993961334228516, "global_step": 163182, "epoch": 3885} {"train_loss": -6.991659164428711, "global_step": 163183, "epoch": 3885} {"train_loss": -6.94480037689209, "global_step": 163184, "epoch": 3885} {"train_loss": -6.859794616699219, "global_step": 163185, "epoch": 3885} {"train_loss": -6.82981014251709, "global_step": 163186, "epoch": 3885} {"train_loss": -6.94465446472168, "global_step": 163187, "epoch": 3885} {"train_loss": -6.921659469604492, "global_step": 163188, "epoch": 3885} {"train_loss": -6.9620490074157715, "global_step": 163189, "epoch": 3885} {"train_loss": -6.998048782348633, "global_step": 163190, "epoch": 3885} {"train_loss": -6.7771806716918945, "global_step": 163191, "epoch": 3885} {"train_loss": -6.859432220458984, "global_step": 163192, "epoch": 3885} {"train_loss": -6.938844203948975, "global_step": 163193, "epoch": 3885} {"train_loss": -6.980121612548828, "global_step": 163194, "epoch": 3885} {"train_loss": -6.839738368988037, "global_step": 163195, "epoch": 3885} {"train_loss": -6.9829816818237305, "global_step": 163196, "epoch": 3885} {"train_loss": -6.8242998123168945, "global_step": 163197, "epoch": 3885} {"train_loss": -6.8427042961120605, "global_step": 163198, "epoch": 3885} {"train_loss": -6.867055892944336, "global_step": 163199, "epoch": 3885} {"train_loss": -6.862811088562012, "global_step": 163200, "epoch": 3885} {"train_loss": -6.765833854675293, "global_step": 163201, "epoch": 3885} {"train_loss": -6.926693916320801, "global_step": 163202, "epoch": 3885} {"train_loss": -6.90153694152832, "global_step": 163203, "epoch": 3885} {"train_loss": -6.813026428222656, "global_step": 163204, "epoch": 3885} {"train_loss": -6.839938163757324, "global_step": 163205, "epoch": 3885} {"train_loss": -6.929924964904785, "global_step": 163206, "epoch": 3885} {"train_loss": -6.967357635498047, "global_step": 163207, "epoch": 3885} {"train_loss": -6.8921732902526855, "global_step": 163208, "epoch": 3885} {"train_loss": -6.81044864654541, "global_step": 163209, "epoch": 3885} {"train_loss": -6.84549617767334, "global_step": 163210, "epoch": 3885} {"train_loss": -6.911781333741688, "global_step": 163211, "epoch": 3885, "val_loss": 68666.84375} {"train_loss": -6.919405937194824, "global_step": 163212, "epoch": 3886} {"train_loss": -6.9232282638549805, "global_step": 163213, "epoch": 3886} {"train_loss": -6.933542251586914, "global_step": 163214, "epoch": 3886} {"train_loss": -6.909988880157471, "global_step": 163215, "epoch": 3886} {"train_loss": -6.8601179122924805, "global_step": 163216, "epoch": 3886} {"train_loss": -6.889842987060547, "global_step": 163217, "epoch": 3886} {"train_loss": -6.942569255828857, "global_step": 163218, "epoch": 3886} {"train_loss": -6.852436065673828, "global_step": 163219, "epoch": 3886} {"train_loss": -6.9237470626831055, "global_step": 163220, "epoch": 3886} {"train_loss": -6.887642860412598, "global_step": 163221, "epoch": 3886} {"train_loss": -6.932739734649658, "global_step": 163222, "epoch": 3886} {"train_loss": -6.957798004150391, "global_step": 163223, "epoch": 3886} {"train_loss": -6.947599411010742, "global_step": 163224, "epoch": 3886} {"train_loss": -6.998954772949219, "global_step": 163225, "epoch": 3886} {"train_loss": -6.890612602233887, "global_step": 163226, "epoch": 3886} {"train_loss": -6.868580341339111, "global_step": 163227, "epoch": 3886} {"train_loss": -6.95905065536499, "global_step": 163228, "epoch": 3886} {"train_loss": -6.968897819519043, "global_step": 163229, "epoch": 3886} {"train_loss": -6.922741413116455, "global_step": 163230, "epoch": 3886} {"train_loss": -6.970623970031738, "global_step": 163231, "epoch": 3886} {"train_loss": -6.9642486572265625, "global_step": 163232, "epoch": 3886} {"train_loss": -6.874534606933594, "global_step": 163233, "epoch": 3886} {"train_loss": -6.882633209228516, "global_step": 163234, "epoch": 3886} {"train_loss": -6.9855241775512695, "global_step": 163235, "epoch": 3886} {"train_loss": -6.988144397735596, "global_step": 163236, "epoch": 3886} {"train_loss": -6.906224250793457, "global_step": 163237, "epoch": 3886} {"train_loss": -6.9669880867004395, "global_step": 163238, "epoch": 3886} {"train_loss": -6.950407981872559, "global_step": 163239, "epoch": 3886} {"train_loss": -7.0473175048828125, "global_step": 163240, "epoch": 3886} {"train_loss": -6.867822647094727, "global_step": 163241, "epoch": 3886} {"train_loss": -7.068646430969238, "global_step": 163242, "epoch": 3886} {"train_loss": -6.972526550292969, "global_step": 163243, "epoch": 3886} {"train_loss": -6.793493747711182, "global_step": 163244, "epoch": 3886} {"train_loss": -6.958089828491211, "global_step": 163245, "epoch": 3886} {"train_loss": -6.942970275878906, "global_step": 163246, "epoch": 3886} {"train_loss": -6.8768815994262695, "global_step": 163247, "epoch": 3886} {"train_loss": -6.976475238800049, "global_step": 163248, "epoch": 3886} {"train_loss": -6.973858833312988, "global_step": 163249, "epoch": 3886} {"train_loss": -6.917938232421875, "global_step": 163250, "epoch": 3886} {"train_loss": -6.813783168792725, "global_step": 163251, "epoch": 3886} {"train_loss": -7.026198387145996, "global_step": 163252, "epoch": 3886} {"train_loss": -6.928099121366229, "global_step": 163253, "epoch": 3886, "val_loss": 68766.328125} {"train_loss": -6.9635210037231445, "global_step": 163254, "epoch": 3887} {"train_loss": -6.9114885330200195, "global_step": 163255, "epoch": 3887} {"train_loss": -6.969067096710205, "global_step": 163256, "epoch": 3887} {"train_loss": -6.8602752685546875, "global_step": 163257, "epoch": 3887} {"train_loss": -6.918121814727783, "global_step": 163258, "epoch": 3887} {"train_loss": -6.8793487548828125, "global_step": 163259, "epoch": 3887} {"train_loss": -7.023036956787109, "global_step": 163260, "epoch": 3887} {"train_loss": -6.9075422286987305, "global_step": 163261, "epoch": 3887} {"train_loss": -6.9264044761657715, "global_step": 163262, "epoch": 3887} {"train_loss": -6.816390037536621, "global_step": 163263, "epoch": 3887} {"train_loss": -6.910760879516602, "global_step": 163264, "epoch": 3887} {"train_loss": -6.945454120635986, "global_step": 163265, "epoch": 3887} {"train_loss": -6.908919334411621, "global_step": 163266, "epoch": 3887} {"train_loss": -6.953713417053223, "global_step": 163267, "epoch": 3887} {"train_loss": -6.938726902008057, "global_step": 163268, "epoch": 3887} {"train_loss": -7.02609395980835, "global_step": 163269, "epoch": 3887} {"train_loss": -6.901073455810547, "global_step": 163270, "epoch": 3887} {"train_loss": -6.97487735748291, "global_step": 163271, "epoch": 3887} {"train_loss": -6.944298267364502, "global_step": 163272, "epoch": 3887} {"train_loss": -6.90336799621582, "global_step": 163273, "epoch": 3887} {"train_loss": -6.913566589355469, "global_step": 163274, "epoch": 3887} {"train_loss": -6.854684352874756, "global_step": 163275, "epoch": 3887} {"train_loss": -6.916304588317871, "global_step": 163276, "epoch": 3887} {"train_loss": -6.9056525230407715, "global_step": 163277, "epoch": 3887} {"train_loss": -6.902066230773926, "global_step": 163278, "epoch": 3887} {"train_loss": -6.885422706604004, "global_step": 163279, "epoch": 3887} {"train_loss": -6.922181129455566, "global_step": 163280, "epoch": 3887} {"train_loss": -6.909523963928223, "global_step": 163281, "epoch": 3887} {"train_loss": -6.90275764465332, "global_step": 163282, "epoch": 3887} {"train_loss": -6.9522199630737305, "global_step": 163283, "epoch": 3887} {"train_loss": -6.982552528381348, "global_step": 163284, "epoch": 3887} {"train_loss": -7.001449108123779, "global_step": 163285, "epoch": 3887} {"train_loss": -6.883286476135254, "global_step": 163286, "epoch": 3887} {"train_loss": -6.857132911682129, "global_step": 163287, "epoch": 3887} {"train_loss": -6.91179084777832, "global_step": 163288, "epoch": 3887} {"train_loss": -7.013697624206543, "global_step": 163289, "epoch": 3887} {"train_loss": -6.745959758758545, "global_step": 163290, "epoch": 3887} {"train_loss": -7.022749900817871, "global_step": 163291, "epoch": 3887} {"train_loss": -6.941584587097168, "global_step": 163292, "epoch": 3887} {"train_loss": -6.920074939727783, "global_step": 163293, "epoch": 3887} {"train_loss": -7.039995193481445, "global_step": 163294, "epoch": 3887} {"train_loss": -6.924881004151844, "global_step": 163295, "epoch": 3887, "val_loss": 68660.5625} {"train_loss": -6.934150218963623, "global_step": 163296, "epoch": 3888} {"train_loss": -6.849580764770508, "global_step": 163297, "epoch": 3888} {"train_loss": -6.942782402038574, "global_step": 163298, "epoch": 3888} {"train_loss": -7.030196189880371, "global_step": 163299, "epoch": 3888} {"train_loss": -6.935662269592285, "global_step": 163300, "epoch": 3888} {"train_loss": -6.958582878112793, "global_step": 163301, "epoch": 3888} {"train_loss": -6.899481296539307, "global_step": 163302, "epoch": 3888} {"train_loss": -6.765670299530029, "global_step": 163303, "epoch": 3888} {"train_loss": -6.9879350662231445, "global_step": 163304, "epoch": 3888} {"train_loss": -6.900309085845947, "global_step": 163305, "epoch": 3888} {"train_loss": -6.970851898193359, "global_step": 163306, "epoch": 3888} {"train_loss": -6.892454624176025, "global_step": 163307, "epoch": 3888} {"train_loss": -6.770483016967773, "global_step": 163308, "epoch": 3888} {"train_loss": -6.972983360290527, "global_step": 163309, "epoch": 3888} {"train_loss": -6.878165245056152, "global_step": 163310, "epoch": 3888} {"train_loss": -6.897454261779785, "global_step": 163311, "epoch": 3888} {"train_loss": -6.995352745056152, "global_step": 163312, "epoch": 3888} {"train_loss": -6.918622970581055, "global_step": 163313, "epoch": 3888} {"train_loss": -6.909992218017578, "global_step": 163314, "epoch": 3888} {"train_loss": -7.002439498901367, "global_step": 163315, "epoch": 3888} {"train_loss": -6.979498863220215, "global_step": 163316, "epoch": 3888} {"train_loss": -6.945155143737793, "global_step": 163317, "epoch": 3888} {"train_loss": -6.868314743041992, "global_step": 163318, "epoch": 3888} {"train_loss": -6.853416442871094, "global_step": 163319, "epoch": 3888} {"train_loss": -7.009894847869873, "global_step": 163320, "epoch": 3888} {"train_loss": -6.966631889343262, "global_step": 163321, "epoch": 3888} {"train_loss": -6.902674674987793, "global_step": 163322, "epoch": 3888} {"train_loss": -6.930102825164795, "global_step": 163323, "epoch": 3888} {"train_loss": -7.035281658172607, "global_step": 163324, "epoch": 3888} {"train_loss": -6.979470729827881, "global_step": 163325, "epoch": 3888} {"train_loss": -6.994832992553711, "global_step": 163326, "epoch": 3888} {"train_loss": -6.9193572998046875, "global_step": 163327, "epoch": 3888} {"train_loss": -6.839025497436523, "global_step": 163328, "epoch": 3888} {"train_loss": -7.030854225158691, "global_step": 163329, "epoch": 3888} {"train_loss": -6.949662208557129, "global_step": 163330, "epoch": 3888} {"train_loss": -6.860636234283447, "global_step": 163331, "epoch": 3888} {"train_loss": -6.849531173706055, "global_step": 163332, "epoch": 3888} {"train_loss": -6.903639793395996, "global_step": 163333, "epoch": 3888} {"train_loss": -6.9420366287231445, "global_step": 163334, "epoch": 3888} {"train_loss": -6.90431022644043, "global_step": 163335, "epoch": 3888} {"train_loss": -7.0619683265686035, "global_step": 163336, "epoch": 3888} {"train_loss": -6.931186710085187, "global_step": 163337, "epoch": 3888, "val_loss": 68585.1796875} {"train_loss": -7.052948951721191, "global_step": 163338, "epoch": 3889} {"train_loss": -7.001917839050293, "global_step": 163339, "epoch": 3889} {"train_loss": -6.9772491455078125, "global_step": 163340, "epoch": 3889} {"train_loss": -6.947909355163574, "global_step": 163341, "epoch": 3889} {"train_loss": -7.035604476928711, "global_step": 163342, "epoch": 3889} {"train_loss": -6.96561336517334, "global_step": 163343, "epoch": 3889} {"train_loss": -6.979884147644043, "global_step": 163344, "epoch": 3889} {"train_loss": -6.938339710235596, "global_step": 163345, "epoch": 3889} {"train_loss": -7.017678260803223, "global_step": 163346, "epoch": 3889} {"train_loss": -6.977635860443115, "global_step": 163347, "epoch": 3889} {"train_loss": -6.953025817871094, "global_step": 163348, "epoch": 3889} {"train_loss": -6.909209728240967, "global_step": 163349, "epoch": 3889} {"train_loss": -7.012924671173096, "global_step": 163350, "epoch": 3889} {"train_loss": -6.931366920471191, "global_step": 163351, "epoch": 3889} {"train_loss": -6.940469741821289, "global_step": 163352, "epoch": 3889} {"train_loss": -6.929913520812988, "global_step": 163353, "epoch": 3889} {"train_loss": -6.902245998382568, "global_step": 163354, "epoch": 3889} {"train_loss": -6.789720058441162, "global_step": 163355, "epoch": 3889} {"train_loss": -7.007769584655762, "global_step": 163356, "epoch": 3889} {"train_loss": -7.013801574707031, "global_step": 163357, "epoch": 3889} {"train_loss": -7.030287265777588, "global_step": 163358, "epoch": 3889} {"train_loss": -6.8543219566345215, "global_step": 163359, "epoch": 3889} {"train_loss": -6.900446891784668, "global_step": 163360, "epoch": 3889} {"train_loss": -6.960634231567383, "global_step": 163361, "epoch": 3889} {"train_loss": -6.864863872528076, "global_step": 163362, "epoch": 3889} {"train_loss": -6.902083396911621, "global_step": 163363, "epoch": 3889} {"train_loss": -6.926674842834473, "global_step": 163364, "epoch": 3889} {"train_loss": -7.033134460449219, "global_step": 163365, "epoch": 3889} {"train_loss": -6.761904716491699, "global_step": 163366, "epoch": 3889} {"train_loss": -6.827724456787109, "global_step": 163367, "epoch": 3889} {"train_loss": -6.930637359619141, "global_step": 163368, "epoch": 3889} {"train_loss": -6.910243988037109, "global_step": 163369, "epoch": 3889} {"train_loss": -6.893165588378906, "global_step": 163370, "epoch": 3889} {"train_loss": -6.893387794494629, "global_step": 163371, "epoch": 3889} {"train_loss": -6.843801498413086, "global_step": 163372, "epoch": 3889} {"train_loss": -6.8385772705078125, "global_step": 163373, "epoch": 3889} {"train_loss": -6.9451751708984375, "global_step": 163374, "epoch": 3889} {"train_loss": -6.7262349128723145, "global_step": 163375, "epoch": 3889} {"train_loss": -6.920554161071777, "global_step": 163376, "epoch": 3889} {"train_loss": -6.919806480407715, "global_step": 163377, "epoch": 3889} {"train_loss": -6.765876770019531, "global_step": 163378, "epoch": 3889} {"train_loss": -6.926813840866089, "global_step": 163379, "epoch": 3889, "val_loss": 68669.859375} {"train_loss": -6.761508941650391, "global_step": 163380, "epoch": 3890} {"train_loss": -6.999979496002197, "global_step": 163381, "epoch": 3890} {"train_loss": -6.881911754608154, "global_step": 163382, "epoch": 3890} {"train_loss": -6.946249961853027, "global_step": 163383, "epoch": 3890} {"train_loss": -7.014530181884766, "global_step": 163384, "epoch": 3890} {"train_loss": -6.789244651794434, "global_step": 163385, "epoch": 3890} {"train_loss": -6.801942348480225, "global_step": 163386, "epoch": 3890} {"train_loss": -6.765655994415283, "global_step": 163387, "epoch": 3890} {"train_loss": -6.701712608337402, "global_step": 163388, "epoch": 3890} {"train_loss": -6.865266799926758, "global_step": 163389, "epoch": 3890} {"train_loss": -6.734957695007324, "global_step": 163390, "epoch": 3890} {"train_loss": -6.791969299316406, "global_step": 163391, "epoch": 3890} {"train_loss": -6.7375688552856445, "global_step": 163392, "epoch": 3890} {"train_loss": -6.819045543670654, "global_step": 163393, "epoch": 3890} {"train_loss": -6.942010879516602, "global_step": 163394, "epoch": 3890} {"train_loss": -6.85634708404541, "global_step": 163395, "epoch": 3890} {"train_loss": -6.882289886474609, "global_step": 163396, "epoch": 3890} {"train_loss": -6.871676921844482, "global_step": 163397, "epoch": 3890} {"train_loss": -6.887204170227051, "global_step": 163398, "epoch": 3890} {"train_loss": -6.780369758605957, "global_step": 163399, "epoch": 3890} {"train_loss": -6.870448589324951, "global_step": 163400, "epoch": 3890} {"train_loss": -6.8988423347473145, "global_step": 163401, "epoch": 3890} {"train_loss": -6.891293048858643, "global_step": 163402, "epoch": 3890} {"train_loss": -6.847724914550781, "global_step": 163403, "epoch": 3890} {"train_loss": -6.9051079750061035, "global_step": 163404, "epoch": 3890} {"train_loss": -7.009999752044678, "global_step": 163405, "epoch": 3890} {"train_loss": -6.891578674316406, "global_step": 163406, "epoch": 3890} {"train_loss": -6.969313144683838, "global_step": 163407, "epoch": 3890} {"train_loss": -6.922331809997559, "global_step": 163408, "epoch": 3890} {"train_loss": -6.820679664611816, "global_step": 163409, "epoch": 3890} {"train_loss": -6.9546332359313965, "global_step": 163410, "epoch": 3890} {"train_loss": -6.821595668792725, "global_step": 163411, "epoch": 3890} {"train_loss": -6.938101291656494, "global_step": 163412, "epoch": 3890} {"train_loss": -6.8235931396484375, "global_step": 163413, "epoch": 3890} {"train_loss": -6.928726673126221, "global_step": 163414, "epoch": 3890} {"train_loss": -6.937643527984619, "global_step": 163415, "epoch": 3890} {"train_loss": -6.938909530639648, "global_step": 163416, "epoch": 3890} {"train_loss": -6.89171028137207, "global_step": 163417, "epoch": 3890} {"train_loss": -6.870367050170898, "global_step": 163418, "epoch": 3890} {"train_loss": -6.835949897766113, "global_step": 163419, "epoch": 3890} {"train_loss": -6.960304260253906, "global_step": 163420, "epoch": 3890} {"train_loss": -6.873799812226069, "global_step": 163421, "epoch": 3890, "val_loss": 68553.265625} {"train_loss": -6.983571529388428, "global_step": 163422, "epoch": 3891} {"train_loss": -6.941298484802246, "global_step": 163423, "epoch": 3891} {"train_loss": -6.939698219299316, "global_step": 163424, "epoch": 3891} {"train_loss": -6.945188522338867, "global_step": 163425, "epoch": 3891} {"train_loss": -6.916804313659668, "global_step": 163426, "epoch": 3891} {"train_loss": -6.953804969787598, "global_step": 163427, "epoch": 3891} {"train_loss": -6.992480278015137, "global_step": 163428, "epoch": 3891} {"train_loss": -6.944173812866211, "global_step": 163429, "epoch": 3891} {"train_loss": -6.948103904724121, "global_step": 163430, "epoch": 3891} {"train_loss": -6.923624038696289, "global_step": 163431, "epoch": 3891} {"train_loss": -7.0510993003845215, "global_step": 163432, "epoch": 3891} {"train_loss": -6.916755199432373, "global_step": 163433, "epoch": 3891} {"train_loss": -6.97398567199707, "global_step": 163434, "epoch": 3891} {"train_loss": -7.016829490661621, "global_step": 163435, "epoch": 3891} {"train_loss": -6.841967582702637, "global_step": 163436, "epoch": 3891} {"train_loss": -6.83979606628418, "global_step": 163437, "epoch": 3891} {"train_loss": -6.9766411781311035, "global_step": 163438, "epoch": 3891} {"train_loss": -7.021838665008545, "global_step": 163439, "epoch": 3891} {"train_loss": -6.931970596313477, "global_step": 163440, "epoch": 3891} {"train_loss": -6.853109359741211, "global_step": 163441, "epoch": 3891} {"train_loss": -6.989081382751465, "global_step": 163442, "epoch": 3891} {"train_loss": -6.961871147155762, "global_step": 163443, "epoch": 3891} {"train_loss": -6.8828840255737305, "global_step": 163444, "epoch": 3891} {"train_loss": -6.972314357757568, "global_step": 163445, "epoch": 3891} {"train_loss": -6.920299053192139, "global_step": 163446, "epoch": 3891} {"train_loss": -6.976222038269043, "global_step": 163447, "epoch": 3891} {"train_loss": -7.043819427490234, "global_step": 163448, "epoch": 3891} {"train_loss": -6.8804240226745605, "global_step": 163449, "epoch": 3891} {"train_loss": -7.032199859619141, "global_step": 163450, "epoch": 3891} {"train_loss": -6.991833686828613, "global_step": 163451, "epoch": 3891} {"train_loss": -6.889937400817871, "global_step": 163452, "epoch": 3891} {"train_loss": -6.985451698303223, "global_step": 163453, "epoch": 3891} {"train_loss": -7.0625691413879395, "global_step": 163454, "epoch": 3891} {"train_loss": -6.863494873046875, "global_step": 163455, "epoch": 3891} {"train_loss": -6.942584991455078, "global_step": 163456, "epoch": 3891} {"train_loss": -6.90306282043457, "global_step": 163457, "epoch": 3891} {"train_loss": -7.012436866760254, "global_step": 163458, "epoch": 3891} {"train_loss": -7.0306878089904785, "global_step": 163459, "epoch": 3891} {"train_loss": -6.98497200012207, "global_step": 163460, "epoch": 3891} {"train_loss": -6.9868316650390625, "global_step": 163461, "epoch": 3891} {"train_loss": -6.972607612609863, "global_step": 163462, "epoch": 3891} {"train_loss": -6.9563091823032925, "global_step": 163463, "epoch": 3891, "val_loss": 68533.953125} {"train_loss": -6.94676399230957, "global_step": 163464, "epoch": 3892} {"train_loss": -6.8213348388671875, "global_step": 163465, "epoch": 3892} {"train_loss": -6.878283500671387, "global_step": 163466, "epoch": 3892} {"train_loss": -6.982044219970703, "global_step": 163467, "epoch": 3892} {"train_loss": -6.844404697418213, "global_step": 163468, "epoch": 3892} {"train_loss": -7.054783344268799, "global_step": 163469, "epoch": 3892} {"train_loss": -6.955338478088379, "global_step": 163470, "epoch": 3892} {"train_loss": -6.893465518951416, "global_step": 163471, "epoch": 3892} {"train_loss": -6.96799373626709, "global_step": 163472, "epoch": 3892} {"train_loss": -6.928954124450684, "global_step": 163473, "epoch": 3892} {"train_loss": -7.057073593139648, "global_step": 163474, "epoch": 3892} {"train_loss": -6.9283037185668945, "global_step": 163475, "epoch": 3892} {"train_loss": -6.8863725662231445, "global_step": 163476, "epoch": 3892} {"train_loss": -7.035679817199707, "global_step": 163477, "epoch": 3892} {"train_loss": -6.900067329406738, "global_step": 163478, "epoch": 3892} {"train_loss": -7.001300811767578, "global_step": 163479, "epoch": 3892} {"train_loss": -7.022050857543945, "global_step": 163480, "epoch": 3892} {"train_loss": -6.934906482696533, "global_step": 163481, "epoch": 3892} {"train_loss": -6.837203502655029, "global_step": 163482, "epoch": 3892} {"train_loss": -6.939727783203125, "global_step": 163483, "epoch": 3892} {"train_loss": -6.87898588180542, "global_step": 163484, "epoch": 3892} {"train_loss": -6.7824530601501465, "global_step": 163485, "epoch": 3892} {"train_loss": -6.904283046722412, "global_step": 163486, "epoch": 3892} {"train_loss": -6.925436973571777, "global_step": 163487, "epoch": 3892} {"train_loss": -6.9955644607543945, "global_step": 163488, "epoch": 3892} {"train_loss": -7.014916896820068, "global_step": 163489, "epoch": 3892} {"train_loss": -6.876199722290039, "global_step": 163490, "epoch": 3892} {"train_loss": -7.053403854370117, "global_step": 163491, "epoch": 3892} {"train_loss": -6.936695575714111, "global_step": 163492, "epoch": 3892} {"train_loss": -6.789020538330078, "global_step": 163493, "epoch": 3892} {"train_loss": -6.940049171447754, "global_step": 163494, "epoch": 3892} {"train_loss": -6.821308135986328, "global_step": 163495, "epoch": 3892} {"train_loss": -6.931467056274414, "global_step": 163496, "epoch": 3892} {"train_loss": -6.949172019958496, "global_step": 163497, "epoch": 3892} {"train_loss": -6.860078811645508, "global_step": 163498, "epoch": 3892} {"train_loss": -6.8237457275390625, "global_step": 163499, "epoch": 3892} {"train_loss": -6.893990516662598, "global_step": 163500, "epoch": 3892} {"train_loss": -6.929671764373779, "global_step": 163501, "epoch": 3892} {"train_loss": -6.737939834594727, "global_step": 163502, "epoch": 3892} {"train_loss": -6.919386386871338, "global_step": 163503, "epoch": 3892} {"train_loss": -6.80300760269165, "global_step": 163504, "epoch": 3892} {"train_loss": -6.909881716682797, "global_step": 163505, "epoch": 3892, "val_loss": 68633.4453125} {"train_loss": -6.831707000732422, "global_step": 163506, "epoch": 3893} {"train_loss": -6.7190446853637695, "global_step": 163507, "epoch": 3893} {"train_loss": -6.940176010131836, "global_step": 163508, "epoch": 3893} {"train_loss": -6.75068473815918, "global_step": 163509, "epoch": 3893} {"train_loss": -6.858298301696777, "global_step": 163510, "epoch": 3893} {"train_loss": -6.9006829261779785, "global_step": 163511, "epoch": 3893} {"train_loss": -6.909280776977539, "global_step": 163512, "epoch": 3893} {"train_loss": -6.952036380767822, "global_step": 163513, "epoch": 3893} {"train_loss": -6.891332149505615, "global_step": 163514, "epoch": 3893} {"train_loss": -6.871714115142822, "global_step": 163515, "epoch": 3893} {"train_loss": -6.865912914276123, "global_step": 163516, "epoch": 3893} {"train_loss": -6.865987777709961, "global_step": 163517, "epoch": 3893} {"train_loss": -6.845582008361816, "global_step": 163518, "epoch": 3893} {"train_loss": -6.851907253265381, "global_step": 163519, "epoch": 3893} {"train_loss": -6.909971237182617, "global_step": 163520, "epoch": 3893} {"train_loss": -6.817573547363281, "global_step": 163521, "epoch": 3893} {"train_loss": -6.976386070251465, "global_step": 163522, "epoch": 3893} {"train_loss": -6.783059120178223, "global_step": 163523, "epoch": 3893} {"train_loss": -6.898613452911377, "global_step": 163524, "epoch": 3893} {"train_loss": -6.952004432678223, "global_step": 163525, "epoch": 3893} {"train_loss": -6.882191181182861, "global_step": 163526, "epoch": 3893} {"train_loss": -6.84712028503418, "global_step": 163527, "epoch": 3893} {"train_loss": -6.868780136108398, "global_step": 163528, "epoch": 3893} {"train_loss": -6.862521171569824, "global_step": 163529, "epoch": 3893} {"train_loss": -6.956162452697754, "global_step": 163530, "epoch": 3893} {"train_loss": -6.961409091949463, "global_step": 163531, "epoch": 3893} {"train_loss": -6.8371734619140625, "global_step": 163532, "epoch": 3893} {"train_loss": -6.811160564422607, "global_step": 163533, "epoch": 3893} {"train_loss": -6.924383163452148, "global_step": 163534, "epoch": 3893} {"train_loss": -6.7962541580200195, "global_step": 163535, "epoch": 3893} {"train_loss": -6.803156852722168, "global_step": 163536, "epoch": 3893} {"train_loss": -6.948042392730713, "global_step": 163537, "epoch": 3893} {"train_loss": -6.912675857543945, "global_step": 163538, "epoch": 3893} {"train_loss": -6.873440265655518, "global_step": 163539, "epoch": 3893} {"train_loss": -7.033919334411621, "global_step": 163540, "epoch": 3893} {"train_loss": -6.935075759887695, "global_step": 163541, "epoch": 3893} {"train_loss": -6.999218940734863, "global_step": 163542, "epoch": 3893} {"train_loss": -6.920921325683594, "global_step": 163543, "epoch": 3893} {"train_loss": -7.0200629234313965, "global_step": 163544, "epoch": 3893} {"train_loss": -6.862757682800293, "global_step": 163545, "epoch": 3893} {"train_loss": -6.956400394439697, "global_step": 163546, "epoch": 3893} {"train_loss": -6.886454116730463, "global_step": 163547, "epoch": 3893, "val_loss": 68366.328125} {"train_loss": -6.972558975219727, "global_step": 163548, "epoch": 3894} {"train_loss": -6.902435302734375, "global_step": 163549, "epoch": 3894} {"train_loss": -6.919604778289795, "global_step": 163550, "epoch": 3894} {"train_loss": -6.954724311828613, "global_step": 163551, "epoch": 3894} {"train_loss": -6.931610107421875, "global_step": 163552, "epoch": 3894} {"train_loss": -6.953898906707764, "global_step": 163553, "epoch": 3894} {"train_loss": -6.982867240905762, "global_step": 163554, "epoch": 3894} {"train_loss": -6.891214847564697, "global_step": 163555, "epoch": 3894} {"train_loss": -6.919662952423096, "global_step": 163556, "epoch": 3894} {"train_loss": -6.9849700927734375, "global_step": 163557, "epoch": 3894} {"train_loss": -6.847159385681152, "global_step": 163558, "epoch": 3894} {"train_loss": -6.890384674072266, "global_step": 163559, "epoch": 3894} {"train_loss": -7.029973030090332, "global_step": 163560, "epoch": 3894} {"train_loss": -6.923638343811035, "global_step": 163561, "epoch": 3894} {"train_loss": -6.899823188781738, "global_step": 163562, "epoch": 3894} {"train_loss": -6.86771821975708, "global_step": 163563, "epoch": 3894} {"train_loss": -6.975305557250977, "global_step": 163564, "epoch": 3894} {"train_loss": -6.934218406677246, "global_step": 163565, "epoch": 3894} {"train_loss": -6.857621669769287, "global_step": 163566, "epoch": 3894} {"train_loss": -6.990852355957031, "global_step": 163567, "epoch": 3894} {"train_loss": -6.887516498565674, "global_step": 163568, "epoch": 3894} {"train_loss": -7.002726078033447, "global_step": 163569, "epoch": 3894} {"train_loss": -6.854413986206055, "global_step": 163570, "epoch": 3894} {"train_loss": -6.959405899047852, "global_step": 163571, "epoch": 3894} {"train_loss": -7.017819404602051, "global_step": 163572, "epoch": 3894} {"train_loss": -6.993648529052734, "global_step": 163573, "epoch": 3894} {"train_loss": -6.926419258117676, "global_step": 163574, "epoch": 3894} {"train_loss": -7.007678985595703, "global_step": 163575, "epoch": 3894} {"train_loss": -6.940914154052734, "global_step": 163576, "epoch": 3894} {"train_loss": -6.89232063293457, "global_step": 163577, "epoch": 3894} {"train_loss": -7.022272109985352, "global_step": 163578, "epoch": 3894} {"train_loss": -6.917734146118164, "global_step": 163579, "epoch": 3894} {"train_loss": -7.025781154632568, "global_step": 163580, "epoch": 3894} {"train_loss": -7.035528182983398, "global_step": 163581, "epoch": 3894} {"train_loss": -6.947458267211914, "global_step": 163582, "epoch": 3894} {"train_loss": -7.010227680206299, "global_step": 163583, "epoch": 3894} {"train_loss": -6.943601131439209, "global_step": 163584, "epoch": 3894} {"train_loss": -6.879406929016113, "global_step": 163585, "epoch": 3894} {"train_loss": -6.784031867980957, "global_step": 163586, "epoch": 3894} {"train_loss": -6.9883246421813965, "global_step": 163587, "epoch": 3894} {"train_loss": -6.894570827484131, "global_step": 163588, "epoch": 3894} {"train_loss": -6.940965936297462, "global_step": 163589, "epoch": 3894, "val_loss": 68584.5859375} {"train_loss": -6.861813068389893, "global_step": 163590, "epoch": 3895} {"train_loss": -6.858996391296387, "global_step": 163591, "epoch": 3895} {"train_loss": -6.9682698249816895, "global_step": 163592, "epoch": 3895} {"train_loss": -6.930391311645508, "global_step": 163593, "epoch": 3895} {"train_loss": -6.786502838134766, "global_step": 163594, "epoch": 3895} {"train_loss": -6.948451995849609, "global_step": 163595, "epoch": 3895} {"train_loss": -6.896285057067871, "global_step": 163596, "epoch": 3895} {"train_loss": -7.0077409744262695, "global_step": 163597, "epoch": 3895} {"train_loss": -6.9711408615112305, "global_step": 163598, "epoch": 3895} {"train_loss": -6.874957084655762, "global_step": 163599, "epoch": 3895} {"train_loss": -6.985400199890137, "global_step": 163600, "epoch": 3895} {"train_loss": -6.929317474365234, "global_step": 163601, "epoch": 3895} {"train_loss": -6.998843193054199, "global_step": 163602, "epoch": 3895} {"train_loss": -6.95366096496582, "global_step": 163603, "epoch": 3895} {"train_loss": -6.893492221832275, "global_step": 163604, "epoch": 3895} {"train_loss": -6.991301536560059, "global_step": 163605, "epoch": 3895} {"train_loss": -7.067191123962402, "global_step": 163606, "epoch": 3895} {"train_loss": -7.006806373596191, "global_step": 163607, "epoch": 3895} {"train_loss": -7.0177717208862305, "global_step": 163608, "epoch": 3895} {"train_loss": -6.913533687591553, "global_step": 163609, "epoch": 3895} {"train_loss": -6.962125778198242, "global_step": 163610, "epoch": 3895} {"train_loss": -7.015321731567383, "global_step": 163611, "epoch": 3895} {"train_loss": -7.009515762329102, "global_step": 163612, "epoch": 3895} {"train_loss": -7.020336151123047, "global_step": 163613, "epoch": 3895} {"train_loss": -6.937989234924316, "global_step": 163614, "epoch": 3895} {"train_loss": -6.974799156188965, "global_step": 163615, "epoch": 3895} {"train_loss": -6.932681560516357, "global_step": 163616, "epoch": 3895} {"train_loss": -6.9562225341796875, "global_step": 163617, "epoch": 3895} {"train_loss": -6.9304351806640625, "global_step": 163618, "epoch": 3895} {"train_loss": -7.0469160079956055, "global_step": 163619, "epoch": 3895} {"train_loss": -6.988030433654785, "global_step": 163620, "epoch": 3895} {"train_loss": -6.872214317321777, "global_step": 163621, "epoch": 3895} {"train_loss": -7.015989303588867, "global_step": 163622, "epoch": 3895} {"train_loss": -6.788418769836426, "global_step": 163623, "epoch": 3895} {"train_loss": -6.992053031921387, "global_step": 163624, "epoch": 3895} {"train_loss": -6.933629035949707, "global_step": 163625, "epoch": 3895} {"train_loss": -6.922452926635742, "global_step": 163626, "epoch": 3895} {"train_loss": -7.008937835693359, "global_step": 163627, "epoch": 3895} {"train_loss": -6.905285835266113, "global_step": 163628, "epoch": 3895} {"train_loss": -6.823232650756836, "global_step": 163629, "epoch": 3895} {"train_loss": -7.033337593078613, "global_step": 163630, "epoch": 3895} {"train_loss": -6.946847177687145, "global_step": 163631, "epoch": 3895, "val_loss": 68372.78125} {"train_loss": -6.939159393310547, "global_step": 163632, "epoch": 3896} {"train_loss": -6.881621360778809, "global_step": 163633, "epoch": 3896} {"train_loss": -6.984490394592285, "global_step": 163634, "epoch": 3896} {"train_loss": -6.993824481964111, "global_step": 163635, "epoch": 3896} {"train_loss": -6.945914268493652, "global_step": 163636, "epoch": 3896} {"train_loss": -7.019801139831543, "global_step": 163637, "epoch": 3896} {"train_loss": -7.024994373321533, "global_step": 163638, "epoch": 3896} {"train_loss": -6.994108200073242, "global_step": 163639, "epoch": 3896} {"train_loss": -6.9896559715271, "global_step": 163640, "epoch": 3896} {"train_loss": -6.917943000793457, "global_step": 163641, "epoch": 3896} {"train_loss": -6.8205976486206055, "global_step": 163642, "epoch": 3896} {"train_loss": -6.997762203216553, "global_step": 163643, "epoch": 3896} {"train_loss": -6.968535900115967, "global_step": 163644, "epoch": 3896} {"train_loss": -6.992314338684082, "global_step": 163645, "epoch": 3896} {"train_loss": -6.894274711608887, "global_step": 163646, "epoch": 3896} {"train_loss": -6.944319248199463, "global_step": 163647, "epoch": 3896} {"train_loss": -6.969419479370117, "global_step": 163648, "epoch": 3896} {"train_loss": -7.047065258026123, "global_step": 163649, "epoch": 3896} {"train_loss": -7.035092830657959, "global_step": 163650, "epoch": 3896} {"train_loss": -6.9397172927856445, "global_step": 163651, "epoch": 3896} {"train_loss": -6.875949382781982, "global_step": 163652, "epoch": 3896} {"train_loss": -7.0124831199646, "global_step": 163653, "epoch": 3896} {"train_loss": -7.068593978881836, "global_step": 163654, "epoch": 3896} {"train_loss": -7.009521484375, "global_step": 163655, "epoch": 3896} {"train_loss": -7.027841567993164, "global_step": 163656, "epoch": 3896} {"train_loss": -6.949652194976807, "global_step": 163657, "epoch": 3896} {"train_loss": -6.968160152435303, "global_step": 163658, "epoch": 3896} {"train_loss": -7.042695999145508, "global_step": 163659, "epoch": 3896} {"train_loss": -7.007863521575928, "global_step": 163660, "epoch": 3896} {"train_loss": -7.024216651916504, "global_step": 163661, "epoch": 3896} {"train_loss": -7.054176330566406, "global_step": 163662, "epoch": 3896} {"train_loss": -6.956809043884277, "global_step": 163663, "epoch": 3896} {"train_loss": -6.973274230957031, "global_step": 163664, "epoch": 3896} {"train_loss": -6.875587463378906, "global_step": 163665, "epoch": 3896} {"train_loss": -6.9380106925964355, "global_step": 163666, "epoch": 3896} {"train_loss": -6.958416938781738, "global_step": 163667, "epoch": 3896} {"train_loss": -7.0136590003967285, "global_step": 163668, "epoch": 3896} {"train_loss": -6.854421615600586, "global_step": 163669, "epoch": 3896} {"train_loss": -6.981457233428955, "global_step": 163670, "epoch": 3896} {"train_loss": -6.919591903686523, "global_step": 163671, "epoch": 3896} {"train_loss": -6.785213470458984, "global_step": 163672, "epoch": 3896} {"train_loss": -6.966098592394874, "global_step": 163673, "epoch": 3896, "val_loss": 68502.46875} {"train_loss": -6.870091438293457, "global_step": 163674, "epoch": 3897} {"train_loss": -6.807409286499023, "global_step": 163675, "epoch": 3897} {"train_loss": -6.821890830993652, "global_step": 163676, "epoch": 3897} {"train_loss": -6.934211254119873, "global_step": 163677, "epoch": 3897} {"train_loss": -6.783061504364014, "global_step": 163678, "epoch": 3897} {"train_loss": -6.643708229064941, "global_step": 163679, "epoch": 3897} {"train_loss": -6.802342891693115, "global_step": 163680, "epoch": 3897} {"train_loss": -6.811382293701172, "global_step": 163681, "epoch": 3897} {"train_loss": -6.808927536010742, "global_step": 163682, "epoch": 3897} {"train_loss": -6.830931663513184, "global_step": 163683, "epoch": 3897} {"train_loss": -6.855443000793457, "global_step": 163684, "epoch": 3897} {"train_loss": -6.920742034912109, "global_step": 163685, "epoch": 3897} {"train_loss": -6.623538970947266, "global_step": 163686, "epoch": 3897} {"train_loss": -6.90748929977417, "global_step": 163687, "epoch": 3897} {"train_loss": -6.642729759216309, "global_step": 163688, "epoch": 3897} {"train_loss": -6.810895919799805, "global_step": 163689, "epoch": 3897} {"train_loss": -6.739604949951172, "global_step": 163690, "epoch": 3897} {"train_loss": -6.741981506347656, "global_step": 163691, "epoch": 3897} {"train_loss": -6.827419281005859, "global_step": 163692, "epoch": 3897} {"train_loss": -6.782391548156738, "global_step": 163693, "epoch": 3897} {"train_loss": -6.85464334487915, "global_step": 163694, "epoch": 3897} {"train_loss": -6.797959804534912, "global_step": 163695, "epoch": 3897} {"train_loss": -6.905909538269043, "global_step": 163696, "epoch": 3897} {"train_loss": -6.896371841430664, "global_step": 163697, "epoch": 3897} {"train_loss": -6.880718231201172, "global_step": 163698, "epoch": 3897} {"train_loss": -6.7498884201049805, "global_step": 163699, "epoch": 3897} {"train_loss": -6.974501609802246, "global_step": 163700, "epoch": 3897} {"train_loss": -6.8162641525268555, "global_step": 163701, "epoch": 3897} {"train_loss": -6.792770862579346, "global_step": 163702, "epoch": 3897} {"train_loss": -6.757454872131348, "global_step": 163703, "epoch": 3897} {"train_loss": -6.944262504577637, "global_step": 163704, "epoch": 3897} {"train_loss": -6.873116493225098, "global_step": 163705, "epoch": 3897} {"train_loss": -6.938289165496826, "global_step": 163706, "epoch": 3897} {"train_loss": -6.893680095672607, "global_step": 163707, "epoch": 3897} {"train_loss": -6.8454790115356445, "global_step": 163708, "epoch": 3897} {"train_loss": -7.045681953430176, "global_step": 163709, "epoch": 3897} {"train_loss": -6.884542465209961, "global_step": 163710, "epoch": 3897} {"train_loss": -6.851936340332031, "global_step": 163711, "epoch": 3897} {"train_loss": -7.013827323913574, "global_step": 163712, "epoch": 3897} {"train_loss": -6.838247299194336, "global_step": 163713, "epoch": 3897} {"train_loss": -6.921022891998291, "global_step": 163714, "epoch": 3897} {"train_loss": -6.840226638884771, "global_step": 163715, "epoch": 3897, "val_loss": 68405.6796875} {"train_loss": -6.8867292404174805, "global_step": 163716, "epoch": 3898} {"train_loss": -6.980936527252197, "global_step": 163717, "epoch": 3898} {"train_loss": -6.906037330627441, "global_step": 163718, "epoch": 3898} {"train_loss": -6.945245265960693, "global_step": 163719, "epoch": 3898} {"train_loss": -6.953707695007324, "global_step": 163720, "epoch": 3898} {"train_loss": -6.904269218444824, "global_step": 163721, "epoch": 3898} {"train_loss": -6.84815788269043, "global_step": 163722, "epoch": 3898} {"train_loss": -6.984311103820801, "global_step": 163723, "epoch": 3898} {"train_loss": -6.918449401855469, "global_step": 163724, "epoch": 3898} {"train_loss": -6.958618640899658, "global_step": 163725, "epoch": 3898} {"train_loss": -6.96193790435791, "global_step": 163726, "epoch": 3898} {"train_loss": -6.956648826599121, "global_step": 163727, "epoch": 3898} {"train_loss": -6.985705852508545, "global_step": 163728, "epoch": 3898} {"train_loss": -6.92398738861084, "global_step": 163729, "epoch": 3898} {"train_loss": -7.011528491973877, "global_step": 163730, "epoch": 3898} {"train_loss": -6.978189468383789, "global_step": 163731, "epoch": 3898} {"train_loss": -6.873103618621826, "global_step": 163732, "epoch": 3898} {"train_loss": -6.879377365112305, "global_step": 163733, "epoch": 3898} {"train_loss": -6.999113082885742, "global_step": 163734, "epoch": 3898} {"train_loss": -6.898776054382324, "global_step": 163735, "epoch": 3898} {"train_loss": -7.0459394454956055, "global_step": 163736, "epoch": 3898} {"train_loss": -7.000364303588867, "global_step": 163737, "epoch": 3898} {"train_loss": -7.021032333374023, "global_step": 163738, "epoch": 3898} {"train_loss": -6.967502117156982, "global_step": 163739, "epoch": 3898} {"train_loss": -6.943928241729736, "global_step": 163740, "epoch": 3898} {"train_loss": -6.947463512420654, "global_step": 163741, "epoch": 3898} {"train_loss": -6.983489513397217, "global_step": 163742, "epoch": 3898} {"train_loss": -7.040118217468262, "global_step": 163743, "epoch": 3898} {"train_loss": -6.993349075317383, "global_step": 163744, "epoch": 3898} {"train_loss": -7.000123977661133, "global_step": 163745, "epoch": 3898} {"train_loss": -7.016092300415039, "global_step": 163746, "epoch": 3898} {"train_loss": -7.109248638153076, "global_step": 163747, "epoch": 3898} {"train_loss": -6.963312149047852, "global_step": 163748, "epoch": 3898} {"train_loss": -6.983309745788574, "global_step": 163749, "epoch": 3898} {"train_loss": -6.863874435424805, "global_step": 163750, "epoch": 3898} {"train_loss": -6.962197780609131, "global_step": 163751, "epoch": 3898} {"train_loss": -6.89481258392334, "global_step": 163752, "epoch": 3898} {"train_loss": -6.865200519561768, "global_step": 163753, "epoch": 3898} {"train_loss": -7.04759407043457, "global_step": 163754, "epoch": 3898} {"train_loss": -7.022480487823486, "global_step": 163755, "epoch": 3898} {"train_loss": -6.913476943969727, "global_step": 163756, "epoch": 3898} {"train_loss": -6.958820218131656, "global_step": 163757, "epoch": 3898, "val_loss": 68520.0859375} {"train_loss": -6.937677383422852, "global_step": 163758, "epoch": 3899} {"train_loss": -6.871193885803223, "global_step": 163759, "epoch": 3899} {"train_loss": -6.9715681076049805, "global_step": 163760, "epoch": 3899} {"train_loss": -6.875213623046875, "global_step": 163761, "epoch": 3899} {"train_loss": -7.053654670715332, "global_step": 163762, "epoch": 3899} {"train_loss": -6.87479305267334, "global_step": 163763, "epoch": 3899} {"train_loss": -6.820042610168457, "global_step": 163764, "epoch": 3899} {"train_loss": -6.898793697357178, "global_step": 163765, "epoch": 3899} {"train_loss": -6.799283981323242, "global_step": 163766, "epoch": 3899} {"train_loss": -6.839348793029785, "global_step": 163767, "epoch": 3899} {"train_loss": -6.985215663909912, "global_step": 163768, "epoch": 3899} {"train_loss": -6.8463544845581055, "global_step": 163769, "epoch": 3899} {"train_loss": -6.7760162353515625, "global_step": 163770, "epoch": 3899} {"train_loss": -6.837095737457275, "global_step": 163771, "epoch": 3899} {"train_loss": -6.881043910980225, "global_step": 163772, "epoch": 3899} {"train_loss": -6.993997573852539, "global_step": 163773, "epoch": 3899} {"train_loss": -6.92606258392334, "global_step": 163774, "epoch": 3899} {"train_loss": -6.912388801574707, "global_step": 163775, "epoch": 3899} {"train_loss": -6.859052658081055, "global_step": 163776, "epoch": 3899} {"train_loss": -6.980996131896973, "global_step": 163777, "epoch": 3899} {"train_loss": -6.965790271759033, "global_step": 163778, "epoch": 3899} {"train_loss": -6.868878364562988, "global_step": 163779, "epoch": 3899} {"train_loss": -6.897792816162109, "global_step": 163780, "epoch": 3899} {"train_loss": -6.9483819007873535, "global_step": 163781, "epoch": 3899} {"train_loss": -6.85150146484375, "global_step": 163782, "epoch": 3899} {"train_loss": -6.94863748550415, "global_step": 163783, "epoch": 3899} {"train_loss": -6.831235408782959, "global_step": 163784, "epoch": 3899} {"train_loss": -6.927774429321289, "global_step": 163785, "epoch": 3899} {"train_loss": -6.902521133422852, "global_step": 163786, "epoch": 3899} {"train_loss": -6.8787665367126465, "global_step": 163787, "epoch": 3899} {"train_loss": -6.980719566345215, "global_step": 163788, "epoch": 3899} {"train_loss": -6.8786163330078125, "global_step": 163789, "epoch": 3899} {"train_loss": -6.948969841003418, "global_step": 163790, "epoch": 3899} {"train_loss": -6.829625129699707, "global_step": 163791, "epoch": 3899} {"train_loss": -6.906261920928955, "global_step": 163792, "epoch": 3899} {"train_loss": -6.968287467956543, "global_step": 163793, "epoch": 3899} {"train_loss": -6.809243202209473, "global_step": 163794, "epoch": 3899} {"train_loss": -6.911639213562012, "global_step": 163795, "epoch": 3899} {"train_loss": -6.687786102294922, "global_step": 163796, "epoch": 3899} {"train_loss": -6.888104438781738, "global_step": 163797, "epoch": 3899} {"train_loss": -6.835997104644775, "global_step": 163798, "epoch": 3899} {"train_loss": -6.890997705005464, "global_step": 163799, "epoch": 3899, "val_loss": 68601.8359375} {"train_loss": -6.905555725097656, "global_step": 163800, "epoch": 3900} {"train_loss": -6.932285785675049, "global_step": 163801, "epoch": 3900} {"train_loss": -6.995296955108643, "global_step": 163802, "epoch": 3900} {"train_loss": -6.828667640686035, "global_step": 163803, "epoch": 3900} {"train_loss": -6.839962005615234, "global_step": 163804, "epoch": 3900} {"train_loss": -6.795299530029297, "global_step": 163805, "epoch": 3900} {"train_loss": -6.918396949768066, "global_step": 163806, "epoch": 3900} {"train_loss": -6.946521759033203, "global_step": 163807, "epoch": 3900} {"train_loss": -6.882221221923828, "global_step": 163808, "epoch": 3900} {"train_loss": -6.978528022766113, "global_step": 163809, "epoch": 3900} {"train_loss": -6.896133899688721, "global_step": 163810, "epoch": 3900} {"train_loss": -6.904956817626953, "global_step": 163811, "epoch": 3900} {"train_loss": -6.920583248138428, "global_step": 163812, "epoch": 3900} {"train_loss": -6.959403038024902, "global_step": 163813, "epoch": 3900} {"train_loss": -6.855198860168457, "global_step": 163814, "epoch": 3900} {"train_loss": -6.88189697265625, "global_step": 163815, "epoch": 3900} {"train_loss": -6.813872337341309, "global_step": 163816, "epoch": 3900} {"train_loss": -6.939439296722412, "global_step": 163817, "epoch": 3900} {"train_loss": -6.931338787078857, "global_step": 163818, "epoch": 3900} {"train_loss": -6.946020126342773, "global_step": 163819, "epoch": 3900} {"train_loss": -6.871276378631592, "global_step": 163820, "epoch": 3900} {"train_loss": -6.837474822998047, "global_step": 163821, "epoch": 3900} {"train_loss": -6.962823867797852, "global_step": 163822, "epoch": 3900} {"train_loss": -6.8418474197387695, "global_step": 163823, "epoch": 3900} {"train_loss": -6.94891357421875, "global_step": 163824, "epoch": 3900} {"train_loss": -6.960505485534668, "global_step": 163825, "epoch": 3900} {"train_loss": -6.945652961730957, "global_step": 163826, "epoch": 3900} {"train_loss": -6.873945713043213, "global_step": 163827, "epoch": 3900} {"train_loss": -6.901289939880371, "global_step": 163828, "epoch": 3900} {"train_loss": -6.9297003746032715, "global_step": 163829, "epoch": 3900} {"train_loss": -6.9220685958862305, "global_step": 163830, "epoch": 3900} {"train_loss": -6.858471393585205, "global_step": 163831, "epoch": 3900} {"train_loss": -6.935787200927734, "global_step": 163832, "epoch": 3900} {"train_loss": -6.9248247146606445, "global_step": 163833, "epoch": 3900} {"train_loss": -6.907471656799316, "global_step": 163834, "epoch": 3900} {"train_loss": -6.889281272888184, "global_step": 163835, "epoch": 3900} {"train_loss": -6.901615142822266, "global_step": 163836, "epoch": 3900} {"train_loss": -7.000730991363525, "global_step": 163837, "epoch": 3900} {"train_loss": -6.944361686706543, "global_step": 163838, "epoch": 3900} {"train_loss": -6.872673034667969, "global_step": 163839, "epoch": 3900} {"train_loss": -6.812981605529785, "global_step": 163840, "epoch": 3900} {"train_loss": -6.904143526440575, "global_step": 163841, "epoch": 3900, "train/sim_max_reward_0": 0.2131269472356992, "train/sim_max_reward_1": 0.9302015381998079, "train/sim_max_reward_2": 0.5998900041674902, "train/sim_max_reward_3": 0.13138629916844038, "train/sim_max_reward_4": 0.38576353770283417, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.2735609217140039, "test/sim_max_reward_4400001": 0.4105593103140002, "test/sim_max_reward_4400002": 0.9497224007722553, "test/sim_max_reward_4400003": 0.9600990167086086, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9730011131631944, "test/sim_max_reward_4400006": 0.905783321491592, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.3001883234102108, "test/sim_max_reward_4400009": 0.744359233474038, "test/sim_max_reward_4400010": 0.3228273451305008, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9205049790857578, "test/sim_max_reward_4400013": 0.36567821862956024, "test/sim_max_reward_4400014": 0.9938567477905067, "test/sim_max_reward_4400015": 0.05372440661672362, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.26602451805645255, "test/sim_max_reward_4400019": 0.8955515101464745, "test/sim_max_reward_4400020": 0.9671938209136063, "test/sim_max_reward_4400021": 0.8773380448074155, "test/sim_max_reward_4400022": 0.2974591878881145, "test/sim_max_reward_4400023": 0.9800988621457679, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.2605415453106675, "test/sim_max_reward_4400026": 0.8377988614053026, "test/sim_max_reward_4400027": 0.03219608061698624, "test/sim_max_reward_4400028": 0.7743123239735661, "test/sim_max_reward_4400029": 0.7729377172276767, "test/sim_max_reward_4400030": 0.9807683892536865, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9324180799891002, "test/sim_max_reward_4400034": 0.9061513833222552, "test/sim_max_reward_4400035": 0.9551569907659628, "test/sim_max_reward_4400036": 0.3746721797926219, "test/sim_max_reward_4400037": 0.9240135658887816, "test/sim_max_reward_4400038": 0.9405377712401216, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9838063028286956, "test/sim_max_reward_4400042": 0.8743813611396651, "test/sim_max_reward_4400043": 0.9051777606075502, "test/sim_max_reward_4400044": 0.9785226578154466, "test/sim_max_reward_4400045": 0.9930836655918615, "test/sim_max_reward_4400046": 0.8741269888332127, "test/sim_max_reward_4400047": 0.8557979490112136, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.4088921809727432, "test/mean_score": 0.6273579309463945, "val_loss": 68503.2578125} {"train_loss": -6.933225631713867, "global_step": 163842, "epoch": 3901} {"train_loss": -6.895403861999512, "global_step": 163843, "epoch": 3901} {"train_loss": -6.915345668792725, "global_step": 163844, "epoch": 3901} {"train_loss": -6.868109703063965, "global_step": 163845, "epoch": 3901} {"train_loss": -6.8902201652526855, "global_step": 163846, "epoch": 3901} {"train_loss": -6.853604316711426, "global_step": 163847, "epoch": 3901} {"train_loss": -6.870763301849365, "global_step": 163848, "epoch": 3901} {"train_loss": -6.887396812438965, "global_step": 163849, "epoch": 3901} {"train_loss": -6.940923690795898, "global_step": 163850, "epoch": 3901} {"train_loss": -7.0453081130981445, "global_step": 163851, "epoch": 3901} {"train_loss": -6.810826778411865, "global_step": 163852, "epoch": 3901} {"train_loss": -6.85668420791626, "global_step": 163853, "epoch": 3901} {"train_loss": -7.001812934875488, "global_step": 163854, "epoch": 3901} {"train_loss": -6.772762298583984, "global_step": 163855, "epoch": 3901} {"train_loss": -6.942543029785156, "global_step": 163856, "epoch": 3901} {"train_loss": -6.920781135559082, "global_step": 163857, "epoch": 3901} {"train_loss": -6.838718414306641, "global_step": 163858, "epoch": 3901} {"train_loss": -7.029592037200928, "global_step": 163859, "epoch": 3901} {"train_loss": -6.895451068878174, "global_step": 163860, "epoch": 3901} {"train_loss": -6.945306777954102, "global_step": 163861, "epoch": 3901} {"train_loss": -6.959169387817383, "global_step": 163862, "epoch": 3901} {"train_loss": -6.928279399871826, "global_step": 163863, "epoch": 3901} {"train_loss": -6.986599922180176, "global_step": 163864, "epoch": 3901} {"train_loss": -6.953899383544922, "global_step": 163865, "epoch": 3901} {"train_loss": -6.986489295959473, "global_step": 163866, "epoch": 3901} {"train_loss": -7.0367207527160645, "global_step": 163867, "epoch": 3901} {"train_loss": -6.991308689117432, "global_step": 163868, "epoch": 3901} {"train_loss": -6.9674272537231445, "global_step": 163869, "epoch": 3901} {"train_loss": -6.922872543334961, "global_step": 163870, "epoch": 3901} {"train_loss": -6.983613014221191, "global_step": 163871, "epoch": 3901} {"train_loss": -6.945826530456543, "global_step": 163872, "epoch": 3901} {"train_loss": -6.927696228027344, "global_step": 163873, "epoch": 3901} {"train_loss": -6.92470645904541, "global_step": 163874, "epoch": 3901} {"train_loss": -6.923293590545654, "global_step": 163875, "epoch": 3901} {"train_loss": -6.9622578620910645, "global_step": 163876, "epoch": 3901} {"train_loss": -6.987095832824707, "global_step": 163877, "epoch": 3901} {"train_loss": -6.886101722717285, "global_step": 163878, "epoch": 3901} {"train_loss": -6.91734504699707, "global_step": 163879, "epoch": 3901} {"train_loss": -6.936888694763184, "global_step": 163880, "epoch": 3901} {"train_loss": -6.888092041015625, "global_step": 163881, "epoch": 3901} {"train_loss": -6.917938232421875, "global_step": 163882, "epoch": 3901} {"train_loss": -6.926724445252192, "global_step": 163883, "epoch": 3901, "val_loss": 68552.96875} {"train_loss": -6.834559917449951, "global_step": 163884, "epoch": 3902} {"train_loss": -6.849416732788086, "global_step": 163885, "epoch": 3902} {"train_loss": -6.886782169342041, "global_step": 163886, "epoch": 3902} {"train_loss": -6.835755348205566, "global_step": 163887, "epoch": 3902} {"train_loss": -6.862480163574219, "global_step": 163888, "epoch": 3902} {"train_loss": -6.941440582275391, "global_step": 163889, "epoch": 3902} {"train_loss": -6.949193000793457, "global_step": 163890, "epoch": 3902} {"train_loss": -6.924887657165527, "global_step": 163891, "epoch": 3902} {"train_loss": -6.917604446411133, "global_step": 163892, "epoch": 3902} {"train_loss": -6.875300407409668, "global_step": 163893, "epoch": 3902} {"train_loss": -6.947352409362793, "global_step": 163894, "epoch": 3902} {"train_loss": -6.897649765014648, "global_step": 163895, "epoch": 3902} {"train_loss": -6.810993194580078, "global_step": 163896, "epoch": 3902} {"train_loss": -6.89255428314209, "global_step": 163897, "epoch": 3902} {"train_loss": -6.878002643585205, "global_step": 163898, "epoch": 3902} {"train_loss": -6.832033157348633, "global_step": 163899, "epoch": 3902} {"train_loss": -6.905750274658203, "global_step": 163900, "epoch": 3902} {"train_loss": -6.956156253814697, "global_step": 163901, "epoch": 3902} {"train_loss": -6.885776519775391, "global_step": 163902, "epoch": 3902} {"train_loss": -6.993602275848389, "global_step": 163903, "epoch": 3902} {"train_loss": -6.997006416320801, "global_step": 163904, "epoch": 3902} {"train_loss": -6.797251224517822, "global_step": 163905, "epoch": 3902} {"train_loss": -6.913426399230957, "global_step": 163906, "epoch": 3902} {"train_loss": -6.9262285232543945, "global_step": 163907, "epoch": 3902} {"train_loss": -6.8930840492248535, "global_step": 163908, "epoch": 3902} {"train_loss": -7.016434669494629, "global_step": 163909, "epoch": 3902} {"train_loss": -6.899709701538086, "global_step": 163910, "epoch": 3902} {"train_loss": -6.80426025390625, "global_step": 163911, "epoch": 3902} {"train_loss": -7.053755283355713, "global_step": 163912, "epoch": 3902} {"train_loss": -6.9048919677734375, "global_step": 163913, "epoch": 3902} {"train_loss": -6.735640525817871, "global_step": 163914, "epoch": 3902} {"train_loss": -6.961025714874268, "global_step": 163915, "epoch": 3902} {"train_loss": -6.957083702087402, "global_step": 163916, "epoch": 3902} {"train_loss": -7.071878433227539, "global_step": 163917, "epoch": 3902} {"train_loss": -6.994889736175537, "global_step": 163918, "epoch": 3902} {"train_loss": -6.990544319152832, "global_step": 163919, "epoch": 3902} {"train_loss": -6.934908390045166, "global_step": 163920, "epoch": 3902} {"train_loss": -6.878421783447266, "global_step": 163921, "epoch": 3902} {"train_loss": -6.90504264831543, "global_step": 163922, "epoch": 3902} {"train_loss": -6.7421770095825195, "global_step": 163923, "epoch": 3902} {"train_loss": -6.9468607902526855, "global_step": 163924, "epoch": 3902} {"train_loss": -6.907513096219017, "global_step": 163925, "epoch": 3902, "val_loss": 68369.0625} {"train_loss": -6.798727989196777, "global_step": 163926, "epoch": 3903} {"train_loss": -7.068833827972412, "global_step": 163927, "epoch": 3903} {"train_loss": -6.957941055297852, "global_step": 163928, "epoch": 3903} {"train_loss": -6.748233318328857, "global_step": 163929, "epoch": 3903} {"train_loss": -6.884475231170654, "global_step": 163930, "epoch": 3903} {"train_loss": -6.993455410003662, "global_step": 163931, "epoch": 3903} {"train_loss": -6.886305809020996, "global_step": 163932, "epoch": 3903} {"train_loss": -6.925456523895264, "global_step": 163933, "epoch": 3903} {"train_loss": -6.926792144775391, "global_step": 163934, "epoch": 3903} {"train_loss": -6.9903411865234375, "global_step": 163935, "epoch": 3903} {"train_loss": -6.908920764923096, "global_step": 163936, "epoch": 3903} {"train_loss": -6.940665245056152, "global_step": 163937, "epoch": 3903} {"train_loss": -6.900596618652344, "global_step": 163938, "epoch": 3903} {"train_loss": -6.849893569946289, "global_step": 163939, "epoch": 3903} {"train_loss": -6.905187606811523, "global_step": 163940, "epoch": 3903} {"train_loss": -6.824538230895996, "global_step": 163941, "epoch": 3903} {"train_loss": -6.907711505889893, "global_step": 163942, "epoch": 3903} {"train_loss": -6.944133281707764, "global_step": 163943, "epoch": 3903} {"train_loss": -6.966676235198975, "global_step": 163944, "epoch": 3903} {"train_loss": -6.82679557800293, "global_step": 163945, "epoch": 3903} {"train_loss": -6.8492631912231445, "global_step": 163946, "epoch": 3903} {"train_loss": -6.852357864379883, "global_step": 163947, "epoch": 3903} {"train_loss": -6.941064834594727, "global_step": 163948, "epoch": 3903} {"train_loss": -6.921965599060059, "global_step": 163949, "epoch": 3903} {"train_loss": -6.882417678833008, "global_step": 163950, "epoch": 3903} {"train_loss": -6.950407028198242, "global_step": 163951, "epoch": 3903} {"train_loss": -6.9303975105285645, "global_step": 163952, "epoch": 3903} {"train_loss": -6.9545722007751465, "global_step": 163953, "epoch": 3903} {"train_loss": -6.8643059730529785, "global_step": 163954, "epoch": 3903} {"train_loss": -6.884206771850586, "global_step": 163955, "epoch": 3903} {"train_loss": -6.886326789855957, "global_step": 163956, "epoch": 3903} {"train_loss": -6.975310325622559, "global_step": 163957, "epoch": 3903} {"train_loss": -6.933276653289795, "global_step": 163958, "epoch": 3903} {"train_loss": -6.945761680603027, "global_step": 163959, "epoch": 3903} {"train_loss": -6.951834201812744, "global_step": 163960, "epoch": 3903} {"train_loss": -6.9829421043396, "global_step": 163961, "epoch": 3903} {"train_loss": -6.9033637046813965, "global_step": 163962, "epoch": 3903} {"train_loss": -6.941077709197998, "global_step": 163963, "epoch": 3903} {"train_loss": -6.884810447692871, "global_step": 163964, "epoch": 3903} {"train_loss": -6.890862464904785, "global_step": 163965, "epoch": 3903} {"train_loss": -6.848207473754883, "global_step": 163966, "epoch": 3903} {"train_loss": -6.910732076281593, "global_step": 163967, "epoch": 3903, "val_loss": 68498.734375} {"train_loss": -6.863901615142822, "global_step": 163968, "epoch": 3904} {"train_loss": -6.921735763549805, "global_step": 163969, "epoch": 3904} {"train_loss": -6.907560348510742, "global_step": 163970, "epoch": 3904} {"train_loss": -6.9964599609375, "global_step": 163971, "epoch": 3904} {"train_loss": -6.988132476806641, "global_step": 163972, "epoch": 3904} {"train_loss": -6.890688896179199, "global_step": 163973, "epoch": 3904} {"train_loss": -6.864371299743652, "global_step": 163974, "epoch": 3904} {"train_loss": -6.964767932891846, "global_step": 163975, "epoch": 3904} {"train_loss": -6.920953750610352, "global_step": 163976, "epoch": 3904} {"train_loss": -7.017486572265625, "global_step": 163977, "epoch": 3904} {"train_loss": -6.89785099029541, "global_step": 163978, "epoch": 3904} {"train_loss": -6.957276344299316, "global_step": 163979, "epoch": 3904} {"train_loss": -6.978107452392578, "global_step": 163980, "epoch": 3904} {"train_loss": -6.998185634613037, "global_step": 163981, "epoch": 3904} {"train_loss": -6.974973201751709, "global_step": 163982, "epoch": 3904} {"train_loss": -6.881382942199707, "global_step": 163983, "epoch": 3904} {"train_loss": -6.943744659423828, "global_step": 163984, "epoch": 3904} {"train_loss": -6.871123313903809, "global_step": 163985, "epoch": 3904} {"train_loss": -6.995255470275879, "global_step": 163986, "epoch": 3904} {"train_loss": -7.035970211029053, "global_step": 163987, "epoch": 3904} {"train_loss": -6.849510192871094, "global_step": 163988, "epoch": 3904} {"train_loss": -6.979852676391602, "global_step": 163989, "epoch": 3904} {"train_loss": -6.927740097045898, "global_step": 163990, "epoch": 3904} {"train_loss": -6.872363090515137, "global_step": 163991, "epoch": 3904} {"train_loss": -6.797675609588623, "global_step": 163992, "epoch": 3904} {"train_loss": -6.9232988357543945, "global_step": 163993, "epoch": 3904} {"train_loss": -6.998891353607178, "global_step": 163994, "epoch": 3904} {"train_loss": -6.850606918334961, "global_step": 163995, "epoch": 3904} {"train_loss": -6.886430740356445, "global_step": 163996, "epoch": 3904} {"train_loss": -6.871653079986572, "global_step": 163997, "epoch": 3904} {"train_loss": -6.739771842956543, "global_step": 163998, "epoch": 3904} {"train_loss": -6.8086934089660645, "global_step": 163999, "epoch": 3904} {"train_loss": -6.805291175842285, "global_step": 164000, "epoch": 3904} {"train_loss": -6.893855094909668, "global_step": 164001, "epoch": 3904} {"train_loss": -6.853171348571777, "global_step": 164002, "epoch": 3904} {"train_loss": -6.810378074645996, "global_step": 164003, "epoch": 3904} {"train_loss": -6.665544509887695, "global_step": 164004, "epoch": 3904} {"train_loss": -6.67341947555542, "global_step": 164005, "epoch": 3904} {"train_loss": -6.84195613861084, "global_step": 164006, "epoch": 3904} {"train_loss": -6.6811041831970215, "global_step": 164007, "epoch": 3904} {"train_loss": -6.895528793334961, "global_step": 164008, "epoch": 3904} {"train_loss": -6.881570850099836, "global_step": 164009, "epoch": 3904, "val_loss": 68580.6640625} {"train_loss": -6.76423454284668, "global_step": 164010, "epoch": 3905} {"train_loss": -6.701240062713623, "global_step": 164011, "epoch": 3905} {"train_loss": -6.74207878112793, "global_step": 164012, "epoch": 3905} {"train_loss": -6.797405242919922, "global_step": 164013, "epoch": 3905} {"train_loss": -6.724074363708496, "global_step": 164014, "epoch": 3905} {"train_loss": -6.808224678039551, "global_step": 164015, "epoch": 3905} {"train_loss": -6.5877203941345215, "global_step": 164016, "epoch": 3905} {"train_loss": -6.784977912902832, "global_step": 164017, "epoch": 3905} {"train_loss": -6.697985649108887, "global_step": 164018, "epoch": 3905} {"train_loss": -6.787559986114502, "global_step": 164019, "epoch": 3905} {"train_loss": -6.678542137145996, "global_step": 164020, "epoch": 3905} {"train_loss": -6.772484302520752, "global_step": 164021, "epoch": 3905} {"train_loss": -6.735023498535156, "global_step": 164022, "epoch": 3905} {"train_loss": -6.790499687194824, "global_step": 164023, "epoch": 3905} {"train_loss": -6.874907970428467, "global_step": 164024, "epoch": 3905} {"train_loss": -6.605254650115967, "global_step": 164025, "epoch": 3905} {"train_loss": -6.766861438751221, "global_step": 164026, "epoch": 3905} {"train_loss": -6.808931827545166, "global_step": 164027, "epoch": 3905} {"train_loss": -6.861089706420898, "global_step": 164028, "epoch": 3905} {"train_loss": -6.710037708282471, "global_step": 164029, "epoch": 3905} {"train_loss": -6.834750652313232, "global_step": 164030, "epoch": 3905} {"train_loss": -6.86544132232666, "global_step": 164031, "epoch": 3905} {"train_loss": -6.889057159423828, "global_step": 164032, "epoch": 3905} {"train_loss": -6.896401405334473, "global_step": 164033, "epoch": 3905} {"train_loss": -6.803186416625977, "global_step": 164034, "epoch": 3905} {"train_loss": -6.933391094207764, "global_step": 164035, "epoch": 3905} {"train_loss": -6.938762187957764, "global_step": 164036, "epoch": 3905} {"train_loss": -6.960864067077637, "global_step": 164037, "epoch": 3905} {"train_loss": -6.806354522705078, "global_step": 164038, "epoch": 3905} {"train_loss": -6.893646240234375, "global_step": 164039, "epoch": 3905} {"train_loss": -6.833618640899658, "global_step": 164040, "epoch": 3905} {"train_loss": -6.9167680740356445, "global_step": 164041, "epoch": 3905} {"train_loss": -6.890186309814453, "global_step": 164042, "epoch": 3905} {"train_loss": -7.053229331970215, "global_step": 164043, "epoch": 3905} {"train_loss": -6.82432746887207, "global_step": 164044, "epoch": 3905} {"train_loss": -7.00230598449707, "global_step": 164045, "epoch": 3905} {"train_loss": -6.917834758758545, "global_step": 164046, "epoch": 3905} {"train_loss": -6.88591194152832, "global_step": 164047, "epoch": 3905} {"train_loss": -6.877694129943848, "global_step": 164048, "epoch": 3905} {"train_loss": -6.926731109619141, "global_step": 164049, "epoch": 3905} {"train_loss": -7.045036792755127, "global_step": 164050, "epoch": 3905} {"train_loss": -6.832879486538115, "global_step": 164051, "epoch": 3905, "val_loss": 68500.6953125} {"train_loss": -6.944371700286865, "global_step": 164052, "epoch": 3906} {"train_loss": -6.968020439147949, "global_step": 164053, "epoch": 3906} {"train_loss": -6.895919322967529, "global_step": 164054, "epoch": 3906} {"train_loss": -6.947176456451416, "global_step": 164055, "epoch": 3906} {"train_loss": -6.9962005615234375, "global_step": 164056, "epoch": 3906} {"train_loss": -6.96180534362793, "global_step": 164057, "epoch": 3906} {"train_loss": -6.777415752410889, "global_step": 164058, "epoch": 3906} {"train_loss": -6.999762535095215, "global_step": 164059, "epoch": 3906} {"train_loss": -6.958921432495117, "global_step": 164060, "epoch": 3906} {"train_loss": -6.89533805847168, "global_step": 164061, "epoch": 3906} {"train_loss": -6.962339401245117, "global_step": 164062, "epoch": 3906} {"train_loss": -6.879157543182373, "global_step": 164063, "epoch": 3906} {"train_loss": -6.805441856384277, "global_step": 164064, "epoch": 3906} {"train_loss": -7.0389885902404785, "global_step": 164065, "epoch": 3906} {"train_loss": -7.025985240936279, "global_step": 164066, "epoch": 3906} {"train_loss": -6.956025123596191, "global_step": 164067, "epoch": 3906} {"train_loss": -6.900552749633789, "global_step": 164068, "epoch": 3906} {"train_loss": -7.023252964019775, "global_step": 164069, "epoch": 3906} {"train_loss": -6.9592604637146, "global_step": 164070, "epoch": 3906} {"train_loss": -6.969594955444336, "global_step": 164071, "epoch": 3906} {"train_loss": -7.0080976486206055, "global_step": 164072, "epoch": 3906} {"train_loss": -6.916255950927734, "global_step": 164073, "epoch": 3906} {"train_loss": -7.076436519622803, "global_step": 164074, "epoch": 3906} {"train_loss": -6.94495153427124, "global_step": 164075, "epoch": 3906} {"train_loss": -7.029208183288574, "global_step": 164076, "epoch": 3906} {"train_loss": -6.9566521644592285, "global_step": 164077, "epoch": 3906} {"train_loss": -7.013864517211914, "global_step": 164078, "epoch": 3906} {"train_loss": -7.036864757537842, "global_step": 164079, "epoch": 3906} {"train_loss": -6.93351936340332, "global_step": 164080, "epoch": 3906} {"train_loss": -6.976391792297363, "global_step": 164081, "epoch": 3906} {"train_loss": -7.140730381011963, "global_step": 164082, "epoch": 3906} {"train_loss": -7.00058650970459, "global_step": 164083, "epoch": 3906} {"train_loss": -6.914761543273926, "global_step": 164084, "epoch": 3906} {"train_loss": -7.01793909072876, "global_step": 164085, "epoch": 3906} {"train_loss": -7.002103328704834, "global_step": 164086, "epoch": 3906} {"train_loss": -7.073638916015625, "global_step": 164087, "epoch": 3906} {"train_loss": -7.016180992126465, "global_step": 164088, "epoch": 3906} {"train_loss": -6.944025039672852, "global_step": 164089, "epoch": 3906} {"train_loss": -7.036036968231201, "global_step": 164090, "epoch": 3906} {"train_loss": -7.012523651123047, "global_step": 164091, "epoch": 3906} {"train_loss": -6.965091705322266, "global_step": 164092, "epoch": 3906} {"train_loss": -6.971339804785592, "global_step": 164093, "epoch": 3906, "val_loss": 68452.1640625} {"train_loss": -7.102535247802734, "global_step": 164094, "epoch": 3907} {"train_loss": -6.945459365844727, "global_step": 164095, "epoch": 3907} {"train_loss": -6.996915817260742, "global_step": 164096, "epoch": 3907} {"train_loss": -6.894926071166992, "global_step": 164097, "epoch": 3907} {"train_loss": -7.026923179626465, "global_step": 164098, "epoch": 3907} {"train_loss": -6.922633647918701, "global_step": 164099, "epoch": 3907} {"train_loss": -6.901785850524902, "global_step": 164100, "epoch": 3907} {"train_loss": -6.922060012817383, "global_step": 164101, "epoch": 3907} {"train_loss": -6.966883182525635, "global_step": 164102, "epoch": 3907} {"train_loss": -6.926244735717773, "global_step": 164103, "epoch": 3907} {"train_loss": -6.817971229553223, "global_step": 164104, "epoch": 3907} {"train_loss": -6.954184532165527, "global_step": 164105, "epoch": 3907} {"train_loss": -6.9557647705078125, "global_step": 164106, "epoch": 3907} {"train_loss": -6.747509002685547, "global_step": 164107, "epoch": 3907} {"train_loss": -7.019101142883301, "global_step": 164108, "epoch": 3907} {"train_loss": -6.926124572753906, "global_step": 164109, "epoch": 3907} {"train_loss": -6.9256110191345215, "global_step": 164110, "epoch": 3907} {"train_loss": -6.889703750610352, "global_step": 164111, "epoch": 3907} {"train_loss": -6.86957311630249, "global_step": 164112, "epoch": 3907} {"train_loss": -6.987292766571045, "global_step": 164113, "epoch": 3907} {"train_loss": -7.000905990600586, "global_step": 164114, "epoch": 3907} {"train_loss": -6.960359573364258, "global_step": 164115, "epoch": 3907} {"train_loss": -6.986118316650391, "global_step": 164116, "epoch": 3907} {"train_loss": -6.925293922424316, "global_step": 164117, "epoch": 3907} {"train_loss": -6.965991973876953, "global_step": 164118, "epoch": 3907} {"train_loss": -6.919759750366211, "global_step": 164119, "epoch": 3907} {"train_loss": -6.975081443786621, "global_step": 164120, "epoch": 3907} {"train_loss": -7.060400009155273, "global_step": 164121, "epoch": 3907} {"train_loss": -6.9948320388793945, "global_step": 164122, "epoch": 3907} {"train_loss": -6.9100494384765625, "global_step": 164123, "epoch": 3907} {"train_loss": -6.933309078216553, "global_step": 164124, "epoch": 3907} {"train_loss": -6.823148727416992, "global_step": 164125, "epoch": 3907} {"train_loss": -6.932764053344727, "global_step": 164126, "epoch": 3907} {"train_loss": -7.054469108581543, "global_step": 164127, "epoch": 3907} {"train_loss": -6.883642673492432, "global_step": 164128, "epoch": 3907} {"train_loss": -6.844357967376709, "global_step": 164129, "epoch": 3907} {"train_loss": -7.0039286613464355, "global_step": 164130, "epoch": 3907} {"train_loss": -6.927515506744385, "global_step": 164131, "epoch": 3907} {"train_loss": -6.89597225189209, "global_step": 164132, "epoch": 3907} {"train_loss": -6.916984558105469, "global_step": 164133, "epoch": 3907} {"train_loss": -6.884693145751953, "global_step": 164134, "epoch": 3907} {"train_loss": -6.936770473207746, "global_step": 164135, "epoch": 3907, "val_loss": 68601.21875} {"train_loss": -6.899805068969727, "global_step": 164136, "epoch": 3908} {"train_loss": -6.725958824157715, "global_step": 164137, "epoch": 3908} {"train_loss": -6.916945457458496, "global_step": 164138, "epoch": 3908} {"train_loss": -6.980388641357422, "global_step": 164139, "epoch": 3908} {"train_loss": -6.949994087219238, "global_step": 164140, "epoch": 3908} {"train_loss": -6.7557573318481445, "global_step": 164141, "epoch": 3908} {"train_loss": -6.76141357421875, "global_step": 164142, "epoch": 3908} {"train_loss": -6.838099479675293, "global_step": 164143, "epoch": 3908} {"train_loss": -6.912430763244629, "global_step": 164144, "epoch": 3908} {"train_loss": -6.8210272789001465, "global_step": 164145, "epoch": 3908} {"train_loss": -6.8987603187561035, "global_step": 164146, "epoch": 3908} {"train_loss": -6.9049201011657715, "global_step": 164147, "epoch": 3908} {"train_loss": -6.824804306030273, "global_step": 164148, "epoch": 3908} {"train_loss": -7.02938175201416, "global_step": 164149, "epoch": 3908} {"train_loss": -6.934162616729736, "global_step": 164150, "epoch": 3908} {"train_loss": -6.892082691192627, "global_step": 164151, "epoch": 3908} {"train_loss": -6.976016998291016, "global_step": 164152, "epoch": 3908} {"train_loss": -6.892555236816406, "global_step": 164153, "epoch": 3908} {"train_loss": -6.853961944580078, "global_step": 164154, "epoch": 3908} {"train_loss": -6.985561370849609, "global_step": 164155, "epoch": 3908} {"train_loss": -6.799376964569092, "global_step": 164156, "epoch": 3908} {"train_loss": -6.953581809997559, "global_step": 164157, "epoch": 3908} {"train_loss": -6.9432477951049805, "global_step": 164158, "epoch": 3908} {"train_loss": -6.757781028747559, "global_step": 164159, "epoch": 3908} {"train_loss": -6.9594621658325195, "global_step": 164160, "epoch": 3908} {"train_loss": -6.754817008972168, "global_step": 164161, "epoch": 3908} {"train_loss": -6.880244255065918, "global_step": 164162, "epoch": 3908} {"train_loss": -6.88630485534668, "global_step": 164163, "epoch": 3908} {"train_loss": -6.866085529327393, "global_step": 164164, "epoch": 3908} {"train_loss": -7.023340225219727, "global_step": 164165, "epoch": 3908} {"train_loss": -6.855189323425293, "global_step": 164166, "epoch": 3908} {"train_loss": -6.920834541320801, "global_step": 164167, "epoch": 3908} {"train_loss": -6.812051773071289, "global_step": 164168, "epoch": 3908} {"train_loss": -6.944601058959961, "global_step": 164169, "epoch": 3908} {"train_loss": -6.897834300994873, "global_step": 164170, "epoch": 3908} {"train_loss": -6.855695724487305, "global_step": 164171, "epoch": 3908} {"train_loss": -6.957494735717773, "global_step": 164172, "epoch": 3908} {"train_loss": -6.891313076019287, "global_step": 164173, "epoch": 3908} {"train_loss": -7.000112056732178, "global_step": 164174, "epoch": 3908} {"train_loss": -6.863645553588867, "global_step": 164175, "epoch": 3908} {"train_loss": -6.98226261138916, "global_step": 164176, "epoch": 3908} {"train_loss": -6.8919861770811535, "global_step": 164177, "epoch": 3908, "val_loss": 68594.1328125} {"train_loss": -6.946782112121582, "global_step": 164178, "epoch": 3909} {"train_loss": -7.047597885131836, "global_step": 164179, "epoch": 3909} {"train_loss": -6.8811936378479, "global_step": 164180, "epoch": 3909} {"train_loss": -7.067841053009033, "global_step": 164181, "epoch": 3909} {"train_loss": -6.890261650085449, "global_step": 164182, "epoch": 3909} {"train_loss": -6.926830291748047, "global_step": 164183, "epoch": 3909} {"train_loss": -6.963082313537598, "global_step": 164184, "epoch": 3909} {"train_loss": -6.957982063293457, "global_step": 164185, "epoch": 3909} {"train_loss": -6.900501728057861, "global_step": 164186, "epoch": 3909} {"train_loss": -6.94449520111084, "global_step": 164187, "epoch": 3909} {"train_loss": -6.898250579833984, "global_step": 164188, "epoch": 3909} {"train_loss": -6.939522743225098, "global_step": 164189, "epoch": 3909} {"train_loss": -6.909748077392578, "global_step": 164190, "epoch": 3909} {"train_loss": -6.861222267150879, "global_step": 164191, "epoch": 3909} {"train_loss": -6.923127174377441, "global_step": 164192, "epoch": 3909} {"train_loss": -6.896178245544434, "global_step": 164193, "epoch": 3909} {"train_loss": -6.876799583435059, "global_step": 164194, "epoch": 3909} {"train_loss": -6.885519981384277, "global_step": 164195, "epoch": 3909} {"train_loss": -6.856389999389648, "global_step": 164196, "epoch": 3909} {"train_loss": -6.905303478240967, "global_step": 164197, "epoch": 3909} {"train_loss": -6.847255706787109, "global_step": 164198, "epoch": 3909} {"train_loss": -6.859426498413086, "global_step": 164199, "epoch": 3909} {"train_loss": -6.903336048126221, "global_step": 164200, "epoch": 3909} {"train_loss": -6.9895853996276855, "global_step": 164201, "epoch": 3909} {"train_loss": -6.928302764892578, "global_step": 164202, "epoch": 3909} {"train_loss": -6.991650104522705, "global_step": 164203, "epoch": 3909} {"train_loss": -6.954435348510742, "global_step": 164204, "epoch": 3909} {"train_loss": -7.062319278717041, "global_step": 164205, "epoch": 3909} {"train_loss": -6.97062873840332, "global_step": 164206, "epoch": 3909} {"train_loss": -7.0473527908325195, "global_step": 164207, "epoch": 3909} {"train_loss": -7.002969264984131, "global_step": 164208, "epoch": 3909} {"train_loss": -7.013590335845947, "global_step": 164209, "epoch": 3909} {"train_loss": -6.893795013427734, "global_step": 164210, "epoch": 3909} {"train_loss": -7.08951473236084, "global_step": 164211, "epoch": 3909} {"train_loss": -6.972596645355225, "global_step": 164212, "epoch": 3909} {"train_loss": -6.925868034362793, "global_step": 164213, "epoch": 3909} {"train_loss": -6.954051971435547, "global_step": 164214, "epoch": 3909} {"train_loss": -6.920345306396484, "global_step": 164215, "epoch": 3909} {"train_loss": -7.041599273681641, "global_step": 164216, "epoch": 3909} {"train_loss": -7.077546119689941, "global_step": 164217, "epoch": 3909} {"train_loss": -6.830741882324219, "global_step": 164218, "epoch": 3909} {"train_loss": -6.947473571414039, "global_step": 164219, "epoch": 3909, "val_loss": 68607.7890625} {"train_loss": -6.985965251922607, "global_step": 164220, "epoch": 3910} {"train_loss": -7.006978511810303, "global_step": 164221, "epoch": 3910} {"train_loss": -6.955006122589111, "global_step": 164222, "epoch": 3910} {"train_loss": -6.968583106994629, "global_step": 164223, "epoch": 3910} {"train_loss": -6.986200332641602, "global_step": 164224, "epoch": 3910} {"train_loss": -6.9437947273254395, "global_step": 164225, "epoch": 3910} {"train_loss": -7.017604827880859, "global_step": 164226, "epoch": 3910} {"train_loss": -6.980541229248047, "global_step": 164227, "epoch": 3910} {"train_loss": -6.9513468742370605, "global_step": 164228, "epoch": 3910} {"train_loss": -6.970751762390137, "global_step": 164229, "epoch": 3910} {"train_loss": -6.856683731079102, "global_step": 164230, "epoch": 3910} {"train_loss": -6.908501148223877, "global_step": 164231, "epoch": 3910} {"train_loss": -6.796987533569336, "global_step": 164232, "epoch": 3910} {"train_loss": -6.958324432373047, "global_step": 164233, "epoch": 3910} {"train_loss": -7.047107696533203, "global_step": 164234, "epoch": 3910} {"train_loss": -6.98714542388916, "global_step": 164235, "epoch": 3910} {"train_loss": -6.810988426208496, "global_step": 164236, "epoch": 3910} {"train_loss": -6.843203544616699, "global_step": 164237, "epoch": 3910} {"train_loss": -6.84203577041626, "global_step": 164238, "epoch": 3910} {"train_loss": -6.8512492179870605, "global_step": 164239, "epoch": 3910} {"train_loss": -6.899719715118408, "global_step": 164240, "epoch": 3910} {"train_loss": -6.699514389038086, "global_step": 164241, "epoch": 3910} {"train_loss": -7.017585754394531, "global_step": 164242, "epoch": 3910} {"train_loss": -6.925455093383789, "global_step": 164243, "epoch": 3910} {"train_loss": -6.950489521026611, "global_step": 164244, "epoch": 3910} {"train_loss": -6.9225921630859375, "global_step": 164245, "epoch": 3910} {"train_loss": -6.870869159698486, "global_step": 164246, "epoch": 3910} {"train_loss": -7.008036136627197, "global_step": 164247, "epoch": 3910} {"train_loss": -6.914773464202881, "global_step": 164248, "epoch": 3910} {"train_loss": -6.87111234664917, "global_step": 164249, "epoch": 3910} {"train_loss": -6.910759925842285, "global_step": 164250, "epoch": 3910} {"train_loss": -6.836564064025879, "global_step": 164251, "epoch": 3910} {"train_loss": -6.9264960289001465, "global_step": 164252, "epoch": 3910} {"train_loss": -6.888105392456055, "global_step": 164253, "epoch": 3910} {"train_loss": -6.881898880004883, "global_step": 164254, "epoch": 3910} {"train_loss": -6.96419620513916, "global_step": 164255, "epoch": 3910} {"train_loss": -6.884530067443848, "global_step": 164256, "epoch": 3910} {"train_loss": -6.835931301116943, "global_step": 164257, "epoch": 3910} {"train_loss": -6.981115818023682, "global_step": 164258, "epoch": 3910} {"train_loss": -6.953138828277588, "global_step": 164259, "epoch": 3910} {"train_loss": -6.940995216369629, "global_step": 164260, "epoch": 3910} {"train_loss": -6.921902963093349, "global_step": 164261, "epoch": 3910, "val_loss": 68499.6015625} {"train_loss": -6.897479057312012, "global_step": 164262, "epoch": 3911} {"train_loss": -6.971217155456543, "global_step": 164263, "epoch": 3911} {"train_loss": -6.885749816894531, "global_step": 164264, "epoch": 3911} {"train_loss": -7.006158828735352, "global_step": 164265, "epoch": 3911} {"train_loss": -7.032507419586182, "global_step": 164266, "epoch": 3911} {"train_loss": -6.9014997482299805, "global_step": 164267, "epoch": 3911} {"train_loss": -6.998485565185547, "global_step": 164268, "epoch": 3911} {"train_loss": -7.052684783935547, "global_step": 164269, "epoch": 3911} {"train_loss": -6.891805648803711, "global_step": 164270, "epoch": 3911} {"train_loss": -6.837002754211426, "global_step": 164271, "epoch": 3911} {"train_loss": -6.897222518920898, "global_step": 164272, "epoch": 3911} {"train_loss": -6.9530253410339355, "global_step": 164273, "epoch": 3911} {"train_loss": -6.9313063621521, "global_step": 164274, "epoch": 3911} {"train_loss": -6.892987251281738, "global_step": 164275, "epoch": 3911} {"train_loss": -6.873762130737305, "global_step": 164276, "epoch": 3911} {"train_loss": -6.881899833679199, "global_step": 164277, "epoch": 3911} {"train_loss": -6.895794868469238, "global_step": 164278, "epoch": 3911} {"train_loss": -6.934093475341797, "global_step": 164279, "epoch": 3911} {"train_loss": -6.879800796508789, "global_step": 164280, "epoch": 3911} {"train_loss": -6.7702131271362305, "global_step": 164281, "epoch": 3911} {"train_loss": -6.955192565917969, "global_step": 164282, "epoch": 3911} {"train_loss": -6.86863374710083, "global_step": 164283, "epoch": 3911} {"train_loss": -6.884827136993408, "global_step": 164284, "epoch": 3911} {"train_loss": -6.95560359954834, "global_step": 164285, "epoch": 3911} {"train_loss": -6.80494499206543, "global_step": 164286, "epoch": 3911} {"train_loss": -6.880176544189453, "global_step": 164287, "epoch": 3911} {"train_loss": -6.773316860198975, "global_step": 164288, "epoch": 3911} {"train_loss": -6.891478538513184, "global_step": 164289, "epoch": 3911} {"train_loss": -6.902778625488281, "global_step": 164290, "epoch": 3911} {"train_loss": -6.89223575592041, "global_step": 164291, "epoch": 3911} {"train_loss": -6.933528423309326, "global_step": 164292, "epoch": 3911} {"train_loss": -6.767902851104736, "global_step": 164293, "epoch": 3911} {"train_loss": -6.845864772796631, "global_step": 164294, "epoch": 3911} {"train_loss": -6.850087642669678, "global_step": 164295, "epoch": 3911} {"train_loss": -6.945273399353027, "global_step": 164296, "epoch": 3911} {"train_loss": -6.966089248657227, "global_step": 164297, "epoch": 3911} {"train_loss": -6.914610862731934, "global_step": 164298, "epoch": 3911} {"train_loss": -6.9231767654418945, "global_step": 164299, "epoch": 3911} {"train_loss": -6.927338600158691, "global_step": 164300, "epoch": 3911} {"train_loss": -6.836651802062988, "global_step": 164301, "epoch": 3911} {"train_loss": -6.916508674621582, "global_step": 164302, "epoch": 3911} {"train_loss": -6.902236461639404, "global_step": 164303, "epoch": 3911, "val_loss": 68571.0546875} {"train_loss": -6.938921928405762, "global_step": 164304, "epoch": 3912} {"train_loss": -7.005315780639648, "global_step": 164305, "epoch": 3912} {"train_loss": -6.877531051635742, "global_step": 164306, "epoch": 3912} {"train_loss": -6.958855628967285, "global_step": 164307, "epoch": 3912} {"train_loss": -6.7707977294921875, "global_step": 164308, "epoch": 3912} {"train_loss": -6.934079170227051, "global_step": 164309, "epoch": 3912} {"train_loss": -6.921631813049316, "global_step": 164310, "epoch": 3912} {"train_loss": -6.909817695617676, "global_step": 164311, "epoch": 3912} {"train_loss": -6.9720563888549805, "global_step": 164312, "epoch": 3912} {"train_loss": -6.84061861038208, "global_step": 164313, "epoch": 3912} {"train_loss": -6.907748222351074, "global_step": 164314, "epoch": 3912} {"train_loss": -6.900144577026367, "global_step": 164315, "epoch": 3912} {"train_loss": -6.8369951248168945, "global_step": 164316, "epoch": 3912} {"train_loss": -6.955592155456543, "global_step": 164317, "epoch": 3912} {"train_loss": -6.881787300109863, "global_step": 164318, "epoch": 3912} {"train_loss": -6.991159439086914, "global_step": 164319, "epoch": 3912} {"train_loss": -6.9632887840271, "global_step": 164320, "epoch": 3912} {"train_loss": -6.935242176055908, "global_step": 164321, "epoch": 3912} {"train_loss": -6.899353981018066, "global_step": 164322, "epoch": 3912} {"train_loss": -6.905592918395996, "global_step": 164323, "epoch": 3912} {"train_loss": -6.986104965209961, "global_step": 164324, "epoch": 3912} {"train_loss": -6.969448089599609, "global_step": 164325, "epoch": 3912} {"train_loss": -6.733168601989746, "global_step": 164326, "epoch": 3912} {"train_loss": -6.987861633300781, "global_step": 164327, "epoch": 3912} {"train_loss": -6.945376396179199, "global_step": 164328, "epoch": 3912} {"train_loss": -6.9525017738342285, "global_step": 164329, "epoch": 3912} {"train_loss": -7.026556491851807, "global_step": 164330, "epoch": 3912} {"train_loss": -6.892899513244629, "global_step": 164331, "epoch": 3912} {"train_loss": -6.988728046417236, "global_step": 164332, "epoch": 3912} {"train_loss": -7.064871311187744, "global_step": 164333, "epoch": 3912} {"train_loss": -6.932678699493408, "global_step": 164334, "epoch": 3912} {"train_loss": -7.020999908447266, "global_step": 164335, "epoch": 3912} {"train_loss": -6.9539995193481445, "global_step": 164336, "epoch": 3912} {"train_loss": -6.917217254638672, "global_step": 164337, "epoch": 3912} {"train_loss": -6.833396911621094, "global_step": 164338, "epoch": 3912} {"train_loss": -6.9233856201171875, "global_step": 164339, "epoch": 3912} {"train_loss": -6.917780876159668, "global_step": 164340, "epoch": 3912} {"train_loss": -6.966087818145752, "global_step": 164341, "epoch": 3912} {"train_loss": -6.981420040130615, "global_step": 164342, "epoch": 3912} {"train_loss": -6.999115943908691, "global_step": 164343, "epoch": 3912} {"train_loss": -7.0210089683532715, "global_step": 164344, "epoch": 3912} {"train_loss": -6.935058673222859, "global_step": 164345, "epoch": 3912, "val_loss": 68608.2421875} {"train_loss": -6.926677703857422, "global_step": 164346, "epoch": 3913} {"train_loss": -7.075445175170898, "global_step": 164347, "epoch": 3913} {"train_loss": -6.902420520782471, "global_step": 164348, "epoch": 3913} {"train_loss": -6.848754405975342, "global_step": 164349, "epoch": 3913} {"train_loss": -6.964666366577148, "global_step": 164350, "epoch": 3913} {"train_loss": -6.9415364265441895, "global_step": 164351, "epoch": 3913} {"train_loss": -7.043332099914551, "global_step": 164352, "epoch": 3913} {"train_loss": -6.963589191436768, "global_step": 164353, "epoch": 3913} {"train_loss": -6.978896617889404, "global_step": 164354, "epoch": 3913} {"train_loss": -6.982760429382324, "global_step": 164355, "epoch": 3913} {"train_loss": -6.9815263748168945, "global_step": 164356, "epoch": 3913} {"train_loss": -6.864894390106201, "global_step": 164357, "epoch": 3913} {"train_loss": -6.819332599639893, "global_step": 164358, "epoch": 3913} {"train_loss": -6.861255168914795, "global_step": 164359, "epoch": 3913} {"train_loss": -7.027264595031738, "global_step": 164360, "epoch": 3913} {"train_loss": -6.9746880531311035, "global_step": 164361, "epoch": 3913} {"train_loss": -6.927253246307373, "global_step": 164362, "epoch": 3913} {"train_loss": -6.949719429016113, "global_step": 164363, "epoch": 3913} {"train_loss": -6.962406158447266, "global_step": 164364, "epoch": 3913} {"train_loss": -6.977686405181885, "global_step": 164365, "epoch": 3913} {"train_loss": -6.8422322273254395, "global_step": 164366, "epoch": 3913} {"train_loss": -6.920322418212891, "global_step": 164367, "epoch": 3913} {"train_loss": -6.99109411239624, "global_step": 164368, "epoch": 3913} {"train_loss": -6.946857452392578, "global_step": 164369, "epoch": 3913} {"train_loss": -6.852597236633301, "global_step": 164370, "epoch": 3913} {"train_loss": -6.938017845153809, "global_step": 164371, "epoch": 3913} {"train_loss": -6.893177032470703, "global_step": 164372, "epoch": 3913} {"train_loss": -6.917638778686523, "global_step": 164373, "epoch": 3913} {"train_loss": -6.924409866333008, "global_step": 164374, "epoch": 3913} {"train_loss": -6.979104995727539, "global_step": 164375, "epoch": 3913} {"train_loss": -6.875655174255371, "global_step": 164376, "epoch": 3913} {"train_loss": -6.924566745758057, "global_step": 164377, "epoch": 3913} {"train_loss": -6.905331611633301, "global_step": 164378, "epoch": 3913} {"train_loss": -6.917850494384766, "global_step": 164379, "epoch": 3913} {"train_loss": -6.959552764892578, "global_step": 164380, "epoch": 3913} {"train_loss": -6.86685037612915, "global_step": 164381, "epoch": 3913} {"train_loss": -6.945159912109375, "global_step": 164382, "epoch": 3913} {"train_loss": -6.991151809692383, "global_step": 164383, "epoch": 3913} {"train_loss": -6.980307579040527, "global_step": 164384, "epoch": 3913} {"train_loss": -6.926280975341797, "global_step": 164385, "epoch": 3913} {"train_loss": -6.954130172729492, "global_step": 164386, "epoch": 3913} {"train_loss": -6.937381494612921, "global_step": 164387, "epoch": 3913, "val_loss": 68490.96875} {"train_loss": -6.8713836669921875, "global_step": 164388, "epoch": 3914} {"train_loss": -6.835334777832031, "global_step": 164389, "epoch": 3914} {"train_loss": -7.088956356048584, "global_step": 164390, "epoch": 3914} {"train_loss": -6.998757362365723, "global_step": 164391, "epoch": 3914} {"train_loss": -6.884437084197998, "global_step": 164392, "epoch": 3914} {"train_loss": -6.891592502593994, "global_step": 164393, "epoch": 3914} {"train_loss": -6.9314775466918945, "global_step": 164394, "epoch": 3914} {"train_loss": -6.8634538650512695, "global_step": 164395, "epoch": 3914} {"train_loss": -6.911291122436523, "global_step": 164396, "epoch": 3914} {"train_loss": -6.87660026550293, "global_step": 164397, "epoch": 3914} {"train_loss": -6.885318756103516, "global_step": 164398, "epoch": 3914} {"train_loss": -6.947322845458984, "global_step": 164399, "epoch": 3914} {"train_loss": -6.867045879364014, "global_step": 164400, "epoch": 3914} {"train_loss": -7.001972675323486, "global_step": 164401, "epoch": 3914} {"train_loss": -6.894660472869873, "global_step": 164402, "epoch": 3914} {"train_loss": -6.90186882019043, "global_step": 164403, "epoch": 3914} {"train_loss": -7.000882625579834, "global_step": 164404, "epoch": 3914} {"train_loss": -6.772773742675781, "global_step": 164405, "epoch": 3914} {"train_loss": -6.980221748352051, "global_step": 164406, "epoch": 3914} {"train_loss": -6.962652683258057, "global_step": 164407, "epoch": 3914} {"train_loss": -6.936365127563477, "global_step": 164408, "epoch": 3914} {"train_loss": -6.872788906097412, "global_step": 164409, "epoch": 3914} {"train_loss": -6.997986793518066, "global_step": 164410, "epoch": 3914} {"train_loss": -6.947918891906738, "global_step": 164411, "epoch": 3914} {"train_loss": -6.929340362548828, "global_step": 164412, "epoch": 3914} {"train_loss": -6.980927467346191, "global_step": 164413, "epoch": 3914} {"train_loss": -6.85547399520874, "global_step": 164414, "epoch": 3914} {"train_loss": -6.9174699783325195, "global_step": 164415, "epoch": 3914} {"train_loss": -7.062898635864258, "global_step": 164416, "epoch": 3914} {"train_loss": -6.907037734985352, "global_step": 164417, "epoch": 3914} {"train_loss": -6.966118812561035, "global_step": 164418, "epoch": 3914} {"train_loss": -7.008462429046631, "global_step": 164419, "epoch": 3914} {"train_loss": -6.961053848266602, "global_step": 164420, "epoch": 3914} {"train_loss": -7.027502059936523, "global_step": 164421, "epoch": 3914} {"train_loss": -7.093669891357422, "global_step": 164422, "epoch": 3914} {"train_loss": -6.969155311584473, "global_step": 164423, "epoch": 3914} {"train_loss": -7.030460834503174, "global_step": 164424, "epoch": 3914} {"train_loss": -7.007153511047363, "global_step": 164425, "epoch": 3914} {"train_loss": -6.937961578369141, "global_step": 164426, "epoch": 3914} {"train_loss": -6.96435546875, "global_step": 164427, "epoch": 3914} {"train_loss": -7.011986255645752, "global_step": 164428, "epoch": 3914} {"train_loss": -6.94775702839806, "global_step": 164429, "epoch": 3914, "val_loss": 68746.6328125} {"train_loss": -6.9173126220703125, "global_step": 164430, "epoch": 3915} {"train_loss": -6.903314590454102, "global_step": 164431, "epoch": 3915} {"train_loss": -7.037271976470947, "global_step": 164432, "epoch": 3915} {"train_loss": -6.897250175476074, "global_step": 164433, "epoch": 3915} {"train_loss": -7.004090785980225, "global_step": 164434, "epoch": 3915} {"train_loss": -6.881422519683838, "global_step": 164435, "epoch": 3915} {"train_loss": -6.938782691955566, "global_step": 164436, "epoch": 3915} {"train_loss": -6.888071537017822, "global_step": 164437, "epoch": 3915} {"train_loss": -6.9827680587768555, "global_step": 164438, "epoch": 3915} {"train_loss": -7.017636299133301, "global_step": 164439, "epoch": 3915} {"train_loss": -6.992608070373535, "global_step": 164440, "epoch": 3915} {"train_loss": -6.8364715576171875, "global_step": 164441, "epoch": 3915} {"train_loss": -6.981719970703125, "global_step": 164442, "epoch": 3915} {"train_loss": -7.0818634033203125, "global_step": 164443, "epoch": 3915} {"train_loss": -6.866508483886719, "global_step": 164444, "epoch": 3915} {"train_loss": -7.079001426696777, "global_step": 164445, "epoch": 3915} {"train_loss": -7.080718994140625, "global_step": 164446, "epoch": 3915} {"train_loss": -7.012814521789551, "global_step": 164447, "epoch": 3915} {"train_loss": -6.891637325286865, "global_step": 164448, "epoch": 3915} {"train_loss": -7.0814948081970215, "global_step": 164449, "epoch": 3915} {"train_loss": -6.977818012237549, "global_step": 164450, "epoch": 3915} {"train_loss": -7.01241397857666, "global_step": 164451, "epoch": 3915} {"train_loss": -6.959858417510986, "global_step": 164452, "epoch": 3915} {"train_loss": -7.109499931335449, "global_step": 164453, "epoch": 3915} {"train_loss": -6.930833339691162, "global_step": 164454, "epoch": 3915} {"train_loss": -7.05600643157959, "global_step": 164455, "epoch": 3915} {"train_loss": -7.004276275634766, "global_step": 164456, "epoch": 3915} {"train_loss": -6.94091796875, "global_step": 164457, "epoch": 3915} {"train_loss": -7.005565166473389, "global_step": 164458, "epoch": 3915} {"train_loss": -6.978119850158691, "global_step": 164459, "epoch": 3915} {"train_loss": -6.9352874755859375, "global_step": 164460, "epoch": 3915} {"train_loss": -7.009878635406494, "global_step": 164461, "epoch": 3915} {"train_loss": -7.028047561645508, "global_step": 164462, "epoch": 3915} {"train_loss": -7.032931327819824, "global_step": 164463, "epoch": 3915} {"train_loss": -6.99896764755249, "global_step": 164464, "epoch": 3915} {"train_loss": -7.013765335083008, "global_step": 164465, "epoch": 3915} {"train_loss": -6.980955123901367, "global_step": 164466, "epoch": 3915} {"train_loss": -7.017882347106934, "global_step": 164467, "epoch": 3915} {"train_loss": -7.013496398925781, "global_step": 164468, "epoch": 3915} {"train_loss": -6.950793266296387, "global_step": 164469, "epoch": 3915} {"train_loss": -7.024508476257324, "global_step": 164470, "epoch": 3915} {"train_loss": -6.984106949397495, "global_step": 164471, "epoch": 3915, "val_loss": 68563.9140625} {"train_loss": -6.99434757232666, "global_step": 164472, "epoch": 3916} {"train_loss": -7.0045576095581055, "global_step": 164473, "epoch": 3916} {"train_loss": -6.909765243530273, "global_step": 164474, "epoch": 3916} {"train_loss": -7.11672306060791, "global_step": 164475, "epoch": 3916} {"train_loss": -6.923117637634277, "global_step": 164476, "epoch": 3916} {"train_loss": -6.96016788482666, "global_step": 164477, "epoch": 3916} {"train_loss": -6.963994979858398, "global_step": 164478, "epoch": 3916} {"train_loss": -7.00931978225708, "global_step": 164479, "epoch": 3916} {"train_loss": -6.965883255004883, "global_step": 164480, "epoch": 3916} {"train_loss": -6.939379692077637, "global_step": 164481, "epoch": 3916} {"train_loss": -6.848225116729736, "global_step": 164482, "epoch": 3916} {"train_loss": -6.897892475128174, "global_step": 164483, "epoch": 3916} {"train_loss": -6.919695854187012, "global_step": 164484, "epoch": 3916} {"train_loss": -7.0109100341796875, "global_step": 164485, "epoch": 3916} {"train_loss": -6.949028015136719, "global_step": 164486, "epoch": 3916} {"train_loss": -6.91234016418457, "global_step": 164487, "epoch": 3916} {"train_loss": -6.901922225952148, "global_step": 164488, "epoch": 3916} {"train_loss": -7.00542688369751, "global_step": 164489, "epoch": 3916} {"train_loss": -6.9795145988464355, "global_step": 164490, "epoch": 3916} {"train_loss": -6.893280029296875, "global_step": 164491, "epoch": 3916} {"train_loss": -6.918974876403809, "global_step": 164492, "epoch": 3916} {"train_loss": -6.959820747375488, "global_step": 164493, "epoch": 3916} {"train_loss": -6.856861114501953, "global_step": 164494, "epoch": 3916} {"train_loss": -6.903398513793945, "global_step": 164495, "epoch": 3916} {"train_loss": -6.868886470794678, "global_step": 164496, "epoch": 3916} {"train_loss": -7.0569305419921875, "global_step": 164497, "epoch": 3916} {"train_loss": -6.9124579429626465, "global_step": 164498, "epoch": 3916} {"train_loss": -6.865723609924316, "global_step": 164499, "epoch": 3916} {"train_loss": -6.851992607116699, "global_step": 164500, "epoch": 3916} {"train_loss": -7.011722564697266, "global_step": 164501, "epoch": 3916} {"train_loss": -6.882090091705322, "global_step": 164502, "epoch": 3916} {"train_loss": -6.803467750549316, "global_step": 164503, "epoch": 3916} {"train_loss": -6.992513656616211, "global_step": 164504, "epoch": 3916} {"train_loss": -6.925510883331299, "global_step": 164505, "epoch": 3916} {"train_loss": -6.936410427093506, "global_step": 164506, "epoch": 3916} {"train_loss": -6.932606220245361, "global_step": 164507, "epoch": 3916} {"train_loss": -6.922854900360107, "global_step": 164508, "epoch": 3916} {"train_loss": -6.987911224365234, "global_step": 164509, "epoch": 3916} {"train_loss": -6.976245880126953, "global_step": 164510, "epoch": 3916} {"train_loss": -6.952096939086914, "global_step": 164511, "epoch": 3916} {"train_loss": -7.038837432861328, "global_step": 164512, "epoch": 3916} {"train_loss": -6.944006113778977, "global_step": 164513, "epoch": 3916, "val_loss": 68587.1484375} {"train_loss": -6.976766586303711, "global_step": 164514, "epoch": 3917} {"train_loss": -6.95649528503418, "global_step": 164515, "epoch": 3917} {"train_loss": -7.015872478485107, "global_step": 164516, "epoch": 3917} {"train_loss": -6.867773056030273, "global_step": 164517, "epoch": 3917} {"train_loss": -6.821898460388184, "global_step": 164518, "epoch": 3917} {"train_loss": -6.923336029052734, "global_step": 164519, "epoch": 3917} {"train_loss": -6.940343856811523, "global_step": 164520, "epoch": 3917} {"train_loss": -6.887901782989502, "global_step": 164521, "epoch": 3917} {"train_loss": -6.992314338684082, "global_step": 164522, "epoch": 3917} {"train_loss": -6.865838527679443, "global_step": 164523, "epoch": 3917} {"train_loss": -6.998992919921875, "global_step": 164524, "epoch": 3917} {"train_loss": -7.026933670043945, "global_step": 164525, "epoch": 3917} {"train_loss": -6.931619644165039, "global_step": 164526, "epoch": 3917} {"train_loss": -6.874483108520508, "global_step": 164527, "epoch": 3917} {"train_loss": -6.99643611907959, "global_step": 164528, "epoch": 3917} {"train_loss": -6.8876848220825195, "global_step": 164529, "epoch": 3917} {"train_loss": -6.935839653015137, "global_step": 164530, "epoch": 3917} {"train_loss": -6.918452262878418, "global_step": 164531, "epoch": 3917} {"train_loss": -6.906736373901367, "global_step": 164532, "epoch": 3917} {"train_loss": -6.828531265258789, "global_step": 164533, "epoch": 3917} {"train_loss": -6.890937805175781, "global_step": 164534, "epoch": 3917} {"train_loss": -7.0002031326293945, "global_step": 164535, "epoch": 3917} {"train_loss": -6.974206924438477, "global_step": 164536, "epoch": 3917} {"train_loss": -7.000996112823486, "global_step": 164537, "epoch": 3917} {"train_loss": -6.881644248962402, "global_step": 164538, "epoch": 3917} {"train_loss": -6.899986267089844, "global_step": 164539, "epoch": 3917} {"train_loss": -6.802155494689941, "global_step": 164540, "epoch": 3917} {"train_loss": -6.965533256530762, "global_step": 164541, "epoch": 3917} {"train_loss": -6.988025665283203, "global_step": 164542, "epoch": 3917} {"train_loss": -6.910542011260986, "global_step": 164543, "epoch": 3917} {"train_loss": -6.939428329467773, "global_step": 164544, "epoch": 3917} {"train_loss": -6.8176679611206055, "global_step": 164545, "epoch": 3917} {"train_loss": -6.878203392028809, "global_step": 164546, "epoch": 3917} {"train_loss": -6.934117794036865, "global_step": 164547, "epoch": 3917} {"train_loss": -7.036128997802734, "global_step": 164548, "epoch": 3917} {"train_loss": -6.965109825134277, "global_step": 164549, "epoch": 3917} {"train_loss": -6.957242965698242, "global_step": 164550, "epoch": 3917} {"train_loss": -6.812661170959473, "global_step": 164551, "epoch": 3917} {"train_loss": -6.840753555297852, "global_step": 164552, "epoch": 3917} {"train_loss": -6.874625205993652, "global_step": 164553, "epoch": 3917} {"train_loss": -6.959768772125244, "global_step": 164554, "epoch": 3917} {"train_loss": -6.924215657370431, "global_step": 164555, "epoch": 3917, "val_loss": 68534.6796875} {"train_loss": -6.906559944152832, "global_step": 164556, "epoch": 3918} {"train_loss": -6.959808826446533, "global_step": 164557, "epoch": 3918} {"train_loss": -7.012569427490234, "global_step": 164558, "epoch": 3918} {"train_loss": -6.944098949432373, "global_step": 164559, "epoch": 3918} {"train_loss": -6.996429443359375, "global_step": 164560, "epoch": 3918} {"train_loss": -6.982535362243652, "global_step": 164561, "epoch": 3918} {"train_loss": -6.93403434753418, "global_step": 164562, "epoch": 3918} {"train_loss": -6.955048084259033, "global_step": 164563, "epoch": 3918} {"train_loss": -6.93959903717041, "global_step": 164564, "epoch": 3918} {"train_loss": -6.904668807983398, "global_step": 164565, "epoch": 3918} {"train_loss": -6.882157325744629, "global_step": 164566, "epoch": 3918} {"train_loss": -6.84635066986084, "global_step": 164567, "epoch": 3918} {"train_loss": -6.991453170776367, "global_step": 164568, "epoch": 3918} {"train_loss": -7.048248291015625, "global_step": 164569, "epoch": 3918} {"train_loss": -7.094484806060791, "global_step": 164570, "epoch": 3918} {"train_loss": -6.94578218460083, "global_step": 164571, "epoch": 3918} {"train_loss": -7.093749523162842, "global_step": 164572, "epoch": 3918} {"train_loss": -7.063164234161377, "global_step": 164573, "epoch": 3918} {"train_loss": -7.02042293548584, "global_step": 164574, "epoch": 3918} {"train_loss": -6.942899703979492, "global_step": 164575, "epoch": 3918} {"train_loss": -7.029000759124756, "global_step": 164576, "epoch": 3918} {"train_loss": -6.9439897537231445, "global_step": 164577, "epoch": 3918} {"train_loss": -7.012452602386475, "global_step": 164578, "epoch": 3918} {"train_loss": -6.856832504272461, "global_step": 164579, "epoch": 3918} {"train_loss": -6.947978973388672, "global_step": 164580, "epoch": 3918} {"train_loss": -6.878515720367432, "global_step": 164581, "epoch": 3918} {"train_loss": -6.831526756286621, "global_step": 164582, "epoch": 3918} {"train_loss": -6.996605396270752, "global_step": 164583, "epoch": 3918} {"train_loss": -6.840856552124023, "global_step": 164584, "epoch": 3918} {"train_loss": -6.730979919433594, "global_step": 164585, "epoch": 3918} {"train_loss": -6.863253593444824, "global_step": 164586, "epoch": 3918} {"train_loss": -6.797542095184326, "global_step": 164587, "epoch": 3918} {"train_loss": -6.950373649597168, "global_step": 164588, "epoch": 3918} {"train_loss": -6.950490951538086, "global_step": 164589, "epoch": 3918} {"train_loss": -6.812083721160889, "global_step": 164590, "epoch": 3918} {"train_loss": -6.843937873840332, "global_step": 164591, "epoch": 3918} {"train_loss": -6.716070175170898, "global_step": 164592, "epoch": 3918} {"train_loss": -6.901669502258301, "global_step": 164593, "epoch": 3918} {"train_loss": -6.84613561630249, "global_step": 164594, "epoch": 3918} {"train_loss": -7.02151346206665, "global_step": 164595, "epoch": 3918} {"train_loss": -6.793885707855225, "global_step": 164596, "epoch": 3918} {"train_loss": -6.926798604783558, "global_step": 164597, "epoch": 3918, "val_loss": 68689.5234375} {"train_loss": -6.948664665222168, "global_step": 164598, "epoch": 3919} {"train_loss": -6.776525497436523, "global_step": 164599, "epoch": 3919} {"train_loss": -6.935855388641357, "global_step": 164600, "epoch": 3919} {"train_loss": -6.852215766906738, "global_step": 164601, "epoch": 3919} {"train_loss": -6.975123405456543, "global_step": 164602, "epoch": 3919} {"train_loss": -6.928920745849609, "global_step": 164603, "epoch": 3919} {"train_loss": -7.0075201988220215, "global_step": 164604, "epoch": 3919} {"train_loss": -6.918335914611816, "global_step": 164605, "epoch": 3919} {"train_loss": -6.8218994140625, "global_step": 164606, "epoch": 3919} {"train_loss": -6.920815944671631, "global_step": 164607, "epoch": 3919} {"train_loss": -6.833433151245117, "global_step": 164608, "epoch": 3919} {"train_loss": -7.013506889343262, "global_step": 164609, "epoch": 3919} {"train_loss": -6.897064208984375, "global_step": 164610, "epoch": 3919} {"train_loss": -6.974421501159668, "global_step": 164611, "epoch": 3919} {"train_loss": -6.956437110900879, "global_step": 164612, "epoch": 3919} {"train_loss": -6.986665725708008, "global_step": 164613, "epoch": 3919} {"train_loss": -6.930815696716309, "global_step": 164614, "epoch": 3919} {"train_loss": -6.908917427062988, "global_step": 164615, "epoch": 3919} {"train_loss": -6.970783233642578, "global_step": 164616, "epoch": 3919} {"train_loss": -7.027921676635742, "global_step": 164617, "epoch": 3919} {"train_loss": -6.9970550537109375, "global_step": 164618, "epoch": 3919} {"train_loss": -6.853722095489502, "global_step": 164619, "epoch": 3919} {"train_loss": -6.980932235717773, "global_step": 164620, "epoch": 3919} {"train_loss": -6.913210868835449, "global_step": 164621, "epoch": 3919} {"train_loss": -6.845355033874512, "global_step": 164622, "epoch": 3919} {"train_loss": -6.938981533050537, "global_step": 164623, "epoch": 3919} {"train_loss": -6.943281173706055, "global_step": 164624, "epoch": 3919} {"train_loss": -6.980499267578125, "global_step": 164625, "epoch": 3919} {"train_loss": -6.894333362579346, "global_step": 164626, "epoch": 3919} {"train_loss": -6.942017555236816, "global_step": 164627, "epoch": 3919} {"train_loss": -6.822517395019531, "global_step": 164628, "epoch": 3919} {"train_loss": -6.937398910522461, "global_step": 164629, "epoch": 3919} {"train_loss": -6.892187118530273, "global_step": 164630, "epoch": 3919} {"train_loss": -6.811567783355713, "global_step": 164631, "epoch": 3919} {"train_loss": -6.923629283905029, "global_step": 164632, "epoch": 3919} {"train_loss": -6.964987754821777, "global_step": 164633, "epoch": 3919} {"train_loss": -6.996302604675293, "global_step": 164634, "epoch": 3919} {"train_loss": -6.914205551147461, "global_step": 164635, "epoch": 3919} {"train_loss": -6.955034255981445, "global_step": 164636, "epoch": 3919} {"train_loss": -6.958822250366211, "global_step": 164637, "epoch": 3919} {"train_loss": -6.942541122436523, "global_step": 164638, "epoch": 3919} {"train_loss": -6.926452761604672, "global_step": 164639, "epoch": 3919, "val_loss": 68681.9765625} {"train_loss": -6.92228889465332, "global_step": 164640, "epoch": 3920} {"train_loss": -6.965340614318848, "global_step": 164641, "epoch": 3920} {"train_loss": -6.905848026275635, "global_step": 164642, "epoch": 3920} {"train_loss": -6.970044136047363, "global_step": 164643, "epoch": 3920} {"train_loss": -6.936418533325195, "global_step": 164644, "epoch": 3920} {"train_loss": -7.0742011070251465, "global_step": 164645, "epoch": 3920} {"train_loss": -6.815757751464844, "global_step": 164646, "epoch": 3920} {"train_loss": -6.964991569519043, "global_step": 164647, "epoch": 3920} {"train_loss": -6.803727149963379, "global_step": 164648, "epoch": 3920} {"train_loss": -6.896783828735352, "global_step": 164649, "epoch": 3920} {"train_loss": -6.923799991607666, "global_step": 164650, "epoch": 3920} {"train_loss": -6.959015369415283, "global_step": 164651, "epoch": 3920} {"train_loss": -7.01729154586792, "global_step": 164652, "epoch": 3920} {"train_loss": -7.036677360534668, "global_step": 164653, "epoch": 3920} {"train_loss": -6.932479381561279, "global_step": 164654, "epoch": 3920} {"train_loss": -6.936078071594238, "global_step": 164655, "epoch": 3920} {"train_loss": -6.7760443687438965, "global_step": 164656, "epoch": 3920} {"train_loss": -6.857146739959717, "global_step": 164657, "epoch": 3920} {"train_loss": -6.953166961669922, "global_step": 164658, "epoch": 3920} {"train_loss": -6.964927673339844, "global_step": 164659, "epoch": 3920} {"train_loss": -6.899299144744873, "global_step": 164660, "epoch": 3920} {"train_loss": -7.00483512878418, "global_step": 164661, "epoch": 3920} {"train_loss": -6.936624526977539, "global_step": 164662, "epoch": 3920} {"train_loss": -6.938189506530762, "global_step": 164663, "epoch": 3920} {"train_loss": -6.923028945922852, "global_step": 164664, "epoch": 3920} {"train_loss": -6.913887023925781, "global_step": 164665, "epoch": 3920} {"train_loss": -7.003149032592773, "global_step": 164666, "epoch": 3920} {"train_loss": -6.880093574523926, "global_step": 164667, "epoch": 3920} {"train_loss": -6.8172383308410645, "global_step": 164668, "epoch": 3920} {"train_loss": -6.911523818969727, "global_step": 164669, "epoch": 3920} {"train_loss": -6.835742950439453, "global_step": 164670, "epoch": 3920} {"train_loss": -6.892484188079834, "global_step": 164671, "epoch": 3920} {"train_loss": -6.948541641235352, "global_step": 164672, "epoch": 3920} {"train_loss": -6.807250022888184, "global_step": 164673, "epoch": 3920} {"train_loss": -6.945487976074219, "global_step": 164674, "epoch": 3920} {"train_loss": -6.842258930206299, "global_step": 164675, "epoch": 3920} {"train_loss": -6.846022605895996, "global_step": 164676, "epoch": 3920} {"train_loss": -6.8943281173706055, "global_step": 164677, "epoch": 3920} {"train_loss": -6.877439498901367, "global_step": 164678, "epoch": 3920} {"train_loss": -6.88159704208374, "global_step": 164679, "epoch": 3920} {"train_loss": -6.849061965942383, "global_step": 164680, "epoch": 3920} {"train_loss": -6.911158266521635, "global_step": 164681, "epoch": 3920, "val_loss": 68478.765625} {"train_loss": -6.956334590911865, "global_step": 164682, "epoch": 3921} {"train_loss": -6.895852088928223, "global_step": 164683, "epoch": 3921} {"train_loss": -6.8905558586120605, "global_step": 164684, "epoch": 3921} {"train_loss": -6.872842788696289, "global_step": 164685, "epoch": 3921} {"train_loss": -6.832248687744141, "global_step": 164686, "epoch": 3921} {"train_loss": -6.954073905944824, "global_step": 164687, "epoch": 3921} {"train_loss": -6.936092376708984, "global_step": 164688, "epoch": 3921} {"train_loss": -6.8937835693359375, "global_step": 164689, "epoch": 3921} {"train_loss": -6.779018878936768, "global_step": 164690, "epoch": 3921} {"train_loss": -6.952825546264648, "global_step": 164691, "epoch": 3921} {"train_loss": -6.892298698425293, "global_step": 164692, "epoch": 3921} {"train_loss": -6.952715873718262, "global_step": 164693, "epoch": 3921} {"train_loss": -6.904892921447754, "global_step": 164694, "epoch": 3921} {"train_loss": -6.93617057800293, "global_step": 164695, "epoch": 3921} {"train_loss": -6.996915340423584, "global_step": 164696, "epoch": 3921} {"train_loss": -6.926575183868408, "global_step": 164697, "epoch": 3921} {"train_loss": -6.957401275634766, "global_step": 164698, "epoch": 3921} {"train_loss": -7.016566753387451, "global_step": 164699, "epoch": 3921} {"train_loss": -6.854066848754883, "global_step": 164700, "epoch": 3921} {"train_loss": -7.000357151031494, "global_step": 164701, "epoch": 3921} {"train_loss": -6.903927326202393, "global_step": 164702, "epoch": 3921} {"train_loss": -6.976152420043945, "global_step": 164703, "epoch": 3921} {"train_loss": -7.017789363861084, "global_step": 164704, "epoch": 3921} {"train_loss": -7.079307556152344, "global_step": 164705, "epoch": 3921} {"train_loss": -6.968849182128906, "global_step": 164706, "epoch": 3921} {"train_loss": -7.108440399169922, "global_step": 164707, "epoch": 3921} {"train_loss": -6.98567533493042, "global_step": 164708, "epoch": 3921} {"train_loss": -6.947698593139648, "global_step": 164709, "epoch": 3921} {"train_loss": -6.93946647644043, "global_step": 164710, "epoch": 3921} {"train_loss": -6.946197509765625, "global_step": 164711, "epoch": 3921} {"train_loss": -6.920973300933838, "global_step": 164712, "epoch": 3921} {"train_loss": -7.054510116577148, "global_step": 164713, "epoch": 3921} {"train_loss": -6.978633403778076, "global_step": 164714, "epoch": 3921} {"train_loss": -7.032436370849609, "global_step": 164715, "epoch": 3921} {"train_loss": -6.916776180267334, "global_step": 164716, "epoch": 3921} {"train_loss": -6.9608235359191895, "global_step": 164717, "epoch": 3921} {"train_loss": -6.839914321899414, "global_step": 164718, "epoch": 3921} {"train_loss": -6.862316131591797, "global_step": 164719, "epoch": 3921} {"train_loss": -6.920803070068359, "global_step": 164720, "epoch": 3921} {"train_loss": -6.982666015625, "global_step": 164721, "epoch": 3921} {"train_loss": -6.932799339294434, "global_step": 164722, "epoch": 3921} {"train_loss": -6.946759621302287, "global_step": 164723, "epoch": 3921, "val_loss": 68652.1875} {"train_loss": -7.059415340423584, "global_step": 164724, "epoch": 3922} {"train_loss": -6.991934776306152, "global_step": 164725, "epoch": 3922} {"train_loss": -6.94588565826416, "global_step": 164726, "epoch": 3922} {"train_loss": -7.006856441497803, "global_step": 164727, "epoch": 3922} {"train_loss": -6.896862983703613, "global_step": 164728, "epoch": 3922} {"train_loss": -6.965024948120117, "global_step": 164729, "epoch": 3922} {"train_loss": -6.971543312072754, "global_step": 164730, "epoch": 3922} {"train_loss": -6.8259429931640625, "global_step": 164731, "epoch": 3922} {"train_loss": -6.989604949951172, "global_step": 164732, "epoch": 3922} {"train_loss": -6.9581499099731445, "global_step": 164733, "epoch": 3922} {"train_loss": -6.967526912689209, "global_step": 164734, "epoch": 3922} {"train_loss": -6.99647331237793, "global_step": 164735, "epoch": 3922} {"train_loss": -6.70432186126709, "global_step": 164736, "epoch": 3922} {"train_loss": -7.0425848960876465, "global_step": 164737, "epoch": 3922} {"train_loss": -6.873873710632324, "global_step": 164738, "epoch": 3922} {"train_loss": -6.927428245544434, "global_step": 164739, "epoch": 3922} {"train_loss": -6.930835247039795, "global_step": 164740, "epoch": 3922} {"train_loss": -6.735083103179932, "global_step": 164741, "epoch": 3922} {"train_loss": -6.913944244384766, "global_step": 164742, "epoch": 3922} {"train_loss": -6.849180221557617, "global_step": 164743, "epoch": 3922} {"train_loss": -7.01123046875, "global_step": 164744, "epoch": 3922} {"train_loss": -6.915528774261475, "global_step": 164745, "epoch": 3922} {"train_loss": -6.804316997528076, "global_step": 164746, "epoch": 3922} {"train_loss": -6.891761779785156, "global_step": 164747, "epoch": 3922} {"train_loss": -6.890537261962891, "global_step": 164748, "epoch": 3922} {"train_loss": -6.9114508628845215, "global_step": 164749, "epoch": 3922} {"train_loss": -6.868684768676758, "global_step": 164750, "epoch": 3922} {"train_loss": -6.8459601402282715, "global_step": 164751, "epoch": 3922} {"train_loss": -6.955853462219238, "global_step": 164752, "epoch": 3922} {"train_loss": -6.91801643371582, "global_step": 164753, "epoch": 3922} {"train_loss": -6.914505958557129, "global_step": 164754, "epoch": 3922} {"train_loss": -6.919694900512695, "global_step": 164755, "epoch": 3922} {"train_loss": -6.822601318359375, "global_step": 164756, "epoch": 3922} {"train_loss": -6.9491400718688965, "global_step": 164757, "epoch": 3922} {"train_loss": -6.935897350311279, "global_step": 164758, "epoch": 3922} {"train_loss": -6.902880668640137, "global_step": 164759, "epoch": 3922} {"train_loss": -6.926790237426758, "global_step": 164760, "epoch": 3922} {"train_loss": -6.993851661682129, "global_step": 164761, "epoch": 3922} {"train_loss": -6.9827775955200195, "global_step": 164762, "epoch": 3922} {"train_loss": -6.9603376388549805, "global_step": 164763, "epoch": 3922} {"train_loss": -6.9274797439575195, "global_step": 164764, "epoch": 3922} {"train_loss": -6.922653141475859, "global_step": 164765, "epoch": 3922, "val_loss": 68498.296875} {"train_loss": -6.979416847229004, "global_step": 164766, "epoch": 3923} {"train_loss": -6.892271041870117, "global_step": 164767, "epoch": 3923} {"train_loss": -6.934731483459473, "global_step": 164768, "epoch": 3923} {"train_loss": -6.979897975921631, "global_step": 164769, "epoch": 3923} {"train_loss": -7.052778244018555, "global_step": 164770, "epoch": 3923} {"train_loss": -7.050885200500488, "global_step": 164771, "epoch": 3923} {"train_loss": -6.940382957458496, "global_step": 164772, "epoch": 3923} {"train_loss": -7.0443010330200195, "global_step": 164773, "epoch": 3923} {"train_loss": -6.958420753479004, "global_step": 164774, "epoch": 3923} {"train_loss": -7.049380302429199, "global_step": 164775, "epoch": 3923} {"train_loss": -6.956119537353516, "global_step": 164776, "epoch": 3923} {"train_loss": -6.938117980957031, "global_step": 164777, "epoch": 3923} {"train_loss": -7.0953216552734375, "global_step": 164778, "epoch": 3923} {"train_loss": -6.916767120361328, "global_step": 164779, "epoch": 3923} {"train_loss": -6.9451584815979, "global_step": 164780, "epoch": 3923} {"train_loss": -6.978304862976074, "global_step": 164781, "epoch": 3923} {"train_loss": -6.97679328918457, "global_step": 164782, "epoch": 3923} {"train_loss": -6.975606918334961, "global_step": 164783, "epoch": 3923} {"train_loss": -7.044201850891113, "global_step": 164784, "epoch": 3923} {"train_loss": -7.016054153442383, "global_step": 164785, "epoch": 3923} {"train_loss": -7.0224151611328125, "global_step": 164786, "epoch": 3923} {"train_loss": -7.002152919769287, "global_step": 164787, "epoch": 3923} {"train_loss": -6.9298224449157715, "global_step": 164788, "epoch": 3923} {"train_loss": -7.012042999267578, "global_step": 164789, "epoch": 3923} {"train_loss": -7.012752056121826, "global_step": 164790, "epoch": 3923} {"train_loss": -7.006473541259766, "global_step": 164791, "epoch": 3923} {"train_loss": -6.943675518035889, "global_step": 164792, "epoch": 3923} {"train_loss": -7.0305399894714355, "global_step": 164793, "epoch": 3923} {"train_loss": -6.971534252166748, "global_step": 164794, "epoch": 3923} {"train_loss": -6.996253490447998, "global_step": 164795, "epoch": 3923} {"train_loss": -7.0538554191589355, "global_step": 164796, "epoch": 3923} {"train_loss": -6.95929479598999, "global_step": 164797, "epoch": 3923} {"train_loss": -7.011378288269043, "global_step": 164798, "epoch": 3923} {"train_loss": -6.963950157165527, "global_step": 164799, "epoch": 3923} {"train_loss": -7.1382155418396, "global_step": 164800, "epoch": 3923} {"train_loss": -6.913574695587158, "global_step": 164801, "epoch": 3923} {"train_loss": -7.006092071533203, "global_step": 164802, "epoch": 3923} {"train_loss": -7.097713947296143, "global_step": 164803, "epoch": 3923} {"train_loss": -7.017309188842773, "global_step": 164804, "epoch": 3923} {"train_loss": -7.127202987670898, "global_step": 164805, "epoch": 3923} {"train_loss": -7.17093563079834, "global_step": 164806, "epoch": 3923} {"train_loss": -7.002457266762143, "global_step": 164807, "epoch": 3923, "val_loss": 68514.2890625} {"train_loss": -6.939434051513672, "global_step": 164808, "epoch": 3924} {"train_loss": -7.089812278747559, "global_step": 164809, "epoch": 3924} {"train_loss": -6.906694412231445, "global_step": 164810, "epoch": 3924} {"train_loss": -7.097151756286621, "global_step": 164811, "epoch": 3924} {"train_loss": -6.978558540344238, "global_step": 164812, "epoch": 3924} {"train_loss": -7.014932155609131, "global_step": 164813, "epoch": 3924} {"train_loss": -6.96555233001709, "global_step": 164814, "epoch": 3924} {"train_loss": -7.002480506896973, "global_step": 164815, "epoch": 3924} {"train_loss": -7.024196147918701, "global_step": 164816, "epoch": 3924} {"train_loss": -6.855568885803223, "global_step": 164817, "epoch": 3924} {"train_loss": -6.881954193115234, "global_step": 164818, "epoch": 3924} {"train_loss": -7.062711238861084, "global_step": 164819, "epoch": 3924} {"train_loss": -6.79203462600708, "global_step": 164820, "epoch": 3924} {"train_loss": -6.984321594238281, "global_step": 164821, "epoch": 3924} {"train_loss": -6.989806175231934, "global_step": 164822, "epoch": 3924} {"train_loss": -6.952519416809082, "global_step": 164823, "epoch": 3924} {"train_loss": -6.979497909545898, "global_step": 164824, "epoch": 3924} {"train_loss": -6.8824357986450195, "global_step": 164825, "epoch": 3924} {"train_loss": -6.842888832092285, "global_step": 164826, "epoch": 3924} {"train_loss": -6.834733963012695, "global_step": 164827, "epoch": 3924} {"train_loss": -6.8677263259887695, "global_step": 164828, "epoch": 3924} {"train_loss": -6.981868267059326, "global_step": 164829, "epoch": 3924} {"train_loss": -6.971375465393066, "global_step": 164830, "epoch": 3924} {"train_loss": -6.992850303649902, "global_step": 164831, "epoch": 3924} {"train_loss": -7.0609869956970215, "global_step": 164832, "epoch": 3924} {"train_loss": -6.885745048522949, "global_step": 164833, "epoch": 3924} {"train_loss": -6.9336957931518555, "global_step": 164834, "epoch": 3924} {"train_loss": -6.973647117614746, "global_step": 164835, "epoch": 3924} {"train_loss": -6.908686637878418, "global_step": 164836, "epoch": 3924} {"train_loss": -6.886025428771973, "global_step": 164837, "epoch": 3924} {"train_loss": -7.009801864624023, "global_step": 164838, "epoch": 3924} {"train_loss": -6.933415412902832, "global_step": 164839, "epoch": 3924} {"train_loss": -7.025068283081055, "global_step": 164840, "epoch": 3924} {"train_loss": -6.858630180358887, "global_step": 164841, "epoch": 3924} {"train_loss": -6.904778957366943, "global_step": 164842, "epoch": 3924} {"train_loss": -6.895930290222168, "global_step": 164843, "epoch": 3924} {"train_loss": -6.966691017150879, "global_step": 164844, "epoch": 3924} {"train_loss": -6.873220920562744, "global_step": 164845, "epoch": 3924} {"train_loss": -6.914280891418457, "global_step": 164846, "epoch": 3924} {"train_loss": -6.88043737411499, "global_step": 164847, "epoch": 3924} {"train_loss": -6.951650619506836, "global_step": 164848, "epoch": 3924} {"train_loss": -6.944284416380382, "global_step": 164849, "epoch": 3924, "val_loss": 68474.7421875} {"train_loss": -6.969097137451172, "global_step": 164850, "epoch": 3925} {"train_loss": -6.9436750411987305, "global_step": 164851, "epoch": 3925} {"train_loss": -6.8845953941345215, "global_step": 164852, "epoch": 3925} {"train_loss": -6.8957929611206055, "global_step": 164853, "epoch": 3925} {"train_loss": -6.977237701416016, "global_step": 164854, "epoch": 3925} {"train_loss": -6.857149600982666, "global_step": 164855, "epoch": 3925} {"train_loss": -6.877639293670654, "global_step": 164856, "epoch": 3925} {"train_loss": -7.0048136711120605, "global_step": 164857, "epoch": 3925} {"train_loss": -6.914666175842285, "global_step": 164858, "epoch": 3925} {"train_loss": -6.734721660614014, "global_step": 164859, "epoch": 3925} {"train_loss": -6.976737976074219, "global_step": 164860, "epoch": 3925} {"train_loss": -6.823966026306152, "global_step": 164861, "epoch": 3925} {"train_loss": -6.967061996459961, "global_step": 164862, "epoch": 3925} {"train_loss": -6.869052886962891, "global_step": 164863, "epoch": 3925} {"train_loss": -6.84270715713501, "global_step": 164864, "epoch": 3925} {"train_loss": -7.012326717376709, "global_step": 164865, "epoch": 3925} {"train_loss": -6.881895065307617, "global_step": 164866, "epoch": 3925} {"train_loss": -6.823836803436279, "global_step": 164867, "epoch": 3925} {"train_loss": -6.751677513122559, "global_step": 164868, "epoch": 3925} {"train_loss": -6.854036331176758, "global_step": 164869, "epoch": 3925} {"train_loss": -6.814765930175781, "global_step": 164870, "epoch": 3925} {"train_loss": -6.769363880157471, "global_step": 164871, "epoch": 3925} {"train_loss": -6.835360050201416, "global_step": 164872, "epoch": 3925} {"train_loss": -6.784720420837402, "global_step": 164873, "epoch": 3925} {"train_loss": -6.687061309814453, "global_step": 164874, "epoch": 3925} {"train_loss": -6.763991355895996, "global_step": 164875, "epoch": 3925} {"train_loss": -6.51452112197876, "global_step": 164876, "epoch": 3925} {"train_loss": -6.856436729431152, "global_step": 164877, "epoch": 3925} {"train_loss": -6.627176284790039, "global_step": 164878, "epoch": 3925} {"train_loss": -6.732748985290527, "global_step": 164879, "epoch": 3925} {"train_loss": -6.723405838012695, "global_step": 164880, "epoch": 3925} {"train_loss": -6.577815055847168, "global_step": 164881, "epoch": 3925} {"train_loss": -6.826493263244629, "global_step": 164882, "epoch": 3925} {"train_loss": -6.687816143035889, "global_step": 164883, "epoch": 3925} {"train_loss": -6.838744163513184, "global_step": 164884, "epoch": 3925} {"train_loss": -6.78959846496582, "global_step": 164885, "epoch": 3925} {"train_loss": -6.853926658630371, "global_step": 164886, "epoch": 3925} {"train_loss": -6.694899559020996, "global_step": 164887, "epoch": 3925} {"train_loss": -6.793863773345947, "global_step": 164888, "epoch": 3925} {"train_loss": -6.7982869148254395, "global_step": 164889, "epoch": 3925} {"train_loss": -6.8633623123168945, "global_step": 164890, "epoch": 3925} {"train_loss": -6.820641687938145, "global_step": 164891, "epoch": 3925, "val_loss": 68525.140625} {"train_loss": -6.783331871032715, "global_step": 164892, "epoch": 3926} {"train_loss": -6.850142478942871, "global_step": 164893, "epoch": 3926} {"train_loss": -6.920008659362793, "global_step": 164894, "epoch": 3926} {"train_loss": -6.913106918334961, "global_step": 164895, "epoch": 3926} {"train_loss": -6.929688453674316, "global_step": 164896, "epoch": 3926} {"train_loss": -6.9246134757995605, "global_step": 164897, "epoch": 3926} {"train_loss": -7.013760566711426, "global_step": 164898, "epoch": 3926} {"train_loss": -6.887561798095703, "global_step": 164899, "epoch": 3926} {"train_loss": -6.88310432434082, "global_step": 164900, "epoch": 3926} {"train_loss": -6.7687225341796875, "global_step": 164901, "epoch": 3926} {"train_loss": -6.784998893737793, "global_step": 164902, "epoch": 3926} {"train_loss": -6.918276309967041, "global_step": 164903, "epoch": 3926} {"train_loss": -6.972796440124512, "global_step": 164904, "epoch": 3926} {"train_loss": -6.9000043869018555, "global_step": 164905, "epoch": 3926} {"train_loss": -6.938218116760254, "global_step": 164906, "epoch": 3926} {"train_loss": -6.958395957946777, "global_step": 164907, "epoch": 3926} {"train_loss": -6.980390548706055, "global_step": 164908, "epoch": 3926} {"train_loss": -6.956367492675781, "global_step": 164909, "epoch": 3926} {"train_loss": -6.904042720794678, "global_step": 164910, "epoch": 3926} {"train_loss": -6.995922565460205, "global_step": 164911, "epoch": 3926} {"train_loss": -6.896261692047119, "global_step": 164912, "epoch": 3926} {"train_loss": -7.02816915512085, "global_step": 164913, "epoch": 3926} {"train_loss": -6.946816444396973, "global_step": 164914, "epoch": 3926} {"train_loss": -6.957229137420654, "global_step": 164915, "epoch": 3926} {"train_loss": -6.972830772399902, "global_step": 164916, "epoch": 3926} {"train_loss": -6.987671852111816, "global_step": 164917, "epoch": 3926} {"train_loss": -6.953131675720215, "global_step": 164918, "epoch": 3926} {"train_loss": -6.934239387512207, "global_step": 164919, "epoch": 3926} {"train_loss": -6.911714553833008, "global_step": 164920, "epoch": 3926} {"train_loss": -7.013265609741211, "global_step": 164921, "epoch": 3926} {"train_loss": -6.924734592437744, "global_step": 164922, "epoch": 3926} {"train_loss": -7.017666816711426, "global_step": 164923, "epoch": 3926} {"train_loss": -6.9453959465026855, "global_step": 164924, "epoch": 3926} {"train_loss": -6.902033805847168, "global_step": 164925, "epoch": 3926} {"train_loss": -6.987351417541504, "global_step": 164926, "epoch": 3926} {"train_loss": -6.820940017700195, "global_step": 164927, "epoch": 3926} {"train_loss": -6.920764923095703, "global_step": 164928, "epoch": 3926} {"train_loss": -7.044195652008057, "global_step": 164929, "epoch": 3926} {"train_loss": -6.882519245147705, "global_step": 164930, "epoch": 3926} {"train_loss": -6.842816352844238, "global_step": 164931, "epoch": 3926} {"train_loss": -6.820221900939941, "global_step": 164932, "epoch": 3926} {"train_loss": -6.921940258571079, "global_step": 164933, "epoch": 3926, "val_loss": 68684.953125} {"train_loss": -6.926085472106934, "global_step": 164934, "epoch": 3927} {"train_loss": -6.845512390136719, "global_step": 164935, "epoch": 3927} {"train_loss": -7.072807312011719, "global_step": 164936, "epoch": 3927} {"train_loss": -6.851082801818848, "global_step": 164937, "epoch": 3927} {"train_loss": -6.868592739105225, "global_step": 164938, "epoch": 3927} {"train_loss": -6.902894020080566, "global_step": 164939, "epoch": 3927} {"train_loss": -6.9654388427734375, "global_step": 164940, "epoch": 3927} {"train_loss": -7.061324596405029, "global_step": 164941, "epoch": 3927} {"train_loss": -6.897072792053223, "global_step": 164942, "epoch": 3927} {"train_loss": -6.878609657287598, "global_step": 164943, "epoch": 3927} {"train_loss": -7.12615966796875, "global_step": 164944, "epoch": 3927} {"train_loss": -6.958871841430664, "global_step": 164945, "epoch": 3927} {"train_loss": -6.925705432891846, "global_step": 164946, "epoch": 3927} {"train_loss": -6.815378189086914, "global_step": 164947, "epoch": 3927} {"train_loss": -6.874324321746826, "global_step": 164948, "epoch": 3927} {"train_loss": -6.919344902038574, "global_step": 164949, "epoch": 3927} {"train_loss": -6.992259502410889, "global_step": 164950, "epoch": 3927} {"train_loss": -6.98280143737793, "global_step": 164951, "epoch": 3927} {"train_loss": -6.956551551818848, "global_step": 164952, "epoch": 3927} {"train_loss": -7.016674995422363, "global_step": 164953, "epoch": 3927} {"train_loss": -7.0194878578186035, "global_step": 164954, "epoch": 3927} {"train_loss": -6.886390686035156, "global_step": 164955, "epoch": 3927} {"train_loss": -7.0028533935546875, "global_step": 164956, "epoch": 3927} {"train_loss": -6.943878173828125, "global_step": 164957, "epoch": 3927} {"train_loss": -6.884084701538086, "global_step": 164958, "epoch": 3927} {"train_loss": -7.017927169799805, "global_step": 164959, "epoch": 3927} {"train_loss": -6.981407165527344, "global_step": 164960, "epoch": 3927} {"train_loss": -6.9668121337890625, "global_step": 164961, "epoch": 3927} {"train_loss": -7.013089179992676, "global_step": 164962, "epoch": 3927} {"train_loss": -6.889741897583008, "global_step": 164963, "epoch": 3927} {"train_loss": -6.967446327209473, "global_step": 164964, "epoch": 3927} {"train_loss": -6.964629650115967, "global_step": 164965, "epoch": 3927} {"train_loss": -6.903009414672852, "global_step": 164966, "epoch": 3927} {"train_loss": -6.93393087387085, "global_step": 164967, "epoch": 3927} {"train_loss": -7.074267387390137, "global_step": 164968, "epoch": 3927} {"train_loss": -7.020637035369873, "global_step": 164969, "epoch": 3927} {"train_loss": -7.0752458572387695, "global_step": 164970, "epoch": 3927} {"train_loss": -6.923776149749756, "global_step": 164971, "epoch": 3927} {"train_loss": -6.949241638183594, "global_step": 164972, "epoch": 3927} {"train_loss": -6.961343288421631, "global_step": 164973, "epoch": 3927} {"train_loss": -6.802838325500488, "global_step": 164974, "epoch": 3927} {"train_loss": -6.952059041886103, "global_step": 164975, "epoch": 3927, "val_loss": 68445.4140625} {"train_loss": -6.844745635986328, "global_step": 164976, "epoch": 3928} {"train_loss": -6.870952606201172, "global_step": 164977, "epoch": 3928} {"train_loss": -6.941582202911377, "global_step": 164978, "epoch": 3928} {"train_loss": -7.121046543121338, "global_step": 164979, "epoch": 3928} {"train_loss": -6.899945259094238, "global_step": 164980, "epoch": 3928} {"train_loss": -6.915569305419922, "global_step": 164981, "epoch": 3928} {"train_loss": -6.954367637634277, "global_step": 164982, "epoch": 3928} {"train_loss": -6.958067893981934, "global_step": 164983, "epoch": 3928} {"train_loss": -6.95934534072876, "global_step": 164984, "epoch": 3928} {"train_loss": -6.907535552978516, "global_step": 164985, "epoch": 3928} {"train_loss": -6.89776611328125, "global_step": 164986, "epoch": 3928} {"train_loss": -6.968874454498291, "global_step": 164987, "epoch": 3928} {"train_loss": -7.008495330810547, "global_step": 164988, "epoch": 3928} {"train_loss": -6.81674337387085, "global_step": 164989, "epoch": 3928} {"train_loss": -7.056704521179199, "global_step": 164990, "epoch": 3928} {"train_loss": -6.9647955894470215, "global_step": 164991, "epoch": 3928} {"train_loss": -6.971652984619141, "global_step": 164992, "epoch": 3928} {"train_loss": -7.07512092590332, "global_step": 164993, "epoch": 3928} {"train_loss": -6.850844383239746, "global_step": 164994, "epoch": 3928} {"train_loss": -6.937360763549805, "global_step": 164995, "epoch": 3928} {"train_loss": -6.919437408447266, "global_step": 164996, "epoch": 3928} {"train_loss": -6.947072982788086, "global_step": 164997, "epoch": 3928} {"train_loss": -6.870301246643066, "global_step": 164998, "epoch": 3928} {"train_loss": -6.858428955078125, "global_step": 164999, "epoch": 3928} {"train_loss": -6.842761993408203, "global_step": 165000, "epoch": 3928} {"train_loss": -6.740436553955078, "global_step": 165001, "epoch": 3928} {"train_loss": -6.8233537673950195, "global_step": 165002, "epoch": 3928} {"train_loss": -6.835518836975098, "global_step": 165003, "epoch": 3928} {"train_loss": -6.934637069702148, "global_step": 165004, "epoch": 3928} {"train_loss": -6.935911178588867, "global_step": 165005, "epoch": 3928} {"train_loss": -6.925220966339111, "global_step": 165006, "epoch": 3928} {"train_loss": -7.0268707275390625, "global_step": 165007, "epoch": 3928} {"train_loss": -6.759390354156494, "global_step": 165008, "epoch": 3928} {"train_loss": -6.969926834106445, "global_step": 165009, "epoch": 3928} {"train_loss": -6.930169582366943, "global_step": 165010, "epoch": 3928} {"train_loss": -6.828656196594238, "global_step": 165011, "epoch": 3928} {"train_loss": -7.018472194671631, "global_step": 165012, "epoch": 3928} {"train_loss": -6.853654861450195, "global_step": 165013, "epoch": 3928} {"train_loss": -6.886144638061523, "global_step": 165014, "epoch": 3928} {"train_loss": -6.795869827270508, "global_step": 165015, "epoch": 3928} {"train_loss": -6.882640361785889, "global_step": 165016, "epoch": 3928} {"train_loss": -6.915039505277361, "global_step": 165017, "epoch": 3928, "val_loss": 68772.5078125} {"train_loss": -6.9606523513793945, "global_step": 165018, "epoch": 3929} {"train_loss": -6.986014366149902, "global_step": 165019, "epoch": 3929} {"train_loss": -6.9259796142578125, "global_step": 165020, "epoch": 3929} {"train_loss": -6.862766265869141, "global_step": 165021, "epoch": 3929} {"train_loss": -6.793580532073975, "global_step": 165022, "epoch": 3929} {"train_loss": -7.05265998840332, "global_step": 165023, "epoch": 3929} {"train_loss": -6.968881607055664, "global_step": 165024, "epoch": 3929} {"train_loss": -6.998023509979248, "global_step": 165025, "epoch": 3929} {"train_loss": -6.987546920776367, "global_step": 165026, "epoch": 3929} {"train_loss": -6.954014778137207, "global_step": 165027, "epoch": 3929} {"train_loss": -6.956451416015625, "global_step": 165028, "epoch": 3929} {"train_loss": -6.992398262023926, "global_step": 165029, "epoch": 3929} {"train_loss": -6.946829319000244, "global_step": 165030, "epoch": 3929} {"train_loss": -7.061450004577637, "global_step": 165031, "epoch": 3929} {"train_loss": -7.050995826721191, "global_step": 165032, "epoch": 3929} {"train_loss": -7.049332618713379, "global_step": 165033, "epoch": 3929} {"train_loss": -6.926002502441406, "global_step": 165034, "epoch": 3929} {"train_loss": -7.083062648773193, "global_step": 165035, "epoch": 3929} {"train_loss": -6.958024978637695, "global_step": 165036, "epoch": 3929} {"train_loss": -7.105119705200195, "global_step": 165037, "epoch": 3929} {"train_loss": -7.019523620605469, "global_step": 165038, "epoch": 3929} {"train_loss": -6.930332183837891, "global_step": 165039, "epoch": 3929} {"train_loss": -6.950411796569824, "global_step": 165040, "epoch": 3929} {"train_loss": -6.949316024780273, "global_step": 165041, "epoch": 3929} {"train_loss": -6.917673110961914, "global_step": 165042, "epoch": 3929} {"train_loss": -6.963569164276123, "global_step": 165043, "epoch": 3929} {"train_loss": -6.940043926239014, "global_step": 165044, "epoch": 3929} {"train_loss": -6.945071220397949, "global_step": 165045, "epoch": 3929} {"train_loss": -7.068450927734375, "global_step": 165046, "epoch": 3929} {"train_loss": -6.897909641265869, "global_step": 165047, "epoch": 3929} {"train_loss": -7.008801460266113, "global_step": 165048, "epoch": 3929} {"train_loss": -7.018616199493408, "global_step": 165049, "epoch": 3929} {"train_loss": -6.922416687011719, "global_step": 165050, "epoch": 3929} {"train_loss": -6.936583995819092, "global_step": 165051, "epoch": 3929} {"train_loss": -7.005813121795654, "global_step": 165052, "epoch": 3929} {"train_loss": -7.0629563331604, "global_step": 165053, "epoch": 3929} {"train_loss": -6.889565944671631, "global_step": 165054, "epoch": 3929} {"train_loss": -6.968506813049316, "global_step": 165055, "epoch": 3929} {"train_loss": -7.114279747009277, "global_step": 165056, "epoch": 3929} {"train_loss": -6.990758895874023, "global_step": 165057, "epoch": 3929} {"train_loss": -6.968299865722656, "global_step": 165058, "epoch": 3929} {"train_loss": -6.979148444675264, "global_step": 165059, "epoch": 3929, "val_loss": 68595.2890625} {"train_loss": -6.801159858703613, "global_step": 165060, "epoch": 3930} {"train_loss": -6.916362762451172, "global_step": 165061, "epoch": 3930} {"train_loss": -6.92911434173584, "global_step": 165062, "epoch": 3930} {"train_loss": -6.951035499572754, "global_step": 165063, "epoch": 3930} {"train_loss": -6.685126781463623, "global_step": 165064, "epoch": 3930} {"train_loss": -6.8262505531311035, "global_step": 165065, "epoch": 3930} {"train_loss": -6.8087158203125, "global_step": 165066, "epoch": 3930} {"train_loss": -6.752985000610352, "global_step": 165067, "epoch": 3930} {"train_loss": -6.730993270874023, "global_step": 165068, "epoch": 3930} {"train_loss": -6.669289588928223, "global_step": 165069, "epoch": 3930} {"train_loss": -7.000723838806152, "global_step": 165070, "epoch": 3930} {"train_loss": -6.85989236831665, "global_step": 165071, "epoch": 3930} {"train_loss": -6.744353771209717, "global_step": 165072, "epoch": 3930} {"train_loss": -6.898025035858154, "global_step": 165073, "epoch": 3930} {"train_loss": -6.807254314422607, "global_step": 165074, "epoch": 3930} {"train_loss": -6.979879379272461, "global_step": 165075, "epoch": 3930} {"train_loss": -6.839450836181641, "global_step": 165076, "epoch": 3930} {"train_loss": -6.747561931610107, "global_step": 165077, "epoch": 3930} {"train_loss": -6.840123653411865, "global_step": 165078, "epoch": 3930} {"train_loss": -6.8374714851379395, "global_step": 165079, "epoch": 3930} {"train_loss": -6.8856658935546875, "global_step": 165080, "epoch": 3930} {"train_loss": -6.898049354553223, "global_step": 165081, "epoch": 3930} {"train_loss": -6.7328386306762695, "global_step": 165082, "epoch": 3930} {"train_loss": -6.843454360961914, "global_step": 165083, "epoch": 3930} {"train_loss": -6.783447742462158, "global_step": 165084, "epoch": 3930} {"train_loss": -6.823633193969727, "global_step": 165085, "epoch": 3930} {"train_loss": -6.688114166259766, "global_step": 165086, "epoch": 3930} {"train_loss": -6.876073837280273, "global_step": 165087, "epoch": 3930} {"train_loss": -6.874213218688965, "global_step": 165088, "epoch": 3930} {"train_loss": -6.861983299255371, "global_step": 165089, "epoch": 3930} {"train_loss": -6.801033973693848, "global_step": 165090, "epoch": 3930} {"train_loss": -6.776201248168945, "global_step": 165091, "epoch": 3930} {"train_loss": -6.901230812072754, "global_step": 165092, "epoch": 3930} {"train_loss": -6.925723075866699, "global_step": 165093, "epoch": 3930} {"train_loss": -6.884099960327148, "global_step": 165094, "epoch": 3930} {"train_loss": -6.805935382843018, "global_step": 165095, "epoch": 3930} {"train_loss": -6.887286186218262, "global_step": 165096, "epoch": 3930} {"train_loss": -6.853445053100586, "global_step": 165097, "epoch": 3930} {"train_loss": -6.842227935791016, "global_step": 165098, "epoch": 3930} {"train_loss": -6.887190818786621, "global_step": 165099, "epoch": 3930} {"train_loss": -6.835944175720215, "global_step": 165100, "epoch": 3930} {"train_loss": -6.837702671686809, "global_step": 165101, "epoch": 3930, "val_loss": 68769.4921875} {"train_loss": -6.735228538513184, "global_step": 165102, "epoch": 3931} {"train_loss": -6.864561080932617, "global_step": 165103, "epoch": 3931} {"train_loss": -6.855548858642578, "global_step": 165104, "epoch": 3931} {"train_loss": -6.795934677124023, "global_step": 165105, "epoch": 3931} {"train_loss": -6.931941986083984, "global_step": 165106, "epoch": 3931} {"train_loss": -6.803549766540527, "global_step": 165107, "epoch": 3931} {"train_loss": -6.985845565795898, "global_step": 165108, "epoch": 3931} {"train_loss": -6.880216598510742, "global_step": 165109, "epoch": 3931} {"train_loss": -6.866677284240723, "global_step": 165110, "epoch": 3931} {"train_loss": -7.018434524536133, "global_step": 165111, "epoch": 3931} {"train_loss": -6.827785968780518, "global_step": 165112, "epoch": 3931} {"train_loss": -6.783093452453613, "global_step": 165113, "epoch": 3931} {"train_loss": -6.880913734436035, "global_step": 165114, "epoch": 3931} {"train_loss": -7.017368316650391, "global_step": 165115, "epoch": 3931} {"train_loss": -7.0351057052612305, "global_step": 165116, "epoch": 3931} {"train_loss": -6.998465061187744, "global_step": 165117, "epoch": 3931} {"train_loss": -6.937869071960449, "global_step": 165118, "epoch": 3931} {"train_loss": -6.925577163696289, "global_step": 165119, "epoch": 3931} {"train_loss": -6.883878707885742, "global_step": 165120, "epoch": 3931} {"train_loss": -6.955140113830566, "global_step": 165121, "epoch": 3931} {"train_loss": -6.9582414627075195, "global_step": 165122, "epoch": 3931} {"train_loss": -6.9690046310424805, "global_step": 165123, "epoch": 3931} {"train_loss": -6.9183349609375, "global_step": 165124, "epoch": 3931} {"train_loss": -7.0641770362854, "global_step": 165125, "epoch": 3931} {"train_loss": -6.8746232986450195, "global_step": 165126, "epoch": 3931} {"train_loss": -6.990928649902344, "global_step": 165127, "epoch": 3931} {"train_loss": -6.9739179611206055, "global_step": 165128, "epoch": 3931} {"train_loss": -6.92136287689209, "global_step": 165129, "epoch": 3931} {"train_loss": -7.02984619140625, "global_step": 165130, "epoch": 3931} {"train_loss": -7.001587867736816, "global_step": 165131, "epoch": 3931} {"train_loss": -6.961756706237793, "global_step": 165132, "epoch": 3931} {"train_loss": -7.010875701904297, "global_step": 165133, "epoch": 3931} {"train_loss": -7.045062065124512, "global_step": 165134, "epoch": 3931} {"train_loss": -6.956899642944336, "global_step": 165135, "epoch": 3931} {"train_loss": -6.952027320861816, "global_step": 165136, "epoch": 3931} {"train_loss": -7.0280561447143555, "global_step": 165137, "epoch": 3931} {"train_loss": -7.037751197814941, "global_step": 165138, "epoch": 3931} {"train_loss": -6.951818466186523, "global_step": 165139, "epoch": 3931} {"train_loss": -7.037888526916504, "global_step": 165140, "epoch": 3931} {"train_loss": -7.0715436935424805, "global_step": 165141, "epoch": 3931} {"train_loss": -6.901854991912842, "global_step": 165142, "epoch": 3931} {"train_loss": -6.943293707711356, "global_step": 165143, "epoch": 3931, "val_loss": 68490.453125} {"train_loss": -6.934359550476074, "global_step": 165144, "epoch": 3932} {"train_loss": -7.004168510437012, "global_step": 165145, "epoch": 3932} {"train_loss": -6.9299774169921875, "global_step": 165146, "epoch": 3932} {"train_loss": -6.9482831954956055, "global_step": 165147, "epoch": 3932} {"train_loss": -7.041940689086914, "global_step": 165148, "epoch": 3932} {"train_loss": -7.044719696044922, "global_step": 165149, "epoch": 3932} {"train_loss": -7.041250705718994, "global_step": 165150, "epoch": 3932} {"train_loss": -7.081300735473633, "global_step": 165151, "epoch": 3932} {"train_loss": -6.888036251068115, "global_step": 165152, "epoch": 3932} {"train_loss": -6.958405017852783, "global_step": 165153, "epoch": 3932} {"train_loss": -6.949161529541016, "global_step": 165154, "epoch": 3932} {"train_loss": -7.041219711303711, "global_step": 165155, "epoch": 3932} {"train_loss": -6.9474568367004395, "global_step": 165156, "epoch": 3932} {"train_loss": -6.930561065673828, "global_step": 165157, "epoch": 3932} {"train_loss": -6.9825825691223145, "global_step": 165158, "epoch": 3932} {"train_loss": -6.926483154296875, "global_step": 165159, "epoch": 3932} {"train_loss": -6.912563323974609, "global_step": 165160, "epoch": 3932} {"train_loss": -6.741827011108398, "global_step": 165161, "epoch": 3932} {"train_loss": -6.929259300231934, "global_step": 165162, "epoch": 3932} {"train_loss": -6.8793792724609375, "global_step": 165163, "epoch": 3932} {"train_loss": -6.839122772216797, "global_step": 165164, "epoch": 3932} {"train_loss": -6.999127388000488, "global_step": 165165, "epoch": 3932} {"train_loss": -6.943126678466797, "global_step": 165166, "epoch": 3932} {"train_loss": -6.690495491027832, "global_step": 165167, "epoch": 3932} {"train_loss": -6.913311004638672, "global_step": 165168, "epoch": 3932} {"train_loss": -6.8074421882629395, "global_step": 165169, "epoch": 3932} {"train_loss": -6.823482990264893, "global_step": 165170, "epoch": 3932} {"train_loss": -6.914541721343994, "global_step": 165171, "epoch": 3932} {"train_loss": -6.781865119934082, "global_step": 165172, "epoch": 3932} {"train_loss": -7.056246757507324, "global_step": 165173, "epoch": 3932} {"train_loss": -6.940502643585205, "global_step": 165174, "epoch": 3932} {"train_loss": -6.955117225646973, "global_step": 165175, "epoch": 3932} {"train_loss": -7.0365705490112305, "global_step": 165176, "epoch": 3932} {"train_loss": -6.834268569946289, "global_step": 165177, "epoch": 3932} {"train_loss": -6.892505645751953, "global_step": 165178, "epoch": 3932} {"train_loss": -6.82966423034668, "global_step": 165179, "epoch": 3932} {"train_loss": -6.827198028564453, "global_step": 165180, "epoch": 3932} {"train_loss": -6.920022010803223, "global_step": 165181, "epoch": 3932} {"train_loss": -6.810333251953125, "global_step": 165182, "epoch": 3932} {"train_loss": -6.972234725952148, "global_step": 165183, "epoch": 3932} {"train_loss": -6.944840431213379, "global_step": 165184, "epoch": 3932} {"train_loss": -6.922855354490734, "global_step": 165185, "epoch": 3932, "val_loss": 68726.1796875} {"train_loss": -6.96221399307251, "global_step": 165186, "epoch": 3933} {"train_loss": -6.790770053863525, "global_step": 165187, "epoch": 3933} {"train_loss": -6.905061721801758, "global_step": 165188, "epoch": 3933} {"train_loss": -6.88858699798584, "global_step": 165189, "epoch": 3933} {"train_loss": -6.890374660491943, "global_step": 165190, "epoch": 3933} {"train_loss": -7.01956033706665, "global_step": 165191, "epoch": 3933} {"train_loss": -6.867006301879883, "global_step": 165192, "epoch": 3933} {"train_loss": -6.953237533569336, "global_step": 165193, "epoch": 3933} {"train_loss": -6.765578269958496, "global_step": 165194, "epoch": 3933} {"train_loss": -6.958354473114014, "global_step": 165195, "epoch": 3933} {"train_loss": -6.922283172607422, "global_step": 165196, "epoch": 3933} {"train_loss": -6.9330244064331055, "global_step": 165197, "epoch": 3933} {"train_loss": -6.9180684089660645, "global_step": 165198, "epoch": 3933} {"train_loss": -7.021697044372559, "global_step": 165199, "epoch": 3933} {"train_loss": -6.9538984298706055, "global_step": 165200, "epoch": 3933} {"train_loss": -6.925748825073242, "global_step": 165201, "epoch": 3933} {"train_loss": -6.934081077575684, "global_step": 165202, "epoch": 3933} {"train_loss": -6.856562614440918, "global_step": 165203, "epoch": 3933} {"train_loss": -6.869075298309326, "global_step": 165204, "epoch": 3933} {"train_loss": -6.962817192077637, "global_step": 165205, "epoch": 3933} {"train_loss": -6.9090681076049805, "global_step": 165206, "epoch": 3933} {"train_loss": -6.954550266265869, "global_step": 165207, "epoch": 3933} {"train_loss": -7.016207695007324, "global_step": 165208, "epoch": 3933} {"train_loss": -7.051693916320801, "global_step": 165209, "epoch": 3933} {"train_loss": -6.938519477844238, "global_step": 165210, "epoch": 3933} {"train_loss": -6.928627014160156, "global_step": 165211, "epoch": 3933} {"train_loss": -7.105679988861084, "global_step": 165212, "epoch": 3933} {"train_loss": -7.002075672149658, "global_step": 165213, "epoch": 3933} {"train_loss": -6.999757289886475, "global_step": 165214, "epoch": 3933} {"train_loss": -6.94029426574707, "global_step": 165215, "epoch": 3933} {"train_loss": -7.046684265136719, "global_step": 165216, "epoch": 3933} {"train_loss": -7.021673202514648, "global_step": 165217, "epoch": 3933} {"train_loss": -6.963742256164551, "global_step": 165218, "epoch": 3933} {"train_loss": -7.032533168792725, "global_step": 165219, "epoch": 3933} {"train_loss": -6.902468681335449, "global_step": 165220, "epoch": 3933} {"train_loss": -6.894282341003418, "global_step": 165221, "epoch": 3933} {"train_loss": -6.997082710266113, "global_step": 165222, "epoch": 3933} {"train_loss": -6.959225654602051, "global_step": 165223, "epoch": 3933} {"train_loss": -6.920042991638184, "global_step": 165224, "epoch": 3933} {"train_loss": -6.983265399932861, "global_step": 165225, "epoch": 3933} {"train_loss": -7.095665454864502, "global_step": 165226, "epoch": 3933} {"train_loss": -6.951201790855045, "global_step": 165227, "epoch": 3933, "val_loss": 68547.0078125} {"train_loss": -7.037073135375977, "global_step": 165228, "epoch": 3934} {"train_loss": -6.970418930053711, "global_step": 165229, "epoch": 3934} {"train_loss": -6.9302263259887695, "global_step": 165230, "epoch": 3934} {"train_loss": -6.955121994018555, "global_step": 165231, "epoch": 3934} {"train_loss": -6.9597930908203125, "global_step": 165232, "epoch": 3934} {"train_loss": -6.912021636962891, "global_step": 165233, "epoch": 3934} {"train_loss": -7.010165214538574, "global_step": 165234, "epoch": 3934} {"train_loss": -6.888841152191162, "global_step": 165235, "epoch": 3934} {"train_loss": -6.913886070251465, "global_step": 165236, "epoch": 3934} {"train_loss": -6.828795433044434, "global_step": 165237, "epoch": 3934} {"train_loss": -6.937860488891602, "global_step": 165238, "epoch": 3934} {"train_loss": -6.947611331939697, "global_step": 165239, "epoch": 3934} {"train_loss": -6.895517349243164, "global_step": 165240, "epoch": 3934} {"train_loss": -7.023076057434082, "global_step": 165241, "epoch": 3934} {"train_loss": -6.8447489738464355, "global_step": 165242, "epoch": 3934} {"train_loss": -6.838541030883789, "global_step": 165243, "epoch": 3934} {"train_loss": -6.933503150939941, "global_step": 165244, "epoch": 3934} {"train_loss": -7.061677932739258, "global_step": 165245, "epoch": 3934} {"train_loss": -7.04620361328125, "global_step": 165246, "epoch": 3934} {"train_loss": -6.930981636047363, "global_step": 165247, "epoch": 3934} {"train_loss": -6.912566184997559, "global_step": 165248, "epoch": 3934} {"train_loss": -6.868596076965332, "global_step": 165249, "epoch": 3934} {"train_loss": -6.840668201446533, "global_step": 165250, "epoch": 3934} {"train_loss": -6.978719711303711, "global_step": 165251, "epoch": 3934} {"train_loss": -6.769655227661133, "global_step": 165252, "epoch": 3934} {"train_loss": -6.893069267272949, "global_step": 165253, "epoch": 3934} {"train_loss": -6.962453842163086, "global_step": 165254, "epoch": 3934} {"train_loss": -6.905242443084717, "global_step": 165255, "epoch": 3934} {"train_loss": -6.913745403289795, "global_step": 165256, "epoch": 3934} {"train_loss": -6.962453842163086, "global_step": 165257, "epoch": 3934} {"train_loss": -6.9368743896484375, "global_step": 165258, "epoch": 3934} {"train_loss": -6.969976425170898, "global_step": 165259, "epoch": 3934} {"train_loss": -6.967569828033447, "global_step": 165260, "epoch": 3934} {"train_loss": -6.950031280517578, "global_step": 165261, "epoch": 3934} {"train_loss": -6.916778564453125, "global_step": 165262, "epoch": 3934} {"train_loss": -6.967389106750488, "global_step": 165263, "epoch": 3934} {"train_loss": -6.950189590454102, "global_step": 165264, "epoch": 3934} {"train_loss": -6.919200897216797, "global_step": 165265, "epoch": 3934} {"train_loss": -7.027750015258789, "global_step": 165266, "epoch": 3934} {"train_loss": -7.0262017250061035, "global_step": 165267, "epoch": 3934} {"train_loss": -6.7810444831848145, "global_step": 165268, "epoch": 3934} {"train_loss": -6.935066631862095, "global_step": 165269, "epoch": 3934, "val_loss": 68373.0859375} {"train_loss": -6.977394104003906, "global_step": 165270, "epoch": 3935} {"train_loss": -6.91096305847168, "global_step": 165271, "epoch": 3935} {"train_loss": -7.076329708099365, "global_step": 165272, "epoch": 3935} {"train_loss": -6.959907531738281, "global_step": 165273, "epoch": 3935} {"train_loss": -6.945790767669678, "global_step": 165274, "epoch": 3935} {"train_loss": -7.01611328125, "global_step": 165275, "epoch": 3935} {"train_loss": -7.0063371658325195, "global_step": 165276, "epoch": 3935} {"train_loss": -6.986824989318848, "global_step": 165277, "epoch": 3935} {"train_loss": -7.06649112701416, "global_step": 165278, "epoch": 3935} {"train_loss": -7.0901031494140625, "global_step": 165279, "epoch": 3935} {"train_loss": -7.086318492889404, "global_step": 165280, "epoch": 3935} {"train_loss": -6.953201770782471, "global_step": 165281, "epoch": 3935} {"train_loss": -6.979615211486816, "global_step": 165282, "epoch": 3935} {"train_loss": -6.86601448059082, "global_step": 165283, "epoch": 3935} {"train_loss": -6.895167350769043, "global_step": 165284, "epoch": 3935} {"train_loss": -6.906732559204102, "global_step": 165285, "epoch": 3935} {"train_loss": -6.819232940673828, "global_step": 165286, "epoch": 3935} {"train_loss": -6.938624382019043, "global_step": 165287, "epoch": 3935} {"train_loss": -6.939903259277344, "global_step": 165288, "epoch": 3935} {"train_loss": -6.845795154571533, "global_step": 165289, "epoch": 3935} {"train_loss": -6.877793788909912, "global_step": 165290, "epoch": 3935} {"train_loss": -6.911800384521484, "global_step": 165291, "epoch": 3935} {"train_loss": -6.783215522766113, "global_step": 165292, "epoch": 3935} {"train_loss": -6.807576656341553, "global_step": 165293, "epoch": 3935} {"train_loss": -6.987277984619141, "global_step": 165294, "epoch": 3935} {"train_loss": -6.902556419372559, "global_step": 165295, "epoch": 3935} {"train_loss": -6.875150680541992, "global_step": 165296, "epoch": 3935} {"train_loss": -6.932955265045166, "global_step": 165297, "epoch": 3935} {"train_loss": -6.759311676025391, "global_step": 165298, "epoch": 3935} {"train_loss": -6.735261917114258, "global_step": 165299, "epoch": 3935} {"train_loss": -6.862283706665039, "global_step": 165300, "epoch": 3935} {"train_loss": -6.84086275100708, "global_step": 165301, "epoch": 3935} {"train_loss": -6.892085075378418, "global_step": 165302, "epoch": 3935} {"train_loss": -6.763359069824219, "global_step": 165303, "epoch": 3935} {"train_loss": -6.777988433837891, "global_step": 165304, "epoch": 3935} {"train_loss": -6.714926242828369, "global_step": 165305, "epoch": 3935} {"train_loss": -6.806741714477539, "global_step": 165306, "epoch": 3935} {"train_loss": -6.828579902648926, "global_step": 165307, "epoch": 3935} {"train_loss": -6.714328765869141, "global_step": 165308, "epoch": 3935} {"train_loss": -6.850760459899902, "global_step": 165309, "epoch": 3935} {"train_loss": -6.680396556854248, "global_step": 165310, "epoch": 3935} {"train_loss": -6.889069148472378, "global_step": 165311, "epoch": 3935, "val_loss": 68780.640625} {"train_loss": -6.717587471008301, "global_step": 165312, "epoch": 3936} {"train_loss": -6.917417526245117, "global_step": 165313, "epoch": 3936} {"train_loss": -6.824017524719238, "global_step": 165314, "epoch": 3936} {"train_loss": -6.989242076873779, "global_step": 165315, "epoch": 3936} {"train_loss": -6.865657806396484, "global_step": 165316, "epoch": 3936} {"train_loss": -7.012839317321777, "global_step": 165317, "epoch": 3936} {"train_loss": -6.868381500244141, "global_step": 165318, "epoch": 3936} {"train_loss": -7.002789497375488, "global_step": 165319, "epoch": 3936} {"train_loss": -6.9086737632751465, "global_step": 165320, "epoch": 3936} {"train_loss": -6.840756416320801, "global_step": 165321, "epoch": 3936} {"train_loss": -6.924149990081787, "global_step": 165322, "epoch": 3936} {"train_loss": -6.922740459442139, "global_step": 165323, "epoch": 3936} {"train_loss": -6.898131370544434, "global_step": 165324, "epoch": 3936} {"train_loss": -7.044210433959961, "global_step": 165325, "epoch": 3936} {"train_loss": -6.84532356262207, "global_step": 165326, "epoch": 3936} {"train_loss": -7.063065528869629, "global_step": 165327, "epoch": 3936} {"train_loss": -6.932713985443115, "global_step": 165328, "epoch": 3936} {"train_loss": -6.949109077453613, "global_step": 165329, "epoch": 3936} {"train_loss": -6.98098611831665, "global_step": 165330, "epoch": 3936} {"train_loss": -6.993801593780518, "global_step": 165331, "epoch": 3936} {"train_loss": -6.856470108032227, "global_step": 165332, "epoch": 3936} {"train_loss": -6.763936519622803, "global_step": 165333, "epoch": 3936} {"train_loss": -6.980388641357422, "global_step": 165334, "epoch": 3936} {"train_loss": -6.871199607849121, "global_step": 165335, "epoch": 3936} {"train_loss": -6.9412407875061035, "global_step": 165336, "epoch": 3936} {"train_loss": -6.930322647094727, "global_step": 165337, "epoch": 3936} {"train_loss": -6.908708095550537, "global_step": 165338, "epoch": 3936} {"train_loss": -6.944314479827881, "global_step": 165339, "epoch": 3936} {"train_loss": -7.005354881286621, "global_step": 165340, "epoch": 3936} {"train_loss": -6.997097969055176, "global_step": 165341, "epoch": 3936} {"train_loss": -6.957969665527344, "global_step": 165342, "epoch": 3936} {"train_loss": -7.001194000244141, "global_step": 165343, "epoch": 3936} {"train_loss": -7.110139846801758, "global_step": 165344, "epoch": 3936} {"train_loss": -6.954565525054932, "global_step": 165345, "epoch": 3936} {"train_loss": -7.0087199211120605, "global_step": 165346, "epoch": 3936} {"train_loss": -6.910464286804199, "global_step": 165347, "epoch": 3936} {"train_loss": -6.935272216796875, "global_step": 165348, "epoch": 3936} {"train_loss": -6.995161533355713, "global_step": 165349, "epoch": 3936} {"train_loss": -7.142739772796631, "global_step": 165350, "epoch": 3936} {"train_loss": -6.888369560241699, "global_step": 165351, "epoch": 3936} {"train_loss": -7.123915195465088, "global_step": 165352, "epoch": 3936} {"train_loss": -6.947198935917446, "global_step": 165353, "epoch": 3936, "val_loss": 68468.0078125} {"train_loss": -7.071017265319824, "global_step": 165354, "epoch": 3937} {"train_loss": -7.123569965362549, "global_step": 165355, "epoch": 3937} {"train_loss": -6.952843189239502, "global_step": 165356, "epoch": 3937} {"train_loss": -6.901510238647461, "global_step": 165357, "epoch": 3937} {"train_loss": -6.947575569152832, "global_step": 165358, "epoch": 3937} {"train_loss": -7.071069240570068, "global_step": 165359, "epoch": 3937} {"train_loss": -6.965385437011719, "global_step": 165360, "epoch": 3937} {"train_loss": -7.100546836853027, "global_step": 165361, "epoch": 3937} {"train_loss": -7.0384979248046875, "global_step": 165362, "epoch": 3937} {"train_loss": -7.128780364990234, "global_step": 165363, "epoch": 3937} {"train_loss": -7.121577739715576, "global_step": 165364, "epoch": 3937} {"train_loss": -7.0121259689331055, "global_step": 165365, "epoch": 3937} {"train_loss": -7.034526348114014, "global_step": 165366, "epoch": 3937} {"train_loss": -7.04547643661499, "global_step": 165367, "epoch": 3937} {"train_loss": -6.992013931274414, "global_step": 165368, "epoch": 3937} {"train_loss": -6.882807731628418, "global_step": 165369, "epoch": 3937} {"train_loss": -7.03518009185791, "global_step": 165370, "epoch": 3937} {"train_loss": -7.015562057495117, "global_step": 165371, "epoch": 3937} {"train_loss": -6.850724220275879, "global_step": 165372, "epoch": 3937} {"train_loss": -6.9991912841796875, "global_step": 165373, "epoch": 3937} {"train_loss": -6.994123458862305, "global_step": 165374, "epoch": 3937} {"train_loss": -6.793117523193359, "global_step": 165375, "epoch": 3937} {"train_loss": -7.042010307312012, "global_step": 165376, "epoch": 3937} {"train_loss": -6.986933708190918, "global_step": 165377, "epoch": 3937} {"train_loss": -6.832839488983154, "global_step": 165378, "epoch": 3937} {"train_loss": -6.98221492767334, "global_step": 165379, "epoch": 3937} {"train_loss": -6.864443302154541, "global_step": 165380, "epoch": 3937} {"train_loss": -6.987445831298828, "global_step": 165381, "epoch": 3937} {"train_loss": -6.931375980377197, "global_step": 165382, "epoch": 3937} {"train_loss": -6.873268127441406, "global_step": 165383, "epoch": 3937} {"train_loss": -7.106086254119873, "global_step": 165384, "epoch": 3937} {"train_loss": -6.980373859405518, "global_step": 165385, "epoch": 3937} {"train_loss": -7.064002990722656, "global_step": 165386, "epoch": 3937} {"train_loss": -6.926265239715576, "global_step": 165387, "epoch": 3937} {"train_loss": -6.970474720001221, "global_step": 165388, "epoch": 3937} {"train_loss": -6.9463701248168945, "global_step": 165389, "epoch": 3937} {"train_loss": -6.9436540603637695, "global_step": 165390, "epoch": 3937} {"train_loss": -7.020650863647461, "global_step": 165391, "epoch": 3937} {"train_loss": -7.034836769104004, "global_step": 165392, "epoch": 3937} {"train_loss": -7.0057454109191895, "global_step": 165393, "epoch": 3937} {"train_loss": -7.0538249015808105, "global_step": 165394, "epoch": 3937} {"train_loss": -6.988766919998896, "global_step": 165395, "epoch": 3937, "val_loss": 68497.984375} {"train_loss": -7.054740905761719, "global_step": 165396, "epoch": 3938} {"train_loss": -6.928763389587402, "global_step": 165397, "epoch": 3938} {"train_loss": -6.898073673248291, "global_step": 165398, "epoch": 3938} {"train_loss": -6.9428205490112305, "global_step": 165399, "epoch": 3938} {"train_loss": -6.994107246398926, "global_step": 165400, "epoch": 3938} {"train_loss": -6.953751087188721, "global_step": 165401, "epoch": 3938} {"train_loss": -6.856013774871826, "global_step": 165402, "epoch": 3938} {"train_loss": -7.005553245544434, "global_step": 165403, "epoch": 3938} {"train_loss": -6.760764122009277, "global_step": 165404, "epoch": 3938} {"train_loss": -6.794764518737793, "global_step": 165405, "epoch": 3938} {"train_loss": -7.004947662353516, "global_step": 165406, "epoch": 3938} {"train_loss": -6.656605243682861, "global_step": 165407, "epoch": 3938} {"train_loss": -6.901856422424316, "global_step": 165408, "epoch": 3938} {"train_loss": -6.649326324462891, "global_step": 165409, "epoch": 3938} {"train_loss": -6.732664108276367, "global_step": 165410, "epoch": 3938} {"train_loss": -6.922286033630371, "global_step": 165411, "epoch": 3938} {"train_loss": -6.733009338378906, "global_step": 165412, "epoch": 3938} {"train_loss": -6.869250297546387, "global_step": 165413, "epoch": 3938} {"train_loss": -6.688197612762451, "global_step": 165414, "epoch": 3938} {"train_loss": -6.966475009918213, "global_step": 165415, "epoch": 3938} {"train_loss": -6.686997413635254, "global_step": 165416, "epoch": 3938} {"train_loss": -6.8885064125061035, "global_step": 165417, "epoch": 3938} {"train_loss": -6.8508429527282715, "global_step": 165418, "epoch": 3938} {"train_loss": -6.844640731811523, "global_step": 165419, "epoch": 3938} {"train_loss": -6.83745002746582, "global_step": 165420, "epoch": 3938} {"train_loss": -6.671169757843018, "global_step": 165421, "epoch": 3938} {"train_loss": -6.977272987365723, "global_step": 165422, "epoch": 3938} {"train_loss": -6.688236236572266, "global_step": 165423, "epoch": 3938} {"train_loss": -6.773451805114746, "global_step": 165424, "epoch": 3938} {"train_loss": -6.788647651672363, "global_step": 165425, "epoch": 3938} {"train_loss": -6.941103935241699, "global_step": 165426, "epoch": 3938} {"train_loss": -6.954209327697754, "global_step": 165427, "epoch": 3938} {"train_loss": -6.890032768249512, "global_step": 165428, "epoch": 3938} {"train_loss": -6.89125919342041, "global_step": 165429, "epoch": 3938} {"train_loss": -6.963174343109131, "global_step": 165430, "epoch": 3938} {"train_loss": -6.819238662719727, "global_step": 165431, "epoch": 3938} {"train_loss": -6.945117950439453, "global_step": 165432, "epoch": 3938} {"train_loss": -6.967518329620361, "global_step": 165433, "epoch": 3938} {"train_loss": -6.975790977478027, "global_step": 165434, "epoch": 3938} {"train_loss": -6.960676670074463, "global_step": 165435, "epoch": 3938} {"train_loss": -7.015941143035889, "global_step": 165436, "epoch": 3938} {"train_loss": -6.871944268544515, "global_step": 165437, "epoch": 3938, "val_loss": 68503.515625} {"train_loss": -6.968565464019775, "global_step": 165438, "epoch": 3939} {"train_loss": -7.0543599128723145, "global_step": 165439, "epoch": 3939} {"train_loss": -7.038179397583008, "global_step": 165440, "epoch": 3939} {"train_loss": -6.9094343185424805, "global_step": 165441, "epoch": 3939} {"train_loss": -7.037872314453125, "global_step": 165442, "epoch": 3939} {"train_loss": -6.923628807067871, "global_step": 165443, "epoch": 3939} {"train_loss": -7.010916709899902, "global_step": 165444, "epoch": 3939} {"train_loss": -6.965821266174316, "global_step": 165445, "epoch": 3939} {"train_loss": -7.009695053100586, "global_step": 165446, "epoch": 3939} {"train_loss": -7.001992702484131, "global_step": 165447, "epoch": 3939} {"train_loss": -6.986457824707031, "global_step": 165448, "epoch": 3939} {"train_loss": -7.010886192321777, "global_step": 165449, "epoch": 3939} {"train_loss": -7.0209431648254395, "global_step": 165450, "epoch": 3939} {"train_loss": -6.935736656188965, "global_step": 165451, "epoch": 3939} {"train_loss": -7.001247882843018, "global_step": 165452, "epoch": 3939} {"train_loss": -7.003479957580566, "global_step": 165453, "epoch": 3939} {"train_loss": -6.964322090148926, "global_step": 165454, "epoch": 3939} {"train_loss": -6.836110591888428, "global_step": 165455, "epoch": 3939} {"train_loss": -6.962159633636475, "global_step": 165456, "epoch": 3939} {"train_loss": -7.02308988571167, "global_step": 165457, "epoch": 3939} {"train_loss": -7.05328369140625, "global_step": 165458, "epoch": 3939} {"train_loss": -6.936542510986328, "global_step": 165459, "epoch": 3939} {"train_loss": -6.9641289710998535, "global_step": 165460, "epoch": 3939} {"train_loss": -6.961589813232422, "global_step": 165461, "epoch": 3939} {"train_loss": -6.9290242195129395, "global_step": 165462, "epoch": 3939} {"train_loss": -6.98029899597168, "global_step": 165463, "epoch": 3939} {"train_loss": -6.9985551834106445, "global_step": 165464, "epoch": 3939} {"train_loss": -6.92191219329834, "global_step": 165465, "epoch": 3939} {"train_loss": -6.927949905395508, "global_step": 165466, "epoch": 3939} {"train_loss": -7.064743995666504, "global_step": 165467, "epoch": 3939} {"train_loss": -6.9125471115112305, "global_step": 165468, "epoch": 3939} {"train_loss": -6.917435646057129, "global_step": 165469, "epoch": 3939} {"train_loss": -6.950617790222168, "global_step": 165470, "epoch": 3939} {"train_loss": -6.951076984405518, "global_step": 165471, "epoch": 3939} {"train_loss": -6.79135799407959, "global_step": 165472, "epoch": 3939} {"train_loss": -7.092169284820557, "global_step": 165473, "epoch": 3939} {"train_loss": -6.884756088256836, "global_step": 165474, "epoch": 3939} {"train_loss": -6.814775466918945, "global_step": 165475, "epoch": 3939} {"train_loss": -6.965720176696777, "global_step": 165476, "epoch": 3939} {"train_loss": -6.794590473175049, "global_step": 165477, "epoch": 3939} {"train_loss": -6.773407936096191, "global_step": 165478, "epoch": 3939} {"train_loss": -6.956843410219465, "global_step": 165479, "epoch": 3939, "val_loss": 68647.6875} {"train_loss": -6.82529354095459, "global_step": 165480, "epoch": 3940} {"train_loss": -6.781527042388916, "global_step": 165481, "epoch": 3940} {"train_loss": -6.821834087371826, "global_step": 165482, "epoch": 3940} {"train_loss": -6.740705490112305, "global_step": 165483, "epoch": 3940} {"train_loss": -6.808221340179443, "global_step": 165484, "epoch": 3940} {"train_loss": -6.848184585571289, "global_step": 165485, "epoch": 3940} {"train_loss": -6.883162021636963, "global_step": 165486, "epoch": 3940} {"train_loss": -6.772672653198242, "global_step": 165487, "epoch": 3940} {"train_loss": -6.8300886154174805, "global_step": 165488, "epoch": 3940} {"train_loss": -6.957440376281738, "global_step": 165489, "epoch": 3940} {"train_loss": -6.962033271789551, "global_step": 165490, "epoch": 3940} {"train_loss": -6.954857349395752, "global_step": 165491, "epoch": 3940} {"train_loss": -6.897052764892578, "global_step": 165492, "epoch": 3940} {"train_loss": -6.824827194213867, "global_step": 165493, "epoch": 3940} {"train_loss": -7.051409721374512, "global_step": 165494, "epoch": 3940} {"train_loss": -6.9795355796813965, "global_step": 165495, "epoch": 3940} {"train_loss": -7.088357448577881, "global_step": 165496, "epoch": 3940} {"train_loss": -6.923927307128906, "global_step": 165497, "epoch": 3940} {"train_loss": -6.83451509475708, "global_step": 165498, "epoch": 3940} {"train_loss": -6.945422172546387, "global_step": 165499, "epoch": 3940} {"train_loss": -6.935832977294922, "global_step": 165500, "epoch": 3940} {"train_loss": -6.9155449867248535, "global_step": 165501, "epoch": 3940} {"train_loss": -6.8872199058532715, "global_step": 165502, "epoch": 3940} {"train_loss": -6.765537261962891, "global_step": 165503, "epoch": 3940} {"train_loss": -6.919630527496338, "global_step": 165504, "epoch": 3940} {"train_loss": -6.940638542175293, "global_step": 165505, "epoch": 3940} {"train_loss": -6.784093856811523, "global_step": 165506, "epoch": 3940} {"train_loss": -6.761012077331543, "global_step": 165507, "epoch": 3940} {"train_loss": -6.797121047973633, "global_step": 165508, "epoch": 3940} {"train_loss": -6.79791784286499, "global_step": 165509, "epoch": 3940} {"train_loss": -6.798157215118408, "global_step": 165510, "epoch": 3940} {"train_loss": -6.9541497230529785, "global_step": 165511, "epoch": 3940} {"train_loss": -6.843405246734619, "global_step": 165512, "epoch": 3940} {"train_loss": -7.012777328491211, "global_step": 165513, "epoch": 3940} {"train_loss": -6.85827112197876, "global_step": 165514, "epoch": 3940} {"train_loss": -6.812570571899414, "global_step": 165515, "epoch": 3940} {"train_loss": -6.884035110473633, "global_step": 165516, "epoch": 3940} {"train_loss": -6.793715953826904, "global_step": 165517, "epoch": 3940} {"train_loss": -6.977105140686035, "global_step": 165518, "epoch": 3940} {"train_loss": -6.838691711425781, "global_step": 165519, "epoch": 3940} {"train_loss": -6.843903541564941, "global_step": 165520, "epoch": 3940} {"train_loss": -6.873610189982823, "global_step": 165521, "epoch": 3940, "val_loss": 68720.109375} {"train_loss": -6.775902271270752, "global_step": 165522, "epoch": 3941} {"train_loss": -6.798666954040527, "global_step": 165523, "epoch": 3941} {"train_loss": -6.7701640129089355, "global_step": 165524, "epoch": 3941} {"train_loss": -6.788095474243164, "global_step": 165525, "epoch": 3941} {"train_loss": -6.875143051147461, "global_step": 165526, "epoch": 3941} {"train_loss": -6.8372297286987305, "global_step": 165527, "epoch": 3941} {"train_loss": -6.9247727394104, "global_step": 165528, "epoch": 3941} {"train_loss": -6.961344242095947, "global_step": 165529, "epoch": 3941} {"train_loss": -6.99700927734375, "global_step": 165530, "epoch": 3941} {"train_loss": -6.838315963745117, "global_step": 165531, "epoch": 3941} {"train_loss": -6.949037551879883, "global_step": 165532, "epoch": 3941} {"train_loss": -6.902552127838135, "global_step": 165533, "epoch": 3941} {"train_loss": -6.918543815612793, "global_step": 165534, "epoch": 3941} {"train_loss": -6.930119514465332, "global_step": 165535, "epoch": 3941} {"train_loss": -6.918516159057617, "global_step": 165536, "epoch": 3941} {"train_loss": -6.970677375793457, "global_step": 165537, "epoch": 3941} {"train_loss": -6.979527473449707, "global_step": 165538, "epoch": 3941} {"train_loss": -6.94088888168335, "global_step": 165539, "epoch": 3941} {"train_loss": -6.890372276306152, "global_step": 165540, "epoch": 3941} {"train_loss": -7.048300743103027, "global_step": 165541, "epoch": 3941} {"train_loss": -7.022452354431152, "global_step": 165542, "epoch": 3941} {"train_loss": -7.005834102630615, "global_step": 165543, "epoch": 3941} {"train_loss": -6.821319580078125, "global_step": 165544, "epoch": 3941} {"train_loss": -6.873096942901611, "global_step": 165545, "epoch": 3941} {"train_loss": -6.847095489501953, "global_step": 165546, "epoch": 3941} {"train_loss": -6.951284408569336, "global_step": 165547, "epoch": 3941} {"train_loss": -7.038360118865967, "global_step": 165548, "epoch": 3941} {"train_loss": -6.967483997344971, "global_step": 165549, "epoch": 3941} {"train_loss": -7.0812201499938965, "global_step": 165550, "epoch": 3941} {"train_loss": -6.879049301147461, "global_step": 165551, "epoch": 3941} {"train_loss": -6.940279006958008, "global_step": 165552, "epoch": 3941} {"train_loss": -6.992234230041504, "global_step": 165553, "epoch": 3941} {"train_loss": -7.032957077026367, "global_step": 165554, "epoch": 3941} {"train_loss": -7.010776996612549, "global_step": 165555, "epoch": 3941} {"train_loss": -6.938510894775391, "global_step": 165556, "epoch": 3941} {"train_loss": -7.018917083740234, "global_step": 165557, "epoch": 3941} {"train_loss": -6.993635177612305, "global_step": 165558, "epoch": 3941} {"train_loss": -6.937270164489746, "global_step": 165559, "epoch": 3941} {"train_loss": -6.995593070983887, "global_step": 165560, "epoch": 3941} {"train_loss": -7.074186325073242, "global_step": 165561, "epoch": 3941} {"train_loss": -6.9640398025512695, "global_step": 165562, "epoch": 3941} {"train_loss": -6.938486280895415, "global_step": 165563, "epoch": 3941, "val_loss": 68553.28125} {"train_loss": -7.023822784423828, "global_step": 165564, "epoch": 3942} {"train_loss": -6.930876731872559, "global_step": 165565, "epoch": 3942} {"train_loss": -6.995846748352051, "global_step": 165566, "epoch": 3942} {"train_loss": -6.941763877868652, "global_step": 165567, "epoch": 3942} {"train_loss": -7.058773040771484, "global_step": 165568, "epoch": 3942} {"train_loss": -6.963547706604004, "global_step": 165569, "epoch": 3942} {"train_loss": -6.940678119659424, "global_step": 165570, "epoch": 3942} {"train_loss": -7.052631855010986, "global_step": 165571, "epoch": 3942} {"train_loss": -6.980759620666504, "global_step": 165572, "epoch": 3942} {"train_loss": -6.96214485168457, "global_step": 165573, "epoch": 3942} {"train_loss": -6.944528579711914, "global_step": 165574, "epoch": 3942} {"train_loss": -6.982474327087402, "global_step": 165575, "epoch": 3942} {"train_loss": -6.898098468780518, "global_step": 165576, "epoch": 3942} {"train_loss": -6.972525596618652, "global_step": 165577, "epoch": 3942} {"train_loss": -6.999009609222412, "global_step": 165578, "epoch": 3942} {"train_loss": -7.058772087097168, "global_step": 165579, "epoch": 3942} {"train_loss": -6.977660655975342, "global_step": 165580, "epoch": 3942} {"train_loss": -6.910376071929932, "global_step": 165581, "epoch": 3942} {"train_loss": -6.970200538635254, "global_step": 165582, "epoch": 3942} {"train_loss": -6.814226150512695, "global_step": 165583, "epoch": 3942} {"train_loss": -6.922910213470459, "global_step": 165584, "epoch": 3942} {"train_loss": -6.916665077209473, "global_step": 165585, "epoch": 3942} {"train_loss": -7.0065412521362305, "global_step": 165586, "epoch": 3942} {"train_loss": -6.86800479888916, "global_step": 165587, "epoch": 3942} {"train_loss": -6.87789249420166, "global_step": 165588, "epoch": 3942} {"train_loss": -6.879388332366943, "global_step": 165589, "epoch": 3942} {"train_loss": -6.895846366882324, "global_step": 165590, "epoch": 3942} {"train_loss": -6.949371337890625, "global_step": 165591, "epoch": 3942} {"train_loss": -6.96436882019043, "global_step": 165592, "epoch": 3942} {"train_loss": -6.9161481857299805, "global_step": 165593, "epoch": 3942} {"train_loss": -6.905816078186035, "global_step": 165594, "epoch": 3942} {"train_loss": -6.973691940307617, "global_step": 165595, "epoch": 3942} {"train_loss": -6.943363189697266, "global_step": 165596, "epoch": 3942} {"train_loss": -6.961169719696045, "global_step": 165597, "epoch": 3942} {"train_loss": -6.9915547370910645, "global_step": 165598, "epoch": 3942} {"train_loss": -6.934370517730713, "global_step": 165599, "epoch": 3942} {"train_loss": -6.910739898681641, "global_step": 165600, "epoch": 3942} {"train_loss": -6.995665550231934, "global_step": 165601, "epoch": 3942} {"train_loss": -6.897176265716553, "global_step": 165602, "epoch": 3942} {"train_loss": -6.943913459777832, "global_step": 165603, "epoch": 3942} {"train_loss": -6.9979166984558105, "global_step": 165604, "epoch": 3942} {"train_loss": -6.952769574664888, "global_step": 165605, "epoch": 3942, "val_loss": 68630.9140625} {"train_loss": -7.045770645141602, "global_step": 165606, "epoch": 3943} {"train_loss": -6.919493675231934, "global_step": 165607, "epoch": 3943} {"train_loss": -6.9467620849609375, "global_step": 165608, "epoch": 3943} {"train_loss": -7.044467926025391, "global_step": 165609, "epoch": 3943} {"train_loss": -6.972010612487793, "global_step": 165610, "epoch": 3943} {"train_loss": -7.027732849121094, "global_step": 165611, "epoch": 3943} {"train_loss": -7.002387523651123, "global_step": 165612, "epoch": 3943} {"train_loss": -7.027364730834961, "global_step": 165613, "epoch": 3943} {"train_loss": -7.08280611038208, "global_step": 165614, "epoch": 3943} {"train_loss": -6.903180122375488, "global_step": 165615, "epoch": 3943} {"train_loss": -6.983247756958008, "global_step": 165616, "epoch": 3943} {"train_loss": -6.974405765533447, "global_step": 165617, "epoch": 3943} {"train_loss": -6.9748005867004395, "global_step": 165618, "epoch": 3943} {"train_loss": -6.865408897399902, "global_step": 165619, "epoch": 3943} {"train_loss": -7.026350975036621, "global_step": 165620, "epoch": 3943} {"train_loss": -7.056196689605713, "global_step": 165621, "epoch": 3943} {"train_loss": -7.043128967285156, "global_step": 165622, "epoch": 3943} {"train_loss": -6.964837074279785, "global_step": 165623, "epoch": 3943} {"train_loss": -7.055616855621338, "global_step": 165624, "epoch": 3943} {"train_loss": -6.924127578735352, "global_step": 165625, "epoch": 3943} {"train_loss": -7.052247047424316, "global_step": 165626, "epoch": 3943} {"train_loss": -7.023985862731934, "global_step": 165627, "epoch": 3943} {"train_loss": -6.949553489685059, "global_step": 165628, "epoch": 3943} {"train_loss": -7.063609600067139, "global_step": 165629, "epoch": 3943} {"train_loss": -7.071284294128418, "global_step": 165630, "epoch": 3943} {"train_loss": -6.952110290527344, "global_step": 165631, "epoch": 3943} {"train_loss": -6.926469802856445, "global_step": 165632, "epoch": 3943} {"train_loss": -6.963314056396484, "global_step": 165633, "epoch": 3943} {"train_loss": -7.067649841308594, "global_step": 165634, "epoch": 3943} {"train_loss": -6.90872859954834, "global_step": 165635, "epoch": 3943} {"train_loss": -7.027876853942871, "global_step": 165636, "epoch": 3943} {"train_loss": -7.053950309753418, "global_step": 165637, "epoch": 3943} {"train_loss": -7.008353233337402, "global_step": 165638, "epoch": 3943} {"train_loss": -7.00747537612915, "global_step": 165639, "epoch": 3943} {"train_loss": -6.967644691467285, "global_step": 165640, "epoch": 3943} {"train_loss": -6.8403167724609375, "global_step": 165641, "epoch": 3943} {"train_loss": -7.1210246086120605, "global_step": 165642, "epoch": 3943} {"train_loss": -7.0394086837768555, "global_step": 165643, "epoch": 3943} {"train_loss": -7.014520645141602, "global_step": 165644, "epoch": 3943} {"train_loss": -6.970965385437012, "global_step": 165645, "epoch": 3943} {"train_loss": -6.963481903076172, "global_step": 165646, "epoch": 3943} {"train_loss": -6.996012369791667, "global_step": 165647, "epoch": 3943, "val_loss": 68535.828125} {"train_loss": -7.031692981719971, "global_step": 165648, "epoch": 3944} {"train_loss": -7.028008937835693, "global_step": 165649, "epoch": 3944} {"train_loss": -6.958016872406006, "global_step": 165650, "epoch": 3944} {"train_loss": -6.896942138671875, "global_step": 165651, "epoch": 3944} {"train_loss": -6.940041542053223, "global_step": 165652, "epoch": 3944} {"train_loss": -6.981108665466309, "global_step": 165653, "epoch": 3944} {"train_loss": -7.066053867340088, "global_step": 165654, "epoch": 3944} {"train_loss": -6.943519592285156, "global_step": 165655, "epoch": 3944} {"train_loss": -7.083883285522461, "global_step": 165656, "epoch": 3944} {"train_loss": -7.0137939453125, "global_step": 165657, "epoch": 3944} {"train_loss": -6.9837751388549805, "global_step": 165658, "epoch": 3944} {"train_loss": -6.98783540725708, "global_step": 165659, "epoch": 3944} {"train_loss": -7.01708984375, "global_step": 165660, "epoch": 3944} {"train_loss": -7.073737144470215, "global_step": 165661, "epoch": 3944} {"train_loss": -7.139294624328613, "global_step": 165662, "epoch": 3944} {"train_loss": -6.79545259475708, "global_step": 165663, "epoch": 3944} {"train_loss": -6.865534782409668, "global_step": 165664, "epoch": 3944} {"train_loss": -6.933141708374023, "global_step": 165665, "epoch": 3944} {"train_loss": -6.86424446105957, "global_step": 165666, "epoch": 3944} {"train_loss": -6.788159370422363, "global_step": 165667, "epoch": 3944} {"train_loss": -7.025211334228516, "global_step": 165668, "epoch": 3944} {"train_loss": -6.867832183837891, "global_step": 165669, "epoch": 3944} {"train_loss": -6.969451904296875, "global_step": 165670, "epoch": 3944} {"train_loss": -6.870532035827637, "global_step": 165671, "epoch": 3944} {"train_loss": -7.054171562194824, "global_step": 165672, "epoch": 3944} {"train_loss": -6.84908390045166, "global_step": 165673, "epoch": 3944} {"train_loss": -6.970154762268066, "global_step": 165674, "epoch": 3944} {"train_loss": -7.001901149749756, "global_step": 165675, "epoch": 3944} {"train_loss": -6.934545516967773, "global_step": 165676, "epoch": 3944} {"train_loss": -6.8925957679748535, "global_step": 165677, "epoch": 3944} {"train_loss": -6.977423667907715, "global_step": 165678, "epoch": 3944} {"train_loss": -6.972110271453857, "global_step": 165679, "epoch": 3944} {"train_loss": -6.822917938232422, "global_step": 165680, "epoch": 3944} {"train_loss": -6.9008636474609375, "global_step": 165681, "epoch": 3944} {"train_loss": -6.937310218811035, "global_step": 165682, "epoch": 3944} {"train_loss": -6.694140434265137, "global_step": 165683, "epoch": 3944} {"train_loss": -6.997014999389648, "global_step": 165684, "epoch": 3944} {"train_loss": -6.9382710456848145, "global_step": 165685, "epoch": 3944} {"train_loss": -6.848206043243408, "global_step": 165686, "epoch": 3944} {"train_loss": -6.998595237731934, "global_step": 165687, "epoch": 3944} {"train_loss": -6.892761707305908, "global_step": 165688, "epoch": 3944} {"train_loss": -6.944190104802449, "global_step": 165689, "epoch": 3944, "val_loss": 68553.359375} {"train_loss": -6.887755393981934, "global_step": 165690, "epoch": 3945} {"train_loss": -6.854762554168701, "global_step": 165691, "epoch": 3945} {"train_loss": -6.756330966949463, "global_step": 165692, "epoch": 3945} {"train_loss": -6.904331207275391, "global_step": 165693, "epoch": 3945} {"train_loss": -6.767426490783691, "global_step": 165694, "epoch": 3945} {"train_loss": -6.914438247680664, "global_step": 165695, "epoch": 3945} {"train_loss": -6.79931640625, "global_step": 165696, "epoch": 3945} {"train_loss": -6.871457099914551, "global_step": 165697, "epoch": 3945} {"train_loss": -6.9088311195373535, "global_step": 165698, "epoch": 3945} {"train_loss": -6.955620765686035, "global_step": 165699, "epoch": 3945} {"train_loss": -6.980189323425293, "global_step": 165700, "epoch": 3945} {"train_loss": -6.996270179748535, "global_step": 165701, "epoch": 3945} {"train_loss": -7.003520965576172, "global_step": 165702, "epoch": 3945} {"train_loss": -6.884767532348633, "global_step": 165703, "epoch": 3945} {"train_loss": -6.825440406799316, "global_step": 165704, "epoch": 3945} {"train_loss": -6.804277420043945, "global_step": 165705, "epoch": 3945} {"train_loss": -6.987190246582031, "global_step": 165706, "epoch": 3945} {"train_loss": -6.984784126281738, "global_step": 165707, "epoch": 3945} {"train_loss": -6.94881534576416, "global_step": 165708, "epoch": 3945} {"train_loss": -6.980260372161865, "global_step": 165709, "epoch": 3945} {"train_loss": -6.842327117919922, "global_step": 165710, "epoch": 3945} {"train_loss": -7.056635856628418, "global_step": 165711, "epoch": 3945} {"train_loss": -6.844117164611816, "global_step": 165712, "epoch": 3945} {"train_loss": -6.890292167663574, "global_step": 165713, "epoch": 3945} {"train_loss": -6.828246116638184, "global_step": 165714, "epoch": 3945} {"train_loss": -6.964434623718262, "global_step": 165715, "epoch": 3945} {"train_loss": -6.90611457824707, "global_step": 165716, "epoch": 3945} {"train_loss": -6.838934421539307, "global_step": 165717, "epoch": 3945} {"train_loss": -6.9250407218933105, "global_step": 165718, "epoch": 3945} {"train_loss": -6.938503265380859, "global_step": 165719, "epoch": 3945} {"train_loss": -7.024196624755859, "global_step": 165720, "epoch": 3945} {"train_loss": -6.906374931335449, "global_step": 165721, "epoch": 3945} {"train_loss": -6.963410377502441, "global_step": 165722, "epoch": 3945} {"train_loss": -7.014300346374512, "global_step": 165723, "epoch": 3945} {"train_loss": -7.016652584075928, "global_step": 165724, "epoch": 3945} {"train_loss": -6.929753303527832, "global_step": 165725, "epoch": 3945} {"train_loss": -6.9543561935424805, "global_step": 165726, "epoch": 3945} {"train_loss": -7.012186050415039, "global_step": 165727, "epoch": 3945} {"train_loss": -6.925947189331055, "global_step": 165728, "epoch": 3945} {"train_loss": -7.0510029792785645, "global_step": 165729, "epoch": 3945} {"train_loss": -6.939019203186035, "global_step": 165730, "epoch": 3945} {"train_loss": -6.923440286091396, "global_step": 165731, "epoch": 3945, "val_loss": 68572.6484375} {"train_loss": -6.9735870361328125, "global_step": 165732, "epoch": 3946} {"train_loss": -7.017172813415527, "global_step": 165733, "epoch": 3946} {"train_loss": -6.957419395446777, "global_step": 165734, "epoch": 3946} {"train_loss": -7.013195514678955, "global_step": 165735, "epoch": 3946} {"train_loss": -7.092254638671875, "global_step": 165736, "epoch": 3946} {"train_loss": -7.11159610748291, "global_step": 165737, "epoch": 3946} {"train_loss": -6.999199390411377, "global_step": 165738, "epoch": 3946} {"train_loss": -6.942256450653076, "global_step": 165739, "epoch": 3946} {"train_loss": -7.0293097496032715, "global_step": 165740, "epoch": 3946} {"train_loss": -7.007363319396973, "global_step": 165741, "epoch": 3946} {"train_loss": -7.018314361572266, "global_step": 165742, "epoch": 3946} {"train_loss": -6.999179840087891, "global_step": 165743, "epoch": 3946} {"train_loss": -7.041134357452393, "global_step": 165744, "epoch": 3946} {"train_loss": -6.932674407958984, "global_step": 165745, "epoch": 3946} {"train_loss": -6.931581974029541, "global_step": 165746, "epoch": 3946} {"train_loss": -6.913403511047363, "global_step": 165747, "epoch": 3946} {"train_loss": -7.074016571044922, "global_step": 165748, "epoch": 3946} {"train_loss": -7.0228424072265625, "global_step": 165749, "epoch": 3946} {"train_loss": -7.028993606567383, "global_step": 165750, "epoch": 3946} {"train_loss": -7.0520477294921875, "global_step": 165751, "epoch": 3946} {"train_loss": -7.01597785949707, "global_step": 165752, "epoch": 3946} {"train_loss": -7.003606796264648, "global_step": 165753, "epoch": 3946} {"train_loss": -6.926427364349365, "global_step": 165754, "epoch": 3946} {"train_loss": -6.928372383117676, "global_step": 165755, "epoch": 3946} {"train_loss": -7.030621528625488, "global_step": 165756, "epoch": 3946} {"train_loss": -6.827800750732422, "global_step": 165757, "epoch": 3946} {"train_loss": -7.0443267822265625, "global_step": 165758, "epoch": 3946} {"train_loss": -7.01522970199585, "global_step": 165759, "epoch": 3946} {"train_loss": -7.063516616821289, "global_step": 165760, "epoch": 3946} {"train_loss": -7.067529678344727, "global_step": 165761, "epoch": 3946} {"train_loss": -6.964458465576172, "global_step": 165762, "epoch": 3946} {"train_loss": -6.907245635986328, "global_step": 165763, "epoch": 3946} {"train_loss": -7.0264668464660645, "global_step": 165764, "epoch": 3946} {"train_loss": -6.97935676574707, "global_step": 165765, "epoch": 3946} {"train_loss": -7.002803802490234, "global_step": 165766, "epoch": 3946} {"train_loss": -6.835609436035156, "global_step": 165767, "epoch": 3946} {"train_loss": -7.00508975982666, "global_step": 165768, "epoch": 3946} {"train_loss": -6.860072612762451, "global_step": 165769, "epoch": 3946} {"train_loss": -7.075007438659668, "global_step": 165770, "epoch": 3946} {"train_loss": -7.069134712219238, "global_step": 165771, "epoch": 3946} {"train_loss": -7.030848503112793, "global_step": 165772, "epoch": 3946} {"train_loss": -6.992127804529099, "global_step": 165773, "epoch": 3946, "val_loss": 68538.6875} {"train_loss": -7.0423688888549805, "global_step": 165774, "epoch": 3947} {"train_loss": -6.863980293273926, "global_step": 165775, "epoch": 3947} {"train_loss": -6.993904113769531, "global_step": 165776, "epoch": 3947} {"train_loss": -6.919758319854736, "global_step": 165777, "epoch": 3947} {"train_loss": -6.964304447174072, "global_step": 165778, "epoch": 3947} {"train_loss": -7.1227264404296875, "global_step": 165779, "epoch": 3947} {"train_loss": -6.997195243835449, "global_step": 165780, "epoch": 3947} {"train_loss": -6.995573043823242, "global_step": 165781, "epoch": 3947} {"train_loss": -6.932121753692627, "global_step": 165782, "epoch": 3947} {"train_loss": -6.989726543426514, "global_step": 165783, "epoch": 3947} {"train_loss": -6.923992156982422, "global_step": 165784, "epoch": 3947} {"train_loss": -7.020465850830078, "global_step": 165785, "epoch": 3947} {"train_loss": -6.993809700012207, "global_step": 165786, "epoch": 3947} {"train_loss": -7.041568756103516, "global_step": 165787, "epoch": 3947} {"train_loss": -6.993626594543457, "global_step": 165788, "epoch": 3947} {"train_loss": -6.963653564453125, "global_step": 165789, "epoch": 3947} {"train_loss": -7.049735069274902, "global_step": 165790, "epoch": 3947} {"train_loss": -6.978867530822754, "global_step": 165791, "epoch": 3947} {"train_loss": -6.988635063171387, "global_step": 165792, "epoch": 3947} {"train_loss": -6.969566345214844, "global_step": 165793, "epoch": 3947} {"train_loss": -6.973491668701172, "global_step": 165794, "epoch": 3947} {"train_loss": -6.892341613769531, "global_step": 165795, "epoch": 3947} {"train_loss": -6.9006500244140625, "global_step": 165796, "epoch": 3947} {"train_loss": -6.87408447265625, "global_step": 165797, "epoch": 3947} {"train_loss": -7.047117233276367, "global_step": 165798, "epoch": 3947} {"train_loss": -6.767401695251465, "global_step": 165799, "epoch": 3947} {"train_loss": -6.859945774078369, "global_step": 165800, "epoch": 3947} {"train_loss": -6.948938369750977, "global_step": 165801, "epoch": 3947} {"train_loss": -6.886918544769287, "global_step": 165802, "epoch": 3947} {"train_loss": -7.027301788330078, "global_step": 165803, "epoch": 3947} {"train_loss": -6.865942001342773, "global_step": 165804, "epoch": 3947} {"train_loss": -6.971797943115234, "global_step": 165805, "epoch": 3947} {"train_loss": -6.862849712371826, "global_step": 165806, "epoch": 3947} {"train_loss": -6.915600776672363, "global_step": 165807, "epoch": 3947} {"train_loss": -6.961097717285156, "global_step": 165808, "epoch": 3947} {"train_loss": -6.801858425140381, "global_step": 165809, "epoch": 3947} {"train_loss": -6.959897041320801, "global_step": 165810, "epoch": 3947} {"train_loss": -6.997547149658203, "global_step": 165811, "epoch": 3947} {"train_loss": -6.910026550292969, "global_step": 165812, "epoch": 3947} {"train_loss": -6.8459272384643555, "global_step": 165813, "epoch": 3947} {"train_loss": -6.878757476806641, "global_step": 165814, "epoch": 3947} {"train_loss": -6.948885304587228, "global_step": 165815, "epoch": 3947, "val_loss": 68770.34375} {"train_loss": -6.864612579345703, "global_step": 165816, "epoch": 3948} {"train_loss": -6.790637969970703, "global_step": 165817, "epoch": 3948} {"train_loss": -6.730945110321045, "global_step": 165818, "epoch": 3948} {"train_loss": -6.905557155609131, "global_step": 165819, "epoch": 3948} {"train_loss": -6.653548240661621, "global_step": 165820, "epoch": 3948} {"train_loss": -6.901390075683594, "global_step": 165821, "epoch": 3948} {"train_loss": -6.908029556274414, "global_step": 165822, "epoch": 3948} {"train_loss": -6.703915119171143, "global_step": 165823, "epoch": 3948} {"train_loss": -6.790602207183838, "global_step": 165824, "epoch": 3948} {"train_loss": -6.738863945007324, "global_step": 165825, "epoch": 3948} {"train_loss": -6.818202018737793, "global_step": 165826, "epoch": 3948} {"train_loss": -6.846342086791992, "global_step": 165827, "epoch": 3948} {"train_loss": -6.837705135345459, "global_step": 165828, "epoch": 3948} {"train_loss": -6.545499801635742, "global_step": 165829, "epoch": 3948} {"train_loss": -6.744292736053467, "global_step": 165830, "epoch": 3948} {"train_loss": -6.628062725067139, "global_step": 165831, "epoch": 3948} {"train_loss": -6.878098487854004, "global_step": 165832, "epoch": 3948} {"train_loss": -6.660834312438965, "global_step": 165833, "epoch": 3948} {"train_loss": -6.806637287139893, "global_step": 165834, "epoch": 3948} {"train_loss": -6.750607490539551, "global_step": 165835, "epoch": 3948} {"train_loss": -6.759407043457031, "global_step": 165836, "epoch": 3948} {"train_loss": -6.717510223388672, "global_step": 165837, "epoch": 3948} {"train_loss": -6.726330280303955, "global_step": 165838, "epoch": 3948} {"train_loss": -6.954585552215576, "global_step": 165839, "epoch": 3948} {"train_loss": -6.710737228393555, "global_step": 165840, "epoch": 3948} {"train_loss": -6.923365592956543, "global_step": 165841, "epoch": 3948} {"train_loss": -6.900330543518066, "global_step": 165842, "epoch": 3948} {"train_loss": -6.839484214782715, "global_step": 165843, "epoch": 3948} {"train_loss": -6.946660041809082, "global_step": 165844, "epoch": 3948} {"train_loss": -6.866059303283691, "global_step": 165845, "epoch": 3948} {"train_loss": -6.785243034362793, "global_step": 165846, "epoch": 3948} {"train_loss": -6.920017242431641, "global_step": 165847, "epoch": 3948} {"train_loss": -6.828149318695068, "global_step": 165848, "epoch": 3948} {"train_loss": -6.832427024841309, "global_step": 165849, "epoch": 3948} {"train_loss": -6.910859107971191, "global_step": 165850, "epoch": 3948} {"train_loss": -6.866448879241943, "global_step": 165851, "epoch": 3948} {"train_loss": -6.915169715881348, "global_step": 165852, "epoch": 3948} {"train_loss": -6.92897891998291, "global_step": 165853, "epoch": 3948} {"train_loss": -6.900801658630371, "global_step": 165854, "epoch": 3948} {"train_loss": -6.817061424255371, "global_step": 165855, "epoch": 3948} {"train_loss": -6.930293083190918, "global_step": 165856, "epoch": 3948} {"train_loss": -6.819055772963024, "global_step": 165857, "epoch": 3948, "val_loss": 68751.9375} {"train_loss": -7.051511287689209, "global_step": 165858, "epoch": 3949} {"train_loss": -6.914073467254639, "global_step": 165859, "epoch": 3949} {"train_loss": -6.890434265136719, "global_step": 165860, "epoch": 3949} {"train_loss": -7.031092643737793, "global_step": 165861, "epoch": 3949} {"train_loss": -6.952634334564209, "global_step": 165862, "epoch": 3949} {"train_loss": -7.0059123039245605, "global_step": 165863, "epoch": 3949} {"train_loss": -6.965828895568848, "global_step": 165864, "epoch": 3949} {"train_loss": -6.882375717163086, "global_step": 165865, "epoch": 3949} {"train_loss": -7.004152297973633, "global_step": 165866, "epoch": 3949} {"train_loss": -7.009703159332275, "global_step": 165867, "epoch": 3949} {"train_loss": -6.977815628051758, "global_step": 165868, "epoch": 3949} {"train_loss": -7.02614164352417, "global_step": 165869, "epoch": 3949} {"train_loss": -6.959391117095947, "global_step": 165870, "epoch": 3949} {"train_loss": -6.793394088745117, "global_step": 165871, "epoch": 3949} {"train_loss": -6.891206741333008, "global_step": 165872, "epoch": 3949} {"train_loss": -6.960364818572998, "global_step": 165873, "epoch": 3949} {"train_loss": -6.847019195556641, "global_step": 165874, "epoch": 3949} {"train_loss": -6.9314703941345215, "global_step": 165875, "epoch": 3949} {"train_loss": -6.926718235015869, "global_step": 165876, "epoch": 3949} {"train_loss": -6.6939287185668945, "global_step": 165877, "epoch": 3949} {"train_loss": -6.813238143920898, "global_step": 165878, "epoch": 3949} {"train_loss": -6.812325477600098, "global_step": 165879, "epoch": 3949} {"train_loss": -6.880446434020996, "global_step": 165880, "epoch": 3949} {"train_loss": -6.800308704376221, "global_step": 165881, "epoch": 3949} {"train_loss": -6.671788215637207, "global_step": 165882, "epoch": 3949} {"train_loss": -6.805870056152344, "global_step": 165883, "epoch": 3949} {"train_loss": -6.8543596267700195, "global_step": 165884, "epoch": 3949} {"train_loss": -6.845589637756348, "global_step": 165885, "epoch": 3949} {"train_loss": -6.884653091430664, "global_step": 165886, "epoch": 3949} {"train_loss": -6.764476299285889, "global_step": 165887, "epoch": 3949} {"train_loss": -6.883059978485107, "global_step": 165888, "epoch": 3949} {"train_loss": -6.811922073364258, "global_step": 165889, "epoch": 3949} {"train_loss": -6.9302520751953125, "global_step": 165890, "epoch": 3949} {"train_loss": -6.784318923950195, "global_step": 165891, "epoch": 3949} {"train_loss": -6.880124568939209, "global_step": 165892, "epoch": 3949} {"train_loss": -6.929242134094238, "global_step": 165893, "epoch": 3949} {"train_loss": -6.982112407684326, "global_step": 165894, "epoch": 3949} {"train_loss": -6.884411811828613, "global_step": 165895, "epoch": 3949} {"train_loss": -6.8746819496154785, "global_step": 165896, "epoch": 3949} {"train_loss": -6.9595746994018555, "global_step": 165897, "epoch": 3949} {"train_loss": -6.737405776977539, "global_step": 165898, "epoch": 3949} {"train_loss": -6.88909710021246, "global_step": 165899, "epoch": 3949, "val_loss": 68600.796875} {"train_loss": -6.825998306274414, "global_step": 165900, "epoch": 3950} {"train_loss": -7.032710075378418, "global_step": 165901, "epoch": 3950} {"train_loss": -6.946076393127441, "global_step": 165902, "epoch": 3950} {"train_loss": -7.092153549194336, "global_step": 165903, "epoch": 3950} {"train_loss": -7.014348983764648, "global_step": 165904, "epoch": 3950} {"train_loss": -6.992824554443359, "global_step": 165905, "epoch": 3950} {"train_loss": -6.967085838317871, "global_step": 165906, "epoch": 3950} {"train_loss": -6.946342945098877, "global_step": 165907, "epoch": 3950} {"train_loss": -6.9840989112854, "global_step": 165908, "epoch": 3950} {"train_loss": -6.933133125305176, "global_step": 165909, "epoch": 3950} {"train_loss": -7.101056098937988, "global_step": 165910, "epoch": 3950} {"train_loss": -6.883952617645264, "global_step": 165911, "epoch": 3950} {"train_loss": -7.013505935668945, "global_step": 165912, "epoch": 3950} {"train_loss": -7.052319526672363, "global_step": 165913, "epoch": 3950} {"train_loss": -6.981296539306641, "global_step": 165914, "epoch": 3950} {"train_loss": -6.914309978485107, "global_step": 165915, "epoch": 3950} {"train_loss": -7.10800838470459, "global_step": 165916, "epoch": 3950} {"train_loss": -6.9185991287231445, "global_step": 165917, "epoch": 3950} {"train_loss": -6.917291641235352, "global_step": 165918, "epoch": 3950} {"train_loss": -6.9077372550964355, "global_step": 165919, "epoch": 3950} {"train_loss": -7.020421504974365, "global_step": 165920, "epoch": 3950} {"train_loss": -7.175314426422119, "global_step": 165921, "epoch": 3950} {"train_loss": -7.048097610473633, "global_step": 165922, "epoch": 3950} {"train_loss": -7.015613079071045, "global_step": 165923, "epoch": 3950} {"train_loss": -7.134939670562744, "global_step": 165924, "epoch": 3950} {"train_loss": -6.896117687225342, "global_step": 165925, "epoch": 3950} {"train_loss": -7.077082633972168, "global_step": 165926, "epoch": 3950} {"train_loss": -7.011931419372559, "global_step": 165927, "epoch": 3950} {"train_loss": -7.0620012283325195, "global_step": 165928, "epoch": 3950} {"train_loss": -7.0830078125, "global_step": 165929, "epoch": 3950} {"train_loss": -6.989846229553223, "global_step": 165930, "epoch": 3950} {"train_loss": -6.929311275482178, "global_step": 165931, "epoch": 3950} {"train_loss": -7.009823322296143, "global_step": 165932, "epoch": 3950} {"train_loss": -6.97209358215332, "global_step": 165933, "epoch": 3950} {"train_loss": -6.888122081756592, "global_step": 165934, "epoch": 3950} {"train_loss": -6.970308303833008, "global_step": 165935, "epoch": 3950} {"train_loss": -6.931486129760742, "global_step": 165936, "epoch": 3950} {"train_loss": -6.943561553955078, "global_step": 165937, "epoch": 3950} {"train_loss": -6.992973327636719, "global_step": 165938, "epoch": 3950} {"train_loss": -6.926473140716553, "global_step": 165939, "epoch": 3950} {"train_loss": -6.759639739990234, "global_step": 165940, "epoch": 3950} {"train_loss": -6.984678563617525, "global_step": 165941, "epoch": 3950, "train/sim_max_reward_0": 0.21978675095987055, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.5840045496265155, "train/sim_max_reward_3": 0.1206359393814214, "train/sim_max_reward_4": 0.4270305592586691, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.4054104325737677, "test/sim_max_reward_4400001": 0.2518293711979045, "test/sim_max_reward_4400002": 0.8634038695102668, "test/sim_max_reward_4400003": 0.8072110899576083, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.6279750875608034, "test/sim_max_reward_4400006": 0.9747215697049681, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.30066997773209814, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 0.20784743948127601, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9726690988403546, "test/sim_max_reward_4400013": 0.9648273068478892, "test/sim_max_reward_4400014": 0.9823032720396396, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2793717968736196, "test/sim_max_reward_4400019": 0.031538163055415847, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.5355672293970872, "test/sim_max_reward_4400023": 0.9262631608663425, "test/sim_max_reward_4400024": 0.9822405072006147, "test/sim_max_reward_4400025": 0.26705597358207517, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0022247063633639365, "test/sim_max_reward_4400028": 0.5177210678210176, "test/sim_max_reward_4400029": 0.5088295253146696, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9990711193625106, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9178475483965899, "test/sim_max_reward_4400034": 0.8846166231750989, "test/sim_max_reward_4400035": 0.9851522615353168, "test/sim_max_reward_4400036": 0.4147857297798836, "test/sim_max_reward_4400037": 0.8624227595834475, "test/sim_max_reward_4400038": 0.9929795828922156, "test/sim_max_reward_4400039": 0.965138929324673, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.996986795121937, "test/sim_max_reward_4400042": 0.5057746944113929, "test/sim_max_reward_4400043": 0.9293826977408084, "test/sim_max_reward_4400044": 0.7214052230205605, "test/sim_max_reward_4400045": 0.960843308910705, "test/sim_max_reward_4400046": 0.9424358062603223, "test/sim_max_reward_4400047": 0.9919085882894126, "test/sim_max_reward_4400048": 0.9256348779540885, "test/sim_max_reward_4400049": 0.7957837830307812, "train/mean_score": 0.4240737597647773, "test/mean_score": 0.5949609191048285, "val_loss": 68716.015625} {"train_loss": -7.003430366516113, "global_step": 165942, "epoch": 3951} {"train_loss": -6.862277984619141, "global_step": 165943, "epoch": 3951} {"train_loss": -6.939016819000244, "global_step": 165944, "epoch": 3951} {"train_loss": -6.875134468078613, "global_step": 165945, "epoch": 3951} {"train_loss": -7.012606620788574, "global_step": 165946, "epoch": 3951} {"train_loss": -6.978114604949951, "global_step": 165947, "epoch": 3951} {"train_loss": -6.986593723297119, "global_step": 165948, "epoch": 3951} {"train_loss": -7.014772415161133, "global_step": 165949, "epoch": 3951} {"train_loss": -6.8969268798828125, "global_step": 165950, "epoch": 3951} {"train_loss": -6.920764446258545, "global_step": 165951, "epoch": 3951} {"train_loss": -7.009401798248291, "global_step": 165952, "epoch": 3951} {"train_loss": -7.0066423416137695, "global_step": 165953, "epoch": 3951} {"train_loss": -6.924371719360352, "global_step": 165954, "epoch": 3951} {"train_loss": -6.970727443695068, "global_step": 165955, "epoch": 3951} {"train_loss": -6.988223075866699, "global_step": 165956, "epoch": 3951} {"train_loss": -6.988620281219482, "global_step": 165957, "epoch": 3951} {"train_loss": -7.027714729309082, "global_step": 165958, "epoch": 3951} {"train_loss": -7.042553901672363, "global_step": 165959, "epoch": 3951} {"train_loss": -6.96122932434082, "global_step": 165960, "epoch": 3951} {"train_loss": -6.8609209060668945, "global_step": 165961, "epoch": 3951} {"train_loss": -6.885128021240234, "global_step": 165962, "epoch": 3951} {"train_loss": -6.953978538513184, "global_step": 165963, "epoch": 3951} {"train_loss": -7.027385711669922, "global_step": 165964, "epoch": 3951} {"train_loss": -7.018568515777588, "global_step": 165965, "epoch": 3951} {"train_loss": -7.094979286193848, "global_step": 165966, "epoch": 3951} {"train_loss": -6.964491844177246, "global_step": 165967, "epoch": 3951} {"train_loss": -6.8677473068237305, "global_step": 165968, "epoch": 3951} {"train_loss": -6.917684555053711, "global_step": 165969, "epoch": 3951} {"train_loss": -6.897781848907471, "global_step": 165970, "epoch": 3951} {"train_loss": -7.011564254760742, "global_step": 165971, "epoch": 3951} {"train_loss": -6.980142116546631, "global_step": 165972, "epoch": 3951} {"train_loss": -6.930257320404053, "global_step": 165973, "epoch": 3951} {"train_loss": -6.903156757354736, "global_step": 165974, "epoch": 3951} {"train_loss": -6.985121726989746, "global_step": 165975, "epoch": 3951} {"train_loss": -6.871098041534424, "global_step": 165976, "epoch": 3951} {"train_loss": -6.926468372344971, "global_step": 165977, "epoch": 3951} {"train_loss": -7.003195762634277, "global_step": 165978, "epoch": 3951} {"train_loss": -6.9601030349731445, "global_step": 165979, "epoch": 3951} {"train_loss": -7.030316352844238, "global_step": 165980, "epoch": 3951} {"train_loss": -6.9481611251831055, "global_step": 165981, "epoch": 3951} {"train_loss": -6.953373432159424, "global_step": 165982, "epoch": 3951} {"train_loss": -6.960731324695406, "global_step": 165983, "epoch": 3951, "val_loss": 68529.125} {"train_loss": -6.956470489501953, "global_step": 165984, "epoch": 3952} {"train_loss": -6.983935832977295, "global_step": 165985, "epoch": 3952} {"train_loss": -7.017849922180176, "global_step": 165986, "epoch": 3952} {"train_loss": -6.9194135665893555, "global_step": 165987, "epoch": 3952} {"train_loss": -6.955497741699219, "global_step": 165988, "epoch": 3952} {"train_loss": -6.9594316482543945, "global_step": 165989, "epoch": 3952} {"train_loss": -6.916759490966797, "global_step": 165990, "epoch": 3952} {"train_loss": -6.957056999206543, "global_step": 165991, "epoch": 3952} {"train_loss": -7.003049373626709, "global_step": 165992, "epoch": 3952} {"train_loss": -6.964690208435059, "global_step": 165993, "epoch": 3952} {"train_loss": -6.963522911071777, "global_step": 165994, "epoch": 3952} {"train_loss": -6.966301918029785, "global_step": 165995, "epoch": 3952} {"train_loss": -6.99433708190918, "global_step": 165996, "epoch": 3952} {"train_loss": -6.901155471801758, "global_step": 165997, "epoch": 3952} {"train_loss": -6.922280788421631, "global_step": 165998, "epoch": 3952} {"train_loss": -6.8037309646606445, "global_step": 165999, "epoch": 3952} {"train_loss": -6.984789848327637, "global_step": 166000, "epoch": 3952} {"train_loss": -6.894679069519043, "global_step": 166001, "epoch": 3952} {"train_loss": -6.864469528198242, "global_step": 166002, "epoch": 3952} {"train_loss": -6.983591079711914, "global_step": 166003, "epoch": 3952} {"train_loss": -6.916769027709961, "global_step": 166004, "epoch": 3952} {"train_loss": -6.993626117706299, "global_step": 166005, "epoch": 3952} {"train_loss": -7.060851097106934, "global_step": 166006, "epoch": 3952} {"train_loss": -6.876276016235352, "global_step": 166007, "epoch": 3952} {"train_loss": -6.9174652099609375, "global_step": 166008, "epoch": 3952} {"train_loss": -7.001492977142334, "global_step": 166009, "epoch": 3952} {"train_loss": -6.9302978515625, "global_step": 166010, "epoch": 3952} {"train_loss": -7.0920257568359375, "global_step": 166011, "epoch": 3952} {"train_loss": -6.932707786560059, "global_step": 166012, "epoch": 3952} {"train_loss": -6.997393608093262, "global_step": 166013, "epoch": 3952} {"train_loss": -6.8644514083862305, "global_step": 166014, "epoch": 3952} {"train_loss": -6.881908893585205, "global_step": 166015, "epoch": 3952} {"train_loss": -6.900537490844727, "global_step": 166016, "epoch": 3952} {"train_loss": -6.937046527862549, "global_step": 166017, "epoch": 3952} {"train_loss": -6.903424263000488, "global_step": 166018, "epoch": 3952} {"train_loss": -6.871718406677246, "global_step": 166019, "epoch": 3952} {"train_loss": -6.844130516052246, "global_step": 166020, "epoch": 3952} {"train_loss": -6.927570819854736, "global_step": 166021, "epoch": 3952} {"train_loss": -6.869197845458984, "global_step": 166022, "epoch": 3952} {"train_loss": -6.995359420776367, "global_step": 166023, "epoch": 3952} {"train_loss": -6.867397308349609, "global_step": 166024, "epoch": 3952} {"train_loss": -6.936753579548427, "global_step": 166025, "epoch": 3952, "val_loss": 68721.6640625} {"train_loss": -7.042764663696289, "global_step": 166026, "epoch": 3953} {"train_loss": -6.963954925537109, "global_step": 166027, "epoch": 3953} {"train_loss": -7.005282878875732, "global_step": 166028, "epoch": 3953} {"train_loss": -7.008848190307617, "global_step": 166029, "epoch": 3953} {"train_loss": -6.960280418395996, "global_step": 166030, "epoch": 3953} {"train_loss": -6.9852399826049805, "global_step": 166031, "epoch": 3953} {"train_loss": -7.0133771896362305, "global_step": 166032, "epoch": 3953} {"train_loss": -6.8465166091918945, "global_step": 166033, "epoch": 3953} {"train_loss": -6.9676618576049805, "global_step": 166034, "epoch": 3953} {"train_loss": -6.806116104125977, "global_step": 166035, "epoch": 3953} {"train_loss": -6.90207576751709, "global_step": 166036, "epoch": 3953} {"train_loss": -6.946369647979736, "global_step": 166037, "epoch": 3953} {"train_loss": -6.9869184494018555, "global_step": 166038, "epoch": 3953} {"train_loss": -6.792998313903809, "global_step": 166039, "epoch": 3953} {"train_loss": -6.921527862548828, "global_step": 166040, "epoch": 3953} {"train_loss": -6.8216938972473145, "global_step": 166041, "epoch": 3953} {"train_loss": -7.0051703453063965, "global_step": 166042, "epoch": 3953} {"train_loss": -6.870226860046387, "global_step": 166043, "epoch": 3953} {"train_loss": -6.877918243408203, "global_step": 166044, "epoch": 3953} {"train_loss": -7.060292720794678, "global_step": 166045, "epoch": 3953} {"train_loss": -6.8949761390686035, "global_step": 166046, "epoch": 3953} {"train_loss": -6.975659370422363, "global_step": 166047, "epoch": 3953} {"train_loss": -6.927855968475342, "global_step": 166048, "epoch": 3953} {"train_loss": -6.9126691818237305, "global_step": 166049, "epoch": 3953} {"train_loss": -7.043107986450195, "global_step": 166050, "epoch": 3953} {"train_loss": -6.92636775970459, "global_step": 166051, "epoch": 3953} {"train_loss": -6.925393104553223, "global_step": 166052, "epoch": 3953} {"train_loss": -6.958475112915039, "global_step": 166053, "epoch": 3953} {"train_loss": -7.025461196899414, "global_step": 166054, "epoch": 3953} {"train_loss": -6.95898962020874, "global_step": 166055, "epoch": 3953} {"train_loss": -7.0314507484436035, "global_step": 166056, "epoch": 3953} {"train_loss": -7.009825706481934, "global_step": 166057, "epoch": 3953} {"train_loss": -6.972583770751953, "global_step": 166058, "epoch": 3953} {"train_loss": -7.0285234451293945, "global_step": 166059, "epoch": 3953} {"train_loss": -7.005890846252441, "global_step": 166060, "epoch": 3953} {"train_loss": -7.0461506843566895, "global_step": 166061, "epoch": 3953} {"train_loss": -6.9890456199646, "global_step": 166062, "epoch": 3953} {"train_loss": -7.014904499053955, "global_step": 166063, "epoch": 3953} {"train_loss": -6.959099769592285, "global_step": 166064, "epoch": 3953} {"train_loss": -7.065908432006836, "global_step": 166065, "epoch": 3953} {"train_loss": -7.125490665435791, "global_step": 166066, "epoch": 3953} {"train_loss": -6.962430953979492, "global_step": 166067, "epoch": 3953, "val_loss": 68446.0} {"train_loss": -6.813536643981934, "global_step": 166068, "epoch": 3954} {"train_loss": -6.951209545135498, "global_step": 166069, "epoch": 3954} {"train_loss": -6.954043388366699, "global_step": 166070, "epoch": 3954} {"train_loss": -6.901444435119629, "global_step": 166071, "epoch": 3954} {"train_loss": -7.005322456359863, "global_step": 166072, "epoch": 3954} {"train_loss": -6.864974021911621, "global_step": 166073, "epoch": 3954} {"train_loss": -6.893387794494629, "global_step": 166074, "epoch": 3954} {"train_loss": -6.9643235206604, "global_step": 166075, "epoch": 3954} {"train_loss": -6.738186836242676, "global_step": 166076, "epoch": 3954} {"train_loss": -6.87396240234375, "global_step": 166077, "epoch": 3954} {"train_loss": -7.013740539550781, "global_step": 166078, "epoch": 3954} {"train_loss": -6.816540241241455, "global_step": 166079, "epoch": 3954} {"train_loss": -6.92734432220459, "global_step": 166080, "epoch": 3954} {"train_loss": -6.839883804321289, "global_step": 166081, "epoch": 3954} {"train_loss": -6.733247756958008, "global_step": 166082, "epoch": 3954} {"train_loss": -6.891866683959961, "global_step": 166083, "epoch": 3954} {"train_loss": -6.858194828033447, "global_step": 166084, "epoch": 3954} {"train_loss": -6.963436603546143, "global_step": 166085, "epoch": 3954} {"train_loss": -6.910213947296143, "global_step": 166086, "epoch": 3954} {"train_loss": -6.949547290802002, "global_step": 166087, "epoch": 3954} {"train_loss": -6.933736324310303, "global_step": 166088, "epoch": 3954} {"train_loss": -6.8722920417785645, "global_step": 166089, "epoch": 3954} {"train_loss": -7.009710788726807, "global_step": 166090, "epoch": 3954} {"train_loss": -7.068603038787842, "global_step": 166091, "epoch": 3954} {"train_loss": -7.01120662689209, "global_step": 166092, "epoch": 3954} {"train_loss": -6.959867477416992, "global_step": 166093, "epoch": 3954} {"train_loss": -7.03413200378418, "global_step": 166094, "epoch": 3954} {"train_loss": -6.868474960327148, "global_step": 166095, "epoch": 3954} {"train_loss": -7.000668048858643, "global_step": 166096, "epoch": 3954} {"train_loss": -6.914248466491699, "global_step": 166097, "epoch": 3954} {"train_loss": -6.965435981750488, "global_step": 166098, "epoch": 3954} {"train_loss": -6.929689407348633, "global_step": 166099, "epoch": 3954} {"train_loss": -6.929262161254883, "global_step": 166100, "epoch": 3954} {"train_loss": -7.008683204650879, "global_step": 166101, "epoch": 3954} {"train_loss": -6.930834770202637, "global_step": 166102, "epoch": 3954} {"train_loss": -6.936882972717285, "global_step": 166103, "epoch": 3954} {"train_loss": -6.986821174621582, "global_step": 166104, "epoch": 3954} {"train_loss": -6.932516574859619, "global_step": 166105, "epoch": 3954} {"train_loss": -6.851164817810059, "global_step": 166106, "epoch": 3954} {"train_loss": -6.954134464263916, "global_step": 166107, "epoch": 3954} {"train_loss": -6.951508522033691, "global_step": 166108, "epoch": 3954} {"train_loss": -6.924774805704753, "global_step": 166109, "epoch": 3954, "val_loss": 68670.546875} {"train_loss": -6.93902587890625, "global_step": 166110, "epoch": 3955} {"train_loss": -6.9849066734313965, "global_step": 166111, "epoch": 3955} {"train_loss": -7.008456230163574, "global_step": 166112, "epoch": 3955} {"train_loss": -6.860142707824707, "global_step": 166113, "epoch": 3955} {"train_loss": -7.053118705749512, "global_step": 166114, "epoch": 3955} {"train_loss": -6.915352821350098, "global_step": 166115, "epoch": 3955} {"train_loss": -6.9834136962890625, "global_step": 166116, "epoch": 3955} {"train_loss": -7.00737190246582, "global_step": 166117, "epoch": 3955} {"train_loss": -6.836243152618408, "global_step": 166118, "epoch": 3955} {"train_loss": -6.904658317565918, "global_step": 166119, "epoch": 3955} {"train_loss": -7.007213115692139, "global_step": 166120, "epoch": 3955} {"train_loss": -6.93004035949707, "global_step": 166121, "epoch": 3955} {"train_loss": -6.973222732543945, "global_step": 166122, "epoch": 3955} {"train_loss": -6.986414909362793, "global_step": 166123, "epoch": 3955} {"train_loss": -6.939708232879639, "global_step": 166124, "epoch": 3955} {"train_loss": -6.893730640411377, "global_step": 166125, "epoch": 3955} {"train_loss": -6.879034996032715, "global_step": 166126, "epoch": 3955} {"train_loss": -6.946834564208984, "global_step": 166127, "epoch": 3955} {"train_loss": -7.052386283874512, "global_step": 166128, "epoch": 3955} {"train_loss": -7.002559661865234, "global_step": 166129, "epoch": 3955} {"train_loss": -7.068619251251221, "global_step": 166130, "epoch": 3955} {"train_loss": -7.0093536376953125, "global_step": 166131, "epoch": 3955} {"train_loss": -6.943685054779053, "global_step": 166132, "epoch": 3955} {"train_loss": -6.9709272384643555, "global_step": 166133, "epoch": 3955} {"train_loss": -6.930156707763672, "global_step": 166134, "epoch": 3955} {"train_loss": -6.9877848625183105, "global_step": 166135, "epoch": 3955} {"train_loss": -7.040942192077637, "global_step": 166136, "epoch": 3955} {"train_loss": -7.059598922729492, "global_step": 166137, "epoch": 3955} {"train_loss": -6.996251583099365, "global_step": 166138, "epoch": 3955} {"train_loss": -6.990371227264404, "global_step": 166139, "epoch": 3955} {"train_loss": -6.9805684089660645, "global_step": 166140, "epoch": 3955} {"train_loss": -6.994070053100586, "global_step": 166141, "epoch": 3955} {"train_loss": -7.04902458190918, "global_step": 166142, "epoch": 3955} {"train_loss": -6.881403923034668, "global_step": 166143, "epoch": 3955} {"train_loss": -6.878769397735596, "global_step": 166144, "epoch": 3955} {"train_loss": -6.961183547973633, "global_step": 166145, "epoch": 3955} {"train_loss": -7.031438827514648, "global_step": 166146, "epoch": 3955} {"train_loss": -6.871189117431641, "global_step": 166147, "epoch": 3955} {"train_loss": -6.888588905334473, "global_step": 166148, "epoch": 3955} {"train_loss": -7.046369552612305, "global_step": 166149, "epoch": 3955} {"train_loss": -6.917141914367676, "global_step": 166150, "epoch": 3955} {"train_loss": -6.963676725115095, "global_step": 166151, "epoch": 3955, "val_loss": 68624.875} {"train_loss": -6.9339752197265625, "global_step": 166152, "epoch": 3956} {"train_loss": -6.883928298950195, "global_step": 166153, "epoch": 3956} {"train_loss": -6.951525688171387, "global_step": 166154, "epoch": 3956} {"train_loss": -6.943121910095215, "global_step": 166155, "epoch": 3956} {"train_loss": -6.865874767303467, "global_step": 166156, "epoch": 3956} {"train_loss": -6.982487678527832, "global_step": 166157, "epoch": 3956} {"train_loss": -6.922338485717773, "global_step": 166158, "epoch": 3956} {"train_loss": -6.88170051574707, "global_step": 166159, "epoch": 3956} {"train_loss": -6.909318447113037, "global_step": 166160, "epoch": 3956} {"train_loss": -6.9925336837768555, "global_step": 166161, "epoch": 3956} {"train_loss": -6.828631401062012, "global_step": 166162, "epoch": 3956} {"train_loss": -7.001321315765381, "global_step": 166163, "epoch": 3956} {"train_loss": -6.957312107086182, "global_step": 166164, "epoch": 3956} {"train_loss": -6.960080146789551, "global_step": 166165, "epoch": 3956} {"train_loss": -6.9708685874938965, "global_step": 166166, "epoch": 3956} {"train_loss": -6.95028018951416, "global_step": 166167, "epoch": 3956} {"train_loss": -6.86591911315918, "global_step": 166168, "epoch": 3956} {"train_loss": -6.940255165100098, "global_step": 166169, "epoch": 3956} {"train_loss": -6.928688049316406, "global_step": 166170, "epoch": 3956} {"train_loss": -6.954832553863525, "global_step": 166171, "epoch": 3956} {"train_loss": -6.960515975952148, "global_step": 166172, "epoch": 3956} {"train_loss": -6.906396865844727, "global_step": 166173, "epoch": 3956} {"train_loss": -7.023256301879883, "global_step": 166174, "epoch": 3956} {"train_loss": -6.889381408691406, "global_step": 166175, "epoch": 3956} {"train_loss": -7.024432182312012, "global_step": 166176, "epoch": 3956} {"train_loss": -6.912740707397461, "global_step": 166177, "epoch": 3956} {"train_loss": -7.092927932739258, "global_step": 166178, "epoch": 3956} {"train_loss": -6.944267749786377, "global_step": 166179, "epoch": 3956} {"train_loss": -7.056012153625488, "global_step": 166180, "epoch": 3956} {"train_loss": -7.006927490234375, "global_step": 166181, "epoch": 3956} {"train_loss": -7.054804801940918, "global_step": 166182, "epoch": 3956} {"train_loss": -6.957319736480713, "global_step": 166183, "epoch": 3956} {"train_loss": -6.972232818603516, "global_step": 166184, "epoch": 3956} {"train_loss": -6.972960948944092, "global_step": 166185, "epoch": 3956} {"train_loss": -6.998812675476074, "global_step": 166186, "epoch": 3956} {"train_loss": -6.966683864593506, "global_step": 166187, "epoch": 3956} {"train_loss": -6.936513900756836, "global_step": 166188, "epoch": 3956} {"train_loss": -7.014379501342773, "global_step": 166189, "epoch": 3956} {"train_loss": -6.990144729614258, "global_step": 166190, "epoch": 3956} {"train_loss": -6.779909133911133, "global_step": 166191, "epoch": 3956} {"train_loss": -6.993164539337158, "global_step": 166192, "epoch": 3956} {"train_loss": -6.950942005429949, "global_step": 166193, "epoch": 3956, "val_loss": 68568.9921875} {"train_loss": -6.920873641967773, "global_step": 166194, "epoch": 3957} {"train_loss": -6.866365909576416, "global_step": 166195, "epoch": 3957} {"train_loss": -6.924654006958008, "global_step": 166196, "epoch": 3957} {"train_loss": -6.8650312423706055, "global_step": 166197, "epoch": 3957} {"train_loss": -6.8325700759887695, "global_step": 166198, "epoch": 3957} {"train_loss": -6.860086441040039, "global_step": 166199, "epoch": 3957} {"train_loss": -6.863889217376709, "global_step": 166200, "epoch": 3957} {"train_loss": -6.899899482727051, "global_step": 166201, "epoch": 3957} {"train_loss": -6.881934642791748, "global_step": 166202, "epoch": 3957} {"train_loss": -6.870147705078125, "global_step": 166203, "epoch": 3957} {"train_loss": -6.88347864151001, "global_step": 166204, "epoch": 3957} {"train_loss": -6.961099624633789, "global_step": 166205, "epoch": 3957} {"train_loss": -6.890716552734375, "global_step": 166206, "epoch": 3957} {"train_loss": -7.015876293182373, "global_step": 166207, "epoch": 3957} {"train_loss": -6.896986961364746, "global_step": 166208, "epoch": 3957} {"train_loss": -7.017147064208984, "global_step": 166209, "epoch": 3957} {"train_loss": -6.984743118286133, "global_step": 166210, "epoch": 3957} {"train_loss": -6.952269554138184, "global_step": 166211, "epoch": 3957} {"train_loss": -6.945172309875488, "global_step": 166212, "epoch": 3957} {"train_loss": -6.943563938140869, "global_step": 166213, "epoch": 3957} {"train_loss": -7.042418956756592, "global_step": 166214, "epoch": 3957} {"train_loss": -6.96352481842041, "global_step": 166215, "epoch": 3957} {"train_loss": -6.967582702636719, "global_step": 166216, "epoch": 3957} {"train_loss": -7.000827789306641, "global_step": 166217, "epoch": 3957} {"train_loss": -7.044570446014404, "global_step": 166218, "epoch": 3957} {"train_loss": -7.010883331298828, "global_step": 166219, "epoch": 3957} {"train_loss": -6.978837966918945, "global_step": 166220, "epoch": 3957} {"train_loss": -6.798103332519531, "global_step": 166221, "epoch": 3957} {"train_loss": -7.0336198806762695, "global_step": 166222, "epoch": 3957} {"train_loss": -6.947599411010742, "global_step": 166223, "epoch": 3957} {"train_loss": -6.939547538757324, "global_step": 166224, "epoch": 3957} {"train_loss": -6.990726470947266, "global_step": 166225, "epoch": 3957} {"train_loss": -6.967217922210693, "global_step": 166226, "epoch": 3957} {"train_loss": -6.921108245849609, "global_step": 166227, "epoch": 3957} {"train_loss": -6.91346549987793, "global_step": 166228, "epoch": 3957} {"train_loss": -6.963595867156982, "global_step": 166229, "epoch": 3957} {"train_loss": -7.058559417724609, "global_step": 166230, "epoch": 3957} {"train_loss": -6.878801345825195, "global_step": 166231, "epoch": 3957} {"train_loss": -6.957918167114258, "global_step": 166232, "epoch": 3957} {"train_loss": -7.088252067565918, "global_step": 166233, "epoch": 3957} {"train_loss": -6.914579391479492, "global_step": 166234, "epoch": 3957} {"train_loss": -6.945156846727643, "global_step": 166235, "epoch": 3957, "val_loss": 68378.171875} {"train_loss": -6.913801193237305, "global_step": 166236, "epoch": 3958} {"train_loss": -6.892177581787109, "global_step": 166237, "epoch": 3958} {"train_loss": -6.985795974731445, "global_step": 166238, "epoch": 3958} {"train_loss": -6.887526035308838, "global_step": 166239, "epoch": 3958} {"train_loss": -6.971467971801758, "global_step": 166240, "epoch": 3958} {"train_loss": -6.954920768737793, "global_step": 166241, "epoch": 3958} {"train_loss": -6.958503723144531, "global_step": 166242, "epoch": 3958} {"train_loss": -6.973913669586182, "global_step": 166243, "epoch": 3958} {"train_loss": -6.868141174316406, "global_step": 166244, "epoch": 3958} {"train_loss": -6.88695764541626, "global_step": 166245, "epoch": 3958} {"train_loss": -6.948420524597168, "global_step": 166246, "epoch": 3958} {"train_loss": -6.837915897369385, "global_step": 166247, "epoch": 3958} {"train_loss": -6.922611713409424, "global_step": 166248, "epoch": 3958} {"train_loss": -6.905967712402344, "global_step": 166249, "epoch": 3958} {"train_loss": -6.795093536376953, "global_step": 166250, "epoch": 3958} {"train_loss": -6.828192234039307, "global_step": 166251, "epoch": 3958} {"train_loss": -6.8677778244018555, "global_step": 166252, "epoch": 3958} {"train_loss": -6.824395179748535, "global_step": 166253, "epoch": 3958} {"train_loss": -6.803746700286865, "global_step": 166254, "epoch": 3958} {"train_loss": -6.916844367980957, "global_step": 166255, "epoch": 3958} {"train_loss": -6.9510650634765625, "global_step": 166256, "epoch": 3958} {"train_loss": -6.874000549316406, "global_step": 166257, "epoch": 3958} {"train_loss": -6.764508247375488, "global_step": 166258, "epoch": 3958} {"train_loss": -6.963590145111084, "global_step": 166259, "epoch": 3958} {"train_loss": -6.8060712814331055, "global_step": 166260, "epoch": 3958} {"train_loss": -6.837569236755371, "global_step": 166261, "epoch": 3958} {"train_loss": -6.855706214904785, "global_step": 166262, "epoch": 3958} {"train_loss": -6.93239164352417, "global_step": 166263, "epoch": 3958} {"train_loss": -6.930280685424805, "global_step": 166264, "epoch": 3958} {"train_loss": -6.935061931610107, "global_step": 166265, "epoch": 3958} {"train_loss": -6.995279312133789, "global_step": 166266, "epoch": 3958} {"train_loss": -7.000805377960205, "global_step": 166267, "epoch": 3958} {"train_loss": -6.996068000793457, "global_step": 166268, "epoch": 3958} {"train_loss": -6.9528727531433105, "global_step": 166269, "epoch": 3958} {"train_loss": -6.968781471252441, "global_step": 166270, "epoch": 3958} {"train_loss": -7.000154495239258, "global_step": 166271, "epoch": 3958} {"train_loss": -6.954560279846191, "global_step": 166272, "epoch": 3958} {"train_loss": -7.041324615478516, "global_step": 166273, "epoch": 3958} {"train_loss": -6.873178958892822, "global_step": 166274, "epoch": 3958} {"train_loss": -6.852835655212402, "global_step": 166275, "epoch": 3958} {"train_loss": -6.958549499511719, "global_step": 166276, "epoch": 3958} {"train_loss": -6.909692628043039, "global_step": 166277, "epoch": 3958, "val_loss": 68386.921875} {"train_loss": -6.928493022918701, "global_step": 166278, "epoch": 3959} {"train_loss": -6.8813347816467285, "global_step": 166279, "epoch": 3959} {"train_loss": -6.979958534240723, "global_step": 166280, "epoch": 3959} {"train_loss": -6.904487609863281, "global_step": 166281, "epoch": 3959} {"train_loss": -6.813223361968994, "global_step": 166282, "epoch": 3959} {"train_loss": -7.026156425476074, "global_step": 166283, "epoch": 3959} {"train_loss": -6.965415954589844, "global_step": 166284, "epoch": 3959} {"train_loss": -6.95836067199707, "global_step": 166285, "epoch": 3959} {"train_loss": -6.941069602966309, "global_step": 166286, "epoch": 3959} {"train_loss": -6.957965850830078, "global_step": 166287, "epoch": 3959} {"train_loss": -7.040021896362305, "global_step": 166288, "epoch": 3959} {"train_loss": -6.947476863861084, "global_step": 166289, "epoch": 3959} {"train_loss": -7.066905975341797, "global_step": 166290, "epoch": 3959} {"train_loss": -6.947263240814209, "global_step": 166291, "epoch": 3959} {"train_loss": -6.963484764099121, "global_step": 166292, "epoch": 3959} {"train_loss": -6.912425994873047, "global_step": 166293, "epoch": 3959} {"train_loss": -6.913364887237549, "global_step": 166294, "epoch": 3959} {"train_loss": -6.966289043426514, "global_step": 166295, "epoch": 3959} {"train_loss": -6.995909690856934, "global_step": 166296, "epoch": 3959} {"train_loss": -6.886333465576172, "global_step": 166297, "epoch": 3959} {"train_loss": -6.938565731048584, "global_step": 166298, "epoch": 3959} {"train_loss": -6.961232662200928, "global_step": 166299, "epoch": 3959} {"train_loss": -6.999345779418945, "global_step": 166300, "epoch": 3959} {"train_loss": -6.981259346008301, "global_step": 166301, "epoch": 3959} {"train_loss": -6.920867443084717, "global_step": 166302, "epoch": 3959} {"train_loss": -6.9531049728393555, "global_step": 166303, "epoch": 3959} {"train_loss": -6.960270881652832, "global_step": 166304, "epoch": 3959} {"train_loss": -6.890774726867676, "global_step": 166305, "epoch": 3959} {"train_loss": -6.967865943908691, "global_step": 166306, "epoch": 3959} {"train_loss": -6.953999996185303, "global_step": 166307, "epoch": 3959} {"train_loss": -6.981862545013428, "global_step": 166308, "epoch": 3959} {"train_loss": -6.992892265319824, "global_step": 166309, "epoch": 3959} {"train_loss": -6.979119777679443, "global_step": 166310, "epoch": 3959} {"train_loss": -7.00627326965332, "global_step": 166311, "epoch": 3959} {"train_loss": -6.9445013999938965, "global_step": 166312, "epoch": 3959} {"train_loss": -6.990525722503662, "global_step": 166313, "epoch": 3959} {"train_loss": -6.968228340148926, "global_step": 166314, "epoch": 3959} {"train_loss": -7.038551330566406, "global_step": 166315, "epoch": 3959} {"train_loss": -7.018019676208496, "global_step": 166316, "epoch": 3959} {"train_loss": -6.982961177825928, "global_step": 166317, "epoch": 3959} {"train_loss": -6.9445905685424805, "global_step": 166318, "epoch": 3959} {"train_loss": -6.9603858561742875, "global_step": 166319, "epoch": 3959, "val_loss": 68556.78125} {"train_loss": -6.904460906982422, "global_step": 166320, "epoch": 3960} {"train_loss": -6.8596720695495605, "global_step": 166321, "epoch": 3960} {"train_loss": -6.963658809661865, "global_step": 166322, "epoch": 3960} {"train_loss": -7.029585838317871, "global_step": 166323, "epoch": 3960} {"train_loss": -6.9779486656188965, "global_step": 166324, "epoch": 3960} {"train_loss": -6.9472808837890625, "global_step": 166325, "epoch": 3960} {"train_loss": -7.100128650665283, "global_step": 166326, "epoch": 3960} {"train_loss": -6.993851184844971, "global_step": 166327, "epoch": 3960} {"train_loss": -6.958237648010254, "global_step": 166328, "epoch": 3960} {"train_loss": -6.820436477661133, "global_step": 166329, "epoch": 3960} {"train_loss": -6.874123573303223, "global_step": 166330, "epoch": 3960} {"train_loss": -6.913767337799072, "global_step": 166331, "epoch": 3960} {"train_loss": -6.855825901031494, "global_step": 166332, "epoch": 3960} {"train_loss": -6.895939826965332, "global_step": 166333, "epoch": 3960} {"train_loss": -6.879472732543945, "global_step": 166334, "epoch": 3960} {"train_loss": -6.83048152923584, "global_step": 166335, "epoch": 3960} {"train_loss": -7.010883331298828, "global_step": 166336, "epoch": 3960} {"train_loss": -6.884062767028809, "global_step": 166337, "epoch": 3960} {"train_loss": -6.978831768035889, "global_step": 166338, "epoch": 3960} {"train_loss": -7.076352119445801, "global_step": 166339, "epoch": 3960} {"train_loss": -6.888901233673096, "global_step": 166340, "epoch": 3960} {"train_loss": -6.999845504760742, "global_step": 166341, "epoch": 3960} {"train_loss": -6.814693450927734, "global_step": 166342, "epoch": 3960} {"train_loss": -6.803471088409424, "global_step": 166343, "epoch": 3960} {"train_loss": -7.000700950622559, "global_step": 166344, "epoch": 3960} {"train_loss": -6.99506950378418, "global_step": 166345, "epoch": 3960} {"train_loss": -7.0275163650512695, "global_step": 166346, "epoch": 3960} {"train_loss": -6.8835320472717285, "global_step": 166347, "epoch": 3960} {"train_loss": -7.022991180419922, "global_step": 166348, "epoch": 3960} {"train_loss": -6.975451469421387, "global_step": 166349, "epoch": 3960} {"train_loss": -7.029114723205566, "global_step": 166350, "epoch": 3960} {"train_loss": -6.978238105773926, "global_step": 166351, "epoch": 3960} {"train_loss": -6.8797712326049805, "global_step": 166352, "epoch": 3960} {"train_loss": -7.022525787353516, "global_step": 166353, "epoch": 3960} {"train_loss": -6.954561710357666, "global_step": 166354, "epoch": 3960} {"train_loss": -6.926288604736328, "global_step": 166355, "epoch": 3960} {"train_loss": -6.842613697052002, "global_step": 166356, "epoch": 3960} {"train_loss": -6.885024070739746, "global_step": 166357, "epoch": 3960} {"train_loss": -6.863027095794678, "global_step": 166358, "epoch": 3960} {"train_loss": -6.883166313171387, "global_step": 166359, "epoch": 3960} {"train_loss": -6.965376853942871, "global_step": 166360, "epoch": 3960} {"train_loss": -6.937469857079642, "global_step": 166361, "epoch": 3960, "val_loss": 68505.1796875} {"train_loss": -6.92536735534668, "global_step": 166362, "epoch": 3961} {"train_loss": -7.056704521179199, "global_step": 166363, "epoch": 3961} {"train_loss": -6.8749823570251465, "global_step": 166364, "epoch": 3961} {"train_loss": -6.892250061035156, "global_step": 166365, "epoch": 3961} {"train_loss": -6.993661880493164, "global_step": 166366, "epoch": 3961} {"train_loss": -7.009365558624268, "global_step": 166367, "epoch": 3961} {"train_loss": -6.964441776275635, "global_step": 166368, "epoch": 3961} {"train_loss": -6.926214218139648, "global_step": 166369, "epoch": 3961} {"train_loss": -6.929037094116211, "global_step": 166370, "epoch": 3961} {"train_loss": -6.883382797241211, "global_step": 166371, "epoch": 3961} {"train_loss": -6.947553634643555, "global_step": 166372, "epoch": 3961} {"train_loss": -6.963828086853027, "global_step": 166373, "epoch": 3961} {"train_loss": -6.904305934906006, "global_step": 166374, "epoch": 3961} {"train_loss": -6.970387935638428, "global_step": 166375, "epoch": 3961} {"train_loss": -6.952258586883545, "global_step": 166376, "epoch": 3961} {"train_loss": -6.9360222816467285, "global_step": 166377, "epoch": 3961} {"train_loss": -6.881608963012695, "global_step": 166378, "epoch": 3961} {"train_loss": -6.932605743408203, "global_step": 166379, "epoch": 3961} {"train_loss": -6.799221515655518, "global_step": 166380, "epoch": 3961} {"train_loss": -6.945319175720215, "global_step": 166381, "epoch": 3961} {"train_loss": -6.9328155517578125, "global_step": 166382, "epoch": 3961} {"train_loss": -6.829455375671387, "global_step": 166383, "epoch": 3961} {"train_loss": -6.8448896408081055, "global_step": 166384, "epoch": 3961} {"train_loss": -6.971606254577637, "global_step": 166385, "epoch": 3961} {"train_loss": -6.976700305938721, "global_step": 166386, "epoch": 3961} {"train_loss": -7.005305767059326, "global_step": 166387, "epoch": 3961} {"train_loss": -6.799521446228027, "global_step": 166388, "epoch": 3961} {"train_loss": -6.914494514465332, "global_step": 166389, "epoch": 3961} {"train_loss": -7.00990629196167, "global_step": 166390, "epoch": 3961} {"train_loss": -6.927416801452637, "global_step": 166391, "epoch": 3961} {"train_loss": -6.934811592102051, "global_step": 166392, "epoch": 3961} {"train_loss": -6.842164993286133, "global_step": 166393, "epoch": 3961} {"train_loss": -6.9073615074157715, "global_step": 166394, "epoch": 3961} {"train_loss": -7.087953567504883, "global_step": 166395, "epoch": 3961} {"train_loss": -6.96720027923584, "global_step": 166396, "epoch": 3961} {"train_loss": -6.918243885040283, "global_step": 166397, "epoch": 3961} {"train_loss": -6.953890800476074, "global_step": 166398, "epoch": 3961} {"train_loss": -6.86114501953125, "global_step": 166399, "epoch": 3961} {"train_loss": -6.989258766174316, "global_step": 166400, "epoch": 3961} {"train_loss": -6.82090950012207, "global_step": 166401, "epoch": 3961} {"train_loss": -6.941709995269775, "global_step": 166402, "epoch": 3961} {"train_loss": -6.928399687721615, "global_step": 166403, "epoch": 3961, "val_loss": 68571.515625} {"train_loss": -6.8942766189575195, "global_step": 166404, "epoch": 3962} {"train_loss": -6.799505233764648, "global_step": 166405, "epoch": 3962} {"train_loss": -6.981861114501953, "global_step": 166406, "epoch": 3962} {"train_loss": -6.9347639083862305, "global_step": 166407, "epoch": 3962} {"train_loss": -6.872507095336914, "global_step": 166408, "epoch": 3962} {"train_loss": -6.999385833740234, "global_step": 166409, "epoch": 3962} {"train_loss": -6.813933372497559, "global_step": 166410, "epoch": 3962} {"train_loss": -6.947501182556152, "global_step": 166411, "epoch": 3962} {"train_loss": -6.962174415588379, "global_step": 166412, "epoch": 3962} {"train_loss": -6.819774627685547, "global_step": 166413, "epoch": 3962} {"train_loss": -6.992216110229492, "global_step": 166414, "epoch": 3962} {"train_loss": -6.878767013549805, "global_step": 166415, "epoch": 3962} {"train_loss": -6.6360039710998535, "global_step": 166416, "epoch": 3962} {"train_loss": -6.8920183181762695, "global_step": 166417, "epoch": 3962} {"train_loss": -6.791218280792236, "global_step": 166418, "epoch": 3962} {"train_loss": -6.973771572113037, "global_step": 166419, "epoch": 3962} {"train_loss": -6.925201892852783, "global_step": 166420, "epoch": 3962} {"train_loss": -6.813066482543945, "global_step": 166421, "epoch": 3962} {"train_loss": -6.8833441734313965, "global_step": 166422, "epoch": 3962} {"train_loss": -6.846341133117676, "global_step": 166423, "epoch": 3962} {"train_loss": -6.8000593185424805, "global_step": 166424, "epoch": 3962} {"train_loss": -6.974153995513916, "global_step": 166425, "epoch": 3962} {"train_loss": -6.950583457946777, "global_step": 166426, "epoch": 3962} {"train_loss": -6.9136834144592285, "global_step": 166427, "epoch": 3962} {"train_loss": -6.936450958251953, "global_step": 166428, "epoch": 3962} {"train_loss": -6.911949157714844, "global_step": 166429, "epoch": 3962} {"train_loss": -7.014887809753418, "global_step": 166430, "epoch": 3962} {"train_loss": -6.846902847290039, "global_step": 166431, "epoch": 3962} {"train_loss": -6.897909164428711, "global_step": 166432, "epoch": 3962} {"train_loss": -6.947145462036133, "global_step": 166433, "epoch": 3962} {"train_loss": -7.012533664703369, "global_step": 166434, "epoch": 3962} {"train_loss": -6.987408638000488, "global_step": 166435, "epoch": 3962} {"train_loss": -6.941957473754883, "global_step": 166436, "epoch": 3962} {"train_loss": -6.94051456451416, "global_step": 166437, "epoch": 3962} {"train_loss": -6.930426597595215, "global_step": 166438, "epoch": 3962} {"train_loss": -6.943953514099121, "global_step": 166439, "epoch": 3962} {"train_loss": -6.855391979217529, "global_step": 166440, "epoch": 3962} {"train_loss": -6.976715087890625, "global_step": 166441, "epoch": 3962} {"train_loss": -6.972694396972656, "global_step": 166442, "epoch": 3962} {"train_loss": -7.00695276260376, "global_step": 166443, "epoch": 3962} {"train_loss": -6.81743860244751, "global_step": 166444, "epoch": 3962} {"train_loss": -6.908988112495059, "global_step": 166445, "epoch": 3962, "val_loss": 68529.640625} {"train_loss": -6.899528503417969, "global_step": 166446, "epoch": 3963} {"train_loss": -6.930337905883789, "global_step": 166447, "epoch": 3963} {"train_loss": -6.901782035827637, "global_step": 166448, "epoch": 3963} {"train_loss": -6.845100402832031, "global_step": 166449, "epoch": 3963} {"train_loss": -6.916627407073975, "global_step": 166450, "epoch": 3963} {"train_loss": -7.02687931060791, "global_step": 166451, "epoch": 3963} {"train_loss": -7.01031494140625, "global_step": 166452, "epoch": 3963} {"train_loss": -6.919228553771973, "global_step": 166453, "epoch": 3963} {"train_loss": -6.935659408569336, "global_step": 166454, "epoch": 3963} {"train_loss": -7.042993545532227, "global_step": 166455, "epoch": 3963} {"train_loss": -7.0495758056640625, "global_step": 166456, "epoch": 3963} {"train_loss": -7.068985939025879, "global_step": 166457, "epoch": 3963} {"train_loss": -7.0743279457092285, "global_step": 166458, "epoch": 3963} {"train_loss": -7.0142364501953125, "global_step": 166459, "epoch": 3963} {"train_loss": -6.882495403289795, "global_step": 166460, "epoch": 3963} {"train_loss": -6.888519287109375, "global_step": 166461, "epoch": 3963} {"train_loss": -6.945719242095947, "global_step": 166462, "epoch": 3963} {"train_loss": -6.856184482574463, "global_step": 166463, "epoch": 3963} {"train_loss": -7.030585765838623, "global_step": 166464, "epoch": 3963} {"train_loss": -7.003190994262695, "global_step": 166465, "epoch": 3963} {"train_loss": -7.060563087463379, "global_step": 166466, "epoch": 3963} {"train_loss": -6.994237899780273, "global_step": 166467, "epoch": 3963} {"train_loss": -7.0165205001831055, "global_step": 166468, "epoch": 3963} {"train_loss": -6.960186004638672, "global_step": 166469, "epoch": 3963} {"train_loss": -6.94932746887207, "global_step": 166470, "epoch": 3963} {"train_loss": -6.9936652183532715, "global_step": 166471, "epoch": 3963} {"train_loss": -6.9366774559021, "global_step": 166472, "epoch": 3963} {"train_loss": -6.9298481941223145, "global_step": 166473, "epoch": 3963} {"train_loss": -6.908348560333252, "global_step": 166474, "epoch": 3963} {"train_loss": -6.993805885314941, "global_step": 166475, "epoch": 3963} {"train_loss": -7.0649590492248535, "global_step": 166476, "epoch": 3963} {"train_loss": -6.873264312744141, "global_step": 166477, "epoch": 3963} {"train_loss": -6.988736152648926, "global_step": 166478, "epoch": 3963} {"train_loss": -7.116519927978516, "global_step": 166479, "epoch": 3963} {"train_loss": -6.923784255981445, "global_step": 166480, "epoch": 3963} {"train_loss": -7.032454967498779, "global_step": 166481, "epoch": 3963} {"train_loss": -6.957414627075195, "global_step": 166482, "epoch": 3963} {"train_loss": -7.016140937805176, "global_step": 166483, "epoch": 3963} {"train_loss": -7.003676414489746, "global_step": 166484, "epoch": 3963} {"train_loss": -7.024686813354492, "global_step": 166485, "epoch": 3963} {"train_loss": -6.865817546844482, "global_step": 166486, "epoch": 3963} {"train_loss": -6.972068003245762, "global_step": 166487, "epoch": 3963, "val_loss": 68373.9609375} {"train_loss": -6.927611351013184, "global_step": 166488, "epoch": 3964} {"train_loss": -6.915980339050293, "global_step": 166489, "epoch": 3964} {"train_loss": -6.97035026550293, "global_step": 166490, "epoch": 3964} {"train_loss": -6.894207954406738, "global_step": 166491, "epoch": 3964} {"train_loss": -6.801124095916748, "global_step": 166492, "epoch": 3964} {"train_loss": -6.870324611663818, "global_step": 166493, "epoch": 3964} {"train_loss": -6.986364364624023, "global_step": 166494, "epoch": 3964} {"train_loss": -6.89557409286499, "global_step": 166495, "epoch": 3964} {"train_loss": -6.915807247161865, "global_step": 166496, "epoch": 3964} {"train_loss": -6.9025983810424805, "global_step": 166497, "epoch": 3964} {"train_loss": -6.975873947143555, "global_step": 166498, "epoch": 3964} {"train_loss": -6.997155666351318, "global_step": 166499, "epoch": 3964} {"train_loss": -6.987226486206055, "global_step": 166500, "epoch": 3964} {"train_loss": -6.942214012145996, "global_step": 166501, "epoch": 3964} {"train_loss": -6.9188151359558105, "global_step": 166502, "epoch": 3964} {"train_loss": -6.831113815307617, "global_step": 166503, "epoch": 3964} {"train_loss": -6.925989151000977, "global_step": 166504, "epoch": 3964} {"train_loss": -6.943438529968262, "global_step": 166505, "epoch": 3964} {"train_loss": -6.9776811599731445, "global_step": 166506, "epoch": 3964} {"train_loss": -6.835648536682129, "global_step": 166507, "epoch": 3964} {"train_loss": -7.094653129577637, "global_step": 166508, "epoch": 3964} {"train_loss": -6.868691444396973, "global_step": 166509, "epoch": 3964} {"train_loss": -6.866332054138184, "global_step": 166510, "epoch": 3964} {"train_loss": -6.840995788574219, "global_step": 166511, "epoch": 3964} {"train_loss": -6.874045372009277, "global_step": 166512, "epoch": 3964} {"train_loss": -7.102153778076172, "global_step": 166513, "epoch": 3964} {"train_loss": -6.9259843826293945, "global_step": 166514, "epoch": 3964} {"train_loss": -7.008547306060791, "global_step": 166515, "epoch": 3964} {"train_loss": -6.93211555480957, "global_step": 166516, "epoch": 3964} {"train_loss": -6.908535003662109, "global_step": 166517, "epoch": 3964} {"train_loss": -6.854937553405762, "global_step": 166518, "epoch": 3964} {"train_loss": -6.959033012390137, "global_step": 166519, "epoch": 3964} {"train_loss": -6.980930328369141, "global_step": 166520, "epoch": 3964} {"train_loss": -6.8923020362854, "global_step": 166521, "epoch": 3964} {"train_loss": -6.92927360534668, "global_step": 166522, "epoch": 3964} {"train_loss": -6.996956825256348, "global_step": 166523, "epoch": 3964} {"train_loss": -6.9382805824279785, "global_step": 166524, "epoch": 3964} {"train_loss": -6.8993659019470215, "global_step": 166525, "epoch": 3964} {"train_loss": -6.993985652923584, "global_step": 166526, "epoch": 3964} {"train_loss": -6.7621355056762695, "global_step": 166527, "epoch": 3964} {"train_loss": -6.908805847167969, "global_step": 166528, "epoch": 3964} {"train_loss": -6.927051112765358, "global_step": 166529, "epoch": 3964, "val_loss": 68718.078125} {"train_loss": -7.057889461517334, "global_step": 166530, "epoch": 3965} {"train_loss": -7.126421928405762, "global_step": 166531, "epoch": 3965} {"train_loss": -6.968831539154053, "global_step": 166532, "epoch": 3965} {"train_loss": -6.985907554626465, "global_step": 166533, "epoch": 3965} {"train_loss": -6.941118240356445, "global_step": 166534, "epoch": 3965} {"train_loss": -7.148107528686523, "global_step": 166535, "epoch": 3965} {"train_loss": -7.055290222167969, "global_step": 166536, "epoch": 3965} {"train_loss": -6.995212078094482, "global_step": 166537, "epoch": 3965} {"train_loss": -6.944308280944824, "global_step": 166538, "epoch": 3965} {"train_loss": -7.010552406311035, "global_step": 166539, "epoch": 3965} {"train_loss": -7.0920281410217285, "global_step": 166540, "epoch": 3965} {"train_loss": -6.985532760620117, "global_step": 166541, "epoch": 3965} {"train_loss": -6.957436561584473, "global_step": 166542, "epoch": 3965} {"train_loss": -7.011103630065918, "global_step": 166543, "epoch": 3965} {"train_loss": -6.866459846496582, "global_step": 166544, "epoch": 3965} {"train_loss": -7.023580551147461, "global_step": 166545, "epoch": 3965} {"train_loss": -7.055359840393066, "global_step": 166546, "epoch": 3965} {"train_loss": -6.907915115356445, "global_step": 166547, "epoch": 3965} {"train_loss": -6.886879920959473, "global_step": 166548, "epoch": 3965} {"train_loss": -6.980103492736816, "global_step": 166549, "epoch": 3965} {"train_loss": -6.793983459472656, "global_step": 166550, "epoch": 3965} {"train_loss": -6.931468963623047, "global_step": 166551, "epoch": 3965} {"train_loss": -7.005588531494141, "global_step": 166552, "epoch": 3965} {"train_loss": -6.915546894073486, "global_step": 166553, "epoch": 3965} {"train_loss": -6.904058456420898, "global_step": 166554, "epoch": 3965} {"train_loss": -7.051412582397461, "global_step": 166555, "epoch": 3965} {"train_loss": -6.833529472351074, "global_step": 166556, "epoch": 3965} {"train_loss": -7.046914577484131, "global_step": 166557, "epoch": 3965} {"train_loss": -6.883394718170166, "global_step": 166558, "epoch": 3965} {"train_loss": -6.783164978027344, "global_step": 166559, "epoch": 3965} {"train_loss": -6.906606674194336, "global_step": 166560, "epoch": 3965} {"train_loss": -6.766566753387451, "global_step": 166561, "epoch": 3965} {"train_loss": -6.892592430114746, "global_step": 166562, "epoch": 3965} {"train_loss": -6.798405647277832, "global_step": 166563, "epoch": 3965} {"train_loss": -6.898194789886475, "global_step": 166564, "epoch": 3965} {"train_loss": -6.948719024658203, "global_step": 166565, "epoch": 3965} {"train_loss": -6.6751227378845215, "global_step": 166566, "epoch": 3965} {"train_loss": -6.8915886878967285, "global_step": 166567, "epoch": 3965} {"train_loss": -6.728199481964111, "global_step": 166568, "epoch": 3965} {"train_loss": -6.7971649169921875, "global_step": 166569, "epoch": 3965} {"train_loss": -6.98988151550293, "global_step": 166570, "epoch": 3965} {"train_loss": -6.935139633360363, "global_step": 166571, "epoch": 3965, "val_loss": 68394.546875} {"train_loss": -6.866162300109863, "global_step": 166572, "epoch": 3966} {"train_loss": -6.936167240142822, "global_step": 166573, "epoch": 3966} {"train_loss": -6.89119815826416, "global_step": 166574, "epoch": 3966} {"train_loss": -6.888670921325684, "global_step": 166575, "epoch": 3966} {"train_loss": -6.870107650756836, "global_step": 166576, "epoch": 3966} {"train_loss": -7.062236785888672, "global_step": 166577, "epoch": 3966} {"train_loss": -6.905722618103027, "global_step": 166578, "epoch": 3966} {"train_loss": -6.992233753204346, "global_step": 166579, "epoch": 3966} {"train_loss": -6.8744215965271, "global_step": 166580, "epoch": 3966} {"train_loss": -6.835239887237549, "global_step": 166581, "epoch": 3966} {"train_loss": -6.947989463806152, "global_step": 166582, "epoch": 3966} {"train_loss": -6.850632190704346, "global_step": 166583, "epoch": 3966} {"train_loss": -6.889216423034668, "global_step": 166584, "epoch": 3966} {"train_loss": -7.013092041015625, "global_step": 166585, "epoch": 3966} {"train_loss": -6.968730926513672, "global_step": 166586, "epoch": 3966} {"train_loss": -6.9435200691223145, "global_step": 166587, "epoch": 3966} {"train_loss": -6.948516845703125, "global_step": 166588, "epoch": 3966} {"train_loss": -6.870553493499756, "global_step": 166589, "epoch": 3966} {"train_loss": -7.120731353759766, "global_step": 166590, "epoch": 3966} {"train_loss": -7.002589225769043, "global_step": 166591, "epoch": 3966} {"train_loss": -6.955540657043457, "global_step": 166592, "epoch": 3966} {"train_loss": -6.962313652038574, "global_step": 166593, "epoch": 3966} {"train_loss": -7.057624340057373, "global_step": 166594, "epoch": 3966} {"train_loss": -6.961979866027832, "global_step": 166595, "epoch": 3966} {"train_loss": -6.876069068908691, "global_step": 166596, "epoch": 3966} {"train_loss": -6.991306781768799, "global_step": 166597, "epoch": 3966} {"train_loss": -6.892083644866943, "global_step": 166598, "epoch": 3966} {"train_loss": -6.844836235046387, "global_step": 166599, "epoch": 3966} {"train_loss": -6.999410629272461, "global_step": 166600, "epoch": 3966} {"train_loss": -6.8523712158203125, "global_step": 166601, "epoch": 3966} {"train_loss": -6.930284023284912, "global_step": 166602, "epoch": 3966} {"train_loss": -6.885847091674805, "global_step": 166603, "epoch": 3966} {"train_loss": -6.962120056152344, "global_step": 166604, "epoch": 3966} {"train_loss": -6.934142112731934, "global_step": 166605, "epoch": 3966} {"train_loss": -7.103569984436035, "global_step": 166606, "epoch": 3966} {"train_loss": -7.017802715301514, "global_step": 166607, "epoch": 3966} {"train_loss": -7.009693622589111, "global_step": 166608, "epoch": 3966} {"train_loss": -6.843616962432861, "global_step": 166609, "epoch": 3966} {"train_loss": -6.851022243499756, "global_step": 166610, "epoch": 3966} {"train_loss": -7.057581901550293, "global_step": 166611, "epoch": 3966} {"train_loss": -6.9579572677612305, "global_step": 166612, "epoch": 3966} {"train_loss": -6.947580099105835, "global_step": 166613, "epoch": 3966, "val_loss": 68553.0546875} {"train_loss": -6.962501525878906, "global_step": 166614, "epoch": 3967} {"train_loss": -6.984651565551758, "global_step": 166615, "epoch": 3967} {"train_loss": -7.075653076171875, "global_step": 166616, "epoch": 3967} {"train_loss": -6.875213146209717, "global_step": 166617, "epoch": 3967} {"train_loss": -7.054488182067871, "global_step": 166618, "epoch": 3967} {"train_loss": -6.956676006317139, "global_step": 166619, "epoch": 3967} {"train_loss": -6.913045883178711, "global_step": 166620, "epoch": 3967} {"train_loss": -7.028885841369629, "global_step": 166621, "epoch": 3967} {"train_loss": -7.042819499969482, "global_step": 166622, "epoch": 3967} {"train_loss": -6.911986351013184, "global_step": 166623, "epoch": 3967} {"train_loss": -6.977485656738281, "global_step": 166624, "epoch": 3967} {"train_loss": -6.958489418029785, "global_step": 166625, "epoch": 3967} {"train_loss": -6.932351112365723, "global_step": 166626, "epoch": 3967} {"train_loss": -6.837676525115967, "global_step": 166627, "epoch": 3967} {"train_loss": -6.997150421142578, "global_step": 166628, "epoch": 3967} {"train_loss": -6.808070659637451, "global_step": 166629, "epoch": 3967} {"train_loss": -6.847557067871094, "global_step": 166630, "epoch": 3967} {"train_loss": -6.945773124694824, "global_step": 166631, "epoch": 3967} {"train_loss": -6.859632968902588, "global_step": 166632, "epoch": 3967} {"train_loss": -7.011796951293945, "global_step": 166633, "epoch": 3967} {"train_loss": -6.86097526550293, "global_step": 166634, "epoch": 3967} {"train_loss": -6.88975715637207, "global_step": 166635, "epoch": 3967} {"train_loss": -6.975698471069336, "global_step": 166636, "epoch": 3967} {"train_loss": -6.8985161781311035, "global_step": 166637, "epoch": 3967} {"train_loss": -7.010879993438721, "global_step": 166638, "epoch": 3967} {"train_loss": -6.904473781585693, "global_step": 166639, "epoch": 3967} {"train_loss": -6.966151237487793, "global_step": 166640, "epoch": 3967} {"train_loss": -7.025524616241455, "global_step": 166641, "epoch": 3967} {"train_loss": -7.032841205596924, "global_step": 166642, "epoch": 3967} {"train_loss": -6.998358249664307, "global_step": 166643, "epoch": 3967} {"train_loss": -7.030464172363281, "global_step": 166644, "epoch": 3967} {"train_loss": -6.926817893981934, "global_step": 166645, "epoch": 3967} {"train_loss": -7.074728965759277, "global_step": 166646, "epoch": 3967} {"train_loss": -6.931535720825195, "global_step": 166647, "epoch": 3967} {"train_loss": -6.976907730102539, "global_step": 166648, "epoch": 3967} {"train_loss": -6.9022979736328125, "global_step": 166649, "epoch": 3967} {"train_loss": -6.874294757843018, "global_step": 166650, "epoch": 3967} {"train_loss": -6.912536144256592, "global_step": 166651, "epoch": 3967} {"train_loss": -7.024261951446533, "global_step": 166652, "epoch": 3967} {"train_loss": -7.021738529205322, "global_step": 166653, "epoch": 3967} {"train_loss": -6.927189826965332, "global_step": 166654, "epoch": 3967} {"train_loss": -6.953370854968116, "global_step": 166655, "epoch": 3967, "val_loss": 68493.3046875} {"train_loss": -6.945395469665527, "global_step": 166656, "epoch": 3968} {"train_loss": -7.054202079772949, "global_step": 166657, "epoch": 3968} {"train_loss": -6.930052757263184, "global_step": 166658, "epoch": 3968} {"train_loss": -6.87181282043457, "global_step": 166659, "epoch": 3968} {"train_loss": -6.960186958312988, "global_step": 166660, "epoch": 3968} {"train_loss": -6.826077461242676, "global_step": 166661, "epoch": 3968} {"train_loss": -6.986184120178223, "global_step": 166662, "epoch": 3968} {"train_loss": -7.004729270935059, "global_step": 166663, "epoch": 3968} {"train_loss": -6.929601192474365, "global_step": 166664, "epoch": 3968} {"train_loss": -6.994551658630371, "global_step": 166665, "epoch": 3968} {"train_loss": -6.979437828063965, "global_step": 166666, "epoch": 3968} {"train_loss": -6.879124641418457, "global_step": 166667, "epoch": 3968} {"train_loss": -6.956493854522705, "global_step": 166668, "epoch": 3968} {"train_loss": -6.948338985443115, "global_step": 166669, "epoch": 3968} {"train_loss": -6.867476940155029, "global_step": 166670, "epoch": 3968} {"train_loss": -7.02504301071167, "global_step": 166671, "epoch": 3968} {"train_loss": -6.964954376220703, "global_step": 166672, "epoch": 3968} {"train_loss": -6.998512268066406, "global_step": 166673, "epoch": 3968} {"train_loss": -6.912886142730713, "global_step": 166674, "epoch": 3968} {"train_loss": -6.938714027404785, "global_step": 166675, "epoch": 3968} {"train_loss": -6.98729944229126, "global_step": 166676, "epoch": 3968} {"train_loss": -7.023115158081055, "global_step": 166677, "epoch": 3968} {"train_loss": -7.007329940795898, "global_step": 166678, "epoch": 3968} {"train_loss": -6.956284999847412, "global_step": 166679, "epoch": 3968} {"train_loss": -6.892580032348633, "global_step": 166680, "epoch": 3968} {"train_loss": -6.953055381774902, "global_step": 166681, "epoch": 3968} {"train_loss": -6.995769500732422, "global_step": 166682, "epoch": 3968} {"train_loss": -7.0360870361328125, "global_step": 166683, "epoch": 3968} {"train_loss": -6.990527153015137, "global_step": 166684, "epoch": 3968} {"train_loss": -6.989426612854004, "global_step": 166685, "epoch": 3968} {"train_loss": -6.920198440551758, "global_step": 166686, "epoch": 3968} {"train_loss": -6.909298896789551, "global_step": 166687, "epoch": 3968} {"train_loss": -7.04102897644043, "global_step": 166688, "epoch": 3968} {"train_loss": -7.055214881896973, "global_step": 166689, "epoch": 3968} {"train_loss": -6.96469259262085, "global_step": 166690, "epoch": 3968} {"train_loss": -7.174098014831543, "global_step": 166691, "epoch": 3968} {"train_loss": -7.0014214515686035, "global_step": 166692, "epoch": 3968} {"train_loss": -6.934271812438965, "global_step": 166693, "epoch": 3968} {"train_loss": -6.986417770385742, "global_step": 166694, "epoch": 3968} {"train_loss": -6.9490461349487305, "global_step": 166695, "epoch": 3968} {"train_loss": -6.8742570877075195, "global_step": 166696, "epoch": 3968} {"train_loss": -6.966032346089681, "global_step": 166697, "epoch": 3968, "val_loss": 68605.234375} {"train_loss": -7.068136692047119, "global_step": 166698, "epoch": 3969} {"train_loss": -6.922016143798828, "global_step": 166699, "epoch": 3969} {"train_loss": -6.997199535369873, "global_step": 166700, "epoch": 3969} {"train_loss": -6.963214874267578, "global_step": 166701, "epoch": 3969} {"train_loss": -7.0196146965026855, "global_step": 166702, "epoch": 3969} {"train_loss": -6.909425735473633, "global_step": 166703, "epoch": 3969} {"train_loss": -6.99828577041626, "global_step": 166704, "epoch": 3969} {"train_loss": -6.958261013031006, "global_step": 166705, "epoch": 3969} {"train_loss": -7.13405704498291, "global_step": 166706, "epoch": 3969} {"train_loss": -7.104189872741699, "global_step": 166707, "epoch": 3969} {"train_loss": -6.984378814697266, "global_step": 166708, "epoch": 3969} {"train_loss": -7.023425579071045, "global_step": 166709, "epoch": 3969} {"train_loss": -7.1579060554504395, "global_step": 166710, "epoch": 3969} {"train_loss": -7.0512189865112305, "global_step": 166711, "epoch": 3969} {"train_loss": -6.993196487426758, "global_step": 166712, "epoch": 3969} {"train_loss": -7.068927764892578, "global_step": 166713, "epoch": 3969} {"train_loss": -6.955960273742676, "global_step": 166714, "epoch": 3969} {"train_loss": -6.925783157348633, "global_step": 166715, "epoch": 3969} {"train_loss": -6.98605489730835, "global_step": 166716, "epoch": 3969} {"train_loss": -7.072788238525391, "global_step": 166717, "epoch": 3969} {"train_loss": -6.971621990203857, "global_step": 166718, "epoch": 3969} {"train_loss": -6.91054105758667, "global_step": 166719, "epoch": 3969} {"train_loss": -7.002803802490234, "global_step": 166720, "epoch": 3969} {"train_loss": -7.03656005859375, "global_step": 166721, "epoch": 3969} {"train_loss": -6.980712413787842, "global_step": 166722, "epoch": 3969} {"train_loss": -6.7863969802856445, "global_step": 166723, "epoch": 3969} {"train_loss": -7.044201850891113, "global_step": 166724, "epoch": 3969} {"train_loss": -6.8352532386779785, "global_step": 166725, "epoch": 3969} {"train_loss": -6.908637523651123, "global_step": 166726, "epoch": 3969} {"train_loss": -6.885437965393066, "global_step": 166727, "epoch": 3969} {"train_loss": -6.984061241149902, "global_step": 166728, "epoch": 3969} {"train_loss": -6.966820240020752, "global_step": 166729, "epoch": 3969} {"train_loss": -6.940637588500977, "global_step": 166730, "epoch": 3969} {"train_loss": -6.983205318450928, "global_step": 166731, "epoch": 3969} {"train_loss": -7.059595108032227, "global_step": 166732, "epoch": 3969} {"train_loss": -7.010621070861816, "global_step": 166733, "epoch": 3969} {"train_loss": -6.918709754943848, "global_step": 166734, "epoch": 3969} {"train_loss": -7.049769401550293, "global_step": 166735, "epoch": 3969} {"train_loss": -6.981171607971191, "global_step": 166736, "epoch": 3969} {"train_loss": -7.076529502868652, "global_step": 166737, "epoch": 3969} {"train_loss": -6.964751720428467, "global_step": 166738, "epoch": 3969} {"train_loss": -6.99137586639041, "global_step": 166739, "epoch": 3969, "val_loss": 68585.234375} {"train_loss": -7.001075267791748, "global_step": 166740, "epoch": 3970} {"train_loss": -6.951998710632324, "global_step": 166741, "epoch": 3970} {"train_loss": -6.971357345581055, "global_step": 166742, "epoch": 3970} {"train_loss": -7.022129058837891, "global_step": 166743, "epoch": 3970} {"train_loss": -7.076992034912109, "global_step": 166744, "epoch": 3970} {"train_loss": -6.917910575866699, "global_step": 166745, "epoch": 3970} {"train_loss": -6.96306848526001, "global_step": 166746, "epoch": 3970} {"train_loss": -6.882123947143555, "global_step": 166747, "epoch": 3970} {"train_loss": -6.887399196624756, "global_step": 166748, "epoch": 3970} {"train_loss": -6.925806045532227, "global_step": 166749, "epoch": 3970} {"train_loss": -6.926067352294922, "global_step": 166750, "epoch": 3970} {"train_loss": -6.9170989990234375, "global_step": 166751, "epoch": 3970} {"train_loss": -7.0114898681640625, "global_step": 166752, "epoch": 3970} {"train_loss": -6.874967098236084, "global_step": 166753, "epoch": 3970} {"train_loss": -6.950577735900879, "global_step": 166754, "epoch": 3970} {"train_loss": -6.877117156982422, "global_step": 166755, "epoch": 3970} {"train_loss": -6.858310222625732, "global_step": 166756, "epoch": 3970} {"train_loss": -7.02937126159668, "global_step": 166757, "epoch": 3970} {"train_loss": -6.903685569763184, "global_step": 166758, "epoch": 3970} {"train_loss": -6.969445705413818, "global_step": 166759, "epoch": 3970} {"train_loss": -7.065361499786377, "global_step": 166760, "epoch": 3970} {"train_loss": -7.009524345397949, "global_step": 166761, "epoch": 3970} {"train_loss": -7.023791313171387, "global_step": 166762, "epoch": 3970} {"train_loss": -6.9630231857299805, "global_step": 166763, "epoch": 3970} {"train_loss": -7.076569557189941, "global_step": 166764, "epoch": 3970} {"train_loss": -7.135349750518799, "global_step": 166765, "epoch": 3970} {"train_loss": -6.941720008850098, "global_step": 166766, "epoch": 3970} {"train_loss": -6.917322158813477, "global_step": 166767, "epoch": 3970} {"train_loss": -6.860274791717529, "global_step": 166768, "epoch": 3970} {"train_loss": -6.955042839050293, "global_step": 166769, "epoch": 3970} {"train_loss": -6.846723556518555, "global_step": 166770, "epoch": 3970} {"train_loss": -6.577940940856934, "global_step": 166771, "epoch": 3970} {"train_loss": -7.018366813659668, "global_step": 166772, "epoch": 3970} {"train_loss": -6.859291076660156, "global_step": 166773, "epoch": 3970} {"train_loss": -6.932109832763672, "global_step": 166774, "epoch": 3970} {"train_loss": -6.958076000213623, "global_step": 166775, "epoch": 3970} {"train_loss": -6.822776794433594, "global_step": 166776, "epoch": 3970} {"train_loss": -6.921712875366211, "global_step": 166777, "epoch": 3970} {"train_loss": -6.713283538818359, "global_step": 166778, "epoch": 3970} {"train_loss": -6.925417900085449, "global_step": 166779, "epoch": 3970} {"train_loss": -6.857363224029541, "global_step": 166780, "epoch": 3970} {"train_loss": -6.9341237885611395, "global_step": 166781, "epoch": 3970, "val_loss": 68538.3984375} {"train_loss": -7.005069255828857, "global_step": 166782, "epoch": 3971} {"train_loss": -6.897618293762207, "global_step": 166783, "epoch": 3971} {"train_loss": -7.0039472579956055, "global_step": 166784, "epoch": 3971} {"train_loss": -6.910129547119141, "global_step": 166785, "epoch": 3971} {"train_loss": -6.940042018890381, "global_step": 166786, "epoch": 3971} {"train_loss": -6.873849391937256, "global_step": 166787, "epoch": 3971} {"train_loss": -7.009956359863281, "global_step": 166788, "epoch": 3971} {"train_loss": -6.989261627197266, "global_step": 166789, "epoch": 3971} {"train_loss": -6.947570323944092, "global_step": 166790, "epoch": 3971} {"train_loss": -6.874472141265869, "global_step": 166791, "epoch": 3971} {"train_loss": -6.904139518737793, "global_step": 166792, "epoch": 3971} {"train_loss": -6.994279384613037, "global_step": 166793, "epoch": 3971} {"train_loss": -6.916660785675049, "global_step": 166794, "epoch": 3971} {"train_loss": -6.915030479431152, "global_step": 166795, "epoch": 3971} {"train_loss": -6.953237533569336, "global_step": 166796, "epoch": 3971} {"train_loss": -7.074537754058838, "global_step": 166797, "epoch": 3971} {"train_loss": -6.965773105621338, "global_step": 166798, "epoch": 3971} {"train_loss": -6.992547512054443, "global_step": 166799, "epoch": 3971} {"train_loss": -7.132986068725586, "global_step": 166800, "epoch": 3971} {"train_loss": -7.078914165496826, "global_step": 166801, "epoch": 3971} {"train_loss": -7.031858921051025, "global_step": 166802, "epoch": 3971} {"train_loss": -6.999837875366211, "global_step": 166803, "epoch": 3971} {"train_loss": -7.020016670227051, "global_step": 166804, "epoch": 3971} {"train_loss": -7.029345989227295, "global_step": 166805, "epoch": 3971} {"train_loss": -7.079333782196045, "global_step": 166806, "epoch": 3971} {"train_loss": -7.055087089538574, "global_step": 166807, "epoch": 3971} {"train_loss": -7.058962821960449, "global_step": 166808, "epoch": 3971} {"train_loss": -6.893449783325195, "global_step": 166809, "epoch": 3971} {"train_loss": -7.039685249328613, "global_step": 166810, "epoch": 3971} {"train_loss": -7.014739036560059, "global_step": 166811, "epoch": 3971} {"train_loss": -6.977090358734131, "global_step": 166812, "epoch": 3971} {"train_loss": -7.019474983215332, "global_step": 166813, "epoch": 3971} {"train_loss": -7.053800106048584, "global_step": 166814, "epoch": 3971} {"train_loss": -6.9061689376831055, "global_step": 166815, "epoch": 3971} {"train_loss": -6.848259925842285, "global_step": 166816, "epoch": 3971} {"train_loss": -6.9405131340026855, "global_step": 166817, "epoch": 3971} {"train_loss": -6.9742512702941895, "global_step": 166818, "epoch": 3971} {"train_loss": -6.856993675231934, "global_step": 166819, "epoch": 3971} {"train_loss": -7.027152061462402, "global_step": 166820, "epoch": 3971} {"train_loss": -6.918543815612793, "global_step": 166821, "epoch": 3971} {"train_loss": -6.914302825927734, "global_step": 166822, "epoch": 3971} {"train_loss": -6.976916063399542, "global_step": 166823, "epoch": 3971, "val_loss": 68590.8515625} {"train_loss": -7.051468849182129, "global_step": 166824, "epoch": 3972} {"train_loss": -6.981969833374023, "global_step": 166825, "epoch": 3972} {"train_loss": -6.92723274230957, "global_step": 166826, "epoch": 3972} {"train_loss": -7.039821624755859, "global_step": 166827, "epoch": 3972} {"train_loss": -6.877655029296875, "global_step": 166828, "epoch": 3972} {"train_loss": -6.933566093444824, "global_step": 166829, "epoch": 3972} {"train_loss": -6.9400434494018555, "global_step": 166830, "epoch": 3972} {"train_loss": -6.900389671325684, "global_step": 166831, "epoch": 3972} {"train_loss": -6.978744983673096, "global_step": 166832, "epoch": 3972} {"train_loss": -6.987488269805908, "global_step": 166833, "epoch": 3972} {"train_loss": -6.909003734588623, "global_step": 166834, "epoch": 3972} {"train_loss": -6.9251909255981445, "global_step": 166835, "epoch": 3972} {"train_loss": -6.9857964515686035, "global_step": 166836, "epoch": 3972} {"train_loss": -6.945342063903809, "global_step": 166837, "epoch": 3972} {"train_loss": -6.840927600860596, "global_step": 166838, "epoch": 3972} {"train_loss": -7.033492088317871, "global_step": 166839, "epoch": 3972} {"train_loss": -6.894758224487305, "global_step": 166840, "epoch": 3972} {"train_loss": -7.014195442199707, "global_step": 166841, "epoch": 3972} {"train_loss": -6.94088077545166, "global_step": 166842, "epoch": 3972} {"train_loss": -6.915292263031006, "global_step": 166843, "epoch": 3972} {"train_loss": -7.022366523742676, "global_step": 166844, "epoch": 3972} {"train_loss": -6.936580181121826, "global_step": 166845, "epoch": 3972} {"train_loss": -6.971833229064941, "global_step": 166846, "epoch": 3972} {"train_loss": -6.918774127960205, "global_step": 166847, "epoch": 3972} {"train_loss": -6.972826957702637, "global_step": 166848, "epoch": 3972} {"train_loss": -7.059486389160156, "global_step": 166849, "epoch": 3972} {"train_loss": -6.949586868286133, "global_step": 166850, "epoch": 3972} {"train_loss": -6.982314109802246, "global_step": 166851, "epoch": 3972} {"train_loss": -7.023393630981445, "global_step": 166852, "epoch": 3972} {"train_loss": -6.9041900634765625, "global_step": 166853, "epoch": 3972} {"train_loss": -6.935484886169434, "global_step": 166854, "epoch": 3972} {"train_loss": -6.884300231933594, "global_step": 166855, "epoch": 3972} {"train_loss": -6.9832353591918945, "global_step": 166856, "epoch": 3972} {"train_loss": -7.030331611633301, "global_step": 166857, "epoch": 3972} {"train_loss": -6.832945346832275, "global_step": 166858, "epoch": 3972} {"train_loss": -7.014183044433594, "global_step": 166859, "epoch": 3972} {"train_loss": -7.133913516998291, "global_step": 166860, "epoch": 3972} {"train_loss": -7.033328056335449, "global_step": 166861, "epoch": 3972} {"train_loss": -7.029994010925293, "global_step": 166862, "epoch": 3972} {"train_loss": -6.9833269119262695, "global_step": 166863, "epoch": 3972} {"train_loss": -6.99169921875, "global_step": 166864, "epoch": 3972} {"train_loss": -6.967979056494577, "global_step": 166865, "epoch": 3972, "val_loss": 68561.625} {"train_loss": -6.932352066040039, "global_step": 166866, "epoch": 3973} {"train_loss": -6.957016944885254, "global_step": 166867, "epoch": 3973} {"train_loss": -7.0342912673950195, "global_step": 166868, "epoch": 3973} {"train_loss": -7.0080671310424805, "global_step": 166869, "epoch": 3973} {"train_loss": -6.972373008728027, "global_step": 166870, "epoch": 3973} {"train_loss": -6.9868974685668945, "global_step": 166871, "epoch": 3973} {"train_loss": -7.022315979003906, "global_step": 166872, "epoch": 3973} {"train_loss": -6.976043701171875, "global_step": 166873, "epoch": 3973} {"train_loss": -7.024172782897949, "global_step": 166874, "epoch": 3973} {"train_loss": -6.9544782638549805, "global_step": 166875, "epoch": 3973} {"train_loss": -7.009891510009766, "global_step": 166876, "epoch": 3973} {"train_loss": -6.989214897155762, "global_step": 166877, "epoch": 3973} {"train_loss": -6.94283390045166, "global_step": 166878, "epoch": 3973} {"train_loss": -7.016048431396484, "global_step": 166879, "epoch": 3973} {"train_loss": -7.018990516662598, "global_step": 166880, "epoch": 3973} {"train_loss": -7.0601606369018555, "global_step": 166881, "epoch": 3973} {"train_loss": -7.021243095397949, "global_step": 166882, "epoch": 3973} {"train_loss": -6.942755699157715, "global_step": 166883, "epoch": 3973} {"train_loss": -6.97072696685791, "global_step": 166884, "epoch": 3973} {"train_loss": -6.995306968688965, "global_step": 166885, "epoch": 3973} {"train_loss": -7.089627742767334, "global_step": 166886, "epoch": 3973} {"train_loss": -6.981931686401367, "global_step": 166887, "epoch": 3973} {"train_loss": -7.109031677246094, "global_step": 166888, "epoch": 3973} {"train_loss": -7.025495529174805, "global_step": 166889, "epoch": 3973} {"train_loss": -7.023818016052246, "global_step": 166890, "epoch": 3973} {"train_loss": -7.075754165649414, "global_step": 166891, "epoch": 3973} {"train_loss": -7.122942924499512, "global_step": 166892, "epoch": 3973} {"train_loss": -7.014245510101318, "global_step": 166893, "epoch": 3973} {"train_loss": -6.951290130615234, "global_step": 166894, "epoch": 3973} {"train_loss": -6.858654022216797, "global_step": 166895, "epoch": 3973} {"train_loss": -6.99009895324707, "global_step": 166896, "epoch": 3973} {"train_loss": -6.88416862487793, "global_step": 166897, "epoch": 3973} {"train_loss": -6.935132026672363, "global_step": 166898, "epoch": 3973} {"train_loss": -6.953705787658691, "global_step": 166899, "epoch": 3973} {"train_loss": -7.0065765380859375, "global_step": 166900, "epoch": 3973} {"train_loss": -6.8477630615234375, "global_step": 166901, "epoch": 3973} {"train_loss": -6.913835048675537, "global_step": 166902, "epoch": 3973} {"train_loss": -7.0027923583984375, "global_step": 166903, "epoch": 3973} {"train_loss": -6.746804714202881, "global_step": 166904, "epoch": 3973} {"train_loss": -6.930320739746094, "global_step": 166905, "epoch": 3973} {"train_loss": -6.7407732009887695, "global_step": 166906, "epoch": 3973} {"train_loss": -6.973946071806408, "global_step": 166907, "epoch": 3973, "val_loss": 68850.375} {"train_loss": -6.855006694793701, "global_step": 166908, "epoch": 3974} {"train_loss": -6.832786560058594, "global_step": 166909, "epoch": 3974} {"train_loss": -6.88289737701416, "global_step": 166910, "epoch": 3974} {"train_loss": -6.8683905601501465, "global_step": 166911, "epoch": 3974} {"train_loss": -6.865591049194336, "global_step": 166912, "epoch": 3974} {"train_loss": -6.823180198669434, "global_step": 166913, "epoch": 3974} {"train_loss": -6.863051414489746, "global_step": 166914, "epoch": 3974} {"train_loss": -6.9383745193481445, "global_step": 166915, "epoch": 3974} {"train_loss": -6.919179916381836, "global_step": 166916, "epoch": 3974} {"train_loss": -6.906529426574707, "global_step": 166917, "epoch": 3974} {"train_loss": -6.799307823181152, "global_step": 166918, "epoch": 3974} {"train_loss": -6.992493629455566, "global_step": 166919, "epoch": 3974} {"train_loss": -6.979557991027832, "global_step": 166920, "epoch": 3974} {"train_loss": -6.932323932647705, "global_step": 166921, "epoch": 3974} {"train_loss": -6.9405622482299805, "global_step": 166922, "epoch": 3974} {"train_loss": -6.861071586608887, "global_step": 166923, "epoch": 3974} {"train_loss": -6.971599102020264, "global_step": 166924, "epoch": 3974} {"train_loss": -6.965905666351318, "global_step": 166925, "epoch": 3974} {"train_loss": -6.90859842300415, "global_step": 166926, "epoch": 3974} {"train_loss": -7.080751895904541, "global_step": 166927, "epoch": 3974} {"train_loss": -6.939347267150879, "global_step": 166928, "epoch": 3974} {"train_loss": -6.9575653076171875, "global_step": 166929, "epoch": 3974} {"train_loss": -6.982390880584717, "global_step": 166930, "epoch": 3974} {"train_loss": -7.1038947105407715, "global_step": 166931, "epoch": 3974} {"train_loss": -6.900269985198975, "global_step": 166932, "epoch": 3974} {"train_loss": -6.911312580108643, "global_step": 166933, "epoch": 3974} {"train_loss": -6.9800286293029785, "global_step": 166934, "epoch": 3974} {"train_loss": -6.888876914978027, "global_step": 166935, "epoch": 3974} {"train_loss": -6.918365955352783, "global_step": 166936, "epoch": 3974} {"train_loss": -6.933320045471191, "global_step": 166937, "epoch": 3974} {"train_loss": -6.850152015686035, "global_step": 166938, "epoch": 3974} {"train_loss": -6.960012912750244, "global_step": 166939, "epoch": 3974} {"train_loss": -6.958388805389404, "global_step": 166940, "epoch": 3974} {"train_loss": -6.969415664672852, "global_step": 166941, "epoch": 3974} {"train_loss": -7.086483955383301, "global_step": 166942, "epoch": 3974} {"train_loss": -6.883617401123047, "global_step": 166943, "epoch": 3974} {"train_loss": -6.89128303527832, "global_step": 166944, "epoch": 3974} {"train_loss": -6.984771728515625, "global_step": 166945, "epoch": 3974} {"train_loss": -7.016406059265137, "global_step": 166946, "epoch": 3974} {"train_loss": -6.999377727508545, "global_step": 166947, "epoch": 3974} {"train_loss": -6.838580131530762, "global_step": 166948, "epoch": 3974} {"train_loss": -6.933261712392171, "global_step": 166949, "epoch": 3974, "val_loss": 68615.9921875} {"train_loss": -6.93424654006958, "global_step": 166950, "epoch": 3975} {"train_loss": -7.0250468254089355, "global_step": 166951, "epoch": 3975} {"train_loss": -6.91899299621582, "global_step": 166952, "epoch": 3975} {"train_loss": -6.917646884918213, "global_step": 166953, "epoch": 3975} {"train_loss": -7.007055282592773, "global_step": 166954, "epoch": 3975} {"train_loss": -6.9325714111328125, "global_step": 166955, "epoch": 3975} {"train_loss": -6.888537406921387, "global_step": 166956, "epoch": 3975} {"train_loss": -6.81418514251709, "global_step": 166957, "epoch": 3975} {"train_loss": -6.837910175323486, "global_step": 166958, "epoch": 3975} {"train_loss": -6.937363624572754, "global_step": 166959, "epoch": 3975} {"train_loss": -6.883963584899902, "global_step": 166960, "epoch": 3975} {"train_loss": -6.843194007873535, "global_step": 166961, "epoch": 3975} {"train_loss": -7.012296676635742, "global_step": 166962, "epoch": 3975} {"train_loss": -6.949917793273926, "global_step": 166963, "epoch": 3975} {"train_loss": -6.787095069885254, "global_step": 166964, "epoch": 3975} {"train_loss": -6.922176361083984, "global_step": 166965, "epoch": 3975} {"train_loss": -6.8032073974609375, "global_step": 166966, "epoch": 3975} {"train_loss": -6.812893867492676, "global_step": 166967, "epoch": 3975} {"train_loss": -6.878776550292969, "global_step": 166968, "epoch": 3975} {"train_loss": -6.877084732055664, "global_step": 166969, "epoch": 3975} {"train_loss": -6.913485050201416, "global_step": 166970, "epoch": 3975} {"train_loss": -6.7903032302856445, "global_step": 166971, "epoch": 3975} {"train_loss": -6.839169979095459, "global_step": 166972, "epoch": 3975} {"train_loss": -6.849800109863281, "global_step": 166973, "epoch": 3975} {"train_loss": -6.868052959442139, "global_step": 166974, "epoch": 3975} {"train_loss": -7.017999649047852, "global_step": 166975, "epoch": 3975} {"train_loss": -6.798455715179443, "global_step": 166976, "epoch": 3975} {"train_loss": -7.0018181800842285, "global_step": 166977, "epoch": 3975} {"train_loss": -6.912437438964844, "global_step": 166978, "epoch": 3975} {"train_loss": -6.8908491134643555, "global_step": 166979, "epoch": 3975} {"train_loss": -6.851568222045898, "global_step": 166980, "epoch": 3975} {"train_loss": -6.895427703857422, "global_step": 166981, "epoch": 3975} {"train_loss": -6.81864070892334, "global_step": 166982, "epoch": 3975} {"train_loss": -6.977484703063965, "global_step": 166983, "epoch": 3975} {"train_loss": -6.882426738739014, "global_step": 166984, "epoch": 3975} {"train_loss": -7.01291561126709, "global_step": 166985, "epoch": 3975} {"train_loss": -6.889480113983154, "global_step": 166986, "epoch": 3975} {"train_loss": -6.920426845550537, "global_step": 166987, "epoch": 3975} {"train_loss": -6.9326372146606445, "global_step": 166988, "epoch": 3975} {"train_loss": -6.984840393066406, "global_step": 166989, "epoch": 3975} {"train_loss": -7.014447212219238, "global_step": 166990, "epoch": 3975} {"train_loss": -6.904284216108776, "global_step": 166991, "epoch": 3975, "val_loss": 68513.6328125} {"train_loss": -7.032327651977539, "global_step": 166992, "epoch": 3976} {"train_loss": -6.903998374938965, "global_step": 166993, "epoch": 3976} {"train_loss": -6.925885200500488, "global_step": 166994, "epoch": 3976} {"train_loss": -6.968608856201172, "global_step": 166995, "epoch": 3976} {"train_loss": -7.050412178039551, "global_step": 166996, "epoch": 3976} {"train_loss": -6.871870040893555, "global_step": 166997, "epoch": 3976} {"train_loss": -7.059671878814697, "global_step": 166998, "epoch": 3976} {"train_loss": -6.962754249572754, "global_step": 166999, "epoch": 3976} {"train_loss": -6.974211692810059, "global_step": 167000, "epoch": 3976} {"train_loss": -7.0005717277526855, "global_step": 167001, "epoch": 3976} {"train_loss": -6.861656188964844, "global_step": 167002, "epoch": 3976} {"train_loss": -7.031808853149414, "global_step": 167003, "epoch": 3976} {"train_loss": -6.9719743728637695, "global_step": 167004, "epoch": 3976} {"train_loss": -6.974510192871094, "global_step": 167005, "epoch": 3976} {"train_loss": -6.975394248962402, "global_step": 167006, "epoch": 3976} {"train_loss": -7.041914939880371, "global_step": 167007, "epoch": 3976} {"train_loss": -6.928169250488281, "global_step": 167008, "epoch": 3976} {"train_loss": -6.9861297607421875, "global_step": 167009, "epoch": 3976} {"train_loss": -6.990257263183594, "global_step": 167010, "epoch": 3976} {"train_loss": -7.023067474365234, "global_step": 167011, "epoch": 3976} {"train_loss": -6.899515628814697, "global_step": 167012, "epoch": 3976} {"train_loss": -7.1160664558410645, "global_step": 167013, "epoch": 3976} {"train_loss": -6.9327545166015625, "global_step": 167014, "epoch": 3976} {"train_loss": -6.934486389160156, "global_step": 167015, "epoch": 3976} {"train_loss": -7.06179141998291, "global_step": 167016, "epoch": 3976} {"train_loss": -6.967942237854004, "global_step": 167017, "epoch": 3976} {"train_loss": -6.952510833740234, "global_step": 167018, "epoch": 3976} {"train_loss": -6.886796951293945, "global_step": 167019, "epoch": 3976} {"train_loss": -6.908352375030518, "global_step": 167020, "epoch": 3976} {"train_loss": -6.929318428039551, "global_step": 167021, "epoch": 3976} {"train_loss": -7.068156719207764, "global_step": 167022, "epoch": 3976} {"train_loss": -7.02197265625, "global_step": 167023, "epoch": 3976} {"train_loss": -7.088892459869385, "global_step": 167024, "epoch": 3976} {"train_loss": -7.017494201660156, "global_step": 167025, "epoch": 3976} {"train_loss": -7.0030198097229, "global_step": 167026, "epoch": 3976} {"train_loss": -7.055517196655273, "global_step": 167027, "epoch": 3976} {"train_loss": -7.028153896331787, "global_step": 167028, "epoch": 3976} {"train_loss": -7.044991493225098, "global_step": 167029, "epoch": 3976} {"train_loss": -6.881438255310059, "global_step": 167030, "epoch": 3976} {"train_loss": -6.915532112121582, "global_step": 167031, "epoch": 3976} {"train_loss": -6.979160785675049, "global_step": 167032, "epoch": 3976} {"train_loss": -6.980445419039045, "global_step": 167033, "epoch": 3976, "val_loss": 68625.03125} {"train_loss": -7.042549133300781, "global_step": 167034, "epoch": 3977} {"train_loss": -6.9285783767700195, "global_step": 167035, "epoch": 3977} {"train_loss": -6.791736602783203, "global_step": 167036, "epoch": 3977} {"train_loss": -6.97415018081665, "global_step": 167037, "epoch": 3977} {"train_loss": -6.991056442260742, "global_step": 167038, "epoch": 3977} {"train_loss": -6.95652961730957, "global_step": 167039, "epoch": 3977} {"train_loss": -6.890573024749756, "global_step": 167040, "epoch": 3977} {"train_loss": -6.897957801818848, "global_step": 167041, "epoch": 3977} {"train_loss": -7.085762023925781, "global_step": 167042, "epoch": 3977} {"train_loss": -7.044322967529297, "global_step": 167043, "epoch": 3977} {"train_loss": -6.956557750701904, "global_step": 167044, "epoch": 3977} {"train_loss": -6.979146957397461, "global_step": 167045, "epoch": 3977} {"train_loss": -6.921380996704102, "global_step": 167046, "epoch": 3977} {"train_loss": -7.010830879211426, "global_step": 167047, "epoch": 3977} {"train_loss": -7.010624885559082, "global_step": 167048, "epoch": 3977} {"train_loss": -6.920356273651123, "global_step": 167049, "epoch": 3977} {"train_loss": -6.883077621459961, "global_step": 167050, "epoch": 3977} {"train_loss": -7.003901481628418, "global_step": 167051, "epoch": 3977} {"train_loss": -6.938790321350098, "global_step": 167052, "epoch": 3977} {"train_loss": -7.006207466125488, "global_step": 167053, "epoch": 3977} {"train_loss": -7.073303699493408, "global_step": 167054, "epoch": 3977} {"train_loss": -7.039308547973633, "global_step": 167055, "epoch": 3977} {"train_loss": -6.907917022705078, "global_step": 167056, "epoch": 3977} {"train_loss": -6.9661970138549805, "global_step": 167057, "epoch": 3977} {"train_loss": -6.996538162231445, "global_step": 167058, "epoch": 3977} {"train_loss": -7.122579574584961, "global_step": 167059, "epoch": 3977} {"train_loss": -6.934042930603027, "global_step": 167060, "epoch": 3977} {"train_loss": -6.9487409591674805, "global_step": 167061, "epoch": 3977} {"train_loss": -7.087663650512695, "global_step": 167062, "epoch": 3977} {"train_loss": -7.042852401733398, "global_step": 167063, "epoch": 3977} {"train_loss": -7.039773941040039, "global_step": 167064, "epoch": 3977} {"train_loss": -6.826272964477539, "global_step": 167065, "epoch": 3977} {"train_loss": -7.04029655456543, "global_step": 167066, "epoch": 3977} {"train_loss": -6.975732326507568, "global_step": 167067, "epoch": 3977} {"train_loss": -6.8900957107543945, "global_step": 167068, "epoch": 3977} {"train_loss": -6.8928985595703125, "global_step": 167069, "epoch": 3977} {"train_loss": -6.8577985763549805, "global_step": 167070, "epoch": 3977} {"train_loss": -6.961520671844482, "global_step": 167071, "epoch": 3977} {"train_loss": -6.970680236816406, "global_step": 167072, "epoch": 3977} {"train_loss": -6.884747505187988, "global_step": 167073, "epoch": 3977} {"train_loss": -6.929141044616699, "global_step": 167074, "epoch": 3977} {"train_loss": -6.965106316975185, "global_step": 167075, "epoch": 3977, "val_loss": 68532.2109375} {"train_loss": -6.952126502990723, "global_step": 167076, "epoch": 3978} {"train_loss": -6.893853187561035, "global_step": 167077, "epoch": 3978} {"train_loss": -6.902117729187012, "global_step": 167078, "epoch": 3978} {"train_loss": -6.870983123779297, "global_step": 167079, "epoch": 3978} {"train_loss": -6.965967178344727, "global_step": 167080, "epoch": 3978} {"train_loss": -6.954842567443848, "global_step": 167081, "epoch": 3978} {"train_loss": -6.831603527069092, "global_step": 167082, "epoch": 3978} {"train_loss": -6.982893943786621, "global_step": 167083, "epoch": 3978} {"train_loss": -6.965958595275879, "global_step": 167084, "epoch": 3978} {"train_loss": -6.979811668395996, "global_step": 167085, "epoch": 3978} {"train_loss": -6.855079650878906, "global_step": 167086, "epoch": 3978} {"train_loss": -6.994967937469482, "global_step": 167087, "epoch": 3978} {"train_loss": -6.875143527984619, "global_step": 167088, "epoch": 3978} {"train_loss": -6.9407854080200195, "global_step": 167089, "epoch": 3978} {"train_loss": -7.024507522583008, "global_step": 167090, "epoch": 3978} {"train_loss": -6.853385925292969, "global_step": 167091, "epoch": 3978} {"train_loss": -7.066919803619385, "global_step": 167092, "epoch": 3978} {"train_loss": -6.931142807006836, "global_step": 167093, "epoch": 3978} {"train_loss": -7.034103870391846, "global_step": 167094, "epoch": 3978} {"train_loss": -7.007074356079102, "global_step": 167095, "epoch": 3978} {"train_loss": -6.97930908203125, "global_step": 167096, "epoch": 3978} {"train_loss": -6.8562750816345215, "global_step": 167097, "epoch": 3978} {"train_loss": -7.036184310913086, "global_step": 167098, "epoch": 3978} {"train_loss": -7.026510238647461, "global_step": 167099, "epoch": 3978} {"train_loss": -6.9492878913879395, "global_step": 167100, "epoch": 3978} {"train_loss": -7.074166297912598, "global_step": 167101, "epoch": 3978} {"train_loss": -6.982521057128906, "global_step": 167102, "epoch": 3978} {"train_loss": -6.933427810668945, "global_step": 167103, "epoch": 3978} {"train_loss": -7.078884601593018, "global_step": 167104, "epoch": 3978} {"train_loss": -7.069556713104248, "global_step": 167105, "epoch": 3978} {"train_loss": -6.892117500305176, "global_step": 167106, "epoch": 3978} {"train_loss": -6.957569122314453, "global_step": 167107, "epoch": 3978} {"train_loss": -6.944441795349121, "global_step": 167108, "epoch": 3978} {"train_loss": -7.025365829467773, "global_step": 167109, "epoch": 3978} {"train_loss": -6.922945976257324, "global_step": 167110, "epoch": 3978} {"train_loss": -6.993311882019043, "global_step": 167111, "epoch": 3978} {"train_loss": -6.958584785461426, "global_step": 167112, "epoch": 3978} {"train_loss": -6.89840030670166, "global_step": 167113, "epoch": 3978} {"train_loss": -6.902476787567139, "global_step": 167114, "epoch": 3978} {"train_loss": -6.850676536560059, "global_step": 167115, "epoch": 3978} {"train_loss": -6.793492317199707, "global_step": 167116, "epoch": 3978} {"train_loss": -6.950178872971308, "global_step": 167117, "epoch": 3978, "val_loss": 68583.5546875} {"train_loss": -6.937833309173584, "global_step": 167118, "epoch": 3979} {"train_loss": -6.933521270751953, "global_step": 167119, "epoch": 3979} {"train_loss": -6.902578830718994, "global_step": 167120, "epoch": 3979} {"train_loss": -6.7700090408325195, "global_step": 167121, "epoch": 3979} {"train_loss": -6.822448253631592, "global_step": 167122, "epoch": 3979} {"train_loss": -6.871157646179199, "global_step": 167123, "epoch": 3979} {"train_loss": -6.926454067230225, "global_step": 167124, "epoch": 3979} {"train_loss": -6.8435492515563965, "global_step": 167125, "epoch": 3979} {"train_loss": -6.797372817993164, "global_step": 167126, "epoch": 3979} {"train_loss": -6.868490219116211, "global_step": 167127, "epoch": 3979} {"train_loss": -6.935318946838379, "global_step": 167128, "epoch": 3979} {"train_loss": -6.852849960327148, "global_step": 167129, "epoch": 3979} {"train_loss": -6.87513542175293, "global_step": 167130, "epoch": 3979} {"train_loss": -6.917242050170898, "global_step": 167131, "epoch": 3979} {"train_loss": -6.763681411743164, "global_step": 167132, "epoch": 3979} {"train_loss": -7.049034118652344, "global_step": 167133, "epoch": 3979} {"train_loss": -6.731421947479248, "global_step": 167134, "epoch": 3979} {"train_loss": -6.927628040313721, "global_step": 167135, "epoch": 3979} {"train_loss": -6.806622505187988, "global_step": 167136, "epoch": 3979} {"train_loss": -6.931970596313477, "global_step": 167137, "epoch": 3979} {"train_loss": -6.951048374176025, "global_step": 167138, "epoch": 3979} {"train_loss": -6.969150543212891, "global_step": 167139, "epoch": 3979} {"train_loss": -6.932097911834717, "global_step": 167140, "epoch": 3979} {"train_loss": -6.953959941864014, "global_step": 167141, "epoch": 3979} {"train_loss": -6.728756427764893, "global_step": 167142, "epoch": 3979} {"train_loss": -6.9465227127075195, "global_step": 167143, "epoch": 3979} {"train_loss": -6.938982963562012, "global_step": 167144, "epoch": 3979} {"train_loss": -6.781848907470703, "global_step": 167145, "epoch": 3979} {"train_loss": -6.9721221923828125, "global_step": 167146, "epoch": 3979} {"train_loss": -6.913066864013672, "global_step": 167147, "epoch": 3979} {"train_loss": -6.840148448944092, "global_step": 167148, "epoch": 3979} {"train_loss": -7.004083633422852, "global_step": 167149, "epoch": 3979} {"train_loss": -6.911072731018066, "global_step": 167150, "epoch": 3979} {"train_loss": -6.923041820526123, "global_step": 167151, "epoch": 3979} {"train_loss": -6.977670669555664, "global_step": 167152, "epoch": 3979} {"train_loss": -6.9403886795043945, "global_step": 167153, "epoch": 3979} {"train_loss": -6.983730792999268, "global_step": 167154, "epoch": 3979} {"train_loss": -6.944453239440918, "global_step": 167155, "epoch": 3979} {"train_loss": -6.973762512207031, "global_step": 167156, "epoch": 3979} {"train_loss": -6.997424125671387, "global_step": 167157, "epoch": 3979} {"train_loss": -6.907242774963379, "global_step": 167158, "epoch": 3979} {"train_loss": -6.900794596899123, "global_step": 167159, "epoch": 3979, "val_loss": 68498.8984375} {"train_loss": -6.978520393371582, "global_step": 167160, "epoch": 3980} {"train_loss": -6.908547878265381, "global_step": 167161, "epoch": 3980} {"train_loss": -6.972160339355469, "global_step": 167162, "epoch": 3980} {"train_loss": -6.960957050323486, "global_step": 167163, "epoch": 3980} {"train_loss": -6.909352779388428, "global_step": 167164, "epoch": 3980} {"train_loss": -6.9704179763793945, "global_step": 167165, "epoch": 3980} {"train_loss": -6.986358642578125, "global_step": 167166, "epoch": 3980} {"train_loss": -6.906549453735352, "global_step": 167167, "epoch": 3980} {"train_loss": -6.835209846496582, "global_step": 167168, "epoch": 3980} {"train_loss": -7.0110883712768555, "global_step": 167169, "epoch": 3980} {"train_loss": -7.029125690460205, "global_step": 167170, "epoch": 3980} {"train_loss": -6.912193775177002, "global_step": 167171, "epoch": 3980} {"train_loss": -6.958568572998047, "global_step": 167172, "epoch": 3980} {"train_loss": -7.00958251953125, "global_step": 167173, "epoch": 3980} {"train_loss": -6.979863166809082, "global_step": 167174, "epoch": 3980} {"train_loss": -7.074967384338379, "global_step": 167175, "epoch": 3980} {"train_loss": -6.975719451904297, "global_step": 167176, "epoch": 3980} {"train_loss": -6.987674236297607, "global_step": 167177, "epoch": 3980} {"train_loss": -7.084709167480469, "global_step": 167178, "epoch": 3980} {"train_loss": -7.081583023071289, "global_step": 167179, "epoch": 3980} {"train_loss": -7.068077087402344, "global_step": 167180, "epoch": 3980} {"train_loss": -6.986422061920166, "global_step": 167181, "epoch": 3980} {"train_loss": -6.998055458068848, "global_step": 167182, "epoch": 3980} {"train_loss": -7.0320515632629395, "global_step": 167183, "epoch": 3980} {"train_loss": -6.925432205200195, "global_step": 167184, "epoch": 3980} {"train_loss": -7.033634185791016, "global_step": 167185, "epoch": 3980} {"train_loss": -6.963439464569092, "global_step": 167186, "epoch": 3980} {"train_loss": -6.994300842285156, "global_step": 167187, "epoch": 3980} {"train_loss": -6.944525241851807, "global_step": 167188, "epoch": 3980} {"train_loss": -7.043327331542969, "global_step": 167189, "epoch": 3980} {"train_loss": -6.894355297088623, "global_step": 167190, "epoch": 3980} {"train_loss": -6.982232570648193, "global_step": 167191, "epoch": 3980} {"train_loss": -7.008912086486816, "global_step": 167192, "epoch": 3980} {"train_loss": -6.930649757385254, "global_step": 167193, "epoch": 3980} {"train_loss": -6.995582580566406, "global_step": 167194, "epoch": 3980} {"train_loss": -7.094058513641357, "global_step": 167195, "epoch": 3980} {"train_loss": -7.043057441711426, "global_step": 167196, "epoch": 3980} {"train_loss": -6.957472801208496, "global_step": 167197, "epoch": 3980} {"train_loss": -7.026557922363281, "global_step": 167198, "epoch": 3980} {"train_loss": -6.934736251831055, "global_step": 167199, "epoch": 3980} {"train_loss": -6.948763847351074, "global_step": 167200, "epoch": 3980} {"train_loss": -6.983057146980649, "global_step": 167201, "epoch": 3980, "val_loss": 68507.1015625} {"train_loss": -6.884458065032959, "global_step": 167202, "epoch": 3981} {"train_loss": -6.912830352783203, "global_step": 167203, "epoch": 3981} {"train_loss": -6.9786176681518555, "global_step": 167204, "epoch": 3981} {"train_loss": -6.938882350921631, "global_step": 167205, "epoch": 3981} {"train_loss": -7.026789665222168, "global_step": 167206, "epoch": 3981} {"train_loss": -6.987235069274902, "global_step": 167207, "epoch": 3981} {"train_loss": -7.010125160217285, "global_step": 167208, "epoch": 3981} {"train_loss": -7.068806171417236, "global_step": 167209, "epoch": 3981} {"train_loss": -7.075865268707275, "global_step": 167210, "epoch": 3981} {"train_loss": -7.050454139709473, "global_step": 167211, "epoch": 3981} {"train_loss": -7.006892204284668, "global_step": 167212, "epoch": 3981} {"train_loss": -6.912691116333008, "global_step": 167213, "epoch": 3981} {"train_loss": -7.010649681091309, "global_step": 167214, "epoch": 3981} {"train_loss": -7.0244269371032715, "global_step": 167215, "epoch": 3981} {"train_loss": -6.954529285430908, "global_step": 167216, "epoch": 3981} {"train_loss": -6.917617321014404, "global_step": 167217, "epoch": 3981} {"train_loss": -6.8712053298950195, "global_step": 167218, "epoch": 3981} {"train_loss": -6.865597724914551, "global_step": 167219, "epoch": 3981} {"train_loss": -7.079026222229004, "global_step": 167220, "epoch": 3981} {"train_loss": -6.9136762619018555, "global_step": 167221, "epoch": 3981} {"train_loss": -6.96933126449585, "global_step": 167222, "epoch": 3981} {"train_loss": -7.056791305541992, "global_step": 167223, "epoch": 3981} {"train_loss": -6.985679626464844, "global_step": 167224, "epoch": 3981} {"train_loss": -7.139713764190674, "global_step": 167225, "epoch": 3981} {"train_loss": -6.942905426025391, "global_step": 167226, "epoch": 3981} {"train_loss": -6.925209999084473, "global_step": 167227, "epoch": 3981} {"train_loss": -7.0326032638549805, "global_step": 167228, "epoch": 3981} {"train_loss": -6.943539619445801, "global_step": 167229, "epoch": 3981} {"train_loss": -6.982591152191162, "global_step": 167230, "epoch": 3981} {"train_loss": -6.829801559448242, "global_step": 167231, "epoch": 3981} {"train_loss": -6.921257972717285, "global_step": 167232, "epoch": 3981} {"train_loss": -7.024511337280273, "global_step": 167233, "epoch": 3981} {"train_loss": -7.063076019287109, "global_step": 167234, "epoch": 3981} {"train_loss": -7.012962341308594, "global_step": 167235, "epoch": 3981} {"train_loss": -6.971640586853027, "global_step": 167236, "epoch": 3981} {"train_loss": -6.929619312286377, "global_step": 167237, "epoch": 3981} {"train_loss": -7.076886177062988, "global_step": 167238, "epoch": 3981} {"train_loss": -7.051155090332031, "global_step": 167239, "epoch": 3981} {"train_loss": -7.089108943939209, "global_step": 167240, "epoch": 3981} {"train_loss": -7.1287007331848145, "global_step": 167241, "epoch": 3981} {"train_loss": -6.974377632141113, "global_step": 167242, "epoch": 3981} {"train_loss": -6.990491798945835, "global_step": 167243, "epoch": 3981, "val_loss": 68619.3359375} {"train_loss": -6.9726715087890625, "global_step": 167244, "epoch": 3982} {"train_loss": -6.935203552246094, "global_step": 167245, "epoch": 3982} {"train_loss": -7.069523811340332, "global_step": 167246, "epoch": 3982} {"train_loss": -7.026031494140625, "global_step": 167247, "epoch": 3982} {"train_loss": -6.985090255737305, "global_step": 167248, "epoch": 3982} {"train_loss": -6.99615478515625, "global_step": 167249, "epoch": 3982} {"train_loss": -6.9206929206848145, "global_step": 167250, "epoch": 3982} {"train_loss": -6.9012556076049805, "global_step": 167251, "epoch": 3982} {"train_loss": -7.0046515464782715, "global_step": 167252, "epoch": 3982} {"train_loss": -6.934218406677246, "global_step": 167253, "epoch": 3982} {"train_loss": -6.983161926269531, "global_step": 167254, "epoch": 3982} {"train_loss": -7.07919979095459, "global_step": 167255, "epoch": 3982} {"train_loss": -6.847987174987793, "global_step": 167256, "epoch": 3982} {"train_loss": -6.982745170593262, "global_step": 167257, "epoch": 3982} {"train_loss": -6.869929313659668, "global_step": 167258, "epoch": 3982} {"train_loss": -6.958461761474609, "global_step": 167259, "epoch": 3982} {"train_loss": -6.843454360961914, "global_step": 167260, "epoch": 3982} {"train_loss": -6.920315265655518, "global_step": 167261, "epoch": 3982} {"train_loss": -7.013236999511719, "global_step": 167262, "epoch": 3982} {"train_loss": -6.880079746246338, "global_step": 167263, "epoch": 3982} {"train_loss": -6.939054489135742, "global_step": 167264, "epoch": 3982} {"train_loss": -6.980395317077637, "global_step": 167265, "epoch": 3982} {"train_loss": -7.058480262756348, "global_step": 167266, "epoch": 3982} {"train_loss": -6.957758903503418, "global_step": 167267, "epoch": 3982} {"train_loss": -6.964980602264404, "global_step": 167268, "epoch": 3982} {"train_loss": -6.9140143394470215, "global_step": 167269, "epoch": 3982} {"train_loss": -7.0167036056518555, "global_step": 167270, "epoch": 3982} {"train_loss": -6.931983470916748, "global_step": 167271, "epoch": 3982} {"train_loss": -6.968357086181641, "global_step": 167272, "epoch": 3982} {"train_loss": -7.018338680267334, "global_step": 167273, "epoch": 3982} {"train_loss": -7.012224197387695, "global_step": 167274, "epoch": 3982} {"train_loss": -6.982234001159668, "global_step": 167275, "epoch": 3982} {"train_loss": -6.957009792327881, "global_step": 167276, "epoch": 3982} {"train_loss": -6.8914475440979, "global_step": 167277, "epoch": 3982} {"train_loss": -7.050763130187988, "global_step": 167278, "epoch": 3982} {"train_loss": -6.9359660148620605, "global_step": 167279, "epoch": 3982} {"train_loss": -7.020391941070557, "global_step": 167280, "epoch": 3982} {"train_loss": -6.996767997741699, "global_step": 167281, "epoch": 3982} {"train_loss": -7.02352237701416, "global_step": 167282, "epoch": 3982} {"train_loss": -6.941083908081055, "global_step": 167283, "epoch": 3982} {"train_loss": -6.943723678588867, "global_step": 167284, "epoch": 3982} {"train_loss": -6.966015316191173, "global_step": 167285, "epoch": 3982, "val_loss": 68764.1484375} {"train_loss": -7.009139060974121, "global_step": 167286, "epoch": 3983} {"train_loss": -6.935911178588867, "global_step": 167287, "epoch": 3983} {"train_loss": -6.93975830078125, "global_step": 167288, "epoch": 3983} {"train_loss": -6.923525810241699, "global_step": 167289, "epoch": 3983} {"train_loss": -6.9110565185546875, "global_step": 167290, "epoch": 3983} {"train_loss": -6.984118461608887, "global_step": 167291, "epoch": 3983} {"train_loss": -6.936723709106445, "global_step": 167292, "epoch": 3983} {"train_loss": -6.921945571899414, "global_step": 167293, "epoch": 3983} {"train_loss": -6.896834850311279, "global_step": 167294, "epoch": 3983} {"train_loss": -6.820730209350586, "global_step": 167295, "epoch": 3983} {"train_loss": -6.778126239776611, "global_step": 167296, "epoch": 3983} {"train_loss": -6.852004528045654, "global_step": 167297, "epoch": 3983} {"train_loss": -6.82688570022583, "global_step": 167298, "epoch": 3983} {"train_loss": -6.982049465179443, "global_step": 167299, "epoch": 3983} {"train_loss": -6.760148525238037, "global_step": 167300, "epoch": 3983} {"train_loss": -6.776135444641113, "global_step": 167301, "epoch": 3983} {"train_loss": -6.896081447601318, "global_step": 167302, "epoch": 3983} {"train_loss": -6.855363845825195, "global_step": 167303, "epoch": 3983} {"train_loss": -6.753992557525635, "global_step": 167304, "epoch": 3983} {"train_loss": -6.791831970214844, "global_step": 167305, "epoch": 3983} {"train_loss": -6.870852470397949, "global_step": 167306, "epoch": 3983} {"train_loss": -6.831718444824219, "global_step": 167307, "epoch": 3983} {"train_loss": -6.699516296386719, "global_step": 167308, "epoch": 3983} {"train_loss": -6.849875450134277, "global_step": 167309, "epoch": 3983} {"train_loss": -6.822430610656738, "global_step": 167310, "epoch": 3983} {"train_loss": -6.750548362731934, "global_step": 167311, "epoch": 3983} {"train_loss": -6.863917350769043, "global_step": 167312, "epoch": 3983} {"train_loss": -6.748081207275391, "global_step": 167313, "epoch": 3983} {"train_loss": -6.824025630950928, "global_step": 167314, "epoch": 3983} {"train_loss": -6.8463850021362305, "global_step": 167315, "epoch": 3983} {"train_loss": -6.861517906188965, "global_step": 167316, "epoch": 3983} {"train_loss": -6.8893280029296875, "global_step": 167317, "epoch": 3983} {"train_loss": -6.850841999053955, "global_step": 167318, "epoch": 3983} {"train_loss": -6.879349231719971, "global_step": 167319, "epoch": 3983} {"train_loss": -6.724438667297363, "global_step": 167320, "epoch": 3983} {"train_loss": -6.757920265197754, "global_step": 167321, "epoch": 3983} {"train_loss": -6.8852386474609375, "global_step": 167322, "epoch": 3983} {"train_loss": -6.978806495666504, "global_step": 167323, "epoch": 3983} {"train_loss": -6.87984561920166, "global_step": 167324, "epoch": 3983} {"train_loss": -6.855604648590088, "global_step": 167325, "epoch": 3983} {"train_loss": -6.833554267883301, "global_step": 167326, "epoch": 3983} {"train_loss": -6.854863745825631, "global_step": 167327, "epoch": 3983, "val_loss": 68816.3125} {"train_loss": -6.691554069519043, "global_step": 167328, "epoch": 3984} {"train_loss": -6.888193130493164, "global_step": 167329, "epoch": 3984} {"train_loss": -6.7701921463012695, "global_step": 167330, "epoch": 3984} {"train_loss": -6.861427307128906, "global_step": 167331, "epoch": 3984} {"train_loss": -6.974404335021973, "global_step": 167332, "epoch": 3984} {"train_loss": -6.893575668334961, "global_step": 167333, "epoch": 3984} {"train_loss": -6.787917137145996, "global_step": 167334, "epoch": 3984} {"train_loss": -6.859960556030273, "global_step": 167335, "epoch": 3984} {"train_loss": -6.914252281188965, "global_step": 167336, "epoch": 3984} {"train_loss": -6.831760883331299, "global_step": 167337, "epoch": 3984} {"train_loss": -6.934079170227051, "global_step": 167338, "epoch": 3984} {"train_loss": -6.768904209136963, "global_step": 167339, "epoch": 3984} {"train_loss": -6.975371360778809, "global_step": 167340, "epoch": 3984} {"train_loss": -6.942020416259766, "global_step": 167341, "epoch": 3984} {"train_loss": -6.827336311340332, "global_step": 167342, "epoch": 3984} {"train_loss": -6.994170665740967, "global_step": 167343, "epoch": 3984} {"train_loss": -6.829429626464844, "global_step": 167344, "epoch": 3984} {"train_loss": -6.956801414489746, "global_step": 167345, "epoch": 3984} {"train_loss": -6.984789848327637, "global_step": 167346, "epoch": 3984} {"train_loss": -6.939694404602051, "global_step": 167347, "epoch": 3984} {"train_loss": -6.9037275314331055, "global_step": 167348, "epoch": 3984} {"train_loss": -6.882768154144287, "global_step": 167349, "epoch": 3984} {"train_loss": -6.965587139129639, "global_step": 167350, "epoch": 3984} {"train_loss": -6.914356231689453, "global_step": 167351, "epoch": 3984} {"train_loss": -7.051420211791992, "global_step": 167352, "epoch": 3984} {"train_loss": -6.873708248138428, "global_step": 167353, "epoch": 3984} {"train_loss": -6.951549530029297, "global_step": 167354, "epoch": 3984} {"train_loss": -6.8299055099487305, "global_step": 167355, "epoch": 3984} {"train_loss": -6.934666633605957, "global_step": 167356, "epoch": 3984} {"train_loss": -7.01943302154541, "global_step": 167357, "epoch": 3984} {"train_loss": -6.946722030639648, "global_step": 167358, "epoch": 3984} {"train_loss": -6.954588890075684, "global_step": 167359, "epoch": 3984} {"train_loss": -7.104198455810547, "global_step": 167360, "epoch": 3984} {"train_loss": -7.04132080078125, "global_step": 167361, "epoch": 3984} {"train_loss": -7.012780666351318, "global_step": 167362, "epoch": 3984} {"train_loss": -7.00040340423584, "global_step": 167363, "epoch": 3984} {"train_loss": -6.946641445159912, "global_step": 167364, "epoch": 3984} {"train_loss": -7.050201416015625, "global_step": 167365, "epoch": 3984} {"train_loss": -7.006997585296631, "global_step": 167366, "epoch": 3984} {"train_loss": -7.017127990722656, "global_step": 167367, "epoch": 3984} {"train_loss": -6.906414985656738, "global_step": 167368, "epoch": 3984} {"train_loss": -6.927559091931298, "global_step": 167369, "epoch": 3984, "val_loss": 68549.1953125} {"train_loss": -6.955998420715332, "global_step": 167370, "epoch": 3985} {"train_loss": -6.955514430999756, "global_step": 167371, "epoch": 3985} {"train_loss": -6.956689834594727, "global_step": 167372, "epoch": 3985} {"train_loss": -6.894081115722656, "global_step": 167373, "epoch": 3985} {"train_loss": -7.107608795166016, "global_step": 167374, "epoch": 3985} {"train_loss": -6.944862365722656, "global_step": 167375, "epoch": 3985} {"train_loss": -6.862581253051758, "global_step": 167376, "epoch": 3985} {"train_loss": -7.086441993713379, "global_step": 167377, "epoch": 3985} {"train_loss": -7.022012710571289, "global_step": 167378, "epoch": 3985} {"train_loss": -7.030300140380859, "global_step": 167379, "epoch": 3985} {"train_loss": -6.995319366455078, "global_step": 167380, "epoch": 3985} {"train_loss": -7.003365516662598, "global_step": 167381, "epoch": 3985} {"train_loss": -7.000043869018555, "global_step": 167382, "epoch": 3985} {"train_loss": -6.959583759307861, "global_step": 167383, "epoch": 3985} {"train_loss": -6.882591247558594, "global_step": 167384, "epoch": 3985} {"train_loss": -7.02197265625, "global_step": 167385, "epoch": 3985} {"train_loss": -6.964467525482178, "global_step": 167386, "epoch": 3985} {"train_loss": -7.065968990325928, "global_step": 167387, "epoch": 3985} {"train_loss": -7.021533012390137, "global_step": 167388, "epoch": 3985} {"train_loss": -6.971319675445557, "global_step": 167389, "epoch": 3985} {"train_loss": -7.01812744140625, "global_step": 167390, "epoch": 3985} {"train_loss": -6.934588432312012, "global_step": 167391, "epoch": 3985} {"train_loss": -6.994638919830322, "global_step": 167392, "epoch": 3985} {"train_loss": -6.92952823638916, "global_step": 167393, "epoch": 3985} {"train_loss": -6.98087215423584, "global_step": 167394, "epoch": 3985} {"train_loss": -6.8998589515686035, "global_step": 167395, "epoch": 3985} {"train_loss": -7.045164585113525, "global_step": 167396, "epoch": 3985} {"train_loss": -6.891056537628174, "global_step": 167397, "epoch": 3985} {"train_loss": -6.846348762512207, "global_step": 167398, "epoch": 3985} {"train_loss": -6.961026668548584, "global_step": 167399, "epoch": 3985} {"train_loss": -6.918467044830322, "global_step": 167400, "epoch": 3985} {"train_loss": -6.8632941246032715, "global_step": 167401, "epoch": 3985} {"train_loss": -6.881270408630371, "global_step": 167402, "epoch": 3985} {"train_loss": -6.866050720214844, "global_step": 167403, "epoch": 3985} {"train_loss": -6.856698989868164, "global_step": 167404, "epoch": 3985} {"train_loss": -6.9479522705078125, "global_step": 167405, "epoch": 3985} {"train_loss": -6.748795509338379, "global_step": 167406, "epoch": 3985} {"train_loss": -6.9827375411987305, "global_step": 167407, "epoch": 3985} {"train_loss": -6.955023288726807, "global_step": 167408, "epoch": 3985} {"train_loss": -6.768152236938477, "global_step": 167409, "epoch": 3985} {"train_loss": -6.830451011657715, "global_step": 167410, "epoch": 3985} {"train_loss": -6.944834289096651, "global_step": 167411, "epoch": 3985, "val_loss": 68677.671875} {"train_loss": -6.8047099113464355, "global_step": 167412, "epoch": 3986} {"train_loss": -6.944128513336182, "global_step": 167413, "epoch": 3986} {"train_loss": -6.970108985900879, "global_step": 167414, "epoch": 3986} {"train_loss": -6.9394659996032715, "global_step": 167415, "epoch": 3986} {"train_loss": -6.905117034912109, "global_step": 167416, "epoch": 3986} {"train_loss": -6.875997066497803, "global_step": 167417, "epoch": 3986} {"train_loss": -6.905844688415527, "global_step": 167418, "epoch": 3986} {"train_loss": -7.074248313903809, "global_step": 167419, "epoch": 3986} {"train_loss": -6.904163360595703, "global_step": 167420, "epoch": 3986} {"train_loss": -6.9853315353393555, "global_step": 167421, "epoch": 3986} {"train_loss": -6.971651554107666, "global_step": 167422, "epoch": 3986} {"train_loss": -6.957376480102539, "global_step": 167423, "epoch": 3986} {"train_loss": -6.984923362731934, "global_step": 167424, "epoch": 3986} {"train_loss": -7.040534496307373, "global_step": 167425, "epoch": 3986} {"train_loss": -6.972223281860352, "global_step": 167426, "epoch": 3986} {"train_loss": -7.133060932159424, "global_step": 167427, "epoch": 3986} {"train_loss": -7.079401016235352, "global_step": 167428, "epoch": 3986} {"train_loss": -7.031883239746094, "global_step": 167429, "epoch": 3986} {"train_loss": -6.912659168243408, "global_step": 167430, "epoch": 3986} {"train_loss": -7.046796798706055, "global_step": 167431, "epoch": 3986} {"train_loss": -6.944101333618164, "global_step": 167432, "epoch": 3986} {"train_loss": -7.0399675369262695, "global_step": 167433, "epoch": 3986} {"train_loss": -6.949632167816162, "global_step": 167434, "epoch": 3986} {"train_loss": -6.914574146270752, "global_step": 167435, "epoch": 3986} {"train_loss": -7.023963928222656, "global_step": 167436, "epoch": 3986} {"train_loss": -6.992581844329834, "global_step": 167437, "epoch": 3986} {"train_loss": -7.014697551727295, "global_step": 167438, "epoch": 3986} {"train_loss": -7.1168413162231445, "global_step": 167439, "epoch": 3986} {"train_loss": -6.996960639953613, "global_step": 167440, "epoch": 3986} {"train_loss": -7.0791168212890625, "global_step": 167441, "epoch": 3986} {"train_loss": -7.004670143127441, "global_step": 167442, "epoch": 3986} {"train_loss": -7.04170560836792, "global_step": 167443, "epoch": 3986} {"train_loss": -7.046660423278809, "global_step": 167444, "epoch": 3986} {"train_loss": -7.018682479858398, "global_step": 167445, "epoch": 3986} {"train_loss": -6.923252105712891, "global_step": 167446, "epoch": 3986} {"train_loss": -6.959941387176514, "global_step": 167447, "epoch": 3986} {"train_loss": -6.971468925476074, "global_step": 167448, "epoch": 3986} {"train_loss": -6.979006767272949, "global_step": 167449, "epoch": 3986} {"train_loss": -6.933368682861328, "global_step": 167450, "epoch": 3986} {"train_loss": -7.132343769073486, "global_step": 167451, "epoch": 3986} {"train_loss": -7.042603969573975, "global_step": 167452, "epoch": 3986} {"train_loss": -6.990327664784023, "global_step": 167453, "epoch": 3986, "val_loss": 68551.3984375} {"train_loss": -6.980103969573975, "global_step": 167454, "epoch": 3987} {"train_loss": -7.033697128295898, "global_step": 167455, "epoch": 3987} {"train_loss": -6.948949813842773, "global_step": 167456, "epoch": 3987} {"train_loss": -6.966629505157471, "global_step": 167457, "epoch": 3987} {"train_loss": -7.1063032150268555, "global_step": 167458, "epoch": 3987} {"train_loss": -6.9573211669921875, "global_step": 167459, "epoch": 3987} {"train_loss": -6.913002014160156, "global_step": 167460, "epoch": 3987} {"train_loss": -7.043457984924316, "global_step": 167461, "epoch": 3987} {"train_loss": -6.9060564041137695, "global_step": 167462, "epoch": 3987} {"train_loss": -7.033411979675293, "global_step": 167463, "epoch": 3987} {"train_loss": -7.026860237121582, "global_step": 167464, "epoch": 3987} {"train_loss": -7.078927516937256, "global_step": 167465, "epoch": 3987} {"train_loss": -6.9493584632873535, "global_step": 167466, "epoch": 3987} {"train_loss": -7.023829460144043, "global_step": 167467, "epoch": 3987} {"train_loss": -6.933645725250244, "global_step": 167468, "epoch": 3987} {"train_loss": -7.030879497528076, "global_step": 167469, "epoch": 3987} {"train_loss": -7.091671943664551, "global_step": 167470, "epoch": 3987} {"train_loss": -7.03329610824585, "global_step": 167471, "epoch": 3987} {"train_loss": -6.965677261352539, "global_step": 167472, "epoch": 3987} {"train_loss": -7.0040812492370605, "global_step": 167473, "epoch": 3987} {"train_loss": -6.900842666625977, "global_step": 167474, "epoch": 3987} {"train_loss": -6.904400825500488, "global_step": 167475, "epoch": 3987} {"train_loss": -6.913349151611328, "global_step": 167476, "epoch": 3987} {"train_loss": -6.96286678314209, "global_step": 167477, "epoch": 3987} {"train_loss": -6.881049633026123, "global_step": 167478, "epoch": 3987} {"train_loss": -6.872254371643066, "global_step": 167479, "epoch": 3987} {"train_loss": -6.899985313415527, "global_step": 167480, "epoch": 3987} {"train_loss": -6.865787506103516, "global_step": 167481, "epoch": 3987} {"train_loss": -6.955624580383301, "global_step": 167482, "epoch": 3987} {"train_loss": -6.940674781799316, "global_step": 167483, "epoch": 3987} {"train_loss": -6.820370674133301, "global_step": 167484, "epoch": 3987} {"train_loss": -6.82654333114624, "global_step": 167485, "epoch": 3987} {"train_loss": -6.995669364929199, "global_step": 167486, "epoch": 3987} {"train_loss": -6.851305961608887, "global_step": 167487, "epoch": 3987} {"train_loss": -6.9288330078125, "global_step": 167488, "epoch": 3987} {"train_loss": -6.869106292724609, "global_step": 167489, "epoch": 3987} {"train_loss": -6.838746070861816, "global_step": 167490, "epoch": 3987} {"train_loss": -6.9606614112854, "global_step": 167491, "epoch": 3987} {"train_loss": -6.895790100097656, "global_step": 167492, "epoch": 3987} {"train_loss": -6.9227399826049805, "global_step": 167493, "epoch": 3987} {"train_loss": -6.82189416885376, "global_step": 167494, "epoch": 3987} {"train_loss": -6.949262721197946, "global_step": 167495, "epoch": 3987, "val_loss": 68737.6640625} {"train_loss": -6.883200168609619, "global_step": 167496, "epoch": 3988} {"train_loss": -7.024196624755859, "global_step": 167497, "epoch": 3988} {"train_loss": -6.914823055267334, "global_step": 167498, "epoch": 3988} {"train_loss": -6.975520610809326, "global_step": 167499, "epoch": 3988} {"train_loss": -7.0042572021484375, "global_step": 167500, "epoch": 3988} {"train_loss": -6.960849761962891, "global_step": 167501, "epoch": 3988} {"train_loss": -7.015682697296143, "global_step": 167502, "epoch": 3988} {"train_loss": -6.796568393707275, "global_step": 167503, "epoch": 3988} {"train_loss": -7.066309928894043, "global_step": 167504, "epoch": 3988} {"train_loss": -6.8776936531066895, "global_step": 167505, "epoch": 3988} {"train_loss": -6.9875335693359375, "global_step": 167506, "epoch": 3988} {"train_loss": -7.009047508239746, "global_step": 167507, "epoch": 3988} {"train_loss": -6.996131896972656, "global_step": 167508, "epoch": 3988} {"train_loss": -7.041482448577881, "global_step": 167509, "epoch": 3988} {"train_loss": -6.948144912719727, "global_step": 167510, "epoch": 3988} {"train_loss": -6.817443370819092, "global_step": 167511, "epoch": 3988} {"train_loss": -6.979824066162109, "global_step": 167512, "epoch": 3988} {"train_loss": -6.977458953857422, "global_step": 167513, "epoch": 3988} {"train_loss": -6.942669868469238, "global_step": 167514, "epoch": 3988} {"train_loss": -6.9735870361328125, "global_step": 167515, "epoch": 3988} {"train_loss": -7.053792953491211, "global_step": 167516, "epoch": 3988} {"train_loss": -6.758954048156738, "global_step": 167517, "epoch": 3988} {"train_loss": -6.912888050079346, "global_step": 167518, "epoch": 3988} {"train_loss": -7.019824028015137, "global_step": 167519, "epoch": 3988} {"train_loss": -7.018514633178711, "global_step": 167520, "epoch": 3988} {"train_loss": -6.963094711303711, "global_step": 167521, "epoch": 3988} {"train_loss": -6.918455123901367, "global_step": 167522, "epoch": 3988} {"train_loss": -6.922024250030518, "global_step": 167523, "epoch": 3988} {"train_loss": -7.006735801696777, "global_step": 167524, "epoch": 3988} {"train_loss": -6.861962795257568, "global_step": 167525, "epoch": 3988} {"train_loss": -6.875790596008301, "global_step": 167526, "epoch": 3988} {"train_loss": -7.002485275268555, "global_step": 167527, "epoch": 3988} {"train_loss": -6.909929275512695, "global_step": 167528, "epoch": 3988} {"train_loss": -6.954761028289795, "global_step": 167529, "epoch": 3988} {"train_loss": -6.978105068206787, "global_step": 167530, "epoch": 3988} {"train_loss": -6.939976692199707, "global_step": 167531, "epoch": 3988} {"train_loss": -7.018669605255127, "global_step": 167532, "epoch": 3988} {"train_loss": -6.989138126373291, "global_step": 167533, "epoch": 3988} {"train_loss": -6.786211013793945, "global_step": 167534, "epoch": 3988} {"train_loss": -6.910244464874268, "global_step": 167535, "epoch": 3988} {"train_loss": -6.949021339416504, "global_step": 167536, "epoch": 3988} {"train_loss": -6.948788506644113, "global_step": 167537, "epoch": 3988, "val_loss": 68703.3046875} {"train_loss": -6.868524551391602, "global_step": 167538, "epoch": 3989} {"train_loss": -6.856523513793945, "global_step": 167539, "epoch": 3989} {"train_loss": -6.962782859802246, "global_step": 167540, "epoch": 3989} {"train_loss": -6.881174087524414, "global_step": 167541, "epoch": 3989} {"train_loss": -6.8978352546691895, "global_step": 167542, "epoch": 3989} {"train_loss": -6.875144004821777, "global_step": 167543, "epoch": 3989} {"train_loss": -6.821975231170654, "global_step": 167544, "epoch": 3989} {"train_loss": -6.893557071685791, "global_step": 167545, "epoch": 3989} {"train_loss": -6.821615695953369, "global_step": 167546, "epoch": 3989} {"train_loss": -6.9008708000183105, "global_step": 167547, "epoch": 3989} {"train_loss": -6.903739929199219, "global_step": 167548, "epoch": 3989} {"train_loss": -6.999115467071533, "global_step": 167549, "epoch": 3989} {"train_loss": -6.833374500274658, "global_step": 167550, "epoch": 3989} {"train_loss": -6.884783744812012, "global_step": 167551, "epoch": 3989} {"train_loss": -6.952693939208984, "global_step": 167552, "epoch": 3989} {"train_loss": -6.78297233581543, "global_step": 167553, "epoch": 3989} {"train_loss": -6.8213114738464355, "global_step": 167554, "epoch": 3989} {"train_loss": -6.853281497955322, "global_step": 167555, "epoch": 3989} {"train_loss": -6.823099136352539, "global_step": 167556, "epoch": 3989} {"train_loss": -6.871009826660156, "global_step": 167557, "epoch": 3989} {"train_loss": -6.861115455627441, "global_step": 167558, "epoch": 3989} {"train_loss": -6.902679443359375, "global_step": 167559, "epoch": 3989} {"train_loss": -6.9028401374816895, "global_step": 167560, "epoch": 3989} {"train_loss": -6.913191795349121, "global_step": 167561, "epoch": 3989} {"train_loss": -6.950275421142578, "global_step": 167562, "epoch": 3989} {"train_loss": -6.883599758148193, "global_step": 167563, "epoch": 3989} {"train_loss": -6.993983745574951, "global_step": 167564, "epoch": 3989} {"train_loss": -6.916841506958008, "global_step": 167565, "epoch": 3989} {"train_loss": -7.048491477966309, "global_step": 167566, "epoch": 3989} {"train_loss": -6.925562858581543, "global_step": 167567, "epoch": 3989} {"train_loss": -6.9101691246032715, "global_step": 167568, "epoch": 3989} {"train_loss": -6.875487327575684, "global_step": 167569, "epoch": 3989} {"train_loss": -6.948607921600342, "global_step": 167570, "epoch": 3989} {"train_loss": -6.925437927246094, "global_step": 167571, "epoch": 3989} {"train_loss": -6.921420097351074, "global_step": 167572, "epoch": 3989} {"train_loss": -6.867221832275391, "global_step": 167573, "epoch": 3989} {"train_loss": -6.934223175048828, "global_step": 167574, "epoch": 3989} {"train_loss": -6.8923540115356445, "global_step": 167575, "epoch": 3989} {"train_loss": -6.948929786682129, "global_step": 167576, "epoch": 3989} {"train_loss": -7.011009693145752, "global_step": 167577, "epoch": 3989} {"train_loss": -6.88724422454834, "global_step": 167578, "epoch": 3989} {"train_loss": -6.900781960714431, "global_step": 167579, "epoch": 3989, "val_loss": 68550.9921875} {"train_loss": -7.0206618309021, "global_step": 167580, "epoch": 3990} {"train_loss": -6.964323997497559, "global_step": 167581, "epoch": 3990} {"train_loss": -7.010784149169922, "global_step": 167582, "epoch": 3990} {"train_loss": -6.977895736694336, "global_step": 167583, "epoch": 3990} {"train_loss": -7.0142822265625, "global_step": 167584, "epoch": 3990} {"train_loss": -6.94568395614624, "global_step": 167585, "epoch": 3990} {"train_loss": -6.921182632446289, "global_step": 167586, "epoch": 3990} {"train_loss": -6.985332489013672, "global_step": 167587, "epoch": 3990} {"train_loss": -6.982742786407471, "global_step": 167588, "epoch": 3990} {"train_loss": -6.9868316650390625, "global_step": 167589, "epoch": 3990} {"train_loss": -6.830873966217041, "global_step": 167590, "epoch": 3990} {"train_loss": -6.993118762969971, "global_step": 167591, "epoch": 3990} {"train_loss": -6.991552352905273, "global_step": 167592, "epoch": 3990} {"train_loss": -7.0355329513549805, "global_step": 167593, "epoch": 3990} {"train_loss": -6.97277307510376, "global_step": 167594, "epoch": 3990} {"train_loss": -6.850247859954834, "global_step": 167595, "epoch": 3990} {"train_loss": -7.0000505447387695, "global_step": 167596, "epoch": 3990} {"train_loss": -6.864350318908691, "global_step": 167597, "epoch": 3990} {"train_loss": -7.041438102722168, "global_step": 167598, "epoch": 3990} {"train_loss": -6.797243118286133, "global_step": 167599, "epoch": 3990} {"train_loss": -6.941946029663086, "global_step": 167600, "epoch": 3990} {"train_loss": -6.921191215515137, "global_step": 167601, "epoch": 3990} {"train_loss": -6.955292224884033, "global_step": 167602, "epoch": 3990} {"train_loss": -7.011836051940918, "global_step": 167603, "epoch": 3990} {"train_loss": -7.007762432098389, "global_step": 167604, "epoch": 3990} {"train_loss": -6.970615386962891, "global_step": 167605, "epoch": 3990} {"train_loss": -7.044585227966309, "global_step": 167606, "epoch": 3990} {"train_loss": -6.921730041503906, "global_step": 167607, "epoch": 3990} {"train_loss": -7.014932632446289, "global_step": 167608, "epoch": 3990} {"train_loss": -6.983346939086914, "global_step": 167609, "epoch": 3990} {"train_loss": -6.936431884765625, "global_step": 167610, "epoch": 3990} {"train_loss": -6.9304375648498535, "global_step": 167611, "epoch": 3990} {"train_loss": -6.842683792114258, "global_step": 167612, "epoch": 3990} {"train_loss": -7.015511512756348, "global_step": 167613, "epoch": 3990} {"train_loss": -7.0432000160217285, "global_step": 167614, "epoch": 3990} {"train_loss": -6.961564540863037, "global_step": 167615, "epoch": 3990} {"train_loss": -6.876040458679199, "global_step": 167616, "epoch": 3990} {"train_loss": -6.994851112365723, "global_step": 167617, "epoch": 3990} {"train_loss": -7.033041000366211, "global_step": 167618, "epoch": 3990} {"train_loss": -6.984723091125488, "global_step": 167619, "epoch": 3990} {"train_loss": -6.96183443069458, "global_step": 167620, "epoch": 3990} {"train_loss": -6.961990776516142, "global_step": 167621, "epoch": 3990, "val_loss": 68394.3359375} {"train_loss": -6.941577434539795, "global_step": 167622, "epoch": 3991} {"train_loss": -6.956712245941162, "global_step": 167623, "epoch": 3991} {"train_loss": -6.871513366699219, "global_step": 167624, "epoch": 3991} {"train_loss": -6.906803607940674, "global_step": 167625, "epoch": 3991} {"train_loss": -6.891299247741699, "global_step": 167626, "epoch": 3991} {"train_loss": -6.863476276397705, "global_step": 167627, "epoch": 3991} {"train_loss": -6.932339191436768, "global_step": 167628, "epoch": 3991} {"train_loss": -6.870752811431885, "global_step": 167629, "epoch": 3991} {"train_loss": -6.780033111572266, "global_step": 167630, "epoch": 3991} {"train_loss": -6.967042922973633, "global_step": 167631, "epoch": 3991} {"train_loss": -6.895791053771973, "global_step": 167632, "epoch": 3991} {"train_loss": -6.919203281402588, "global_step": 167633, "epoch": 3991} {"train_loss": -6.925520896911621, "global_step": 167634, "epoch": 3991} {"train_loss": -6.898815155029297, "global_step": 167635, "epoch": 3991} {"train_loss": -7.005579948425293, "global_step": 167636, "epoch": 3991} {"train_loss": -7.043947219848633, "global_step": 167637, "epoch": 3991} {"train_loss": -6.979585647583008, "global_step": 167638, "epoch": 3991} {"train_loss": -7.07535457611084, "global_step": 167639, "epoch": 3991} {"train_loss": -7.036903381347656, "global_step": 167640, "epoch": 3991} {"train_loss": -7.075979232788086, "global_step": 167641, "epoch": 3991} {"train_loss": -7.057737350463867, "global_step": 167642, "epoch": 3991} {"train_loss": -7.005666732788086, "global_step": 167643, "epoch": 3991} {"train_loss": -6.906609058380127, "global_step": 167644, "epoch": 3991} {"train_loss": -7.028997421264648, "global_step": 167645, "epoch": 3991} {"train_loss": -7.034739017486572, "global_step": 167646, "epoch": 3991} {"train_loss": -7.029452323913574, "global_step": 167647, "epoch": 3991} {"train_loss": -7.022513389587402, "global_step": 167648, "epoch": 3991} {"train_loss": -7.016064643859863, "global_step": 167649, "epoch": 3991} {"train_loss": -7.103382110595703, "global_step": 167650, "epoch": 3991} {"train_loss": -6.962697982788086, "global_step": 167651, "epoch": 3991} {"train_loss": -7.0031843185424805, "global_step": 167652, "epoch": 3991} {"train_loss": -6.981355667114258, "global_step": 167653, "epoch": 3991} {"train_loss": -6.933905124664307, "global_step": 167654, "epoch": 3991} {"train_loss": -7.13694429397583, "global_step": 167655, "epoch": 3991} {"train_loss": -6.992743492126465, "global_step": 167656, "epoch": 3991} {"train_loss": -7.029534339904785, "global_step": 167657, "epoch": 3991} {"train_loss": -7.071715831756592, "global_step": 167658, "epoch": 3991} {"train_loss": -6.975045204162598, "global_step": 167659, "epoch": 3991} {"train_loss": -6.985415458679199, "global_step": 167660, "epoch": 3991} {"train_loss": -7.195039749145508, "global_step": 167661, "epoch": 3991} {"train_loss": -7.039149284362793, "global_step": 167662, "epoch": 3991} {"train_loss": -6.984261728468395, "global_step": 167663, "epoch": 3991, "val_loss": 68457.1484375} {"train_loss": -7.093631744384766, "global_step": 167664, "epoch": 3992} {"train_loss": -7.012375354766846, "global_step": 167665, "epoch": 3992} {"train_loss": -6.955782890319824, "global_step": 167666, "epoch": 3992} {"train_loss": -6.925429344177246, "global_step": 167667, "epoch": 3992} {"train_loss": -6.948648452758789, "global_step": 167668, "epoch": 3992} {"train_loss": -6.952847957611084, "global_step": 167669, "epoch": 3992} {"train_loss": -6.94093132019043, "global_step": 167670, "epoch": 3992} {"train_loss": -6.913641929626465, "global_step": 167671, "epoch": 3992} {"train_loss": -6.944280624389648, "global_step": 167672, "epoch": 3992} {"train_loss": -7.006209373474121, "global_step": 167673, "epoch": 3992} {"train_loss": -6.938799858093262, "global_step": 167674, "epoch": 3992} {"train_loss": -7.032700538635254, "global_step": 167675, "epoch": 3992} {"train_loss": -6.952617645263672, "global_step": 167676, "epoch": 3992} {"train_loss": -6.962673187255859, "global_step": 167677, "epoch": 3992} {"train_loss": -6.923435211181641, "global_step": 167678, "epoch": 3992} {"train_loss": -6.929653167724609, "global_step": 167679, "epoch": 3992} {"train_loss": -6.987237930297852, "global_step": 167680, "epoch": 3992} {"train_loss": -7.014625072479248, "global_step": 167681, "epoch": 3992} {"train_loss": -6.975204944610596, "global_step": 167682, "epoch": 3992} {"train_loss": -6.947118759155273, "global_step": 167683, "epoch": 3992} {"train_loss": -6.861356735229492, "global_step": 167684, "epoch": 3992} {"train_loss": -6.825333595275879, "global_step": 167685, "epoch": 3992} {"train_loss": -6.86055850982666, "global_step": 167686, "epoch": 3992} {"train_loss": -6.972380638122559, "global_step": 167687, "epoch": 3992} {"train_loss": -6.9291558265686035, "global_step": 167688, "epoch": 3992} {"train_loss": -6.879322528839111, "global_step": 167689, "epoch": 3992} {"train_loss": -6.9446563720703125, "global_step": 167690, "epoch": 3992} {"train_loss": -6.963360786437988, "global_step": 167691, "epoch": 3992} {"train_loss": -6.8862504959106445, "global_step": 167692, "epoch": 3992} {"train_loss": -6.861565589904785, "global_step": 167693, "epoch": 3992} {"train_loss": -6.972599506378174, "global_step": 167694, "epoch": 3992} {"train_loss": -6.927562713623047, "global_step": 167695, "epoch": 3992} {"train_loss": -6.944258689880371, "global_step": 167696, "epoch": 3992} {"train_loss": -6.977323055267334, "global_step": 167697, "epoch": 3992} {"train_loss": -6.954558372497559, "global_step": 167698, "epoch": 3992} {"train_loss": -6.844969749450684, "global_step": 167699, "epoch": 3992} {"train_loss": -6.994855880737305, "global_step": 167700, "epoch": 3992} {"train_loss": -6.997819900512695, "global_step": 167701, "epoch": 3992} {"train_loss": -6.915946960449219, "global_step": 167702, "epoch": 3992} {"train_loss": -6.987680435180664, "global_step": 167703, "epoch": 3992} {"train_loss": -6.8942790031433105, "global_step": 167704, "epoch": 3992} {"train_loss": -6.947362581888835, "global_step": 167705, "epoch": 3992, "val_loss": 68558.6875} {"train_loss": -6.998207092285156, "global_step": 167706, "epoch": 3993} {"train_loss": -6.954854965209961, "global_step": 167707, "epoch": 3993} {"train_loss": -6.928250312805176, "global_step": 167708, "epoch": 3993} {"train_loss": -6.970495700836182, "global_step": 167709, "epoch": 3993} {"train_loss": -7.0000457763671875, "global_step": 167710, "epoch": 3993} {"train_loss": -7.019847869873047, "global_step": 167711, "epoch": 3993} {"train_loss": -7.097916603088379, "global_step": 167712, "epoch": 3993} {"train_loss": -6.967123985290527, "global_step": 167713, "epoch": 3993} {"train_loss": -7.036484718322754, "global_step": 167714, "epoch": 3993} {"train_loss": -7.049851417541504, "global_step": 167715, "epoch": 3993} {"train_loss": -6.951289176940918, "global_step": 167716, "epoch": 3993} {"train_loss": -7.0158233642578125, "global_step": 167717, "epoch": 3993} {"train_loss": -6.952620029449463, "global_step": 167718, "epoch": 3993} {"train_loss": -6.932432174682617, "global_step": 167719, "epoch": 3993} {"train_loss": -6.896050453186035, "global_step": 167720, "epoch": 3993} {"train_loss": -7.100595474243164, "global_step": 167721, "epoch": 3993} {"train_loss": -7.0439300537109375, "global_step": 167722, "epoch": 3993} {"train_loss": -6.940562725067139, "global_step": 167723, "epoch": 3993} {"train_loss": -7.003494739532471, "global_step": 167724, "epoch": 3993} {"train_loss": -7.011879920959473, "global_step": 167725, "epoch": 3993} {"train_loss": -7.0187530517578125, "global_step": 167726, "epoch": 3993} {"train_loss": -6.969057083129883, "global_step": 167727, "epoch": 3993} {"train_loss": -7.008860111236572, "global_step": 167728, "epoch": 3993} {"train_loss": -6.943009376525879, "global_step": 167729, "epoch": 3993} {"train_loss": -6.8964409828186035, "global_step": 167730, "epoch": 3993} {"train_loss": -6.921210289001465, "global_step": 167731, "epoch": 3993} {"train_loss": -6.90312385559082, "global_step": 167732, "epoch": 3993} {"train_loss": -6.947930335998535, "global_step": 167733, "epoch": 3993} {"train_loss": -6.926889419555664, "global_step": 167734, "epoch": 3993} {"train_loss": -7.09609842300415, "global_step": 167735, "epoch": 3993} {"train_loss": -7.033740997314453, "global_step": 167736, "epoch": 3993} {"train_loss": -6.824151992797852, "global_step": 167737, "epoch": 3993} {"train_loss": -6.944282054901123, "global_step": 167738, "epoch": 3993} {"train_loss": -6.936598300933838, "global_step": 167739, "epoch": 3993} {"train_loss": -6.874266624450684, "global_step": 167740, "epoch": 3993} {"train_loss": -6.833775043487549, "global_step": 167741, "epoch": 3993} {"train_loss": -6.981538772583008, "global_step": 167742, "epoch": 3993} {"train_loss": -6.8820600509643555, "global_step": 167743, "epoch": 3993} {"train_loss": -6.926887512207031, "global_step": 167744, "epoch": 3993} {"train_loss": -6.86641263961792, "global_step": 167745, "epoch": 3993} {"train_loss": -6.869260787963867, "global_step": 167746, "epoch": 3993} {"train_loss": -6.962283157166981, "global_step": 167747, "epoch": 3993, "val_loss": 68573.53125} {"train_loss": -6.866694927215576, "global_step": 167748, "epoch": 3994} {"train_loss": -6.997262477874756, "global_step": 167749, "epoch": 3994} {"train_loss": -6.985494136810303, "global_step": 167750, "epoch": 3994} {"train_loss": -6.94547176361084, "global_step": 167751, "epoch": 3994} {"train_loss": -6.997447967529297, "global_step": 167752, "epoch": 3994} {"train_loss": -6.811847686767578, "global_step": 167753, "epoch": 3994} {"train_loss": -6.903387546539307, "global_step": 167754, "epoch": 3994} {"train_loss": -6.908477783203125, "global_step": 167755, "epoch": 3994} {"train_loss": -6.942766189575195, "global_step": 167756, "epoch": 3994} {"train_loss": -6.885208606719971, "global_step": 167757, "epoch": 3994} {"train_loss": -6.969542980194092, "global_step": 167758, "epoch": 3994} {"train_loss": -7.017083168029785, "global_step": 167759, "epoch": 3994} {"train_loss": -6.948310375213623, "global_step": 167760, "epoch": 3994} {"train_loss": -6.995874881744385, "global_step": 167761, "epoch": 3994} {"train_loss": -6.899603366851807, "global_step": 167762, "epoch": 3994} {"train_loss": -7.048959732055664, "global_step": 167763, "epoch": 3994} {"train_loss": -6.9530348777771, "global_step": 167764, "epoch": 3994} {"train_loss": -7.081727981567383, "global_step": 167765, "epoch": 3994} {"train_loss": -6.976699352264404, "global_step": 167766, "epoch": 3994} {"train_loss": -6.888427734375, "global_step": 167767, "epoch": 3994} {"train_loss": -6.999490261077881, "global_step": 167768, "epoch": 3994} {"train_loss": -6.9867963790893555, "global_step": 167769, "epoch": 3994} {"train_loss": -6.9479475021362305, "global_step": 167770, "epoch": 3994} {"train_loss": -7.045169353485107, "global_step": 167771, "epoch": 3994} {"train_loss": -6.942389965057373, "global_step": 167772, "epoch": 3994} {"train_loss": -6.891024589538574, "global_step": 167773, "epoch": 3994} {"train_loss": -7.010156631469727, "global_step": 167774, "epoch": 3994} {"train_loss": -6.9123334884643555, "global_step": 167775, "epoch": 3994} {"train_loss": -6.837693214416504, "global_step": 167776, "epoch": 3994} {"train_loss": -7.010776996612549, "global_step": 167777, "epoch": 3994} {"train_loss": -7.065676689147949, "global_step": 167778, "epoch": 3994} {"train_loss": -6.976651668548584, "global_step": 167779, "epoch": 3994} {"train_loss": -7.020920276641846, "global_step": 167780, "epoch": 3994} {"train_loss": -7.025190353393555, "global_step": 167781, "epoch": 3994} {"train_loss": -6.842864990234375, "global_step": 167782, "epoch": 3994} {"train_loss": -6.96809196472168, "global_step": 167783, "epoch": 3994} {"train_loss": -6.823479175567627, "global_step": 167784, "epoch": 3994} {"train_loss": -6.864221572875977, "global_step": 167785, "epoch": 3994} {"train_loss": -7.054780006408691, "global_step": 167786, "epoch": 3994} {"train_loss": -6.7914628982543945, "global_step": 167787, "epoch": 3994} {"train_loss": -6.890550136566162, "global_step": 167788, "epoch": 3994} {"train_loss": -6.948900461196899, "global_step": 167789, "epoch": 3994, "val_loss": 68810.7734375} {"train_loss": -6.799748420715332, "global_step": 167790, "epoch": 3995} {"train_loss": -6.828019618988037, "global_step": 167791, "epoch": 3995} {"train_loss": -6.864754676818848, "global_step": 167792, "epoch": 3995} {"train_loss": -6.925045013427734, "global_step": 167793, "epoch": 3995} {"train_loss": -6.975378036499023, "global_step": 167794, "epoch": 3995} {"train_loss": -6.774980545043945, "global_step": 167795, "epoch": 3995} {"train_loss": -6.984635353088379, "global_step": 167796, "epoch": 3995} {"train_loss": -6.996539115905762, "global_step": 167797, "epoch": 3995} {"train_loss": -6.973470211029053, "global_step": 167798, "epoch": 3995} {"train_loss": -6.752924919128418, "global_step": 167799, "epoch": 3995} {"train_loss": -6.843339443206787, "global_step": 167800, "epoch": 3995} {"train_loss": -6.823204040527344, "global_step": 167801, "epoch": 3995} {"train_loss": -6.949817657470703, "global_step": 167802, "epoch": 3995} {"train_loss": -6.914279937744141, "global_step": 167803, "epoch": 3995} {"train_loss": -7.018966197967529, "global_step": 167804, "epoch": 3995} {"train_loss": -6.915846824645996, "global_step": 167805, "epoch": 3995} {"train_loss": -6.9242353439331055, "global_step": 167806, "epoch": 3995} {"train_loss": -6.9792070388793945, "global_step": 167807, "epoch": 3995} {"train_loss": -6.97091007232666, "global_step": 167808, "epoch": 3995} {"train_loss": -6.922663688659668, "global_step": 167809, "epoch": 3995} {"train_loss": -6.904993534088135, "global_step": 167810, "epoch": 3995} {"train_loss": -6.964484691619873, "global_step": 167811, "epoch": 3995} {"train_loss": -6.925443649291992, "global_step": 167812, "epoch": 3995} {"train_loss": -6.9145002365112305, "global_step": 167813, "epoch": 3995} {"train_loss": -7.04500150680542, "global_step": 167814, "epoch": 3995} {"train_loss": -6.931253433227539, "global_step": 167815, "epoch": 3995} {"train_loss": -6.966165542602539, "global_step": 167816, "epoch": 3995} {"train_loss": -6.862773895263672, "global_step": 167817, "epoch": 3995} {"train_loss": -7.006270408630371, "global_step": 167818, "epoch": 3995} {"train_loss": -7.06236457824707, "global_step": 167819, "epoch": 3995} {"train_loss": -6.881659507751465, "global_step": 167820, "epoch": 3995} {"train_loss": -6.954082489013672, "global_step": 167821, "epoch": 3995} {"train_loss": -6.928562164306641, "global_step": 167822, "epoch": 3995} {"train_loss": -7.038223743438721, "global_step": 167823, "epoch": 3995} {"train_loss": -6.950495719909668, "global_step": 167824, "epoch": 3995} {"train_loss": -6.8996968269348145, "global_step": 167825, "epoch": 3995} {"train_loss": -6.9756293296813965, "global_step": 167826, "epoch": 3995} {"train_loss": -7.064092636108398, "global_step": 167827, "epoch": 3995} {"train_loss": -6.9741010665893555, "global_step": 167828, "epoch": 3995} {"train_loss": -7.030996322631836, "global_step": 167829, "epoch": 3995} {"train_loss": -7.151005744934082, "global_step": 167830, "epoch": 3995} {"train_loss": -6.940310614449637, "global_step": 167831, "epoch": 3995, "val_loss": 68663.3671875} {"train_loss": -7.082671642303467, "global_step": 167832, "epoch": 3996} {"train_loss": -7.029036045074463, "global_step": 167833, "epoch": 3996} {"train_loss": -7.0482587814331055, "global_step": 167834, "epoch": 3996} {"train_loss": -6.985211372375488, "global_step": 167835, "epoch": 3996} {"train_loss": -6.962543964385986, "global_step": 167836, "epoch": 3996} {"train_loss": -6.982302665710449, "global_step": 167837, "epoch": 3996} {"train_loss": -7.031983375549316, "global_step": 167838, "epoch": 3996} {"train_loss": -7.003302097320557, "global_step": 167839, "epoch": 3996} {"train_loss": -6.95965576171875, "global_step": 167840, "epoch": 3996} {"train_loss": -7.04494571685791, "global_step": 167841, "epoch": 3996} {"train_loss": -7.02726936340332, "global_step": 167842, "epoch": 3996} {"train_loss": -6.959941864013672, "global_step": 167843, "epoch": 3996} {"train_loss": -7.012970924377441, "global_step": 167844, "epoch": 3996} {"train_loss": -7.029040336608887, "global_step": 167845, "epoch": 3996} {"train_loss": -6.968156337738037, "global_step": 167846, "epoch": 3996} {"train_loss": -7.0137529373168945, "global_step": 167847, "epoch": 3996} {"train_loss": -7.029043197631836, "global_step": 167848, "epoch": 3996} {"train_loss": -7.033598899841309, "global_step": 167849, "epoch": 3996} {"train_loss": -6.996705055236816, "global_step": 167850, "epoch": 3996} {"train_loss": -6.969721794128418, "global_step": 167851, "epoch": 3996} {"train_loss": -7.0577497482299805, "global_step": 167852, "epoch": 3996} {"train_loss": -6.990129470825195, "global_step": 167853, "epoch": 3996} {"train_loss": -7.049727439880371, "global_step": 167854, "epoch": 3996} {"train_loss": -7.0918731689453125, "global_step": 167855, "epoch": 3996} {"train_loss": -7.094494819641113, "global_step": 167856, "epoch": 3996} {"train_loss": -7.031380653381348, "global_step": 167857, "epoch": 3996} {"train_loss": -6.98868465423584, "global_step": 167858, "epoch": 3996} {"train_loss": -7.061620712280273, "global_step": 167859, "epoch": 3996} {"train_loss": -7.056704044342041, "global_step": 167860, "epoch": 3996} {"train_loss": -6.897653579711914, "global_step": 167861, "epoch": 3996} {"train_loss": -6.871291160583496, "global_step": 167862, "epoch": 3996} {"train_loss": -7.017967224121094, "global_step": 167863, "epoch": 3996} {"train_loss": -7.002440452575684, "global_step": 167864, "epoch": 3996} {"train_loss": -6.910163402557373, "global_step": 167865, "epoch": 3996} {"train_loss": -6.8789777755737305, "global_step": 167866, "epoch": 3996} {"train_loss": -7.023423671722412, "global_step": 167867, "epoch": 3996} {"train_loss": -6.976649284362793, "global_step": 167868, "epoch": 3996} {"train_loss": -7.016280174255371, "global_step": 167869, "epoch": 3996} {"train_loss": -6.855457305908203, "global_step": 167870, "epoch": 3996} {"train_loss": -6.992470741271973, "global_step": 167871, "epoch": 3996} {"train_loss": -6.957515716552734, "global_step": 167872, "epoch": 3996} {"train_loss": -7.003201303027925, "global_step": 167873, "epoch": 3996, "val_loss": 68571.671875} {"train_loss": -6.913871765136719, "global_step": 167874, "epoch": 3997} {"train_loss": -6.966512680053711, "global_step": 167875, "epoch": 3997} {"train_loss": -6.910008430480957, "global_step": 167876, "epoch": 3997} {"train_loss": -6.8661603927612305, "global_step": 167877, "epoch": 3997} {"train_loss": -6.9176530838012695, "global_step": 167878, "epoch": 3997} {"train_loss": -7.05670690536499, "global_step": 167879, "epoch": 3997} {"train_loss": -6.9676971435546875, "global_step": 167880, "epoch": 3997} {"train_loss": -6.9768781661987305, "global_step": 167881, "epoch": 3997} {"train_loss": -6.995941162109375, "global_step": 167882, "epoch": 3997} {"train_loss": -6.931982040405273, "global_step": 167883, "epoch": 3997} {"train_loss": -6.982081413269043, "global_step": 167884, "epoch": 3997} {"train_loss": -6.926389694213867, "global_step": 167885, "epoch": 3997} {"train_loss": -6.866969108581543, "global_step": 167886, "epoch": 3997} {"train_loss": -7.0528154373168945, "global_step": 167887, "epoch": 3997} {"train_loss": -6.787388801574707, "global_step": 167888, "epoch": 3997} {"train_loss": -6.842837333679199, "global_step": 167889, "epoch": 3997} {"train_loss": -6.987298965454102, "global_step": 167890, "epoch": 3997} {"train_loss": -6.959546089172363, "global_step": 167891, "epoch": 3997} {"train_loss": -6.982507705688477, "global_step": 167892, "epoch": 3997} {"train_loss": -6.932860374450684, "global_step": 167893, "epoch": 3997} {"train_loss": -7.001306056976318, "global_step": 167894, "epoch": 3997} {"train_loss": -7.070009231567383, "global_step": 167895, "epoch": 3997} {"train_loss": -7.006660461425781, "global_step": 167896, "epoch": 3997} {"train_loss": -6.871038436889648, "global_step": 167897, "epoch": 3997} {"train_loss": -6.986879348754883, "global_step": 167898, "epoch": 3997} {"train_loss": -6.9184064865112305, "global_step": 167899, "epoch": 3997} {"train_loss": -6.773990154266357, "global_step": 167900, "epoch": 3997} {"train_loss": -6.986274719238281, "global_step": 167901, "epoch": 3997} {"train_loss": -6.750865936279297, "global_step": 167902, "epoch": 3997} {"train_loss": -6.892448902130127, "global_step": 167903, "epoch": 3997} {"train_loss": -6.91472864151001, "global_step": 167904, "epoch": 3997} {"train_loss": -6.9126434326171875, "global_step": 167905, "epoch": 3997} {"train_loss": -6.819513320922852, "global_step": 167906, "epoch": 3997} {"train_loss": -6.799806118011475, "global_step": 167907, "epoch": 3997} {"train_loss": -6.867857933044434, "global_step": 167908, "epoch": 3997} {"train_loss": -6.754376411437988, "global_step": 167909, "epoch": 3997} {"train_loss": -6.832783222198486, "global_step": 167910, "epoch": 3997} {"train_loss": -6.869237899780273, "global_step": 167911, "epoch": 3997} {"train_loss": -6.773191928863525, "global_step": 167912, "epoch": 3997} {"train_loss": -6.900568962097168, "global_step": 167913, "epoch": 3997} {"train_loss": -6.892322540283203, "global_step": 167914, "epoch": 3997} {"train_loss": -6.912432772772653, "global_step": 167915, "epoch": 3997, "val_loss": 68590.8515625} {"train_loss": -6.919586181640625, "global_step": 167916, "epoch": 3998} {"train_loss": -6.855545997619629, "global_step": 167917, "epoch": 3998} {"train_loss": -6.884079933166504, "global_step": 167918, "epoch": 3998} {"train_loss": -6.882617950439453, "global_step": 167919, "epoch": 3998} {"train_loss": -6.986534118652344, "global_step": 167920, "epoch": 3998} {"train_loss": -6.940387725830078, "global_step": 167921, "epoch": 3998} {"train_loss": -6.946455001831055, "global_step": 167922, "epoch": 3998} {"train_loss": -7.0826263427734375, "global_step": 167923, "epoch": 3998} {"train_loss": -6.994223594665527, "global_step": 167924, "epoch": 3998} {"train_loss": -7.029741287231445, "global_step": 167925, "epoch": 3998} {"train_loss": -6.877150535583496, "global_step": 167926, "epoch": 3998} {"train_loss": -7.064873695373535, "global_step": 167927, "epoch": 3998} {"train_loss": -6.972170829772949, "global_step": 167928, "epoch": 3998} {"train_loss": -7.073363780975342, "global_step": 167929, "epoch": 3998} {"train_loss": -6.930981159210205, "global_step": 167930, "epoch": 3998} {"train_loss": -6.991141319274902, "global_step": 167931, "epoch": 3998} {"train_loss": -7.073833465576172, "global_step": 167932, "epoch": 3998} {"train_loss": -6.945934295654297, "global_step": 167933, "epoch": 3998} {"train_loss": -7.0721540451049805, "global_step": 167934, "epoch": 3998} {"train_loss": -6.998496055603027, "global_step": 167935, "epoch": 3998} {"train_loss": -7.037904262542725, "global_step": 167936, "epoch": 3998} {"train_loss": -7.033304214477539, "global_step": 167937, "epoch": 3998} {"train_loss": -7.079187393188477, "global_step": 167938, "epoch": 3998} {"train_loss": -7.007101058959961, "global_step": 167939, "epoch": 3998} {"train_loss": -7.054044723510742, "global_step": 167940, "epoch": 3998} {"train_loss": -6.964885711669922, "global_step": 167941, "epoch": 3998} {"train_loss": -7.087222099304199, "global_step": 167942, "epoch": 3998} {"train_loss": -7.094334125518799, "global_step": 167943, "epoch": 3998} {"train_loss": -6.977349281311035, "global_step": 167944, "epoch": 3998} {"train_loss": -6.923271179199219, "global_step": 167945, "epoch": 3998} {"train_loss": -7.005817890167236, "global_step": 167946, "epoch": 3998} {"train_loss": -7.059659957885742, "global_step": 167947, "epoch": 3998} {"train_loss": -7.042534351348877, "global_step": 167948, "epoch": 3998} {"train_loss": -7.025620460510254, "global_step": 167949, "epoch": 3998} {"train_loss": -7.070146560668945, "global_step": 167950, "epoch": 3998} {"train_loss": -7.042670726776123, "global_step": 167951, "epoch": 3998} {"train_loss": -7.042557239532471, "global_step": 167952, "epoch": 3998} {"train_loss": -7.00459098815918, "global_step": 167953, "epoch": 3998} {"train_loss": -7.134820461273193, "global_step": 167954, "epoch": 3998} {"train_loss": -7.037146091461182, "global_step": 167955, "epoch": 3998} {"train_loss": -6.957144260406494, "global_step": 167956, "epoch": 3998} {"train_loss": -7.006617750440325, "global_step": 167957, "epoch": 3998, "val_loss": 68466.828125} {"train_loss": -7.020204544067383, "global_step": 167958, "epoch": 3999} {"train_loss": -6.957910060882568, "global_step": 167959, "epoch": 3999} {"train_loss": -6.992462158203125, "global_step": 167960, "epoch": 3999} {"train_loss": -7.077468395233154, "global_step": 167961, "epoch": 3999} {"train_loss": -6.858672618865967, "global_step": 167962, "epoch": 3999} {"train_loss": -6.924832344055176, "global_step": 167963, "epoch": 3999} {"train_loss": -6.952889442443848, "global_step": 167964, "epoch": 3999} {"train_loss": -6.933072090148926, "global_step": 167965, "epoch": 3999} {"train_loss": -7.061904430389404, "global_step": 167966, "epoch": 3999} {"train_loss": -6.973897933959961, "global_step": 167967, "epoch": 3999} {"train_loss": -6.917201995849609, "global_step": 167968, "epoch": 3999} {"train_loss": -7.007228851318359, "global_step": 167969, "epoch": 3999} {"train_loss": -7.018964767456055, "global_step": 167970, "epoch": 3999} {"train_loss": -6.931763648986816, "global_step": 167971, "epoch": 3999} {"train_loss": -6.9810686111450195, "global_step": 167972, "epoch": 3999} {"train_loss": -6.982630252838135, "global_step": 167973, "epoch": 3999} {"train_loss": -6.963131904602051, "global_step": 167974, "epoch": 3999} {"train_loss": -6.948563575744629, "global_step": 167975, "epoch": 3999} {"train_loss": -6.9615678787231445, "global_step": 167976, "epoch": 3999} {"train_loss": -6.927121162414551, "global_step": 167977, "epoch": 3999} {"train_loss": -7.005125999450684, "global_step": 167978, "epoch": 3999} {"train_loss": -6.921869277954102, "global_step": 167979, "epoch": 3999} {"train_loss": -7.000761985778809, "global_step": 167980, "epoch": 3999} {"train_loss": -6.988950729370117, "global_step": 167981, "epoch": 3999} {"train_loss": -6.937003135681152, "global_step": 167982, "epoch": 3999} {"train_loss": -6.7820515632629395, "global_step": 167983, "epoch": 3999} {"train_loss": -7.015917778015137, "global_step": 167984, "epoch": 3999} {"train_loss": -6.881804466247559, "global_step": 167985, "epoch": 3999} {"train_loss": -6.976430892944336, "global_step": 167986, "epoch": 3999} {"train_loss": -7.026473045349121, "global_step": 167987, "epoch": 3999} {"train_loss": -7.067417621612549, "global_step": 167988, "epoch": 3999} {"train_loss": -6.967370986938477, "global_step": 167989, "epoch": 3999} {"train_loss": -6.899103164672852, "global_step": 167990, "epoch": 3999} {"train_loss": -7.086150169372559, "global_step": 167991, "epoch": 3999} {"train_loss": -6.987579345703125, "global_step": 167992, "epoch": 3999} {"train_loss": -7.071767807006836, "global_step": 167993, "epoch": 3999} {"train_loss": -6.9592437744140625, "global_step": 167994, "epoch": 3999} {"train_loss": -6.9040069580078125, "global_step": 167995, "epoch": 3999} {"train_loss": -6.921895980834961, "global_step": 167996, "epoch": 3999} {"train_loss": -6.9197611808776855, "global_step": 167997, "epoch": 3999} {"train_loss": -7.0096635818481445, "global_step": 167998, "epoch": 3999} {"train_loss": -6.965404022307623, "global_step": 167999, "epoch": 3999, "val_loss": 68389.4453125} {"train_loss": -6.975114822387695, "global_step": 168000, "epoch": 4000} {"train_loss": -7.058966159820557, "global_step": 168001, "epoch": 4000} {"train_loss": -6.94127082824707, "global_step": 168002, "epoch": 4000} {"train_loss": -6.981600761413574, "global_step": 168003, "epoch": 4000} {"train_loss": -6.960064888000488, "global_step": 168004, "epoch": 4000} {"train_loss": -7.031223297119141, "global_step": 168005, "epoch": 4000} {"train_loss": -6.9143452644348145, "global_step": 168006, "epoch": 4000} {"train_loss": -7.035085678100586, "global_step": 168007, "epoch": 4000} {"train_loss": -6.9615936279296875, "global_step": 168008, "epoch": 4000} {"train_loss": -7.059316158294678, "global_step": 168009, "epoch": 4000} {"train_loss": -7.091597080230713, "global_step": 168010, "epoch": 4000} {"train_loss": -6.983139991760254, "global_step": 168011, "epoch": 4000} {"train_loss": -6.993376731872559, "global_step": 168012, "epoch": 4000} {"train_loss": -6.9989471435546875, "global_step": 168013, "epoch": 4000} {"train_loss": -6.91874361038208, "global_step": 168014, "epoch": 4000} {"train_loss": -6.934401988983154, "global_step": 168015, "epoch": 4000} {"train_loss": -6.912242412567139, "global_step": 168016, "epoch": 4000} {"train_loss": -6.847062110900879, "global_step": 168017, "epoch": 4000} {"train_loss": -6.92278528213501, "global_step": 168018, "epoch": 4000} {"train_loss": -6.8654632568359375, "global_step": 168019, "epoch": 4000} {"train_loss": -6.9735212326049805, "global_step": 168020, "epoch": 4000} {"train_loss": -6.947601318359375, "global_step": 168021, "epoch": 4000} {"train_loss": -6.646553039550781, "global_step": 168022, "epoch": 4000} {"train_loss": -6.9131317138671875, "global_step": 168023, "epoch": 4000} {"train_loss": -6.934222221374512, "global_step": 168024, "epoch": 4000} {"train_loss": -6.709969520568848, "global_step": 168025, "epoch": 4000} {"train_loss": -6.899506568908691, "global_step": 168026, "epoch": 4000} {"train_loss": -6.604809761047363, "global_step": 168027, "epoch": 4000} {"train_loss": -6.830098628997803, "global_step": 168028, "epoch": 4000} {"train_loss": -6.792661666870117, "global_step": 168029, "epoch": 4000} {"train_loss": -6.660754203796387, "global_step": 168030, "epoch": 4000} {"train_loss": -6.805284023284912, "global_step": 168031, "epoch": 4000} {"train_loss": -6.789772033691406, "global_step": 168032, "epoch": 4000} {"train_loss": -6.980670928955078, "global_step": 168033, "epoch": 4000} {"train_loss": -6.839570045471191, "global_step": 168034, "epoch": 4000} {"train_loss": -6.858545780181885, "global_step": 168035, "epoch": 4000} {"train_loss": -6.865561008453369, "global_step": 168036, "epoch": 4000} {"train_loss": -6.823524475097656, "global_step": 168037, "epoch": 4000} {"train_loss": -6.867797374725342, "global_step": 168038, "epoch": 4000} {"train_loss": -6.840536594390869, "global_step": 168039, "epoch": 4000} {"train_loss": -6.877874374389648, "global_step": 168040, "epoch": 4000} {"train_loss": -6.900665181023734, "global_step": 168041, "epoch": 4000, "train/sim_max_reward_0": 0.26861135830945143, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.5811714427101285, "train/sim_max_reward_3": 0.11614640656721789, "train/sim_max_reward_4": 0.8412587335051472, "train/sim_max_reward_5": 0.9832691973994225, "test/sim_max_reward_4400000": 0.9393570339107207, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 0.05990749945319828, "test/sim_max_reward_4400003": 0.6473125777939847, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9284875657198218, "test/sim_max_reward_4400006": 0.9607228672406137, "test/sim_max_reward_4400007": 0.9207766177911035, "test/sim_max_reward_4400008": 0.2975066542371646, "test/sim_max_reward_4400009": 0.918847322124367, "test/sim_max_reward_4400010": 0.26117655128929657, "test/sim_max_reward_4400011": 0.2745045856892323, "test/sim_max_reward_4400012": 0.9733497302447731, "test/sim_max_reward_4400013": 0.9726847778748036, "test/sim_max_reward_4400014": 0.3208724958195586, "test/sim_max_reward_4400015": 0.038116638784886706, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2326418107789415, "test/sim_max_reward_4400019": 0.9790972305559121, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9244182600519488, "test/sim_max_reward_4400023": 0.035124291605656395, "test/sim_max_reward_4400024": 0.9837565534593192, "test/sim_max_reward_4400025": 0.26532848974949574, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.03592728212547191, "test/sim_max_reward_4400028": 0.8795416698114257, "test/sim_max_reward_4400029": 0.548435742620463, "test/sim_max_reward_4400030": 0.9966294152547002, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9745729416586112, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.7148761545286898, "test/sim_max_reward_4400036": 0.659839151176619, "test/sim_max_reward_4400037": 0.9636826787254102, "test/sim_max_reward_4400038": 0.9931054903118683, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9860395094982854, "test/sim_max_reward_4400042": 0.907547175050021, "test/sim_max_reward_4400043": 0.9615625503799912, "test/sim_max_reward_4400044": 0.8950635389523816, "test/sim_max_reward_4400045": 0.901940510380873, "test/sim_max_reward_4400046": 0.42171551416914604, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.8660675339435052, "test/sim_max_reward_4400049": 0.9082556973558366, "train/mean_score": 0.631742856415228, "test/mean_score": 0.6204404388098399, "val_loss": 68529.7421875} {"train_loss": -6.936349868774414, "global_step": 168042, "epoch": 4001} {"train_loss": -6.984724998474121, "global_step": 168043, "epoch": 4001} {"train_loss": -6.86669921875, "global_step": 168044, "epoch": 4001} {"train_loss": -7.012018203735352, "global_step": 168045, "epoch": 4001} {"train_loss": -6.964024543762207, "global_step": 168046, "epoch": 4001} {"train_loss": -6.958227157592773, "global_step": 168047, "epoch": 4001} {"train_loss": -6.998513698577881, "global_step": 168048, "epoch": 4001} {"train_loss": -6.873867988586426, "global_step": 168049, "epoch": 4001} {"train_loss": -6.871171474456787, "global_step": 168050, "epoch": 4001} {"train_loss": -6.790042400360107, "global_step": 168051, "epoch": 4001} {"train_loss": -7.029745101928711, "global_step": 168052, "epoch": 4001} {"train_loss": -6.941363334655762, "global_step": 168053, "epoch": 4001} {"train_loss": -7.032376766204834, "global_step": 168054, "epoch": 4001} {"train_loss": -7.019705295562744, "global_step": 168055, "epoch": 4001} {"train_loss": -7.013650417327881, "global_step": 168056, "epoch": 4001} {"train_loss": -7.060257911682129, "global_step": 168057, "epoch": 4001} {"train_loss": -7.019327163696289, "global_step": 168058, "epoch": 4001} {"train_loss": -6.969716548919678, "global_step": 168059, "epoch": 4001} {"train_loss": -6.945643424987793, "global_step": 168060, "epoch": 4001} {"train_loss": -6.927835464477539, "global_step": 168061, "epoch": 4001} {"train_loss": -6.947142601013184, "global_step": 168062, "epoch": 4001} {"train_loss": -7.00698709487915, "global_step": 168063, "epoch": 4001} {"train_loss": -6.951724529266357, "global_step": 168064, "epoch": 4001} {"train_loss": -6.9425153732299805, "global_step": 168065, "epoch": 4001} {"train_loss": -7.115261077880859, "global_step": 168066, "epoch": 4001} {"train_loss": -6.989256381988525, "global_step": 168067, "epoch": 4001} {"train_loss": -6.902041912078857, "global_step": 168068, "epoch": 4001} {"train_loss": -6.9960432052612305, "global_step": 168069, "epoch": 4001} {"train_loss": -7.09836483001709, "global_step": 168070, "epoch": 4001} {"train_loss": -6.999085426330566, "global_step": 168071, "epoch": 4001} {"train_loss": -6.999869346618652, "global_step": 168072, "epoch": 4001} {"train_loss": -7.120396614074707, "global_step": 168073, "epoch": 4001} {"train_loss": -7.05289363861084, "global_step": 168074, "epoch": 4001} {"train_loss": -6.963634967803955, "global_step": 168075, "epoch": 4001} {"train_loss": -7.025703430175781, "global_step": 168076, "epoch": 4001} {"train_loss": -7.0331597328186035, "global_step": 168077, "epoch": 4001} {"train_loss": -6.942865371704102, "global_step": 168078, "epoch": 4001} {"train_loss": -6.941544532775879, "global_step": 168079, "epoch": 4001} {"train_loss": -7.05954647064209, "global_step": 168080, "epoch": 4001} {"train_loss": -6.967105865478516, "global_step": 168081, "epoch": 4001} {"train_loss": -7.031691551208496, "global_step": 168082, "epoch": 4001} {"train_loss": -6.984680357433501, "global_step": 168083, "epoch": 4001, "val_loss": 68414.828125} {"train_loss": -7.0790486335754395, "global_step": 168084, "epoch": 4002} {"train_loss": -6.864539623260498, "global_step": 168085, "epoch": 4002} {"train_loss": -7.088370323181152, "global_step": 168086, "epoch": 4002} {"train_loss": -7.026291847229004, "global_step": 168087, "epoch": 4002} {"train_loss": -7.022233486175537, "global_step": 168088, "epoch": 4002} {"train_loss": -6.955269813537598, "global_step": 168089, "epoch": 4002} {"train_loss": -6.778662204742432, "global_step": 168090, "epoch": 4002} {"train_loss": -6.89698600769043, "global_step": 168091, "epoch": 4002} {"train_loss": -6.86107873916626, "global_step": 168092, "epoch": 4002} {"train_loss": -6.842347145080566, "global_step": 168093, "epoch": 4002} {"train_loss": -6.921331405639648, "global_step": 168094, "epoch": 4002} {"train_loss": -6.76921272277832, "global_step": 168095, "epoch": 4002} {"train_loss": -6.75250244140625, "global_step": 168096, "epoch": 4002} {"train_loss": -6.810455799102783, "global_step": 168097, "epoch": 4002} {"train_loss": -6.830244541168213, "global_step": 168098, "epoch": 4002} {"train_loss": -6.911113739013672, "global_step": 168099, "epoch": 4002} {"train_loss": -6.860124111175537, "global_step": 168100, "epoch": 4002} {"train_loss": -6.883144855499268, "global_step": 168101, "epoch": 4002} {"train_loss": -6.90988302230835, "global_step": 168102, "epoch": 4002} {"train_loss": -6.946241855621338, "global_step": 168103, "epoch": 4002} {"train_loss": -6.913370132446289, "global_step": 168104, "epoch": 4002} {"train_loss": -6.8930206298828125, "global_step": 168105, "epoch": 4002} {"train_loss": -6.910947322845459, "global_step": 168106, "epoch": 4002} {"train_loss": -6.907869338989258, "global_step": 168107, "epoch": 4002} {"train_loss": -6.884243011474609, "global_step": 168108, "epoch": 4002} {"train_loss": -6.820795059204102, "global_step": 168109, "epoch": 4002} {"train_loss": -6.953770637512207, "global_step": 168110, "epoch": 4002} {"train_loss": -6.993393898010254, "global_step": 168111, "epoch": 4002} {"train_loss": -6.838648796081543, "global_step": 168112, "epoch": 4002} {"train_loss": -6.83181095123291, "global_step": 168113, "epoch": 4002} {"train_loss": -6.975790500640869, "global_step": 168114, "epoch": 4002} {"train_loss": -7.063000679016113, "global_step": 168115, "epoch": 4002} {"train_loss": -6.900046348571777, "global_step": 168116, "epoch": 4002} {"train_loss": -6.968649387359619, "global_step": 168117, "epoch": 4002} {"train_loss": -6.7998175621032715, "global_step": 168118, "epoch": 4002} {"train_loss": -6.960724353790283, "global_step": 168119, "epoch": 4002} {"train_loss": -6.976713180541992, "global_step": 168120, "epoch": 4002} {"train_loss": -6.9628143310546875, "global_step": 168121, "epoch": 4002} {"train_loss": -7.015292167663574, "global_step": 168122, "epoch": 4002} {"train_loss": -6.9264326095581055, "global_step": 168123, "epoch": 4002} {"train_loss": -7.055068016052246, "global_step": 168124, "epoch": 4002} {"train_loss": -6.918325617199852, "global_step": 168125, "epoch": 4002, "val_loss": 68648.96875} {"train_loss": -7.0700483322143555, "global_step": 168126, "epoch": 4003} {"train_loss": -6.934294700622559, "global_step": 168127, "epoch": 4003} {"train_loss": -6.920174598693848, "global_step": 168128, "epoch": 4003} {"train_loss": -6.958240985870361, "global_step": 168129, "epoch": 4003} {"train_loss": -6.915071964263916, "global_step": 168130, "epoch": 4003} {"train_loss": -7.032159805297852, "global_step": 168131, "epoch": 4003} {"train_loss": -6.969390869140625, "global_step": 168132, "epoch": 4003} {"train_loss": -6.962703227996826, "global_step": 168133, "epoch": 4003} {"train_loss": -7.010319709777832, "global_step": 168134, "epoch": 4003} {"train_loss": -6.894789695739746, "global_step": 168135, "epoch": 4003} {"train_loss": -6.933027267456055, "global_step": 168136, "epoch": 4003} {"train_loss": -7.002412796020508, "global_step": 168137, "epoch": 4003} {"train_loss": -6.958525657653809, "global_step": 168138, "epoch": 4003} {"train_loss": -6.929186820983887, "global_step": 168139, "epoch": 4003} {"train_loss": -6.920124530792236, "global_step": 168140, "epoch": 4003} {"train_loss": -6.963134765625, "global_step": 168141, "epoch": 4003} {"train_loss": -7.013401985168457, "global_step": 168142, "epoch": 4003} {"train_loss": -7.011317253112793, "global_step": 168143, "epoch": 4003} {"train_loss": -6.892788887023926, "global_step": 168144, "epoch": 4003} {"train_loss": -6.932178497314453, "global_step": 168145, "epoch": 4003} {"train_loss": -7.057634353637695, "global_step": 168146, "epoch": 4003} {"train_loss": -6.991146564483643, "global_step": 168147, "epoch": 4003} {"train_loss": -6.865725517272949, "global_step": 168148, "epoch": 4003} {"train_loss": -6.9857988357543945, "global_step": 168149, "epoch": 4003} {"train_loss": -6.936100959777832, "global_step": 168150, "epoch": 4003} {"train_loss": -6.8939642906188965, "global_step": 168151, "epoch": 4003} {"train_loss": -6.924505233764648, "global_step": 168152, "epoch": 4003} {"train_loss": -6.9861345291137695, "global_step": 168153, "epoch": 4003} {"train_loss": -6.8856401443481445, "global_step": 168154, "epoch": 4003} {"train_loss": -6.983867645263672, "global_step": 168155, "epoch": 4003} {"train_loss": -6.999152183532715, "global_step": 168156, "epoch": 4003} {"train_loss": -7.069095611572266, "global_step": 168157, "epoch": 4003} {"train_loss": -7.005740165710449, "global_step": 168158, "epoch": 4003} {"train_loss": -6.955843925476074, "global_step": 168159, "epoch": 4003} {"train_loss": -6.944809913635254, "global_step": 168160, "epoch": 4003} {"train_loss": -6.987695217132568, "global_step": 168161, "epoch": 4003} {"train_loss": -6.963170051574707, "global_step": 168162, "epoch": 4003} {"train_loss": -6.916735649108887, "global_step": 168163, "epoch": 4003} {"train_loss": -6.898119926452637, "global_step": 168164, "epoch": 4003} {"train_loss": -6.988402366638184, "global_step": 168165, "epoch": 4003} {"train_loss": -6.826653480529785, "global_step": 168166, "epoch": 4003} {"train_loss": -6.9569892429170155, "global_step": 168167, "epoch": 4003, "val_loss": 68537.390625} {"train_loss": -6.92447566986084, "global_step": 168168, "epoch": 4004} {"train_loss": -6.911402702331543, "global_step": 168169, "epoch": 4004} {"train_loss": -6.988365650177002, "global_step": 168170, "epoch": 4004} {"train_loss": -7.0043439865112305, "global_step": 168171, "epoch": 4004} {"train_loss": -6.802016735076904, "global_step": 168172, "epoch": 4004} {"train_loss": -6.963255405426025, "global_step": 168173, "epoch": 4004} {"train_loss": -6.759418487548828, "global_step": 168174, "epoch": 4004} {"train_loss": -6.937725067138672, "global_step": 168175, "epoch": 4004} {"train_loss": -6.9228081703186035, "global_step": 168176, "epoch": 4004} {"train_loss": -6.721453666687012, "global_step": 168177, "epoch": 4004} {"train_loss": -7.066740036010742, "global_step": 168178, "epoch": 4004} {"train_loss": -6.921107769012451, "global_step": 168179, "epoch": 4004} {"train_loss": -6.861275672912598, "global_step": 168180, "epoch": 4004} {"train_loss": -6.827853202819824, "global_step": 168181, "epoch": 4004} {"train_loss": -6.775834083557129, "global_step": 168182, "epoch": 4004} {"train_loss": -6.762136459350586, "global_step": 168183, "epoch": 4004} {"train_loss": -6.795269966125488, "global_step": 168184, "epoch": 4004} {"train_loss": -6.8758649826049805, "global_step": 168185, "epoch": 4004} {"train_loss": -6.634546279907227, "global_step": 168186, "epoch": 4004} {"train_loss": -6.9122185707092285, "global_step": 168187, "epoch": 4004} {"train_loss": -6.806842803955078, "global_step": 168188, "epoch": 4004} {"train_loss": -6.9021196365356445, "global_step": 168189, "epoch": 4004} {"train_loss": -6.823151588439941, "global_step": 168190, "epoch": 4004} {"train_loss": -6.81439733505249, "global_step": 168191, "epoch": 4004} {"train_loss": -6.800055027008057, "global_step": 168192, "epoch": 4004} {"train_loss": -6.885382652282715, "global_step": 168193, "epoch": 4004} {"train_loss": -6.812901020050049, "global_step": 168194, "epoch": 4004} {"train_loss": -6.7655181884765625, "global_step": 168195, "epoch": 4004} {"train_loss": -6.829684257507324, "global_step": 168196, "epoch": 4004} {"train_loss": -6.873441696166992, "global_step": 168197, "epoch": 4004} {"train_loss": -6.915424346923828, "global_step": 168198, "epoch": 4004} {"train_loss": -7.042999267578125, "global_step": 168199, "epoch": 4004} {"train_loss": -6.964887619018555, "global_step": 168200, "epoch": 4004} {"train_loss": -6.796022415161133, "global_step": 168201, "epoch": 4004} {"train_loss": -6.878732681274414, "global_step": 168202, "epoch": 4004} {"train_loss": -6.834115028381348, "global_step": 168203, "epoch": 4004} {"train_loss": -6.990396499633789, "global_step": 168204, "epoch": 4004} {"train_loss": -6.869834899902344, "global_step": 168205, "epoch": 4004} {"train_loss": -6.970135688781738, "global_step": 168206, "epoch": 4004} {"train_loss": -7.055752754211426, "global_step": 168207, "epoch": 4004} {"train_loss": -6.915035247802734, "global_step": 168208, "epoch": 4004} {"train_loss": -6.877847637448992, "global_step": 168209, "epoch": 4004, "val_loss": 68463.109375} {"train_loss": -6.9287824630737305, "global_step": 168210, "epoch": 4005} {"train_loss": -6.923338890075684, "global_step": 168211, "epoch": 4005} {"train_loss": -6.948996543884277, "global_step": 168212, "epoch": 4005} {"train_loss": -6.929070472717285, "global_step": 168213, "epoch": 4005} {"train_loss": -7.018339157104492, "global_step": 168214, "epoch": 4005} {"train_loss": -7.0694074630737305, "global_step": 168215, "epoch": 4005} {"train_loss": -6.97985315322876, "global_step": 168216, "epoch": 4005} {"train_loss": -7.089211940765381, "global_step": 168217, "epoch": 4005} {"train_loss": -6.898775100708008, "global_step": 168218, "epoch": 4005} {"train_loss": -6.998631477355957, "global_step": 168219, "epoch": 4005} {"train_loss": -7.022482872009277, "global_step": 168220, "epoch": 4005} {"train_loss": -6.950868606567383, "global_step": 168221, "epoch": 4005} {"train_loss": -7.0366411209106445, "global_step": 168222, "epoch": 4005} {"train_loss": -6.963863372802734, "global_step": 168223, "epoch": 4005} {"train_loss": -7.0692644119262695, "global_step": 168224, "epoch": 4005} {"train_loss": -6.976989269256592, "global_step": 168225, "epoch": 4005} {"train_loss": -7.017441272735596, "global_step": 168226, "epoch": 4005} {"train_loss": -6.9572272300720215, "global_step": 168227, "epoch": 4005} {"train_loss": -6.935633659362793, "global_step": 168228, "epoch": 4005} {"train_loss": -7.016711235046387, "global_step": 168229, "epoch": 4005} {"train_loss": -7.11301326751709, "global_step": 168230, "epoch": 4005} {"train_loss": -7.042295932769775, "global_step": 168231, "epoch": 4005} {"train_loss": -7.007687568664551, "global_step": 168232, "epoch": 4005} {"train_loss": -6.999732971191406, "global_step": 168233, "epoch": 4005} {"train_loss": -6.940220832824707, "global_step": 168234, "epoch": 4005} {"train_loss": -6.904505729675293, "global_step": 168235, "epoch": 4005} {"train_loss": -6.9001874923706055, "global_step": 168236, "epoch": 4005} {"train_loss": -7.050422668457031, "global_step": 168237, "epoch": 4005} {"train_loss": -6.972131729125977, "global_step": 168238, "epoch": 4005} {"train_loss": -7.1038498878479, "global_step": 168239, "epoch": 4005} {"train_loss": -7.149296760559082, "global_step": 168240, "epoch": 4005} {"train_loss": -6.85474967956543, "global_step": 168241, "epoch": 4005} {"train_loss": -7.011751174926758, "global_step": 168242, "epoch": 4005} {"train_loss": -6.866293907165527, "global_step": 168243, "epoch": 4005} {"train_loss": -6.899833679199219, "global_step": 168244, "epoch": 4005} {"train_loss": -6.977118015289307, "global_step": 168245, "epoch": 4005} {"train_loss": -7.012083053588867, "global_step": 168246, "epoch": 4005} {"train_loss": -7.033799171447754, "global_step": 168247, "epoch": 4005} {"train_loss": -6.992352485656738, "global_step": 168248, "epoch": 4005} {"train_loss": -6.938290119171143, "global_step": 168249, "epoch": 4005} {"train_loss": -7.025200843811035, "global_step": 168250, "epoch": 4005} {"train_loss": -6.98561185882205, "global_step": 168251, "epoch": 4005, "val_loss": 68393.8359375} {"train_loss": -7.087220191955566, "global_step": 168252, "epoch": 4006} {"train_loss": -6.977518081665039, "global_step": 168253, "epoch": 4006} {"train_loss": -6.904262065887451, "global_step": 168254, "epoch": 4006} {"train_loss": -6.882119178771973, "global_step": 168255, "epoch": 4006} {"train_loss": -6.959786415100098, "global_step": 168256, "epoch": 4006} {"train_loss": -7.04228401184082, "global_step": 168257, "epoch": 4006} {"train_loss": -7.007524013519287, "global_step": 168258, "epoch": 4006} {"train_loss": -6.952709197998047, "global_step": 168259, "epoch": 4006} {"train_loss": -6.948245525360107, "global_step": 168260, "epoch": 4006} {"train_loss": -7.017275333404541, "global_step": 168261, "epoch": 4006} {"train_loss": -6.953372001647949, "global_step": 168262, "epoch": 4006} {"train_loss": -6.953436374664307, "global_step": 168263, "epoch": 4006} {"train_loss": -6.972836494445801, "global_step": 168264, "epoch": 4006} {"train_loss": -6.983766555786133, "global_step": 168265, "epoch": 4006} {"train_loss": -6.966705322265625, "global_step": 168266, "epoch": 4006} {"train_loss": -6.920294761657715, "global_step": 168267, "epoch": 4006} {"train_loss": -6.928598403930664, "global_step": 168268, "epoch": 4006} {"train_loss": -6.949345588684082, "global_step": 168269, "epoch": 4006} {"train_loss": -6.8673481941223145, "global_step": 168270, "epoch": 4006} {"train_loss": -6.975149154663086, "global_step": 168271, "epoch": 4006} {"train_loss": -6.934364318847656, "global_step": 168272, "epoch": 4006} {"train_loss": -6.926231384277344, "global_step": 168273, "epoch": 4006} {"train_loss": -6.895718097686768, "global_step": 168274, "epoch": 4006} {"train_loss": -6.943002223968506, "global_step": 168275, "epoch": 4006} {"train_loss": -6.981464385986328, "global_step": 168276, "epoch": 4006} {"train_loss": -6.981558799743652, "global_step": 168277, "epoch": 4006} {"train_loss": -6.940700531005859, "global_step": 168278, "epoch": 4006} {"train_loss": -6.8488616943359375, "global_step": 168279, "epoch": 4006} {"train_loss": -7.005522727966309, "global_step": 168280, "epoch": 4006} {"train_loss": -6.966562271118164, "global_step": 168281, "epoch": 4006} {"train_loss": -6.895740985870361, "global_step": 168282, "epoch": 4006} {"train_loss": -6.995070457458496, "global_step": 168283, "epoch": 4006} {"train_loss": -6.980443000793457, "global_step": 168284, "epoch": 4006} {"train_loss": -6.8445048332214355, "global_step": 168285, "epoch": 4006} {"train_loss": -6.959126949310303, "global_step": 168286, "epoch": 4006} {"train_loss": -6.990571975708008, "global_step": 168287, "epoch": 4006} {"train_loss": -7.014429092407227, "global_step": 168288, "epoch": 4006} {"train_loss": -6.953639984130859, "global_step": 168289, "epoch": 4006} {"train_loss": -6.90538215637207, "global_step": 168290, "epoch": 4006} {"train_loss": -6.892443656921387, "global_step": 168291, "epoch": 4006} {"train_loss": -7.138575553894043, "global_step": 168292, "epoch": 4006} {"train_loss": -6.95655962399074, "global_step": 168293, "epoch": 4006, "val_loss": 68614.3125} {"train_loss": -6.960165500640869, "global_step": 168294, "epoch": 4007} {"train_loss": -6.94413948059082, "global_step": 168295, "epoch": 4007} {"train_loss": -6.923369407653809, "global_step": 168296, "epoch": 4007} {"train_loss": -6.963167190551758, "global_step": 168297, "epoch": 4007} {"train_loss": -7.0325727462768555, "global_step": 168298, "epoch": 4007} {"train_loss": -6.903829574584961, "global_step": 168299, "epoch": 4007} {"train_loss": -7.068398475646973, "global_step": 168300, "epoch": 4007} {"train_loss": -7.010979652404785, "global_step": 168301, "epoch": 4007} {"train_loss": -6.975240707397461, "global_step": 168302, "epoch": 4007} {"train_loss": -7.10723352432251, "global_step": 168303, "epoch": 4007} {"train_loss": -7.037032604217529, "global_step": 168304, "epoch": 4007} {"train_loss": -6.968292236328125, "global_step": 168305, "epoch": 4007} {"train_loss": -7.049193382263184, "global_step": 168306, "epoch": 4007} {"train_loss": -7.06675386428833, "global_step": 168307, "epoch": 4007} {"train_loss": -7.003764629364014, "global_step": 168308, "epoch": 4007} {"train_loss": -6.987086296081543, "global_step": 168309, "epoch": 4007} {"train_loss": -6.869894981384277, "global_step": 168310, "epoch": 4007} {"train_loss": -6.990591526031494, "global_step": 168311, "epoch": 4007} {"train_loss": -6.936907768249512, "global_step": 168312, "epoch": 4007} {"train_loss": -6.853857517242432, "global_step": 168313, "epoch": 4007} {"train_loss": -6.948751449584961, "global_step": 168314, "epoch": 4007} {"train_loss": -7.038427829742432, "global_step": 168315, "epoch": 4007} {"train_loss": -6.879149913787842, "global_step": 168316, "epoch": 4007} {"train_loss": -7.009909629821777, "global_step": 168317, "epoch": 4007} {"train_loss": -6.796839714050293, "global_step": 168318, "epoch": 4007} {"train_loss": -6.981720924377441, "global_step": 168319, "epoch": 4007} {"train_loss": -7.0506181716918945, "global_step": 168320, "epoch": 4007} {"train_loss": -6.9407854080200195, "global_step": 168321, "epoch": 4007} {"train_loss": -6.963848114013672, "global_step": 168322, "epoch": 4007} {"train_loss": -6.9085693359375, "global_step": 168323, "epoch": 4007} {"train_loss": -6.900498390197754, "global_step": 168324, "epoch": 4007} {"train_loss": -7.034268856048584, "global_step": 168325, "epoch": 4007} {"train_loss": -6.94870662689209, "global_step": 168326, "epoch": 4007} {"train_loss": -7.073798179626465, "global_step": 168327, "epoch": 4007} {"train_loss": -6.9247517585754395, "global_step": 168328, "epoch": 4007} {"train_loss": -6.984112739562988, "global_step": 168329, "epoch": 4007} {"train_loss": -7.034303188323975, "global_step": 168330, "epoch": 4007} {"train_loss": -7.107997894287109, "global_step": 168331, "epoch": 4007} {"train_loss": -7.023180961608887, "global_step": 168332, "epoch": 4007} {"train_loss": -6.990978717803955, "global_step": 168333, "epoch": 4007} {"train_loss": -7.0189104080200195, "global_step": 168334, "epoch": 4007} {"train_loss": -6.981784411839077, "global_step": 168335, "epoch": 4007, "val_loss": 68572.0234375} {"train_loss": -7.079694747924805, "global_step": 168336, "epoch": 4008} {"train_loss": -6.997797012329102, "global_step": 168337, "epoch": 4008} {"train_loss": -6.993188858032227, "global_step": 168338, "epoch": 4008} {"train_loss": -7.025564670562744, "global_step": 168339, "epoch": 4008} {"train_loss": -6.956366062164307, "global_step": 168340, "epoch": 4008} {"train_loss": -7.017954349517822, "global_step": 168341, "epoch": 4008} {"train_loss": -6.9752278327941895, "global_step": 168342, "epoch": 4008} {"train_loss": -6.997444152832031, "global_step": 168343, "epoch": 4008} {"train_loss": -6.986912727355957, "global_step": 168344, "epoch": 4008} {"train_loss": -6.851717948913574, "global_step": 168345, "epoch": 4008} {"train_loss": -6.876241207122803, "global_step": 168346, "epoch": 4008} {"train_loss": -6.96440315246582, "global_step": 168347, "epoch": 4008} {"train_loss": -6.972606182098389, "global_step": 168348, "epoch": 4008} {"train_loss": -7.062891006469727, "global_step": 168349, "epoch": 4008} {"train_loss": -7.009885311126709, "global_step": 168350, "epoch": 4008} {"train_loss": -7.142920970916748, "global_step": 168351, "epoch": 4008} {"train_loss": -6.9542083740234375, "global_step": 168352, "epoch": 4008} {"train_loss": -6.999942779541016, "global_step": 168353, "epoch": 4008} {"train_loss": -6.845392227172852, "global_step": 168354, "epoch": 4008} {"train_loss": -6.942530155181885, "global_step": 168355, "epoch": 4008} {"train_loss": -6.971322059631348, "global_step": 168356, "epoch": 4008} {"train_loss": -6.978948593139648, "global_step": 168357, "epoch": 4008} {"train_loss": -6.961190223693848, "global_step": 168358, "epoch": 4008} {"train_loss": -6.845540523529053, "global_step": 168359, "epoch": 4008} {"train_loss": -6.8463544845581055, "global_step": 168360, "epoch": 4008} {"train_loss": -6.866883277893066, "global_step": 168361, "epoch": 4008} {"train_loss": -6.849118232727051, "global_step": 168362, "epoch": 4008} {"train_loss": -6.980563163757324, "global_step": 168363, "epoch": 4008} {"train_loss": -6.873516082763672, "global_step": 168364, "epoch": 4008} {"train_loss": -6.8530778884887695, "global_step": 168365, "epoch": 4008} {"train_loss": -6.836124420166016, "global_step": 168366, "epoch": 4008} {"train_loss": -6.9411091804504395, "global_step": 168367, "epoch": 4008} {"train_loss": -6.924245834350586, "global_step": 168368, "epoch": 4008} {"train_loss": -6.993288040161133, "global_step": 168369, "epoch": 4008} {"train_loss": -6.972356796264648, "global_step": 168370, "epoch": 4008} {"train_loss": -6.903331279754639, "global_step": 168371, "epoch": 4008} {"train_loss": -6.865767478942871, "global_step": 168372, "epoch": 4008} {"train_loss": -6.816212177276611, "global_step": 168373, "epoch": 4008} {"train_loss": -6.802435874938965, "global_step": 168374, "epoch": 4008} {"train_loss": -6.730772972106934, "global_step": 168375, "epoch": 4008} {"train_loss": -6.823271751403809, "global_step": 168376, "epoch": 4008} {"train_loss": -6.932802381969633, "global_step": 168377, "epoch": 4008, "val_loss": 68576.0625} {"train_loss": -6.842248439788818, "global_step": 168378, "epoch": 4009} {"train_loss": -6.799647331237793, "global_step": 168379, "epoch": 4009} {"train_loss": -7.001043319702148, "global_step": 168380, "epoch": 4009} {"train_loss": -6.825862884521484, "global_step": 168381, "epoch": 4009} {"train_loss": -6.798489570617676, "global_step": 168382, "epoch": 4009} {"train_loss": -6.776923179626465, "global_step": 168383, "epoch": 4009} {"train_loss": -6.802350044250488, "global_step": 168384, "epoch": 4009} {"train_loss": -6.978649616241455, "global_step": 168385, "epoch": 4009} {"train_loss": -6.794010162353516, "global_step": 168386, "epoch": 4009} {"train_loss": -6.850214958190918, "global_step": 168387, "epoch": 4009} {"train_loss": -6.901344299316406, "global_step": 168388, "epoch": 4009} {"train_loss": -6.779755592346191, "global_step": 168389, "epoch": 4009} {"train_loss": -6.743814468383789, "global_step": 168390, "epoch": 4009} {"train_loss": -6.853570938110352, "global_step": 168391, "epoch": 4009} {"train_loss": -6.781928062438965, "global_step": 168392, "epoch": 4009} {"train_loss": -6.8850603103637695, "global_step": 168393, "epoch": 4009} {"train_loss": -6.901902198791504, "global_step": 168394, "epoch": 4009} {"train_loss": -6.808156490325928, "global_step": 168395, "epoch": 4009} {"train_loss": -6.869580268859863, "global_step": 168396, "epoch": 4009} {"train_loss": -6.90217924118042, "global_step": 168397, "epoch": 4009} {"train_loss": -6.91848087310791, "global_step": 168398, "epoch": 4009} {"train_loss": -7.011829853057861, "global_step": 168399, "epoch": 4009} {"train_loss": -6.982571125030518, "global_step": 168400, "epoch": 4009} {"train_loss": -6.988575458526611, "global_step": 168401, "epoch": 4009} {"train_loss": -6.972498893737793, "global_step": 168402, "epoch": 4009} {"train_loss": -6.949118614196777, "global_step": 168403, "epoch": 4009} {"train_loss": -6.963043212890625, "global_step": 168404, "epoch": 4009} {"train_loss": -6.999651908874512, "global_step": 168405, "epoch": 4009} {"train_loss": -6.999468803405762, "global_step": 168406, "epoch": 4009} {"train_loss": -6.934142112731934, "global_step": 168407, "epoch": 4009} {"train_loss": -6.961629867553711, "global_step": 168408, "epoch": 4009} {"train_loss": -6.985781192779541, "global_step": 168409, "epoch": 4009} {"train_loss": -6.861660957336426, "global_step": 168410, "epoch": 4009} {"train_loss": -6.886752128601074, "global_step": 168411, "epoch": 4009} {"train_loss": -6.91703462600708, "global_step": 168412, "epoch": 4009} {"train_loss": -6.973237037658691, "global_step": 168413, "epoch": 4009} {"train_loss": -7.054313659667969, "global_step": 168414, "epoch": 4009} {"train_loss": -6.884171485900879, "global_step": 168415, "epoch": 4009} {"train_loss": -6.971368789672852, "global_step": 168416, "epoch": 4009} {"train_loss": -7.011814594268799, "global_step": 168417, "epoch": 4009} {"train_loss": -7.046416759490967, "global_step": 168418, "epoch": 4009} {"train_loss": -6.906428234917777, "global_step": 168419, "epoch": 4009, "val_loss": 68457.6640625} {"train_loss": -6.885378360748291, "global_step": 168420, "epoch": 4010} {"train_loss": -6.815364360809326, "global_step": 168421, "epoch": 4010} {"train_loss": -6.737760543823242, "global_step": 168422, "epoch": 4010} {"train_loss": -6.852458953857422, "global_step": 168423, "epoch": 4010} {"train_loss": -6.8987579345703125, "global_step": 168424, "epoch": 4010} {"train_loss": -6.9795241355896, "global_step": 168425, "epoch": 4010} {"train_loss": -6.921416282653809, "global_step": 168426, "epoch": 4010} {"train_loss": -6.818839073181152, "global_step": 168427, "epoch": 4010} {"train_loss": -6.908771514892578, "global_step": 168428, "epoch": 4010} {"train_loss": -6.780962944030762, "global_step": 168429, "epoch": 4010} {"train_loss": -6.871315002441406, "global_step": 168430, "epoch": 4010} {"train_loss": -6.734375, "global_step": 168431, "epoch": 4010} {"train_loss": -6.890260696411133, "global_step": 168432, "epoch": 4010} {"train_loss": -6.750685214996338, "global_step": 168433, "epoch": 4010} {"train_loss": -6.940353870391846, "global_step": 168434, "epoch": 4010} {"train_loss": -6.896636962890625, "global_step": 168435, "epoch": 4010} {"train_loss": -6.7769975662231445, "global_step": 168436, "epoch": 4010} {"train_loss": -7.035663604736328, "global_step": 168437, "epoch": 4010} {"train_loss": -6.901689052581787, "global_step": 168438, "epoch": 4010} {"train_loss": -6.833676338195801, "global_step": 168439, "epoch": 4010} {"train_loss": -6.95106315612793, "global_step": 168440, "epoch": 4010} {"train_loss": -6.956687927246094, "global_step": 168441, "epoch": 4010} {"train_loss": -6.900079727172852, "global_step": 168442, "epoch": 4010} {"train_loss": -6.956493377685547, "global_step": 168443, "epoch": 4010} {"train_loss": -6.988851547241211, "global_step": 168444, "epoch": 4010} {"train_loss": -6.854393005371094, "global_step": 168445, "epoch": 4010} {"train_loss": -6.8209004402160645, "global_step": 168446, "epoch": 4010} {"train_loss": -6.932862758636475, "global_step": 168447, "epoch": 4010} {"train_loss": -6.790155410766602, "global_step": 168448, "epoch": 4010} {"train_loss": -6.906913757324219, "global_step": 168449, "epoch": 4010} {"train_loss": -6.8361663818359375, "global_step": 168450, "epoch": 4010} {"train_loss": -6.945844650268555, "global_step": 168451, "epoch": 4010} {"train_loss": -6.873299598693848, "global_step": 168452, "epoch": 4010} {"train_loss": -6.92622184753418, "global_step": 168453, "epoch": 4010} {"train_loss": -6.96051549911499, "global_step": 168454, "epoch": 4010} {"train_loss": -7.011940956115723, "global_step": 168455, "epoch": 4010} {"train_loss": -6.95555305480957, "global_step": 168456, "epoch": 4010} {"train_loss": -6.887417316436768, "global_step": 168457, "epoch": 4010} {"train_loss": -6.944239616394043, "global_step": 168458, "epoch": 4010} {"train_loss": -6.9534149169921875, "global_step": 168459, "epoch": 4010} {"train_loss": -7.0525617599487305, "global_step": 168460, "epoch": 4010} {"train_loss": -6.894701435452416, "global_step": 168461, "epoch": 4010, "val_loss": 68488.359375} {"train_loss": -7.095528602600098, "global_step": 168462, "epoch": 4011} {"train_loss": -6.965252876281738, "global_step": 168463, "epoch": 4011} {"train_loss": -6.95982551574707, "global_step": 168464, "epoch": 4011} {"train_loss": -6.986024856567383, "global_step": 168465, "epoch": 4011} {"train_loss": -6.995205402374268, "global_step": 168466, "epoch": 4011} {"train_loss": -6.951315879821777, "global_step": 168467, "epoch": 4011} {"train_loss": -7.008934020996094, "global_step": 168468, "epoch": 4011} {"train_loss": -7.04287576675415, "global_step": 168469, "epoch": 4011} {"train_loss": -7.087853908538818, "global_step": 168470, "epoch": 4011} {"train_loss": -6.912496566772461, "global_step": 168471, "epoch": 4011} {"train_loss": -7.071174621582031, "global_step": 168472, "epoch": 4011} {"train_loss": -7.046778678894043, "global_step": 168473, "epoch": 4011} {"train_loss": -7.025269985198975, "global_step": 168474, "epoch": 4011} {"train_loss": -6.913153648376465, "global_step": 168475, "epoch": 4011} {"train_loss": -6.983226776123047, "global_step": 168476, "epoch": 4011} {"train_loss": -7.097757339477539, "global_step": 168477, "epoch": 4011} {"train_loss": -6.921263217926025, "global_step": 168478, "epoch": 4011} {"train_loss": -7.0281662940979, "global_step": 168479, "epoch": 4011} {"train_loss": -6.963431358337402, "global_step": 168480, "epoch": 4011} {"train_loss": -6.905915260314941, "global_step": 168481, "epoch": 4011} {"train_loss": -6.954021453857422, "global_step": 168482, "epoch": 4011} {"train_loss": -6.970876693725586, "global_step": 168483, "epoch": 4011} {"train_loss": -7.018520355224609, "global_step": 168484, "epoch": 4011} {"train_loss": -6.923840522766113, "global_step": 168485, "epoch": 4011} {"train_loss": -6.995429515838623, "global_step": 168486, "epoch": 4011} {"train_loss": -6.940998077392578, "global_step": 168487, "epoch": 4011} {"train_loss": -7.025019645690918, "global_step": 168488, "epoch": 4011} {"train_loss": -6.983906269073486, "global_step": 168489, "epoch": 4011} {"train_loss": -7.014378070831299, "global_step": 168490, "epoch": 4011} {"train_loss": -7.058318614959717, "global_step": 168491, "epoch": 4011} {"train_loss": -6.944802284240723, "global_step": 168492, "epoch": 4011} {"train_loss": -7.003410816192627, "global_step": 168493, "epoch": 4011} {"train_loss": -6.967693328857422, "global_step": 168494, "epoch": 4011} {"train_loss": -7.011532306671143, "global_step": 168495, "epoch": 4011} {"train_loss": -7.009538650512695, "global_step": 168496, "epoch": 4011} {"train_loss": -6.912376403808594, "global_step": 168497, "epoch": 4011} {"train_loss": -7.038370132446289, "global_step": 168498, "epoch": 4011} {"train_loss": -6.936752796173096, "global_step": 168499, "epoch": 4011} {"train_loss": -6.872475624084473, "global_step": 168500, "epoch": 4011} {"train_loss": -7.046481132507324, "global_step": 168501, "epoch": 4011} {"train_loss": -7.005232334136963, "global_step": 168502, "epoch": 4011} {"train_loss": -6.990530309222994, "global_step": 168503, "epoch": 4011, "val_loss": 68611.828125} {"train_loss": -6.981809616088867, "global_step": 168504, "epoch": 4012} {"train_loss": -6.976668357849121, "global_step": 168505, "epoch": 4012} {"train_loss": -7.024984836578369, "global_step": 168506, "epoch": 4012} {"train_loss": -6.923642635345459, "global_step": 168507, "epoch": 4012} {"train_loss": -7.051470756530762, "global_step": 168508, "epoch": 4012} {"train_loss": -7.112844944000244, "global_step": 168509, "epoch": 4012} {"train_loss": -7.0225830078125, "global_step": 168510, "epoch": 4012} {"train_loss": -7.020754814147949, "global_step": 168511, "epoch": 4012} {"train_loss": -6.96552848815918, "global_step": 168512, "epoch": 4012} {"train_loss": -7.018256664276123, "global_step": 168513, "epoch": 4012} {"train_loss": -6.9453582763671875, "global_step": 168514, "epoch": 4012} {"train_loss": -7.041860580444336, "global_step": 168515, "epoch": 4012} {"train_loss": -6.896443843841553, "global_step": 168516, "epoch": 4012} {"train_loss": -6.999545097351074, "global_step": 168517, "epoch": 4012} {"train_loss": -6.999298095703125, "global_step": 168518, "epoch": 4012} {"train_loss": -6.938465595245361, "global_step": 168519, "epoch": 4012} {"train_loss": -6.99654483795166, "global_step": 168520, "epoch": 4012} {"train_loss": -7.0657548904418945, "global_step": 168521, "epoch": 4012} {"train_loss": -6.890323162078857, "global_step": 168522, "epoch": 4012} {"train_loss": -6.975261688232422, "global_step": 168523, "epoch": 4012} {"train_loss": -7.0067291259765625, "global_step": 168524, "epoch": 4012} {"train_loss": -7.079456806182861, "global_step": 168525, "epoch": 4012} {"train_loss": -6.941860675811768, "global_step": 168526, "epoch": 4012} {"train_loss": -6.903863430023193, "global_step": 168527, "epoch": 4012} {"train_loss": -7.048521518707275, "global_step": 168528, "epoch": 4012} {"train_loss": -6.828499794006348, "global_step": 168529, "epoch": 4012} {"train_loss": -6.934519290924072, "global_step": 168530, "epoch": 4012} {"train_loss": -6.912137985229492, "global_step": 168531, "epoch": 4012} {"train_loss": -6.9963459968566895, "global_step": 168532, "epoch": 4012} {"train_loss": -6.923483371734619, "global_step": 168533, "epoch": 4012} {"train_loss": -6.92943811416626, "global_step": 168534, "epoch": 4012} {"train_loss": -6.956293106079102, "global_step": 168535, "epoch": 4012} {"train_loss": -7.059747219085693, "global_step": 168536, "epoch": 4012} {"train_loss": -6.970973968505859, "global_step": 168537, "epoch": 4012} {"train_loss": -6.967695236206055, "global_step": 168538, "epoch": 4012} {"train_loss": -6.8775129318237305, "global_step": 168539, "epoch": 4012} {"train_loss": -6.984762668609619, "global_step": 168540, "epoch": 4012} {"train_loss": -6.894661903381348, "global_step": 168541, "epoch": 4012} {"train_loss": -6.98794412612915, "global_step": 168542, "epoch": 4012} {"train_loss": -6.935685634613037, "global_step": 168543, "epoch": 4012} {"train_loss": -7.034912586212158, "global_step": 168544, "epoch": 4012} {"train_loss": -6.975771461214338, "global_step": 168545, "epoch": 4012, "val_loss": 68527.6875} {"train_loss": -6.902519226074219, "global_step": 168546, "epoch": 4013} {"train_loss": -6.951186180114746, "global_step": 168547, "epoch": 4013} {"train_loss": -6.931129455566406, "global_step": 168548, "epoch": 4013} {"train_loss": -6.886898994445801, "global_step": 168549, "epoch": 4013} {"train_loss": -6.991583824157715, "global_step": 168550, "epoch": 4013} {"train_loss": -6.989528656005859, "global_step": 168551, "epoch": 4013} {"train_loss": -6.924922466278076, "global_step": 168552, "epoch": 4013} {"train_loss": -7.057624816894531, "global_step": 168553, "epoch": 4013} {"train_loss": -7.01626443862915, "global_step": 168554, "epoch": 4013} {"train_loss": -6.976626396179199, "global_step": 168555, "epoch": 4013} {"train_loss": -7.127384662628174, "global_step": 168556, "epoch": 4013} {"train_loss": -6.976470470428467, "global_step": 168557, "epoch": 4013} {"train_loss": -6.982055187225342, "global_step": 168558, "epoch": 4013} {"train_loss": -7.067235946655273, "global_step": 168559, "epoch": 4013} {"train_loss": -7.0130791664123535, "global_step": 168560, "epoch": 4013} {"train_loss": -7.080709457397461, "global_step": 168561, "epoch": 4013} {"train_loss": -7.155553817749023, "global_step": 168562, "epoch": 4013} {"train_loss": -6.979677677154541, "global_step": 168563, "epoch": 4013} {"train_loss": -6.94001579284668, "global_step": 168564, "epoch": 4013} {"train_loss": -6.899116516113281, "global_step": 168565, "epoch": 4013} {"train_loss": -6.840897083282471, "global_step": 168566, "epoch": 4013} {"train_loss": -7.0309271812438965, "global_step": 168567, "epoch": 4013} {"train_loss": -6.914403915405273, "global_step": 168568, "epoch": 4013} {"train_loss": -6.930753707885742, "global_step": 168569, "epoch": 4013} {"train_loss": -7.006703853607178, "global_step": 168570, "epoch": 4013} {"train_loss": -7.036276340484619, "global_step": 168571, "epoch": 4013} {"train_loss": -7.066023349761963, "global_step": 168572, "epoch": 4013} {"train_loss": -7.029163360595703, "global_step": 168573, "epoch": 4013} {"train_loss": -7.024589538574219, "global_step": 168574, "epoch": 4013} {"train_loss": -7.021134853363037, "global_step": 168575, "epoch": 4013} {"train_loss": -7.176098823547363, "global_step": 168576, "epoch": 4013} {"train_loss": -7.007050037384033, "global_step": 168577, "epoch": 4013} {"train_loss": -7.046759605407715, "global_step": 168578, "epoch": 4013} {"train_loss": -6.8892292976379395, "global_step": 168579, "epoch": 4013} {"train_loss": -6.947126388549805, "global_step": 168580, "epoch": 4013} {"train_loss": -6.938392639160156, "global_step": 168581, "epoch": 4013} {"train_loss": -6.9000163078308105, "global_step": 168582, "epoch": 4013} {"train_loss": -6.8871002197265625, "global_step": 168583, "epoch": 4013} {"train_loss": -6.978402137756348, "global_step": 168584, "epoch": 4013} {"train_loss": -6.919450283050537, "global_step": 168585, "epoch": 4013} {"train_loss": -6.824488162994385, "global_step": 168586, "epoch": 4013} {"train_loss": -6.980743113018217, "global_step": 168587, "epoch": 4013, "val_loss": 68834.3515625} {"train_loss": -6.814642906188965, "global_step": 168588, "epoch": 4014} {"train_loss": -6.9090189933776855, "global_step": 168589, "epoch": 4014} {"train_loss": -7.015776634216309, "global_step": 168590, "epoch": 4014} {"train_loss": -6.8962907791137695, "global_step": 168591, "epoch": 4014} {"train_loss": -6.9291839599609375, "global_step": 168592, "epoch": 4014} {"train_loss": -6.931807041168213, "global_step": 168593, "epoch": 4014} {"train_loss": -6.968808174133301, "global_step": 168594, "epoch": 4014} {"train_loss": -6.84727668762207, "global_step": 168595, "epoch": 4014} {"train_loss": -6.783061981201172, "global_step": 168596, "epoch": 4014} {"train_loss": -6.945501804351807, "global_step": 168597, "epoch": 4014} {"train_loss": -6.828264236450195, "global_step": 168598, "epoch": 4014} {"train_loss": -7.0153656005859375, "global_step": 168599, "epoch": 4014} {"train_loss": -6.778557777404785, "global_step": 168600, "epoch": 4014} {"train_loss": -6.944990158081055, "global_step": 168601, "epoch": 4014} {"train_loss": -6.972759246826172, "global_step": 168602, "epoch": 4014} {"train_loss": -6.893608093261719, "global_step": 168603, "epoch": 4014} {"train_loss": -7.007077217102051, "global_step": 168604, "epoch": 4014} {"train_loss": -6.926538467407227, "global_step": 168605, "epoch": 4014} {"train_loss": -7.072297096252441, "global_step": 168606, "epoch": 4014} {"train_loss": -6.910782337188721, "global_step": 168607, "epoch": 4014} {"train_loss": -6.941388130187988, "global_step": 168608, "epoch": 4014} {"train_loss": -6.928266525268555, "global_step": 168609, "epoch": 4014} {"train_loss": -6.855888843536377, "global_step": 168610, "epoch": 4014} {"train_loss": -6.9777421951293945, "global_step": 168611, "epoch": 4014} {"train_loss": -6.9423675537109375, "global_step": 168612, "epoch": 4014} {"train_loss": -6.926664352416992, "global_step": 168613, "epoch": 4014} {"train_loss": -6.960982799530029, "global_step": 168614, "epoch": 4014} {"train_loss": -7.082526683807373, "global_step": 168615, "epoch": 4014} {"train_loss": -6.877140045166016, "global_step": 168616, "epoch": 4014} {"train_loss": -6.941248893737793, "global_step": 168617, "epoch": 4014} {"train_loss": -7.030912399291992, "global_step": 168618, "epoch": 4014} {"train_loss": -6.929922103881836, "global_step": 168619, "epoch": 4014} {"train_loss": -6.88637113571167, "global_step": 168620, "epoch": 4014} {"train_loss": -6.984312057495117, "global_step": 168621, "epoch": 4014} {"train_loss": -6.991156101226807, "global_step": 168622, "epoch": 4014} {"train_loss": -6.994365692138672, "global_step": 168623, "epoch": 4014} {"train_loss": -6.991644859313965, "global_step": 168624, "epoch": 4014} {"train_loss": -6.946396827697754, "global_step": 168625, "epoch": 4014} {"train_loss": -6.974933624267578, "global_step": 168626, "epoch": 4014} {"train_loss": -6.954536437988281, "global_step": 168627, "epoch": 4014} {"train_loss": -6.953794002532959, "global_step": 168628, "epoch": 4014} {"train_loss": -6.939082940419515, "global_step": 168629, "epoch": 4014, "val_loss": 68517.0703125} {"train_loss": -7.009405136108398, "global_step": 168630, "epoch": 4015} {"train_loss": -6.979057312011719, "global_step": 168631, "epoch": 4015} {"train_loss": -7.102251052856445, "global_step": 168632, "epoch": 4015} {"train_loss": -7.064218521118164, "global_step": 168633, "epoch": 4015} {"train_loss": -6.987799644470215, "global_step": 168634, "epoch": 4015} {"train_loss": -7.081020355224609, "global_step": 168635, "epoch": 4015} {"train_loss": -6.9847002029418945, "global_step": 168636, "epoch": 4015} {"train_loss": -6.991986274719238, "global_step": 168637, "epoch": 4015} {"train_loss": -7.056855201721191, "global_step": 168638, "epoch": 4015} {"train_loss": -7.018601417541504, "global_step": 168639, "epoch": 4015} {"train_loss": -7.056594371795654, "global_step": 168640, "epoch": 4015} {"train_loss": -7.055354118347168, "global_step": 168641, "epoch": 4015} {"train_loss": -6.977964401245117, "global_step": 168642, "epoch": 4015} {"train_loss": -6.921211242675781, "global_step": 168643, "epoch": 4015} {"train_loss": -6.898861885070801, "global_step": 168644, "epoch": 4015} {"train_loss": -7.0569562911987305, "global_step": 168645, "epoch": 4015} {"train_loss": -7.061311721801758, "global_step": 168646, "epoch": 4015} {"train_loss": -6.966145038604736, "global_step": 168647, "epoch": 4015} {"train_loss": -6.967323303222656, "global_step": 168648, "epoch": 4015} {"train_loss": -7.08241081237793, "global_step": 168649, "epoch": 4015} {"train_loss": -7.082331657409668, "global_step": 168650, "epoch": 4015} {"train_loss": -6.9705376625061035, "global_step": 168651, "epoch": 4015} {"train_loss": -6.946949481964111, "global_step": 168652, "epoch": 4015} {"train_loss": -6.997150421142578, "global_step": 168653, "epoch": 4015} {"train_loss": -7.112343788146973, "global_step": 168654, "epoch": 4015} {"train_loss": -7.0305495262146, "global_step": 168655, "epoch": 4015} {"train_loss": -7.045965671539307, "global_step": 168656, "epoch": 4015} {"train_loss": -7.009366989135742, "global_step": 168657, "epoch": 4015} {"train_loss": -6.977933406829834, "global_step": 168658, "epoch": 4015} {"train_loss": -6.993602275848389, "global_step": 168659, "epoch": 4015} {"train_loss": -6.945886135101318, "global_step": 168660, "epoch": 4015} {"train_loss": -6.9525322914123535, "global_step": 168661, "epoch": 4015} {"train_loss": -6.909446716308594, "global_step": 168662, "epoch": 4015} {"train_loss": -6.945174217224121, "global_step": 168663, "epoch": 4015} {"train_loss": -6.9865875244140625, "global_step": 168664, "epoch": 4015} {"train_loss": -6.965967178344727, "global_step": 168665, "epoch": 4015} {"train_loss": -6.976086616516113, "global_step": 168666, "epoch": 4015} {"train_loss": -6.898609638214111, "global_step": 168667, "epoch": 4015} {"train_loss": -6.906620025634766, "global_step": 168668, "epoch": 4015} {"train_loss": -6.960416793823242, "global_step": 168669, "epoch": 4015} {"train_loss": -6.82249641418457, "global_step": 168670, "epoch": 4015} {"train_loss": -6.994653985613868, "global_step": 168671, "epoch": 4015, "val_loss": 68623.1015625} {"train_loss": -7.0368146896362305, "global_step": 168672, "epoch": 4016} {"train_loss": -6.9655914306640625, "global_step": 168673, "epoch": 4016} {"train_loss": -6.948488712310791, "global_step": 168674, "epoch": 4016} {"train_loss": -7.076058387756348, "global_step": 168675, "epoch": 4016} {"train_loss": -6.926797389984131, "global_step": 168676, "epoch": 4016} {"train_loss": -6.875899791717529, "global_step": 168677, "epoch": 4016} {"train_loss": -6.9515275955200195, "global_step": 168678, "epoch": 4016} {"train_loss": -7.017807483673096, "global_step": 168679, "epoch": 4016} {"train_loss": -7.0625410079956055, "global_step": 168680, "epoch": 4016} {"train_loss": -7.050236701965332, "global_step": 168681, "epoch": 4016} {"train_loss": -6.987295150756836, "global_step": 168682, "epoch": 4016} {"train_loss": -6.979530334472656, "global_step": 168683, "epoch": 4016} {"train_loss": -6.956153869628906, "global_step": 168684, "epoch": 4016} {"train_loss": -6.944612979888916, "global_step": 168685, "epoch": 4016} {"train_loss": -6.99343204498291, "global_step": 168686, "epoch": 4016} {"train_loss": -7.112870693206787, "global_step": 168687, "epoch": 4016} {"train_loss": -6.9955949783325195, "global_step": 168688, "epoch": 4016} {"train_loss": -7.045793056488037, "global_step": 168689, "epoch": 4016} {"train_loss": -7.0020432472229, "global_step": 168690, "epoch": 4016} {"train_loss": -6.965328216552734, "global_step": 168691, "epoch": 4016} {"train_loss": -7.143770694732666, "global_step": 168692, "epoch": 4016} {"train_loss": -6.993062973022461, "global_step": 168693, "epoch": 4016} {"train_loss": -7.063998222351074, "global_step": 168694, "epoch": 4016} {"train_loss": -6.99320650100708, "global_step": 168695, "epoch": 4016} {"train_loss": -6.9885711669921875, "global_step": 168696, "epoch": 4016} {"train_loss": -7.030795097351074, "global_step": 168697, "epoch": 4016} {"train_loss": -6.976452827453613, "global_step": 168698, "epoch": 4016} {"train_loss": -6.944368839263916, "global_step": 168699, "epoch": 4016} {"train_loss": -6.850292205810547, "global_step": 168700, "epoch": 4016} {"train_loss": -7.0226240158081055, "global_step": 168701, "epoch": 4016} {"train_loss": -6.9037766456604, "global_step": 168702, "epoch": 4016} {"train_loss": -7.09971809387207, "global_step": 168703, "epoch": 4016} {"train_loss": -6.938429832458496, "global_step": 168704, "epoch": 4016} {"train_loss": -7.055271148681641, "global_step": 168705, "epoch": 4016} {"train_loss": -7.042612075805664, "global_step": 168706, "epoch": 4016} {"train_loss": -6.972291946411133, "global_step": 168707, "epoch": 4016} {"train_loss": -7.035780429840088, "global_step": 168708, "epoch": 4016} {"train_loss": -7.0058183670043945, "global_step": 168709, "epoch": 4016} {"train_loss": -7.057610034942627, "global_step": 168710, "epoch": 4016} {"train_loss": -6.955889701843262, "global_step": 168711, "epoch": 4016} {"train_loss": -7.02480411529541, "global_step": 168712, "epoch": 4016} {"train_loss": -6.999599593026297, "global_step": 168713, "epoch": 4016, "val_loss": 68387.46875} {"train_loss": -6.948146343231201, "global_step": 168714, "epoch": 4017} {"train_loss": -6.981848239898682, "global_step": 168715, "epoch": 4017} {"train_loss": -6.8267059326171875, "global_step": 168716, "epoch": 4017} {"train_loss": -6.921351432800293, "global_step": 168717, "epoch": 4017} {"train_loss": -7.067580223083496, "global_step": 168718, "epoch": 4017} {"train_loss": -6.932548999786377, "global_step": 168719, "epoch": 4017} {"train_loss": -7.042021751403809, "global_step": 168720, "epoch": 4017} {"train_loss": -6.945898532867432, "global_step": 168721, "epoch": 4017} {"train_loss": -6.904872894287109, "global_step": 168722, "epoch": 4017} {"train_loss": -7.101254940032959, "global_step": 168723, "epoch": 4017} {"train_loss": -7.023838996887207, "global_step": 168724, "epoch": 4017} {"train_loss": -7.013774394989014, "global_step": 168725, "epoch": 4017} {"train_loss": -7.08894157409668, "global_step": 168726, "epoch": 4017} {"train_loss": -7.07081413269043, "global_step": 168727, "epoch": 4017} {"train_loss": -7.046135902404785, "global_step": 168728, "epoch": 4017} {"train_loss": -7.018739223480225, "global_step": 168729, "epoch": 4017} {"train_loss": -7.0324177742004395, "global_step": 168730, "epoch": 4017} {"train_loss": -7.046819686889648, "global_step": 168731, "epoch": 4017} {"train_loss": -6.922381401062012, "global_step": 168732, "epoch": 4017} {"train_loss": -7.069646835327148, "global_step": 168733, "epoch": 4017} {"train_loss": -6.974186897277832, "global_step": 168734, "epoch": 4017} {"train_loss": -7.056562423706055, "global_step": 168735, "epoch": 4017} {"train_loss": -6.9993181228637695, "global_step": 168736, "epoch": 4017} {"train_loss": -6.980976104736328, "global_step": 168737, "epoch": 4017} {"train_loss": -6.9649786949157715, "global_step": 168738, "epoch": 4017} {"train_loss": -6.986166477203369, "global_step": 168739, "epoch": 4017} {"train_loss": -7.014281272888184, "global_step": 168740, "epoch": 4017} {"train_loss": -7.0068769454956055, "global_step": 168741, "epoch": 4017} {"train_loss": -7.1171746253967285, "global_step": 168742, "epoch": 4017} {"train_loss": -7.091773509979248, "global_step": 168743, "epoch": 4017} {"train_loss": -6.9460859298706055, "global_step": 168744, "epoch": 4017} {"train_loss": -7.018864154815674, "global_step": 168745, "epoch": 4017} {"train_loss": -6.895147323608398, "global_step": 168746, "epoch": 4017} {"train_loss": -7.057470321655273, "global_step": 168747, "epoch": 4017} {"train_loss": -6.970643997192383, "global_step": 168748, "epoch": 4017} {"train_loss": -7.012640476226807, "global_step": 168749, "epoch": 4017} {"train_loss": -6.994952201843262, "global_step": 168750, "epoch": 4017} {"train_loss": -6.977077007293701, "global_step": 168751, "epoch": 4017} {"train_loss": -6.9375715255737305, "global_step": 168752, "epoch": 4017} {"train_loss": -7.051479339599609, "global_step": 168753, "epoch": 4017} {"train_loss": -6.938650131225586, "global_step": 168754, "epoch": 4017} {"train_loss": -7.000017688387916, "global_step": 168755, "epoch": 4017, "val_loss": 68559.7578125} {"train_loss": -7.0733747482299805, "global_step": 168756, "epoch": 4018} {"train_loss": -6.935864448547363, "global_step": 168757, "epoch": 4018} {"train_loss": -6.89337158203125, "global_step": 168758, "epoch": 4018} {"train_loss": -7.007137298583984, "global_step": 168759, "epoch": 4018} {"train_loss": -6.982269763946533, "global_step": 168760, "epoch": 4018} {"train_loss": -7.09999418258667, "global_step": 168761, "epoch": 4018} {"train_loss": -7.003314971923828, "global_step": 168762, "epoch": 4018} {"train_loss": -6.989381790161133, "global_step": 168763, "epoch": 4018} {"train_loss": -7.02045202255249, "global_step": 168764, "epoch": 4018} {"train_loss": -6.946606636047363, "global_step": 168765, "epoch": 4018} {"train_loss": -6.852887153625488, "global_step": 168766, "epoch": 4018} {"train_loss": -7.036725997924805, "global_step": 168767, "epoch": 4018} {"train_loss": -7.146459579467773, "global_step": 168768, "epoch": 4018} {"train_loss": -7.065147876739502, "global_step": 168769, "epoch": 4018} {"train_loss": -7.061628341674805, "global_step": 168770, "epoch": 4018} {"train_loss": -6.959890842437744, "global_step": 168771, "epoch": 4018} {"train_loss": -7.0672383308410645, "global_step": 168772, "epoch": 4018} {"train_loss": -7.162099838256836, "global_step": 168773, "epoch": 4018} {"train_loss": -7.065302848815918, "global_step": 168774, "epoch": 4018} {"train_loss": -7.057033538818359, "global_step": 168775, "epoch": 4018} {"train_loss": -7.010564804077148, "global_step": 168776, "epoch": 4018} {"train_loss": -7.028964996337891, "global_step": 168777, "epoch": 4018} {"train_loss": -7.068650245666504, "global_step": 168778, "epoch": 4018} {"train_loss": -7.010116100311279, "global_step": 168779, "epoch": 4018} {"train_loss": -6.9871721267700195, "global_step": 168780, "epoch": 4018} {"train_loss": -7.117602348327637, "global_step": 168781, "epoch": 4018} {"train_loss": -7.080766677856445, "global_step": 168782, "epoch": 4018} {"train_loss": -7.125256061553955, "global_step": 168783, "epoch": 4018} {"train_loss": -7.097034454345703, "global_step": 168784, "epoch": 4018} {"train_loss": -6.960898399353027, "global_step": 168785, "epoch": 4018} {"train_loss": -6.864622116088867, "global_step": 168786, "epoch": 4018} {"train_loss": -7.044108867645264, "global_step": 168787, "epoch": 4018} {"train_loss": -7.119308948516846, "global_step": 168788, "epoch": 4018} {"train_loss": -7.042834281921387, "global_step": 168789, "epoch": 4018} {"train_loss": -7.000972270965576, "global_step": 168790, "epoch": 4018} {"train_loss": -6.964773178100586, "global_step": 168791, "epoch": 4018} {"train_loss": -6.85683536529541, "global_step": 168792, "epoch": 4018} {"train_loss": -7.046079635620117, "global_step": 168793, "epoch": 4018} {"train_loss": -6.977267265319824, "global_step": 168794, "epoch": 4018} {"train_loss": -6.988517761230469, "global_step": 168795, "epoch": 4018} {"train_loss": -7.060787200927734, "global_step": 168796, "epoch": 4018} {"train_loss": -7.019877218064808, "global_step": 168797, "epoch": 4018, "val_loss": 68530.734375} {"train_loss": -7.125699996948242, "global_step": 168798, "epoch": 4019} {"train_loss": -6.972647666931152, "global_step": 168799, "epoch": 4019} {"train_loss": -7.011957168579102, "global_step": 168800, "epoch": 4019} {"train_loss": -6.9192705154418945, "global_step": 168801, "epoch": 4019} {"train_loss": -7.177827835083008, "global_step": 168802, "epoch": 4019} {"train_loss": -7.025657653808594, "global_step": 168803, "epoch": 4019} {"train_loss": -6.989974021911621, "global_step": 168804, "epoch": 4019} {"train_loss": -7.056903839111328, "global_step": 168805, "epoch": 4019} {"train_loss": -6.997504711151123, "global_step": 168806, "epoch": 4019} {"train_loss": -6.986227512359619, "global_step": 168807, "epoch": 4019} {"train_loss": -7.065805912017822, "global_step": 168808, "epoch": 4019} {"train_loss": -6.894261837005615, "global_step": 168809, "epoch": 4019} {"train_loss": -6.987089157104492, "global_step": 168810, "epoch": 4019} {"train_loss": -6.965663909912109, "global_step": 168811, "epoch": 4019} {"train_loss": -6.931391716003418, "global_step": 168812, "epoch": 4019} {"train_loss": -6.867206573486328, "global_step": 168813, "epoch": 4019} {"train_loss": -7.081476211547852, "global_step": 168814, "epoch": 4019} {"train_loss": -6.971194744110107, "global_step": 168815, "epoch": 4019} {"train_loss": -6.977097988128662, "global_step": 168816, "epoch": 4019} {"train_loss": -7.058162689208984, "global_step": 168817, "epoch": 4019} {"train_loss": -6.973137855529785, "global_step": 168818, "epoch": 4019} {"train_loss": -6.896130561828613, "global_step": 168819, "epoch": 4019} {"train_loss": -7.006909370422363, "global_step": 168820, "epoch": 4019} {"train_loss": -6.984144687652588, "global_step": 168821, "epoch": 4019} {"train_loss": -6.972807884216309, "global_step": 168822, "epoch": 4019} {"train_loss": -6.937922954559326, "global_step": 168823, "epoch": 4019} {"train_loss": -6.920723915100098, "global_step": 168824, "epoch": 4019} {"train_loss": -6.977775573730469, "global_step": 168825, "epoch": 4019} {"train_loss": -7.005958557128906, "global_step": 168826, "epoch": 4019} {"train_loss": -6.991894245147705, "global_step": 168827, "epoch": 4019} {"train_loss": -6.938150405883789, "global_step": 168828, "epoch": 4019} {"train_loss": -6.994655609130859, "global_step": 168829, "epoch": 4019} {"train_loss": -6.856113433837891, "global_step": 168830, "epoch": 4019} {"train_loss": -6.982977867126465, "global_step": 168831, "epoch": 4019} {"train_loss": -6.978664875030518, "global_step": 168832, "epoch": 4019} {"train_loss": -6.878159999847412, "global_step": 168833, "epoch": 4019} {"train_loss": -6.946196556091309, "global_step": 168834, "epoch": 4019} {"train_loss": -7.017652988433838, "global_step": 168835, "epoch": 4019} {"train_loss": -6.92835807800293, "global_step": 168836, "epoch": 4019} {"train_loss": -6.874916076660156, "global_step": 168837, "epoch": 4019} {"train_loss": -6.990043640136719, "global_step": 168838, "epoch": 4019} {"train_loss": -6.979474578584943, "global_step": 168839, "epoch": 4019, "val_loss": 68745.515625} {"train_loss": -6.936218738555908, "global_step": 168840, "epoch": 4020} {"train_loss": -6.952803611755371, "global_step": 168841, "epoch": 4020} {"train_loss": -6.962541580200195, "global_step": 168842, "epoch": 4020} {"train_loss": -7.013958930969238, "global_step": 168843, "epoch": 4020} {"train_loss": -7.013121128082275, "global_step": 168844, "epoch": 4020} {"train_loss": -6.999001502990723, "global_step": 168845, "epoch": 4020} {"train_loss": -6.898699760437012, "global_step": 168846, "epoch": 4020} {"train_loss": -7.009727478027344, "global_step": 168847, "epoch": 4020} {"train_loss": -6.9681243896484375, "global_step": 168848, "epoch": 4020} {"train_loss": -7.008327960968018, "global_step": 168849, "epoch": 4020} {"train_loss": -7.0564470291137695, "global_step": 168850, "epoch": 4020} {"train_loss": -6.969690322875977, "global_step": 168851, "epoch": 4020} {"train_loss": -6.9124321937561035, "global_step": 168852, "epoch": 4020} {"train_loss": -6.933753967285156, "global_step": 168853, "epoch": 4020} {"train_loss": -7.071479797363281, "global_step": 168854, "epoch": 4020} {"train_loss": -6.876988887786865, "global_step": 168855, "epoch": 4020} {"train_loss": -7.1001129150390625, "global_step": 168856, "epoch": 4020} {"train_loss": -6.972324371337891, "global_step": 168857, "epoch": 4020} {"train_loss": -6.982037544250488, "global_step": 168858, "epoch": 4020} {"train_loss": -7.019351005554199, "global_step": 168859, "epoch": 4020} {"train_loss": -6.851728439331055, "global_step": 168860, "epoch": 4020} {"train_loss": -6.979592323303223, "global_step": 168861, "epoch": 4020} {"train_loss": -6.994953155517578, "global_step": 168862, "epoch": 4020} {"train_loss": -7.016273498535156, "global_step": 168863, "epoch": 4020} {"train_loss": -6.722468376159668, "global_step": 168864, "epoch": 4020} {"train_loss": -6.923984527587891, "global_step": 168865, "epoch": 4020} {"train_loss": -6.935329914093018, "global_step": 168866, "epoch": 4020} {"train_loss": -6.814151763916016, "global_step": 168867, "epoch": 4020} {"train_loss": -6.791595458984375, "global_step": 168868, "epoch": 4020} {"train_loss": -6.724347114562988, "global_step": 168869, "epoch": 4020} {"train_loss": -6.768332004547119, "global_step": 168870, "epoch": 4020} {"train_loss": -6.757749557495117, "global_step": 168871, "epoch": 4020} {"train_loss": -6.765125751495361, "global_step": 168872, "epoch": 4020} {"train_loss": -6.842735290527344, "global_step": 168873, "epoch": 4020} {"train_loss": -6.701552391052246, "global_step": 168874, "epoch": 4020} {"train_loss": -6.810819625854492, "global_step": 168875, "epoch": 4020} {"train_loss": -6.781924247741699, "global_step": 168876, "epoch": 4020} {"train_loss": -6.905814170837402, "global_step": 168877, "epoch": 4020} {"train_loss": -6.747928619384766, "global_step": 168878, "epoch": 4020} {"train_loss": -6.676714897155762, "global_step": 168879, "epoch": 4020} {"train_loss": -6.8527655601501465, "global_step": 168880, "epoch": 4020} {"train_loss": -6.9067832969483876, "global_step": 168881, "epoch": 4020, "val_loss": 68623.890625} {"train_loss": -6.964077949523926, "global_step": 168882, "epoch": 4021} {"train_loss": -6.783071041107178, "global_step": 168883, "epoch": 4021} {"train_loss": -6.766594886779785, "global_step": 168884, "epoch": 4021} {"train_loss": -6.947190284729004, "global_step": 168885, "epoch": 4021} {"train_loss": -6.828987121582031, "global_step": 168886, "epoch": 4021} {"train_loss": -6.992203712463379, "global_step": 168887, "epoch": 4021} {"train_loss": -6.938596725463867, "global_step": 168888, "epoch": 4021} {"train_loss": -7.032017707824707, "global_step": 168889, "epoch": 4021} {"train_loss": -6.987905025482178, "global_step": 168890, "epoch": 4021} {"train_loss": -6.962578773498535, "global_step": 168891, "epoch": 4021} {"train_loss": -6.898407936096191, "global_step": 168892, "epoch": 4021} {"train_loss": -6.967704772949219, "global_step": 168893, "epoch": 4021} {"train_loss": -7.030688285827637, "global_step": 168894, "epoch": 4021} {"train_loss": -6.912511825561523, "global_step": 168895, "epoch": 4021} {"train_loss": -6.890203475952148, "global_step": 168896, "epoch": 4021} {"train_loss": -6.92039680480957, "global_step": 168897, "epoch": 4021} {"train_loss": -6.928752422332764, "global_step": 168898, "epoch": 4021} {"train_loss": -6.9692511558532715, "global_step": 168899, "epoch": 4021} {"train_loss": -6.850897789001465, "global_step": 168900, "epoch": 4021} {"train_loss": -7.008749485015869, "global_step": 168901, "epoch": 4021} {"train_loss": -7.038083076477051, "global_step": 168902, "epoch": 4021} {"train_loss": -7.0038604736328125, "global_step": 168903, "epoch": 4021} {"train_loss": -7.0419464111328125, "global_step": 168904, "epoch": 4021} {"train_loss": -6.8907904624938965, "global_step": 168905, "epoch": 4021} {"train_loss": -6.949245452880859, "global_step": 168906, "epoch": 4021} {"train_loss": -7.100976943969727, "global_step": 168907, "epoch": 4021} {"train_loss": -7.073325157165527, "global_step": 168908, "epoch": 4021} {"train_loss": -7.092268943786621, "global_step": 168909, "epoch": 4021} {"train_loss": -6.987884998321533, "global_step": 168910, "epoch": 4021} {"train_loss": -6.9653143882751465, "global_step": 168911, "epoch": 4021} {"train_loss": -7.128704071044922, "global_step": 168912, "epoch": 4021} {"train_loss": -6.924496650695801, "global_step": 168913, "epoch": 4021} {"train_loss": -7.075118541717529, "global_step": 168914, "epoch": 4021} {"train_loss": -6.964646816253662, "global_step": 168915, "epoch": 4021} {"train_loss": -6.880059242248535, "global_step": 168916, "epoch": 4021} {"train_loss": -6.912707328796387, "global_step": 168917, "epoch": 4021} {"train_loss": -6.877068519592285, "global_step": 168918, "epoch": 4021} {"train_loss": -6.959114074707031, "global_step": 168919, "epoch": 4021} {"train_loss": -6.959134101867676, "global_step": 168920, "epoch": 4021} {"train_loss": -7.0474162101745605, "global_step": 168921, "epoch": 4021} {"train_loss": -7.054821968078613, "global_step": 168922, "epoch": 4021} {"train_loss": -6.964727912630353, "global_step": 168923, "epoch": 4021, "val_loss": 68557.9140625} {"train_loss": -7.024009704589844, "global_step": 168924, "epoch": 4022} {"train_loss": -7.051089286804199, "global_step": 168925, "epoch": 4022} {"train_loss": -6.910318374633789, "global_step": 168926, "epoch": 4022} {"train_loss": -7.03879976272583, "global_step": 168927, "epoch": 4022} {"train_loss": -6.945043087005615, "global_step": 168928, "epoch": 4022} {"train_loss": -7.017414093017578, "global_step": 168929, "epoch": 4022} {"train_loss": -6.798852443695068, "global_step": 168930, "epoch": 4022} {"train_loss": -6.86240291595459, "global_step": 168931, "epoch": 4022} {"train_loss": -7.015131950378418, "global_step": 168932, "epoch": 4022} {"train_loss": -6.8945207595825195, "global_step": 168933, "epoch": 4022} {"train_loss": -6.891217231750488, "global_step": 168934, "epoch": 4022} {"train_loss": -6.956042289733887, "global_step": 168935, "epoch": 4022} {"train_loss": -6.983275890350342, "global_step": 168936, "epoch": 4022} {"train_loss": -7.048150062561035, "global_step": 168937, "epoch": 4022} {"train_loss": -7.023116588592529, "global_step": 168938, "epoch": 4022} {"train_loss": -6.953907489776611, "global_step": 168939, "epoch": 4022} {"train_loss": -6.94391393661499, "global_step": 168940, "epoch": 4022} {"train_loss": -6.954751014709473, "global_step": 168941, "epoch": 4022} {"train_loss": -6.892760276794434, "global_step": 168942, "epoch": 4022} {"train_loss": -6.920048236846924, "global_step": 168943, "epoch": 4022} {"train_loss": -7.035869598388672, "global_step": 168944, "epoch": 4022} {"train_loss": -7.013132095336914, "global_step": 168945, "epoch": 4022} {"train_loss": -7.002939224243164, "global_step": 168946, "epoch": 4022} {"train_loss": -7.008583068847656, "global_step": 168947, "epoch": 4022} {"train_loss": -7.082423210144043, "global_step": 168948, "epoch": 4022} {"train_loss": -6.970109939575195, "global_step": 168949, "epoch": 4022} {"train_loss": -7.0022478103637695, "global_step": 168950, "epoch": 4022} {"train_loss": -7.005851745605469, "global_step": 168951, "epoch": 4022} {"train_loss": -6.975719451904297, "global_step": 168952, "epoch": 4022} {"train_loss": -6.9354376792907715, "global_step": 168953, "epoch": 4022} {"train_loss": -7.043155670166016, "global_step": 168954, "epoch": 4022} {"train_loss": -7.019103050231934, "global_step": 168955, "epoch": 4022} {"train_loss": -6.948392868041992, "global_step": 168956, "epoch": 4022} {"train_loss": -6.974225997924805, "global_step": 168957, "epoch": 4022} {"train_loss": -7.023426532745361, "global_step": 168958, "epoch": 4022} {"train_loss": -7.063511848449707, "global_step": 168959, "epoch": 4022} {"train_loss": -6.979407787322998, "global_step": 168960, "epoch": 4022} {"train_loss": -7.048424243927002, "global_step": 168961, "epoch": 4022} {"train_loss": -7.000828266143799, "global_step": 168962, "epoch": 4022} {"train_loss": -6.974223613739014, "global_step": 168963, "epoch": 4022} {"train_loss": -7.030370712280273, "global_step": 168964, "epoch": 4022} {"train_loss": -6.982232956659226, "global_step": 168965, "epoch": 4022, "val_loss": 68763.9375} {"train_loss": -6.997481346130371, "global_step": 168966, "epoch": 4023} {"train_loss": -6.943422317504883, "global_step": 168967, "epoch": 4023} {"train_loss": -7.04327392578125, "global_step": 168968, "epoch": 4023} {"train_loss": -6.944495677947998, "global_step": 168969, "epoch": 4023} {"train_loss": -7.019512176513672, "global_step": 168970, "epoch": 4023} {"train_loss": -7.094324111938477, "global_step": 168971, "epoch": 4023} {"train_loss": -7.01705265045166, "global_step": 168972, "epoch": 4023} {"train_loss": -7.083907127380371, "global_step": 168973, "epoch": 4023} {"train_loss": -7.013172149658203, "global_step": 168974, "epoch": 4023} {"train_loss": -6.967331409454346, "global_step": 168975, "epoch": 4023} {"train_loss": -6.978885173797607, "global_step": 168976, "epoch": 4023} {"train_loss": -6.984151840209961, "global_step": 168977, "epoch": 4023} {"train_loss": -7.0204267501831055, "global_step": 168978, "epoch": 4023} {"train_loss": -7.017305850982666, "global_step": 168979, "epoch": 4023} {"train_loss": -6.96893310546875, "global_step": 168980, "epoch": 4023} {"train_loss": -6.825717926025391, "global_step": 168981, "epoch": 4023} {"train_loss": -7.01949405670166, "global_step": 168982, "epoch": 4023} {"train_loss": -6.881960868835449, "global_step": 168983, "epoch": 4023} {"train_loss": -6.829112529754639, "global_step": 168984, "epoch": 4023} {"train_loss": -6.845880031585693, "global_step": 168985, "epoch": 4023} {"train_loss": -6.913191318511963, "global_step": 168986, "epoch": 4023} {"train_loss": -7.004796028137207, "global_step": 168987, "epoch": 4023} {"train_loss": -6.764225482940674, "global_step": 168988, "epoch": 4023} {"train_loss": -6.910309791564941, "global_step": 168989, "epoch": 4023} {"train_loss": -7.04677677154541, "global_step": 168990, "epoch": 4023} {"train_loss": -6.933784484863281, "global_step": 168991, "epoch": 4023} {"train_loss": -7.016922950744629, "global_step": 168992, "epoch": 4023} {"train_loss": -6.9419331550598145, "global_step": 168993, "epoch": 4023} {"train_loss": -7.005399227142334, "global_step": 168994, "epoch": 4023} {"train_loss": -6.840631484985352, "global_step": 168995, "epoch": 4023} {"train_loss": -6.961508274078369, "global_step": 168996, "epoch": 4023} {"train_loss": -6.898299217224121, "global_step": 168997, "epoch": 4023} {"train_loss": -6.893552780151367, "global_step": 168998, "epoch": 4023} {"train_loss": -6.9581403732299805, "global_step": 168999, "epoch": 4023} {"train_loss": -7.0524444580078125, "global_step": 169000, "epoch": 4023} {"train_loss": -7.0106425285339355, "global_step": 169001, "epoch": 4023} {"train_loss": -7.115204811096191, "global_step": 169002, "epoch": 4023} {"train_loss": -6.96641731262207, "global_step": 169003, "epoch": 4023} {"train_loss": -7.022159576416016, "global_step": 169004, "epoch": 4023} {"train_loss": -6.952765464782715, "global_step": 169005, "epoch": 4023} {"train_loss": -7.044344425201416, "global_step": 169006, "epoch": 4023} {"train_loss": -6.967875707717169, "global_step": 169007, "epoch": 4023, "val_loss": 68745.125} {"train_loss": -6.9384660720825195, "global_step": 169008, "epoch": 4024} {"train_loss": -6.999441146850586, "global_step": 169009, "epoch": 4024} {"train_loss": -6.858912467956543, "global_step": 169010, "epoch": 4024} {"train_loss": -6.937437057495117, "global_step": 169011, "epoch": 4024} {"train_loss": -6.962120056152344, "global_step": 169012, "epoch": 4024} {"train_loss": -6.838894844055176, "global_step": 169013, "epoch": 4024} {"train_loss": -6.911892890930176, "global_step": 169014, "epoch": 4024} {"train_loss": -6.765323162078857, "global_step": 169015, "epoch": 4024} {"train_loss": -6.819462776184082, "global_step": 169016, "epoch": 4024} {"train_loss": -6.894015312194824, "global_step": 169017, "epoch": 4024} {"train_loss": -6.90648889541626, "global_step": 169018, "epoch": 4024} {"train_loss": -7.041769504547119, "global_step": 169019, "epoch": 4024} {"train_loss": -6.913032531738281, "global_step": 169020, "epoch": 4024} {"train_loss": -6.948262691497803, "global_step": 169021, "epoch": 4024} {"train_loss": -7.008638381958008, "global_step": 169022, "epoch": 4024} {"train_loss": -6.878424167633057, "global_step": 169023, "epoch": 4024} {"train_loss": -7.003012657165527, "global_step": 169024, "epoch": 4024} {"train_loss": -6.907323837280273, "global_step": 169025, "epoch": 4024} {"train_loss": -6.902009963989258, "global_step": 169026, "epoch": 4024} {"train_loss": -6.960426330566406, "global_step": 169027, "epoch": 4024} {"train_loss": -6.986928939819336, "global_step": 169028, "epoch": 4024} {"train_loss": -7.018623352050781, "global_step": 169029, "epoch": 4024} {"train_loss": -6.848048210144043, "global_step": 169030, "epoch": 4024} {"train_loss": -6.954315662384033, "global_step": 169031, "epoch": 4024} {"train_loss": -6.988547325134277, "global_step": 169032, "epoch": 4024} {"train_loss": -6.956564903259277, "global_step": 169033, "epoch": 4024} {"train_loss": -7.097102642059326, "global_step": 169034, "epoch": 4024} {"train_loss": -6.993472576141357, "global_step": 169035, "epoch": 4024} {"train_loss": -6.788133144378662, "global_step": 169036, "epoch": 4024} {"train_loss": -6.896568775177002, "global_step": 169037, "epoch": 4024} {"train_loss": -6.923901557922363, "global_step": 169038, "epoch": 4024} {"train_loss": -6.808876991271973, "global_step": 169039, "epoch": 4024} {"train_loss": -6.973045349121094, "global_step": 169040, "epoch": 4024} {"train_loss": -7.005243301391602, "global_step": 169041, "epoch": 4024} {"train_loss": -6.850279808044434, "global_step": 169042, "epoch": 4024} {"train_loss": -6.946911811828613, "global_step": 169043, "epoch": 4024} {"train_loss": -6.925438404083252, "global_step": 169044, "epoch": 4024} {"train_loss": -6.909343719482422, "global_step": 169045, "epoch": 4024} {"train_loss": -6.947423458099365, "global_step": 169046, "epoch": 4024} {"train_loss": -6.842267036437988, "global_step": 169047, "epoch": 4024} {"train_loss": -6.850184440612793, "global_step": 169048, "epoch": 4024} {"train_loss": -6.925968488057454, "global_step": 169049, "epoch": 4024, "val_loss": 68848.375} {"train_loss": -6.986121654510498, "global_step": 169050, "epoch": 4025} {"train_loss": -6.909954071044922, "global_step": 169051, "epoch": 4025} {"train_loss": -6.966912269592285, "global_step": 169052, "epoch": 4025} {"train_loss": -6.930468559265137, "global_step": 169053, "epoch": 4025} {"train_loss": -6.9668803215026855, "global_step": 169054, "epoch": 4025} {"train_loss": -6.993630409240723, "global_step": 169055, "epoch": 4025} {"train_loss": -6.982624053955078, "global_step": 169056, "epoch": 4025} {"train_loss": -6.829542636871338, "global_step": 169057, "epoch": 4025} {"train_loss": -6.9044904708862305, "global_step": 169058, "epoch": 4025} {"train_loss": -6.907555103302002, "global_step": 169059, "epoch": 4025} {"train_loss": -7.053133964538574, "global_step": 169060, "epoch": 4025} {"train_loss": -6.902796745300293, "global_step": 169061, "epoch": 4025} {"train_loss": -6.8272480964660645, "global_step": 169062, "epoch": 4025} {"train_loss": -6.9089202880859375, "global_step": 169063, "epoch": 4025} {"train_loss": -6.696835517883301, "global_step": 169064, "epoch": 4025} {"train_loss": -6.932353973388672, "global_step": 169065, "epoch": 4025} {"train_loss": -6.72450590133667, "global_step": 169066, "epoch": 4025} {"train_loss": -6.981152057647705, "global_step": 169067, "epoch": 4025} {"train_loss": -6.884101867675781, "global_step": 169068, "epoch": 4025} {"train_loss": -6.732035160064697, "global_step": 169069, "epoch": 4025} {"train_loss": -6.97364616394043, "global_step": 169070, "epoch": 4025} {"train_loss": -6.708221435546875, "global_step": 169071, "epoch": 4025} {"train_loss": -6.930968284606934, "global_step": 169072, "epoch": 4025} {"train_loss": -6.790049076080322, "global_step": 169073, "epoch": 4025} {"train_loss": -6.830690860748291, "global_step": 169074, "epoch": 4025} {"train_loss": -6.699524879455566, "global_step": 169075, "epoch": 4025} {"train_loss": -6.849748611450195, "global_step": 169076, "epoch": 4025} {"train_loss": -6.739973545074463, "global_step": 169077, "epoch": 4025} {"train_loss": -6.943874835968018, "global_step": 169078, "epoch": 4025} {"train_loss": -6.944575309753418, "global_step": 169079, "epoch": 4025} {"train_loss": -6.8334550857543945, "global_step": 169080, "epoch": 4025} {"train_loss": -6.869663238525391, "global_step": 169081, "epoch": 4025} {"train_loss": -6.945256233215332, "global_step": 169082, "epoch": 4025} {"train_loss": -6.7536163330078125, "global_step": 169083, "epoch": 4025} {"train_loss": -6.87950325012207, "global_step": 169084, "epoch": 4025} {"train_loss": -7.019908905029297, "global_step": 169085, "epoch": 4025} {"train_loss": -6.716244697570801, "global_step": 169086, "epoch": 4025} {"train_loss": -6.838765621185303, "global_step": 169087, "epoch": 4025} {"train_loss": -6.919953346252441, "global_step": 169088, "epoch": 4025} {"train_loss": -6.8756890296936035, "global_step": 169089, "epoch": 4025} {"train_loss": -7.039182662963867, "global_step": 169090, "epoch": 4025} {"train_loss": -6.879722935812814, "global_step": 169091, "epoch": 4025, "val_loss": 68612.2265625} {"train_loss": -6.803554534912109, "global_step": 169092, "epoch": 4026} {"train_loss": -6.994045257568359, "global_step": 169093, "epoch": 4026} {"train_loss": -6.98612117767334, "global_step": 169094, "epoch": 4026} {"train_loss": -6.878502368927002, "global_step": 169095, "epoch": 4026} {"train_loss": -7.076932907104492, "global_step": 169096, "epoch": 4026} {"train_loss": -7.0295515060424805, "global_step": 169097, "epoch": 4026} {"train_loss": -7.009528636932373, "global_step": 169098, "epoch": 4026} {"train_loss": -6.856027126312256, "global_step": 169099, "epoch": 4026} {"train_loss": -6.942884922027588, "global_step": 169100, "epoch": 4026} {"train_loss": -6.997584342956543, "global_step": 169101, "epoch": 4026} {"train_loss": -6.966570854187012, "global_step": 169102, "epoch": 4026} {"train_loss": -6.950850486755371, "global_step": 169103, "epoch": 4026} {"train_loss": -7.033092021942139, "global_step": 169104, "epoch": 4026} {"train_loss": -7.06446647644043, "global_step": 169105, "epoch": 4026} {"train_loss": -6.9789509773254395, "global_step": 169106, "epoch": 4026} {"train_loss": -7.044674873352051, "global_step": 169107, "epoch": 4026} {"train_loss": -7.009798049926758, "global_step": 169108, "epoch": 4026} {"train_loss": -7.048851013183594, "global_step": 169109, "epoch": 4026} {"train_loss": -6.916423797607422, "global_step": 169110, "epoch": 4026} {"train_loss": -6.89382791519165, "global_step": 169111, "epoch": 4026} {"train_loss": -6.973453998565674, "global_step": 169112, "epoch": 4026} {"train_loss": -6.960850715637207, "global_step": 169113, "epoch": 4026} {"train_loss": -6.970059394836426, "global_step": 169114, "epoch": 4026} {"train_loss": -7.119780540466309, "global_step": 169115, "epoch": 4026} {"train_loss": -6.8778605461120605, "global_step": 169116, "epoch": 4026} {"train_loss": -6.930424690246582, "global_step": 169117, "epoch": 4026} {"train_loss": -6.938392639160156, "global_step": 169118, "epoch": 4026} {"train_loss": -6.977104663848877, "global_step": 169119, "epoch": 4026} {"train_loss": -7.005379676818848, "global_step": 169120, "epoch": 4026} {"train_loss": -7.027155876159668, "global_step": 169121, "epoch": 4026} {"train_loss": -6.923450469970703, "global_step": 169122, "epoch": 4026} {"train_loss": -6.994616985321045, "global_step": 169123, "epoch": 4026} {"train_loss": -7.079079627990723, "global_step": 169124, "epoch": 4026} {"train_loss": -6.910071849822998, "global_step": 169125, "epoch": 4026} {"train_loss": -6.960420608520508, "global_step": 169126, "epoch": 4026} {"train_loss": -7.057906150817871, "global_step": 169127, "epoch": 4026} {"train_loss": -6.954442024230957, "global_step": 169128, "epoch": 4026} {"train_loss": -7.051837921142578, "global_step": 169129, "epoch": 4026} {"train_loss": -6.966920375823975, "global_step": 169130, "epoch": 4026} {"train_loss": -7.071051120758057, "global_step": 169131, "epoch": 4026} {"train_loss": -6.864629745483398, "global_step": 169132, "epoch": 4026} {"train_loss": -6.974505912689936, "global_step": 169133, "epoch": 4026, "val_loss": 68657.71875} {"train_loss": -6.899030685424805, "global_step": 169134, "epoch": 4027} {"train_loss": -7.0058722496032715, "global_step": 169135, "epoch": 4027} {"train_loss": -6.967878341674805, "global_step": 169136, "epoch": 4027} {"train_loss": -6.920199394226074, "global_step": 169137, "epoch": 4027} {"train_loss": -6.8821916580200195, "global_step": 169138, "epoch": 4027} {"train_loss": -6.952485084533691, "global_step": 169139, "epoch": 4027} {"train_loss": -7.04022741317749, "global_step": 169140, "epoch": 4027} {"train_loss": -6.975632667541504, "global_step": 169141, "epoch": 4027} {"train_loss": -6.935763359069824, "global_step": 169142, "epoch": 4027} {"train_loss": -6.94034481048584, "global_step": 169143, "epoch": 4027} {"train_loss": -6.932591438293457, "global_step": 169144, "epoch": 4027} {"train_loss": -7.042425155639648, "global_step": 169145, "epoch": 4027} {"train_loss": -6.907423973083496, "global_step": 169146, "epoch": 4027} {"train_loss": -7.048494338989258, "global_step": 169147, "epoch": 4027} {"train_loss": -6.964786529541016, "global_step": 169148, "epoch": 4027} {"train_loss": -7.055013179779053, "global_step": 169149, "epoch": 4027} {"train_loss": -7.006573677062988, "global_step": 169150, "epoch": 4027} {"train_loss": -6.966769695281982, "global_step": 169151, "epoch": 4027} {"train_loss": -7.001328468322754, "global_step": 169152, "epoch": 4027} {"train_loss": -6.98890495300293, "global_step": 169153, "epoch": 4027} {"train_loss": -7.036001682281494, "global_step": 169154, "epoch": 4027} {"train_loss": -6.971940994262695, "global_step": 169155, "epoch": 4027} {"train_loss": -7.054502487182617, "global_step": 169156, "epoch": 4027} {"train_loss": -7.04415225982666, "global_step": 169157, "epoch": 4027} {"train_loss": -7.0319366455078125, "global_step": 169158, "epoch": 4027} {"train_loss": -7.049117088317871, "global_step": 169159, "epoch": 4027} {"train_loss": -7.023492336273193, "global_step": 169160, "epoch": 4027} {"train_loss": -6.973912715911865, "global_step": 169161, "epoch": 4027} {"train_loss": -7.026434898376465, "global_step": 169162, "epoch": 4027} {"train_loss": -7.007870674133301, "global_step": 169163, "epoch": 4027} {"train_loss": -6.952001094818115, "global_step": 169164, "epoch": 4027} {"train_loss": -6.975991249084473, "global_step": 169165, "epoch": 4027} {"train_loss": -6.943814277648926, "global_step": 169166, "epoch": 4027} {"train_loss": -7.005561828613281, "global_step": 169167, "epoch": 4027} {"train_loss": -6.984124660491943, "global_step": 169168, "epoch": 4027} {"train_loss": -6.956246852874756, "global_step": 169169, "epoch": 4027} {"train_loss": -7.106161117553711, "global_step": 169170, "epoch": 4027} {"train_loss": -7.0706257820129395, "global_step": 169171, "epoch": 4027} {"train_loss": -6.889490604400635, "global_step": 169172, "epoch": 4027} {"train_loss": -7.029781341552734, "global_step": 169173, "epoch": 4027} {"train_loss": -7.0791497230529785, "global_step": 169174, "epoch": 4027} {"train_loss": -6.994340431122553, "global_step": 169175, "epoch": 4027, "val_loss": 68342.1953125} {"train_loss": -6.966734886169434, "global_step": 169176, "epoch": 4028} {"train_loss": -6.943617820739746, "global_step": 169177, "epoch": 4028} {"train_loss": -6.945785045623779, "global_step": 169178, "epoch": 4028} {"train_loss": -7.0350141525268555, "global_step": 169179, "epoch": 4028} {"train_loss": -7.111781120300293, "global_step": 169180, "epoch": 4028} {"train_loss": -7.0071001052856445, "global_step": 169181, "epoch": 4028} {"train_loss": -6.942722320556641, "global_step": 169182, "epoch": 4028} {"train_loss": -7.0324578285217285, "global_step": 169183, "epoch": 4028} {"train_loss": -7.03983211517334, "global_step": 169184, "epoch": 4028} {"train_loss": -7.135845184326172, "global_step": 169185, "epoch": 4028} {"train_loss": -7.116119861602783, "global_step": 169186, "epoch": 4028} {"train_loss": -7.079215049743652, "global_step": 169187, "epoch": 4028} {"train_loss": -6.953332424163818, "global_step": 169188, "epoch": 4028} {"train_loss": -6.953908920288086, "global_step": 169189, "epoch": 4028} {"train_loss": -7.040263652801514, "global_step": 169190, "epoch": 4028} {"train_loss": -6.924879550933838, "global_step": 169191, "epoch": 4028} {"train_loss": -6.968639373779297, "global_step": 169192, "epoch": 4028} {"train_loss": -7.009461402893066, "global_step": 169193, "epoch": 4028} {"train_loss": -7.052909851074219, "global_step": 169194, "epoch": 4028} {"train_loss": -6.910353660583496, "global_step": 169195, "epoch": 4028} {"train_loss": -6.986432075500488, "global_step": 169196, "epoch": 4028} {"train_loss": -7.055630683898926, "global_step": 169197, "epoch": 4028} {"train_loss": -7.0609235763549805, "global_step": 169198, "epoch": 4028} {"train_loss": -6.849810600280762, "global_step": 169199, "epoch": 4028} {"train_loss": -7.069947719573975, "global_step": 169200, "epoch": 4028} {"train_loss": -7.052231788635254, "global_step": 169201, "epoch": 4028} {"train_loss": -7.135463237762451, "global_step": 169202, "epoch": 4028} {"train_loss": -7.066791534423828, "global_step": 169203, "epoch": 4028} {"train_loss": -7.027021408081055, "global_step": 169204, "epoch": 4028} {"train_loss": -7.041650772094727, "global_step": 169205, "epoch": 4028} {"train_loss": -6.9716033935546875, "global_step": 169206, "epoch": 4028} {"train_loss": -6.966353893280029, "global_step": 169207, "epoch": 4028} {"train_loss": -7.0138630867004395, "global_step": 169208, "epoch": 4028} {"train_loss": -6.9965949058532715, "global_step": 169209, "epoch": 4028} {"train_loss": -6.918398380279541, "global_step": 169210, "epoch": 4028} {"train_loss": -6.938121795654297, "global_step": 169211, "epoch": 4028} {"train_loss": -7.016543865203857, "global_step": 169212, "epoch": 4028} {"train_loss": -6.997641086578369, "global_step": 169213, "epoch": 4028} {"train_loss": -7.052918910980225, "global_step": 169214, "epoch": 4028} {"train_loss": -6.972661972045898, "global_step": 169215, "epoch": 4028} {"train_loss": -7.103330612182617, "global_step": 169216, "epoch": 4028} {"train_loss": -7.010189238048735, "global_step": 169217, "epoch": 4028, "val_loss": 68586.546875} {"train_loss": -6.947919845581055, "global_step": 169218, "epoch": 4029} {"train_loss": -6.851431846618652, "global_step": 169219, "epoch": 4029} {"train_loss": -7.046422958374023, "global_step": 169220, "epoch": 4029} {"train_loss": -6.938889503479004, "global_step": 169221, "epoch": 4029} {"train_loss": -6.971294403076172, "global_step": 169222, "epoch": 4029} {"train_loss": -6.981161117553711, "global_step": 169223, "epoch": 4029} {"train_loss": -6.899042129516602, "global_step": 169224, "epoch": 4029} {"train_loss": -6.992376804351807, "global_step": 169225, "epoch": 4029} {"train_loss": -7.059459686279297, "global_step": 169226, "epoch": 4029} {"train_loss": -6.845534324645996, "global_step": 169227, "epoch": 4029} {"train_loss": -6.946609973907471, "global_step": 169228, "epoch": 4029} {"train_loss": -6.946394920349121, "global_step": 169229, "epoch": 4029} {"train_loss": -6.833637237548828, "global_step": 169230, "epoch": 4029} {"train_loss": -7.048495292663574, "global_step": 169231, "epoch": 4029} {"train_loss": -6.959992408752441, "global_step": 169232, "epoch": 4029} {"train_loss": -7.096874713897705, "global_step": 169233, "epoch": 4029} {"train_loss": -6.852090835571289, "global_step": 169234, "epoch": 4029} {"train_loss": -6.927821159362793, "global_step": 169235, "epoch": 4029} {"train_loss": -6.946770668029785, "global_step": 169236, "epoch": 4029} {"train_loss": -6.8962788581848145, "global_step": 169237, "epoch": 4029} {"train_loss": -6.968381881713867, "global_step": 169238, "epoch": 4029} {"train_loss": -6.86746883392334, "global_step": 169239, "epoch": 4029} {"train_loss": -6.827897071838379, "global_step": 169240, "epoch": 4029} {"train_loss": -6.992490768432617, "global_step": 169241, "epoch": 4029} {"train_loss": -6.91400146484375, "global_step": 169242, "epoch": 4029} {"train_loss": -6.887789726257324, "global_step": 169243, "epoch": 4029} {"train_loss": -6.83857536315918, "global_step": 169244, "epoch": 4029} {"train_loss": -6.931920051574707, "global_step": 169245, "epoch": 4029} {"train_loss": -7.049862384796143, "global_step": 169246, "epoch": 4029} {"train_loss": -6.868695259094238, "global_step": 169247, "epoch": 4029} {"train_loss": -6.947284698486328, "global_step": 169248, "epoch": 4029} {"train_loss": -6.891676902770996, "global_step": 169249, "epoch": 4029} {"train_loss": -6.912421703338623, "global_step": 169250, "epoch": 4029} {"train_loss": -6.983301639556885, "global_step": 169251, "epoch": 4029} {"train_loss": -7.022096157073975, "global_step": 169252, "epoch": 4029} {"train_loss": -6.95084810256958, "global_step": 169253, "epoch": 4029} {"train_loss": -6.900429725646973, "global_step": 169254, "epoch": 4029} {"train_loss": -6.908897399902344, "global_step": 169255, "epoch": 4029} {"train_loss": -6.960823059082031, "global_step": 169256, "epoch": 4029} {"train_loss": -6.767610549926758, "global_step": 169257, "epoch": 4029} {"train_loss": -7.045919418334961, "global_step": 169258, "epoch": 4029} {"train_loss": -6.936154853729975, "global_step": 169259, "epoch": 4029, "val_loss": 68574.46875} {"train_loss": -6.903499603271484, "global_step": 169260, "epoch": 4030} {"train_loss": -6.854528427124023, "global_step": 169261, "epoch": 4030} {"train_loss": -6.84248685836792, "global_step": 169262, "epoch": 4030} {"train_loss": -6.968012809753418, "global_step": 169263, "epoch": 4030} {"train_loss": -6.965781211853027, "global_step": 169264, "epoch": 4030} {"train_loss": -6.913199424743652, "global_step": 169265, "epoch": 4030} {"train_loss": -6.940665245056152, "global_step": 169266, "epoch": 4030} {"train_loss": -6.97541618347168, "global_step": 169267, "epoch": 4030} {"train_loss": -6.953248977661133, "global_step": 169268, "epoch": 4030} {"train_loss": -6.962845802307129, "global_step": 169269, "epoch": 4030} {"train_loss": -6.910971641540527, "global_step": 169270, "epoch": 4030} {"train_loss": -6.943620681762695, "global_step": 169271, "epoch": 4030} {"train_loss": -6.784646987915039, "global_step": 169272, "epoch": 4030} {"train_loss": -6.987870693206787, "global_step": 169273, "epoch": 4030} {"train_loss": -6.819026947021484, "global_step": 169274, "epoch": 4030} {"train_loss": -6.9824934005737305, "global_step": 169275, "epoch": 4030} {"train_loss": -6.887516021728516, "global_step": 169276, "epoch": 4030} {"train_loss": -6.944382190704346, "global_step": 169277, "epoch": 4030} {"train_loss": -6.919000625610352, "global_step": 169278, "epoch": 4030} {"train_loss": -6.816956996917725, "global_step": 169279, "epoch": 4030} {"train_loss": -6.982049465179443, "global_step": 169280, "epoch": 4030} {"train_loss": -6.853354454040527, "global_step": 169281, "epoch": 4030} {"train_loss": -6.881361484527588, "global_step": 169282, "epoch": 4030} {"train_loss": -6.973567008972168, "global_step": 169283, "epoch": 4030} {"train_loss": -6.8794426918029785, "global_step": 169284, "epoch": 4030} {"train_loss": -6.938692569732666, "global_step": 169285, "epoch": 4030} {"train_loss": -6.900278091430664, "global_step": 169286, "epoch": 4030} {"train_loss": -6.940786838531494, "global_step": 169287, "epoch": 4030} {"train_loss": -6.965646266937256, "global_step": 169288, "epoch": 4030} {"train_loss": -7.007031440734863, "global_step": 169289, "epoch": 4030} {"train_loss": -6.955127716064453, "global_step": 169290, "epoch": 4030} {"train_loss": -6.966572284698486, "global_step": 169291, "epoch": 4030} {"train_loss": -6.892061233520508, "global_step": 169292, "epoch": 4030} {"train_loss": -7.015502452850342, "global_step": 169293, "epoch": 4030} {"train_loss": -6.841954231262207, "global_step": 169294, "epoch": 4030} {"train_loss": -6.895068645477295, "global_step": 169295, "epoch": 4030} {"train_loss": -6.997836112976074, "global_step": 169296, "epoch": 4030} {"train_loss": -6.949363708496094, "global_step": 169297, "epoch": 4030} {"train_loss": -7.002874374389648, "global_step": 169298, "epoch": 4030} {"train_loss": -7.014893531799316, "global_step": 169299, "epoch": 4030} {"train_loss": -6.974847793579102, "global_step": 169300, "epoch": 4030} {"train_loss": -6.930998734065464, "global_step": 169301, "epoch": 4030, "val_loss": 68474.0078125} {"train_loss": -6.948348045349121, "global_step": 169302, "epoch": 4031} {"train_loss": -7.0159831047058105, "global_step": 169303, "epoch": 4031} {"train_loss": -6.936190605163574, "global_step": 169304, "epoch": 4031} {"train_loss": -6.998632907867432, "global_step": 169305, "epoch": 4031} {"train_loss": -6.923517227172852, "global_step": 169306, "epoch": 4031} {"train_loss": -7.012374401092529, "global_step": 169307, "epoch": 4031} {"train_loss": -6.950515270233154, "global_step": 169308, "epoch": 4031} {"train_loss": -6.943439483642578, "global_step": 169309, "epoch": 4031} {"train_loss": -7.093297481536865, "global_step": 169310, "epoch": 4031} {"train_loss": -6.943166732788086, "global_step": 169311, "epoch": 4031} {"train_loss": -7.045433044433594, "global_step": 169312, "epoch": 4031} {"train_loss": -6.955674648284912, "global_step": 169313, "epoch": 4031} {"train_loss": -6.99433708190918, "global_step": 169314, "epoch": 4031} {"train_loss": -7.041134834289551, "global_step": 169315, "epoch": 4031} {"train_loss": -6.98239803314209, "global_step": 169316, "epoch": 4031} {"train_loss": -6.980031490325928, "global_step": 169317, "epoch": 4031} {"train_loss": -7.0766448974609375, "global_step": 169318, "epoch": 4031} {"train_loss": -7.074932098388672, "global_step": 169319, "epoch": 4031} {"train_loss": -7.031172275543213, "global_step": 169320, "epoch": 4031} {"train_loss": -6.9003095626831055, "global_step": 169321, "epoch": 4031} {"train_loss": -7.033106803894043, "global_step": 169322, "epoch": 4031} {"train_loss": -6.876428604125977, "global_step": 169323, "epoch": 4031} {"train_loss": -7.0376667976379395, "global_step": 169324, "epoch": 4031} {"train_loss": -7.071275234222412, "global_step": 169325, "epoch": 4031} {"train_loss": -7.0478620529174805, "global_step": 169326, "epoch": 4031} {"train_loss": -7.125370502471924, "global_step": 169327, "epoch": 4031} {"train_loss": -6.958382606506348, "global_step": 169328, "epoch": 4031} {"train_loss": -6.847197532653809, "global_step": 169329, "epoch": 4031} {"train_loss": -6.988245964050293, "global_step": 169330, "epoch": 4031} {"train_loss": -7.1393632888793945, "global_step": 169331, "epoch": 4031} {"train_loss": -7.043697357177734, "global_step": 169332, "epoch": 4031} {"train_loss": -7.074617862701416, "global_step": 169333, "epoch": 4031} {"train_loss": -7.113414764404297, "global_step": 169334, "epoch": 4031} {"train_loss": -7.116653919219971, "global_step": 169335, "epoch": 4031} {"train_loss": -7.005323886871338, "global_step": 169336, "epoch": 4031} {"train_loss": -7.038145065307617, "global_step": 169337, "epoch": 4031} {"train_loss": -7.055164813995361, "global_step": 169338, "epoch": 4031} {"train_loss": -7.118572235107422, "global_step": 169339, "epoch": 4031} {"train_loss": -6.96095085144043, "global_step": 169340, "epoch": 4031} {"train_loss": -7.042914390563965, "global_step": 169341, "epoch": 4031} {"train_loss": -6.989470481872559, "global_step": 169342, "epoch": 4031} {"train_loss": -7.014172860554287, "global_step": 169343, "epoch": 4031, "val_loss": 68450.3125} {"train_loss": -7.07958984375, "global_step": 169344, "epoch": 4032} {"train_loss": -7.171435356140137, "global_step": 169345, "epoch": 4032} {"train_loss": -7.011450290679932, "global_step": 169346, "epoch": 4032} {"train_loss": -6.972075462341309, "global_step": 169347, "epoch": 4032} {"train_loss": -7.15889835357666, "global_step": 169348, "epoch": 4032} {"train_loss": -7.19590950012207, "global_step": 169349, "epoch": 4032} {"train_loss": -7.011730194091797, "global_step": 169350, "epoch": 4032} {"train_loss": -7.027104377746582, "global_step": 169351, "epoch": 4032} {"train_loss": -7.0070366859436035, "global_step": 169352, "epoch": 4032} {"train_loss": -6.96036434173584, "global_step": 169353, "epoch": 4032} {"train_loss": -6.9591569900512695, "global_step": 169354, "epoch": 4032} {"train_loss": -6.981250762939453, "global_step": 169355, "epoch": 4032} {"train_loss": -6.804685592651367, "global_step": 169356, "epoch": 4032} {"train_loss": -7.080697059631348, "global_step": 169357, "epoch": 4032} {"train_loss": -6.833646774291992, "global_step": 169358, "epoch": 4032} {"train_loss": -7.001659393310547, "global_step": 169359, "epoch": 4032} {"train_loss": -7.009256839752197, "global_step": 169360, "epoch": 4032} {"train_loss": -6.842192649841309, "global_step": 169361, "epoch": 4032} {"train_loss": -7.027353286743164, "global_step": 169362, "epoch": 4032} {"train_loss": -6.994726181030273, "global_step": 169363, "epoch": 4032} {"train_loss": -7.008814811706543, "global_step": 169364, "epoch": 4032} {"train_loss": -6.9289937019348145, "global_step": 169365, "epoch": 4032} {"train_loss": -6.846510410308838, "global_step": 169366, "epoch": 4032} {"train_loss": -6.893179893493652, "global_step": 169367, "epoch": 4032} {"train_loss": -6.9936394691467285, "global_step": 169368, "epoch": 4032} {"train_loss": -7.004864692687988, "global_step": 169369, "epoch": 4032} {"train_loss": -6.819726943969727, "global_step": 169370, "epoch": 4032} {"train_loss": -6.949108123779297, "global_step": 169371, "epoch": 4032} {"train_loss": -6.9073028564453125, "global_step": 169372, "epoch": 4032} {"train_loss": -6.881136894226074, "global_step": 169373, "epoch": 4032} {"train_loss": -6.93319845199585, "global_step": 169374, "epoch": 4032} {"train_loss": -6.800766944885254, "global_step": 169375, "epoch": 4032} {"train_loss": -6.799818992614746, "global_step": 169376, "epoch": 4032} {"train_loss": -6.920122146606445, "global_step": 169377, "epoch": 4032} {"train_loss": -6.988386154174805, "global_step": 169378, "epoch": 4032} {"train_loss": -7.0602922439575195, "global_step": 169379, "epoch": 4032} {"train_loss": -6.897406578063965, "global_step": 169380, "epoch": 4032} {"train_loss": -6.961804389953613, "global_step": 169381, "epoch": 4032} {"train_loss": -6.931848526000977, "global_step": 169382, "epoch": 4032} {"train_loss": -6.9802093505859375, "global_step": 169383, "epoch": 4032} {"train_loss": -6.976046562194824, "global_step": 169384, "epoch": 4032} {"train_loss": -6.968802849451701, "global_step": 169385, "epoch": 4032, "val_loss": 68603.5234375} {"train_loss": -7.114712715148926, "global_step": 169386, "epoch": 4033} {"train_loss": -6.991815567016602, "global_step": 169387, "epoch": 4033} {"train_loss": -7.038036823272705, "global_step": 169388, "epoch": 4033} {"train_loss": -6.918396949768066, "global_step": 169389, "epoch": 4033} {"train_loss": -7.031164169311523, "global_step": 169390, "epoch": 4033} {"train_loss": -7.011047840118408, "global_step": 169391, "epoch": 4033} {"train_loss": -6.968210697174072, "global_step": 169392, "epoch": 4033} {"train_loss": -7.096081256866455, "global_step": 169393, "epoch": 4033} {"train_loss": -6.997052192687988, "global_step": 169394, "epoch": 4033} {"train_loss": -7.05400276184082, "global_step": 169395, "epoch": 4033} {"train_loss": -7.034385681152344, "global_step": 169396, "epoch": 4033} {"train_loss": -6.999300479888916, "global_step": 169397, "epoch": 4033} {"train_loss": -7.094384670257568, "global_step": 169398, "epoch": 4033} {"train_loss": -7.076348304748535, "global_step": 169399, "epoch": 4033} {"train_loss": -6.991621017456055, "global_step": 169400, "epoch": 4033} {"train_loss": -6.983470916748047, "global_step": 169401, "epoch": 4033} {"train_loss": -7.115180015563965, "global_step": 169402, "epoch": 4033} {"train_loss": -6.9526567459106445, "global_step": 169403, "epoch": 4033} {"train_loss": -7.1024017333984375, "global_step": 169404, "epoch": 4033} {"train_loss": -6.928467273712158, "global_step": 169405, "epoch": 4033} {"train_loss": -7.034085750579834, "global_step": 169406, "epoch": 4033} {"train_loss": -7.041660308837891, "global_step": 169407, "epoch": 4033} {"train_loss": -7.095330238342285, "global_step": 169408, "epoch": 4033} {"train_loss": -6.9514946937561035, "global_step": 169409, "epoch": 4033} {"train_loss": -7.040691375732422, "global_step": 169410, "epoch": 4033} {"train_loss": -7.051511287689209, "global_step": 169411, "epoch": 4033} {"train_loss": -6.907584190368652, "global_step": 169412, "epoch": 4033} {"train_loss": -7.082108497619629, "global_step": 169413, "epoch": 4033} {"train_loss": -6.980857849121094, "global_step": 169414, "epoch": 4033} {"train_loss": -6.98091983795166, "global_step": 169415, "epoch": 4033} {"train_loss": -7.000324249267578, "global_step": 169416, "epoch": 4033} {"train_loss": -6.834397315979004, "global_step": 169417, "epoch": 4033} {"train_loss": -6.973947525024414, "global_step": 169418, "epoch": 4033} {"train_loss": -6.997274398803711, "global_step": 169419, "epoch": 4033} {"train_loss": -7.034189701080322, "global_step": 169420, "epoch": 4033} {"train_loss": -6.972712516784668, "global_step": 169421, "epoch": 4033} {"train_loss": -7.038520812988281, "global_step": 169422, "epoch": 4033} {"train_loss": -7.045623302459717, "global_step": 169423, "epoch": 4033} {"train_loss": -6.920305252075195, "global_step": 169424, "epoch": 4033} {"train_loss": -7.068953990936279, "global_step": 169425, "epoch": 4033} {"train_loss": -7.0155029296875, "global_step": 169426, "epoch": 4033} {"train_loss": -7.012713352839152, "global_step": 169427, "epoch": 4033, "val_loss": 68449.859375} {"train_loss": -7.03525972366333, "global_step": 169428, "epoch": 4034} {"train_loss": -7.113265037536621, "global_step": 169429, "epoch": 4034} {"train_loss": -6.992181777954102, "global_step": 169430, "epoch": 4034} {"train_loss": -7.017706394195557, "global_step": 169431, "epoch": 4034} {"train_loss": -6.964468002319336, "global_step": 169432, "epoch": 4034} {"train_loss": -6.985879898071289, "global_step": 169433, "epoch": 4034} {"train_loss": -6.998313903808594, "global_step": 169434, "epoch": 4034} {"train_loss": -7.067971706390381, "global_step": 169435, "epoch": 4034} {"train_loss": -7.0914201736450195, "global_step": 169436, "epoch": 4034} {"train_loss": -6.964652061462402, "global_step": 169437, "epoch": 4034} {"train_loss": -7.010592937469482, "global_step": 169438, "epoch": 4034} {"train_loss": -6.873200416564941, "global_step": 169439, "epoch": 4034} {"train_loss": -7.030891418457031, "global_step": 169440, "epoch": 4034} {"train_loss": -6.922855377197266, "global_step": 169441, "epoch": 4034} {"train_loss": -7.0579633712768555, "global_step": 169442, "epoch": 4034} {"train_loss": -6.965641975402832, "global_step": 169443, "epoch": 4034} {"train_loss": -6.894407749176025, "global_step": 169444, "epoch": 4034} {"train_loss": -6.942593097686768, "global_step": 169445, "epoch": 4034} {"train_loss": -7.004721641540527, "global_step": 169446, "epoch": 4034} {"train_loss": -6.955142974853516, "global_step": 169447, "epoch": 4034} {"train_loss": -6.972801208496094, "global_step": 169448, "epoch": 4034} {"train_loss": -6.8824310302734375, "global_step": 169449, "epoch": 4034} {"train_loss": -6.784677028656006, "global_step": 169450, "epoch": 4034} {"train_loss": -6.94115686416626, "global_step": 169451, "epoch": 4034} {"train_loss": -6.92694616317749, "global_step": 169452, "epoch": 4034} {"train_loss": -6.804006576538086, "global_step": 169453, "epoch": 4034} {"train_loss": -6.8570556640625, "global_step": 169454, "epoch": 4034} {"train_loss": -6.897824287414551, "global_step": 169455, "epoch": 4034} {"train_loss": -6.94227409362793, "global_step": 169456, "epoch": 4034} {"train_loss": -7.00960636138916, "global_step": 169457, "epoch": 4034} {"train_loss": -7.008648872375488, "global_step": 169458, "epoch": 4034} {"train_loss": -6.973329544067383, "global_step": 169459, "epoch": 4034} {"train_loss": -6.965899467468262, "global_step": 169460, "epoch": 4034} {"train_loss": -7.0350446701049805, "global_step": 169461, "epoch": 4034} {"train_loss": -6.888736724853516, "global_step": 169462, "epoch": 4034} {"train_loss": -6.910440444946289, "global_step": 169463, "epoch": 4034} {"train_loss": -7.001104354858398, "global_step": 169464, "epoch": 4034} {"train_loss": -6.992014408111572, "global_step": 169465, "epoch": 4034} {"train_loss": -6.964788436889648, "global_step": 169466, "epoch": 4034} {"train_loss": -6.8810858726501465, "global_step": 169467, "epoch": 4034} {"train_loss": -7.001375675201416, "global_step": 169468, "epoch": 4034} {"train_loss": -6.964085942222958, "global_step": 169469, "epoch": 4034, "val_loss": 68575.484375} {"train_loss": -7.061917304992676, "global_step": 169470, "epoch": 4035} {"train_loss": -7.017124176025391, "global_step": 169471, "epoch": 4035} {"train_loss": -7.1053996086120605, "global_step": 169472, "epoch": 4035} {"train_loss": -6.997413158416748, "global_step": 169473, "epoch": 4035} {"train_loss": -6.9071478843688965, "global_step": 169474, "epoch": 4035} {"train_loss": -7.105257034301758, "global_step": 169475, "epoch": 4035} {"train_loss": -6.992697715759277, "global_step": 169476, "epoch": 4035} {"train_loss": -6.984395980834961, "global_step": 169477, "epoch": 4035} {"train_loss": -6.91117000579834, "global_step": 169478, "epoch": 4035} {"train_loss": -7.038909912109375, "global_step": 169479, "epoch": 4035} {"train_loss": -7.0168938636779785, "global_step": 169480, "epoch": 4035} {"train_loss": -6.89882755279541, "global_step": 169481, "epoch": 4035} {"train_loss": -6.96389102935791, "global_step": 169482, "epoch": 4035} {"train_loss": -6.975110054016113, "global_step": 169483, "epoch": 4035} {"train_loss": -7.073968410491943, "global_step": 169484, "epoch": 4035} {"train_loss": -7.059976577758789, "global_step": 169485, "epoch": 4035} {"train_loss": -6.931285858154297, "global_step": 169486, "epoch": 4035} {"train_loss": -6.949596881866455, "global_step": 169487, "epoch": 4035} {"train_loss": -7.033220291137695, "global_step": 169488, "epoch": 4035} {"train_loss": -7.053905963897705, "global_step": 169489, "epoch": 4035} {"train_loss": -6.906976699829102, "global_step": 169490, "epoch": 4035} {"train_loss": -7.021729469299316, "global_step": 169491, "epoch": 4035} {"train_loss": -6.939711570739746, "global_step": 169492, "epoch": 4035} {"train_loss": -6.9694013595581055, "global_step": 169493, "epoch": 4035} {"train_loss": -6.943373680114746, "global_step": 169494, "epoch": 4035} {"train_loss": -6.853476047515869, "global_step": 169495, "epoch": 4035} {"train_loss": -6.966805458068848, "global_step": 169496, "epoch": 4035} {"train_loss": -7.003723621368408, "global_step": 169497, "epoch": 4035} {"train_loss": -6.9284443855285645, "global_step": 169498, "epoch": 4035} {"train_loss": -7.009775161743164, "global_step": 169499, "epoch": 4035} {"train_loss": -6.842023849487305, "global_step": 169500, "epoch": 4035} {"train_loss": -6.969337463378906, "global_step": 169501, "epoch": 4035} {"train_loss": -6.899293899536133, "global_step": 169502, "epoch": 4035} {"train_loss": -6.943657875061035, "global_step": 169503, "epoch": 4035} {"train_loss": -6.967850685119629, "global_step": 169504, "epoch": 4035} {"train_loss": -6.94896125793457, "global_step": 169505, "epoch": 4035} {"train_loss": -6.9983439445495605, "global_step": 169506, "epoch": 4035} {"train_loss": -6.964335918426514, "global_step": 169507, "epoch": 4035} {"train_loss": -6.9839701652526855, "global_step": 169508, "epoch": 4035} {"train_loss": -6.9679484367370605, "global_step": 169509, "epoch": 4035} {"train_loss": -7.070391654968262, "global_step": 169510, "epoch": 4035} {"train_loss": -6.980060089202154, "global_step": 169511, "epoch": 4035, "val_loss": 68665.3046875} {"train_loss": -7.012184143066406, "global_step": 169512, "epoch": 4036} {"train_loss": -7.053906440734863, "global_step": 169513, "epoch": 4036} {"train_loss": -6.9904093742370605, "global_step": 169514, "epoch": 4036} {"train_loss": -6.988090515136719, "global_step": 169515, "epoch": 4036} {"train_loss": -7.04981803894043, "global_step": 169516, "epoch": 4036} {"train_loss": -6.9859137535095215, "global_step": 169517, "epoch": 4036} {"train_loss": -7.056384086608887, "global_step": 169518, "epoch": 4036} {"train_loss": -6.933549880981445, "global_step": 169519, "epoch": 4036} {"train_loss": -7.062248229980469, "global_step": 169520, "epoch": 4036} {"train_loss": -7.002004623413086, "global_step": 169521, "epoch": 4036} {"train_loss": -7.11116886138916, "global_step": 169522, "epoch": 4036} {"train_loss": -6.999844551086426, "global_step": 169523, "epoch": 4036} {"train_loss": -7.082780838012695, "global_step": 169524, "epoch": 4036} {"train_loss": -6.967353820800781, "global_step": 169525, "epoch": 4036} {"train_loss": -7.015881538391113, "global_step": 169526, "epoch": 4036} {"train_loss": -7.047633171081543, "global_step": 169527, "epoch": 4036} {"train_loss": -7.032810211181641, "global_step": 169528, "epoch": 4036} {"train_loss": -7.038956165313721, "global_step": 169529, "epoch": 4036} {"train_loss": -7.037059307098389, "global_step": 169530, "epoch": 4036} {"train_loss": -6.996288776397705, "global_step": 169531, "epoch": 4036} {"train_loss": -6.817810535430908, "global_step": 169532, "epoch": 4036} {"train_loss": -6.9015116691589355, "global_step": 169533, "epoch": 4036} {"train_loss": -7.060821533203125, "global_step": 169534, "epoch": 4036} {"train_loss": -6.818796634674072, "global_step": 169535, "epoch": 4036} {"train_loss": -6.9757280349731445, "global_step": 169536, "epoch": 4036} {"train_loss": -6.839057922363281, "global_step": 169537, "epoch": 4036} {"train_loss": -6.902085304260254, "global_step": 169538, "epoch": 4036} {"train_loss": -6.980537414550781, "global_step": 169539, "epoch": 4036} {"train_loss": -6.8099870681762695, "global_step": 169540, "epoch": 4036} {"train_loss": -6.970707893371582, "global_step": 169541, "epoch": 4036} {"train_loss": -6.986131191253662, "global_step": 169542, "epoch": 4036} {"train_loss": -6.907606601715088, "global_step": 169543, "epoch": 4036} {"train_loss": -7.027095794677734, "global_step": 169544, "epoch": 4036} {"train_loss": -6.957751750946045, "global_step": 169545, "epoch": 4036} {"train_loss": -6.949038028717041, "global_step": 169546, "epoch": 4036} {"train_loss": -6.899169921875, "global_step": 169547, "epoch": 4036} {"train_loss": -6.956286430358887, "global_step": 169548, "epoch": 4036} {"train_loss": -7.021039009094238, "global_step": 169549, "epoch": 4036} {"train_loss": -6.911257743835449, "global_step": 169550, "epoch": 4036} {"train_loss": -6.9764533042907715, "global_step": 169551, "epoch": 4036} {"train_loss": -6.952734470367432, "global_step": 169552, "epoch": 4036} {"train_loss": -6.9766934258597235, "global_step": 169553, "epoch": 4036, "val_loss": 68523.3046875} {"train_loss": -6.980152606964111, "global_step": 169554, "epoch": 4037} {"train_loss": -6.949439525604248, "global_step": 169555, "epoch": 4037} {"train_loss": -6.904450416564941, "global_step": 169556, "epoch": 4037} {"train_loss": -6.9464921951293945, "global_step": 169557, "epoch": 4037} {"train_loss": -6.973358631134033, "global_step": 169558, "epoch": 4037} {"train_loss": -6.843825340270996, "global_step": 169559, "epoch": 4037} {"train_loss": -6.821966171264648, "global_step": 169560, "epoch": 4037} {"train_loss": -6.941812992095947, "global_step": 169561, "epoch": 4037} {"train_loss": -6.866700649261475, "global_step": 169562, "epoch": 4037} {"train_loss": -6.997650623321533, "global_step": 169563, "epoch": 4037} {"train_loss": -6.976484298706055, "global_step": 169564, "epoch": 4037} {"train_loss": -6.830711364746094, "global_step": 169565, "epoch": 4037} {"train_loss": -6.932570934295654, "global_step": 169566, "epoch": 4037} {"train_loss": -6.828768730163574, "global_step": 169567, "epoch": 4037} {"train_loss": -6.933687210083008, "global_step": 169568, "epoch": 4037} {"train_loss": -6.951377868652344, "global_step": 169569, "epoch": 4037} {"train_loss": -6.92454195022583, "global_step": 169570, "epoch": 4037} {"train_loss": -6.9256672859191895, "global_step": 169571, "epoch": 4037} {"train_loss": -6.86484956741333, "global_step": 169572, "epoch": 4037} {"train_loss": -6.996744632720947, "global_step": 169573, "epoch": 4037} {"train_loss": -7.052699565887451, "global_step": 169574, "epoch": 4037} {"train_loss": -6.827258586883545, "global_step": 169575, "epoch": 4037} {"train_loss": -6.992681980133057, "global_step": 169576, "epoch": 4037} {"train_loss": -6.906583309173584, "global_step": 169577, "epoch": 4037} {"train_loss": -6.957184791564941, "global_step": 169578, "epoch": 4037} {"train_loss": -6.99795389175415, "global_step": 169579, "epoch": 4037} {"train_loss": -6.917742729187012, "global_step": 169580, "epoch": 4037} {"train_loss": -6.997509002685547, "global_step": 169581, "epoch": 4037} {"train_loss": -6.9207329750061035, "global_step": 169582, "epoch": 4037} {"train_loss": -7.047224044799805, "global_step": 169583, "epoch": 4037} {"train_loss": -7.024312973022461, "global_step": 169584, "epoch": 4037} {"train_loss": -6.896861553192139, "global_step": 169585, "epoch": 4037} {"train_loss": -7.032517433166504, "global_step": 169586, "epoch": 4037} {"train_loss": -6.947054862976074, "global_step": 169587, "epoch": 4037} {"train_loss": -6.998814582824707, "global_step": 169588, "epoch": 4037} {"train_loss": -7.066361427307129, "global_step": 169589, "epoch": 4037} {"train_loss": -6.932661056518555, "global_step": 169590, "epoch": 4037} {"train_loss": -6.953310012817383, "global_step": 169591, "epoch": 4037} {"train_loss": -6.940023899078369, "global_step": 169592, "epoch": 4037} {"train_loss": -6.944643020629883, "global_step": 169593, "epoch": 4037} {"train_loss": -6.959259986877441, "global_step": 169594, "epoch": 4037} {"train_loss": -6.9420080071403865, "global_step": 169595, "epoch": 4037, "val_loss": 68706.90625} {"train_loss": -6.939243316650391, "global_step": 169596, "epoch": 4038} {"train_loss": -6.976255416870117, "global_step": 169597, "epoch": 4038} {"train_loss": -6.965071678161621, "global_step": 169598, "epoch": 4038} {"train_loss": -6.846046447753906, "global_step": 169599, "epoch": 4038} {"train_loss": -7.066727638244629, "global_step": 169600, "epoch": 4038} {"train_loss": -6.940889358520508, "global_step": 169601, "epoch": 4038} {"train_loss": -7.004328727722168, "global_step": 169602, "epoch": 4038} {"train_loss": -7.0108442306518555, "global_step": 169603, "epoch": 4038} {"train_loss": -6.989736557006836, "global_step": 169604, "epoch": 4038} {"train_loss": -7.041947364807129, "global_step": 169605, "epoch": 4038} {"train_loss": -6.863232612609863, "global_step": 169606, "epoch": 4038} {"train_loss": -7.052549839019775, "global_step": 169607, "epoch": 4038} {"train_loss": -6.95631217956543, "global_step": 169608, "epoch": 4038} {"train_loss": -6.790951728820801, "global_step": 169609, "epoch": 4038} {"train_loss": -6.980319976806641, "global_step": 169610, "epoch": 4038} {"train_loss": -6.935426235198975, "global_step": 169611, "epoch": 4038} {"train_loss": -6.986422061920166, "global_step": 169612, "epoch": 4038} {"train_loss": -6.965453147888184, "global_step": 169613, "epoch": 4038} {"train_loss": -6.953520774841309, "global_step": 169614, "epoch": 4038} {"train_loss": -6.902655601501465, "global_step": 169615, "epoch": 4038} {"train_loss": -7.022255897521973, "global_step": 169616, "epoch": 4038} {"train_loss": -6.980148792266846, "global_step": 169617, "epoch": 4038} {"train_loss": -6.952427387237549, "global_step": 169618, "epoch": 4038} {"train_loss": -6.905668258666992, "global_step": 169619, "epoch": 4038} {"train_loss": -6.999992847442627, "global_step": 169620, "epoch": 4038} {"train_loss": -7.068882465362549, "global_step": 169621, "epoch": 4038} {"train_loss": -7.082736015319824, "global_step": 169622, "epoch": 4038} {"train_loss": -6.916901588439941, "global_step": 169623, "epoch": 4038} {"train_loss": -7.030922889709473, "global_step": 169624, "epoch": 4038} {"train_loss": -6.974465370178223, "global_step": 169625, "epoch": 4038} {"train_loss": -6.906919479370117, "global_step": 169626, "epoch": 4038} {"train_loss": -7.020926475524902, "global_step": 169627, "epoch": 4038} {"train_loss": -6.985325813293457, "global_step": 169628, "epoch": 4038} {"train_loss": -6.869744777679443, "global_step": 169629, "epoch": 4038} {"train_loss": -7.038812160491943, "global_step": 169630, "epoch": 4038} {"train_loss": -6.823879718780518, "global_step": 169631, "epoch": 4038} {"train_loss": -6.786285400390625, "global_step": 169632, "epoch": 4038} {"train_loss": -6.9522480964660645, "global_step": 169633, "epoch": 4038} {"train_loss": -6.894899368286133, "global_step": 169634, "epoch": 4038} {"train_loss": -6.880257606506348, "global_step": 169635, "epoch": 4038} {"train_loss": -6.914510726928711, "global_step": 169636, "epoch": 4038} {"train_loss": -6.956959633600144, "global_step": 169637, "epoch": 4038, "val_loss": 68693.90625} {"train_loss": -6.924449920654297, "global_step": 169638, "epoch": 4039} {"train_loss": -7.04406213760376, "global_step": 169639, "epoch": 4039} {"train_loss": -6.94004487991333, "global_step": 169640, "epoch": 4039} {"train_loss": -6.9538373947143555, "global_step": 169641, "epoch": 4039} {"train_loss": -6.9795050621032715, "global_step": 169642, "epoch": 4039} {"train_loss": -6.980980396270752, "global_step": 169643, "epoch": 4039} {"train_loss": -7.014271259307861, "global_step": 169644, "epoch": 4039} {"train_loss": -6.999446868896484, "global_step": 169645, "epoch": 4039} {"train_loss": -6.878026008605957, "global_step": 169646, "epoch": 4039} {"train_loss": -7.040635108947754, "global_step": 169647, "epoch": 4039} {"train_loss": -7.041608810424805, "global_step": 169648, "epoch": 4039} {"train_loss": -6.913327217102051, "global_step": 169649, "epoch": 4039} {"train_loss": -7.039036273956299, "global_step": 169650, "epoch": 4039} {"train_loss": -7.029019355773926, "global_step": 169651, "epoch": 4039} {"train_loss": -7.006528854370117, "global_step": 169652, "epoch": 4039} {"train_loss": -6.938960075378418, "global_step": 169653, "epoch": 4039} {"train_loss": -6.8693037033081055, "global_step": 169654, "epoch": 4039} {"train_loss": -7.0418806076049805, "global_step": 169655, "epoch": 4039} {"train_loss": -7.019132137298584, "global_step": 169656, "epoch": 4039} {"train_loss": -6.9331841468811035, "global_step": 169657, "epoch": 4039} {"train_loss": -6.9771504402160645, "global_step": 169658, "epoch": 4039} {"train_loss": -6.961232662200928, "global_step": 169659, "epoch": 4039} {"train_loss": -7.00131893157959, "global_step": 169660, "epoch": 4039} {"train_loss": -6.9531989097595215, "global_step": 169661, "epoch": 4039} {"train_loss": -6.991236209869385, "global_step": 169662, "epoch": 4039} {"train_loss": -6.935187339782715, "global_step": 169663, "epoch": 4039} {"train_loss": -6.936892032623291, "global_step": 169664, "epoch": 4039} {"train_loss": -6.950340747833252, "global_step": 169665, "epoch": 4039} {"train_loss": -7.017205238342285, "global_step": 169666, "epoch": 4039} {"train_loss": -6.966672420501709, "global_step": 169667, "epoch": 4039} {"train_loss": -7.005794525146484, "global_step": 169668, "epoch": 4039} {"train_loss": -6.959200859069824, "global_step": 169669, "epoch": 4039} {"train_loss": -6.912707328796387, "global_step": 169670, "epoch": 4039} {"train_loss": -6.831248760223389, "global_step": 169671, "epoch": 4039} {"train_loss": -7.031699180603027, "global_step": 169672, "epoch": 4039} {"train_loss": -6.9489264488220215, "global_step": 169673, "epoch": 4039} {"train_loss": -7.01667594909668, "global_step": 169674, "epoch": 4039} {"train_loss": -6.886349678039551, "global_step": 169675, "epoch": 4039} {"train_loss": -7.038180351257324, "global_step": 169676, "epoch": 4039} {"train_loss": -6.9741668701171875, "global_step": 169677, "epoch": 4039} {"train_loss": -6.825476169586182, "global_step": 169678, "epoch": 4039} {"train_loss": -6.9680990264529274, "global_step": 169679, "epoch": 4039, "val_loss": 68597.578125} {"train_loss": -7.00782585144043, "global_step": 169680, "epoch": 4040} {"train_loss": -6.936723709106445, "global_step": 169681, "epoch": 4040} {"train_loss": -6.863358974456787, "global_step": 169682, "epoch": 4040} {"train_loss": -7.041858673095703, "global_step": 169683, "epoch": 4040} {"train_loss": -6.941027641296387, "global_step": 169684, "epoch": 4040} {"train_loss": -6.994189739227295, "global_step": 169685, "epoch": 4040} {"train_loss": -7.0246124267578125, "global_step": 169686, "epoch": 4040} {"train_loss": -7.066703796386719, "global_step": 169687, "epoch": 4040} {"train_loss": -6.987735748291016, "global_step": 169688, "epoch": 4040} {"train_loss": -7.062509536743164, "global_step": 169689, "epoch": 4040} {"train_loss": -7.0298895835876465, "global_step": 169690, "epoch": 4040} {"train_loss": -6.976659774780273, "global_step": 169691, "epoch": 4040} {"train_loss": -6.9748334884643555, "global_step": 169692, "epoch": 4040} {"train_loss": -7.036409378051758, "global_step": 169693, "epoch": 4040} {"train_loss": -6.987467288970947, "global_step": 169694, "epoch": 4040} {"train_loss": -7.070372581481934, "global_step": 169695, "epoch": 4040} {"train_loss": -6.982649803161621, "global_step": 169696, "epoch": 4040} {"train_loss": -6.909448623657227, "global_step": 169697, "epoch": 4040} {"train_loss": -6.992175579071045, "global_step": 169698, "epoch": 4040} {"train_loss": -6.999875068664551, "global_step": 169699, "epoch": 4040} {"train_loss": -7.081856727600098, "global_step": 169700, "epoch": 4040} {"train_loss": -6.9739837646484375, "global_step": 169701, "epoch": 4040} {"train_loss": -7.044095993041992, "global_step": 169702, "epoch": 4040} {"train_loss": -7.130100250244141, "global_step": 169703, "epoch": 4040} {"train_loss": -7.106473922729492, "global_step": 169704, "epoch": 4040} {"train_loss": -7.135087966918945, "global_step": 169705, "epoch": 4040} {"train_loss": -7.080771446228027, "global_step": 169706, "epoch": 4040} {"train_loss": -7.113293170928955, "global_step": 169707, "epoch": 4040} {"train_loss": -7.061759948730469, "global_step": 169708, "epoch": 4040} {"train_loss": -7.033139228820801, "global_step": 169709, "epoch": 4040} {"train_loss": -7.110515594482422, "global_step": 169710, "epoch": 4040} {"train_loss": -7.09857177734375, "global_step": 169711, "epoch": 4040} {"train_loss": -7.010847091674805, "global_step": 169712, "epoch": 4040} {"train_loss": -6.941349506378174, "global_step": 169713, "epoch": 4040} {"train_loss": -6.968766212463379, "global_step": 169714, "epoch": 4040} {"train_loss": -7.065365791320801, "global_step": 169715, "epoch": 4040} {"train_loss": -6.932663917541504, "global_step": 169716, "epoch": 4040} {"train_loss": -7.030361652374268, "global_step": 169717, "epoch": 4040} {"train_loss": -6.984531402587891, "global_step": 169718, "epoch": 4040} {"train_loss": -6.938868999481201, "global_step": 169719, "epoch": 4040} {"train_loss": -6.968704700469971, "global_step": 169720, "epoch": 4040} {"train_loss": -7.018884556634085, "global_step": 169721, "epoch": 4040, "val_loss": 68645.2890625} {"train_loss": -6.982381343841553, "global_step": 169722, "epoch": 4041} {"train_loss": -6.96267032623291, "global_step": 169723, "epoch": 4041} {"train_loss": -6.9179229736328125, "global_step": 169724, "epoch": 4041} {"train_loss": -6.990516185760498, "global_step": 169725, "epoch": 4041} {"train_loss": -6.897618770599365, "global_step": 169726, "epoch": 4041} {"train_loss": -7.003886699676514, "global_step": 169727, "epoch": 4041} {"train_loss": -6.905117034912109, "global_step": 169728, "epoch": 4041} {"train_loss": -6.883400917053223, "global_step": 169729, "epoch": 4041} {"train_loss": -6.91495943069458, "global_step": 169730, "epoch": 4041} {"train_loss": -6.897830486297607, "global_step": 169731, "epoch": 4041} {"train_loss": -6.831185817718506, "global_step": 169732, "epoch": 4041} {"train_loss": -6.709911346435547, "global_step": 169733, "epoch": 4041} {"train_loss": -6.827877044677734, "global_step": 169734, "epoch": 4041} {"train_loss": -6.941028594970703, "global_step": 169735, "epoch": 4041} {"train_loss": -6.883939266204834, "global_step": 169736, "epoch": 4041} {"train_loss": -6.884622573852539, "global_step": 169737, "epoch": 4041} {"train_loss": -6.935162544250488, "global_step": 169738, "epoch": 4041} {"train_loss": -6.795934677124023, "global_step": 169739, "epoch": 4041} {"train_loss": -6.821673393249512, "global_step": 169740, "epoch": 4041} {"train_loss": -6.864038467407227, "global_step": 169741, "epoch": 4041} {"train_loss": -6.944770812988281, "global_step": 169742, "epoch": 4041} {"train_loss": -6.62275505065918, "global_step": 169743, "epoch": 4041} {"train_loss": -7.029740333557129, "global_step": 169744, "epoch": 4041} {"train_loss": -6.825118541717529, "global_step": 169745, "epoch": 4041} {"train_loss": -6.940859794616699, "global_step": 169746, "epoch": 4041} {"train_loss": -6.826038837432861, "global_step": 169747, "epoch": 4041} {"train_loss": -6.898470878601074, "global_step": 169748, "epoch": 4041} {"train_loss": -6.944304466247559, "global_step": 169749, "epoch": 4041} {"train_loss": -6.940402030944824, "global_step": 169750, "epoch": 4041} {"train_loss": -6.963991165161133, "global_step": 169751, "epoch": 4041} {"train_loss": -6.943115711212158, "global_step": 169752, "epoch": 4041} {"train_loss": -6.934953212738037, "global_step": 169753, "epoch": 4041} {"train_loss": -6.836453437805176, "global_step": 169754, "epoch": 4041} {"train_loss": -7.016567230224609, "global_step": 169755, "epoch": 4041} {"train_loss": -6.946278095245361, "global_step": 169756, "epoch": 4041} {"train_loss": -6.937225341796875, "global_step": 169757, "epoch": 4041} {"train_loss": -6.903295516967773, "global_step": 169758, "epoch": 4041} {"train_loss": -6.925640106201172, "global_step": 169759, "epoch": 4041} {"train_loss": -6.972711563110352, "global_step": 169760, "epoch": 4041} {"train_loss": -6.986822605133057, "global_step": 169761, "epoch": 4041} {"train_loss": -7.00532341003418, "global_step": 169762, "epoch": 4041} {"train_loss": -6.9084489686148505, "global_step": 169763, "epoch": 4041, "val_loss": 68565.28125} {"train_loss": -6.9927520751953125, "global_step": 169764, "epoch": 4042} {"train_loss": -6.932241916656494, "global_step": 169765, "epoch": 4042} {"train_loss": -7.03055477142334, "global_step": 169766, "epoch": 4042} {"train_loss": -7.114839553833008, "global_step": 169767, "epoch": 4042} {"train_loss": -6.9475178718566895, "global_step": 169768, "epoch": 4042} {"train_loss": -6.956093788146973, "global_step": 169769, "epoch": 4042} {"train_loss": -7.036984443664551, "global_step": 169770, "epoch": 4042} {"train_loss": -6.920436382293701, "global_step": 169771, "epoch": 4042} {"train_loss": -6.990075588226318, "global_step": 169772, "epoch": 4042} {"train_loss": -7.100472450256348, "global_step": 169773, "epoch": 4042} {"train_loss": -7.005644798278809, "global_step": 169774, "epoch": 4042} {"train_loss": -6.995481967926025, "global_step": 169775, "epoch": 4042} {"train_loss": -7.005557060241699, "global_step": 169776, "epoch": 4042} {"train_loss": -7.0978474617004395, "global_step": 169777, "epoch": 4042} {"train_loss": -6.960953235626221, "global_step": 169778, "epoch": 4042} {"train_loss": -7.089205741882324, "global_step": 169779, "epoch": 4042} {"train_loss": -6.929349899291992, "global_step": 169780, "epoch": 4042} {"train_loss": -6.961986541748047, "global_step": 169781, "epoch": 4042} {"train_loss": -7.184199333190918, "global_step": 169782, "epoch": 4042} {"train_loss": -6.98630428314209, "global_step": 169783, "epoch": 4042} {"train_loss": -7.0265655517578125, "global_step": 169784, "epoch": 4042} {"train_loss": -7.030526638031006, "global_step": 169785, "epoch": 4042} {"train_loss": -6.956780433654785, "global_step": 169786, "epoch": 4042} {"train_loss": -6.998632431030273, "global_step": 169787, "epoch": 4042} {"train_loss": -6.883884429931641, "global_step": 169788, "epoch": 4042} {"train_loss": -7.020481109619141, "global_step": 169789, "epoch": 4042} {"train_loss": -6.996340274810791, "global_step": 169790, "epoch": 4042} {"train_loss": -6.940914154052734, "global_step": 169791, "epoch": 4042} {"train_loss": -6.955267429351807, "global_step": 169792, "epoch": 4042} {"train_loss": -7.061859607696533, "global_step": 169793, "epoch": 4042} {"train_loss": -7.07697057723999, "global_step": 169794, "epoch": 4042} {"train_loss": -7.081909656524658, "global_step": 169795, "epoch": 4042} {"train_loss": -6.997380256652832, "global_step": 169796, "epoch": 4042} {"train_loss": -6.961943626403809, "global_step": 169797, "epoch": 4042} {"train_loss": -6.9595537185668945, "global_step": 169798, "epoch": 4042} {"train_loss": -7.099781036376953, "global_step": 169799, "epoch": 4042} {"train_loss": -7.123288631439209, "global_step": 169800, "epoch": 4042} {"train_loss": -6.881741523742676, "global_step": 169801, "epoch": 4042} {"train_loss": -7.068982124328613, "global_step": 169802, "epoch": 4042} {"train_loss": -7.032630443572998, "global_step": 169803, "epoch": 4042} {"train_loss": -6.9209771156311035, "global_step": 169804, "epoch": 4042} {"train_loss": -7.0074489911397295, "global_step": 169805, "epoch": 4042, "val_loss": 68579.6953125} {"train_loss": -7.076938152313232, "global_step": 169806, "epoch": 4043} {"train_loss": -7.010197639465332, "global_step": 169807, "epoch": 4043} {"train_loss": -7.002172946929932, "global_step": 169808, "epoch": 4043} {"train_loss": -7.087751388549805, "global_step": 169809, "epoch": 4043} {"train_loss": -7.096759796142578, "global_step": 169810, "epoch": 4043} {"train_loss": -6.9942522048950195, "global_step": 169811, "epoch": 4043} {"train_loss": -7.143994331359863, "global_step": 169812, "epoch": 4043} {"train_loss": -7.045118808746338, "global_step": 169813, "epoch": 4043} {"train_loss": -6.895623207092285, "global_step": 169814, "epoch": 4043} {"train_loss": -7.004817962646484, "global_step": 169815, "epoch": 4043} {"train_loss": -7.132562160491943, "global_step": 169816, "epoch": 4043} {"train_loss": -7.056988716125488, "global_step": 169817, "epoch": 4043} {"train_loss": -7.140818119049072, "global_step": 169818, "epoch": 4043} {"train_loss": -6.935934543609619, "global_step": 169819, "epoch": 4043} {"train_loss": -6.970588684082031, "global_step": 169820, "epoch": 4043} {"train_loss": -7.13593053817749, "global_step": 169821, "epoch": 4043} {"train_loss": -7.0085649490356445, "global_step": 169822, "epoch": 4043} {"train_loss": -6.87471866607666, "global_step": 169823, "epoch": 4043} {"train_loss": -6.993589878082275, "global_step": 169824, "epoch": 4043} {"train_loss": -7.015798091888428, "global_step": 169825, "epoch": 4043} {"train_loss": -7.024096488952637, "global_step": 169826, "epoch": 4043} {"train_loss": -6.971771240234375, "global_step": 169827, "epoch": 4043} {"train_loss": -7.089099884033203, "global_step": 169828, "epoch": 4043} {"train_loss": -7.026425361633301, "global_step": 169829, "epoch": 4043} {"train_loss": -7.106374740600586, "global_step": 169830, "epoch": 4043} {"train_loss": -7.06036376953125, "global_step": 169831, "epoch": 4043} {"train_loss": -6.985265254974365, "global_step": 169832, "epoch": 4043} {"train_loss": -7.016404628753662, "global_step": 169833, "epoch": 4043} {"train_loss": -6.996404647827148, "global_step": 169834, "epoch": 4043} {"train_loss": -6.90902042388916, "global_step": 169835, "epoch": 4043} {"train_loss": -6.920755863189697, "global_step": 169836, "epoch": 4043} {"train_loss": -6.972023010253906, "global_step": 169837, "epoch": 4043} {"train_loss": -7.050131320953369, "global_step": 169838, "epoch": 4043} {"train_loss": -6.869941711425781, "global_step": 169839, "epoch": 4043} {"train_loss": -6.953397750854492, "global_step": 169840, "epoch": 4043} {"train_loss": -6.866466045379639, "global_step": 169841, "epoch": 4043} {"train_loss": -6.903381824493408, "global_step": 169842, "epoch": 4043} {"train_loss": -6.907032489776611, "global_step": 169843, "epoch": 4043} {"train_loss": -6.887840270996094, "global_step": 169844, "epoch": 4043} {"train_loss": -6.93371057510376, "global_step": 169845, "epoch": 4043} {"train_loss": -6.899205684661865, "global_step": 169846, "epoch": 4043} {"train_loss": -6.994917699268886, "global_step": 169847, "epoch": 4043, "val_loss": 68755.640625} {"train_loss": -7.013381481170654, "global_step": 169848, "epoch": 4044} {"train_loss": -6.907620429992676, "global_step": 169849, "epoch": 4044} {"train_loss": -6.881905555725098, "global_step": 169850, "epoch": 4044} {"train_loss": -7.014747619628906, "global_step": 169851, "epoch": 4044} {"train_loss": -6.82411527633667, "global_step": 169852, "epoch": 4044} {"train_loss": -6.9386444091796875, "global_step": 169853, "epoch": 4044} {"train_loss": -6.941019058227539, "global_step": 169854, "epoch": 4044} {"train_loss": -6.871040344238281, "global_step": 169855, "epoch": 4044} {"train_loss": -6.9993791580200195, "global_step": 169856, "epoch": 4044} {"train_loss": -7.034838676452637, "global_step": 169857, "epoch": 4044} {"train_loss": -6.9014482498168945, "global_step": 169858, "epoch": 4044} {"train_loss": -7.00307035446167, "global_step": 169859, "epoch": 4044} {"train_loss": -6.973225116729736, "global_step": 169860, "epoch": 4044} {"train_loss": -6.821092128753662, "global_step": 169861, "epoch": 4044} {"train_loss": -6.905200958251953, "global_step": 169862, "epoch": 4044} {"train_loss": -6.800569534301758, "global_step": 169863, "epoch": 4044} {"train_loss": -6.990591526031494, "global_step": 169864, "epoch": 4044} {"train_loss": -6.915030479431152, "global_step": 169865, "epoch": 4044} {"train_loss": -6.9121479988098145, "global_step": 169866, "epoch": 4044} {"train_loss": -7.023921489715576, "global_step": 169867, "epoch": 4044} {"train_loss": -7.015800476074219, "global_step": 169868, "epoch": 4044} {"train_loss": -6.951014041900635, "global_step": 169869, "epoch": 4044} {"train_loss": -7.048086643218994, "global_step": 169870, "epoch": 4044} {"train_loss": -7.039615631103516, "global_step": 169871, "epoch": 4044} {"train_loss": -6.974167346954346, "global_step": 169872, "epoch": 4044} {"train_loss": -6.924399375915527, "global_step": 169873, "epoch": 4044} {"train_loss": -7.03067684173584, "global_step": 169874, "epoch": 4044} {"train_loss": -6.981894493103027, "global_step": 169875, "epoch": 4044} {"train_loss": -6.9560227394104, "global_step": 169876, "epoch": 4044} {"train_loss": -6.945358753204346, "global_step": 169877, "epoch": 4044} {"train_loss": -7.0453901290893555, "global_step": 169878, "epoch": 4044} {"train_loss": -7.018256187438965, "global_step": 169879, "epoch": 4044} {"train_loss": -6.994266033172607, "global_step": 169880, "epoch": 4044} {"train_loss": -7.133430004119873, "global_step": 169881, "epoch": 4044} {"train_loss": -6.950886249542236, "global_step": 169882, "epoch": 4044} {"train_loss": -6.9711503982543945, "global_step": 169883, "epoch": 4044} {"train_loss": -7.04135799407959, "global_step": 169884, "epoch": 4044} {"train_loss": -6.846372604370117, "global_step": 169885, "epoch": 4044} {"train_loss": -7.007088661193848, "global_step": 169886, "epoch": 4044} {"train_loss": -6.968860149383545, "global_step": 169887, "epoch": 4044} {"train_loss": -6.88165283203125, "global_step": 169888, "epoch": 4044} {"train_loss": -6.960310958680653, "global_step": 169889, "epoch": 4044, "val_loss": 68651.828125} {"train_loss": -6.861197471618652, "global_step": 169890, "epoch": 4045} {"train_loss": -7.045038223266602, "global_step": 169891, "epoch": 4045} {"train_loss": -7.043288230895996, "global_step": 169892, "epoch": 4045} {"train_loss": -7.017848968505859, "global_step": 169893, "epoch": 4045} {"train_loss": -6.9773054122924805, "global_step": 169894, "epoch": 4045} {"train_loss": -6.842502593994141, "global_step": 169895, "epoch": 4045} {"train_loss": -6.996891975402832, "global_step": 169896, "epoch": 4045} {"train_loss": -6.964644908905029, "global_step": 169897, "epoch": 4045} {"train_loss": -6.938328742980957, "global_step": 169898, "epoch": 4045} {"train_loss": -6.985819339752197, "global_step": 169899, "epoch": 4045} {"train_loss": -6.946935653686523, "global_step": 169900, "epoch": 4045} {"train_loss": -6.993763446807861, "global_step": 169901, "epoch": 4045} {"train_loss": -6.95705509185791, "global_step": 169902, "epoch": 4045} {"train_loss": -6.969897747039795, "global_step": 169903, "epoch": 4045} {"train_loss": -6.93400764465332, "global_step": 169904, "epoch": 4045} {"train_loss": -6.838456630706787, "global_step": 169905, "epoch": 4045} {"train_loss": -7.015022277832031, "global_step": 169906, "epoch": 4045} {"train_loss": -6.88554048538208, "global_step": 169907, "epoch": 4045} {"train_loss": -7.008113861083984, "global_step": 169908, "epoch": 4045} {"train_loss": -6.965387344360352, "global_step": 169909, "epoch": 4045} {"train_loss": -6.851158618927002, "global_step": 169910, "epoch": 4045} {"train_loss": -6.944464683532715, "global_step": 169911, "epoch": 4045} {"train_loss": -6.953145980834961, "global_step": 169912, "epoch": 4045} {"train_loss": -6.889769077301025, "global_step": 169913, "epoch": 4045} {"train_loss": -6.987541198730469, "global_step": 169914, "epoch": 4045} {"train_loss": -6.951822280883789, "global_step": 169915, "epoch": 4045} {"train_loss": -6.890125274658203, "global_step": 169916, "epoch": 4045} {"train_loss": -6.953636169433594, "global_step": 169917, "epoch": 4045} {"train_loss": -6.931769847869873, "global_step": 169918, "epoch": 4045} {"train_loss": -7.078533172607422, "global_step": 169919, "epoch": 4045} {"train_loss": -7.073249816894531, "global_step": 169920, "epoch": 4045} {"train_loss": -6.932295799255371, "global_step": 169921, "epoch": 4045} {"train_loss": -6.879006385803223, "global_step": 169922, "epoch": 4045} {"train_loss": -6.919310569763184, "global_step": 169923, "epoch": 4045} {"train_loss": -6.96850061416626, "global_step": 169924, "epoch": 4045} {"train_loss": -7.010309219360352, "global_step": 169925, "epoch": 4045} {"train_loss": -7.057005882263184, "global_step": 169926, "epoch": 4045} {"train_loss": -6.950291156768799, "global_step": 169927, "epoch": 4045} {"train_loss": -6.8949198722839355, "global_step": 169928, "epoch": 4045} {"train_loss": -6.936253070831299, "global_step": 169929, "epoch": 4045} {"train_loss": -6.948730945587158, "global_step": 169930, "epoch": 4045} {"train_loss": -6.95621581304641, "global_step": 169931, "epoch": 4045, "val_loss": 68519.3125} {"train_loss": -6.945096015930176, "global_step": 169932, "epoch": 4046} {"train_loss": -6.882665634155273, "global_step": 169933, "epoch": 4046} {"train_loss": -6.80421257019043, "global_step": 169934, "epoch": 4046} {"train_loss": -6.90645694732666, "global_step": 169935, "epoch": 4046} {"train_loss": -7.0354156494140625, "global_step": 169936, "epoch": 4046} {"train_loss": -7.0852203369140625, "global_step": 169937, "epoch": 4046} {"train_loss": -6.872923851013184, "global_step": 169938, "epoch": 4046} {"train_loss": -6.991025924682617, "global_step": 169939, "epoch": 4046} {"train_loss": -6.988333702087402, "global_step": 169940, "epoch": 4046} {"train_loss": -6.972593784332275, "global_step": 169941, "epoch": 4046} {"train_loss": -6.967974662780762, "global_step": 169942, "epoch": 4046} {"train_loss": -6.92706823348999, "global_step": 169943, "epoch": 4046} {"train_loss": -6.969237327575684, "global_step": 169944, "epoch": 4046} {"train_loss": -6.9696245193481445, "global_step": 169945, "epoch": 4046} {"train_loss": -7.023685455322266, "global_step": 169946, "epoch": 4046} {"train_loss": -6.990347385406494, "global_step": 169947, "epoch": 4046} {"train_loss": -6.941583633422852, "global_step": 169948, "epoch": 4046} {"train_loss": -6.965116500854492, "global_step": 169949, "epoch": 4046} {"train_loss": -6.898097038269043, "global_step": 169950, "epoch": 4046} {"train_loss": -6.990291595458984, "global_step": 169951, "epoch": 4046} {"train_loss": -6.953253746032715, "global_step": 169952, "epoch": 4046} {"train_loss": -6.928579330444336, "global_step": 169953, "epoch": 4046} {"train_loss": -6.984650611877441, "global_step": 169954, "epoch": 4046} {"train_loss": -6.842198371887207, "global_step": 169955, "epoch": 4046} {"train_loss": -6.86050271987915, "global_step": 169956, "epoch": 4046} {"train_loss": -7.049655914306641, "global_step": 169957, "epoch": 4046} {"train_loss": -6.92676305770874, "global_step": 169958, "epoch": 4046} {"train_loss": -7.080380439758301, "global_step": 169959, "epoch": 4046} {"train_loss": -6.954361915588379, "global_step": 169960, "epoch": 4046} {"train_loss": -6.928989410400391, "global_step": 169961, "epoch": 4046} {"train_loss": -7.084295272827148, "global_step": 169962, "epoch": 4046} {"train_loss": -6.922265529632568, "global_step": 169963, "epoch": 4046} {"train_loss": -6.948981761932373, "global_step": 169964, "epoch": 4046} {"train_loss": -6.933682918548584, "global_step": 169965, "epoch": 4046} {"train_loss": -6.986349582672119, "global_step": 169966, "epoch": 4046} {"train_loss": -6.916842460632324, "global_step": 169967, "epoch": 4046} {"train_loss": -6.873266220092773, "global_step": 169968, "epoch": 4046} {"train_loss": -7.0845842361450195, "global_step": 169969, "epoch": 4046} {"train_loss": -6.932492256164551, "global_step": 169970, "epoch": 4046} {"train_loss": -6.9928364753723145, "global_step": 169971, "epoch": 4046} {"train_loss": -7.050863265991211, "global_step": 169972, "epoch": 4046} {"train_loss": -6.959975026902699, "global_step": 169973, "epoch": 4046, "val_loss": 68560.5078125} {"train_loss": -6.972845554351807, "global_step": 169974, "epoch": 4047} {"train_loss": -6.953845024108887, "global_step": 169975, "epoch": 4047} {"train_loss": -7.056581497192383, "global_step": 169976, "epoch": 4047} {"train_loss": -7.008921146392822, "global_step": 169977, "epoch": 4047} {"train_loss": -6.90996789932251, "global_step": 169978, "epoch": 4047} {"train_loss": -6.963637351989746, "global_step": 169979, "epoch": 4047} {"train_loss": -6.8856282234191895, "global_step": 169980, "epoch": 4047} {"train_loss": -6.942389488220215, "global_step": 169981, "epoch": 4047} {"train_loss": -7.012184143066406, "global_step": 169982, "epoch": 4047} {"train_loss": -6.979633331298828, "global_step": 169983, "epoch": 4047} {"train_loss": -6.917119026184082, "global_step": 169984, "epoch": 4047} {"train_loss": -7.026641368865967, "global_step": 169985, "epoch": 4047} {"train_loss": -6.943817138671875, "global_step": 169986, "epoch": 4047} {"train_loss": -6.931093215942383, "global_step": 169987, "epoch": 4047} {"train_loss": -6.946262359619141, "global_step": 169988, "epoch": 4047} {"train_loss": -6.933542728424072, "global_step": 169989, "epoch": 4047} {"train_loss": -7.153442859649658, "global_step": 169990, "epoch": 4047} {"train_loss": -7.010697364807129, "global_step": 169991, "epoch": 4047} {"train_loss": -6.997920036315918, "global_step": 169992, "epoch": 4047} {"train_loss": -6.909048080444336, "global_step": 169993, "epoch": 4047} {"train_loss": -6.882142066955566, "global_step": 169994, "epoch": 4047} {"train_loss": -7.062859535217285, "global_step": 169995, "epoch": 4047} {"train_loss": -6.957279205322266, "global_step": 169996, "epoch": 4047} {"train_loss": -7.153531074523926, "global_step": 169997, "epoch": 4047} {"train_loss": -7.045637130737305, "global_step": 169998, "epoch": 4047} {"train_loss": -6.999828338623047, "global_step": 169999, "epoch": 4047} {"train_loss": -6.965816020965576, "global_step": 170000, "epoch": 4047} {"train_loss": -6.992075443267822, "global_step": 170001, "epoch": 4047} {"train_loss": -6.988581657409668, "global_step": 170002, "epoch": 4047} {"train_loss": -6.961423873901367, "global_step": 170003, "epoch": 4047} {"train_loss": -6.969236373901367, "global_step": 170004, "epoch": 4047} {"train_loss": -6.9892120361328125, "global_step": 170005, "epoch": 4047} {"train_loss": -7.024927616119385, "global_step": 170006, "epoch": 4047} {"train_loss": -7.0217742919921875, "global_step": 170007, "epoch": 4047} {"train_loss": -7.067107200622559, "global_step": 170008, "epoch": 4047} {"train_loss": -7.050990104675293, "global_step": 170009, "epoch": 4047} {"train_loss": -6.951206684112549, "global_step": 170010, "epoch": 4047} {"train_loss": -7.062335014343262, "global_step": 170011, "epoch": 4047} {"train_loss": -6.890239238739014, "global_step": 170012, "epoch": 4047} {"train_loss": -7.008677005767822, "global_step": 170013, "epoch": 4047} {"train_loss": -7.024639129638672, "global_step": 170014, "epoch": 4047} {"train_loss": -6.988113505499704, "global_step": 170015, "epoch": 4047, "val_loss": 68568.9609375} {"train_loss": -7.114440441131592, "global_step": 170016, "epoch": 4048} {"train_loss": -7.180393218994141, "global_step": 170017, "epoch": 4048} {"train_loss": -6.937800407409668, "global_step": 170018, "epoch": 4048} {"train_loss": -6.952204704284668, "global_step": 170019, "epoch": 4048} {"train_loss": -7.088949203491211, "global_step": 170020, "epoch": 4048} {"train_loss": -6.927363872528076, "global_step": 170021, "epoch": 4048} {"train_loss": -6.888040542602539, "global_step": 170022, "epoch": 4048} {"train_loss": -7.113187313079834, "global_step": 170023, "epoch": 4048} {"train_loss": -6.958014011383057, "global_step": 170024, "epoch": 4048} {"train_loss": -7.019804954528809, "global_step": 170025, "epoch": 4048} {"train_loss": -6.921377182006836, "global_step": 170026, "epoch": 4048} {"train_loss": -7.028995513916016, "global_step": 170027, "epoch": 4048} {"train_loss": -7.079056739807129, "global_step": 170028, "epoch": 4048} {"train_loss": -6.927030563354492, "global_step": 170029, "epoch": 4048} {"train_loss": -6.950571537017822, "global_step": 170030, "epoch": 4048} {"train_loss": -6.976375579833984, "global_step": 170031, "epoch": 4048} {"train_loss": -7.0130157470703125, "global_step": 170032, "epoch": 4048} {"train_loss": -7.008464813232422, "global_step": 170033, "epoch": 4048} {"train_loss": -7.012310028076172, "global_step": 170034, "epoch": 4048} {"train_loss": -6.986001968383789, "global_step": 170035, "epoch": 4048} {"train_loss": -6.9649739265441895, "global_step": 170036, "epoch": 4048} {"train_loss": -6.869649887084961, "global_step": 170037, "epoch": 4048} {"train_loss": -7.0763630867004395, "global_step": 170038, "epoch": 4048} {"train_loss": -6.814416885375977, "global_step": 170039, "epoch": 4048} {"train_loss": -6.9911932945251465, "global_step": 170040, "epoch": 4048} {"train_loss": -7.142511367797852, "global_step": 170041, "epoch": 4048} {"train_loss": -6.904361724853516, "global_step": 170042, "epoch": 4048} {"train_loss": -6.979108810424805, "global_step": 170043, "epoch": 4048} {"train_loss": -6.903623580932617, "global_step": 170044, "epoch": 4048} {"train_loss": -6.853934288024902, "global_step": 170045, "epoch": 4048} {"train_loss": -6.901389122009277, "global_step": 170046, "epoch": 4048} {"train_loss": -6.928893089294434, "global_step": 170047, "epoch": 4048} {"train_loss": -7.02752685546875, "global_step": 170048, "epoch": 4048} {"train_loss": -6.9363861083984375, "global_step": 170049, "epoch": 4048} {"train_loss": -6.936779022216797, "global_step": 170050, "epoch": 4048} {"train_loss": -6.929906845092773, "global_step": 170051, "epoch": 4048} {"train_loss": -6.955108642578125, "global_step": 170052, "epoch": 4048} {"train_loss": -6.963511943817139, "global_step": 170053, "epoch": 4048} {"train_loss": -6.969928741455078, "global_step": 170054, "epoch": 4048} {"train_loss": -6.99361515045166, "global_step": 170055, "epoch": 4048} {"train_loss": -6.859959602355957, "global_step": 170056, "epoch": 4048} {"train_loss": -6.974660192217145, "global_step": 170057, "epoch": 4048, "val_loss": 68486.703125} {"train_loss": -6.923226356506348, "global_step": 170058, "epoch": 4049} {"train_loss": -6.98630952835083, "global_step": 170059, "epoch": 4049} {"train_loss": -6.958144187927246, "global_step": 170060, "epoch": 4049} {"train_loss": -6.9404449462890625, "global_step": 170061, "epoch": 4049} {"train_loss": -6.995790481567383, "global_step": 170062, "epoch": 4049} {"train_loss": -6.9693684577941895, "global_step": 170063, "epoch": 4049} {"train_loss": -6.905505180358887, "global_step": 170064, "epoch": 4049} {"train_loss": -6.9042816162109375, "global_step": 170065, "epoch": 4049} {"train_loss": -6.909335613250732, "global_step": 170066, "epoch": 4049} {"train_loss": -6.878685474395752, "global_step": 170067, "epoch": 4049} {"train_loss": -6.865166664123535, "global_step": 170068, "epoch": 4049} {"train_loss": -6.870495796203613, "global_step": 170069, "epoch": 4049} {"train_loss": -6.940324783325195, "global_step": 170070, "epoch": 4049} {"train_loss": -6.9290032386779785, "global_step": 170071, "epoch": 4049} {"train_loss": -6.962094306945801, "global_step": 170072, "epoch": 4049} {"train_loss": -6.917138576507568, "global_step": 170073, "epoch": 4049} {"train_loss": -6.902838230133057, "global_step": 170074, "epoch": 4049} {"train_loss": -6.936585903167725, "global_step": 170075, "epoch": 4049} {"train_loss": -6.926429748535156, "global_step": 170076, "epoch": 4049} {"train_loss": -6.870840072631836, "global_step": 170077, "epoch": 4049} {"train_loss": -6.871884346008301, "global_step": 170078, "epoch": 4049} {"train_loss": -6.9479899406433105, "global_step": 170079, "epoch": 4049} {"train_loss": -6.938137531280518, "global_step": 170080, "epoch": 4049} {"train_loss": -6.956443786621094, "global_step": 170081, "epoch": 4049} {"train_loss": -6.913793563842773, "global_step": 170082, "epoch": 4049} {"train_loss": -6.9007978439331055, "global_step": 170083, "epoch": 4049} {"train_loss": -7.001630783081055, "global_step": 170084, "epoch": 4049} {"train_loss": -6.893130302429199, "global_step": 170085, "epoch": 4049} {"train_loss": -6.94662618637085, "global_step": 170086, "epoch": 4049} {"train_loss": -6.925514221191406, "global_step": 170087, "epoch": 4049} {"train_loss": -6.984396457672119, "global_step": 170088, "epoch": 4049} {"train_loss": -6.92020320892334, "global_step": 170089, "epoch": 4049} {"train_loss": -7.086883068084717, "global_step": 170090, "epoch": 4049} {"train_loss": -6.958592414855957, "global_step": 170091, "epoch": 4049} {"train_loss": -7.075891494750977, "global_step": 170092, "epoch": 4049} {"train_loss": -6.833477973937988, "global_step": 170093, "epoch": 4049} {"train_loss": -6.958313941955566, "global_step": 170094, "epoch": 4049} {"train_loss": -6.89909029006958, "global_step": 170095, "epoch": 4049} {"train_loss": -6.873448371887207, "global_step": 170096, "epoch": 4049} {"train_loss": -6.942886829376221, "global_step": 170097, "epoch": 4049} {"train_loss": -6.937546253204346, "global_step": 170098, "epoch": 4049} {"train_loss": -6.9345143636067705, "global_step": 170099, "epoch": 4049, "val_loss": 68507.5078125} {"train_loss": -7.036924362182617, "global_step": 170100, "epoch": 4050} {"train_loss": -6.910227298736572, "global_step": 170101, "epoch": 4050} {"train_loss": -6.949429512023926, "global_step": 170102, "epoch": 4050} {"train_loss": -6.970643043518066, "global_step": 170103, "epoch": 4050} {"train_loss": -6.9405717849731445, "global_step": 170104, "epoch": 4050} {"train_loss": -6.924075126647949, "global_step": 170105, "epoch": 4050} {"train_loss": -7.008420944213867, "global_step": 170106, "epoch": 4050} {"train_loss": -7.049245357513428, "global_step": 170107, "epoch": 4050} {"train_loss": -7.035592079162598, "global_step": 170108, "epoch": 4050} {"train_loss": -7.085011959075928, "global_step": 170109, "epoch": 4050} {"train_loss": -7.062028884887695, "global_step": 170110, "epoch": 4050} {"train_loss": -6.988092422485352, "global_step": 170111, "epoch": 4050} {"train_loss": -7.044522285461426, "global_step": 170112, "epoch": 4050} {"train_loss": -6.981986045837402, "global_step": 170113, "epoch": 4050} {"train_loss": -6.854763507843018, "global_step": 170114, "epoch": 4050} {"train_loss": -6.920169830322266, "global_step": 170115, "epoch": 4050} {"train_loss": -6.861795425415039, "global_step": 170116, "epoch": 4050} {"train_loss": -6.887148857116699, "global_step": 170117, "epoch": 4050} {"train_loss": -6.849637985229492, "global_step": 170118, "epoch": 4050} {"train_loss": -6.903898239135742, "global_step": 170119, "epoch": 4050} {"train_loss": -6.923713684082031, "global_step": 170120, "epoch": 4050} {"train_loss": -6.887752532958984, "global_step": 170121, "epoch": 4050} {"train_loss": -6.894864082336426, "global_step": 170122, "epoch": 4050} {"train_loss": -6.914419174194336, "global_step": 170123, "epoch": 4050} {"train_loss": -6.909646987915039, "global_step": 170124, "epoch": 4050} {"train_loss": -6.859062194824219, "global_step": 170125, "epoch": 4050} {"train_loss": -6.998458385467529, "global_step": 170126, "epoch": 4050} {"train_loss": -6.941442966461182, "global_step": 170127, "epoch": 4050} {"train_loss": -7.003789901733398, "global_step": 170128, "epoch": 4050} {"train_loss": -7.016369819641113, "global_step": 170129, "epoch": 4050} {"train_loss": -6.952182769775391, "global_step": 170130, "epoch": 4050} {"train_loss": -6.914608001708984, "global_step": 170131, "epoch": 4050} {"train_loss": -6.997746467590332, "global_step": 170132, "epoch": 4050} {"train_loss": -7.094331741333008, "global_step": 170133, "epoch": 4050} {"train_loss": -7.011590480804443, "global_step": 170134, "epoch": 4050} {"train_loss": -6.9767961502075195, "global_step": 170135, "epoch": 4050} {"train_loss": -6.963679313659668, "global_step": 170136, "epoch": 4050} {"train_loss": -6.94270133972168, "global_step": 170137, "epoch": 4050} {"train_loss": -6.864952564239502, "global_step": 170138, "epoch": 4050} {"train_loss": -7.112731456756592, "global_step": 170139, "epoch": 4050} {"train_loss": -6.934277534484863, "global_step": 170140, "epoch": 4050} {"train_loss": -6.957518395923433, "global_step": 170141, "epoch": 4050, "train/sim_max_reward_0": 0.24138418999469413, "train/sim_max_reward_1": 0.8694105394382533, "train/sim_max_reward_2": 0.30018047207275017, "train/sim_max_reward_3": 0.12999731407457213, "train/sim_max_reward_4": 0.8806732663660432, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.2953581264972689, "test/sim_max_reward_4400001": 0.9015681950641323, "test/sim_max_reward_4400002": 0.9667745297650341, "test/sim_max_reward_4400003": 0.7694470911760928, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.9163145736870887, "test/sim_max_reward_4400007": 0.9537715423108682, "test/sim_max_reward_4400008": 0.2990367774647636, "test/sim_max_reward_4400009": 0.913909181657779, "test/sim_max_reward_4400010": 0.9064081731525696, "test/sim_max_reward_4400011": 0.19247938066457937, "test/sim_max_reward_4400012": 0.9472391914045889, "test/sim_max_reward_4400013": 0.4610240684398586, "test/sim_max_reward_4400014": 0.39880737912394854, "test/sim_max_reward_4400015": 0.5137610749077736, "test/sim_max_reward_4400016": 0.07337284483162061, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2296728812876292, "test/sim_max_reward_4400019": 1.1285628466733966e-05, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8898627137746519, "test/sim_max_reward_4400023": 0.9842060608370424, "test/sim_max_reward_4400024": 0.4972416472961124, "test/sim_max_reward_4400025": 0.2683966602553908, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0, "test/sim_max_reward_4400028": 0.5545500605998412, "test/sim_max_reward_4400029": 0.04598896605278306, "test/sim_max_reward_4400030": 0.9725608476694558, "test/sim_max_reward_4400031": 0.9962649771878784, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8915382714000423, "test/sim_max_reward_4400034": 0.8970723693706141, "test/sim_max_reward_4400035": 0.48351531444497536, "test/sim_max_reward_4400036": 0.9422448894851777, "test/sim_max_reward_4400037": 0.9000656155153653, "test/sim_max_reward_4400038": 0.39867859076438816, "test/sim_max_reward_4400039": 0.9613318108915709, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9258545222707617, "test/sim_max_reward_4400042": 0.8968584776826221, "test/sim_max_reward_4400043": 0.8796354605339464, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9598977863243741, "test/sim_max_reward_4400046": 0.6867190591629991, "test/sim_max_reward_4400047": 0.9072590088480774, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 0.926380456472238, "train/mean_score": 0.5702742969910521, "test/mean_score": 0.5815661938855654, "val_loss": 68482.328125} {"train_loss": -7.133314609527588, "global_step": 170142, "epoch": 4051} {"train_loss": -6.98518180847168, "global_step": 170143, "epoch": 4051} {"train_loss": -7.062431335449219, "global_step": 170144, "epoch": 4051} {"train_loss": -7.105684757232666, "global_step": 170145, "epoch": 4051} {"train_loss": -7.031723499298096, "global_step": 170146, "epoch": 4051} {"train_loss": -7.016202449798584, "global_step": 170147, "epoch": 4051} {"train_loss": -6.980422496795654, "global_step": 170148, "epoch": 4051} {"train_loss": -6.996186256408691, "global_step": 170149, "epoch": 4051} {"train_loss": -6.996374130249023, "global_step": 170150, "epoch": 4051} {"train_loss": -7.072299003601074, "global_step": 170151, "epoch": 4051} {"train_loss": -6.971559524536133, "global_step": 170152, "epoch": 4051} {"train_loss": -6.933393478393555, "global_step": 170153, "epoch": 4051} {"train_loss": -6.889662265777588, "global_step": 170154, "epoch": 4051} {"train_loss": -6.8886823654174805, "global_step": 170155, "epoch": 4051} {"train_loss": -7.0269389152526855, "global_step": 170156, "epoch": 4051} {"train_loss": -6.919353485107422, "global_step": 170157, "epoch": 4051} {"train_loss": -6.921024799346924, "global_step": 170158, "epoch": 4051} {"train_loss": -7.065244674682617, "global_step": 170159, "epoch": 4051} {"train_loss": -7.0006422996521, "global_step": 170160, "epoch": 4051} {"train_loss": -7.0989990234375, "global_step": 170161, "epoch": 4051} {"train_loss": -7.008059501647949, "global_step": 170162, "epoch": 4051} {"train_loss": -6.943126678466797, "global_step": 170163, "epoch": 4051} {"train_loss": -6.946681976318359, "global_step": 170164, "epoch": 4051} {"train_loss": -6.912923812866211, "global_step": 170165, "epoch": 4051} {"train_loss": -6.928661823272705, "global_step": 170166, "epoch": 4051} {"train_loss": -7.0184831619262695, "global_step": 170167, "epoch": 4051} {"train_loss": -7.044733047485352, "global_step": 170168, "epoch": 4051} {"train_loss": -6.939309120178223, "global_step": 170169, "epoch": 4051} {"train_loss": -7.028331279754639, "global_step": 170170, "epoch": 4051} {"train_loss": -6.906657695770264, "global_step": 170171, "epoch": 4051} {"train_loss": -7.045933246612549, "global_step": 170172, "epoch": 4051} {"train_loss": -7.070102691650391, "global_step": 170173, "epoch": 4051} {"train_loss": -6.991204738616943, "global_step": 170174, "epoch": 4051} {"train_loss": -6.898744583129883, "global_step": 170175, "epoch": 4051} {"train_loss": -7.062447547912598, "global_step": 170176, "epoch": 4051} {"train_loss": -7.018485069274902, "global_step": 170177, "epoch": 4051} {"train_loss": -7.049243927001953, "global_step": 170178, "epoch": 4051} {"train_loss": -6.938542366027832, "global_step": 170179, "epoch": 4051} {"train_loss": -6.981249809265137, "global_step": 170180, "epoch": 4051} {"train_loss": -7.006711959838867, "global_step": 170181, "epoch": 4051} {"train_loss": -6.939509391784668, "global_step": 170182, "epoch": 4051} {"train_loss": -6.992779811223348, "global_step": 170183, "epoch": 4051, "val_loss": 68775.328125} {"train_loss": -7.020034313201904, "global_step": 170184, "epoch": 4052} {"train_loss": -6.934325695037842, "global_step": 170185, "epoch": 4052} {"train_loss": -7.060527801513672, "global_step": 170186, "epoch": 4052} {"train_loss": -7.130840301513672, "global_step": 170187, "epoch": 4052} {"train_loss": -6.881830215454102, "global_step": 170188, "epoch": 4052} {"train_loss": -7.097909927368164, "global_step": 170189, "epoch": 4052} {"train_loss": -7.122738838195801, "global_step": 170190, "epoch": 4052} {"train_loss": -6.924403190612793, "global_step": 170191, "epoch": 4052} {"train_loss": -7.001753807067871, "global_step": 170192, "epoch": 4052} {"train_loss": -6.942855358123779, "global_step": 170193, "epoch": 4052} {"train_loss": -6.903351783752441, "global_step": 170194, "epoch": 4052} {"train_loss": -7.0608415603637695, "global_step": 170195, "epoch": 4052} {"train_loss": -7.073540687561035, "global_step": 170196, "epoch": 4052} {"train_loss": -7.0797858238220215, "global_step": 170197, "epoch": 4052} {"train_loss": -6.996784210205078, "global_step": 170198, "epoch": 4052} {"train_loss": -6.926974296569824, "global_step": 170199, "epoch": 4052} {"train_loss": -6.976681709289551, "global_step": 170200, "epoch": 4052} {"train_loss": -7.072698593139648, "global_step": 170201, "epoch": 4052} {"train_loss": -6.9119462966918945, "global_step": 170202, "epoch": 4052} {"train_loss": -6.974201202392578, "global_step": 170203, "epoch": 4052} {"train_loss": -6.9924163818359375, "global_step": 170204, "epoch": 4052} {"train_loss": -6.985218524932861, "global_step": 170205, "epoch": 4052} {"train_loss": -6.9892706871032715, "global_step": 170206, "epoch": 4052} {"train_loss": -6.946683883666992, "global_step": 170207, "epoch": 4052} {"train_loss": -7.054800033569336, "global_step": 170208, "epoch": 4052} {"train_loss": -6.996281623840332, "global_step": 170209, "epoch": 4052} {"train_loss": -7.027787208557129, "global_step": 170210, "epoch": 4052} {"train_loss": -6.980632781982422, "global_step": 170211, "epoch": 4052} {"train_loss": -6.868192195892334, "global_step": 170212, "epoch": 4052} {"train_loss": -6.878582000732422, "global_step": 170213, "epoch": 4052} {"train_loss": -6.956857681274414, "global_step": 170214, "epoch": 4052} {"train_loss": -6.986138343811035, "global_step": 170215, "epoch": 4052} {"train_loss": -7.020938873291016, "global_step": 170216, "epoch": 4052} {"train_loss": -6.894136428833008, "global_step": 170217, "epoch": 4052} {"train_loss": -6.940913200378418, "global_step": 170218, "epoch": 4052} {"train_loss": -7.062627792358398, "global_step": 170219, "epoch": 4052} {"train_loss": -6.854732513427734, "global_step": 170220, "epoch": 4052} {"train_loss": -6.9640374183654785, "global_step": 170221, "epoch": 4052} {"train_loss": -7.052562713623047, "global_step": 170222, "epoch": 4052} {"train_loss": -6.8465800285339355, "global_step": 170223, "epoch": 4052} {"train_loss": -6.933609962463379, "global_step": 170224, "epoch": 4052} {"train_loss": -6.980607430140178, "global_step": 170225, "epoch": 4052, "val_loss": 68581.015625} {"train_loss": -6.989531993865967, "global_step": 170226, "epoch": 4053} {"train_loss": -6.885006904602051, "global_step": 170227, "epoch": 4053} {"train_loss": -6.841135025024414, "global_step": 170228, "epoch": 4053} {"train_loss": -6.998432159423828, "global_step": 170229, "epoch": 4053} {"train_loss": -6.828922748565674, "global_step": 170230, "epoch": 4053} {"train_loss": -6.902334213256836, "global_step": 170231, "epoch": 4053} {"train_loss": -6.986658096313477, "global_step": 170232, "epoch": 4053} {"train_loss": -6.875979423522949, "global_step": 170233, "epoch": 4053} {"train_loss": -6.99018669128418, "global_step": 170234, "epoch": 4053} {"train_loss": -6.8676605224609375, "global_step": 170235, "epoch": 4053} {"train_loss": -6.881625175476074, "global_step": 170236, "epoch": 4053} {"train_loss": -6.915449142456055, "global_step": 170237, "epoch": 4053} {"train_loss": -6.853538513183594, "global_step": 170238, "epoch": 4053} {"train_loss": -6.88299036026001, "global_step": 170239, "epoch": 4053} {"train_loss": -6.872480392456055, "global_step": 170240, "epoch": 4053} {"train_loss": -6.864513874053955, "global_step": 170241, "epoch": 4053} {"train_loss": -6.959980010986328, "global_step": 170242, "epoch": 4053} {"train_loss": -7.077948570251465, "global_step": 170243, "epoch": 4053} {"train_loss": -6.811962127685547, "global_step": 170244, "epoch": 4053} {"train_loss": -6.903597831726074, "global_step": 170245, "epoch": 4053} {"train_loss": -6.8769025802612305, "global_step": 170246, "epoch": 4053} {"train_loss": -6.962235450744629, "global_step": 170247, "epoch": 4053} {"train_loss": -6.830985069274902, "global_step": 170248, "epoch": 4053} {"train_loss": -6.870450019836426, "global_step": 170249, "epoch": 4053} {"train_loss": -6.938333511352539, "global_step": 170250, "epoch": 4053} {"train_loss": -6.972839832305908, "global_step": 170251, "epoch": 4053} {"train_loss": -6.852170944213867, "global_step": 170252, "epoch": 4053} {"train_loss": -6.944999694824219, "global_step": 170253, "epoch": 4053} {"train_loss": -6.938901901245117, "global_step": 170254, "epoch": 4053} {"train_loss": -6.870007514953613, "global_step": 170255, "epoch": 4053} {"train_loss": -6.875794410705566, "global_step": 170256, "epoch": 4053} {"train_loss": -6.983802318572998, "global_step": 170257, "epoch": 4053} {"train_loss": -6.953889846801758, "global_step": 170258, "epoch": 4053} {"train_loss": -6.921257019042969, "global_step": 170259, "epoch": 4053} {"train_loss": -6.923761367797852, "global_step": 170260, "epoch": 4053} {"train_loss": -7.038725852966309, "global_step": 170261, "epoch": 4053} {"train_loss": -7.05178689956665, "global_step": 170262, "epoch": 4053} {"train_loss": -6.974179267883301, "global_step": 170263, "epoch": 4053} {"train_loss": -7.000381946563721, "global_step": 170264, "epoch": 4053} {"train_loss": -6.999922752380371, "global_step": 170265, "epoch": 4053} {"train_loss": -7.105531215667725, "global_step": 170266, "epoch": 4053} {"train_loss": -6.93138693627857, "global_step": 170267, "epoch": 4053, "val_loss": 68601.9609375} {"train_loss": -7.014681816101074, "global_step": 170268, "epoch": 4054} {"train_loss": -6.987146377563477, "global_step": 170269, "epoch": 4054} {"train_loss": -6.991818904876709, "global_step": 170270, "epoch": 4054} {"train_loss": -6.976999282836914, "global_step": 170271, "epoch": 4054} {"train_loss": -7.013424873352051, "global_step": 170272, "epoch": 4054} {"train_loss": -6.987298011779785, "global_step": 170273, "epoch": 4054} {"train_loss": -7.005918502807617, "global_step": 170274, "epoch": 4054} {"train_loss": -7.02078104019165, "global_step": 170275, "epoch": 4054} {"train_loss": -7.0221099853515625, "global_step": 170276, "epoch": 4054} {"train_loss": -7.043453216552734, "global_step": 170277, "epoch": 4054} {"train_loss": -6.930537223815918, "global_step": 170278, "epoch": 4054} {"train_loss": -6.927577495574951, "global_step": 170279, "epoch": 4054} {"train_loss": -6.906744003295898, "global_step": 170280, "epoch": 4054} {"train_loss": -6.948369979858398, "global_step": 170281, "epoch": 4054} {"train_loss": -7.088967323303223, "global_step": 170282, "epoch": 4054} {"train_loss": -6.885270118713379, "global_step": 170283, "epoch": 4054} {"train_loss": -7.085141181945801, "global_step": 170284, "epoch": 4054} {"train_loss": -6.947205543518066, "global_step": 170285, "epoch": 4054} {"train_loss": -6.921773910522461, "global_step": 170286, "epoch": 4054} {"train_loss": -7.052160263061523, "global_step": 170287, "epoch": 4054} {"train_loss": -7.050556659698486, "global_step": 170288, "epoch": 4054} {"train_loss": -6.951555252075195, "global_step": 170289, "epoch": 4054} {"train_loss": -6.96489143371582, "global_step": 170290, "epoch": 4054} {"train_loss": -6.978092670440674, "global_step": 170291, "epoch": 4054} {"train_loss": -7.010828495025635, "global_step": 170292, "epoch": 4054} {"train_loss": -7.013920783996582, "global_step": 170293, "epoch": 4054} {"train_loss": -7.039324760437012, "global_step": 170294, "epoch": 4054} {"train_loss": -7.110031604766846, "global_step": 170295, "epoch": 4054} {"train_loss": -6.988628387451172, "global_step": 170296, "epoch": 4054} {"train_loss": -6.931623458862305, "global_step": 170297, "epoch": 4054} {"train_loss": -7.0234527587890625, "global_step": 170298, "epoch": 4054} {"train_loss": -7.02495813369751, "global_step": 170299, "epoch": 4054} {"train_loss": -7.008439064025879, "global_step": 170300, "epoch": 4054} {"train_loss": -7.087032794952393, "global_step": 170301, "epoch": 4054} {"train_loss": -7.033384323120117, "global_step": 170302, "epoch": 4054} {"train_loss": -6.881059169769287, "global_step": 170303, "epoch": 4054} {"train_loss": -7.051386833190918, "global_step": 170304, "epoch": 4054} {"train_loss": -7.081871032714844, "global_step": 170305, "epoch": 4054} {"train_loss": -6.962874412536621, "global_step": 170306, "epoch": 4054} {"train_loss": -7.034921646118164, "global_step": 170307, "epoch": 4054} {"train_loss": -6.936936855316162, "global_step": 170308, "epoch": 4054} {"train_loss": -6.997566847574143, "global_step": 170309, "epoch": 4054, "val_loss": 68710.7578125} {"train_loss": -7.057089805603027, "global_step": 170310, "epoch": 4055} {"train_loss": -7.028072357177734, "global_step": 170311, "epoch": 4055} {"train_loss": -6.937593460083008, "global_step": 170312, "epoch": 4055} {"train_loss": -6.997980117797852, "global_step": 170313, "epoch": 4055} {"train_loss": -6.92365837097168, "global_step": 170314, "epoch": 4055} {"train_loss": -7.017200946807861, "global_step": 170315, "epoch": 4055} {"train_loss": -7.012857437133789, "global_step": 170316, "epoch": 4055} {"train_loss": -6.992983818054199, "global_step": 170317, "epoch": 4055} {"train_loss": -7.115318775177002, "global_step": 170318, "epoch": 4055} {"train_loss": -7.048051357269287, "global_step": 170319, "epoch": 4055} {"train_loss": -7.0753912925720215, "global_step": 170320, "epoch": 4055} {"train_loss": -6.870995044708252, "global_step": 170321, "epoch": 4055} {"train_loss": -7.1254072189331055, "global_step": 170322, "epoch": 4055} {"train_loss": -6.952263832092285, "global_step": 170323, "epoch": 4055} {"train_loss": -6.976515769958496, "global_step": 170324, "epoch": 4055} {"train_loss": -7.030054569244385, "global_step": 170325, "epoch": 4055} {"train_loss": -7.038688659667969, "global_step": 170326, "epoch": 4055} {"train_loss": -7.011870384216309, "global_step": 170327, "epoch": 4055} {"train_loss": -7.126934051513672, "global_step": 170328, "epoch": 4055} {"train_loss": -7.117741584777832, "global_step": 170329, "epoch": 4055} {"train_loss": -7.076151371002197, "global_step": 170330, "epoch": 4055} {"train_loss": -7.0336480140686035, "global_step": 170331, "epoch": 4055} {"train_loss": -7.160520553588867, "global_step": 170332, "epoch": 4055} {"train_loss": -7.001473426818848, "global_step": 170333, "epoch": 4055} {"train_loss": -6.934277534484863, "global_step": 170334, "epoch": 4055} {"train_loss": -6.994106292724609, "global_step": 170335, "epoch": 4055} {"train_loss": -7.044795989990234, "global_step": 170336, "epoch": 4055} {"train_loss": -6.890314102172852, "global_step": 170337, "epoch": 4055} {"train_loss": -7.0367960929870605, "global_step": 170338, "epoch": 4055} {"train_loss": -6.877379894256592, "global_step": 170339, "epoch": 4055} {"train_loss": -7.083864212036133, "global_step": 170340, "epoch": 4055} {"train_loss": -6.996670722961426, "global_step": 170341, "epoch": 4055} {"train_loss": -7.024959087371826, "global_step": 170342, "epoch": 4055} {"train_loss": -6.99370002746582, "global_step": 170343, "epoch": 4055} {"train_loss": -6.964120864868164, "global_step": 170344, "epoch": 4055} {"train_loss": -6.973964691162109, "global_step": 170345, "epoch": 4055} {"train_loss": -7.021754264831543, "global_step": 170346, "epoch": 4055} {"train_loss": -6.964600563049316, "global_step": 170347, "epoch": 4055} {"train_loss": -6.9429931640625, "global_step": 170348, "epoch": 4055} {"train_loss": -6.997304916381836, "global_step": 170349, "epoch": 4055} {"train_loss": -6.949619293212891, "global_step": 170350, "epoch": 4055} {"train_loss": -7.01014122508821, "global_step": 170351, "epoch": 4055, "val_loss": 68628.859375} {"train_loss": -7.037640571594238, "global_step": 170352, "epoch": 4056} {"train_loss": -7.026348114013672, "global_step": 170353, "epoch": 4056} {"train_loss": -7.051857948303223, "global_step": 170354, "epoch": 4056} {"train_loss": -6.933109283447266, "global_step": 170355, "epoch": 4056} {"train_loss": -6.992580413818359, "global_step": 170356, "epoch": 4056} {"train_loss": -6.886692047119141, "global_step": 170357, "epoch": 4056} {"train_loss": -6.9327497482299805, "global_step": 170358, "epoch": 4056} {"train_loss": -6.8046040534973145, "global_step": 170359, "epoch": 4056} {"train_loss": -6.984281063079834, "global_step": 170360, "epoch": 4056} {"train_loss": -6.8931779861450195, "global_step": 170361, "epoch": 4056} {"train_loss": -7.042771816253662, "global_step": 170362, "epoch": 4056} {"train_loss": -6.9901957511901855, "global_step": 170363, "epoch": 4056} {"train_loss": -6.897220611572266, "global_step": 170364, "epoch": 4056} {"train_loss": -7.08238410949707, "global_step": 170365, "epoch": 4056} {"train_loss": -6.965999603271484, "global_step": 170366, "epoch": 4056} {"train_loss": -6.985427379608154, "global_step": 170367, "epoch": 4056} {"train_loss": -6.790952682495117, "global_step": 170368, "epoch": 4056} {"train_loss": -6.9623823165893555, "global_step": 170369, "epoch": 4056} {"train_loss": -6.981201171875, "global_step": 170370, "epoch": 4056} {"train_loss": -6.992295742034912, "global_step": 170371, "epoch": 4056} {"train_loss": -6.9907989501953125, "global_step": 170372, "epoch": 4056} {"train_loss": -6.946291923522949, "global_step": 170373, "epoch": 4056} {"train_loss": -6.85540771484375, "global_step": 170374, "epoch": 4056} {"train_loss": -6.957137584686279, "global_step": 170375, "epoch": 4056} {"train_loss": -6.841993808746338, "global_step": 170376, "epoch": 4056} {"train_loss": -7.000838279724121, "global_step": 170377, "epoch": 4056} {"train_loss": -7.029945373535156, "global_step": 170378, "epoch": 4056} {"train_loss": -6.974073886871338, "global_step": 170379, "epoch": 4056} {"train_loss": -6.969086647033691, "global_step": 170380, "epoch": 4056} {"train_loss": -6.9586076736450195, "global_step": 170381, "epoch": 4056} {"train_loss": -6.864686965942383, "global_step": 170382, "epoch": 4056} {"train_loss": -6.987598419189453, "global_step": 170383, "epoch": 4056} {"train_loss": -7.034728050231934, "global_step": 170384, "epoch": 4056} {"train_loss": -7.008838653564453, "global_step": 170385, "epoch": 4056} {"train_loss": -6.999206066131592, "global_step": 170386, "epoch": 4056} {"train_loss": -7.092398643493652, "global_step": 170387, "epoch": 4056} {"train_loss": -6.9606451988220215, "global_step": 170388, "epoch": 4056} {"train_loss": -6.944504737854004, "global_step": 170389, "epoch": 4056} {"train_loss": -6.912954330444336, "global_step": 170390, "epoch": 4056} {"train_loss": -7.111037254333496, "global_step": 170391, "epoch": 4056} {"train_loss": -7.046977996826172, "global_step": 170392, "epoch": 4056} {"train_loss": -6.96918435323806, "global_step": 170393, "epoch": 4056, "val_loss": 68661.0859375} {"train_loss": -7.0092973709106445, "global_step": 170394, "epoch": 4057} {"train_loss": -6.977497100830078, "global_step": 170395, "epoch": 4057} {"train_loss": -6.9850335121154785, "global_step": 170396, "epoch": 4057} {"train_loss": -6.999334335327148, "global_step": 170397, "epoch": 4057} {"train_loss": -6.958184719085693, "global_step": 170398, "epoch": 4057} {"train_loss": -6.932882308959961, "global_step": 170399, "epoch": 4057} {"train_loss": -6.935451984405518, "global_step": 170400, "epoch": 4057} {"train_loss": -6.724381446838379, "global_step": 170401, "epoch": 4057} {"train_loss": -6.973720550537109, "global_step": 170402, "epoch": 4057} {"train_loss": -7.023282051086426, "global_step": 170403, "epoch": 4057} {"train_loss": -6.901966094970703, "global_step": 170404, "epoch": 4057} {"train_loss": -6.905875205993652, "global_step": 170405, "epoch": 4057} {"train_loss": -7.055595874786377, "global_step": 170406, "epoch": 4057} {"train_loss": -6.95396614074707, "global_step": 170407, "epoch": 4057} {"train_loss": -6.939302921295166, "global_step": 170408, "epoch": 4057} {"train_loss": -6.921504974365234, "global_step": 170409, "epoch": 4057} {"train_loss": -6.925935745239258, "global_step": 170410, "epoch": 4057} {"train_loss": -6.998389720916748, "global_step": 170411, "epoch": 4057} {"train_loss": -6.860527515411377, "global_step": 170412, "epoch": 4057} {"train_loss": -6.990009307861328, "global_step": 170413, "epoch": 4057} {"train_loss": -6.9311137199401855, "global_step": 170414, "epoch": 4057} {"train_loss": -6.820518493652344, "global_step": 170415, "epoch": 4057} {"train_loss": -6.977585792541504, "global_step": 170416, "epoch": 4057} {"train_loss": -6.852900981903076, "global_step": 170417, "epoch": 4057} {"train_loss": -6.853818893432617, "global_step": 170418, "epoch": 4057} {"train_loss": -6.848094940185547, "global_step": 170419, "epoch": 4057} {"train_loss": -6.832876682281494, "global_step": 170420, "epoch": 4057} {"train_loss": -6.963448524475098, "global_step": 170421, "epoch": 4057} {"train_loss": -6.688638687133789, "global_step": 170422, "epoch": 4057} {"train_loss": -6.846761703491211, "global_step": 170423, "epoch": 4057} {"train_loss": -6.986738681793213, "global_step": 170424, "epoch": 4057} {"train_loss": -6.873323440551758, "global_step": 170425, "epoch": 4057} {"train_loss": -6.913224220275879, "global_step": 170426, "epoch": 4057} {"train_loss": -6.927302837371826, "global_step": 170427, "epoch": 4057} {"train_loss": -6.940927028656006, "global_step": 170428, "epoch": 4057} {"train_loss": -6.90709924697876, "global_step": 170429, "epoch": 4057} {"train_loss": -6.8829803466796875, "global_step": 170430, "epoch": 4057} {"train_loss": -6.984281539916992, "global_step": 170431, "epoch": 4057} {"train_loss": -6.6979241371154785, "global_step": 170432, "epoch": 4057} {"train_loss": -6.860965728759766, "global_step": 170433, "epoch": 4057} {"train_loss": -6.895402908325195, "global_step": 170434, "epoch": 4057} {"train_loss": -6.913854826064337, "global_step": 170435, "epoch": 4057, "val_loss": 68941.8671875} {"train_loss": -6.774428367614746, "global_step": 170436, "epoch": 4058} {"train_loss": -6.872631072998047, "global_step": 170437, "epoch": 4058} {"train_loss": -6.75691032409668, "global_step": 170438, "epoch": 4058} {"train_loss": -6.937093734741211, "global_step": 170439, "epoch": 4058} {"train_loss": -6.954291820526123, "global_step": 170440, "epoch": 4058} {"train_loss": -6.949037551879883, "global_step": 170441, "epoch": 4058} {"train_loss": -6.972317218780518, "global_step": 170442, "epoch": 4058} {"train_loss": -6.924042701721191, "global_step": 170443, "epoch": 4058} {"train_loss": -6.975582122802734, "global_step": 170444, "epoch": 4058} {"train_loss": -6.839087963104248, "global_step": 170445, "epoch": 4058} {"train_loss": -6.922547340393066, "global_step": 170446, "epoch": 4058} {"train_loss": -6.975817680358887, "global_step": 170447, "epoch": 4058} {"train_loss": -6.9750752449035645, "global_step": 170448, "epoch": 4058} {"train_loss": -6.952559471130371, "global_step": 170449, "epoch": 4058} {"train_loss": -6.958691596984863, "global_step": 170450, "epoch": 4058} {"train_loss": -6.924670219421387, "global_step": 170451, "epoch": 4058} {"train_loss": -6.888636589050293, "global_step": 170452, "epoch": 4058} {"train_loss": -7.005640029907227, "global_step": 170453, "epoch": 4058} {"train_loss": -7.002411842346191, "global_step": 170454, "epoch": 4058} {"train_loss": -7.024262428283691, "global_step": 170455, "epoch": 4058} {"train_loss": -6.865839004516602, "global_step": 170456, "epoch": 4058} {"train_loss": -7.01057243347168, "global_step": 170457, "epoch": 4058} {"train_loss": -6.905728340148926, "global_step": 170458, "epoch": 4058} {"train_loss": -6.99490213394165, "global_step": 170459, "epoch": 4058} {"train_loss": -6.929802894592285, "global_step": 170460, "epoch": 4058} {"train_loss": -7.01416015625, "global_step": 170461, "epoch": 4058} {"train_loss": -7.008249282836914, "global_step": 170462, "epoch": 4058} {"train_loss": -7.029626846313477, "global_step": 170463, "epoch": 4058} {"train_loss": -7.021230220794678, "global_step": 170464, "epoch": 4058} {"train_loss": -6.801817893981934, "global_step": 170465, "epoch": 4058} {"train_loss": -6.965222358703613, "global_step": 170466, "epoch": 4058} {"train_loss": -6.948555946350098, "global_step": 170467, "epoch": 4058} {"train_loss": -6.840810775756836, "global_step": 170468, "epoch": 4058} {"train_loss": -7.10476016998291, "global_step": 170469, "epoch": 4058} {"train_loss": -6.920352935791016, "global_step": 170470, "epoch": 4058} {"train_loss": -7.054670333862305, "global_step": 170471, "epoch": 4058} {"train_loss": -6.952771186828613, "global_step": 170472, "epoch": 4058} {"train_loss": -7.102283477783203, "global_step": 170473, "epoch": 4058} {"train_loss": -7.115196704864502, "global_step": 170474, "epoch": 4058} {"train_loss": -7.070735454559326, "global_step": 170475, "epoch": 4058} {"train_loss": -7.001631736755371, "global_step": 170476, "epoch": 4058} {"train_loss": -6.958508241744268, "global_step": 170477, "epoch": 4058, "val_loss": 68589.5625} {"train_loss": -7.084402084350586, "global_step": 170478, "epoch": 4059} {"train_loss": -7.035815238952637, "global_step": 170479, "epoch": 4059} {"train_loss": -7.116024494171143, "global_step": 170480, "epoch": 4059} {"train_loss": -7.031429290771484, "global_step": 170481, "epoch": 4059} {"train_loss": -7.0392255783081055, "global_step": 170482, "epoch": 4059} {"train_loss": -6.8958001136779785, "global_step": 170483, "epoch": 4059} {"train_loss": -7.024155616760254, "global_step": 170484, "epoch": 4059} {"train_loss": -6.898727893829346, "global_step": 170485, "epoch": 4059} {"train_loss": -7.061176776885986, "global_step": 170486, "epoch": 4059} {"train_loss": -6.9567718505859375, "global_step": 170487, "epoch": 4059} {"train_loss": -6.977762222290039, "global_step": 170488, "epoch": 4059} {"train_loss": -7.0100202560424805, "global_step": 170489, "epoch": 4059} {"train_loss": -6.944275856018066, "global_step": 170490, "epoch": 4059} {"train_loss": -6.873747825622559, "global_step": 170491, "epoch": 4059} {"train_loss": -7.0286335945129395, "global_step": 170492, "epoch": 4059} {"train_loss": -6.933215141296387, "global_step": 170493, "epoch": 4059} {"train_loss": -7.01949405670166, "global_step": 170494, "epoch": 4059} {"train_loss": -7.077548980712891, "global_step": 170495, "epoch": 4059} {"train_loss": -6.946839332580566, "global_step": 170496, "epoch": 4059} {"train_loss": -7.077108383178711, "global_step": 170497, "epoch": 4059} {"train_loss": -6.952677249908447, "global_step": 170498, "epoch": 4059} {"train_loss": -6.960548400878906, "global_step": 170499, "epoch": 4059} {"train_loss": -7.000363826751709, "global_step": 170500, "epoch": 4059} {"train_loss": -6.960855484008789, "global_step": 170501, "epoch": 4059} {"train_loss": -6.954565048217773, "global_step": 170502, "epoch": 4059} {"train_loss": -7.036259651184082, "global_step": 170503, "epoch": 4059} {"train_loss": -7.039035797119141, "global_step": 170504, "epoch": 4059} {"train_loss": -6.890633583068848, "global_step": 170505, "epoch": 4059} {"train_loss": -7.01699161529541, "global_step": 170506, "epoch": 4059} {"train_loss": -7.085827827453613, "global_step": 170507, "epoch": 4059} {"train_loss": -7.025564193725586, "global_step": 170508, "epoch": 4059} {"train_loss": -7.006258010864258, "global_step": 170509, "epoch": 4059} {"train_loss": -6.943596363067627, "global_step": 170510, "epoch": 4059} {"train_loss": -7.0338263511657715, "global_step": 170511, "epoch": 4059} {"train_loss": -6.956947326660156, "global_step": 170512, "epoch": 4059} {"train_loss": -6.96023416519165, "global_step": 170513, "epoch": 4059} {"train_loss": -6.930441856384277, "global_step": 170514, "epoch": 4059} {"train_loss": -6.972131252288818, "global_step": 170515, "epoch": 4059} {"train_loss": -6.967612266540527, "global_step": 170516, "epoch": 4059} {"train_loss": -6.898707389831543, "global_step": 170517, "epoch": 4059} {"train_loss": -6.928037643432617, "global_step": 170518, "epoch": 4059} {"train_loss": -6.990029914038522, "global_step": 170519, "epoch": 4059, "val_loss": 68695.078125} {"train_loss": -6.9548020362854, "global_step": 170520, "epoch": 4060} {"train_loss": -7.000390529632568, "global_step": 170521, "epoch": 4060} {"train_loss": -7.057496070861816, "global_step": 170522, "epoch": 4060} {"train_loss": -6.983305931091309, "global_step": 170523, "epoch": 4060} {"train_loss": -6.98972225189209, "global_step": 170524, "epoch": 4060} {"train_loss": -6.906632423400879, "global_step": 170525, "epoch": 4060} {"train_loss": -7.02097225189209, "global_step": 170526, "epoch": 4060} {"train_loss": -6.9903764724731445, "global_step": 170527, "epoch": 4060} {"train_loss": -6.979545593261719, "global_step": 170528, "epoch": 4060} {"train_loss": -7.008721351623535, "global_step": 170529, "epoch": 4060} {"train_loss": -7.03476619720459, "global_step": 170530, "epoch": 4060} {"train_loss": -7.074502468109131, "global_step": 170531, "epoch": 4060} {"train_loss": -6.920360565185547, "global_step": 170532, "epoch": 4060} {"train_loss": -7.113207817077637, "global_step": 170533, "epoch": 4060} {"train_loss": -7.044584274291992, "global_step": 170534, "epoch": 4060} {"train_loss": -6.990601539611816, "global_step": 170535, "epoch": 4060} {"train_loss": -6.990758419036865, "global_step": 170536, "epoch": 4060} {"train_loss": -6.958178520202637, "global_step": 170537, "epoch": 4060} {"train_loss": -6.904400825500488, "global_step": 170538, "epoch": 4060} {"train_loss": -7.085360527038574, "global_step": 170539, "epoch": 4060} {"train_loss": -6.9269866943359375, "global_step": 170540, "epoch": 4060} {"train_loss": -7.094628810882568, "global_step": 170541, "epoch": 4060} {"train_loss": -6.993988990783691, "global_step": 170542, "epoch": 4060} {"train_loss": -6.995551109313965, "global_step": 170543, "epoch": 4060} {"train_loss": -6.934918403625488, "global_step": 170544, "epoch": 4060} {"train_loss": -6.81447696685791, "global_step": 170545, "epoch": 4060} {"train_loss": -6.91080379486084, "global_step": 170546, "epoch": 4060} {"train_loss": -6.870552062988281, "global_step": 170547, "epoch": 4060} {"train_loss": -6.904024600982666, "global_step": 170548, "epoch": 4060} {"train_loss": -6.833021640777588, "global_step": 170549, "epoch": 4060} {"train_loss": -6.9749274253845215, "global_step": 170550, "epoch": 4060} {"train_loss": -6.877162933349609, "global_step": 170551, "epoch": 4060} {"train_loss": -6.861400604248047, "global_step": 170552, "epoch": 4060} {"train_loss": -6.9444403648376465, "global_step": 170553, "epoch": 4060} {"train_loss": -6.85957145690918, "global_step": 170554, "epoch": 4060} {"train_loss": -6.902176856994629, "global_step": 170555, "epoch": 4060} {"train_loss": -6.960478782653809, "global_step": 170556, "epoch": 4060} {"train_loss": -6.913363456726074, "global_step": 170557, "epoch": 4060} {"train_loss": -6.963396072387695, "global_step": 170558, "epoch": 4060} {"train_loss": -6.999034881591797, "global_step": 170559, "epoch": 4060} {"train_loss": -6.959996223449707, "global_step": 170560, "epoch": 4060} {"train_loss": -6.961761190777733, "global_step": 170561, "epoch": 4060, "val_loss": 68530.359375} {"train_loss": -7.035192966461182, "global_step": 170562, "epoch": 4061} {"train_loss": -7.106873512268066, "global_step": 170563, "epoch": 4061} {"train_loss": -7.005492210388184, "global_step": 170564, "epoch": 4061} {"train_loss": -6.977582931518555, "global_step": 170565, "epoch": 4061} {"train_loss": -6.930093288421631, "global_step": 170566, "epoch": 4061} {"train_loss": -7.063270568847656, "global_step": 170567, "epoch": 4061} {"train_loss": -7.107121467590332, "global_step": 170568, "epoch": 4061} {"train_loss": -7.096948623657227, "global_step": 170569, "epoch": 4061} {"train_loss": -7.019518852233887, "global_step": 170570, "epoch": 4061} {"train_loss": -7.089258193969727, "global_step": 170571, "epoch": 4061} {"train_loss": -7.0356125831604, "global_step": 170572, "epoch": 4061} {"train_loss": -6.944568634033203, "global_step": 170573, "epoch": 4061} {"train_loss": -7.0634660720825195, "global_step": 170574, "epoch": 4061} {"train_loss": -7.082394599914551, "global_step": 170575, "epoch": 4061} {"train_loss": -6.929232120513916, "global_step": 170576, "epoch": 4061} {"train_loss": -7.047913551330566, "global_step": 170577, "epoch": 4061} {"train_loss": -7.020336627960205, "global_step": 170578, "epoch": 4061} {"train_loss": -6.979323863983154, "global_step": 170579, "epoch": 4061} {"train_loss": -6.994068145751953, "global_step": 170580, "epoch": 4061} {"train_loss": -7.051359176635742, "global_step": 170581, "epoch": 4061} {"train_loss": -7.0554423332214355, "global_step": 170582, "epoch": 4061} {"train_loss": -6.969633102416992, "global_step": 170583, "epoch": 4061} {"train_loss": -7.078035831451416, "global_step": 170584, "epoch": 4061} {"train_loss": -7.077733039855957, "global_step": 170585, "epoch": 4061} {"train_loss": -6.972585678100586, "global_step": 170586, "epoch": 4061} {"train_loss": -7.1517534255981445, "global_step": 170587, "epoch": 4061} {"train_loss": -7.01376485824585, "global_step": 170588, "epoch": 4061} {"train_loss": -6.996068954467773, "global_step": 170589, "epoch": 4061} {"train_loss": -6.9844865798950195, "global_step": 170590, "epoch": 4061} {"train_loss": -7.016396522521973, "global_step": 170591, "epoch": 4061} {"train_loss": -7.020757675170898, "global_step": 170592, "epoch": 4061} {"train_loss": -7.047794342041016, "global_step": 170593, "epoch": 4061} {"train_loss": -7.10626745223999, "global_step": 170594, "epoch": 4061} {"train_loss": -7.027071475982666, "global_step": 170595, "epoch": 4061} {"train_loss": -6.858809471130371, "global_step": 170596, "epoch": 4061} {"train_loss": -6.989618301391602, "global_step": 170597, "epoch": 4061} {"train_loss": -6.845244407653809, "global_step": 170598, "epoch": 4061} {"train_loss": -6.808669567108154, "global_step": 170599, "epoch": 4061} {"train_loss": -7.020403861999512, "global_step": 170600, "epoch": 4061} {"train_loss": -6.888984680175781, "global_step": 170601, "epoch": 4061} {"train_loss": -6.989920616149902, "global_step": 170602, "epoch": 4061} {"train_loss": -7.009813865025838, "global_step": 170603, "epoch": 4061, "val_loss": 68842.40625} {"train_loss": -7.004796981811523, "global_step": 170604, "epoch": 4062} {"train_loss": -6.935986518859863, "global_step": 170605, "epoch": 4062} {"train_loss": -6.940517425537109, "global_step": 170606, "epoch": 4062} {"train_loss": -6.852270126342773, "global_step": 170607, "epoch": 4062} {"train_loss": -7.094732284545898, "global_step": 170608, "epoch": 4062} {"train_loss": -7.079138278961182, "global_step": 170609, "epoch": 4062} {"train_loss": -6.968139171600342, "global_step": 170610, "epoch": 4062} {"train_loss": -6.951513290405273, "global_step": 170611, "epoch": 4062} {"train_loss": -7.018911838531494, "global_step": 170612, "epoch": 4062} {"train_loss": -6.847997665405273, "global_step": 170613, "epoch": 4062} {"train_loss": -7.12276554107666, "global_step": 170614, "epoch": 4062} {"train_loss": -6.980861186981201, "global_step": 170615, "epoch": 4062} {"train_loss": -6.8112993240356445, "global_step": 170616, "epoch": 4062} {"train_loss": -6.991143703460693, "global_step": 170617, "epoch": 4062} {"train_loss": -6.79958438873291, "global_step": 170618, "epoch": 4062} {"train_loss": -6.905758380889893, "global_step": 170619, "epoch": 4062} {"train_loss": -6.830419540405273, "global_step": 170620, "epoch": 4062} {"train_loss": -6.826530456542969, "global_step": 170621, "epoch": 4062} {"train_loss": -6.97446346282959, "global_step": 170622, "epoch": 4062} {"train_loss": -6.785432815551758, "global_step": 170623, "epoch": 4062} {"train_loss": -6.865412712097168, "global_step": 170624, "epoch": 4062} {"train_loss": -6.974266052246094, "global_step": 170625, "epoch": 4062} {"train_loss": -6.911731719970703, "global_step": 170626, "epoch": 4062} {"train_loss": -6.956432342529297, "global_step": 170627, "epoch": 4062} {"train_loss": -6.846484184265137, "global_step": 170628, "epoch": 4062} {"train_loss": -6.874380111694336, "global_step": 170629, "epoch": 4062} {"train_loss": -7.0337815284729, "global_step": 170630, "epoch": 4062} {"train_loss": -6.827313423156738, "global_step": 170631, "epoch": 4062} {"train_loss": -7.053896903991699, "global_step": 170632, "epoch": 4062} {"train_loss": -6.949251174926758, "global_step": 170633, "epoch": 4062} {"train_loss": -6.909974098205566, "global_step": 170634, "epoch": 4062} {"train_loss": -7.015673637390137, "global_step": 170635, "epoch": 4062} {"train_loss": -7.023653507232666, "global_step": 170636, "epoch": 4062} {"train_loss": -6.939383029937744, "global_step": 170637, "epoch": 4062} {"train_loss": -6.990083694458008, "global_step": 170638, "epoch": 4062} {"train_loss": -6.945204734802246, "global_step": 170639, "epoch": 4062} {"train_loss": -7.010660648345947, "global_step": 170640, "epoch": 4062} {"train_loss": -7.0501885414123535, "global_step": 170641, "epoch": 4062} {"train_loss": -6.895631790161133, "global_step": 170642, "epoch": 4062} {"train_loss": -7.096627712249756, "global_step": 170643, "epoch": 4062} {"train_loss": -6.993852615356445, "global_step": 170644, "epoch": 4062} {"train_loss": -6.950329735165551, "global_step": 170645, "epoch": 4062, "val_loss": 68494.984375} {"train_loss": -7.0546488761901855, "global_step": 170646, "epoch": 4063} {"train_loss": -7.061102867126465, "global_step": 170647, "epoch": 4063} {"train_loss": -6.95543909072876, "global_step": 170648, "epoch": 4063} {"train_loss": -7.02510929107666, "global_step": 170649, "epoch": 4063} {"train_loss": -7.186659812927246, "global_step": 170650, "epoch": 4063} {"train_loss": -6.850497722625732, "global_step": 170651, "epoch": 4063} {"train_loss": -6.972768783569336, "global_step": 170652, "epoch": 4063} {"train_loss": -6.993276596069336, "global_step": 170653, "epoch": 4063} {"train_loss": -6.99098014831543, "global_step": 170654, "epoch": 4063} {"train_loss": -6.907757759094238, "global_step": 170655, "epoch": 4063} {"train_loss": -6.910577774047852, "global_step": 170656, "epoch": 4063} {"train_loss": -7.018675804138184, "global_step": 170657, "epoch": 4063} {"train_loss": -6.827542304992676, "global_step": 170658, "epoch": 4063} {"train_loss": -6.8645524978637695, "global_step": 170659, "epoch": 4063} {"train_loss": -6.993476867675781, "global_step": 170660, "epoch": 4063} {"train_loss": -6.893148422241211, "global_step": 170661, "epoch": 4063} {"train_loss": -7.02783203125, "global_step": 170662, "epoch": 4063} {"train_loss": -7.105810165405273, "global_step": 170663, "epoch": 4063} {"train_loss": -6.848399639129639, "global_step": 170664, "epoch": 4063} {"train_loss": -7.030896186828613, "global_step": 170665, "epoch": 4063} {"train_loss": -6.907890319824219, "global_step": 170666, "epoch": 4063} {"train_loss": -6.962705612182617, "global_step": 170667, "epoch": 4063} {"train_loss": -6.939064979553223, "global_step": 170668, "epoch": 4063} {"train_loss": -6.881180763244629, "global_step": 170669, "epoch": 4063} {"train_loss": -7.027896404266357, "global_step": 170670, "epoch": 4063} {"train_loss": -6.904167652130127, "global_step": 170671, "epoch": 4063} {"train_loss": -6.907358169555664, "global_step": 170672, "epoch": 4063} {"train_loss": -6.890821933746338, "global_step": 170673, "epoch": 4063} {"train_loss": -6.986020088195801, "global_step": 170674, "epoch": 4063} {"train_loss": -6.987916946411133, "global_step": 170675, "epoch": 4063} {"train_loss": -6.894736289978027, "global_step": 170676, "epoch": 4063} {"train_loss": -6.896768569946289, "global_step": 170677, "epoch": 4063} {"train_loss": -6.767280578613281, "global_step": 170678, "epoch": 4063} {"train_loss": -6.913765907287598, "global_step": 170679, "epoch": 4063} {"train_loss": -6.928119659423828, "global_step": 170680, "epoch": 4063} {"train_loss": -7.004786491394043, "global_step": 170681, "epoch": 4063} {"train_loss": -6.923679351806641, "global_step": 170682, "epoch": 4063} {"train_loss": -6.876585006713867, "global_step": 170683, "epoch": 4063} {"train_loss": -6.9913330078125, "global_step": 170684, "epoch": 4063} {"train_loss": -6.891427993774414, "global_step": 170685, "epoch": 4063} {"train_loss": -6.928906440734863, "global_step": 170686, "epoch": 4063} {"train_loss": -6.9488940352485296, "global_step": 170687, "epoch": 4063, "val_loss": 68370.9921875} {"train_loss": -6.984962463378906, "global_step": 170688, "epoch": 4064} {"train_loss": -6.88566780090332, "global_step": 170689, "epoch": 4064} {"train_loss": -7.075563430786133, "global_step": 170690, "epoch": 4064} {"train_loss": -6.973809242248535, "global_step": 170691, "epoch": 4064} {"train_loss": -6.974957466125488, "global_step": 170692, "epoch": 4064} {"train_loss": -7.054505348205566, "global_step": 170693, "epoch": 4064} {"train_loss": -6.947876453399658, "global_step": 170694, "epoch": 4064} {"train_loss": -7.014960289001465, "global_step": 170695, "epoch": 4064} {"train_loss": -6.990025997161865, "global_step": 170696, "epoch": 4064} {"train_loss": -7.000612735748291, "global_step": 170697, "epoch": 4064} {"train_loss": -6.98427152633667, "global_step": 170698, "epoch": 4064} {"train_loss": -7.070801734924316, "global_step": 170699, "epoch": 4064} {"train_loss": -7.043745994567871, "global_step": 170700, "epoch": 4064} {"train_loss": -7.048696517944336, "global_step": 170701, "epoch": 4064} {"train_loss": -6.975255966186523, "global_step": 170702, "epoch": 4064} {"train_loss": -6.994808197021484, "global_step": 170703, "epoch": 4064} {"train_loss": -6.933239936828613, "global_step": 170704, "epoch": 4064} {"train_loss": -7.007138252258301, "global_step": 170705, "epoch": 4064} {"train_loss": -6.951608657836914, "global_step": 170706, "epoch": 4064} {"train_loss": -6.953473091125488, "global_step": 170707, "epoch": 4064} {"train_loss": -7.0479278564453125, "global_step": 170708, "epoch": 4064} {"train_loss": -6.912867546081543, "global_step": 170709, "epoch": 4064} {"train_loss": -6.965513229370117, "global_step": 170710, "epoch": 4064} {"train_loss": -7.02645206451416, "global_step": 170711, "epoch": 4064} {"train_loss": -6.973340034484863, "global_step": 170712, "epoch": 4064} {"train_loss": -7.061393737792969, "global_step": 170713, "epoch": 4064} {"train_loss": -6.93436336517334, "global_step": 170714, "epoch": 4064} {"train_loss": -6.988747596740723, "global_step": 170715, "epoch": 4064} {"train_loss": -7.014552593231201, "global_step": 170716, "epoch": 4064} {"train_loss": -6.872928619384766, "global_step": 170717, "epoch": 4064} {"train_loss": -6.890551567077637, "global_step": 170718, "epoch": 4064} {"train_loss": -6.807366847991943, "global_step": 170719, "epoch": 4064} {"train_loss": -6.865279674530029, "global_step": 170720, "epoch": 4064} {"train_loss": -6.854440689086914, "global_step": 170721, "epoch": 4064} {"train_loss": -6.92656946182251, "global_step": 170722, "epoch": 4064} {"train_loss": -6.881508827209473, "global_step": 170723, "epoch": 4064} {"train_loss": -6.876768112182617, "global_step": 170724, "epoch": 4064} {"train_loss": -6.908052444458008, "global_step": 170725, "epoch": 4064} {"train_loss": -6.850909233093262, "global_step": 170726, "epoch": 4064} {"train_loss": -6.979912281036377, "global_step": 170727, "epoch": 4064} {"train_loss": -6.996251106262207, "global_step": 170728, "epoch": 4064} {"train_loss": -6.961965526853289, "global_step": 170729, "epoch": 4064, "val_loss": 68516.5078125} {"train_loss": -6.825976371765137, "global_step": 170730, "epoch": 4065} {"train_loss": -6.855085372924805, "global_step": 170731, "epoch": 4065} {"train_loss": -6.939253807067871, "global_step": 170732, "epoch": 4065} {"train_loss": -6.956903457641602, "global_step": 170733, "epoch": 4065} {"train_loss": -6.896727085113525, "global_step": 170734, "epoch": 4065} {"train_loss": -7.041412353515625, "global_step": 170735, "epoch": 4065} {"train_loss": -7.03482723236084, "global_step": 170736, "epoch": 4065} {"train_loss": -7.003114223480225, "global_step": 170737, "epoch": 4065} {"train_loss": -7.049375057220459, "global_step": 170738, "epoch": 4065} {"train_loss": -6.953847885131836, "global_step": 170739, "epoch": 4065} {"train_loss": -6.9798994064331055, "global_step": 170740, "epoch": 4065} {"train_loss": -6.984321594238281, "global_step": 170741, "epoch": 4065} {"train_loss": -6.9429240226745605, "global_step": 170742, "epoch": 4065} {"train_loss": -6.970725059509277, "global_step": 170743, "epoch": 4065} {"train_loss": -6.98756217956543, "global_step": 170744, "epoch": 4065} {"train_loss": -7.0917067527771, "global_step": 170745, "epoch": 4065} {"train_loss": -6.918087959289551, "global_step": 170746, "epoch": 4065} {"train_loss": -6.982967376708984, "global_step": 170747, "epoch": 4065} {"train_loss": -7.071345806121826, "global_step": 170748, "epoch": 4065} {"train_loss": -7.061647415161133, "global_step": 170749, "epoch": 4065} {"train_loss": -7.072933197021484, "global_step": 170750, "epoch": 4065} {"train_loss": -7.135208606719971, "global_step": 170751, "epoch": 4065} {"train_loss": -7.069878101348877, "global_step": 170752, "epoch": 4065} {"train_loss": -7.027050971984863, "global_step": 170753, "epoch": 4065} {"train_loss": -7.1245293617248535, "global_step": 170754, "epoch": 4065} {"train_loss": -7.1383771896362305, "global_step": 170755, "epoch": 4065} {"train_loss": -6.957212448120117, "global_step": 170756, "epoch": 4065} {"train_loss": -7.0720624923706055, "global_step": 170757, "epoch": 4065} {"train_loss": -7.014349937438965, "global_step": 170758, "epoch": 4065} {"train_loss": -7.000491142272949, "global_step": 170759, "epoch": 4065} {"train_loss": -6.995757102966309, "global_step": 170760, "epoch": 4065} {"train_loss": -7.033487319946289, "global_step": 170761, "epoch": 4065} {"train_loss": -6.953690528869629, "global_step": 170762, "epoch": 4065} {"train_loss": -7.071322441101074, "global_step": 170763, "epoch": 4065} {"train_loss": -6.930174827575684, "global_step": 170764, "epoch": 4065} {"train_loss": -7.006685256958008, "global_step": 170765, "epoch": 4065} {"train_loss": -7.063671112060547, "global_step": 170766, "epoch": 4065} {"train_loss": -6.991212368011475, "global_step": 170767, "epoch": 4065} {"train_loss": -6.924663543701172, "global_step": 170768, "epoch": 4065} {"train_loss": -7.067921161651611, "global_step": 170769, "epoch": 4065} {"train_loss": -6.910006523132324, "global_step": 170770, "epoch": 4065} {"train_loss": -7.001350312005906, "global_step": 170771, "epoch": 4065, "val_loss": 68728.8359375} {"train_loss": -6.924297332763672, "global_step": 170772, "epoch": 4066} {"train_loss": -6.827341079711914, "global_step": 170773, "epoch": 4066} {"train_loss": -6.935522556304932, "global_step": 170774, "epoch": 4066} {"train_loss": -7.081876754760742, "global_step": 170775, "epoch": 4066} {"train_loss": -6.980846405029297, "global_step": 170776, "epoch": 4066} {"train_loss": -6.87071418762207, "global_step": 170777, "epoch": 4066} {"train_loss": -6.9748430252075195, "global_step": 170778, "epoch": 4066} {"train_loss": -6.980368614196777, "global_step": 170779, "epoch": 4066} {"train_loss": -7.104823112487793, "global_step": 170780, "epoch": 4066} {"train_loss": -7.018172264099121, "global_step": 170781, "epoch": 4066} {"train_loss": -6.992486953735352, "global_step": 170782, "epoch": 4066} {"train_loss": -6.875330924987793, "global_step": 170783, "epoch": 4066} {"train_loss": -6.9883222579956055, "global_step": 170784, "epoch": 4066} {"train_loss": -6.913395404815674, "global_step": 170785, "epoch": 4066} {"train_loss": -6.9317779541015625, "global_step": 170786, "epoch": 4066} {"train_loss": -6.960661888122559, "global_step": 170787, "epoch": 4066} {"train_loss": -6.9459662437438965, "global_step": 170788, "epoch": 4066} {"train_loss": -6.977568626403809, "global_step": 170789, "epoch": 4066} {"train_loss": -6.9010162353515625, "global_step": 170790, "epoch": 4066} {"train_loss": -6.888230800628662, "global_step": 170791, "epoch": 4066} {"train_loss": -6.90060567855835, "global_step": 170792, "epoch": 4066} {"train_loss": -7.051718235015869, "global_step": 170793, "epoch": 4066} {"train_loss": -6.880715370178223, "global_step": 170794, "epoch": 4066} {"train_loss": -6.893526077270508, "global_step": 170795, "epoch": 4066} {"train_loss": -7.000837802886963, "global_step": 170796, "epoch": 4066} {"train_loss": -6.850551128387451, "global_step": 170797, "epoch": 4066} {"train_loss": -6.928833961486816, "global_step": 170798, "epoch": 4066} {"train_loss": -6.944400787353516, "global_step": 170799, "epoch": 4066} {"train_loss": -6.920971870422363, "global_step": 170800, "epoch": 4066} {"train_loss": -6.942493915557861, "global_step": 170801, "epoch": 4066} {"train_loss": -6.944588661193848, "global_step": 170802, "epoch": 4066} {"train_loss": -6.797213077545166, "global_step": 170803, "epoch": 4066} {"train_loss": -7.052097320556641, "global_step": 170804, "epoch": 4066} {"train_loss": -6.878818035125732, "global_step": 170805, "epoch": 4066} {"train_loss": -7.049624919891357, "global_step": 170806, "epoch": 4066} {"train_loss": -6.983274459838867, "global_step": 170807, "epoch": 4066} {"train_loss": -6.898787498474121, "global_step": 170808, "epoch": 4066} {"train_loss": -7.073121070861816, "global_step": 170809, "epoch": 4066} {"train_loss": -6.99186372756958, "global_step": 170810, "epoch": 4066} {"train_loss": -6.966550827026367, "global_step": 170811, "epoch": 4066} {"train_loss": -7.022700309753418, "global_step": 170812, "epoch": 4066} {"train_loss": -6.954352299372355, "global_step": 170813, "epoch": 4066, "val_loss": 68765.7421875} {"train_loss": -6.962789535522461, "global_step": 170814, "epoch": 4067} {"train_loss": -7.030904769897461, "global_step": 170815, "epoch": 4067} {"train_loss": -6.9623870849609375, "global_step": 170816, "epoch": 4067} {"train_loss": -7.039034843444824, "global_step": 170817, "epoch": 4067} {"train_loss": -7.022677421569824, "global_step": 170818, "epoch": 4067} {"train_loss": -6.986334323883057, "global_step": 170819, "epoch": 4067} {"train_loss": -7.011507034301758, "global_step": 170820, "epoch": 4067} {"train_loss": -7.066893577575684, "global_step": 170821, "epoch": 4067} {"train_loss": -6.994226932525635, "global_step": 170822, "epoch": 4067} {"train_loss": -7.068127632141113, "global_step": 170823, "epoch": 4067} {"train_loss": -7.02955436706543, "global_step": 170824, "epoch": 4067} {"train_loss": -6.980134010314941, "global_step": 170825, "epoch": 4067} {"train_loss": -7.041526794433594, "global_step": 170826, "epoch": 4067} {"train_loss": -6.954074859619141, "global_step": 170827, "epoch": 4067} {"train_loss": -7.063421249389648, "global_step": 170828, "epoch": 4067} {"train_loss": -7.034534454345703, "global_step": 170829, "epoch": 4067} {"train_loss": -7.0155487060546875, "global_step": 170830, "epoch": 4067} {"train_loss": -6.981575012207031, "global_step": 170831, "epoch": 4067} {"train_loss": -6.9944987297058105, "global_step": 170832, "epoch": 4067} {"train_loss": -7.1064982414245605, "global_step": 170833, "epoch": 4067} {"train_loss": -7.01740026473999, "global_step": 170834, "epoch": 4067} {"train_loss": -7.063601970672607, "global_step": 170835, "epoch": 4067} {"train_loss": -7.031332015991211, "global_step": 170836, "epoch": 4067} {"train_loss": -7.020692825317383, "global_step": 170837, "epoch": 4067} {"train_loss": -6.9281487464904785, "global_step": 170838, "epoch": 4067} {"train_loss": -6.938425540924072, "global_step": 170839, "epoch": 4067} {"train_loss": -7.050718307495117, "global_step": 170840, "epoch": 4067} {"train_loss": -6.9932708740234375, "global_step": 170841, "epoch": 4067} {"train_loss": -7.039440155029297, "global_step": 170842, "epoch": 4067} {"train_loss": -7.027036190032959, "global_step": 170843, "epoch": 4067} {"train_loss": -7.012292385101318, "global_step": 170844, "epoch": 4067} {"train_loss": -7.04071044921875, "global_step": 170845, "epoch": 4067} {"train_loss": -7.050684928894043, "global_step": 170846, "epoch": 4067} {"train_loss": -6.988349914550781, "global_step": 170847, "epoch": 4067} {"train_loss": -7.016879081726074, "global_step": 170848, "epoch": 4067} {"train_loss": -7.009726047515869, "global_step": 170849, "epoch": 4067} {"train_loss": -7.031139850616455, "global_step": 170850, "epoch": 4067} {"train_loss": -7.003173351287842, "global_step": 170851, "epoch": 4067} {"train_loss": -7.0719099044799805, "global_step": 170852, "epoch": 4067} {"train_loss": -7.061769962310791, "global_step": 170853, "epoch": 4067} {"train_loss": -7.009166717529297, "global_step": 170854, "epoch": 4067} {"train_loss": -7.0197603816077825, "global_step": 170855, "epoch": 4067, "val_loss": 68514.515625} {"train_loss": -7.114401817321777, "global_step": 170856, "epoch": 4068} {"train_loss": -7.031825065612793, "global_step": 170857, "epoch": 4068} {"train_loss": -7.028545379638672, "global_step": 170858, "epoch": 4068} {"train_loss": -6.987822532653809, "global_step": 170859, "epoch": 4068} {"train_loss": -6.987570285797119, "global_step": 170860, "epoch": 4068} {"train_loss": -7.000518798828125, "global_step": 170861, "epoch": 4068} {"train_loss": -7.017709732055664, "global_step": 170862, "epoch": 4068} {"train_loss": -6.987572193145752, "global_step": 170863, "epoch": 4068} {"train_loss": -6.989568710327148, "global_step": 170864, "epoch": 4068} {"train_loss": -7.049503326416016, "global_step": 170865, "epoch": 4068} {"train_loss": -6.998318672180176, "global_step": 170866, "epoch": 4068} {"train_loss": -7.020779609680176, "global_step": 170867, "epoch": 4068} {"train_loss": -7.090386867523193, "global_step": 170868, "epoch": 4068} {"train_loss": -7.058366775512695, "global_step": 170869, "epoch": 4068} {"train_loss": -6.88007926940918, "global_step": 170870, "epoch": 4068} {"train_loss": -6.917431831359863, "global_step": 170871, "epoch": 4068} {"train_loss": -7.117993354797363, "global_step": 170872, "epoch": 4068} {"train_loss": -7.041076183319092, "global_step": 170873, "epoch": 4068} {"train_loss": -7.009706497192383, "global_step": 170874, "epoch": 4068} {"train_loss": -7.001601696014404, "global_step": 170875, "epoch": 4068} {"train_loss": -7.065081596374512, "global_step": 170876, "epoch": 4068} {"train_loss": -7.03270149230957, "global_step": 170877, "epoch": 4068} {"train_loss": -7.103249549865723, "global_step": 170878, "epoch": 4068} {"train_loss": -7.172463417053223, "global_step": 170879, "epoch": 4068} {"train_loss": -7.075726509094238, "global_step": 170880, "epoch": 4068} {"train_loss": -7.056033134460449, "global_step": 170881, "epoch": 4068} {"train_loss": -6.964517593383789, "global_step": 170882, "epoch": 4068} {"train_loss": -7.014339447021484, "global_step": 170883, "epoch": 4068} {"train_loss": -7.000955581665039, "global_step": 170884, "epoch": 4068} {"train_loss": -7.080857753753662, "global_step": 170885, "epoch": 4068} {"train_loss": -7.01723575592041, "global_step": 170886, "epoch": 4068} {"train_loss": -6.906345844268799, "global_step": 170887, "epoch": 4068} {"train_loss": -6.965789794921875, "global_step": 170888, "epoch": 4068} {"train_loss": -7.018522262573242, "global_step": 170889, "epoch": 4068} {"train_loss": -7.016483306884766, "global_step": 170890, "epoch": 4068} {"train_loss": -6.951024055480957, "global_step": 170891, "epoch": 4068} {"train_loss": -7.034787654876709, "global_step": 170892, "epoch": 4068} {"train_loss": -7.080349445343018, "global_step": 170893, "epoch": 4068} {"train_loss": -7.09929084777832, "global_step": 170894, "epoch": 4068} {"train_loss": -7.049903392791748, "global_step": 170895, "epoch": 4068} {"train_loss": -7.073883056640625, "global_step": 170896, "epoch": 4068} {"train_loss": -7.026221400215512, "global_step": 170897, "epoch": 4068, "val_loss": 68556.390625} {"train_loss": -7.103360176086426, "global_step": 170898, "epoch": 4069} {"train_loss": -7.071127414703369, "global_step": 170899, "epoch": 4069} {"train_loss": -6.994141578674316, "global_step": 170900, "epoch": 4069} {"train_loss": -7.028308868408203, "global_step": 170901, "epoch": 4069} {"train_loss": -6.945958137512207, "global_step": 170902, "epoch": 4069} {"train_loss": -6.928243637084961, "global_step": 170903, "epoch": 4069} {"train_loss": -7.057943344116211, "global_step": 170904, "epoch": 4069} {"train_loss": -6.937335014343262, "global_step": 170905, "epoch": 4069} {"train_loss": -7.0182905197143555, "global_step": 170906, "epoch": 4069} {"train_loss": -7.131106376647949, "global_step": 170907, "epoch": 4069} {"train_loss": -6.8750081062316895, "global_step": 170908, "epoch": 4069} {"train_loss": -7.014648914337158, "global_step": 170909, "epoch": 4069} {"train_loss": -7.070262908935547, "global_step": 170910, "epoch": 4069} {"train_loss": -6.981708526611328, "global_step": 170911, "epoch": 4069} {"train_loss": -7.0399370193481445, "global_step": 170912, "epoch": 4069} {"train_loss": -6.9793314933776855, "global_step": 170913, "epoch": 4069} {"train_loss": -7.013506889343262, "global_step": 170914, "epoch": 4069} {"train_loss": -6.994573593139648, "global_step": 170915, "epoch": 4069} {"train_loss": -6.869756698608398, "global_step": 170916, "epoch": 4069} {"train_loss": -7.064725875854492, "global_step": 170917, "epoch": 4069} {"train_loss": -6.9542412757873535, "global_step": 170918, "epoch": 4069} {"train_loss": -6.9537672996521, "global_step": 170919, "epoch": 4069} {"train_loss": -7.031177520751953, "global_step": 170920, "epoch": 4069} {"train_loss": -6.808666706085205, "global_step": 170921, "epoch": 4069} {"train_loss": -7.000946044921875, "global_step": 170922, "epoch": 4069} {"train_loss": -6.791133880615234, "global_step": 170923, "epoch": 4069} {"train_loss": -6.903964996337891, "global_step": 170924, "epoch": 4069} {"train_loss": -6.831657886505127, "global_step": 170925, "epoch": 4069} {"train_loss": -6.864419460296631, "global_step": 170926, "epoch": 4069} {"train_loss": -6.898852348327637, "global_step": 170927, "epoch": 4069} {"train_loss": -6.902461051940918, "global_step": 170928, "epoch": 4069} {"train_loss": -6.8892927169799805, "global_step": 170929, "epoch": 4069} {"train_loss": -6.963627338409424, "global_step": 170930, "epoch": 4069} {"train_loss": -6.938168525695801, "global_step": 170931, "epoch": 4069} {"train_loss": -6.8769025802612305, "global_step": 170932, "epoch": 4069} {"train_loss": -6.8552141189575195, "global_step": 170933, "epoch": 4069} {"train_loss": -6.896480083465576, "global_step": 170934, "epoch": 4069} {"train_loss": -6.991673469543457, "global_step": 170935, "epoch": 4069} {"train_loss": -6.9243364334106445, "global_step": 170936, "epoch": 4069} {"train_loss": -6.923903465270996, "global_step": 170937, "epoch": 4069} {"train_loss": -6.995566368103027, "global_step": 170938, "epoch": 4069} {"train_loss": -6.960128682000296, "global_step": 170939, "epoch": 4069, "val_loss": 68796.9609375} {"train_loss": -6.891878604888916, "global_step": 170940, "epoch": 4070} {"train_loss": -7.00130033493042, "global_step": 170941, "epoch": 4070} {"train_loss": -7.057570457458496, "global_step": 170942, "epoch": 4070} {"train_loss": -6.968466281890869, "global_step": 170943, "epoch": 4070} {"train_loss": -6.930314064025879, "global_step": 170944, "epoch": 4070} {"train_loss": -6.889504432678223, "global_step": 170945, "epoch": 4070} {"train_loss": -7.012099742889404, "global_step": 170946, "epoch": 4070} {"train_loss": -6.989755153656006, "global_step": 170947, "epoch": 4070} {"train_loss": -7.022718906402588, "global_step": 170948, "epoch": 4070} {"train_loss": -7.04032039642334, "global_step": 170949, "epoch": 4070} {"train_loss": -7.0355072021484375, "global_step": 170950, "epoch": 4070} {"train_loss": -6.982863426208496, "global_step": 170951, "epoch": 4070} {"train_loss": -7.054329872131348, "global_step": 170952, "epoch": 4070} {"train_loss": -6.987545013427734, "global_step": 170953, "epoch": 4070} {"train_loss": -6.946544647216797, "global_step": 170954, "epoch": 4070} {"train_loss": -6.886941432952881, "global_step": 170955, "epoch": 4070} {"train_loss": -7.017114639282227, "global_step": 170956, "epoch": 4070} {"train_loss": -6.9478936195373535, "global_step": 170957, "epoch": 4070} {"train_loss": -6.907222270965576, "global_step": 170958, "epoch": 4070} {"train_loss": -6.9658918380737305, "global_step": 170959, "epoch": 4070} {"train_loss": -7.074214935302734, "global_step": 170960, "epoch": 4070} {"train_loss": -6.946592330932617, "global_step": 170961, "epoch": 4070} {"train_loss": -6.927136421203613, "global_step": 170962, "epoch": 4070} {"train_loss": -7.099884986877441, "global_step": 170963, "epoch": 4070} {"train_loss": -6.936497688293457, "global_step": 170964, "epoch": 4070} {"train_loss": -6.900557994842529, "global_step": 170965, "epoch": 4070} {"train_loss": -6.981534957885742, "global_step": 170966, "epoch": 4070} {"train_loss": -6.94862174987793, "global_step": 170967, "epoch": 4070} {"train_loss": -6.826627254486084, "global_step": 170968, "epoch": 4070} {"train_loss": -6.9522576332092285, "global_step": 170969, "epoch": 4070} {"train_loss": -7.109148025512695, "global_step": 170970, "epoch": 4070} {"train_loss": -6.933193206787109, "global_step": 170971, "epoch": 4070} {"train_loss": -7.042790412902832, "global_step": 170972, "epoch": 4070} {"train_loss": -7.1149702072143555, "global_step": 170973, "epoch": 4070} {"train_loss": -6.915487289428711, "global_step": 170974, "epoch": 4070} {"train_loss": -7.0996599197387695, "global_step": 170975, "epoch": 4070} {"train_loss": -7.04773473739624, "global_step": 170976, "epoch": 4070} {"train_loss": -7.086219787597656, "global_step": 170977, "epoch": 4070} {"train_loss": -7.035084247589111, "global_step": 170978, "epoch": 4070} {"train_loss": -7.065973281860352, "global_step": 170979, "epoch": 4070} {"train_loss": -7.0207414627075195, "global_step": 170980, "epoch": 4070} {"train_loss": -6.995629276548113, "global_step": 170981, "epoch": 4070, "val_loss": 68615.9140625} {"train_loss": -7.065914154052734, "global_step": 170982, "epoch": 4071} {"train_loss": -7.033670902252197, "global_step": 170983, "epoch": 4071} {"train_loss": -7.054080009460449, "global_step": 170984, "epoch": 4071} {"train_loss": -7.000577449798584, "global_step": 170985, "epoch": 4071} {"train_loss": -6.961745738983154, "global_step": 170986, "epoch": 4071} {"train_loss": -6.983675003051758, "global_step": 170987, "epoch": 4071} {"train_loss": -7.04129695892334, "global_step": 170988, "epoch": 4071} {"train_loss": -7.00706672668457, "global_step": 170989, "epoch": 4071} {"train_loss": -6.933553695678711, "global_step": 170990, "epoch": 4071} {"train_loss": -6.918207168579102, "global_step": 170991, "epoch": 4071} {"train_loss": -6.914867401123047, "global_step": 170992, "epoch": 4071} {"train_loss": -6.933743000030518, "global_step": 170993, "epoch": 4071} {"train_loss": -6.986151695251465, "global_step": 170994, "epoch": 4071} {"train_loss": -6.833281517028809, "global_step": 170995, "epoch": 4071} {"train_loss": -6.882464408874512, "global_step": 170996, "epoch": 4071} {"train_loss": -6.926431655883789, "global_step": 170997, "epoch": 4071} {"train_loss": -6.952759742736816, "global_step": 170998, "epoch": 4071} {"train_loss": -6.87950325012207, "global_step": 170999, "epoch": 4071} {"train_loss": -6.8915863037109375, "global_step": 171000, "epoch": 4071} {"train_loss": -6.84762716293335, "global_step": 171001, "epoch": 4071} {"train_loss": -6.979790687561035, "global_step": 171002, "epoch": 4071} {"train_loss": -6.958136558532715, "global_step": 171003, "epoch": 4071} {"train_loss": -6.8917436599731445, "global_step": 171004, "epoch": 4071} {"train_loss": -7.003560543060303, "global_step": 171005, "epoch": 4071} {"train_loss": -6.905702590942383, "global_step": 171006, "epoch": 4071} {"train_loss": -7.05943489074707, "global_step": 171007, "epoch": 4071} {"train_loss": -6.827508449554443, "global_step": 171008, "epoch": 4071} {"train_loss": -7.071074962615967, "global_step": 171009, "epoch": 4071} {"train_loss": -6.980526447296143, "global_step": 171010, "epoch": 4071} {"train_loss": -6.906537055969238, "global_step": 171011, "epoch": 4071} {"train_loss": -7.047538757324219, "global_step": 171012, "epoch": 4071} {"train_loss": -6.9832916259765625, "global_step": 171013, "epoch": 4071} {"train_loss": -6.854827880859375, "global_step": 171014, "epoch": 4071} {"train_loss": -6.990728378295898, "global_step": 171015, "epoch": 4071} {"train_loss": -6.776359558105469, "global_step": 171016, "epoch": 4071} {"train_loss": -6.847218036651611, "global_step": 171017, "epoch": 4071} {"train_loss": -6.930858612060547, "global_step": 171018, "epoch": 4071} {"train_loss": -6.689543724060059, "global_step": 171019, "epoch": 4071} {"train_loss": -6.897249221801758, "global_step": 171020, "epoch": 4071} {"train_loss": -6.9575347900390625, "global_step": 171021, "epoch": 4071} {"train_loss": -6.927327632904053, "global_step": 171022, "epoch": 4071} {"train_loss": -6.940857864561535, "global_step": 171023, "epoch": 4071, "val_loss": 68598.5546875} {"train_loss": -6.904200077056885, "global_step": 171024, "epoch": 4072} {"train_loss": -7.1107378005981445, "global_step": 171025, "epoch": 4072} {"train_loss": -6.987364768981934, "global_step": 171026, "epoch": 4072} {"train_loss": -7.12197732925415, "global_step": 171027, "epoch": 4072} {"train_loss": -7.038910865783691, "global_step": 171028, "epoch": 4072} {"train_loss": -6.924912452697754, "global_step": 171029, "epoch": 4072} {"train_loss": -7.081916332244873, "global_step": 171030, "epoch": 4072} {"train_loss": -6.867346286773682, "global_step": 171031, "epoch": 4072} {"train_loss": -7.018637657165527, "global_step": 171032, "epoch": 4072} {"train_loss": -6.9052510261535645, "global_step": 171033, "epoch": 4072} {"train_loss": -7.024768829345703, "global_step": 171034, "epoch": 4072} {"train_loss": -6.995108127593994, "global_step": 171035, "epoch": 4072} {"train_loss": -6.956984996795654, "global_step": 171036, "epoch": 4072} {"train_loss": -7.022730827331543, "global_step": 171037, "epoch": 4072} {"train_loss": -6.9923176765441895, "global_step": 171038, "epoch": 4072} {"train_loss": -7.085079669952393, "global_step": 171039, "epoch": 4072} {"train_loss": -6.950709342956543, "global_step": 171040, "epoch": 4072} {"train_loss": -7.069390773773193, "global_step": 171041, "epoch": 4072} {"train_loss": -6.968408107757568, "global_step": 171042, "epoch": 4072} {"train_loss": -6.93931770324707, "global_step": 171043, "epoch": 4072} {"train_loss": -7.100220680236816, "global_step": 171044, "epoch": 4072} {"train_loss": -6.889947891235352, "global_step": 171045, "epoch": 4072} {"train_loss": -6.962364196777344, "global_step": 171046, "epoch": 4072} {"train_loss": -6.95736837387085, "global_step": 171047, "epoch": 4072} {"train_loss": -6.898928165435791, "global_step": 171048, "epoch": 4072} {"train_loss": -6.9306464195251465, "global_step": 171049, "epoch": 4072} {"train_loss": -6.937185287475586, "global_step": 171050, "epoch": 4072} {"train_loss": -7.000788688659668, "global_step": 171051, "epoch": 4072} {"train_loss": -6.849244594573975, "global_step": 171052, "epoch": 4072} {"train_loss": -6.887559413909912, "global_step": 171053, "epoch": 4072} {"train_loss": -7.175849914550781, "global_step": 171054, "epoch": 4072} {"train_loss": -6.812711715698242, "global_step": 171055, "epoch": 4072} {"train_loss": -6.882368564605713, "global_step": 171056, "epoch": 4072} {"train_loss": -7.030942440032959, "global_step": 171057, "epoch": 4072} {"train_loss": -6.860492706298828, "global_step": 171058, "epoch": 4072} {"train_loss": -6.95927619934082, "global_step": 171059, "epoch": 4072} {"train_loss": -6.979502201080322, "global_step": 171060, "epoch": 4072} {"train_loss": -7.004815101623535, "global_step": 171061, "epoch": 4072} {"train_loss": -7.053342819213867, "global_step": 171062, "epoch": 4072} {"train_loss": -6.973341464996338, "global_step": 171063, "epoch": 4072} {"train_loss": -7.058811187744141, "global_step": 171064, "epoch": 4072} {"train_loss": -6.977495454606556, "global_step": 171065, "epoch": 4072, "val_loss": 68482.546875} {"train_loss": -6.854521751403809, "global_step": 171066, "epoch": 4073} {"train_loss": -7.031257629394531, "global_step": 171067, "epoch": 4073} {"train_loss": -7.017942428588867, "global_step": 171068, "epoch": 4073} {"train_loss": -7.039665222167969, "global_step": 171069, "epoch": 4073} {"train_loss": -7.001047134399414, "global_step": 171070, "epoch": 4073} {"train_loss": -6.963181972503662, "global_step": 171071, "epoch": 4073} {"train_loss": -7.130313873291016, "global_step": 171072, "epoch": 4073} {"train_loss": -7.056200981140137, "global_step": 171073, "epoch": 4073} {"train_loss": -7.052525520324707, "global_step": 171074, "epoch": 4073} {"train_loss": -7.0288777351379395, "global_step": 171075, "epoch": 4073} {"train_loss": -7.032344818115234, "global_step": 171076, "epoch": 4073} {"train_loss": -7.064260959625244, "global_step": 171077, "epoch": 4073} {"train_loss": -6.910358905792236, "global_step": 171078, "epoch": 4073} {"train_loss": -6.959445953369141, "global_step": 171079, "epoch": 4073} {"train_loss": -6.982668876647949, "global_step": 171080, "epoch": 4073} {"train_loss": -7.032604217529297, "global_step": 171081, "epoch": 4073} {"train_loss": -6.927887916564941, "global_step": 171082, "epoch": 4073} {"train_loss": -7.110965251922607, "global_step": 171083, "epoch": 4073} {"train_loss": -7.072186470031738, "global_step": 171084, "epoch": 4073} {"train_loss": -7.082467079162598, "global_step": 171085, "epoch": 4073} {"train_loss": -7.071238994598389, "global_step": 171086, "epoch": 4073} {"train_loss": -7.1087799072265625, "global_step": 171087, "epoch": 4073} {"train_loss": -6.939918518066406, "global_step": 171088, "epoch": 4073} {"train_loss": -7.039685249328613, "global_step": 171089, "epoch": 4073} {"train_loss": -6.89834451675415, "global_step": 171090, "epoch": 4073} {"train_loss": -6.945002555847168, "global_step": 171091, "epoch": 4073} {"train_loss": -6.948976516723633, "global_step": 171092, "epoch": 4073} {"train_loss": -6.9106125831604, "global_step": 171093, "epoch": 4073} {"train_loss": -6.8662285804748535, "global_step": 171094, "epoch": 4073} {"train_loss": -7.088090896606445, "global_step": 171095, "epoch": 4073} {"train_loss": -6.956369876861572, "global_step": 171096, "epoch": 4073} {"train_loss": -7.028879642486572, "global_step": 171097, "epoch": 4073} {"train_loss": -7.033418655395508, "global_step": 171098, "epoch": 4073} {"train_loss": -6.980097770690918, "global_step": 171099, "epoch": 4073} {"train_loss": -7.069327354431152, "global_step": 171100, "epoch": 4073} {"train_loss": -6.897506237030029, "global_step": 171101, "epoch": 4073} {"train_loss": -7.136739730834961, "global_step": 171102, "epoch": 4073} {"train_loss": -7.100194454193115, "global_step": 171103, "epoch": 4073} {"train_loss": -7.001716613769531, "global_step": 171104, "epoch": 4073} {"train_loss": -7.106024742126465, "global_step": 171105, "epoch": 4073} {"train_loss": -6.986863136291504, "global_step": 171106, "epoch": 4073} {"train_loss": -7.0110832963671, "global_step": 171107, "epoch": 4073, "val_loss": 68529.953125} {"train_loss": -6.988667011260986, "global_step": 171108, "epoch": 4074} {"train_loss": -7.059816360473633, "global_step": 171109, "epoch": 4074} {"train_loss": -7.062760353088379, "global_step": 171110, "epoch": 4074} {"train_loss": -7.022061824798584, "global_step": 171111, "epoch": 4074} {"train_loss": -6.943317413330078, "global_step": 171112, "epoch": 4074} {"train_loss": -7.078289031982422, "global_step": 171113, "epoch": 4074} {"train_loss": -7.015775680541992, "global_step": 171114, "epoch": 4074} {"train_loss": -7.052455902099609, "global_step": 171115, "epoch": 4074} {"train_loss": -6.767152786254883, "global_step": 171116, "epoch": 4074} {"train_loss": -6.835641860961914, "global_step": 171117, "epoch": 4074} {"train_loss": -6.933166027069092, "global_step": 171118, "epoch": 4074} {"train_loss": -6.851497650146484, "global_step": 171119, "epoch": 4074} {"train_loss": -6.9447855949401855, "global_step": 171120, "epoch": 4074} {"train_loss": -6.978342056274414, "global_step": 171121, "epoch": 4074} {"train_loss": -7.018821716308594, "global_step": 171122, "epoch": 4074} {"train_loss": -6.889299392700195, "global_step": 171123, "epoch": 4074} {"train_loss": -6.949142932891846, "global_step": 171124, "epoch": 4074} {"train_loss": -7.01933479309082, "global_step": 171125, "epoch": 4074} {"train_loss": -6.949528694152832, "global_step": 171126, "epoch": 4074} {"train_loss": -6.976537704467773, "global_step": 171127, "epoch": 4074} {"train_loss": -6.932047367095947, "global_step": 171128, "epoch": 4074} {"train_loss": -6.904475688934326, "global_step": 171129, "epoch": 4074} {"train_loss": -6.954951763153076, "global_step": 171130, "epoch": 4074} {"train_loss": -6.818510055541992, "global_step": 171131, "epoch": 4074} {"train_loss": -6.939385890960693, "global_step": 171132, "epoch": 4074} {"train_loss": -6.782208442687988, "global_step": 171133, "epoch": 4074} {"train_loss": -6.862076759338379, "global_step": 171134, "epoch": 4074} {"train_loss": -6.977797508239746, "global_step": 171135, "epoch": 4074} {"train_loss": -6.871517181396484, "global_step": 171136, "epoch": 4074} {"train_loss": -6.897482872009277, "global_step": 171137, "epoch": 4074} {"train_loss": -6.84346342086792, "global_step": 171138, "epoch": 4074} {"train_loss": -6.906721591949463, "global_step": 171139, "epoch": 4074} {"train_loss": -6.741372585296631, "global_step": 171140, "epoch": 4074} {"train_loss": -6.9854841232299805, "global_step": 171141, "epoch": 4074} {"train_loss": -6.733347415924072, "global_step": 171142, "epoch": 4074} {"train_loss": -6.819850921630859, "global_step": 171143, "epoch": 4074} {"train_loss": -6.994490623474121, "global_step": 171144, "epoch": 4074} {"train_loss": -6.893863201141357, "global_step": 171145, "epoch": 4074} {"train_loss": -6.9767608642578125, "global_step": 171146, "epoch": 4074} {"train_loss": -6.9183244705200195, "global_step": 171147, "epoch": 4074} {"train_loss": -6.959934234619141, "global_step": 171148, "epoch": 4074} {"train_loss": -6.926534823008946, "global_step": 171149, "epoch": 4074, "val_loss": 68567.953125} {"train_loss": -7.0106401443481445, "global_step": 171150, "epoch": 4075} {"train_loss": -6.948336601257324, "global_step": 171151, "epoch": 4075} {"train_loss": -6.95874547958374, "global_step": 171152, "epoch": 4075} {"train_loss": -6.973397254943848, "global_step": 171153, "epoch": 4075} {"train_loss": -6.940668106079102, "global_step": 171154, "epoch": 4075} {"train_loss": -7.021548271179199, "global_step": 171155, "epoch": 4075} {"train_loss": -7.036988258361816, "global_step": 171156, "epoch": 4075} {"train_loss": -7.090484619140625, "global_step": 171157, "epoch": 4075} {"train_loss": -6.981498718261719, "global_step": 171158, "epoch": 4075} {"train_loss": -6.988840103149414, "global_step": 171159, "epoch": 4075} {"train_loss": -6.9727888107299805, "global_step": 171160, "epoch": 4075} {"train_loss": -7.065296173095703, "global_step": 171161, "epoch": 4075} {"train_loss": -7.012108325958252, "global_step": 171162, "epoch": 4075} {"train_loss": -7.109055995941162, "global_step": 171163, "epoch": 4075} {"train_loss": -7.1137285232543945, "global_step": 171164, "epoch": 4075} {"train_loss": -6.980160713195801, "global_step": 171165, "epoch": 4075} {"train_loss": -7.09171199798584, "global_step": 171166, "epoch": 4075} {"train_loss": -7.075834274291992, "global_step": 171167, "epoch": 4075} {"train_loss": -7.021649360656738, "global_step": 171168, "epoch": 4075} {"train_loss": -7.007226943969727, "global_step": 171169, "epoch": 4075} {"train_loss": -7.056244850158691, "global_step": 171170, "epoch": 4075} {"train_loss": -7.164037704467773, "global_step": 171171, "epoch": 4075} {"train_loss": -7.045900344848633, "global_step": 171172, "epoch": 4075} {"train_loss": -7.1177215576171875, "global_step": 171173, "epoch": 4075} {"train_loss": -7.034729480743408, "global_step": 171174, "epoch": 4075} {"train_loss": -6.888143062591553, "global_step": 171175, "epoch": 4075} {"train_loss": -6.976430892944336, "global_step": 171176, "epoch": 4075} {"train_loss": -7.069389820098877, "global_step": 171177, "epoch": 4075} {"train_loss": -7.045927047729492, "global_step": 171178, "epoch": 4075} {"train_loss": -7.020263671875, "global_step": 171179, "epoch": 4075} {"train_loss": -7.049643516540527, "global_step": 171180, "epoch": 4075} {"train_loss": -7.059454441070557, "global_step": 171181, "epoch": 4075} {"train_loss": -7.077077865600586, "global_step": 171182, "epoch": 4075} {"train_loss": -6.967255592346191, "global_step": 171183, "epoch": 4075} {"train_loss": -7.082196235656738, "global_step": 171184, "epoch": 4075} {"train_loss": -7.056785583496094, "global_step": 171185, "epoch": 4075} {"train_loss": -7.123939514160156, "global_step": 171186, "epoch": 4075} {"train_loss": -7.098024368286133, "global_step": 171187, "epoch": 4075} {"train_loss": -7.004373073577881, "global_step": 171188, "epoch": 4075} {"train_loss": -7.104345798492432, "global_step": 171189, "epoch": 4075} {"train_loss": -7.044891357421875, "global_step": 171190, "epoch": 4075} {"train_loss": -7.037647996629987, "global_step": 171191, "epoch": 4075, "val_loss": 68529.0546875} {"train_loss": -7.027102947235107, "global_step": 171192, "epoch": 4076} {"train_loss": -6.927540302276611, "global_step": 171193, "epoch": 4076} {"train_loss": -7.082003116607666, "global_step": 171194, "epoch": 4076} {"train_loss": -6.9785919189453125, "global_step": 171195, "epoch": 4076} {"train_loss": -7.085163116455078, "global_step": 171196, "epoch": 4076} {"train_loss": -6.913222789764404, "global_step": 171197, "epoch": 4076} {"train_loss": -7.052558422088623, "global_step": 171198, "epoch": 4076} {"train_loss": -6.973666191101074, "global_step": 171199, "epoch": 4076} {"train_loss": -7.038668632507324, "global_step": 171200, "epoch": 4076} {"train_loss": -6.990625381469727, "global_step": 171201, "epoch": 4076} {"train_loss": -6.998412132263184, "global_step": 171202, "epoch": 4076} {"train_loss": -6.990406036376953, "global_step": 171203, "epoch": 4076} {"train_loss": -7.1103363037109375, "global_step": 171204, "epoch": 4076} {"train_loss": -6.928391456604004, "global_step": 171205, "epoch": 4076} {"train_loss": -7.035320281982422, "global_step": 171206, "epoch": 4076} {"train_loss": -6.918694972991943, "global_step": 171207, "epoch": 4076} {"train_loss": -6.98929500579834, "global_step": 171208, "epoch": 4076} {"train_loss": -6.994060516357422, "global_step": 171209, "epoch": 4076} {"train_loss": -7.028012752532959, "global_step": 171210, "epoch": 4076} {"train_loss": -7.064903259277344, "global_step": 171211, "epoch": 4076} {"train_loss": -6.947945594787598, "global_step": 171212, "epoch": 4076} {"train_loss": -6.934462547302246, "global_step": 171213, "epoch": 4076} {"train_loss": -6.998376846313477, "global_step": 171214, "epoch": 4076} {"train_loss": -7.060489654541016, "global_step": 171215, "epoch": 4076} {"train_loss": -6.9878315925598145, "global_step": 171216, "epoch": 4076} {"train_loss": -6.929474353790283, "global_step": 171217, "epoch": 4076} {"train_loss": -7.022548198699951, "global_step": 171218, "epoch": 4076} {"train_loss": -7.018649101257324, "global_step": 171219, "epoch": 4076} {"train_loss": -6.936549186706543, "global_step": 171220, "epoch": 4076} {"train_loss": -7.0418219566345215, "global_step": 171221, "epoch": 4076} {"train_loss": -7.0419416427612305, "global_step": 171222, "epoch": 4076} {"train_loss": -7.034085750579834, "global_step": 171223, "epoch": 4076} {"train_loss": -7.168767929077148, "global_step": 171224, "epoch": 4076} {"train_loss": -6.937817573547363, "global_step": 171225, "epoch": 4076} {"train_loss": -7.097843647003174, "global_step": 171226, "epoch": 4076} {"train_loss": -7.102639675140381, "global_step": 171227, "epoch": 4076} {"train_loss": -7.1634674072265625, "global_step": 171228, "epoch": 4076} {"train_loss": -6.949627876281738, "global_step": 171229, "epoch": 4076} {"train_loss": -7.02730655670166, "global_step": 171230, "epoch": 4076} {"train_loss": -7.136423110961914, "global_step": 171231, "epoch": 4076} {"train_loss": -7.059325218200684, "global_step": 171232, "epoch": 4076} {"train_loss": -7.018032948176066, "global_step": 171233, "epoch": 4076, "val_loss": 68449.6484375} {"train_loss": -7.140407562255859, "global_step": 171234, "epoch": 4077} {"train_loss": -7.089288711547852, "global_step": 171235, "epoch": 4077} {"train_loss": -6.8895087242126465, "global_step": 171236, "epoch": 4077} {"train_loss": -6.9287590980529785, "global_step": 171237, "epoch": 4077} {"train_loss": -7.091937065124512, "global_step": 171238, "epoch": 4077} {"train_loss": -7.0325517654418945, "global_step": 171239, "epoch": 4077} {"train_loss": -6.850872039794922, "global_step": 171240, "epoch": 4077} {"train_loss": -6.959355354309082, "global_step": 171241, "epoch": 4077} {"train_loss": -6.954285621643066, "global_step": 171242, "epoch": 4077} {"train_loss": -6.841559886932373, "global_step": 171243, "epoch": 4077} {"train_loss": -6.798686981201172, "global_step": 171244, "epoch": 4077} {"train_loss": -6.956597805023193, "global_step": 171245, "epoch": 4077} {"train_loss": -6.811422348022461, "global_step": 171246, "epoch": 4077} {"train_loss": -6.884960174560547, "global_step": 171247, "epoch": 4077} {"train_loss": -6.989924430847168, "global_step": 171248, "epoch": 4077} {"train_loss": -6.987196922302246, "global_step": 171249, "epoch": 4077} {"train_loss": -7.024316787719727, "global_step": 171250, "epoch": 4077} {"train_loss": -6.940306663513184, "global_step": 171251, "epoch": 4077} {"train_loss": -6.957845211029053, "global_step": 171252, "epoch": 4077} {"train_loss": -6.936984539031982, "global_step": 171253, "epoch": 4077} {"train_loss": -6.939810276031494, "global_step": 171254, "epoch": 4077} {"train_loss": -6.919026851654053, "global_step": 171255, "epoch": 4077} {"train_loss": -6.989386558532715, "global_step": 171256, "epoch": 4077} {"train_loss": -7.01513147354126, "global_step": 171257, "epoch": 4077} {"train_loss": -6.944761276245117, "global_step": 171258, "epoch": 4077} {"train_loss": -6.847694396972656, "global_step": 171259, "epoch": 4077} {"train_loss": -7.054390907287598, "global_step": 171260, "epoch": 4077} {"train_loss": -6.834990978240967, "global_step": 171261, "epoch": 4077} {"train_loss": -6.886195182800293, "global_step": 171262, "epoch": 4077} {"train_loss": -6.890787601470947, "global_step": 171263, "epoch": 4077} {"train_loss": -6.913384437561035, "global_step": 171264, "epoch": 4077} {"train_loss": -6.870490074157715, "global_step": 171265, "epoch": 4077} {"train_loss": -6.828944206237793, "global_step": 171266, "epoch": 4077} {"train_loss": -6.95015811920166, "global_step": 171267, "epoch": 4077} {"train_loss": -6.845448970794678, "global_step": 171268, "epoch": 4077} {"train_loss": -6.856084823608398, "global_step": 171269, "epoch": 4077} {"train_loss": -6.950740814208984, "global_step": 171270, "epoch": 4077} {"train_loss": -6.793900966644287, "global_step": 171271, "epoch": 4077} {"train_loss": -7.0038886070251465, "global_step": 171272, "epoch": 4077} {"train_loss": -6.990041255950928, "global_step": 171273, "epoch": 4077} {"train_loss": -6.938122272491455, "global_step": 171274, "epoch": 4077} {"train_loss": -6.934899579911005, "global_step": 171275, "epoch": 4077, "val_loss": 68586.140625} {"train_loss": -6.936548709869385, "global_step": 171276, "epoch": 4078} {"train_loss": -6.9766645431518555, "global_step": 171277, "epoch": 4078} {"train_loss": -7.036555290222168, "global_step": 171278, "epoch": 4078} {"train_loss": -7.052395820617676, "global_step": 171279, "epoch": 4078} {"train_loss": -6.97354793548584, "global_step": 171280, "epoch": 4078} {"train_loss": -7.009947776794434, "global_step": 171281, "epoch": 4078} {"train_loss": -6.946314811706543, "global_step": 171282, "epoch": 4078} {"train_loss": -6.971321105957031, "global_step": 171283, "epoch": 4078} {"train_loss": -6.994510650634766, "global_step": 171284, "epoch": 4078} {"train_loss": -6.970434665679932, "global_step": 171285, "epoch": 4078} {"train_loss": -7.036205291748047, "global_step": 171286, "epoch": 4078} {"train_loss": -6.89847993850708, "global_step": 171287, "epoch": 4078} {"train_loss": -6.9563398361206055, "global_step": 171288, "epoch": 4078} {"train_loss": -7.045536041259766, "global_step": 171289, "epoch": 4078} {"train_loss": -7.102858543395996, "global_step": 171290, "epoch": 4078} {"train_loss": -7.056600570678711, "global_step": 171291, "epoch": 4078} {"train_loss": -7.046716690063477, "global_step": 171292, "epoch": 4078} {"train_loss": -7.078325271606445, "global_step": 171293, "epoch": 4078} {"train_loss": -7.144777774810791, "global_step": 171294, "epoch": 4078} {"train_loss": -7.127930164337158, "global_step": 171295, "epoch": 4078} {"train_loss": -7.049323558807373, "global_step": 171296, "epoch": 4078} {"train_loss": -6.989874839782715, "global_step": 171297, "epoch": 4078} {"train_loss": -7.154989242553711, "global_step": 171298, "epoch": 4078} {"train_loss": -7.166341781616211, "global_step": 171299, "epoch": 4078} {"train_loss": -7.061586380004883, "global_step": 171300, "epoch": 4078} {"train_loss": -7.104157447814941, "global_step": 171301, "epoch": 4078} {"train_loss": -7.117276668548584, "global_step": 171302, "epoch": 4078} {"train_loss": -7.214594841003418, "global_step": 171303, "epoch": 4078} {"train_loss": -7.111234664916992, "global_step": 171304, "epoch": 4078} {"train_loss": -6.975589275360107, "global_step": 171305, "epoch": 4078} {"train_loss": -7.079392433166504, "global_step": 171306, "epoch": 4078} {"train_loss": -7.076929092407227, "global_step": 171307, "epoch": 4078} {"train_loss": -7.008591175079346, "global_step": 171308, "epoch": 4078} {"train_loss": -7.099783897399902, "global_step": 171309, "epoch": 4078} {"train_loss": -7.183732986450195, "global_step": 171310, "epoch": 4078} {"train_loss": -7.087924003601074, "global_step": 171311, "epoch": 4078} {"train_loss": -7.183950424194336, "global_step": 171312, "epoch": 4078} {"train_loss": -6.988815784454346, "global_step": 171313, "epoch": 4078} {"train_loss": -7.023416519165039, "global_step": 171314, "epoch": 4078} {"train_loss": -6.99083137512207, "global_step": 171315, "epoch": 4078} {"train_loss": -7.157498359680176, "global_step": 171316, "epoch": 4078} {"train_loss": -7.053360655194237, "global_step": 171317, "epoch": 4078, "val_loss": 68604.9609375} {"train_loss": -7.129066467285156, "global_step": 171318, "epoch": 4079} {"train_loss": -7.076885223388672, "global_step": 171319, "epoch": 4079} {"train_loss": -7.036681175231934, "global_step": 171320, "epoch": 4079} {"train_loss": -7.163908004760742, "global_step": 171321, "epoch": 4079} {"train_loss": -7.015410423278809, "global_step": 171322, "epoch": 4079} {"train_loss": -7.105091094970703, "global_step": 171323, "epoch": 4079} {"train_loss": -7.094237327575684, "global_step": 171324, "epoch": 4079} {"train_loss": -7.054633140563965, "global_step": 171325, "epoch": 4079} {"train_loss": -7.059296607971191, "global_step": 171326, "epoch": 4079} {"train_loss": -7.028958797454834, "global_step": 171327, "epoch": 4079} {"train_loss": -7.049927234649658, "global_step": 171328, "epoch": 4079} {"train_loss": -6.975503921508789, "global_step": 171329, "epoch": 4079} {"train_loss": -6.994434356689453, "global_step": 171330, "epoch": 4079} {"train_loss": -7.081901550292969, "global_step": 171331, "epoch": 4079} {"train_loss": -7.002618789672852, "global_step": 171332, "epoch": 4079} {"train_loss": -6.902388572692871, "global_step": 171333, "epoch": 4079} {"train_loss": -6.86216402053833, "global_step": 171334, "epoch": 4079} {"train_loss": -7.144161224365234, "global_step": 171335, "epoch": 4079} {"train_loss": -6.944605827331543, "global_step": 171336, "epoch": 4079} {"train_loss": -6.891814708709717, "global_step": 171337, "epoch": 4079} {"train_loss": -6.984216690063477, "global_step": 171338, "epoch": 4079} {"train_loss": -6.850638389587402, "global_step": 171339, "epoch": 4079} {"train_loss": -7.012491226196289, "global_step": 171340, "epoch": 4079} {"train_loss": -6.9425482749938965, "global_step": 171341, "epoch": 4079} {"train_loss": -6.82720422744751, "global_step": 171342, "epoch": 4079} {"train_loss": -6.937613487243652, "global_step": 171343, "epoch": 4079} {"train_loss": -6.8524627685546875, "global_step": 171344, "epoch": 4079} {"train_loss": -6.766033172607422, "global_step": 171345, "epoch": 4079} {"train_loss": -6.895905494689941, "global_step": 171346, "epoch": 4079} {"train_loss": -6.88275671005249, "global_step": 171347, "epoch": 4079} {"train_loss": -6.869503021240234, "global_step": 171348, "epoch": 4079} {"train_loss": -6.945396900177002, "global_step": 171349, "epoch": 4079} {"train_loss": -6.904883861541748, "global_step": 171350, "epoch": 4079} {"train_loss": -6.8884196281433105, "global_step": 171351, "epoch": 4079} {"train_loss": -6.901263236999512, "global_step": 171352, "epoch": 4079} {"train_loss": -6.878511428833008, "global_step": 171353, "epoch": 4079} {"train_loss": -6.913427352905273, "global_step": 171354, "epoch": 4079} {"train_loss": -6.8443098068237305, "global_step": 171355, "epoch": 4079} {"train_loss": -6.843931198120117, "global_step": 171356, "epoch": 4079} {"train_loss": -6.8747406005859375, "global_step": 171357, "epoch": 4079} {"train_loss": -6.904007911682129, "global_step": 171358, "epoch": 4079} {"train_loss": -6.955923114504133, "global_step": 171359, "epoch": 4079, "val_loss": 68580.625} {"train_loss": -7.057693004608154, "global_step": 171360, "epoch": 4080} {"train_loss": -6.931639671325684, "global_step": 171361, "epoch": 4080} {"train_loss": -7.0214033126831055, "global_step": 171362, "epoch": 4080} {"train_loss": -6.993974208831787, "global_step": 171363, "epoch": 4080} {"train_loss": -6.819791316986084, "global_step": 171364, "epoch": 4080} {"train_loss": -6.975804805755615, "global_step": 171365, "epoch": 4080} {"train_loss": -7.023833274841309, "global_step": 171366, "epoch": 4080} {"train_loss": -6.863424777984619, "global_step": 171367, "epoch": 4080} {"train_loss": -6.8892974853515625, "global_step": 171368, "epoch": 4080} {"train_loss": -7.06294059753418, "global_step": 171369, "epoch": 4080} {"train_loss": -7.000489234924316, "global_step": 171370, "epoch": 4080} {"train_loss": -6.964283466339111, "global_step": 171371, "epoch": 4080} {"train_loss": -7.018826007843018, "global_step": 171372, "epoch": 4080} {"train_loss": -6.929584980010986, "global_step": 171373, "epoch": 4080} {"train_loss": -7.07600212097168, "global_step": 171374, "epoch": 4080} {"train_loss": -6.917728424072266, "global_step": 171375, "epoch": 4080} {"train_loss": -7.0818867683410645, "global_step": 171376, "epoch": 4080} {"train_loss": -7.033464431762695, "global_step": 171377, "epoch": 4080} {"train_loss": -6.937233924865723, "global_step": 171378, "epoch": 4080} {"train_loss": -6.886499881744385, "global_step": 171379, "epoch": 4080} {"train_loss": -7.037752628326416, "global_step": 171380, "epoch": 4080} {"train_loss": -6.969404220581055, "global_step": 171381, "epoch": 4080} {"train_loss": -7.096576690673828, "global_step": 171382, "epoch": 4080} {"train_loss": -7.0432891845703125, "global_step": 171383, "epoch": 4080} {"train_loss": -7.06308650970459, "global_step": 171384, "epoch": 4080} {"train_loss": -7.0363545417785645, "global_step": 171385, "epoch": 4080} {"train_loss": -6.925385475158691, "global_step": 171386, "epoch": 4080} {"train_loss": -6.999682903289795, "global_step": 171387, "epoch": 4080} {"train_loss": -6.980891227722168, "global_step": 171388, "epoch": 4080} {"train_loss": -6.953315734863281, "global_step": 171389, "epoch": 4080} {"train_loss": -7.079884052276611, "global_step": 171390, "epoch": 4080} {"train_loss": -7.002356052398682, "global_step": 171391, "epoch": 4080} {"train_loss": -7.074502944946289, "global_step": 171392, "epoch": 4080} {"train_loss": -7.07680082321167, "global_step": 171393, "epoch": 4080} {"train_loss": -7.043811321258545, "global_step": 171394, "epoch": 4080} {"train_loss": -7.084633827209473, "global_step": 171395, "epoch": 4080} {"train_loss": -7.140981674194336, "global_step": 171396, "epoch": 4080} {"train_loss": -7.02943754196167, "global_step": 171397, "epoch": 4080} {"train_loss": -7.034404277801514, "global_step": 171398, "epoch": 4080} {"train_loss": -7.043603420257568, "global_step": 171399, "epoch": 4080} {"train_loss": -6.995626926422119, "global_step": 171400, "epoch": 4080} {"train_loss": -7.005093347458613, "global_step": 171401, "epoch": 4080, "val_loss": 68584.0546875} {"train_loss": -6.937363147735596, "global_step": 171402, "epoch": 4081} {"train_loss": -6.869267463684082, "global_step": 171403, "epoch": 4081} {"train_loss": -6.927127838134766, "global_step": 171404, "epoch": 4081} {"train_loss": -7.00054931640625, "global_step": 171405, "epoch": 4081} {"train_loss": -6.968801021575928, "global_step": 171406, "epoch": 4081} {"train_loss": -6.889785289764404, "global_step": 171407, "epoch": 4081} {"train_loss": -6.954002857208252, "global_step": 171408, "epoch": 4081} {"train_loss": -7.003525733947754, "global_step": 171409, "epoch": 4081} {"train_loss": -6.9486494064331055, "global_step": 171410, "epoch": 4081} {"train_loss": -6.765220642089844, "global_step": 171411, "epoch": 4081} {"train_loss": -7.0939788818359375, "global_step": 171412, "epoch": 4081} {"train_loss": -7.085855960845947, "global_step": 171413, "epoch": 4081} {"train_loss": -7.031253337860107, "global_step": 171414, "epoch": 4081} {"train_loss": -6.9620256423950195, "global_step": 171415, "epoch": 4081} {"train_loss": -7.052072525024414, "global_step": 171416, "epoch": 4081} {"train_loss": -6.993293285369873, "global_step": 171417, "epoch": 4081} {"train_loss": -6.976191997528076, "global_step": 171418, "epoch": 4081} {"train_loss": -7.030892372131348, "global_step": 171419, "epoch": 4081} {"train_loss": -6.93400764465332, "global_step": 171420, "epoch": 4081} {"train_loss": -6.986965179443359, "global_step": 171421, "epoch": 4081} {"train_loss": -7.054091453552246, "global_step": 171422, "epoch": 4081} {"train_loss": -6.967108249664307, "global_step": 171423, "epoch": 4081} {"train_loss": -6.984189987182617, "global_step": 171424, "epoch": 4081} {"train_loss": -6.963214874267578, "global_step": 171425, "epoch": 4081} {"train_loss": -6.95790958404541, "global_step": 171426, "epoch": 4081} {"train_loss": -7.050324440002441, "global_step": 171427, "epoch": 4081} {"train_loss": -6.894778251647949, "global_step": 171428, "epoch": 4081} {"train_loss": -6.881535530090332, "global_step": 171429, "epoch": 4081} {"train_loss": -6.994009017944336, "global_step": 171430, "epoch": 4081} {"train_loss": -6.798098087310791, "global_step": 171431, "epoch": 4081} {"train_loss": -6.934086799621582, "global_step": 171432, "epoch": 4081} {"train_loss": -6.861659049987793, "global_step": 171433, "epoch": 4081} {"train_loss": -6.898921489715576, "global_step": 171434, "epoch": 4081} {"train_loss": -6.912317276000977, "global_step": 171435, "epoch": 4081} {"train_loss": -6.921456336975098, "global_step": 171436, "epoch": 4081} {"train_loss": -7.031887531280518, "global_step": 171437, "epoch": 4081} {"train_loss": -6.968239784240723, "global_step": 171438, "epoch": 4081} {"train_loss": -6.918344020843506, "global_step": 171439, "epoch": 4081} {"train_loss": -6.946707725524902, "global_step": 171440, "epoch": 4081} {"train_loss": -6.857395172119141, "global_step": 171441, "epoch": 4081} {"train_loss": -6.900460720062256, "global_step": 171442, "epoch": 4081} {"train_loss": -6.955024208341326, "global_step": 171443, "epoch": 4081, "val_loss": 68578.3046875} {"train_loss": -7.032590866088867, "global_step": 171444, "epoch": 4082} {"train_loss": -7.026801109313965, "global_step": 171445, "epoch": 4082} {"train_loss": -7.024643898010254, "global_step": 171446, "epoch": 4082} {"train_loss": -6.9857354164123535, "global_step": 171447, "epoch": 4082} {"train_loss": -7.117550373077393, "global_step": 171448, "epoch": 4082} {"train_loss": -7.069578170776367, "global_step": 171449, "epoch": 4082} {"train_loss": -6.939067840576172, "global_step": 171450, "epoch": 4082} {"train_loss": -7.036147117614746, "global_step": 171451, "epoch": 4082} {"train_loss": -7.105149745941162, "global_step": 171452, "epoch": 4082} {"train_loss": -7.0828447341918945, "global_step": 171453, "epoch": 4082} {"train_loss": -7.089015960693359, "global_step": 171454, "epoch": 4082} {"train_loss": -7.042267799377441, "global_step": 171455, "epoch": 4082} {"train_loss": -6.921807289123535, "global_step": 171456, "epoch": 4082} {"train_loss": -6.930872917175293, "global_step": 171457, "epoch": 4082} {"train_loss": -7.087794303894043, "global_step": 171458, "epoch": 4082} {"train_loss": -6.900282382965088, "global_step": 171459, "epoch": 4082} {"train_loss": -7.148082733154297, "global_step": 171460, "epoch": 4082} {"train_loss": -7.025370121002197, "global_step": 171461, "epoch": 4082} {"train_loss": -7.129395484924316, "global_step": 171462, "epoch": 4082} {"train_loss": -6.992841720581055, "global_step": 171463, "epoch": 4082} {"train_loss": -7.102640628814697, "global_step": 171464, "epoch": 4082} {"train_loss": -7.093733310699463, "global_step": 171465, "epoch": 4082} {"train_loss": -6.939043998718262, "global_step": 171466, "epoch": 4082} {"train_loss": -7.078221321105957, "global_step": 171467, "epoch": 4082} {"train_loss": -6.97590970993042, "global_step": 171468, "epoch": 4082} {"train_loss": -6.900171279907227, "global_step": 171469, "epoch": 4082} {"train_loss": -6.982207775115967, "global_step": 171470, "epoch": 4082} {"train_loss": -7.035404205322266, "global_step": 171471, "epoch": 4082} {"train_loss": -6.968289852142334, "global_step": 171472, "epoch": 4082} {"train_loss": -6.988905429840088, "global_step": 171473, "epoch": 4082} {"train_loss": -6.9594926834106445, "global_step": 171474, "epoch": 4082} {"train_loss": -6.9850969314575195, "global_step": 171475, "epoch": 4082} {"train_loss": -6.935478210449219, "global_step": 171476, "epoch": 4082} {"train_loss": -7.118046760559082, "global_step": 171477, "epoch": 4082} {"train_loss": -6.893409729003906, "global_step": 171478, "epoch": 4082} {"train_loss": -6.939380645751953, "global_step": 171479, "epoch": 4082} {"train_loss": -6.876995086669922, "global_step": 171480, "epoch": 4082} {"train_loss": -6.908170700073242, "global_step": 171481, "epoch": 4082} {"train_loss": -7.037163257598877, "global_step": 171482, "epoch": 4082} {"train_loss": -6.94963264465332, "global_step": 171483, "epoch": 4082} {"train_loss": -6.854554176330566, "global_step": 171484, "epoch": 4082} {"train_loss": -7.0065324533553355, "global_step": 171485, "epoch": 4082, "val_loss": 68644.28125} {"train_loss": -6.9991455078125, "global_step": 171486, "epoch": 4083} {"train_loss": -7.07610559463501, "global_step": 171487, "epoch": 4083} {"train_loss": -6.952338218688965, "global_step": 171488, "epoch": 4083} {"train_loss": -6.9366350173950195, "global_step": 171489, "epoch": 4083} {"train_loss": -7.001884937286377, "global_step": 171490, "epoch": 4083} {"train_loss": -7.022018909454346, "global_step": 171491, "epoch": 4083} {"train_loss": -7.099554538726807, "global_step": 171492, "epoch": 4083} {"train_loss": -7.051670074462891, "global_step": 171493, "epoch": 4083} {"train_loss": -7.075986385345459, "global_step": 171494, "epoch": 4083} {"train_loss": -7.102394104003906, "global_step": 171495, "epoch": 4083} {"train_loss": -6.9171905517578125, "global_step": 171496, "epoch": 4083} {"train_loss": -6.978547096252441, "global_step": 171497, "epoch": 4083} {"train_loss": -6.999698638916016, "global_step": 171498, "epoch": 4083} {"train_loss": -7.0676960945129395, "global_step": 171499, "epoch": 4083} {"train_loss": -6.981935024261475, "global_step": 171500, "epoch": 4083} {"train_loss": -6.986856460571289, "global_step": 171501, "epoch": 4083} {"train_loss": -6.894834518432617, "global_step": 171502, "epoch": 4083} {"train_loss": -7.0489501953125, "global_step": 171503, "epoch": 4083} {"train_loss": -7.023157119750977, "global_step": 171504, "epoch": 4083} {"train_loss": -6.994240760803223, "global_step": 171505, "epoch": 4083} {"train_loss": -7.119742393493652, "global_step": 171506, "epoch": 4083} {"train_loss": -7.088040828704834, "global_step": 171507, "epoch": 4083} {"train_loss": -6.965913772583008, "global_step": 171508, "epoch": 4083} {"train_loss": -7.098580360412598, "global_step": 171509, "epoch": 4083} {"train_loss": -6.9716925621032715, "global_step": 171510, "epoch": 4083} {"train_loss": -7.1542863845825195, "global_step": 171511, "epoch": 4083} {"train_loss": -7.095908164978027, "global_step": 171512, "epoch": 4083} {"train_loss": -6.733824729919434, "global_step": 171513, "epoch": 4083} {"train_loss": -7.059469699859619, "global_step": 171514, "epoch": 4083} {"train_loss": -6.885356903076172, "global_step": 171515, "epoch": 4083} {"train_loss": -6.908622741699219, "global_step": 171516, "epoch": 4083} {"train_loss": -7.060665130615234, "global_step": 171517, "epoch": 4083} {"train_loss": -6.975927829742432, "global_step": 171518, "epoch": 4083} {"train_loss": -6.819296836853027, "global_step": 171519, "epoch": 4083} {"train_loss": -6.991994857788086, "global_step": 171520, "epoch": 4083} {"train_loss": -6.725950241088867, "global_step": 171521, "epoch": 4083} {"train_loss": -7.04518985748291, "global_step": 171522, "epoch": 4083} {"train_loss": -6.865865707397461, "global_step": 171523, "epoch": 4083} {"train_loss": -6.930037498474121, "global_step": 171524, "epoch": 4083} {"train_loss": -6.95958137512207, "global_step": 171525, "epoch": 4083} {"train_loss": -6.994562149047852, "global_step": 171526, "epoch": 4083} {"train_loss": -6.991019827978952, "global_step": 171527, "epoch": 4083, "val_loss": 68565.546875} {"train_loss": -6.889279842376709, "global_step": 171528, "epoch": 4084} {"train_loss": -6.8321332931518555, "global_step": 171529, "epoch": 4084} {"train_loss": -6.985555648803711, "global_step": 171530, "epoch": 4084} {"train_loss": -6.834655284881592, "global_step": 171531, "epoch": 4084} {"train_loss": -7.0404157638549805, "global_step": 171532, "epoch": 4084} {"train_loss": -6.848111629486084, "global_step": 171533, "epoch": 4084} {"train_loss": -6.826141834259033, "global_step": 171534, "epoch": 4084} {"train_loss": -7.033688545227051, "global_step": 171535, "epoch": 4084} {"train_loss": -6.964484214782715, "global_step": 171536, "epoch": 4084} {"train_loss": -7.008879661560059, "global_step": 171537, "epoch": 4084} {"train_loss": -6.932726860046387, "global_step": 171538, "epoch": 4084} {"train_loss": -6.940646171569824, "global_step": 171539, "epoch": 4084} {"train_loss": -6.834012031555176, "global_step": 171540, "epoch": 4084} {"train_loss": -6.935818672180176, "global_step": 171541, "epoch": 4084} {"train_loss": -6.7186479568481445, "global_step": 171542, "epoch": 4084} {"train_loss": -6.891116142272949, "global_step": 171543, "epoch": 4084} {"train_loss": -6.845658779144287, "global_step": 171544, "epoch": 4084} {"train_loss": -6.990095138549805, "global_step": 171545, "epoch": 4084} {"train_loss": -6.949229717254639, "global_step": 171546, "epoch": 4084} {"train_loss": -6.922825813293457, "global_step": 171547, "epoch": 4084} {"train_loss": -6.955780982971191, "global_step": 171548, "epoch": 4084} {"train_loss": -6.884535312652588, "global_step": 171549, "epoch": 4084} {"train_loss": -7.021673202514648, "global_step": 171550, "epoch": 4084} {"train_loss": -7.0133819580078125, "global_step": 171551, "epoch": 4084} {"train_loss": -7.069400787353516, "global_step": 171552, "epoch": 4084} {"train_loss": -6.857143402099609, "global_step": 171553, "epoch": 4084} {"train_loss": -7.105118751525879, "global_step": 171554, "epoch": 4084} {"train_loss": -6.8702192306518555, "global_step": 171555, "epoch": 4084} {"train_loss": -6.971953392028809, "global_step": 171556, "epoch": 4084} {"train_loss": -7.047410011291504, "global_step": 171557, "epoch": 4084} {"train_loss": -6.967331886291504, "global_step": 171558, "epoch": 4084} {"train_loss": -6.866238117218018, "global_step": 171559, "epoch": 4084} {"train_loss": -6.979504108428955, "global_step": 171560, "epoch": 4084} {"train_loss": -7.007924556732178, "global_step": 171561, "epoch": 4084} {"train_loss": -6.88087272644043, "global_step": 171562, "epoch": 4084} {"train_loss": -7.012035846710205, "global_step": 171563, "epoch": 4084} {"train_loss": -7.038269519805908, "global_step": 171564, "epoch": 4084} {"train_loss": -7.027198791503906, "global_step": 171565, "epoch": 4084} {"train_loss": -7.03851318359375, "global_step": 171566, "epoch": 4084} {"train_loss": -6.994030475616455, "global_step": 171567, "epoch": 4084} {"train_loss": -7.058261394500732, "global_step": 171568, "epoch": 4084} {"train_loss": -6.948289133253551, "global_step": 171569, "epoch": 4084, "val_loss": 68492.5859375} {"train_loss": -6.968632698059082, "global_step": 171570, "epoch": 4085} {"train_loss": -6.966291427612305, "global_step": 171571, "epoch": 4085} {"train_loss": -6.96340274810791, "global_step": 171572, "epoch": 4085} {"train_loss": -6.965152740478516, "global_step": 171573, "epoch": 4085} {"train_loss": -6.943519592285156, "global_step": 171574, "epoch": 4085} {"train_loss": -6.9707489013671875, "global_step": 171575, "epoch": 4085} {"train_loss": -7.084208011627197, "global_step": 171576, "epoch": 4085} {"train_loss": -6.896255970001221, "global_step": 171577, "epoch": 4085} {"train_loss": -6.984502792358398, "global_step": 171578, "epoch": 4085} {"train_loss": -6.9158101081848145, "global_step": 171579, "epoch": 4085} {"train_loss": -7.066095352172852, "global_step": 171580, "epoch": 4085} {"train_loss": -6.934238910675049, "global_step": 171581, "epoch": 4085} {"train_loss": -6.928681373596191, "global_step": 171582, "epoch": 4085} {"train_loss": -7.045788764953613, "global_step": 171583, "epoch": 4085} {"train_loss": -7.049873352050781, "global_step": 171584, "epoch": 4085} {"train_loss": -6.916470050811768, "global_step": 171585, "epoch": 4085} {"train_loss": -7.05659294128418, "global_step": 171586, "epoch": 4085} {"train_loss": -6.969358444213867, "global_step": 171587, "epoch": 4085} {"train_loss": -6.864928245544434, "global_step": 171588, "epoch": 4085} {"train_loss": -7.085052490234375, "global_step": 171589, "epoch": 4085} {"train_loss": -7.027724742889404, "global_step": 171590, "epoch": 4085} {"train_loss": -6.917329788208008, "global_step": 171591, "epoch": 4085} {"train_loss": -6.992229461669922, "global_step": 171592, "epoch": 4085} {"train_loss": -6.87251091003418, "global_step": 171593, "epoch": 4085} {"train_loss": -6.989904403686523, "global_step": 171594, "epoch": 4085} {"train_loss": -7.133995532989502, "global_step": 171595, "epoch": 4085} {"train_loss": -7.014593124389648, "global_step": 171596, "epoch": 4085} {"train_loss": -7.038955211639404, "global_step": 171597, "epoch": 4085} {"train_loss": -6.957006454467773, "global_step": 171598, "epoch": 4085} {"train_loss": -6.901599407196045, "global_step": 171599, "epoch": 4085} {"train_loss": -7.0115203857421875, "global_step": 171600, "epoch": 4085} {"train_loss": -6.944629669189453, "global_step": 171601, "epoch": 4085} {"train_loss": -7.075615882873535, "global_step": 171602, "epoch": 4085} {"train_loss": -7.120656490325928, "global_step": 171603, "epoch": 4085} {"train_loss": -7.048104286193848, "global_step": 171604, "epoch": 4085} {"train_loss": -6.978753089904785, "global_step": 171605, "epoch": 4085} {"train_loss": -7.0470781326293945, "global_step": 171606, "epoch": 4085} {"train_loss": -7.13060998916626, "global_step": 171607, "epoch": 4085} {"train_loss": -7.059606075286865, "global_step": 171608, "epoch": 4085} {"train_loss": -7.128078460693359, "global_step": 171609, "epoch": 4085} {"train_loss": -7.036064147949219, "global_step": 171610, "epoch": 4085} {"train_loss": -6.999357371103196, "global_step": 171611, "epoch": 4085, "val_loss": 68691.7109375} {"train_loss": -7.081721305847168, "global_step": 171612, "epoch": 4086} {"train_loss": -7.045371055603027, "global_step": 171613, "epoch": 4086} {"train_loss": -7.119055271148682, "global_step": 171614, "epoch": 4086} {"train_loss": -7.195670127868652, "global_step": 171615, "epoch": 4086} {"train_loss": -7.032654762268066, "global_step": 171616, "epoch": 4086} {"train_loss": -7.004982948303223, "global_step": 171617, "epoch": 4086} {"train_loss": -7.003078460693359, "global_step": 171618, "epoch": 4086} {"train_loss": -6.949185371398926, "global_step": 171619, "epoch": 4086} {"train_loss": -6.950765609741211, "global_step": 171620, "epoch": 4086} {"train_loss": -6.991222381591797, "global_step": 171621, "epoch": 4086} {"train_loss": -7.018387794494629, "global_step": 171622, "epoch": 4086} {"train_loss": -7.0829620361328125, "global_step": 171623, "epoch": 4086} {"train_loss": -6.936823844909668, "global_step": 171624, "epoch": 4086} {"train_loss": -7.093646049499512, "global_step": 171625, "epoch": 4086} {"train_loss": -7.0050201416015625, "global_step": 171626, "epoch": 4086} {"train_loss": -7.047452926635742, "global_step": 171627, "epoch": 4086} {"train_loss": -7.095517158508301, "global_step": 171628, "epoch": 4086} {"train_loss": -7.0126800537109375, "global_step": 171629, "epoch": 4086} {"train_loss": -7.119288444519043, "global_step": 171630, "epoch": 4086} {"train_loss": -7.0078349113464355, "global_step": 171631, "epoch": 4086} {"train_loss": -7.061873435974121, "global_step": 171632, "epoch": 4086} {"train_loss": -6.999398231506348, "global_step": 171633, "epoch": 4086} {"train_loss": -6.983772277832031, "global_step": 171634, "epoch": 4086} {"train_loss": -6.989261627197266, "global_step": 171635, "epoch": 4086} {"train_loss": -7.022521018981934, "global_step": 171636, "epoch": 4086} {"train_loss": -7.064093112945557, "global_step": 171637, "epoch": 4086} {"train_loss": -7.0805535316467285, "global_step": 171638, "epoch": 4086} {"train_loss": -7.037110805511475, "global_step": 171639, "epoch": 4086} {"train_loss": -7.008059501647949, "global_step": 171640, "epoch": 4086} {"train_loss": -7.022152900695801, "global_step": 171641, "epoch": 4086} {"train_loss": -7.034961223602295, "global_step": 171642, "epoch": 4086} {"train_loss": -7.039301872253418, "global_step": 171643, "epoch": 4086} {"train_loss": -7.0455732345581055, "global_step": 171644, "epoch": 4086} {"train_loss": -7.1239824295043945, "global_step": 171645, "epoch": 4086} {"train_loss": -7.095454216003418, "global_step": 171646, "epoch": 4086} {"train_loss": -6.900959491729736, "global_step": 171647, "epoch": 4086} {"train_loss": -6.9684834480285645, "global_step": 171648, "epoch": 4086} {"train_loss": -7.06865930557251, "global_step": 171649, "epoch": 4086} {"train_loss": -7.0094757080078125, "global_step": 171650, "epoch": 4086} {"train_loss": -6.954361438751221, "global_step": 171651, "epoch": 4086} {"train_loss": -7.012060165405273, "global_step": 171652, "epoch": 4086} {"train_loss": -7.0296843733106344, "global_step": 171653, "epoch": 4086, "val_loss": 68419.78125} {"train_loss": -6.978323459625244, "global_step": 171654, "epoch": 4087} {"train_loss": -7.118844985961914, "global_step": 171655, "epoch": 4087} {"train_loss": -7.042452335357666, "global_step": 171656, "epoch": 4087} {"train_loss": -6.873388290405273, "global_step": 171657, "epoch": 4087} {"train_loss": -7.090121269226074, "global_step": 171658, "epoch": 4087} {"train_loss": -6.996875762939453, "global_step": 171659, "epoch": 4087} {"train_loss": -7.00262975692749, "global_step": 171660, "epoch": 4087} {"train_loss": -7.039056777954102, "global_step": 171661, "epoch": 4087} {"train_loss": -7.077517986297607, "global_step": 171662, "epoch": 4087} {"train_loss": -7.02027702331543, "global_step": 171663, "epoch": 4087} {"train_loss": -7.035452842712402, "global_step": 171664, "epoch": 4087} {"train_loss": -7.075740814208984, "global_step": 171665, "epoch": 4087} {"train_loss": -7.049986362457275, "global_step": 171666, "epoch": 4087} {"train_loss": -6.98488712310791, "global_step": 171667, "epoch": 4087} {"train_loss": -7.057534217834473, "global_step": 171668, "epoch": 4087} {"train_loss": -6.957696914672852, "global_step": 171669, "epoch": 4087} {"train_loss": -7.01390266418457, "global_step": 171670, "epoch": 4087} {"train_loss": -6.979426860809326, "global_step": 171671, "epoch": 4087} {"train_loss": -6.92133903503418, "global_step": 171672, "epoch": 4087} {"train_loss": -7.031798362731934, "global_step": 171673, "epoch": 4087} {"train_loss": -7.027562141418457, "global_step": 171674, "epoch": 4087} {"train_loss": -7.0273942947387695, "global_step": 171675, "epoch": 4087} {"train_loss": -7.059243679046631, "global_step": 171676, "epoch": 4087} {"train_loss": -7.001026630401611, "global_step": 171677, "epoch": 4087} {"train_loss": -6.98525333404541, "global_step": 171678, "epoch": 4087} {"train_loss": -6.94617223739624, "global_step": 171679, "epoch": 4087} {"train_loss": -6.978672027587891, "global_step": 171680, "epoch": 4087} {"train_loss": -6.807880401611328, "global_step": 171681, "epoch": 4087} {"train_loss": -7.027756214141846, "global_step": 171682, "epoch": 4087} {"train_loss": -6.885860919952393, "global_step": 171683, "epoch": 4087} {"train_loss": -7.094611167907715, "global_step": 171684, "epoch": 4087} {"train_loss": -6.959066867828369, "global_step": 171685, "epoch": 4087} {"train_loss": -6.952366828918457, "global_step": 171686, "epoch": 4087} {"train_loss": -6.992137908935547, "global_step": 171687, "epoch": 4087} {"train_loss": -7.051766395568848, "global_step": 171688, "epoch": 4087} {"train_loss": -6.998416900634766, "global_step": 171689, "epoch": 4087} {"train_loss": -7.016119956970215, "global_step": 171690, "epoch": 4087} {"train_loss": -7.060981750488281, "global_step": 171691, "epoch": 4087} {"train_loss": -7.001140117645264, "global_step": 171692, "epoch": 4087} {"train_loss": -6.974210262298584, "global_step": 171693, "epoch": 4087} {"train_loss": -7.001428604125977, "global_step": 171694, "epoch": 4087} {"train_loss": -7.004217999322074, "global_step": 171695, "epoch": 4087, "val_loss": 68487.265625} {"train_loss": -6.919170379638672, "global_step": 171696, "epoch": 4088} {"train_loss": -7.003026008605957, "global_step": 171697, "epoch": 4088} {"train_loss": -7.047567367553711, "global_step": 171698, "epoch": 4088} {"train_loss": -7.036889553070068, "global_step": 171699, "epoch": 4088} {"train_loss": -7.02589225769043, "global_step": 171700, "epoch": 4088} {"train_loss": -7.066493988037109, "global_step": 171701, "epoch": 4088} {"train_loss": -7.05109977722168, "global_step": 171702, "epoch": 4088} {"train_loss": -6.870720863342285, "global_step": 171703, "epoch": 4088} {"train_loss": -7.0388712882995605, "global_step": 171704, "epoch": 4088} {"train_loss": -6.957986831665039, "global_step": 171705, "epoch": 4088} {"train_loss": -6.89561653137207, "global_step": 171706, "epoch": 4088} {"train_loss": -7.006646156311035, "global_step": 171707, "epoch": 4088} {"train_loss": -7.00466775894165, "global_step": 171708, "epoch": 4088} {"train_loss": -6.977181434631348, "global_step": 171709, "epoch": 4088} {"train_loss": -7.0158233642578125, "global_step": 171710, "epoch": 4088} {"train_loss": -6.968101501464844, "global_step": 171711, "epoch": 4088} {"train_loss": -6.980316162109375, "global_step": 171712, "epoch": 4088} {"train_loss": -6.894291877746582, "global_step": 171713, "epoch": 4088} {"train_loss": -6.999174118041992, "global_step": 171714, "epoch": 4088} {"train_loss": -7.0929155349731445, "global_step": 171715, "epoch": 4088} {"train_loss": -6.999895095825195, "global_step": 171716, "epoch": 4088} {"train_loss": -6.981180191040039, "global_step": 171717, "epoch": 4088} {"train_loss": -6.944132328033447, "global_step": 171718, "epoch": 4088} {"train_loss": -6.944546699523926, "global_step": 171719, "epoch": 4088} {"train_loss": -7.059355735778809, "global_step": 171720, "epoch": 4088} {"train_loss": -7.020185470581055, "global_step": 171721, "epoch": 4088} {"train_loss": -7.090601921081543, "global_step": 171722, "epoch": 4088} {"train_loss": -7.011054039001465, "global_step": 171723, "epoch": 4088} {"train_loss": -7.0408406257629395, "global_step": 171724, "epoch": 4088} {"train_loss": -7.026078224182129, "global_step": 171725, "epoch": 4088} {"train_loss": -7.046849727630615, "global_step": 171726, "epoch": 4088} {"train_loss": -7.110208034515381, "global_step": 171727, "epoch": 4088} {"train_loss": -7.081715106964111, "global_step": 171728, "epoch": 4088} {"train_loss": -7.091320991516113, "global_step": 171729, "epoch": 4088} {"train_loss": -7.012549877166748, "global_step": 171730, "epoch": 4088} {"train_loss": -7.030139923095703, "global_step": 171731, "epoch": 4088} {"train_loss": -7.03080940246582, "global_step": 171732, "epoch": 4088} {"train_loss": -7.112370491027832, "global_step": 171733, "epoch": 4088} {"train_loss": -6.957818984985352, "global_step": 171734, "epoch": 4088} {"train_loss": -7.01561164855957, "global_step": 171735, "epoch": 4088} {"train_loss": -6.947665214538574, "global_step": 171736, "epoch": 4088} {"train_loss": -7.0096767743428545, "global_step": 171737, "epoch": 4088, "val_loss": 68669.3203125} {"train_loss": -6.974631309509277, "global_step": 171738, "epoch": 4089} {"train_loss": -6.939082145690918, "global_step": 171739, "epoch": 4089} {"train_loss": -6.980483055114746, "global_step": 171740, "epoch": 4089} {"train_loss": -7.069242477416992, "global_step": 171741, "epoch": 4089} {"train_loss": -7.0761003494262695, "global_step": 171742, "epoch": 4089} {"train_loss": -6.950221061706543, "global_step": 171743, "epoch": 4089} {"train_loss": -6.971867084503174, "global_step": 171744, "epoch": 4089} {"train_loss": -6.957914352416992, "global_step": 171745, "epoch": 4089} {"train_loss": -6.869910717010498, "global_step": 171746, "epoch": 4089} {"train_loss": -6.85015344619751, "global_step": 171747, "epoch": 4089} {"train_loss": -7.024921894073486, "global_step": 171748, "epoch": 4089} {"train_loss": -6.915820598602295, "global_step": 171749, "epoch": 4089} {"train_loss": -6.834021091461182, "global_step": 171750, "epoch": 4089} {"train_loss": -6.920612335205078, "global_step": 171751, "epoch": 4089} {"train_loss": -6.788420677185059, "global_step": 171752, "epoch": 4089} {"train_loss": -7.013927459716797, "global_step": 171753, "epoch": 4089} {"train_loss": -6.864342212677002, "global_step": 171754, "epoch": 4089} {"train_loss": -6.877927303314209, "global_step": 171755, "epoch": 4089} {"train_loss": -6.952120780944824, "global_step": 171756, "epoch": 4089} {"train_loss": -6.785514831542969, "global_step": 171757, "epoch": 4089} {"train_loss": -6.890692710876465, "global_step": 171758, "epoch": 4089} {"train_loss": -6.762238502502441, "global_step": 171759, "epoch": 4089} {"train_loss": -6.826011657714844, "global_step": 171760, "epoch": 4089} {"train_loss": -6.579048156738281, "global_step": 171761, "epoch": 4089} {"train_loss": -6.812026023864746, "global_step": 171762, "epoch": 4089} {"train_loss": -6.814215183258057, "global_step": 171763, "epoch": 4089} {"train_loss": -6.878668785095215, "global_step": 171764, "epoch": 4089} {"train_loss": -6.668115615844727, "global_step": 171765, "epoch": 4089} {"train_loss": -6.821598529815674, "global_step": 171766, "epoch": 4089} {"train_loss": -6.7303056716918945, "global_step": 171767, "epoch": 4089} {"train_loss": -6.939513206481934, "global_step": 171768, "epoch": 4089} {"train_loss": -6.813684463500977, "global_step": 171769, "epoch": 4089} {"train_loss": -6.8308024406433105, "global_step": 171770, "epoch": 4089} {"train_loss": -6.749363899230957, "global_step": 171771, "epoch": 4089} {"train_loss": -6.818436145782471, "global_step": 171772, "epoch": 4089} {"train_loss": -6.938864707946777, "global_step": 171773, "epoch": 4089} {"train_loss": -6.845025062561035, "global_step": 171774, "epoch": 4089} {"train_loss": -7.028311252593994, "global_step": 171775, "epoch": 4089} {"train_loss": -6.789775848388672, "global_step": 171776, "epoch": 4089} {"train_loss": -6.999558448791504, "global_step": 171777, "epoch": 4089} {"train_loss": -6.954021453857422, "global_step": 171778, "epoch": 4089} {"train_loss": -6.88369844073341, "global_step": 171779, "epoch": 4089, "val_loss": 68636.0390625} {"train_loss": -6.888293266296387, "global_step": 171780, "epoch": 4090} {"train_loss": -7.016602993011475, "global_step": 171781, "epoch": 4090} {"train_loss": -6.847349166870117, "global_step": 171782, "epoch": 4090} {"train_loss": -6.9773783683776855, "global_step": 171783, "epoch": 4090} {"train_loss": -6.806703090667725, "global_step": 171784, "epoch": 4090} {"train_loss": -6.98191499710083, "global_step": 171785, "epoch": 4090} {"train_loss": -6.856147289276123, "global_step": 171786, "epoch": 4090} {"train_loss": -6.9698686599731445, "global_step": 171787, "epoch": 4090} {"train_loss": -6.977147102355957, "global_step": 171788, "epoch": 4090} {"train_loss": -7.06264591217041, "global_step": 171789, "epoch": 4090} {"train_loss": -7.031494617462158, "global_step": 171790, "epoch": 4090} {"train_loss": -7.018994331359863, "global_step": 171791, "epoch": 4090} {"train_loss": -6.972209930419922, "global_step": 171792, "epoch": 4090} {"train_loss": -6.820197582244873, "global_step": 171793, "epoch": 4090} {"train_loss": -7.078313827514648, "global_step": 171794, "epoch": 4090} {"train_loss": -6.851213455200195, "global_step": 171795, "epoch": 4090} {"train_loss": -6.9550886154174805, "global_step": 171796, "epoch": 4090} {"train_loss": -7.095008850097656, "global_step": 171797, "epoch": 4090} {"train_loss": -7.023099899291992, "global_step": 171798, "epoch": 4090} {"train_loss": -6.945608139038086, "global_step": 171799, "epoch": 4090} {"train_loss": -7.110352516174316, "global_step": 171800, "epoch": 4090} {"train_loss": -7.011387825012207, "global_step": 171801, "epoch": 4090} {"train_loss": -7.068170547485352, "global_step": 171802, "epoch": 4090} {"train_loss": -6.920805931091309, "global_step": 171803, "epoch": 4090} {"train_loss": -7.089276313781738, "global_step": 171804, "epoch": 4090} {"train_loss": -7.006021499633789, "global_step": 171805, "epoch": 4090} {"train_loss": -6.955524444580078, "global_step": 171806, "epoch": 4090} {"train_loss": -7.167625904083252, "global_step": 171807, "epoch": 4090} {"train_loss": -6.952478408813477, "global_step": 171808, "epoch": 4090} {"train_loss": -6.996452331542969, "global_step": 171809, "epoch": 4090} {"train_loss": -7.079919338226318, "global_step": 171810, "epoch": 4090} {"train_loss": -7.001516342163086, "global_step": 171811, "epoch": 4090} {"train_loss": -7.075885772705078, "global_step": 171812, "epoch": 4090} {"train_loss": -6.986163139343262, "global_step": 171813, "epoch": 4090} {"train_loss": -7.084240913391113, "global_step": 171814, "epoch": 4090} {"train_loss": -7.180586814880371, "global_step": 171815, "epoch": 4090} {"train_loss": -7.068111896514893, "global_step": 171816, "epoch": 4090} {"train_loss": -6.998387336730957, "global_step": 171817, "epoch": 4090} {"train_loss": -7.046026229858398, "global_step": 171818, "epoch": 4090} {"train_loss": -7.016057014465332, "global_step": 171819, "epoch": 4090} {"train_loss": -6.981242656707764, "global_step": 171820, "epoch": 4090} {"train_loss": -7.00318455696106, "global_step": 171821, "epoch": 4090, "val_loss": 68563.78125} {"train_loss": -7.090930938720703, "global_step": 171822, "epoch": 4091} {"train_loss": -6.975818157196045, "global_step": 171823, "epoch": 4091} {"train_loss": -7.106167793273926, "global_step": 171824, "epoch": 4091} {"train_loss": -7.02960729598999, "global_step": 171825, "epoch": 4091} {"train_loss": -7.065480709075928, "global_step": 171826, "epoch": 4091} {"train_loss": -7.052016258239746, "global_step": 171827, "epoch": 4091} {"train_loss": -7.0388383865356445, "global_step": 171828, "epoch": 4091} {"train_loss": -7.122560501098633, "global_step": 171829, "epoch": 4091} {"train_loss": -7.009259223937988, "global_step": 171830, "epoch": 4091} {"train_loss": -7.062074184417725, "global_step": 171831, "epoch": 4091} {"train_loss": -7.027846813201904, "global_step": 171832, "epoch": 4091} {"train_loss": -6.97537899017334, "global_step": 171833, "epoch": 4091} {"train_loss": -7.002920150756836, "global_step": 171834, "epoch": 4091} {"train_loss": -6.980316162109375, "global_step": 171835, "epoch": 4091} {"train_loss": -7.014896392822266, "global_step": 171836, "epoch": 4091} {"train_loss": -6.965597152709961, "global_step": 171837, "epoch": 4091} {"train_loss": -7.049059867858887, "global_step": 171838, "epoch": 4091} {"train_loss": -7.0370893478393555, "global_step": 171839, "epoch": 4091} {"train_loss": -7.03009033203125, "global_step": 171840, "epoch": 4091} {"train_loss": -7.005782604217529, "global_step": 171841, "epoch": 4091} {"train_loss": -7.024091720581055, "global_step": 171842, "epoch": 4091} {"train_loss": -7.081808090209961, "global_step": 171843, "epoch": 4091} {"train_loss": -7.066246509552002, "global_step": 171844, "epoch": 4091} {"train_loss": -6.981967449188232, "global_step": 171845, "epoch": 4091} {"train_loss": -7.036783695220947, "global_step": 171846, "epoch": 4091} {"train_loss": -7.056738376617432, "global_step": 171847, "epoch": 4091} {"train_loss": -6.9726972579956055, "global_step": 171848, "epoch": 4091} {"train_loss": -6.994326591491699, "global_step": 171849, "epoch": 4091} {"train_loss": -7.191755294799805, "global_step": 171850, "epoch": 4091} {"train_loss": -6.936465263366699, "global_step": 171851, "epoch": 4091} {"train_loss": -6.9139885902404785, "global_step": 171852, "epoch": 4091} {"train_loss": -7.0630388259887695, "global_step": 171853, "epoch": 4091} {"train_loss": -7.134799480438232, "global_step": 171854, "epoch": 4091} {"train_loss": -6.922244071960449, "global_step": 171855, "epoch": 4091} {"train_loss": -7.004568099975586, "global_step": 171856, "epoch": 4091} {"train_loss": -7.017374515533447, "global_step": 171857, "epoch": 4091} {"train_loss": -7.018800735473633, "global_step": 171858, "epoch": 4091} {"train_loss": -6.96880578994751, "global_step": 171859, "epoch": 4091} {"train_loss": -6.890170097351074, "global_step": 171860, "epoch": 4091} {"train_loss": -7.014509201049805, "global_step": 171861, "epoch": 4091} {"train_loss": -6.8993239402771, "global_step": 171862, "epoch": 4091} {"train_loss": -7.019524426687331, "global_step": 171863, "epoch": 4091, "val_loss": 68536.0703125} {"train_loss": -6.995713233947754, "global_step": 171864, "epoch": 4092} {"train_loss": -6.925471782684326, "global_step": 171865, "epoch": 4092} {"train_loss": -7.017239570617676, "global_step": 171866, "epoch": 4092} {"train_loss": -6.985625267028809, "global_step": 171867, "epoch": 4092} {"train_loss": -6.955072402954102, "global_step": 171868, "epoch": 4092} {"train_loss": -7.083517074584961, "global_step": 171869, "epoch": 4092} {"train_loss": -6.918964385986328, "global_step": 171870, "epoch": 4092} {"train_loss": -7.038883209228516, "global_step": 171871, "epoch": 4092} {"train_loss": -6.952120780944824, "global_step": 171872, "epoch": 4092} {"train_loss": -7.064431190490723, "global_step": 171873, "epoch": 4092} {"train_loss": -7.044308185577393, "global_step": 171874, "epoch": 4092} {"train_loss": -7.017284393310547, "global_step": 171875, "epoch": 4092} {"train_loss": -7.077536106109619, "global_step": 171876, "epoch": 4092} {"train_loss": -6.935340404510498, "global_step": 171877, "epoch": 4092} {"train_loss": -6.994198799133301, "global_step": 171878, "epoch": 4092} {"train_loss": -7.024791717529297, "global_step": 171879, "epoch": 4092} {"train_loss": -6.99739933013916, "global_step": 171880, "epoch": 4092} {"train_loss": -6.995360374450684, "global_step": 171881, "epoch": 4092} {"train_loss": -7.032578468322754, "global_step": 171882, "epoch": 4092} {"train_loss": -7.016839027404785, "global_step": 171883, "epoch": 4092} {"train_loss": -7.050711154937744, "global_step": 171884, "epoch": 4092} {"train_loss": -7.0196404457092285, "global_step": 171885, "epoch": 4092} {"train_loss": -6.92319393157959, "global_step": 171886, "epoch": 4092} {"train_loss": -6.981043338775635, "global_step": 171887, "epoch": 4092} {"train_loss": -6.956628322601318, "global_step": 171888, "epoch": 4092} {"train_loss": -7.066614151000977, "global_step": 171889, "epoch": 4092} {"train_loss": -7.042315483093262, "global_step": 171890, "epoch": 4092} {"train_loss": -7.008599758148193, "global_step": 171891, "epoch": 4092} {"train_loss": -7.0039215087890625, "global_step": 171892, "epoch": 4092} {"train_loss": -7.015381813049316, "global_step": 171893, "epoch": 4092} {"train_loss": -7.037081718444824, "global_step": 171894, "epoch": 4092} {"train_loss": -6.874215126037598, "global_step": 171895, "epoch": 4092} {"train_loss": -7.172093391418457, "global_step": 171896, "epoch": 4092} {"train_loss": -7.1115546226501465, "global_step": 171897, "epoch": 4092} {"train_loss": -6.990289688110352, "global_step": 171898, "epoch": 4092} {"train_loss": -7.004702091217041, "global_step": 171899, "epoch": 4092} {"train_loss": -7.040194034576416, "global_step": 171900, "epoch": 4092} {"train_loss": -6.964895248413086, "global_step": 171901, "epoch": 4092} {"train_loss": -7.152632713317871, "global_step": 171902, "epoch": 4092} {"train_loss": -6.95195198059082, "global_step": 171903, "epoch": 4092} {"train_loss": -6.945101737976074, "global_step": 171904, "epoch": 4092} {"train_loss": -7.007606642586844, "global_step": 171905, "epoch": 4092, "val_loss": 68538.5859375} {"train_loss": -6.950870990753174, "global_step": 171906, "epoch": 4093} {"train_loss": -6.860689163208008, "global_step": 171907, "epoch": 4093} {"train_loss": -6.787898063659668, "global_step": 171908, "epoch": 4093} {"train_loss": -7.0200605392456055, "global_step": 171909, "epoch": 4093} {"train_loss": -6.975187301635742, "global_step": 171910, "epoch": 4093} {"train_loss": -6.882341384887695, "global_step": 171911, "epoch": 4093} {"train_loss": -7.02290153503418, "global_step": 171912, "epoch": 4093} {"train_loss": -7.013623237609863, "global_step": 171913, "epoch": 4093} {"train_loss": -6.951006889343262, "global_step": 171914, "epoch": 4093} {"train_loss": -6.987077713012695, "global_step": 171915, "epoch": 4093} {"train_loss": -7.004303932189941, "global_step": 171916, "epoch": 4093} {"train_loss": -7.037442684173584, "global_step": 171917, "epoch": 4093} {"train_loss": -6.902469635009766, "global_step": 171918, "epoch": 4093} {"train_loss": -6.959339141845703, "global_step": 171919, "epoch": 4093} {"train_loss": -6.880046844482422, "global_step": 171920, "epoch": 4093} {"train_loss": -6.903564453125, "global_step": 171921, "epoch": 4093} {"train_loss": -6.845370292663574, "global_step": 171922, "epoch": 4093} {"train_loss": -6.842141151428223, "global_step": 171923, "epoch": 4093} {"train_loss": -6.79940938949585, "global_step": 171924, "epoch": 4093} {"train_loss": -6.9890031814575195, "global_step": 171925, "epoch": 4093} {"train_loss": -6.930390357971191, "global_step": 171926, "epoch": 4093} {"train_loss": -6.8479204177856445, "global_step": 171927, "epoch": 4093} {"train_loss": -6.944265365600586, "global_step": 171928, "epoch": 4093} {"train_loss": -6.971475601196289, "global_step": 171929, "epoch": 4093} {"train_loss": -6.963893413543701, "global_step": 171930, "epoch": 4093} {"train_loss": -6.823596000671387, "global_step": 171931, "epoch": 4093} {"train_loss": -6.966202735900879, "global_step": 171932, "epoch": 4093} {"train_loss": -6.796783447265625, "global_step": 171933, "epoch": 4093} {"train_loss": -6.915470123291016, "global_step": 171934, "epoch": 4093} {"train_loss": -6.996838092803955, "global_step": 171935, "epoch": 4093} {"train_loss": -6.8914031982421875, "global_step": 171936, "epoch": 4093} {"train_loss": -7.096170902252197, "global_step": 171937, "epoch": 4093} {"train_loss": -6.967178821563721, "global_step": 171938, "epoch": 4093} {"train_loss": -7.018293380737305, "global_step": 171939, "epoch": 4093} {"train_loss": -6.814327239990234, "global_step": 171940, "epoch": 4093} {"train_loss": -7.00529670715332, "global_step": 171941, "epoch": 4093} {"train_loss": -7.011409282684326, "global_step": 171942, "epoch": 4093} {"train_loss": -7.1002726554870605, "global_step": 171943, "epoch": 4093} {"train_loss": -7.067895889282227, "global_step": 171944, "epoch": 4093} {"train_loss": -7.1061553955078125, "global_step": 171945, "epoch": 4093} {"train_loss": -6.978071212768555, "global_step": 171946, "epoch": 4093} {"train_loss": -6.947105907258534, "global_step": 171947, "epoch": 4093, "val_loss": 68676.359375} {"train_loss": -7.0268778800964355, "global_step": 171948, "epoch": 4094} {"train_loss": -7.053428649902344, "global_step": 171949, "epoch": 4094} {"train_loss": -7.113146781921387, "global_step": 171950, "epoch": 4094} {"train_loss": -7.044535160064697, "global_step": 171951, "epoch": 4094} {"train_loss": -7.053318023681641, "global_step": 171952, "epoch": 4094} {"train_loss": -7.103870391845703, "global_step": 171953, "epoch": 4094} {"train_loss": -7.132955074310303, "global_step": 171954, "epoch": 4094} {"train_loss": -7.044859886169434, "global_step": 171955, "epoch": 4094} {"train_loss": -7.065666198730469, "global_step": 171956, "epoch": 4094} {"train_loss": -7.105539321899414, "global_step": 171957, "epoch": 4094} {"train_loss": -7.0863237380981445, "global_step": 171958, "epoch": 4094} {"train_loss": -7.096495151519775, "global_step": 171959, "epoch": 4094} {"train_loss": -7.093384742736816, "global_step": 171960, "epoch": 4094} {"train_loss": -7.074801921844482, "global_step": 171961, "epoch": 4094} {"train_loss": -7.0080437660217285, "global_step": 171962, "epoch": 4094} {"train_loss": -6.984966278076172, "global_step": 171963, "epoch": 4094} {"train_loss": -7.133312225341797, "global_step": 171964, "epoch": 4094} {"train_loss": -6.915849685668945, "global_step": 171965, "epoch": 4094} {"train_loss": -7.069933891296387, "global_step": 171966, "epoch": 4094} {"train_loss": -7.002466201782227, "global_step": 171967, "epoch": 4094} {"train_loss": -7.055670738220215, "global_step": 171968, "epoch": 4094} {"train_loss": -7.029562950134277, "global_step": 171969, "epoch": 4094} {"train_loss": -6.995725154876709, "global_step": 171970, "epoch": 4094} {"train_loss": -7.034952640533447, "global_step": 171971, "epoch": 4094} {"train_loss": -7.088143348693848, "global_step": 171972, "epoch": 4094} {"train_loss": -7.065544605255127, "global_step": 171973, "epoch": 4094} {"train_loss": -6.849910736083984, "global_step": 171974, "epoch": 4094} {"train_loss": -7.004464626312256, "global_step": 171975, "epoch": 4094} {"train_loss": -7.062607288360596, "global_step": 171976, "epoch": 4094} {"train_loss": -7.034278869628906, "global_step": 171977, "epoch": 4094} {"train_loss": -7.009193420410156, "global_step": 171978, "epoch": 4094} {"train_loss": -7.003841400146484, "global_step": 171979, "epoch": 4094} {"train_loss": -7.066801071166992, "global_step": 171980, "epoch": 4094} {"train_loss": -7.0332350730896, "global_step": 171981, "epoch": 4094} {"train_loss": -7.0635271072387695, "global_step": 171982, "epoch": 4094} {"train_loss": -7.069688320159912, "global_step": 171983, "epoch": 4094} {"train_loss": -7.053747177124023, "global_step": 171984, "epoch": 4094} {"train_loss": -7.102720260620117, "global_step": 171985, "epoch": 4094} {"train_loss": -7.238385200500488, "global_step": 171986, "epoch": 4094} {"train_loss": -7.043572425842285, "global_step": 171987, "epoch": 4094} {"train_loss": -7.138391971588135, "global_step": 171988, "epoch": 4094} {"train_loss": -7.055947996321178, "global_step": 171989, "epoch": 4094, "val_loss": 68599.7265625} {"train_loss": -7.155652046203613, "global_step": 171990, "epoch": 4095} {"train_loss": -7.005943298339844, "global_step": 171991, "epoch": 4095} {"train_loss": -7.149666786193848, "global_step": 171992, "epoch": 4095} {"train_loss": -7.06928825378418, "global_step": 171993, "epoch": 4095} {"train_loss": -7.089197158813477, "global_step": 171994, "epoch": 4095} {"train_loss": -7.067657947540283, "global_step": 171995, "epoch": 4095} {"train_loss": -7.115607261657715, "global_step": 171996, "epoch": 4095} {"train_loss": -7.036313533782959, "global_step": 171997, "epoch": 4095} {"train_loss": -7.101144790649414, "global_step": 171998, "epoch": 4095} {"train_loss": -7.020349502563477, "global_step": 171999, "epoch": 4095} {"train_loss": -7.098901271820068, "global_step": 172000, "epoch": 4095} {"train_loss": -7.014074802398682, "global_step": 172001, "epoch": 4095} {"train_loss": -7.134548187255859, "global_step": 172002, "epoch": 4095} {"train_loss": -7.055185317993164, "global_step": 172003, "epoch": 4095} {"train_loss": -6.930075645446777, "global_step": 172004, "epoch": 4095} {"train_loss": -7.087879180908203, "global_step": 172005, "epoch": 4095} {"train_loss": -7.054019451141357, "global_step": 172006, "epoch": 4095} {"train_loss": -7.091047286987305, "global_step": 172007, "epoch": 4095} {"train_loss": -6.9803924560546875, "global_step": 172008, "epoch": 4095} {"train_loss": -7.030152797698975, "global_step": 172009, "epoch": 4095} {"train_loss": -6.994571685791016, "global_step": 172010, "epoch": 4095} {"train_loss": -6.939622402191162, "global_step": 172011, "epoch": 4095} {"train_loss": -6.999020576477051, "global_step": 172012, "epoch": 4095} {"train_loss": -7.04035758972168, "global_step": 172013, "epoch": 4095} {"train_loss": -6.9791646003723145, "global_step": 172014, "epoch": 4095} {"train_loss": -7.067709922790527, "global_step": 172015, "epoch": 4095} {"train_loss": -7.022330284118652, "global_step": 172016, "epoch": 4095} {"train_loss": -6.834571838378906, "global_step": 172017, "epoch": 4095} {"train_loss": -6.922958850860596, "global_step": 172018, "epoch": 4095} {"train_loss": -6.987326622009277, "global_step": 172019, "epoch": 4095} {"train_loss": -6.93670654296875, "global_step": 172020, "epoch": 4095} {"train_loss": -7.045727729797363, "global_step": 172021, "epoch": 4095} {"train_loss": -6.985064506530762, "global_step": 172022, "epoch": 4095} {"train_loss": -6.986794948577881, "global_step": 172023, "epoch": 4095} {"train_loss": -6.978021144866943, "global_step": 172024, "epoch": 4095} {"train_loss": -7.054218292236328, "global_step": 172025, "epoch": 4095} {"train_loss": -6.908153057098389, "global_step": 172026, "epoch": 4095} {"train_loss": -7.007512092590332, "global_step": 172027, "epoch": 4095} {"train_loss": -7.023868560791016, "global_step": 172028, "epoch": 4095} {"train_loss": -7.007092475891113, "global_step": 172029, "epoch": 4095} {"train_loss": -6.860959053039551, "global_step": 172030, "epoch": 4095} {"train_loss": -7.019929499853225, "global_step": 172031, "epoch": 4095, "val_loss": 68589.3828125} {"train_loss": -6.9849748611450195, "global_step": 172032, "epoch": 4096} {"train_loss": -6.877009391784668, "global_step": 172033, "epoch": 4096} {"train_loss": -6.751152515411377, "global_step": 172034, "epoch": 4096} {"train_loss": -6.964285850524902, "global_step": 172035, "epoch": 4096} {"train_loss": -6.92817497253418, "global_step": 172036, "epoch": 4096} {"train_loss": -6.851925849914551, "global_step": 172037, "epoch": 4096} {"train_loss": -6.931107521057129, "global_step": 172038, "epoch": 4096} {"train_loss": -6.8195390701293945, "global_step": 172039, "epoch": 4096} {"train_loss": -7.020180702209473, "global_step": 172040, "epoch": 4096} {"train_loss": -6.962210178375244, "global_step": 172041, "epoch": 4096} {"train_loss": -6.915342807769775, "global_step": 172042, "epoch": 4096} {"train_loss": -7.019187927246094, "global_step": 172043, "epoch": 4096} {"train_loss": -6.981320381164551, "global_step": 172044, "epoch": 4096} {"train_loss": -6.937882423400879, "global_step": 172045, "epoch": 4096} {"train_loss": -6.876668930053711, "global_step": 172046, "epoch": 4096} {"train_loss": -7.025481700897217, "global_step": 172047, "epoch": 4096} {"train_loss": -6.967718124389648, "global_step": 172048, "epoch": 4096} {"train_loss": -7.006533622741699, "global_step": 172049, "epoch": 4096} {"train_loss": -6.988144874572754, "global_step": 172050, "epoch": 4096} {"train_loss": -7.0344133377075195, "global_step": 172051, "epoch": 4096} {"train_loss": -7.004636287689209, "global_step": 172052, "epoch": 4096} {"train_loss": -7.016180992126465, "global_step": 172053, "epoch": 4096} {"train_loss": -7.096811294555664, "global_step": 172054, "epoch": 4096} {"train_loss": -6.843008518218994, "global_step": 172055, "epoch": 4096} {"train_loss": -6.946412086486816, "global_step": 172056, "epoch": 4096} {"train_loss": -6.833860397338867, "global_step": 172057, "epoch": 4096} {"train_loss": -6.998385429382324, "global_step": 172058, "epoch": 4096} {"train_loss": -7.077649116516113, "global_step": 172059, "epoch": 4096} {"train_loss": -6.9795684814453125, "global_step": 172060, "epoch": 4096} {"train_loss": -7.114401817321777, "global_step": 172061, "epoch": 4096} {"train_loss": -6.908370018005371, "global_step": 172062, "epoch": 4096} {"train_loss": -6.924721717834473, "global_step": 172063, "epoch": 4096} {"train_loss": -7.001295566558838, "global_step": 172064, "epoch": 4096} {"train_loss": -6.968143463134766, "global_step": 172065, "epoch": 4096} {"train_loss": -7.091455459594727, "global_step": 172066, "epoch": 4096} {"train_loss": -7.022506237030029, "global_step": 172067, "epoch": 4096} {"train_loss": -7.002830505371094, "global_step": 172068, "epoch": 4096} {"train_loss": -7.045321464538574, "global_step": 172069, "epoch": 4096} {"train_loss": -6.942322254180908, "global_step": 172070, "epoch": 4096} {"train_loss": -7.066265106201172, "global_step": 172071, "epoch": 4096} {"train_loss": -7.002644062042236, "global_step": 172072, "epoch": 4096} {"train_loss": -6.968884013947987, "global_step": 172073, "epoch": 4096, "val_loss": 68649.9140625} {"train_loss": -6.999528884887695, "global_step": 172074, "epoch": 4097} {"train_loss": -6.941002368927002, "global_step": 172075, "epoch": 4097} {"train_loss": -7.108123302459717, "global_step": 172076, "epoch": 4097} {"train_loss": -7.01472806930542, "global_step": 172077, "epoch": 4097} {"train_loss": -7.049691677093506, "global_step": 172078, "epoch": 4097} {"train_loss": -7.028895378112793, "global_step": 172079, "epoch": 4097} {"train_loss": -7.050791263580322, "global_step": 172080, "epoch": 4097} {"train_loss": -7.175260543823242, "global_step": 172081, "epoch": 4097} {"train_loss": -7.044833183288574, "global_step": 172082, "epoch": 4097} {"train_loss": -7.073373794555664, "global_step": 172083, "epoch": 4097} {"train_loss": -7.054837226867676, "global_step": 172084, "epoch": 4097} {"train_loss": -7.026668548583984, "global_step": 172085, "epoch": 4097} {"train_loss": -6.962581634521484, "global_step": 172086, "epoch": 4097} {"train_loss": -7.098675727844238, "global_step": 172087, "epoch": 4097} {"train_loss": -7.013601779937744, "global_step": 172088, "epoch": 4097} {"train_loss": -6.977591037750244, "global_step": 172089, "epoch": 4097} {"train_loss": -6.9808149337768555, "global_step": 172090, "epoch": 4097} {"train_loss": -7.0243682861328125, "global_step": 172091, "epoch": 4097} {"train_loss": -6.921419620513916, "global_step": 172092, "epoch": 4097} {"train_loss": -7.125296592712402, "global_step": 172093, "epoch": 4097} {"train_loss": -7.031520843505859, "global_step": 172094, "epoch": 4097} {"train_loss": -7.064958572387695, "global_step": 172095, "epoch": 4097} {"train_loss": -7.062091827392578, "global_step": 172096, "epoch": 4097} {"train_loss": -7.04176664352417, "global_step": 172097, "epoch": 4097} {"train_loss": -6.919989585876465, "global_step": 172098, "epoch": 4097} {"train_loss": -7.012565612792969, "global_step": 172099, "epoch": 4097} {"train_loss": -7.029829978942871, "global_step": 172100, "epoch": 4097} {"train_loss": -7.017427921295166, "global_step": 172101, "epoch": 4097} {"train_loss": -6.91583776473999, "global_step": 172102, "epoch": 4097} {"train_loss": -6.9486799240112305, "global_step": 172103, "epoch": 4097} {"train_loss": -6.827723503112793, "global_step": 172104, "epoch": 4097} {"train_loss": -6.98314094543457, "global_step": 172105, "epoch": 4097} {"train_loss": -6.856454849243164, "global_step": 172106, "epoch": 4097} {"train_loss": -6.877974987030029, "global_step": 172107, "epoch": 4097} {"train_loss": -7.00941801071167, "global_step": 172108, "epoch": 4097} {"train_loss": -6.789831161499023, "global_step": 172109, "epoch": 4097} {"train_loss": -7.051652431488037, "global_step": 172110, "epoch": 4097} {"train_loss": -6.804862976074219, "global_step": 172111, "epoch": 4097} {"train_loss": -6.930968284606934, "global_step": 172112, "epoch": 4097} {"train_loss": -6.90138053894043, "global_step": 172113, "epoch": 4097} {"train_loss": -6.944481372833252, "global_step": 172114, "epoch": 4097} {"train_loss": -6.989275171643212, "global_step": 172115, "epoch": 4097, "val_loss": 68667.578125} {"train_loss": -6.8511962890625, "global_step": 172116, "epoch": 4098} {"train_loss": -6.89223575592041, "global_step": 172117, "epoch": 4098} {"train_loss": -6.8521575927734375, "global_step": 172118, "epoch": 4098} {"train_loss": -6.89059591293335, "global_step": 172119, "epoch": 4098} {"train_loss": -6.854086399078369, "global_step": 172120, "epoch": 4098} {"train_loss": -6.904082775115967, "global_step": 172121, "epoch": 4098} {"train_loss": -6.9621901512146, "global_step": 172122, "epoch": 4098} {"train_loss": -6.795550346374512, "global_step": 172123, "epoch": 4098} {"train_loss": -6.76645565032959, "global_step": 172124, "epoch": 4098} {"train_loss": -6.857624053955078, "global_step": 172125, "epoch": 4098} {"train_loss": -6.754373550415039, "global_step": 172126, "epoch": 4098} {"train_loss": -6.788750171661377, "global_step": 172127, "epoch": 4098} {"train_loss": -6.831303596496582, "global_step": 172128, "epoch": 4098} {"train_loss": -6.670180797576904, "global_step": 172129, "epoch": 4098} {"train_loss": -6.893647193908691, "global_step": 172130, "epoch": 4098} {"train_loss": -6.881593704223633, "global_step": 172131, "epoch": 4098} {"train_loss": -6.8610520362854, "global_step": 172132, "epoch": 4098} {"train_loss": -6.891447067260742, "global_step": 172133, "epoch": 4098} {"train_loss": -6.851999282836914, "global_step": 172134, "epoch": 4098} {"train_loss": -6.896284580230713, "global_step": 172135, "epoch": 4098} {"train_loss": -6.935685157775879, "global_step": 172136, "epoch": 4098} {"train_loss": -6.972803115844727, "global_step": 172137, "epoch": 4098} {"train_loss": -6.938745975494385, "global_step": 172138, "epoch": 4098} {"train_loss": -6.881187915802002, "global_step": 172139, "epoch": 4098} {"train_loss": -6.944185256958008, "global_step": 172140, "epoch": 4098} {"train_loss": -6.981457710266113, "global_step": 172141, "epoch": 4098} {"train_loss": -6.920759201049805, "global_step": 172142, "epoch": 4098} {"train_loss": -6.938261985778809, "global_step": 172143, "epoch": 4098} {"train_loss": -6.929606914520264, "global_step": 172144, "epoch": 4098} {"train_loss": -7.002700328826904, "global_step": 172145, "epoch": 4098} {"train_loss": -7.042497158050537, "global_step": 172146, "epoch": 4098} {"train_loss": -6.9103922843933105, "global_step": 172147, "epoch": 4098} {"train_loss": -7.093584060668945, "global_step": 172148, "epoch": 4098} {"train_loss": -6.991339683532715, "global_step": 172149, "epoch": 4098} {"train_loss": -6.971347332000732, "global_step": 172150, "epoch": 4098} {"train_loss": -6.973635673522949, "global_step": 172151, "epoch": 4098} {"train_loss": -7.008028030395508, "global_step": 172152, "epoch": 4098} {"train_loss": -7.064417362213135, "global_step": 172153, "epoch": 4098} {"train_loss": -7.0370612144470215, "global_step": 172154, "epoch": 4098} {"train_loss": -7.055612564086914, "global_step": 172155, "epoch": 4098} {"train_loss": -7.111838340759277, "global_step": 172156, "epoch": 4098} {"train_loss": -6.922327030272711, "global_step": 172157, "epoch": 4098, "val_loss": 68475.03125} {"train_loss": -7.065582275390625, "global_step": 172158, "epoch": 4099} {"train_loss": -7.081073760986328, "global_step": 172159, "epoch": 4099} {"train_loss": -7.013571739196777, "global_step": 172160, "epoch": 4099} {"train_loss": -7.036459922790527, "global_step": 172161, "epoch": 4099} {"train_loss": -7.113925457000732, "global_step": 172162, "epoch": 4099} {"train_loss": -7.046863555908203, "global_step": 172163, "epoch": 4099} {"train_loss": -7.061470031738281, "global_step": 172164, "epoch": 4099} {"train_loss": -6.968747138977051, "global_step": 172165, "epoch": 4099} {"train_loss": -7.075511932373047, "global_step": 172166, "epoch": 4099} {"train_loss": -7.0728912353515625, "global_step": 172167, "epoch": 4099} {"train_loss": -7.021512031555176, "global_step": 172168, "epoch": 4099} {"train_loss": -7.064991474151611, "global_step": 172169, "epoch": 4099} {"train_loss": -6.9957051277160645, "global_step": 172170, "epoch": 4099} {"train_loss": -7.125179767608643, "global_step": 172171, "epoch": 4099} {"train_loss": -7.017479419708252, "global_step": 172172, "epoch": 4099} {"train_loss": -6.964506149291992, "global_step": 172173, "epoch": 4099} {"train_loss": -7.013566970825195, "global_step": 172174, "epoch": 4099} {"train_loss": -6.946072578430176, "global_step": 172175, "epoch": 4099} {"train_loss": -7.023612976074219, "global_step": 172176, "epoch": 4099} {"train_loss": -6.958995819091797, "global_step": 172177, "epoch": 4099} {"train_loss": -6.947563648223877, "global_step": 172178, "epoch": 4099} {"train_loss": -7.061447620391846, "global_step": 172179, "epoch": 4099} {"train_loss": -6.963147163391113, "global_step": 172180, "epoch": 4099} {"train_loss": -6.979452133178711, "global_step": 172181, "epoch": 4099} {"train_loss": -7.122014999389648, "global_step": 172182, "epoch": 4099} {"train_loss": -6.985634803771973, "global_step": 172183, "epoch": 4099} {"train_loss": -6.857537746429443, "global_step": 172184, "epoch": 4099} {"train_loss": -7.098238468170166, "global_step": 172185, "epoch": 4099} {"train_loss": -7.015726566314697, "global_step": 172186, "epoch": 4099} {"train_loss": -6.9173383712768555, "global_step": 172187, "epoch": 4099} {"train_loss": -7.015547275543213, "global_step": 172188, "epoch": 4099} {"train_loss": -6.842809677124023, "global_step": 172189, "epoch": 4099} {"train_loss": -6.92978572845459, "global_step": 172190, "epoch": 4099} {"train_loss": -7.090522766113281, "global_step": 172191, "epoch": 4099} {"train_loss": -7.136407375335693, "global_step": 172192, "epoch": 4099} {"train_loss": -7.088947296142578, "global_step": 172193, "epoch": 4099} {"train_loss": -7.018289566040039, "global_step": 172194, "epoch": 4099} {"train_loss": -7.020565032958984, "global_step": 172195, "epoch": 4099} {"train_loss": -7.0044331550598145, "global_step": 172196, "epoch": 4099} {"train_loss": -7.087430953979492, "global_step": 172197, "epoch": 4099} {"train_loss": -7.038486957550049, "global_step": 172198, "epoch": 4099} {"train_loss": -7.019445135479882, "global_step": 172199, "epoch": 4099, "val_loss": 68664.796875} {"train_loss": -7.023594856262207, "global_step": 172200, "epoch": 4100} {"train_loss": -7.075435161590576, "global_step": 172201, "epoch": 4100} {"train_loss": -7.036637783050537, "global_step": 172202, "epoch": 4100} {"train_loss": -6.995734691619873, "global_step": 172203, "epoch": 4100} {"train_loss": -7.048678398132324, "global_step": 172204, "epoch": 4100} {"train_loss": -6.909519672393799, "global_step": 172205, "epoch": 4100} {"train_loss": -6.931314945220947, "global_step": 172206, "epoch": 4100} {"train_loss": -7.059206008911133, "global_step": 172207, "epoch": 4100} {"train_loss": -7.054722785949707, "global_step": 172208, "epoch": 4100} {"train_loss": -6.992181777954102, "global_step": 172209, "epoch": 4100} {"train_loss": -6.985301971435547, "global_step": 172210, "epoch": 4100} {"train_loss": -7.043080806732178, "global_step": 172211, "epoch": 4100} {"train_loss": -7.021368980407715, "global_step": 172212, "epoch": 4100} {"train_loss": -7.0268964767456055, "global_step": 172213, "epoch": 4100} {"train_loss": -6.955147743225098, "global_step": 172214, "epoch": 4100} {"train_loss": -7.0117387771606445, "global_step": 172215, "epoch": 4100} {"train_loss": -7.021637439727783, "global_step": 172216, "epoch": 4100} {"train_loss": -6.976196765899658, "global_step": 172217, "epoch": 4100} {"train_loss": -7.051556587219238, "global_step": 172218, "epoch": 4100} {"train_loss": -7.0667877197265625, "global_step": 172219, "epoch": 4100} {"train_loss": -6.943503379821777, "global_step": 172220, "epoch": 4100} {"train_loss": -7.036646842956543, "global_step": 172221, "epoch": 4100} {"train_loss": -6.985595703125, "global_step": 172222, "epoch": 4100} {"train_loss": -7.0990095138549805, "global_step": 172223, "epoch": 4100} {"train_loss": -7.086162567138672, "global_step": 172224, "epoch": 4100} {"train_loss": -7.090031623840332, "global_step": 172225, "epoch": 4100} {"train_loss": -7.115031719207764, "global_step": 172226, "epoch": 4100} {"train_loss": -7.075150489807129, "global_step": 172227, "epoch": 4100} {"train_loss": -7.067052841186523, "global_step": 172228, "epoch": 4100} {"train_loss": -7.107658386230469, "global_step": 172229, "epoch": 4100} {"train_loss": -7.067563056945801, "global_step": 172230, "epoch": 4100} {"train_loss": -7.08474063873291, "global_step": 172231, "epoch": 4100} {"train_loss": -7.147040367126465, "global_step": 172232, "epoch": 4100} {"train_loss": -7.059084415435791, "global_step": 172233, "epoch": 4100} {"train_loss": -7.045829772949219, "global_step": 172234, "epoch": 4100} {"train_loss": -6.965217590332031, "global_step": 172235, "epoch": 4100} {"train_loss": -7.076098442077637, "global_step": 172236, "epoch": 4100} {"train_loss": -6.88657808303833, "global_step": 172237, "epoch": 4100} {"train_loss": -6.854922294616699, "global_step": 172238, "epoch": 4100} {"train_loss": -7.019410133361816, "global_step": 172239, "epoch": 4100} {"train_loss": -7.037372589111328, "global_step": 172240, "epoch": 4100} {"train_loss": -7.0252997534615655, "global_step": 172241, "epoch": 4100, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.9870195376344258, "train/sim_max_reward_2": 0.9653119034944031, "train/sim_max_reward_3": 0.9422861945034176, "train/sim_max_reward_4": 0.915280622130339, "train/sim_max_reward_5": 0.4457682189548524, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.22889561084719837, "test/sim_max_reward_4400002": 0.9523213615260657, "test/sim_max_reward_4400003": 0.8465923370869175, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.965721128744884, "test/sim_max_reward_4400006": 0.2674633074636113, "test/sim_max_reward_4400007": 0.9495328760080773, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9260572138255585, "test/sim_max_reward_4400010": 0.9495077063996888, "test/sim_max_reward_4400011": 0.1559689870066942, "test/sim_max_reward_4400012": 0.972312149903957, "test/sim_max_reward_4400013": 0.8836459301001793, "test/sim_max_reward_4400014": 0.6754610088127978, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.09544660478522743, "test/sim_max_reward_4400017": 0.9675572493401308, "test/sim_max_reward_4400018": 0.31534069712198626, "test/sim_max_reward_4400019": 0.8979340496430193, "test/sim_max_reward_4400020": 0.9724209273806442, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9889170065258066, "test/sim_max_reward_4400023": 0.15341068810859368, "test/sim_max_reward_4400024": 0.5499156766358637, "test/sim_max_reward_4400025": 0.26627169817780055, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.011172541114991745, "test/sim_max_reward_4400028": 0.8542093146038275, "test/sim_max_reward_4400029": 0.49247708593476464, "test/sim_max_reward_4400030": 0.9921137301587181, "test/sim_max_reward_4400031": 0.9620643087554516, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9435463845145832, "test/sim_max_reward_4400034": 0.9812972116027984, "test/sim_max_reward_4400035": 0.39329564499528136, "test/sim_max_reward_4400036": 0.995312742777116, "test/sim_max_reward_4400037": 0.9507572908768536, "test/sim_max_reward_4400038": 0.9760914079208161, "test/sim_max_reward_4400039": 0.9236792368859568, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.8849163802495238, "test/sim_max_reward_4400043": 0.9774871121119272, "test/sim_max_reward_4400044": 0.8717731266825092, "test/sim_max_reward_4400045": 0.8637695884242577, "test/sim_max_reward_4400046": 0.9535825541769981, "test/sim_max_reward_4400047": 0.9842306656913654, "test/sim_max_reward_4400048": 0.9979980565401756, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.740993995553915, "test/mean_score": 0.6752072469998487, "val_loss": 68651.734375} {"train_loss": -6.887970924377441, "global_step": 172242, "epoch": 4101} {"train_loss": -7.0518598556518555, "global_step": 172243, "epoch": 4101} {"train_loss": -6.9247918128967285, "global_step": 172244, "epoch": 4101} {"train_loss": -6.955770015716553, "global_step": 172245, "epoch": 4101} {"train_loss": -7.074306488037109, "global_step": 172246, "epoch": 4101} {"train_loss": -6.870565414428711, "global_step": 172247, "epoch": 4101} {"train_loss": -6.926593780517578, "global_step": 172248, "epoch": 4101} {"train_loss": -6.98388671875, "global_step": 172249, "epoch": 4101} {"train_loss": -6.732725620269775, "global_step": 172250, "epoch": 4101} {"train_loss": -7.019956111907959, "global_step": 172251, "epoch": 4101} {"train_loss": -6.931634902954102, "global_step": 172252, "epoch": 4101} {"train_loss": -6.833669662475586, "global_step": 172253, "epoch": 4101} {"train_loss": -6.927623748779297, "global_step": 172254, "epoch": 4101} {"train_loss": -6.831003665924072, "global_step": 172255, "epoch": 4101} {"train_loss": -7.100647449493408, "global_step": 172256, "epoch": 4101} {"train_loss": -6.8342061042785645, "global_step": 172257, "epoch": 4101} {"train_loss": -6.948020935058594, "global_step": 172258, "epoch": 4101} {"train_loss": -6.871456146240234, "global_step": 172259, "epoch": 4101} {"train_loss": -7.008090972900391, "global_step": 172260, "epoch": 4101} {"train_loss": -7.018914222717285, "global_step": 172261, "epoch": 4101} {"train_loss": -7.1147003173828125, "global_step": 172262, "epoch": 4101} {"train_loss": -6.968094348907471, "global_step": 172263, "epoch": 4101} {"train_loss": -7.038994789123535, "global_step": 172264, "epoch": 4101} {"train_loss": -6.953729152679443, "global_step": 172265, "epoch": 4101} {"train_loss": -7.0652031898498535, "global_step": 172266, "epoch": 4101} {"train_loss": -7.022862434387207, "global_step": 172267, "epoch": 4101} {"train_loss": -7.078662395477295, "global_step": 172268, "epoch": 4101} {"train_loss": -7.014174461364746, "global_step": 172269, "epoch": 4101} {"train_loss": -6.8642425537109375, "global_step": 172270, "epoch": 4101} {"train_loss": -7.022911548614502, "global_step": 172271, "epoch": 4101} {"train_loss": -6.982694625854492, "global_step": 172272, "epoch": 4101} {"train_loss": -6.926814556121826, "global_step": 172273, "epoch": 4101} {"train_loss": -7.062167167663574, "global_step": 172274, "epoch": 4101} {"train_loss": -7.014383316040039, "global_step": 172275, "epoch": 4101} {"train_loss": -6.999709129333496, "global_step": 172276, "epoch": 4101} {"train_loss": -7.0102314949035645, "global_step": 172277, "epoch": 4101} {"train_loss": -6.960004806518555, "global_step": 172278, "epoch": 4101} {"train_loss": -7.0964460372924805, "global_step": 172279, "epoch": 4101} {"train_loss": -7.077043533325195, "global_step": 172280, "epoch": 4101} {"train_loss": -7.0711774826049805, "global_step": 172281, "epoch": 4101} {"train_loss": -7.102219581604004, "global_step": 172282, "epoch": 4101} {"train_loss": -6.978541987282889, "global_step": 172283, "epoch": 4101, "val_loss": 68559.0625} {"train_loss": -7.1216020584106445, "global_step": 172284, "epoch": 4102} {"train_loss": -6.921134948730469, "global_step": 172285, "epoch": 4102} {"train_loss": -7.084287643432617, "global_step": 172286, "epoch": 4102} {"train_loss": -6.981972694396973, "global_step": 172287, "epoch": 4102} {"train_loss": -6.999518394470215, "global_step": 172288, "epoch": 4102} {"train_loss": -7.023714065551758, "global_step": 172289, "epoch": 4102} {"train_loss": -6.973675727844238, "global_step": 172290, "epoch": 4102} {"train_loss": -6.958465099334717, "global_step": 172291, "epoch": 4102} {"train_loss": -7.074366569519043, "global_step": 172292, "epoch": 4102} {"train_loss": -7.056336402893066, "global_step": 172293, "epoch": 4102} {"train_loss": -7.102970600128174, "global_step": 172294, "epoch": 4102} {"train_loss": -7.126323699951172, "global_step": 172295, "epoch": 4102} {"train_loss": -7.047527313232422, "global_step": 172296, "epoch": 4102} {"train_loss": -7.015031337738037, "global_step": 172297, "epoch": 4102} {"train_loss": -6.937150001525879, "global_step": 172298, "epoch": 4102} {"train_loss": -7.0545148849487305, "global_step": 172299, "epoch": 4102} {"train_loss": -6.9668965339660645, "global_step": 172300, "epoch": 4102} {"train_loss": -7.000863552093506, "global_step": 172301, "epoch": 4102} {"train_loss": -7.101946830749512, "global_step": 172302, "epoch": 4102} {"train_loss": -6.994059085845947, "global_step": 172303, "epoch": 4102} {"train_loss": -6.939083099365234, "global_step": 172304, "epoch": 4102} {"train_loss": -6.915522575378418, "global_step": 172305, "epoch": 4102} {"train_loss": -6.812975883483887, "global_step": 172306, "epoch": 4102} {"train_loss": -6.928464889526367, "global_step": 172307, "epoch": 4102} {"train_loss": -6.9276123046875, "global_step": 172308, "epoch": 4102} {"train_loss": -6.907430648803711, "global_step": 172309, "epoch": 4102} {"train_loss": -6.9129204750061035, "global_step": 172310, "epoch": 4102} {"train_loss": -6.874326705932617, "global_step": 172311, "epoch": 4102} {"train_loss": -6.888025283813477, "global_step": 172312, "epoch": 4102} {"train_loss": -6.844971179962158, "global_step": 172313, "epoch": 4102} {"train_loss": -6.935174465179443, "global_step": 172314, "epoch": 4102} {"train_loss": -6.895839691162109, "global_step": 172315, "epoch": 4102} {"train_loss": -6.914990425109863, "global_step": 172316, "epoch": 4102} {"train_loss": -6.971434593200684, "global_step": 172317, "epoch": 4102} {"train_loss": -6.8811798095703125, "global_step": 172318, "epoch": 4102} {"train_loss": -7.005885601043701, "global_step": 172319, "epoch": 4102} {"train_loss": -6.939682960510254, "global_step": 172320, "epoch": 4102} {"train_loss": -7.034019470214844, "global_step": 172321, "epoch": 4102} {"train_loss": -6.895504951477051, "global_step": 172322, "epoch": 4102} {"train_loss": -7.083913803100586, "global_step": 172323, "epoch": 4102} {"train_loss": -6.933785438537598, "global_step": 172324, "epoch": 4102} {"train_loss": -6.975498222169422, "global_step": 172325, "epoch": 4102, "val_loss": 68539.984375} {"train_loss": -6.955339431762695, "global_step": 172326, "epoch": 4103} {"train_loss": -6.954769134521484, "global_step": 172327, "epoch": 4103} {"train_loss": -7.030709743499756, "global_step": 172328, "epoch": 4103} {"train_loss": -6.883545875549316, "global_step": 172329, "epoch": 4103} {"train_loss": -6.960174083709717, "global_step": 172330, "epoch": 4103} {"train_loss": -7.001787185668945, "global_step": 172331, "epoch": 4103} {"train_loss": -7.122757911682129, "global_step": 172332, "epoch": 4103} {"train_loss": -6.973672389984131, "global_step": 172333, "epoch": 4103} {"train_loss": -6.991943359375, "global_step": 172334, "epoch": 4103} {"train_loss": -6.896114349365234, "global_step": 172335, "epoch": 4103} {"train_loss": -7.052593231201172, "global_step": 172336, "epoch": 4103} {"train_loss": -7.05803108215332, "global_step": 172337, "epoch": 4103} {"train_loss": -7.069332122802734, "global_step": 172338, "epoch": 4103} {"train_loss": -6.990451812744141, "global_step": 172339, "epoch": 4103} {"train_loss": -7.048125267028809, "global_step": 172340, "epoch": 4103} {"train_loss": -6.954507827758789, "global_step": 172341, "epoch": 4103} {"train_loss": -6.963568210601807, "global_step": 172342, "epoch": 4103} {"train_loss": -6.960856914520264, "global_step": 172343, "epoch": 4103} {"train_loss": -7.009744644165039, "global_step": 172344, "epoch": 4103} {"train_loss": -6.914935111999512, "global_step": 172345, "epoch": 4103} {"train_loss": -7.020467281341553, "global_step": 172346, "epoch": 4103} {"train_loss": -6.943803787231445, "global_step": 172347, "epoch": 4103} {"train_loss": -6.955801010131836, "global_step": 172348, "epoch": 4103} {"train_loss": -6.96522331237793, "global_step": 172349, "epoch": 4103} {"train_loss": -6.954792499542236, "global_step": 172350, "epoch": 4103} {"train_loss": -6.991191864013672, "global_step": 172351, "epoch": 4103} {"train_loss": -7.0218610763549805, "global_step": 172352, "epoch": 4103} {"train_loss": -7.005795478820801, "global_step": 172353, "epoch": 4103} {"train_loss": -6.943343162536621, "global_step": 172354, "epoch": 4103} {"train_loss": -6.908287525177002, "global_step": 172355, "epoch": 4103} {"train_loss": -7.009877681732178, "global_step": 172356, "epoch": 4103} {"train_loss": -7.034717559814453, "global_step": 172357, "epoch": 4103} {"train_loss": -7.072553634643555, "global_step": 172358, "epoch": 4103} {"train_loss": -7.020778656005859, "global_step": 172359, "epoch": 4103} {"train_loss": -7.00968074798584, "global_step": 172360, "epoch": 4103} {"train_loss": -7.116994857788086, "global_step": 172361, "epoch": 4103} {"train_loss": -6.9309492111206055, "global_step": 172362, "epoch": 4103} {"train_loss": -6.999065399169922, "global_step": 172363, "epoch": 4103} {"train_loss": -7.01614236831665, "global_step": 172364, "epoch": 4103} {"train_loss": -6.885558605194092, "global_step": 172365, "epoch": 4103} {"train_loss": -7.114049911499023, "global_step": 172366, "epoch": 4103} {"train_loss": -6.99348319144476, "global_step": 172367, "epoch": 4103, "val_loss": 68524.5625} {"train_loss": -7.0873541831970215, "global_step": 172368, "epoch": 4104} {"train_loss": -7.074103355407715, "global_step": 172369, "epoch": 4104} {"train_loss": -7.073117256164551, "global_step": 172370, "epoch": 4104} {"train_loss": -7.058548927307129, "global_step": 172371, "epoch": 4104} {"train_loss": -6.97603702545166, "global_step": 172372, "epoch": 4104} {"train_loss": -7.020122528076172, "global_step": 172373, "epoch": 4104} {"train_loss": -7.1337504386901855, "global_step": 172374, "epoch": 4104} {"train_loss": -7.046502113342285, "global_step": 172375, "epoch": 4104} {"train_loss": -7.056363105773926, "global_step": 172376, "epoch": 4104} {"train_loss": -7.059854507446289, "global_step": 172377, "epoch": 4104} {"train_loss": -6.919253349304199, "global_step": 172378, "epoch": 4104} {"train_loss": -6.921338081359863, "global_step": 172379, "epoch": 4104} {"train_loss": -7.0208587646484375, "global_step": 172380, "epoch": 4104} {"train_loss": -7.0658111572265625, "global_step": 172381, "epoch": 4104} {"train_loss": -7.037339687347412, "global_step": 172382, "epoch": 4104} {"train_loss": -6.939937591552734, "global_step": 172383, "epoch": 4104} {"train_loss": -7.037960052490234, "global_step": 172384, "epoch": 4104} {"train_loss": -6.920599937438965, "global_step": 172385, "epoch": 4104} {"train_loss": -7.042761325836182, "global_step": 172386, "epoch": 4104} {"train_loss": -6.908889293670654, "global_step": 172387, "epoch": 4104} {"train_loss": -7.141912460327148, "global_step": 172388, "epoch": 4104} {"train_loss": -7.122476577758789, "global_step": 172389, "epoch": 4104} {"train_loss": -7.083347797393799, "global_step": 172390, "epoch": 4104} {"train_loss": -6.990976810455322, "global_step": 172391, "epoch": 4104} {"train_loss": -6.89149808883667, "global_step": 172392, "epoch": 4104} {"train_loss": -6.9416093826293945, "global_step": 172393, "epoch": 4104} {"train_loss": -7.002857208251953, "global_step": 172394, "epoch": 4104} {"train_loss": -6.983047962188721, "global_step": 172395, "epoch": 4104} {"train_loss": -6.896215438842773, "global_step": 172396, "epoch": 4104} {"train_loss": -6.898943901062012, "global_step": 172397, "epoch": 4104} {"train_loss": -7.040205955505371, "global_step": 172398, "epoch": 4104} {"train_loss": -7.059240341186523, "global_step": 172399, "epoch": 4104} {"train_loss": -6.904052734375, "global_step": 172400, "epoch": 4104} {"train_loss": -7.021726131439209, "global_step": 172401, "epoch": 4104} {"train_loss": -6.994133949279785, "global_step": 172402, "epoch": 4104} {"train_loss": -6.912545204162598, "global_step": 172403, "epoch": 4104} {"train_loss": -7.012810707092285, "global_step": 172404, "epoch": 4104} {"train_loss": -7.049306392669678, "global_step": 172405, "epoch": 4104} {"train_loss": -6.851615905761719, "global_step": 172406, "epoch": 4104} {"train_loss": -7.041444778442383, "global_step": 172407, "epoch": 4104} {"train_loss": -6.954935073852539, "global_step": 172408, "epoch": 4104} {"train_loss": -7.005480130513509, "global_step": 172409, "epoch": 4104, "val_loss": 68512.796875} {"train_loss": -6.982612133026123, "global_step": 172410, "epoch": 4105} {"train_loss": -6.904016494750977, "global_step": 172411, "epoch": 4105} {"train_loss": -7.012035369873047, "global_step": 172412, "epoch": 4105} {"train_loss": -6.927709579467773, "global_step": 172413, "epoch": 4105} {"train_loss": -6.903685569763184, "global_step": 172414, "epoch": 4105} {"train_loss": -7.00148868560791, "global_step": 172415, "epoch": 4105} {"train_loss": -7.034946441650391, "global_step": 172416, "epoch": 4105} {"train_loss": -6.953786849975586, "global_step": 172417, "epoch": 4105} {"train_loss": -7.011686325073242, "global_step": 172418, "epoch": 4105} {"train_loss": -7.094470024108887, "global_step": 172419, "epoch": 4105} {"train_loss": -6.911745548248291, "global_step": 172420, "epoch": 4105} {"train_loss": -7.020755290985107, "global_step": 172421, "epoch": 4105} {"train_loss": -7.035022735595703, "global_step": 172422, "epoch": 4105} {"train_loss": -7.0088324546813965, "global_step": 172423, "epoch": 4105} {"train_loss": -7.010449409484863, "global_step": 172424, "epoch": 4105} {"train_loss": -7.0619659423828125, "global_step": 172425, "epoch": 4105} {"train_loss": -6.959677696228027, "global_step": 172426, "epoch": 4105} {"train_loss": -6.893243312835693, "global_step": 172427, "epoch": 4105} {"train_loss": -6.876380920410156, "global_step": 172428, "epoch": 4105} {"train_loss": -7.0197906494140625, "global_step": 172429, "epoch": 4105} {"train_loss": -6.846836566925049, "global_step": 172430, "epoch": 4105} {"train_loss": -6.959662437438965, "global_step": 172431, "epoch": 4105} {"train_loss": -6.939061641693115, "global_step": 172432, "epoch": 4105} {"train_loss": -6.964230537414551, "global_step": 172433, "epoch": 4105} {"train_loss": -6.95742130279541, "global_step": 172434, "epoch": 4105} {"train_loss": -7.064913749694824, "global_step": 172435, "epoch": 4105} {"train_loss": -7.003416061401367, "global_step": 172436, "epoch": 4105} {"train_loss": -7.012330055236816, "global_step": 172437, "epoch": 4105} {"train_loss": -7.027865409851074, "global_step": 172438, "epoch": 4105} {"train_loss": -6.881889343261719, "global_step": 172439, "epoch": 4105} {"train_loss": -6.966803550720215, "global_step": 172440, "epoch": 4105} {"train_loss": -7.154512405395508, "global_step": 172441, "epoch": 4105} {"train_loss": -6.882336616516113, "global_step": 172442, "epoch": 4105} {"train_loss": -6.944272994995117, "global_step": 172443, "epoch": 4105} {"train_loss": -7.0439910888671875, "global_step": 172444, "epoch": 4105} {"train_loss": -6.827371120452881, "global_step": 172445, "epoch": 4105} {"train_loss": -6.930056571960449, "global_step": 172446, "epoch": 4105} {"train_loss": -7.057696342468262, "global_step": 172447, "epoch": 4105} {"train_loss": -6.88649320602417, "global_step": 172448, "epoch": 4105} {"train_loss": -6.983868598937988, "global_step": 172449, "epoch": 4105} {"train_loss": -6.867891788482666, "global_step": 172450, "epoch": 4105} {"train_loss": -6.970540568942115, "global_step": 172451, "epoch": 4105, "val_loss": 68667.3046875} {"train_loss": -7.016427993774414, "global_step": 172452, "epoch": 4106} {"train_loss": -6.8720245361328125, "global_step": 172453, "epoch": 4106} {"train_loss": -7.0401811599731445, "global_step": 172454, "epoch": 4106} {"train_loss": -6.88270378112793, "global_step": 172455, "epoch": 4106} {"train_loss": -6.816852569580078, "global_step": 172456, "epoch": 4106} {"train_loss": -7.109238624572754, "global_step": 172457, "epoch": 4106} {"train_loss": -6.9215850830078125, "global_step": 172458, "epoch": 4106} {"train_loss": -7.0644378662109375, "global_step": 172459, "epoch": 4106} {"train_loss": -6.978585720062256, "global_step": 172460, "epoch": 4106} {"train_loss": -7.0050787925720215, "global_step": 172461, "epoch": 4106} {"train_loss": -6.987920761108398, "global_step": 172462, "epoch": 4106} {"train_loss": -6.921828269958496, "global_step": 172463, "epoch": 4106} {"train_loss": -6.966095924377441, "global_step": 172464, "epoch": 4106} {"train_loss": -7.0461297035217285, "global_step": 172465, "epoch": 4106} {"train_loss": -6.905129909515381, "global_step": 172466, "epoch": 4106} {"train_loss": -7.032816410064697, "global_step": 172467, "epoch": 4106} {"train_loss": -6.934050559997559, "global_step": 172468, "epoch": 4106} {"train_loss": -6.97158145904541, "global_step": 172469, "epoch": 4106} {"train_loss": -6.9092559814453125, "global_step": 172470, "epoch": 4106} {"train_loss": -7.082831382751465, "global_step": 172471, "epoch": 4106} {"train_loss": -7.07900857925415, "global_step": 172472, "epoch": 4106} {"train_loss": -6.965373992919922, "global_step": 172473, "epoch": 4106} {"train_loss": -7.047032356262207, "global_step": 172474, "epoch": 4106} {"train_loss": -7.14832878112793, "global_step": 172475, "epoch": 4106} {"train_loss": -7.003161430358887, "global_step": 172476, "epoch": 4106} {"train_loss": -7.048740386962891, "global_step": 172477, "epoch": 4106} {"train_loss": -6.978167533874512, "global_step": 172478, "epoch": 4106} {"train_loss": -7.0045318603515625, "global_step": 172479, "epoch": 4106} {"train_loss": -7.0201029777526855, "global_step": 172480, "epoch": 4106} {"train_loss": -7.081966400146484, "global_step": 172481, "epoch": 4106} {"train_loss": -6.972562313079834, "global_step": 172482, "epoch": 4106} {"train_loss": -7.035390853881836, "global_step": 172483, "epoch": 4106} {"train_loss": -7.029934883117676, "global_step": 172484, "epoch": 4106} {"train_loss": -7.077990531921387, "global_step": 172485, "epoch": 4106} {"train_loss": -7.009578227996826, "global_step": 172486, "epoch": 4106} {"train_loss": -7.087018013000488, "global_step": 172487, "epoch": 4106} {"train_loss": -7.041562080383301, "global_step": 172488, "epoch": 4106} {"train_loss": -7.086248397827148, "global_step": 172489, "epoch": 4106} {"train_loss": -6.929680824279785, "global_step": 172490, "epoch": 4106} {"train_loss": -7.007920265197754, "global_step": 172491, "epoch": 4106} {"train_loss": -7.080201148986816, "global_step": 172492, "epoch": 4106} {"train_loss": -7.006874322891235, "global_step": 172493, "epoch": 4106, "val_loss": 68595.1875} {"train_loss": -7.1091413497924805, "global_step": 172494, "epoch": 4107} {"train_loss": -7.058143138885498, "global_step": 172495, "epoch": 4107} {"train_loss": -6.989221572875977, "global_step": 172496, "epoch": 4107} {"train_loss": -7.006811141967773, "global_step": 172497, "epoch": 4107} {"train_loss": -7.049022674560547, "global_step": 172498, "epoch": 4107} {"train_loss": -7.079507827758789, "global_step": 172499, "epoch": 4107} {"train_loss": -7.141113758087158, "global_step": 172500, "epoch": 4107} {"train_loss": -7.161182403564453, "global_step": 172501, "epoch": 4107} {"train_loss": -6.9932637214660645, "global_step": 172502, "epoch": 4107} {"train_loss": -7.07684326171875, "global_step": 172503, "epoch": 4107} {"train_loss": -6.916889190673828, "global_step": 172504, "epoch": 4107} {"train_loss": -7.010333061218262, "global_step": 172505, "epoch": 4107} {"train_loss": -7.09958553314209, "global_step": 172506, "epoch": 4107} {"train_loss": -6.960173606872559, "global_step": 172507, "epoch": 4107} {"train_loss": -7.023480415344238, "global_step": 172508, "epoch": 4107} {"train_loss": -6.9709320068359375, "global_step": 172509, "epoch": 4107} {"train_loss": -6.944281578063965, "global_step": 172510, "epoch": 4107} {"train_loss": -7.066251754760742, "global_step": 172511, "epoch": 4107} {"train_loss": -7.066920280456543, "global_step": 172512, "epoch": 4107} {"train_loss": -7.013250350952148, "global_step": 172513, "epoch": 4107} {"train_loss": -7.003275394439697, "global_step": 172514, "epoch": 4107} {"train_loss": -7.008567810058594, "global_step": 172515, "epoch": 4107} {"train_loss": -7.000446319580078, "global_step": 172516, "epoch": 4107} {"train_loss": -7.019301414489746, "global_step": 172517, "epoch": 4107} {"train_loss": -6.973599433898926, "global_step": 172518, "epoch": 4107} {"train_loss": -7.003787040710449, "global_step": 172519, "epoch": 4107} {"train_loss": -6.993803024291992, "global_step": 172520, "epoch": 4107} {"train_loss": -6.83684778213501, "global_step": 172521, "epoch": 4107} {"train_loss": -7.015511989593506, "global_step": 172522, "epoch": 4107} {"train_loss": -6.917272567749023, "global_step": 172523, "epoch": 4107} {"train_loss": -6.912890911102295, "global_step": 172524, "epoch": 4107} {"train_loss": -6.953001976013184, "global_step": 172525, "epoch": 4107} {"train_loss": -6.826543807983398, "global_step": 172526, "epoch": 4107} {"train_loss": -6.979240417480469, "global_step": 172527, "epoch": 4107} {"train_loss": -6.9833760261535645, "global_step": 172528, "epoch": 4107} {"train_loss": -6.945082187652588, "global_step": 172529, "epoch": 4107} {"train_loss": -7.014124870300293, "global_step": 172530, "epoch": 4107} {"train_loss": -6.9143571853637695, "global_step": 172531, "epoch": 4107} {"train_loss": -7.029731273651123, "global_step": 172532, "epoch": 4107} {"train_loss": -7.046204090118408, "global_step": 172533, "epoch": 4107} {"train_loss": -7.027645111083984, "global_step": 172534, "epoch": 4107} {"train_loss": -7.005805095036824, "global_step": 172535, "epoch": 4107, "val_loss": 68803.3359375} {"train_loss": -6.946516990661621, "global_step": 172536, "epoch": 4108} {"train_loss": -7.037891387939453, "global_step": 172537, "epoch": 4108} {"train_loss": -6.866296291351318, "global_step": 172538, "epoch": 4108} {"train_loss": -6.999243259429932, "global_step": 172539, "epoch": 4108} {"train_loss": -7.015914440155029, "global_step": 172540, "epoch": 4108} {"train_loss": -6.951466083526611, "global_step": 172541, "epoch": 4108} {"train_loss": -7.03717041015625, "global_step": 172542, "epoch": 4108} {"train_loss": -7.058236122131348, "global_step": 172543, "epoch": 4108} {"train_loss": -6.990998268127441, "global_step": 172544, "epoch": 4108} {"train_loss": -7.0167036056518555, "global_step": 172545, "epoch": 4108} {"train_loss": -6.965312957763672, "global_step": 172546, "epoch": 4108} {"train_loss": -7.085671901702881, "global_step": 172547, "epoch": 4108} {"train_loss": -6.924125671386719, "global_step": 172548, "epoch": 4108} {"train_loss": -7.067901134490967, "global_step": 172549, "epoch": 4108} {"train_loss": -7.021663188934326, "global_step": 172550, "epoch": 4108} {"train_loss": -6.976003646850586, "global_step": 172551, "epoch": 4108} {"train_loss": -7.130128860473633, "global_step": 172552, "epoch": 4108} {"train_loss": -7.0490193367004395, "global_step": 172553, "epoch": 4108} {"train_loss": -6.973151206970215, "global_step": 172554, "epoch": 4108} {"train_loss": -7.046184062957764, "global_step": 172555, "epoch": 4108} {"train_loss": -6.96922492980957, "global_step": 172556, "epoch": 4108} {"train_loss": -6.863145351409912, "global_step": 172557, "epoch": 4108} {"train_loss": -6.938909530639648, "global_step": 172558, "epoch": 4108} {"train_loss": -7.064019680023193, "global_step": 172559, "epoch": 4108} {"train_loss": -6.877955436706543, "global_step": 172560, "epoch": 4108} {"train_loss": -6.873140335083008, "global_step": 172561, "epoch": 4108} {"train_loss": -6.974742889404297, "global_step": 172562, "epoch": 4108} {"train_loss": -6.931134223937988, "global_step": 172563, "epoch": 4108} {"train_loss": -6.874792098999023, "global_step": 172564, "epoch": 4108} {"train_loss": -6.918623924255371, "global_step": 172565, "epoch": 4108} {"train_loss": -7.018126487731934, "global_step": 172566, "epoch": 4108} {"train_loss": -7.109112739562988, "global_step": 172567, "epoch": 4108} {"train_loss": -7.036116600036621, "global_step": 172568, "epoch": 4108} {"train_loss": -6.87606143951416, "global_step": 172569, "epoch": 4108} {"train_loss": -6.896847724914551, "global_step": 172570, "epoch": 4108} {"train_loss": -6.892936706542969, "global_step": 172571, "epoch": 4108} {"train_loss": -7.024702072143555, "global_step": 172572, "epoch": 4108} {"train_loss": -7.062914848327637, "global_step": 172573, "epoch": 4108} {"train_loss": -7.0058112144470215, "global_step": 172574, "epoch": 4108} {"train_loss": -6.990904808044434, "global_step": 172575, "epoch": 4108} {"train_loss": -7.079473972320557, "global_step": 172576, "epoch": 4108} {"train_loss": -6.988682349522908, "global_step": 172577, "epoch": 4108, "val_loss": 68795.9375} {"train_loss": -7.009459972381592, "global_step": 172578, "epoch": 4109} {"train_loss": -7.101518630981445, "global_step": 172579, "epoch": 4109} {"train_loss": -7.0351715087890625, "global_step": 172580, "epoch": 4109} {"train_loss": -7.181125640869141, "global_step": 172581, "epoch": 4109} {"train_loss": -6.983137130737305, "global_step": 172582, "epoch": 4109} {"train_loss": -7.054487228393555, "global_step": 172583, "epoch": 4109} {"train_loss": -7.15118408203125, "global_step": 172584, "epoch": 4109} {"train_loss": -7.096649646759033, "global_step": 172585, "epoch": 4109} {"train_loss": -6.979506492614746, "global_step": 172586, "epoch": 4109} {"train_loss": -7.065630912780762, "global_step": 172587, "epoch": 4109} {"train_loss": -7.03432559967041, "global_step": 172588, "epoch": 4109} {"train_loss": -7.036582946777344, "global_step": 172589, "epoch": 4109} {"train_loss": -7.098086833953857, "global_step": 172590, "epoch": 4109} {"train_loss": -7.058056354522705, "global_step": 172591, "epoch": 4109} {"train_loss": -7.073575019836426, "global_step": 172592, "epoch": 4109} {"train_loss": -6.860896110534668, "global_step": 172593, "epoch": 4109} {"train_loss": -7.1159586906433105, "global_step": 172594, "epoch": 4109} {"train_loss": -7.061787128448486, "global_step": 172595, "epoch": 4109} {"train_loss": -6.978710174560547, "global_step": 172596, "epoch": 4109} {"train_loss": -6.938963413238525, "global_step": 172597, "epoch": 4109} {"train_loss": -6.924394607543945, "global_step": 172598, "epoch": 4109} {"train_loss": -7.100632667541504, "global_step": 172599, "epoch": 4109} {"train_loss": -6.957911491394043, "global_step": 172600, "epoch": 4109} {"train_loss": -7.051933765411377, "global_step": 172601, "epoch": 4109} {"train_loss": -7.039061069488525, "global_step": 172602, "epoch": 4109} {"train_loss": -6.930553913116455, "global_step": 172603, "epoch": 4109} {"train_loss": -6.987815856933594, "global_step": 172604, "epoch": 4109} {"train_loss": -7.0681867599487305, "global_step": 172605, "epoch": 4109} {"train_loss": -6.919412612915039, "global_step": 172606, "epoch": 4109} {"train_loss": -6.958365440368652, "global_step": 172607, "epoch": 4109} {"train_loss": -7.031980991363525, "global_step": 172608, "epoch": 4109} {"train_loss": -6.905487060546875, "global_step": 172609, "epoch": 4109} {"train_loss": -6.992445945739746, "global_step": 172610, "epoch": 4109} {"train_loss": -6.904201030731201, "global_step": 172611, "epoch": 4109} {"train_loss": -6.795407295227051, "global_step": 172612, "epoch": 4109} {"train_loss": -7.0506744384765625, "global_step": 172613, "epoch": 4109} {"train_loss": -6.930081367492676, "global_step": 172614, "epoch": 4109} {"train_loss": -7.01572322845459, "global_step": 172615, "epoch": 4109} {"train_loss": -6.907801628112793, "global_step": 172616, "epoch": 4109} {"train_loss": -6.869884490966797, "global_step": 172617, "epoch": 4109} {"train_loss": -6.96408748626709, "global_step": 172618, "epoch": 4109} {"train_loss": -7.002919026783535, "global_step": 172619, "epoch": 4109, "val_loss": 68480.71875} {"train_loss": -6.914991855621338, "global_step": 172620, "epoch": 4110} {"train_loss": -6.815710067749023, "global_step": 172621, "epoch": 4110} {"train_loss": -6.934652328491211, "global_step": 172622, "epoch": 4110} {"train_loss": -6.892234802246094, "global_step": 172623, "epoch": 4110} {"train_loss": -7.001838684082031, "global_step": 172624, "epoch": 4110} {"train_loss": -6.941484451293945, "global_step": 172625, "epoch": 4110} {"train_loss": -6.939932823181152, "global_step": 172626, "epoch": 4110} {"train_loss": -6.9336957931518555, "global_step": 172627, "epoch": 4110} {"train_loss": -7.0737175941467285, "global_step": 172628, "epoch": 4110} {"train_loss": -7.044825553894043, "global_step": 172629, "epoch": 4110} {"train_loss": -6.96367883682251, "global_step": 172630, "epoch": 4110} {"train_loss": -6.963891983032227, "global_step": 172631, "epoch": 4110} {"train_loss": -6.971005916595459, "global_step": 172632, "epoch": 4110} {"train_loss": -6.9978227615356445, "global_step": 172633, "epoch": 4110} {"train_loss": -7.056746482849121, "global_step": 172634, "epoch": 4110} {"train_loss": -6.919522285461426, "global_step": 172635, "epoch": 4110} {"train_loss": -6.98045539855957, "global_step": 172636, "epoch": 4110} {"train_loss": -6.97074031829834, "global_step": 172637, "epoch": 4110} {"train_loss": -6.913509845733643, "global_step": 172638, "epoch": 4110} {"train_loss": -6.977627754211426, "global_step": 172639, "epoch": 4110} {"train_loss": -7.04442024230957, "global_step": 172640, "epoch": 4110} {"train_loss": -6.940524101257324, "global_step": 172641, "epoch": 4110} {"train_loss": -6.958232879638672, "global_step": 172642, "epoch": 4110} {"train_loss": -6.979398250579834, "global_step": 172643, "epoch": 4110} {"train_loss": -6.974004745483398, "global_step": 172644, "epoch": 4110} {"train_loss": -7.109757423400879, "global_step": 172645, "epoch": 4110} {"train_loss": -6.967929840087891, "global_step": 172646, "epoch": 4110} {"train_loss": -7.147547721862793, "global_step": 172647, "epoch": 4110} {"train_loss": -7.0191450119018555, "global_step": 172648, "epoch": 4110} {"train_loss": -7.054955959320068, "global_step": 172649, "epoch": 4110} {"train_loss": -6.976065635681152, "global_step": 172650, "epoch": 4110} {"train_loss": -6.98345947265625, "global_step": 172651, "epoch": 4110} {"train_loss": -7.0948381423950195, "global_step": 172652, "epoch": 4110} {"train_loss": -7.022961616516113, "global_step": 172653, "epoch": 4110} {"train_loss": -7.019162178039551, "global_step": 172654, "epoch": 4110} {"train_loss": -7.025498390197754, "global_step": 172655, "epoch": 4110} {"train_loss": -7.186614990234375, "global_step": 172656, "epoch": 4110} {"train_loss": -6.99971342086792, "global_step": 172657, "epoch": 4110} {"train_loss": -6.944438457489014, "global_step": 172658, "epoch": 4110} {"train_loss": -7.115150451660156, "global_step": 172659, "epoch": 4110} {"train_loss": -6.979147911071777, "global_step": 172660, "epoch": 4110} {"train_loss": -6.996342307045346, "global_step": 172661, "epoch": 4110, "val_loss": 68476.9609375} {"train_loss": -7.108053207397461, "global_step": 172662, "epoch": 4111} {"train_loss": -7.009805202484131, "global_step": 172663, "epoch": 4111} {"train_loss": -7.168728828430176, "global_step": 172664, "epoch": 4111} {"train_loss": -7.128683090209961, "global_step": 172665, "epoch": 4111} {"train_loss": -7.110055446624756, "global_step": 172666, "epoch": 4111} {"train_loss": -7.173372268676758, "global_step": 172667, "epoch": 4111} {"train_loss": -7.001603603363037, "global_step": 172668, "epoch": 4111} {"train_loss": -7.085386276245117, "global_step": 172669, "epoch": 4111} {"train_loss": -7.087557315826416, "global_step": 172670, "epoch": 4111} {"train_loss": -7.028381824493408, "global_step": 172671, "epoch": 4111} {"train_loss": -7.155045509338379, "global_step": 172672, "epoch": 4111} {"train_loss": -7.046638488769531, "global_step": 172673, "epoch": 4111} {"train_loss": -7.11397123336792, "global_step": 172674, "epoch": 4111} {"train_loss": -7.064911842346191, "global_step": 172675, "epoch": 4111} {"train_loss": -7.119802951812744, "global_step": 172676, "epoch": 4111} {"train_loss": -7.060625076293945, "global_step": 172677, "epoch": 4111} {"train_loss": -7.14642333984375, "global_step": 172678, "epoch": 4111} {"train_loss": -6.974671363830566, "global_step": 172679, "epoch": 4111} {"train_loss": -7.097800254821777, "global_step": 172680, "epoch": 4111} {"train_loss": -6.963526248931885, "global_step": 172681, "epoch": 4111} {"train_loss": -7.030580520629883, "global_step": 172682, "epoch": 4111} {"train_loss": -7.018741607666016, "global_step": 172683, "epoch": 4111} {"train_loss": -7.051710605621338, "global_step": 172684, "epoch": 4111} {"train_loss": -7.074939727783203, "global_step": 172685, "epoch": 4111} {"train_loss": -6.999027252197266, "global_step": 172686, "epoch": 4111} {"train_loss": -7.075017929077148, "global_step": 172687, "epoch": 4111} {"train_loss": -7.161170959472656, "global_step": 172688, "epoch": 4111} {"train_loss": -7.026722431182861, "global_step": 172689, "epoch": 4111} {"train_loss": -7.12736701965332, "global_step": 172690, "epoch": 4111} {"train_loss": -7.063541889190674, "global_step": 172691, "epoch": 4111} {"train_loss": -7.101808071136475, "global_step": 172692, "epoch": 4111} {"train_loss": -7.162158966064453, "global_step": 172693, "epoch": 4111} {"train_loss": -7.072004795074463, "global_step": 172694, "epoch": 4111} {"train_loss": -7.0979228019714355, "global_step": 172695, "epoch": 4111} {"train_loss": -7.107729911804199, "global_step": 172696, "epoch": 4111} {"train_loss": -7.108710765838623, "global_step": 172697, "epoch": 4111} {"train_loss": -6.950048923492432, "global_step": 172698, "epoch": 4111} {"train_loss": -6.942418098449707, "global_step": 172699, "epoch": 4111} {"train_loss": -7.042479038238525, "global_step": 172700, "epoch": 4111} {"train_loss": -6.992252349853516, "global_step": 172701, "epoch": 4111} {"train_loss": -6.995878219604492, "global_step": 172702, "epoch": 4111} {"train_loss": -7.062511137553623, "global_step": 172703, "epoch": 4111, "val_loss": 68666.1875} {"train_loss": -6.999949932098389, "global_step": 172704, "epoch": 4112} {"train_loss": -7.079980373382568, "global_step": 172705, "epoch": 4112} {"train_loss": -7.019269943237305, "global_step": 172706, "epoch": 4112} {"train_loss": -7.085843086242676, "global_step": 172707, "epoch": 4112} {"train_loss": -6.899941921234131, "global_step": 172708, "epoch": 4112} {"train_loss": -6.9158172607421875, "global_step": 172709, "epoch": 4112} {"train_loss": -6.974363327026367, "global_step": 172710, "epoch": 4112} {"train_loss": -7.0590033531188965, "global_step": 172711, "epoch": 4112} {"train_loss": -6.87283992767334, "global_step": 172712, "epoch": 4112} {"train_loss": -6.995963096618652, "global_step": 172713, "epoch": 4112} {"train_loss": -7.023584842681885, "global_step": 172714, "epoch": 4112} {"train_loss": -6.891910076141357, "global_step": 172715, "epoch": 4112} {"train_loss": -7.067904472351074, "global_step": 172716, "epoch": 4112} {"train_loss": -6.8924150466918945, "global_step": 172717, "epoch": 4112} {"train_loss": -6.8095855712890625, "global_step": 172718, "epoch": 4112} {"train_loss": -6.993655204772949, "global_step": 172719, "epoch": 4112} {"train_loss": -6.807761192321777, "global_step": 172720, "epoch": 4112} {"train_loss": -6.910829544067383, "global_step": 172721, "epoch": 4112} {"train_loss": -6.926512718200684, "global_step": 172722, "epoch": 4112} {"train_loss": -6.846292495727539, "global_step": 172723, "epoch": 4112} {"train_loss": -6.910204887390137, "global_step": 172724, "epoch": 4112} {"train_loss": -6.986023902893066, "global_step": 172725, "epoch": 4112} {"train_loss": -6.945505142211914, "global_step": 172726, "epoch": 4112} {"train_loss": -7.018771648406982, "global_step": 172727, "epoch": 4112} {"train_loss": -6.960147380828857, "global_step": 172728, "epoch": 4112} {"train_loss": -6.900787830352783, "global_step": 172729, "epoch": 4112} {"train_loss": -7.021261215209961, "global_step": 172730, "epoch": 4112} {"train_loss": -6.838382720947266, "global_step": 172731, "epoch": 4112} {"train_loss": -6.958917617797852, "global_step": 172732, "epoch": 4112} {"train_loss": -6.976281642913818, "global_step": 172733, "epoch": 4112} {"train_loss": -6.878769397735596, "global_step": 172734, "epoch": 4112} {"train_loss": -6.978505611419678, "global_step": 172735, "epoch": 4112} {"train_loss": -6.8786773681640625, "global_step": 172736, "epoch": 4112} {"train_loss": -6.939747333526611, "global_step": 172737, "epoch": 4112} {"train_loss": -6.84804630279541, "global_step": 172738, "epoch": 4112} {"train_loss": -6.756467819213867, "global_step": 172739, "epoch": 4112} {"train_loss": -6.934815406799316, "global_step": 172740, "epoch": 4112} {"train_loss": -6.793946266174316, "global_step": 172741, "epoch": 4112} {"train_loss": -6.6959357261657715, "global_step": 172742, "epoch": 4112} {"train_loss": -6.734458923339844, "global_step": 172743, "epoch": 4112} {"train_loss": -6.674500942230225, "global_step": 172744, "epoch": 4112} {"train_loss": -6.916585763295491, "global_step": 172745, "epoch": 4112, "val_loss": 68481.53125} {"train_loss": -6.955902099609375, "global_step": 172746, "epoch": 4113} {"train_loss": -6.713349342346191, "global_step": 172747, "epoch": 4113} {"train_loss": -6.945586204528809, "global_step": 172748, "epoch": 4113} {"train_loss": -6.889505863189697, "global_step": 172749, "epoch": 4113} {"train_loss": -6.878060340881348, "global_step": 172750, "epoch": 4113} {"train_loss": -6.818358898162842, "global_step": 172751, "epoch": 4113} {"train_loss": -6.842423439025879, "global_step": 172752, "epoch": 4113} {"train_loss": -6.771137237548828, "global_step": 172753, "epoch": 4113} {"train_loss": -6.704409122467041, "global_step": 172754, "epoch": 4113} {"train_loss": -6.884528160095215, "global_step": 172755, "epoch": 4113} {"train_loss": -6.968657493591309, "global_step": 172756, "epoch": 4113} {"train_loss": -6.893363952636719, "global_step": 172757, "epoch": 4113} {"train_loss": -6.915968894958496, "global_step": 172758, "epoch": 4113} {"train_loss": -6.841708660125732, "global_step": 172759, "epoch": 4113} {"train_loss": -6.922228813171387, "global_step": 172760, "epoch": 4113} {"train_loss": -6.913147926330566, "global_step": 172761, "epoch": 4113} {"train_loss": -6.841588020324707, "global_step": 172762, "epoch": 4113} {"train_loss": -6.830746650695801, "global_step": 172763, "epoch": 4113} {"train_loss": -6.88990592956543, "global_step": 172764, "epoch": 4113} {"train_loss": -6.964370250701904, "global_step": 172765, "epoch": 4113} {"train_loss": -6.860506057739258, "global_step": 172766, "epoch": 4113} {"train_loss": -7.043690204620361, "global_step": 172767, "epoch": 4113} {"train_loss": -6.892848014831543, "global_step": 172768, "epoch": 4113} {"train_loss": -6.821512699127197, "global_step": 172769, "epoch": 4113} {"train_loss": -6.868241310119629, "global_step": 172770, "epoch": 4113} {"train_loss": -6.9559006690979, "global_step": 172771, "epoch": 4113} {"train_loss": -6.893049716949463, "global_step": 172772, "epoch": 4113} {"train_loss": -6.983310699462891, "global_step": 172773, "epoch": 4113} {"train_loss": -6.827592849731445, "global_step": 172774, "epoch": 4113} {"train_loss": -6.976190567016602, "global_step": 172775, "epoch": 4113} {"train_loss": -6.911174297332764, "global_step": 172776, "epoch": 4113} {"train_loss": -6.955148696899414, "global_step": 172777, "epoch": 4113} {"train_loss": -6.872332572937012, "global_step": 172778, "epoch": 4113} {"train_loss": -6.769305229187012, "global_step": 172779, "epoch": 4113} {"train_loss": -6.915850639343262, "global_step": 172780, "epoch": 4113} {"train_loss": -6.87838077545166, "global_step": 172781, "epoch": 4113} {"train_loss": -6.91484260559082, "global_step": 172782, "epoch": 4113} {"train_loss": -6.981083869934082, "global_step": 172783, "epoch": 4113} {"train_loss": -6.9692182540893555, "global_step": 172784, "epoch": 4113} {"train_loss": -6.786857604980469, "global_step": 172785, "epoch": 4113} {"train_loss": -7.0628767013549805, "global_step": 172786, "epoch": 4113} {"train_loss": -6.8912013825916105, "global_step": 172787, "epoch": 4113, "val_loss": 68641.3515625} {"train_loss": -6.924769401550293, "global_step": 172788, "epoch": 4114} {"train_loss": -6.996260166168213, "global_step": 172789, "epoch": 4114} {"train_loss": -6.936357021331787, "global_step": 172790, "epoch": 4114} {"train_loss": -7.042486667633057, "global_step": 172791, "epoch": 4114} {"train_loss": -7.043082237243652, "global_step": 172792, "epoch": 4114} {"train_loss": -7.0231099128723145, "global_step": 172793, "epoch": 4114} {"train_loss": -7.0184478759765625, "global_step": 172794, "epoch": 4114} {"train_loss": -7.066336631774902, "global_step": 172795, "epoch": 4114} {"train_loss": -6.951709747314453, "global_step": 172796, "epoch": 4114} {"train_loss": -6.928643226623535, "global_step": 172797, "epoch": 4114} {"train_loss": -7.109952926635742, "global_step": 172798, "epoch": 4114} {"train_loss": -6.951637268066406, "global_step": 172799, "epoch": 4114} {"train_loss": -6.9498701095581055, "global_step": 172800, "epoch": 4114} {"train_loss": -6.7833452224731445, "global_step": 172801, "epoch": 4114} {"train_loss": -7.128671646118164, "global_step": 172802, "epoch": 4114} {"train_loss": -6.960145950317383, "global_step": 172803, "epoch": 4114} {"train_loss": -7.047035217285156, "global_step": 172804, "epoch": 4114} {"train_loss": -6.895203590393066, "global_step": 172805, "epoch": 4114} {"train_loss": -6.914349555969238, "global_step": 172806, "epoch": 4114} {"train_loss": -7.018399715423584, "global_step": 172807, "epoch": 4114} {"train_loss": -6.933067798614502, "global_step": 172808, "epoch": 4114} {"train_loss": -6.914079666137695, "global_step": 172809, "epoch": 4114} {"train_loss": -6.929645538330078, "global_step": 172810, "epoch": 4114} {"train_loss": -6.939629554748535, "global_step": 172811, "epoch": 4114} {"train_loss": -6.919467926025391, "global_step": 172812, "epoch": 4114} {"train_loss": -6.988239765167236, "global_step": 172813, "epoch": 4114} {"train_loss": -7.040181636810303, "global_step": 172814, "epoch": 4114} {"train_loss": -6.946501731872559, "global_step": 172815, "epoch": 4114} {"train_loss": -6.9556427001953125, "global_step": 172816, "epoch": 4114} {"train_loss": -6.932191848754883, "global_step": 172817, "epoch": 4114} {"train_loss": -7.089626312255859, "global_step": 172818, "epoch": 4114} {"train_loss": -7.065230369567871, "global_step": 172819, "epoch": 4114} {"train_loss": -6.942095756530762, "global_step": 172820, "epoch": 4114} {"train_loss": -6.96779203414917, "global_step": 172821, "epoch": 4114} {"train_loss": -6.957629203796387, "global_step": 172822, "epoch": 4114} {"train_loss": -6.979422569274902, "global_step": 172823, "epoch": 4114} {"train_loss": -6.98868465423584, "global_step": 172824, "epoch": 4114} {"train_loss": -6.963671684265137, "global_step": 172825, "epoch": 4114} {"train_loss": -6.928232669830322, "global_step": 172826, "epoch": 4114} {"train_loss": -7.0114641189575195, "global_step": 172827, "epoch": 4114} {"train_loss": -6.9436116218566895, "global_step": 172828, "epoch": 4114} {"train_loss": -6.9718177772703624, "global_step": 172829, "epoch": 4114, "val_loss": 68586.3125} {"train_loss": -6.898963451385498, "global_step": 172830, "epoch": 4115} {"train_loss": -6.942904472351074, "global_step": 172831, "epoch": 4115} {"train_loss": -7.074456214904785, "global_step": 172832, "epoch": 4115} {"train_loss": -6.989433288574219, "global_step": 172833, "epoch": 4115} {"train_loss": -6.927196979522705, "global_step": 172834, "epoch": 4115} {"train_loss": -6.937536239624023, "global_step": 172835, "epoch": 4115} {"train_loss": -6.938348770141602, "global_step": 172836, "epoch": 4115} {"train_loss": -7.018698692321777, "global_step": 172837, "epoch": 4115} {"train_loss": -6.990280628204346, "global_step": 172838, "epoch": 4115} {"train_loss": -7.072867393493652, "global_step": 172839, "epoch": 4115} {"train_loss": -7.055256366729736, "global_step": 172840, "epoch": 4115} {"train_loss": -7.005146503448486, "global_step": 172841, "epoch": 4115} {"train_loss": -7.084439754486084, "global_step": 172842, "epoch": 4115} {"train_loss": -6.99350118637085, "global_step": 172843, "epoch": 4115} {"train_loss": -6.960148334503174, "global_step": 172844, "epoch": 4115} {"train_loss": -6.99998140335083, "global_step": 172845, "epoch": 4115} {"train_loss": -6.875041961669922, "global_step": 172846, "epoch": 4115} {"train_loss": -7.059272766113281, "global_step": 172847, "epoch": 4115} {"train_loss": -7.0705037117004395, "global_step": 172848, "epoch": 4115} {"train_loss": -6.930703163146973, "global_step": 172849, "epoch": 4115} {"train_loss": -7.108321189880371, "global_step": 172850, "epoch": 4115} {"train_loss": -7.0879106521606445, "global_step": 172851, "epoch": 4115} {"train_loss": -6.9787983894348145, "global_step": 172852, "epoch": 4115} {"train_loss": -7.043700695037842, "global_step": 172853, "epoch": 4115} {"train_loss": -6.905885696411133, "global_step": 172854, "epoch": 4115} {"train_loss": -7.134888172149658, "global_step": 172855, "epoch": 4115} {"train_loss": -7.004038333892822, "global_step": 172856, "epoch": 4115} {"train_loss": -7.086607933044434, "global_step": 172857, "epoch": 4115} {"train_loss": -6.986652374267578, "global_step": 172858, "epoch": 4115} {"train_loss": -7.051905632019043, "global_step": 172859, "epoch": 4115} {"train_loss": -7.0174455642700195, "global_step": 172860, "epoch": 4115} {"train_loss": -7.051048755645752, "global_step": 172861, "epoch": 4115} {"train_loss": -6.959836959838867, "global_step": 172862, "epoch": 4115} {"train_loss": -6.91520881652832, "global_step": 172863, "epoch": 4115} {"train_loss": -6.931227684020996, "global_step": 172864, "epoch": 4115} {"train_loss": -7.069005012512207, "global_step": 172865, "epoch": 4115} {"train_loss": -7.05837345123291, "global_step": 172866, "epoch": 4115} {"train_loss": -7.040105819702148, "global_step": 172867, "epoch": 4115} {"train_loss": -7.034917831420898, "global_step": 172868, "epoch": 4115} {"train_loss": -7.126278400421143, "global_step": 172869, "epoch": 4115} {"train_loss": -6.855310440063477, "global_step": 172870, "epoch": 4115} {"train_loss": -7.005563349950881, "global_step": 172871, "epoch": 4115, "val_loss": 68566.4921875} {"train_loss": -6.978696346282959, "global_step": 172872, "epoch": 4116} {"train_loss": -6.946789264678955, "global_step": 172873, "epoch": 4116} {"train_loss": -7.061074733734131, "global_step": 172874, "epoch": 4116} {"train_loss": -7.029092311859131, "global_step": 172875, "epoch": 4116} {"train_loss": -7.009499549865723, "global_step": 172876, "epoch": 4116} {"train_loss": -7.018986701965332, "global_step": 172877, "epoch": 4116} {"train_loss": -7.031749725341797, "global_step": 172878, "epoch": 4116} {"train_loss": -7.028367519378662, "global_step": 172879, "epoch": 4116} {"train_loss": -7.0604472160339355, "global_step": 172880, "epoch": 4116} {"train_loss": -7.022774696350098, "global_step": 172881, "epoch": 4116} {"train_loss": -7.030794620513916, "global_step": 172882, "epoch": 4116} {"train_loss": -7.0328264236450195, "global_step": 172883, "epoch": 4116} {"train_loss": -6.967416763305664, "global_step": 172884, "epoch": 4116} {"train_loss": -6.967069149017334, "global_step": 172885, "epoch": 4116} {"train_loss": -7.056835174560547, "global_step": 172886, "epoch": 4116} {"train_loss": -6.966732025146484, "global_step": 172887, "epoch": 4116} {"train_loss": -6.906435966491699, "global_step": 172888, "epoch": 4116} {"train_loss": -7.011971473693848, "global_step": 172889, "epoch": 4116} {"train_loss": -7.118160247802734, "global_step": 172890, "epoch": 4116} {"train_loss": -7.147974967956543, "global_step": 172891, "epoch": 4116} {"train_loss": -6.961259841918945, "global_step": 172892, "epoch": 4116} {"train_loss": -7.058563232421875, "global_step": 172893, "epoch": 4116} {"train_loss": -7.004202842712402, "global_step": 172894, "epoch": 4116} {"train_loss": -7.003608703613281, "global_step": 172895, "epoch": 4116} {"train_loss": -7.067658424377441, "global_step": 172896, "epoch": 4116} {"train_loss": -6.986088275909424, "global_step": 172897, "epoch": 4116} {"train_loss": -7.008903503417969, "global_step": 172898, "epoch": 4116} {"train_loss": -6.942337989807129, "global_step": 172899, "epoch": 4116} {"train_loss": -7.026693344116211, "global_step": 172900, "epoch": 4116} {"train_loss": -7.04793643951416, "global_step": 172901, "epoch": 4116} {"train_loss": -6.973563194274902, "global_step": 172902, "epoch": 4116} {"train_loss": -6.999569892883301, "global_step": 172903, "epoch": 4116} {"train_loss": -6.947562217712402, "global_step": 172904, "epoch": 4116} {"train_loss": -6.789188385009766, "global_step": 172905, "epoch": 4116} {"train_loss": -6.885236740112305, "global_step": 172906, "epoch": 4116} {"train_loss": -7.101719856262207, "global_step": 172907, "epoch": 4116} {"train_loss": -6.989855766296387, "global_step": 172908, "epoch": 4116} {"train_loss": -6.906928539276123, "global_step": 172909, "epoch": 4116} {"train_loss": -6.935311317443848, "global_step": 172910, "epoch": 4116} {"train_loss": -7.068044662475586, "global_step": 172911, "epoch": 4116} {"train_loss": -6.973419189453125, "global_step": 172912, "epoch": 4116} {"train_loss": -7.00369507925851, "global_step": 172913, "epoch": 4116, "val_loss": 68709.1640625} {"train_loss": -6.9904584884643555, "global_step": 172914, "epoch": 4117} {"train_loss": -6.977518081665039, "global_step": 172915, "epoch": 4117} {"train_loss": -6.944910049438477, "global_step": 172916, "epoch": 4117} {"train_loss": -7.005867004394531, "global_step": 172917, "epoch": 4117} {"train_loss": -7.005013465881348, "global_step": 172918, "epoch": 4117} {"train_loss": -7.049412727355957, "global_step": 172919, "epoch": 4117} {"train_loss": -6.917585372924805, "global_step": 172920, "epoch": 4117} {"train_loss": -7.025930404663086, "global_step": 172921, "epoch": 4117} {"train_loss": -6.998147487640381, "global_step": 172922, "epoch": 4117} {"train_loss": -6.889623641967773, "global_step": 172923, "epoch": 4117} {"train_loss": -7.013256072998047, "global_step": 172924, "epoch": 4117} {"train_loss": -6.8894195556640625, "global_step": 172925, "epoch": 4117} {"train_loss": -7.023872375488281, "global_step": 172926, "epoch": 4117} {"train_loss": -6.91002082824707, "global_step": 172927, "epoch": 4117} {"train_loss": -7.076706409454346, "global_step": 172928, "epoch": 4117} {"train_loss": -6.990350246429443, "global_step": 172929, "epoch": 4117} {"train_loss": -7.035761833190918, "global_step": 172930, "epoch": 4117} {"train_loss": -7.101863861083984, "global_step": 172931, "epoch": 4117} {"train_loss": -6.980204105377197, "global_step": 172932, "epoch": 4117} {"train_loss": -7.001604080200195, "global_step": 172933, "epoch": 4117} {"train_loss": -6.948127746582031, "global_step": 172934, "epoch": 4117} {"train_loss": -7.084659099578857, "global_step": 172935, "epoch": 4117} {"train_loss": -7.066372871398926, "global_step": 172936, "epoch": 4117} {"train_loss": -7.112349510192871, "global_step": 172937, "epoch": 4117} {"train_loss": -7.115945816040039, "global_step": 172938, "epoch": 4117} {"train_loss": -7.013772487640381, "global_step": 172939, "epoch": 4117} {"train_loss": -7.006497383117676, "global_step": 172940, "epoch": 4117} {"train_loss": -7.113741874694824, "global_step": 172941, "epoch": 4117} {"train_loss": -6.955482482910156, "global_step": 172942, "epoch": 4117} {"train_loss": -7.058572769165039, "global_step": 172943, "epoch": 4117} {"train_loss": -7.121685981750488, "global_step": 172944, "epoch": 4117} {"train_loss": -6.976489543914795, "global_step": 172945, "epoch": 4117} {"train_loss": -7.044857978820801, "global_step": 172946, "epoch": 4117} {"train_loss": -7.094466686248779, "global_step": 172947, "epoch": 4117} {"train_loss": -7.123379707336426, "global_step": 172948, "epoch": 4117} {"train_loss": -7.018988132476807, "global_step": 172949, "epoch": 4117} {"train_loss": -7.129244804382324, "global_step": 172950, "epoch": 4117} {"train_loss": -7.069899559020996, "global_step": 172951, "epoch": 4117} {"train_loss": -6.925085067749023, "global_step": 172952, "epoch": 4117} {"train_loss": -6.916163444519043, "global_step": 172953, "epoch": 4117} {"train_loss": -7.115542888641357, "global_step": 172954, "epoch": 4117} {"train_loss": -7.018484615144276, "global_step": 172955, "epoch": 4117, "val_loss": 68477.0390625} {"train_loss": -6.894864559173584, "global_step": 172956, "epoch": 4118} {"train_loss": -6.939846992492676, "global_step": 172957, "epoch": 4118} {"train_loss": -7.017470359802246, "global_step": 172958, "epoch": 4118} {"train_loss": -6.936232566833496, "global_step": 172959, "epoch": 4118} {"train_loss": -7.005680561065674, "global_step": 172960, "epoch": 4118} {"train_loss": -6.869684219360352, "global_step": 172961, "epoch": 4118} {"train_loss": -7.044678688049316, "global_step": 172962, "epoch": 4118} {"train_loss": -6.873295307159424, "global_step": 172963, "epoch": 4118} {"train_loss": -6.9844183921813965, "global_step": 172964, "epoch": 4118} {"train_loss": -6.898466110229492, "global_step": 172965, "epoch": 4118} {"train_loss": -6.933097839355469, "global_step": 172966, "epoch": 4118} {"train_loss": -7.048982620239258, "global_step": 172967, "epoch": 4118} {"train_loss": -6.891717910766602, "global_step": 172968, "epoch": 4118} {"train_loss": -7.06883430480957, "global_step": 172969, "epoch": 4118} {"train_loss": -6.904970169067383, "global_step": 172970, "epoch": 4118} {"train_loss": -6.954994201660156, "global_step": 172971, "epoch": 4118} {"train_loss": -7.033628463745117, "global_step": 172972, "epoch": 4118} {"train_loss": -7.024188995361328, "global_step": 172973, "epoch": 4118} {"train_loss": -6.910586357116699, "global_step": 172974, "epoch": 4118} {"train_loss": -7.085741996765137, "global_step": 172975, "epoch": 4118} {"train_loss": -7.077464580535889, "global_step": 172976, "epoch": 4118} {"train_loss": -6.972868919372559, "global_step": 172977, "epoch": 4118} {"train_loss": -7.005851745605469, "global_step": 172978, "epoch": 4118} {"train_loss": -7.1335129737854, "global_step": 172979, "epoch": 4118} {"train_loss": -6.9953107833862305, "global_step": 172980, "epoch": 4118} {"train_loss": -6.918817520141602, "global_step": 172981, "epoch": 4118} {"train_loss": -7.011706829071045, "global_step": 172982, "epoch": 4118} {"train_loss": -7.085561752319336, "global_step": 172983, "epoch": 4118} {"train_loss": -6.954835891723633, "global_step": 172984, "epoch": 4118} {"train_loss": -6.915742874145508, "global_step": 172985, "epoch": 4118} {"train_loss": -6.998039245605469, "global_step": 172986, "epoch": 4118} {"train_loss": -7.096404075622559, "global_step": 172987, "epoch": 4118} {"train_loss": -6.878118515014648, "global_step": 172988, "epoch": 4118} {"train_loss": -6.967067718505859, "global_step": 172989, "epoch": 4118} {"train_loss": -7.026253700256348, "global_step": 172990, "epoch": 4118} {"train_loss": -7.016182899475098, "global_step": 172991, "epoch": 4118} {"train_loss": -6.920483589172363, "global_step": 172992, "epoch": 4118} {"train_loss": -6.874930381774902, "global_step": 172993, "epoch": 4118} {"train_loss": -7.0151872634887695, "global_step": 172994, "epoch": 4118} {"train_loss": -7.014456748962402, "global_step": 172995, "epoch": 4118} {"train_loss": -6.989394664764404, "global_step": 172996, "epoch": 4118} {"train_loss": -6.98225542477199, "global_step": 172997, "epoch": 4118, "val_loss": 68375.140625} {"train_loss": -7.084869861602783, "global_step": 172998, "epoch": 4119} {"train_loss": -7.047472953796387, "global_step": 172999, "epoch": 4119} {"train_loss": -7.084469795227051, "global_step": 173000, "epoch": 4119} {"train_loss": -7.11884069442749, "global_step": 173001, "epoch": 4119} {"train_loss": -7.095949172973633, "global_step": 173002, "epoch": 4119} {"train_loss": -7.114532470703125, "global_step": 173003, "epoch": 4119} {"train_loss": -7.105862617492676, "global_step": 173004, "epoch": 4119} {"train_loss": -7.116750717163086, "global_step": 173005, "epoch": 4119} {"train_loss": -6.968340873718262, "global_step": 173006, "epoch": 4119} {"train_loss": -6.9897613525390625, "global_step": 173007, "epoch": 4119} {"train_loss": -7.0012922286987305, "global_step": 173008, "epoch": 4119} {"train_loss": -6.985803127288818, "global_step": 173009, "epoch": 4119} {"train_loss": -6.968194961547852, "global_step": 173010, "epoch": 4119} {"train_loss": -7.068078517913818, "global_step": 173011, "epoch": 4119} {"train_loss": -6.953704833984375, "global_step": 173012, "epoch": 4119} {"train_loss": -7.1166229248046875, "global_step": 173013, "epoch": 4119} {"train_loss": -6.992345809936523, "global_step": 173014, "epoch": 4119} {"train_loss": -6.840517044067383, "global_step": 173015, "epoch": 4119} {"train_loss": -7.01043701171875, "global_step": 173016, "epoch": 4119} {"train_loss": -6.899628639221191, "global_step": 173017, "epoch": 4119} {"train_loss": -6.841961860656738, "global_step": 173018, "epoch": 4119} {"train_loss": -7.029146194458008, "global_step": 173019, "epoch": 4119} {"train_loss": -6.914346218109131, "global_step": 173020, "epoch": 4119} {"train_loss": -7.057456016540527, "global_step": 173021, "epoch": 4119} {"train_loss": -7.043251037597656, "global_step": 173022, "epoch": 4119} {"train_loss": -6.964746475219727, "global_step": 173023, "epoch": 4119} {"train_loss": -7.058831214904785, "global_step": 173024, "epoch": 4119} {"train_loss": -6.915836334228516, "global_step": 173025, "epoch": 4119} {"train_loss": -6.959445953369141, "global_step": 173026, "epoch": 4119} {"train_loss": -7.022303581237793, "global_step": 173027, "epoch": 4119} {"train_loss": -6.917707443237305, "global_step": 173028, "epoch": 4119} {"train_loss": -6.960102081298828, "global_step": 173029, "epoch": 4119} {"train_loss": -7.025673866271973, "global_step": 173030, "epoch": 4119} {"train_loss": -6.948768615722656, "global_step": 173031, "epoch": 4119} {"train_loss": -6.941098690032959, "global_step": 173032, "epoch": 4119} {"train_loss": -6.971201419830322, "global_step": 173033, "epoch": 4119} {"train_loss": -6.834661483764648, "global_step": 173034, "epoch": 4119} {"train_loss": -7.107815265655518, "global_step": 173035, "epoch": 4119} {"train_loss": -7.065653324127197, "global_step": 173036, "epoch": 4119} {"train_loss": -6.9485979080200195, "global_step": 173037, "epoch": 4119} {"train_loss": -7.006211280822754, "global_step": 173038, "epoch": 4119} {"train_loss": -7.002012184688023, "global_step": 173039, "epoch": 4119, "val_loss": 68604.4453125} {"train_loss": -6.9263386726379395, "global_step": 173040, "epoch": 4120} {"train_loss": -6.994696140289307, "global_step": 173041, "epoch": 4120} {"train_loss": -6.943935394287109, "global_step": 173042, "epoch": 4120} {"train_loss": -6.999527931213379, "global_step": 173043, "epoch": 4120} {"train_loss": -6.967317581176758, "global_step": 173044, "epoch": 4120} {"train_loss": -7.046413421630859, "global_step": 173045, "epoch": 4120} {"train_loss": -6.904528617858887, "global_step": 173046, "epoch": 4120} {"train_loss": -6.907188892364502, "global_step": 173047, "epoch": 4120} {"train_loss": -6.943910121917725, "global_step": 173048, "epoch": 4120} {"train_loss": -7.024439334869385, "global_step": 173049, "epoch": 4120} {"train_loss": -6.920832633972168, "global_step": 173050, "epoch": 4120} {"train_loss": -6.925174713134766, "global_step": 173051, "epoch": 4120} {"train_loss": -6.885554313659668, "global_step": 173052, "epoch": 4120} {"train_loss": -6.91373348236084, "global_step": 173053, "epoch": 4120} {"train_loss": -7.040083885192871, "global_step": 173054, "epoch": 4120} {"train_loss": -6.800755500793457, "global_step": 173055, "epoch": 4120} {"train_loss": -7.082803249359131, "global_step": 173056, "epoch": 4120} {"train_loss": -7.065931797027588, "global_step": 173057, "epoch": 4120} {"train_loss": -6.907395362854004, "global_step": 173058, "epoch": 4120} {"train_loss": -7.004010200500488, "global_step": 173059, "epoch": 4120} {"train_loss": -6.809737205505371, "global_step": 173060, "epoch": 4120} {"train_loss": -7.000128746032715, "global_step": 173061, "epoch": 4120} {"train_loss": -6.961190700531006, "global_step": 173062, "epoch": 4120} {"train_loss": -6.958433151245117, "global_step": 173063, "epoch": 4120} {"train_loss": -6.993232250213623, "global_step": 173064, "epoch": 4120} {"train_loss": -6.998709678649902, "global_step": 173065, "epoch": 4120} {"train_loss": -7.052659034729004, "global_step": 173066, "epoch": 4120} {"train_loss": -6.925806999206543, "global_step": 173067, "epoch": 4120} {"train_loss": -6.949263572692871, "global_step": 173068, "epoch": 4120} {"train_loss": -7.057401657104492, "global_step": 173069, "epoch": 4120} {"train_loss": -7.0330047607421875, "global_step": 173070, "epoch": 4120} {"train_loss": -6.965842247009277, "global_step": 173071, "epoch": 4120} {"train_loss": -6.964293003082275, "global_step": 173072, "epoch": 4120} {"train_loss": -6.910314559936523, "global_step": 173073, "epoch": 4120} {"train_loss": -6.985823631286621, "global_step": 173074, "epoch": 4120} {"train_loss": -6.996304988861084, "global_step": 173075, "epoch": 4120} {"train_loss": -6.9241485595703125, "global_step": 173076, "epoch": 4120} {"train_loss": -7.037611961364746, "global_step": 173077, "epoch": 4120} {"train_loss": -7.004883766174316, "global_step": 173078, "epoch": 4120} {"train_loss": -7.0970892906188965, "global_step": 173079, "epoch": 4120} {"train_loss": -7.000204086303711, "global_step": 173080, "epoch": 4120} {"train_loss": -6.973259959902082, "global_step": 173081, "epoch": 4120, "val_loss": 68449.515625} {"train_loss": -7.011487007141113, "global_step": 173082, "epoch": 4121} {"train_loss": -7.085766792297363, "global_step": 173083, "epoch": 4121} {"train_loss": -6.819997787475586, "global_step": 173084, "epoch": 4121} {"train_loss": -7.01415491104126, "global_step": 173085, "epoch": 4121} {"train_loss": -7.005563735961914, "global_step": 173086, "epoch": 4121} {"train_loss": -7.009859085083008, "global_step": 173087, "epoch": 4121} {"train_loss": -7.009442329406738, "global_step": 173088, "epoch": 4121} {"train_loss": -7.0656232833862305, "global_step": 173089, "epoch": 4121} {"train_loss": -7.011617660522461, "global_step": 173090, "epoch": 4121} {"train_loss": -7.020485877990723, "global_step": 173091, "epoch": 4121} {"train_loss": -7.032015800476074, "global_step": 173092, "epoch": 4121} {"train_loss": -6.963210582733154, "global_step": 173093, "epoch": 4121} {"train_loss": -6.939436912536621, "global_step": 173094, "epoch": 4121} {"train_loss": -7.091856956481934, "global_step": 173095, "epoch": 4121} {"train_loss": -7.091045379638672, "global_step": 173096, "epoch": 4121} {"train_loss": -6.915311336517334, "global_step": 173097, "epoch": 4121} {"train_loss": -7.051487922668457, "global_step": 173098, "epoch": 4121} {"train_loss": -7.119925498962402, "global_step": 173099, "epoch": 4121} {"train_loss": -6.969457626342773, "global_step": 173100, "epoch": 4121} {"train_loss": -7.05938720703125, "global_step": 173101, "epoch": 4121} {"train_loss": -7.078850746154785, "global_step": 173102, "epoch": 4121} {"train_loss": -7.206613063812256, "global_step": 173103, "epoch": 4121} {"train_loss": -7.062132835388184, "global_step": 173104, "epoch": 4121} {"train_loss": -7.071162223815918, "global_step": 173105, "epoch": 4121} {"train_loss": -7.077428817749023, "global_step": 173106, "epoch": 4121} {"train_loss": -7.00309419631958, "global_step": 173107, "epoch": 4121} {"train_loss": -7.044062614440918, "global_step": 173108, "epoch": 4121} {"train_loss": -6.910683631896973, "global_step": 173109, "epoch": 4121} {"train_loss": -7.010592460632324, "global_step": 173110, "epoch": 4121} {"train_loss": -7.069416046142578, "global_step": 173111, "epoch": 4121} {"train_loss": -6.958281517028809, "global_step": 173112, "epoch": 4121} {"train_loss": -6.987941741943359, "global_step": 173113, "epoch": 4121} {"train_loss": -7.042341232299805, "global_step": 173114, "epoch": 4121} {"train_loss": -6.936563014984131, "global_step": 173115, "epoch": 4121} {"train_loss": -7.026006698608398, "global_step": 173116, "epoch": 4121} {"train_loss": -7.137431621551514, "global_step": 173117, "epoch": 4121} {"train_loss": -7.001420497894287, "global_step": 173118, "epoch": 4121} {"train_loss": -7.012503147125244, "global_step": 173119, "epoch": 4121} {"train_loss": -7.056485176086426, "global_step": 173120, "epoch": 4121} {"train_loss": -7.00508451461792, "global_step": 173121, "epoch": 4121} {"train_loss": -6.993404865264893, "global_step": 173122, "epoch": 4121} {"train_loss": -7.025654747372582, "global_step": 173123, "epoch": 4121, "val_loss": 68544.734375} {"train_loss": -7.092494487762451, "global_step": 173124, "epoch": 4122} {"train_loss": -7.092871189117432, "global_step": 173125, "epoch": 4122} {"train_loss": -7.013710975646973, "global_step": 173126, "epoch": 4122} {"train_loss": -7.0707011222839355, "global_step": 173127, "epoch": 4122} {"train_loss": -7.0107927322387695, "global_step": 173128, "epoch": 4122} {"train_loss": -7.17762565612793, "global_step": 173129, "epoch": 4122} {"train_loss": -7.037158012390137, "global_step": 173130, "epoch": 4122} {"train_loss": -7.114306449890137, "global_step": 173131, "epoch": 4122} {"train_loss": -7.044710159301758, "global_step": 173132, "epoch": 4122} {"train_loss": -7.135236740112305, "global_step": 173133, "epoch": 4122} {"train_loss": -7.031589984893799, "global_step": 173134, "epoch": 4122} {"train_loss": -7.016944885253906, "global_step": 173135, "epoch": 4122} {"train_loss": -7.140063285827637, "global_step": 173136, "epoch": 4122} {"train_loss": -7.112112522125244, "global_step": 173137, "epoch": 4122} {"train_loss": -7.114683151245117, "global_step": 173138, "epoch": 4122} {"train_loss": -7.111011028289795, "global_step": 173139, "epoch": 4122} {"train_loss": -7.056698799133301, "global_step": 173140, "epoch": 4122} {"train_loss": -7.03563928604126, "global_step": 173141, "epoch": 4122} {"train_loss": -7.077548027038574, "global_step": 173142, "epoch": 4122} {"train_loss": -7.109516143798828, "global_step": 173143, "epoch": 4122} {"train_loss": -6.937073707580566, "global_step": 173144, "epoch": 4122} {"train_loss": -7.012205123901367, "global_step": 173145, "epoch": 4122} {"train_loss": -7.120654106140137, "global_step": 173146, "epoch": 4122} {"train_loss": -7.106664657592773, "global_step": 173147, "epoch": 4122} {"train_loss": -7.0646562576293945, "global_step": 173148, "epoch": 4122} {"train_loss": -6.950094223022461, "global_step": 173149, "epoch": 4122} {"train_loss": -7.0958757400512695, "global_step": 173150, "epoch": 4122} {"train_loss": -7.08625602722168, "global_step": 173151, "epoch": 4122} {"train_loss": -7.025112152099609, "global_step": 173152, "epoch": 4122} {"train_loss": -7.145110607147217, "global_step": 173153, "epoch": 4122} {"train_loss": -6.975562572479248, "global_step": 173154, "epoch": 4122} {"train_loss": -7.117510795593262, "global_step": 173155, "epoch": 4122} {"train_loss": -7.042710304260254, "global_step": 173156, "epoch": 4122} {"train_loss": -6.915022850036621, "global_step": 173157, "epoch": 4122} {"train_loss": -7.060635566711426, "global_step": 173158, "epoch": 4122} {"train_loss": -7.042852401733398, "global_step": 173159, "epoch": 4122} {"train_loss": -6.984947204589844, "global_step": 173160, "epoch": 4122} {"train_loss": -6.994316101074219, "global_step": 173161, "epoch": 4122} {"train_loss": -6.994617462158203, "global_step": 173162, "epoch": 4122} {"train_loss": -7.0487799644470215, "global_step": 173163, "epoch": 4122} {"train_loss": -6.944539546966553, "global_step": 173164, "epoch": 4122} {"train_loss": -7.054659241721744, "global_step": 173165, "epoch": 4122, "val_loss": 68645.6796875} {"train_loss": -7.036181449890137, "global_step": 173166, "epoch": 4123} {"train_loss": -7.137362003326416, "global_step": 173167, "epoch": 4123} {"train_loss": -6.950050354003906, "global_step": 173168, "epoch": 4123} {"train_loss": -7.037964820861816, "global_step": 173169, "epoch": 4123} {"train_loss": -6.957337379455566, "global_step": 173170, "epoch": 4123} {"train_loss": -7.033871173858643, "global_step": 173171, "epoch": 4123} {"train_loss": -7.130836486816406, "global_step": 173172, "epoch": 4123} {"train_loss": -6.885574817657471, "global_step": 173173, "epoch": 4123} {"train_loss": -7.02012825012207, "global_step": 173174, "epoch": 4123} {"train_loss": -6.865203857421875, "global_step": 173175, "epoch": 4123} {"train_loss": -6.948655605316162, "global_step": 173176, "epoch": 4123} {"train_loss": -7.031650543212891, "global_step": 173177, "epoch": 4123} {"train_loss": -7.019065856933594, "global_step": 173178, "epoch": 4123} {"train_loss": -7.043344020843506, "global_step": 173179, "epoch": 4123} {"train_loss": -6.875345230102539, "global_step": 173180, "epoch": 4123} {"train_loss": -7.040076732635498, "global_step": 173181, "epoch": 4123} {"train_loss": -6.984752655029297, "global_step": 173182, "epoch": 4123} {"train_loss": -6.963893890380859, "global_step": 173183, "epoch": 4123} {"train_loss": -7.008314609527588, "global_step": 173184, "epoch": 4123} {"train_loss": -6.976789951324463, "global_step": 173185, "epoch": 4123} {"train_loss": -7.0720906257629395, "global_step": 173186, "epoch": 4123} {"train_loss": -6.986233711242676, "global_step": 173187, "epoch": 4123} {"train_loss": -6.947092056274414, "global_step": 173188, "epoch": 4123} {"train_loss": -6.9250640869140625, "global_step": 173189, "epoch": 4123} {"train_loss": -6.993537902832031, "global_step": 173190, "epoch": 4123} {"train_loss": -6.907271385192871, "global_step": 173191, "epoch": 4123} {"train_loss": -6.831878185272217, "global_step": 173192, "epoch": 4123} {"train_loss": -6.988527297973633, "global_step": 173193, "epoch": 4123} {"train_loss": -7.091143608093262, "global_step": 173194, "epoch": 4123} {"train_loss": -7.065159797668457, "global_step": 173195, "epoch": 4123} {"train_loss": -6.911620140075684, "global_step": 173196, "epoch": 4123} {"train_loss": -6.9962873458862305, "global_step": 173197, "epoch": 4123} {"train_loss": -7.002778053283691, "global_step": 173198, "epoch": 4123} {"train_loss": -6.992698669433594, "global_step": 173199, "epoch": 4123} {"train_loss": -7.013739109039307, "global_step": 173200, "epoch": 4123} {"train_loss": -7.033997535705566, "global_step": 173201, "epoch": 4123} {"train_loss": -7.014700889587402, "global_step": 173202, "epoch": 4123} {"train_loss": -7.06781005859375, "global_step": 173203, "epoch": 4123} {"train_loss": -7.10295295715332, "global_step": 173204, "epoch": 4123} {"train_loss": -7.053894519805908, "global_step": 173205, "epoch": 4123} {"train_loss": -7.101922035217285, "global_step": 173206, "epoch": 4123} {"train_loss": -7.000473885309129, "global_step": 173207, "epoch": 4123, "val_loss": 68465.0234375} {"train_loss": -7.043990135192871, "global_step": 173208, "epoch": 4124} {"train_loss": -7.046133995056152, "global_step": 173209, "epoch": 4124} {"train_loss": -7.025609493255615, "global_step": 173210, "epoch": 4124} {"train_loss": -6.967719554901123, "global_step": 173211, "epoch": 4124} {"train_loss": -7.103416442871094, "global_step": 173212, "epoch": 4124} {"train_loss": -6.947146415710449, "global_step": 173213, "epoch": 4124} {"train_loss": -7.07299280166626, "global_step": 173214, "epoch": 4124} {"train_loss": -7.120194435119629, "global_step": 173215, "epoch": 4124} {"train_loss": -6.952406883239746, "global_step": 173216, "epoch": 4124} {"train_loss": -7.076350688934326, "global_step": 173217, "epoch": 4124} {"train_loss": -6.946286678314209, "global_step": 173218, "epoch": 4124} {"train_loss": -6.965663909912109, "global_step": 173219, "epoch": 4124} {"train_loss": -6.895990371704102, "global_step": 173220, "epoch": 4124} {"train_loss": -6.98166561126709, "global_step": 173221, "epoch": 4124} {"train_loss": -6.954345703125, "global_step": 173222, "epoch": 4124} {"train_loss": -6.982422351837158, "global_step": 173223, "epoch": 4124} {"train_loss": -6.875998497009277, "global_step": 173224, "epoch": 4124} {"train_loss": -7.004728317260742, "global_step": 173225, "epoch": 4124} {"train_loss": -7.063957691192627, "global_step": 173226, "epoch": 4124} {"train_loss": -7.086921691894531, "global_step": 173227, "epoch": 4124} {"train_loss": -7.038933753967285, "global_step": 173228, "epoch": 4124} {"train_loss": -7.144983291625977, "global_step": 173229, "epoch": 4124} {"train_loss": -6.96237850189209, "global_step": 173230, "epoch": 4124} {"train_loss": -6.983151435852051, "global_step": 173231, "epoch": 4124} {"train_loss": -6.987537384033203, "global_step": 173232, "epoch": 4124} {"train_loss": -7.062048435211182, "global_step": 173233, "epoch": 4124} {"train_loss": -6.946266174316406, "global_step": 173234, "epoch": 4124} {"train_loss": -6.913463115692139, "global_step": 173235, "epoch": 4124} {"train_loss": -7.165356636047363, "global_step": 173236, "epoch": 4124} {"train_loss": -7.0239033699035645, "global_step": 173237, "epoch": 4124} {"train_loss": -7.047745704650879, "global_step": 173238, "epoch": 4124} {"train_loss": -7.031951427459717, "global_step": 173239, "epoch": 4124} {"train_loss": -6.989953994750977, "global_step": 173240, "epoch": 4124} {"train_loss": -7.136454105377197, "global_step": 173241, "epoch": 4124} {"train_loss": -7.038552284240723, "global_step": 173242, "epoch": 4124} {"train_loss": -7.025507926940918, "global_step": 173243, "epoch": 4124} {"train_loss": -7.119372367858887, "global_step": 173244, "epoch": 4124} {"train_loss": -7.035784721374512, "global_step": 173245, "epoch": 4124} {"train_loss": -7.030426979064941, "global_step": 173246, "epoch": 4124} {"train_loss": -7.0366291999816895, "global_step": 173247, "epoch": 4124} {"train_loss": -6.9146904945373535, "global_step": 173248, "epoch": 4124} {"train_loss": -7.018505209968204, "global_step": 173249, "epoch": 4124, "val_loss": 68605.6640625} {"train_loss": -7.037642478942871, "global_step": 173250, "epoch": 4125} {"train_loss": -7.023708343505859, "global_step": 173251, "epoch": 4125} {"train_loss": -7.150631904602051, "global_step": 173252, "epoch": 4125} {"train_loss": -7.051093101501465, "global_step": 173253, "epoch": 4125} {"train_loss": -7.047964096069336, "global_step": 173254, "epoch": 4125} {"train_loss": -7.091734409332275, "global_step": 173255, "epoch": 4125} {"train_loss": -7.037240982055664, "global_step": 173256, "epoch": 4125} {"train_loss": -7.073764801025391, "global_step": 173257, "epoch": 4125} {"train_loss": -7.062060356140137, "global_step": 173258, "epoch": 4125} {"train_loss": -6.962900161743164, "global_step": 173259, "epoch": 4125} {"train_loss": -6.971487998962402, "global_step": 173260, "epoch": 4125} {"train_loss": -7.001526355743408, "global_step": 173261, "epoch": 4125} {"train_loss": -7.011682510375977, "global_step": 173262, "epoch": 4125} {"train_loss": -7.050684928894043, "global_step": 173263, "epoch": 4125} {"train_loss": -7.120348930358887, "global_step": 173264, "epoch": 4125} {"train_loss": -7.040426254272461, "global_step": 173265, "epoch": 4125} {"train_loss": -7.0784125328063965, "global_step": 173266, "epoch": 4125} {"train_loss": -7.098832607269287, "global_step": 173267, "epoch": 4125} {"train_loss": -7.085456848144531, "global_step": 173268, "epoch": 4125} {"train_loss": -7.005566596984863, "global_step": 173269, "epoch": 4125} {"train_loss": -6.97735595703125, "global_step": 173270, "epoch": 4125} {"train_loss": -7.134705543518066, "global_step": 173271, "epoch": 4125} {"train_loss": -7.022943019866943, "global_step": 173272, "epoch": 4125} {"train_loss": -7.011185646057129, "global_step": 173273, "epoch": 4125} {"train_loss": -7.154104232788086, "global_step": 173274, "epoch": 4125} {"train_loss": -7.033164024353027, "global_step": 173275, "epoch": 4125} {"train_loss": -7.084874629974365, "global_step": 173276, "epoch": 4125} {"train_loss": -7.067502498626709, "global_step": 173277, "epoch": 4125} {"train_loss": -7.065127372741699, "global_step": 173278, "epoch": 4125} {"train_loss": -6.995656490325928, "global_step": 173279, "epoch": 4125} {"train_loss": -6.8719587326049805, "global_step": 173280, "epoch": 4125} {"train_loss": -7.0033087730407715, "global_step": 173281, "epoch": 4125} {"train_loss": -6.818429946899414, "global_step": 173282, "epoch": 4125} {"train_loss": -6.899727821350098, "global_step": 173283, "epoch": 4125} {"train_loss": -6.9414448738098145, "global_step": 173284, "epoch": 4125} {"train_loss": -6.7983927726745605, "global_step": 173285, "epoch": 4125} {"train_loss": -6.995290756225586, "global_step": 173286, "epoch": 4125} {"train_loss": -6.924867630004883, "global_step": 173287, "epoch": 4125} {"train_loss": -6.937705993652344, "global_step": 173288, "epoch": 4125} {"train_loss": -6.849118232727051, "global_step": 173289, "epoch": 4125} {"train_loss": -6.985865592956543, "global_step": 173290, "epoch": 4125} {"train_loss": -7.010875679197765, "global_step": 173291, "epoch": 4125, "val_loss": 68518.6015625} {"train_loss": -6.872805595397949, "global_step": 173292, "epoch": 4126} {"train_loss": -7.06749153137207, "global_step": 173293, "epoch": 4126} {"train_loss": -7.032073020935059, "global_step": 173294, "epoch": 4126} {"train_loss": -6.9360833168029785, "global_step": 173295, "epoch": 4126} {"train_loss": -6.9935407638549805, "global_step": 173296, "epoch": 4126} {"train_loss": -6.982855796813965, "global_step": 173297, "epoch": 4126} {"train_loss": -7.060006141662598, "global_step": 173298, "epoch": 4126} {"train_loss": -6.9459943771362305, "global_step": 173299, "epoch": 4126} {"train_loss": -7.043545722961426, "global_step": 173300, "epoch": 4126} {"train_loss": -7.078910827636719, "global_step": 173301, "epoch": 4126} {"train_loss": -6.976325035095215, "global_step": 173302, "epoch": 4126} {"train_loss": -6.891674995422363, "global_step": 173303, "epoch": 4126} {"train_loss": -7.031026840209961, "global_step": 173304, "epoch": 4126} {"train_loss": -7.046968460083008, "global_step": 173305, "epoch": 4126} {"train_loss": -6.945488929748535, "global_step": 173306, "epoch": 4126} {"train_loss": -6.9602837562561035, "global_step": 173307, "epoch": 4126} {"train_loss": -6.99283504486084, "global_step": 173308, "epoch": 4126} {"train_loss": -7.002761363983154, "global_step": 173309, "epoch": 4126} {"train_loss": -7.105107307434082, "global_step": 173310, "epoch": 4126} {"train_loss": -6.979536533355713, "global_step": 173311, "epoch": 4126} {"train_loss": -7.004530906677246, "global_step": 173312, "epoch": 4126} {"train_loss": -7.030545234680176, "global_step": 173313, "epoch": 4126} {"train_loss": -7.056146621704102, "global_step": 173314, "epoch": 4126} {"train_loss": -7.046706199645996, "global_step": 173315, "epoch": 4126} {"train_loss": -6.958698272705078, "global_step": 173316, "epoch": 4126} {"train_loss": -7.093968391418457, "global_step": 173317, "epoch": 4126} {"train_loss": -6.964920520782471, "global_step": 173318, "epoch": 4126} {"train_loss": -6.98328971862793, "global_step": 173319, "epoch": 4126} {"train_loss": -6.949592113494873, "global_step": 173320, "epoch": 4126} {"train_loss": -6.961925506591797, "global_step": 173321, "epoch": 4126} {"train_loss": -7.011214256286621, "global_step": 173322, "epoch": 4126} {"train_loss": -6.957004070281982, "global_step": 173323, "epoch": 4126} {"train_loss": -6.958914756774902, "global_step": 173324, "epoch": 4126} {"train_loss": -6.989442825317383, "global_step": 173325, "epoch": 4126} {"train_loss": -6.9982147216796875, "global_step": 173326, "epoch": 4126} {"train_loss": -7.016060829162598, "global_step": 173327, "epoch": 4126} {"train_loss": -7.04910945892334, "global_step": 173328, "epoch": 4126} {"train_loss": -7.040624618530273, "global_step": 173329, "epoch": 4126} {"train_loss": -7.0269622802734375, "global_step": 173330, "epoch": 4126} {"train_loss": -6.936863422393799, "global_step": 173331, "epoch": 4126} {"train_loss": -7.066710472106934, "global_step": 173332, "epoch": 4126} {"train_loss": -6.9989006859915595, "global_step": 173333, "epoch": 4126, "val_loss": 68721.484375} {"train_loss": -6.995681285858154, "global_step": 173334, "epoch": 4127} {"train_loss": -6.964460849761963, "global_step": 173335, "epoch": 4127} {"train_loss": -7.043985843658447, "global_step": 173336, "epoch": 4127} {"train_loss": -7.025607109069824, "global_step": 173337, "epoch": 4127} {"train_loss": -6.996249675750732, "global_step": 173338, "epoch": 4127} {"train_loss": -6.950167179107666, "global_step": 173339, "epoch": 4127} {"train_loss": -7.037863254547119, "global_step": 173340, "epoch": 4127} {"train_loss": -6.995528697967529, "global_step": 173341, "epoch": 4127} {"train_loss": -6.870236396789551, "global_step": 173342, "epoch": 4127} {"train_loss": -6.9368085861206055, "global_step": 173343, "epoch": 4127} {"train_loss": -7.033487319946289, "global_step": 173344, "epoch": 4127} {"train_loss": -6.873350143432617, "global_step": 173345, "epoch": 4127} {"train_loss": -6.884504318237305, "global_step": 173346, "epoch": 4127} {"train_loss": -6.94171142578125, "global_step": 173347, "epoch": 4127} {"train_loss": -7.041132926940918, "global_step": 173348, "epoch": 4127} {"train_loss": -6.816171169281006, "global_step": 173349, "epoch": 4127} {"train_loss": -6.930501461029053, "global_step": 173350, "epoch": 4127} {"train_loss": -7.097366809844971, "global_step": 173351, "epoch": 4127} {"train_loss": -6.8918046951293945, "global_step": 173352, "epoch": 4127} {"train_loss": -6.930652618408203, "global_step": 173353, "epoch": 4127} {"train_loss": -7.02803373336792, "global_step": 173354, "epoch": 4127} {"train_loss": -6.965536594390869, "global_step": 173355, "epoch": 4127} {"train_loss": -6.913763999938965, "global_step": 173356, "epoch": 4127} {"train_loss": -7.016959190368652, "global_step": 173357, "epoch": 4127} {"train_loss": -6.857867240905762, "global_step": 173358, "epoch": 4127} {"train_loss": -6.942678928375244, "global_step": 173359, "epoch": 4127} {"train_loss": -6.997217178344727, "global_step": 173360, "epoch": 4127} {"train_loss": -6.903750419616699, "global_step": 173361, "epoch": 4127} {"train_loss": -6.939692497253418, "global_step": 173362, "epoch": 4127} {"train_loss": -6.963268280029297, "global_step": 173363, "epoch": 4127} {"train_loss": -7.034216403961182, "global_step": 173364, "epoch": 4127} {"train_loss": -7.078799724578857, "global_step": 173365, "epoch": 4127} {"train_loss": -6.929720878601074, "global_step": 173366, "epoch": 4127} {"train_loss": -6.9158854484558105, "global_step": 173367, "epoch": 4127} {"train_loss": -6.996131896972656, "global_step": 173368, "epoch": 4127} {"train_loss": -6.946218490600586, "global_step": 173369, "epoch": 4127} {"train_loss": -7.072176933288574, "global_step": 173370, "epoch": 4127} {"train_loss": -6.842329978942871, "global_step": 173371, "epoch": 4127} {"train_loss": -7.090517997741699, "global_step": 173372, "epoch": 4127} {"train_loss": -6.930484294891357, "global_step": 173373, "epoch": 4127} {"train_loss": -6.926029682159424, "global_step": 173374, "epoch": 4127} {"train_loss": -6.963571389516194, "global_step": 173375, "epoch": 4127, "val_loss": 68599.28125} {"train_loss": -6.9405436515808105, "global_step": 173376, "epoch": 4128} {"train_loss": -7.053327560424805, "global_step": 173377, "epoch": 4128} {"train_loss": -6.9907755851745605, "global_step": 173378, "epoch": 4128} {"train_loss": -6.989773273468018, "global_step": 173379, "epoch": 4128} {"train_loss": -6.9143967628479, "global_step": 173380, "epoch": 4128} {"train_loss": -6.804174900054932, "global_step": 173381, "epoch": 4128} {"train_loss": -6.969780445098877, "global_step": 173382, "epoch": 4128} {"train_loss": -6.910905361175537, "global_step": 173383, "epoch": 4128} {"train_loss": -6.8646697998046875, "global_step": 173384, "epoch": 4128} {"train_loss": -6.949435234069824, "global_step": 173385, "epoch": 4128} {"train_loss": -7.070280075073242, "global_step": 173386, "epoch": 4128} {"train_loss": -7.003405570983887, "global_step": 173387, "epoch": 4128} {"train_loss": -7.002714157104492, "global_step": 173388, "epoch": 4128} {"train_loss": -7.130538463592529, "global_step": 173389, "epoch": 4128} {"train_loss": -7.143781661987305, "global_step": 173390, "epoch": 4128} {"train_loss": -7.070071220397949, "global_step": 173391, "epoch": 4128} {"train_loss": -6.9834699630737305, "global_step": 173392, "epoch": 4128} {"train_loss": -7.010570526123047, "global_step": 173393, "epoch": 4128} {"train_loss": -7.075311660766602, "global_step": 173394, "epoch": 4128} {"train_loss": -7.054376602172852, "global_step": 173395, "epoch": 4128} {"train_loss": -7.001995086669922, "global_step": 173396, "epoch": 4128} {"train_loss": -7.017871856689453, "global_step": 173397, "epoch": 4128} {"train_loss": -7.104361534118652, "global_step": 173398, "epoch": 4128} {"train_loss": -7.050915718078613, "global_step": 173399, "epoch": 4128} {"train_loss": -6.997705459594727, "global_step": 173400, "epoch": 4128} {"train_loss": -7.022324562072754, "global_step": 173401, "epoch": 4128} {"train_loss": -6.98214054107666, "global_step": 173402, "epoch": 4128} {"train_loss": -7.163474082946777, "global_step": 173403, "epoch": 4128} {"train_loss": -7.176987171173096, "global_step": 173404, "epoch": 4128} {"train_loss": -6.996171951293945, "global_step": 173405, "epoch": 4128} {"train_loss": -7.071269512176514, "global_step": 173406, "epoch": 4128} {"train_loss": -6.8944172859191895, "global_step": 173407, "epoch": 4128} {"train_loss": -7.026317596435547, "global_step": 173408, "epoch": 4128} {"train_loss": -7.126474857330322, "global_step": 173409, "epoch": 4128} {"train_loss": -7.066932678222656, "global_step": 173410, "epoch": 4128} {"train_loss": -7.073269844055176, "global_step": 173411, "epoch": 4128} {"train_loss": -6.978842735290527, "global_step": 173412, "epoch": 4128} {"train_loss": -7.0613813400268555, "global_step": 173413, "epoch": 4128} {"train_loss": -6.933130264282227, "global_step": 173414, "epoch": 4128} {"train_loss": -7.068846702575684, "global_step": 173415, "epoch": 4128} {"train_loss": -7.113467693328857, "global_step": 173416, "epoch": 4128} {"train_loss": -7.020747139340355, "global_step": 173417, "epoch": 4128, "val_loss": 68594.34375} {"train_loss": -7.085103988647461, "global_step": 173418, "epoch": 4129} {"train_loss": -7.078285217285156, "global_step": 173419, "epoch": 4129} {"train_loss": -6.915521144866943, "global_step": 173420, "epoch": 4129} {"train_loss": -7.091365337371826, "global_step": 173421, "epoch": 4129} {"train_loss": -7.084795951843262, "global_step": 173422, "epoch": 4129} {"train_loss": -6.987274646759033, "global_step": 173423, "epoch": 4129} {"train_loss": -7.021895885467529, "global_step": 173424, "epoch": 4129} {"train_loss": -7.092491149902344, "global_step": 173425, "epoch": 4129} {"train_loss": -6.99268913269043, "global_step": 173426, "epoch": 4129} {"train_loss": -7.042835712432861, "global_step": 173427, "epoch": 4129} {"train_loss": -7.039188385009766, "global_step": 173428, "epoch": 4129} {"train_loss": -7.075249671936035, "global_step": 173429, "epoch": 4129} {"train_loss": -7.059179782867432, "global_step": 173430, "epoch": 4129} {"train_loss": -6.9975385665893555, "global_step": 173431, "epoch": 4129} {"train_loss": -7.145599365234375, "global_step": 173432, "epoch": 4129} {"train_loss": -7.058086395263672, "global_step": 173433, "epoch": 4129} {"train_loss": -7.054111957550049, "global_step": 173434, "epoch": 4129} {"train_loss": -7.048272132873535, "global_step": 173435, "epoch": 4129} {"train_loss": -7.086705207824707, "global_step": 173436, "epoch": 4129} {"train_loss": -7.019000053405762, "global_step": 173437, "epoch": 4129} {"train_loss": -6.950436592102051, "global_step": 173438, "epoch": 4129} {"train_loss": -7.103119850158691, "global_step": 173439, "epoch": 4129} {"train_loss": -6.982427597045898, "global_step": 173440, "epoch": 4129} {"train_loss": -7.0858917236328125, "global_step": 173441, "epoch": 4129} {"train_loss": -7.107681751251221, "global_step": 173442, "epoch": 4129} {"train_loss": -7.108412742614746, "global_step": 173443, "epoch": 4129} {"train_loss": -7.111889362335205, "global_step": 173444, "epoch": 4129} {"train_loss": -7.0953755378723145, "global_step": 173445, "epoch": 4129} {"train_loss": -7.078264236450195, "global_step": 173446, "epoch": 4129} {"train_loss": -7.134279251098633, "global_step": 173447, "epoch": 4129} {"train_loss": -7.075621604919434, "global_step": 173448, "epoch": 4129} {"train_loss": -7.0680389404296875, "global_step": 173449, "epoch": 4129} {"train_loss": -7.049476623535156, "global_step": 173450, "epoch": 4129} {"train_loss": -7.06744384765625, "global_step": 173451, "epoch": 4129} {"train_loss": -7.09286642074585, "global_step": 173452, "epoch": 4129} {"train_loss": -7.120391845703125, "global_step": 173453, "epoch": 4129} {"train_loss": -7.060359954833984, "global_step": 173454, "epoch": 4129} {"train_loss": -7.048234939575195, "global_step": 173455, "epoch": 4129} {"train_loss": -7.02130126953125, "global_step": 173456, "epoch": 4129} {"train_loss": -7.043785095214844, "global_step": 173457, "epoch": 4129} {"train_loss": -7.077153205871582, "global_step": 173458, "epoch": 4129} {"train_loss": -7.0534148670378185, "global_step": 173459, "epoch": 4129, "val_loss": 68744.5} {"train_loss": -6.840003967285156, "global_step": 173460, "epoch": 4130} {"train_loss": -7.0513715744018555, "global_step": 173461, "epoch": 4130} {"train_loss": -6.999068260192871, "global_step": 173462, "epoch": 4130} {"train_loss": -7.000284194946289, "global_step": 173463, "epoch": 4130} {"train_loss": -7.030621528625488, "global_step": 173464, "epoch": 4130} {"train_loss": -7.056329727172852, "global_step": 173465, "epoch": 4130} {"train_loss": -7.067019462585449, "global_step": 173466, "epoch": 4130} {"train_loss": -7.057600021362305, "global_step": 173467, "epoch": 4130} {"train_loss": -6.95705509185791, "global_step": 173468, "epoch": 4130} {"train_loss": -7.033494472503662, "global_step": 173469, "epoch": 4130} {"train_loss": -6.993947982788086, "global_step": 173470, "epoch": 4130} {"train_loss": -7.022911071777344, "global_step": 173471, "epoch": 4130} {"train_loss": -7.043641567230225, "global_step": 173472, "epoch": 4130} {"train_loss": -7.074117183685303, "global_step": 173473, "epoch": 4130} {"train_loss": -6.976670265197754, "global_step": 173474, "epoch": 4130} {"train_loss": -7.0800251960754395, "global_step": 173475, "epoch": 4130} {"train_loss": -7.051247596740723, "global_step": 173476, "epoch": 4130} {"train_loss": -6.99156379699707, "global_step": 173477, "epoch": 4130} {"train_loss": -7.146093368530273, "global_step": 173478, "epoch": 4130} {"train_loss": -7.104726314544678, "global_step": 173479, "epoch": 4130} {"train_loss": -7.184870719909668, "global_step": 173480, "epoch": 4130} {"train_loss": -7.070683002471924, "global_step": 173481, "epoch": 4130} {"train_loss": -6.953807830810547, "global_step": 173482, "epoch": 4130} {"train_loss": -7.0192742347717285, "global_step": 173483, "epoch": 4130} {"train_loss": -7.095205307006836, "global_step": 173484, "epoch": 4130} {"train_loss": -7.008784770965576, "global_step": 173485, "epoch": 4130} {"train_loss": -6.921206474304199, "global_step": 173486, "epoch": 4130} {"train_loss": -6.942152500152588, "global_step": 173487, "epoch": 4130} {"train_loss": -7.002992630004883, "global_step": 173488, "epoch": 4130} {"train_loss": -6.973134517669678, "global_step": 173489, "epoch": 4130} {"train_loss": -6.9857282638549805, "global_step": 173490, "epoch": 4130} {"train_loss": -7.022844314575195, "global_step": 173491, "epoch": 4130} {"train_loss": -7.0820465087890625, "global_step": 173492, "epoch": 4130} {"train_loss": -6.97550106048584, "global_step": 173493, "epoch": 4130} {"train_loss": -6.965222358703613, "global_step": 173494, "epoch": 4130} {"train_loss": -7.025467395782471, "global_step": 173495, "epoch": 4130} {"train_loss": -7.065798759460449, "global_step": 173496, "epoch": 4130} {"train_loss": -6.912445068359375, "global_step": 173497, "epoch": 4130} {"train_loss": -7.024905204772949, "global_step": 173498, "epoch": 4130} {"train_loss": -6.989765644073486, "global_step": 173499, "epoch": 4130} {"train_loss": -6.897572994232178, "global_step": 173500, "epoch": 4130} {"train_loss": -7.015047572907948, "global_step": 173501, "epoch": 4130, "val_loss": 68762.515625} {"train_loss": -6.940719127655029, "global_step": 173502, "epoch": 4131} {"train_loss": -7.0256547927856445, "global_step": 173503, "epoch": 4131} {"train_loss": -6.903613090515137, "global_step": 173504, "epoch": 4131} {"train_loss": -6.9015045166015625, "global_step": 173505, "epoch": 4131} {"train_loss": -6.97880744934082, "global_step": 173506, "epoch": 4131} {"train_loss": -6.8971076011657715, "global_step": 173507, "epoch": 4131} {"train_loss": -6.851075172424316, "global_step": 173508, "epoch": 4131} {"train_loss": -6.865199089050293, "global_step": 173509, "epoch": 4131} {"train_loss": -6.816834449768066, "global_step": 173510, "epoch": 4131} {"train_loss": -7.051583290100098, "global_step": 173511, "epoch": 4131} {"train_loss": -6.800329208374023, "global_step": 173512, "epoch": 4131} {"train_loss": -7.004176139831543, "global_step": 173513, "epoch": 4131} {"train_loss": -6.8629255294799805, "global_step": 173514, "epoch": 4131} {"train_loss": -6.899482250213623, "global_step": 173515, "epoch": 4131} {"train_loss": -6.898747444152832, "global_step": 173516, "epoch": 4131} {"train_loss": -6.986977577209473, "global_step": 173517, "epoch": 4131} {"train_loss": -7.0065131187438965, "global_step": 173518, "epoch": 4131} {"train_loss": -6.967970848083496, "global_step": 173519, "epoch": 4131} {"train_loss": -6.908384323120117, "global_step": 173520, "epoch": 4131} {"train_loss": -6.975893497467041, "global_step": 173521, "epoch": 4131} {"train_loss": -6.994085311889648, "global_step": 173522, "epoch": 4131} {"train_loss": -7.011714935302734, "global_step": 173523, "epoch": 4131} {"train_loss": -6.951373100280762, "global_step": 173524, "epoch": 4131} {"train_loss": -6.935205936431885, "global_step": 173525, "epoch": 4131} {"train_loss": -6.985749244689941, "global_step": 173526, "epoch": 4131} {"train_loss": -6.9602155685424805, "global_step": 173527, "epoch": 4131} {"train_loss": -7.051922798156738, "global_step": 173528, "epoch": 4131} {"train_loss": -7.090495586395264, "global_step": 173529, "epoch": 4131} {"train_loss": -6.989262580871582, "global_step": 173530, "epoch": 4131} {"train_loss": -7.068214416503906, "global_step": 173531, "epoch": 4131} {"train_loss": -7.013383865356445, "global_step": 173532, "epoch": 4131} {"train_loss": -7.077415943145752, "global_step": 173533, "epoch": 4131} {"train_loss": -7.024525165557861, "global_step": 173534, "epoch": 4131} {"train_loss": -7.073199272155762, "global_step": 173535, "epoch": 4131} {"train_loss": -6.970744609832764, "global_step": 173536, "epoch": 4131} {"train_loss": -7.016307830810547, "global_step": 173537, "epoch": 4131} {"train_loss": -6.963747978210449, "global_step": 173538, "epoch": 4131} {"train_loss": -7.086544513702393, "global_step": 173539, "epoch": 4131} {"train_loss": -7.029082298278809, "global_step": 173540, "epoch": 4131} {"train_loss": -7.021210193634033, "global_step": 173541, "epoch": 4131} {"train_loss": -7.122433185577393, "global_step": 173542, "epoch": 4131} {"train_loss": -6.976054066703433, "global_step": 173543, "epoch": 4131, "val_loss": 68594.5390625} {"train_loss": -6.964529991149902, "global_step": 173544, "epoch": 4132} {"train_loss": -7.099836349487305, "global_step": 173545, "epoch": 4132} {"train_loss": -7.0539751052856445, "global_step": 173546, "epoch": 4132} {"train_loss": -7.109409809112549, "global_step": 173547, "epoch": 4132} {"train_loss": -7.019445419311523, "global_step": 173548, "epoch": 4132} {"train_loss": -6.97402286529541, "global_step": 173549, "epoch": 4132} {"train_loss": -6.91948938369751, "global_step": 173550, "epoch": 4132} {"train_loss": -7.057518005371094, "global_step": 173551, "epoch": 4132} {"train_loss": -7.026382923126221, "global_step": 173552, "epoch": 4132} {"train_loss": -6.960046291351318, "global_step": 173553, "epoch": 4132} {"train_loss": -7.043315410614014, "global_step": 173554, "epoch": 4132} {"train_loss": -7.013546943664551, "global_step": 173555, "epoch": 4132} {"train_loss": -6.982786178588867, "global_step": 173556, "epoch": 4132} {"train_loss": -6.988399982452393, "global_step": 173557, "epoch": 4132} {"train_loss": -7.024449825286865, "global_step": 173558, "epoch": 4132} {"train_loss": -6.925012588500977, "global_step": 173559, "epoch": 4132} {"train_loss": -7.079401016235352, "global_step": 173560, "epoch": 4132} {"train_loss": -6.993610382080078, "global_step": 173561, "epoch": 4132} {"train_loss": -7.018974304199219, "global_step": 173562, "epoch": 4132} {"train_loss": -7.018108367919922, "global_step": 173563, "epoch": 4132} {"train_loss": -7.141922950744629, "global_step": 173564, "epoch": 4132} {"train_loss": -7.061418056488037, "global_step": 173565, "epoch": 4132} {"train_loss": -7.008845806121826, "global_step": 173566, "epoch": 4132} {"train_loss": -7.079824447631836, "global_step": 173567, "epoch": 4132} {"train_loss": -6.986094951629639, "global_step": 173568, "epoch": 4132} {"train_loss": -7.143726348876953, "global_step": 173569, "epoch": 4132} {"train_loss": -7.050134658813477, "global_step": 173570, "epoch": 4132} {"train_loss": -7.058846950531006, "global_step": 173571, "epoch": 4132} {"train_loss": -7.049923896789551, "global_step": 173572, "epoch": 4132} {"train_loss": -7.070827484130859, "global_step": 173573, "epoch": 4132} {"train_loss": -6.9744343757629395, "global_step": 173574, "epoch": 4132} {"train_loss": -6.952181816101074, "global_step": 173575, "epoch": 4132} {"train_loss": -7.102578639984131, "global_step": 173576, "epoch": 4132} {"train_loss": -7.0288987159729, "global_step": 173577, "epoch": 4132} {"train_loss": -7.129386901855469, "global_step": 173578, "epoch": 4132} {"train_loss": -6.997350692749023, "global_step": 173579, "epoch": 4132} {"train_loss": -6.995383262634277, "global_step": 173580, "epoch": 4132} {"train_loss": -7.021151542663574, "global_step": 173581, "epoch": 4132} {"train_loss": -6.985487937927246, "global_step": 173582, "epoch": 4132} {"train_loss": -7.070328235626221, "global_step": 173583, "epoch": 4132} {"train_loss": -7.07406759262085, "global_step": 173584, "epoch": 4132} {"train_loss": -7.0330080304827005, "global_step": 173585, "epoch": 4132, "val_loss": 68675.296875} {"train_loss": -7.153730392456055, "global_step": 173586, "epoch": 4133} {"train_loss": -7.091126441955566, "global_step": 173587, "epoch": 4133} {"train_loss": -7.137681484222412, "global_step": 173588, "epoch": 4133} {"train_loss": -7.086139678955078, "global_step": 173589, "epoch": 4133} {"train_loss": -6.831148147583008, "global_step": 173590, "epoch": 4133} {"train_loss": -7.040247917175293, "global_step": 173591, "epoch": 4133} {"train_loss": -6.923505783081055, "global_step": 173592, "epoch": 4133} {"train_loss": -6.7941083908081055, "global_step": 173593, "epoch": 4133} {"train_loss": -6.852086067199707, "global_step": 173594, "epoch": 4133} {"train_loss": -6.940248966217041, "global_step": 173595, "epoch": 4133} {"train_loss": -6.880642890930176, "global_step": 173596, "epoch": 4133} {"train_loss": -6.950020790100098, "global_step": 173597, "epoch": 4133} {"train_loss": -6.958188056945801, "global_step": 173598, "epoch": 4133} {"train_loss": -7.006213188171387, "global_step": 173599, "epoch": 4133} {"train_loss": -6.996191024780273, "global_step": 173600, "epoch": 4133} {"train_loss": -6.9901041984558105, "global_step": 173601, "epoch": 4133} {"train_loss": -7.021954536437988, "global_step": 173602, "epoch": 4133} {"train_loss": -7.0380682945251465, "global_step": 173603, "epoch": 4133} {"train_loss": -6.937090873718262, "global_step": 173604, "epoch": 4133} {"train_loss": -6.959131717681885, "global_step": 173605, "epoch": 4133} {"train_loss": -6.915131092071533, "global_step": 173606, "epoch": 4133} {"train_loss": -6.831914901733398, "global_step": 173607, "epoch": 4133} {"train_loss": -7.0175862312316895, "global_step": 173608, "epoch": 4133} {"train_loss": -6.9563212394714355, "global_step": 173609, "epoch": 4133} {"train_loss": -6.961490631103516, "global_step": 173610, "epoch": 4133} {"train_loss": -6.89277458190918, "global_step": 173611, "epoch": 4133} {"train_loss": -7.082433700561523, "global_step": 173612, "epoch": 4133} {"train_loss": -6.826320648193359, "global_step": 173613, "epoch": 4133} {"train_loss": -6.9416937828063965, "global_step": 173614, "epoch": 4133} {"train_loss": -7.013506889343262, "global_step": 173615, "epoch": 4133} {"train_loss": -6.971050262451172, "global_step": 173616, "epoch": 4133} {"train_loss": -6.984708309173584, "global_step": 173617, "epoch": 4133} {"train_loss": -7.056138515472412, "global_step": 173618, "epoch": 4133} {"train_loss": -7.000840663909912, "global_step": 173619, "epoch": 4133} {"train_loss": -7.018701553344727, "global_step": 173620, "epoch": 4133} {"train_loss": -7.0908355712890625, "global_step": 173621, "epoch": 4133} {"train_loss": -6.966203689575195, "global_step": 173622, "epoch": 4133} {"train_loss": -7.013240814208984, "global_step": 173623, "epoch": 4133} {"train_loss": -7.016714096069336, "global_step": 173624, "epoch": 4133} {"train_loss": -6.856569766998291, "global_step": 173625, "epoch": 4133} {"train_loss": -6.9016618728637695, "global_step": 173626, "epoch": 4133} {"train_loss": -6.971632355735416, "global_step": 173627, "epoch": 4133, "val_loss": 68757.5} {"train_loss": -6.868436813354492, "global_step": 173628, "epoch": 4134} {"train_loss": -6.99954891204834, "global_step": 173629, "epoch": 4134} {"train_loss": -6.975544452667236, "global_step": 173630, "epoch": 4134} {"train_loss": -6.982928276062012, "global_step": 173631, "epoch": 4134} {"train_loss": -7.1631622314453125, "global_step": 173632, "epoch": 4134} {"train_loss": -6.942942142486572, "global_step": 173633, "epoch": 4134} {"train_loss": -6.966409683227539, "global_step": 173634, "epoch": 4134} {"train_loss": -7.0241899490356445, "global_step": 173635, "epoch": 4134} {"train_loss": -6.942021369934082, "global_step": 173636, "epoch": 4134} {"train_loss": -6.98497200012207, "global_step": 173637, "epoch": 4134} {"train_loss": -6.955101013183594, "global_step": 173638, "epoch": 4134} {"train_loss": -7.014042854309082, "global_step": 173639, "epoch": 4134} {"train_loss": -6.9967756271362305, "global_step": 173640, "epoch": 4134} {"train_loss": -7.080121994018555, "global_step": 173641, "epoch": 4134} {"train_loss": -6.943280220031738, "global_step": 173642, "epoch": 4134} {"train_loss": -7.028016090393066, "global_step": 173643, "epoch": 4134} {"train_loss": -6.935203552246094, "global_step": 173644, "epoch": 4134} {"train_loss": -6.9663801193237305, "global_step": 173645, "epoch": 4134} {"train_loss": -7.035749435424805, "global_step": 173646, "epoch": 4134} {"train_loss": -6.935800075531006, "global_step": 173647, "epoch": 4134} {"train_loss": -6.94816780090332, "global_step": 173648, "epoch": 4134} {"train_loss": -7.165178298950195, "global_step": 173649, "epoch": 4134} {"train_loss": -6.906550407409668, "global_step": 173650, "epoch": 4134} {"train_loss": -6.981489181518555, "global_step": 173651, "epoch": 4134} {"train_loss": -7.002017498016357, "global_step": 173652, "epoch": 4134} {"train_loss": -7.047168731689453, "global_step": 173653, "epoch": 4134} {"train_loss": -7.153862953186035, "global_step": 173654, "epoch": 4134} {"train_loss": -7.013233184814453, "global_step": 173655, "epoch": 4134} {"train_loss": -6.931253910064697, "global_step": 173656, "epoch": 4134} {"train_loss": -7.0834760665893555, "global_step": 173657, "epoch": 4134} {"train_loss": -7.0490570068359375, "global_step": 173658, "epoch": 4134} {"train_loss": -6.91580867767334, "global_step": 173659, "epoch": 4134} {"train_loss": -7.079089641571045, "global_step": 173660, "epoch": 4134} {"train_loss": -7.095730781555176, "global_step": 173661, "epoch": 4134} {"train_loss": -7.033663749694824, "global_step": 173662, "epoch": 4134} {"train_loss": -7.068960189819336, "global_step": 173663, "epoch": 4134} {"train_loss": -7.039869785308838, "global_step": 173664, "epoch": 4134} {"train_loss": -7.080855846405029, "global_step": 173665, "epoch": 4134} {"train_loss": -7.084059715270996, "global_step": 173666, "epoch": 4134} {"train_loss": -7.084395408630371, "global_step": 173667, "epoch": 4134} {"train_loss": -7.077517032623291, "global_step": 173668, "epoch": 4134} {"train_loss": -7.015375863938105, "global_step": 173669, "epoch": 4134, "val_loss": 68877.3046875} {"train_loss": -6.883366584777832, "global_step": 173670, "epoch": 4135} {"train_loss": -7.019214630126953, "global_step": 173671, "epoch": 4135} {"train_loss": -6.948129653930664, "global_step": 173672, "epoch": 4135} {"train_loss": -6.939591407775879, "global_step": 173673, "epoch": 4135} {"train_loss": -6.978644371032715, "global_step": 173674, "epoch": 4135} {"train_loss": -6.929922103881836, "global_step": 173675, "epoch": 4135} {"train_loss": -6.984281063079834, "global_step": 173676, "epoch": 4135} {"train_loss": -7.035617828369141, "global_step": 173677, "epoch": 4135} {"train_loss": -6.913551330566406, "global_step": 173678, "epoch": 4135} {"train_loss": -6.95692253112793, "global_step": 173679, "epoch": 4135} {"train_loss": -6.959531784057617, "global_step": 173680, "epoch": 4135} {"train_loss": -6.982872486114502, "global_step": 173681, "epoch": 4135} {"train_loss": -7.077432632446289, "global_step": 173682, "epoch": 4135} {"train_loss": -7.071115016937256, "global_step": 173683, "epoch": 4135} {"train_loss": -7.034263610839844, "global_step": 173684, "epoch": 4135} {"train_loss": -7.070615291595459, "global_step": 173685, "epoch": 4135} {"train_loss": -7.087313652038574, "global_step": 173686, "epoch": 4135} {"train_loss": -7.084471702575684, "global_step": 173687, "epoch": 4135} {"train_loss": -6.994370937347412, "global_step": 173688, "epoch": 4135} {"train_loss": -7.043966770172119, "global_step": 173689, "epoch": 4135} {"train_loss": -7.080081939697266, "global_step": 173690, "epoch": 4135} {"train_loss": -7.052195072174072, "global_step": 173691, "epoch": 4135} {"train_loss": -7.0940961837768555, "global_step": 173692, "epoch": 4135} {"train_loss": -7.081033706665039, "global_step": 173693, "epoch": 4135} {"train_loss": -7.105570316314697, "global_step": 173694, "epoch": 4135} {"train_loss": -7.123396873474121, "global_step": 173695, "epoch": 4135} {"train_loss": -7.181622505187988, "global_step": 173696, "epoch": 4135} {"train_loss": -7.023710250854492, "global_step": 173697, "epoch": 4135} {"train_loss": -7.034014701843262, "global_step": 173698, "epoch": 4135} {"train_loss": -7.004081726074219, "global_step": 173699, "epoch": 4135} {"train_loss": -6.935337066650391, "global_step": 173700, "epoch": 4135} {"train_loss": -6.989749431610107, "global_step": 173701, "epoch": 4135} {"train_loss": -7.043911933898926, "global_step": 173702, "epoch": 4135} {"train_loss": -7.070318698883057, "global_step": 173703, "epoch": 4135} {"train_loss": -6.9256591796875, "global_step": 173704, "epoch": 4135} {"train_loss": -7.043733596801758, "global_step": 173705, "epoch": 4135} {"train_loss": -7.023297309875488, "global_step": 173706, "epoch": 4135} {"train_loss": -6.89975643157959, "global_step": 173707, "epoch": 4135} {"train_loss": -6.727851867675781, "global_step": 173708, "epoch": 4135} {"train_loss": -6.9686737060546875, "global_step": 173709, "epoch": 4135} {"train_loss": -6.920787811279297, "global_step": 173710, "epoch": 4135} {"train_loss": -7.0066555341084795, "global_step": 173711, "epoch": 4135, "val_loss": 68654.625} {"train_loss": -6.906305313110352, "global_step": 173712, "epoch": 4136} {"train_loss": -7.071325302124023, "global_step": 173713, "epoch": 4136} {"train_loss": -6.910728454589844, "global_step": 173714, "epoch": 4136} {"train_loss": -6.965500831604004, "global_step": 173715, "epoch": 4136} {"train_loss": -6.979606628417969, "global_step": 173716, "epoch": 4136} {"train_loss": -7.03193998336792, "global_step": 173717, "epoch": 4136} {"train_loss": -7.048872947692871, "global_step": 173718, "epoch": 4136} {"train_loss": -6.952701568603516, "global_step": 173719, "epoch": 4136} {"train_loss": -7.060015678405762, "global_step": 173720, "epoch": 4136} {"train_loss": -7.008124351501465, "global_step": 173721, "epoch": 4136} {"train_loss": -6.920328140258789, "global_step": 173722, "epoch": 4136} {"train_loss": -6.933325290679932, "global_step": 173723, "epoch": 4136} {"train_loss": -6.957637310028076, "global_step": 173724, "epoch": 4136} {"train_loss": -7.0218048095703125, "global_step": 173725, "epoch": 4136} {"train_loss": -7.00208854675293, "global_step": 173726, "epoch": 4136} {"train_loss": -7.003963470458984, "global_step": 173727, "epoch": 4136} {"train_loss": -6.979463577270508, "global_step": 173728, "epoch": 4136} {"train_loss": -7.035825729370117, "global_step": 173729, "epoch": 4136} {"train_loss": -7.045826435089111, "global_step": 173730, "epoch": 4136} {"train_loss": -7.033395290374756, "global_step": 173731, "epoch": 4136} {"train_loss": -6.936792373657227, "global_step": 173732, "epoch": 4136} {"train_loss": -7.088561058044434, "global_step": 173733, "epoch": 4136} {"train_loss": -7.0538811683654785, "global_step": 173734, "epoch": 4136} {"train_loss": -7.026797294616699, "global_step": 173735, "epoch": 4136} {"train_loss": -6.998744964599609, "global_step": 173736, "epoch": 4136} {"train_loss": -7.018311500549316, "global_step": 173737, "epoch": 4136} {"train_loss": -7.037834167480469, "global_step": 173738, "epoch": 4136} {"train_loss": -7.027496337890625, "global_step": 173739, "epoch": 4136} {"train_loss": -7.0304975509643555, "global_step": 173740, "epoch": 4136} {"train_loss": -7.108392715454102, "global_step": 173741, "epoch": 4136} {"train_loss": -7.032220840454102, "global_step": 173742, "epoch": 4136} {"train_loss": -6.918410778045654, "global_step": 173743, "epoch": 4136} {"train_loss": -7.114943027496338, "global_step": 173744, "epoch": 4136} {"train_loss": -6.948819637298584, "global_step": 173745, "epoch": 4136} {"train_loss": -7.06576681137085, "global_step": 173746, "epoch": 4136} {"train_loss": -7.147264003753662, "global_step": 173747, "epoch": 4136} {"train_loss": -7.0352678298950195, "global_step": 173748, "epoch": 4136} {"train_loss": -6.980592250823975, "global_step": 173749, "epoch": 4136} {"train_loss": -7.00325345993042, "global_step": 173750, "epoch": 4136} {"train_loss": -7.035604953765869, "global_step": 173751, "epoch": 4136} {"train_loss": -6.996512413024902, "global_step": 173752, "epoch": 4136} {"train_loss": -7.0144700776963, "global_step": 173753, "epoch": 4136, "val_loss": 68587.4453125} {"train_loss": -7.034660339355469, "global_step": 173754, "epoch": 4137} {"train_loss": -7.007192611694336, "global_step": 173755, "epoch": 4137} {"train_loss": -6.985078811645508, "global_step": 173756, "epoch": 4137} {"train_loss": -6.925800800323486, "global_step": 173757, "epoch": 4137} {"train_loss": -7.003710746765137, "global_step": 173758, "epoch": 4137} {"train_loss": -6.832672119140625, "global_step": 173759, "epoch": 4137} {"train_loss": -6.980979919433594, "global_step": 173760, "epoch": 4137} {"train_loss": -6.856376647949219, "global_step": 173761, "epoch": 4137} {"train_loss": -6.83270788192749, "global_step": 173762, "epoch": 4137} {"train_loss": -6.907844543457031, "global_step": 173763, "epoch": 4137} {"train_loss": -6.842447757720947, "global_step": 173764, "epoch": 4137} {"train_loss": -6.957708358764648, "global_step": 173765, "epoch": 4137} {"train_loss": -6.953246116638184, "global_step": 173766, "epoch": 4137} {"train_loss": -6.918755054473877, "global_step": 173767, "epoch": 4137} {"train_loss": -7.016848087310791, "global_step": 173768, "epoch": 4137} {"train_loss": -6.946198463439941, "global_step": 173769, "epoch": 4137} {"train_loss": -7.100139617919922, "global_step": 173770, "epoch": 4137} {"train_loss": -6.99990177154541, "global_step": 173771, "epoch": 4137} {"train_loss": -6.991605758666992, "global_step": 173772, "epoch": 4137} {"train_loss": -7.095972061157227, "global_step": 173773, "epoch": 4137} {"train_loss": -7.091299057006836, "global_step": 173774, "epoch": 4137} {"train_loss": -7.0367655754089355, "global_step": 173775, "epoch": 4137} {"train_loss": -6.986571788787842, "global_step": 173776, "epoch": 4137} {"train_loss": -7.045742034912109, "global_step": 173777, "epoch": 4137} {"train_loss": -7.060138702392578, "global_step": 173778, "epoch": 4137} {"train_loss": -7.0528154373168945, "global_step": 173779, "epoch": 4137} {"train_loss": -6.958296298980713, "global_step": 173780, "epoch": 4137} {"train_loss": -7.1655755043029785, "global_step": 173781, "epoch": 4137} {"train_loss": -6.984286308288574, "global_step": 173782, "epoch": 4137} {"train_loss": -7.061620712280273, "global_step": 173783, "epoch": 4137} {"train_loss": -6.941001892089844, "global_step": 173784, "epoch": 4137} {"train_loss": -7.0414838790893555, "global_step": 173785, "epoch": 4137} {"train_loss": -6.987838268280029, "global_step": 173786, "epoch": 4137} {"train_loss": -6.997398853302002, "global_step": 173787, "epoch": 4137} {"train_loss": -7.012233257293701, "global_step": 173788, "epoch": 4137} {"train_loss": -7.0388617515563965, "global_step": 173789, "epoch": 4137} {"train_loss": -7.061154842376709, "global_step": 173790, "epoch": 4137} {"train_loss": -7.088135242462158, "global_step": 173791, "epoch": 4137} {"train_loss": -7.156280517578125, "global_step": 173792, "epoch": 4137} {"train_loss": -6.922469615936279, "global_step": 173793, "epoch": 4137} {"train_loss": -7.074131011962891, "global_step": 173794, "epoch": 4137} {"train_loss": -7.000102474575951, "global_step": 173795, "epoch": 4137, "val_loss": 68509.9375} {"train_loss": -7.0318756103515625, "global_step": 173796, "epoch": 4138} {"train_loss": -6.975502967834473, "global_step": 173797, "epoch": 4138} {"train_loss": -7.001225471496582, "global_step": 173798, "epoch": 4138} {"train_loss": -7.05647087097168, "global_step": 173799, "epoch": 4138} {"train_loss": -7.150737285614014, "global_step": 173800, "epoch": 4138} {"train_loss": -6.913064479827881, "global_step": 173801, "epoch": 4138} {"train_loss": -6.996428966522217, "global_step": 173802, "epoch": 4138} {"train_loss": -7.087191104888916, "global_step": 173803, "epoch": 4138} {"train_loss": -6.988572597503662, "global_step": 173804, "epoch": 4138} {"train_loss": -7.03143310546875, "global_step": 173805, "epoch": 4138} {"train_loss": -7.034435272216797, "global_step": 173806, "epoch": 4138} {"train_loss": -6.979526519775391, "global_step": 173807, "epoch": 4138} {"train_loss": -7.095187187194824, "global_step": 173808, "epoch": 4138} {"train_loss": -7.040394306182861, "global_step": 173809, "epoch": 4138} {"train_loss": -7.100846767425537, "global_step": 173810, "epoch": 4138} {"train_loss": -6.85108757019043, "global_step": 173811, "epoch": 4138} {"train_loss": -7.094372749328613, "global_step": 173812, "epoch": 4138} {"train_loss": -7.0947184562683105, "global_step": 173813, "epoch": 4138} {"train_loss": -7.000654220581055, "global_step": 173814, "epoch": 4138} {"train_loss": -7.059471130371094, "global_step": 173815, "epoch": 4138} {"train_loss": -7.0313520431518555, "global_step": 173816, "epoch": 4138} {"train_loss": -7.013769149780273, "global_step": 173817, "epoch": 4138} {"train_loss": -7.094243049621582, "global_step": 173818, "epoch": 4138} {"train_loss": -7.092130661010742, "global_step": 173819, "epoch": 4138} {"train_loss": -7.094307899475098, "global_step": 173820, "epoch": 4138} {"train_loss": -7.056015968322754, "global_step": 173821, "epoch": 4138} {"train_loss": -7.102248191833496, "global_step": 173822, "epoch": 4138} {"train_loss": -7.062631607055664, "global_step": 173823, "epoch": 4138} {"train_loss": -7.144478797912598, "global_step": 173824, "epoch": 4138} {"train_loss": -7.146566390991211, "global_step": 173825, "epoch": 4138} {"train_loss": -7.1491899490356445, "global_step": 173826, "epoch": 4138} {"train_loss": -7.010312080383301, "global_step": 173827, "epoch": 4138} {"train_loss": -7.086511135101318, "global_step": 173828, "epoch": 4138} {"train_loss": -7.07686710357666, "global_step": 173829, "epoch": 4138} {"train_loss": -7.013724327087402, "global_step": 173830, "epoch": 4138} {"train_loss": -7.056373596191406, "global_step": 173831, "epoch": 4138} {"train_loss": -7.129913806915283, "global_step": 173832, "epoch": 4138} {"train_loss": -7.102152347564697, "global_step": 173833, "epoch": 4138} {"train_loss": -7.1158342361450195, "global_step": 173834, "epoch": 4138} {"train_loss": -7.008573532104492, "global_step": 173835, "epoch": 4138} {"train_loss": -7.071404933929443, "global_step": 173836, "epoch": 4138} {"train_loss": -7.055625801994687, "global_step": 173837, "epoch": 4138, "val_loss": 68731.7421875} {"train_loss": -6.997152328491211, "global_step": 173838, "epoch": 4139} {"train_loss": -7.0745391845703125, "global_step": 173839, "epoch": 4139} {"train_loss": -7.147310256958008, "global_step": 173840, "epoch": 4139} {"train_loss": -7.10162353515625, "global_step": 173841, "epoch": 4139} {"train_loss": -7.066287517547607, "global_step": 173842, "epoch": 4139} {"train_loss": -7.209298610687256, "global_step": 173843, "epoch": 4139} {"train_loss": -7.164874076843262, "global_step": 173844, "epoch": 4139} {"train_loss": -7.061631679534912, "global_step": 173845, "epoch": 4139} {"train_loss": -7.153656959533691, "global_step": 173846, "epoch": 4139} {"train_loss": -6.9724297523498535, "global_step": 173847, "epoch": 4139} {"train_loss": -6.989190101623535, "global_step": 173848, "epoch": 4139} {"train_loss": -7.000241279602051, "global_step": 173849, "epoch": 4139} {"train_loss": -7.119355201721191, "global_step": 173850, "epoch": 4139} {"train_loss": -7.077059745788574, "global_step": 173851, "epoch": 4139} {"train_loss": -7.111684322357178, "global_step": 173852, "epoch": 4139} {"train_loss": -7.198735237121582, "global_step": 173853, "epoch": 4139} {"train_loss": -7.080391883850098, "global_step": 173854, "epoch": 4139} {"train_loss": -6.917793273925781, "global_step": 173855, "epoch": 4139} {"train_loss": -7.063704490661621, "global_step": 173856, "epoch": 4139} {"train_loss": -7.075469493865967, "global_step": 173857, "epoch": 4139} {"train_loss": -7.13604736328125, "global_step": 173858, "epoch": 4139} {"train_loss": -6.907608985900879, "global_step": 173859, "epoch": 4139} {"train_loss": -7.047134876251221, "global_step": 173860, "epoch": 4139} {"train_loss": -7.002582550048828, "global_step": 173861, "epoch": 4139} {"train_loss": -6.974818229675293, "global_step": 173862, "epoch": 4139} {"train_loss": -7.057596206665039, "global_step": 173863, "epoch": 4139} {"train_loss": -7.029514312744141, "global_step": 173864, "epoch": 4139} {"train_loss": -7.098694324493408, "global_step": 173865, "epoch": 4139} {"train_loss": -6.9761433601379395, "global_step": 173866, "epoch": 4139} {"train_loss": -6.986260414123535, "global_step": 173867, "epoch": 4139} {"train_loss": -7.106329917907715, "global_step": 173868, "epoch": 4139} {"train_loss": -7.169908046722412, "global_step": 173869, "epoch": 4139} {"train_loss": -7.023839950561523, "global_step": 173870, "epoch": 4139} {"train_loss": -7.000804424285889, "global_step": 173871, "epoch": 4139} {"train_loss": -6.990718841552734, "global_step": 173872, "epoch": 4139} {"train_loss": -6.970295429229736, "global_step": 173873, "epoch": 4139} {"train_loss": -6.921623229980469, "global_step": 173874, "epoch": 4139} {"train_loss": -7.0841450691223145, "global_step": 173875, "epoch": 4139} {"train_loss": -6.837884902954102, "global_step": 173876, "epoch": 4139} {"train_loss": -6.861747741699219, "global_step": 173877, "epoch": 4139} {"train_loss": -7.043708801269531, "global_step": 173878, "epoch": 4139} {"train_loss": -7.042676812126523, "global_step": 173879, "epoch": 4139, "val_loss": 68556.90625} {"train_loss": -6.882485389709473, "global_step": 173880, "epoch": 4140} {"train_loss": -6.952749252319336, "global_step": 173881, "epoch": 4140} {"train_loss": -6.643113136291504, "global_step": 173882, "epoch": 4140} {"train_loss": -6.944302082061768, "global_step": 173883, "epoch": 4140} {"train_loss": -6.954269886016846, "global_step": 173884, "epoch": 4140} {"train_loss": -6.822920322418213, "global_step": 173885, "epoch": 4140} {"train_loss": -6.950672626495361, "global_step": 173886, "epoch": 4140} {"train_loss": -6.7354536056518555, "global_step": 173887, "epoch": 4140} {"train_loss": -6.880388259887695, "global_step": 173888, "epoch": 4140} {"train_loss": -6.95321798324585, "global_step": 173889, "epoch": 4140} {"train_loss": -6.830684185028076, "global_step": 173890, "epoch": 4140} {"train_loss": -6.784211158752441, "global_step": 173891, "epoch": 4140} {"train_loss": -6.804294586181641, "global_step": 173892, "epoch": 4140} {"train_loss": -6.811757564544678, "global_step": 173893, "epoch": 4140} {"train_loss": -6.890056133270264, "global_step": 173894, "epoch": 4140} {"train_loss": -6.889671325683594, "global_step": 173895, "epoch": 4140} {"train_loss": -6.944874286651611, "global_step": 173896, "epoch": 4140} {"train_loss": -6.780007839202881, "global_step": 173897, "epoch": 4140} {"train_loss": -6.919473171234131, "global_step": 173898, "epoch": 4140} {"train_loss": -6.8979597091674805, "global_step": 173899, "epoch": 4140} {"train_loss": -6.89557409286499, "global_step": 173900, "epoch": 4140} {"train_loss": -6.943603515625, "global_step": 173901, "epoch": 4140} {"train_loss": -6.934335708618164, "global_step": 173902, "epoch": 4140} {"train_loss": -6.980661869049072, "global_step": 173903, "epoch": 4140} {"train_loss": -6.9708380699157715, "global_step": 173904, "epoch": 4140} {"train_loss": -7.063578128814697, "global_step": 173905, "epoch": 4140} {"train_loss": -6.898441791534424, "global_step": 173906, "epoch": 4140} {"train_loss": -6.949042320251465, "global_step": 173907, "epoch": 4140} {"train_loss": -6.960991382598877, "global_step": 173908, "epoch": 4140} {"train_loss": -6.922744274139404, "global_step": 173909, "epoch": 4140} {"train_loss": -7.039519786834717, "global_step": 173910, "epoch": 4140} {"train_loss": -7.057336807250977, "global_step": 173911, "epoch": 4140} {"train_loss": -6.937593460083008, "global_step": 173912, "epoch": 4140} {"train_loss": -7.015242576599121, "global_step": 173913, "epoch": 4140} {"train_loss": -7.004587173461914, "global_step": 173914, "epoch": 4140} {"train_loss": -6.940851211547852, "global_step": 173915, "epoch": 4140} {"train_loss": -6.992444038391113, "global_step": 173916, "epoch": 4140} {"train_loss": -6.799881935119629, "global_step": 173917, "epoch": 4140} {"train_loss": -7.127580642700195, "global_step": 173918, "epoch": 4140} {"train_loss": -6.934004783630371, "global_step": 173919, "epoch": 4140} {"train_loss": -6.963719367980957, "global_step": 173920, "epoch": 4140} {"train_loss": -6.922351439793904, "global_step": 173921, "epoch": 4140, "val_loss": 68582.03125} {"train_loss": -6.993670463562012, "global_step": 173922, "epoch": 4141} {"train_loss": -7.012909889221191, "global_step": 173923, "epoch": 4141} {"train_loss": -6.96195125579834, "global_step": 173924, "epoch": 4141} {"train_loss": -7.029404163360596, "global_step": 173925, "epoch": 4141} {"train_loss": -7.018610000610352, "global_step": 173926, "epoch": 4141} {"train_loss": -6.983405590057373, "global_step": 173927, "epoch": 4141} {"train_loss": -7.001407623291016, "global_step": 173928, "epoch": 4141} {"train_loss": -7.034015655517578, "global_step": 173929, "epoch": 4141} {"train_loss": -7.025506019592285, "global_step": 173930, "epoch": 4141} {"train_loss": -7.0287017822265625, "global_step": 173931, "epoch": 4141} {"train_loss": -7.158655166625977, "global_step": 173932, "epoch": 4141} {"train_loss": -7.050591468811035, "global_step": 173933, "epoch": 4141} {"train_loss": -7.100207805633545, "global_step": 173934, "epoch": 4141} {"train_loss": -6.910567760467529, "global_step": 173935, "epoch": 4141} {"train_loss": -6.969493865966797, "global_step": 173936, "epoch": 4141} {"train_loss": -7.1146087646484375, "global_step": 173937, "epoch": 4141} {"train_loss": -6.9332380294799805, "global_step": 173938, "epoch": 4141} {"train_loss": -7.108784198760986, "global_step": 173939, "epoch": 4141} {"train_loss": -7.032140254974365, "global_step": 173940, "epoch": 4141} {"train_loss": -7.029234886169434, "global_step": 173941, "epoch": 4141} {"train_loss": -7.13808536529541, "global_step": 173942, "epoch": 4141} {"train_loss": -6.953019618988037, "global_step": 173943, "epoch": 4141} {"train_loss": -7.132842063903809, "global_step": 173944, "epoch": 4141} {"train_loss": -7.019002437591553, "global_step": 173945, "epoch": 4141} {"train_loss": -7.029545307159424, "global_step": 173946, "epoch": 4141} {"train_loss": -7.110713958740234, "global_step": 173947, "epoch": 4141} {"train_loss": -7.174864768981934, "global_step": 173948, "epoch": 4141} {"train_loss": -7.057034492492676, "global_step": 173949, "epoch": 4141} {"train_loss": -7.053197860717773, "global_step": 173950, "epoch": 4141} {"train_loss": -7.114116668701172, "global_step": 173951, "epoch": 4141} {"train_loss": -7.0536322593688965, "global_step": 173952, "epoch": 4141} {"train_loss": -7.130524635314941, "global_step": 173953, "epoch": 4141} {"train_loss": -7.011261940002441, "global_step": 173954, "epoch": 4141} {"train_loss": -7.158286094665527, "global_step": 173955, "epoch": 4141} {"train_loss": -7.131650924682617, "global_step": 173956, "epoch": 4141} {"train_loss": -7.066831588745117, "global_step": 173957, "epoch": 4141} {"train_loss": -7.05862283706665, "global_step": 173958, "epoch": 4141} {"train_loss": -7.03587532043457, "global_step": 173959, "epoch": 4141} {"train_loss": -7.0736470222473145, "global_step": 173960, "epoch": 4141} {"train_loss": -7.103374481201172, "global_step": 173961, "epoch": 4141} {"train_loss": -7.042429447174072, "global_step": 173962, "epoch": 4141} {"train_loss": -7.052279915128436, "global_step": 173963, "epoch": 4141, "val_loss": 68748.296875} {"train_loss": -6.982394218444824, "global_step": 173964, "epoch": 4142} {"train_loss": -7.028319835662842, "global_step": 173965, "epoch": 4142} {"train_loss": -7.006706237792969, "global_step": 173966, "epoch": 4142} {"train_loss": -7.065680503845215, "global_step": 173967, "epoch": 4142} {"train_loss": -6.890693664550781, "global_step": 173968, "epoch": 4142} {"train_loss": -6.953472137451172, "global_step": 173969, "epoch": 4142} {"train_loss": -6.997433185577393, "global_step": 173970, "epoch": 4142} {"train_loss": -7.111408233642578, "global_step": 173971, "epoch": 4142} {"train_loss": -7.024168968200684, "global_step": 173972, "epoch": 4142} {"train_loss": -7.108122825622559, "global_step": 173973, "epoch": 4142} {"train_loss": -7.08773136138916, "global_step": 173974, "epoch": 4142} {"train_loss": -7.032556533813477, "global_step": 173975, "epoch": 4142} {"train_loss": -7.019883155822754, "global_step": 173976, "epoch": 4142} {"train_loss": -7.058106422424316, "global_step": 173977, "epoch": 4142} {"train_loss": -7.095027923583984, "global_step": 173978, "epoch": 4142} {"train_loss": -7.020868301391602, "global_step": 173979, "epoch": 4142} {"train_loss": -7.0995049476623535, "global_step": 173980, "epoch": 4142} {"train_loss": -6.980956077575684, "global_step": 173981, "epoch": 4142} {"train_loss": -7.084929943084717, "global_step": 173982, "epoch": 4142} {"train_loss": -7.116525173187256, "global_step": 173983, "epoch": 4142} {"train_loss": -7.025612831115723, "global_step": 173984, "epoch": 4142} {"train_loss": -7.016894817352295, "global_step": 173985, "epoch": 4142} {"train_loss": -6.93858003616333, "global_step": 173986, "epoch": 4142} {"train_loss": -6.993719577789307, "global_step": 173987, "epoch": 4142} {"train_loss": -7.0179901123046875, "global_step": 173988, "epoch": 4142} {"train_loss": -6.9819817543029785, "global_step": 173989, "epoch": 4142} {"train_loss": -7.013411521911621, "global_step": 173990, "epoch": 4142} {"train_loss": -7.0666351318359375, "global_step": 173991, "epoch": 4142} {"train_loss": -7.007625579833984, "global_step": 173992, "epoch": 4142} {"train_loss": -6.889214515686035, "global_step": 173993, "epoch": 4142} {"train_loss": -6.859653472900391, "global_step": 173994, "epoch": 4142} {"train_loss": -7.005692481994629, "global_step": 173995, "epoch": 4142} {"train_loss": -6.840166091918945, "global_step": 173996, "epoch": 4142} {"train_loss": -6.9081878662109375, "global_step": 173997, "epoch": 4142} {"train_loss": -6.993949890136719, "global_step": 173998, "epoch": 4142} {"train_loss": -7.0103960037231445, "global_step": 173999, "epoch": 4142} {"train_loss": -6.9946136474609375, "global_step": 174000, "epoch": 4142} {"train_loss": -7.028751850128174, "global_step": 174001, "epoch": 4142} {"train_loss": -7.026005744934082, "global_step": 174002, "epoch": 4142} {"train_loss": -7.069822311401367, "global_step": 174003, "epoch": 4142} {"train_loss": -7.068751335144043, "global_step": 174004, "epoch": 4142} {"train_loss": -7.011580853235154, "global_step": 174005, "epoch": 4142, "val_loss": 68473.03125} {"train_loss": -7.050053119659424, "global_step": 174006, "epoch": 4143} {"train_loss": -7.0832014083862305, "global_step": 174007, "epoch": 4143} {"train_loss": -7.028657913208008, "global_step": 174008, "epoch": 4143} {"train_loss": -7.052565097808838, "global_step": 174009, "epoch": 4143} {"train_loss": -6.984811782836914, "global_step": 174010, "epoch": 4143} {"train_loss": -7.046002388000488, "global_step": 174011, "epoch": 4143} {"train_loss": -6.935283184051514, "global_step": 174012, "epoch": 4143} {"train_loss": -7.099411964416504, "global_step": 174013, "epoch": 4143} {"train_loss": -6.981837749481201, "global_step": 174014, "epoch": 4143} {"train_loss": -6.859804153442383, "global_step": 174015, "epoch": 4143} {"train_loss": -6.988648414611816, "global_step": 174016, "epoch": 4143} {"train_loss": -7.121817588806152, "global_step": 174017, "epoch": 4143} {"train_loss": -6.925304412841797, "global_step": 174018, "epoch": 4143} {"train_loss": -7.002254486083984, "global_step": 174019, "epoch": 4143} {"train_loss": -7.037742614746094, "global_step": 174020, "epoch": 4143} {"train_loss": -7.0308146476745605, "global_step": 174021, "epoch": 4143} {"train_loss": -7.062382221221924, "global_step": 174022, "epoch": 4143} {"train_loss": -7.002260208129883, "global_step": 174023, "epoch": 4143} {"train_loss": -6.971183776855469, "global_step": 174024, "epoch": 4143} {"train_loss": -7.002461910247803, "global_step": 174025, "epoch": 4143} {"train_loss": -6.91538143157959, "global_step": 174026, "epoch": 4143} {"train_loss": -7.053197383880615, "global_step": 174027, "epoch": 4143} {"train_loss": -6.974803447723389, "global_step": 174028, "epoch": 4143} {"train_loss": -7.134816646575928, "global_step": 174029, "epoch": 4143} {"train_loss": -7.083332061767578, "global_step": 174030, "epoch": 4143} {"train_loss": -7.172684669494629, "global_step": 174031, "epoch": 4143} {"train_loss": -6.995590686798096, "global_step": 174032, "epoch": 4143} {"train_loss": -6.9859113693237305, "global_step": 174033, "epoch": 4143} {"train_loss": -7.147570610046387, "global_step": 174034, "epoch": 4143} {"train_loss": -7.050820350646973, "global_step": 174035, "epoch": 4143} {"train_loss": -6.995120525360107, "global_step": 174036, "epoch": 4143} {"train_loss": -7.026728630065918, "global_step": 174037, "epoch": 4143} {"train_loss": -6.979831695556641, "global_step": 174038, "epoch": 4143} {"train_loss": -7.071748733520508, "global_step": 174039, "epoch": 4143} {"train_loss": -6.943108558654785, "global_step": 174040, "epoch": 4143} {"train_loss": -7.11147403717041, "global_step": 174041, "epoch": 4143} {"train_loss": -7.011953830718994, "global_step": 174042, "epoch": 4143} {"train_loss": -7.115617752075195, "global_step": 174043, "epoch": 4143} {"train_loss": -7.1043829917907715, "global_step": 174044, "epoch": 4143} {"train_loss": -7.117664337158203, "global_step": 174045, "epoch": 4143} {"train_loss": -6.966033458709717, "global_step": 174046, "epoch": 4143} {"train_loss": -7.033587137858073, "global_step": 174047, "epoch": 4143, "val_loss": 68447.7890625} {"train_loss": -7.0740461349487305, "global_step": 174048, "epoch": 4144} {"train_loss": -7.078845977783203, "global_step": 174049, "epoch": 4144} {"train_loss": -7.018147945404053, "global_step": 174050, "epoch": 4144} {"train_loss": -7.059999465942383, "global_step": 174051, "epoch": 4144} {"train_loss": -7.166478157043457, "global_step": 174052, "epoch": 4144} {"train_loss": -7.091374397277832, "global_step": 174053, "epoch": 4144} {"train_loss": -7.12281608581543, "global_step": 174054, "epoch": 4144} {"train_loss": -7.009753227233887, "global_step": 174055, "epoch": 4144} {"train_loss": -7.178733825683594, "global_step": 174056, "epoch": 4144} {"train_loss": -7.064925193786621, "global_step": 174057, "epoch": 4144} {"train_loss": -7.143199920654297, "global_step": 174058, "epoch": 4144} {"train_loss": -7.0296831130981445, "global_step": 174059, "epoch": 4144} {"train_loss": -7.100751876831055, "global_step": 174060, "epoch": 4144} {"train_loss": -7.1404337882995605, "global_step": 174061, "epoch": 4144} {"train_loss": -7.062299728393555, "global_step": 174062, "epoch": 4144} {"train_loss": -7.156937599182129, "global_step": 174063, "epoch": 4144} {"train_loss": -7.06380558013916, "global_step": 174064, "epoch": 4144} {"train_loss": -7.080179214477539, "global_step": 174065, "epoch": 4144} {"train_loss": -7.04727840423584, "global_step": 174066, "epoch": 4144} {"train_loss": -7.063659191131592, "global_step": 174067, "epoch": 4144} {"train_loss": -7.075895309448242, "global_step": 174068, "epoch": 4144} {"train_loss": -7.077242851257324, "global_step": 174069, "epoch": 4144} {"train_loss": -7.055058479309082, "global_step": 174070, "epoch": 4144} {"train_loss": -7.068697929382324, "global_step": 174071, "epoch": 4144} {"train_loss": -7.118181228637695, "global_step": 174072, "epoch": 4144} {"train_loss": -6.982083320617676, "global_step": 174073, "epoch": 4144} {"train_loss": -6.98527193069458, "global_step": 174074, "epoch": 4144} {"train_loss": -6.911545753479004, "global_step": 174075, "epoch": 4144} {"train_loss": -6.905179977416992, "global_step": 174076, "epoch": 4144} {"train_loss": -6.980521202087402, "global_step": 174077, "epoch": 4144} {"train_loss": -7.061380386352539, "global_step": 174078, "epoch": 4144} {"train_loss": -7.00445556640625, "global_step": 174079, "epoch": 4144} {"train_loss": -7.071073532104492, "global_step": 174080, "epoch": 4144} {"train_loss": -7.003027439117432, "global_step": 174081, "epoch": 4144} {"train_loss": -7.023144245147705, "global_step": 174082, "epoch": 4144} {"train_loss": -6.987566947937012, "global_step": 174083, "epoch": 4144} {"train_loss": -7.009767532348633, "global_step": 174084, "epoch": 4144} {"train_loss": -7.0149006843566895, "global_step": 174085, "epoch": 4144} {"train_loss": -7.162125110626221, "global_step": 174086, "epoch": 4144} {"train_loss": -7.111163139343262, "global_step": 174087, "epoch": 4144} {"train_loss": -7.041137218475342, "global_step": 174088, "epoch": 4144} {"train_loss": -7.057171821594238, "global_step": 174089, "epoch": 4144, "val_loss": 68622.3046875} {"train_loss": -7.04790735244751, "global_step": 174090, "epoch": 4145} {"train_loss": -7.10227108001709, "global_step": 174091, "epoch": 4145} {"train_loss": -6.963771820068359, "global_step": 174092, "epoch": 4145} {"train_loss": -7.0258331298828125, "global_step": 174093, "epoch": 4145} {"train_loss": -7.10154390335083, "global_step": 174094, "epoch": 4145} {"train_loss": -6.9766950607299805, "global_step": 174095, "epoch": 4145} {"train_loss": -7.06158971786499, "global_step": 174096, "epoch": 4145} {"train_loss": -6.971004962921143, "global_step": 174097, "epoch": 4145} {"train_loss": -6.876175403594971, "global_step": 174098, "epoch": 4145} {"train_loss": -7.050690174102783, "global_step": 174099, "epoch": 4145} {"train_loss": -7.051438331604004, "global_step": 174100, "epoch": 4145} {"train_loss": -6.9119367599487305, "global_step": 174101, "epoch": 4145} {"train_loss": -6.897621154785156, "global_step": 174102, "epoch": 4145} {"train_loss": -6.923540115356445, "global_step": 174103, "epoch": 4145} {"train_loss": -6.943502902984619, "global_step": 174104, "epoch": 4145} {"train_loss": -6.93178653717041, "global_step": 174105, "epoch": 4145} {"train_loss": -6.89176607131958, "global_step": 174106, "epoch": 4145} {"train_loss": -7.0072150230407715, "global_step": 174107, "epoch": 4145} {"train_loss": -7.0711259841918945, "global_step": 174108, "epoch": 4145} {"train_loss": -6.895380020141602, "global_step": 174109, "epoch": 4145} {"train_loss": -7.075607776641846, "global_step": 174110, "epoch": 4145} {"train_loss": -7.013051509857178, "global_step": 174111, "epoch": 4145} {"train_loss": -6.983628273010254, "global_step": 174112, "epoch": 4145} {"train_loss": -6.988230228424072, "global_step": 174113, "epoch": 4145} {"train_loss": -7.090148448944092, "global_step": 174114, "epoch": 4145} {"train_loss": -6.928529739379883, "global_step": 174115, "epoch": 4145} {"train_loss": -7.060467720031738, "global_step": 174116, "epoch": 4145} {"train_loss": -7.052915573120117, "global_step": 174117, "epoch": 4145} {"train_loss": -7.076754570007324, "global_step": 174118, "epoch": 4145} {"train_loss": -7.059136390686035, "global_step": 174119, "epoch": 4145} {"train_loss": -7.049125671386719, "global_step": 174120, "epoch": 4145} {"train_loss": -7.0107269287109375, "global_step": 174121, "epoch": 4145} {"train_loss": -6.99130392074585, "global_step": 174122, "epoch": 4145} {"train_loss": -7.036409378051758, "global_step": 174123, "epoch": 4145} {"train_loss": -6.924563884735107, "global_step": 174124, "epoch": 4145} {"train_loss": -7.000309944152832, "global_step": 174125, "epoch": 4145} {"train_loss": -7.03199577331543, "global_step": 174126, "epoch": 4145} {"train_loss": -7.026485443115234, "global_step": 174127, "epoch": 4145} {"train_loss": -7.018829822540283, "global_step": 174128, "epoch": 4145} {"train_loss": -6.996376037597656, "global_step": 174129, "epoch": 4145} {"train_loss": -6.9686479568481445, "global_step": 174130, "epoch": 4145} {"train_loss": -7.002504575820196, "global_step": 174131, "epoch": 4145, "val_loss": 68586.796875} {"train_loss": -6.983907222747803, "global_step": 174132, "epoch": 4146} {"train_loss": -6.906405448913574, "global_step": 174133, "epoch": 4146} {"train_loss": -7.0311150550842285, "global_step": 174134, "epoch": 4146} {"train_loss": -6.944653511047363, "global_step": 174135, "epoch": 4146} {"train_loss": -7.052724361419678, "global_step": 174136, "epoch": 4146} {"train_loss": -7.199822425842285, "global_step": 174137, "epoch": 4146} {"train_loss": -7.048994064331055, "global_step": 174138, "epoch": 4146} {"train_loss": -7.040718078613281, "global_step": 174139, "epoch": 4146} {"train_loss": -7.061938285827637, "global_step": 174140, "epoch": 4146} {"train_loss": -7.112671852111816, "global_step": 174141, "epoch": 4146} {"train_loss": -6.997774124145508, "global_step": 174142, "epoch": 4146} {"train_loss": -7.048900127410889, "global_step": 174143, "epoch": 4146} {"train_loss": -7.0421905517578125, "global_step": 174144, "epoch": 4146} {"train_loss": -7.0444512367248535, "global_step": 174145, "epoch": 4146} {"train_loss": -6.901485443115234, "global_step": 174146, "epoch": 4146} {"train_loss": -7.03480863571167, "global_step": 174147, "epoch": 4146} {"train_loss": -6.885043144226074, "global_step": 174148, "epoch": 4146} {"train_loss": -6.888379096984863, "global_step": 174149, "epoch": 4146} {"train_loss": -7.037718772888184, "global_step": 174150, "epoch": 4146} {"train_loss": -6.92536735534668, "global_step": 174151, "epoch": 4146} {"train_loss": -6.973092555999756, "global_step": 174152, "epoch": 4146} {"train_loss": -7.031408309936523, "global_step": 174153, "epoch": 4146} {"train_loss": -6.781113624572754, "global_step": 174154, "epoch": 4146} {"train_loss": -6.898904800415039, "global_step": 174155, "epoch": 4146} {"train_loss": -6.951353549957275, "global_step": 174156, "epoch": 4146} {"train_loss": -7.053565502166748, "global_step": 174157, "epoch": 4146} {"train_loss": -6.976376533508301, "global_step": 174158, "epoch": 4146} {"train_loss": -6.854773998260498, "global_step": 174159, "epoch": 4146} {"train_loss": -7.007926940917969, "global_step": 174160, "epoch": 4146} {"train_loss": -6.937228202819824, "global_step": 174161, "epoch": 4146} {"train_loss": -6.910574436187744, "global_step": 174162, "epoch": 4146} {"train_loss": -7.007997035980225, "global_step": 174163, "epoch": 4146} {"train_loss": -7.0221357345581055, "global_step": 174164, "epoch": 4146} {"train_loss": -6.966831207275391, "global_step": 174165, "epoch": 4146} {"train_loss": -6.834595680236816, "global_step": 174166, "epoch": 4146} {"train_loss": -6.804853916168213, "global_step": 174167, "epoch": 4146} {"train_loss": -6.895443439483643, "global_step": 174168, "epoch": 4146} {"train_loss": -6.89262056350708, "global_step": 174169, "epoch": 4146} {"train_loss": -6.8343658447265625, "global_step": 174170, "epoch": 4146} {"train_loss": -6.920164108276367, "global_step": 174171, "epoch": 4146} {"train_loss": -6.900204658508301, "global_step": 174172, "epoch": 4146} {"train_loss": -6.966669775190807, "global_step": 174173, "epoch": 4146, "val_loss": 68776.4921875} {"train_loss": -6.854145526885986, "global_step": 174174, "epoch": 4147} {"train_loss": -6.998876094818115, "global_step": 174175, "epoch": 4147} {"train_loss": -7.005079746246338, "global_step": 174176, "epoch": 4147} {"train_loss": -7.003758907318115, "global_step": 174177, "epoch": 4147} {"train_loss": -6.877444267272949, "global_step": 174178, "epoch": 4147} {"train_loss": -6.878223419189453, "global_step": 174179, "epoch": 4147} {"train_loss": -7.04590368270874, "global_step": 174180, "epoch": 4147} {"train_loss": -6.949366092681885, "global_step": 174181, "epoch": 4147} {"train_loss": -7.031820297241211, "global_step": 174182, "epoch": 4147} {"train_loss": -6.9398698806762695, "global_step": 174183, "epoch": 4147} {"train_loss": -6.956010341644287, "global_step": 174184, "epoch": 4147} {"train_loss": -7.038177013397217, "global_step": 174185, "epoch": 4147} {"train_loss": -7.034698009490967, "global_step": 174186, "epoch": 4147} {"train_loss": -6.936258792877197, "global_step": 174187, "epoch": 4147} {"train_loss": -6.961014270782471, "global_step": 174188, "epoch": 4147} {"train_loss": -7.117677688598633, "global_step": 174189, "epoch": 4147} {"train_loss": -7.082022666931152, "global_step": 174190, "epoch": 4147} {"train_loss": -6.994790077209473, "global_step": 174191, "epoch": 4147} {"train_loss": -7.071605682373047, "global_step": 174192, "epoch": 4147} {"train_loss": -6.9770355224609375, "global_step": 174193, "epoch": 4147} {"train_loss": -7.047263145446777, "global_step": 174194, "epoch": 4147} {"train_loss": -6.938320159912109, "global_step": 174195, "epoch": 4147} {"train_loss": -6.974863529205322, "global_step": 174196, "epoch": 4147} {"train_loss": -6.919225215911865, "global_step": 174197, "epoch": 4147} {"train_loss": -6.930513858795166, "global_step": 174198, "epoch": 4147} {"train_loss": -6.901788234710693, "global_step": 174199, "epoch": 4147} {"train_loss": -7.045927047729492, "global_step": 174200, "epoch": 4147} {"train_loss": -6.928923606872559, "global_step": 174201, "epoch": 4147} {"train_loss": -7.088661193847656, "global_step": 174202, "epoch": 4147} {"train_loss": -7.023630619049072, "global_step": 174203, "epoch": 4147} {"train_loss": -6.973387718200684, "global_step": 174204, "epoch": 4147} {"train_loss": -7.070124626159668, "global_step": 174205, "epoch": 4147} {"train_loss": -7.120499610900879, "global_step": 174206, "epoch": 4147} {"train_loss": -6.986721992492676, "global_step": 174207, "epoch": 4147} {"train_loss": -7.061214447021484, "global_step": 174208, "epoch": 4147} {"train_loss": -6.950001239776611, "global_step": 174209, "epoch": 4147} {"train_loss": -7.077281951904297, "global_step": 174210, "epoch": 4147} {"train_loss": -7.0450239181518555, "global_step": 174211, "epoch": 4147} {"train_loss": -7.05610990524292, "global_step": 174212, "epoch": 4147} {"train_loss": -7.019460201263428, "global_step": 174213, "epoch": 4147} {"train_loss": -7.01308536529541, "global_step": 174214, "epoch": 4147} {"train_loss": -7.000478437968662, "global_step": 174215, "epoch": 4147, "val_loss": 68772.359375} {"train_loss": -7.149634838104248, "global_step": 174216, "epoch": 4148} {"train_loss": -7.122498989105225, "global_step": 174217, "epoch": 4148} {"train_loss": -7.057651519775391, "global_step": 174218, "epoch": 4148} {"train_loss": -7.093129634857178, "global_step": 174219, "epoch": 4148} {"train_loss": -7.1815595626831055, "global_step": 174220, "epoch": 4148} {"train_loss": -7.025622367858887, "global_step": 174221, "epoch": 4148} {"train_loss": -7.103233337402344, "global_step": 174222, "epoch": 4148} {"train_loss": -6.880471229553223, "global_step": 174223, "epoch": 4148} {"train_loss": -6.923078536987305, "global_step": 174224, "epoch": 4148} {"train_loss": -7.15938663482666, "global_step": 174225, "epoch": 4148} {"train_loss": -6.995944023132324, "global_step": 174226, "epoch": 4148} {"train_loss": -6.919219970703125, "global_step": 174227, "epoch": 4148} {"train_loss": -7.23375129699707, "global_step": 174228, "epoch": 4148} {"train_loss": -7.033051013946533, "global_step": 174229, "epoch": 4148} {"train_loss": -7.113926887512207, "global_step": 174230, "epoch": 4148} {"train_loss": -7.008298873901367, "global_step": 174231, "epoch": 4148} {"train_loss": -7.048341274261475, "global_step": 174232, "epoch": 4148} {"train_loss": -7.0081682205200195, "global_step": 174233, "epoch": 4148} {"train_loss": -7.086775779724121, "global_step": 174234, "epoch": 4148} {"train_loss": -6.998736381530762, "global_step": 174235, "epoch": 4148} {"train_loss": -6.879397392272949, "global_step": 174236, "epoch": 4148} {"train_loss": -7.1119279861450195, "global_step": 174237, "epoch": 4148} {"train_loss": -6.9626007080078125, "global_step": 174238, "epoch": 4148} {"train_loss": -6.869657516479492, "global_step": 174239, "epoch": 4148} {"train_loss": -7.006411552429199, "global_step": 174240, "epoch": 4148} {"train_loss": -6.844573020935059, "global_step": 174241, "epoch": 4148} {"train_loss": -6.989469528198242, "global_step": 174242, "epoch": 4148} {"train_loss": -6.896551132202148, "global_step": 174243, "epoch": 4148} {"train_loss": -6.886485576629639, "global_step": 174244, "epoch": 4148} {"train_loss": -6.98345947265625, "global_step": 174245, "epoch": 4148} {"train_loss": -6.945267677307129, "global_step": 174246, "epoch": 4148} {"train_loss": -6.961745738983154, "global_step": 174247, "epoch": 4148} {"train_loss": -6.957718372344971, "global_step": 174248, "epoch": 4148} {"train_loss": -7.011355400085449, "global_step": 174249, "epoch": 4148} {"train_loss": -6.838050842285156, "global_step": 174250, "epoch": 4148} {"train_loss": -7.057201385498047, "global_step": 174251, "epoch": 4148} {"train_loss": -6.867778301239014, "global_step": 174252, "epoch": 4148} {"train_loss": -6.7469658851623535, "global_step": 174253, "epoch": 4148} {"train_loss": -6.948955535888672, "global_step": 174254, "epoch": 4148} {"train_loss": -6.968196392059326, "global_step": 174255, "epoch": 4148} {"train_loss": -7.007547378540039, "global_step": 174256, "epoch": 4148} {"train_loss": -6.998141402289981, "global_step": 174257, "epoch": 4148, "val_loss": 68452.4375} {"train_loss": -6.942831039428711, "global_step": 174258, "epoch": 4149} {"train_loss": -6.839122295379639, "global_step": 174259, "epoch": 4149} {"train_loss": -7.094546318054199, "global_step": 174260, "epoch": 4149} {"train_loss": -6.892085552215576, "global_step": 174261, "epoch": 4149} {"train_loss": -6.950984954833984, "global_step": 174262, "epoch": 4149} {"train_loss": -6.90418815612793, "global_step": 174263, "epoch": 4149} {"train_loss": -6.997622489929199, "global_step": 174264, "epoch": 4149} {"train_loss": -6.932926654815674, "global_step": 174265, "epoch": 4149} {"train_loss": -6.884316921234131, "global_step": 174266, "epoch": 4149} {"train_loss": -6.9462571144104, "global_step": 174267, "epoch": 4149} {"train_loss": -6.9668731689453125, "global_step": 174268, "epoch": 4149} {"train_loss": -6.914477348327637, "global_step": 174269, "epoch": 4149} {"train_loss": -6.960637092590332, "global_step": 174270, "epoch": 4149} {"train_loss": -6.958371162414551, "global_step": 174271, "epoch": 4149} {"train_loss": -7.033760070800781, "global_step": 174272, "epoch": 4149} {"train_loss": -6.953686714172363, "global_step": 174273, "epoch": 4149} {"train_loss": -7.030013084411621, "global_step": 174274, "epoch": 4149} {"train_loss": -6.972707748413086, "global_step": 174275, "epoch": 4149} {"train_loss": -7.004391193389893, "global_step": 174276, "epoch": 4149} {"train_loss": -7.031874656677246, "global_step": 174277, "epoch": 4149} {"train_loss": -7.030715465545654, "global_step": 174278, "epoch": 4149} {"train_loss": -6.908803939819336, "global_step": 174279, "epoch": 4149} {"train_loss": -6.993206977844238, "global_step": 174280, "epoch": 4149} {"train_loss": -7.052561283111572, "global_step": 174281, "epoch": 4149} {"train_loss": -6.938292503356934, "global_step": 174282, "epoch": 4149} {"train_loss": -6.969965934753418, "global_step": 174283, "epoch": 4149} {"train_loss": -7.000510215759277, "global_step": 174284, "epoch": 4149} {"train_loss": -6.846031188964844, "global_step": 174285, "epoch": 4149} {"train_loss": -6.9899373054504395, "global_step": 174286, "epoch": 4149} {"train_loss": -6.8241119384765625, "global_step": 174287, "epoch": 4149} {"train_loss": -6.8472137451171875, "global_step": 174288, "epoch": 4149} {"train_loss": -6.876640319824219, "global_step": 174289, "epoch": 4149} {"train_loss": -6.75809383392334, "global_step": 174290, "epoch": 4149} {"train_loss": -6.923699378967285, "global_step": 174291, "epoch": 4149} {"train_loss": -6.9471516609191895, "global_step": 174292, "epoch": 4149} {"train_loss": -6.939037322998047, "global_step": 174293, "epoch": 4149} {"train_loss": -6.88763427734375, "global_step": 174294, "epoch": 4149} {"train_loss": -6.888836860656738, "global_step": 174295, "epoch": 4149} {"train_loss": -6.9026689529418945, "global_step": 174296, "epoch": 4149} {"train_loss": -6.952540397644043, "global_step": 174297, "epoch": 4149} {"train_loss": -6.734324932098389, "global_step": 174298, "epoch": 4149} {"train_loss": -6.936963978267851, "global_step": 174299, "epoch": 4149, "val_loss": 68876.4140625} {"train_loss": -6.872143745422363, "global_step": 174300, "epoch": 4150} {"train_loss": -6.969662666320801, "global_step": 174301, "epoch": 4150} {"train_loss": -6.795281410217285, "global_step": 174302, "epoch": 4150} {"train_loss": -6.952461242675781, "global_step": 174303, "epoch": 4150} {"train_loss": -6.861724853515625, "global_step": 174304, "epoch": 4150} {"train_loss": -6.9138875007629395, "global_step": 174305, "epoch": 4150} {"train_loss": -6.983379364013672, "global_step": 174306, "epoch": 4150} {"train_loss": -6.9250054359436035, "global_step": 174307, "epoch": 4150} {"train_loss": -7.0353264808654785, "global_step": 174308, "epoch": 4150} {"train_loss": -7.043926239013672, "global_step": 174309, "epoch": 4150} {"train_loss": -6.940311908721924, "global_step": 174310, "epoch": 4150} {"train_loss": -6.927285671234131, "global_step": 174311, "epoch": 4150} {"train_loss": -6.984981536865234, "global_step": 174312, "epoch": 4150} {"train_loss": -7.031803131103516, "global_step": 174313, "epoch": 4150} {"train_loss": -7.026913642883301, "global_step": 174314, "epoch": 4150} {"train_loss": -6.972907543182373, "global_step": 174315, "epoch": 4150} {"train_loss": -6.93699836730957, "global_step": 174316, "epoch": 4150} {"train_loss": -7.000581741333008, "global_step": 174317, "epoch": 4150} {"train_loss": -6.939848899841309, "global_step": 174318, "epoch": 4150} {"train_loss": -6.9544677734375, "global_step": 174319, "epoch": 4150} {"train_loss": -6.962578773498535, "global_step": 174320, "epoch": 4150} {"train_loss": -6.9514007568359375, "global_step": 174321, "epoch": 4150} {"train_loss": -6.911938190460205, "global_step": 174322, "epoch": 4150} {"train_loss": -7.1398115158081055, "global_step": 174323, "epoch": 4150} {"train_loss": -7.026071548461914, "global_step": 174324, "epoch": 4150} {"train_loss": -6.9092698097229, "global_step": 174325, "epoch": 4150} {"train_loss": -7.061280250549316, "global_step": 174326, "epoch": 4150} {"train_loss": -7.053802013397217, "global_step": 174327, "epoch": 4150} {"train_loss": -6.95697021484375, "global_step": 174328, "epoch": 4150} {"train_loss": -7.122343063354492, "global_step": 174329, "epoch": 4150} {"train_loss": -6.932283401489258, "global_step": 174330, "epoch": 4150} {"train_loss": -6.916294097900391, "global_step": 174331, "epoch": 4150} {"train_loss": -7.007204055786133, "global_step": 174332, "epoch": 4150} {"train_loss": -7.030174732208252, "global_step": 174333, "epoch": 4150} {"train_loss": -7.0957746505737305, "global_step": 174334, "epoch": 4150} {"train_loss": -6.922369956970215, "global_step": 174335, "epoch": 4150} {"train_loss": -7.058548450469971, "global_step": 174336, "epoch": 4150} {"train_loss": -7.022660255432129, "global_step": 174337, "epoch": 4150} {"train_loss": -6.959555625915527, "global_step": 174338, "epoch": 4150} {"train_loss": -6.951530456542969, "global_step": 174339, "epoch": 4150} {"train_loss": -7.042027473449707, "global_step": 174340, "epoch": 4150} {"train_loss": -6.979869036447434, "global_step": 174341, "epoch": 4150, "train/sim_max_reward_0": 0.39381593149478705, "train/sim_max_reward_1": 0.9621348151854929, "train/sim_max_reward_2": 0.9902407074122587, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.35225519407375805, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.1524143263740682, "test/sim_max_reward_4400001": 0.2532290339140256, "test/sim_max_reward_4400002": 0.9040658504811084, "test/sim_max_reward_4400003": 0.9777724680699182, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.980559165885449, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.8826273156606318, "test/sim_max_reward_4400008": 0.3066326023304844, "test/sim_max_reward_4400009": 0.8852689630271324, "test/sim_max_reward_4400010": 0.9390262332328939, "test/sim_max_reward_4400011": 0.07516846122527346, "test/sim_max_reward_4400012": 0.9956535928508459, "test/sim_max_reward_4400013": 0.9256263105748417, "test/sim_max_reward_4400014": 0.9524994682682655, "test/sim_max_reward_4400015": 0.8089207373239982, "test/sim_max_reward_4400016": 0.14201010652144724, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2992566678761314, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.22786352513691868, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.27172372167293296, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.010495465562321874, "test/sim_max_reward_4400028": 0.5106573656160024, "test/sim_max_reward_4400029": 0.33476820025938625, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9670292153017556, "test/sim_max_reward_4400034": 0.9385840583485819, "test/sim_max_reward_4400035": 0.4303046244976488, "test/sim_max_reward_4400036": 0.3573546790657209, "test/sim_max_reward_4400037": 0.9628840278226045, "test/sim_max_reward_4400038": 0.9395796072110846, "test/sim_max_reward_4400039": 0.9824706891580922, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.9698860784411166, "test/sim_max_reward_4400044": 0.8894103129029561, "test/sim_max_reward_4400045": 0.9660447577526814, "test/sim_max_reward_4400046": 0.3749281553016436, "test/sim_max_reward_4400047": 0.973302353648945, "test/sim_max_reward_4400048": 0.9855688490868331, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.6485719012547474, "test/mean_score": 0.6009405449276791, "val_loss": 68744.6953125} {"train_loss": -7.037781715393066, "global_step": 174342, "epoch": 4151} {"train_loss": -7.125932693481445, "global_step": 174343, "epoch": 4151} {"train_loss": -7.0068278312683105, "global_step": 174344, "epoch": 4151} {"train_loss": -6.99805212020874, "global_step": 174345, "epoch": 4151} {"train_loss": -7.051355361938477, "global_step": 174346, "epoch": 4151} {"train_loss": -7.029442310333252, "global_step": 174347, "epoch": 4151} {"train_loss": -7.065860748291016, "global_step": 174348, "epoch": 4151} {"train_loss": -7.062245845794678, "global_step": 174349, "epoch": 4151} {"train_loss": -7.061590194702148, "global_step": 174350, "epoch": 4151} {"train_loss": -7.026400566101074, "global_step": 174351, "epoch": 4151} {"train_loss": -7.04689884185791, "global_step": 174352, "epoch": 4151} {"train_loss": -7.105913162231445, "global_step": 174353, "epoch": 4151} {"train_loss": -7.0026421546936035, "global_step": 174354, "epoch": 4151} {"train_loss": -7.011292934417725, "global_step": 174355, "epoch": 4151} {"train_loss": -6.874726295471191, "global_step": 174356, "epoch": 4151} {"train_loss": -7.051717281341553, "global_step": 174357, "epoch": 4151} {"train_loss": -7.019867420196533, "global_step": 174358, "epoch": 4151} {"train_loss": -6.985886096954346, "global_step": 174359, "epoch": 4151} {"train_loss": -7.062592029571533, "global_step": 174360, "epoch": 4151} {"train_loss": -7.051006317138672, "global_step": 174361, "epoch": 4151} {"train_loss": -7.078248023986816, "global_step": 174362, "epoch": 4151} {"train_loss": -7.086010456085205, "global_step": 174363, "epoch": 4151} {"train_loss": -7.052521705627441, "global_step": 174364, "epoch": 4151} {"train_loss": -7.020083427429199, "global_step": 174365, "epoch": 4151} {"train_loss": -6.995607852935791, "global_step": 174366, "epoch": 4151} {"train_loss": -6.994899749755859, "global_step": 174367, "epoch": 4151} {"train_loss": -6.997940540313721, "global_step": 174368, "epoch": 4151} {"train_loss": -6.8827338218688965, "global_step": 174369, "epoch": 4151} {"train_loss": -7.070287704467773, "global_step": 174370, "epoch": 4151} {"train_loss": -7.052413463592529, "global_step": 174371, "epoch": 4151} {"train_loss": -7.037935733795166, "global_step": 174372, "epoch": 4151} {"train_loss": -7.089514255523682, "global_step": 174373, "epoch": 4151} {"train_loss": -6.990357398986816, "global_step": 174374, "epoch": 4151} {"train_loss": -7.067540168762207, "global_step": 174375, "epoch": 4151} {"train_loss": -6.93251895904541, "global_step": 174376, "epoch": 4151} {"train_loss": -7.020596504211426, "global_step": 174377, "epoch": 4151} {"train_loss": -7.143538475036621, "global_step": 174378, "epoch": 4151} {"train_loss": -6.843416213989258, "global_step": 174379, "epoch": 4151} {"train_loss": -6.981012344360352, "global_step": 174380, "epoch": 4151} {"train_loss": -7.013659954071045, "global_step": 174381, "epoch": 4151} {"train_loss": -6.977889060974121, "global_step": 174382, "epoch": 4151} {"train_loss": -7.0283712432498024, "global_step": 174383, "epoch": 4151, "val_loss": 68825.6953125} {"train_loss": -6.984550476074219, "global_step": 174384, "epoch": 4152} {"train_loss": -6.8762736320495605, "global_step": 174385, "epoch": 4152} {"train_loss": -6.9942827224731445, "global_step": 174386, "epoch": 4152} {"train_loss": -7.040230751037598, "global_step": 174387, "epoch": 4152} {"train_loss": -7.051292419433594, "global_step": 174388, "epoch": 4152} {"train_loss": -7.022608757019043, "global_step": 174389, "epoch": 4152} {"train_loss": -6.998416900634766, "global_step": 174390, "epoch": 4152} {"train_loss": -7.109829425811768, "global_step": 174391, "epoch": 4152} {"train_loss": -6.974081516265869, "global_step": 174392, "epoch": 4152} {"train_loss": -6.997451305389404, "global_step": 174393, "epoch": 4152} {"train_loss": -7.051422119140625, "global_step": 174394, "epoch": 4152} {"train_loss": -7.145428657531738, "global_step": 174395, "epoch": 4152} {"train_loss": -7.043210029602051, "global_step": 174396, "epoch": 4152} {"train_loss": -7.058391571044922, "global_step": 174397, "epoch": 4152} {"train_loss": -6.997679233551025, "global_step": 174398, "epoch": 4152} {"train_loss": -7.090710639953613, "global_step": 174399, "epoch": 4152} {"train_loss": -7.000669479370117, "global_step": 174400, "epoch": 4152} {"train_loss": -7.024592399597168, "global_step": 174401, "epoch": 4152} {"train_loss": -7.013546943664551, "global_step": 174402, "epoch": 4152} {"train_loss": -6.952564239501953, "global_step": 174403, "epoch": 4152} {"train_loss": -7.0894975662231445, "global_step": 174404, "epoch": 4152} {"train_loss": -7.005617618560791, "global_step": 174405, "epoch": 4152} {"train_loss": -7.047301292419434, "global_step": 174406, "epoch": 4152} {"train_loss": -7.084753513336182, "global_step": 174407, "epoch": 4152} {"train_loss": -7.13787841796875, "global_step": 174408, "epoch": 4152} {"train_loss": -6.946596622467041, "global_step": 174409, "epoch": 4152} {"train_loss": -7.070464611053467, "global_step": 174410, "epoch": 4152} {"train_loss": -6.966281414031982, "global_step": 174411, "epoch": 4152} {"train_loss": -6.900771141052246, "global_step": 174412, "epoch": 4152} {"train_loss": -7.005720138549805, "global_step": 174413, "epoch": 4152} {"train_loss": -7.0189409255981445, "global_step": 174414, "epoch": 4152} {"train_loss": -7.019796848297119, "global_step": 174415, "epoch": 4152} {"train_loss": -6.935818672180176, "global_step": 174416, "epoch": 4152} {"train_loss": -6.989589214324951, "global_step": 174417, "epoch": 4152} {"train_loss": -6.903650283813477, "global_step": 174418, "epoch": 4152} {"train_loss": -7.045675277709961, "global_step": 174419, "epoch": 4152} {"train_loss": -7.023499488830566, "global_step": 174420, "epoch": 4152} {"train_loss": -6.95243501663208, "global_step": 174421, "epoch": 4152} {"train_loss": -6.927173614501953, "global_step": 174422, "epoch": 4152} {"train_loss": -7.056722640991211, "global_step": 174423, "epoch": 4152} {"train_loss": -6.82611608505249, "global_step": 174424, "epoch": 4152} {"train_loss": -7.010424875077748, "global_step": 174425, "epoch": 4152, "val_loss": 68654.078125} {"train_loss": -7.087457656860352, "global_step": 174426, "epoch": 4153} {"train_loss": -6.960253715515137, "global_step": 174427, "epoch": 4153} {"train_loss": -7.08035945892334, "global_step": 174428, "epoch": 4153} {"train_loss": -7.0396623611450195, "global_step": 174429, "epoch": 4153} {"train_loss": -6.930135250091553, "global_step": 174430, "epoch": 4153} {"train_loss": -7.021920680999756, "global_step": 174431, "epoch": 4153} {"train_loss": -7.1075439453125, "global_step": 174432, "epoch": 4153} {"train_loss": -7.00672721862793, "global_step": 174433, "epoch": 4153} {"train_loss": -7.0957512855529785, "global_step": 174434, "epoch": 4153} {"train_loss": -7.078913688659668, "global_step": 174435, "epoch": 4153} {"train_loss": -7.0611982345581055, "global_step": 174436, "epoch": 4153} {"train_loss": -7.044683456420898, "global_step": 174437, "epoch": 4153} {"train_loss": -7.009471893310547, "global_step": 174438, "epoch": 4153} {"train_loss": -7.121762275695801, "global_step": 174439, "epoch": 4153} {"train_loss": -7.051547050476074, "global_step": 174440, "epoch": 4153} {"train_loss": -7.1782612800598145, "global_step": 174441, "epoch": 4153} {"train_loss": -7.078893184661865, "global_step": 174442, "epoch": 4153} {"train_loss": -7.044729232788086, "global_step": 174443, "epoch": 4153} {"train_loss": -7.210188865661621, "global_step": 174444, "epoch": 4153} {"train_loss": -7.185378074645996, "global_step": 174445, "epoch": 4153} {"train_loss": -7.045047283172607, "global_step": 174446, "epoch": 4153} {"train_loss": -7.116159439086914, "global_step": 174447, "epoch": 4153} {"train_loss": -7.097232818603516, "global_step": 174448, "epoch": 4153} {"train_loss": -6.998934268951416, "global_step": 174449, "epoch": 4153} {"train_loss": -7.060608863830566, "global_step": 174450, "epoch": 4153} {"train_loss": -6.921099662780762, "global_step": 174451, "epoch": 4153} {"train_loss": -6.942787170410156, "global_step": 174452, "epoch": 4153} {"train_loss": -6.966363906860352, "global_step": 174453, "epoch": 4153} {"train_loss": -6.985476493835449, "global_step": 174454, "epoch": 4153} {"train_loss": -7.062219619750977, "global_step": 174455, "epoch": 4153} {"train_loss": -6.924440383911133, "global_step": 174456, "epoch": 4153} {"train_loss": -7.046552658081055, "global_step": 174457, "epoch": 4153} {"train_loss": -7.048655986785889, "global_step": 174458, "epoch": 4153} {"train_loss": -6.789709568023682, "global_step": 174459, "epoch": 4153} {"train_loss": -6.917416572570801, "global_step": 174460, "epoch": 4153} {"train_loss": -6.991493225097656, "global_step": 174461, "epoch": 4153} {"train_loss": -6.8672871589660645, "global_step": 174462, "epoch": 4153} {"train_loss": -7.025217056274414, "global_step": 174463, "epoch": 4153} {"train_loss": -6.953283309936523, "global_step": 174464, "epoch": 4153} {"train_loss": -6.829098701477051, "global_step": 174465, "epoch": 4153} {"train_loss": -6.926671504974365, "global_step": 174466, "epoch": 4153} {"train_loss": -7.019896995453608, "global_step": 174467, "epoch": 4153, "val_loss": 68581.6953125} {"train_loss": -7.063214302062988, "global_step": 174468, "epoch": 4154} {"train_loss": -6.940005302429199, "global_step": 174469, "epoch": 4154} {"train_loss": -7.110891342163086, "global_step": 174470, "epoch": 4154} {"train_loss": -7.060493469238281, "global_step": 174471, "epoch": 4154} {"train_loss": -6.982810974121094, "global_step": 174472, "epoch": 4154} {"train_loss": -7.0051350593566895, "global_step": 174473, "epoch": 4154} {"train_loss": -6.958761215209961, "global_step": 174474, "epoch": 4154} {"train_loss": -6.919490814208984, "global_step": 174475, "epoch": 4154} {"train_loss": -7.07224178314209, "global_step": 174476, "epoch": 4154} {"train_loss": -6.920262813568115, "global_step": 174477, "epoch": 4154} {"train_loss": -7.074944496154785, "global_step": 174478, "epoch": 4154} {"train_loss": -7.007721900939941, "global_step": 174479, "epoch": 4154} {"train_loss": -6.962429523468018, "global_step": 174480, "epoch": 4154} {"train_loss": -6.906572341918945, "global_step": 174481, "epoch": 4154} {"train_loss": -6.932650566101074, "global_step": 174482, "epoch": 4154} {"train_loss": -6.823709487915039, "global_step": 174483, "epoch": 4154} {"train_loss": -6.941219329833984, "global_step": 174484, "epoch": 4154} {"train_loss": -7.004101753234863, "global_step": 174485, "epoch": 4154} {"train_loss": -6.950263977050781, "global_step": 174486, "epoch": 4154} {"train_loss": -7.006446361541748, "global_step": 174487, "epoch": 4154} {"train_loss": -6.861205577850342, "global_step": 174488, "epoch": 4154} {"train_loss": -6.835033416748047, "global_step": 174489, "epoch": 4154} {"train_loss": -6.919323921203613, "global_step": 174490, "epoch": 4154} {"train_loss": -6.912381172180176, "global_step": 174491, "epoch": 4154} {"train_loss": -6.956358432769775, "global_step": 174492, "epoch": 4154} {"train_loss": -7.037468910217285, "global_step": 174493, "epoch": 4154} {"train_loss": -6.908762454986572, "global_step": 174494, "epoch": 4154} {"train_loss": -7.006292343139648, "global_step": 174495, "epoch": 4154} {"train_loss": -6.963367462158203, "global_step": 174496, "epoch": 4154} {"train_loss": -7.072735786437988, "global_step": 174497, "epoch": 4154} {"train_loss": -7.056545257568359, "global_step": 174498, "epoch": 4154} {"train_loss": -7.071544647216797, "global_step": 174499, "epoch": 4154} {"train_loss": -7.077352523803711, "global_step": 174500, "epoch": 4154} {"train_loss": -7.031235694885254, "global_step": 174501, "epoch": 4154} {"train_loss": -7.074202537536621, "global_step": 174502, "epoch": 4154} {"train_loss": -7.01584529876709, "global_step": 174503, "epoch": 4154} {"train_loss": -7.0136308670043945, "global_step": 174504, "epoch": 4154} {"train_loss": -7.028528213500977, "global_step": 174505, "epoch": 4154} {"train_loss": -6.992959022521973, "global_step": 174506, "epoch": 4154} {"train_loss": -7.048321723937988, "global_step": 174507, "epoch": 4154} {"train_loss": -7.110955715179443, "global_step": 174508, "epoch": 4154} {"train_loss": -6.992902131307693, "global_step": 174509, "epoch": 4154, "val_loss": 68461.734375} {"train_loss": -7.105804443359375, "global_step": 174510, "epoch": 4155} {"train_loss": -7.050420761108398, "global_step": 174511, "epoch": 4155} {"train_loss": -7.126352787017822, "global_step": 174512, "epoch": 4155} {"train_loss": -7.14774227142334, "global_step": 174513, "epoch": 4155} {"train_loss": -7.184576034545898, "global_step": 174514, "epoch": 4155} {"train_loss": -7.013906478881836, "global_step": 174515, "epoch": 4155} {"train_loss": -7.166891098022461, "global_step": 174516, "epoch": 4155} {"train_loss": -6.999241828918457, "global_step": 174517, "epoch": 4155} {"train_loss": -7.1870198249816895, "global_step": 174518, "epoch": 4155} {"train_loss": -6.996275901794434, "global_step": 174519, "epoch": 4155} {"train_loss": -7.172201156616211, "global_step": 174520, "epoch": 4155} {"train_loss": -7.004975318908691, "global_step": 174521, "epoch": 4155} {"train_loss": -7.122491836547852, "global_step": 174522, "epoch": 4155} {"train_loss": -7.070475101470947, "global_step": 174523, "epoch": 4155} {"train_loss": -7.138554573059082, "global_step": 174524, "epoch": 4155} {"train_loss": -7.085100173950195, "global_step": 174525, "epoch": 4155} {"train_loss": -6.997841835021973, "global_step": 174526, "epoch": 4155} {"train_loss": -6.980888843536377, "global_step": 174527, "epoch": 4155} {"train_loss": -6.981823921203613, "global_step": 174528, "epoch": 4155} {"train_loss": -6.954564094543457, "global_step": 174529, "epoch": 4155} {"train_loss": -6.955260276794434, "global_step": 174530, "epoch": 4155} {"train_loss": -6.955807685852051, "global_step": 174531, "epoch": 4155} {"train_loss": -7.038975715637207, "global_step": 174532, "epoch": 4155} {"train_loss": -7.033512115478516, "global_step": 174533, "epoch": 4155} {"train_loss": -7.019147872924805, "global_step": 174534, "epoch": 4155} {"train_loss": -6.812460899353027, "global_step": 174535, "epoch": 4155} {"train_loss": -7.0549774169921875, "global_step": 174536, "epoch": 4155} {"train_loss": -7.053699493408203, "global_step": 174537, "epoch": 4155} {"train_loss": -6.990993499755859, "global_step": 174538, "epoch": 4155} {"train_loss": -7.105299949645996, "global_step": 174539, "epoch": 4155} {"train_loss": -7.0095672607421875, "global_step": 174540, "epoch": 4155} {"train_loss": -7.018075942993164, "global_step": 174541, "epoch": 4155} {"train_loss": -7.055535793304443, "global_step": 174542, "epoch": 4155} {"train_loss": -6.992356300354004, "global_step": 174543, "epoch": 4155} {"train_loss": -7.063270568847656, "global_step": 174544, "epoch": 4155} {"train_loss": -7.064347267150879, "global_step": 174545, "epoch": 4155} {"train_loss": -7.170576572418213, "global_step": 174546, "epoch": 4155} {"train_loss": -7.150151252746582, "global_step": 174547, "epoch": 4155} {"train_loss": -7.053701400756836, "global_step": 174548, "epoch": 4155} {"train_loss": -7.14381217956543, "global_step": 174549, "epoch": 4155} {"train_loss": -7.128652572631836, "global_step": 174550, "epoch": 4155} {"train_loss": -7.05691073054359, "global_step": 174551, "epoch": 4155, "val_loss": 68591.28125} {"train_loss": -7.1423749923706055, "global_step": 174552, "epoch": 4156} {"train_loss": -7.104233741760254, "global_step": 174553, "epoch": 4156} {"train_loss": -7.112484455108643, "global_step": 174554, "epoch": 4156} {"train_loss": -7.093225479125977, "global_step": 174555, "epoch": 4156} {"train_loss": -7.093493938446045, "global_step": 174556, "epoch": 4156} {"train_loss": -7.062081336975098, "global_step": 174557, "epoch": 4156} {"train_loss": -7.07490348815918, "global_step": 174558, "epoch": 4156} {"train_loss": -7.028337001800537, "global_step": 174559, "epoch": 4156} {"train_loss": -7.044983386993408, "global_step": 174560, "epoch": 4156} {"train_loss": -6.955048084259033, "global_step": 174561, "epoch": 4156} {"train_loss": -7.173081398010254, "global_step": 174562, "epoch": 4156} {"train_loss": -7.080122947692871, "global_step": 174563, "epoch": 4156} {"train_loss": -7.024385929107666, "global_step": 174564, "epoch": 4156} {"train_loss": -6.9672441482543945, "global_step": 174565, "epoch": 4156} {"train_loss": -6.990206718444824, "global_step": 174566, "epoch": 4156} {"train_loss": -7.043671607971191, "global_step": 174567, "epoch": 4156} {"train_loss": -7.138415336608887, "global_step": 174568, "epoch": 4156} {"train_loss": -7.044454574584961, "global_step": 174569, "epoch": 4156} {"train_loss": -7.090238571166992, "global_step": 174570, "epoch": 4156} {"train_loss": -7.008295059204102, "global_step": 174571, "epoch": 4156} {"train_loss": -7.15709924697876, "global_step": 174572, "epoch": 4156} {"train_loss": -7.057651519775391, "global_step": 174573, "epoch": 4156} {"train_loss": -7.001556873321533, "global_step": 174574, "epoch": 4156} {"train_loss": -6.937713146209717, "global_step": 174575, "epoch": 4156} {"train_loss": -6.989679336547852, "global_step": 174576, "epoch": 4156} {"train_loss": -6.8832550048828125, "global_step": 174577, "epoch": 4156} {"train_loss": -6.949008464813232, "global_step": 174578, "epoch": 4156} {"train_loss": -7.0709428787231445, "global_step": 174579, "epoch": 4156} {"train_loss": -6.821403503417969, "global_step": 174580, "epoch": 4156} {"train_loss": -7.004715919494629, "global_step": 174581, "epoch": 4156} {"train_loss": -6.91140604019165, "global_step": 174582, "epoch": 4156} {"train_loss": -7.0033488273620605, "global_step": 174583, "epoch": 4156} {"train_loss": -6.96215295791626, "global_step": 174584, "epoch": 4156} {"train_loss": -6.849658966064453, "global_step": 174585, "epoch": 4156} {"train_loss": -7.011044979095459, "global_step": 174586, "epoch": 4156} {"train_loss": -6.958750247955322, "global_step": 174587, "epoch": 4156} {"train_loss": -6.870030403137207, "global_step": 174588, "epoch": 4156} {"train_loss": -6.894543647766113, "global_step": 174589, "epoch": 4156} {"train_loss": -6.987906455993652, "global_step": 174590, "epoch": 4156} {"train_loss": -6.8958611488342285, "global_step": 174591, "epoch": 4156} {"train_loss": -6.99150276184082, "global_step": 174592, "epoch": 4156} {"train_loss": -7.0112100555783226, "global_step": 174593, "epoch": 4156, "val_loss": 68734.2109375} {"train_loss": -6.985957145690918, "global_step": 174594, "epoch": 4157} {"train_loss": -6.856869220733643, "global_step": 174595, "epoch": 4157} {"train_loss": -6.968560695648193, "global_step": 174596, "epoch": 4157} {"train_loss": -7.096030235290527, "global_step": 174597, "epoch": 4157} {"train_loss": -6.94994592666626, "global_step": 174598, "epoch": 4157} {"train_loss": -6.968406677246094, "global_step": 174599, "epoch": 4157} {"train_loss": -6.9444732666015625, "global_step": 174600, "epoch": 4157} {"train_loss": -6.941616058349609, "global_step": 174601, "epoch": 4157} {"train_loss": -6.989346504211426, "global_step": 174602, "epoch": 4157} {"train_loss": -6.928180694580078, "global_step": 174603, "epoch": 4157} {"train_loss": -7.1222825050354, "global_step": 174604, "epoch": 4157} {"train_loss": -6.944758415222168, "global_step": 174605, "epoch": 4157} {"train_loss": -6.944869518280029, "global_step": 174606, "epoch": 4157} {"train_loss": -7.055331230163574, "global_step": 174607, "epoch": 4157} {"train_loss": -6.951798439025879, "global_step": 174608, "epoch": 4157} {"train_loss": -7.032492637634277, "global_step": 174609, "epoch": 4157} {"train_loss": -7.032559394836426, "global_step": 174610, "epoch": 4157} {"train_loss": -6.932485580444336, "global_step": 174611, "epoch": 4157} {"train_loss": -7.072426795959473, "global_step": 174612, "epoch": 4157} {"train_loss": -7.063358306884766, "global_step": 174613, "epoch": 4157} {"train_loss": -7.003651142120361, "global_step": 174614, "epoch": 4157} {"train_loss": -7.100082874298096, "global_step": 174615, "epoch": 4157} {"train_loss": -7.091677665710449, "global_step": 174616, "epoch": 4157} {"train_loss": -7.051606178283691, "global_step": 174617, "epoch": 4157} {"train_loss": -7.141849517822266, "global_step": 174618, "epoch": 4157} {"train_loss": -7.01782751083374, "global_step": 174619, "epoch": 4157} {"train_loss": -7.028414726257324, "global_step": 174620, "epoch": 4157} {"train_loss": -6.976231098175049, "global_step": 174621, "epoch": 4157} {"train_loss": -7.064508438110352, "global_step": 174622, "epoch": 4157} {"train_loss": -7.128898620605469, "global_step": 174623, "epoch": 4157} {"train_loss": -7.0928635597229, "global_step": 174624, "epoch": 4157} {"train_loss": -7.1281585693359375, "global_step": 174625, "epoch": 4157} {"train_loss": -6.964865684509277, "global_step": 174626, "epoch": 4157} {"train_loss": -6.977755546569824, "global_step": 174627, "epoch": 4157} {"train_loss": -7.039745330810547, "global_step": 174628, "epoch": 4157} {"train_loss": -7.0061140060424805, "global_step": 174629, "epoch": 4157} {"train_loss": -7.117417812347412, "global_step": 174630, "epoch": 4157} {"train_loss": -7.026494979858398, "global_step": 174631, "epoch": 4157} {"train_loss": -7.066900253295898, "global_step": 174632, "epoch": 4157} {"train_loss": -7.008996963500977, "global_step": 174633, "epoch": 4157} {"train_loss": -6.873673915863037, "global_step": 174634, "epoch": 4157} {"train_loss": -7.017640000297909, "global_step": 174635, "epoch": 4157, "val_loss": 68734.1875} {"train_loss": -6.914876937866211, "global_step": 174636, "epoch": 4158} {"train_loss": -7.04817008972168, "global_step": 174637, "epoch": 4158} {"train_loss": -6.792143821716309, "global_step": 174638, "epoch": 4158} {"train_loss": -6.870338439941406, "global_step": 174639, "epoch": 4158} {"train_loss": -6.991182804107666, "global_step": 174640, "epoch": 4158} {"train_loss": -6.965127944946289, "global_step": 174641, "epoch": 4158} {"train_loss": -6.996615886688232, "global_step": 174642, "epoch": 4158} {"train_loss": -6.913727760314941, "global_step": 174643, "epoch": 4158} {"train_loss": -6.98328971862793, "global_step": 174644, "epoch": 4158} {"train_loss": -6.9614973068237305, "global_step": 174645, "epoch": 4158} {"train_loss": -7.045971393585205, "global_step": 174646, "epoch": 4158} {"train_loss": -6.899007797241211, "global_step": 174647, "epoch": 4158} {"train_loss": -7.027924537658691, "global_step": 174648, "epoch": 4158} {"train_loss": -6.919803619384766, "global_step": 174649, "epoch": 4158} {"train_loss": -7.0720319747924805, "global_step": 174650, "epoch": 4158} {"train_loss": -7.08643102645874, "global_step": 174651, "epoch": 4158} {"train_loss": -6.932518005371094, "global_step": 174652, "epoch": 4158} {"train_loss": -6.958373069763184, "global_step": 174653, "epoch": 4158} {"train_loss": -7.0110578536987305, "global_step": 174654, "epoch": 4158} {"train_loss": -6.953308582305908, "global_step": 174655, "epoch": 4158} {"train_loss": -6.989328384399414, "global_step": 174656, "epoch": 4158} {"train_loss": -6.860476493835449, "global_step": 174657, "epoch": 4158} {"train_loss": -6.945352554321289, "global_step": 174658, "epoch": 4158} {"train_loss": -7.133846282958984, "global_step": 174659, "epoch": 4158} {"train_loss": -6.900789260864258, "global_step": 174660, "epoch": 4158} {"train_loss": -6.995292663574219, "global_step": 174661, "epoch": 4158} {"train_loss": -7.0113115310668945, "global_step": 174662, "epoch": 4158} {"train_loss": -7.0809736251831055, "global_step": 174663, "epoch": 4158} {"train_loss": -7.101894378662109, "global_step": 174664, "epoch": 4158} {"train_loss": -6.9619221687316895, "global_step": 174665, "epoch": 4158} {"train_loss": -7.089297771453857, "global_step": 174666, "epoch": 4158} {"train_loss": -7.085768222808838, "global_step": 174667, "epoch": 4158} {"train_loss": -7.084256172180176, "global_step": 174668, "epoch": 4158} {"train_loss": -6.9915313720703125, "global_step": 174669, "epoch": 4158} {"train_loss": -7.066379547119141, "global_step": 174670, "epoch": 4158} {"train_loss": -7.046098709106445, "global_step": 174671, "epoch": 4158} {"train_loss": -7.037971496582031, "global_step": 174672, "epoch": 4158} {"train_loss": -7.08317232131958, "global_step": 174673, "epoch": 4158} {"train_loss": -7.1497015953063965, "global_step": 174674, "epoch": 4158} {"train_loss": -7.0830078125, "global_step": 174675, "epoch": 4158} {"train_loss": -7.054757118225098, "global_step": 174676, "epoch": 4158} {"train_loss": -7.003452085313343, "global_step": 174677, "epoch": 4158, "val_loss": 68619.9375} {"train_loss": -7.0425543785095215, "global_step": 174678, "epoch": 4159} {"train_loss": -7.087175369262695, "global_step": 174679, "epoch": 4159} {"train_loss": -6.9579877853393555, "global_step": 174680, "epoch": 4159} {"train_loss": -7.065258026123047, "global_step": 174681, "epoch": 4159} {"train_loss": -7.02288818359375, "global_step": 174682, "epoch": 4159} {"train_loss": -7.026405334472656, "global_step": 174683, "epoch": 4159} {"train_loss": -7.003070831298828, "global_step": 174684, "epoch": 4159} {"train_loss": -7.096245765686035, "global_step": 174685, "epoch": 4159} {"train_loss": -7.12038516998291, "global_step": 174686, "epoch": 4159} {"train_loss": -7.117217063903809, "global_step": 174687, "epoch": 4159} {"train_loss": -7.108191967010498, "global_step": 174688, "epoch": 4159} {"train_loss": -7.067859172821045, "global_step": 174689, "epoch": 4159} {"train_loss": -7.014581680297852, "global_step": 174690, "epoch": 4159} {"train_loss": -7.227063179016113, "global_step": 174691, "epoch": 4159} {"train_loss": -7.031345367431641, "global_step": 174692, "epoch": 4159} {"train_loss": -7.106462478637695, "global_step": 174693, "epoch": 4159} {"train_loss": -7.010483741760254, "global_step": 174694, "epoch": 4159} {"train_loss": -7.003188133239746, "global_step": 174695, "epoch": 4159} {"train_loss": -7.100152492523193, "global_step": 174696, "epoch": 4159} {"train_loss": -7.003927707672119, "global_step": 174697, "epoch": 4159} {"train_loss": -6.9726715087890625, "global_step": 174698, "epoch": 4159} {"train_loss": -7.1470136642456055, "global_step": 174699, "epoch": 4159} {"train_loss": -6.984007835388184, "global_step": 174700, "epoch": 4159} {"train_loss": -7.033388137817383, "global_step": 174701, "epoch": 4159} {"train_loss": -7.025964736938477, "global_step": 174702, "epoch": 4159} {"train_loss": -7.120502471923828, "global_step": 174703, "epoch": 4159} {"train_loss": -7.054383277893066, "global_step": 174704, "epoch": 4159} {"train_loss": -7.071820259094238, "global_step": 174705, "epoch": 4159} {"train_loss": -7.120706558227539, "global_step": 174706, "epoch": 4159} {"train_loss": -7.136818885803223, "global_step": 174707, "epoch": 4159} {"train_loss": -7.058547019958496, "global_step": 174708, "epoch": 4159} {"train_loss": -7.019474029541016, "global_step": 174709, "epoch": 4159} {"train_loss": -7.010275363922119, "global_step": 174710, "epoch": 4159} {"train_loss": -6.969592094421387, "global_step": 174711, "epoch": 4159} {"train_loss": -7.070608139038086, "global_step": 174712, "epoch": 4159} {"train_loss": -6.9963555335998535, "global_step": 174713, "epoch": 4159} {"train_loss": -7.06803035736084, "global_step": 174714, "epoch": 4159} {"train_loss": -6.951353549957275, "global_step": 174715, "epoch": 4159} {"train_loss": -7.0062255859375, "global_step": 174716, "epoch": 4159} {"train_loss": -7.080391883850098, "global_step": 174717, "epoch": 4159} {"train_loss": -7.119722366333008, "global_step": 174718, "epoch": 4159} {"train_loss": -7.056017966497512, "global_step": 174719, "epoch": 4159, "val_loss": 68676.390625} {"train_loss": -7.1100239753723145, "global_step": 174720, "epoch": 4160} {"train_loss": -7.006690502166748, "global_step": 174721, "epoch": 4160} {"train_loss": -7.013010501861572, "global_step": 174722, "epoch": 4160} {"train_loss": -7.036611080169678, "global_step": 174723, "epoch": 4160} {"train_loss": -7.017422676086426, "global_step": 174724, "epoch": 4160} {"train_loss": -6.9839630126953125, "global_step": 174725, "epoch": 4160} {"train_loss": -7.085053443908691, "global_step": 174726, "epoch": 4160} {"train_loss": -7.032382965087891, "global_step": 174727, "epoch": 4160} {"train_loss": -6.896431922912598, "global_step": 174728, "epoch": 4160} {"train_loss": -7.078118801116943, "global_step": 174729, "epoch": 4160} {"train_loss": -7.028278350830078, "global_step": 174730, "epoch": 4160} {"train_loss": -7.012550354003906, "global_step": 174731, "epoch": 4160} {"train_loss": -7.075394630432129, "global_step": 174732, "epoch": 4160} {"train_loss": -7.063953876495361, "global_step": 174733, "epoch": 4160} {"train_loss": -7.030791282653809, "global_step": 174734, "epoch": 4160} {"train_loss": -6.977750778198242, "global_step": 174735, "epoch": 4160} {"train_loss": -7.005458354949951, "global_step": 174736, "epoch": 4160} {"train_loss": -7.008559226989746, "global_step": 174737, "epoch": 4160} {"train_loss": -7.186861991882324, "global_step": 174738, "epoch": 4160} {"train_loss": -6.972876071929932, "global_step": 174739, "epoch": 4160} {"train_loss": -6.977729797363281, "global_step": 174740, "epoch": 4160} {"train_loss": -7.051235675811768, "global_step": 174741, "epoch": 4160} {"train_loss": -6.963744163513184, "global_step": 174742, "epoch": 4160} {"train_loss": -6.972525596618652, "global_step": 174743, "epoch": 4160} {"train_loss": -7.045866966247559, "global_step": 174744, "epoch": 4160} {"train_loss": -7.009417533874512, "global_step": 174745, "epoch": 4160} {"train_loss": -7.054920673370361, "global_step": 174746, "epoch": 4160} {"train_loss": -7.026928901672363, "global_step": 174747, "epoch": 4160} {"train_loss": -6.963644027709961, "global_step": 174748, "epoch": 4160} {"train_loss": -6.945950984954834, "global_step": 174749, "epoch": 4160} {"train_loss": -6.997762680053711, "global_step": 174750, "epoch": 4160} {"train_loss": -6.900444030761719, "global_step": 174751, "epoch": 4160} {"train_loss": -6.878787517547607, "global_step": 174752, "epoch": 4160} {"train_loss": -6.9590606689453125, "global_step": 174753, "epoch": 4160} {"train_loss": -6.975408554077148, "global_step": 174754, "epoch": 4160} {"train_loss": -6.872069358825684, "global_step": 174755, "epoch": 4160} {"train_loss": -6.983560562133789, "global_step": 174756, "epoch": 4160} {"train_loss": -7.122624397277832, "global_step": 174757, "epoch": 4160} {"train_loss": -7.01010799407959, "global_step": 174758, "epoch": 4160} {"train_loss": -7.117911338806152, "global_step": 174759, "epoch": 4160} {"train_loss": -7.081351280212402, "global_step": 174760, "epoch": 4160} {"train_loss": -7.012174708502633, "global_step": 174761, "epoch": 4160, "val_loss": 68831.078125} {"train_loss": -7.040263652801514, "global_step": 174762, "epoch": 4161} {"train_loss": -6.931418418884277, "global_step": 174763, "epoch": 4161} {"train_loss": -6.934110641479492, "global_step": 174764, "epoch": 4161} {"train_loss": -6.974037170410156, "global_step": 174765, "epoch": 4161} {"train_loss": -6.959453582763672, "global_step": 174766, "epoch": 4161} {"train_loss": -7.054686069488525, "global_step": 174767, "epoch": 4161} {"train_loss": -7.08259391784668, "global_step": 174768, "epoch": 4161} {"train_loss": -6.918508529663086, "global_step": 174769, "epoch": 4161} {"train_loss": -6.965687274932861, "global_step": 174770, "epoch": 4161} {"train_loss": -7.033291816711426, "global_step": 174771, "epoch": 4161} {"train_loss": -7.057424068450928, "global_step": 174772, "epoch": 4161} {"train_loss": -7.0790605545043945, "global_step": 174773, "epoch": 4161} {"train_loss": -7.042913436889648, "global_step": 174774, "epoch": 4161} {"train_loss": -7.106788158416748, "global_step": 174775, "epoch": 4161} {"train_loss": -7.049726486206055, "global_step": 174776, "epoch": 4161} {"train_loss": -7.010764122009277, "global_step": 174777, "epoch": 4161} {"train_loss": -7.192713260650635, "global_step": 174778, "epoch": 4161} {"train_loss": -7.064283847808838, "global_step": 174779, "epoch": 4161} {"train_loss": -7.0963850021362305, "global_step": 174780, "epoch": 4161} {"train_loss": -7.122108459472656, "global_step": 174781, "epoch": 4161} {"train_loss": -7.06467342376709, "global_step": 174782, "epoch": 4161} {"train_loss": -7.083654403686523, "global_step": 174783, "epoch": 4161} {"train_loss": -7.069327354431152, "global_step": 174784, "epoch": 4161} {"train_loss": -7.106300354003906, "global_step": 174785, "epoch": 4161} {"train_loss": -7.009300231933594, "global_step": 174786, "epoch": 4161} {"train_loss": -7.0399675369262695, "global_step": 174787, "epoch": 4161} {"train_loss": -7.027129173278809, "global_step": 174788, "epoch": 4161} {"train_loss": -6.978697776794434, "global_step": 174789, "epoch": 4161} {"train_loss": -7.127927780151367, "global_step": 174790, "epoch": 4161} {"train_loss": -7.086509704589844, "global_step": 174791, "epoch": 4161} {"train_loss": -7.001330375671387, "global_step": 174792, "epoch": 4161} {"train_loss": -6.95029354095459, "global_step": 174793, "epoch": 4161} {"train_loss": -7.11216402053833, "global_step": 174794, "epoch": 4161} {"train_loss": -6.950743198394775, "global_step": 174795, "epoch": 4161} {"train_loss": -7.012544631958008, "global_step": 174796, "epoch": 4161} {"train_loss": -6.877505779266357, "global_step": 174797, "epoch": 4161} {"train_loss": -7.052688121795654, "global_step": 174798, "epoch": 4161} {"train_loss": -6.858825206756592, "global_step": 174799, "epoch": 4161} {"train_loss": -6.775022506713867, "global_step": 174800, "epoch": 4161} {"train_loss": -7.022650718688965, "global_step": 174801, "epoch": 4161} {"train_loss": -6.878542900085449, "global_step": 174802, "epoch": 4161} {"train_loss": -7.019147850218273, "global_step": 174803, "epoch": 4161, "val_loss": 68743.359375} {"train_loss": -7.014368057250977, "global_step": 174804, "epoch": 4162} {"train_loss": -6.886484146118164, "global_step": 174805, "epoch": 4162} {"train_loss": -6.879327774047852, "global_step": 174806, "epoch": 4162} {"train_loss": -6.923285484313965, "global_step": 174807, "epoch": 4162} {"train_loss": -6.918292045593262, "global_step": 174808, "epoch": 4162} {"train_loss": -6.840386390686035, "global_step": 174809, "epoch": 4162} {"train_loss": -6.945679664611816, "global_step": 174810, "epoch": 4162} {"train_loss": -6.9547953605651855, "global_step": 174811, "epoch": 4162} {"train_loss": -6.949090957641602, "global_step": 174812, "epoch": 4162} {"train_loss": -6.980360507965088, "global_step": 174813, "epoch": 4162} {"train_loss": -6.903422832489014, "global_step": 174814, "epoch": 4162} {"train_loss": -6.951233863830566, "global_step": 174815, "epoch": 4162} {"train_loss": -6.863445281982422, "global_step": 174816, "epoch": 4162} {"train_loss": -6.8874101638793945, "global_step": 174817, "epoch": 4162} {"train_loss": -7.057857036590576, "global_step": 174818, "epoch": 4162} {"train_loss": -6.938686370849609, "global_step": 174819, "epoch": 4162} {"train_loss": -7.041938781738281, "global_step": 174820, "epoch": 4162} {"train_loss": -7.0007476806640625, "global_step": 174821, "epoch": 4162} {"train_loss": -7.014881610870361, "global_step": 174822, "epoch": 4162} {"train_loss": -7.003274440765381, "global_step": 174823, "epoch": 4162} {"train_loss": -6.938390254974365, "global_step": 174824, "epoch": 4162} {"train_loss": -6.900788307189941, "global_step": 174825, "epoch": 4162} {"train_loss": -6.899859428405762, "global_step": 174826, "epoch": 4162} {"train_loss": -6.9804463386535645, "global_step": 174827, "epoch": 4162} {"train_loss": -7.06928825378418, "global_step": 174828, "epoch": 4162} {"train_loss": -6.986858367919922, "global_step": 174829, "epoch": 4162} {"train_loss": -7.007423400878906, "global_step": 174830, "epoch": 4162} {"train_loss": -6.999605178833008, "global_step": 174831, "epoch": 4162} {"train_loss": -7.0836873054504395, "global_step": 174832, "epoch": 4162} {"train_loss": -6.940065383911133, "global_step": 174833, "epoch": 4162} {"train_loss": -7.073345184326172, "global_step": 174834, "epoch": 4162} {"train_loss": -7.018275737762451, "global_step": 174835, "epoch": 4162} {"train_loss": -7.092175006866455, "global_step": 174836, "epoch": 4162} {"train_loss": -7.018677711486816, "global_step": 174837, "epoch": 4162} {"train_loss": -6.956431865692139, "global_step": 174838, "epoch": 4162} {"train_loss": -7.06389856338501, "global_step": 174839, "epoch": 4162} {"train_loss": -7.0450334548950195, "global_step": 174840, "epoch": 4162} {"train_loss": -7.158451557159424, "global_step": 174841, "epoch": 4162} {"train_loss": -7.111851215362549, "global_step": 174842, "epoch": 4162} {"train_loss": -7.044548988342285, "global_step": 174843, "epoch": 4162} {"train_loss": -7.066834449768066, "global_step": 174844, "epoch": 4162} {"train_loss": -6.988269658315749, "global_step": 174845, "epoch": 4162, "val_loss": 68504.0234375} {"train_loss": -7.04632043838501, "global_step": 174846, "epoch": 4163} {"train_loss": -7.075399398803711, "global_step": 174847, "epoch": 4163} {"train_loss": -7.1192474365234375, "global_step": 174848, "epoch": 4163} {"train_loss": -7.133942604064941, "global_step": 174849, "epoch": 4163} {"train_loss": -7.072649955749512, "global_step": 174850, "epoch": 4163} {"train_loss": -7.007519245147705, "global_step": 174851, "epoch": 4163} {"train_loss": -7.121391296386719, "global_step": 174852, "epoch": 4163} {"train_loss": -7.042006492614746, "global_step": 174853, "epoch": 4163} {"train_loss": -7.113178253173828, "global_step": 174854, "epoch": 4163} {"train_loss": -6.967453956604004, "global_step": 174855, "epoch": 4163} {"train_loss": -7.092155933380127, "global_step": 174856, "epoch": 4163} {"train_loss": -7.025927543640137, "global_step": 174857, "epoch": 4163} {"train_loss": -6.908137321472168, "global_step": 174858, "epoch": 4163} {"train_loss": -7.065550804138184, "global_step": 174859, "epoch": 4163} {"train_loss": -7.050953388214111, "global_step": 174860, "epoch": 4163} {"train_loss": -7.060285568237305, "global_step": 174861, "epoch": 4163} {"train_loss": -7.097819805145264, "global_step": 174862, "epoch": 4163} {"train_loss": -6.981803894042969, "global_step": 174863, "epoch": 4163} {"train_loss": -7.019340515136719, "global_step": 174864, "epoch": 4163} {"train_loss": -7.108710289001465, "global_step": 174865, "epoch": 4163} {"train_loss": -7.128181457519531, "global_step": 174866, "epoch": 4163} {"train_loss": -7.137696266174316, "global_step": 174867, "epoch": 4163} {"train_loss": -6.930150032043457, "global_step": 174868, "epoch": 4163} {"train_loss": -7.106609344482422, "global_step": 174869, "epoch": 4163} {"train_loss": -7.030150413513184, "global_step": 174870, "epoch": 4163} {"train_loss": -7.084867477416992, "global_step": 174871, "epoch": 4163} {"train_loss": -7.072314262390137, "global_step": 174872, "epoch": 4163} {"train_loss": -7.06664514541626, "global_step": 174873, "epoch": 4163} {"train_loss": -6.933655261993408, "global_step": 174874, "epoch": 4163} {"train_loss": -7.199741840362549, "global_step": 174875, "epoch": 4163} {"train_loss": -7.098546028137207, "global_step": 174876, "epoch": 4163} {"train_loss": -7.053723335266113, "global_step": 174877, "epoch": 4163} {"train_loss": -6.898836135864258, "global_step": 174878, "epoch": 4163} {"train_loss": -6.995797157287598, "global_step": 174879, "epoch": 4163} {"train_loss": -6.976706504821777, "global_step": 174880, "epoch": 4163} {"train_loss": -7.08894157409668, "global_step": 174881, "epoch": 4163} {"train_loss": -7.070476531982422, "global_step": 174882, "epoch": 4163} {"train_loss": -7.003792762756348, "global_step": 174883, "epoch": 4163} {"train_loss": -7.006833076477051, "global_step": 174884, "epoch": 4163} {"train_loss": -6.958835601806641, "global_step": 174885, "epoch": 4163} {"train_loss": -7.012995719909668, "global_step": 174886, "epoch": 4163} {"train_loss": -7.0450477713630315, "global_step": 174887, "epoch": 4163, "val_loss": 68486.9140625} {"train_loss": -6.870083332061768, "global_step": 174888, "epoch": 4164} {"train_loss": -6.986766815185547, "global_step": 174889, "epoch": 4164} {"train_loss": -6.95422887802124, "global_step": 174890, "epoch": 4164} {"train_loss": -6.8623046875, "global_step": 174891, "epoch": 4164} {"train_loss": -7.088644027709961, "global_step": 174892, "epoch": 4164} {"train_loss": -6.956453323364258, "global_step": 174893, "epoch": 4164} {"train_loss": -6.949614524841309, "global_step": 174894, "epoch": 4164} {"train_loss": -6.920014381408691, "global_step": 174895, "epoch": 4164} {"train_loss": -6.826420783996582, "global_step": 174896, "epoch": 4164} {"train_loss": -6.949805736541748, "global_step": 174897, "epoch": 4164} {"train_loss": -6.959083557128906, "global_step": 174898, "epoch": 4164} {"train_loss": -6.920074462890625, "global_step": 174899, "epoch": 4164} {"train_loss": -6.967058181762695, "global_step": 174900, "epoch": 4164} {"train_loss": -7.030236721038818, "global_step": 174901, "epoch": 4164} {"train_loss": -6.837690353393555, "global_step": 174902, "epoch": 4164} {"train_loss": -6.923750877380371, "global_step": 174903, "epoch": 4164} {"train_loss": -6.998539447784424, "global_step": 174904, "epoch": 4164} {"train_loss": -6.903889179229736, "global_step": 174905, "epoch": 4164} {"train_loss": -6.921397686004639, "global_step": 174906, "epoch": 4164} {"train_loss": -7.001558780670166, "global_step": 174907, "epoch": 4164} {"train_loss": -7.040038585662842, "global_step": 174908, "epoch": 4164} {"train_loss": -7.0055975914001465, "global_step": 174909, "epoch": 4164} {"train_loss": -6.981208801269531, "global_step": 174910, "epoch": 4164} {"train_loss": -6.974553108215332, "global_step": 174911, "epoch": 4164} {"train_loss": -7.11659574508667, "global_step": 174912, "epoch": 4164} {"train_loss": -6.9843573570251465, "global_step": 174913, "epoch": 4164} {"train_loss": -6.97855806350708, "global_step": 174914, "epoch": 4164} {"train_loss": -7.018328666687012, "global_step": 174915, "epoch": 4164} {"train_loss": -7.069037437438965, "global_step": 174916, "epoch": 4164} {"train_loss": -7.037456035614014, "global_step": 174917, "epoch": 4164} {"train_loss": -7.009132385253906, "global_step": 174918, "epoch": 4164} {"train_loss": -7.021040439605713, "global_step": 174919, "epoch": 4164} {"train_loss": -7.05759334564209, "global_step": 174920, "epoch": 4164} {"train_loss": -7.100447177886963, "global_step": 174921, "epoch": 4164} {"train_loss": -7.095954895019531, "global_step": 174922, "epoch": 4164} {"train_loss": -6.93324613571167, "global_step": 174923, "epoch": 4164} {"train_loss": -7.035004138946533, "global_step": 174924, "epoch": 4164} {"train_loss": -7.173309326171875, "global_step": 174925, "epoch": 4164} {"train_loss": -7.050062656402588, "global_step": 174926, "epoch": 4164} {"train_loss": -6.917515754699707, "global_step": 174927, "epoch": 4164} {"train_loss": -6.974764823913574, "global_step": 174928, "epoch": 4164} {"train_loss": -6.986575796490624, "global_step": 174929, "epoch": 4164, "val_loss": 68745.1953125} {"train_loss": -7.052840232849121, "global_step": 174930, "epoch": 4165} {"train_loss": -6.998713493347168, "global_step": 174931, "epoch": 4165} {"train_loss": -7.067729949951172, "global_step": 174932, "epoch": 4165} {"train_loss": -7.064802169799805, "global_step": 174933, "epoch": 4165} {"train_loss": -7.046496391296387, "global_step": 174934, "epoch": 4165} {"train_loss": -7.041007995605469, "global_step": 174935, "epoch": 4165} {"train_loss": -7.132926940917969, "global_step": 174936, "epoch": 4165} {"train_loss": -7.059350490570068, "global_step": 174937, "epoch": 4165} {"train_loss": -7.097469329833984, "global_step": 174938, "epoch": 4165} {"train_loss": -7.04262113571167, "global_step": 174939, "epoch": 4165} {"train_loss": -7.105008125305176, "global_step": 174940, "epoch": 4165} {"train_loss": -7.087120532989502, "global_step": 174941, "epoch": 4165} {"train_loss": -7.012985706329346, "global_step": 174942, "epoch": 4165} {"train_loss": -6.888636589050293, "global_step": 174943, "epoch": 4165} {"train_loss": -6.934633255004883, "global_step": 174944, "epoch": 4165} {"train_loss": -6.98463773727417, "global_step": 174945, "epoch": 4165} {"train_loss": -7.1598005294799805, "global_step": 174946, "epoch": 4165} {"train_loss": -6.991028785705566, "global_step": 174947, "epoch": 4165} {"train_loss": -6.9992475509643555, "global_step": 174948, "epoch": 4165} {"train_loss": -7.095541954040527, "global_step": 174949, "epoch": 4165} {"train_loss": -6.959282875061035, "global_step": 174950, "epoch": 4165} {"train_loss": -7.071953773498535, "global_step": 174951, "epoch": 4165} {"train_loss": -6.9365153312683105, "global_step": 174952, "epoch": 4165} {"train_loss": -6.987972259521484, "global_step": 174953, "epoch": 4165} {"train_loss": -6.987784385681152, "global_step": 174954, "epoch": 4165} {"train_loss": -6.9409403800964355, "global_step": 174955, "epoch": 4165} {"train_loss": -7.041604995727539, "global_step": 174956, "epoch": 4165} {"train_loss": -6.836794376373291, "global_step": 174957, "epoch": 4165} {"train_loss": -7.067750930786133, "global_step": 174958, "epoch": 4165} {"train_loss": -6.943424224853516, "global_step": 174959, "epoch": 4165} {"train_loss": -7.075645446777344, "global_step": 174960, "epoch": 4165} {"train_loss": -7.060766696929932, "global_step": 174961, "epoch": 4165} {"train_loss": -6.932735443115234, "global_step": 174962, "epoch": 4165} {"train_loss": -6.996092796325684, "global_step": 174963, "epoch": 4165} {"train_loss": -6.869521141052246, "global_step": 174964, "epoch": 4165} {"train_loss": -6.842418193817139, "global_step": 174965, "epoch": 4165} {"train_loss": -6.965577125549316, "global_step": 174966, "epoch": 4165} {"train_loss": -6.842958450317383, "global_step": 174967, "epoch": 4165} {"train_loss": -6.944606781005859, "global_step": 174968, "epoch": 4165} {"train_loss": -6.92828369140625, "global_step": 174969, "epoch": 4165} {"train_loss": -6.927477836608887, "global_step": 174970, "epoch": 4165} {"train_loss": -6.996960923785255, "global_step": 174971, "epoch": 4165, "val_loss": 68463.4453125} {"train_loss": -6.907874584197998, "global_step": 174972, "epoch": 4166} {"train_loss": -6.987174987792969, "global_step": 174973, "epoch": 4166} {"train_loss": -6.8755645751953125, "global_step": 174974, "epoch": 4166} {"train_loss": -6.949351787567139, "global_step": 174975, "epoch": 4166} {"train_loss": -6.877659797668457, "global_step": 174976, "epoch": 4166} {"train_loss": -6.968115329742432, "global_step": 174977, "epoch": 4166} {"train_loss": -6.946646690368652, "global_step": 174978, "epoch": 4166} {"train_loss": -6.970846652984619, "global_step": 174979, "epoch": 4166} {"train_loss": -6.900808334350586, "global_step": 174980, "epoch": 4166} {"train_loss": -6.93772029876709, "global_step": 174981, "epoch": 4166} {"train_loss": -6.982077598571777, "global_step": 174982, "epoch": 4166} {"train_loss": -6.950387954711914, "global_step": 174983, "epoch": 4166} {"train_loss": -7.101049423217773, "global_step": 174984, "epoch": 4166} {"train_loss": -6.857494354248047, "global_step": 174985, "epoch": 4166} {"train_loss": -6.943514823913574, "global_step": 174986, "epoch": 4166} {"train_loss": -7.091169357299805, "global_step": 174987, "epoch": 4166} {"train_loss": -7.018721580505371, "global_step": 174988, "epoch": 4166} {"train_loss": -7.02747917175293, "global_step": 174989, "epoch": 4166} {"train_loss": -7.030412673950195, "global_step": 174990, "epoch": 4166} {"train_loss": -6.958806991577148, "global_step": 174991, "epoch": 4166} {"train_loss": -7.027226448059082, "global_step": 174992, "epoch": 4166} {"train_loss": -6.987069129943848, "global_step": 174993, "epoch": 4166} {"train_loss": -7.022764205932617, "global_step": 174994, "epoch": 4166} {"train_loss": -7.0507612228393555, "global_step": 174995, "epoch": 4166} {"train_loss": -6.914654731750488, "global_step": 174996, "epoch": 4166} {"train_loss": -6.995324611663818, "global_step": 174997, "epoch": 4166} {"train_loss": -7.075594902038574, "global_step": 174998, "epoch": 4166} {"train_loss": -7.111786842346191, "global_step": 174999, "epoch": 4166} {"train_loss": -7.012895584106445, "global_step": 175000, "epoch": 4166} {"train_loss": -7.034173965454102, "global_step": 175001, "epoch": 4166} {"train_loss": -7.025275707244873, "global_step": 175002, "epoch": 4166} {"train_loss": -7.048858642578125, "global_step": 175003, "epoch": 4166} {"train_loss": -7.074267387390137, "global_step": 175004, "epoch": 4166} {"train_loss": -7.059704780578613, "global_step": 175005, "epoch": 4166} {"train_loss": -7.063100814819336, "global_step": 175006, "epoch": 4166} {"train_loss": -7.088376998901367, "global_step": 175007, "epoch": 4166} {"train_loss": -7.10327672958374, "global_step": 175008, "epoch": 4166} {"train_loss": -6.968570709228516, "global_step": 175009, "epoch": 4166} {"train_loss": -7.148582458496094, "global_step": 175010, "epoch": 4166} {"train_loss": -7.051275253295898, "global_step": 175011, "epoch": 4166} {"train_loss": -6.931548595428467, "global_step": 175012, "epoch": 4166} {"train_loss": -7.004429045177641, "global_step": 175013, "epoch": 4166, "val_loss": 68614.7265625} {"train_loss": -7.004266738891602, "global_step": 175014, "epoch": 4167} {"train_loss": -6.943504810333252, "global_step": 175015, "epoch": 4167} {"train_loss": -7.006373405456543, "global_step": 175016, "epoch": 4167} {"train_loss": -7.037398338317871, "global_step": 175017, "epoch": 4167} {"train_loss": -6.863690376281738, "global_step": 175018, "epoch": 4167} {"train_loss": -7.029145240783691, "global_step": 175019, "epoch": 4167} {"train_loss": -6.985164642333984, "global_step": 175020, "epoch": 4167} {"train_loss": -6.886267185211182, "global_step": 175021, "epoch": 4167} {"train_loss": -7.022734642028809, "global_step": 175022, "epoch": 4167} {"train_loss": -7.0344648361206055, "global_step": 175023, "epoch": 4167} {"train_loss": -7.007725715637207, "global_step": 175024, "epoch": 4167} {"train_loss": -7.026973247528076, "global_step": 175025, "epoch": 4167} {"train_loss": -6.954184055328369, "global_step": 175026, "epoch": 4167} {"train_loss": -6.968780994415283, "global_step": 175027, "epoch": 4167} {"train_loss": -6.93446159362793, "global_step": 175028, "epoch": 4167} {"train_loss": -7.0118408203125, "global_step": 175029, "epoch": 4167} {"train_loss": -7.091019153594971, "global_step": 175030, "epoch": 4167} {"train_loss": -7.069746494293213, "global_step": 175031, "epoch": 4167} {"train_loss": -6.816501617431641, "global_step": 175032, "epoch": 4167} {"train_loss": -6.967607498168945, "global_step": 175033, "epoch": 4167} {"train_loss": -7.015019416809082, "global_step": 175034, "epoch": 4167} {"train_loss": -6.97314977645874, "global_step": 175035, "epoch": 4167} {"train_loss": -7.006171226501465, "global_step": 175036, "epoch": 4167} {"train_loss": -7.0877532958984375, "global_step": 175037, "epoch": 4167} {"train_loss": -6.796727180480957, "global_step": 175038, "epoch": 4167} {"train_loss": -6.996298313140869, "global_step": 175039, "epoch": 4167} {"train_loss": -7.015089988708496, "global_step": 175040, "epoch": 4167} {"train_loss": -7.036557197570801, "global_step": 175041, "epoch": 4167} {"train_loss": -7.097198963165283, "global_step": 175042, "epoch": 4167} {"train_loss": -6.853270053863525, "global_step": 175043, "epoch": 4167} {"train_loss": -6.9972381591796875, "global_step": 175044, "epoch": 4167} {"train_loss": -7.007237911224365, "global_step": 175045, "epoch": 4167} {"train_loss": -7.072563171386719, "global_step": 175046, "epoch": 4167} {"train_loss": -7.001877307891846, "global_step": 175047, "epoch": 4167} {"train_loss": -6.941547393798828, "global_step": 175048, "epoch": 4167} {"train_loss": -6.9856672286987305, "global_step": 175049, "epoch": 4167} {"train_loss": -7.1288533210754395, "global_step": 175050, "epoch": 4167} {"train_loss": -6.993233680725098, "global_step": 175051, "epoch": 4167} {"train_loss": -7.070688724517822, "global_step": 175052, "epoch": 4167} {"train_loss": -7.0701704025268555, "global_step": 175053, "epoch": 4167} {"train_loss": -7.0522141456604, "global_step": 175054, "epoch": 4167} {"train_loss": -6.995869534356253, "global_step": 175055, "epoch": 4167, "val_loss": 68538.375} {"train_loss": -7.102532386779785, "global_step": 175056, "epoch": 4168} {"train_loss": -6.953420639038086, "global_step": 175057, "epoch": 4168} {"train_loss": -6.975207805633545, "global_step": 175058, "epoch": 4168} {"train_loss": -7.06422758102417, "global_step": 175059, "epoch": 4168} {"train_loss": -6.958432197570801, "global_step": 175060, "epoch": 4168} {"train_loss": -7.026796340942383, "global_step": 175061, "epoch": 4168} {"train_loss": -7.15134334564209, "global_step": 175062, "epoch": 4168} {"train_loss": -6.981571197509766, "global_step": 175063, "epoch": 4168} {"train_loss": -7.000139236450195, "global_step": 175064, "epoch": 4168} {"train_loss": -7.083153247833252, "global_step": 175065, "epoch": 4168} {"train_loss": -7.059899806976318, "global_step": 175066, "epoch": 4168} {"train_loss": -7.0836591720581055, "global_step": 175067, "epoch": 4168} {"train_loss": -7.0629143714904785, "global_step": 175068, "epoch": 4168} {"train_loss": -7.143199920654297, "global_step": 175069, "epoch": 4168} {"train_loss": -6.977694511413574, "global_step": 175070, "epoch": 4168} {"train_loss": -7.0523457527160645, "global_step": 175071, "epoch": 4168} {"train_loss": -7.037393093109131, "global_step": 175072, "epoch": 4168} {"train_loss": -6.967957496643066, "global_step": 175073, "epoch": 4168} {"train_loss": -7.037199974060059, "global_step": 175074, "epoch": 4168} {"train_loss": -6.942997932434082, "global_step": 175075, "epoch": 4168} {"train_loss": -7.094942092895508, "global_step": 175076, "epoch": 4168} {"train_loss": -7.07736873626709, "global_step": 175077, "epoch": 4168} {"train_loss": -7.070958614349365, "global_step": 175078, "epoch": 4168} {"train_loss": -7.0572662353515625, "global_step": 175079, "epoch": 4168} {"train_loss": -7.216635227203369, "global_step": 175080, "epoch": 4168} {"train_loss": -7.147822856903076, "global_step": 175081, "epoch": 4168} {"train_loss": -7.086509704589844, "global_step": 175082, "epoch": 4168} {"train_loss": -7.180466651916504, "global_step": 175083, "epoch": 4168} {"train_loss": -7.013571262359619, "global_step": 175084, "epoch": 4168} {"train_loss": -6.967374801635742, "global_step": 175085, "epoch": 4168} {"train_loss": -6.962862968444824, "global_step": 175086, "epoch": 4168} {"train_loss": -6.829319477081299, "global_step": 175087, "epoch": 4168} {"train_loss": -6.865326404571533, "global_step": 175088, "epoch": 4168} {"train_loss": -7.018943786621094, "global_step": 175089, "epoch": 4168} {"train_loss": -6.8490495681762695, "global_step": 175090, "epoch": 4168} {"train_loss": -6.96999454498291, "global_step": 175091, "epoch": 4168} {"train_loss": -7.047818660736084, "global_step": 175092, "epoch": 4168} {"train_loss": -6.736108303070068, "global_step": 175093, "epoch": 4168} {"train_loss": -6.947778701782227, "global_step": 175094, "epoch": 4168} {"train_loss": -6.941859245300293, "global_step": 175095, "epoch": 4168} {"train_loss": -6.825743675231934, "global_step": 175096, "epoch": 4168} {"train_loss": -7.01493485768636, "global_step": 175097, "epoch": 4168, "val_loss": 68810.2421875} {"train_loss": -6.880474090576172, "global_step": 175098, "epoch": 4169} {"train_loss": -7.0171308517456055, "global_step": 175099, "epoch": 4169} {"train_loss": -7.000649452209473, "global_step": 175100, "epoch": 4169} {"train_loss": -6.904112815856934, "global_step": 175101, "epoch": 4169} {"train_loss": -6.947713375091553, "global_step": 175102, "epoch": 4169} {"train_loss": -6.9586992263793945, "global_step": 175103, "epoch": 4169} {"train_loss": -6.918322563171387, "global_step": 175104, "epoch": 4169} {"train_loss": -6.985997676849365, "global_step": 175105, "epoch": 4169} {"train_loss": -6.9366559982299805, "global_step": 175106, "epoch": 4169} {"train_loss": -6.921337127685547, "global_step": 175107, "epoch": 4169} {"train_loss": -6.99454402923584, "global_step": 175108, "epoch": 4169} {"train_loss": -6.961277484893799, "global_step": 175109, "epoch": 4169} {"train_loss": -7.097170352935791, "global_step": 175110, "epoch": 4169} {"train_loss": -6.998703479766846, "global_step": 175111, "epoch": 4169} {"train_loss": -7.050806045532227, "global_step": 175112, "epoch": 4169} {"train_loss": -7.062237739562988, "global_step": 175113, "epoch": 4169} {"train_loss": -6.963107109069824, "global_step": 175114, "epoch": 4169} {"train_loss": -7.024332523345947, "global_step": 175115, "epoch": 4169} {"train_loss": -7.090198516845703, "global_step": 175116, "epoch": 4169} {"train_loss": -7.022192478179932, "global_step": 175117, "epoch": 4169} {"train_loss": -7.072587966918945, "global_step": 175118, "epoch": 4169} {"train_loss": -7.086023807525635, "global_step": 175119, "epoch": 4169} {"train_loss": -7.172131538391113, "global_step": 175120, "epoch": 4169} {"train_loss": -6.980111122131348, "global_step": 175121, "epoch": 4169} {"train_loss": -7.062538146972656, "global_step": 175122, "epoch": 4169} {"train_loss": -7.0546770095825195, "global_step": 175123, "epoch": 4169} {"train_loss": -7.1396870613098145, "global_step": 175124, "epoch": 4169} {"train_loss": -7.093742370605469, "global_step": 175125, "epoch": 4169} {"train_loss": -7.094752311706543, "global_step": 175126, "epoch": 4169} {"train_loss": -7.073557376861572, "global_step": 175127, "epoch": 4169} {"train_loss": -7.203063488006592, "global_step": 175128, "epoch": 4169} {"train_loss": -7.158698081970215, "global_step": 175129, "epoch": 4169} {"train_loss": -7.038115501403809, "global_step": 175130, "epoch": 4169} {"train_loss": -7.101002216339111, "global_step": 175131, "epoch": 4169} {"train_loss": -7.0547051429748535, "global_step": 175132, "epoch": 4169} {"train_loss": -7.007950782775879, "global_step": 175133, "epoch": 4169} {"train_loss": -7.003424644470215, "global_step": 175134, "epoch": 4169} {"train_loss": -7.061402797698975, "global_step": 175135, "epoch": 4169} {"train_loss": -6.966294288635254, "global_step": 175136, "epoch": 4169} {"train_loss": -7.033947944641113, "global_step": 175137, "epoch": 4169} {"train_loss": -7.103559970855713, "global_step": 175138, "epoch": 4169} {"train_loss": -7.032107966286795, "global_step": 175139, "epoch": 4169, "val_loss": 68697.3125} {"train_loss": -6.99755859375, "global_step": 175140, "epoch": 4170} {"train_loss": -6.999688148498535, "global_step": 175141, "epoch": 4170} {"train_loss": -7.09657096862793, "global_step": 175142, "epoch": 4170} {"train_loss": -7.153799533843994, "global_step": 175143, "epoch": 4170} {"train_loss": -6.957844257354736, "global_step": 175144, "epoch": 4170} {"train_loss": -7.011264801025391, "global_step": 175145, "epoch": 4170} {"train_loss": -6.956178665161133, "global_step": 175146, "epoch": 4170} {"train_loss": -7.038940906524658, "global_step": 175147, "epoch": 4170} {"train_loss": -7.0991363525390625, "global_step": 175148, "epoch": 4170} {"train_loss": -6.986782073974609, "global_step": 175149, "epoch": 4170} {"train_loss": -7.058089256286621, "global_step": 175150, "epoch": 4170} {"train_loss": -7.104857444763184, "global_step": 175151, "epoch": 4170} {"train_loss": -6.996151924133301, "global_step": 175152, "epoch": 4170} {"train_loss": -7.031773567199707, "global_step": 175153, "epoch": 4170} {"train_loss": -7.064817905426025, "global_step": 175154, "epoch": 4170} {"train_loss": -7.131261825561523, "global_step": 175155, "epoch": 4170} {"train_loss": -7.103724479675293, "global_step": 175156, "epoch": 4170} {"train_loss": -7.067073345184326, "global_step": 175157, "epoch": 4170} {"train_loss": -7.132584571838379, "global_step": 175158, "epoch": 4170} {"train_loss": -7.058981895446777, "global_step": 175159, "epoch": 4170} {"train_loss": -7.140003204345703, "global_step": 175160, "epoch": 4170} {"train_loss": -7.084121227264404, "global_step": 175161, "epoch": 4170} {"train_loss": -7.116207122802734, "global_step": 175162, "epoch": 4170} {"train_loss": -7.154393672943115, "global_step": 175163, "epoch": 4170} {"train_loss": -7.120405673980713, "global_step": 175164, "epoch": 4170} {"train_loss": -7.165888786315918, "global_step": 175165, "epoch": 4170} {"train_loss": -7.031557083129883, "global_step": 175166, "epoch": 4170} {"train_loss": -7.068734169006348, "global_step": 175167, "epoch": 4170} {"train_loss": -7.014176845550537, "global_step": 175168, "epoch": 4170} {"train_loss": -7.016383647918701, "global_step": 175169, "epoch": 4170} {"train_loss": -7.055719375610352, "global_step": 175170, "epoch": 4170} {"train_loss": -7.026080131530762, "global_step": 175171, "epoch": 4170} {"train_loss": -7.103697299957275, "global_step": 175172, "epoch": 4170} {"train_loss": -6.953132629394531, "global_step": 175173, "epoch": 4170} {"train_loss": -6.995540618896484, "global_step": 175174, "epoch": 4170} {"train_loss": -7.040212154388428, "global_step": 175175, "epoch": 4170} {"train_loss": -7.081884860992432, "global_step": 175176, "epoch": 4170} {"train_loss": -6.964295864105225, "global_step": 175177, "epoch": 4170} {"train_loss": -7.016488075256348, "global_step": 175178, "epoch": 4170} {"train_loss": -6.962697505950928, "global_step": 175179, "epoch": 4170} {"train_loss": -6.927557945251465, "global_step": 175180, "epoch": 4170} {"train_loss": -7.046812318620228, "global_step": 175181, "epoch": 4170, "val_loss": 68478.265625} {"train_loss": -7.035521030426025, "global_step": 175182, "epoch": 4171} {"train_loss": -7.0079874992370605, "global_step": 175183, "epoch": 4171} {"train_loss": -6.983527183532715, "global_step": 175184, "epoch": 4171} {"train_loss": -7.021339416503906, "global_step": 175185, "epoch": 4171} {"train_loss": -6.965033531188965, "global_step": 175186, "epoch": 4171} {"train_loss": -6.9101643562316895, "global_step": 175187, "epoch": 4171} {"train_loss": -7.125326156616211, "global_step": 175188, "epoch": 4171} {"train_loss": -7.015105247497559, "global_step": 175189, "epoch": 4171} {"train_loss": -6.906561374664307, "global_step": 175190, "epoch": 4171} {"train_loss": -7.089547157287598, "global_step": 175191, "epoch": 4171} {"train_loss": -6.748610496520996, "global_step": 175192, "epoch": 4171} {"train_loss": -6.92325496673584, "global_step": 175193, "epoch": 4171} {"train_loss": -6.887027740478516, "global_step": 175194, "epoch": 4171} {"train_loss": -6.843416690826416, "global_step": 175195, "epoch": 4171} {"train_loss": -6.976083755493164, "global_step": 175196, "epoch": 4171} {"train_loss": -6.788769721984863, "global_step": 175197, "epoch": 4171} {"train_loss": -6.845817565917969, "global_step": 175198, "epoch": 4171} {"train_loss": -6.794215202331543, "global_step": 175199, "epoch": 4171} {"train_loss": -6.768340587615967, "global_step": 175200, "epoch": 4171} {"train_loss": -6.940918922424316, "global_step": 175201, "epoch": 4171} {"train_loss": -6.96304988861084, "global_step": 175202, "epoch": 4171} {"train_loss": -7.004249572753906, "global_step": 175203, "epoch": 4171} {"train_loss": -7.041993618011475, "global_step": 175204, "epoch": 4171} {"train_loss": -6.930534362792969, "global_step": 175205, "epoch": 4171} {"train_loss": -6.907204627990723, "global_step": 175206, "epoch": 4171} {"train_loss": -7.035219192504883, "global_step": 175207, "epoch": 4171} {"train_loss": -6.994704246520996, "global_step": 175208, "epoch": 4171} {"train_loss": -7.051612377166748, "global_step": 175209, "epoch": 4171} {"train_loss": -7.0635857582092285, "global_step": 175210, "epoch": 4171} {"train_loss": -7.020210266113281, "global_step": 175211, "epoch": 4171} {"train_loss": -6.911388874053955, "global_step": 175212, "epoch": 4171} {"train_loss": -7.015296936035156, "global_step": 175213, "epoch": 4171} {"train_loss": -6.922037124633789, "global_step": 175214, "epoch": 4171} {"train_loss": -6.983819961547852, "global_step": 175215, "epoch": 4171} {"train_loss": -7.071998596191406, "global_step": 175216, "epoch": 4171} {"train_loss": -6.978182315826416, "global_step": 175217, "epoch": 4171} {"train_loss": -7.010356426239014, "global_step": 175218, "epoch": 4171} {"train_loss": -7.001590728759766, "global_step": 175219, "epoch": 4171} {"train_loss": -6.876373291015625, "global_step": 175220, "epoch": 4171} {"train_loss": -6.99832820892334, "global_step": 175221, "epoch": 4171} {"train_loss": -6.932578086853027, "global_step": 175222, "epoch": 4171} {"train_loss": -6.956704991204398, "global_step": 175223, "epoch": 4171, "val_loss": 68570.8671875} {"train_loss": -7.067747116088867, "global_step": 175224, "epoch": 4172} {"train_loss": -7.025094985961914, "global_step": 175225, "epoch": 4172} {"train_loss": -6.95347785949707, "global_step": 175226, "epoch": 4172} {"train_loss": -7.088016510009766, "global_step": 175227, "epoch": 4172} {"train_loss": -7.015979766845703, "global_step": 175228, "epoch": 4172} {"train_loss": -7.018986225128174, "global_step": 175229, "epoch": 4172} {"train_loss": -7.01304817199707, "global_step": 175230, "epoch": 4172} {"train_loss": -7.074090003967285, "global_step": 175231, "epoch": 4172} {"train_loss": -7.0862226486206055, "global_step": 175232, "epoch": 4172} {"train_loss": -6.94251823425293, "global_step": 175233, "epoch": 4172} {"train_loss": -7.042284965515137, "global_step": 175234, "epoch": 4172} {"train_loss": -7.0618085861206055, "global_step": 175235, "epoch": 4172} {"train_loss": -7.001781463623047, "global_step": 175236, "epoch": 4172} {"train_loss": -6.933297157287598, "global_step": 175237, "epoch": 4172} {"train_loss": -7.033881664276123, "global_step": 175238, "epoch": 4172} {"train_loss": -7.005107879638672, "global_step": 175239, "epoch": 4172} {"train_loss": -7.090517997741699, "global_step": 175240, "epoch": 4172} {"train_loss": -7.094185829162598, "global_step": 175241, "epoch": 4172} {"train_loss": -6.952899932861328, "global_step": 175242, "epoch": 4172} {"train_loss": -7.108858108520508, "global_step": 175243, "epoch": 4172} {"train_loss": -6.988270282745361, "global_step": 175244, "epoch": 4172} {"train_loss": -7.0470781326293945, "global_step": 175245, "epoch": 4172} {"train_loss": -7.057863235473633, "global_step": 175246, "epoch": 4172} {"train_loss": -6.96616268157959, "global_step": 175247, "epoch": 4172} {"train_loss": -6.978253364562988, "global_step": 175248, "epoch": 4172} {"train_loss": -6.996508598327637, "global_step": 175249, "epoch": 4172} {"train_loss": -7.016753673553467, "global_step": 175250, "epoch": 4172} {"train_loss": -6.981740474700928, "global_step": 175251, "epoch": 4172} {"train_loss": -7.012331962585449, "global_step": 175252, "epoch": 4172} {"train_loss": -7.128935813903809, "global_step": 175253, "epoch": 4172} {"train_loss": -6.941771507263184, "global_step": 175254, "epoch": 4172} {"train_loss": -6.9248151779174805, "global_step": 175255, "epoch": 4172} {"train_loss": -7.034182548522949, "global_step": 175256, "epoch": 4172} {"train_loss": -6.980768203735352, "global_step": 175257, "epoch": 4172} {"train_loss": -7.052192211151123, "global_step": 175258, "epoch": 4172} {"train_loss": -7.049960136413574, "global_step": 175259, "epoch": 4172} {"train_loss": -6.9929890632629395, "global_step": 175260, "epoch": 4172} {"train_loss": -6.937958240509033, "global_step": 175261, "epoch": 4172} {"train_loss": -6.916398525238037, "global_step": 175262, "epoch": 4172} {"train_loss": -6.8593597412109375, "global_step": 175263, "epoch": 4172} {"train_loss": -6.95832633972168, "global_step": 175264, "epoch": 4172} {"train_loss": -7.012804848807199, "global_step": 175265, "epoch": 4172, "val_loss": 68717.65625} {"train_loss": -6.977439880371094, "global_step": 175266, "epoch": 4173} {"train_loss": -6.91937255859375, "global_step": 175267, "epoch": 4173} {"train_loss": -7.097344398498535, "global_step": 175268, "epoch": 4173} {"train_loss": -6.875351905822754, "global_step": 175269, "epoch": 4173} {"train_loss": -6.963932991027832, "global_step": 175270, "epoch": 4173} {"train_loss": -6.8901472091674805, "global_step": 175271, "epoch": 4173} {"train_loss": -6.954334735870361, "global_step": 175272, "epoch": 4173} {"train_loss": -6.899867057800293, "global_step": 175273, "epoch": 4173} {"train_loss": -6.901724815368652, "global_step": 175274, "epoch": 4173} {"train_loss": -6.948110580444336, "global_step": 175275, "epoch": 4173} {"train_loss": -6.914939880371094, "global_step": 175276, "epoch": 4173} {"train_loss": -6.978529930114746, "global_step": 175277, "epoch": 4173} {"train_loss": -6.898377418518066, "global_step": 175278, "epoch": 4173} {"train_loss": -6.778408527374268, "global_step": 175279, "epoch": 4173} {"train_loss": -7.015129089355469, "global_step": 175280, "epoch": 4173} {"train_loss": -6.896450042724609, "global_step": 175281, "epoch": 4173} {"train_loss": -6.890205383300781, "global_step": 175282, "epoch": 4173} {"train_loss": -6.904017448425293, "global_step": 175283, "epoch": 4173} {"train_loss": -6.859694004058838, "global_step": 175284, "epoch": 4173} {"train_loss": -6.920042514801025, "global_step": 175285, "epoch": 4173} {"train_loss": -7.006852149963379, "global_step": 175286, "epoch": 4173} {"train_loss": -6.856326103210449, "global_step": 175287, "epoch": 4173} {"train_loss": -7.040096282958984, "global_step": 175288, "epoch": 4173} {"train_loss": -6.914130210876465, "global_step": 175289, "epoch": 4173} {"train_loss": -6.905647277832031, "global_step": 175290, "epoch": 4173} {"train_loss": -7.056917667388916, "global_step": 175291, "epoch": 4173} {"train_loss": -7.143014907836914, "global_step": 175292, "epoch": 4173} {"train_loss": -6.996468544006348, "global_step": 175293, "epoch": 4173} {"train_loss": -6.967870712280273, "global_step": 175294, "epoch": 4173} {"train_loss": -7.022009372711182, "global_step": 175295, "epoch": 4173} {"train_loss": -6.9665374755859375, "global_step": 175296, "epoch": 4173} {"train_loss": -7.07930850982666, "global_step": 175297, "epoch": 4173} {"train_loss": -7.066439628601074, "global_step": 175298, "epoch": 4173} {"train_loss": -6.974980354309082, "global_step": 175299, "epoch": 4173} {"train_loss": -7.0264739990234375, "global_step": 175300, "epoch": 4173} {"train_loss": -6.918251037597656, "global_step": 175301, "epoch": 4173} {"train_loss": -6.918631076812744, "global_step": 175302, "epoch": 4173} {"train_loss": -7.133406162261963, "global_step": 175303, "epoch": 4173} {"train_loss": -7.135678768157959, "global_step": 175304, "epoch": 4173} {"train_loss": -7.006204605102539, "global_step": 175305, "epoch": 4173} {"train_loss": -6.900305271148682, "global_step": 175306, "epoch": 4173} {"train_loss": -6.962627637953985, "global_step": 175307, "epoch": 4173, "val_loss": 68603.4453125} {"train_loss": -7.1196608543396, "global_step": 175308, "epoch": 4174} {"train_loss": -6.913679122924805, "global_step": 175309, "epoch": 4174} {"train_loss": -6.957480430603027, "global_step": 175310, "epoch": 4174} {"train_loss": -7.061570167541504, "global_step": 175311, "epoch": 4174} {"train_loss": -7.04619026184082, "global_step": 175312, "epoch": 4174} {"train_loss": -7.0230865478515625, "global_step": 175313, "epoch": 4174} {"train_loss": -6.906373500823975, "global_step": 175314, "epoch": 4174} {"train_loss": -7.076210021972656, "global_step": 175315, "epoch": 4174} {"train_loss": -7.072481155395508, "global_step": 175316, "epoch": 4174} {"train_loss": -6.954568862915039, "global_step": 175317, "epoch": 4174} {"train_loss": -7.032238483428955, "global_step": 175318, "epoch": 4174} {"train_loss": -7.139937877655029, "global_step": 175319, "epoch": 4174} {"train_loss": -7.008705139160156, "global_step": 175320, "epoch": 4174} {"train_loss": -7.1131720542907715, "global_step": 175321, "epoch": 4174} {"train_loss": -7.027379989624023, "global_step": 175322, "epoch": 4174} {"train_loss": -6.951221466064453, "global_step": 175323, "epoch": 4174} {"train_loss": -7.025040626525879, "global_step": 175324, "epoch": 4174} {"train_loss": -7.084759712219238, "global_step": 175325, "epoch": 4174} {"train_loss": -7.003696918487549, "global_step": 175326, "epoch": 4174} {"train_loss": -7.065156936645508, "global_step": 175327, "epoch": 4174} {"train_loss": -7.068985462188721, "global_step": 175328, "epoch": 4174} {"train_loss": -7.136305332183838, "global_step": 175329, "epoch": 4174} {"train_loss": -7.018237113952637, "global_step": 175330, "epoch": 4174} {"train_loss": -7.049330711364746, "global_step": 175331, "epoch": 4174} {"train_loss": -7.035096168518066, "global_step": 175332, "epoch": 4174} {"train_loss": -6.864025115966797, "global_step": 175333, "epoch": 4174} {"train_loss": -6.951064109802246, "global_step": 175334, "epoch": 4174} {"train_loss": -6.772932529449463, "global_step": 175335, "epoch": 4174} {"train_loss": -7.076077461242676, "global_step": 175336, "epoch": 4174} {"train_loss": -7.0364532470703125, "global_step": 175337, "epoch": 4174} {"train_loss": -7.054862022399902, "global_step": 175338, "epoch": 4174} {"train_loss": -6.980366230010986, "global_step": 175339, "epoch": 4174} {"train_loss": -6.9286699295043945, "global_step": 175340, "epoch": 4174} {"train_loss": -7.109014511108398, "global_step": 175341, "epoch": 4174} {"train_loss": -7.120520114898682, "global_step": 175342, "epoch": 4174} {"train_loss": -6.935144424438477, "global_step": 175343, "epoch": 4174} {"train_loss": -7.005008697509766, "global_step": 175344, "epoch": 4174} {"train_loss": -6.969785213470459, "global_step": 175345, "epoch": 4174} {"train_loss": -7.091250419616699, "global_step": 175346, "epoch": 4174} {"train_loss": -7.030176162719727, "global_step": 175347, "epoch": 4174} {"train_loss": -7.03375244140625, "global_step": 175348, "epoch": 4174} {"train_loss": -7.022338833127703, "global_step": 175349, "epoch": 4174, "val_loss": 68665.0625} {"train_loss": -7.100415229797363, "global_step": 175350, "epoch": 4175} {"train_loss": -7.075865268707275, "global_step": 175351, "epoch": 4175} {"train_loss": -7.076830863952637, "global_step": 175352, "epoch": 4175} {"train_loss": -7.073984146118164, "global_step": 175353, "epoch": 4175} {"train_loss": -7.12702751159668, "global_step": 175354, "epoch": 4175} {"train_loss": -7.0316081047058105, "global_step": 175355, "epoch": 4175} {"train_loss": -7.038560390472412, "global_step": 175356, "epoch": 4175} {"train_loss": -6.909760475158691, "global_step": 175357, "epoch": 4175} {"train_loss": -7.039604187011719, "global_step": 175358, "epoch": 4175} {"train_loss": -6.9818572998046875, "global_step": 175359, "epoch": 4175} {"train_loss": -7.021100044250488, "global_step": 175360, "epoch": 4175} {"train_loss": -7.037271499633789, "global_step": 175361, "epoch": 4175} {"train_loss": -7.066896915435791, "global_step": 175362, "epoch": 4175} {"train_loss": -6.975742340087891, "global_step": 175363, "epoch": 4175} {"train_loss": -6.9886322021484375, "global_step": 175364, "epoch": 4175} {"train_loss": -7.06533145904541, "global_step": 175365, "epoch": 4175} {"train_loss": -6.980774879455566, "global_step": 175366, "epoch": 4175} {"train_loss": -6.973456859588623, "global_step": 175367, "epoch": 4175} {"train_loss": -7.005404472351074, "global_step": 175368, "epoch": 4175} {"train_loss": -6.999942779541016, "global_step": 175369, "epoch": 4175} {"train_loss": -7.011962413787842, "global_step": 175370, "epoch": 4175} {"train_loss": -6.979207992553711, "global_step": 175371, "epoch": 4175} {"train_loss": -7.1260271072387695, "global_step": 175372, "epoch": 4175} {"train_loss": -7.014030456542969, "global_step": 175373, "epoch": 4175} {"train_loss": -7.026598930358887, "global_step": 175374, "epoch": 4175} {"train_loss": -7.126182556152344, "global_step": 175375, "epoch": 4175} {"train_loss": -7.1237874031066895, "global_step": 175376, "epoch": 4175} {"train_loss": -7.039763450622559, "global_step": 175377, "epoch": 4175} {"train_loss": -7.009902000427246, "global_step": 175378, "epoch": 4175} {"train_loss": -7.011289596557617, "global_step": 175379, "epoch": 4175} {"train_loss": -7.183095455169678, "global_step": 175380, "epoch": 4175} {"train_loss": -6.898932933807373, "global_step": 175381, "epoch": 4175} {"train_loss": -6.98519229888916, "global_step": 175382, "epoch": 4175} {"train_loss": -7.048016548156738, "global_step": 175383, "epoch": 4175} {"train_loss": -6.918655872344971, "global_step": 175384, "epoch": 4175} {"train_loss": -6.957704544067383, "global_step": 175385, "epoch": 4175} {"train_loss": -6.982296943664551, "global_step": 175386, "epoch": 4175} {"train_loss": -7.026522636413574, "global_step": 175387, "epoch": 4175} {"train_loss": -6.986961364746094, "global_step": 175388, "epoch": 4175} {"train_loss": -6.926505088806152, "global_step": 175389, "epoch": 4175} {"train_loss": -6.975898742675781, "global_step": 175390, "epoch": 4175} {"train_loss": -7.022692623592558, "global_step": 175391, "epoch": 4175, "val_loss": 68718.46875} {"train_loss": -7.038208484649658, "global_step": 175392, "epoch": 4176} {"train_loss": -6.979161262512207, "global_step": 175393, "epoch": 4176} {"train_loss": -7.00830602645874, "global_step": 175394, "epoch": 4176} {"train_loss": -6.9685492515563965, "global_step": 175395, "epoch": 4176} {"train_loss": -7.019955635070801, "global_step": 175396, "epoch": 4176} {"train_loss": -6.989288330078125, "global_step": 175397, "epoch": 4176} {"train_loss": -7.052722930908203, "global_step": 175398, "epoch": 4176} {"train_loss": -7.000966548919678, "global_step": 175399, "epoch": 4176} {"train_loss": -7.058824062347412, "global_step": 175400, "epoch": 4176} {"train_loss": -6.945544242858887, "global_step": 175401, "epoch": 4176} {"train_loss": -7.031798839569092, "global_step": 175402, "epoch": 4176} {"train_loss": -6.954281806945801, "global_step": 175403, "epoch": 4176} {"train_loss": -7.056275367736816, "global_step": 175404, "epoch": 4176} {"train_loss": -6.924317836761475, "global_step": 175405, "epoch": 4176} {"train_loss": -7.010995864868164, "global_step": 175406, "epoch": 4176} {"train_loss": -7.0612006187438965, "global_step": 175407, "epoch": 4176} {"train_loss": -6.955996513366699, "global_step": 175408, "epoch": 4176} {"train_loss": -7.119794845581055, "global_step": 175409, "epoch": 4176} {"train_loss": -7.1187944412231445, "global_step": 175410, "epoch": 4176} {"train_loss": -6.998327255249023, "global_step": 175411, "epoch": 4176} {"train_loss": -7.092694282531738, "global_step": 175412, "epoch": 4176} {"train_loss": -6.998600006103516, "global_step": 175413, "epoch": 4176} {"train_loss": -7.084216117858887, "global_step": 175414, "epoch": 4176} {"train_loss": -7.010530471801758, "global_step": 175415, "epoch": 4176} {"train_loss": -7.023940563201904, "global_step": 175416, "epoch": 4176} {"train_loss": -7.099092483520508, "global_step": 175417, "epoch": 4176} {"train_loss": -7.162092208862305, "global_step": 175418, "epoch": 4176} {"train_loss": -7.025869369506836, "global_step": 175419, "epoch": 4176} {"train_loss": -7.074694633483887, "global_step": 175420, "epoch": 4176} {"train_loss": -7.064234733581543, "global_step": 175421, "epoch": 4176} {"train_loss": -7.05601167678833, "global_step": 175422, "epoch": 4176} {"train_loss": -7.106324672698975, "global_step": 175423, "epoch": 4176} {"train_loss": -7.040936470031738, "global_step": 175424, "epoch": 4176} {"train_loss": -7.03420877456665, "global_step": 175425, "epoch": 4176} {"train_loss": -7.061875343322754, "global_step": 175426, "epoch": 4176} {"train_loss": -6.909003257751465, "global_step": 175427, "epoch": 4176} {"train_loss": -7.033160209655762, "global_step": 175428, "epoch": 4176} {"train_loss": -7.043000221252441, "global_step": 175429, "epoch": 4176} {"train_loss": -6.887523651123047, "global_step": 175430, "epoch": 4176} {"train_loss": -7.1175947189331055, "global_step": 175431, "epoch": 4176} {"train_loss": -7.016119956970215, "global_step": 175432, "epoch": 4176} {"train_loss": -7.028323287055606, "global_step": 175433, "epoch": 4176, "val_loss": 68920.4140625} {"train_loss": -7.010801315307617, "global_step": 175434, "epoch": 4177} {"train_loss": -6.930929183959961, "global_step": 175435, "epoch": 4177} {"train_loss": -7.027856826782227, "global_step": 175436, "epoch": 4177} {"train_loss": -6.946843147277832, "global_step": 175437, "epoch": 4177} {"train_loss": -7.015110015869141, "global_step": 175438, "epoch": 4177} {"train_loss": -7.0379958152771, "global_step": 175439, "epoch": 4177} {"train_loss": -6.920913219451904, "global_step": 175440, "epoch": 4177} {"train_loss": -7.052670001983643, "global_step": 175441, "epoch": 4177} {"train_loss": -6.885506629943848, "global_step": 175442, "epoch": 4177} {"train_loss": -7.056920051574707, "global_step": 175443, "epoch": 4177} {"train_loss": -6.955896854400635, "global_step": 175444, "epoch": 4177} {"train_loss": -7.064889907836914, "global_step": 175445, "epoch": 4177} {"train_loss": -7.04056453704834, "global_step": 175446, "epoch": 4177} {"train_loss": -6.980855941772461, "global_step": 175447, "epoch": 4177} {"train_loss": -6.959558486938477, "global_step": 175448, "epoch": 4177} {"train_loss": -7.011298656463623, "global_step": 175449, "epoch": 4177} {"train_loss": -7.006496429443359, "global_step": 175450, "epoch": 4177} {"train_loss": -7.031784534454346, "global_step": 175451, "epoch": 4177} {"train_loss": -6.971773147583008, "global_step": 175452, "epoch": 4177} {"train_loss": -6.870329856872559, "global_step": 175453, "epoch": 4177} {"train_loss": -7.011649131774902, "global_step": 175454, "epoch": 4177} {"train_loss": -7.015505790710449, "global_step": 175455, "epoch": 4177} {"train_loss": -7.014466285705566, "global_step": 175456, "epoch": 4177} {"train_loss": -7.008306503295898, "global_step": 175457, "epoch": 4177} {"train_loss": -7.035778045654297, "global_step": 175458, "epoch": 4177} {"train_loss": -6.999449729919434, "global_step": 175459, "epoch": 4177} {"train_loss": -6.98536491394043, "global_step": 175460, "epoch": 4177} {"train_loss": -7.117040634155273, "global_step": 175461, "epoch": 4177} {"train_loss": -7.117693901062012, "global_step": 175462, "epoch": 4177} {"train_loss": -7.01761531829834, "global_step": 175463, "epoch": 4177} {"train_loss": -7.088065147399902, "global_step": 175464, "epoch": 4177} {"train_loss": -7.06058931350708, "global_step": 175465, "epoch": 4177} {"train_loss": -7.044460296630859, "global_step": 175466, "epoch": 4177} {"train_loss": -7.154360771179199, "global_step": 175467, "epoch": 4177} {"train_loss": -7.038651943206787, "global_step": 175468, "epoch": 4177} {"train_loss": -7.126658916473389, "global_step": 175469, "epoch": 4177} {"train_loss": -7.094235897064209, "global_step": 175470, "epoch": 4177} {"train_loss": -6.965371131896973, "global_step": 175471, "epoch": 4177} {"train_loss": -7.08190393447876, "global_step": 175472, "epoch": 4177} {"train_loss": -7.050803184509277, "global_step": 175473, "epoch": 4177} {"train_loss": -7.064734935760498, "global_step": 175474, "epoch": 4177} {"train_loss": -7.023956696192424, "global_step": 175475, "epoch": 4177, "val_loss": 68450.1328125} {"train_loss": -7.031261444091797, "global_step": 175476, "epoch": 4178} {"train_loss": -6.969873428344727, "global_step": 175477, "epoch": 4178} {"train_loss": -7.230961799621582, "global_step": 175478, "epoch": 4178} {"train_loss": -7.073461532592773, "global_step": 175479, "epoch": 4178} {"train_loss": -7.10955286026001, "global_step": 175480, "epoch": 4178} {"train_loss": -6.967726707458496, "global_step": 175481, "epoch": 4178} {"train_loss": -7.053833961486816, "global_step": 175482, "epoch": 4178} {"train_loss": -7.063070297241211, "global_step": 175483, "epoch": 4178} {"train_loss": -7.105239391326904, "global_step": 175484, "epoch": 4178} {"train_loss": -6.968406677246094, "global_step": 175485, "epoch": 4178} {"train_loss": -6.9659857749938965, "global_step": 175486, "epoch": 4178} {"train_loss": -7.046058654785156, "global_step": 175487, "epoch": 4178} {"train_loss": -6.945533752441406, "global_step": 175488, "epoch": 4178} {"train_loss": -6.976509094238281, "global_step": 175489, "epoch": 4178} {"train_loss": -7.020225524902344, "global_step": 175490, "epoch": 4178} {"train_loss": -7.020119667053223, "global_step": 175491, "epoch": 4178} {"train_loss": -7.033597946166992, "global_step": 175492, "epoch": 4178} {"train_loss": -6.937419891357422, "global_step": 175493, "epoch": 4178} {"train_loss": -6.967209339141846, "global_step": 175494, "epoch": 4178} {"train_loss": -7.053939342498779, "global_step": 175495, "epoch": 4178} {"train_loss": -6.900883197784424, "global_step": 175496, "epoch": 4178} {"train_loss": -6.967657566070557, "global_step": 175497, "epoch": 4178} {"train_loss": -6.920907497406006, "global_step": 175498, "epoch": 4178} {"train_loss": -6.9872965812683105, "global_step": 175499, "epoch": 4178} {"train_loss": -6.938990116119385, "global_step": 175500, "epoch": 4178} {"train_loss": -6.856331825256348, "global_step": 175501, "epoch": 4178} {"train_loss": -7.002384185791016, "global_step": 175502, "epoch": 4178} {"train_loss": -6.889245986938477, "global_step": 175503, "epoch": 4178} {"train_loss": -6.952223300933838, "global_step": 175504, "epoch": 4178} {"train_loss": -7.018632411956787, "global_step": 175505, "epoch": 4178} {"train_loss": -6.824770450592041, "global_step": 175506, "epoch": 4178} {"train_loss": -7.040410041809082, "global_step": 175507, "epoch": 4178} {"train_loss": -7.055469512939453, "global_step": 175508, "epoch": 4178} {"train_loss": -6.97725772857666, "global_step": 175509, "epoch": 4178} {"train_loss": -6.948420524597168, "global_step": 175510, "epoch": 4178} {"train_loss": -6.969639778137207, "global_step": 175511, "epoch": 4178} {"train_loss": -6.91733980178833, "global_step": 175512, "epoch": 4178} {"train_loss": -6.940325736999512, "global_step": 175513, "epoch": 4178} {"train_loss": -6.962337493896484, "global_step": 175514, "epoch": 4178} {"train_loss": -7.0462164878845215, "global_step": 175515, "epoch": 4178} {"train_loss": -6.986751556396484, "global_step": 175516, "epoch": 4178} {"train_loss": -6.9915875026157925, "global_step": 175517, "epoch": 4178, "val_loss": 68685.4296875} {"train_loss": -7.1271514892578125, "global_step": 175518, "epoch": 4179} {"train_loss": -7.009979248046875, "global_step": 175519, "epoch": 4179} {"train_loss": -6.985048294067383, "global_step": 175520, "epoch": 4179} {"train_loss": -6.903413772583008, "global_step": 175521, "epoch": 4179} {"train_loss": -7.074007034301758, "global_step": 175522, "epoch": 4179} {"train_loss": -6.777120113372803, "global_step": 175523, "epoch": 4179} {"train_loss": -6.85093879699707, "global_step": 175524, "epoch": 4179} {"train_loss": -7.054873466491699, "global_step": 175525, "epoch": 4179} {"train_loss": -6.8898773193359375, "global_step": 175526, "epoch": 4179} {"train_loss": -6.898778915405273, "global_step": 175527, "epoch": 4179} {"train_loss": -6.907391548156738, "global_step": 175528, "epoch": 4179} {"train_loss": -7.059718132019043, "global_step": 175529, "epoch": 4179} {"train_loss": -7.099601745605469, "global_step": 175530, "epoch": 4179} {"train_loss": -7.013023376464844, "global_step": 175531, "epoch": 4179} {"train_loss": -6.923460960388184, "global_step": 175532, "epoch": 4179} {"train_loss": -6.987604141235352, "global_step": 175533, "epoch": 4179} {"train_loss": -7.009975910186768, "global_step": 175534, "epoch": 4179} {"train_loss": -7.093435287475586, "global_step": 175535, "epoch": 4179} {"train_loss": -6.936055660247803, "global_step": 175536, "epoch": 4179} {"train_loss": -6.969817161560059, "global_step": 175537, "epoch": 4179} {"train_loss": -6.985463619232178, "global_step": 175538, "epoch": 4179} {"train_loss": -6.965455055236816, "global_step": 175539, "epoch": 4179} {"train_loss": -6.886265754699707, "global_step": 175540, "epoch": 4179} {"train_loss": -7.016850471496582, "global_step": 175541, "epoch": 4179} {"train_loss": -6.992868423461914, "global_step": 175542, "epoch": 4179} {"train_loss": -6.959179401397705, "global_step": 175543, "epoch": 4179} {"train_loss": -7.071776390075684, "global_step": 175544, "epoch": 4179} {"train_loss": -6.977178573608398, "global_step": 175545, "epoch": 4179} {"train_loss": -7.083256721496582, "global_step": 175546, "epoch": 4179} {"train_loss": -7.022192001342773, "global_step": 175547, "epoch": 4179} {"train_loss": -7.01833438873291, "global_step": 175548, "epoch": 4179} {"train_loss": -7.086235046386719, "global_step": 175549, "epoch": 4179} {"train_loss": -6.990291118621826, "global_step": 175550, "epoch": 4179} {"train_loss": -7.177956581115723, "global_step": 175551, "epoch": 4179} {"train_loss": -7.159592628479004, "global_step": 175552, "epoch": 4179} {"train_loss": -6.871665954589844, "global_step": 175553, "epoch": 4179} {"train_loss": -6.983663558959961, "global_step": 175554, "epoch": 4179} {"train_loss": -7.0526275634765625, "global_step": 175555, "epoch": 4179} {"train_loss": -6.920659065246582, "global_step": 175556, "epoch": 4179} {"train_loss": -7.1049299240112305, "global_step": 175557, "epoch": 4179} {"train_loss": -6.836004257202148, "global_step": 175558, "epoch": 4179} {"train_loss": -6.993413505100069, "global_step": 175559, "epoch": 4179, "val_loss": 68542.1640625} {"train_loss": -6.946564674377441, "global_step": 175560, "epoch": 4180} {"train_loss": -6.941789627075195, "global_step": 175561, "epoch": 4180} {"train_loss": -7.065529823303223, "global_step": 175562, "epoch": 4180} {"train_loss": -6.822249889373779, "global_step": 175563, "epoch": 4180} {"train_loss": -7.024281978607178, "global_step": 175564, "epoch": 4180} {"train_loss": -6.969905376434326, "global_step": 175565, "epoch": 4180} {"train_loss": -7.123663902282715, "global_step": 175566, "epoch": 4180} {"train_loss": -6.8622236251831055, "global_step": 175567, "epoch": 4180} {"train_loss": -7.011544227600098, "global_step": 175568, "epoch": 4180} {"train_loss": -7.070860862731934, "global_step": 175569, "epoch": 4180} {"train_loss": -7.037393569946289, "global_step": 175570, "epoch": 4180} {"train_loss": -7.106752395629883, "global_step": 175571, "epoch": 4180} {"train_loss": -6.989156246185303, "global_step": 175572, "epoch": 4180} {"train_loss": -6.946776866912842, "global_step": 175573, "epoch": 4180} {"train_loss": -6.979171276092529, "global_step": 175574, "epoch": 4180} {"train_loss": -7.024424076080322, "global_step": 175575, "epoch": 4180} {"train_loss": -6.967333793640137, "global_step": 175576, "epoch": 4180} {"train_loss": -7.079311370849609, "global_step": 175577, "epoch": 4180} {"train_loss": -6.893092632293701, "global_step": 175578, "epoch": 4180} {"train_loss": -6.949602127075195, "global_step": 175579, "epoch": 4180} {"train_loss": -6.959070205688477, "global_step": 175580, "epoch": 4180} {"train_loss": -6.940716743469238, "global_step": 175581, "epoch": 4180} {"train_loss": -6.901692867279053, "global_step": 175582, "epoch": 4180} {"train_loss": -6.949218273162842, "global_step": 175583, "epoch": 4180} {"train_loss": -6.889888286590576, "global_step": 175584, "epoch": 4180} {"train_loss": -7.159781455993652, "global_step": 175585, "epoch": 4180} {"train_loss": -6.906031608581543, "global_step": 175586, "epoch": 4180} {"train_loss": -6.992088317871094, "global_step": 175587, "epoch": 4180} {"train_loss": -6.82088565826416, "global_step": 175588, "epoch": 4180} {"train_loss": -6.991604804992676, "global_step": 175589, "epoch": 4180} {"train_loss": -6.927801132202148, "global_step": 175590, "epoch": 4180} {"train_loss": -6.913468360900879, "global_step": 175591, "epoch": 4180} {"train_loss": -6.884977340698242, "global_step": 175592, "epoch": 4180} {"train_loss": -6.949985504150391, "global_step": 175593, "epoch": 4180} {"train_loss": -7.0135884284973145, "global_step": 175594, "epoch": 4180} {"train_loss": -6.9317755699157715, "global_step": 175595, "epoch": 4180} {"train_loss": -6.9468793869018555, "global_step": 175596, "epoch": 4180} {"train_loss": -6.806425094604492, "global_step": 175597, "epoch": 4180} {"train_loss": -6.943426132202148, "global_step": 175598, "epoch": 4180} {"train_loss": -6.88637638092041, "global_step": 175599, "epoch": 4180} {"train_loss": -7.004364013671875, "global_step": 175600, "epoch": 4180} {"train_loss": -6.965872537522089, "global_step": 175601, "epoch": 4180, "val_loss": 68665.09375} {"train_loss": -7.039482116699219, "global_step": 175602, "epoch": 4181} {"train_loss": -6.852431297302246, "global_step": 175603, "epoch": 4181} {"train_loss": -6.908331871032715, "global_step": 175604, "epoch": 4181} {"train_loss": -6.894376754760742, "global_step": 175605, "epoch": 4181} {"train_loss": -6.9497785568237305, "global_step": 175606, "epoch": 4181} {"train_loss": -6.926840305328369, "global_step": 175607, "epoch": 4181} {"train_loss": -6.912324905395508, "global_step": 175608, "epoch": 4181} {"train_loss": -7.035884857177734, "global_step": 175609, "epoch": 4181} {"train_loss": -6.804089546203613, "global_step": 175610, "epoch": 4181} {"train_loss": -6.97402286529541, "global_step": 175611, "epoch": 4181} {"train_loss": -7.027454376220703, "global_step": 175612, "epoch": 4181} {"train_loss": -6.975293159484863, "global_step": 175613, "epoch": 4181} {"train_loss": -6.90673828125, "global_step": 175614, "epoch": 4181} {"train_loss": -6.957427501678467, "global_step": 175615, "epoch": 4181} {"train_loss": -6.906805038452148, "global_step": 175616, "epoch": 4181} {"train_loss": -6.962721347808838, "global_step": 175617, "epoch": 4181} {"train_loss": -6.9994306564331055, "global_step": 175618, "epoch": 4181} {"train_loss": -7.033565044403076, "global_step": 175619, "epoch": 4181} {"train_loss": -6.97987699508667, "global_step": 175620, "epoch": 4181} {"train_loss": -7.060767650604248, "global_step": 175621, "epoch": 4181} {"train_loss": -7.022084712982178, "global_step": 175622, "epoch": 4181} {"train_loss": -7.037711143493652, "global_step": 175623, "epoch": 4181} {"train_loss": -6.991613388061523, "global_step": 175624, "epoch": 4181} {"train_loss": -6.976644515991211, "global_step": 175625, "epoch": 4181} {"train_loss": -7.095508575439453, "global_step": 175626, "epoch": 4181} {"train_loss": -6.97925329208374, "global_step": 175627, "epoch": 4181} {"train_loss": -6.971900939941406, "global_step": 175628, "epoch": 4181} {"train_loss": -7.017571449279785, "global_step": 175629, "epoch": 4181} {"train_loss": -7.006857872009277, "global_step": 175630, "epoch": 4181} {"train_loss": -7.08438777923584, "global_step": 175631, "epoch": 4181} {"train_loss": -7.037688255310059, "global_step": 175632, "epoch": 4181} {"train_loss": -7.058938026428223, "global_step": 175633, "epoch": 4181} {"train_loss": -7.062170028686523, "global_step": 175634, "epoch": 4181} {"train_loss": -6.828150749206543, "global_step": 175635, "epoch": 4181} {"train_loss": -7.0397257804870605, "global_step": 175636, "epoch": 4181} {"train_loss": -6.979089736938477, "global_step": 175637, "epoch": 4181} {"train_loss": -6.9101738929748535, "global_step": 175638, "epoch": 4181} {"train_loss": -6.9540252685546875, "global_step": 175639, "epoch": 4181} {"train_loss": -6.965797424316406, "global_step": 175640, "epoch": 4181} {"train_loss": -7.010678291320801, "global_step": 175641, "epoch": 4181} {"train_loss": -6.922558784484863, "global_step": 175642, "epoch": 4181} {"train_loss": -6.977420727411906, "global_step": 175643, "epoch": 4181, "val_loss": 68728.6171875} {"train_loss": -6.970194339752197, "global_step": 175644, "epoch": 4182} {"train_loss": -6.999943733215332, "global_step": 175645, "epoch": 4182} {"train_loss": -6.9786553382873535, "global_step": 175646, "epoch": 4182} {"train_loss": -6.936919212341309, "global_step": 175647, "epoch": 4182} {"train_loss": -6.9698004722595215, "global_step": 175648, "epoch": 4182} {"train_loss": -6.932523250579834, "global_step": 175649, "epoch": 4182} {"train_loss": -6.9714250564575195, "global_step": 175650, "epoch": 4182} {"train_loss": -6.8469390869140625, "global_step": 175651, "epoch": 4182} {"train_loss": -6.847160339355469, "global_step": 175652, "epoch": 4182} {"train_loss": -6.950868606567383, "global_step": 175653, "epoch": 4182} {"train_loss": -6.930096626281738, "global_step": 175654, "epoch": 4182} {"train_loss": -6.938228607177734, "global_step": 175655, "epoch": 4182} {"train_loss": -6.905664443969727, "global_step": 175656, "epoch": 4182} {"train_loss": -7.005280494689941, "global_step": 175657, "epoch": 4182} {"train_loss": -6.9159464836120605, "global_step": 175658, "epoch": 4182} {"train_loss": -7.069658279418945, "global_step": 175659, "epoch": 4182} {"train_loss": -7.0199432373046875, "global_step": 175660, "epoch": 4182} {"train_loss": -7.045472145080566, "global_step": 175661, "epoch": 4182} {"train_loss": -6.957952499389648, "global_step": 175662, "epoch": 4182} {"train_loss": -6.988566875457764, "global_step": 175663, "epoch": 4182} {"train_loss": -6.909256935119629, "global_step": 175664, "epoch": 4182} {"train_loss": -7.0411882400512695, "global_step": 175665, "epoch": 4182} {"train_loss": -7.000326156616211, "global_step": 175666, "epoch": 4182} {"train_loss": -7.00455904006958, "global_step": 175667, "epoch": 4182} {"train_loss": -7.054894924163818, "global_step": 175668, "epoch": 4182} {"train_loss": -6.948148727416992, "global_step": 175669, "epoch": 4182} {"train_loss": -7.112239837646484, "global_step": 175670, "epoch": 4182} {"train_loss": -7.142626762390137, "global_step": 175671, "epoch": 4182} {"train_loss": -7.0200042724609375, "global_step": 175672, "epoch": 4182} {"train_loss": -6.9927520751953125, "global_step": 175673, "epoch": 4182} {"train_loss": -7.0556111335754395, "global_step": 175674, "epoch": 4182} {"train_loss": -7.064881324768066, "global_step": 175675, "epoch": 4182} {"train_loss": -7.016017436981201, "global_step": 175676, "epoch": 4182} {"train_loss": -7.075268745422363, "global_step": 175677, "epoch": 4182} {"train_loss": -7.106826305389404, "global_step": 175678, "epoch": 4182} {"train_loss": -6.962316513061523, "global_step": 175679, "epoch": 4182} {"train_loss": -7.100725173950195, "global_step": 175680, "epoch": 4182} {"train_loss": -7.113389015197754, "global_step": 175681, "epoch": 4182} {"train_loss": -7.084247589111328, "global_step": 175682, "epoch": 4182} {"train_loss": -7.117447853088379, "global_step": 175683, "epoch": 4182} {"train_loss": -7.074069023132324, "global_step": 175684, "epoch": 4182} {"train_loss": -7.005905378432501, "global_step": 175685, "epoch": 4182, "val_loss": 68679.75} {"train_loss": -6.970556259155273, "global_step": 175686, "epoch": 4183} {"train_loss": -7.0473856925964355, "global_step": 175687, "epoch": 4183} {"train_loss": -7.08455753326416, "global_step": 175688, "epoch": 4183} {"train_loss": -7.0062479972839355, "global_step": 175689, "epoch": 4183} {"train_loss": -7.129280090332031, "global_step": 175690, "epoch": 4183} {"train_loss": -7.104819297790527, "global_step": 175691, "epoch": 4183} {"train_loss": -6.98406982421875, "global_step": 175692, "epoch": 4183} {"train_loss": -6.997139930725098, "global_step": 175693, "epoch": 4183} {"train_loss": -7.108009338378906, "global_step": 175694, "epoch": 4183} {"train_loss": -7.173842430114746, "global_step": 175695, "epoch": 4183} {"train_loss": -7.065755844116211, "global_step": 175696, "epoch": 4183} {"train_loss": -7.126350402832031, "global_step": 175697, "epoch": 4183} {"train_loss": -7.060970783233643, "global_step": 175698, "epoch": 4183} {"train_loss": -7.151599884033203, "global_step": 175699, "epoch": 4183} {"train_loss": -7.044711112976074, "global_step": 175700, "epoch": 4183} {"train_loss": -7.059213161468506, "global_step": 175701, "epoch": 4183} {"train_loss": -7.069281578063965, "global_step": 175702, "epoch": 4183} {"train_loss": -6.9985809326171875, "global_step": 175703, "epoch": 4183} {"train_loss": -7.093657493591309, "global_step": 175704, "epoch": 4183} {"train_loss": -7.030013561248779, "global_step": 175705, "epoch": 4183} {"train_loss": -7.178086280822754, "global_step": 175706, "epoch": 4183} {"train_loss": -7.051304817199707, "global_step": 175707, "epoch": 4183} {"train_loss": -7.106122970581055, "global_step": 175708, "epoch": 4183} {"train_loss": -7.097421646118164, "global_step": 175709, "epoch": 4183} {"train_loss": -7.088217258453369, "global_step": 175710, "epoch": 4183} {"train_loss": -6.996998310089111, "global_step": 175711, "epoch": 4183} {"train_loss": -7.144134521484375, "global_step": 175712, "epoch": 4183} {"train_loss": -7.080874443054199, "global_step": 175713, "epoch": 4183} {"train_loss": -6.945169448852539, "global_step": 175714, "epoch": 4183} {"train_loss": -7.171213626861572, "global_step": 175715, "epoch": 4183} {"train_loss": -7.146084785461426, "global_step": 175716, "epoch": 4183} {"train_loss": -7.003103256225586, "global_step": 175717, "epoch": 4183} {"train_loss": -6.943752765655518, "global_step": 175718, "epoch": 4183} {"train_loss": -7.1355719566345215, "global_step": 175719, "epoch": 4183} {"train_loss": -7.014558792114258, "global_step": 175720, "epoch": 4183} {"train_loss": -7.06249475479126, "global_step": 175721, "epoch": 4183} {"train_loss": -6.987846374511719, "global_step": 175722, "epoch": 4183} {"train_loss": -6.936282157897949, "global_step": 175723, "epoch": 4183} {"train_loss": -7.070304870605469, "global_step": 175724, "epoch": 4183} {"train_loss": -6.953322410583496, "global_step": 175725, "epoch": 4183} {"train_loss": -6.89927339553833, "global_step": 175726, "epoch": 4183} {"train_loss": -7.053694248199463, "global_step": 175727, "epoch": 4183, "val_loss": 68759.4921875} {"train_loss": -7.064379692077637, "global_step": 175728, "epoch": 4184} {"train_loss": -6.922511100769043, "global_step": 175729, "epoch": 4184} {"train_loss": -7.043523788452148, "global_step": 175730, "epoch": 4184} {"train_loss": -7.0378594398498535, "global_step": 175731, "epoch": 4184} {"train_loss": -6.938770294189453, "global_step": 175732, "epoch": 4184} {"train_loss": -6.9236249923706055, "global_step": 175733, "epoch": 4184} {"train_loss": -6.854060173034668, "global_step": 175734, "epoch": 4184} {"train_loss": -6.937661170959473, "global_step": 175735, "epoch": 4184} {"train_loss": -6.989446640014648, "global_step": 175736, "epoch": 4184} {"train_loss": -6.957385540008545, "global_step": 175737, "epoch": 4184} {"train_loss": -6.9774346351623535, "global_step": 175738, "epoch": 4184} {"train_loss": -6.931793689727783, "global_step": 175739, "epoch": 4184} {"train_loss": -6.998330116271973, "global_step": 175740, "epoch": 4184} {"train_loss": -6.781963348388672, "global_step": 175741, "epoch": 4184} {"train_loss": -7.007325649261475, "global_step": 175742, "epoch": 4184} {"train_loss": -6.856813430786133, "global_step": 175743, "epoch": 4184} {"train_loss": -6.973196029663086, "global_step": 175744, "epoch": 4184} {"train_loss": -6.975622177124023, "global_step": 175745, "epoch": 4184} {"train_loss": -6.909825325012207, "global_step": 175746, "epoch": 4184} {"train_loss": -7.006528854370117, "global_step": 175747, "epoch": 4184} {"train_loss": -6.838287830352783, "global_step": 175748, "epoch": 4184} {"train_loss": -6.961546897888184, "global_step": 175749, "epoch": 4184} {"train_loss": -6.845398902893066, "global_step": 175750, "epoch": 4184} {"train_loss": -6.951056957244873, "global_step": 175751, "epoch": 4184} {"train_loss": -7.00424861907959, "global_step": 175752, "epoch": 4184} {"train_loss": -6.926853179931641, "global_step": 175753, "epoch": 4184} {"train_loss": -6.8339643478393555, "global_step": 175754, "epoch": 4184} {"train_loss": -6.935006141662598, "global_step": 175755, "epoch": 4184} {"train_loss": -7.0277814865112305, "global_step": 175756, "epoch": 4184} {"train_loss": -6.896765232086182, "global_step": 175757, "epoch": 4184} {"train_loss": -6.9319376945495605, "global_step": 175758, "epoch": 4184} {"train_loss": -6.9398674964904785, "global_step": 175759, "epoch": 4184} {"train_loss": -6.8697967529296875, "global_step": 175760, "epoch": 4184} {"train_loss": -6.953912734985352, "global_step": 175761, "epoch": 4184} {"train_loss": -6.909991264343262, "global_step": 175762, "epoch": 4184} {"train_loss": -6.9984540939331055, "global_step": 175763, "epoch": 4184} {"train_loss": -7.0636091232299805, "global_step": 175764, "epoch": 4184} {"train_loss": -7.061912536621094, "global_step": 175765, "epoch": 4184} {"train_loss": -6.888203144073486, "global_step": 175766, "epoch": 4184} {"train_loss": -7.113404750823975, "global_step": 175767, "epoch": 4184} {"train_loss": -7.0656418800354, "global_step": 175768, "epoch": 4184} {"train_loss": -6.956818126496815, "global_step": 175769, "epoch": 4184, "val_loss": 68603.2109375} {"train_loss": -6.962321758270264, "global_step": 175770, "epoch": 4185} {"train_loss": -7.09495735168457, "global_step": 175771, "epoch": 4185} {"train_loss": -7.001923561096191, "global_step": 175772, "epoch": 4185} {"train_loss": -6.9980645179748535, "global_step": 175773, "epoch": 4185} {"train_loss": -7.028281211853027, "global_step": 175774, "epoch": 4185} {"train_loss": -6.996067047119141, "global_step": 175775, "epoch": 4185} {"train_loss": -6.973011016845703, "global_step": 175776, "epoch": 4185} {"train_loss": -7.0694780349731445, "global_step": 175777, "epoch": 4185} {"train_loss": -7.105124473571777, "global_step": 175778, "epoch": 4185} {"train_loss": -7.005887985229492, "global_step": 175779, "epoch": 4185} {"train_loss": -7.009922981262207, "global_step": 175780, "epoch": 4185} {"train_loss": -7.10576868057251, "global_step": 175781, "epoch": 4185} {"train_loss": -7.063967704772949, "global_step": 175782, "epoch": 4185} {"train_loss": -7.1139044761657715, "global_step": 175783, "epoch": 4185} {"train_loss": -7.04796028137207, "global_step": 175784, "epoch": 4185} {"train_loss": -7.149631500244141, "global_step": 175785, "epoch": 4185} {"train_loss": -6.991166114807129, "global_step": 175786, "epoch": 4185} {"train_loss": -7.113293647766113, "global_step": 175787, "epoch": 4185} {"train_loss": -6.983717918395996, "global_step": 175788, "epoch": 4185} {"train_loss": -7.10407018661499, "global_step": 175789, "epoch": 4185} {"train_loss": -7.017976760864258, "global_step": 175790, "epoch": 4185} {"train_loss": -7.062709331512451, "global_step": 175791, "epoch": 4185} {"train_loss": -7.185522556304932, "global_step": 175792, "epoch": 4185} {"train_loss": -7.040627956390381, "global_step": 175793, "epoch": 4185} {"train_loss": -7.015167236328125, "global_step": 175794, "epoch": 4185} {"train_loss": -7.1440558433532715, "global_step": 175795, "epoch": 4185} {"train_loss": -7.061220169067383, "global_step": 175796, "epoch": 4185} {"train_loss": -7.120227813720703, "global_step": 175797, "epoch": 4185} {"train_loss": -7.113473415374756, "global_step": 175798, "epoch": 4185} {"train_loss": -6.992338180541992, "global_step": 175799, "epoch": 4185} {"train_loss": -7.129435062408447, "global_step": 175800, "epoch": 4185} {"train_loss": -7.064010143280029, "global_step": 175801, "epoch": 4185} {"train_loss": -7.074665069580078, "global_step": 175802, "epoch": 4185} {"train_loss": -7.058676719665527, "global_step": 175803, "epoch": 4185} {"train_loss": -7.011622428894043, "global_step": 175804, "epoch": 4185} {"train_loss": -7.086688995361328, "global_step": 175805, "epoch": 4185} {"train_loss": -6.951321601867676, "global_step": 175806, "epoch": 4185} {"train_loss": -7.141895294189453, "global_step": 175807, "epoch": 4185} {"train_loss": -7.026537895202637, "global_step": 175808, "epoch": 4185} {"train_loss": -6.999977111816406, "global_step": 175809, "epoch": 4185} {"train_loss": -7.222558498382568, "global_step": 175810, "epoch": 4185} {"train_loss": -7.061474584397816, "global_step": 175811, "epoch": 4185, "val_loss": 68628.6328125} {"train_loss": -6.931436061859131, "global_step": 175812, "epoch": 4186} {"train_loss": -7.029211521148682, "global_step": 175813, "epoch": 4186} {"train_loss": -7.104495525360107, "global_step": 175814, "epoch": 4186} {"train_loss": -7.102628707885742, "global_step": 175815, "epoch": 4186} {"train_loss": -6.961261749267578, "global_step": 175816, "epoch": 4186} {"train_loss": -7.103643894195557, "global_step": 175817, "epoch": 4186} {"train_loss": -7.0904693603515625, "global_step": 175818, "epoch": 4186} {"train_loss": -7.006340980529785, "global_step": 175819, "epoch": 4186} {"train_loss": -7.013118267059326, "global_step": 175820, "epoch": 4186} {"train_loss": -7.150096893310547, "global_step": 175821, "epoch": 4186} {"train_loss": -7.041301727294922, "global_step": 175822, "epoch": 4186} {"train_loss": -7.005362033843994, "global_step": 175823, "epoch": 4186} {"train_loss": -7.011569499969482, "global_step": 175824, "epoch": 4186} {"train_loss": -7.001278877258301, "global_step": 175825, "epoch": 4186} {"train_loss": -7.054022789001465, "global_step": 175826, "epoch": 4186} {"train_loss": -7.049888610839844, "global_step": 175827, "epoch": 4186} {"train_loss": -6.921911716461182, "global_step": 175828, "epoch": 4186} {"train_loss": -6.935580730438232, "global_step": 175829, "epoch": 4186} {"train_loss": -7.029644012451172, "global_step": 175830, "epoch": 4186} {"train_loss": -6.958074569702148, "global_step": 175831, "epoch": 4186} {"train_loss": -7.052382946014404, "global_step": 175832, "epoch": 4186} {"train_loss": -7.168088912963867, "global_step": 175833, "epoch": 4186} {"train_loss": -6.925755500793457, "global_step": 175834, "epoch": 4186} {"train_loss": -7.04661750793457, "global_step": 175835, "epoch": 4186} {"train_loss": -7.0114665031433105, "global_step": 175836, "epoch": 4186} {"train_loss": -6.983192443847656, "global_step": 175837, "epoch": 4186} {"train_loss": -7.073020935058594, "global_step": 175838, "epoch": 4186} {"train_loss": -7.026826858520508, "global_step": 175839, "epoch": 4186} {"train_loss": -6.996809959411621, "global_step": 175840, "epoch": 4186} {"train_loss": -7.121527671813965, "global_step": 175841, "epoch": 4186} {"train_loss": -7.162426948547363, "global_step": 175842, "epoch": 4186} {"train_loss": -7.133390426635742, "global_step": 175843, "epoch": 4186} {"train_loss": -7.061275005340576, "global_step": 175844, "epoch": 4186} {"train_loss": -7.0484819412231445, "global_step": 175845, "epoch": 4186} {"train_loss": -7.02335262298584, "global_step": 175846, "epoch": 4186} {"train_loss": -7.076387405395508, "global_step": 175847, "epoch": 4186} {"train_loss": -7.04091215133667, "global_step": 175848, "epoch": 4186} {"train_loss": -7.015895843505859, "global_step": 175849, "epoch": 4186} {"train_loss": -7.041254043579102, "global_step": 175850, "epoch": 4186} {"train_loss": -6.913340091705322, "global_step": 175851, "epoch": 4186} {"train_loss": -7.050008296966553, "global_step": 175852, "epoch": 4186} {"train_loss": -7.0356450989132835, "global_step": 175853, "epoch": 4186, "val_loss": 68533.7578125} {"train_loss": -7.028517723083496, "global_step": 175854, "epoch": 4187} {"train_loss": -6.9241132736206055, "global_step": 175855, "epoch": 4187} {"train_loss": -7.0131378173828125, "global_step": 175856, "epoch": 4187} {"train_loss": -7.059145927429199, "global_step": 175857, "epoch": 4187} {"train_loss": -7.03531551361084, "global_step": 175858, "epoch": 4187} {"train_loss": -7.127312183380127, "global_step": 175859, "epoch": 4187} {"train_loss": -7.046816825866699, "global_step": 175860, "epoch": 4187} {"train_loss": -6.961907863616943, "global_step": 175861, "epoch": 4187} {"train_loss": -6.98262882232666, "global_step": 175862, "epoch": 4187} {"train_loss": -6.9935760498046875, "global_step": 175863, "epoch": 4187} {"train_loss": -7.0640082359313965, "global_step": 175864, "epoch": 4187} {"train_loss": -7.016225814819336, "global_step": 175865, "epoch": 4187} {"train_loss": -7.05772066116333, "global_step": 175866, "epoch": 4187} {"train_loss": -7.057809352874756, "global_step": 175867, "epoch": 4187} {"train_loss": -7.066323280334473, "global_step": 175868, "epoch": 4187} {"train_loss": -7.053432941436768, "global_step": 175869, "epoch": 4187} {"train_loss": -7.1536383628845215, "global_step": 175870, "epoch": 4187} {"train_loss": -7.143300533294678, "global_step": 175871, "epoch": 4187} {"train_loss": -7.12653923034668, "global_step": 175872, "epoch": 4187} {"train_loss": -7.128986835479736, "global_step": 175873, "epoch": 4187} {"train_loss": -7.052536964416504, "global_step": 175874, "epoch": 4187} {"train_loss": -7.134100914001465, "global_step": 175875, "epoch": 4187} {"train_loss": -7.05039644241333, "global_step": 175876, "epoch": 4187} {"train_loss": -7.062983512878418, "global_step": 175877, "epoch": 4187} {"train_loss": -7.079296112060547, "global_step": 175878, "epoch": 4187} {"train_loss": -7.061694145202637, "global_step": 175879, "epoch": 4187} {"train_loss": -7.028738498687744, "global_step": 175880, "epoch": 4187} {"train_loss": -6.9933342933654785, "global_step": 175881, "epoch": 4187} {"train_loss": -7.030848026275635, "global_step": 175882, "epoch": 4187} {"train_loss": -7.043109893798828, "global_step": 175883, "epoch": 4187} {"train_loss": -7.150389671325684, "global_step": 175884, "epoch": 4187} {"train_loss": -7.0808329582214355, "global_step": 175885, "epoch": 4187} {"train_loss": -7.069676399230957, "global_step": 175886, "epoch": 4187} {"train_loss": -7.038778781890869, "global_step": 175887, "epoch": 4187} {"train_loss": -6.909785270690918, "global_step": 175888, "epoch": 4187} {"train_loss": -6.967386245727539, "global_step": 175889, "epoch": 4187} {"train_loss": -7.220139980316162, "global_step": 175890, "epoch": 4187} {"train_loss": -6.937221527099609, "global_step": 175891, "epoch": 4187} {"train_loss": -6.896934986114502, "global_step": 175892, "epoch": 4187} {"train_loss": -7.150702476501465, "global_step": 175893, "epoch": 4187} {"train_loss": -7.109012126922607, "global_step": 175894, "epoch": 4187} {"train_loss": -7.05084186508542, "global_step": 175895, "epoch": 4187, "val_loss": 68790.9921875} {"train_loss": -7.178178787231445, "global_step": 175896, "epoch": 4188} {"train_loss": -7.023418426513672, "global_step": 175897, "epoch": 4188} {"train_loss": -7.011967182159424, "global_step": 175898, "epoch": 4188} {"train_loss": -7.029904365539551, "global_step": 175899, "epoch": 4188} {"train_loss": -7.15211296081543, "global_step": 175900, "epoch": 4188} {"train_loss": -6.959580421447754, "global_step": 175901, "epoch": 4188} {"train_loss": -7.046321392059326, "global_step": 175902, "epoch": 4188} {"train_loss": -7.089125633239746, "global_step": 175903, "epoch": 4188} {"train_loss": -7.142657279968262, "global_step": 175904, "epoch": 4188} {"train_loss": -6.964654922485352, "global_step": 175905, "epoch": 4188} {"train_loss": -7.121294021606445, "global_step": 175906, "epoch": 4188} {"train_loss": -7.053414821624756, "global_step": 175907, "epoch": 4188} {"train_loss": -6.971554756164551, "global_step": 175908, "epoch": 4188} {"train_loss": -6.983240604400635, "global_step": 175909, "epoch": 4188} {"train_loss": -6.988628387451172, "global_step": 175910, "epoch": 4188} {"train_loss": -7.03415584564209, "global_step": 175911, "epoch": 4188} {"train_loss": -7.027602195739746, "global_step": 175912, "epoch": 4188} {"train_loss": -7.137754440307617, "global_step": 175913, "epoch": 4188} {"train_loss": -7.074236869812012, "global_step": 175914, "epoch": 4188} {"train_loss": -7.152861595153809, "global_step": 175915, "epoch": 4188} {"train_loss": -7.03536319732666, "global_step": 175916, "epoch": 4188} {"train_loss": -7.03254508972168, "global_step": 175917, "epoch": 4188} {"train_loss": -7.065849304199219, "global_step": 175918, "epoch": 4188} {"train_loss": -7.009408950805664, "global_step": 175919, "epoch": 4188} {"train_loss": -7.0771803855896, "global_step": 175920, "epoch": 4188} {"train_loss": -7.164970397949219, "global_step": 175921, "epoch": 4188} {"train_loss": -7.00614070892334, "global_step": 175922, "epoch": 4188} {"train_loss": -6.954591274261475, "global_step": 175923, "epoch": 4188} {"train_loss": -6.9404473304748535, "global_step": 175924, "epoch": 4188} {"train_loss": -6.9996256828308105, "global_step": 175925, "epoch": 4188} {"train_loss": -7.0450897216796875, "global_step": 175926, "epoch": 4188} {"train_loss": -7.020847320556641, "global_step": 175927, "epoch": 4188} {"train_loss": -6.93778133392334, "global_step": 175928, "epoch": 4188} {"train_loss": -7.022811412811279, "global_step": 175929, "epoch": 4188} {"train_loss": -7.153303623199463, "global_step": 175930, "epoch": 4188} {"train_loss": -6.964977264404297, "global_step": 175931, "epoch": 4188} {"train_loss": -7.058040618896484, "global_step": 175932, "epoch": 4188} {"train_loss": -7.124582290649414, "global_step": 175933, "epoch": 4188} {"train_loss": -6.969493865966797, "global_step": 175934, "epoch": 4188} {"train_loss": -6.9798455238342285, "global_step": 175935, "epoch": 4188} {"train_loss": -6.982859134674072, "global_step": 175936, "epoch": 4188} {"train_loss": -7.041196164630708, "global_step": 175937, "epoch": 4188, "val_loss": 68733.359375} {"train_loss": -7.127552032470703, "global_step": 175938, "epoch": 4189} {"train_loss": -6.985437393188477, "global_step": 175939, "epoch": 4189} {"train_loss": -7.026461601257324, "global_step": 175940, "epoch": 4189} {"train_loss": -7.011897087097168, "global_step": 175941, "epoch": 4189} {"train_loss": -6.976635932922363, "global_step": 175942, "epoch": 4189} {"train_loss": -6.958277702331543, "global_step": 175943, "epoch": 4189} {"train_loss": -7.0494160652160645, "global_step": 175944, "epoch": 4189} {"train_loss": -7.032087326049805, "global_step": 175945, "epoch": 4189} {"train_loss": -7.00904655456543, "global_step": 175946, "epoch": 4189} {"train_loss": -7.010443687438965, "global_step": 175947, "epoch": 4189} {"train_loss": -7.074985027313232, "global_step": 175948, "epoch": 4189} {"train_loss": -7.000502109527588, "global_step": 175949, "epoch": 4189} {"train_loss": -6.905106544494629, "global_step": 175950, "epoch": 4189} {"train_loss": -6.960012435913086, "global_step": 175951, "epoch": 4189} {"train_loss": -7.056718826293945, "global_step": 175952, "epoch": 4189} {"train_loss": -7.054289817810059, "global_step": 175953, "epoch": 4189} {"train_loss": -7.054174423217773, "global_step": 175954, "epoch": 4189} {"train_loss": -6.94154167175293, "global_step": 175955, "epoch": 4189} {"train_loss": -7.059272766113281, "global_step": 175956, "epoch": 4189} {"train_loss": -7.016796112060547, "global_step": 175957, "epoch": 4189} {"train_loss": -7.100889682769775, "global_step": 175958, "epoch": 4189} {"train_loss": -7.050162315368652, "global_step": 175959, "epoch": 4189} {"train_loss": -6.998401641845703, "global_step": 175960, "epoch": 4189} {"train_loss": -7.067208766937256, "global_step": 175961, "epoch": 4189} {"train_loss": -7.072562217712402, "global_step": 175962, "epoch": 4189} {"train_loss": -6.835951805114746, "global_step": 175963, "epoch": 4189} {"train_loss": -6.88081693649292, "global_step": 175964, "epoch": 4189} {"train_loss": -7.045017242431641, "global_step": 175965, "epoch": 4189} {"train_loss": -6.954980373382568, "global_step": 175966, "epoch": 4189} {"train_loss": -6.970127105712891, "global_step": 175967, "epoch": 4189} {"train_loss": -6.938925266265869, "global_step": 175968, "epoch": 4189} {"train_loss": -6.9788641929626465, "global_step": 175969, "epoch": 4189} {"train_loss": -7.000081539154053, "global_step": 175970, "epoch": 4189} {"train_loss": -7.033499717712402, "global_step": 175971, "epoch": 4189} {"train_loss": -6.933781147003174, "global_step": 175972, "epoch": 4189} {"train_loss": -7.039556980133057, "global_step": 175973, "epoch": 4189} {"train_loss": -6.976776123046875, "global_step": 175974, "epoch": 4189} {"train_loss": -7.075826644897461, "global_step": 175975, "epoch": 4189} {"train_loss": -6.842367172241211, "global_step": 175976, "epoch": 4189} {"train_loss": -7.059981346130371, "global_step": 175977, "epoch": 4189} {"train_loss": -6.938991546630859, "global_step": 175978, "epoch": 4189} {"train_loss": -7.002717370078678, "global_step": 175979, "epoch": 4189, "val_loss": 68700.6328125} {"train_loss": -6.979849815368652, "global_step": 175980, "epoch": 4190} {"train_loss": -7.104389190673828, "global_step": 175981, "epoch": 4190} {"train_loss": -7.111049175262451, "global_step": 175982, "epoch": 4190} {"train_loss": -7.009556293487549, "global_step": 175983, "epoch": 4190} {"train_loss": -7.052454948425293, "global_step": 175984, "epoch": 4190} {"train_loss": -6.986394882202148, "global_step": 175985, "epoch": 4190} {"train_loss": -7.090827941894531, "global_step": 175986, "epoch": 4190} {"train_loss": -7.029921531677246, "global_step": 175987, "epoch": 4190} {"train_loss": -6.964937210083008, "global_step": 175988, "epoch": 4190} {"train_loss": -6.978590965270996, "global_step": 175989, "epoch": 4190} {"train_loss": -7.126564025878906, "global_step": 175990, "epoch": 4190} {"train_loss": -6.969954013824463, "global_step": 175991, "epoch": 4190} {"train_loss": -7.083540916442871, "global_step": 175992, "epoch": 4190} {"train_loss": -6.985591888427734, "global_step": 175993, "epoch": 4190} {"train_loss": -7.0604448318481445, "global_step": 175994, "epoch": 4190} {"train_loss": -7.1518874168396, "global_step": 175995, "epoch": 4190} {"train_loss": -7.143817901611328, "global_step": 175996, "epoch": 4190} {"train_loss": -7.092817306518555, "global_step": 175997, "epoch": 4190} {"train_loss": -7.074249267578125, "global_step": 175998, "epoch": 4190} {"train_loss": -7.0649495124816895, "global_step": 175999, "epoch": 4190} {"train_loss": -7.044131278991699, "global_step": 176000, "epoch": 4190} {"train_loss": -7.026996612548828, "global_step": 176001, "epoch": 4190} {"train_loss": -7.0393242835998535, "global_step": 176002, "epoch": 4190} {"train_loss": -7.027378082275391, "global_step": 176003, "epoch": 4190} {"train_loss": -7.073592185974121, "global_step": 176004, "epoch": 4190} {"train_loss": -6.937464714050293, "global_step": 176005, "epoch": 4190} {"train_loss": -6.967474937438965, "global_step": 176006, "epoch": 4190} {"train_loss": -7.043977737426758, "global_step": 176007, "epoch": 4190} {"train_loss": -6.9537553787231445, "global_step": 176008, "epoch": 4190} {"train_loss": -7.025189399719238, "global_step": 176009, "epoch": 4190} {"train_loss": -7.017833709716797, "global_step": 176010, "epoch": 4190} {"train_loss": -6.970385551452637, "global_step": 176011, "epoch": 4190} {"train_loss": -6.942080497741699, "global_step": 176012, "epoch": 4190} {"train_loss": -7.008113384246826, "global_step": 176013, "epoch": 4190} {"train_loss": -6.848964691162109, "global_step": 176014, "epoch": 4190} {"train_loss": -6.98640251159668, "global_step": 176015, "epoch": 4190} {"train_loss": -6.968541145324707, "global_step": 176016, "epoch": 4190} {"train_loss": -7.023738861083984, "global_step": 176017, "epoch": 4190} {"train_loss": -6.955718040466309, "global_step": 176018, "epoch": 4190} {"train_loss": -7.0670013427734375, "global_step": 176019, "epoch": 4190} {"train_loss": -6.950849533081055, "global_step": 176020, "epoch": 4190} {"train_loss": -7.02201737676348, "global_step": 176021, "epoch": 4190, "val_loss": 68664.9921875} {"train_loss": -7.0089335441589355, "global_step": 176022, "epoch": 4191} {"train_loss": -6.911396026611328, "global_step": 176023, "epoch": 4191} {"train_loss": -6.986394882202148, "global_step": 176024, "epoch": 4191} {"train_loss": -6.993046760559082, "global_step": 176025, "epoch": 4191} {"train_loss": -7.123470306396484, "global_step": 176026, "epoch": 4191} {"train_loss": -7.063350677490234, "global_step": 176027, "epoch": 4191} {"train_loss": -6.888206481933594, "global_step": 176028, "epoch": 4191} {"train_loss": -6.897493362426758, "global_step": 176029, "epoch": 4191} {"train_loss": -7.032191276550293, "global_step": 176030, "epoch": 4191} {"train_loss": -7.011686325073242, "global_step": 176031, "epoch": 4191} {"train_loss": -6.997598648071289, "global_step": 176032, "epoch": 4191} {"train_loss": -7.1767072677612305, "global_step": 176033, "epoch": 4191} {"train_loss": -6.933732032775879, "global_step": 176034, "epoch": 4191} {"train_loss": -7.075142860412598, "global_step": 176035, "epoch": 4191} {"train_loss": -7.091535568237305, "global_step": 176036, "epoch": 4191} {"train_loss": -6.98233699798584, "global_step": 176037, "epoch": 4191} {"train_loss": -7.08845329284668, "global_step": 176038, "epoch": 4191} {"train_loss": -6.953375816345215, "global_step": 176039, "epoch": 4191} {"train_loss": -6.890739440917969, "global_step": 176040, "epoch": 4191} {"train_loss": -7.049776077270508, "global_step": 176041, "epoch": 4191} {"train_loss": -7.095776557922363, "global_step": 176042, "epoch": 4191} {"train_loss": -7.084362983703613, "global_step": 176043, "epoch": 4191} {"train_loss": -7.079150199890137, "global_step": 176044, "epoch": 4191} {"train_loss": -7.014995098114014, "global_step": 176045, "epoch": 4191} {"train_loss": -7.1071062088012695, "global_step": 176046, "epoch": 4191} {"train_loss": -7.137116432189941, "global_step": 176047, "epoch": 4191} {"train_loss": -7.051363945007324, "global_step": 176048, "epoch": 4191} {"train_loss": -7.164403915405273, "global_step": 176049, "epoch": 4191} {"train_loss": -7.027751445770264, "global_step": 176050, "epoch": 4191} {"train_loss": -6.956905364990234, "global_step": 176051, "epoch": 4191} {"train_loss": -7.188753604888916, "global_step": 176052, "epoch": 4191} {"train_loss": -7.1019182205200195, "global_step": 176053, "epoch": 4191} {"train_loss": -7.117165565490723, "global_step": 176054, "epoch": 4191} {"train_loss": -7.155160903930664, "global_step": 176055, "epoch": 4191} {"train_loss": -7.225590705871582, "global_step": 176056, "epoch": 4191} {"train_loss": -7.033514022827148, "global_step": 176057, "epoch": 4191} {"train_loss": -7.111950397491455, "global_step": 176058, "epoch": 4191} {"train_loss": -7.088560581207275, "global_step": 176059, "epoch": 4191} {"train_loss": -7.125458717346191, "global_step": 176060, "epoch": 4191} {"train_loss": -7.079300880432129, "global_step": 176061, "epoch": 4191} {"train_loss": -7.0306501388549805, "global_step": 176062, "epoch": 4191} {"train_loss": -7.05613062495277, "global_step": 176063, "epoch": 4191, "val_loss": 68725.0234375} {"train_loss": -7.091496467590332, "global_step": 176064, "epoch": 4192} {"train_loss": -7.122840881347656, "global_step": 176065, "epoch": 4192} {"train_loss": -7.172238826751709, "global_step": 176066, "epoch": 4192} {"train_loss": -7.064316749572754, "global_step": 176067, "epoch": 4192} {"train_loss": -7.092041969299316, "global_step": 176068, "epoch": 4192} {"train_loss": -7.0854620933532715, "global_step": 176069, "epoch": 4192} {"train_loss": -7.110930442810059, "global_step": 176070, "epoch": 4192} {"train_loss": -7.161642074584961, "global_step": 176071, "epoch": 4192} {"train_loss": -7.099035263061523, "global_step": 176072, "epoch": 4192} {"train_loss": -7.106094837188721, "global_step": 176073, "epoch": 4192} {"train_loss": -6.951262474060059, "global_step": 176074, "epoch": 4192} {"train_loss": -7.107503414154053, "global_step": 176075, "epoch": 4192} {"train_loss": -6.9913716316223145, "global_step": 176076, "epoch": 4192} {"train_loss": -7.121367454528809, "global_step": 176077, "epoch": 4192} {"train_loss": -7.106542587280273, "global_step": 176078, "epoch": 4192} {"train_loss": -6.868137836456299, "global_step": 176079, "epoch": 4192} {"train_loss": -6.920937538146973, "global_step": 176080, "epoch": 4192} {"train_loss": -6.927425384521484, "global_step": 176081, "epoch": 4192} {"train_loss": -7.076862335205078, "global_step": 176082, "epoch": 4192} {"train_loss": -7.143923759460449, "global_step": 176083, "epoch": 4192} {"train_loss": -7.052056312561035, "global_step": 176084, "epoch": 4192} {"train_loss": -7.08375883102417, "global_step": 176085, "epoch": 4192} {"train_loss": -7.057326793670654, "global_step": 176086, "epoch": 4192} {"train_loss": -6.924685478210449, "global_step": 176087, "epoch": 4192} {"train_loss": -7.037567138671875, "global_step": 176088, "epoch": 4192} {"train_loss": -7.014759063720703, "global_step": 176089, "epoch": 4192} {"train_loss": -7.077646255493164, "global_step": 176090, "epoch": 4192} {"train_loss": -7.132916450500488, "global_step": 176091, "epoch": 4192} {"train_loss": -7.070126533508301, "global_step": 176092, "epoch": 4192} {"train_loss": -7.111164093017578, "global_step": 176093, "epoch": 4192} {"train_loss": -7.100082874298096, "global_step": 176094, "epoch": 4192} {"train_loss": -6.9845123291015625, "global_step": 176095, "epoch": 4192} {"train_loss": -7.069830417633057, "global_step": 176096, "epoch": 4192} {"train_loss": -7.055058002471924, "global_step": 176097, "epoch": 4192} {"train_loss": -7.017359256744385, "global_step": 176098, "epoch": 4192} {"train_loss": -7.035651206970215, "global_step": 176099, "epoch": 4192} {"train_loss": -7.130288600921631, "global_step": 176100, "epoch": 4192} {"train_loss": -6.979753017425537, "global_step": 176101, "epoch": 4192} {"train_loss": -6.956186294555664, "global_step": 176102, "epoch": 4192} {"train_loss": -7.048378944396973, "global_step": 176103, "epoch": 4192} {"train_loss": -6.7505645751953125, "global_step": 176104, "epoch": 4192} {"train_loss": -7.046611297698248, "global_step": 176105, "epoch": 4192, "val_loss": 68713.640625} {"train_loss": -6.9468231201171875, "global_step": 176106, "epoch": 4193} {"train_loss": -6.755226135253906, "global_step": 176107, "epoch": 4193} {"train_loss": -7.10008430480957, "global_step": 176108, "epoch": 4193} {"train_loss": -6.748748302459717, "global_step": 176109, "epoch": 4193} {"train_loss": -7.150051116943359, "global_step": 176110, "epoch": 4193} {"train_loss": -6.973555564880371, "global_step": 176111, "epoch": 4193} {"train_loss": -6.816874027252197, "global_step": 176112, "epoch": 4193} {"train_loss": -6.827767372131348, "global_step": 176113, "epoch": 4193} {"train_loss": -6.830068588256836, "global_step": 176114, "epoch": 4193} {"train_loss": -7.027770519256592, "global_step": 176115, "epoch": 4193} {"train_loss": -6.9900336265563965, "global_step": 176116, "epoch": 4193} {"train_loss": -6.972347736358643, "global_step": 176117, "epoch": 4193} {"train_loss": -6.866665363311768, "global_step": 176118, "epoch": 4193} {"train_loss": -7.011343955993652, "global_step": 176119, "epoch": 4193} {"train_loss": -7.064069747924805, "global_step": 176120, "epoch": 4193} {"train_loss": -6.925677299499512, "global_step": 176121, "epoch": 4193} {"train_loss": -6.978687763214111, "global_step": 176122, "epoch": 4193} {"train_loss": -7.00325870513916, "global_step": 176123, "epoch": 4193} {"train_loss": -6.96182918548584, "global_step": 176124, "epoch": 4193} {"train_loss": -7.089869499206543, "global_step": 176125, "epoch": 4193} {"train_loss": -7.183030605316162, "global_step": 176126, "epoch": 4193} {"train_loss": -7.025665283203125, "global_step": 176127, "epoch": 4193} {"train_loss": -7.109206199645996, "global_step": 176128, "epoch": 4193} {"train_loss": -7.031274795532227, "global_step": 176129, "epoch": 4193} {"train_loss": -7.069034099578857, "global_step": 176130, "epoch": 4193} {"train_loss": -7.056673049926758, "global_step": 176131, "epoch": 4193} {"train_loss": -7.19912052154541, "global_step": 176132, "epoch": 4193} {"train_loss": -7.070094108581543, "global_step": 176133, "epoch": 4193} {"train_loss": -7.090473175048828, "global_step": 176134, "epoch": 4193} {"train_loss": -7.157915115356445, "global_step": 176135, "epoch": 4193} {"train_loss": -7.038208961486816, "global_step": 176136, "epoch": 4193} {"train_loss": -6.9748759269714355, "global_step": 176137, "epoch": 4193} {"train_loss": -7.037652969360352, "global_step": 176138, "epoch": 4193} {"train_loss": -7.077425956726074, "global_step": 176139, "epoch": 4193} {"train_loss": -7.1228179931640625, "global_step": 176140, "epoch": 4193} {"train_loss": -7.103776931762695, "global_step": 176141, "epoch": 4193} {"train_loss": -7.13115119934082, "global_step": 176142, "epoch": 4193} {"train_loss": -7.1263041496276855, "global_step": 176143, "epoch": 4193} {"train_loss": -7.082993507385254, "global_step": 176144, "epoch": 4193} {"train_loss": -7.053339004516602, "global_step": 176145, "epoch": 4193} {"train_loss": -7.128023147583008, "global_step": 176146, "epoch": 4193} {"train_loss": -7.019811641602289, "global_step": 176147, "epoch": 4193, "val_loss": 68612.4140625} {"train_loss": -7.107035160064697, "global_step": 176148, "epoch": 4194} {"train_loss": -7.083312034606934, "global_step": 176149, "epoch": 4194} {"train_loss": -6.8627238273620605, "global_step": 176150, "epoch": 4194} {"train_loss": -6.949244976043701, "global_step": 176151, "epoch": 4194} {"train_loss": -6.994864463806152, "global_step": 176152, "epoch": 4194} {"train_loss": -6.978473663330078, "global_step": 176153, "epoch": 4194} {"train_loss": -6.9632768630981445, "global_step": 176154, "epoch": 4194} {"train_loss": -6.789611339569092, "global_step": 176155, "epoch": 4194} {"train_loss": -7.017197608947754, "global_step": 176156, "epoch": 4194} {"train_loss": -7.163481712341309, "global_step": 176157, "epoch": 4194} {"train_loss": -6.915684223175049, "global_step": 176158, "epoch": 4194} {"train_loss": -6.980551719665527, "global_step": 176159, "epoch": 4194} {"train_loss": -6.935806751251221, "global_step": 176160, "epoch": 4194} {"train_loss": -7.0670695304870605, "global_step": 176161, "epoch": 4194} {"train_loss": -7.0661725997924805, "global_step": 176162, "epoch": 4194} {"train_loss": -6.979625225067139, "global_step": 176163, "epoch": 4194} {"train_loss": -7.090802192687988, "global_step": 176164, "epoch": 4194} {"train_loss": -6.978863716125488, "global_step": 176165, "epoch": 4194} {"train_loss": -6.937398910522461, "global_step": 176166, "epoch": 4194} {"train_loss": -7.059391975402832, "global_step": 176167, "epoch": 4194} {"train_loss": -6.912249565124512, "global_step": 176168, "epoch": 4194} {"train_loss": -7.14326286315918, "global_step": 176169, "epoch": 4194} {"train_loss": -6.994582176208496, "global_step": 176170, "epoch": 4194} {"train_loss": -6.985877990722656, "global_step": 176171, "epoch": 4194} {"train_loss": -6.867791175842285, "global_step": 176172, "epoch": 4194} {"train_loss": -6.901325225830078, "global_step": 176173, "epoch": 4194} {"train_loss": -7.088790416717529, "global_step": 176174, "epoch": 4194} {"train_loss": -6.979310035705566, "global_step": 176175, "epoch": 4194} {"train_loss": -7.022949695587158, "global_step": 176176, "epoch": 4194} {"train_loss": -6.893202781677246, "global_step": 176177, "epoch": 4194} {"train_loss": -6.997613430023193, "global_step": 176178, "epoch": 4194} {"train_loss": -7.02896785736084, "global_step": 176179, "epoch": 4194} {"train_loss": -7.020602226257324, "global_step": 176180, "epoch": 4194} {"train_loss": -6.9289093017578125, "global_step": 176181, "epoch": 4194} {"train_loss": -6.974289417266846, "global_step": 176182, "epoch": 4194} {"train_loss": -6.807367324829102, "global_step": 176183, "epoch": 4194} {"train_loss": -7.025513648986816, "global_step": 176184, "epoch": 4194} {"train_loss": -6.9615278244018555, "global_step": 176185, "epoch": 4194} {"train_loss": -6.921657562255859, "global_step": 176186, "epoch": 4194} {"train_loss": -6.91041374206543, "global_step": 176187, "epoch": 4194} {"train_loss": -6.897820472717285, "global_step": 176188, "epoch": 4194} {"train_loss": -6.979084673381987, "global_step": 176189, "epoch": 4194, "val_loss": 68729.4609375} {"train_loss": -6.944545745849609, "global_step": 176190, "epoch": 4195} {"train_loss": -6.98538875579834, "global_step": 176191, "epoch": 4195} {"train_loss": -6.9253621101379395, "global_step": 176192, "epoch": 4195} {"train_loss": -6.943461894989014, "global_step": 176193, "epoch": 4195} {"train_loss": -6.957500457763672, "global_step": 176194, "epoch": 4195} {"train_loss": -6.928856372833252, "global_step": 176195, "epoch": 4195} {"train_loss": -7.008330345153809, "global_step": 176196, "epoch": 4195} {"train_loss": -7.047755241394043, "global_step": 176197, "epoch": 4195} {"train_loss": -6.995538711547852, "global_step": 176198, "epoch": 4195} {"train_loss": -7.010437488555908, "global_step": 176199, "epoch": 4195} {"train_loss": -7.022366523742676, "global_step": 176200, "epoch": 4195} {"train_loss": -7.134077548980713, "global_step": 176201, "epoch": 4195} {"train_loss": -7.046351432800293, "global_step": 176202, "epoch": 4195} {"train_loss": -6.986296653747559, "global_step": 176203, "epoch": 4195} {"train_loss": -7.059484481811523, "global_step": 176204, "epoch": 4195} {"train_loss": -6.971640110015869, "global_step": 176205, "epoch": 4195} {"train_loss": -7.051942348480225, "global_step": 176206, "epoch": 4195} {"train_loss": -7.005956649780273, "global_step": 176207, "epoch": 4195} {"train_loss": -7.03084659576416, "global_step": 176208, "epoch": 4195} {"train_loss": -7.073958873748779, "global_step": 176209, "epoch": 4195} {"train_loss": -7.201824188232422, "global_step": 176210, "epoch": 4195} {"train_loss": -7.0474443435668945, "global_step": 176211, "epoch": 4195} {"train_loss": -7.147708415985107, "global_step": 176212, "epoch": 4195} {"train_loss": -7.031404972076416, "global_step": 176213, "epoch": 4195} {"train_loss": -7.040853500366211, "global_step": 176214, "epoch": 4195} {"train_loss": -7.120091915130615, "global_step": 176215, "epoch": 4195} {"train_loss": -7.067845344543457, "global_step": 176216, "epoch": 4195} {"train_loss": -7.056209087371826, "global_step": 176217, "epoch": 4195} {"train_loss": -7.0834736824035645, "global_step": 176218, "epoch": 4195} {"train_loss": -7.110253810882568, "global_step": 176219, "epoch": 4195} {"train_loss": -7.092098712921143, "global_step": 176220, "epoch": 4195} {"train_loss": -7.0889081954956055, "global_step": 176221, "epoch": 4195} {"train_loss": -6.96817684173584, "global_step": 176222, "epoch": 4195} {"train_loss": -7.121829986572266, "global_step": 176223, "epoch": 4195} {"train_loss": -7.071627616882324, "global_step": 176224, "epoch": 4195} {"train_loss": -7.1005072593688965, "global_step": 176225, "epoch": 4195} {"train_loss": -7.036174774169922, "global_step": 176226, "epoch": 4195} {"train_loss": -6.955275535583496, "global_step": 176227, "epoch": 4195} {"train_loss": -7.079819679260254, "global_step": 176228, "epoch": 4195} {"train_loss": -7.059004783630371, "global_step": 176229, "epoch": 4195} {"train_loss": -7.116346836090088, "global_step": 176230, "epoch": 4195} {"train_loss": -7.043576297305879, "global_step": 176231, "epoch": 4195, "val_loss": 68696.6640625} {"train_loss": -7.001585960388184, "global_step": 176232, "epoch": 4196} {"train_loss": -6.93000602722168, "global_step": 176233, "epoch": 4196} {"train_loss": -7.131189346313477, "global_step": 176234, "epoch": 4196} {"train_loss": -7.0584001541137695, "global_step": 176235, "epoch": 4196} {"train_loss": -7.048468589782715, "global_step": 176236, "epoch": 4196} {"train_loss": -6.958235740661621, "global_step": 176237, "epoch": 4196} {"train_loss": -7.023495674133301, "global_step": 176238, "epoch": 4196} {"train_loss": -6.971953392028809, "global_step": 176239, "epoch": 4196} {"train_loss": -6.939223289489746, "global_step": 176240, "epoch": 4196} {"train_loss": -7.018080234527588, "global_step": 176241, "epoch": 4196} {"train_loss": -7.03650426864624, "global_step": 176242, "epoch": 4196} {"train_loss": -7.0668134689331055, "global_step": 176243, "epoch": 4196} {"train_loss": -7.029442310333252, "global_step": 176244, "epoch": 4196} {"train_loss": -6.996895790100098, "global_step": 176245, "epoch": 4196} {"train_loss": -7.099520683288574, "global_step": 176246, "epoch": 4196} {"train_loss": -7.011397361755371, "global_step": 176247, "epoch": 4196} {"train_loss": -7.020624160766602, "global_step": 176248, "epoch": 4196} {"train_loss": -7.004382610321045, "global_step": 176249, "epoch": 4196} {"train_loss": -7.03529167175293, "global_step": 176250, "epoch": 4196} {"train_loss": -7.005247116088867, "global_step": 176251, "epoch": 4196} {"train_loss": -6.987179279327393, "global_step": 176252, "epoch": 4196} {"train_loss": -7.128773212432861, "global_step": 176253, "epoch": 4196} {"train_loss": -7.004573822021484, "global_step": 176254, "epoch": 4196} {"train_loss": -6.949151039123535, "global_step": 176255, "epoch": 4196} {"train_loss": -7.093750953674316, "global_step": 176256, "epoch": 4196} {"train_loss": -7.026966571807861, "global_step": 176257, "epoch": 4196} {"train_loss": -7.08814811706543, "global_step": 176258, "epoch": 4196} {"train_loss": -7.11842679977417, "global_step": 176259, "epoch": 4196} {"train_loss": -7.096197605133057, "global_step": 176260, "epoch": 4196} {"train_loss": -7.137706756591797, "global_step": 176261, "epoch": 4196} {"train_loss": -7.02165412902832, "global_step": 176262, "epoch": 4196} {"train_loss": -7.201596736907959, "global_step": 176263, "epoch": 4196} {"train_loss": -7.06053352355957, "global_step": 176264, "epoch": 4196} {"train_loss": -7.170798301696777, "global_step": 176265, "epoch": 4196} {"train_loss": -7.064224720001221, "global_step": 176266, "epoch": 4196} {"train_loss": -7.120891094207764, "global_step": 176267, "epoch": 4196} {"train_loss": -7.102653503417969, "global_step": 176268, "epoch": 4196} {"train_loss": -7.056032180786133, "global_step": 176269, "epoch": 4196} {"train_loss": -7.023850440979004, "global_step": 176270, "epoch": 4196} {"train_loss": -6.962273597717285, "global_step": 176271, "epoch": 4196} {"train_loss": -7.085592269897461, "global_step": 176272, "epoch": 4196} {"train_loss": -7.047361373901367, "global_step": 176273, "epoch": 4196, "val_loss": 68672.2734375} {"train_loss": -7.067326545715332, "global_step": 176274, "epoch": 4197} {"train_loss": -7.056342601776123, "global_step": 176275, "epoch": 4197} {"train_loss": -7.146204948425293, "global_step": 176276, "epoch": 4197} {"train_loss": -7.096520900726318, "global_step": 176277, "epoch": 4197} {"train_loss": -7.05487060546875, "global_step": 176278, "epoch": 4197} {"train_loss": -7.081368446350098, "global_step": 176279, "epoch": 4197} {"train_loss": -6.980513095855713, "global_step": 176280, "epoch": 4197} {"train_loss": -6.998879909515381, "global_step": 176281, "epoch": 4197} {"train_loss": -6.926013946533203, "global_step": 176282, "epoch": 4197} {"train_loss": -7.054864883422852, "global_step": 176283, "epoch": 4197} {"train_loss": -7.074165344238281, "global_step": 176284, "epoch": 4197} {"train_loss": -7.044980049133301, "global_step": 176285, "epoch": 4197} {"train_loss": -6.703499794006348, "global_step": 176286, "epoch": 4197} {"train_loss": -7.011363983154297, "global_step": 176287, "epoch": 4197} {"train_loss": -6.940025329589844, "global_step": 176288, "epoch": 4197} {"train_loss": -7.001425266265869, "global_step": 176289, "epoch": 4197} {"train_loss": -7.080076694488525, "global_step": 176290, "epoch": 4197} {"train_loss": -6.926220893859863, "global_step": 176291, "epoch": 4197} {"train_loss": -7.006223201751709, "global_step": 176292, "epoch": 4197} {"train_loss": -6.979392051696777, "global_step": 176293, "epoch": 4197} {"train_loss": -6.916587829589844, "global_step": 176294, "epoch": 4197} {"train_loss": -7.080831050872803, "global_step": 176295, "epoch": 4197} {"train_loss": -6.880720138549805, "global_step": 176296, "epoch": 4197} {"train_loss": -7.020092964172363, "global_step": 176297, "epoch": 4197} {"train_loss": -6.99073600769043, "global_step": 176298, "epoch": 4197} {"train_loss": -6.957098960876465, "global_step": 176299, "epoch": 4197} {"train_loss": -6.9972052574157715, "global_step": 176300, "epoch": 4197} {"train_loss": -6.956214904785156, "global_step": 176301, "epoch": 4197} {"train_loss": -7.012163162231445, "global_step": 176302, "epoch": 4197} {"train_loss": -6.876733779907227, "global_step": 176303, "epoch": 4197} {"train_loss": -7.078603267669678, "global_step": 176304, "epoch": 4197} {"train_loss": -7.069248676300049, "global_step": 176305, "epoch": 4197} {"train_loss": -6.973891735076904, "global_step": 176306, "epoch": 4197} {"train_loss": -7.058646202087402, "global_step": 176307, "epoch": 4197} {"train_loss": -7.073025703430176, "global_step": 176308, "epoch": 4197} {"train_loss": -7.069575786590576, "global_step": 176309, "epoch": 4197} {"train_loss": -6.954785346984863, "global_step": 176310, "epoch": 4197} {"train_loss": -7.008986473083496, "global_step": 176311, "epoch": 4197} {"train_loss": -7.07602596282959, "global_step": 176312, "epoch": 4197} {"train_loss": -6.999055862426758, "global_step": 176313, "epoch": 4197} {"train_loss": -7.094646453857422, "global_step": 176314, "epoch": 4197} {"train_loss": -7.012154352097284, "global_step": 176315, "epoch": 4197, "val_loss": 68752.859375} {"train_loss": -7.024585723876953, "global_step": 176316, "epoch": 4198} {"train_loss": -7.073239803314209, "global_step": 176317, "epoch": 4198} {"train_loss": -7.105087757110596, "global_step": 176318, "epoch": 4198} {"train_loss": -7.137607574462891, "global_step": 176319, "epoch": 4198} {"train_loss": -7.17715311050415, "global_step": 176320, "epoch": 4198} {"train_loss": -7.077110290527344, "global_step": 176321, "epoch": 4198} {"train_loss": -7.074566841125488, "global_step": 176322, "epoch": 4198} {"train_loss": -6.931093215942383, "global_step": 176323, "epoch": 4198} {"train_loss": -7.103008270263672, "global_step": 176324, "epoch": 4198} {"train_loss": -7.031435012817383, "global_step": 176325, "epoch": 4198} {"train_loss": -7.079016208648682, "global_step": 176326, "epoch": 4198} {"train_loss": -6.9978766441345215, "global_step": 176327, "epoch": 4198} {"train_loss": -7.061285972595215, "global_step": 176328, "epoch": 4198} {"train_loss": -7.040954113006592, "global_step": 176329, "epoch": 4198} {"train_loss": -7.130338668823242, "global_step": 176330, "epoch": 4198} {"train_loss": -6.996192932128906, "global_step": 176331, "epoch": 4198} {"train_loss": -7.052133560180664, "global_step": 176332, "epoch": 4198} {"train_loss": -7.087732791900635, "global_step": 176333, "epoch": 4198} {"train_loss": -7.133487701416016, "global_step": 176334, "epoch": 4198} {"train_loss": -6.996842384338379, "global_step": 176335, "epoch": 4198} {"train_loss": -7.14853048324585, "global_step": 176336, "epoch": 4198} {"train_loss": -7.037889003753662, "global_step": 176337, "epoch": 4198} {"train_loss": -7.056032180786133, "global_step": 176338, "epoch": 4198} {"train_loss": -7.06462287902832, "global_step": 176339, "epoch": 4198} {"train_loss": -7.061459541320801, "global_step": 176340, "epoch": 4198} {"train_loss": -7.091530799865723, "global_step": 176341, "epoch": 4198} {"train_loss": -7.064914703369141, "global_step": 176342, "epoch": 4198} {"train_loss": -7.032585144042969, "global_step": 176343, "epoch": 4198} {"train_loss": -6.982794761657715, "global_step": 176344, "epoch": 4198} {"train_loss": -6.887155532836914, "global_step": 176345, "epoch": 4198} {"train_loss": -7.081170082092285, "global_step": 176346, "epoch": 4198} {"train_loss": -7.027449131011963, "global_step": 176347, "epoch": 4198} {"train_loss": -6.912795066833496, "global_step": 176348, "epoch": 4198} {"train_loss": -6.945773124694824, "global_step": 176349, "epoch": 4198} {"train_loss": -7.161699295043945, "global_step": 176350, "epoch": 4198} {"train_loss": -7.018338203430176, "global_step": 176351, "epoch": 4198} {"train_loss": -7.13477897644043, "global_step": 176352, "epoch": 4198} {"train_loss": -6.913418769836426, "global_step": 176353, "epoch": 4198} {"train_loss": -6.940976619720459, "global_step": 176354, "epoch": 4198} {"train_loss": -7.064099311828613, "global_step": 176355, "epoch": 4198} {"train_loss": -6.93958044052124, "global_step": 176356, "epoch": 4198} {"train_loss": -7.044242734000797, "global_step": 176357, "epoch": 4198, "val_loss": 68633.3984375} {"train_loss": -6.844871997833252, "global_step": 176358, "epoch": 4199} {"train_loss": -6.864101409912109, "global_step": 176359, "epoch": 4199} {"train_loss": -6.966020107269287, "global_step": 176360, "epoch": 4199} {"train_loss": -6.903711795806885, "global_step": 176361, "epoch": 4199} {"train_loss": -6.921836853027344, "global_step": 176362, "epoch": 4199} {"train_loss": -7.008246421813965, "global_step": 176363, "epoch": 4199} {"train_loss": -6.970356464385986, "global_step": 176364, "epoch": 4199} {"train_loss": -7.0162553787231445, "global_step": 176365, "epoch": 4199} {"train_loss": -7.0882568359375, "global_step": 176366, "epoch": 4199} {"train_loss": -6.910040855407715, "global_step": 176367, "epoch": 4199} {"train_loss": -7.038506507873535, "global_step": 176368, "epoch": 4199} {"train_loss": -7.040482997894287, "global_step": 176369, "epoch": 4199} {"train_loss": -6.931044578552246, "global_step": 176370, "epoch": 4199} {"train_loss": -7.002774238586426, "global_step": 176371, "epoch": 4199} {"train_loss": -7.043501853942871, "global_step": 176372, "epoch": 4199} {"train_loss": -7.105316162109375, "global_step": 176373, "epoch": 4199} {"train_loss": -6.976988792419434, "global_step": 176374, "epoch": 4199} {"train_loss": -7.059563636779785, "global_step": 176375, "epoch": 4199} {"train_loss": -7.021380424499512, "global_step": 176376, "epoch": 4199} {"train_loss": -6.967840194702148, "global_step": 176377, "epoch": 4199} {"train_loss": -6.956851959228516, "global_step": 176378, "epoch": 4199} {"train_loss": -7.00745964050293, "global_step": 176379, "epoch": 4199} {"train_loss": -7.060784339904785, "global_step": 176380, "epoch": 4199} {"train_loss": -6.996622085571289, "global_step": 176381, "epoch": 4199} {"train_loss": -7.117828845977783, "global_step": 176382, "epoch": 4199} {"train_loss": -6.996234893798828, "global_step": 176383, "epoch": 4199} {"train_loss": -6.953833103179932, "global_step": 176384, "epoch": 4199} {"train_loss": -7.0322394371032715, "global_step": 176385, "epoch": 4199} {"train_loss": -6.9590935707092285, "global_step": 176386, "epoch": 4199} {"train_loss": -6.920217037200928, "global_step": 176387, "epoch": 4199} {"train_loss": -7.11054801940918, "global_step": 176388, "epoch": 4199} {"train_loss": -6.828117370605469, "global_step": 176389, "epoch": 4199} {"train_loss": -7.063060760498047, "global_step": 176390, "epoch": 4199} {"train_loss": -7.014482498168945, "global_step": 176391, "epoch": 4199} {"train_loss": -6.951751708984375, "global_step": 176392, "epoch": 4199} {"train_loss": -7.060337543487549, "global_step": 176393, "epoch": 4199} {"train_loss": -6.929018020629883, "global_step": 176394, "epoch": 4199} {"train_loss": -7.005273342132568, "global_step": 176395, "epoch": 4199} {"train_loss": -6.981147766113281, "global_step": 176396, "epoch": 4199} {"train_loss": -7.070332050323486, "global_step": 176397, "epoch": 4199} {"train_loss": -7.112798690795898, "global_step": 176398, "epoch": 4199} {"train_loss": -6.995495637257894, "global_step": 176399, "epoch": 4199, "val_loss": 68701.78125} {"train_loss": -7.117007255554199, "global_step": 176400, "epoch": 4200} {"train_loss": -7.042081832885742, "global_step": 176401, "epoch": 4200} {"train_loss": -7.161619663238525, "global_step": 176402, "epoch": 4200} {"train_loss": -7.050299167633057, "global_step": 176403, "epoch": 4200} {"train_loss": -6.992678165435791, "global_step": 176404, "epoch": 4200} {"train_loss": -7.06417989730835, "global_step": 176405, "epoch": 4200} {"train_loss": -6.996546745300293, "global_step": 176406, "epoch": 4200} {"train_loss": -7.150049686431885, "global_step": 176407, "epoch": 4200} {"train_loss": -7.06298828125, "global_step": 176408, "epoch": 4200} {"train_loss": -7.121107578277588, "global_step": 176409, "epoch": 4200} {"train_loss": -7.120234966278076, "global_step": 176410, "epoch": 4200} {"train_loss": -7.121333122253418, "global_step": 176411, "epoch": 4200} {"train_loss": -7.042043685913086, "global_step": 176412, "epoch": 4200} {"train_loss": -7.135885238647461, "global_step": 176413, "epoch": 4200} {"train_loss": -7.013469696044922, "global_step": 176414, "epoch": 4200} {"train_loss": -7.093618869781494, "global_step": 176415, "epoch": 4200} {"train_loss": -6.880305767059326, "global_step": 176416, "epoch": 4200} {"train_loss": -7.215898036956787, "global_step": 176417, "epoch": 4200} {"train_loss": -6.932354927062988, "global_step": 176418, "epoch": 4200} {"train_loss": -6.9813232421875, "global_step": 176419, "epoch": 4200} {"train_loss": -7.051858901977539, "global_step": 176420, "epoch": 4200} {"train_loss": -7.196260929107666, "global_step": 176421, "epoch": 4200} {"train_loss": -6.881165981292725, "global_step": 176422, "epoch": 4200} {"train_loss": -7.127259254455566, "global_step": 176423, "epoch": 4200} {"train_loss": -6.9199538230896, "global_step": 176424, "epoch": 4200} {"train_loss": -6.9662089347839355, "global_step": 176425, "epoch": 4200} {"train_loss": -7.015097618103027, "global_step": 176426, "epoch": 4200} {"train_loss": -6.82156229019165, "global_step": 176427, "epoch": 4200} {"train_loss": -7.076033592224121, "global_step": 176428, "epoch": 4200} {"train_loss": -6.998513221740723, "global_step": 176429, "epoch": 4200} {"train_loss": -6.978737831115723, "global_step": 176430, "epoch": 4200} {"train_loss": -6.9377875328063965, "global_step": 176431, "epoch": 4200} {"train_loss": -6.851164817810059, "global_step": 176432, "epoch": 4200} {"train_loss": -7.023941516876221, "global_step": 176433, "epoch": 4200} {"train_loss": -6.912902355194092, "global_step": 176434, "epoch": 4200} {"train_loss": -6.899847984313965, "global_step": 176435, "epoch": 4200} {"train_loss": -7.002276420593262, "global_step": 176436, "epoch": 4200} {"train_loss": -6.925091743469238, "global_step": 176437, "epoch": 4200} {"train_loss": -7.042226314544678, "global_step": 176438, "epoch": 4200} {"train_loss": -6.879245758056641, "global_step": 176439, "epoch": 4200} {"train_loss": -6.987551689147949, "global_step": 176440, "epoch": 4200} {"train_loss": -7.0210666088830855, "global_step": 176441, "epoch": 4200, "train/sim_max_reward_0": 0.252290877808957, "train/sim_max_reward_1": 0.8864745979612317, "train/sim_max_reward_2": 0.9414409334467633, "train/sim_max_reward_3": 0.13686665421409583, "train/sim_max_reward_4": 0.42184506979757025, "train/sim_max_reward_5": 0.8529305011410209, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.22797230257153925, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.9732396446057963, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.8618782869463031, "test/sim_max_reward_4400006": 0.9831378057695084, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.31707166407477044, "test/sim_max_reward_4400009": 0.834371774321995, "test/sim_max_reward_4400010": 0.20962673336352944, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9927237599086504, "test/sim_max_reward_4400013": 0.7206052024305516, "test/sim_max_reward_4400014": 0.9196463066885734, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.12594145356173736, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2855589629392791, "test/sim_max_reward_4400019": 0.41806251901222774, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.26242323693916375, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.44532095907737496, "test/sim_max_reward_4400025": 0.26413639032763836, "test/sim_max_reward_4400026": 0.01098838282657675, "test/sim_max_reward_4400027": 0.02441227690256701, "test/sim_max_reward_4400028": 0.465363124317903, "test/sim_max_reward_4400029": 0.9758432659930839, "test/sim_max_reward_4400030": 0.7801461922321958, "test/sim_max_reward_4400031": 0.9623460918667466, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 0.823407599217507, "test/sim_max_reward_4400035": 1.0, "test/sim_max_reward_4400036": 0.7236610025829234, "test/sim_max_reward_4400037": 0.8534384240730872, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9771503664483077, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.740212652128262, "test/sim_max_reward_4400042": 0.7981306767539551, "test/sim_max_reward_4400043": 0.7674993158036175, "test/sim_max_reward_4400044": 0.8773047764193712, "test/sim_max_reward_4400045": 0.9522375456890952, "test/sim_max_reward_4400046": 0.94784907018983, "test/sim_max_reward_4400047": 0.8354786789347501, "test/sim_max_reward_4400048": 0.9348586365749973, "test/sim_max_reward_4400049": 0.9205087535139285, "train/mean_score": 0.5819747723949399, "test/mean_score": 0.5951749763107649, "val_loss": 68772.09375} {"train_loss": -6.875587463378906, "global_step": 176442, "epoch": 4201} {"train_loss": -7.022451400756836, "global_step": 176443, "epoch": 4201} {"train_loss": -6.981090545654297, "global_step": 176444, "epoch": 4201} {"train_loss": -6.827574729919434, "global_step": 176445, "epoch": 4201} {"train_loss": -6.950238227844238, "global_step": 176446, "epoch": 4201} {"train_loss": -6.821889877319336, "global_step": 176447, "epoch": 4201} {"train_loss": -6.846468448638916, "global_step": 176448, "epoch": 4201} {"train_loss": -6.7345805168151855, "global_step": 176449, "epoch": 4201} {"train_loss": -7.005403995513916, "global_step": 176450, "epoch": 4201} {"train_loss": -6.802421569824219, "global_step": 176451, "epoch": 4201} {"train_loss": -7.028958797454834, "global_step": 176452, "epoch": 4201} {"train_loss": -6.918540000915527, "global_step": 176453, "epoch": 4201} {"train_loss": -7.048222064971924, "global_step": 176454, "epoch": 4201} {"train_loss": -6.930092811584473, "global_step": 176455, "epoch": 4201} {"train_loss": -6.938488483428955, "global_step": 176456, "epoch": 4201} {"train_loss": -6.915764808654785, "global_step": 176457, "epoch": 4201} {"train_loss": -6.959235668182373, "global_step": 176458, "epoch": 4201} {"train_loss": -7.02430534362793, "global_step": 176459, "epoch": 4201} {"train_loss": -7.0198893547058105, "global_step": 176460, "epoch": 4201} {"train_loss": -6.986355781555176, "global_step": 176461, "epoch": 4201} {"train_loss": -6.933429718017578, "global_step": 176462, "epoch": 4201} {"train_loss": -6.997450828552246, "global_step": 176463, "epoch": 4201} {"train_loss": -6.891656875610352, "global_step": 176464, "epoch": 4201} {"train_loss": -7.108299732208252, "global_step": 176465, "epoch": 4201} {"train_loss": -7.003129005432129, "global_step": 176466, "epoch": 4201} {"train_loss": -6.926687240600586, "global_step": 176467, "epoch": 4201} {"train_loss": -7.00479793548584, "global_step": 176468, "epoch": 4201} {"train_loss": -6.92121696472168, "global_step": 176469, "epoch": 4201} {"train_loss": -6.9029035568237305, "global_step": 176470, "epoch": 4201} {"train_loss": -7.031278133392334, "global_step": 176471, "epoch": 4201} {"train_loss": -6.93425178527832, "global_step": 176472, "epoch": 4201} {"train_loss": -7.049309253692627, "global_step": 176473, "epoch": 4201} {"train_loss": -6.987331390380859, "global_step": 176474, "epoch": 4201} {"train_loss": -6.891354084014893, "global_step": 176475, "epoch": 4201} {"train_loss": -6.99022912979126, "global_step": 176476, "epoch": 4201} {"train_loss": -7.019242286682129, "global_step": 176477, "epoch": 4201} {"train_loss": -7.019752502441406, "global_step": 176478, "epoch": 4201} {"train_loss": -7.039498329162598, "global_step": 176479, "epoch": 4201} {"train_loss": -7.056037425994873, "global_step": 176480, "epoch": 4201} {"train_loss": -6.967584133148193, "global_step": 176481, "epoch": 4201} {"train_loss": -7.032463073730469, "global_step": 176482, "epoch": 4201} {"train_loss": -6.96161489259629, "global_step": 176483, "epoch": 4201, "val_loss": 68865.609375} {"train_loss": -6.9775614738464355, "global_step": 176484, "epoch": 4202} {"train_loss": -7.1780219078063965, "global_step": 176485, "epoch": 4202} {"train_loss": -7.016421318054199, "global_step": 176486, "epoch": 4202} {"train_loss": -7.0872626304626465, "global_step": 176487, "epoch": 4202} {"train_loss": -7.113039970397949, "global_step": 176488, "epoch": 4202} {"train_loss": -6.979409217834473, "global_step": 176489, "epoch": 4202} {"train_loss": -7.097350120544434, "global_step": 176490, "epoch": 4202} {"train_loss": -6.927342414855957, "global_step": 176491, "epoch": 4202} {"train_loss": -7.093315124511719, "global_step": 176492, "epoch": 4202} {"train_loss": -6.981134414672852, "global_step": 176493, "epoch": 4202} {"train_loss": -7.005151271820068, "global_step": 176494, "epoch": 4202} {"train_loss": -6.953865051269531, "global_step": 176495, "epoch": 4202} {"train_loss": -7.109181880950928, "global_step": 176496, "epoch": 4202} {"train_loss": -7.080949783325195, "global_step": 176497, "epoch": 4202} {"train_loss": -7.064401626586914, "global_step": 176498, "epoch": 4202} {"train_loss": -7.037981986999512, "global_step": 176499, "epoch": 4202} {"train_loss": -6.9440598487854, "global_step": 176500, "epoch": 4202} {"train_loss": -7.033512115478516, "global_step": 176501, "epoch": 4202} {"train_loss": -6.9984450340271, "global_step": 176502, "epoch": 4202} {"train_loss": -7.102207183837891, "global_step": 176503, "epoch": 4202} {"train_loss": -7.091443061828613, "global_step": 176504, "epoch": 4202} {"train_loss": -7.037128448486328, "global_step": 176505, "epoch": 4202} {"train_loss": -7.180911064147949, "global_step": 176506, "epoch": 4202} {"train_loss": -7.004641532897949, "global_step": 176507, "epoch": 4202} {"train_loss": -7.073205947875977, "global_step": 176508, "epoch": 4202} {"train_loss": -7.039698600769043, "global_step": 176509, "epoch": 4202} {"train_loss": -7.05122184753418, "global_step": 176510, "epoch": 4202} {"train_loss": -7.189619541168213, "global_step": 176511, "epoch": 4202} {"train_loss": -7.130293846130371, "global_step": 176512, "epoch": 4202} {"train_loss": -7.142982482910156, "global_step": 176513, "epoch": 4202} {"train_loss": -7.094327926635742, "global_step": 176514, "epoch": 4202} {"train_loss": -7.127543926239014, "global_step": 176515, "epoch": 4202} {"train_loss": -7.034914493560791, "global_step": 176516, "epoch": 4202} {"train_loss": -7.093655586242676, "global_step": 176517, "epoch": 4202} {"train_loss": -7.108407974243164, "global_step": 176518, "epoch": 4202} {"train_loss": -7.121428489685059, "global_step": 176519, "epoch": 4202} {"train_loss": -7.033144474029541, "global_step": 176520, "epoch": 4202} {"train_loss": -6.968201160430908, "global_step": 176521, "epoch": 4202} {"train_loss": -7.083220481872559, "global_step": 176522, "epoch": 4202} {"train_loss": -7.092317581176758, "global_step": 176523, "epoch": 4202} {"train_loss": -7.022038459777832, "global_step": 176524, "epoch": 4202} {"train_loss": -7.06155184337071, "global_step": 176525, "epoch": 4202, "val_loss": 68700.8828125} {"train_loss": -7.012709617614746, "global_step": 176526, "epoch": 4203} {"train_loss": -7.073880195617676, "global_step": 176527, "epoch": 4203} {"train_loss": -7.029540061950684, "global_step": 176528, "epoch": 4203} {"train_loss": -7.075128555297852, "global_step": 176529, "epoch": 4203} {"train_loss": -7.049854278564453, "global_step": 176530, "epoch": 4203} {"train_loss": -7.002946853637695, "global_step": 176531, "epoch": 4203} {"train_loss": -6.972602844238281, "global_step": 176532, "epoch": 4203} {"train_loss": -7.0849385261535645, "global_step": 176533, "epoch": 4203} {"train_loss": -7.08095121383667, "global_step": 176534, "epoch": 4203} {"train_loss": -7.067523956298828, "global_step": 176535, "epoch": 4203} {"train_loss": -7.104012489318848, "global_step": 176536, "epoch": 4203} {"train_loss": -7.05020809173584, "global_step": 176537, "epoch": 4203} {"train_loss": -7.078083038330078, "global_step": 176538, "epoch": 4203} {"train_loss": -7.183191299438477, "global_step": 176539, "epoch": 4203} {"train_loss": -7.05655574798584, "global_step": 176540, "epoch": 4203} {"train_loss": -7.072099208831787, "global_step": 176541, "epoch": 4203} {"train_loss": -7.139091968536377, "global_step": 176542, "epoch": 4203} {"train_loss": -7.0325422286987305, "global_step": 176543, "epoch": 4203} {"train_loss": -7.118341445922852, "global_step": 176544, "epoch": 4203} {"train_loss": -7.128984451293945, "global_step": 176545, "epoch": 4203} {"train_loss": -7.119539260864258, "global_step": 176546, "epoch": 4203} {"train_loss": -7.036040306091309, "global_step": 176547, "epoch": 4203} {"train_loss": -7.035462379455566, "global_step": 176548, "epoch": 4203} {"train_loss": -6.9608283042907715, "global_step": 176549, "epoch": 4203} {"train_loss": -7.197480201721191, "global_step": 176550, "epoch": 4203} {"train_loss": -6.945225715637207, "global_step": 176551, "epoch": 4203} {"train_loss": -6.980363845825195, "global_step": 176552, "epoch": 4203} {"train_loss": -6.946559906005859, "global_step": 176553, "epoch": 4203} {"train_loss": -7.0585618019104, "global_step": 176554, "epoch": 4203} {"train_loss": -6.932401180267334, "global_step": 176555, "epoch": 4203} {"train_loss": -6.942915439605713, "global_step": 176556, "epoch": 4203} {"train_loss": -7.0143914222717285, "global_step": 176557, "epoch": 4203} {"train_loss": -7.058026313781738, "global_step": 176558, "epoch": 4203} {"train_loss": -6.849175453186035, "global_step": 176559, "epoch": 4203} {"train_loss": -7.061978340148926, "global_step": 176560, "epoch": 4203} {"train_loss": -6.956793308258057, "global_step": 176561, "epoch": 4203} {"train_loss": -7.051690101623535, "global_step": 176562, "epoch": 4203} {"train_loss": -7.149888038635254, "global_step": 176563, "epoch": 4203} {"train_loss": -7.124902248382568, "global_step": 176564, "epoch": 4203} {"train_loss": -6.978826522827148, "global_step": 176565, "epoch": 4203} {"train_loss": -7.059262275695801, "global_step": 176566, "epoch": 4203} {"train_loss": -7.042906704403105, "global_step": 176567, "epoch": 4203, "val_loss": 68887.8046875} {"train_loss": -6.9219441413879395, "global_step": 176568, "epoch": 4204} {"train_loss": -7.065885543823242, "global_step": 176569, "epoch": 4204} {"train_loss": -7.064198017120361, "global_step": 176570, "epoch": 4204} {"train_loss": -7.007913589477539, "global_step": 176571, "epoch": 4204} {"train_loss": -7.09598445892334, "global_step": 176572, "epoch": 4204} {"train_loss": -7.04020881652832, "global_step": 176573, "epoch": 4204} {"train_loss": -6.995844841003418, "global_step": 176574, "epoch": 4204} {"train_loss": -6.985834121704102, "global_step": 176575, "epoch": 4204} {"train_loss": -7.039519786834717, "global_step": 176576, "epoch": 4204} {"train_loss": -6.964825630187988, "global_step": 176577, "epoch": 4204} {"train_loss": -7.012401580810547, "global_step": 176578, "epoch": 4204} {"train_loss": -7.129196643829346, "global_step": 176579, "epoch": 4204} {"train_loss": -6.959753513336182, "global_step": 176580, "epoch": 4204} {"train_loss": -6.961443901062012, "global_step": 176581, "epoch": 4204} {"train_loss": -6.983345985412598, "global_step": 176582, "epoch": 4204} {"train_loss": -6.9340691566467285, "global_step": 176583, "epoch": 4204} {"train_loss": -6.935595989227295, "global_step": 176584, "epoch": 4204} {"train_loss": -6.960968971252441, "global_step": 176585, "epoch": 4204} {"train_loss": -6.844009876251221, "global_step": 176586, "epoch": 4204} {"train_loss": -6.959681510925293, "global_step": 176587, "epoch": 4204} {"train_loss": -6.922815322875977, "global_step": 176588, "epoch": 4204} {"train_loss": -6.953502655029297, "global_step": 176589, "epoch": 4204} {"train_loss": -7.022712707519531, "global_step": 176590, "epoch": 4204} {"train_loss": -6.980463027954102, "global_step": 176591, "epoch": 4204} {"train_loss": -6.9804558753967285, "global_step": 176592, "epoch": 4204} {"train_loss": -7.003063201904297, "global_step": 176593, "epoch": 4204} {"train_loss": -6.996977806091309, "global_step": 176594, "epoch": 4204} {"train_loss": -6.9624528884887695, "global_step": 176595, "epoch": 4204} {"train_loss": -7.102194309234619, "global_step": 176596, "epoch": 4204} {"train_loss": -7.005643844604492, "global_step": 176597, "epoch": 4204} {"train_loss": -7.022913455963135, "global_step": 176598, "epoch": 4204} {"train_loss": -7.115207195281982, "global_step": 176599, "epoch": 4204} {"train_loss": -6.974061012268066, "global_step": 176600, "epoch": 4204} {"train_loss": -7.038935661315918, "global_step": 176601, "epoch": 4204} {"train_loss": -7.031269550323486, "global_step": 176602, "epoch": 4204} {"train_loss": -6.974515438079834, "global_step": 176603, "epoch": 4204} {"train_loss": -7.070080280303955, "global_step": 176604, "epoch": 4204} {"train_loss": -7.079102516174316, "global_step": 176605, "epoch": 4204} {"train_loss": -7.10235595703125, "global_step": 176606, "epoch": 4204} {"train_loss": -7.15798807144165, "global_step": 176607, "epoch": 4204} {"train_loss": -6.996946334838867, "global_step": 176608, "epoch": 4204} {"train_loss": -7.010167712257022, "global_step": 176609, "epoch": 4204, "val_loss": 68619.78125} {"train_loss": -7.151717185974121, "global_step": 176610, "epoch": 4205} {"train_loss": -7.0373454093933105, "global_step": 176611, "epoch": 4205} {"train_loss": -6.982405185699463, "global_step": 176612, "epoch": 4205} {"train_loss": -6.995175838470459, "global_step": 176613, "epoch": 4205} {"train_loss": -7.007088661193848, "global_step": 176614, "epoch": 4205} {"train_loss": -6.97120475769043, "global_step": 176615, "epoch": 4205} {"train_loss": -6.966917514801025, "global_step": 176616, "epoch": 4205} {"train_loss": -6.872204780578613, "global_step": 176617, "epoch": 4205} {"train_loss": -6.995848655700684, "global_step": 176618, "epoch": 4205} {"train_loss": -7.019010543823242, "global_step": 176619, "epoch": 4205} {"train_loss": -6.9795637130737305, "global_step": 176620, "epoch": 4205} {"train_loss": -7.035887718200684, "global_step": 176621, "epoch": 4205} {"train_loss": -7.022860527038574, "global_step": 176622, "epoch": 4205} {"train_loss": -7.031512260437012, "global_step": 176623, "epoch": 4205} {"train_loss": -7.016090393066406, "global_step": 176624, "epoch": 4205} {"train_loss": -7.034200668334961, "global_step": 176625, "epoch": 4205} {"train_loss": -6.943974494934082, "global_step": 176626, "epoch": 4205} {"train_loss": -7.1524553298950195, "global_step": 176627, "epoch": 4205} {"train_loss": -7.0635786056518555, "global_step": 176628, "epoch": 4205} {"train_loss": -7.035888671875, "global_step": 176629, "epoch": 4205} {"train_loss": -7.036108016967773, "global_step": 176630, "epoch": 4205} {"train_loss": -6.95981502532959, "global_step": 176631, "epoch": 4205} {"train_loss": -6.968483924865723, "global_step": 176632, "epoch": 4205} {"train_loss": -7.108615875244141, "global_step": 176633, "epoch": 4205} {"train_loss": -6.995168685913086, "global_step": 176634, "epoch": 4205} {"train_loss": -7.100629806518555, "global_step": 176635, "epoch": 4205} {"train_loss": -7.073410987854004, "global_step": 176636, "epoch": 4205} {"train_loss": -7.0246968269348145, "global_step": 176637, "epoch": 4205} {"train_loss": -6.994379997253418, "global_step": 176638, "epoch": 4205} {"train_loss": -6.98359489440918, "global_step": 176639, "epoch": 4205} {"train_loss": -6.994624137878418, "global_step": 176640, "epoch": 4205} {"train_loss": -7.0591278076171875, "global_step": 176641, "epoch": 4205} {"train_loss": -6.989711761474609, "global_step": 176642, "epoch": 4205} {"train_loss": -7.0629425048828125, "global_step": 176643, "epoch": 4205} {"train_loss": -7.053603172302246, "global_step": 176644, "epoch": 4205} {"train_loss": -7.129558563232422, "global_step": 176645, "epoch": 4205} {"train_loss": -7.091754913330078, "global_step": 176646, "epoch": 4205} {"train_loss": -7.008054733276367, "global_step": 176647, "epoch": 4205} {"train_loss": -7.096938133239746, "global_step": 176648, "epoch": 4205} {"train_loss": -6.957441329956055, "global_step": 176649, "epoch": 4205} {"train_loss": -7.005260467529297, "global_step": 176650, "epoch": 4205} {"train_loss": -7.026809885388329, "global_step": 176651, "epoch": 4205, "val_loss": 68491.3125} {"train_loss": -7.070070743560791, "global_step": 176652, "epoch": 4206} {"train_loss": -7.0316362380981445, "global_step": 176653, "epoch": 4206} {"train_loss": -7.057305335998535, "global_step": 176654, "epoch": 4206} {"train_loss": -7.112898349761963, "global_step": 176655, "epoch": 4206} {"train_loss": -7.0541486740112305, "global_step": 176656, "epoch": 4206} {"train_loss": -7.0510382652282715, "global_step": 176657, "epoch": 4206} {"train_loss": -7.049248218536377, "global_step": 176658, "epoch": 4206} {"train_loss": -6.972696304321289, "global_step": 176659, "epoch": 4206} {"train_loss": -7.027448654174805, "global_step": 176660, "epoch": 4206} {"train_loss": -7.084493160247803, "global_step": 176661, "epoch": 4206} {"train_loss": -7.064678192138672, "global_step": 176662, "epoch": 4206} {"train_loss": -7.016902446746826, "global_step": 176663, "epoch": 4206} {"train_loss": -6.978304386138916, "global_step": 176664, "epoch": 4206} {"train_loss": -6.927885055541992, "global_step": 176665, "epoch": 4206} {"train_loss": -6.953423500061035, "global_step": 176666, "epoch": 4206} {"train_loss": -7.045741081237793, "global_step": 176667, "epoch": 4206} {"train_loss": -7.047846794128418, "global_step": 176668, "epoch": 4206} {"train_loss": -7.013958930969238, "global_step": 176669, "epoch": 4206} {"train_loss": -7.010176181793213, "global_step": 176670, "epoch": 4206} {"train_loss": -7.05194091796875, "global_step": 176671, "epoch": 4206} {"train_loss": -7.122382164001465, "global_step": 176672, "epoch": 4206} {"train_loss": -6.955843925476074, "global_step": 176673, "epoch": 4206} {"train_loss": -7.03546142578125, "global_step": 176674, "epoch": 4206} {"train_loss": -6.989945411682129, "global_step": 176675, "epoch": 4206} {"train_loss": -7.081876754760742, "global_step": 176676, "epoch": 4206} {"train_loss": -7.010705947875977, "global_step": 176677, "epoch": 4206} {"train_loss": -7.115971088409424, "global_step": 176678, "epoch": 4206} {"train_loss": -7.063699722290039, "global_step": 176679, "epoch": 4206} {"train_loss": -7.0571746826171875, "global_step": 176680, "epoch": 4206} {"train_loss": -7.014836311340332, "global_step": 176681, "epoch": 4206} {"train_loss": -6.836216926574707, "global_step": 176682, "epoch": 4206} {"train_loss": -6.952375888824463, "global_step": 176683, "epoch": 4206} {"train_loss": -6.9462103843688965, "global_step": 176684, "epoch": 4206} {"train_loss": -6.893743991851807, "global_step": 176685, "epoch": 4206} {"train_loss": -6.994897842407227, "global_step": 176686, "epoch": 4206} {"train_loss": -6.949873924255371, "global_step": 176687, "epoch": 4206} {"train_loss": -7.050140380859375, "global_step": 176688, "epoch": 4206} {"train_loss": -6.97906494140625, "global_step": 176689, "epoch": 4206} {"train_loss": -6.873476505279541, "global_step": 176690, "epoch": 4206} {"train_loss": -7.0261359214782715, "global_step": 176691, "epoch": 4206} {"train_loss": -6.913673400878906, "global_step": 176692, "epoch": 4206} {"train_loss": -7.00914952868507, "global_step": 176693, "epoch": 4206, "val_loss": 68724.1328125} {"train_loss": -6.97723388671875, "global_step": 176694, "epoch": 4207} {"train_loss": -6.931183815002441, "global_step": 176695, "epoch": 4207} {"train_loss": -6.949522018432617, "global_step": 176696, "epoch": 4207} {"train_loss": -7.1657609939575195, "global_step": 176697, "epoch": 4207} {"train_loss": -7.03516960144043, "global_step": 176698, "epoch": 4207} {"train_loss": -7.026604652404785, "global_step": 176699, "epoch": 4207} {"train_loss": -7.07686710357666, "global_step": 176700, "epoch": 4207} {"train_loss": -6.8397417068481445, "global_step": 176701, "epoch": 4207} {"train_loss": -7.106658458709717, "global_step": 176702, "epoch": 4207} {"train_loss": -6.974850177764893, "global_step": 176703, "epoch": 4207} {"train_loss": -7.079341888427734, "global_step": 176704, "epoch": 4207} {"train_loss": -6.998478412628174, "global_step": 176705, "epoch": 4207} {"train_loss": -7.080204010009766, "global_step": 176706, "epoch": 4207} {"train_loss": -6.892612457275391, "global_step": 176707, "epoch": 4207} {"train_loss": -6.874013900756836, "global_step": 176708, "epoch": 4207} {"train_loss": -7.031075954437256, "global_step": 176709, "epoch": 4207} {"train_loss": -6.950414657592773, "global_step": 176710, "epoch": 4207} {"train_loss": -7.099780082702637, "global_step": 176711, "epoch": 4207} {"train_loss": -6.939009189605713, "global_step": 176712, "epoch": 4207} {"train_loss": -7.0017852783203125, "global_step": 176713, "epoch": 4207} {"train_loss": -7.017040252685547, "global_step": 176714, "epoch": 4207} {"train_loss": -7.068638801574707, "global_step": 176715, "epoch": 4207} {"train_loss": -6.978280544281006, "global_step": 176716, "epoch": 4207} {"train_loss": -6.958930015563965, "global_step": 176717, "epoch": 4207} {"train_loss": -7.097908973693848, "global_step": 176718, "epoch": 4207} {"train_loss": -7.010188102722168, "global_step": 176719, "epoch": 4207} {"train_loss": -7.125190734863281, "global_step": 176720, "epoch": 4207} {"train_loss": -7.069701194763184, "global_step": 176721, "epoch": 4207} {"train_loss": -6.980122089385986, "global_step": 176722, "epoch": 4207} {"train_loss": -7.031730651855469, "global_step": 176723, "epoch": 4207} {"train_loss": -7.0538740158081055, "global_step": 176724, "epoch": 4207} {"train_loss": -7.049468040466309, "global_step": 176725, "epoch": 4207} {"train_loss": -6.991885185241699, "global_step": 176726, "epoch": 4207} {"train_loss": -6.975417137145996, "global_step": 176727, "epoch": 4207} {"train_loss": -7.028064727783203, "global_step": 176728, "epoch": 4207} {"train_loss": -7.015814781188965, "global_step": 176729, "epoch": 4207} {"train_loss": -7.004446983337402, "global_step": 176730, "epoch": 4207} {"train_loss": -6.966838359832764, "global_step": 176731, "epoch": 4207} {"train_loss": -7.037256240844727, "global_step": 176732, "epoch": 4207} {"train_loss": -7.000331878662109, "global_step": 176733, "epoch": 4207} {"train_loss": -7.058272361755371, "global_step": 176734, "epoch": 4207} {"train_loss": -7.013698884419033, "global_step": 176735, "epoch": 4207, "val_loss": 68787.2578125} {"train_loss": -7.042619705200195, "global_step": 176736, "epoch": 4208} {"train_loss": -7.179087162017822, "global_step": 176737, "epoch": 4208} {"train_loss": -7.067108631134033, "global_step": 176738, "epoch": 4208} {"train_loss": -7.1670355796813965, "global_step": 176739, "epoch": 4208} {"train_loss": -7.040195465087891, "global_step": 176740, "epoch": 4208} {"train_loss": -7.093696117401123, "global_step": 176741, "epoch": 4208} {"train_loss": -6.998006343841553, "global_step": 176742, "epoch": 4208} {"train_loss": -7.087935447692871, "global_step": 176743, "epoch": 4208} {"train_loss": -6.956022262573242, "global_step": 176744, "epoch": 4208} {"train_loss": -7.055946350097656, "global_step": 176745, "epoch": 4208} {"train_loss": -7.028428077697754, "global_step": 176746, "epoch": 4208} {"train_loss": -7.015685081481934, "global_step": 176747, "epoch": 4208} {"train_loss": -7.097578048706055, "global_step": 176748, "epoch": 4208} {"train_loss": -7.110780239105225, "global_step": 176749, "epoch": 4208} {"train_loss": -7.044964790344238, "global_step": 176750, "epoch": 4208} {"train_loss": -7.059410095214844, "global_step": 176751, "epoch": 4208} {"train_loss": -7.0818257331848145, "global_step": 176752, "epoch": 4208} {"train_loss": -7.038825988769531, "global_step": 176753, "epoch": 4208} {"train_loss": -6.966605186462402, "global_step": 176754, "epoch": 4208} {"train_loss": -7.100918769836426, "global_step": 176755, "epoch": 4208} {"train_loss": -6.92559289932251, "global_step": 176756, "epoch": 4208} {"train_loss": -6.934280872344971, "global_step": 176757, "epoch": 4208} {"train_loss": -7.054074287414551, "global_step": 176758, "epoch": 4208} {"train_loss": -7.111001968383789, "global_step": 176759, "epoch": 4208} {"train_loss": -7.060185432434082, "global_step": 176760, "epoch": 4208} {"train_loss": -7.102669715881348, "global_step": 176761, "epoch": 4208} {"train_loss": -7.111536026000977, "global_step": 176762, "epoch": 4208} {"train_loss": -7.098546028137207, "global_step": 176763, "epoch": 4208} {"train_loss": -7.185785293579102, "global_step": 176764, "epoch": 4208} {"train_loss": -7.047167778015137, "global_step": 176765, "epoch": 4208} {"train_loss": -6.974206447601318, "global_step": 176766, "epoch": 4208} {"train_loss": -7.092395782470703, "global_step": 176767, "epoch": 4208} {"train_loss": -7.129727363586426, "global_step": 176768, "epoch": 4208} {"train_loss": -7.191583156585693, "global_step": 176769, "epoch": 4208} {"train_loss": -7.027251243591309, "global_step": 176770, "epoch": 4208} {"train_loss": -7.0599541664123535, "global_step": 176771, "epoch": 4208} {"train_loss": -7.017793655395508, "global_step": 176772, "epoch": 4208} {"train_loss": -7.105669975280762, "global_step": 176773, "epoch": 4208} {"train_loss": -7.041155815124512, "global_step": 176774, "epoch": 4208} {"train_loss": -6.95943021774292, "global_step": 176775, "epoch": 4208} {"train_loss": -7.013444900512695, "global_step": 176776, "epoch": 4208} {"train_loss": -7.058728149959019, "global_step": 176777, "epoch": 4208, "val_loss": 68908.125} {"train_loss": -7.048433303833008, "global_step": 176778, "epoch": 4209} {"train_loss": -7.1063432693481445, "global_step": 176779, "epoch": 4209} {"train_loss": -6.925013542175293, "global_step": 176780, "epoch": 4209} {"train_loss": -7.014034271240234, "global_step": 176781, "epoch": 4209} {"train_loss": -7.032049655914307, "global_step": 176782, "epoch": 4209} {"train_loss": -7.022950649261475, "global_step": 176783, "epoch": 4209} {"train_loss": -6.985128402709961, "global_step": 176784, "epoch": 4209} {"train_loss": -6.927883148193359, "global_step": 176785, "epoch": 4209} {"train_loss": -7.13353157043457, "global_step": 176786, "epoch": 4209} {"train_loss": -6.840306282043457, "global_step": 176787, "epoch": 4209} {"train_loss": -7.051753044128418, "global_step": 176788, "epoch": 4209} {"train_loss": -7.064244270324707, "global_step": 176789, "epoch": 4209} {"train_loss": -6.8261213302612305, "global_step": 176790, "epoch": 4209} {"train_loss": -6.9706926345825195, "global_step": 176791, "epoch": 4209} {"train_loss": -6.735964775085449, "global_step": 176792, "epoch": 4209} {"train_loss": -7.011178970336914, "global_step": 176793, "epoch": 4209} {"train_loss": -6.9612932205200195, "global_step": 176794, "epoch": 4209} {"train_loss": -6.966784954071045, "global_step": 176795, "epoch": 4209} {"train_loss": -7.138599395751953, "global_step": 176796, "epoch": 4209} {"train_loss": -6.875741958618164, "global_step": 176797, "epoch": 4209} {"train_loss": -6.986982345581055, "global_step": 176798, "epoch": 4209} {"train_loss": -7.028145790100098, "global_step": 176799, "epoch": 4209} {"train_loss": -7.056958198547363, "global_step": 176800, "epoch": 4209} {"train_loss": -7.049896717071533, "global_step": 176801, "epoch": 4209} {"train_loss": -7.120802879333496, "global_step": 176802, "epoch": 4209} {"train_loss": -7.09434700012207, "global_step": 176803, "epoch": 4209} {"train_loss": -7.072864532470703, "global_step": 176804, "epoch": 4209} {"train_loss": -7.026276588439941, "global_step": 176805, "epoch": 4209} {"train_loss": -7.119617938995361, "global_step": 176806, "epoch": 4209} {"train_loss": -7.10725212097168, "global_step": 176807, "epoch": 4209} {"train_loss": -7.070590019226074, "global_step": 176808, "epoch": 4209} {"train_loss": -7.044602394104004, "global_step": 176809, "epoch": 4209} {"train_loss": -6.982024192810059, "global_step": 176810, "epoch": 4209} {"train_loss": -7.097384452819824, "global_step": 176811, "epoch": 4209} {"train_loss": -7.0075273513793945, "global_step": 176812, "epoch": 4209} {"train_loss": -7.097160339355469, "global_step": 176813, "epoch": 4209} {"train_loss": -7.0965118408203125, "global_step": 176814, "epoch": 4209} {"train_loss": -7.100912570953369, "global_step": 176815, "epoch": 4209} {"train_loss": -6.968714714050293, "global_step": 176816, "epoch": 4209} {"train_loss": -7.147624969482422, "global_step": 176817, "epoch": 4209} {"train_loss": -6.985218048095703, "global_step": 176818, "epoch": 4209} {"train_loss": -7.020307359241304, "global_step": 176819, "epoch": 4209, "val_loss": 68555.1015625} {"train_loss": -7.008679389953613, "global_step": 176820, "epoch": 4210} {"train_loss": -7.032886981964111, "global_step": 176821, "epoch": 4210} {"train_loss": -6.963294982910156, "global_step": 176822, "epoch": 4210} {"train_loss": -7.082739353179932, "global_step": 176823, "epoch": 4210} {"train_loss": -7.019850730895996, "global_step": 176824, "epoch": 4210} {"train_loss": -7.115316390991211, "global_step": 176825, "epoch": 4210} {"train_loss": -6.999799728393555, "global_step": 176826, "epoch": 4210} {"train_loss": -7.111918926239014, "global_step": 176827, "epoch": 4210} {"train_loss": -7.162832260131836, "global_step": 176828, "epoch": 4210} {"train_loss": -7.111217498779297, "global_step": 176829, "epoch": 4210} {"train_loss": -7.0594964027404785, "global_step": 176830, "epoch": 4210} {"train_loss": -7.087101459503174, "global_step": 176831, "epoch": 4210} {"train_loss": -7.205639839172363, "global_step": 176832, "epoch": 4210} {"train_loss": -6.905279636383057, "global_step": 176833, "epoch": 4210} {"train_loss": -7.034204483032227, "global_step": 176834, "epoch": 4210} {"train_loss": -7.067204475402832, "global_step": 176835, "epoch": 4210} {"train_loss": -7.1146697998046875, "global_step": 176836, "epoch": 4210} {"train_loss": -7.192059516906738, "global_step": 176837, "epoch": 4210} {"train_loss": -7.092326641082764, "global_step": 176838, "epoch": 4210} {"train_loss": -7.060486793518066, "global_step": 176839, "epoch": 4210} {"train_loss": -7.081980228424072, "global_step": 176840, "epoch": 4210} {"train_loss": -7.1120500564575195, "global_step": 176841, "epoch": 4210} {"train_loss": -7.111031532287598, "global_step": 176842, "epoch": 4210} {"train_loss": -7.022622108459473, "global_step": 176843, "epoch": 4210} {"train_loss": -7.0984930992126465, "global_step": 176844, "epoch": 4210} {"train_loss": -7.08480167388916, "global_step": 176845, "epoch": 4210} {"train_loss": -7.005061626434326, "global_step": 176846, "epoch": 4210} {"train_loss": -6.977453231811523, "global_step": 176847, "epoch": 4210} {"train_loss": -7.139554023742676, "global_step": 176848, "epoch": 4210} {"train_loss": -7.041832447052002, "global_step": 176849, "epoch": 4210} {"train_loss": -6.898433685302734, "global_step": 176850, "epoch": 4210} {"train_loss": -7.004053115844727, "global_step": 176851, "epoch": 4210} {"train_loss": -6.984938144683838, "global_step": 176852, "epoch": 4210} {"train_loss": -6.926092147827148, "global_step": 176853, "epoch": 4210} {"train_loss": -7.1743879318237305, "global_step": 176854, "epoch": 4210} {"train_loss": -7.046481609344482, "global_step": 176855, "epoch": 4210} {"train_loss": -6.969168663024902, "global_step": 176856, "epoch": 4210} {"train_loss": -7.158086776733398, "global_step": 176857, "epoch": 4210} {"train_loss": -6.965522766113281, "global_step": 176858, "epoch": 4210} {"train_loss": -7.1068339347839355, "global_step": 176859, "epoch": 4210} {"train_loss": -7.035243511199951, "global_step": 176860, "epoch": 4210} {"train_loss": -7.057399522690546, "global_step": 176861, "epoch": 4210, "val_loss": 68662.921875} {"train_loss": -7.019501209259033, "global_step": 176862, "epoch": 4211} {"train_loss": -6.923948287963867, "global_step": 176863, "epoch": 4211} {"train_loss": -7.089848518371582, "global_step": 176864, "epoch": 4211} {"train_loss": -7.025358200073242, "global_step": 176865, "epoch": 4211} {"train_loss": -6.9555768966674805, "global_step": 176866, "epoch": 4211} {"train_loss": -7.07950496673584, "global_step": 176867, "epoch": 4211} {"train_loss": -6.9467058181762695, "global_step": 176868, "epoch": 4211} {"train_loss": -7.119312763214111, "global_step": 176869, "epoch": 4211} {"train_loss": -7.051559925079346, "global_step": 176870, "epoch": 4211} {"train_loss": -7.014257431030273, "global_step": 176871, "epoch": 4211} {"train_loss": -7.1917195320129395, "global_step": 176872, "epoch": 4211} {"train_loss": -7.038783073425293, "global_step": 176873, "epoch": 4211} {"train_loss": -6.981653690338135, "global_step": 176874, "epoch": 4211} {"train_loss": -7.026364803314209, "global_step": 176875, "epoch": 4211} {"train_loss": -7.0576171875, "global_step": 176876, "epoch": 4211} {"train_loss": -7.076435089111328, "global_step": 176877, "epoch": 4211} {"train_loss": -6.900306701660156, "global_step": 176878, "epoch": 4211} {"train_loss": -6.851739883422852, "global_step": 176879, "epoch": 4211} {"train_loss": -6.989326000213623, "global_step": 176880, "epoch": 4211} {"train_loss": -6.858250617980957, "global_step": 176881, "epoch": 4211} {"train_loss": -6.953375339508057, "global_step": 176882, "epoch": 4211} {"train_loss": -7.082304000854492, "global_step": 176883, "epoch": 4211} {"train_loss": -6.978500843048096, "global_step": 176884, "epoch": 4211} {"train_loss": -6.859779357910156, "global_step": 176885, "epoch": 4211} {"train_loss": -6.955181121826172, "global_step": 176886, "epoch": 4211} {"train_loss": -6.985608100891113, "global_step": 176887, "epoch": 4211} {"train_loss": -7.02976131439209, "global_step": 176888, "epoch": 4211} {"train_loss": -6.832886695861816, "global_step": 176889, "epoch": 4211} {"train_loss": -7.124241828918457, "global_step": 176890, "epoch": 4211} {"train_loss": -6.858175277709961, "global_step": 176891, "epoch": 4211} {"train_loss": -6.9595136642456055, "global_step": 176892, "epoch": 4211} {"train_loss": -7.024065017700195, "global_step": 176893, "epoch": 4211} {"train_loss": -6.929691791534424, "global_step": 176894, "epoch": 4211} {"train_loss": -7.017055511474609, "global_step": 176895, "epoch": 4211} {"train_loss": -7.053334712982178, "global_step": 176896, "epoch": 4211} {"train_loss": -6.9740095138549805, "global_step": 176897, "epoch": 4211} {"train_loss": -7.005636692047119, "global_step": 176898, "epoch": 4211} {"train_loss": -6.974201202392578, "global_step": 176899, "epoch": 4211} {"train_loss": -6.895438194274902, "global_step": 176900, "epoch": 4211} {"train_loss": -7.097751617431641, "global_step": 176901, "epoch": 4211} {"train_loss": -6.906508922576904, "global_step": 176902, "epoch": 4211} {"train_loss": -6.995151485715594, "global_step": 176903, "epoch": 4211, "val_loss": 68711.390625} {"train_loss": -6.969024658203125, "global_step": 176904, "epoch": 4212} {"train_loss": -7.021632194519043, "global_step": 176905, "epoch": 4212} {"train_loss": -7.1935906410217285, "global_step": 176906, "epoch": 4212} {"train_loss": -6.992584705352783, "global_step": 176907, "epoch": 4212} {"train_loss": -7.054819583892822, "global_step": 176908, "epoch": 4212} {"train_loss": -7.021113395690918, "global_step": 176909, "epoch": 4212} {"train_loss": -6.960352897644043, "global_step": 176910, "epoch": 4212} {"train_loss": -7.09263801574707, "global_step": 176911, "epoch": 4212} {"train_loss": -7.129108428955078, "global_step": 176912, "epoch": 4212} {"train_loss": -7.042666435241699, "global_step": 176913, "epoch": 4212} {"train_loss": -7.115894317626953, "global_step": 176914, "epoch": 4212} {"train_loss": -7.045881271362305, "global_step": 176915, "epoch": 4212} {"train_loss": -7.1094865798950195, "global_step": 176916, "epoch": 4212} {"train_loss": -6.983894348144531, "global_step": 176917, "epoch": 4212} {"train_loss": -7.0310163497924805, "global_step": 176918, "epoch": 4212} {"train_loss": -7.160538673400879, "global_step": 176919, "epoch": 4212} {"train_loss": -7.126873970031738, "global_step": 176920, "epoch": 4212} {"train_loss": -7.155031204223633, "global_step": 176921, "epoch": 4212} {"train_loss": -7.096321105957031, "global_step": 176922, "epoch": 4212} {"train_loss": -7.061844348907471, "global_step": 176923, "epoch": 4212} {"train_loss": -7.117664337158203, "global_step": 176924, "epoch": 4212} {"train_loss": -7.038972854614258, "global_step": 176925, "epoch": 4212} {"train_loss": -7.005415916442871, "global_step": 176926, "epoch": 4212} {"train_loss": -6.983358383178711, "global_step": 176927, "epoch": 4212} {"train_loss": -7.050164699554443, "global_step": 176928, "epoch": 4212} {"train_loss": -7.002167224884033, "global_step": 176929, "epoch": 4212} {"train_loss": -7.078338146209717, "global_step": 176930, "epoch": 4212} {"train_loss": -6.937704086303711, "global_step": 176931, "epoch": 4212} {"train_loss": -7.049083709716797, "global_step": 176932, "epoch": 4212} {"train_loss": -7.031142234802246, "global_step": 176933, "epoch": 4212} {"train_loss": -7.0635905265808105, "global_step": 176934, "epoch": 4212} {"train_loss": -7.022927761077881, "global_step": 176935, "epoch": 4212} {"train_loss": -6.999386310577393, "global_step": 176936, "epoch": 4212} {"train_loss": -6.992789268493652, "global_step": 176937, "epoch": 4212} {"train_loss": -6.926652908325195, "global_step": 176938, "epoch": 4212} {"train_loss": -7.0804033279418945, "global_step": 176939, "epoch": 4212} {"train_loss": -7.065611362457275, "global_step": 176940, "epoch": 4212} {"train_loss": -7.092364311218262, "global_step": 176941, "epoch": 4212} {"train_loss": -6.987660884857178, "global_step": 176942, "epoch": 4212} {"train_loss": -7.119133472442627, "global_step": 176943, "epoch": 4212} {"train_loss": -7.019749164581299, "global_step": 176944, "epoch": 4212} {"train_loss": -7.048720212209792, "global_step": 176945, "epoch": 4212, "val_loss": 68498.765625} {"train_loss": -7.1074371337890625, "global_step": 176946, "epoch": 4213} {"train_loss": -7.04428243637085, "global_step": 176947, "epoch": 4213} {"train_loss": -6.970490455627441, "global_step": 176948, "epoch": 4213} {"train_loss": -7.059473991394043, "global_step": 176949, "epoch": 4213} {"train_loss": -7.075187683105469, "global_step": 176950, "epoch": 4213} {"train_loss": -6.983788013458252, "global_step": 176951, "epoch": 4213} {"train_loss": -7.090821266174316, "global_step": 176952, "epoch": 4213} {"train_loss": -7.062222480773926, "global_step": 176953, "epoch": 4213} {"train_loss": -7.02265739440918, "global_step": 176954, "epoch": 4213} {"train_loss": -7.036836624145508, "global_step": 176955, "epoch": 4213} {"train_loss": -7.059560775756836, "global_step": 176956, "epoch": 4213} {"train_loss": -7.041133880615234, "global_step": 176957, "epoch": 4213} {"train_loss": -6.984465599060059, "global_step": 176958, "epoch": 4213} {"train_loss": -7.038013458251953, "global_step": 176959, "epoch": 4213} {"train_loss": -7.071421146392822, "global_step": 176960, "epoch": 4213} {"train_loss": -7.057021141052246, "global_step": 176961, "epoch": 4213} {"train_loss": -7.081854820251465, "global_step": 176962, "epoch": 4213} {"train_loss": -7.162569999694824, "global_step": 176963, "epoch": 4213} {"train_loss": -6.930536270141602, "global_step": 176964, "epoch": 4213} {"train_loss": -6.97175931930542, "global_step": 176965, "epoch": 4213} {"train_loss": -7.136711120605469, "global_step": 176966, "epoch": 4213} {"train_loss": -7.0099310874938965, "global_step": 176967, "epoch": 4213} {"train_loss": -6.9062604904174805, "global_step": 176968, "epoch": 4213} {"train_loss": -7.008902072906494, "global_step": 176969, "epoch": 4213} {"train_loss": -7.075871467590332, "global_step": 176970, "epoch": 4213} {"train_loss": -7.113962650299072, "global_step": 176971, "epoch": 4213} {"train_loss": -6.970951080322266, "global_step": 176972, "epoch": 4213} {"train_loss": -6.962622165679932, "global_step": 176973, "epoch": 4213} {"train_loss": -7.0237298011779785, "global_step": 176974, "epoch": 4213} {"train_loss": -6.988330841064453, "global_step": 176975, "epoch": 4213} {"train_loss": -7.122943878173828, "global_step": 176976, "epoch": 4213} {"train_loss": -7.118254661560059, "global_step": 176977, "epoch": 4213} {"train_loss": -7.14038610458374, "global_step": 176978, "epoch": 4213} {"train_loss": -7.06717586517334, "global_step": 176979, "epoch": 4213} {"train_loss": -7.099353790283203, "global_step": 176980, "epoch": 4213} {"train_loss": -7.109244346618652, "global_step": 176981, "epoch": 4213} {"train_loss": -7.142768383026123, "global_step": 176982, "epoch": 4213} {"train_loss": -7.047758102416992, "global_step": 176983, "epoch": 4213} {"train_loss": -7.065888404846191, "global_step": 176984, "epoch": 4213} {"train_loss": -7.13134765625, "global_step": 176985, "epoch": 4213} {"train_loss": -7.085086822509766, "global_step": 176986, "epoch": 4213} {"train_loss": -7.055604480561756, "global_step": 176987, "epoch": 4213, "val_loss": 68708.6953125} {"train_loss": -7.056881904602051, "global_step": 176988, "epoch": 4214} {"train_loss": -7.04153299331665, "global_step": 176989, "epoch": 4214} {"train_loss": -7.079306602478027, "global_step": 176990, "epoch": 4214} {"train_loss": -7.064942359924316, "global_step": 176991, "epoch": 4214} {"train_loss": -7.080906867980957, "global_step": 176992, "epoch": 4214} {"train_loss": -7.08980655670166, "global_step": 176993, "epoch": 4214} {"train_loss": -7.0897040367126465, "global_step": 176994, "epoch": 4214} {"train_loss": -7.145404815673828, "global_step": 176995, "epoch": 4214} {"train_loss": -7.146519660949707, "global_step": 176996, "epoch": 4214} {"train_loss": -7.059774398803711, "global_step": 176997, "epoch": 4214} {"train_loss": -7.158909320831299, "global_step": 176998, "epoch": 4214} {"train_loss": -7.129039764404297, "global_step": 176999, "epoch": 4214} {"train_loss": -7.1516571044921875, "global_step": 177000, "epoch": 4214} {"train_loss": -7.102849960327148, "global_step": 177001, "epoch": 4214} {"train_loss": -6.997179985046387, "global_step": 177002, "epoch": 4214} {"train_loss": -7.059362888336182, "global_step": 177003, "epoch": 4214} {"train_loss": -7.069423675537109, "global_step": 177004, "epoch": 4214} {"train_loss": -7.004852294921875, "global_step": 177005, "epoch": 4214} {"train_loss": -7.0477142333984375, "global_step": 177006, "epoch": 4214} {"train_loss": -7.043414115905762, "global_step": 177007, "epoch": 4214} {"train_loss": -7.059165000915527, "global_step": 177008, "epoch": 4214} {"train_loss": -7.147143840789795, "global_step": 177009, "epoch": 4214} {"train_loss": -7.11666202545166, "global_step": 177010, "epoch": 4214} {"train_loss": -6.958741188049316, "global_step": 177011, "epoch": 4214} {"train_loss": -7.066036224365234, "global_step": 177012, "epoch": 4214} {"train_loss": -7.0879364013671875, "global_step": 177013, "epoch": 4214} {"train_loss": -7.1302900314331055, "global_step": 177014, "epoch": 4214} {"train_loss": -7.041645050048828, "global_step": 177015, "epoch": 4214} {"train_loss": -7.1260294914245605, "global_step": 177016, "epoch": 4214} {"train_loss": -7.020336627960205, "global_step": 177017, "epoch": 4214} {"train_loss": -6.990497589111328, "global_step": 177018, "epoch": 4214} {"train_loss": -7.173104763031006, "global_step": 177019, "epoch": 4214} {"train_loss": -6.997275352478027, "global_step": 177020, "epoch": 4214} {"train_loss": -7.026333332061768, "global_step": 177021, "epoch": 4214} {"train_loss": -7.058809280395508, "global_step": 177022, "epoch": 4214} {"train_loss": -7.07531213760376, "global_step": 177023, "epoch": 4214} {"train_loss": -6.953176021575928, "global_step": 177024, "epoch": 4214} {"train_loss": -7.030747413635254, "global_step": 177025, "epoch": 4214} {"train_loss": -7.0127668380737305, "global_step": 177026, "epoch": 4214} {"train_loss": -6.886279106140137, "global_step": 177027, "epoch": 4214} {"train_loss": -7.0095109939575195, "global_step": 177028, "epoch": 4214} {"train_loss": -7.062486421494257, "global_step": 177029, "epoch": 4214, "val_loss": 68631.234375} {"train_loss": -6.969544410705566, "global_step": 177030, "epoch": 4215} {"train_loss": -6.913188934326172, "global_step": 177031, "epoch": 4215} {"train_loss": -6.911118984222412, "global_step": 177032, "epoch": 4215} {"train_loss": -6.9620771408081055, "global_step": 177033, "epoch": 4215} {"train_loss": -6.892685890197754, "global_step": 177034, "epoch": 4215} {"train_loss": -6.9947614669799805, "global_step": 177035, "epoch": 4215} {"train_loss": -7.032922744750977, "global_step": 177036, "epoch": 4215} {"train_loss": -6.91989278793335, "global_step": 177037, "epoch": 4215} {"train_loss": -6.962698459625244, "global_step": 177038, "epoch": 4215} {"train_loss": -7.249680519104004, "global_step": 177039, "epoch": 4215} {"train_loss": -6.9889326095581055, "global_step": 177040, "epoch": 4215} {"train_loss": -7.018797874450684, "global_step": 177041, "epoch": 4215} {"train_loss": -7.107517719268799, "global_step": 177042, "epoch": 4215} {"train_loss": -6.8877339363098145, "global_step": 177043, "epoch": 4215} {"train_loss": -7.025189399719238, "global_step": 177044, "epoch": 4215} {"train_loss": -6.908239364624023, "global_step": 177045, "epoch": 4215} {"train_loss": -6.962950706481934, "global_step": 177046, "epoch": 4215} {"train_loss": -6.969540119171143, "global_step": 177047, "epoch": 4215} {"train_loss": -6.820321083068848, "global_step": 177048, "epoch": 4215} {"train_loss": -6.985057830810547, "global_step": 177049, "epoch": 4215} {"train_loss": -6.943136215209961, "global_step": 177050, "epoch": 4215} {"train_loss": -6.955541133880615, "global_step": 177051, "epoch": 4215} {"train_loss": -6.91911506652832, "global_step": 177052, "epoch": 4215} {"train_loss": -6.934781551361084, "global_step": 177053, "epoch": 4215} {"train_loss": -6.960563659667969, "global_step": 177054, "epoch": 4215} {"train_loss": -7.079922676086426, "global_step": 177055, "epoch": 4215} {"train_loss": -6.936990737915039, "global_step": 177056, "epoch": 4215} {"train_loss": -6.968573093414307, "global_step": 177057, "epoch": 4215} {"train_loss": -7.0043768882751465, "global_step": 177058, "epoch": 4215} {"train_loss": -7.042999267578125, "global_step": 177059, "epoch": 4215} {"train_loss": -7.123628616333008, "global_step": 177060, "epoch": 4215} {"train_loss": -6.991536617279053, "global_step": 177061, "epoch": 4215} {"train_loss": -7.000154495239258, "global_step": 177062, "epoch": 4215} {"train_loss": -7.056018829345703, "global_step": 177063, "epoch": 4215} {"train_loss": -7.019818305969238, "global_step": 177064, "epoch": 4215} {"train_loss": -7.017313003540039, "global_step": 177065, "epoch": 4215} {"train_loss": -7.070431709289551, "global_step": 177066, "epoch": 4215} {"train_loss": -6.981332302093506, "global_step": 177067, "epoch": 4215} {"train_loss": -7.02708625793457, "global_step": 177068, "epoch": 4215} {"train_loss": -7.032357692718506, "global_step": 177069, "epoch": 4215} {"train_loss": -6.897385120391846, "global_step": 177070, "epoch": 4215} {"train_loss": -6.988254217874436, "global_step": 177071, "epoch": 4215, "val_loss": 68762.3671875} {"train_loss": -7.018409729003906, "global_step": 177072, "epoch": 4216} {"train_loss": -7.085848331451416, "global_step": 177073, "epoch": 4216} {"train_loss": -7.071583271026611, "global_step": 177074, "epoch": 4216} {"train_loss": -6.969182014465332, "global_step": 177075, "epoch": 4216} {"train_loss": -6.9703049659729, "global_step": 177076, "epoch": 4216} {"train_loss": -7.122781753540039, "global_step": 177077, "epoch": 4216} {"train_loss": -7.1232500076293945, "global_step": 177078, "epoch": 4216} {"train_loss": -6.9769206047058105, "global_step": 177079, "epoch": 4216} {"train_loss": -6.99665641784668, "global_step": 177080, "epoch": 4216} {"train_loss": -6.98356819152832, "global_step": 177081, "epoch": 4216} {"train_loss": -7.017086029052734, "global_step": 177082, "epoch": 4216} {"train_loss": -6.999920845031738, "global_step": 177083, "epoch": 4216} {"train_loss": -7.086668014526367, "global_step": 177084, "epoch": 4216} {"train_loss": -7.02894926071167, "global_step": 177085, "epoch": 4216} {"train_loss": -7.06496524810791, "global_step": 177086, "epoch": 4216} {"train_loss": -7.0329694747924805, "global_step": 177087, "epoch": 4216} {"train_loss": -7.06663703918457, "global_step": 177088, "epoch": 4216} {"train_loss": -7.055164813995361, "global_step": 177089, "epoch": 4216} {"train_loss": -7.065401077270508, "global_step": 177090, "epoch": 4216} {"train_loss": -7.065146446228027, "global_step": 177091, "epoch": 4216} {"train_loss": -7.018780708312988, "global_step": 177092, "epoch": 4216} {"train_loss": -7.123199462890625, "global_step": 177093, "epoch": 4216} {"train_loss": -7.017899990081787, "global_step": 177094, "epoch": 4216} {"train_loss": -7.0718913078308105, "global_step": 177095, "epoch": 4216} {"train_loss": -7.054654121398926, "global_step": 177096, "epoch": 4216} {"train_loss": -7.1594038009643555, "global_step": 177097, "epoch": 4216} {"train_loss": -7.129931449890137, "global_step": 177098, "epoch": 4216} {"train_loss": -7.106046676635742, "global_step": 177099, "epoch": 4216} {"train_loss": -6.97319221496582, "global_step": 177100, "epoch": 4216} {"train_loss": -7.061697483062744, "global_step": 177101, "epoch": 4216} {"train_loss": -7.027148246765137, "global_step": 177102, "epoch": 4216} {"train_loss": -6.9623122215271, "global_step": 177103, "epoch": 4216} {"train_loss": -6.987782955169678, "global_step": 177104, "epoch": 4216} {"train_loss": -7.054829120635986, "global_step": 177105, "epoch": 4216} {"train_loss": -7.15103816986084, "global_step": 177106, "epoch": 4216} {"train_loss": -6.94915246963501, "global_step": 177107, "epoch": 4216} {"train_loss": -6.915454864501953, "global_step": 177108, "epoch": 4216} {"train_loss": -7.088457107543945, "global_step": 177109, "epoch": 4216} {"train_loss": -6.817184925079346, "global_step": 177110, "epoch": 4216} {"train_loss": -6.954828262329102, "global_step": 177111, "epoch": 4216} {"train_loss": -7.091732978820801, "global_step": 177112, "epoch": 4216} {"train_loss": -7.03503832362947, "global_step": 177113, "epoch": 4216, "val_loss": 68694.3359375} {"train_loss": -7.016026496887207, "global_step": 177114, "epoch": 4217} {"train_loss": -6.890512466430664, "global_step": 177115, "epoch": 4217} {"train_loss": -7.037133693695068, "global_step": 177116, "epoch": 4217} {"train_loss": -6.907641410827637, "global_step": 177117, "epoch": 4217} {"train_loss": -7.00656795501709, "global_step": 177118, "epoch": 4217} {"train_loss": -6.951570510864258, "global_step": 177119, "epoch": 4217} {"train_loss": -6.9667253494262695, "global_step": 177120, "epoch": 4217} {"train_loss": -7.011958122253418, "global_step": 177121, "epoch": 4217} {"train_loss": -6.970127582550049, "global_step": 177122, "epoch": 4217} {"train_loss": -6.973282814025879, "global_step": 177123, "epoch": 4217} {"train_loss": -7.098240375518799, "global_step": 177124, "epoch": 4217} {"train_loss": -6.951354503631592, "global_step": 177125, "epoch": 4217} {"train_loss": -7.166354179382324, "global_step": 177126, "epoch": 4217} {"train_loss": -6.932593822479248, "global_step": 177127, "epoch": 4217} {"train_loss": -7.100497722625732, "global_step": 177128, "epoch": 4217} {"train_loss": -6.993358135223389, "global_step": 177129, "epoch": 4217} {"train_loss": -6.956151962280273, "global_step": 177130, "epoch": 4217} {"train_loss": -6.996456146240234, "global_step": 177131, "epoch": 4217} {"train_loss": -7.092467784881592, "global_step": 177132, "epoch": 4217} {"train_loss": -7.041597366333008, "global_step": 177133, "epoch": 4217} {"train_loss": -7.026956558227539, "global_step": 177134, "epoch": 4217} {"train_loss": -6.961818695068359, "global_step": 177135, "epoch": 4217} {"train_loss": -7.013456344604492, "global_step": 177136, "epoch": 4217} {"train_loss": -7.085414886474609, "global_step": 177137, "epoch": 4217} {"train_loss": -6.933329105377197, "global_step": 177138, "epoch": 4217} {"train_loss": -6.877994537353516, "global_step": 177139, "epoch": 4217} {"train_loss": -6.941954612731934, "global_step": 177140, "epoch": 4217} {"train_loss": -6.967220783233643, "global_step": 177141, "epoch": 4217} {"train_loss": -6.994892120361328, "global_step": 177142, "epoch": 4217} {"train_loss": -7.111234664916992, "global_step": 177143, "epoch": 4217} {"train_loss": -7.165977478027344, "global_step": 177144, "epoch": 4217} {"train_loss": -7.025208473205566, "global_step": 177145, "epoch": 4217} {"train_loss": -7.1090989112854, "global_step": 177146, "epoch": 4217} {"train_loss": -7.11817741394043, "global_step": 177147, "epoch": 4217} {"train_loss": -6.928559303283691, "global_step": 177148, "epoch": 4217} {"train_loss": -7.116199493408203, "global_step": 177149, "epoch": 4217} {"train_loss": -7.059017658233643, "global_step": 177150, "epoch": 4217} {"train_loss": -7.042929649353027, "global_step": 177151, "epoch": 4217} {"train_loss": -7.030755043029785, "global_step": 177152, "epoch": 4217} {"train_loss": -7.131793022155762, "global_step": 177153, "epoch": 4217} {"train_loss": -7.152327537536621, "global_step": 177154, "epoch": 4217} {"train_loss": -7.0225652285984586, "global_step": 177155, "epoch": 4217, "val_loss": 68629.984375} {"train_loss": -7.161266326904297, "global_step": 177156, "epoch": 4218} {"train_loss": -7.013998508453369, "global_step": 177157, "epoch": 4218} {"train_loss": -6.92625093460083, "global_step": 177158, "epoch": 4218} {"train_loss": -7.067568302154541, "global_step": 177159, "epoch": 4218} {"train_loss": -7.0780181884765625, "global_step": 177160, "epoch": 4218} {"train_loss": -7.001595497131348, "global_step": 177161, "epoch": 4218} {"train_loss": -6.988761901855469, "global_step": 177162, "epoch": 4218} {"train_loss": -7.215290069580078, "global_step": 177163, "epoch": 4218} {"train_loss": -7.118300914764404, "global_step": 177164, "epoch": 4218} {"train_loss": -7.077534198760986, "global_step": 177165, "epoch": 4218} {"train_loss": -7.09710693359375, "global_step": 177166, "epoch": 4218} {"train_loss": -7.003507137298584, "global_step": 177167, "epoch": 4218} {"train_loss": -7.17266845703125, "global_step": 177168, "epoch": 4218} {"train_loss": -6.995433807373047, "global_step": 177169, "epoch": 4218} {"train_loss": -6.9636335372924805, "global_step": 177170, "epoch": 4218} {"train_loss": -7.080985069274902, "global_step": 177171, "epoch": 4218} {"train_loss": -7.033804893493652, "global_step": 177172, "epoch": 4218} {"train_loss": -6.883790969848633, "global_step": 177173, "epoch": 4218} {"train_loss": -7.115747451782227, "global_step": 177174, "epoch": 4218} {"train_loss": -6.92031192779541, "global_step": 177175, "epoch": 4218} {"train_loss": -7.0573320388793945, "global_step": 177176, "epoch": 4218} {"train_loss": -7.055028438568115, "global_step": 177177, "epoch": 4218} {"train_loss": -7.067510604858398, "global_step": 177178, "epoch": 4218} {"train_loss": -7.092792510986328, "global_step": 177179, "epoch": 4218} {"train_loss": -7.029324054718018, "global_step": 177180, "epoch": 4218} {"train_loss": -7.157452583312988, "global_step": 177181, "epoch": 4218} {"train_loss": -7.119029521942139, "global_step": 177182, "epoch": 4218} {"train_loss": -7.172239303588867, "global_step": 177183, "epoch": 4218} {"train_loss": -7.052321434020996, "global_step": 177184, "epoch": 4218} {"train_loss": -7.049961090087891, "global_step": 177185, "epoch": 4218} {"train_loss": -7.028602600097656, "global_step": 177186, "epoch": 4218} {"train_loss": -7.080064296722412, "global_step": 177187, "epoch": 4218} {"train_loss": -7.021328449249268, "global_step": 177188, "epoch": 4218} {"train_loss": -6.992790222167969, "global_step": 177189, "epoch": 4218} {"train_loss": -7.178728103637695, "global_step": 177190, "epoch": 4218} {"train_loss": -7.056665897369385, "global_step": 177191, "epoch": 4218} {"train_loss": -7.028881072998047, "global_step": 177192, "epoch": 4218} {"train_loss": -7.01297664642334, "global_step": 177193, "epoch": 4218} {"train_loss": -6.9934401512146, "global_step": 177194, "epoch": 4218} {"train_loss": -7.000481605529785, "global_step": 177195, "epoch": 4218} {"train_loss": -7.186245918273926, "global_step": 177196, "epoch": 4218} {"train_loss": -7.057690972373599, "global_step": 177197, "epoch": 4218, "val_loss": 68844.984375} {"train_loss": -7.07908296585083, "global_step": 177198, "epoch": 4219} {"train_loss": -7.132620334625244, "global_step": 177199, "epoch": 4219} {"train_loss": -6.952338218688965, "global_step": 177200, "epoch": 4219} {"train_loss": -7.016584396362305, "global_step": 177201, "epoch": 4219} {"train_loss": -7.075717926025391, "global_step": 177202, "epoch": 4219} {"train_loss": -6.762970447540283, "global_step": 177203, "epoch": 4219} {"train_loss": -6.938180446624756, "global_step": 177204, "epoch": 4219} {"train_loss": -6.989004135131836, "global_step": 177205, "epoch": 4219} {"train_loss": -6.899375915527344, "global_step": 177206, "epoch": 4219} {"train_loss": -7.070318698883057, "global_step": 177207, "epoch": 4219} {"train_loss": -6.908051013946533, "global_step": 177208, "epoch": 4219} {"train_loss": -6.985988140106201, "global_step": 177209, "epoch": 4219} {"train_loss": -6.837868690490723, "global_step": 177210, "epoch": 4219} {"train_loss": -6.992695331573486, "global_step": 177211, "epoch": 4219} {"train_loss": -6.944601535797119, "global_step": 177212, "epoch": 4219} {"train_loss": -6.993813514709473, "global_step": 177213, "epoch": 4219} {"train_loss": -7.030141353607178, "global_step": 177214, "epoch": 4219} {"train_loss": -7.0678606033325195, "global_step": 177215, "epoch": 4219} {"train_loss": -6.959588050842285, "global_step": 177216, "epoch": 4219} {"train_loss": -6.986103534698486, "global_step": 177217, "epoch": 4219} {"train_loss": -6.955134391784668, "global_step": 177218, "epoch": 4219} {"train_loss": -6.982113838195801, "global_step": 177219, "epoch": 4219} {"train_loss": -7.002551078796387, "global_step": 177220, "epoch": 4219} {"train_loss": -7.037072658538818, "global_step": 177221, "epoch": 4219} {"train_loss": -7.107439041137695, "global_step": 177222, "epoch": 4219} {"train_loss": -6.8842244148254395, "global_step": 177223, "epoch": 4219} {"train_loss": -7.0383734703063965, "global_step": 177224, "epoch": 4219} {"train_loss": -6.9801740646362305, "global_step": 177225, "epoch": 4219} {"train_loss": -7.070571422576904, "global_step": 177226, "epoch": 4219} {"train_loss": -6.917757987976074, "global_step": 177227, "epoch": 4219} {"train_loss": -6.95152473449707, "global_step": 177228, "epoch": 4219} {"train_loss": -7.021856307983398, "global_step": 177229, "epoch": 4219} {"train_loss": -7.011480331420898, "global_step": 177230, "epoch": 4219} {"train_loss": -7.056997299194336, "global_step": 177231, "epoch": 4219} {"train_loss": -6.945063591003418, "global_step": 177232, "epoch": 4219} {"train_loss": -7.030505180358887, "global_step": 177233, "epoch": 4219} {"train_loss": -6.953474521636963, "global_step": 177234, "epoch": 4219} {"train_loss": -6.983949661254883, "global_step": 177235, "epoch": 4219} {"train_loss": -7.0985002517700195, "global_step": 177236, "epoch": 4219} {"train_loss": -7.047903060913086, "global_step": 177237, "epoch": 4219} {"train_loss": -7.008749961853027, "global_step": 177238, "epoch": 4219} {"train_loss": -6.995235851832798, "global_step": 177239, "epoch": 4219, "val_loss": 68602.6953125} {"train_loss": -6.961813926696777, "global_step": 177240, "epoch": 4220} {"train_loss": -6.999182224273682, "global_step": 177241, "epoch": 4220} {"train_loss": -6.981133937835693, "global_step": 177242, "epoch": 4220} {"train_loss": -6.963133335113525, "global_step": 177243, "epoch": 4220} {"train_loss": -7.02725887298584, "global_step": 177244, "epoch": 4220} {"train_loss": -7.171085357666016, "global_step": 177245, "epoch": 4220} {"train_loss": -6.960475444793701, "global_step": 177246, "epoch": 4220} {"train_loss": -7.015793800354004, "global_step": 177247, "epoch": 4220} {"train_loss": -7.023553848266602, "global_step": 177248, "epoch": 4220} {"train_loss": -7.058236122131348, "global_step": 177249, "epoch": 4220} {"train_loss": -7.064257621765137, "global_step": 177250, "epoch": 4220} {"train_loss": -7.074695110321045, "global_step": 177251, "epoch": 4220} {"train_loss": -7.1617631912231445, "global_step": 177252, "epoch": 4220} {"train_loss": -7.059624671936035, "global_step": 177253, "epoch": 4220} {"train_loss": -7.0782694816589355, "global_step": 177254, "epoch": 4220} {"train_loss": -7.0374040603637695, "global_step": 177255, "epoch": 4220} {"train_loss": -7.0882344245910645, "global_step": 177256, "epoch": 4220} {"train_loss": -7.066561698913574, "global_step": 177257, "epoch": 4220} {"train_loss": -7.09055233001709, "global_step": 177258, "epoch": 4220} {"train_loss": -7.020931243896484, "global_step": 177259, "epoch": 4220} {"train_loss": -6.960026741027832, "global_step": 177260, "epoch": 4220} {"train_loss": -7.1087727546691895, "global_step": 177261, "epoch": 4220} {"train_loss": -6.970726490020752, "global_step": 177262, "epoch": 4220} {"train_loss": -7.011845588684082, "global_step": 177263, "epoch": 4220} {"train_loss": -7.032096862792969, "global_step": 177264, "epoch": 4220} {"train_loss": -6.924912452697754, "global_step": 177265, "epoch": 4220} {"train_loss": -7.043790817260742, "global_step": 177266, "epoch": 4220} {"train_loss": -7.0675249099731445, "global_step": 177267, "epoch": 4220} {"train_loss": -6.891355991363525, "global_step": 177268, "epoch": 4220} {"train_loss": -7.126674652099609, "global_step": 177269, "epoch": 4220} {"train_loss": -6.822396278381348, "global_step": 177270, "epoch": 4220} {"train_loss": -7.1028947830200195, "global_step": 177271, "epoch": 4220} {"train_loss": -6.846585273742676, "global_step": 177272, "epoch": 4220} {"train_loss": -6.949816703796387, "global_step": 177273, "epoch": 4220} {"train_loss": -6.861947059631348, "global_step": 177274, "epoch": 4220} {"train_loss": -6.974205493927002, "global_step": 177275, "epoch": 4220} {"train_loss": -6.902028560638428, "global_step": 177276, "epoch": 4220} {"train_loss": -6.924137115478516, "global_step": 177277, "epoch": 4220} {"train_loss": -6.986693382263184, "global_step": 177278, "epoch": 4220} {"train_loss": -6.9021453857421875, "global_step": 177279, "epoch": 4220} {"train_loss": -6.926764965057373, "global_step": 177280, "epoch": 4220} {"train_loss": -7.002969355810256, "global_step": 177281, "epoch": 4220, "val_loss": 68695.484375} {"train_loss": -6.88253116607666, "global_step": 177282, "epoch": 4221} {"train_loss": -7.038431167602539, "global_step": 177283, "epoch": 4221} {"train_loss": -6.864603519439697, "global_step": 177284, "epoch": 4221} {"train_loss": -7.06841516494751, "global_step": 177285, "epoch": 4221} {"train_loss": -7.030304431915283, "global_step": 177286, "epoch": 4221} {"train_loss": -7.017470836639404, "global_step": 177287, "epoch": 4221} {"train_loss": -7.130914688110352, "global_step": 177288, "epoch": 4221} {"train_loss": -6.9482526779174805, "global_step": 177289, "epoch": 4221} {"train_loss": -6.942685127258301, "global_step": 177290, "epoch": 4221} {"train_loss": -7.015582084655762, "global_step": 177291, "epoch": 4221} {"train_loss": -7.0124969482421875, "global_step": 177292, "epoch": 4221} {"train_loss": -7.042159080505371, "global_step": 177293, "epoch": 4221} {"train_loss": -6.915919303894043, "global_step": 177294, "epoch": 4221} {"train_loss": -7.077273845672607, "global_step": 177295, "epoch": 4221} {"train_loss": -7.038508415222168, "global_step": 177296, "epoch": 4221} {"train_loss": -6.992679595947266, "global_step": 177297, "epoch": 4221} {"train_loss": -7.051846504211426, "global_step": 177298, "epoch": 4221} {"train_loss": -7.035732269287109, "global_step": 177299, "epoch": 4221} {"train_loss": -7.039183616638184, "global_step": 177300, "epoch": 4221} {"train_loss": -7.154783725738525, "global_step": 177301, "epoch": 4221} {"train_loss": -7.0500359535217285, "global_step": 177302, "epoch": 4221} {"train_loss": -7.149867057800293, "global_step": 177303, "epoch": 4221} {"train_loss": -7.081843376159668, "global_step": 177304, "epoch": 4221} {"train_loss": -7.179134368896484, "global_step": 177305, "epoch": 4221} {"train_loss": -7.0805463790893555, "global_step": 177306, "epoch": 4221} {"train_loss": -7.071260452270508, "global_step": 177307, "epoch": 4221} {"train_loss": -7.12783145904541, "global_step": 177308, "epoch": 4221} {"train_loss": -7.070803642272949, "global_step": 177309, "epoch": 4221} {"train_loss": -7.156739711761475, "global_step": 177310, "epoch": 4221} {"train_loss": -7.0494256019592285, "global_step": 177311, "epoch": 4221} {"train_loss": -7.113715648651123, "global_step": 177312, "epoch": 4221} {"train_loss": -7.123222351074219, "global_step": 177313, "epoch": 4221} {"train_loss": -7.070775032043457, "global_step": 177314, "epoch": 4221} {"train_loss": -7.094757080078125, "global_step": 177315, "epoch": 4221} {"train_loss": -7.0406293869018555, "global_step": 177316, "epoch": 4221} {"train_loss": -7.077508449554443, "global_step": 177317, "epoch": 4221} {"train_loss": -6.949185371398926, "global_step": 177318, "epoch": 4221} {"train_loss": -7.047107696533203, "global_step": 177319, "epoch": 4221} {"train_loss": -7.125096797943115, "global_step": 177320, "epoch": 4221} {"train_loss": -7.094811916351318, "global_step": 177321, "epoch": 4221} {"train_loss": -7.070653915405273, "global_step": 177322, "epoch": 4221} {"train_loss": -7.051491521653675, "global_step": 177323, "epoch": 4221, "val_loss": 68619.5078125} {"train_loss": -7.156322479248047, "global_step": 177324, "epoch": 4222} {"train_loss": -6.998773097991943, "global_step": 177325, "epoch": 4222} {"train_loss": -7.045546531677246, "global_step": 177326, "epoch": 4222} {"train_loss": -7.093750953674316, "global_step": 177327, "epoch": 4222} {"train_loss": -7.153153419494629, "global_step": 177328, "epoch": 4222} {"train_loss": -7.0947265625, "global_step": 177329, "epoch": 4222} {"train_loss": -7.063778877258301, "global_step": 177330, "epoch": 4222} {"train_loss": -7.074042320251465, "global_step": 177331, "epoch": 4222} {"train_loss": -7.135756492614746, "global_step": 177332, "epoch": 4222} {"train_loss": -7.092379093170166, "global_step": 177333, "epoch": 4222} {"train_loss": -7.104078769683838, "global_step": 177334, "epoch": 4222} {"train_loss": -7.114575386047363, "global_step": 177335, "epoch": 4222} {"train_loss": -7.163213729858398, "global_step": 177336, "epoch": 4222} {"train_loss": -7.17085075378418, "global_step": 177337, "epoch": 4222} {"train_loss": -7.133689880371094, "global_step": 177338, "epoch": 4222} {"train_loss": -7.080280780792236, "global_step": 177339, "epoch": 4222} {"train_loss": -7.030922889709473, "global_step": 177340, "epoch": 4222} {"train_loss": -7.087887763977051, "global_step": 177341, "epoch": 4222} {"train_loss": -7.040979385375977, "global_step": 177342, "epoch": 4222} {"train_loss": -6.996419429779053, "global_step": 177343, "epoch": 4222} {"train_loss": -7.0455522537231445, "global_step": 177344, "epoch": 4222} {"train_loss": -7.100213527679443, "global_step": 177345, "epoch": 4222} {"train_loss": -7.03583288192749, "global_step": 177346, "epoch": 4222} {"train_loss": -7.064220428466797, "global_step": 177347, "epoch": 4222} {"train_loss": -7.061820983886719, "global_step": 177348, "epoch": 4222} {"train_loss": -7.046502590179443, "global_step": 177349, "epoch": 4222} {"train_loss": -6.971559047698975, "global_step": 177350, "epoch": 4222} {"train_loss": -6.993434906005859, "global_step": 177351, "epoch": 4222} {"train_loss": -6.958873748779297, "global_step": 177352, "epoch": 4222} {"train_loss": -6.9217095375061035, "global_step": 177353, "epoch": 4222} {"train_loss": -7.001949787139893, "global_step": 177354, "epoch": 4222} {"train_loss": -7.071399211883545, "global_step": 177355, "epoch": 4222} {"train_loss": -7.050276756286621, "global_step": 177356, "epoch": 4222} {"train_loss": -6.969891548156738, "global_step": 177357, "epoch": 4222} {"train_loss": -7.010806560516357, "global_step": 177358, "epoch": 4222} {"train_loss": -6.996590614318848, "global_step": 177359, "epoch": 4222} {"train_loss": -7.1680521965026855, "global_step": 177360, "epoch": 4222} {"train_loss": -7.086243629455566, "global_step": 177361, "epoch": 4222} {"train_loss": -7.089208602905273, "global_step": 177362, "epoch": 4222} {"train_loss": -6.999942779541016, "global_step": 177363, "epoch": 4222} {"train_loss": -7.025622367858887, "global_step": 177364, "epoch": 4222} {"train_loss": -7.057688940139044, "global_step": 177365, "epoch": 4222, "val_loss": 68766.0859375} {"train_loss": -7.154048442840576, "global_step": 177366, "epoch": 4223} {"train_loss": -6.985652923583984, "global_step": 177367, "epoch": 4223} {"train_loss": -7.129669189453125, "global_step": 177368, "epoch": 4223} {"train_loss": -7.0857086181640625, "global_step": 177369, "epoch": 4223} {"train_loss": -6.981532096862793, "global_step": 177370, "epoch": 4223} {"train_loss": -7.194368362426758, "global_step": 177371, "epoch": 4223} {"train_loss": -7.176906585693359, "global_step": 177372, "epoch": 4223} {"train_loss": -7.132152557373047, "global_step": 177373, "epoch": 4223} {"train_loss": -7.060988426208496, "global_step": 177374, "epoch": 4223} {"train_loss": -7.095944404602051, "global_step": 177375, "epoch": 4223} {"train_loss": -7.056794166564941, "global_step": 177376, "epoch": 4223} {"train_loss": -7.16423225402832, "global_step": 177377, "epoch": 4223} {"train_loss": -7.005495548248291, "global_step": 177378, "epoch": 4223} {"train_loss": -7.15580940246582, "global_step": 177379, "epoch": 4223} {"train_loss": -7.06659460067749, "global_step": 177380, "epoch": 4223} {"train_loss": -6.9538493156433105, "global_step": 177381, "epoch": 4223} {"train_loss": -7.083934307098389, "global_step": 177382, "epoch": 4223} {"train_loss": -7.052034378051758, "global_step": 177383, "epoch": 4223} {"train_loss": -7.129979133605957, "global_step": 177384, "epoch": 4223} {"train_loss": -7.066133499145508, "global_step": 177385, "epoch": 4223} {"train_loss": -6.934863567352295, "global_step": 177386, "epoch": 4223} {"train_loss": -7.067987442016602, "global_step": 177387, "epoch": 4223} {"train_loss": -7.102341651916504, "global_step": 177388, "epoch": 4223} {"train_loss": -7.056177616119385, "global_step": 177389, "epoch": 4223} {"train_loss": -7.024423599243164, "global_step": 177390, "epoch": 4223} {"train_loss": -7.146421432495117, "global_step": 177391, "epoch": 4223} {"train_loss": -7.086626052856445, "global_step": 177392, "epoch": 4223} {"train_loss": -6.952548027038574, "global_step": 177393, "epoch": 4223} {"train_loss": -7.023441314697266, "global_step": 177394, "epoch": 4223} {"train_loss": -6.961156845092773, "global_step": 177395, "epoch": 4223} {"train_loss": -6.975049018859863, "global_step": 177396, "epoch": 4223} {"train_loss": -7.038818836212158, "global_step": 177397, "epoch": 4223} {"train_loss": -7.089496612548828, "global_step": 177398, "epoch": 4223} {"train_loss": -6.974517345428467, "global_step": 177399, "epoch": 4223} {"train_loss": -7.094564437866211, "global_step": 177400, "epoch": 4223} {"train_loss": -7.093033313751221, "global_step": 177401, "epoch": 4223} {"train_loss": -7.001497268676758, "global_step": 177402, "epoch": 4223} {"train_loss": -7.144450664520264, "global_step": 177403, "epoch": 4223} {"train_loss": -7.003698348999023, "global_step": 177404, "epoch": 4223} {"train_loss": -7.00681734085083, "global_step": 177405, "epoch": 4223} {"train_loss": -7.200324058532715, "global_step": 177406, "epoch": 4223} {"train_loss": -7.066088608333042, "global_step": 177407, "epoch": 4223, "val_loss": 68584.2109375} {"train_loss": -7.030301094055176, "global_step": 177408, "epoch": 4224} {"train_loss": -7.09705924987793, "global_step": 177409, "epoch": 4224} {"train_loss": -7.1719207763671875, "global_step": 177410, "epoch": 4224} {"train_loss": -7.009941101074219, "global_step": 177411, "epoch": 4224} {"train_loss": -7.07189416885376, "global_step": 177412, "epoch": 4224} {"train_loss": -7.057463645935059, "global_step": 177413, "epoch": 4224} {"train_loss": -7.041936874389648, "global_step": 177414, "epoch": 4224} {"train_loss": -7.03726863861084, "global_step": 177415, "epoch": 4224} {"train_loss": -7.1107940673828125, "global_step": 177416, "epoch": 4224} {"train_loss": -6.930624961853027, "global_step": 177417, "epoch": 4224} {"train_loss": -7.104147911071777, "global_step": 177418, "epoch": 4224} {"train_loss": -7.099310398101807, "global_step": 177419, "epoch": 4224} {"train_loss": -7.2172088623046875, "global_step": 177420, "epoch": 4224} {"train_loss": -7.098653793334961, "global_step": 177421, "epoch": 4224} {"train_loss": -7.055542469024658, "global_step": 177422, "epoch": 4224} {"train_loss": -7.113377094268799, "global_step": 177423, "epoch": 4224} {"train_loss": -6.974163055419922, "global_step": 177424, "epoch": 4224} {"train_loss": -7.1460700035095215, "global_step": 177425, "epoch": 4224} {"train_loss": -7.035310745239258, "global_step": 177426, "epoch": 4224} {"train_loss": -6.944366455078125, "global_step": 177427, "epoch": 4224} {"train_loss": -7.028002738952637, "global_step": 177428, "epoch": 4224} {"train_loss": -7.0940446853637695, "global_step": 177429, "epoch": 4224} {"train_loss": -7.017049789428711, "global_step": 177430, "epoch": 4224} {"train_loss": -7.083552360534668, "global_step": 177431, "epoch": 4224} {"train_loss": -7.019571304321289, "global_step": 177432, "epoch": 4224} {"train_loss": -7.141915321350098, "global_step": 177433, "epoch": 4224} {"train_loss": -7.084245681762695, "global_step": 177434, "epoch": 4224} {"train_loss": -7.027119159698486, "global_step": 177435, "epoch": 4224} {"train_loss": -7.095033645629883, "global_step": 177436, "epoch": 4224} {"train_loss": -7.078247547149658, "global_step": 177437, "epoch": 4224} {"train_loss": -7.116448402404785, "global_step": 177438, "epoch": 4224} {"train_loss": -6.999297142028809, "global_step": 177439, "epoch": 4224} {"train_loss": -7.16339111328125, "global_step": 177440, "epoch": 4224} {"train_loss": -7.062677383422852, "global_step": 177441, "epoch": 4224} {"train_loss": -7.144002914428711, "global_step": 177442, "epoch": 4224} {"train_loss": -7.157290458679199, "global_step": 177443, "epoch": 4224} {"train_loss": -7.096671104431152, "global_step": 177444, "epoch": 4224} {"train_loss": -7.130527496337891, "global_step": 177445, "epoch": 4224} {"train_loss": -7.036728382110596, "global_step": 177446, "epoch": 4224} {"train_loss": -7.111367225646973, "global_step": 177447, "epoch": 4224} {"train_loss": -7.093365669250488, "global_step": 177448, "epoch": 4224} {"train_loss": -7.077117658796764, "global_step": 177449, "epoch": 4224, "val_loss": 68612.9453125} {"train_loss": -7.124765396118164, "global_step": 177450, "epoch": 4225} {"train_loss": -7.0854902267456055, "global_step": 177451, "epoch": 4225} {"train_loss": -7.110774040222168, "global_step": 177452, "epoch": 4225} {"train_loss": -7.090860366821289, "global_step": 177453, "epoch": 4225} {"train_loss": -7.1082329750061035, "global_step": 177454, "epoch": 4225} {"train_loss": -6.998917579650879, "global_step": 177455, "epoch": 4225} {"train_loss": -7.024297714233398, "global_step": 177456, "epoch": 4225} {"train_loss": -6.967166900634766, "global_step": 177457, "epoch": 4225} {"train_loss": -7.049966812133789, "global_step": 177458, "epoch": 4225} {"train_loss": -6.9822893142700195, "global_step": 177459, "epoch": 4225} {"train_loss": -7.107590675354004, "global_step": 177460, "epoch": 4225} {"train_loss": -6.904954433441162, "global_step": 177461, "epoch": 4225} {"train_loss": -7.000721454620361, "global_step": 177462, "epoch": 4225} {"train_loss": -6.994624137878418, "global_step": 177463, "epoch": 4225} {"train_loss": -6.978908061981201, "global_step": 177464, "epoch": 4225} {"train_loss": -7.156152725219727, "global_step": 177465, "epoch": 4225} {"train_loss": -6.976675987243652, "global_step": 177466, "epoch": 4225} {"train_loss": -6.999978065490723, "global_step": 177467, "epoch": 4225} {"train_loss": -6.9583516120910645, "global_step": 177468, "epoch": 4225} {"train_loss": -7.093262672424316, "global_step": 177469, "epoch": 4225} {"train_loss": -6.877501010894775, "global_step": 177470, "epoch": 4225} {"train_loss": -6.9989399909973145, "global_step": 177471, "epoch": 4225} {"train_loss": -7.054141044616699, "global_step": 177472, "epoch": 4225} {"train_loss": -6.959939479827881, "global_step": 177473, "epoch": 4225} {"train_loss": -6.926169395446777, "global_step": 177474, "epoch": 4225} {"train_loss": -6.98182487487793, "global_step": 177475, "epoch": 4225} {"train_loss": -7.017207145690918, "global_step": 177476, "epoch": 4225} {"train_loss": -6.9944257736206055, "global_step": 177477, "epoch": 4225} {"train_loss": -6.991131782531738, "global_step": 177478, "epoch": 4225} {"train_loss": -6.9413275718688965, "global_step": 177479, "epoch": 4225} {"train_loss": -6.85155725479126, "global_step": 177480, "epoch": 4225} {"train_loss": -6.994473934173584, "global_step": 177481, "epoch": 4225} {"train_loss": -6.964983940124512, "global_step": 177482, "epoch": 4225} {"train_loss": -7.01872444152832, "global_step": 177483, "epoch": 4225} {"train_loss": -7.024170398712158, "global_step": 177484, "epoch": 4225} {"train_loss": -6.867162227630615, "global_step": 177485, "epoch": 4225} {"train_loss": -6.96290397644043, "global_step": 177486, "epoch": 4225} {"train_loss": -7.072688102722168, "global_step": 177487, "epoch": 4225} {"train_loss": -7.015424728393555, "global_step": 177488, "epoch": 4225} {"train_loss": -6.983940124511719, "global_step": 177489, "epoch": 4225} {"train_loss": -7.028316974639893, "global_step": 177490, "epoch": 4225} {"train_loss": -7.004762218112037, "global_step": 177491, "epoch": 4225, "val_loss": 68928.2109375} {"train_loss": -7.007956504821777, "global_step": 177492, "epoch": 4226} {"train_loss": -7.035803318023682, "global_step": 177493, "epoch": 4226} {"train_loss": -7.134116172790527, "global_step": 177494, "epoch": 4226} {"train_loss": -7.0119757652282715, "global_step": 177495, "epoch": 4226} {"train_loss": -7.102241039276123, "global_step": 177496, "epoch": 4226} {"train_loss": -6.978634834289551, "global_step": 177497, "epoch": 4226} {"train_loss": -6.959220886230469, "global_step": 177498, "epoch": 4226} {"train_loss": -7.068046569824219, "global_step": 177499, "epoch": 4226} {"train_loss": -7.057323455810547, "global_step": 177500, "epoch": 4226} {"train_loss": -7.065506458282471, "global_step": 177501, "epoch": 4226} {"train_loss": -7.18857479095459, "global_step": 177502, "epoch": 4226} {"train_loss": -7.1165008544921875, "global_step": 177503, "epoch": 4226} {"train_loss": -7.105569839477539, "global_step": 177504, "epoch": 4226} {"train_loss": -7.190749168395996, "global_step": 177505, "epoch": 4226} {"train_loss": -6.971430778503418, "global_step": 177506, "epoch": 4226} {"train_loss": -7.054555416107178, "global_step": 177507, "epoch": 4226} {"train_loss": -7.012424468994141, "global_step": 177508, "epoch": 4226} {"train_loss": -7.16823673248291, "global_step": 177509, "epoch": 4226} {"train_loss": -6.956635475158691, "global_step": 177510, "epoch": 4226} {"train_loss": -7.001644134521484, "global_step": 177511, "epoch": 4226} {"train_loss": -7.045226097106934, "global_step": 177512, "epoch": 4226} {"train_loss": -7.065059185028076, "global_step": 177513, "epoch": 4226} {"train_loss": -7.055844306945801, "global_step": 177514, "epoch": 4226} {"train_loss": -6.989856719970703, "global_step": 177515, "epoch": 4226} {"train_loss": -7.012250900268555, "global_step": 177516, "epoch": 4226} {"train_loss": -6.991180896759033, "global_step": 177517, "epoch": 4226} {"train_loss": -7.023255348205566, "global_step": 177518, "epoch": 4226} {"train_loss": -7.007996082305908, "global_step": 177519, "epoch": 4226} {"train_loss": -7.033453941345215, "global_step": 177520, "epoch": 4226} {"train_loss": -7.233697414398193, "global_step": 177521, "epoch": 4226} {"train_loss": -7.060535907745361, "global_step": 177522, "epoch": 4226} {"train_loss": -7.0681610107421875, "global_step": 177523, "epoch": 4226} {"train_loss": -7.071203231811523, "global_step": 177524, "epoch": 4226} {"train_loss": -7.105756759643555, "global_step": 177525, "epoch": 4226} {"train_loss": -7.0271196365356445, "global_step": 177526, "epoch": 4226} {"train_loss": -7.17176628112793, "global_step": 177527, "epoch": 4226} {"train_loss": -7.154973983764648, "global_step": 177528, "epoch": 4226} {"train_loss": -7.1109619140625, "global_step": 177529, "epoch": 4226} {"train_loss": -7.089663982391357, "global_step": 177530, "epoch": 4226} {"train_loss": -7.071598529815674, "global_step": 177531, "epoch": 4226} {"train_loss": -7.103207111358643, "global_step": 177532, "epoch": 4226} {"train_loss": -7.0645413512275335, "global_step": 177533, "epoch": 4226, "val_loss": 68888.0859375} {"train_loss": -7.083510398864746, "global_step": 177534, "epoch": 4227} {"train_loss": -7.052762508392334, "global_step": 177535, "epoch": 4227} {"train_loss": -7.112738609313965, "global_step": 177536, "epoch": 4227} {"train_loss": -7.058104515075684, "global_step": 177537, "epoch": 4227} {"train_loss": -7.094798564910889, "global_step": 177538, "epoch": 4227} {"train_loss": -7.126821517944336, "global_step": 177539, "epoch": 4227} {"train_loss": -6.993580341339111, "global_step": 177540, "epoch": 4227} {"train_loss": -7.095911979675293, "global_step": 177541, "epoch": 4227} {"train_loss": -7.03427791595459, "global_step": 177542, "epoch": 4227} {"train_loss": -7.070112228393555, "global_step": 177543, "epoch": 4227} {"train_loss": -7.066734790802002, "global_step": 177544, "epoch": 4227} {"train_loss": -6.965715408325195, "global_step": 177545, "epoch": 4227} {"train_loss": -7.05849552154541, "global_step": 177546, "epoch": 4227} {"train_loss": -7.079277992248535, "global_step": 177547, "epoch": 4227} {"train_loss": -7.146422863006592, "global_step": 177548, "epoch": 4227} {"train_loss": -7.14265775680542, "global_step": 177549, "epoch": 4227} {"train_loss": -7.023013591766357, "global_step": 177550, "epoch": 4227} {"train_loss": -6.9949951171875, "global_step": 177551, "epoch": 4227} {"train_loss": -7.018241882324219, "global_step": 177552, "epoch": 4227} {"train_loss": -6.877992630004883, "global_step": 177553, "epoch": 4227} {"train_loss": -7.0266313552856445, "global_step": 177554, "epoch": 4227} {"train_loss": -7.07247257232666, "global_step": 177555, "epoch": 4227} {"train_loss": -6.9080634117126465, "global_step": 177556, "epoch": 4227} {"train_loss": -7.217581748962402, "global_step": 177557, "epoch": 4227} {"train_loss": -6.921145439147949, "global_step": 177558, "epoch": 4227} {"train_loss": -7.143720626831055, "global_step": 177559, "epoch": 4227} {"train_loss": -7.013455390930176, "global_step": 177560, "epoch": 4227} {"train_loss": -6.947170734405518, "global_step": 177561, "epoch": 4227} {"train_loss": -7.050106048583984, "global_step": 177562, "epoch": 4227} {"train_loss": -6.972146987915039, "global_step": 177563, "epoch": 4227} {"train_loss": -6.980719566345215, "global_step": 177564, "epoch": 4227} {"train_loss": -6.934083938598633, "global_step": 177565, "epoch": 4227} {"train_loss": -7.025446891784668, "global_step": 177566, "epoch": 4227} {"train_loss": -7.096948623657227, "global_step": 177567, "epoch": 4227} {"train_loss": -6.994563579559326, "global_step": 177568, "epoch": 4227} {"train_loss": -7.040626049041748, "global_step": 177569, "epoch": 4227} {"train_loss": -6.899779796600342, "global_step": 177570, "epoch": 4227} {"train_loss": -7.029335021972656, "global_step": 177571, "epoch": 4227} {"train_loss": -6.978787899017334, "global_step": 177572, "epoch": 4227} {"train_loss": -6.874245643615723, "global_step": 177573, "epoch": 4227} {"train_loss": -6.889798164367676, "global_step": 177574, "epoch": 4227} {"train_loss": -7.024304526192801, "global_step": 177575, "epoch": 4227, "val_loss": 68725.0390625} {"train_loss": -7.051239013671875, "global_step": 177576, "epoch": 4228} {"train_loss": -6.919339179992676, "global_step": 177577, "epoch": 4228} {"train_loss": -6.985378265380859, "global_step": 177578, "epoch": 4228} {"train_loss": -7.057704925537109, "global_step": 177579, "epoch": 4228} {"train_loss": -6.854515075683594, "global_step": 177580, "epoch": 4228} {"train_loss": -6.906612873077393, "global_step": 177581, "epoch": 4228} {"train_loss": -6.923994064331055, "global_step": 177582, "epoch": 4228} {"train_loss": -6.9532694816589355, "global_step": 177583, "epoch": 4228} {"train_loss": -6.89005708694458, "global_step": 177584, "epoch": 4228} {"train_loss": -7.040288925170898, "global_step": 177585, "epoch": 4228} {"train_loss": -6.8579301834106445, "global_step": 177586, "epoch": 4228} {"train_loss": -6.910920143127441, "global_step": 177587, "epoch": 4228} {"train_loss": -6.844876289367676, "global_step": 177588, "epoch": 4228} {"train_loss": -7.0446696281433105, "global_step": 177589, "epoch": 4228} {"train_loss": -6.989674091339111, "global_step": 177590, "epoch": 4228} {"train_loss": -6.991947174072266, "global_step": 177591, "epoch": 4228} {"train_loss": -6.90434455871582, "global_step": 177592, "epoch": 4228} {"train_loss": -6.921628475189209, "global_step": 177593, "epoch": 4228} {"train_loss": -6.8521552085876465, "global_step": 177594, "epoch": 4228} {"train_loss": -6.973069667816162, "global_step": 177595, "epoch": 4228} {"train_loss": -6.879683494567871, "global_step": 177596, "epoch": 4228} {"train_loss": -6.904713153839111, "global_step": 177597, "epoch": 4228} {"train_loss": -6.986739635467529, "global_step": 177598, "epoch": 4228} {"train_loss": -6.959197521209717, "global_step": 177599, "epoch": 4228} {"train_loss": -7.0030012130737305, "global_step": 177600, "epoch": 4228} {"train_loss": -7.102273941040039, "global_step": 177601, "epoch": 4228} {"train_loss": -6.992584228515625, "global_step": 177602, "epoch": 4228} {"train_loss": -7.0048956871032715, "global_step": 177603, "epoch": 4228} {"train_loss": -7.044643402099609, "global_step": 177604, "epoch": 4228} {"train_loss": -6.944283485412598, "global_step": 177605, "epoch": 4228} {"train_loss": -7.086636543273926, "global_step": 177606, "epoch": 4228} {"train_loss": -6.96604585647583, "global_step": 177607, "epoch": 4228} {"train_loss": -6.989147186279297, "global_step": 177608, "epoch": 4228} {"train_loss": -7.027826309204102, "global_step": 177609, "epoch": 4228} {"train_loss": -6.96297550201416, "global_step": 177610, "epoch": 4228} {"train_loss": -6.912721633911133, "global_step": 177611, "epoch": 4228} {"train_loss": -7.105025768280029, "global_step": 177612, "epoch": 4228} {"train_loss": -6.924071311950684, "global_step": 177613, "epoch": 4228} {"train_loss": -7.00956392288208, "global_step": 177614, "epoch": 4228} {"train_loss": -6.9748616218566895, "global_step": 177615, "epoch": 4228} {"train_loss": -6.921602725982666, "global_step": 177616, "epoch": 4228} {"train_loss": -6.967099643888927, "global_step": 177617, "epoch": 4228, "val_loss": 68798.78125} {"train_loss": -7.0775227546691895, "global_step": 177618, "epoch": 4229} {"train_loss": -6.966213226318359, "global_step": 177619, "epoch": 4229} {"train_loss": -7.04672908782959, "global_step": 177620, "epoch": 4229} {"train_loss": -6.9599761962890625, "global_step": 177621, "epoch": 4229} {"train_loss": -7.113614559173584, "global_step": 177622, "epoch": 4229} {"train_loss": -7.059047698974609, "global_step": 177623, "epoch": 4229} {"train_loss": -7.003969192504883, "global_step": 177624, "epoch": 4229} {"train_loss": -6.929687976837158, "global_step": 177625, "epoch": 4229} {"train_loss": -7.089612007141113, "global_step": 177626, "epoch": 4229} {"train_loss": -7.037958145141602, "global_step": 177627, "epoch": 4229} {"train_loss": -7.055013179779053, "global_step": 177628, "epoch": 4229} {"train_loss": -6.981794357299805, "global_step": 177629, "epoch": 4229} {"train_loss": -6.959290504455566, "global_step": 177630, "epoch": 4229} {"train_loss": -7.148170471191406, "global_step": 177631, "epoch": 4229} {"train_loss": -7.033298969268799, "global_step": 177632, "epoch": 4229} {"train_loss": -7.102989196777344, "global_step": 177633, "epoch": 4229} {"train_loss": -7.016458988189697, "global_step": 177634, "epoch": 4229} {"train_loss": -7.064875602722168, "global_step": 177635, "epoch": 4229} {"train_loss": -7.0768632888793945, "global_step": 177636, "epoch": 4229} {"train_loss": -7.023552894592285, "global_step": 177637, "epoch": 4229} {"train_loss": -7.075153827667236, "global_step": 177638, "epoch": 4229} {"train_loss": -7.028605937957764, "global_step": 177639, "epoch": 4229} {"train_loss": -7.129204750061035, "global_step": 177640, "epoch": 4229} {"train_loss": -7.027289390563965, "global_step": 177641, "epoch": 4229} {"train_loss": -7.043391227722168, "global_step": 177642, "epoch": 4229} {"train_loss": -7.144360065460205, "global_step": 177643, "epoch": 4229} {"train_loss": -7.063185214996338, "global_step": 177644, "epoch": 4229} {"train_loss": -7.011624336242676, "global_step": 177645, "epoch": 4229} {"train_loss": -7.068089485168457, "global_step": 177646, "epoch": 4229} {"train_loss": -7.208974838256836, "global_step": 177647, "epoch": 4229} {"train_loss": -7.005967140197754, "global_step": 177648, "epoch": 4229} {"train_loss": -7.053896903991699, "global_step": 177649, "epoch": 4229} {"train_loss": -7.082034111022949, "global_step": 177650, "epoch": 4229} {"train_loss": -7.120368003845215, "global_step": 177651, "epoch": 4229} {"train_loss": -6.9782395362854, "global_step": 177652, "epoch": 4229} {"train_loss": -7.078010559082031, "global_step": 177653, "epoch": 4229} {"train_loss": -7.133401870727539, "global_step": 177654, "epoch": 4229} {"train_loss": -7.080539703369141, "global_step": 177655, "epoch": 4229} {"train_loss": -7.041234016418457, "global_step": 177656, "epoch": 4229} {"train_loss": -6.948060989379883, "global_step": 177657, "epoch": 4229} {"train_loss": -7.104257106781006, "global_step": 177658, "epoch": 4229} {"train_loss": -7.054667745317731, "global_step": 177659, "epoch": 4229, "val_loss": 68787.375} {"train_loss": -7.148798942565918, "global_step": 177660, "epoch": 4230} {"train_loss": -7.141299247741699, "global_step": 177661, "epoch": 4230} {"train_loss": -7.1062116622924805, "global_step": 177662, "epoch": 4230} {"train_loss": -7.097524642944336, "global_step": 177663, "epoch": 4230} {"train_loss": -7.034204483032227, "global_step": 177664, "epoch": 4230} {"train_loss": -7.0381951332092285, "global_step": 177665, "epoch": 4230} {"train_loss": -7.086592674255371, "global_step": 177666, "epoch": 4230} {"train_loss": -7.075419902801514, "global_step": 177667, "epoch": 4230} {"train_loss": -6.985687255859375, "global_step": 177668, "epoch": 4230} {"train_loss": -7.037215232849121, "global_step": 177669, "epoch": 4230} {"train_loss": -6.866503715515137, "global_step": 177670, "epoch": 4230} {"train_loss": -7.12407922744751, "global_step": 177671, "epoch": 4230} {"train_loss": -7.196282386779785, "global_step": 177672, "epoch": 4230} {"train_loss": -7.040743350982666, "global_step": 177673, "epoch": 4230} {"train_loss": -7.001476287841797, "global_step": 177674, "epoch": 4230} {"train_loss": -6.960252285003662, "global_step": 177675, "epoch": 4230} {"train_loss": -7.075936317443848, "global_step": 177676, "epoch": 4230} {"train_loss": -6.96544075012207, "global_step": 177677, "epoch": 4230} {"train_loss": -7.0506792068481445, "global_step": 177678, "epoch": 4230} {"train_loss": -7.058572769165039, "global_step": 177679, "epoch": 4230} {"train_loss": -6.927173137664795, "global_step": 177680, "epoch": 4230} {"train_loss": -7.110177040100098, "global_step": 177681, "epoch": 4230} {"train_loss": -7.063258171081543, "global_step": 177682, "epoch": 4230} {"train_loss": -7.05949068069458, "global_step": 177683, "epoch": 4230} {"train_loss": -7.062559127807617, "global_step": 177684, "epoch": 4230} {"train_loss": -6.948581695556641, "global_step": 177685, "epoch": 4230} {"train_loss": -7.093020439147949, "global_step": 177686, "epoch": 4230} {"train_loss": -7.0878705978393555, "global_step": 177687, "epoch": 4230} {"train_loss": -6.97819709777832, "global_step": 177688, "epoch": 4230} {"train_loss": -6.951089859008789, "global_step": 177689, "epoch": 4230} {"train_loss": -7.027290344238281, "global_step": 177690, "epoch": 4230} {"train_loss": -7.061359405517578, "global_step": 177691, "epoch": 4230} {"train_loss": -6.9959259033203125, "global_step": 177692, "epoch": 4230} {"train_loss": -7.052491188049316, "global_step": 177693, "epoch": 4230} {"train_loss": -7.032670974731445, "global_step": 177694, "epoch": 4230} {"train_loss": -6.9834136962890625, "global_step": 177695, "epoch": 4230} {"train_loss": -7.032097339630127, "global_step": 177696, "epoch": 4230} {"train_loss": -7.041566848754883, "global_step": 177697, "epoch": 4230} {"train_loss": -7.0508527755737305, "global_step": 177698, "epoch": 4230} {"train_loss": -7.14221715927124, "global_step": 177699, "epoch": 4230} {"train_loss": -7.01543664932251, "global_step": 177700, "epoch": 4230} {"train_loss": -7.043903260003953, "global_step": 177701, "epoch": 4230, "val_loss": 68481.203125} {"train_loss": -7.164849281311035, "global_step": 177702, "epoch": 4231} {"train_loss": -7.141626834869385, "global_step": 177703, "epoch": 4231} {"train_loss": -7.040441989898682, "global_step": 177704, "epoch": 4231} {"train_loss": -7.0349531173706055, "global_step": 177705, "epoch": 4231} {"train_loss": -7.0591607093811035, "global_step": 177706, "epoch": 4231} {"train_loss": -7.171792507171631, "global_step": 177707, "epoch": 4231} {"train_loss": -7.064816474914551, "global_step": 177708, "epoch": 4231} {"train_loss": -7.0831756591796875, "global_step": 177709, "epoch": 4231} {"train_loss": -7.1231207847595215, "global_step": 177710, "epoch": 4231} {"train_loss": -7.062828063964844, "global_step": 177711, "epoch": 4231} {"train_loss": -6.977054119110107, "global_step": 177712, "epoch": 4231} {"train_loss": -7.054605960845947, "global_step": 177713, "epoch": 4231} {"train_loss": -7.0651350021362305, "global_step": 177714, "epoch": 4231} {"train_loss": -7.033838272094727, "global_step": 177715, "epoch": 4231} {"train_loss": -7.031868934631348, "global_step": 177716, "epoch": 4231} {"train_loss": -7.079968452453613, "global_step": 177717, "epoch": 4231} {"train_loss": -7.0085296630859375, "global_step": 177718, "epoch": 4231} {"train_loss": -7.133432388305664, "global_step": 177719, "epoch": 4231} {"train_loss": -7.083359718322754, "global_step": 177720, "epoch": 4231} {"train_loss": -7.066271781921387, "global_step": 177721, "epoch": 4231} {"train_loss": -7.038493633270264, "global_step": 177722, "epoch": 4231} {"train_loss": -7.001506805419922, "global_step": 177723, "epoch": 4231} {"train_loss": -7.087837219238281, "global_step": 177724, "epoch": 4231} {"train_loss": -6.918972969055176, "global_step": 177725, "epoch": 4231} {"train_loss": -7.078828811645508, "global_step": 177726, "epoch": 4231} {"train_loss": -7.039099216461182, "global_step": 177727, "epoch": 4231} {"train_loss": -7.016271591186523, "global_step": 177728, "epoch": 4231} {"train_loss": -7.12120246887207, "global_step": 177729, "epoch": 4231} {"train_loss": -6.97021484375, "global_step": 177730, "epoch": 4231} {"train_loss": -6.973219871520996, "global_step": 177731, "epoch": 4231} {"train_loss": -6.94566535949707, "global_step": 177732, "epoch": 4231} {"train_loss": -6.993988990783691, "global_step": 177733, "epoch": 4231} {"train_loss": -7.005273342132568, "global_step": 177734, "epoch": 4231} {"train_loss": -6.888636589050293, "global_step": 177735, "epoch": 4231} {"train_loss": -6.911957740783691, "global_step": 177736, "epoch": 4231} {"train_loss": -6.957237243652344, "global_step": 177737, "epoch": 4231} {"train_loss": -6.872754096984863, "global_step": 177738, "epoch": 4231} {"train_loss": -6.951333999633789, "global_step": 177739, "epoch": 4231} {"train_loss": -6.973141193389893, "global_step": 177740, "epoch": 4231} {"train_loss": -6.920575141906738, "global_step": 177741, "epoch": 4231} {"train_loss": -6.992778778076172, "global_step": 177742, "epoch": 4231} {"train_loss": -7.022368147259667, "global_step": 177743, "epoch": 4231, "val_loss": 68752.3046875} {"train_loss": -7.113474369049072, "global_step": 177744, "epoch": 4232} {"train_loss": -6.952123641967773, "global_step": 177745, "epoch": 4232} {"train_loss": -6.978782653808594, "global_step": 177746, "epoch": 4232} {"train_loss": -6.971706390380859, "global_step": 177747, "epoch": 4232} {"train_loss": -6.999017715454102, "global_step": 177748, "epoch": 4232} {"train_loss": -6.8682780265808105, "global_step": 177749, "epoch": 4232} {"train_loss": -7.105026721954346, "global_step": 177750, "epoch": 4232} {"train_loss": -6.951153755187988, "global_step": 177751, "epoch": 4232} {"train_loss": -6.918628692626953, "global_step": 177752, "epoch": 4232} {"train_loss": -6.990584373474121, "global_step": 177753, "epoch": 4232} {"train_loss": -7.021719932556152, "global_step": 177754, "epoch": 4232} {"train_loss": -7.078535079956055, "global_step": 177755, "epoch": 4232} {"train_loss": -7.066778182983398, "global_step": 177756, "epoch": 4232} {"train_loss": -7.040193557739258, "global_step": 177757, "epoch": 4232} {"train_loss": -7.026705741882324, "global_step": 177758, "epoch": 4232} {"train_loss": -7.048666477203369, "global_step": 177759, "epoch": 4232} {"train_loss": -7.009964942932129, "global_step": 177760, "epoch": 4232} {"train_loss": -7.005617618560791, "global_step": 177761, "epoch": 4232} {"train_loss": -7.095649719238281, "global_step": 177762, "epoch": 4232} {"train_loss": -7.022536277770996, "global_step": 177763, "epoch": 4232} {"train_loss": -7.1426591873168945, "global_step": 177764, "epoch": 4232} {"train_loss": -6.9697089195251465, "global_step": 177765, "epoch": 4232} {"train_loss": -7.095700263977051, "global_step": 177766, "epoch": 4232} {"train_loss": -6.987338542938232, "global_step": 177767, "epoch": 4232} {"train_loss": -6.8950629234313965, "global_step": 177768, "epoch": 4232} {"train_loss": -7.111686706542969, "global_step": 177769, "epoch": 4232} {"train_loss": -7.065197944641113, "global_step": 177770, "epoch": 4232} {"train_loss": -7.013431549072266, "global_step": 177771, "epoch": 4232} {"train_loss": -6.931942462921143, "global_step": 177772, "epoch": 4232} {"train_loss": -6.981640815734863, "global_step": 177773, "epoch": 4232} {"train_loss": -7.000958442687988, "global_step": 177774, "epoch": 4232} {"train_loss": -7.017966270446777, "global_step": 177775, "epoch": 4232} {"train_loss": -7.090372085571289, "global_step": 177776, "epoch": 4232} {"train_loss": -7.088863372802734, "global_step": 177777, "epoch": 4232} {"train_loss": -7.068234443664551, "global_step": 177778, "epoch": 4232} {"train_loss": -7.097109794616699, "global_step": 177779, "epoch": 4232} {"train_loss": -7.053470611572266, "global_step": 177780, "epoch": 4232} {"train_loss": -7.151857852935791, "global_step": 177781, "epoch": 4232} {"train_loss": -7.053410530090332, "global_step": 177782, "epoch": 4232} {"train_loss": -7.101701736450195, "global_step": 177783, "epoch": 4232} {"train_loss": -7.077118873596191, "global_step": 177784, "epoch": 4232} {"train_loss": -7.03219545455206, "global_step": 177785, "epoch": 4232, "val_loss": 68744.9609375} {"train_loss": -7.117393970489502, "global_step": 177786, "epoch": 4233} {"train_loss": -7.069220066070557, "global_step": 177787, "epoch": 4233} {"train_loss": -7.065614700317383, "global_step": 177788, "epoch": 4233} {"train_loss": -7.002205848693848, "global_step": 177789, "epoch": 4233} {"train_loss": -7.157406806945801, "global_step": 177790, "epoch": 4233} {"train_loss": -7.109476089477539, "global_step": 177791, "epoch": 4233} {"train_loss": -7.187531471252441, "global_step": 177792, "epoch": 4233} {"train_loss": -7.08553409576416, "global_step": 177793, "epoch": 4233} {"train_loss": -7.109010219573975, "global_step": 177794, "epoch": 4233} {"train_loss": -7.136282920837402, "global_step": 177795, "epoch": 4233} {"train_loss": -7.051229953765869, "global_step": 177796, "epoch": 4233} {"train_loss": -7.04094934463501, "global_step": 177797, "epoch": 4233} {"train_loss": -7.063543796539307, "global_step": 177798, "epoch": 4233} {"train_loss": -7.150111198425293, "global_step": 177799, "epoch": 4233} {"train_loss": -6.998042583465576, "global_step": 177800, "epoch": 4233} {"train_loss": -7.034682750701904, "global_step": 177801, "epoch": 4233} {"train_loss": -7.1057515144348145, "global_step": 177802, "epoch": 4233} {"train_loss": -7.142541885375977, "global_step": 177803, "epoch": 4233} {"train_loss": -7.041186809539795, "global_step": 177804, "epoch": 4233} {"train_loss": -7.074077129364014, "global_step": 177805, "epoch": 4233} {"train_loss": -7.104575157165527, "global_step": 177806, "epoch": 4233} {"train_loss": -7.041512966156006, "global_step": 177807, "epoch": 4233} {"train_loss": -7.170973777770996, "global_step": 177808, "epoch": 4233} {"train_loss": -7.089076042175293, "global_step": 177809, "epoch": 4233} {"train_loss": -7.048274040222168, "global_step": 177810, "epoch": 4233} {"train_loss": -6.955389499664307, "global_step": 177811, "epoch": 4233} {"train_loss": -7.0499067306518555, "global_step": 177812, "epoch": 4233} {"train_loss": -6.994110107421875, "global_step": 177813, "epoch": 4233} {"train_loss": -7.052806854248047, "global_step": 177814, "epoch": 4233} {"train_loss": -6.988766193389893, "global_step": 177815, "epoch": 4233} {"train_loss": -7.078433036804199, "global_step": 177816, "epoch": 4233} {"train_loss": -7.035913467407227, "global_step": 177817, "epoch": 4233} {"train_loss": -7.064260005950928, "global_step": 177818, "epoch": 4233} {"train_loss": -7.107248306274414, "global_step": 177819, "epoch": 4233} {"train_loss": -7.031078338623047, "global_step": 177820, "epoch": 4233} {"train_loss": -6.979331016540527, "global_step": 177821, "epoch": 4233} {"train_loss": -7.044021129608154, "global_step": 177822, "epoch": 4233} {"train_loss": -7.043517112731934, "global_step": 177823, "epoch": 4233} {"train_loss": -7.095072269439697, "global_step": 177824, "epoch": 4233} {"train_loss": -7.204353332519531, "global_step": 177825, "epoch": 4233} {"train_loss": -6.991054534912109, "global_step": 177826, "epoch": 4233} {"train_loss": -7.0687098276047475, "global_step": 177827, "epoch": 4233, "val_loss": 68803.90625} {"train_loss": -7.092510223388672, "global_step": 177828, "epoch": 4234} {"train_loss": -7.052201271057129, "global_step": 177829, "epoch": 4234} {"train_loss": -7.091616630554199, "global_step": 177830, "epoch": 4234} {"train_loss": -7.043985366821289, "global_step": 177831, "epoch": 4234} {"train_loss": -7.091961860656738, "global_step": 177832, "epoch": 4234} {"train_loss": -7.217676639556885, "global_step": 177833, "epoch": 4234} {"train_loss": -7.021055698394775, "global_step": 177834, "epoch": 4234} {"train_loss": -6.830149173736572, "global_step": 177835, "epoch": 4234} {"train_loss": -6.987582206726074, "global_step": 177836, "epoch": 4234} {"train_loss": -6.988428115844727, "global_step": 177837, "epoch": 4234} {"train_loss": -6.972596168518066, "global_step": 177838, "epoch": 4234} {"train_loss": -7.004441261291504, "global_step": 177839, "epoch": 4234} {"train_loss": -6.945412635803223, "global_step": 177840, "epoch": 4234} {"train_loss": -6.91770076751709, "global_step": 177841, "epoch": 4234} {"train_loss": -6.9313812255859375, "global_step": 177842, "epoch": 4234} {"train_loss": -6.910195350646973, "global_step": 177843, "epoch": 4234} {"train_loss": -7.063438415527344, "global_step": 177844, "epoch": 4234} {"train_loss": -6.861291885375977, "global_step": 177845, "epoch": 4234} {"train_loss": -7.082952499389648, "global_step": 177846, "epoch": 4234} {"train_loss": -6.866825103759766, "global_step": 177847, "epoch": 4234} {"train_loss": -6.959957122802734, "global_step": 177848, "epoch": 4234} {"train_loss": -6.926083564758301, "global_step": 177849, "epoch": 4234} {"train_loss": -6.890307426452637, "global_step": 177850, "epoch": 4234} {"train_loss": -6.936249256134033, "global_step": 177851, "epoch": 4234} {"train_loss": -6.836524963378906, "global_step": 177852, "epoch": 4234} {"train_loss": -6.9149394035339355, "global_step": 177853, "epoch": 4234} {"train_loss": -6.93414831161499, "global_step": 177854, "epoch": 4234} {"train_loss": -7.039268970489502, "global_step": 177855, "epoch": 4234} {"train_loss": -6.912725925445557, "global_step": 177856, "epoch": 4234} {"train_loss": -6.941947937011719, "global_step": 177857, "epoch": 4234} {"train_loss": -6.96852970123291, "global_step": 177858, "epoch": 4234} {"train_loss": -6.8870038986206055, "global_step": 177859, "epoch": 4234} {"train_loss": -6.996964454650879, "global_step": 177860, "epoch": 4234} {"train_loss": -6.962775707244873, "global_step": 177861, "epoch": 4234} {"train_loss": -7.022582530975342, "global_step": 177862, "epoch": 4234} {"train_loss": -7.022793292999268, "global_step": 177863, "epoch": 4234} {"train_loss": -7.029705047607422, "global_step": 177864, "epoch": 4234} {"train_loss": -7.055724143981934, "global_step": 177865, "epoch": 4234} {"train_loss": -7.002985954284668, "global_step": 177866, "epoch": 4234} {"train_loss": -6.981733798980713, "global_step": 177867, "epoch": 4234} {"train_loss": -7.018835067749023, "global_step": 177868, "epoch": 4234} {"train_loss": -6.981141385577974, "global_step": 177869, "epoch": 4234, "val_loss": 68758.0859375} {"train_loss": -7.056473731994629, "global_step": 177870, "epoch": 4235} {"train_loss": -7.031705856323242, "global_step": 177871, "epoch": 4235} {"train_loss": -6.952686786651611, "global_step": 177872, "epoch": 4235} {"train_loss": -7.022162437438965, "global_step": 177873, "epoch": 4235} {"train_loss": -7.035397052764893, "global_step": 177874, "epoch": 4235} {"train_loss": -7.08597469329834, "global_step": 177875, "epoch": 4235} {"train_loss": -7.036833763122559, "global_step": 177876, "epoch": 4235} {"train_loss": -7.020129680633545, "global_step": 177877, "epoch": 4235} {"train_loss": -7.060080528259277, "global_step": 177878, "epoch": 4235} {"train_loss": -7.0734453201293945, "global_step": 177879, "epoch": 4235} {"train_loss": -7.002459526062012, "global_step": 177880, "epoch": 4235} {"train_loss": -7.138849258422852, "global_step": 177881, "epoch": 4235} {"train_loss": -7.022124290466309, "global_step": 177882, "epoch": 4235} {"train_loss": -7.054075717926025, "global_step": 177883, "epoch": 4235} {"train_loss": -7.23582649230957, "global_step": 177884, "epoch": 4235} {"train_loss": -6.982686996459961, "global_step": 177885, "epoch": 4235} {"train_loss": -6.971646308898926, "global_step": 177886, "epoch": 4235} {"train_loss": -7.166583061218262, "global_step": 177887, "epoch": 4235} {"train_loss": -6.895749092102051, "global_step": 177888, "epoch": 4235} {"train_loss": -7.085290908813477, "global_step": 177889, "epoch": 4235} {"train_loss": -6.960725784301758, "global_step": 177890, "epoch": 4235} {"train_loss": -7.249034881591797, "global_step": 177891, "epoch": 4235} {"train_loss": -7.045680046081543, "global_step": 177892, "epoch": 4235} {"train_loss": -7.076136589050293, "global_step": 177893, "epoch": 4235} {"train_loss": -7.173025608062744, "global_step": 177894, "epoch": 4235} {"train_loss": -7.005346298217773, "global_step": 177895, "epoch": 4235} {"train_loss": -7.082457542419434, "global_step": 177896, "epoch": 4235} {"train_loss": -7.126495361328125, "global_step": 177897, "epoch": 4235} {"train_loss": -7.0277509689331055, "global_step": 177898, "epoch": 4235} {"train_loss": -7.096994400024414, "global_step": 177899, "epoch": 4235} {"train_loss": -7.151917457580566, "global_step": 177900, "epoch": 4235} {"train_loss": -7.032182693481445, "global_step": 177901, "epoch": 4235} {"train_loss": -7.037914276123047, "global_step": 177902, "epoch": 4235} {"train_loss": -6.986815929412842, "global_step": 177903, "epoch": 4235} {"train_loss": -7.0394086837768555, "global_step": 177904, "epoch": 4235} {"train_loss": -7.029154300689697, "global_step": 177905, "epoch": 4235} {"train_loss": -7.085447311401367, "global_step": 177906, "epoch": 4235} {"train_loss": -6.909196853637695, "global_step": 177907, "epoch": 4235} {"train_loss": -7.005198955535889, "global_step": 177908, "epoch": 4235} {"train_loss": -7.025248050689697, "global_step": 177909, "epoch": 4235} {"train_loss": -6.955953121185303, "global_step": 177910, "epoch": 4235} {"train_loss": -7.04990047500247, "global_step": 177911, "epoch": 4235, "val_loss": 68605.09375} {"train_loss": -7.02318000793457, "global_step": 177912, "epoch": 4236} {"train_loss": -7.006617546081543, "global_step": 177913, "epoch": 4236} {"train_loss": -6.862941741943359, "global_step": 177914, "epoch": 4236} {"train_loss": -7.043881893157959, "global_step": 177915, "epoch": 4236} {"train_loss": -7.033050060272217, "global_step": 177916, "epoch": 4236} {"train_loss": -7.009176254272461, "global_step": 177917, "epoch": 4236} {"train_loss": -7.106450080871582, "global_step": 177918, "epoch": 4236} {"train_loss": -6.961647033691406, "global_step": 177919, "epoch": 4236} {"train_loss": -7.092931747436523, "global_step": 177920, "epoch": 4236} {"train_loss": -7.077020645141602, "global_step": 177921, "epoch": 4236} {"train_loss": -6.99212121963501, "global_step": 177922, "epoch": 4236} {"train_loss": -7.068484306335449, "global_step": 177923, "epoch": 4236} {"train_loss": -7.062829971313477, "global_step": 177924, "epoch": 4236} {"train_loss": -7.16850471496582, "global_step": 177925, "epoch": 4236} {"train_loss": -7.03947114944458, "global_step": 177926, "epoch": 4236} {"train_loss": -7.010892868041992, "global_step": 177927, "epoch": 4236} {"train_loss": -7.055420875549316, "global_step": 177928, "epoch": 4236} {"train_loss": -7.062844276428223, "global_step": 177929, "epoch": 4236} {"train_loss": -7.192692279815674, "global_step": 177930, "epoch": 4236} {"train_loss": -7.136828422546387, "global_step": 177931, "epoch": 4236} {"train_loss": -6.890937805175781, "global_step": 177932, "epoch": 4236} {"train_loss": -6.901144027709961, "global_step": 177933, "epoch": 4236} {"train_loss": -7.073726654052734, "global_step": 177934, "epoch": 4236} {"train_loss": -6.925743103027344, "global_step": 177935, "epoch": 4236} {"train_loss": -6.89518404006958, "global_step": 177936, "epoch": 4236} {"train_loss": -6.933589458465576, "global_step": 177937, "epoch": 4236} {"train_loss": -6.9332709312438965, "global_step": 177938, "epoch": 4236} {"train_loss": -7.032365798950195, "global_step": 177939, "epoch": 4236} {"train_loss": -6.981029987335205, "global_step": 177940, "epoch": 4236} {"train_loss": -6.967865943908691, "global_step": 177941, "epoch": 4236} {"train_loss": -6.7927470207214355, "global_step": 177942, "epoch": 4236} {"train_loss": -6.990918159484863, "global_step": 177943, "epoch": 4236} {"train_loss": -6.906800270080566, "global_step": 177944, "epoch": 4236} {"train_loss": -6.916875839233398, "global_step": 177945, "epoch": 4236} {"train_loss": -7.042107105255127, "global_step": 177946, "epoch": 4236} {"train_loss": -7.0132060050964355, "global_step": 177947, "epoch": 4236} {"train_loss": -6.9036102294921875, "global_step": 177948, "epoch": 4236} {"train_loss": -7.04849910736084, "global_step": 177949, "epoch": 4236} {"train_loss": -7.054786682128906, "global_step": 177950, "epoch": 4236} {"train_loss": -7.104239463806152, "global_step": 177951, "epoch": 4236} {"train_loss": -7.025943279266357, "global_step": 177952, "epoch": 4236} {"train_loss": -7.009277752467564, "global_step": 177953, "epoch": 4236, "val_loss": 68810.6953125} {"train_loss": -7.0300445556640625, "global_step": 177954, "epoch": 4237} {"train_loss": -7.094756126403809, "global_step": 177955, "epoch": 4237} {"train_loss": -7.157527446746826, "global_step": 177956, "epoch": 4237} {"train_loss": -7.092097282409668, "global_step": 177957, "epoch": 4237} {"train_loss": -7.0572052001953125, "global_step": 177958, "epoch": 4237} {"train_loss": -7.02134895324707, "global_step": 177959, "epoch": 4237} {"train_loss": -7.045434951782227, "global_step": 177960, "epoch": 4237} {"train_loss": -6.989465236663818, "global_step": 177961, "epoch": 4237} {"train_loss": -7.006689071655273, "global_step": 177962, "epoch": 4237} {"train_loss": -7.016207695007324, "global_step": 177963, "epoch": 4237} {"train_loss": -6.7691521644592285, "global_step": 177964, "epoch": 4237} {"train_loss": -7.136932373046875, "global_step": 177965, "epoch": 4237} {"train_loss": -6.997668743133545, "global_step": 177966, "epoch": 4237} {"train_loss": -7.098015785217285, "global_step": 177967, "epoch": 4237} {"train_loss": -7.1114959716796875, "global_step": 177968, "epoch": 4237} {"train_loss": -7.037898540496826, "global_step": 177969, "epoch": 4237} {"train_loss": -7.071369171142578, "global_step": 177970, "epoch": 4237} {"train_loss": -6.942586898803711, "global_step": 177971, "epoch": 4237} {"train_loss": -7.18191385269165, "global_step": 177972, "epoch": 4237} {"train_loss": -6.948093891143799, "global_step": 177973, "epoch": 4237} {"train_loss": -6.99080753326416, "global_step": 177974, "epoch": 4237} {"train_loss": -6.969822883605957, "global_step": 177975, "epoch": 4237} {"train_loss": -6.855408191680908, "global_step": 177976, "epoch": 4237} {"train_loss": -7.039468765258789, "global_step": 177977, "epoch": 4237} {"train_loss": -6.928304195404053, "global_step": 177978, "epoch": 4237} {"train_loss": -7.054421424865723, "global_step": 177979, "epoch": 4237} {"train_loss": -6.9278483390808105, "global_step": 177980, "epoch": 4237} {"train_loss": -7.038310527801514, "global_step": 177981, "epoch": 4237} {"train_loss": -6.971567153930664, "global_step": 177982, "epoch": 4237} {"train_loss": -6.952001571655273, "global_step": 177983, "epoch": 4237} {"train_loss": -7.089416980743408, "global_step": 177984, "epoch": 4237} {"train_loss": -6.935220718383789, "global_step": 177985, "epoch": 4237} {"train_loss": -7.112128257751465, "global_step": 177986, "epoch": 4237} {"train_loss": -7.0386834144592285, "global_step": 177987, "epoch": 4237} {"train_loss": -7.038601875305176, "global_step": 177988, "epoch": 4237} {"train_loss": -6.977468013763428, "global_step": 177989, "epoch": 4237} {"train_loss": -6.948697090148926, "global_step": 177990, "epoch": 4237} {"train_loss": -7.000016212463379, "global_step": 177991, "epoch": 4237} {"train_loss": -6.934676647186279, "global_step": 177992, "epoch": 4237} {"train_loss": -6.970981597900391, "global_step": 177993, "epoch": 4237} {"train_loss": -7.039426803588867, "global_step": 177994, "epoch": 4237} {"train_loss": -7.013873713357108, "global_step": 177995, "epoch": 4237, "val_loss": 68703.90625} {"train_loss": -7.161311149597168, "global_step": 177996, "epoch": 4238} {"train_loss": -7.049327850341797, "global_step": 177997, "epoch": 4238} {"train_loss": -6.933435440063477, "global_step": 177998, "epoch": 4238} {"train_loss": -7.0865654945373535, "global_step": 177999, "epoch": 4238} {"train_loss": -7.124894142150879, "global_step": 178000, "epoch": 4238} {"train_loss": -7.018212795257568, "global_step": 178001, "epoch": 4238} {"train_loss": -7.059174537658691, "global_step": 178002, "epoch": 4238} {"train_loss": -7.043981552124023, "global_step": 178003, "epoch": 4238} {"train_loss": -7.029822826385498, "global_step": 178004, "epoch": 4238} {"train_loss": -7.03187370300293, "global_step": 178005, "epoch": 4238} {"train_loss": -7.008760929107666, "global_step": 178006, "epoch": 4238} {"train_loss": -7.109570503234863, "global_step": 178007, "epoch": 4238} {"train_loss": -7.098196983337402, "global_step": 178008, "epoch": 4238} {"train_loss": -7.112464904785156, "global_step": 178009, "epoch": 4238} {"train_loss": -7.174472808837891, "global_step": 178010, "epoch": 4238} {"train_loss": -7.017616271972656, "global_step": 178011, "epoch": 4238} {"train_loss": -7.08891487121582, "global_step": 178012, "epoch": 4238} {"train_loss": -7.139471054077148, "global_step": 178013, "epoch": 4238} {"train_loss": -7.0895795822143555, "global_step": 178014, "epoch": 4238} {"train_loss": -7.103240966796875, "global_step": 178015, "epoch": 4238} {"train_loss": -7.085592746734619, "global_step": 178016, "epoch": 4238} {"train_loss": -7.082914352416992, "global_step": 178017, "epoch": 4238} {"train_loss": -7.099159240722656, "global_step": 178018, "epoch": 4238} {"train_loss": -6.974078178405762, "global_step": 178019, "epoch": 4238} {"train_loss": -7.015950679779053, "global_step": 178020, "epoch": 4238} {"train_loss": -6.999728679656982, "global_step": 178021, "epoch": 4238} {"train_loss": -6.876732349395752, "global_step": 178022, "epoch": 4238} {"train_loss": -7.080765724182129, "global_step": 178023, "epoch": 4238} {"train_loss": -7.035129547119141, "global_step": 178024, "epoch": 4238} {"train_loss": -7.05259895324707, "global_step": 178025, "epoch": 4238} {"train_loss": -6.96953010559082, "global_step": 178026, "epoch": 4238} {"train_loss": -7.06698751449585, "global_step": 178027, "epoch": 4238} {"train_loss": -7.017684459686279, "global_step": 178028, "epoch": 4238} {"train_loss": -7.052666664123535, "global_step": 178029, "epoch": 4238} {"train_loss": -7.2017059326171875, "global_step": 178030, "epoch": 4238} {"train_loss": -6.936441898345947, "global_step": 178031, "epoch": 4238} {"train_loss": -7.0498456954956055, "global_step": 178032, "epoch": 4238} {"train_loss": -7.059941291809082, "global_step": 178033, "epoch": 4238} {"train_loss": -6.963450908660889, "global_step": 178034, "epoch": 4238} {"train_loss": -7.101496696472168, "global_step": 178035, "epoch": 4238} {"train_loss": -7.009400367736816, "global_step": 178036, "epoch": 4238} {"train_loss": -7.0511883326939175, "global_step": 178037, "epoch": 4238, "val_loss": 68604.5546875} {"train_loss": -7.10572624206543, "global_step": 178038, "epoch": 4239} {"train_loss": -7.0261993408203125, "global_step": 178039, "epoch": 4239} {"train_loss": -7.090939044952393, "global_step": 178040, "epoch": 4239} {"train_loss": -7.020650386810303, "global_step": 178041, "epoch": 4239} {"train_loss": -6.92230224609375, "global_step": 178042, "epoch": 4239} {"train_loss": -6.991916656494141, "global_step": 178043, "epoch": 4239} {"train_loss": -7.039421558380127, "global_step": 178044, "epoch": 4239} {"train_loss": -7.013071060180664, "global_step": 178045, "epoch": 4239} {"train_loss": -7.125115394592285, "global_step": 178046, "epoch": 4239} {"train_loss": -6.959765434265137, "global_step": 178047, "epoch": 4239} {"train_loss": -6.997384071350098, "global_step": 178048, "epoch": 4239} {"train_loss": -7.078174591064453, "global_step": 178049, "epoch": 4239} {"train_loss": -6.964087009429932, "global_step": 178050, "epoch": 4239} {"train_loss": -7.007360935211182, "global_step": 178051, "epoch": 4239} {"train_loss": -6.993407249450684, "global_step": 178052, "epoch": 4239} {"train_loss": -7.048976421356201, "global_step": 178053, "epoch": 4239} {"train_loss": -6.9261322021484375, "global_step": 178054, "epoch": 4239} {"train_loss": -7.1206955909729, "global_step": 178055, "epoch": 4239} {"train_loss": -7.037651538848877, "global_step": 178056, "epoch": 4239} {"train_loss": -7.056535720825195, "global_step": 178057, "epoch": 4239} {"train_loss": -7.11704158782959, "global_step": 178058, "epoch": 4239} {"train_loss": -6.978914260864258, "global_step": 178059, "epoch": 4239} {"train_loss": -6.985042095184326, "global_step": 178060, "epoch": 4239} {"train_loss": -7.0013203620910645, "global_step": 178061, "epoch": 4239} {"train_loss": -7.020707130432129, "global_step": 178062, "epoch": 4239} {"train_loss": -7.145267486572266, "global_step": 178063, "epoch": 4239} {"train_loss": -7.08924674987793, "global_step": 178064, "epoch": 4239} {"train_loss": -6.911309242248535, "global_step": 178065, "epoch": 4239} {"train_loss": -7.07134485244751, "global_step": 178066, "epoch": 4239} {"train_loss": -7.026433944702148, "global_step": 178067, "epoch": 4239} {"train_loss": -6.931153297424316, "global_step": 178068, "epoch": 4239} {"train_loss": -7.138047218322754, "global_step": 178069, "epoch": 4239} {"train_loss": -7.076260566711426, "global_step": 178070, "epoch": 4239} {"train_loss": -7.131278038024902, "global_step": 178071, "epoch": 4239} {"train_loss": -7.133746147155762, "global_step": 178072, "epoch": 4239} {"train_loss": -7.060558319091797, "global_step": 178073, "epoch": 4239} {"train_loss": -7.1382222175598145, "global_step": 178074, "epoch": 4239} {"train_loss": -7.080841064453125, "global_step": 178075, "epoch": 4239} {"train_loss": -7.117288112640381, "global_step": 178076, "epoch": 4239} {"train_loss": -7.040899753570557, "global_step": 178077, "epoch": 4239} {"train_loss": -7.074342727661133, "global_step": 178078, "epoch": 4239} {"train_loss": -7.045009828749157, "global_step": 178079, "epoch": 4239, "val_loss": 68781.9375} {"train_loss": -7.0456929206848145, "global_step": 178080, "epoch": 4240} {"train_loss": -7.185196876525879, "global_step": 178081, "epoch": 4240} {"train_loss": -7.017425537109375, "global_step": 178082, "epoch": 4240} {"train_loss": -6.977656364440918, "global_step": 178083, "epoch": 4240} {"train_loss": -7.0662055015563965, "global_step": 178084, "epoch": 4240} {"train_loss": -7.210546493530273, "global_step": 178085, "epoch": 4240} {"train_loss": -6.991379737854004, "global_step": 178086, "epoch": 4240} {"train_loss": -6.958912372589111, "global_step": 178087, "epoch": 4240} {"train_loss": -7.1533002853393555, "global_step": 178088, "epoch": 4240} {"train_loss": -7.107850551605225, "global_step": 178089, "epoch": 4240} {"train_loss": -7.168008327484131, "global_step": 178090, "epoch": 4240} {"train_loss": -6.956937789916992, "global_step": 178091, "epoch": 4240} {"train_loss": -7.0120344161987305, "global_step": 178092, "epoch": 4240} {"train_loss": -7.108004570007324, "global_step": 178093, "epoch": 4240} {"train_loss": -7.031196594238281, "global_step": 178094, "epoch": 4240} {"train_loss": -7.046196937561035, "global_step": 178095, "epoch": 4240} {"train_loss": -7.139453887939453, "global_step": 178096, "epoch": 4240} {"train_loss": -7.105777263641357, "global_step": 178097, "epoch": 4240} {"train_loss": -7.068093299865723, "global_step": 178098, "epoch": 4240} {"train_loss": -7.118100166320801, "global_step": 178099, "epoch": 4240} {"train_loss": -6.964276313781738, "global_step": 178100, "epoch": 4240} {"train_loss": -7.047098636627197, "global_step": 178101, "epoch": 4240} {"train_loss": -7.027678966522217, "global_step": 178102, "epoch": 4240} {"train_loss": -7.10329532623291, "global_step": 178103, "epoch": 4240} {"train_loss": -7.097766876220703, "global_step": 178104, "epoch": 4240} {"train_loss": -7.035325050354004, "global_step": 178105, "epoch": 4240} {"train_loss": -7.090364933013916, "global_step": 178106, "epoch": 4240} {"train_loss": -6.98531436920166, "global_step": 178107, "epoch": 4240} {"train_loss": -7.062664985656738, "global_step": 178108, "epoch": 4240} {"train_loss": -7.023041248321533, "global_step": 178109, "epoch": 4240} {"train_loss": -6.8731231689453125, "global_step": 178110, "epoch": 4240} {"train_loss": -7.075985908508301, "global_step": 178111, "epoch": 4240} {"train_loss": -7.0414347648620605, "global_step": 178112, "epoch": 4240} {"train_loss": -7.078107833862305, "global_step": 178113, "epoch": 4240} {"train_loss": -6.922057151794434, "global_step": 178114, "epoch": 4240} {"train_loss": -7.0069732666015625, "global_step": 178115, "epoch": 4240} {"train_loss": -7.099576950073242, "global_step": 178116, "epoch": 4240} {"train_loss": -7.0335373878479, "global_step": 178117, "epoch": 4240} {"train_loss": -7.04750919342041, "global_step": 178118, "epoch": 4240} {"train_loss": -6.89316987991333, "global_step": 178119, "epoch": 4240} {"train_loss": -7.050163745880127, "global_step": 178120, "epoch": 4240} {"train_loss": -7.049348944709415, "global_step": 178121, "epoch": 4240, "val_loss": 68670.8984375} {"train_loss": -7.055255889892578, "global_step": 178122, "epoch": 4241} {"train_loss": -7.019286155700684, "global_step": 178123, "epoch": 4241} {"train_loss": -7.012914657592773, "global_step": 178124, "epoch": 4241} {"train_loss": -7.010898113250732, "global_step": 178125, "epoch": 4241} {"train_loss": -7.108562469482422, "global_step": 178126, "epoch": 4241} {"train_loss": -7.119219779968262, "global_step": 178127, "epoch": 4241} {"train_loss": -7.021137714385986, "global_step": 178128, "epoch": 4241} {"train_loss": -7.129749774932861, "global_step": 178129, "epoch": 4241} {"train_loss": -7.077178955078125, "global_step": 178130, "epoch": 4241} {"train_loss": -6.908461570739746, "global_step": 178131, "epoch": 4241} {"train_loss": -7.029668807983398, "global_step": 178132, "epoch": 4241} {"train_loss": -6.995270729064941, "global_step": 178133, "epoch": 4241} {"train_loss": -7.017459392547607, "global_step": 178134, "epoch": 4241} {"train_loss": -6.934076309204102, "global_step": 178135, "epoch": 4241} {"train_loss": -7.070204257965088, "global_step": 178136, "epoch": 4241} {"train_loss": -7.0445170402526855, "global_step": 178137, "epoch": 4241} {"train_loss": -6.948836326599121, "global_step": 178138, "epoch": 4241} {"train_loss": -7.0669708251953125, "global_step": 178139, "epoch": 4241} {"train_loss": -6.984701156616211, "global_step": 178140, "epoch": 4241} {"train_loss": -6.9992499351501465, "global_step": 178141, "epoch": 4241} {"train_loss": -7.045527458190918, "global_step": 178142, "epoch": 4241} {"train_loss": -7.092551231384277, "global_step": 178143, "epoch": 4241} {"train_loss": -7.181171894073486, "global_step": 178144, "epoch": 4241} {"train_loss": -7.190138816833496, "global_step": 178145, "epoch": 4241} {"train_loss": -6.978332996368408, "global_step": 178146, "epoch": 4241} {"train_loss": -7.053591251373291, "global_step": 178147, "epoch": 4241} {"train_loss": -6.956323623657227, "global_step": 178148, "epoch": 4241} {"train_loss": -7.204107761383057, "global_step": 178149, "epoch": 4241} {"train_loss": -6.986682415008545, "global_step": 178150, "epoch": 4241} {"train_loss": -7.199304103851318, "global_step": 178151, "epoch": 4241} {"train_loss": -7.061160087585449, "global_step": 178152, "epoch": 4241} {"train_loss": -7.036701679229736, "global_step": 178153, "epoch": 4241} {"train_loss": -7.061379432678223, "global_step": 178154, "epoch": 4241} {"train_loss": -7.046401023864746, "global_step": 178155, "epoch": 4241} {"train_loss": -7.098263263702393, "global_step": 178156, "epoch": 4241} {"train_loss": -7.112262725830078, "global_step": 178157, "epoch": 4241} {"train_loss": -7.063104152679443, "global_step": 178158, "epoch": 4241} {"train_loss": -7.1466803550720215, "global_step": 178159, "epoch": 4241} {"train_loss": -7.056687831878662, "global_step": 178160, "epoch": 4241} {"train_loss": -7.160724639892578, "global_step": 178161, "epoch": 4241} {"train_loss": -7.129533290863037, "global_step": 178162, "epoch": 4241} {"train_loss": -7.05477465902056, "global_step": 178163, "epoch": 4241, "val_loss": 68845.4140625} {"train_loss": -7.15184211730957, "global_step": 178164, "epoch": 4242} {"train_loss": -7.107817649841309, "global_step": 178165, "epoch": 4242} {"train_loss": -7.007049083709717, "global_step": 178166, "epoch": 4242} {"train_loss": -7.008815765380859, "global_step": 178167, "epoch": 4242} {"train_loss": -7.068015098571777, "global_step": 178168, "epoch": 4242} {"train_loss": -7.085953235626221, "global_step": 178169, "epoch": 4242} {"train_loss": -7.006264686584473, "global_step": 178170, "epoch": 4242} {"train_loss": -7.059196949005127, "global_step": 178171, "epoch": 4242} {"train_loss": -7.083259105682373, "global_step": 178172, "epoch": 4242} {"train_loss": -7.1410040855407715, "global_step": 178173, "epoch": 4242} {"train_loss": -7.033634662628174, "global_step": 178174, "epoch": 4242} {"train_loss": -7.124791145324707, "global_step": 178175, "epoch": 4242} {"train_loss": -7.165635108947754, "global_step": 178176, "epoch": 4242} {"train_loss": -7.045721054077148, "global_step": 178177, "epoch": 4242} {"train_loss": -7.058650016784668, "global_step": 178178, "epoch": 4242} {"train_loss": -6.974297046661377, "global_step": 178179, "epoch": 4242} {"train_loss": -6.850870132446289, "global_step": 178180, "epoch": 4242} {"train_loss": -7.130763530731201, "global_step": 178181, "epoch": 4242} {"train_loss": -7.044719696044922, "global_step": 178182, "epoch": 4242} {"train_loss": -6.986767768859863, "global_step": 178183, "epoch": 4242} {"train_loss": -7.123628616333008, "global_step": 178184, "epoch": 4242} {"train_loss": -7.014249801635742, "global_step": 178185, "epoch": 4242} {"train_loss": -7.06298828125, "global_step": 178186, "epoch": 4242} {"train_loss": -7.091582298278809, "global_step": 178187, "epoch": 4242} {"train_loss": -7.000672340393066, "global_step": 178188, "epoch": 4242} {"train_loss": -7.09738826751709, "global_step": 178189, "epoch": 4242} {"train_loss": -7.035261631011963, "global_step": 178190, "epoch": 4242} {"train_loss": -7.076726913452148, "global_step": 178191, "epoch": 4242} {"train_loss": -7.174149513244629, "global_step": 178192, "epoch": 4242} {"train_loss": -7.186368465423584, "global_step": 178193, "epoch": 4242} {"train_loss": -7.138463973999023, "global_step": 178194, "epoch": 4242} {"train_loss": -7.06208610534668, "global_step": 178195, "epoch": 4242} {"train_loss": -7.104396343231201, "global_step": 178196, "epoch": 4242} {"train_loss": -7.094479560852051, "global_step": 178197, "epoch": 4242} {"train_loss": -7.080999374389648, "global_step": 178198, "epoch": 4242} {"train_loss": -7.103590965270996, "global_step": 178199, "epoch": 4242} {"train_loss": -7.057284832000732, "global_step": 178200, "epoch": 4242} {"train_loss": -7.067108154296875, "global_step": 178201, "epoch": 4242} {"train_loss": -7.11381721496582, "global_step": 178202, "epoch": 4242} {"train_loss": -7.058767318725586, "global_step": 178203, "epoch": 4242} {"train_loss": -7.077116012573242, "global_step": 178204, "epoch": 4242} {"train_loss": -7.072947388603573, "global_step": 178205, "epoch": 4242, "val_loss": 68490.8046875} {"train_loss": -7.104382514953613, "global_step": 178206, "epoch": 4243} {"train_loss": -7.099338531494141, "global_step": 178207, "epoch": 4243} {"train_loss": -7.122394561767578, "global_step": 178208, "epoch": 4243} {"train_loss": -7.057080268859863, "global_step": 178209, "epoch": 4243} {"train_loss": -7.024783134460449, "global_step": 178210, "epoch": 4243} {"train_loss": -7.098736763000488, "global_step": 178211, "epoch": 4243} {"train_loss": -6.936154365539551, "global_step": 178212, "epoch": 4243} {"train_loss": -6.967660903930664, "global_step": 178213, "epoch": 4243} {"train_loss": -7.052315711975098, "global_step": 178214, "epoch": 4243} {"train_loss": -7.041945457458496, "global_step": 178215, "epoch": 4243} {"train_loss": -7.076176643371582, "global_step": 178216, "epoch": 4243} {"train_loss": -7.078874588012695, "global_step": 178217, "epoch": 4243} {"train_loss": -7.068986892700195, "global_step": 178218, "epoch": 4243} {"train_loss": -7.090693950653076, "global_step": 178219, "epoch": 4243} {"train_loss": -7.110580921173096, "global_step": 178220, "epoch": 4243} {"train_loss": -7.107392311096191, "global_step": 178221, "epoch": 4243} {"train_loss": -6.963602066040039, "global_step": 178222, "epoch": 4243} {"train_loss": -7.085053443908691, "global_step": 178223, "epoch": 4243} {"train_loss": -6.9961748123168945, "global_step": 178224, "epoch": 4243} {"train_loss": -7.107359886169434, "global_step": 178225, "epoch": 4243} {"train_loss": -7.043619155883789, "global_step": 178226, "epoch": 4243} {"train_loss": -7.102794647216797, "global_step": 178227, "epoch": 4243} {"train_loss": -6.957714080810547, "global_step": 178228, "epoch": 4243} {"train_loss": -7.027413845062256, "global_step": 178229, "epoch": 4243} {"train_loss": -7.130562782287598, "global_step": 178230, "epoch": 4243} {"train_loss": -7.095284938812256, "global_step": 178231, "epoch": 4243} {"train_loss": -7.141478538513184, "global_step": 178232, "epoch": 4243} {"train_loss": -7.179502010345459, "global_step": 178233, "epoch": 4243} {"train_loss": -7.065010070800781, "global_step": 178234, "epoch": 4243} {"train_loss": -6.994593143463135, "global_step": 178235, "epoch": 4243} {"train_loss": -6.937653541564941, "global_step": 178236, "epoch": 4243} {"train_loss": -7.060784339904785, "global_step": 178237, "epoch": 4243} {"train_loss": -7.058207988739014, "global_step": 178238, "epoch": 4243} {"train_loss": -7.050336837768555, "global_step": 178239, "epoch": 4243} {"train_loss": -7.046409606933594, "global_step": 178240, "epoch": 4243} {"train_loss": -7.018206596374512, "global_step": 178241, "epoch": 4243} {"train_loss": -6.895454406738281, "global_step": 178242, "epoch": 4243} {"train_loss": -7.129199028015137, "global_step": 178243, "epoch": 4243} {"train_loss": -7.055182456970215, "global_step": 178244, "epoch": 4243} {"train_loss": -6.864501953125, "global_step": 178245, "epoch": 4243} {"train_loss": -7.045607089996338, "global_step": 178246, "epoch": 4243} {"train_loss": -7.051035892395746, "global_step": 178247, "epoch": 4243, "val_loss": 68721.4453125} {"train_loss": -7.049044609069824, "global_step": 178248, "epoch": 4244} {"train_loss": -7.196535110473633, "global_step": 178249, "epoch": 4244} {"train_loss": -6.960249900817871, "global_step": 178250, "epoch": 4244} {"train_loss": -7.028194427490234, "global_step": 178251, "epoch": 4244} {"train_loss": -7.075709342956543, "global_step": 178252, "epoch": 4244} {"train_loss": -6.940916538238525, "global_step": 178253, "epoch": 4244} {"train_loss": -6.969977855682373, "global_step": 178254, "epoch": 4244} {"train_loss": -7.0275163650512695, "global_step": 178255, "epoch": 4244} {"train_loss": -6.944552898406982, "global_step": 178256, "epoch": 4244} {"train_loss": -6.91705846786499, "global_step": 178257, "epoch": 4244} {"train_loss": -7.033205986022949, "global_step": 178258, "epoch": 4244} {"train_loss": -7.058905601501465, "global_step": 178259, "epoch": 4244} {"train_loss": -6.8973283767700195, "global_step": 178260, "epoch": 4244} {"train_loss": -7.051006317138672, "global_step": 178261, "epoch": 4244} {"train_loss": -6.965027809143066, "global_step": 178262, "epoch": 4244} {"train_loss": -7.044524192810059, "global_step": 178263, "epoch": 4244} {"train_loss": -7.015325546264648, "global_step": 178264, "epoch": 4244} {"train_loss": -7.110208988189697, "global_step": 178265, "epoch": 4244} {"train_loss": -7.03040885925293, "global_step": 178266, "epoch": 4244} {"train_loss": -7.051468372344971, "global_step": 178267, "epoch": 4244} {"train_loss": -7.004610061645508, "global_step": 178268, "epoch": 4244} {"train_loss": -7.020866394042969, "global_step": 178269, "epoch": 4244} {"train_loss": -6.993927478790283, "global_step": 178270, "epoch": 4244} {"train_loss": -7.212808609008789, "global_step": 178271, "epoch": 4244} {"train_loss": -7.127861976623535, "global_step": 178272, "epoch": 4244} {"train_loss": -7.108304500579834, "global_step": 178273, "epoch": 4244} {"train_loss": -7.10884952545166, "global_step": 178274, "epoch": 4244} {"train_loss": -7.106666564941406, "global_step": 178275, "epoch": 4244} {"train_loss": -7.108659744262695, "global_step": 178276, "epoch": 4244} {"train_loss": -7.098088264465332, "global_step": 178277, "epoch": 4244} {"train_loss": -7.102495193481445, "global_step": 178278, "epoch": 4244} {"train_loss": -7.100978851318359, "global_step": 178279, "epoch": 4244} {"train_loss": -7.167730331420898, "global_step": 178280, "epoch": 4244} {"train_loss": -7.034425735473633, "global_step": 178281, "epoch": 4244} {"train_loss": -7.163297653198242, "global_step": 178282, "epoch": 4244} {"train_loss": -6.919615745544434, "global_step": 178283, "epoch": 4244} {"train_loss": -7.14749813079834, "global_step": 178284, "epoch": 4244} {"train_loss": -7.00544548034668, "global_step": 178285, "epoch": 4244} {"train_loss": -7.0053205490112305, "global_step": 178286, "epoch": 4244} {"train_loss": -7.215826511383057, "global_step": 178287, "epoch": 4244} {"train_loss": -7.040589332580566, "global_step": 178288, "epoch": 4244} {"train_loss": -7.05132474218096, "global_step": 178289, "epoch": 4244, "val_loss": 68488.8125} {"train_loss": -6.998132705688477, "global_step": 178290, "epoch": 4245} {"train_loss": -6.898268699645996, "global_step": 178291, "epoch": 4245} {"train_loss": -6.956681251525879, "global_step": 178292, "epoch": 4245} {"train_loss": -6.872028350830078, "global_step": 178293, "epoch": 4245} {"train_loss": -6.9942240715026855, "global_step": 178294, "epoch": 4245} {"train_loss": -6.9685893058776855, "global_step": 178295, "epoch": 4245} {"train_loss": -7.025407791137695, "global_step": 178296, "epoch": 4245} {"train_loss": -7.119648456573486, "global_step": 178297, "epoch": 4245} {"train_loss": -7.025913715362549, "global_step": 178298, "epoch": 4245} {"train_loss": -7.171205520629883, "global_step": 178299, "epoch": 4245} {"train_loss": -6.928528785705566, "global_step": 178300, "epoch": 4245} {"train_loss": -7.087380409240723, "global_step": 178301, "epoch": 4245} {"train_loss": -7.093822002410889, "global_step": 178302, "epoch": 4245} {"train_loss": -7.11903190612793, "global_step": 178303, "epoch": 4245} {"train_loss": -7.067990779876709, "global_step": 178304, "epoch": 4245} {"train_loss": -7.015143394470215, "global_step": 178305, "epoch": 4245} {"train_loss": -7.0126872062683105, "global_step": 178306, "epoch": 4245} {"train_loss": -7.1128644943237305, "global_step": 178307, "epoch": 4245} {"train_loss": -7.080962657928467, "global_step": 178308, "epoch": 4245} {"train_loss": -7.076946258544922, "global_step": 178309, "epoch": 4245} {"train_loss": -6.958423614501953, "global_step": 178310, "epoch": 4245} {"train_loss": -7.006398677825928, "global_step": 178311, "epoch": 4245} {"train_loss": -6.986781597137451, "global_step": 178312, "epoch": 4245} {"train_loss": -6.939952850341797, "global_step": 178313, "epoch": 4245} {"train_loss": -6.996283531188965, "global_step": 178314, "epoch": 4245} {"train_loss": -6.991724014282227, "global_step": 178315, "epoch": 4245} {"train_loss": -7.047241687774658, "global_step": 178316, "epoch": 4245} {"train_loss": -7.05349063873291, "global_step": 178317, "epoch": 4245} {"train_loss": -6.911396026611328, "global_step": 178318, "epoch": 4245} {"train_loss": -6.929775238037109, "global_step": 178319, "epoch": 4245} {"train_loss": -6.9422760009765625, "global_step": 178320, "epoch": 4245} {"train_loss": -6.906269073486328, "global_step": 178321, "epoch": 4245} {"train_loss": -7.052676200866699, "global_step": 178322, "epoch": 4245} {"train_loss": -6.995796203613281, "global_step": 178323, "epoch": 4245} {"train_loss": -7.067707061767578, "global_step": 178324, "epoch": 4245} {"train_loss": -7.044589042663574, "global_step": 178325, "epoch": 4245} {"train_loss": -6.8829755783081055, "global_step": 178326, "epoch": 4245} {"train_loss": -6.966324806213379, "global_step": 178327, "epoch": 4245} {"train_loss": -6.978963375091553, "global_step": 178328, "epoch": 4245} {"train_loss": -6.829482078552246, "global_step": 178329, "epoch": 4245} {"train_loss": -7.143779277801514, "global_step": 178330, "epoch": 4245} {"train_loss": -7.0052143051510765, "global_step": 178331, "epoch": 4245, "val_loss": 68643.7734375} {"train_loss": -7.044095993041992, "global_step": 178332, "epoch": 4246} {"train_loss": -7.149288654327393, "global_step": 178333, "epoch": 4246} {"train_loss": -6.9249467849731445, "global_step": 178334, "epoch": 4246} {"train_loss": -7.062262535095215, "global_step": 178335, "epoch": 4246} {"train_loss": -7.04337739944458, "global_step": 178336, "epoch": 4246} {"train_loss": -7.060115337371826, "global_step": 178337, "epoch": 4246} {"train_loss": -7.091083526611328, "global_step": 178338, "epoch": 4246} {"train_loss": -7.032533645629883, "global_step": 178339, "epoch": 4246} {"train_loss": -7.045241355895996, "global_step": 178340, "epoch": 4246} {"train_loss": -7.082983016967773, "global_step": 178341, "epoch": 4246} {"train_loss": -7.027459144592285, "global_step": 178342, "epoch": 4246} {"train_loss": -7.034735202789307, "global_step": 178343, "epoch": 4246} {"train_loss": -7.060035705566406, "global_step": 178344, "epoch": 4246} {"train_loss": -7.025280952453613, "global_step": 178345, "epoch": 4246} {"train_loss": -7.136209487915039, "global_step": 178346, "epoch": 4246} {"train_loss": -7.15802001953125, "global_step": 178347, "epoch": 4246} {"train_loss": -7.165593147277832, "global_step": 178348, "epoch": 4246} {"train_loss": -7.131477355957031, "global_step": 178349, "epoch": 4246} {"train_loss": -7.115939617156982, "global_step": 178350, "epoch": 4246} {"train_loss": -7.016975402832031, "global_step": 178351, "epoch": 4246} {"train_loss": -7.156458854675293, "global_step": 178352, "epoch": 4246} {"train_loss": -7.073907852172852, "global_step": 178353, "epoch": 4246} {"train_loss": -6.987206935882568, "global_step": 178354, "epoch": 4246} {"train_loss": -7.092654705047607, "global_step": 178355, "epoch": 4246} {"train_loss": -7.192654132843018, "global_step": 178356, "epoch": 4246} {"train_loss": -7.136598587036133, "global_step": 178357, "epoch": 4246} {"train_loss": -7.10958194732666, "global_step": 178358, "epoch": 4246} {"train_loss": -7.127915859222412, "global_step": 178359, "epoch": 4246} {"train_loss": -6.947573661804199, "global_step": 178360, "epoch": 4246} {"train_loss": -7.118720054626465, "global_step": 178361, "epoch": 4246} {"train_loss": -7.069443702697754, "global_step": 178362, "epoch": 4246} {"train_loss": -7.098733901977539, "global_step": 178363, "epoch": 4246} {"train_loss": -7.1062703132629395, "global_step": 178364, "epoch": 4246} {"train_loss": -7.16438627243042, "global_step": 178365, "epoch": 4246} {"train_loss": -7.0665764808654785, "global_step": 178366, "epoch": 4246} {"train_loss": -7.057015419006348, "global_step": 178367, "epoch": 4246} {"train_loss": -7.087000846862793, "global_step": 178368, "epoch": 4246} {"train_loss": -7.082005500793457, "global_step": 178369, "epoch": 4246} {"train_loss": -7.0033278465271, "global_step": 178370, "epoch": 4246} {"train_loss": -7.128558158874512, "global_step": 178371, "epoch": 4246} {"train_loss": -7.050151824951172, "global_step": 178372, "epoch": 4246} {"train_loss": -7.0816517898014615, "global_step": 178373, "epoch": 4246, "val_loss": 68877.8984375} {"train_loss": -7.050743103027344, "global_step": 178374, "epoch": 4247} {"train_loss": -7.068373680114746, "global_step": 178375, "epoch": 4247} {"train_loss": -7.100830078125, "global_step": 178376, "epoch": 4247} {"train_loss": -7.143927574157715, "global_step": 178377, "epoch": 4247} {"train_loss": -6.951342582702637, "global_step": 178378, "epoch": 4247} {"train_loss": -7.04511022567749, "global_step": 178379, "epoch": 4247} {"train_loss": -7.076957702636719, "global_step": 178380, "epoch": 4247} {"train_loss": -6.940839767456055, "global_step": 178381, "epoch": 4247} {"train_loss": -7.140704154968262, "global_step": 178382, "epoch": 4247} {"train_loss": -7.023192882537842, "global_step": 178383, "epoch": 4247} {"train_loss": -7.051154136657715, "global_step": 178384, "epoch": 4247} {"train_loss": -6.998300552368164, "global_step": 178385, "epoch": 4247} {"train_loss": -7.094141006469727, "global_step": 178386, "epoch": 4247} {"train_loss": -7.023666858673096, "global_step": 178387, "epoch": 4247} {"train_loss": -7.073556423187256, "global_step": 178388, "epoch": 4247} {"train_loss": -7.15591287612915, "global_step": 178389, "epoch": 4247} {"train_loss": -7.065541744232178, "global_step": 178390, "epoch": 4247} {"train_loss": -7.0793352127075195, "global_step": 178391, "epoch": 4247} {"train_loss": -7.077322006225586, "global_step": 178392, "epoch": 4247} {"train_loss": -7.018471717834473, "global_step": 178393, "epoch": 4247} {"train_loss": -7.056623458862305, "global_step": 178394, "epoch": 4247} {"train_loss": -7.100134372711182, "global_step": 178395, "epoch": 4247} {"train_loss": -6.951700210571289, "global_step": 178396, "epoch": 4247} {"train_loss": -7.0265607833862305, "global_step": 178397, "epoch": 4247} {"train_loss": -7.047853469848633, "global_step": 178398, "epoch": 4247} {"train_loss": -6.95395565032959, "global_step": 178399, "epoch": 4247} {"train_loss": -7.090750694274902, "global_step": 178400, "epoch": 4247} {"train_loss": -7.204052925109863, "global_step": 178401, "epoch": 4247} {"train_loss": -6.914936542510986, "global_step": 178402, "epoch": 4247} {"train_loss": -7.164455413818359, "global_step": 178403, "epoch": 4247} {"train_loss": -7.168726444244385, "global_step": 178404, "epoch": 4247} {"train_loss": -6.870168209075928, "global_step": 178405, "epoch": 4247} {"train_loss": -7.063379287719727, "global_step": 178406, "epoch": 4247} {"train_loss": -7.026830196380615, "global_step": 178407, "epoch": 4247} {"train_loss": -7.1859540939331055, "global_step": 178408, "epoch": 4247} {"train_loss": -6.970280170440674, "global_step": 178409, "epoch": 4247} {"train_loss": -7.0360212326049805, "global_step": 178410, "epoch": 4247} {"train_loss": -7.056429862976074, "global_step": 178411, "epoch": 4247} {"train_loss": -7.048361301422119, "global_step": 178412, "epoch": 4247} {"train_loss": -7.127805709838867, "global_step": 178413, "epoch": 4247} {"train_loss": -6.958067893981934, "global_step": 178414, "epoch": 4247} {"train_loss": -7.051890668414888, "global_step": 178415, "epoch": 4247, "val_loss": 68660.5625} {"train_loss": -7.175586700439453, "global_step": 178416, "epoch": 4248} {"train_loss": -6.993525505065918, "global_step": 178417, "epoch": 4248} {"train_loss": -7.059788703918457, "global_step": 178418, "epoch": 4248} {"train_loss": -7.0999436378479, "global_step": 178419, "epoch": 4248} {"train_loss": -7.044367790222168, "global_step": 178420, "epoch": 4248} {"train_loss": -7.093941688537598, "global_step": 178421, "epoch": 4248} {"train_loss": -6.993030548095703, "global_step": 178422, "epoch": 4248} {"train_loss": -7.056209564208984, "global_step": 178423, "epoch": 4248} {"train_loss": -7.019384384155273, "global_step": 178424, "epoch": 4248} {"train_loss": -6.956386089324951, "global_step": 178425, "epoch": 4248} {"train_loss": -6.9257049560546875, "global_step": 178426, "epoch": 4248} {"train_loss": -6.9411516189575195, "global_step": 178427, "epoch": 4248} {"train_loss": -6.94454288482666, "global_step": 178428, "epoch": 4248} {"train_loss": -7.057000637054443, "global_step": 178429, "epoch": 4248} {"train_loss": -6.974717140197754, "global_step": 178430, "epoch": 4248} {"train_loss": -6.968775749206543, "global_step": 178431, "epoch": 4248} {"train_loss": -6.7668681144714355, "global_step": 178432, "epoch": 4248} {"train_loss": -6.87552547454834, "global_step": 178433, "epoch": 4248} {"train_loss": -6.986226558685303, "global_step": 178434, "epoch": 4248} {"train_loss": -6.856246471405029, "global_step": 178435, "epoch": 4248} {"train_loss": -7.043277740478516, "global_step": 178436, "epoch": 4248} {"train_loss": -6.859450817108154, "global_step": 178437, "epoch": 4248} {"train_loss": -6.902113914489746, "global_step": 178438, "epoch": 4248} {"train_loss": -6.8821258544921875, "global_step": 178439, "epoch": 4248} {"train_loss": -7.036118507385254, "global_step": 178440, "epoch": 4248} {"train_loss": -6.836273670196533, "global_step": 178441, "epoch": 4248} {"train_loss": -7.007757186889648, "global_step": 178442, "epoch": 4248} {"train_loss": -6.980161666870117, "global_step": 178443, "epoch": 4248} {"train_loss": -7.038744926452637, "global_step": 178444, "epoch": 4248} {"train_loss": -6.968179702758789, "global_step": 178445, "epoch": 4248} {"train_loss": -6.979176998138428, "global_step": 178446, "epoch": 4248} {"train_loss": -6.942837715148926, "global_step": 178447, "epoch": 4248} {"train_loss": -7.132702827453613, "global_step": 178448, "epoch": 4248} {"train_loss": -7.043920993804932, "global_step": 178449, "epoch": 4248} {"train_loss": -6.912685394287109, "global_step": 178450, "epoch": 4248} {"train_loss": -7.069125175476074, "global_step": 178451, "epoch": 4248} {"train_loss": -7.060982704162598, "global_step": 178452, "epoch": 4248} {"train_loss": -7.072312355041504, "global_step": 178453, "epoch": 4248} {"train_loss": -6.95558500289917, "global_step": 178454, "epoch": 4248} {"train_loss": -7.049187660217285, "global_step": 178455, "epoch": 4248} {"train_loss": -7.035170555114746, "global_step": 178456, "epoch": 4248} {"train_loss": -6.99199238277617, "global_step": 178457, "epoch": 4248, "val_loss": 68604.0625} {"train_loss": -7.117867946624756, "global_step": 178458, "epoch": 4249} {"train_loss": -7.119509696960449, "global_step": 178459, "epoch": 4249} {"train_loss": -7.153390407562256, "global_step": 178460, "epoch": 4249} {"train_loss": -7.043096542358398, "global_step": 178461, "epoch": 4249} {"train_loss": -7.0363359451293945, "global_step": 178462, "epoch": 4249} {"train_loss": -7.025426864624023, "global_step": 178463, "epoch": 4249} {"train_loss": -7.035275459289551, "global_step": 178464, "epoch": 4249} {"train_loss": -7.137076377868652, "global_step": 178465, "epoch": 4249} {"train_loss": -7.18454647064209, "global_step": 178466, "epoch": 4249} {"train_loss": -7.063326358795166, "global_step": 178467, "epoch": 4249} {"train_loss": -7.092783451080322, "global_step": 178468, "epoch": 4249} {"train_loss": -7.054065704345703, "global_step": 178469, "epoch": 4249} {"train_loss": -7.110281944274902, "global_step": 178470, "epoch": 4249} {"train_loss": -7.040647983551025, "global_step": 178471, "epoch": 4249} {"train_loss": -7.0905609130859375, "global_step": 178472, "epoch": 4249} {"train_loss": -7.072063446044922, "global_step": 178473, "epoch": 4249} {"train_loss": -7.081723213195801, "global_step": 178474, "epoch": 4249} {"train_loss": -7.121054172515869, "global_step": 178475, "epoch": 4249} {"train_loss": -6.999912261962891, "global_step": 178476, "epoch": 4249} {"train_loss": -7.051004409790039, "global_step": 178477, "epoch": 4249} {"train_loss": -7.037245750427246, "global_step": 178478, "epoch": 4249} {"train_loss": -7.1449127197265625, "global_step": 178479, "epoch": 4249} {"train_loss": -7.1138505935668945, "global_step": 178480, "epoch": 4249} {"train_loss": -7.03826379776001, "global_step": 178481, "epoch": 4249} {"train_loss": -7.01237154006958, "global_step": 178482, "epoch": 4249} {"train_loss": -7.103579998016357, "global_step": 178483, "epoch": 4249} {"train_loss": -7.038128852844238, "global_step": 178484, "epoch": 4249} {"train_loss": -7.14091157913208, "global_step": 178485, "epoch": 4249} {"train_loss": -6.971250534057617, "global_step": 178486, "epoch": 4249} {"train_loss": -7.114712238311768, "global_step": 178487, "epoch": 4249} {"train_loss": -7.1045122146606445, "global_step": 178488, "epoch": 4249} {"train_loss": -7.13365364074707, "global_step": 178489, "epoch": 4249} {"train_loss": -7.046027660369873, "global_step": 178490, "epoch": 4249} {"train_loss": -7.120396614074707, "global_step": 178491, "epoch": 4249} {"train_loss": -7.098418712615967, "global_step": 178492, "epoch": 4249} {"train_loss": -7.0654754638671875, "global_step": 178493, "epoch": 4249} {"train_loss": -7.100872039794922, "global_step": 178494, "epoch": 4249} {"train_loss": -7.091998100280762, "global_step": 178495, "epoch": 4249} {"train_loss": -7.118587970733643, "global_step": 178496, "epoch": 4249} {"train_loss": -7.15785026550293, "global_step": 178497, "epoch": 4249} {"train_loss": -7.0633745193481445, "global_step": 178498, "epoch": 4249} {"train_loss": -7.083685012090774, "global_step": 178499, "epoch": 4249, "val_loss": 68580.421875} {"train_loss": -7.033116340637207, "global_step": 178500, "epoch": 4250} {"train_loss": -7.028594017028809, "global_step": 178501, "epoch": 4250} {"train_loss": -7.069714069366455, "global_step": 178502, "epoch": 4250} {"train_loss": -7.128901481628418, "global_step": 178503, "epoch": 4250} {"train_loss": -7.02395486831665, "global_step": 178504, "epoch": 4250} {"train_loss": -7.121051788330078, "global_step": 178505, "epoch": 4250} {"train_loss": -7.049882888793945, "global_step": 178506, "epoch": 4250} {"train_loss": -6.999875068664551, "global_step": 178507, "epoch": 4250} {"train_loss": -7.099605560302734, "global_step": 178508, "epoch": 4250} {"train_loss": -6.950776100158691, "global_step": 178509, "epoch": 4250} {"train_loss": -6.9952073097229, "global_step": 178510, "epoch": 4250} {"train_loss": -7.071796417236328, "global_step": 178511, "epoch": 4250} {"train_loss": -7.085732460021973, "global_step": 178512, "epoch": 4250} {"train_loss": -7.0570244789123535, "global_step": 178513, "epoch": 4250} {"train_loss": -6.944748878479004, "global_step": 178514, "epoch": 4250} {"train_loss": -7.091495513916016, "global_step": 178515, "epoch": 4250} {"train_loss": -7.0320210456848145, "global_step": 178516, "epoch": 4250} {"train_loss": -6.985261917114258, "global_step": 178517, "epoch": 4250} {"train_loss": -6.984013080596924, "global_step": 178518, "epoch": 4250} {"train_loss": -7.113533973693848, "global_step": 178519, "epoch": 4250} {"train_loss": -6.9319844245910645, "global_step": 178520, "epoch": 4250} {"train_loss": -6.977297306060791, "global_step": 178521, "epoch": 4250} {"train_loss": -7.074896812438965, "global_step": 178522, "epoch": 4250} {"train_loss": -7.014045715332031, "global_step": 178523, "epoch": 4250} {"train_loss": -6.8843607902526855, "global_step": 178524, "epoch": 4250} {"train_loss": -6.991094589233398, "global_step": 178525, "epoch": 4250} {"train_loss": -6.89049768447876, "global_step": 178526, "epoch": 4250} {"train_loss": -6.973844528198242, "global_step": 178527, "epoch": 4250} {"train_loss": -7.008271217346191, "global_step": 178528, "epoch": 4250} {"train_loss": -7.042957305908203, "global_step": 178529, "epoch": 4250} {"train_loss": -6.950887680053711, "global_step": 178530, "epoch": 4250} {"train_loss": -7.097867965698242, "global_step": 178531, "epoch": 4250} {"train_loss": -7.10736083984375, "global_step": 178532, "epoch": 4250} {"train_loss": -7.001009941101074, "global_step": 178533, "epoch": 4250} {"train_loss": -7.029084205627441, "global_step": 178534, "epoch": 4250} {"train_loss": -7.069234371185303, "global_step": 178535, "epoch": 4250} {"train_loss": -7.000800609588623, "global_step": 178536, "epoch": 4250} {"train_loss": -7.0380706787109375, "global_step": 178537, "epoch": 4250} {"train_loss": -7.103084564208984, "global_step": 178538, "epoch": 4250} {"train_loss": -7.049186706542969, "global_step": 178539, "epoch": 4250} {"train_loss": -6.990067481994629, "global_step": 178540, "epoch": 4250} {"train_loss": -7.028453838257563, "global_step": 178541, "epoch": 4250, "train/sim_max_reward_0": 0.2525291619138071, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.9992329000513279, "train/sim_max_reward_3": 0.13692890584258594, "train/sim_max_reward_4": 0.9596922370238619, "train/sim_max_reward_5": 0.19566450822028209, "test/sim_max_reward_4400000": 0.21462163306982748, "test/sim_max_reward_4400001": 0.20800873379157697, "test/sim_max_reward_4400002": 0.9341563214283227, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.2850629441588417, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.30908660691948664, "test/sim_max_reward_4400009": 0.8934903852373617, "test/sim_max_reward_4400010": 0.1918401800825645, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.924691468234026, "test/sim_max_reward_4400013": 0.4028326434026052, "test/sim_max_reward_4400014": 0.5771321923202419, "test/sim_max_reward_4400015": 0.9828045361405925, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.6674822829429953, "test/sim_max_reward_4400018": 0.5050303653607802, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.1183288790007132, "test/sim_max_reward_4400023": 0.9695764725043393, "test/sim_max_reward_4400024": 0.9452729644764876, "test/sim_max_reward_4400025": 0.2692211521610712, "test/sim_max_reward_4400026": 0.6783605605624949, "test/sim_max_reward_4400027": 0.026917207954135287, "test/sim_max_reward_4400028": 0.9815970438316713, "test/sim_max_reward_4400029": 0.9747726118129807, "test/sim_max_reward_4400030": 0.9327941736508006, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9370893984305878, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.4707961746102434, "test/sim_max_reward_4400036": 0.557017444875265, "test/sim_max_reward_4400037": 0.8544827468591294, "test/sim_max_reward_4400038": 0.9433453469844824, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.9624497263737963, "test/sim_max_reward_4400044": 0.9913232499861279, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8411198824067309, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 0.9762184867094622, "train/mean_score": 0.5906746188419775, "test/mean_score": 0.6214623759362128, "val_loss": 68569.4453125} {"train_loss": -7.072235107421875, "global_step": 178542, "epoch": 4251} {"train_loss": -7.190308094024658, "global_step": 178543, "epoch": 4251} {"train_loss": -7.132842063903809, "global_step": 178544, "epoch": 4251} {"train_loss": -7.06066370010376, "global_step": 178545, "epoch": 4251} {"train_loss": -7.121310234069824, "global_step": 178546, "epoch": 4251} {"train_loss": -7.002969264984131, "global_step": 178547, "epoch": 4251} {"train_loss": -7.067375659942627, "global_step": 178548, "epoch": 4251} {"train_loss": -7.021067142486572, "global_step": 178549, "epoch": 4251} {"train_loss": -7.137136459350586, "global_step": 178550, "epoch": 4251} {"train_loss": -7.035028457641602, "global_step": 178551, "epoch": 4251} {"train_loss": -7.022443771362305, "global_step": 178552, "epoch": 4251} {"train_loss": -7.13359260559082, "global_step": 178553, "epoch": 4251} {"train_loss": -7.08256721496582, "global_step": 178554, "epoch": 4251} {"train_loss": -7.099950790405273, "global_step": 178555, "epoch": 4251} {"train_loss": -7.002266883850098, "global_step": 178556, "epoch": 4251} {"train_loss": -7.173887729644775, "global_step": 178557, "epoch": 4251} {"train_loss": -7.021434307098389, "global_step": 178558, "epoch": 4251} {"train_loss": -6.945218086242676, "global_step": 178559, "epoch": 4251} {"train_loss": -6.889062881469727, "global_step": 178560, "epoch": 4251} {"train_loss": -6.9533772468566895, "global_step": 178561, "epoch": 4251} {"train_loss": -7.152614593505859, "global_step": 178562, "epoch": 4251} {"train_loss": -7.025793075561523, "global_step": 178563, "epoch": 4251} {"train_loss": -7.076531410217285, "global_step": 178564, "epoch": 4251} {"train_loss": -7.02015495300293, "global_step": 178565, "epoch": 4251} {"train_loss": -7.097577095031738, "global_step": 178566, "epoch": 4251} {"train_loss": -7.026009559631348, "global_step": 178567, "epoch": 4251} {"train_loss": -6.984029293060303, "global_step": 178568, "epoch": 4251} {"train_loss": -7.070995330810547, "global_step": 178569, "epoch": 4251} {"train_loss": -6.977065563201904, "global_step": 178570, "epoch": 4251} {"train_loss": -7.073940277099609, "global_step": 178571, "epoch": 4251} {"train_loss": -7.0856757164001465, "global_step": 178572, "epoch": 4251} {"train_loss": -7.030074596405029, "global_step": 178573, "epoch": 4251} {"train_loss": -7.0921220779418945, "global_step": 178574, "epoch": 4251} {"train_loss": -7.024095058441162, "global_step": 178575, "epoch": 4251} {"train_loss": -7.059479236602783, "global_step": 178576, "epoch": 4251} {"train_loss": -7.093358993530273, "global_step": 178577, "epoch": 4251} {"train_loss": -7.053956985473633, "global_step": 178578, "epoch": 4251} {"train_loss": -7.056614875793457, "global_step": 178579, "epoch": 4251} {"train_loss": -6.971195220947266, "global_step": 178580, "epoch": 4251} {"train_loss": -7.036862373352051, "global_step": 178581, "epoch": 4251} {"train_loss": -7.0413103103637695, "global_step": 178582, "epoch": 4251} {"train_loss": -7.053655919574556, "global_step": 178583, "epoch": 4251, "val_loss": 68782.5078125} {"train_loss": -6.995140075683594, "global_step": 178584, "epoch": 4252} {"train_loss": -7.069803714752197, "global_step": 178585, "epoch": 4252} {"train_loss": -6.949123859405518, "global_step": 178586, "epoch": 4252} {"train_loss": -7.166571617126465, "global_step": 178587, "epoch": 4252} {"train_loss": -6.967558860778809, "global_step": 178588, "epoch": 4252} {"train_loss": -6.977912902832031, "global_step": 178589, "epoch": 4252} {"train_loss": -7.178701877593994, "global_step": 178590, "epoch": 4252} {"train_loss": -7.010656356811523, "global_step": 178591, "epoch": 4252} {"train_loss": -7.067483901977539, "global_step": 178592, "epoch": 4252} {"train_loss": -7.204671382904053, "global_step": 178593, "epoch": 4252} {"train_loss": -7.120086193084717, "global_step": 178594, "epoch": 4252} {"train_loss": -7.215234756469727, "global_step": 178595, "epoch": 4252} {"train_loss": -7.227148056030273, "global_step": 178596, "epoch": 4252} {"train_loss": -7.069729328155518, "global_step": 178597, "epoch": 4252} {"train_loss": -7.1654558181762695, "global_step": 178598, "epoch": 4252} {"train_loss": -7.101478099822998, "global_step": 178599, "epoch": 4252} {"train_loss": -6.974924564361572, "global_step": 178600, "epoch": 4252} {"train_loss": -7.091419696807861, "global_step": 178601, "epoch": 4252} {"train_loss": -7.067339897155762, "global_step": 178602, "epoch": 4252} {"train_loss": -7.043262481689453, "global_step": 178603, "epoch": 4252} {"train_loss": -7.233725547790527, "global_step": 178604, "epoch": 4252} {"train_loss": -7.079402923583984, "global_step": 178605, "epoch": 4252} {"train_loss": -7.107150554656982, "global_step": 178606, "epoch": 4252} {"train_loss": -7.078815460205078, "global_step": 178607, "epoch": 4252} {"train_loss": -7.055387496948242, "global_step": 178608, "epoch": 4252} {"train_loss": -7.135647773742676, "global_step": 178609, "epoch": 4252} {"train_loss": -7.149363994598389, "global_step": 178610, "epoch": 4252} {"train_loss": -7.055440902709961, "global_step": 178611, "epoch": 4252} {"train_loss": -7.111412048339844, "global_step": 178612, "epoch": 4252} {"train_loss": -7.136053085327148, "global_step": 178613, "epoch": 4252} {"train_loss": -7.035621643066406, "global_step": 178614, "epoch": 4252} {"train_loss": -7.11046028137207, "global_step": 178615, "epoch": 4252} {"train_loss": -6.978577613830566, "global_step": 178616, "epoch": 4252} {"train_loss": -7.106579303741455, "global_step": 178617, "epoch": 4252} {"train_loss": -6.9996113777160645, "global_step": 178618, "epoch": 4252} {"train_loss": -7.091244220733643, "global_step": 178619, "epoch": 4252} {"train_loss": -7.015600204467773, "global_step": 178620, "epoch": 4252} {"train_loss": -7.0260725021362305, "global_step": 178621, "epoch": 4252} {"train_loss": -7.132227897644043, "global_step": 178622, "epoch": 4252} {"train_loss": -6.962536811828613, "global_step": 178623, "epoch": 4252} {"train_loss": -7.005484104156494, "global_step": 178624, "epoch": 4252} {"train_loss": -7.078971567608061, "global_step": 178625, "epoch": 4252, "val_loss": 68847.484375} {"train_loss": -6.898175239562988, "global_step": 178626, "epoch": 4253} {"train_loss": -6.9084625244140625, "global_step": 178627, "epoch": 4253} {"train_loss": -6.91502046585083, "global_step": 178628, "epoch": 4253} {"train_loss": -7.100653648376465, "global_step": 178629, "epoch": 4253} {"train_loss": -6.848389148712158, "global_step": 178630, "epoch": 4253} {"train_loss": -6.886312007904053, "global_step": 178631, "epoch": 4253} {"train_loss": -6.910906791687012, "global_step": 178632, "epoch": 4253} {"train_loss": -6.934313774108887, "global_step": 178633, "epoch": 4253} {"train_loss": -6.935778617858887, "global_step": 178634, "epoch": 4253} {"train_loss": -6.945528984069824, "global_step": 178635, "epoch": 4253} {"train_loss": -6.773393630981445, "global_step": 178636, "epoch": 4253} {"train_loss": -6.973097324371338, "global_step": 178637, "epoch": 4253} {"train_loss": -6.783370018005371, "global_step": 178638, "epoch": 4253} {"train_loss": -7.111084938049316, "global_step": 178639, "epoch": 4253} {"train_loss": -6.847255229949951, "global_step": 178640, "epoch": 4253} {"train_loss": -6.962651252746582, "global_step": 178641, "epoch": 4253} {"train_loss": -6.957200527191162, "global_step": 178642, "epoch": 4253} {"train_loss": -6.861435890197754, "global_step": 178643, "epoch": 4253} {"train_loss": -7.004843711853027, "global_step": 178644, "epoch": 4253} {"train_loss": -7.081876754760742, "global_step": 178645, "epoch": 4253} {"train_loss": -6.917008876800537, "global_step": 178646, "epoch": 4253} {"train_loss": -7.1054158210754395, "global_step": 178647, "epoch": 4253} {"train_loss": -7.012613296508789, "global_step": 178648, "epoch": 4253} {"train_loss": -6.986181259155273, "global_step": 178649, "epoch": 4253} {"train_loss": -7.0786638259887695, "global_step": 178650, "epoch": 4253} {"train_loss": -6.987215995788574, "global_step": 178651, "epoch": 4253} {"train_loss": -7.081720352172852, "global_step": 178652, "epoch": 4253} {"train_loss": -7.005059242248535, "global_step": 178653, "epoch": 4253} {"train_loss": -6.994714736938477, "global_step": 178654, "epoch": 4253} {"train_loss": -7.086702346801758, "global_step": 178655, "epoch": 4253} {"train_loss": -7.059553146362305, "global_step": 178656, "epoch": 4253} {"train_loss": -7.090678691864014, "global_step": 178657, "epoch": 4253} {"train_loss": -7.067729949951172, "global_step": 178658, "epoch": 4253} {"train_loss": -6.994576454162598, "global_step": 178659, "epoch": 4253} {"train_loss": -7.045139312744141, "global_step": 178660, "epoch": 4253} {"train_loss": -7.032052040100098, "global_step": 178661, "epoch": 4253} {"train_loss": -7.065460681915283, "global_step": 178662, "epoch": 4253} {"train_loss": -7.12844181060791, "global_step": 178663, "epoch": 4253} {"train_loss": -7.160701751708984, "global_step": 178664, "epoch": 4253} {"train_loss": -7.215035438537598, "global_step": 178665, "epoch": 4253} {"train_loss": -7.060520172119141, "global_step": 178666, "epoch": 4253} {"train_loss": -6.994521776835124, "global_step": 178667, "epoch": 4253, "val_loss": 68894.4765625} {"train_loss": -6.970132827758789, "global_step": 178668, "epoch": 4254} {"train_loss": -7.0633649826049805, "global_step": 178669, "epoch": 4254} {"train_loss": -7.144322395324707, "global_step": 178670, "epoch": 4254} {"train_loss": -7.022198677062988, "global_step": 178671, "epoch": 4254} {"train_loss": -7.1187005043029785, "global_step": 178672, "epoch": 4254} {"train_loss": -7.094568252563477, "global_step": 178673, "epoch": 4254} {"train_loss": -7.055588722229004, "global_step": 178674, "epoch": 4254} {"train_loss": -7.106846809387207, "global_step": 178675, "epoch": 4254} {"train_loss": -7.059601306915283, "global_step": 178676, "epoch": 4254} {"train_loss": -6.962223052978516, "global_step": 178677, "epoch": 4254} {"train_loss": -7.124184608459473, "global_step": 178678, "epoch": 4254} {"train_loss": -7.075087547302246, "global_step": 178679, "epoch": 4254} {"train_loss": -6.994678974151611, "global_step": 178680, "epoch": 4254} {"train_loss": -7.069126605987549, "global_step": 178681, "epoch": 4254} {"train_loss": -7.117439270019531, "global_step": 178682, "epoch": 4254} {"train_loss": -7.079686164855957, "global_step": 178683, "epoch": 4254} {"train_loss": -7.064108848571777, "global_step": 178684, "epoch": 4254} {"train_loss": -7.065589427947998, "global_step": 178685, "epoch": 4254} {"train_loss": -6.985719680786133, "global_step": 178686, "epoch": 4254} {"train_loss": -7.143227577209473, "global_step": 178687, "epoch": 4254} {"train_loss": -7.201568126678467, "global_step": 178688, "epoch": 4254} {"train_loss": -6.96234655380249, "global_step": 178689, "epoch": 4254} {"train_loss": -7.094738006591797, "global_step": 178690, "epoch": 4254} {"train_loss": -6.993172645568848, "global_step": 178691, "epoch": 4254} {"train_loss": -6.973208427429199, "global_step": 178692, "epoch": 4254} {"train_loss": -7.084772109985352, "global_step": 178693, "epoch": 4254} {"train_loss": -7.099549293518066, "global_step": 178694, "epoch": 4254} {"train_loss": -6.985454559326172, "global_step": 178695, "epoch": 4254} {"train_loss": -7.043886184692383, "global_step": 178696, "epoch": 4254} {"train_loss": -7.141845703125, "global_step": 178697, "epoch": 4254} {"train_loss": -7.112642288208008, "global_step": 178698, "epoch": 4254} {"train_loss": -7.128009796142578, "global_step": 178699, "epoch": 4254} {"train_loss": -7.044969081878662, "global_step": 178700, "epoch": 4254} {"train_loss": -7.080373287200928, "global_step": 178701, "epoch": 4254} {"train_loss": -7.121188163757324, "global_step": 178702, "epoch": 4254} {"train_loss": -6.93306827545166, "global_step": 178703, "epoch": 4254} {"train_loss": -7.0718278884887695, "global_step": 178704, "epoch": 4254} {"train_loss": -7.209440231323242, "global_step": 178705, "epoch": 4254} {"train_loss": -7.072721004486084, "global_step": 178706, "epoch": 4254} {"train_loss": -6.952309608459473, "global_step": 178707, "epoch": 4254} {"train_loss": -7.067623138427734, "global_step": 178708, "epoch": 4254} {"train_loss": -7.063660474050613, "global_step": 178709, "epoch": 4254, "val_loss": 68784.6171875} {"train_loss": -7.0031867027282715, "global_step": 178710, "epoch": 4255} {"train_loss": -7.115589618682861, "global_step": 178711, "epoch": 4255} {"train_loss": -7.085962295532227, "global_step": 178712, "epoch": 4255} {"train_loss": -7.12623929977417, "global_step": 178713, "epoch": 4255} {"train_loss": -7.0080461502075195, "global_step": 178714, "epoch": 4255} {"train_loss": -7.130407810211182, "global_step": 178715, "epoch": 4255} {"train_loss": -7.094871520996094, "global_step": 178716, "epoch": 4255} {"train_loss": -7.150748252868652, "global_step": 178717, "epoch": 4255} {"train_loss": -7.010739326477051, "global_step": 178718, "epoch": 4255} {"train_loss": -7.102494239807129, "global_step": 178719, "epoch": 4255} {"train_loss": -6.982710838317871, "global_step": 178720, "epoch": 4255} {"train_loss": -7.089692115783691, "global_step": 178721, "epoch": 4255} {"train_loss": -7.140127182006836, "global_step": 178722, "epoch": 4255} {"train_loss": -7.039466381072998, "global_step": 178723, "epoch": 4255} {"train_loss": -7.134042739868164, "global_step": 178724, "epoch": 4255} {"train_loss": -7.178084373474121, "global_step": 178725, "epoch": 4255} {"train_loss": -7.062304496765137, "global_step": 178726, "epoch": 4255} {"train_loss": -7.079479217529297, "global_step": 178727, "epoch": 4255} {"train_loss": -7.161904335021973, "global_step": 178728, "epoch": 4255} {"train_loss": -7.139107704162598, "global_step": 178729, "epoch": 4255} {"train_loss": -7.033322334289551, "global_step": 178730, "epoch": 4255} {"train_loss": -6.992563247680664, "global_step": 178731, "epoch": 4255} {"train_loss": -7.104963302612305, "global_step": 178732, "epoch": 4255} {"train_loss": -7.08323860168457, "global_step": 178733, "epoch": 4255} {"train_loss": -7.093740940093994, "global_step": 178734, "epoch": 4255} {"train_loss": -7.0062456130981445, "global_step": 178735, "epoch": 4255} {"train_loss": -7.130122184753418, "global_step": 178736, "epoch": 4255} {"train_loss": -7.128929138183594, "global_step": 178737, "epoch": 4255} {"train_loss": -7.1331024169921875, "global_step": 178738, "epoch": 4255} {"train_loss": -7.031161785125732, "global_step": 178739, "epoch": 4255} {"train_loss": -7.056066036224365, "global_step": 178740, "epoch": 4255} {"train_loss": -6.985871315002441, "global_step": 178741, "epoch": 4255} {"train_loss": -7.102090835571289, "global_step": 178742, "epoch": 4255} {"train_loss": -6.993521213531494, "global_step": 178743, "epoch": 4255} {"train_loss": -7.269256591796875, "global_step": 178744, "epoch": 4255} {"train_loss": -7.114316463470459, "global_step": 178745, "epoch": 4255} {"train_loss": -7.074154853820801, "global_step": 178746, "epoch": 4255} {"train_loss": -7.047260284423828, "global_step": 178747, "epoch": 4255} {"train_loss": -7.067072868347168, "global_step": 178748, "epoch": 4255} {"train_loss": -6.999555587768555, "global_step": 178749, "epoch": 4255} {"train_loss": -7.05695104598999, "global_step": 178750, "epoch": 4255} {"train_loss": -7.0807954129718595, "global_step": 178751, "epoch": 4255, "val_loss": 68650.5390625} {"train_loss": -6.928469657897949, "global_step": 178752, "epoch": 4256} {"train_loss": -7.012799263000488, "global_step": 178753, "epoch": 4256} {"train_loss": -7.184027671813965, "global_step": 178754, "epoch": 4256} {"train_loss": -6.98790979385376, "global_step": 178755, "epoch": 4256} {"train_loss": -6.976126670837402, "global_step": 178756, "epoch": 4256} {"train_loss": -7.17457914352417, "global_step": 178757, "epoch": 4256} {"train_loss": -6.904611587524414, "global_step": 178758, "epoch": 4256} {"train_loss": -7.010270118713379, "global_step": 178759, "epoch": 4256} {"train_loss": -7.123262405395508, "global_step": 178760, "epoch": 4256} {"train_loss": -6.973900318145752, "global_step": 178761, "epoch": 4256} {"train_loss": -7.013986587524414, "global_step": 178762, "epoch": 4256} {"train_loss": -7.091160297393799, "global_step": 178763, "epoch": 4256} {"train_loss": -7.095350742340088, "global_step": 178764, "epoch": 4256} {"train_loss": -7.09671688079834, "global_step": 178765, "epoch": 4256} {"train_loss": -7.112137317657471, "global_step": 178766, "epoch": 4256} {"train_loss": -6.978841781616211, "global_step": 178767, "epoch": 4256} {"train_loss": -7.069024085998535, "global_step": 178768, "epoch": 4256} {"train_loss": -7.1001739501953125, "global_step": 178769, "epoch": 4256} {"train_loss": -7.091373920440674, "global_step": 178770, "epoch": 4256} {"train_loss": -7.030289649963379, "global_step": 178771, "epoch": 4256} {"train_loss": -7.044040679931641, "global_step": 178772, "epoch": 4256} {"train_loss": -7.050580978393555, "global_step": 178773, "epoch": 4256} {"train_loss": -7.091263771057129, "global_step": 178774, "epoch": 4256} {"train_loss": -7.099094867706299, "global_step": 178775, "epoch": 4256} {"train_loss": -7.117286682128906, "global_step": 178776, "epoch": 4256} {"train_loss": -7.166836261749268, "global_step": 178777, "epoch": 4256} {"train_loss": -7.135976314544678, "global_step": 178778, "epoch": 4256} {"train_loss": -7.134600639343262, "global_step": 178779, "epoch": 4256} {"train_loss": -7.004514694213867, "global_step": 178780, "epoch": 4256} {"train_loss": -7.013017654418945, "global_step": 178781, "epoch": 4256} {"train_loss": -7.02156925201416, "global_step": 178782, "epoch": 4256} {"train_loss": -7.1482343673706055, "global_step": 178783, "epoch": 4256} {"train_loss": -7.069123268127441, "global_step": 178784, "epoch": 4256} {"train_loss": -7.024909973144531, "global_step": 178785, "epoch": 4256} {"train_loss": -7.101234436035156, "global_step": 178786, "epoch": 4256} {"train_loss": -7.059138298034668, "global_step": 178787, "epoch": 4256} {"train_loss": -7.062132835388184, "global_step": 178788, "epoch": 4256} {"train_loss": -7.079964637756348, "global_step": 178789, "epoch": 4256} {"train_loss": -6.889082908630371, "global_step": 178790, "epoch": 4256} {"train_loss": -7.116009712219238, "global_step": 178791, "epoch": 4256} {"train_loss": -7.051287651062012, "global_step": 178792, "epoch": 4256} {"train_loss": -7.059059404191517, "global_step": 178793, "epoch": 4256, "val_loss": 68689.015625} {"train_loss": -7.103161334991455, "global_step": 178794, "epoch": 4257} {"train_loss": -7.0086669921875, "global_step": 178795, "epoch": 4257} {"train_loss": -7.1563944816589355, "global_step": 178796, "epoch": 4257} {"train_loss": -7.06342887878418, "global_step": 178797, "epoch": 4257} {"train_loss": -6.976754665374756, "global_step": 178798, "epoch": 4257} {"train_loss": -7.0287885665893555, "global_step": 178799, "epoch": 4257} {"train_loss": -7.07967472076416, "global_step": 178800, "epoch": 4257} {"train_loss": -7.040248870849609, "global_step": 178801, "epoch": 4257} {"train_loss": -7.061333656311035, "global_step": 178802, "epoch": 4257} {"train_loss": -7.069317817687988, "global_step": 178803, "epoch": 4257} {"train_loss": -7.114834785461426, "global_step": 178804, "epoch": 4257} {"train_loss": -6.996732234954834, "global_step": 178805, "epoch": 4257} {"train_loss": -6.994373798370361, "global_step": 178806, "epoch": 4257} {"train_loss": -7.093555450439453, "global_step": 178807, "epoch": 4257} {"train_loss": -7.021794319152832, "global_step": 178808, "epoch": 4257} {"train_loss": -6.931039810180664, "global_step": 178809, "epoch": 4257} {"train_loss": -7.138745307922363, "global_step": 178810, "epoch": 4257} {"train_loss": -7.034948348999023, "global_step": 178811, "epoch": 4257} {"train_loss": -7.0952043533325195, "global_step": 178812, "epoch": 4257} {"train_loss": -7.147932052612305, "global_step": 178813, "epoch": 4257} {"train_loss": -7.0575852394104, "global_step": 178814, "epoch": 4257} {"train_loss": -7.0290846824646, "global_step": 178815, "epoch": 4257} {"train_loss": -7.052539348602295, "global_step": 178816, "epoch": 4257} {"train_loss": -7.119897842407227, "global_step": 178817, "epoch": 4257} {"train_loss": -7.003229141235352, "global_step": 178818, "epoch": 4257} {"train_loss": -7.029574394226074, "global_step": 178819, "epoch": 4257} {"train_loss": -7.099576473236084, "global_step": 178820, "epoch": 4257} {"train_loss": -6.946969985961914, "global_step": 178821, "epoch": 4257} {"train_loss": -7.031878471374512, "global_step": 178822, "epoch": 4257} {"train_loss": -7.008810997009277, "global_step": 178823, "epoch": 4257} {"train_loss": -7.116972923278809, "global_step": 178824, "epoch": 4257} {"train_loss": -7.009866714477539, "global_step": 178825, "epoch": 4257} {"train_loss": -7.059266090393066, "global_step": 178826, "epoch": 4257} {"train_loss": -6.9907989501953125, "global_step": 178827, "epoch": 4257} {"train_loss": -7.085603713989258, "global_step": 178828, "epoch": 4257} {"train_loss": -7.1342363357543945, "global_step": 178829, "epoch": 4257} {"train_loss": -6.941798210144043, "global_step": 178830, "epoch": 4257} {"train_loss": -7.107949256896973, "global_step": 178831, "epoch": 4257} {"train_loss": -6.940377235412598, "global_step": 178832, "epoch": 4257} {"train_loss": -7.032740592956543, "global_step": 178833, "epoch": 4257} {"train_loss": -7.0198140144348145, "global_step": 178834, "epoch": 4257} {"train_loss": -7.046011845270793, "global_step": 178835, "epoch": 4257, "val_loss": 68745.53125} {"train_loss": -7.060234546661377, "global_step": 178836, "epoch": 4258} {"train_loss": -6.910027503967285, "global_step": 178837, "epoch": 4258} {"train_loss": -7.038835048675537, "global_step": 178838, "epoch": 4258} {"train_loss": -6.868319511413574, "global_step": 178839, "epoch": 4258} {"train_loss": -6.971958160400391, "global_step": 178840, "epoch": 4258} {"train_loss": -7.037968158721924, "global_step": 178841, "epoch": 4258} {"train_loss": -7.039983749389648, "global_step": 178842, "epoch": 4258} {"train_loss": -7.006944179534912, "global_step": 178843, "epoch": 4258} {"train_loss": -6.959845066070557, "global_step": 178844, "epoch": 4258} {"train_loss": -7.074723243713379, "global_step": 178845, "epoch": 4258} {"train_loss": -6.85502290725708, "global_step": 178846, "epoch": 4258} {"train_loss": -7.027312278747559, "global_step": 178847, "epoch": 4258} {"train_loss": -7.0231242179870605, "global_step": 178848, "epoch": 4258} {"train_loss": -6.90550422668457, "global_step": 178849, "epoch": 4258} {"train_loss": -6.950469970703125, "global_step": 178850, "epoch": 4258} {"train_loss": -7.050012588500977, "global_step": 178851, "epoch": 4258} {"train_loss": -6.831064701080322, "global_step": 178852, "epoch": 4258} {"train_loss": -6.920186996459961, "global_step": 178853, "epoch": 4258} {"train_loss": -6.840564727783203, "global_step": 178854, "epoch": 4258} {"train_loss": -7.00533390045166, "global_step": 178855, "epoch": 4258} {"train_loss": -6.980761528015137, "global_step": 178856, "epoch": 4258} {"train_loss": -6.997335910797119, "global_step": 178857, "epoch": 4258} {"train_loss": -6.9168548583984375, "global_step": 178858, "epoch": 4258} {"train_loss": -7.029298782348633, "global_step": 178859, "epoch": 4258} {"train_loss": -6.984405040740967, "global_step": 178860, "epoch": 4258} {"train_loss": -6.9244537353515625, "global_step": 178861, "epoch": 4258} {"train_loss": -7.092609405517578, "global_step": 178862, "epoch": 4258} {"train_loss": -6.95920467376709, "global_step": 178863, "epoch": 4258} {"train_loss": -6.998608589172363, "global_step": 178864, "epoch": 4258} {"train_loss": -7.004373073577881, "global_step": 178865, "epoch": 4258} {"train_loss": -6.991528034210205, "global_step": 178866, "epoch": 4258} {"train_loss": -6.92818546295166, "global_step": 178867, "epoch": 4258} {"train_loss": -7.0154643058776855, "global_step": 178868, "epoch": 4258} {"train_loss": -6.898207664489746, "global_step": 178869, "epoch": 4258} {"train_loss": -6.9325690269470215, "global_step": 178870, "epoch": 4258} {"train_loss": -6.98309850692749, "global_step": 178871, "epoch": 4258} {"train_loss": -6.949684143066406, "global_step": 178872, "epoch": 4258} {"train_loss": -7.071538925170898, "global_step": 178873, "epoch": 4258} {"train_loss": -6.977723121643066, "global_step": 178874, "epoch": 4258} {"train_loss": -7.052682399749756, "global_step": 178875, "epoch": 4258} {"train_loss": -7.075135707855225, "global_step": 178876, "epoch": 4258} {"train_loss": -6.98173147156125, "global_step": 178877, "epoch": 4258, "val_loss": 68518.7734375} {"train_loss": -7.037615776062012, "global_step": 178878, "epoch": 4259} {"train_loss": -7.122636795043945, "global_step": 178879, "epoch": 4259} {"train_loss": -7.028957843780518, "global_step": 178880, "epoch": 4259} {"train_loss": -7.088473796844482, "global_step": 178881, "epoch": 4259} {"train_loss": -6.926445960998535, "global_step": 178882, "epoch": 4259} {"train_loss": -6.983647346496582, "global_step": 178883, "epoch": 4259} {"train_loss": -7.181765079498291, "global_step": 178884, "epoch": 4259} {"train_loss": -7.088846206665039, "global_step": 178885, "epoch": 4259} {"train_loss": -6.956233978271484, "global_step": 178886, "epoch": 4259} {"train_loss": -7.072080612182617, "global_step": 178887, "epoch": 4259} {"train_loss": -6.889277935028076, "global_step": 178888, "epoch": 4259} {"train_loss": -7.054199695587158, "global_step": 178889, "epoch": 4259} {"train_loss": -7.059614181518555, "global_step": 178890, "epoch": 4259} {"train_loss": -7.058645248413086, "global_step": 178891, "epoch": 4259} {"train_loss": -7.081883430480957, "global_step": 178892, "epoch": 4259} {"train_loss": -6.996169090270996, "global_step": 178893, "epoch": 4259} {"train_loss": -6.8750152587890625, "global_step": 178894, "epoch": 4259} {"train_loss": -6.928372859954834, "global_step": 178895, "epoch": 4259} {"train_loss": -7.075854778289795, "global_step": 178896, "epoch": 4259} {"train_loss": -6.986838340759277, "global_step": 178897, "epoch": 4259} {"train_loss": -6.95913028717041, "global_step": 178898, "epoch": 4259} {"train_loss": -6.977843284606934, "global_step": 178899, "epoch": 4259} {"train_loss": -6.933628082275391, "global_step": 178900, "epoch": 4259} {"train_loss": -6.927548885345459, "global_step": 178901, "epoch": 4259} {"train_loss": -6.8936004638671875, "global_step": 178902, "epoch": 4259} {"train_loss": -6.882314682006836, "global_step": 178903, "epoch": 4259} {"train_loss": -6.983172416687012, "global_step": 178904, "epoch": 4259} {"train_loss": -7.086006164550781, "global_step": 178905, "epoch": 4259} {"train_loss": -6.9136552810668945, "global_step": 178906, "epoch": 4259} {"train_loss": -6.9031500816345215, "global_step": 178907, "epoch": 4259} {"train_loss": -6.8627238273620605, "global_step": 178908, "epoch": 4259} {"train_loss": -7.040999889373779, "global_step": 178909, "epoch": 4259} {"train_loss": -6.898460388183594, "global_step": 178910, "epoch": 4259} {"train_loss": -7.033421516418457, "global_step": 178911, "epoch": 4259} {"train_loss": -6.7988057136535645, "global_step": 178912, "epoch": 4259} {"train_loss": -7.007047653198242, "global_step": 178913, "epoch": 4259} {"train_loss": -7.030082702636719, "global_step": 178914, "epoch": 4259} {"train_loss": -6.964053630828857, "global_step": 178915, "epoch": 4259} {"train_loss": -6.93743896484375, "global_step": 178916, "epoch": 4259} {"train_loss": -6.976000785827637, "global_step": 178917, "epoch": 4259} {"train_loss": -6.93403434753418, "global_step": 178918, "epoch": 4259} {"train_loss": -6.98598177092416, "global_step": 178919, "epoch": 4259, "val_loss": 68768.5625} {"train_loss": -7.021757125854492, "global_step": 178920, "epoch": 4260} {"train_loss": -6.858608245849609, "global_step": 178921, "epoch": 4260} {"train_loss": -7.008392333984375, "global_step": 178922, "epoch": 4260} {"train_loss": -7.149268627166748, "global_step": 178923, "epoch": 4260} {"train_loss": -6.915331840515137, "global_step": 178924, "epoch": 4260} {"train_loss": -7.064312934875488, "global_step": 178925, "epoch": 4260} {"train_loss": -7.047043323516846, "global_step": 178926, "epoch": 4260} {"train_loss": -7.146279335021973, "global_step": 178927, "epoch": 4260} {"train_loss": -7.112756729125977, "global_step": 178928, "epoch": 4260} {"train_loss": -6.999091148376465, "global_step": 178929, "epoch": 4260} {"train_loss": -7.085832118988037, "global_step": 178930, "epoch": 4260} {"train_loss": -7.0229620933532715, "global_step": 178931, "epoch": 4260} {"train_loss": -6.951865196228027, "global_step": 178932, "epoch": 4260} {"train_loss": -7.120500087738037, "global_step": 178933, "epoch": 4260} {"train_loss": -7.065834999084473, "global_step": 178934, "epoch": 4260} {"train_loss": -7.0911359786987305, "global_step": 178935, "epoch": 4260} {"train_loss": -7.08935546875, "global_step": 178936, "epoch": 4260} {"train_loss": -7.21683406829834, "global_step": 178937, "epoch": 4260} {"train_loss": -6.9936723709106445, "global_step": 178938, "epoch": 4260} {"train_loss": -7.021493434906006, "global_step": 178939, "epoch": 4260} {"train_loss": -7.0631184577941895, "global_step": 178940, "epoch": 4260} {"train_loss": -7.067861557006836, "global_step": 178941, "epoch": 4260} {"train_loss": -7.040102481842041, "global_step": 178942, "epoch": 4260} {"train_loss": -7.050248146057129, "global_step": 178943, "epoch": 4260} {"train_loss": -7.081642150878906, "global_step": 178944, "epoch": 4260} {"train_loss": -7.038484573364258, "global_step": 178945, "epoch": 4260} {"train_loss": -7.134391784667969, "global_step": 178946, "epoch": 4260} {"train_loss": -7.050609588623047, "global_step": 178947, "epoch": 4260} {"train_loss": -7.148863315582275, "global_step": 178948, "epoch": 4260} {"train_loss": -7.129887580871582, "global_step": 178949, "epoch": 4260} {"train_loss": -7.056256294250488, "global_step": 178950, "epoch": 4260} {"train_loss": -7.135563850402832, "global_step": 178951, "epoch": 4260} {"train_loss": -7.129507541656494, "global_step": 178952, "epoch": 4260} {"train_loss": -7.198457717895508, "global_step": 178953, "epoch": 4260} {"train_loss": -7.155027389526367, "global_step": 178954, "epoch": 4260} {"train_loss": -7.04625129699707, "global_step": 178955, "epoch": 4260} {"train_loss": -7.0368523597717285, "global_step": 178956, "epoch": 4260} {"train_loss": -7.12092924118042, "global_step": 178957, "epoch": 4260} {"train_loss": -7.018064975738525, "global_step": 178958, "epoch": 4260} {"train_loss": -7.014880180358887, "global_step": 178959, "epoch": 4260} {"train_loss": -7.064728736877441, "global_step": 178960, "epoch": 4260} {"train_loss": -7.064604418618338, "global_step": 178961, "epoch": 4260, "val_loss": 68620.6015625} {"train_loss": -7.006230354309082, "global_step": 178962, "epoch": 4261} {"train_loss": -6.9886393547058105, "global_step": 178963, "epoch": 4261} {"train_loss": -7.034837245941162, "global_step": 178964, "epoch": 4261} {"train_loss": -7.054721832275391, "global_step": 178965, "epoch": 4261} {"train_loss": -6.9818010330200195, "global_step": 178966, "epoch": 4261} {"train_loss": -7.158753871917725, "global_step": 178967, "epoch": 4261} {"train_loss": -7.142606258392334, "global_step": 178968, "epoch": 4261} {"train_loss": -7.0608415603637695, "global_step": 178969, "epoch": 4261} {"train_loss": -7.242093086242676, "global_step": 178970, "epoch": 4261} {"train_loss": -7.103582382202148, "global_step": 178971, "epoch": 4261} {"train_loss": -7.119041442871094, "global_step": 178972, "epoch": 4261} {"train_loss": -7.057440757751465, "global_step": 178973, "epoch": 4261} {"train_loss": -7.010210037231445, "global_step": 178974, "epoch": 4261} {"train_loss": -7.192895412445068, "global_step": 178975, "epoch": 4261} {"train_loss": -7.081093788146973, "global_step": 178976, "epoch": 4261} {"train_loss": -7.018655300140381, "global_step": 178977, "epoch": 4261} {"train_loss": -7.10081672668457, "global_step": 178978, "epoch": 4261} {"train_loss": -7.131007671356201, "global_step": 178979, "epoch": 4261} {"train_loss": -7.094192981719971, "global_step": 178980, "epoch": 4261} {"train_loss": -6.981473922729492, "global_step": 178981, "epoch": 4261} {"train_loss": -7.078389644622803, "global_step": 178982, "epoch": 4261} {"train_loss": -6.84480094909668, "global_step": 178983, "epoch": 4261} {"train_loss": -6.949468612670898, "global_step": 178984, "epoch": 4261} {"train_loss": -7.108143329620361, "global_step": 178985, "epoch": 4261} {"train_loss": -6.949070453643799, "global_step": 178986, "epoch": 4261} {"train_loss": -7.050865173339844, "global_step": 178987, "epoch": 4261} {"train_loss": -7.065561294555664, "global_step": 178988, "epoch": 4261} {"train_loss": -6.95245361328125, "global_step": 178989, "epoch": 4261} {"train_loss": -7.025640487670898, "global_step": 178990, "epoch": 4261} {"train_loss": -7.179121971130371, "global_step": 178991, "epoch": 4261} {"train_loss": -7.044968128204346, "global_step": 178992, "epoch": 4261} {"train_loss": -7.102275848388672, "global_step": 178993, "epoch": 4261} {"train_loss": -6.993480682373047, "global_step": 178994, "epoch": 4261} {"train_loss": -7.089215278625488, "global_step": 178995, "epoch": 4261} {"train_loss": -7.076199054718018, "global_step": 178996, "epoch": 4261} {"train_loss": -6.965695858001709, "global_step": 178997, "epoch": 4261} {"train_loss": -7.068470478057861, "global_step": 178998, "epoch": 4261} {"train_loss": -6.898427486419678, "global_step": 178999, "epoch": 4261} {"train_loss": -7.101357936859131, "global_step": 179000, "epoch": 4261} {"train_loss": -7.084449768066406, "global_step": 179001, "epoch": 4261} {"train_loss": -7.047575950622559, "global_step": 179002, "epoch": 4261} {"train_loss": -7.053740240278698, "global_step": 179003, "epoch": 4261, "val_loss": 68703.0546875} {"train_loss": -7.145249843597412, "global_step": 179004, "epoch": 4262} {"train_loss": -7.100658893585205, "global_step": 179005, "epoch": 4262} {"train_loss": -7.031709671020508, "global_step": 179006, "epoch": 4262} {"train_loss": -7.101312637329102, "global_step": 179007, "epoch": 4262} {"train_loss": -6.930939674377441, "global_step": 179008, "epoch": 4262} {"train_loss": -7.159485816955566, "global_step": 179009, "epoch": 4262} {"train_loss": -7.067490577697754, "global_step": 179010, "epoch": 4262} {"train_loss": -7.0559258460998535, "global_step": 179011, "epoch": 4262} {"train_loss": -7.105961799621582, "global_step": 179012, "epoch": 4262} {"train_loss": -7.086519241333008, "global_step": 179013, "epoch": 4262} {"train_loss": -7.196669578552246, "global_step": 179014, "epoch": 4262} {"train_loss": -7.103851318359375, "global_step": 179015, "epoch": 4262} {"train_loss": -7.215349197387695, "global_step": 179016, "epoch": 4262} {"train_loss": -7.007683753967285, "global_step": 179017, "epoch": 4262} {"train_loss": -7.0887770652771, "global_step": 179018, "epoch": 4262} {"train_loss": -7.056296348571777, "global_step": 179019, "epoch": 4262} {"train_loss": -6.985581874847412, "global_step": 179020, "epoch": 4262} {"train_loss": -7.049199104309082, "global_step": 179021, "epoch": 4262} {"train_loss": -7.0518293380737305, "global_step": 179022, "epoch": 4262} {"train_loss": -6.996342182159424, "global_step": 179023, "epoch": 4262} {"train_loss": -6.997581481933594, "global_step": 179024, "epoch": 4262} {"train_loss": -7.03099250793457, "global_step": 179025, "epoch": 4262} {"train_loss": -7.147896766662598, "global_step": 179026, "epoch": 4262} {"train_loss": -7.06581449508667, "global_step": 179027, "epoch": 4262} {"train_loss": -7.114275932312012, "global_step": 179028, "epoch": 4262} {"train_loss": -7.033642768859863, "global_step": 179029, "epoch": 4262} {"train_loss": -7.087278842926025, "global_step": 179030, "epoch": 4262} {"train_loss": -7.204537391662598, "global_step": 179031, "epoch": 4262} {"train_loss": -7.026178359985352, "global_step": 179032, "epoch": 4262} {"train_loss": -7.141149520874023, "global_step": 179033, "epoch": 4262} {"train_loss": -7.035613059997559, "global_step": 179034, "epoch": 4262} {"train_loss": -7.123398303985596, "global_step": 179035, "epoch": 4262} {"train_loss": -7.035024642944336, "global_step": 179036, "epoch": 4262} {"train_loss": -7.124087333679199, "global_step": 179037, "epoch": 4262} {"train_loss": -7.123852729797363, "global_step": 179038, "epoch": 4262} {"train_loss": -7.0925703048706055, "global_step": 179039, "epoch": 4262} {"train_loss": -7.051910877227783, "global_step": 179040, "epoch": 4262} {"train_loss": -7.039790153503418, "global_step": 179041, "epoch": 4262} {"train_loss": -7.114960670471191, "global_step": 179042, "epoch": 4262} {"train_loss": -7.046402454376221, "global_step": 179043, "epoch": 4262} {"train_loss": -7.10784912109375, "global_step": 179044, "epoch": 4262} {"train_loss": -7.081322976521084, "global_step": 179045, "epoch": 4262, "val_loss": 68815.7109375} {"train_loss": -7.057126045227051, "global_step": 179046, "epoch": 4263} {"train_loss": -7.1017560958862305, "global_step": 179047, "epoch": 4263} {"train_loss": -7.0385422706604, "global_step": 179048, "epoch": 4263} {"train_loss": -7.087072849273682, "global_step": 179049, "epoch": 4263} {"train_loss": -7.107185363769531, "global_step": 179050, "epoch": 4263} {"train_loss": -7.209079265594482, "global_step": 179051, "epoch": 4263} {"train_loss": -7.207204341888428, "global_step": 179052, "epoch": 4263} {"train_loss": -7.141136646270752, "global_step": 179053, "epoch": 4263} {"train_loss": -7.1073408126831055, "global_step": 179054, "epoch": 4263} {"train_loss": -7.065738677978516, "global_step": 179055, "epoch": 4263} {"train_loss": -7.159381866455078, "global_step": 179056, "epoch": 4263} {"train_loss": -7.154176235198975, "global_step": 179057, "epoch": 4263} {"train_loss": -7.0366668701171875, "global_step": 179058, "epoch": 4263} {"train_loss": -7.167291164398193, "global_step": 179059, "epoch": 4263} {"train_loss": -7.228296756744385, "global_step": 179060, "epoch": 4263} {"train_loss": -7.12345027923584, "global_step": 179061, "epoch": 4263} {"train_loss": -7.057610034942627, "global_step": 179062, "epoch": 4263} {"train_loss": -7.034608364105225, "global_step": 179063, "epoch": 4263} {"train_loss": -7.189003944396973, "global_step": 179064, "epoch": 4263} {"train_loss": -7.092813491821289, "global_step": 179065, "epoch": 4263} {"train_loss": -6.966299533843994, "global_step": 179066, "epoch": 4263} {"train_loss": -7.058550834655762, "global_step": 179067, "epoch": 4263} {"train_loss": -7.03671407699585, "global_step": 179068, "epoch": 4263} {"train_loss": -7.169347763061523, "global_step": 179069, "epoch": 4263} {"train_loss": -7.082655906677246, "global_step": 179070, "epoch": 4263} {"train_loss": -7.006047248840332, "global_step": 179071, "epoch": 4263} {"train_loss": -7.1430206298828125, "global_step": 179072, "epoch": 4263} {"train_loss": -7.068290710449219, "global_step": 179073, "epoch": 4263} {"train_loss": -7.093105316162109, "global_step": 179074, "epoch": 4263} {"train_loss": -7.047682285308838, "global_step": 179075, "epoch": 4263} {"train_loss": -7.100258827209473, "global_step": 179076, "epoch": 4263} {"train_loss": -6.913290977478027, "global_step": 179077, "epoch": 4263} {"train_loss": -7.029608726501465, "global_step": 179078, "epoch": 4263} {"train_loss": -7.079863548278809, "global_step": 179079, "epoch": 4263} {"train_loss": -6.982446193695068, "global_step": 179080, "epoch": 4263} {"train_loss": -7.074897766113281, "global_step": 179081, "epoch": 4263} {"train_loss": -7.061934471130371, "global_step": 179082, "epoch": 4263} {"train_loss": -7.123901844024658, "global_step": 179083, "epoch": 4263} {"train_loss": -7.0955810546875, "global_step": 179084, "epoch": 4263} {"train_loss": -7.049861907958984, "global_step": 179085, "epoch": 4263} {"train_loss": -7.1603875160217285, "global_step": 179086, "epoch": 4263} {"train_loss": -7.091772249766758, "global_step": 179087, "epoch": 4263, "val_loss": 68651.890625} {"train_loss": -7.218791484832764, "global_step": 179088, "epoch": 4264} {"train_loss": -7.069642543792725, "global_step": 179089, "epoch": 4264} {"train_loss": -7.051278114318848, "global_step": 179090, "epoch": 4264} {"train_loss": -7.011936664581299, "global_step": 179091, "epoch": 4264} {"train_loss": -7.188922882080078, "global_step": 179092, "epoch": 4264} {"train_loss": -7.049283027648926, "global_step": 179093, "epoch": 4264} {"train_loss": -7.022243499755859, "global_step": 179094, "epoch": 4264} {"train_loss": -7.041985511779785, "global_step": 179095, "epoch": 4264} {"train_loss": -7.105779647827148, "global_step": 179096, "epoch": 4264} {"train_loss": -7.0370259284973145, "global_step": 179097, "epoch": 4264} {"train_loss": -7.031723976135254, "global_step": 179098, "epoch": 4264} {"train_loss": -7.0737433433532715, "global_step": 179099, "epoch": 4264} {"train_loss": -7.108075141906738, "global_step": 179100, "epoch": 4264} {"train_loss": -7.0843186378479, "global_step": 179101, "epoch": 4264} {"train_loss": -7.110253810882568, "global_step": 179102, "epoch": 4264} {"train_loss": -7.003625869750977, "global_step": 179103, "epoch": 4264} {"train_loss": -7.095411777496338, "global_step": 179104, "epoch": 4264} {"train_loss": -7.0808610916137695, "global_step": 179105, "epoch": 4264} {"train_loss": -7.091413974761963, "global_step": 179106, "epoch": 4264} {"train_loss": -7.158410549163818, "global_step": 179107, "epoch": 4264} {"train_loss": -7.066104888916016, "global_step": 179108, "epoch": 4264} {"train_loss": -6.9326934814453125, "global_step": 179109, "epoch": 4264} {"train_loss": -7.043033599853516, "global_step": 179110, "epoch": 4264} {"train_loss": -7.0188093185424805, "global_step": 179111, "epoch": 4264} {"train_loss": -6.991661071777344, "global_step": 179112, "epoch": 4264} {"train_loss": -7.144612789154053, "global_step": 179113, "epoch": 4264} {"train_loss": -7.109562873840332, "global_step": 179114, "epoch": 4264} {"train_loss": -7.07973575592041, "global_step": 179115, "epoch": 4264} {"train_loss": -7.189773082733154, "global_step": 179116, "epoch": 4264} {"train_loss": -6.980399131774902, "global_step": 179117, "epoch": 4264} {"train_loss": -7.096657752990723, "global_step": 179118, "epoch": 4264} {"train_loss": -7.017725944519043, "global_step": 179119, "epoch": 4264} {"train_loss": -6.9220075607299805, "global_step": 179120, "epoch": 4264} {"train_loss": -6.947142601013184, "global_step": 179121, "epoch": 4264} {"train_loss": -7.05238151550293, "global_step": 179122, "epoch": 4264} {"train_loss": -7.0238847732543945, "global_step": 179123, "epoch": 4264} {"train_loss": -6.87166690826416, "global_step": 179124, "epoch": 4264} {"train_loss": -6.930819511413574, "global_step": 179125, "epoch": 4264} {"train_loss": -7.096391677856445, "global_step": 179126, "epoch": 4264} {"train_loss": -6.97927713394165, "global_step": 179127, "epoch": 4264} {"train_loss": -7.127161026000977, "global_step": 179128, "epoch": 4264} {"train_loss": -7.056345723924183, "global_step": 179129, "epoch": 4264, "val_loss": 68978.984375} {"train_loss": -6.949618339538574, "global_step": 179130, "epoch": 4265} {"train_loss": -7.0583391189575195, "global_step": 179131, "epoch": 4265} {"train_loss": -7.164728164672852, "global_step": 179132, "epoch": 4265} {"train_loss": -7.028273105621338, "global_step": 179133, "epoch": 4265} {"train_loss": -7.033237457275391, "global_step": 179134, "epoch": 4265} {"train_loss": -6.992145538330078, "global_step": 179135, "epoch": 4265} {"train_loss": -7.0123291015625, "global_step": 179136, "epoch": 4265} {"train_loss": -7.033831596374512, "global_step": 179137, "epoch": 4265} {"train_loss": -7.096527099609375, "global_step": 179138, "epoch": 4265} {"train_loss": -7.003420352935791, "global_step": 179139, "epoch": 4265} {"train_loss": -7.049333095550537, "global_step": 179140, "epoch": 4265} {"train_loss": -7.16864538192749, "global_step": 179141, "epoch": 4265} {"train_loss": -7.033717155456543, "global_step": 179142, "epoch": 4265} {"train_loss": -7.10115909576416, "global_step": 179143, "epoch": 4265} {"train_loss": -6.998269081115723, "global_step": 179144, "epoch": 4265} {"train_loss": -7.087028503417969, "global_step": 179145, "epoch": 4265} {"train_loss": -7.086055755615234, "global_step": 179146, "epoch": 4265} {"train_loss": -6.984680652618408, "global_step": 179147, "epoch": 4265} {"train_loss": -7.148648738861084, "global_step": 179148, "epoch": 4265} {"train_loss": -7.101907730102539, "global_step": 179149, "epoch": 4265} {"train_loss": -7.108320236206055, "global_step": 179150, "epoch": 4265} {"train_loss": -7.034482955932617, "global_step": 179151, "epoch": 4265} {"train_loss": -7.073703765869141, "global_step": 179152, "epoch": 4265} {"train_loss": -7.09678316116333, "global_step": 179153, "epoch": 4265} {"train_loss": -7.118337631225586, "global_step": 179154, "epoch": 4265} {"train_loss": -7.149144649505615, "global_step": 179155, "epoch": 4265} {"train_loss": -7.0484395027160645, "global_step": 179156, "epoch": 4265} {"train_loss": -7.026342391967773, "global_step": 179157, "epoch": 4265} {"train_loss": -7.125236988067627, "global_step": 179158, "epoch": 4265} {"train_loss": -7.107375621795654, "global_step": 179159, "epoch": 4265} {"train_loss": -6.941157341003418, "global_step": 179160, "epoch": 4265} {"train_loss": -7.113279342651367, "global_step": 179161, "epoch": 4265} {"train_loss": -7.039743900299072, "global_step": 179162, "epoch": 4265} {"train_loss": -7.053320407867432, "global_step": 179163, "epoch": 4265} {"train_loss": -7.146098613739014, "global_step": 179164, "epoch": 4265} {"train_loss": -7.183967590332031, "global_step": 179165, "epoch": 4265} {"train_loss": -7.064441680908203, "global_step": 179166, "epoch": 4265} {"train_loss": -7.070890426635742, "global_step": 179167, "epoch": 4265} {"train_loss": -7.048678874969482, "global_step": 179168, "epoch": 4265} {"train_loss": -7.094585418701172, "global_step": 179169, "epoch": 4265} {"train_loss": -7.038450241088867, "global_step": 179170, "epoch": 4265} {"train_loss": -7.071569238390241, "global_step": 179171, "epoch": 4265, "val_loss": 68689.1015625} {"train_loss": -7.059787750244141, "global_step": 179172, "epoch": 4266} {"train_loss": -7.128615379333496, "global_step": 179173, "epoch": 4266} {"train_loss": -7.006127834320068, "global_step": 179174, "epoch": 4266} {"train_loss": -7.062105178833008, "global_step": 179175, "epoch": 4266} {"train_loss": -7.039331436157227, "global_step": 179176, "epoch": 4266} {"train_loss": -7.225330352783203, "global_step": 179177, "epoch": 4266} {"train_loss": -7.024957656860352, "global_step": 179178, "epoch": 4266} {"train_loss": -7.166477203369141, "global_step": 179179, "epoch": 4266} {"train_loss": -6.996951580047607, "global_step": 179180, "epoch": 4266} {"train_loss": -7.075267791748047, "global_step": 179181, "epoch": 4266} {"train_loss": -7.117364406585693, "global_step": 179182, "epoch": 4266} {"train_loss": -7.056039333343506, "global_step": 179183, "epoch": 4266} {"train_loss": -7.017807483673096, "global_step": 179184, "epoch": 4266} {"train_loss": -7.086795806884766, "global_step": 179185, "epoch": 4266} {"train_loss": -7.169781684875488, "global_step": 179186, "epoch": 4266} {"train_loss": -7.006667137145996, "global_step": 179187, "epoch": 4266} {"train_loss": -7.003801345825195, "global_step": 179188, "epoch": 4266} {"train_loss": -7.143078804016113, "global_step": 179189, "epoch": 4266} {"train_loss": -6.902137756347656, "global_step": 179190, "epoch": 4266} {"train_loss": -6.952771186828613, "global_step": 179191, "epoch": 4266} {"train_loss": -6.982753276824951, "global_step": 179192, "epoch": 4266} {"train_loss": -7.067038536071777, "global_step": 179193, "epoch": 4266} {"train_loss": -6.967817783355713, "global_step": 179194, "epoch": 4266} {"train_loss": -6.967896461486816, "global_step": 179195, "epoch": 4266} {"train_loss": -7.050509929656982, "global_step": 179196, "epoch": 4266} {"train_loss": -6.948815822601318, "global_step": 179197, "epoch": 4266} {"train_loss": -7.002775192260742, "global_step": 179198, "epoch": 4266} {"train_loss": -6.971287250518799, "global_step": 179199, "epoch": 4266} {"train_loss": -6.913843631744385, "global_step": 179200, "epoch": 4266} {"train_loss": -7.097918510437012, "global_step": 179201, "epoch": 4266} {"train_loss": -7.063302993774414, "global_step": 179202, "epoch": 4266} {"train_loss": -6.9455060958862305, "global_step": 179203, "epoch": 4266} {"train_loss": -7.031459331512451, "global_step": 179204, "epoch": 4266} {"train_loss": -6.997736930847168, "global_step": 179205, "epoch": 4266} {"train_loss": -6.9983134269714355, "global_step": 179206, "epoch": 4266} {"train_loss": -7.095602989196777, "global_step": 179207, "epoch": 4266} {"train_loss": -7.02912712097168, "global_step": 179208, "epoch": 4266} {"train_loss": -7.006223678588867, "global_step": 179209, "epoch": 4266} {"train_loss": -7.104197978973389, "global_step": 179210, "epoch": 4266} {"train_loss": -7.1633405685424805, "global_step": 179211, "epoch": 4266} {"train_loss": -7.010181427001953, "global_step": 179212, "epoch": 4266} {"train_loss": -7.040195328848703, "global_step": 179213, "epoch": 4266, "val_loss": 68919.578125} {"train_loss": -6.961836814880371, "global_step": 179214, "epoch": 4267} {"train_loss": -6.889034271240234, "global_step": 179215, "epoch": 4267} {"train_loss": -7.12812614440918, "global_step": 179216, "epoch": 4267} {"train_loss": -6.974839687347412, "global_step": 179217, "epoch": 4267} {"train_loss": -6.952936172485352, "global_step": 179218, "epoch": 4267} {"train_loss": -7.011861801147461, "global_step": 179219, "epoch": 4267} {"train_loss": -7.036934852600098, "global_step": 179220, "epoch": 4267} {"train_loss": -7.057098388671875, "global_step": 179221, "epoch": 4267} {"train_loss": -6.904892921447754, "global_step": 179222, "epoch": 4267} {"train_loss": -6.960245609283447, "global_step": 179223, "epoch": 4267} {"train_loss": -6.868485450744629, "global_step": 179224, "epoch": 4267} {"train_loss": -6.9799394607543945, "global_step": 179225, "epoch": 4267} {"train_loss": -6.985870361328125, "global_step": 179226, "epoch": 4267} {"train_loss": -7.018056869506836, "global_step": 179227, "epoch": 4267} {"train_loss": -7.072759628295898, "global_step": 179228, "epoch": 4267} {"train_loss": -6.938612461090088, "global_step": 179229, "epoch": 4267} {"train_loss": -6.992969512939453, "global_step": 179230, "epoch": 4267} {"train_loss": -7.060403823852539, "global_step": 179231, "epoch": 4267} {"train_loss": -6.920539379119873, "global_step": 179232, "epoch": 4267} {"train_loss": -6.963016510009766, "global_step": 179233, "epoch": 4267} {"train_loss": -6.937259674072266, "global_step": 179234, "epoch": 4267} {"train_loss": -7.031257629394531, "global_step": 179235, "epoch": 4267} {"train_loss": -6.951180458068848, "global_step": 179236, "epoch": 4267} {"train_loss": -7.091989517211914, "global_step": 179237, "epoch": 4267} {"train_loss": -7.008145809173584, "global_step": 179238, "epoch": 4267} {"train_loss": -6.9486470222473145, "global_step": 179239, "epoch": 4267} {"train_loss": -6.9419074058532715, "global_step": 179240, "epoch": 4267} {"train_loss": -7.040740013122559, "global_step": 179241, "epoch": 4267} {"train_loss": -7.065286636352539, "global_step": 179242, "epoch": 4267} {"train_loss": -6.9842658042907715, "global_step": 179243, "epoch": 4267} {"train_loss": -7.142096519470215, "global_step": 179244, "epoch": 4267} {"train_loss": -7.087801933288574, "global_step": 179245, "epoch": 4267} {"train_loss": -7.0949506759643555, "global_step": 179246, "epoch": 4267} {"train_loss": -7.087206840515137, "global_step": 179247, "epoch": 4267} {"train_loss": -7.0429205894470215, "global_step": 179248, "epoch": 4267} {"train_loss": -7.0970458984375, "global_step": 179249, "epoch": 4267} {"train_loss": -7.091611862182617, "global_step": 179250, "epoch": 4267} {"train_loss": -7.11651611328125, "global_step": 179251, "epoch": 4267} {"train_loss": -7.140951156616211, "global_step": 179252, "epoch": 4267} {"train_loss": -7.1371684074401855, "global_step": 179253, "epoch": 4267} {"train_loss": -7.128927230834961, "global_step": 179254, "epoch": 4267} {"train_loss": -7.019523177828107, "global_step": 179255, "epoch": 4267, "val_loss": 68599.375} {"train_loss": -7.145967483520508, "global_step": 179256, "epoch": 4268} {"train_loss": -7.109163761138916, "global_step": 179257, "epoch": 4268} {"train_loss": -6.955108642578125, "global_step": 179258, "epoch": 4268} {"train_loss": -7.079562187194824, "global_step": 179259, "epoch": 4268} {"train_loss": -7.0968427658081055, "global_step": 179260, "epoch": 4268} {"train_loss": -7.02547025680542, "global_step": 179261, "epoch": 4268} {"train_loss": -7.034451484680176, "global_step": 179262, "epoch": 4268} {"train_loss": -7.160155296325684, "global_step": 179263, "epoch": 4268} {"train_loss": -7.026477813720703, "global_step": 179264, "epoch": 4268} {"train_loss": -7.144866466522217, "global_step": 179265, "epoch": 4268} {"train_loss": -7.026000022888184, "global_step": 179266, "epoch": 4268} {"train_loss": -7.082452774047852, "global_step": 179267, "epoch": 4268} {"train_loss": -7.078207969665527, "global_step": 179268, "epoch": 4268} {"train_loss": -7.025025844573975, "global_step": 179269, "epoch": 4268} {"train_loss": -7.0368757247924805, "global_step": 179270, "epoch": 4268} {"train_loss": -6.989607810974121, "global_step": 179271, "epoch": 4268} {"train_loss": -7.039056301116943, "global_step": 179272, "epoch": 4268} {"train_loss": -7.068028926849365, "global_step": 179273, "epoch": 4268} {"train_loss": -7.048994064331055, "global_step": 179274, "epoch": 4268} {"train_loss": -6.952828407287598, "global_step": 179275, "epoch": 4268} {"train_loss": -7.062502861022949, "global_step": 179276, "epoch": 4268} {"train_loss": -7.100566864013672, "global_step": 179277, "epoch": 4268} {"train_loss": -7.0002641677856445, "global_step": 179278, "epoch": 4268} {"train_loss": -7.086436748504639, "global_step": 179279, "epoch": 4268} {"train_loss": -7.1092939376831055, "global_step": 179280, "epoch": 4268} {"train_loss": -7.063417434692383, "global_step": 179281, "epoch": 4268} {"train_loss": -7.148796558380127, "global_step": 179282, "epoch": 4268} {"train_loss": -7.062918663024902, "global_step": 179283, "epoch": 4268} {"train_loss": -6.905850410461426, "global_step": 179284, "epoch": 4268} {"train_loss": -7.111274242401123, "global_step": 179285, "epoch": 4268} {"train_loss": -7.045124053955078, "global_step": 179286, "epoch": 4268} {"train_loss": -7.118993282318115, "global_step": 179287, "epoch": 4268} {"train_loss": -7.039606094360352, "global_step": 179288, "epoch": 4268} {"train_loss": -7.034319877624512, "global_step": 179289, "epoch": 4268} {"train_loss": -6.973213195800781, "global_step": 179290, "epoch": 4268} {"train_loss": -6.853242874145508, "global_step": 179291, "epoch": 4268} {"train_loss": -7.001222610473633, "global_step": 179292, "epoch": 4268} {"train_loss": -6.758545875549316, "global_step": 179293, "epoch": 4268} {"train_loss": -7.0160136222839355, "global_step": 179294, "epoch": 4268} {"train_loss": -6.909193992614746, "global_step": 179295, "epoch": 4268} {"train_loss": -6.864272117614746, "global_step": 179296, "epoch": 4268} {"train_loss": -7.03705570811317, "global_step": 179297, "epoch": 4268, "val_loss": 68830.90625} {"train_loss": -6.89892578125, "global_step": 179298, "epoch": 4269} {"train_loss": -6.853891372680664, "global_step": 179299, "epoch": 4269} {"train_loss": -7.087477684020996, "global_step": 179300, "epoch": 4269} {"train_loss": -6.897054195404053, "global_step": 179301, "epoch": 4269} {"train_loss": -7.06949520111084, "global_step": 179302, "epoch": 4269} {"train_loss": -6.790627956390381, "global_step": 179303, "epoch": 4269} {"train_loss": -6.969959259033203, "global_step": 179304, "epoch": 4269} {"train_loss": -6.945237159729004, "global_step": 179305, "epoch": 4269} {"train_loss": -6.984200954437256, "global_step": 179306, "epoch": 4269} {"train_loss": -6.966653823852539, "global_step": 179307, "epoch": 4269} {"train_loss": -7.06857967376709, "global_step": 179308, "epoch": 4269} {"train_loss": -6.938692092895508, "global_step": 179309, "epoch": 4269} {"train_loss": -6.968931198120117, "global_step": 179310, "epoch": 4269} {"train_loss": -6.985892295837402, "global_step": 179311, "epoch": 4269} {"train_loss": -6.935823440551758, "global_step": 179312, "epoch": 4269} {"train_loss": -7.105704307556152, "global_step": 179313, "epoch": 4269} {"train_loss": -7.028407096862793, "global_step": 179314, "epoch": 4269} {"train_loss": -7.084259986877441, "global_step": 179315, "epoch": 4269} {"train_loss": -7.019815921783447, "global_step": 179316, "epoch": 4269} {"train_loss": -6.978638172149658, "global_step": 179317, "epoch": 4269} {"train_loss": -6.972033500671387, "global_step": 179318, "epoch": 4269} {"train_loss": -7.0061235427856445, "global_step": 179319, "epoch": 4269} {"train_loss": -7.089637756347656, "global_step": 179320, "epoch": 4269} {"train_loss": -6.994028091430664, "global_step": 179321, "epoch": 4269} {"train_loss": -7.00994348526001, "global_step": 179322, "epoch": 4269} {"train_loss": -7.013829231262207, "global_step": 179323, "epoch": 4269} {"train_loss": -6.974687099456787, "global_step": 179324, "epoch": 4269} {"train_loss": -7.099560260772705, "global_step": 179325, "epoch": 4269} {"train_loss": -7.17669677734375, "global_step": 179326, "epoch": 4269} {"train_loss": -7.161632537841797, "global_step": 179327, "epoch": 4269} {"train_loss": -7.00334358215332, "global_step": 179328, "epoch": 4269} {"train_loss": -7.196268081665039, "global_step": 179329, "epoch": 4269} {"train_loss": -7.045243263244629, "global_step": 179330, "epoch": 4269} {"train_loss": -7.100550651550293, "global_step": 179331, "epoch": 4269} {"train_loss": -7.128915309906006, "global_step": 179332, "epoch": 4269} {"train_loss": -7.202248573303223, "global_step": 179333, "epoch": 4269} {"train_loss": -7.064986705780029, "global_step": 179334, "epoch": 4269} {"train_loss": -7.121224880218506, "global_step": 179335, "epoch": 4269} {"train_loss": -7.108835220336914, "global_step": 179336, "epoch": 4269} {"train_loss": -7.099130630493164, "global_step": 179337, "epoch": 4269} {"train_loss": -7.065229892730713, "global_step": 179338, "epoch": 4269} {"train_loss": -7.032044456118629, "global_step": 179339, "epoch": 4269, "val_loss": 68790.9453125} {"train_loss": -7.220459938049316, "global_step": 179340, "epoch": 4270} {"train_loss": -7.178960800170898, "global_step": 179341, "epoch": 4270} {"train_loss": -7.2438459396362305, "global_step": 179342, "epoch": 4270} {"train_loss": -7.131311416625977, "global_step": 179343, "epoch": 4270} {"train_loss": -7.150885105133057, "global_step": 179344, "epoch": 4270} {"train_loss": -7.262457847595215, "global_step": 179345, "epoch": 4270} {"train_loss": -7.1725969314575195, "global_step": 179346, "epoch": 4270} {"train_loss": -7.158517837524414, "global_step": 179347, "epoch": 4270} {"train_loss": -7.152059078216553, "global_step": 179348, "epoch": 4270} {"train_loss": -7.2188615798950195, "global_step": 179349, "epoch": 4270} {"train_loss": -7.0854339599609375, "global_step": 179350, "epoch": 4270} {"train_loss": -7.034337043762207, "global_step": 179351, "epoch": 4270} {"train_loss": -7.096420764923096, "global_step": 179352, "epoch": 4270} {"train_loss": -7.018019676208496, "global_step": 179353, "epoch": 4270} {"train_loss": -7.116499900817871, "global_step": 179354, "epoch": 4270} {"train_loss": -6.9941582679748535, "global_step": 179355, "epoch": 4270} {"train_loss": -6.956469535827637, "global_step": 179356, "epoch": 4270} {"train_loss": -6.959791660308838, "global_step": 179357, "epoch": 4270} {"train_loss": -7.0221757888793945, "global_step": 179358, "epoch": 4270} {"train_loss": -6.979675769805908, "global_step": 179359, "epoch": 4270} {"train_loss": -6.956546783447266, "global_step": 179360, "epoch": 4270} {"train_loss": -7.044403076171875, "global_step": 179361, "epoch": 4270} {"train_loss": -7.008482456207275, "global_step": 179362, "epoch": 4270} {"train_loss": -6.785711288452148, "global_step": 179363, "epoch": 4270} {"train_loss": -6.847012996673584, "global_step": 179364, "epoch": 4270} {"train_loss": -6.953121185302734, "global_step": 179365, "epoch": 4270} {"train_loss": -7.052002906799316, "global_step": 179366, "epoch": 4270} {"train_loss": -7.00911808013916, "global_step": 179367, "epoch": 4270} {"train_loss": -7.0254902839660645, "global_step": 179368, "epoch": 4270} {"train_loss": -7.059477806091309, "global_step": 179369, "epoch": 4270} {"train_loss": -6.962986946105957, "global_step": 179370, "epoch": 4270} {"train_loss": -6.94003963470459, "global_step": 179371, "epoch": 4270} {"train_loss": -6.913844108581543, "global_step": 179372, "epoch": 4270} {"train_loss": -6.923476219177246, "global_step": 179373, "epoch": 4270} {"train_loss": -7.004816055297852, "global_step": 179374, "epoch": 4270} {"train_loss": -7.061411380767822, "global_step": 179375, "epoch": 4270} {"train_loss": -6.873810291290283, "global_step": 179376, "epoch": 4270} {"train_loss": -6.954722881317139, "global_step": 179377, "epoch": 4270} {"train_loss": -6.940746307373047, "global_step": 179378, "epoch": 4270} {"train_loss": -6.988352298736572, "global_step": 179379, "epoch": 4270} {"train_loss": -7.011493682861328, "global_step": 179380, "epoch": 4270} {"train_loss": -7.0307738326844715, "global_step": 179381, "epoch": 4270, "val_loss": 68811.2109375} {"train_loss": -7.11056661605835, "global_step": 179382, "epoch": 4271} {"train_loss": -7.009549617767334, "global_step": 179383, "epoch": 4271} {"train_loss": -7.041342258453369, "global_step": 179384, "epoch": 4271} {"train_loss": -6.983166694641113, "global_step": 179385, "epoch": 4271} {"train_loss": -7.090893745422363, "global_step": 179386, "epoch": 4271} {"train_loss": -7.037344932556152, "global_step": 179387, "epoch": 4271} {"train_loss": -6.981770038604736, "global_step": 179388, "epoch": 4271} {"train_loss": -6.976462364196777, "global_step": 179389, "epoch": 4271} {"train_loss": -7.051387310028076, "global_step": 179390, "epoch": 4271} {"train_loss": -7.0084309577941895, "global_step": 179391, "epoch": 4271} {"train_loss": -7.028477668762207, "global_step": 179392, "epoch": 4271} {"train_loss": -7.000083923339844, "global_step": 179393, "epoch": 4271} {"train_loss": -7.11728572845459, "global_step": 179394, "epoch": 4271} {"train_loss": -7.012167930603027, "global_step": 179395, "epoch": 4271} {"train_loss": -7.065252780914307, "global_step": 179396, "epoch": 4271} {"train_loss": -7.102205276489258, "global_step": 179397, "epoch": 4271} {"train_loss": -7.146309852600098, "global_step": 179398, "epoch": 4271} {"train_loss": -7.066585540771484, "global_step": 179399, "epoch": 4271} {"train_loss": -7.031923770904541, "global_step": 179400, "epoch": 4271} {"train_loss": -6.918676376342773, "global_step": 179401, "epoch": 4271} {"train_loss": -6.9855523109436035, "global_step": 179402, "epoch": 4271} {"train_loss": -7.121132850646973, "global_step": 179403, "epoch": 4271} {"train_loss": -7.053953170776367, "global_step": 179404, "epoch": 4271} {"train_loss": -7.118965148925781, "global_step": 179405, "epoch": 4271} {"train_loss": -7.163020610809326, "global_step": 179406, "epoch": 4271} {"train_loss": -7.129639625549316, "global_step": 179407, "epoch": 4271} {"train_loss": -7.059062480926514, "global_step": 179408, "epoch": 4271} {"train_loss": -7.124478340148926, "global_step": 179409, "epoch": 4271} {"train_loss": -7.0664753913879395, "global_step": 179410, "epoch": 4271} {"train_loss": -7.069660663604736, "global_step": 179411, "epoch": 4271} {"train_loss": -7.088224411010742, "global_step": 179412, "epoch": 4271} {"train_loss": -7.0825676918029785, "global_step": 179413, "epoch": 4271} {"train_loss": -7.203969955444336, "global_step": 179414, "epoch": 4271} {"train_loss": -7.0376129150390625, "global_step": 179415, "epoch": 4271} {"train_loss": -7.039429187774658, "global_step": 179416, "epoch": 4271} {"train_loss": -7.165663242340088, "global_step": 179417, "epoch": 4271} {"train_loss": -7.053077697753906, "global_step": 179418, "epoch": 4271} {"train_loss": -7.081181526184082, "global_step": 179419, "epoch": 4271} {"train_loss": -7.033095359802246, "global_step": 179420, "epoch": 4271} {"train_loss": -7.143527984619141, "global_step": 179421, "epoch": 4271} {"train_loss": -7.130584716796875, "global_step": 179422, "epoch": 4271} {"train_loss": -7.070688383919852, "global_step": 179423, "epoch": 4271, "val_loss": 68747.6953125} {"train_loss": -7.093344688415527, "global_step": 179424, "epoch": 4272} {"train_loss": -7.140688896179199, "global_step": 179425, "epoch": 4272} {"train_loss": -7.212778091430664, "global_step": 179426, "epoch": 4272} {"train_loss": -7.103631973266602, "global_step": 179427, "epoch": 4272} {"train_loss": -7.069710731506348, "global_step": 179428, "epoch": 4272} {"train_loss": -7.06596565246582, "global_step": 179429, "epoch": 4272} {"train_loss": -7.0863447189331055, "global_step": 179430, "epoch": 4272} {"train_loss": -7.156987190246582, "global_step": 179431, "epoch": 4272} {"train_loss": -7.152021408081055, "global_step": 179432, "epoch": 4272} {"train_loss": -7.104366779327393, "global_step": 179433, "epoch": 4272} {"train_loss": -7.091416358947754, "global_step": 179434, "epoch": 4272} {"train_loss": -7.149985313415527, "global_step": 179435, "epoch": 4272} {"train_loss": -7.006234645843506, "global_step": 179436, "epoch": 4272} {"train_loss": -6.946422576904297, "global_step": 179437, "epoch": 4272} {"train_loss": -7.047351837158203, "global_step": 179438, "epoch": 4272} {"train_loss": -7.022319793701172, "global_step": 179439, "epoch": 4272} {"train_loss": -7.017046928405762, "global_step": 179440, "epoch": 4272} {"train_loss": -7.085268020629883, "global_step": 179441, "epoch": 4272} {"train_loss": -6.97126579284668, "global_step": 179442, "epoch": 4272} {"train_loss": -7.140343189239502, "global_step": 179443, "epoch": 4272} {"train_loss": -7.0775041580200195, "global_step": 179444, "epoch": 4272} {"train_loss": -7.037988662719727, "global_step": 179445, "epoch": 4272} {"train_loss": -7.017319679260254, "global_step": 179446, "epoch": 4272} {"train_loss": -7.1647868156433105, "global_step": 179447, "epoch": 4272} {"train_loss": -7.047950744628906, "global_step": 179448, "epoch": 4272} {"train_loss": -7.126532554626465, "global_step": 179449, "epoch": 4272} {"train_loss": -7.053133010864258, "global_step": 179450, "epoch": 4272} {"train_loss": -7.052741050720215, "global_step": 179451, "epoch": 4272} {"train_loss": -7.029167652130127, "global_step": 179452, "epoch": 4272} {"train_loss": -7.110846996307373, "global_step": 179453, "epoch": 4272} {"train_loss": -7.025739669799805, "global_step": 179454, "epoch": 4272} {"train_loss": -7.14251708984375, "global_step": 179455, "epoch": 4272} {"train_loss": -7.0382771492004395, "global_step": 179456, "epoch": 4272} {"train_loss": -7.088802337646484, "global_step": 179457, "epoch": 4272} {"train_loss": -7.066583633422852, "global_step": 179458, "epoch": 4272} {"train_loss": -7.109991073608398, "global_step": 179459, "epoch": 4272} {"train_loss": -7.1709303855896, "global_step": 179460, "epoch": 4272} {"train_loss": -7.0579729080200195, "global_step": 179461, "epoch": 4272} {"train_loss": -7.032221794128418, "global_step": 179462, "epoch": 4272} {"train_loss": -7.042230606079102, "global_step": 179463, "epoch": 4272} {"train_loss": -7.026392459869385, "global_step": 179464, "epoch": 4272} {"train_loss": -7.078476406279064, "global_step": 179465, "epoch": 4272, "val_loss": 69061.28125} {"train_loss": -7.069422721862793, "global_step": 179466, "epoch": 4273} {"train_loss": -7.079921722412109, "global_step": 179467, "epoch": 4273} {"train_loss": -6.8902435302734375, "global_step": 179468, "epoch": 4273} {"train_loss": -7.08220100402832, "global_step": 179469, "epoch": 4273} {"train_loss": -7.06834077835083, "global_step": 179470, "epoch": 4273} {"train_loss": -6.956686019897461, "global_step": 179471, "epoch": 4273} {"train_loss": -7.102048397064209, "global_step": 179472, "epoch": 4273} {"train_loss": -7.056850433349609, "global_step": 179473, "epoch": 4273} {"train_loss": -7.11073637008667, "global_step": 179474, "epoch": 4273} {"train_loss": -7.02757453918457, "global_step": 179475, "epoch": 4273} {"train_loss": -7.007151126861572, "global_step": 179476, "epoch": 4273} {"train_loss": -7.087420463562012, "global_step": 179477, "epoch": 4273} {"train_loss": -7.04189920425415, "global_step": 179478, "epoch": 4273} {"train_loss": -7.200777530670166, "global_step": 179479, "epoch": 4273} {"train_loss": -6.944031715393066, "global_step": 179480, "epoch": 4273} {"train_loss": -7.107563018798828, "global_step": 179481, "epoch": 4273} {"train_loss": -7.167320251464844, "global_step": 179482, "epoch": 4273} {"train_loss": -7.090954780578613, "global_step": 179483, "epoch": 4273} {"train_loss": -6.9781670570373535, "global_step": 179484, "epoch": 4273} {"train_loss": -6.982689380645752, "global_step": 179485, "epoch": 4273} {"train_loss": -7.08306360244751, "global_step": 179486, "epoch": 4273} {"train_loss": -7.032949924468994, "global_step": 179487, "epoch": 4273} {"train_loss": -7.059677600860596, "global_step": 179488, "epoch": 4273} {"train_loss": -6.977709770202637, "global_step": 179489, "epoch": 4273} {"train_loss": -7.046208381652832, "global_step": 179490, "epoch": 4273} {"train_loss": -7.069329261779785, "global_step": 179491, "epoch": 4273} {"train_loss": -7.044564247131348, "global_step": 179492, "epoch": 4273} {"train_loss": -7.074858665466309, "global_step": 179493, "epoch": 4273} {"train_loss": -6.992311477661133, "global_step": 179494, "epoch": 4273} {"train_loss": -7.11102819442749, "global_step": 179495, "epoch": 4273} {"train_loss": -6.965542316436768, "global_step": 179496, "epoch": 4273} {"train_loss": -7.0530548095703125, "global_step": 179497, "epoch": 4273} {"train_loss": -7.058010578155518, "global_step": 179498, "epoch": 4273} {"train_loss": -6.971924781799316, "global_step": 179499, "epoch": 4273} {"train_loss": -7.058838844299316, "global_step": 179500, "epoch": 4273} {"train_loss": -6.835897445678711, "global_step": 179501, "epoch": 4273} {"train_loss": -7.1331787109375, "global_step": 179502, "epoch": 4273} {"train_loss": -7.067143440246582, "global_step": 179503, "epoch": 4273} {"train_loss": -7.044403076171875, "global_step": 179504, "epoch": 4273} {"train_loss": -7.1056671142578125, "global_step": 179505, "epoch": 4273} {"train_loss": -6.986565113067627, "global_step": 179506, "epoch": 4273} {"train_loss": -7.044498375483921, "global_step": 179507, "epoch": 4273, "val_loss": 68868.8203125} {"train_loss": -6.942585468292236, "global_step": 179508, "epoch": 4274} {"train_loss": -6.956111907958984, "global_step": 179509, "epoch": 4274} {"train_loss": -6.991300582885742, "global_step": 179510, "epoch": 4274} {"train_loss": -6.985851287841797, "global_step": 179511, "epoch": 4274} {"train_loss": -7.107578277587891, "global_step": 179512, "epoch": 4274} {"train_loss": -6.9975080490112305, "global_step": 179513, "epoch": 4274} {"train_loss": -7.095672607421875, "global_step": 179514, "epoch": 4274} {"train_loss": -7.149051666259766, "global_step": 179515, "epoch": 4274} {"train_loss": -7.0955424308776855, "global_step": 179516, "epoch": 4274} {"train_loss": -7.165899276733398, "global_step": 179517, "epoch": 4274} {"train_loss": -7.0634236335754395, "global_step": 179518, "epoch": 4274} {"train_loss": -7.021902084350586, "global_step": 179519, "epoch": 4274} {"train_loss": -7.1334638595581055, "global_step": 179520, "epoch": 4274} {"train_loss": -7.062012672424316, "global_step": 179521, "epoch": 4274} {"train_loss": -7.048023700714111, "global_step": 179522, "epoch": 4274} {"train_loss": -7.044980049133301, "global_step": 179523, "epoch": 4274} {"train_loss": -6.903573036193848, "global_step": 179524, "epoch": 4274} {"train_loss": -7.038336277008057, "global_step": 179525, "epoch": 4274} {"train_loss": -7.018394947052002, "global_step": 179526, "epoch": 4274} {"train_loss": -6.828456878662109, "global_step": 179527, "epoch": 4274} {"train_loss": -6.900913715362549, "global_step": 179528, "epoch": 4274} {"train_loss": -6.977530479431152, "global_step": 179529, "epoch": 4274} {"train_loss": -6.940770626068115, "global_step": 179530, "epoch": 4274} {"train_loss": -7.0431013107299805, "global_step": 179531, "epoch": 4274} {"train_loss": -6.903256416320801, "global_step": 179532, "epoch": 4274} {"train_loss": -7.03160285949707, "global_step": 179533, "epoch": 4274} {"train_loss": -7.000726699829102, "global_step": 179534, "epoch": 4274} {"train_loss": -6.999407768249512, "global_step": 179535, "epoch": 4274} {"train_loss": -7.12837028503418, "global_step": 179536, "epoch": 4274} {"train_loss": -7.018587112426758, "global_step": 179537, "epoch": 4274} {"train_loss": -6.973138332366943, "global_step": 179538, "epoch": 4274} {"train_loss": -7.027530193328857, "global_step": 179539, "epoch": 4274} {"train_loss": -7.096537113189697, "global_step": 179540, "epoch": 4274} {"train_loss": -6.989855766296387, "global_step": 179541, "epoch": 4274} {"train_loss": -7.042879104614258, "global_step": 179542, "epoch": 4274} {"train_loss": -7.056267738342285, "global_step": 179543, "epoch": 4274} {"train_loss": -7.076621055603027, "global_step": 179544, "epoch": 4274} {"train_loss": -7.094738483428955, "global_step": 179545, "epoch": 4274} {"train_loss": -7.018430233001709, "global_step": 179546, "epoch": 4274} {"train_loss": -7.012167930603027, "global_step": 179547, "epoch": 4274} {"train_loss": -7.06047248840332, "global_step": 179548, "epoch": 4274} {"train_loss": -7.025720880145118, "global_step": 179549, "epoch": 4274, "val_loss": 68594.640625} {"train_loss": -7.0613908767700195, "global_step": 179550, "epoch": 4275} {"train_loss": -7.006712913513184, "global_step": 179551, "epoch": 4275} {"train_loss": -7.012790679931641, "global_step": 179552, "epoch": 4275} {"train_loss": -7.022849082946777, "global_step": 179553, "epoch": 4275} {"train_loss": -7.011192321777344, "global_step": 179554, "epoch": 4275} {"train_loss": -7.11244010925293, "global_step": 179555, "epoch": 4275} {"train_loss": -6.96272087097168, "global_step": 179556, "epoch": 4275} {"train_loss": -7.157499313354492, "global_step": 179557, "epoch": 4275} {"train_loss": -7.118205547332764, "global_step": 179558, "epoch": 4275} {"train_loss": -7.067238807678223, "global_step": 179559, "epoch": 4275} {"train_loss": -7.163366317749023, "global_step": 179560, "epoch": 4275} {"train_loss": -7.046934127807617, "global_step": 179561, "epoch": 4275} {"train_loss": -7.0234293937683105, "global_step": 179562, "epoch": 4275} {"train_loss": -7.100220680236816, "global_step": 179563, "epoch": 4275} {"train_loss": -6.984816551208496, "global_step": 179564, "epoch": 4275} {"train_loss": -7.062239646911621, "global_step": 179565, "epoch": 4275} {"train_loss": -7.184452056884766, "global_step": 179566, "epoch": 4275} {"train_loss": -7.053065299987793, "global_step": 179567, "epoch": 4275} {"train_loss": -7.200572967529297, "global_step": 179568, "epoch": 4275} {"train_loss": -7.044294834136963, "global_step": 179569, "epoch": 4275} {"train_loss": -7.205680847167969, "global_step": 179570, "epoch": 4275} {"train_loss": -7.067278861999512, "global_step": 179571, "epoch": 4275} {"train_loss": -7.029214859008789, "global_step": 179572, "epoch": 4275} {"train_loss": -7.093285083770752, "global_step": 179573, "epoch": 4275} {"train_loss": -7.119417190551758, "global_step": 179574, "epoch": 4275} {"train_loss": -6.988056659698486, "global_step": 179575, "epoch": 4275} {"train_loss": -7.083737850189209, "global_step": 179576, "epoch": 4275} {"train_loss": -7.14401912689209, "global_step": 179577, "epoch": 4275} {"train_loss": -7.060062408447266, "global_step": 179578, "epoch": 4275} {"train_loss": -6.960867881774902, "global_step": 179579, "epoch": 4275} {"train_loss": -7.031451225280762, "global_step": 179580, "epoch": 4275} {"train_loss": -7.086468696594238, "global_step": 179581, "epoch": 4275} {"train_loss": -7.100468635559082, "global_step": 179582, "epoch": 4275} {"train_loss": -7.020358562469482, "global_step": 179583, "epoch": 4275} {"train_loss": -7.138765335083008, "global_step": 179584, "epoch": 4275} {"train_loss": -7.128777980804443, "global_step": 179585, "epoch": 4275} {"train_loss": -6.983310222625732, "global_step": 179586, "epoch": 4275} {"train_loss": -6.966850280761719, "global_step": 179587, "epoch": 4275} {"train_loss": -7.037097930908203, "global_step": 179588, "epoch": 4275} {"train_loss": -6.999289512634277, "global_step": 179589, "epoch": 4275} {"train_loss": -6.9314284324646, "global_step": 179590, "epoch": 4275} {"train_loss": -7.060981852667672, "global_step": 179591, "epoch": 4275, "val_loss": 68710.4296875} {"train_loss": -6.980598449707031, "global_step": 179592, "epoch": 4276} {"train_loss": -7.1439995765686035, "global_step": 179593, "epoch": 4276} {"train_loss": -7.047253608703613, "global_step": 179594, "epoch": 4276} {"train_loss": -7.025954246520996, "global_step": 179595, "epoch": 4276} {"train_loss": -7.176342487335205, "global_step": 179596, "epoch": 4276} {"train_loss": -6.971346855163574, "global_step": 179597, "epoch": 4276} {"train_loss": -7.065975189208984, "global_step": 179598, "epoch": 4276} {"train_loss": -6.988151550292969, "global_step": 179599, "epoch": 4276} {"train_loss": -7.012609481811523, "global_step": 179600, "epoch": 4276} {"train_loss": -7.065668106079102, "global_step": 179601, "epoch": 4276} {"train_loss": -6.950881004333496, "global_step": 179602, "epoch": 4276} {"train_loss": -7.064525604248047, "global_step": 179603, "epoch": 4276} {"train_loss": -7.108093738555908, "global_step": 179604, "epoch": 4276} {"train_loss": -7.15519380569458, "global_step": 179605, "epoch": 4276} {"train_loss": -6.99180793762207, "global_step": 179606, "epoch": 4276} {"train_loss": -7.051985263824463, "global_step": 179607, "epoch": 4276} {"train_loss": -7.085478782653809, "global_step": 179608, "epoch": 4276} {"train_loss": -7.003602981567383, "global_step": 179609, "epoch": 4276} {"train_loss": -7.103689670562744, "global_step": 179610, "epoch": 4276} {"train_loss": -7.020569801330566, "global_step": 179611, "epoch": 4276} {"train_loss": -7.114813804626465, "global_step": 179612, "epoch": 4276} {"train_loss": -6.9926042556762695, "global_step": 179613, "epoch": 4276} {"train_loss": -6.923773288726807, "global_step": 179614, "epoch": 4276} {"train_loss": -7.076132297515869, "global_step": 179615, "epoch": 4276} {"train_loss": -7.089491844177246, "global_step": 179616, "epoch": 4276} {"train_loss": -7.050734043121338, "global_step": 179617, "epoch": 4276} {"train_loss": -7.079572677612305, "global_step": 179618, "epoch": 4276} {"train_loss": -7.0616888999938965, "global_step": 179619, "epoch": 4276} {"train_loss": -7.012495040893555, "global_step": 179620, "epoch": 4276} {"train_loss": -7.209034442901611, "global_step": 179621, "epoch": 4276} {"train_loss": -7.205451011657715, "global_step": 179622, "epoch": 4276} {"train_loss": -7.1616644859313965, "global_step": 179623, "epoch": 4276} {"train_loss": -7.1298723220825195, "global_step": 179624, "epoch": 4276} {"train_loss": -7.116137504577637, "global_step": 179625, "epoch": 4276} {"train_loss": -7.026487827301025, "global_step": 179626, "epoch": 4276} {"train_loss": -6.913516044616699, "global_step": 179627, "epoch": 4276} {"train_loss": -6.970254421234131, "global_step": 179628, "epoch": 4276} {"train_loss": -7.105059623718262, "global_step": 179629, "epoch": 4276} {"train_loss": -7.000884056091309, "global_step": 179630, "epoch": 4276} {"train_loss": -6.9503655433654785, "global_step": 179631, "epoch": 4276} {"train_loss": -7.091287136077881, "global_step": 179632, "epoch": 4276} {"train_loss": -7.057462453842163, "global_step": 179633, "epoch": 4276, "val_loss": 68739.8828125} {"train_loss": -6.908513069152832, "global_step": 179634, "epoch": 4277} {"train_loss": -6.957459926605225, "global_step": 179635, "epoch": 4277} {"train_loss": -7.1708269119262695, "global_step": 179636, "epoch": 4277} {"train_loss": -6.9446587562561035, "global_step": 179637, "epoch": 4277} {"train_loss": -6.870987892150879, "global_step": 179638, "epoch": 4277} {"train_loss": -7.062856674194336, "global_step": 179639, "epoch": 4277} {"train_loss": -7.0984907150268555, "global_step": 179640, "epoch": 4277} {"train_loss": -7.005825996398926, "global_step": 179641, "epoch": 4277} {"train_loss": -7.132088661193848, "global_step": 179642, "epoch": 4277} {"train_loss": -6.956240653991699, "global_step": 179643, "epoch": 4277} {"train_loss": -6.887293338775635, "global_step": 179644, "epoch": 4277} {"train_loss": -6.978062629699707, "global_step": 179645, "epoch": 4277} {"train_loss": -6.958313941955566, "global_step": 179646, "epoch": 4277} {"train_loss": -6.957367420196533, "global_step": 179647, "epoch": 4277} {"train_loss": -7.023914337158203, "global_step": 179648, "epoch": 4277} {"train_loss": -6.964733123779297, "global_step": 179649, "epoch": 4277} {"train_loss": -7.099407196044922, "global_step": 179650, "epoch": 4277} {"train_loss": -7.074090003967285, "global_step": 179651, "epoch": 4277} {"train_loss": -7.0238471031188965, "global_step": 179652, "epoch": 4277} {"train_loss": -7.09164571762085, "global_step": 179653, "epoch": 4277} {"train_loss": -7.009993553161621, "global_step": 179654, "epoch": 4277} {"train_loss": -6.982666492462158, "global_step": 179655, "epoch": 4277} {"train_loss": -7.141626358032227, "global_step": 179656, "epoch": 4277} {"train_loss": -7.097139835357666, "global_step": 179657, "epoch": 4277} {"train_loss": -7.139735698699951, "global_step": 179658, "epoch": 4277} {"train_loss": -7.002915382385254, "global_step": 179659, "epoch": 4277} {"train_loss": -7.042342185974121, "global_step": 179660, "epoch": 4277} {"train_loss": -7.090230941772461, "global_step": 179661, "epoch": 4277} {"train_loss": -6.985963821411133, "global_step": 179662, "epoch": 4277} {"train_loss": -7.163873672485352, "global_step": 179663, "epoch": 4277} {"train_loss": -7.103928089141846, "global_step": 179664, "epoch": 4277} {"train_loss": -7.023287296295166, "global_step": 179665, "epoch": 4277} {"train_loss": -7.062358856201172, "global_step": 179666, "epoch": 4277} {"train_loss": -7.100975036621094, "global_step": 179667, "epoch": 4277} {"train_loss": -6.958046913146973, "global_step": 179668, "epoch": 4277} {"train_loss": -7.030508041381836, "global_step": 179669, "epoch": 4277} {"train_loss": -7.077646732330322, "global_step": 179670, "epoch": 4277} {"train_loss": -7.122236251831055, "global_step": 179671, "epoch": 4277} {"train_loss": -7.161064147949219, "global_step": 179672, "epoch": 4277} {"train_loss": -7.028495788574219, "global_step": 179673, "epoch": 4277} {"train_loss": -7.064250946044922, "global_step": 179674, "epoch": 4277} {"train_loss": -7.03728217170352, "global_step": 179675, "epoch": 4277, "val_loss": 68638.8984375} {"train_loss": -7.133430480957031, "global_step": 179676, "epoch": 4278} {"train_loss": -7.132094383239746, "global_step": 179677, "epoch": 4278} {"train_loss": -7.011176109313965, "global_step": 179678, "epoch": 4278} {"train_loss": -7.070281982421875, "global_step": 179679, "epoch": 4278} {"train_loss": -7.193733215332031, "global_step": 179680, "epoch": 4278} {"train_loss": -7.064226150512695, "global_step": 179681, "epoch": 4278} {"train_loss": -7.055907249450684, "global_step": 179682, "epoch": 4278} {"train_loss": -7.110567092895508, "global_step": 179683, "epoch": 4278} {"train_loss": -6.9853057861328125, "global_step": 179684, "epoch": 4278} {"train_loss": -7.11366605758667, "global_step": 179685, "epoch": 4278} {"train_loss": -7.020450592041016, "global_step": 179686, "epoch": 4278} {"train_loss": -7.038965225219727, "global_step": 179687, "epoch": 4278} {"train_loss": -7.0448150634765625, "global_step": 179688, "epoch": 4278} {"train_loss": -7.224565505981445, "global_step": 179689, "epoch": 4278} {"train_loss": -7.157137870788574, "global_step": 179690, "epoch": 4278} {"train_loss": -7.0800042152404785, "global_step": 179691, "epoch": 4278} {"train_loss": -6.974043846130371, "global_step": 179692, "epoch": 4278} {"train_loss": -7.082345008850098, "global_step": 179693, "epoch": 4278} {"train_loss": -7.229870796203613, "global_step": 179694, "epoch": 4278} {"train_loss": -7.101444244384766, "global_step": 179695, "epoch": 4278} {"train_loss": -7.118601322174072, "global_step": 179696, "epoch": 4278} {"train_loss": -7.129490852355957, "global_step": 179697, "epoch": 4278} {"train_loss": -7.1259379386901855, "global_step": 179698, "epoch": 4278} {"train_loss": -7.2083587646484375, "global_step": 179699, "epoch": 4278} {"train_loss": -7.061480522155762, "global_step": 179700, "epoch": 4278} {"train_loss": -7.262976169586182, "global_step": 179701, "epoch": 4278} {"train_loss": -7.084981918334961, "global_step": 179702, "epoch": 4278} {"train_loss": -7.029060363769531, "global_step": 179703, "epoch": 4278} {"train_loss": -7.081297397613525, "global_step": 179704, "epoch": 4278} {"train_loss": -7.164283752441406, "global_step": 179705, "epoch": 4278} {"train_loss": -7.049304962158203, "global_step": 179706, "epoch": 4278} {"train_loss": -6.89603853225708, "global_step": 179707, "epoch": 4278} {"train_loss": -6.921954154968262, "global_step": 179708, "epoch": 4278} {"train_loss": -6.861756324768066, "global_step": 179709, "epoch": 4278} {"train_loss": -7.129565238952637, "global_step": 179710, "epoch": 4278} {"train_loss": -6.947714805603027, "global_step": 179711, "epoch": 4278} {"train_loss": -6.969308853149414, "global_step": 179712, "epoch": 4278} {"train_loss": -7.066830635070801, "global_step": 179713, "epoch": 4278} {"train_loss": -6.982485294342041, "global_step": 179714, "epoch": 4278} {"train_loss": -7.10172176361084, "global_step": 179715, "epoch": 4278} {"train_loss": -6.886601448059082, "global_step": 179716, "epoch": 4278} {"train_loss": -7.06858552069891, "global_step": 179717, "epoch": 4278, "val_loss": 68835.6328125} {"train_loss": -6.982220649719238, "global_step": 179718, "epoch": 4279} {"train_loss": -6.895617485046387, "global_step": 179719, "epoch": 4279} {"train_loss": -7.067867279052734, "global_step": 179720, "epoch": 4279} {"train_loss": -6.942574501037598, "global_step": 179721, "epoch": 4279} {"train_loss": -7.015739440917969, "global_step": 179722, "epoch": 4279} {"train_loss": -7.049790382385254, "global_step": 179723, "epoch": 4279} {"train_loss": -7.008264064788818, "global_step": 179724, "epoch": 4279} {"train_loss": -6.976988792419434, "global_step": 179725, "epoch": 4279} {"train_loss": -7.0633649826049805, "global_step": 179726, "epoch": 4279} {"train_loss": -7.074010848999023, "global_step": 179727, "epoch": 4279} {"train_loss": -7.056110382080078, "global_step": 179728, "epoch": 4279} {"train_loss": -7.009542942047119, "global_step": 179729, "epoch": 4279} {"train_loss": -7.0924177169799805, "global_step": 179730, "epoch": 4279} {"train_loss": -7.052553176879883, "global_step": 179731, "epoch": 4279} {"train_loss": -6.976871013641357, "global_step": 179732, "epoch": 4279} {"train_loss": -7.116861343383789, "global_step": 179733, "epoch": 4279} {"train_loss": -7.038827896118164, "global_step": 179734, "epoch": 4279} {"train_loss": -7.192989349365234, "global_step": 179735, "epoch": 4279} {"train_loss": -7.098908424377441, "global_step": 179736, "epoch": 4279} {"train_loss": -7.106220245361328, "global_step": 179737, "epoch": 4279} {"train_loss": -7.046635627746582, "global_step": 179738, "epoch": 4279} {"train_loss": -7.1286516189575195, "global_step": 179739, "epoch": 4279} {"train_loss": -7.111948013305664, "global_step": 179740, "epoch": 4279} {"train_loss": -7.150460720062256, "global_step": 179741, "epoch": 4279} {"train_loss": -7.040157318115234, "global_step": 179742, "epoch": 4279} {"train_loss": -7.095356464385986, "global_step": 179743, "epoch": 4279} {"train_loss": -7.200177192687988, "global_step": 179744, "epoch": 4279} {"train_loss": -7.027672290802002, "global_step": 179745, "epoch": 4279} {"train_loss": -7.101746559143066, "global_step": 179746, "epoch": 4279} {"train_loss": -7.21142053604126, "global_step": 179747, "epoch": 4279} {"train_loss": -7.006958961486816, "global_step": 179748, "epoch": 4279} {"train_loss": -7.156496047973633, "global_step": 179749, "epoch": 4279} {"train_loss": -7.043791770935059, "global_step": 179750, "epoch": 4279} {"train_loss": -7.031569480895996, "global_step": 179751, "epoch": 4279} {"train_loss": -7.092818737030029, "global_step": 179752, "epoch": 4279} {"train_loss": -6.987142086029053, "global_step": 179753, "epoch": 4279} {"train_loss": -7.010307312011719, "global_step": 179754, "epoch": 4279} {"train_loss": -7.117660045623779, "global_step": 179755, "epoch": 4279} {"train_loss": -6.991484642028809, "global_step": 179756, "epoch": 4279} {"train_loss": -7.125998497009277, "global_step": 179757, "epoch": 4279} {"train_loss": -7.088809967041016, "global_step": 179758, "epoch": 4279} {"train_loss": -7.061265400477818, "global_step": 179759, "epoch": 4279, "val_loss": 68941.546875} {"train_loss": -7.082000255584717, "global_step": 179760, "epoch": 4280} {"train_loss": -7.118669509887695, "global_step": 179761, "epoch": 4280} {"train_loss": -7.093095779418945, "global_step": 179762, "epoch": 4280} {"train_loss": -7.122193336486816, "global_step": 179763, "epoch": 4280} {"train_loss": -7.073769569396973, "global_step": 179764, "epoch": 4280} {"train_loss": -7.0825090408325195, "global_step": 179765, "epoch": 4280} {"train_loss": -6.991143226623535, "global_step": 179766, "epoch": 4280} {"train_loss": -7.0278520584106445, "global_step": 179767, "epoch": 4280} {"train_loss": -7.040205955505371, "global_step": 179768, "epoch": 4280} {"train_loss": -7.046498775482178, "global_step": 179769, "epoch": 4280} {"train_loss": -7.123781204223633, "global_step": 179770, "epoch": 4280} {"train_loss": -7.081892013549805, "global_step": 179771, "epoch": 4280} {"train_loss": -7.13381290435791, "global_step": 179772, "epoch": 4280} {"train_loss": -7.131083965301514, "global_step": 179773, "epoch": 4280} {"train_loss": -7.149524211883545, "global_step": 179774, "epoch": 4280} {"train_loss": -7.087388515472412, "global_step": 179775, "epoch": 4280} {"train_loss": -7.113898277282715, "global_step": 179776, "epoch": 4280} {"train_loss": -7.09371280670166, "global_step": 179777, "epoch": 4280} {"train_loss": -6.969324111938477, "global_step": 179778, "epoch": 4280} {"train_loss": -6.9744038581848145, "global_step": 179779, "epoch": 4280} {"train_loss": -7.079570770263672, "global_step": 179780, "epoch": 4280} {"train_loss": -7.147968292236328, "global_step": 179781, "epoch": 4280} {"train_loss": -6.999283313751221, "global_step": 179782, "epoch": 4280} {"train_loss": -7.034531593322754, "global_step": 179783, "epoch": 4280} {"train_loss": -7.0953240394592285, "global_step": 179784, "epoch": 4280} {"train_loss": -7.061918258666992, "global_step": 179785, "epoch": 4280} {"train_loss": -7.182009696960449, "global_step": 179786, "epoch": 4280} {"train_loss": -7.079254150390625, "global_step": 179787, "epoch": 4280} {"train_loss": -7.231487274169922, "global_step": 179788, "epoch": 4280} {"train_loss": -7.14138650894165, "global_step": 179789, "epoch": 4280} {"train_loss": -7.117425918579102, "global_step": 179790, "epoch": 4280} {"train_loss": -7.146315097808838, "global_step": 179791, "epoch": 4280} {"train_loss": -7.075909614562988, "global_step": 179792, "epoch": 4280} {"train_loss": -7.127834320068359, "global_step": 179793, "epoch": 4280} {"train_loss": -7.220856666564941, "global_step": 179794, "epoch": 4280} {"train_loss": -7.0477070808410645, "global_step": 179795, "epoch": 4280} {"train_loss": -7.146014213562012, "global_step": 179796, "epoch": 4280} {"train_loss": -6.9949798583984375, "global_step": 179797, "epoch": 4280} {"train_loss": -6.9791154861450195, "global_step": 179798, "epoch": 4280} {"train_loss": -7.074407577514648, "global_step": 179799, "epoch": 4280} {"train_loss": -7.08432674407959, "global_step": 179800, "epoch": 4280} {"train_loss": -7.084914638882592, "global_step": 179801, "epoch": 4280, "val_loss": 68589.78125} {"train_loss": -7.084171772003174, "global_step": 179802, "epoch": 4281} {"train_loss": -7.074831962585449, "global_step": 179803, "epoch": 4281} {"train_loss": -7.071582794189453, "global_step": 179804, "epoch": 4281} {"train_loss": -7.078816890716553, "global_step": 179805, "epoch": 4281} {"train_loss": -7.025361061096191, "global_step": 179806, "epoch": 4281} {"train_loss": -6.956081390380859, "global_step": 179807, "epoch": 4281} {"train_loss": -6.945034980773926, "global_step": 179808, "epoch": 4281} {"train_loss": -7.055575370788574, "global_step": 179809, "epoch": 4281} {"train_loss": -6.910996437072754, "global_step": 179810, "epoch": 4281} {"train_loss": -6.980662822723389, "global_step": 179811, "epoch": 4281} {"train_loss": -6.920952796936035, "global_step": 179812, "epoch": 4281} {"train_loss": -7.037954807281494, "global_step": 179813, "epoch": 4281} {"train_loss": -6.982553005218506, "global_step": 179814, "epoch": 4281} {"train_loss": -6.984500885009766, "global_step": 179815, "epoch": 4281} {"train_loss": -7.130786895751953, "global_step": 179816, "epoch": 4281} {"train_loss": -6.948489189147949, "global_step": 179817, "epoch": 4281} {"train_loss": -7.030002593994141, "global_step": 179818, "epoch": 4281} {"train_loss": -7.048723220825195, "global_step": 179819, "epoch": 4281} {"train_loss": -7.154953956604004, "global_step": 179820, "epoch": 4281} {"train_loss": -6.919920921325684, "global_step": 179821, "epoch": 4281} {"train_loss": -6.947491645812988, "global_step": 179822, "epoch": 4281} {"train_loss": -7.005922794342041, "global_step": 179823, "epoch": 4281} {"train_loss": -6.970508098602295, "global_step": 179824, "epoch": 4281} {"train_loss": -6.964877128601074, "global_step": 179825, "epoch": 4281} {"train_loss": -6.972881317138672, "global_step": 179826, "epoch": 4281} {"train_loss": -6.974394798278809, "global_step": 179827, "epoch": 4281} {"train_loss": -6.9289937019348145, "global_step": 179828, "epoch": 4281} {"train_loss": -7.0609540939331055, "global_step": 179829, "epoch": 4281} {"train_loss": -6.961935520172119, "global_step": 179830, "epoch": 4281} {"train_loss": -7.0580735206604, "global_step": 179831, "epoch": 4281} {"train_loss": -7.016869068145752, "global_step": 179832, "epoch": 4281} {"train_loss": -6.97943115234375, "global_step": 179833, "epoch": 4281} {"train_loss": -7.005468368530273, "global_step": 179834, "epoch": 4281} {"train_loss": -7.0036492347717285, "global_step": 179835, "epoch": 4281} {"train_loss": -7.048915863037109, "global_step": 179836, "epoch": 4281} {"train_loss": -6.993708610534668, "global_step": 179837, "epoch": 4281} {"train_loss": -7.108611106872559, "global_step": 179838, "epoch": 4281} {"train_loss": -7.077101230621338, "global_step": 179839, "epoch": 4281} {"train_loss": -7.047418594360352, "global_step": 179840, "epoch": 4281} {"train_loss": -7.04286527633667, "global_step": 179841, "epoch": 4281} {"train_loss": -6.9933881759643555, "global_step": 179842, "epoch": 4281} {"train_loss": -7.014180864606585, "global_step": 179843, "epoch": 4281, "val_loss": 68731.0546875} {"train_loss": -7.006499767303467, "global_step": 179844, "epoch": 4282} {"train_loss": -6.949855327606201, "global_step": 179845, "epoch": 4282} {"train_loss": -7.065729141235352, "global_step": 179846, "epoch": 4282} {"train_loss": -7.127755641937256, "global_step": 179847, "epoch": 4282} {"train_loss": -7.10014533996582, "global_step": 179848, "epoch": 4282} {"train_loss": -6.925149440765381, "global_step": 179849, "epoch": 4282} {"train_loss": -7.031279563903809, "global_step": 179850, "epoch": 4282} {"train_loss": -7.08393669128418, "global_step": 179851, "epoch": 4282} {"train_loss": -7.078161239624023, "global_step": 179852, "epoch": 4282} {"train_loss": -7.001531600952148, "global_step": 179853, "epoch": 4282} {"train_loss": -6.996881484985352, "global_step": 179854, "epoch": 4282} {"train_loss": -7.068216323852539, "global_step": 179855, "epoch": 4282} {"train_loss": -7.0050435066223145, "global_step": 179856, "epoch": 4282} {"train_loss": -7.020226001739502, "global_step": 179857, "epoch": 4282} {"train_loss": -7.073557376861572, "global_step": 179858, "epoch": 4282} {"train_loss": -7.103872776031494, "global_step": 179859, "epoch": 4282} {"train_loss": -7.058051109313965, "global_step": 179860, "epoch": 4282} {"train_loss": -7.036769390106201, "global_step": 179861, "epoch": 4282} {"train_loss": -7.08837890625, "global_step": 179862, "epoch": 4282} {"train_loss": -7.146926403045654, "global_step": 179863, "epoch": 4282} {"train_loss": -6.998456001281738, "global_step": 179864, "epoch": 4282} {"train_loss": -7.10322904586792, "global_step": 179865, "epoch": 4282} {"train_loss": -7.164865970611572, "global_step": 179866, "epoch": 4282} {"train_loss": -7.102363109588623, "global_step": 179867, "epoch": 4282} {"train_loss": -7.026251316070557, "global_step": 179868, "epoch": 4282} {"train_loss": -7.154423236846924, "global_step": 179869, "epoch": 4282} {"train_loss": -7.096210479736328, "global_step": 179870, "epoch": 4282} {"train_loss": -7.130385398864746, "global_step": 179871, "epoch": 4282} {"train_loss": -7.059803009033203, "global_step": 179872, "epoch": 4282} {"train_loss": -7.186091423034668, "global_step": 179873, "epoch": 4282} {"train_loss": -7.015379905700684, "global_step": 179874, "epoch": 4282} {"train_loss": -7.133746147155762, "global_step": 179875, "epoch": 4282} {"train_loss": -7.089463233947754, "global_step": 179876, "epoch": 4282} {"train_loss": -7.175215721130371, "global_step": 179877, "epoch": 4282} {"train_loss": -7.140105247497559, "global_step": 179878, "epoch": 4282} {"train_loss": -7.061062812805176, "global_step": 179879, "epoch": 4282} {"train_loss": -7.201382637023926, "global_step": 179880, "epoch": 4282} {"train_loss": -7.114750862121582, "global_step": 179881, "epoch": 4282} {"train_loss": -7.128415107727051, "global_step": 179882, "epoch": 4282} {"train_loss": -7.066619873046875, "global_step": 179883, "epoch": 4282} {"train_loss": -7.132080078125, "global_step": 179884, "epoch": 4282} {"train_loss": -7.081787779217675, "global_step": 179885, "epoch": 4282, "val_loss": 68884.0546875} {"train_loss": -7.119499683380127, "global_step": 179886, "epoch": 4283} {"train_loss": -7.043078422546387, "global_step": 179887, "epoch": 4283} {"train_loss": -7.077019691467285, "global_step": 179888, "epoch": 4283} {"train_loss": -7.047741413116455, "global_step": 179889, "epoch": 4283} {"train_loss": -7.006292343139648, "global_step": 179890, "epoch": 4283} {"train_loss": -6.977347373962402, "global_step": 179891, "epoch": 4283} {"train_loss": -7.071862697601318, "global_step": 179892, "epoch": 4283} {"train_loss": -7.061113357543945, "global_step": 179893, "epoch": 4283} {"train_loss": -7.114139556884766, "global_step": 179894, "epoch": 4283} {"train_loss": -7.05911922454834, "global_step": 179895, "epoch": 4283} {"train_loss": -7.0933051109313965, "global_step": 179896, "epoch": 4283} {"train_loss": -7.079868316650391, "global_step": 179897, "epoch": 4283} {"train_loss": -7.143287181854248, "global_step": 179898, "epoch": 4283} {"train_loss": -7.147186279296875, "global_step": 179899, "epoch": 4283} {"train_loss": -7.096050262451172, "global_step": 179900, "epoch": 4283} {"train_loss": -7.063407897949219, "global_step": 179901, "epoch": 4283} {"train_loss": -6.971663475036621, "global_step": 179902, "epoch": 4283} {"train_loss": -7.123420715332031, "global_step": 179903, "epoch": 4283} {"train_loss": -7.123271465301514, "global_step": 179904, "epoch": 4283} {"train_loss": -6.9859466552734375, "global_step": 179905, "epoch": 4283} {"train_loss": -7.0678606033325195, "global_step": 179906, "epoch": 4283} {"train_loss": -7.035674571990967, "global_step": 179907, "epoch": 4283} {"train_loss": -7.033237457275391, "global_step": 179908, "epoch": 4283} {"train_loss": -7.032403945922852, "global_step": 179909, "epoch": 4283} {"train_loss": -7.080813407897949, "global_step": 179910, "epoch": 4283} {"train_loss": -6.985937118530273, "global_step": 179911, "epoch": 4283} {"train_loss": -7.100196838378906, "global_step": 179912, "epoch": 4283} {"train_loss": -6.871319770812988, "global_step": 179913, "epoch": 4283} {"train_loss": -6.953775405883789, "global_step": 179914, "epoch": 4283} {"train_loss": -7.03532075881958, "global_step": 179915, "epoch": 4283} {"train_loss": -7.012447357177734, "global_step": 179916, "epoch": 4283} {"train_loss": -7.0066680908203125, "global_step": 179917, "epoch": 4283} {"train_loss": -6.979865550994873, "global_step": 179918, "epoch": 4283} {"train_loss": -6.799314498901367, "global_step": 179919, "epoch": 4283} {"train_loss": -7.059315204620361, "global_step": 179920, "epoch": 4283} {"train_loss": -6.905824661254883, "global_step": 179921, "epoch": 4283} {"train_loss": -6.936190605163574, "global_step": 179922, "epoch": 4283} {"train_loss": -6.937580108642578, "global_step": 179923, "epoch": 4283} {"train_loss": -7.064598560333252, "global_step": 179924, "epoch": 4283} {"train_loss": -6.992677688598633, "global_step": 179925, "epoch": 4283} {"train_loss": -6.998757362365723, "global_step": 179926, "epoch": 4283} {"train_loss": -7.031577791486468, "global_step": 179927, "epoch": 4283, "val_loss": 68673.484375} {"train_loss": -7.005814552307129, "global_step": 179928, "epoch": 4284} {"train_loss": -6.943154811859131, "global_step": 179929, "epoch": 4284} {"train_loss": -6.9551682472229, "global_step": 179930, "epoch": 4284} {"train_loss": -7.077358245849609, "global_step": 179931, "epoch": 4284} {"train_loss": -6.887733459472656, "global_step": 179932, "epoch": 4284} {"train_loss": -7.006488800048828, "global_step": 179933, "epoch": 4284} {"train_loss": -6.950450420379639, "global_step": 179934, "epoch": 4284} {"train_loss": -7.069433689117432, "global_step": 179935, "epoch": 4284} {"train_loss": -7.004692077636719, "global_step": 179936, "epoch": 4284} {"train_loss": -7.004307746887207, "global_step": 179937, "epoch": 4284} {"train_loss": -6.9502854347229, "global_step": 179938, "epoch": 4284} {"train_loss": -6.950077056884766, "global_step": 179939, "epoch": 4284} {"train_loss": -7.085628986358643, "global_step": 179940, "epoch": 4284} {"train_loss": -7.040722846984863, "global_step": 179941, "epoch": 4284} {"train_loss": -7.112405300140381, "global_step": 179942, "epoch": 4284} {"train_loss": -7.005406379699707, "global_step": 179943, "epoch": 4284} {"train_loss": -7.05836296081543, "global_step": 179944, "epoch": 4284} {"train_loss": -7.074099063873291, "global_step": 179945, "epoch": 4284} {"train_loss": -7.07867956161499, "global_step": 179946, "epoch": 4284} {"train_loss": -7.099344253540039, "global_step": 179947, "epoch": 4284} {"train_loss": -7.127813339233398, "global_step": 179948, "epoch": 4284} {"train_loss": -7.1699628829956055, "global_step": 179949, "epoch": 4284} {"train_loss": -7.079240798950195, "global_step": 179950, "epoch": 4284} {"train_loss": -7.001091957092285, "global_step": 179951, "epoch": 4284} {"train_loss": -7.075958728790283, "global_step": 179952, "epoch": 4284} {"train_loss": -7.104104995727539, "global_step": 179953, "epoch": 4284} {"train_loss": -7.152666091918945, "global_step": 179954, "epoch": 4284} {"train_loss": -7.065493583679199, "global_step": 179955, "epoch": 4284} {"train_loss": -7.197792053222656, "global_step": 179956, "epoch": 4284} {"train_loss": -7.011736869812012, "global_step": 179957, "epoch": 4284} {"train_loss": -7.070977210998535, "global_step": 179958, "epoch": 4284} {"train_loss": -7.078503131866455, "global_step": 179959, "epoch": 4284} {"train_loss": -6.952445983886719, "global_step": 179960, "epoch": 4284} {"train_loss": -7.012932777404785, "global_step": 179961, "epoch": 4284} {"train_loss": -7.060712814331055, "global_step": 179962, "epoch": 4284} {"train_loss": -7.042993068695068, "global_step": 179963, "epoch": 4284} {"train_loss": -6.970015525817871, "global_step": 179964, "epoch": 4284} {"train_loss": -6.94178581237793, "global_step": 179965, "epoch": 4284} {"train_loss": -7.017415523529053, "global_step": 179966, "epoch": 4284} {"train_loss": -6.934074878692627, "global_step": 179967, "epoch": 4284} {"train_loss": -7.0717878341674805, "global_step": 179968, "epoch": 4284} {"train_loss": -7.0373481795901345, "global_step": 179969, "epoch": 4284, "val_loss": 68653.5234375} {"train_loss": -7.047595500946045, "global_step": 179970, "epoch": 4285} {"train_loss": -6.9996657371521, "global_step": 179971, "epoch": 4285} {"train_loss": -7.002614974975586, "global_step": 179972, "epoch": 4285} {"train_loss": -7.005020618438721, "global_step": 179973, "epoch": 4285} {"train_loss": -7.078807830810547, "global_step": 179974, "epoch": 4285} {"train_loss": -7.236163139343262, "global_step": 179975, "epoch": 4285} {"train_loss": -7.209777355194092, "global_step": 179976, "epoch": 4285} {"train_loss": -7.12354850769043, "global_step": 179977, "epoch": 4285} {"train_loss": -7.121750831604004, "global_step": 179978, "epoch": 4285} {"train_loss": -7.182014465332031, "global_step": 179979, "epoch": 4285} {"train_loss": -7.1710710525512695, "global_step": 179980, "epoch": 4285} {"train_loss": -7.10512638092041, "global_step": 179981, "epoch": 4285} {"train_loss": -7.046602725982666, "global_step": 179982, "epoch": 4285} {"train_loss": -7.1214704513549805, "global_step": 179983, "epoch": 4285} {"train_loss": -7.164078712463379, "global_step": 179984, "epoch": 4285} {"train_loss": -7.135507106781006, "global_step": 179985, "epoch": 4285} {"train_loss": -7.097883701324463, "global_step": 179986, "epoch": 4285} {"train_loss": -7.17875337600708, "global_step": 179987, "epoch": 4285} {"train_loss": -6.9622602462768555, "global_step": 179988, "epoch": 4285} {"train_loss": -7.148407459259033, "global_step": 179989, "epoch": 4285} {"train_loss": -7.29537296295166, "global_step": 179990, "epoch": 4285} {"train_loss": -7.0890302658081055, "global_step": 179991, "epoch": 4285} {"train_loss": -7.061868667602539, "global_step": 179992, "epoch": 4285} {"train_loss": -7.138136386871338, "global_step": 179993, "epoch": 4285} {"train_loss": -7.115594863891602, "global_step": 179994, "epoch": 4285} {"train_loss": -7.074957847595215, "global_step": 179995, "epoch": 4285} {"train_loss": -7.104258060455322, "global_step": 179996, "epoch": 4285} {"train_loss": -7.014535903930664, "global_step": 179997, "epoch": 4285} {"train_loss": -6.981901168823242, "global_step": 179998, "epoch": 4285} {"train_loss": -7.147419452667236, "global_step": 179999, "epoch": 4285} {"train_loss": -7.067743301391602, "global_step": 180000, "epoch": 4285} {"train_loss": -6.987746238708496, "global_step": 180001, "epoch": 4285} {"train_loss": -7.019442558288574, "global_step": 180002, "epoch": 4285} {"train_loss": -7.068617820739746, "global_step": 180003, "epoch": 4285} {"train_loss": -6.973989486694336, "global_step": 180004, "epoch": 4285} {"train_loss": -7.120700359344482, "global_step": 180005, "epoch": 4285} {"train_loss": -7.006667137145996, "global_step": 180006, "epoch": 4285} {"train_loss": -7.029574394226074, "global_step": 180007, "epoch": 4285} {"train_loss": -7.146181106567383, "global_step": 180008, "epoch": 4285} {"train_loss": -7.078147888183594, "global_step": 180009, "epoch": 4285} {"train_loss": -6.9570698738098145, "global_step": 180010, "epoch": 4285} {"train_loss": -7.08641098794483, "global_step": 180011, "epoch": 4285, "val_loss": 68716.9453125} {"train_loss": -6.9529829025268555, "global_step": 180012, "epoch": 4286} {"train_loss": -7.148383617401123, "global_step": 180013, "epoch": 4286} {"train_loss": -7.0561628341674805, "global_step": 180014, "epoch": 4286} {"train_loss": -6.970808982849121, "global_step": 180015, "epoch": 4286} {"train_loss": -7.148324012756348, "global_step": 180016, "epoch": 4286} {"train_loss": -6.966040134429932, "global_step": 180017, "epoch": 4286} {"train_loss": -7.182158470153809, "global_step": 180018, "epoch": 4286} {"train_loss": -7.1021294593811035, "global_step": 180019, "epoch": 4286} {"train_loss": -7.18105411529541, "global_step": 180020, "epoch": 4286} {"train_loss": -7.228426933288574, "global_step": 180021, "epoch": 4286} {"train_loss": -7.226809501647949, "global_step": 180022, "epoch": 4286} {"train_loss": -7.110387802124023, "global_step": 180023, "epoch": 4286} {"train_loss": -7.117006778717041, "global_step": 180024, "epoch": 4286} {"train_loss": -7.061563014984131, "global_step": 180025, "epoch": 4286} {"train_loss": -7.1092448234558105, "global_step": 180026, "epoch": 4286} {"train_loss": -7.160253047943115, "global_step": 180027, "epoch": 4286} {"train_loss": -7.111696243286133, "global_step": 180028, "epoch": 4286} {"train_loss": -7.067190647125244, "global_step": 180029, "epoch": 4286} {"train_loss": -7.142736911773682, "global_step": 180030, "epoch": 4286} {"train_loss": -7.052063465118408, "global_step": 180031, "epoch": 4286} {"train_loss": -7.196898460388184, "global_step": 180032, "epoch": 4286} {"train_loss": -7.075813293457031, "global_step": 180033, "epoch": 4286} {"train_loss": -7.135061264038086, "global_step": 180034, "epoch": 4286} {"train_loss": -7.01279354095459, "global_step": 180035, "epoch": 4286} {"train_loss": -6.992786407470703, "global_step": 180036, "epoch": 4286} {"train_loss": -7.047798156738281, "global_step": 180037, "epoch": 4286} {"train_loss": -6.957517623901367, "global_step": 180038, "epoch": 4286} {"train_loss": -7.008970737457275, "global_step": 180039, "epoch": 4286} {"train_loss": -6.717432975769043, "global_step": 180040, "epoch": 4286} {"train_loss": -6.909152030944824, "global_step": 180041, "epoch": 4286} {"train_loss": -7.056212902069092, "global_step": 180042, "epoch": 4286} {"train_loss": -6.999917507171631, "global_step": 180043, "epoch": 4286} {"train_loss": -7.072572231292725, "global_step": 180044, "epoch": 4286} {"train_loss": -7.007815361022949, "global_step": 180045, "epoch": 4286} {"train_loss": -6.935864448547363, "global_step": 180046, "epoch": 4286} {"train_loss": -7.003523826599121, "global_step": 180047, "epoch": 4286} {"train_loss": -6.9442667961120605, "global_step": 180048, "epoch": 4286} {"train_loss": -6.921136856079102, "global_step": 180049, "epoch": 4286} {"train_loss": -6.983096599578857, "global_step": 180050, "epoch": 4286} {"train_loss": -6.9337663650512695, "global_step": 180051, "epoch": 4286} {"train_loss": -6.946451187133789, "global_step": 180052, "epoch": 4286} {"train_loss": -7.047850779124668, "global_step": 180053, "epoch": 4286, "val_loss": 68743.03125} {"train_loss": -7.044195175170898, "global_step": 180054, "epoch": 4287} {"train_loss": -6.97435188293457, "global_step": 180055, "epoch": 4287} {"train_loss": -6.93837833404541, "global_step": 180056, "epoch": 4287} {"train_loss": -7.181846618652344, "global_step": 180057, "epoch": 4287} {"train_loss": -6.9107513427734375, "global_step": 180058, "epoch": 4287} {"train_loss": -7.108724594116211, "global_step": 180059, "epoch": 4287} {"train_loss": -6.983004570007324, "global_step": 180060, "epoch": 4287} {"train_loss": -7.100019454956055, "global_step": 180061, "epoch": 4287} {"train_loss": -7.105528831481934, "global_step": 180062, "epoch": 4287} {"train_loss": -6.97740364074707, "global_step": 180063, "epoch": 4287} {"train_loss": -7.017545700073242, "global_step": 180064, "epoch": 4287} {"train_loss": -7.025757789611816, "global_step": 180065, "epoch": 4287} {"train_loss": -7.052644729614258, "global_step": 180066, "epoch": 4287} {"train_loss": -7.152151107788086, "global_step": 180067, "epoch": 4287} {"train_loss": -7.07646369934082, "global_step": 180068, "epoch": 4287} {"train_loss": -7.085094451904297, "global_step": 180069, "epoch": 4287} {"train_loss": -7.061199188232422, "global_step": 180070, "epoch": 4287} {"train_loss": -7.126679420471191, "global_step": 180071, "epoch": 4287} {"train_loss": -7.034487247467041, "global_step": 180072, "epoch": 4287} {"train_loss": -7.037764549255371, "global_step": 180073, "epoch": 4287} {"train_loss": -7.216594219207764, "global_step": 180074, "epoch": 4287} {"train_loss": -7.06710958480835, "global_step": 180075, "epoch": 4287} {"train_loss": -7.067236423492432, "global_step": 180076, "epoch": 4287} {"train_loss": -7.055263519287109, "global_step": 180077, "epoch": 4287} {"train_loss": -7.187152862548828, "global_step": 180078, "epoch": 4287} {"train_loss": -7.22226619720459, "global_step": 180079, "epoch": 4287} {"train_loss": -7.07180118560791, "global_step": 180080, "epoch": 4287} {"train_loss": -7.066104888916016, "global_step": 180081, "epoch": 4287} {"train_loss": -7.0558929443359375, "global_step": 180082, "epoch": 4287} {"train_loss": -7.126984119415283, "global_step": 180083, "epoch": 4287} {"train_loss": -6.937503814697266, "global_step": 180084, "epoch": 4287} {"train_loss": -7.130249977111816, "global_step": 180085, "epoch": 4287} {"train_loss": -7.071203708648682, "global_step": 180086, "epoch": 4287} {"train_loss": -7.0491814613342285, "global_step": 180087, "epoch": 4287} {"train_loss": -6.994749069213867, "global_step": 180088, "epoch": 4287} {"train_loss": -7.0882487297058105, "global_step": 180089, "epoch": 4287} {"train_loss": -7.1364054679870605, "global_step": 180090, "epoch": 4287} {"train_loss": -7.123781681060791, "global_step": 180091, "epoch": 4287} {"train_loss": -7.020837783813477, "global_step": 180092, "epoch": 4287} {"train_loss": -7.104609489440918, "global_step": 180093, "epoch": 4287} {"train_loss": -7.044666290283203, "global_step": 180094, "epoch": 4287} {"train_loss": -7.0719131742204935, "global_step": 180095, "epoch": 4287, "val_loss": 68838.609375} {"train_loss": -6.890139579772949, "global_step": 180096, "epoch": 4288} {"train_loss": -7.020784378051758, "global_step": 180097, "epoch": 4288} {"train_loss": -7.087130069732666, "global_step": 180098, "epoch": 4288} {"train_loss": -7.094429969787598, "global_step": 180099, "epoch": 4288} {"train_loss": -7.161898136138916, "global_step": 180100, "epoch": 4288} {"train_loss": -6.938096523284912, "global_step": 180101, "epoch": 4288} {"train_loss": -6.987771511077881, "global_step": 180102, "epoch": 4288} {"train_loss": -6.952566146850586, "global_step": 180103, "epoch": 4288} {"train_loss": -6.974581241607666, "global_step": 180104, "epoch": 4288} {"train_loss": -6.929103374481201, "global_step": 180105, "epoch": 4288} {"train_loss": -7.00518798828125, "global_step": 180106, "epoch": 4288} {"train_loss": -6.950668811798096, "global_step": 180107, "epoch": 4288} {"train_loss": -6.959507942199707, "global_step": 180108, "epoch": 4288} {"train_loss": -7.017451763153076, "global_step": 180109, "epoch": 4288} {"train_loss": -7.078216552734375, "global_step": 180110, "epoch": 4288} {"train_loss": -7.057129859924316, "global_step": 180111, "epoch": 4288} {"train_loss": -6.936707973480225, "global_step": 180112, "epoch": 4288} {"train_loss": -7.049485683441162, "global_step": 180113, "epoch": 4288} {"train_loss": -7.051076412200928, "global_step": 180114, "epoch": 4288} {"train_loss": -7.010102272033691, "global_step": 180115, "epoch": 4288} {"train_loss": -7.075772762298584, "global_step": 180116, "epoch": 4288} {"train_loss": -6.9024763107299805, "global_step": 180117, "epoch": 4288} {"train_loss": -7.045112609863281, "global_step": 180118, "epoch": 4288} {"train_loss": -7.083334922790527, "global_step": 180119, "epoch": 4288} {"train_loss": -6.915858268737793, "global_step": 180120, "epoch": 4288} {"train_loss": -6.976455211639404, "global_step": 180121, "epoch": 4288} {"train_loss": -6.878580093383789, "global_step": 180122, "epoch": 4288} {"train_loss": -6.94487190246582, "global_step": 180123, "epoch": 4288} {"train_loss": -7.052465915679932, "global_step": 180124, "epoch": 4288} {"train_loss": -6.97502326965332, "global_step": 180125, "epoch": 4288} {"train_loss": -6.933381080627441, "global_step": 180126, "epoch": 4288} {"train_loss": -6.897299766540527, "global_step": 180127, "epoch": 4288} {"train_loss": -6.953825950622559, "global_step": 180128, "epoch": 4288} {"train_loss": -6.954668045043945, "global_step": 180129, "epoch": 4288} {"train_loss": -7.041009902954102, "global_step": 180130, "epoch": 4288} {"train_loss": -6.9308624267578125, "global_step": 180131, "epoch": 4288} {"train_loss": -6.951885223388672, "global_step": 180132, "epoch": 4288} {"train_loss": -6.907964706420898, "global_step": 180133, "epoch": 4288} {"train_loss": -7.073032379150391, "global_step": 180134, "epoch": 4288} {"train_loss": -7.008296012878418, "global_step": 180135, "epoch": 4288} {"train_loss": -7.059974670410156, "global_step": 180136, "epoch": 4288} {"train_loss": -6.994329543340774, "global_step": 180137, "epoch": 4288, "val_loss": 68910.1015625} {"train_loss": -6.991890907287598, "global_step": 180138, "epoch": 4289} {"train_loss": -6.951709747314453, "global_step": 180139, "epoch": 4289} {"train_loss": -7.079922676086426, "global_step": 180140, "epoch": 4289} {"train_loss": -7.006159782409668, "global_step": 180141, "epoch": 4289} {"train_loss": -6.989873886108398, "global_step": 180142, "epoch": 4289} {"train_loss": -7.184975624084473, "global_step": 180143, "epoch": 4289} {"train_loss": -7.027554512023926, "global_step": 180144, "epoch": 4289} {"train_loss": -7.020573139190674, "global_step": 180145, "epoch": 4289} {"train_loss": -7.1673479080200195, "global_step": 180146, "epoch": 4289} {"train_loss": -7.012743949890137, "global_step": 180147, "epoch": 4289} {"train_loss": -7.004634380340576, "global_step": 180148, "epoch": 4289} {"train_loss": -7.052163124084473, "global_step": 180149, "epoch": 4289} {"train_loss": -7.06199312210083, "global_step": 180150, "epoch": 4289} {"train_loss": -7.052305221557617, "global_step": 180151, "epoch": 4289} {"train_loss": -7.087640762329102, "global_step": 180152, "epoch": 4289} {"train_loss": -7.087879657745361, "global_step": 180153, "epoch": 4289} {"train_loss": -7.195283889770508, "global_step": 180154, "epoch": 4289} {"train_loss": -7.0866289138793945, "global_step": 180155, "epoch": 4289} {"train_loss": -7.163315773010254, "global_step": 180156, "epoch": 4289} {"train_loss": -7.06294059753418, "global_step": 180157, "epoch": 4289} {"train_loss": -7.210928440093994, "global_step": 180158, "epoch": 4289} {"train_loss": -7.1255645751953125, "global_step": 180159, "epoch": 4289} {"train_loss": -7.0809502601623535, "global_step": 180160, "epoch": 4289} {"train_loss": -7.127167701721191, "global_step": 180161, "epoch": 4289} {"train_loss": -6.985201835632324, "global_step": 180162, "epoch": 4289} {"train_loss": -7.022146224975586, "global_step": 180163, "epoch": 4289} {"train_loss": -7.13819694519043, "global_step": 180164, "epoch": 4289} {"train_loss": -7.027165412902832, "global_step": 180165, "epoch": 4289} {"train_loss": -7.0280609130859375, "global_step": 180166, "epoch": 4289} {"train_loss": -7.070995807647705, "global_step": 180167, "epoch": 4289} {"train_loss": -7.039032936096191, "global_step": 180168, "epoch": 4289} {"train_loss": -7.154023170471191, "global_step": 180169, "epoch": 4289} {"train_loss": -7.132232666015625, "global_step": 180170, "epoch": 4289} {"train_loss": -7.149320125579834, "global_step": 180171, "epoch": 4289} {"train_loss": -7.0492634773254395, "global_step": 180172, "epoch": 4289} {"train_loss": -7.089998245239258, "global_step": 180173, "epoch": 4289} {"train_loss": -7.068840503692627, "global_step": 180174, "epoch": 4289} {"train_loss": -7.196202278137207, "global_step": 180175, "epoch": 4289} {"train_loss": -7.1456098556518555, "global_step": 180176, "epoch": 4289} {"train_loss": -7.081902503967285, "global_step": 180177, "epoch": 4289} {"train_loss": -7.232893943786621, "global_step": 180178, "epoch": 4289} {"train_loss": -7.085871866771153, "global_step": 180179, "epoch": 4289, "val_loss": 68731.671875} {"train_loss": -7.209451675415039, "global_step": 180180, "epoch": 4290} {"train_loss": -7.118607521057129, "global_step": 180181, "epoch": 4290} {"train_loss": -6.998908996582031, "global_step": 180182, "epoch": 4290} {"train_loss": -6.9742326736450195, "global_step": 180183, "epoch": 4290} {"train_loss": -7.104369640350342, "global_step": 180184, "epoch": 4290} {"train_loss": -6.974820137023926, "global_step": 180185, "epoch": 4290} {"train_loss": -7.0741472244262695, "global_step": 180186, "epoch": 4290} {"train_loss": -7.069436073303223, "global_step": 180187, "epoch": 4290} {"train_loss": -7.052845001220703, "global_step": 180188, "epoch": 4290} {"train_loss": -7.127860069274902, "global_step": 180189, "epoch": 4290} {"train_loss": -7.093070030212402, "global_step": 180190, "epoch": 4290} {"train_loss": -7.005889892578125, "global_step": 180191, "epoch": 4290} {"train_loss": -7.108391761779785, "global_step": 180192, "epoch": 4290} {"train_loss": -7.165890216827393, "global_step": 180193, "epoch": 4290} {"train_loss": -7.058498382568359, "global_step": 180194, "epoch": 4290} {"train_loss": -7.059412002563477, "global_step": 180195, "epoch": 4290} {"train_loss": -7.1131720542907715, "global_step": 180196, "epoch": 4290} {"train_loss": -6.964632511138916, "global_step": 180197, "epoch": 4290} {"train_loss": -7.011837005615234, "global_step": 180198, "epoch": 4290} {"train_loss": -7.012935638427734, "global_step": 180199, "epoch": 4290} {"train_loss": -7.093706130981445, "global_step": 180200, "epoch": 4290} {"train_loss": -7.1093034744262695, "global_step": 180201, "epoch": 4290} {"train_loss": -7.069196701049805, "global_step": 180202, "epoch": 4290} {"train_loss": -7.127920627593994, "global_step": 180203, "epoch": 4290} {"train_loss": -7.066298484802246, "global_step": 180204, "epoch": 4290} {"train_loss": -7.1105499267578125, "global_step": 180205, "epoch": 4290} {"train_loss": -7.036625385284424, "global_step": 180206, "epoch": 4290} {"train_loss": -7.2235541343688965, "global_step": 180207, "epoch": 4290} {"train_loss": -7.0916876792907715, "global_step": 180208, "epoch": 4290} {"train_loss": -6.861031532287598, "global_step": 180209, "epoch": 4290} {"train_loss": -7.152613639831543, "global_step": 180210, "epoch": 4290} {"train_loss": -6.90739107131958, "global_step": 180211, "epoch": 4290} {"train_loss": -7.094747066497803, "global_step": 180212, "epoch": 4290} {"train_loss": -7.065310955047607, "global_step": 180213, "epoch": 4290} {"train_loss": -7.046058654785156, "global_step": 180214, "epoch": 4290} {"train_loss": -7.042049407958984, "global_step": 180215, "epoch": 4290} {"train_loss": -7.035577774047852, "global_step": 180216, "epoch": 4290} {"train_loss": -7.060055255889893, "global_step": 180217, "epoch": 4290} {"train_loss": -7.051931858062744, "global_step": 180218, "epoch": 4290} {"train_loss": -7.1107072830200195, "global_step": 180219, "epoch": 4290} {"train_loss": -7.145666599273682, "global_step": 180220, "epoch": 4290} {"train_loss": -7.070138170605614, "global_step": 180221, "epoch": 4290, "val_loss": 68625.03125} {"train_loss": -7.047321319580078, "global_step": 180222, "epoch": 4291} {"train_loss": -7.03548002243042, "global_step": 180223, "epoch": 4291} {"train_loss": -7.162901878356934, "global_step": 180224, "epoch": 4291} {"train_loss": -7.10225772857666, "global_step": 180225, "epoch": 4291} {"train_loss": -6.9851975440979, "global_step": 180226, "epoch": 4291} {"train_loss": -6.98190450668335, "global_step": 180227, "epoch": 4291} {"train_loss": -7.076010704040527, "global_step": 180228, "epoch": 4291} {"train_loss": -7.104071617126465, "global_step": 180229, "epoch": 4291} {"train_loss": -7.007452011108398, "global_step": 180230, "epoch": 4291} {"train_loss": -7.0507354736328125, "global_step": 180231, "epoch": 4291} {"train_loss": -7.00776481628418, "global_step": 180232, "epoch": 4291} {"train_loss": -7.090539932250977, "global_step": 180233, "epoch": 4291} {"train_loss": -7.065155506134033, "global_step": 180234, "epoch": 4291} {"train_loss": -7.124838352203369, "global_step": 180235, "epoch": 4291} {"train_loss": -7.04347038269043, "global_step": 180236, "epoch": 4291} {"train_loss": -7.013775825500488, "global_step": 180237, "epoch": 4291} {"train_loss": -6.907574653625488, "global_step": 180238, "epoch": 4291} {"train_loss": -7.070470333099365, "global_step": 180239, "epoch": 4291} {"train_loss": -6.993305206298828, "global_step": 180240, "epoch": 4291} {"train_loss": -6.966670989990234, "global_step": 180241, "epoch": 4291} {"train_loss": -7.126191139221191, "global_step": 180242, "epoch": 4291} {"train_loss": -6.910297870635986, "global_step": 180243, "epoch": 4291} {"train_loss": -6.9875030517578125, "global_step": 180244, "epoch": 4291} {"train_loss": -7.036679267883301, "global_step": 180245, "epoch": 4291} {"train_loss": -6.920157432556152, "global_step": 180246, "epoch": 4291} {"train_loss": -6.988969802856445, "global_step": 180247, "epoch": 4291} {"train_loss": -7.001226425170898, "global_step": 180248, "epoch": 4291} {"train_loss": -7.077328681945801, "global_step": 180249, "epoch": 4291} {"train_loss": -7.095792293548584, "global_step": 180250, "epoch": 4291} {"train_loss": -6.89028263092041, "global_step": 180251, "epoch": 4291} {"train_loss": -6.977103233337402, "global_step": 180252, "epoch": 4291} {"train_loss": -6.985716819763184, "global_step": 180253, "epoch": 4291} {"train_loss": -7.0746636390686035, "global_step": 180254, "epoch": 4291} {"train_loss": -6.971072196960449, "global_step": 180255, "epoch": 4291} {"train_loss": -7.096347808837891, "global_step": 180256, "epoch": 4291} {"train_loss": -6.94641637802124, "global_step": 180257, "epoch": 4291} {"train_loss": -7.010659217834473, "global_step": 180258, "epoch": 4291} {"train_loss": -7.068918228149414, "global_step": 180259, "epoch": 4291} {"train_loss": -7.024696350097656, "global_step": 180260, "epoch": 4291} {"train_loss": -7.117440223693848, "global_step": 180261, "epoch": 4291} {"train_loss": -7.07419490814209, "global_step": 180262, "epoch": 4291} {"train_loss": -7.030844711122059, "global_step": 180263, "epoch": 4291, "val_loss": 68657.9140625} {"train_loss": -7.124424457550049, "global_step": 180264, "epoch": 4292} {"train_loss": -7.125688076019287, "global_step": 180265, "epoch": 4292} {"train_loss": -7.058116436004639, "global_step": 180266, "epoch": 4292} {"train_loss": -7.101072311401367, "global_step": 180267, "epoch": 4292} {"train_loss": -6.993278503417969, "global_step": 180268, "epoch": 4292} {"train_loss": -7.1429901123046875, "global_step": 180269, "epoch": 4292} {"train_loss": -7.084033966064453, "global_step": 180270, "epoch": 4292} {"train_loss": -7.18154239654541, "global_step": 180271, "epoch": 4292} {"train_loss": -7.1801862716674805, "global_step": 180272, "epoch": 4292} {"train_loss": -6.946008682250977, "global_step": 180273, "epoch": 4292} {"train_loss": -7.1960039138793945, "global_step": 180274, "epoch": 4292} {"train_loss": -6.996559143066406, "global_step": 180275, "epoch": 4292} {"train_loss": -6.986696720123291, "global_step": 180276, "epoch": 4292} {"train_loss": -7.026427745819092, "global_step": 180277, "epoch": 4292} {"train_loss": -6.963195323944092, "global_step": 180278, "epoch": 4292} {"train_loss": -7.165792465209961, "global_step": 180279, "epoch": 4292} {"train_loss": -7.052577972412109, "global_step": 180280, "epoch": 4292} {"train_loss": -7.28580379486084, "global_step": 180281, "epoch": 4292} {"train_loss": -7.061235427856445, "global_step": 180282, "epoch": 4292} {"train_loss": -7.062591075897217, "global_step": 180283, "epoch": 4292} {"train_loss": -7.068360328674316, "global_step": 180284, "epoch": 4292} {"train_loss": -7.080469131469727, "global_step": 180285, "epoch": 4292} {"train_loss": -7.046494483947754, "global_step": 180286, "epoch": 4292} {"train_loss": -7.099113464355469, "global_step": 180287, "epoch": 4292} {"train_loss": -6.987364768981934, "global_step": 180288, "epoch": 4292} {"train_loss": -7.117914199829102, "global_step": 180289, "epoch": 4292} {"train_loss": -6.992671012878418, "global_step": 180290, "epoch": 4292} {"train_loss": -7.180602073669434, "global_step": 180291, "epoch": 4292} {"train_loss": -6.9935150146484375, "global_step": 180292, "epoch": 4292} {"train_loss": -7.039592742919922, "global_step": 180293, "epoch": 4292} {"train_loss": -7.010438919067383, "global_step": 180294, "epoch": 4292} {"train_loss": -6.9638895988464355, "global_step": 180295, "epoch": 4292} {"train_loss": -7.010585308074951, "global_step": 180296, "epoch": 4292} {"train_loss": -6.861457824707031, "global_step": 180297, "epoch": 4292} {"train_loss": -7.029871940612793, "global_step": 180298, "epoch": 4292} {"train_loss": -6.978840351104736, "global_step": 180299, "epoch": 4292} {"train_loss": -7.116878032684326, "global_step": 180300, "epoch": 4292} {"train_loss": -6.996121406555176, "global_step": 180301, "epoch": 4292} {"train_loss": -6.9704060554504395, "global_step": 180302, "epoch": 4292} {"train_loss": -7.119688987731934, "global_step": 180303, "epoch": 4292} {"train_loss": -6.892159461975098, "global_step": 180304, "epoch": 4292} {"train_loss": -7.058125722975958, "global_step": 180305, "epoch": 4292, "val_loss": 68865.5703125} {"train_loss": -6.950118541717529, "global_step": 180306, "epoch": 4293} {"train_loss": -7.025646686553955, "global_step": 180307, "epoch": 4293} {"train_loss": -6.921910285949707, "global_step": 180308, "epoch": 4293} {"train_loss": -6.983887672424316, "global_step": 180309, "epoch": 4293} {"train_loss": -6.851579666137695, "global_step": 180310, "epoch": 4293} {"train_loss": -6.969053268432617, "global_step": 180311, "epoch": 4293} {"train_loss": -7.01122522354126, "global_step": 180312, "epoch": 4293} {"train_loss": -6.944384574890137, "global_step": 180313, "epoch": 4293} {"train_loss": -6.962560653686523, "global_step": 180314, "epoch": 4293} {"train_loss": -7.097903251647949, "global_step": 180315, "epoch": 4293} {"train_loss": -6.973679542541504, "global_step": 180316, "epoch": 4293} {"train_loss": -7.1510009765625, "global_step": 180317, "epoch": 4293} {"train_loss": -7.032771110534668, "global_step": 180318, "epoch": 4293} {"train_loss": -7.082211494445801, "global_step": 180319, "epoch": 4293} {"train_loss": -7.153073310852051, "global_step": 180320, "epoch": 4293} {"train_loss": -6.9756622314453125, "global_step": 180321, "epoch": 4293} {"train_loss": -7.126779556274414, "global_step": 180322, "epoch": 4293} {"train_loss": -6.936274528503418, "global_step": 180323, "epoch": 4293} {"train_loss": -7.092013835906982, "global_step": 180324, "epoch": 4293} {"train_loss": -7.020324230194092, "global_step": 180325, "epoch": 4293} {"train_loss": -6.997020244598389, "global_step": 180326, "epoch": 4293} {"train_loss": -7.111065864562988, "global_step": 180327, "epoch": 4293} {"train_loss": -7.079333305358887, "global_step": 180328, "epoch": 4293} {"train_loss": -7.061898231506348, "global_step": 180329, "epoch": 4293} {"train_loss": -6.968070983886719, "global_step": 180330, "epoch": 4293} {"train_loss": -7.105195045471191, "global_step": 180331, "epoch": 4293} {"train_loss": -7.279554843902588, "global_step": 180332, "epoch": 4293} {"train_loss": -7.102304458618164, "global_step": 180333, "epoch": 4293} {"train_loss": -7.1386613845825195, "global_step": 180334, "epoch": 4293} {"train_loss": -7.126403331756592, "global_step": 180335, "epoch": 4293} {"train_loss": -7.18707275390625, "global_step": 180336, "epoch": 4293} {"train_loss": -7.021523475646973, "global_step": 180337, "epoch": 4293} {"train_loss": -7.078313827514648, "global_step": 180338, "epoch": 4293} {"train_loss": -7.181273460388184, "global_step": 180339, "epoch": 4293} {"train_loss": -6.988581657409668, "global_step": 180340, "epoch": 4293} {"train_loss": -7.05064582824707, "global_step": 180341, "epoch": 4293} {"train_loss": -7.12529182434082, "global_step": 180342, "epoch": 4293} {"train_loss": -7.050778388977051, "global_step": 180343, "epoch": 4293} {"train_loss": -7.054244041442871, "global_step": 180344, "epoch": 4293} {"train_loss": -6.899148941040039, "global_step": 180345, "epoch": 4293} {"train_loss": -7.0261383056640625, "global_step": 180346, "epoch": 4293} {"train_loss": -7.047374384743827, "global_step": 180347, "epoch": 4293, "val_loss": 69046.5859375} {"train_loss": -6.912642955780029, "global_step": 180348, "epoch": 4294} {"train_loss": -7.098514556884766, "global_step": 180349, "epoch": 4294} {"train_loss": -7.132905960083008, "global_step": 180350, "epoch": 4294} {"train_loss": -7.12171745300293, "global_step": 180351, "epoch": 4294} {"train_loss": -6.958637237548828, "global_step": 180352, "epoch": 4294} {"train_loss": -6.9419660568237305, "global_step": 180353, "epoch": 4294} {"train_loss": -7.004978656768799, "global_step": 180354, "epoch": 4294} {"train_loss": -7.047179222106934, "global_step": 180355, "epoch": 4294} {"train_loss": -7.111034393310547, "global_step": 180356, "epoch": 4294} {"train_loss": -7.045078277587891, "global_step": 180357, "epoch": 4294} {"train_loss": -7.1060099601745605, "global_step": 180358, "epoch": 4294} {"train_loss": -7.10678768157959, "global_step": 180359, "epoch": 4294} {"train_loss": -7.111614227294922, "global_step": 180360, "epoch": 4294} {"train_loss": -7.007739067077637, "global_step": 180361, "epoch": 4294} {"train_loss": -6.950540542602539, "global_step": 180362, "epoch": 4294} {"train_loss": -7.238009452819824, "global_step": 180363, "epoch": 4294} {"train_loss": -7.052828311920166, "global_step": 180364, "epoch": 4294} {"train_loss": -7.078020095825195, "global_step": 180365, "epoch": 4294} {"train_loss": -7.092649936676025, "global_step": 180366, "epoch": 4294} {"train_loss": -7.104389190673828, "global_step": 180367, "epoch": 4294} {"train_loss": -7.014963626861572, "global_step": 180368, "epoch": 4294} {"train_loss": -7.140436172485352, "global_step": 180369, "epoch": 4294} {"train_loss": -7.077582359313965, "global_step": 180370, "epoch": 4294} {"train_loss": -7.0866899490356445, "global_step": 180371, "epoch": 4294} {"train_loss": -7.1092705726623535, "global_step": 180372, "epoch": 4294} {"train_loss": -7.2012434005737305, "global_step": 180373, "epoch": 4294} {"train_loss": -6.966763496398926, "global_step": 180374, "epoch": 4294} {"train_loss": -7.057180404663086, "global_step": 180375, "epoch": 4294} {"train_loss": -7.186128616333008, "global_step": 180376, "epoch": 4294} {"train_loss": -7.111041069030762, "global_step": 180377, "epoch": 4294} {"train_loss": -7.124588966369629, "global_step": 180378, "epoch": 4294} {"train_loss": -7.063043594360352, "global_step": 180379, "epoch": 4294} {"train_loss": -7.167877674102783, "global_step": 180380, "epoch": 4294} {"train_loss": -7.036038398742676, "global_step": 180381, "epoch": 4294} {"train_loss": -7.115885257720947, "global_step": 180382, "epoch": 4294} {"train_loss": -6.994437217712402, "global_step": 180383, "epoch": 4294} {"train_loss": -7.059314727783203, "global_step": 180384, "epoch": 4294} {"train_loss": -7.177481651306152, "global_step": 180385, "epoch": 4294} {"train_loss": -7.138260841369629, "global_step": 180386, "epoch": 4294} {"train_loss": -7.025876522064209, "global_step": 180387, "epoch": 4294} {"train_loss": -7.065916061401367, "global_step": 180388, "epoch": 4294} {"train_loss": -7.079462233043852, "global_step": 180389, "epoch": 4294, "val_loss": 68935.71875} {"train_loss": -7.125361442565918, "global_step": 180390, "epoch": 4295} {"train_loss": -7.111112594604492, "global_step": 180391, "epoch": 4295} {"train_loss": -7.13712215423584, "global_step": 180392, "epoch": 4295} {"train_loss": -7.13176965713501, "global_step": 180393, "epoch": 4295} {"train_loss": -7.097064018249512, "global_step": 180394, "epoch": 4295} {"train_loss": -7.113578796386719, "global_step": 180395, "epoch": 4295} {"train_loss": -7.214775562286377, "global_step": 180396, "epoch": 4295} {"train_loss": -7.160215854644775, "global_step": 180397, "epoch": 4295} {"train_loss": -7.032753944396973, "global_step": 180398, "epoch": 4295} {"train_loss": -7.195581436157227, "global_step": 180399, "epoch": 4295} {"train_loss": -7.153698921203613, "global_step": 180400, "epoch": 4295} {"train_loss": -7.018268585205078, "global_step": 180401, "epoch": 4295} {"train_loss": -7.085781574249268, "global_step": 180402, "epoch": 4295} {"train_loss": -7.038771152496338, "global_step": 180403, "epoch": 4295} {"train_loss": -7.2504353523254395, "global_step": 180404, "epoch": 4295} {"train_loss": -7.142490863800049, "global_step": 180405, "epoch": 4295} {"train_loss": -7.051853179931641, "global_step": 180406, "epoch": 4295} {"train_loss": -7.034347057342529, "global_step": 180407, "epoch": 4295} {"train_loss": -7.292255401611328, "global_step": 180408, "epoch": 4295} {"train_loss": -7.0649824142456055, "global_step": 180409, "epoch": 4295} {"train_loss": -7.026326656341553, "global_step": 180410, "epoch": 4295} {"train_loss": -7.113859176635742, "global_step": 180411, "epoch": 4295} {"train_loss": -7.209050178527832, "global_step": 180412, "epoch": 4295} {"train_loss": -7.103055000305176, "global_step": 180413, "epoch": 4295} {"train_loss": -7.078544616699219, "global_step": 180414, "epoch": 4295} {"train_loss": -7.185296535491943, "global_step": 180415, "epoch": 4295} {"train_loss": -7.103771686553955, "global_step": 180416, "epoch": 4295} {"train_loss": -7.143560409545898, "global_step": 180417, "epoch": 4295} {"train_loss": -7.086877822875977, "global_step": 180418, "epoch": 4295} {"train_loss": -7.109821319580078, "global_step": 180419, "epoch": 4295} {"train_loss": -7.118069648742676, "global_step": 180420, "epoch": 4295} {"train_loss": -7.182239055633545, "global_step": 180421, "epoch": 4295} {"train_loss": -7.220516204833984, "global_step": 180422, "epoch": 4295} {"train_loss": -7.088140487670898, "global_step": 180423, "epoch": 4295} {"train_loss": -7.133350849151611, "global_step": 180424, "epoch": 4295} {"train_loss": -6.95847225189209, "global_step": 180425, "epoch": 4295} {"train_loss": -6.982181549072266, "global_step": 180426, "epoch": 4295} {"train_loss": -7.202430248260498, "global_step": 180427, "epoch": 4295} {"train_loss": -7.007421493530273, "global_step": 180428, "epoch": 4295} {"train_loss": -7.070533275604248, "global_step": 180429, "epoch": 4295} {"train_loss": -7.101688385009766, "global_step": 180430, "epoch": 4295} {"train_loss": -7.116464717047555, "global_step": 180431, "epoch": 4295, "val_loss": 68754.375} {"train_loss": -6.94703483581543, "global_step": 180432, "epoch": 4296} {"train_loss": -7.22229528427124, "global_step": 180433, "epoch": 4296} {"train_loss": -7.106212615966797, "global_step": 180434, "epoch": 4296} {"train_loss": -7.048900604248047, "global_step": 180435, "epoch": 4296} {"train_loss": -7.153061866760254, "global_step": 180436, "epoch": 4296} {"train_loss": -7.136597633361816, "global_step": 180437, "epoch": 4296} {"train_loss": -7.147541522979736, "global_step": 180438, "epoch": 4296} {"train_loss": -7.113946914672852, "global_step": 180439, "epoch": 4296} {"train_loss": -7.116838455200195, "global_step": 180440, "epoch": 4296} {"train_loss": -7.073271751403809, "global_step": 180441, "epoch": 4296} {"train_loss": -7.03912353515625, "global_step": 180442, "epoch": 4296} {"train_loss": -7.036900520324707, "global_step": 180443, "epoch": 4296} {"train_loss": -7.030451774597168, "global_step": 180444, "epoch": 4296} {"train_loss": -7.094542026519775, "global_step": 180445, "epoch": 4296} {"train_loss": -7.038667678833008, "global_step": 180446, "epoch": 4296} {"train_loss": -7.081478595733643, "global_step": 180447, "epoch": 4296} {"train_loss": -7.103560447692871, "global_step": 180448, "epoch": 4296} {"train_loss": -6.9584641456604, "global_step": 180449, "epoch": 4296} {"train_loss": -7.0879716873168945, "global_step": 180450, "epoch": 4296} {"train_loss": -7.1432318687438965, "global_step": 180451, "epoch": 4296} {"train_loss": -7.017564296722412, "global_step": 180452, "epoch": 4296} {"train_loss": -7.027047157287598, "global_step": 180453, "epoch": 4296} {"train_loss": -7.079793930053711, "global_step": 180454, "epoch": 4296} {"train_loss": -7.162110328674316, "global_step": 180455, "epoch": 4296} {"train_loss": -7.018684387207031, "global_step": 180456, "epoch": 4296} {"train_loss": -6.969836711883545, "global_step": 180457, "epoch": 4296} {"train_loss": -6.939792633056641, "global_step": 180458, "epoch": 4296} {"train_loss": -6.9899725914001465, "global_step": 180459, "epoch": 4296} {"train_loss": -6.951310157775879, "global_step": 180460, "epoch": 4296} {"train_loss": -6.9793500900268555, "global_step": 180461, "epoch": 4296} {"train_loss": -7.09345006942749, "global_step": 180462, "epoch": 4296} {"train_loss": -6.9753193855285645, "global_step": 180463, "epoch": 4296} {"train_loss": -6.997341156005859, "global_step": 180464, "epoch": 4296} {"train_loss": -6.994225025177002, "global_step": 180465, "epoch": 4296} {"train_loss": -7.1358160972595215, "global_step": 180466, "epoch": 4296} {"train_loss": -7.085546493530273, "global_step": 180467, "epoch": 4296} {"train_loss": -6.89292049407959, "global_step": 180468, "epoch": 4296} {"train_loss": -7.155872344970703, "global_step": 180469, "epoch": 4296} {"train_loss": -6.94883394241333, "global_step": 180470, "epoch": 4296} {"train_loss": -7.002802848815918, "global_step": 180471, "epoch": 4296} {"train_loss": -7.016808032989502, "global_step": 180472, "epoch": 4296} {"train_loss": -7.049688940956479, "global_step": 180473, "epoch": 4296, "val_loss": 68906.421875} {"train_loss": -7.166347026824951, "global_step": 180474, "epoch": 4297} {"train_loss": -6.934331893920898, "global_step": 180475, "epoch": 4297} {"train_loss": -7.119565010070801, "global_step": 180476, "epoch": 4297} {"train_loss": -7.071694850921631, "global_step": 180477, "epoch": 4297} {"train_loss": -7.031007766723633, "global_step": 180478, "epoch": 4297} {"train_loss": -7.165333271026611, "global_step": 180479, "epoch": 4297} {"train_loss": -7.023968696594238, "global_step": 180480, "epoch": 4297} {"train_loss": -7.026246070861816, "global_step": 180481, "epoch": 4297} {"train_loss": -7.11407470703125, "global_step": 180482, "epoch": 4297} {"train_loss": -7.050397872924805, "global_step": 180483, "epoch": 4297} {"train_loss": -6.987027168273926, "global_step": 180484, "epoch": 4297} {"train_loss": -7.1310224533081055, "global_step": 180485, "epoch": 4297} {"train_loss": -7.071932792663574, "global_step": 180486, "epoch": 4297} {"train_loss": -7.1514129638671875, "global_step": 180487, "epoch": 4297} {"train_loss": -7.105358123779297, "global_step": 180488, "epoch": 4297} {"train_loss": -7.05059814453125, "global_step": 180489, "epoch": 4297} {"train_loss": -7.106071949005127, "global_step": 180490, "epoch": 4297} {"train_loss": -7.095013618469238, "global_step": 180491, "epoch": 4297} {"train_loss": -7.004469394683838, "global_step": 180492, "epoch": 4297} {"train_loss": -7.02546501159668, "global_step": 180493, "epoch": 4297} {"train_loss": -7.157365798950195, "global_step": 180494, "epoch": 4297} {"train_loss": -7.008518218994141, "global_step": 180495, "epoch": 4297} {"train_loss": -7.067363262176514, "global_step": 180496, "epoch": 4297} {"train_loss": -7.076178550720215, "global_step": 180497, "epoch": 4297} {"train_loss": -7.063648223876953, "global_step": 180498, "epoch": 4297} {"train_loss": -7.1144819259643555, "global_step": 180499, "epoch": 4297} {"train_loss": -7.034218788146973, "global_step": 180500, "epoch": 4297} {"train_loss": -7.116804122924805, "global_step": 180501, "epoch": 4297} {"train_loss": -6.974507808685303, "global_step": 180502, "epoch": 4297} {"train_loss": -7.102974891662598, "global_step": 180503, "epoch": 4297} {"train_loss": -7.120614051818848, "global_step": 180504, "epoch": 4297} {"train_loss": -7.081290245056152, "global_step": 180505, "epoch": 4297} {"train_loss": -7.000238418579102, "global_step": 180506, "epoch": 4297} {"train_loss": -7.029038429260254, "global_step": 180507, "epoch": 4297} {"train_loss": -6.940519332885742, "global_step": 180508, "epoch": 4297} {"train_loss": -6.924391269683838, "global_step": 180509, "epoch": 4297} {"train_loss": -7.059700012207031, "global_step": 180510, "epoch": 4297} {"train_loss": -7.0845746994018555, "global_step": 180511, "epoch": 4297} {"train_loss": -6.86922025680542, "global_step": 180512, "epoch": 4297} {"train_loss": -6.936680793762207, "global_step": 180513, "epoch": 4297} {"train_loss": -6.8920207023620605, "global_step": 180514, "epoch": 4297} {"train_loss": -7.050657669703166, "global_step": 180515, "epoch": 4297, "val_loss": 69128.1171875} {"train_loss": -6.915567398071289, "global_step": 180516, "epoch": 4298} {"train_loss": -6.982775688171387, "global_step": 180517, "epoch": 4298} {"train_loss": -7.05057430267334, "global_step": 180518, "epoch": 4298} {"train_loss": -6.99394416809082, "global_step": 180519, "epoch": 4298} {"train_loss": -6.900935649871826, "global_step": 180520, "epoch": 4298} {"train_loss": -6.94137716293335, "global_step": 180521, "epoch": 4298} {"train_loss": -6.994317054748535, "global_step": 180522, "epoch": 4298} {"train_loss": -7.114452362060547, "global_step": 180523, "epoch": 4298} {"train_loss": -7.053140163421631, "global_step": 180524, "epoch": 4298} {"train_loss": -6.972909927368164, "global_step": 180525, "epoch": 4298} {"train_loss": -7.019607067108154, "global_step": 180526, "epoch": 4298} {"train_loss": -7.180229187011719, "global_step": 180527, "epoch": 4298} {"train_loss": -7.0690460205078125, "global_step": 180528, "epoch": 4298} {"train_loss": -7.0395989418029785, "global_step": 180529, "epoch": 4298} {"train_loss": -7.11965274810791, "global_step": 180530, "epoch": 4298} {"train_loss": -7.12114143371582, "global_step": 180531, "epoch": 4298} {"train_loss": -7.140480041503906, "global_step": 180532, "epoch": 4298} {"train_loss": -7.166338920593262, "global_step": 180533, "epoch": 4298} {"train_loss": -7.082552909851074, "global_step": 180534, "epoch": 4298} {"train_loss": -7.124137878417969, "global_step": 180535, "epoch": 4298} {"train_loss": -7.174414157867432, "global_step": 180536, "epoch": 4298} {"train_loss": -7.086634635925293, "global_step": 180537, "epoch": 4298} {"train_loss": -7.134158134460449, "global_step": 180538, "epoch": 4298} {"train_loss": -7.124944686889648, "global_step": 180539, "epoch": 4298} {"train_loss": -7.182011127471924, "global_step": 180540, "epoch": 4298} {"train_loss": -7.066763877868652, "global_step": 180541, "epoch": 4298} {"train_loss": -7.230229377746582, "global_step": 180542, "epoch": 4298} {"train_loss": -7.142470836639404, "global_step": 180543, "epoch": 4298} {"train_loss": -7.2673234939575195, "global_step": 180544, "epoch": 4298} {"train_loss": -7.155994415283203, "global_step": 180545, "epoch": 4298} {"train_loss": -7.1224212646484375, "global_step": 180546, "epoch": 4298} {"train_loss": -7.069271087646484, "global_step": 180547, "epoch": 4298} {"train_loss": -7.149503707885742, "global_step": 180548, "epoch": 4298} {"train_loss": -7.162655353546143, "global_step": 180549, "epoch": 4298} {"train_loss": -7.171971797943115, "global_step": 180550, "epoch": 4298} {"train_loss": -7.10579252243042, "global_step": 180551, "epoch": 4298} {"train_loss": -7.278460502624512, "global_step": 180552, "epoch": 4298} {"train_loss": -7.122543811798096, "global_step": 180553, "epoch": 4298} {"train_loss": -7.101655960083008, "global_step": 180554, "epoch": 4298} {"train_loss": -7.065040111541748, "global_step": 180555, "epoch": 4298} {"train_loss": -7.0756049156188965, "global_step": 180556, "epoch": 4298} {"train_loss": -7.096483491715931, "global_step": 180557, "epoch": 4298, "val_loss": 68707.34375} {"train_loss": -7.031525611877441, "global_step": 180558, "epoch": 4299} {"train_loss": -7.162623882293701, "global_step": 180559, "epoch": 4299} {"train_loss": -6.954801559448242, "global_step": 180560, "epoch": 4299} {"train_loss": -6.794854640960693, "global_step": 180561, "epoch": 4299} {"train_loss": -6.986292362213135, "global_step": 180562, "epoch": 4299} {"train_loss": -6.996709823608398, "global_step": 180563, "epoch": 4299} {"train_loss": -6.861021041870117, "global_step": 180564, "epoch": 4299} {"train_loss": -6.9963250160217285, "global_step": 180565, "epoch": 4299} {"train_loss": -7.145883560180664, "global_step": 180566, "epoch": 4299} {"train_loss": -7.0617876052856445, "global_step": 180567, "epoch": 4299} {"train_loss": -6.9798078536987305, "global_step": 180568, "epoch": 4299} {"train_loss": -7.0038275718688965, "global_step": 180569, "epoch": 4299} {"train_loss": -7.008567810058594, "global_step": 180570, "epoch": 4299} {"train_loss": -7.058002471923828, "global_step": 180571, "epoch": 4299} {"train_loss": -7.169485092163086, "global_step": 180572, "epoch": 4299} {"train_loss": -7.002702713012695, "global_step": 180573, "epoch": 4299} {"train_loss": -7.146603584289551, "global_step": 180574, "epoch": 4299} {"train_loss": -7.073576927185059, "global_step": 180575, "epoch": 4299} {"train_loss": -7.0953826904296875, "global_step": 180576, "epoch": 4299} {"train_loss": -6.974003314971924, "global_step": 180577, "epoch": 4299} {"train_loss": -7.086093425750732, "global_step": 180578, "epoch": 4299} {"train_loss": -7.057355880737305, "global_step": 180579, "epoch": 4299} {"train_loss": -7.031960487365723, "global_step": 180580, "epoch": 4299} {"train_loss": -7.107837677001953, "global_step": 180581, "epoch": 4299} {"train_loss": -7.058082103729248, "global_step": 180582, "epoch": 4299} {"train_loss": -7.060807228088379, "global_step": 180583, "epoch": 4299} {"train_loss": -7.125533103942871, "global_step": 180584, "epoch": 4299} {"train_loss": -6.991334438323975, "global_step": 180585, "epoch": 4299} {"train_loss": -6.946656227111816, "global_step": 180586, "epoch": 4299} {"train_loss": -7.03969669342041, "global_step": 180587, "epoch": 4299} {"train_loss": -7.12517786026001, "global_step": 180588, "epoch": 4299} {"train_loss": -6.930953025817871, "global_step": 180589, "epoch": 4299} {"train_loss": -6.961297988891602, "global_step": 180590, "epoch": 4299} {"train_loss": -7.135883331298828, "global_step": 180591, "epoch": 4299} {"train_loss": -7.098203659057617, "global_step": 180592, "epoch": 4299} {"train_loss": -7.210109710693359, "global_step": 180593, "epoch": 4299} {"train_loss": -7.258429527282715, "global_step": 180594, "epoch": 4299} {"train_loss": -6.943503379821777, "global_step": 180595, "epoch": 4299} {"train_loss": -7.121662139892578, "global_step": 180596, "epoch": 4299} {"train_loss": -7.111515522003174, "global_step": 180597, "epoch": 4299} {"train_loss": -7.004169464111328, "global_step": 180598, "epoch": 4299} {"train_loss": -7.0478330339704245, "global_step": 180599, "epoch": 4299, "val_loss": 68596.8125} {"train_loss": -7.194268226623535, "global_step": 180600, "epoch": 4300} {"train_loss": -7.144225120544434, "global_step": 180601, "epoch": 4300} {"train_loss": -7.094754219055176, "global_step": 180602, "epoch": 4300} {"train_loss": -7.132209777832031, "global_step": 180603, "epoch": 4300} {"train_loss": -7.067063808441162, "global_step": 180604, "epoch": 4300} {"train_loss": -7.044806003570557, "global_step": 180605, "epoch": 4300} {"train_loss": -7.127230644226074, "global_step": 180606, "epoch": 4300} {"train_loss": -7.182147026062012, "global_step": 180607, "epoch": 4300} {"train_loss": -7.183615684509277, "global_step": 180608, "epoch": 4300} {"train_loss": -7.008558750152588, "global_step": 180609, "epoch": 4300} {"train_loss": -7.161019802093506, "global_step": 180610, "epoch": 4300} {"train_loss": -7.047966003417969, "global_step": 180611, "epoch": 4300} {"train_loss": -6.978228569030762, "global_step": 180612, "epoch": 4300} {"train_loss": -7.137537002563477, "global_step": 180613, "epoch": 4300} {"train_loss": -7.085184097290039, "global_step": 180614, "epoch": 4300} {"train_loss": -7.018197536468506, "global_step": 180615, "epoch": 4300} {"train_loss": -7.027757167816162, "global_step": 180616, "epoch": 4300} {"train_loss": -7.107392311096191, "global_step": 180617, "epoch": 4300} {"train_loss": -6.986489772796631, "global_step": 180618, "epoch": 4300} {"train_loss": -7.103401184082031, "global_step": 180619, "epoch": 4300} {"train_loss": -7.106285095214844, "global_step": 180620, "epoch": 4300} {"train_loss": -7.040314197540283, "global_step": 180621, "epoch": 4300} {"train_loss": -7.077553749084473, "global_step": 180622, "epoch": 4300} {"train_loss": -7.124275207519531, "global_step": 180623, "epoch": 4300} {"train_loss": -6.924374580383301, "global_step": 180624, "epoch": 4300} {"train_loss": -7.118786811828613, "global_step": 180625, "epoch": 4300} {"train_loss": -6.9183783531188965, "global_step": 180626, "epoch": 4300} {"train_loss": -7.005119323730469, "global_step": 180627, "epoch": 4300} {"train_loss": -7.1107258796691895, "global_step": 180628, "epoch": 4300} {"train_loss": -7.021786212921143, "global_step": 180629, "epoch": 4300} {"train_loss": -7.112098217010498, "global_step": 180630, "epoch": 4300} {"train_loss": -7.083303928375244, "global_step": 180631, "epoch": 4300} {"train_loss": -7.038508892059326, "global_step": 180632, "epoch": 4300} {"train_loss": -7.168889045715332, "global_step": 180633, "epoch": 4300} {"train_loss": -7.0385284423828125, "global_step": 180634, "epoch": 4300} {"train_loss": -7.139520168304443, "global_step": 180635, "epoch": 4300} {"train_loss": -7.093513488769531, "global_step": 180636, "epoch": 4300} {"train_loss": -7.010601043701172, "global_step": 180637, "epoch": 4300} {"train_loss": -6.994009017944336, "global_step": 180638, "epoch": 4300} {"train_loss": -7.073177337646484, "global_step": 180639, "epoch": 4300} {"train_loss": -7.063715934753418, "global_step": 180640, "epoch": 4300} {"train_loss": -7.07592324983506, "global_step": 180641, "epoch": 4300, "train/sim_max_reward_0": 0.4092656193999948, "train/sim_max_reward_1": 0.46704908206765045, "train/sim_max_reward_2": 0.7196889678988153, "train/sim_max_reward_3": 0.9557218836257335, "train/sim_max_reward_4": 0.8676071609376053, "train/sim_max_reward_5": 0.9803503275423464, "test/sim_max_reward_4400000": 0.3326332469849207, "test/sim_max_reward_4400001": 0.21732429253113184, "test/sim_max_reward_4400002": 0.3349158740364964, "test/sim_max_reward_4400003": 0.861868011248749, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9545665707303005, "test/sim_max_reward_4400006": 0.9838616590289693, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.32599770048065113, "test/sim_max_reward_4400009": 0.6836466354624777, "test/sim_max_reward_4400010": 0.8191208803519033, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9116637332700551, "test/sim_max_reward_4400013": 0.9681549005298256, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.001086165109605489, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.25538680029918326, "test/sim_max_reward_4400019": 0.9052289733302521, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.28303471553394927, "test/sim_max_reward_4400023": 0.46077713070814275, "test/sim_max_reward_4400024": 0.35260372831622827, "test/sim_max_reward_4400025": 0.2678915486468959, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.02927939844273033, "test/sim_max_reward_4400028": 0.8301839228730968, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 0.9624172881666689, "test/sim_max_reward_4400031": 0.9820188964636366, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9113358863805937, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.9528616566334431, "test/sim_max_reward_4400036": 0.4050554766036013, "test/sim_max_reward_4400037": 0.9846802556024193, "test/sim_max_reward_4400038": 0.19793949687490892, "test/sim_max_reward_4400039": 0.8843217972374765, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.9677850232976172, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.7164504818568669, "test/sim_max_reward_4400045": 0.9713253242554962, "test/sim_max_reward_4400046": 0.9741169097992287, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.7926631290841416, "test/sim_max_reward_4400049": 0.903201487739852, "train/mean_score": 0.7332805069120244, "test/mean_score": 0.5786318795688483, "val_loss": 68698.359375} {"train_loss": -7.080791473388672, "global_step": 180642, "epoch": 4301} {"train_loss": -7.080106735229492, "global_step": 180643, "epoch": 4301} {"train_loss": -7.124197006225586, "global_step": 180644, "epoch": 4301} {"train_loss": -7.1798601150512695, "global_step": 180645, "epoch": 4301} {"train_loss": -7.110711097717285, "global_step": 180646, "epoch": 4301} {"train_loss": -7.121352672576904, "global_step": 180647, "epoch": 4301} {"train_loss": -7.056059837341309, "global_step": 180648, "epoch": 4301} {"train_loss": -7.0352864265441895, "global_step": 180649, "epoch": 4301} {"train_loss": -7.18244743347168, "global_step": 180650, "epoch": 4301} {"train_loss": -7.139460563659668, "global_step": 180651, "epoch": 4301} {"train_loss": -7.159867763519287, "global_step": 180652, "epoch": 4301} {"train_loss": -7.069506645202637, "global_step": 180653, "epoch": 4301} {"train_loss": -6.994868278503418, "global_step": 180654, "epoch": 4301} {"train_loss": -6.955124855041504, "global_step": 180655, "epoch": 4301} {"train_loss": -7.146415710449219, "global_step": 180656, "epoch": 4301} {"train_loss": -7.168780326843262, "global_step": 180657, "epoch": 4301} {"train_loss": -7.091864585876465, "global_step": 180658, "epoch": 4301} {"train_loss": -7.063925266265869, "global_step": 180659, "epoch": 4301} {"train_loss": -7.070676803588867, "global_step": 180660, "epoch": 4301} {"train_loss": -7.157492637634277, "global_step": 180661, "epoch": 4301} {"train_loss": -7.054954528808594, "global_step": 180662, "epoch": 4301} {"train_loss": -7.200738906860352, "global_step": 180663, "epoch": 4301} {"train_loss": -7.19991397857666, "global_step": 180664, "epoch": 4301} {"train_loss": -7.097172260284424, "global_step": 180665, "epoch": 4301} {"train_loss": -7.100974082946777, "global_step": 180666, "epoch": 4301} {"train_loss": -7.087973594665527, "global_step": 180667, "epoch": 4301} {"train_loss": -7.0393853187561035, "global_step": 180668, "epoch": 4301} {"train_loss": -7.0514936447143555, "global_step": 180669, "epoch": 4301} {"train_loss": -7.062004089355469, "global_step": 180670, "epoch": 4301} {"train_loss": -7.177434921264648, "global_step": 180671, "epoch": 4301} {"train_loss": -7.0825395584106445, "global_step": 180672, "epoch": 4301} {"train_loss": -7.062768936157227, "global_step": 180673, "epoch": 4301} {"train_loss": -7.071675777435303, "global_step": 180674, "epoch": 4301} {"train_loss": -7.145770072937012, "global_step": 180675, "epoch": 4301} {"train_loss": -7.096811294555664, "global_step": 180676, "epoch": 4301} {"train_loss": -6.9814863204956055, "global_step": 180677, "epoch": 4301} {"train_loss": -7.060085296630859, "global_step": 180678, "epoch": 4301} {"train_loss": -7.081212520599365, "global_step": 180679, "epoch": 4301} {"train_loss": -7.019665718078613, "global_step": 180680, "epoch": 4301} {"train_loss": -7.14259147644043, "global_step": 180681, "epoch": 4301} {"train_loss": -7.0061445236206055, "global_step": 180682, "epoch": 4301} {"train_loss": -7.09444945199149, "global_step": 180683, "epoch": 4301, "val_loss": 68835.9375} {"train_loss": -7.081639289855957, "global_step": 180684, "epoch": 4302} {"train_loss": -6.99173641204834, "global_step": 180685, "epoch": 4302} {"train_loss": -7.179420471191406, "global_step": 180686, "epoch": 4302} {"train_loss": -7.139054775238037, "global_step": 180687, "epoch": 4302} {"train_loss": -7.056713104248047, "global_step": 180688, "epoch": 4302} {"train_loss": -6.973954677581787, "global_step": 180689, "epoch": 4302} {"train_loss": -7.043922424316406, "global_step": 180690, "epoch": 4302} {"train_loss": -6.988265037536621, "global_step": 180691, "epoch": 4302} {"train_loss": -7.059499263763428, "global_step": 180692, "epoch": 4302} {"train_loss": -7.065982341766357, "global_step": 180693, "epoch": 4302} {"train_loss": -6.913542747497559, "global_step": 180694, "epoch": 4302} {"train_loss": -7.005823135375977, "global_step": 180695, "epoch": 4302} {"train_loss": -6.991427421569824, "global_step": 180696, "epoch": 4302} {"train_loss": -6.970664024353027, "global_step": 180697, "epoch": 4302} {"train_loss": -6.977182388305664, "global_step": 180698, "epoch": 4302} {"train_loss": -6.888025283813477, "global_step": 180699, "epoch": 4302} {"train_loss": -7.0406813621521, "global_step": 180700, "epoch": 4302} {"train_loss": -6.873432159423828, "global_step": 180701, "epoch": 4302} {"train_loss": -6.916996002197266, "global_step": 180702, "epoch": 4302} {"train_loss": -6.909375190734863, "global_step": 180703, "epoch": 4302} {"train_loss": -6.871864318847656, "global_step": 180704, "epoch": 4302} {"train_loss": -7.080940246582031, "global_step": 180705, "epoch": 4302} {"train_loss": -6.914432525634766, "global_step": 180706, "epoch": 4302} {"train_loss": -6.921939849853516, "global_step": 180707, "epoch": 4302} {"train_loss": -6.8902788162231445, "global_step": 180708, "epoch": 4302} {"train_loss": -7.016984939575195, "global_step": 180709, "epoch": 4302} {"train_loss": -6.950569152832031, "global_step": 180710, "epoch": 4302} {"train_loss": -6.95025634765625, "global_step": 180711, "epoch": 4302} {"train_loss": -6.961789131164551, "global_step": 180712, "epoch": 4302} {"train_loss": -6.896031379699707, "global_step": 180713, "epoch": 4302} {"train_loss": -6.9515581130981445, "global_step": 180714, "epoch": 4302} {"train_loss": -6.957139015197754, "global_step": 180715, "epoch": 4302} {"train_loss": -6.954532146453857, "global_step": 180716, "epoch": 4302} {"train_loss": -7.001864433288574, "global_step": 180717, "epoch": 4302} {"train_loss": -7.008931636810303, "global_step": 180718, "epoch": 4302} {"train_loss": -7.04681396484375, "global_step": 180719, "epoch": 4302} {"train_loss": -7.1252665519714355, "global_step": 180720, "epoch": 4302} {"train_loss": -7.078523635864258, "global_step": 180721, "epoch": 4302} {"train_loss": -7.132582187652588, "global_step": 180722, "epoch": 4302} {"train_loss": -7.0236921310424805, "global_step": 180723, "epoch": 4302} {"train_loss": -7.093020915985107, "global_step": 180724, "epoch": 4302} {"train_loss": -7.000492402485439, "global_step": 180725, "epoch": 4302, "val_loss": 68701.859375} {"train_loss": -7.05937385559082, "global_step": 180726, "epoch": 4303} {"train_loss": -7.083746433258057, "global_step": 180727, "epoch": 4303} {"train_loss": -7.145962715148926, "global_step": 180728, "epoch": 4303} {"train_loss": -7.080241680145264, "global_step": 180729, "epoch": 4303} {"train_loss": -7.147851943969727, "global_step": 180730, "epoch": 4303} {"train_loss": -7.116943836212158, "global_step": 180731, "epoch": 4303} {"train_loss": -7.0649213790893555, "global_step": 180732, "epoch": 4303} {"train_loss": -7.175599098205566, "global_step": 180733, "epoch": 4303} {"train_loss": -7.109530925750732, "global_step": 180734, "epoch": 4303} {"train_loss": -7.108468055725098, "global_step": 180735, "epoch": 4303} {"train_loss": -7.041023254394531, "global_step": 180736, "epoch": 4303} {"train_loss": -7.069805145263672, "global_step": 180737, "epoch": 4303} {"train_loss": -7.1142072677612305, "global_step": 180738, "epoch": 4303} {"train_loss": -7.104060649871826, "global_step": 180739, "epoch": 4303} {"train_loss": -7.080288887023926, "global_step": 180740, "epoch": 4303} {"train_loss": -7.132262229919434, "global_step": 180741, "epoch": 4303} {"train_loss": -7.112100124359131, "global_step": 180742, "epoch": 4303} {"train_loss": -7.129096984863281, "global_step": 180743, "epoch": 4303} {"train_loss": -7.149205207824707, "global_step": 180744, "epoch": 4303} {"train_loss": -7.134612560272217, "global_step": 180745, "epoch": 4303} {"train_loss": -7.034448146820068, "global_step": 180746, "epoch": 4303} {"train_loss": -7.076204299926758, "global_step": 180747, "epoch": 4303} {"train_loss": -7.18064546585083, "global_step": 180748, "epoch": 4303} {"train_loss": -7.126974582672119, "global_step": 180749, "epoch": 4303} {"train_loss": -7.212536334991455, "global_step": 180750, "epoch": 4303} {"train_loss": -6.98505973815918, "global_step": 180751, "epoch": 4303} {"train_loss": -7.2597198486328125, "global_step": 180752, "epoch": 4303} {"train_loss": -7.068931579589844, "global_step": 180753, "epoch": 4303} {"train_loss": -7.119828224182129, "global_step": 180754, "epoch": 4303} {"train_loss": -7.058767318725586, "global_step": 180755, "epoch": 4303} {"train_loss": -7.103775978088379, "global_step": 180756, "epoch": 4303} {"train_loss": -7.06229305267334, "global_step": 180757, "epoch": 4303} {"train_loss": -7.130590915679932, "global_step": 180758, "epoch": 4303} {"train_loss": -7.070372581481934, "global_step": 180759, "epoch": 4303} {"train_loss": -7.033934593200684, "global_step": 180760, "epoch": 4303} {"train_loss": -7.186598777770996, "global_step": 180761, "epoch": 4303} {"train_loss": -7.097533226013184, "global_step": 180762, "epoch": 4303} {"train_loss": -7.072064399719238, "global_step": 180763, "epoch": 4303} {"train_loss": -7.204662799835205, "global_step": 180764, "epoch": 4303} {"train_loss": -7.076369285583496, "global_step": 180765, "epoch": 4303} {"train_loss": -7.063591480255127, "global_step": 180766, "epoch": 4303} {"train_loss": -7.1033298288072855, "global_step": 180767, "epoch": 4303, "val_loss": 68627.96875} {"train_loss": -7.144583702087402, "global_step": 180768, "epoch": 4304} {"train_loss": -7.052702903747559, "global_step": 180769, "epoch": 4304} {"train_loss": -7.052618026733398, "global_step": 180770, "epoch": 4304} {"train_loss": -7.065837860107422, "global_step": 180771, "epoch": 4304} {"train_loss": -7.111401081085205, "global_step": 180772, "epoch": 4304} {"train_loss": -7.091267108917236, "global_step": 180773, "epoch": 4304} {"train_loss": -6.886523723602295, "global_step": 180774, "epoch": 4304} {"train_loss": -7.068844318389893, "global_step": 180775, "epoch": 4304} {"train_loss": -7.061522483825684, "global_step": 180776, "epoch": 4304} {"train_loss": -7.040719032287598, "global_step": 180777, "epoch": 4304} {"train_loss": -6.968904972076416, "global_step": 180778, "epoch": 4304} {"train_loss": -7.007227897644043, "global_step": 180779, "epoch": 4304} {"train_loss": -7.028804779052734, "global_step": 180780, "epoch": 4304} {"train_loss": -6.937384605407715, "global_step": 180781, "epoch": 4304} {"train_loss": -7.1037211418151855, "global_step": 180782, "epoch": 4304} {"train_loss": -7.123810768127441, "global_step": 180783, "epoch": 4304} {"train_loss": -7.004847526550293, "global_step": 180784, "epoch": 4304} {"train_loss": -7.099187850952148, "global_step": 180785, "epoch": 4304} {"train_loss": -6.928718566894531, "global_step": 180786, "epoch": 4304} {"train_loss": -7.048758029937744, "global_step": 180787, "epoch": 4304} {"train_loss": -7.073282241821289, "global_step": 180788, "epoch": 4304} {"train_loss": -7.089376449584961, "global_step": 180789, "epoch": 4304} {"train_loss": -7.078875541687012, "global_step": 180790, "epoch": 4304} {"train_loss": -7.0392560958862305, "global_step": 180791, "epoch": 4304} {"train_loss": -7.1813812255859375, "global_step": 180792, "epoch": 4304} {"train_loss": -7.065223693847656, "global_step": 180793, "epoch": 4304} {"train_loss": -7.036229133605957, "global_step": 180794, "epoch": 4304} {"train_loss": -7.035218238830566, "global_step": 180795, "epoch": 4304} {"train_loss": -7.064619064331055, "global_step": 180796, "epoch": 4304} {"train_loss": -7.065263271331787, "global_step": 180797, "epoch": 4304} {"train_loss": -7.003576755523682, "global_step": 180798, "epoch": 4304} {"train_loss": -7.143535137176514, "global_step": 180799, "epoch": 4304} {"train_loss": -7.079623222351074, "global_step": 180800, "epoch": 4304} {"train_loss": -7.055510520935059, "global_step": 180801, "epoch": 4304} {"train_loss": -7.064739227294922, "global_step": 180802, "epoch": 4304} {"train_loss": -6.9611077308654785, "global_step": 180803, "epoch": 4304} {"train_loss": -7.0364532470703125, "global_step": 180804, "epoch": 4304} {"train_loss": -7.0140061378479, "global_step": 180805, "epoch": 4304} {"train_loss": -7.0220537185668945, "global_step": 180806, "epoch": 4304} {"train_loss": -7.053006172180176, "global_step": 180807, "epoch": 4304} {"train_loss": -7.026632308959961, "global_step": 180808, "epoch": 4304} {"train_loss": -7.047435453959873, "global_step": 180809, "epoch": 4304, "val_loss": 68900.3046875} {"train_loss": -6.847688674926758, "global_step": 180810, "epoch": 4305} {"train_loss": -7.029426574707031, "global_step": 180811, "epoch": 4305} {"train_loss": -6.796516418457031, "global_step": 180812, "epoch": 4305} {"train_loss": -7.106711387634277, "global_step": 180813, "epoch": 4305} {"train_loss": -6.970972537994385, "global_step": 180814, "epoch": 4305} {"train_loss": -6.90945291519165, "global_step": 180815, "epoch": 4305} {"train_loss": -7.0868635177612305, "global_step": 180816, "epoch": 4305} {"train_loss": -7.007447242736816, "global_step": 180817, "epoch": 4305} {"train_loss": -7.004974365234375, "global_step": 180818, "epoch": 4305} {"train_loss": -7.124958038330078, "global_step": 180819, "epoch": 4305} {"train_loss": -6.919233322143555, "global_step": 180820, "epoch": 4305} {"train_loss": -7.1595659255981445, "global_step": 180821, "epoch": 4305} {"train_loss": -6.943335056304932, "global_step": 180822, "epoch": 4305} {"train_loss": -7.008174896240234, "global_step": 180823, "epoch": 4305} {"train_loss": -7.0527496337890625, "global_step": 180824, "epoch": 4305} {"train_loss": -7.063265800476074, "global_step": 180825, "epoch": 4305} {"train_loss": -7.054291725158691, "global_step": 180826, "epoch": 4305} {"train_loss": -6.94567346572876, "global_step": 180827, "epoch": 4305} {"train_loss": -6.962406635284424, "global_step": 180828, "epoch": 4305} {"train_loss": -7.086495399475098, "global_step": 180829, "epoch": 4305} {"train_loss": -7.019428253173828, "global_step": 180830, "epoch": 4305} {"train_loss": -6.9513773918151855, "global_step": 180831, "epoch": 4305} {"train_loss": -7.054358005523682, "global_step": 180832, "epoch": 4305} {"train_loss": -7.063899993896484, "global_step": 180833, "epoch": 4305} {"train_loss": -7.1437153816223145, "global_step": 180834, "epoch": 4305} {"train_loss": -7.038861274719238, "global_step": 180835, "epoch": 4305} {"train_loss": -7.110443115234375, "global_step": 180836, "epoch": 4305} {"train_loss": -6.9661359786987305, "global_step": 180837, "epoch": 4305} {"train_loss": -6.983529090881348, "global_step": 180838, "epoch": 4305} {"train_loss": -7.028727054595947, "global_step": 180839, "epoch": 4305} {"train_loss": -7.042747497558594, "global_step": 180840, "epoch": 4305} {"train_loss": -7.080366134643555, "global_step": 180841, "epoch": 4305} {"train_loss": -7.155426025390625, "global_step": 180842, "epoch": 4305} {"train_loss": -7.1161603927612305, "global_step": 180843, "epoch": 4305} {"train_loss": -7.067035675048828, "global_step": 180844, "epoch": 4305} {"train_loss": -7.053107261657715, "global_step": 180845, "epoch": 4305} {"train_loss": -7.114667892456055, "global_step": 180846, "epoch": 4305} {"train_loss": -6.957420349121094, "global_step": 180847, "epoch": 4305} {"train_loss": -7.0592851638793945, "global_step": 180848, "epoch": 4305} {"train_loss": -7.069360733032227, "global_step": 180849, "epoch": 4305} {"train_loss": -7.0566325187683105, "global_step": 180850, "epoch": 4305} {"train_loss": -7.029551449276152, "global_step": 180851, "epoch": 4305, "val_loss": 68750.359375} {"train_loss": -7.003506660461426, "global_step": 180852, "epoch": 4306} {"train_loss": -6.989716529846191, "global_step": 180853, "epoch": 4306} {"train_loss": -7.016170501708984, "global_step": 180854, "epoch": 4306} {"train_loss": -7.020705699920654, "global_step": 180855, "epoch": 4306} {"train_loss": -7.123842239379883, "global_step": 180856, "epoch": 4306} {"train_loss": -7.110996246337891, "global_step": 180857, "epoch": 4306} {"train_loss": -7.084606170654297, "global_step": 180858, "epoch": 4306} {"train_loss": -7.019235134124756, "global_step": 180859, "epoch": 4306} {"train_loss": -7.046464920043945, "global_step": 180860, "epoch": 4306} {"train_loss": -7.051760673522949, "global_step": 180861, "epoch": 4306} {"train_loss": -7.163663864135742, "global_step": 180862, "epoch": 4306} {"train_loss": -7.08846378326416, "global_step": 180863, "epoch": 4306} {"train_loss": -7.107531547546387, "global_step": 180864, "epoch": 4306} {"train_loss": -7.108465194702148, "global_step": 180865, "epoch": 4306} {"train_loss": -7.109978675842285, "global_step": 180866, "epoch": 4306} {"train_loss": -7.156772613525391, "global_step": 180867, "epoch": 4306} {"train_loss": -7.1472015380859375, "global_step": 180868, "epoch": 4306} {"train_loss": -7.0438127517700195, "global_step": 180869, "epoch": 4306} {"train_loss": -7.087560653686523, "global_step": 180870, "epoch": 4306} {"train_loss": -7.086859703063965, "global_step": 180871, "epoch": 4306} {"train_loss": -7.035943984985352, "global_step": 180872, "epoch": 4306} {"train_loss": -7.076050758361816, "global_step": 180873, "epoch": 4306} {"train_loss": -7.117496490478516, "global_step": 180874, "epoch": 4306} {"train_loss": -7.020853042602539, "global_step": 180875, "epoch": 4306} {"train_loss": -7.083674430847168, "global_step": 180876, "epoch": 4306} {"train_loss": -7.244155406951904, "global_step": 180877, "epoch": 4306} {"train_loss": -7.049314498901367, "global_step": 180878, "epoch": 4306} {"train_loss": -7.123575687408447, "global_step": 180879, "epoch": 4306} {"train_loss": -7.006552696228027, "global_step": 180880, "epoch": 4306} {"train_loss": -7.144916534423828, "global_step": 180881, "epoch": 4306} {"train_loss": -7.182533264160156, "global_step": 180882, "epoch": 4306} {"train_loss": -6.980123043060303, "global_step": 180883, "epoch": 4306} {"train_loss": -7.041498184204102, "global_step": 180884, "epoch": 4306} {"train_loss": -6.960892200469971, "global_step": 180885, "epoch": 4306} {"train_loss": -7.071283340454102, "global_step": 180886, "epoch": 4306} {"train_loss": -7.0940351486206055, "global_step": 180887, "epoch": 4306} {"train_loss": -7.045078754425049, "global_step": 180888, "epoch": 4306} {"train_loss": -7.1629228591918945, "global_step": 180889, "epoch": 4306} {"train_loss": -7.0582122802734375, "global_step": 180890, "epoch": 4306} {"train_loss": -7.215298175811768, "global_step": 180891, "epoch": 4306} {"train_loss": -7.057425022125244, "global_step": 180892, "epoch": 4306} {"train_loss": -7.080063059216454, "global_step": 180893, "epoch": 4306, "val_loss": 68808.171875} {"train_loss": -7.034544467926025, "global_step": 180894, "epoch": 4307} {"train_loss": -7.082024574279785, "global_step": 180895, "epoch": 4307} {"train_loss": -7.046391010284424, "global_step": 180896, "epoch": 4307} {"train_loss": -7.100906848907471, "global_step": 180897, "epoch": 4307} {"train_loss": -6.9850616455078125, "global_step": 180898, "epoch": 4307} {"train_loss": -7.020902156829834, "global_step": 180899, "epoch": 4307} {"train_loss": -7.0348992347717285, "global_step": 180900, "epoch": 4307} {"train_loss": -6.9236907958984375, "global_step": 180901, "epoch": 4307} {"train_loss": -6.912434101104736, "global_step": 180902, "epoch": 4307} {"train_loss": -7.032907962799072, "global_step": 180903, "epoch": 4307} {"train_loss": -6.732882499694824, "global_step": 180904, "epoch": 4307} {"train_loss": -6.965561389923096, "global_step": 180905, "epoch": 4307} {"train_loss": -6.791473865509033, "global_step": 180906, "epoch": 4307} {"train_loss": -6.823110580444336, "global_step": 180907, "epoch": 4307} {"train_loss": -7.007877349853516, "global_step": 180908, "epoch": 4307} {"train_loss": -6.9068450927734375, "global_step": 180909, "epoch": 4307} {"train_loss": -6.974998474121094, "global_step": 180910, "epoch": 4307} {"train_loss": -6.836607933044434, "global_step": 180911, "epoch": 4307} {"train_loss": -6.876706123352051, "global_step": 180912, "epoch": 4307} {"train_loss": -6.84515905380249, "global_step": 180913, "epoch": 4307} {"train_loss": -6.8214240074157715, "global_step": 180914, "epoch": 4307} {"train_loss": -6.891064167022705, "global_step": 180915, "epoch": 4307} {"train_loss": -6.922035217285156, "global_step": 180916, "epoch": 4307} {"train_loss": -6.910852432250977, "global_step": 180917, "epoch": 4307} {"train_loss": -6.935511112213135, "global_step": 180918, "epoch": 4307} {"train_loss": -6.845776557922363, "global_step": 180919, "epoch": 4307} {"train_loss": -6.90450382232666, "global_step": 180920, "epoch": 4307} {"train_loss": -6.9719038009643555, "global_step": 180921, "epoch": 4307} {"train_loss": -6.912431716918945, "global_step": 180922, "epoch": 4307} {"train_loss": -6.931177616119385, "global_step": 180923, "epoch": 4307} {"train_loss": -6.939968585968018, "global_step": 180924, "epoch": 4307} {"train_loss": -6.990583419799805, "global_step": 180925, "epoch": 4307} {"train_loss": -6.99940299987793, "global_step": 180926, "epoch": 4307} {"train_loss": -6.9810404777526855, "global_step": 180927, "epoch": 4307} {"train_loss": -7.109545707702637, "global_step": 180928, "epoch": 4307} {"train_loss": -7.04797887802124, "global_step": 180929, "epoch": 4307} {"train_loss": -6.986015319824219, "global_step": 180930, "epoch": 4307} {"train_loss": -6.937026023864746, "global_step": 180931, "epoch": 4307} {"train_loss": -7.000009536743164, "global_step": 180932, "epoch": 4307} {"train_loss": -6.9467453956604, "global_step": 180933, "epoch": 4307} {"train_loss": -7.010563850402832, "global_step": 180934, "epoch": 4307} {"train_loss": -6.949868520100911, "global_step": 180935, "epoch": 4307, "val_loss": 68849.9375} {"train_loss": -6.963713645935059, "global_step": 180936, "epoch": 4308} {"train_loss": -7.106184005737305, "global_step": 180937, "epoch": 4308} {"train_loss": -7.113771438598633, "global_step": 180938, "epoch": 4308} {"train_loss": -7.059260368347168, "global_step": 180939, "epoch": 4308} {"train_loss": -6.990151405334473, "global_step": 180940, "epoch": 4308} {"train_loss": -7.02156925201416, "global_step": 180941, "epoch": 4308} {"train_loss": -6.983547210693359, "global_step": 180942, "epoch": 4308} {"train_loss": -7.105108737945557, "global_step": 180943, "epoch": 4308} {"train_loss": -7.105440139770508, "global_step": 180944, "epoch": 4308} {"train_loss": -7.088886737823486, "global_step": 180945, "epoch": 4308} {"train_loss": -7.064291000366211, "global_step": 180946, "epoch": 4308} {"train_loss": -6.95229434967041, "global_step": 180947, "epoch": 4308} {"train_loss": -7.059816837310791, "global_step": 180948, "epoch": 4308} {"train_loss": -7.098337650299072, "global_step": 180949, "epoch": 4308} {"train_loss": -7.0064592361450195, "global_step": 180950, "epoch": 4308} {"train_loss": -7.070903778076172, "global_step": 180951, "epoch": 4308} {"train_loss": -7.053018569946289, "global_step": 180952, "epoch": 4308} {"train_loss": -7.068777084350586, "global_step": 180953, "epoch": 4308} {"train_loss": -7.098297119140625, "global_step": 180954, "epoch": 4308} {"train_loss": -7.214606761932373, "global_step": 180955, "epoch": 4308} {"train_loss": -7.0988969802856445, "global_step": 180956, "epoch": 4308} {"train_loss": -7.030054569244385, "global_step": 180957, "epoch": 4308} {"train_loss": -7.099921226501465, "global_step": 180958, "epoch": 4308} {"train_loss": -7.0541276931762695, "global_step": 180959, "epoch": 4308} {"train_loss": -7.016042232513428, "global_step": 180960, "epoch": 4308} {"train_loss": -7.078454971313477, "global_step": 180961, "epoch": 4308} {"train_loss": -7.183678150177002, "global_step": 180962, "epoch": 4308} {"train_loss": -6.922293663024902, "global_step": 180963, "epoch": 4308} {"train_loss": -7.073960304260254, "global_step": 180964, "epoch": 4308} {"train_loss": -7.077655792236328, "global_step": 180965, "epoch": 4308} {"train_loss": -6.935951232910156, "global_step": 180966, "epoch": 4308} {"train_loss": -7.058388710021973, "global_step": 180967, "epoch": 4308} {"train_loss": -6.9322309494018555, "global_step": 180968, "epoch": 4308} {"train_loss": -7.050510406494141, "global_step": 180969, "epoch": 4308} {"train_loss": -7.089250564575195, "global_step": 180970, "epoch": 4308} {"train_loss": -7.061764240264893, "global_step": 180971, "epoch": 4308} {"train_loss": -7.04494047164917, "global_step": 180972, "epoch": 4308} {"train_loss": -6.989433288574219, "global_step": 180973, "epoch": 4308} {"train_loss": -7.060629367828369, "global_step": 180974, "epoch": 4308} {"train_loss": -7.058030605316162, "global_step": 180975, "epoch": 4308} {"train_loss": -6.892326354980469, "global_step": 180976, "epoch": 4308} {"train_loss": -7.050438029425485, "global_step": 180977, "epoch": 4308, "val_loss": 68700.890625} {"train_loss": -7.002323150634766, "global_step": 180978, "epoch": 4309} {"train_loss": -7.138545036315918, "global_step": 180979, "epoch": 4309} {"train_loss": -7.020005226135254, "global_step": 180980, "epoch": 4309} {"train_loss": -7.010127067565918, "global_step": 180981, "epoch": 4309} {"train_loss": -7.035493850708008, "global_step": 180982, "epoch": 4309} {"train_loss": -7.018301486968994, "global_step": 180983, "epoch": 4309} {"train_loss": -7.020476341247559, "global_step": 180984, "epoch": 4309} {"train_loss": -7.056065559387207, "global_step": 180985, "epoch": 4309} {"train_loss": -7.170408248901367, "global_step": 180986, "epoch": 4309} {"train_loss": -6.948953628540039, "global_step": 180987, "epoch": 4309} {"train_loss": -7.060062408447266, "global_step": 180988, "epoch": 4309} {"train_loss": -7.014230728149414, "global_step": 180989, "epoch": 4309} {"train_loss": -7.0329484939575195, "global_step": 180990, "epoch": 4309} {"train_loss": -7.203108787536621, "global_step": 180991, "epoch": 4309} {"train_loss": -7.0480756759643555, "global_step": 180992, "epoch": 4309} {"train_loss": -7.048281669616699, "global_step": 180993, "epoch": 4309} {"train_loss": -7.149448871612549, "global_step": 180994, "epoch": 4309} {"train_loss": -7.004266738891602, "global_step": 180995, "epoch": 4309} {"train_loss": -7.116431713104248, "global_step": 180996, "epoch": 4309} {"train_loss": -7.0985589027404785, "global_step": 180997, "epoch": 4309} {"train_loss": -7.16213321685791, "global_step": 180998, "epoch": 4309} {"train_loss": -6.990813255310059, "global_step": 180999, "epoch": 4309} {"train_loss": -7.0457916259765625, "global_step": 181000, "epoch": 4309} {"train_loss": -7.098669528961182, "global_step": 181001, "epoch": 4309} {"train_loss": -7.088468551635742, "global_step": 181002, "epoch": 4309} {"train_loss": -7.095602989196777, "global_step": 181003, "epoch": 4309} {"train_loss": -7.046897888183594, "global_step": 181004, "epoch": 4309} {"train_loss": -7.143033981323242, "global_step": 181005, "epoch": 4309} {"train_loss": -7.072383880615234, "global_step": 181006, "epoch": 4309} {"train_loss": -7.08445930480957, "global_step": 181007, "epoch": 4309} {"train_loss": -7.251040935516357, "global_step": 181008, "epoch": 4309} {"train_loss": -7.164730072021484, "global_step": 181009, "epoch": 4309} {"train_loss": -7.058757305145264, "global_step": 181010, "epoch": 4309} {"train_loss": -7.115353107452393, "global_step": 181011, "epoch": 4309} {"train_loss": -7.135171890258789, "global_step": 181012, "epoch": 4309} {"train_loss": -7.150110244750977, "global_step": 181013, "epoch": 4309} {"train_loss": -7.07816219329834, "global_step": 181014, "epoch": 4309} {"train_loss": -7.0201311111450195, "global_step": 181015, "epoch": 4309} {"train_loss": -7.126350402832031, "global_step": 181016, "epoch": 4309} {"train_loss": -7.126252174377441, "global_step": 181017, "epoch": 4309} {"train_loss": -7.046714782714844, "global_step": 181018, "epoch": 4309} {"train_loss": -7.0809816519419355, "global_step": 181019, "epoch": 4309, "val_loss": 68809.5390625} {"train_loss": -7.114065170288086, "global_step": 181020, "epoch": 4310} {"train_loss": -7.143326282501221, "global_step": 181021, "epoch": 4310} {"train_loss": -6.963782787322998, "global_step": 181022, "epoch": 4310} {"train_loss": -7.105119705200195, "global_step": 181023, "epoch": 4310} {"train_loss": -6.921919822692871, "global_step": 181024, "epoch": 4310} {"train_loss": -7.129634857177734, "global_step": 181025, "epoch": 4310} {"train_loss": -7.223535537719727, "global_step": 181026, "epoch": 4310} {"train_loss": -7.002591133117676, "global_step": 181027, "epoch": 4310} {"train_loss": -7.153144836425781, "global_step": 181028, "epoch": 4310} {"train_loss": -7.123332977294922, "global_step": 181029, "epoch": 4310} {"train_loss": -7.100793838500977, "global_step": 181030, "epoch": 4310} {"train_loss": -7.073030471801758, "global_step": 181031, "epoch": 4310} {"train_loss": -7.134821891784668, "global_step": 181032, "epoch": 4310} {"train_loss": -7.143527984619141, "global_step": 181033, "epoch": 4310} {"train_loss": -7.035815238952637, "global_step": 181034, "epoch": 4310} {"train_loss": -7.049711227416992, "global_step": 181035, "epoch": 4310} {"train_loss": -7.062950134277344, "global_step": 181036, "epoch": 4310} {"train_loss": -6.958459854125977, "global_step": 181037, "epoch": 4310} {"train_loss": -7.2128095626831055, "global_step": 181038, "epoch": 4310} {"train_loss": -6.995447158813477, "global_step": 181039, "epoch": 4310} {"train_loss": -7.101234436035156, "global_step": 181040, "epoch": 4310} {"train_loss": -7.093674659729004, "global_step": 181041, "epoch": 4310} {"train_loss": -7.041163444519043, "global_step": 181042, "epoch": 4310} {"train_loss": -7.092883110046387, "global_step": 181043, "epoch": 4310} {"train_loss": -6.9158034324646, "global_step": 181044, "epoch": 4310} {"train_loss": -7.084634304046631, "global_step": 181045, "epoch": 4310} {"train_loss": -6.993566989898682, "global_step": 181046, "epoch": 4310} {"train_loss": -7.029651641845703, "global_step": 181047, "epoch": 4310} {"train_loss": -7.1050848960876465, "global_step": 181048, "epoch": 4310} {"train_loss": -6.868021011352539, "global_step": 181049, "epoch": 4310} {"train_loss": -7.029755592346191, "global_step": 181050, "epoch": 4310} {"train_loss": -6.938930988311768, "global_step": 181051, "epoch": 4310} {"train_loss": -7.006945610046387, "global_step": 181052, "epoch": 4310} {"train_loss": -6.975011825561523, "global_step": 181053, "epoch": 4310} {"train_loss": -6.859539985656738, "global_step": 181054, "epoch": 4310} {"train_loss": -7.033487319946289, "global_step": 181055, "epoch": 4310} {"train_loss": -6.863154411315918, "global_step": 181056, "epoch": 4310} {"train_loss": -6.9211859703063965, "global_step": 181057, "epoch": 4310} {"train_loss": -7.0002946853637695, "global_step": 181058, "epoch": 4310} {"train_loss": -7.0055928230285645, "global_step": 181059, "epoch": 4310} {"train_loss": -7.068234920501709, "global_step": 181060, "epoch": 4310} {"train_loss": -7.0394536427089145, "global_step": 181061, "epoch": 4310, "val_loss": 68682.5546875} {"train_loss": -7.01383638381958, "global_step": 181062, "epoch": 4311} {"train_loss": -7.080841064453125, "global_step": 181063, "epoch": 4311} {"train_loss": -6.990119457244873, "global_step": 181064, "epoch": 4311} {"train_loss": -7.14781379699707, "global_step": 181065, "epoch": 4311} {"train_loss": -6.982608795166016, "global_step": 181066, "epoch": 4311} {"train_loss": -6.946383476257324, "global_step": 181067, "epoch": 4311} {"train_loss": -6.9921875, "global_step": 181068, "epoch": 4311} {"train_loss": -7.22348165512085, "global_step": 181069, "epoch": 4311} {"train_loss": -7.086742401123047, "global_step": 181070, "epoch": 4311} {"train_loss": -7.031067848205566, "global_step": 181071, "epoch": 4311} {"train_loss": -7.045135974884033, "global_step": 181072, "epoch": 4311} {"train_loss": -7.156305313110352, "global_step": 181073, "epoch": 4311} {"train_loss": -6.955904960632324, "global_step": 181074, "epoch": 4311} {"train_loss": -6.895087242126465, "global_step": 181075, "epoch": 4311} {"train_loss": -6.921417236328125, "global_step": 181076, "epoch": 4311} {"train_loss": -7.032853126525879, "global_step": 181077, "epoch": 4311} {"train_loss": -6.943828582763672, "global_step": 181078, "epoch": 4311} {"train_loss": -7.078801155090332, "global_step": 181079, "epoch": 4311} {"train_loss": -6.978109359741211, "global_step": 181080, "epoch": 4311} {"train_loss": -7.022536277770996, "global_step": 181081, "epoch": 4311} {"train_loss": -7.03101921081543, "global_step": 181082, "epoch": 4311} {"train_loss": -7.067723274230957, "global_step": 181083, "epoch": 4311} {"train_loss": -7.086942195892334, "global_step": 181084, "epoch": 4311} {"train_loss": -6.993647575378418, "global_step": 181085, "epoch": 4311} {"train_loss": -6.96640682220459, "global_step": 181086, "epoch": 4311} {"train_loss": -7.013338088989258, "global_step": 181087, "epoch": 4311} {"train_loss": -7.087082862854004, "global_step": 181088, "epoch": 4311} {"train_loss": -7.10698127746582, "global_step": 181089, "epoch": 4311} {"train_loss": -7.052962303161621, "global_step": 181090, "epoch": 4311} {"train_loss": -7.047579288482666, "global_step": 181091, "epoch": 4311} {"train_loss": -6.96154260635376, "global_step": 181092, "epoch": 4311} {"train_loss": -7.08811092376709, "global_step": 181093, "epoch": 4311} {"train_loss": -7.021149635314941, "global_step": 181094, "epoch": 4311} {"train_loss": -7.070559501647949, "global_step": 181095, "epoch": 4311} {"train_loss": -7.151479721069336, "global_step": 181096, "epoch": 4311} {"train_loss": -7.082898139953613, "global_step": 181097, "epoch": 4311} {"train_loss": -7.000226974487305, "global_step": 181098, "epoch": 4311} {"train_loss": -7.044561862945557, "global_step": 181099, "epoch": 4311} {"train_loss": -7.0330400466918945, "global_step": 181100, "epoch": 4311} {"train_loss": -7.067874908447266, "global_step": 181101, "epoch": 4311} {"train_loss": -7.1253275871276855, "global_step": 181102, "epoch": 4311} {"train_loss": -7.038675535292852, "global_step": 181103, "epoch": 4311, "val_loss": 68647.5859375} {"train_loss": -7.148236274719238, "global_step": 181104, "epoch": 4312} {"train_loss": -7.062320709228516, "global_step": 181105, "epoch": 4312} {"train_loss": -6.824206829071045, "global_step": 181106, "epoch": 4312} {"train_loss": -6.925638675689697, "global_step": 181107, "epoch": 4312} {"train_loss": -7.118073463439941, "global_step": 181108, "epoch": 4312} {"train_loss": -7.034900188446045, "global_step": 181109, "epoch": 4312} {"train_loss": -7.072488307952881, "global_step": 181110, "epoch": 4312} {"train_loss": -7.086592674255371, "global_step": 181111, "epoch": 4312} {"train_loss": -6.965405464172363, "global_step": 181112, "epoch": 4312} {"train_loss": -7.088482856750488, "global_step": 181113, "epoch": 4312} {"train_loss": -7.076226234436035, "global_step": 181114, "epoch": 4312} {"train_loss": -7.09151029586792, "global_step": 181115, "epoch": 4312} {"train_loss": -7.16746187210083, "global_step": 181116, "epoch": 4312} {"train_loss": -7.005690574645996, "global_step": 181117, "epoch": 4312} {"train_loss": -7.04707145690918, "global_step": 181118, "epoch": 4312} {"train_loss": -7.1546831130981445, "global_step": 181119, "epoch": 4312} {"train_loss": -7.065062522888184, "global_step": 181120, "epoch": 4312} {"train_loss": -7.161335468292236, "global_step": 181121, "epoch": 4312} {"train_loss": -7.137629985809326, "global_step": 181122, "epoch": 4312} {"train_loss": -7.1519365310668945, "global_step": 181123, "epoch": 4312} {"train_loss": -7.08503532409668, "global_step": 181124, "epoch": 4312} {"train_loss": -7.175978660583496, "global_step": 181125, "epoch": 4312} {"train_loss": -7.038018703460693, "global_step": 181126, "epoch": 4312} {"train_loss": -7.160135746002197, "global_step": 181127, "epoch": 4312} {"train_loss": -7.054190635681152, "global_step": 181128, "epoch": 4312} {"train_loss": -7.105511665344238, "global_step": 181129, "epoch": 4312} {"train_loss": -7.115993499755859, "global_step": 181130, "epoch": 4312} {"train_loss": -6.970709323883057, "global_step": 181131, "epoch": 4312} {"train_loss": -6.970391750335693, "global_step": 181132, "epoch": 4312} {"train_loss": -7.038975715637207, "global_step": 181133, "epoch": 4312} {"train_loss": -7.02952766418457, "global_step": 181134, "epoch": 4312} {"train_loss": -7.221024990081787, "global_step": 181135, "epoch": 4312} {"train_loss": -7.040535926818848, "global_step": 181136, "epoch": 4312} {"train_loss": -7.178062915802002, "global_step": 181137, "epoch": 4312} {"train_loss": -7.143314838409424, "global_step": 181138, "epoch": 4312} {"train_loss": -7.091785430908203, "global_step": 181139, "epoch": 4312} {"train_loss": -7.105685234069824, "global_step": 181140, "epoch": 4312} {"train_loss": -7.068043231964111, "global_step": 181141, "epoch": 4312} {"train_loss": -7.106598854064941, "global_step": 181142, "epoch": 4312} {"train_loss": -7.0115861892700195, "global_step": 181143, "epoch": 4312} {"train_loss": -7.162820816040039, "global_step": 181144, "epoch": 4312} {"train_loss": -7.079060770216442, "global_step": 181145, "epoch": 4312, "val_loss": 68717.40625} {"train_loss": -7.216213226318359, "global_step": 181146, "epoch": 4313} {"train_loss": -7.062671661376953, "global_step": 181147, "epoch": 4313} {"train_loss": -7.152857780456543, "global_step": 181148, "epoch": 4313} {"train_loss": -7.096428871154785, "global_step": 181149, "epoch": 4313} {"train_loss": -6.988443374633789, "global_step": 181150, "epoch": 4313} {"train_loss": -7.143558979034424, "global_step": 181151, "epoch": 4313} {"train_loss": -7.0219597816467285, "global_step": 181152, "epoch": 4313} {"train_loss": -7.134387016296387, "global_step": 181153, "epoch": 4313} {"train_loss": -7.097070693969727, "global_step": 181154, "epoch": 4313} {"train_loss": -6.969376564025879, "global_step": 181155, "epoch": 4313} {"train_loss": -6.975815773010254, "global_step": 181156, "epoch": 4313} {"train_loss": -6.996904373168945, "global_step": 181157, "epoch": 4313} {"train_loss": -7.059735298156738, "global_step": 181158, "epoch": 4313} {"train_loss": -7.095274925231934, "global_step": 181159, "epoch": 4313} {"train_loss": -7.0332746505737305, "global_step": 181160, "epoch": 4313} {"train_loss": -7.09445858001709, "global_step": 181161, "epoch": 4313} {"train_loss": -7.055811882019043, "global_step": 181162, "epoch": 4313} {"train_loss": -7.013949394226074, "global_step": 181163, "epoch": 4313} {"train_loss": -7.068680763244629, "global_step": 181164, "epoch": 4313} {"train_loss": -7.148608207702637, "global_step": 181165, "epoch": 4313} {"train_loss": -7.061651229858398, "global_step": 181166, "epoch": 4313} {"train_loss": -7.119072437286377, "global_step": 181167, "epoch": 4313} {"train_loss": -7.047730445861816, "global_step": 181168, "epoch": 4313} {"train_loss": -6.987238883972168, "global_step": 181169, "epoch": 4313} {"train_loss": -7.1136088371276855, "global_step": 181170, "epoch": 4313} {"train_loss": -7.018394947052002, "global_step": 181171, "epoch": 4313} {"train_loss": -7.109612464904785, "global_step": 181172, "epoch": 4313} {"train_loss": -7.053860664367676, "global_step": 181173, "epoch": 4313} {"train_loss": -7.1071367263793945, "global_step": 181174, "epoch": 4313} {"train_loss": -7.1156158447265625, "global_step": 181175, "epoch": 4313} {"train_loss": -7.087996482849121, "global_step": 181176, "epoch": 4313} {"train_loss": -7.105271339416504, "global_step": 181177, "epoch": 4313} {"train_loss": -7.170172214508057, "global_step": 181178, "epoch": 4313} {"train_loss": -7.066534042358398, "global_step": 181179, "epoch": 4313} {"train_loss": -7.123546123504639, "global_step": 181180, "epoch": 4313} {"train_loss": -7.06004524230957, "global_step": 181181, "epoch": 4313} {"train_loss": -7.12858772277832, "global_step": 181182, "epoch": 4313} {"train_loss": -7.139588356018066, "global_step": 181183, "epoch": 4313} {"train_loss": -7.161966323852539, "global_step": 181184, "epoch": 4313} {"train_loss": -7.055998802185059, "global_step": 181185, "epoch": 4313} {"train_loss": -7.106898307800293, "global_step": 181186, "epoch": 4313} {"train_loss": -7.080154396238781, "global_step": 181187, "epoch": 4313, "val_loss": 68940.09375} {"train_loss": -7.166326999664307, "global_step": 181188, "epoch": 4314} {"train_loss": -7.158894062042236, "global_step": 181189, "epoch": 4314} {"train_loss": -7.001669883728027, "global_step": 181190, "epoch": 4314} {"train_loss": -7.163474082946777, "global_step": 181191, "epoch": 4314} {"train_loss": -7.029503345489502, "global_step": 181192, "epoch": 4314} {"train_loss": -7.096538543701172, "global_step": 181193, "epoch": 4314} {"train_loss": -7.134499549865723, "global_step": 181194, "epoch": 4314} {"train_loss": -7.057061195373535, "global_step": 181195, "epoch": 4314} {"train_loss": -7.128629684448242, "global_step": 181196, "epoch": 4314} {"train_loss": -6.955772399902344, "global_step": 181197, "epoch": 4314} {"train_loss": -7.164996147155762, "global_step": 181198, "epoch": 4314} {"train_loss": -6.956882953643799, "global_step": 181199, "epoch": 4314} {"train_loss": -7.136656761169434, "global_step": 181200, "epoch": 4314} {"train_loss": -7.004268169403076, "global_step": 181201, "epoch": 4314} {"train_loss": -7.077166557312012, "global_step": 181202, "epoch": 4314} {"train_loss": -7.06453800201416, "global_step": 181203, "epoch": 4314} {"train_loss": -6.970119953155518, "global_step": 181204, "epoch": 4314} {"train_loss": -7.128575325012207, "global_step": 181205, "epoch": 4314} {"train_loss": -7.044890403747559, "global_step": 181206, "epoch": 4314} {"train_loss": -7.116514682769775, "global_step": 181207, "epoch": 4314} {"train_loss": -7.025057792663574, "global_step": 181208, "epoch": 4314} {"train_loss": -7.083219528198242, "global_step": 181209, "epoch": 4314} {"train_loss": -7.176301002502441, "global_step": 181210, "epoch": 4314} {"train_loss": -7.0747785568237305, "global_step": 181211, "epoch": 4314} {"train_loss": -6.979272842407227, "global_step": 181212, "epoch": 4314} {"train_loss": -7.169507026672363, "global_step": 181213, "epoch": 4314} {"train_loss": -7.094180107116699, "global_step": 181214, "epoch": 4314} {"train_loss": -7.022915840148926, "global_step": 181215, "epoch": 4314} {"train_loss": -7.16290283203125, "global_step": 181216, "epoch": 4314} {"train_loss": -7.068361282348633, "global_step": 181217, "epoch": 4314} {"train_loss": -6.915770530700684, "global_step": 181218, "epoch": 4314} {"train_loss": -7.126622200012207, "global_step": 181219, "epoch": 4314} {"train_loss": -7.068076133728027, "global_step": 181220, "epoch": 4314} {"train_loss": -6.995223045349121, "global_step": 181221, "epoch": 4314} {"train_loss": -7.096619606018066, "global_step": 181222, "epoch": 4314} {"train_loss": -7.024904727935791, "global_step": 181223, "epoch": 4314} {"train_loss": -7.060590744018555, "global_step": 181224, "epoch": 4314} {"train_loss": -7.154147148132324, "global_step": 181225, "epoch": 4314} {"train_loss": -7.059659957885742, "global_step": 181226, "epoch": 4314} {"train_loss": -6.975953102111816, "global_step": 181227, "epoch": 4314} {"train_loss": -7.078878879547119, "global_step": 181228, "epoch": 4314} {"train_loss": -7.070196696690151, "global_step": 181229, "epoch": 4314, "val_loss": 68836.0625} {"train_loss": -7.010472297668457, "global_step": 181230, "epoch": 4315} {"train_loss": -7.024500846862793, "global_step": 181231, "epoch": 4315} {"train_loss": -7.16904354095459, "global_step": 181232, "epoch": 4315} {"train_loss": -7.008794784545898, "global_step": 181233, "epoch": 4315} {"train_loss": -7.08658504486084, "global_step": 181234, "epoch": 4315} {"train_loss": -7.092012405395508, "global_step": 181235, "epoch": 4315} {"train_loss": -7.1202287673950195, "global_step": 181236, "epoch": 4315} {"train_loss": -6.994973659515381, "global_step": 181237, "epoch": 4315} {"train_loss": -6.890301704406738, "global_step": 181238, "epoch": 4315} {"train_loss": -6.936592102050781, "global_step": 181239, "epoch": 4315} {"train_loss": -7.079958915710449, "global_step": 181240, "epoch": 4315} {"train_loss": -7.071022987365723, "global_step": 181241, "epoch": 4315} {"train_loss": -6.915858745574951, "global_step": 181242, "epoch": 4315} {"train_loss": -7.0792388916015625, "global_step": 181243, "epoch": 4315} {"train_loss": -7.03590202331543, "global_step": 181244, "epoch": 4315} {"train_loss": -7.149640083312988, "global_step": 181245, "epoch": 4315} {"train_loss": -7.107330322265625, "global_step": 181246, "epoch": 4315} {"train_loss": -7.038024425506592, "global_step": 181247, "epoch": 4315} {"train_loss": -7.1721038818359375, "global_step": 181248, "epoch": 4315} {"train_loss": -7.088428497314453, "global_step": 181249, "epoch": 4315} {"train_loss": -7.051275253295898, "global_step": 181250, "epoch": 4315} {"train_loss": -7.003063678741455, "global_step": 181251, "epoch": 4315} {"train_loss": -7.083103179931641, "global_step": 181252, "epoch": 4315} {"train_loss": -6.948357582092285, "global_step": 181253, "epoch": 4315} {"train_loss": -7.028898239135742, "global_step": 181254, "epoch": 4315} {"train_loss": -7.027559280395508, "global_step": 181255, "epoch": 4315} {"train_loss": -7.018611431121826, "global_step": 181256, "epoch": 4315} {"train_loss": -7.062917709350586, "global_step": 181257, "epoch": 4315} {"train_loss": -7.180328369140625, "global_step": 181258, "epoch": 4315} {"train_loss": -7.073652267456055, "global_step": 181259, "epoch": 4315} {"train_loss": -7.091082572937012, "global_step": 181260, "epoch": 4315} {"train_loss": -7.127015113830566, "global_step": 181261, "epoch": 4315} {"train_loss": -7.028646469116211, "global_step": 181262, "epoch": 4315} {"train_loss": -7.04831075668335, "global_step": 181263, "epoch": 4315} {"train_loss": -6.962689399719238, "global_step": 181264, "epoch": 4315} {"train_loss": -7.042425155639648, "global_step": 181265, "epoch": 4315} {"train_loss": -6.982110977172852, "global_step": 181266, "epoch": 4315} {"train_loss": -7.0601911544799805, "global_step": 181267, "epoch": 4315} {"train_loss": -7.030324935913086, "global_step": 181268, "epoch": 4315} {"train_loss": -6.982291221618652, "global_step": 181269, "epoch": 4315} {"train_loss": -7.01052188873291, "global_step": 181270, "epoch": 4315} {"train_loss": -7.046470426377796, "global_step": 181271, "epoch": 4315, "val_loss": 68949.109375} {"train_loss": -6.992588043212891, "global_step": 181272, "epoch": 4316} {"train_loss": -7.023050308227539, "global_step": 181273, "epoch": 4316} {"train_loss": -7.025927543640137, "global_step": 181274, "epoch": 4316} {"train_loss": -7.000675678253174, "global_step": 181275, "epoch": 4316} {"train_loss": -6.999201774597168, "global_step": 181276, "epoch": 4316} {"train_loss": -7.104821681976318, "global_step": 181277, "epoch": 4316} {"train_loss": -7.0031561851501465, "global_step": 181278, "epoch": 4316} {"train_loss": -7.014873504638672, "global_step": 181279, "epoch": 4316} {"train_loss": -7.042581558227539, "global_step": 181280, "epoch": 4316} {"train_loss": -7.046606540679932, "global_step": 181281, "epoch": 4316} {"train_loss": -6.979571342468262, "global_step": 181282, "epoch": 4316} {"train_loss": -7.0990400314331055, "global_step": 181283, "epoch": 4316} {"train_loss": -7.059237003326416, "global_step": 181284, "epoch": 4316} {"train_loss": -6.982412338256836, "global_step": 181285, "epoch": 4316} {"train_loss": -7.045424461364746, "global_step": 181286, "epoch": 4316} {"train_loss": -6.966605186462402, "global_step": 181287, "epoch": 4316} {"train_loss": -6.9744181632995605, "global_step": 181288, "epoch": 4316} {"train_loss": -7.043872833251953, "global_step": 181289, "epoch": 4316} {"train_loss": -6.987351417541504, "global_step": 181290, "epoch": 4316} {"train_loss": -6.895397186279297, "global_step": 181291, "epoch": 4316} {"train_loss": -7.067627906799316, "global_step": 181292, "epoch": 4316} {"train_loss": -6.901013374328613, "global_step": 181293, "epoch": 4316} {"train_loss": -7.067000865936279, "global_step": 181294, "epoch": 4316} {"train_loss": -7.1321024894714355, "global_step": 181295, "epoch": 4316} {"train_loss": -7.058860778808594, "global_step": 181296, "epoch": 4316} {"train_loss": -6.986246109008789, "global_step": 181297, "epoch": 4316} {"train_loss": -7.074746131896973, "global_step": 181298, "epoch": 4316} {"train_loss": -7.126375675201416, "global_step": 181299, "epoch": 4316} {"train_loss": -6.90330696105957, "global_step": 181300, "epoch": 4316} {"train_loss": -7.061160564422607, "global_step": 181301, "epoch": 4316} {"train_loss": -7.094972610473633, "global_step": 181302, "epoch": 4316} {"train_loss": -7.087597846984863, "global_step": 181303, "epoch": 4316} {"train_loss": -6.998857498168945, "global_step": 181304, "epoch": 4316} {"train_loss": -7.100072383880615, "global_step": 181305, "epoch": 4316} {"train_loss": -6.894796848297119, "global_step": 181306, "epoch": 4316} {"train_loss": -7.0013298988342285, "global_step": 181307, "epoch": 4316} {"train_loss": -7.190566062927246, "global_step": 181308, "epoch": 4316} {"train_loss": -6.972034931182861, "global_step": 181309, "epoch": 4316} {"train_loss": -7.016177654266357, "global_step": 181310, "epoch": 4316} {"train_loss": -7.001124382019043, "global_step": 181311, "epoch": 4316} {"train_loss": -7.027334213256836, "global_step": 181312, "epoch": 4316} {"train_loss": -7.026706366311936, "global_step": 181313, "epoch": 4316, "val_loss": 68889.4609375} {"train_loss": -7.098273277282715, "global_step": 181314, "epoch": 4317} {"train_loss": -7.069708824157715, "global_step": 181315, "epoch": 4317} {"train_loss": -6.967408180236816, "global_step": 181316, "epoch": 4317} {"train_loss": -7.149980068206787, "global_step": 181317, "epoch": 4317} {"train_loss": -7.059161186218262, "global_step": 181318, "epoch": 4317} {"train_loss": -7.035096645355225, "global_step": 181319, "epoch": 4317} {"train_loss": -7.202595233917236, "global_step": 181320, "epoch": 4317} {"train_loss": -7.055546283721924, "global_step": 181321, "epoch": 4317} {"train_loss": -7.066561222076416, "global_step": 181322, "epoch": 4317} {"train_loss": -7.136862277984619, "global_step": 181323, "epoch": 4317} {"train_loss": -7.109528541564941, "global_step": 181324, "epoch": 4317} {"train_loss": -7.077193260192871, "global_step": 181325, "epoch": 4317} {"train_loss": -7.2146430015563965, "global_step": 181326, "epoch": 4317} {"train_loss": -7.077497482299805, "global_step": 181327, "epoch": 4317} {"train_loss": -7.164581298828125, "global_step": 181328, "epoch": 4317} {"train_loss": -7.119268417358398, "global_step": 181329, "epoch": 4317} {"train_loss": -7.007226943969727, "global_step": 181330, "epoch": 4317} {"train_loss": -7.177831172943115, "global_step": 181331, "epoch": 4317} {"train_loss": -7.147936820983887, "global_step": 181332, "epoch": 4317} {"train_loss": -7.223570346832275, "global_step": 181333, "epoch": 4317} {"train_loss": -7.245655059814453, "global_step": 181334, "epoch": 4317} {"train_loss": -7.058128833770752, "global_step": 181335, "epoch": 4317} {"train_loss": -7.118123531341553, "global_step": 181336, "epoch": 4317} {"train_loss": -7.123239517211914, "global_step": 181337, "epoch": 4317} {"train_loss": -7.125308036804199, "global_step": 181338, "epoch": 4317} {"train_loss": -7.117059707641602, "global_step": 181339, "epoch": 4317} {"train_loss": -7.176837921142578, "global_step": 181340, "epoch": 4317} {"train_loss": -7.115989685058594, "global_step": 181341, "epoch": 4317} {"train_loss": -7.168600559234619, "global_step": 181342, "epoch": 4317} {"train_loss": -7.13176155090332, "global_step": 181343, "epoch": 4317} {"train_loss": -7.109956741333008, "global_step": 181344, "epoch": 4317} {"train_loss": -7.12193489074707, "global_step": 181345, "epoch": 4317} {"train_loss": -7.209437370300293, "global_step": 181346, "epoch": 4317} {"train_loss": -7.13994026184082, "global_step": 181347, "epoch": 4317} {"train_loss": -7.138995170593262, "global_step": 181348, "epoch": 4317} {"train_loss": -7.175053596496582, "global_step": 181349, "epoch": 4317} {"train_loss": -7.137295722961426, "global_step": 181350, "epoch": 4317} {"train_loss": -7.107611656188965, "global_step": 181351, "epoch": 4317} {"train_loss": -7.033937931060791, "global_step": 181352, "epoch": 4317} {"train_loss": -7.11832332611084, "global_step": 181353, "epoch": 4317} {"train_loss": -7.056073188781738, "global_step": 181354, "epoch": 4317} {"train_loss": -7.122238170532953, "global_step": 181355, "epoch": 4317, "val_loss": 68758.03125} {"train_loss": -7.1867523193359375, "global_step": 181356, "epoch": 4318} {"train_loss": -7.08191442489624, "global_step": 181357, "epoch": 4318} {"train_loss": -7.162336349487305, "global_step": 181358, "epoch": 4318} {"train_loss": -7.139791488647461, "global_step": 181359, "epoch": 4318} {"train_loss": -7.098455429077148, "global_step": 181360, "epoch": 4318} {"train_loss": -7.105475902557373, "global_step": 181361, "epoch": 4318} {"train_loss": -7.200976371765137, "global_step": 181362, "epoch": 4318} {"train_loss": -7.098028659820557, "global_step": 181363, "epoch": 4318} {"train_loss": -7.136905193328857, "global_step": 181364, "epoch": 4318} {"train_loss": -7.103377342224121, "global_step": 181365, "epoch": 4318} {"train_loss": -7.167055606842041, "global_step": 181366, "epoch": 4318} {"train_loss": -6.963375568389893, "global_step": 181367, "epoch": 4318} {"train_loss": -6.945405006408691, "global_step": 181368, "epoch": 4318} {"train_loss": -7.111352920532227, "global_step": 181369, "epoch": 4318} {"train_loss": -7.013725757598877, "global_step": 181370, "epoch": 4318} {"train_loss": -7.003664970397949, "global_step": 181371, "epoch": 4318} {"train_loss": -7.147112846374512, "global_step": 181372, "epoch": 4318} {"train_loss": -7.127486705780029, "global_step": 181373, "epoch": 4318} {"train_loss": -6.900129318237305, "global_step": 181374, "epoch": 4318} {"train_loss": -7.169546127319336, "global_step": 181375, "epoch": 4318} {"train_loss": -6.954595565795898, "global_step": 181376, "epoch": 4318} {"train_loss": -6.846238136291504, "global_step": 181377, "epoch": 4318} {"train_loss": -7.008644104003906, "global_step": 181378, "epoch": 4318} {"train_loss": -6.888558387756348, "global_step": 181379, "epoch": 4318} {"train_loss": -6.957077503204346, "global_step": 181380, "epoch": 4318} {"train_loss": -7.0869855880737305, "global_step": 181381, "epoch": 4318} {"train_loss": -6.916946887969971, "global_step": 181382, "epoch": 4318} {"train_loss": -7.057408332824707, "global_step": 181383, "epoch": 4318} {"train_loss": -7.0283331871032715, "global_step": 181384, "epoch": 4318} {"train_loss": -7.128875732421875, "global_step": 181385, "epoch": 4318} {"train_loss": -6.995306015014648, "global_step": 181386, "epoch": 4318} {"train_loss": -7.018075466156006, "global_step": 181387, "epoch": 4318} {"train_loss": -7.076316833496094, "global_step": 181388, "epoch": 4318} {"train_loss": -7.079285621643066, "global_step": 181389, "epoch": 4318} {"train_loss": -7.09876012802124, "global_step": 181390, "epoch": 4318} {"train_loss": -6.967302322387695, "global_step": 181391, "epoch": 4318} {"train_loss": -7.104413986206055, "global_step": 181392, "epoch": 4318} {"train_loss": -6.881869316101074, "global_step": 181393, "epoch": 4318} {"train_loss": -7.075067520141602, "global_step": 181394, "epoch": 4318} {"train_loss": -7.056413173675537, "global_step": 181395, "epoch": 4318} {"train_loss": -6.96397590637207, "global_step": 181396, "epoch": 4318} {"train_loss": -7.051717156455631, "global_step": 181397, "epoch": 4318, "val_loss": 68886.734375} {"train_loss": -7.140763282775879, "global_step": 181398, "epoch": 4319} {"train_loss": -6.933635711669922, "global_step": 181399, "epoch": 4319} {"train_loss": -7.120428085327148, "global_step": 181400, "epoch": 4319} {"train_loss": -7.066621780395508, "global_step": 181401, "epoch": 4319} {"train_loss": -7.019478797912598, "global_step": 181402, "epoch": 4319} {"train_loss": -7.133334636688232, "global_step": 181403, "epoch": 4319} {"train_loss": -7.192785263061523, "global_step": 181404, "epoch": 4319} {"train_loss": -7.118100643157959, "global_step": 181405, "epoch": 4319} {"train_loss": -6.991520881652832, "global_step": 181406, "epoch": 4319} {"train_loss": -7.135065078735352, "global_step": 181407, "epoch": 4319} {"train_loss": -6.95384407043457, "global_step": 181408, "epoch": 4319} {"train_loss": -7.04152250289917, "global_step": 181409, "epoch": 4319} {"train_loss": -7.161172866821289, "global_step": 181410, "epoch": 4319} {"train_loss": -7.092325210571289, "global_step": 181411, "epoch": 4319} {"train_loss": -7.121494293212891, "global_step": 181412, "epoch": 4319} {"train_loss": -7.124301910400391, "global_step": 181413, "epoch": 4319} {"train_loss": -7.0612897872924805, "global_step": 181414, "epoch": 4319} {"train_loss": -6.967956066131592, "global_step": 181415, "epoch": 4319} {"train_loss": -7.0933732986450195, "global_step": 181416, "epoch": 4319} {"train_loss": -7.0658464431762695, "global_step": 181417, "epoch": 4319} {"train_loss": -6.961499214172363, "global_step": 181418, "epoch": 4319} {"train_loss": -7.001758575439453, "global_step": 181419, "epoch": 4319} {"train_loss": -6.9964213371276855, "global_step": 181420, "epoch": 4319} {"train_loss": -7.130462646484375, "global_step": 181421, "epoch": 4319} {"train_loss": -7.00912618637085, "global_step": 181422, "epoch": 4319} {"train_loss": -7.002652645111084, "global_step": 181423, "epoch": 4319} {"train_loss": -6.992256164550781, "global_step": 181424, "epoch": 4319} {"train_loss": -7.079327583312988, "global_step": 181425, "epoch": 4319} {"train_loss": -6.92225456237793, "global_step": 181426, "epoch": 4319} {"train_loss": -7.025368690490723, "global_step": 181427, "epoch": 4319} {"train_loss": -7.034985065460205, "global_step": 181428, "epoch": 4319} {"train_loss": -7.151844024658203, "global_step": 181429, "epoch": 4319} {"train_loss": -7.086204528808594, "global_step": 181430, "epoch": 4319} {"train_loss": -7.053010940551758, "global_step": 181431, "epoch": 4319} {"train_loss": -7.03035831451416, "global_step": 181432, "epoch": 4319} {"train_loss": -7.062984466552734, "global_step": 181433, "epoch": 4319} {"train_loss": -7.083539009094238, "global_step": 181434, "epoch": 4319} {"train_loss": -7.0571770668029785, "global_step": 181435, "epoch": 4319} {"train_loss": -7.002261638641357, "global_step": 181436, "epoch": 4319} {"train_loss": -7.115029335021973, "global_step": 181437, "epoch": 4319} {"train_loss": -7.041543960571289, "global_step": 181438, "epoch": 4319} {"train_loss": -7.056388559795561, "global_step": 181439, "epoch": 4319, "val_loss": 68602.0078125} {"train_loss": -6.990207672119141, "global_step": 181440, "epoch": 4320} {"train_loss": -7.000284194946289, "global_step": 181441, "epoch": 4320} {"train_loss": -7.09393310546875, "global_step": 181442, "epoch": 4320} {"train_loss": -7.030620098114014, "global_step": 181443, "epoch": 4320} {"train_loss": -7.052544116973877, "global_step": 181444, "epoch": 4320} {"train_loss": -7.083406925201416, "global_step": 181445, "epoch": 4320} {"train_loss": -7.017719745635986, "global_step": 181446, "epoch": 4320} {"train_loss": -7.097393035888672, "global_step": 181447, "epoch": 4320} {"train_loss": -7.111269950866699, "global_step": 181448, "epoch": 4320} {"train_loss": -7.082066059112549, "global_step": 181449, "epoch": 4320} {"train_loss": -7.045846462249756, "global_step": 181450, "epoch": 4320} {"train_loss": -7.061068534851074, "global_step": 181451, "epoch": 4320} {"train_loss": -7.10697603225708, "global_step": 181452, "epoch": 4320} {"train_loss": -7.051392078399658, "global_step": 181453, "epoch": 4320} {"train_loss": -7.036738395690918, "global_step": 181454, "epoch": 4320} {"train_loss": -7.021920204162598, "global_step": 181455, "epoch": 4320} {"train_loss": -7.099963665008545, "global_step": 181456, "epoch": 4320} {"train_loss": -7.048799991607666, "global_step": 181457, "epoch": 4320} {"train_loss": -7.0343427658081055, "global_step": 181458, "epoch": 4320} {"train_loss": -7.126371383666992, "global_step": 181459, "epoch": 4320} {"train_loss": -7.086174964904785, "global_step": 181460, "epoch": 4320} {"train_loss": -7.128233909606934, "global_step": 181461, "epoch": 4320} {"train_loss": -7.082649230957031, "global_step": 181462, "epoch": 4320} {"train_loss": -7.149637222290039, "global_step": 181463, "epoch": 4320} {"train_loss": -7.134980201721191, "global_step": 181464, "epoch": 4320} {"train_loss": -7.21549129486084, "global_step": 181465, "epoch": 4320} {"train_loss": -6.960402011871338, "global_step": 181466, "epoch": 4320} {"train_loss": -7.089207649230957, "global_step": 181467, "epoch": 4320} {"train_loss": -7.166388511657715, "global_step": 181468, "epoch": 4320} {"train_loss": -7.217935562133789, "global_step": 181469, "epoch": 4320} {"train_loss": -7.169618129730225, "global_step": 181470, "epoch": 4320} {"train_loss": -7.1729841232299805, "global_step": 181471, "epoch": 4320} {"train_loss": -7.108409881591797, "global_step": 181472, "epoch": 4320} {"train_loss": -7.1416192054748535, "global_step": 181473, "epoch": 4320} {"train_loss": -7.00621223449707, "global_step": 181474, "epoch": 4320} {"train_loss": -7.1673784255981445, "global_step": 181475, "epoch": 4320} {"train_loss": -7.143671989440918, "global_step": 181476, "epoch": 4320} {"train_loss": -7.011553764343262, "global_step": 181477, "epoch": 4320} {"train_loss": -7.211734771728516, "global_step": 181478, "epoch": 4320} {"train_loss": -7.107189178466797, "global_step": 181479, "epoch": 4320} {"train_loss": -7.1683735847473145, "global_step": 181480, "epoch": 4320} {"train_loss": -7.093679042089553, "global_step": 181481, "epoch": 4320, "val_loss": 68577.71875} {"train_loss": -7.135869026184082, "global_step": 181482, "epoch": 4321} {"train_loss": -7.224480152130127, "global_step": 181483, "epoch": 4321} {"train_loss": -7.074095249176025, "global_step": 181484, "epoch": 4321} {"train_loss": -7.202918529510498, "global_step": 181485, "epoch": 4321} {"train_loss": -7.122707843780518, "global_step": 181486, "epoch": 4321} {"train_loss": -7.142244815826416, "global_step": 181487, "epoch": 4321} {"train_loss": -7.209401607513428, "global_step": 181488, "epoch": 4321} {"train_loss": -7.071172714233398, "global_step": 181489, "epoch": 4321} {"train_loss": -7.226390838623047, "global_step": 181490, "epoch": 4321} {"train_loss": -7.17317008972168, "global_step": 181491, "epoch": 4321} {"train_loss": -7.084038257598877, "global_step": 181492, "epoch": 4321} {"train_loss": -7.1402482986450195, "global_step": 181493, "epoch": 4321} {"train_loss": -7.129426956176758, "global_step": 181494, "epoch": 4321} {"train_loss": -7.080626487731934, "global_step": 181495, "epoch": 4321} {"train_loss": -7.17571496963501, "global_step": 181496, "epoch": 4321} {"train_loss": -7.160493850708008, "global_step": 181497, "epoch": 4321} {"train_loss": -7.056859016418457, "global_step": 181498, "epoch": 4321} {"train_loss": -7.135517597198486, "global_step": 181499, "epoch": 4321} {"train_loss": -7.067103385925293, "global_step": 181500, "epoch": 4321} {"train_loss": -7.108186721801758, "global_step": 181501, "epoch": 4321} {"train_loss": -7.147980690002441, "global_step": 181502, "epoch": 4321} {"train_loss": -7.0509562492370605, "global_step": 181503, "epoch": 4321} {"train_loss": -7.106048107147217, "global_step": 181504, "epoch": 4321} {"train_loss": -7.121608257293701, "global_step": 181505, "epoch": 4321} {"train_loss": -7.12095832824707, "global_step": 181506, "epoch": 4321} {"train_loss": -7.071352005004883, "global_step": 181507, "epoch": 4321} {"train_loss": -7.096221923828125, "global_step": 181508, "epoch": 4321} {"train_loss": -7.030300140380859, "global_step": 181509, "epoch": 4321} {"train_loss": -7.056098461151123, "global_step": 181510, "epoch": 4321} {"train_loss": -7.02706241607666, "global_step": 181511, "epoch": 4321} {"train_loss": -7.145956039428711, "global_step": 181512, "epoch": 4321} {"train_loss": -7.098006248474121, "global_step": 181513, "epoch": 4321} {"train_loss": -7.030954360961914, "global_step": 181514, "epoch": 4321} {"train_loss": -7.066911697387695, "global_step": 181515, "epoch": 4321} {"train_loss": -7.084460258483887, "global_step": 181516, "epoch": 4321} {"train_loss": -7.066716194152832, "global_step": 181517, "epoch": 4321} {"train_loss": -6.991585731506348, "global_step": 181518, "epoch": 4321} {"train_loss": -7.011318683624268, "global_step": 181519, "epoch": 4321} {"train_loss": -7.009403705596924, "global_step": 181520, "epoch": 4321} {"train_loss": -7.015559196472168, "global_step": 181521, "epoch": 4321} {"train_loss": -7.162302494049072, "global_step": 181522, "epoch": 4321} {"train_loss": -7.102836756479173, "global_step": 181523, "epoch": 4321, "val_loss": 68696.890625} {"train_loss": -7.124152183532715, "global_step": 181524, "epoch": 4322} {"train_loss": -6.9912543296813965, "global_step": 181525, "epoch": 4322} {"train_loss": -7.105618476867676, "global_step": 181526, "epoch": 4322} {"train_loss": -7.147650718688965, "global_step": 181527, "epoch": 4322} {"train_loss": -6.963311195373535, "global_step": 181528, "epoch": 4322} {"train_loss": -6.967756271362305, "global_step": 181529, "epoch": 4322} {"train_loss": -6.989040374755859, "global_step": 181530, "epoch": 4322} {"train_loss": -7.076519012451172, "global_step": 181531, "epoch": 4322} {"train_loss": -6.956048965454102, "global_step": 181532, "epoch": 4322} {"train_loss": -7.073036193847656, "global_step": 181533, "epoch": 4322} {"train_loss": -7.002089500427246, "global_step": 181534, "epoch": 4322} {"train_loss": -7.105030059814453, "global_step": 181535, "epoch": 4322} {"train_loss": -7.078521251678467, "global_step": 181536, "epoch": 4322} {"train_loss": -7.1283860206604, "global_step": 181537, "epoch": 4322} {"train_loss": -7.03757905960083, "global_step": 181538, "epoch": 4322} {"train_loss": -7.052078723907471, "global_step": 181539, "epoch": 4322} {"train_loss": -7.0635881423950195, "global_step": 181540, "epoch": 4322} {"train_loss": -7.079990386962891, "global_step": 181541, "epoch": 4322} {"train_loss": -7.043570518493652, "global_step": 181542, "epoch": 4322} {"train_loss": -7.075056076049805, "global_step": 181543, "epoch": 4322} {"train_loss": -7.064637184143066, "global_step": 181544, "epoch": 4322} {"train_loss": -7.171813011169434, "global_step": 181545, "epoch": 4322} {"train_loss": -7.010991096496582, "global_step": 181546, "epoch": 4322} {"train_loss": -7.039084434509277, "global_step": 181547, "epoch": 4322} {"train_loss": -7.0956220626831055, "global_step": 181548, "epoch": 4322} {"train_loss": -6.968719482421875, "global_step": 181549, "epoch": 4322} {"train_loss": -7.07425594329834, "global_step": 181550, "epoch": 4322} {"train_loss": -7.058391571044922, "global_step": 181551, "epoch": 4322} {"train_loss": -7.14509391784668, "global_step": 181552, "epoch": 4322} {"train_loss": -7.050288200378418, "global_step": 181553, "epoch": 4322} {"train_loss": -6.997864723205566, "global_step": 181554, "epoch": 4322} {"train_loss": -7.1279168128967285, "global_step": 181555, "epoch": 4322} {"train_loss": -7.018696308135986, "global_step": 181556, "epoch": 4322} {"train_loss": -7.0555572509765625, "global_step": 181557, "epoch": 4322} {"train_loss": -6.882646560668945, "global_step": 181558, "epoch": 4322} {"train_loss": -7.049623012542725, "global_step": 181559, "epoch": 4322} {"train_loss": -6.9809064865112305, "global_step": 181560, "epoch": 4322} {"train_loss": -7.10231876373291, "global_step": 181561, "epoch": 4322} {"train_loss": -6.9240498542785645, "global_step": 181562, "epoch": 4322} {"train_loss": -7.020503997802734, "global_step": 181563, "epoch": 4322} {"train_loss": -7.014487266540527, "global_step": 181564, "epoch": 4322} {"train_loss": -7.044989199865432, "global_step": 181565, "epoch": 4322, "val_loss": 68892.6484375} {"train_loss": -7.039728164672852, "global_step": 181566, "epoch": 4323} {"train_loss": -6.942781448364258, "global_step": 181567, "epoch": 4323} {"train_loss": -7.010129451751709, "global_step": 181568, "epoch": 4323} {"train_loss": -6.96694278717041, "global_step": 181569, "epoch": 4323} {"train_loss": -7.143902778625488, "global_step": 181570, "epoch": 4323} {"train_loss": -7.083605766296387, "global_step": 181571, "epoch": 4323} {"train_loss": -6.99125337600708, "global_step": 181572, "epoch": 4323} {"train_loss": -6.975545406341553, "global_step": 181573, "epoch": 4323} {"train_loss": -6.95121955871582, "global_step": 181574, "epoch": 4323} {"train_loss": -7.078958988189697, "global_step": 181575, "epoch": 4323} {"train_loss": -6.99353551864624, "global_step": 181576, "epoch": 4323} {"train_loss": -7.081806182861328, "global_step": 181577, "epoch": 4323} {"train_loss": -7.062342643737793, "global_step": 181578, "epoch": 4323} {"train_loss": -7.113607406616211, "global_step": 181579, "epoch": 4323} {"train_loss": -7.054227828979492, "global_step": 181580, "epoch": 4323} {"train_loss": -6.9710187911987305, "global_step": 181581, "epoch": 4323} {"train_loss": -7.021559715270996, "global_step": 181582, "epoch": 4323} {"train_loss": -7.095376014709473, "global_step": 181583, "epoch": 4323} {"train_loss": -7.1102190017700195, "global_step": 181584, "epoch": 4323} {"train_loss": -6.950075149536133, "global_step": 181585, "epoch": 4323} {"train_loss": -7.051197528839111, "global_step": 181586, "epoch": 4323} {"train_loss": -7.138335227966309, "global_step": 181587, "epoch": 4323} {"train_loss": -7.009653568267822, "global_step": 181588, "epoch": 4323} {"train_loss": -6.9508771896362305, "global_step": 181589, "epoch": 4323} {"train_loss": -6.978811740875244, "global_step": 181590, "epoch": 4323} {"train_loss": -7.001431465148926, "global_step": 181591, "epoch": 4323} {"train_loss": -7.057744979858398, "global_step": 181592, "epoch": 4323} {"train_loss": -7.025992393493652, "global_step": 181593, "epoch": 4323} {"train_loss": -6.90308952331543, "global_step": 181594, "epoch": 4323} {"train_loss": -6.787755966186523, "global_step": 181595, "epoch": 4323} {"train_loss": -7.094884872436523, "global_step": 181596, "epoch": 4323} {"train_loss": -6.842931747436523, "global_step": 181597, "epoch": 4323} {"train_loss": -6.807961940765381, "global_step": 181598, "epoch": 4323} {"train_loss": -7.015381336212158, "global_step": 181599, "epoch": 4323} {"train_loss": -6.800481796264648, "global_step": 181600, "epoch": 4323} {"train_loss": -6.800366401672363, "global_step": 181601, "epoch": 4323} {"train_loss": -6.969210624694824, "global_step": 181602, "epoch": 4323} {"train_loss": -6.839239120483398, "global_step": 181603, "epoch": 4323} {"train_loss": -6.946898460388184, "global_step": 181604, "epoch": 4323} {"train_loss": -6.68257999420166, "global_step": 181605, "epoch": 4323} {"train_loss": -6.933414936065674, "global_step": 181606, "epoch": 4323} {"train_loss": -6.980527696155367, "global_step": 181607, "epoch": 4323, "val_loss": 68661.1640625} {"train_loss": -6.975882053375244, "global_step": 181608, "epoch": 4324} {"train_loss": -6.831476211547852, "global_step": 181609, "epoch": 4324} {"train_loss": -7.018449306488037, "global_step": 181610, "epoch": 4324} {"train_loss": -6.968482971191406, "global_step": 181611, "epoch": 4324} {"train_loss": -6.944799423217773, "global_step": 181612, "epoch": 4324} {"train_loss": -6.929116249084473, "global_step": 181613, "epoch": 4324} {"train_loss": -6.975170135498047, "global_step": 181614, "epoch": 4324} {"train_loss": -6.8139424324035645, "global_step": 181615, "epoch": 4324} {"train_loss": -7.0159759521484375, "global_step": 181616, "epoch": 4324} {"train_loss": -6.88450813293457, "global_step": 181617, "epoch": 4324} {"train_loss": -7.003569602966309, "global_step": 181618, "epoch": 4324} {"train_loss": -7.0364227294921875, "global_step": 181619, "epoch": 4324} {"train_loss": -6.952071189880371, "global_step": 181620, "epoch": 4324} {"train_loss": -6.904301643371582, "global_step": 181621, "epoch": 4324} {"train_loss": -7.08597469329834, "global_step": 181622, "epoch": 4324} {"train_loss": -7.0728302001953125, "global_step": 181623, "epoch": 4324} {"train_loss": -7.158843517303467, "global_step": 181624, "epoch": 4324} {"train_loss": -6.9864397048950195, "global_step": 181625, "epoch": 4324} {"train_loss": -7.046396255493164, "global_step": 181626, "epoch": 4324} {"train_loss": -7.044472694396973, "global_step": 181627, "epoch": 4324} {"train_loss": -7.048583984375, "global_step": 181628, "epoch": 4324} {"train_loss": -7.102297306060791, "global_step": 181629, "epoch": 4324} {"train_loss": -7.033166885375977, "global_step": 181630, "epoch": 4324} {"train_loss": -7.107517719268799, "global_step": 181631, "epoch": 4324} {"train_loss": -7.06199836730957, "global_step": 181632, "epoch": 4324} {"train_loss": -7.122452735900879, "global_step": 181633, "epoch": 4324} {"train_loss": -7.07800817489624, "global_step": 181634, "epoch": 4324} {"train_loss": -7.207232475280762, "global_step": 181635, "epoch": 4324} {"train_loss": -7.171483993530273, "global_step": 181636, "epoch": 4324} {"train_loss": -7.219037055969238, "global_step": 181637, "epoch": 4324} {"train_loss": -7.140659332275391, "global_step": 181638, "epoch": 4324} {"train_loss": -7.194275856018066, "global_step": 181639, "epoch": 4324} {"train_loss": -7.153825759887695, "global_step": 181640, "epoch": 4324} {"train_loss": -7.0582356452941895, "global_step": 181641, "epoch": 4324} {"train_loss": -7.146858215332031, "global_step": 181642, "epoch": 4324} {"train_loss": -7.160433769226074, "global_step": 181643, "epoch": 4324} {"train_loss": -7.142457962036133, "global_step": 181644, "epoch": 4324} {"train_loss": -7.062013626098633, "global_step": 181645, "epoch": 4324} {"train_loss": -7.118741035461426, "global_step": 181646, "epoch": 4324} {"train_loss": -7.092844009399414, "global_step": 181647, "epoch": 4324} {"train_loss": -7.110372066497803, "global_step": 181648, "epoch": 4324} {"train_loss": -7.057482356116886, "global_step": 181649, "epoch": 4324, "val_loss": 68737.71875} {"train_loss": -7.159397125244141, "global_step": 181650, "epoch": 4325} {"train_loss": -7.097935676574707, "global_step": 181651, "epoch": 4325} {"train_loss": -7.164822101593018, "global_step": 181652, "epoch": 4325} {"train_loss": -7.173386096954346, "global_step": 181653, "epoch": 4325} {"train_loss": -7.126953125, "global_step": 181654, "epoch": 4325} {"train_loss": -7.143317222595215, "global_step": 181655, "epoch": 4325} {"train_loss": -7.0568952560424805, "global_step": 181656, "epoch": 4325} {"train_loss": -7.130378246307373, "global_step": 181657, "epoch": 4325} {"train_loss": -6.97633171081543, "global_step": 181658, "epoch": 4325} {"train_loss": -7.227656364440918, "global_step": 181659, "epoch": 4325} {"train_loss": -7.227875232696533, "global_step": 181660, "epoch": 4325} {"train_loss": -7.1800150871276855, "global_step": 181661, "epoch": 4325} {"train_loss": -7.158394813537598, "global_step": 181662, "epoch": 4325} {"train_loss": -7.142733097076416, "global_step": 181663, "epoch": 4325} {"train_loss": -7.163771629333496, "global_step": 181664, "epoch": 4325} {"train_loss": -7.094653129577637, "global_step": 181665, "epoch": 4325} {"train_loss": -7.1410322189331055, "global_step": 181666, "epoch": 4325} {"train_loss": -7.075099468231201, "global_step": 181667, "epoch": 4325} {"train_loss": -6.978689193725586, "global_step": 181668, "epoch": 4325} {"train_loss": -7.1587677001953125, "global_step": 181669, "epoch": 4325} {"train_loss": -7.132794380187988, "global_step": 181670, "epoch": 4325} {"train_loss": -7.055453300476074, "global_step": 181671, "epoch": 4325} {"train_loss": -6.996588230133057, "global_step": 181672, "epoch": 4325} {"train_loss": -7.199843406677246, "global_step": 181673, "epoch": 4325} {"train_loss": -7.095772743225098, "global_step": 181674, "epoch": 4325} {"train_loss": -7.086418151855469, "global_step": 181675, "epoch": 4325} {"train_loss": -7.043046951293945, "global_step": 181676, "epoch": 4325} {"train_loss": -7.041431427001953, "global_step": 181677, "epoch": 4325} {"train_loss": -6.993772983551025, "global_step": 181678, "epoch": 4325} {"train_loss": -7.14885139465332, "global_step": 181679, "epoch": 4325} {"train_loss": -7.046839237213135, "global_step": 181680, "epoch": 4325} {"train_loss": -7.022495269775391, "global_step": 181681, "epoch": 4325} {"train_loss": -7.124330520629883, "global_step": 181682, "epoch": 4325} {"train_loss": -7.1214599609375, "global_step": 181683, "epoch": 4325} {"train_loss": -7.1668701171875, "global_step": 181684, "epoch": 4325} {"train_loss": -7.054370880126953, "global_step": 181685, "epoch": 4325} {"train_loss": -7.025322914123535, "global_step": 181686, "epoch": 4325} {"train_loss": -7.010036468505859, "global_step": 181687, "epoch": 4325} {"train_loss": -7.172299385070801, "global_step": 181688, "epoch": 4325} {"train_loss": -7.052250385284424, "global_step": 181689, "epoch": 4325} {"train_loss": -7.088192462921143, "global_step": 181690, "epoch": 4325} {"train_loss": -7.103246859141758, "global_step": 181691, "epoch": 4325, "val_loss": 68755.9453125} {"train_loss": -7.048509120941162, "global_step": 181692, "epoch": 4326} {"train_loss": -7.013112545013428, "global_step": 181693, "epoch": 4326} {"train_loss": -7.153971195220947, "global_step": 181694, "epoch": 4326} {"train_loss": -7.127987861633301, "global_step": 181695, "epoch": 4326} {"train_loss": -6.965799331665039, "global_step": 181696, "epoch": 4326} {"train_loss": -7.082211494445801, "global_step": 181697, "epoch": 4326} {"train_loss": -7.019467353820801, "global_step": 181698, "epoch": 4326} {"train_loss": -7.060043811798096, "global_step": 181699, "epoch": 4326} {"train_loss": -7.031795024871826, "global_step": 181700, "epoch": 4326} {"train_loss": -7.069890975952148, "global_step": 181701, "epoch": 4326} {"train_loss": -6.992089748382568, "global_step": 181702, "epoch": 4326} {"train_loss": -7.008178234100342, "global_step": 181703, "epoch": 4326} {"train_loss": -6.9982476234436035, "global_step": 181704, "epoch": 4326} {"train_loss": -7.00923490524292, "global_step": 181705, "epoch": 4326} {"train_loss": -7.14589786529541, "global_step": 181706, "epoch": 4326} {"train_loss": -7.088780403137207, "global_step": 181707, "epoch": 4326} {"train_loss": -7.142984390258789, "global_step": 181708, "epoch": 4326} {"train_loss": -7.011861801147461, "global_step": 181709, "epoch": 4326} {"train_loss": -7.128323078155518, "global_step": 181710, "epoch": 4326} {"train_loss": -7.044145584106445, "global_step": 181711, "epoch": 4326} {"train_loss": -6.9990386962890625, "global_step": 181712, "epoch": 4326} {"train_loss": -7.0427680015563965, "global_step": 181713, "epoch": 4326} {"train_loss": -7.001382827758789, "global_step": 181714, "epoch": 4326} {"train_loss": -7.197622299194336, "global_step": 181715, "epoch": 4326} {"train_loss": -7.143226623535156, "global_step": 181716, "epoch": 4326} {"train_loss": -7.09345817565918, "global_step": 181717, "epoch": 4326} {"train_loss": -7.1108808517456055, "global_step": 181718, "epoch": 4326} {"train_loss": -6.924855709075928, "global_step": 181719, "epoch": 4326} {"train_loss": -7.203897953033447, "global_step": 181720, "epoch": 4326} {"train_loss": -7.049848556518555, "global_step": 181721, "epoch": 4326} {"train_loss": -7.0144195556640625, "global_step": 181722, "epoch": 4326} {"train_loss": -7.029675483703613, "global_step": 181723, "epoch": 4326} {"train_loss": -7.0805559158325195, "global_step": 181724, "epoch": 4326} {"train_loss": -7.1280317306518555, "global_step": 181725, "epoch": 4326} {"train_loss": -7.1121416091918945, "global_step": 181726, "epoch": 4326} {"train_loss": -7.203871726989746, "global_step": 181727, "epoch": 4326} {"train_loss": -7.149248123168945, "global_step": 181728, "epoch": 4326} {"train_loss": -7.066009521484375, "global_step": 181729, "epoch": 4326} {"train_loss": -7.079408645629883, "global_step": 181730, "epoch": 4326} {"train_loss": -7.010615348815918, "global_step": 181731, "epoch": 4326} {"train_loss": -7.1460161209106445, "global_step": 181732, "epoch": 4326} {"train_loss": -7.070545480364845, "global_step": 181733, "epoch": 4326, "val_loss": 68725.71875} {"train_loss": -7.134248733520508, "global_step": 181734, "epoch": 4327} {"train_loss": -7.195169925689697, "global_step": 181735, "epoch": 4327} {"train_loss": -6.993781089782715, "global_step": 181736, "epoch": 4327} {"train_loss": -7.1618547439575195, "global_step": 181737, "epoch": 4327} {"train_loss": -7.176515102386475, "global_step": 181738, "epoch": 4327} {"train_loss": -7.1427321434021, "global_step": 181739, "epoch": 4327} {"train_loss": -7.09434700012207, "global_step": 181740, "epoch": 4327} {"train_loss": -7.212489128112793, "global_step": 181741, "epoch": 4327} {"train_loss": -7.094629764556885, "global_step": 181742, "epoch": 4327} {"train_loss": -7.12164306640625, "global_step": 181743, "epoch": 4327} {"train_loss": -7.140361309051514, "global_step": 181744, "epoch": 4327} {"train_loss": -7.157754898071289, "global_step": 181745, "epoch": 4327} {"train_loss": -7.053893089294434, "global_step": 181746, "epoch": 4327} {"train_loss": -7.086838722229004, "global_step": 181747, "epoch": 4327} {"train_loss": -7.005824089050293, "global_step": 181748, "epoch": 4327} {"train_loss": -6.919144630432129, "global_step": 181749, "epoch": 4327} {"train_loss": -7.022090911865234, "global_step": 181750, "epoch": 4327} {"train_loss": -7.068332195281982, "global_step": 181751, "epoch": 4327} {"train_loss": -6.881766319274902, "global_step": 181752, "epoch": 4327} {"train_loss": -6.918064117431641, "global_step": 181753, "epoch": 4327} {"train_loss": -7.125843048095703, "global_step": 181754, "epoch": 4327} {"train_loss": -7.047858238220215, "global_step": 181755, "epoch": 4327} {"train_loss": -7.150428295135498, "global_step": 181756, "epoch": 4327} {"train_loss": -7.008899688720703, "global_step": 181757, "epoch": 4327} {"train_loss": -6.960042953491211, "global_step": 181758, "epoch": 4327} {"train_loss": -7.097762107849121, "global_step": 181759, "epoch": 4327} {"train_loss": -6.954975128173828, "global_step": 181760, "epoch": 4327} {"train_loss": -6.941859245300293, "global_step": 181761, "epoch": 4327} {"train_loss": -7.042239189147949, "global_step": 181762, "epoch": 4327} {"train_loss": -7.082055568695068, "global_step": 181763, "epoch": 4327} {"train_loss": -7.045980453491211, "global_step": 181764, "epoch": 4327} {"train_loss": -6.888500213623047, "global_step": 181765, "epoch": 4327} {"train_loss": -7.015491962432861, "global_step": 181766, "epoch": 4327} {"train_loss": -7.066736698150635, "global_step": 181767, "epoch": 4327} {"train_loss": -6.873861312866211, "global_step": 181768, "epoch": 4327} {"train_loss": -7.099214553833008, "global_step": 181769, "epoch": 4327} {"train_loss": -6.939348220825195, "global_step": 181770, "epoch": 4327} {"train_loss": -7.093788146972656, "global_step": 181771, "epoch": 4327} {"train_loss": -6.942966461181641, "global_step": 181772, "epoch": 4327} {"train_loss": -7.0830159187316895, "global_step": 181773, "epoch": 4327} {"train_loss": -7.00054407119751, "global_step": 181774, "epoch": 4327} {"train_loss": -7.047990571884882, "global_step": 181775, "epoch": 4327, "val_loss": 68893.3359375} {"train_loss": -7.072638511657715, "global_step": 181776, "epoch": 4328} {"train_loss": -7.0024871826171875, "global_step": 181777, "epoch": 4328} {"train_loss": -6.98884916305542, "global_step": 181778, "epoch": 4328} {"train_loss": -7.050896167755127, "global_step": 181779, "epoch": 4328} {"train_loss": -6.951488018035889, "global_step": 181780, "epoch": 4328} {"train_loss": -6.874135971069336, "global_step": 181781, "epoch": 4328} {"train_loss": -7.029219627380371, "global_step": 181782, "epoch": 4328} {"train_loss": -6.885174751281738, "global_step": 181783, "epoch": 4328} {"train_loss": -7.029537200927734, "global_step": 181784, "epoch": 4328} {"train_loss": -6.977815628051758, "global_step": 181785, "epoch": 4328} {"train_loss": -7.013145923614502, "global_step": 181786, "epoch": 4328} {"train_loss": -7.0095906257629395, "global_step": 181787, "epoch": 4328} {"train_loss": -6.945402145385742, "global_step": 181788, "epoch": 4328} {"train_loss": -7.015430450439453, "global_step": 181789, "epoch": 4328} {"train_loss": -7.034080982208252, "global_step": 181790, "epoch": 4328} {"train_loss": -6.890486717224121, "global_step": 181791, "epoch": 4328} {"train_loss": -6.992347717285156, "global_step": 181792, "epoch": 4328} {"train_loss": -6.964107513427734, "global_step": 181793, "epoch": 4328} {"train_loss": -7.0834174156188965, "global_step": 181794, "epoch": 4328} {"train_loss": -6.999476909637451, "global_step": 181795, "epoch": 4328} {"train_loss": -6.9995269775390625, "global_step": 181796, "epoch": 4328} {"train_loss": -7.06046199798584, "global_step": 181797, "epoch": 4328} {"train_loss": -7.129794597625732, "global_step": 181798, "epoch": 4328} {"train_loss": -7.0668463706970215, "global_step": 181799, "epoch": 4328} {"train_loss": -7.05088996887207, "global_step": 181800, "epoch": 4328} {"train_loss": -7.05241060256958, "global_step": 181801, "epoch": 4328} {"train_loss": -7.10562801361084, "global_step": 181802, "epoch": 4328} {"train_loss": -6.965242385864258, "global_step": 181803, "epoch": 4328} {"train_loss": -7.116935729980469, "global_step": 181804, "epoch": 4328} {"train_loss": -7.0692644119262695, "global_step": 181805, "epoch": 4328} {"train_loss": -7.1627397537231445, "global_step": 181806, "epoch": 4328} {"train_loss": -6.990159034729004, "global_step": 181807, "epoch": 4328} {"train_loss": -7.150454998016357, "global_step": 181808, "epoch": 4328} {"train_loss": -7.082630157470703, "global_step": 181809, "epoch": 4328} {"train_loss": -7.01316499710083, "global_step": 181810, "epoch": 4328} {"train_loss": -7.117800712585449, "global_step": 181811, "epoch": 4328} {"train_loss": -7.035318851470947, "global_step": 181812, "epoch": 4328} {"train_loss": -7.080798149108887, "global_step": 181813, "epoch": 4328} {"train_loss": -7.13535213470459, "global_step": 181814, "epoch": 4328} {"train_loss": -7.140519142150879, "global_step": 181815, "epoch": 4328} {"train_loss": -7.066307067871094, "global_step": 181816, "epoch": 4328} {"train_loss": -7.036695014862787, "global_step": 181817, "epoch": 4328, "val_loss": 68686.578125} {"train_loss": -7.129692554473877, "global_step": 181818, "epoch": 4329} {"train_loss": -7.162919998168945, "global_step": 181819, "epoch": 4329} {"train_loss": -7.150726318359375, "global_step": 181820, "epoch": 4329} {"train_loss": -7.148188591003418, "global_step": 181821, "epoch": 4329} {"train_loss": -7.196430683135986, "global_step": 181822, "epoch": 4329} {"train_loss": -7.071557998657227, "global_step": 181823, "epoch": 4329} {"train_loss": -7.21772575378418, "global_step": 181824, "epoch": 4329} {"train_loss": -7.120758056640625, "global_step": 181825, "epoch": 4329} {"train_loss": -7.1883673667907715, "global_step": 181826, "epoch": 4329} {"train_loss": -7.114046096801758, "global_step": 181827, "epoch": 4329} {"train_loss": -7.073162078857422, "global_step": 181828, "epoch": 4329} {"train_loss": -7.080811500549316, "global_step": 181829, "epoch": 4329} {"train_loss": -7.105555534362793, "global_step": 181830, "epoch": 4329} {"train_loss": -7.213335990905762, "global_step": 181831, "epoch": 4329} {"train_loss": -7.106775283813477, "global_step": 181832, "epoch": 4329} {"train_loss": -7.03352165222168, "global_step": 181833, "epoch": 4329} {"train_loss": -7.112026691436768, "global_step": 181834, "epoch": 4329} {"train_loss": -7.040658473968506, "global_step": 181835, "epoch": 4329} {"train_loss": -7.1374969482421875, "global_step": 181836, "epoch": 4329} {"train_loss": -7.188993453979492, "global_step": 181837, "epoch": 4329} {"train_loss": -7.06955623626709, "global_step": 181838, "epoch": 4329} {"train_loss": -7.093669891357422, "global_step": 181839, "epoch": 4329} {"train_loss": -7.039871692657471, "global_step": 181840, "epoch": 4329} {"train_loss": -7.0851030349731445, "global_step": 181841, "epoch": 4329} {"train_loss": -7.180774211883545, "global_step": 181842, "epoch": 4329} {"train_loss": -7.060969829559326, "global_step": 181843, "epoch": 4329} {"train_loss": -7.088406562805176, "global_step": 181844, "epoch": 4329} {"train_loss": -7.15655517578125, "global_step": 181845, "epoch": 4329} {"train_loss": -7.087924957275391, "global_step": 181846, "epoch": 4329} {"train_loss": -7.113785743713379, "global_step": 181847, "epoch": 4329} {"train_loss": -7.016561508178711, "global_step": 181848, "epoch": 4329} {"train_loss": -7.12413215637207, "global_step": 181849, "epoch": 4329} {"train_loss": -7.048031806945801, "global_step": 181850, "epoch": 4329} {"train_loss": -6.8512372970581055, "global_step": 181851, "epoch": 4329} {"train_loss": -7.098505020141602, "global_step": 181852, "epoch": 4329} {"train_loss": -7.027965545654297, "global_step": 181853, "epoch": 4329} {"train_loss": -7.060111045837402, "global_step": 181854, "epoch": 4329} {"train_loss": -7.035346031188965, "global_step": 181855, "epoch": 4329} {"train_loss": -7.1451616287231445, "global_step": 181856, "epoch": 4329} {"train_loss": -7.030035018920898, "global_step": 181857, "epoch": 4329} {"train_loss": -7.08013916015625, "global_step": 181858, "epoch": 4329} {"train_loss": -7.101905221030826, "global_step": 181859, "epoch": 4329, "val_loss": 68742.375} {"train_loss": -7.259528160095215, "global_step": 181860, "epoch": 4330} {"train_loss": -7.070082664489746, "global_step": 181861, "epoch": 4330} {"train_loss": -7.1494855880737305, "global_step": 181862, "epoch": 4330} {"train_loss": -7.083438873291016, "global_step": 181863, "epoch": 4330} {"train_loss": -7.023169994354248, "global_step": 181864, "epoch": 4330} {"train_loss": -7.106714248657227, "global_step": 181865, "epoch": 4330} {"train_loss": -7.103116035461426, "global_step": 181866, "epoch": 4330} {"train_loss": -7.047746658325195, "global_step": 181867, "epoch": 4330} {"train_loss": -7.090115070343018, "global_step": 181868, "epoch": 4330} {"train_loss": -7.151870250701904, "global_step": 181869, "epoch": 4330} {"train_loss": -7.181316375732422, "global_step": 181870, "epoch": 4330} {"train_loss": -7.127560138702393, "global_step": 181871, "epoch": 4330} {"train_loss": -7.173098564147949, "global_step": 181872, "epoch": 4330} {"train_loss": -7.195232391357422, "global_step": 181873, "epoch": 4330} {"train_loss": -7.181623458862305, "global_step": 181874, "epoch": 4330} {"train_loss": -7.05122709274292, "global_step": 181875, "epoch": 4330} {"train_loss": -7.172428607940674, "global_step": 181876, "epoch": 4330} {"train_loss": -7.107935905456543, "global_step": 181877, "epoch": 4330} {"train_loss": -7.11981725692749, "global_step": 181878, "epoch": 4330} {"train_loss": -7.306827545166016, "global_step": 181879, "epoch": 4330} {"train_loss": -7.143490791320801, "global_step": 181880, "epoch": 4330} {"train_loss": -7.175941467285156, "global_step": 181881, "epoch": 4330} {"train_loss": -7.072674751281738, "global_step": 181882, "epoch": 4330} {"train_loss": -7.105672836303711, "global_step": 181883, "epoch": 4330} {"train_loss": -7.134002208709717, "global_step": 181884, "epoch": 4330} {"train_loss": -7.091760635375977, "global_step": 181885, "epoch": 4330} {"train_loss": -7.054714202880859, "global_step": 181886, "epoch": 4330} {"train_loss": -7.02916955947876, "global_step": 181887, "epoch": 4330} {"train_loss": -7.160287857055664, "global_step": 181888, "epoch": 4330} {"train_loss": -7.16114616394043, "global_step": 181889, "epoch": 4330} {"train_loss": -7.015469074249268, "global_step": 181890, "epoch": 4330} {"train_loss": -7.108676910400391, "global_step": 181891, "epoch": 4330} {"train_loss": -7.161498546600342, "global_step": 181892, "epoch": 4330} {"train_loss": -6.94976806640625, "global_step": 181893, "epoch": 4330} {"train_loss": -7.105867385864258, "global_step": 181894, "epoch": 4330} {"train_loss": -6.967627048492432, "global_step": 181895, "epoch": 4330} {"train_loss": -6.987132549285889, "global_step": 181896, "epoch": 4330} {"train_loss": -6.940258979797363, "global_step": 181897, "epoch": 4330} {"train_loss": -6.954596042633057, "global_step": 181898, "epoch": 4330} {"train_loss": -7.05885124206543, "global_step": 181899, "epoch": 4330} {"train_loss": -7.098268508911133, "global_step": 181900, "epoch": 4330} {"train_loss": -7.101287410372779, "global_step": 181901, "epoch": 4330, "val_loss": 68775.1015625} {"train_loss": -6.930380821228027, "global_step": 181902, "epoch": 4331} {"train_loss": -7.123535633087158, "global_step": 181903, "epoch": 4331} {"train_loss": -7.028934955596924, "global_step": 181904, "epoch": 4331} {"train_loss": -7.055018424987793, "global_step": 181905, "epoch": 4331} {"train_loss": -7.002357006072998, "global_step": 181906, "epoch": 4331} {"train_loss": -7.065075397491455, "global_step": 181907, "epoch": 4331} {"train_loss": -7.155325889587402, "global_step": 181908, "epoch": 4331} {"train_loss": -7.137845039367676, "global_step": 181909, "epoch": 4331} {"train_loss": -7.016860008239746, "global_step": 181910, "epoch": 4331} {"train_loss": -6.937704086303711, "global_step": 181911, "epoch": 4331} {"train_loss": -7.1347246170043945, "global_step": 181912, "epoch": 4331} {"train_loss": -7.0819172859191895, "global_step": 181913, "epoch": 4331} {"train_loss": -7.0630950927734375, "global_step": 181914, "epoch": 4331} {"train_loss": -7.128426551818848, "global_step": 181915, "epoch": 4331} {"train_loss": -6.98252010345459, "global_step": 181916, "epoch": 4331} {"train_loss": -7.221181869506836, "global_step": 181917, "epoch": 4331} {"train_loss": -7.096623420715332, "global_step": 181918, "epoch": 4331} {"train_loss": -7.114628791809082, "global_step": 181919, "epoch": 4331} {"train_loss": -7.112054824829102, "global_step": 181920, "epoch": 4331} {"train_loss": -7.156959533691406, "global_step": 181921, "epoch": 4331} {"train_loss": -7.094435691833496, "global_step": 181922, "epoch": 4331} {"train_loss": -7.050045967102051, "global_step": 181923, "epoch": 4331} {"train_loss": -7.102205276489258, "global_step": 181924, "epoch": 4331} {"train_loss": -7.028800964355469, "global_step": 181925, "epoch": 4331} {"train_loss": -7.015767574310303, "global_step": 181926, "epoch": 4331} {"train_loss": -7.209007263183594, "global_step": 181927, "epoch": 4331} {"train_loss": -7.076048851013184, "global_step": 181928, "epoch": 4331} {"train_loss": -7.06638240814209, "global_step": 181929, "epoch": 4331} {"train_loss": -7.174253463745117, "global_step": 181930, "epoch": 4331} {"train_loss": -7.162941932678223, "global_step": 181931, "epoch": 4331} {"train_loss": -7.1048479080200195, "global_step": 181932, "epoch": 4331} {"train_loss": -7.087067604064941, "global_step": 181933, "epoch": 4331} {"train_loss": -7.077641010284424, "global_step": 181934, "epoch": 4331} {"train_loss": -7.044830322265625, "global_step": 181935, "epoch": 4331} {"train_loss": -7.03902530670166, "global_step": 181936, "epoch": 4331} {"train_loss": -7.197181701660156, "global_step": 181937, "epoch": 4331} {"train_loss": -7.05851936340332, "global_step": 181938, "epoch": 4331} {"train_loss": -7.08441162109375, "global_step": 181939, "epoch": 4331} {"train_loss": -7.094625949859619, "global_step": 181940, "epoch": 4331} {"train_loss": -7.145908355712891, "global_step": 181941, "epoch": 4331} {"train_loss": -7.063223838806152, "global_step": 181942, "epoch": 4331} {"train_loss": -7.084189676103138, "global_step": 181943, "epoch": 4331, "val_loss": 68789.9609375} {"train_loss": -7.107685089111328, "global_step": 181944, "epoch": 4332} {"train_loss": -7.134213447570801, "global_step": 181945, "epoch": 4332} {"train_loss": -7.153158664703369, "global_step": 181946, "epoch": 4332} {"train_loss": -7.12932825088501, "global_step": 181947, "epoch": 4332} {"train_loss": -6.9964070320129395, "global_step": 181948, "epoch": 4332} {"train_loss": -7.1106767654418945, "global_step": 181949, "epoch": 4332} {"train_loss": -7.168036460876465, "global_step": 181950, "epoch": 4332} {"train_loss": -7.143026351928711, "global_step": 181951, "epoch": 4332} {"train_loss": -7.208926200866699, "global_step": 181952, "epoch": 4332} {"train_loss": -7.06522798538208, "global_step": 181953, "epoch": 4332} {"train_loss": -7.180874347686768, "global_step": 181954, "epoch": 4332} {"train_loss": -7.1733198165893555, "global_step": 181955, "epoch": 4332} {"train_loss": -7.145755767822266, "global_step": 181956, "epoch": 4332} {"train_loss": -7.128297328948975, "global_step": 181957, "epoch": 4332} {"train_loss": -7.1255645751953125, "global_step": 181958, "epoch": 4332} {"train_loss": -7.039168357849121, "global_step": 181959, "epoch": 4332} {"train_loss": -7.060059547424316, "global_step": 181960, "epoch": 4332} {"train_loss": -7.056880950927734, "global_step": 181961, "epoch": 4332} {"train_loss": -7.160830497741699, "global_step": 181962, "epoch": 4332} {"train_loss": -6.957535743713379, "global_step": 181963, "epoch": 4332} {"train_loss": -7.0786943435668945, "global_step": 181964, "epoch": 4332} {"train_loss": -7.134614944458008, "global_step": 181965, "epoch": 4332} {"train_loss": -7.014372825622559, "global_step": 181966, "epoch": 4332} {"train_loss": -7.150671005249023, "global_step": 181967, "epoch": 4332} {"train_loss": -7.146359443664551, "global_step": 181968, "epoch": 4332} {"train_loss": -7.0422210693359375, "global_step": 181969, "epoch": 4332} {"train_loss": -7.215627670288086, "global_step": 181970, "epoch": 4332} {"train_loss": -7.206210136413574, "global_step": 181971, "epoch": 4332} {"train_loss": -7.043914794921875, "global_step": 181972, "epoch": 4332} {"train_loss": -7.089454650878906, "global_step": 181973, "epoch": 4332} {"train_loss": -7.090176582336426, "global_step": 181974, "epoch": 4332} {"train_loss": -7.079228401184082, "global_step": 181975, "epoch": 4332} {"train_loss": -7.063494682312012, "global_step": 181976, "epoch": 4332} {"train_loss": -7.106747627258301, "global_step": 181977, "epoch": 4332} {"train_loss": -7.104887962341309, "global_step": 181978, "epoch": 4332} {"train_loss": -7.033824920654297, "global_step": 181979, "epoch": 4332} {"train_loss": -7.00273323059082, "global_step": 181980, "epoch": 4332} {"train_loss": -7.18034553527832, "global_step": 181981, "epoch": 4332} {"train_loss": -7.023133277893066, "global_step": 181982, "epoch": 4332} {"train_loss": -7.056520938873291, "global_step": 181983, "epoch": 4332} {"train_loss": -6.903237819671631, "global_step": 181984, "epoch": 4332} {"train_loss": -7.097320352281843, "global_step": 181985, "epoch": 4332, "val_loss": 68901.4609375} {"train_loss": -6.991066932678223, "global_step": 181986, "epoch": 4333} {"train_loss": -7.000873565673828, "global_step": 181987, "epoch": 4333} {"train_loss": -7.09935188293457, "global_step": 181988, "epoch": 4333} {"train_loss": -7.112043380737305, "global_step": 181989, "epoch": 4333} {"train_loss": -7.144311904907227, "global_step": 181990, "epoch": 4333} {"train_loss": -7.01368522644043, "global_step": 181991, "epoch": 4333} {"train_loss": -6.991488456726074, "global_step": 181992, "epoch": 4333} {"train_loss": -7.1661601066589355, "global_step": 181993, "epoch": 4333} {"train_loss": -6.966149806976318, "global_step": 181994, "epoch": 4333} {"train_loss": -6.975743293762207, "global_step": 181995, "epoch": 4333} {"train_loss": -7.050745964050293, "global_step": 181996, "epoch": 4333} {"train_loss": -7.086092472076416, "global_step": 181997, "epoch": 4333} {"train_loss": -7.130279541015625, "global_step": 181998, "epoch": 4333} {"train_loss": -7.167709827423096, "global_step": 181999, "epoch": 4333} {"train_loss": -6.956507205963135, "global_step": 182000, "epoch": 4333} {"train_loss": -7.043332099914551, "global_step": 182001, "epoch": 4333} {"train_loss": -6.993775844573975, "global_step": 182002, "epoch": 4333} {"train_loss": -7.023767471313477, "global_step": 182003, "epoch": 4333} {"train_loss": -7.096158027648926, "global_step": 182004, "epoch": 4333} {"train_loss": -7.041515350341797, "global_step": 182005, "epoch": 4333} {"train_loss": -7.047807693481445, "global_step": 182006, "epoch": 4333} {"train_loss": -7.141510009765625, "global_step": 182007, "epoch": 4333} {"train_loss": -7.101529598236084, "global_step": 182008, "epoch": 4333} {"train_loss": -7.028293132781982, "global_step": 182009, "epoch": 4333} {"train_loss": -7.188864231109619, "global_step": 182010, "epoch": 4333} {"train_loss": -7.0746870040893555, "global_step": 182011, "epoch": 4333} {"train_loss": -7.085803031921387, "global_step": 182012, "epoch": 4333} {"train_loss": -7.059632778167725, "global_step": 182013, "epoch": 4333} {"train_loss": -7.027422904968262, "global_step": 182014, "epoch": 4333} {"train_loss": -7.087252616882324, "global_step": 182015, "epoch": 4333} {"train_loss": -7.163676738739014, "global_step": 182016, "epoch": 4333} {"train_loss": -7.123310089111328, "global_step": 182017, "epoch": 4333} {"train_loss": -7.110874176025391, "global_step": 182018, "epoch": 4333} {"train_loss": -7.068707466125488, "global_step": 182019, "epoch": 4333} {"train_loss": -7.092780113220215, "global_step": 182020, "epoch": 4333} {"train_loss": -7.058990001678467, "global_step": 182021, "epoch": 4333} {"train_loss": -7.104169845581055, "global_step": 182022, "epoch": 4333} {"train_loss": -7.044783115386963, "global_step": 182023, "epoch": 4333} {"train_loss": -7.156804084777832, "global_step": 182024, "epoch": 4333} {"train_loss": -7.054165840148926, "global_step": 182025, "epoch": 4333} {"train_loss": -7.146059513092041, "global_step": 182026, "epoch": 4333} {"train_loss": -7.074484075818743, "global_step": 182027, "epoch": 4333, "val_loss": 68707.0390625} {"train_loss": -7.128766059875488, "global_step": 182028, "epoch": 4334} {"train_loss": -7.0557684898376465, "global_step": 182029, "epoch": 4334} {"train_loss": -7.077778339385986, "global_step": 182030, "epoch": 4334} {"train_loss": -7.067121982574463, "global_step": 182031, "epoch": 4334} {"train_loss": -7.1593217849731445, "global_step": 182032, "epoch": 4334} {"train_loss": -7.014778137207031, "global_step": 182033, "epoch": 4334} {"train_loss": -7.133626461029053, "global_step": 182034, "epoch": 4334} {"train_loss": -7.153332710266113, "global_step": 182035, "epoch": 4334} {"train_loss": -6.931447505950928, "global_step": 182036, "epoch": 4334} {"train_loss": -6.9952802658081055, "global_step": 182037, "epoch": 4334} {"train_loss": -6.99027156829834, "global_step": 182038, "epoch": 4334} {"train_loss": -6.892326354980469, "global_step": 182039, "epoch": 4334} {"train_loss": -7.020400047302246, "global_step": 182040, "epoch": 4334} {"train_loss": -7.042093276977539, "global_step": 182041, "epoch": 4334} {"train_loss": -7.052267551422119, "global_step": 182042, "epoch": 4334} {"train_loss": -6.910795211791992, "global_step": 182043, "epoch": 4334} {"train_loss": -7.0175251960754395, "global_step": 182044, "epoch": 4334} {"train_loss": -6.882285118103027, "global_step": 182045, "epoch": 4334} {"train_loss": -6.749129295349121, "global_step": 182046, "epoch": 4334} {"train_loss": -7.125389099121094, "global_step": 182047, "epoch": 4334} {"train_loss": -7.012163162231445, "global_step": 182048, "epoch": 4334} {"train_loss": -6.912102222442627, "global_step": 182049, "epoch": 4334} {"train_loss": -7.030158519744873, "global_step": 182050, "epoch": 4334} {"train_loss": -6.878593444824219, "global_step": 182051, "epoch": 4334} {"train_loss": -7.045473575592041, "global_step": 182052, "epoch": 4334} {"train_loss": -6.97258186340332, "global_step": 182053, "epoch": 4334} {"train_loss": -7.007295608520508, "global_step": 182054, "epoch": 4334} {"train_loss": -7.128477096557617, "global_step": 182055, "epoch": 4334} {"train_loss": -7.111118793487549, "global_step": 182056, "epoch": 4334} {"train_loss": -7.096981048583984, "global_step": 182057, "epoch": 4334} {"train_loss": -7.138042449951172, "global_step": 182058, "epoch": 4334} {"train_loss": -7.127657890319824, "global_step": 182059, "epoch": 4334} {"train_loss": -7.094346046447754, "global_step": 182060, "epoch": 4334} {"train_loss": -7.023377418518066, "global_step": 182061, "epoch": 4334} {"train_loss": -7.123901844024658, "global_step": 182062, "epoch": 4334} {"train_loss": -7.023406982421875, "global_step": 182063, "epoch": 4334} {"train_loss": -7.045696258544922, "global_step": 182064, "epoch": 4334} {"train_loss": -7.081673622131348, "global_step": 182065, "epoch": 4334} {"train_loss": -7.16456413269043, "global_step": 182066, "epoch": 4334} {"train_loss": -7.062211036682129, "global_step": 182067, "epoch": 4334} {"train_loss": -7.009171485900879, "global_step": 182068, "epoch": 4334} {"train_loss": -7.039635783150082, "global_step": 182069, "epoch": 4334, "val_loss": 68782.046875} {"train_loss": -7.02425479888916, "global_step": 182070, "epoch": 4335} {"train_loss": -7.136745929718018, "global_step": 182071, "epoch": 4335} {"train_loss": -7.164393424987793, "global_step": 182072, "epoch": 4335} {"train_loss": -7.123359680175781, "global_step": 182073, "epoch": 4335} {"train_loss": -7.113385200500488, "global_step": 182074, "epoch": 4335} {"train_loss": -7.189032554626465, "global_step": 182075, "epoch": 4335} {"train_loss": -7.1860198974609375, "global_step": 182076, "epoch": 4335} {"train_loss": -7.035118579864502, "global_step": 182077, "epoch": 4335} {"train_loss": -7.130382537841797, "global_step": 182078, "epoch": 4335} {"train_loss": -7.064362049102783, "global_step": 182079, "epoch": 4335} {"train_loss": -7.123189926147461, "global_step": 182080, "epoch": 4335} {"train_loss": -7.158136367797852, "global_step": 182081, "epoch": 4335} {"train_loss": -7.067877769470215, "global_step": 182082, "epoch": 4335} {"train_loss": -7.054805755615234, "global_step": 182083, "epoch": 4335} {"train_loss": -7.076913356781006, "global_step": 182084, "epoch": 4335} {"train_loss": -6.964738845825195, "global_step": 182085, "epoch": 4335} {"train_loss": -6.915170669555664, "global_step": 182086, "epoch": 4335} {"train_loss": -7.136841297149658, "global_step": 182087, "epoch": 4335} {"train_loss": -7.055973052978516, "global_step": 182088, "epoch": 4335} {"train_loss": -6.985429763793945, "global_step": 182089, "epoch": 4335} {"train_loss": -6.968441963195801, "global_step": 182090, "epoch": 4335} {"train_loss": -7.0102972984313965, "global_step": 182091, "epoch": 4335} {"train_loss": -6.981572151184082, "global_step": 182092, "epoch": 4335} {"train_loss": -7.050607204437256, "global_step": 182093, "epoch": 4335} {"train_loss": -7.024101257324219, "global_step": 182094, "epoch": 4335} {"train_loss": -7.042845726013184, "global_step": 182095, "epoch": 4335} {"train_loss": -7.003901481628418, "global_step": 182096, "epoch": 4335} {"train_loss": -6.992844581604004, "global_step": 182097, "epoch": 4335} {"train_loss": -6.921174049377441, "global_step": 182098, "epoch": 4335} {"train_loss": -6.893223285675049, "global_step": 182099, "epoch": 4335} {"train_loss": -7.0936737060546875, "global_step": 182100, "epoch": 4335} {"train_loss": -7.018930435180664, "global_step": 182101, "epoch": 4335} {"train_loss": -7.103442192077637, "global_step": 182102, "epoch": 4335} {"train_loss": -7.147789001464844, "global_step": 182103, "epoch": 4335} {"train_loss": -7.051670074462891, "global_step": 182104, "epoch": 4335} {"train_loss": -7.135212421417236, "global_step": 182105, "epoch": 4335} {"train_loss": -7.113410949707031, "global_step": 182106, "epoch": 4335} {"train_loss": -7.174483299255371, "global_step": 182107, "epoch": 4335} {"train_loss": -7.125800132751465, "global_step": 182108, "epoch": 4335} {"train_loss": -7.1306939125061035, "global_step": 182109, "epoch": 4335} {"train_loss": -7.0456767082214355, "global_step": 182110, "epoch": 4335} {"train_loss": -7.06936038108099, "global_step": 182111, "epoch": 4335, "val_loss": 68706.671875} {"train_loss": -7.004725933074951, "global_step": 182112, "epoch": 4336} {"train_loss": -6.97560977935791, "global_step": 182113, "epoch": 4336} {"train_loss": -7.001230239868164, "global_step": 182114, "epoch": 4336} {"train_loss": -7.199257850646973, "global_step": 182115, "epoch": 4336} {"train_loss": -7.0923943519592285, "global_step": 182116, "epoch": 4336} {"train_loss": -7.081411361694336, "global_step": 182117, "epoch": 4336} {"train_loss": -7.138721466064453, "global_step": 182118, "epoch": 4336} {"train_loss": -7.017739295959473, "global_step": 182119, "epoch": 4336} {"train_loss": -7.210471153259277, "global_step": 182120, "epoch": 4336} {"train_loss": -7.060276985168457, "global_step": 182121, "epoch": 4336} {"train_loss": -6.999444007873535, "global_step": 182122, "epoch": 4336} {"train_loss": -7.15908145904541, "global_step": 182123, "epoch": 4336} {"train_loss": -7.108381748199463, "global_step": 182124, "epoch": 4336} {"train_loss": -7.093768119812012, "global_step": 182125, "epoch": 4336} {"train_loss": -7.128093719482422, "global_step": 182126, "epoch": 4336} {"train_loss": -7.097683906555176, "global_step": 182127, "epoch": 4336} {"train_loss": -7.130778789520264, "global_step": 182128, "epoch": 4336} {"train_loss": -7.072554111480713, "global_step": 182129, "epoch": 4336} {"train_loss": -7.159687042236328, "global_step": 182130, "epoch": 4336} {"train_loss": -7.097480773925781, "global_step": 182131, "epoch": 4336} {"train_loss": -7.077020168304443, "global_step": 182132, "epoch": 4336} {"train_loss": -7.164216041564941, "global_step": 182133, "epoch": 4336} {"train_loss": -7.101398468017578, "global_step": 182134, "epoch": 4336} {"train_loss": -7.249833583831787, "global_step": 182135, "epoch": 4336} {"train_loss": -6.996072769165039, "global_step": 182136, "epoch": 4336} {"train_loss": -7.081114292144775, "global_step": 182137, "epoch": 4336} {"train_loss": -7.064733505249023, "global_step": 182138, "epoch": 4336} {"train_loss": -7.171449184417725, "global_step": 182139, "epoch": 4336} {"train_loss": -7.110863208770752, "global_step": 182140, "epoch": 4336} {"train_loss": -7.11200475692749, "global_step": 182141, "epoch": 4336} {"train_loss": -7.179136276245117, "global_step": 182142, "epoch": 4336} {"train_loss": -6.973502159118652, "global_step": 182143, "epoch": 4336} {"train_loss": -7.124875068664551, "global_step": 182144, "epoch": 4336} {"train_loss": -7.102105617523193, "global_step": 182145, "epoch": 4336} {"train_loss": -7.085268974304199, "global_step": 182146, "epoch": 4336} {"train_loss": -7.147572040557861, "global_step": 182147, "epoch": 4336} {"train_loss": -7.085925579071045, "global_step": 182148, "epoch": 4336} {"train_loss": -7.200952529907227, "global_step": 182149, "epoch": 4336} {"train_loss": -7.150135517120361, "global_step": 182150, "epoch": 4336} {"train_loss": -7.148838043212891, "global_step": 182151, "epoch": 4336} {"train_loss": -7.037877082824707, "global_step": 182152, "epoch": 4336} {"train_loss": -7.101818799972534, "global_step": 182153, "epoch": 4336, "val_loss": 68662.375} {"train_loss": -7.057088851928711, "global_step": 182154, "epoch": 4337} {"train_loss": -7.1431379318237305, "global_step": 182155, "epoch": 4337} {"train_loss": -7.121341705322266, "global_step": 182156, "epoch": 4337} {"train_loss": -7.089007377624512, "global_step": 182157, "epoch": 4337} {"train_loss": -7.137078285217285, "global_step": 182158, "epoch": 4337} {"train_loss": -7.139491081237793, "global_step": 182159, "epoch": 4337} {"train_loss": -7.176030158996582, "global_step": 182160, "epoch": 4337} {"train_loss": -7.08843994140625, "global_step": 182161, "epoch": 4337} {"train_loss": -7.200599670410156, "global_step": 182162, "epoch": 4337} {"train_loss": -7.1085309982299805, "global_step": 182163, "epoch": 4337} {"train_loss": -7.079442024230957, "global_step": 182164, "epoch": 4337} {"train_loss": -6.997843265533447, "global_step": 182165, "epoch": 4337} {"train_loss": -7.135206699371338, "global_step": 182166, "epoch": 4337} {"train_loss": -7.056023597717285, "global_step": 182167, "epoch": 4337} {"train_loss": -7.1273040771484375, "global_step": 182168, "epoch": 4337} {"train_loss": -7.109589576721191, "global_step": 182169, "epoch": 4337} {"train_loss": -7.08859920501709, "global_step": 182170, "epoch": 4337} {"train_loss": -7.102608680725098, "global_step": 182171, "epoch": 4337} {"train_loss": -7.186850547790527, "global_step": 182172, "epoch": 4337} {"train_loss": -7.0812578201293945, "global_step": 182173, "epoch": 4337} {"train_loss": -7.126023769378662, "global_step": 182174, "epoch": 4337} {"train_loss": -7.1214189529418945, "global_step": 182175, "epoch": 4337} {"train_loss": -7.1377692222595215, "global_step": 182176, "epoch": 4337} {"train_loss": -7.04589319229126, "global_step": 182177, "epoch": 4337} {"train_loss": -7.163810729980469, "global_step": 182178, "epoch": 4337} {"train_loss": -7.117696762084961, "global_step": 182179, "epoch": 4337} {"train_loss": -7.1450419425964355, "global_step": 182180, "epoch": 4337} {"train_loss": -7.085973262786865, "global_step": 182181, "epoch": 4337} {"train_loss": -7.167588233947754, "global_step": 182182, "epoch": 4337} {"train_loss": -7.07708215713501, "global_step": 182183, "epoch": 4337} {"train_loss": -7.119433403015137, "global_step": 182184, "epoch": 4337} {"train_loss": -7.0993876457214355, "global_step": 182185, "epoch": 4337} {"train_loss": -6.935459136962891, "global_step": 182186, "epoch": 4337} {"train_loss": -7.172989845275879, "global_step": 182187, "epoch": 4337} {"train_loss": -6.986921310424805, "global_step": 182188, "epoch": 4337} {"train_loss": -7.0500383377075195, "global_step": 182189, "epoch": 4337} {"train_loss": -7.220532417297363, "global_step": 182190, "epoch": 4337} {"train_loss": -7.011317253112793, "global_step": 182191, "epoch": 4337} {"train_loss": -7.070040702819824, "global_step": 182192, "epoch": 4337} {"train_loss": -7.169589042663574, "global_step": 182193, "epoch": 4337} {"train_loss": -7.0952959060668945, "global_step": 182194, "epoch": 4337} {"train_loss": -7.103771084830875, "global_step": 182195, "epoch": 4337, "val_loss": 68935.2265625} {"train_loss": -7.152573585510254, "global_step": 182196, "epoch": 4338} {"train_loss": -6.932615280151367, "global_step": 182197, "epoch": 4338} {"train_loss": -6.985166549682617, "global_step": 182198, "epoch": 4338} {"train_loss": -6.955687522888184, "global_step": 182199, "epoch": 4338} {"train_loss": -7.019306182861328, "global_step": 182200, "epoch": 4338} {"train_loss": -7.183996200561523, "global_step": 182201, "epoch": 4338} {"train_loss": -7.049923896789551, "global_step": 182202, "epoch": 4338} {"train_loss": -7.17025899887085, "global_step": 182203, "epoch": 4338} {"train_loss": -7.056929588317871, "global_step": 182204, "epoch": 4338} {"train_loss": -7.044820785522461, "global_step": 182205, "epoch": 4338} {"train_loss": -7.192948818206787, "global_step": 182206, "epoch": 4338} {"train_loss": -7.097916126251221, "global_step": 182207, "epoch": 4338} {"train_loss": -7.090462684631348, "global_step": 182208, "epoch": 4338} {"train_loss": -7.1157026290893555, "global_step": 182209, "epoch": 4338} {"train_loss": -7.106212615966797, "global_step": 182210, "epoch": 4338} {"train_loss": -7.198031425476074, "global_step": 182211, "epoch": 4338} {"train_loss": -6.997249126434326, "global_step": 182212, "epoch": 4338} {"train_loss": -7.042938232421875, "global_step": 182213, "epoch": 4338} {"train_loss": -7.140318870544434, "global_step": 182214, "epoch": 4338} {"train_loss": -7.113435745239258, "global_step": 182215, "epoch": 4338} {"train_loss": -6.99985408782959, "global_step": 182216, "epoch": 4338} {"train_loss": -7.014487266540527, "global_step": 182217, "epoch": 4338} {"train_loss": -7.038583755493164, "global_step": 182218, "epoch": 4338} {"train_loss": -6.993605613708496, "global_step": 182219, "epoch": 4338} {"train_loss": -6.986332893371582, "global_step": 182220, "epoch": 4338} {"train_loss": -7.1376237869262695, "global_step": 182221, "epoch": 4338} {"train_loss": -7.000735759735107, "global_step": 182222, "epoch": 4338} {"train_loss": -6.972774505615234, "global_step": 182223, "epoch": 4338} {"train_loss": -7.105413436889648, "global_step": 182224, "epoch": 4338} {"train_loss": -6.9623212814331055, "global_step": 182225, "epoch": 4338} {"train_loss": -6.9359235763549805, "global_step": 182226, "epoch": 4338} {"train_loss": -6.977044105529785, "global_step": 182227, "epoch": 4338} {"train_loss": -7.023130893707275, "global_step": 182228, "epoch": 4338} {"train_loss": -7.019234657287598, "global_step": 182229, "epoch": 4338} {"train_loss": -6.949651718139648, "global_step": 182230, "epoch": 4338} {"train_loss": -7.032008171081543, "global_step": 182231, "epoch": 4338} {"train_loss": -7.096386909484863, "global_step": 182232, "epoch": 4338} {"train_loss": -7.062017917633057, "global_step": 182233, "epoch": 4338} {"train_loss": -7.1486287117004395, "global_step": 182234, "epoch": 4338} {"train_loss": -7.005366325378418, "global_step": 182235, "epoch": 4338} {"train_loss": -7.023008346557617, "global_step": 182236, "epoch": 4338} {"train_loss": -7.053395838964553, "global_step": 182237, "epoch": 4338, "val_loss": 68837.5546875} {"train_loss": -6.997611999511719, "global_step": 182238, "epoch": 4339} {"train_loss": -6.994838714599609, "global_step": 182239, "epoch": 4339} {"train_loss": -7.060553550720215, "global_step": 182240, "epoch": 4339} {"train_loss": -7.027105808258057, "global_step": 182241, "epoch": 4339} {"train_loss": -7.035362243652344, "global_step": 182242, "epoch": 4339} {"train_loss": -7.022536277770996, "global_step": 182243, "epoch": 4339} {"train_loss": -6.926715850830078, "global_step": 182244, "epoch": 4339} {"train_loss": -7.022217750549316, "global_step": 182245, "epoch": 4339} {"train_loss": -7.081795692443848, "global_step": 182246, "epoch": 4339} {"train_loss": -7.064517974853516, "global_step": 182247, "epoch": 4339} {"train_loss": -7.107606887817383, "global_step": 182248, "epoch": 4339} {"train_loss": -6.945487022399902, "global_step": 182249, "epoch": 4339} {"train_loss": -6.83925724029541, "global_step": 182250, "epoch": 4339} {"train_loss": -7.115339756011963, "global_step": 182251, "epoch": 4339} {"train_loss": -7.034459114074707, "global_step": 182252, "epoch": 4339} {"train_loss": -7.149651527404785, "global_step": 182253, "epoch": 4339} {"train_loss": -7.111807823181152, "global_step": 182254, "epoch": 4339} {"train_loss": -7.1816558837890625, "global_step": 182255, "epoch": 4339} {"train_loss": -7.141372203826904, "global_step": 182256, "epoch": 4339} {"train_loss": -7.089788436889648, "global_step": 182257, "epoch": 4339} {"train_loss": -7.155102729797363, "global_step": 182258, "epoch": 4339} {"train_loss": -7.100430011749268, "global_step": 182259, "epoch": 4339} {"train_loss": -7.032016754150391, "global_step": 182260, "epoch": 4339} {"train_loss": -7.1327104568481445, "global_step": 182261, "epoch": 4339} {"train_loss": -7.117074966430664, "global_step": 182262, "epoch": 4339} {"train_loss": -6.979978561401367, "global_step": 182263, "epoch": 4339} {"train_loss": -7.14456844329834, "global_step": 182264, "epoch": 4339} {"train_loss": -7.255438804626465, "global_step": 182265, "epoch": 4339} {"train_loss": -7.233986854553223, "global_step": 182266, "epoch": 4339} {"train_loss": -6.974285125732422, "global_step": 182267, "epoch": 4339} {"train_loss": -7.141441822052002, "global_step": 182268, "epoch": 4339} {"train_loss": -7.100104331970215, "global_step": 182269, "epoch": 4339} {"train_loss": -6.934312343597412, "global_step": 182270, "epoch": 4339} {"train_loss": -7.0422539710998535, "global_step": 182271, "epoch": 4339} {"train_loss": -7.08447265625, "global_step": 182272, "epoch": 4339} {"train_loss": -7.018737316131592, "global_step": 182273, "epoch": 4339} {"train_loss": -7.020040988922119, "global_step": 182274, "epoch": 4339} {"train_loss": -7.033753395080566, "global_step": 182275, "epoch": 4339} {"train_loss": -7.152279853820801, "global_step": 182276, "epoch": 4339} {"train_loss": -6.982444763183594, "global_step": 182277, "epoch": 4339} {"train_loss": -7.0445709228515625, "global_step": 182278, "epoch": 4339} {"train_loss": -7.065710147221883, "global_step": 182279, "epoch": 4339, "val_loss": 68888.609375} {"train_loss": -7.131508827209473, "global_step": 182280, "epoch": 4340} {"train_loss": -7.097894668579102, "global_step": 182281, "epoch": 4340} {"train_loss": -7.149998188018799, "global_step": 182282, "epoch": 4340} {"train_loss": -7.087900161743164, "global_step": 182283, "epoch": 4340} {"train_loss": -7.0800323486328125, "global_step": 182284, "epoch": 4340} {"train_loss": -7.146051406860352, "global_step": 182285, "epoch": 4340} {"train_loss": -7.207773685455322, "global_step": 182286, "epoch": 4340} {"train_loss": -7.241576194763184, "global_step": 182287, "epoch": 4340} {"train_loss": -7.043198108673096, "global_step": 182288, "epoch": 4340} {"train_loss": -7.1757941246032715, "global_step": 182289, "epoch": 4340} {"train_loss": -6.993932247161865, "global_step": 182290, "epoch": 4340} {"train_loss": -6.980207443237305, "global_step": 182291, "epoch": 4340} {"train_loss": -7.115983963012695, "global_step": 182292, "epoch": 4340} {"train_loss": -6.959728240966797, "global_step": 182293, "epoch": 4340} {"train_loss": -7.1772236824035645, "global_step": 182294, "epoch": 4340} {"train_loss": -7.204514026641846, "global_step": 182295, "epoch": 4340} {"train_loss": -7.067891597747803, "global_step": 182296, "epoch": 4340} {"train_loss": -7.203327178955078, "global_step": 182297, "epoch": 4340} {"train_loss": -7.085168838500977, "global_step": 182298, "epoch": 4340} {"train_loss": -6.993410110473633, "global_step": 182299, "epoch": 4340} {"train_loss": -7.167873859405518, "global_step": 182300, "epoch": 4340} {"train_loss": -7.07441520690918, "global_step": 182301, "epoch": 4340} {"train_loss": -7.147428035736084, "global_step": 182302, "epoch": 4340} {"train_loss": -7.0255632400512695, "global_step": 182303, "epoch": 4340} {"train_loss": -7.139471054077148, "global_step": 182304, "epoch": 4340} {"train_loss": -6.995791435241699, "global_step": 182305, "epoch": 4340} {"train_loss": -7.2077412605285645, "global_step": 182306, "epoch": 4340} {"train_loss": -7.060657024383545, "global_step": 182307, "epoch": 4340} {"train_loss": -7.087206840515137, "global_step": 182308, "epoch": 4340} {"train_loss": -7.108131408691406, "global_step": 182309, "epoch": 4340} {"train_loss": -7.0716705322265625, "global_step": 182310, "epoch": 4340} {"train_loss": -7.000754356384277, "global_step": 182311, "epoch": 4340} {"train_loss": -7.168224334716797, "global_step": 182312, "epoch": 4340} {"train_loss": -7.006034851074219, "global_step": 182313, "epoch": 4340} {"train_loss": -7.07053279876709, "global_step": 182314, "epoch": 4340} {"train_loss": -7.115865707397461, "global_step": 182315, "epoch": 4340} {"train_loss": -6.970694065093994, "global_step": 182316, "epoch": 4340} {"train_loss": -6.940145015716553, "global_step": 182317, "epoch": 4340} {"train_loss": -6.918290138244629, "global_step": 182318, "epoch": 4340} {"train_loss": -7.121927261352539, "global_step": 182319, "epoch": 4340} {"train_loss": -7.009993553161621, "global_step": 182320, "epoch": 4340} {"train_loss": -7.083804709570749, "global_step": 182321, "epoch": 4340, "val_loss": 68833.0546875} {"train_loss": -6.935394287109375, "global_step": 182322, "epoch": 4341} {"train_loss": -7.069827079772949, "global_step": 182323, "epoch": 4341} {"train_loss": -7.032346725463867, "global_step": 182324, "epoch": 4341} {"train_loss": -7.018852233886719, "global_step": 182325, "epoch": 4341} {"train_loss": -6.93325138092041, "global_step": 182326, "epoch": 4341} {"train_loss": -7.178657531738281, "global_step": 182327, "epoch": 4341} {"train_loss": -6.997803688049316, "global_step": 182328, "epoch": 4341} {"train_loss": -7.091231346130371, "global_step": 182329, "epoch": 4341} {"train_loss": -7.0338239669799805, "global_step": 182330, "epoch": 4341} {"train_loss": -7.109005928039551, "global_step": 182331, "epoch": 4341} {"train_loss": -7.005758285522461, "global_step": 182332, "epoch": 4341} {"train_loss": -7.090956687927246, "global_step": 182333, "epoch": 4341} {"train_loss": -7.006691932678223, "global_step": 182334, "epoch": 4341} {"train_loss": -6.955262660980225, "global_step": 182335, "epoch": 4341} {"train_loss": -7.116476058959961, "global_step": 182336, "epoch": 4341} {"train_loss": -7.050743103027344, "global_step": 182337, "epoch": 4341} {"train_loss": -7.104972839355469, "global_step": 182338, "epoch": 4341} {"train_loss": -7.101856231689453, "global_step": 182339, "epoch": 4341} {"train_loss": -6.99068546295166, "global_step": 182340, "epoch": 4341} {"train_loss": -7.05314826965332, "global_step": 182341, "epoch": 4341} {"train_loss": -7.112095832824707, "global_step": 182342, "epoch": 4341} {"train_loss": -7.014589309692383, "global_step": 182343, "epoch": 4341} {"train_loss": -6.876382827758789, "global_step": 182344, "epoch": 4341} {"train_loss": -7.090207099914551, "global_step": 182345, "epoch": 4341} {"train_loss": -6.9487762451171875, "global_step": 182346, "epoch": 4341} {"train_loss": -7.046135902404785, "global_step": 182347, "epoch": 4341} {"train_loss": -7.21012020111084, "global_step": 182348, "epoch": 4341} {"train_loss": -7.033747673034668, "global_step": 182349, "epoch": 4341} {"train_loss": -7.118277549743652, "global_step": 182350, "epoch": 4341} {"train_loss": -7.053504943847656, "global_step": 182351, "epoch": 4341} {"train_loss": -7.016064643859863, "global_step": 182352, "epoch": 4341} {"train_loss": -7.1891560554504395, "global_step": 182353, "epoch": 4341} {"train_loss": -7.06240177154541, "global_step": 182354, "epoch": 4341} {"train_loss": -7.042840003967285, "global_step": 182355, "epoch": 4341} {"train_loss": -7.023276329040527, "global_step": 182356, "epoch": 4341} {"train_loss": -7.143899440765381, "global_step": 182357, "epoch": 4341} {"train_loss": -7.122928142547607, "global_step": 182358, "epoch": 4341} {"train_loss": -6.95993185043335, "global_step": 182359, "epoch": 4341} {"train_loss": -7.126955509185791, "global_step": 182360, "epoch": 4341} {"train_loss": -7.098656177520752, "global_step": 182361, "epoch": 4341} {"train_loss": -7.069300651550293, "global_step": 182362, "epoch": 4341} {"train_loss": -7.051981732958839, "global_step": 182363, "epoch": 4341, "val_loss": 68675.2890625} {"train_loss": -7.108057022094727, "global_step": 182364, "epoch": 4342} {"train_loss": -6.975027561187744, "global_step": 182365, "epoch": 4342} {"train_loss": -7.055899620056152, "global_step": 182366, "epoch": 4342} {"train_loss": -7.1719794273376465, "global_step": 182367, "epoch": 4342} {"train_loss": -7.086607456207275, "global_step": 182368, "epoch": 4342} {"train_loss": -7.127857208251953, "global_step": 182369, "epoch": 4342} {"train_loss": -7.12099552154541, "global_step": 182370, "epoch": 4342} {"train_loss": -7.103426456451416, "global_step": 182371, "epoch": 4342} {"train_loss": -7.000589847564697, "global_step": 182372, "epoch": 4342} {"train_loss": -7.134584426879883, "global_step": 182373, "epoch": 4342} {"train_loss": -7.028853416442871, "global_step": 182374, "epoch": 4342} {"train_loss": -7.107626438140869, "global_step": 182375, "epoch": 4342} {"train_loss": -7.096515655517578, "global_step": 182376, "epoch": 4342} {"train_loss": -7.193100452423096, "global_step": 182377, "epoch": 4342} {"train_loss": -7.083600044250488, "global_step": 182378, "epoch": 4342} {"train_loss": -7.143075466156006, "global_step": 182379, "epoch": 4342} {"train_loss": -6.975099563598633, "global_step": 182380, "epoch": 4342} {"train_loss": -7.047659873962402, "global_step": 182381, "epoch": 4342} {"train_loss": -7.002042770385742, "global_step": 182382, "epoch": 4342} {"train_loss": -7.107007026672363, "global_step": 182383, "epoch": 4342} {"train_loss": -7.060118675231934, "global_step": 182384, "epoch": 4342} {"train_loss": -6.957082748413086, "global_step": 182385, "epoch": 4342} {"train_loss": -6.973933219909668, "global_step": 182386, "epoch": 4342} {"train_loss": -7.016994953155518, "global_step": 182387, "epoch": 4342} {"train_loss": -7.1323466300964355, "global_step": 182388, "epoch": 4342} {"train_loss": -7.050782203674316, "global_step": 182389, "epoch": 4342} {"train_loss": -7.114832401275635, "global_step": 182390, "epoch": 4342} {"train_loss": -7.143115043640137, "global_step": 182391, "epoch": 4342} {"train_loss": -7.196754455566406, "global_step": 182392, "epoch": 4342} {"train_loss": -7.099833011627197, "global_step": 182393, "epoch": 4342} {"train_loss": -7.14638614654541, "global_step": 182394, "epoch": 4342} {"train_loss": -7.044329643249512, "global_step": 182395, "epoch": 4342} {"train_loss": -7.171609878540039, "global_step": 182396, "epoch": 4342} {"train_loss": -7.189043045043945, "global_step": 182397, "epoch": 4342} {"train_loss": -7.118264198303223, "global_step": 182398, "epoch": 4342} {"train_loss": -7.182626724243164, "global_step": 182399, "epoch": 4342} {"train_loss": -7.092562675476074, "global_step": 182400, "epoch": 4342} {"train_loss": -7.112331867218018, "global_step": 182401, "epoch": 4342} {"train_loss": -7.195155143737793, "global_step": 182402, "epoch": 4342} {"train_loss": -7.1340742111206055, "global_step": 182403, "epoch": 4342} {"train_loss": -7.02125883102417, "global_step": 182404, "epoch": 4342} {"train_loss": -7.095030466715495, "global_step": 182405, "epoch": 4342, "val_loss": 68825.96875} {"train_loss": -7.002992153167725, "global_step": 182406, "epoch": 4343} {"train_loss": -6.943747043609619, "global_step": 182407, "epoch": 4343} {"train_loss": -7.156180381774902, "global_step": 182408, "epoch": 4343} {"train_loss": -7.156529426574707, "global_step": 182409, "epoch": 4343} {"train_loss": -7.155252933502197, "global_step": 182410, "epoch": 4343} {"train_loss": -7.108447074890137, "global_step": 182411, "epoch": 4343} {"train_loss": -7.156115531921387, "global_step": 182412, "epoch": 4343} {"train_loss": -6.897518157958984, "global_step": 182413, "epoch": 4343} {"train_loss": -7.177152633666992, "global_step": 182414, "epoch": 4343} {"train_loss": -7.010378837585449, "global_step": 182415, "epoch": 4343} {"train_loss": -7.138742923736572, "global_step": 182416, "epoch": 4343} {"train_loss": -7.121914386749268, "global_step": 182417, "epoch": 4343} {"train_loss": -6.9878411293029785, "global_step": 182418, "epoch": 4343} {"train_loss": -7.101111888885498, "global_step": 182419, "epoch": 4343} {"train_loss": -7.107309341430664, "global_step": 182420, "epoch": 4343} {"train_loss": -7.081900596618652, "global_step": 182421, "epoch": 4343} {"train_loss": -7.076348304748535, "global_step": 182422, "epoch": 4343} {"train_loss": -7.066293716430664, "global_step": 182423, "epoch": 4343} {"train_loss": -7.109702110290527, "global_step": 182424, "epoch": 4343} {"train_loss": -7.175833702087402, "global_step": 182425, "epoch": 4343} {"train_loss": -6.868947982788086, "global_step": 182426, "epoch": 4343} {"train_loss": -6.941728591918945, "global_step": 182427, "epoch": 4343} {"train_loss": -7.153169631958008, "global_step": 182428, "epoch": 4343} {"train_loss": -7.0100274085998535, "global_step": 182429, "epoch": 4343} {"train_loss": -6.984604835510254, "global_step": 182430, "epoch": 4343} {"train_loss": -7.028167247772217, "global_step": 182431, "epoch": 4343} {"train_loss": -6.929405212402344, "global_step": 182432, "epoch": 4343} {"train_loss": -7.134810447692871, "global_step": 182433, "epoch": 4343} {"train_loss": -7.05043888092041, "global_step": 182434, "epoch": 4343} {"train_loss": -7.014162063598633, "global_step": 182435, "epoch": 4343} {"train_loss": -7.114284515380859, "global_step": 182436, "epoch": 4343} {"train_loss": -7.04440450668335, "global_step": 182437, "epoch": 4343} {"train_loss": -7.150086879730225, "global_step": 182438, "epoch": 4343} {"train_loss": -7.143982887268066, "global_step": 182439, "epoch": 4343} {"train_loss": -7.182268142700195, "global_step": 182440, "epoch": 4343} {"train_loss": -7.186081409454346, "global_step": 182441, "epoch": 4343} {"train_loss": -7.2086944580078125, "global_step": 182442, "epoch": 4343} {"train_loss": -7.0545454025268555, "global_step": 182443, "epoch": 4343} {"train_loss": -7.072408199310303, "global_step": 182444, "epoch": 4343} {"train_loss": -7.063963413238525, "global_step": 182445, "epoch": 4343} {"train_loss": -7.139578342437744, "global_step": 182446, "epoch": 4343} {"train_loss": -7.078010252543858, "global_step": 182447, "epoch": 4343, "val_loss": 68800.671875} {"train_loss": -6.924869537353516, "global_step": 182448, "epoch": 4344} {"train_loss": -7.01705265045166, "global_step": 182449, "epoch": 4344} {"train_loss": -7.060593605041504, "global_step": 182450, "epoch": 4344} {"train_loss": -7.131577968597412, "global_step": 182451, "epoch": 4344} {"train_loss": -7.153858184814453, "global_step": 182452, "epoch": 4344} {"train_loss": -7.069843292236328, "global_step": 182453, "epoch": 4344} {"train_loss": -7.091041088104248, "global_step": 182454, "epoch": 4344} {"train_loss": -6.982077598571777, "global_step": 182455, "epoch": 4344} {"train_loss": -7.189099311828613, "global_step": 182456, "epoch": 4344} {"train_loss": -7.181915760040283, "global_step": 182457, "epoch": 4344} {"train_loss": -6.925601959228516, "global_step": 182458, "epoch": 4344} {"train_loss": -7.175385475158691, "global_step": 182459, "epoch": 4344} {"train_loss": -7.121092796325684, "global_step": 182460, "epoch": 4344} {"train_loss": -7.137786865234375, "global_step": 182461, "epoch": 4344} {"train_loss": -7.066971778869629, "global_step": 182462, "epoch": 4344} {"train_loss": -7.095690727233887, "global_step": 182463, "epoch": 4344} {"train_loss": -7.02812385559082, "global_step": 182464, "epoch": 4344} {"train_loss": -7.133640766143799, "global_step": 182465, "epoch": 4344} {"train_loss": -7.119365692138672, "global_step": 182466, "epoch": 4344} {"train_loss": -7.089676856994629, "global_step": 182467, "epoch": 4344} {"train_loss": -7.263690948486328, "global_step": 182468, "epoch": 4344} {"train_loss": -6.987894058227539, "global_step": 182469, "epoch": 4344} {"train_loss": -6.988548278808594, "global_step": 182470, "epoch": 4344} {"train_loss": -7.11366081237793, "global_step": 182471, "epoch": 4344} {"train_loss": -6.962392807006836, "global_step": 182472, "epoch": 4344} {"train_loss": -6.974594593048096, "global_step": 182473, "epoch": 4344} {"train_loss": -7.088901519775391, "global_step": 182474, "epoch": 4344} {"train_loss": -7.071702003479004, "global_step": 182475, "epoch": 4344} {"train_loss": -7.097593307495117, "global_step": 182476, "epoch": 4344} {"train_loss": -7.204522609710693, "global_step": 182477, "epoch": 4344} {"train_loss": -7.042276382446289, "global_step": 182478, "epoch": 4344} {"train_loss": -7.1314616203308105, "global_step": 182479, "epoch": 4344} {"train_loss": -6.980048656463623, "global_step": 182480, "epoch": 4344} {"train_loss": -7.0366058349609375, "global_step": 182481, "epoch": 4344} {"train_loss": -7.02047872543335, "global_step": 182482, "epoch": 4344} {"train_loss": -7.008293151855469, "global_step": 182483, "epoch": 4344} {"train_loss": -6.969326019287109, "global_step": 182484, "epoch": 4344} {"train_loss": -7.0631489753723145, "global_step": 182485, "epoch": 4344} {"train_loss": -7.105399131774902, "global_step": 182486, "epoch": 4344} {"train_loss": -7.186197757720947, "global_step": 182487, "epoch": 4344} {"train_loss": -7.110346794128418, "global_step": 182488, "epoch": 4344} {"train_loss": -7.076930897576468, "global_step": 182489, "epoch": 4344, "val_loss": 68967.5078125} {"train_loss": -7.127863883972168, "global_step": 182490, "epoch": 4345} {"train_loss": -7.158083915710449, "global_step": 182491, "epoch": 4345} {"train_loss": -7.141387939453125, "global_step": 182492, "epoch": 4345} {"train_loss": -7.083685874938965, "global_step": 182493, "epoch": 4345} {"train_loss": -7.146503448486328, "global_step": 182494, "epoch": 4345} {"train_loss": -7.097533702850342, "global_step": 182495, "epoch": 4345} {"train_loss": -7.068996429443359, "global_step": 182496, "epoch": 4345} {"train_loss": -7.210849761962891, "global_step": 182497, "epoch": 4345} {"train_loss": -7.065040588378906, "global_step": 182498, "epoch": 4345} {"train_loss": -7.077065467834473, "global_step": 182499, "epoch": 4345} {"train_loss": -7.015171051025391, "global_step": 182500, "epoch": 4345} {"train_loss": -7.093658924102783, "global_step": 182501, "epoch": 4345} {"train_loss": -6.9758100509643555, "global_step": 182502, "epoch": 4345} {"train_loss": -6.972969055175781, "global_step": 182503, "epoch": 4345} {"train_loss": -7.13059139251709, "global_step": 182504, "epoch": 4345} {"train_loss": -6.9827094078063965, "global_step": 182505, "epoch": 4345} {"train_loss": -7.09229850769043, "global_step": 182506, "epoch": 4345} {"train_loss": -7.024285793304443, "global_step": 182507, "epoch": 4345} {"train_loss": -7.06271505355835, "global_step": 182508, "epoch": 4345} {"train_loss": -7.063736915588379, "global_step": 182509, "epoch": 4345} {"train_loss": -6.947629451751709, "global_step": 182510, "epoch": 4345} {"train_loss": -6.985063552856445, "global_step": 182511, "epoch": 4345} {"train_loss": -7.05072021484375, "global_step": 182512, "epoch": 4345} {"train_loss": -7.115362167358398, "global_step": 182513, "epoch": 4345} {"train_loss": -7.029515266418457, "global_step": 182514, "epoch": 4345} {"train_loss": -7.087213039398193, "global_step": 182515, "epoch": 4345} {"train_loss": -7.018393516540527, "global_step": 182516, "epoch": 4345} {"train_loss": -7.089082717895508, "global_step": 182517, "epoch": 4345} {"train_loss": -7.169690132141113, "global_step": 182518, "epoch": 4345} {"train_loss": -7.105341911315918, "global_step": 182519, "epoch": 4345} {"train_loss": -7.116430282592773, "global_step": 182520, "epoch": 4345} {"train_loss": -7.056246757507324, "global_step": 182521, "epoch": 4345} {"train_loss": -7.101861000061035, "global_step": 182522, "epoch": 4345} {"train_loss": -7.178905010223389, "global_step": 182523, "epoch": 4345} {"train_loss": -7.23578405380249, "global_step": 182524, "epoch": 4345} {"train_loss": -7.007874965667725, "global_step": 182525, "epoch": 4345} {"train_loss": -7.142037391662598, "global_step": 182526, "epoch": 4345} {"train_loss": -7.088969707489014, "global_step": 182527, "epoch": 4345} {"train_loss": -7.0773210525512695, "global_step": 182528, "epoch": 4345} {"train_loss": -6.985287666320801, "global_step": 182529, "epoch": 4345} {"train_loss": -7.089471340179443, "global_step": 182530, "epoch": 4345} {"train_loss": -7.078736373356411, "global_step": 182531, "epoch": 4345, "val_loss": 68795.78125} {"train_loss": -7.191280364990234, "global_step": 182532, "epoch": 4346} {"train_loss": -7.061272621154785, "global_step": 182533, "epoch": 4346} {"train_loss": -7.0354814529418945, "global_step": 182534, "epoch": 4346} {"train_loss": -7.079906463623047, "global_step": 182535, "epoch": 4346} {"train_loss": -6.973836898803711, "global_step": 182536, "epoch": 4346} {"train_loss": -7.088022232055664, "global_step": 182537, "epoch": 4346} {"train_loss": -7.139547824859619, "global_step": 182538, "epoch": 4346} {"train_loss": -6.9770660400390625, "global_step": 182539, "epoch": 4346} {"train_loss": -7.038060188293457, "global_step": 182540, "epoch": 4346} {"train_loss": -7.040517330169678, "global_step": 182541, "epoch": 4346} {"train_loss": -7.114300727844238, "global_step": 182542, "epoch": 4346} {"train_loss": -7.040464401245117, "global_step": 182543, "epoch": 4346} {"train_loss": -7.206596374511719, "global_step": 182544, "epoch": 4346} {"train_loss": -7.1259870529174805, "global_step": 182545, "epoch": 4346} {"train_loss": -7.103555679321289, "global_step": 182546, "epoch": 4346} {"train_loss": -7.108404159545898, "global_step": 182547, "epoch": 4346} {"train_loss": -7.032878875732422, "global_step": 182548, "epoch": 4346} {"train_loss": -7.07948637008667, "global_step": 182549, "epoch": 4346} {"train_loss": -7.015436172485352, "global_step": 182550, "epoch": 4346} {"train_loss": -7.107823371887207, "global_step": 182551, "epoch": 4346} {"train_loss": -7.125860691070557, "global_step": 182552, "epoch": 4346} {"train_loss": -7.124196529388428, "global_step": 182553, "epoch": 4346} {"train_loss": -7.152194023132324, "global_step": 182554, "epoch": 4346} {"train_loss": -7.151902198791504, "global_step": 182555, "epoch": 4346} {"train_loss": -7.221791744232178, "global_step": 182556, "epoch": 4346} {"train_loss": -7.054128646850586, "global_step": 182557, "epoch": 4346} {"train_loss": -7.143841743469238, "global_step": 182558, "epoch": 4346} {"train_loss": -7.175344467163086, "global_step": 182559, "epoch": 4346} {"train_loss": -7.149013042449951, "global_step": 182560, "epoch": 4346} {"train_loss": -7.184032917022705, "global_step": 182561, "epoch": 4346} {"train_loss": -7.176752090454102, "global_step": 182562, "epoch": 4346} {"train_loss": -7.171184539794922, "global_step": 182563, "epoch": 4346} {"train_loss": -7.096384048461914, "global_step": 182564, "epoch": 4346} {"train_loss": -7.244390487670898, "global_step": 182565, "epoch": 4346} {"train_loss": -7.09853982925415, "global_step": 182566, "epoch": 4346} {"train_loss": -7.194281578063965, "global_step": 182567, "epoch": 4346} {"train_loss": -7.129397392272949, "global_step": 182568, "epoch": 4346} {"train_loss": -7.2470903396606445, "global_step": 182569, "epoch": 4346} {"train_loss": -7.061258316040039, "global_step": 182570, "epoch": 4346} {"train_loss": -7.101521015167236, "global_step": 182571, "epoch": 4346} {"train_loss": -7.218825817108154, "global_step": 182572, "epoch": 4346} {"train_loss": -7.1156496206919355, "global_step": 182573, "epoch": 4346, "val_loss": 68859.7890625} {"train_loss": -7.165726184844971, "global_step": 182574, "epoch": 4347} {"train_loss": -7.1005330085754395, "global_step": 182575, "epoch": 4347} {"train_loss": -7.115754127502441, "global_step": 182576, "epoch": 4347} {"train_loss": -6.980738162994385, "global_step": 182577, "epoch": 4347} {"train_loss": -7.081577301025391, "global_step": 182578, "epoch": 4347} {"train_loss": -6.976628303527832, "global_step": 182579, "epoch": 4347} {"train_loss": -7.076820373535156, "global_step": 182580, "epoch": 4347} {"train_loss": -7.0937180519104, "global_step": 182581, "epoch": 4347} {"train_loss": -7.17752742767334, "global_step": 182582, "epoch": 4347} {"train_loss": -7.07908296585083, "global_step": 182583, "epoch": 4347} {"train_loss": -7.053170204162598, "global_step": 182584, "epoch": 4347} {"train_loss": -7.183096885681152, "global_step": 182585, "epoch": 4347} {"train_loss": -7.055643558502197, "global_step": 182586, "epoch": 4347} {"train_loss": -6.990349769592285, "global_step": 182587, "epoch": 4347} {"train_loss": -7.092207431793213, "global_step": 182588, "epoch": 4347} {"train_loss": -7.046309471130371, "global_step": 182589, "epoch": 4347} {"train_loss": -7.046662330627441, "global_step": 182590, "epoch": 4347} {"train_loss": -6.980887413024902, "global_step": 182591, "epoch": 4347} {"train_loss": -6.969209671020508, "global_step": 182592, "epoch": 4347} {"train_loss": -7.029034614562988, "global_step": 182593, "epoch": 4347} {"train_loss": -7.0579118728637695, "global_step": 182594, "epoch": 4347} {"train_loss": -6.979989528656006, "global_step": 182595, "epoch": 4347} {"train_loss": -7.119578838348389, "global_step": 182596, "epoch": 4347} {"train_loss": -7.044366836547852, "global_step": 182597, "epoch": 4347} {"train_loss": -7.109337329864502, "global_step": 182598, "epoch": 4347} {"train_loss": -7.1713104248046875, "global_step": 182599, "epoch": 4347} {"train_loss": -7.124866485595703, "global_step": 182600, "epoch": 4347} {"train_loss": -7.050726890563965, "global_step": 182601, "epoch": 4347} {"train_loss": -7.094607353210449, "global_step": 182602, "epoch": 4347} {"train_loss": -7.061221599578857, "global_step": 182603, "epoch": 4347} {"train_loss": -7.094342231750488, "global_step": 182604, "epoch": 4347} {"train_loss": -7.001548767089844, "global_step": 182605, "epoch": 4347} {"train_loss": -7.089831352233887, "global_step": 182606, "epoch": 4347} {"train_loss": -6.779936790466309, "global_step": 182607, "epoch": 4347} {"train_loss": -6.784090518951416, "global_step": 182608, "epoch": 4347} {"train_loss": -7.043484687805176, "global_step": 182609, "epoch": 4347} {"train_loss": -6.7823638916015625, "global_step": 182610, "epoch": 4347} {"train_loss": -6.985870838165283, "global_step": 182611, "epoch": 4347} {"train_loss": -6.873708248138428, "global_step": 182612, "epoch": 4347} {"train_loss": -7.02540397644043, "global_step": 182613, "epoch": 4347} {"train_loss": -6.986883163452148, "global_step": 182614, "epoch": 4347} {"train_loss": -7.036044994990031, "global_step": 182615, "epoch": 4347, "val_loss": 68878.921875} {"train_loss": -7.039501667022705, "global_step": 182616, "epoch": 4348} {"train_loss": -7.038331031799316, "global_step": 182617, "epoch": 4348} {"train_loss": -7.105586051940918, "global_step": 182618, "epoch": 4348} {"train_loss": -7.006631851196289, "global_step": 182619, "epoch": 4348} {"train_loss": -6.917322158813477, "global_step": 182620, "epoch": 4348} {"train_loss": -7.017509937286377, "global_step": 182621, "epoch": 4348} {"train_loss": -6.855381965637207, "global_step": 182622, "epoch": 4348} {"train_loss": -7.173847198486328, "global_step": 182623, "epoch": 4348} {"train_loss": -7.042259693145752, "global_step": 182624, "epoch": 4348} {"train_loss": -6.993760585784912, "global_step": 182625, "epoch": 4348} {"train_loss": -6.925494194030762, "global_step": 182626, "epoch": 4348} {"train_loss": -7.170863151550293, "global_step": 182627, "epoch": 4348} {"train_loss": -6.908811569213867, "global_step": 182628, "epoch": 4348} {"train_loss": -7.0614519119262695, "global_step": 182629, "epoch": 4348} {"train_loss": -7.086246013641357, "global_step": 182630, "epoch": 4348} {"train_loss": -6.940691947937012, "global_step": 182631, "epoch": 4348} {"train_loss": -6.9841742515563965, "global_step": 182632, "epoch": 4348} {"train_loss": -7.017770290374756, "global_step": 182633, "epoch": 4348} {"train_loss": -7.171930313110352, "global_step": 182634, "epoch": 4348} {"train_loss": -7.0379486083984375, "global_step": 182635, "epoch": 4348} {"train_loss": -6.990245342254639, "global_step": 182636, "epoch": 4348} {"train_loss": -7.157805442810059, "global_step": 182637, "epoch": 4348} {"train_loss": -7.117877960205078, "global_step": 182638, "epoch": 4348} {"train_loss": -6.988982200622559, "global_step": 182639, "epoch": 4348} {"train_loss": -7.069599151611328, "global_step": 182640, "epoch": 4348} {"train_loss": -7.170034408569336, "global_step": 182641, "epoch": 4348} {"train_loss": -7.098316669464111, "global_step": 182642, "epoch": 4348} {"train_loss": -6.9886674880981445, "global_step": 182643, "epoch": 4348} {"train_loss": -7.134187698364258, "global_step": 182644, "epoch": 4348} {"train_loss": -7.106601238250732, "global_step": 182645, "epoch": 4348} {"train_loss": -6.980253219604492, "global_step": 182646, "epoch": 4348} {"train_loss": -7.227423191070557, "global_step": 182647, "epoch": 4348} {"train_loss": -7.150376319885254, "global_step": 182648, "epoch": 4348} {"train_loss": -7.032071590423584, "global_step": 182649, "epoch": 4348} {"train_loss": -7.172159194946289, "global_step": 182650, "epoch": 4348} {"train_loss": -7.05048942565918, "global_step": 182651, "epoch": 4348} {"train_loss": -7.026297569274902, "global_step": 182652, "epoch": 4348} {"train_loss": -7.1296281814575195, "global_step": 182653, "epoch": 4348} {"train_loss": -7.0706868171691895, "global_step": 182654, "epoch": 4348} {"train_loss": -7.069486618041992, "global_step": 182655, "epoch": 4348} {"train_loss": -7.057620525360107, "global_step": 182656, "epoch": 4348} {"train_loss": -7.056477989469256, "global_step": 182657, "epoch": 4348, "val_loss": 68789.8828125} {"train_loss": -6.975133419036865, "global_step": 182658, "epoch": 4349} {"train_loss": -7.146943092346191, "global_step": 182659, "epoch": 4349} {"train_loss": -7.117114067077637, "global_step": 182660, "epoch": 4349} {"train_loss": -7.15123176574707, "global_step": 182661, "epoch": 4349} {"train_loss": -7.055890083312988, "global_step": 182662, "epoch": 4349} {"train_loss": -7.064069747924805, "global_step": 182663, "epoch": 4349} {"train_loss": -7.106631278991699, "global_step": 182664, "epoch": 4349} {"train_loss": -7.104705333709717, "global_step": 182665, "epoch": 4349} {"train_loss": -7.022017955780029, "global_step": 182666, "epoch": 4349} {"train_loss": -7.024452209472656, "global_step": 182667, "epoch": 4349} {"train_loss": -6.9927592277526855, "global_step": 182668, "epoch": 4349} {"train_loss": -7.0600666999816895, "global_step": 182669, "epoch": 4349} {"train_loss": -7.13297176361084, "global_step": 182670, "epoch": 4349} {"train_loss": -7.027761459350586, "global_step": 182671, "epoch": 4349} {"train_loss": -7.125491142272949, "global_step": 182672, "epoch": 4349} {"train_loss": -7.090781211853027, "global_step": 182673, "epoch": 4349} {"train_loss": -7.156832695007324, "global_step": 182674, "epoch": 4349} {"train_loss": -7.040167808532715, "global_step": 182675, "epoch": 4349} {"train_loss": -7.160228252410889, "global_step": 182676, "epoch": 4349} {"train_loss": -7.125324726104736, "global_step": 182677, "epoch": 4349} {"train_loss": -7.142618179321289, "global_step": 182678, "epoch": 4349} {"train_loss": -7.159028053283691, "global_step": 182679, "epoch": 4349} {"train_loss": -7.214812278747559, "global_step": 182680, "epoch": 4349} {"train_loss": -7.02957820892334, "global_step": 182681, "epoch": 4349} {"train_loss": -7.330047130584717, "global_step": 182682, "epoch": 4349} {"train_loss": -7.064421653747559, "global_step": 182683, "epoch": 4349} {"train_loss": -7.1509504318237305, "global_step": 182684, "epoch": 4349} {"train_loss": -7.177216529846191, "global_step": 182685, "epoch": 4349} {"train_loss": -7.107346057891846, "global_step": 182686, "epoch": 4349} {"train_loss": -7.099878787994385, "global_step": 182687, "epoch": 4349} {"train_loss": -7.066144943237305, "global_step": 182688, "epoch": 4349} {"train_loss": -7.159238815307617, "global_step": 182689, "epoch": 4349} {"train_loss": -7.086688995361328, "global_step": 182690, "epoch": 4349} {"train_loss": -7.101701736450195, "global_step": 182691, "epoch": 4349} {"train_loss": -7.068874359130859, "global_step": 182692, "epoch": 4349} {"train_loss": -6.966031074523926, "global_step": 182693, "epoch": 4349} {"train_loss": -7.081529140472412, "global_step": 182694, "epoch": 4349} {"train_loss": -6.964883327484131, "global_step": 182695, "epoch": 4349} {"train_loss": -6.793362617492676, "global_step": 182696, "epoch": 4349} {"train_loss": -7.122378826141357, "global_step": 182697, "epoch": 4349} {"train_loss": -6.975568771362305, "global_step": 182698, "epoch": 4349} {"train_loss": -7.0854607082548595, "global_step": 182699, "epoch": 4349, "val_loss": 68897.5234375} {"train_loss": -7.036602973937988, "global_step": 182700, "epoch": 4350} {"train_loss": -7.001863479614258, "global_step": 182701, "epoch": 4350} {"train_loss": -7.099703788757324, "global_step": 182702, "epoch": 4350} {"train_loss": -7.038928985595703, "global_step": 182703, "epoch": 4350} {"train_loss": -7.045544624328613, "global_step": 182704, "epoch": 4350} {"train_loss": -7.09765625, "global_step": 182705, "epoch": 4350} {"train_loss": -7.083865165710449, "global_step": 182706, "epoch": 4350} {"train_loss": -6.976609230041504, "global_step": 182707, "epoch": 4350} {"train_loss": -7.011725425720215, "global_step": 182708, "epoch": 4350} {"train_loss": -6.965421676635742, "global_step": 182709, "epoch": 4350} {"train_loss": -7.037636756896973, "global_step": 182710, "epoch": 4350} {"train_loss": -7.1235880851745605, "global_step": 182711, "epoch": 4350} {"train_loss": -7.127543926239014, "global_step": 182712, "epoch": 4350} {"train_loss": -7.187755107879639, "global_step": 182713, "epoch": 4350} {"train_loss": -7.163325309753418, "global_step": 182714, "epoch": 4350} {"train_loss": -7.149155616760254, "global_step": 182715, "epoch": 4350} {"train_loss": -7.15715217590332, "global_step": 182716, "epoch": 4350} {"train_loss": -7.1537652015686035, "global_step": 182717, "epoch": 4350} {"train_loss": -7.193955898284912, "global_step": 182718, "epoch": 4350} {"train_loss": -7.00557804107666, "global_step": 182719, "epoch": 4350} {"train_loss": -7.020485877990723, "global_step": 182720, "epoch": 4350} {"train_loss": -7.072654724121094, "global_step": 182721, "epoch": 4350} {"train_loss": -7.025961875915527, "global_step": 182722, "epoch": 4350} {"train_loss": -7.003411293029785, "global_step": 182723, "epoch": 4350} {"train_loss": -7.072723865509033, "global_step": 182724, "epoch": 4350} {"train_loss": -6.972226619720459, "global_step": 182725, "epoch": 4350} {"train_loss": -7.073203086853027, "global_step": 182726, "epoch": 4350} {"train_loss": -7.156889915466309, "global_step": 182727, "epoch": 4350} {"train_loss": -6.924480438232422, "global_step": 182728, "epoch": 4350} {"train_loss": -7.097219944000244, "global_step": 182729, "epoch": 4350} {"train_loss": -7.098565101623535, "global_step": 182730, "epoch": 4350} {"train_loss": -7.089695930480957, "global_step": 182731, "epoch": 4350} {"train_loss": -7.103107452392578, "global_step": 182732, "epoch": 4350} {"train_loss": -7.055103778839111, "global_step": 182733, "epoch": 4350} {"train_loss": -7.1330156326293945, "global_step": 182734, "epoch": 4350} {"train_loss": -7.085790157318115, "global_step": 182735, "epoch": 4350} {"train_loss": -7.143704414367676, "global_step": 182736, "epoch": 4350} {"train_loss": -7.143045425415039, "global_step": 182737, "epoch": 4350} {"train_loss": -7.197705268859863, "global_step": 182738, "epoch": 4350} {"train_loss": -7.021738529205322, "global_step": 182739, "epoch": 4350} {"train_loss": -7.114548683166504, "global_step": 182740, "epoch": 4350} {"train_loss": -7.078292687733968, "global_step": 182741, "epoch": 4350, "train/sim_max_reward_0": 0.19994852381439862, "train/sim_max_reward_1": 0.8815880743602016, "train/sim_max_reward_2": 0.8109675618153399, "train/sim_max_reward_3": 0.13460607641895697, "train/sim_max_reward_4": 0.9165101106502461, "train/sim_max_reward_5": 0.9072420009808773, "test/sim_max_reward_4400000": 0.1881504195921789, "test/sim_max_reward_4400001": 0.23015603566407822, "test/sim_max_reward_4400002": 0.9726196709901587, "test/sim_max_reward_4400003": 0.7481515701692979, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.26640027506857444, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.8773059305073636, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.9073771340645491, "test/sim_max_reward_4400010": 0.1876206482049287, "test/sim_max_reward_4400011": 0.07367815791263908, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.7543193001044276, "test/sim_max_reward_4400014": 0.8897445216699611, "test/sim_max_reward_4400015": 0.0855603704476198, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.25117526533385054, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8789295752997848, "test/sim_max_reward_4400023": 0.4225697538554648, "test/sim_max_reward_4400024": 0.8737026688134271, "test/sim_max_reward_4400025": 0.2667124309277785, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.019640702044303304, "test/sim_max_reward_4400028": 0.4262702420977388, "test/sim_max_reward_4400029": 0.9463736830783473, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.948275689859273, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8798837732702026, "test/sim_max_reward_4400034": 0.9930405016826781, "test/sim_max_reward_4400035": 0.4609994541192371, "test/sim_max_reward_4400036": 0.9847348972069994, "test/sim_max_reward_4400037": 0.9796478020155978, "test/sim_max_reward_4400038": 0.9500494511188134, "test/sim_max_reward_4400039": 0.9437376123079462, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9543070307828248, "test/sim_max_reward_4400042": 0.5223176056124332, "test/sim_max_reward_4400043": 0.9369693079050678, "test/sim_max_reward_4400044": 0.6014916730774782, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.9317667212897673, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.8915522254719624, "test/sim_max_reward_4400049": 0.8676331516659282, "train/mean_score": 0.6418103913400034, "test/mean_score": 0.5776551800752499, "val_loss": 68749.1015625} {"train_loss": -7.1064043045043945, "global_step": 182742, "epoch": 4351} {"train_loss": -7.1304779052734375, "global_step": 182743, "epoch": 4351} {"train_loss": -7.101419925689697, "global_step": 182744, "epoch": 4351} {"train_loss": -7.1536993980407715, "global_step": 182745, "epoch": 4351} {"train_loss": -7.094918251037598, "global_step": 182746, "epoch": 4351} {"train_loss": -7.084255695343018, "global_step": 182747, "epoch": 4351} {"train_loss": -7.05246114730835, "global_step": 182748, "epoch": 4351} {"train_loss": -7.009078025817871, "global_step": 182749, "epoch": 4351} {"train_loss": -7.080702781677246, "global_step": 182750, "epoch": 4351} {"train_loss": -7.091991901397705, "global_step": 182751, "epoch": 4351} {"train_loss": -7.171247482299805, "global_step": 182752, "epoch": 4351} {"train_loss": -7.072633743286133, "global_step": 182753, "epoch": 4351} {"train_loss": -7.134625434875488, "global_step": 182754, "epoch": 4351} {"train_loss": -7.110992431640625, "global_step": 182755, "epoch": 4351} {"train_loss": -7.096837520599365, "global_step": 182756, "epoch": 4351} {"train_loss": -7.221123695373535, "global_step": 182757, "epoch": 4351} {"train_loss": -7.141914367675781, "global_step": 182758, "epoch": 4351} {"train_loss": -6.957058906555176, "global_step": 182759, "epoch": 4351} {"train_loss": -7.146537780761719, "global_step": 182760, "epoch": 4351} {"train_loss": -6.99678897857666, "global_step": 182761, "epoch": 4351} {"train_loss": -6.932411193847656, "global_step": 182762, "epoch": 4351} {"train_loss": -7.104255676269531, "global_step": 182763, "epoch": 4351} {"train_loss": -7.017351150512695, "global_step": 182764, "epoch": 4351} {"train_loss": -7.047748565673828, "global_step": 182765, "epoch": 4351} {"train_loss": -6.94633674621582, "global_step": 182766, "epoch": 4351} {"train_loss": -7.115194797515869, "global_step": 182767, "epoch": 4351} {"train_loss": -7.047314643859863, "global_step": 182768, "epoch": 4351} {"train_loss": -6.9453349113464355, "global_step": 182769, "epoch": 4351} {"train_loss": -7.035002708435059, "global_step": 182770, "epoch": 4351} {"train_loss": -6.966355323791504, "global_step": 182771, "epoch": 4351} {"train_loss": -7.053450107574463, "global_step": 182772, "epoch": 4351} {"train_loss": -7.033164024353027, "global_step": 182773, "epoch": 4351} {"train_loss": -7.030710697174072, "global_step": 182774, "epoch": 4351} {"train_loss": -7.096978187561035, "global_step": 182775, "epoch": 4351} {"train_loss": -7.135761737823486, "global_step": 182776, "epoch": 4351} {"train_loss": -7.13084602355957, "global_step": 182777, "epoch": 4351} {"train_loss": -7.143159866333008, "global_step": 182778, "epoch": 4351} {"train_loss": -7.075538635253906, "global_step": 182779, "epoch": 4351} {"train_loss": -7.118348598480225, "global_step": 182780, "epoch": 4351} {"train_loss": -7.225903511047363, "global_step": 182781, "epoch": 4351} {"train_loss": -7.176982879638672, "global_step": 182782, "epoch": 4351} {"train_loss": -7.083745752062116, "global_step": 182783, "epoch": 4351, "val_loss": 68777.625} {"train_loss": -7.091819763183594, "global_step": 182784, "epoch": 4352} {"train_loss": -7.096324443817139, "global_step": 182785, "epoch": 4352} {"train_loss": -6.916598796844482, "global_step": 182786, "epoch": 4352} {"train_loss": -7.21840238571167, "global_step": 182787, "epoch": 4352} {"train_loss": -7.143728256225586, "global_step": 182788, "epoch": 4352} {"train_loss": -7.115622520446777, "global_step": 182789, "epoch": 4352} {"train_loss": -7.111600875854492, "global_step": 182790, "epoch": 4352} {"train_loss": -7.115229606628418, "global_step": 182791, "epoch": 4352} {"train_loss": -7.232492923736572, "global_step": 182792, "epoch": 4352} {"train_loss": -7.174835205078125, "global_step": 182793, "epoch": 4352} {"train_loss": -7.228497505187988, "global_step": 182794, "epoch": 4352} {"train_loss": -7.104178428649902, "global_step": 182795, "epoch": 4352} {"train_loss": -7.174915313720703, "global_step": 182796, "epoch": 4352} {"train_loss": -7.200324058532715, "global_step": 182797, "epoch": 4352} {"train_loss": -7.056902885437012, "global_step": 182798, "epoch": 4352} {"train_loss": -7.1145477294921875, "global_step": 182799, "epoch": 4352} {"train_loss": -7.092106819152832, "global_step": 182800, "epoch": 4352} {"train_loss": -7.195619583129883, "global_step": 182801, "epoch": 4352} {"train_loss": -7.098546981811523, "global_step": 182802, "epoch": 4352} {"train_loss": -7.077835559844971, "global_step": 182803, "epoch": 4352} {"train_loss": -6.995045185089111, "global_step": 182804, "epoch": 4352} {"train_loss": -6.9719557762146, "global_step": 182805, "epoch": 4352} {"train_loss": -7.056451797485352, "global_step": 182806, "epoch": 4352} {"train_loss": -7.066976070404053, "global_step": 182807, "epoch": 4352} {"train_loss": -6.919721603393555, "global_step": 182808, "epoch": 4352} {"train_loss": -7.045147895812988, "global_step": 182809, "epoch": 4352} {"train_loss": -7.087236404418945, "global_step": 182810, "epoch": 4352} {"train_loss": -6.862053871154785, "global_step": 182811, "epoch": 4352} {"train_loss": -7.093349456787109, "global_step": 182812, "epoch": 4352} {"train_loss": -6.8592729568481445, "global_step": 182813, "epoch": 4352} {"train_loss": -7.065225601196289, "global_step": 182814, "epoch": 4352} {"train_loss": -7.150119304656982, "global_step": 182815, "epoch": 4352} {"train_loss": -6.8809356689453125, "global_step": 182816, "epoch": 4352} {"train_loss": -7.1030378341674805, "global_step": 182817, "epoch": 4352} {"train_loss": -7.0335540771484375, "global_step": 182818, "epoch": 4352} {"train_loss": -7.106886863708496, "global_step": 182819, "epoch": 4352} {"train_loss": -7.005311965942383, "global_step": 182820, "epoch": 4352} {"train_loss": -7.0484418869018555, "global_step": 182821, "epoch": 4352} {"train_loss": -7.072727203369141, "global_step": 182822, "epoch": 4352} {"train_loss": -7.1369829177856445, "global_step": 182823, "epoch": 4352} {"train_loss": -7.0576701164245605, "global_step": 182824, "epoch": 4352} {"train_loss": -7.079799663452875, "global_step": 182825, "epoch": 4352, "val_loss": 68905.90625} {"train_loss": -7.075349807739258, "global_step": 182826, "epoch": 4353} {"train_loss": -7.070542335510254, "global_step": 182827, "epoch": 4353} {"train_loss": -7.079730987548828, "global_step": 182828, "epoch": 4353} {"train_loss": -7.140964984893799, "global_step": 182829, "epoch": 4353} {"train_loss": -7.092365741729736, "global_step": 182830, "epoch": 4353} {"train_loss": -7.080084323883057, "global_step": 182831, "epoch": 4353} {"train_loss": -7.103982925415039, "global_step": 182832, "epoch": 4353} {"train_loss": -7.095211982727051, "global_step": 182833, "epoch": 4353} {"train_loss": -7.068779945373535, "global_step": 182834, "epoch": 4353} {"train_loss": -7.15836238861084, "global_step": 182835, "epoch": 4353} {"train_loss": -7.061152458190918, "global_step": 182836, "epoch": 4353} {"train_loss": -7.085133075714111, "global_step": 182837, "epoch": 4353} {"train_loss": -7.127402305603027, "global_step": 182838, "epoch": 4353} {"train_loss": -7.066596984863281, "global_step": 182839, "epoch": 4353} {"train_loss": -7.075313568115234, "global_step": 182840, "epoch": 4353} {"train_loss": -7.049900054931641, "global_step": 182841, "epoch": 4353} {"train_loss": -7.1161603927612305, "global_step": 182842, "epoch": 4353} {"train_loss": -7.124626159667969, "global_step": 182843, "epoch": 4353} {"train_loss": -7.057506084442139, "global_step": 182844, "epoch": 4353} {"train_loss": -6.985653877258301, "global_step": 182845, "epoch": 4353} {"train_loss": -7.056790351867676, "global_step": 182846, "epoch": 4353} {"train_loss": -7.016324043273926, "global_step": 182847, "epoch": 4353} {"train_loss": -7.160900592803955, "global_step": 182848, "epoch": 4353} {"train_loss": -7.13955020904541, "global_step": 182849, "epoch": 4353} {"train_loss": -6.941668510437012, "global_step": 182850, "epoch": 4353} {"train_loss": -7.217592716217041, "global_step": 182851, "epoch": 4353} {"train_loss": -7.062836170196533, "global_step": 182852, "epoch": 4353} {"train_loss": -7.045063018798828, "global_step": 182853, "epoch": 4353} {"train_loss": -7.015885353088379, "global_step": 182854, "epoch": 4353} {"train_loss": -7.014461517333984, "global_step": 182855, "epoch": 4353} {"train_loss": -7.0256500244140625, "global_step": 182856, "epoch": 4353} {"train_loss": -7.078243255615234, "global_step": 182857, "epoch": 4353} {"train_loss": -6.956722259521484, "global_step": 182858, "epoch": 4353} {"train_loss": -7.124117851257324, "global_step": 182859, "epoch": 4353} {"train_loss": -6.924942493438721, "global_step": 182860, "epoch": 4353} {"train_loss": -6.979823112487793, "global_step": 182861, "epoch": 4353} {"train_loss": -6.997575759887695, "global_step": 182862, "epoch": 4353} {"train_loss": -7.008856296539307, "global_step": 182863, "epoch": 4353} {"train_loss": -7.063813209533691, "global_step": 182864, "epoch": 4353} {"train_loss": -7.011083602905273, "global_step": 182865, "epoch": 4353} {"train_loss": -7.0626935958862305, "global_step": 182866, "epoch": 4353} {"train_loss": -7.063265948068528, "global_step": 182867, "epoch": 4353, "val_loss": 68901.8828125} {"train_loss": -7.097686767578125, "global_step": 182868, "epoch": 4354} {"train_loss": -7.1558990478515625, "global_step": 182869, "epoch": 4354} {"train_loss": -7.071777820587158, "global_step": 182870, "epoch": 4354} {"train_loss": -7.099082946777344, "global_step": 182871, "epoch": 4354} {"train_loss": -7.067255973815918, "global_step": 182872, "epoch": 4354} {"train_loss": -7.066437721252441, "global_step": 182873, "epoch": 4354} {"train_loss": -7.1295037269592285, "global_step": 182874, "epoch": 4354} {"train_loss": -6.95381498336792, "global_step": 182875, "epoch": 4354} {"train_loss": -7.075658798217773, "global_step": 182876, "epoch": 4354} {"train_loss": -7.134045600891113, "global_step": 182877, "epoch": 4354} {"train_loss": -7.070621967315674, "global_step": 182878, "epoch": 4354} {"train_loss": -7.080389022827148, "global_step": 182879, "epoch": 4354} {"train_loss": -7.119174480438232, "global_step": 182880, "epoch": 4354} {"train_loss": -7.100177764892578, "global_step": 182881, "epoch": 4354} {"train_loss": -7.188543319702148, "global_step": 182882, "epoch": 4354} {"train_loss": -7.066915512084961, "global_step": 182883, "epoch": 4354} {"train_loss": -7.081184387207031, "global_step": 182884, "epoch": 4354} {"train_loss": -7.103646278381348, "global_step": 182885, "epoch": 4354} {"train_loss": -7.097988128662109, "global_step": 182886, "epoch": 4354} {"train_loss": -7.099720478057861, "global_step": 182887, "epoch": 4354} {"train_loss": -7.108908653259277, "global_step": 182888, "epoch": 4354} {"train_loss": -7.125504493713379, "global_step": 182889, "epoch": 4354} {"train_loss": -7.087342739105225, "global_step": 182890, "epoch": 4354} {"train_loss": -7.231130599975586, "global_step": 182891, "epoch": 4354} {"train_loss": -7.052126884460449, "global_step": 182892, "epoch": 4354} {"train_loss": -7.063667297363281, "global_step": 182893, "epoch": 4354} {"train_loss": -7.156371593475342, "global_step": 182894, "epoch": 4354} {"train_loss": -7.2125139236450195, "global_step": 182895, "epoch": 4354} {"train_loss": -7.036555290222168, "global_step": 182896, "epoch": 4354} {"train_loss": -7.043630599975586, "global_step": 182897, "epoch": 4354} {"train_loss": -7.101644039154053, "global_step": 182898, "epoch": 4354} {"train_loss": -7.169685363769531, "global_step": 182899, "epoch": 4354} {"train_loss": -7.09306001663208, "global_step": 182900, "epoch": 4354} {"train_loss": -7.0877909660339355, "global_step": 182901, "epoch": 4354} {"train_loss": -7.197792053222656, "global_step": 182902, "epoch": 4354} {"train_loss": -7.10147762298584, "global_step": 182903, "epoch": 4354} {"train_loss": -7.142036437988281, "global_step": 182904, "epoch": 4354} {"train_loss": -7.039102077484131, "global_step": 182905, "epoch": 4354} {"train_loss": -7.274213790893555, "global_step": 182906, "epoch": 4354} {"train_loss": -7.1819257736206055, "global_step": 182907, "epoch": 4354} {"train_loss": -7.115512847900391, "global_step": 182908, "epoch": 4354} {"train_loss": -7.109699885050456, "global_step": 182909, "epoch": 4354, "val_loss": 68726.421875} {"train_loss": -7.14306640625, "global_step": 182910, "epoch": 4355} {"train_loss": -7.048267364501953, "global_step": 182911, "epoch": 4355} {"train_loss": -7.0668439865112305, "global_step": 182912, "epoch": 4355} {"train_loss": -7.116549015045166, "global_step": 182913, "epoch": 4355} {"train_loss": -7.182985305786133, "global_step": 182914, "epoch": 4355} {"train_loss": -7.045270919799805, "global_step": 182915, "epoch": 4355} {"train_loss": -7.12012243270874, "global_step": 182916, "epoch": 4355} {"train_loss": -7.202456474304199, "global_step": 182917, "epoch": 4355} {"train_loss": -7.098293304443359, "global_step": 182918, "epoch": 4355} {"train_loss": -7.165347576141357, "global_step": 182919, "epoch": 4355} {"train_loss": -7.075377464294434, "global_step": 182920, "epoch": 4355} {"train_loss": -7.108755588531494, "global_step": 182921, "epoch": 4355} {"train_loss": -7.151007652282715, "global_step": 182922, "epoch": 4355} {"train_loss": -7.078917026519775, "global_step": 182923, "epoch": 4355} {"train_loss": -7.108263969421387, "global_step": 182924, "epoch": 4355} {"train_loss": -7.026423454284668, "global_step": 182925, "epoch": 4355} {"train_loss": -7.100313186645508, "global_step": 182926, "epoch": 4355} {"train_loss": -7.0009870529174805, "global_step": 182927, "epoch": 4355} {"train_loss": -7.097496032714844, "global_step": 182928, "epoch": 4355} {"train_loss": -7.089011192321777, "global_step": 182929, "epoch": 4355} {"train_loss": -7.044116973876953, "global_step": 182930, "epoch": 4355} {"train_loss": -6.94378137588501, "global_step": 182931, "epoch": 4355} {"train_loss": -7.079814910888672, "global_step": 182932, "epoch": 4355} {"train_loss": -6.9904046058654785, "global_step": 182933, "epoch": 4355} {"train_loss": -7.170131206512451, "global_step": 182934, "epoch": 4355} {"train_loss": -7.083296775817871, "global_step": 182935, "epoch": 4355} {"train_loss": -6.951015472412109, "global_step": 182936, "epoch": 4355} {"train_loss": -7.0289306640625, "global_step": 182937, "epoch": 4355} {"train_loss": -7.076020240783691, "global_step": 182938, "epoch": 4355} {"train_loss": -7.084784507751465, "global_step": 182939, "epoch": 4355} {"train_loss": -7.127995014190674, "global_step": 182940, "epoch": 4355} {"train_loss": -7.06026554107666, "global_step": 182941, "epoch": 4355} {"train_loss": -7.116553783416748, "global_step": 182942, "epoch": 4355} {"train_loss": -7.065704345703125, "global_step": 182943, "epoch": 4355} {"train_loss": -7.1354570388793945, "global_step": 182944, "epoch": 4355} {"train_loss": -7.175771713256836, "global_step": 182945, "epoch": 4355} {"train_loss": -7.119044303894043, "global_step": 182946, "epoch": 4355} {"train_loss": -7.054078578948975, "global_step": 182947, "epoch": 4355} {"train_loss": -7.068957328796387, "global_step": 182948, "epoch": 4355} {"train_loss": -7.072846412658691, "global_step": 182949, "epoch": 4355} {"train_loss": -6.942563056945801, "global_step": 182950, "epoch": 4355} {"train_loss": -7.085672878083729, "global_step": 182951, "epoch": 4355, "val_loss": 68923.90625} {"train_loss": -6.9651899337768555, "global_step": 182952, "epoch": 4356} {"train_loss": -7.047870635986328, "global_step": 182953, "epoch": 4356} {"train_loss": -7.1473069190979, "global_step": 182954, "epoch": 4356} {"train_loss": -6.978823661804199, "global_step": 182955, "epoch": 4356} {"train_loss": -7.07158088684082, "global_step": 182956, "epoch": 4356} {"train_loss": -7.012611389160156, "global_step": 182957, "epoch": 4356} {"train_loss": -7.005441665649414, "global_step": 182958, "epoch": 4356} {"train_loss": -7.0744123458862305, "global_step": 182959, "epoch": 4356} {"train_loss": -6.946091175079346, "global_step": 182960, "epoch": 4356} {"train_loss": -7.0724101066589355, "global_step": 182961, "epoch": 4356} {"train_loss": -7.012372970581055, "global_step": 182962, "epoch": 4356} {"train_loss": -7.04642391204834, "global_step": 182963, "epoch": 4356} {"train_loss": -7.0964155197143555, "global_step": 182964, "epoch": 4356} {"train_loss": -7.0737714767456055, "global_step": 182965, "epoch": 4356} {"train_loss": -7.003775596618652, "global_step": 182966, "epoch": 4356} {"train_loss": -7.018741130828857, "global_step": 182967, "epoch": 4356} {"train_loss": -6.913989543914795, "global_step": 182968, "epoch": 4356} {"train_loss": -7.1361260414123535, "global_step": 182969, "epoch": 4356} {"train_loss": -7.0040459632873535, "global_step": 182970, "epoch": 4356} {"train_loss": -6.943290710449219, "global_step": 182971, "epoch": 4356} {"train_loss": -7.0231828689575195, "global_step": 182972, "epoch": 4356} {"train_loss": -7.0404462814331055, "global_step": 182973, "epoch": 4356} {"train_loss": -7.016440391540527, "global_step": 182974, "epoch": 4356} {"train_loss": -7.07856559753418, "global_step": 182975, "epoch": 4356} {"train_loss": -7.124360084533691, "global_step": 182976, "epoch": 4356} {"train_loss": -7.055617809295654, "global_step": 182977, "epoch": 4356} {"train_loss": -7.127407550811768, "global_step": 182978, "epoch": 4356} {"train_loss": -7.122135162353516, "global_step": 182979, "epoch": 4356} {"train_loss": -7.113164901733398, "global_step": 182980, "epoch": 4356} {"train_loss": -7.129679203033447, "global_step": 182981, "epoch": 4356} {"train_loss": -7.168950080871582, "global_step": 182982, "epoch": 4356} {"train_loss": -7.114171028137207, "global_step": 182983, "epoch": 4356} {"train_loss": -6.98754358291626, "global_step": 182984, "epoch": 4356} {"train_loss": -7.06673526763916, "global_step": 182985, "epoch": 4356} {"train_loss": -7.15582799911499, "global_step": 182986, "epoch": 4356} {"train_loss": -7.0559282302856445, "global_step": 182987, "epoch": 4356} {"train_loss": -7.058454513549805, "global_step": 182988, "epoch": 4356} {"train_loss": -7.174662113189697, "global_step": 182989, "epoch": 4356} {"train_loss": -7.152682304382324, "global_step": 182990, "epoch": 4356} {"train_loss": -7.109053611755371, "global_step": 182991, "epoch": 4356} {"train_loss": -7.083883285522461, "global_step": 182992, "epoch": 4356} {"train_loss": -7.062084606715611, "global_step": 182993, "epoch": 4356, "val_loss": 68719.9765625} {"train_loss": -7.05499267578125, "global_step": 182994, "epoch": 4357} {"train_loss": -7.175579071044922, "global_step": 182995, "epoch": 4357} {"train_loss": -7.095736503601074, "global_step": 182996, "epoch": 4357} {"train_loss": -7.117188930511475, "global_step": 182997, "epoch": 4357} {"train_loss": -7.064590930938721, "global_step": 182998, "epoch": 4357} {"train_loss": -7.15915584564209, "global_step": 182999, "epoch": 4357} {"train_loss": -7.165470600128174, "global_step": 183000, "epoch": 4357} {"train_loss": -7.053335666656494, "global_step": 183001, "epoch": 4357} {"train_loss": -7.076930046081543, "global_step": 183002, "epoch": 4357} {"train_loss": -7.1569132804870605, "global_step": 183003, "epoch": 4357} {"train_loss": -7.144067764282227, "global_step": 183004, "epoch": 4357} {"train_loss": -7.069474697113037, "global_step": 183005, "epoch": 4357} {"train_loss": -7.019654273986816, "global_step": 183006, "epoch": 4357} {"train_loss": -6.974527359008789, "global_step": 183007, "epoch": 4357} {"train_loss": -7.099834442138672, "global_step": 183008, "epoch": 4357} {"train_loss": -7.085203647613525, "global_step": 183009, "epoch": 4357} {"train_loss": -7.076571464538574, "global_step": 183010, "epoch": 4357} {"train_loss": -7.084809303283691, "global_step": 183011, "epoch": 4357} {"train_loss": -7.208737850189209, "global_step": 183012, "epoch": 4357} {"train_loss": -7.088776111602783, "global_step": 183013, "epoch": 4357} {"train_loss": -7.171202182769775, "global_step": 183014, "epoch": 4357} {"train_loss": -7.153440952301025, "global_step": 183015, "epoch": 4357} {"train_loss": -7.110132217407227, "global_step": 183016, "epoch": 4357} {"train_loss": -7.063388824462891, "global_step": 183017, "epoch": 4357} {"train_loss": -7.159930229187012, "global_step": 183018, "epoch": 4357} {"train_loss": -7.122919082641602, "global_step": 183019, "epoch": 4357} {"train_loss": -7.079624176025391, "global_step": 183020, "epoch": 4357} {"train_loss": -7.132147789001465, "global_step": 183021, "epoch": 4357} {"train_loss": -7.278796195983887, "global_step": 183022, "epoch": 4357} {"train_loss": -7.2139692306518555, "global_step": 183023, "epoch": 4357} {"train_loss": -7.1719818115234375, "global_step": 183024, "epoch": 4357} {"train_loss": -7.14091682434082, "global_step": 183025, "epoch": 4357} {"train_loss": -7.136270999908447, "global_step": 183026, "epoch": 4357} {"train_loss": -7.140406608581543, "global_step": 183027, "epoch": 4357} {"train_loss": -7.122960567474365, "global_step": 183028, "epoch": 4357} {"train_loss": -7.121653079986572, "global_step": 183029, "epoch": 4357} {"train_loss": -7.1629838943481445, "global_step": 183030, "epoch": 4357} {"train_loss": -7.166971206665039, "global_step": 183031, "epoch": 4357} {"train_loss": -6.967931270599365, "global_step": 183032, "epoch": 4357} {"train_loss": -7.128104209899902, "global_step": 183033, "epoch": 4357} {"train_loss": -7.149259090423584, "global_step": 183034, "epoch": 4357} {"train_loss": -7.118237166177659, "global_step": 183035, "epoch": 4357, "val_loss": 68870.375} {"train_loss": -6.999323844909668, "global_step": 183036, "epoch": 4358} {"train_loss": -7.101107597351074, "global_step": 183037, "epoch": 4358} {"train_loss": -7.060683250427246, "global_step": 183038, "epoch": 4358} {"train_loss": -7.085015773773193, "global_step": 183039, "epoch": 4358} {"train_loss": -7.1295928955078125, "global_step": 183040, "epoch": 4358} {"train_loss": -7.1902923583984375, "global_step": 183041, "epoch": 4358} {"train_loss": -7.14593505859375, "global_step": 183042, "epoch": 4358} {"train_loss": -7.275739669799805, "global_step": 183043, "epoch": 4358} {"train_loss": -7.181539535522461, "global_step": 183044, "epoch": 4358} {"train_loss": -7.085289001464844, "global_step": 183045, "epoch": 4358} {"train_loss": -7.2092695236206055, "global_step": 183046, "epoch": 4358} {"train_loss": -7.104292392730713, "global_step": 183047, "epoch": 4358} {"train_loss": -7.123900413513184, "global_step": 183048, "epoch": 4358} {"train_loss": -7.07938814163208, "global_step": 183049, "epoch": 4358} {"train_loss": -7.058561325073242, "global_step": 183050, "epoch": 4358} {"train_loss": -7.052069664001465, "global_step": 183051, "epoch": 4358} {"train_loss": -7.071208953857422, "global_step": 183052, "epoch": 4358} {"train_loss": -7.117480754852295, "global_step": 183053, "epoch": 4358} {"train_loss": -7.19877815246582, "global_step": 183054, "epoch": 4358} {"train_loss": -7.16934871673584, "global_step": 183055, "epoch": 4358} {"train_loss": -7.2409749031066895, "global_step": 183056, "epoch": 4358} {"train_loss": -7.18491268157959, "global_step": 183057, "epoch": 4358} {"train_loss": -7.086857795715332, "global_step": 183058, "epoch": 4358} {"train_loss": -7.021255016326904, "global_step": 183059, "epoch": 4358} {"train_loss": -7.044486045837402, "global_step": 183060, "epoch": 4358} {"train_loss": -7.03706169128418, "global_step": 183061, "epoch": 4358} {"train_loss": -7.076971530914307, "global_step": 183062, "epoch": 4358} {"train_loss": -7.0976457595825195, "global_step": 183063, "epoch": 4358} {"train_loss": -6.985215187072754, "global_step": 183064, "epoch": 4358} {"train_loss": -7.02736759185791, "global_step": 183065, "epoch": 4358} {"train_loss": -7.058879852294922, "global_step": 183066, "epoch": 4358} {"train_loss": -6.956364154815674, "global_step": 183067, "epoch": 4358} {"train_loss": -7.063464164733887, "global_step": 183068, "epoch": 4358} {"train_loss": -7.148354530334473, "global_step": 183069, "epoch": 4358} {"train_loss": -6.918665885925293, "global_step": 183070, "epoch": 4358} {"train_loss": -7.091649055480957, "global_step": 183071, "epoch": 4358} {"train_loss": -7.059530735015869, "global_step": 183072, "epoch": 4358} {"train_loss": -6.995549201965332, "global_step": 183073, "epoch": 4358} {"train_loss": -7.059995651245117, "global_step": 183074, "epoch": 4358} {"train_loss": -7.001343727111816, "global_step": 183075, "epoch": 4358} {"train_loss": -7.036252498626709, "global_step": 183076, "epoch": 4358} {"train_loss": -7.08511445635841, "global_step": 183077, "epoch": 4358, "val_loss": 68764.375} {"train_loss": -7.0562944412231445, "global_step": 183078, "epoch": 4359} {"train_loss": -7.1009979248046875, "global_step": 183079, "epoch": 4359} {"train_loss": -7.152341365814209, "global_step": 183080, "epoch": 4359} {"train_loss": -7.084502220153809, "global_step": 183081, "epoch": 4359} {"train_loss": -7.088680267333984, "global_step": 183082, "epoch": 4359} {"train_loss": -7.01094913482666, "global_step": 183083, "epoch": 4359} {"train_loss": -6.948934555053711, "global_step": 183084, "epoch": 4359} {"train_loss": -7.083216667175293, "global_step": 183085, "epoch": 4359} {"train_loss": -7.104413986206055, "global_step": 183086, "epoch": 4359} {"train_loss": -7.196109771728516, "global_step": 183087, "epoch": 4359} {"train_loss": -7.092054843902588, "global_step": 183088, "epoch": 4359} {"train_loss": -7.038998126983643, "global_step": 183089, "epoch": 4359} {"train_loss": -7.030933380126953, "global_step": 183090, "epoch": 4359} {"train_loss": -7.040862560272217, "global_step": 183091, "epoch": 4359} {"train_loss": -7.076390743255615, "global_step": 183092, "epoch": 4359} {"train_loss": -6.998204231262207, "global_step": 183093, "epoch": 4359} {"train_loss": -7.03668212890625, "global_step": 183094, "epoch": 4359} {"train_loss": -7.162803649902344, "global_step": 183095, "epoch": 4359} {"train_loss": -7.0315937995910645, "global_step": 183096, "epoch": 4359} {"train_loss": -7.017527103424072, "global_step": 183097, "epoch": 4359} {"train_loss": -7.0787153244018555, "global_step": 183098, "epoch": 4359} {"train_loss": -7.031883716583252, "global_step": 183099, "epoch": 4359} {"train_loss": -6.964566707611084, "global_step": 183100, "epoch": 4359} {"train_loss": -7.089893341064453, "global_step": 183101, "epoch": 4359} {"train_loss": -7.055581092834473, "global_step": 183102, "epoch": 4359} {"train_loss": -6.943985939025879, "global_step": 183103, "epoch": 4359} {"train_loss": -6.984330654144287, "global_step": 183104, "epoch": 4359} {"train_loss": -7.077705383300781, "global_step": 183105, "epoch": 4359} {"train_loss": -7.01602840423584, "global_step": 183106, "epoch": 4359} {"train_loss": -7.041515350341797, "global_step": 183107, "epoch": 4359} {"train_loss": -7.020322799682617, "global_step": 183108, "epoch": 4359} {"train_loss": -6.924119472503662, "global_step": 183109, "epoch": 4359} {"train_loss": -6.889404296875, "global_step": 183110, "epoch": 4359} {"train_loss": -7.003006935119629, "global_step": 183111, "epoch": 4359} {"train_loss": -6.988800048828125, "global_step": 183112, "epoch": 4359} {"train_loss": -6.984828472137451, "global_step": 183113, "epoch": 4359} {"train_loss": -7.052699089050293, "global_step": 183114, "epoch": 4359} {"train_loss": -6.975648403167725, "global_step": 183115, "epoch": 4359} {"train_loss": -6.924094200134277, "global_step": 183116, "epoch": 4359} {"train_loss": -6.998960971832275, "global_step": 183117, "epoch": 4359} {"train_loss": -7.092073440551758, "global_step": 183118, "epoch": 4359} {"train_loss": -7.033852758861723, "global_step": 183119, "epoch": 4359, "val_loss": 68883.015625} {"train_loss": -7.002893447875977, "global_step": 183120, "epoch": 4360} {"train_loss": -7.02696418762207, "global_step": 183121, "epoch": 4360} {"train_loss": -7.113644599914551, "global_step": 183122, "epoch": 4360} {"train_loss": -6.952908515930176, "global_step": 183123, "epoch": 4360} {"train_loss": -6.855769157409668, "global_step": 183124, "epoch": 4360} {"train_loss": -7.092750072479248, "global_step": 183125, "epoch": 4360} {"train_loss": -7.083141326904297, "global_step": 183126, "epoch": 4360} {"train_loss": -7.167070388793945, "global_step": 183127, "epoch": 4360} {"train_loss": -7.112575054168701, "global_step": 183128, "epoch": 4360} {"train_loss": -7.130681037902832, "global_step": 183129, "epoch": 4360} {"train_loss": -6.9607415199279785, "global_step": 183130, "epoch": 4360} {"train_loss": -7.086136817932129, "global_step": 183131, "epoch": 4360} {"train_loss": -6.941840171813965, "global_step": 183132, "epoch": 4360} {"train_loss": -7.035830497741699, "global_step": 183133, "epoch": 4360} {"train_loss": -7.086122512817383, "global_step": 183134, "epoch": 4360} {"train_loss": -7.075882911682129, "global_step": 183135, "epoch": 4360} {"train_loss": -7.000389099121094, "global_step": 183136, "epoch": 4360} {"train_loss": -6.993445873260498, "global_step": 183137, "epoch": 4360} {"train_loss": -7.080733299255371, "global_step": 183138, "epoch": 4360} {"train_loss": -7.13123083114624, "global_step": 183139, "epoch": 4360} {"train_loss": -7.142131805419922, "global_step": 183140, "epoch": 4360} {"train_loss": -7.112419128417969, "global_step": 183141, "epoch": 4360} {"train_loss": -7.062286853790283, "global_step": 183142, "epoch": 4360} {"train_loss": -7.092001438140869, "global_step": 183143, "epoch": 4360} {"train_loss": -7.188108921051025, "global_step": 183144, "epoch": 4360} {"train_loss": -7.1096272468566895, "global_step": 183145, "epoch": 4360} {"train_loss": -7.069843769073486, "global_step": 183146, "epoch": 4360} {"train_loss": -7.0844879150390625, "global_step": 183147, "epoch": 4360} {"train_loss": -7.04719352722168, "global_step": 183148, "epoch": 4360} {"train_loss": -7.104682922363281, "global_step": 183149, "epoch": 4360} {"train_loss": -7.076486110687256, "global_step": 183150, "epoch": 4360} {"train_loss": -7.199008941650391, "global_step": 183151, "epoch": 4360} {"train_loss": -7.066159725189209, "global_step": 183152, "epoch": 4360} {"train_loss": -6.998366355895996, "global_step": 183153, "epoch": 4360} {"train_loss": -6.88609504699707, "global_step": 183154, "epoch": 4360} {"train_loss": -7.06552791595459, "global_step": 183155, "epoch": 4360} {"train_loss": -7.084491729736328, "global_step": 183156, "epoch": 4360} {"train_loss": -7.240520477294922, "global_step": 183157, "epoch": 4360} {"train_loss": -7.140993118286133, "global_step": 183158, "epoch": 4360} {"train_loss": -7.075113296508789, "global_step": 183159, "epoch": 4360} {"train_loss": -7.092225551605225, "global_step": 183160, "epoch": 4360} {"train_loss": -7.069139628183274, "global_step": 183161, "epoch": 4360, "val_loss": 68875.8359375} {"train_loss": -7.130056381225586, "global_step": 183162, "epoch": 4361} {"train_loss": -7.168240547180176, "global_step": 183163, "epoch": 4361} {"train_loss": -7.185160160064697, "global_step": 183164, "epoch": 4361} {"train_loss": -7.090212821960449, "global_step": 183165, "epoch": 4361} {"train_loss": -7.067047119140625, "global_step": 183166, "epoch": 4361} {"train_loss": -7.167973518371582, "global_step": 183167, "epoch": 4361} {"train_loss": -6.9907097816467285, "global_step": 183168, "epoch": 4361} {"train_loss": -7.186928749084473, "global_step": 183169, "epoch": 4361} {"train_loss": -7.16560173034668, "global_step": 183170, "epoch": 4361} {"train_loss": -7.07942533493042, "global_step": 183171, "epoch": 4361} {"train_loss": -7.099629878997803, "global_step": 183172, "epoch": 4361} {"train_loss": -7.1194539070129395, "global_step": 183173, "epoch": 4361} {"train_loss": -7.1581854820251465, "global_step": 183174, "epoch": 4361} {"train_loss": -7.110960483551025, "global_step": 183175, "epoch": 4361} {"train_loss": -7.122278213500977, "global_step": 183176, "epoch": 4361} {"train_loss": -7.189701080322266, "global_step": 183177, "epoch": 4361} {"train_loss": -7.215091705322266, "global_step": 183178, "epoch": 4361} {"train_loss": -7.079909324645996, "global_step": 183179, "epoch": 4361} {"train_loss": -7.116706371307373, "global_step": 183180, "epoch": 4361} {"train_loss": -7.0780744552612305, "global_step": 183181, "epoch": 4361} {"train_loss": -7.137138366699219, "global_step": 183182, "epoch": 4361} {"train_loss": -7.139064788818359, "global_step": 183183, "epoch": 4361} {"train_loss": -7.1130523681640625, "global_step": 183184, "epoch": 4361} {"train_loss": -7.207209587097168, "global_step": 183185, "epoch": 4361} {"train_loss": -7.14043664932251, "global_step": 183186, "epoch": 4361} {"train_loss": -7.180820941925049, "global_step": 183187, "epoch": 4361} {"train_loss": -7.204373359680176, "global_step": 183188, "epoch": 4361} {"train_loss": -7.005147933959961, "global_step": 183189, "epoch": 4361} {"train_loss": -7.216291427612305, "global_step": 183190, "epoch": 4361} {"train_loss": -7.118662357330322, "global_step": 183191, "epoch": 4361} {"train_loss": -7.0713791847229, "global_step": 183192, "epoch": 4361} {"train_loss": -7.088152885437012, "global_step": 183193, "epoch": 4361} {"train_loss": -7.13427734375, "global_step": 183194, "epoch": 4361} {"train_loss": -6.964896202087402, "global_step": 183195, "epoch": 4361} {"train_loss": -7.145571708679199, "global_step": 183196, "epoch": 4361} {"train_loss": -7.094888687133789, "global_step": 183197, "epoch": 4361} {"train_loss": -7.082289695739746, "global_step": 183198, "epoch": 4361} {"train_loss": -7.08131217956543, "global_step": 183199, "epoch": 4361} {"train_loss": -7.137850284576416, "global_step": 183200, "epoch": 4361} {"train_loss": -7.071285247802734, "global_step": 183201, "epoch": 4361} {"train_loss": -7.1287336349487305, "global_step": 183202, "epoch": 4361} {"train_loss": -7.1223044622512095, "global_step": 183203, "epoch": 4361, "val_loss": 68746.8984375} {"train_loss": -7.040712356567383, "global_step": 183204, "epoch": 4362} {"train_loss": -6.999261856079102, "global_step": 183205, "epoch": 4362} {"train_loss": -7.183304786682129, "global_step": 183206, "epoch": 4362} {"train_loss": -7.242859840393066, "global_step": 183207, "epoch": 4362} {"train_loss": -7.00929069519043, "global_step": 183208, "epoch": 4362} {"train_loss": -7.141257286071777, "global_step": 183209, "epoch": 4362} {"train_loss": -7.094704627990723, "global_step": 183210, "epoch": 4362} {"train_loss": -7.033441543579102, "global_step": 183211, "epoch": 4362} {"train_loss": -7.124527931213379, "global_step": 183212, "epoch": 4362} {"train_loss": -7.197984218597412, "global_step": 183213, "epoch": 4362} {"train_loss": -7.057530879974365, "global_step": 183214, "epoch": 4362} {"train_loss": -7.108882904052734, "global_step": 183215, "epoch": 4362} {"train_loss": -7.1934709548950195, "global_step": 183216, "epoch": 4362} {"train_loss": -7.028268814086914, "global_step": 183217, "epoch": 4362} {"train_loss": -6.988610744476318, "global_step": 183218, "epoch": 4362} {"train_loss": -6.950941562652588, "global_step": 183219, "epoch": 4362} {"train_loss": -7.103914260864258, "global_step": 183220, "epoch": 4362} {"train_loss": -6.926379680633545, "global_step": 183221, "epoch": 4362} {"train_loss": -6.947639465332031, "global_step": 183222, "epoch": 4362} {"train_loss": -7.055809497833252, "global_step": 183223, "epoch": 4362} {"train_loss": -7.051458358764648, "global_step": 183224, "epoch": 4362} {"train_loss": -6.9356513023376465, "global_step": 183225, "epoch": 4362} {"train_loss": -6.988732814788818, "global_step": 183226, "epoch": 4362} {"train_loss": -7.131991863250732, "global_step": 183227, "epoch": 4362} {"train_loss": -6.906733512878418, "global_step": 183228, "epoch": 4362} {"train_loss": -6.976861476898193, "global_step": 183229, "epoch": 4362} {"train_loss": -7.09426212310791, "global_step": 183230, "epoch": 4362} {"train_loss": -6.968910217285156, "global_step": 183231, "epoch": 4362} {"train_loss": -7.116941452026367, "global_step": 183232, "epoch": 4362} {"train_loss": -7.074993133544922, "global_step": 183233, "epoch": 4362} {"train_loss": -7.046006679534912, "global_step": 183234, "epoch": 4362} {"train_loss": -7.077284336090088, "global_step": 183235, "epoch": 4362} {"train_loss": -7.038339614868164, "global_step": 183236, "epoch": 4362} {"train_loss": -7.012337684631348, "global_step": 183237, "epoch": 4362} {"train_loss": -7.114426612854004, "global_step": 183238, "epoch": 4362} {"train_loss": -7.102207183837891, "global_step": 183239, "epoch": 4362} {"train_loss": -7.033663272857666, "global_step": 183240, "epoch": 4362} {"train_loss": -7.111708641052246, "global_step": 183241, "epoch": 4362} {"train_loss": -7.03338098526001, "global_step": 183242, "epoch": 4362} {"train_loss": -7.146676063537598, "global_step": 183243, "epoch": 4362} {"train_loss": -7.018701553344727, "global_step": 183244, "epoch": 4362} {"train_loss": -7.059199923560733, "global_step": 183245, "epoch": 4362, "val_loss": 68862.9609375} {"train_loss": -6.982783317565918, "global_step": 183246, "epoch": 4363} {"train_loss": -7.1616926193237305, "global_step": 183247, "epoch": 4363} {"train_loss": -7.099703311920166, "global_step": 183248, "epoch": 4363} {"train_loss": -6.975963592529297, "global_step": 183249, "epoch": 4363} {"train_loss": -7.124205589294434, "global_step": 183250, "epoch": 4363} {"train_loss": -7.178955078125, "global_step": 183251, "epoch": 4363} {"train_loss": -7.066439628601074, "global_step": 183252, "epoch": 4363} {"train_loss": -6.963812828063965, "global_step": 183253, "epoch": 4363} {"train_loss": -7.062967300415039, "global_step": 183254, "epoch": 4363} {"train_loss": -7.101501941680908, "global_step": 183255, "epoch": 4363} {"train_loss": -7.086190223693848, "global_step": 183256, "epoch": 4363} {"train_loss": -7.091334342956543, "global_step": 183257, "epoch": 4363} {"train_loss": -6.995268821716309, "global_step": 183258, "epoch": 4363} {"train_loss": -7.102218151092529, "global_step": 183259, "epoch": 4363} {"train_loss": -7.1478271484375, "global_step": 183260, "epoch": 4363} {"train_loss": -7.164506912231445, "global_step": 183261, "epoch": 4363} {"train_loss": -7.080618858337402, "global_step": 183262, "epoch": 4363} {"train_loss": -7.111332893371582, "global_step": 183263, "epoch": 4363} {"train_loss": -7.132877349853516, "global_step": 183264, "epoch": 4363} {"train_loss": -7.201622009277344, "global_step": 183265, "epoch": 4363} {"train_loss": -7.06852912902832, "global_step": 183266, "epoch": 4363} {"train_loss": -7.019923210144043, "global_step": 183267, "epoch": 4363} {"train_loss": -7.101325035095215, "global_step": 183268, "epoch": 4363} {"train_loss": -7.118894577026367, "global_step": 183269, "epoch": 4363} {"train_loss": -7.219606399536133, "global_step": 183270, "epoch": 4363} {"train_loss": -7.108450889587402, "global_step": 183271, "epoch": 4363} {"train_loss": -7.0265583992004395, "global_step": 183272, "epoch": 4363} {"train_loss": -7.128168106079102, "global_step": 183273, "epoch": 4363} {"train_loss": -7.134231090545654, "global_step": 183274, "epoch": 4363} {"train_loss": -7.173178672790527, "global_step": 183275, "epoch": 4363} {"train_loss": -7.152091979980469, "global_step": 183276, "epoch": 4363} {"train_loss": -7.139737129211426, "global_step": 183277, "epoch": 4363} {"train_loss": -7.056013107299805, "global_step": 183278, "epoch": 4363} {"train_loss": -7.167111396789551, "global_step": 183279, "epoch": 4363} {"train_loss": -7.212212562561035, "global_step": 183280, "epoch": 4363} {"train_loss": -7.168612957000732, "global_step": 183281, "epoch": 4363} {"train_loss": -7.014975070953369, "global_step": 183282, "epoch": 4363} {"train_loss": -7.13996696472168, "global_step": 183283, "epoch": 4363} {"train_loss": -7.041782379150391, "global_step": 183284, "epoch": 4363} {"train_loss": -7.078654766082764, "global_step": 183285, "epoch": 4363} {"train_loss": -7.201451301574707, "global_step": 183286, "epoch": 4363} {"train_loss": -7.103678737367902, "global_step": 183287, "epoch": 4363, "val_loss": 68967.5546875} {"train_loss": -7.170470237731934, "global_step": 183288, "epoch": 4364} {"train_loss": -7.093212604522705, "global_step": 183289, "epoch": 4364} {"train_loss": -7.138261795043945, "global_step": 183290, "epoch": 4364} {"train_loss": -7.113772392272949, "global_step": 183291, "epoch": 4364} {"train_loss": -7.0517191886901855, "global_step": 183292, "epoch": 4364} {"train_loss": -7.137539863586426, "global_step": 183293, "epoch": 4364} {"train_loss": -7.0090436935424805, "global_step": 183294, "epoch": 4364} {"train_loss": -7.06180477142334, "global_step": 183295, "epoch": 4364} {"train_loss": -7.238663673400879, "global_step": 183296, "epoch": 4364} {"train_loss": -7.056665420532227, "global_step": 183297, "epoch": 4364} {"train_loss": -7.169611930847168, "global_step": 183298, "epoch": 4364} {"train_loss": -7.104709625244141, "global_step": 183299, "epoch": 4364} {"train_loss": -7.1209797859191895, "global_step": 183300, "epoch": 4364} {"train_loss": -7.096248626708984, "global_step": 183301, "epoch": 4364} {"train_loss": -7.1387939453125, "global_step": 183302, "epoch": 4364} {"train_loss": -7.24639892578125, "global_step": 183303, "epoch": 4364} {"train_loss": -7.187894821166992, "global_step": 183304, "epoch": 4364} {"train_loss": -7.113846778869629, "global_step": 183305, "epoch": 4364} {"train_loss": -7.204578399658203, "global_step": 183306, "epoch": 4364} {"train_loss": -7.068823337554932, "global_step": 183307, "epoch": 4364} {"train_loss": -7.172252655029297, "global_step": 183308, "epoch": 4364} {"train_loss": -7.168404579162598, "global_step": 183309, "epoch": 4364} {"train_loss": -7.12367057800293, "global_step": 183310, "epoch": 4364} {"train_loss": -7.16848087310791, "global_step": 183311, "epoch": 4364} {"train_loss": -7.044449806213379, "global_step": 183312, "epoch": 4364} {"train_loss": -7.046092510223389, "global_step": 183313, "epoch": 4364} {"train_loss": -7.191355228424072, "global_step": 183314, "epoch": 4364} {"train_loss": -7.139311790466309, "global_step": 183315, "epoch": 4364} {"train_loss": -7.154053688049316, "global_step": 183316, "epoch": 4364} {"train_loss": -7.135800361633301, "global_step": 183317, "epoch": 4364} {"train_loss": -7.042168140411377, "global_step": 183318, "epoch": 4364} {"train_loss": -7.0315775871276855, "global_step": 183319, "epoch": 4364} {"train_loss": -7.044728755950928, "global_step": 183320, "epoch": 4364} {"train_loss": -7.092712879180908, "global_step": 183321, "epoch": 4364} {"train_loss": -7.098686695098877, "global_step": 183322, "epoch": 4364} {"train_loss": -7.0794830322265625, "global_step": 183323, "epoch": 4364} {"train_loss": -7.132510185241699, "global_step": 183324, "epoch": 4364} {"train_loss": -7.041979789733887, "global_step": 183325, "epoch": 4364} {"train_loss": -7.057231426239014, "global_step": 183326, "epoch": 4364} {"train_loss": -7.100216388702393, "global_step": 183327, "epoch": 4364} {"train_loss": -7.059169292449951, "global_step": 183328, "epoch": 4364} {"train_loss": -7.1145212309701105, "global_step": 183329, "epoch": 4364, "val_loss": 69036.2421875} {"train_loss": -7.111387729644775, "global_step": 183330, "epoch": 4365} {"train_loss": -7.120160102844238, "global_step": 183331, "epoch": 4365} {"train_loss": -7.160358428955078, "global_step": 183332, "epoch": 4365} {"train_loss": -7.069516181945801, "global_step": 183333, "epoch": 4365} {"train_loss": -7.047828674316406, "global_step": 183334, "epoch": 4365} {"train_loss": -7.092231750488281, "global_step": 183335, "epoch": 4365} {"train_loss": -7.143614768981934, "global_step": 183336, "epoch": 4365} {"train_loss": -7.114437103271484, "global_step": 183337, "epoch": 4365} {"train_loss": -7.178840637207031, "global_step": 183338, "epoch": 4365} {"train_loss": -7.11100959777832, "global_step": 183339, "epoch": 4365} {"train_loss": -7.022967338562012, "global_step": 183340, "epoch": 4365} {"train_loss": -7.174948692321777, "global_step": 183341, "epoch": 4365} {"train_loss": -7.155035972595215, "global_step": 183342, "epoch": 4365} {"train_loss": -7.097969055175781, "global_step": 183343, "epoch": 4365} {"train_loss": -7.1018171310424805, "global_step": 183344, "epoch": 4365} {"train_loss": -7.014875411987305, "global_step": 183345, "epoch": 4365} {"train_loss": -7.176321506500244, "global_step": 183346, "epoch": 4365} {"train_loss": -7.119200229644775, "global_step": 183347, "epoch": 4365} {"train_loss": -6.918931007385254, "global_step": 183348, "epoch": 4365} {"train_loss": -7.075093746185303, "global_step": 183349, "epoch": 4365} {"train_loss": -7.135433197021484, "global_step": 183350, "epoch": 4365} {"train_loss": -6.992799758911133, "global_step": 183351, "epoch": 4365} {"train_loss": -7.113636016845703, "global_step": 183352, "epoch": 4365} {"train_loss": -6.955124855041504, "global_step": 183353, "epoch": 4365} {"train_loss": -7.101289749145508, "global_step": 183354, "epoch": 4365} {"train_loss": -7.067073822021484, "global_step": 183355, "epoch": 4365} {"train_loss": -7.049760818481445, "global_step": 183356, "epoch": 4365} {"train_loss": -7.035839080810547, "global_step": 183357, "epoch": 4365} {"train_loss": -7.041367530822754, "global_step": 183358, "epoch": 4365} {"train_loss": -7.059054374694824, "global_step": 183359, "epoch": 4365} {"train_loss": -7.020026206970215, "global_step": 183360, "epoch": 4365} {"train_loss": -7.067234992980957, "global_step": 183361, "epoch": 4365} {"train_loss": -7.037010669708252, "global_step": 183362, "epoch": 4365} {"train_loss": -7.029618740081787, "global_step": 183363, "epoch": 4365} {"train_loss": -7.055561542510986, "global_step": 183364, "epoch": 4365} {"train_loss": -7.112499713897705, "global_step": 183365, "epoch": 4365} {"train_loss": -7.086742401123047, "global_step": 183366, "epoch": 4365} {"train_loss": -7.142655372619629, "global_step": 183367, "epoch": 4365} {"train_loss": -7.013445854187012, "global_step": 183368, "epoch": 4365} {"train_loss": -7.054292678833008, "global_step": 183369, "epoch": 4365} {"train_loss": -7.222999572753906, "global_step": 183370, "epoch": 4365} {"train_loss": -7.08634817032587, "global_step": 183371, "epoch": 4365, "val_loss": 68744.71875} {"train_loss": -7.0279340744018555, "global_step": 183372, "epoch": 4366} {"train_loss": -7.10224723815918, "global_step": 183373, "epoch": 4366} {"train_loss": -7.012057304382324, "global_step": 183374, "epoch": 4366} {"train_loss": -7.054222106933594, "global_step": 183375, "epoch": 4366} {"train_loss": -6.984305381774902, "global_step": 183376, "epoch": 4366} {"train_loss": -7.062183856964111, "global_step": 183377, "epoch": 4366} {"train_loss": -7.0587663650512695, "global_step": 183378, "epoch": 4366} {"train_loss": -7.063634395599365, "global_step": 183379, "epoch": 4366} {"train_loss": -7.134217262268066, "global_step": 183380, "epoch": 4366} {"train_loss": -7.147204399108887, "global_step": 183381, "epoch": 4366} {"train_loss": -6.972128868103027, "global_step": 183382, "epoch": 4366} {"train_loss": -7.169904708862305, "global_step": 183383, "epoch": 4366} {"train_loss": -6.953235626220703, "global_step": 183384, "epoch": 4366} {"train_loss": -7.130036354064941, "global_step": 183385, "epoch": 4366} {"train_loss": -7.0616841316223145, "global_step": 183386, "epoch": 4366} {"train_loss": -7.00581169128418, "global_step": 183387, "epoch": 4366} {"train_loss": -7.103715419769287, "global_step": 183388, "epoch": 4366} {"train_loss": -7.164050102233887, "global_step": 183389, "epoch": 4366} {"train_loss": -7.032662868499756, "global_step": 183390, "epoch": 4366} {"train_loss": -7.096464157104492, "global_step": 183391, "epoch": 4366} {"train_loss": -7.0482964515686035, "global_step": 183392, "epoch": 4366} {"train_loss": -7.079408168792725, "global_step": 183393, "epoch": 4366} {"train_loss": -7.222591400146484, "global_step": 183394, "epoch": 4366} {"train_loss": -7.100860595703125, "global_step": 183395, "epoch": 4366} {"train_loss": -7.085907936096191, "global_step": 183396, "epoch": 4366} {"train_loss": -7.0351996421813965, "global_step": 183397, "epoch": 4366} {"train_loss": -7.071235656738281, "global_step": 183398, "epoch": 4366} {"train_loss": -7.078921318054199, "global_step": 183399, "epoch": 4366} {"train_loss": -7.093450546264648, "global_step": 183400, "epoch": 4366} {"train_loss": -7.0077691078186035, "global_step": 183401, "epoch": 4366} {"train_loss": -7.098816871643066, "global_step": 183402, "epoch": 4366} {"train_loss": -7.132272720336914, "global_step": 183403, "epoch": 4366} {"train_loss": -7.11744499206543, "global_step": 183404, "epoch": 4366} {"train_loss": -7.2202348709106445, "global_step": 183405, "epoch": 4366} {"train_loss": -7.116684913635254, "global_step": 183406, "epoch": 4366} {"train_loss": -7.120756149291992, "global_step": 183407, "epoch": 4366} {"train_loss": -7.127587795257568, "global_step": 183408, "epoch": 4366} {"train_loss": -7.105429649353027, "global_step": 183409, "epoch": 4366} {"train_loss": -7.21774959564209, "global_step": 183410, "epoch": 4366} {"train_loss": -7.247170925140381, "global_step": 183411, "epoch": 4366} {"train_loss": -7.147793769836426, "global_step": 183412, "epoch": 4366} {"train_loss": -7.094656217665899, "global_step": 183413, "epoch": 4366, "val_loss": 68864.125} {"train_loss": -7.283092975616455, "global_step": 183414, "epoch": 4367} {"train_loss": -7.244095802307129, "global_step": 183415, "epoch": 4367} {"train_loss": -7.170076370239258, "global_step": 183416, "epoch": 4367} {"train_loss": -7.167140007019043, "global_step": 183417, "epoch": 4367} {"train_loss": -7.128786563873291, "global_step": 183418, "epoch": 4367} {"train_loss": -7.325381278991699, "global_step": 183419, "epoch": 4367} {"train_loss": -7.18477725982666, "global_step": 183420, "epoch": 4367} {"train_loss": -7.154272079467773, "global_step": 183421, "epoch": 4367} {"train_loss": -7.073953151702881, "global_step": 183422, "epoch": 4367} {"train_loss": -7.22029972076416, "global_step": 183423, "epoch": 4367} {"train_loss": -7.144866943359375, "global_step": 183424, "epoch": 4367} {"train_loss": -7.1908159255981445, "global_step": 183425, "epoch": 4367} {"train_loss": -7.032898902893066, "global_step": 183426, "epoch": 4367} {"train_loss": -7.1671929359436035, "global_step": 183427, "epoch": 4367} {"train_loss": -7.208608627319336, "global_step": 183428, "epoch": 4367} {"train_loss": -7.058423042297363, "global_step": 183429, "epoch": 4367} {"train_loss": -6.957094192504883, "global_step": 183430, "epoch": 4367} {"train_loss": -6.959959983825684, "global_step": 183431, "epoch": 4367} {"train_loss": -7.043715476989746, "global_step": 183432, "epoch": 4367} {"train_loss": -7.032845497131348, "global_step": 183433, "epoch": 4367} {"train_loss": -7.10772705078125, "global_step": 183434, "epoch": 4367} {"train_loss": -6.992341995239258, "global_step": 183435, "epoch": 4367} {"train_loss": -6.980360984802246, "global_step": 183436, "epoch": 4367} {"train_loss": -7.0831685066223145, "global_step": 183437, "epoch": 4367} {"train_loss": -7.083438873291016, "global_step": 183438, "epoch": 4367} {"train_loss": -7.10399866104126, "global_step": 183439, "epoch": 4367} {"train_loss": -6.920073986053467, "global_step": 183440, "epoch": 4367} {"train_loss": -6.93947696685791, "global_step": 183441, "epoch": 4367} {"train_loss": -7.1353864669799805, "global_step": 183442, "epoch": 4367} {"train_loss": -7.089277744293213, "global_step": 183443, "epoch": 4367} {"train_loss": -7.02281379699707, "global_step": 183444, "epoch": 4367} {"train_loss": -6.963639259338379, "global_step": 183445, "epoch": 4367} {"train_loss": -7.262470245361328, "global_step": 183446, "epoch": 4367} {"train_loss": -7.115751266479492, "global_step": 183447, "epoch": 4367} {"train_loss": -6.992786884307861, "global_step": 183448, "epoch": 4367} {"train_loss": -7.180199146270752, "global_step": 183449, "epoch": 4367} {"train_loss": -6.9621477127075195, "global_step": 183450, "epoch": 4367} {"train_loss": -7.027401924133301, "global_step": 183451, "epoch": 4367} {"train_loss": -7.034369468688965, "global_step": 183452, "epoch": 4367} {"train_loss": -6.983643531799316, "global_step": 183453, "epoch": 4367} {"train_loss": -7.142619609832764, "global_step": 183454, "epoch": 4367} {"train_loss": -7.091388509387062, "global_step": 183455, "epoch": 4367, "val_loss": 68843.6015625} {"train_loss": -7.132025718688965, "global_step": 183456, "epoch": 4368} {"train_loss": -6.9976806640625, "global_step": 183457, "epoch": 4368} {"train_loss": -7.05042839050293, "global_step": 183458, "epoch": 4368} {"train_loss": -7.1649370193481445, "global_step": 183459, "epoch": 4368} {"train_loss": -6.9686665534973145, "global_step": 183460, "epoch": 4368} {"train_loss": -6.983299255371094, "global_step": 183461, "epoch": 4368} {"train_loss": -7.020918369293213, "global_step": 183462, "epoch": 4368} {"train_loss": -7.033414840698242, "global_step": 183463, "epoch": 4368} {"train_loss": -7.004860877990723, "global_step": 183464, "epoch": 4368} {"train_loss": -6.882610321044922, "global_step": 183465, "epoch": 4368} {"train_loss": -7.0850725173950195, "global_step": 183466, "epoch": 4368} {"train_loss": -6.964735507965088, "global_step": 183467, "epoch": 4368} {"train_loss": -7.034224510192871, "global_step": 183468, "epoch": 4368} {"train_loss": -6.8596110343933105, "global_step": 183469, "epoch": 4368} {"train_loss": -6.747057914733887, "global_step": 183470, "epoch": 4368} {"train_loss": -7.045858383178711, "global_step": 183471, "epoch": 4368} {"train_loss": -6.841704845428467, "global_step": 183472, "epoch": 4368} {"train_loss": -6.9945573806762695, "global_step": 183473, "epoch": 4368} {"train_loss": -7.032819747924805, "global_step": 183474, "epoch": 4368} {"train_loss": -6.8826751708984375, "global_step": 183475, "epoch": 4368} {"train_loss": -7.006448745727539, "global_step": 183476, "epoch": 4368} {"train_loss": -6.967310905456543, "global_step": 183477, "epoch": 4368} {"train_loss": -6.9893341064453125, "global_step": 183478, "epoch": 4368} {"train_loss": -7.004444122314453, "global_step": 183479, "epoch": 4368} {"train_loss": -6.929642677307129, "global_step": 183480, "epoch": 4368} {"train_loss": -6.899026870727539, "global_step": 183481, "epoch": 4368} {"train_loss": -7.0514936447143555, "global_step": 183482, "epoch": 4368} {"train_loss": -6.982213973999023, "global_step": 183483, "epoch": 4368} {"train_loss": -6.911928176879883, "global_step": 183484, "epoch": 4368} {"train_loss": -7.084607124328613, "global_step": 183485, "epoch": 4368} {"train_loss": -6.996936798095703, "global_step": 183486, "epoch": 4368} {"train_loss": -6.9950480461120605, "global_step": 183487, "epoch": 4368} {"train_loss": -7.115112781524658, "global_step": 183488, "epoch": 4368} {"train_loss": -7.042819499969482, "global_step": 183489, "epoch": 4368} {"train_loss": -6.962749004364014, "global_step": 183490, "epoch": 4368} {"train_loss": -6.909069061279297, "global_step": 183491, "epoch": 4368} {"train_loss": -7.069589614868164, "global_step": 183492, "epoch": 4368} {"train_loss": -6.875439643859863, "global_step": 183493, "epoch": 4368} {"train_loss": -6.926509380340576, "global_step": 183494, "epoch": 4368} {"train_loss": -7.004843711853027, "global_step": 183495, "epoch": 4368} {"train_loss": -7.013823509216309, "global_step": 183496, "epoch": 4368} {"train_loss": -6.988739728927612, "global_step": 183497, "epoch": 4368, "val_loss": 68843.9609375} {"train_loss": -6.9788994789123535, "global_step": 183498, "epoch": 4369} {"train_loss": -7.050692558288574, "global_step": 183499, "epoch": 4369} {"train_loss": -6.947783470153809, "global_step": 183500, "epoch": 4369} {"train_loss": -7.055702209472656, "global_step": 183501, "epoch": 4369} {"train_loss": -6.956877708435059, "global_step": 183502, "epoch": 4369} {"train_loss": -7.138266563415527, "global_step": 183503, "epoch": 4369} {"train_loss": -6.99597692489624, "global_step": 183504, "epoch": 4369} {"train_loss": -6.849359512329102, "global_step": 183505, "epoch": 4369} {"train_loss": -6.991983413696289, "global_step": 183506, "epoch": 4369} {"train_loss": -7.00435733795166, "global_step": 183507, "epoch": 4369} {"train_loss": -7.013354778289795, "global_step": 183508, "epoch": 4369} {"train_loss": -7.096902847290039, "global_step": 183509, "epoch": 4369} {"train_loss": -7.002012252807617, "global_step": 183510, "epoch": 4369} {"train_loss": -7.059935569763184, "global_step": 183511, "epoch": 4369} {"train_loss": -7.094354629516602, "global_step": 183512, "epoch": 4369} {"train_loss": -7.056192874908447, "global_step": 183513, "epoch": 4369} {"train_loss": -7.065672874450684, "global_step": 183514, "epoch": 4369} {"train_loss": -7.101203441619873, "global_step": 183515, "epoch": 4369} {"train_loss": -7.069437026977539, "global_step": 183516, "epoch": 4369} {"train_loss": -7.09065055847168, "global_step": 183517, "epoch": 4369} {"train_loss": -7.043188571929932, "global_step": 183518, "epoch": 4369} {"train_loss": -7.107247352600098, "global_step": 183519, "epoch": 4369} {"train_loss": -7.082958221435547, "global_step": 183520, "epoch": 4369} {"train_loss": -7.0081610679626465, "global_step": 183521, "epoch": 4369} {"train_loss": -7.094094753265381, "global_step": 183522, "epoch": 4369} {"train_loss": -7.094768524169922, "global_step": 183523, "epoch": 4369} {"train_loss": -7.214982986450195, "global_step": 183524, "epoch": 4369} {"train_loss": -7.095078468322754, "global_step": 183525, "epoch": 4369} {"train_loss": -7.152735710144043, "global_step": 183526, "epoch": 4369} {"train_loss": -7.132260322570801, "global_step": 183527, "epoch": 4369} {"train_loss": -7.16741943359375, "global_step": 183528, "epoch": 4369} {"train_loss": -7.170180320739746, "global_step": 183529, "epoch": 4369} {"train_loss": -7.146482467651367, "global_step": 183530, "epoch": 4369} {"train_loss": -7.0893025398254395, "global_step": 183531, "epoch": 4369} {"train_loss": -7.197546005249023, "global_step": 183532, "epoch": 4369} {"train_loss": -7.164855003356934, "global_step": 183533, "epoch": 4369} {"train_loss": -7.068730354309082, "global_step": 183534, "epoch": 4369} {"train_loss": -7.130411624908447, "global_step": 183535, "epoch": 4369} {"train_loss": -7.171820640563965, "global_step": 183536, "epoch": 4369} {"train_loss": -7.127722263336182, "global_step": 183537, "epoch": 4369} {"train_loss": -7.240683555603027, "global_step": 183538, "epoch": 4369} {"train_loss": -7.0802894206274125, "global_step": 183539, "epoch": 4369, "val_loss": 68665.3515625} {"train_loss": -7.140485763549805, "global_step": 183540, "epoch": 4370} {"train_loss": -7.0971879959106445, "global_step": 183541, "epoch": 4370} {"train_loss": -7.090915203094482, "global_step": 183542, "epoch": 4370} {"train_loss": -7.137375831604004, "global_step": 183543, "epoch": 4370} {"train_loss": -7.207921028137207, "global_step": 183544, "epoch": 4370} {"train_loss": -7.086334228515625, "global_step": 183545, "epoch": 4370} {"train_loss": -7.143505096435547, "global_step": 183546, "epoch": 4370} {"train_loss": -7.126406669616699, "global_step": 183547, "epoch": 4370} {"train_loss": -7.170284271240234, "global_step": 183548, "epoch": 4370} {"train_loss": -7.084527492523193, "global_step": 183549, "epoch": 4370} {"train_loss": -7.15418815612793, "global_step": 183550, "epoch": 4370} {"train_loss": -7.144626140594482, "global_step": 183551, "epoch": 4370} {"train_loss": -7.21177339553833, "global_step": 183552, "epoch": 4370} {"train_loss": -7.103721618652344, "global_step": 183553, "epoch": 4370} {"train_loss": -7.057186603546143, "global_step": 183554, "epoch": 4370} {"train_loss": -7.058623790740967, "global_step": 183555, "epoch": 4370} {"train_loss": -7.196990966796875, "global_step": 183556, "epoch": 4370} {"train_loss": -7.110912322998047, "global_step": 183557, "epoch": 4370} {"train_loss": -7.083352565765381, "global_step": 183558, "epoch": 4370} {"train_loss": -7.167366981506348, "global_step": 183559, "epoch": 4370} {"train_loss": -7.220025062561035, "global_step": 183560, "epoch": 4370} {"train_loss": -7.244144439697266, "global_step": 183561, "epoch": 4370} {"train_loss": -7.211881637573242, "global_step": 183562, "epoch": 4370} {"train_loss": -7.123230457305908, "global_step": 183563, "epoch": 4370} {"train_loss": -7.105376720428467, "global_step": 183564, "epoch": 4370} {"train_loss": -7.097711086273193, "global_step": 183565, "epoch": 4370} {"train_loss": -7.0881147384643555, "global_step": 183566, "epoch": 4370} {"train_loss": -7.043138027191162, "global_step": 183567, "epoch": 4370} {"train_loss": -7.132551670074463, "global_step": 183568, "epoch": 4370} {"train_loss": -7.197075843811035, "global_step": 183569, "epoch": 4370} {"train_loss": -7.035650253295898, "global_step": 183570, "epoch": 4370} {"train_loss": -7.032015800476074, "global_step": 183571, "epoch": 4370} {"train_loss": -7.2243828773498535, "global_step": 183572, "epoch": 4370} {"train_loss": -7.155920028686523, "global_step": 183573, "epoch": 4370} {"train_loss": -7.06037712097168, "global_step": 183574, "epoch": 4370} {"train_loss": -7.128045082092285, "global_step": 183575, "epoch": 4370} {"train_loss": -7.106090068817139, "global_step": 183576, "epoch": 4370} {"train_loss": -7.033823013305664, "global_step": 183577, "epoch": 4370} {"train_loss": -7.072752475738525, "global_step": 183578, "epoch": 4370} {"train_loss": -7.080961227416992, "global_step": 183579, "epoch": 4370} {"train_loss": -7.13585901260376, "global_step": 183580, "epoch": 4370} {"train_loss": -7.124030726296561, "global_step": 183581, "epoch": 4370, "val_loss": 68925.7109375} {"train_loss": -7.1248931884765625, "global_step": 183582, "epoch": 4371} {"train_loss": -7.040864944458008, "global_step": 183583, "epoch": 4371} {"train_loss": -7.122941017150879, "global_step": 183584, "epoch": 4371} {"train_loss": -7.074074745178223, "global_step": 183585, "epoch": 4371} {"train_loss": -7.024299621582031, "global_step": 183586, "epoch": 4371} {"train_loss": -7.006091594696045, "global_step": 183587, "epoch": 4371} {"train_loss": -7.147272109985352, "global_step": 183588, "epoch": 4371} {"train_loss": -7.104987621307373, "global_step": 183589, "epoch": 4371} {"train_loss": -7.024524688720703, "global_step": 183590, "epoch": 4371} {"train_loss": -7.11610221862793, "global_step": 183591, "epoch": 4371} {"train_loss": -6.9654412269592285, "global_step": 183592, "epoch": 4371} {"train_loss": -7.18421745300293, "global_step": 183593, "epoch": 4371} {"train_loss": -7.107903480529785, "global_step": 183594, "epoch": 4371} {"train_loss": -6.9905686378479, "global_step": 183595, "epoch": 4371} {"train_loss": -7.2139763832092285, "global_step": 183596, "epoch": 4371} {"train_loss": -7.0068817138671875, "global_step": 183597, "epoch": 4371} {"train_loss": -7.1181464195251465, "global_step": 183598, "epoch": 4371} {"train_loss": -7.120155334472656, "global_step": 183599, "epoch": 4371} {"train_loss": -7.053438186645508, "global_step": 183600, "epoch": 4371} {"train_loss": -7.184317588806152, "global_step": 183601, "epoch": 4371} {"train_loss": -7.046687126159668, "global_step": 183602, "epoch": 4371} {"train_loss": -7.0998640060424805, "global_step": 183603, "epoch": 4371} {"train_loss": -7.142267227172852, "global_step": 183604, "epoch": 4371} {"train_loss": -7.111808776855469, "global_step": 183605, "epoch": 4371} {"train_loss": -7.145488739013672, "global_step": 183606, "epoch": 4371} {"train_loss": -7.020527362823486, "global_step": 183607, "epoch": 4371} {"train_loss": -7.085112571716309, "global_step": 183608, "epoch": 4371} {"train_loss": -7.092113494873047, "global_step": 183609, "epoch": 4371} {"train_loss": -7.012209892272949, "global_step": 183610, "epoch": 4371} {"train_loss": -7.125914573669434, "global_step": 183611, "epoch": 4371} {"train_loss": -6.925121784210205, "global_step": 183612, "epoch": 4371} {"train_loss": -7.168332576751709, "global_step": 183613, "epoch": 4371} {"train_loss": -7.170958995819092, "global_step": 183614, "epoch": 4371} {"train_loss": -6.904448986053467, "global_step": 183615, "epoch": 4371} {"train_loss": -7.149466514587402, "global_step": 183616, "epoch": 4371} {"train_loss": -7.0718817710876465, "global_step": 183617, "epoch": 4371} {"train_loss": -7.050978183746338, "global_step": 183618, "epoch": 4371} {"train_loss": -7.127191543579102, "global_step": 183619, "epoch": 4371} {"train_loss": -7.05904483795166, "global_step": 183620, "epoch": 4371} {"train_loss": -6.898385047912598, "global_step": 183621, "epoch": 4371} {"train_loss": -7.090261459350586, "global_step": 183622, "epoch": 4371} {"train_loss": -7.07640738714309, "global_step": 183623, "epoch": 4371, "val_loss": 68738.28125} {"train_loss": -6.955508232116699, "global_step": 183624, "epoch": 4372} {"train_loss": -7.019670486450195, "global_step": 183625, "epoch": 4372} {"train_loss": -7.014164447784424, "global_step": 183626, "epoch": 4372} {"train_loss": -7.03596305847168, "global_step": 183627, "epoch": 4372} {"train_loss": -7.008963584899902, "global_step": 183628, "epoch": 4372} {"train_loss": -7.039945602416992, "global_step": 183629, "epoch": 4372} {"train_loss": -6.840941429138184, "global_step": 183630, "epoch": 4372} {"train_loss": -7.050965309143066, "global_step": 183631, "epoch": 4372} {"train_loss": -6.792665958404541, "global_step": 183632, "epoch": 4372} {"train_loss": -7.07064962387085, "global_step": 183633, "epoch": 4372} {"train_loss": -7.017798900604248, "global_step": 183634, "epoch": 4372} {"train_loss": -6.881600856781006, "global_step": 183635, "epoch": 4372} {"train_loss": -7.103889465332031, "global_step": 183636, "epoch": 4372} {"train_loss": -7.042294979095459, "global_step": 183637, "epoch": 4372} {"train_loss": -7.001456260681152, "global_step": 183638, "epoch": 4372} {"train_loss": -6.978342056274414, "global_step": 183639, "epoch": 4372} {"train_loss": -7.089893341064453, "global_step": 183640, "epoch": 4372} {"train_loss": -6.953686714172363, "global_step": 183641, "epoch": 4372} {"train_loss": -6.914470195770264, "global_step": 183642, "epoch": 4372} {"train_loss": -6.895602226257324, "global_step": 183643, "epoch": 4372} {"train_loss": -6.970892429351807, "global_step": 183644, "epoch": 4372} {"train_loss": -6.957239151000977, "global_step": 183645, "epoch": 4372} {"train_loss": -6.811797142028809, "global_step": 183646, "epoch": 4372} {"train_loss": -6.9404191970825195, "global_step": 183647, "epoch": 4372} {"train_loss": -6.915521144866943, "global_step": 183648, "epoch": 4372} {"train_loss": -7.044775485992432, "global_step": 183649, "epoch": 4372} {"train_loss": -6.949462890625, "global_step": 183650, "epoch": 4372} {"train_loss": -6.981592178344727, "global_step": 183651, "epoch": 4372} {"train_loss": -7.042877674102783, "global_step": 183652, "epoch": 4372} {"train_loss": -7.04286003112793, "global_step": 183653, "epoch": 4372} {"train_loss": -6.893368721008301, "global_step": 183654, "epoch": 4372} {"train_loss": -7.031760215759277, "global_step": 183655, "epoch": 4372} {"train_loss": -6.907894134521484, "global_step": 183656, "epoch": 4372} {"train_loss": -7.06838321685791, "global_step": 183657, "epoch": 4372} {"train_loss": -7.056021690368652, "global_step": 183658, "epoch": 4372} {"train_loss": -6.997009754180908, "global_step": 183659, "epoch": 4372} {"train_loss": -7.036655426025391, "global_step": 183660, "epoch": 4372} {"train_loss": -7.031146049499512, "global_step": 183661, "epoch": 4372} {"train_loss": -7.076284408569336, "global_step": 183662, "epoch": 4372} {"train_loss": -6.942722320556641, "global_step": 183663, "epoch": 4372} {"train_loss": -7.163359642028809, "global_step": 183664, "epoch": 4372} {"train_loss": -6.990418445496332, "global_step": 183665, "epoch": 4372, "val_loss": 68771.734375} {"train_loss": -7.103805065155029, "global_step": 183666, "epoch": 4373} {"train_loss": -7.135926246643066, "global_step": 183667, "epoch": 4373} {"train_loss": -7.096055507659912, "global_step": 183668, "epoch": 4373} {"train_loss": -7.061941146850586, "global_step": 183669, "epoch": 4373} {"train_loss": -6.991912841796875, "global_step": 183670, "epoch": 4373} {"train_loss": -7.211219310760498, "global_step": 183671, "epoch": 4373} {"train_loss": -7.0938825607299805, "global_step": 183672, "epoch": 4373} {"train_loss": -7.058946132659912, "global_step": 183673, "epoch": 4373} {"train_loss": -7.138857841491699, "global_step": 183674, "epoch": 4373} {"train_loss": -7.127444267272949, "global_step": 183675, "epoch": 4373} {"train_loss": -7.123973369598389, "global_step": 183676, "epoch": 4373} {"train_loss": -7.109640121459961, "global_step": 183677, "epoch": 4373} {"train_loss": -7.152304649353027, "global_step": 183678, "epoch": 4373} {"train_loss": -7.041518688201904, "global_step": 183679, "epoch": 4373} {"train_loss": -7.092307090759277, "global_step": 183680, "epoch": 4373} {"train_loss": -7.087124824523926, "global_step": 183681, "epoch": 4373} {"train_loss": -7.1363525390625, "global_step": 183682, "epoch": 4373} {"train_loss": -7.1060590744018555, "global_step": 183683, "epoch": 4373} {"train_loss": -6.982113361358643, "global_step": 183684, "epoch": 4373} {"train_loss": -7.071829795837402, "global_step": 183685, "epoch": 4373} {"train_loss": -7.011389255523682, "global_step": 183686, "epoch": 4373} {"train_loss": -7.099970817565918, "global_step": 183687, "epoch": 4373} {"train_loss": -7.070444107055664, "global_step": 183688, "epoch": 4373} {"train_loss": -7.12928581237793, "global_step": 183689, "epoch": 4373} {"train_loss": -7.073553085327148, "global_step": 183690, "epoch": 4373} {"train_loss": -7.113867282867432, "global_step": 183691, "epoch": 4373} {"train_loss": -7.030885219573975, "global_step": 183692, "epoch": 4373} {"train_loss": -7.161301612854004, "global_step": 183693, "epoch": 4373} {"train_loss": -7.177355766296387, "global_step": 183694, "epoch": 4373} {"train_loss": -7.108378887176514, "global_step": 183695, "epoch": 4373} {"train_loss": -7.096202373504639, "global_step": 183696, "epoch": 4373} {"train_loss": -7.0043439865112305, "global_step": 183697, "epoch": 4373} {"train_loss": -7.0903520584106445, "global_step": 183698, "epoch": 4373} {"train_loss": -6.965167999267578, "global_step": 183699, "epoch": 4373} {"train_loss": -7.091192245483398, "global_step": 183700, "epoch": 4373} {"train_loss": -7.092643737792969, "global_step": 183701, "epoch": 4373} {"train_loss": -7.119168758392334, "global_step": 183702, "epoch": 4373} {"train_loss": -7.111064434051514, "global_step": 183703, "epoch": 4373} {"train_loss": -7.051790237426758, "global_step": 183704, "epoch": 4373} {"train_loss": -7.183535575866699, "global_step": 183705, "epoch": 4373} {"train_loss": -7.181571006774902, "global_step": 183706, "epoch": 4373} {"train_loss": -7.093211900620234, "global_step": 183707, "epoch": 4373, "val_loss": 68672.421875} {"train_loss": -7.081703186035156, "global_step": 183708, "epoch": 4374} {"train_loss": -7.059139251708984, "global_step": 183709, "epoch": 4374} {"train_loss": -7.124566078186035, "global_step": 183710, "epoch": 4374} {"train_loss": -7.06313419342041, "global_step": 183711, "epoch": 4374} {"train_loss": -7.150286674499512, "global_step": 183712, "epoch": 4374} {"train_loss": -7.06028938293457, "global_step": 183713, "epoch": 4374} {"train_loss": -7.112733840942383, "global_step": 183714, "epoch": 4374} {"train_loss": -7.116513729095459, "global_step": 183715, "epoch": 4374} {"train_loss": -7.029388427734375, "global_step": 183716, "epoch": 4374} {"train_loss": -7.091944694519043, "global_step": 183717, "epoch": 4374} {"train_loss": -7.059781074523926, "global_step": 183718, "epoch": 4374} {"train_loss": -7.037951469421387, "global_step": 183719, "epoch": 4374} {"train_loss": -7.154916763305664, "global_step": 183720, "epoch": 4374} {"train_loss": -7.143556594848633, "global_step": 183721, "epoch": 4374} {"train_loss": -7.015223026275635, "global_step": 183722, "epoch": 4374} {"train_loss": -7.1690568923950195, "global_step": 183723, "epoch": 4374} {"train_loss": -7.088567733764648, "global_step": 183724, "epoch": 4374} {"train_loss": -7.0941901206970215, "global_step": 183725, "epoch": 4374} {"train_loss": -7.222329139709473, "global_step": 183726, "epoch": 4374} {"train_loss": -7.050498008728027, "global_step": 183727, "epoch": 4374} {"train_loss": -7.2477593421936035, "global_step": 183728, "epoch": 4374} {"train_loss": -7.108386993408203, "global_step": 183729, "epoch": 4374} {"train_loss": -7.129765510559082, "global_step": 183730, "epoch": 4374} {"train_loss": -7.174400806427002, "global_step": 183731, "epoch": 4374} {"train_loss": -7.130570888519287, "global_step": 183732, "epoch": 4374} {"train_loss": -7.145084381103516, "global_step": 183733, "epoch": 4374} {"train_loss": -7.1267595291137695, "global_step": 183734, "epoch": 4374} {"train_loss": -7.168570518493652, "global_step": 183735, "epoch": 4374} {"train_loss": -7.163478374481201, "global_step": 183736, "epoch": 4374} {"train_loss": -7.194738388061523, "global_step": 183737, "epoch": 4374} {"train_loss": -7.188201904296875, "global_step": 183738, "epoch": 4374} {"train_loss": -7.010875701904297, "global_step": 183739, "epoch": 4374} {"train_loss": -7.103760719299316, "global_step": 183740, "epoch": 4374} {"train_loss": -7.047126293182373, "global_step": 183741, "epoch": 4374} {"train_loss": -7.0800676345825195, "global_step": 183742, "epoch": 4374} {"train_loss": -7.079131603240967, "global_step": 183743, "epoch": 4374} {"train_loss": -7.011924743652344, "global_step": 183744, "epoch": 4374} {"train_loss": -7.136700630187988, "global_step": 183745, "epoch": 4374} {"train_loss": -7.094371795654297, "global_step": 183746, "epoch": 4374} {"train_loss": -6.977894306182861, "global_step": 183747, "epoch": 4374} {"train_loss": -7.073895454406738, "global_step": 183748, "epoch": 4374} {"train_loss": -7.105076926095145, "global_step": 183749, "epoch": 4374, "val_loss": 68829.4921875} {"train_loss": -7.046189308166504, "global_step": 183750, "epoch": 4375} {"train_loss": -7.180970668792725, "global_step": 183751, "epoch": 4375} {"train_loss": -7.136425018310547, "global_step": 183752, "epoch": 4375} {"train_loss": -6.979793548583984, "global_step": 183753, "epoch": 4375} {"train_loss": -7.128790855407715, "global_step": 183754, "epoch": 4375} {"train_loss": -7.135996341705322, "global_step": 183755, "epoch": 4375} {"train_loss": -7.047595977783203, "global_step": 183756, "epoch": 4375} {"train_loss": -6.990833759307861, "global_step": 183757, "epoch": 4375} {"train_loss": -7.010948657989502, "global_step": 183758, "epoch": 4375} {"train_loss": -7.048666000366211, "global_step": 183759, "epoch": 4375} {"train_loss": -7.179987907409668, "global_step": 183760, "epoch": 4375} {"train_loss": -6.906294822692871, "global_step": 183761, "epoch": 4375} {"train_loss": -7.035038948059082, "global_step": 183762, "epoch": 4375} {"train_loss": -7.024758338928223, "global_step": 183763, "epoch": 4375} {"train_loss": -6.852717399597168, "global_step": 183764, "epoch": 4375} {"train_loss": -6.941132545471191, "global_step": 183765, "epoch": 4375} {"train_loss": -7.1092634201049805, "global_step": 183766, "epoch": 4375} {"train_loss": -6.930132865905762, "global_step": 183767, "epoch": 4375} {"train_loss": -6.922060012817383, "global_step": 183768, "epoch": 4375} {"train_loss": -7.037486553192139, "global_step": 183769, "epoch": 4375} {"train_loss": -6.9567484855651855, "global_step": 183770, "epoch": 4375} {"train_loss": -7.017945289611816, "global_step": 183771, "epoch": 4375} {"train_loss": -7.0280046463012695, "global_step": 183772, "epoch": 4375} {"train_loss": -7.018290996551514, "global_step": 183773, "epoch": 4375} {"train_loss": -7.081545829772949, "global_step": 183774, "epoch": 4375} {"train_loss": -7.056651592254639, "global_step": 183775, "epoch": 4375} {"train_loss": -7.048812389373779, "global_step": 183776, "epoch": 4375} {"train_loss": -6.9524335861206055, "global_step": 183777, "epoch": 4375} {"train_loss": -7.000566482543945, "global_step": 183778, "epoch": 4375} {"train_loss": -6.906134128570557, "global_step": 183779, "epoch": 4375} {"train_loss": -7.095977306365967, "global_step": 183780, "epoch": 4375} {"train_loss": -7.027679920196533, "global_step": 183781, "epoch": 4375} {"train_loss": -7.0074462890625, "global_step": 183782, "epoch": 4375} {"train_loss": -7.022976875305176, "global_step": 183783, "epoch": 4375} {"train_loss": -6.956151962280273, "global_step": 183784, "epoch": 4375} {"train_loss": -6.9865570068359375, "global_step": 183785, "epoch": 4375} {"train_loss": -7.019386291503906, "global_step": 183786, "epoch": 4375} {"train_loss": -7.131037712097168, "global_step": 183787, "epoch": 4375} {"train_loss": -7.026275634765625, "global_step": 183788, "epoch": 4375} {"train_loss": -6.970699310302734, "global_step": 183789, "epoch": 4375} {"train_loss": -7.05112361907959, "global_step": 183790, "epoch": 4375} {"train_loss": -7.026146071297782, "global_step": 183791, "epoch": 4375, "val_loss": 68895.8984375} {"train_loss": -7.03717565536499, "global_step": 183792, "epoch": 4376} {"train_loss": -6.979665756225586, "global_step": 183793, "epoch": 4376} {"train_loss": -7.108900547027588, "global_step": 183794, "epoch": 4376} {"train_loss": -7.022009372711182, "global_step": 183795, "epoch": 4376} {"train_loss": -6.897073745727539, "global_step": 183796, "epoch": 4376} {"train_loss": -7.019114017486572, "global_step": 183797, "epoch": 4376} {"train_loss": -7.119356632232666, "global_step": 183798, "epoch": 4376} {"train_loss": -6.9291486740112305, "global_step": 183799, "epoch": 4376} {"train_loss": -7.064655780792236, "global_step": 183800, "epoch": 4376} {"train_loss": -7.0430378913879395, "global_step": 183801, "epoch": 4376} {"train_loss": -6.950514793395996, "global_step": 183802, "epoch": 4376} {"train_loss": -7.1023149490356445, "global_step": 183803, "epoch": 4376} {"train_loss": -7.0834245681762695, "global_step": 183804, "epoch": 4376} {"train_loss": -6.982365608215332, "global_step": 183805, "epoch": 4376} {"train_loss": -7.09866189956665, "global_step": 183806, "epoch": 4376} {"train_loss": -6.910491943359375, "global_step": 183807, "epoch": 4376} {"train_loss": -7.09784460067749, "global_step": 183808, "epoch": 4376} {"train_loss": -6.987330436706543, "global_step": 183809, "epoch": 4376} {"train_loss": -7.128413200378418, "global_step": 183810, "epoch": 4376} {"train_loss": -7.203957557678223, "global_step": 183811, "epoch": 4376} {"train_loss": -6.951207160949707, "global_step": 183812, "epoch": 4376} {"train_loss": -7.118407726287842, "global_step": 183813, "epoch": 4376} {"train_loss": -6.950007438659668, "global_step": 183814, "epoch": 4376} {"train_loss": -6.948890686035156, "global_step": 183815, "epoch": 4376} {"train_loss": -7.130226135253906, "global_step": 183816, "epoch": 4376} {"train_loss": -7.0422210693359375, "global_step": 183817, "epoch": 4376} {"train_loss": -7.194506645202637, "global_step": 183818, "epoch": 4376} {"train_loss": -7.0295186042785645, "global_step": 183819, "epoch": 4376} {"train_loss": -6.941727638244629, "global_step": 183820, "epoch": 4376} {"train_loss": -7.130311012268066, "global_step": 183821, "epoch": 4376} {"train_loss": -7.069169998168945, "global_step": 183822, "epoch": 4376} {"train_loss": -7.037785530090332, "global_step": 183823, "epoch": 4376} {"train_loss": -7.057674407958984, "global_step": 183824, "epoch": 4376} {"train_loss": -7.172256946563721, "global_step": 183825, "epoch": 4376} {"train_loss": -7.190124988555908, "global_step": 183826, "epoch": 4376} {"train_loss": -7.225090026855469, "global_step": 183827, "epoch": 4376} {"train_loss": -7.16909122467041, "global_step": 183828, "epoch": 4376} {"train_loss": -7.136794090270996, "global_step": 183829, "epoch": 4376} {"train_loss": -7.0113091468811035, "global_step": 183830, "epoch": 4376} {"train_loss": -7.117069244384766, "global_step": 183831, "epoch": 4376} {"train_loss": -7.070560932159424, "global_step": 183832, "epoch": 4376} {"train_loss": -7.057913076309931, "global_step": 183833, "epoch": 4376, "val_loss": 68780.578125} {"train_loss": -7.16975212097168, "global_step": 183834, "epoch": 4377} {"train_loss": -6.998876571655273, "global_step": 183835, "epoch": 4377} {"train_loss": -7.113216400146484, "global_step": 183836, "epoch": 4377} {"train_loss": -7.133245944976807, "global_step": 183837, "epoch": 4377} {"train_loss": -7.061166763305664, "global_step": 183838, "epoch": 4377} {"train_loss": -7.177553176879883, "global_step": 183839, "epoch": 4377} {"train_loss": -7.142400741577148, "global_step": 183840, "epoch": 4377} {"train_loss": -7.105072498321533, "global_step": 183841, "epoch": 4377} {"train_loss": -7.103333473205566, "global_step": 183842, "epoch": 4377} {"train_loss": -7.06634521484375, "global_step": 183843, "epoch": 4377} {"train_loss": -7.1649041175842285, "global_step": 183844, "epoch": 4377} {"train_loss": -7.099250316619873, "global_step": 183845, "epoch": 4377} {"train_loss": -7.169899940490723, "global_step": 183846, "epoch": 4377} {"train_loss": -7.044577121734619, "global_step": 183847, "epoch": 4377} {"train_loss": -7.140974998474121, "global_step": 183848, "epoch": 4377} {"train_loss": -7.259659290313721, "global_step": 183849, "epoch": 4377} {"train_loss": -7.2351393699646, "global_step": 183850, "epoch": 4377} {"train_loss": -7.079584121704102, "global_step": 183851, "epoch": 4377} {"train_loss": -7.110123634338379, "global_step": 183852, "epoch": 4377} {"train_loss": -7.195820331573486, "global_step": 183853, "epoch": 4377} {"train_loss": -7.129397869110107, "global_step": 183854, "epoch": 4377} {"train_loss": -7.135858058929443, "global_step": 183855, "epoch": 4377} {"train_loss": -7.167579174041748, "global_step": 183856, "epoch": 4377} {"train_loss": -7.146945476531982, "global_step": 183857, "epoch": 4377} {"train_loss": -7.068146228790283, "global_step": 183858, "epoch": 4377} {"train_loss": -7.122281074523926, "global_step": 183859, "epoch": 4377} {"train_loss": -7.2684326171875, "global_step": 183860, "epoch": 4377} {"train_loss": -7.119638442993164, "global_step": 183861, "epoch": 4377} {"train_loss": -7.172717094421387, "global_step": 183862, "epoch": 4377} {"train_loss": -7.143468856811523, "global_step": 183863, "epoch": 4377} {"train_loss": -7.054165840148926, "global_step": 183864, "epoch": 4377} {"train_loss": -7.208949089050293, "global_step": 183865, "epoch": 4377} {"train_loss": -7.056985855102539, "global_step": 183866, "epoch": 4377} {"train_loss": -7.109635353088379, "global_step": 183867, "epoch": 4377} {"train_loss": -7.136897087097168, "global_step": 183868, "epoch": 4377} {"train_loss": -7.064823150634766, "global_step": 183869, "epoch": 4377} {"train_loss": -7.080711364746094, "global_step": 183870, "epoch": 4377} {"train_loss": -7.063046455383301, "global_step": 183871, "epoch": 4377} {"train_loss": -7.132090091705322, "global_step": 183872, "epoch": 4377} {"train_loss": -7.092366695404053, "global_step": 183873, "epoch": 4377} {"train_loss": -7.190999984741211, "global_step": 183874, "epoch": 4377} {"train_loss": -7.126243216650827, "global_step": 183875, "epoch": 4377, "val_loss": 68772.46875} {"train_loss": -7.098173141479492, "global_step": 183876, "epoch": 4378} {"train_loss": -7.080603122711182, "global_step": 183877, "epoch": 4378} {"train_loss": -6.923699378967285, "global_step": 183878, "epoch": 4378} {"train_loss": -7.071084976196289, "global_step": 183879, "epoch": 4378} {"train_loss": -7.284885883331299, "global_step": 183880, "epoch": 4378} {"train_loss": -7.134117126464844, "global_step": 183881, "epoch": 4378} {"train_loss": -7.010136604309082, "global_step": 183882, "epoch": 4378} {"train_loss": -7.125967025756836, "global_step": 183883, "epoch": 4378} {"train_loss": -6.943633079528809, "global_step": 183884, "epoch": 4378} {"train_loss": -6.85133695602417, "global_step": 183885, "epoch": 4378} {"train_loss": -6.96817684173584, "global_step": 183886, "epoch": 4378} {"train_loss": -6.90670108795166, "global_step": 183887, "epoch": 4378} {"train_loss": -7.026336669921875, "global_step": 183888, "epoch": 4378} {"train_loss": -6.976033687591553, "global_step": 183889, "epoch": 4378} {"train_loss": -6.995431423187256, "global_step": 183890, "epoch": 4378} {"train_loss": -7.101451396942139, "global_step": 183891, "epoch": 4378} {"train_loss": -6.855988025665283, "global_step": 183892, "epoch": 4378} {"train_loss": -6.9585862159729, "global_step": 183893, "epoch": 4378} {"train_loss": -7.006929397583008, "global_step": 183894, "epoch": 4378} {"train_loss": -7.017496109008789, "global_step": 183895, "epoch": 4378} {"train_loss": -7.024870872497559, "global_step": 183896, "epoch": 4378} {"train_loss": -7.015897750854492, "global_step": 183897, "epoch": 4378} {"train_loss": -6.9177045822143555, "global_step": 183898, "epoch": 4378} {"train_loss": -6.922285079956055, "global_step": 183899, "epoch": 4378} {"train_loss": -7.006930351257324, "global_step": 183900, "epoch": 4378} {"train_loss": -7.109863758087158, "global_step": 183901, "epoch": 4378} {"train_loss": -7.062223434448242, "global_step": 183902, "epoch": 4378} {"train_loss": -7.109313488006592, "global_step": 183903, "epoch": 4378} {"train_loss": -7.02603816986084, "global_step": 183904, "epoch": 4378} {"train_loss": -7.0706610679626465, "global_step": 183905, "epoch": 4378} {"train_loss": -7.049055099487305, "global_step": 183906, "epoch": 4378} {"train_loss": -7.123131275177002, "global_step": 183907, "epoch": 4378} {"train_loss": -7.207928657531738, "global_step": 183908, "epoch": 4378} {"train_loss": -7.0619354248046875, "global_step": 183909, "epoch": 4378} {"train_loss": -7.061193943023682, "global_step": 183910, "epoch": 4378} {"train_loss": -7.156279563903809, "global_step": 183911, "epoch": 4378} {"train_loss": -7.128061294555664, "global_step": 183912, "epoch": 4378} {"train_loss": -7.111735820770264, "global_step": 183913, "epoch": 4378} {"train_loss": -7.267917156219482, "global_step": 183914, "epoch": 4378} {"train_loss": -7.128201961517334, "global_step": 183915, "epoch": 4378} {"train_loss": -7.259485244750977, "global_step": 183916, "epoch": 4378} {"train_loss": -7.055225122542608, "global_step": 183917, "epoch": 4378, "val_loss": 68786.2890625} {"train_loss": -7.1872358322143555, "global_step": 183918, "epoch": 4379} {"train_loss": -7.198896408081055, "global_step": 183919, "epoch": 4379} {"train_loss": -7.006514072418213, "global_step": 183920, "epoch": 4379} {"train_loss": -7.144533157348633, "global_step": 183921, "epoch": 4379} {"train_loss": -7.208218097686768, "global_step": 183922, "epoch": 4379} {"train_loss": -7.1778435707092285, "global_step": 183923, "epoch": 4379} {"train_loss": -7.187860488891602, "global_step": 183924, "epoch": 4379} {"train_loss": -7.026005268096924, "global_step": 183925, "epoch": 4379} {"train_loss": -7.126935958862305, "global_step": 183926, "epoch": 4379} {"train_loss": -7.294700622558594, "global_step": 183927, "epoch": 4379} {"train_loss": -7.089355945587158, "global_step": 183928, "epoch": 4379} {"train_loss": -7.294622898101807, "global_step": 183929, "epoch": 4379} {"train_loss": -7.179156303405762, "global_step": 183930, "epoch": 4379} {"train_loss": -7.078229904174805, "global_step": 183931, "epoch": 4379} {"train_loss": -7.155053615570068, "global_step": 183932, "epoch": 4379} {"train_loss": -7.160378456115723, "global_step": 183933, "epoch": 4379} {"train_loss": -7.091904640197754, "global_step": 183934, "epoch": 4379} {"train_loss": -7.1146087646484375, "global_step": 183935, "epoch": 4379} {"train_loss": -7.299933910369873, "global_step": 183936, "epoch": 4379} {"train_loss": -7.155039310455322, "global_step": 183937, "epoch": 4379} {"train_loss": -7.05150032043457, "global_step": 183938, "epoch": 4379} {"train_loss": -7.202019691467285, "global_step": 183939, "epoch": 4379} {"train_loss": -7.258355617523193, "global_step": 183940, "epoch": 4379} {"train_loss": -6.982273578643799, "global_step": 183941, "epoch": 4379} {"train_loss": -7.215113162994385, "global_step": 183942, "epoch": 4379} {"train_loss": -7.120295524597168, "global_step": 183943, "epoch": 4379} {"train_loss": -7.097302436828613, "global_step": 183944, "epoch": 4379} {"train_loss": -7.052590370178223, "global_step": 183945, "epoch": 4379} {"train_loss": -7.129096508026123, "global_step": 183946, "epoch": 4379} {"train_loss": -7.159694671630859, "global_step": 183947, "epoch": 4379} {"train_loss": -7.129499435424805, "global_step": 183948, "epoch": 4379} {"train_loss": -7.211947917938232, "global_step": 183949, "epoch": 4379} {"train_loss": -7.175539970397949, "global_step": 183950, "epoch": 4379} {"train_loss": -7.192800998687744, "global_step": 183951, "epoch": 4379} {"train_loss": -7.105915069580078, "global_step": 183952, "epoch": 4379} {"train_loss": -7.094917297363281, "global_step": 183953, "epoch": 4379} {"train_loss": -7.07012939453125, "global_step": 183954, "epoch": 4379} {"train_loss": -7.211725234985352, "global_step": 183955, "epoch": 4379} {"train_loss": -7.050343990325928, "global_step": 183956, "epoch": 4379} {"train_loss": -7.063373565673828, "global_step": 183957, "epoch": 4379} {"train_loss": -7.344552993774414, "global_step": 183958, "epoch": 4379} {"train_loss": -7.149735859462193, "global_step": 183959, "epoch": 4379, "val_loss": 68804.3125} {"train_loss": -7.129775047302246, "global_step": 183960, "epoch": 4380} {"train_loss": -7.21132755279541, "global_step": 183961, "epoch": 4380} {"train_loss": -7.061070919036865, "global_step": 183962, "epoch": 4380} {"train_loss": -7.189533233642578, "global_step": 183963, "epoch": 4380} {"train_loss": -7.265227317810059, "global_step": 183964, "epoch": 4380} {"train_loss": -7.101512908935547, "global_step": 183965, "epoch": 4380} {"train_loss": -7.23680305480957, "global_step": 183966, "epoch": 4380} {"train_loss": -7.191009521484375, "global_step": 183967, "epoch": 4380} {"train_loss": -7.094844818115234, "global_step": 183968, "epoch": 4380} {"train_loss": -7.21098518371582, "global_step": 183969, "epoch": 4380} {"train_loss": -7.160556793212891, "global_step": 183970, "epoch": 4380} {"train_loss": -7.056758880615234, "global_step": 183971, "epoch": 4380} {"train_loss": -7.120580673217773, "global_step": 183972, "epoch": 4380} {"train_loss": -7.12259578704834, "global_step": 183973, "epoch": 4380} {"train_loss": -7.060644149780273, "global_step": 183974, "epoch": 4380} {"train_loss": -7.1649169921875, "global_step": 183975, "epoch": 4380} {"train_loss": -7.047187805175781, "global_step": 183976, "epoch": 4380} {"train_loss": -7.055309295654297, "global_step": 183977, "epoch": 4380} {"train_loss": -7.103841781616211, "global_step": 183978, "epoch": 4380} {"train_loss": -7.0848846435546875, "global_step": 183979, "epoch": 4380} {"train_loss": -7.098066329956055, "global_step": 183980, "epoch": 4380} {"train_loss": -7.133057117462158, "global_step": 183981, "epoch": 4380} {"train_loss": -7.028475761413574, "global_step": 183982, "epoch": 4380} {"train_loss": -7.1302642822265625, "global_step": 183983, "epoch": 4380} {"train_loss": -7.017369270324707, "global_step": 183984, "epoch": 4380} {"train_loss": -7.097253322601318, "global_step": 183985, "epoch": 4380} {"train_loss": -7.112313270568848, "global_step": 183986, "epoch": 4380} {"train_loss": -6.981237411499023, "global_step": 183987, "epoch": 4380} {"train_loss": -7.15539026260376, "global_step": 183988, "epoch": 4380} {"train_loss": -7.012731552124023, "global_step": 183989, "epoch": 4380} {"train_loss": -7.139294624328613, "global_step": 183990, "epoch": 4380} {"train_loss": -7.15928840637207, "global_step": 183991, "epoch": 4380} {"train_loss": -7.228757858276367, "global_step": 183992, "epoch": 4380} {"train_loss": -7.041110992431641, "global_step": 183993, "epoch": 4380} {"train_loss": -7.052038192749023, "global_step": 183994, "epoch": 4380} {"train_loss": -7.0064697265625, "global_step": 183995, "epoch": 4380} {"train_loss": -7.116252899169922, "global_step": 183996, "epoch": 4380} {"train_loss": -7.077175617218018, "global_step": 183997, "epoch": 4380} {"train_loss": -7.129456043243408, "global_step": 183998, "epoch": 4380} {"train_loss": -7.057978630065918, "global_step": 183999, "epoch": 4380} {"train_loss": -7.05428409576416, "global_step": 184000, "epoch": 4380} {"train_loss": -7.112153007870629, "global_step": 184001, "epoch": 4380, "val_loss": 68752.671875} {"train_loss": -7.132932662963867, "global_step": 184002, "epoch": 4381} {"train_loss": -7.199417591094971, "global_step": 184003, "epoch": 4381} {"train_loss": -7.011812210083008, "global_step": 184004, "epoch": 4381} {"train_loss": -7.121373653411865, "global_step": 184005, "epoch": 4381} {"train_loss": -7.257725238800049, "global_step": 184006, "epoch": 4381} {"train_loss": -7.109506130218506, "global_step": 184007, "epoch": 4381} {"train_loss": -7.030727863311768, "global_step": 184008, "epoch": 4381} {"train_loss": -7.192816257476807, "global_step": 184009, "epoch": 4381} {"train_loss": -7.0490922927856445, "global_step": 184010, "epoch": 4381} {"train_loss": -7.21171760559082, "global_step": 184011, "epoch": 4381} {"train_loss": -7.14988374710083, "global_step": 184012, "epoch": 4381} {"train_loss": -7.281065940856934, "global_step": 184013, "epoch": 4381} {"train_loss": -7.108080863952637, "global_step": 184014, "epoch": 4381} {"train_loss": -7.182143688201904, "global_step": 184015, "epoch": 4381} {"train_loss": -7.066901206970215, "global_step": 184016, "epoch": 4381} {"train_loss": -7.199441909790039, "global_step": 184017, "epoch": 4381} {"train_loss": -7.338451862335205, "global_step": 184018, "epoch": 4381} {"train_loss": -7.174533843994141, "global_step": 184019, "epoch": 4381} {"train_loss": -7.135448455810547, "global_step": 184020, "epoch": 4381} {"train_loss": -7.14158296585083, "global_step": 184021, "epoch": 4381} {"train_loss": -7.221014022827148, "global_step": 184022, "epoch": 4381} {"train_loss": -7.170951843261719, "global_step": 184023, "epoch": 4381} {"train_loss": -7.182297706604004, "global_step": 184024, "epoch": 4381} {"train_loss": -7.175119876861572, "global_step": 184025, "epoch": 4381} {"train_loss": -7.211972236633301, "global_step": 184026, "epoch": 4381} {"train_loss": -7.0901689529418945, "global_step": 184027, "epoch": 4381} {"train_loss": -7.1607346534729, "global_step": 184028, "epoch": 4381} {"train_loss": -7.110146522521973, "global_step": 184029, "epoch": 4381} {"train_loss": -7.142403602600098, "global_step": 184030, "epoch": 4381} {"train_loss": -7.067636966705322, "global_step": 184031, "epoch": 4381} {"train_loss": -7.015383243560791, "global_step": 184032, "epoch": 4381} {"train_loss": -7.181405067443848, "global_step": 184033, "epoch": 4381} {"train_loss": -7.069400787353516, "global_step": 184034, "epoch": 4381} {"train_loss": -7.087895393371582, "global_step": 184035, "epoch": 4381} {"train_loss": -7.015619277954102, "global_step": 184036, "epoch": 4381} {"train_loss": -7.151798248291016, "global_step": 184037, "epoch": 4381} {"train_loss": -7.161444664001465, "global_step": 184038, "epoch": 4381} {"train_loss": -7.076540946960449, "global_step": 184039, "epoch": 4381} {"train_loss": -7.191664695739746, "global_step": 184040, "epoch": 4381} {"train_loss": -7.147574424743652, "global_step": 184041, "epoch": 4381} {"train_loss": -7.165587902069092, "global_step": 184042, "epoch": 4381} {"train_loss": -7.144511313665481, "global_step": 184043, "epoch": 4381, "val_loss": 68684.4609375} {"train_loss": -7.226374626159668, "global_step": 184044, "epoch": 4382} {"train_loss": -7.184535980224609, "global_step": 184045, "epoch": 4382} {"train_loss": -7.190485954284668, "global_step": 184046, "epoch": 4382} {"train_loss": -7.041164875030518, "global_step": 184047, "epoch": 4382} {"train_loss": -7.207642078399658, "global_step": 184048, "epoch": 4382} {"train_loss": -7.1372246742248535, "global_step": 184049, "epoch": 4382} {"train_loss": -7.172142505645752, "global_step": 184050, "epoch": 4382} {"train_loss": -7.129964828491211, "global_step": 184051, "epoch": 4382} {"train_loss": -7.053155422210693, "global_step": 184052, "epoch": 4382} {"train_loss": -7.079895973205566, "global_step": 184053, "epoch": 4382} {"train_loss": -7.137886047363281, "global_step": 184054, "epoch": 4382} {"train_loss": -7.144477367401123, "global_step": 184055, "epoch": 4382} {"train_loss": -7.189762115478516, "global_step": 184056, "epoch": 4382} {"train_loss": -7.098509788513184, "global_step": 184057, "epoch": 4382} {"train_loss": -7.199299335479736, "global_step": 184058, "epoch": 4382} {"train_loss": -7.127246856689453, "global_step": 184059, "epoch": 4382} {"train_loss": -7.1241135597229, "global_step": 184060, "epoch": 4382} {"train_loss": -7.043542861938477, "global_step": 184061, "epoch": 4382} {"train_loss": -7.055974960327148, "global_step": 184062, "epoch": 4382} {"train_loss": -7.016645431518555, "global_step": 184063, "epoch": 4382} {"train_loss": -7.111514568328857, "global_step": 184064, "epoch": 4382} {"train_loss": -7.053660869598389, "global_step": 184065, "epoch": 4382} {"train_loss": -7.088106155395508, "global_step": 184066, "epoch": 4382} {"train_loss": -7.080648422241211, "global_step": 184067, "epoch": 4382} {"train_loss": -7.078364849090576, "global_step": 184068, "epoch": 4382} {"train_loss": -7.023261070251465, "global_step": 184069, "epoch": 4382} {"train_loss": -7.056763648986816, "global_step": 184070, "epoch": 4382} {"train_loss": -7.1375017166137695, "global_step": 184071, "epoch": 4382} {"train_loss": -7.108331680297852, "global_step": 184072, "epoch": 4382} {"train_loss": -7.088468551635742, "global_step": 184073, "epoch": 4382} {"train_loss": -7.003094673156738, "global_step": 184074, "epoch": 4382} {"train_loss": -7.087641716003418, "global_step": 184075, "epoch": 4382} {"train_loss": -7.139736175537109, "global_step": 184076, "epoch": 4382} {"train_loss": -7.114624977111816, "global_step": 184077, "epoch": 4382} {"train_loss": -7.104522705078125, "global_step": 184078, "epoch": 4382} {"train_loss": -7.122119426727295, "global_step": 184079, "epoch": 4382} {"train_loss": -7.14642333984375, "global_step": 184080, "epoch": 4382} {"train_loss": -7.097850322723389, "global_step": 184081, "epoch": 4382} {"train_loss": -7.017158508300781, "global_step": 184082, "epoch": 4382} {"train_loss": -7.014122486114502, "global_step": 184083, "epoch": 4382} {"train_loss": -7.040733337402344, "global_step": 184084, "epoch": 4382} {"train_loss": -7.104413077944801, "global_step": 184085, "epoch": 4382, "val_loss": 68809.328125} {"train_loss": -7.047520637512207, "global_step": 184086, "epoch": 4383} {"train_loss": -6.994618892669678, "global_step": 184087, "epoch": 4383} {"train_loss": -7.115151882171631, "global_step": 184088, "epoch": 4383} {"train_loss": -6.9744462966918945, "global_step": 184089, "epoch": 4383} {"train_loss": -7.138345718383789, "global_step": 184090, "epoch": 4383} {"train_loss": -7.196152687072754, "global_step": 184091, "epoch": 4383} {"train_loss": -7.113183498382568, "global_step": 184092, "epoch": 4383} {"train_loss": -7.17234468460083, "global_step": 184093, "epoch": 4383} {"train_loss": -7.030848503112793, "global_step": 184094, "epoch": 4383} {"train_loss": -7.035732269287109, "global_step": 184095, "epoch": 4383} {"train_loss": -7.216615676879883, "global_step": 184096, "epoch": 4383} {"train_loss": -7.063608169555664, "global_step": 184097, "epoch": 4383} {"train_loss": -7.160157203674316, "global_step": 184098, "epoch": 4383} {"train_loss": -7.092262268066406, "global_step": 184099, "epoch": 4383} {"train_loss": -7.161319732666016, "global_step": 184100, "epoch": 4383} {"train_loss": -7.072808265686035, "global_step": 184101, "epoch": 4383} {"train_loss": -6.982631683349609, "global_step": 184102, "epoch": 4383} {"train_loss": -7.022974014282227, "global_step": 184103, "epoch": 4383} {"train_loss": -7.109227180480957, "global_step": 184104, "epoch": 4383} {"train_loss": -7.128876686096191, "global_step": 184105, "epoch": 4383} {"train_loss": -7.129167556762695, "global_step": 184106, "epoch": 4383} {"train_loss": -7.039674758911133, "global_step": 184107, "epoch": 4383} {"train_loss": -7.0395965576171875, "global_step": 184108, "epoch": 4383} {"train_loss": -7.149874210357666, "global_step": 184109, "epoch": 4383} {"train_loss": -7.089507102966309, "global_step": 184110, "epoch": 4383} {"train_loss": -6.96012020111084, "global_step": 184111, "epoch": 4383} {"train_loss": -7.057376861572266, "global_step": 184112, "epoch": 4383} {"train_loss": -7.048233509063721, "global_step": 184113, "epoch": 4383} {"train_loss": -7.034595966339111, "global_step": 184114, "epoch": 4383} {"train_loss": -7.095350742340088, "global_step": 184115, "epoch": 4383} {"train_loss": -7.034272193908691, "global_step": 184116, "epoch": 4383} {"train_loss": -6.987239360809326, "global_step": 184117, "epoch": 4383} {"train_loss": -7.076687812805176, "global_step": 184118, "epoch": 4383} {"train_loss": -7.029730319976807, "global_step": 184119, "epoch": 4383} {"train_loss": -7.1198015213012695, "global_step": 184120, "epoch": 4383} {"train_loss": -7.026078224182129, "global_step": 184121, "epoch": 4383} {"train_loss": -7.152776718139648, "global_step": 184122, "epoch": 4383} {"train_loss": -7.0131988525390625, "global_step": 184123, "epoch": 4383} {"train_loss": -7.053409099578857, "global_step": 184124, "epoch": 4383} {"train_loss": -7.185333728790283, "global_step": 184125, "epoch": 4383} {"train_loss": -7.041400909423828, "global_step": 184126, "epoch": 4383} {"train_loss": -7.078322047278995, "global_step": 184127, "epoch": 4383, "val_loss": 68845.140625} {"train_loss": -7.010313034057617, "global_step": 184128, "epoch": 4384} {"train_loss": -7.167558670043945, "global_step": 184129, "epoch": 4384} {"train_loss": -7.089898109436035, "global_step": 184130, "epoch": 4384} {"train_loss": -7.115934371948242, "global_step": 184131, "epoch": 4384} {"train_loss": -7.12548303604126, "global_step": 184132, "epoch": 4384} {"train_loss": -7.038632392883301, "global_step": 184133, "epoch": 4384} {"train_loss": -7.066562652587891, "global_step": 184134, "epoch": 4384} {"train_loss": -7.124863147735596, "global_step": 184135, "epoch": 4384} {"train_loss": -7.119102954864502, "global_step": 184136, "epoch": 4384} {"train_loss": -7.072429180145264, "global_step": 184137, "epoch": 4384} {"train_loss": -6.9851393699646, "global_step": 184138, "epoch": 4384} {"train_loss": -7.047577857971191, "global_step": 184139, "epoch": 4384} {"train_loss": -7.051357269287109, "global_step": 184140, "epoch": 4384} {"train_loss": -7.046298027038574, "global_step": 184141, "epoch": 4384} {"train_loss": -6.961468696594238, "global_step": 184142, "epoch": 4384} {"train_loss": -7.099274635314941, "global_step": 184143, "epoch": 4384} {"train_loss": -7.000652313232422, "global_step": 184144, "epoch": 4384} {"train_loss": -6.9786787033081055, "global_step": 184145, "epoch": 4384} {"train_loss": -7.057448387145996, "global_step": 184146, "epoch": 4384} {"train_loss": -7.004329681396484, "global_step": 184147, "epoch": 4384} {"train_loss": -7.051570415496826, "global_step": 184148, "epoch": 4384} {"train_loss": -7.070859909057617, "global_step": 184149, "epoch": 4384} {"train_loss": -7.009280204772949, "global_step": 184150, "epoch": 4384} {"train_loss": -6.9947686195373535, "global_step": 184151, "epoch": 4384} {"train_loss": -7.09149169921875, "global_step": 184152, "epoch": 4384} {"train_loss": -7.085879325866699, "global_step": 184153, "epoch": 4384} {"train_loss": -7.0889482498168945, "global_step": 184154, "epoch": 4384} {"train_loss": -7.030614852905273, "global_step": 184155, "epoch": 4384} {"train_loss": -7.120946884155273, "global_step": 184156, "epoch": 4384} {"train_loss": -7.067050933837891, "global_step": 184157, "epoch": 4384} {"train_loss": -7.027716636657715, "global_step": 184158, "epoch": 4384} {"train_loss": -6.949662685394287, "global_step": 184159, "epoch": 4384} {"train_loss": -6.991579055786133, "global_step": 184160, "epoch": 4384} {"train_loss": -6.896557807922363, "global_step": 184161, "epoch": 4384} {"train_loss": -7.02188777923584, "global_step": 184162, "epoch": 4384} {"train_loss": -7.1404218673706055, "global_step": 184163, "epoch": 4384} {"train_loss": -7.023347854614258, "global_step": 184164, "epoch": 4384} {"train_loss": -7.0806779861450195, "global_step": 184165, "epoch": 4384} {"train_loss": -7.1611528396606445, "global_step": 184166, "epoch": 4384} {"train_loss": -7.140048027038574, "global_step": 184167, "epoch": 4384} {"train_loss": -7.082882881164551, "global_step": 184168, "epoch": 4384} {"train_loss": -7.056493463970366, "global_step": 184169, "epoch": 4384, "val_loss": 68944.5078125} {"train_loss": -7.165556907653809, "global_step": 184170, "epoch": 4385} {"train_loss": -7.084404468536377, "global_step": 184171, "epoch": 4385} {"train_loss": -7.114328384399414, "global_step": 184172, "epoch": 4385} {"train_loss": -7.149116516113281, "global_step": 184173, "epoch": 4385} {"train_loss": -7.171221733093262, "global_step": 184174, "epoch": 4385} {"train_loss": -7.107806205749512, "global_step": 184175, "epoch": 4385} {"train_loss": -7.048759460449219, "global_step": 184176, "epoch": 4385} {"train_loss": -7.087973594665527, "global_step": 184177, "epoch": 4385} {"train_loss": -7.090031623840332, "global_step": 184178, "epoch": 4385} {"train_loss": -6.988825798034668, "global_step": 184179, "epoch": 4385} {"train_loss": -6.899440288543701, "global_step": 184180, "epoch": 4385} {"train_loss": -6.948790550231934, "global_step": 184181, "epoch": 4385} {"train_loss": -6.9303388595581055, "global_step": 184182, "epoch": 4385} {"train_loss": -7.000227928161621, "global_step": 184183, "epoch": 4385} {"train_loss": -6.958772659301758, "global_step": 184184, "epoch": 4385} {"train_loss": -6.95435094833374, "global_step": 184185, "epoch": 4385} {"train_loss": -7.021697521209717, "global_step": 184186, "epoch": 4385} {"train_loss": -6.9843244552612305, "global_step": 184187, "epoch": 4385} {"train_loss": -6.947473526000977, "global_step": 184188, "epoch": 4385} {"train_loss": -7.01957893371582, "global_step": 184189, "epoch": 4385} {"train_loss": -7.073125839233398, "global_step": 184190, "epoch": 4385} {"train_loss": -6.991446495056152, "global_step": 184191, "epoch": 4385} {"train_loss": -7.0680365562438965, "global_step": 184192, "epoch": 4385} {"train_loss": -7.0475358963012695, "global_step": 184193, "epoch": 4385} {"train_loss": -7.185250282287598, "global_step": 184194, "epoch": 4385} {"train_loss": -6.975773811340332, "global_step": 184195, "epoch": 4385} {"train_loss": -7.087906837463379, "global_step": 184196, "epoch": 4385} {"train_loss": -7.224031925201416, "global_step": 184197, "epoch": 4385} {"train_loss": -7.012198448181152, "global_step": 184198, "epoch": 4385} {"train_loss": -7.064306735992432, "global_step": 184199, "epoch": 4385} {"train_loss": -7.072396278381348, "global_step": 184200, "epoch": 4385} {"train_loss": -7.072813034057617, "global_step": 184201, "epoch": 4385} {"train_loss": -7.137091636657715, "global_step": 184202, "epoch": 4385} {"train_loss": -7.146079063415527, "global_step": 184203, "epoch": 4385} {"train_loss": -7.209469318389893, "global_step": 184204, "epoch": 4385} {"train_loss": -7.172184944152832, "global_step": 184205, "epoch": 4385} {"train_loss": -7.140929698944092, "global_step": 184206, "epoch": 4385} {"train_loss": -7.134654998779297, "global_step": 184207, "epoch": 4385} {"train_loss": -7.14243745803833, "global_step": 184208, "epoch": 4385} {"train_loss": -7.259355545043945, "global_step": 184209, "epoch": 4385} {"train_loss": -7.032113075256348, "global_step": 184210, "epoch": 4385} {"train_loss": -7.073338588078816, "global_step": 184211, "epoch": 4385, "val_loss": 68829.109375} {"train_loss": -7.0286712646484375, "global_step": 184212, "epoch": 4386} {"train_loss": -7.12152099609375, "global_step": 184213, "epoch": 4386} {"train_loss": -7.1912384033203125, "global_step": 184214, "epoch": 4386} {"train_loss": -7.1572370529174805, "global_step": 184215, "epoch": 4386} {"train_loss": -7.129495620727539, "global_step": 184216, "epoch": 4386} {"train_loss": -7.049306869506836, "global_step": 184217, "epoch": 4386} {"train_loss": -7.13490104675293, "global_step": 184218, "epoch": 4386} {"train_loss": -7.071533679962158, "global_step": 184219, "epoch": 4386} {"train_loss": -7.21466064453125, "global_step": 184220, "epoch": 4386} {"train_loss": -7.116238117218018, "global_step": 184221, "epoch": 4386} {"train_loss": -7.101973533630371, "global_step": 184222, "epoch": 4386} {"train_loss": -7.099954605102539, "global_step": 184223, "epoch": 4386} {"train_loss": -7.06915283203125, "global_step": 184224, "epoch": 4386} {"train_loss": -7.066467761993408, "global_step": 184225, "epoch": 4386} {"train_loss": -7.094151020050049, "global_step": 184226, "epoch": 4386} {"train_loss": -7.1686296463012695, "global_step": 184227, "epoch": 4386} {"train_loss": -7.052847862243652, "global_step": 184228, "epoch": 4386} {"train_loss": -7.114988803863525, "global_step": 184229, "epoch": 4386} {"train_loss": -7.16207218170166, "global_step": 184230, "epoch": 4386} {"train_loss": -7.158236503601074, "global_step": 184231, "epoch": 4386} {"train_loss": -7.0818047523498535, "global_step": 184232, "epoch": 4386} {"train_loss": -7.146644592285156, "global_step": 184233, "epoch": 4386} {"train_loss": -7.084262847900391, "global_step": 184234, "epoch": 4386} {"train_loss": -7.092566967010498, "global_step": 184235, "epoch": 4386} {"train_loss": -7.181341648101807, "global_step": 184236, "epoch": 4386} {"train_loss": -7.127958297729492, "global_step": 184237, "epoch": 4386} {"train_loss": -6.991552352905273, "global_step": 184238, "epoch": 4386} {"train_loss": -7.120847702026367, "global_step": 184239, "epoch": 4386} {"train_loss": -7.1667304039001465, "global_step": 184240, "epoch": 4386} {"train_loss": -7.165165901184082, "global_step": 184241, "epoch": 4386} {"train_loss": -7.061575889587402, "global_step": 184242, "epoch": 4386} {"train_loss": -7.084983825683594, "global_step": 184243, "epoch": 4386} {"train_loss": -7.191705703735352, "global_step": 184244, "epoch": 4386} {"train_loss": -7.090258598327637, "global_step": 184245, "epoch": 4386} {"train_loss": -6.981128692626953, "global_step": 184246, "epoch": 4386} {"train_loss": -7.228122711181641, "global_step": 184247, "epoch": 4386} {"train_loss": -6.971662998199463, "global_step": 184248, "epoch": 4386} {"train_loss": -7.085705757141113, "global_step": 184249, "epoch": 4386} {"train_loss": -7.069341659545898, "global_step": 184250, "epoch": 4386} {"train_loss": -7.035252571105957, "global_step": 184251, "epoch": 4386} {"train_loss": -7.084397315979004, "global_step": 184252, "epoch": 4386} {"train_loss": -7.104926745096843, "global_step": 184253, "epoch": 4386, "val_loss": 68727.65625} {"train_loss": -7.10787296295166, "global_step": 184254, "epoch": 4387} {"train_loss": -7.121324062347412, "global_step": 184255, "epoch": 4387} {"train_loss": -7.026116847991943, "global_step": 184256, "epoch": 4387} {"train_loss": -7.132928848266602, "global_step": 184257, "epoch": 4387} {"train_loss": -7.131684303283691, "global_step": 184258, "epoch": 4387} {"train_loss": -7.185410499572754, "global_step": 184259, "epoch": 4387} {"train_loss": -7.046317100524902, "global_step": 184260, "epoch": 4387} {"train_loss": -7.098502159118652, "global_step": 184261, "epoch": 4387} {"train_loss": -7.145989894866943, "global_step": 184262, "epoch": 4387} {"train_loss": -7.096449375152588, "global_step": 184263, "epoch": 4387} {"train_loss": -7.123568534851074, "global_step": 184264, "epoch": 4387} {"train_loss": -7.098644256591797, "global_step": 184265, "epoch": 4387} {"train_loss": -7.071467399597168, "global_step": 184266, "epoch": 4387} {"train_loss": -7.043274879455566, "global_step": 184267, "epoch": 4387} {"train_loss": -6.997674942016602, "global_step": 184268, "epoch": 4387} {"train_loss": -7.089267253875732, "global_step": 184269, "epoch": 4387} {"train_loss": -7.071393013000488, "global_step": 184270, "epoch": 4387} {"train_loss": -7.064180374145508, "global_step": 184271, "epoch": 4387} {"train_loss": -7.146267890930176, "global_step": 184272, "epoch": 4387} {"train_loss": -7.05679178237915, "global_step": 184273, "epoch": 4387} {"train_loss": -6.938652515411377, "global_step": 184274, "epoch": 4387} {"train_loss": -7.091048240661621, "global_step": 184275, "epoch": 4387} {"train_loss": -6.869264602661133, "global_step": 184276, "epoch": 4387} {"train_loss": -7.0240020751953125, "global_step": 184277, "epoch": 4387} {"train_loss": -7.176999092102051, "global_step": 184278, "epoch": 4387} {"train_loss": -6.998964309692383, "global_step": 184279, "epoch": 4387} {"train_loss": -6.991394519805908, "global_step": 184280, "epoch": 4387} {"train_loss": -7.189260959625244, "global_step": 184281, "epoch": 4387} {"train_loss": -7.06882905960083, "global_step": 184282, "epoch": 4387} {"train_loss": -7.088489055633545, "global_step": 184283, "epoch": 4387} {"train_loss": -7.065183639526367, "global_step": 184284, "epoch": 4387} {"train_loss": -7.025443077087402, "global_step": 184285, "epoch": 4387} {"train_loss": -6.936959266662598, "global_step": 184286, "epoch": 4387} {"train_loss": -7.1234540939331055, "global_step": 184287, "epoch": 4387} {"train_loss": -7.115257263183594, "global_step": 184288, "epoch": 4387} {"train_loss": -7.019016265869141, "global_step": 184289, "epoch": 4387} {"train_loss": -7.079715728759766, "global_step": 184290, "epoch": 4387} {"train_loss": -7.1470537185668945, "global_step": 184291, "epoch": 4387} {"train_loss": -7.087642192840576, "global_step": 184292, "epoch": 4387} {"train_loss": -7.10407018661499, "global_step": 184293, "epoch": 4387} {"train_loss": -7.146430015563965, "global_step": 184294, "epoch": 4387} {"train_loss": -7.07401164372762, "global_step": 184295, "epoch": 4387, "val_loss": 68934.3203125} {"train_loss": -7.114512920379639, "global_step": 184296, "epoch": 4388} {"train_loss": -7.033207893371582, "global_step": 184297, "epoch": 4388} {"train_loss": -6.939540863037109, "global_step": 184298, "epoch": 4388} {"train_loss": -7.124846458435059, "global_step": 184299, "epoch": 4388} {"train_loss": -7.04175329208374, "global_step": 184300, "epoch": 4388} {"train_loss": -6.952084541320801, "global_step": 184301, "epoch": 4388} {"train_loss": -7.037327289581299, "global_step": 184302, "epoch": 4388} {"train_loss": -7.008001327514648, "global_step": 184303, "epoch": 4388} {"train_loss": -7.137894630432129, "global_step": 184304, "epoch": 4388} {"train_loss": -7.068746089935303, "global_step": 184305, "epoch": 4388} {"train_loss": -6.862635612487793, "global_step": 184306, "epoch": 4388} {"train_loss": -6.969906330108643, "global_step": 184307, "epoch": 4388} {"train_loss": -7.010638236999512, "global_step": 184308, "epoch": 4388} {"train_loss": -7.040290832519531, "global_step": 184309, "epoch": 4388} {"train_loss": -7.05648946762085, "global_step": 184310, "epoch": 4388} {"train_loss": -6.947296619415283, "global_step": 184311, "epoch": 4388} {"train_loss": -7.0524797439575195, "global_step": 184312, "epoch": 4388} {"train_loss": -6.919518947601318, "global_step": 184313, "epoch": 4388} {"train_loss": -7.047690391540527, "global_step": 184314, "epoch": 4388} {"train_loss": -7.023496627807617, "global_step": 184315, "epoch": 4388} {"train_loss": -7.06948709487915, "global_step": 184316, "epoch": 4388} {"train_loss": -7.145176887512207, "global_step": 184317, "epoch": 4388} {"train_loss": -7.1272969245910645, "global_step": 184318, "epoch": 4388} {"train_loss": -7.170376300811768, "global_step": 184319, "epoch": 4388} {"train_loss": -7.093807220458984, "global_step": 184320, "epoch": 4388} {"train_loss": -6.997171401977539, "global_step": 184321, "epoch": 4388} {"train_loss": -7.059504508972168, "global_step": 184322, "epoch": 4388} {"train_loss": -7.098034858703613, "global_step": 184323, "epoch": 4388} {"train_loss": -7.185046672821045, "global_step": 184324, "epoch": 4388} {"train_loss": -7.010636329650879, "global_step": 184325, "epoch": 4388} {"train_loss": -7.1360673904418945, "global_step": 184326, "epoch": 4388} {"train_loss": -7.22675895690918, "global_step": 184327, "epoch": 4388} {"train_loss": -7.076511383056641, "global_step": 184328, "epoch": 4388} {"train_loss": -7.11752986907959, "global_step": 184329, "epoch": 4388} {"train_loss": -7.119803428649902, "global_step": 184330, "epoch": 4388} {"train_loss": -7.1443963050842285, "global_step": 184331, "epoch": 4388} {"train_loss": -7.16389274597168, "global_step": 184332, "epoch": 4388} {"train_loss": -7.093409538269043, "global_step": 184333, "epoch": 4388} {"train_loss": -7.104790687561035, "global_step": 184334, "epoch": 4388} {"train_loss": -7.09169864654541, "global_step": 184335, "epoch": 4388} {"train_loss": -7.2290754318237305, "global_step": 184336, "epoch": 4388} {"train_loss": -7.073191597348168, "global_step": 184337, "epoch": 4388, "val_loss": 68666.125} {"train_loss": -7.205859661102295, "global_step": 184338, "epoch": 4389} {"train_loss": -7.202004432678223, "global_step": 184339, "epoch": 4389} {"train_loss": -7.080143928527832, "global_step": 184340, "epoch": 4389} {"train_loss": -7.2237396240234375, "global_step": 184341, "epoch": 4389} {"train_loss": -7.133217811584473, "global_step": 184342, "epoch": 4389} {"train_loss": -7.199672698974609, "global_step": 184343, "epoch": 4389} {"train_loss": -7.125672340393066, "global_step": 184344, "epoch": 4389} {"train_loss": -7.218050956726074, "global_step": 184345, "epoch": 4389} {"train_loss": -7.127752304077148, "global_step": 184346, "epoch": 4389} {"train_loss": -7.137463569641113, "global_step": 184347, "epoch": 4389} {"train_loss": -7.088305473327637, "global_step": 184348, "epoch": 4389} {"train_loss": -7.055644512176514, "global_step": 184349, "epoch": 4389} {"train_loss": -7.182220935821533, "global_step": 184350, "epoch": 4389} {"train_loss": -7.05671501159668, "global_step": 184351, "epoch": 4389} {"train_loss": -7.105700969696045, "global_step": 184352, "epoch": 4389} {"train_loss": -7.077180862426758, "global_step": 184353, "epoch": 4389} {"train_loss": -7.0634918212890625, "global_step": 184354, "epoch": 4389} {"train_loss": -7.120369911193848, "global_step": 184355, "epoch": 4389} {"train_loss": -7.133477210998535, "global_step": 184356, "epoch": 4389} {"train_loss": -7.094944000244141, "global_step": 184357, "epoch": 4389} {"train_loss": -7.166986465454102, "global_step": 184358, "epoch": 4389} {"train_loss": -7.122130393981934, "global_step": 184359, "epoch": 4389} {"train_loss": -6.912982940673828, "global_step": 184360, "epoch": 4389} {"train_loss": -7.111947536468506, "global_step": 184361, "epoch": 4389} {"train_loss": -7.180548191070557, "global_step": 184362, "epoch": 4389} {"train_loss": -6.939067840576172, "global_step": 184363, "epoch": 4389} {"train_loss": -7.143576622009277, "global_step": 184364, "epoch": 4389} {"train_loss": -6.9771728515625, "global_step": 184365, "epoch": 4389} {"train_loss": -7.06852388381958, "global_step": 184366, "epoch": 4389} {"train_loss": -7.02099609375, "global_step": 184367, "epoch": 4389} {"train_loss": -7.074769496917725, "global_step": 184368, "epoch": 4389} {"train_loss": -6.933751106262207, "global_step": 184369, "epoch": 4389} {"train_loss": -7.108826637268066, "global_step": 184370, "epoch": 4389} {"train_loss": -7.239404678344727, "global_step": 184371, "epoch": 4389} {"train_loss": -7.1069016456604, "global_step": 184372, "epoch": 4389} {"train_loss": -7.183732032775879, "global_step": 184373, "epoch": 4389} {"train_loss": -7.123509407043457, "global_step": 184374, "epoch": 4389} {"train_loss": -7.02951717376709, "global_step": 184375, "epoch": 4389} {"train_loss": -7.222156524658203, "global_step": 184376, "epoch": 4389} {"train_loss": -7.0885844230651855, "global_step": 184377, "epoch": 4389} {"train_loss": -7.115135669708252, "global_step": 184378, "epoch": 4389} {"train_loss": -7.110905261266799, "global_step": 184379, "epoch": 4389, "val_loss": 68861.3125} {"train_loss": -7.1065354347229, "global_step": 184380, "epoch": 4390} {"train_loss": -7.2247514724731445, "global_step": 184381, "epoch": 4390} {"train_loss": -6.969527244567871, "global_step": 184382, "epoch": 4390} {"train_loss": -7.094700813293457, "global_step": 184383, "epoch": 4390} {"train_loss": -7.069422245025635, "global_step": 184384, "epoch": 4390} {"train_loss": -7.058752059936523, "global_step": 184385, "epoch": 4390} {"train_loss": -7.12579345703125, "global_step": 184386, "epoch": 4390} {"train_loss": -7.055966377258301, "global_step": 184387, "epoch": 4390} {"train_loss": -7.135802268981934, "global_step": 184388, "epoch": 4390} {"train_loss": -7.089129447937012, "global_step": 184389, "epoch": 4390} {"train_loss": -6.994173049926758, "global_step": 184390, "epoch": 4390} {"train_loss": -7.085559844970703, "global_step": 184391, "epoch": 4390} {"train_loss": -7.13386344909668, "global_step": 184392, "epoch": 4390} {"train_loss": -7.048213958740234, "global_step": 184393, "epoch": 4390} {"train_loss": -7.110147476196289, "global_step": 184394, "epoch": 4390} {"train_loss": -7.128713607788086, "global_step": 184395, "epoch": 4390} {"train_loss": -7.179335594177246, "global_step": 184396, "epoch": 4390} {"train_loss": -7.090014457702637, "global_step": 184397, "epoch": 4390} {"train_loss": -7.111549377441406, "global_step": 184398, "epoch": 4390} {"train_loss": -7.184409141540527, "global_step": 184399, "epoch": 4390} {"train_loss": -7.1383562088012695, "global_step": 184400, "epoch": 4390} {"train_loss": -7.134825706481934, "global_step": 184401, "epoch": 4390} {"train_loss": -7.093343734741211, "global_step": 184402, "epoch": 4390} {"train_loss": -7.10603141784668, "global_step": 184403, "epoch": 4390} {"train_loss": -7.175774574279785, "global_step": 184404, "epoch": 4390} {"train_loss": -7.219944000244141, "global_step": 184405, "epoch": 4390} {"train_loss": -7.202566146850586, "global_step": 184406, "epoch": 4390} {"train_loss": -7.109098434448242, "global_step": 184407, "epoch": 4390} {"train_loss": -7.124059677124023, "global_step": 184408, "epoch": 4390} {"train_loss": -7.0876970291137695, "global_step": 184409, "epoch": 4390} {"train_loss": -7.15726375579834, "global_step": 184410, "epoch": 4390} {"train_loss": -7.158145904541016, "global_step": 184411, "epoch": 4390} {"train_loss": -7.189050197601318, "global_step": 184412, "epoch": 4390} {"train_loss": -7.019811630249023, "global_step": 184413, "epoch": 4390} {"train_loss": -7.092541694641113, "global_step": 184414, "epoch": 4390} {"train_loss": -7.238999366760254, "global_step": 184415, "epoch": 4390} {"train_loss": -7.20546817779541, "global_step": 184416, "epoch": 4390} {"train_loss": -7.21781587600708, "global_step": 184417, "epoch": 4390} {"train_loss": -7.274034023284912, "global_step": 184418, "epoch": 4390} {"train_loss": -7.2056074142456055, "global_step": 184419, "epoch": 4390} {"train_loss": -7.161515235900879, "global_step": 184420, "epoch": 4390} {"train_loss": -7.1300186429704935, "global_step": 184421, "epoch": 4390, "val_loss": 68818.4140625} {"train_loss": -7.21176290512085, "global_step": 184422, "epoch": 4391} {"train_loss": -7.230206489562988, "global_step": 184423, "epoch": 4391} {"train_loss": -7.200240135192871, "global_step": 184424, "epoch": 4391} {"train_loss": -7.20781135559082, "global_step": 184425, "epoch": 4391} {"train_loss": -7.236240386962891, "global_step": 184426, "epoch": 4391} {"train_loss": -7.123814105987549, "global_step": 184427, "epoch": 4391} {"train_loss": -7.125238418579102, "global_step": 184428, "epoch": 4391} {"train_loss": -7.076526641845703, "global_step": 184429, "epoch": 4391} {"train_loss": -7.112003326416016, "global_step": 184430, "epoch": 4391} {"train_loss": -7.2170305252075195, "global_step": 184431, "epoch": 4391} {"train_loss": -7.187257289886475, "global_step": 184432, "epoch": 4391} {"train_loss": -7.159237384796143, "global_step": 184433, "epoch": 4391} {"train_loss": -7.043787956237793, "global_step": 184434, "epoch": 4391} {"train_loss": -7.144974708557129, "global_step": 184435, "epoch": 4391} {"train_loss": -7.023733139038086, "global_step": 184436, "epoch": 4391} {"train_loss": -7.20652437210083, "global_step": 184437, "epoch": 4391} {"train_loss": -7.0419921875, "global_step": 184438, "epoch": 4391} {"train_loss": -7.164664268493652, "global_step": 184439, "epoch": 4391} {"train_loss": -7.1146135330200195, "global_step": 184440, "epoch": 4391} {"train_loss": -7.090358734130859, "global_step": 184441, "epoch": 4391} {"train_loss": -7.134085655212402, "global_step": 184442, "epoch": 4391} {"train_loss": -7.249728202819824, "global_step": 184443, "epoch": 4391} {"train_loss": -7.077476501464844, "global_step": 184444, "epoch": 4391} {"train_loss": -7.1670050621032715, "global_step": 184445, "epoch": 4391} {"train_loss": -7.061769008636475, "global_step": 184446, "epoch": 4391} {"train_loss": -7.09254264831543, "global_step": 184447, "epoch": 4391} {"train_loss": -7.143883228302002, "global_step": 184448, "epoch": 4391} {"train_loss": -7.095970630645752, "global_step": 184449, "epoch": 4391} {"train_loss": -7.174455642700195, "global_step": 184450, "epoch": 4391} {"train_loss": -7.039059638977051, "global_step": 184451, "epoch": 4391} {"train_loss": -7.047324180603027, "global_step": 184452, "epoch": 4391} {"train_loss": -7.1589436531066895, "global_step": 184453, "epoch": 4391} {"train_loss": -7.13858699798584, "global_step": 184454, "epoch": 4391} {"train_loss": -7.130162715911865, "global_step": 184455, "epoch": 4391} {"train_loss": -7.041530132293701, "global_step": 184456, "epoch": 4391} {"train_loss": -7.201969146728516, "global_step": 184457, "epoch": 4391} {"train_loss": -7.066617965698242, "global_step": 184458, "epoch": 4391} {"train_loss": -7.045942306518555, "global_step": 184459, "epoch": 4391} {"train_loss": -7.174840927124023, "global_step": 184460, "epoch": 4391} {"train_loss": -7.067717552185059, "global_step": 184461, "epoch": 4391} {"train_loss": -7.134904861450195, "global_step": 184462, "epoch": 4391} {"train_loss": -7.130975938978649, "global_step": 184463, "epoch": 4391, "val_loss": 68788.3515625} {"train_loss": -7.1403584480285645, "global_step": 184464, "epoch": 4392} {"train_loss": -7.125590801239014, "global_step": 184465, "epoch": 4392} {"train_loss": -7.184114456176758, "global_step": 184466, "epoch": 4392} {"train_loss": -7.1593122482299805, "global_step": 184467, "epoch": 4392} {"train_loss": -7.24409294128418, "global_step": 184468, "epoch": 4392} {"train_loss": -7.178938865661621, "global_step": 184469, "epoch": 4392} {"train_loss": -7.302823543548584, "global_step": 184470, "epoch": 4392} {"train_loss": -7.1282243728637695, "global_step": 184471, "epoch": 4392} {"train_loss": -7.104016304016113, "global_step": 184472, "epoch": 4392} {"train_loss": -6.995886325836182, "global_step": 184473, "epoch": 4392} {"train_loss": -6.908648490905762, "global_step": 184474, "epoch": 4392} {"train_loss": -7.049752235412598, "global_step": 184475, "epoch": 4392} {"train_loss": -7.091044902801514, "global_step": 184476, "epoch": 4392} {"train_loss": -7.076094150543213, "global_step": 184477, "epoch": 4392} {"train_loss": -7.025928497314453, "global_step": 184478, "epoch": 4392} {"train_loss": -7.087279796600342, "global_step": 184479, "epoch": 4392} {"train_loss": -7.074645042419434, "global_step": 184480, "epoch": 4392} {"train_loss": -7.058218002319336, "global_step": 184481, "epoch": 4392} {"train_loss": -6.920276641845703, "global_step": 184482, "epoch": 4392} {"train_loss": -7.139098167419434, "global_step": 184483, "epoch": 4392} {"train_loss": -7.055507659912109, "global_step": 184484, "epoch": 4392} {"train_loss": -6.953583240509033, "global_step": 184485, "epoch": 4392} {"train_loss": -7.142634868621826, "global_step": 184486, "epoch": 4392} {"train_loss": -6.9293012619018555, "global_step": 184487, "epoch": 4392} {"train_loss": -6.89309549331665, "global_step": 184488, "epoch": 4392} {"train_loss": -7.074894905090332, "global_step": 184489, "epoch": 4392} {"train_loss": -6.9973320960998535, "global_step": 184490, "epoch": 4392} {"train_loss": -6.9597649574279785, "global_step": 184491, "epoch": 4392} {"train_loss": -6.937987327575684, "global_step": 184492, "epoch": 4392} {"train_loss": -6.970500946044922, "global_step": 184493, "epoch": 4392} {"train_loss": -6.987177848815918, "global_step": 184494, "epoch": 4392} {"train_loss": -7.005253314971924, "global_step": 184495, "epoch": 4392} {"train_loss": -6.872509956359863, "global_step": 184496, "epoch": 4392} {"train_loss": -7.075022220611572, "global_step": 184497, "epoch": 4392} {"train_loss": -7.057807445526123, "global_step": 184498, "epoch": 4392} {"train_loss": -6.96995210647583, "global_step": 184499, "epoch": 4392} {"train_loss": -7.0334153175354, "global_step": 184500, "epoch": 4392} {"train_loss": -7.062954902648926, "global_step": 184501, "epoch": 4392} {"train_loss": -6.984408855438232, "global_step": 184502, "epoch": 4392} {"train_loss": -6.922451972961426, "global_step": 184503, "epoch": 4392} {"train_loss": -7.127666473388672, "global_step": 184504, "epoch": 4392} {"train_loss": -7.046036493210566, "global_step": 184505, "epoch": 4392, "val_loss": 68809.9375} {"train_loss": -7.123279571533203, "global_step": 184506, "epoch": 4393} {"train_loss": -7.017024040222168, "global_step": 184507, "epoch": 4393} {"train_loss": -7.072472095489502, "global_step": 184508, "epoch": 4393} {"train_loss": -7.127631664276123, "global_step": 184509, "epoch": 4393} {"train_loss": -7.159387588500977, "global_step": 184510, "epoch": 4393} {"train_loss": -7.123227119445801, "global_step": 184511, "epoch": 4393} {"train_loss": -7.076042652130127, "global_step": 184512, "epoch": 4393} {"train_loss": -7.102869987487793, "global_step": 184513, "epoch": 4393} {"train_loss": -7.068110942840576, "global_step": 184514, "epoch": 4393} {"train_loss": -7.047825813293457, "global_step": 184515, "epoch": 4393} {"train_loss": -7.088311195373535, "global_step": 184516, "epoch": 4393} {"train_loss": -7.08902645111084, "global_step": 184517, "epoch": 4393} {"train_loss": -7.156271934509277, "global_step": 184518, "epoch": 4393} {"train_loss": -7.195826053619385, "global_step": 184519, "epoch": 4393} {"train_loss": -7.266477584838867, "global_step": 184520, "epoch": 4393} {"train_loss": -7.177468776702881, "global_step": 184521, "epoch": 4393} {"train_loss": -7.124894142150879, "global_step": 184522, "epoch": 4393} {"train_loss": -7.251635551452637, "global_step": 184523, "epoch": 4393} {"train_loss": -7.234864234924316, "global_step": 184524, "epoch": 4393} {"train_loss": -7.133037090301514, "global_step": 184525, "epoch": 4393} {"train_loss": -7.186652183532715, "global_step": 184526, "epoch": 4393} {"train_loss": -7.233328819274902, "global_step": 184527, "epoch": 4393} {"train_loss": -7.193627834320068, "global_step": 184528, "epoch": 4393} {"train_loss": -7.0327372550964355, "global_step": 184529, "epoch": 4393} {"train_loss": -7.108115196228027, "global_step": 184530, "epoch": 4393} {"train_loss": -7.111182689666748, "global_step": 184531, "epoch": 4393} {"train_loss": -7.187812328338623, "global_step": 184532, "epoch": 4393} {"train_loss": -7.1653571128845215, "global_step": 184533, "epoch": 4393} {"train_loss": -7.2454633712768555, "global_step": 184534, "epoch": 4393} {"train_loss": -7.0384721755981445, "global_step": 184535, "epoch": 4393} {"train_loss": -7.170629024505615, "global_step": 184536, "epoch": 4393} {"train_loss": -7.189266681671143, "global_step": 184537, "epoch": 4393} {"train_loss": -6.993685722351074, "global_step": 184538, "epoch": 4393} {"train_loss": -7.188677787780762, "global_step": 184539, "epoch": 4393} {"train_loss": -7.2108683586120605, "global_step": 184540, "epoch": 4393} {"train_loss": -7.1559553146362305, "global_step": 184541, "epoch": 4393} {"train_loss": -7.079435348510742, "global_step": 184542, "epoch": 4393} {"train_loss": -7.022765636444092, "global_step": 184543, "epoch": 4393} {"train_loss": -7.177322864532471, "global_step": 184544, "epoch": 4393} {"train_loss": -6.884721755981445, "global_step": 184545, "epoch": 4393} {"train_loss": -6.839724540710449, "global_step": 184546, "epoch": 4393} {"train_loss": -7.123554388682048, "global_step": 184547, "epoch": 4393, "val_loss": 69144.0859375} {"train_loss": -7.018805503845215, "global_step": 184548, "epoch": 4394} {"train_loss": -7.009143829345703, "global_step": 184549, "epoch": 4394} {"train_loss": -6.982223987579346, "global_step": 184550, "epoch": 4394} {"train_loss": -7.013352394104004, "global_step": 184551, "epoch": 4394} {"train_loss": -7.022303581237793, "global_step": 184552, "epoch": 4394} {"train_loss": -6.9707794189453125, "global_step": 184553, "epoch": 4394} {"train_loss": -7.02225399017334, "global_step": 184554, "epoch": 4394} {"train_loss": -7.04377555847168, "global_step": 184555, "epoch": 4394} {"train_loss": -7.0695061683654785, "global_step": 184556, "epoch": 4394} {"train_loss": -6.979643821716309, "global_step": 184557, "epoch": 4394} {"train_loss": -7.098354816436768, "global_step": 184558, "epoch": 4394} {"train_loss": -7.097905158996582, "global_step": 184559, "epoch": 4394} {"train_loss": -7.046548843383789, "global_step": 184560, "epoch": 4394} {"train_loss": -7.126001358032227, "global_step": 184561, "epoch": 4394} {"train_loss": -7.101507663726807, "global_step": 184562, "epoch": 4394} {"train_loss": -7.108445167541504, "global_step": 184563, "epoch": 4394} {"train_loss": -7.1067304611206055, "global_step": 184564, "epoch": 4394} {"train_loss": -6.989043235778809, "global_step": 184565, "epoch": 4394} {"train_loss": -7.058989524841309, "global_step": 184566, "epoch": 4394} {"train_loss": -7.052426815032959, "global_step": 184567, "epoch": 4394} {"train_loss": -7.196548938751221, "global_step": 184568, "epoch": 4394} {"train_loss": -7.041813850402832, "global_step": 184569, "epoch": 4394} {"train_loss": -7.109670639038086, "global_step": 184570, "epoch": 4394} {"train_loss": -7.207655429840088, "global_step": 184571, "epoch": 4394} {"train_loss": -7.144661903381348, "global_step": 184572, "epoch": 4394} {"train_loss": -7.029982566833496, "global_step": 184573, "epoch": 4394} {"train_loss": -7.093860149383545, "global_step": 184574, "epoch": 4394} {"train_loss": -7.152299880981445, "global_step": 184575, "epoch": 4394} {"train_loss": -7.044623851776123, "global_step": 184576, "epoch": 4394} {"train_loss": -7.1010942459106445, "global_step": 184577, "epoch": 4394} {"train_loss": -7.219546318054199, "global_step": 184578, "epoch": 4394} {"train_loss": -7.121893405914307, "global_step": 184579, "epoch": 4394} {"train_loss": -7.185118675231934, "global_step": 184580, "epoch": 4394} {"train_loss": -7.0573906898498535, "global_step": 184581, "epoch": 4394} {"train_loss": -7.082986831665039, "global_step": 184582, "epoch": 4394} {"train_loss": -7.122089385986328, "global_step": 184583, "epoch": 4394} {"train_loss": -7.078676223754883, "global_step": 184584, "epoch": 4394} {"train_loss": -6.983002662658691, "global_step": 184585, "epoch": 4394} {"train_loss": -7.113872528076172, "global_step": 184586, "epoch": 4394} {"train_loss": -7.1042633056640625, "global_step": 184587, "epoch": 4394} {"train_loss": -7.016385078430176, "global_step": 184588, "epoch": 4394} {"train_loss": -7.077783255350022, "global_step": 184589, "epoch": 4394, "val_loss": 68937.96875} {"train_loss": -7.046950340270996, "global_step": 184590, "epoch": 4395} {"train_loss": -7.009746551513672, "global_step": 184591, "epoch": 4395} {"train_loss": -7.085573196411133, "global_step": 184592, "epoch": 4395} {"train_loss": -6.975689888000488, "global_step": 184593, "epoch": 4395} {"train_loss": -7.008871078491211, "global_step": 184594, "epoch": 4395} {"train_loss": -7.104475975036621, "global_step": 184595, "epoch": 4395} {"train_loss": -7.044824600219727, "global_step": 184596, "epoch": 4395} {"train_loss": -6.999156475067139, "global_step": 184597, "epoch": 4395} {"train_loss": -7.074887275695801, "global_step": 184598, "epoch": 4395} {"train_loss": -6.973607063293457, "global_step": 184599, "epoch": 4395} {"train_loss": -7.054198265075684, "global_step": 184600, "epoch": 4395} {"train_loss": -6.9210615158081055, "global_step": 184601, "epoch": 4395} {"train_loss": -7.0628767013549805, "global_step": 184602, "epoch": 4395} {"train_loss": -6.972296237945557, "global_step": 184603, "epoch": 4395} {"train_loss": -6.898466110229492, "global_step": 184604, "epoch": 4395} {"train_loss": -7.115616321563721, "global_step": 184605, "epoch": 4395} {"train_loss": -6.836508274078369, "global_step": 184606, "epoch": 4395} {"train_loss": -6.979076862335205, "global_step": 184607, "epoch": 4395} {"train_loss": -7.095946311950684, "global_step": 184608, "epoch": 4395} {"train_loss": -6.97270393371582, "global_step": 184609, "epoch": 4395} {"train_loss": -7.0681233406066895, "global_step": 184610, "epoch": 4395} {"train_loss": -6.9200334548950195, "global_step": 184611, "epoch": 4395} {"train_loss": -7.02588415145874, "global_step": 184612, "epoch": 4395} {"train_loss": -6.890130996704102, "global_step": 184613, "epoch": 4395} {"train_loss": -6.927003860473633, "global_step": 184614, "epoch": 4395} {"train_loss": -6.95045280456543, "global_step": 184615, "epoch": 4395} {"train_loss": -6.981167793273926, "global_step": 184616, "epoch": 4395} {"train_loss": -6.940731048583984, "global_step": 184617, "epoch": 4395} {"train_loss": -7.012467384338379, "global_step": 184618, "epoch": 4395} {"train_loss": -7.117884635925293, "global_step": 184619, "epoch": 4395} {"train_loss": -7.039743423461914, "global_step": 184620, "epoch": 4395} {"train_loss": -6.991707801818848, "global_step": 184621, "epoch": 4395} {"train_loss": -7.015732765197754, "global_step": 184622, "epoch": 4395} {"train_loss": -7.065303325653076, "global_step": 184623, "epoch": 4395} {"train_loss": -7.101701736450195, "global_step": 184624, "epoch": 4395} {"train_loss": -7.130880355834961, "global_step": 184625, "epoch": 4395} {"train_loss": -7.006186485290527, "global_step": 184626, "epoch": 4395} {"train_loss": -7.101282596588135, "global_step": 184627, "epoch": 4395} {"train_loss": -7.227372169494629, "global_step": 184628, "epoch": 4395} {"train_loss": -7.149806499481201, "global_step": 184629, "epoch": 4395} {"train_loss": -7.148679733276367, "global_step": 184630, "epoch": 4395} {"train_loss": -7.028173651014056, "global_step": 184631, "epoch": 4395, "val_loss": 68824.8359375} {"train_loss": -7.095735549926758, "global_step": 184632, "epoch": 4396} {"train_loss": -7.130139350891113, "global_step": 184633, "epoch": 4396} {"train_loss": -7.109347343444824, "global_step": 184634, "epoch": 4396} {"train_loss": -7.1200079917907715, "global_step": 184635, "epoch": 4396} {"train_loss": -7.154870986938477, "global_step": 184636, "epoch": 4396} {"train_loss": -7.115692615509033, "global_step": 184637, "epoch": 4396} {"train_loss": -7.024760723114014, "global_step": 184638, "epoch": 4396} {"train_loss": -7.136148452758789, "global_step": 184639, "epoch": 4396} {"train_loss": -7.12647819519043, "global_step": 184640, "epoch": 4396} {"train_loss": -7.088810920715332, "global_step": 184641, "epoch": 4396} {"train_loss": -7.075145244598389, "global_step": 184642, "epoch": 4396} {"train_loss": -7.123356819152832, "global_step": 184643, "epoch": 4396} {"train_loss": -7.140733242034912, "global_step": 184644, "epoch": 4396} {"train_loss": -6.943263053894043, "global_step": 184645, "epoch": 4396} {"train_loss": -7.159103870391846, "global_step": 184646, "epoch": 4396} {"train_loss": -7.2113494873046875, "global_step": 184647, "epoch": 4396} {"train_loss": -7.230947971343994, "global_step": 184648, "epoch": 4396} {"train_loss": -7.091421127319336, "global_step": 184649, "epoch": 4396} {"train_loss": -7.0771074295043945, "global_step": 184650, "epoch": 4396} {"train_loss": -7.0449957847595215, "global_step": 184651, "epoch": 4396} {"train_loss": -7.207601070404053, "global_step": 184652, "epoch": 4396} {"train_loss": -7.133326053619385, "global_step": 184653, "epoch": 4396} {"train_loss": -7.129783630371094, "global_step": 184654, "epoch": 4396} {"train_loss": -7.0977678298950195, "global_step": 184655, "epoch": 4396} {"train_loss": -7.175668716430664, "global_step": 184656, "epoch": 4396} {"train_loss": -7.161407947540283, "global_step": 184657, "epoch": 4396} {"train_loss": -7.220340728759766, "global_step": 184658, "epoch": 4396} {"train_loss": -7.126516342163086, "global_step": 184659, "epoch": 4396} {"train_loss": -7.268340587615967, "global_step": 184660, "epoch": 4396} {"train_loss": -7.047603607177734, "global_step": 184661, "epoch": 4396} {"train_loss": -7.020335674285889, "global_step": 184662, "epoch": 4396} {"train_loss": -7.209297180175781, "global_step": 184663, "epoch": 4396} {"train_loss": -7.075474262237549, "global_step": 184664, "epoch": 4396} {"train_loss": -6.9078369140625, "global_step": 184665, "epoch": 4396} {"train_loss": -7.009878158569336, "global_step": 184666, "epoch": 4396} {"train_loss": -7.136930465698242, "global_step": 184667, "epoch": 4396} {"train_loss": -7.117652416229248, "global_step": 184668, "epoch": 4396} {"train_loss": -7.006223201751709, "global_step": 184669, "epoch": 4396} {"train_loss": -7.053841590881348, "global_step": 184670, "epoch": 4396} {"train_loss": -7.084660053253174, "global_step": 184671, "epoch": 4396} {"train_loss": -7.069911003112793, "global_step": 184672, "epoch": 4396} {"train_loss": -7.108045237404959, "global_step": 184673, "epoch": 4396, "val_loss": 68589.625} {"train_loss": -7.115283012390137, "global_step": 184674, "epoch": 4397} {"train_loss": -7.045677661895752, "global_step": 184675, "epoch": 4397} {"train_loss": -7.104415416717529, "global_step": 184676, "epoch": 4397} {"train_loss": -7.07192850112915, "global_step": 184677, "epoch": 4397} {"train_loss": -7.036731719970703, "global_step": 184678, "epoch": 4397} {"train_loss": -7.099063873291016, "global_step": 184679, "epoch": 4397} {"train_loss": -7.106089115142822, "global_step": 184680, "epoch": 4397} {"train_loss": -7.155679702758789, "global_step": 184681, "epoch": 4397} {"train_loss": -7.149892807006836, "global_step": 184682, "epoch": 4397} {"train_loss": -7.186385631561279, "global_step": 184683, "epoch": 4397} {"train_loss": -7.153348922729492, "global_step": 184684, "epoch": 4397} {"train_loss": -7.146681785583496, "global_step": 184685, "epoch": 4397} {"train_loss": -7.100590229034424, "global_step": 184686, "epoch": 4397} {"train_loss": -7.119927406311035, "global_step": 184687, "epoch": 4397} {"train_loss": -7.076569080352783, "global_step": 184688, "epoch": 4397} {"train_loss": -7.079068183898926, "global_step": 184689, "epoch": 4397} {"train_loss": -7.119246482849121, "global_step": 184690, "epoch": 4397} {"train_loss": -6.937750816345215, "global_step": 184691, "epoch": 4397} {"train_loss": -7.180018901824951, "global_step": 184692, "epoch": 4397} {"train_loss": -7.0791802406311035, "global_step": 184693, "epoch": 4397} {"train_loss": -6.886310577392578, "global_step": 184694, "epoch": 4397} {"train_loss": -7.024445056915283, "global_step": 184695, "epoch": 4397} {"train_loss": -6.844303131103516, "global_step": 184696, "epoch": 4397} {"train_loss": -6.9956560134887695, "global_step": 184697, "epoch": 4397} {"train_loss": -7.072442531585693, "global_step": 184698, "epoch": 4397} {"train_loss": -6.8923211097717285, "global_step": 184699, "epoch": 4397} {"train_loss": -7.088700771331787, "global_step": 184700, "epoch": 4397} {"train_loss": -6.933270454406738, "global_step": 184701, "epoch": 4397} {"train_loss": -6.891900062561035, "global_step": 184702, "epoch": 4397} {"train_loss": -7.00496768951416, "global_step": 184703, "epoch": 4397} {"train_loss": -7.03897762298584, "global_step": 184704, "epoch": 4397} {"train_loss": -7.002030372619629, "global_step": 184705, "epoch": 4397} {"train_loss": -7.014259338378906, "global_step": 184706, "epoch": 4397} {"train_loss": -6.839102745056152, "global_step": 184707, "epoch": 4397} {"train_loss": -6.974435806274414, "global_step": 184708, "epoch": 4397} {"train_loss": -7.09131383895874, "global_step": 184709, "epoch": 4397} {"train_loss": -6.8910651206970215, "global_step": 184710, "epoch": 4397} {"train_loss": -7.042152404785156, "global_step": 184711, "epoch": 4397} {"train_loss": -7.149113655090332, "global_step": 184712, "epoch": 4397} {"train_loss": -6.972515106201172, "global_step": 184713, "epoch": 4397} {"train_loss": -6.999343395233154, "global_step": 184714, "epoch": 4397} {"train_loss": -7.04024803070795, "global_step": 184715, "epoch": 4397, "val_loss": 68800.140625} {"train_loss": -6.9911885261535645, "global_step": 184716, "epoch": 4398} {"train_loss": -7.120567798614502, "global_step": 184717, "epoch": 4398} {"train_loss": -6.94334602355957, "global_step": 184718, "epoch": 4398} {"train_loss": -7.110038757324219, "global_step": 184719, "epoch": 4398} {"train_loss": -7.058851718902588, "global_step": 184720, "epoch": 4398} {"train_loss": -7.051508903503418, "global_step": 184721, "epoch": 4398} {"train_loss": -7.023174285888672, "global_step": 184722, "epoch": 4398} {"train_loss": -7.091397285461426, "global_step": 184723, "epoch": 4398} {"train_loss": -7.050644874572754, "global_step": 184724, "epoch": 4398} {"train_loss": -7.015259742736816, "global_step": 184725, "epoch": 4398} {"train_loss": -7.041667938232422, "global_step": 184726, "epoch": 4398} {"train_loss": -7.000748634338379, "global_step": 184727, "epoch": 4398} {"train_loss": -7.118326663970947, "global_step": 184728, "epoch": 4398} {"train_loss": -7.052456855773926, "global_step": 184729, "epoch": 4398} {"train_loss": -7.086854934692383, "global_step": 184730, "epoch": 4398} {"train_loss": -7.076812744140625, "global_step": 184731, "epoch": 4398} {"train_loss": -7.065793037414551, "global_step": 184732, "epoch": 4398} {"train_loss": -7.127941131591797, "global_step": 184733, "epoch": 4398} {"train_loss": -7.112792015075684, "global_step": 184734, "epoch": 4398} {"train_loss": -7.082128047943115, "global_step": 184735, "epoch": 4398} {"train_loss": -7.170024871826172, "global_step": 184736, "epoch": 4398} {"train_loss": -7.169353008270264, "global_step": 184737, "epoch": 4398} {"train_loss": -7.173085689544678, "global_step": 184738, "epoch": 4398} {"train_loss": -7.151487827301025, "global_step": 184739, "epoch": 4398} {"train_loss": -7.171443939208984, "global_step": 184740, "epoch": 4398} {"train_loss": -7.1764936447143555, "global_step": 184741, "epoch": 4398} {"train_loss": -7.027060508728027, "global_step": 184742, "epoch": 4398} {"train_loss": -7.178530693054199, "global_step": 184743, "epoch": 4398} {"train_loss": -7.058427810668945, "global_step": 184744, "epoch": 4398} {"train_loss": -7.186275005340576, "global_step": 184745, "epoch": 4398} {"train_loss": -7.1122894287109375, "global_step": 184746, "epoch": 4398} {"train_loss": -7.086637020111084, "global_step": 184747, "epoch": 4398} {"train_loss": -7.2067365646362305, "global_step": 184748, "epoch": 4398} {"train_loss": -7.071929931640625, "global_step": 184749, "epoch": 4398} {"train_loss": -7.048880577087402, "global_step": 184750, "epoch": 4398} {"train_loss": -7.216636657714844, "global_step": 184751, "epoch": 4398} {"train_loss": -7.163825988769531, "global_step": 184752, "epoch": 4398} {"train_loss": -7.068924903869629, "global_step": 184753, "epoch": 4398} {"train_loss": -7.092049598693848, "global_step": 184754, "epoch": 4398} {"train_loss": -7.195178985595703, "global_step": 184755, "epoch": 4398} {"train_loss": -7.228673934936523, "global_step": 184756, "epoch": 4398} {"train_loss": -7.103886524836223, "global_step": 184757, "epoch": 4398, "val_loss": 68836.171875} {"train_loss": -7.23499059677124, "global_step": 184758, "epoch": 4399} {"train_loss": -7.202270984649658, "global_step": 184759, "epoch": 4399} {"train_loss": -7.123846054077148, "global_step": 184760, "epoch": 4399} {"train_loss": -7.078886032104492, "global_step": 184761, "epoch": 4399} {"train_loss": -7.300135135650635, "global_step": 184762, "epoch": 4399} {"train_loss": -7.141014099121094, "global_step": 184763, "epoch": 4399} {"train_loss": -7.19373893737793, "global_step": 184764, "epoch": 4399} {"train_loss": -7.192127227783203, "global_step": 184765, "epoch": 4399} {"train_loss": -7.189228057861328, "global_step": 184766, "epoch": 4399} {"train_loss": -7.150911331176758, "global_step": 184767, "epoch": 4399} {"train_loss": -7.181601524353027, "global_step": 184768, "epoch": 4399} {"train_loss": -7.232084274291992, "global_step": 184769, "epoch": 4399} {"train_loss": -7.154443740844727, "global_step": 184770, "epoch": 4399} {"train_loss": -7.162600517272949, "global_step": 184771, "epoch": 4399} {"train_loss": -7.253529071807861, "global_step": 184772, "epoch": 4399} {"train_loss": -7.209826469421387, "global_step": 184773, "epoch": 4399} {"train_loss": -7.220459938049316, "global_step": 184774, "epoch": 4399} {"train_loss": -7.226405143737793, "global_step": 184775, "epoch": 4399} {"train_loss": -7.072546005249023, "global_step": 184776, "epoch": 4399} {"train_loss": -7.119421482086182, "global_step": 184777, "epoch": 4399} {"train_loss": -7.155685901641846, "global_step": 184778, "epoch": 4399} {"train_loss": -7.070147514343262, "global_step": 184779, "epoch": 4399} {"train_loss": -7.132691383361816, "global_step": 184780, "epoch": 4399} {"train_loss": -7.17205286026001, "global_step": 184781, "epoch": 4399} {"train_loss": -7.004042625427246, "global_step": 184782, "epoch": 4399} {"train_loss": -7.152061462402344, "global_step": 184783, "epoch": 4399} {"train_loss": -7.137556076049805, "global_step": 184784, "epoch": 4399} {"train_loss": -7.269161224365234, "global_step": 184785, "epoch": 4399} {"train_loss": -7.172891616821289, "global_step": 184786, "epoch": 4399} {"train_loss": -7.152642726898193, "global_step": 184787, "epoch": 4399} {"train_loss": -7.149504661560059, "global_step": 184788, "epoch": 4399} {"train_loss": -7.104605197906494, "global_step": 184789, "epoch": 4399} {"train_loss": -7.116908073425293, "global_step": 184790, "epoch": 4399} {"train_loss": -7.1384758949279785, "global_step": 184791, "epoch": 4399} {"train_loss": -7.070821762084961, "global_step": 184792, "epoch": 4399} {"train_loss": -7.068596363067627, "global_step": 184793, "epoch": 4399} {"train_loss": -7.154704570770264, "global_step": 184794, "epoch": 4399} {"train_loss": -7.178882598876953, "global_step": 184795, "epoch": 4399} {"train_loss": -7.173341751098633, "global_step": 184796, "epoch": 4399} {"train_loss": -7.05731201171875, "global_step": 184797, "epoch": 4399} {"train_loss": -7.070798873901367, "global_step": 184798, "epoch": 4399} {"train_loss": -7.153747467767625, "global_step": 184799, "epoch": 4399, "val_loss": 68858.3046875} {"train_loss": -7.195773124694824, "global_step": 184800, "epoch": 4400} {"train_loss": -7.043649673461914, "global_step": 184801, "epoch": 4400} {"train_loss": -7.118056297302246, "global_step": 184802, "epoch": 4400} {"train_loss": -7.183116436004639, "global_step": 184803, "epoch": 4400} {"train_loss": -7.205286979675293, "global_step": 184804, "epoch": 4400} {"train_loss": -7.090953350067139, "global_step": 184805, "epoch": 4400} {"train_loss": -7.10800838470459, "global_step": 184806, "epoch": 4400} {"train_loss": -7.21221923828125, "global_step": 184807, "epoch": 4400} {"train_loss": -7.223304748535156, "global_step": 184808, "epoch": 4400} {"train_loss": -7.0315141677856445, "global_step": 184809, "epoch": 4400} {"train_loss": -7.224116325378418, "global_step": 184810, "epoch": 4400} {"train_loss": -7.085700511932373, "global_step": 184811, "epoch": 4400} {"train_loss": -7.206188678741455, "global_step": 184812, "epoch": 4400} {"train_loss": -7.262316703796387, "global_step": 184813, "epoch": 4400} {"train_loss": -7.061554908752441, "global_step": 184814, "epoch": 4400} {"train_loss": -7.149845600128174, "global_step": 184815, "epoch": 4400} {"train_loss": -7.102891445159912, "global_step": 184816, "epoch": 4400} {"train_loss": -7.0924272537231445, "global_step": 184817, "epoch": 4400} {"train_loss": -7.142858028411865, "global_step": 184818, "epoch": 4400} {"train_loss": -7.065600395202637, "global_step": 184819, "epoch": 4400} {"train_loss": -7.02046012878418, "global_step": 184820, "epoch": 4400} {"train_loss": -7.140163421630859, "global_step": 184821, "epoch": 4400} {"train_loss": -7.228486061096191, "global_step": 184822, "epoch": 4400} {"train_loss": -7.194305419921875, "global_step": 184823, "epoch": 4400} {"train_loss": -7.089011192321777, "global_step": 184824, "epoch": 4400} {"train_loss": -7.172346115112305, "global_step": 184825, "epoch": 4400} {"train_loss": -7.362700462341309, "global_step": 184826, "epoch": 4400} {"train_loss": -7.1503095626831055, "global_step": 184827, "epoch": 4400} {"train_loss": -7.196948528289795, "global_step": 184828, "epoch": 4400} {"train_loss": -7.081522464752197, "global_step": 184829, "epoch": 4400} {"train_loss": -7.123878479003906, "global_step": 184830, "epoch": 4400} {"train_loss": -7.133968353271484, "global_step": 184831, "epoch": 4400} {"train_loss": -7.090770721435547, "global_step": 184832, "epoch": 4400} {"train_loss": -7.037994384765625, "global_step": 184833, "epoch": 4400} {"train_loss": -7.189675331115723, "global_step": 184834, "epoch": 4400} {"train_loss": -7.077334403991699, "global_step": 184835, "epoch": 4400} {"train_loss": -6.981451511383057, "global_step": 184836, "epoch": 4400} {"train_loss": -7.1010847091674805, "global_step": 184837, "epoch": 4400} {"train_loss": -7.0995683670043945, "global_step": 184838, "epoch": 4400} {"train_loss": -7.1020989418029785, "global_step": 184839, "epoch": 4400} {"train_loss": -6.964138984680176, "global_step": 184840, "epoch": 4400} {"train_loss": -7.13117960521153, "global_step": 184841, "epoch": 4400, "train/sim_max_reward_0": 0.8296414421935888, "train/sim_max_reward_1": 0.7881921726420772, "train/sim_max_reward_2": 0.6883534396843131, "train/sim_max_reward_3": 0.5190583909656944, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9393160065381704, "test/sim_max_reward_4400000": 0.21537802813938767, "test/sim_max_reward_4400001": 0.9743313955464867, "test/sim_max_reward_4400002": 0.938481293004986, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.20012465534294327, "test/sim_max_reward_4400006": 0.9812401714057694, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 0.9194974336087496, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9599288094161001, "test/sim_max_reward_4400014": 0.8390043407519954, "test/sim_max_reward_4400015": 0.07632915549814213, "test/sim_max_reward_4400016": 0.19190282710717693, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3016475376905988, "test/sim_max_reward_4400019": 0.9922991125923771, "test/sim_max_reward_4400020": 0.7819468736741674, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9585045602290877, "test/sim_max_reward_4400023": 0.9758711131915921, "test/sim_max_reward_4400024": 0.8887123387289603, "test/sim_max_reward_4400025": 0.26952290181453187, "test/sim_max_reward_4400026": 0.9398984855403352, "test/sim_max_reward_4400027": 0.009160913384822238, "test/sim_max_reward_4400028": 0.9810010454901624, "test/sim_max_reward_4400029": 0.9177515068803815, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 0.9393994478277788, "test/sim_max_reward_4400035": 0.9829181931545155, "test/sim_max_reward_4400036": 0.5263906922671705, "test/sim_max_reward_4400037": 0.8248237771204153, "test/sim_max_reward_4400038": 0.8740453557723811, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9733098501834843, "test/sim_max_reward_4400042": 0.531814110062273, "test/sim_max_reward_4400043": 0.989044532544386, "test/sim_max_reward_4400044": 0.8661673095733453, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.32187201747429334, "test/sim_max_reward_4400047": 0.9060732583936337, "test/sim_max_reward_4400048": 0.970132992113195, "test/sim_max_reward_4400049": 0.9511885815967231, "train/mean_score": 0.7940935753373073, "test/mean_score": 0.6762514703561834, "val_loss": 68707.5625} {"train_loss": -7.047553062438965, "global_step": 184842, "epoch": 4401} {"train_loss": -7.108362674713135, "global_step": 184843, "epoch": 4401} {"train_loss": -7.170074462890625, "global_step": 184844, "epoch": 4401} {"train_loss": -6.983184337615967, "global_step": 184845, "epoch": 4401} {"train_loss": -7.102705478668213, "global_step": 184846, "epoch": 4401} {"train_loss": -7.1228485107421875, "global_step": 184847, "epoch": 4401} {"train_loss": -6.9781060218811035, "global_step": 184848, "epoch": 4401} {"train_loss": -7.110973358154297, "global_step": 184849, "epoch": 4401} {"train_loss": -7.101162910461426, "global_step": 184850, "epoch": 4401} {"train_loss": -7.020453453063965, "global_step": 184851, "epoch": 4401} {"train_loss": -7.129261016845703, "global_step": 184852, "epoch": 4401} {"train_loss": -7.011570930480957, "global_step": 184853, "epoch": 4401} {"train_loss": -7.126764297485352, "global_step": 184854, "epoch": 4401} {"train_loss": -7.010369777679443, "global_step": 184855, "epoch": 4401} {"train_loss": -7.036559104919434, "global_step": 184856, "epoch": 4401} {"train_loss": -7.008491516113281, "global_step": 184857, "epoch": 4401} {"train_loss": -7.077182769775391, "global_step": 184858, "epoch": 4401} {"train_loss": -7.071734428405762, "global_step": 184859, "epoch": 4401} {"train_loss": -6.95490026473999, "global_step": 184860, "epoch": 4401} {"train_loss": -7.102374076843262, "global_step": 184861, "epoch": 4401} {"train_loss": -6.8809075355529785, "global_step": 184862, "epoch": 4401} {"train_loss": -7.102817535400391, "global_step": 184863, "epoch": 4401} {"train_loss": -6.984785556793213, "global_step": 184864, "epoch": 4401} {"train_loss": -7.034660339355469, "global_step": 184865, "epoch": 4401} {"train_loss": -6.972843647003174, "global_step": 184866, "epoch": 4401} {"train_loss": -6.936188697814941, "global_step": 184867, "epoch": 4401} {"train_loss": -6.987738609313965, "global_step": 184868, "epoch": 4401} {"train_loss": -6.972592830657959, "global_step": 184869, "epoch": 4401} {"train_loss": -6.858022689819336, "global_step": 184870, "epoch": 4401} {"train_loss": -6.8842692375183105, "global_step": 184871, "epoch": 4401} {"train_loss": -6.928705215454102, "global_step": 184872, "epoch": 4401} {"train_loss": -6.82049560546875, "global_step": 184873, "epoch": 4401} {"train_loss": -7.08847188949585, "global_step": 184874, "epoch": 4401} {"train_loss": -6.738519668579102, "global_step": 184875, "epoch": 4401} {"train_loss": -7.035572528839111, "global_step": 184876, "epoch": 4401} {"train_loss": -6.971016883850098, "global_step": 184877, "epoch": 4401} {"train_loss": -7.082444667816162, "global_step": 184878, "epoch": 4401} {"train_loss": -6.970497131347656, "global_step": 184879, "epoch": 4401} {"train_loss": -7.042507171630859, "global_step": 184880, "epoch": 4401} {"train_loss": -6.976027488708496, "global_step": 184881, "epoch": 4401} {"train_loss": -7.086304664611816, "global_step": 184882, "epoch": 4401} {"train_loss": -7.015848466328213, "global_step": 184883, "epoch": 4401, "val_loss": 68656.640625} {"train_loss": -7.066592216491699, "global_step": 184884, "epoch": 4402} {"train_loss": -6.952750205993652, "global_step": 184885, "epoch": 4402} {"train_loss": -7.1190643310546875, "global_step": 184886, "epoch": 4402} {"train_loss": -7.018586158752441, "global_step": 184887, "epoch": 4402} {"train_loss": -7.100319862365723, "global_step": 184888, "epoch": 4402} {"train_loss": -7.095836639404297, "global_step": 184889, "epoch": 4402} {"train_loss": -7.166041374206543, "global_step": 184890, "epoch": 4402} {"train_loss": -7.126360893249512, "global_step": 184891, "epoch": 4402} {"train_loss": -7.124131202697754, "global_step": 184892, "epoch": 4402} {"train_loss": -7.135924339294434, "global_step": 184893, "epoch": 4402} {"train_loss": -7.053839683532715, "global_step": 184894, "epoch": 4402} {"train_loss": -7.041667461395264, "global_step": 184895, "epoch": 4402} {"train_loss": -7.133007049560547, "global_step": 184896, "epoch": 4402} {"train_loss": -7.115601539611816, "global_step": 184897, "epoch": 4402} {"train_loss": -7.170650482177734, "global_step": 184898, "epoch": 4402} {"train_loss": -7.232743740081787, "global_step": 184899, "epoch": 4402} {"train_loss": -7.070521354675293, "global_step": 184900, "epoch": 4402} {"train_loss": -7.264463901519775, "global_step": 184901, "epoch": 4402} {"train_loss": -7.06684684753418, "global_step": 184902, "epoch": 4402} {"train_loss": -7.147164821624756, "global_step": 184903, "epoch": 4402} {"train_loss": -7.176462173461914, "global_step": 184904, "epoch": 4402} {"train_loss": -7.145533561706543, "global_step": 184905, "epoch": 4402} {"train_loss": -7.059986114501953, "global_step": 184906, "epoch": 4402} {"train_loss": -7.159853935241699, "global_step": 184907, "epoch": 4402} {"train_loss": -7.197637557983398, "global_step": 184908, "epoch": 4402} {"train_loss": -7.269517421722412, "global_step": 184909, "epoch": 4402} {"train_loss": -7.260381698608398, "global_step": 184910, "epoch": 4402} {"train_loss": -7.121370315551758, "global_step": 184911, "epoch": 4402} {"train_loss": -7.063314437866211, "global_step": 184912, "epoch": 4402} {"train_loss": -7.1640119552612305, "global_step": 184913, "epoch": 4402} {"train_loss": -7.202033042907715, "global_step": 184914, "epoch": 4402} {"train_loss": -7.1664276123046875, "global_step": 184915, "epoch": 4402} {"train_loss": -7.1331071853637695, "global_step": 184916, "epoch": 4402} {"train_loss": -6.984707832336426, "global_step": 184917, "epoch": 4402} {"train_loss": -7.126795768737793, "global_step": 184918, "epoch": 4402} {"train_loss": -7.170408725738525, "global_step": 184919, "epoch": 4402} {"train_loss": -7.217613220214844, "global_step": 184920, "epoch": 4402} {"train_loss": -7.2578444480896, "global_step": 184921, "epoch": 4402} {"train_loss": -7.221619129180908, "global_step": 184922, "epoch": 4402} {"train_loss": -7.071624755859375, "global_step": 184923, "epoch": 4402} {"train_loss": -7.024488925933838, "global_step": 184924, "epoch": 4402} {"train_loss": -7.129984787532261, "global_step": 184925, "epoch": 4402, "val_loss": 68811.796875} {"train_loss": -7.202705383300781, "global_step": 184926, "epoch": 4403} {"train_loss": -7.033380508422852, "global_step": 184927, "epoch": 4403} {"train_loss": -7.1082258224487305, "global_step": 184928, "epoch": 4403} {"train_loss": -7.097667694091797, "global_step": 184929, "epoch": 4403} {"train_loss": -7.053328514099121, "global_step": 184930, "epoch": 4403} {"train_loss": -7.015445232391357, "global_step": 184931, "epoch": 4403} {"train_loss": -7.0274553298950195, "global_step": 184932, "epoch": 4403} {"train_loss": -7.096622467041016, "global_step": 184933, "epoch": 4403} {"train_loss": -7.221855640411377, "global_step": 184934, "epoch": 4403} {"train_loss": -7.101303577423096, "global_step": 184935, "epoch": 4403} {"train_loss": -7.131820201873779, "global_step": 184936, "epoch": 4403} {"train_loss": -7.0736236572265625, "global_step": 184937, "epoch": 4403} {"train_loss": -7.1476616859436035, "global_step": 184938, "epoch": 4403} {"train_loss": -7.14219856262207, "global_step": 184939, "epoch": 4403} {"train_loss": -7.036276340484619, "global_step": 184940, "epoch": 4403} {"train_loss": -7.105107307434082, "global_step": 184941, "epoch": 4403} {"train_loss": -7.083617210388184, "global_step": 184942, "epoch": 4403} {"train_loss": -7.055622100830078, "global_step": 184943, "epoch": 4403} {"train_loss": -7.176663398742676, "global_step": 184944, "epoch": 4403} {"train_loss": -7.075591564178467, "global_step": 184945, "epoch": 4403} {"train_loss": -7.074138164520264, "global_step": 184946, "epoch": 4403} {"train_loss": -7.137728691101074, "global_step": 184947, "epoch": 4403} {"train_loss": -6.969367980957031, "global_step": 184948, "epoch": 4403} {"train_loss": -7.132064342498779, "global_step": 184949, "epoch": 4403} {"train_loss": -7.042672157287598, "global_step": 184950, "epoch": 4403} {"train_loss": -7.054070949554443, "global_step": 184951, "epoch": 4403} {"train_loss": -7.17673397064209, "global_step": 184952, "epoch": 4403} {"train_loss": -7.060134410858154, "global_step": 184953, "epoch": 4403} {"train_loss": -7.021206855773926, "global_step": 184954, "epoch": 4403} {"train_loss": -7.219663143157959, "global_step": 184955, "epoch": 4403} {"train_loss": -7.180703163146973, "global_step": 184956, "epoch": 4403} {"train_loss": -7.105539321899414, "global_step": 184957, "epoch": 4403} {"train_loss": -6.957322597503662, "global_step": 184958, "epoch": 4403} {"train_loss": -7.040631294250488, "global_step": 184959, "epoch": 4403} {"train_loss": -7.130958557128906, "global_step": 184960, "epoch": 4403} {"train_loss": -7.126233100891113, "global_step": 184961, "epoch": 4403} {"train_loss": -7.056432723999023, "global_step": 184962, "epoch": 4403} {"train_loss": -7.110018730163574, "global_step": 184963, "epoch": 4403} {"train_loss": -7.121782302856445, "global_step": 184964, "epoch": 4403} {"train_loss": -7.048624038696289, "global_step": 184965, "epoch": 4403} {"train_loss": -7.149038791656494, "global_step": 184966, "epoch": 4403} {"train_loss": -7.093595686412993, "global_step": 184967, "epoch": 4403, "val_loss": 68588.765625} {"train_loss": -7.059564590454102, "global_step": 184968, "epoch": 4404} {"train_loss": -7.131955146789551, "global_step": 184969, "epoch": 4404} {"train_loss": -7.185453414916992, "global_step": 184970, "epoch": 4404} {"train_loss": -7.125069618225098, "global_step": 184971, "epoch": 4404} {"train_loss": -7.063260078430176, "global_step": 184972, "epoch": 4404} {"train_loss": -7.008724212646484, "global_step": 184973, "epoch": 4404} {"train_loss": -6.970686912536621, "global_step": 184974, "epoch": 4404} {"train_loss": -7.068289279937744, "global_step": 184975, "epoch": 4404} {"train_loss": -7.214814186096191, "global_step": 184976, "epoch": 4404} {"train_loss": -7.013278484344482, "global_step": 184977, "epoch": 4404} {"train_loss": -6.904741287231445, "global_step": 184978, "epoch": 4404} {"train_loss": -6.977222442626953, "global_step": 184979, "epoch": 4404} {"train_loss": -7.0696120262146, "global_step": 184980, "epoch": 4404} {"train_loss": -6.857582092285156, "global_step": 184981, "epoch": 4404} {"train_loss": -7.03464412689209, "global_step": 184982, "epoch": 4404} {"train_loss": -6.880706787109375, "global_step": 184983, "epoch": 4404} {"train_loss": -6.965241432189941, "global_step": 184984, "epoch": 4404} {"train_loss": -7.035163879394531, "global_step": 184985, "epoch": 4404} {"train_loss": -6.808280944824219, "global_step": 184986, "epoch": 4404} {"train_loss": -7.059958457946777, "global_step": 184987, "epoch": 4404} {"train_loss": -6.8986616134643555, "global_step": 184988, "epoch": 4404} {"train_loss": -7.080662727355957, "global_step": 184989, "epoch": 4404} {"train_loss": -6.821527004241943, "global_step": 184990, "epoch": 4404} {"train_loss": -6.878039836883545, "global_step": 184991, "epoch": 4404} {"train_loss": -6.8139214515686035, "global_step": 184992, "epoch": 4404} {"train_loss": -6.99515962600708, "global_step": 184993, "epoch": 4404} {"train_loss": -6.826889991760254, "global_step": 184994, "epoch": 4404} {"train_loss": -6.91049861907959, "global_step": 184995, "epoch": 4404} {"train_loss": -6.943662643432617, "global_step": 184996, "epoch": 4404} {"train_loss": -6.86421012878418, "global_step": 184997, "epoch": 4404} {"train_loss": -7.007128715515137, "global_step": 184998, "epoch": 4404} {"train_loss": -6.961398124694824, "global_step": 184999, "epoch": 4404} {"train_loss": -6.99363899230957, "global_step": 185000, "epoch": 4404} {"train_loss": -6.99125862121582, "global_step": 185001, "epoch": 4404} {"train_loss": -6.985832214355469, "global_step": 185002, "epoch": 4404} {"train_loss": -7.149311065673828, "global_step": 185003, "epoch": 4404} {"train_loss": -7.006220817565918, "global_step": 185004, "epoch": 4404} {"train_loss": -7.01251220703125, "global_step": 185005, "epoch": 4404} {"train_loss": -7.0393805503845215, "global_step": 185006, "epoch": 4404} {"train_loss": -7.005674362182617, "global_step": 185007, "epoch": 4404} {"train_loss": -6.967189311981201, "global_step": 185008, "epoch": 4404} {"train_loss": -6.995049590156192, "global_step": 185009, "epoch": 4404, "val_loss": 68727.2421875} {"train_loss": -7.124388694763184, "global_step": 185010, "epoch": 4405} {"train_loss": -6.961097717285156, "global_step": 185011, "epoch": 4405} {"train_loss": -7.098255157470703, "global_step": 185012, "epoch": 4405} {"train_loss": -7.054664134979248, "global_step": 185013, "epoch": 4405} {"train_loss": -7.003873825073242, "global_step": 185014, "epoch": 4405} {"train_loss": -7.123750686645508, "global_step": 185015, "epoch": 4405} {"train_loss": -7.00188684463501, "global_step": 185016, "epoch": 4405} {"train_loss": -7.010207176208496, "global_step": 185017, "epoch": 4405} {"train_loss": -6.970390319824219, "global_step": 185018, "epoch": 4405} {"train_loss": -7.010520935058594, "global_step": 185019, "epoch": 4405} {"train_loss": -7.117938041687012, "global_step": 185020, "epoch": 4405} {"train_loss": -6.974336624145508, "global_step": 185021, "epoch": 4405} {"train_loss": -7.151037216186523, "global_step": 185022, "epoch": 4405} {"train_loss": -7.006757736206055, "global_step": 185023, "epoch": 4405} {"train_loss": -7.082601547241211, "global_step": 185024, "epoch": 4405} {"train_loss": -7.156970977783203, "global_step": 185025, "epoch": 4405} {"train_loss": -6.961090564727783, "global_step": 185026, "epoch": 4405} {"train_loss": -7.1034088134765625, "global_step": 185027, "epoch": 4405} {"train_loss": -6.99948787689209, "global_step": 185028, "epoch": 4405} {"train_loss": -6.973756790161133, "global_step": 185029, "epoch": 4405} {"train_loss": -7.062194347381592, "global_step": 185030, "epoch": 4405} {"train_loss": -7.115468502044678, "global_step": 185031, "epoch": 4405} {"train_loss": -7.228910446166992, "global_step": 185032, "epoch": 4405} {"train_loss": -7.1375226974487305, "global_step": 185033, "epoch": 4405} {"train_loss": -7.061165809631348, "global_step": 185034, "epoch": 4405} {"train_loss": -7.182596206665039, "global_step": 185035, "epoch": 4405} {"train_loss": -7.011710166931152, "global_step": 185036, "epoch": 4405} {"train_loss": -7.140185356140137, "global_step": 185037, "epoch": 4405} {"train_loss": -7.098142147064209, "global_step": 185038, "epoch": 4405} {"train_loss": -7.113112449645996, "global_step": 185039, "epoch": 4405} {"train_loss": -7.030948638916016, "global_step": 185040, "epoch": 4405} {"train_loss": -7.11541748046875, "global_step": 185041, "epoch": 4405} {"train_loss": -7.049680233001709, "global_step": 185042, "epoch": 4405} {"train_loss": -7.11150598526001, "global_step": 185043, "epoch": 4405} {"train_loss": -7.213380813598633, "global_step": 185044, "epoch": 4405} {"train_loss": -7.151821136474609, "global_step": 185045, "epoch": 4405} {"train_loss": -7.140750885009766, "global_step": 185046, "epoch": 4405} {"train_loss": -6.99561071395874, "global_step": 185047, "epoch": 4405} {"train_loss": -7.1088361740112305, "global_step": 185048, "epoch": 4405} {"train_loss": -7.115754127502441, "global_step": 185049, "epoch": 4405} {"train_loss": -7.013214111328125, "global_step": 185050, "epoch": 4405} {"train_loss": -7.077873457045782, "global_step": 185051, "epoch": 4405, "val_loss": 68833.2578125} {"train_loss": -7.061394691467285, "global_step": 185052, "epoch": 4406} {"train_loss": -7.142632961273193, "global_step": 185053, "epoch": 4406} {"train_loss": -7.236362457275391, "global_step": 185054, "epoch": 4406} {"train_loss": -6.956611156463623, "global_step": 185055, "epoch": 4406} {"train_loss": -7.17205810546875, "global_step": 185056, "epoch": 4406} {"train_loss": -7.034409523010254, "global_step": 185057, "epoch": 4406} {"train_loss": -7.1595964431762695, "global_step": 185058, "epoch": 4406} {"train_loss": -7.076000213623047, "global_step": 185059, "epoch": 4406} {"train_loss": -7.154613494873047, "global_step": 185060, "epoch": 4406} {"train_loss": -7.18310546875, "global_step": 185061, "epoch": 4406} {"train_loss": -7.022948741912842, "global_step": 185062, "epoch": 4406} {"train_loss": -7.235466003417969, "global_step": 185063, "epoch": 4406} {"train_loss": -7.144781112670898, "global_step": 185064, "epoch": 4406} {"train_loss": -7.0305633544921875, "global_step": 185065, "epoch": 4406} {"train_loss": -7.068633079528809, "global_step": 185066, "epoch": 4406} {"train_loss": -7.038637161254883, "global_step": 185067, "epoch": 4406} {"train_loss": -7.090954303741455, "global_step": 185068, "epoch": 4406} {"train_loss": -7.050373077392578, "global_step": 185069, "epoch": 4406} {"train_loss": -6.9804863929748535, "global_step": 185070, "epoch": 4406} {"train_loss": -7.133262634277344, "global_step": 185071, "epoch": 4406} {"train_loss": -7.080310821533203, "global_step": 185072, "epoch": 4406} {"train_loss": -7.102471828460693, "global_step": 185073, "epoch": 4406} {"train_loss": -6.958740234375, "global_step": 185074, "epoch": 4406} {"train_loss": -7.166663646697998, "global_step": 185075, "epoch": 4406} {"train_loss": -7.186583042144775, "global_step": 185076, "epoch": 4406} {"train_loss": -7.17930793762207, "global_step": 185077, "epoch": 4406} {"train_loss": -7.065881729125977, "global_step": 185078, "epoch": 4406} {"train_loss": -7.070402145385742, "global_step": 185079, "epoch": 4406} {"train_loss": -7.143420219421387, "global_step": 185080, "epoch": 4406} {"train_loss": -7.022486209869385, "global_step": 185081, "epoch": 4406} {"train_loss": -7.1953654289245605, "global_step": 185082, "epoch": 4406} {"train_loss": -7.038550853729248, "global_step": 185083, "epoch": 4406} {"train_loss": -7.1096415519714355, "global_step": 185084, "epoch": 4406} {"train_loss": -7.158215522766113, "global_step": 185085, "epoch": 4406} {"train_loss": -7.1323466300964355, "global_step": 185086, "epoch": 4406} {"train_loss": -7.250350475311279, "global_step": 185087, "epoch": 4406} {"train_loss": -7.080819129943848, "global_step": 185088, "epoch": 4406} {"train_loss": -7.17424201965332, "global_step": 185089, "epoch": 4406} {"train_loss": -7.123442649841309, "global_step": 185090, "epoch": 4406} {"train_loss": -7.12470817565918, "global_step": 185091, "epoch": 4406} {"train_loss": -7.142533779144287, "global_step": 185092, "epoch": 4406} {"train_loss": -7.1076896871839255, "global_step": 185093, "epoch": 4406, "val_loss": 68802.015625} {"train_loss": -7.168885231018066, "global_step": 185094, "epoch": 4407} {"train_loss": -7.148244857788086, "global_step": 185095, "epoch": 4407} {"train_loss": -7.074853420257568, "global_step": 185096, "epoch": 4407} {"train_loss": -7.137495040893555, "global_step": 185097, "epoch": 4407} {"train_loss": -7.001723289489746, "global_step": 185098, "epoch": 4407} {"train_loss": -7.0661163330078125, "global_step": 185099, "epoch": 4407} {"train_loss": -6.919604301452637, "global_step": 185100, "epoch": 4407} {"train_loss": -7.119276523590088, "global_step": 185101, "epoch": 4407} {"train_loss": -7.081612586975098, "global_step": 185102, "epoch": 4407} {"train_loss": -7.054533958435059, "global_step": 185103, "epoch": 4407} {"train_loss": -7.10019588470459, "global_step": 185104, "epoch": 4407} {"train_loss": -7.172159194946289, "global_step": 185105, "epoch": 4407} {"train_loss": -7.179629325866699, "global_step": 185106, "epoch": 4407} {"train_loss": -7.1470112800598145, "global_step": 185107, "epoch": 4407} {"train_loss": -7.172015190124512, "global_step": 185108, "epoch": 4407} {"train_loss": -7.121942520141602, "global_step": 185109, "epoch": 4407} {"train_loss": -7.188462257385254, "global_step": 185110, "epoch": 4407} {"train_loss": -7.183589458465576, "global_step": 185111, "epoch": 4407} {"train_loss": -7.181666374206543, "global_step": 185112, "epoch": 4407} {"train_loss": -7.115441799163818, "global_step": 185113, "epoch": 4407} {"train_loss": -7.136720657348633, "global_step": 185114, "epoch": 4407} {"train_loss": -7.156514644622803, "global_step": 185115, "epoch": 4407} {"train_loss": -7.133183479309082, "global_step": 185116, "epoch": 4407} {"train_loss": -7.134836196899414, "global_step": 185117, "epoch": 4407} {"train_loss": -7.114197731018066, "global_step": 185118, "epoch": 4407} {"train_loss": -7.087010860443115, "global_step": 185119, "epoch": 4407} {"train_loss": -7.220810890197754, "global_step": 185120, "epoch": 4407} {"train_loss": -7.070287704467773, "global_step": 185121, "epoch": 4407} {"train_loss": -6.988054275512695, "global_step": 185122, "epoch": 4407} {"train_loss": -7.200772285461426, "global_step": 185123, "epoch": 4407} {"train_loss": -7.0698699951171875, "global_step": 185124, "epoch": 4407} {"train_loss": -7.185601711273193, "global_step": 185125, "epoch": 4407} {"train_loss": -7.176019191741943, "global_step": 185126, "epoch": 4407} {"train_loss": -7.150696754455566, "global_step": 185127, "epoch": 4407} {"train_loss": -7.114230155944824, "global_step": 185128, "epoch": 4407} {"train_loss": -7.0345611572265625, "global_step": 185129, "epoch": 4407} {"train_loss": -7.212339401245117, "global_step": 185130, "epoch": 4407} {"train_loss": -7.125546455383301, "global_step": 185131, "epoch": 4407} {"train_loss": -7.145317077636719, "global_step": 185132, "epoch": 4407} {"train_loss": -7.014692783355713, "global_step": 185133, "epoch": 4407} {"train_loss": -7.282311916351318, "global_step": 185134, "epoch": 4407} {"train_loss": -7.123762459982009, "global_step": 185135, "epoch": 4407, "val_loss": 68911.6015625} {"train_loss": -7.081589698791504, "global_step": 185136, "epoch": 4408} {"train_loss": -7.117813587188721, "global_step": 185137, "epoch": 4408} {"train_loss": -7.095067024230957, "global_step": 185138, "epoch": 4408} {"train_loss": -7.105579376220703, "global_step": 185139, "epoch": 4408} {"train_loss": -7.180713176727295, "global_step": 185140, "epoch": 4408} {"train_loss": -7.13217830657959, "global_step": 185141, "epoch": 4408} {"train_loss": -7.150903701782227, "global_step": 185142, "epoch": 4408} {"train_loss": -7.179965019226074, "global_step": 185143, "epoch": 4408} {"train_loss": -7.149799346923828, "global_step": 185144, "epoch": 4408} {"train_loss": -7.110741138458252, "global_step": 185145, "epoch": 4408} {"train_loss": -7.147526264190674, "global_step": 185146, "epoch": 4408} {"train_loss": -6.991537094116211, "global_step": 185147, "epoch": 4408} {"train_loss": -7.140265464782715, "global_step": 185148, "epoch": 4408} {"train_loss": -7.12960147857666, "global_step": 185149, "epoch": 4408} {"train_loss": -7.198075294494629, "global_step": 185150, "epoch": 4408} {"train_loss": -7.098728656768799, "global_step": 185151, "epoch": 4408} {"train_loss": -7.215635776519775, "global_step": 185152, "epoch": 4408} {"train_loss": -7.243256568908691, "global_step": 185153, "epoch": 4408} {"train_loss": -7.214052677154541, "global_step": 185154, "epoch": 4408} {"train_loss": -7.043515205383301, "global_step": 185155, "epoch": 4408} {"train_loss": -7.074567794799805, "global_step": 185156, "epoch": 4408} {"train_loss": -7.033299446105957, "global_step": 185157, "epoch": 4408} {"train_loss": -7.129652976989746, "global_step": 185158, "epoch": 4408} {"train_loss": -6.888909339904785, "global_step": 185159, "epoch": 4408} {"train_loss": -7.093907833099365, "global_step": 185160, "epoch": 4408} {"train_loss": -7.029618263244629, "global_step": 185161, "epoch": 4408} {"train_loss": -6.841339111328125, "global_step": 185162, "epoch": 4408} {"train_loss": -7.1302642822265625, "global_step": 185163, "epoch": 4408} {"train_loss": -7.08896541595459, "global_step": 185164, "epoch": 4408} {"train_loss": -6.85931396484375, "global_step": 185165, "epoch": 4408} {"train_loss": -7.174001216888428, "global_step": 185166, "epoch": 4408} {"train_loss": -6.810922622680664, "global_step": 185167, "epoch": 4408} {"train_loss": -7.107236862182617, "global_step": 185168, "epoch": 4408} {"train_loss": -6.9159040451049805, "global_step": 185169, "epoch": 4408} {"train_loss": -6.896033763885498, "global_step": 185170, "epoch": 4408} {"train_loss": -7.0779643058776855, "global_step": 185171, "epoch": 4408} {"train_loss": -6.899303436279297, "global_step": 185172, "epoch": 4408} {"train_loss": -7.052959442138672, "global_step": 185173, "epoch": 4408} {"train_loss": -6.861396789550781, "global_step": 185174, "epoch": 4408} {"train_loss": -7.073336601257324, "global_step": 185175, "epoch": 4408} {"train_loss": -6.971936225891113, "global_step": 185176, "epoch": 4408} {"train_loss": -7.067768710000174, "global_step": 185177, "epoch": 4408, "val_loss": 68841.9453125} {"train_loss": -7.066485404968262, "global_step": 185178, "epoch": 4409} {"train_loss": -7.1332478523254395, "global_step": 185179, "epoch": 4409} {"train_loss": -7.1187615394592285, "global_step": 185180, "epoch": 4409} {"train_loss": -7.078627586364746, "global_step": 185181, "epoch": 4409} {"train_loss": -6.951205730438232, "global_step": 185182, "epoch": 4409} {"train_loss": -7.115344524383545, "global_step": 185183, "epoch": 4409} {"train_loss": -7.112354278564453, "global_step": 185184, "epoch": 4409} {"train_loss": -7.077354431152344, "global_step": 185185, "epoch": 4409} {"train_loss": -7.1080780029296875, "global_step": 185186, "epoch": 4409} {"train_loss": -7.15631103515625, "global_step": 185187, "epoch": 4409} {"train_loss": -7.233068466186523, "global_step": 185188, "epoch": 4409} {"train_loss": -7.171142578125, "global_step": 185189, "epoch": 4409} {"train_loss": -7.246913909912109, "global_step": 185190, "epoch": 4409} {"train_loss": -7.265488624572754, "global_step": 185191, "epoch": 4409} {"train_loss": -7.152740478515625, "global_step": 185192, "epoch": 4409} {"train_loss": -7.111278533935547, "global_step": 185193, "epoch": 4409} {"train_loss": -7.186662673950195, "global_step": 185194, "epoch": 4409} {"train_loss": -7.095000743865967, "global_step": 185195, "epoch": 4409} {"train_loss": -7.014692306518555, "global_step": 185196, "epoch": 4409} {"train_loss": -7.0685625076293945, "global_step": 185197, "epoch": 4409} {"train_loss": -7.079141616821289, "global_step": 185198, "epoch": 4409} {"train_loss": -7.047430992126465, "global_step": 185199, "epoch": 4409} {"train_loss": -7.092793941497803, "global_step": 185200, "epoch": 4409} {"train_loss": -7.056941986083984, "global_step": 185201, "epoch": 4409} {"train_loss": -7.001040458679199, "global_step": 185202, "epoch": 4409} {"train_loss": -7.256495475769043, "global_step": 185203, "epoch": 4409} {"train_loss": -7.126769065856934, "global_step": 185204, "epoch": 4409} {"train_loss": -6.995988368988037, "global_step": 185205, "epoch": 4409} {"train_loss": -7.09051513671875, "global_step": 185206, "epoch": 4409} {"train_loss": -7.109883785247803, "global_step": 185207, "epoch": 4409} {"train_loss": -7.113280296325684, "global_step": 185208, "epoch": 4409} {"train_loss": -7.077265739440918, "global_step": 185209, "epoch": 4409} {"train_loss": -7.186550140380859, "global_step": 185210, "epoch": 4409} {"train_loss": -7.142160415649414, "global_step": 185211, "epoch": 4409} {"train_loss": -7.092164993286133, "global_step": 185212, "epoch": 4409} {"train_loss": -7.1361494064331055, "global_step": 185213, "epoch": 4409} {"train_loss": -7.160292148590088, "global_step": 185214, "epoch": 4409} {"train_loss": -7.102963447570801, "global_step": 185215, "epoch": 4409} {"train_loss": -7.16865348815918, "global_step": 185216, "epoch": 4409} {"train_loss": -7.089728832244873, "global_step": 185217, "epoch": 4409} {"train_loss": -7.2151384353637695, "global_step": 185218, "epoch": 4409} {"train_loss": -7.116654044105893, "global_step": 185219, "epoch": 4409, "val_loss": 68839.09375} {"train_loss": -7.215302467346191, "global_step": 185220, "epoch": 4410} {"train_loss": -7.17073917388916, "global_step": 185221, "epoch": 4410} {"train_loss": -7.146008014678955, "global_step": 185222, "epoch": 4410} {"train_loss": -7.219285011291504, "global_step": 185223, "epoch": 4410} {"train_loss": -7.126453399658203, "global_step": 185224, "epoch": 4410} {"train_loss": -7.129263877868652, "global_step": 185225, "epoch": 4410} {"train_loss": -7.19140625, "global_step": 185226, "epoch": 4410} {"train_loss": -7.174098014831543, "global_step": 185227, "epoch": 4410} {"train_loss": -7.129438400268555, "global_step": 185228, "epoch": 4410} {"train_loss": -7.223366737365723, "global_step": 185229, "epoch": 4410} {"train_loss": -7.1073408126831055, "global_step": 185230, "epoch": 4410} {"train_loss": -7.122246742248535, "global_step": 185231, "epoch": 4410} {"train_loss": -7.187566757202148, "global_step": 185232, "epoch": 4410} {"train_loss": -7.041990280151367, "global_step": 185233, "epoch": 4410} {"train_loss": -7.114617347717285, "global_step": 185234, "epoch": 4410} {"train_loss": -7.183248043060303, "global_step": 185235, "epoch": 4410} {"train_loss": -7.114724159240723, "global_step": 185236, "epoch": 4410} {"train_loss": -7.154351711273193, "global_step": 185237, "epoch": 4410} {"train_loss": -7.141182899475098, "global_step": 185238, "epoch": 4410} {"train_loss": -7.104453086853027, "global_step": 185239, "epoch": 4410} {"train_loss": -7.128539085388184, "global_step": 185240, "epoch": 4410} {"train_loss": -7.217410087585449, "global_step": 185241, "epoch": 4410} {"train_loss": -7.198677062988281, "global_step": 185242, "epoch": 4410} {"train_loss": -7.164417266845703, "global_step": 185243, "epoch": 4410} {"train_loss": -7.129692077636719, "global_step": 185244, "epoch": 4410} {"train_loss": -7.1029229164123535, "global_step": 185245, "epoch": 4410} {"train_loss": -7.229152679443359, "global_step": 185246, "epoch": 4410} {"train_loss": -7.074467658996582, "global_step": 185247, "epoch": 4410} {"train_loss": -7.2214202880859375, "global_step": 185248, "epoch": 4410} {"train_loss": -7.113286018371582, "global_step": 185249, "epoch": 4410} {"train_loss": -7.053990364074707, "global_step": 185250, "epoch": 4410} {"train_loss": -7.159277439117432, "global_step": 185251, "epoch": 4410} {"train_loss": -7.103037357330322, "global_step": 185252, "epoch": 4410} {"train_loss": -7.111634731292725, "global_step": 185253, "epoch": 4410} {"train_loss": -7.190315246582031, "global_step": 185254, "epoch": 4410} {"train_loss": -7.202131271362305, "global_step": 185255, "epoch": 4410} {"train_loss": -7.219762325286865, "global_step": 185256, "epoch": 4410} {"train_loss": -7.193120002746582, "global_step": 185257, "epoch": 4410} {"train_loss": -7.282222747802734, "global_step": 185258, "epoch": 4410} {"train_loss": -7.157046318054199, "global_step": 185259, "epoch": 4410} {"train_loss": -7.158618927001953, "global_step": 185260, "epoch": 4410} {"train_loss": -7.157508271081107, "global_step": 185261, "epoch": 4410, "val_loss": 68813.109375} {"train_loss": -7.251849174499512, "global_step": 185262, "epoch": 4411} {"train_loss": -7.043731689453125, "global_step": 185263, "epoch": 4411} {"train_loss": -7.12681770324707, "global_step": 185264, "epoch": 4411} {"train_loss": -7.240180492401123, "global_step": 185265, "epoch": 4411} {"train_loss": -7.167976379394531, "global_step": 185266, "epoch": 4411} {"train_loss": -7.178648948669434, "global_step": 185267, "epoch": 4411} {"train_loss": -7.148322582244873, "global_step": 185268, "epoch": 4411} {"train_loss": -7.164281845092773, "global_step": 185269, "epoch": 4411} {"train_loss": -7.223711967468262, "global_step": 185270, "epoch": 4411} {"train_loss": -7.165160655975342, "global_step": 185271, "epoch": 4411} {"train_loss": -7.168126106262207, "global_step": 185272, "epoch": 4411} {"train_loss": -7.166107177734375, "global_step": 185273, "epoch": 4411} {"train_loss": -7.025593280792236, "global_step": 185274, "epoch": 4411} {"train_loss": -7.143989562988281, "global_step": 185275, "epoch": 4411} {"train_loss": -7.165661334991455, "global_step": 185276, "epoch": 4411} {"train_loss": -7.094743728637695, "global_step": 185277, "epoch": 4411} {"train_loss": -7.228314399719238, "global_step": 185278, "epoch": 4411} {"train_loss": -7.083713531494141, "global_step": 185279, "epoch": 4411} {"train_loss": -7.110146522521973, "global_step": 185280, "epoch": 4411} {"train_loss": -7.094427108764648, "global_step": 185281, "epoch": 4411} {"train_loss": -6.979892730712891, "global_step": 185282, "epoch": 4411} {"train_loss": -7.086642265319824, "global_step": 185283, "epoch": 4411} {"train_loss": -7.059429168701172, "global_step": 185284, "epoch": 4411} {"train_loss": -6.955425262451172, "global_step": 185285, "epoch": 4411} {"train_loss": -7.003223419189453, "global_step": 185286, "epoch": 4411} {"train_loss": -7.037569046020508, "global_step": 185287, "epoch": 4411} {"train_loss": -7.059366703033447, "global_step": 185288, "epoch": 4411} {"train_loss": -7.01666259765625, "global_step": 185289, "epoch": 4411} {"train_loss": -7.215254306793213, "global_step": 185290, "epoch": 4411} {"train_loss": -7.0557541847229, "global_step": 185291, "epoch": 4411} {"train_loss": -7.169604301452637, "global_step": 185292, "epoch": 4411} {"train_loss": -7.040103435516357, "global_step": 185293, "epoch": 4411} {"train_loss": -6.93324089050293, "global_step": 185294, "epoch": 4411} {"train_loss": -7.066325664520264, "global_step": 185295, "epoch": 4411} {"train_loss": -7.157075881958008, "global_step": 185296, "epoch": 4411} {"train_loss": -7.195663928985596, "global_step": 185297, "epoch": 4411} {"train_loss": -7.114352226257324, "global_step": 185298, "epoch": 4411} {"train_loss": -7.046970367431641, "global_step": 185299, "epoch": 4411} {"train_loss": -7.201396942138672, "global_step": 185300, "epoch": 4411} {"train_loss": -7.144565582275391, "global_step": 185301, "epoch": 4411} {"train_loss": -7.138469696044922, "global_step": 185302, "epoch": 4411} {"train_loss": -7.114451612745013, "global_step": 185303, "epoch": 4411, "val_loss": 68821.71875} {"train_loss": -7.089461326599121, "global_step": 185304, "epoch": 4412} {"train_loss": -7.067666530609131, "global_step": 185305, "epoch": 4412} {"train_loss": -7.114468574523926, "global_step": 185306, "epoch": 4412} {"train_loss": -7.122299671173096, "global_step": 185307, "epoch": 4412} {"train_loss": -7.144608497619629, "global_step": 185308, "epoch": 4412} {"train_loss": -7.04544734954834, "global_step": 185309, "epoch": 4412} {"train_loss": -7.129279613494873, "global_step": 185310, "epoch": 4412} {"train_loss": -7.146219253540039, "global_step": 185311, "epoch": 4412} {"train_loss": -7.126885414123535, "global_step": 185312, "epoch": 4412} {"train_loss": -7.220718860626221, "global_step": 185313, "epoch": 4412} {"train_loss": -7.006089210510254, "global_step": 185314, "epoch": 4412} {"train_loss": -7.141122817993164, "global_step": 185315, "epoch": 4412} {"train_loss": -7.177542209625244, "global_step": 185316, "epoch": 4412} {"train_loss": -7.151400566101074, "global_step": 185317, "epoch": 4412} {"train_loss": -7.198572158813477, "global_step": 185318, "epoch": 4412} {"train_loss": -7.034772872924805, "global_step": 185319, "epoch": 4412} {"train_loss": -7.186681747436523, "global_step": 185320, "epoch": 4412} {"train_loss": -7.071025848388672, "global_step": 185321, "epoch": 4412} {"train_loss": -7.120357513427734, "global_step": 185322, "epoch": 4412} {"train_loss": -7.201699256896973, "global_step": 185323, "epoch": 4412} {"train_loss": -7.077006816864014, "global_step": 185324, "epoch": 4412} {"train_loss": -7.161492347717285, "global_step": 185325, "epoch": 4412} {"train_loss": -7.075596332550049, "global_step": 185326, "epoch": 4412} {"train_loss": -7.234921455383301, "global_step": 185327, "epoch": 4412} {"train_loss": -7.182248115539551, "global_step": 185328, "epoch": 4412} {"train_loss": -7.151124954223633, "global_step": 185329, "epoch": 4412} {"train_loss": -7.186286449432373, "global_step": 185330, "epoch": 4412} {"train_loss": -7.234663963317871, "global_step": 185331, "epoch": 4412} {"train_loss": -7.199038505554199, "global_step": 185332, "epoch": 4412} {"train_loss": -7.094784736633301, "global_step": 185333, "epoch": 4412} {"train_loss": -7.188792705535889, "global_step": 185334, "epoch": 4412} {"train_loss": -7.062746524810791, "global_step": 185335, "epoch": 4412} {"train_loss": -7.133599281311035, "global_step": 185336, "epoch": 4412} {"train_loss": -7.150246620178223, "global_step": 185337, "epoch": 4412} {"train_loss": -7.193336486816406, "global_step": 185338, "epoch": 4412} {"train_loss": -7.130724906921387, "global_step": 185339, "epoch": 4412} {"train_loss": -7.245668411254883, "global_step": 185340, "epoch": 4412} {"train_loss": -7.071174621582031, "global_step": 185341, "epoch": 4412} {"train_loss": -7.0707173347473145, "global_step": 185342, "epoch": 4412} {"train_loss": -7.095271110534668, "global_step": 185343, "epoch": 4412} {"train_loss": -6.979681968688965, "global_step": 185344, "epoch": 4412} {"train_loss": -7.129935684658232, "global_step": 185345, "epoch": 4412, "val_loss": 68806.46875} {"train_loss": -7.157630920410156, "global_step": 185346, "epoch": 4413} {"train_loss": -7.187619209289551, "global_step": 185347, "epoch": 4413} {"train_loss": -7.054174900054932, "global_step": 185348, "epoch": 4413} {"train_loss": -7.036389350891113, "global_step": 185349, "epoch": 4413} {"train_loss": -7.107098579406738, "global_step": 185350, "epoch": 4413} {"train_loss": -7.057584762573242, "global_step": 185351, "epoch": 4413} {"train_loss": -7.043339252471924, "global_step": 185352, "epoch": 4413} {"train_loss": -7.1686530113220215, "global_step": 185353, "epoch": 4413} {"train_loss": -7.113293647766113, "global_step": 185354, "epoch": 4413} {"train_loss": -7.068543434143066, "global_step": 185355, "epoch": 4413} {"train_loss": -7.140427112579346, "global_step": 185356, "epoch": 4413} {"train_loss": -7.233941078186035, "global_step": 185357, "epoch": 4413} {"train_loss": -7.153234481811523, "global_step": 185358, "epoch": 4413} {"train_loss": -7.100069999694824, "global_step": 185359, "epoch": 4413} {"train_loss": -6.977334499359131, "global_step": 185360, "epoch": 4413} {"train_loss": -7.028902053833008, "global_step": 185361, "epoch": 4413} {"train_loss": -7.0783796310424805, "global_step": 185362, "epoch": 4413} {"train_loss": -7.0336103439331055, "global_step": 185363, "epoch": 4413} {"train_loss": -7.019521713256836, "global_step": 185364, "epoch": 4413} {"train_loss": -7.03492546081543, "global_step": 185365, "epoch": 4413} {"train_loss": -6.9812774658203125, "global_step": 185366, "epoch": 4413} {"train_loss": -7.066789627075195, "global_step": 185367, "epoch": 4413} {"train_loss": -7.130608558654785, "global_step": 185368, "epoch": 4413} {"train_loss": -7.0402421951293945, "global_step": 185369, "epoch": 4413} {"train_loss": -7.098611354827881, "global_step": 185370, "epoch": 4413} {"train_loss": -7.092640399932861, "global_step": 185371, "epoch": 4413} {"train_loss": -7.043682098388672, "global_step": 185372, "epoch": 4413} {"train_loss": -7.057265758514404, "global_step": 185373, "epoch": 4413} {"train_loss": -7.041261672973633, "global_step": 185374, "epoch": 4413} {"train_loss": -6.8076252937316895, "global_step": 185375, "epoch": 4413} {"train_loss": -7.0362091064453125, "global_step": 185376, "epoch": 4413} {"train_loss": -7.0050811767578125, "global_step": 185377, "epoch": 4413} {"train_loss": -7.068135738372803, "global_step": 185378, "epoch": 4413} {"train_loss": -7.103220462799072, "global_step": 185379, "epoch": 4413} {"train_loss": -6.9762468338012695, "global_step": 185380, "epoch": 4413} {"train_loss": -7.15285587310791, "global_step": 185381, "epoch": 4413} {"train_loss": -7.188706874847412, "global_step": 185382, "epoch": 4413} {"train_loss": -7.205491065979004, "global_step": 185383, "epoch": 4413} {"train_loss": -7.054018020629883, "global_step": 185384, "epoch": 4413} {"train_loss": -7.039794921875, "global_step": 185385, "epoch": 4413} {"train_loss": -7.151259899139404, "global_step": 185386, "epoch": 4413} {"train_loss": -7.074703409558251, "global_step": 185387, "epoch": 4413, "val_loss": 68674.859375} {"train_loss": -7.190829277038574, "global_step": 185388, "epoch": 4414} {"train_loss": -7.062413215637207, "global_step": 185389, "epoch": 4414} {"train_loss": -7.114140510559082, "global_step": 185390, "epoch": 4414} {"train_loss": -6.934043884277344, "global_step": 185391, "epoch": 4414} {"train_loss": -7.0933942794799805, "global_step": 185392, "epoch": 4414} {"train_loss": -7.0831756591796875, "global_step": 185393, "epoch": 4414} {"train_loss": -7.073371410369873, "global_step": 185394, "epoch": 4414} {"train_loss": -7.114764213562012, "global_step": 185395, "epoch": 4414} {"train_loss": -7.022824764251709, "global_step": 185396, "epoch": 4414} {"train_loss": -7.201557636260986, "global_step": 185397, "epoch": 4414} {"train_loss": -7.131781578063965, "global_step": 185398, "epoch": 4414} {"train_loss": -7.086558818817139, "global_step": 185399, "epoch": 4414} {"train_loss": -7.012543678283691, "global_step": 185400, "epoch": 4414} {"train_loss": -6.975257396697998, "global_step": 185401, "epoch": 4414} {"train_loss": -7.152923583984375, "global_step": 185402, "epoch": 4414} {"train_loss": -7.1685333251953125, "global_step": 185403, "epoch": 4414} {"train_loss": -7.030704975128174, "global_step": 185404, "epoch": 4414} {"train_loss": -7.151890277862549, "global_step": 185405, "epoch": 4414} {"train_loss": -7.152976036071777, "global_step": 185406, "epoch": 4414} {"train_loss": -7.144201278686523, "global_step": 185407, "epoch": 4414} {"train_loss": -7.1016340255737305, "global_step": 185408, "epoch": 4414} {"train_loss": -7.150465965270996, "global_step": 185409, "epoch": 4414} {"train_loss": -7.0374555587768555, "global_step": 185410, "epoch": 4414} {"train_loss": -7.086442947387695, "global_step": 185411, "epoch": 4414} {"train_loss": -7.127606391906738, "global_step": 185412, "epoch": 4414} {"train_loss": -7.123620510101318, "global_step": 185413, "epoch": 4414} {"train_loss": -7.166278839111328, "global_step": 185414, "epoch": 4414} {"train_loss": -7.156805038452148, "global_step": 185415, "epoch": 4414} {"train_loss": -7.052865982055664, "global_step": 185416, "epoch": 4414} {"train_loss": -7.096116542816162, "global_step": 185417, "epoch": 4414} {"train_loss": -7.069779396057129, "global_step": 185418, "epoch": 4414} {"train_loss": -7.056161880493164, "global_step": 185419, "epoch": 4414} {"train_loss": -7.118077278137207, "global_step": 185420, "epoch": 4414} {"train_loss": -7.1729278564453125, "global_step": 185421, "epoch": 4414} {"train_loss": -7.074700832366943, "global_step": 185422, "epoch": 4414} {"train_loss": -7.093352317810059, "global_step": 185423, "epoch": 4414} {"train_loss": -7.018488883972168, "global_step": 185424, "epoch": 4414} {"train_loss": -7.135478496551514, "global_step": 185425, "epoch": 4414} {"train_loss": -7.097844123840332, "global_step": 185426, "epoch": 4414} {"train_loss": -7.096549034118652, "global_step": 185427, "epoch": 4414} {"train_loss": -6.9533467292785645, "global_step": 185428, "epoch": 4414} {"train_loss": -7.091448954173496, "global_step": 185429, "epoch": 4414, "val_loss": 68911.1484375} {"train_loss": -7.001195907592773, "global_step": 185430, "epoch": 4415} {"train_loss": -7.114156246185303, "global_step": 185431, "epoch": 4415} {"train_loss": -7.034881591796875, "global_step": 185432, "epoch": 4415} {"train_loss": -7.08973503112793, "global_step": 185433, "epoch": 4415} {"train_loss": -7.013604640960693, "global_step": 185434, "epoch": 4415} {"train_loss": -7.033769607543945, "global_step": 185435, "epoch": 4415} {"train_loss": -7.252343654632568, "global_step": 185436, "epoch": 4415} {"train_loss": -7.031091690063477, "global_step": 185437, "epoch": 4415} {"train_loss": -7.058518409729004, "global_step": 185438, "epoch": 4415} {"train_loss": -7.067224025726318, "global_step": 185439, "epoch": 4415} {"train_loss": -7.137205600738525, "global_step": 185440, "epoch": 4415} {"train_loss": -7.216852188110352, "global_step": 185441, "epoch": 4415} {"train_loss": -7.147091388702393, "global_step": 185442, "epoch": 4415} {"train_loss": -7.081263542175293, "global_step": 185443, "epoch": 4415} {"train_loss": -7.178920745849609, "global_step": 185444, "epoch": 4415} {"train_loss": -7.207067489624023, "global_step": 185445, "epoch": 4415} {"train_loss": -7.166420936584473, "global_step": 185446, "epoch": 4415} {"train_loss": -7.07076358795166, "global_step": 185447, "epoch": 4415} {"train_loss": -7.02142858505249, "global_step": 185448, "epoch": 4415} {"train_loss": -7.1565141677856445, "global_step": 185449, "epoch": 4415} {"train_loss": -7.111697196960449, "global_step": 185450, "epoch": 4415} {"train_loss": -7.046867370605469, "global_step": 185451, "epoch": 4415} {"train_loss": -7.146064758300781, "global_step": 185452, "epoch": 4415} {"train_loss": -7.146190643310547, "global_step": 185453, "epoch": 4415} {"train_loss": -7.0467305183410645, "global_step": 185454, "epoch": 4415} {"train_loss": -7.162641525268555, "global_step": 185455, "epoch": 4415} {"train_loss": -7.133498191833496, "global_step": 185456, "epoch": 4415} {"train_loss": -7.1789398193359375, "global_step": 185457, "epoch": 4415} {"train_loss": -6.987447261810303, "global_step": 185458, "epoch": 4415} {"train_loss": -7.164421081542969, "global_step": 185459, "epoch": 4415} {"train_loss": -7.053389549255371, "global_step": 185460, "epoch": 4415} {"train_loss": -6.965638160705566, "global_step": 185461, "epoch": 4415} {"train_loss": -7.13095235824585, "global_step": 185462, "epoch": 4415} {"train_loss": -7.034226894378662, "global_step": 185463, "epoch": 4415} {"train_loss": -7.197047233581543, "global_step": 185464, "epoch": 4415} {"train_loss": -7.1382551193237305, "global_step": 185465, "epoch": 4415} {"train_loss": -6.971346378326416, "global_step": 185466, "epoch": 4415} {"train_loss": -7.044955253601074, "global_step": 185467, "epoch": 4415} {"train_loss": -7.025683403015137, "global_step": 185468, "epoch": 4415} {"train_loss": -7.117624759674072, "global_step": 185469, "epoch": 4415} {"train_loss": -7.024123191833496, "global_step": 185470, "epoch": 4415} {"train_loss": -7.095251389912197, "global_step": 185471, "epoch": 4415, "val_loss": 68738.640625} {"train_loss": -7.266586780548096, "global_step": 185472, "epoch": 4416} {"train_loss": -7.187280654907227, "global_step": 185473, "epoch": 4416} {"train_loss": -7.119794845581055, "global_step": 185474, "epoch": 4416} {"train_loss": -7.210492134094238, "global_step": 185475, "epoch": 4416} {"train_loss": -7.013744831085205, "global_step": 185476, "epoch": 4416} {"train_loss": -7.11212682723999, "global_step": 185477, "epoch": 4416} {"train_loss": -7.099390983581543, "global_step": 185478, "epoch": 4416} {"train_loss": -7.168327331542969, "global_step": 185479, "epoch": 4416} {"train_loss": -7.096670150756836, "global_step": 185480, "epoch": 4416} {"train_loss": -7.145010471343994, "global_step": 185481, "epoch": 4416} {"train_loss": -7.13878870010376, "global_step": 185482, "epoch": 4416} {"train_loss": -7.037362098693848, "global_step": 185483, "epoch": 4416} {"train_loss": -7.172418594360352, "global_step": 185484, "epoch": 4416} {"train_loss": -7.069833755493164, "global_step": 185485, "epoch": 4416} {"train_loss": -7.061374664306641, "global_step": 185486, "epoch": 4416} {"train_loss": -7.240533828735352, "global_step": 185487, "epoch": 4416} {"train_loss": -6.993875503540039, "global_step": 185488, "epoch": 4416} {"train_loss": -7.1656365394592285, "global_step": 185489, "epoch": 4416} {"train_loss": -7.124866485595703, "global_step": 185490, "epoch": 4416} {"train_loss": -7.107112407684326, "global_step": 185491, "epoch": 4416} {"train_loss": -7.1203765869140625, "global_step": 185492, "epoch": 4416} {"train_loss": -7.129219055175781, "global_step": 185493, "epoch": 4416} {"train_loss": -7.227323532104492, "global_step": 185494, "epoch": 4416} {"train_loss": -7.014257907867432, "global_step": 185495, "epoch": 4416} {"train_loss": -7.210190773010254, "global_step": 185496, "epoch": 4416} {"train_loss": -7.162698745727539, "global_step": 185497, "epoch": 4416} {"train_loss": -7.080289840698242, "global_step": 185498, "epoch": 4416} {"train_loss": -7.164134979248047, "global_step": 185499, "epoch": 4416} {"train_loss": -7.195367813110352, "global_step": 185500, "epoch": 4416} {"train_loss": -7.127599716186523, "global_step": 185501, "epoch": 4416} {"train_loss": -7.143116474151611, "global_step": 185502, "epoch": 4416} {"train_loss": -7.048795700073242, "global_step": 185503, "epoch": 4416} {"train_loss": -7.050360202789307, "global_step": 185504, "epoch": 4416} {"train_loss": -7.097552299499512, "global_step": 185505, "epoch": 4416} {"train_loss": -7.0953755378723145, "global_step": 185506, "epoch": 4416} {"train_loss": -7.155923843383789, "global_step": 185507, "epoch": 4416} {"train_loss": -7.177833557128906, "global_step": 185508, "epoch": 4416} {"train_loss": -7.0911760330200195, "global_step": 185509, "epoch": 4416} {"train_loss": -7.1189775466918945, "global_step": 185510, "epoch": 4416} {"train_loss": -7.189332485198975, "global_step": 185511, "epoch": 4416} {"train_loss": -7.0844011306762695, "global_step": 185512, "epoch": 4416} {"train_loss": -7.129731541588193, "global_step": 185513, "epoch": 4416, "val_loss": 68815.3984375} {"train_loss": -7.065679550170898, "global_step": 185514, "epoch": 4417} {"train_loss": -7.105278491973877, "global_step": 185515, "epoch": 4417} {"train_loss": -7.210338592529297, "global_step": 185516, "epoch": 4417} {"train_loss": -7.182240009307861, "global_step": 185517, "epoch": 4417} {"train_loss": -7.110015869140625, "global_step": 185518, "epoch": 4417} {"train_loss": -7.202963352203369, "global_step": 185519, "epoch": 4417} {"train_loss": -7.169239044189453, "global_step": 185520, "epoch": 4417} {"train_loss": -7.163248538970947, "global_step": 185521, "epoch": 4417} {"train_loss": -7.2431817054748535, "global_step": 185522, "epoch": 4417} {"train_loss": -7.244476795196533, "global_step": 185523, "epoch": 4417} {"train_loss": -7.155058860778809, "global_step": 185524, "epoch": 4417} {"train_loss": -7.1997833251953125, "global_step": 185525, "epoch": 4417} {"train_loss": -7.182570457458496, "global_step": 185526, "epoch": 4417} {"train_loss": -7.2168145179748535, "global_step": 185527, "epoch": 4417} {"train_loss": -7.133600234985352, "global_step": 185528, "epoch": 4417} {"train_loss": -7.17494535446167, "global_step": 185529, "epoch": 4417} {"train_loss": -7.1865315437316895, "global_step": 185530, "epoch": 4417} {"train_loss": -7.257538318634033, "global_step": 185531, "epoch": 4417} {"train_loss": -7.171724796295166, "global_step": 185532, "epoch": 4417} {"train_loss": -7.127625465393066, "global_step": 185533, "epoch": 4417} {"train_loss": -7.083974838256836, "global_step": 185534, "epoch": 4417} {"train_loss": -7.261175632476807, "global_step": 185535, "epoch": 4417} {"train_loss": -7.126795768737793, "global_step": 185536, "epoch": 4417} {"train_loss": -7.117588043212891, "global_step": 185537, "epoch": 4417} {"train_loss": -7.077282428741455, "global_step": 185538, "epoch": 4417} {"train_loss": -7.134130001068115, "global_step": 185539, "epoch": 4417} {"train_loss": -7.202790260314941, "global_step": 185540, "epoch": 4417} {"train_loss": -7.098382949829102, "global_step": 185541, "epoch": 4417} {"train_loss": -7.109858512878418, "global_step": 185542, "epoch": 4417} {"train_loss": -7.202121734619141, "global_step": 185543, "epoch": 4417} {"train_loss": -7.009560585021973, "global_step": 185544, "epoch": 4417} {"train_loss": -7.035744667053223, "global_step": 185545, "epoch": 4417} {"train_loss": -7.089180946350098, "global_step": 185546, "epoch": 4417} {"train_loss": -7.031535625457764, "global_step": 185547, "epoch": 4417} {"train_loss": -6.9018025398254395, "global_step": 185548, "epoch": 4417} {"train_loss": -6.957857131958008, "global_step": 185549, "epoch": 4417} {"train_loss": -6.971100807189941, "global_step": 185550, "epoch": 4417} {"train_loss": -7.031579971313477, "global_step": 185551, "epoch": 4417} {"train_loss": -7.026440143585205, "global_step": 185552, "epoch": 4417} {"train_loss": -7.0835700035095215, "global_step": 185553, "epoch": 4417} {"train_loss": -7.108166694641113, "global_step": 185554, "epoch": 4417} {"train_loss": -7.1240440890902565, "global_step": 185555, "epoch": 4417, "val_loss": 68998.140625} {"train_loss": -7.084717750549316, "global_step": 185556, "epoch": 4418} {"train_loss": -7.09620475769043, "global_step": 185557, "epoch": 4418} {"train_loss": -7.073211669921875, "global_step": 185558, "epoch": 4418} {"train_loss": -7.142041206359863, "global_step": 185559, "epoch": 4418} {"train_loss": -7.077232360839844, "global_step": 185560, "epoch": 4418} {"train_loss": -7.095017910003662, "global_step": 185561, "epoch": 4418} {"train_loss": -7.161018371582031, "global_step": 185562, "epoch": 4418} {"train_loss": -7.1416215896606445, "global_step": 185563, "epoch": 4418} {"train_loss": -7.143080711364746, "global_step": 185564, "epoch": 4418} {"train_loss": -7.139652729034424, "global_step": 185565, "epoch": 4418} {"train_loss": -7.017905235290527, "global_step": 185566, "epoch": 4418} {"train_loss": -7.068216323852539, "global_step": 185567, "epoch": 4418} {"train_loss": -7.202669143676758, "global_step": 185568, "epoch": 4418} {"train_loss": -7.050305366516113, "global_step": 185569, "epoch": 4418} {"train_loss": -7.120265960693359, "global_step": 185570, "epoch": 4418} {"train_loss": -7.150881290435791, "global_step": 185571, "epoch": 4418} {"train_loss": -7.192349910736084, "global_step": 185572, "epoch": 4418} {"train_loss": -7.06303071975708, "global_step": 185573, "epoch": 4418} {"train_loss": -7.0872602462768555, "global_step": 185574, "epoch": 4418} {"train_loss": -7.092211723327637, "global_step": 185575, "epoch": 4418} {"train_loss": -7.102999210357666, "global_step": 185576, "epoch": 4418} {"train_loss": -7.1219024658203125, "global_step": 185577, "epoch": 4418} {"train_loss": -6.910200595855713, "global_step": 185578, "epoch": 4418} {"train_loss": -6.75912618637085, "global_step": 185579, "epoch": 4418} {"train_loss": -6.959845542907715, "global_step": 185580, "epoch": 4418} {"train_loss": -6.6306562423706055, "global_step": 185581, "epoch": 4418} {"train_loss": -6.91254997253418, "global_step": 185582, "epoch": 4418} {"train_loss": -6.718137264251709, "global_step": 185583, "epoch": 4418} {"train_loss": -6.852376461029053, "global_step": 185584, "epoch": 4418} {"train_loss": -6.795041561126709, "global_step": 185585, "epoch": 4418} {"train_loss": -6.852165222167969, "global_step": 185586, "epoch": 4418} {"train_loss": -6.716628074645996, "global_step": 185587, "epoch": 4418} {"train_loss": -6.687199592590332, "global_step": 185588, "epoch": 4418} {"train_loss": -7.088529586791992, "global_step": 185589, "epoch": 4418} {"train_loss": -6.723550796508789, "global_step": 185590, "epoch": 4418} {"train_loss": -7.031412124633789, "global_step": 185591, "epoch": 4418} {"train_loss": -6.764128684997559, "global_step": 185592, "epoch": 4418} {"train_loss": -6.958341598510742, "global_step": 185593, "epoch": 4418} {"train_loss": -6.850399017333984, "global_step": 185594, "epoch": 4418} {"train_loss": -6.938601016998291, "global_step": 185595, "epoch": 4418} {"train_loss": -6.942399978637695, "global_step": 185596, "epoch": 4418} {"train_loss": -6.98482210295541, "global_step": 185597, "epoch": 4418, "val_loss": 68970.78125} {"train_loss": -7.006897926330566, "global_step": 185598, "epoch": 4419} {"train_loss": -6.94990348815918, "global_step": 185599, "epoch": 4419} {"train_loss": -6.957667350769043, "global_step": 185600, "epoch": 4419} {"train_loss": -6.975063800811768, "global_step": 185601, "epoch": 4419} {"train_loss": -6.992013454437256, "global_step": 185602, "epoch": 4419} {"train_loss": -7.092794418334961, "global_step": 185603, "epoch": 4419} {"train_loss": -6.9947710037231445, "global_step": 185604, "epoch": 4419} {"train_loss": -7.154567241668701, "global_step": 185605, "epoch": 4419} {"train_loss": -7.12417459487915, "global_step": 185606, "epoch": 4419} {"train_loss": -7.05714750289917, "global_step": 185607, "epoch": 4419} {"train_loss": -7.210610866546631, "global_step": 185608, "epoch": 4419} {"train_loss": -7.092284202575684, "global_step": 185609, "epoch": 4419} {"train_loss": -7.096392631530762, "global_step": 185610, "epoch": 4419} {"train_loss": -7.104575157165527, "global_step": 185611, "epoch": 4419} {"train_loss": -7.078625202178955, "global_step": 185612, "epoch": 4419} {"train_loss": -7.203184127807617, "global_step": 185613, "epoch": 4419} {"train_loss": -7.113699913024902, "global_step": 185614, "epoch": 4419} {"train_loss": -7.200690746307373, "global_step": 185615, "epoch": 4419} {"train_loss": -7.11724328994751, "global_step": 185616, "epoch": 4419} {"train_loss": -7.147197723388672, "global_step": 185617, "epoch": 4419} {"train_loss": -7.143746852874756, "global_step": 185618, "epoch": 4419} {"train_loss": -7.209540843963623, "global_step": 185619, "epoch": 4419} {"train_loss": -7.306210994720459, "global_step": 185620, "epoch": 4419} {"train_loss": -7.241036415100098, "global_step": 185621, "epoch": 4419} {"train_loss": -7.267996788024902, "global_step": 185622, "epoch": 4419} {"train_loss": -7.170793533325195, "global_step": 185623, "epoch": 4419} {"train_loss": -7.170018672943115, "global_step": 185624, "epoch": 4419} {"train_loss": -7.202911376953125, "global_step": 185625, "epoch": 4419} {"train_loss": -7.192058563232422, "global_step": 185626, "epoch": 4419} {"train_loss": -7.182363986968994, "global_step": 185627, "epoch": 4419} {"train_loss": -7.252760410308838, "global_step": 185628, "epoch": 4419} {"train_loss": -7.220357418060303, "global_step": 185629, "epoch": 4419} {"train_loss": -7.17447566986084, "global_step": 185630, "epoch": 4419} {"train_loss": -7.135703086853027, "global_step": 185631, "epoch": 4419} {"train_loss": -7.068920135498047, "global_step": 185632, "epoch": 4419} {"train_loss": -7.240426063537598, "global_step": 185633, "epoch": 4419} {"train_loss": -7.240484237670898, "global_step": 185634, "epoch": 4419} {"train_loss": -7.192946910858154, "global_step": 185635, "epoch": 4419} {"train_loss": -7.189208030700684, "global_step": 185636, "epoch": 4419} {"train_loss": -7.198184013366699, "global_step": 185637, "epoch": 4419} {"train_loss": -7.173797130584717, "global_step": 185638, "epoch": 4419} {"train_loss": -7.142387742087955, "global_step": 185639, "epoch": 4419, "val_loss": 68911.8515625} {"train_loss": -7.158918857574463, "global_step": 185640, "epoch": 4420} {"train_loss": -7.163812637329102, "global_step": 185641, "epoch": 4420} {"train_loss": -7.2032012939453125, "global_step": 185642, "epoch": 4420} {"train_loss": -7.237837791442871, "global_step": 185643, "epoch": 4420} {"train_loss": -7.2505693435668945, "global_step": 185644, "epoch": 4420} {"train_loss": -7.1423234939575195, "global_step": 185645, "epoch": 4420} {"train_loss": -7.11415958404541, "global_step": 185646, "epoch": 4420} {"train_loss": -7.227181434631348, "global_step": 185647, "epoch": 4420} {"train_loss": -7.131121635437012, "global_step": 185648, "epoch": 4420} {"train_loss": -7.254621982574463, "global_step": 185649, "epoch": 4420} {"train_loss": -7.0798492431640625, "global_step": 185650, "epoch": 4420} {"train_loss": -7.192887306213379, "global_step": 185651, "epoch": 4420} {"train_loss": -7.081097602844238, "global_step": 185652, "epoch": 4420} {"train_loss": -7.133722305297852, "global_step": 185653, "epoch": 4420} {"train_loss": -7.128054618835449, "global_step": 185654, "epoch": 4420} {"train_loss": -7.195976257324219, "global_step": 185655, "epoch": 4420} {"train_loss": -7.0868024826049805, "global_step": 185656, "epoch": 4420} {"train_loss": -7.146409034729004, "global_step": 185657, "epoch": 4420} {"train_loss": -7.151988983154297, "global_step": 185658, "epoch": 4420} {"train_loss": -7.03415060043335, "global_step": 185659, "epoch": 4420} {"train_loss": -7.06339168548584, "global_step": 185660, "epoch": 4420} {"train_loss": -7.193351745605469, "global_step": 185661, "epoch": 4420} {"train_loss": -7.154024124145508, "global_step": 185662, "epoch": 4420} {"train_loss": -7.01509952545166, "global_step": 185663, "epoch": 4420} {"train_loss": -7.0790910720825195, "global_step": 185664, "epoch": 4420} {"train_loss": -7.29304313659668, "global_step": 185665, "epoch": 4420} {"train_loss": -7.041304588317871, "global_step": 185666, "epoch": 4420} {"train_loss": -7.092993259429932, "global_step": 185667, "epoch": 4420} {"train_loss": -7.07844352722168, "global_step": 185668, "epoch": 4420} {"train_loss": -7.168015480041504, "global_step": 185669, "epoch": 4420} {"train_loss": -7.172125816345215, "global_step": 185670, "epoch": 4420} {"train_loss": -7.107346534729004, "global_step": 185671, "epoch": 4420} {"train_loss": -7.092708587646484, "global_step": 185672, "epoch": 4420} {"train_loss": -7.138325214385986, "global_step": 185673, "epoch": 4420} {"train_loss": -7.206642150878906, "global_step": 185674, "epoch": 4420} {"train_loss": -7.085765838623047, "global_step": 185675, "epoch": 4420} {"train_loss": -7.273340225219727, "global_step": 185676, "epoch": 4420} {"train_loss": -7.057313919067383, "global_step": 185677, "epoch": 4420} {"train_loss": -7.168169021606445, "global_step": 185678, "epoch": 4420} {"train_loss": -7.084269046783447, "global_step": 185679, "epoch": 4420} {"train_loss": -7.077040195465088, "global_step": 185680, "epoch": 4420} {"train_loss": -7.143286069234212, "global_step": 185681, "epoch": 4420, "val_loss": 68777.28125} {"train_loss": -7.103977680206299, "global_step": 185682, "epoch": 4421} {"train_loss": -7.1448869705200195, "global_step": 185683, "epoch": 4421} {"train_loss": -7.236311912536621, "global_step": 185684, "epoch": 4421} {"train_loss": -6.988556861877441, "global_step": 185685, "epoch": 4421} {"train_loss": -7.094956398010254, "global_step": 185686, "epoch": 4421} {"train_loss": -7.119564056396484, "global_step": 185687, "epoch": 4421} {"train_loss": -7.023934364318848, "global_step": 185688, "epoch": 4421} {"train_loss": -7.171854019165039, "global_step": 185689, "epoch": 4421} {"train_loss": -7.13004207611084, "global_step": 185690, "epoch": 4421} {"train_loss": -6.937614440917969, "global_step": 185691, "epoch": 4421} {"train_loss": -6.992572784423828, "global_step": 185692, "epoch": 4421} {"train_loss": -7.068850517272949, "global_step": 185693, "epoch": 4421} {"train_loss": -7.045956611633301, "global_step": 185694, "epoch": 4421} {"train_loss": -7.130173683166504, "global_step": 185695, "epoch": 4421} {"train_loss": -7.072819709777832, "global_step": 185696, "epoch": 4421} {"train_loss": -7.085362434387207, "global_step": 185697, "epoch": 4421} {"train_loss": -7.063747406005859, "global_step": 185698, "epoch": 4421} {"train_loss": -7.062703609466553, "global_step": 185699, "epoch": 4421} {"train_loss": -7.034255027770996, "global_step": 185700, "epoch": 4421} {"train_loss": -7.115931510925293, "global_step": 185701, "epoch": 4421} {"train_loss": -7.176514148712158, "global_step": 185702, "epoch": 4421} {"train_loss": -6.994680404663086, "global_step": 185703, "epoch": 4421} {"train_loss": -7.113517761230469, "global_step": 185704, "epoch": 4421} {"train_loss": -7.171897888183594, "global_step": 185705, "epoch": 4421} {"train_loss": -7.160583019256592, "global_step": 185706, "epoch": 4421} {"train_loss": -7.092817306518555, "global_step": 185707, "epoch": 4421} {"train_loss": -7.146846771240234, "global_step": 185708, "epoch": 4421} {"train_loss": -7.126739501953125, "global_step": 185709, "epoch": 4421} {"train_loss": -7.173517227172852, "global_step": 185710, "epoch": 4421} {"train_loss": -7.100760459899902, "global_step": 185711, "epoch": 4421} {"train_loss": -7.2506232261657715, "global_step": 185712, "epoch": 4421} {"train_loss": -7.0678839683532715, "global_step": 185713, "epoch": 4421} {"train_loss": -7.041860580444336, "global_step": 185714, "epoch": 4421} {"train_loss": -7.139491081237793, "global_step": 185715, "epoch": 4421} {"train_loss": -7.134232521057129, "global_step": 185716, "epoch": 4421} {"train_loss": -7.109401226043701, "global_step": 185717, "epoch": 4421} {"train_loss": -6.92415714263916, "global_step": 185718, "epoch": 4421} {"train_loss": -7.057512283325195, "global_step": 185719, "epoch": 4421} {"train_loss": -7.010798454284668, "global_step": 185720, "epoch": 4421} {"train_loss": -7.124267578125, "global_step": 185721, "epoch": 4421} {"train_loss": -7.107962131500244, "global_step": 185722, "epoch": 4421} {"train_loss": -7.091670785631452, "global_step": 185723, "epoch": 4421, "val_loss": 69079.296875} {"train_loss": -7.060048580169678, "global_step": 185724, "epoch": 4422} {"train_loss": -7.023036479949951, "global_step": 185725, "epoch": 4422} {"train_loss": -6.990298748016357, "global_step": 185726, "epoch": 4422} {"train_loss": -7.133271217346191, "global_step": 185727, "epoch": 4422} {"train_loss": -6.9785661697387695, "global_step": 185728, "epoch": 4422} {"train_loss": -7.013718128204346, "global_step": 185729, "epoch": 4422} {"train_loss": -6.970675945281982, "global_step": 185730, "epoch": 4422} {"train_loss": -6.754563331604004, "global_step": 185731, "epoch": 4422} {"train_loss": -7.118133068084717, "global_step": 185732, "epoch": 4422} {"train_loss": -6.966559410095215, "global_step": 185733, "epoch": 4422} {"train_loss": -6.922428607940674, "global_step": 185734, "epoch": 4422} {"train_loss": -7.102028846740723, "global_step": 185735, "epoch": 4422} {"train_loss": -6.956979751586914, "global_step": 185736, "epoch": 4422} {"train_loss": -7.13033390045166, "global_step": 185737, "epoch": 4422} {"train_loss": -6.9665985107421875, "global_step": 185738, "epoch": 4422} {"train_loss": -7.103400230407715, "global_step": 185739, "epoch": 4422} {"train_loss": -7.0393877029418945, "global_step": 185740, "epoch": 4422} {"train_loss": -7.02296257019043, "global_step": 185741, "epoch": 4422} {"train_loss": -7.085595607757568, "global_step": 185742, "epoch": 4422} {"train_loss": -7.117153167724609, "global_step": 185743, "epoch": 4422} {"train_loss": -6.975228309631348, "global_step": 185744, "epoch": 4422} {"train_loss": -7.041781425476074, "global_step": 185745, "epoch": 4422} {"train_loss": -7.145421028137207, "global_step": 185746, "epoch": 4422} {"train_loss": -7.031216621398926, "global_step": 185747, "epoch": 4422} {"train_loss": -7.0911641120910645, "global_step": 185748, "epoch": 4422} {"train_loss": -7.033334732055664, "global_step": 185749, "epoch": 4422} {"train_loss": -7.087192535400391, "global_step": 185750, "epoch": 4422} {"train_loss": -7.1998291015625, "global_step": 185751, "epoch": 4422} {"train_loss": -7.013996124267578, "global_step": 185752, "epoch": 4422} {"train_loss": -7.038904666900635, "global_step": 185753, "epoch": 4422} {"train_loss": -7.17213249206543, "global_step": 185754, "epoch": 4422} {"train_loss": -7.13805627822876, "global_step": 185755, "epoch": 4422} {"train_loss": -7.124178886413574, "global_step": 185756, "epoch": 4422} {"train_loss": -7.123841285705566, "global_step": 185757, "epoch": 4422} {"train_loss": -7.1141557693481445, "global_step": 185758, "epoch": 4422} {"train_loss": -7.048855781555176, "global_step": 185759, "epoch": 4422} {"train_loss": -7.052473545074463, "global_step": 185760, "epoch": 4422} {"train_loss": -7.031476020812988, "global_step": 185761, "epoch": 4422} {"train_loss": -7.02329158782959, "global_step": 185762, "epoch": 4422} {"train_loss": -7.168399333953857, "global_step": 185763, "epoch": 4422} {"train_loss": -6.984488487243652, "global_step": 185764, "epoch": 4422} {"train_loss": -7.054405507587251, "global_step": 185765, "epoch": 4422, "val_loss": 68722.921875} {"train_loss": -7.2281293869018555, "global_step": 185766, "epoch": 4423} {"train_loss": -7.016541481018066, "global_step": 185767, "epoch": 4423} {"train_loss": -7.216495990753174, "global_step": 185768, "epoch": 4423} {"train_loss": -7.180829048156738, "global_step": 185769, "epoch": 4423} {"train_loss": -7.199319839477539, "global_step": 185770, "epoch": 4423} {"train_loss": -7.141903877258301, "global_step": 185771, "epoch": 4423} {"train_loss": -7.119132041931152, "global_step": 185772, "epoch": 4423} {"train_loss": -7.084919452667236, "global_step": 185773, "epoch": 4423} {"train_loss": -7.085300922393799, "global_step": 185774, "epoch": 4423} {"train_loss": -7.097495079040527, "global_step": 185775, "epoch": 4423} {"train_loss": -7.083894729614258, "global_step": 185776, "epoch": 4423} {"train_loss": -7.2395710945129395, "global_step": 185777, "epoch": 4423} {"train_loss": -7.131152629852295, "global_step": 185778, "epoch": 4423} {"train_loss": -7.065848350524902, "global_step": 185779, "epoch": 4423} {"train_loss": -7.0840864181518555, "global_step": 185780, "epoch": 4423} {"train_loss": -7.065245628356934, "global_step": 185781, "epoch": 4423} {"train_loss": -7.16117000579834, "global_step": 185782, "epoch": 4423} {"train_loss": -6.978646278381348, "global_step": 185783, "epoch": 4423} {"train_loss": -7.1074934005737305, "global_step": 185784, "epoch": 4423} {"train_loss": -7.131816864013672, "global_step": 185785, "epoch": 4423} {"train_loss": -6.970949649810791, "global_step": 185786, "epoch": 4423} {"train_loss": -7.077144145965576, "global_step": 185787, "epoch": 4423} {"train_loss": -7.166438579559326, "global_step": 185788, "epoch": 4423} {"train_loss": -6.982381820678711, "global_step": 185789, "epoch": 4423} {"train_loss": -7.199404716491699, "global_step": 185790, "epoch": 4423} {"train_loss": -7.156846046447754, "global_step": 185791, "epoch": 4423} {"train_loss": -7.08787202835083, "global_step": 185792, "epoch": 4423} {"train_loss": -7.1235456466674805, "global_step": 185793, "epoch": 4423} {"train_loss": -7.017692565917969, "global_step": 185794, "epoch": 4423} {"train_loss": -7.117951393127441, "global_step": 185795, "epoch": 4423} {"train_loss": -6.97603178024292, "global_step": 185796, "epoch": 4423} {"train_loss": -7.047679901123047, "global_step": 185797, "epoch": 4423} {"train_loss": -7.025968551635742, "global_step": 185798, "epoch": 4423} {"train_loss": -6.938907146453857, "global_step": 185799, "epoch": 4423} {"train_loss": -7.188827037811279, "global_step": 185800, "epoch": 4423} {"train_loss": -6.920440673828125, "global_step": 185801, "epoch": 4423} {"train_loss": -6.973725318908691, "global_step": 185802, "epoch": 4423} {"train_loss": -6.996885299682617, "global_step": 185803, "epoch": 4423} {"train_loss": -7.11176872253418, "global_step": 185804, "epoch": 4423} {"train_loss": -7.025817394256592, "global_step": 185805, "epoch": 4423} {"train_loss": -7.018568992614746, "global_step": 185806, "epoch": 4423} {"train_loss": -7.08441330137707, "global_step": 185807, "epoch": 4423, "val_loss": 68968.09375} {"train_loss": -7.058559417724609, "global_step": 185808, "epoch": 4424} {"train_loss": -7.120152473449707, "global_step": 185809, "epoch": 4424} {"train_loss": -7.0288166999816895, "global_step": 185810, "epoch": 4424} {"train_loss": -7.096269607543945, "global_step": 185811, "epoch": 4424} {"train_loss": -7.02207612991333, "global_step": 185812, "epoch": 4424} {"train_loss": -7.0581440925598145, "global_step": 185813, "epoch": 4424} {"train_loss": -7.085549354553223, "global_step": 185814, "epoch": 4424} {"train_loss": -7.149273872375488, "global_step": 185815, "epoch": 4424} {"train_loss": -6.995444297790527, "global_step": 185816, "epoch": 4424} {"train_loss": -7.0552263259887695, "global_step": 185817, "epoch": 4424} {"train_loss": -7.094347953796387, "global_step": 185818, "epoch": 4424} {"train_loss": -7.15533971786499, "global_step": 185819, "epoch": 4424} {"train_loss": -7.16957950592041, "global_step": 185820, "epoch": 4424} {"train_loss": -7.115635871887207, "global_step": 185821, "epoch": 4424} {"train_loss": -7.114789962768555, "global_step": 185822, "epoch": 4424} {"train_loss": -7.123683929443359, "global_step": 185823, "epoch": 4424} {"train_loss": -7.128992557525635, "global_step": 185824, "epoch": 4424} {"train_loss": -7.174419403076172, "global_step": 185825, "epoch": 4424} {"train_loss": -7.141452789306641, "global_step": 185826, "epoch": 4424} {"train_loss": -7.106747627258301, "global_step": 185827, "epoch": 4424} {"train_loss": -7.055449485778809, "global_step": 185828, "epoch": 4424} {"train_loss": -7.153050422668457, "global_step": 185829, "epoch": 4424} {"train_loss": -7.206325531005859, "global_step": 185830, "epoch": 4424} {"train_loss": -7.08387565612793, "global_step": 185831, "epoch": 4424} {"train_loss": -7.205893516540527, "global_step": 185832, "epoch": 4424} {"train_loss": -7.111642837524414, "global_step": 185833, "epoch": 4424} {"train_loss": -6.991680145263672, "global_step": 185834, "epoch": 4424} {"train_loss": -7.07161808013916, "global_step": 185835, "epoch": 4424} {"train_loss": -7.0059428215026855, "global_step": 185836, "epoch": 4424} {"train_loss": -7.174097061157227, "global_step": 185837, "epoch": 4424} {"train_loss": -6.977104187011719, "global_step": 185838, "epoch": 4424} {"train_loss": -7.243622779846191, "global_step": 185839, "epoch": 4424} {"train_loss": -7.134665489196777, "global_step": 185840, "epoch": 4424} {"train_loss": -6.966954708099365, "global_step": 185841, "epoch": 4424} {"train_loss": -7.026234149932861, "global_step": 185842, "epoch": 4424} {"train_loss": -6.9153547286987305, "global_step": 185843, "epoch": 4424} {"train_loss": -7.056903839111328, "global_step": 185844, "epoch": 4424} {"train_loss": -7.08848762512207, "global_step": 185845, "epoch": 4424} {"train_loss": -7.013796806335449, "global_step": 185846, "epoch": 4424} {"train_loss": -7.00791597366333, "global_step": 185847, "epoch": 4424} {"train_loss": -7.192794322967529, "global_step": 185848, "epoch": 4424} {"train_loss": -7.089662915184384, "global_step": 185849, "epoch": 4424, "val_loss": 68859.1796875} {"train_loss": -6.941496849060059, "global_step": 185850, "epoch": 4425} {"train_loss": -6.931589126586914, "global_step": 185851, "epoch": 4425} {"train_loss": -7.086799144744873, "global_step": 185852, "epoch": 4425} {"train_loss": -7.053890705108643, "global_step": 185853, "epoch": 4425} {"train_loss": -7.116368293762207, "global_step": 185854, "epoch": 4425} {"train_loss": -7.069394111633301, "global_step": 185855, "epoch": 4425} {"train_loss": -7.142029285430908, "global_step": 185856, "epoch": 4425} {"train_loss": -7.177886009216309, "global_step": 185857, "epoch": 4425} {"train_loss": -7.115954399108887, "global_step": 185858, "epoch": 4425} {"train_loss": -7.167015075683594, "global_step": 185859, "epoch": 4425} {"train_loss": -7.110776901245117, "global_step": 185860, "epoch": 4425} {"train_loss": -7.070446968078613, "global_step": 185861, "epoch": 4425} {"train_loss": -7.172844886779785, "global_step": 185862, "epoch": 4425} {"train_loss": -7.137866497039795, "global_step": 185863, "epoch": 4425} {"train_loss": -7.06086540222168, "global_step": 185864, "epoch": 4425} {"train_loss": -7.129448890686035, "global_step": 185865, "epoch": 4425} {"train_loss": -7.056014060974121, "global_step": 185866, "epoch": 4425} {"train_loss": -7.214395046234131, "global_step": 185867, "epoch": 4425} {"train_loss": -7.063846111297607, "global_step": 185868, "epoch": 4425} {"train_loss": -7.1387834548950195, "global_step": 185869, "epoch": 4425} {"train_loss": -7.145078659057617, "global_step": 185870, "epoch": 4425} {"train_loss": -7.0039825439453125, "global_step": 185871, "epoch": 4425} {"train_loss": -7.09706449508667, "global_step": 185872, "epoch": 4425} {"train_loss": -7.127439022064209, "global_step": 185873, "epoch": 4425} {"train_loss": -7.029034614562988, "global_step": 185874, "epoch": 4425} {"train_loss": -7.121054172515869, "global_step": 185875, "epoch": 4425} {"train_loss": -7.039274215698242, "global_step": 185876, "epoch": 4425} {"train_loss": -7.065923690795898, "global_step": 185877, "epoch": 4425} {"train_loss": -7.069486618041992, "global_step": 185878, "epoch": 4425} {"train_loss": -7.089964389801025, "global_step": 185879, "epoch": 4425} {"train_loss": -7.089156150817871, "global_step": 185880, "epoch": 4425} {"train_loss": -7.099891185760498, "global_step": 185881, "epoch": 4425} {"train_loss": -7.017805576324463, "global_step": 185882, "epoch": 4425} {"train_loss": -7.1700310707092285, "global_step": 185883, "epoch": 4425} {"train_loss": -7.034562110900879, "global_step": 185884, "epoch": 4425} {"train_loss": -7.1113128662109375, "global_step": 185885, "epoch": 4425} {"train_loss": -7.001086711883545, "global_step": 185886, "epoch": 4425} {"train_loss": -7.039658069610596, "global_step": 185887, "epoch": 4425} {"train_loss": -7.005690097808838, "global_step": 185888, "epoch": 4425} {"train_loss": -7.071866035461426, "global_step": 185889, "epoch": 4425} {"train_loss": -6.9895219802856445, "global_step": 185890, "epoch": 4425} {"train_loss": -7.08357758749099, "global_step": 185891, "epoch": 4425, "val_loss": 68742.5078125} {"train_loss": -7.024585723876953, "global_step": 185892, "epoch": 4426} {"train_loss": -7.068363666534424, "global_step": 185893, "epoch": 4426} {"train_loss": -7.04051399230957, "global_step": 185894, "epoch": 4426} {"train_loss": -7.026348114013672, "global_step": 185895, "epoch": 4426} {"train_loss": -7.178121089935303, "global_step": 185896, "epoch": 4426} {"train_loss": -7.110645294189453, "global_step": 185897, "epoch": 4426} {"train_loss": -7.067957878112793, "global_step": 185898, "epoch": 4426} {"train_loss": -7.155586242675781, "global_step": 185899, "epoch": 4426} {"train_loss": -7.0799055099487305, "global_step": 185900, "epoch": 4426} {"train_loss": -7.098189353942871, "global_step": 185901, "epoch": 4426} {"train_loss": -7.1401567459106445, "global_step": 185902, "epoch": 4426} {"train_loss": -7.057243347167969, "global_step": 185903, "epoch": 4426} {"train_loss": -7.08176326751709, "global_step": 185904, "epoch": 4426} {"train_loss": -7.081799030303955, "global_step": 185905, "epoch": 4426} {"train_loss": -7.252754211425781, "global_step": 185906, "epoch": 4426} {"train_loss": -7.168723106384277, "global_step": 185907, "epoch": 4426} {"train_loss": -7.163877964019775, "global_step": 185908, "epoch": 4426} {"train_loss": -7.169854640960693, "global_step": 185909, "epoch": 4426} {"train_loss": -7.0801472663879395, "global_step": 185910, "epoch": 4426} {"train_loss": -7.193122863769531, "global_step": 185911, "epoch": 4426} {"train_loss": -7.22751522064209, "global_step": 185912, "epoch": 4426} {"train_loss": -7.182837009429932, "global_step": 185913, "epoch": 4426} {"train_loss": -7.163002014160156, "global_step": 185914, "epoch": 4426} {"train_loss": -7.221090793609619, "global_step": 185915, "epoch": 4426} {"train_loss": -7.258526802062988, "global_step": 185916, "epoch": 4426} {"train_loss": -7.118078231811523, "global_step": 185917, "epoch": 4426} {"train_loss": -7.128439903259277, "global_step": 185918, "epoch": 4426} {"train_loss": -7.2307939529418945, "global_step": 185919, "epoch": 4426} {"train_loss": -7.2900495529174805, "global_step": 185920, "epoch": 4426} {"train_loss": -7.218829154968262, "global_step": 185921, "epoch": 4426} {"train_loss": -7.200233459472656, "global_step": 185922, "epoch": 4426} {"train_loss": -7.1756086349487305, "global_step": 185923, "epoch": 4426} {"train_loss": -7.286365985870361, "global_step": 185924, "epoch": 4426} {"train_loss": -7.276582717895508, "global_step": 185925, "epoch": 4426} {"train_loss": -7.295930862426758, "global_step": 185926, "epoch": 4426} {"train_loss": -7.3100481033325195, "global_step": 185927, "epoch": 4426} {"train_loss": -7.261168956756592, "global_step": 185928, "epoch": 4426} {"train_loss": -7.236179828643799, "global_step": 185929, "epoch": 4426} {"train_loss": -7.228712558746338, "global_step": 185930, "epoch": 4426} {"train_loss": -7.157731056213379, "global_step": 185931, "epoch": 4426} {"train_loss": -7.278031349182129, "global_step": 185932, "epoch": 4426} {"train_loss": -7.172663597833543, "global_step": 185933, "epoch": 4426, "val_loss": 68900.7265625} {"train_loss": -7.254717826843262, "global_step": 185934, "epoch": 4427} {"train_loss": -7.162623405456543, "global_step": 185935, "epoch": 4427} {"train_loss": -7.194211483001709, "global_step": 185936, "epoch": 4427} {"train_loss": -7.186738014221191, "global_step": 185937, "epoch": 4427} {"train_loss": -7.033784866333008, "global_step": 185938, "epoch": 4427} {"train_loss": -7.178295612335205, "global_step": 185939, "epoch": 4427} {"train_loss": -7.1133623123168945, "global_step": 185940, "epoch": 4427} {"train_loss": -7.074701309204102, "global_step": 185941, "epoch": 4427} {"train_loss": -7.100332260131836, "global_step": 185942, "epoch": 4427} {"train_loss": -7.112709045410156, "global_step": 185943, "epoch": 4427} {"train_loss": -7.049785614013672, "global_step": 185944, "epoch": 4427} {"train_loss": -6.955426216125488, "global_step": 185945, "epoch": 4427} {"train_loss": -7.179551601409912, "global_step": 185946, "epoch": 4427} {"train_loss": -7.075228214263916, "global_step": 185947, "epoch": 4427} {"train_loss": -7.0770263671875, "global_step": 185948, "epoch": 4427} {"train_loss": -7.1071295738220215, "global_step": 185949, "epoch": 4427} {"train_loss": -6.959555625915527, "global_step": 185950, "epoch": 4427} {"train_loss": -7.066051959991455, "global_step": 185951, "epoch": 4427} {"train_loss": -7.237644195556641, "global_step": 185952, "epoch": 4427} {"train_loss": -7.0478644371032715, "global_step": 185953, "epoch": 4427} {"train_loss": -7.1318511962890625, "global_step": 185954, "epoch": 4427} {"train_loss": -7.011958122253418, "global_step": 185955, "epoch": 4427} {"train_loss": -6.974381446838379, "global_step": 185956, "epoch": 4427} {"train_loss": -7.080599308013916, "global_step": 185957, "epoch": 4427} {"train_loss": -7.052720069885254, "global_step": 185958, "epoch": 4427} {"train_loss": -7.140305519104004, "global_step": 185959, "epoch": 4427} {"train_loss": -7.043360710144043, "global_step": 185960, "epoch": 4427} {"train_loss": -7.043434143066406, "global_step": 185961, "epoch": 4427} {"train_loss": -7.08840274810791, "global_step": 185962, "epoch": 4427} {"train_loss": -7.036393165588379, "global_step": 185963, "epoch": 4427} {"train_loss": -7.096731662750244, "global_step": 185964, "epoch": 4427} {"train_loss": -7.064658164978027, "global_step": 185965, "epoch": 4427} {"train_loss": -7.046032905578613, "global_step": 185966, "epoch": 4427} {"train_loss": -7.046550273895264, "global_step": 185967, "epoch": 4427} {"train_loss": -7.028712749481201, "global_step": 185968, "epoch": 4427} {"train_loss": -7.086393356323242, "global_step": 185969, "epoch": 4427} {"train_loss": -7.0800933837890625, "global_step": 185970, "epoch": 4427} {"train_loss": -7.177513599395752, "global_step": 185971, "epoch": 4427} {"train_loss": -7.1240434646606445, "global_step": 185972, "epoch": 4427} {"train_loss": -7.089771270751953, "global_step": 185973, "epoch": 4427} {"train_loss": -7.1020708084106445, "global_step": 185974, "epoch": 4427} {"train_loss": -7.090352807726179, "global_step": 185975, "epoch": 4427, "val_loss": 68856.5625} {"train_loss": -7.057611465454102, "global_step": 185976, "epoch": 4428} {"train_loss": -6.993839263916016, "global_step": 185977, "epoch": 4428} {"train_loss": -7.131069660186768, "global_step": 185978, "epoch": 4428} {"train_loss": -7.063726425170898, "global_step": 185979, "epoch": 4428} {"train_loss": -7.14243221282959, "global_step": 185980, "epoch": 4428} {"train_loss": -7.029455184936523, "global_step": 185981, "epoch": 4428} {"train_loss": -7.154583930969238, "global_step": 185982, "epoch": 4428} {"train_loss": -7.082908630371094, "global_step": 185983, "epoch": 4428} {"train_loss": -7.051095485687256, "global_step": 185984, "epoch": 4428} {"train_loss": -7.034516334533691, "global_step": 185985, "epoch": 4428} {"train_loss": -7.009980201721191, "global_step": 185986, "epoch": 4428} {"train_loss": -6.946261405944824, "global_step": 185987, "epoch": 4428} {"train_loss": -7.0189385414123535, "global_step": 185988, "epoch": 4428} {"train_loss": -7.105569839477539, "global_step": 185989, "epoch": 4428} {"train_loss": -7.058104038238525, "global_step": 185990, "epoch": 4428} {"train_loss": -7.139037132263184, "global_step": 185991, "epoch": 4428} {"train_loss": -7.181124687194824, "global_step": 185992, "epoch": 4428} {"train_loss": -7.137861251831055, "global_step": 185993, "epoch": 4428} {"train_loss": -7.215864181518555, "global_step": 185994, "epoch": 4428} {"train_loss": -7.086981296539307, "global_step": 185995, "epoch": 4428} {"train_loss": -7.168647766113281, "global_step": 185996, "epoch": 4428} {"train_loss": -7.137079238891602, "global_step": 185997, "epoch": 4428} {"train_loss": -7.18620491027832, "global_step": 185998, "epoch": 4428} {"train_loss": -7.108565330505371, "global_step": 185999, "epoch": 4428} {"train_loss": -7.173537254333496, "global_step": 186000, "epoch": 4428} {"train_loss": -7.080284118652344, "global_step": 186001, "epoch": 4428} {"train_loss": -7.142958164215088, "global_step": 186002, "epoch": 4428} {"train_loss": -7.117310523986816, "global_step": 186003, "epoch": 4428} {"train_loss": -7.030825614929199, "global_step": 186004, "epoch": 4428} {"train_loss": -7.153744220733643, "global_step": 186005, "epoch": 4428} {"train_loss": -7.174631118774414, "global_step": 186006, "epoch": 4428} {"train_loss": -7.205455780029297, "global_step": 186007, "epoch": 4428} {"train_loss": -7.232056617736816, "global_step": 186008, "epoch": 4428} {"train_loss": -7.088183879852295, "global_step": 186009, "epoch": 4428} {"train_loss": -7.077108383178711, "global_step": 186010, "epoch": 4428} {"train_loss": -7.157965183258057, "global_step": 186011, "epoch": 4428} {"train_loss": -7.201146125793457, "global_step": 186012, "epoch": 4428} {"train_loss": -7.164546966552734, "global_step": 186013, "epoch": 4428} {"train_loss": -7.157479763031006, "global_step": 186014, "epoch": 4428} {"train_loss": -7.131443977355957, "global_step": 186015, "epoch": 4428} {"train_loss": -7.1660614013671875, "global_step": 186016, "epoch": 4428} {"train_loss": -7.117324681509109, "global_step": 186017, "epoch": 4428, "val_loss": 69054.203125} {"train_loss": -7.245810031890869, "global_step": 186018, "epoch": 4429} {"train_loss": -7.176057815551758, "global_step": 186019, "epoch": 4429} {"train_loss": -7.110907554626465, "global_step": 186020, "epoch": 4429} {"train_loss": -7.190995216369629, "global_step": 186021, "epoch": 4429} {"train_loss": -7.190277576446533, "global_step": 186022, "epoch": 4429} {"train_loss": -7.185181617736816, "global_step": 186023, "epoch": 4429} {"train_loss": -7.074904918670654, "global_step": 186024, "epoch": 4429} {"train_loss": -7.0966691970825195, "global_step": 186025, "epoch": 4429} {"train_loss": -7.18970251083374, "global_step": 186026, "epoch": 4429} {"train_loss": -7.1573076248168945, "global_step": 186027, "epoch": 4429} {"train_loss": -7.229744911193848, "global_step": 186028, "epoch": 4429} {"train_loss": -7.069168567657471, "global_step": 186029, "epoch": 4429} {"train_loss": -7.110396385192871, "global_step": 186030, "epoch": 4429} {"train_loss": -7.266671180725098, "global_step": 186031, "epoch": 4429} {"train_loss": -7.1255879402160645, "global_step": 186032, "epoch": 4429} {"train_loss": -7.10555362701416, "global_step": 186033, "epoch": 4429} {"train_loss": -7.178445816040039, "global_step": 186034, "epoch": 4429} {"train_loss": -7.1634111404418945, "global_step": 186035, "epoch": 4429} {"train_loss": -7.17557954788208, "global_step": 186036, "epoch": 4429} {"train_loss": -7.130033016204834, "global_step": 186037, "epoch": 4429} {"train_loss": -7.248513221740723, "global_step": 186038, "epoch": 4429} {"train_loss": -7.143082141876221, "global_step": 186039, "epoch": 4429} {"train_loss": -7.0592474937438965, "global_step": 186040, "epoch": 4429} {"train_loss": -7.110012054443359, "global_step": 186041, "epoch": 4429} {"train_loss": -7.153926372528076, "global_step": 186042, "epoch": 4429} {"train_loss": -7.124582290649414, "global_step": 186043, "epoch": 4429} {"train_loss": -7.046788692474365, "global_step": 186044, "epoch": 4429} {"train_loss": -7.105292320251465, "global_step": 186045, "epoch": 4429} {"train_loss": -7.246129989624023, "global_step": 186046, "epoch": 4429} {"train_loss": -7.157820701599121, "global_step": 186047, "epoch": 4429} {"train_loss": -7.038172721862793, "global_step": 186048, "epoch": 4429} {"train_loss": -7.125043869018555, "global_step": 186049, "epoch": 4429} {"train_loss": -7.099710464477539, "global_step": 186050, "epoch": 4429} {"train_loss": -7.082604885101318, "global_step": 186051, "epoch": 4429} {"train_loss": -7.166629791259766, "global_step": 186052, "epoch": 4429} {"train_loss": -7.1280975341796875, "global_step": 186053, "epoch": 4429} {"train_loss": -7.051760673522949, "global_step": 186054, "epoch": 4429} {"train_loss": -6.98731803894043, "global_step": 186055, "epoch": 4429} {"train_loss": -7.201189041137695, "global_step": 186056, "epoch": 4429} {"train_loss": -7.141346454620361, "global_step": 186057, "epoch": 4429} {"train_loss": -6.985898017883301, "global_step": 186058, "epoch": 4429} {"train_loss": -7.132703826540992, "global_step": 186059, "epoch": 4429, "val_loss": 69077.140625} {"train_loss": -6.952459335327148, "global_step": 186060, "epoch": 4430} {"train_loss": -7.217261791229248, "global_step": 186061, "epoch": 4430} {"train_loss": -6.972292423248291, "global_step": 186062, "epoch": 4430} {"train_loss": -7.0778350830078125, "global_step": 186063, "epoch": 4430} {"train_loss": -7.000600814819336, "global_step": 186064, "epoch": 4430} {"train_loss": -7.032580375671387, "global_step": 186065, "epoch": 4430} {"train_loss": -7.0571489334106445, "global_step": 186066, "epoch": 4430} {"train_loss": -7.062304496765137, "global_step": 186067, "epoch": 4430} {"train_loss": -7.147945404052734, "global_step": 186068, "epoch": 4430} {"train_loss": -7.060813903808594, "global_step": 186069, "epoch": 4430} {"train_loss": -6.971581935882568, "global_step": 186070, "epoch": 4430} {"train_loss": -7.104037284851074, "global_step": 186071, "epoch": 4430} {"train_loss": -7.002492427825928, "global_step": 186072, "epoch": 4430} {"train_loss": -7.0839033126831055, "global_step": 186073, "epoch": 4430} {"train_loss": -7.070769309997559, "global_step": 186074, "epoch": 4430} {"train_loss": -6.990619659423828, "global_step": 186075, "epoch": 4430} {"train_loss": -7.08919095993042, "global_step": 186076, "epoch": 4430} {"train_loss": -7.108224868774414, "global_step": 186077, "epoch": 4430} {"train_loss": -7.129426002502441, "global_step": 186078, "epoch": 4430} {"train_loss": -7.045008659362793, "global_step": 186079, "epoch": 4430} {"train_loss": -7.018112659454346, "global_step": 186080, "epoch": 4430} {"train_loss": -7.051845073699951, "global_step": 186081, "epoch": 4430} {"train_loss": -7.043163299560547, "global_step": 186082, "epoch": 4430} {"train_loss": -6.958401679992676, "global_step": 186083, "epoch": 4430} {"train_loss": -7.136134147644043, "global_step": 186084, "epoch": 4430} {"train_loss": -7.13690185546875, "global_step": 186085, "epoch": 4430} {"train_loss": -7.076602458953857, "global_step": 186086, "epoch": 4430} {"train_loss": -7.191338062286377, "global_step": 186087, "epoch": 4430} {"train_loss": -7.032784938812256, "global_step": 186088, "epoch": 4430} {"train_loss": -7.246150016784668, "global_step": 186089, "epoch": 4430} {"train_loss": -7.168182373046875, "global_step": 186090, "epoch": 4430} {"train_loss": -7.145451545715332, "global_step": 186091, "epoch": 4430} {"train_loss": -7.057909965515137, "global_step": 186092, "epoch": 4430} {"train_loss": -7.089443206787109, "global_step": 186093, "epoch": 4430} {"train_loss": -7.125649452209473, "global_step": 186094, "epoch": 4430} {"train_loss": -7.088230609893799, "global_step": 186095, "epoch": 4430} {"train_loss": -7.21480655670166, "global_step": 186096, "epoch": 4430} {"train_loss": -7.128916263580322, "global_step": 186097, "epoch": 4430} {"train_loss": -7.2418107986450195, "global_step": 186098, "epoch": 4430} {"train_loss": -7.080212116241455, "global_step": 186099, "epoch": 4430} {"train_loss": -7.137447357177734, "global_step": 186100, "epoch": 4430} {"train_loss": -7.08763363247826, "global_step": 186101, "epoch": 4430, "val_loss": 68893.9453125} {"train_loss": -7.079807281494141, "global_step": 186102, "epoch": 4431} {"train_loss": -7.180498123168945, "global_step": 186103, "epoch": 4431} {"train_loss": -7.169164657592773, "global_step": 186104, "epoch": 4431} {"train_loss": -7.13870906829834, "global_step": 186105, "epoch": 4431} {"train_loss": -7.110225677490234, "global_step": 186106, "epoch": 4431} {"train_loss": -7.165221691131592, "global_step": 186107, "epoch": 4431} {"train_loss": -7.19294548034668, "global_step": 186108, "epoch": 4431} {"train_loss": -7.221796989440918, "global_step": 186109, "epoch": 4431} {"train_loss": -7.106389999389648, "global_step": 186110, "epoch": 4431} {"train_loss": -7.200146675109863, "global_step": 186111, "epoch": 4431} {"train_loss": -7.2400360107421875, "global_step": 186112, "epoch": 4431} {"train_loss": -7.182801246643066, "global_step": 186113, "epoch": 4431} {"train_loss": -7.140096664428711, "global_step": 186114, "epoch": 4431} {"train_loss": -7.115433692932129, "global_step": 186115, "epoch": 4431} {"train_loss": -7.136487007141113, "global_step": 186116, "epoch": 4431} {"train_loss": -7.1969146728515625, "global_step": 186117, "epoch": 4431} {"train_loss": -7.158594131469727, "global_step": 186118, "epoch": 4431} {"train_loss": -7.156744480133057, "global_step": 186119, "epoch": 4431} {"train_loss": -7.202610492706299, "global_step": 186120, "epoch": 4431} {"train_loss": -7.249306678771973, "global_step": 186121, "epoch": 4431} {"train_loss": -7.187668800354004, "global_step": 186122, "epoch": 4431} {"train_loss": -7.2314534187316895, "global_step": 186123, "epoch": 4431} {"train_loss": -7.134144306182861, "global_step": 186124, "epoch": 4431} {"train_loss": -7.056070327758789, "global_step": 186125, "epoch": 4431} {"train_loss": -7.1438093185424805, "global_step": 186126, "epoch": 4431} {"train_loss": -7.206992149353027, "global_step": 186127, "epoch": 4431} {"train_loss": -7.193599700927734, "global_step": 186128, "epoch": 4431} {"train_loss": -7.242973327636719, "global_step": 186129, "epoch": 4431} {"train_loss": -7.259434700012207, "global_step": 186130, "epoch": 4431} {"train_loss": -7.074868202209473, "global_step": 186131, "epoch": 4431} {"train_loss": -7.196568012237549, "global_step": 186132, "epoch": 4431} {"train_loss": -7.161263465881348, "global_step": 186133, "epoch": 4431} {"train_loss": -7.138382911682129, "global_step": 186134, "epoch": 4431} {"train_loss": -7.154489994049072, "global_step": 186135, "epoch": 4431} {"train_loss": -7.1434407234191895, "global_step": 186136, "epoch": 4431} {"train_loss": -7.224985599517822, "global_step": 186137, "epoch": 4431} {"train_loss": -7.203742504119873, "global_step": 186138, "epoch": 4431} {"train_loss": -7.151760101318359, "global_step": 186139, "epoch": 4431} {"train_loss": -7.1090264320373535, "global_step": 186140, "epoch": 4431} {"train_loss": -7.194363594055176, "global_step": 186141, "epoch": 4431} {"train_loss": -7.016183853149414, "global_step": 186142, "epoch": 4431} {"train_loss": -7.161838576907203, "global_step": 186143, "epoch": 4431, "val_loss": 68816.5859375} {"train_loss": -7.285229682922363, "global_step": 186144, "epoch": 4432} {"train_loss": -7.1284613609313965, "global_step": 186145, "epoch": 4432} {"train_loss": -7.040220737457275, "global_step": 186146, "epoch": 4432} {"train_loss": -7.074357509613037, "global_step": 186147, "epoch": 4432} {"train_loss": -7.117773056030273, "global_step": 186148, "epoch": 4432} {"train_loss": -6.963848114013672, "global_step": 186149, "epoch": 4432} {"train_loss": -7.012188911437988, "global_step": 186150, "epoch": 4432} {"train_loss": -6.978424549102783, "global_step": 186151, "epoch": 4432} {"train_loss": -7.088165283203125, "global_step": 186152, "epoch": 4432} {"train_loss": -7.1682281494140625, "global_step": 186153, "epoch": 4432} {"train_loss": -6.971193790435791, "global_step": 186154, "epoch": 4432} {"train_loss": -7.087906837463379, "global_step": 186155, "epoch": 4432} {"train_loss": -7.064167022705078, "global_step": 186156, "epoch": 4432} {"train_loss": -7.0181884765625, "global_step": 186157, "epoch": 4432} {"train_loss": -7.064631462097168, "global_step": 186158, "epoch": 4432} {"train_loss": -7.178196907043457, "global_step": 186159, "epoch": 4432} {"train_loss": -7.116580963134766, "global_step": 186160, "epoch": 4432} {"train_loss": -7.108534812927246, "global_step": 186161, "epoch": 4432} {"train_loss": -7.074535369873047, "global_step": 186162, "epoch": 4432} {"train_loss": -7.0833635330200195, "global_step": 186163, "epoch": 4432} {"train_loss": -7.050049781799316, "global_step": 186164, "epoch": 4432} {"train_loss": -7.045610427856445, "global_step": 186165, "epoch": 4432} {"train_loss": -7.017064094543457, "global_step": 186166, "epoch": 4432} {"train_loss": -7.061097145080566, "global_step": 186167, "epoch": 4432} {"train_loss": -6.966737747192383, "global_step": 186168, "epoch": 4432} {"train_loss": -6.978200912475586, "global_step": 186169, "epoch": 4432} {"train_loss": -6.823975563049316, "global_step": 186170, "epoch": 4432} {"train_loss": -7.081631660461426, "global_step": 186171, "epoch": 4432} {"train_loss": -7.10516357421875, "global_step": 186172, "epoch": 4432} {"train_loss": -7.0292768478393555, "global_step": 186173, "epoch": 4432} {"train_loss": -7.076874732971191, "global_step": 186174, "epoch": 4432} {"train_loss": -6.9288530349731445, "global_step": 186175, "epoch": 4432} {"train_loss": -7.035384178161621, "global_step": 186176, "epoch": 4432} {"train_loss": -7.036977291107178, "global_step": 186177, "epoch": 4432} {"train_loss": -7.028645038604736, "global_step": 186178, "epoch": 4432} {"train_loss": -7.126507759094238, "global_step": 186179, "epoch": 4432} {"train_loss": -7.13835334777832, "global_step": 186180, "epoch": 4432} {"train_loss": -7.03903341293335, "global_step": 186181, "epoch": 4432} {"train_loss": -7.185019016265869, "global_step": 186182, "epoch": 4432} {"train_loss": -7.043638229370117, "global_step": 186183, "epoch": 4432} {"train_loss": -6.925143241882324, "global_step": 186184, "epoch": 4432} {"train_loss": -7.056539331163679, "global_step": 186185, "epoch": 4432, "val_loss": 68996.671875} {"train_loss": -6.999566555023193, "global_step": 186186, "epoch": 4433} {"train_loss": -7.099028587341309, "global_step": 186187, "epoch": 4433} {"train_loss": -7.084078788757324, "global_step": 186188, "epoch": 4433} {"train_loss": -6.9633002281188965, "global_step": 186189, "epoch": 4433} {"train_loss": -7.094610691070557, "global_step": 186190, "epoch": 4433} {"train_loss": -6.915234565734863, "global_step": 186191, "epoch": 4433} {"train_loss": -7.111846923828125, "global_step": 186192, "epoch": 4433} {"train_loss": -6.972270488739014, "global_step": 186193, "epoch": 4433} {"train_loss": -7.0850067138671875, "global_step": 186194, "epoch": 4433} {"train_loss": -7.061147689819336, "global_step": 186195, "epoch": 4433} {"train_loss": -7.0572028160095215, "global_step": 186196, "epoch": 4433} {"train_loss": -6.979705333709717, "global_step": 186197, "epoch": 4433} {"train_loss": -7.098723411560059, "global_step": 186198, "epoch": 4433} {"train_loss": -7.017932415008545, "global_step": 186199, "epoch": 4433} {"train_loss": -7.019492149353027, "global_step": 186200, "epoch": 4433} {"train_loss": -7.124241828918457, "global_step": 186201, "epoch": 4433} {"train_loss": -7.058656692504883, "global_step": 186202, "epoch": 4433} {"train_loss": -7.098569393157959, "global_step": 186203, "epoch": 4433} {"train_loss": -7.104116439819336, "global_step": 186204, "epoch": 4433} {"train_loss": -7.014013767242432, "global_step": 186205, "epoch": 4433} {"train_loss": -7.127470970153809, "global_step": 186206, "epoch": 4433} {"train_loss": -7.040857791900635, "global_step": 186207, "epoch": 4433} {"train_loss": -7.022893905639648, "global_step": 186208, "epoch": 4433} {"train_loss": -7.256213188171387, "global_step": 186209, "epoch": 4433} {"train_loss": -6.987314224243164, "global_step": 186210, "epoch": 4433} {"train_loss": -7.080583095550537, "global_step": 186211, "epoch": 4433} {"train_loss": -7.054179668426514, "global_step": 186212, "epoch": 4433} {"train_loss": -7.048514366149902, "global_step": 186213, "epoch": 4433} {"train_loss": -7.130250453948975, "global_step": 186214, "epoch": 4433} {"train_loss": -7.0313568115234375, "global_step": 186215, "epoch": 4433} {"train_loss": -6.945657253265381, "global_step": 186216, "epoch": 4433} {"train_loss": -7.156569957733154, "global_step": 186217, "epoch": 4433} {"train_loss": -6.984742164611816, "global_step": 186218, "epoch": 4433} {"train_loss": -7.003663063049316, "global_step": 186219, "epoch": 4433} {"train_loss": -7.075841903686523, "global_step": 186220, "epoch": 4433} {"train_loss": -7.10708475112915, "global_step": 186221, "epoch": 4433} {"train_loss": -7.041052341461182, "global_step": 186222, "epoch": 4433} {"train_loss": -6.990035057067871, "global_step": 186223, "epoch": 4433} {"train_loss": -7.061842918395996, "global_step": 186224, "epoch": 4433} {"train_loss": -7.060331344604492, "global_step": 186225, "epoch": 4433} {"train_loss": -7.163784027099609, "global_step": 186226, "epoch": 4433} {"train_loss": -7.059108177820842, "global_step": 186227, "epoch": 4433, "val_loss": 68977.4765625} {"train_loss": -7.105319976806641, "global_step": 186228, "epoch": 4434} {"train_loss": -7.157950401306152, "global_step": 186229, "epoch": 4434} {"train_loss": -7.112898826599121, "global_step": 186230, "epoch": 4434} {"train_loss": -7.074700355529785, "global_step": 186231, "epoch": 4434} {"train_loss": -7.312262535095215, "global_step": 186232, "epoch": 4434} {"train_loss": -7.118711471557617, "global_step": 186233, "epoch": 4434} {"train_loss": -7.085992813110352, "global_step": 186234, "epoch": 4434} {"train_loss": -7.175048828125, "global_step": 186235, "epoch": 4434} {"train_loss": -7.164862155914307, "global_step": 186236, "epoch": 4434} {"train_loss": -7.197900772094727, "global_step": 186237, "epoch": 4434} {"train_loss": -7.15520715713501, "global_step": 186238, "epoch": 4434} {"train_loss": -7.120813846588135, "global_step": 186239, "epoch": 4434} {"train_loss": -7.154892921447754, "global_step": 186240, "epoch": 4434} {"train_loss": -7.133305549621582, "global_step": 186241, "epoch": 4434} {"train_loss": -7.159017562866211, "global_step": 186242, "epoch": 4434} {"train_loss": -7.059432506561279, "global_step": 186243, "epoch": 4434} {"train_loss": -7.0899457931518555, "global_step": 186244, "epoch": 4434} {"train_loss": -7.133364200592041, "global_step": 186245, "epoch": 4434} {"train_loss": -7.159359931945801, "global_step": 186246, "epoch": 4434} {"train_loss": -7.1550750732421875, "global_step": 186247, "epoch": 4434} {"train_loss": -7.144402980804443, "global_step": 186248, "epoch": 4434} {"train_loss": -7.119718551635742, "global_step": 186249, "epoch": 4434} {"train_loss": -7.204627990722656, "global_step": 186250, "epoch": 4434} {"train_loss": -7.135732650756836, "global_step": 186251, "epoch": 4434} {"train_loss": -7.120635032653809, "global_step": 186252, "epoch": 4434} {"train_loss": -7.0215044021606445, "global_step": 186253, "epoch": 4434} {"train_loss": -7.19073486328125, "global_step": 186254, "epoch": 4434} {"train_loss": -7.065374851226807, "global_step": 186255, "epoch": 4434} {"train_loss": -7.241177558898926, "global_step": 186256, "epoch": 4434} {"train_loss": -7.1953887939453125, "global_step": 186257, "epoch": 4434} {"train_loss": -7.169018268585205, "global_step": 186258, "epoch": 4434} {"train_loss": -7.143287658691406, "global_step": 186259, "epoch": 4434} {"train_loss": -7.072428226470947, "global_step": 186260, "epoch": 4434} {"train_loss": -7.014871597290039, "global_step": 186261, "epoch": 4434} {"train_loss": -7.053181171417236, "global_step": 186262, "epoch": 4434} {"train_loss": -7.188040733337402, "global_step": 186263, "epoch": 4434} {"train_loss": -6.976851463317871, "global_step": 186264, "epoch": 4434} {"train_loss": -7.1182451248168945, "global_step": 186265, "epoch": 4434} {"train_loss": -7.1645989418029785, "global_step": 186266, "epoch": 4434} {"train_loss": -7.185244560241699, "global_step": 186267, "epoch": 4434} {"train_loss": -7.145409107208252, "global_step": 186268, "epoch": 4434} {"train_loss": -7.132899670373826, "global_step": 186269, "epoch": 4434, "val_loss": 69001.828125} {"train_loss": -7.1292948722839355, "global_step": 186270, "epoch": 4435} {"train_loss": -7.0639801025390625, "global_step": 186271, "epoch": 4435} {"train_loss": -7.2378411293029785, "global_step": 186272, "epoch": 4435} {"train_loss": -7.075251579284668, "global_step": 186273, "epoch": 4435} {"train_loss": -7.205134391784668, "global_step": 186274, "epoch": 4435} {"train_loss": -7.160273551940918, "global_step": 186275, "epoch": 4435} {"train_loss": -7.103521823883057, "global_step": 186276, "epoch": 4435} {"train_loss": -7.049259185791016, "global_step": 186277, "epoch": 4435} {"train_loss": -7.187638759613037, "global_step": 186278, "epoch": 4435} {"train_loss": -7.093039512634277, "global_step": 186279, "epoch": 4435} {"train_loss": -7.072671890258789, "global_step": 186280, "epoch": 4435} {"train_loss": -7.134181499481201, "global_step": 186281, "epoch": 4435} {"train_loss": -7.205251216888428, "global_step": 186282, "epoch": 4435} {"train_loss": -7.216027736663818, "global_step": 186283, "epoch": 4435} {"train_loss": -7.02413272857666, "global_step": 186284, "epoch": 4435} {"train_loss": -7.109797477722168, "global_step": 186285, "epoch": 4435} {"train_loss": -7.147947311401367, "global_step": 186286, "epoch": 4435} {"train_loss": -7.0825042724609375, "global_step": 186287, "epoch": 4435} {"train_loss": -7.179983139038086, "global_step": 186288, "epoch": 4435} {"train_loss": -7.125748157501221, "global_step": 186289, "epoch": 4435} {"train_loss": -7.087519645690918, "global_step": 186290, "epoch": 4435} {"train_loss": -7.228764533996582, "global_step": 186291, "epoch": 4435} {"train_loss": -7.108038902282715, "global_step": 186292, "epoch": 4435} {"train_loss": -7.094216823577881, "global_step": 186293, "epoch": 4435} {"train_loss": -7.093581199645996, "global_step": 186294, "epoch": 4435} {"train_loss": -7.173623085021973, "global_step": 186295, "epoch": 4435} {"train_loss": -7.061806678771973, "global_step": 186296, "epoch": 4435} {"train_loss": -7.165127754211426, "global_step": 186297, "epoch": 4435} {"train_loss": -7.195506572723389, "global_step": 186298, "epoch": 4435} {"train_loss": -6.988487720489502, "global_step": 186299, "epoch": 4435} {"train_loss": -7.042509078979492, "global_step": 186300, "epoch": 4435} {"train_loss": -7.250015735626221, "global_step": 186301, "epoch": 4435} {"train_loss": -6.916925430297852, "global_step": 186302, "epoch": 4435} {"train_loss": -7.126036167144775, "global_step": 186303, "epoch": 4435} {"train_loss": -6.994439601898193, "global_step": 186304, "epoch": 4435} {"train_loss": -6.955552101135254, "global_step": 186305, "epoch": 4435} {"train_loss": -7.10113000869751, "global_step": 186306, "epoch": 4435} {"train_loss": -7.138998985290527, "global_step": 186307, "epoch": 4435} {"train_loss": -7.090666770935059, "global_step": 186308, "epoch": 4435} {"train_loss": -7.168184757232666, "global_step": 186309, "epoch": 4435} {"train_loss": -7.038103103637695, "global_step": 186310, "epoch": 4435} {"train_loss": -7.1116151582627065, "global_step": 186311, "epoch": 4435, "val_loss": 68737.65625} {"train_loss": -7.1509623527526855, "global_step": 186312, "epoch": 4436} {"train_loss": -7.135530948638916, "global_step": 186313, "epoch": 4436} {"train_loss": -7.1926751136779785, "global_step": 186314, "epoch": 4436} {"train_loss": -7.152500152587891, "global_step": 186315, "epoch": 4436} {"train_loss": -7.183111190795898, "global_step": 186316, "epoch": 4436} {"train_loss": -7.22774076461792, "global_step": 186317, "epoch": 4436} {"train_loss": -7.139736652374268, "global_step": 186318, "epoch": 4436} {"train_loss": -7.048982620239258, "global_step": 186319, "epoch": 4436} {"train_loss": -7.165363311767578, "global_step": 186320, "epoch": 4436} {"train_loss": -7.168542385101318, "global_step": 186321, "epoch": 4436} {"train_loss": -7.193412780761719, "global_step": 186322, "epoch": 4436} {"train_loss": -7.050461769104004, "global_step": 186323, "epoch": 4436} {"train_loss": -7.043112754821777, "global_step": 186324, "epoch": 4436} {"train_loss": -7.069561958312988, "global_step": 186325, "epoch": 4436} {"train_loss": -7.107428550720215, "global_step": 186326, "epoch": 4436} {"train_loss": -7.10099983215332, "global_step": 186327, "epoch": 4436} {"train_loss": -7.25284481048584, "global_step": 186328, "epoch": 4436} {"train_loss": -7.020618438720703, "global_step": 186329, "epoch": 4436} {"train_loss": -7.122392654418945, "global_step": 186330, "epoch": 4436} {"train_loss": -7.107613563537598, "global_step": 186331, "epoch": 4436} {"train_loss": -7.056756496429443, "global_step": 186332, "epoch": 4436} {"train_loss": -7.011754035949707, "global_step": 186333, "epoch": 4436} {"train_loss": -7.166848182678223, "global_step": 186334, "epoch": 4436} {"train_loss": -7.083193302154541, "global_step": 186335, "epoch": 4436} {"train_loss": -7.183296203613281, "global_step": 186336, "epoch": 4436} {"train_loss": -7.171998977661133, "global_step": 186337, "epoch": 4436} {"train_loss": -7.152644157409668, "global_step": 186338, "epoch": 4436} {"train_loss": -7.094152450561523, "global_step": 186339, "epoch": 4436} {"train_loss": -7.042677879333496, "global_step": 186340, "epoch": 4436} {"train_loss": -7.186237812042236, "global_step": 186341, "epoch": 4436} {"train_loss": -7.172638416290283, "global_step": 186342, "epoch": 4436} {"train_loss": -7.038787841796875, "global_step": 186343, "epoch": 4436} {"train_loss": -7.17845344543457, "global_step": 186344, "epoch": 4436} {"train_loss": -7.139682292938232, "global_step": 186345, "epoch": 4436} {"train_loss": -7.178149223327637, "global_step": 186346, "epoch": 4436} {"train_loss": -7.17952823638916, "global_step": 186347, "epoch": 4436} {"train_loss": -7.067534446716309, "global_step": 186348, "epoch": 4436} {"train_loss": -7.096132278442383, "global_step": 186349, "epoch": 4436} {"train_loss": -7.102038383483887, "global_step": 186350, "epoch": 4436} {"train_loss": -7.083791255950928, "global_step": 186351, "epoch": 4436} {"train_loss": -7.107159614562988, "global_step": 186352, "epoch": 4436} {"train_loss": -7.125667208716983, "global_step": 186353, "epoch": 4436, "val_loss": 68773.2890625} {"train_loss": -7.059353828430176, "global_step": 186354, "epoch": 4437} {"train_loss": -7.090567588806152, "global_step": 186355, "epoch": 4437} {"train_loss": -7.092573165893555, "global_step": 186356, "epoch": 4437} {"train_loss": -7.089923858642578, "global_step": 186357, "epoch": 4437} {"train_loss": -7.075735092163086, "global_step": 186358, "epoch": 4437} {"train_loss": -7.030699729919434, "global_step": 186359, "epoch": 4437} {"train_loss": -7.104108810424805, "global_step": 186360, "epoch": 4437} {"train_loss": -7.064891338348389, "global_step": 186361, "epoch": 4437} {"train_loss": -6.977387428283691, "global_step": 186362, "epoch": 4437} {"train_loss": -6.957623481750488, "global_step": 186363, "epoch": 4437} {"train_loss": -7.023189544677734, "global_step": 186364, "epoch": 4437} {"train_loss": -7.03249454498291, "global_step": 186365, "epoch": 4437} {"train_loss": -7.004246711730957, "global_step": 186366, "epoch": 4437} {"train_loss": -7.035013198852539, "global_step": 186367, "epoch": 4437} {"train_loss": -6.999965667724609, "global_step": 186368, "epoch": 4437} {"train_loss": -6.965529441833496, "global_step": 186369, "epoch": 4437} {"train_loss": -7.176793575286865, "global_step": 186370, "epoch": 4437} {"train_loss": -7.064929485321045, "global_step": 186371, "epoch": 4437} {"train_loss": -7.089426040649414, "global_step": 186372, "epoch": 4437} {"train_loss": -6.9002366065979, "global_step": 186373, "epoch": 4437} {"train_loss": -7.200640678405762, "global_step": 186374, "epoch": 4437} {"train_loss": -7.108656406402588, "global_step": 186375, "epoch": 4437} {"train_loss": -7.138477325439453, "global_step": 186376, "epoch": 4437} {"train_loss": -7.126311779022217, "global_step": 186377, "epoch": 4437} {"train_loss": -7.079939842224121, "global_step": 186378, "epoch": 4437} {"train_loss": -7.13769006729126, "global_step": 186379, "epoch": 4437} {"train_loss": -7.112478256225586, "global_step": 186380, "epoch": 4437} {"train_loss": -6.994777202606201, "global_step": 186381, "epoch": 4437} {"train_loss": -7.2197113037109375, "global_step": 186382, "epoch": 4437} {"train_loss": -7.244608402252197, "global_step": 186383, "epoch": 4437} {"train_loss": -7.093704700469971, "global_step": 186384, "epoch": 4437} {"train_loss": -7.133228302001953, "global_step": 186385, "epoch": 4437} {"train_loss": -7.12686824798584, "global_step": 186386, "epoch": 4437} {"train_loss": -7.03788948059082, "global_step": 186387, "epoch": 4437} {"train_loss": -7.152894020080566, "global_step": 186388, "epoch": 4437} {"train_loss": -7.247387886047363, "global_step": 186389, "epoch": 4437} {"train_loss": -7.107497215270996, "global_step": 186390, "epoch": 4437} {"train_loss": -7.254819869995117, "global_step": 186391, "epoch": 4437} {"train_loss": -7.150257587432861, "global_step": 186392, "epoch": 4437} {"train_loss": -7.203914642333984, "global_step": 186393, "epoch": 4437} {"train_loss": -7.2920684814453125, "global_step": 186394, "epoch": 4437} {"train_loss": -7.100565785453433, "global_step": 186395, "epoch": 4437, "val_loss": 68864.296875} {"train_loss": -7.28803825378418, "global_step": 186396, "epoch": 4438} {"train_loss": -7.183887958526611, "global_step": 186397, "epoch": 4438} {"train_loss": -7.205639839172363, "global_step": 186398, "epoch": 4438} {"train_loss": -7.135217666625977, "global_step": 186399, "epoch": 4438} {"train_loss": -7.2344770431518555, "global_step": 186400, "epoch": 4438} {"train_loss": -7.133440017700195, "global_step": 186401, "epoch": 4438} {"train_loss": -7.0929412841796875, "global_step": 186402, "epoch": 4438} {"train_loss": -7.131442546844482, "global_step": 186403, "epoch": 4438} {"train_loss": -7.129852294921875, "global_step": 186404, "epoch": 4438} {"train_loss": -6.968578815460205, "global_step": 186405, "epoch": 4438} {"train_loss": -7.104567527770996, "global_step": 186406, "epoch": 4438} {"train_loss": -7.112417221069336, "global_step": 186407, "epoch": 4438} {"train_loss": -6.794851303100586, "global_step": 186408, "epoch": 4438} {"train_loss": -6.914235591888428, "global_step": 186409, "epoch": 4438} {"train_loss": -6.988702774047852, "global_step": 186410, "epoch": 4438} {"train_loss": -6.756687164306641, "global_step": 186411, "epoch": 4438} {"train_loss": -7.022810935974121, "global_step": 186412, "epoch": 4438} {"train_loss": -6.905613899230957, "global_step": 186413, "epoch": 4438} {"train_loss": -7.012170791625977, "global_step": 186414, "epoch": 4438} {"train_loss": -6.884418487548828, "global_step": 186415, "epoch": 4438} {"train_loss": -6.9786295890808105, "global_step": 186416, "epoch": 4438} {"train_loss": -6.953882217407227, "global_step": 186417, "epoch": 4438} {"train_loss": -7.157902240753174, "global_step": 186418, "epoch": 4438} {"train_loss": -6.762062072753906, "global_step": 186419, "epoch": 4438} {"train_loss": -7.0057373046875, "global_step": 186420, "epoch": 4438} {"train_loss": -6.983192443847656, "global_step": 186421, "epoch": 4438} {"train_loss": -6.99567985534668, "global_step": 186422, "epoch": 4438} {"train_loss": -7.063946723937988, "global_step": 186423, "epoch": 4438} {"train_loss": -7.101230144500732, "global_step": 186424, "epoch": 4438} {"train_loss": -6.947818756103516, "global_step": 186425, "epoch": 4438} {"train_loss": -7.052496433258057, "global_step": 186426, "epoch": 4438} {"train_loss": -6.951593399047852, "global_step": 186427, "epoch": 4438} {"train_loss": -7.098198890686035, "global_step": 186428, "epoch": 4438} {"train_loss": -7.110082626342773, "global_step": 186429, "epoch": 4438} {"train_loss": -7.051752090454102, "global_step": 186430, "epoch": 4438} {"train_loss": -6.982053756713867, "global_step": 186431, "epoch": 4438} {"train_loss": -7.064245223999023, "global_step": 186432, "epoch": 4438} {"train_loss": -7.032066345214844, "global_step": 186433, "epoch": 4438} {"train_loss": -7.070649147033691, "global_step": 186434, "epoch": 4438} {"train_loss": -7.081879138946533, "global_step": 186435, "epoch": 4438} {"train_loss": -7.044764041900635, "global_step": 186436, "epoch": 4438} {"train_loss": -7.035090321586246, "global_step": 186437, "epoch": 4438, "val_loss": 68870.5546875} {"train_loss": -7.083765029907227, "global_step": 186438, "epoch": 4439} {"train_loss": -7.070371627807617, "global_step": 186439, "epoch": 4439} {"train_loss": -7.06417989730835, "global_step": 186440, "epoch": 4439} {"train_loss": -7.068049430847168, "global_step": 186441, "epoch": 4439} {"train_loss": -6.976726531982422, "global_step": 186442, "epoch": 4439} {"train_loss": -7.195891380310059, "global_step": 186443, "epoch": 4439} {"train_loss": -6.937039852142334, "global_step": 186444, "epoch": 4439} {"train_loss": -6.850918292999268, "global_step": 186445, "epoch": 4439} {"train_loss": -7.221224784851074, "global_step": 186446, "epoch": 4439} {"train_loss": -6.864563941955566, "global_step": 186447, "epoch": 4439} {"train_loss": -7.039029121398926, "global_step": 186448, "epoch": 4439} {"train_loss": -6.920637607574463, "global_step": 186449, "epoch": 4439} {"train_loss": -7.07540225982666, "global_step": 186450, "epoch": 4439} {"train_loss": -7.052783489227295, "global_step": 186451, "epoch": 4439} {"train_loss": -6.916672706604004, "global_step": 186452, "epoch": 4439} {"train_loss": -7.030013084411621, "global_step": 186453, "epoch": 4439} {"train_loss": -6.95365571975708, "global_step": 186454, "epoch": 4439} {"train_loss": -7.13594388961792, "global_step": 186455, "epoch": 4439} {"train_loss": -6.970064640045166, "global_step": 186456, "epoch": 4439} {"train_loss": -6.9912614822387695, "global_step": 186457, "epoch": 4439} {"train_loss": -7.061003684997559, "global_step": 186458, "epoch": 4439} {"train_loss": -7.143017292022705, "global_step": 186459, "epoch": 4439} {"train_loss": -7.0152058601379395, "global_step": 186460, "epoch": 4439} {"train_loss": -6.833690166473389, "global_step": 186461, "epoch": 4439} {"train_loss": -6.965892791748047, "global_step": 186462, "epoch": 4439} {"train_loss": -7.009897232055664, "global_step": 186463, "epoch": 4439} {"train_loss": -6.9553632736206055, "global_step": 186464, "epoch": 4439} {"train_loss": -7.041278839111328, "global_step": 186465, "epoch": 4439} {"train_loss": -6.944969177246094, "global_step": 186466, "epoch": 4439} {"train_loss": -7.021450996398926, "global_step": 186467, "epoch": 4439} {"train_loss": -7.019420623779297, "global_step": 186468, "epoch": 4439} {"train_loss": -7.17210054397583, "global_step": 186469, "epoch": 4439} {"train_loss": -7.051636695861816, "global_step": 186470, "epoch": 4439} {"train_loss": -7.1368231773376465, "global_step": 186471, "epoch": 4439} {"train_loss": -7.035128593444824, "global_step": 186472, "epoch": 4439} {"train_loss": -7.152124404907227, "global_step": 186473, "epoch": 4439} {"train_loss": -7.025653839111328, "global_step": 186474, "epoch": 4439} {"train_loss": -7.109922409057617, "global_step": 186475, "epoch": 4439} {"train_loss": -7.060809135437012, "global_step": 186476, "epoch": 4439} {"train_loss": -7.171581268310547, "global_step": 186477, "epoch": 4439} {"train_loss": -7.059934139251709, "global_step": 186478, "epoch": 4439} {"train_loss": -7.0350767771403, "global_step": 186479, "epoch": 4439, "val_loss": 68890.3984375} {"train_loss": -7.068526268005371, "global_step": 186480, "epoch": 4440} {"train_loss": -7.181270599365234, "global_step": 186481, "epoch": 4440} {"train_loss": -7.105406761169434, "global_step": 186482, "epoch": 4440} {"train_loss": -7.119731903076172, "global_step": 186483, "epoch": 4440} {"train_loss": -7.073101997375488, "global_step": 186484, "epoch": 4440} {"train_loss": -7.121646881103516, "global_step": 186485, "epoch": 4440} {"train_loss": -7.172675132751465, "global_step": 186486, "epoch": 4440} {"train_loss": -7.214527130126953, "global_step": 186487, "epoch": 4440} {"train_loss": -7.211204528808594, "global_step": 186488, "epoch": 4440} {"train_loss": -7.2145538330078125, "global_step": 186489, "epoch": 4440} {"train_loss": -7.074270725250244, "global_step": 186490, "epoch": 4440} {"train_loss": -7.197797775268555, "global_step": 186491, "epoch": 4440} {"train_loss": -7.075351238250732, "global_step": 186492, "epoch": 4440} {"train_loss": -7.191535472869873, "global_step": 186493, "epoch": 4440} {"train_loss": -7.244298934936523, "global_step": 186494, "epoch": 4440} {"train_loss": -7.2678351402282715, "global_step": 186495, "epoch": 4440} {"train_loss": -7.188398361206055, "global_step": 186496, "epoch": 4440} {"train_loss": -7.294832229614258, "global_step": 186497, "epoch": 4440} {"train_loss": -7.155986785888672, "global_step": 186498, "epoch": 4440} {"train_loss": -7.217294692993164, "global_step": 186499, "epoch": 4440} {"train_loss": -7.253453254699707, "global_step": 186500, "epoch": 4440} {"train_loss": -7.1461944580078125, "global_step": 186501, "epoch": 4440} {"train_loss": -7.205296516418457, "global_step": 186502, "epoch": 4440} {"train_loss": -7.11124324798584, "global_step": 186503, "epoch": 4440} {"train_loss": -7.2176666259765625, "global_step": 186504, "epoch": 4440} {"train_loss": -7.165187835693359, "global_step": 186505, "epoch": 4440} {"train_loss": -7.1387038230896, "global_step": 186506, "epoch": 4440} {"train_loss": -7.151638031005859, "global_step": 186507, "epoch": 4440} {"train_loss": -7.1245856285095215, "global_step": 186508, "epoch": 4440} {"train_loss": -6.991219520568848, "global_step": 186509, "epoch": 4440} {"train_loss": -7.0786027908325195, "global_step": 186510, "epoch": 4440} {"train_loss": -7.223485469818115, "global_step": 186511, "epoch": 4440} {"train_loss": -7.179904460906982, "global_step": 186512, "epoch": 4440} {"train_loss": -7.070985794067383, "global_step": 186513, "epoch": 4440} {"train_loss": -7.003847599029541, "global_step": 186514, "epoch": 4440} {"train_loss": -7.115257263183594, "global_step": 186515, "epoch": 4440} {"train_loss": -7.128122329711914, "global_step": 186516, "epoch": 4440} {"train_loss": -7.146642208099365, "global_step": 186517, "epoch": 4440} {"train_loss": -7.072826385498047, "global_step": 186518, "epoch": 4440} {"train_loss": -7.171097755432129, "global_step": 186519, "epoch": 4440} {"train_loss": -7.181392669677734, "global_step": 186520, "epoch": 4440} {"train_loss": -7.153036980401902, "global_step": 186521, "epoch": 4440, "val_loss": 68634.96875} {"train_loss": -7.167239189147949, "global_step": 186522, "epoch": 4441} {"train_loss": -7.155777454376221, "global_step": 186523, "epoch": 4441} {"train_loss": -7.123593330383301, "global_step": 186524, "epoch": 4441} {"train_loss": -7.0984392166137695, "global_step": 186525, "epoch": 4441} {"train_loss": -7.220242500305176, "global_step": 186526, "epoch": 4441} {"train_loss": -7.110819339752197, "global_step": 186527, "epoch": 4441} {"train_loss": -7.093712329864502, "global_step": 186528, "epoch": 4441} {"train_loss": -7.103837013244629, "global_step": 186529, "epoch": 4441} {"train_loss": -7.093398571014404, "global_step": 186530, "epoch": 4441} {"train_loss": -7.154379844665527, "global_step": 186531, "epoch": 4441} {"train_loss": -7.0532426834106445, "global_step": 186532, "epoch": 4441} {"train_loss": -7.127093315124512, "global_step": 186533, "epoch": 4441} {"train_loss": -7.295814514160156, "global_step": 186534, "epoch": 4441} {"train_loss": -7.146523952484131, "global_step": 186535, "epoch": 4441} {"train_loss": -7.21308708190918, "global_step": 186536, "epoch": 4441} {"train_loss": -7.081675052642822, "global_step": 186537, "epoch": 4441} {"train_loss": -7.165755271911621, "global_step": 186538, "epoch": 4441} {"train_loss": -7.186197280883789, "global_step": 186539, "epoch": 4441} {"train_loss": -7.046523571014404, "global_step": 186540, "epoch": 4441} {"train_loss": -7.191478729248047, "global_step": 186541, "epoch": 4441} {"train_loss": -7.120009899139404, "global_step": 186542, "epoch": 4441} {"train_loss": -7.1540751457214355, "global_step": 186543, "epoch": 4441} {"train_loss": -7.217201232910156, "global_step": 186544, "epoch": 4441} {"train_loss": -7.163674354553223, "global_step": 186545, "epoch": 4441} {"train_loss": -7.118674278259277, "global_step": 186546, "epoch": 4441} {"train_loss": -7.037929534912109, "global_step": 186547, "epoch": 4441} {"train_loss": -7.216351509094238, "global_step": 186548, "epoch": 4441} {"train_loss": -7.009591102600098, "global_step": 186549, "epoch": 4441} {"train_loss": -6.922494411468506, "global_step": 186550, "epoch": 4441} {"train_loss": -6.838537216186523, "global_step": 186551, "epoch": 4441} {"train_loss": -7.0513811111450195, "global_step": 186552, "epoch": 4441} {"train_loss": -6.888992786407471, "global_step": 186553, "epoch": 4441} {"train_loss": -6.943951606750488, "global_step": 186554, "epoch": 4441} {"train_loss": -7.028558731079102, "global_step": 186555, "epoch": 4441} {"train_loss": -6.900670528411865, "global_step": 186556, "epoch": 4441} {"train_loss": -6.993315696716309, "global_step": 186557, "epoch": 4441} {"train_loss": -7.10980224609375, "global_step": 186558, "epoch": 4441} {"train_loss": -6.938109874725342, "global_step": 186559, "epoch": 4441} {"train_loss": -6.975774765014648, "global_step": 186560, "epoch": 4441} {"train_loss": -6.891458511352539, "global_step": 186561, "epoch": 4441} {"train_loss": -6.949389934539795, "global_step": 186562, "epoch": 4441} {"train_loss": -7.079047906966436, "global_step": 186563, "epoch": 4441, "val_loss": 69199.7578125} {"train_loss": -6.856625556945801, "global_step": 186564, "epoch": 4442} {"train_loss": -7.110215187072754, "global_step": 186565, "epoch": 4442} {"train_loss": -7.019137859344482, "global_step": 186566, "epoch": 4442} {"train_loss": -6.995484352111816, "global_step": 186567, "epoch": 4442} {"train_loss": -7.000768184661865, "global_step": 186568, "epoch": 4442} {"train_loss": -7.047855854034424, "global_step": 186569, "epoch": 4442} {"train_loss": -6.953897476196289, "global_step": 186570, "epoch": 4442} {"train_loss": -7.0851616859436035, "global_step": 186571, "epoch": 4442} {"train_loss": -6.999802589416504, "global_step": 186572, "epoch": 4442} {"train_loss": -7.187674522399902, "global_step": 186573, "epoch": 4442} {"train_loss": -7.008700847625732, "global_step": 186574, "epoch": 4442} {"train_loss": -7.049959659576416, "global_step": 186575, "epoch": 4442} {"train_loss": -6.9300336837768555, "global_step": 186576, "epoch": 4442} {"train_loss": -6.9387335777282715, "global_step": 186577, "epoch": 4442} {"train_loss": -7.0795488357543945, "global_step": 186578, "epoch": 4442} {"train_loss": -7.1107892990112305, "global_step": 186579, "epoch": 4442} {"train_loss": -7.0963568687438965, "global_step": 186580, "epoch": 4442} {"train_loss": -7.023561477661133, "global_step": 186581, "epoch": 4442} {"train_loss": -7.142441272735596, "global_step": 186582, "epoch": 4442} {"train_loss": -7.054614067077637, "global_step": 186583, "epoch": 4442} {"train_loss": -7.1638031005859375, "global_step": 186584, "epoch": 4442} {"train_loss": -7.088202953338623, "global_step": 186585, "epoch": 4442} {"train_loss": -7.151470184326172, "global_step": 186586, "epoch": 4442} {"train_loss": -7.172582149505615, "global_step": 186587, "epoch": 4442} {"train_loss": -7.001201629638672, "global_step": 186588, "epoch": 4442} {"train_loss": -7.094980239868164, "global_step": 186589, "epoch": 4442} {"train_loss": -7.128809928894043, "global_step": 186590, "epoch": 4442} {"train_loss": -7.074892520904541, "global_step": 186591, "epoch": 4442} {"train_loss": -7.163108825683594, "global_step": 186592, "epoch": 4442} {"train_loss": -7.25410795211792, "global_step": 186593, "epoch": 4442} {"train_loss": -7.276458263397217, "global_step": 186594, "epoch": 4442} {"train_loss": -7.091072082519531, "global_step": 186595, "epoch": 4442} {"train_loss": -7.055917263031006, "global_step": 186596, "epoch": 4442} {"train_loss": -7.05179500579834, "global_step": 186597, "epoch": 4442} {"train_loss": -7.068460464477539, "global_step": 186598, "epoch": 4442} {"train_loss": -7.1845221519470215, "global_step": 186599, "epoch": 4442} {"train_loss": -7.178132057189941, "global_step": 186600, "epoch": 4442} {"train_loss": -7.137045860290527, "global_step": 186601, "epoch": 4442} {"train_loss": -7.180143356323242, "global_step": 186602, "epoch": 4442} {"train_loss": -7.238161563873291, "global_step": 186603, "epoch": 4442} {"train_loss": -7.150112152099609, "global_step": 186604, "epoch": 4442} {"train_loss": -7.089827083405995, "global_step": 186605, "epoch": 4442, "val_loss": 68710.7890625} {"train_loss": -7.299633979797363, "global_step": 186606, "epoch": 4443} {"train_loss": -7.179017066955566, "global_step": 186607, "epoch": 4443} {"train_loss": -7.1842827796936035, "global_step": 186608, "epoch": 4443} {"train_loss": -7.193288803100586, "global_step": 186609, "epoch": 4443} {"train_loss": -7.1439008712768555, "global_step": 186610, "epoch": 4443} {"train_loss": -7.164700508117676, "global_step": 186611, "epoch": 4443} {"train_loss": -7.139231204986572, "global_step": 186612, "epoch": 4443} {"train_loss": -7.265571117401123, "global_step": 186613, "epoch": 4443} {"train_loss": -7.173821926116943, "global_step": 186614, "epoch": 4443} {"train_loss": -7.095824718475342, "global_step": 186615, "epoch": 4443} {"train_loss": -7.043127536773682, "global_step": 186616, "epoch": 4443} {"train_loss": -7.208310127258301, "global_step": 186617, "epoch": 4443} {"train_loss": -7.300772666931152, "global_step": 186618, "epoch": 4443} {"train_loss": -7.160916328430176, "global_step": 186619, "epoch": 4443} {"train_loss": -7.188907623291016, "global_step": 186620, "epoch": 4443} {"train_loss": -7.117674827575684, "global_step": 186621, "epoch": 4443} {"train_loss": -7.20103120803833, "global_step": 186622, "epoch": 4443} {"train_loss": -7.130066394805908, "global_step": 186623, "epoch": 4443} {"train_loss": -7.1502180099487305, "global_step": 186624, "epoch": 4443} {"train_loss": -7.192768096923828, "global_step": 186625, "epoch": 4443} {"train_loss": -7.267025947570801, "global_step": 186626, "epoch": 4443} {"train_loss": -7.1381425857543945, "global_step": 186627, "epoch": 4443} {"train_loss": -7.178053379058838, "global_step": 186628, "epoch": 4443} {"train_loss": -7.203790664672852, "global_step": 186629, "epoch": 4443} {"train_loss": -7.245046138763428, "global_step": 186630, "epoch": 4443} {"train_loss": -7.122107982635498, "global_step": 186631, "epoch": 4443} {"train_loss": -7.202549457550049, "global_step": 186632, "epoch": 4443} {"train_loss": -7.167370796203613, "global_step": 186633, "epoch": 4443} {"train_loss": -7.219046115875244, "global_step": 186634, "epoch": 4443} {"train_loss": -7.205052375793457, "global_step": 186635, "epoch": 4443} {"train_loss": -7.225506782531738, "global_step": 186636, "epoch": 4443} {"train_loss": -7.235672950744629, "global_step": 186637, "epoch": 4443} {"train_loss": -7.146564960479736, "global_step": 186638, "epoch": 4443} {"train_loss": -7.218233108520508, "global_step": 186639, "epoch": 4443} {"train_loss": -7.1528239250183105, "global_step": 186640, "epoch": 4443} {"train_loss": -7.214395999908447, "global_step": 186641, "epoch": 4443} {"train_loss": -7.294127941131592, "global_step": 186642, "epoch": 4443} {"train_loss": -7.091762065887451, "global_step": 186643, "epoch": 4443} {"train_loss": -6.97178316116333, "global_step": 186644, "epoch": 4443} {"train_loss": -7.195479393005371, "global_step": 186645, "epoch": 4443} {"train_loss": -7.137972831726074, "global_step": 186646, "epoch": 4443} {"train_loss": -7.177835294178554, "global_step": 186647, "epoch": 4443, "val_loss": 68873.9609375} {"train_loss": -7.091485023498535, "global_step": 186648, "epoch": 4444} {"train_loss": -7.080109596252441, "global_step": 186649, "epoch": 4444} {"train_loss": -7.026218414306641, "global_step": 186650, "epoch": 4444} {"train_loss": -6.984647750854492, "global_step": 186651, "epoch": 4444} {"train_loss": -6.9535393714904785, "global_step": 186652, "epoch": 4444} {"train_loss": -7.1967058181762695, "global_step": 186653, "epoch": 4444} {"train_loss": -7.10432243347168, "global_step": 186654, "epoch": 4444} {"train_loss": -7.185159683227539, "global_step": 186655, "epoch": 4444} {"train_loss": -7.074069976806641, "global_step": 186656, "epoch": 4444} {"train_loss": -6.997375011444092, "global_step": 186657, "epoch": 4444} {"train_loss": -7.18048095703125, "global_step": 186658, "epoch": 4444} {"train_loss": -7.026577949523926, "global_step": 186659, "epoch": 4444} {"train_loss": -6.899600982666016, "global_step": 186660, "epoch": 4444} {"train_loss": -7.054371356964111, "global_step": 186661, "epoch": 4444} {"train_loss": -6.939205646514893, "global_step": 186662, "epoch": 4444} {"train_loss": -7.165622234344482, "global_step": 186663, "epoch": 4444} {"train_loss": -6.898532867431641, "global_step": 186664, "epoch": 4444} {"train_loss": -7.124677658081055, "global_step": 186665, "epoch": 4444} {"train_loss": -6.966066360473633, "global_step": 186666, "epoch": 4444} {"train_loss": -7.036655426025391, "global_step": 186667, "epoch": 4444} {"train_loss": -7.002997398376465, "global_step": 186668, "epoch": 4444} {"train_loss": -6.988508701324463, "global_step": 186669, "epoch": 4444} {"train_loss": -6.983485698699951, "global_step": 186670, "epoch": 4444} {"train_loss": -7.076452732086182, "global_step": 186671, "epoch": 4444} {"train_loss": -7.144395351409912, "global_step": 186672, "epoch": 4444} {"train_loss": -7.09893274307251, "global_step": 186673, "epoch": 4444} {"train_loss": -7.136209487915039, "global_step": 186674, "epoch": 4444} {"train_loss": -7.013004779815674, "global_step": 186675, "epoch": 4444} {"train_loss": -7.064948558807373, "global_step": 186676, "epoch": 4444} {"train_loss": -7.05483341217041, "global_step": 186677, "epoch": 4444} {"train_loss": -7.090157508850098, "global_step": 186678, "epoch": 4444} {"train_loss": -7.082001209259033, "global_step": 186679, "epoch": 4444} {"train_loss": -7.017576217651367, "global_step": 186680, "epoch": 4444} {"train_loss": -6.986964702606201, "global_step": 186681, "epoch": 4444} {"train_loss": -7.137328147888184, "global_step": 186682, "epoch": 4444} {"train_loss": -6.885586738586426, "global_step": 186683, "epoch": 4444} {"train_loss": -7.206951141357422, "global_step": 186684, "epoch": 4444} {"train_loss": -7.100070953369141, "global_step": 186685, "epoch": 4444} {"train_loss": -7.051513671875, "global_step": 186686, "epoch": 4444} {"train_loss": -7.107894420623779, "global_step": 186687, "epoch": 4444} {"train_loss": -7.071752071380615, "global_step": 186688, "epoch": 4444} {"train_loss": -7.0547969454810735, "global_step": 186689, "epoch": 4444, "val_loss": 68865.765625} {"train_loss": -7.05366325378418, "global_step": 186690, "epoch": 4445} {"train_loss": -7.146659851074219, "global_step": 186691, "epoch": 4445} {"train_loss": -7.143011569976807, "global_step": 186692, "epoch": 4445} {"train_loss": -7.212212085723877, "global_step": 186693, "epoch": 4445} {"train_loss": -7.112383842468262, "global_step": 186694, "epoch": 4445} {"train_loss": -7.156802177429199, "global_step": 186695, "epoch": 4445} {"train_loss": -7.078356742858887, "global_step": 186696, "epoch": 4445} {"train_loss": -7.15084171295166, "global_step": 186697, "epoch": 4445} {"train_loss": -7.07509708404541, "global_step": 186698, "epoch": 4445} {"train_loss": -7.063515663146973, "global_step": 186699, "epoch": 4445} {"train_loss": -7.049460411071777, "global_step": 186700, "epoch": 4445} {"train_loss": -7.197445392608643, "global_step": 186701, "epoch": 4445} {"train_loss": -7.019596099853516, "global_step": 186702, "epoch": 4445} {"train_loss": -7.149607181549072, "global_step": 186703, "epoch": 4445} {"train_loss": -7.124818801879883, "global_step": 186704, "epoch": 4445} {"train_loss": -7.102696418762207, "global_step": 186705, "epoch": 4445} {"train_loss": -7.187691688537598, "global_step": 186706, "epoch": 4445} {"train_loss": -7.1111860275268555, "global_step": 186707, "epoch": 4445} {"train_loss": -7.124103546142578, "global_step": 186708, "epoch": 4445} {"train_loss": -7.134525299072266, "global_step": 186709, "epoch": 4445} {"train_loss": -7.240859031677246, "global_step": 186710, "epoch": 4445} {"train_loss": -7.1623735427856445, "global_step": 186711, "epoch": 4445} {"train_loss": -7.141846179962158, "global_step": 186712, "epoch": 4445} {"train_loss": -7.117349624633789, "global_step": 186713, "epoch": 4445} {"train_loss": -7.227964401245117, "global_step": 186714, "epoch": 4445} {"train_loss": -7.1274824142456055, "global_step": 186715, "epoch": 4445} {"train_loss": -7.054134368896484, "global_step": 186716, "epoch": 4445} {"train_loss": -7.163386344909668, "global_step": 186717, "epoch": 4445} {"train_loss": -7.124175071716309, "global_step": 186718, "epoch": 4445} {"train_loss": -7.179129600524902, "global_step": 186719, "epoch": 4445} {"train_loss": -7.155828475952148, "global_step": 186720, "epoch": 4445} {"train_loss": -7.123054504394531, "global_step": 186721, "epoch": 4445} {"train_loss": -7.06828498840332, "global_step": 186722, "epoch": 4445} {"train_loss": -7.182088851928711, "global_step": 186723, "epoch": 4445} {"train_loss": -7.091215133666992, "global_step": 186724, "epoch": 4445} {"train_loss": -7.120136260986328, "global_step": 186725, "epoch": 4445} {"train_loss": -7.1506242752075195, "global_step": 186726, "epoch": 4445} {"train_loss": -7.104467391967773, "global_step": 186727, "epoch": 4445} {"train_loss": -7.144841194152832, "global_step": 186728, "epoch": 4445} {"train_loss": -7.043510437011719, "global_step": 186729, "epoch": 4445} {"train_loss": -7.127298831939697, "global_step": 186730, "epoch": 4445} {"train_loss": -7.127012956710089, "global_step": 186731, "epoch": 4445, "val_loss": 69057.8515625} {"train_loss": -7.013725280761719, "global_step": 186732, "epoch": 4446} {"train_loss": -7.155161380767822, "global_step": 186733, "epoch": 4446} {"train_loss": -7.165886402130127, "global_step": 186734, "epoch": 4446} {"train_loss": -7.125672340393066, "global_step": 186735, "epoch": 4446} {"train_loss": -7.146047592163086, "global_step": 186736, "epoch": 4446} {"train_loss": -7.130435466766357, "global_step": 186737, "epoch": 4446} {"train_loss": -7.070629596710205, "global_step": 186738, "epoch": 4446} {"train_loss": -7.118823051452637, "global_step": 186739, "epoch": 4446} {"train_loss": -7.072761535644531, "global_step": 186740, "epoch": 4446} {"train_loss": -7.2493696212768555, "global_step": 186741, "epoch": 4446} {"train_loss": -7.042166709899902, "global_step": 186742, "epoch": 4446} {"train_loss": -7.195067405700684, "global_step": 186743, "epoch": 4446} {"train_loss": -7.116694450378418, "global_step": 186744, "epoch": 4446} {"train_loss": -7.091280937194824, "global_step": 186745, "epoch": 4446} {"train_loss": -7.112429618835449, "global_step": 186746, "epoch": 4446} {"train_loss": -7.078827857971191, "global_step": 186747, "epoch": 4446} {"train_loss": -7.078093528747559, "global_step": 186748, "epoch": 4446} {"train_loss": -7.176480293273926, "global_step": 186749, "epoch": 4446} {"train_loss": -7.161430835723877, "global_step": 186750, "epoch": 4446} {"train_loss": -7.156965732574463, "global_step": 186751, "epoch": 4446} {"train_loss": -7.233875274658203, "global_step": 186752, "epoch": 4446} {"train_loss": -7.1075849533081055, "global_step": 186753, "epoch": 4446} {"train_loss": -7.1156511306762695, "global_step": 186754, "epoch": 4446} {"train_loss": -7.169827938079834, "global_step": 186755, "epoch": 4446} {"train_loss": -7.109872341156006, "global_step": 186756, "epoch": 4446} {"train_loss": -7.180115699768066, "global_step": 186757, "epoch": 4446} {"train_loss": -7.288740634918213, "global_step": 186758, "epoch": 4446} {"train_loss": -7.1423492431640625, "global_step": 186759, "epoch": 4446} {"train_loss": -7.116111755371094, "global_step": 186760, "epoch": 4446} {"train_loss": -7.020351409912109, "global_step": 186761, "epoch": 4446} {"train_loss": -6.995561599731445, "global_step": 186762, "epoch": 4446} {"train_loss": -7.212882995605469, "global_step": 186763, "epoch": 4446} {"train_loss": -7.14698600769043, "global_step": 186764, "epoch": 4446} {"train_loss": -7.142385959625244, "global_step": 186765, "epoch": 4446} {"train_loss": -7.086361885070801, "global_step": 186766, "epoch": 4446} {"train_loss": -7.204136848449707, "global_step": 186767, "epoch": 4446} {"train_loss": -7.094003677368164, "global_step": 186768, "epoch": 4446} {"train_loss": -7.02262020111084, "global_step": 186769, "epoch": 4446} {"train_loss": -7.144775390625, "global_step": 186770, "epoch": 4446} {"train_loss": -7.1254472732543945, "global_step": 186771, "epoch": 4446} {"train_loss": -7.0289788246154785, "global_step": 186772, "epoch": 4446} {"train_loss": -7.122892686298916, "global_step": 186773, "epoch": 4446, "val_loss": 69037.2109375} {"train_loss": -7.035645484924316, "global_step": 186774, "epoch": 4447} {"train_loss": -7.126670837402344, "global_step": 186775, "epoch": 4447} {"train_loss": -7.136868476867676, "global_step": 186776, "epoch": 4447} {"train_loss": -7.122321128845215, "global_step": 186777, "epoch": 4447} {"train_loss": -7.128412246704102, "global_step": 186778, "epoch": 4447} {"train_loss": -7.133138656616211, "global_step": 186779, "epoch": 4447} {"train_loss": -7.10369873046875, "global_step": 186780, "epoch": 4447} {"train_loss": -7.0231032371521, "global_step": 186781, "epoch": 4447} {"train_loss": -7.186278343200684, "global_step": 186782, "epoch": 4447} {"train_loss": -7.073635101318359, "global_step": 186783, "epoch": 4447} {"train_loss": -7.127533912658691, "global_step": 186784, "epoch": 4447} {"train_loss": -7.098095893859863, "global_step": 186785, "epoch": 4447} {"train_loss": -7.019536972045898, "global_step": 186786, "epoch": 4447} {"train_loss": -7.129551887512207, "global_step": 186787, "epoch": 4447} {"train_loss": -7.149426460266113, "global_step": 186788, "epoch": 4447} {"train_loss": -7.148992538452148, "global_step": 186789, "epoch": 4447} {"train_loss": -7.0312042236328125, "global_step": 186790, "epoch": 4447} {"train_loss": -7.250761985778809, "global_step": 186791, "epoch": 4447} {"train_loss": -7.1452317237854, "global_step": 186792, "epoch": 4447} {"train_loss": -7.181647300720215, "global_step": 186793, "epoch": 4447} {"train_loss": -7.152958869934082, "global_step": 186794, "epoch": 4447} {"train_loss": -7.123909950256348, "global_step": 186795, "epoch": 4447} {"train_loss": -7.187601089477539, "global_step": 186796, "epoch": 4447} {"train_loss": -7.210388660430908, "global_step": 186797, "epoch": 4447} {"train_loss": -7.110546588897705, "global_step": 186798, "epoch": 4447} {"train_loss": -7.130033493041992, "global_step": 186799, "epoch": 4447} {"train_loss": -7.180994987487793, "global_step": 186800, "epoch": 4447} {"train_loss": -7.141352653503418, "global_step": 186801, "epoch": 4447} {"train_loss": -7.224441051483154, "global_step": 186802, "epoch": 4447} {"train_loss": -7.084495544433594, "global_step": 186803, "epoch": 4447} {"train_loss": -7.155004501342773, "global_step": 186804, "epoch": 4447} {"train_loss": -7.128033638000488, "global_step": 186805, "epoch": 4447} {"train_loss": -7.187283515930176, "global_step": 186806, "epoch": 4447} {"train_loss": -7.112906455993652, "global_step": 186807, "epoch": 4447} {"train_loss": -7.170376777648926, "global_step": 186808, "epoch": 4447} {"train_loss": -7.136408805847168, "global_step": 186809, "epoch": 4447} {"train_loss": -7.105070114135742, "global_step": 186810, "epoch": 4447} {"train_loss": -7.11098575592041, "global_step": 186811, "epoch": 4447} {"train_loss": -7.08518648147583, "global_step": 186812, "epoch": 4447} {"train_loss": -7.10754919052124, "global_step": 186813, "epoch": 4447} {"train_loss": -7.222201347351074, "global_step": 186814, "epoch": 4447} {"train_loss": -7.134552387964158, "global_step": 186815, "epoch": 4447, "val_loss": 68785.765625} {"train_loss": -7.181138515472412, "global_step": 186816, "epoch": 4448} {"train_loss": -7.192178726196289, "global_step": 186817, "epoch": 4448} {"train_loss": -7.151886940002441, "global_step": 186818, "epoch": 4448} {"train_loss": -7.190472602844238, "global_step": 186819, "epoch": 4448} {"train_loss": -7.156576633453369, "global_step": 186820, "epoch": 4448} {"train_loss": -7.090841293334961, "global_step": 186821, "epoch": 4448} {"train_loss": -7.008018493652344, "global_step": 186822, "epoch": 4448} {"train_loss": -7.199328422546387, "global_step": 186823, "epoch": 4448} {"train_loss": -7.154162883758545, "global_step": 186824, "epoch": 4448} {"train_loss": -7.063823699951172, "global_step": 186825, "epoch": 4448} {"train_loss": -7.146342754364014, "global_step": 186826, "epoch": 4448} {"train_loss": -7.127062797546387, "global_step": 186827, "epoch": 4448} {"train_loss": -7.052753925323486, "global_step": 186828, "epoch": 4448} {"train_loss": -7.0010666847229, "global_step": 186829, "epoch": 4448} {"train_loss": -7.1163554191589355, "global_step": 186830, "epoch": 4448} {"train_loss": -7.045777320861816, "global_step": 186831, "epoch": 4448} {"train_loss": -7.168861389160156, "global_step": 186832, "epoch": 4448} {"train_loss": -6.968186378479004, "global_step": 186833, "epoch": 4448} {"train_loss": -6.982390880584717, "global_step": 186834, "epoch": 4448} {"train_loss": -7.00236701965332, "global_step": 186835, "epoch": 4448} {"train_loss": -7.110224723815918, "global_step": 186836, "epoch": 4448} {"train_loss": -7.1742963790893555, "global_step": 186837, "epoch": 4448} {"train_loss": -7.0061163902282715, "global_step": 186838, "epoch": 4448} {"train_loss": -7.0890069007873535, "global_step": 186839, "epoch": 4448} {"train_loss": -7.09068489074707, "global_step": 186840, "epoch": 4448} {"train_loss": -6.85706901550293, "global_step": 186841, "epoch": 4448} {"train_loss": -7.191476821899414, "global_step": 186842, "epoch": 4448} {"train_loss": -7.052300453186035, "global_step": 186843, "epoch": 4448} {"train_loss": -6.9757184982299805, "global_step": 186844, "epoch": 4448} {"train_loss": -7.152341365814209, "global_step": 186845, "epoch": 4448} {"train_loss": -7.038008689880371, "global_step": 186846, "epoch": 4448} {"train_loss": -7.119032859802246, "global_step": 186847, "epoch": 4448} {"train_loss": -6.989763259887695, "global_step": 186848, "epoch": 4448} {"train_loss": -7.039863109588623, "global_step": 186849, "epoch": 4448} {"train_loss": -7.027224063873291, "global_step": 186850, "epoch": 4448} {"train_loss": -7.053827285766602, "global_step": 186851, "epoch": 4448} {"train_loss": -7.115511894226074, "global_step": 186852, "epoch": 4448} {"train_loss": -7.093568325042725, "global_step": 186853, "epoch": 4448} {"train_loss": -6.9908552169799805, "global_step": 186854, "epoch": 4448} {"train_loss": -6.954100608825684, "global_step": 186855, "epoch": 4448} {"train_loss": -6.921152591705322, "global_step": 186856, "epoch": 4448} {"train_loss": -7.070385126840501, "global_step": 186857, "epoch": 4448, "val_loss": 69110.2734375} {"train_loss": -6.8811936378479, "global_step": 186858, "epoch": 4449} {"train_loss": -6.9929423332214355, "global_step": 186859, "epoch": 4449} {"train_loss": -6.865305423736572, "global_step": 186860, "epoch": 4449} {"train_loss": -7.021920204162598, "global_step": 186861, "epoch": 4449} {"train_loss": -6.773519515991211, "global_step": 186862, "epoch": 4449} {"train_loss": -6.993348121643066, "global_step": 186863, "epoch": 4449} {"train_loss": -6.943335056304932, "global_step": 186864, "epoch": 4449} {"train_loss": -6.831707000732422, "global_step": 186865, "epoch": 4449} {"train_loss": -6.925241947174072, "global_step": 186866, "epoch": 4449} {"train_loss": -7.184269905090332, "global_step": 186867, "epoch": 4449} {"train_loss": -6.894477367401123, "global_step": 186868, "epoch": 4449} {"train_loss": -7.057833671569824, "global_step": 186869, "epoch": 4449} {"train_loss": -6.9088969230651855, "global_step": 186870, "epoch": 4449} {"train_loss": -7.055509567260742, "global_step": 186871, "epoch": 4449} {"train_loss": -7.043813705444336, "global_step": 186872, "epoch": 4449} {"train_loss": -7.017952919006348, "global_step": 186873, "epoch": 4449} {"train_loss": -7.0309906005859375, "global_step": 186874, "epoch": 4449} {"train_loss": -7.065274715423584, "global_step": 186875, "epoch": 4449} {"train_loss": -7.027261257171631, "global_step": 186876, "epoch": 4449} {"train_loss": -7.108860969543457, "global_step": 186877, "epoch": 4449} {"train_loss": -7.069108963012695, "global_step": 186878, "epoch": 4449} {"train_loss": -7.08608341217041, "global_step": 186879, "epoch": 4449} {"train_loss": -7.04150390625, "global_step": 186880, "epoch": 4449} {"train_loss": -7.187438011169434, "global_step": 186881, "epoch": 4449} {"train_loss": -7.116342544555664, "global_step": 186882, "epoch": 4449} {"train_loss": -7.115344524383545, "global_step": 186883, "epoch": 4449} {"train_loss": -7.132418155670166, "global_step": 186884, "epoch": 4449} {"train_loss": -7.197332382202148, "global_step": 186885, "epoch": 4449} {"train_loss": -7.133275985717773, "global_step": 186886, "epoch": 4449} {"train_loss": -7.184706211090088, "global_step": 186887, "epoch": 4449} {"train_loss": -7.105137825012207, "global_step": 186888, "epoch": 4449} {"train_loss": -7.078082084655762, "global_step": 186889, "epoch": 4449} {"train_loss": -7.243899822235107, "global_step": 186890, "epoch": 4449} {"train_loss": -7.111111640930176, "global_step": 186891, "epoch": 4449} {"train_loss": -7.182232856750488, "global_step": 186892, "epoch": 4449} {"train_loss": -7.066679000854492, "global_step": 186893, "epoch": 4449} {"train_loss": -7.218235969543457, "global_step": 186894, "epoch": 4449} {"train_loss": -7.230137825012207, "global_step": 186895, "epoch": 4449} {"train_loss": -7.068921089172363, "global_step": 186896, "epoch": 4449} {"train_loss": -7.1289496421813965, "global_step": 186897, "epoch": 4449} {"train_loss": -7.138189792633057, "global_step": 186898, "epoch": 4449} {"train_loss": -7.062317382721674, "global_step": 186899, "epoch": 4449, "val_loss": 68782.671875} {"train_loss": -7.250397205352783, "global_step": 186900, "epoch": 4450} {"train_loss": -7.166940689086914, "global_step": 186901, "epoch": 4450} {"train_loss": -7.177334785461426, "global_step": 186902, "epoch": 4450} {"train_loss": -7.173605918884277, "global_step": 186903, "epoch": 4450} {"train_loss": -7.174149036407471, "global_step": 186904, "epoch": 4450} {"train_loss": -7.1281328201293945, "global_step": 186905, "epoch": 4450} {"train_loss": -7.130793571472168, "global_step": 186906, "epoch": 4450} {"train_loss": -7.125200271606445, "global_step": 186907, "epoch": 4450} {"train_loss": -7.199594020843506, "global_step": 186908, "epoch": 4450} {"train_loss": -7.193227767944336, "global_step": 186909, "epoch": 4450} {"train_loss": -7.195327281951904, "global_step": 186910, "epoch": 4450} {"train_loss": -7.1245808601379395, "global_step": 186911, "epoch": 4450} {"train_loss": -7.129644393920898, "global_step": 186912, "epoch": 4450} {"train_loss": -7.115171909332275, "global_step": 186913, "epoch": 4450} {"train_loss": -7.1656646728515625, "global_step": 186914, "epoch": 4450} {"train_loss": -7.071322441101074, "global_step": 186915, "epoch": 4450} {"train_loss": -7.135498523712158, "global_step": 186916, "epoch": 4450} {"train_loss": -7.050036430358887, "global_step": 186917, "epoch": 4450} {"train_loss": -7.178279399871826, "global_step": 186918, "epoch": 4450} {"train_loss": -7.1496500968933105, "global_step": 186919, "epoch": 4450} {"train_loss": -7.200018882751465, "global_step": 186920, "epoch": 4450} {"train_loss": -7.065227031707764, "global_step": 186921, "epoch": 4450} {"train_loss": -7.185596466064453, "global_step": 186922, "epoch": 4450} {"train_loss": -7.229964256286621, "global_step": 186923, "epoch": 4450} {"train_loss": -7.179718494415283, "global_step": 186924, "epoch": 4450} {"train_loss": -7.219951629638672, "global_step": 186925, "epoch": 4450} {"train_loss": -7.268902778625488, "global_step": 186926, "epoch": 4450} {"train_loss": -7.159987449645996, "global_step": 186927, "epoch": 4450} {"train_loss": -7.246825218200684, "global_step": 186928, "epoch": 4450} {"train_loss": -7.150503158569336, "global_step": 186929, "epoch": 4450} {"train_loss": -7.096369743347168, "global_step": 186930, "epoch": 4450} {"train_loss": -7.180461883544922, "global_step": 186931, "epoch": 4450} {"train_loss": -7.164710998535156, "global_step": 186932, "epoch": 4450} {"train_loss": -7.213110446929932, "global_step": 186933, "epoch": 4450} {"train_loss": -7.117692947387695, "global_step": 186934, "epoch": 4450} {"train_loss": -7.210524559020996, "global_step": 186935, "epoch": 4450} {"train_loss": -7.338459491729736, "global_step": 186936, "epoch": 4450} {"train_loss": -7.141698360443115, "global_step": 186937, "epoch": 4450} {"train_loss": -7.210359573364258, "global_step": 186938, "epoch": 4450} {"train_loss": -7.179498672485352, "global_step": 186939, "epoch": 4450} {"train_loss": -7.195770263671875, "global_step": 186940, "epoch": 4450} {"train_loss": -7.172856819062006, "global_step": 186941, "epoch": 4450, "train/sim_max_reward_0": 0.23952304326658924, "train/sim_max_reward_1": 0.9647904522795243, "train/sim_max_reward_2": 0.5720073517026412, "train/sim_max_reward_3": 0.13362023309862228, "train/sim_max_reward_4": 0.973707418261377, "train/sim_max_reward_5": 0.8181640091613248, "test/sim_max_reward_4400000": 0.18975712447865917, "test/sim_max_reward_4400001": 0.887368988356455, "test/sim_max_reward_4400002": 0.9325766959750303, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.3096474141797891, "test/sim_max_reward_4400006": 0.937298167028407, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.2992634522731191, "test/sim_max_reward_4400009": 0.9456297957411869, "test/sim_max_reward_4400010": 0.22704543459649254, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9510440133205068, "test/sim_max_reward_4400013": 0.916991987798961, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.019606837097044565, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2719262595876141, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.18830131350369333, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.27282429028077765, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.015116855640001788, "test/sim_max_reward_4400028": 0.5149579280881655, "test/sim_max_reward_4400029": 0.8694388070236474, "test/sim_max_reward_4400030": 0.971309063542209, "test/sim_max_reward_4400031": 0.9350072689694039, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8989158740732203, "test/sim_max_reward_4400034": 0.9358506453258773, "test/sim_max_reward_4400035": 0.4383031471120087, "test/sim_max_reward_4400036": 0.3937674642811309, "test/sim_max_reward_4400037": 0.9527227135499424, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.8828202987169841, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6550025809778629, "test/sim_max_reward_4400042": 0.8655612371993033, "test/sim_max_reward_4400043": 0.967736053093643, "test/sim_max_reward_4400044": 0.9285715775988086, "test/sim_max_reward_4400045": 0.985682552605107, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.979749915404766, "test/sim_max_reward_4400049": 0.999579660235201, "train/mean_score": 0.6169687512950132, "test/mean_score": 0.5817114079637183, "val_loss": 68794.0} {"train_loss": -7.298048496246338, "global_step": 186942, "epoch": 4451} {"train_loss": -7.099327564239502, "global_step": 186943, "epoch": 4451} {"train_loss": -7.301725387573242, "global_step": 186944, "epoch": 4451} {"train_loss": -7.189880847930908, "global_step": 186945, "epoch": 4451} {"train_loss": -7.204270362854004, "global_step": 186946, "epoch": 4451} {"train_loss": -7.178274154663086, "global_step": 186947, "epoch": 4451} {"train_loss": -7.158044815063477, "global_step": 186948, "epoch": 4451} {"train_loss": -7.153360366821289, "global_step": 186949, "epoch": 4451} {"train_loss": -7.209003448486328, "global_step": 186950, "epoch": 4451} {"train_loss": -7.098588943481445, "global_step": 186951, "epoch": 4451} {"train_loss": -7.201084613800049, "global_step": 186952, "epoch": 4451} {"train_loss": -7.06839656829834, "global_step": 186953, "epoch": 4451} {"train_loss": -7.011090278625488, "global_step": 186954, "epoch": 4451} {"train_loss": -7.194530010223389, "global_step": 186955, "epoch": 4451} {"train_loss": -7.074466705322266, "global_step": 186956, "epoch": 4451} {"train_loss": -7.097177982330322, "global_step": 186957, "epoch": 4451} {"train_loss": -7.121150016784668, "global_step": 186958, "epoch": 4451} {"train_loss": -7.106631278991699, "global_step": 186959, "epoch": 4451} {"train_loss": -7.179387092590332, "global_step": 186960, "epoch": 4451} {"train_loss": -7.278351306915283, "global_step": 186961, "epoch": 4451} {"train_loss": -7.127002716064453, "global_step": 186962, "epoch": 4451} {"train_loss": -7.105836391448975, "global_step": 186963, "epoch": 4451} {"train_loss": -7.072892665863037, "global_step": 186964, "epoch": 4451} {"train_loss": -7.128002166748047, "global_step": 186965, "epoch": 4451} {"train_loss": -7.178030014038086, "global_step": 186966, "epoch": 4451} {"train_loss": -7.200218200683594, "global_step": 186967, "epoch": 4451} {"train_loss": -7.132534980773926, "global_step": 186968, "epoch": 4451} {"train_loss": -7.104325771331787, "global_step": 186969, "epoch": 4451} {"train_loss": -7.1184983253479, "global_step": 186970, "epoch": 4451} {"train_loss": -7.13530158996582, "global_step": 186971, "epoch": 4451} {"train_loss": -7.123443603515625, "global_step": 186972, "epoch": 4451} {"train_loss": -7.15227746963501, "global_step": 186973, "epoch": 4451} {"train_loss": -7.0990071296691895, "global_step": 186974, "epoch": 4451} {"train_loss": -7.231593132019043, "global_step": 186975, "epoch": 4451} {"train_loss": -7.151127815246582, "global_step": 186976, "epoch": 4451} {"train_loss": -6.9787116050720215, "global_step": 186977, "epoch": 4451} {"train_loss": -7.0361833572387695, "global_step": 186978, "epoch": 4451} {"train_loss": -7.1261138916015625, "global_step": 186979, "epoch": 4451} {"train_loss": -7.036262035369873, "global_step": 186980, "epoch": 4451} {"train_loss": -7.120729446411133, "global_step": 186981, "epoch": 4451} {"train_loss": -7.026667594909668, "global_step": 186982, "epoch": 4451} {"train_loss": -7.137304044905163, "global_step": 186983, "epoch": 4451, "val_loss": 68831.59375} {"train_loss": -7.12436580657959, "global_step": 186984, "epoch": 4452} {"train_loss": -7.037091255187988, "global_step": 186985, "epoch": 4452} {"train_loss": -7.1639204025268555, "global_step": 186986, "epoch": 4452} {"train_loss": -7.123531818389893, "global_step": 186987, "epoch": 4452} {"train_loss": -7.085457801818848, "global_step": 186988, "epoch": 4452} {"train_loss": -7.10129451751709, "global_step": 186989, "epoch": 4452} {"train_loss": -6.995429992675781, "global_step": 186990, "epoch": 4452} {"train_loss": -7.000563621520996, "global_step": 186991, "epoch": 4452} {"train_loss": -7.1168107986450195, "global_step": 186992, "epoch": 4452} {"train_loss": -7.233999729156494, "global_step": 186993, "epoch": 4452} {"train_loss": -7.093172073364258, "global_step": 186994, "epoch": 4452} {"train_loss": -7.143401145935059, "global_step": 186995, "epoch": 4452} {"train_loss": -7.172740936279297, "global_step": 186996, "epoch": 4452} {"train_loss": -7.0740251541137695, "global_step": 186997, "epoch": 4452} {"train_loss": -7.221858978271484, "global_step": 186998, "epoch": 4452} {"train_loss": -7.140796661376953, "global_step": 186999, "epoch": 4452} {"train_loss": -7.134213924407959, "global_step": 187000, "epoch": 4452} {"train_loss": -7.1371636390686035, "global_step": 187001, "epoch": 4452} {"train_loss": -7.012362957000732, "global_step": 187002, "epoch": 4452} {"train_loss": -7.167949676513672, "global_step": 187003, "epoch": 4452} {"train_loss": -7.106606483459473, "global_step": 187004, "epoch": 4452} {"train_loss": -7.023070335388184, "global_step": 187005, "epoch": 4452} {"train_loss": -7.030405044555664, "global_step": 187006, "epoch": 4452} {"train_loss": -7.136792182922363, "global_step": 187007, "epoch": 4452} {"train_loss": -7.15096378326416, "global_step": 187008, "epoch": 4452} {"train_loss": -7.182254314422607, "global_step": 187009, "epoch": 4452} {"train_loss": -7.140266418457031, "global_step": 187010, "epoch": 4452} {"train_loss": -7.157541275024414, "global_step": 187011, "epoch": 4452} {"train_loss": -7.199895858764648, "global_step": 187012, "epoch": 4452} {"train_loss": -7.177955150604248, "global_step": 187013, "epoch": 4452} {"train_loss": -7.227778434753418, "global_step": 187014, "epoch": 4452} {"train_loss": -7.12589168548584, "global_step": 187015, "epoch": 4452} {"train_loss": -7.149582862854004, "global_step": 187016, "epoch": 4452} {"train_loss": -7.1934943199157715, "global_step": 187017, "epoch": 4452} {"train_loss": -7.258059501647949, "global_step": 187018, "epoch": 4452} {"train_loss": -7.123230457305908, "global_step": 187019, "epoch": 4452} {"train_loss": -7.193065166473389, "global_step": 187020, "epoch": 4452} {"train_loss": -7.036853790283203, "global_step": 187021, "epoch": 4452} {"train_loss": -7.135500907897949, "global_step": 187022, "epoch": 4452} {"train_loss": -7.166254997253418, "global_step": 187023, "epoch": 4452} {"train_loss": -7.097695350646973, "global_step": 187024, "epoch": 4452} {"train_loss": -7.129432632809594, "global_step": 187025, "epoch": 4452, "val_loss": 68832.53125} {"train_loss": -7.039619445800781, "global_step": 187026, "epoch": 4453} {"train_loss": -7.198962688446045, "global_step": 187027, "epoch": 4453} {"train_loss": -7.116872787475586, "global_step": 187028, "epoch": 4453} {"train_loss": -7.09378719329834, "global_step": 187029, "epoch": 4453} {"train_loss": -6.994081497192383, "global_step": 187030, "epoch": 4453} {"train_loss": -7.138936996459961, "global_step": 187031, "epoch": 4453} {"train_loss": -7.021385192871094, "global_step": 187032, "epoch": 4453} {"train_loss": -7.161816596984863, "global_step": 187033, "epoch": 4453} {"train_loss": -7.025134086608887, "global_step": 187034, "epoch": 4453} {"train_loss": -7.153970718383789, "global_step": 187035, "epoch": 4453} {"train_loss": -7.1964592933654785, "global_step": 187036, "epoch": 4453} {"train_loss": -7.130823135375977, "global_step": 187037, "epoch": 4453} {"train_loss": -7.126532077789307, "global_step": 187038, "epoch": 4453} {"train_loss": -7.168692111968994, "global_step": 187039, "epoch": 4453} {"train_loss": -7.156155586242676, "global_step": 187040, "epoch": 4453} {"train_loss": -7.094237327575684, "global_step": 187041, "epoch": 4453} {"train_loss": -6.994758605957031, "global_step": 187042, "epoch": 4453} {"train_loss": -7.1007843017578125, "global_step": 187043, "epoch": 4453} {"train_loss": -6.938144683837891, "global_step": 187044, "epoch": 4453} {"train_loss": -6.859279632568359, "global_step": 187045, "epoch": 4453} {"train_loss": -7.177063941955566, "global_step": 187046, "epoch": 4453} {"train_loss": -6.945450305938721, "global_step": 187047, "epoch": 4453} {"train_loss": -6.93254280090332, "global_step": 187048, "epoch": 4453} {"train_loss": -7.176226615905762, "global_step": 187049, "epoch": 4453} {"train_loss": -7.010010242462158, "global_step": 187050, "epoch": 4453} {"train_loss": -7.124654293060303, "global_step": 187051, "epoch": 4453} {"train_loss": -7.118227005004883, "global_step": 187052, "epoch": 4453} {"train_loss": -7.046257972717285, "global_step": 187053, "epoch": 4453} {"train_loss": -7.0558013916015625, "global_step": 187054, "epoch": 4453} {"train_loss": -7.119670867919922, "global_step": 187055, "epoch": 4453} {"train_loss": -7.012052536010742, "global_step": 187056, "epoch": 4453} {"train_loss": -7.093297958374023, "global_step": 187057, "epoch": 4453} {"train_loss": -6.981075763702393, "global_step": 187058, "epoch": 4453} {"train_loss": -7.136796951293945, "global_step": 187059, "epoch": 4453} {"train_loss": -7.149830341339111, "global_step": 187060, "epoch": 4453} {"train_loss": -6.981546401977539, "global_step": 187061, "epoch": 4453} {"train_loss": -7.032529830932617, "global_step": 187062, "epoch": 4453} {"train_loss": -7.145520210266113, "global_step": 187063, "epoch": 4453} {"train_loss": -7.13517951965332, "global_step": 187064, "epoch": 4453} {"train_loss": -7.030546188354492, "global_step": 187065, "epoch": 4453} {"train_loss": -6.974620342254639, "global_step": 187066, "epoch": 4453} {"train_loss": -7.074923924037388, "global_step": 187067, "epoch": 4453, "val_loss": 68842.234375} {"train_loss": -7.045561790466309, "global_step": 187068, "epoch": 4454} {"train_loss": -7.103081226348877, "global_step": 187069, "epoch": 4454} {"train_loss": -7.228759765625, "global_step": 187070, "epoch": 4454} {"train_loss": -7.1375861167907715, "global_step": 187071, "epoch": 4454} {"train_loss": -7.105067729949951, "global_step": 187072, "epoch": 4454} {"train_loss": -7.051772117614746, "global_step": 187073, "epoch": 4454} {"train_loss": -7.125797271728516, "global_step": 187074, "epoch": 4454} {"train_loss": -7.146220684051514, "global_step": 187075, "epoch": 4454} {"train_loss": -7.079158782958984, "global_step": 187076, "epoch": 4454} {"train_loss": -7.0685200691223145, "global_step": 187077, "epoch": 4454} {"train_loss": -7.122938632965088, "global_step": 187078, "epoch": 4454} {"train_loss": -7.181476593017578, "global_step": 187079, "epoch": 4454} {"train_loss": -7.070347785949707, "global_step": 187080, "epoch": 4454} {"train_loss": -7.105788707733154, "global_step": 187081, "epoch": 4454} {"train_loss": -7.116282939910889, "global_step": 187082, "epoch": 4454} {"train_loss": -7.120981216430664, "global_step": 187083, "epoch": 4454} {"train_loss": -7.068243026733398, "global_step": 187084, "epoch": 4454} {"train_loss": -7.129363536834717, "global_step": 187085, "epoch": 4454} {"train_loss": -7.081883907318115, "global_step": 187086, "epoch": 4454} {"train_loss": -7.192975997924805, "global_step": 187087, "epoch": 4454} {"train_loss": -7.197116851806641, "global_step": 187088, "epoch": 4454} {"train_loss": -7.02979850769043, "global_step": 187089, "epoch": 4454} {"train_loss": -7.115724086761475, "global_step": 187090, "epoch": 4454} {"train_loss": -7.1388773918151855, "global_step": 187091, "epoch": 4454} {"train_loss": -7.107669353485107, "global_step": 187092, "epoch": 4454} {"train_loss": -7.1901469230651855, "global_step": 187093, "epoch": 4454} {"train_loss": -7.041252613067627, "global_step": 187094, "epoch": 4454} {"train_loss": -7.149202823638916, "global_step": 187095, "epoch": 4454} {"train_loss": -7.111263275146484, "global_step": 187096, "epoch": 4454} {"train_loss": -7.1117353439331055, "global_step": 187097, "epoch": 4454} {"train_loss": -7.203064918518066, "global_step": 187098, "epoch": 4454} {"train_loss": -7.217747211456299, "global_step": 187099, "epoch": 4454} {"train_loss": -7.194397926330566, "global_step": 187100, "epoch": 4454} {"train_loss": -7.157455921173096, "global_step": 187101, "epoch": 4454} {"train_loss": -7.03633975982666, "global_step": 187102, "epoch": 4454} {"train_loss": -7.083460807800293, "global_step": 187103, "epoch": 4454} {"train_loss": -7.121138572692871, "global_step": 187104, "epoch": 4454} {"train_loss": -7.127681255340576, "global_step": 187105, "epoch": 4454} {"train_loss": -7.126420021057129, "global_step": 187106, "epoch": 4454} {"train_loss": -6.990650653839111, "global_step": 187107, "epoch": 4454} {"train_loss": -7.088237285614014, "global_step": 187108, "epoch": 4454} {"train_loss": -7.117581253960019, "global_step": 187109, "epoch": 4454, "val_loss": 68948.6796875} {"train_loss": -7.148863315582275, "global_step": 187110, "epoch": 4455} {"train_loss": -7.214728355407715, "global_step": 187111, "epoch": 4455} {"train_loss": -7.019522666931152, "global_step": 187112, "epoch": 4455} {"train_loss": -7.068739414215088, "global_step": 187113, "epoch": 4455} {"train_loss": -7.12410831451416, "global_step": 187114, "epoch": 4455} {"train_loss": -7.183472633361816, "global_step": 187115, "epoch": 4455} {"train_loss": -7.30872917175293, "global_step": 187116, "epoch": 4455} {"train_loss": -7.143820762634277, "global_step": 187117, "epoch": 4455} {"train_loss": -7.126528739929199, "global_step": 187118, "epoch": 4455} {"train_loss": -7.16398811340332, "global_step": 187119, "epoch": 4455} {"train_loss": -7.140999794006348, "global_step": 187120, "epoch": 4455} {"train_loss": -7.206155776977539, "global_step": 187121, "epoch": 4455} {"train_loss": -7.062945365905762, "global_step": 187122, "epoch": 4455} {"train_loss": -7.091217041015625, "global_step": 187123, "epoch": 4455} {"train_loss": -7.0191779136657715, "global_step": 187124, "epoch": 4455} {"train_loss": -7.182811737060547, "global_step": 187125, "epoch": 4455} {"train_loss": -7.011812210083008, "global_step": 187126, "epoch": 4455} {"train_loss": -7.10217809677124, "global_step": 187127, "epoch": 4455} {"train_loss": -7.155447006225586, "global_step": 187128, "epoch": 4455} {"train_loss": -7.1057233810424805, "global_step": 187129, "epoch": 4455} {"train_loss": -7.047369003295898, "global_step": 187130, "epoch": 4455} {"train_loss": -7.138547897338867, "global_step": 187131, "epoch": 4455} {"train_loss": -7.073952674865723, "global_step": 187132, "epoch": 4455} {"train_loss": -7.085833549499512, "global_step": 187133, "epoch": 4455} {"train_loss": -7.111579418182373, "global_step": 187134, "epoch": 4455} {"train_loss": -7.129933834075928, "global_step": 187135, "epoch": 4455} {"train_loss": -7.094801902770996, "global_step": 187136, "epoch": 4455} {"train_loss": -7.134302139282227, "global_step": 187137, "epoch": 4455} {"train_loss": -7.078487396240234, "global_step": 187138, "epoch": 4455} {"train_loss": -7.094161033630371, "global_step": 187139, "epoch": 4455} {"train_loss": -7.058919906616211, "global_step": 187140, "epoch": 4455} {"train_loss": -7.018502235412598, "global_step": 187141, "epoch": 4455} {"train_loss": -7.1018877029418945, "global_step": 187142, "epoch": 4455} {"train_loss": -7.034238815307617, "global_step": 187143, "epoch": 4455} {"train_loss": -7.060227870941162, "global_step": 187144, "epoch": 4455} {"train_loss": -7.0947160720825195, "global_step": 187145, "epoch": 4455} {"train_loss": -7.052254676818848, "global_step": 187146, "epoch": 4455} {"train_loss": -7.119481086730957, "global_step": 187147, "epoch": 4455} {"train_loss": -7.143256187438965, "global_step": 187148, "epoch": 4455} {"train_loss": -7.1747050285339355, "global_step": 187149, "epoch": 4455} {"train_loss": -7.15299129486084, "global_step": 187150, "epoch": 4455} {"train_loss": -7.108265309106736, "global_step": 187151, "epoch": 4455, "val_loss": 68959.765625} {"train_loss": -7.091652870178223, "global_step": 187152, "epoch": 4456} {"train_loss": -7.138961315155029, "global_step": 187153, "epoch": 4456} {"train_loss": -7.041386127471924, "global_step": 187154, "epoch": 4456} {"train_loss": -6.999567985534668, "global_step": 187155, "epoch": 4456} {"train_loss": -7.136688709259033, "global_step": 187156, "epoch": 4456} {"train_loss": -7.072796821594238, "global_step": 187157, "epoch": 4456} {"train_loss": -7.1480207443237305, "global_step": 187158, "epoch": 4456} {"train_loss": -6.994537353515625, "global_step": 187159, "epoch": 4456} {"train_loss": -6.901930809020996, "global_step": 187160, "epoch": 4456} {"train_loss": -7.151576995849609, "global_step": 187161, "epoch": 4456} {"train_loss": -7.028548240661621, "global_step": 187162, "epoch": 4456} {"train_loss": -7.0403523445129395, "global_step": 187163, "epoch": 4456} {"train_loss": -6.96345853805542, "global_step": 187164, "epoch": 4456} {"train_loss": -6.889492988586426, "global_step": 187165, "epoch": 4456} {"train_loss": -7.11576509475708, "global_step": 187166, "epoch": 4456} {"train_loss": -6.845969200134277, "global_step": 187167, "epoch": 4456} {"train_loss": -7.047534942626953, "global_step": 187168, "epoch": 4456} {"train_loss": -7.141059875488281, "global_step": 187169, "epoch": 4456} {"train_loss": -7.007347106933594, "global_step": 187170, "epoch": 4456} {"train_loss": -7.025820732116699, "global_step": 187171, "epoch": 4456} {"train_loss": -6.9935503005981445, "global_step": 187172, "epoch": 4456} {"train_loss": -7.0565948486328125, "global_step": 187173, "epoch": 4456} {"train_loss": -7.046020030975342, "global_step": 187174, "epoch": 4456} {"train_loss": -7.068762302398682, "global_step": 187175, "epoch": 4456} {"train_loss": -7.11424446105957, "global_step": 187176, "epoch": 4456} {"train_loss": -7.1847076416015625, "global_step": 187177, "epoch": 4456} {"train_loss": -7.052650451660156, "global_step": 187178, "epoch": 4456} {"train_loss": -7.174335479736328, "global_step": 187179, "epoch": 4456} {"train_loss": -7.090602397918701, "global_step": 187180, "epoch": 4456} {"train_loss": -7.137757301330566, "global_step": 187181, "epoch": 4456} {"train_loss": -7.057003498077393, "global_step": 187182, "epoch": 4456} {"train_loss": -7.118475437164307, "global_step": 187183, "epoch": 4456} {"train_loss": -7.215724945068359, "global_step": 187184, "epoch": 4456} {"train_loss": -7.0467681884765625, "global_step": 187185, "epoch": 4456} {"train_loss": -7.129888534545898, "global_step": 187186, "epoch": 4456} {"train_loss": -7.178787708282471, "global_step": 187187, "epoch": 4456} {"train_loss": -7.208199501037598, "global_step": 187188, "epoch": 4456} {"train_loss": -7.136492729187012, "global_step": 187189, "epoch": 4456} {"train_loss": -7.087894439697266, "global_step": 187190, "epoch": 4456} {"train_loss": -7.126225471496582, "global_step": 187191, "epoch": 4456} {"train_loss": -7.107738971710205, "global_step": 187192, "epoch": 4456} {"train_loss": -7.076313836233957, "global_step": 187193, "epoch": 4456, "val_loss": 68834.8671875} {"train_loss": -7.183568954467773, "global_step": 187194, "epoch": 4457} {"train_loss": -7.208738327026367, "global_step": 187195, "epoch": 4457} {"train_loss": -7.1276774406433105, "global_step": 187196, "epoch": 4457} {"train_loss": -7.102724075317383, "global_step": 187197, "epoch": 4457} {"train_loss": -7.10664176940918, "global_step": 187198, "epoch": 4457} {"train_loss": -7.020312309265137, "global_step": 187199, "epoch": 4457} {"train_loss": -7.108275413513184, "global_step": 187200, "epoch": 4457} {"train_loss": -7.216596603393555, "global_step": 187201, "epoch": 4457} {"train_loss": -7.238643646240234, "global_step": 187202, "epoch": 4457} {"train_loss": -7.046332359313965, "global_step": 187203, "epoch": 4457} {"train_loss": -7.110030651092529, "global_step": 187204, "epoch": 4457} {"train_loss": -7.111670970916748, "global_step": 187205, "epoch": 4457} {"train_loss": -7.152513027191162, "global_step": 187206, "epoch": 4457} {"train_loss": -7.134971618652344, "global_step": 187207, "epoch": 4457} {"train_loss": -7.1790618896484375, "global_step": 187208, "epoch": 4457} {"train_loss": -7.042511940002441, "global_step": 187209, "epoch": 4457} {"train_loss": -7.293544292449951, "global_step": 187210, "epoch": 4457} {"train_loss": -7.221468448638916, "global_step": 187211, "epoch": 4457} {"train_loss": -7.066139221191406, "global_step": 187212, "epoch": 4457} {"train_loss": -7.191217422485352, "global_step": 187213, "epoch": 4457} {"train_loss": -7.1773295402526855, "global_step": 187214, "epoch": 4457} {"train_loss": -7.261544227600098, "global_step": 187215, "epoch": 4457} {"train_loss": -7.117380619049072, "global_step": 187216, "epoch": 4457} {"train_loss": -7.156117916107178, "global_step": 187217, "epoch": 4457} {"train_loss": -7.166640758514404, "global_step": 187218, "epoch": 4457} {"train_loss": -7.304276466369629, "global_step": 187219, "epoch": 4457} {"train_loss": -7.156073570251465, "global_step": 187220, "epoch": 4457} {"train_loss": -7.2765302658081055, "global_step": 187221, "epoch": 4457} {"train_loss": -7.115631103515625, "global_step": 187222, "epoch": 4457} {"train_loss": -7.164497375488281, "global_step": 187223, "epoch": 4457} {"train_loss": -7.190298080444336, "global_step": 187224, "epoch": 4457} {"train_loss": -7.189672470092773, "global_step": 187225, "epoch": 4457} {"train_loss": -7.158058166503906, "global_step": 187226, "epoch": 4457} {"train_loss": -7.21469259262085, "global_step": 187227, "epoch": 4457} {"train_loss": -7.202043056488037, "global_step": 187228, "epoch": 4457} {"train_loss": -7.07973575592041, "global_step": 187229, "epoch": 4457} {"train_loss": -7.100847244262695, "global_step": 187230, "epoch": 4457} {"train_loss": -7.28999137878418, "global_step": 187231, "epoch": 4457} {"train_loss": -7.206623554229736, "global_step": 187232, "epoch": 4457} {"train_loss": -7.084000587463379, "global_step": 187233, "epoch": 4457} {"train_loss": -7.173738479614258, "global_step": 187234, "epoch": 4457} {"train_loss": -7.163041705176944, "global_step": 187235, "epoch": 4457, "val_loss": 68929.7109375} {"train_loss": -7.172397613525391, "global_step": 187236, "epoch": 4458} {"train_loss": -7.171175003051758, "global_step": 187237, "epoch": 4458} {"train_loss": -7.047000885009766, "global_step": 187238, "epoch": 4458} {"train_loss": -7.130305290222168, "global_step": 187239, "epoch": 4458} {"train_loss": -7.042551040649414, "global_step": 187240, "epoch": 4458} {"train_loss": -7.088827133178711, "global_step": 187241, "epoch": 4458} {"train_loss": -7.155060768127441, "global_step": 187242, "epoch": 4458} {"train_loss": -6.986743450164795, "global_step": 187243, "epoch": 4458} {"train_loss": -6.845245838165283, "global_step": 187244, "epoch": 4458} {"train_loss": -7.071271896362305, "global_step": 187245, "epoch": 4458} {"train_loss": -7.105140209197998, "global_step": 187246, "epoch": 4458} {"train_loss": -7.061375617980957, "global_step": 187247, "epoch": 4458} {"train_loss": -7.155864715576172, "global_step": 187248, "epoch": 4458} {"train_loss": -7.06456184387207, "global_step": 187249, "epoch": 4458} {"train_loss": -7.1341962814331055, "global_step": 187250, "epoch": 4458} {"train_loss": -6.879471778869629, "global_step": 187251, "epoch": 4458} {"train_loss": -7.145179271697998, "global_step": 187252, "epoch": 4458} {"train_loss": -7.076780319213867, "global_step": 187253, "epoch": 4458} {"train_loss": -7.031199932098389, "global_step": 187254, "epoch": 4458} {"train_loss": -7.114979267120361, "global_step": 187255, "epoch": 4458} {"train_loss": -7.127777576446533, "global_step": 187256, "epoch": 4458} {"train_loss": -7.154593467712402, "global_step": 187257, "epoch": 4458} {"train_loss": -7.1906023025512695, "global_step": 187258, "epoch": 4458} {"train_loss": -7.028535842895508, "global_step": 187259, "epoch": 4458} {"train_loss": -7.140710830688477, "global_step": 187260, "epoch": 4458} {"train_loss": -7.1010422706604, "global_step": 187261, "epoch": 4458} {"train_loss": -7.32421875, "global_step": 187262, "epoch": 4458} {"train_loss": -7.112611770629883, "global_step": 187263, "epoch": 4458} {"train_loss": -7.179786682128906, "global_step": 187264, "epoch": 4458} {"train_loss": -7.142270088195801, "global_step": 187265, "epoch": 4458} {"train_loss": -7.214357376098633, "global_step": 187266, "epoch": 4458} {"train_loss": -7.141237735748291, "global_step": 187267, "epoch": 4458} {"train_loss": -7.074462890625, "global_step": 187268, "epoch": 4458} {"train_loss": -7.138966083526611, "global_step": 187269, "epoch": 4458} {"train_loss": -7.037936210632324, "global_step": 187270, "epoch": 4458} {"train_loss": -7.245473384857178, "global_step": 187271, "epoch": 4458} {"train_loss": -7.028225898742676, "global_step": 187272, "epoch": 4458} {"train_loss": -6.997105598449707, "global_step": 187273, "epoch": 4458} {"train_loss": -7.196727752685547, "global_step": 187274, "epoch": 4458} {"train_loss": -6.944268226623535, "global_step": 187275, "epoch": 4458} {"train_loss": -6.9063801765441895, "global_step": 187276, "epoch": 4458} {"train_loss": -7.0961146014077325, "global_step": 187277, "epoch": 4458, "val_loss": 68835.9140625} {"train_loss": -6.890645980834961, "global_step": 187278, "epoch": 4459} {"train_loss": -6.944448471069336, "global_step": 187279, "epoch": 4459} {"train_loss": -7.086198806762695, "global_step": 187280, "epoch": 4459} {"train_loss": -7.011313438415527, "global_step": 187281, "epoch": 4459} {"train_loss": -7.151914119720459, "global_step": 187282, "epoch": 4459} {"train_loss": -7.053347587585449, "global_step": 187283, "epoch": 4459} {"train_loss": -7.071249008178711, "global_step": 187284, "epoch": 4459} {"train_loss": -7.127999305725098, "global_step": 187285, "epoch": 4459} {"train_loss": -7.219991683959961, "global_step": 187286, "epoch": 4459} {"train_loss": -7.131326198577881, "global_step": 187287, "epoch": 4459} {"train_loss": -7.0771708488464355, "global_step": 187288, "epoch": 4459} {"train_loss": -7.045738220214844, "global_step": 187289, "epoch": 4459} {"train_loss": -7.081247329711914, "global_step": 187290, "epoch": 4459} {"train_loss": -7.1904215812683105, "global_step": 187291, "epoch": 4459} {"train_loss": -7.095775604248047, "global_step": 187292, "epoch": 4459} {"train_loss": -7.1757683753967285, "global_step": 187293, "epoch": 4459} {"train_loss": -7.0499372482299805, "global_step": 187294, "epoch": 4459} {"train_loss": -7.155346870422363, "global_step": 187295, "epoch": 4459} {"train_loss": -7.070771217346191, "global_step": 187296, "epoch": 4459} {"train_loss": -7.057310581207275, "global_step": 187297, "epoch": 4459} {"train_loss": -7.0915350914001465, "global_step": 187298, "epoch": 4459} {"train_loss": -7.272098541259766, "global_step": 187299, "epoch": 4459} {"train_loss": -7.156367301940918, "global_step": 187300, "epoch": 4459} {"train_loss": -7.175624847412109, "global_step": 187301, "epoch": 4459} {"train_loss": -7.096185207366943, "global_step": 187302, "epoch": 4459} {"train_loss": -7.0447893142700195, "global_step": 187303, "epoch": 4459} {"train_loss": -6.937582015991211, "global_step": 187304, "epoch": 4459} {"train_loss": -7.130135536193848, "global_step": 187305, "epoch": 4459} {"train_loss": -7.155477523803711, "global_step": 187306, "epoch": 4459} {"train_loss": -7.184352397918701, "global_step": 187307, "epoch": 4459} {"train_loss": -7.153645038604736, "global_step": 187308, "epoch": 4459} {"train_loss": -7.1275811195373535, "global_step": 187309, "epoch": 4459} {"train_loss": -7.201415061950684, "global_step": 187310, "epoch": 4459} {"train_loss": -7.117934226989746, "global_step": 187311, "epoch": 4459} {"train_loss": -7.140658378601074, "global_step": 187312, "epoch": 4459} {"train_loss": -7.136319160461426, "global_step": 187313, "epoch": 4459} {"train_loss": -7.189296245574951, "global_step": 187314, "epoch": 4459} {"train_loss": -7.045564651489258, "global_step": 187315, "epoch": 4459} {"train_loss": -7.274049758911133, "global_step": 187316, "epoch": 4459} {"train_loss": -7.104880332946777, "global_step": 187317, "epoch": 4459} {"train_loss": -7.109241962432861, "global_step": 187318, "epoch": 4459} {"train_loss": -7.114786772500901, "global_step": 187319, "epoch": 4459, "val_loss": 68847.6484375} {"train_loss": -7.123584747314453, "global_step": 187320, "epoch": 4460} {"train_loss": -7.132086277008057, "global_step": 187321, "epoch": 4460} {"train_loss": -7.075660705566406, "global_step": 187322, "epoch": 4460} {"train_loss": -7.141568660736084, "global_step": 187323, "epoch": 4460} {"train_loss": -7.250926971435547, "global_step": 187324, "epoch": 4460} {"train_loss": -7.150669097900391, "global_step": 187325, "epoch": 4460} {"train_loss": -7.19680643081665, "global_step": 187326, "epoch": 4460} {"train_loss": -7.067909240722656, "global_step": 187327, "epoch": 4460} {"train_loss": -7.0376739501953125, "global_step": 187328, "epoch": 4460} {"train_loss": -7.218334197998047, "global_step": 187329, "epoch": 4460} {"train_loss": -7.084451198577881, "global_step": 187330, "epoch": 4460} {"train_loss": -7.101383686065674, "global_step": 187331, "epoch": 4460} {"train_loss": -7.1648759841918945, "global_step": 187332, "epoch": 4460} {"train_loss": -7.1352081298828125, "global_step": 187333, "epoch": 4460} {"train_loss": -7.0910539627075195, "global_step": 187334, "epoch": 4460} {"train_loss": -6.994354248046875, "global_step": 187335, "epoch": 4460} {"train_loss": -7.198749542236328, "global_step": 187336, "epoch": 4460} {"train_loss": -7.1301679611206055, "global_step": 187337, "epoch": 4460} {"train_loss": -7.013376235961914, "global_step": 187338, "epoch": 4460} {"train_loss": -7.081666946411133, "global_step": 187339, "epoch": 4460} {"train_loss": -7.074029922485352, "global_step": 187340, "epoch": 4460} {"train_loss": -6.983001708984375, "global_step": 187341, "epoch": 4460} {"train_loss": -7.068524360656738, "global_step": 187342, "epoch": 4460} {"train_loss": -7.121588230133057, "global_step": 187343, "epoch": 4460} {"train_loss": -7.010926246643066, "global_step": 187344, "epoch": 4460} {"train_loss": -7.001802921295166, "global_step": 187345, "epoch": 4460} {"train_loss": -7.035002708435059, "global_step": 187346, "epoch": 4460} {"train_loss": -7.108019828796387, "global_step": 187347, "epoch": 4460} {"train_loss": -7.176734924316406, "global_step": 187348, "epoch": 4460} {"train_loss": -7.106011390686035, "global_step": 187349, "epoch": 4460} {"train_loss": -7.059815883636475, "global_step": 187350, "epoch": 4460} {"train_loss": -7.269595146179199, "global_step": 187351, "epoch": 4460} {"train_loss": -7.176047325134277, "global_step": 187352, "epoch": 4460} {"train_loss": -7.093469619750977, "global_step": 187353, "epoch": 4460} {"train_loss": -7.156791687011719, "global_step": 187354, "epoch": 4460} {"train_loss": -7.024587631225586, "global_step": 187355, "epoch": 4460} {"train_loss": -7.130204200744629, "global_step": 187356, "epoch": 4460} {"train_loss": -7.089165687561035, "global_step": 187357, "epoch": 4460} {"train_loss": -7.160378456115723, "global_step": 187358, "epoch": 4460} {"train_loss": -7.118324279785156, "global_step": 187359, "epoch": 4460} {"train_loss": -7.1250810623168945, "global_step": 187360, "epoch": 4460} {"train_loss": -7.111308790388561, "global_step": 187361, "epoch": 4460, "val_loss": 68964.4140625} {"train_loss": -7.121910095214844, "global_step": 187362, "epoch": 4461} {"train_loss": -7.098556995391846, "global_step": 187363, "epoch": 4461} {"train_loss": -7.14699125289917, "global_step": 187364, "epoch": 4461} {"train_loss": -7.116786003112793, "global_step": 187365, "epoch": 4461} {"train_loss": -7.222161769866943, "global_step": 187366, "epoch": 4461} {"train_loss": -7.035608291625977, "global_step": 187367, "epoch": 4461} {"train_loss": -7.114571571350098, "global_step": 187368, "epoch": 4461} {"train_loss": -7.049610137939453, "global_step": 187369, "epoch": 4461} {"train_loss": -7.130512714385986, "global_step": 187370, "epoch": 4461} {"train_loss": -7.119032859802246, "global_step": 187371, "epoch": 4461} {"train_loss": -7.212474346160889, "global_step": 187372, "epoch": 4461} {"train_loss": -7.113053798675537, "global_step": 187373, "epoch": 4461} {"train_loss": -7.012117385864258, "global_step": 187374, "epoch": 4461} {"train_loss": -7.1237030029296875, "global_step": 187375, "epoch": 4461} {"train_loss": -7.089941024780273, "global_step": 187376, "epoch": 4461} {"train_loss": -7.102574348449707, "global_step": 187377, "epoch": 4461} {"train_loss": -7.220089912414551, "global_step": 187378, "epoch": 4461} {"train_loss": -7.1041259765625, "global_step": 187379, "epoch": 4461} {"train_loss": -7.08206844329834, "global_step": 187380, "epoch": 4461} {"train_loss": -7.167270660400391, "global_step": 187381, "epoch": 4461} {"train_loss": -7.1098151206970215, "global_step": 187382, "epoch": 4461} {"train_loss": -7.135530948638916, "global_step": 187383, "epoch": 4461} {"train_loss": -7.105835914611816, "global_step": 187384, "epoch": 4461} {"train_loss": -7.149179458618164, "global_step": 187385, "epoch": 4461} {"train_loss": -7.0757222175598145, "global_step": 187386, "epoch": 4461} {"train_loss": -7.0970458984375, "global_step": 187387, "epoch": 4461} {"train_loss": -7.150809288024902, "global_step": 187388, "epoch": 4461} {"train_loss": -7.1012468338012695, "global_step": 187389, "epoch": 4461} {"train_loss": -7.052621841430664, "global_step": 187390, "epoch": 4461} {"train_loss": -7.156364440917969, "global_step": 187391, "epoch": 4461} {"train_loss": -7.107621192932129, "global_step": 187392, "epoch": 4461} {"train_loss": -7.169273376464844, "global_step": 187393, "epoch": 4461} {"train_loss": -7.166396141052246, "global_step": 187394, "epoch": 4461} {"train_loss": -6.947236061096191, "global_step": 187395, "epoch": 4461} {"train_loss": -7.043842315673828, "global_step": 187396, "epoch": 4461} {"train_loss": -7.082244873046875, "global_step": 187397, "epoch": 4461} {"train_loss": -7.1538543701171875, "global_step": 187398, "epoch": 4461} {"train_loss": -7.121525764465332, "global_step": 187399, "epoch": 4461} {"train_loss": -7.082630157470703, "global_step": 187400, "epoch": 4461} {"train_loss": -7.090791702270508, "global_step": 187401, "epoch": 4461} {"train_loss": -7.084096908569336, "global_step": 187402, "epoch": 4461} {"train_loss": -7.110060975665138, "global_step": 187403, "epoch": 4461, "val_loss": 69010.6953125} {"train_loss": -7.178976058959961, "global_step": 187404, "epoch": 4462} {"train_loss": -7.117156028747559, "global_step": 187405, "epoch": 4462} {"train_loss": -7.199342250823975, "global_step": 187406, "epoch": 4462} {"train_loss": -6.993297100067139, "global_step": 187407, "epoch": 4462} {"train_loss": -7.1268110275268555, "global_step": 187408, "epoch": 4462} {"train_loss": -7.150461196899414, "global_step": 187409, "epoch": 4462} {"train_loss": -7.135031700134277, "global_step": 187410, "epoch": 4462} {"train_loss": -7.143654823303223, "global_step": 187411, "epoch": 4462} {"train_loss": -7.118916034698486, "global_step": 187412, "epoch": 4462} {"train_loss": -7.140883445739746, "global_step": 187413, "epoch": 4462} {"train_loss": -7.0652360916137695, "global_step": 187414, "epoch": 4462} {"train_loss": -7.150208473205566, "global_step": 187415, "epoch": 4462} {"train_loss": -7.182241916656494, "global_step": 187416, "epoch": 4462} {"train_loss": -7.142584323883057, "global_step": 187417, "epoch": 4462} {"train_loss": -7.170558929443359, "global_step": 187418, "epoch": 4462} {"train_loss": -7.143949508666992, "global_step": 187419, "epoch": 4462} {"train_loss": -7.174927234649658, "global_step": 187420, "epoch": 4462} {"train_loss": -7.086952209472656, "global_step": 187421, "epoch": 4462} {"train_loss": -7.1646528244018555, "global_step": 187422, "epoch": 4462} {"train_loss": -7.100811004638672, "global_step": 187423, "epoch": 4462} {"train_loss": -7.087307929992676, "global_step": 187424, "epoch": 4462} {"train_loss": -7.159552574157715, "global_step": 187425, "epoch": 4462} {"train_loss": -7.105357646942139, "global_step": 187426, "epoch": 4462} {"train_loss": -7.109926223754883, "global_step": 187427, "epoch": 4462} {"train_loss": -7.042117118835449, "global_step": 187428, "epoch": 4462} {"train_loss": -7.160099983215332, "global_step": 187429, "epoch": 4462} {"train_loss": -7.124810218811035, "global_step": 187430, "epoch": 4462} {"train_loss": -7.005528450012207, "global_step": 187431, "epoch": 4462} {"train_loss": -7.168073654174805, "global_step": 187432, "epoch": 4462} {"train_loss": -7.138278007507324, "global_step": 187433, "epoch": 4462} {"train_loss": -7.180948257446289, "global_step": 187434, "epoch": 4462} {"train_loss": -7.033490180969238, "global_step": 187435, "epoch": 4462} {"train_loss": -7.10979700088501, "global_step": 187436, "epoch": 4462} {"train_loss": -7.015737056732178, "global_step": 187437, "epoch": 4462} {"train_loss": -7.049904823303223, "global_step": 187438, "epoch": 4462} {"train_loss": -7.258805751800537, "global_step": 187439, "epoch": 4462} {"train_loss": -7.122025489807129, "global_step": 187440, "epoch": 4462} {"train_loss": -7.13692569732666, "global_step": 187441, "epoch": 4462} {"train_loss": -7.125765800476074, "global_step": 187442, "epoch": 4462} {"train_loss": -7.10338830947876, "global_step": 187443, "epoch": 4462} {"train_loss": -7.23280143737793, "global_step": 187444, "epoch": 4462} {"train_loss": -7.126109736306327, "global_step": 187445, "epoch": 4462, "val_loss": 68780.1796875} {"train_loss": -7.194893836975098, "global_step": 187446, "epoch": 4463} {"train_loss": -7.063451766967773, "global_step": 187447, "epoch": 4463} {"train_loss": -7.117114067077637, "global_step": 187448, "epoch": 4463} {"train_loss": -7.188614845275879, "global_step": 187449, "epoch": 4463} {"train_loss": -7.157615661621094, "global_step": 187450, "epoch": 4463} {"train_loss": -7.22177267074585, "global_step": 187451, "epoch": 4463} {"train_loss": -7.256998538970947, "global_step": 187452, "epoch": 4463} {"train_loss": -7.109668731689453, "global_step": 187453, "epoch": 4463} {"train_loss": -7.141732215881348, "global_step": 187454, "epoch": 4463} {"train_loss": -7.270010948181152, "global_step": 187455, "epoch": 4463} {"train_loss": -7.2169694900512695, "global_step": 187456, "epoch": 4463} {"train_loss": -7.185062408447266, "global_step": 187457, "epoch": 4463} {"train_loss": -7.19164514541626, "global_step": 187458, "epoch": 4463} {"train_loss": -7.276622772216797, "global_step": 187459, "epoch": 4463} {"train_loss": -7.181628227233887, "global_step": 187460, "epoch": 4463} {"train_loss": -7.238251686096191, "global_step": 187461, "epoch": 4463} {"train_loss": -7.226300239562988, "global_step": 187462, "epoch": 4463} {"train_loss": -7.194746017456055, "global_step": 187463, "epoch": 4463} {"train_loss": -7.155843734741211, "global_step": 187464, "epoch": 4463} {"train_loss": -7.000157833099365, "global_step": 187465, "epoch": 4463} {"train_loss": -7.094255447387695, "global_step": 187466, "epoch": 4463} {"train_loss": -7.13609504699707, "global_step": 187467, "epoch": 4463} {"train_loss": -7.165589332580566, "global_step": 187468, "epoch": 4463} {"train_loss": -7.073637008666992, "global_step": 187469, "epoch": 4463} {"train_loss": -7.181017875671387, "global_step": 187470, "epoch": 4463} {"train_loss": -7.1323089599609375, "global_step": 187471, "epoch": 4463} {"train_loss": -7.085450172424316, "global_step": 187472, "epoch": 4463} {"train_loss": -7.200428009033203, "global_step": 187473, "epoch": 4463} {"train_loss": -7.106744766235352, "global_step": 187474, "epoch": 4463} {"train_loss": -7.122806072235107, "global_step": 187475, "epoch": 4463} {"train_loss": -7.151944160461426, "global_step": 187476, "epoch": 4463} {"train_loss": -6.991279602050781, "global_step": 187477, "epoch": 4463} {"train_loss": -7.189638137817383, "global_step": 187478, "epoch": 4463} {"train_loss": -7.0257039070129395, "global_step": 187479, "epoch": 4463} {"train_loss": -7.0483574867248535, "global_step": 187480, "epoch": 4463} {"train_loss": -7.124908447265625, "global_step": 187481, "epoch": 4463} {"train_loss": -7.089231491088867, "global_step": 187482, "epoch": 4463} {"train_loss": -7.0666704177856445, "global_step": 187483, "epoch": 4463} {"train_loss": -7.207618713378906, "global_step": 187484, "epoch": 4463} {"train_loss": -7.018853187561035, "global_step": 187485, "epoch": 4463} {"train_loss": -7.136030197143555, "global_step": 187486, "epoch": 4463} {"train_loss": -7.1417205560775034, "global_step": 187487, "epoch": 4463, "val_loss": 69027.8984375} {"train_loss": -7.138017654418945, "global_step": 187488, "epoch": 4464} {"train_loss": -7.206729888916016, "global_step": 187489, "epoch": 4464} {"train_loss": -7.070657253265381, "global_step": 187490, "epoch": 4464} {"train_loss": -7.199694633483887, "global_step": 187491, "epoch": 4464} {"train_loss": -7.04758358001709, "global_step": 187492, "epoch": 4464} {"train_loss": -7.091742515563965, "global_step": 187493, "epoch": 4464} {"train_loss": -6.9788312911987305, "global_step": 187494, "epoch": 4464} {"train_loss": -6.9938859939575195, "global_step": 187495, "epoch": 4464} {"train_loss": -7.139654636383057, "global_step": 187496, "epoch": 4464} {"train_loss": -7.081263065338135, "global_step": 187497, "epoch": 4464} {"train_loss": -7.093597888946533, "global_step": 187498, "epoch": 4464} {"train_loss": -6.966217041015625, "global_step": 187499, "epoch": 4464} {"train_loss": -6.957831382751465, "global_step": 187500, "epoch": 4464} {"train_loss": -6.963109016418457, "global_step": 187501, "epoch": 4464} {"train_loss": -6.909176826477051, "global_step": 187502, "epoch": 4464} {"train_loss": -7.088222026824951, "global_step": 187503, "epoch": 4464} {"train_loss": -6.898352146148682, "global_step": 187504, "epoch": 4464} {"train_loss": -7.120185852050781, "global_step": 187505, "epoch": 4464} {"train_loss": -7.063099384307861, "global_step": 187506, "epoch": 4464} {"train_loss": -7.210351943969727, "global_step": 187507, "epoch": 4464} {"train_loss": -7.065806865692139, "global_step": 187508, "epoch": 4464} {"train_loss": -7.128961563110352, "global_step": 187509, "epoch": 4464} {"train_loss": -7.093208312988281, "global_step": 187510, "epoch": 4464} {"train_loss": -7.073512554168701, "global_step": 187511, "epoch": 4464} {"train_loss": -7.127878189086914, "global_step": 187512, "epoch": 4464} {"train_loss": -7.094178199768066, "global_step": 187513, "epoch": 4464} {"train_loss": -7.106454849243164, "global_step": 187514, "epoch": 4464} {"train_loss": -7.061595916748047, "global_step": 187515, "epoch": 4464} {"train_loss": -7.167756080627441, "global_step": 187516, "epoch": 4464} {"train_loss": -7.081569671630859, "global_step": 187517, "epoch": 4464} {"train_loss": -7.138726234436035, "global_step": 187518, "epoch": 4464} {"train_loss": -7.16361141204834, "global_step": 187519, "epoch": 4464} {"train_loss": -7.003853797912598, "global_step": 187520, "epoch": 4464} {"train_loss": -7.1709489822387695, "global_step": 187521, "epoch": 4464} {"train_loss": -7.06074333190918, "global_step": 187522, "epoch": 4464} {"train_loss": -7.195272445678711, "global_step": 187523, "epoch": 4464} {"train_loss": -7.149537563323975, "global_step": 187524, "epoch": 4464} {"train_loss": -7.087681293487549, "global_step": 187525, "epoch": 4464} {"train_loss": -7.096843719482422, "global_step": 187526, "epoch": 4464} {"train_loss": -7.082784175872803, "global_step": 187527, "epoch": 4464} {"train_loss": -7.178788661956787, "global_step": 187528, "epoch": 4464} {"train_loss": -7.091824372609456, "global_step": 187529, "epoch": 4464, "val_loss": 68836.5390625} {"train_loss": -7.164958953857422, "global_step": 187530, "epoch": 4465} {"train_loss": -7.201261043548584, "global_step": 187531, "epoch": 4465} {"train_loss": -7.127536773681641, "global_step": 187532, "epoch": 4465} {"train_loss": -7.192865371704102, "global_step": 187533, "epoch": 4465} {"train_loss": -7.103949546813965, "global_step": 187534, "epoch": 4465} {"train_loss": -7.2106781005859375, "global_step": 187535, "epoch": 4465} {"train_loss": -7.059654235839844, "global_step": 187536, "epoch": 4465} {"train_loss": -7.106793403625488, "global_step": 187537, "epoch": 4465} {"train_loss": -7.221508026123047, "global_step": 187538, "epoch": 4465} {"train_loss": -7.16526985168457, "global_step": 187539, "epoch": 4465} {"train_loss": -7.152681350708008, "global_step": 187540, "epoch": 4465} {"train_loss": -7.1325201988220215, "global_step": 187541, "epoch": 4465} {"train_loss": -7.235824108123779, "global_step": 187542, "epoch": 4465} {"train_loss": -7.150996208190918, "global_step": 187543, "epoch": 4465} {"train_loss": -7.100492477416992, "global_step": 187544, "epoch": 4465} {"train_loss": -7.049174785614014, "global_step": 187545, "epoch": 4465} {"train_loss": -7.175041198730469, "global_step": 187546, "epoch": 4465} {"train_loss": -7.022637367248535, "global_step": 187547, "epoch": 4465} {"train_loss": -7.1315436363220215, "global_step": 187548, "epoch": 4465} {"train_loss": -7.227937698364258, "global_step": 187549, "epoch": 4465} {"train_loss": -7.081668853759766, "global_step": 187550, "epoch": 4465} {"train_loss": -7.004399299621582, "global_step": 187551, "epoch": 4465} {"train_loss": -7.158636093139648, "global_step": 187552, "epoch": 4465} {"train_loss": -7.10945987701416, "global_step": 187553, "epoch": 4465} {"train_loss": -7.091143608093262, "global_step": 187554, "epoch": 4465} {"train_loss": -7.237121105194092, "global_step": 187555, "epoch": 4465} {"train_loss": -7.193057060241699, "global_step": 187556, "epoch": 4465} {"train_loss": -7.143648147583008, "global_step": 187557, "epoch": 4465} {"train_loss": -7.234696388244629, "global_step": 187558, "epoch": 4465} {"train_loss": -7.202973365783691, "global_step": 187559, "epoch": 4465} {"train_loss": -7.224071502685547, "global_step": 187560, "epoch": 4465} {"train_loss": -7.145318031311035, "global_step": 187561, "epoch": 4465} {"train_loss": -7.231098651885986, "global_step": 187562, "epoch": 4465} {"train_loss": -7.086416244506836, "global_step": 187563, "epoch": 4465} {"train_loss": -7.183651447296143, "global_step": 187564, "epoch": 4465} {"train_loss": -7.07712984085083, "global_step": 187565, "epoch": 4465} {"train_loss": -7.281857967376709, "global_step": 187566, "epoch": 4465} {"train_loss": -7.089041709899902, "global_step": 187567, "epoch": 4465} {"train_loss": -7.135616302490234, "global_step": 187568, "epoch": 4465} {"train_loss": -7.153537273406982, "global_step": 187569, "epoch": 4465} {"train_loss": -7.191162109375, "global_step": 187570, "epoch": 4465} {"train_loss": -7.148568641571772, "global_step": 187571, "epoch": 4465, "val_loss": 68848.2109375} {"train_loss": -7.193392753601074, "global_step": 187572, "epoch": 4466} {"train_loss": -7.082050323486328, "global_step": 187573, "epoch": 4466} {"train_loss": -7.196739196777344, "global_step": 187574, "epoch": 4466} {"train_loss": -7.192058563232422, "global_step": 187575, "epoch": 4466} {"train_loss": -7.094861030578613, "global_step": 187576, "epoch": 4466} {"train_loss": -7.259085178375244, "global_step": 187577, "epoch": 4466} {"train_loss": -7.140837669372559, "global_step": 187578, "epoch": 4466} {"train_loss": -7.0559258460998535, "global_step": 187579, "epoch": 4466} {"train_loss": -7.011902809143066, "global_step": 187580, "epoch": 4466} {"train_loss": -7.1819329261779785, "global_step": 187581, "epoch": 4466} {"train_loss": -7.056195259094238, "global_step": 187582, "epoch": 4466} {"train_loss": -7.182071685791016, "global_step": 187583, "epoch": 4466} {"train_loss": -7.195263862609863, "global_step": 187584, "epoch": 4466} {"train_loss": -7.114398956298828, "global_step": 187585, "epoch": 4466} {"train_loss": -7.0096282958984375, "global_step": 187586, "epoch": 4466} {"train_loss": -7.054207801818848, "global_step": 187587, "epoch": 4466} {"train_loss": -7.170957565307617, "global_step": 187588, "epoch": 4466} {"train_loss": -7.174715995788574, "global_step": 187589, "epoch": 4466} {"train_loss": -7.088700294494629, "global_step": 187590, "epoch": 4466} {"train_loss": -7.101131439208984, "global_step": 187591, "epoch": 4466} {"train_loss": -7.001282691955566, "global_step": 187592, "epoch": 4466} {"train_loss": -7.078401565551758, "global_step": 187593, "epoch": 4466} {"train_loss": -7.117920398712158, "global_step": 187594, "epoch": 4466} {"train_loss": -7.197972297668457, "global_step": 187595, "epoch": 4466} {"train_loss": -7.189364433288574, "global_step": 187596, "epoch": 4466} {"train_loss": -6.977842330932617, "global_step": 187597, "epoch": 4466} {"train_loss": -7.044804573059082, "global_step": 187598, "epoch": 4466} {"train_loss": -7.0220537185668945, "global_step": 187599, "epoch": 4466} {"train_loss": -7.111589431762695, "global_step": 187600, "epoch": 4466} {"train_loss": -7.050037384033203, "global_step": 187601, "epoch": 4466} {"train_loss": -7.095491886138916, "global_step": 187602, "epoch": 4466} {"train_loss": -7.169923782348633, "global_step": 187603, "epoch": 4466} {"train_loss": -7.144762992858887, "global_step": 187604, "epoch": 4466} {"train_loss": -7.111688613891602, "global_step": 187605, "epoch": 4466} {"train_loss": -7.097875595092773, "global_step": 187606, "epoch": 4466} {"train_loss": -7.059009552001953, "global_step": 187607, "epoch": 4466} {"train_loss": -7.241660118103027, "global_step": 187608, "epoch": 4466} {"train_loss": -7.213827610015869, "global_step": 187609, "epoch": 4466} {"train_loss": -7.238442420959473, "global_step": 187610, "epoch": 4466} {"train_loss": -7.028928279876709, "global_step": 187611, "epoch": 4466} {"train_loss": -7.124690055847168, "global_step": 187612, "epoch": 4466} {"train_loss": -7.118043729237148, "global_step": 187613, "epoch": 4466, "val_loss": 68840.3515625} {"train_loss": -7.197751045227051, "global_step": 187614, "epoch": 4467} {"train_loss": -7.174121856689453, "global_step": 187615, "epoch": 4467} {"train_loss": -7.150721549987793, "global_step": 187616, "epoch": 4467} {"train_loss": -7.145768165588379, "global_step": 187617, "epoch": 4467} {"train_loss": -7.224260330200195, "global_step": 187618, "epoch": 4467} {"train_loss": -7.186361789703369, "global_step": 187619, "epoch": 4467} {"train_loss": -7.120746612548828, "global_step": 187620, "epoch": 4467} {"train_loss": -7.035099029541016, "global_step": 187621, "epoch": 4467} {"train_loss": -7.211684226989746, "global_step": 187622, "epoch": 4467} {"train_loss": -7.213611125946045, "global_step": 187623, "epoch": 4467} {"train_loss": -7.1843976974487305, "global_step": 187624, "epoch": 4467} {"train_loss": -7.123739242553711, "global_step": 187625, "epoch": 4467} {"train_loss": -7.162913799285889, "global_step": 187626, "epoch": 4467} {"train_loss": -7.1193108558654785, "global_step": 187627, "epoch": 4467} {"train_loss": -7.168150424957275, "global_step": 187628, "epoch": 4467} {"train_loss": -7.118566513061523, "global_step": 187629, "epoch": 4467} {"train_loss": -7.1020917892456055, "global_step": 187630, "epoch": 4467} {"train_loss": -7.1708831787109375, "global_step": 187631, "epoch": 4467} {"train_loss": -7.093297004699707, "global_step": 187632, "epoch": 4467} {"train_loss": -7.174385070800781, "global_step": 187633, "epoch": 4467} {"train_loss": -7.126461982727051, "global_step": 187634, "epoch": 4467} {"train_loss": -7.145283222198486, "global_step": 187635, "epoch": 4467} {"train_loss": -7.21466064453125, "global_step": 187636, "epoch": 4467} {"train_loss": -7.103731155395508, "global_step": 187637, "epoch": 4467} {"train_loss": -7.150980472564697, "global_step": 187638, "epoch": 4467} {"train_loss": -7.163728713989258, "global_step": 187639, "epoch": 4467} {"train_loss": -7.121448993682861, "global_step": 187640, "epoch": 4467} {"train_loss": -7.153965950012207, "global_step": 187641, "epoch": 4467} {"train_loss": -7.201838493347168, "global_step": 187642, "epoch": 4467} {"train_loss": -7.136086463928223, "global_step": 187643, "epoch": 4467} {"train_loss": -7.112607955932617, "global_step": 187644, "epoch": 4467} {"train_loss": -7.134871006011963, "global_step": 187645, "epoch": 4467} {"train_loss": -7.1161041259765625, "global_step": 187646, "epoch": 4467} {"train_loss": -7.250247001647949, "global_step": 187647, "epoch": 4467} {"train_loss": -7.035640716552734, "global_step": 187648, "epoch": 4467} {"train_loss": -7.178416728973389, "global_step": 187649, "epoch": 4467} {"train_loss": -7.231520175933838, "global_step": 187650, "epoch": 4467} {"train_loss": -7.102599143981934, "global_step": 187651, "epoch": 4467} {"train_loss": -7.054220676422119, "global_step": 187652, "epoch": 4467} {"train_loss": -7.1071038246154785, "global_step": 187653, "epoch": 4467} {"train_loss": -7.094542503356934, "global_step": 187654, "epoch": 4467} {"train_loss": -7.1446797507149835, "global_step": 187655, "epoch": 4467, "val_loss": 68789.03125} {"train_loss": -7.099717617034912, "global_step": 187656, "epoch": 4468} {"train_loss": -7.093976974487305, "global_step": 187657, "epoch": 4468} {"train_loss": -6.954693794250488, "global_step": 187658, "epoch": 4468} {"train_loss": -7.109447956085205, "global_step": 187659, "epoch": 4468} {"train_loss": -7.065431118011475, "global_step": 187660, "epoch": 4468} {"train_loss": -7.082408905029297, "global_step": 187661, "epoch": 4468} {"train_loss": -7.131134986877441, "global_step": 187662, "epoch": 4468} {"train_loss": -7.101889133453369, "global_step": 187663, "epoch": 4468} {"train_loss": -7.138217449188232, "global_step": 187664, "epoch": 4468} {"train_loss": -7.116194725036621, "global_step": 187665, "epoch": 4468} {"train_loss": -7.144720077514648, "global_step": 187666, "epoch": 4468} {"train_loss": -7.183518409729004, "global_step": 187667, "epoch": 4468} {"train_loss": -7.13059139251709, "global_step": 187668, "epoch": 4468} {"train_loss": -7.1151814460754395, "global_step": 187669, "epoch": 4468} {"train_loss": -7.014288902282715, "global_step": 187670, "epoch": 4468} {"train_loss": -6.950996398925781, "global_step": 187671, "epoch": 4468} {"train_loss": -7.168994903564453, "global_step": 187672, "epoch": 4468} {"train_loss": -6.996588230133057, "global_step": 187673, "epoch": 4468} {"train_loss": -6.989208221435547, "global_step": 187674, "epoch": 4468} {"train_loss": -7.044369697570801, "global_step": 187675, "epoch": 4468} {"train_loss": -7.064996719360352, "global_step": 187676, "epoch": 4468} {"train_loss": -7.083836555480957, "global_step": 187677, "epoch": 4468} {"train_loss": -7.035758018493652, "global_step": 187678, "epoch": 4468} {"train_loss": -7.125209331512451, "global_step": 187679, "epoch": 4468} {"train_loss": -7.069076061248779, "global_step": 187680, "epoch": 4468} {"train_loss": -7.147465705871582, "global_step": 187681, "epoch": 4468} {"train_loss": -7.006529808044434, "global_step": 187682, "epoch": 4468} {"train_loss": -7.0489678382873535, "global_step": 187683, "epoch": 4468} {"train_loss": -7.055938720703125, "global_step": 187684, "epoch": 4468} {"train_loss": -7.127537250518799, "global_step": 187685, "epoch": 4468} {"train_loss": -7.13808536529541, "global_step": 187686, "epoch": 4468} {"train_loss": -7.188674449920654, "global_step": 187687, "epoch": 4468} {"train_loss": -7.164022445678711, "global_step": 187688, "epoch": 4468} {"train_loss": -7.106616020202637, "global_step": 187689, "epoch": 4468} {"train_loss": -7.073368072509766, "global_step": 187690, "epoch": 4468} {"train_loss": -7.0727128982543945, "global_step": 187691, "epoch": 4468} {"train_loss": -7.128880977630615, "global_step": 187692, "epoch": 4468} {"train_loss": -7.040473937988281, "global_step": 187693, "epoch": 4468} {"train_loss": -7.156713485717773, "global_step": 187694, "epoch": 4468} {"train_loss": -7.1429901123046875, "global_step": 187695, "epoch": 4468} {"train_loss": -7.149918556213379, "global_step": 187696, "epoch": 4468} {"train_loss": -7.092699346088228, "global_step": 187697, "epoch": 4468, "val_loss": 68873.765625} {"train_loss": -7.129974365234375, "global_step": 187698, "epoch": 4469} {"train_loss": -7.20482063293457, "global_step": 187699, "epoch": 4469} {"train_loss": -7.15178108215332, "global_step": 187700, "epoch": 4469} {"train_loss": -7.144472122192383, "global_step": 187701, "epoch": 4469} {"train_loss": -7.103026390075684, "global_step": 187702, "epoch": 4469} {"train_loss": -7.206989288330078, "global_step": 187703, "epoch": 4469} {"train_loss": -7.314855098724365, "global_step": 187704, "epoch": 4469} {"train_loss": -7.1247334480285645, "global_step": 187705, "epoch": 4469} {"train_loss": -7.114815711975098, "global_step": 187706, "epoch": 4469} {"train_loss": -7.105169296264648, "global_step": 187707, "epoch": 4469} {"train_loss": -7.161377906799316, "global_step": 187708, "epoch": 4469} {"train_loss": -7.161590576171875, "global_step": 187709, "epoch": 4469} {"train_loss": -7.176982879638672, "global_step": 187710, "epoch": 4469} {"train_loss": -7.269667625427246, "global_step": 187711, "epoch": 4469} {"train_loss": -7.104591369628906, "global_step": 187712, "epoch": 4469} {"train_loss": -7.131802082061768, "global_step": 187713, "epoch": 4469} {"train_loss": -7.170128345489502, "global_step": 187714, "epoch": 4469} {"train_loss": -7.185804843902588, "global_step": 187715, "epoch": 4469} {"train_loss": -7.12390661239624, "global_step": 187716, "epoch": 4469} {"train_loss": -7.1189165115356445, "global_step": 187717, "epoch": 4469} {"train_loss": -7.085953235626221, "global_step": 187718, "epoch": 4469} {"train_loss": -7.175236701965332, "global_step": 187719, "epoch": 4469} {"train_loss": -7.050187110900879, "global_step": 187720, "epoch": 4469} {"train_loss": -7.109814643859863, "global_step": 187721, "epoch": 4469} {"train_loss": -7.225076198577881, "global_step": 187722, "epoch": 4469} {"train_loss": -7.122802734375, "global_step": 187723, "epoch": 4469} {"train_loss": -7.21451473236084, "global_step": 187724, "epoch": 4469} {"train_loss": -7.140439510345459, "global_step": 187725, "epoch": 4469} {"train_loss": -7.197336196899414, "global_step": 187726, "epoch": 4469} {"train_loss": -7.119854927062988, "global_step": 187727, "epoch": 4469} {"train_loss": -7.1226348876953125, "global_step": 187728, "epoch": 4469} {"train_loss": -7.117718696594238, "global_step": 187729, "epoch": 4469} {"train_loss": -7.177050590515137, "global_step": 187730, "epoch": 4469} {"train_loss": -7.156797409057617, "global_step": 187731, "epoch": 4469} {"train_loss": -7.003164291381836, "global_step": 187732, "epoch": 4469} {"train_loss": -7.263990879058838, "global_step": 187733, "epoch": 4469} {"train_loss": -7.144582748413086, "global_step": 187734, "epoch": 4469} {"train_loss": -7.141387939453125, "global_step": 187735, "epoch": 4469} {"train_loss": -6.977530479431152, "global_step": 187736, "epoch": 4469} {"train_loss": -6.984562397003174, "global_step": 187737, "epoch": 4469} {"train_loss": -7.144406318664551, "global_step": 187738, "epoch": 4469} {"train_loss": -7.141091573806036, "global_step": 187739, "epoch": 4469, "val_loss": 68978.6875} {"train_loss": -7.168413162231445, "global_step": 187740, "epoch": 4470} {"train_loss": -7.069999694824219, "global_step": 187741, "epoch": 4470} {"train_loss": -7.154025554656982, "global_step": 187742, "epoch": 4470} {"train_loss": -7.1319580078125, "global_step": 187743, "epoch": 4470} {"train_loss": -7.057488441467285, "global_step": 187744, "epoch": 4470} {"train_loss": -7.083483695983887, "global_step": 187745, "epoch": 4470} {"train_loss": -7.023443222045898, "global_step": 187746, "epoch": 4470} {"train_loss": -7.049770355224609, "global_step": 187747, "epoch": 4470} {"train_loss": -7.139887809753418, "global_step": 187748, "epoch": 4470} {"train_loss": -7.088968276977539, "global_step": 187749, "epoch": 4470} {"train_loss": -7.150747299194336, "global_step": 187750, "epoch": 4470} {"train_loss": -6.944969177246094, "global_step": 187751, "epoch": 4470} {"train_loss": -7.125017166137695, "global_step": 187752, "epoch": 4470} {"train_loss": -7.065886497497559, "global_step": 187753, "epoch": 4470} {"train_loss": -7.142128944396973, "global_step": 187754, "epoch": 4470} {"train_loss": -7.079274654388428, "global_step": 187755, "epoch": 4470} {"train_loss": -7.138441562652588, "global_step": 187756, "epoch": 4470} {"train_loss": -7.144216060638428, "global_step": 187757, "epoch": 4470} {"train_loss": -6.997512340545654, "global_step": 187758, "epoch": 4470} {"train_loss": -7.087526798248291, "global_step": 187759, "epoch": 4470} {"train_loss": -7.175198554992676, "global_step": 187760, "epoch": 4470} {"train_loss": -7.060219764709473, "global_step": 187761, "epoch": 4470} {"train_loss": -7.213690280914307, "global_step": 187762, "epoch": 4470} {"train_loss": -7.030241966247559, "global_step": 187763, "epoch": 4470} {"train_loss": -7.053800582885742, "global_step": 187764, "epoch": 4470} {"train_loss": -6.9690632820129395, "global_step": 187765, "epoch": 4470} {"train_loss": -7.127050876617432, "global_step": 187766, "epoch": 4470} {"train_loss": -7.145302772521973, "global_step": 187767, "epoch": 4470} {"train_loss": -7.052066802978516, "global_step": 187768, "epoch": 4470} {"train_loss": -7.086692810058594, "global_step": 187769, "epoch": 4470} {"train_loss": -7.198668956756592, "global_step": 187770, "epoch": 4470} {"train_loss": -7.022709369659424, "global_step": 187771, "epoch": 4470} {"train_loss": -6.957355499267578, "global_step": 187772, "epoch": 4470} {"train_loss": -7.196315765380859, "global_step": 187773, "epoch": 4470} {"train_loss": -7.097892761230469, "global_step": 187774, "epoch": 4470} {"train_loss": -7.066413879394531, "global_step": 187775, "epoch": 4470} {"train_loss": -7.226168155670166, "global_step": 187776, "epoch": 4470} {"train_loss": -7.091166019439697, "global_step": 187777, "epoch": 4470} {"train_loss": -7.153553485870361, "global_step": 187778, "epoch": 4470} {"train_loss": -7.199457168579102, "global_step": 187779, "epoch": 4470} {"train_loss": -7.123177528381348, "global_step": 187780, "epoch": 4470} {"train_loss": -7.101586080732799, "global_step": 187781, "epoch": 4470, "val_loss": 69096.609375} {"train_loss": -7.162257194519043, "global_step": 187782, "epoch": 4471} {"train_loss": -7.170733451843262, "global_step": 187783, "epoch": 4471} {"train_loss": -7.143522262573242, "global_step": 187784, "epoch": 4471} {"train_loss": -7.128950595855713, "global_step": 187785, "epoch": 4471} {"train_loss": -7.148288249969482, "global_step": 187786, "epoch": 4471} {"train_loss": -7.067615509033203, "global_step": 187787, "epoch": 4471} {"train_loss": -7.171533584594727, "global_step": 187788, "epoch": 4471} {"train_loss": -7.304089546203613, "global_step": 187789, "epoch": 4471} {"train_loss": -7.068812370300293, "global_step": 187790, "epoch": 4471} {"train_loss": -7.1150994300842285, "global_step": 187791, "epoch": 4471} {"train_loss": -7.216289043426514, "global_step": 187792, "epoch": 4471} {"train_loss": -7.185579299926758, "global_step": 187793, "epoch": 4471} {"train_loss": -7.1629133224487305, "global_step": 187794, "epoch": 4471} {"train_loss": -7.12795352935791, "global_step": 187795, "epoch": 4471} {"train_loss": -7.171800136566162, "global_step": 187796, "epoch": 4471} {"train_loss": -7.313164234161377, "global_step": 187797, "epoch": 4471} {"train_loss": -7.166518211364746, "global_step": 187798, "epoch": 4471} {"train_loss": -7.1366682052612305, "global_step": 187799, "epoch": 4471} {"train_loss": -7.154620170593262, "global_step": 187800, "epoch": 4471} {"train_loss": -7.180500030517578, "global_step": 187801, "epoch": 4471} {"train_loss": -7.213550567626953, "global_step": 187802, "epoch": 4471} {"train_loss": -7.084988594055176, "global_step": 187803, "epoch": 4471} {"train_loss": -7.080599784851074, "global_step": 187804, "epoch": 4471} {"train_loss": -7.135568141937256, "global_step": 187805, "epoch": 4471} {"train_loss": -7.188343048095703, "global_step": 187806, "epoch": 4471} {"train_loss": -7.184714317321777, "global_step": 187807, "epoch": 4471} {"train_loss": -7.141088962554932, "global_step": 187808, "epoch": 4471} {"train_loss": -7.150601863861084, "global_step": 187809, "epoch": 4471} {"train_loss": -7.1819562911987305, "global_step": 187810, "epoch": 4471} {"train_loss": -7.18846321105957, "global_step": 187811, "epoch": 4471} {"train_loss": -7.056247711181641, "global_step": 187812, "epoch": 4471} {"train_loss": -7.168452262878418, "global_step": 187813, "epoch": 4471} {"train_loss": -7.189404487609863, "global_step": 187814, "epoch": 4471} {"train_loss": -7.100136756896973, "global_step": 187815, "epoch": 4471} {"train_loss": -7.128612518310547, "global_step": 187816, "epoch": 4471} {"train_loss": -7.000566005706787, "global_step": 187817, "epoch": 4471} {"train_loss": -7.062926769256592, "global_step": 187818, "epoch": 4471} {"train_loss": -7.1362433433532715, "global_step": 187819, "epoch": 4471} {"train_loss": -7.172362804412842, "global_step": 187820, "epoch": 4471} {"train_loss": -7.071373462677002, "global_step": 187821, "epoch": 4471} {"train_loss": -7.089800834655762, "global_step": 187822, "epoch": 4471} {"train_loss": -7.145615146273658, "global_step": 187823, "epoch": 4471, "val_loss": 68798.4453125} {"train_loss": -7.047152519226074, "global_step": 187824, "epoch": 4472} {"train_loss": -7.040932655334473, "global_step": 187825, "epoch": 4472} {"train_loss": -7.159728527069092, "global_step": 187826, "epoch": 4472} {"train_loss": -7.127132415771484, "global_step": 187827, "epoch": 4472} {"train_loss": -7.120473861694336, "global_step": 187828, "epoch": 4472} {"train_loss": -7.062205791473389, "global_step": 187829, "epoch": 4472} {"train_loss": -7.003360271453857, "global_step": 187830, "epoch": 4472} {"train_loss": -7.002893924713135, "global_step": 187831, "epoch": 4472} {"train_loss": -7.027550220489502, "global_step": 187832, "epoch": 4472} {"train_loss": -6.920153617858887, "global_step": 187833, "epoch": 4472} {"train_loss": -6.985448360443115, "global_step": 187834, "epoch": 4472} {"train_loss": -7.084892749786377, "global_step": 187835, "epoch": 4472} {"train_loss": -6.8950886726379395, "global_step": 187836, "epoch": 4472} {"train_loss": -6.869874954223633, "global_step": 187837, "epoch": 4472} {"train_loss": -6.991518020629883, "global_step": 187838, "epoch": 4472} {"train_loss": -7.0163679122924805, "global_step": 187839, "epoch": 4472} {"train_loss": -7.047232627868652, "global_step": 187840, "epoch": 4472} {"train_loss": -7.04138708114624, "global_step": 187841, "epoch": 4472} {"train_loss": -7.073707580566406, "global_step": 187842, "epoch": 4472} {"train_loss": -7.104410171508789, "global_step": 187843, "epoch": 4472} {"train_loss": -7.124092102050781, "global_step": 187844, "epoch": 4472} {"train_loss": -7.11297607421875, "global_step": 187845, "epoch": 4472} {"train_loss": -7.084924221038818, "global_step": 187846, "epoch": 4472} {"train_loss": -7.045505523681641, "global_step": 187847, "epoch": 4472} {"train_loss": -7.032641410827637, "global_step": 187848, "epoch": 4472} {"train_loss": -7.113791465759277, "global_step": 187849, "epoch": 4472} {"train_loss": -7.065061569213867, "global_step": 187850, "epoch": 4472} {"train_loss": -7.056122779846191, "global_step": 187851, "epoch": 4472} {"train_loss": -7.106045722961426, "global_step": 187852, "epoch": 4472} {"train_loss": -7.08408260345459, "global_step": 187853, "epoch": 4472} {"train_loss": -6.920805931091309, "global_step": 187854, "epoch": 4472} {"train_loss": -7.104619979858398, "global_step": 187855, "epoch": 4472} {"train_loss": -6.972803115844727, "global_step": 187856, "epoch": 4472} {"train_loss": -7.180855751037598, "global_step": 187857, "epoch": 4472} {"train_loss": -7.127814769744873, "global_step": 187858, "epoch": 4472} {"train_loss": -7.137077331542969, "global_step": 187859, "epoch": 4472} {"train_loss": -7.099379062652588, "global_step": 187860, "epoch": 4472} {"train_loss": -7.211080074310303, "global_step": 187861, "epoch": 4472} {"train_loss": -7.132663249969482, "global_step": 187862, "epoch": 4472} {"train_loss": -7.114274024963379, "global_step": 187863, "epoch": 4472} {"train_loss": -7.103027820587158, "global_step": 187864, "epoch": 4472} {"train_loss": -7.061981167112078, "global_step": 187865, "epoch": 4472, "val_loss": 68889.2890625} {"train_loss": -7.05588436126709, "global_step": 187866, "epoch": 4473} {"train_loss": -7.012299060821533, "global_step": 187867, "epoch": 4473} {"train_loss": -7.007080554962158, "global_step": 187868, "epoch": 4473} {"train_loss": -6.9572601318359375, "global_step": 187869, "epoch": 4473} {"train_loss": -7.165201663970947, "global_step": 187870, "epoch": 4473} {"train_loss": -6.834822177886963, "global_step": 187871, "epoch": 4473} {"train_loss": -7.040322303771973, "global_step": 187872, "epoch": 4473} {"train_loss": -7.019284725189209, "global_step": 187873, "epoch": 4473} {"train_loss": -6.95302152633667, "global_step": 187874, "epoch": 4473} {"train_loss": -7.196217060089111, "global_step": 187875, "epoch": 4473} {"train_loss": -6.831886291503906, "global_step": 187876, "epoch": 4473} {"train_loss": -7.216042518615723, "global_step": 187877, "epoch": 4473} {"train_loss": -6.960691452026367, "global_step": 187878, "epoch": 4473} {"train_loss": -7.1559343338012695, "global_step": 187879, "epoch": 4473} {"train_loss": -6.932834625244141, "global_step": 187880, "epoch": 4473} {"train_loss": -6.872128486633301, "global_step": 187881, "epoch": 4473} {"train_loss": -7.063440322875977, "global_step": 187882, "epoch": 4473} {"train_loss": -7.169498443603516, "global_step": 187883, "epoch": 4473} {"train_loss": -7.041807174682617, "global_step": 187884, "epoch": 4473} {"train_loss": -7.270489692687988, "global_step": 187885, "epoch": 4473} {"train_loss": -7.07850456237793, "global_step": 187886, "epoch": 4473} {"train_loss": -7.0293803215026855, "global_step": 187887, "epoch": 4473} {"train_loss": -7.064056396484375, "global_step": 187888, "epoch": 4473} {"train_loss": -7.208395004272461, "global_step": 187889, "epoch": 4473} {"train_loss": -7.091787815093994, "global_step": 187890, "epoch": 4473} {"train_loss": -7.256086349487305, "global_step": 187891, "epoch": 4473} {"train_loss": -7.188148498535156, "global_step": 187892, "epoch": 4473} {"train_loss": -7.0781660079956055, "global_step": 187893, "epoch": 4473} {"train_loss": -7.3500471115112305, "global_step": 187894, "epoch": 4473} {"train_loss": -7.089364051818848, "global_step": 187895, "epoch": 4473} {"train_loss": -7.232975006103516, "global_step": 187896, "epoch": 4473} {"train_loss": -7.149723052978516, "global_step": 187897, "epoch": 4473} {"train_loss": -7.142455101013184, "global_step": 187898, "epoch": 4473} {"train_loss": -7.141268730163574, "global_step": 187899, "epoch": 4473} {"train_loss": -7.120138645172119, "global_step": 187900, "epoch": 4473} {"train_loss": -7.049511909484863, "global_step": 187901, "epoch": 4473} {"train_loss": -7.159790992736816, "global_step": 187902, "epoch": 4473} {"train_loss": -7.123525142669678, "global_step": 187903, "epoch": 4473} {"train_loss": -7.1727776527404785, "global_step": 187904, "epoch": 4473} {"train_loss": -7.206709861755371, "global_step": 187905, "epoch": 4473} {"train_loss": -7.0833516120910645, "global_step": 187906, "epoch": 4473} {"train_loss": -7.091094709578014, "global_step": 187907, "epoch": 4473, "val_loss": 69054.625} {"train_loss": -7.191272735595703, "global_step": 187908, "epoch": 4474} {"train_loss": -7.13966178894043, "global_step": 187909, "epoch": 4474} {"train_loss": -7.036484718322754, "global_step": 187910, "epoch": 4474} {"train_loss": -6.999341011047363, "global_step": 187911, "epoch": 4474} {"train_loss": -7.158337593078613, "global_step": 187912, "epoch": 4474} {"train_loss": -7.0505900382995605, "global_step": 187913, "epoch": 4474} {"train_loss": -7.170641899108887, "global_step": 187914, "epoch": 4474} {"train_loss": -7.125665187835693, "global_step": 187915, "epoch": 4474} {"train_loss": -7.100500106811523, "global_step": 187916, "epoch": 4474} {"train_loss": -7.085228443145752, "global_step": 187917, "epoch": 4474} {"train_loss": -7.175931930541992, "global_step": 187918, "epoch": 4474} {"train_loss": -7.067797660827637, "global_step": 187919, "epoch": 4474} {"train_loss": -7.067224502563477, "global_step": 187920, "epoch": 4474} {"train_loss": -7.160236358642578, "global_step": 187921, "epoch": 4474} {"train_loss": -7.215147972106934, "global_step": 187922, "epoch": 4474} {"train_loss": -7.0116682052612305, "global_step": 187923, "epoch": 4474} {"train_loss": -7.091261863708496, "global_step": 187924, "epoch": 4474} {"train_loss": -7.145864486694336, "global_step": 187925, "epoch": 4474} {"train_loss": -7.051167964935303, "global_step": 187926, "epoch": 4474} {"train_loss": -7.250009059906006, "global_step": 187927, "epoch": 4474} {"train_loss": -7.152210235595703, "global_step": 187928, "epoch": 4474} {"train_loss": -7.260225296020508, "global_step": 187929, "epoch": 4474} {"train_loss": -7.272727966308594, "global_step": 187930, "epoch": 4474} {"train_loss": -7.163900375366211, "global_step": 187931, "epoch": 4474} {"train_loss": -7.15936803817749, "global_step": 187932, "epoch": 4474} {"train_loss": -7.149756908416748, "global_step": 187933, "epoch": 4474} {"train_loss": -7.158343315124512, "global_step": 187934, "epoch": 4474} {"train_loss": -7.154333591461182, "global_step": 187935, "epoch": 4474} {"train_loss": -7.208885669708252, "global_step": 187936, "epoch": 4474} {"train_loss": -7.203351020812988, "global_step": 187937, "epoch": 4474} {"train_loss": -7.1311798095703125, "global_step": 187938, "epoch": 4474} {"train_loss": -7.226691722869873, "global_step": 187939, "epoch": 4474} {"train_loss": -7.196360111236572, "global_step": 187940, "epoch": 4474} {"train_loss": -7.187383651733398, "global_step": 187941, "epoch": 4474} {"train_loss": -7.184929847717285, "global_step": 187942, "epoch": 4474} {"train_loss": -7.1435089111328125, "global_step": 187943, "epoch": 4474} {"train_loss": -7.2270917892456055, "global_step": 187944, "epoch": 4474} {"train_loss": -7.050049781799316, "global_step": 187945, "epoch": 4474} {"train_loss": -7.014627456665039, "global_step": 187946, "epoch": 4474} {"train_loss": -7.14277458190918, "global_step": 187947, "epoch": 4474} {"train_loss": -7.117844104766846, "global_step": 187948, "epoch": 4474} {"train_loss": -7.141816684177944, "global_step": 187949, "epoch": 4474, "val_loss": 69089.859375} {"train_loss": -7.0949177742004395, "global_step": 187950, "epoch": 4475} {"train_loss": -7.142111778259277, "global_step": 187951, "epoch": 4475} {"train_loss": -6.96395206451416, "global_step": 187952, "epoch": 4475} {"train_loss": -7.183071136474609, "global_step": 187953, "epoch": 4475} {"train_loss": -7.1603922843933105, "global_step": 187954, "epoch": 4475} {"train_loss": -7.264744758605957, "global_step": 187955, "epoch": 4475} {"train_loss": -7.110495090484619, "global_step": 187956, "epoch": 4475} {"train_loss": -7.058304786682129, "global_step": 187957, "epoch": 4475} {"train_loss": -7.27309513092041, "global_step": 187958, "epoch": 4475} {"train_loss": -7.084294319152832, "global_step": 187959, "epoch": 4475} {"train_loss": -7.008930206298828, "global_step": 187960, "epoch": 4475} {"train_loss": -7.09555721282959, "global_step": 187961, "epoch": 4475} {"train_loss": -7.068540096282959, "global_step": 187962, "epoch": 4475} {"train_loss": -7.085336208343506, "global_step": 187963, "epoch": 4475} {"train_loss": -7.169474124908447, "global_step": 187964, "epoch": 4475} {"train_loss": -7.206132888793945, "global_step": 187965, "epoch": 4475} {"train_loss": -7.00275182723999, "global_step": 187966, "epoch": 4475} {"train_loss": -7.087394714355469, "global_step": 187967, "epoch": 4475} {"train_loss": -7.1379475593566895, "global_step": 187968, "epoch": 4475} {"train_loss": -7.070577621459961, "global_step": 187969, "epoch": 4475} {"train_loss": -7.225153923034668, "global_step": 187970, "epoch": 4475} {"train_loss": -7.180510997772217, "global_step": 187971, "epoch": 4475} {"train_loss": -7.225641250610352, "global_step": 187972, "epoch": 4475} {"train_loss": -7.194427013397217, "global_step": 187973, "epoch": 4475} {"train_loss": -7.105744361877441, "global_step": 187974, "epoch": 4475} {"train_loss": -7.133769512176514, "global_step": 187975, "epoch": 4475} {"train_loss": -7.073788642883301, "global_step": 187976, "epoch": 4475} {"train_loss": -7.141584396362305, "global_step": 187977, "epoch": 4475} {"train_loss": -7.044652938842773, "global_step": 187978, "epoch": 4475} {"train_loss": -7.225019454956055, "global_step": 187979, "epoch": 4475} {"train_loss": -7.194008827209473, "global_step": 187980, "epoch": 4475} {"train_loss": -7.181451320648193, "global_step": 187981, "epoch": 4475} {"train_loss": -7.0311279296875, "global_step": 187982, "epoch": 4475} {"train_loss": -7.10564661026001, "global_step": 187983, "epoch": 4475} {"train_loss": -7.044816017150879, "global_step": 187984, "epoch": 4475} {"train_loss": -7.119096755981445, "global_step": 187985, "epoch": 4475} {"train_loss": -7.1003828048706055, "global_step": 187986, "epoch": 4475} {"train_loss": -7.058438777923584, "global_step": 187987, "epoch": 4475} {"train_loss": -7.093742370605469, "global_step": 187988, "epoch": 4475} {"train_loss": -6.98928165435791, "global_step": 187989, "epoch": 4475} {"train_loss": -6.981497287750244, "global_step": 187990, "epoch": 4475} {"train_loss": -7.114399455842518, "global_step": 187991, "epoch": 4475, "val_loss": 68941.2109375} {"train_loss": -7.122073173522949, "global_step": 187992, "epoch": 4476} {"train_loss": -7.136117935180664, "global_step": 187993, "epoch": 4476} {"train_loss": -7.158023834228516, "global_step": 187994, "epoch": 4476} {"train_loss": -7.12575626373291, "global_step": 187995, "epoch": 4476} {"train_loss": -7.186823844909668, "global_step": 187996, "epoch": 4476} {"train_loss": -7.025339126586914, "global_step": 187997, "epoch": 4476} {"train_loss": -7.168752670288086, "global_step": 187998, "epoch": 4476} {"train_loss": -7.13040828704834, "global_step": 187999, "epoch": 4476} {"train_loss": -7.0731401443481445, "global_step": 188000, "epoch": 4476} {"train_loss": -7.071934700012207, "global_step": 188001, "epoch": 4476} {"train_loss": -7.12843656539917, "global_step": 188002, "epoch": 4476} {"train_loss": -7.153234481811523, "global_step": 188003, "epoch": 4476} {"train_loss": -7.095844268798828, "global_step": 188004, "epoch": 4476} {"train_loss": -7.154941558837891, "global_step": 188005, "epoch": 4476} {"train_loss": -6.978968620300293, "global_step": 188006, "epoch": 4476} {"train_loss": -6.995513439178467, "global_step": 188007, "epoch": 4476} {"train_loss": -7.1535844802856445, "global_step": 188008, "epoch": 4476} {"train_loss": -6.869747161865234, "global_step": 188009, "epoch": 4476} {"train_loss": -7.020633220672607, "global_step": 188010, "epoch": 4476} {"train_loss": -7.0884552001953125, "global_step": 188011, "epoch": 4476} {"train_loss": -6.963827133178711, "global_step": 188012, "epoch": 4476} {"train_loss": -7.184442520141602, "global_step": 188013, "epoch": 4476} {"train_loss": -6.9425153732299805, "global_step": 188014, "epoch": 4476} {"train_loss": -7.1942267417907715, "global_step": 188015, "epoch": 4476} {"train_loss": -7.001263618469238, "global_step": 188016, "epoch": 4476} {"train_loss": -7.151266574859619, "global_step": 188017, "epoch": 4476} {"train_loss": -7.156618118286133, "global_step": 188018, "epoch": 4476} {"train_loss": -7.108278751373291, "global_step": 188019, "epoch": 4476} {"train_loss": -7.036437511444092, "global_step": 188020, "epoch": 4476} {"train_loss": -7.140984535217285, "global_step": 188021, "epoch": 4476} {"train_loss": -7.013697624206543, "global_step": 188022, "epoch": 4476} {"train_loss": -7.140626907348633, "global_step": 188023, "epoch": 4476} {"train_loss": -7.134369850158691, "global_step": 188024, "epoch": 4476} {"train_loss": -7.134160995483398, "global_step": 188025, "epoch": 4476} {"train_loss": -7.165617942810059, "global_step": 188026, "epoch": 4476} {"train_loss": -7.111612319946289, "global_step": 188027, "epoch": 4476} {"train_loss": -7.101770401000977, "global_step": 188028, "epoch": 4476} {"train_loss": -7.207657814025879, "global_step": 188029, "epoch": 4476} {"train_loss": -7.115422248840332, "global_step": 188030, "epoch": 4476} {"train_loss": -7.055011749267578, "global_step": 188031, "epoch": 4476} {"train_loss": -7.130615234375, "global_step": 188032, "epoch": 4476} {"train_loss": -7.097797223499843, "global_step": 188033, "epoch": 4476, "val_loss": 68905.0234375} {"train_loss": -7.121853351593018, "global_step": 188034, "epoch": 4477} {"train_loss": -7.175851821899414, "global_step": 188035, "epoch": 4477} {"train_loss": -7.171896457672119, "global_step": 188036, "epoch": 4477} {"train_loss": -7.2125115394592285, "global_step": 188037, "epoch": 4477} {"train_loss": -7.261624336242676, "global_step": 188038, "epoch": 4477} {"train_loss": -7.171735763549805, "global_step": 188039, "epoch": 4477} {"train_loss": -7.109055519104004, "global_step": 188040, "epoch": 4477} {"train_loss": -7.258920669555664, "global_step": 188041, "epoch": 4477} {"train_loss": -7.206836700439453, "global_step": 188042, "epoch": 4477} {"train_loss": -7.146256446838379, "global_step": 188043, "epoch": 4477} {"train_loss": -7.108222484588623, "global_step": 188044, "epoch": 4477} {"train_loss": -7.129498481750488, "global_step": 188045, "epoch": 4477} {"train_loss": -7.2743096351623535, "global_step": 188046, "epoch": 4477} {"train_loss": -7.162093162536621, "global_step": 188047, "epoch": 4477} {"train_loss": -7.163729667663574, "global_step": 188048, "epoch": 4477} {"train_loss": -7.181463718414307, "global_step": 188049, "epoch": 4477} {"train_loss": -7.138155937194824, "global_step": 188050, "epoch": 4477} {"train_loss": -7.154237270355225, "global_step": 188051, "epoch": 4477} {"train_loss": -7.1703338623046875, "global_step": 188052, "epoch": 4477} {"train_loss": -7.211396217346191, "global_step": 188053, "epoch": 4477} {"train_loss": -7.135503768920898, "global_step": 188054, "epoch": 4477} {"train_loss": -7.263063430786133, "global_step": 188055, "epoch": 4477} {"train_loss": -7.123782634735107, "global_step": 188056, "epoch": 4477} {"train_loss": -7.073817253112793, "global_step": 188057, "epoch": 4477} {"train_loss": -7.17240047454834, "global_step": 188058, "epoch": 4477} {"train_loss": -7.155948162078857, "global_step": 188059, "epoch": 4477} {"train_loss": -7.183140277862549, "global_step": 188060, "epoch": 4477} {"train_loss": -6.985335350036621, "global_step": 188061, "epoch": 4477} {"train_loss": -7.215620040893555, "global_step": 188062, "epoch": 4477} {"train_loss": -7.0160369873046875, "global_step": 188063, "epoch": 4477} {"train_loss": -7.002557754516602, "global_step": 188064, "epoch": 4477} {"train_loss": -7.073277473449707, "global_step": 188065, "epoch": 4477} {"train_loss": -6.955984115600586, "global_step": 188066, "epoch": 4477} {"train_loss": -7.105892658233643, "global_step": 188067, "epoch": 4477} {"train_loss": -7.013593673706055, "global_step": 188068, "epoch": 4477} {"train_loss": -7.13629150390625, "global_step": 188069, "epoch": 4477} {"train_loss": -7.116323471069336, "global_step": 188070, "epoch": 4477} {"train_loss": -7.111368179321289, "global_step": 188071, "epoch": 4477} {"train_loss": -7.162304878234863, "global_step": 188072, "epoch": 4477} {"train_loss": -7.075183391571045, "global_step": 188073, "epoch": 4477} {"train_loss": -7.050533294677734, "global_step": 188074, "epoch": 4477} {"train_loss": -7.140000559034801, "global_step": 188075, "epoch": 4477, "val_loss": 69019.5859375} {"train_loss": -7.102050304412842, "global_step": 188076, "epoch": 4478} {"train_loss": -7.153570175170898, "global_step": 188077, "epoch": 4478} {"train_loss": -7.100554466247559, "global_step": 188078, "epoch": 4478} {"train_loss": -7.107385635375977, "global_step": 188079, "epoch": 4478} {"train_loss": -7.08482551574707, "global_step": 188080, "epoch": 4478} {"train_loss": -7.151059627532959, "global_step": 188081, "epoch": 4478} {"train_loss": -7.108006000518799, "global_step": 188082, "epoch": 4478} {"train_loss": -7.154546737670898, "global_step": 188083, "epoch": 4478} {"train_loss": -7.061077117919922, "global_step": 188084, "epoch": 4478} {"train_loss": -7.135761260986328, "global_step": 188085, "epoch": 4478} {"train_loss": -7.049995422363281, "global_step": 188086, "epoch": 4478} {"train_loss": -7.067612171173096, "global_step": 188087, "epoch": 4478} {"train_loss": -7.167447090148926, "global_step": 188088, "epoch": 4478} {"train_loss": -7.1388726234436035, "global_step": 188089, "epoch": 4478} {"train_loss": -7.218605041503906, "global_step": 188090, "epoch": 4478} {"train_loss": -7.148291110992432, "global_step": 188091, "epoch": 4478} {"train_loss": -7.0406084060668945, "global_step": 188092, "epoch": 4478} {"train_loss": -7.156103610992432, "global_step": 188093, "epoch": 4478} {"train_loss": -7.1056623458862305, "global_step": 188094, "epoch": 4478} {"train_loss": -7.073964595794678, "global_step": 188095, "epoch": 4478} {"train_loss": -7.174011707305908, "global_step": 188096, "epoch": 4478} {"train_loss": -7.182753086090088, "global_step": 188097, "epoch": 4478} {"train_loss": -7.098831653594971, "global_step": 188098, "epoch": 4478} {"train_loss": -7.076594352722168, "global_step": 188099, "epoch": 4478} {"train_loss": -7.162664413452148, "global_step": 188100, "epoch": 4478} {"train_loss": -6.969837188720703, "global_step": 188101, "epoch": 4478} {"train_loss": -6.917235374450684, "global_step": 188102, "epoch": 4478} {"train_loss": -7.040560245513916, "global_step": 188103, "epoch": 4478} {"train_loss": -7.1848955154418945, "global_step": 188104, "epoch": 4478} {"train_loss": -7.082239627838135, "global_step": 188105, "epoch": 4478} {"train_loss": -7.206942558288574, "global_step": 188106, "epoch": 4478} {"train_loss": -7.164680480957031, "global_step": 188107, "epoch": 4478} {"train_loss": -7.196632385253906, "global_step": 188108, "epoch": 4478} {"train_loss": -7.02178955078125, "global_step": 188109, "epoch": 4478} {"train_loss": -7.172305107116699, "global_step": 188110, "epoch": 4478} {"train_loss": -7.086267471313477, "global_step": 188111, "epoch": 4478} {"train_loss": -7.11939811706543, "global_step": 188112, "epoch": 4478} {"train_loss": -7.133035182952881, "global_step": 188113, "epoch": 4478} {"train_loss": -7.094813346862793, "global_step": 188114, "epoch": 4478} {"train_loss": -7.08806037902832, "global_step": 188115, "epoch": 4478} {"train_loss": -7.116209030151367, "global_step": 188116, "epoch": 4478} {"train_loss": -7.116622118722825, "global_step": 188117, "epoch": 4478, "val_loss": 68869.5390625} {"train_loss": -7.11740255355835, "global_step": 188118, "epoch": 4479} {"train_loss": -7.220354080200195, "global_step": 188119, "epoch": 4479} {"train_loss": -7.049711227416992, "global_step": 188120, "epoch": 4479} {"train_loss": -7.15423583984375, "global_step": 188121, "epoch": 4479} {"train_loss": -7.21714973449707, "global_step": 188122, "epoch": 4479} {"train_loss": -7.203245162963867, "global_step": 188123, "epoch": 4479} {"train_loss": -7.159655570983887, "global_step": 188124, "epoch": 4479} {"train_loss": -7.181766986846924, "global_step": 188125, "epoch": 4479} {"train_loss": -7.140434265136719, "global_step": 188126, "epoch": 4479} {"train_loss": -7.083613395690918, "global_step": 188127, "epoch": 4479} {"train_loss": -7.065202713012695, "global_step": 188128, "epoch": 4479} {"train_loss": -7.065351963043213, "global_step": 188129, "epoch": 4479} {"train_loss": -7.116390228271484, "global_step": 188130, "epoch": 4479} {"train_loss": -7.074710845947266, "global_step": 188131, "epoch": 4479} {"train_loss": -7.087444305419922, "global_step": 188132, "epoch": 4479} {"train_loss": -7.099396705627441, "global_step": 188133, "epoch": 4479} {"train_loss": -7.005126953125, "global_step": 188134, "epoch": 4479} {"train_loss": -7.096315860748291, "global_step": 188135, "epoch": 4479} {"train_loss": -7.097034454345703, "global_step": 188136, "epoch": 4479} {"train_loss": -7.1296186447143555, "global_step": 188137, "epoch": 4479} {"train_loss": -7.057979583740234, "global_step": 188138, "epoch": 4479} {"train_loss": -7.238229751586914, "global_step": 188139, "epoch": 4479} {"train_loss": -7.176480770111084, "global_step": 188140, "epoch": 4479} {"train_loss": -7.159867286682129, "global_step": 188141, "epoch": 4479} {"train_loss": -7.073647499084473, "global_step": 188142, "epoch": 4479} {"train_loss": -7.009792327880859, "global_step": 188143, "epoch": 4479} {"train_loss": -7.074286460876465, "global_step": 188144, "epoch": 4479} {"train_loss": -7.234446048736572, "global_step": 188145, "epoch": 4479} {"train_loss": -7.143472671508789, "global_step": 188146, "epoch": 4479} {"train_loss": -7.173356056213379, "global_step": 188147, "epoch": 4479} {"train_loss": -7.128511428833008, "global_step": 188148, "epoch": 4479} {"train_loss": -6.983604907989502, "global_step": 188149, "epoch": 4479} {"train_loss": -7.156248569488525, "global_step": 188150, "epoch": 4479} {"train_loss": -7.079514980316162, "global_step": 188151, "epoch": 4479} {"train_loss": -6.870418548583984, "global_step": 188152, "epoch": 4479} {"train_loss": -7.2311811447143555, "global_step": 188153, "epoch": 4479} {"train_loss": -6.973086833953857, "global_step": 188154, "epoch": 4479} {"train_loss": -6.718085289001465, "global_step": 188155, "epoch": 4479} {"train_loss": -7.024085998535156, "global_step": 188156, "epoch": 4479} {"train_loss": -6.801753997802734, "global_step": 188157, "epoch": 4479} {"train_loss": -6.945745468139648, "global_step": 188158, "epoch": 4479} {"train_loss": -7.085584651856196, "global_step": 188159, "epoch": 4479, "val_loss": 68997.4375} {"train_loss": -6.758410930633545, "global_step": 188160, "epoch": 4480} {"train_loss": -7.062939167022705, "global_step": 188161, "epoch": 4480} {"train_loss": -6.783245086669922, "global_step": 188162, "epoch": 4480} {"train_loss": -7.000276565551758, "global_step": 188163, "epoch": 4480} {"train_loss": -6.762222766876221, "global_step": 188164, "epoch": 4480} {"train_loss": -7.076411247253418, "global_step": 188165, "epoch": 4480} {"train_loss": -6.859628677368164, "global_step": 188166, "epoch": 4480} {"train_loss": -6.968118667602539, "global_step": 188167, "epoch": 4480} {"train_loss": -6.9643168449401855, "global_step": 188168, "epoch": 4480} {"train_loss": -6.926182746887207, "global_step": 188169, "epoch": 4480} {"train_loss": -7.079819202423096, "global_step": 188170, "epoch": 4480} {"train_loss": -7.062750339508057, "global_step": 188171, "epoch": 4480} {"train_loss": -7.009929656982422, "global_step": 188172, "epoch": 4480} {"train_loss": -6.91837739944458, "global_step": 188173, "epoch": 4480} {"train_loss": -7.003901481628418, "global_step": 188174, "epoch": 4480} {"train_loss": -7.041018962860107, "global_step": 188175, "epoch": 4480} {"train_loss": -7.016295433044434, "global_step": 188176, "epoch": 4480} {"train_loss": -7.06176233291626, "global_step": 188177, "epoch": 4480} {"train_loss": -7.024755477905273, "global_step": 188178, "epoch": 4480} {"train_loss": -7.118377685546875, "global_step": 188179, "epoch": 4480} {"train_loss": -7.042715072631836, "global_step": 188180, "epoch": 4480} {"train_loss": -7.013078212738037, "global_step": 188181, "epoch": 4480} {"train_loss": -7.122155666351318, "global_step": 188182, "epoch": 4480} {"train_loss": -7.0031890869140625, "global_step": 188183, "epoch": 4480} {"train_loss": -7.103764057159424, "global_step": 188184, "epoch": 4480} {"train_loss": -7.192035675048828, "global_step": 188185, "epoch": 4480} {"train_loss": -7.002601623535156, "global_step": 188186, "epoch": 4480} {"train_loss": -7.135973930358887, "global_step": 188187, "epoch": 4480} {"train_loss": -6.955991268157959, "global_step": 188188, "epoch": 4480} {"train_loss": -7.16251802444458, "global_step": 188189, "epoch": 4480} {"train_loss": -7.0978522300720215, "global_step": 188190, "epoch": 4480} {"train_loss": -7.084221839904785, "global_step": 188191, "epoch": 4480} {"train_loss": -7.12818717956543, "global_step": 188192, "epoch": 4480} {"train_loss": -7.069756507873535, "global_step": 188193, "epoch": 4480} {"train_loss": -7.113488674163818, "global_step": 188194, "epoch": 4480} {"train_loss": -7.111015319824219, "global_step": 188195, "epoch": 4480} {"train_loss": -7.256006240844727, "global_step": 188196, "epoch": 4480} {"train_loss": -7.08094596862793, "global_step": 188197, "epoch": 4480} {"train_loss": -7.169198036193848, "global_step": 188198, "epoch": 4480} {"train_loss": -7.235991477966309, "global_step": 188199, "epoch": 4480} {"train_loss": -7.228470802307129, "global_step": 188200, "epoch": 4480} {"train_loss": -7.045174961998349, "global_step": 188201, "epoch": 4480, "val_loss": 68944.6015625} {"train_loss": -7.144200801849365, "global_step": 188202, "epoch": 4481} {"train_loss": -7.26452112197876, "global_step": 188203, "epoch": 4481} {"train_loss": -7.056519508361816, "global_step": 188204, "epoch": 4481} {"train_loss": -7.143621921539307, "global_step": 188205, "epoch": 4481} {"train_loss": -7.241415023803711, "global_step": 188206, "epoch": 4481} {"train_loss": -7.056158065795898, "global_step": 188207, "epoch": 4481} {"train_loss": -7.092851638793945, "global_step": 188208, "epoch": 4481} {"train_loss": -7.045191764831543, "global_step": 188209, "epoch": 4481} {"train_loss": -7.103858470916748, "global_step": 188210, "epoch": 4481} {"train_loss": -7.233753204345703, "global_step": 188211, "epoch": 4481} {"train_loss": -6.953559875488281, "global_step": 188212, "epoch": 4481} {"train_loss": -7.228487968444824, "global_step": 188213, "epoch": 4481} {"train_loss": -7.0584917068481445, "global_step": 188214, "epoch": 4481} {"train_loss": -7.145649433135986, "global_step": 188215, "epoch": 4481} {"train_loss": -7.107204437255859, "global_step": 188216, "epoch": 4481} {"train_loss": -6.992103576660156, "global_step": 188217, "epoch": 4481} {"train_loss": -7.318164825439453, "global_step": 188218, "epoch": 4481} {"train_loss": -7.148273468017578, "global_step": 188219, "epoch": 4481} {"train_loss": -7.065145492553711, "global_step": 188220, "epoch": 4481} {"train_loss": -7.161499977111816, "global_step": 188221, "epoch": 4481} {"train_loss": -7.164756774902344, "global_step": 188222, "epoch": 4481} {"train_loss": -7.101971626281738, "global_step": 188223, "epoch": 4481} {"train_loss": -7.090426921844482, "global_step": 188224, "epoch": 4481} {"train_loss": -7.28081750869751, "global_step": 188225, "epoch": 4481} {"train_loss": -7.067279815673828, "global_step": 188226, "epoch": 4481} {"train_loss": -7.133878231048584, "global_step": 188227, "epoch": 4481} {"train_loss": -7.221297264099121, "global_step": 188228, "epoch": 4481} {"train_loss": -6.981144905090332, "global_step": 188229, "epoch": 4481} {"train_loss": -7.1396074295043945, "global_step": 188230, "epoch": 4481} {"train_loss": -7.167844772338867, "global_step": 188231, "epoch": 4481} {"train_loss": -7.138124465942383, "global_step": 188232, "epoch": 4481} {"train_loss": -7.143200874328613, "global_step": 188233, "epoch": 4481} {"train_loss": -7.20829963684082, "global_step": 188234, "epoch": 4481} {"train_loss": -7.222307205200195, "global_step": 188235, "epoch": 4481} {"train_loss": -7.176767349243164, "global_step": 188236, "epoch": 4481} {"train_loss": -7.055295944213867, "global_step": 188237, "epoch": 4481} {"train_loss": -7.226404190063477, "global_step": 188238, "epoch": 4481} {"train_loss": -7.17057466506958, "global_step": 188239, "epoch": 4481} {"train_loss": -7.07683801651001, "global_step": 188240, "epoch": 4481} {"train_loss": -7.123871803283691, "global_step": 188241, "epoch": 4481} {"train_loss": -7.087225914001465, "global_step": 188242, "epoch": 4481} {"train_loss": -7.133583261853173, "global_step": 188243, "epoch": 4481, "val_loss": 68962.875} {"train_loss": -7.1588358879089355, "global_step": 188244, "epoch": 4482} {"train_loss": -7.213237285614014, "global_step": 188245, "epoch": 4482} {"train_loss": -7.108068943023682, "global_step": 188246, "epoch": 4482} {"train_loss": -7.1139326095581055, "global_step": 188247, "epoch": 4482} {"train_loss": -7.103069305419922, "global_step": 188248, "epoch": 4482} {"train_loss": -7.182692527770996, "global_step": 188249, "epoch": 4482} {"train_loss": -7.2039289474487305, "global_step": 188250, "epoch": 4482} {"train_loss": -7.099260330200195, "global_step": 188251, "epoch": 4482} {"train_loss": -7.117079734802246, "global_step": 188252, "epoch": 4482} {"train_loss": -7.0406036376953125, "global_step": 188253, "epoch": 4482} {"train_loss": -7.090124130249023, "global_step": 188254, "epoch": 4482} {"train_loss": -7.16796350479126, "global_step": 188255, "epoch": 4482} {"train_loss": -7.171255111694336, "global_step": 188256, "epoch": 4482} {"train_loss": -7.129375457763672, "global_step": 188257, "epoch": 4482} {"train_loss": -7.252462387084961, "global_step": 188258, "epoch": 4482} {"train_loss": -7.138684272766113, "global_step": 188259, "epoch": 4482} {"train_loss": -7.170315265655518, "global_step": 188260, "epoch": 4482} {"train_loss": -7.146636486053467, "global_step": 188261, "epoch": 4482} {"train_loss": -7.1391096115112305, "global_step": 188262, "epoch": 4482} {"train_loss": -7.138673782348633, "global_step": 188263, "epoch": 4482} {"train_loss": -7.105673789978027, "global_step": 188264, "epoch": 4482} {"train_loss": -6.966853141784668, "global_step": 188265, "epoch": 4482} {"train_loss": -6.976977348327637, "global_step": 188266, "epoch": 4482} {"train_loss": -7.058844566345215, "global_step": 188267, "epoch": 4482} {"train_loss": -7.147597312927246, "global_step": 188268, "epoch": 4482} {"train_loss": -6.9566192626953125, "global_step": 188269, "epoch": 4482} {"train_loss": -7.048609256744385, "global_step": 188270, "epoch": 4482} {"train_loss": -7.133692741394043, "global_step": 188271, "epoch": 4482} {"train_loss": -7.075177192687988, "global_step": 188272, "epoch": 4482} {"train_loss": -7.131936073303223, "global_step": 188273, "epoch": 4482} {"train_loss": -7.156734466552734, "global_step": 188274, "epoch": 4482} {"train_loss": -6.9765424728393555, "global_step": 188275, "epoch": 4482} {"train_loss": -7.191498279571533, "global_step": 188276, "epoch": 4482} {"train_loss": -7.198960304260254, "global_step": 188277, "epoch": 4482} {"train_loss": -7.1350250244140625, "global_step": 188278, "epoch": 4482} {"train_loss": -7.162783622741699, "global_step": 188279, "epoch": 4482} {"train_loss": -7.168449401855469, "global_step": 188280, "epoch": 4482} {"train_loss": -6.981441497802734, "global_step": 188281, "epoch": 4482} {"train_loss": -7.156595230102539, "global_step": 188282, "epoch": 4482} {"train_loss": -7.087440490722656, "global_step": 188283, "epoch": 4482} {"train_loss": -7.102488040924072, "global_step": 188284, "epoch": 4482} {"train_loss": -7.116165093013218, "global_step": 188285, "epoch": 4482, "val_loss": 69085.7578125} {"train_loss": -7.191825866699219, "global_step": 188286, "epoch": 4483} {"train_loss": -7.20153284072876, "global_step": 188287, "epoch": 4483} {"train_loss": -7.174853324890137, "global_step": 188288, "epoch": 4483} {"train_loss": -7.046261787414551, "global_step": 188289, "epoch": 4483} {"train_loss": -7.034056663513184, "global_step": 188290, "epoch": 4483} {"train_loss": -7.066528797149658, "global_step": 188291, "epoch": 4483} {"train_loss": -7.074506759643555, "global_step": 188292, "epoch": 4483} {"train_loss": -7.005834579467773, "global_step": 188293, "epoch": 4483} {"train_loss": -7.080677032470703, "global_step": 188294, "epoch": 4483} {"train_loss": -7.215008735656738, "global_step": 188295, "epoch": 4483} {"train_loss": -7.107960224151611, "global_step": 188296, "epoch": 4483} {"train_loss": -7.041316986083984, "global_step": 188297, "epoch": 4483} {"train_loss": -7.2261481285095215, "global_step": 188298, "epoch": 4483} {"train_loss": -7.160338401794434, "global_step": 188299, "epoch": 4483} {"train_loss": -7.09591007232666, "global_step": 188300, "epoch": 4483} {"train_loss": -7.224437236785889, "global_step": 188301, "epoch": 4483} {"train_loss": -7.015872001647949, "global_step": 188302, "epoch": 4483} {"train_loss": -7.223488807678223, "global_step": 188303, "epoch": 4483} {"train_loss": -7.062839031219482, "global_step": 188304, "epoch": 4483} {"train_loss": -7.01884126663208, "global_step": 188305, "epoch": 4483} {"train_loss": -7.124767780303955, "global_step": 188306, "epoch": 4483} {"train_loss": -7.17041015625, "global_step": 188307, "epoch": 4483} {"train_loss": -7.154638290405273, "global_step": 188308, "epoch": 4483} {"train_loss": -7.036670684814453, "global_step": 188309, "epoch": 4483} {"train_loss": -7.124630451202393, "global_step": 188310, "epoch": 4483} {"train_loss": -7.182033061981201, "global_step": 188311, "epoch": 4483} {"train_loss": -7.074584007263184, "global_step": 188312, "epoch": 4483} {"train_loss": -7.1444573402404785, "global_step": 188313, "epoch": 4483} {"train_loss": -7.226320266723633, "global_step": 188314, "epoch": 4483} {"train_loss": -7.107487201690674, "global_step": 188315, "epoch": 4483} {"train_loss": -7.0705885887146, "global_step": 188316, "epoch": 4483} {"train_loss": -7.034063339233398, "global_step": 188317, "epoch": 4483} {"train_loss": -7.173260688781738, "global_step": 188318, "epoch": 4483} {"train_loss": -7.163585662841797, "global_step": 188319, "epoch": 4483} {"train_loss": -7.139838218688965, "global_step": 188320, "epoch": 4483} {"train_loss": -7.190544128417969, "global_step": 188321, "epoch": 4483} {"train_loss": -7.098694801330566, "global_step": 188322, "epoch": 4483} {"train_loss": -7.170716762542725, "global_step": 188323, "epoch": 4483} {"train_loss": -7.231074333190918, "global_step": 188324, "epoch": 4483} {"train_loss": -7.085315227508545, "global_step": 188325, "epoch": 4483} {"train_loss": -7.226761817932129, "global_step": 188326, "epoch": 4483} {"train_loss": -7.1250644865490145, "global_step": 188327, "epoch": 4483, "val_loss": 68969.9921875} {"train_loss": -7.162234306335449, "global_step": 188328, "epoch": 4484} {"train_loss": -7.183507919311523, "global_step": 188329, "epoch": 4484} {"train_loss": -7.104151725769043, "global_step": 188330, "epoch": 4484} {"train_loss": -7.066205978393555, "global_step": 188331, "epoch": 4484} {"train_loss": -7.122498989105225, "global_step": 188332, "epoch": 4484} {"train_loss": -7.105390548706055, "global_step": 188333, "epoch": 4484} {"train_loss": -7.082930088043213, "global_step": 188334, "epoch": 4484} {"train_loss": -7.2117533683776855, "global_step": 188335, "epoch": 4484} {"train_loss": -7.259976863861084, "global_step": 188336, "epoch": 4484} {"train_loss": -7.1399760246276855, "global_step": 188337, "epoch": 4484} {"train_loss": -7.152618408203125, "global_step": 188338, "epoch": 4484} {"train_loss": -7.101513862609863, "global_step": 188339, "epoch": 4484} {"train_loss": -7.134233474731445, "global_step": 188340, "epoch": 4484} {"train_loss": -7.244811534881592, "global_step": 188341, "epoch": 4484} {"train_loss": -7.167113304138184, "global_step": 188342, "epoch": 4484} {"train_loss": -7.237104415893555, "global_step": 188343, "epoch": 4484} {"train_loss": -7.147416114807129, "global_step": 188344, "epoch": 4484} {"train_loss": -7.24872350692749, "global_step": 188345, "epoch": 4484} {"train_loss": -7.334758758544922, "global_step": 188346, "epoch": 4484} {"train_loss": -7.1652069091796875, "global_step": 188347, "epoch": 4484} {"train_loss": -7.184136390686035, "global_step": 188348, "epoch": 4484} {"train_loss": -7.249703407287598, "global_step": 188349, "epoch": 4484} {"train_loss": -7.109637260437012, "global_step": 188350, "epoch": 4484} {"train_loss": -7.131584167480469, "global_step": 188351, "epoch": 4484} {"train_loss": -7.207214832305908, "global_step": 188352, "epoch": 4484} {"train_loss": -7.014803409576416, "global_step": 188353, "epoch": 4484} {"train_loss": -7.116178512573242, "global_step": 188354, "epoch": 4484} {"train_loss": -7.183741569519043, "global_step": 188355, "epoch": 4484} {"train_loss": -7.117191314697266, "global_step": 188356, "epoch": 4484} {"train_loss": -7.1316752433776855, "global_step": 188357, "epoch": 4484} {"train_loss": -7.269293785095215, "global_step": 188358, "epoch": 4484} {"train_loss": -7.106972694396973, "global_step": 188359, "epoch": 4484} {"train_loss": -7.197303771972656, "global_step": 188360, "epoch": 4484} {"train_loss": -7.217232704162598, "global_step": 188361, "epoch": 4484} {"train_loss": -7.129966735839844, "global_step": 188362, "epoch": 4484} {"train_loss": -7.005007743835449, "global_step": 188363, "epoch": 4484} {"train_loss": -7.226988792419434, "global_step": 188364, "epoch": 4484} {"train_loss": -7.166006088256836, "global_step": 188365, "epoch": 4484} {"train_loss": -7.126931667327881, "global_step": 188366, "epoch": 4484} {"train_loss": -7.258171081542969, "global_step": 188367, "epoch": 4484} {"train_loss": -7.15789794921875, "global_step": 188368, "epoch": 4484} {"train_loss": -7.163543076742263, "global_step": 188369, "epoch": 4484, "val_loss": 68912.53125} {"train_loss": -7.15761661529541, "global_step": 188370, "epoch": 4485} {"train_loss": -7.117434024810791, "global_step": 188371, "epoch": 4485} {"train_loss": -7.277840614318848, "global_step": 188372, "epoch": 4485} {"train_loss": -7.15858793258667, "global_step": 188373, "epoch": 4485} {"train_loss": -7.2161865234375, "global_step": 188374, "epoch": 4485} {"train_loss": -7.009460926055908, "global_step": 188375, "epoch": 4485} {"train_loss": -7.033136367797852, "global_step": 188376, "epoch": 4485} {"train_loss": -7.164267539978027, "global_step": 188377, "epoch": 4485} {"train_loss": -7.089803695678711, "global_step": 188378, "epoch": 4485} {"train_loss": -7.098146438598633, "global_step": 188379, "epoch": 4485} {"train_loss": -7.1944804191589355, "global_step": 188380, "epoch": 4485} {"train_loss": -7.1745524406433105, "global_step": 188381, "epoch": 4485} {"train_loss": -7.157986640930176, "global_step": 188382, "epoch": 4485} {"train_loss": -7.082187652587891, "global_step": 188383, "epoch": 4485} {"train_loss": -7.2504072189331055, "global_step": 188384, "epoch": 4485} {"train_loss": -7.118479251861572, "global_step": 188385, "epoch": 4485} {"train_loss": -7.159872055053711, "global_step": 188386, "epoch": 4485} {"train_loss": -7.121255874633789, "global_step": 188387, "epoch": 4485} {"train_loss": -7.201395034790039, "global_step": 188388, "epoch": 4485} {"train_loss": -7.132411956787109, "global_step": 188389, "epoch": 4485} {"train_loss": -7.202338218688965, "global_step": 188390, "epoch": 4485} {"train_loss": -7.178865432739258, "global_step": 188391, "epoch": 4485} {"train_loss": -7.291256904602051, "global_step": 188392, "epoch": 4485} {"train_loss": -7.230955123901367, "global_step": 188393, "epoch": 4485} {"train_loss": -7.162889003753662, "global_step": 188394, "epoch": 4485} {"train_loss": -7.17404317855835, "global_step": 188395, "epoch": 4485} {"train_loss": -7.112088203430176, "global_step": 188396, "epoch": 4485} {"train_loss": -7.143621444702148, "global_step": 188397, "epoch": 4485} {"train_loss": -7.185142517089844, "global_step": 188398, "epoch": 4485} {"train_loss": -7.161344528198242, "global_step": 188399, "epoch": 4485} {"train_loss": -7.073040962219238, "global_step": 188400, "epoch": 4485} {"train_loss": -7.180060386657715, "global_step": 188401, "epoch": 4485} {"train_loss": -7.11572790145874, "global_step": 188402, "epoch": 4485} {"train_loss": -7.132863998413086, "global_step": 188403, "epoch": 4485} {"train_loss": -7.095235347747803, "global_step": 188404, "epoch": 4485} {"train_loss": -7.054304122924805, "global_step": 188405, "epoch": 4485} {"train_loss": -7.171392440795898, "global_step": 188406, "epoch": 4485} {"train_loss": -7.008131504058838, "global_step": 188407, "epoch": 4485} {"train_loss": -7.154968738555908, "global_step": 188408, "epoch": 4485} {"train_loss": -6.989445686340332, "global_step": 188409, "epoch": 4485} {"train_loss": -7.015432357788086, "global_step": 188410, "epoch": 4485} {"train_loss": -7.138787882668631, "global_step": 188411, "epoch": 4485, "val_loss": 69138.6875} {"train_loss": -7.032810211181641, "global_step": 188412, "epoch": 4486} {"train_loss": -7.116748809814453, "global_step": 188413, "epoch": 4486} {"train_loss": -7.126138687133789, "global_step": 188414, "epoch": 4486} {"train_loss": -7.148627281188965, "global_step": 188415, "epoch": 4486} {"train_loss": -7.056622505187988, "global_step": 188416, "epoch": 4486} {"train_loss": -7.1872148513793945, "global_step": 188417, "epoch": 4486} {"train_loss": -7.103610038757324, "global_step": 188418, "epoch": 4486} {"train_loss": -7.07899284362793, "global_step": 188419, "epoch": 4486} {"train_loss": -7.183100700378418, "global_step": 188420, "epoch": 4486} {"train_loss": -7.136343955993652, "global_step": 188421, "epoch": 4486} {"train_loss": -7.140304088592529, "global_step": 188422, "epoch": 4486} {"train_loss": -7.200798988342285, "global_step": 188423, "epoch": 4486} {"train_loss": -7.056193828582764, "global_step": 188424, "epoch": 4486} {"train_loss": -7.315566062927246, "global_step": 188425, "epoch": 4486} {"train_loss": -7.161147117614746, "global_step": 188426, "epoch": 4486} {"train_loss": -7.128779411315918, "global_step": 188427, "epoch": 4486} {"train_loss": -7.213220596313477, "global_step": 188428, "epoch": 4486} {"train_loss": -7.19001579284668, "global_step": 188429, "epoch": 4486} {"train_loss": -7.144107818603516, "global_step": 188430, "epoch": 4486} {"train_loss": -7.029763221740723, "global_step": 188431, "epoch": 4486} {"train_loss": -7.084671974182129, "global_step": 188432, "epoch": 4486} {"train_loss": -7.224087715148926, "global_step": 188433, "epoch": 4486} {"train_loss": -6.978775978088379, "global_step": 188434, "epoch": 4486} {"train_loss": -7.014452934265137, "global_step": 188435, "epoch": 4486} {"train_loss": -7.0894083976745605, "global_step": 188436, "epoch": 4486} {"train_loss": -6.898538589477539, "global_step": 188437, "epoch": 4486} {"train_loss": -7.057981491088867, "global_step": 188438, "epoch": 4486} {"train_loss": -7.220415115356445, "global_step": 188439, "epoch": 4486} {"train_loss": -7.213349342346191, "global_step": 188440, "epoch": 4486} {"train_loss": -7.06629753112793, "global_step": 188441, "epoch": 4486} {"train_loss": -7.100035667419434, "global_step": 188442, "epoch": 4486} {"train_loss": -7.149590969085693, "global_step": 188443, "epoch": 4486} {"train_loss": -7.200530529022217, "global_step": 188444, "epoch": 4486} {"train_loss": -7.166468620300293, "global_step": 188445, "epoch": 4486} {"train_loss": -7.085550308227539, "global_step": 188446, "epoch": 4486} {"train_loss": -7.117505073547363, "global_step": 188447, "epoch": 4486} {"train_loss": -7.137408256530762, "global_step": 188448, "epoch": 4486} {"train_loss": -7.1500396728515625, "global_step": 188449, "epoch": 4486} {"train_loss": -6.8591203689575195, "global_step": 188450, "epoch": 4486} {"train_loss": -7.081391334533691, "global_step": 188451, "epoch": 4486} {"train_loss": -7.095728397369385, "global_step": 188452, "epoch": 4486} {"train_loss": -7.116332599094936, "global_step": 188453, "epoch": 4486, "val_loss": 68896.4375} {"train_loss": -7.227987289428711, "global_step": 188454, "epoch": 4487} {"train_loss": -7.075918197631836, "global_step": 188455, "epoch": 4487} {"train_loss": -7.122632026672363, "global_step": 188456, "epoch": 4487} {"train_loss": -7.1851701736450195, "global_step": 188457, "epoch": 4487} {"train_loss": -7.169549942016602, "global_step": 188458, "epoch": 4487} {"train_loss": -7.000038146972656, "global_step": 188459, "epoch": 4487} {"train_loss": -7.2060041427612305, "global_step": 188460, "epoch": 4487} {"train_loss": -7.105317115783691, "global_step": 188461, "epoch": 4487} {"train_loss": -7.093532085418701, "global_step": 188462, "epoch": 4487} {"train_loss": -7.189148902893066, "global_step": 188463, "epoch": 4487} {"train_loss": -6.977391242980957, "global_step": 188464, "epoch": 4487} {"train_loss": -7.0994720458984375, "global_step": 188465, "epoch": 4487} {"train_loss": -7.1382646560668945, "global_step": 188466, "epoch": 4487} {"train_loss": -7.123333930969238, "global_step": 188467, "epoch": 4487} {"train_loss": -7.18422794342041, "global_step": 188468, "epoch": 4487} {"train_loss": -7.118887901306152, "global_step": 188469, "epoch": 4487} {"train_loss": -7.076605796813965, "global_step": 188470, "epoch": 4487} {"train_loss": -7.097870349884033, "global_step": 188471, "epoch": 4487} {"train_loss": -7.117266654968262, "global_step": 188472, "epoch": 4487} {"train_loss": -7.041176795959473, "global_step": 188473, "epoch": 4487} {"train_loss": -6.964086532592773, "global_step": 188474, "epoch": 4487} {"train_loss": -7.087867259979248, "global_step": 188475, "epoch": 4487} {"train_loss": -6.9947710037231445, "global_step": 188476, "epoch": 4487} {"train_loss": -7.205408096313477, "global_step": 188477, "epoch": 4487} {"train_loss": -6.946127414703369, "global_step": 188478, "epoch": 4487} {"train_loss": -7.114490509033203, "global_step": 188479, "epoch": 4487} {"train_loss": -7.2024946212768555, "global_step": 188480, "epoch": 4487} {"train_loss": -7.15286111831665, "global_step": 188481, "epoch": 4487} {"train_loss": -7.221834182739258, "global_step": 188482, "epoch": 4487} {"train_loss": -7.16856575012207, "global_step": 188483, "epoch": 4487} {"train_loss": -7.092901706695557, "global_step": 188484, "epoch": 4487} {"train_loss": -7.142528057098389, "global_step": 188485, "epoch": 4487} {"train_loss": -7.050702095031738, "global_step": 188486, "epoch": 4487} {"train_loss": -7.047833442687988, "global_step": 188487, "epoch": 4487} {"train_loss": -7.129264831542969, "global_step": 188488, "epoch": 4487} {"train_loss": -7.166617393493652, "global_step": 188489, "epoch": 4487} {"train_loss": -7.137701988220215, "global_step": 188490, "epoch": 4487} {"train_loss": -7.25718879699707, "global_step": 188491, "epoch": 4487} {"train_loss": -7.192688941955566, "global_step": 188492, "epoch": 4487} {"train_loss": -7.110630512237549, "global_step": 188493, "epoch": 4487} {"train_loss": -7.1397809982299805, "global_step": 188494, "epoch": 4487} {"train_loss": -7.122067667189098, "global_step": 188495, "epoch": 4487, "val_loss": 68775.0859375} {"train_loss": -7.047395706176758, "global_step": 188496, "epoch": 4488} {"train_loss": -7.268978118896484, "global_step": 188497, "epoch": 4488} {"train_loss": -7.209434509277344, "global_step": 188498, "epoch": 4488} {"train_loss": -7.238890647888184, "global_step": 188499, "epoch": 4488} {"train_loss": -7.229966163635254, "global_step": 188500, "epoch": 4488} {"train_loss": -7.167036056518555, "global_step": 188501, "epoch": 4488} {"train_loss": -7.175325870513916, "global_step": 188502, "epoch": 4488} {"train_loss": -7.2267746925354, "global_step": 188503, "epoch": 4488} {"train_loss": -7.255570888519287, "global_step": 188504, "epoch": 4488} {"train_loss": -7.138667106628418, "global_step": 188505, "epoch": 4488} {"train_loss": -7.208703994750977, "global_step": 188506, "epoch": 4488} {"train_loss": -7.156441688537598, "global_step": 188507, "epoch": 4488} {"train_loss": -7.290884017944336, "global_step": 188508, "epoch": 4488} {"train_loss": -7.1647725105285645, "global_step": 188509, "epoch": 4488} {"train_loss": -7.162988662719727, "global_step": 188510, "epoch": 4488} {"train_loss": -7.247121810913086, "global_step": 188511, "epoch": 4488} {"train_loss": -7.179870128631592, "global_step": 188512, "epoch": 4488} {"train_loss": -7.13960075378418, "global_step": 188513, "epoch": 4488} {"train_loss": -7.1691741943359375, "global_step": 188514, "epoch": 4488} {"train_loss": -7.073336601257324, "global_step": 188515, "epoch": 4488} {"train_loss": -7.198495864868164, "global_step": 188516, "epoch": 4488} {"train_loss": -6.939406871795654, "global_step": 188517, "epoch": 4488} {"train_loss": -6.991158485412598, "global_step": 188518, "epoch": 4488} {"train_loss": -7.119476795196533, "global_step": 188519, "epoch": 4488} {"train_loss": -7.046213150024414, "global_step": 188520, "epoch": 4488} {"train_loss": -7.052742958068848, "global_step": 188521, "epoch": 4488} {"train_loss": -7.027259826660156, "global_step": 188522, "epoch": 4488} {"train_loss": -7.054557800292969, "global_step": 188523, "epoch": 4488} {"train_loss": -7.073209285736084, "global_step": 188524, "epoch": 4488} {"train_loss": -7.14329719543457, "global_step": 188525, "epoch": 4488} {"train_loss": -7.13181209564209, "global_step": 188526, "epoch": 4488} {"train_loss": -7.1201043128967285, "global_step": 188527, "epoch": 4488} {"train_loss": -7.154853343963623, "global_step": 188528, "epoch": 4488} {"train_loss": -6.983737945556641, "global_step": 188529, "epoch": 4488} {"train_loss": -7.1037445068359375, "global_step": 188530, "epoch": 4488} {"train_loss": -7.014212131500244, "global_step": 188531, "epoch": 4488} {"train_loss": -7.051510810852051, "global_step": 188532, "epoch": 4488} {"train_loss": -7.062246322631836, "global_step": 188533, "epoch": 4488} {"train_loss": -6.931958198547363, "global_step": 188534, "epoch": 4488} {"train_loss": -7.174087047576904, "global_step": 188535, "epoch": 4488} {"train_loss": -6.889494895935059, "global_step": 188536, "epoch": 4488} {"train_loss": -7.121627773557391, "global_step": 188537, "epoch": 4488, "val_loss": 68947.328125} {"train_loss": -7.0779571533203125, "global_step": 188538, "epoch": 4489} {"train_loss": -7.029958724975586, "global_step": 188539, "epoch": 4489} {"train_loss": -7.0616655349731445, "global_step": 188540, "epoch": 4489} {"train_loss": -7.085458278656006, "global_step": 188541, "epoch": 4489} {"train_loss": -7.04666805267334, "global_step": 188542, "epoch": 4489} {"train_loss": -7.046957969665527, "global_step": 188543, "epoch": 4489} {"train_loss": -7.134976863861084, "global_step": 188544, "epoch": 4489} {"train_loss": -7.146413803100586, "global_step": 188545, "epoch": 4489} {"train_loss": -7.076660633087158, "global_step": 188546, "epoch": 4489} {"train_loss": -7.108060836791992, "global_step": 188547, "epoch": 4489} {"train_loss": -7.109338760375977, "global_step": 188548, "epoch": 4489} {"train_loss": -7.0720014572143555, "global_step": 188549, "epoch": 4489} {"train_loss": -7.066669464111328, "global_step": 188550, "epoch": 4489} {"train_loss": -7.125258445739746, "global_step": 188551, "epoch": 4489} {"train_loss": -7.15818977355957, "global_step": 188552, "epoch": 4489} {"train_loss": -7.067711353302002, "global_step": 188553, "epoch": 4489} {"train_loss": -7.128302097320557, "global_step": 188554, "epoch": 4489} {"train_loss": -7.104011535644531, "global_step": 188555, "epoch": 4489} {"train_loss": -7.185548782348633, "global_step": 188556, "epoch": 4489} {"train_loss": -7.1978044509887695, "global_step": 188557, "epoch": 4489} {"train_loss": -7.156526565551758, "global_step": 188558, "epoch": 4489} {"train_loss": -7.268194198608398, "global_step": 188559, "epoch": 4489} {"train_loss": -7.1884870529174805, "global_step": 188560, "epoch": 4489} {"train_loss": -7.113190174102783, "global_step": 188561, "epoch": 4489} {"train_loss": -7.249224662780762, "global_step": 188562, "epoch": 4489} {"train_loss": -7.170341491699219, "global_step": 188563, "epoch": 4489} {"train_loss": -7.207425117492676, "global_step": 188564, "epoch": 4489} {"train_loss": -7.236390113830566, "global_step": 188565, "epoch": 4489} {"train_loss": -7.197376251220703, "global_step": 188566, "epoch": 4489} {"train_loss": -7.220643520355225, "global_step": 188567, "epoch": 4489} {"train_loss": -7.120183944702148, "global_step": 188568, "epoch": 4489} {"train_loss": -7.197230339050293, "global_step": 188569, "epoch": 4489} {"train_loss": -7.311748504638672, "global_step": 188570, "epoch": 4489} {"train_loss": -7.073422908782959, "global_step": 188571, "epoch": 4489} {"train_loss": -7.03764009475708, "global_step": 188572, "epoch": 4489} {"train_loss": -7.274106979370117, "global_step": 188573, "epoch": 4489} {"train_loss": -7.153631687164307, "global_step": 188574, "epoch": 4489} {"train_loss": -7.183020114898682, "global_step": 188575, "epoch": 4489} {"train_loss": -7.248723030090332, "global_step": 188576, "epoch": 4489} {"train_loss": -7.238387584686279, "global_step": 188577, "epoch": 4489} {"train_loss": -7.1412153244018555, "global_step": 188578, "epoch": 4489} {"train_loss": -7.147870710917881, "global_step": 188579, "epoch": 4489, "val_loss": 68981.9453125} {"train_loss": -7.2473225593566895, "global_step": 188580, "epoch": 4490} {"train_loss": -7.1853413581848145, "global_step": 188581, "epoch": 4490} {"train_loss": -7.069765090942383, "global_step": 188582, "epoch": 4490} {"train_loss": -7.086805820465088, "global_step": 188583, "epoch": 4490} {"train_loss": -7.1114397048950195, "global_step": 188584, "epoch": 4490} {"train_loss": -7.195066452026367, "global_step": 188585, "epoch": 4490} {"train_loss": -7.001561164855957, "global_step": 188586, "epoch": 4490} {"train_loss": -7.345777988433838, "global_step": 188587, "epoch": 4490} {"train_loss": -7.0477094650268555, "global_step": 188588, "epoch": 4490} {"train_loss": -7.145600318908691, "global_step": 188589, "epoch": 4490} {"train_loss": -7.21734619140625, "global_step": 188590, "epoch": 4490} {"train_loss": -7.117494583129883, "global_step": 188591, "epoch": 4490} {"train_loss": -7.072027206420898, "global_step": 188592, "epoch": 4490} {"train_loss": -7.176878929138184, "global_step": 188593, "epoch": 4490} {"train_loss": -7.156280040740967, "global_step": 188594, "epoch": 4490} {"train_loss": -7.1744771003723145, "global_step": 188595, "epoch": 4490} {"train_loss": -7.1272172927856445, "global_step": 188596, "epoch": 4490} {"train_loss": -7.2447428703308105, "global_step": 188597, "epoch": 4490} {"train_loss": -7.156269073486328, "global_step": 188598, "epoch": 4490} {"train_loss": -7.09891414642334, "global_step": 188599, "epoch": 4490} {"train_loss": -7.071930885314941, "global_step": 188600, "epoch": 4490} {"train_loss": -7.12502384185791, "global_step": 188601, "epoch": 4490} {"train_loss": -7.178267002105713, "global_step": 188602, "epoch": 4490} {"train_loss": -7.167298793792725, "global_step": 188603, "epoch": 4490} {"train_loss": -7.013571739196777, "global_step": 188604, "epoch": 4490} {"train_loss": -7.112276077270508, "global_step": 188605, "epoch": 4490} {"train_loss": -7.171398639678955, "global_step": 188606, "epoch": 4490} {"train_loss": -7.1392340660095215, "global_step": 188607, "epoch": 4490} {"train_loss": -7.024665355682373, "global_step": 188608, "epoch": 4490} {"train_loss": -7.153358459472656, "global_step": 188609, "epoch": 4490} {"train_loss": -7.120603084564209, "global_step": 188610, "epoch": 4490} {"train_loss": -7.182695388793945, "global_step": 188611, "epoch": 4490} {"train_loss": -7.120667457580566, "global_step": 188612, "epoch": 4490} {"train_loss": -7.134354591369629, "global_step": 188613, "epoch": 4490} {"train_loss": -7.058149337768555, "global_step": 188614, "epoch": 4490} {"train_loss": -7.042031288146973, "global_step": 188615, "epoch": 4490} {"train_loss": -7.113847255706787, "global_step": 188616, "epoch": 4490} {"train_loss": -7.201938629150391, "global_step": 188617, "epoch": 4490} {"train_loss": -7.151760578155518, "global_step": 188618, "epoch": 4490} {"train_loss": -7.10209846496582, "global_step": 188619, "epoch": 4490} {"train_loss": -7.0468854904174805, "global_step": 188620, "epoch": 4490} {"train_loss": -7.130739280155727, "global_step": 188621, "epoch": 4490, "val_loss": 69067.515625} {"train_loss": -7.145462989807129, "global_step": 188622, "epoch": 4491} {"train_loss": -7.007467269897461, "global_step": 188623, "epoch": 4491} {"train_loss": -7.09645938873291, "global_step": 188624, "epoch": 4491} {"train_loss": -7.052895545959473, "global_step": 188625, "epoch": 4491} {"train_loss": -7.200326919555664, "global_step": 188626, "epoch": 4491} {"train_loss": -7.082282543182373, "global_step": 188627, "epoch": 4491} {"train_loss": -7.136966228485107, "global_step": 188628, "epoch": 4491} {"train_loss": -6.963984489440918, "global_step": 188629, "epoch": 4491} {"train_loss": -7.143527507781982, "global_step": 188630, "epoch": 4491} {"train_loss": -6.99216365814209, "global_step": 188631, "epoch": 4491} {"train_loss": -7.00825309753418, "global_step": 188632, "epoch": 4491} {"train_loss": -7.11393404006958, "global_step": 188633, "epoch": 4491} {"train_loss": -7.143536567687988, "global_step": 188634, "epoch": 4491} {"train_loss": -7.11371374130249, "global_step": 188635, "epoch": 4491} {"train_loss": -7.160184860229492, "global_step": 188636, "epoch": 4491} {"train_loss": -7.2265167236328125, "global_step": 188637, "epoch": 4491} {"train_loss": -7.15231466293335, "global_step": 188638, "epoch": 4491} {"train_loss": -7.184619903564453, "global_step": 188639, "epoch": 4491} {"train_loss": -7.205330848693848, "global_step": 188640, "epoch": 4491} {"train_loss": -7.205768585205078, "global_step": 188641, "epoch": 4491} {"train_loss": -7.1863627433776855, "global_step": 188642, "epoch": 4491} {"train_loss": -7.118053436279297, "global_step": 188643, "epoch": 4491} {"train_loss": -7.172297477722168, "global_step": 188644, "epoch": 4491} {"train_loss": -7.213621139526367, "global_step": 188645, "epoch": 4491} {"train_loss": -7.233327388763428, "global_step": 188646, "epoch": 4491} {"train_loss": -7.0673041343688965, "global_step": 188647, "epoch": 4491} {"train_loss": -7.19359016418457, "global_step": 188648, "epoch": 4491} {"train_loss": -7.1751556396484375, "global_step": 188649, "epoch": 4491} {"train_loss": -7.135279655456543, "global_step": 188650, "epoch": 4491} {"train_loss": -7.190742492675781, "global_step": 188651, "epoch": 4491} {"train_loss": -7.208078384399414, "global_step": 188652, "epoch": 4491} {"train_loss": -7.151403427124023, "global_step": 188653, "epoch": 4491} {"train_loss": -7.131923675537109, "global_step": 188654, "epoch": 4491} {"train_loss": -7.138818740844727, "global_step": 188655, "epoch": 4491} {"train_loss": -7.200977802276611, "global_step": 188656, "epoch": 4491} {"train_loss": -7.2138447761535645, "global_step": 188657, "epoch": 4491} {"train_loss": -7.008414268493652, "global_step": 188658, "epoch": 4491} {"train_loss": -7.150266647338867, "global_step": 188659, "epoch": 4491} {"train_loss": -7.10162353515625, "global_step": 188660, "epoch": 4491} {"train_loss": -7.12445068359375, "global_step": 188661, "epoch": 4491} {"train_loss": -7.025689601898193, "global_step": 188662, "epoch": 4491} {"train_loss": -7.132381155377343, "global_step": 188663, "epoch": 4491, "val_loss": 68947.453125} {"train_loss": -7.277653217315674, "global_step": 188664, "epoch": 4492} {"train_loss": -7.2200775146484375, "global_step": 188665, "epoch": 4492} {"train_loss": -7.133464813232422, "global_step": 188666, "epoch": 4492} {"train_loss": -7.100049018859863, "global_step": 188667, "epoch": 4492} {"train_loss": -7.157777786254883, "global_step": 188668, "epoch": 4492} {"train_loss": -7.0944976806640625, "global_step": 188669, "epoch": 4492} {"train_loss": -7.1020355224609375, "global_step": 188670, "epoch": 4492} {"train_loss": -7.244927406311035, "global_step": 188671, "epoch": 4492} {"train_loss": -7.136350154876709, "global_step": 188672, "epoch": 4492} {"train_loss": -7.167956829071045, "global_step": 188673, "epoch": 4492} {"train_loss": -7.125507354736328, "global_step": 188674, "epoch": 4492} {"train_loss": -7.10176944732666, "global_step": 188675, "epoch": 4492} {"train_loss": -7.096673965454102, "global_step": 188676, "epoch": 4492} {"train_loss": -7.200456619262695, "global_step": 188677, "epoch": 4492} {"train_loss": -7.075629711151123, "global_step": 188678, "epoch": 4492} {"train_loss": -7.0175981521606445, "global_step": 188679, "epoch": 4492} {"train_loss": -7.171991348266602, "global_step": 188680, "epoch": 4492} {"train_loss": -7.1875224113464355, "global_step": 188681, "epoch": 4492} {"train_loss": -7.1728925704956055, "global_step": 188682, "epoch": 4492} {"train_loss": -7.131344318389893, "global_step": 188683, "epoch": 4492} {"train_loss": -7.200685501098633, "global_step": 188684, "epoch": 4492} {"train_loss": -7.000140190124512, "global_step": 188685, "epoch": 4492} {"train_loss": -7.038158416748047, "global_step": 188686, "epoch": 4492} {"train_loss": -7.1713409423828125, "global_step": 188687, "epoch": 4492} {"train_loss": -7.053776741027832, "global_step": 188688, "epoch": 4492} {"train_loss": -7.052081108093262, "global_step": 188689, "epoch": 4492} {"train_loss": -7.092825412750244, "global_step": 188690, "epoch": 4492} {"train_loss": -7.10115909576416, "global_step": 188691, "epoch": 4492} {"train_loss": -7.068541526794434, "global_step": 188692, "epoch": 4492} {"train_loss": -7.116610527038574, "global_step": 188693, "epoch": 4492} {"train_loss": -7.171363353729248, "global_step": 188694, "epoch": 4492} {"train_loss": -7.079385757446289, "global_step": 188695, "epoch": 4492} {"train_loss": -7.116395950317383, "global_step": 188696, "epoch": 4492} {"train_loss": -7.11290168762207, "global_step": 188697, "epoch": 4492} {"train_loss": -7.114696979522705, "global_step": 188698, "epoch": 4492} {"train_loss": -7.214746475219727, "global_step": 188699, "epoch": 4492} {"train_loss": -7.147062301635742, "global_step": 188700, "epoch": 4492} {"train_loss": -7.141554832458496, "global_step": 188701, "epoch": 4492} {"train_loss": -7.220376968383789, "global_step": 188702, "epoch": 4492} {"train_loss": -7.17330265045166, "global_step": 188703, "epoch": 4492} {"train_loss": -7.193045139312744, "global_step": 188704, "epoch": 4492} {"train_loss": -7.135116815567017, "global_step": 188705, "epoch": 4492, "val_loss": 68913.265625} {"train_loss": -7.179603099822998, "global_step": 188706, "epoch": 4493} {"train_loss": -7.222811698913574, "global_step": 188707, "epoch": 4493} {"train_loss": -7.279563903808594, "global_step": 188708, "epoch": 4493} {"train_loss": -7.224185466766357, "global_step": 188709, "epoch": 4493} {"train_loss": -7.220320224761963, "global_step": 188710, "epoch": 4493} {"train_loss": -7.2285356521606445, "global_step": 188711, "epoch": 4493} {"train_loss": -7.265988826751709, "global_step": 188712, "epoch": 4493} {"train_loss": -7.109921455383301, "global_step": 188713, "epoch": 4493} {"train_loss": -7.089972972869873, "global_step": 188714, "epoch": 4493} {"train_loss": -7.151005268096924, "global_step": 188715, "epoch": 4493} {"train_loss": -7.126694679260254, "global_step": 188716, "epoch": 4493} {"train_loss": -7.104722499847412, "global_step": 188717, "epoch": 4493} {"train_loss": -7.1527934074401855, "global_step": 188718, "epoch": 4493} {"train_loss": -7.193852424621582, "global_step": 188719, "epoch": 4493} {"train_loss": -7.234668731689453, "global_step": 188720, "epoch": 4493} {"train_loss": -7.109739303588867, "global_step": 188721, "epoch": 4493} {"train_loss": -7.006791591644287, "global_step": 188722, "epoch": 4493} {"train_loss": -7.150050163269043, "global_step": 188723, "epoch": 4493} {"train_loss": -7.019547462463379, "global_step": 188724, "epoch": 4493} {"train_loss": -7.077263832092285, "global_step": 188725, "epoch": 4493} {"train_loss": -7.017787456512451, "global_step": 188726, "epoch": 4493} {"train_loss": -7.158387184143066, "global_step": 188727, "epoch": 4493} {"train_loss": -7.148123741149902, "global_step": 188728, "epoch": 4493} {"train_loss": -7.109681129455566, "global_step": 188729, "epoch": 4493} {"train_loss": -7.239346504211426, "global_step": 188730, "epoch": 4493} {"train_loss": -7.116006851196289, "global_step": 188731, "epoch": 4493} {"train_loss": -7.050604343414307, "global_step": 188732, "epoch": 4493} {"train_loss": -7.215570449829102, "global_step": 188733, "epoch": 4493} {"train_loss": -7.188225269317627, "global_step": 188734, "epoch": 4493} {"train_loss": -7.18918514251709, "global_step": 188735, "epoch": 4493} {"train_loss": -7.093234062194824, "global_step": 188736, "epoch": 4493} {"train_loss": -7.167842864990234, "global_step": 188737, "epoch": 4493} {"train_loss": -7.131224632263184, "global_step": 188738, "epoch": 4493} {"train_loss": -7.139282703399658, "global_step": 188739, "epoch": 4493} {"train_loss": -7.09500789642334, "global_step": 188740, "epoch": 4493} {"train_loss": -7.234701633453369, "global_step": 188741, "epoch": 4493} {"train_loss": -7.061156272888184, "global_step": 188742, "epoch": 4493} {"train_loss": -7.14249324798584, "global_step": 188743, "epoch": 4493} {"train_loss": -7.280433177947998, "global_step": 188744, "epoch": 4493} {"train_loss": -7.180446624755859, "global_step": 188745, "epoch": 4493} {"train_loss": -7.228610992431641, "global_step": 188746, "epoch": 4493} {"train_loss": -7.153348593484788, "global_step": 188747, "epoch": 4493, "val_loss": 68976.0625} {"train_loss": -7.022763252258301, "global_step": 188748, "epoch": 4494} {"train_loss": -7.201778888702393, "global_step": 188749, "epoch": 4494} {"train_loss": -7.230252265930176, "global_step": 188750, "epoch": 4494} {"train_loss": -7.258329391479492, "global_step": 188751, "epoch": 4494} {"train_loss": -7.2235426902771, "global_step": 188752, "epoch": 4494} {"train_loss": -7.166481971740723, "global_step": 188753, "epoch": 4494} {"train_loss": -7.078986167907715, "global_step": 188754, "epoch": 4494} {"train_loss": -7.201225280761719, "global_step": 188755, "epoch": 4494} {"train_loss": -7.156444072723389, "global_step": 188756, "epoch": 4494} {"train_loss": -7.084146022796631, "global_step": 188757, "epoch": 4494} {"train_loss": -7.178976535797119, "global_step": 188758, "epoch": 4494} {"train_loss": -7.265795707702637, "global_step": 188759, "epoch": 4494} {"train_loss": -7.146883964538574, "global_step": 188760, "epoch": 4494} {"train_loss": -7.194974422454834, "global_step": 188761, "epoch": 4494} {"train_loss": -7.158466815948486, "global_step": 188762, "epoch": 4494} {"train_loss": -7.081840515136719, "global_step": 188763, "epoch": 4494} {"train_loss": -7.059658050537109, "global_step": 188764, "epoch": 4494} {"train_loss": -7.085622787475586, "global_step": 188765, "epoch": 4494} {"train_loss": -7.158221244812012, "global_step": 188766, "epoch": 4494} {"train_loss": -7.094970226287842, "global_step": 188767, "epoch": 4494} {"train_loss": -7.166487693786621, "global_step": 188768, "epoch": 4494} {"train_loss": -7.052365303039551, "global_step": 188769, "epoch": 4494} {"train_loss": -7.109370231628418, "global_step": 188770, "epoch": 4494} {"train_loss": -7.141908645629883, "global_step": 188771, "epoch": 4494} {"train_loss": -7.055434226989746, "global_step": 188772, "epoch": 4494} {"train_loss": -7.106265068054199, "global_step": 188773, "epoch": 4494} {"train_loss": -7.016456127166748, "global_step": 188774, "epoch": 4494} {"train_loss": -7.039255142211914, "global_step": 188775, "epoch": 4494} {"train_loss": -7.200985908508301, "global_step": 188776, "epoch": 4494} {"train_loss": -6.9720258712768555, "global_step": 188777, "epoch": 4494} {"train_loss": -7.049732685089111, "global_step": 188778, "epoch": 4494} {"train_loss": -6.861408710479736, "global_step": 188779, "epoch": 4494} {"train_loss": -6.971153259277344, "global_step": 188780, "epoch": 4494} {"train_loss": -7.025949954986572, "global_step": 188781, "epoch": 4494} {"train_loss": -6.8917388916015625, "global_step": 188782, "epoch": 4494} {"train_loss": -7.083160877227783, "global_step": 188783, "epoch": 4494} {"train_loss": -6.941399097442627, "global_step": 188784, "epoch": 4494} {"train_loss": -7.06380033493042, "global_step": 188785, "epoch": 4494} {"train_loss": -6.976611614227295, "global_step": 188786, "epoch": 4494} {"train_loss": -6.959917068481445, "global_step": 188787, "epoch": 4494} {"train_loss": -7.041109085083008, "global_step": 188788, "epoch": 4494} {"train_loss": -7.087282748449416, "global_step": 188789, "epoch": 4494, "val_loss": 68955.5234375} {"train_loss": -6.946264266967773, "global_step": 188790, "epoch": 4495} {"train_loss": -7.048640251159668, "global_step": 188791, "epoch": 4495} {"train_loss": -6.9567036628723145, "global_step": 188792, "epoch": 4495} {"train_loss": -6.992964744567871, "global_step": 188793, "epoch": 4495} {"train_loss": -7.0132670402526855, "global_step": 188794, "epoch": 4495} {"train_loss": -6.989780902862549, "global_step": 188795, "epoch": 4495} {"train_loss": -7.130951881408691, "global_step": 188796, "epoch": 4495} {"train_loss": -6.998148441314697, "global_step": 188797, "epoch": 4495} {"train_loss": -7.059361934661865, "global_step": 188798, "epoch": 4495} {"train_loss": -7.070761203765869, "global_step": 188799, "epoch": 4495} {"train_loss": -7.1276702880859375, "global_step": 188800, "epoch": 4495} {"train_loss": -6.895261764526367, "global_step": 188801, "epoch": 4495} {"train_loss": -7.122304916381836, "global_step": 188802, "epoch": 4495} {"train_loss": -7.128355979919434, "global_step": 188803, "epoch": 4495} {"train_loss": -7.079885959625244, "global_step": 188804, "epoch": 4495} {"train_loss": -7.113500595092773, "global_step": 188805, "epoch": 4495} {"train_loss": -6.970011234283447, "global_step": 188806, "epoch": 4495} {"train_loss": -7.109535217285156, "global_step": 188807, "epoch": 4495} {"train_loss": -7.084679126739502, "global_step": 188808, "epoch": 4495} {"train_loss": -7.15573263168335, "global_step": 188809, "epoch": 4495} {"train_loss": -7.099748134613037, "global_step": 188810, "epoch": 4495} {"train_loss": -7.218400478363037, "global_step": 188811, "epoch": 4495} {"train_loss": -7.089174270629883, "global_step": 188812, "epoch": 4495} {"train_loss": -7.154048442840576, "global_step": 188813, "epoch": 4495} {"train_loss": -7.117847919464111, "global_step": 188814, "epoch": 4495} {"train_loss": -7.122475624084473, "global_step": 188815, "epoch": 4495} {"train_loss": -7.163949489593506, "global_step": 188816, "epoch": 4495} {"train_loss": -7.200729846954346, "global_step": 188817, "epoch": 4495} {"train_loss": -7.148487091064453, "global_step": 188818, "epoch": 4495} {"train_loss": -7.200564384460449, "global_step": 188819, "epoch": 4495} {"train_loss": -7.157410621643066, "global_step": 188820, "epoch": 4495} {"train_loss": -7.009425163269043, "global_step": 188821, "epoch": 4495} {"train_loss": -7.150665283203125, "global_step": 188822, "epoch": 4495} {"train_loss": -7.098001956939697, "global_step": 188823, "epoch": 4495} {"train_loss": -7.18973445892334, "global_step": 188824, "epoch": 4495} {"train_loss": -7.112098217010498, "global_step": 188825, "epoch": 4495} {"train_loss": -7.14164400100708, "global_step": 188826, "epoch": 4495} {"train_loss": -7.085691928863525, "global_step": 188827, "epoch": 4495} {"train_loss": -7.199676513671875, "global_step": 188828, "epoch": 4495} {"train_loss": -7.101557731628418, "global_step": 188829, "epoch": 4495} {"train_loss": -7.181585311889648, "global_step": 188830, "epoch": 4495} {"train_loss": -7.096185082481021, "global_step": 188831, "epoch": 4495, "val_loss": 68922.671875} {"train_loss": -7.026680946350098, "global_step": 188832, "epoch": 4496} {"train_loss": -7.038054466247559, "global_step": 188833, "epoch": 4496} {"train_loss": -6.978147506713867, "global_step": 188834, "epoch": 4496} {"train_loss": -7.133486747741699, "global_step": 188835, "epoch": 4496} {"train_loss": -7.1117262840271, "global_step": 188836, "epoch": 4496} {"train_loss": -7.2184929847717285, "global_step": 188837, "epoch": 4496} {"train_loss": -7.084687232971191, "global_step": 188838, "epoch": 4496} {"train_loss": -7.150339603424072, "global_step": 188839, "epoch": 4496} {"train_loss": -6.93604040145874, "global_step": 188840, "epoch": 4496} {"train_loss": -7.1953630447387695, "global_step": 188841, "epoch": 4496} {"train_loss": -7.355982780456543, "global_step": 188842, "epoch": 4496} {"train_loss": -7.187455177307129, "global_step": 188843, "epoch": 4496} {"train_loss": -6.987890243530273, "global_step": 188844, "epoch": 4496} {"train_loss": -7.296868324279785, "global_step": 188845, "epoch": 4496} {"train_loss": -7.213770866394043, "global_step": 188846, "epoch": 4496} {"train_loss": -7.118924140930176, "global_step": 188847, "epoch": 4496} {"train_loss": -7.1897101402282715, "global_step": 188848, "epoch": 4496} {"train_loss": -7.199729919433594, "global_step": 188849, "epoch": 4496} {"train_loss": -7.2060112953186035, "global_step": 188850, "epoch": 4496} {"train_loss": -7.1869354248046875, "global_step": 188851, "epoch": 4496} {"train_loss": -7.165898323059082, "global_step": 188852, "epoch": 4496} {"train_loss": -7.102733135223389, "global_step": 188853, "epoch": 4496} {"train_loss": -7.143195152282715, "global_step": 188854, "epoch": 4496} {"train_loss": -7.22391414642334, "global_step": 188855, "epoch": 4496} {"train_loss": -7.295262336730957, "global_step": 188856, "epoch": 4496} {"train_loss": -7.203368186950684, "global_step": 188857, "epoch": 4496} {"train_loss": -7.150857925415039, "global_step": 188858, "epoch": 4496} {"train_loss": -7.2284626960754395, "global_step": 188859, "epoch": 4496} {"train_loss": -7.130490779876709, "global_step": 188860, "epoch": 4496} {"train_loss": -7.160500526428223, "global_step": 188861, "epoch": 4496} {"train_loss": -7.146222114562988, "global_step": 188862, "epoch": 4496} {"train_loss": -7.233782768249512, "global_step": 188863, "epoch": 4496} {"train_loss": -7.21099853515625, "global_step": 188864, "epoch": 4496} {"train_loss": -7.145369529724121, "global_step": 188865, "epoch": 4496} {"train_loss": -7.209425449371338, "global_step": 188866, "epoch": 4496} {"train_loss": -7.2524590492248535, "global_step": 188867, "epoch": 4496} {"train_loss": -7.151691913604736, "global_step": 188868, "epoch": 4496} {"train_loss": -7.306299686431885, "global_step": 188869, "epoch": 4496} {"train_loss": -7.010078430175781, "global_step": 188870, "epoch": 4496} {"train_loss": -7.075037002563477, "global_step": 188871, "epoch": 4496} {"train_loss": -7.078067779541016, "global_step": 188872, "epoch": 4496} {"train_loss": -7.151455754325504, "global_step": 188873, "epoch": 4496, "val_loss": 69042.7578125} {"train_loss": -7.078484535217285, "global_step": 188874, "epoch": 4497} {"train_loss": -7.3048505783081055, "global_step": 188875, "epoch": 4497} {"train_loss": -7.142176151275635, "global_step": 188876, "epoch": 4497} {"train_loss": -6.95997953414917, "global_step": 188877, "epoch": 4497} {"train_loss": -7.257701873779297, "global_step": 188878, "epoch": 4497} {"train_loss": -7.186006546020508, "global_step": 188879, "epoch": 4497} {"train_loss": -7.066747665405273, "global_step": 188880, "epoch": 4497} {"train_loss": -7.252807140350342, "global_step": 188881, "epoch": 4497} {"train_loss": -7.190549850463867, "global_step": 188882, "epoch": 4497} {"train_loss": -7.134612083435059, "global_step": 188883, "epoch": 4497} {"train_loss": -7.124459743499756, "global_step": 188884, "epoch": 4497} {"train_loss": -7.066466331481934, "global_step": 188885, "epoch": 4497} {"train_loss": -7.109780788421631, "global_step": 188886, "epoch": 4497} {"train_loss": -7.072640895843506, "global_step": 188887, "epoch": 4497} {"train_loss": -7.0922932624816895, "global_step": 188888, "epoch": 4497} {"train_loss": -7.089377403259277, "global_step": 188889, "epoch": 4497} {"train_loss": -7.144378662109375, "global_step": 188890, "epoch": 4497} {"train_loss": -7.1547627449035645, "global_step": 188891, "epoch": 4497} {"train_loss": -7.137538909912109, "global_step": 188892, "epoch": 4497} {"train_loss": -7.146868705749512, "global_step": 188893, "epoch": 4497} {"train_loss": -7.1656036376953125, "global_step": 188894, "epoch": 4497} {"train_loss": -7.152383804321289, "global_step": 188895, "epoch": 4497} {"train_loss": -7.234241485595703, "global_step": 188896, "epoch": 4497} {"train_loss": -7.099273204803467, "global_step": 188897, "epoch": 4497} {"train_loss": -7.233274459838867, "global_step": 188898, "epoch": 4497} {"train_loss": -7.253349304199219, "global_step": 188899, "epoch": 4497} {"train_loss": -7.155831336975098, "global_step": 188900, "epoch": 4497} {"train_loss": -7.127197742462158, "global_step": 188901, "epoch": 4497} {"train_loss": -7.158815383911133, "global_step": 188902, "epoch": 4497} {"train_loss": -7.333195686340332, "global_step": 188903, "epoch": 4497} {"train_loss": -7.0962114334106445, "global_step": 188904, "epoch": 4497} {"train_loss": -7.1457672119140625, "global_step": 188905, "epoch": 4497} {"train_loss": -7.241964340209961, "global_step": 188906, "epoch": 4497} {"train_loss": -7.129003524780273, "global_step": 188907, "epoch": 4497} {"train_loss": -7.203955173492432, "global_step": 188908, "epoch": 4497} {"train_loss": -7.127089500427246, "global_step": 188909, "epoch": 4497} {"train_loss": -7.077521324157715, "global_step": 188910, "epoch": 4497} {"train_loss": -7.199406623840332, "global_step": 188911, "epoch": 4497} {"train_loss": -7.15069580078125, "global_step": 188912, "epoch": 4497} {"train_loss": -7.1745076179504395, "global_step": 188913, "epoch": 4497} {"train_loss": -7.143871307373047, "global_step": 188914, "epoch": 4497} {"train_loss": -7.1549302736918134, "global_step": 188915, "epoch": 4497, "val_loss": 68892.2109375} {"train_loss": -7.238668441772461, "global_step": 188916, "epoch": 4498} {"train_loss": -7.134490489959717, "global_step": 188917, "epoch": 4498} {"train_loss": -7.089638710021973, "global_step": 188918, "epoch": 4498} {"train_loss": -7.157341957092285, "global_step": 188919, "epoch": 4498} {"train_loss": -7.109987258911133, "global_step": 188920, "epoch": 4498} {"train_loss": -7.143043518066406, "global_step": 188921, "epoch": 4498} {"train_loss": -7.123832702636719, "global_step": 188922, "epoch": 4498} {"train_loss": -7.135199546813965, "global_step": 188923, "epoch": 4498} {"train_loss": -7.079005241394043, "global_step": 188924, "epoch": 4498} {"train_loss": -7.240422248840332, "global_step": 188925, "epoch": 4498} {"train_loss": -7.073084354400635, "global_step": 188926, "epoch": 4498} {"train_loss": -7.116708278656006, "global_step": 188927, "epoch": 4498} {"train_loss": -7.169297218322754, "global_step": 188928, "epoch": 4498} {"train_loss": -7.0025529861450195, "global_step": 188929, "epoch": 4498} {"train_loss": -7.0902204513549805, "global_step": 188930, "epoch": 4498} {"train_loss": -7.0531463623046875, "global_step": 188931, "epoch": 4498} {"train_loss": -7.048590660095215, "global_step": 188932, "epoch": 4498} {"train_loss": -7.17618465423584, "global_step": 188933, "epoch": 4498} {"train_loss": -6.94010066986084, "global_step": 188934, "epoch": 4498} {"train_loss": -7.056591510772705, "global_step": 188935, "epoch": 4498} {"train_loss": -7.105400085449219, "global_step": 188936, "epoch": 4498} {"train_loss": -7.048830986022949, "global_step": 188937, "epoch": 4498} {"train_loss": -7.033313751220703, "global_step": 188938, "epoch": 4498} {"train_loss": -6.990109443664551, "global_step": 188939, "epoch": 4498} {"train_loss": -7.0910162925720215, "global_step": 188940, "epoch": 4498} {"train_loss": -6.938816070556641, "global_step": 188941, "epoch": 4498} {"train_loss": -7.075406551361084, "global_step": 188942, "epoch": 4498} {"train_loss": -6.819609642028809, "global_step": 188943, "epoch": 4498} {"train_loss": -7.15889310836792, "global_step": 188944, "epoch": 4498} {"train_loss": -6.941744327545166, "global_step": 188945, "epoch": 4498} {"train_loss": -7.052993297576904, "global_step": 188946, "epoch": 4498} {"train_loss": -7.144895553588867, "global_step": 188947, "epoch": 4498} {"train_loss": -7.168234348297119, "global_step": 188948, "epoch": 4498} {"train_loss": -7.077147006988525, "global_step": 188949, "epoch": 4498} {"train_loss": -7.222959518432617, "global_step": 188950, "epoch": 4498} {"train_loss": -6.996057510375977, "global_step": 188951, "epoch": 4498} {"train_loss": -7.097650527954102, "global_step": 188952, "epoch": 4498} {"train_loss": -7.073650360107422, "global_step": 188953, "epoch": 4498} {"train_loss": -7.016782760620117, "global_step": 188954, "epoch": 4498} {"train_loss": -7.058410167694092, "global_step": 188955, "epoch": 4498} {"train_loss": -7.158696174621582, "global_step": 188956, "epoch": 4498} {"train_loss": -7.080616303852627, "global_step": 188957, "epoch": 4498, "val_loss": 68757.0078125} {"train_loss": -7.081263065338135, "global_step": 188958, "epoch": 4499} {"train_loss": -7.085766315460205, "global_step": 188959, "epoch": 4499} {"train_loss": -6.975367546081543, "global_step": 188960, "epoch": 4499} {"train_loss": -7.0809783935546875, "global_step": 188961, "epoch": 4499} {"train_loss": -7.018945693969727, "global_step": 188962, "epoch": 4499} {"train_loss": -7.0758585929870605, "global_step": 188963, "epoch": 4499} {"train_loss": -7.066045761108398, "global_step": 188964, "epoch": 4499} {"train_loss": -7.008636474609375, "global_step": 188965, "epoch": 4499} {"train_loss": -7.023532867431641, "global_step": 188966, "epoch": 4499} {"train_loss": -7.036224365234375, "global_step": 188967, "epoch": 4499} {"train_loss": -7.198257923126221, "global_step": 188968, "epoch": 4499} {"train_loss": -6.9630584716796875, "global_step": 188969, "epoch": 4499} {"train_loss": -7.055383682250977, "global_step": 188970, "epoch": 4499} {"train_loss": -7.0335588455200195, "global_step": 188971, "epoch": 4499} {"train_loss": -7.072542190551758, "global_step": 188972, "epoch": 4499} {"train_loss": -7.1006059646606445, "global_step": 188973, "epoch": 4499} {"train_loss": -7.027700424194336, "global_step": 188974, "epoch": 4499} {"train_loss": -7.089596271514893, "global_step": 188975, "epoch": 4499} {"train_loss": -7.008464813232422, "global_step": 188976, "epoch": 4499} {"train_loss": -7.0256123542785645, "global_step": 188977, "epoch": 4499} {"train_loss": -7.062580108642578, "global_step": 188978, "epoch": 4499} {"train_loss": -7.136753082275391, "global_step": 188979, "epoch": 4499} {"train_loss": -6.961663246154785, "global_step": 188980, "epoch": 4499} {"train_loss": -7.223125457763672, "global_step": 188981, "epoch": 4499} {"train_loss": -7.082520484924316, "global_step": 188982, "epoch": 4499} {"train_loss": -7.038005352020264, "global_step": 188983, "epoch": 4499} {"train_loss": -7.218266487121582, "global_step": 188984, "epoch": 4499} {"train_loss": -7.045784950256348, "global_step": 188985, "epoch": 4499} {"train_loss": -7.160187244415283, "global_step": 188986, "epoch": 4499} {"train_loss": -7.127616882324219, "global_step": 188987, "epoch": 4499} {"train_loss": -7.107470989227295, "global_step": 188988, "epoch": 4499} {"train_loss": -7.213772773742676, "global_step": 188989, "epoch": 4499} {"train_loss": -7.180559158325195, "global_step": 188990, "epoch": 4499} {"train_loss": -7.150529861450195, "global_step": 188991, "epoch": 4499} {"train_loss": -7.199093341827393, "global_step": 188992, "epoch": 4499} {"train_loss": -7.286983489990234, "global_step": 188993, "epoch": 4499} {"train_loss": -7.178373336791992, "global_step": 188994, "epoch": 4499} {"train_loss": -7.230199813842773, "global_step": 188995, "epoch": 4499} {"train_loss": -7.2027387619018555, "global_step": 188996, "epoch": 4499} {"train_loss": -7.221114158630371, "global_step": 188997, "epoch": 4499} {"train_loss": -7.231931686401367, "global_step": 188998, "epoch": 4499} {"train_loss": -7.104897408258347, "global_step": 188999, "epoch": 4499, "val_loss": 68857.9140625} {"train_loss": -7.152523517608643, "global_step": 189000, "epoch": 4500} {"train_loss": -7.117942810058594, "global_step": 189001, "epoch": 4500} {"train_loss": -7.1291327476501465, "global_step": 189002, "epoch": 4500} {"train_loss": -7.249179840087891, "global_step": 189003, "epoch": 4500} {"train_loss": -7.173920631408691, "global_step": 189004, "epoch": 4500} {"train_loss": -7.159897327423096, "global_step": 189005, "epoch": 4500} {"train_loss": -7.216513633728027, "global_step": 189006, "epoch": 4500} {"train_loss": -7.169674873352051, "global_step": 189007, "epoch": 4500} {"train_loss": -7.183215141296387, "global_step": 189008, "epoch": 4500} {"train_loss": -7.208500385284424, "global_step": 189009, "epoch": 4500} {"train_loss": -7.203493118286133, "global_step": 189010, "epoch": 4500} {"train_loss": -7.157186508178711, "global_step": 189011, "epoch": 4500} {"train_loss": -7.274425029754639, "global_step": 189012, "epoch": 4500} {"train_loss": -7.220710754394531, "global_step": 189013, "epoch": 4500} {"train_loss": -7.254705429077148, "global_step": 189014, "epoch": 4500} {"train_loss": -7.203982353210449, "global_step": 189015, "epoch": 4500} {"train_loss": -7.368019104003906, "global_step": 189016, "epoch": 4500} {"train_loss": -7.256918907165527, "global_step": 189017, "epoch": 4500} {"train_loss": -7.113836288452148, "global_step": 189018, "epoch": 4500} {"train_loss": -7.150979042053223, "global_step": 189019, "epoch": 4500} {"train_loss": -7.107183933258057, "global_step": 189020, "epoch": 4500} {"train_loss": -7.106285095214844, "global_step": 189021, "epoch": 4500} {"train_loss": -7.244106292724609, "global_step": 189022, "epoch": 4500} {"train_loss": -7.056903839111328, "global_step": 189023, "epoch": 4500} {"train_loss": -7.088903427124023, "global_step": 189024, "epoch": 4500} {"train_loss": -7.170543670654297, "global_step": 189025, "epoch": 4500} {"train_loss": -7.113116264343262, "global_step": 189026, "epoch": 4500} {"train_loss": -7.237959861755371, "global_step": 189027, "epoch": 4500} {"train_loss": -7.167287826538086, "global_step": 189028, "epoch": 4500} {"train_loss": -7.171658515930176, "global_step": 189029, "epoch": 4500} {"train_loss": -7.1215105056762695, "global_step": 189030, "epoch": 4500} {"train_loss": -7.258479595184326, "global_step": 189031, "epoch": 4500} {"train_loss": -7.143794536590576, "global_step": 189032, "epoch": 4500} {"train_loss": -7.1702117919921875, "global_step": 189033, "epoch": 4500} {"train_loss": -7.00105094909668, "global_step": 189034, "epoch": 4500} {"train_loss": -7.180354118347168, "global_step": 189035, "epoch": 4500} {"train_loss": -7.212390899658203, "global_step": 189036, "epoch": 4500} {"train_loss": -7.162537097930908, "global_step": 189037, "epoch": 4500} {"train_loss": -7.138763427734375, "global_step": 189038, "epoch": 4500} {"train_loss": -7.099821090698242, "global_step": 189039, "epoch": 4500} {"train_loss": -7.152358055114746, "global_step": 189040, "epoch": 4500} {"train_loss": -7.172273885636103, "global_step": 189041, "epoch": 4500, "train/sim_max_reward_0": 0.28324698108789687, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.6141393522149556, "train/sim_max_reward_3": 0.13297920540813668, "train/sim_max_reward_4": 0.35567439382797156, "train/sim_max_reward_5": 0.9586439661624863, "test/sim_max_reward_4400000": 0.9067806190924199, "test/sim_max_reward_4400001": 0.2652285325178918, "test/sim_max_reward_4400002": 0.17070024381742593, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.24946213169329332, "test/sim_max_reward_4400006": 0.9906372037283985, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3122990445974901, "test/sim_max_reward_4400009": 0.9862690194000445, "test/sim_max_reward_4400010": 0.2521872207590596, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9713318388147494, "test/sim_max_reward_4400013": 0.9200219047380889, "test/sim_max_reward_4400014": 0.9479432822424181, "test/sim_max_reward_4400015": 0.0015460886353572696, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.33104380047364007, "test/sim_max_reward_4400018": 0.26106121699912305, "test/sim_max_reward_4400019": 0.9507509519543453, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.9052340956077166, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.2679543254694816, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0010306802036420598, "test/sim_max_reward_4400028": 0.7299626593800209, "test/sim_max_reward_4400029": 0.9183001716384568, "test/sim_max_reward_4400030": 0.9746353954299989, "test/sim_max_reward_4400031": 0.9567833607077224, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9962066960463908, "test/sim_max_reward_4400034": 0.9719866738951759, "test/sim_max_reward_4400035": 0.8075922078845049, "test/sim_max_reward_4400036": 0.43244215802430586, "test/sim_max_reward_4400037": 0.9316079267450821, "test/sim_max_reward_4400038": 0.8821776626880966, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9743767688395669, "test/sim_max_reward_4400042": 0.9935630922001087, "test/sim_max_reward_4400043": 0.06656106995910795, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9712404966895467, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 0.9897935817849464, "test/sim_max_reward_4400048": 0.4476659419788278, "test/sim_max_reward_4400049": 0.8784323622516649, "train/mean_score": 0.5574473164502413, "test/mean_score": 0.5851904495969394, "val_loss": 69046.96875} {"train_loss": -7.169075012207031, "global_step": 189042, "epoch": 4501} {"train_loss": -7.119366645812988, "global_step": 189043, "epoch": 4501} {"train_loss": -7.246923446655273, "global_step": 189044, "epoch": 4501} {"train_loss": -7.150674343109131, "global_step": 189045, "epoch": 4501} {"train_loss": -7.086297512054443, "global_step": 189046, "epoch": 4501} {"train_loss": -7.1736626625061035, "global_step": 189047, "epoch": 4501} {"train_loss": -7.142636299133301, "global_step": 189048, "epoch": 4501} {"train_loss": -7.202457427978516, "global_step": 189049, "epoch": 4501} {"train_loss": -7.267151832580566, "global_step": 189050, "epoch": 4501} {"train_loss": -7.2244181632995605, "global_step": 189051, "epoch": 4501} {"train_loss": -7.188950538635254, "global_step": 189052, "epoch": 4501} {"train_loss": -7.1748127937316895, "global_step": 189053, "epoch": 4501} {"train_loss": -7.126368045806885, "global_step": 189054, "epoch": 4501} {"train_loss": -7.1209540367126465, "global_step": 189055, "epoch": 4501} {"train_loss": -7.110681056976318, "global_step": 189056, "epoch": 4501} {"train_loss": -7.20819616317749, "global_step": 189057, "epoch": 4501} {"train_loss": -7.1509904861450195, "global_step": 189058, "epoch": 4501} {"train_loss": -7.027862548828125, "global_step": 189059, "epoch": 4501} {"train_loss": -6.950481414794922, "global_step": 189060, "epoch": 4501} {"train_loss": -7.154548645019531, "global_step": 189061, "epoch": 4501} {"train_loss": -7.075438499450684, "global_step": 189062, "epoch": 4501} {"train_loss": -7.014244079589844, "global_step": 189063, "epoch": 4501} {"train_loss": -7.101903438568115, "global_step": 189064, "epoch": 4501} {"train_loss": -7.026352882385254, "global_step": 189065, "epoch": 4501} {"train_loss": -6.953497409820557, "global_step": 189066, "epoch": 4501} {"train_loss": -7.137138366699219, "global_step": 189067, "epoch": 4501} {"train_loss": -7.122483253479004, "global_step": 189068, "epoch": 4501} {"train_loss": -6.913968086242676, "global_step": 189069, "epoch": 4501} {"train_loss": -7.158871650695801, "global_step": 189070, "epoch": 4501} {"train_loss": -7.113243103027344, "global_step": 189071, "epoch": 4501} {"train_loss": -7.09305477142334, "global_step": 189072, "epoch": 4501} {"train_loss": -7.025478363037109, "global_step": 189073, "epoch": 4501} {"train_loss": -7.003449440002441, "global_step": 189074, "epoch": 4501} {"train_loss": -7.1180572509765625, "global_step": 189075, "epoch": 4501} {"train_loss": -7.140072822570801, "global_step": 189076, "epoch": 4501} {"train_loss": -7.081354141235352, "global_step": 189077, "epoch": 4501} {"train_loss": -7.179250717163086, "global_step": 189078, "epoch": 4501} {"train_loss": -7.100981712341309, "global_step": 189079, "epoch": 4501} {"train_loss": -7.049102306365967, "global_step": 189080, "epoch": 4501} {"train_loss": -7.074862480163574, "global_step": 189081, "epoch": 4501} {"train_loss": -7.029293060302734, "global_step": 189082, "epoch": 4501} {"train_loss": -7.11083848135812, "global_step": 189083, "epoch": 4501, "val_loss": 68862.5859375} {"train_loss": -7.157524585723877, "global_step": 189084, "epoch": 4502} {"train_loss": -7.167305946350098, "global_step": 189085, "epoch": 4502} {"train_loss": -7.304841995239258, "global_step": 189086, "epoch": 4502} {"train_loss": -7.193768501281738, "global_step": 189087, "epoch": 4502} {"train_loss": -7.1630473136901855, "global_step": 189088, "epoch": 4502} {"train_loss": -7.233250617980957, "global_step": 189089, "epoch": 4502} {"train_loss": -7.25056791305542, "global_step": 189090, "epoch": 4502} {"train_loss": -7.181238174438477, "global_step": 189091, "epoch": 4502} {"train_loss": -7.279933929443359, "global_step": 189092, "epoch": 4502} {"train_loss": -7.154892921447754, "global_step": 189093, "epoch": 4502} {"train_loss": -7.171756267547607, "global_step": 189094, "epoch": 4502} {"train_loss": -7.158863067626953, "global_step": 189095, "epoch": 4502} {"train_loss": -7.149646759033203, "global_step": 189096, "epoch": 4502} {"train_loss": -7.240222930908203, "global_step": 189097, "epoch": 4502} {"train_loss": -7.189676761627197, "global_step": 189098, "epoch": 4502} {"train_loss": -7.18583869934082, "global_step": 189099, "epoch": 4502} {"train_loss": -7.105246543884277, "global_step": 189100, "epoch": 4502} {"train_loss": -7.075771331787109, "global_step": 189101, "epoch": 4502} {"train_loss": -7.172420501708984, "global_step": 189102, "epoch": 4502} {"train_loss": -7.190860271453857, "global_step": 189103, "epoch": 4502} {"train_loss": -7.082854270935059, "global_step": 189104, "epoch": 4502} {"train_loss": -7.067451477050781, "global_step": 189105, "epoch": 4502} {"train_loss": -7.076745510101318, "global_step": 189106, "epoch": 4502} {"train_loss": -7.091435432434082, "global_step": 189107, "epoch": 4502} {"train_loss": -7.043516159057617, "global_step": 189108, "epoch": 4502} {"train_loss": -7.20738410949707, "global_step": 189109, "epoch": 4502} {"train_loss": -7.048670768737793, "global_step": 189110, "epoch": 4502} {"train_loss": -7.1248579025268555, "global_step": 189111, "epoch": 4502} {"train_loss": -7.026994705200195, "global_step": 189112, "epoch": 4502} {"train_loss": -7.0337443351745605, "global_step": 189113, "epoch": 4502} {"train_loss": -7.128807067871094, "global_step": 189114, "epoch": 4502} {"train_loss": -6.960181713104248, "global_step": 189115, "epoch": 4502} {"train_loss": -7.098117828369141, "global_step": 189116, "epoch": 4502} {"train_loss": -7.096961975097656, "global_step": 189117, "epoch": 4502} {"train_loss": -7.029232978820801, "global_step": 189118, "epoch": 4502} {"train_loss": -7.056962013244629, "global_step": 189119, "epoch": 4502} {"train_loss": -6.794251441955566, "global_step": 189120, "epoch": 4502} {"train_loss": -7.106058120727539, "global_step": 189121, "epoch": 4502} {"train_loss": -6.938675880432129, "global_step": 189122, "epoch": 4502} {"train_loss": -7.075023174285889, "global_step": 189123, "epoch": 4502} {"train_loss": -6.962792873382568, "global_step": 189124, "epoch": 4502} {"train_loss": -7.11826753616333, "global_step": 189125, "epoch": 4502, "val_loss": 68936.2578125} {"train_loss": -7.119574546813965, "global_step": 189126, "epoch": 4503} {"train_loss": -7.066176414489746, "global_step": 189127, "epoch": 4503} {"train_loss": -7.14142370223999, "global_step": 189128, "epoch": 4503} {"train_loss": -7.106062889099121, "global_step": 189129, "epoch": 4503} {"train_loss": -7.1827898025512695, "global_step": 189130, "epoch": 4503} {"train_loss": -7.161836624145508, "global_step": 189131, "epoch": 4503} {"train_loss": -7.189064025878906, "global_step": 189132, "epoch": 4503} {"train_loss": -7.106316089630127, "global_step": 189133, "epoch": 4503} {"train_loss": -7.17919921875, "global_step": 189134, "epoch": 4503} {"train_loss": -7.16603946685791, "global_step": 189135, "epoch": 4503} {"train_loss": -7.112656116485596, "global_step": 189136, "epoch": 4503} {"train_loss": -7.286334037780762, "global_step": 189137, "epoch": 4503} {"train_loss": -7.186073303222656, "global_step": 189138, "epoch": 4503} {"train_loss": -7.083540439605713, "global_step": 189139, "epoch": 4503} {"train_loss": -7.1154584884643555, "global_step": 189140, "epoch": 4503} {"train_loss": -7.162375450134277, "global_step": 189141, "epoch": 4503} {"train_loss": -7.103710174560547, "global_step": 189142, "epoch": 4503} {"train_loss": -7.155799388885498, "global_step": 189143, "epoch": 4503} {"train_loss": -7.126523017883301, "global_step": 189144, "epoch": 4503} {"train_loss": -7.152706146240234, "global_step": 189145, "epoch": 4503} {"train_loss": -7.058757781982422, "global_step": 189146, "epoch": 4503} {"train_loss": -7.0966033935546875, "global_step": 189147, "epoch": 4503} {"train_loss": -7.133242607116699, "global_step": 189148, "epoch": 4503} {"train_loss": -7.008461952209473, "global_step": 189149, "epoch": 4503} {"train_loss": -7.200974464416504, "global_step": 189150, "epoch": 4503} {"train_loss": -6.909981727600098, "global_step": 189151, "epoch": 4503} {"train_loss": -7.040065288543701, "global_step": 189152, "epoch": 4503} {"train_loss": -7.112009048461914, "global_step": 189153, "epoch": 4503} {"train_loss": -7.083560943603516, "global_step": 189154, "epoch": 4503} {"train_loss": -7.232132911682129, "global_step": 189155, "epoch": 4503} {"train_loss": -7.094977378845215, "global_step": 189156, "epoch": 4503} {"train_loss": -7.051941394805908, "global_step": 189157, "epoch": 4503} {"train_loss": -7.132881164550781, "global_step": 189158, "epoch": 4503} {"train_loss": -7.018772125244141, "global_step": 189159, "epoch": 4503} {"train_loss": -7.132132530212402, "global_step": 189160, "epoch": 4503} {"train_loss": -6.938838005065918, "global_step": 189161, "epoch": 4503} {"train_loss": -7.146796226501465, "global_step": 189162, "epoch": 4503} {"train_loss": -7.045346736907959, "global_step": 189163, "epoch": 4503} {"train_loss": -7.1542510986328125, "global_step": 189164, "epoch": 4503} {"train_loss": -7.106213569641113, "global_step": 189165, "epoch": 4503} {"train_loss": -7.12736177444458, "global_step": 189166, "epoch": 4503} {"train_loss": -7.110756851377941, "global_step": 189167, "epoch": 4503, "val_loss": 68839.5078125} {"train_loss": -7.238724708557129, "global_step": 189168, "epoch": 4504} {"train_loss": -7.241734027862549, "global_step": 189169, "epoch": 4504} {"train_loss": -7.139382362365723, "global_step": 189170, "epoch": 4504} {"train_loss": -7.248251914978027, "global_step": 189171, "epoch": 4504} {"train_loss": -7.184375762939453, "global_step": 189172, "epoch": 4504} {"train_loss": -7.122228145599365, "global_step": 189173, "epoch": 4504} {"train_loss": -7.225655555725098, "global_step": 189174, "epoch": 4504} {"train_loss": -7.180385589599609, "global_step": 189175, "epoch": 4504} {"train_loss": -7.159003257751465, "global_step": 189176, "epoch": 4504} {"train_loss": -7.126090049743652, "global_step": 189177, "epoch": 4504} {"train_loss": -7.213561058044434, "global_step": 189178, "epoch": 4504} {"train_loss": -7.1306939125061035, "global_step": 189179, "epoch": 4504} {"train_loss": -7.215109348297119, "global_step": 189180, "epoch": 4504} {"train_loss": -7.194561958312988, "global_step": 189181, "epoch": 4504} {"train_loss": -7.146507740020752, "global_step": 189182, "epoch": 4504} {"train_loss": -7.221437454223633, "global_step": 189183, "epoch": 4504} {"train_loss": -7.233395576477051, "global_step": 189184, "epoch": 4504} {"train_loss": -7.164433479309082, "global_step": 189185, "epoch": 4504} {"train_loss": -7.2524943351745605, "global_step": 189186, "epoch": 4504} {"train_loss": -7.1136603355407715, "global_step": 189187, "epoch": 4504} {"train_loss": -7.133541584014893, "global_step": 189188, "epoch": 4504} {"train_loss": -7.280218124389648, "global_step": 189189, "epoch": 4504} {"train_loss": -7.196012496948242, "global_step": 189190, "epoch": 4504} {"train_loss": -7.187414169311523, "global_step": 189191, "epoch": 4504} {"train_loss": -7.09155797958374, "global_step": 189192, "epoch": 4504} {"train_loss": -7.241676330566406, "global_step": 189193, "epoch": 4504} {"train_loss": -7.303788185119629, "global_step": 189194, "epoch": 4504} {"train_loss": -7.198544502258301, "global_step": 189195, "epoch": 4504} {"train_loss": -7.156447410583496, "global_step": 189196, "epoch": 4504} {"train_loss": -7.240965366363525, "global_step": 189197, "epoch": 4504} {"train_loss": -7.087727069854736, "global_step": 189198, "epoch": 4504} {"train_loss": -7.1719136238098145, "global_step": 189199, "epoch": 4504} {"train_loss": -7.2967681884765625, "global_step": 189200, "epoch": 4504} {"train_loss": -7.138253688812256, "global_step": 189201, "epoch": 4504} {"train_loss": -7.080094337463379, "global_step": 189202, "epoch": 4504} {"train_loss": -7.04868221282959, "global_step": 189203, "epoch": 4504} {"train_loss": -7.125007629394531, "global_step": 189204, "epoch": 4504} {"train_loss": -7.065074443817139, "global_step": 189205, "epoch": 4504} {"train_loss": -7.095070838928223, "global_step": 189206, "epoch": 4504} {"train_loss": -7.065884113311768, "global_step": 189207, "epoch": 4504} {"train_loss": -7.005662441253662, "global_step": 189208, "epoch": 4504} {"train_loss": -7.162215255555653, "global_step": 189209, "epoch": 4504, "val_loss": 69143.28125} {"train_loss": -7.238764762878418, "global_step": 189210, "epoch": 4505} {"train_loss": -6.9311347007751465, "global_step": 189211, "epoch": 4505} {"train_loss": -6.933515548706055, "global_step": 189212, "epoch": 4505} {"train_loss": -7.093202114105225, "global_step": 189213, "epoch": 4505} {"train_loss": -7.123616695404053, "global_step": 189214, "epoch": 4505} {"train_loss": -7.160252571105957, "global_step": 189215, "epoch": 4505} {"train_loss": -7.142956256866455, "global_step": 189216, "epoch": 4505} {"train_loss": -7.110357284545898, "global_step": 189217, "epoch": 4505} {"train_loss": -7.1405134201049805, "global_step": 189218, "epoch": 4505} {"train_loss": -7.032896995544434, "global_step": 189219, "epoch": 4505} {"train_loss": -7.056000709533691, "global_step": 189220, "epoch": 4505} {"train_loss": -7.019250392913818, "global_step": 189221, "epoch": 4505} {"train_loss": -7.151845932006836, "global_step": 189222, "epoch": 4505} {"train_loss": -7.152584075927734, "global_step": 189223, "epoch": 4505} {"train_loss": -7.124607086181641, "global_step": 189224, "epoch": 4505} {"train_loss": -7.165215492248535, "global_step": 189225, "epoch": 4505} {"train_loss": -7.1318182945251465, "global_step": 189226, "epoch": 4505} {"train_loss": -7.198464870452881, "global_step": 189227, "epoch": 4505} {"train_loss": -7.050065040588379, "global_step": 189228, "epoch": 4505} {"train_loss": -7.154635906219482, "global_step": 189229, "epoch": 4505} {"train_loss": -7.10861873626709, "global_step": 189230, "epoch": 4505} {"train_loss": -7.065773963928223, "global_step": 189231, "epoch": 4505} {"train_loss": -7.215489387512207, "global_step": 189232, "epoch": 4505} {"train_loss": -7.269909858703613, "global_step": 189233, "epoch": 4505} {"train_loss": -7.013902187347412, "global_step": 189234, "epoch": 4505} {"train_loss": -7.201605796813965, "global_step": 189235, "epoch": 4505} {"train_loss": -7.18222713470459, "global_step": 189236, "epoch": 4505} {"train_loss": -7.0704193115234375, "global_step": 189237, "epoch": 4505} {"train_loss": -7.158377170562744, "global_step": 189238, "epoch": 4505} {"train_loss": -7.096810340881348, "global_step": 189239, "epoch": 4505} {"train_loss": -7.154278755187988, "global_step": 189240, "epoch": 4505} {"train_loss": -7.201284408569336, "global_step": 189241, "epoch": 4505} {"train_loss": -7.138856410980225, "global_step": 189242, "epoch": 4505} {"train_loss": -7.202275276184082, "global_step": 189243, "epoch": 4505} {"train_loss": -7.157793998718262, "global_step": 189244, "epoch": 4505} {"train_loss": -7.241194725036621, "global_step": 189245, "epoch": 4505} {"train_loss": -7.142547607421875, "global_step": 189246, "epoch": 4505} {"train_loss": -7.187673568725586, "global_step": 189247, "epoch": 4505} {"train_loss": -7.222966194152832, "global_step": 189248, "epoch": 4505} {"train_loss": -7.029429912567139, "global_step": 189249, "epoch": 4505} {"train_loss": -7.143123626708984, "global_step": 189250, "epoch": 4505} {"train_loss": -7.132358040128436, "global_step": 189251, "epoch": 4505, "val_loss": 68852.8203125} {"train_loss": -7.165510177612305, "global_step": 189252, "epoch": 4506} {"train_loss": -7.028631687164307, "global_step": 189253, "epoch": 4506} {"train_loss": -7.180253982543945, "global_step": 189254, "epoch": 4506} {"train_loss": -7.154254913330078, "global_step": 189255, "epoch": 4506} {"train_loss": -7.187517166137695, "global_step": 189256, "epoch": 4506} {"train_loss": -7.215909004211426, "global_step": 189257, "epoch": 4506} {"train_loss": -7.157476425170898, "global_step": 189258, "epoch": 4506} {"train_loss": -7.257351398468018, "global_step": 189259, "epoch": 4506} {"train_loss": -7.236175537109375, "global_step": 189260, "epoch": 4506} {"train_loss": -7.246422290802002, "global_step": 189261, "epoch": 4506} {"train_loss": -7.232770919799805, "global_step": 189262, "epoch": 4506} {"train_loss": -7.181487083435059, "global_step": 189263, "epoch": 4506} {"train_loss": -7.220153331756592, "global_step": 189264, "epoch": 4506} {"train_loss": -7.207111835479736, "global_step": 189265, "epoch": 4506} {"train_loss": -7.10719108581543, "global_step": 189266, "epoch": 4506} {"train_loss": -7.212961196899414, "global_step": 189267, "epoch": 4506} {"train_loss": -7.1493611335754395, "global_step": 189268, "epoch": 4506} {"train_loss": -7.2307891845703125, "global_step": 189269, "epoch": 4506} {"train_loss": -7.275293350219727, "global_step": 189270, "epoch": 4506} {"train_loss": -7.289710998535156, "global_step": 189271, "epoch": 4506} {"train_loss": -7.173897743225098, "global_step": 189272, "epoch": 4506} {"train_loss": -7.231424331665039, "global_step": 189273, "epoch": 4506} {"train_loss": -7.261468410491943, "global_step": 189274, "epoch": 4506} {"train_loss": -7.277707099914551, "global_step": 189275, "epoch": 4506} {"train_loss": -7.237819671630859, "global_step": 189276, "epoch": 4506} {"train_loss": -7.212778568267822, "global_step": 189277, "epoch": 4506} {"train_loss": -7.160082817077637, "global_step": 189278, "epoch": 4506} {"train_loss": -7.214062213897705, "global_step": 189279, "epoch": 4506} {"train_loss": -7.009883880615234, "global_step": 189280, "epoch": 4506} {"train_loss": -7.0851874351501465, "global_step": 189281, "epoch": 4506} {"train_loss": -7.228144645690918, "global_step": 189282, "epoch": 4506} {"train_loss": -7.162395477294922, "global_step": 189283, "epoch": 4506} {"train_loss": -6.997189521789551, "global_step": 189284, "epoch": 4506} {"train_loss": -7.034691333770752, "global_step": 189285, "epoch": 4506} {"train_loss": -7.190364837646484, "global_step": 189286, "epoch": 4506} {"train_loss": -7.081472396850586, "global_step": 189287, "epoch": 4506} {"train_loss": -7.124662399291992, "global_step": 189288, "epoch": 4506} {"train_loss": -7.041568756103516, "global_step": 189289, "epoch": 4506} {"train_loss": -6.908898830413818, "global_step": 189290, "epoch": 4506} {"train_loss": -7.086601257324219, "global_step": 189291, "epoch": 4506} {"train_loss": -7.136277675628662, "global_step": 189292, "epoch": 4506} {"train_loss": -7.16139090628851, "global_step": 189293, "epoch": 4506, "val_loss": 69047.5546875} {"train_loss": -7.121088981628418, "global_step": 189294, "epoch": 4507} {"train_loss": -6.970355033874512, "global_step": 189295, "epoch": 4507} {"train_loss": -6.968186378479004, "global_step": 189296, "epoch": 4507} {"train_loss": -7.038216590881348, "global_step": 189297, "epoch": 4507} {"train_loss": -7.1123552322387695, "global_step": 189298, "epoch": 4507} {"train_loss": -7.068819046020508, "global_step": 189299, "epoch": 4507} {"train_loss": -7.015143394470215, "global_step": 189300, "epoch": 4507} {"train_loss": -7.187751770019531, "global_step": 189301, "epoch": 4507} {"train_loss": -7.04832649230957, "global_step": 189302, "epoch": 4507} {"train_loss": -6.99766731262207, "global_step": 189303, "epoch": 4507} {"train_loss": -7.113964557647705, "global_step": 189304, "epoch": 4507} {"train_loss": -7.1146931648254395, "global_step": 189305, "epoch": 4507} {"train_loss": -7.139219284057617, "global_step": 189306, "epoch": 4507} {"train_loss": -7.042078971862793, "global_step": 189307, "epoch": 4507} {"train_loss": -7.0362067222595215, "global_step": 189308, "epoch": 4507} {"train_loss": -7.105792999267578, "global_step": 189309, "epoch": 4507} {"train_loss": -7.132615566253662, "global_step": 189310, "epoch": 4507} {"train_loss": -7.2145256996154785, "global_step": 189311, "epoch": 4507} {"train_loss": -7.026402473449707, "global_step": 189312, "epoch": 4507} {"train_loss": -7.116592884063721, "global_step": 189313, "epoch": 4507} {"train_loss": -7.076025485992432, "global_step": 189314, "epoch": 4507} {"train_loss": -7.056078910827637, "global_step": 189315, "epoch": 4507} {"train_loss": -7.141820907592773, "global_step": 189316, "epoch": 4507} {"train_loss": -7.012348175048828, "global_step": 189317, "epoch": 4507} {"train_loss": -6.993618488311768, "global_step": 189318, "epoch": 4507} {"train_loss": -7.028256893157959, "global_step": 189319, "epoch": 4507} {"train_loss": -7.096713542938232, "global_step": 189320, "epoch": 4507} {"train_loss": -6.948022842407227, "global_step": 189321, "epoch": 4507} {"train_loss": -6.950247287750244, "global_step": 189322, "epoch": 4507} {"train_loss": -7.161351203918457, "global_step": 189323, "epoch": 4507} {"train_loss": -6.958852291107178, "global_step": 189324, "epoch": 4507} {"train_loss": -6.952834129333496, "global_step": 189325, "epoch": 4507} {"train_loss": -6.9772844314575195, "global_step": 189326, "epoch": 4507} {"train_loss": -6.911717414855957, "global_step": 189327, "epoch": 4507} {"train_loss": -7.065949440002441, "global_step": 189328, "epoch": 4507} {"train_loss": -6.923648834228516, "global_step": 189329, "epoch": 4507} {"train_loss": -6.965975761413574, "global_step": 189330, "epoch": 4507} {"train_loss": -7.0805206298828125, "global_step": 189331, "epoch": 4507} {"train_loss": -7.080923080444336, "global_step": 189332, "epoch": 4507} {"train_loss": -7.116358757019043, "global_step": 189333, "epoch": 4507} {"train_loss": -7.06627082824707, "global_step": 189334, "epoch": 4507} {"train_loss": -7.054717779159546, "global_step": 189335, "epoch": 4507, "val_loss": 68878.0625} {"train_loss": -7.027817249298096, "global_step": 189336, "epoch": 4508} {"train_loss": -6.9976887702941895, "global_step": 189337, "epoch": 4508} {"train_loss": -7.00214958190918, "global_step": 189338, "epoch": 4508} {"train_loss": -7.075062274932861, "global_step": 189339, "epoch": 4508} {"train_loss": -6.994368076324463, "global_step": 189340, "epoch": 4508} {"train_loss": -7.094492435455322, "global_step": 189341, "epoch": 4508} {"train_loss": -6.960782051086426, "global_step": 189342, "epoch": 4508} {"train_loss": -7.08266544342041, "global_step": 189343, "epoch": 4508} {"train_loss": -6.9343485832214355, "global_step": 189344, "epoch": 4508} {"train_loss": -7.126999378204346, "global_step": 189345, "epoch": 4508} {"train_loss": -7.149318695068359, "global_step": 189346, "epoch": 4508} {"train_loss": -7.12416934967041, "global_step": 189347, "epoch": 4508} {"train_loss": -6.9888529777526855, "global_step": 189348, "epoch": 4508} {"train_loss": -7.101239204406738, "global_step": 189349, "epoch": 4508} {"train_loss": -7.122001647949219, "global_step": 189350, "epoch": 4508} {"train_loss": -7.220266342163086, "global_step": 189351, "epoch": 4508} {"train_loss": -7.026177406311035, "global_step": 189352, "epoch": 4508} {"train_loss": -7.239241600036621, "global_step": 189353, "epoch": 4508} {"train_loss": -7.120510101318359, "global_step": 189354, "epoch": 4508} {"train_loss": -7.101400375366211, "global_step": 189355, "epoch": 4508} {"train_loss": -7.119603157043457, "global_step": 189356, "epoch": 4508} {"train_loss": -7.081734657287598, "global_step": 189357, "epoch": 4508} {"train_loss": -7.102581024169922, "global_step": 189358, "epoch": 4508} {"train_loss": -7.0881476402282715, "global_step": 189359, "epoch": 4508} {"train_loss": -6.983593940734863, "global_step": 189360, "epoch": 4508} {"train_loss": -7.086082935333252, "global_step": 189361, "epoch": 4508} {"train_loss": -7.211989879608154, "global_step": 189362, "epoch": 4508} {"train_loss": -7.1046223640441895, "global_step": 189363, "epoch": 4508} {"train_loss": -6.9978556632995605, "global_step": 189364, "epoch": 4508} {"train_loss": -7.156057357788086, "global_step": 189365, "epoch": 4508} {"train_loss": -7.0447845458984375, "global_step": 189366, "epoch": 4508} {"train_loss": -7.117177963256836, "global_step": 189367, "epoch": 4508} {"train_loss": -7.052840232849121, "global_step": 189368, "epoch": 4508} {"train_loss": -7.0852580070495605, "global_step": 189369, "epoch": 4508} {"train_loss": -7.055235385894775, "global_step": 189370, "epoch": 4508} {"train_loss": -7.0592241287231445, "global_step": 189371, "epoch": 4508} {"train_loss": -7.066021919250488, "global_step": 189372, "epoch": 4508} {"train_loss": -6.982469081878662, "global_step": 189373, "epoch": 4508} {"train_loss": -7.029372215270996, "global_step": 189374, "epoch": 4508} {"train_loss": -7.055610179901123, "global_step": 189375, "epoch": 4508} {"train_loss": -7.047983169555664, "global_step": 189376, "epoch": 4508} {"train_loss": -7.072508777890887, "global_step": 189377, "epoch": 4508, "val_loss": 68926.40625} {"train_loss": -7.13389778137207, "global_step": 189378, "epoch": 4509} {"train_loss": -7.154945373535156, "global_step": 189379, "epoch": 4509} {"train_loss": -7.063819885253906, "global_step": 189380, "epoch": 4509} {"train_loss": -7.112910270690918, "global_step": 189381, "epoch": 4509} {"train_loss": -7.20585298538208, "global_step": 189382, "epoch": 4509} {"train_loss": -7.085731029510498, "global_step": 189383, "epoch": 4509} {"train_loss": -7.1093268394470215, "global_step": 189384, "epoch": 4509} {"train_loss": -7.092812538146973, "global_step": 189385, "epoch": 4509} {"train_loss": -7.0635833740234375, "global_step": 189386, "epoch": 4509} {"train_loss": -7.174269676208496, "global_step": 189387, "epoch": 4509} {"train_loss": -7.092654228210449, "global_step": 189388, "epoch": 4509} {"train_loss": -7.148336887359619, "global_step": 189389, "epoch": 4509} {"train_loss": -7.025214195251465, "global_step": 189390, "epoch": 4509} {"train_loss": -7.236149787902832, "global_step": 189391, "epoch": 4509} {"train_loss": -7.203915119171143, "global_step": 189392, "epoch": 4509} {"train_loss": -7.232184410095215, "global_step": 189393, "epoch": 4509} {"train_loss": -7.229070663452148, "global_step": 189394, "epoch": 4509} {"train_loss": -7.129123687744141, "global_step": 189395, "epoch": 4509} {"train_loss": -7.222801685333252, "global_step": 189396, "epoch": 4509} {"train_loss": -7.063084602355957, "global_step": 189397, "epoch": 4509} {"train_loss": -7.120705604553223, "global_step": 189398, "epoch": 4509} {"train_loss": -7.093833923339844, "global_step": 189399, "epoch": 4509} {"train_loss": -7.138784408569336, "global_step": 189400, "epoch": 4509} {"train_loss": -7.165534019470215, "global_step": 189401, "epoch": 4509} {"train_loss": -7.2377729415893555, "global_step": 189402, "epoch": 4509} {"train_loss": -7.1173601150512695, "global_step": 189403, "epoch": 4509} {"train_loss": -7.139065265655518, "global_step": 189404, "epoch": 4509} {"train_loss": -7.14585018157959, "global_step": 189405, "epoch": 4509} {"train_loss": -7.156129837036133, "global_step": 189406, "epoch": 4509} {"train_loss": -7.231340408325195, "global_step": 189407, "epoch": 4509} {"train_loss": -7.314324378967285, "global_step": 189408, "epoch": 4509} {"train_loss": -7.242698669433594, "global_step": 189409, "epoch": 4509} {"train_loss": -7.2929887771606445, "global_step": 189410, "epoch": 4509} {"train_loss": -7.230301856994629, "global_step": 189411, "epoch": 4509} {"train_loss": -7.159515380859375, "global_step": 189412, "epoch": 4509} {"train_loss": -7.218842029571533, "global_step": 189413, "epoch": 4509} {"train_loss": -7.222014427185059, "global_step": 189414, "epoch": 4509} {"train_loss": -7.213174819946289, "global_step": 189415, "epoch": 4509} {"train_loss": -7.193159103393555, "global_step": 189416, "epoch": 4509} {"train_loss": -7.207286357879639, "global_step": 189417, "epoch": 4509} {"train_loss": -7.184239387512207, "global_step": 189418, "epoch": 4509} {"train_loss": -7.163729588190715, "global_step": 189419, "epoch": 4509, "val_loss": 68864.6015625} {"train_loss": -7.159306049346924, "global_step": 189420, "epoch": 4510} {"train_loss": -7.218405246734619, "global_step": 189421, "epoch": 4510} {"train_loss": -7.117429733276367, "global_step": 189422, "epoch": 4510} {"train_loss": -7.273800373077393, "global_step": 189423, "epoch": 4510} {"train_loss": -7.108888149261475, "global_step": 189424, "epoch": 4510} {"train_loss": -7.254361629486084, "global_step": 189425, "epoch": 4510} {"train_loss": -7.196255207061768, "global_step": 189426, "epoch": 4510} {"train_loss": -7.131337642669678, "global_step": 189427, "epoch": 4510} {"train_loss": -7.148337364196777, "global_step": 189428, "epoch": 4510} {"train_loss": -7.142409324645996, "global_step": 189429, "epoch": 4510} {"train_loss": -7.1931610107421875, "global_step": 189430, "epoch": 4510} {"train_loss": -7.043588638305664, "global_step": 189431, "epoch": 4510} {"train_loss": -7.190086364746094, "global_step": 189432, "epoch": 4510} {"train_loss": -7.197607040405273, "global_step": 189433, "epoch": 4510} {"train_loss": -7.102161884307861, "global_step": 189434, "epoch": 4510} {"train_loss": -7.201700210571289, "global_step": 189435, "epoch": 4510} {"train_loss": -7.111940860748291, "global_step": 189436, "epoch": 4510} {"train_loss": -6.984980583190918, "global_step": 189437, "epoch": 4510} {"train_loss": -7.035144329071045, "global_step": 189438, "epoch": 4510} {"train_loss": -7.0572509765625, "global_step": 189439, "epoch": 4510} {"train_loss": -7.113627910614014, "global_step": 189440, "epoch": 4510} {"train_loss": -7.009434700012207, "global_step": 189441, "epoch": 4510} {"train_loss": -7.105803489685059, "global_step": 189442, "epoch": 4510} {"train_loss": -7.1855363845825195, "global_step": 189443, "epoch": 4510} {"train_loss": -7.08237361907959, "global_step": 189444, "epoch": 4510} {"train_loss": -7.239383220672607, "global_step": 189445, "epoch": 4510} {"train_loss": -7.210673809051514, "global_step": 189446, "epoch": 4510} {"train_loss": -7.061553955078125, "global_step": 189447, "epoch": 4510} {"train_loss": -7.092273712158203, "global_step": 189448, "epoch": 4510} {"train_loss": -7.161829948425293, "global_step": 189449, "epoch": 4510} {"train_loss": -7.14404296875, "global_step": 189450, "epoch": 4510} {"train_loss": -7.155628204345703, "global_step": 189451, "epoch": 4510} {"train_loss": -7.048617839813232, "global_step": 189452, "epoch": 4510} {"train_loss": -7.1363301277160645, "global_step": 189453, "epoch": 4510} {"train_loss": -7.070300102233887, "global_step": 189454, "epoch": 4510} {"train_loss": -6.974791526794434, "global_step": 189455, "epoch": 4510} {"train_loss": -7.058285713195801, "global_step": 189456, "epoch": 4510} {"train_loss": -7.015127182006836, "global_step": 189457, "epoch": 4510} {"train_loss": -7.043376922607422, "global_step": 189458, "epoch": 4510} {"train_loss": -7.147712230682373, "global_step": 189459, "epoch": 4510} {"train_loss": -7.145381927490234, "global_step": 189460, "epoch": 4510} {"train_loss": -7.125746465864635, "global_step": 189461, "epoch": 4510, "val_loss": 68929.28125} {"train_loss": -7.220034122467041, "global_step": 189462, "epoch": 4511} {"train_loss": -7.209824085235596, "global_step": 189463, "epoch": 4511} {"train_loss": -7.229806900024414, "global_step": 189464, "epoch": 4511} {"train_loss": -7.20783805847168, "global_step": 189465, "epoch": 4511} {"train_loss": -7.174612045288086, "global_step": 189466, "epoch": 4511} {"train_loss": -7.097886085510254, "global_step": 189467, "epoch": 4511} {"train_loss": -7.175253868103027, "global_step": 189468, "epoch": 4511} {"train_loss": -7.053223609924316, "global_step": 189469, "epoch": 4511} {"train_loss": -7.260223388671875, "global_step": 189470, "epoch": 4511} {"train_loss": -7.085371017456055, "global_step": 189471, "epoch": 4511} {"train_loss": -7.193796157836914, "global_step": 189472, "epoch": 4511} {"train_loss": -7.204389572143555, "global_step": 189473, "epoch": 4511} {"train_loss": -7.070362091064453, "global_step": 189474, "epoch": 4511} {"train_loss": -7.232278823852539, "global_step": 189475, "epoch": 4511} {"train_loss": -7.122319221496582, "global_step": 189476, "epoch": 4511} {"train_loss": -7.145644187927246, "global_step": 189477, "epoch": 4511} {"train_loss": -7.213827133178711, "global_step": 189478, "epoch": 4511} {"train_loss": -7.219843864440918, "global_step": 189479, "epoch": 4511} {"train_loss": -7.085042953491211, "global_step": 189480, "epoch": 4511} {"train_loss": -7.101232528686523, "global_step": 189481, "epoch": 4511} {"train_loss": -7.148410320281982, "global_step": 189482, "epoch": 4511} {"train_loss": -6.810805797576904, "global_step": 189483, "epoch": 4511} {"train_loss": -7.206572532653809, "global_step": 189484, "epoch": 4511} {"train_loss": -7.062610626220703, "global_step": 189485, "epoch": 4511} {"train_loss": -6.979003429412842, "global_step": 189486, "epoch": 4511} {"train_loss": -7.091190338134766, "global_step": 189487, "epoch": 4511} {"train_loss": -7.089840412139893, "global_step": 189488, "epoch": 4511} {"train_loss": -7.184089660644531, "global_step": 189489, "epoch": 4511} {"train_loss": -7.046811103820801, "global_step": 189490, "epoch": 4511} {"train_loss": -7.009278297424316, "global_step": 189491, "epoch": 4511} {"train_loss": -7.21871280670166, "global_step": 189492, "epoch": 4511} {"train_loss": -7.072806358337402, "global_step": 189493, "epoch": 4511} {"train_loss": -7.205875396728516, "global_step": 189494, "epoch": 4511} {"train_loss": -7.129345893859863, "global_step": 189495, "epoch": 4511} {"train_loss": -7.005030632019043, "global_step": 189496, "epoch": 4511} {"train_loss": -7.121517658233643, "global_step": 189497, "epoch": 4511} {"train_loss": -6.981960296630859, "global_step": 189498, "epoch": 4511} {"train_loss": -7.156763553619385, "global_step": 189499, "epoch": 4511} {"train_loss": -7.0637407302856445, "global_step": 189500, "epoch": 4511} {"train_loss": -7.051692008972168, "global_step": 189501, "epoch": 4511} {"train_loss": -6.971551418304443, "global_step": 189502, "epoch": 4511} {"train_loss": -7.11889310110183, "global_step": 189503, "epoch": 4511, "val_loss": 68988.171875} {"train_loss": -7.047508239746094, "global_step": 189504, "epoch": 4512} {"train_loss": -7.123260974884033, "global_step": 189505, "epoch": 4512} {"train_loss": -7.069721221923828, "global_step": 189506, "epoch": 4512} {"train_loss": -7.082517147064209, "global_step": 189507, "epoch": 4512} {"train_loss": -7.152134895324707, "global_step": 189508, "epoch": 4512} {"train_loss": -7.020876884460449, "global_step": 189509, "epoch": 4512} {"train_loss": -7.199182033538818, "global_step": 189510, "epoch": 4512} {"train_loss": -7.07142448425293, "global_step": 189511, "epoch": 4512} {"train_loss": -7.20754337310791, "global_step": 189512, "epoch": 4512} {"train_loss": -7.019778251647949, "global_step": 189513, "epoch": 4512} {"train_loss": -7.111757755279541, "global_step": 189514, "epoch": 4512} {"train_loss": -7.080199718475342, "global_step": 189515, "epoch": 4512} {"train_loss": -7.1053147315979, "global_step": 189516, "epoch": 4512} {"train_loss": -7.100127220153809, "global_step": 189517, "epoch": 4512} {"train_loss": -6.996966361999512, "global_step": 189518, "epoch": 4512} {"train_loss": -7.1355719566345215, "global_step": 189519, "epoch": 4512} {"train_loss": -7.088786602020264, "global_step": 189520, "epoch": 4512} {"train_loss": -7.187896251678467, "global_step": 189521, "epoch": 4512} {"train_loss": -7.0988359451293945, "global_step": 189522, "epoch": 4512} {"train_loss": -7.135912895202637, "global_step": 189523, "epoch": 4512} {"train_loss": -7.240752696990967, "global_step": 189524, "epoch": 4512} {"train_loss": -7.099270820617676, "global_step": 189525, "epoch": 4512} {"train_loss": -7.10611629486084, "global_step": 189526, "epoch": 4512} {"train_loss": -7.1949567794799805, "global_step": 189527, "epoch": 4512} {"train_loss": -7.091066360473633, "global_step": 189528, "epoch": 4512} {"train_loss": -7.206381797790527, "global_step": 189529, "epoch": 4512} {"train_loss": -7.141179084777832, "global_step": 189530, "epoch": 4512} {"train_loss": -7.084016799926758, "global_step": 189531, "epoch": 4512} {"train_loss": -7.10264253616333, "global_step": 189532, "epoch": 4512} {"train_loss": -7.102443695068359, "global_step": 189533, "epoch": 4512} {"train_loss": -7.216142177581787, "global_step": 189534, "epoch": 4512} {"train_loss": -7.245732307434082, "global_step": 189535, "epoch": 4512} {"train_loss": -7.19212532043457, "global_step": 189536, "epoch": 4512} {"train_loss": -7.157235145568848, "global_step": 189537, "epoch": 4512} {"train_loss": -7.228952407836914, "global_step": 189538, "epoch": 4512} {"train_loss": -7.115973472595215, "global_step": 189539, "epoch": 4512} {"train_loss": -7.185744285583496, "global_step": 189540, "epoch": 4512} {"train_loss": -7.155819416046143, "global_step": 189541, "epoch": 4512} {"train_loss": -7.11894416809082, "global_step": 189542, "epoch": 4512} {"train_loss": -7.161262035369873, "global_step": 189543, "epoch": 4512} {"train_loss": -7.171454429626465, "global_step": 189544, "epoch": 4512} {"train_loss": -7.133721033732097, "global_step": 189545, "epoch": 4512, "val_loss": 68852.8125} {"train_loss": -7.200469017028809, "global_step": 189546, "epoch": 4513} {"train_loss": -7.213785171508789, "global_step": 189547, "epoch": 4513} {"train_loss": -7.150264739990234, "global_step": 189548, "epoch": 4513} {"train_loss": -7.198814392089844, "global_step": 189549, "epoch": 4513} {"train_loss": -7.175574779510498, "global_step": 189550, "epoch": 4513} {"train_loss": -7.091063499450684, "global_step": 189551, "epoch": 4513} {"train_loss": -7.059930801391602, "global_step": 189552, "epoch": 4513} {"train_loss": -7.083347797393799, "global_step": 189553, "epoch": 4513} {"train_loss": -7.0612993240356445, "global_step": 189554, "epoch": 4513} {"train_loss": -7.071274757385254, "global_step": 189555, "epoch": 4513} {"train_loss": -7.176753044128418, "global_step": 189556, "epoch": 4513} {"train_loss": -7.0095744132995605, "global_step": 189557, "epoch": 4513} {"train_loss": -7.042820930480957, "global_step": 189558, "epoch": 4513} {"train_loss": -7.250214576721191, "global_step": 189559, "epoch": 4513} {"train_loss": -7.03504753112793, "global_step": 189560, "epoch": 4513} {"train_loss": -7.106399059295654, "global_step": 189561, "epoch": 4513} {"train_loss": -7.254485130310059, "global_step": 189562, "epoch": 4513} {"train_loss": -7.089347839355469, "global_step": 189563, "epoch": 4513} {"train_loss": -7.149938106536865, "global_step": 189564, "epoch": 4513} {"train_loss": -7.169903755187988, "global_step": 189565, "epoch": 4513} {"train_loss": -7.188012599945068, "global_step": 189566, "epoch": 4513} {"train_loss": -7.216141700744629, "global_step": 189567, "epoch": 4513} {"train_loss": -7.164299964904785, "global_step": 189568, "epoch": 4513} {"train_loss": -7.174839019775391, "global_step": 189569, "epoch": 4513} {"train_loss": -7.273319244384766, "global_step": 189570, "epoch": 4513} {"train_loss": -7.15440034866333, "global_step": 189571, "epoch": 4513} {"train_loss": -7.153043746948242, "global_step": 189572, "epoch": 4513} {"train_loss": -7.238719463348389, "global_step": 189573, "epoch": 4513} {"train_loss": -7.2125372886657715, "global_step": 189574, "epoch": 4513} {"train_loss": -7.284775733947754, "global_step": 189575, "epoch": 4513} {"train_loss": -7.132909774780273, "global_step": 189576, "epoch": 4513} {"train_loss": -7.18120813369751, "global_step": 189577, "epoch": 4513} {"train_loss": -7.245491981506348, "global_step": 189578, "epoch": 4513} {"train_loss": -7.2420525550842285, "global_step": 189579, "epoch": 4513} {"train_loss": -7.199490547180176, "global_step": 189580, "epoch": 4513} {"train_loss": -7.190032958984375, "global_step": 189581, "epoch": 4513} {"train_loss": -7.292129039764404, "global_step": 189582, "epoch": 4513} {"train_loss": -7.228506088256836, "global_step": 189583, "epoch": 4513} {"train_loss": -7.221731662750244, "global_step": 189584, "epoch": 4513} {"train_loss": -7.204336166381836, "global_step": 189585, "epoch": 4513} {"train_loss": -7.273094654083252, "global_step": 189586, "epoch": 4513} {"train_loss": -7.1734727791377475, "global_step": 189587, "epoch": 4513, "val_loss": 68805.609375} {"train_loss": -7.213232040405273, "global_step": 189588, "epoch": 4514} {"train_loss": -7.208759307861328, "global_step": 189589, "epoch": 4514} {"train_loss": -7.1726789474487305, "global_step": 189590, "epoch": 4514} {"train_loss": -7.260536193847656, "global_step": 189591, "epoch": 4514} {"train_loss": -7.222529411315918, "global_step": 189592, "epoch": 4514} {"train_loss": -7.208459854125977, "global_step": 189593, "epoch": 4514} {"train_loss": -7.21829891204834, "global_step": 189594, "epoch": 4514} {"train_loss": -7.11751127243042, "global_step": 189595, "epoch": 4514} {"train_loss": -7.231207847595215, "global_step": 189596, "epoch": 4514} {"train_loss": -7.1785430908203125, "global_step": 189597, "epoch": 4514} {"train_loss": -7.156061172485352, "global_step": 189598, "epoch": 4514} {"train_loss": -7.239417552947998, "global_step": 189599, "epoch": 4514} {"train_loss": -7.1084208488464355, "global_step": 189600, "epoch": 4514} {"train_loss": -7.296818256378174, "global_step": 189601, "epoch": 4514} {"train_loss": -7.250661373138428, "global_step": 189602, "epoch": 4514} {"train_loss": -7.153354644775391, "global_step": 189603, "epoch": 4514} {"train_loss": -7.251241683959961, "global_step": 189604, "epoch": 4514} {"train_loss": -7.25237512588501, "global_step": 189605, "epoch": 4514} {"train_loss": -7.242243766784668, "global_step": 189606, "epoch": 4514} {"train_loss": -7.28045654296875, "global_step": 189607, "epoch": 4514} {"train_loss": -7.1786956787109375, "global_step": 189608, "epoch": 4514} {"train_loss": -7.243382453918457, "global_step": 189609, "epoch": 4514} {"train_loss": -7.1243205070495605, "global_step": 189610, "epoch": 4514} {"train_loss": -7.142037391662598, "global_step": 189611, "epoch": 4514} {"train_loss": -7.069021224975586, "global_step": 189612, "epoch": 4514} {"train_loss": -7.331371307373047, "global_step": 189613, "epoch": 4514} {"train_loss": -7.081425666809082, "global_step": 189614, "epoch": 4514} {"train_loss": -7.076141357421875, "global_step": 189615, "epoch": 4514} {"train_loss": -7.194289207458496, "global_step": 189616, "epoch": 4514} {"train_loss": -7.146411895751953, "global_step": 189617, "epoch": 4514} {"train_loss": -6.971166610717773, "global_step": 189618, "epoch": 4514} {"train_loss": -7.0667829513549805, "global_step": 189619, "epoch": 4514} {"train_loss": -7.079451560974121, "global_step": 189620, "epoch": 4514} {"train_loss": -7.060473442077637, "global_step": 189621, "epoch": 4514} {"train_loss": -7.0723772048950195, "global_step": 189622, "epoch": 4514} {"train_loss": -6.92916202545166, "global_step": 189623, "epoch": 4514} {"train_loss": -7.044214248657227, "global_step": 189624, "epoch": 4514} {"train_loss": -6.893305778503418, "global_step": 189625, "epoch": 4514} {"train_loss": -6.987145900726318, "global_step": 189626, "epoch": 4514} {"train_loss": -7.003008842468262, "global_step": 189627, "epoch": 4514} {"train_loss": -7.14915657043457, "global_step": 189628, "epoch": 4514} {"train_loss": -7.146966116768973, "global_step": 189629, "epoch": 4514, "val_loss": 68915.0546875} {"train_loss": -6.947610855102539, "global_step": 189630, "epoch": 4515} {"train_loss": -7.062535285949707, "global_step": 189631, "epoch": 4515} {"train_loss": -6.840785503387451, "global_step": 189632, "epoch": 4515} {"train_loss": -7.018911361694336, "global_step": 189633, "epoch": 4515} {"train_loss": -6.994567394256592, "global_step": 189634, "epoch": 4515} {"train_loss": -6.930227756500244, "global_step": 189635, "epoch": 4515} {"train_loss": -7.0120463371276855, "global_step": 189636, "epoch": 4515} {"train_loss": -6.950911998748779, "global_step": 189637, "epoch": 4515} {"train_loss": -6.953072547912598, "global_step": 189638, "epoch": 4515} {"train_loss": -7.077441215515137, "global_step": 189639, "epoch": 4515} {"train_loss": -7.040616512298584, "global_step": 189640, "epoch": 4515} {"train_loss": -7.0481672286987305, "global_step": 189641, "epoch": 4515} {"train_loss": -7.004644393920898, "global_step": 189642, "epoch": 4515} {"train_loss": -7.031582832336426, "global_step": 189643, "epoch": 4515} {"train_loss": -7.193408966064453, "global_step": 189644, "epoch": 4515} {"train_loss": -6.995102882385254, "global_step": 189645, "epoch": 4515} {"train_loss": -7.1339006423950195, "global_step": 189646, "epoch": 4515} {"train_loss": -6.964831829071045, "global_step": 189647, "epoch": 4515} {"train_loss": -7.107421398162842, "global_step": 189648, "epoch": 4515} {"train_loss": -7.0711774826049805, "global_step": 189649, "epoch": 4515} {"train_loss": -7.075782775878906, "global_step": 189650, "epoch": 4515} {"train_loss": -7.035490036010742, "global_step": 189651, "epoch": 4515} {"train_loss": -7.019285678863525, "global_step": 189652, "epoch": 4515} {"train_loss": -6.9812140464782715, "global_step": 189653, "epoch": 4515} {"train_loss": -7.102656841278076, "global_step": 189654, "epoch": 4515} {"train_loss": -7.213526725769043, "global_step": 189655, "epoch": 4515} {"train_loss": -7.054447174072266, "global_step": 189656, "epoch": 4515} {"train_loss": -7.166860103607178, "global_step": 189657, "epoch": 4515} {"train_loss": -6.830885410308838, "global_step": 189658, "epoch": 4515} {"train_loss": -7.1063432693481445, "global_step": 189659, "epoch": 4515} {"train_loss": -6.9462714195251465, "global_step": 189660, "epoch": 4515} {"train_loss": -7.075095176696777, "global_step": 189661, "epoch": 4515} {"train_loss": -7.059004783630371, "global_step": 189662, "epoch": 4515} {"train_loss": -7.120174407958984, "global_step": 189663, "epoch": 4515} {"train_loss": -6.9179487228393555, "global_step": 189664, "epoch": 4515} {"train_loss": -7.113088607788086, "global_step": 189665, "epoch": 4515} {"train_loss": -7.06974983215332, "global_step": 189666, "epoch": 4515} {"train_loss": -7.160383701324463, "global_step": 189667, "epoch": 4515} {"train_loss": -7.153399467468262, "global_step": 189668, "epoch": 4515} {"train_loss": -7.1440534591674805, "global_step": 189669, "epoch": 4515} {"train_loss": -7.207454204559326, "global_step": 189670, "epoch": 4515} {"train_loss": -7.050392218998501, "global_step": 189671, "epoch": 4515, "val_loss": 68810.296875} {"train_loss": -7.066926002502441, "global_step": 189672, "epoch": 4516} {"train_loss": -7.196083068847656, "global_step": 189673, "epoch": 4516} {"train_loss": -7.10958194732666, "global_step": 189674, "epoch": 4516} {"train_loss": -7.177718639373779, "global_step": 189675, "epoch": 4516} {"train_loss": -7.212695598602295, "global_step": 189676, "epoch": 4516} {"train_loss": -7.148190498352051, "global_step": 189677, "epoch": 4516} {"train_loss": -7.164628982543945, "global_step": 189678, "epoch": 4516} {"train_loss": -7.216891288757324, "global_step": 189679, "epoch": 4516} {"train_loss": -7.209585189819336, "global_step": 189680, "epoch": 4516} {"train_loss": -7.186526298522949, "global_step": 189681, "epoch": 4516} {"train_loss": -7.129822731018066, "global_step": 189682, "epoch": 4516} {"train_loss": -7.271125316619873, "global_step": 189683, "epoch": 4516} {"train_loss": -7.214811325073242, "global_step": 189684, "epoch": 4516} {"train_loss": -7.128704071044922, "global_step": 189685, "epoch": 4516} {"train_loss": -7.170018672943115, "global_step": 189686, "epoch": 4516} {"train_loss": -7.197719573974609, "global_step": 189687, "epoch": 4516} {"train_loss": -7.200680732727051, "global_step": 189688, "epoch": 4516} {"train_loss": -7.188129425048828, "global_step": 189689, "epoch": 4516} {"train_loss": -7.160998821258545, "global_step": 189690, "epoch": 4516} {"train_loss": -7.259946823120117, "global_step": 189691, "epoch": 4516} {"train_loss": -7.196671485900879, "global_step": 189692, "epoch": 4516} {"train_loss": -7.251835346221924, "global_step": 189693, "epoch": 4516} {"train_loss": -7.189868927001953, "global_step": 189694, "epoch": 4516} {"train_loss": -7.262813568115234, "global_step": 189695, "epoch": 4516} {"train_loss": -7.2389678955078125, "global_step": 189696, "epoch": 4516} {"train_loss": -7.17279052734375, "global_step": 189697, "epoch": 4516} {"train_loss": -7.209719181060791, "global_step": 189698, "epoch": 4516} {"train_loss": -7.136392116546631, "global_step": 189699, "epoch": 4516} {"train_loss": -7.10015869140625, "global_step": 189700, "epoch": 4516} {"train_loss": -7.222141265869141, "global_step": 189701, "epoch": 4516} {"train_loss": -7.273959159851074, "global_step": 189702, "epoch": 4516} {"train_loss": -7.320235252380371, "global_step": 189703, "epoch": 4516} {"train_loss": -7.225961685180664, "global_step": 189704, "epoch": 4516} {"train_loss": -7.328063011169434, "global_step": 189705, "epoch": 4516} {"train_loss": -7.255949974060059, "global_step": 189706, "epoch": 4516} {"train_loss": -7.124520301818848, "global_step": 189707, "epoch": 4516} {"train_loss": -7.1610307693481445, "global_step": 189708, "epoch": 4516} {"train_loss": -7.204261302947998, "global_step": 189709, "epoch": 4516} {"train_loss": -7.1856184005737305, "global_step": 189710, "epoch": 4516} {"train_loss": -7.196987152099609, "global_step": 189711, "epoch": 4516} {"train_loss": -7.265654563903809, "global_step": 189712, "epoch": 4516} {"train_loss": -7.194872958319528, "global_step": 189713, "epoch": 4516, "val_loss": 68816.515625} {"train_loss": -7.155760288238525, "global_step": 189714, "epoch": 4517} {"train_loss": -7.205828666687012, "global_step": 189715, "epoch": 4517} {"train_loss": -7.013509750366211, "global_step": 189716, "epoch": 4517} {"train_loss": -7.184828281402588, "global_step": 189717, "epoch": 4517} {"train_loss": -7.260227203369141, "global_step": 189718, "epoch": 4517} {"train_loss": -7.101889610290527, "global_step": 189719, "epoch": 4517} {"train_loss": -7.273099899291992, "global_step": 189720, "epoch": 4517} {"train_loss": -7.172853946685791, "global_step": 189721, "epoch": 4517} {"train_loss": -7.101327896118164, "global_step": 189722, "epoch": 4517} {"train_loss": -7.195001602172852, "global_step": 189723, "epoch": 4517} {"train_loss": -7.008027076721191, "global_step": 189724, "epoch": 4517} {"train_loss": -7.050693035125732, "global_step": 189725, "epoch": 4517} {"train_loss": -7.192300796508789, "global_step": 189726, "epoch": 4517} {"train_loss": -7.18774938583374, "global_step": 189727, "epoch": 4517} {"train_loss": -7.113386154174805, "global_step": 189728, "epoch": 4517} {"train_loss": -7.134311676025391, "global_step": 189729, "epoch": 4517} {"train_loss": -7.214686393737793, "global_step": 189730, "epoch": 4517} {"train_loss": -6.9347243309021, "global_step": 189731, "epoch": 4517} {"train_loss": -7.069109916687012, "global_step": 189732, "epoch": 4517} {"train_loss": -7.093131065368652, "global_step": 189733, "epoch": 4517} {"train_loss": -7.08358907699585, "global_step": 189734, "epoch": 4517} {"train_loss": -7.00788688659668, "global_step": 189735, "epoch": 4517} {"train_loss": -7.1087751388549805, "global_step": 189736, "epoch": 4517} {"train_loss": -7.127900123596191, "global_step": 189737, "epoch": 4517} {"train_loss": -7.128597259521484, "global_step": 189738, "epoch": 4517} {"train_loss": -7.1012725830078125, "global_step": 189739, "epoch": 4517} {"train_loss": -7.111461639404297, "global_step": 189740, "epoch": 4517} {"train_loss": -7.0725507736206055, "global_step": 189741, "epoch": 4517} {"train_loss": -7.1747541427612305, "global_step": 189742, "epoch": 4517} {"train_loss": -7.0858354568481445, "global_step": 189743, "epoch": 4517} {"train_loss": -7.0816240310668945, "global_step": 189744, "epoch": 4517} {"train_loss": -7.1027069091796875, "global_step": 189745, "epoch": 4517} {"train_loss": -6.992176055908203, "global_step": 189746, "epoch": 4517} {"train_loss": -7.154056072235107, "global_step": 189747, "epoch": 4517} {"train_loss": -7.14017915725708, "global_step": 189748, "epoch": 4517} {"train_loss": -7.145092964172363, "global_step": 189749, "epoch": 4517} {"train_loss": -7.120275497436523, "global_step": 189750, "epoch": 4517} {"train_loss": -7.118059158325195, "global_step": 189751, "epoch": 4517} {"train_loss": -7.210586071014404, "global_step": 189752, "epoch": 4517} {"train_loss": -7.122053146362305, "global_step": 189753, "epoch": 4517} {"train_loss": -7.17855167388916, "global_step": 189754, "epoch": 4517} {"train_loss": -7.119970889318557, "global_step": 189755, "epoch": 4517, "val_loss": 68947.765625} {"train_loss": -7.066072463989258, "global_step": 189756, "epoch": 4518} {"train_loss": -7.20944881439209, "global_step": 189757, "epoch": 4518} {"train_loss": -7.264235973358154, "global_step": 189758, "epoch": 4518} {"train_loss": -7.086889266967773, "global_step": 189759, "epoch": 4518} {"train_loss": -7.176146030426025, "global_step": 189760, "epoch": 4518} {"train_loss": -7.053067684173584, "global_step": 189761, "epoch": 4518} {"train_loss": -7.235159397125244, "global_step": 189762, "epoch": 4518} {"train_loss": -6.987872123718262, "global_step": 189763, "epoch": 4518} {"train_loss": -7.144755840301514, "global_step": 189764, "epoch": 4518} {"train_loss": -7.113623142242432, "global_step": 189765, "epoch": 4518} {"train_loss": -7.056248664855957, "global_step": 189766, "epoch": 4518} {"train_loss": -7.163568496704102, "global_step": 189767, "epoch": 4518} {"train_loss": -7.1589765548706055, "global_step": 189768, "epoch": 4518} {"train_loss": -7.153636932373047, "global_step": 189769, "epoch": 4518} {"train_loss": -7.109764575958252, "global_step": 189770, "epoch": 4518} {"train_loss": -7.057222366333008, "global_step": 189771, "epoch": 4518} {"train_loss": -7.182710647583008, "global_step": 189772, "epoch": 4518} {"train_loss": -7.234304428100586, "global_step": 189773, "epoch": 4518} {"train_loss": -7.219104290008545, "global_step": 189774, "epoch": 4518} {"train_loss": -7.084270477294922, "global_step": 189775, "epoch": 4518} {"train_loss": -7.189756393432617, "global_step": 189776, "epoch": 4518} {"train_loss": -7.159931659698486, "global_step": 189777, "epoch": 4518} {"train_loss": -7.1016740798950195, "global_step": 189778, "epoch": 4518} {"train_loss": -7.211326599121094, "global_step": 189779, "epoch": 4518} {"train_loss": -7.141969203948975, "global_step": 189780, "epoch": 4518} {"train_loss": -7.056073188781738, "global_step": 189781, "epoch": 4518} {"train_loss": -7.086718559265137, "global_step": 189782, "epoch": 4518} {"train_loss": -7.055307865142822, "global_step": 189783, "epoch": 4518} {"train_loss": -7.121011257171631, "global_step": 189784, "epoch": 4518} {"train_loss": -7.138327598571777, "global_step": 189785, "epoch": 4518} {"train_loss": -7.128127098083496, "global_step": 189786, "epoch": 4518} {"train_loss": -7.058590888977051, "global_step": 189787, "epoch": 4518} {"train_loss": -7.041154861450195, "global_step": 189788, "epoch": 4518} {"train_loss": -7.102204322814941, "global_step": 189789, "epoch": 4518} {"train_loss": -7.050203323364258, "global_step": 189790, "epoch": 4518} {"train_loss": -7.163159370422363, "global_step": 189791, "epoch": 4518} {"train_loss": -7.006742477416992, "global_step": 189792, "epoch": 4518} {"train_loss": -7.0950117111206055, "global_step": 189793, "epoch": 4518} {"train_loss": -7.178038597106934, "global_step": 189794, "epoch": 4518} {"train_loss": -7.036755561828613, "global_step": 189795, "epoch": 4518} {"train_loss": -7.090606212615967, "global_step": 189796, "epoch": 4518} {"train_loss": -7.122055394308908, "global_step": 189797, "epoch": 4518, "val_loss": 69114.5078125} {"train_loss": -7.071898460388184, "global_step": 189798, "epoch": 4519} {"train_loss": -7.2046685218811035, "global_step": 189799, "epoch": 4519} {"train_loss": -7.074414253234863, "global_step": 189800, "epoch": 4519} {"train_loss": -6.8650431632995605, "global_step": 189801, "epoch": 4519} {"train_loss": -7.023654460906982, "global_step": 189802, "epoch": 4519} {"train_loss": -7.067350387573242, "global_step": 189803, "epoch": 4519} {"train_loss": -7.108135223388672, "global_step": 189804, "epoch": 4519} {"train_loss": -7.031780242919922, "global_step": 189805, "epoch": 4519} {"train_loss": -7.090776443481445, "global_step": 189806, "epoch": 4519} {"train_loss": -7.039491176605225, "global_step": 189807, "epoch": 4519} {"train_loss": -7.164403915405273, "global_step": 189808, "epoch": 4519} {"train_loss": -7.114067077636719, "global_step": 189809, "epoch": 4519} {"train_loss": -6.977682590484619, "global_step": 189810, "epoch": 4519} {"train_loss": -7.134215831756592, "global_step": 189811, "epoch": 4519} {"train_loss": -7.080066680908203, "global_step": 189812, "epoch": 4519} {"train_loss": -7.200758934020996, "global_step": 189813, "epoch": 4519} {"train_loss": -7.170217990875244, "global_step": 189814, "epoch": 4519} {"train_loss": -7.168046951293945, "global_step": 189815, "epoch": 4519} {"train_loss": -7.109912395477295, "global_step": 189816, "epoch": 4519} {"train_loss": -7.081027030944824, "global_step": 189817, "epoch": 4519} {"train_loss": -7.047489166259766, "global_step": 189818, "epoch": 4519} {"train_loss": -7.105867385864258, "global_step": 189819, "epoch": 4519} {"train_loss": -7.187493324279785, "global_step": 189820, "epoch": 4519} {"train_loss": -7.1550397872924805, "global_step": 189821, "epoch": 4519} {"train_loss": -7.203534126281738, "global_step": 189822, "epoch": 4519} {"train_loss": -7.072759628295898, "global_step": 189823, "epoch": 4519} {"train_loss": -7.092804908752441, "global_step": 189824, "epoch": 4519} {"train_loss": -7.119411468505859, "global_step": 189825, "epoch": 4519} {"train_loss": -7.103989601135254, "global_step": 189826, "epoch": 4519} {"train_loss": -7.183038234710693, "global_step": 189827, "epoch": 4519} {"train_loss": -7.239536285400391, "global_step": 189828, "epoch": 4519} {"train_loss": -7.038046836853027, "global_step": 189829, "epoch": 4519} {"train_loss": -7.207508087158203, "global_step": 189830, "epoch": 4519} {"train_loss": -7.157960891723633, "global_step": 189831, "epoch": 4519} {"train_loss": -7.151281833648682, "global_step": 189832, "epoch": 4519} {"train_loss": -7.194165229797363, "global_step": 189833, "epoch": 4519} {"train_loss": -7.155312538146973, "global_step": 189834, "epoch": 4519} {"train_loss": -7.1042046546936035, "global_step": 189835, "epoch": 4519} {"train_loss": -7.187282562255859, "global_step": 189836, "epoch": 4519} {"train_loss": -7.1091413497924805, "global_step": 189837, "epoch": 4519} {"train_loss": -7.123291969299316, "global_step": 189838, "epoch": 4519} {"train_loss": -7.117322183790661, "global_step": 189839, "epoch": 4519, "val_loss": 68893.2265625} {"train_loss": -7.233954906463623, "global_step": 189840, "epoch": 4520} {"train_loss": -7.276121139526367, "global_step": 189841, "epoch": 4520} {"train_loss": -7.170590400695801, "global_step": 189842, "epoch": 4520} {"train_loss": -7.189857482910156, "global_step": 189843, "epoch": 4520} {"train_loss": -7.165261268615723, "global_step": 189844, "epoch": 4520} {"train_loss": -7.124826431274414, "global_step": 189845, "epoch": 4520} {"train_loss": -7.1799845695495605, "global_step": 189846, "epoch": 4520} {"train_loss": -7.07814359664917, "global_step": 189847, "epoch": 4520} {"train_loss": -7.190674781799316, "global_step": 189848, "epoch": 4520} {"train_loss": -7.177708625793457, "global_step": 189849, "epoch": 4520} {"train_loss": -7.078620910644531, "global_step": 189850, "epoch": 4520} {"train_loss": -7.132122993469238, "global_step": 189851, "epoch": 4520} {"train_loss": -7.143445014953613, "global_step": 189852, "epoch": 4520} {"train_loss": -7.165162563323975, "global_step": 189853, "epoch": 4520} {"train_loss": -7.195473670959473, "global_step": 189854, "epoch": 4520} {"train_loss": -7.084997653961182, "global_step": 189855, "epoch": 4520} {"train_loss": -7.184573173522949, "global_step": 189856, "epoch": 4520} {"train_loss": -7.1207427978515625, "global_step": 189857, "epoch": 4520} {"train_loss": -7.247272968292236, "global_step": 189858, "epoch": 4520} {"train_loss": -6.912421703338623, "global_step": 189859, "epoch": 4520} {"train_loss": -7.165064811706543, "global_step": 189860, "epoch": 4520} {"train_loss": -7.10465145111084, "global_step": 189861, "epoch": 4520} {"train_loss": -7.068137168884277, "global_step": 189862, "epoch": 4520} {"train_loss": -7.151680946350098, "global_step": 189863, "epoch": 4520} {"train_loss": -7.146047592163086, "global_step": 189864, "epoch": 4520} {"train_loss": -7.153188705444336, "global_step": 189865, "epoch": 4520} {"train_loss": -7.106784343719482, "global_step": 189866, "epoch": 4520} {"train_loss": -7.1385931968688965, "global_step": 189867, "epoch": 4520} {"train_loss": -7.199895858764648, "global_step": 189868, "epoch": 4520} {"train_loss": -7.145431041717529, "global_step": 189869, "epoch": 4520} {"train_loss": -7.080306053161621, "global_step": 189870, "epoch": 4520} {"train_loss": -7.113672256469727, "global_step": 189871, "epoch": 4520} {"train_loss": -6.962859153747559, "global_step": 189872, "epoch": 4520} {"train_loss": -7.0676751136779785, "global_step": 189873, "epoch": 4520} {"train_loss": -7.033592700958252, "global_step": 189874, "epoch": 4520} {"train_loss": -7.009339332580566, "global_step": 189875, "epoch": 4520} {"train_loss": -7.059632778167725, "global_step": 189876, "epoch": 4520} {"train_loss": -7.066658020019531, "global_step": 189877, "epoch": 4520} {"train_loss": -6.931723594665527, "global_step": 189878, "epoch": 4520} {"train_loss": -6.93277645111084, "global_step": 189879, "epoch": 4520} {"train_loss": -7.103065490722656, "global_step": 189880, "epoch": 4520} {"train_loss": -7.1176124186742875, "global_step": 189881, "epoch": 4520, "val_loss": 69241.4453125} {"train_loss": -7.088531494140625, "global_step": 189882, "epoch": 4521} {"train_loss": -7.106161117553711, "global_step": 189883, "epoch": 4521} {"train_loss": -7.156979560852051, "global_step": 189884, "epoch": 4521} {"train_loss": -7.155482292175293, "global_step": 189885, "epoch": 4521} {"train_loss": -7.16099214553833, "global_step": 189886, "epoch": 4521} {"train_loss": -7.089201927185059, "global_step": 189887, "epoch": 4521} {"train_loss": -7.084547519683838, "global_step": 189888, "epoch": 4521} {"train_loss": -7.118483543395996, "global_step": 189889, "epoch": 4521} {"train_loss": -7.213591575622559, "global_step": 189890, "epoch": 4521} {"train_loss": -7.150604724884033, "global_step": 189891, "epoch": 4521} {"train_loss": -7.185070037841797, "global_step": 189892, "epoch": 4521} {"train_loss": -7.043957710266113, "global_step": 189893, "epoch": 4521} {"train_loss": -7.275456428527832, "global_step": 189894, "epoch": 4521} {"train_loss": -7.044248580932617, "global_step": 189895, "epoch": 4521} {"train_loss": -7.209964752197266, "global_step": 189896, "epoch": 4521} {"train_loss": -7.171335220336914, "global_step": 189897, "epoch": 4521} {"train_loss": -7.166062831878662, "global_step": 189898, "epoch": 4521} {"train_loss": -7.206801891326904, "global_step": 189899, "epoch": 4521} {"train_loss": -7.180300712585449, "global_step": 189900, "epoch": 4521} {"train_loss": -7.148160457611084, "global_step": 189901, "epoch": 4521} {"train_loss": -7.3245463371276855, "global_step": 189902, "epoch": 4521} {"train_loss": -7.087155342102051, "global_step": 189903, "epoch": 4521} {"train_loss": -7.232722282409668, "global_step": 189904, "epoch": 4521} {"train_loss": -7.160884857177734, "global_step": 189905, "epoch": 4521} {"train_loss": -7.251389503479004, "global_step": 189906, "epoch": 4521} {"train_loss": -7.22776985168457, "global_step": 189907, "epoch": 4521} {"train_loss": -7.1650471687316895, "global_step": 189908, "epoch": 4521} {"train_loss": -7.318976402282715, "global_step": 189909, "epoch": 4521} {"train_loss": -7.160739898681641, "global_step": 189910, "epoch": 4521} {"train_loss": -7.152902603149414, "global_step": 189911, "epoch": 4521} {"train_loss": -7.233572006225586, "global_step": 189912, "epoch": 4521} {"train_loss": -7.197345733642578, "global_step": 189913, "epoch": 4521} {"train_loss": -7.210260391235352, "global_step": 189914, "epoch": 4521} {"train_loss": -7.236023426055908, "global_step": 189915, "epoch": 4521} {"train_loss": -7.12180233001709, "global_step": 189916, "epoch": 4521} {"train_loss": -7.220248699188232, "global_step": 189917, "epoch": 4521} {"train_loss": -7.2606587409973145, "global_step": 189918, "epoch": 4521} {"train_loss": -7.108057022094727, "global_step": 189919, "epoch": 4521} {"train_loss": -7.247553825378418, "global_step": 189920, "epoch": 4521} {"train_loss": -7.154192924499512, "global_step": 189921, "epoch": 4521} {"train_loss": -7.124275207519531, "global_step": 189922, "epoch": 4521} {"train_loss": -7.171989679336548, "global_step": 189923, "epoch": 4521, "val_loss": 69020.21875} {"train_loss": -7.254183769226074, "global_step": 189924, "epoch": 4522} {"train_loss": -7.135598182678223, "global_step": 189925, "epoch": 4522} {"train_loss": -7.255549430847168, "global_step": 189926, "epoch": 4522} {"train_loss": -7.204453468322754, "global_step": 189927, "epoch": 4522} {"train_loss": -7.125321865081787, "global_step": 189928, "epoch": 4522} {"train_loss": -7.201966762542725, "global_step": 189929, "epoch": 4522} {"train_loss": -7.298926830291748, "global_step": 189930, "epoch": 4522} {"train_loss": -7.1875224113464355, "global_step": 189931, "epoch": 4522} {"train_loss": -7.233537197113037, "global_step": 189932, "epoch": 4522} {"train_loss": -7.112207412719727, "global_step": 189933, "epoch": 4522} {"train_loss": -7.103833198547363, "global_step": 189934, "epoch": 4522} {"train_loss": -7.017383575439453, "global_step": 189935, "epoch": 4522} {"train_loss": -7.091213226318359, "global_step": 189936, "epoch": 4522} {"train_loss": -7.149113655090332, "global_step": 189937, "epoch": 4522} {"train_loss": -7.035711288452148, "global_step": 189938, "epoch": 4522} {"train_loss": -7.11415433883667, "global_step": 189939, "epoch": 4522} {"train_loss": -7.13605260848999, "global_step": 189940, "epoch": 4522} {"train_loss": -7.178073406219482, "global_step": 189941, "epoch": 4522} {"train_loss": -7.218108177185059, "global_step": 189942, "epoch": 4522} {"train_loss": -7.24580192565918, "global_step": 189943, "epoch": 4522} {"train_loss": -7.217114448547363, "global_step": 189944, "epoch": 4522} {"train_loss": -7.150759696960449, "global_step": 189945, "epoch": 4522} {"train_loss": -7.177559852600098, "global_step": 189946, "epoch": 4522} {"train_loss": -7.006002426147461, "global_step": 189947, "epoch": 4522} {"train_loss": -7.100250244140625, "global_step": 189948, "epoch": 4522} {"train_loss": -7.134407043457031, "global_step": 189949, "epoch": 4522} {"train_loss": -7.124056816101074, "global_step": 189950, "epoch": 4522} {"train_loss": -7.136075973510742, "global_step": 189951, "epoch": 4522} {"train_loss": -7.064692497253418, "global_step": 189952, "epoch": 4522} {"train_loss": -7.06046199798584, "global_step": 189953, "epoch": 4522} {"train_loss": -7.263408660888672, "global_step": 189954, "epoch": 4522} {"train_loss": -7.074563026428223, "global_step": 189955, "epoch": 4522} {"train_loss": -7.165521621704102, "global_step": 189956, "epoch": 4522} {"train_loss": -7.115900039672852, "global_step": 189957, "epoch": 4522} {"train_loss": -7.101199150085449, "global_step": 189958, "epoch": 4522} {"train_loss": -7.099340438842773, "global_step": 189959, "epoch": 4522} {"train_loss": -7.188364505767822, "global_step": 189960, "epoch": 4522} {"train_loss": -7.092405319213867, "global_step": 189961, "epoch": 4522} {"train_loss": -7.242770195007324, "global_step": 189962, "epoch": 4522} {"train_loss": -7.1313676834106445, "global_step": 189963, "epoch": 4522} {"train_loss": -7.2075958251953125, "global_step": 189964, "epoch": 4522} {"train_loss": -7.151330981935773, "global_step": 189965, "epoch": 4522, "val_loss": 68842.125} {"train_loss": -7.210808753967285, "global_step": 189966, "epoch": 4523} {"train_loss": -7.205692291259766, "global_step": 189967, "epoch": 4523} {"train_loss": -7.130896091461182, "global_step": 189968, "epoch": 4523} {"train_loss": -7.198094367980957, "global_step": 189969, "epoch": 4523} {"train_loss": -7.2451324462890625, "global_step": 189970, "epoch": 4523} {"train_loss": -7.145986557006836, "global_step": 189971, "epoch": 4523} {"train_loss": -7.339469909667969, "global_step": 189972, "epoch": 4523} {"train_loss": -7.044342041015625, "global_step": 189973, "epoch": 4523} {"train_loss": -7.163002014160156, "global_step": 189974, "epoch": 4523} {"train_loss": -7.164013862609863, "global_step": 189975, "epoch": 4523} {"train_loss": -7.196606636047363, "global_step": 189976, "epoch": 4523} {"train_loss": -7.102575302124023, "global_step": 189977, "epoch": 4523} {"train_loss": -7.128310203552246, "global_step": 189978, "epoch": 4523} {"train_loss": -7.156661033630371, "global_step": 189979, "epoch": 4523} {"train_loss": -7.134103775024414, "global_step": 189980, "epoch": 4523} {"train_loss": -7.221807479858398, "global_step": 189981, "epoch": 4523} {"train_loss": -7.059507369995117, "global_step": 189982, "epoch": 4523} {"train_loss": -7.164407730102539, "global_step": 189983, "epoch": 4523} {"train_loss": -7.1215009689331055, "global_step": 189984, "epoch": 4523} {"train_loss": -7.129194736480713, "global_step": 189985, "epoch": 4523} {"train_loss": -7.1091508865356445, "global_step": 189986, "epoch": 4523} {"train_loss": -7.251646041870117, "global_step": 189987, "epoch": 4523} {"train_loss": -7.057960033416748, "global_step": 189988, "epoch": 4523} {"train_loss": -7.071048736572266, "global_step": 189989, "epoch": 4523} {"train_loss": -7.107985496520996, "global_step": 189990, "epoch": 4523} {"train_loss": -7.142727375030518, "global_step": 189991, "epoch": 4523} {"train_loss": -7.168071269989014, "global_step": 189992, "epoch": 4523} {"train_loss": -7.049960613250732, "global_step": 189993, "epoch": 4523} {"train_loss": -7.348575592041016, "global_step": 189994, "epoch": 4523} {"train_loss": -7.076621055603027, "global_step": 189995, "epoch": 4523} {"train_loss": -7.174774169921875, "global_step": 189996, "epoch": 4523} {"train_loss": -7.149681091308594, "global_step": 189997, "epoch": 4523} {"train_loss": -7.029994964599609, "global_step": 189998, "epoch": 4523} {"train_loss": -7.118321418762207, "global_step": 189999, "epoch": 4523} {"train_loss": -7.140894889831543, "global_step": 190000, "epoch": 4523} {"train_loss": -7.109681129455566, "global_step": 190001, "epoch": 4523} {"train_loss": -7.129886150360107, "global_step": 190002, "epoch": 4523} {"train_loss": -7.039829254150391, "global_step": 190003, "epoch": 4523} {"train_loss": -7.003530502319336, "global_step": 190004, "epoch": 4523} {"train_loss": -7.117238998413086, "global_step": 190005, "epoch": 4523} {"train_loss": -7.109886169433594, "global_step": 190006, "epoch": 4523} {"train_loss": -7.142479362941923, "global_step": 190007, "epoch": 4523, "val_loss": 68864.2421875} {"train_loss": -7.1648478507995605, "global_step": 190008, "epoch": 4524} {"train_loss": -7.1164960861206055, "global_step": 190009, "epoch": 4524} {"train_loss": -7.17002010345459, "global_step": 190010, "epoch": 4524} {"train_loss": -7.2094316482543945, "global_step": 190011, "epoch": 4524} {"train_loss": -7.129025459289551, "global_step": 190012, "epoch": 4524} {"train_loss": -7.162632942199707, "global_step": 190013, "epoch": 4524} {"train_loss": -7.032914161682129, "global_step": 190014, "epoch": 4524} {"train_loss": -7.105495452880859, "global_step": 190015, "epoch": 4524} {"train_loss": -7.118561267852783, "global_step": 190016, "epoch": 4524} {"train_loss": -7.086282730102539, "global_step": 190017, "epoch": 4524} {"train_loss": -7.030417442321777, "global_step": 190018, "epoch": 4524} {"train_loss": -7.154221534729004, "global_step": 190019, "epoch": 4524} {"train_loss": -7.092693328857422, "global_step": 190020, "epoch": 4524} {"train_loss": -7.094444274902344, "global_step": 190021, "epoch": 4524} {"train_loss": -7.285894393920898, "global_step": 190022, "epoch": 4524} {"train_loss": -7.133537769317627, "global_step": 190023, "epoch": 4524} {"train_loss": -7.070497512817383, "global_step": 190024, "epoch": 4524} {"train_loss": -7.235161781311035, "global_step": 190025, "epoch": 4524} {"train_loss": -7.134446144104004, "global_step": 190026, "epoch": 4524} {"train_loss": -7.109072208404541, "global_step": 190027, "epoch": 4524} {"train_loss": -7.216130256652832, "global_step": 190028, "epoch": 4524} {"train_loss": -7.106042861938477, "global_step": 190029, "epoch": 4524} {"train_loss": -7.1346588134765625, "global_step": 190030, "epoch": 4524} {"train_loss": -7.283164024353027, "global_step": 190031, "epoch": 4524} {"train_loss": -7.075597763061523, "global_step": 190032, "epoch": 4524} {"train_loss": -7.199543476104736, "global_step": 190033, "epoch": 4524} {"train_loss": -7.221249103546143, "global_step": 190034, "epoch": 4524} {"train_loss": -7.202946186065674, "global_step": 190035, "epoch": 4524} {"train_loss": -7.095892906188965, "global_step": 190036, "epoch": 4524} {"train_loss": -7.156140327453613, "global_step": 190037, "epoch": 4524} {"train_loss": -7.15183162689209, "global_step": 190038, "epoch": 4524} {"train_loss": -7.177488327026367, "global_step": 190039, "epoch": 4524} {"train_loss": -7.178593635559082, "global_step": 190040, "epoch": 4524} {"train_loss": -7.127017021179199, "global_step": 190041, "epoch": 4524} {"train_loss": -7.212917804718018, "global_step": 190042, "epoch": 4524} {"train_loss": -7.246588706970215, "global_step": 190043, "epoch": 4524} {"train_loss": -7.127324104309082, "global_step": 190044, "epoch": 4524} {"train_loss": -7.139106273651123, "global_step": 190045, "epoch": 4524} {"train_loss": -7.1022844314575195, "global_step": 190046, "epoch": 4524} {"train_loss": -7.089141845703125, "global_step": 190047, "epoch": 4524} {"train_loss": -7.159454345703125, "global_step": 190048, "epoch": 4524} {"train_loss": -7.143132834207444, "global_step": 190049, "epoch": 4524, "val_loss": 69004.171875} {"train_loss": -7.144580841064453, "global_step": 190050, "epoch": 4525} {"train_loss": -7.165744781494141, "global_step": 190051, "epoch": 4525} {"train_loss": -7.008678913116455, "global_step": 190052, "epoch": 4525} {"train_loss": -7.142703533172607, "global_step": 190053, "epoch": 4525} {"train_loss": -7.230340480804443, "global_step": 190054, "epoch": 4525} {"train_loss": -7.097198486328125, "global_step": 190055, "epoch": 4525} {"train_loss": -7.055535316467285, "global_step": 190056, "epoch": 4525} {"train_loss": -7.050265312194824, "global_step": 190057, "epoch": 4525} {"train_loss": -7.225369453430176, "global_step": 190058, "epoch": 4525} {"train_loss": -7.149028778076172, "global_step": 190059, "epoch": 4525} {"train_loss": -6.9904375076293945, "global_step": 190060, "epoch": 4525} {"train_loss": -7.166691780090332, "global_step": 190061, "epoch": 4525} {"train_loss": -7.121976852416992, "global_step": 190062, "epoch": 4525} {"train_loss": -7.1468095779418945, "global_step": 190063, "epoch": 4525} {"train_loss": -7.139045715332031, "global_step": 190064, "epoch": 4525} {"train_loss": -7.030048370361328, "global_step": 190065, "epoch": 4525} {"train_loss": -7.06221866607666, "global_step": 190066, "epoch": 4525} {"train_loss": -7.211587429046631, "global_step": 190067, "epoch": 4525} {"train_loss": -7.193584442138672, "global_step": 190068, "epoch": 4525} {"train_loss": -7.07059383392334, "global_step": 190069, "epoch": 4525} {"train_loss": -7.04494571685791, "global_step": 190070, "epoch": 4525} {"train_loss": -7.06545352935791, "global_step": 190071, "epoch": 4525} {"train_loss": -7.169994831085205, "global_step": 190072, "epoch": 4525} {"train_loss": -7.126077175140381, "global_step": 190073, "epoch": 4525} {"train_loss": -7.116423606872559, "global_step": 190074, "epoch": 4525} {"train_loss": -7.146607398986816, "global_step": 190075, "epoch": 4525} {"train_loss": -7.0603532791137695, "global_step": 190076, "epoch": 4525} {"train_loss": -7.193351745605469, "global_step": 190077, "epoch": 4525} {"train_loss": -7.107906341552734, "global_step": 190078, "epoch": 4525} {"train_loss": -7.11906623840332, "global_step": 190079, "epoch": 4525} {"train_loss": -7.173867225646973, "global_step": 190080, "epoch": 4525} {"train_loss": -7.1287736892700195, "global_step": 190081, "epoch": 4525} {"train_loss": -7.096604347229004, "global_step": 190082, "epoch": 4525} {"train_loss": -7.218216896057129, "global_step": 190083, "epoch": 4525} {"train_loss": -7.243596076965332, "global_step": 190084, "epoch": 4525} {"train_loss": -7.098111152648926, "global_step": 190085, "epoch": 4525} {"train_loss": -7.25779914855957, "global_step": 190086, "epoch": 4525} {"train_loss": -7.166821479797363, "global_step": 190087, "epoch": 4525} {"train_loss": -7.167657852172852, "global_step": 190088, "epoch": 4525} {"train_loss": -7.208837032318115, "global_step": 190089, "epoch": 4525} {"train_loss": -7.13679313659668, "global_step": 190090, "epoch": 4525} {"train_loss": -7.13234231585548, "global_step": 190091, "epoch": 4525, "val_loss": 68761.296875} {"train_loss": -7.205593585968018, "global_step": 190092, "epoch": 4526} {"train_loss": -7.191237926483154, "global_step": 190093, "epoch": 4526} {"train_loss": -7.040712356567383, "global_step": 190094, "epoch": 4526} {"train_loss": -7.164299488067627, "global_step": 190095, "epoch": 4526} {"train_loss": -7.217913627624512, "global_step": 190096, "epoch": 4526} {"train_loss": -7.162092208862305, "global_step": 190097, "epoch": 4526} {"train_loss": -7.176997184753418, "global_step": 190098, "epoch": 4526} {"train_loss": -7.10736608505249, "global_step": 190099, "epoch": 4526} {"train_loss": -7.1390485763549805, "global_step": 190100, "epoch": 4526} {"train_loss": -7.014745235443115, "global_step": 190101, "epoch": 4526} {"train_loss": -7.087569713592529, "global_step": 190102, "epoch": 4526} {"train_loss": -7.096341133117676, "global_step": 190103, "epoch": 4526} {"train_loss": -7.102378845214844, "global_step": 190104, "epoch": 4526} {"train_loss": -7.041868209838867, "global_step": 190105, "epoch": 4526} {"train_loss": -7.094742298126221, "global_step": 190106, "epoch": 4526} {"train_loss": -7.1445817947387695, "global_step": 190107, "epoch": 4526} {"train_loss": -7.16556453704834, "global_step": 190108, "epoch": 4526} {"train_loss": -7.112224578857422, "global_step": 190109, "epoch": 4526} {"train_loss": -7.192535400390625, "global_step": 190110, "epoch": 4526} {"train_loss": -6.973505973815918, "global_step": 190111, "epoch": 4526} {"train_loss": -7.148308753967285, "global_step": 190112, "epoch": 4526} {"train_loss": -7.133644104003906, "global_step": 190113, "epoch": 4526} {"train_loss": -7.167108058929443, "global_step": 190114, "epoch": 4526} {"train_loss": -7.143144607543945, "global_step": 190115, "epoch": 4526} {"train_loss": -7.054974555969238, "global_step": 190116, "epoch": 4526} {"train_loss": -7.169950008392334, "global_step": 190117, "epoch": 4526} {"train_loss": -7.116386413574219, "global_step": 190118, "epoch": 4526} {"train_loss": -6.910772323608398, "global_step": 190119, "epoch": 4526} {"train_loss": -7.065711975097656, "global_step": 190120, "epoch": 4526} {"train_loss": -6.996397495269775, "global_step": 190121, "epoch": 4526} {"train_loss": -7.124373435974121, "global_step": 190122, "epoch": 4526} {"train_loss": -7.111420631408691, "global_step": 190123, "epoch": 4526} {"train_loss": -7.110415458679199, "global_step": 190124, "epoch": 4526} {"train_loss": -7.196002960205078, "global_step": 190125, "epoch": 4526} {"train_loss": -7.099126815795898, "global_step": 190126, "epoch": 4526} {"train_loss": -6.998323440551758, "global_step": 190127, "epoch": 4526} {"train_loss": -7.167122840881348, "global_step": 190128, "epoch": 4526} {"train_loss": -7.191451072692871, "global_step": 190129, "epoch": 4526} {"train_loss": -7.14980936050415, "global_step": 190130, "epoch": 4526} {"train_loss": -7.155747413635254, "global_step": 190131, "epoch": 4526} {"train_loss": -7.201837062835693, "global_step": 190132, "epoch": 4526} {"train_loss": -7.117944706053961, "global_step": 190133, "epoch": 4526, "val_loss": 68752.625} {"train_loss": -7.138871192932129, "global_step": 190134, "epoch": 4527} {"train_loss": -7.187150955200195, "global_step": 190135, "epoch": 4527} {"train_loss": -7.086745262145996, "global_step": 190136, "epoch": 4527} {"train_loss": -7.1916046142578125, "global_step": 190137, "epoch": 4527} {"train_loss": -7.136734962463379, "global_step": 190138, "epoch": 4527} {"train_loss": -7.221255302429199, "global_step": 190139, "epoch": 4527} {"train_loss": -7.152753829956055, "global_step": 190140, "epoch": 4527} {"train_loss": -7.124168395996094, "global_step": 190141, "epoch": 4527} {"train_loss": -7.221257209777832, "global_step": 190142, "epoch": 4527} {"train_loss": -7.087059020996094, "global_step": 190143, "epoch": 4527} {"train_loss": -7.004110336303711, "global_step": 190144, "epoch": 4527} {"train_loss": -6.998943328857422, "global_step": 190145, "epoch": 4527} {"train_loss": -7.179708480834961, "global_step": 190146, "epoch": 4527} {"train_loss": -7.135065078735352, "global_step": 190147, "epoch": 4527} {"train_loss": -7.078254699707031, "global_step": 190148, "epoch": 4527} {"train_loss": -7.091403961181641, "global_step": 190149, "epoch": 4527} {"train_loss": -7.074966907501221, "global_step": 190150, "epoch": 4527} {"train_loss": -7.0821919441223145, "global_step": 190151, "epoch": 4527} {"train_loss": -7.192022800445557, "global_step": 190152, "epoch": 4527} {"train_loss": -7.0670647621154785, "global_step": 190153, "epoch": 4527} {"train_loss": -7.105765342712402, "global_step": 190154, "epoch": 4527} {"train_loss": -7.1006035804748535, "global_step": 190155, "epoch": 4527} {"train_loss": -7.199007987976074, "global_step": 190156, "epoch": 4527} {"train_loss": -7.162542819976807, "global_step": 190157, "epoch": 4527} {"train_loss": -7.14778995513916, "global_step": 190158, "epoch": 4527} {"train_loss": -7.2061076164245605, "global_step": 190159, "epoch": 4527} {"train_loss": -7.129239559173584, "global_step": 190160, "epoch": 4527} {"train_loss": -7.048394203186035, "global_step": 190161, "epoch": 4527} {"train_loss": -7.06588077545166, "global_step": 190162, "epoch": 4527} {"train_loss": -7.199361801147461, "global_step": 190163, "epoch": 4527} {"train_loss": -7.092266082763672, "global_step": 190164, "epoch": 4527} {"train_loss": -7.13541316986084, "global_step": 190165, "epoch": 4527} {"train_loss": -7.2730817794799805, "global_step": 190166, "epoch": 4527} {"train_loss": -7.0166521072387695, "global_step": 190167, "epoch": 4527} {"train_loss": -7.081375598907471, "global_step": 190168, "epoch": 4527} {"train_loss": -6.959884166717529, "global_step": 190169, "epoch": 4527} {"train_loss": -7.028253078460693, "global_step": 190170, "epoch": 4527} {"train_loss": -7.222090244293213, "global_step": 190171, "epoch": 4527} {"train_loss": -7.045562744140625, "global_step": 190172, "epoch": 4527} {"train_loss": -7.106769561767578, "global_step": 190173, "epoch": 4527} {"train_loss": -7.1796956062316895, "global_step": 190174, "epoch": 4527} {"train_loss": -7.120821827933902, "global_step": 190175, "epoch": 4527, "val_loss": 69006.28125} {"train_loss": -7.265056133270264, "global_step": 190176, "epoch": 4528} {"train_loss": -7.055384159088135, "global_step": 190177, "epoch": 4528} {"train_loss": -7.096571922302246, "global_step": 190178, "epoch": 4528} {"train_loss": -7.163186073303223, "global_step": 190179, "epoch": 4528} {"train_loss": -7.065916061401367, "global_step": 190180, "epoch": 4528} {"train_loss": -7.235790729522705, "global_step": 190181, "epoch": 4528} {"train_loss": -7.203601837158203, "global_step": 190182, "epoch": 4528} {"train_loss": -7.201638221740723, "global_step": 190183, "epoch": 4528} {"train_loss": -7.170215606689453, "global_step": 190184, "epoch": 4528} {"train_loss": -7.254685878753662, "global_step": 190185, "epoch": 4528} {"train_loss": -7.176054000854492, "global_step": 190186, "epoch": 4528} {"train_loss": -7.0849714279174805, "global_step": 190187, "epoch": 4528} {"train_loss": -7.073918342590332, "global_step": 190188, "epoch": 4528} {"train_loss": -7.226827621459961, "global_step": 190189, "epoch": 4528} {"train_loss": -7.219213962554932, "global_step": 190190, "epoch": 4528} {"train_loss": -7.187028884887695, "global_step": 190191, "epoch": 4528} {"train_loss": -7.203615188598633, "global_step": 190192, "epoch": 4528} {"train_loss": -7.161645412445068, "global_step": 190193, "epoch": 4528} {"train_loss": -7.28031063079834, "global_step": 190194, "epoch": 4528} {"train_loss": -7.114614963531494, "global_step": 190195, "epoch": 4528} {"train_loss": -7.109493255615234, "global_step": 190196, "epoch": 4528} {"train_loss": -7.189483642578125, "global_step": 190197, "epoch": 4528} {"train_loss": -7.161801815032959, "global_step": 190198, "epoch": 4528} {"train_loss": -7.150153160095215, "global_step": 190199, "epoch": 4528} {"train_loss": -7.231227874755859, "global_step": 190200, "epoch": 4528} {"train_loss": -7.170318603515625, "global_step": 190201, "epoch": 4528} {"train_loss": -7.18310546875, "global_step": 190202, "epoch": 4528} {"train_loss": -7.217080116271973, "global_step": 190203, "epoch": 4528} {"train_loss": -7.176916122436523, "global_step": 190204, "epoch": 4528} {"train_loss": -7.048825263977051, "global_step": 190205, "epoch": 4528} {"train_loss": -7.105253219604492, "global_step": 190206, "epoch": 4528} {"train_loss": -7.161595344543457, "global_step": 190207, "epoch": 4528} {"train_loss": -7.275697231292725, "global_step": 190208, "epoch": 4528} {"train_loss": -7.236630916595459, "global_step": 190209, "epoch": 4528} {"train_loss": -7.17389440536499, "global_step": 190210, "epoch": 4528} {"train_loss": -7.259101867675781, "global_step": 190211, "epoch": 4528} {"train_loss": -7.193868637084961, "global_step": 190212, "epoch": 4528} {"train_loss": -7.1070451736450195, "global_step": 190213, "epoch": 4528} {"train_loss": -7.189140319824219, "global_step": 190214, "epoch": 4528} {"train_loss": -7.090416431427002, "global_step": 190215, "epoch": 4528} {"train_loss": -7.029788970947266, "global_step": 190216, "epoch": 4528} {"train_loss": -7.167568479265485, "global_step": 190217, "epoch": 4528, "val_loss": 68881.21875} {"train_loss": -7.209593772888184, "global_step": 190218, "epoch": 4529} {"train_loss": -7.073151111602783, "global_step": 190219, "epoch": 4529} {"train_loss": -7.22896146774292, "global_step": 190220, "epoch": 4529} {"train_loss": -7.171344757080078, "global_step": 190221, "epoch": 4529} {"train_loss": -7.1567606925964355, "global_step": 190222, "epoch": 4529} {"train_loss": -7.118664741516113, "global_step": 190223, "epoch": 4529} {"train_loss": -7.325264930725098, "global_step": 190224, "epoch": 4529} {"train_loss": -7.209722518920898, "global_step": 190225, "epoch": 4529} {"train_loss": -7.084683418273926, "global_step": 190226, "epoch": 4529} {"train_loss": -7.095914840698242, "global_step": 190227, "epoch": 4529} {"train_loss": -7.151252746582031, "global_step": 190228, "epoch": 4529} {"train_loss": -7.167336463928223, "global_step": 190229, "epoch": 4529} {"train_loss": -7.007872581481934, "global_step": 190230, "epoch": 4529} {"train_loss": -7.202404975891113, "global_step": 190231, "epoch": 4529} {"train_loss": -7.226273059844971, "global_step": 190232, "epoch": 4529} {"train_loss": -7.207046031951904, "global_step": 190233, "epoch": 4529} {"train_loss": -7.103794097900391, "global_step": 190234, "epoch": 4529} {"train_loss": -7.093070030212402, "global_step": 190235, "epoch": 4529} {"train_loss": -7.075652122497559, "global_step": 190236, "epoch": 4529} {"train_loss": -7.083504676818848, "global_step": 190237, "epoch": 4529} {"train_loss": -7.248161315917969, "global_step": 190238, "epoch": 4529} {"train_loss": -7.289588451385498, "global_step": 190239, "epoch": 4529} {"train_loss": -7.191342830657959, "global_step": 190240, "epoch": 4529} {"train_loss": -7.088775157928467, "global_step": 190241, "epoch": 4529} {"train_loss": -7.1462507247924805, "global_step": 190242, "epoch": 4529} {"train_loss": -7.0682759284973145, "global_step": 190243, "epoch": 4529} {"train_loss": -7.149097919464111, "global_step": 190244, "epoch": 4529} {"train_loss": -7.202417373657227, "global_step": 190245, "epoch": 4529} {"train_loss": -7.10070276260376, "global_step": 190246, "epoch": 4529} {"train_loss": -7.211093902587891, "global_step": 190247, "epoch": 4529} {"train_loss": -7.154575347900391, "global_step": 190248, "epoch": 4529} {"train_loss": -7.160406589508057, "global_step": 190249, "epoch": 4529} {"train_loss": -7.033797264099121, "global_step": 190250, "epoch": 4529} {"train_loss": -7.170496940612793, "global_step": 190251, "epoch": 4529} {"train_loss": -7.178815841674805, "global_step": 190252, "epoch": 4529} {"train_loss": -7.167476654052734, "global_step": 190253, "epoch": 4529} {"train_loss": -7.205436706542969, "global_step": 190254, "epoch": 4529} {"train_loss": -7.121098518371582, "global_step": 190255, "epoch": 4529} {"train_loss": -7.136608123779297, "global_step": 190256, "epoch": 4529} {"train_loss": -7.178982734680176, "global_step": 190257, "epoch": 4529} {"train_loss": -7.17119836807251, "global_step": 190258, "epoch": 4529} {"train_loss": -7.155748231070382, "global_step": 190259, "epoch": 4529, "val_loss": 68824.8984375} {"train_loss": -7.176584243774414, "global_step": 190260, "epoch": 4530} {"train_loss": -7.199986457824707, "global_step": 190261, "epoch": 4530} {"train_loss": -6.910007476806641, "global_step": 190262, "epoch": 4530} {"train_loss": -7.112667083740234, "global_step": 190263, "epoch": 4530} {"train_loss": -7.088355541229248, "global_step": 190264, "epoch": 4530} {"train_loss": -6.9890031814575195, "global_step": 190265, "epoch": 4530} {"train_loss": -7.117415428161621, "global_step": 190266, "epoch": 4530} {"train_loss": -7.097344398498535, "global_step": 190267, "epoch": 4530} {"train_loss": -7.162383079528809, "global_step": 190268, "epoch": 4530} {"train_loss": -7.076648712158203, "global_step": 190269, "epoch": 4530} {"train_loss": -6.9197797775268555, "global_step": 190270, "epoch": 4530} {"train_loss": -7.17230224609375, "global_step": 190271, "epoch": 4530} {"train_loss": -7.0637712478637695, "global_step": 190272, "epoch": 4530} {"train_loss": -6.978292942047119, "global_step": 190273, "epoch": 4530} {"train_loss": -7.169679164886475, "global_step": 190274, "epoch": 4530} {"train_loss": -7.174737930297852, "global_step": 190275, "epoch": 4530} {"train_loss": -7.049811363220215, "global_step": 190276, "epoch": 4530} {"train_loss": -7.224102973937988, "global_step": 190277, "epoch": 4530} {"train_loss": -7.203892707824707, "global_step": 190278, "epoch": 4530} {"train_loss": -7.1533708572387695, "global_step": 190279, "epoch": 4530} {"train_loss": -7.063475131988525, "global_step": 190280, "epoch": 4530} {"train_loss": -7.154260635375977, "global_step": 190281, "epoch": 4530} {"train_loss": -7.158430099487305, "global_step": 190282, "epoch": 4530} {"train_loss": -7.168437480926514, "global_step": 190283, "epoch": 4530} {"train_loss": -7.170829772949219, "global_step": 190284, "epoch": 4530} {"train_loss": -7.09246826171875, "global_step": 190285, "epoch": 4530} {"train_loss": -7.219608306884766, "global_step": 190286, "epoch": 4530} {"train_loss": -7.075969696044922, "global_step": 190287, "epoch": 4530} {"train_loss": -7.163973808288574, "global_step": 190288, "epoch": 4530} {"train_loss": -7.268634796142578, "global_step": 190289, "epoch": 4530} {"train_loss": -7.233236312866211, "global_step": 190290, "epoch": 4530} {"train_loss": -7.1587018966674805, "global_step": 190291, "epoch": 4530} {"train_loss": -7.172032833099365, "global_step": 190292, "epoch": 4530} {"train_loss": -7.216592788696289, "global_step": 190293, "epoch": 4530} {"train_loss": -7.13474178314209, "global_step": 190294, "epoch": 4530} {"train_loss": -7.329077243804932, "global_step": 190295, "epoch": 4530} {"train_loss": -7.18582820892334, "global_step": 190296, "epoch": 4530} {"train_loss": -7.278227806091309, "global_step": 190297, "epoch": 4530} {"train_loss": -7.2373785972595215, "global_step": 190298, "epoch": 4530} {"train_loss": -7.248754501342773, "global_step": 190299, "epoch": 4530} {"train_loss": -7.110718727111816, "global_step": 190300, "epoch": 4530} {"train_loss": -7.142917462757656, "global_step": 190301, "epoch": 4530, "val_loss": 68778.1875} {"train_loss": -7.30564546585083, "global_step": 190302, "epoch": 4531} {"train_loss": -7.099769592285156, "global_step": 190303, "epoch": 4531} {"train_loss": -7.178929328918457, "global_step": 190304, "epoch": 4531} {"train_loss": -7.3368425369262695, "global_step": 190305, "epoch": 4531} {"train_loss": -7.140069961547852, "global_step": 190306, "epoch": 4531} {"train_loss": -7.18137264251709, "global_step": 190307, "epoch": 4531} {"train_loss": -7.281191825866699, "global_step": 190308, "epoch": 4531} {"train_loss": -7.28499698638916, "global_step": 190309, "epoch": 4531} {"train_loss": -7.163620948791504, "global_step": 190310, "epoch": 4531} {"train_loss": -7.197328567504883, "global_step": 190311, "epoch": 4531} {"train_loss": -7.052864074707031, "global_step": 190312, "epoch": 4531} {"train_loss": -7.160470008850098, "global_step": 190313, "epoch": 4531} {"train_loss": -7.159188747406006, "global_step": 190314, "epoch": 4531} {"train_loss": -7.040668487548828, "global_step": 190315, "epoch": 4531} {"train_loss": -7.127067565917969, "global_step": 190316, "epoch": 4531} {"train_loss": -7.227391242980957, "global_step": 190317, "epoch": 4531} {"train_loss": -7.057824611663818, "global_step": 190318, "epoch": 4531} {"train_loss": -7.226227283477783, "global_step": 190319, "epoch": 4531} {"train_loss": -7.193795680999756, "global_step": 190320, "epoch": 4531} {"train_loss": -7.098930358886719, "global_step": 190321, "epoch": 4531} {"train_loss": -7.10222053527832, "global_step": 190322, "epoch": 4531} {"train_loss": -7.132527828216553, "global_step": 190323, "epoch": 4531} {"train_loss": -7.117788791656494, "global_step": 190324, "epoch": 4531} {"train_loss": -7.216442108154297, "global_step": 190325, "epoch": 4531} {"train_loss": -7.230485439300537, "global_step": 190326, "epoch": 4531} {"train_loss": -7.060788631439209, "global_step": 190327, "epoch": 4531} {"train_loss": -7.035947799682617, "global_step": 190328, "epoch": 4531} {"train_loss": -7.100802898406982, "global_step": 190329, "epoch": 4531} {"train_loss": -7.107243537902832, "global_step": 190330, "epoch": 4531} {"train_loss": -6.890658378601074, "global_step": 190331, "epoch": 4531} {"train_loss": -7.173128128051758, "global_step": 190332, "epoch": 4531} {"train_loss": -7.189619064331055, "global_step": 190333, "epoch": 4531} {"train_loss": -7.114940643310547, "global_step": 190334, "epoch": 4531} {"train_loss": -7.140618324279785, "global_step": 190335, "epoch": 4531} {"train_loss": -7.159333229064941, "global_step": 190336, "epoch": 4531} {"train_loss": -7.209385871887207, "global_step": 190337, "epoch": 4531} {"train_loss": -7.121668815612793, "global_step": 190338, "epoch": 4531} {"train_loss": -7.156996726989746, "global_step": 190339, "epoch": 4531} {"train_loss": -7.128139972686768, "global_step": 190340, "epoch": 4531} {"train_loss": -7.188878536224365, "global_step": 190341, "epoch": 4531} {"train_loss": -7.133481502532959, "global_step": 190342, "epoch": 4531} {"train_loss": -7.1502193836938766, "global_step": 190343, "epoch": 4531, "val_loss": 69058.3046875} {"train_loss": -7.194149017333984, "global_step": 190344, "epoch": 4532} {"train_loss": -7.169258117675781, "global_step": 190345, "epoch": 4532} {"train_loss": -7.254894256591797, "global_step": 190346, "epoch": 4532} {"train_loss": -7.209987163543701, "global_step": 190347, "epoch": 4532} {"train_loss": -7.154054641723633, "global_step": 190348, "epoch": 4532} {"train_loss": -7.153646945953369, "global_step": 190349, "epoch": 4532} {"train_loss": -7.090229511260986, "global_step": 190350, "epoch": 4532} {"train_loss": -7.072394847869873, "global_step": 190351, "epoch": 4532} {"train_loss": -7.134317398071289, "global_step": 190352, "epoch": 4532} {"train_loss": -7.117799758911133, "global_step": 190353, "epoch": 4532} {"train_loss": -7.135927200317383, "global_step": 190354, "epoch": 4532} {"train_loss": -7.206778526306152, "global_step": 190355, "epoch": 4532} {"train_loss": -7.117770671844482, "global_step": 190356, "epoch": 4532} {"train_loss": -7.089168548583984, "global_step": 190357, "epoch": 4532} {"train_loss": -7.110913276672363, "global_step": 190358, "epoch": 4532} {"train_loss": -7.214015007019043, "global_step": 190359, "epoch": 4532} {"train_loss": -7.155034065246582, "global_step": 190360, "epoch": 4532} {"train_loss": -7.199792385101318, "global_step": 190361, "epoch": 4532} {"train_loss": -7.16960334777832, "global_step": 190362, "epoch": 4532} {"train_loss": -7.062995910644531, "global_step": 190363, "epoch": 4532} {"train_loss": -7.178059101104736, "global_step": 190364, "epoch": 4532} {"train_loss": -7.038606643676758, "global_step": 190365, "epoch": 4532} {"train_loss": -7.130072116851807, "global_step": 190366, "epoch": 4532} {"train_loss": -7.114884376525879, "global_step": 190367, "epoch": 4532} {"train_loss": -7.120835781097412, "global_step": 190368, "epoch": 4532} {"train_loss": -7.071963310241699, "global_step": 190369, "epoch": 4532} {"train_loss": -7.176225662231445, "global_step": 190370, "epoch": 4532} {"train_loss": -7.049295425415039, "global_step": 190371, "epoch": 4532} {"train_loss": -7.142840385437012, "global_step": 190372, "epoch": 4532} {"train_loss": -7.035183906555176, "global_step": 190373, "epoch": 4532} {"train_loss": -7.087308883666992, "global_step": 190374, "epoch": 4532} {"train_loss": -7.075857639312744, "global_step": 190375, "epoch": 4532} {"train_loss": -7.100576400756836, "global_step": 190376, "epoch": 4532} {"train_loss": -7.0936079025268555, "global_step": 190377, "epoch": 4532} {"train_loss": -7.089693069458008, "global_step": 190378, "epoch": 4532} {"train_loss": -7.11916446685791, "global_step": 190379, "epoch": 4532} {"train_loss": -6.968593597412109, "global_step": 190380, "epoch": 4532} {"train_loss": -6.973657608032227, "global_step": 190381, "epoch": 4532} {"train_loss": -6.90194845199585, "global_step": 190382, "epoch": 4532} {"train_loss": -7.01580810546875, "global_step": 190383, "epoch": 4532} {"train_loss": -7.088155746459961, "global_step": 190384, "epoch": 4532} {"train_loss": -7.105859393165225, "global_step": 190385, "epoch": 4532, "val_loss": 69145.0625} {"train_loss": -6.976691246032715, "global_step": 190386, "epoch": 4533} {"train_loss": -6.994630813598633, "global_step": 190387, "epoch": 4533} {"train_loss": -7.204472541809082, "global_step": 190388, "epoch": 4533} {"train_loss": -6.971519470214844, "global_step": 190389, "epoch": 4533} {"train_loss": -7.072927474975586, "global_step": 190390, "epoch": 4533} {"train_loss": -7.026450157165527, "global_step": 190391, "epoch": 4533} {"train_loss": -7.082562446594238, "global_step": 190392, "epoch": 4533} {"train_loss": -7.0195631980896, "global_step": 190393, "epoch": 4533} {"train_loss": -7.094388961791992, "global_step": 190394, "epoch": 4533} {"train_loss": -7.133082389831543, "global_step": 190395, "epoch": 4533} {"train_loss": -7.09825325012207, "global_step": 190396, "epoch": 4533} {"train_loss": -7.115902900695801, "global_step": 190397, "epoch": 4533} {"train_loss": -6.952446460723877, "global_step": 190398, "epoch": 4533} {"train_loss": -7.104363441467285, "global_step": 190399, "epoch": 4533} {"train_loss": -7.017516613006592, "global_step": 190400, "epoch": 4533} {"train_loss": -7.222719192504883, "global_step": 190401, "epoch": 4533} {"train_loss": -6.981755256652832, "global_step": 190402, "epoch": 4533} {"train_loss": -7.141163349151611, "global_step": 190403, "epoch": 4533} {"train_loss": -7.076192855834961, "global_step": 190404, "epoch": 4533} {"train_loss": -7.148346900939941, "global_step": 190405, "epoch": 4533} {"train_loss": -7.2010817527771, "global_step": 190406, "epoch": 4533} {"train_loss": -7.016366004943848, "global_step": 190407, "epoch": 4533} {"train_loss": -7.207748889923096, "global_step": 190408, "epoch": 4533} {"train_loss": -7.203441619873047, "global_step": 190409, "epoch": 4533} {"train_loss": -7.222533226013184, "global_step": 190410, "epoch": 4533} {"train_loss": -7.208806991577148, "global_step": 190411, "epoch": 4533} {"train_loss": -7.1577959060668945, "global_step": 190412, "epoch": 4533} {"train_loss": -7.169999122619629, "global_step": 190413, "epoch": 4533} {"train_loss": -7.278891563415527, "global_step": 190414, "epoch": 4533} {"train_loss": -7.285030364990234, "global_step": 190415, "epoch": 4533} {"train_loss": -7.215527534484863, "global_step": 190416, "epoch": 4533} {"train_loss": -7.251816272735596, "global_step": 190417, "epoch": 4533} {"train_loss": -7.1377434730529785, "global_step": 190418, "epoch": 4533} {"train_loss": -7.185730457305908, "global_step": 190419, "epoch": 4533} {"train_loss": -7.100747585296631, "global_step": 190420, "epoch": 4533} {"train_loss": -7.199352264404297, "global_step": 190421, "epoch": 4533} {"train_loss": -7.084198951721191, "global_step": 190422, "epoch": 4533} {"train_loss": -7.042649269104004, "global_step": 190423, "epoch": 4533} {"train_loss": -7.185070037841797, "global_step": 190424, "epoch": 4533} {"train_loss": -7.118912696838379, "global_step": 190425, "epoch": 4533} {"train_loss": -7.179292678833008, "global_step": 190426, "epoch": 4533} {"train_loss": -7.121686276935396, "global_step": 190427, "epoch": 4533, "val_loss": 69041.265625} {"train_loss": -7.220990180969238, "global_step": 190428, "epoch": 4534} {"train_loss": -7.0278801918029785, "global_step": 190429, "epoch": 4534} {"train_loss": -6.964748859405518, "global_step": 190430, "epoch": 4534} {"train_loss": -7.161852836608887, "global_step": 190431, "epoch": 4534} {"train_loss": -7.082993030548096, "global_step": 190432, "epoch": 4534} {"train_loss": -7.200925350189209, "global_step": 190433, "epoch": 4534} {"train_loss": -7.101109981536865, "global_step": 190434, "epoch": 4534} {"train_loss": -6.9807024002075195, "global_step": 190435, "epoch": 4534} {"train_loss": -7.184316158294678, "global_step": 190436, "epoch": 4534} {"train_loss": -7.080416202545166, "global_step": 190437, "epoch": 4534} {"train_loss": -7.097503185272217, "global_step": 190438, "epoch": 4534} {"train_loss": -7.088559150695801, "global_step": 190439, "epoch": 4534} {"train_loss": -6.98321008682251, "global_step": 190440, "epoch": 4534} {"train_loss": -7.204253673553467, "global_step": 190441, "epoch": 4534} {"train_loss": -7.004611968994141, "global_step": 190442, "epoch": 4534} {"train_loss": -7.16068172454834, "global_step": 190443, "epoch": 4534} {"train_loss": -7.190737247467041, "global_step": 190444, "epoch": 4534} {"train_loss": -6.939475059509277, "global_step": 190445, "epoch": 4534} {"train_loss": -7.21600341796875, "global_step": 190446, "epoch": 4534} {"train_loss": -7.165477752685547, "global_step": 190447, "epoch": 4534} {"train_loss": -7.137995719909668, "global_step": 190448, "epoch": 4534} {"train_loss": -7.112926483154297, "global_step": 190449, "epoch": 4534} {"train_loss": -7.150003433227539, "global_step": 190450, "epoch": 4534} {"train_loss": -7.170246124267578, "global_step": 190451, "epoch": 4534} {"train_loss": -7.122972011566162, "global_step": 190452, "epoch": 4534} {"train_loss": -7.036303520202637, "global_step": 190453, "epoch": 4534} {"train_loss": -7.126873016357422, "global_step": 190454, "epoch": 4534} {"train_loss": -7.185304641723633, "global_step": 190455, "epoch": 4534} {"train_loss": -7.133627891540527, "global_step": 190456, "epoch": 4534} {"train_loss": -7.190830230712891, "global_step": 190457, "epoch": 4534} {"train_loss": -7.174846172332764, "global_step": 190458, "epoch": 4534} {"train_loss": -7.103266716003418, "global_step": 190459, "epoch": 4534} {"train_loss": -7.143276214599609, "global_step": 190460, "epoch": 4534} {"train_loss": -7.058221817016602, "global_step": 190461, "epoch": 4534} {"train_loss": -7.075475215911865, "global_step": 190462, "epoch": 4534} {"train_loss": -7.097392559051514, "global_step": 190463, "epoch": 4534} {"train_loss": -7.080488204956055, "global_step": 190464, "epoch": 4534} {"train_loss": -7.189615249633789, "global_step": 190465, "epoch": 4534} {"train_loss": -6.994722366333008, "global_step": 190466, "epoch": 4534} {"train_loss": -6.998098850250244, "global_step": 190467, "epoch": 4534} {"train_loss": -7.121356964111328, "global_step": 190468, "epoch": 4534} {"train_loss": -7.108833528700329, "global_step": 190469, "epoch": 4534, "val_loss": 68864.109375} {"train_loss": -7.073143005371094, "global_step": 190470, "epoch": 4535} {"train_loss": -7.052670478820801, "global_step": 190471, "epoch": 4535} {"train_loss": -7.0230560302734375, "global_step": 190472, "epoch": 4535} {"train_loss": -7.060264587402344, "global_step": 190473, "epoch": 4535} {"train_loss": -7.217336654663086, "global_step": 190474, "epoch": 4535} {"train_loss": -6.986260890960693, "global_step": 190475, "epoch": 4535} {"train_loss": -7.173128128051758, "global_step": 190476, "epoch": 4535} {"train_loss": -7.220356464385986, "global_step": 190477, "epoch": 4535} {"train_loss": -7.172404766082764, "global_step": 190478, "epoch": 4535} {"train_loss": -7.050614356994629, "global_step": 190479, "epoch": 4535} {"train_loss": -7.252253532409668, "global_step": 190480, "epoch": 4535} {"train_loss": -7.266116142272949, "global_step": 190481, "epoch": 4535} {"train_loss": -7.143026351928711, "global_step": 190482, "epoch": 4535} {"train_loss": -7.112330436706543, "global_step": 190483, "epoch": 4535} {"train_loss": -7.2097859382629395, "global_step": 190484, "epoch": 4535} {"train_loss": -7.15349817276001, "global_step": 190485, "epoch": 4535} {"train_loss": -7.041234970092773, "global_step": 190486, "epoch": 4535} {"train_loss": -7.171473979949951, "global_step": 190487, "epoch": 4535} {"train_loss": -7.180931091308594, "global_step": 190488, "epoch": 4535} {"train_loss": -7.080513954162598, "global_step": 190489, "epoch": 4535} {"train_loss": -7.119190692901611, "global_step": 190490, "epoch": 4535} {"train_loss": -7.154751300811768, "global_step": 190491, "epoch": 4535} {"train_loss": -7.094161033630371, "global_step": 190492, "epoch": 4535} {"train_loss": -7.0879082679748535, "global_step": 190493, "epoch": 4535} {"train_loss": -7.0904107093811035, "global_step": 190494, "epoch": 4535} {"train_loss": -7.23337459564209, "global_step": 190495, "epoch": 4535} {"train_loss": -7.16324520111084, "global_step": 190496, "epoch": 4535} {"train_loss": -7.087206840515137, "global_step": 190497, "epoch": 4535} {"train_loss": -7.2915239334106445, "global_step": 190498, "epoch": 4535} {"train_loss": -7.118040084838867, "global_step": 190499, "epoch": 4535} {"train_loss": -6.999075889587402, "global_step": 190500, "epoch": 4535} {"train_loss": -7.065938949584961, "global_step": 190501, "epoch": 4535} {"train_loss": -7.0459442138671875, "global_step": 190502, "epoch": 4535} {"train_loss": -7.103847980499268, "global_step": 190503, "epoch": 4535} {"train_loss": -7.15643310546875, "global_step": 190504, "epoch": 4535} {"train_loss": -7.0795745849609375, "global_step": 190505, "epoch": 4535} {"train_loss": -7.276246547698975, "global_step": 190506, "epoch": 4535} {"train_loss": -7.396247863769531, "global_step": 190507, "epoch": 4535} {"train_loss": -7.134336471557617, "global_step": 190508, "epoch": 4535} {"train_loss": -7.116294860839844, "global_step": 190509, "epoch": 4535} {"train_loss": -7.199990749359131, "global_step": 190510, "epoch": 4535} {"train_loss": -7.137515862782796, "global_step": 190511, "epoch": 4535, "val_loss": 68990.140625} {"train_loss": -7.177151679992676, "global_step": 190512, "epoch": 4536} {"train_loss": -7.239781856536865, "global_step": 190513, "epoch": 4536} {"train_loss": -7.2542924880981445, "global_step": 190514, "epoch": 4536} {"train_loss": -7.1891984939575195, "global_step": 190515, "epoch": 4536} {"train_loss": -7.138235092163086, "global_step": 190516, "epoch": 4536} {"train_loss": -7.2122802734375, "global_step": 190517, "epoch": 4536} {"train_loss": -7.2264885902404785, "global_step": 190518, "epoch": 4536} {"train_loss": -7.139591217041016, "global_step": 190519, "epoch": 4536} {"train_loss": -7.146200180053711, "global_step": 190520, "epoch": 4536} {"train_loss": -7.197096824645996, "global_step": 190521, "epoch": 4536} {"train_loss": -7.266637325286865, "global_step": 190522, "epoch": 4536} {"train_loss": -7.30145263671875, "global_step": 190523, "epoch": 4536} {"train_loss": -7.188499450683594, "global_step": 190524, "epoch": 4536} {"train_loss": -7.220303535461426, "global_step": 190525, "epoch": 4536} {"train_loss": -7.253485679626465, "global_step": 190526, "epoch": 4536} {"train_loss": -7.2035231590271, "global_step": 190527, "epoch": 4536} {"train_loss": -7.095036506652832, "global_step": 190528, "epoch": 4536} {"train_loss": -7.103891849517822, "global_step": 190529, "epoch": 4536} {"train_loss": -7.18834924697876, "global_step": 190530, "epoch": 4536} {"train_loss": -7.196098327636719, "global_step": 190531, "epoch": 4536} {"train_loss": -7.25385856628418, "global_step": 190532, "epoch": 4536} {"train_loss": -7.115971565246582, "global_step": 190533, "epoch": 4536} {"train_loss": -7.150264739990234, "global_step": 190534, "epoch": 4536} {"train_loss": -7.203391075134277, "global_step": 190535, "epoch": 4536} {"train_loss": -7.185248851776123, "global_step": 190536, "epoch": 4536} {"train_loss": -7.090796947479248, "global_step": 190537, "epoch": 4536} {"train_loss": -7.136578559875488, "global_step": 190538, "epoch": 4536} {"train_loss": -7.177174091339111, "global_step": 190539, "epoch": 4536} {"train_loss": -7.1492228507995605, "global_step": 190540, "epoch": 4536} {"train_loss": -7.185324668884277, "global_step": 190541, "epoch": 4536} {"train_loss": -7.249073028564453, "global_step": 190542, "epoch": 4536} {"train_loss": -7.280574798583984, "global_step": 190543, "epoch": 4536} {"train_loss": -7.158503532409668, "global_step": 190544, "epoch": 4536} {"train_loss": -7.139283180236816, "global_step": 190545, "epoch": 4536} {"train_loss": -7.12818717956543, "global_step": 190546, "epoch": 4536} {"train_loss": -7.200878143310547, "global_step": 190547, "epoch": 4536} {"train_loss": -7.0769548416137695, "global_step": 190548, "epoch": 4536} {"train_loss": -7.176836013793945, "global_step": 190549, "epoch": 4536} {"train_loss": -7.1317572593688965, "global_step": 190550, "epoch": 4536} {"train_loss": -7.200436592102051, "global_step": 190551, "epoch": 4536} {"train_loss": -7.165996074676514, "global_step": 190552, "epoch": 4536} {"train_loss": -7.17810997508821, "global_step": 190553, "epoch": 4536, "val_loss": 68902.40625} {"train_loss": -7.224772930145264, "global_step": 190554, "epoch": 4537} {"train_loss": -7.0710344314575195, "global_step": 190555, "epoch": 4537} {"train_loss": -7.254044532775879, "global_step": 190556, "epoch": 4537} {"train_loss": -7.130969524383545, "global_step": 190557, "epoch": 4537} {"train_loss": -7.092568397521973, "global_step": 190558, "epoch": 4537} {"train_loss": -7.169768333435059, "global_step": 190559, "epoch": 4537} {"train_loss": -7.299842357635498, "global_step": 190560, "epoch": 4537} {"train_loss": -7.175814628601074, "global_step": 190561, "epoch": 4537} {"train_loss": -7.058176040649414, "global_step": 190562, "epoch": 4537} {"train_loss": -7.151521682739258, "global_step": 190563, "epoch": 4537} {"train_loss": -7.173704147338867, "global_step": 190564, "epoch": 4537} {"train_loss": -7.230659484863281, "global_step": 190565, "epoch": 4537} {"train_loss": -7.103738307952881, "global_step": 190566, "epoch": 4537} {"train_loss": -7.1921586990356445, "global_step": 190567, "epoch": 4537} {"train_loss": -7.086886405944824, "global_step": 190568, "epoch": 4537} {"train_loss": -7.174685478210449, "global_step": 190569, "epoch": 4537} {"train_loss": -7.0682902336120605, "global_step": 190570, "epoch": 4537} {"train_loss": -7.127498626708984, "global_step": 190571, "epoch": 4537} {"train_loss": -7.098673343658447, "global_step": 190572, "epoch": 4537} {"train_loss": -7.2044782638549805, "global_step": 190573, "epoch": 4537} {"train_loss": -7.21604585647583, "global_step": 190574, "epoch": 4537} {"train_loss": -7.119173049926758, "global_step": 190575, "epoch": 4537} {"train_loss": -7.205104827880859, "global_step": 190576, "epoch": 4537} {"train_loss": -7.119210243225098, "global_step": 190577, "epoch": 4537} {"train_loss": -7.205749988555908, "global_step": 190578, "epoch": 4537} {"train_loss": -7.223211288452148, "global_step": 190579, "epoch": 4537} {"train_loss": -7.196142673492432, "global_step": 190580, "epoch": 4537} {"train_loss": -7.234978199005127, "global_step": 190581, "epoch": 4537} {"train_loss": -7.160099029541016, "global_step": 190582, "epoch": 4537} {"train_loss": -7.215719223022461, "global_step": 190583, "epoch": 4537} {"train_loss": -7.277212142944336, "global_step": 190584, "epoch": 4537} {"train_loss": -7.173083305358887, "global_step": 190585, "epoch": 4537} {"train_loss": -7.260138034820557, "global_step": 190586, "epoch": 4537} {"train_loss": -7.217508316040039, "global_step": 190587, "epoch": 4537} {"train_loss": -7.165121078491211, "global_step": 190588, "epoch": 4537} {"train_loss": -7.026519298553467, "global_step": 190589, "epoch": 4537} {"train_loss": -7.147319316864014, "global_step": 190590, "epoch": 4537} {"train_loss": -7.174603462219238, "global_step": 190591, "epoch": 4537} {"train_loss": -7.092709541320801, "global_step": 190592, "epoch": 4537} {"train_loss": -7.107826232910156, "global_step": 190593, "epoch": 4537} {"train_loss": -7.1851067543029785, "global_step": 190594, "epoch": 4537} {"train_loss": -7.167976765405564, "global_step": 190595, "epoch": 4537, "val_loss": 68894.3515625} {"train_loss": -7.190737724304199, "global_step": 190596, "epoch": 4538} {"train_loss": -7.1677703857421875, "global_step": 190597, "epoch": 4538} {"train_loss": -7.1536054611206055, "global_step": 190598, "epoch": 4538} {"train_loss": -7.131051063537598, "global_step": 190599, "epoch": 4538} {"train_loss": -7.167096138000488, "global_step": 190600, "epoch": 4538} {"train_loss": -7.091156005859375, "global_step": 190601, "epoch": 4538} {"train_loss": -7.136602401733398, "global_step": 190602, "epoch": 4538} {"train_loss": -7.198822498321533, "global_step": 190603, "epoch": 4538} {"train_loss": -7.103675365447998, "global_step": 190604, "epoch": 4538} {"train_loss": -7.137815475463867, "global_step": 190605, "epoch": 4538} {"train_loss": -7.185490131378174, "global_step": 190606, "epoch": 4538} {"train_loss": -7.054119110107422, "global_step": 190607, "epoch": 4538} {"train_loss": -7.181064605712891, "global_step": 190608, "epoch": 4538} {"train_loss": -7.141820907592773, "global_step": 190609, "epoch": 4538} {"train_loss": -7.139986991882324, "global_step": 190610, "epoch": 4538} {"train_loss": -7.120495796203613, "global_step": 190611, "epoch": 4538} {"train_loss": -7.12696647644043, "global_step": 190612, "epoch": 4538} {"train_loss": -7.201873302459717, "global_step": 190613, "epoch": 4538} {"train_loss": -7.0720672607421875, "global_step": 190614, "epoch": 4538} {"train_loss": -7.1244096755981445, "global_step": 190615, "epoch": 4538} {"train_loss": -7.185922622680664, "global_step": 190616, "epoch": 4538} {"train_loss": -7.172755241394043, "global_step": 190617, "epoch": 4538} {"train_loss": -7.086428165435791, "global_step": 190618, "epoch": 4538} {"train_loss": -7.156949996948242, "global_step": 190619, "epoch": 4538} {"train_loss": -7.18649435043335, "global_step": 190620, "epoch": 4538} {"train_loss": -7.213007926940918, "global_step": 190621, "epoch": 4538} {"train_loss": -7.231251239776611, "global_step": 190622, "epoch": 4538} {"train_loss": -7.151663303375244, "global_step": 190623, "epoch": 4538} {"train_loss": -7.074882507324219, "global_step": 190624, "epoch": 4538} {"train_loss": -7.084306240081787, "global_step": 190625, "epoch": 4538} {"train_loss": -7.063991546630859, "global_step": 190626, "epoch": 4538} {"train_loss": -7.1264472007751465, "global_step": 190627, "epoch": 4538} {"train_loss": -7.099785327911377, "global_step": 190628, "epoch": 4538} {"train_loss": -7.134923934936523, "global_step": 190629, "epoch": 4538} {"train_loss": -7.007716178894043, "global_step": 190630, "epoch": 4538} {"train_loss": -7.1463942527771, "global_step": 190631, "epoch": 4538} {"train_loss": -7.185262680053711, "global_step": 190632, "epoch": 4538} {"train_loss": -7.142875671386719, "global_step": 190633, "epoch": 4538} {"train_loss": -7.179684638977051, "global_step": 190634, "epoch": 4538} {"train_loss": -7.070921421051025, "global_step": 190635, "epoch": 4538} {"train_loss": -7.16787576675415, "global_step": 190636, "epoch": 4538} {"train_loss": -7.137976260412307, "global_step": 190637, "epoch": 4538, "val_loss": 68951.4140625} {"train_loss": -7.036124229431152, "global_step": 190638, "epoch": 4539} {"train_loss": -7.181300163269043, "global_step": 190639, "epoch": 4539} {"train_loss": -7.0745849609375, "global_step": 190640, "epoch": 4539} {"train_loss": -7.15986442565918, "global_step": 190641, "epoch": 4539} {"train_loss": -6.996983051300049, "global_step": 190642, "epoch": 4539} {"train_loss": -7.180867671966553, "global_step": 190643, "epoch": 4539} {"train_loss": -7.094969749450684, "global_step": 190644, "epoch": 4539} {"train_loss": -7.101253032684326, "global_step": 190645, "epoch": 4539} {"train_loss": -7.154205799102783, "global_step": 190646, "epoch": 4539} {"train_loss": -7.163059711456299, "global_step": 190647, "epoch": 4539} {"train_loss": -7.034363746643066, "global_step": 190648, "epoch": 4539} {"train_loss": -7.066027641296387, "global_step": 190649, "epoch": 4539} {"train_loss": -7.068117141723633, "global_step": 190650, "epoch": 4539} {"train_loss": -7.145978927612305, "global_step": 190651, "epoch": 4539} {"train_loss": -7.171555042266846, "global_step": 190652, "epoch": 4539} {"train_loss": -7.035041809082031, "global_step": 190653, "epoch": 4539} {"train_loss": -7.078505992889404, "global_step": 190654, "epoch": 4539} {"train_loss": -7.078459739685059, "global_step": 190655, "epoch": 4539} {"train_loss": -7.105012893676758, "global_step": 190656, "epoch": 4539} {"train_loss": -7.250290393829346, "global_step": 190657, "epoch": 4539} {"train_loss": -6.96817684173584, "global_step": 190658, "epoch": 4539} {"train_loss": -7.11451530456543, "global_step": 190659, "epoch": 4539} {"train_loss": -7.099647521972656, "global_step": 190660, "epoch": 4539} {"train_loss": -7.234986305236816, "global_step": 190661, "epoch": 4539} {"train_loss": -7.223066329956055, "global_step": 190662, "epoch": 4539} {"train_loss": -7.046376705169678, "global_step": 190663, "epoch": 4539} {"train_loss": -7.132369518280029, "global_step": 190664, "epoch": 4539} {"train_loss": -7.196566581726074, "global_step": 190665, "epoch": 4539} {"train_loss": -7.237499237060547, "global_step": 190666, "epoch": 4539} {"train_loss": -7.319092750549316, "global_step": 190667, "epoch": 4539} {"train_loss": -7.222122669219971, "global_step": 190668, "epoch": 4539} {"train_loss": -7.141701698303223, "global_step": 190669, "epoch": 4539} {"train_loss": -7.298678398132324, "global_step": 190670, "epoch": 4539} {"train_loss": -7.155706882476807, "global_step": 190671, "epoch": 4539} {"train_loss": -7.2911696434021, "global_step": 190672, "epoch": 4539} {"train_loss": -7.268383502960205, "global_step": 190673, "epoch": 4539} {"train_loss": -7.233341693878174, "global_step": 190674, "epoch": 4539} {"train_loss": -7.195716857910156, "global_step": 190675, "epoch": 4539} {"train_loss": -7.137673854827881, "global_step": 190676, "epoch": 4539} {"train_loss": -7.155797004699707, "global_step": 190677, "epoch": 4539} {"train_loss": -7.14042854309082, "global_step": 190678, "epoch": 4539} {"train_loss": -7.146020991461618, "global_step": 190679, "epoch": 4539, "val_loss": 68880.9375} {"train_loss": -7.228608131408691, "global_step": 190680, "epoch": 4540} {"train_loss": -7.159543037414551, "global_step": 190681, "epoch": 4540} {"train_loss": -7.146902561187744, "global_step": 190682, "epoch": 4540} {"train_loss": -7.301337718963623, "global_step": 190683, "epoch": 4540} {"train_loss": -7.169394016265869, "global_step": 190684, "epoch": 4540} {"train_loss": -7.277830600738525, "global_step": 190685, "epoch": 4540} {"train_loss": -7.276232719421387, "global_step": 190686, "epoch": 4540} {"train_loss": -7.195194244384766, "global_step": 190687, "epoch": 4540} {"train_loss": -7.2718353271484375, "global_step": 190688, "epoch": 4540} {"train_loss": -7.109270095825195, "global_step": 190689, "epoch": 4540} {"train_loss": -7.173431396484375, "global_step": 190690, "epoch": 4540} {"train_loss": -7.226535797119141, "global_step": 190691, "epoch": 4540} {"train_loss": -7.223414897918701, "global_step": 190692, "epoch": 4540} {"train_loss": -7.143980979919434, "global_step": 190693, "epoch": 4540} {"train_loss": -7.257255554199219, "global_step": 190694, "epoch": 4540} {"train_loss": -7.216698169708252, "global_step": 190695, "epoch": 4540} {"train_loss": -7.095499038696289, "global_step": 190696, "epoch": 4540} {"train_loss": -7.210565567016602, "global_step": 190697, "epoch": 4540} {"train_loss": -7.114152908325195, "global_step": 190698, "epoch": 4540} {"train_loss": -7.152350902557373, "global_step": 190699, "epoch": 4540} {"train_loss": -7.297231674194336, "global_step": 190700, "epoch": 4540} {"train_loss": -7.151937961578369, "global_step": 190701, "epoch": 4540} {"train_loss": -7.137338638305664, "global_step": 190702, "epoch": 4540} {"train_loss": -7.311303615570068, "global_step": 190703, "epoch": 4540} {"train_loss": -7.318877220153809, "global_step": 190704, "epoch": 4540} {"train_loss": -7.081348896026611, "global_step": 190705, "epoch": 4540} {"train_loss": -7.22355842590332, "global_step": 190706, "epoch": 4540} {"train_loss": -7.24630069732666, "global_step": 190707, "epoch": 4540} {"train_loss": -7.072670936584473, "global_step": 190708, "epoch": 4540} {"train_loss": -7.212570667266846, "global_step": 190709, "epoch": 4540} {"train_loss": -7.191741466522217, "global_step": 190710, "epoch": 4540} {"train_loss": -7.0629425048828125, "global_step": 190711, "epoch": 4540} {"train_loss": -7.097665309906006, "global_step": 190712, "epoch": 4540} {"train_loss": -7.068727493286133, "global_step": 190713, "epoch": 4540} {"train_loss": -7.063830375671387, "global_step": 190714, "epoch": 4540} {"train_loss": -7.116683006286621, "global_step": 190715, "epoch": 4540} {"train_loss": -7.0016655921936035, "global_step": 190716, "epoch": 4540} {"train_loss": -7.162991046905518, "global_step": 190717, "epoch": 4540} {"train_loss": -7.054605484008789, "global_step": 190718, "epoch": 4540} {"train_loss": -7.0524773597717285, "global_step": 190719, "epoch": 4540} {"train_loss": -7.011540412902832, "global_step": 190720, "epoch": 4540} {"train_loss": -7.168423482349941, "global_step": 190721, "epoch": 4540, "val_loss": 69079.625} {"train_loss": -7.149538993835449, "global_step": 190722, "epoch": 4541} {"train_loss": -7.266289234161377, "global_step": 190723, "epoch": 4541} {"train_loss": -7.248493194580078, "global_step": 190724, "epoch": 4541} {"train_loss": -7.172136306762695, "global_step": 190725, "epoch": 4541} {"train_loss": -7.065080642700195, "global_step": 190726, "epoch": 4541} {"train_loss": -7.1754937171936035, "global_step": 190727, "epoch": 4541} {"train_loss": -7.2155280113220215, "global_step": 190728, "epoch": 4541} {"train_loss": -7.111494064331055, "global_step": 190729, "epoch": 4541} {"train_loss": -7.140748023986816, "global_step": 190730, "epoch": 4541} {"train_loss": -7.241682052612305, "global_step": 190731, "epoch": 4541} {"train_loss": -7.149250030517578, "global_step": 190732, "epoch": 4541} {"train_loss": -7.170449256896973, "global_step": 190733, "epoch": 4541} {"train_loss": -6.97515344619751, "global_step": 190734, "epoch": 4541} {"train_loss": -7.198184490203857, "global_step": 190735, "epoch": 4541} {"train_loss": -7.160514831542969, "global_step": 190736, "epoch": 4541} {"train_loss": -7.130200386047363, "global_step": 190737, "epoch": 4541} {"train_loss": -7.187352180480957, "global_step": 190738, "epoch": 4541} {"train_loss": -7.177724361419678, "global_step": 190739, "epoch": 4541} {"train_loss": -7.1327714920043945, "global_step": 190740, "epoch": 4541} {"train_loss": -7.054539680480957, "global_step": 190741, "epoch": 4541} {"train_loss": -7.083189010620117, "global_step": 190742, "epoch": 4541} {"train_loss": -7.227142333984375, "global_step": 190743, "epoch": 4541} {"train_loss": -7.126243591308594, "global_step": 190744, "epoch": 4541} {"train_loss": -7.017314434051514, "global_step": 190745, "epoch": 4541} {"train_loss": -7.047484397888184, "global_step": 190746, "epoch": 4541} {"train_loss": -7.165821552276611, "global_step": 190747, "epoch": 4541} {"train_loss": -7.020625591278076, "global_step": 190748, "epoch": 4541} {"train_loss": -7.071389198303223, "global_step": 190749, "epoch": 4541} {"train_loss": -7.158759117126465, "global_step": 190750, "epoch": 4541} {"train_loss": -7.057358741760254, "global_step": 190751, "epoch": 4541} {"train_loss": -7.199667930603027, "global_step": 190752, "epoch": 4541} {"train_loss": -7.136568069458008, "global_step": 190753, "epoch": 4541} {"train_loss": -7.040780544281006, "global_step": 190754, "epoch": 4541} {"train_loss": -7.088838577270508, "global_step": 190755, "epoch": 4541} {"train_loss": -7.023548603057861, "global_step": 190756, "epoch": 4541} {"train_loss": -7.084521293640137, "global_step": 190757, "epoch": 4541} {"train_loss": -7.073161602020264, "global_step": 190758, "epoch": 4541} {"train_loss": -7.092635631561279, "global_step": 190759, "epoch": 4541} {"train_loss": -7.01264762878418, "global_step": 190760, "epoch": 4541} {"train_loss": -7.187679290771484, "global_step": 190761, "epoch": 4541} {"train_loss": -6.938066482543945, "global_step": 190762, "epoch": 4541} {"train_loss": -7.121238629023234, "global_step": 190763, "epoch": 4541, "val_loss": 69053.8359375} {"train_loss": -7.1740570068359375, "global_step": 190764, "epoch": 4542} {"train_loss": -7.102507591247559, "global_step": 190765, "epoch": 4542} {"train_loss": -7.072700023651123, "global_step": 190766, "epoch": 4542} {"train_loss": -7.056362152099609, "global_step": 190767, "epoch": 4542} {"train_loss": -7.216030120849609, "global_step": 190768, "epoch": 4542} {"train_loss": -7.255656719207764, "global_step": 190769, "epoch": 4542} {"train_loss": -7.091866493225098, "global_step": 190770, "epoch": 4542} {"train_loss": -7.128395080566406, "global_step": 190771, "epoch": 4542} {"train_loss": -7.102786064147949, "global_step": 190772, "epoch": 4542} {"train_loss": -7.167533874511719, "global_step": 190773, "epoch": 4542} {"train_loss": -7.127188682556152, "global_step": 190774, "epoch": 4542} {"train_loss": -7.083629608154297, "global_step": 190775, "epoch": 4542} {"train_loss": -7.179027080535889, "global_step": 190776, "epoch": 4542} {"train_loss": -7.097233295440674, "global_step": 190777, "epoch": 4542} {"train_loss": -7.1387834548950195, "global_step": 190778, "epoch": 4542} {"train_loss": -7.08892822265625, "global_step": 190779, "epoch": 4542} {"train_loss": -7.1672258377075195, "global_step": 190780, "epoch": 4542} {"train_loss": -7.2231974601745605, "global_step": 190781, "epoch": 4542} {"train_loss": -7.102812767028809, "global_step": 190782, "epoch": 4542} {"train_loss": -7.148491382598877, "global_step": 190783, "epoch": 4542} {"train_loss": -7.17805814743042, "global_step": 190784, "epoch": 4542} {"train_loss": -7.257882118225098, "global_step": 190785, "epoch": 4542} {"train_loss": -7.137832164764404, "global_step": 190786, "epoch": 4542} {"train_loss": -7.0481719970703125, "global_step": 190787, "epoch": 4542} {"train_loss": -7.1909685134887695, "global_step": 190788, "epoch": 4542} {"train_loss": -7.185175895690918, "global_step": 190789, "epoch": 4542} {"train_loss": -7.236908912658691, "global_step": 190790, "epoch": 4542} {"train_loss": -7.228234767913818, "global_step": 190791, "epoch": 4542} {"train_loss": -7.147123336791992, "global_step": 190792, "epoch": 4542} {"train_loss": -7.113492012023926, "global_step": 190793, "epoch": 4542} {"train_loss": -7.09495735168457, "global_step": 190794, "epoch": 4542} {"train_loss": -7.1405792236328125, "global_step": 190795, "epoch": 4542} {"train_loss": -7.165676116943359, "global_step": 190796, "epoch": 4542} {"train_loss": -7.249832630157471, "global_step": 190797, "epoch": 4542} {"train_loss": -7.115758895874023, "global_step": 190798, "epoch": 4542} {"train_loss": -7.154209613800049, "global_step": 190799, "epoch": 4542} {"train_loss": -7.210369110107422, "global_step": 190800, "epoch": 4542} {"train_loss": -7.13146448135376, "global_step": 190801, "epoch": 4542} {"train_loss": -7.11147403717041, "global_step": 190802, "epoch": 4542} {"train_loss": -7.251764297485352, "global_step": 190803, "epoch": 4542} {"train_loss": -7.135869979858398, "global_step": 190804, "epoch": 4542} {"train_loss": -7.148175432568505, "global_step": 190805, "epoch": 4542, "val_loss": 68855.59375} {"train_loss": -7.109235763549805, "global_step": 190806, "epoch": 4543} {"train_loss": -7.039830207824707, "global_step": 190807, "epoch": 4543} {"train_loss": -7.07042121887207, "global_step": 190808, "epoch": 4543} {"train_loss": -7.011885643005371, "global_step": 190809, "epoch": 4543} {"train_loss": -7.158418655395508, "global_step": 190810, "epoch": 4543} {"train_loss": -7.0930657386779785, "global_step": 190811, "epoch": 4543} {"train_loss": -7.029577732086182, "global_step": 190812, "epoch": 4543} {"train_loss": -7.141712188720703, "global_step": 190813, "epoch": 4543} {"train_loss": -7.006186485290527, "global_step": 190814, "epoch": 4543} {"train_loss": -7.107608795166016, "global_step": 190815, "epoch": 4543} {"train_loss": -7.15250825881958, "global_step": 190816, "epoch": 4543} {"train_loss": -7.119359970092773, "global_step": 190817, "epoch": 4543} {"train_loss": -7.184950351715088, "global_step": 190818, "epoch": 4543} {"train_loss": -7.094992637634277, "global_step": 190819, "epoch": 4543} {"train_loss": -7.120655059814453, "global_step": 190820, "epoch": 4543} {"train_loss": -7.183347702026367, "global_step": 190821, "epoch": 4543} {"train_loss": -7.145257472991943, "global_step": 190822, "epoch": 4543} {"train_loss": -7.166046142578125, "global_step": 190823, "epoch": 4543} {"train_loss": -7.145764350891113, "global_step": 190824, "epoch": 4543} {"train_loss": -7.179866790771484, "global_step": 190825, "epoch": 4543} {"train_loss": -7.0296125411987305, "global_step": 190826, "epoch": 4543} {"train_loss": -7.1887712478637695, "global_step": 190827, "epoch": 4543} {"train_loss": -7.057669639587402, "global_step": 190828, "epoch": 4543} {"train_loss": -7.142071723937988, "global_step": 190829, "epoch": 4543} {"train_loss": -7.118242263793945, "global_step": 190830, "epoch": 4543} {"train_loss": -7.096026420593262, "global_step": 190831, "epoch": 4543} {"train_loss": -7.1993408203125, "global_step": 190832, "epoch": 4543} {"train_loss": -7.209628105163574, "global_step": 190833, "epoch": 4543} {"train_loss": -7.013899803161621, "global_step": 190834, "epoch": 4543} {"train_loss": -7.221959114074707, "global_step": 190835, "epoch": 4543} {"train_loss": -7.198361396789551, "global_step": 190836, "epoch": 4543} {"train_loss": -7.152127742767334, "global_step": 190837, "epoch": 4543} {"train_loss": -7.13514518737793, "global_step": 190838, "epoch": 4543} {"train_loss": -7.181447982788086, "global_step": 190839, "epoch": 4543} {"train_loss": -7.191366195678711, "global_step": 190840, "epoch": 4543} {"train_loss": -7.151556015014648, "global_step": 190841, "epoch": 4543} {"train_loss": -7.135204792022705, "global_step": 190842, "epoch": 4543} {"train_loss": -7.157480716705322, "global_step": 190843, "epoch": 4543} {"train_loss": -7.126226425170898, "global_step": 190844, "epoch": 4543} {"train_loss": -7.19298791885376, "global_step": 190845, "epoch": 4543} {"train_loss": -7.248905181884766, "global_step": 190846, "epoch": 4543} {"train_loss": -7.13172561781747, "global_step": 190847, "epoch": 4543, "val_loss": 68882.7265625} {"train_loss": -7.300005912780762, "global_step": 190848, "epoch": 4544} {"train_loss": -7.147971153259277, "global_step": 190849, "epoch": 4544} {"train_loss": -7.007762432098389, "global_step": 190850, "epoch": 4544} {"train_loss": -7.218729496002197, "global_step": 190851, "epoch": 4544} {"train_loss": -7.162749767303467, "global_step": 190852, "epoch": 4544} {"train_loss": -7.182856559753418, "global_step": 190853, "epoch": 4544} {"train_loss": -7.279083251953125, "global_step": 190854, "epoch": 4544} {"train_loss": -7.162964820861816, "global_step": 190855, "epoch": 4544} {"train_loss": -7.131765842437744, "global_step": 190856, "epoch": 4544} {"train_loss": -7.0999345779418945, "global_step": 190857, "epoch": 4544} {"train_loss": -7.17634916305542, "global_step": 190858, "epoch": 4544} {"train_loss": -7.182186126708984, "global_step": 190859, "epoch": 4544} {"train_loss": -7.055654525756836, "global_step": 190860, "epoch": 4544} {"train_loss": -7.204745769500732, "global_step": 190861, "epoch": 4544} {"train_loss": -7.0892863273620605, "global_step": 190862, "epoch": 4544} {"train_loss": -7.08381986618042, "global_step": 190863, "epoch": 4544} {"train_loss": -7.192030906677246, "global_step": 190864, "epoch": 4544} {"train_loss": -7.24785041809082, "global_step": 190865, "epoch": 4544} {"train_loss": -7.0241169929504395, "global_step": 190866, "epoch": 4544} {"train_loss": -7.067378044128418, "global_step": 190867, "epoch": 4544} {"train_loss": -7.18055534362793, "global_step": 190868, "epoch": 4544} {"train_loss": -7.160126686096191, "global_step": 190869, "epoch": 4544} {"train_loss": -7.153591632843018, "global_step": 190870, "epoch": 4544} {"train_loss": -7.19957160949707, "global_step": 190871, "epoch": 4544} {"train_loss": -7.108806610107422, "global_step": 190872, "epoch": 4544} {"train_loss": -7.229995250701904, "global_step": 190873, "epoch": 4544} {"train_loss": -7.319250106811523, "global_step": 190874, "epoch": 4544} {"train_loss": -7.268356800079346, "global_step": 190875, "epoch": 4544} {"train_loss": -7.184832572937012, "global_step": 190876, "epoch": 4544} {"train_loss": -7.330345630645752, "global_step": 190877, "epoch": 4544} {"train_loss": -7.093761920928955, "global_step": 190878, "epoch": 4544} {"train_loss": -7.167041778564453, "global_step": 190879, "epoch": 4544} {"train_loss": -7.154205322265625, "global_step": 190880, "epoch": 4544} {"train_loss": -7.231726169586182, "global_step": 190881, "epoch": 4544} {"train_loss": -7.196855545043945, "global_step": 190882, "epoch": 4544} {"train_loss": -7.194827556610107, "global_step": 190883, "epoch": 4544} {"train_loss": -7.122722625732422, "global_step": 190884, "epoch": 4544} {"train_loss": -7.169368743896484, "global_step": 190885, "epoch": 4544} {"train_loss": -7.276577472686768, "global_step": 190886, "epoch": 4544} {"train_loss": -7.213895797729492, "global_step": 190887, "epoch": 4544} {"train_loss": -7.11884880065918, "global_step": 190888, "epoch": 4544} {"train_loss": -7.173516091846285, "global_step": 190889, "epoch": 4544, "val_loss": 68988.015625} {"train_loss": -7.260499000549316, "global_step": 190890, "epoch": 4545} {"train_loss": -7.223067283630371, "global_step": 190891, "epoch": 4545} {"train_loss": -7.111635208129883, "global_step": 190892, "epoch": 4545} {"train_loss": -7.147580146789551, "global_step": 190893, "epoch": 4545} {"train_loss": -7.157848834991455, "global_step": 190894, "epoch": 4545} {"train_loss": -7.228231430053711, "global_step": 190895, "epoch": 4545} {"train_loss": -7.012688636779785, "global_step": 190896, "epoch": 4545} {"train_loss": -7.203083038330078, "global_step": 190897, "epoch": 4545} {"train_loss": -7.15786600112915, "global_step": 190898, "epoch": 4545} {"train_loss": -7.2050299644470215, "global_step": 190899, "epoch": 4545} {"train_loss": -7.1263861656188965, "global_step": 190900, "epoch": 4545} {"train_loss": -7.160664081573486, "global_step": 190901, "epoch": 4545} {"train_loss": -7.170589447021484, "global_step": 190902, "epoch": 4545} {"train_loss": -7.125820636749268, "global_step": 190903, "epoch": 4545} {"train_loss": -7.15287446975708, "global_step": 190904, "epoch": 4545} {"train_loss": -7.090489387512207, "global_step": 190905, "epoch": 4545} {"train_loss": -7.098670959472656, "global_step": 190906, "epoch": 4545} {"train_loss": -7.035958766937256, "global_step": 190907, "epoch": 4545} {"train_loss": -7.012146949768066, "global_step": 190908, "epoch": 4545} {"train_loss": -7.136281967163086, "global_step": 190909, "epoch": 4545} {"train_loss": -7.029473304748535, "global_step": 190910, "epoch": 4545} {"train_loss": -7.074493885040283, "global_step": 190911, "epoch": 4545} {"train_loss": -7.092595100402832, "global_step": 190912, "epoch": 4545} {"train_loss": -6.849936008453369, "global_step": 190913, "epoch": 4545} {"train_loss": -6.9947428703308105, "global_step": 190914, "epoch": 4545} {"train_loss": -7.038625717163086, "global_step": 190915, "epoch": 4545} {"train_loss": -7.127159595489502, "global_step": 190916, "epoch": 4545} {"train_loss": -7.073116302490234, "global_step": 190917, "epoch": 4545} {"train_loss": -7.058568000793457, "global_step": 190918, "epoch": 4545} {"train_loss": -7.068921089172363, "global_step": 190919, "epoch": 4545} {"train_loss": -7.055231094360352, "global_step": 190920, "epoch": 4545} {"train_loss": -7.1422576904296875, "global_step": 190921, "epoch": 4545} {"train_loss": -7.037631034851074, "global_step": 190922, "epoch": 4545} {"train_loss": -7.152458667755127, "global_step": 190923, "epoch": 4545} {"train_loss": -7.242276191711426, "global_step": 190924, "epoch": 4545} {"train_loss": -7.186326503753662, "global_step": 190925, "epoch": 4545} {"train_loss": -7.133864879608154, "global_step": 190926, "epoch": 4545} {"train_loss": -7.166090965270996, "global_step": 190927, "epoch": 4545} {"train_loss": -7.102551460266113, "global_step": 190928, "epoch": 4545} {"train_loss": -7.1769022941589355, "global_step": 190929, "epoch": 4545} {"train_loss": -7.1373443603515625, "global_step": 190930, "epoch": 4545} {"train_loss": -7.116561549050467, "global_step": 190931, "epoch": 4545, "val_loss": 68997.7578125} {"train_loss": -7.211518287658691, "global_step": 190932, "epoch": 4546} {"train_loss": -7.259221076965332, "global_step": 190933, "epoch": 4546} {"train_loss": -7.221822261810303, "global_step": 190934, "epoch": 4546} {"train_loss": -7.282972812652588, "global_step": 190935, "epoch": 4546} {"train_loss": -7.272344589233398, "global_step": 190936, "epoch": 4546} {"train_loss": -7.252659797668457, "global_step": 190937, "epoch": 4546} {"train_loss": -7.259469985961914, "global_step": 190938, "epoch": 4546} {"train_loss": -7.211025238037109, "global_step": 190939, "epoch": 4546} {"train_loss": -7.236627578735352, "global_step": 190940, "epoch": 4546} {"train_loss": -7.23973274230957, "global_step": 190941, "epoch": 4546} {"train_loss": -7.230597496032715, "global_step": 190942, "epoch": 4546} {"train_loss": -7.169025421142578, "global_step": 190943, "epoch": 4546} {"train_loss": -7.184128284454346, "global_step": 190944, "epoch": 4546} {"train_loss": -7.201874256134033, "global_step": 190945, "epoch": 4546} {"train_loss": -7.297947406768799, "global_step": 190946, "epoch": 4546} {"train_loss": -7.249053001403809, "global_step": 190947, "epoch": 4546} {"train_loss": -7.180312156677246, "global_step": 190948, "epoch": 4546} {"train_loss": -7.15542459487915, "global_step": 190949, "epoch": 4546} {"train_loss": -7.044408798217773, "global_step": 190950, "epoch": 4546} {"train_loss": -7.079135417938232, "global_step": 190951, "epoch": 4546} {"train_loss": -7.171396255493164, "global_step": 190952, "epoch": 4546} {"train_loss": -7.16232967376709, "global_step": 190953, "epoch": 4546} {"train_loss": -6.976972579956055, "global_step": 190954, "epoch": 4546} {"train_loss": -7.208393096923828, "global_step": 190955, "epoch": 4546} {"train_loss": -7.0991926193237305, "global_step": 190956, "epoch": 4546} {"train_loss": -7.163671970367432, "global_step": 190957, "epoch": 4546} {"train_loss": -7.165439128875732, "global_step": 190958, "epoch": 4546} {"train_loss": -6.9550981521606445, "global_step": 190959, "epoch": 4546} {"train_loss": -7.113796234130859, "global_step": 190960, "epoch": 4546} {"train_loss": -7.035262584686279, "global_step": 190961, "epoch": 4546} {"train_loss": -7.046738147735596, "global_step": 190962, "epoch": 4546} {"train_loss": -7.196915626525879, "global_step": 190963, "epoch": 4546} {"train_loss": -7.241225242614746, "global_step": 190964, "epoch": 4546} {"train_loss": -7.10964298248291, "global_step": 190965, "epoch": 4546} {"train_loss": -7.2200236320495605, "global_step": 190966, "epoch": 4546} {"train_loss": -7.135541915893555, "global_step": 190967, "epoch": 4546} {"train_loss": -7.169817924499512, "global_step": 190968, "epoch": 4546} {"train_loss": -7.219367027282715, "global_step": 190969, "epoch": 4546} {"train_loss": -7.242866516113281, "global_step": 190970, "epoch": 4546} {"train_loss": -7.194986343383789, "global_step": 190971, "epoch": 4546} {"train_loss": -7.257801055908203, "global_step": 190972, "epoch": 4546} {"train_loss": -7.179912589845204, "global_step": 190973, "epoch": 4546, "val_loss": 68951.1484375} {"train_loss": -7.309060096740723, "global_step": 190974, "epoch": 4547} {"train_loss": -7.307492256164551, "global_step": 190975, "epoch": 4547} {"train_loss": -7.221059799194336, "global_step": 190976, "epoch": 4547} {"train_loss": -7.202520370483398, "global_step": 190977, "epoch": 4547} {"train_loss": -7.183469295501709, "global_step": 190978, "epoch": 4547} {"train_loss": -7.265542030334473, "global_step": 190979, "epoch": 4547} {"train_loss": -7.163567066192627, "global_step": 190980, "epoch": 4547} {"train_loss": -7.255003929138184, "global_step": 190981, "epoch": 4547} {"train_loss": -7.186440467834473, "global_step": 190982, "epoch": 4547} {"train_loss": -7.204464912414551, "global_step": 190983, "epoch": 4547} {"train_loss": -7.191944122314453, "global_step": 190984, "epoch": 4547} {"train_loss": -7.052651405334473, "global_step": 190985, "epoch": 4547} {"train_loss": -7.184391021728516, "global_step": 190986, "epoch": 4547} {"train_loss": -7.098988056182861, "global_step": 190987, "epoch": 4547} {"train_loss": -7.111588954925537, "global_step": 190988, "epoch": 4547} {"train_loss": -7.2032976150512695, "global_step": 190989, "epoch": 4547} {"train_loss": -7.180922508239746, "global_step": 190990, "epoch": 4547} {"train_loss": -7.07168436050415, "global_step": 190991, "epoch": 4547} {"train_loss": -7.145443439483643, "global_step": 190992, "epoch": 4547} {"train_loss": -7.044002532958984, "global_step": 190993, "epoch": 4547} {"train_loss": -7.0392255783081055, "global_step": 190994, "epoch": 4547} {"train_loss": -7.183371067047119, "global_step": 190995, "epoch": 4547} {"train_loss": -7.1105499267578125, "global_step": 190996, "epoch": 4547} {"train_loss": -7.188603401184082, "global_step": 190997, "epoch": 4547} {"train_loss": -7.023542404174805, "global_step": 190998, "epoch": 4547} {"train_loss": -7.110175132751465, "global_step": 190999, "epoch": 4547} {"train_loss": -7.078367233276367, "global_step": 191000, "epoch": 4547} {"train_loss": -7.011404037475586, "global_step": 191001, "epoch": 4547} {"train_loss": -7.1898908615112305, "global_step": 191002, "epoch": 4547} {"train_loss": -7.002541542053223, "global_step": 191003, "epoch": 4547} {"train_loss": -7.026749134063721, "global_step": 191004, "epoch": 4547} {"train_loss": -7.078899383544922, "global_step": 191005, "epoch": 4547} {"train_loss": -6.993614673614502, "global_step": 191006, "epoch": 4547} {"train_loss": -7.1217122077941895, "global_step": 191007, "epoch": 4547} {"train_loss": -7.1060967445373535, "global_step": 191008, "epoch": 4547} {"train_loss": -7.04156494140625, "global_step": 191009, "epoch": 4547} {"train_loss": -7.199455738067627, "global_step": 191010, "epoch": 4547} {"train_loss": -7.166469573974609, "global_step": 191011, "epoch": 4547} {"train_loss": -7.068363189697266, "global_step": 191012, "epoch": 4547} {"train_loss": -7.147365570068359, "global_step": 191013, "epoch": 4547} {"train_loss": -7.065476417541504, "global_step": 191014, "epoch": 4547} {"train_loss": -7.134698266074771, "global_step": 191015, "epoch": 4547, "val_loss": 68974.6875} {"train_loss": -7.088345527648926, "global_step": 191016, "epoch": 4548} {"train_loss": -7.115474700927734, "global_step": 191017, "epoch": 4548} {"train_loss": -7.172168254852295, "global_step": 191018, "epoch": 4548} {"train_loss": -7.035289287567139, "global_step": 191019, "epoch": 4548} {"train_loss": -7.215996265411377, "global_step": 191020, "epoch": 4548} {"train_loss": -7.148958683013916, "global_step": 191021, "epoch": 4548} {"train_loss": -7.217041969299316, "global_step": 191022, "epoch": 4548} {"train_loss": -7.138005256652832, "global_step": 191023, "epoch": 4548} {"train_loss": -7.084063529968262, "global_step": 191024, "epoch": 4548} {"train_loss": -7.052679538726807, "global_step": 191025, "epoch": 4548} {"train_loss": -7.064422607421875, "global_step": 191026, "epoch": 4548} {"train_loss": -7.154544353485107, "global_step": 191027, "epoch": 4548} {"train_loss": -7.12358283996582, "global_step": 191028, "epoch": 4548} {"train_loss": -7.091984748840332, "global_step": 191029, "epoch": 4548} {"train_loss": -7.140389442443848, "global_step": 191030, "epoch": 4548} {"train_loss": -6.982304096221924, "global_step": 191031, "epoch": 4548} {"train_loss": -7.09920072555542, "global_step": 191032, "epoch": 4548} {"train_loss": -7.043735504150391, "global_step": 191033, "epoch": 4548} {"train_loss": -7.1021728515625, "global_step": 191034, "epoch": 4548} {"train_loss": -7.042104721069336, "global_step": 191035, "epoch": 4548} {"train_loss": -6.961355686187744, "global_step": 191036, "epoch": 4548} {"train_loss": -7.067806243896484, "global_step": 191037, "epoch": 4548} {"train_loss": -7.026983261108398, "global_step": 191038, "epoch": 4548} {"train_loss": -7.030882358551025, "global_step": 191039, "epoch": 4548} {"train_loss": -7.028219699859619, "global_step": 191040, "epoch": 4548} {"train_loss": -7.089025497436523, "global_step": 191041, "epoch": 4548} {"train_loss": -7.005876541137695, "global_step": 191042, "epoch": 4548} {"train_loss": -7.082602500915527, "global_step": 191043, "epoch": 4548} {"train_loss": -7.037618637084961, "global_step": 191044, "epoch": 4548} {"train_loss": -7.135008335113525, "global_step": 191045, "epoch": 4548} {"train_loss": -7.069314002990723, "global_step": 191046, "epoch": 4548} {"train_loss": -7.089949607849121, "global_step": 191047, "epoch": 4548} {"train_loss": -7.0924553871154785, "global_step": 191048, "epoch": 4548} {"train_loss": -7.04599666595459, "global_step": 191049, "epoch": 4548} {"train_loss": -7.065702438354492, "global_step": 191050, "epoch": 4548} {"train_loss": -7.071284294128418, "global_step": 191051, "epoch": 4548} {"train_loss": -7.194578170776367, "global_step": 191052, "epoch": 4548} {"train_loss": -7.084473609924316, "global_step": 191053, "epoch": 4548} {"train_loss": -7.236970901489258, "global_step": 191054, "epoch": 4548} {"train_loss": -7.150634765625, "global_step": 191055, "epoch": 4548} {"train_loss": -7.217577934265137, "global_step": 191056, "epoch": 4548} {"train_loss": -7.096553393772671, "global_step": 191057, "epoch": 4548, "val_loss": 68865.375} {"train_loss": -7.0812883377075195, "global_step": 191058, "epoch": 4549} {"train_loss": -7.090679168701172, "global_step": 191059, "epoch": 4549} {"train_loss": -7.175004959106445, "global_step": 191060, "epoch": 4549} {"train_loss": -7.168518543243408, "global_step": 191061, "epoch": 4549} {"train_loss": -7.13039493560791, "global_step": 191062, "epoch": 4549} {"train_loss": -7.155911445617676, "global_step": 191063, "epoch": 4549} {"train_loss": -7.189475059509277, "global_step": 191064, "epoch": 4549} {"train_loss": -7.24085807800293, "global_step": 191065, "epoch": 4549} {"train_loss": -7.230362415313721, "global_step": 191066, "epoch": 4549} {"train_loss": -7.194068908691406, "global_step": 191067, "epoch": 4549} {"train_loss": -7.058773994445801, "global_step": 191068, "epoch": 4549} {"train_loss": -7.14227294921875, "global_step": 191069, "epoch": 4549} {"train_loss": -7.093816757202148, "global_step": 191070, "epoch": 4549} {"train_loss": -7.1286797523498535, "global_step": 191071, "epoch": 4549} {"train_loss": -7.115108489990234, "global_step": 191072, "epoch": 4549} {"train_loss": -7.0225372314453125, "global_step": 191073, "epoch": 4549} {"train_loss": -7.15981912612915, "global_step": 191074, "epoch": 4549} {"train_loss": -7.157268524169922, "global_step": 191075, "epoch": 4549} {"train_loss": -7.048537254333496, "global_step": 191076, "epoch": 4549} {"train_loss": -7.141265869140625, "global_step": 191077, "epoch": 4549} {"train_loss": -7.111874580383301, "global_step": 191078, "epoch": 4549} {"train_loss": -7.070614814758301, "global_step": 191079, "epoch": 4549} {"train_loss": -7.13205623626709, "global_step": 191080, "epoch": 4549} {"train_loss": -7.090141296386719, "global_step": 191081, "epoch": 4549} {"train_loss": -7.083734035491943, "global_step": 191082, "epoch": 4549} {"train_loss": -7.102239608764648, "global_step": 191083, "epoch": 4549} {"train_loss": -7.074023246765137, "global_step": 191084, "epoch": 4549} {"train_loss": -6.988156318664551, "global_step": 191085, "epoch": 4549} {"train_loss": -6.951751708984375, "global_step": 191086, "epoch": 4549} {"train_loss": -7.106666564941406, "global_step": 191087, "epoch": 4549} {"train_loss": -7.032204627990723, "global_step": 191088, "epoch": 4549} {"train_loss": -7.170792102813721, "global_step": 191089, "epoch": 4549} {"train_loss": -7.014747619628906, "global_step": 191090, "epoch": 4549} {"train_loss": -7.021506309509277, "global_step": 191091, "epoch": 4549} {"train_loss": -7.061734199523926, "global_step": 191092, "epoch": 4549} {"train_loss": -7.022258758544922, "global_step": 191093, "epoch": 4549} {"train_loss": -7.083777904510498, "global_step": 191094, "epoch": 4549} {"train_loss": -7.133516788482666, "global_step": 191095, "epoch": 4549} {"train_loss": -7.127432346343994, "global_step": 191096, "epoch": 4549} {"train_loss": -7.105682373046875, "global_step": 191097, "epoch": 4549} {"train_loss": -7.172696113586426, "global_step": 191098, "epoch": 4549} {"train_loss": -7.104664859317598, "global_step": 191099, "epoch": 4549, "val_loss": 68912.6640625} {"train_loss": -7.141141891479492, "global_step": 191100, "epoch": 4550} {"train_loss": -7.028107643127441, "global_step": 191101, "epoch": 4550} {"train_loss": -7.271024703979492, "global_step": 191102, "epoch": 4550} {"train_loss": -7.1067304611206055, "global_step": 191103, "epoch": 4550} {"train_loss": -7.091139793395996, "global_step": 191104, "epoch": 4550} {"train_loss": -7.205832481384277, "global_step": 191105, "epoch": 4550} {"train_loss": -7.160093784332275, "global_step": 191106, "epoch": 4550} {"train_loss": -7.109103202819824, "global_step": 191107, "epoch": 4550} {"train_loss": -7.277660369873047, "global_step": 191108, "epoch": 4550} {"train_loss": -7.170706748962402, "global_step": 191109, "epoch": 4550} {"train_loss": -7.183940887451172, "global_step": 191110, "epoch": 4550} {"train_loss": -7.179416656494141, "global_step": 191111, "epoch": 4550} {"train_loss": -7.184976577758789, "global_step": 191112, "epoch": 4550} {"train_loss": -7.256274700164795, "global_step": 191113, "epoch": 4550} {"train_loss": -7.195383548736572, "global_step": 191114, "epoch": 4550} {"train_loss": -7.225103855133057, "global_step": 191115, "epoch": 4550} {"train_loss": -7.203210830688477, "global_step": 191116, "epoch": 4550} {"train_loss": -7.256669521331787, "global_step": 191117, "epoch": 4550} {"train_loss": -7.244110107421875, "global_step": 191118, "epoch": 4550} {"train_loss": -7.262598991394043, "global_step": 191119, "epoch": 4550} {"train_loss": -7.226991653442383, "global_step": 191120, "epoch": 4550} {"train_loss": -7.206526756286621, "global_step": 191121, "epoch": 4550} {"train_loss": -7.252932548522949, "global_step": 191122, "epoch": 4550} {"train_loss": -7.150646686553955, "global_step": 191123, "epoch": 4550} {"train_loss": -7.246921539306641, "global_step": 191124, "epoch": 4550} {"train_loss": -7.1526899337768555, "global_step": 191125, "epoch": 4550} {"train_loss": -7.2588629722595215, "global_step": 191126, "epoch": 4550} {"train_loss": -7.251676559448242, "global_step": 191127, "epoch": 4550} {"train_loss": -7.237339973449707, "global_step": 191128, "epoch": 4550} {"train_loss": -7.20747184753418, "global_step": 191129, "epoch": 4550} {"train_loss": -7.172999382019043, "global_step": 191130, "epoch": 4550} {"train_loss": -7.196603775024414, "global_step": 191131, "epoch": 4550} {"train_loss": -7.119756698608398, "global_step": 191132, "epoch": 4550} {"train_loss": -7.063672065734863, "global_step": 191133, "epoch": 4550} {"train_loss": -7.186009407043457, "global_step": 191134, "epoch": 4550} {"train_loss": -7.14410400390625, "global_step": 191135, "epoch": 4550} {"train_loss": -7.180630683898926, "global_step": 191136, "epoch": 4550} {"train_loss": -7.021197319030762, "global_step": 191137, "epoch": 4550} {"train_loss": -7.05887508392334, "global_step": 191138, "epoch": 4550} {"train_loss": -7.150327682495117, "global_step": 191139, "epoch": 4550} {"train_loss": -7.181312561035156, "global_step": 191140, "epoch": 4550} {"train_loss": -7.178476730982463, "global_step": 191141, "epoch": 4550, "train/sim_max_reward_0": 0.34177912303698416, "train/sim_max_reward_1": 0.9931903979365135, "train/sim_max_reward_2": 0.8280051886535336, "train/sim_max_reward_3": 0.13299659992476529, "train/sim_max_reward_4": 0.42635997390691577, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.20444408430961256, "test/sim_max_reward_4400001": 0.651074140742807, "test/sim_max_reward_4400002": 0.5162697075549778, "test/sim_max_reward_4400003": 0.8429808978334572, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.8040954302822666, "test/sim_max_reward_4400006": 0.9926224696425653, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3130037714423308, "test/sim_max_reward_4400009": 0.9400154027382666, "test/sim_max_reward_4400010": 0.958163951986781, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.7521809671116939, "test/sim_max_reward_4400015": 0.09808069710624799, "test/sim_max_reward_4400016": 0.9306406477196328, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2498075580681001, "test/sim_max_reward_4400019": 0.0770017382594396, "test/sim_max_reward_4400020": 0.9346137475381326, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8999017598904742, "test/sim_max_reward_4400023": 0.1712513630696157, "test/sim_max_reward_4400024": 0.41074764379648443, "test/sim_max_reward_4400025": 0.2658271562219833, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.018958858608718866, "test/sim_max_reward_4400028": 0.3995812265320436, "test/sim_max_reward_4400029": 0.5519026587864921, "test/sim_max_reward_4400030": 0.9814044351256346, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 0.9541773331759639, "test/sim_max_reward_4400035": 0.9619279137815533, "test/sim_max_reward_4400036": 0.572123131371043, "test/sim_max_reward_4400037": 0.9605245722179191, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9709604281676583, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9339470044485241, "test/sim_max_reward_4400042": 0.5367464090467542, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.9201183167146497, "test/sim_max_reward_4400047": 0.923328423285604, "test/sim_max_reward_4400048": 0.980882700210443, "test/sim_max_reward_4400049": 0.9580560553566059, "train/mean_score": 0.6203885472431186, "test/mean_score": 0.6236711516535075, "val_loss": 68974.546875} {"train_loss": -6.967559814453125, "global_step": 191142, "epoch": 4551} {"train_loss": -7.041385650634766, "global_step": 191143, "epoch": 4551} {"train_loss": -7.132541179656982, "global_step": 191144, "epoch": 4551} {"train_loss": -7.095393180847168, "global_step": 191145, "epoch": 4551} {"train_loss": -7.04862117767334, "global_step": 191146, "epoch": 4551} {"train_loss": -7.05564022064209, "global_step": 191147, "epoch": 4551} {"train_loss": -7.026697635650635, "global_step": 191148, "epoch": 4551} {"train_loss": -7.104608535766602, "global_step": 191149, "epoch": 4551} {"train_loss": -7.0693559646606445, "global_step": 191150, "epoch": 4551} {"train_loss": -7.024479866027832, "global_step": 191151, "epoch": 4551} {"train_loss": -7.2110114097595215, "global_step": 191152, "epoch": 4551} {"train_loss": -6.981950283050537, "global_step": 191153, "epoch": 4551} {"train_loss": -7.140281677246094, "global_step": 191154, "epoch": 4551} {"train_loss": -7.159628868103027, "global_step": 191155, "epoch": 4551} {"train_loss": -7.07492208480835, "global_step": 191156, "epoch": 4551} {"train_loss": -7.095132350921631, "global_step": 191157, "epoch": 4551} {"train_loss": -7.11769962310791, "global_step": 191158, "epoch": 4551} {"train_loss": -7.177715301513672, "global_step": 191159, "epoch": 4551} {"train_loss": -7.144518852233887, "global_step": 191160, "epoch": 4551} {"train_loss": -7.111840724945068, "global_step": 191161, "epoch": 4551} {"train_loss": -7.0909013748168945, "global_step": 191162, "epoch": 4551} {"train_loss": -7.02537727355957, "global_step": 191163, "epoch": 4551} {"train_loss": -7.198680877685547, "global_step": 191164, "epoch": 4551} {"train_loss": -7.166465759277344, "global_step": 191165, "epoch": 4551} {"train_loss": -7.164973735809326, "global_step": 191166, "epoch": 4551} {"train_loss": -7.1328959465026855, "global_step": 191167, "epoch": 4551} {"train_loss": -7.119662284851074, "global_step": 191168, "epoch": 4551} {"train_loss": -7.101866245269775, "global_step": 191169, "epoch": 4551} {"train_loss": -7.129622936248779, "global_step": 191170, "epoch": 4551} {"train_loss": -7.134960651397705, "global_step": 191171, "epoch": 4551} {"train_loss": -7.044431686401367, "global_step": 191172, "epoch": 4551} {"train_loss": -7.066496849060059, "global_step": 191173, "epoch": 4551} {"train_loss": -7.18587589263916, "global_step": 191174, "epoch": 4551} {"train_loss": -7.06318998336792, "global_step": 191175, "epoch": 4551} {"train_loss": -7.054615497589111, "global_step": 191176, "epoch": 4551} {"train_loss": -7.162889003753662, "global_step": 191177, "epoch": 4551} {"train_loss": -7.15371561050415, "global_step": 191178, "epoch": 4551} {"train_loss": -7.205460548400879, "global_step": 191179, "epoch": 4551} {"train_loss": -7.113297462463379, "global_step": 191180, "epoch": 4551} {"train_loss": -7.11846923828125, "global_step": 191181, "epoch": 4551} {"train_loss": -7.141946315765381, "global_step": 191182, "epoch": 4551} {"train_loss": -7.106017532802763, "global_step": 191183, "epoch": 4551, "val_loss": 69015.78125} {"train_loss": -7.17879581451416, "global_step": 191184, "epoch": 4552} {"train_loss": -7.228129863739014, "global_step": 191185, "epoch": 4552} {"train_loss": -7.21165657043457, "global_step": 191186, "epoch": 4552} {"train_loss": -7.111043930053711, "global_step": 191187, "epoch": 4552} {"train_loss": -7.10788631439209, "global_step": 191188, "epoch": 4552} {"train_loss": -7.064998626708984, "global_step": 191189, "epoch": 4552} {"train_loss": -7.1351165771484375, "global_step": 191190, "epoch": 4552} {"train_loss": -7.154736042022705, "global_step": 191191, "epoch": 4552} {"train_loss": -7.129816055297852, "global_step": 191192, "epoch": 4552} {"train_loss": -7.1247382164001465, "global_step": 191193, "epoch": 4552} {"train_loss": -7.179086685180664, "global_step": 191194, "epoch": 4552} {"train_loss": -7.226871967315674, "global_step": 191195, "epoch": 4552} {"train_loss": -7.154560089111328, "global_step": 191196, "epoch": 4552} {"train_loss": -7.1042327880859375, "global_step": 191197, "epoch": 4552} {"train_loss": -7.046313285827637, "global_step": 191198, "epoch": 4552} {"train_loss": -7.173321723937988, "global_step": 191199, "epoch": 4552} {"train_loss": -7.1328301429748535, "global_step": 191200, "epoch": 4552} {"train_loss": -7.16668176651001, "global_step": 191201, "epoch": 4552} {"train_loss": -7.230316162109375, "global_step": 191202, "epoch": 4552} {"train_loss": -7.149630546569824, "global_step": 191203, "epoch": 4552} {"train_loss": -7.180414199829102, "global_step": 191204, "epoch": 4552} {"train_loss": -7.144119739532471, "global_step": 191205, "epoch": 4552} {"train_loss": -7.21563720703125, "global_step": 191206, "epoch": 4552} {"train_loss": -7.079599857330322, "global_step": 191207, "epoch": 4552} {"train_loss": -7.107767581939697, "global_step": 191208, "epoch": 4552} {"train_loss": -7.0719499588012695, "global_step": 191209, "epoch": 4552} {"train_loss": -7.20322322845459, "global_step": 191210, "epoch": 4552} {"train_loss": -7.213662624359131, "global_step": 191211, "epoch": 4552} {"train_loss": -7.185716152191162, "global_step": 191212, "epoch": 4552} {"train_loss": -7.103604316711426, "global_step": 191213, "epoch": 4552} {"train_loss": -7.114498138427734, "global_step": 191214, "epoch": 4552} {"train_loss": -7.186197757720947, "global_step": 191215, "epoch": 4552} {"train_loss": -7.224282264709473, "global_step": 191216, "epoch": 4552} {"train_loss": -7.179981231689453, "global_step": 191217, "epoch": 4552} {"train_loss": -7.219389915466309, "global_step": 191218, "epoch": 4552} {"train_loss": -6.987867832183838, "global_step": 191219, "epoch": 4552} {"train_loss": -7.180427074432373, "global_step": 191220, "epoch": 4552} {"train_loss": -7.0524187088012695, "global_step": 191221, "epoch": 4552} {"train_loss": -7.142978668212891, "global_step": 191222, "epoch": 4552} {"train_loss": -7.18717098236084, "global_step": 191223, "epoch": 4552} {"train_loss": -7.202299118041992, "global_step": 191224, "epoch": 4552} {"train_loss": -7.15005856468564, "global_step": 191225, "epoch": 4552, "val_loss": 69013.4375} {"train_loss": -7.219853401184082, "global_step": 191226, "epoch": 4553} {"train_loss": -7.175772666931152, "global_step": 191227, "epoch": 4553} {"train_loss": -7.196243762969971, "global_step": 191228, "epoch": 4553} {"train_loss": -7.194020748138428, "global_step": 191229, "epoch": 4553} {"train_loss": -7.221968650817871, "global_step": 191230, "epoch": 4553} {"train_loss": -7.174536228179932, "global_step": 191231, "epoch": 4553} {"train_loss": -7.163668155670166, "global_step": 191232, "epoch": 4553} {"train_loss": -7.168901443481445, "global_step": 191233, "epoch": 4553} {"train_loss": -7.2096333503723145, "global_step": 191234, "epoch": 4553} {"train_loss": -7.181851863861084, "global_step": 191235, "epoch": 4553} {"train_loss": -7.151724338531494, "global_step": 191236, "epoch": 4553} {"train_loss": -7.093181133270264, "global_step": 191237, "epoch": 4553} {"train_loss": -7.316034317016602, "global_step": 191238, "epoch": 4553} {"train_loss": -7.207028865814209, "global_step": 191239, "epoch": 4553} {"train_loss": -7.153725624084473, "global_step": 191240, "epoch": 4553} {"train_loss": -7.232824325561523, "global_step": 191241, "epoch": 4553} {"train_loss": -7.1497907638549805, "global_step": 191242, "epoch": 4553} {"train_loss": -7.325748443603516, "global_step": 191243, "epoch": 4553} {"train_loss": -7.152067184448242, "global_step": 191244, "epoch": 4553} {"train_loss": -7.206890106201172, "global_step": 191245, "epoch": 4553} {"train_loss": -7.108652114868164, "global_step": 191246, "epoch": 4553} {"train_loss": -7.107913494110107, "global_step": 191247, "epoch": 4553} {"train_loss": -7.270625114440918, "global_step": 191248, "epoch": 4553} {"train_loss": -7.179143905639648, "global_step": 191249, "epoch": 4553} {"train_loss": -7.270505905151367, "global_step": 191250, "epoch": 4553} {"train_loss": -7.201435089111328, "global_step": 191251, "epoch": 4553} {"train_loss": -7.2206926345825195, "global_step": 191252, "epoch": 4553} {"train_loss": -7.230717658996582, "global_step": 191253, "epoch": 4553} {"train_loss": -7.166228771209717, "global_step": 191254, "epoch": 4553} {"train_loss": -7.305826187133789, "global_step": 191255, "epoch": 4553} {"train_loss": -7.204390525817871, "global_step": 191256, "epoch": 4553} {"train_loss": -7.2167463302612305, "global_step": 191257, "epoch": 4553} {"train_loss": -7.119389533996582, "global_step": 191258, "epoch": 4553} {"train_loss": -7.2059407234191895, "global_step": 191259, "epoch": 4553} {"train_loss": -7.153164863586426, "global_step": 191260, "epoch": 4553} {"train_loss": -7.23817253112793, "global_step": 191261, "epoch": 4553} {"train_loss": -7.201470851898193, "global_step": 191262, "epoch": 4553} {"train_loss": -7.247313499450684, "global_step": 191263, "epoch": 4553} {"train_loss": -7.088825225830078, "global_step": 191264, "epoch": 4553} {"train_loss": -7.169795513153076, "global_step": 191265, "epoch": 4553} {"train_loss": -7.176673889160156, "global_step": 191266, "epoch": 4553} {"train_loss": -7.1955695719946, "global_step": 191267, "epoch": 4553, "val_loss": 69091.125} {"train_loss": -7.06895637512207, "global_step": 191268, "epoch": 4554} {"train_loss": -7.303050994873047, "global_step": 191269, "epoch": 4554} {"train_loss": -7.1006317138671875, "global_step": 191270, "epoch": 4554} {"train_loss": -6.992029666900635, "global_step": 191271, "epoch": 4554} {"train_loss": -7.217510223388672, "global_step": 191272, "epoch": 4554} {"train_loss": -7.038815498352051, "global_step": 191273, "epoch": 4554} {"train_loss": -7.115109920501709, "global_step": 191274, "epoch": 4554} {"train_loss": -7.165017127990723, "global_step": 191275, "epoch": 4554} {"train_loss": -7.095861434936523, "global_step": 191276, "epoch": 4554} {"train_loss": -7.009047508239746, "global_step": 191277, "epoch": 4554} {"train_loss": -7.169620513916016, "global_step": 191278, "epoch": 4554} {"train_loss": -7.107280731201172, "global_step": 191279, "epoch": 4554} {"train_loss": -7.092031478881836, "global_step": 191280, "epoch": 4554} {"train_loss": -7.170253753662109, "global_step": 191281, "epoch": 4554} {"train_loss": -6.997682571411133, "global_step": 191282, "epoch": 4554} {"train_loss": -6.989703178405762, "global_step": 191283, "epoch": 4554} {"train_loss": -7.0581817626953125, "global_step": 191284, "epoch": 4554} {"train_loss": -7.0430192947387695, "global_step": 191285, "epoch": 4554} {"train_loss": -6.940273284912109, "global_step": 191286, "epoch": 4554} {"train_loss": -7.073507785797119, "global_step": 191287, "epoch": 4554} {"train_loss": -7.050462245941162, "global_step": 191288, "epoch": 4554} {"train_loss": -6.958744049072266, "global_step": 191289, "epoch": 4554} {"train_loss": -7.116400718688965, "global_step": 191290, "epoch": 4554} {"train_loss": -7.050015449523926, "global_step": 191291, "epoch": 4554} {"train_loss": -7.163188457489014, "global_step": 191292, "epoch": 4554} {"train_loss": -7.01918888092041, "global_step": 191293, "epoch": 4554} {"train_loss": -7.058780670166016, "global_step": 191294, "epoch": 4554} {"train_loss": -7.155632972717285, "global_step": 191295, "epoch": 4554} {"train_loss": -7.102041244506836, "global_step": 191296, "epoch": 4554} {"train_loss": -7.215442657470703, "global_step": 191297, "epoch": 4554} {"train_loss": -7.24794864654541, "global_step": 191298, "epoch": 4554} {"train_loss": -7.260125160217285, "global_step": 191299, "epoch": 4554} {"train_loss": -7.206167221069336, "global_step": 191300, "epoch": 4554} {"train_loss": -7.181200981140137, "global_step": 191301, "epoch": 4554} {"train_loss": -7.207659721374512, "global_step": 191302, "epoch": 4554} {"train_loss": -7.204094886779785, "global_step": 191303, "epoch": 4554} {"train_loss": -7.122368812561035, "global_step": 191304, "epoch": 4554} {"train_loss": -7.203432559967041, "global_step": 191305, "epoch": 4554} {"train_loss": -7.135558128356934, "global_step": 191306, "epoch": 4554} {"train_loss": -7.2099127769470215, "global_step": 191307, "epoch": 4554} {"train_loss": -7.175264358520508, "global_step": 191308, "epoch": 4554} {"train_loss": -7.119135436557588, "global_step": 191309, "epoch": 4554, "val_loss": 68889.9609375} {"train_loss": -7.1632537841796875, "global_step": 191310, "epoch": 4555} {"train_loss": -7.192440986633301, "global_step": 191311, "epoch": 4555} {"train_loss": -7.311835289001465, "global_step": 191312, "epoch": 4555} {"train_loss": -7.243897438049316, "global_step": 191313, "epoch": 4555} {"train_loss": -7.168637275695801, "global_step": 191314, "epoch": 4555} {"train_loss": -7.156834602355957, "global_step": 191315, "epoch": 4555} {"train_loss": -7.277884006500244, "global_step": 191316, "epoch": 4555} {"train_loss": -7.256969451904297, "global_step": 191317, "epoch": 4555} {"train_loss": -7.33881950378418, "global_step": 191318, "epoch": 4555} {"train_loss": -7.192542552947998, "global_step": 191319, "epoch": 4555} {"train_loss": -7.122179985046387, "global_step": 191320, "epoch": 4555} {"train_loss": -7.1682448387146, "global_step": 191321, "epoch": 4555} {"train_loss": -7.131233215332031, "global_step": 191322, "epoch": 4555} {"train_loss": -7.248640537261963, "global_step": 191323, "epoch": 4555} {"train_loss": -7.180553436279297, "global_step": 191324, "epoch": 4555} {"train_loss": -7.139930725097656, "global_step": 191325, "epoch": 4555} {"train_loss": -7.126121520996094, "global_step": 191326, "epoch": 4555} {"train_loss": -7.236860275268555, "global_step": 191327, "epoch": 4555} {"train_loss": -7.235650539398193, "global_step": 191328, "epoch": 4555} {"train_loss": -7.096373081207275, "global_step": 191329, "epoch": 4555} {"train_loss": -7.180574893951416, "global_step": 191330, "epoch": 4555} {"train_loss": -6.928789138793945, "global_step": 191331, "epoch": 4555} {"train_loss": -7.247238636016846, "global_step": 191332, "epoch": 4555} {"train_loss": -7.107813358306885, "global_step": 191333, "epoch": 4555} {"train_loss": -7.202236652374268, "global_step": 191334, "epoch": 4555} {"train_loss": -7.134651184082031, "global_step": 191335, "epoch": 4555} {"train_loss": -7.0520524978637695, "global_step": 191336, "epoch": 4555} {"train_loss": -7.011684894561768, "global_step": 191337, "epoch": 4555} {"train_loss": -7.154636383056641, "global_step": 191338, "epoch": 4555} {"train_loss": -7.085625171661377, "global_step": 191339, "epoch": 4555} {"train_loss": -7.148977279663086, "global_step": 191340, "epoch": 4555} {"train_loss": -7.159177780151367, "global_step": 191341, "epoch": 4555} {"train_loss": -7.172271251678467, "global_step": 191342, "epoch": 4555} {"train_loss": -7.091292381286621, "global_step": 191343, "epoch": 4555} {"train_loss": -7.17662239074707, "global_step": 191344, "epoch": 4555} {"train_loss": -7.216108322143555, "global_step": 191345, "epoch": 4555} {"train_loss": -7.097067832946777, "global_step": 191346, "epoch": 4555} {"train_loss": -7.240178108215332, "global_step": 191347, "epoch": 4555} {"train_loss": -7.24794864654541, "global_step": 191348, "epoch": 4555} {"train_loss": -7.0683698654174805, "global_step": 191349, "epoch": 4555} {"train_loss": -7.187232971191406, "global_step": 191350, "epoch": 4555} {"train_loss": -7.16794566881089, "global_step": 191351, "epoch": 4555, "val_loss": 68825.5859375} {"train_loss": -7.130003452301025, "global_step": 191352, "epoch": 4556} {"train_loss": -7.237575054168701, "global_step": 191353, "epoch": 4556} {"train_loss": -7.099801063537598, "global_step": 191354, "epoch": 4556} {"train_loss": -7.147737979888916, "global_step": 191355, "epoch": 4556} {"train_loss": -7.1737589836120605, "global_step": 191356, "epoch": 4556} {"train_loss": -6.978741645812988, "global_step": 191357, "epoch": 4556} {"train_loss": -7.21718692779541, "global_step": 191358, "epoch": 4556} {"train_loss": -7.176448822021484, "global_step": 191359, "epoch": 4556} {"train_loss": -7.030399322509766, "global_step": 191360, "epoch": 4556} {"train_loss": -7.1924309730529785, "global_step": 191361, "epoch": 4556} {"train_loss": -7.034654140472412, "global_step": 191362, "epoch": 4556} {"train_loss": -7.032402038574219, "global_step": 191363, "epoch": 4556} {"train_loss": -7.075837135314941, "global_step": 191364, "epoch": 4556} {"train_loss": -6.999969959259033, "global_step": 191365, "epoch": 4556} {"train_loss": -7.099259376525879, "global_step": 191366, "epoch": 4556} {"train_loss": -7.0599517822265625, "global_step": 191367, "epoch": 4556} {"train_loss": -6.929486274719238, "global_step": 191368, "epoch": 4556} {"train_loss": -7.1193389892578125, "global_step": 191369, "epoch": 4556} {"train_loss": -7.133279800415039, "global_step": 191370, "epoch": 4556} {"train_loss": -6.957810401916504, "global_step": 191371, "epoch": 4556} {"train_loss": -7.0859880447387695, "global_step": 191372, "epoch": 4556} {"train_loss": -7.032988548278809, "global_step": 191373, "epoch": 4556} {"train_loss": -6.929625511169434, "global_step": 191374, "epoch": 4556} {"train_loss": -7.0694732666015625, "global_step": 191375, "epoch": 4556} {"train_loss": -7.071887016296387, "global_step": 191376, "epoch": 4556} {"train_loss": -7.036352157592773, "global_step": 191377, "epoch": 4556} {"train_loss": -7.207345008850098, "global_step": 191378, "epoch": 4556} {"train_loss": -7.127686977386475, "global_step": 191379, "epoch": 4556} {"train_loss": -7.016683578491211, "global_step": 191380, "epoch": 4556} {"train_loss": -7.103363037109375, "global_step": 191381, "epoch": 4556} {"train_loss": -7.057435989379883, "global_step": 191382, "epoch": 4556} {"train_loss": -7.104301929473877, "global_step": 191383, "epoch": 4556} {"train_loss": -7.151698589324951, "global_step": 191384, "epoch": 4556} {"train_loss": -7.027150630950928, "global_step": 191385, "epoch": 4556} {"train_loss": -7.149532318115234, "global_step": 191386, "epoch": 4556} {"train_loss": -7.040719032287598, "global_step": 191387, "epoch": 4556} {"train_loss": -7.105417251586914, "global_step": 191388, "epoch": 4556} {"train_loss": -7.103131294250488, "global_step": 191389, "epoch": 4556} {"train_loss": -7.040523052215576, "global_step": 191390, "epoch": 4556} {"train_loss": -7.118051052093506, "global_step": 191391, "epoch": 4556} {"train_loss": -7.081363677978516, "global_step": 191392, "epoch": 4556} {"train_loss": -7.087109384082613, "global_step": 191393, "epoch": 4556, "val_loss": 68724.4140625} {"train_loss": -7.15250301361084, "global_step": 191394, "epoch": 4557} {"train_loss": -7.157095909118652, "global_step": 191395, "epoch": 4557} {"train_loss": -7.138333797454834, "global_step": 191396, "epoch": 4557} {"train_loss": -7.1944169998168945, "global_step": 191397, "epoch": 4557} {"train_loss": -7.154507637023926, "global_step": 191398, "epoch": 4557} {"train_loss": -7.15564489364624, "global_step": 191399, "epoch": 4557} {"train_loss": -7.087779998779297, "global_step": 191400, "epoch": 4557} {"train_loss": -7.154107093811035, "global_step": 191401, "epoch": 4557} {"train_loss": -7.168146133422852, "global_step": 191402, "epoch": 4557} {"train_loss": -7.121665954589844, "global_step": 191403, "epoch": 4557} {"train_loss": -7.111437797546387, "global_step": 191404, "epoch": 4557} {"train_loss": -7.012600898742676, "global_step": 191405, "epoch": 4557} {"train_loss": -7.23672342300415, "global_step": 191406, "epoch": 4557} {"train_loss": -7.06954288482666, "global_step": 191407, "epoch": 4557} {"train_loss": -7.0887651443481445, "global_step": 191408, "epoch": 4557} {"train_loss": -7.134734153747559, "global_step": 191409, "epoch": 4557} {"train_loss": -7.07973575592041, "global_step": 191410, "epoch": 4557} {"train_loss": -7.1362481117248535, "global_step": 191411, "epoch": 4557} {"train_loss": -7.118232250213623, "global_step": 191412, "epoch": 4557} {"train_loss": -7.037985801696777, "global_step": 191413, "epoch": 4557} {"train_loss": -7.069645404815674, "global_step": 191414, "epoch": 4557} {"train_loss": -7.040046215057373, "global_step": 191415, "epoch": 4557} {"train_loss": -7.23625373840332, "global_step": 191416, "epoch": 4557} {"train_loss": -7.030111312866211, "global_step": 191417, "epoch": 4557} {"train_loss": -7.216387748718262, "global_step": 191418, "epoch": 4557} {"train_loss": -7.215226173400879, "global_step": 191419, "epoch": 4557} {"train_loss": -7.201281547546387, "global_step": 191420, "epoch": 4557} {"train_loss": -7.256947040557861, "global_step": 191421, "epoch": 4557} {"train_loss": -7.204636573791504, "global_step": 191422, "epoch": 4557} {"train_loss": -7.099127769470215, "global_step": 191423, "epoch": 4557} {"train_loss": -7.1781511306762695, "global_step": 191424, "epoch": 4557} {"train_loss": -7.155955791473389, "global_step": 191425, "epoch": 4557} {"train_loss": -7.192605972290039, "global_step": 191426, "epoch": 4557} {"train_loss": -7.097318172454834, "global_step": 191427, "epoch": 4557} {"train_loss": -7.1566314697265625, "global_step": 191428, "epoch": 4557} {"train_loss": -7.1628828048706055, "global_step": 191429, "epoch": 4557} {"train_loss": -7.033734321594238, "global_step": 191430, "epoch": 4557} {"train_loss": -7.107842922210693, "global_step": 191431, "epoch": 4557} {"train_loss": -7.134093284606934, "global_step": 191432, "epoch": 4557} {"train_loss": -7.095117568969727, "global_step": 191433, "epoch": 4557} {"train_loss": -7.236713409423828, "global_step": 191434, "epoch": 4557} {"train_loss": -7.1368702593303865, "global_step": 191435, "epoch": 4557, "val_loss": 69091.0546875} {"train_loss": -7.13047456741333, "global_step": 191436, "epoch": 4558} {"train_loss": -7.1751813888549805, "global_step": 191437, "epoch": 4558} {"train_loss": -7.149919509887695, "global_step": 191438, "epoch": 4558} {"train_loss": -7.0520195960998535, "global_step": 191439, "epoch": 4558} {"train_loss": -7.097065448760986, "global_step": 191440, "epoch": 4558} {"train_loss": -7.133333206176758, "global_step": 191441, "epoch": 4558} {"train_loss": -6.987179756164551, "global_step": 191442, "epoch": 4558} {"train_loss": -7.039799690246582, "global_step": 191443, "epoch": 4558} {"train_loss": -7.089569091796875, "global_step": 191444, "epoch": 4558} {"train_loss": -7.166311264038086, "global_step": 191445, "epoch": 4558} {"train_loss": -7.194293975830078, "global_step": 191446, "epoch": 4558} {"train_loss": -7.107851505279541, "global_step": 191447, "epoch": 4558} {"train_loss": -7.160837173461914, "global_step": 191448, "epoch": 4558} {"train_loss": -7.12867546081543, "global_step": 191449, "epoch": 4558} {"train_loss": -7.088540077209473, "global_step": 191450, "epoch": 4558} {"train_loss": -7.247458457946777, "global_step": 191451, "epoch": 4558} {"train_loss": -6.912798881530762, "global_step": 191452, "epoch": 4558} {"train_loss": -7.019351005554199, "global_step": 191453, "epoch": 4558} {"train_loss": -7.1666259765625, "global_step": 191454, "epoch": 4558} {"train_loss": -7.014113426208496, "global_step": 191455, "epoch": 4558} {"train_loss": -7.097094535827637, "global_step": 191456, "epoch": 4558} {"train_loss": -7.161049842834473, "global_step": 191457, "epoch": 4558} {"train_loss": -7.19600772857666, "global_step": 191458, "epoch": 4558} {"train_loss": -7.123710632324219, "global_step": 191459, "epoch": 4558} {"train_loss": -7.206183433532715, "global_step": 191460, "epoch": 4558} {"train_loss": -7.254222869873047, "global_step": 191461, "epoch": 4558} {"train_loss": -7.114027976989746, "global_step": 191462, "epoch": 4558} {"train_loss": -7.257054328918457, "global_step": 191463, "epoch": 4558} {"train_loss": -7.198554992675781, "global_step": 191464, "epoch": 4558} {"train_loss": -6.9845380783081055, "global_step": 191465, "epoch": 4558} {"train_loss": -7.134057998657227, "global_step": 191466, "epoch": 4558} {"train_loss": -7.129359245300293, "global_step": 191467, "epoch": 4558} {"train_loss": -7.00738525390625, "global_step": 191468, "epoch": 4558} {"train_loss": -7.06107759475708, "global_step": 191469, "epoch": 4558} {"train_loss": -7.093897819519043, "global_step": 191470, "epoch": 4558} {"train_loss": -7.021880149841309, "global_step": 191471, "epoch": 4558} {"train_loss": -7.134167671203613, "global_step": 191472, "epoch": 4558} {"train_loss": -6.903137683868408, "global_step": 191473, "epoch": 4558} {"train_loss": -7.155154705047607, "global_step": 191474, "epoch": 4558} {"train_loss": -7.123088836669922, "global_step": 191475, "epoch": 4558} {"train_loss": -7.119283199310303, "global_step": 191476, "epoch": 4558} {"train_loss": -7.111017953781855, "global_step": 191477, "epoch": 4558, "val_loss": 68926.3828125} {"train_loss": -7.133142948150635, "global_step": 191478, "epoch": 4559} {"train_loss": -7.070291519165039, "global_step": 191479, "epoch": 4559} {"train_loss": -7.143496990203857, "global_step": 191480, "epoch": 4559} {"train_loss": -7.098240852355957, "global_step": 191481, "epoch": 4559} {"train_loss": -7.1775970458984375, "global_step": 191482, "epoch": 4559} {"train_loss": -7.026527404785156, "global_step": 191483, "epoch": 4559} {"train_loss": -7.134744644165039, "global_step": 191484, "epoch": 4559} {"train_loss": -7.238931655883789, "global_step": 191485, "epoch": 4559} {"train_loss": -7.05195426940918, "global_step": 191486, "epoch": 4559} {"train_loss": -7.140864849090576, "global_step": 191487, "epoch": 4559} {"train_loss": -7.091585159301758, "global_step": 191488, "epoch": 4559} {"train_loss": -7.126110553741455, "global_step": 191489, "epoch": 4559} {"train_loss": -7.17897367477417, "global_step": 191490, "epoch": 4559} {"train_loss": -7.021647930145264, "global_step": 191491, "epoch": 4559} {"train_loss": -7.1921844482421875, "global_step": 191492, "epoch": 4559} {"train_loss": -7.167088985443115, "global_step": 191493, "epoch": 4559} {"train_loss": -7.177600860595703, "global_step": 191494, "epoch": 4559} {"train_loss": -7.200926780700684, "global_step": 191495, "epoch": 4559} {"train_loss": -7.090323448181152, "global_step": 191496, "epoch": 4559} {"train_loss": -7.14971399307251, "global_step": 191497, "epoch": 4559} {"train_loss": -7.177135467529297, "global_step": 191498, "epoch": 4559} {"train_loss": -7.181473731994629, "global_step": 191499, "epoch": 4559} {"train_loss": -7.179024696350098, "global_step": 191500, "epoch": 4559} {"train_loss": -7.2041730880737305, "global_step": 191501, "epoch": 4559} {"train_loss": -7.246338844299316, "global_step": 191502, "epoch": 4559} {"train_loss": -7.100556373596191, "global_step": 191503, "epoch": 4559} {"train_loss": -7.230330944061279, "global_step": 191504, "epoch": 4559} {"train_loss": -7.097751140594482, "global_step": 191505, "epoch": 4559} {"train_loss": -7.104236602783203, "global_step": 191506, "epoch": 4559} {"train_loss": -7.054494857788086, "global_step": 191507, "epoch": 4559} {"train_loss": -7.072243690490723, "global_step": 191508, "epoch": 4559} {"train_loss": -7.339045524597168, "global_step": 191509, "epoch": 4559} {"train_loss": -7.242700099945068, "global_step": 191510, "epoch": 4559} {"train_loss": -6.971942901611328, "global_step": 191511, "epoch": 4559} {"train_loss": -7.010052680969238, "global_step": 191512, "epoch": 4559} {"train_loss": -7.042444705963135, "global_step": 191513, "epoch": 4559} {"train_loss": -7.008187770843506, "global_step": 191514, "epoch": 4559} {"train_loss": -7.1181793212890625, "global_step": 191515, "epoch": 4559} {"train_loss": -6.956415176391602, "global_step": 191516, "epoch": 4559} {"train_loss": -7.053195953369141, "global_step": 191517, "epoch": 4559} {"train_loss": -7.065630912780762, "global_step": 191518, "epoch": 4559} {"train_loss": -7.122127294540405, "global_step": 191519, "epoch": 4559, "val_loss": 68901.0390625} {"train_loss": -7.182389259338379, "global_step": 191520, "epoch": 4560} {"train_loss": -6.996365547180176, "global_step": 191521, "epoch": 4560} {"train_loss": -7.050501823425293, "global_step": 191522, "epoch": 4560} {"train_loss": -7.112316131591797, "global_step": 191523, "epoch": 4560} {"train_loss": -7.100756645202637, "global_step": 191524, "epoch": 4560} {"train_loss": -7.023797988891602, "global_step": 191525, "epoch": 4560} {"train_loss": -7.062365531921387, "global_step": 191526, "epoch": 4560} {"train_loss": -7.089371204376221, "global_step": 191527, "epoch": 4560} {"train_loss": -7.117432594299316, "global_step": 191528, "epoch": 4560} {"train_loss": -7.042754650115967, "global_step": 191529, "epoch": 4560} {"train_loss": -7.143683910369873, "global_step": 191530, "epoch": 4560} {"train_loss": -6.992771625518799, "global_step": 191531, "epoch": 4560} {"train_loss": -7.251577854156494, "global_step": 191532, "epoch": 4560} {"train_loss": -7.150720596313477, "global_step": 191533, "epoch": 4560} {"train_loss": -7.14012336730957, "global_step": 191534, "epoch": 4560} {"train_loss": -7.1538920402526855, "global_step": 191535, "epoch": 4560} {"train_loss": -7.091525077819824, "global_step": 191536, "epoch": 4560} {"train_loss": -7.157718658447266, "global_step": 191537, "epoch": 4560} {"train_loss": -7.176154613494873, "global_step": 191538, "epoch": 4560} {"train_loss": -7.085010528564453, "global_step": 191539, "epoch": 4560} {"train_loss": -7.0429277420043945, "global_step": 191540, "epoch": 4560} {"train_loss": -7.179662704467773, "global_step": 191541, "epoch": 4560} {"train_loss": -7.063846588134766, "global_step": 191542, "epoch": 4560} {"train_loss": -7.203537464141846, "global_step": 191543, "epoch": 4560} {"train_loss": -7.265964031219482, "global_step": 191544, "epoch": 4560} {"train_loss": -7.1267499923706055, "global_step": 191545, "epoch": 4560} {"train_loss": -7.182651519775391, "global_step": 191546, "epoch": 4560} {"train_loss": -7.105648040771484, "global_step": 191547, "epoch": 4560} {"train_loss": -7.190778732299805, "global_step": 191548, "epoch": 4560} {"train_loss": -7.149109363555908, "global_step": 191549, "epoch": 4560} {"train_loss": -7.147059917449951, "global_step": 191550, "epoch": 4560} {"train_loss": -7.312887668609619, "global_step": 191551, "epoch": 4560} {"train_loss": -7.261307716369629, "global_step": 191552, "epoch": 4560} {"train_loss": -7.290687561035156, "global_step": 191553, "epoch": 4560} {"train_loss": -7.26171875, "global_step": 191554, "epoch": 4560} {"train_loss": -7.108177185058594, "global_step": 191555, "epoch": 4560} {"train_loss": -7.164140701293945, "global_step": 191556, "epoch": 4560} {"train_loss": -7.13475227355957, "global_step": 191557, "epoch": 4560} {"train_loss": -6.993413925170898, "global_step": 191558, "epoch": 4560} {"train_loss": -7.120308876037598, "global_step": 191559, "epoch": 4560} {"train_loss": -7.190821647644043, "global_step": 191560, "epoch": 4560} {"train_loss": -7.133933124088106, "global_step": 191561, "epoch": 4560, "val_loss": 69027.59375} {"train_loss": -7.178019046783447, "global_step": 191562, "epoch": 4561} {"train_loss": -7.112625598907471, "global_step": 191563, "epoch": 4561} {"train_loss": -7.11682653427124, "global_step": 191564, "epoch": 4561} {"train_loss": -7.0618743896484375, "global_step": 191565, "epoch": 4561} {"train_loss": -7.006325721740723, "global_step": 191566, "epoch": 4561} {"train_loss": -7.0301194190979, "global_step": 191567, "epoch": 4561} {"train_loss": -7.25957727432251, "global_step": 191568, "epoch": 4561} {"train_loss": -7.182776927947998, "global_step": 191569, "epoch": 4561} {"train_loss": -7.156897068023682, "global_step": 191570, "epoch": 4561} {"train_loss": -7.183347225189209, "global_step": 191571, "epoch": 4561} {"train_loss": -7.062114238739014, "global_step": 191572, "epoch": 4561} {"train_loss": -7.117926597595215, "global_step": 191573, "epoch": 4561} {"train_loss": -7.161636829376221, "global_step": 191574, "epoch": 4561} {"train_loss": -7.05521297454834, "global_step": 191575, "epoch": 4561} {"train_loss": -7.149349212646484, "global_step": 191576, "epoch": 4561} {"train_loss": -7.154632091522217, "global_step": 191577, "epoch": 4561} {"train_loss": -7.084592819213867, "global_step": 191578, "epoch": 4561} {"train_loss": -7.205256462097168, "global_step": 191579, "epoch": 4561} {"train_loss": -7.164038181304932, "global_step": 191580, "epoch": 4561} {"train_loss": -7.177845001220703, "global_step": 191581, "epoch": 4561} {"train_loss": -7.16402006149292, "global_step": 191582, "epoch": 4561} {"train_loss": -7.0990891456604, "global_step": 191583, "epoch": 4561} {"train_loss": -7.0950927734375, "global_step": 191584, "epoch": 4561} {"train_loss": -7.164155006408691, "global_step": 191585, "epoch": 4561} {"train_loss": -7.125217437744141, "global_step": 191586, "epoch": 4561} {"train_loss": -7.186187744140625, "global_step": 191587, "epoch": 4561} {"train_loss": -7.2271318435668945, "global_step": 191588, "epoch": 4561} {"train_loss": -7.172873497009277, "global_step": 191589, "epoch": 4561} {"train_loss": -7.197813987731934, "global_step": 191590, "epoch": 4561} {"train_loss": -7.189288139343262, "global_step": 191591, "epoch": 4561} {"train_loss": -7.1265153884887695, "global_step": 191592, "epoch": 4561} {"train_loss": -7.174173831939697, "global_step": 191593, "epoch": 4561} {"train_loss": -7.216161727905273, "global_step": 191594, "epoch": 4561} {"train_loss": -7.1278276443481445, "global_step": 191595, "epoch": 4561} {"train_loss": -7.282303810119629, "global_step": 191596, "epoch": 4561} {"train_loss": -7.17060661315918, "global_step": 191597, "epoch": 4561} {"train_loss": -7.298826217651367, "global_step": 191598, "epoch": 4561} {"train_loss": -7.181049346923828, "global_step": 191599, "epoch": 4561} {"train_loss": -7.239886283874512, "global_step": 191600, "epoch": 4561} {"train_loss": -7.172684669494629, "global_step": 191601, "epoch": 4561} {"train_loss": -7.2400312423706055, "global_step": 191602, "epoch": 4561} {"train_loss": -7.159288304192679, "global_step": 191603, "epoch": 4561, "val_loss": 68850.5078125} {"train_loss": -7.134895324707031, "global_step": 191604, "epoch": 4562} {"train_loss": -7.244379997253418, "global_step": 191605, "epoch": 4562} {"train_loss": -7.292514801025391, "global_step": 191606, "epoch": 4562} {"train_loss": -7.189816951751709, "global_step": 191607, "epoch": 4562} {"train_loss": -7.093405723571777, "global_step": 191608, "epoch": 4562} {"train_loss": -7.227858543395996, "global_step": 191609, "epoch": 4562} {"train_loss": -7.081056118011475, "global_step": 191610, "epoch": 4562} {"train_loss": -7.176962852478027, "global_step": 191611, "epoch": 4562} {"train_loss": -7.103537559509277, "global_step": 191612, "epoch": 4562} {"train_loss": -7.044438362121582, "global_step": 191613, "epoch": 4562} {"train_loss": -7.1851301193237305, "global_step": 191614, "epoch": 4562} {"train_loss": -7.123554229736328, "global_step": 191615, "epoch": 4562} {"train_loss": -6.930757522583008, "global_step": 191616, "epoch": 4562} {"train_loss": -7.226324081420898, "global_step": 191617, "epoch": 4562} {"train_loss": -7.138115882873535, "global_step": 191618, "epoch": 4562} {"train_loss": -7.197671413421631, "global_step": 191619, "epoch": 4562} {"train_loss": -7.103285312652588, "global_step": 191620, "epoch": 4562} {"train_loss": -7.049110412597656, "global_step": 191621, "epoch": 4562} {"train_loss": -7.204494476318359, "global_step": 191622, "epoch": 4562} {"train_loss": -7.102639198303223, "global_step": 191623, "epoch": 4562} {"train_loss": -7.237699508666992, "global_step": 191624, "epoch": 4562} {"train_loss": -7.05308198928833, "global_step": 191625, "epoch": 4562} {"train_loss": -7.000714302062988, "global_step": 191626, "epoch": 4562} {"train_loss": -7.208329200744629, "global_step": 191627, "epoch": 4562} {"train_loss": -7.211494445800781, "global_step": 191628, "epoch": 4562} {"train_loss": -7.124059677124023, "global_step": 191629, "epoch": 4562} {"train_loss": -7.050379753112793, "global_step": 191630, "epoch": 4562} {"train_loss": -7.133139610290527, "global_step": 191631, "epoch": 4562} {"train_loss": -7.149305820465088, "global_step": 191632, "epoch": 4562} {"train_loss": -7.12907600402832, "global_step": 191633, "epoch": 4562} {"train_loss": -7.227706432342529, "global_step": 191634, "epoch": 4562} {"train_loss": -7.238214492797852, "global_step": 191635, "epoch": 4562} {"train_loss": -7.163896560668945, "global_step": 191636, "epoch": 4562} {"train_loss": -7.145312786102295, "global_step": 191637, "epoch": 4562} {"train_loss": -7.115427017211914, "global_step": 191638, "epoch": 4562} {"train_loss": -7.118873596191406, "global_step": 191639, "epoch": 4562} {"train_loss": -7.039114952087402, "global_step": 191640, "epoch": 4562} {"train_loss": -7.186335563659668, "global_step": 191641, "epoch": 4562} {"train_loss": -7.157078266143799, "global_step": 191642, "epoch": 4562} {"train_loss": -7.0342488288879395, "global_step": 191643, "epoch": 4562} {"train_loss": -7.150174617767334, "global_step": 191644, "epoch": 4562} {"train_loss": -7.141219434284029, "global_step": 191645, "epoch": 4562, "val_loss": 68965.28125} {"train_loss": -7.094538688659668, "global_step": 191646, "epoch": 4563} {"train_loss": -7.201394081115723, "global_step": 191647, "epoch": 4563} {"train_loss": -7.184176445007324, "global_step": 191648, "epoch": 4563} {"train_loss": -7.123797416687012, "global_step": 191649, "epoch": 4563} {"train_loss": -7.016200065612793, "global_step": 191650, "epoch": 4563} {"train_loss": -7.1320905685424805, "global_step": 191651, "epoch": 4563} {"train_loss": -7.107712745666504, "global_step": 191652, "epoch": 4563} {"train_loss": -7.08575439453125, "global_step": 191653, "epoch": 4563} {"train_loss": -7.003252983093262, "global_step": 191654, "epoch": 4563} {"train_loss": -7.017151832580566, "global_step": 191655, "epoch": 4563} {"train_loss": -7.096734046936035, "global_step": 191656, "epoch": 4563} {"train_loss": -7.173773288726807, "global_step": 191657, "epoch": 4563} {"train_loss": -7.012935161590576, "global_step": 191658, "epoch": 4563} {"train_loss": -7.069750785827637, "global_step": 191659, "epoch": 4563} {"train_loss": -7.158412933349609, "global_step": 191660, "epoch": 4563} {"train_loss": -7.10887336730957, "global_step": 191661, "epoch": 4563} {"train_loss": -7.286681175231934, "global_step": 191662, "epoch": 4563} {"train_loss": -7.232048511505127, "global_step": 191663, "epoch": 4563} {"train_loss": -7.010748863220215, "global_step": 191664, "epoch": 4563} {"train_loss": -7.099815368652344, "global_step": 191665, "epoch": 4563} {"train_loss": -7.164678573608398, "global_step": 191666, "epoch": 4563} {"train_loss": -7.1197614669799805, "global_step": 191667, "epoch": 4563} {"train_loss": -7.190240859985352, "global_step": 191668, "epoch": 4563} {"train_loss": -7.080432891845703, "global_step": 191669, "epoch": 4563} {"train_loss": -7.047552585601807, "global_step": 191670, "epoch": 4563} {"train_loss": -7.2449259757995605, "global_step": 191671, "epoch": 4563} {"train_loss": -7.266268253326416, "global_step": 191672, "epoch": 4563} {"train_loss": -7.191518783569336, "global_step": 191673, "epoch": 4563} {"train_loss": -7.114099502563477, "global_step": 191674, "epoch": 4563} {"train_loss": -7.120373725891113, "global_step": 191675, "epoch": 4563} {"train_loss": -7.151059627532959, "global_step": 191676, "epoch": 4563} {"train_loss": -7.164222240447998, "global_step": 191677, "epoch": 4563} {"train_loss": -7.157508850097656, "global_step": 191678, "epoch": 4563} {"train_loss": -7.146092891693115, "global_step": 191679, "epoch": 4563} {"train_loss": -7.218075752258301, "global_step": 191680, "epoch": 4563} {"train_loss": -7.085583686828613, "global_step": 191681, "epoch": 4563} {"train_loss": -7.152678489685059, "global_step": 191682, "epoch": 4563} {"train_loss": -7.233524322509766, "global_step": 191683, "epoch": 4563} {"train_loss": -7.282743453979492, "global_step": 191684, "epoch": 4563} {"train_loss": -7.041589736938477, "global_step": 191685, "epoch": 4563} {"train_loss": -7.149849891662598, "global_step": 191686, "epoch": 4563} {"train_loss": -7.134320781344459, "global_step": 191687, "epoch": 4563, "val_loss": 68923.9140625} {"train_loss": -7.180187225341797, "global_step": 191688, "epoch": 4564} {"train_loss": -7.108292579650879, "global_step": 191689, "epoch": 4564} {"train_loss": -7.293500900268555, "global_step": 191690, "epoch": 4564} {"train_loss": -7.208906173706055, "global_step": 191691, "epoch": 4564} {"train_loss": -7.255002975463867, "global_step": 191692, "epoch": 4564} {"train_loss": -7.16251802444458, "global_step": 191693, "epoch": 4564} {"train_loss": -7.144523620605469, "global_step": 191694, "epoch": 4564} {"train_loss": -7.206229209899902, "global_step": 191695, "epoch": 4564} {"train_loss": -7.284302234649658, "global_step": 191696, "epoch": 4564} {"train_loss": -7.319255828857422, "global_step": 191697, "epoch": 4564} {"train_loss": -7.227899551391602, "global_step": 191698, "epoch": 4564} {"train_loss": -7.272984981536865, "global_step": 191699, "epoch": 4564} {"train_loss": -7.182459354400635, "global_step": 191700, "epoch": 4564} {"train_loss": -7.204670429229736, "global_step": 191701, "epoch": 4564} {"train_loss": -7.250640392303467, "global_step": 191702, "epoch": 4564} {"train_loss": -7.194612503051758, "global_step": 191703, "epoch": 4564} {"train_loss": -7.1068925857543945, "global_step": 191704, "epoch": 4564} {"train_loss": -7.233017444610596, "global_step": 191705, "epoch": 4564} {"train_loss": -7.220721244812012, "global_step": 191706, "epoch": 4564} {"train_loss": -7.197576522827148, "global_step": 191707, "epoch": 4564} {"train_loss": -7.190325736999512, "global_step": 191708, "epoch": 4564} {"train_loss": -7.105459690093994, "global_step": 191709, "epoch": 4564} {"train_loss": -7.368869304656982, "global_step": 191710, "epoch": 4564} {"train_loss": -7.072897911071777, "global_step": 191711, "epoch": 4564} {"train_loss": -7.15592622756958, "global_step": 191712, "epoch": 4564} {"train_loss": -7.218902587890625, "global_step": 191713, "epoch": 4564} {"train_loss": -7.189922332763672, "global_step": 191714, "epoch": 4564} {"train_loss": -7.212363243103027, "global_step": 191715, "epoch": 4564} {"train_loss": -7.160882949829102, "global_step": 191716, "epoch": 4564} {"train_loss": -7.21165657043457, "global_step": 191717, "epoch": 4564} {"train_loss": -7.205533504486084, "global_step": 191718, "epoch": 4564} {"train_loss": -7.163388252258301, "global_step": 191719, "epoch": 4564} {"train_loss": -7.15096378326416, "global_step": 191720, "epoch": 4564} {"train_loss": -7.173951625823975, "global_step": 191721, "epoch": 4564} {"train_loss": -7.057732582092285, "global_step": 191722, "epoch": 4564} {"train_loss": -7.17103910446167, "global_step": 191723, "epoch": 4564} {"train_loss": -7.138761520385742, "global_step": 191724, "epoch": 4564} {"train_loss": -7.089136123657227, "global_step": 191725, "epoch": 4564} {"train_loss": -7.227398872375488, "global_step": 191726, "epoch": 4564} {"train_loss": -7.200160503387451, "global_step": 191727, "epoch": 4564} {"train_loss": -7.162281036376953, "global_step": 191728, "epoch": 4564} {"train_loss": -7.193408966064453, "global_step": 191729, "epoch": 4564, "val_loss": 68798.28125} {"train_loss": -7.122247695922852, "global_step": 191730, "epoch": 4565} {"train_loss": -7.03679895401001, "global_step": 191731, "epoch": 4565} {"train_loss": -7.152063846588135, "global_step": 191732, "epoch": 4565} {"train_loss": -7.239753723144531, "global_step": 191733, "epoch": 4565} {"train_loss": -7.225933074951172, "global_step": 191734, "epoch": 4565} {"train_loss": -7.23628044128418, "global_step": 191735, "epoch": 4565} {"train_loss": -7.15505838394165, "global_step": 191736, "epoch": 4565} {"train_loss": -7.17463493347168, "global_step": 191737, "epoch": 4565} {"train_loss": -7.135420799255371, "global_step": 191738, "epoch": 4565} {"train_loss": -6.987009048461914, "global_step": 191739, "epoch": 4565} {"train_loss": -7.090121746063232, "global_step": 191740, "epoch": 4565} {"train_loss": -7.112890243530273, "global_step": 191741, "epoch": 4565} {"train_loss": -7.04200553894043, "global_step": 191742, "epoch": 4565} {"train_loss": -7.078708648681641, "global_step": 191743, "epoch": 4565} {"train_loss": -7.173664093017578, "global_step": 191744, "epoch": 4565} {"train_loss": -7.080079078674316, "global_step": 191745, "epoch": 4565} {"train_loss": -7.12682580947876, "global_step": 191746, "epoch": 4565} {"train_loss": -6.93269157409668, "global_step": 191747, "epoch": 4565} {"train_loss": -7.147344589233398, "global_step": 191748, "epoch": 4565} {"train_loss": -7.136049270629883, "global_step": 191749, "epoch": 4565} {"train_loss": -7.194242000579834, "global_step": 191750, "epoch": 4565} {"train_loss": -6.9535956382751465, "global_step": 191751, "epoch": 4565} {"train_loss": -7.033634185791016, "global_step": 191752, "epoch": 4565} {"train_loss": -7.029347896575928, "global_step": 191753, "epoch": 4565} {"train_loss": -7.04709005355835, "global_step": 191754, "epoch": 4565} {"train_loss": -6.9812421798706055, "global_step": 191755, "epoch": 4565} {"train_loss": -7.23863410949707, "global_step": 191756, "epoch": 4565} {"train_loss": -7.096540451049805, "global_step": 191757, "epoch": 4565} {"train_loss": -7.03449010848999, "global_step": 191758, "epoch": 4565} {"train_loss": -7.194571495056152, "global_step": 191759, "epoch": 4565} {"train_loss": -7.050341606140137, "global_step": 191760, "epoch": 4565} {"train_loss": -7.020096778869629, "global_step": 191761, "epoch": 4565} {"train_loss": -6.978456497192383, "global_step": 191762, "epoch": 4565} {"train_loss": -7.024106502532959, "global_step": 191763, "epoch": 4565} {"train_loss": -7.078300476074219, "global_step": 191764, "epoch": 4565} {"train_loss": -7.075582504272461, "global_step": 191765, "epoch": 4565} {"train_loss": -7.051045894622803, "global_step": 191766, "epoch": 4565} {"train_loss": -7.060015678405762, "global_step": 191767, "epoch": 4565} {"train_loss": -7.095998764038086, "global_step": 191768, "epoch": 4565} {"train_loss": -7.214179992675781, "global_step": 191769, "epoch": 4565} {"train_loss": -7.1158342361450195, "global_step": 191770, "epoch": 4565} {"train_loss": -7.0955676805405385, "global_step": 191771, "epoch": 4565, "val_loss": 68974.140625} {"train_loss": -7.006442070007324, "global_step": 191772, "epoch": 4566} {"train_loss": -6.9595489501953125, "global_step": 191773, "epoch": 4566} {"train_loss": -7.166389465332031, "global_step": 191774, "epoch": 4566} {"train_loss": -7.019327640533447, "global_step": 191775, "epoch": 4566} {"train_loss": -7.19420862197876, "global_step": 191776, "epoch": 4566} {"train_loss": -7.004095077514648, "global_step": 191777, "epoch": 4566} {"train_loss": -7.052184104919434, "global_step": 191778, "epoch": 4566} {"train_loss": -7.078790187835693, "global_step": 191779, "epoch": 4566} {"train_loss": -6.903036594390869, "global_step": 191780, "epoch": 4566} {"train_loss": -7.195596694946289, "global_step": 191781, "epoch": 4566} {"train_loss": -7.079075813293457, "global_step": 191782, "epoch": 4566} {"train_loss": -7.193148612976074, "global_step": 191783, "epoch": 4566} {"train_loss": -7.020621299743652, "global_step": 191784, "epoch": 4566} {"train_loss": -7.098840713500977, "global_step": 191785, "epoch": 4566} {"train_loss": -7.126051425933838, "global_step": 191786, "epoch": 4566} {"train_loss": -7.075285911560059, "global_step": 191787, "epoch": 4566} {"train_loss": -7.119660377502441, "global_step": 191788, "epoch": 4566} {"train_loss": -7.1599602699279785, "global_step": 191789, "epoch": 4566} {"train_loss": -7.254951477050781, "global_step": 191790, "epoch": 4566} {"train_loss": -7.122395038604736, "global_step": 191791, "epoch": 4566} {"train_loss": -7.175168514251709, "global_step": 191792, "epoch": 4566} {"train_loss": -7.007416725158691, "global_step": 191793, "epoch": 4566} {"train_loss": -7.252188682556152, "global_step": 191794, "epoch": 4566} {"train_loss": -7.013931751251221, "global_step": 191795, "epoch": 4566} {"train_loss": -7.113908767700195, "global_step": 191796, "epoch": 4566} {"train_loss": -7.112009525299072, "global_step": 191797, "epoch": 4566} {"train_loss": -7.075165271759033, "global_step": 191798, "epoch": 4566} {"train_loss": -7.189938068389893, "global_step": 191799, "epoch": 4566} {"train_loss": -7.123263835906982, "global_step": 191800, "epoch": 4566} {"train_loss": -7.071689605712891, "global_step": 191801, "epoch": 4566} {"train_loss": -7.216245651245117, "global_step": 191802, "epoch": 4566} {"train_loss": -7.225415229797363, "global_step": 191803, "epoch": 4566} {"train_loss": -7.089676856994629, "global_step": 191804, "epoch": 4566} {"train_loss": -7.210160255432129, "global_step": 191805, "epoch": 4566} {"train_loss": -7.180607318878174, "global_step": 191806, "epoch": 4566} {"train_loss": -7.132694244384766, "global_step": 191807, "epoch": 4566} {"train_loss": -7.245017051696777, "global_step": 191808, "epoch": 4566} {"train_loss": -7.2604546546936035, "global_step": 191809, "epoch": 4566} {"train_loss": -7.177506446838379, "global_step": 191810, "epoch": 4566} {"train_loss": -7.213385581970215, "global_step": 191811, "epoch": 4566} {"train_loss": -7.244978904724121, "global_step": 191812, "epoch": 4566} {"train_loss": -7.125449805032639, "global_step": 191813, "epoch": 4566, "val_loss": 68895.2578125} {"train_loss": -7.099127769470215, "global_step": 191814, "epoch": 4567} {"train_loss": -7.107407093048096, "global_step": 191815, "epoch": 4567} {"train_loss": -7.185407638549805, "global_step": 191816, "epoch": 4567} {"train_loss": -7.238455772399902, "global_step": 191817, "epoch": 4567} {"train_loss": -7.23765754699707, "global_step": 191818, "epoch": 4567} {"train_loss": -7.2143402099609375, "global_step": 191819, "epoch": 4567} {"train_loss": -7.101613521575928, "global_step": 191820, "epoch": 4567} {"train_loss": -7.154782295227051, "global_step": 191821, "epoch": 4567} {"train_loss": -7.262021541595459, "global_step": 191822, "epoch": 4567} {"train_loss": -7.166948318481445, "global_step": 191823, "epoch": 4567} {"train_loss": -7.182919502258301, "global_step": 191824, "epoch": 4567} {"train_loss": -7.143910884857178, "global_step": 191825, "epoch": 4567} {"train_loss": -7.18386173248291, "global_step": 191826, "epoch": 4567} {"train_loss": -7.137691497802734, "global_step": 191827, "epoch": 4567} {"train_loss": -7.177521705627441, "global_step": 191828, "epoch": 4567} {"train_loss": -7.088698863983154, "global_step": 191829, "epoch": 4567} {"train_loss": -7.172019958496094, "global_step": 191830, "epoch": 4567} {"train_loss": -7.1732330322265625, "global_step": 191831, "epoch": 4567} {"train_loss": -7.219021797180176, "global_step": 191832, "epoch": 4567} {"train_loss": -7.193253040313721, "global_step": 191833, "epoch": 4567} {"train_loss": -7.1387128829956055, "global_step": 191834, "epoch": 4567} {"train_loss": -7.1165852546691895, "global_step": 191835, "epoch": 4567} {"train_loss": -7.193422317504883, "global_step": 191836, "epoch": 4567} {"train_loss": -7.1822710037231445, "global_step": 191837, "epoch": 4567} {"train_loss": -7.092164039611816, "global_step": 191838, "epoch": 4567} {"train_loss": -7.100524425506592, "global_step": 191839, "epoch": 4567} {"train_loss": -7.193112850189209, "global_step": 191840, "epoch": 4567} {"train_loss": -7.059483528137207, "global_step": 191841, "epoch": 4567} {"train_loss": -7.151973247528076, "global_step": 191842, "epoch": 4567} {"train_loss": -7.116629600524902, "global_step": 191843, "epoch": 4567} {"train_loss": -7.022698402404785, "global_step": 191844, "epoch": 4567} {"train_loss": -7.174443244934082, "global_step": 191845, "epoch": 4567} {"train_loss": -7.018252372741699, "global_step": 191846, "epoch": 4567} {"train_loss": -7.2082319259643555, "global_step": 191847, "epoch": 4567} {"train_loss": -7.116814613342285, "global_step": 191848, "epoch": 4567} {"train_loss": -7.075745582580566, "global_step": 191849, "epoch": 4567} {"train_loss": -7.191147804260254, "global_step": 191850, "epoch": 4567} {"train_loss": -7.098142147064209, "global_step": 191851, "epoch": 4567} {"train_loss": -7.125324249267578, "global_step": 191852, "epoch": 4567} {"train_loss": -7.126956939697266, "global_step": 191853, "epoch": 4567} {"train_loss": -7.063075065612793, "global_step": 191854, "epoch": 4567} {"train_loss": -7.147509438650949, "global_step": 191855, "epoch": 4567, "val_loss": 68932.9453125} {"train_loss": -7.115355491638184, "global_step": 191856, "epoch": 4568} {"train_loss": -7.147664546966553, "global_step": 191857, "epoch": 4568} {"train_loss": -7.194588661193848, "global_step": 191858, "epoch": 4568} {"train_loss": -7.19462776184082, "global_step": 191859, "epoch": 4568} {"train_loss": -7.174081802368164, "global_step": 191860, "epoch": 4568} {"train_loss": -7.075620174407959, "global_step": 191861, "epoch": 4568} {"train_loss": -7.270204544067383, "global_step": 191862, "epoch": 4568} {"train_loss": -7.269989967346191, "global_step": 191863, "epoch": 4568} {"train_loss": -7.143828392028809, "global_step": 191864, "epoch": 4568} {"train_loss": -7.164050102233887, "global_step": 191865, "epoch": 4568} {"train_loss": -7.186583518981934, "global_step": 191866, "epoch": 4568} {"train_loss": -7.260259628295898, "global_step": 191867, "epoch": 4568} {"train_loss": -7.157556533813477, "global_step": 191868, "epoch": 4568} {"train_loss": -7.202320098876953, "global_step": 191869, "epoch": 4568} {"train_loss": -7.175341606140137, "global_step": 191870, "epoch": 4568} {"train_loss": -7.1505937576293945, "global_step": 191871, "epoch": 4568} {"train_loss": -7.187827110290527, "global_step": 191872, "epoch": 4568} {"train_loss": -7.1901021003723145, "global_step": 191873, "epoch": 4568} {"train_loss": -7.185816764831543, "global_step": 191874, "epoch": 4568} {"train_loss": -7.147486686706543, "global_step": 191875, "epoch": 4568} {"train_loss": -7.33807373046875, "global_step": 191876, "epoch": 4568} {"train_loss": -7.132744312286377, "global_step": 191877, "epoch": 4568} {"train_loss": -7.266636371612549, "global_step": 191878, "epoch": 4568} {"train_loss": -7.204181671142578, "global_step": 191879, "epoch": 4568} {"train_loss": -7.154470443725586, "global_step": 191880, "epoch": 4568} {"train_loss": -7.285591125488281, "global_step": 191881, "epoch": 4568} {"train_loss": -7.220354080200195, "global_step": 191882, "epoch": 4568} {"train_loss": -7.193521499633789, "global_step": 191883, "epoch": 4568} {"train_loss": -7.003705024719238, "global_step": 191884, "epoch": 4568} {"train_loss": -7.152301788330078, "global_step": 191885, "epoch": 4568} {"train_loss": -7.213790416717529, "global_step": 191886, "epoch": 4568} {"train_loss": -7.0526533126831055, "global_step": 191887, "epoch": 4568} {"train_loss": -7.1046295166015625, "global_step": 191888, "epoch": 4568} {"train_loss": -7.192685127258301, "global_step": 191889, "epoch": 4568} {"train_loss": -7.026948928833008, "global_step": 191890, "epoch": 4568} {"train_loss": -7.285418510437012, "global_step": 191891, "epoch": 4568} {"train_loss": -7.228255748748779, "global_step": 191892, "epoch": 4568} {"train_loss": -7.184051990509033, "global_step": 191893, "epoch": 4568} {"train_loss": -7.121913909912109, "global_step": 191894, "epoch": 4568} {"train_loss": -7.177412033081055, "global_step": 191895, "epoch": 4568} {"train_loss": -7.140043258666992, "global_step": 191896, "epoch": 4568} {"train_loss": -7.179232472465152, "global_step": 191897, "epoch": 4568, "val_loss": 69007.6015625} {"train_loss": -7.2551679611206055, "global_step": 191898, "epoch": 4569} {"train_loss": -7.126895904541016, "global_step": 191899, "epoch": 4569} {"train_loss": -7.248897552490234, "global_step": 191900, "epoch": 4569} {"train_loss": -7.130820274353027, "global_step": 191901, "epoch": 4569} {"train_loss": -7.097644805908203, "global_step": 191902, "epoch": 4569} {"train_loss": -7.300490379333496, "global_step": 191903, "epoch": 4569} {"train_loss": -7.0647292137146, "global_step": 191904, "epoch": 4569} {"train_loss": -7.2420172691345215, "global_step": 191905, "epoch": 4569} {"train_loss": -7.273358345031738, "global_step": 191906, "epoch": 4569} {"train_loss": -7.076957702636719, "global_step": 191907, "epoch": 4569} {"train_loss": -7.199637413024902, "global_step": 191908, "epoch": 4569} {"train_loss": -7.146130084991455, "global_step": 191909, "epoch": 4569} {"train_loss": -7.107527732849121, "global_step": 191910, "epoch": 4569} {"train_loss": -7.165968894958496, "global_step": 191911, "epoch": 4569} {"train_loss": -7.070350646972656, "global_step": 191912, "epoch": 4569} {"train_loss": -7.200970649719238, "global_step": 191913, "epoch": 4569} {"train_loss": -7.0558695793151855, "global_step": 191914, "epoch": 4569} {"train_loss": -7.261611461639404, "global_step": 191915, "epoch": 4569} {"train_loss": -7.294826507568359, "global_step": 191916, "epoch": 4569} {"train_loss": -7.146790504455566, "global_step": 191917, "epoch": 4569} {"train_loss": -7.213716983795166, "global_step": 191918, "epoch": 4569} {"train_loss": -7.017584323883057, "global_step": 191919, "epoch": 4569} {"train_loss": -7.226836204528809, "global_step": 191920, "epoch": 4569} {"train_loss": -7.187126636505127, "global_step": 191921, "epoch": 4569} {"train_loss": -7.215745449066162, "global_step": 191922, "epoch": 4569} {"train_loss": -7.14266300201416, "global_step": 191923, "epoch": 4569} {"train_loss": -7.125181674957275, "global_step": 191924, "epoch": 4569} {"train_loss": -7.265763282775879, "global_step": 191925, "epoch": 4569} {"train_loss": -7.07026481628418, "global_step": 191926, "epoch": 4569} {"train_loss": -7.1389594078063965, "global_step": 191927, "epoch": 4569} {"train_loss": -7.186345100402832, "global_step": 191928, "epoch": 4569} {"train_loss": -7.054529190063477, "global_step": 191929, "epoch": 4569} {"train_loss": -7.072919845581055, "global_step": 191930, "epoch": 4569} {"train_loss": -7.169739246368408, "global_step": 191931, "epoch": 4569} {"train_loss": -7.102416038513184, "global_step": 191932, "epoch": 4569} {"train_loss": -7.053486347198486, "global_step": 191933, "epoch": 4569} {"train_loss": -7.097297668457031, "global_step": 191934, "epoch": 4569} {"train_loss": -7.070148468017578, "global_step": 191935, "epoch": 4569} {"train_loss": -7.05894136428833, "global_step": 191936, "epoch": 4569} {"train_loss": -7.105184555053711, "global_step": 191937, "epoch": 4569} {"train_loss": -7.007646560668945, "global_step": 191938, "epoch": 4569} {"train_loss": -7.144595940907796, "global_step": 191939, "epoch": 4569, "val_loss": 69104.15625} {"train_loss": -7.208659648895264, "global_step": 191940, "epoch": 4570} {"train_loss": -7.183565139770508, "global_step": 191941, "epoch": 4570} {"train_loss": -7.080230236053467, "global_step": 191942, "epoch": 4570} {"train_loss": -7.125778675079346, "global_step": 191943, "epoch": 4570} {"train_loss": -7.120729446411133, "global_step": 191944, "epoch": 4570} {"train_loss": -7.277392387390137, "global_step": 191945, "epoch": 4570} {"train_loss": -7.173224449157715, "global_step": 191946, "epoch": 4570} {"train_loss": -7.104007244110107, "global_step": 191947, "epoch": 4570} {"train_loss": -7.067176818847656, "global_step": 191948, "epoch": 4570} {"train_loss": -7.272491455078125, "global_step": 191949, "epoch": 4570} {"train_loss": -7.130858421325684, "global_step": 191950, "epoch": 4570} {"train_loss": -7.186885356903076, "global_step": 191951, "epoch": 4570} {"train_loss": -7.141209125518799, "global_step": 191952, "epoch": 4570} {"train_loss": -7.229570388793945, "global_step": 191953, "epoch": 4570} {"train_loss": -7.155911445617676, "global_step": 191954, "epoch": 4570} {"train_loss": -7.1902360916137695, "global_step": 191955, "epoch": 4570} {"train_loss": -7.3130998611450195, "global_step": 191956, "epoch": 4570} {"train_loss": -7.161942005157471, "global_step": 191957, "epoch": 4570} {"train_loss": -7.120388031005859, "global_step": 191958, "epoch": 4570} {"train_loss": -7.215893745422363, "global_step": 191959, "epoch": 4570} {"train_loss": -7.239201545715332, "global_step": 191960, "epoch": 4570} {"train_loss": -7.095400810241699, "global_step": 191961, "epoch": 4570} {"train_loss": -7.264784812927246, "global_step": 191962, "epoch": 4570} {"train_loss": -7.173023700714111, "global_step": 191963, "epoch": 4570} {"train_loss": -7.180767059326172, "global_step": 191964, "epoch": 4570} {"train_loss": -7.232253074645996, "global_step": 191965, "epoch": 4570} {"train_loss": -7.305730819702148, "global_step": 191966, "epoch": 4570} {"train_loss": -7.186561584472656, "global_step": 191967, "epoch": 4570} {"train_loss": -7.229779243469238, "global_step": 191968, "epoch": 4570} {"train_loss": -7.11817741394043, "global_step": 191969, "epoch": 4570} {"train_loss": -7.154801368713379, "global_step": 191970, "epoch": 4570} {"train_loss": -7.188013076782227, "global_step": 191971, "epoch": 4570} {"train_loss": -7.084153175354004, "global_step": 191972, "epoch": 4570} {"train_loss": -7.212184906005859, "global_step": 191973, "epoch": 4570} {"train_loss": -7.135158538818359, "global_step": 191974, "epoch": 4570} {"train_loss": -7.140811920166016, "global_step": 191975, "epoch": 4570} {"train_loss": -7.208399772644043, "global_step": 191976, "epoch": 4570} {"train_loss": -7.078653812408447, "global_step": 191977, "epoch": 4570} {"train_loss": -7.23020076751709, "global_step": 191978, "epoch": 4570} {"train_loss": -7.20513391494751, "global_step": 191979, "epoch": 4570} {"train_loss": -7.051128387451172, "global_step": 191980, "epoch": 4570} {"train_loss": -7.176567304702032, "global_step": 191981, "epoch": 4570, "val_loss": 68938.96875} {"train_loss": -7.1946210861206055, "global_step": 191982, "epoch": 4571} {"train_loss": -7.107883453369141, "global_step": 191983, "epoch": 4571} {"train_loss": -7.275273323059082, "global_step": 191984, "epoch": 4571} {"train_loss": -7.038259029388428, "global_step": 191985, "epoch": 4571} {"train_loss": -7.13948917388916, "global_step": 191986, "epoch": 4571} {"train_loss": -7.264458656311035, "global_step": 191987, "epoch": 4571} {"train_loss": -7.064888954162598, "global_step": 191988, "epoch": 4571} {"train_loss": -7.200131416320801, "global_step": 191989, "epoch": 4571} {"train_loss": -7.137901306152344, "global_step": 191990, "epoch": 4571} {"train_loss": -7.151614189147949, "global_step": 191991, "epoch": 4571} {"train_loss": -7.387655258178711, "global_step": 191992, "epoch": 4571} {"train_loss": -7.096278190612793, "global_step": 191993, "epoch": 4571} {"train_loss": -7.252159118652344, "global_step": 191994, "epoch": 4571} {"train_loss": -7.2885847091674805, "global_step": 191995, "epoch": 4571} {"train_loss": -7.202236652374268, "global_step": 191996, "epoch": 4571} {"train_loss": -7.24446964263916, "global_step": 191997, "epoch": 4571} {"train_loss": -7.273051738739014, "global_step": 191998, "epoch": 4571} {"train_loss": -7.204152584075928, "global_step": 191999, "epoch": 4571} {"train_loss": -7.273271083831787, "global_step": 192000, "epoch": 4571} {"train_loss": -7.1247735023498535, "global_step": 192001, "epoch": 4571} {"train_loss": -7.200128078460693, "global_step": 192002, "epoch": 4571} {"train_loss": -7.174485683441162, "global_step": 192003, "epoch": 4571} {"train_loss": -7.188470840454102, "global_step": 192004, "epoch": 4571} {"train_loss": -7.161557674407959, "global_step": 192005, "epoch": 4571} {"train_loss": -6.995856761932373, "global_step": 192006, "epoch": 4571} {"train_loss": -7.1275224685668945, "global_step": 192007, "epoch": 4571} {"train_loss": -7.33221435546875, "global_step": 192008, "epoch": 4571} {"train_loss": -7.178627967834473, "global_step": 192009, "epoch": 4571} {"train_loss": -7.17061710357666, "global_step": 192010, "epoch": 4571} {"train_loss": -7.248126983642578, "global_step": 192011, "epoch": 4571} {"train_loss": -6.997767925262451, "global_step": 192012, "epoch": 4571} {"train_loss": -7.04322624206543, "global_step": 192013, "epoch": 4571} {"train_loss": -7.037919998168945, "global_step": 192014, "epoch": 4571} {"train_loss": -7.12288236618042, "global_step": 192015, "epoch": 4571} {"train_loss": -7.130338668823242, "global_step": 192016, "epoch": 4571} {"train_loss": -7.228304862976074, "global_step": 192017, "epoch": 4571} {"train_loss": -7.097387790679932, "global_step": 192018, "epoch": 4571} {"train_loss": -7.21411657333374, "global_step": 192019, "epoch": 4571} {"train_loss": -7.143847942352295, "global_step": 192020, "epoch": 4571} {"train_loss": -7.1182661056518555, "global_step": 192021, "epoch": 4571} {"train_loss": -7.191934585571289, "global_step": 192022, "epoch": 4571} {"train_loss": -7.169660011927287, "global_step": 192023, "epoch": 4571, "val_loss": 68845.8828125} {"train_loss": -7.141931533813477, "global_step": 192024, "epoch": 4572} {"train_loss": -7.173384189605713, "global_step": 192025, "epoch": 4572} {"train_loss": -7.243868350982666, "global_step": 192026, "epoch": 4572} {"train_loss": -7.1491594314575195, "global_step": 192027, "epoch": 4572} {"train_loss": -7.205437660217285, "global_step": 192028, "epoch": 4572} {"train_loss": -7.101356506347656, "global_step": 192029, "epoch": 4572} {"train_loss": -7.141797065734863, "global_step": 192030, "epoch": 4572} {"train_loss": -7.219474792480469, "global_step": 192031, "epoch": 4572} {"train_loss": -7.044061660766602, "global_step": 192032, "epoch": 4572} {"train_loss": -7.152289867401123, "global_step": 192033, "epoch": 4572} {"train_loss": -7.098269939422607, "global_step": 192034, "epoch": 4572} {"train_loss": -7.187412261962891, "global_step": 192035, "epoch": 4572} {"train_loss": -7.277693748474121, "global_step": 192036, "epoch": 4572} {"train_loss": -7.1136932373046875, "global_step": 192037, "epoch": 4572} {"train_loss": -7.208000659942627, "global_step": 192038, "epoch": 4572} {"train_loss": -7.177535057067871, "global_step": 192039, "epoch": 4572} {"train_loss": -7.181020736694336, "global_step": 192040, "epoch": 4572} {"train_loss": -7.147291660308838, "global_step": 192041, "epoch": 4572} {"train_loss": -7.205569267272949, "global_step": 192042, "epoch": 4572} {"train_loss": -7.190322399139404, "global_step": 192043, "epoch": 4572} {"train_loss": -7.223204612731934, "global_step": 192044, "epoch": 4572} {"train_loss": -7.136626243591309, "global_step": 192045, "epoch": 4572} {"train_loss": -7.114352703094482, "global_step": 192046, "epoch": 4572} {"train_loss": -7.106058597564697, "global_step": 192047, "epoch": 4572} {"train_loss": -7.194303512573242, "global_step": 192048, "epoch": 4572} {"train_loss": -7.143571376800537, "global_step": 192049, "epoch": 4572} {"train_loss": -7.179228782653809, "global_step": 192050, "epoch": 4572} {"train_loss": -7.161489486694336, "global_step": 192051, "epoch": 4572} {"train_loss": -7.002133369445801, "global_step": 192052, "epoch": 4572} {"train_loss": -7.069474220275879, "global_step": 192053, "epoch": 4572} {"train_loss": -7.189847946166992, "global_step": 192054, "epoch": 4572} {"train_loss": -7.110224723815918, "global_step": 192055, "epoch": 4572} {"train_loss": -7.058612823486328, "global_step": 192056, "epoch": 4572} {"train_loss": -7.2357282638549805, "global_step": 192057, "epoch": 4572} {"train_loss": -7.009861946105957, "global_step": 192058, "epoch": 4572} {"train_loss": -7.042469024658203, "global_step": 192059, "epoch": 4572} {"train_loss": -7.0841450691223145, "global_step": 192060, "epoch": 4572} {"train_loss": -7.08770751953125, "global_step": 192061, "epoch": 4572} {"train_loss": -7.183322906494141, "global_step": 192062, "epoch": 4572} {"train_loss": -7.15895938873291, "global_step": 192063, "epoch": 4572} {"train_loss": -7.191432476043701, "global_step": 192064, "epoch": 4572} {"train_loss": -7.146168107078189, "global_step": 192065, "epoch": 4572, "val_loss": 68844.328125} {"train_loss": -7.176266670227051, "global_step": 192066, "epoch": 4573} {"train_loss": -7.25522518157959, "global_step": 192067, "epoch": 4573} {"train_loss": -7.1539177894592285, "global_step": 192068, "epoch": 4573} {"train_loss": -7.0872697830200195, "global_step": 192069, "epoch": 4573} {"train_loss": -7.180635452270508, "global_step": 192070, "epoch": 4573} {"train_loss": -7.20887565612793, "global_step": 192071, "epoch": 4573} {"train_loss": -7.151789665222168, "global_step": 192072, "epoch": 4573} {"train_loss": -7.300495147705078, "global_step": 192073, "epoch": 4573} {"train_loss": -7.076595306396484, "global_step": 192074, "epoch": 4573} {"train_loss": -7.160614967346191, "global_step": 192075, "epoch": 4573} {"train_loss": -7.156140327453613, "global_step": 192076, "epoch": 4573} {"train_loss": -7.179529190063477, "global_step": 192077, "epoch": 4573} {"train_loss": -7.355949401855469, "global_step": 192078, "epoch": 4573} {"train_loss": -7.156888008117676, "global_step": 192079, "epoch": 4573} {"train_loss": -7.13608455657959, "global_step": 192080, "epoch": 4573} {"train_loss": -7.169124603271484, "global_step": 192081, "epoch": 4573} {"train_loss": -7.069531440734863, "global_step": 192082, "epoch": 4573} {"train_loss": -7.149028778076172, "global_step": 192083, "epoch": 4573} {"train_loss": -7.291581153869629, "global_step": 192084, "epoch": 4573} {"train_loss": -7.195776462554932, "global_step": 192085, "epoch": 4573} {"train_loss": -7.2698163986206055, "global_step": 192086, "epoch": 4573} {"train_loss": -7.220685005187988, "global_step": 192087, "epoch": 4573} {"train_loss": -7.1956329345703125, "global_step": 192088, "epoch": 4573} {"train_loss": -7.261721611022949, "global_step": 192089, "epoch": 4573} {"train_loss": -7.316826820373535, "global_step": 192090, "epoch": 4573} {"train_loss": -7.069612503051758, "global_step": 192091, "epoch": 4573} {"train_loss": -7.232346534729004, "global_step": 192092, "epoch": 4573} {"train_loss": -7.0896759033203125, "global_step": 192093, "epoch": 4573} {"train_loss": -7.224981307983398, "global_step": 192094, "epoch": 4573} {"train_loss": -7.235880374908447, "global_step": 192095, "epoch": 4573} {"train_loss": -7.158607482910156, "global_step": 192096, "epoch": 4573} {"train_loss": -7.183219909667969, "global_step": 192097, "epoch": 4573} {"train_loss": -7.171829700469971, "global_step": 192098, "epoch": 4573} {"train_loss": -7.206198692321777, "global_step": 192099, "epoch": 4573} {"train_loss": -7.136453151702881, "global_step": 192100, "epoch": 4573} {"train_loss": -7.223446846008301, "global_step": 192101, "epoch": 4573} {"train_loss": -7.17180061340332, "global_step": 192102, "epoch": 4573} {"train_loss": -7.028107166290283, "global_step": 192103, "epoch": 4573} {"train_loss": -7.321235656738281, "global_step": 192104, "epoch": 4573} {"train_loss": -7.071076393127441, "global_step": 192105, "epoch": 4573} {"train_loss": -7.0673418045043945, "global_step": 192106, "epoch": 4573} {"train_loss": -7.18207573890686, "global_step": 192107, "epoch": 4573, "val_loss": 68886.7578125} {"train_loss": -7.148053169250488, "global_step": 192108, "epoch": 4574} {"train_loss": -7.08681583404541, "global_step": 192109, "epoch": 4574} {"train_loss": -7.167416572570801, "global_step": 192110, "epoch": 4574} {"train_loss": -7.154691696166992, "global_step": 192111, "epoch": 4574} {"train_loss": -7.12272834777832, "global_step": 192112, "epoch": 4574} {"train_loss": -7.228504180908203, "global_step": 192113, "epoch": 4574} {"train_loss": -7.121964454650879, "global_step": 192114, "epoch": 4574} {"train_loss": -7.113958835601807, "global_step": 192115, "epoch": 4574} {"train_loss": -7.225131511688232, "global_step": 192116, "epoch": 4574} {"train_loss": -7.114004135131836, "global_step": 192117, "epoch": 4574} {"train_loss": -7.208640098571777, "global_step": 192118, "epoch": 4574} {"train_loss": -7.116584300994873, "global_step": 192119, "epoch": 4574} {"train_loss": -7.231960773468018, "global_step": 192120, "epoch": 4574} {"train_loss": -7.107408046722412, "global_step": 192121, "epoch": 4574} {"train_loss": -7.081019401550293, "global_step": 192122, "epoch": 4574} {"train_loss": -7.083317279815674, "global_step": 192123, "epoch": 4574} {"train_loss": -7.114588737487793, "global_step": 192124, "epoch": 4574} {"train_loss": -7.155989646911621, "global_step": 192125, "epoch": 4574} {"train_loss": -7.0894293785095215, "global_step": 192126, "epoch": 4574} {"train_loss": -7.103865623474121, "global_step": 192127, "epoch": 4574} {"train_loss": -7.182938575744629, "global_step": 192128, "epoch": 4574} {"train_loss": -7.248396396636963, "global_step": 192129, "epoch": 4574} {"train_loss": -7.225695610046387, "global_step": 192130, "epoch": 4574} {"train_loss": -7.179228782653809, "global_step": 192131, "epoch": 4574} {"train_loss": -7.120326995849609, "global_step": 192132, "epoch": 4574} {"train_loss": -7.217159271240234, "global_step": 192133, "epoch": 4574} {"train_loss": -7.178081035614014, "global_step": 192134, "epoch": 4574} {"train_loss": -7.1714911460876465, "global_step": 192135, "epoch": 4574} {"train_loss": -7.174343109130859, "global_step": 192136, "epoch": 4574} {"train_loss": -7.132711410522461, "global_step": 192137, "epoch": 4574} {"train_loss": -7.157416820526123, "global_step": 192138, "epoch": 4574} {"train_loss": -7.24454402923584, "global_step": 192139, "epoch": 4574} {"train_loss": -7.292169570922852, "global_step": 192140, "epoch": 4574} {"train_loss": -7.30482292175293, "global_step": 192141, "epoch": 4574} {"train_loss": -7.040143966674805, "global_step": 192142, "epoch": 4574} {"train_loss": -7.106940269470215, "global_step": 192143, "epoch": 4574} {"train_loss": -7.220287799835205, "global_step": 192144, "epoch": 4574} {"train_loss": -7.070629119873047, "global_step": 192145, "epoch": 4574} {"train_loss": -7.1628828048706055, "global_step": 192146, "epoch": 4574} {"train_loss": -7.199875354766846, "global_step": 192147, "epoch": 4574} {"train_loss": -7.156777858734131, "global_step": 192148, "epoch": 4574} {"train_loss": -7.1620695023309615, "global_step": 192149, "epoch": 4574, "val_loss": 68886.6796875} {"train_loss": -7.2537641525268555, "global_step": 192150, "epoch": 4575} {"train_loss": -7.098589897155762, "global_step": 192151, "epoch": 4575} {"train_loss": -7.212648868560791, "global_step": 192152, "epoch": 4575} {"train_loss": -7.271790504455566, "global_step": 192153, "epoch": 4575} {"train_loss": -7.176187038421631, "global_step": 192154, "epoch": 4575} {"train_loss": -7.137867450714111, "global_step": 192155, "epoch": 4575} {"train_loss": -7.178536415100098, "global_step": 192156, "epoch": 4575} {"train_loss": -7.0873565673828125, "global_step": 192157, "epoch": 4575} {"train_loss": -7.0773606300354, "global_step": 192158, "epoch": 4575} {"train_loss": -7.177046775817871, "global_step": 192159, "epoch": 4575} {"train_loss": -7.027543544769287, "global_step": 192160, "epoch": 4575} {"train_loss": -7.190655708312988, "global_step": 192161, "epoch": 4575} {"train_loss": -7.132591247558594, "global_step": 192162, "epoch": 4575} {"train_loss": -7.272206783294678, "global_step": 192163, "epoch": 4575} {"train_loss": -7.169633865356445, "global_step": 192164, "epoch": 4575} {"train_loss": -7.168871879577637, "global_step": 192165, "epoch": 4575} {"train_loss": -7.217096328735352, "global_step": 192166, "epoch": 4575} {"train_loss": -7.27689790725708, "global_step": 192167, "epoch": 4575} {"train_loss": -7.115076541900635, "global_step": 192168, "epoch": 4575} {"train_loss": -7.200860977172852, "global_step": 192169, "epoch": 4575} {"train_loss": -7.202890396118164, "global_step": 192170, "epoch": 4575} {"train_loss": -7.194953918457031, "global_step": 192171, "epoch": 4575} {"train_loss": -7.144282341003418, "global_step": 192172, "epoch": 4575} {"train_loss": -7.224045753479004, "global_step": 192173, "epoch": 4575} {"train_loss": -7.083174705505371, "global_step": 192174, "epoch": 4575} {"train_loss": -7.096427917480469, "global_step": 192175, "epoch": 4575} {"train_loss": -7.203886985778809, "global_step": 192176, "epoch": 4575} {"train_loss": -7.179012298583984, "global_step": 192177, "epoch": 4575} {"train_loss": -7.220317840576172, "global_step": 192178, "epoch": 4575} {"train_loss": -7.103541374206543, "global_step": 192179, "epoch": 4575} {"train_loss": -7.160190582275391, "global_step": 192180, "epoch": 4575} {"train_loss": -7.1667938232421875, "global_step": 192181, "epoch": 4575} {"train_loss": -7.046848297119141, "global_step": 192182, "epoch": 4575} {"train_loss": -7.196422576904297, "global_step": 192183, "epoch": 4575} {"train_loss": -7.25412654876709, "global_step": 192184, "epoch": 4575} {"train_loss": -7.211824417114258, "global_step": 192185, "epoch": 4575} {"train_loss": -7.163722991943359, "global_step": 192186, "epoch": 4575} {"train_loss": -7.126012802124023, "global_step": 192187, "epoch": 4575} {"train_loss": -7.256764888763428, "global_step": 192188, "epoch": 4575} {"train_loss": -7.090288162231445, "global_step": 192189, "epoch": 4575} {"train_loss": -7.075068473815918, "global_step": 192190, "epoch": 4575} {"train_loss": -7.164975552331834, "global_step": 192191, "epoch": 4575, "val_loss": 69135.21875} {"train_loss": -7.172571182250977, "global_step": 192192, "epoch": 4576} {"train_loss": -7.333644390106201, "global_step": 192193, "epoch": 4576} {"train_loss": -7.038098335266113, "global_step": 192194, "epoch": 4576} {"train_loss": -7.213723182678223, "global_step": 192195, "epoch": 4576} {"train_loss": -7.134354591369629, "global_step": 192196, "epoch": 4576} {"train_loss": -7.170120716094971, "global_step": 192197, "epoch": 4576} {"train_loss": -7.27114725112915, "global_step": 192198, "epoch": 4576} {"train_loss": -7.1239824295043945, "global_step": 192199, "epoch": 4576} {"train_loss": -7.175708770751953, "global_step": 192200, "epoch": 4576} {"train_loss": -7.06948184967041, "global_step": 192201, "epoch": 4576} {"train_loss": -7.150805473327637, "global_step": 192202, "epoch": 4576} {"train_loss": -7.049682140350342, "global_step": 192203, "epoch": 4576} {"train_loss": -7.039716720581055, "global_step": 192204, "epoch": 4576} {"train_loss": -6.901395797729492, "global_step": 192205, "epoch": 4576} {"train_loss": -7.125742435455322, "global_step": 192206, "epoch": 4576} {"train_loss": -7.001791000366211, "global_step": 192207, "epoch": 4576} {"train_loss": -7.0380964279174805, "global_step": 192208, "epoch": 4576} {"train_loss": -7.043824195861816, "global_step": 192209, "epoch": 4576} {"train_loss": -7.03558349609375, "global_step": 192210, "epoch": 4576} {"train_loss": -6.951271057128906, "global_step": 192211, "epoch": 4576} {"train_loss": -7.164254188537598, "global_step": 192212, "epoch": 4576} {"train_loss": -7.124493598937988, "global_step": 192213, "epoch": 4576} {"train_loss": -7.114520072937012, "global_step": 192214, "epoch": 4576} {"train_loss": -7.025945663452148, "global_step": 192215, "epoch": 4576} {"train_loss": -7.061388969421387, "global_step": 192216, "epoch": 4576} {"train_loss": -7.231982231140137, "global_step": 192217, "epoch": 4576} {"train_loss": -6.9974589347839355, "global_step": 192218, "epoch": 4576} {"train_loss": -7.118938446044922, "global_step": 192219, "epoch": 4576} {"train_loss": -7.046095848083496, "global_step": 192220, "epoch": 4576} {"train_loss": -7.133657932281494, "global_step": 192221, "epoch": 4576} {"train_loss": -7.068333625793457, "global_step": 192222, "epoch": 4576} {"train_loss": -7.0780792236328125, "global_step": 192223, "epoch": 4576} {"train_loss": -7.198119163513184, "global_step": 192224, "epoch": 4576} {"train_loss": -7.107974529266357, "global_step": 192225, "epoch": 4576} {"train_loss": -7.1125054359436035, "global_step": 192226, "epoch": 4576} {"train_loss": -7.127182483673096, "global_step": 192227, "epoch": 4576} {"train_loss": -7.197391510009766, "global_step": 192228, "epoch": 4576} {"train_loss": -7.208076477050781, "global_step": 192229, "epoch": 4576} {"train_loss": -7.124049186706543, "global_step": 192230, "epoch": 4576} {"train_loss": -7.207352161407471, "global_step": 192231, "epoch": 4576} {"train_loss": -7.083358287811279, "global_step": 192232, "epoch": 4576} {"train_loss": -7.109734126499721, "global_step": 192233, "epoch": 4576, "val_loss": 68962.7578125} {"train_loss": -7.23153018951416, "global_step": 192234, "epoch": 4577} {"train_loss": -7.135059356689453, "global_step": 192235, "epoch": 4577} {"train_loss": -7.231656074523926, "global_step": 192236, "epoch": 4577} {"train_loss": -7.0960612297058105, "global_step": 192237, "epoch": 4577} {"train_loss": -7.09630012512207, "global_step": 192238, "epoch": 4577} {"train_loss": -7.167000770568848, "global_step": 192239, "epoch": 4577} {"train_loss": -6.996591091156006, "global_step": 192240, "epoch": 4577} {"train_loss": -7.159605026245117, "global_step": 192241, "epoch": 4577} {"train_loss": -7.033938407897949, "global_step": 192242, "epoch": 4577} {"train_loss": -7.063315391540527, "global_step": 192243, "epoch": 4577} {"train_loss": -6.99099063873291, "global_step": 192244, "epoch": 4577} {"train_loss": -7.058925151824951, "global_step": 192245, "epoch": 4577} {"train_loss": -7.121713161468506, "global_step": 192246, "epoch": 4577} {"train_loss": -7.164070129394531, "global_step": 192247, "epoch": 4577} {"train_loss": -7.012168884277344, "global_step": 192248, "epoch": 4577} {"train_loss": -7.183045387268066, "global_step": 192249, "epoch": 4577} {"train_loss": -7.101677894592285, "global_step": 192250, "epoch": 4577} {"train_loss": -7.116671085357666, "global_step": 192251, "epoch": 4577} {"train_loss": -7.122244358062744, "global_step": 192252, "epoch": 4577} {"train_loss": -7.158649444580078, "global_step": 192253, "epoch": 4577} {"train_loss": -6.927680015563965, "global_step": 192254, "epoch": 4577} {"train_loss": -7.075599193572998, "global_step": 192255, "epoch": 4577} {"train_loss": -7.111708641052246, "global_step": 192256, "epoch": 4577} {"train_loss": -7.144222736358643, "global_step": 192257, "epoch": 4577} {"train_loss": -7.1477179527282715, "global_step": 192258, "epoch": 4577} {"train_loss": -7.071351528167725, "global_step": 192259, "epoch": 4577} {"train_loss": -7.144339084625244, "global_step": 192260, "epoch": 4577} {"train_loss": -7.116320610046387, "global_step": 192261, "epoch": 4577} {"train_loss": -7.122437953948975, "global_step": 192262, "epoch": 4577} {"train_loss": -7.216808319091797, "global_step": 192263, "epoch": 4577} {"train_loss": -7.080417156219482, "global_step": 192264, "epoch": 4577} {"train_loss": -7.284024238586426, "global_step": 192265, "epoch": 4577} {"train_loss": -7.0698089599609375, "global_step": 192266, "epoch": 4577} {"train_loss": -7.184887886047363, "global_step": 192267, "epoch": 4577} {"train_loss": -7.194869041442871, "global_step": 192268, "epoch": 4577} {"train_loss": -7.054626941680908, "global_step": 192269, "epoch": 4577} {"train_loss": -7.1793999671936035, "global_step": 192270, "epoch": 4577} {"train_loss": -7.196219444274902, "global_step": 192271, "epoch": 4577} {"train_loss": -7.01708984375, "global_step": 192272, "epoch": 4577} {"train_loss": -7.298287391662598, "global_step": 192273, "epoch": 4577} {"train_loss": -7.2965545654296875, "global_step": 192274, "epoch": 4577} {"train_loss": -7.129898423240299, "global_step": 192275, "epoch": 4577, "val_loss": 68928.5390625} {"train_loss": -7.218050479888916, "global_step": 192276, "epoch": 4578} {"train_loss": -7.229348182678223, "global_step": 192277, "epoch": 4578} {"train_loss": -7.243356704711914, "global_step": 192278, "epoch": 4578} {"train_loss": -7.25160026550293, "global_step": 192279, "epoch": 4578} {"train_loss": -7.229233741760254, "global_step": 192280, "epoch": 4578} {"train_loss": -7.194894313812256, "global_step": 192281, "epoch": 4578} {"train_loss": -7.2561140060424805, "global_step": 192282, "epoch": 4578} {"train_loss": -7.266110420227051, "global_step": 192283, "epoch": 4578} {"train_loss": -7.201413154602051, "global_step": 192284, "epoch": 4578} {"train_loss": -7.331880569458008, "global_step": 192285, "epoch": 4578} {"train_loss": -7.205849647521973, "global_step": 192286, "epoch": 4578} {"train_loss": -7.266454696655273, "global_step": 192287, "epoch": 4578} {"train_loss": -7.087619781494141, "global_step": 192288, "epoch": 4578} {"train_loss": -7.206827163696289, "global_step": 192289, "epoch": 4578} {"train_loss": -7.31059455871582, "global_step": 192290, "epoch": 4578} {"train_loss": -7.268918037414551, "global_step": 192291, "epoch": 4578} {"train_loss": -7.240504264831543, "global_step": 192292, "epoch": 4578} {"train_loss": -7.332915306091309, "global_step": 192293, "epoch": 4578} {"train_loss": -7.319765090942383, "global_step": 192294, "epoch": 4578} {"train_loss": -7.219709396362305, "global_step": 192295, "epoch": 4578} {"train_loss": -7.248140335083008, "global_step": 192296, "epoch": 4578} {"train_loss": -7.129896640777588, "global_step": 192297, "epoch": 4578} {"train_loss": -7.157538890838623, "global_step": 192298, "epoch": 4578} {"train_loss": -7.167468070983887, "global_step": 192299, "epoch": 4578} {"train_loss": -7.129445552825928, "global_step": 192300, "epoch": 4578} {"train_loss": -7.151059150695801, "global_step": 192301, "epoch": 4578} {"train_loss": -7.141371726989746, "global_step": 192302, "epoch": 4578} {"train_loss": -7.159136772155762, "global_step": 192303, "epoch": 4578} {"train_loss": -7.09382438659668, "global_step": 192304, "epoch": 4578} {"train_loss": -7.2133259773254395, "global_step": 192305, "epoch": 4578} {"train_loss": -7.061093330383301, "global_step": 192306, "epoch": 4578} {"train_loss": -7.103395462036133, "global_step": 192307, "epoch": 4578} {"train_loss": -7.255783557891846, "global_step": 192308, "epoch": 4578} {"train_loss": -7.045433044433594, "global_step": 192309, "epoch": 4578} {"train_loss": -7.068362712860107, "global_step": 192310, "epoch": 4578} {"train_loss": -7.191019058227539, "global_step": 192311, "epoch": 4578} {"train_loss": -7.107487678527832, "global_step": 192312, "epoch": 4578} {"train_loss": -7.198898792266846, "global_step": 192313, "epoch": 4578} {"train_loss": -7.048864364624023, "global_step": 192314, "epoch": 4578} {"train_loss": -7.058849334716797, "global_step": 192315, "epoch": 4578} {"train_loss": -7.182187557220459, "global_step": 192316, "epoch": 4578} {"train_loss": -7.188582454408918, "global_step": 192317, "epoch": 4578, "val_loss": 68966.8984375} {"train_loss": -7.123698711395264, "global_step": 192318, "epoch": 4579} {"train_loss": -7.1141462326049805, "global_step": 192319, "epoch": 4579} {"train_loss": -7.0131707191467285, "global_step": 192320, "epoch": 4579} {"train_loss": -7.019491672515869, "global_step": 192321, "epoch": 4579} {"train_loss": -6.990778923034668, "global_step": 192322, "epoch": 4579} {"train_loss": -7.150197982788086, "global_step": 192323, "epoch": 4579} {"train_loss": -7.14250373840332, "global_step": 192324, "epoch": 4579} {"train_loss": -7.068427085876465, "global_step": 192325, "epoch": 4579} {"train_loss": -7.1847028732299805, "global_step": 192326, "epoch": 4579} {"train_loss": -7.152478218078613, "global_step": 192327, "epoch": 4579} {"train_loss": -7.119171142578125, "global_step": 192328, "epoch": 4579} {"train_loss": -7.2446136474609375, "global_step": 192329, "epoch": 4579} {"train_loss": -7.303081512451172, "global_step": 192330, "epoch": 4579} {"train_loss": -7.200959205627441, "global_step": 192331, "epoch": 4579} {"train_loss": -7.203256607055664, "global_step": 192332, "epoch": 4579} {"train_loss": -7.25230598449707, "global_step": 192333, "epoch": 4579} {"train_loss": -7.0393548011779785, "global_step": 192334, "epoch": 4579} {"train_loss": -7.09169864654541, "global_step": 192335, "epoch": 4579} {"train_loss": -7.278217792510986, "global_step": 192336, "epoch": 4579} {"train_loss": -7.204145431518555, "global_step": 192337, "epoch": 4579} {"train_loss": -7.105790138244629, "global_step": 192338, "epoch": 4579} {"train_loss": -7.099790573120117, "global_step": 192339, "epoch": 4579} {"train_loss": -7.225906848907471, "global_step": 192340, "epoch": 4579} {"train_loss": -7.128366470336914, "global_step": 192341, "epoch": 4579} {"train_loss": -7.103603363037109, "global_step": 192342, "epoch": 4579} {"train_loss": -7.192144870758057, "global_step": 192343, "epoch": 4579} {"train_loss": -7.120150566101074, "global_step": 192344, "epoch": 4579} {"train_loss": -7.024726867675781, "global_step": 192345, "epoch": 4579} {"train_loss": -7.1613969802856445, "global_step": 192346, "epoch": 4579} {"train_loss": -7.22358512878418, "global_step": 192347, "epoch": 4579} {"train_loss": -7.236660003662109, "global_step": 192348, "epoch": 4579} {"train_loss": -7.1742844581604, "global_step": 192349, "epoch": 4579} {"train_loss": -7.167449474334717, "global_step": 192350, "epoch": 4579} {"train_loss": -7.22428560256958, "global_step": 192351, "epoch": 4579} {"train_loss": -7.093008041381836, "global_step": 192352, "epoch": 4579} {"train_loss": -7.152963638305664, "global_step": 192353, "epoch": 4579} {"train_loss": -7.153992652893066, "global_step": 192354, "epoch": 4579} {"train_loss": -7.011290550231934, "global_step": 192355, "epoch": 4579} {"train_loss": -7.137716770172119, "global_step": 192356, "epoch": 4579} {"train_loss": -7.252540588378906, "global_step": 192357, "epoch": 4579} {"train_loss": -7.036689758300781, "global_step": 192358, "epoch": 4579} {"train_loss": -7.1411188670567105, "global_step": 192359, "epoch": 4579, "val_loss": 68939.6640625} {"train_loss": -6.891308784484863, "global_step": 192360, "epoch": 4580} {"train_loss": -7.148425102233887, "global_step": 192361, "epoch": 4580} {"train_loss": -7.119417190551758, "global_step": 192362, "epoch": 4580} {"train_loss": -7.120650291442871, "global_step": 192363, "epoch": 4580} {"train_loss": -7.132673263549805, "global_step": 192364, "epoch": 4580} {"train_loss": -7.1299357414245605, "global_step": 192365, "epoch": 4580} {"train_loss": -7.122660160064697, "global_step": 192366, "epoch": 4580} {"train_loss": -7.0807905197143555, "global_step": 192367, "epoch": 4580} {"train_loss": -7.097002983093262, "global_step": 192368, "epoch": 4580} {"train_loss": -6.965406894683838, "global_step": 192369, "epoch": 4580} {"train_loss": -7.070620059967041, "global_step": 192370, "epoch": 4580} {"train_loss": -7.153780937194824, "global_step": 192371, "epoch": 4580} {"train_loss": -7.174862861633301, "global_step": 192372, "epoch": 4580} {"train_loss": -7.147223472595215, "global_step": 192373, "epoch": 4580} {"train_loss": -7.164015769958496, "global_step": 192374, "epoch": 4580} {"train_loss": -7.074680328369141, "global_step": 192375, "epoch": 4580} {"train_loss": -7.130770683288574, "global_step": 192376, "epoch": 4580} {"train_loss": -7.106334686279297, "global_step": 192377, "epoch": 4580} {"train_loss": -7.2474894523620605, "global_step": 192378, "epoch": 4580} {"train_loss": -7.185971260070801, "global_step": 192379, "epoch": 4580} {"train_loss": -7.157672882080078, "global_step": 192380, "epoch": 4580} {"train_loss": -7.223592281341553, "global_step": 192381, "epoch": 4580} {"train_loss": -7.209435939788818, "global_step": 192382, "epoch": 4580} {"train_loss": -7.10156774520874, "global_step": 192383, "epoch": 4580} {"train_loss": -7.112973690032959, "global_step": 192384, "epoch": 4580} {"train_loss": -7.12966251373291, "global_step": 192385, "epoch": 4580} {"train_loss": -7.198285102844238, "global_step": 192386, "epoch": 4580} {"train_loss": -7.215196132659912, "global_step": 192387, "epoch": 4580} {"train_loss": -7.234673023223877, "global_step": 192388, "epoch": 4580} {"train_loss": -7.292829990386963, "global_step": 192389, "epoch": 4580} {"train_loss": -7.158109188079834, "global_step": 192390, "epoch": 4580} {"train_loss": -7.133227348327637, "global_step": 192391, "epoch": 4580} {"train_loss": -7.219826698303223, "global_step": 192392, "epoch": 4580} {"train_loss": -7.0816192626953125, "global_step": 192393, "epoch": 4580} {"train_loss": -7.287784099578857, "global_step": 192394, "epoch": 4580} {"train_loss": -7.365654468536377, "global_step": 192395, "epoch": 4580} {"train_loss": -7.186988830566406, "global_step": 192396, "epoch": 4580} {"train_loss": -7.161996364593506, "global_step": 192397, "epoch": 4580} {"train_loss": -7.311121463775635, "global_step": 192398, "epoch": 4580} {"train_loss": -7.192051410675049, "global_step": 192399, "epoch": 4580} {"train_loss": -7.136963844299316, "global_step": 192400, "epoch": 4580} {"train_loss": -7.152785426094418, "global_step": 192401, "epoch": 4580, "val_loss": 69018.4453125} {"train_loss": -7.243351459503174, "global_step": 192402, "epoch": 4581} {"train_loss": -7.309847354888916, "global_step": 192403, "epoch": 4581} {"train_loss": -7.213599681854248, "global_step": 192404, "epoch": 4581} {"train_loss": -7.279186248779297, "global_step": 192405, "epoch": 4581} {"train_loss": -7.23321533203125, "global_step": 192406, "epoch": 4581} {"train_loss": -7.316286563873291, "global_step": 192407, "epoch": 4581} {"train_loss": -7.1767191886901855, "global_step": 192408, "epoch": 4581} {"train_loss": -7.062187194824219, "global_step": 192409, "epoch": 4581} {"train_loss": -7.287375450134277, "global_step": 192410, "epoch": 4581} {"train_loss": -7.278001308441162, "global_step": 192411, "epoch": 4581} {"train_loss": -7.295095443725586, "global_step": 192412, "epoch": 4581} {"train_loss": -7.230385780334473, "global_step": 192413, "epoch": 4581} {"train_loss": -7.283237457275391, "global_step": 192414, "epoch": 4581} {"train_loss": -7.121586322784424, "global_step": 192415, "epoch": 4581} {"train_loss": -7.151586532592773, "global_step": 192416, "epoch": 4581} {"train_loss": -7.423295974731445, "global_step": 192417, "epoch": 4581} {"train_loss": -7.133081912994385, "global_step": 192418, "epoch": 4581} {"train_loss": -7.204405307769775, "global_step": 192419, "epoch": 4581} {"train_loss": -7.213215351104736, "global_step": 192420, "epoch": 4581} {"train_loss": -7.217292785644531, "global_step": 192421, "epoch": 4581} {"train_loss": -7.2259039878845215, "global_step": 192422, "epoch": 4581} {"train_loss": -7.27614164352417, "global_step": 192423, "epoch": 4581} {"train_loss": -7.256396770477295, "global_step": 192424, "epoch": 4581} {"train_loss": -7.23135232925415, "global_step": 192425, "epoch": 4581} {"train_loss": -7.176283836364746, "global_step": 192426, "epoch": 4581} {"train_loss": -7.184757232666016, "global_step": 192427, "epoch": 4581} {"train_loss": -7.246979236602783, "global_step": 192428, "epoch": 4581} {"train_loss": -7.158555030822754, "global_step": 192429, "epoch": 4581} {"train_loss": -7.165311813354492, "global_step": 192430, "epoch": 4581} {"train_loss": -7.2014360427856445, "global_step": 192431, "epoch": 4581} {"train_loss": -7.215249061584473, "global_step": 192432, "epoch": 4581} {"train_loss": -7.170879364013672, "global_step": 192433, "epoch": 4581} {"train_loss": -7.202696323394775, "global_step": 192434, "epoch": 4581} {"train_loss": -7.154629707336426, "global_step": 192435, "epoch": 4581} {"train_loss": -7.2732367515563965, "global_step": 192436, "epoch": 4581} {"train_loss": -7.087934970855713, "global_step": 192437, "epoch": 4581} {"train_loss": -7.050110816955566, "global_step": 192438, "epoch": 4581} {"train_loss": -7.059377670288086, "global_step": 192439, "epoch": 4581} {"train_loss": -7.081430435180664, "global_step": 192440, "epoch": 4581} {"train_loss": -7.1103997230529785, "global_step": 192441, "epoch": 4581} {"train_loss": -7.042545318603516, "global_step": 192442, "epoch": 4581} {"train_loss": -7.200730062666393, "global_step": 192443, "epoch": 4581, "val_loss": 68871.359375} {"train_loss": -7.03364372253418, "global_step": 192444, "epoch": 4582} {"train_loss": -7.081569671630859, "global_step": 192445, "epoch": 4582} {"train_loss": -7.0971808433532715, "global_step": 192446, "epoch": 4582} {"train_loss": -7.136216163635254, "global_step": 192447, "epoch": 4582} {"train_loss": -7.071683406829834, "global_step": 192448, "epoch": 4582} {"train_loss": -7.228950023651123, "global_step": 192449, "epoch": 4582} {"train_loss": -7.072049140930176, "global_step": 192450, "epoch": 4582} {"train_loss": -7.19751501083374, "global_step": 192451, "epoch": 4582} {"train_loss": -7.064706802368164, "global_step": 192452, "epoch": 4582} {"train_loss": -7.047512054443359, "global_step": 192453, "epoch": 4582} {"train_loss": -7.091095924377441, "global_step": 192454, "epoch": 4582} {"train_loss": -7.215498924255371, "global_step": 192455, "epoch": 4582} {"train_loss": -7.146750450134277, "global_step": 192456, "epoch": 4582} {"train_loss": -7.146878242492676, "global_step": 192457, "epoch": 4582} {"train_loss": -7.172174453735352, "global_step": 192458, "epoch": 4582} {"train_loss": -7.230334281921387, "global_step": 192459, "epoch": 4582} {"train_loss": -7.163032531738281, "global_step": 192460, "epoch": 4582} {"train_loss": -7.119693756103516, "global_step": 192461, "epoch": 4582} {"train_loss": -7.30279016494751, "global_step": 192462, "epoch": 4582} {"train_loss": -7.1740217208862305, "global_step": 192463, "epoch": 4582} {"train_loss": -7.303034782409668, "global_step": 192464, "epoch": 4582} {"train_loss": -7.2342305183410645, "global_step": 192465, "epoch": 4582} {"train_loss": -7.064116477966309, "global_step": 192466, "epoch": 4582} {"train_loss": -7.215030670166016, "global_step": 192467, "epoch": 4582} {"train_loss": -7.226168632507324, "global_step": 192468, "epoch": 4582} {"train_loss": -7.197437763214111, "global_step": 192469, "epoch": 4582} {"train_loss": -7.146603584289551, "global_step": 192470, "epoch": 4582} {"train_loss": -7.25723934173584, "global_step": 192471, "epoch": 4582} {"train_loss": -7.102327346801758, "global_step": 192472, "epoch": 4582} {"train_loss": -7.155101776123047, "global_step": 192473, "epoch": 4582} {"train_loss": -7.096190452575684, "global_step": 192474, "epoch": 4582} {"train_loss": -7.149366855621338, "global_step": 192475, "epoch": 4582} {"train_loss": -7.164956569671631, "global_step": 192476, "epoch": 4582} {"train_loss": -7.150814533233643, "global_step": 192477, "epoch": 4582} {"train_loss": -7.127425670623779, "global_step": 192478, "epoch": 4582} {"train_loss": -7.116101264953613, "global_step": 192479, "epoch": 4582} {"train_loss": -7.1393232345581055, "global_step": 192480, "epoch": 4582} {"train_loss": -7.208165168762207, "global_step": 192481, "epoch": 4582} {"train_loss": -7.176881313323975, "global_step": 192482, "epoch": 4582} {"train_loss": -7.2808732986450195, "global_step": 192483, "epoch": 4582} {"train_loss": -7.133669376373291, "global_step": 192484, "epoch": 4582} {"train_loss": -7.159599633443923, "global_step": 192485, "epoch": 4582, "val_loss": 68911.859375} {"train_loss": -7.124797344207764, "global_step": 192486, "epoch": 4583} {"train_loss": -7.225278854370117, "global_step": 192487, "epoch": 4583} {"train_loss": -7.263733863830566, "global_step": 192488, "epoch": 4583} {"train_loss": -7.036581039428711, "global_step": 192489, "epoch": 4583} {"train_loss": -7.038564205169678, "global_step": 192490, "epoch": 4583} {"train_loss": -7.121041297912598, "global_step": 192491, "epoch": 4583} {"train_loss": -7.140355110168457, "global_step": 192492, "epoch": 4583} {"train_loss": -7.042330265045166, "global_step": 192493, "epoch": 4583} {"train_loss": -7.236396789550781, "global_step": 192494, "epoch": 4583} {"train_loss": -7.070943355560303, "global_step": 192495, "epoch": 4583} {"train_loss": -7.003791809082031, "global_step": 192496, "epoch": 4583} {"train_loss": -7.234231948852539, "global_step": 192497, "epoch": 4583} {"train_loss": -7.088360786437988, "global_step": 192498, "epoch": 4583} {"train_loss": -7.125679016113281, "global_step": 192499, "epoch": 4583} {"train_loss": -7.130401134490967, "global_step": 192500, "epoch": 4583} {"train_loss": -7.173436164855957, "global_step": 192501, "epoch": 4583} {"train_loss": -7.196976661682129, "global_step": 192502, "epoch": 4583} {"train_loss": -7.156903266906738, "global_step": 192503, "epoch": 4583} {"train_loss": -7.103496551513672, "global_step": 192504, "epoch": 4583} {"train_loss": -7.182342052459717, "global_step": 192505, "epoch": 4583} {"train_loss": -7.207666397094727, "global_step": 192506, "epoch": 4583} {"train_loss": -7.1505327224731445, "global_step": 192507, "epoch": 4583} {"train_loss": -7.118006229400635, "global_step": 192508, "epoch": 4583} {"train_loss": -7.16207218170166, "global_step": 192509, "epoch": 4583} {"train_loss": -7.082968711853027, "global_step": 192510, "epoch": 4583} {"train_loss": -7.1570281982421875, "global_step": 192511, "epoch": 4583} {"train_loss": -7.155418395996094, "global_step": 192512, "epoch": 4583} {"train_loss": -7.26346492767334, "global_step": 192513, "epoch": 4583} {"train_loss": -7.173338890075684, "global_step": 192514, "epoch": 4583} {"train_loss": -7.171272277832031, "global_step": 192515, "epoch": 4583} {"train_loss": -7.174342155456543, "global_step": 192516, "epoch": 4583} {"train_loss": -7.172442436218262, "global_step": 192517, "epoch": 4583} {"train_loss": -7.273144721984863, "global_step": 192518, "epoch": 4583} {"train_loss": -7.162708282470703, "global_step": 192519, "epoch": 4583} {"train_loss": -7.2219367027282715, "global_step": 192520, "epoch": 4583} {"train_loss": -7.18632173538208, "global_step": 192521, "epoch": 4583} {"train_loss": -7.252554893493652, "global_step": 192522, "epoch": 4583} {"train_loss": -7.264616012573242, "global_step": 192523, "epoch": 4583} {"train_loss": -7.118625164031982, "global_step": 192524, "epoch": 4583} {"train_loss": -7.31575870513916, "global_step": 192525, "epoch": 4583} {"train_loss": -7.133230209350586, "global_step": 192526, "epoch": 4583} {"train_loss": -7.161928438004994, "global_step": 192527, "epoch": 4583, "val_loss": 69000.734375} {"train_loss": -7.279346466064453, "global_step": 192528, "epoch": 4584} {"train_loss": -7.223903656005859, "global_step": 192529, "epoch": 4584} {"train_loss": -7.176697731018066, "global_step": 192530, "epoch": 4584} {"train_loss": -7.1390275955200195, "global_step": 192531, "epoch": 4584} {"train_loss": -7.208687782287598, "global_step": 192532, "epoch": 4584} {"train_loss": -7.229876518249512, "global_step": 192533, "epoch": 4584} {"train_loss": -7.050718307495117, "global_step": 192534, "epoch": 4584} {"train_loss": -7.092321395874023, "global_step": 192535, "epoch": 4584} {"train_loss": -7.16248893737793, "global_step": 192536, "epoch": 4584} {"train_loss": -6.975059509277344, "global_step": 192537, "epoch": 4584} {"train_loss": -6.954957962036133, "global_step": 192538, "epoch": 4584} {"train_loss": -7.1722025871276855, "global_step": 192539, "epoch": 4584} {"train_loss": -7.0771660804748535, "global_step": 192540, "epoch": 4584} {"train_loss": -7.092317581176758, "global_step": 192541, "epoch": 4584} {"train_loss": -7.21365213394165, "global_step": 192542, "epoch": 4584} {"train_loss": -7.037809371948242, "global_step": 192543, "epoch": 4584} {"train_loss": -7.084407806396484, "global_step": 192544, "epoch": 4584} {"train_loss": -6.934295177459717, "global_step": 192545, "epoch": 4584} {"train_loss": -7.14664363861084, "global_step": 192546, "epoch": 4584} {"train_loss": -7.065445423126221, "global_step": 192547, "epoch": 4584} {"train_loss": -7.153232097625732, "global_step": 192548, "epoch": 4584} {"train_loss": -7.095500946044922, "global_step": 192549, "epoch": 4584} {"train_loss": -7.1625800132751465, "global_step": 192550, "epoch": 4584} {"train_loss": -7.144250869750977, "global_step": 192551, "epoch": 4584} {"train_loss": -7.123288154602051, "global_step": 192552, "epoch": 4584} {"train_loss": -7.154376983642578, "global_step": 192553, "epoch": 4584} {"train_loss": -7.087775230407715, "global_step": 192554, "epoch": 4584} {"train_loss": -7.140688896179199, "global_step": 192555, "epoch": 4584} {"train_loss": -7.300682067871094, "global_step": 192556, "epoch": 4584} {"train_loss": -7.178815841674805, "global_step": 192557, "epoch": 4584} {"train_loss": -7.140659332275391, "global_step": 192558, "epoch": 4584} {"train_loss": -7.163115501403809, "global_step": 192559, "epoch": 4584} {"train_loss": -7.228058815002441, "global_step": 192560, "epoch": 4584} {"train_loss": -7.1319780349731445, "global_step": 192561, "epoch": 4584} {"train_loss": -7.222588062286377, "global_step": 192562, "epoch": 4584} {"train_loss": -7.149722099304199, "global_step": 192563, "epoch": 4584} {"train_loss": -7.185688018798828, "global_step": 192564, "epoch": 4584} {"train_loss": -7.1093549728393555, "global_step": 192565, "epoch": 4584} {"train_loss": -7.248260498046875, "global_step": 192566, "epoch": 4584} {"train_loss": -7.231308937072754, "global_step": 192567, "epoch": 4584} {"train_loss": -7.162391662597656, "global_step": 192568, "epoch": 4584} {"train_loss": -7.141214257194882, "global_step": 192569, "epoch": 4584, "val_loss": 69150.78125} {"train_loss": -7.0641021728515625, "global_step": 192570, "epoch": 4585} {"train_loss": -7.2487473487854, "global_step": 192571, "epoch": 4585} {"train_loss": -7.205738544464111, "global_step": 192572, "epoch": 4585} {"train_loss": -7.069027900695801, "global_step": 192573, "epoch": 4585} {"train_loss": -7.103875160217285, "global_step": 192574, "epoch": 4585} {"train_loss": -7.166018486022949, "global_step": 192575, "epoch": 4585} {"train_loss": -7.2087531089782715, "global_step": 192576, "epoch": 4585} {"train_loss": -7.2855448722839355, "global_step": 192577, "epoch": 4585} {"train_loss": -7.116617202758789, "global_step": 192578, "epoch": 4585} {"train_loss": -7.202175140380859, "global_step": 192579, "epoch": 4585} {"train_loss": -7.191154479980469, "global_step": 192580, "epoch": 4585} {"train_loss": -7.149316787719727, "global_step": 192581, "epoch": 4585} {"train_loss": -7.18865966796875, "global_step": 192582, "epoch": 4585} {"train_loss": -7.221874713897705, "global_step": 192583, "epoch": 4585} {"train_loss": -7.274477005004883, "global_step": 192584, "epoch": 4585} {"train_loss": -7.268333435058594, "global_step": 192585, "epoch": 4585} {"train_loss": -7.181203842163086, "global_step": 192586, "epoch": 4585} {"train_loss": -7.200524806976318, "global_step": 192587, "epoch": 4585} {"train_loss": -7.183677673339844, "global_step": 192588, "epoch": 4585} {"train_loss": -7.141805648803711, "global_step": 192589, "epoch": 4585} {"train_loss": -7.178748607635498, "global_step": 192590, "epoch": 4585} {"train_loss": -7.332735538482666, "global_step": 192591, "epoch": 4585} {"train_loss": -7.223901748657227, "global_step": 192592, "epoch": 4585} {"train_loss": -7.18066930770874, "global_step": 192593, "epoch": 4585} {"train_loss": -7.192914962768555, "global_step": 192594, "epoch": 4585} {"train_loss": -7.1889262199401855, "global_step": 192595, "epoch": 4585} {"train_loss": -7.207861423492432, "global_step": 192596, "epoch": 4585} {"train_loss": -7.170157432556152, "global_step": 192597, "epoch": 4585} {"train_loss": -7.217841148376465, "global_step": 192598, "epoch": 4585} {"train_loss": -7.118935585021973, "global_step": 192599, "epoch": 4585} {"train_loss": -7.182757377624512, "global_step": 192600, "epoch": 4585} {"train_loss": -7.277958869934082, "global_step": 192601, "epoch": 4585} {"train_loss": -7.084839820861816, "global_step": 192602, "epoch": 4585} {"train_loss": -7.090351104736328, "global_step": 192603, "epoch": 4585} {"train_loss": -7.289800643920898, "global_step": 192604, "epoch": 4585} {"train_loss": -7.149613857269287, "global_step": 192605, "epoch": 4585} {"train_loss": -7.187310218811035, "global_step": 192606, "epoch": 4585} {"train_loss": -7.23156213760376, "global_step": 192607, "epoch": 4585} {"train_loss": -7.216939449310303, "global_step": 192608, "epoch": 4585} {"train_loss": -7.082276821136475, "global_step": 192609, "epoch": 4585} {"train_loss": -7.2117719650268555, "global_step": 192610, "epoch": 4585} {"train_loss": -7.186698402677264, "global_step": 192611, "epoch": 4585, "val_loss": 68979.8046875} {"train_loss": -7.071354866027832, "global_step": 192612, "epoch": 4586} {"train_loss": -7.3153815269470215, "global_step": 192613, "epoch": 4586} {"train_loss": -7.1522345542907715, "global_step": 192614, "epoch": 4586} {"train_loss": -7.103433609008789, "global_step": 192615, "epoch": 4586} {"train_loss": -7.190695285797119, "global_step": 192616, "epoch": 4586} {"train_loss": -7.017032146453857, "global_step": 192617, "epoch": 4586} {"train_loss": -7.1657257080078125, "global_step": 192618, "epoch": 4586} {"train_loss": -7.26391077041626, "global_step": 192619, "epoch": 4586} {"train_loss": -7.175723075866699, "global_step": 192620, "epoch": 4586} {"train_loss": -7.148665904998779, "global_step": 192621, "epoch": 4586} {"train_loss": -7.0905914306640625, "global_step": 192622, "epoch": 4586} {"train_loss": -7.161529541015625, "global_step": 192623, "epoch": 4586} {"train_loss": -7.117329120635986, "global_step": 192624, "epoch": 4586} {"train_loss": -7.0778703689575195, "global_step": 192625, "epoch": 4586} {"train_loss": -7.2327423095703125, "global_step": 192626, "epoch": 4586} {"train_loss": -7.116320610046387, "global_step": 192627, "epoch": 4586} {"train_loss": -7.111634731292725, "global_step": 192628, "epoch": 4586} {"train_loss": -7.241837024688721, "global_step": 192629, "epoch": 4586} {"train_loss": -7.099894046783447, "global_step": 192630, "epoch": 4586} {"train_loss": -7.177737236022949, "global_step": 192631, "epoch": 4586} {"train_loss": -7.1796698570251465, "global_step": 192632, "epoch": 4586} {"train_loss": -7.276186943054199, "global_step": 192633, "epoch": 4586} {"train_loss": -7.168076992034912, "global_step": 192634, "epoch": 4586} {"train_loss": -7.161746978759766, "global_step": 192635, "epoch": 4586} {"train_loss": -7.223684310913086, "global_step": 192636, "epoch": 4586} {"train_loss": -7.184372901916504, "global_step": 192637, "epoch": 4586} {"train_loss": -7.035815238952637, "global_step": 192638, "epoch": 4586} {"train_loss": -7.165408611297607, "global_step": 192639, "epoch": 4586} {"train_loss": -7.262248992919922, "global_step": 192640, "epoch": 4586} {"train_loss": -7.160506248474121, "global_step": 192641, "epoch": 4586} {"train_loss": -7.236998558044434, "global_step": 192642, "epoch": 4586} {"train_loss": -7.201436996459961, "global_step": 192643, "epoch": 4586} {"train_loss": -7.1299028396606445, "global_step": 192644, "epoch": 4586} {"train_loss": -7.300316333770752, "global_step": 192645, "epoch": 4586} {"train_loss": -7.16771936416626, "global_step": 192646, "epoch": 4586} {"train_loss": -7.238393306732178, "global_step": 192647, "epoch": 4586} {"train_loss": -7.2484822273254395, "global_step": 192648, "epoch": 4586} {"train_loss": -7.146533012390137, "global_step": 192649, "epoch": 4586} {"train_loss": -7.2462053298950195, "global_step": 192650, "epoch": 4586} {"train_loss": -7.154491424560547, "global_step": 192651, "epoch": 4586} {"train_loss": -7.1687164306640625, "global_step": 192652, "epoch": 4586} {"train_loss": -7.17253988129752, "global_step": 192653, "epoch": 4586, "val_loss": 68829.046875} {"train_loss": -7.213669300079346, "global_step": 192654, "epoch": 4587} {"train_loss": -7.213700294494629, "global_step": 192655, "epoch": 4587} {"train_loss": -7.217957019805908, "global_step": 192656, "epoch": 4587} {"train_loss": -7.14574670791626, "global_step": 192657, "epoch": 4587} {"train_loss": -7.254329681396484, "global_step": 192658, "epoch": 4587} {"train_loss": -7.279290199279785, "global_step": 192659, "epoch": 4587} {"train_loss": -7.086081027984619, "global_step": 192660, "epoch": 4587} {"train_loss": -7.141058921813965, "global_step": 192661, "epoch": 4587} {"train_loss": -7.161807060241699, "global_step": 192662, "epoch": 4587} {"train_loss": -7.194793701171875, "global_step": 192663, "epoch": 4587} {"train_loss": -7.097238540649414, "global_step": 192664, "epoch": 4587} {"train_loss": -7.221497535705566, "global_step": 192665, "epoch": 4587} {"train_loss": -7.066466331481934, "global_step": 192666, "epoch": 4587} {"train_loss": -7.100666046142578, "global_step": 192667, "epoch": 4587} {"train_loss": -7.219203948974609, "global_step": 192668, "epoch": 4587} {"train_loss": -7.190999984741211, "global_step": 192669, "epoch": 4587} {"train_loss": -7.17724609375, "global_step": 192670, "epoch": 4587} {"train_loss": -7.095964431762695, "global_step": 192671, "epoch": 4587} {"train_loss": -7.074278831481934, "global_step": 192672, "epoch": 4587} {"train_loss": -7.110395431518555, "global_step": 192673, "epoch": 4587} {"train_loss": -7.210039138793945, "global_step": 192674, "epoch": 4587} {"train_loss": -7.1386823654174805, "global_step": 192675, "epoch": 4587} {"train_loss": -7.22726583480835, "global_step": 192676, "epoch": 4587} {"train_loss": -7.129673957824707, "global_step": 192677, "epoch": 4587} {"train_loss": -7.23310661315918, "global_step": 192678, "epoch": 4587} {"train_loss": -7.120604515075684, "global_step": 192679, "epoch": 4587} {"train_loss": -7.146203994750977, "global_step": 192680, "epoch": 4587} {"train_loss": -7.252209663391113, "global_step": 192681, "epoch": 4587} {"train_loss": -7.161174297332764, "global_step": 192682, "epoch": 4587} {"train_loss": -7.183819770812988, "global_step": 192683, "epoch": 4587} {"train_loss": -7.213932514190674, "global_step": 192684, "epoch": 4587} {"train_loss": -7.143734455108643, "global_step": 192685, "epoch": 4587} {"train_loss": -7.242281913757324, "global_step": 192686, "epoch": 4587} {"train_loss": -7.192178249359131, "global_step": 192687, "epoch": 4587} {"train_loss": -7.284885406494141, "global_step": 192688, "epoch": 4587} {"train_loss": -7.074955940246582, "global_step": 192689, "epoch": 4587} {"train_loss": -7.111777305603027, "global_step": 192690, "epoch": 4587} {"train_loss": -7.213102340698242, "global_step": 192691, "epoch": 4587} {"train_loss": -7.189463138580322, "global_step": 192692, "epoch": 4587} {"train_loss": -7.169545650482178, "global_step": 192693, "epoch": 4587} {"train_loss": -7.243707656860352, "global_step": 192694, "epoch": 4587} {"train_loss": -7.1724062987736295, "global_step": 192695, "epoch": 4587, "val_loss": 68964.8984375} {"train_loss": -7.139922142028809, "global_step": 192696, "epoch": 4588} {"train_loss": -7.153472900390625, "global_step": 192697, "epoch": 4588} {"train_loss": -7.236381530761719, "global_step": 192698, "epoch": 4588} {"train_loss": -7.204169750213623, "global_step": 192699, "epoch": 4588} {"train_loss": -7.253701210021973, "global_step": 192700, "epoch": 4588} {"train_loss": -7.239206314086914, "global_step": 192701, "epoch": 4588} {"train_loss": -7.098140239715576, "global_step": 192702, "epoch": 4588} {"train_loss": -7.178403377532959, "global_step": 192703, "epoch": 4588} {"train_loss": -7.21791934967041, "global_step": 192704, "epoch": 4588} {"train_loss": -7.320499420166016, "global_step": 192705, "epoch": 4588} {"train_loss": -7.180663108825684, "global_step": 192706, "epoch": 4588} {"train_loss": -7.2063727378845215, "global_step": 192707, "epoch": 4588} {"train_loss": -7.1917338371276855, "global_step": 192708, "epoch": 4588} {"train_loss": -7.348134994506836, "global_step": 192709, "epoch": 4588} {"train_loss": -7.208530426025391, "global_step": 192710, "epoch": 4588} {"train_loss": -7.195788383483887, "global_step": 192711, "epoch": 4588} {"train_loss": -7.3042988777160645, "global_step": 192712, "epoch": 4588} {"train_loss": -7.219813823699951, "global_step": 192713, "epoch": 4588} {"train_loss": -7.28493070602417, "global_step": 192714, "epoch": 4588} {"train_loss": -7.189854145050049, "global_step": 192715, "epoch": 4588} {"train_loss": -7.2396039962768555, "global_step": 192716, "epoch": 4588} {"train_loss": -7.281558036804199, "global_step": 192717, "epoch": 4588} {"train_loss": -7.279666900634766, "global_step": 192718, "epoch": 4588} {"train_loss": -7.265113830566406, "global_step": 192719, "epoch": 4588} {"train_loss": -7.109811782836914, "global_step": 192720, "epoch": 4588} {"train_loss": -7.333197593688965, "global_step": 192721, "epoch": 4588} {"train_loss": -7.306334972381592, "global_step": 192722, "epoch": 4588} {"train_loss": -7.181680679321289, "global_step": 192723, "epoch": 4588} {"train_loss": -7.1968994140625, "global_step": 192724, "epoch": 4588} {"train_loss": -7.139651298522949, "global_step": 192725, "epoch": 4588} {"train_loss": -7.199261665344238, "global_step": 192726, "epoch": 4588} {"train_loss": -7.248941898345947, "global_step": 192727, "epoch": 4588} {"train_loss": -7.186429977416992, "global_step": 192728, "epoch": 4588} {"train_loss": -7.080825328826904, "global_step": 192729, "epoch": 4588} {"train_loss": -7.135130882263184, "global_step": 192730, "epoch": 4588} {"train_loss": -7.230459213256836, "global_step": 192731, "epoch": 4588} {"train_loss": -7.094788551330566, "global_step": 192732, "epoch": 4588} {"train_loss": -7.09152889251709, "global_step": 192733, "epoch": 4588} {"train_loss": -7.246181964874268, "global_step": 192734, "epoch": 4588} {"train_loss": -7.085850238800049, "global_step": 192735, "epoch": 4588} {"train_loss": -6.925100326538086, "global_step": 192736, "epoch": 4588} {"train_loss": -7.197337343579247, "global_step": 192737, "epoch": 4588, "val_loss": 68910.03125} {"train_loss": -7.106444358825684, "global_step": 192738, "epoch": 4589} {"train_loss": -6.994319438934326, "global_step": 192739, "epoch": 4589} {"train_loss": -7.070184707641602, "global_step": 192740, "epoch": 4589} {"train_loss": -7.065530776977539, "global_step": 192741, "epoch": 4589} {"train_loss": -7.119061470031738, "global_step": 192742, "epoch": 4589} {"train_loss": -7.118610382080078, "global_step": 192743, "epoch": 4589} {"train_loss": -6.9893999099731445, "global_step": 192744, "epoch": 4589} {"train_loss": -6.992340087890625, "global_step": 192745, "epoch": 4589} {"train_loss": -6.8441033363342285, "global_step": 192746, "epoch": 4589} {"train_loss": -7.058085918426514, "global_step": 192747, "epoch": 4589} {"train_loss": -7.059562683105469, "global_step": 192748, "epoch": 4589} {"train_loss": -7.088386535644531, "global_step": 192749, "epoch": 4589} {"train_loss": -7.051348686218262, "global_step": 192750, "epoch": 4589} {"train_loss": -6.986062049865723, "global_step": 192751, "epoch": 4589} {"train_loss": -7.069427013397217, "global_step": 192752, "epoch": 4589} {"train_loss": -6.789314270019531, "global_step": 192753, "epoch": 4589} {"train_loss": -7.136185169219971, "global_step": 192754, "epoch": 4589} {"train_loss": -6.828402519226074, "global_step": 192755, "epoch": 4589} {"train_loss": -7.056777477264404, "global_step": 192756, "epoch": 4589} {"train_loss": -7.001795768737793, "global_step": 192757, "epoch": 4589} {"train_loss": -7.030971527099609, "global_step": 192758, "epoch": 4589} {"train_loss": -7.217806816101074, "global_step": 192759, "epoch": 4589} {"train_loss": -7.08970832824707, "global_step": 192760, "epoch": 4589} {"train_loss": -7.152430534362793, "global_step": 192761, "epoch": 4589} {"train_loss": -6.9121856689453125, "global_step": 192762, "epoch": 4589} {"train_loss": -7.136115074157715, "global_step": 192763, "epoch": 4589} {"train_loss": -7.000826835632324, "global_step": 192764, "epoch": 4589} {"train_loss": -7.219836711883545, "global_step": 192765, "epoch": 4589} {"train_loss": -6.915199279785156, "global_step": 192766, "epoch": 4589} {"train_loss": -7.077353477478027, "global_step": 192767, "epoch": 4589} {"train_loss": -7.074748516082764, "global_step": 192768, "epoch": 4589} {"train_loss": -7.207513809204102, "global_step": 192769, "epoch": 4589} {"train_loss": -7.135219573974609, "global_step": 192770, "epoch": 4589} {"train_loss": -7.164682865142822, "global_step": 192771, "epoch": 4589} {"train_loss": -7.117210388183594, "global_step": 192772, "epoch": 4589} {"train_loss": -7.036296844482422, "global_step": 192773, "epoch": 4589} {"train_loss": -7.164794921875, "global_step": 192774, "epoch": 4589} {"train_loss": -6.9152092933654785, "global_step": 192775, "epoch": 4589} {"train_loss": -7.121558666229248, "global_step": 192776, "epoch": 4589} {"train_loss": -7.235649108886719, "global_step": 192777, "epoch": 4589} {"train_loss": -7.029144287109375, "global_step": 192778, "epoch": 4589} {"train_loss": -7.060185205368769, "global_step": 192779, "epoch": 4589, "val_loss": 68897.0546875} {"train_loss": -7.046348571777344, "global_step": 192780, "epoch": 4590} {"train_loss": -7.275023460388184, "global_step": 192781, "epoch": 4590} {"train_loss": -7.177801132202148, "global_step": 192782, "epoch": 4590} {"train_loss": -7.138155460357666, "global_step": 192783, "epoch": 4590} {"train_loss": -7.184149742126465, "global_step": 192784, "epoch": 4590} {"train_loss": -7.228112697601318, "global_step": 192785, "epoch": 4590} {"train_loss": -7.164150238037109, "global_step": 192786, "epoch": 4590} {"train_loss": -7.092269420623779, "global_step": 192787, "epoch": 4590} {"train_loss": -7.218256950378418, "global_step": 192788, "epoch": 4590} {"train_loss": -7.197710037231445, "global_step": 192789, "epoch": 4590} {"train_loss": -7.104005813598633, "global_step": 192790, "epoch": 4590} {"train_loss": -7.074697017669678, "global_step": 192791, "epoch": 4590} {"train_loss": -7.2218708992004395, "global_step": 192792, "epoch": 4590} {"train_loss": -7.264186859130859, "global_step": 192793, "epoch": 4590} {"train_loss": -7.187647342681885, "global_step": 192794, "epoch": 4590} {"train_loss": -7.188826560974121, "global_step": 192795, "epoch": 4590} {"train_loss": -7.2393059730529785, "global_step": 192796, "epoch": 4590} {"train_loss": -7.191492557525635, "global_step": 192797, "epoch": 4590} {"train_loss": -7.18246603012085, "global_step": 192798, "epoch": 4590} {"train_loss": -7.1740312576293945, "global_step": 192799, "epoch": 4590} {"train_loss": -7.285545825958252, "global_step": 192800, "epoch": 4590} {"train_loss": -7.1288862228393555, "global_step": 192801, "epoch": 4590} {"train_loss": -7.196465492248535, "global_step": 192802, "epoch": 4590} {"train_loss": -7.229643821716309, "global_step": 192803, "epoch": 4590} {"train_loss": -7.2079291343688965, "global_step": 192804, "epoch": 4590} {"train_loss": -7.2108612060546875, "global_step": 192805, "epoch": 4590} {"train_loss": -7.231577396392822, "global_step": 192806, "epoch": 4590} {"train_loss": -7.2093048095703125, "global_step": 192807, "epoch": 4590} {"train_loss": -7.199345111846924, "global_step": 192808, "epoch": 4590} {"train_loss": -7.152482509613037, "global_step": 192809, "epoch": 4590} {"train_loss": -7.208021640777588, "global_step": 192810, "epoch": 4590} {"train_loss": -7.262434959411621, "global_step": 192811, "epoch": 4590} {"train_loss": -7.051324844360352, "global_step": 192812, "epoch": 4590} {"train_loss": -7.170901775360107, "global_step": 192813, "epoch": 4590} {"train_loss": -7.171452522277832, "global_step": 192814, "epoch": 4590} {"train_loss": -7.056454658508301, "global_step": 192815, "epoch": 4590} {"train_loss": -7.06765079498291, "global_step": 192816, "epoch": 4590} {"train_loss": -7.195943355560303, "global_step": 192817, "epoch": 4590} {"train_loss": -7.139471054077148, "global_step": 192818, "epoch": 4590} {"train_loss": -7.12286376953125, "global_step": 192819, "epoch": 4590} {"train_loss": -7.026304244995117, "global_step": 192820, "epoch": 4590} {"train_loss": -7.170809689022246, "global_step": 192821, "epoch": 4590, "val_loss": 69113.515625} {"train_loss": -7.1400346755981445, "global_step": 192822, "epoch": 4591} {"train_loss": -7.0579938888549805, "global_step": 192823, "epoch": 4591} {"train_loss": -7.1533660888671875, "global_step": 192824, "epoch": 4591} {"train_loss": -7.132754325866699, "global_step": 192825, "epoch": 4591} {"train_loss": -7.11779260635376, "global_step": 192826, "epoch": 4591} {"train_loss": -7.154303073883057, "global_step": 192827, "epoch": 4591} {"train_loss": -7.096753120422363, "global_step": 192828, "epoch": 4591} {"train_loss": -7.171337604522705, "global_step": 192829, "epoch": 4591} {"train_loss": -7.12582540512085, "global_step": 192830, "epoch": 4591} {"train_loss": -7.12410831451416, "global_step": 192831, "epoch": 4591} {"train_loss": -7.081712245941162, "global_step": 192832, "epoch": 4591} {"train_loss": -7.176205635070801, "global_step": 192833, "epoch": 4591} {"train_loss": -7.179287910461426, "global_step": 192834, "epoch": 4591} {"train_loss": -7.121448993682861, "global_step": 192835, "epoch": 4591} {"train_loss": -7.1912946701049805, "global_step": 192836, "epoch": 4591} {"train_loss": -7.080684661865234, "global_step": 192837, "epoch": 4591} {"train_loss": -7.057124137878418, "global_step": 192838, "epoch": 4591} {"train_loss": -7.1293816566467285, "global_step": 192839, "epoch": 4591} {"train_loss": -7.165694236755371, "global_step": 192840, "epoch": 4591} {"train_loss": -7.1042280197143555, "global_step": 192841, "epoch": 4591} {"train_loss": -7.064045429229736, "global_step": 192842, "epoch": 4591} {"train_loss": -7.144970893859863, "global_step": 192843, "epoch": 4591} {"train_loss": -7.236166000366211, "global_step": 192844, "epoch": 4591} {"train_loss": -7.118969917297363, "global_step": 192845, "epoch": 4591} {"train_loss": -7.0981340408325195, "global_step": 192846, "epoch": 4591} {"train_loss": -7.081346035003662, "global_step": 192847, "epoch": 4591} {"train_loss": -7.0490288734436035, "global_step": 192848, "epoch": 4591} {"train_loss": -6.969699382781982, "global_step": 192849, "epoch": 4591} {"train_loss": -6.994298934936523, "global_step": 192850, "epoch": 4591} {"train_loss": -7.167159080505371, "global_step": 192851, "epoch": 4591} {"train_loss": -7.147751331329346, "global_step": 192852, "epoch": 4591} {"train_loss": -7.074509620666504, "global_step": 192853, "epoch": 4591} {"train_loss": -7.184056282043457, "global_step": 192854, "epoch": 4591} {"train_loss": -7.025995254516602, "global_step": 192855, "epoch": 4591} {"train_loss": -7.174642562866211, "global_step": 192856, "epoch": 4591} {"train_loss": -7.076485633850098, "global_step": 192857, "epoch": 4591} {"train_loss": -7.167452335357666, "global_step": 192858, "epoch": 4591} {"train_loss": -7.0835723876953125, "global_step": 192859, "epoch": 4591} {"train_loss": -7.055172443389893, "global_step": 192860, "epoch": 4591} {"train_loss": -7.030622482299805, "global_step": 192861, "epoch": 4591} {"train_loss": -7.199927806854248, "global_step": 192862, "epoch": 4591} {"train_loss": -7.11672534261431, "global_step": 192863, "epoch": 4591, "val_loss": 68893.8203125} {"train_loss": -7.156601905822754, "global_step": 192864, "epoch": 4592} {"train_loss": -7.300111770629883, "global_step": 192865, "epoch": 4592} {"train_loss": -7.246585845947266, "global_step": 192866, "epoch": 4592} {"train_loss": -7.049905300140381, "global_step": 192867, "epoch": 4592} {"train_loss": -7.0949296951293945, "global_step": 192868, "epoch": 4592} {"train_loss": -7.19476318359375, "global_step": 192869, "epoch": 4592} {"train_loss": -7.159485816955566, "global_step": 192870, "epoch": 4592} {"train_loss": -7.219310760498047, "global_step": 192871, "epoch": 4592} {"train_loss": -7.105719566345215, "global_step": 192872, "epoch": 4592} {"train_loss": -7.140615940093994, "global_step": 192873, "epoch": 4592} {"train_loss": -7.129430770874023, "global_step": 192874, "epoch": 4592} {"train_loss": -7.250648498535156, "global_step": 192875, "epoch": 4592} {"train_loss": -7.206936359405518, "global_step": 192876, "epoch": 4592} {"train_loss": -7.059058666229248, "global_step": 192877, "epoch": 4592} {"train_loss": -7.191646575927734, "global_step": 192878, "epoch": 4592} {"train_loss": -7.177703857421875, "global_step": 192879, "epoch": 4592} {"train_loss": -7.188473701477051, "global_step": 192880, "epoch": 4592} {"train_loss": -7.242169380187988, "global_step": 192881, "epoch": 4592} {"train_loss": -7.184114456176758, "global_step": 192882, "epoch": 4592} {"train_loss": -7.155274391174316, "global_step": 192883, "epoch": 4592} {"train_loss": -7.1522216796875, "global_step": 192884, "epoch": 4592} {"train_loss": -7.081191539764404, "global_step": 192885, "epoch": 4592} {"train_loss": -7.146295547485352, "global_step": 192886, "epoch": 4592} {"train_loss": -7.120532035827637, "global_step": 192887, "epoch": 4592} {"train_loss": -7.1369781494140625, "global_step": 192888, "epoch": 4592} {"train_loss": -7.221500396728516, "global_step": 192889, "epoch": 4592} {"train_loss": -7.201035022735596, "global_step": 192890, "epoch": 4592} {"train_loss": -7.098369598388672, "global_step": 192891, "epoch": 4592} {"train_loss": -7.1232523918151855, "global_step": 192892, "epoch": 4592} {"train_loss": -7.131803512573242, "global_step": 192893, "epoch": 4592} {"train_loss": -7.237915992736816, "global_step": 192894, "epoch": 4592} {"train_loss": -7.152848720550537, "global_step": 192895, "epoch": 4592} {"train_loss": -7.171165466308594, "global_step": 192896, "epoch": 4592} {"train_loss": -7.1211700439453125, "global_step": 192897, "epoch": 4592} {"train_loss": -7.074991226196289, "global_step": 192898, "epoch": 4592} {"train_loss": -7.279630661010742, "global_step": 192899, "epoch": 4592} {"train_loss": -7.147181510925293, "global_step": 192900, "epoch": 4592} {"train_loss": -7.22211217880249, "global_step": 192901, "epoch": 4592} {"train_loss": -7.227108001708984, "global_step": 192902, "epoch": 4592} {"train_loss": -7.127278804779053, "global_step": 192903, "epoch": 4592} {"train_loss": -7.093768119812012, "global_step": 192904, "epoch": 4592} {"train_loss": -7.1663036687033514, "global_step": 192905, "epoch": 4592, "val_loss": 69105.890625} {"train_loss": -7.005945205688477, "global_step": 192906, "epoch": 4593} {"train_loss": -7.081772804260254, "global_step": 192907, "epoch": 4593} {"train_loss": -7.085615158081055, "global_step": 192908, "epoch": 4593} {"train_loss": -7.010529518127441, "global_step": 192909, "epoch": 4593} {"train_loss": -7.165539741516113, "global_step": 192910, "epoch": 4593} {"train_loss": -7.1022491455078125, "global_step": 192911, "epoch": 4593} {"train_loss": -7.070837497711182, "global_step": 192912, "epoch": 4593} {"train_loss": -7.115963935852051, "global_step": 192913, "epoch": 4593} {"train_loss": -7.088043689727783, "global_step": 192914, "epoch": 4593} {"train_loss": -7.182667255401611, "global_step": 192915, "epoch": 4593} {"train_loss": -7.237182140350342, "global_step": 192916, "epoch": 4593} {"train_loss": -7.144988536834717, "global_step": 192917, "epoch": 4593} {"train_loss": -7.207650661468506, "global_step": 192918, "epoch": 4593} {"train_loss": -7.131497859954834, "global_step": 192919, "epoch": 4593} {"train_loss": -7.159600257873535, "global_step": 192920, "epoch": 4593} {"train_loss": -7.361043453216553, "global_step": 192921, "epoch": 4593} {"train_loss": -7.199649810791016, "global_step": 192922, "epoch": 4593} {"train_loss": -7.125088214874268, "global_step": 192923, "epoch": 4593} {"train_loss": -7.140547275543213, "global_step": 192924, "epoch": 4593} {"train_loss": -7.275548458099365, "global_step": 192925, "epoch": 4593} {"train_loss": -7.086239337921143, "global_step": 192926, "epoch": 4593} {"train_loss": -7.208085060119629, "global_step": 192927, "epoch": 4593} {"train_loss": -7.200845718383789, "global_step": 192928, "epoch": 4593} {"train_loss": -7.23214054107666, "global_step": 192929, "epoch": 4593} {"train_loss": -7.306724548339844, "global_step": 192930, "epoch": 4593} {"train_loss": -7.219904899597168, "global_step": 192931, "epoch": 4593} {"train_loss": -7.214930534362793, "global_step": 192932, "epoch": 4593} {"train_loss": -7.248773574829102, "global_step": 192933, "epoch": 4593} {"train_loss": -7.247056484222412, "global_step": 192934, "epoch": 4593} {"train_loss": -7.196683406829834, "global_step": 192935, "epoch": 4593} {"train_loss": -7.2181782722473145, "global_step": 192936, "epoch": 4593} {"train_loss": -7.161491394042969, "global_step": 192937, "epoch": 4593} {"train_loss": -7.201173782348633, "global_step": 192938, "epoch": 4593} {"train_loss": -7.292442321777344, "global_step": 192939, "epoch": 4593} {"train_loss": -7.09451150894165, "global_step": 192940, "epoch": 4593} {"train_loss": -7.18431282043457, "global_step": 192941, "epoch": 4593} {"train_loss": -7.195501327514648, "global_step": 192942, "epoch": 4593} {"train_loss": -7.299841403961182, "global_step": 192943, "epoch": 4593} {"train_loss": -7.249203681945801, "global_step": 192944, "epoch": 4593} {"train_loss": -7.254075050354004, "global_step": 192945, "epoch": 4593} {"train_loss": -7.229334831237793, "global_step": 192946, "epoch": 4593} {"train_loss": -7.180395898364839, "global_step": 192947, "epoch": 4593, "val_loss": 68845.1796875} {"train_loss": -7.322553634643555, "global_step": 192948, "epoch": 4594} {"train_loss": -7.221511363983154, "global_step": 192949, "epoch": 4594} {"train_loss": -7.27521276473999, "global_step": 192950, "epoch": 4594} {"train_loss": -7.190666198730469, "global_step": 192951, "epoch": 4594} {"train_loss": -7.006837844848633, "global_step": 192952, "epoch": 4594} {"train_loss": -7.414106369018555, "global_step": 192953, "epoch": 4594} {"train_loss": -7.194709777832031, "global_step": 192954, "epoch": 4594} {"train_loss": -7.211584568023682, "global_step": 192955, "epoch": 4594} {"train_loss": -7.242523670196533, "global_step": 192956, "epoch": 4594} {"train_loss": -7.227924346923828, "global_step": 192957, "epoch": 4594} {"train_loss": -7.184154033660889, "global_step": 192958, "epoch": 4594} {"train_loss": -7.141056060791016, "global_step": 192959, "epoch": 4594} {"train_loss": -7.093313217163086, "global_step": 192960, "epoch": 4594} {"train_loss": -7.162758827209473, "global_step": 192961, "epoch": 4594} {"train_loss": -7.267995357513428, "global_step": 192962, "epoch": 4594} {"train_loss": -7.171689987182617, "global_step": 192963, "epoch": 4594} {"train_loss": -7.160738945007324, "global_step": 192964, "epoch": 4594} {"train_loss": -7.197628974914551, "global_step": 192965, "epoch": 4594} {"train_loss": -7.229861259460449, "global_step": 192966, "epoch": 4594} {"train_loss": -7.258665084838867, "global_step": 192967, "epoch": 4594} {"train_loss": -7.173858165740967, "global_step": 192968, "epoch": 4594} {"train_loss": -7.284646034240723, "global_step": 192969, "epoch": 4594} {"train_loss": -7.261173725128174, "global_step": 192970, "epoch": 4594} {"train_loss": -7.119707107543945, "global_step": 192971, "epoch": 4594} {"train_loss": -7.2533087730407715, "global_step": 192972, "epoch": 4594} {"train_loss": -7.170198917388916, "global_step": 192973, "epoch": 4594} {"train_loss": -7.087068557739258, "global_step": 192974, "epoch": 4594} {"train_loss": -7.241379737854004, "global_step": 192975, "epoch": 4594} {"train_loss": -7.221548080444336, "global_step": 192976, "epoch": 4594} {"train_loss": -7.211173057556152, "global_step": 192977, "epoch": 4594} {"train_loss": -7.285427093505859, "global_step": 192978, "epoch": 4594} {"train_loss": -7.160066604614258, "global_step": 192979, "epoch": 4594} {"train_loss": -7.2141523361206055, "global_step": 192980, "epoch": 4594} {"train_loss": -7.1412882804870605, "global_step": 192981, "epoch": 4594} {"train_loss": -7.165907859802246, "global_step": 192982, "epoch": 4594} {"train_loss": -7.190397262573242, "global_step": 192983, "epoch": 4594} {"train_loss": -7.209836959838867, "global_step": 192984, "epoch": 4594} {"train_loss": -7.200317859649658, "global_step": 192985, "epoch": 4594} {"train_loss": -7.036971092224121, "global_step": 192986, "epoch": 4594} {"train_loss": -7.194103240966797, "global_step": 192987, "epoch": 4594} {"train_loss": -7.065583229064941, "global_step": 192988, "epoch": 4594} {"train_loss": -7.194540886651902, "global_step": 192989, "epoch": 4594, "val_loss": 69147.5390625} {"train_loss": -7.317434310913086, "global_step": 192990, "epoch": 4595} {"train_loss": -7.270745277404785, "global_step": 192991, "epoch": 4595} {"train_loss": -7.230116367340088, "global_step": 192992, "epoch": 4595} {"train_loss": -7.259925842285156, "global_step": 192993, "epoch": 4595} {"train_loss": -7.255743026733398, "global_step": 192994, "epoch": 4595} {"train_loss": -7.066998481750488, "global_step": 192995, "epoch": 4595} {"train_loss": -7.134309768676758, "global_step": 192996, "epoch": 4595} {"train_loss": -7.136157989501953, "global_step": 192997, "epoch": 4595} {"train_loss": -7.1818413734436035, "global_step": 192998, "epoch": 4595} {"train_loss": -7.19779109954834, "global_step": 192999, "epoch": 4595} {"train_loss": -7.24465274810791, "global_step": 193000, "epoch": 4595} {"train_loss": -7.193875312805176, "global_step": 193001, "epoch": 4595} {"train_loss": -7.152894973754883, "global_step": 193002, "epoch": 4595} {"train_loss": -7.107784271240234, "global_step": 193003, "epoch": 4595} {"train_loss": -7.314815998077393, "global_step": 193004, "epoch": 4595} {"train_loss": -7.14501953125, "global_step": 193005, "epoch": 4595} {"train_loss": -7.116125106811523, "global_step": 193006, "epoch": 4595} {"train_loss": -7.232334136962891, "global_step": 193007, "epoch": 4595} {"train_loss": -7.1414875984191895, "global_step": 193008, "epoch": 4595} {"train_loss": -7.142268180847168, "global_step": 193009, "epoch": 4595} {"train_loss": -7.249773025512695, "global_step": 193010, "epoch": 4595} {"train_loss": -7.171937942504883, "global_step": 193011, "epoch": 4595} {"train_loss": -7.164022922515869, "global_step": 193012, "epoch": 4595} {"train_loss": -7.20955753326416, "global_step": 193013, "epoch": 4595} {"train_loss": -7.0863871574401855, "global_step": 193014, "epoch": 4595} {"train_loss": -7.189558506011963, "global_step": 193015, "epoch": 4595} {"train_loss": -7.19102144241333, "global_step": 193016, "epoch": 4595} {"train_loss": -7.146922588348389, "global_step": 193017, "epoch": 4595} {"train_loss": -7.232871055603027, "global_step": 193018, "epoch": 4595} {"train_loss": -7.1705851554870605, "global_step": 193019, "epoch": 4595} {"train_loss": -7.121831893920898, "global_step": 193020, "epoch": 4595} {"train_loss": -7.264437198638916, "global_step": 193021, "epoch": 4595} {"train_loss": -7.222769737243652, "global_step": 193022, "epoch": 4595} {"train_loss": -7.177656650543213, "global_step": 193023, "epoch": 4595} {"train_loss": -7.222333908081055, "global_step": 193024, "epoch": 4595} {"train_loss": -7.18526554107666, "global_step": 193025, "epoch": 4595} {"train_loss": -7.077147483825684, "global_step": 193026, "epoch": 4595} {"train_loss": -7.159731864929199, "global_step": 193027, "epoch": 4595} {"train_loss": -7.226178169250488, "global_step": 193028, "epoch": 4595} {"train_loss": -7.235790252685547, "global_step": 193029, "epoch": 4595} {"train_loss": -7.266903400421143, "global_step": 193030, "epoch": 4595} {"train_loss": -7.185494388852801, "global_step": 193031, "epoch": 4595, "val_loss": 69049.3515625} {"train_loss": -7.149052619934082, "global_step": 193032, "epoch": 4596} {"train_loss": -7.069187164306641, "global_step": 193033, "epoch": 4596} {"train_loss": -6.964698314666748, "global_step": 193034, "epoch": 4596} {"train_loss": -7.127357482910156, "global_step": 193035, "epoch": 4596} {"train_loss": -7.150527000427246, "global_step": 193036, "epoch": 4596} {"train_loss": -7.106175899505615, "global_step": 193037, "epoch": 4596} {"train_loss": -7.124650955200195, "global_step": 193038, "epoch": 4596} {"train_loss": -7.221339225769043, "global_step": 193039, "epoch": 4596} {"train_loss": -7.061298847198486, "global_step": 193040, "epoch": 4596} {"train_loss": -7.116665840148926, "global_step": 193041, "epoch": 4596} {"train_loss": -7.043092250823975, "global_step": 193042, "epoch": 4596} {"train_loss": -7.065472602844238, "global_step": 193043, "epoch": 4596} {"train_loss": -7.17840576171875, "global_step": 193044, "epoch": 4596} {"train_loss": -7.158202648162842, "global_step": 193045, "epoch": 4596} {"train_loss": -7.148819446563721, "global_step": 193046, "epoch": 4596} {"train_loss": -7.199702262878418, "global_step": 193047, "epoch": 4596} {"train_loss": -7.069420337677002, "global_step": 193048, "epoch": 4596} {"train_loss": -7.162103652954102, "global_step": 193049, "epoch": 4596} {"train_loss": -7.085994720458984, "global_step": 193050, "epoch": 4596} {"train_loss": -7.163131237030029, "global_step": 193051, "epoch": 4596} {"train_loss": -7.2802324295043945, "global_step": 193052, "epoch": 4596} {"train_loss": -7.234921455383301, "global_step": 193053, "epoch": 4596} {"train_loss": -7.162848472595215, "global_step": 193054, "epoch": 4596} {"train_loss": -7.113602638244629, "global_step": 193055, "epoch": 4596} {"train_loss": -7.219220161437988, "global_step": 193056, "epoch": 4596} {"train_loss": -7.206916809082031, "global_step": 193057, "epoch": 4596} {"train_loss": -7.226881980895996, "global_step": 193058, "epoch": 4596} {"train_loss": -7.293854236602783, "global_step": 193059, "epoch": 4596} {"train_loss": -7.215978622436523, "global_step": 193060, "epoch": 4596} {"train_loss": -7.226876258850098, "global_step": 193061, "epoch": 4596} {"train_loss": -7.193082809448242, "global_step": 193062, "epoch": 4596} {"train_loss": -7.213965892791748, "global_step": 193063, "epoch": 4596} {"train_loss": -7.206055164337158, "global_step": 193064, "epoch": 4596} {"train_loss": -7.212507247924805, "global_step": 193065, "epoch": 4596} {"train_loss": -7.191074848175049, "global_step": 193066, "epoch": 4596} {"train_loss": -7.29932165145874, "global_step": 193067, "epoch": 4596} {"train_loss": -7.090193748474121, "global_step": 193068, "epoch": 4596} {"train_loss": -7.318258762359619, "global_step": 193069, "epoch": 4596} {"train_loss": -7.317126750946045, "global_step": 193070, "epoch": 4596} {"train_loss": -7.129220962524414, "global_step": 193071, "epoch": 4596} {"train_loss": -7.2264404296875, "global_step": 193072, "epoch": 4596} {"train_loss": -7.173761118026007, "global_step": 193073, "epoch": 4596, "val_loss": 68988.3203125} {"train_loss": -7.327801704406738, "global_step": 193074, "epoch": 4597} {"train_loss": -7.230344772338867, "global_step": 193075, "epoch": 4597} {"train_loss": -7.182355880737305, "global_step": 193076, "epoch": 4597} {"train_loss": -7.057807922363281, "global_step": 193077, "epoch": 4597} {"train_loss": -7.254604339599609, "global_step": 193078, "epoch": 4597} {"train_loss": -7.253382682800293, "global_step": 193079, "epoch": 4597} {"train_loss": -7.136736869812012, "global_step": 193080, "epoch": 4597} {"train_loss": -7.042827606201172, "global_step": 193081, "epoch": 4597} {"train_loss": -7.284074306488037, "global_step": 193082, "epoch": 4597} {"train_loss": -7.1044230461120605, "global_step": 193083, "epoch": 4597} {"train_loss": -7.075015068054199, "global_step": 193084, "epoch": 4597} {"train_loss": -7.261321067810059, "global_step": 193085, "epoch": 4597} {"train_loss": -7.00244140625, "global_step": 193086, "epoch": 4597} {"train_loss": -7.227511405944824, "global_step": 193087, "epoch": 4597} {"train_loss": -7.210033416748047, "global_step": 193088, "epoch": 4597} {"train_loss": -7.113250732421875, "global_step": 193089, "epoch": 4597} {"train_loss": -7.211153030395508, "global_step": 193090, "epoch": 4597} {"train_loss": -7.1601176261901855, "global_step": 193091, "epoch": 4597} {"train_loss": -7.190361499786377, "global_step": 193092, "epoch": 4597} {"train_loss": -7.058300018310547, "global_step": 193093, "epoch": 4597} {"train_loss": -7.07167911529541, "global_step": 193094, "epoch": 4597} {"train_loss": -7.1638078689575195, "global_step": 193095, "epoch": 4597} {"train_loss": -7.274247169494629, "global_step": 193096, "epoch": 4597} {"train_loss": -7.1116180419921875, "global_step": 193097, "epoch": 4597} {"train_loss": -6.971700191497803, "global_step": 193098, "epoch": 4597} {"train_loss": -7.198902130126953, "global_step": 193099, "epoch": 4597} {"train_loss": -7.0102458000183105, "global_step": 193100, "epoch": 4597} {"train_loss": -7.189241409301758, "global_step": 193101, "epoch": 4597} {"train_loss": -7.156351566314697, "global_step": 193102, "epoch": 4597} {"train_loss": -7.18477725982666, "global_step": 193103, "epoch": 4597} {"train_loss": -7.10064697265625, "global_step": 193104, "epoch": 4597} {"train_loss": -7.097922325134277, "global_step": 193105, "epoch": 4597} {"train_loss": -7.1825480461120605, "global_step": 193106, "epoch": 4597} {"train_loss": -7.272561073303223, "global_step": 193107, "epoch": 4597} {"train_loss": -7.181339263916016, "global_step": 193108, "epoch": 4597} {"train_loss": -7.103868007659912, "global_step": 193109, "epoch": 4597} {"train_loss": -7.2294158935546875, "global_step": 193110, "epoch": 4597} {"train_loss": -7.117702007293701, "global_step": 193111, "epoch": 4597} {"train_loss": -7.115211009979248, "global_step": 193112, "epoch": 4597} {"train_loss": -7.201760292053223, "global_step": 193113, "epoch": 4597} {"train_loss": -7.128171443939209, "global_step": 193114, "epoch": 4597} {"train_loss": -7.155244225547428, "global_step": 193115, "epoch": 4597, "val_loss": 69085.859375} {"train_loss": -7.1793036460876465, "global_step": 193116, "epoch": 4598} {"train_loss": -7.081533908843994, "global_step": 193117, "epoch": 4598} {"train_loss": -7.036558151245117, "global_step": 193118, "epoch": 4598} {"train_loss": -7.159395217895508, "global_step": 193119, "epoch": 4598} {"train_loss": -7.162663459777832, "global_step": 193120, "epoch": 4598} {"train_loss": -7.208124160766602, "global_step": 193121, "epoch": 4598} {"train_loss": -7.165191650390625, "global_step": 193122, "epoch": 4598} {"train_loss": -7.093818664550781, "global_step": 193123, "epoch": 4598} {"train_loss": -7.107820510864258, "global_step": 193124, "epoch": 4598} {"train_loss": -7.153779983520508, "global_step": 193125, "epoch": 4598} {"train_loss": -7.206408500671387, "global_step": 193126, "epoch": 4598} {"train_loss": -7.149031639099121, "global_step": 193127, "epoch": 4598} {"train_loss": -7.1748199462890625, "global_step": 193128, "epoch": 4598} {"train_loss": -7.141088485717773, "global_step": 193129, "epoch": 4598} {"train_loss": -7.088773727416992, "global_step": 193130, "epoch": 4598} {"train_loss": -7.15644645690918, "global_step": 193131, "epoch": 4598} {"train_loss": -7.082368850708008, "global_step": 193132, "epoch": 4598} {"train_loss": -7.125114440917969, "global_step": 193133, "epoch": 4598} {"train_loss": -7.192923545837402, "global_step": 193134, "epoch": 4598} {"train_loss": -7.23577880859375, "global_step": 193135, "epoch": 4598} {"train_loss": -7.188699245452881, "global_step": 193136, "epoch": 4598} {"train_loss": -7.1065545082092285, "global_step": 193137, "epoch": 4598} {"train_loss": -7.229950428009033, "global_step": 193138, "epoch": 4598} {"train_loss": -7.145244598388672, "global_step": 193139, "epoch": 4598} {"train_loss": -7.2333221435546875, "global_step": 193140, "epoch": 4598} {"train_loss": -7.039119720458984, "global_step": 193141, "epoch": 4598} {"train_loss": -7.073648452758789, "global_step": 193142, "epoch": 4598} {"train_loss": -7.230031967163086, "global_step": 193143, "epoch": 4598} {"train_loss": -7.1073503494262695, "global_step": 193144, "epoch": 4598} {"train_loss": -7.154905319213867, "global_step": 193145, "epoch": 4598} {"train_loss": -7.2552266120910645, "global_step": 193146, "epoch": 4598} {"train_loss": -7.089141845703125, "global_step": 193147, "epoch": 4598} {"train_loss": -7.186543941497803, "global_step": 193148, "epoch": 4598} {"train_loss": -7.131828308105469, "global_step": 193149, "epoch": 4598} {"train_loss": -7.181275844573975, "global_step": 193150, "epoch": 4598} {"train_loss": -7.012825965881348, "global_step": 193151, "epoch": 4598} {"train_loss": -7.048196315765381, "global_step": 193152, "epoch": 4598} {"train_loss": -7.119146347045898, "global_step": 193153, "epoch": 4598} {"train_loss": -7.038002014160156, "global_step": 193154, "epoch": 4598} {"train_loss": -7.095961570739746, "global_step": 193155, "epoch": 4598} {"train_loss": -7.086504936218262, "global_step": 193156, "epoch": 4598} {"train_loss": -7.13823804401216, "global_step": 193157, "epoch": 4598, "val_loss": 69416.3046875} {"train_loss": -6.922357559204102, "global_step": 193158, "epoch": 4599} {"train_loss": -6.987224578857422, "global_step": 193159, "epoch": 4599} {"train_loss": -7.142284870147705, "global_step": 193160, "epoch": 4599} {"train_loss": -7.003377914428711, "global_step": 193161, "epoch": 4599} {"train_loss": -7.012704849243164, "global_step": 193162, "epoch": 4599} {"train_loss": -7.183698654174805, "global_step": 193163, "epoch": 4599} {"train_loss": -7.109694004058838, "global_step": 193164, "epoch": 4599} {"train_loss": -7.223745346069336, "global_step": 193165, "epoch": 4599} {"train_loss": -7.0200324058532715, "global_step": 193166, "epoch": 4599} {"train_loss": -7.109313011169434, "global_step": 193167, "epoch": 4599} {"train_loss": -7.148637294769287, "global_step": 193168, "epoch": 4599} {"train_loss": -7.054611682891846, "global_step": 193169, "epoch": 4599} {"train_loss": -7.178333282470703, "global_step": 193170, "epoch": 4599} {"train_loss": -7.090412139892578, "global_step": 193171, "epoch": 4599} {"train_loss": -7.055257797241211, "global_step": 193172, "epoch": 4599} {"train_loss": -7.101123809814453, "global_step": 193173, "epoch": 4599} {"train_loss": -7.117968559265137, "global_step": 193174, "epoch": 4599} {"train_loss": -6.957669734954834, "global_step": 193175, "epoch": 4599} {"train_loss": -7.165932655334473, "global_step": 193176, "epoch": 4599} {"train_loss": -6.936493873596191, "global_step": 193177, "epoch": 4599} {"train_loss": -7.106233596801758, "global_step": 193178, "epoch": 4599} {"train_loss": -7.074603080749512, "global_step": 193179, "epoch": 4599} {"train_loss": -7.049093246459961, "global_step": 193180, "epoch": 4599} {"train_loss": -7.285584926605225, "global_step": 193181, "epoch": 4599} {"train_loss": -7.020618915557861, "global_step": 193182, "epoch": 4599} {"train_loss": -7.151081085205078, "global_step": 193183, "epoch": 4599} {"train_loss": -7.146219253540039, "global_step": 193184, "epoch": 4599} {"train_loss": -6.9867095947265625, "global_step": 193185, "epoch": 4599} {"train_loss": -7.102489471435547, "global_step": 193186, "epoch": 4599} {"train_loss": -7.12294864654541, "global_step": 193187, "epoch": 4599} {"train_loss": -7.144765853881836, "global_step": 193188, "epoch": 4599} {"train_loss": -7.178702354431152, "global_step": 193189, "epoch": 4599} {"train_loss": -7.185162544250488, "global_step": 193190, "epoch": 4599} {"train_loss": -7.185544013977051, "global_step": 193191, "epoch": 4599} {"train_loss": -7.202568054199219, "global_step": 193192, "epoch": 4599} {"train_loss": -7.1681742668151855, "global_step": 193193, "epoch": 4599} {"train_loss": -7.023049354553223, "global_step": 193194, "epoch": 4599} {"train_loss": -7.265081405639648, "global_step": 193195, "epoch": 4599} {"train_loss": -7.221525192260742, "global_step": 193196, "epoch": 4599} {"train_loss": -7.1457414627075195, "global_step": 193197, "epoch": 4599} {"train_loss": -7.166894912719727, "global_step": 193198, "epoch": 4599} {"train_loss": -7.110427425021217, "global_step": 193199, "epoch": 4599, "val_loss": 68890.8671875} {"train_loss": -7.249168395996094, "global_step": 193200, "epoch": 4600} {"train_loss": -7.0594305992126465, "global_step": 193201, "epoch": 4600} {"train_loss": -7.171602725982666, "global_step": 193202, "epoch": 4600} {"train_loss": -7.188422203063965, "global_step": 193203, "epoch": 4600} {"train_loss": -6.98512601852417, "global_step": 193204, "epoch": 4600} {"train_loss": -7.1256513595581055, "global_step": 193205, "epoch": 4600} {"train_loss": -7.169540882110596, "global_step": 193206, "epoch": 4600} {"train_loss": -7.123696804046631, "global_step": 193207, "epoch": 4600} {"train_loss": -7.130796432495117, "global_step": 193208, "epoch": 4600} {"train_loss": -6.9296064376831055, "global_step": 193209, "epoch": 4600} {"train_loss": -7.232542037963867, "global_step": 193210, "epoch": 4600} {"train_loss": -7.084071636199951, "global_step": 193211, "epoch": 4600} {"train_loss": -7.20863151550293, "global_step": 193212, "epoch": 4600} {"train_loss": -7.133039474487305, "global_step": 193213, "epoch": 4600} {"train_loss": -7.098541259765625, "global_step": 193214, "epoch": 4600} {"train_loss": -7.1380438804626465, "global_step": 193215, "epoch": 4600} {"train_loss": -7.069509983062744, "global_step": 193216, "epoch": 4600} {"train_loss": -7.167062759399414, "global_step": 193217, "epoch": 4600} {"train_loss": -7.204268455505371, "global_step": 193218, "epoch": 4600} {"train_loss": -7.177153587341309, "global_step": 193219, "epoch": 4600} {"train_loss": -7.2230706214904785, "global_step": 193220, "epoch": 4600} {"train_loss": -7.186262130737305, "global_step": 193221, "epoch": 4600} {"train_loss": -7.236624717712402, "global_step": 193222, "epoch": 4600} {"train_loss": -7.219333648681641, "global_step": 193223, "epoch": 4600} {"train_loss": -7.181474685668945, "global_step": 193224, "epoch": 4600} {"train_loss": -7.140805721282959, "global_step": 193225, "epoch": 4600} {"train_loss": -7.054887771606445, "global_step": 193226, "epoch": 4600} {"train_loss": -7.223978042602539, "global_step": 193227, "epoch": 4600} {"train_loss": -7.191004753112793, "global_step": 193228, "epoch": 4600} {"train_loss": -7.099493980407715, "global_step": 193229, "epoch": 4600} {"train_loss": -7.1283111572265625, "global_step": 193230, "epoch": 4600} {"train_loss": -7.198278427124023, "global_step": 193231, "epoch": 4600} {"train_loss": -7.120936393737793, "global_step": 193232, "epoch": 4600} {"train_loss": -7.170450210571289, "global_step": 193233, "epoch": 4600} {"train_loss": -7.175468444824219, "global_step": 193234, "epoch": 4600} {"train_loss": -7.14334774017334, "global_step": 193235, "epoch": 4600} {"train_loss": -7.257132530212402, "global_step": 193236, "epoch": 4600} {"train_loss": -7.156693458557129, "global_step": 193237, "epoch": 4600} {"train_loss": -7.184348106384277, "global_step": 193238, "epoch": 4600} {"train_loss": -7.134613513946533, "global_step": 193239, "epoch": 4600} {"train_loss": -7.2837347984313965, "global_step": 193240, "epoch": 4600} {"train_loss": -7.154110329491751, "global_step": 193241, "epoch": 4600, "train/sim_max_reward_0": 0.20562838294432095, "train/sim_max_reward_1": 0.8173535635250982, "train/sim_max_reward_2": 0.5732055826828292, "train/sim_max_reward_3": 0.13056974501439006, "train/sim_max_reward_4": 0.4640455190666156, "train/sim_max_reward_5": 0.8969311066789484, "test/sim_max_reward_4400000": 0.9824688122982819, "test/sim_max_reward_4400001": 0.4046890883681518, "test/sim_max_reward_4400002": 0.29483107339490683, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.21215313916797793, "test/sim_max_reward_4400006": 0.01937895392647768, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3123857859393414, "test/sim_max_reward_4400009": 0.927842895926699, "test/sim_max_reward_4400010": 0.9189251265216113, "test/sim_max_reward_4400011": 0.07374125313532413, "test/sim_max_reward_4400012": 0.9504103375525519, "test/sim_max_reward_4400013": 0.9971601371499884, "test/sim_max_reward_4400014": 0.15136708928126136, "test/sim_max_reward_4400015": 0.6959385779207573, "test/sim_max_reward_4400016": 0.16228476185899365, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.27122114792110114, "test/sim_max_reward_4400019": 0.00013103252116892353, "test/sim_max_reward_4400020": 0.9331734831448545, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.21497583960739647, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.3200428748508575, "test/sim_max_reward_4400025": 0.2616323765646197, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.008755073734235275, "test/sim_max_reward_4400028": 0.4445550633956303, "test/sim_max_reward_4400029": 0.9799073920166798, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9719323237377885, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.8760395556983149, "test/sim_max_reward_4400034": 0.920476154469968, "test/sim_max_reward_4400035": 0.9471991849520643, "test/sim_max_reward_4400036": 0.945555714732843, "test/sim_max_reward_4400037": 0.9277828123087467, "test/sim_max_reward_4400038": 0.8567834829245607, "test/sim_max_reward_4400039": 0.9455995946194069, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.5848708284221803, "test/sim_max_reward_4400042": 0.9008339869942089, "test/sim_max_reward_4400043": 0.8989206668547822, "test/sim_max_reward_4400044": 0.9614729048865945, "test/sim_max_reward_4400045": 0.9528813000990515, "test/sim_max_reward_4400046": 0.8769897877647158, "test/sim_max_reward_4400047": 0.9559242054843571, "test/sim_max_reward_4400048": 0.886652899298741, "test/sim_max_reward_4400049": 0.9838019872287227, "train/mean_score": 0.5146223166520337, "test/mean_score": 0.5680983707409962, "val_loss": 68944.828125} {"train_loss": -7.206279754638672, "global_step": 193242, "epoch": 4601} {"train_loss": -7.169309616088867, "global_step": 193243, "epoch": 4601} {"train_loss": -7.204245090484619, "global_step": 193244, "epoch": 4601} {"train_loss": -7.2823591232299805, "global_step": 193245, "epoch": 4601} {"train_loss": -7.114845275878906, "global_step": 193246, "epoch": 4601} {"train_loss": -7.058187484741211, "global_step": 193247, "epoch": 4601} {"train_loss": -7.252774238586426, "global_step": 193248, "epoch": 4601} {"train_loss": -7.054598808288574, "global_step": 193249, "epoch": 4601} {"train_loss": -7.118073463439941, "global_step": 193250, "epoch": 4601} {"train_loss": -7.250136852264404, "global_step": 193251, "epoch": 4601} {"train_loss": -7.044683933258057, "global_step": 193252, "epoch": 4601} {"train_loss": -7.217430114746094, "global_step": 193253, "epoch": 4601} {"train_loss": -7.181990146636963, "global_step": 193254, "epoch": 4601} {"train_loss": -7.001091003417969, "global_step": 193255, "epoch": 4601} {"train_loss": -7.164216041564941, "global_step": 193256, "epoch": 4601} {"train_loss": -7.173640251159668, "global_step": 193257, "epoch": 4601} {"train_loss": -7.259090423583984, "global_step": 193258, "epoch": 4601} {"train_loss": -7.16889762878418, "global_step": 193259, "epoch": 4601} {"train_loss": -7.179131984710693, "global_step": 193260, "epoch": 4601} {"train_loss": -7.195195198059082, "global_step": 193261, "epoch": 4601} {"train_loss": -7.166217803955078, "global_step": 193262, "epoch": 4601} {"train_loss": -7.247067928314209, "global_step": 193263, "epoch": 4601} {"train_loss": -7.140567779541016, "global_step": 193264, "epoch": 4601} {"train_loss": -7.154288291931152, "global_step": 193265, "epoch": 4601} {"train_loss": -7.197244167327881, "global_step": 193266, "epoch": 4601} {"train_loss": -7.258011817932129, "global_step": 193267, "epoch": 4601} {"train_loss": -7.214931488037109, "global_step": 193268, "epoch": 4601} {"train_loss": -7.101287841796875, "global_step": 193269, "epoch": 4601} {"train_loss": -7.284696578979492, "global_step": 193270, "epoch": 4601} {"train_loss": -7.199528217315674, "global_step": 193271, "epoch": 4601} {"train_loss": -7.205480098724365, "global_step": 193272, "epoch": 4601} {"train_loss": -7.121433258056641, "global_step": 193273, "epoch": 4601} {"train_loss": -7.20440673828125, "global_step": 193274, "epoch": 4601} {"train_loss": -7.203917503356934, "global_step": 193275, "epoch": 4601} {"train_loss": -7.104844093322754, "global_step": 193276, "epoch": 4601} {"train_loss": -7.2677154541015625, "global_step": 193277, "epoch": 4601} {"train_loss": -7.159604549407959, "global_step": 193278, "epoch": 4601} {"train_loss": -7.160130500793457, "global_step": 193279, "epoch": 4601} {"train_loss": -7.172865867614746, "global_step": 193280, "epoch": 4601} {"train_loss": -7.200858116149902, "global_step": 193281, "epoch": 4601} {"train_loss": -7.284801483154297, "global_step": 193282, "epoch": 4601} {"train_loss": -7.180769136973789, "global_step": 193283, "epoch": 4601, "val_loss": 68973.8828125} {"train_loss": -7.2058563232421875, "global_step": 193284, "epoch": 4602} {"train_loss": -7.253701210021973, "global_step": 193285, "epoch": 4602} {"train_loss": -7.142243385314941, "global_step": 193286, "epoch": 4602} {"train_loss": -7.200582981109619, "global_step": 193287, "epoch": 4602} {"train_loss": -7.068790435791016, "global_step": 193288, "epoch": 4602} {"train_loss": -7.370718955993652, "global_step": 193289, "epoch": 4602} {"train_loss": -7.080760955810547, "global_step": 193290, "epoch": 4602} {"train_loss": -7.294108867645264, "global_step": 193291, "epoch": 4602} {"train_loss": -7.106247901916504, "global_step": 193292, "epoch": 4602} {"train_loss": -7.233083724975586, "global_step": 193293, "epoch": 4602} {"train_loss": -7.317768573760986, "global_step": 193294, "epoch": 4602} {"train_loss": -7.198966026306152, "global_step": 193295, "epoch": 4602} {"train_loss": -7.107200622558594, "global_step": 193296, "epoch": 4602} {"train_loss": -7.012969970703125, "global_step": 193297, "epoch": 4602} {"train_loss": -7.1991353034973145, "global_step": 193298, "epoch": 4602} {"train_loss": -7.003293991088867, "global_step": 193299, "epoch": 4602} {"train_loss": -7.2664875984191895, "global_step": 193300, "epoch": 4602} {"train_loss": -7.1317138671875, "global_step": 193301, "epoch": 4602} {"train_loss": -7.08961820602417, "global_step": 193302, "epoch": 4602} {"train_loss": -7.124451637268066, "global_step": 193303, "epoch": 4602} {"train_loss": -7.07295036315918, "global_step": 193304, "epoch": 4602} {"train_loss": -7.08431339263916, "global_step": 193305, "epoch": 4602} {"train_loss": -7.059482097625732, "global_step": 193306, "epoch": 4602} {"train_loss": -7.140585899353027, "global_step": 193307, "epoch": 4602} {"train_loss": -7.243168830871582, "global_step": 193308, "epoch": 4602} {"train_loss": -7.141696453094482, "global_step": 193309, "epoch": 4602} {"train_loss": -7.118063926696777, "global_step": 193310, "epoch": 4602} {"train_loss": -7.103946685791016, "global_step": 193311, "epoch": 4602} {"train_loss": -7.102321147918701, "global_step": 193312, "epoch": 4602} {"train_loss": -7.111161231994629, "global_step": 193313, "epoch": 4602} {"train_loss": -7.122177600860596, "global_step": 193314, "epoch": 4602} {"train_loss": -7.118854999542236, "global_step": 193315, "epoch": 4602} {"train_loss": -7.185290336608887, "global_step": 193316, "epoch": 4602} {"train_loss": -7.084888458251953, "global_step": 193317, "epoch": 4602} {"train_loss": -7.091942310333252, "global_step": 193318, "epoch": 4602} {"train_loss": -6.945757865905762, "global_step": 193319, "epoch": 4602} {"train_loss": -7.253374099731445, "global_step": 193320, "epoch": 4602} {"train_loss": -7.118685245513916, "global_step": 193321, "epoch": 4602} {"train_loss": -7.120846271514893, "global_step": 193322, "epoch": 4602} {"train_loss": -7.179086685180664, "global_step": 193323, "epoch": 4602} {"train_loss": -7.155017375946045, "global_step": 193324, "epoch": 4602} {"train_loss": -7.147514263788859, "global_step": 193325, "epoch": 4602, "val_loss": 69081.890625} {"train_loss": -7.168702602386475, "global_step": 193326, "epoch": 4603} {"train_loss": -7.158696174621582, "global_step": 193327, "epoch": 4603} {"train_loss": -7.153989791870117, "global_step": 193328, "epoch": 4603} {"train_loss": -7.139551162719727, "global_step": 193329, "epoch": 4603} {"train_loss": -7.192108154296875, "global_step": 193330, "epoch": 4603} {"train_loss": -7.230729103088379, "global_step": 193331, "epoch": 4603} {"train_loss": -7.005443096160889, "global_step": 193332, "epoch": 4603} {"train_loss": -7.239609241485596, "global_step": 193333, "epoch": 4603} {"train_loss": -7.268484115600586, "global_step": 193334, "epoch": 4603} {"train_loss": -7.209884166717529, "global_step": 193335, "epoch": 4603} {"train_loss": -7.151288032531738, "global_step": 193336, "epoch": 4603} {"train_loss": -7.127749443054199, "global_step": 193337, "epoch": 4603} {"train_loss": -7.270952224731445, "global_step": 193338, "epoch": 4603} {"train_loss": -7.061340808868408, "global_step": 193339, "epoch": 4603} {"train_loss": -7.132542133331299, "global_step": 193340, "epoch": 4603} {"train_loss": -7.229991912841797, "global_step": 193341, "epoch": 4603} {"train_loss": -7.213462829589844, "global_step": 193342, "epoch": 4603} {"train_loss": -7.128419399261475, "global_step": 193343, "epoch": 4603} {"train_loss": -7.117821216583252, "global_step": 193344, "epoch": 4603} {"train_loss": -7.146336555480957, "global_step": 193345, "epoch": 4603} {"train_loss": -7.154754161834717, "global_step": 193346, "epoch": 4603} {"train_loss": -7.1390180587768555, "global_step": 193347, "epoch": 4603} {"train_loss": -7.174807548522949, "global_step": 193348, "epoch": 4603} {"train_loss": -7.118206024169922, "global_step": 193349, "epoch": 4603} {"train_loss": -7.043590068817139, "global_step": 193350, "epoch": 4603} {"train_loss": -7.089531898498535, "global_step": 193351, "epoch": 4603} {"train_loss": -7.156620025634766, "global_step": 193352, "epoch": 4603} {"train_loss": -7.175370216369629, "global_step": 193353, "epoch": 4603} {"train_loss": -7.3361101150512695, "global_step": 193354, "epoch": 4603} {"train_loss": -7.109304428100586, "global_step": 193355, "epoch": 4603} {"train_loss": -7.132229328155518, "global_step": 193356, "epoch": 4603} {"train_loss": -7.146828651428223, "global_step": 193357, "epoch": 4603} {"train_loss": -7.085650444030762, "global_step": 193358, "epoch": 4603} {"train_loss": -7.076863765716553, "global_step": 193359, "epoch": 4603} {"train_loss": -7.143893241882324, "global_step": 193360, "epoch": 4603} {"train_loss": -7.136328220367432, "global_step": 193361, "epoch": 4603} {"train_loss": -7.115483283996582, "global_step": 193362, "epoch": 4603} {"train_loss": -7.073385715484619, "global_step": 193363, "epoch": 4603} {"train_loss": -7.2797698974609375, "global_step": 193364, "epoch": 4603} {"train_loss": -7.014752388000488, "global_step": 193365, "epoch": 4603} {"train_loss": -7.189933776855469, "global_step": 193366, "epoch": 4603} {"train_loss": -7.152952319099789, "global_step": 193367, "epoch": 4603, "val_loss": 68988.234375} {"train_loss": -7.1717023849487305, "global_step": 193368, "epoch": 4604} {"train_loss": -7.260220527648926, "global_step": 193369, "epoch": 4604} {"train_loss": -7.168359756469727, "global_step": 193370, "epoch": 4604} {"train_loss": -7.132339954376221, "global_step": 193371, "epoch": 4604} {"train_loss": -7.201603412628174, "global_step": 193372, "epoch": 4604} {"train_loss": -7.15164852142334, "global_step": 193373, "epoch": 4604} {"train_loss": -7.180882930755615, "global_step": 193374, "epoch": 4604} {"train_loss": -7.290874481201172, "global_step": 193375, "epoch": 4604} {"train_loss": -7.161225318908691, "global_step": 193376, "epoch": 4604} {"train_loss": -7.1815595626831055, "global_step": 193377, "epoch": 4604} {"train_loss": -7.205217361450195, "global_step": 193378, "epoch": 4604} {"train_loss": -7.232858180999756, "global_step": 193379, "epoch": 4604} {"train_loss": -7.247635841369629, "global_step": 193380, "epoch": 4604} {"train_loss": -7.249931335449219, "global_step": 193381, "epoch": 4604} {"train_loss": -7.217270851135254, "global_step": 193382, "epoch": 4604} {"train_loss": -7.108057022094727, "global_step": 193383, "epoch": 4604} {"train_loss": -7.189511299133301, "global_step": 193384, "epoch": 4604} {"train_loss": -7.249055862426758, "global_step": 193385, "epoch": 4604} {"train_loss": -7.129042625427246, "global_step": 193386, "epoch": 4604} {"train_loss": -7.183465957641602, "global_step": 193387, "epoch": 4604} {"train_loss": -7.15175724029541, "global_step": 193388, "epoch": 4604} {"train_loss": -7.244166374206543, "global_step": 193389, "epoch": 4604} {"train_loss": -7.133563995361328, "global_step": 193390, "epoch": 4604} {"train_loss": -7.205108642578125, "global_step": 193391, "epoch": 4604} {"train_loss": -7.155375957489014, "global_step": 193392, "epoch": 4604} {"train_loss": -7.165310859680176, "global_step": 193393, "epoch": 4604} {"train_loss": -7.154252052307129, "global_step": 193394, "epoch": 4604} {"train_loss": -7.205542087554932, "global_step": 193395, "epoch": 4604} {"train_loss": -7.197253227233887, "global_step": 193396, "epoch": 4604} {"train_loss": -7.123291969299316, "global_step": 193397, "epoch": 4604} {"train_loss": -7.142740249633789, "global_step": 193398, "epoch": 4604} {"train_loss": -6.996445655822754, "global_step": 193399, "epoch": 4604} {"train_loss": -7.257855415344238, "global_step": 193400, "epoch": 4604} {"train_loss": -7.023550033569336, "global_step": 193401, "epoch": 4604} {"train_loss": -7.127964019775391, "global_step": 193402, "epoch": 4604} {"train_loss": -7.103849411010742, "global_step": 193403, "epoch": 4604} {"train_loss": -7.2004523277282715, "global_step": 193404, "epoch": 4604} {"train_loss": -7.068957328796387, "global_step": 193405, "epoch": 4604} {"train_loss": -7.150123596191406, "global_step": 193406, "epoch": 4604} {"train_loss": -7.170726776123047, "global_step": 193407, "epoch": 4604} {"train_loss": -7.0665602684021, "global_step": 193408, "epoch": 4604} {"train_loss": -7.167548565637498, "global_step": 193409, "epoch": 4604, "val_loss": 69002.3203125} {"train_loss": -7.103268146514893, "global_step": 193410, "epoch": 4605} {"train_loss": -7.099643707275391, "global_step": 193411, "epoch": 4605} {"train_loss": -7.034508228302002, "global_step": 193412, "epoch": 4605} {"train_loss": -6.971974849700928, "global_step": 193413, "epoch": 4605} {"train_loss": -7.115475654602051, "global_step": 193414, "epoch": 4605} {"train_loss": -7.043111324310303, "global_step": 193415, "epoch": 4605} {"train_loss": -7.141597270965576, "global_step": 193416, "epoch": 4605} {"train_loss": -7.217973232269287, "global_step": 193417, "epoch": 4605} {"train_loss": -7.243387222290039, "global_step": 193418, "epoch": 4605} {"train_loss": -6.999664783477783, "global_step": 193419, "epoch": 4605} {"train_loss": -7.195350646972656, "global_step": 193420, "epoch": 4605} {"train_loss": -7.18955135345459, "global_step": 193421, "epoch": 4605} {"train_loss": -7.097953796386719, "global_step": 193422, "epoch": 4605} {"train_loss": -7.050341606140137, "global_step": 193423, "epoch": 4605} {"train_loss": -7.171352863311768, "global_step": 193424, "epoch": 4605} {"train_loss": -7.072928428649902, "global_step": 193425, "epoch": 4605} {"train_loss": -7.203431129455566, "global_step": 193426, "epoch": 4605} {"train_loss": -7.085238456726074, "global_step": 193427, "epoch": 4605} {"train_loss": -7.11895751953125, "global_step": 193428, "epoch": 4605} {"train_loss": -7.212841987609863, "global_step": 193429, "epoch": 4605} {"train_loss": -6.984257698059082, "global_step": 193430, "epoch": 4605} {"train_loss": -7.189018249511719, "global_step": 193431, "epoch": 4605} {"train_loss": -7.0940704345703125, "global_step": 193432, "epoch": 4605} {"train_loss": -7.158705234527588, "global_step": 193433, "epoch": 4605} {"train_loss": -7.135500907897949, "global_step": 193434, "epoch": 4605} {"train_loss": -7.08474063873291, "global_step": 193435, "epoch": 4605} {"train_loss": -7.20623779296875, "global_step": 193436, "epoch": 4605} {"train_loss": -7.15194034576416, "global_step": 193437, "epoch": 4605} {"train_loss": -7.17726469039917, "global_step": 193438, "epoch": 4605} {"train_loss": -7.1745452880859375, "global_step": 193439, "epoch": 4605} {"train_loss": -7.189208984375, "global_step": 193440, "epoch": 4605} {"train_loss": -7.160141944885254, "global_step": 193441, "epoch": 4605} {"train_loss": -7.099910736083984, "global_step": 193442, "epoch": 4605} {"train_loss": -7.180046081542969, "global_step": 193443, "epoch": 4605} {"train_loss": -7.028558254241943, "global_step": 193444, "epoch": 4605} {"train_loss": -7.105924606323242, "global_step": 193445, "epoch": 4605} {"train_loss": -7.167149066925049, "global_step": 193446, "epoch": 4605} {"train_loss": -7.1832275390625, "global_step": 193447, "epoch": 4605} {"train_loss": -7.1961212158203125, "global_step": 193448, "epoch": 4605} {"train_loss": -7.0829572677612305, "global_step": 193449, "epoch": 4605} {"train_loss": -7.184630870819092, "global_step": 193450, "epoch": 4605} {"train_loss": -7.1295137632460825, "global_step": 193451, "epoch": 4605, "val_loss": 68704.828125} {"train_loss": -7.191431045532227, "global_step": 193452, "epoch": 4606} {"train_loss": -7.216879844665527, "global_step": 193453, "epoch": 4606} {"train_loss": -7.2137451171875, "global_step": 193454, "epoch": 4606} {"train_loss": -7.173273086547852, "global_step": 193455, "epoch": 4606} {"train_loss": -7.27641487121582, "global_step": 193456, "epoch": 4606} {"train_loss": -7.188604354858398, "global_step": 193457, "epoch": 4606} {"train_loss": -7.127690315246582, "global_step": 193458, "epoch": 4606} {"train_loss": -7.288389205932617, "global_step": 193459, "epoch": 4606} {"train_loss": -7.137661457061768, "global_step": 193460, "epoch": 4606} {"train_loss": -7.256119728088379, "global_step": 193461, "epoch": 4606} {"train_loss": -7.116053104400635, "global_step": 193462, "epoch": 4606} {"train_loss": -7.163491249084473, "global_step": 193463, "epoch": 4606} {"train_loss": -7.018071174621582, "global_step": 193464, "epoch": 4606} {"train_loss": -7.080212116241455, "global_step": 193465, "epoch": 4606} {"train_loss": -7.240607261657715, "global_step": 193466, "epoch": 4606} {"train_loss": -7.160492897033691, "global_step": 193467, "epoch": 4606} {"train_loss": -7.215551376342773, "global_step": 193468, "epoch": 4606} {"train_loss": -7.213252067565918, "global_step": 193469, "epoch": 4606} {"train_loss": -7.210998058319092, "global_step": 193470, "epoch": 4606} {"train_loss": -7.247744083404541, "global_step": 193471, "epoch": 4606} {"train_loss": -7.181066513061523, "global_step": 193472, "epoch": 4606} {"train_loss": -7.243188381195068, "global_step": 193473, "epoch": 4606} {"train_loss": -7.207470417022705, "global_step": 193474, "epoch": 4606} {"train_loss": -7.274219512939453, "global_step": 193475, "epoch": 4606} {"train_loss": -7.2914228439331055, "global_step": 193476, "epoch": 4606} {"train_loss": -7.249344825744629, "global_step": 193477, "epoch": 4606} {"train_loss": -7.195898056030273, "global_step": 193478, "epoch": 4606} {"train_loss": -7.1660966873168945, "global_step": 193479, "epoch": 4606} {"train_loss": -7.231540679931641, "global_step": 193480, "epoch": 4606} {"train_loss": -7.226751327514648, "global_step": 193481, "epoch": 4606} {"train_loss": -7.118762969970703, "global_step": 193482, "epoch": 4606} {"train_loss": -7.187007427215576, "global_step": 193483, "epoch": 4606} {"train_loss": -7.336013317108154, "global_step": 193484, "epoch": 4606} {"train_loss": -7.132107734680176, "global_step": 193485, "epoch": 4606} {"train_loss": -7.2754364013671875, "global_step": 193486, "epoch": 4606} {"train_loss": -7.151756763458252, "global_step": 193487, "epoch": 4606} {"train_loss": -7.169525146484375, "global_step": 193488, "epoch": 4606} {"train_loss": -7.1675591468811035, "global_step": 193489, "epoch": 4606} {"train_loss": -7.061248779296875, "global_step": 193490, "epoch": 4606} {"train_loss": -7.229463577270508, "global_step": 193491, "epoch": 4606} {"train_loss": -6.959474563598633, "global_step": 193492, "epoch": 4606} {"train_loss": -7.190745410465059, "global_step": 193493, "epoch": 4606, "val_loss": 68913.0625} {"train_loss": -7.161125183105469, "global_step": 193494, "epoch": 4607} {"train_loss": -7.113824844360352, "global_step": 193495, "epoch": 4607} {"train_loss": -7.1971893310546875, "global_step": 193496, "epoch": 4607} {"train_loss": -7.143372535705566, "global_step": 193497, "epoch": 4607} {"train_loss": -7.230961799621582, "global_step": 193498, "epoch": 4607} {"train_loss": -7.209709644317627, "global_step": 193499, "epoch": 4607} {"train_loss": -7.200874328613281, "global_step": 193500, "epoch": 4607} {"train_loss": -7.153299331665039, "global_step": 193501, "epoch": 4607} {"train_loss": -7.164736747741699, "global_step": 193502, "epoch": 4607} {"train_loss": -7.180169582366943, "global_step": 193503, "epoch": 4607} {"train_loss": -7.142831802368164, "global_step": 193504, "epoch": 4607} {"train_loss": -7.051431179046631, "global_step": 193505, "epoch": 4607} {"train_loss": -7.024845600128174, "global_step": 193506, "epoch": 4607} {"train_loss": -7.09828519821167, "global_step": 193507, "epoch": 4607} {"train_loss": -7.041774749755859, "global_step": 193508, "epoch": 4607} {"train_loss": -6.972893238067627, "global_step": 193509, "epoch": 4607} {"train_loss": -6.9255828857421875, "global_step": 193510, "epoch": 4607} {"train_loss": -7.0495805740356445, "global_step": 193511, "epoch": 4607} {"train_loss": -7.078334808349609, "global_step": 193512, "epoch": 4607} {"train_loss": -7.092472076416016, "global_step": 193513, "epoch": 4607} {"train_loss": -7.074554443359375, "global_step": 193514, "epoch": 4607} {"train_loss": -7.106789588928223, "global_step": 193515, "epoch": 4607} {"train_loss": -7.115781307220459, "global_step": 193516, "epoch": 4607} {"train_loss": -7.059985637664795, "global_step": 193517, "epoch": 4607} {"train_loss": -6.89479923248291, "global_step": 193518, "epoch": 4607} {"train_loss": -6.999703884124756, "global_step": 193519, "epoch": 4607} {"train_loss": -7.0223212242126465, "global_step": 193520, "epoch": 4607} {"train_loss": -7.0717267990112305, "global_step": 193521, "epoch": 4607} {"train_loss": -6.999621391296387, "global_step": 193522, "epoch": 4607} {"train_loss": -7.124266624450684, "global_step": 193523, "epoch": 4607} {"train_loss": -7.132078647613525, "global_step": 193524, "epoch": 4607} {"train_loss": -7.019360542297363, "global_step": 193525, "epoch": 4607} {"train_loss": -7.039791107177734, "global_step": 193526, "epoch": 4607} {"train_loss": -7.100898742675781, "global_step": 193527, "epoch": 4607} {"train_loss": -7.159414291381836, "global_step": 193528, "epoch": 4607} {"train_loss": -7.205849647521973, "global_step": 193529, "epoch": 4607} {"train_loss": -7.03525447845459, "global_step": 193530, "epoch": 4607} {"train_loss": -7.064907073974609, "global_step": 193531, "epoch": 4607} {"train_loss": -7.068370819091797, "global_step": 193532, "epoch": 4607} {"train_loss": -7.031951427459717, "global_step": 193533, "epoch": 4607} {"train_loss": -7.163332939147949, "global_step": 193534, "epoch": 4607} {"train_loss": -7.0913170746394565, "global_step": 193535, "epoch": 4607, "val_loss": 68910.703125} {"train_loss": -7.167236328125, "global_step": 193536, "epoch": 4608} {"train_loss": -7.3037943840026855, "global_step": 193537, "epoch": 4608} {"train_loss": -7.11962366104126, "global_step": 193538, "epoch": 4608} {"train_loss": -7.091583251953125, "global_step": 193539, "epoch": 4608} {"train_loss": -7.222506523132324, "global_step": 193540, "epoch": 4608} {"train_loss": -7.08262825012207, "global_step": 193541, "epoch": 4608} {"train_loss": -7.1857709884643555, "global_step": 193542, "epoch": 4608} {"train_loss": -7.178276062011719, "global_step": 193543, "epoch": 4608} {"train_loss": -7.363822937011719, "global_step": 193544, "epoch": 4608} {"train_loss": -7.18712043762207, "global_step": 193545, "epoch": 4608} {"train_loss": -7.105873107910156, "global_step": 193546, "epoch": 4608} {"train_loss": -7.240545272827148, "global_step": 193547, "epoch": 4608} {"train_loss": -7.116398334503174, "global_step": 193548, "epoch": 4608} {"train_loss": -7.272298336029053, "global_step": 193549, "epoch": 4608} {"train_loss": -7.190184593200684, "global_step": 193550, "epoch": 4608} {"train_loss": -7.1603007316589355, "global_step": 193551, "epoch": 4608} {"train_loss": -7.097714424133301, "global_step": 193552, "epoch": 4608} {"train_loss": -7.076703071594238, "global_step": 193553, "epoch": 4608} {"train_loss": -7.182168960571289, "global_step": 193554, "epoch": 4608} {"train_loss": -7.2294464111328125, "global_step": 193555, "epoch": 4608} {"train_loss": -7.195712089538574, "global_step": 193556, "epoch": 4608} {"train_loss": -7.196963310241699, "global_step": 193557, "epoch": 4608} {"train_loss": -7.303426742553711, "global_step": 193558, "epoch": 4608} {"train_loss": -7.193994045257568, "global_step": 193559, "epoch": 4608} {"train_loss": -7.258633136749268, "global_step": 193560, "epoch": 4608} {"train_loss": -7.197464942932129, "global_step": 193561, "epoch": 4608} {"train_loss": -7.207096099853516, "global_step": 193562, "epoch": 4608} {"train_loss": -7.1418609619140625, "global_step": 193563, "epoch": 4608} {"train_loss": -7.123195648193359, "global_step": 193564, "epoch": 4608} {"train_loss": -7.179485321044922, "global_step": 193565, "epoch": 4608} {"train_loss": -7.209773063659668, "global_step": 193566, "epoch": 4608} {"train_loss": -7.165581703186035, "global_step": 193567, "epoch": 4608} {"train_loss": -7.2158660888671875, "global_step": 193568, "epoch": 4608} {"train_loss": -7.2731428146362305, "global_step": 193569, "epoch": 4608} {"train_loss": -7.118411064147949, "global_step": 193570, "epoch": 4608} {"train_loss": -7.344361305236816, "global_step": 193571, "epoch": 4608} {"train_loss": -7.186610221862793, "global_step": 193572, "epoch": 4608} {"train_loss": -7.253941535949707, "global_step": 193573, "epoch": 4608} {"train_loss": -7.226677417755127, "global_step": 193574, "epoch": 4608} {"train_loss": -7.152303695678711, "global_step": 193575, "epoch": 4608} {"train_loss": -7.173323631286621, "global_step": 193576, "epoch": 4608} {"train_loss": -7.193134830111549, "global_step": 193577, "epoch": 4608, "val_loss": 69042.8984375} {"train_loss": -7.2055792808532715, "global_step": 193578, "epoch": 4609} {"train_loss": -7.241621971130371, "global_step": 193579, "epoch": 4609} {"train_loss": -7.152888298034668, "global_step": 193580, "epoch": 4609} {"train_loss": -7.149557590484619, "global_step": 193581, "epoch": 4609} {"train_loss": -7.150686264038086, "global_step": 193582, "epoch": 4609} {"train_loss": -7.210878372192383, "global_step": 193583, "epoch": 4609} {"train_loss": -7.281909942626953, "global_step": 193584, "epoch": 4609} {"train_loss": -7.178224563598633, "global_step": 193585, "epoch": 4609} {"train_loss": -7.235740661621094, "global_step": 193586, "epoch": 4609} {"train_loss": -7.2066330909729, "global_step": 193587, "epoch": 4609} {"train_loss": -7.215737342834473, "global_step": 193588, "epoch": 4609} {"train_loss": -7.214564323425293, "global_step": 193589, "epoch": 4609} {"train_loss": -7.193734169006348, "global_step": 193590, "epoch": 4609} {"train_loss": -7.252019882202148, "global_step": 193591, "epoch": 4609} {"train_loss": -7.161468505859375, "global_step": 193592, "epoch": 4609} {"train_loss": -7.18559455871582, "global_step": 193593, "epoch": 4609} {"train_loss": -7.280823707580566, "global_step": 193594, "epoch": 4609} {"train_loss": -7.2248454093933105, "global_step": 193595, "epoch": 4609} {"train_loss": -7.278836250305176, "global_step": 193596, "epoch": 4609} {"train_loss": -7.1605939865112305, "global_step": 193597, "epoch": 4609} {"train_loss": -7.220170021057129, "global_step": 193598, "epoch": 4609} {"train_loss": -7.225238800048828, "global_step": 193599, "epoch": 4609} {"train_loss": -7.226273536682129, "global_step": 193600, "epoch": 4609} {"train_loss": -7.186450481414795, "global_step": 193601, "epoch": 4609} {"train_loss": -7.149547576904297, "global_step": 193602, "epoch": 4609} {"train_loss": -7.152131080627441, "global_step": 193603, "epoch": 4609} {"train_loss": -7.196155548095703, "global_step": 193604, "epoch": 4609} {"train_loss": -7.098123550415039, "global_step": 193605, "epoch": 4609} {"train_loss": -7.226558685302734, "global_step": 193606, "epoch": 4609} {"train_loss": -7.171391487121582, "global_step": 193607, "epoch": 4609} {"train_loss": -7.249195098876953, "global_step": 193608, "epoch": 4609} {"train_loss": -7.185471534729004, "global_step": 193609, "epoch": 4609} {"train_loss": -7.242203712463379, "global_step": 193610, "epoch": 4609} {"train_loss": -7.2539215087890625, "global_step": 193611, "epoch": 4609} {"train_loss": -7.160488128662109, "global_step": 193612, "epoch": 4609} {"train_loss": -7.139575004577637, "global_step": 193613, "epoch": 4609} {"train_loss": -7.217269420623779, "global_step": 193614, "epoch": 4609} {"train_loss": -7.271676540374756, "global_step": 193615, "epoch": 4609} {"train_loss": -7.116447448730469, "global_step": 193616, "epoch": 4609} {"train_loss": -7.002225875854492, "global_step": 193617, "epoch": 4609} {"train_loss": -7.2766008377075195, "global_step": 193618, "epoch": 4609} {"train_loss": -7.197271982828776, "global_step": 193619, "epoch": 4609, "val_loss": 68899.71875} {"train_loss": -7.119991779327393, "global_step": 193620, "epoch": 4610} {"train_loss": -7.096030235290527, "global_step": 193621, "epoch": 4610} {"train_loss": -7.201162338256836, "global_step": 193622, "epoch": 4610} {"train_loss": -7.223578453063965, "global_step": 193623, "epoch": 4610} {"train_loss": -7.17045259475708, "global_step": 193624, "epoch": 4610} {"train_loss": -7.115736961364746, "global_step": 193625, "epoch": 4610} {"train_loss": -7.130638122558594, "global_step": 193626, "epoch": 4610} {"train_loss": -7.212613105773926, "global_step": 193627, "epoch": 4610} {"train_loss": -7.094329833984375, "global_step": 193628, "epoch": 4610} {"train_loss": -7.168975830078125, "global_step": 193629, "epoch": 4610} {"train_loss": -7.107520580291748, "global_step": 193630, "epoch": 4610} {"train_loss": -7.099092483520508, "global_step": 193631, "epoch": 4610} {"train_loss": -7.206831932067871, "global_step": 193632, "epoch": 4610} {"train_loss": -7.247344970703125, "global_step": 193633, "epoch": 4610} {"train_loss": -7.273619651794434, "global_step": 193634, "epoch": 4610} {"train_loss": -7.219759941101074, "global_step": 193635, "epoch": 4610} {"train_loss": -7.360969543457031, "global_step": 193636, "epoch": 4610} {"train_loss": -7.037384510040283, "global_step": 193637, "epoch": 4610} {"train_loss": -7.319362640380859, "global_step": 193638, "epoch": 4610} {"train_loss": -7.249490737915039, "global_step": 193639, "epoch": 4610} {"train_loss": -7.189298629760742, "global_step": 193640, "epoch": 4610} {"train_loss": -7.260448932647705, "global_step": 193641, "epoch": 4610} {"train_loss": -7.195560455322266, "global_step": 193642, "epoch": 4610} {"train_loss": -7.200211048126221, "global_step": 193643, "epoch": 4610} {"train_loss": -7.254197120666504, "global_step": 193644, "epoch": 4610} {"train_loss": -7.187137603759766, "global_step": 193645, "epoch": 4610} {"train_loss": -7.272525787353516, "global_step": 193646, "epoch": 4610} {"train_loss": -7.097174644470215, "global_step": 193647, "epoch": 4610} {"train_loss": -7.107065200805664, "global_step": 193648, "epoch": 4610} {"train_loss": -7.190814971923828, "global_step": 193649, "epoch": 4610} {"train_loss": -7.111026763916016, "global_step": 193650, "epoch": 4610} {"train_loss": -7.2172465324401855, "global_step": 193651, "epoch": 4610} {"train_loss": -7.159552574157715, "global_step": 193652, "epoch": 4610} {"train_loss": -7.193550109863281, "global_step": 193653, "epoch": 4610} {"train_loss": -7.107081413269043, "global_step": 193654, "epoch": 4610} {"train_loss": -7.103062152862549, "global_step": 193655, "epoch": 4610} {"train_loss": -7.184630870819092, "global_step": 193656, "epoch": 4610} {"train_loss": -7.2331037521362305, "global_step": 193657, "epoch": 4610} {"train_loss": -7.0561957359313965, "global_step": 193658, "epoch": 4610} {"train_loss": -7.220783710479736, "global_step": 193659, "epoch": 4610} {"train_loss": -7.217947483062744, "global_step": 193660, "epoch": 4610} {"train_loss": -7.182978845777965, "global_step": 193661, "epoch": 4610, "val_loss": 68912.7890625} {"train_loss": -7.220195770263672, "global_step": 193662, "epoch": 4611} {"train_loss": -7.207336902618408, "global_step": 193663, "epoch": 4611} {"train_loss": -7.230474472045898, "global_step": 193664, "epoch": 4611} {"train_loss": -7.164272785186768, "global_step": 193665, "epoch": 4611} {"train_loss": -7.094411849975586, "global_step": 193666, "epoch": 4611} {"train_loss": -7.060003280639648, "global_step": 193667, "epoch": 4611} {"train_loss": -7.285935878753662, "global_step": 193668, "epoch": 4611} {"train_loss": -7.075616359710693, "global_step": 193669, "epoch": 4611} {"train_loss": -7.194559097290039, "global_step": 193670, "epoch": 4611} {"train_loss": -7.215381145477295, "global_step": 193671, "epoch": 4611} {"train_loss": -7.0720672607421875, "global_step": 193672, "epoch": 4611} {"train_loss": -7.103971004486084, "global_step": 193673, "epoch": 4611} {"train_loss": -7.130587100982666, "global_step": 193674, "epoch": 4611} {"train_loss": -7.103875160217285, "global_step": 193675, "epoch": 4611} {"train_loss": -7.115278720855713, "global_step": 193676, "epoch": 4611} {"train_loss": -7.088878631591797, "global_step": 193677, "epoch": 4611} {"train_loss": -7.031966209411621, "global_step": 193678, "epoch": 4611} {"train_loss": -7.108969688415527, "global_step": 193679, "epoch": 4611} {"train_loss": -7.160840034484863, "global_step": 193680, "epoch": 4611} {"train_loss": -7.1819562911987305, "global_step": 193681, "epoch": 4611} {"train_loss": -7.174955368041992, "global_step": 193682, "epoch": 4611} {"train_loss": -7.042656898498535, "global_step": 193683, "epoch": 4611} {"train_loss": -7.087154865264893, "global_step": 193684, "epoch": 4611} {"train_loss": -7.147544860839844, "global_step": 193685, "epoch": 4611} {"train_loss": -7.07731819152832, "global_step": 193686, "epoch": 4611} {"train_loss": -7.097108364105225, "global_step": 193687, "epoch": 4611} {"train_loss": -7.120082855224609, "global_step": 193688, "epoch": 4611} {"train_loss": -6.954530715942383, "global_step": 193689, "epoch": 4611} {"train_loss": -7.2671799659729, "global_step": 193690, "epoch": 4611} {"train_loss": -7.173080921173096, "global_step": 193691, "epoch": 4611} {"train_loss": -7.060477256774902, "global_step": 193692, "epoch": 4611} {"train_loss": -7.079478740692139, "global_step": 193693, "epoch": 4611} {"train_loss": -7.011111259460449, "global_step": 193694, "epoch": 4611} {"train_loss": -7.129261016845703, "global_step": 193695, "epoch": 4611} {"train_loss": -7.039931297302246, "global_step": 193696, "epoch": 4611} {"train_loss": -7.075601577758789, "global_step": 193697, "epoch": 4611} {"train_loss": -7.159569263458252, "global_step": 193698, "epoch": 4611} {"train_loss": -7.136752605438232, "global_step": 193699, "epoch": 4611} {"train_loss": -7.16408109664917, "global_step": 193700, "epoch": 4611} {"train_loss": -7.074122428894043, "global_step": 193701, "epoch": 4611} {"train_loss": -7.079338550567627, "global_step": 193702, "epoch": 4611} {"train_loss": -7.123041845503307, "global_step": 193703, "epoch": 4611, "val_loss": 68890.8359375} {"train_loss": -7.178807258605957, "global_step": 193704, "epoch": 4612} {"train_loss": -7.245487213134766, "global_step": 193705, "epoch": 4612} {"train_loss": -7.299924850463867, "global_step": 193706, "epoch": 4612} {"train_loss": -7.228455543518066, "global_step": 193707, "epoch": 4612} {"train_loss": -7.143972396850586, "global_step": 193708, "epoch": 4612} {"train_loss": -7.075725555419922, "global_step": 193709, "epoch": 4612} {"train_loss": -7.280585289001465, "global_step": 193710, "epoch": 4612} {"train_loss": -7.136410713195801, "global_step": 193711, "epoch": 4612} {"train_loss": -7.031301021575928, "global_step": 193712, "epoch": 4612} {"train_loss": -7.156022071838379, "global_step": 193713, "epoch": 4612} {"train_loss": -7.1516571044921875, "global_step": 193714, "epoch": 4612} {"train_loss": -7.215763092041016, "global_step": 193715, "epoch": 4612} {"train_loss": -7.181136131286621, "global_step": 193716, "epoch": 4612} {"train_loss": -7.229938507080078, "global_step": 193717, "epoch": 4612} {"train_loss": -7.14848518371582, "global_step": 193718, "epoch": 4612} {"train_loss": -7.235311508178711, "global_step": 193719, "epoch": 4612} {"train_loss": -7.171295642852783, "global_step": 193720, "epoch": 4612} {"train_loss": -7.239761829376221, "global_step": 193721, "epoch": 4612} {"train_loss": -7.23983097076416, "global_step": 193722, "epoch": 4612} {"train_loss": -7.161880970001221, "global_step": 193723, "epoch": 4612} {"train_loss": -7.213870048522949, "global_step": 193724, "epoch": 4612} {"train_loss": -7.111011505126953, "global_step": 193725, "epoch": 4612} {"train_loss": -7.152454853057861, "global_step": 193726, "epoch": 4612} {"train_loss": -7.198479652404785, "global_step": 193727, "epoch": 4612} {"train_loss": -7.066222190856934, "global_step": 193728, "epoch": 4612} {"train_loss": -7.131155967712402, "global_step": 193729, "epoch": 4612} {"train_loss": -7.137211799621582, "global_step": 193730, "epoch": 4612} {"train_loss": -7.038182735443115, "global_step": 193731, "epoch": 4612} {"train_loss": -7.001680374145508, "global_step": 193732, "epoch": 4612} {"train_loss": -7.136372089385986, "global_step": 193733, "epoch": 4612} {"train_loss": -7.267722129821777, "global_step": 193734, "epoch": 4612} {"train_loss": -7.164239883422852, "global_step": 193735, "epoch": 4612} {"train_loss": -7.137197971343994, "global_step": 193736, "epoch": 4612} {"train_loss": -7.168211936950684, "global_step": 193737, "epoch": 4612} {"train_loss": -7.066601276397705, "global_step": 193738, "epoch": 4612} {"train_loss": -7.159419536590576, "global_step": 193739, "epoch": 4612} {"train_loss": -7.1312174797058105, "global_step": 193740, "epoch": 4612} {"train_loss": -7.136302947998047, "global_step": 193741, "epoch": 4612} {"train_loss": -7.283123970031738, "global_step": 193742, "epoch": 4612} {"train_loss": -7.232987880706787, "global_step": 193743, "epoch": 4612} {"train_loss": -7.138963222503662, "global_step": 193744, "epoch": 4612} {"train_loss": -7.16418415024167, "global_step": 193745, "epoch": 4612, "val_loss": 68991.90625} {"train_loss": -7.103194236755371, "global_step": 193746, "epoch": 4613} {"train_loss": -7.085418224334717, "global_step": 193747, "epoch": 4613} {"train_loss": -7.256660461425781, "global_step": 193748, "epoch": 4613} {"train_loss": -7.086231708526611, "global_step": 193749, "epoch": 4613} {"train_loss": -7.202248573303223, "global_step": 193750, "epoch": 4613} {"train_loss": -7.117397308349609, "global_step": 193751, "epoch": 4613} {"train_loss": -7.140621185302734, "global_step": 193752, "epoch": 4613} {"train_loss": -7.151293754577637, "global_step": 193753, "epoch": 4613} {"train_loss": -7.176231384277344, "global_step": 193754, "epoch": 4613} {"train_loss": -7.162195682525635, "global_step": 193755, "epoch": 4613} {"train_loss": -7.147144794464111, "global_step": 193756, "epoch": 4613} {"train_loss": -7.090960502624512, "global_step": 193757, "epoch": 4613} {"train_loss": -7.013627529144287, "global_step": 193758, "epoch": 4613} {"train_loss": -6.817138671875, "global_step": 193759, "epoch": 4613} {"train_loss": -7.1600022315979, "global_step": 193760, "epoch": 4613} {"train_loss": -7.013619422912598, "global_step": 193761, "epoch": 4613} {"train_loss": -7.278624057769775, "global_step": 193762, "epoch": 4613} {"train_loss": -7.28373908996582, "global_step": 193763, "epoch": 4613} {"train_loss": -7.107842445373535, "global_step": 193764, "epoch": 4613} {"train_loss": -7.204923152923584, "global_step": 193765, "epoch": 4613} {"train_loss": -7.197898864746094, "global_step": 193766, "epoch": 4613} {"train_loss": -7.1480913162231445, "global_step": 193767, "epoch": 4613} {"train_loss": -7.255641937255859, "global_step": 193768, "epoch": 4613} {"train_loss": -7.231232643127441, "global_step": 193769, "epoch": 4613} {"train_loss": -7.103004455566406, "global_step": 193770, "epoch": 4613} {"train_loss": -7.100306510925293, "global_step": 193771, "epoch": 4613} {"train_loss": -7.124933242797852, "global_step": 193772, "epoch": 4613} {"train_loss": -7.213794231414795, "global_step": 193773, "epoch": 4613} {"train_loss": -7.151515007019043, "global_step": 193774, "epoch": 4613} {"train_loss": -7.148225784301758, "global_step": 193775, "epoch": 4613} {"train_loss": -7.100813865661621, "global_step": 193776, "epoch": 4613} {"train_loss": -7.1988444328308105, "global_step": 193777, "epoch": 4613} {"train_loss": -7.213275909423828, "global_step": 193778, "epoch": 4613} {"train_loss": -7.147309303283691, "global_step": 193779, "epoch": 4613} {"train_loss": -7.145374298095703, "global_step": 193780, "epoch": 4613} {"train_loss": -7.066337585449219, "global_step": 193781, "epoch": 4613} {"train_loss": -7.133352756500244, "global_step": 193782, "epoch": 4613} {"train_loss": -7.158868789672852, "global_step": 193783, "epoch": 4613} {"train_loss": -7.164895057678223, "global_step": 193784, "epoch": 4613} {"train_loss": -6.978039741516113, "global_step": 193785, "epoch": 4613} {"train_loss": -7.141993522644043, "global_step": 193786, "epoch": 4613} {"train_loss": -7.139341479256039, "global_step": 193787, "epoch": 4613, "val_loss": 69031.1875} {"train_loss": -7.095671653747559, "global_step": 193788, "epoch": 4614} {"train_loss": -7.13385009765625, "global_step": 193789, "epoch": 4614} {"train_loss": -7.227658271789551, "global_step": 193790, "epoch": 4614} {"train_loss": -7.116001129150391, "global_step": 193791, "epoch": 4614} {"train_loss": -7.061771392822266, "global_step": 193792, "epoch": 4614} {"train_loss": -7.165210723876953, "global_step": 193793, "epoch": 4614} {"train_loss": -7.2256574630737305, "global_step": 193794, "epoch": 4614} {"train_loss": -7.201410293579102, "global_step": 193795, "epoch": 4614} {"train_loss": -7.232930660247803, "global_step": 193796, "epoch": 4614} {"train_loss": -7.145755767822266, "global_step": 193797, "epoch": 4614} {"train_loss": -7.166213512420654, "global_step": 193798, "epoch": 4614} {"train_loss": -7.197012901306152, "global_step": 193799, "epoch": 4614} {"train_loss": -7.177850246429443, "global_step": 193800, "epoch": 4614} {"train_loss": -7.250307083129883, "global_step": 193801, "epoch": 4614} {"train_loss": -7.258603096008301, "global_step": 193802, "epoch": 4614} {"train_loss": -7.180556297302246, "global_step": 193803, "epoch": 4614} {"train_loss": -7.190711975097656, "global_step": 193804, "epoch": 4614} {"train_loss": -7.164939880371094, "global_step": 193805, "epoch": 4614} {"train_loss": -7.193024635314941, "global_step": 193806, "epoch": 4614} {"train_loss": -7.19087553024292, "global_step": 193807, "epoch": 4614} {"train_loss": -7.285737037658691, "global_step": 193808, "epoch": 4614} {"train_loss": -7.096953392028809, "global_step": 193809, "epoch": 4614} {"train_loss": -7.132167816162109, "global_step": 193810, "epoch": 4614} {"train_loss": -7.1810173988342285, "global_step": 193811, "epoch": 4614} {"train_loss": -7.195189476013184, "global_step": 193812, "epoch": 4614} {"train_loss": -7.146646499633789, "global_step": 193813, "epoch": 4614} {"train_loss": -7.168776988983154, "global_step": 193814, "epoch": 4614} {"train_loss": -7.135993480682373, "global_step": 193815, "epoch": 4614} {"train_loss": -7.213098526000977, "global_step": 193816, "epoch": 4614} {"train_loss": -7.165397644042969, "global_step": 193817, "epoch": 4614} {"train_loss": -7.143400192260742, "global_step": 193818, "epoch": 4614} {"train_loss": -7.15956974029541, "global_step": 193819, "epoch": 4614} {"train_loss": -7.279526233673096, "global_step": 193820, "epoch": 4614} {"train_loss": -7.154915809631348, "global_step": 193821, "epoch": 4614} {"train_loss": -7.138377666473389, "global_step": 193822, "epoch": 4614} {"train_loss": -7.239034652709961, "global_step": 193823, "epoch": 4614} {"train_loss": -7.248350143432617, "global_step": 193824, "epoch": 4614} {"train_loss": -7.063758850097656, "global_step": 193825, "epoch": 4614} {"train_loss": -7.228874206542969, "global_step": 193826, "epoch": 4614} {"train_loss": -7.022002220153809, "global_step": 193827, "epoch": 4614} {"train_loss": -7.0549726486206055, "global_step": 193828, "epoch": 4614} {"train_loss": -7.169044244857061, "global_step": 193829, "epoch": 4614, "val_loss": 69195.7265625} {"train_loss": -7.142882823944092, "global_step": 193830, "epoch": 4615} {"train_loss": -7.1860456466674805, "global_step": 193831, "epoch": 4615} {"train_loss": -7.20269775390625, "global_step": 193832, "epoch": 4615} {"train_loss": -7.217653274536133, "global_step": 193833, "epoch": 4615} {"train_loss": -7.167876243591309, "global_step": 193834, "epoch": 4615} {"train_loss": -7.101919174194336, "global_step": 193835, "epoch": 4615} {"train_loss": -7.1491570472717285, "global_step": 193836, "epoch": 4615} {"train_loss": -7.0877227783203125, "global_step": 193837, "epoch": 4615} {"train_loss": -7.226155757904053, "global_step": 193838, "epoch": 4615} {"train_loss": -7.228629112243652, "global_step": 193839, "epoch": 4615} {"train_loss": -7.136036396026611, "global_step": 193840, "epoch": 4615} {"train_loss": -7.193031311035156, "global_step": 193841, "epoch": 4615} {"train_loss": -7.075434684753418, "global_step": 193842, "epoch": 4615} {"train_loss": -7.139497756958008, "global_step": 193843, "epoch": 4615} {"train_loss": -7.083548545837402, "global_step": 193844, "epoch": 4615} {"train_loss": -7.150588035583496, "global_step": 193845, "epoch": 4615} {"train_loss": -7.224608421325684, "global_step": 193846, "epoch": 4615} {"train_loss": -7.109367370605469, "global_step": 193847, "epoch": 4615} {"train_loss": -7.069774627685547, "global_step": 193848, "epoch": 4615} {"train_loss": -7.133205413818359, "global_step": 193849, "epoch": 4615} {"train_loss": -7.110045909881592, "global_step": 193850, "epoch": 4615} {"train_loss": -7.131118297576904, "global_step": 193851, "epoch": 4615} {"train_loss": -7.050617218017578, "global_step": 193852, "epoch": 4615} {"train_loss": -7.126755714416504, "global_step": 193853, "epoch": 4615} {"train_loss": -7.039995193481445, "global_step": 193854, "epoch": 4615} {"train_loss": -7.046405792236328, "global_step": 193855, "epoch": 4615} {"train_loss": -7.094326496124268, "global_step": 193856, "epoch": 4615} {"train_loss": -7.192013740539551, "global_step": 193857, "epoch": 4615} {"train_loss": -7.0663909912109375, "global_step": 193858, "epoch": 4615} {"train_loss": -7.219900131225586, "global_step": 193859, "epoch": 4615} {"train_loss": -7.205278396606445, "global_step": 193860, "epoch": 4615} {"train_loss": -7.147735595703125, "global_step": 193861, "epoch": 4615} {"train_loss": -7.219269752502441, "global_step": 193862, "epoch": 4615} {"train_loss": -7.16949462890625, "global_step": 193863, "epoch": 4615} {"train_loss": -7.2091264724731445, "global_step": 193864, "epoch": 4615} {"train_loss": -7.204954147338867, "global_step": 193865, "epoch": 4615} {"train_loss": -7.01545524597168, "global_step": 193866, "epoch": 4615} {"train_loss": -7.120993614196777, "global_step": 193867, "epoch": 4615} {"train_loss": -7.14420223236084, "global_step": 193868, "epoch": 4615} {"train_loss": -6.997573375701904, "global_step": 193869, "epoch": 4615} {"train_loss": -7.2029500007629395, "global_step": 193870, "epoch": 4615} {"train_loss": -7.139663923354376, "global_step": 193871, "epoch": 4615, "val_loss": 69130.5546875} {"train_loss": -7.151854515075684, "global_step": 193872, "epoch": 4616} {"train_loss": -7.141664981842041, "global_step": 193873, "epoch": 4616} {"train_loss": -7.253918170928955, "global_step": 193874, "epoch": 4616} {"train_loss": -7.118979454040527, "global_step": 193875, "epoch": 4616} {"train_loss": -7.192004203796387, "global_step": 193876, "epoch": 4616} {"train_loss": -7.199878692626953, "global_step": 193877, "epoch": 4616} {"train_loss": -7.265583038330078, "global_step": 193878, "epoch": 4616} {"train_loss": -7.096532344818115, "global_step": 193879, "epoch": 4616} {"train_loss": -7.144578456878662, "global_step": 193880, "epoch": 4616} {"train_loss": -7.203986167907715, "global_step": 193881, "epoch": 4616} {"train_loss": -7.04632568359375, "global_step": 193882, "epoch": 4616} {"train_loss": -7.133273601531982, "global_step": 193883, "epoch": 4616} {"train_loss": -7.047425270080566, "global_step": 193884, "epoch": 4616} {"train_loss": -7.045039176940918, "global_step": 193885, "epoch": 4616} {"train_loss": -7.235992431640625, "global_step": 193886, "epoch": 4616} {"train_loss": -7.034055233001709, "global_step": 193887, "epoch": 4616} {"train_loss": -7.124942779541016, "global_step": 193888, "epoch": 4616} {"train_loss": -7.105782508850098, "global_step": 193889, "epoch": 4616} {"train_loss": -7.15067195892334, "global_step": 193890, "epoch": 4616} {"train_loss": -7.102535247802734, "global_step": 193891, "epoch": 4616} {"train_loss": -6.97787618637085, "global_step": 193892, "epoch": 4616} {"train_loss": -7.123653888702393, "global_step": 193893, "epoch": 4616} {"train_loss": -7.185031890869141, "global_step": 193894, "epoch": 4616} {"train_loss": -7.136101722717285, "global_step": 193895, "epoch": 4616} {"train_loss": -7.088125705718994, "global_step": 193896, "epoch": 4616} {"train_loss": -7.179450988769531, "global_step": 193897, "epoch": 4616} {"train_loss": -7.156123161315918, "global_step": 193898, "epoch": 4616} {"train_loss": -7.117408752441406, "global_step": 193899, "epoch": 4616} {"train_loss": -7.098247528076172, "global_step": 193900, "epoch": 4616} {"train_loss": -6.969762802124023, "global_step": 193901, "epoch": 4616} {"train_loss": -7.077125549316406, "global_step": 193902, "epoch": 4616} {"train_loss": -7.081112861633301, "global_step": 193903, "epoch": 4616} {"train_loss": -7.005939960479736, "global_step": 193904, "epoch": 4616} {"train_loss": -7.083015441894531, "global_step": 193905, "epoch": 4616} {"train_loss": -7.015252113342285, "global_step": 193906, "epoch": 4616} {"train_loss": -7.085034370422363, "global_step": 193907, "epoch": 4616} {"train_loss": -7.016253471374512, "global_step": 193908, "epoch": 4616} {"train_loss": -6.944647789001465, "global_step": 193909, "epoch": 4616} {"train_loss": -7.052849292755127, "global_step": 193910, "epoch": 4616} {"train_loss": -7.000342845916748, "global_step": 193911, "epoch": 4616} {"train_loss": -7.040606498718262, "global_step": 193912, "epoch": 4616} {"train_loss": -7.101320119131179, "global_step": 193913, "epoch": 4616, "val_loss": 68845.9609375} {"train_loss": -7.0731353759765625, "global_step": 193914, "epoch": 4617} {"train_loss": -7.089890003204346, "global_step": 193915, "epoch": 4617} {"train_loss": -7.0277910232543945, "global_step": 193916, "epoch": 4617} {"train_loss": -7.222970008850098, "global_step": 193917, "epoch": 4617} {"train_loss": -7.08998966217041, "global_step": 193918, "epoch": 4617} {"train_loss": -7.204190731048584, "global_step": 193919, "epoch": 4617} {"train_loss": -7.078521728515625, "global_step": 193920, "epoch": 4617} {"train_loss": -7.1644158363342285, "global_step": 193921, "epoch": 4617} {"train_loss": -7.108822345733643, "global_step": 193922, "epoch": 4617} {"train_loss": -7.080233573913574, "global_step": 193923, "epoch": 4617} {"train_loss": -6.99273681640625, "global_step": 193924, "epoch": 4617} {"train_loss": -7.071415901184082, "global_step": 193925, "epoch": 4617} {"train_loss": -7.1793107986450195, "global_step": 193926, "epoch": 4617} {"train_loss": -7.02177095413208, "global_step": 193927, "epoch": 4617} {"train_loss": -7.136809349060059, "global_step": 193928, "epoch": 4617} {"train_loss": -7.180518627166748, "global_step": 193929, "epoch": 4617} {"train_loss": -7.254698753356934, "global_step": 193930, "epoch": 4617} {"train_loss": -7.205722332000732, "global_step": 193931, "epoch": 4617} {"train_loss": -7.200225830078125, "global_step": 193932, "epoch": 4617} {"train_loss": -7.150869369506836, "global_step": 193933, "epoch": 4617} {"train_loss": -7.177652359008789, "global_step": 193934, "epoch": 4617} {"train_loss": -7.240629196166992, "global_step": 193935, "epoch": 4617} {"train_loss": -7.125811576843262, "global_step": 193936, "epoch": 4617} {"train_loss": -7.347449779510498, "global_step": 193937, "epoch": 4617} {"train_loss": -7.187086582183838, "global_step": 193938, "epoch": 4617} {"train_loss": -7.190040588378906, "global_step": 193939, "epoch": 4617} {"train_loss": -7.201007843017578, "global_step": 193940, "epoch": 4617} {"train_loss": -7.2105817794799805, "global_step": 193941, "epoch": 4617} {"train_loss": -7.232255458831787, "global_step": 193942, "epoch": 4617} {"train_loss": -7.172025680541992, "global_step": 193943, "epoch": 4617} {"train_loss": -7.150254249572754, "global_step": 193944, "epoch": 4617} {"train_loss": -7.094019412994385, "global_step": 193945, "epoch": 4617} {"train_loss": -7.230740547180176, "global_step": 193946, "epoch": 4617} {"train_loss": -7.135565280914307, "global_step": 193947, "epoch": 4617} {"train_loss": -7.257112979888916, "global_step": 193948, "epoch": 4617} {"train_loss": -7.123318672180176, "global_step": 193949, "epoch": 4617} {"train_loss": -7.218227386474609, "global_step": 193950, "epoch": 4617} {"train_loss": -7.1438422203063965, "global_step": 193951, "epoch": 4617} {"train_loss": -7.238269805908203, "global_step": 193952, "epoch": 4617} {"train_loss": -7.230738162994385, "global_step": 193953, "epoch": 4617} {"train_loss": -7.252469062805176, "global_step": 193954, "epoch": 4617} {"train_loss": -7.162472338903518, "global_step": 193955, "epoch": 4617, "val_loss": 68962.4453125} {"train_loss": -7.205813407897949, "global_step": 193956, "epoch": 4618} {"train_loss": -7.1167120933532715, "global_step": 193957, "epoch": 4618} {"train_loss": -7.169367790222168, "global_step": 193958, "epoch": 4618} {"train_loss": -7.210671424865723, "global_step": 193959, "epoch": 4618} {"train_loss": -7.1174139976501465, "global_step": 193960, "epoch": 4618} {"train_loss": -7.127597808837891, "global_step": 193961, "epoch": 4618} {"train_loss": -7.169295310974121, "global_step": 193962, "epoch": 4618} {"train_loss": -7.14506721496582, "global_step": 193963, "epoch": 4618} {"train_loss": -7.076920032501221, "global_step": 193964, "epoch": 4618} {"train_loss": -7.098606109619141, "global_step": 193965, "epoch": 4618} {"train_loss": -7.085336685180664, "global_step": 193966, "epoch": 4618} {"train_loss": -7.093869209289551, "global_step": 193967, "epoch": 4618} {"train_loss": -7.184576034545898, "global_step": 193968, "epoch": 4618} {"train_loss": -7.095647811889648, "global_step": 193969, "epoch": 4618} {"train_loss": -7.031650543212891, "global_step": 193970, "epoch": 4618} {"train_loss": -6.984485626220703, "global_step": 193971, "epoch": 4618} {"train_loss": -7.173772811889648, "global_step": 193972, "epoch": 4618} {"train_loss": -7.151658058166504, "global_step": 193973, "epoch": 4618} {"train_loss": -7.125968933105469, "global_step": 193974, "epoch": 4618} {"train_loss": -7.028433799743652, "global_step": 193975, "epoch": 4618} {"train_loss": -7.0951032638549805, "global_step": 193976, "epoch": 4618} {"train_loss": -7.177742958068848, "global_step": 193977, "epoch": 4618} {"train_loss": -7.193756580352783, "global_step": 193978, "epoch": 4618} {"train_loss": -7.115835666656494, "global_step": 193979, "epoch": 4618} {"train_loss": -7.154741287231445, "global_step": 193980, "epoch": 4618} {"train_loss": -7.248591423034668, "global_step": 193981, "epoch": 4618} {"train_loss": -7.154768943786621, "global_step": 193982, "epoch": 4618} {"train_loss": -7.136740207672119, "global_step": 193983, "epoch": 4618} {"train_loss": -7.121977806091309, "global_step": 193984, "epoch": 4618} {"train_loss": -7.195182800292969, "global_step": 193985, "epoch": 4618} {"train_loss": -7.172967910766602, "global_step": 193986, "epoch": 4618} {"train_loss": -7.206821918487549, "global_step": 193987, "epoch": 4618} {"train_loss": -7.123144149780273, "global_step": 193988, "epoch": 4618} {"train_loss": -7.155734539031982, "global_step": 193989, "epoch": 4618} {"train_loss": -7.208963394165039, "global_step": 193990, "epoch": 4618} {"train_loss": -7.170551300048828, "global_step": 193991, "epoch": 4618} {"train_loss": -7.203271865844727, "global_step": 193992, "epoch": 4618} {"train_loss": -7.1582770347595215, "global_step": 193993, "epoch": 4618} {"train_loss": -7.216093063354492, "global_step": 193994, "epoch": 4618} {"train_loss": -7.055927276611328, "global_step": 193995, "epoch": 4618} {"train_loss": -7.181879043579102, "global_step": 193996, "epoch": 4618} {"train_loss": -7.142731246494112, "global_step": 193997, "epoch": 4618, "val_loss": 68980.65625} {"train_loss": -7.266745567321777, "global_step": 193998, "epoch": 4619} {"train_loss": -7.329507827758789, "global_step": 193999, "epoch": 4619} {"train_loss": -7.360013961791992, "global_step": 194000, "epoch": 4619} {"train_loss": -7.206533908843994, "global_step": 194001, "epoch": 4619} {"train_loss": -7.161627769470215, "global_step": 194002, "epoch": 4619} {"train_loss": -7.21919059753418, "global_step": 194003, "epoch": 4619} {"train_loss": -7.108760833740234, "global_step": 194004, "epoch": 4619} {"train_loss": -7.237222194671631, "global_step": 194005, "epoch": 4619} {"train_loss": -7.194356441497803, "global_step": 194006, "epoch": 4619} {"train_loss": -7.285830497741699, "global_step": 194007, "epoch": 4619} {"train_loss": -7.320303440093994, "global_step": 194008, "epoch": 4619} {"train_loss": -7.328803062438965, "global_step": 194009, "epoch": 4619} {"train_loss": -7.2946014404296875, "global_step": 194010, "epoch": 4619} {"train_loss": -7.331635475158691, "global_step": 194011, "epoch": 4619} {"train_loss": -7.220952987670898, "global_step": 194012, "epoch": 4619} {"train_loss": -7.349909782409668, "global_step": 194013, "epoch": 4619} {"train_loss": -7.197771072387695, "global_step": 194014, "epoch": 4619} {"train_loss": -7.252143383026123, "global_step": 194015, "epoch": 4619} {"train_loss": -7.302603721618652, "global_step": 194016, "epoch": 4619} {"train_loss": -7.303990364074707, "global_step": 194017, "epoch": 4619} {"train_loss": -7.034519195556641, "global_step": 194018, "epoch": 4619} {"train_loss": -7.284271717071533, "global_step": 194019, "epoch": 4619} {"train_loss": -7.369730472564697, "global_step": 194020, "epoch": 4619} {"train_loss": -7.361306190490723, "global_step": 194021, "epoch": 4619} {"train_loss": -7.333594799041748, "global_step": 194022, "epoch": 4619} {"train_loss": -7.337168216705322, "global_step": 194023, "epoch": 4619} {"train_loss": -7.230589866638184, "global_step": 194024, "epoch": 4619} {"train_loss": -7.19422721862793, "global_step": 194025, "epoch": 4619} {"train_loss": -7.134637355804443, "global_step": 194026, "epoch": 4619} {"train_loss": -7.059479236602783, "global_step": 194027, "epoch": 4619} {"train_loss": -7.050990581512451, "global_step": 194028, "epoch": 4619} {"train_loss": -7.163158416748047, "global_step": 194029, "epoch": 4619} {"train_loss": -7.257114887237549, "global_step": 194030, "epoch": 4619} {"train_loss": -7.151573657989502, "global_step": 194031, "epoch": 4619} {"train_loss": -7.18953800201416, "global_step": 194032, "epoch": 4619} {"train_loss": -7.264057636260986, "global_step": 194033, "epoch": 4619} {"train_loss": -7.17317008972168, "global_step": 194034, "epoch": 4619} {"train_loss": -7.049388885498047, "global_step": 194035, "epoch": 4619} {"train_loss": -7.176600933074951, "global_step": 194036, "epoch": 4619} {"train_loss": -7.264405250549316, "global_step": 194037, "epoch": 4619} {"train_loss": -7.189947128295898, "global_step": 194038, "epoch": 4619} {"train_loss": -7.233481702350435, "global_step": 194039, "epoch": 4619, "val_loss": 68926.5859375} {"train_loss": -7.221662521362305, "global_step": 194040, "epoch": 4620} {"train_loss": -7.131955146789551, "global_step": 194041, "epoch": 4620} {"train_loss": -7.382538795471191, "global_step": 194042, "epoch": 4620} {"train_loss": -7.293746471405029, "global_step": 194043, "epoch": 4620} {"train_loss": -7.200443744659424, "global_step": 194044, "epoch": 4620} {"train_loss": -7.267151355743408, "global_step": 194045, "epoch": 4620} {"train_loss": -7.188874244689941, "global_step": 194046, "epoch": 4620} {"train_loss": -7.143790245056152, "global_step": 194047, "epoch": 4620} {"train_loss": -7.156367301940918, "global_step": 194048, "epoch": 4620} {"train_loss": -7.200381278991699, "global_step": 194049, "epoch": 4620} {"train_loss": -7.211034774780273, "global_step": 194050, "epoch": 4620} {"train_loss": -7.12371826171875, "global_step": 194051, "epoch": 4620} {"train_loss": -7.204441070556641, "global_step": 194052, "epoch": 4620} {"train_loss": -7.314587593078613, "global_step": 194053, "epoch": 4620} {"train_loss": -7.272563934326172, "global_step": 194054, "epoch": 4620} {"train_loss": -7.088985919952393, "global_step": 194055, "epoch": 4620} {"train_loss": -7.276410102844238, "global_step": 194056, "epoch": 4620} {"train_loss": -7.158891677856445, "global_step": 194057, "epoch": 4620} {"train_loss": -7.20350456237793, "global_step": 194058, "epoch": 4620} {"train_loss": -7.24790096282959, "global_step": 194059, "epoch": 4620} {"train_loss": -7.161046981811523, "global_step": 194060, "epoch": 4620} {"train_loss": -7.156792640686035, "global_step": 194061, "epoch": 4620} {"train_loss": -7.088310241699219, "global_step": 194062, "epoch": 4620} {"train_loss": -7.1819047927856445, "global_step": 194063, "epoch": 4620} {"train_loss": -7.235754489898682, "global_step": 194064, "epoch": 4620} {"train_loss": -6.986870288848877, "global_step": 194065, "epoch": 4620} {"train_loss": -7.053181171417236, "global_step": 194066, "epoch": 4620} {"train_loss": -7.205803871154785, "global_step": 194067, "epoch": 4620} {"train_loss": -6.967988967895508, "global_step": 194068, "epoch": 4620} {"train_loss": -7.193511009216309, "global_step": 194069, "epoch": 4620} {"train_loss": -7.048681259155273, "global_step": 194070, "epoch": 4620} {"train_loss": -7.067144393920898, "global_step": 194071, "epoch": 4620} {"train_loss": -7.026192665100098, "global_step": 194072, "epoch": 4620} {"train_loss": -6.9541168212890625, "global_step": 194073, "epoch": 4620} {"train_loss": -7.223636627197266, "global_step": 194074, "epoch": 4620} {"train_loss": -7.052034854888916, "global_step": 194075, "epoch": 4620} {"train_loss": -6.984442710876465, "global_step": 194076, "epoch": 4620} {"train_loss": -7.183064937591553, "global_step": 194077, "epoch": 4620} {"train_loss": -6.9222412109375, "global_step": 194078, "epoch": 4620} {"train_loss": -7.147972583770752, "global_step": 194079, "epoch": 4620} {"train_loss": -7.133143901824951, "global_step": 194080, "epoch": 4620} {"train_loss": -7.151188861756098, "global_step": 194081, "epoch": 4620, "val_loss": 69140.5} {"train_loss": -7.202364444732666, "global_step": 194082, "epoch": 4621} {"train_loss": -7.082160949707031, "global_step": 194083, "epoch": 4621} {"train_loss": -7.085357189178467, "global_step": 194084, "epoch": 4621} {"train_loss": -7.141711235046387, "global_step": 194085, "epoch": 4621} {"train_loss": -7.114880084991455, "global_step": 194086, "epoch": 4621} {"train_loss": -7.259195327758789, "global_step": 194087, "epoch": 4621} {"train_loss": -7.256545066833496, "global_step": 194088, "epoch": 4621} {"train_loss": -7.15255069732666, "global_step": 194089, "epoch": 4621} {"train_loss": -7.30223274230957, "global_step": 194090, "epoch": 4621} {"train_loss": -7.166176795959473, "global_step": 194091, "epoch": 4621} {"train_loss": -7.216782569885254, "global_step": 194092, "epoch": 4621} {"train_loss": -7.201350212097168, "global_step": 194093, "epoch": 4621} {"train_loss": -7.243771076202393, "global_step": 194094, "epoch": 4621} {"train_loss": -7.225642681121826, "global_step": 194095, "epoch": 4621} {"train_loss": -7.197776794433594, "global_step": 194096, "epoch": 4621} {"train_loss": -7.155545711517334, "global_step": 194097, "epoch": 4621} {"train_loss": -7.191154956817627, "global_step": 194098, "epoch": 4621} {"train_loss": -7.1975789070129395, "global_step": 194099, "epoch": 4621} {"train_loss": -7.20162296295166, "global_step": 194100, "epoch": 4621} {"train_loss": -7.107651233673096, "global_step": 194101, "epoch": 4621} {"train_loss": -7.166485786437988, "global_step": 194102, "epoch": 4621} {"train_loss": -7.182699203491211, "global_step": 194103, "epoch": 4621} {"train_loss": -7.284130096435547, "global_step": 194104, "epoch": 4621} {"train_loss": -7.102701187133789, "global_step": 194105, "epoch": 4621} {"train_loss": -7.323945045471191, "global_step": 194106, "epoch": 4621} {"train_loss": -7.178930282592773, "global_step": 194107, "epoch": 4621} {"train_loss": -7.182048797607422, "global_step": 194108, "epoch": 4621} {"train_loss": -7.202786445617676, "global_step": 194109, "epoch": 4621} {"train_loss": -7.2973175048828125, "global_step": 194110, "epoch": 4621} {"train_loss": -7.172336578369141, "global_step": 194111, "epoch": 4621} {"train_loss": -7.174825668334961, "global_step": 194112, "epoch": 4621} {"train_loss": -7.091812610626221, "global_step": 194113, "epoch": 4621} {"train_loss": -7.265119552612305, "global_step": 194114, "epoch": 4621} {"train_loss": -7.182156562805176, "global_step": 194115, "epoch": 4621} {"train_loss": -7.15955924987793, "global_step": 194116, "epoch": 4621} {"train_loss": -7.077225685119629, "global_step": 194117, "epoch": 4621} {"train_loss": -7.262713432312012, "global_step": 194118, "epoch": 4621} {"train_loss": -7.084972381591797, "global_step": 194119, "epoch": 4621} {"train_loss": -7.165287971496582, "global_step": 194120, "epoch": 4621} {"train_loss": -7.201959133148193, "global_step": 194121, "epoch": 4621} {"train_loss": -7.034925937652588, "global_step": 194122, "epoch": 4621} {"train_loss": -7.181070475351243, "global_step": 194123, "epoch": 4621, "val_loss": 68942.3203125} {"train_loss": -7.057772159576416, "global_step": 194124, "epoch": 4622} {"train_loss": -7.202977180480957, "global_step": 194125, "epoch": 4622} {"train_loss": -7.183475017547607, "global_step": 194126, "epoch": 4622} {"train_loss": -7.152430534362793, "global_step": 194127, "epoch": 4622} {"train_loss": -7.230903148651123, "global_step": 194128, "epoch": 4622} {"train_loss": -7.114662170410156, "global_step": 194129, "epoch": 4622} {"train_loss": -7.27194356918335, "global_step": 194130, "epoch": 4622} {"train_loss": -7.1765828132629395, "global_step": 194131, "epoch": 4622} {"train_loss": -7.166149616241455, "global_step": 194132, "epoch": 4622} {"train_loss": -7.227532863616943, "global_step": 194133, "epoch": 4622} {"train_loss": -7.2844038009643555, "global_step": 194134, "epoch": 4622} {"train_loss": -7.155409812927246, "global_step": 194135, "epoch": 4622} {"train_loss": -7.228629112243652, "global_step": 194136, "epoch": 4622} {"train_loss": -7.130954265594482, "global_step": 194137, "epoch": 4622} {"train_loss": -7.116766929626465, "global_step": 194138, "epoch": 4622} {"train_loss": -7.144635200500488, "global_step": 194139, "epoch": 4622} {"train_loss": -7.238605499267578, "global_step": 194140, "epoch": 4622} {"train_loss": -7.1753621101379395, "global_step": 194141, "epoch": 4622} {"train_loss": -7.143167972564697, "global_step": 194142, "epoch": 4622} {"train_loss": -7.172927379608154, "global_step": 194143, "epoch": 4622} {"train_loss": -7.058420181274414, "global_step": 194144, "epoch": 4622} {"train_loss": -7.120172500610352, "global_step": 194145, "epoch": 4622} {"train_loss": -7.126198768615723, "global_step": 194146, "epoch": 4622} {"train_loss": -7.133820533752441, "global_step": 194147, "epoch": 4622} {"train_loss": -7.12762451171875, "global_step": 194148, "epoch": 4622} {"train_loss": -7.080601692199707, "global_step": 194149, "epoch": 4622} {"train_loss": -7.121882915496826, "global_step": 194150, "epoch": 4622} {"train_loss": -7.130987644195557, "global_step": 194151, "epoch": 4622} {"train_loss": -7.061861515045166, "global_step": 194152, "epoch": 4622} {"train_loss": -7.187722206115723, "global_step": 194153, "epoch": 4622} {"train_loss": -7.218472003936768, "global_step": 194154, "epoch": 4622} {"train_loss": -7.209155082702637, "global_step": 194155, "epoch": 4622} {"train_loss": -7.144218444824219, "global_step": 194156, "epoch": 4622} {"train_loss": -7.066832542419434, "global_step": 194157, "epoch": 4622} {"train_loss": -7.111102104187012, "global_step": 194158, "epoch": 4622} {"train_loss": -7.088006019592285, "global_step": 194159, "epoch": 4622} {"train_loss": -7.15355110168457, "global_step": 194160, "epoch": 4622} {"train_loss": -7.148509502410889, "global_step": 194161, "epoch": 4622} {"train_loss": -7.09747314453125, "global_step": 194162, "epoch": 4622} {"train_loss": -7.117837429046631, "global_step": 194163, "epoch": 4622} {"train_loss": -7.125988006591797, "global_step": 194164, "epoch": 4622} {"train_loss": -7.152013029370989, "global_step": 194165, "epoch": 4622, "val_loss": 69015.7265625} {"train_loss": -7.168726444244385, "global_step": 194166, "epoch": 4623} {"train_loss": -7.04788064956665, "global_step": 194167, "epoch": 4623} {"train_loss": -7.176493167877197, "global_step": 194168, "epoch": 4623} {"train_loss": -7.187707901000977, "global_step": 194169, "epoch": 4623} {"train_loss": -7.064571380615234, "global_step": 194170, "epoch": 4623} {"train_loss": -7.139200687408447, "global_step": 194171, "epoch": 4623} {"train_loss": -7.196719646453857, "global_step": 194172, "epoch": 4623} {"train_loss": -7.238884925842285, "global_step": 194173, "epoch": 4623} {"train_loss": -7.203310966491699, "global_step": 194174, "epoch": 4623} {"train_loss": -7.215561866760254, "global_step": 194175, "epoch": 4623} {"train_loss": -7.0919294357299805, "global_step": 194176, "epoch": 4623} {"train_loss": -7.29830265045166, "global_step": 194177, "epoch": 4623} {"train_loss": -7.237978935241699, "global_step": 194178, "epoch": 4623} {"train_loss": -7.135128021240234, "global_step": 194179, "epoch": 4623} {"train_loss": -7.151543617248535, "global_step": 194180, "epoch": 4623} {"train_loss": -7.229328155517578, "global_step": 194181, "epoch": 4623} {"train_loss": -7.000208854675293, "global_step": 194182, "epoch": 4623} {"train_loss": -7.191038131713867, "global_step": 194183, "epoch": 4623} {"train_loss": -7.187638282775879, "global_step": 194184, "epoch": 4623} {"train_loss": -7.202999591827393, "global_step": 194185, "epoch": 4623} {"train_loss": -7.230731010437012, "global_step": 194186, "epoch": 4623} {"train_loss": -7.183164119720459, "global_step": 194187, "epoch": 4623} {"train_loss": -7.186489105224609, "global_step": 194188, "epoch": 4623} {"train_loss": -7.312603950500488, "global_step": 194189, "epoch": 4623} {"train_loss": -7.274757385253906, "global_step": 194190, "epoch": 4623} {"train_loss": -7.236915111541748, "global_step": 194191, "epoch": 4623} {"train_loss": -7.107145309448242, "global_step": 194192, "epoch": 4623} {"train_loss": -7.120650291442871, "global_step": 194193, "epoch": 4623} {"train_loss": -7.181739807128906, "global_step": 194194, "epoch": 4623} {"train_loss": -7.186174392700195, "global_step": 194195, "epoch": 4623} {"train_loss": -7.187344074249268, "global_step": 194196, "epoch": 4623} {"train_loss": -7.076304912567139, "global_step": 194197, "epoch": 4623} {"train_loss": -7.209676265716553, "global_step": 194198, "epoch": 4623} {"train_loss": -7.097460746765137, "global_step": 194199, "epoch": 4623} {"train_loss": -7.1930084228515625, "global_step": 194200, "epoch": 4623} {"train_loss": -7.193938255310059, "global_step": 194201, "epoch": 4623} {"train_loss": -7.1885786056518555, "global_step": 194202, "epoch": 4623} {"train_loss": -7.2529497146606445, "global_step": 194203, "epoch": 4623} {"train_loss": -7.213667869567871, "global_step": 194204, "epoch": 4623} {"train_loss": -7.220505237579346, "global_step": 194205, "epoch": 4623} {"train_loss": -7.144138336181641, "global_step": 194206, "epoch": 4623} {"train_loss": -7.181833165032523, "global_step": 194207, "epoch": 4623, "val_loss": 69125.390625} {"train_loss": -7.070395469665527, "global_step": 194208, "epoch": 4624} {"train_loss": -7.226158618927002, "global_step": 194209, "epoch": 4624} {"train_loss": -7.285100936889648, "global_step": 194210, "epoch": 4624} {"train_loss": -7.066081523895264, "global_step": 194211, "epoch": 4624} {"train_loss": -7.147735118865967, "global_step": 194212, "epoch": 4624} {"train_loss": -7.262720108032227, "global_step": 194213, "epoch": 4624} {"train_loss": -7.201382160186768, "global_step": 194214, "epoch": 4624} {"train_loss": -7.250865936279297, "global_step": 194215, "epoch": 4624} {"train_loss": -7.259735584259033, "global_step": 194216, "epoch": 4624} {"train_loss": -7.276531219482422, "global_step": 194217, "epoch": 4624} {"train_loss": -7.200281143188477, "global_step": 194218, "epoch": 4624} {"train_loss": -7.142024993896484, "global_step": 194219, "epoch": 4624} {"train_loss": -7.239468574523926, "global_step": 194220, "epoch": 4624} {"train_loss": -7.253759384155273, "global_step": 194221, "epoch": 4624} {"train_loss": -7.2648115158081055, "global_step": 194222, "epoch": 4624} {"train_loss": -7.165271759033203, "global_step": 194223, "epoch": 4624} {"train_loss": -7.323451995849609, "global_step": 194224, "epoch": 4624} {"train_loss": -7.168421745300293, "global_step": 194225, "epoch": 4624} {"train_loss": -7.259398460388184, "global_step": 194226, "epoch": 4624} {"train_loss": -7.252451419830322, "global_step": 194227, "epoch": 4624} {"train_loss": -7.232677459716797, "global_step": 194228, "epoch": 4624} {"train_loss": -7.16746711730957, "global_step": 194229, "epoch": 4624} {"train_loss": -7.099164962768555, "global_step": 194230, "epoch": 4624} {"train_loss": -7.132696151733398, "global_step": 194231, "epoch": 4624} {"train_loss": -7.185011863708496, "global_step": 194232, "epoch": 4624} {"train_loss": -7.174817085266113, "global_step": 194233, "epoch": 4624} {"train_loss": -7.149834632873535, "global_step": 194234, "epoch": 4624} {"train_loss": -7.142798900604248, "global_step": 194235, "epoch": 4624} {"train_loss": -7.11637020111084, "global_step": 194236, "epoch": 4624} {"train_loss": -7.050450325012207, "global_step": 194237, "epoch": 4624} {"train_loss": -7.25247859954834, "global_step": 194238, "epoch": 4624} {"train_loss": -7.063292026519775, "global_step": 194239, "epoch": 4624} {"train_loss": -7.128657341003418, "global_step": 194240, "epoch": 4624} {"train_loss": -7.07067346572876, "global_step": 194241, "epoch": 4624} {"train_loss": -7.101362228393555, "global_step": 194242, "epoch": 4624} {"train_loss": -7.135538578033447, "global_step": 194243, "epoch": 4624} {"train_loss": -7.128885269165039, "global_step": 194244, "epoch": 4624} {"train_loss": -6.976559162139893, "global_step": 194245, "epoch": 4624} {"train_loss": -7.149292945861816, "global_step": 194246, "epoch": 4624} {"train_loss": -7.051279067993164, "global_step": 194247, "epoch": 4624} {"train_loss": -7.2397565841674805, "global_step": 194248, "epoch": 4624} {"train_loss": -7.170822926930019, "global_step": 194249, "epoch": 4624, "val_loss": 69128.4921875} {"train_loss": -7.117857456207275, "global_step": 194250, "epoch": 4625} {"train_loss": -7.033829689025879, "global_step": 194251, "epoch": 4625} {"train_loss": -7.060854434967041, "global_step": 194252, "epoch": 4625} {"train_loss": -7.161630153656006, "global_step": 194253, "epoch": 4625} {"train_loss": -6.848971366882324, "global_step": 194254, "epoch": 4625} {"train_loss": -7.112338066101074, "global_step": 194255, "epoch": 4625} {"train_loss": -7.121263027191162, "global_step": 194256, "epoch": 4625} {"train_loss": -7.075940132141113, "global_step": 194257, "epoch": 4625} {"train_loss": -7.1419267654418945, "global_step": 194258, "epoch": 4625} {"train_loss": -7.087508201599121, "global_step": 194259, "epoch": 4625} {"train_loss": -7.181551456451416, "global_step": 194260, "epoch": 4625} {"train_loss": -7.079716682434082, "global_step": 194261, "epoch": 4625} {"train_loss": -7.080024719238281, "global_step": 194262, "epoch": 4625} {"train_loss": -7.315493106842041, "global_step": 194263, "epoch": 4625} {"train_loss": -7.106649398803711, "global_step": 194264, "epoch": 4625} {"train_loss": -7.08644962310791, "global_step": 194265, "epoch": 4625} {"train_loss": -7.170370101928711, "global_step": 194266, "epoch": 4625} {"train_loss": -7.240738868713379, "global_step": 194267, "epoch": 4625} {"train_loss": -7.09970760345459, "global_step": 194268, "epoch": 4625} {"train_loss": -7.178904056549072, "global_step": 194269, "epoch": 4625} {"train_loss": -7.206703186035156, "global_step": 194270, "epoch": 4625} {"train_loss": -7.1549296379089355, "global_step": 194271, "epoch": 4625} {"train_loss": -7.191470623016357, "global_step": 194272, "epoch": 4625} {"train_loss": -7.189076900482178, "global_step": 194273, "epoch": 4625} {"train_loss": -7.165309429168701, "global_step": 194274, "epoch": 4625} {"train_loss": -7.151458740234375, "global_step": 194275, "epoch": 4625} {"train_loss": -7.20908260345459, "global_step": 194276, "epoch": 4625} {"train_loss": -7.192635536193848, "global_step": 194277, "epoch": 4625} {"train_loss": -7.267148017883301, "global_step": 194278, "epoch": 4625} {"train_loss": -7.260049819946289, "global_step": 194279, "epoch": 4625} {"train_loss": -7.192775726318359, "global_step": 194280, "epoch": 4625} {"train_loss": -7.22036075592041, "global_step": 194281, "epoch": 4625} {"train_loss": -7.306986331939697, "global_step": 194282, "epoch": 4625} {"train_loss": -7.157139778137207, "global_step": 194283, "epoch": 4625} {"train_loss": -7.250012397766113, "global_step": 194284, "epoch": 4625} {"train_loss": -7.23300838470459, "global_step": 194285, "epoch": 4625} {"train_loss": -7.1683244705200195, "global_step": 194286, "epoch": 4625} {"train_loss": -7.029654502868652, "global_step": 194287, "epoch": 4625} {"train_loss": -7.041260719299316, "global_step": 194288, "epoch": 4625} {"train_loss": -7.239089012145996, "global_step": 194289, "epoch": 4625} {"train_loss": -7.217645645141602, "global_step": 194290, "epoch": 4625} {"train_loss": -7.153883934020996, "global_step": 194291, "epoch": 4625, "val_loss": 69050.625} {"train_loss": -7.115114212036133, "global_step": 194292, "epoch": 4626} {"train_loss": -7.186519622802734, "global_step": 194293, "epoch": 4626} {"train_loss": -7.179601669311523, "global_step": 194294, "epoch": 4626} {"train_loss": -7.172079086303711, "global_step": 194295, "epoch": 4626} {"train_loss": -7.261958122253418, "global_step": 194296, "epoch": 4626} {"train_loss": -7.151095390319824, "global_step": 194297, "epoch": 4626} {"train_loss": -7.199357032775879, "global_step": 194298, "epoch": 4626} {"train_loss": -7.201005935668945, "global_step": 194299, "epoch": 4626} {"train_loss": -7.070230484008789, "global_step": 194300, "epoch": 4626} {"train_loss": -7.181540489196777, "global_step": 194301, "epoch": 4626} {"train_loss": -7.2813191413879395, "global_step": 194302, "epoch": 4626} {"train_loss": -7.214051246643066, "global_step": 194303, "epoch": 4626} {"train_loss": -7.164761066436768, "global_step": 194304, "epoch": 4626} {"train_loss": -7.2650628089904785, "global_step": 194305, "epoch": 4626} {"train_loss": -7.218279838562012, "global_step": 194306, "epoch": 4626} {"train_loss": -7.266399383544922, "global_step": 194307, "epoch": 4626} {"train_loss": -7.214636325836182, "global_step": 194308, "epoch": 4626} {"train_loss": -7.214667797088623, "global_step": 194309, "epoch": 4626} {"train_loss": -7.316479206085205, "global_step": 194310, "epoch": 4626} {"train_loss": -7.248836040496826, "global_step": 194311, "epoch": 4626} {"train_loss": -7.210866451263428, "global_step": 194312, "epoch": 4626} {"train_loss": -7.22608757019043, "global_step": 194313, "epoch": 4626} {"train_loss": -7.16295051574707, "global_step": 194314, "epoch": 4626} {"train_loss": -7.012862205505371, "global_step": 194315, "epoch": 4626} {"train_loss": -7.100000381469727, "global_step": 194316, "epoch": 4626} {"train_loss": -7.15853214263916, "global_step": 194317, "epoch": 4626} {"train_loss": -7.104369163513184, "global_step": 194318, "epoch": 4626} {"train_loss": -7.0996575355529785, "global_step": 194319, "epoch": 4626} {"train_loss": -7.193406105041504, "global_step": 194320, "epoch": 4626} {"train_loss": -7.110215187072754, "global_step": 194321, "epoch": 4626} {"train_loss": -7.171231746673584, "global_step": 194322, "epoch": 4626} {"train_loss": -7.216014862060547, "global_step": 194323, "epoch": 4626} {"train_loss": -7.125784873962402, "global_step": 194324, "epoch": 4626} {"train_loss": -7.146867752075195, "global_step": 194325, "epoch": 4626} {"train_loss": -7.164909362792969, "global_step": 194326, "epoch": 4626} {"train_loss": -7.1914591789245605, "global_step": 194327, "epoch": 4626} {"train_loss": -7.247753143310547, "global_step": 194328, "epoch": 4626} {"train_loss": -7.134543418884277, "global_step": 194329, "epoch": 4626} {"train_loss": -7.21816349029541, "global_step": 194330, "epoch": 4626} {"train_loss": -7.124483585357666, "global_step": 194331, "epoch": 4626} {"train_loss": -7.134033203125, "global_step": 194332, "epoch": 4626} {"train_loss": -7.183187325795491, "global_step": 194333, "epoch": 4626, "val_loss": 68934.375} {"train_loss": -7.21616792678833, "global_step": 194334, "epoch": 4627} {"train_loss": -7.167015075683594, "global_step": 194335, "epoch": 4627} {"train_loss": -7.215610504150391, "global_step": 194336, "epoch": 4627} {"train_loss": -7.168200969696045, "global_step": 194337, "epoch": 4627} {"train_loss": -7.187448024749756, "global_step": 194338, "epoch": 4627} {"train_loss": -7.23178768157959, "global_step": 194339, "epoch": 4627} {"train_loss": -7.361349105834961, "global_step": 194340, "epoch": 4627} {"train_loss": -7.274972438812256, "global_step": 194341, "epoch": 4627} {"train_loss": -7.259544849395752, "global_step": 194342, "epoch": 4627} {"train_loss": -7.185451507568359, "global_step": 194343, "epoch": 4627} {"train_loss": -7.266395568847656, "global_step": 194344, "epoch": 4627} {"train_loss": -7.150321960449219, "global_step": 194345, "epoch": 4627} {"train_loss": -7.301592826843262, "global_step": 194346, "epoch": 4627} {"train_loss": -7.189032554626465, "global_step": 194347, "epoch": 4627} {"train_loss": -7.229243278503418, "global_step": 194348, "epoch": 4627} {"train_loss": -7.256438255310059, "global_step": 194349, "epoch": 4627} {"train_loss": -7.252821922302246, "global_step": 194350, "epoch": 4627} {"train_loss": -7.250967979431152, "global_step": 194351, "epoch": 4627} {"train_loss": -7.266055583953857, "global_step": 194352, "epoch": 4627} {"train_loss": -7.236565589904785, "global_step": 194353, "epoch": 4627} {"train_loss": -7.222686767578125, "global_step": 194354, "epoch": 4627} {"train_loss": -7.191437721252441, "global_step": 194355, "epoch": 4627} {"train_loss": -7.2325897216796875, "global_step": 194356, "epoch": 4627} {"train_loss": -7.212186813354492, "global_step": 194357, "epoch": 4627} {"train_loss": -7.293429374694824, "global_step": 194358, "epoch": 4627} {"train_loss": -7.2147216796875, "global_step": 194359, "epoch": 4627} {"train_loss": -7.173523902893066, "global_step": 194360, "epoch": 4627} {"train_loss": -7.2416839599609375, "global_step": 194361, "epoch": 4627} {"train_loss": -7.298997402191162, "global_step": 194362, "epoch": 4627} {"train_loss": -7.216388702392578, "global_step": 194363, "epoch": 4627} {"train_loss": -7.233095169067383, "global_step": 194364, "epoch": 4627} {"train_loss": -7.32461404800415, "global_step": 194365, "epoch": 4627} {"train_loss": -7.122285842895508, "global_step": 194366, "epoch": 4627} {"train_loss": -7.24945068359375, "global_step": 194367, "epoch": 4627} {"train_loss": -7.214801788330078, "global_step": 194368, "epoch": 4627} {"train_loss": -7.28481388092041, "global_step": 194369, "epoch": 4627} {"train_loss": -7.267026901245117, "global_step": 194370, "epoch": 4627} {"train_loss": -7.274230003356934, "global_step": 194371, "epoch": 4627} {"train_loss": -7.260848522186279, "global_step": 194372, "epoch": 4627} {"train_loss": -7.234540939331055, "global_step": 194373, "epoch": 4627} {"train_loss": -7.242605209350586, "global_step": 194374, "epoch": 4627} {"train_loss": -7.238175040199643, "global_step": 194375, "epoch": 4627, "val_loss": 69074.015625} {"train_loss": -7.277500152587891, "global_step": 194376, "epoch": 4628} {"train_loss": -7.357693195343018, "global_step": 194377, "epoch": 4628} {"train_loss": -7.323919773101807, "global_step": 194378, "epoch": 4628} {"train_loss": -7.2587409019470215, "global_step": 194379, "epoch": 4628} {"train_loss": -7.235652923583984, "global_step": 194380, "epoch": 4628} {"train_loss": -7.229454040527344, "global_step": 194381, "epoch": 4628} {"train_loss": -7.234841823577881, "global_step": 194382, "epoch": 4628} {"train_loss": -7.399797439575195, "global_step": 194383, "epoch": 4628} {"train_loss": -7.151669502258301, "global_step": 194384, "epoch": 4628} {"train_loss": -7.3296403884887695, "global_step": 194385, "epoch": 4628} {"train_loss": -7.250094413757324, "global_step": 194386, "epoch": 4628} {"train_loss": -7.36519193649292, "global_step": 194387, "epoch": 4628} {"train_loss": -7.332175254821777, "global_step": 194388, "epoch": 4628} {"train_loss": -7.309564590454102, "global_step": 194389, "epoch": 4628} {"train_loss": -7.253034591674805, "global_step": 194390, "epoch": 4628} {"train_loss": -7.303299427032471, "global_step": 194391, "epoch": 4628} {"train_loss": -7.227089881896973, "global_step": 194392, "epoch": 4628} {"train_loss": -7.231194019317627, "global_step": 194393, "epoch": 4628} {"train_loss": -7.244015216827393, "global_step": 194394, "epoch": 4628} {"train_loss": -7.1796464920043945, "global_step": 194395, "epoch": 4628} {"train_loss": -7.177248954772949, "global_step": 194396, "epoch": 4628} {"train_loss": -7.151706695556641, "global_step": 194397, "epoch": 4628} {"train_loss": -7.1349263191223145, "global_step": 194398, "epoch": 4628} {"train_loss": -7.140962600708008, "global_step": 194399, "epoch": 4628} {"train_loss": -7.129809379577637, "global_step": 194400, "epoch": 4628} {"train_loss": -7.185905456542969, "global_step": 194401, "epoch": 4628} {"train_loss": -7.131402015686035, "global_step": 194402, "epoch": 4628} {"train_loss": -7.112988471984863, "global_step": 194403, "epoch": 4628} {"train_loss": -7.191076755523682, "global_step": 194404, "epoch": 4628} {"train_loss": -7.023962497711182, "global_step": 194405, "epoch": 4628} {"train_loss": -7.143413543701172, "global_step": 194406, "epoch": 4628} {"train_loss": -7.117711067199707, "global_step": 194407, "epoch": 4628} {"train_loss": -7.0690531730651855, "global_step": 194408, "epoch": 4628} {"train_loss": -7.122479438781738, "global_step": 194409, "epoch": 4628} {"train_loss": -7.179024696350098, "global_step": 194410, "epoch": 4628} {"train_loss": -7.162232398986816, "global_step": 194411, "epoch": 4628} {"train_loss": -7.143877983093262, "global_step": 194412, "epoch": 4628} {"train_loss": -7.099640846252441, "global_step": 194413, "epoch": 4628} {"train_loss": -7.0933613777160645, "global_step": 194414, "epoch": 4628} {"train_loss": -7.143733024597168, "global_step": 194415, "epoch": 4628} {"train_loss": -7.124770641326904, "global_step": 194416, "epoch": 4628} {"train_loss": -7.200252918970017, "global_step": 194417, "epoch": 4628, "val_loss": 68815.8984375} {"train_loss": -7.268716812133789, "global_step": 194418, "epoch": 4629} {"train_loss": -7.215628623962402, "global_step": 194419, "epoch": 4629} {"train_loss": -7.236700057983398, "global_step": 194420, "epoch": 4629} {"train_loss": -7.154191017150879, "global_step": 194421, "epoch": 4629} {"train_loss": -7.139742374420166, "global_step": 194422, "epoch": 4629} {"train_loss": -7.131180763244629, "global_step": 194423, "epoch": 4629} {"train_loss": -7.157334804534912, "global_step": 194424, "epoch": 4629} {"train_loss": -7.254257678985596, "global_step": 194425, "epoch": 4629} {"train_loss": -7.198520660400391, "global_step": 194426, "epoch": 4629} {"train_loss": -7.176262855529785, "global_step": 194427, "epoch": 4629} {"train_loss": -7.104557037353516, "global_step": 194428, "epoch": 4629} {"train_loss": -7.029626846313477, "global_step": 194429, "epoch": 4629} {"train_loss": -7.085816383361816, "global_step": 194430, "epoch": 4629} {"train_loss": -7.083105087280273, "global_step": 194431, "epoch": 4629} {"train_loss": -7.133264541625977, "global_step": 194432, "epoch": 4629} {"train_loss": -7.263175964355469, "global_step": 194433, "epoch": 4629} {"train_loss": -7.220159530639648, "global_step": 194434, "epoch": 4629} {"train_loss": -7.193767547607422, "global_step": 194435, "epoch": 4629} {"train_loss": -7.244750022888184, "global_step": 194436, "epoch": 4629} {"train_loss": -7.171323776245117, "global_step": 194437, "epoch": 4629} {"train_loss": -7.179895401000977, "global_step": 194438, "epoch": 4629} {"train_loss": -7.161496639251709, "global_step": 194439, "epoch": 4629} {"train_loss": -7.23597526550293, "global_step": 194440, "epoch": 4629} {"train_loss": -7.176574230194092, "global_step": 194441, "epoch": 4629} {"train_loss": -7.270409107208252, "global_step": 194442, "epoch": 4629} {"train_loss": -7.161195278167725, "global_step": 194443, "epoch": 4629} {"train_loss": -7.239781379699707, "global_step": 194444, "epoch": 4629} {"train_loss": -7.149700164794922, "global_step": 194445, "epoch": 4629} {"train_loss": -7.196612358093262, "global_step": 194446, "epoch": 4629} {"train_loss": -7.211560249328613, "global_step": 194447, "epoch": 4629} {"train_loss": -7.133435249328613, "global_step": 194448, "epoch": 4629} {"train_loss": -7.2223100662231445, "global_step": 194449, "epoch": 4629} {"train_loss": -7.109762191772461, "global_step": 194450, "epoch": 4629} {"train_loss": -7.251517295837402, "global_step": 194451, "epoch": 4629} {"train_loss": -7.244745254516602, "global_step": 194452, "epoch": 4629} {"train_loss": -7.222643852233887, "global_step": 194453, "epoch": 4629} {"train_loss": -7.167916297912598, "global_step": 194454, "epoch": 4629} {"train_loss": -7.164816379547119, "global_step": 194455, "epoch": 4629} {"train_loss": -7.046317100524902, "global_step": 194456, "epoch": 4629} {"train_loss": -7.12735652923584, "global_step": 194457, "epoch": 4629} {"train_loss": -7.243920803070068, "global_step": 194458, "epoch": 4629} {"train_loss": -7.181413957050869, "global_step": 194459, "epoch": 4629, "val_loss": 68893.1328125} {"train_loss": -7.208477020263672, "global_step": 194460, "epoch": 4630} {"train_loss": -7.189682483673096, "global_step": 194461, "epoch": 4630} {"train_loss": -7.198268890380859, "global_step": 194462, "epoch": 4630} {"train_loss": -7.178504467010498, "global_step": 194463, "epoch": 4630} {"train_loss": -7.161898612976074, "global_step": 194464, "epoch": 4630} {"train_loss": -7.011673927307129, "global_step": 194465, "epoch": 4630} {"train_loss": -7.178035259246826, "global_step": 194466, "epoch": 4630} {"train_loss": -7.228527069091797, "global_step": 194467, "epoch": 4630} {"train_loss": -7.1166486740112305, "global_step": 194468, "epoch": 4630} {"train_loss": -7.034506320953369, "global_step": 194469, "epoch": 4630} {"train_loss": -7.114777088165283, "global_step": 194470, "epoch": 4630} {"train_loss": -7.223528861999512, "global_step": 194471, "epoch": 4630} {"train_loss": -7.131402015686035, "global_step": 194472, "epoch": 4630} {"train_loss": -7.186430931091309, "global_step": 194473, "epoch": 4630} {"train_loss": -7.198500633239746, "global_step": 194474, "epoch": 4630} {"train_loss": -7.153441429138184, "global_step": 194475, "epoch": 4630} {"train_loss": -7.174754619598389, "global_step": 194476, "epoch": 4630} {"train_loss": -7.141788482666016, "global_step": 194477, "epoch": 4630} {"train_loss": -7.23153018951416, "global_step": 194478, "epoch": 4630} {"train_loss": -7.172206878662109, "global_step": 194479, "epoch": 4630} {"train_loss": -7.062506675720215, "global_step": 194480, "epoch": 4630} {"train_loss": -7.163018226623535, "global_step": 194481, "epoch": 4630} {"train_loss": -7.187396049499512, "global_step": 194482, "epoch": 4630} {"train_loss": -7.201446056365967, "global_step": 194483, "epoch": 4630} {"train_loss": -7.264299392700195, "global_step": 194484, "epoch": 4630} {"train_loss": -7.2772417068481445, "global_step": 194485, "epoch": 4630} {"train_loss": -7.2098517417907715, "global_step": 194486, "epoch": 4630} {"train_loss": -7.277803897857666, "global_step": 194487, "epoch": 4630} {"train_loss": -7.105818748474121, "global_step": 194488, "epoch": 4630} {"train_loss": -7.1639323234558105, "global_step": 194489, "epoch": 4630} {"train_loss": -7.1953630447387695, "global_step": 194490, "epoch": 4630} {"train_loss": -7.168745994567871, "global_step": 194491, "epoch": 4630} {"train_loss": -7.136427879333496, "global_step": 194492, "epoch": 4630} {"train_loss": -7.252352237701416, "global_step": 194493, "epoch": 4630} {"train_loss": -7.227097511291504, "global_step": 194494, "epoch": 4630} {"train_loss": -7.268502235412598, "global_step": 194495, "epoch": 4630} {"train_loss": -7.218472480773926, "global_step": 194496, "epoch": 4630} {"train_loss": -7.266607761383057, "global_step": 194497, "epoch": 4630} {"train_loss": -7.282578468322754, "global_step": 194498, "epoch": 4630} {"train_loss": -7.165787696838379, "global_step": 194499, "epoch": 4630} {"train_loss": -7.2702484130859375, "global_step": 194500, "epoch": 4630} {"train_loss": -7.186561198461623, "global_step": 194501, "epoch": 4630, "val_loss": 69017.609375} {"train_loss": -7.294131278991699, "global_step": 194502, "epoch": 4631} {"train_loss": -7.251609802246094, "global_step": 194503, "epoch": 4631} {"train_loss": -7.262930870056152, "global_step": 194504, "epoch": 4631} {"train_loss": -7.067001819610596, "global_step": 194505, "epoch": 4631} {"train_loss": -7.253480911254883, "global_step": 194506, "epoch": 4631} {"train_loss": -7.19478702545166, "global_step": 194507, "epoch": 4631} {"train_loss": -7.1110310554504395, "global_step": 194508, "epoch": 4631} {"train_loss": -7.214652061462402, "global_step": 194509, "epoch": 4631} {"train_loss": -7.348866939544678, "global_step": 194510, "epoch": 4631} {"train_loss": -7.184441089630127, "global_step": 194511, "epoch": 4631} {"train_loss": -7.231545448303223, "global_step": 194512, "epoch": 4631} {"train_loss": -7.202563762664795, "global_step": 194513, "epoch": 4631} {"train_loss": -7.216709613800049, "global_step": 194514, "epoch": 4631} {"train_loss": -7.195626258850098, "global_step": 194515, "epoch": 4631} {"train_loss": -7.191012382507324, "global_step": 194516, "epoch": 4631} {"train_loss": -7.188920974731445, "global_step": 194517, "epoch": 4631} {"train_loss": -7.162281036376953, "global_step": 194518, "epoch": 4631} {"train_loss": -7.241903305053711, "global_step": 194519, "epoch": 4631} {"train_loss": -7.174373626708984, "global_step": 194520, "epoch": 4631} {"train_loss": -7.242532730102539, "global_step": 194521, "epoch": 4631} {"train_loss": -7.3094048500061035, "global_step": 194522, "epoch": 4631} {"train_loss": -7.184788703918457, "global_step": 194523, "epoch": 4631} {"train_loss": -7.249629497528076, "global_step": 194524, "epoch": 4631} {"train_loss": -7.180166244506836, "global_step": 194525, "epoch": 4631} {"train_loss": -7.0655975341796875, "global_step": 194526, "epoch": 4631} {"train_loss": -7.165290832519531, "global_step": 194527, "epoch": 4631} {"train_loss": -7.132666110992432, "global_step": 194528, "epoch": 4631} {"train_loss": -7.067049980163574, "global_step": 194529, "epoch": 4631} {"train_loss": -7.244362831115723, "global_step": 194530, "epoch": 4631} {"train_loss": -7.2053446769714355, "global_step": 194531, "epoch": 4631} {"train_loss": -7.157642841339111, "global_step": 194532, "epoch": 4631} {"train_loss": -7.139833927154541, "global_step": 194533, "epoch": 4631} {"train_loss": -7.209329605102539, "global_step": 194534, "epoch": 4631} {"train_loss": -7.187892913818359, "global_step": 194535, "epoch": 4631} {"train_loss": -7.2260942459106445, "global_step": 194536, "epoch": 4631} {"train_loss": -7.1925249099731445, "global_step": 194537, "epoch": 4631} {"train_loss": -7.152155876159668, "global_step": 194538, "epoch": 4631} {"train_loss": -7.252796173095703, "global_step": 194539, "epoch": 4631} {"train_loss": -7.2742133140563965, "global_step": 194540, "epoch": 4631} {"train_loss": -7.24305534362793, "global_step": 194541, "epoch": 4631} {"train_loss": -7.129464149475098, "global_step": 194542, "epoch": 4631} {"train_loss": -7.20125811440604, "global_step": 194543, "epoch": 4631, "val_loss": 69016.2265625} {"train_loss": -7.230722427368164, "global_step": 194544, "epoch": 4632} {"train_loss": -7.185042858123779, "global_step": 194545, "epoch": 4632} {"train_loss": -7.227687835693359, "global_step": 194546, "epoch": 4632} {"train_loss": -7.15051794052124, "global_step": 194547, "epoch": 4632} {"train_loss": -7.117739677429199, "global_step": 194548, "epoch": 4632} {"train_loss": -7.247206211090088, "global_step": 194549, "epoch": 4632} {"train_loss": -7.193096160888672, "global_step": 194550, "epoch": 4632} {"train_loss": -7.148377418518066, "global_step": 194551, "epoch": 4632} {"train_loss": -7.157718181610107, "global_step": 194552, "epoch": 4632} {"train_loss": -7.178958415985107, "global_step": 194553, "epoch": 4632} {"train_loss": -7.201550483703613, "global_step": 194554, "epoch": 4632} {"train_loss": -7.205674171447754, "global_step": 194555, "epoch": 4632} {"train_loss": -7.183575630187988, "global_step": 194556, "epoch": 4632} {"train_loss": -7.145265102386475, "global_step": 194557, "epoch": 4632} {"train_loss": -7.094890594482422, "global_step": 194558, "epoch": 4632} {"train_loss": -7.174593925476074, "global_step": 194559, "epoch": 4632} {"train_loss": -7.03969669342041, "global_step": 194560, "epoch": 4632} {"train_loss": -6.991369724273682, "global_step": 194561, "epoch": 4632} {"train_loss": -7.055889129638672, "global_step": 194562, "epoch": 4632} {"train_loss": -7.134084224700928, "global_step": 194563, "epoch": 4632} {"train_loss": -7.080218315124512, "global_step": 194564, "epoch": 4632} {"train_loss": -7.09539794921875, "global_step": 194565, "epoch": 4632} {"train_loss": -7.127519130706787, "global_step": 194566, "epoch": 4632} {"train_loss": -7.182430267333984, "global_step": 194567, "epoch": 4632} {"train_loss": -7.142852783203125, "global_step": 194568, "epoch": 4632} {"train_loss": -7.116700649261475, "global_step": 194569, "epoch": 4632} {"train_loss": -7.199911594390869, "global_step": 194570, "epoch": 4632} {"train_loss": -7.218685150146484, "global_step": 194571, "epoch": 4632} {"train_loss": -7.194557189941406, "global_step": 194572, "epoch": 4632} {"train_loss": -7.201904773712158, "global_step": 194573, "epoch": 4632} {"train_loss": -7.093815803527832, "global_step": 194574, "epoch": 4632} {"train_loss": -7.126452922821045, "global_step": 194575, "epoch": 4632} {"train_loss": -7.166650772094727, "global_step": 194576, "epoch": 4632} {"train_loss": -7.226780891418457, "global_step": 194577, "epoch": 4632} {"train_loss": -7.2029266357421875, "global_step": 194578, "epoch": 4632} {"train_loss": -7.200236797332764, "global_step": 194579, "epoch": 4632} {"train_loss": -7.187479496002197, "global_step": 194580, "epoch": 4632} {"train_loss": -7.111137866973877, "global_step": 194581, "epoch": 4632} {"train_loss": -7.251470565795898, "global_step": 194582, "epoch": 4632} {"train_loss": -7.196078300476074, "global_step": 194583, "epoch": 4632} {"train_loss": -7.221356391906738, "global_step": 194584, "epoch": 4632} {"train_loss": -7.162142322176979, "global_step": 194585, "epoch": 4632, "val_loss": 69170.9609375} {"train_loss": -7.199901103973389, "global_step": 194586, "epoch": 4633} {"train_loss": -7.208019256591797, "global_step": 194587, "epoch": 4633} {"train_loss": -7.196028232574463, "global_step": 194588, "epoch": 4633} {"train_loss": -7.178279399871826, "global_step": 194589, "epoch": 4633} {"train_loss": -7.150855541229248, "global_step": 194590, "epoch": 4633} {"train_loss": -7.207955360412598, "global_step": 194591, "epoch": 4633} {"train_loss": -7.254817962646484, "global_step": 194592, "epoch": 4633} {"train_loss": -7.279689788818359, "global_step": 194593, "epoch": 4633} {"train_loss": -7.21430778503418, "global_step": 194594, "epoch": 4633} {"train_loss": -7.129802703857422, "global_step": 194595, "epoch": 4633} {"train_loss": -7.158535480499268, "global_step": 194596, "epoch": 4633} {"train_loss": -7.184849739074707, "global_step": 194597, "epoch": 4633} {"train_loss": -7.206036567687988, "global_step": 194598, "epoch": 4633} {"train_loss": -7.2284321784973145, "global_step": 194599, "epoch": 4633} {"train_loss": -7.1471123695373535, "global_step": 194600, "epoch": 4633} {"train_loss": -6.98184061050415, "global_step": 194601, "epoch": 4633} {"train_loss": -7.196905612945557, "global_step": 194602, "epoch": 4633} {"train_loss": -7.035721302032471, "global_step": 194603, "epoch": 4633} {"train_loss": -7.095002174377441, "global_step": 194604, "epoch": 4633} {"train_loss": -7.022795677185059, "global_step": 194605, "epoch": 4633} {"train_loss": -7.097465991973877, "global_step": 194606, "epoch": 4633} {"train_loss": -7.183431148529053, "global_step": 194607, "epoch": 4633} {"train_loss": -7.181304931640625, "global_step": 194608, "epoch": 4633} {"train_loss": -7.146585464477539, "global_step": 194609, "epoch": 4633} {"train_loss": -7.192430019378662, "global_step": 194610, "epoch": 4633} {"train_loss": -7.125669956207275, "global_step": 194611, "epoch": 4633} {"train_loss": -6.98139762878418, "global_step": 194612, "epoch": 4633} {"train_loss": -7.227017402648926, "global_step": 194613, "epoch": 4633} {"train_loss": -7.202096939086914, "global_step": 194614, "epoch": 4633} {"train_loss": -7.030473709106445, "global_step": 194615, "epoch": 4633} {"train_loss": -7.162431240081787, "global_step": 194616, "epoch": 4633} {"train_loss": -7.219452857971191, "global_step": 194617, "epoch": 4633} {"train_loss": -7.19022274017334, "global_step": 194618, "epoch": 4633} {"train_loss": -7.076127052307129, "global_step": 194619, "epoch": 4633} {"train_loss": -7.163114070892334, "global_step": 194620, "epoch": 4633} {"train_loss": -7.045375347137451, "global_step": 194621, "epoch": 4633} {"train_loss": -7.016955852508545, "global_step": 194622, "epoch": 4633} {"train_loss": -7.072030067443848, "global_step": 194623, "epoch": 4633} {"train_loss": -7.141263961791992, "global_step": 194624, "epoch": 4633} {"train_loss": -7.030156135559082, "global_step": 194625, "epoch": 4633} {"train_loss": -7.067399024963379, "global_step": 194626, "epoch": 4633} {"train_loss": -7.1382608867826915, "global_step": 194627, "epoch": 4633, "val_loss": 69242.0546875} {"train_loss": -7.000162601470947, "global_step": 194628, "epoch": 4634} {"train_loss": -7.009064674377441, "global_step": 194629, "epoch": 4634} {"train_loss": -7.0180253982543945, "global_step": 194630, "epoch": 4634} {"train_loss": -6.9012651443481445, "global_step": 194631, "epoch": 4634} {"train_loss": -6.963233470916748, "global_step": 194632, "epoch": 4634} {"train_loss": -6.915533065795898, "global_step": 194633, "epoch": 4634} {"train_loss": -7.010958671569824, "global_step": 194634, "epoch": 4634} {"train_loss": -6.9886393547058105, "global_step": 194635, "epoch": 4634} {"train_loss": -7.007396697998047, "global_step": 194636, "epoch": 4634} {"train_loss": -6.98838996887207, "global_step": 194637, "epoch": 4634} {"train_loss": -6.928954124450684, "global_step": 194638, "epoch": 4634} {"train_loss": -6.9496026039123535, "global_step": 194639, "epoch": 4634} {"train_loss": -6.9560346603393555, "global_step": 194640, "epoch": 4634} {"train_loss": -6.954978942871094, "global_step": 194641, "epoch": 4634} {"train_loss": -7.033273696899414, "global_step": 194642, "epoch": 4634} {"train_loss": -7.040806293487549, "global_step": 194643, "epoch": 4634} {"train_loss": -7.111299514770508, "global_step": 194644, "epoch": 4634} {"train_loss": -7.02984619140625, "global_step": 194645, "epoch": 4634} {"train_loss": -7.083853244781494, "global_step": 194646, "epoch": 4634} {"train_loss": -7.010346412658691, "global_step": 194647, "epoch": 4634} {"train_loss": -6.971790790557861, "global_step": 194648, "epoch": 4634} {"train_loss": -7.028602600097656, "global_step": 194649, "epoch": 4634} {"train_loss": -7.002348899841309, "global_step": 194650, "epoch": 4634} {"train_loss": -7.088522434234619, "global_step": 194651, "epoch": 4634} {"train_loss": -7.1013689041137695, "global_step": 194652, "epoch": 4634} {"train_loss": -7.066449165344238, "global_step": 194653, "epoch": 4634} {"train_loss": -7.214812278747559, "global_step": 194654, "epoch": 4634} {"train_loss": -7.067919731140137, "global_step": 194655, "epoch": 4634} {"train_loss": -7.1067657470703125, "global_step": 194656, "epoch": 4634} {"train_loss": -7.118298530578613, "global_step": 194657, "epoch": 4634} {"train_loss": -7.07068395614624, "global_step": 194658, "epoch": 4634} {"train_loss": -7.16709041595459, "global_step": 194659, "epoch": 4634} {"train_loss": -7.227102756500244, "global_step": 194660, "epoch": 4634} {"train_loss": -7.095163822174072, "global_step": 194661, "epoch": 4634} {"train_loss": -7.167695045471191, "global_step": 194662, "epoch": 4634} {"train_loss": -7.224599361419678, "global_step": 194663, "epoch": 4634} {"train_loss": -7.206259250640869, "global_step": 194664, "epoch": 4634} {"train_loss": -7.260784149169922, "global_step": 194665, "epoch": 4634} {"train_loss": -7.2242655754089355, "global_step": 194666, "epoch": 4634} {"train_loss": -7.2274088859558105, "global_step": 194667, "epoch": 4634} {"train_loss": -7.162989616394043, "global_step": 194668, "epoch": 4634} {"train_loss": -7.068305072330293, "global_step": 194669, "epoch": 4634, "val_loss": 69085.671875} {"train_loss": -7.23133659362793, "global_step": 194670, "epoch": 4635} {"train_loss": -7.294175148010254, "global_step": 194671, "epoch": 4635} {"train_loss": -7.147622108459473, "global_step": 194672, "epoch": 4635} {"train_loss": -7.213881492614746, "global_step": 194673, "epoch": 4635} {"train_loss": -7.099046230316162, "global_step": 194674, "epoch": 4635} {"train_loss": -7.096467018127441, "global_step": 194675, "epoch": 4635} {"train_loss": -7.284858703613281, "global_step": 194676, "epoch": 4635} {"train_loss": -7.196802139282227, "global_step": 194677, "epoch": 4635} {"train_loss": -7.1704254150390625, "global_step": 194678, "epoch": 4635} {"train_loss": -7.322042942047119, "global_step": 194679, "epoch": 4635} {"train_loss": -7.131378173828125, "global_step": 194680, "epoch": 4635} {"train_loss": -7.225610256195068, "global_step": 194681, "epoch": 4635} {"train_loss": -7.165399551391602, "global_step": 194682, "epoch": 4635} {"train_loss": -7.339934349060059, "global_step": 194683, "epoch": 4635} {"train_loss": -7.10243558883667, "global_step": 194684, "epoch": 4635} {"train_loss": -7.175893783569336, "global_step": 194685, "epoch": 4635} {"train_loss": -7.210862159729004, "global_step": 194686, "epoch": 4635} {"train_loss": -7.168416500091553, "global_step": 194687, "epoch": 4635} {"train_loss": -7.076556205749512, "global_step": 194688, "epoch": 4635} {"train_loss": -7.219718933105469, "global_step": 194689, "epoch": 4635} {"train_loss": -7.152829170227051, "global_step": 194690, "epoch": 4635} {"train_loss": -7.200433731079102, "global_step": 194691, "epoch": 4635} {"train_loss": -7.1516242027282715, "global_step": 194692, "epoch": 4635} {"train_loss": -7.211337089538574, "global_step": 194693, "epoch": 4635} {"train_loss": -7.092695713043213, "global_step": 194694, "epoch": 4635} {"train_loss": -7.144362449645996, "global_step": 194695, "epoch": 4635} {"train_loss": -7.126178741455078, "global_step": 194696, "epoch": 4635} {"train_loss": -7.185600280761719, "global_step": 194697, "epoch": 4635} {"train_loss": -7.1936187744140625, "global_step": 194698, "epoch": 4635} {"train_loss": -7.139425277709961, "global_step": 194699, "epoch": 4635} {"train_loss": -7.241083145141602, "global_step": 194700, "epoch": 4635} {"train_loss": -7.225143909454346, "global_step": 194701, "epoch": 4635} {"train_loss": -7.235602855682373, "global_step": 194702, "epoch": 4635} {"train_loss": -7.218883037567139, "global_step": 194703, "epoch": 4635} {"train_loss": -7.10465145111084, "global_step": 194704, "epoch": 4635} {"train_loss": -7.130518436431885, "global_step": 194705, "epoch": 4635} {"train_loss": -7.247893810272217, "global_step": 194706, "epoch": 4635} {"train_loss": -7.277495861053467, "global_step": 194707, "epoch": 4635} {"train_loss": -7.219213485717773, "global_step": 194708, "epoch": 4635} {"train_loss": -7.18682861328125, "global_step": 194709, "epoch": 4635} {"train_loss": -7.244588851928711, "global_step": 194710, "epoch": 4635} {"train_loss": -7.189031680425008, "global_step": 194711, "epoch": 4635, "val_loss": 68944.6796875} {"train_loss": -7.329689025878906, "global_step": 194712, "epoch": 4636} {"train_loss": -7.182809352874756, "global_step": 194713, "epoch": 4636} {"train_loss": -7.28527307510376, "global_step": 194714, "epoch": 4636} {"train_loss": -7.232350826263428, "global_step": 194715, "epoch": 4636} {"train_loss": -7.2606306076049805, "global_step": 194716, "epoch": 4636} {"train_loss": -7.071276664733887, "global_step": 194717, "epoch": 4636} {"train_loss": -7.234370231628418, "global_step": 194718, "epoch": 4636} {"train_loss": -7.217090606689453, "global_step": 194719, "epoch": 4636} {"train_loss": -7.245384216308594, "global_step": 194720, "epoch": 4636} {"train_loss": -7.2603759765625, "global_step": 194721, "epoch": 4636} {"train_loss": -7.37637186050415, "global_step": 194722, "epoch": 4636} {"train_loss": -7.17842960357666, "global_step": 194723, "epoch": 4636} {"train_loss": -7.138538360595703, "global_step": 194724, "epoch": 4636} {"train_loss": -7.110535621643066, "global_step": 194725, "epoch": 4636} {"train_loss": -7.102884292602539, "global_step": 194726, "epoch": 4636} {"train_loss": -7.144435882568359, "global_step": 194727, "epoch": 4636} {"train_loss": -7.23098087310791, "global_step": 194728, "epoch": 4636} {"train_loss": -7.02063512802124, "global_step": 194729, "epoch": 4636} {"train_loss": -7.183981418609619, "global_step": 194730, "epoch": 4636} {"train_loss": -7.14620304107666, "global_step": 194731, "epoch": 4636} {"train_loss": -7.144519805908203, "global_step": 194732, "epoch": 4636} {"train_loss": -7.166674613952637, "global_step": 194733, "epoch": 4636} {"train_loss": -7.055600166320801, "global_step": 194734, "epoch": 4636} {"train_loss": -7.121419906616211, "global_step": 194735, "epoch": 4636} {"train_loss": -7.036122798919678, "global_step": 194736, "epoch": 4636} {"train_loss": -7.111598968505859, "global_step": 194737, "epoch": 4636} {"train_loss": -7.163945198059082, "global_step": 194738, "epoch": 4636} {"train_loss": -7.128995418548584, "global_step": 194739, "epoch": 4636} {"train_loss": -7.1412858963012695, "global_step": 194740, "epoch": 4636} {"train_loss": -7.136715888977051, "global_step": 194741, "epoch": 4636} {"train_loss": -6.993390083312988, "global_step": 194742, "epoch": 4636} {"train_loss": -7.108821868896484, "global_step": 194743, "epoch": 4636} {"train_loss": -7.0877838134765625, "global_step": 194744, "epoch": 4636} {"train_loss": -6.900403022766113, "global_step": 194745, "epoch": 4636} {"train_loss": -7.114297866821289, "global_step": 194746, "epoch": 4636} {"train_loss": -6.972708702087402, "global_step": 194747, "epoch": 4636} {"train_loss": -7.162692546844482, "global_step": 194748, "epoch": 4636} {"train_loss": -6.986405372619629, "global_step": 194749, "epoch": 4636} {"train_loss": -6.986322402954102, "global_step": 194750, "epoch": 4636} {"train_loss": -7.135283470153809, "global_step": 194751, "epoch": 4636} {"train_loss": -7.049356460571289, "global_step": 194752, "epoch": 4636} {"train_loss": -7.136836290359497, "global_step": 194753, "epoch": 4636, "val_loss": 69055.0078125} {"train_loss": -7.049725532531738, "global_step": 194754, "epoch": 4637} {"train_loss": -7.030764102935791, "global_step": 194755, "epoch": 4637} {"train_loss": -7.076714992523193, "global_step": 194756, "epoch": 4637} {"train_loss": -7.12664794921875, "global_step": 194757, "epoch": 4637} {"train_loss": -7.136434555053711, "global_step": 194758, "epoch": 4637} {"train_loss": -7.206533432006836, "global_step": 194759, "epoch": 4637} {"train_loss": -7.027518272399902, "global_step": 194760, "epoch": 4637} {"train_loss": -7.186117172241211, "global_step": 194761, "epoch": 4637} {"train_loss": -7.091053009033203, "global_step": 194762, "epoch": 4637} {"train_loss": -7.261119842529297, "global_step": 194763, "epoch": 4637} {"train_loss": -7.179628372192383, "global_step": 194764, "epoch": 4637} {"train_loss": -7.192216873168945, "global_step": 194765, "epoch": 4637} {"train_loss": -7.1606035232543945, "global_step": 194766, "epoch": 4637} {"train_loss": -7.13245964050293, "global_step": 194767, "epoch": 4637} {"train_loss": -7.204561710357666, "global_step": 194768, "epoch": 4637} {"train_loss": -7.19111442565918, "global_step": 194769, "epoch": 4637} {"train_loss": -7.055509567260742, "global_step": 194770, "epoch": 4637} {"train_loss": -7.124270439147949, "global_step": 194771, "epoch": 4637} {"train_loss": -7.213529586791992, "global_step": 194772, "epoch": 4637} {"train_loss": -7.106984615325928, "global_step": 194773, "epoch": 4637} {"train_loss": -7.220236778259277, "global_step": 194774, "epoch": 4637} {"train_loss": -7.129708290100098, "global_step": 194775, "epoch": 4637} {"train_loss": -7.2034912109375, "global_step": 194776, "epoch": 4637} {"train_loss": -7.265620231628418, "global_step": 194777, "epoch": 4637} {"train_loss": -7.260310173034668, "global_step": 194778, "epoch": 4637} {"train_loss": -7.317450523376465, "global_step": 194779, "epoch": 4637} {"train_loss": -7.21574592590332, "global_step": 194780, "epoch": 4637} {"train_loss": -7.286572456359863, "global_step": 194781, "epoch": 4637} {"train_loss": -7.157661437988281, "global_step": 194782, "epoch": 4637} {"train_loss": -7.136412620544434, "global_step": 194783, "epoch": 4637} {"train_loss": -7.170730113983154, "global_step": 194784, "epoch": 4637} {"train_loss": -7.2074785232543945, "global_step": 194785, "epoch": 4637} {"train_loss": -7.288283348083496, "global_step": 194786, "epoch": 4637} {"train_loss": -7.230010986328125, "global_step": 194787, "epoch": 4637} {"train_loss": -7.170169353485107, "global_step": 194788, "epoch": 4637} {"train_loss": -7.108375072479248, "global_step": 194789, "epoch": 4637} {"train_loss": -7.268916130065918, "global_step": 194790, "epoch": 4637} {"train_loss": -7.298249244689941, "global_step": 194791, "epoch": 4637} {"train_loss": -7.274951457977295, "global_step": 194792, "epoch": 4637} {"train_loss": -7.242369651794434, "global_step": 194793, "epoch": 4637} {"train_loss": -7.2166266441345215, "global_step": 194794, "epoch": 4637} {"train_loss": -7.183244784673055, "global_step": 194795, "epoch": 4637, "val_loss": 68967.578125} {"train_loss": -7.176397800445557, "global_step": 194796, "epoch": 4638} {"train_loss": -7.235637664794922, "global_step": 194797, "epoch": 4638} {"train_loss": -7.300132751464844, "global_step": 194798, "epoch": 4638} {"train_loss": -7.140310287475586, "global_step": 194799, "epoch": 4638} {"train_loss": -7.210871696472168, "global_step": 194800, "epoch": 4638} {"train_loss": -7.047811508178711, "global_step": 194801, "epoch": 4638} {"train_loss": -7.067537784576416, "global_step": 194802, "epoch": 4638} {"train_loss": -7.2074079513549805, "global_step": 194803, "epoch": 4638} {"train_loss": -7.196551322937012, "global_step": 194804, "epoch": 4638} {"train_loss": -7.209029197692871, "global_step": 194805, "epoch": 4638} {"train_loss": -7.189552307128906, "global_step": 194806, "epoch": 4638} {"train_loss": -7.215991020202637, "global_step": 194807, "epoch": 4638} {"train_loss": -7.246055603027344, "global_step": 194808, "epoch": 4638} {"train_loss": -7.246077537536621, "global_step": 194809, "epoch": 4638} {"train_loss": -7.206691265106201, "global_step": 194810, "epoch": 4638} {"train_loss": -7.2376203536987305, "global_step": 194811, "epoch": 4638} {"train_loss": -7.236528396606445, "global_step": 194812, "epoch": 4638} {"train_loss": -7.302785396575928, "global_step": 194813, "epoch": 4638} {"train_loss": -7.217190265655518, "global_step": 194814, "epoch": 4638} {"train_loss": -7.197929382324219, "global_step": 194815, "epoch": 4638} {"train_loss": -7.00035285949707, "global_step": 194816, "epoch": 4638} {"train_loss": -7.182613372802734, "global_step": 194817, "epoch": 4638} {"train_loss": -7.243515968322754, "global_step": 194818, "epoch": 4638} {"train_loss": -7.127336502075195, "global_step": 194819, "epoch": 4638} {"train_loss": -7.1819915771484375, "global_step": 194820, "epoch": 4638} {"train_loss": -7.200767993927002, "global_step": 194821, "epoch": 4638} {"train_loss": -7.07200288772583, "global_step": 194822, "epoch": 4638} {"train_loss": -7.01542329788208, "global_step": 194823, "epoch": 4638} {"train_loss": -7.123838424682617, "global_step": 194824, "epoch": 4638} {"train_loss": -7.0807294845581055, "global_step": 194825, "epoch": 4638} {"train_loss": -7.059053421020508, "global_step": 194826, "epoch": 4638} {"train_loss": -7.219142436981201, "global_step": 194827, "epoch": 4638} {"train_loss": -7.0795793533325195, "global_step": 194828, "epoch": 4638} {"train_loss": -7.011476993560791, "global_step": 194829, "epoch": 4638} {"train_loss": -7.063224792480469, "global_step": 194830, "epoch": 4638} {"train_loss": -7.087126731872559, "global_step": 194831, "epoch": 4638} {"train_loss": -6.910453796386719, "global_step": 194832, "epoch": 4638} {"train_loss": -7.140843391418457, "global_step": 194833, "epoch": 4638} {"train_loss": -6.910236358642578, "global_step": 194834, "epoch": 4638} {"train_loss": -7.106136798858643, "global_step": 194835, "epoch": 4638} {"train_loss": -7.0798468589782715, "global_step": 194836, "epoch": 4638} {"train_loss": -7.142138208661761, "global_step": 194837, "epoch": 4638, "val_loss": 69099.765625} {"train_loss": -7.106749057769775, "global_step": 194838, "epoch": 4639} {"train_loss": -7.0063066482543945, "global_step": 194839, "epoch": 4639} {"train_loss": -7.040344715118408, "global_step": 194840, "epoch": 4639} {"train_loss": -7.053112983703613, "global_step": 194841, "epoch": 4639} {"train_loss": -7.016594409942627, "global_step": 194842, "epoch": 4639} {"train_loss": -6.9773149490356445, "global_step": 194843, "epoch": 4639} {"train_loss": -7.255135536193848, "global_step": 194844, "epoch": 4639} {"train_loss": -6.89824104309082, "global_step": 194845, "epoch": 4639} {"train_loss": -7.184417724609375, "global_step": 194846, "epoch": 4639} {"train_loss": -7.011682510375977, "global_step": 194847, "epoch": 4639} {"train_loss": -7.140398025512695, "global_step": 194848, "epoch": 4639} {"train_loss": -6.955129623413086, "global_step": 194849, "epoch": 4639} {"train_loss": -7.088798522949219, "global_step": 194850, "epoch": 4639} {"train_loss": -7.119442939758301, "global_step": 194851, "epoch": 4639} {"train_loss": -7.0945210456848145, "global_step": 194852, "epoch": 4639} {"train_loss": -7.0939226150512695, "global_step": 194853, "epoch": 4639} {"train_loss": -7.096541404724121, "global_step": 194854, "epoch": 4639} {"train_loss": -6.9316840171813965, "global_step": 194855, "epoch": 4639} {"train_loss": -7.083068370819092, "global_step": 194856, "epoch": 4639} {"train_loss": -6.970499515533447, "global_step": 194857, "epoch": 4639} {"train_loss": -7.151140213012695, "global_step": 194858, "epoch": 4639} {"train_loss": -7.129640579223633, "global_step": 194859, "epoch": 4639} {"train_loss": -7.048519611358643, "global_step": 194860, "epoch": 4639} {"train_loss": -7.005791664123535, "global_step": 194861, "epoch": 4639} {"train_loss": -7.084598064422607, "global_step": 194862, "epoch": 4639} {"train_loss": -7.047941207885742, "global_step": 194863, "epoch": 4639} {"train_loss": -7.132565975189209, "global_step": 194864, "epoch": 4639} {"train_loss": -7.183905601501465, "global_step": 194865, "epoch": 4639} {"train_loss": -7.048624038696289, "global_step": 194866, "epoch": 4639} {"train_loss": -7.016071796417236, "global_step": 194867, "epoch": 4639} {"train_loss": -7.26625919342041, "global_step": 194868, "epoch": 4639} {"train_loss": -7.000304222106934, "global_step": 194869, "epoch": 4639} {"train_loss": -7.075340270996094, "global_step": 194870, "epoch": 4639} {"train_loss": -7.137847423553467, "global_step": 194871, "epoch": 4639} {"train_loss": -7.108158111572266, "global_step": 194872, "epoch": 4639} {"train_loss": -7.013258934020996, "global_step": 194873, "epoch": 4639} {"train_loss": -7.129538536071777, "global_step": 194874, "epoch": 4639} {"train_loss": -7.04789924621582, "global_step": 194875, "epoch": 4639} {"train_loss": -7.0779948234558105, "global_step": 194876, "epoch": 4639} {"train_loss": -6.97285270690918, "global_step": 194877, "epoch": 4639} {"train_loss": -7.117210865020752, "global_step": 194878, "epoch": 4639} {"train_loss": -7.068680127461751, "global_step": 194879, "epoch": 4639, "val_loss": 69130.8046875} {"train_loss": -7.111814022064209, "global_step": 194880, "epoch": 4640} {"train_loss": -7.108417510986328, "global_step": 194881, "epoch": 4640} {"train_loss": -7.073740482330322, "global_step": 194882, "epoch": 4640} {"train_loss": -7.165561676025391, "global_step": 194883, "epoch": 4640} {"train_loss": -6.9316205978393555, "global_step": 194884, "epoch": 4640} {"train_loss": -7.093625068664551, "global_step": 194885, "epoch": 4640} {"train_loss": -7.048534393310547, "global_step": 194886, "epoch": 4640} {"train_loss": -7.290488243103027, "global_step": 194887, "epoch": 4640} {"train_loss": -7.1050825119018555, "global_step": 194888, "epoch": 4640} {"train_loss": -7.08131217956543, "global_step": 194889, "epoch": 4640} {"train_loss": -7.079109191894531, "global_step": 194890, "epoch": 4640} {"train_loss": -7.205148696899414, "global_step": 194891, "epoch": 4640} {"train_loss": -7.109281539916992, "global_step": 194892, "epoch": 4640} {"train_loss": -7.1492156982421875, "global_step": 194893, "epoch": 4640} {"train_loss": -7.113409042358398, "global_step": 194894, "epoch": 4640} {"train_loss": -7.151409149169922, "global_step": 194895, "epoch": 4640} {"train_loss": -7.175434112548828, "global_step": 194896, "epoch": 4640} {"train_loss": -7.086298942565918, "global_step": 194897, "epoch": 4640} {"train_loss": -7.299442768096924, "global_step": 194898, "epoch": 4640} {"train_loss": -7.17017936706543, "global_step": 194899, "epoch": 4640} {"train_loss": -7.174672603607178, "global_step": 194900, "epoch": 4640} {"train_loss": -7.114696502685547, "global_step": 194901, "epoch": 4640} {"train_loss": -7.136292457580566, "global_step": 194902, "epoch": 4640} {"train_loss": -7.346569061279297, "global_step": 194903, "epoch": 4640} {"train_loss": -7.152400016784668, "global_step": 194904, "epoch": 4640} {"train_loss": -7.1497602462768555, "global_step": 194905, "epoch": 4640} {"train_loss": -7.198055267333984, "global_step": 194906, "epoch": 4640} {"train_loss": -7.136144638061523, "global_step": 194907, "epoch": 4640} {"train_loss": -7.182042598724365, "global_step": 194908, "epoch": 4640} {"train_loss": -7.235960960388184, "global_step": 194909, "epoch": 4640} {"train_loss": -7.26877498626709, "global_step": 194910, "epoch": 4640} {"train_loss": -7.15419864654541, "global_step": 194911, "epoch": 4640} {"train_loss": -7.198459148406982, "global_step": 194912, "epoch": 4640} {"train_loss": -7.177556991577148, "global_step": 194913, "epoch": 4640} {"train_loss": -7.233837127685547, "global_step": 194914, "epoch": 4640} {"train_loss": -7.139152526855469, "global_step": 194915, "epoch": 4640} {"train_loss": -7.305668830871582, "global_step": 194916, "epoch": 4640} {"train_loss": -7.179571151733398, "global_step": 194917, "epoch": 4640} {"train_loss": -7.281671524047852, "global_step": 194918, "epoch": 4640} {"train_loss": -7.20020866394043, "global_step": 194919, "epoch": 4640} {"train_loss": -7.212002754211426, "global_step": 194920, "epoch": 4640} {"train_loss": -7.165166014716739, "global_step": 194921, "epoch": 4640, "val_loss": 68990.3046875} {"train_loss": -7.26762580871582, "global_step": 194922, "epoch": 4641} {"train_loss": -7.2410078048706055, "global_step": 194923, "epoch": 4641} {"train_loss": -7.230225563049316, "global_step": 194924, "epoch": 4641} {"train_loss": -7.202176570892334, "global_step": 194925, "epoch": 4641} {"train_loss": -7.202310562133789, "global_step": 194926, "epoch": 4641} {"train_loss": -7.234768867492676, "global_step": 194927, "epoch": 4641} {"train_loss": -7.207662105560303, "global_step": 194928, "epoch": 4641} {"train_loss": -7.231266498565674, "global_step": 194929, "epoch": 4641} {"train_loss": -7.295042991638184, "global_step": 194930, "epoch": 4641} {"train_loss": -7.165530204772949, "global_step": 194931, "epoch": 4641} {"train_loss": -7.2503204345703125, "global_step": 194932, "epoch": 4641} {"train_loss": -7.124102592468262, "global_step": 194933, "epoch": 4641} {"train_loss": -7.322920799255371, "global_step": 194934, "epoch": 4641} {"train_loss": -7.136689186096191, "global_step": 194935, "epoch": 4641} {"train_loss": -7.151396751403809, "global_step": 194936, "epoch": 4641} {"train_loss": -7.268117904663086, "global_step": 194937, "epoch": 4641} {"train_loss": -7.252904891967773, "global_step": 194938, "epoch": 4641} {"train_loss": -7.223516464233398, "global_step": 194939, "epoch": 4641} {"train_loss": -7.20301628112793, "global_step": 194940, "epoch": 4641} {"train_loss": -7.330970287322998, "global_step": 194941, "epoch": 4641} {"train_loss": -7.234277248382568, "global_step": 194942, "epoch": 4641} {"train_loss": -7.227622032165527, "global_step": 194943, "epoch": 4641} {"train_loss": -7.268065929412842, "global_step": 194944, "epoch": 4641} {"train_loss": -7.171773433685303, "global_step": 194945, "epoch": 4641} {"train_loss": -7.218750953674316, "global_step": 194946, "epoch": 4641} {"train_loss": -7.192915916442871, "global_step": 194947, "epoch": 4641} {"train_loss": -7.20129919052124, "global_step": 194948, "epoch": 4641} {"train_loss": -7.262378692626953, "global_step": 194949, "epoch": 4641} {"train_loss": -7.192441940307617, "global_step": 194950, "epoch": 4641} {"train_loss": -7.264085292816162, "global_step": 194951, "epoch": 4641} {"train_loss": -7.182003021240234, "global_step": 194952, "epoch": 4641} {"train_loss": -7.263889312744141, "global_step": 194953, "epoch": 4641} {"train_loss": -7.217747211456299, "global_step": 194954, "epoch": 4641} {"train_loss": -7.154387474060059, "global_step": 194955, "epoch": 4641} {"train_loss": -7.278177261352539, "global_step": 194956, "epoch": 4641} {"train_loss": -7.321408748626709, "global_step": 194957, "epoch": 4641} {"train_loss": -7.3656768798828125, "global_step": 194958, "epoch": 4641} {"train_loss": -7.230281829833984, "global_step": 194959, "epoch": 4641} {"train_loss": -7.180360794067383, "global_step": 194960, "epoch": 4641} {"train_loss": -7.277647495269775, "global_step": 194961, "epoch": 4641} {"train_loss": -7.250471591949463, "global_step": 194962, "epoch": 4641} {"train_loss": -7.229943831761678, "global_step": 194963, "epoch": 4641, "val_loss": 68956.5546875} {"train_loss": -7.196907043457031, "global_step": 194964, "epoch": 4642} {"train_loss": -7.113031387329102, "global_step": 194965, "epoch": 4642} {"train_loss": -7.2602691650390625, "global_step": 194966, "epoch": 4642} {"train_loss": -7.21282958984375, "global_step": 194967, "epoch": 4642} {"train_loss": -7.250034332275391, "global_step": 194968, "epoch": 4642} {"train_loss": -7.334053039550781, "global_step": 194969, "epoch": 4642} {"train_loss": -7.007955074310303, "global_step": 194970, "epoch": 4642} {"train_loss": -7.172382831573486, "global_step": 194971, "epoch": 4642} {"train_loss": -7.132168292999268, "global_step": 194972, "epoch": 4642} {"train_loss": -6.973197937011719, "global_step": 194973, "epoch": 4642} {"train_loss": -7.059513092041016, "global_step": 194974, "epoch": 4642} {"train_loss": -7.209112167358398, "global_step": 194975, "epoch": 4642} {"train_loss": -7.063088417053223, "global_step": 194976, "epoch": 4642} {"train_loss": -7.241165637969971, "global_step": 194977, "epoch": 4642} {"train_loss": -7.165672302246094, "global_step": 194978, "epoch": 4642} {"train_loss": -7.178163528442383, "global_step": 194979, "epoch": 4642} {"train_loss": -7.2136030197143555, "global_step": 194980, "epoch": 4642} {"train_loss": -7.187682628631592, "global_step": 194981, "epoch": 4642} {"train_loss": -7.228726863861084, "global_step": 194982, "epoch": 4642} {"train_loss": -7.231330871582031, "global_step": 194983, "epoch": 4642} {"train_loss": -7.188787460327148, "global_step": 194984, "epoch": 4642} {"train_loss": -7.170128345489502, "global_step": 194985, "epoch": 4642} {"train_loss": -7.371937274932861, "global_step": 194986, "epoch": 4642} {"train_loss": -7.12080192565918, "global_step": 194987, "epoch": 4642} {"train_loss": -7.135512828826904, "global_step": 194988, "epoch": 4642} {"train_loss": -7.25705099105835, "global_step": 194989, "epoch": 4642} {"train_loss": -7.1562089920043945, "global_step": 194990, "epoch": 4642} {"train_loss": -7.2989091873168945, "global_step": 194991, "epoch": 4642} {"train_loss": -7.268793106079102, "global_step": 194992, "epoch": 4642} {"train_loss": -7.13571834564209, "global_step": 194993, "epoch": 4642} {"train_loss": -7.257658958435059, "global_step": 194994, "epoch": 4642} {"train_loss": -7.218315601348877, "global_step": 194995, "epoch": 4642} {"train_loss": -7.2400970458984375, "global_step": 194996, "epoch": 4642} {"train_loss": -7.205020904541016, "global_step": 194997, "epoch": 4642} {"train_loss": -7.191492080688477, "global_step": 194998, "epoch": 4642} {"train_loss": -7.2019195556640625, "global_step": 194999, "epoch": 4642} {"train_loss": -7.26669454574585, "global_step": 195000, "epoch": 4642} {"train_loss": -7.150763034820557, "global_step": 195001, "epoch": 4642} {"train_loss": -7.145473480224609, "global_step": 195002, "epoch": 4642} {"train_loss": -7.171821594238281, "global_step": 195003, "epoch": 4642} {"train_loss": -7.22260856628418, "global_step": 195004, "epoch": 4642} {"train_loss": -7.190889347167242, "global_step": 195005, "epoch": 4642, "val_loss": 69040.65625} {"train_loss": -7.206647872924805, "global_step": 195006, "epoch": 4643} {"train_loss": -7.345364093780518, "global_step": 195007, "epoch": 4643} {"train_loss": -7.2737884521484375, "global_step": 195008, "epoch": 4643} {"train_loss": -7.15598201751709, "global_step": 195009, "epoch": 4643} {"train_loss": -7.155874729156494, "global_step": 195010, "epoch": 4643} {"train_loss": -7.308986663818359, "global_step": 195011, "epoch": 4643} {"train_loss": -7.184648513793945, "global_step": 195012, "epoch": 4643} {"train_loss": -7.014456748962402, "global_step": 195013, "epoch": 4643} {"train_loss": -7.040898323059082, "global_step": 195014, "epoch": 4643} {"train_loss": -6.929180145263672, "global_step": 195015, "epoch": 4643} {"train_loss": -6.849373817443848, "global_step": 195016, "epoch": 4643} {"train_loss": -7.144521713256836, "global_step": 195017, "epoch": 4643} {"train_loss": -6.7708539962768555, "global_step": 195018, "epoch": 4643} {"train_loss": -7.00186014175415, "global_step": 195019, "epoch": 4643} {"train_loss": -7.110038757324219, "global_step": 195020, "epoch": 4643} {"train_loss": -6.9971160888671875, "global_step": 195021, "epoch": 4643} {"train_loss": -7.145601272583008, "global_step": 195022, "epoch": 4643} {"train_loss": -6.983377933502197, "global_step": 195023, "epoch": 4643} {"train_loss": -7.140949249267578, "global_step": 195024, "epoch": 4643} {"train_loss": -6.9214372634887695, "global_step": 195025, "epoch": 4643} {"train_loss": -7.061461925506592, "global_step": 195026, "epoch": 4643} {"train_loss": -7.00072717666626, "global_step": 195027, "epoch": 4643} {"train_loss": -6.95329475402832, "global_step": 195028, "epoch": 4643} {"train_loss": -7.086348533630371, "global_step": 195029, "epoch": 4643} {"train_loss": -6.918284893035889, "global_step": 195030, "epoch": 4643} {"train_loss": -7.149783134460449, "global_step": 195031, "epoch": 4643} {"train_loss": -6.880624771118164, "global_step": 195032, "epoch": 4643} {"train_loss": -7.060506820678711, "global_step": 195033, "epoch": 4643} {"train_loss": -6.955708026885986, "global_step": 195034, "epoch": 4643} {"train_loss": -7.155920028686523, "global_step": 195035, "epoch": 4643} {"train_loss": -6.948478698730469, "global_step": 195036, "epoch": 4643} {"train_loss": -7.056405067443848, "global_step": 195037, "epoch": 4643} {"train_loss": -7.095438003540039, "global_step": 195038, "epoch": 4643} {"train_loss": -7.016761302947998, "global_step": 195039, "epoch": 4643} {"train_loss": -7.036759376525879, "global_step": 195040, "epoch": 4643} {"train_loss": -7.060041427612305, "global_step": 195041, "epoch": 4643} {"train_loss": -7.072449684143066, "global_step": 195042, "epoch": 4643} {"train_loss": -7.017786979675293, "global_step": 195043, "epoch": 4643} {"train_loss": -7.158699035644531, "global_step": 195044, "epoch": 4643} {"train_loss": -7.101103782653809, "global_step": 195045, "epoch": 4643} {"train_loss": -7.122645378112793, "global_step": 195046, "epoch": 4643} {"train_loss": -7.060115121659779, "global_step": 195047, "epoch": 4643, "val_loss": 69128.6640625} {"train_loss": -7.144522666931152, "global_step": 195048, "epoch": 4644} {"train_loss": -7.109407424926758, "global_step": 195049, "epoch": 4644} {"train_loss": -7.062795162200928, "global_step": 195050, "epoch": 4644} {"train_loss": -7.204343795776367, "global_step": 195051, "epoch": 4644} {"train_loss": -7.092128753662109, "global_step": 195052, "epoch": 4644} {"train_loss": -7.1797027587890625, "global_step": 195053, "epoch": 4644} {"train_loss": -7.173575401306152, "global_step": 195054, "epoch": 4644} {"train_loss": -7.1829423904418945, "global_step": 195055, "epoch": 4644} {"train_loss": -7.19503116607666, "global_step": 195056, "epoch": 4644} {"train_loss": -7.186032295227051, "global_step": 195057, "epoch": 4644} {"train_loss": -7.14381742477417, "global_step": 195058, "epoch": 4644} {"train_loss": -7.199235916137695, "global_step": 195059, "epoch": 4644} {"train_loss": -7.218584060668945, "global_step": 195060, "epoch": 4644} {"train_loss": -7.1067962646484375, "global_step": 195061, "epoch": 4644} {"train_loss": -7.249016761779785, "global_step": 195062, "epoch": 4644} {"train_loss": -7.113760948181152, "global_step": 195063, "epoch": 4644} {"train_loss": -7.233697891235352, "global_step": 195064, "epoch": 4644} {"train_loss": -7.27862024307251, "global_step": 195065, "epoch": 4644} {"train_loss": -7.162877559661865, "global_step": 195066, "epoch": 4644} {"train_loss": -7.237030982971191, "global_step": 195067, "epoch": 4644} {"train_loss": -7.236294746398926, "global_step": 195068, "epoch": 4644} {"train_loss": -7.222023963928223, "global_step": 195069, "epoch": 4644} {"train_loss": -7.2928924560546875, "global_step": 195070, "epoch": 4644} {"train_loss": -7.27344274520874, "global_step": 195071, "epoch": 4644} {"train_loss": -7.210456848144531, "global_step": 195072, "epoch": 4644} {"train_loss": -7.258094787597656, "global_step": 195073, "epoch": 4644} {"train_loss": -7.324413776397705, "global_step": 195074, "epoch": 4644} {"train_loss": -7.2523322105407715, "global_step": 195075, "epoch": 4644} {"train_loss": -7.166849136352539, "global_step": 195076, "epoch": 4644} {"train_loss": -7.3433308601379395, "global_step": 195077, "epoch": 4644} {"train_loss": -7.136183261871338, "global_step": 195078, "epoch": 4644} {"train_loss": -7.290604591369629, "global_step": 195079, "epoch": 4644} {"train_loss": -7.276834487915039, "global_step": 195080, "epoch": 4644} {"train_loss": -7.183649063110352, "global_step": 195081, "epoch": 4644} {"train_loss": -7.138300895690918, "global_step": 195082, "epoch": 4644} {"train_loss": -7.217354774475098, "global_step": 195083, "epoch": 4644} {"train_loss": -7.079809665679932, "global_step": 195084, "epoch": 4644} {"train_loss": -7.3071699142456055, "global_step": 195085, "epoch": 4644} {"train_loss": -7.209506034851074, "global_step": 195086, "epoch": 4644} {"train_loss": -7.163590431213379, "global_step": 195087, "epoch": 4644} {"train_loss": -7.317087173461914, "global_step": 195088, "epoch": 4644} {"train_loss": -7.2052835282825285, "global_step": 195089, "epoch": 4644, "val_loss": 69135.7421875} {"train_loss": -7.243635177612305, "global_step": 195090, "epoch": 4645} {"train_loss": -7.258170127868652, "global_step": 195091, "epoch": 4645} {"train_loss": -7.161311149597168, "global_step": 195092, "epoch": 4645} {"train_loss": -7.235034942626953, "global_step": 195093, "epoch": 4645} {"train_loss": -7.266724109649658, "global_step": 195094, "epoch": 4645} {"train_loss": -7.158840179443359, "global_step": 195095, "epoch": 4645} {"train_loss": -7.258961200714111, "global_step": 195096, "epoch": 4645} {"train_loss": -7.242434501647949, "global_step": 195097, "epoch": 4645} {"train_loss": -7.283555030822754, "global_step": 195098, "epoch": 4645} {"train_loss": -7.239099502563477, "global_step": 195099, "epoch": 4645} {"train_loss": -7.271847724914551, "global_step": 195100, "epoch": 4645} {"train_loss": -7.38311767578125, "global_step": 195101, "epoch": 4645} {"train_loss": -7.190973281860352, "global_step": 195102, "epoch": 4645} {"train_loss": -7.256854057312012, "global_step": 195103, "epoch": 4645} {"train_loss": -7.203354835510254, "global_step": 195104, "epoch": 4645} {"train_loss": -7.260138511657715, "global_step": 195105, "epoch": 4645} {"train_loss": -7.216326713562012, "global_step": 195106, "epoch": 4645} {"train_loss": -7.1959357261657715, "global_step": 195107, "epoch": 4645} {"train_loss": -7.179287433624268, "global_step": 195108, "epoch": 4645} {"train_loss": -7.2919816970825195, "global_step": 195109, "epoch": 4645} {"train_loss": -7.291801929473877, "global_step": 195110, "epoch": 4645} {"train_loss": -7.113612651824951, "global_step": 195111, "epoch": 4645} {"train_loss": -7.280517101287842, "global_step": 195112, "epoch": 4645} {"train_loss": -7.23828649520874, "global_step": 195113, "epoch": 4645} {"train_loss": -7.327207565307617, "global_step": 195114, "epoch": 4645} {"train_loss": -7.203334808349609, "global_step": 195115, "epoch": 4645} {"train_loss": -7.069604873657227, "global_step": 195116, "epoch": 4645} {"train_loss": -7.197192668914795, "global_step": 195117, "epoch": 4645} {"train_loss": -7.087430000305176, "global_step": 195118, "epoch": 4645} {"train_loss": -7.036288261413574, "global_step": 195119, "epoch": 4645} {"train_loss": -7.199905872344971, "global_step": 195120, "epoch": 4645} {"train_loss": -7.1256022453308105, "global_step": 195121, "epoch": 4645} {"train_loss": -7.201105117797852, "global_step": 195122, "epoch": 4645} {"train_loss": -7.145623207092285, "global_step": 195123, "epoch": 4645} {"train_loss": -6.9945783615112305, "global_step": 195124, "epoch": 4645} {"train_loss": -7.214339733123779, "global_step": 195125, "epoch": 4645} {"train_loss": -7.0023579597473145, "global_step": 195126, "epoch": 4645} {"train_loss": -7.099686622619629, "global_step": 195127, "epoch": 4645} {"train_loss": -7.197296142578125, "global_step": 195128, "epoch": 4645} {"train_loss": -7.211620330810547, "global_step": 195129, "epoch": 4645} {"train_loss": -7.237934112548828, "global_step": 195130, "epoch": 4645} {"train_loss": -7.20064157531375, "global_step": 195131, "epoch": 4645, "val_loss": 69125.125} {"train_loss": -7.115357398986816, "global_step": 195132, "epoch": 4646} {"train_loss": -7.165659427642822, "global_step": 195133, "epoch": 4646} {"train_loss": -7.113891124725342, "global_step": 195134, "epoch": 4646} {"train_loss": -7.1889448165893555, "global_step": 195135, "epoch": 4646} {"train_loss": -7.217308044433594, "global_step": 195136, "epoch": 4646} {"train_loss": -7.09152364730835, "global_step": 195137, "epoch": 4646} {"train_loss": -7.279024124145508, "global_step": 195138, "epoch": 4646} {"train_loss": -7.1022257804870605, "global_step": 195139, "epoch": 4646} {"train_loss": -7.219169616699219, "global_step": 195140, "epoch": 4646} {"train_loss": -7.133600234985352, "global_step": 195141, "epoch": 4646} {"train_loss": -7.324893951416016, "global_step": 195142, "epoch": 4646} {"train_loss": -7.182557106018066, "global_step": 195143, "epoch": 4646} {"train_loss": -7.264193534851074, "global_step": 195144, "epoch": 4646} {"train_loss": -7.2943267822265625, "global_step": 195145, "epoch": 4646} {"train_loss": -7.294310569763184, "global_step": 195146, "epoch": 4646} {"train_loss": -7.195262908935547, "global_step": 195147, "epoch": 4646} {"train_loss": -7.156028747558594, "global_step": 195148, "epoch": 4646} {"train_loss": -7.139791011810303, "global_step": 195149, "epoch": 4646} {"train_loss": -7.166677474975586, "global_step": 195150, "epoch": 4646} {"train_loss": -7.170862197875977, "global_step": 195151, "epoch": 4646} {"train_loss": -7.222902297973633, "global_step": 195152, "epoch": 4646} {"train_loss": -7.157958030700684, "global_step": 195153, "epoch": 4646} {"train_loss": -7.118934631347656, "global_step": 195154, "epoch": 4646} {"train_loss": -7.169417381286621, "global_step": 195155, "epoch": 4646} {"train_loss": -7.188595771789551, "global_step": 195156, "epoch": 4646} {"train_loss": -7.197395324707031, "global_step": 195157, "epoch": 4646} {"train_loss": -7.196747779846191, "global_step": 195158, "epoch": 4646} {"train_loss": -7.218332290649414, "global_step": 195159, "epoch": 4646} {"train_loss": -7.205703258514404, "global_step": 195160, "epoch": 4646} {"train_loss": -7.184807777404785, "global_step": 195161, "epoch": 4646} {"train_loss": -7.192370414733887, "global_step": 195162, "epoch": 4646} {"train_loss": -7.047855854034424, "global_step": 195163, "epoch": 4646} {"train_loss": -7.058732032775879, "global_step": 195164, "epoch": 4646} {"train_loss": -7.122610092163086, "global_step": 195165, "epoch": 4646} {"train_loss": -7.188331604003906, "global_step": 195166, "epoch": 4646} {"train_loss": -7.094791412353516, "global_step": 195167, "epoch": 4646} {"train_loss": -7.118806838989258, "global_step": 195168, "epoch": 4646} {"train_loss": -7.232193470001221, "global_step": 195169, "epoch": 4646} {"train_loss": -7.0856614112854, "global_step": 195170, "epoch": 4646} {"train_loss": -7.119010925292969, "global_step": 195171, "epoch": 4646} {"train_loss": -7.231449127197266, "global_step": 195172, "epoch": 4646} {"train_loss": -7.175156956627255, "global_step": 195173, "epoch": 4646, "val_loss": 69124.2109375} {"train_loss": -7.143126010894775, "global_step": 195174, "epoch": 4647} {"train_loss": -7.195713043212891, "global_step": 195175, "epoch": 4647} {"train_loss": -7.1796441078186035, "global_step": 195176, "epoch": 4647} {"train_loss": -7.179773330688477, "global_step": 195177, "epoch": 4647} {"train_loss": -7.1933674812316895, "global_step": 195178, "epoch": 4647} {"train_loss": -7.308462142944336, "global_step": 195179, "epoch": 4647} {"train_loss": -7.228910446166992, "global_step": 195180, "epoch": 4647} {"train_loss": -7.246074676513672, "global_step": 195181, "epoch": 4647} {"train_loss": -7.237488746643066, "global_step": 195182, "epoch": 4647} {"train_loss": -7.293560981750488, "global_step": 195183, "epoch": 4647} {"train_loss": -7.307257175445557, "global_step": 195184, "epoch": 4647} {"train_loss": -7.348830699920654, "global_step": 195185, "epoch": 4647} {"train_loss": -7.302597999572754, "global_step": 195186, "epoch": 4647} {"train_loss": -7.205702781677246, "global_step": 195187, "epoch": 4647} {"train_loss": -7.241049766540527, "global_step": 195188, "epoch": 4647} {"train_loss": -7.226005554199219, "global_step": 195189, "epoch": 4647} {"train_loss": -7.259342193603516, "global_step": 195190, "epoch": 4647} {"train_loss": -7.232997417449951, "global_step": 195191, "epoch": 4647} {"train_loss": -7.248810291290283, "global_step": 195192, "epoch": 4647} {"train_loss": -7.157103538513184, "global_step": 195193, "epoch": 4647} {"train_loss": -7.170408248901367, "global_step": 195194, "epoch": 4647} {"train_loss": -7.286755561828613, "global_step": 195195, "epoch": 4647} {"train_loss": -7.140586853027344, "global_step": 195196, "epoch": 4647} {"train_loss": -7.355668544769287, "global_step": 195197, "epoch": 4647} {"train_loss": -7.241131782531738, "global_step": 195198, "epoch": 4647} {"train_loss": -7.314187049865723, "global_step": 195199, "epoch": 4647} {"train_loss": -7.181793689727783, "global_step": 195200, "epoch": 4647} {"train_loss": -7.26632022857666, "global_step": 195201, "epoch": 4647} {"train_loss": -7.249495983123779, "global_step": 195202, "epoch": 4647} {"train_loss": -7.201712131500244, "global_step": 195203, "epoch": 4647} {"train_loss": -7.080956935882568, "global_step": 195204, "epoch": 4647} {"train_loss": -7.127383232116699, "global_step": 195205, "epoch": 4647} {"train_loss": -7.241280555725098, "global_step": 195206, "epoch": 4647} {"train_loss": -7.061852931976318, "global_step": 195207, "epoch": 4647} {"train_loss": -7.205114841461182, "global_step": 195208, "epoch": 4647} {"train_loss": -7.1367034912109375, "global_step": 195209, "epoch": 4647} {"train_loss": -7.0514631271362305, "global_step": 195210, "epoch": 4647} {"train_loss": -7.2019548416137695, "global_step": 195211, "epoch": 4647} {"train_loss": -7.213306427001953, "global_step": 195212, "epoch": 4647} {"train_loss": -7.2018938064575195, "global_step": 195213, "epoch": 4647} {"train_loss": -7.109588623046875, "global_step": 195214, "epoch": 4647} {"train_loss": -7.211107696805682, "global_step": 195215, "epoch": 4647, "val_loss": 68941.5625} {"train_loss": -7.174942493438721, "global_step": 195216, "epoch": 4648} {"train_loss": -7.17936897277832, "global_step": 195217, "epoch": 4648} {"train_loss": -7.1529436111450195, "global_step": 195218, "epoch": 4648} {"train_loss": -7.3672075271606445, "global_step": 195219, "epoch": 4648} {"train_loss": -7.120822906494141, "global_step": 195220, "epoch": 4648} {"train_loss": -7.250524997711182, "global_step": 195221, "epoch": 4648} {"train_loss": -7.187374114990234, "global_step": 195222, "epoch": 4648} {"train_loss": -7.125732421875, "global_step": 195223, "epoch": 4648} {"train_loss": -7.317933082580566, "global_step": 195224, "epoch": 4648} {"train_loss": -7.142664909362793, "global_step": 195225, "epoch": 4648} {"train_loss": -7.105035781860352, "global_step": 195226, "epoch": 4648} {"train_loss": -7.304934978485107, "global_step": 195227, "epoch": 4648} {"train_loss": -6.9737138748168945, "global_step": 195228, "epoch": 4648} {"train_loss": -7.183407783508301, "global_step": 195229, "epoch": 4648} {"train_loss": -7.116390705108643, "global_step": 195230, "epoch": 4648} {"train_loss": -7.046390533447266, "global_step": 195231, "epoch": 4648} {"train_loss": -7.163748264312744, "global_step": 195232, "epoch": 4648} {"train_loss": -7.0262908935546875, "global_step": 195233, "epoch": 4648} {"train_loss": -7.069801330566406, "global_step": 195234, "epoch": 4648} {"train_loss": -7.032293319702148, "global_step": 195235, "epoch": 4648} {"train_loss": -7.17647647857666, "global_step": 195236, "epoch": 4648} {"train_loss": -7.010476589202881, "global_step": 195237, "epoch": 4648} {"train_loss": -7.2291460037231445, "global_step": 195238, "epoch": 4648} {"train_loss": -7.293736457824707, "global_step": 195239, "epoch": 4648} {"train_loss": -7.104785919189453, "global_step": 195240, "epoch": 4648} {"train_loss": -7.174890518188477, "global_step": 195241, "epoch": 4648} {"train_loss": -7.1965131759643555, "global_step": 195242, "epoch": 4648} {"train_loss": -7.170755386352539, "global_step": 195243, "epoch": 4648} {"train_loss": -7.181458473205566, "global_step": 195244, "epoch": 4648} {"train_loss": -7.240740776062012, "global_step": 195245, "epoch": 4648} {"train_loss": -7.131962776184082, "global_step": 195246, "epoch": 4648} {"train_loss": -7.085624694824219, "global_step": 195247, "epoch": 4648} {"train_loss": -7.275202751159668, "global_step": 195248, "epoch": 4648} {"train_loss": -7.170047283172607, "global_step": 195249, "epoch": 4648} {"train_loss": -7.295289993286133, "global_step": 195250, "epoch": 4648} {"train_loss": -7.198094367980957, "global_step": 195251, "epoch": 4648} {"train_loss": -7.191062927246094, "global_step": 195252, "epoch": 4648} {"train_loss": -7.218132495880127, "global_step": 195253, "epoch": 4648} {"train_loss": -7.236310958862305, "global_step": 195254, "epoch": 4648} {"train_loss": -7.255471706390381, "global_step": 195255, "epoch": 4648} {"train_loss": -7.168684005737305, "global_step": 195256, "epoch": 4648} {"train_loss": -7.174914995829265, "global_step": 195257, "epoch": 4648, "val_loss": 68838.7890625} {"train_loss": -7.250243186950684, "global_step": 195258, "epoch": 4649} {"train_loss": -7.271812438964844, "global_step": 195259, "epoch": 4649} {"train_loss": -7.32124137878418, "global_step": 195260, "epoch": 4649} {"train_loss": -7.26776647567749, "global_step": 195261, "epoch": 4649} {"train_loss": -7.242691516876221, "global_step": 195262, "epoch": 4649} {"train_loss": -7.185420513153076, "global_step": 195263, "epoch": 4649} {"train_loss": -7.05526876449585, "global_step": 195264, "epoch": 4649} {"train_loss": -7.162192344665527, "global_step": 195265, "epoch": 4649} {"train_loss": -7.154187202453613, "global_step": 195266, "epoch": 4649} {"train_loss": -6.958674430847168, "global_step": 195267, "epoch": 4649} {"train_loss": -7.119997024536133, "global_step": 195268, "epoch": 4649} {"train_loss": -7.122050762176514, "global_step": 195269, "epoch": 4649} {"train_loss": -6.991057395935059, "global_step": 195270, "epoch": 4649} {"train_loss": -7.175530433654785, "global_step": 195271, "epoch": 4649} {"train_loss": -7.161404132843018, "global_step": 195272, "epoch": 4649} {"train_loss": -7.05463981628418, "global_step": 195273, "epoch": 4649} {"train_loss": -7.1628313064575195, "global_step": 195274, "epoch": 4649} {"train_loss": -7.061359405517578, "global_step": 195275, "epoch": 4649} {"train_loss": -7.163221836090088, "global_step": 195276, "epoch": 4649} {"train_loss": -7.075328826904297, "global_step": 195277, "epoch": 4649} {"train_loss": -7.1835432052612305, "global_step": 195278, "epoch": 4649} {"train_loss": -7.119633674621582, "global_step": 195279, "epoch": 4649} {"train_loss": -7.138493537902832, "global_step": 195280, "epoch": 4649} {"train_loss": -7.146956443786621, "global_step": 195281, "epoch": 4649} {"train_loss": -7.147898197174072, "global_step": 195282, "epoch": 4649} {"train_loss": -7.163089752197266, "global_step": 195283, "epoch": 4649} {"train_loss": -6.919440269470215, "global_step": 195284, "epoch": 4649} {"train_loss": -7.202079772949219, "global_step": 195285, "epoch": 4649} {"train_loss": -7.006011962890625, "global_step": 195286, "epoch": 4649} {"train_loss": -6.972837924957275, "global_step": 195287, "epoch": 4649} {"train_loss": -7.087052345275879, "global_step": 195288, "epoch": 4649} {"train_loss": -7.112767219543457, "global_step": 195289, "epoch": 4649} {"train_loss": -7.110536098480225, "global_step": 195290, "epoch": 4649} {"train_loss": -7.112034797668457, "global_step": 195291, "epoch": 4649} {"train_loss": -7.114928722381592, "global_step": 195292, "epoch": 4649} {"train_loss": -6.959051609039307, "global_step": 195293, "epoch": 4649} {"train_loss": -7.172822952270508, "global_step": 195294, "epoch": 4649} {"train_loss": -7.106369972229004, "global_step": 195295, "epoch": 4649} {"train_loss": -6.994237899780273, "global_step": 195296, "epoch": 4649} {"train_loss": -7.078154563903809, "global_step": 195297, "epoch": 4649} {"train_loss": -7.0624589920043945, "global_step": 195298, "epoch": 4649} {"train_loss": -7.1187511285146075, "global_step": 195299, "epoch": 4649, "val_loss": 68934.296875} {"train_loss": -7.123785495758057, "global_step": 195300, "epoch": 4650} {"train_loss": -6.981699466705322, "global_step": 195301, "epoch": 4650} {"train_loss": -7.12431526184082, "global_step": 195302, "epoch": 4650} {"train_loss": -7.133599281311035, "global_step": 195303, "epoch": 4650} {"train_loss": -7.022465229034424, "global_step": 195304, "epoch": 4650} {"train_loss": -7.042725563049316, "global_step": 195305, "epoch": 4650} {"train_loss": -7.193732738494873, "global_step": 195306, "epoch": 4650} {"train_loss": -6.984225749969482, "global_step": 195307, "epoch": 4650} {"train_loss": -7.098798751831055, "global_step": 195308, "epoch": 4650} {"train_loss": -7.250083923339844, "global_step": 195309, "epoch": 4650} {"train_loss": -7.000016212463379, "global_step": 195310, "epoch": 4650} {"train_loss": -7.1156721115112305, "global_step": 195311, "epoch": 4650} {"train_loss": -7.071916580200195, "global_step": 195312, "epoch": 4650} {"train_loss": -7.212556838989258, "global_step": 195313, "epoch": 4650} {"train_loss": -7.188948631286621, "global_step": 195314, "epoch": 4650} {"train_loss": -7.1514892578125, "global_step": 195315, "epoch": 4650} {"train_loss": -7.112302303314209, "global_step": 195316, "epoch": 4650} {"train_loss": -7.142450332641602, "global_step": 195317, "epoch": 4650} {"train_loss": -7.224336624145508, "global_step": 195318, "epoch": 4650} {"train_loss": -7.067161560058594, "global_step": 195319, "epoch": 4650} {"train_loss": -7.10713529586792, "global_step": 195320, "epoch": 4650} {"train_loss": -7.1297454833984375, "global_step": 195321, "epoch": 4650} {"train_loss": -7.16347599029541, "global_step": 195322, "epoch": 4650} {"train_loss": -7.206633567810059, "global_step": 195323, "epoch": 4650} {"train_loss": -7.247991561889648, "global_step": 195324, "epoch": 4650} {"train_loss": -7.335892677307129, "global_step": 195325, "epoch": 4650} {"train_loss": -7.261161804199219, "global_step": 195326, "epoch": 4650} {"train_loss": -7.289559364318848, "global_step": 195327, "epoch": 4650} {"train_loss": -7.169602394104004, "global_step": 195328, "epoch": 4650} {"train_loss": -7.248226642608643, "global_step": 195329, "epoch": 4650} {"train_loss": -7.237181663513184, "global_step": 195330, "epoch": 4650} {"train_loss": -7.109063625335693, "global_step": 195331, "epoch": 4650} {"train_loss": -7.2430596351623535, "global_step": 195332, "epoch": 4650} {"train_loss": -7.321438789367676, "global_step": 195333, "epoch": 4650} {"train_loss": -7.237972259521484, "global_step": 195334, "epoch": 4650} {"train_loss": -7.17523717880249, "global_step": 195335, "epoch": 4650} {"train_loss": -7.239364147186279, "global_step": 195336, "epoch": 4650} {"train_loss": -7.239575386047363, "global_step": 195337, "epoch": 4650} {"train_loss": -7.264540672302246, "global_step": 195338, "epoch": 4650} {"train_loss": -7.252961158752441, "global_step": 195339, "epoch": 4650} {"train_loss": -7.17284631729126, "global_step": 195340, "epoch": 4650} {"train_loss": -7.171455088115874, "global_step": 195341, "epoch": 4650, "train/sim_max_reward_0": 0.6091342387191445, "train/sim_max_reward_1": 0.9865918308558316, "train/sim_max_reward_2": 0.672658801998853, "train/sim_max_reward_3": 0.1285281669910408, "train/sim_max_reward_4": 0.9543238186848978, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.17838520694159005, "test/sim_max_reward_4400001": 0.36602660441959606, "test/sim_max_reward_4400002": 0.3737058081845066, "test/sim_max_reward_4400003": 0.9820730121600396, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.8045797148482321, "test/sim_max_reward_4400006": 0.25799739301771474, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.2996724540099501, "test/sim_max_reward_4400009": 0.9980345067873362, "test/sim_max_reward_4400010": 0.8831300109236415, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.37791246067331435, "test/sim_max_reward_4400014": 0.7655535630593691, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.19453743694189468, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3142503470404707, "test/sim_max_reward_4400019": 0.0036475687345498154, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9829236507161772, "test/sim_max_reward_4400023": 0.41629199421836477, "test/sim_max_reward_4400024": 0.8958382095500095, "test/sim_max_reward_4400025": 0.26628263705830496, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0002685118524902398, "test/sim_max_reward_4400028": 0.7384711190688085, "test/sim_max_reward_4400029": 0.9723517813968929, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.8366748704754682, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9736910608362231, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.807631248245615, "test/sim_max_reward_4400036": 0.4882765054070345, "test/sim_max_reward_4400037": 0.9454570724677228, "test/sim_max_reward_4400038": 0.9519521474853471, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8425112038915629, "test/sim_max_reward_4400042": 0.9549357327506455, "test/sim_max_reward_4400043": 0.9575837715249992, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9913133286154888, "test/sim_max_reward_4400046": 0.5312793311930083, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.950705510618594, "test/sim_max_reward_4400049": 0.9206890674215487, "train/mean_score": 0.7252061428749612, "test/mean_score": 0.5754165964613481, "val_loss": 69011.1640625} {"train_loss": -7.4001970291137695, "global_step": 195342, "epoch": 4651} {"train_loss": -7.242040634155273, "global_step": 195343, "epoch": 4651} {"train_loss": -7.222949504852295, "global_step": 195344, "epoch": 4651} {"train_loss": -7.419306755065918, "global_step": 195345, "epoch": 4651} {"train_loss": -7.259549140930176, "global_step": 195346, "epoch": 4651} {"train_loss": -7.149973392486572, "global_step": 195347, "epoch": 4651} {"train_loss": -7.1435136795043945, "global_step": 195348, "epoch": 4651} {"train_loss": -7.270349979400635, "global_step": 195349, "epoch": 4651} {"train_loss": -7.161517143249512, "global_step": 195350, "epoch": 4651} {"train_loss": -7.398078918457031, "global_step": 195351, "epoch": 4651} {"train_loss": -7.229037284851074, "global_step": 195352, "epoch": 4651} {"train_loss": -7.2705912590026855, "global_step": 195353, "epoch": 4651} {"train_loss": -7.200666427612305, "global_step": 195354, "epoch": 4651} {"train_loss": -7.214492321014404, "global_step": 195355, "epoch": 4651} {"train_loss": -7.257328987121582, "global_step": 195356, "epoch": 4651} {"train_loss": -7.270403861999512, "global_step": 195357, "epoch": 4651} {"train_loss": -7.3563618659973145, "global_step": 195358, "epoch": 4651} {"train_loss": -7.303538799285889, "global_step": 195359, "epoch": 4651} {"train_loss": -7.188278675079346, "global_step": 195360, "epoch": 4651} {"train_loss": -7.263251304626465, "global_step": 195361, "epoch": 4651} {"train_loss": -7.2410383224487305, "global_step": 195362, "epoch": 4651} {"train_loss": -7.377179145812988, "global_step": 195363, "epoch": 4651} {"train_loss": -7.271134376525879, "global_step": 195364, "epoch": 4651} {"train_loss": -7.2203779220581055, "global_step": 195365, "epoch": 4651} {"train_loss": -7.178287982940674, "global_step": 195366, "epoch": 4651} {"train_loss": -7.204594135284424, "global_step": 195367, "epoch": 4651} {"train_loss": -7.274107933044434, "global_step": 195368, "epoch": 4651} {"train_loss": -7.285933494567871, "global_step": 195369, "epoch": 4651} {"train_loss": -7.1634016036987305, "global_step": 195370, "epoch": 4651} {"train_loss": -7.297740459442139, "global_step": 195371, "epoch": 4651} {"train_loss": -7.258462429046631, "global_step": 195372, "epoch": 4651} {"train_loss": -7.275508880615234, "global_step": 195373, "epoch": 4651} {"train_loss": -7.279246807098389, "global_step": 195374, "epoch": 4651} {"train_loss": -7.254298686981201, "global_step": 195375, "epoch": 4651} {"train_loss": -6.930329322814941, "global_step": 195376, "epoch": 4651} {"train_loss": -7.04640007019043, "global_step": 195377, "epoch": 4651} {"train_loss": -7.108278274536133, "global_step": 195378, "epoch": 4651} {"train_loss": -6.946338176727295, "global_step": 195379, "epoch": 4651} {"train_loss": -6.986413955688477, "global_step": 195380, "epoch": 4651} {"train_loss": -7.060287952423096, "global_step": 195381, "epoch": 4651} {"train_loss": -7.004691123962402, "global_step": 195382, "epoch": 4651} {"train_loss": -7.214435986110142, "global_step": 195383, "epoch": 4651, "val_loss": 68893.1796875} {"train_loss": -7.043278217315674, "global_step": 195384, "epoch": 4652} {"train_loss": -7.179519176483154, "global_step": 195385, "epoch": 4652} {"train_loss": -7.084578990936279, "global_step": 195386, "epoch": 4652} {"train_loss": -7.1051788330078125, "global_step": 195387, "epoch": 4652} {"train_loss": -7.184091091156006, "global_step": 195388, "epoch": 4652} {"train_loss": -7.219029426574707, "global_step": 195389, "epoch": 4652} {"train_loss": -7.369549751281738, "global_step": 195390, "epoch": 4652} {"train_loss": -7.262207984924316, "global_step": 195391, "epoch": 4652} {"train_loss": -7.178413391113281, "global_step": 195392, "epoch": 4652} {"train_loss": -7.254579544067383, "global_step": 195393, "epoch": 4652} {"train_loss": -7.141948699951172, "global_step": 195394, "epoch": 4652} {"train_loss": -7.221631050109863, "global_step": 195395, "epoch": 4652} {"train_loss": -7.214250564575195, "global_step": 195396, "epoch": 4652} {"train_loss": -7.200827598571777, "global_step": 195397, "epoch": 4652} {"train_loss": -7.174857139587402, "global_step": 195398, "epoch": 4652} {"train_loss": -7.241766452789307, "global_step": 195399, "epoch": 4652} {"train_loss": -7.204837322235107, "global_step": 195400, "epoch": 4652} {"train_loss": -7.263172149658203, "global_step": 195401, "epoch": 4652} {"train_loss": -7.215445518493652, "global_step": 195402, "epoch": 4652} {"train_loss": -7.2127885818481445, "global_step": 195403, "epoch": 4652} {"train_loss": -7.235099792480469, "global_step": 195404, "epoch": 4652} {"train_loss": -7.248660087585449, "global_step": 195405, "epoch": 4652} {"train_loss": -7.258309841156006, "global_step": 195406, "epoch": 4652} {"train_loss": -7.264337539672852, "global_step": 195407, "epoch": 4652} {"train_loss": -7.269965648651123, "global_step": 195408, "epoch": 4652} {"train_loss": -7.250128269195557, "global_step": 195409, "epoch": 4652} {"train_loss": -7.0454888343811035, "global_step": 195410, "epoch": 4652} {"train_loss": -7.192365646362305, "global_step": 195411, "epoch": 4652} {"train_loss": -7.1494879722595215, "global_step": 195412, "epoch": 4652} {"train_loss": -7.186856269836426, "global_step": 195413, "epoch": 4652} {"train_loss": -7.274653434753418, "global_step": 195414, "epoch": 4652} {"train_loss": -7.169214248657227, "global_step": 195415, "epoch": 4652} {"train_loss": -7.231569290161133, "global_step": 195416, "epoch": 4652} {"train_loss": -7.118310928344727, "global_step": 195417, "epoch": 4652} {"train_loss": -7.221889495849609, "global_step": 195418, "epoch": 4652} {"train_loss": -7.243505001068115, "global_step": 195419, "epoch": 4652} {"train_loss": -7.3163933753967285, "global_step": 195420, "epoch": 4652} {"train_loss": -7.232443809509277, "global_step": 195421, "epoch": 4652} {"train_loss": -7.172801971435547, "global_step": 195422, "epoch": 4652} {"train_loss": -7.341055870056152, "global_step": 195423, "epoch": 4652} {"train_loss": -7.150567054748535, "global_step": 195424, "epoch": 4652} {"train_loss": -7.210878054300944, "global_step": 195425, "epoch": 4652, "val_loss": 69201.1875} {"train_loss": -7.2030205726623535, "global_step": 195426, "epoch": 4653} {"train_loss": -7.35481071472168, "global_step": 195427, "epoch": 4653} {"train_loss": -7.188173294067383, "global_step": 195428, "epoch": 4653} {"train_loss": -7.216725826263428, "global_step": 195429, "epoch": 4653} {"train_loss": -7.254812240600586, "global_step": 195430, "epoch": 4653} {"train_loss": -7.288475036621094, "global_step": 195431, "epoch": 4653} {"train_loss": -7.060832977294922, "global_step": 195432, "epoch": 4653} {"train_loss": -7.281407356262207, "global_step": 195433, "epoch": 4653} {"train_loss": -7.318363666534424, "global_step": 195434, "epoch": 4653} {"train_loss": -7.220893859863281, "global_step": 195435, "epoch": 4653} {"train_loss": -7.1224822998046875, "global_step": 195436, "epoch": 4653} {"train_loss": -7.219114303588867, "global_step": 195437, "epoch": 4653} {"train_loss": -7.1638898849487305, "global_step": 195438, "epoch": 4653} {"train_loss": -7.234973430633545, "global_step": 195439, "epoch": 4653} {"train_loss": -7.23077392578125, "global_step": 195440, "epoch": 4653} {"train_loss": -7.1976847648620605, "global_step": 195441, "epoch": 4653} {"train_loss": -7.2627081871032715, "global_step": 195442, "epoch": 4653} {"train_loss": -7.261455535888672, "global_step": 195443, "epoch": 4653} {"train_loss": -7.231248378753662, "global_step": 195444, "epoch": 4653} {"train_loss": -7.154851913452148, "global_step": 195445, "epoch": 4653} {"train_loss": -7.318316459655762, "global_step": 195446, "epoch": 4653} {"train_loss": -7.114978790283203, "global_step": 195447, "epoch": 4653} {"train_loss": -7.174488544464111, "global_step": 195448, "epoch": 4653} {"train_loss": -7.163825988769531, "global_step": 195449, "epoch": 4653} {"train_loss": -7.153961181640625, "global_step": 195450, "epoch": 4653} {"train_loss": -7.098010540008545, "global_step": 195451, "epoch": 4653} {"train_loss": -7.239675521850586, "global_step": 195452, "epoch": 4653} {"train_loss": -7.172090530395508, "global_step": 195453, "epoch": 4653} {"train_loss": -7.226070404052734, "global_step": 195454, "epoch": 4653} {"train_loss": -7.141639709472656, "global_step": 195455, "epoch": 4653} {"train_loss": -7.057036399841309, "global_step": 195456, "epoch": 4653} {"train_loss": -7.198021411895752, "global_step": 195457, "epoch": 4653} {"train_loss": -7.167705535888672, "global_step": 195458, "epoch": 4653} {"train_loss": -7.107362270355225, "global_step": 195459, "epoch": 4653} {"train_loss": -7.159542083740234, "global_step": 195460, "epoch": 4653} {"train_loss": -7.093931674957275, "global_step": 195461, "epoch": 4653} {"train_loss": -7.143256664276123, "global_step": 195462, "epoch": 4653} {"train_loss": -7.155422687530518, "global_step": 195463, "epoch": 4653} {"train_loss": -7.21049690246582, "global_step": 195464, "epoch": 4653} {"train_loss": -7.167062759399414, "global_step": 195465, "epoch": 4653} {"train_loss": -7.2266106605529785, "global_step": 195466, "epoch": 4653} {"train_loss": -7.195591915221441, "global_step": 195467, "epoch": 4653, "val_loss": 69055.3984375} {"train_loss": -7.168664455413818, "global_step": 195468, "epoch": 4654} {"train_loss": -7.220162391662598, "global_step": 195469, "epoch": 4654} {"train_loss": -7.277225971221924, "global_step": 195470, "epoch": 4654} {"train_loss": -7.280929088592529, "global_step": 195471, "epoch": 4654} {"train_loss": -7.215648651123047, "global_step": 195472, "epoch": 4654} {"train_loss": -7.249648571014404, "global_step": 195473, "epoch": 4654} {"train_loss": -7.186027526855469, "global_step": 195474, "epoch": 4654} {"train_loss": -7.170369625091553, "global_step": 195475, "epoch": 4654} {"train_loss": -7.159411430358887, "global_step": 195476, "epoch": 4654} {"train_loss": -7.209364891052246, "global_step": 195477, "epoch": 4654} {"train_loss": -7.2256693840026855, "global_step": 195478, "epoch": 4654} {"train_loss": -7.108161926269531, "global_step": 195479, "epoch": 4654} {"train_loss": -7.137918472290039, "global_step": 195480, "epoch": 4654} {"train_loss": -7.224126815795898, "global_step": 195481, "epoch": 4654} {"train_loss": -7.19254207611084, "global_step": 195482, "epoch": 4654} {"train_loss": -7.243284225463867, "global_step": 195483, "epoch": 4654} {"train_loss": -7.168846130371094, "global_step": 195484, "epoch": 4654} {"train_loss": -7.183890342712402, "global_step": 195485, "epoch": 4654} {"train_loss": -7.173413276672363, "global_step": 195486, "epoch": 4654} {"train_loss": -7.286203384399414, "global_step": 195487, "epoch": 4654} {"train_loss": -7.234163284301758, "global_step": 195488, "epoch": 4654} {"train_loss": -7.214561462402344, "global_step": 195489, "epoch": 4654} {"train_loss": -7.203032493591309, "global_step": 195490, "epoch": 4654} {"train_loss": -7.330565452575684, "global_step": 195491, "epoch": 4654} {"train_loss": -7.140743255615234, "global_step": 195492, "epoch": 4654} {"train_loss": -7.372231483459473, "global_step": 195493, "epoch": 4654} {"train_loss": -7.211658477783203, "global_step": 195494, "epoch": 4654} {"train_loss": -7.2367634773254395, "global_step": 195495, "epoch": 4654} {"train_loss": -7.281105041503906, "global_step": 195496, "epoch": 4654} {"train_loss": -7.100511074066162, "global_step": 195497, "epoch": 4654} {"train_loss": -7.0868330001831055, "global_step": 195498, "epoch": 4654} {"train_loss": -7.231368064880371, "global_step": 195499, "epoch": 4654} {"train_loss": -7.151899814605713, "global_step": 195500, "epoch": 4654} {"train_loss": -7.138484954833984, "global_step": 195501, "epoch": 4654} {"train_loss": -7.111101150512695, "global_step": 195502, "epoch": 4654} {"train_loss": -7.059530258178711, "global_step": 195503, "epoch": 4654} {"train_loss": -7.118533611297607, "global_step": 195504, "epoch": 4654} {"train_loss": -7.0910964012146, "global_step": 195505, "epoch": 4654} {"train_loss": -7.115818500518799, "global_step": 195506, "epoch": 4654} {"train_loss": -7.083799839019775, "global_step": 195507, "epoch": 4654} {"train_loss": -7.217174530029297, "global_step": 195508, "epoch": 4654} {"train_loss": -7.190193357921782, "global_step": 195509, "epoch": 4654, "val_loss": 68956.3203125} {"train_loss": -7.167276382446289, "global_step": 195510, "epoch": 4655} {"train_loss": -7.132442474365234, "global_step": 195511, "epoch": 4655} {"train_loss": -7.168854713439941, "global_step": 195512, "epoch": 4655} {"train_loss": -7.125456809997559, "global_step": 195513, "epoch": 4655} {"train_loss": -7.074577331542969, "global_step": 195514, "epoch": 4655} {"train_loss": -7.098012924194336, "global_step": 195515, "epoch": 4655} {"train_loss": -7.0282392501831055, "global_step": 195516, "epoch": 4655} {"train_loss": -7.053400993347168, "global_step": 195517, "epoch": 4655} {"train_loss": -7.137338638305664, "global_step": 195518, "epoch": 4655} {"train_loss": -7.100221633911133, "global_step": 195519, "epoch": 4655} {"train_loss": -7.137429237365723, "global_step": 195520, "epoch": 4655} {"train_loss": -6.823285102844238, "global_step": 195521, "epoch": 4655} {"train_loss": -7.172307014465332, "global_step": 195522, "epoch": 4655} {"train_loss": -7.143599033355713, "global_step": 195523, "epoch": 4655} {"train_loss": -6.992034912109375, "global_step": 195524, "epoch": 4655} {"train_loss": -7.083340167999268, "global_step": 195525, "epoch": 4655} {"train_loss": -6.967700958251953, "global_step": 195526, "epoch": 4655} {"train_loss": -7.102300643920898, "global_step": 195527, "epoch": 4655} {"train_loss": -7.069445610046387, "global_step": 195528, "epoch": 4655} {"train_loss": -7.184238910675049, "global_step": 195529, "epoch": 4655} {"train_loss": -7.137065887451172, "global_step": 195530, "epoch": 4655} {"train_loss": -7.128184795379639, "global_step": 195531, "epoch": 4655} {"train_loss": -7.173809051513672, "global_step": 195532, "epoch": 4655} {"train_loss": -7.0551886558532715, "global_step": 195533, "epoch": 4655} {"train_loss": -7.123553276062012, "global_step": 195534, "epoch": 4655} {"train_loss": -7.10407829284668, "global_step": 195535, "epoch": 4655} {"train_loss": -7.038333415985107, "global_step": 195536, "epoch": 4655} {"train_loss": -7.24550724029541, "global_step": 195537, "epoch": 4655} {"train_loss": -7.145997524261475, "global_step": 195538, "epoch": 4655} {"train_loss": -7.154038429260254, "global_step": 195539, "epoch": 4655} {"train_loss": -7.095373153686523, "global_step": 195540, "epoch": 4655} {"train_loss": -7.250100135803223, "global_step": 195541, "epoch": 4655} {"train_loss": -7.255391597747803, "global_step": 195542, "epoch": 4655} {"train_loss": -7.1597514152526855, "global_step": 195543, "epoch": 4655} {"train_loss": -7.131402015686035, "global_step": 195544, "epoch": 4655} {"train_loss": -7.091255187988281, "global_step": 195545, "epoch": 4655} {"train_loss": -7.215385437011719, "global_step": 195546, "epoch": 4655} {"train_loss": -7.247196197509766, "global_step": 195547, "epoch": 4655} {"train_loss": -7.156129837036133, "global_step": 195548, "epoch": 4655} {"train_loss": -7.345597267150879, "global_step": 195549, "epoch": 4655} {"train_loss": -7.215888977050781, "global_step": 195550, "epoch": 4655} {"train_loss": -7.1298612867082864, "global_step": 195551, "epoch": 4655, "val_loss": 68992.59375} {"train_loss": -7.220280647277832, "global_step": 195552, "epoch": 4656} {"train_loss": -7.254802703857422, "global_step": 195553, "epoch": 4656} {"train_loss": -7.354218482971191, "global_step": 195554, "epoch": 4656} {"train_loss": -7.324892044067383, "global_step": 195555, "epoch": 4656} {"train_loss": -7.149560451507568, "global_step": 195556, "epoch": 4656} {"train_loss": -7.2290873527526855, "global_step": 195557, "epoch": 4656} {"train_loss": -7.201457977294922, "global_step": 195558, "epoch": 4656} {"train_loss": -7.145698070526123, "global_step": 195559, "epoch": 4656} {"train_loss": -7.159367561340332, "global_step": 195560, "epoch": 4656} {"train_loss": -7.21018123626709, "global_step": 195561, "epoch": 4656} {"train_loss": -7.188894271850586, "global_step": 195562, "epoch": 4656} {"train_loss": -7.12391996383667, "global_step": 195563, "epoch": 4656} {"train_loss": -7.2093610763549805, "global_step": 195564, "epoch": 4656} {"train_loss": -7.1280341148376465, "global_step": 195565, "epoch": 4656} {"train_loss": -6.984633922576904, "global_step": 195566, "epoch": 4656} {"train_loss": -7.244157791137695, "global_step": 195567, "epoch": 4656} {"train_loss": -7.169572830200195, "global_step": 195568, "epoch": 4656} {"train_loss": -7.081467628479004, "global_step": 195569, "epoch": 4656} {"train_loss": -7.272956848144531, "global_step": 195570, "epoch": 4656} {"train_loss": -7.052517890930176, "global_step": 195571, "epoch": 4656} {"train_loss": -7.1667680740356445, "global_step": 195572, "epoch": 4656} {"train_loss": -7.252742767333984, "global_step": 195573, "epoch": 4656} {"train_loss": -7.022830963134766, "global_step": 195574, "epoch": 4656} {"train_loss": -7.155728340148926, "global_step": 195575, "epoch": 4656} {"train_loss": -7.159389495849609, "global_step": 195576, "epoch": 4656} {"train_loss": -7.160066604614258, "global_step": 195577, "epoch": 4656} {"train_loss": -7.140953540802002, "global_step": 195578, "epoch": 4656} {"train_loss": -7.071418762207031, "global_step": 195579, "epoch": 4656} {"train_loss": -7.0384521484375, "global_step": 195580, "epoch": 4656} {"train_loss": -7.128251075744629, "global_step": 195581, "epoch": 4656} {"train_loss": -7.053373336791992, "global_step": 195582, "epoch": 4656} {"train_loss": -7.053117275238037, "global_step": 195583, "epoch": 4656} {"train_loss": -7.066535949707031, "global_step": 195584, "epoch": 4656} {"train_loss": -7.155463218688965, "global_step": 195585, "epoch": 4656} {"train_loss": -7.089107990264893, "global_step": 195586, "epoch": 4656} {"train_loss": -7.096386909484863, "global_step": 195587, "epoch": 4656} {"train_loss": -7.163102149963379, "global_step": 195588, "epoch": 4656} {"train_loss": -7.224849700927734, "global_step": 195589, "epoch": 4656} {"train_loss": -7.087310791015625, "global_step": 195590, "epoch": 4656} {"train_loss": -7.102694988250732, "global_step": 195591, "epoch": 4656} {"train_loss": -7.160449981689453, "global_step": 195592, "epoch": 4656} {"train_loss": -7.150871787752424, "global_step": 195593, "epoch": 4656, "val_loss": 68991.359375} {"train_loss": -7.220820426940918, "global_step": 195594, "epoch": 4657} {"train_loss": -7.085087776184082, "global_step": 195595, "epoch": 4657} {"train_loss": -7.208420276641846, "global_step": 195596, "epoch": 4657} {"train_loss": -7.024007320404053, "global_step": 195597, "epoch": 4657} {"train_loss": -7.159520149230957, "global_step": 195598, "epoch": 4657} {"train_loss": -7.164895057678223, "global_step": 195599, "epoch": 4657} {"train_loss": -7.11651611328125, "global_step": 195600, "epoch": 4657} {"train_loss": -7.255298614501953, "global_step": 195601, "epoch": 4657} {"train_loss": -7.310931205749512, "global_step": 195602, "epoch": 4657} {"train_loss": -7.263491630554199, "global_step": 195603, "epoch": 4657} {"train_loss": -7.312225341796875, "global_step": 195604, "epoch": 4657} {"train_loss": -7.223737716674805, "global_step": 195605, "epoch": 4657} {"train_loss": -7.239864826202393, "global_step": 195606, "epoch": 4657} {"train_loss": -7.254656791687012, "global_step": 195607, "epoch": 4657} {"train_loss": -7.175602436065674, "global_step": 195608, "epoch": 4657} {"train_loss": -7.170475482940674, "global_step": 195609, "epoch": 4657} {"train_loss": -7.275383949279785, "global_step": 195610, "epoch": 4657} {"train_loss": -7.243351936340332, "global_step": 195611, "epoch": 4657} {"train_loss": -7.300994873046875, "global_step": 195612, "epoch": 4657} {"train_loss": -7.1992506980896, "global_step": 195613, "epoch": 4657} {"train_loss": -7.259252548217773, "global_step": 195614, "epoch": 4657} {"train_loss": -7.370348930358887, "global_step": 195615, "epoch": 4657} {"train_loss": -7.216883659362793, "global_step": 195616, "epoch": 4657} {"train_loss": -7.3527512550354, "global_step": 195617, "epoch": 4657} {"train_loss": -7.1603288650512695, "global_step": 195618, "epoch": 4657} {"train_loss": -7.260382652282715, "global_step": 195619, "epoch": 4657} {"train_loss": -7.183149814605713, "global_step": 195620, "epoch": 4657} {"train_loss": -7.281083106994629, "global_step": 195621, "epoch": 4657} {"train_loss": -7.231326103210449, "global_step": 195622, "epoch": 4657} {"train_loss": -7.324779510498047, "global_step": 195623, "epoch": 4657} {"train_loss": -7.299478530883789, "global_step": 195624, "epoch": 4657} {"train_loss": -7.294855117797852, "global_step": 195625, "epoch": 4657} {"train_loss": -7.3926801681518555, "global_step": 195626, "epoch": 4657} {"train_loss": -7.354312896728516, "global_step": 195627, "epoch": 4657} {"train_loss": -7.255521297454834, "global_step": 195628, "epoch": 4657} {"train_loss": -7.2112274169921875, "global_step": 195629, "epoch": 4657} {"train_loss": -7.3498711585998535, "global_step": 195630, "epoch": 4657} {"train_loss": -7.121851921081543, "global_step": 195631, "epoch": 4657} {"train_loss": -7.242687702178955, "global_step": 195632, "epoch": 4657} {"train_loss": -7.3527936935424805, "global_step": 195633, "epoch": 4657} {"train_loss": -7.270229339599609, "global_step": 195634, "epoch": 4657} {"train_loss": -7.243699561981928, "global_step": 195635, "epoch": 4657, "val_loss": 69117.5078125} {"train_loss": -7.303953170776367, "global_step": 195636, "epoch": 4658} {"train_loss": -7.362790584564209, "global_step": 195637, "epoch": 4658} {"train_loss": -7.341069221496582, "global_step": 195638, "epoch": 4658} {"train_loss": -7.321915626525879, "global_step": 195639, "epoch": 4658} {"train_loss": -7.2011332511901855, "global_step": 195640, "epoch": 4658} {"train_loss": -7.308848857879639, "global_step": 195641, "epoch": 4658} {"train_loss": -7.202993869781494, "global_step": 195642, "epoch": 4658} {"train_loss": -7.2675933837890625, "global_step": 195643, "epoch": 4658} {"train_loss": -7.164633750915527, "global_step": 195644, "epoch": 4658} {"train_loss": -7.176946640014648, "global_step": 195645, "epoch": 4658} {"train_loss": -7.157488822937012, "global_step": 195646, "epoch": 4658} {"train_loss": -6.925750255584717, "global_step": 195647, "epoch": 4658} {"train_loss": -7.05294132232666, "global_step": 195648, "epoch": 4658} {"train_loss": -7.238897323608398, "global_step": 195649, "epoch": 4658} {"train_loss": -7.13546895980835, "global_step": 195650, "epoch": 4658} {"train_loss": -7.0414934158325195, "global_step": 195651, "epoch": 4658} {"train_loss": -6.981492042541504, "global_step": 195652, "epoch": 4658} {"train_loss": -7.013832092285156, "global_step": 195653, "epoch": 4658} {"train_loss": -7.0765767097473145, "global_step": 195654, "epoch": 4658} {"train_loss": -7.180306911468506, "global_step": 195655, "epoch": 4658} {"train_loss": -7.2395172119140625, "global_step": 195656, "epoch": 4658} {"train_loss": -7.171031951904297, "global_step": 195657, "epoch": 4658} {"train_loss": -7.17075252532959, "global_step": 195658, "epoch": 4658} {"train_loss": -7.115305423736572, "global_step": 195659, "epoch": 4658} {"train_loss": -7.106143474578857, "global_step": 195660, "epoch": 4658} {"train_loss": -7.097625732421875, "global_step": 195661, "epoch": 4658} {"train_loss": -7.225881576538086, "global_step": 195662, "epoch": 4658} {"train_loss": -7.092114448547363, "global_step": 195663, "epoch": 4658} {"train_loss": -6.977619647979736, "global_step": 195664, "epoch": 4658} {"train_loss": -7.0528564453125, "global_step": 195665, "epoch": 4658} {"train_loss": -6.783298969268799, "global_step": 195666, "epoch": 4658} {"train_loss": -7.065903663635254, "global_step": 195667, "epoch": 4658} {"train_loss": -7.027721405029297, "global_step": 195668, "epoch": 4658} {"train_loss": -7.1633992195129395, "global_step": 195669, "epoch": 4658} {"train_loss": -7.011441707611084, "global_step": 195670, "epoch": 4658} {"train_loss": -6.962480068206787, "global_step": 195671, "epoch": 4658} {"train_loss": -7.118515491485596, "global_step": 195672, "epoch": 4658} {"train_loss": -7.126656532287598, "global_step": 195673, "epoch": 4658} {"train_loss": -7.0511932373046875, "global_step": 195674, "epoch": 4658} {"train_loss": -7.1330976486206055, "global_step": 195675, "epoch": 4658} {"train_loss": -7.147303581237793, "global_step": 195676, "epoch": 4658} {"train_loss": -7.12831541470119, "global_step": 195677, "epoch": 4658, "val_loss": 69029.4921875} {"train_loss": -7.17799186706543, "global_step": 195678, "epoch": 4659} {"train_loss": -7.127334117889404, "global_step": 195679, "epoch": 4659} {"train_loss": -7.33328914642334, "global_step": 195680, "epoch": 4659} {"train_loss": -7.170528411865234, "global_step": 195681, "epoch": 4659} {"train_loss": -7.192440032958984, "global_step": 195682, "epoch": 4659} {"train_loss": -7.115044116973877, "global_step": 195683, "epoch": 4659} {"train_loss": -7.152878284454346, "global_step": 195684, "epoch": 4659} {"train_loss": -7.137580394744873, "global_step": 195685, "epoch": 4659} {"train_loss": -7.200230598449707, "global_step": 195686, "epoch": 4659} {"train_loss": -7.320993423461914, "global_step": 195687, "epoch": 4659} {"train_loss": -7.238894462585449, "global_step": 195688, "epoch": 4659} {"train_loss": -7.1531081199646, "global_step": 195689, "epoch": 4659} {"train_loss": -7.170168399810791, "global_step": 195690, "epoch": 4659} {"train_loss": -7.219837188720703, "global_step": 195691, "epoch": 4659} {"train_loss": -7.26317024230957, "global_step": 195692, "epoch": 4659} {"train_loss": -7.188597679138184, "global_step": 195693, "epoch": 4659} {"train_loss": -7.141110897064209, "global_step": 195694, "epoch": 4659} {"train_loss": -6.985203742980957, "global_step": 195695, "epoch": 4659} {"train_loss": -7.232964515686035, "global_step": 195696, "epoch": 4659} {"train_loss": -7.27299165725708, "global_step": 195697, "epoch": 4659} {"train_loss": -7.261669158935547, "global_step": 195698, "epoch": 4659} {"train_loss": -7.264467239379883, "global_step": 195699, "epoch": 4659} {"train_loss": -7.159911155700684, "global_step": 195700, "epoch": 4659} {"train_loss": -7.038658142089844, "global_step": 195701, "epoch": 4659} {"train_loss": -7.129485130310059, "global_step": 195702, "epoch": 4659} {"train_loss": -7.133254051208496, "global_step": 195703, "epoch": 4659} {"train_loss": -7.222959995269775, "global_step": 195704, "epoch": 4659} {"train_loss": -7.258370399475098, "global_step": 195705, "epoch": 4659} {"train_loss": -7.158835411071777, "global_step": 195706, "epoch": 4659} {"train_loss": -7.178590774536133, "global_step": 195707, "epoch": 4659} {"train_loss": -7.142697334289551, "global_step": 195708, "epoch": 4659} {"train_loss": -6.981654167175293, "global_step": 195709, "epoch": 4659} {"train_loss": -7.300922393798828, "global_step": 195710, "epoch": 4659} {"train_loss": -6.964942932128906, "global_step": 195711, "epoch": 4659} {"train_loss": -7.044207572937012, "global_step": 195712, "epoch": 4659} {"train_loss": -7.095694541931152, "global_step": 195713, "epoch": 4659} {"train_loss": -7.033864974975586, "global_step": 195714, "epoch": 4659} {"train_loss": -7.0320329666137695, "global_step": 195715, "epoch": 4659} {"train_loss": -7.067159652709961, "global_step": 195716, "epoch": 4659} {"train_loss": -7.055269241333008, "global_step": 195717, "epoch": 4659} {"train_loss": -7.019852161407471, "global_step": 195718, "epoch": 4659} {"train_loss": -7.153296981539045, "global_step": 195719, "epoch": 4659, "val_loss": 68806.3046875} {"train_loss": -6.98942756652832, "global_step": 195720, "epoch": 4660} {"train_loss": -7.158409595489502, "global_step": 195721, "epoch": 4660} {"train_loss": -7.136091709136963, "global_step": 195722, "epoch": 4660} {"train_loss": -7.19057035446167, "global_step": 195723, "epoch": 4660} {"train_loss": -7.153907775878906, "global_step": 195724, "epoch": 4660} {"train_loss": -7.105116844177246, "global_step": 195725, "epoch": 4660} {"train_loss": -7.153353691101074, "global_step": 195726, "epoch": 4660} {"train_loss": -7.160679340362549, "global_step": 195727, "epoch": 4660} {"train_loss": -7.1407270431518555, "global_step": 195728, "epoch": 4660} {"train_loss": -7.070038795471191, "global_step": 195729, "epoch": 4660} {"train_loss": -7.128045082092285, "global_step": 195730, "epoch": 4660} {"train_loss": -7.224456787109375, "global_step": 195731, "epoch": 4660} {"train_loss": -7.257925033569336, "global_step": 195732, "epoch": 4660} {"train_loss": -7.1988630294799805, "global_step": 195733, "epoch": 4660} {"train_loss": -7.3154401779174805, "global_step": 195734, "epoch": 4660} {"train_loss": -7.105718612670898, "global_step": 195735, "epoch": 4660} {"train_loss": -7.114264011383057, "global_step": 195736, "epoch": 4660} {"train_loss": -7.250400066375732, "global_step": 195737, "epoch": 4660} {"train_loss": -7.304937362670898, "global_step": 195738, "epoch": 4660} {"train_loss": -7.24250602722168, "global_step": 195739, "epoch": 4660} {"train_loss": -7.101487159729004, "global_step": 195740, "epoch": 4660} {"train_loss": -7.270105361938477, "global_step": 195741, "epoch": 4660} {"train_loss": -7.180537700653076, "global_step": 195742, "epoch": 4660} {"train_loss": -7.224760055541992, "global_step": 195743, "epoch": 4660} {"train_loss": -7.241510391235352, "global_step": 195744, "epoch": 4660} {"train_loss": -7.258898735046387, "global_step": 195745, "epoch": 4660} {"train_loss": -7.19724178314209, "global_step": 195746, "epoch": 4660} {"train_loss": -7.265196800231934, "global_step": 195747, "epoch": 4660} {"train_loss": -7.253361225128174, "global_step": 195748, "epoch": 4660} {"train_loss": -7.277589797973633, "global_step": 195749, "epoch": 4660} {"train_loss": -7.281944274902344, "global_step": 195750, "epoch": 4660} {"train_loss": -7.22108268737793, "global_step": 195751, "epoch": 4660} {"train_loss": -7.308934688568115, "global_step": 195752, "epoch": 4660} {"train_loss": -7.248067855834961, "global_step": 195753, "epoch": 4660} {"train_loss": -7.214147567749023, "global_step": 195754, "epoch": 4660} {"train_loss": -7.277585029602051, "global_step": 195755, "epoch": 4660} {"train_loss": -7.309879302978516, "global_step": 195756, "epoch": 4660} {"train_loss": -7.237281799316406, "global_step": 195757, "epoch": 4660} {"train_loss": -7.207313537597656, "global_step": 195758, "epoch": 4660} {"train_loss": -7.2510881423950195, "global_step": 195759, "epoch": 4660} {"train_loss": -7.236472129821777, "global_step": 195760, "epoch": 4660} {"train_loss": -7.208725293477376, "global_step": 195761, "epoch": 4660, "val_loss": 68916.8515625} {"train_loss": -7.3140788078308105, "global_step": 195762, "epoch": 4661} {"train_loss": -7.279956817626953, "global_step": 195763, "epoch": 4661} {"train_loss": -7.385702133178711, "global_step": 195764, "epoch": 4661} {"train_loss": -7.274790287017822, "global_step": 195765, "epoch": 4661} {"train_loss": -7.321926116943359, "global_step": 195766, "epoch": 4661} {"train_loss": -7.223224639892578, "global_step": 195767, "epoch": 4661} {"train_loss": -7.3802361488342285, "global_step": 195768, "epoch": 4661} {"train_loss": -7.206156253814697, "global_step": 195769, "epoch": 4661} {"train_loss": -7.26862907409668, "global_step": 195770, "epoch": 4661} {"train_loss": -7.304898262023926, "global_step": 195771, "epoch": 4661} {"train_loss": -7.228847503662109, "global_step": 195772, "epoch": 4661} {"train_loss": -7.295886993408203, "global_step": 195773, "epoch": 4661} {"train_loss": -7.167939186096191, "global_step": 195774, "epoch": 4661} {"train_loss": -7.249877452850342, "global_step": 195775, "epoch": 4661} {"train_loss": -7.142867088317871, "global_step": 195776, "epoch": 4661} {"train_loss": -7.094566822052002, "global_step": 195777, "epoch": 4661} {"train_loss": -7.2913994789123535, "global_step": 195778, "epoch": 4661} {"train_loss": -7.1737565994262695, "global_step": 195779, "epoch": 4661} {"train_loss": -7.155613422393799, "global_step": 195780, "epoch": 4661} {"train_loss": -7.233519077301025, "global_step": 195781, "epoch": 4661} {"train_loss": -7.2042236328125, "global_step": 195782, "epoch": 4661} {"train_loss": -7.07265043258667, "global_step": 195783, "epoch": 4661} {"train_loss": -7.124487400054932, "global_step": 195784, "epoch": 4661} {"train_loss": -7.241662979125977, "global_step": 195785, "epoch": 4661} {"train_loss": -7.293498992919922, "global_step": 195786, "epoch": 4661} {"train_loss": -7.254237651824951, "global_step": 195787, "epoch": 4661} {"train_loss": -7.225354194641113, "global_step": 195788, "epoch": 4661} {"train_loss": -7.216978549957275, "global_step": 195789, "epoch": 4661} {"train_loss": -7.228729248046875, "global_step": 195790, "epoch": 4661} {"train_loss": -7.138289451599121, "global_step": 195791, "epoch": 4661} {"train_loss": -7.23233699798584, "global_step": 195792, "epoch": 4661} {"train_loss": -7.28324031829834, "global_step": 195793, "epoch": 4661} {"train_loss": -7.237372875213623, "global_step": 195794, "epoch": 4661} {"train_loss": -7.300555229187012, "global_step": 195795, "epoch": 4661} {"train_loss": -7.0710039138793945, "global_step": 195796, "epoch": 4661} {"train_loss": -7.208313941955566, "global_step": 195797, "epoch": 4661} {"train_loss": -7.203995704650879, "global_step": 195798, "epoch": 4661} {"train_loss": -7.234825134277344, "global_step": 195799, "epoch": 4661} {"train_loss": -7.164035797119141, "global_step": 195800, "epoch": 4661} {"train_loss": -7.1491241455078125, "global_step": 195801, "epoch": 4661} {"train_loss": -7.090435028076172, "global_step": 195802, "epoch": 4661} {"train_loss": -7.222759746369862, "global_step": 195803, "epoch": 4661, "val_loss": 69099.59375} {"train_loss": -7.131767272949219, "global_step": 195804, "epoch": 4662} {"train_loss": -7.0590500831604, "global_step": 195805, "epoch": 4662} {"train_loss": -7.160859107971191, "global_step": 195806, "epoch": 4662} {"train_loss": -7.181362628936768, "global_step": 195807, "epoch": 4662} {"train_loss": -7.358258247375488, "global_step": 195808, "epoch": 4662} {"train_loss": -7.267748832702637, "global_step": 195809, "epoch": 4662} {"train_loss": -7.193146705627441, "global_step": 195810, "epoch": 4662} {"train_loss": -7.2721757888793945, "global_step": 195811, "epoch": 4662} {"train_loss": -7.375332832336426, "global_step": 195812, "epoch": 4662} {"train_loss": -7.209193229675293, "global_step": 195813, "epoch": 4662} {"train_loss": -7.315657615661621, "global_step": 195814, "epoch": 4662} {"train_loss": -7.29285192489624, "global_step": 195815, "epoch": 4662} {"train_loss": -7.20154333114624, "global_step": 195816, "epoch": 4662} {"train_loss": -7.217036247253418, "global_step": 195817, "epoch": 4662} {"train_loss": -7.256125450134277, "global_step": 195818, "epoch": 4662} {"train_loss": -7.214789867401123, "global_step": 195819, "epoch": 4662} {"train_loss": -7.318826675415039, "global_step": 195820, "epoch": 4662} {"train_loss": -7.189416885375977, "global_step": 195821, "epoch": 4662} {"train_loss": -7.17086124420166, "global_step": 195822, "epoch": 4662} {"train_loss": -7.226459980010986, "global_step": 195823, "epoch": 4662} {"train_loss": -7.246862411499023, "global_step": 195824, "epoch": 4662} {"train_loss": -7.320769309997559, "global_step": 195825, "epoch": 4662} {"train_loss": -7.22615385055542, "global_step": 195826, "epoch": 4662} {"train_loss": -7.300395488739014, "global_step": 195827, "epoch": 4662} {"train_loss": -7.224659442901611, "global_step": 195828, "epoch": 4662} {"train_loss": -7.321198463439941, "global_step": 195829, "epoch": 4662} {"train_loss": -7.184072494506836, "global_step": 195830, "epoch": 4662} {"train_loss": -7.3252458572387695, "global_step": 195831, "epoch": 4662} {"train_loss": -7.244321823120117, "global_step": 195832, "epoch": 4662} {"train_loss": -7.210315704345703, "global_step": 195833, "epoch": 4662} {"train_loss": -7.156661033630371, "global_step": 195834, "epoch": 4662} {"train_loss": -7.146871566772461, "global_step": 195835, "epoch": 4662} {"train_loss": -7.222949981689453, "global_step": 195836, "epoch": 4662} {"train_loss": -7.198607921600342, "global_step": 195837, "epoch": 4662} {"train_loss": -7.257718563079834, "global_step": 195838, "epoch": 4662} {"train_loss": -7.330484390258789, "global_step": 195839, "epoch": 4662} {"train_loss": -7.30781364440918, "global_step": 195840, "epoch": 4662} {"train_loss": -7.325893402099609, "global_step": 195841, "epoch": 4662} {"train_loss": -7.382572174072266, "global_step": 195842, "epoch": 4662} {"train_loss": -7.287668704986572, "global_step": 195843, "epoch": 4662} {"train_loss": -7.222989082336426, "global_step": 195844, "epoch": 4662} {"train_loss": -7.244377783366612, "global_step": 195845, "epoch": 4662, "val_loss": 69031.4375} {"train_loss": -7.212639331817627, "global_step": 195846, "epoch": 4663} {"train_loss": -7.236503601074219, "global_step": 195847, "epoch": 4663} {"train_loss": -7.265589237213135, "global_step": 195848, "epoch": 4663} {"train_loss": -7.365147590637207, "global_step": 195849, "epoch": 4663} {"train_loss": -7.267575263977051, "global_step": 195850, "epoch": 4663} {"train_loss": -7.175207138061523, "global_step": 195851, "epoch": 4663} {"train_loss": -7.188150882720947, "global_step": 195852, "epoch": 4663} {"train_loss": -7.18893575668335, "global_step": 195853, "epoch": 4663} {"train_loss": -7.254653453826904, "global_step": 195854, "epoch": 4663} {"train_loss": -7.269061088562012, "global_step": 195855, "epoch": 4663} {"train_loss": -7.102466106414795, "global_step": 195856, "epoch": 4663} {"train_loss": -7.1721601486206055, "global_step": 195857, "epoch": 4663} {"train_loss": -7.194283485412598, "global_step": 195858, "epoch": 4663} {"train_loss": -7.339214324951172, "global_step": 195859, "epoch": 4663} {"train_loss": -7.133309841156006, "global_step": 195860, "epoch": 4663} {"train_loss": -7.231171607971191, "global_step": 195861, "epoch": 4663} {"train_loss": -7.217611789703369, "global_step": 195862, "epoch": 4663} {"train_loss": -7.206821441650391, "global_step": 195863, "epoch": 4663} {"train_loss": -7.086307525634766, "global_step": 195864, "epoch": 4663} {"train_loss": -7.144050598144531, "global_step": 195865, "epoch": 4663} {"train_loss": -7.243494510650635, "global_step": 195866, "epoch": 4663} {"train_loss": -7.157663345336914, "global_step": 195867, "epoch": 4663} {"train_loss": -7.157319068908691, "global_step": 195868, "epoch": 4663} {"train_loss": -7.155113220214844, "global_step": 195869, "epoch": 4663} {"train_loss": -7.1954169273376465, "global_step": 195870, "epoch": 4663} {"train_loss": -7.109938621520996, "global_step": 195871, "epoch": 4663} {"train_loss": -7.241667747497559, "global_step": 195872, "epoch": 4663} {"train_loss": -7.161799430847168, "global_step": 195873, "epoch": 4663} {"train_loss": -7.180988311767578, "global_step": 195874, "epoch": 4663} {"train_loss": -7.239229202270508, "global_step": 195875, "epoch": 4663} {"train_loss": -7.185988426208496, "global_step": 195876, "epoch": 4663} {"train_loss": -7.089824676513672, "global_step": 195877, "epoch": 4663} {"train_loss": -7.099930286407471, "global_step": 195878, "epoch": 4663} {"train_loss": -7.089439392089844, "global_step": 195879, "epoch": 4663} {"train_loss": -7.108761787414551, "global_step": 195880, "epoch": 4663} {"train_loss": -7.179001808166504, "global_step": 195881, "epoch": 4663} {"train_loss": -6.997349739074707, "global_step": 195882, "epoch": 4663} {"train_loss": -7.149106502532959, "global_step": 195883, "epoch": 4663} {"train_loss": -7.198068141937256, "global_step": 195884, "epoch": 4663} {"train_loss": -7.153522968292236, "global_step": 195885, "epoch": 4663} {"train_loss": -7.14284610748291, "global_step": 195886, "epoch": 4663} {"train_loss": -7.182488123575847, "global_step": 195887, "epoch": 4663, "val_loss": 69086.28125} {"train_loss": -7.141268730163574, "global_step": 195888, "epoch": 4664} {"train_loss": -7.157257556915283, "global_step": 195889, "epoch": 4664} {"train_loss": -7.192116737365723, "global_step": 195890, "epoch": 4664} {"train_loss": -7.047186374664307, "global_step": 195891, "epoch": 4664} {"train_loss": -7.030879020690918, "global_step": 195892, "epoch": 4664} {"train_loss": -7.034372806549072, "global_step": 195893, "epoch": 4664} {"train_loss": -7.167669296264648, "global_step": 195894, "epoch": 4664} {"train_loss": -7.092667579650879, "global_step": 195895, "epoch": 4664} {"train_loss": -7.020061492919922, "global_step": 195896, "epoch": 4664} {"train_loss": -7.06455135345459, "global_step": 195897, "epoch": 4664} {"train_loss": -7.034959316253662, "global_step": 195898, "epoch": 4664} {"train_loss": -7.047525405883789, "global_step": 195899, "epoch": 4664} {"train_loss": -7.133600234985352, "global_step": 195900, "epoch": 4664} {"train_loss": -7.020019054412842, "global_step": 195901, "epoch": 4664} {"train_loss": -7.161648750305176, "global_step": 195902, "epoch": 4664} {"train_loss": -7.074524402618408, "global_step": 195903, "epoch": 4664} {"train_loss": -7.168137550354004, "global_step": 195904, "epoch": 4664} {"train_loss": -7.005774974822998, "global_step": 195905, "epoch": 4664} {"train_loss": -7.095816612243652, "global_step": 195906, "epoch": 4664} {"train_loss": -7.122161865234375, "global_step": 195907, "epoch": 4664} {"train_loss": -7.06624174118042, "global_step": 195908, "epoch": 4664} {"train_loss": -7.2038068771362305, "global_step": 195909, "epoch": 4664} {"train_loss": -7.141695499420166, "global_step": 195910, "epoch": 4664} {"train_loss": -7.05422306060791, "global_step": 195911, "epoch": 4664} {"train_loss": -7.060327529907227, "global_step": 195912, "epoch": 4664} {"train_loss": -7.036019325256348, "global_step": 195913, "epoch": 4664} {"train_loss": -7.146946430206299, "global_step": 195914, "epoch": 4664} {"train_loss": -7.125984191894531, "global_step": 195915, "epoch": 4664} {"train_loss": -7.024541854858398, "global_step": 195916, "epoch": 4664} {"train_loss": -7.030461311340332, "global_step": 195917, "epoch": 4664} {"train_loss": -7.221899509429932, "global_step": 195918, "epoch": 4664} {"train_loss": -7.11965274810791, "global_step": 195919, "epoch": 4664} {"train_loss": -7.0791730880737305, "global_step": 195920, "epoch": 4664} {"train_loss": -7.140002727508545, "global_step": 195921, "epoch": 4664} {"train_loss": -7.138639450073242, "global_step": 195922, "epoch": 4664} {"train_loss": -7.102397918701172, "global_step": 195923, "epoch": 4664} {"train_loss": -7.155807971954346, "global_step": 195924, "epoch": 4664} {"train_loss": -7.118083477020264, "global_step": 195925, "epoch": 4664} {"train_loss": -7.193506240844727, "global_step": 195926, "epoch": 4664} {"train_loss": -7.229348182678223, "global_step": 195927, "epoch": 4664} {"train_loss": -7.316396236419678, "global_step": 195928, "epoch": 4664} {"train_loss": -7.112038056055705, "global_step": 195929, "epoch": 4664, "val_loss": 69127.109375} {"train_loss": -7.1046013832092285, "global_step": 195930, "epoch": 4665} {"train_loss": -7.169760227203369, "global_step": 195931, "epoch": 4665} {"train_loss": -6.942899703979492, "global_step": 195932, "epoch": 4665} {"train_loss": -7.216930866241455, "global_step": 195933, "epoch": 4665} {"train_loss": -7.019134521484375, "global_step": 195934, "epoch": 4665} {"train_loss": -7.171343803405762, "global_step": 195935, "epoch": 4665} {"train_loss": -7.085383892059326, "global_step": 195936, "epoch": 4665} {"train_loss": -7.05713415145874, "global_step": 195937, "epoch": 4665} {"train_loss": -7.201249122619629, "global_step": 195938, "epoch": 4665} {"train_loss": -7.127081394195557, "global_step": 195939, "epoch": 4665} {"train_loss": -7.11482048034668, "global_step": 195940, "epoch": 4665} {"train_loss": -7.023475646972656, "global_step": 195941, "epoch": 4665} {"train_loss": -7.044009208679199, "global_step": 195942, "epoch": 4665} {"train_loss": -7.0915985107421875, "global_step": 195943, "epoch": 4665} {"train_loss": -7.1570329666137695, "global_step": 195944, "epoch": 4665} {"train_loss": -7.1606950759887695, "global_step": 195945, "epoch": 4665} {"train_loss": -7.2357330322265625, "global_step": 195946, "epoch": 4665} {"train_loss": -7.122439384460449, "global_step": 195947, "epoch": 4665} {"train_loss": -7.133535385131836, "global_step": 195948, "epoch": 4665} {"train_loss": -7.098812103271484, "global_step": 195949, "epoch": 4665} {"train_loss": -7.192352294921875, "global_step": 195950, "epoch": 4665} {"train_loss": -7.143798828125, "global_step": 195951, "epoch": 4665} {"train_loss": -7.1832804679870605, "global_step": 195952, "epoch": 4665} {"train_loss": -7.124982833862305, "global_step": 195953, "epoch": 4665} {"train_loss": -7.090261936187744, "global_step": 195954, "epoch": 4665} {"train_loss": -7.232980728149414, "global_step": 195955, "epoch": 4665} {"train_loss": -7.069106101989746, "global_step": 195956, "epoch": 4665} {"train_loss": -7.107743263244629, "global_step": 195957, "epoch": 4665} {"train_loss": -7.152367115020752, "global_step": 195958, "epoch": 4665} {"train_loss": -7.21073055267334, "global_step": 195959, "epoch": 4665} {"train_loss": -7.09554386138916, "global_step": 195960, "epoch": 4665} {"train_loss": -7.094165802001953, "global_step": 195961, "epoch": 4665} {"train_loss": -7.058848857879639, "global_step": 195962, "epoch": 4665} {"train_loss": -7.1331706047058105, "global_step": 195963, "epoch": 4665} {"train_loss": -7.047873497009277, "global_step": 195964, "epoch": 4665} {"train_loss": -7.121574878692627, "global_step": 195965, "epoch": 4665} {"train_loss": -7.1082563400268555, "global_step": 195966, "epoch": 4665} {"train_loss": -7.132415771484375, "global_step": 195967, "epoch": 4665} {"train_loss": -7.126548767089844, "global_step": 195968, "epoch": 4665} {"train_loss": -7.088174819946289, "global_step": 195969, "epoch": 4665} {"train_loss": -7.212275505065918, "global_step": 195970, "epoch": 4665} {"train_loss": -7.121858335676647, "global_step": 195971, "epoch": 4665, "val_loss": 68932.3046875} {"train_loss": -7.123001575469971, "global_step": 195972, "epoch": 4666} {"train_loss": -7.224571704864502, "global_step": 195973, "epoch": 4666} {"train_loss": -7.123652458190918, "global_step": 195974, "epoch": 4666} {"train_loss": -7.138479232788086, "global_step": 195975, "epoch": 4666} {"train_loss": -7.231574535369873, "global_step": 195976, "epoch": 4666} {"train_loss": -7.104968070983887, "global_step": 195977, "epoch": 4666} {"train_loss": -7.267093181610107, "global_step": 195978, "epoch": 4666} {"train_loss": -7.159220218658447, "global_step": 195979, "epoch": 4666} {"train_loss": -7.194096565246582, "global_step": 195980, "epoch": 4666} {"train_loss": -7.176117897033691, "global_step": 195981, "epoch": 4666} {"train_loss": -7.124993801116943, "global_step": 195982, "epoch": 4666} {"train_loss": -7.167301177978516, "global_step": 195983, "epoch": 4666} {"train_loss": -7.324377059936523, "global_step": 195984, "epoch": 4666} {"train_loss": -7.21071720123291, "global_step": 195985, "epoch": 4666} {"train_loss": -7.232705593109131, "global_step": 195986, "epoch": 4666} {"train_loss": -7.040574550628662, "global_step": 195987, "epoch": 4666} {"train_loss": -7.266633033752441, "global_step": 195988, "epoch": 4666} {"train_loss": -7.162389755249023, "global_step": 195989, "epoch": 4666} {"train_loss": -7.261944770812988, "global_step": 195990, "epoch": 4666} {"train_loss": -7.201015472412109, "global_step": 195991, "epoch": 4666} {"train_loss": -7.1454644203186035, "global_step": 195992, "epoch": 4666} {"train_loss": -7.224957466125488, "global_step": 195993, "epoch": 4666} {"train_loss": -7.208148002624512, "global_step": 195994, "epoch": 4666} {"train_loss": -7.224870681762695, "global_step": 195995, "epoch": 4666} {"train_loss": -7.30288553237915, "global_step": 195996, "epoch": 4666} {"train_loss": -7.234428405761719, "global_step": 195997, "epoch": 4666} {"train_loss": -7.240810871124268, "global_step": 195998, "epoch": 4666} {"train_loss": -7.31038236618042, "global_step": 195999, "epoch": 4666} {"train_loss": -7.320375442504883, "global_step": 196000, "epoch": 4666} {"train_loss": -7.249878883361816, "global_step": 196001, "epoch": 4666} {"train_loss": -7.258810043334961, "global_step": 196002, "epoch": 4666} {"train_loss": -7.1445417404174805, "global_step": 196003, "epoch": 4666} {"train_loss": -7.218416690826416, "global_step": 196004, "epoch": 4666} {"train_loss": -7.199374198913574, "global_step": 196005, "epoch": 4666} {"train_loss": -7.3179473876953125, "global_step": 196006, "epoch": 4666} {"train_loss": -7.365293502807617, "global_step": 196007, "epoch": 4666} {"train_loss": -7.215239524841309, "global_step": 196008, "epoch": 4666} {"train_loss": -7.154533386230469, "global_step": 196009, "epoch": 4666} {"train_loss": -7.275435447692871, "global_step": 196010, "epoch": 4666} {"train_loss": -7.149746417999268, "global_step": 196011, "epoch": 4666} {"train_loss": -7.291670799255371, "global_step": 196012, "epoch": 4666} {"train_loss": -7.215427194322858, "global_step": 196013, "epoch": 4666, "val_loss": 68865.4609375} {"train_loss": -7.136598587036133, "global_step": 196014, "epoch": 4667} {"train_loss": -7.213388442993164, "global_step": 196015, "epoch": 4667} {"train_loss": -7.302457332611084, "global_step": 196016, "epoch": 4667} {"train_loss": -7.10073184967041, "global_step": 196017, "epoch": 4667} {"train_loss": -7.31497049331665, "global_step": 196018, "epoch": 4667} {"train_loss": -7.099654674530029, "global_step": 196019, "epoch": 4667} {"train_loss": -7.286656856536865, "global_step": 196020, "epoch": 4667} {"train_loss": -7.287067890167236, "global_step": 196021, "epoch": 4667} {"train_loss": -7.260887622833252, "global_step": 196022, "epoch": 4667} {"train_loss": -7.275633335113525, "global_step": 196023, "epoch": 4667} {"train_loss": -7.3229546546936035, "global_step": 196024, "epoch": 4667} {"train_loss": -7.219922065734863, "global_step": 196025, "epoch": 4667} {"train_loss": -7.145158290863037, "global_step": 196026, "epoch": 4667} {"train_loss": -7.251347541809082, "global_step": 196027, "epoch": 4667} {"train_loss": -7.275867938995361, "global_step": 196028, "epoch": 4667} {"train_loss": -7.316404342651367, "global_step": 196029, "epoch": 4667} {"train_loss": -7.2386274337768555, "global_step": 196030, "epoch": 4667} {"train_loss": -7.260087013244629, "global_step": 196031, "epoch": 4667} {"train_loss": -7.150130271911621, "global_step": 196032, "epoch": 4667} {"train_loss": -7.245594024658203, "global_step": 196033, "epoch": 4667} {"train_loss": -7.217337608337402, "global_step": 196034, "epoch": 4667} {"train_loss": -7.191773414611816, "global_step": 196035, "epoch": 4667} {"train_loss": -7.159550666809082, "global_step": 196036, "epoch": 4667} {"train_loss": -7.156236171722412, "global_step": 196037, "epoch": 4667} {"train_loss": -7.074261665344238, "global_step": 196038, "epoch": 4667} {"train_loss": -7.083086967468262, "global_step": 196039, "epoch": 4667} {"train_loss": -7.264631748199463, "global_step": 196040, "epoch": 4667} {"train_loss": -7.297903060913086, "global_step": 196041, "epoch": 4667} {"train_loss": -7.209987640380859, "global_step": 196042, "epoch": 4667} {"train_loss": -7.12466287612915, "global_step": 196043, "epoch": 4667} {"train_loss": -7.1862945556640625, "global_step": 196044, "epoch": 4667} {"train_loss": -7.224090576171875, "global_step": 196045, "epoch": 4667} {"train_loss": -7.038661479949951, "global_step": 196046, "epoch": 4667} {"train_loss": -7.164145469665527, "global_step": 196047, "epoch": 4667} {"train_loss": -7.250840187072754, "global_step": 196048, "epoch": 4667} {"train_loss": -7.248553276062012, "global_step": 196049, "epoch": 4667} {"train_loss": -7.175302505493164, "global_step": 196050, "epoch": 4667} {"train_loss": -7.145751953125, "global_step": 196051, "epoch": 4667} {"train_loss": -7.016851425170898, "global_step": 196052, "epoch": 4667} {"train_loss": -7.225609302520752, "global_step": 196053, "epoch": 4667} {"train_loss": -7.104686260223389, "global_step": 196054, "epoch": 4667} {"train_loss": -7.1938487348102385, "global_step": 196055, "epoch": 4667, "val_loss": 69142.640625} {"train_loss": -7.159157752990723, "global_step": 196056, "epoch": 4668} {"train_loss": -7.065211772918701, "global_step": 196057, "epoch": 4668} {"train_loss": -7.098236083984375, "global_step": 196058, "epoch": 4668} {"train_loss": -7.087856292724609, "global_step": 196059, "epoch": 4668} {"train_loss": -7.118047714233398, "global_step": 196060, "epoch": 4668} {"train_loss": -7.173900604248047, "global_step": 196061, "epoch": 4668} {"train_loss": -7.065732955932617, "global_step": 196062, "epoch": 4668} {"train_loss": -7.150739669799805, "global_step": 196063, "epoch": 4668} {"train_loss": -6.923939228057861, "global_step": 196064, "epoch": 4668} {"train_loss": -7.07048225402832, "global_step": 196065, "epoch": 4668} {"train_loss": -7.079230785369873, "global_step": 196066, "epoch": 4668} {"train_loss": -6.8322601318359375, "global_step": 196067, "epoch": 4668} {"train_loss": -7.2533063888549805, "global_step": 196068, "epoch": 4668} {"train_loss": -6.981666564941406, "global_step": 196069, "epoch": 4668} {"train_loss": -6.923774719238281, "global_step": 196070, "epoch": 4668} {"train_loss": -6.981115341186523, "global_step": 196071, "epoch": 4668} {"train_loss": -6.945448875427246, "global_step": 196072, "epoch": 4668} {"train_loss": -7.0886945724487305, "global_step": 196073, "epoch": 4668} {"train_loss": -6.976524353027344, "global_step": 196074, "epoch": 4668} {"train_loss": -7.083970546722412, "global_step": 196075, "epoch": 4668} {"train_loss": -6.916234016418457, "global_step": 196076, "epoch": 4668} {"train_loss": -7.154099464416504, "global_step": 196077, "epoch": 4668} {"train_loss": -6.9819488525390625, "global_step": 196078, "epoch": 4668} {"train_loss": -7.078359603881836, "global_step": 196079, "epoch": 4668} {"train_loss": -6.92432165145874, "global_step": 196080, "epoch": 4668} {"train_loss": -7.085879802703857, "global_step": 196081, "epoch": 4668} {"train_loss": -6.826559066772461, "global_step": 196082, "epoch": 4668} {"train_loss": -7.051680564880371, "global_step": 196083, "epoch": 4668} {"train_loss": -7.111042499542236, "global_step": 196084, "epoch": 4668} {"train_loss": -7.0967607498168945, "global_step": 196085, "epoch": 4668} {"train_loss": -6.979757308959961, "global_step": 196086, "epoch": 4668} {"train_loss": -7.112706184387207, "global_step": 196087, "epoch": 4668} {"train_loss": -7.034229755401611, "global_step": 196088, "epoch": 4668} {"train_loss": -7.100974082946777, "global_step": 196089, "epoch": 4668} {"train_loss": -7.110864162445068, "global_step": 196090, "epoch": 4668} {"train_loss": -7.236237525939941, "global_step": 196091, "epoch": 4668} {"train_loss": -7.120340347290039, "global_step": 196092, "epoch": 4668} {"train_loss": -7.127326965332031, "global_step": 196093, "epoch": 4668} {"train_loss": -7.212525367736816, "global_step": 196094, "epoch": 4668} {"train_loss": -7.18006706237793, "global_step": 196095, "epoch": 4668} {"train_loss": -7.234826564788818, "global_step": 196096, "epoch": 4668} {"train_loss": -7.066709711438134, "global_step": 196097, "epoch": 4668, "val_loss": 68926.703125} {"train_loss": -7.069750785827637, "global_step": 196098, "epoch": 4669} {"train_loss": -7.213168144226074, "global_step": 196099, "epoch": 4669} {"train_loss": -7.2066144943237305, "global_step": 196100, "epoch": 4669} {"train_loss": -7.317667007446289, "global_step": 196101, "epoch": 4669} {"train_loss": -7.179856300354004, "global_step": 196102, "epoch": 4669} {"train_loss": -7.147291660308838, "global_step": 196103, "epoch": 4669} {"train_loss": -7.175762176513672, "global_step": 196104, "epoch": 4669} {"train_loss": -7.199373722076416, "global_step": 196105, "epoch": 4669} {"train_loss": -7.346334457397461, "global_step": 196106, "epoch": 4669} {"train_loss": -7.221932411193848, "global_step": 196107, "epoch": 4669} {"train_loss": -7.127690315246582, "global_step": 196108, "epoch": 4669} {"train_loss": -7.168397903442383, "global_step": 196109, "epoch": 4669} {"train_loss": -7.277029037475586, "global_step": 196110, "epoch": 4669} {"train_loss": -7.310581684112549, "global_step": 196111, "epoch": 4669} {"train_loss": -7.072097301483154, "global_step": 196112, "epoch": 4669} {"train_loss": -7.293295860290527, "global_step": 196113, "epoch": 4669} {"train_loss": -7.258359909057617, "global_step": 196114, "epoch": 4669} {"train_loss": -7.101734161376953, "global_step": 196115, "epoch": 4669} {"train_loss": -7.236210346221924, "global_step": 196116, "epoch": 4669} {"train_loss": -7.2142720222473145, "global_step": 196117, "epoch": 4669} {"train_loss": -7.126368522644043, "global_step": 196118, "epoch": 4669} {"train_loss": -7.203794479370117, "global_step": 196119, "epoch": 4669} {"train_loss": -7.229437828063965, "global_step": 196120, "epoch": 4669} {"train_loss": -7.259576320648193, "global_step": 196121, "epoch": 4669} {"train_loss": -7.1559739112854, "global_step": 196122, "epoch": 4669} {"train_loss": -7.260842323303223, "global_step": 196123, "epoch": 4669} {"train_loss": -7.354732990264893, "global_step": 196124, "epoch": 4669} {"train_loss": -7.09518575668335, "global_step": 196125, "epoch": 4669} {"train_loss": -7.154099464416504, "global_step": 196126, "epoch": 4669} {"train_loss": -7.230188369750977, "global_step": 196127, "epoch": 4669} {"train_loss": -7.157822132110596, "global_step": 196128, "epoch": 4669} {"train_loss": -7.287353515625, "global_step": 196129, "epoch": 4669} {"train_loss": -7.447823524475098, "global_step": 196130, "epoch": 4669} {"train_loss": -7.26827335357666, "global_step": 196131, "epoch": 4669} {"train_loss": -7.2428436279296875, "global_step": 196132, "epoch": 4669} {"train_loss": -7.151124954223633, "global_step": 196133, "epoch": 4669} {"train_loss": -7.231668472290039, "global_step": 196134, "epoch": 4669} {"train_loss": -7.215387344360352, "global_step": 196135, "epoch": 4669} {"train_loss": -7.2147016525268555, "global_step": 196136, "epoch": 4669} {"train_loss": -7.269944190979004, "global_step": 196137, "epoch": 4669} {"train_loss": -7.38565731048584, "global_step": 196138, "epoch": 4669} {"train_loss": -7.22154104141962, "global_step": 196139, "epoch": 4669, "val_loss": 68916.3984375} {"train_loss": -7.267568588256836, "global_step": 196140, "epoch": 4670} {"train_loss": -7.333083152770996, "global_step": 196141, "epoch": 4670} {"train_loss": -7.322571754455566, "global_step": 196142, "epoch": 4670} {"train_loss": -7.212570667266846, "global_step": 196143, "epoch": 4670} {"train_loss": -7.25954532623291, "global_step": 196144, "epoch": 4670} {"train_loss": -7.224483966827393, "global_step": 196145, "epoch": 4670} {"train_loss": -7.328784942626953, "global_step": 196146, "epoch": 4670} {"train_loss": -7.277618408203125, "global_step": 196147, "epoch": 4670} {"train_loss": -7.322493553161621, "global_step": 196148, "epoch": 4670} {"train_loss": -7.2177414894104, "global_step": 196149, "epoch": 4670} {"train_loss": -7.135915756225586, "global_step": 196150, "epoch": 4670} {"train_loss": -7.250417232513428, "global_step": 196151, "epoch": 4670} {"train_loss": -7.215493202209473, "global_step": 196152, "epoch": 4670} {"train_loss": -7.27260684967041, "global_step": 196153, "epoch": 4670} {"train_loss": -7.233486652374268, "global_step": 196154, "epoch": 4670} {"train_loss": -7.314018726348877, "global_step": 196155, "epoch": 4670} {"train_loss": -7.221482276916504, "global_step": 196156, "epoch": 4670} {"train_loss": -7.172603607177734, "global_step": 196157, "epoch": 4670} {"train_loss": -7.035678386688232, "global_step": 196158, "epoch": 4670} {"train_loss": -7.096492767333984, "global_step": 196159, "epoch": 4670} {"train_loss": -7.144621849060059, "global_step": 196160, "epoch": 4670} {"train_loss": -7.283733367919922, "global_step": 196161, "epoch": 4670} {"train_loss": -7.339540481567383, "global_step": 196162, "epoch": 4670} {"train_loss": -7.16230583190918, "global_step": 196163, "epoch": 4670} {"train_loss": -7.358389854431152, "global_step": 196164, "epoch": 4670} {"train_loss": -7.2428364753723145, "global_step": 196165, "epoch": 4670} {"train_loss": -7.261754512786865, "global_step": 196166, "epoch": 4670} {"train_loss": -7.192258358001709, "global_step": 196167, "epoch": 4670} {"train_loss": -7.168212890625, "global_step": 196168, "epoch": 4670} {"train_loss": -7.255140781402588, "global_step": 196169, "epoch": 4670} {"train_loss": -7.226789951324463, "global_step": 196170, "epoch": 4670} {"train_loss": -7.325941562652588, "global_step": 196171, "epoch": 4670} {"train_loss": -7.257338523864746, "global_step": 196172, "epoch": 4670} {"train_loss": -7.0863189697265625, "global_step": 196173, "epoch": 4670} {"train_loss": -7.139665603637695, "global_step": 196174, "epoch": 4670} {"train_loss": -7.195388317108154, "global_step": 196175, "epoch": 4670} {"train_loss": -7.1800384521484375, "global_step": 196176, "epoch": 4670} {"train_loss": -7.284506797790527, "global_step": 196177, "epoch": 4670} {"train_loss": -7.080348968505859, "global_step": 196178, "epoch": 4670} {"train_loss": -7.1678466796875, "global_step": 196179, "epoch": 4670} {"train_loss": -7.171430587768555, "global_step": 196180, "epoch": 4670} {"train_loss": -7.2256158874148415, "global_step": 196181, "epoch": 4670, "val_loss": 69019.359375} {"train_loss": -7.122349739074707, "global_step": 196182, "epoch": 4671} {"train_loss": -7.204805850982666, "global_step": 196183, "epoch": 4671} {"train_loss": -7.320010185241699, "global_step": 196184, "epoch": 4671} {"train_loss": -7.333436965942383, "global_step": 196185, "epoch": 4671} {"train_loss": -7.220155715942383, "global_step": 196186, "epoch": 4671} {"train_loss": -7.274020195007324, "global_step": 196187, "epoch": 4671} {"train_loss": -7.31282901763916, "global_step": 196188, "epoch": 4671} {"train_loss": -7.215004920959473, "global_step": 196189, "epoch": 4671} {"train_loss": -7.180417537689209, "global_step": 196190, "epoch": 4671} {"train_loss": -7.212398529052734, "global_step": 196191, "epoch": 4671} {"train_loss": -7.097384929656982, "global_step": 196192, "epoch": 4671} {"train_loss": -7.148794174194336, "global_step": 196193, "epoch": 4671} {"train_loss": -7.139051914215088, "global_step": 196194, "epoch": 4671} {"train_loss": -7.1439924240112305, "global_step": 196195, "epoch": 4671} {"train_loss": -7.218197822570801, "global_step": 196196, "epoch": 4671} {"train_loss": -7.224034309387207, "global_step": 196197, "epoch": 4671} {"train_loss": -7.2408447265625, "global_step": 196198, "epoch": 4671} {"train_loss": -7.280021667480469, "global_step": 196199, "epoch": 4671} {"train_loss": -7.21677303314209, "global_step": 196200, "epoch": 4671} {"train_loss": -7.211025238037109, "global_step": 196201, "epoch": 4671} {"train_loss": -7.23894739151001, "global_step": 196202, "epoch": 4671} {"train_loss": -7.354116439819336, "global_step": 196203, "epoch": 4671} {"train_loss": -7.203131675720215, "global_step": 196204, "epoch": 4671} {"train_loss": -7.125602722167969, "global_step": 196205, "epoch": 4671} {"train_loss": -7.291713714599609, "global_step": 196206, "epoch": 4671} {"train_loss": -7.239832878112793, "global_step": 196207, "epoch": 4671} {"train_loss": -7.2303314208984375, "global_step": 196208, "epoch": 4671} {"train_loss": -7.325322151184082, "global_step": 196209, "epoch": 4671} {"train_loss": -7.263596534729004, "global_step": 196210, "epoch": 4671} {"train_loss": -7.2689690589904785, "global_step": 196211, "epoch": 4671} {"train_loss": -7.106017112731934, "global_step": 196212, "epoch": 4671} {"train_loss": -7.162292003631592, "global_step": 196213, "epoch": 4671} {"train_loss": -7.113951683044434, "global_step": 196214, "epoch": 4671} {"train_loss": -7.238238334655762, "global_step": 196215, "epoch": 4671} {"train_loss": -7.302218437194824, "global_step": 196216, "epoch": 4671} {"train_loss": -6.9747772216796875, "global_step": 196217, "epoch": 4671} {"train_loss": -7.126877307891846, "global_step": 196218, "epoch": 4671} {"train_loss": -7.09794807434082, "global_step": 196219, "epoch": 4671} {"train_loss": -6.968940734863281, "global_step": 196220, "epoch": 4671} {"train_loss": -7.173955917358398, "global_step": 196221, "epoch": 4671} {"train_loss": -7.093562126159668, "global_step": 196222, "epoch": 4671} {"train_loss": -7.1989423888070245, "global_step": 196223, "epoch": 4671, "val_loss": 68919.5390625} {"train_loss": -7.230785369873047, "global_step": 196224, "epoch": 4672} {"train_loss": -7.106995582580566, "global_step": 196225, "epoch": 4672} {"train_loss": -7.246087074279785, "global_step": 196226, "epoch": 4672} {"train_loss": -7.156776428222656, "global_step": 196227, "epoch": 4672} {"train_loss": -7.11994743347168, "global_step": 196228, "epoch": 4672} {"train_loss": -7.196099281311035, "global_step": 196229, "epoch": 4672} {"train_loss": -7.064401626586914, "global_step": 196230, "epoch": 4672} {"train_loss": -7.186047077178955, "global_step": 196231, "epoch": 4672} {"train_loss": -7.118475437164307, "global_step": 196232, "epoch": 4672} {"train_loss": -7.123996257781982, "global_step": 196233, "epoch": 4672} {"train_loss": -7.104687690734863, "global_step": 196234, "epoch": 4672} {"train_loss": -7.033343315124512, "global_step": 196235, "epoch": 4672} {"train_loss": -7.26943302154541, "global_step": 196236, "epoch": 4672} {"train_loss": -6.906315326690674, "global_step": 196237, "epoch": 4672} {"train_loss": -7.222771644592285, "global_step": 196238, "epoch": 4672} {"train_loss": -7.169962406158447, "global_step": 196239, "epoch": 4672} {"train_loss": -7.140101432800293, "global_step": 196240, "epoch": 4672} {"train_loss": -7.189226150512695, "global_step": 196241, "epoch": 4672} {"train_loss": -7.057808876037598, "global_step": 196242, "epoch": 4672} {"train_loss": -7.1820759773254395, "global_step": 196243, "epoch": 4672} {"train_loss": -7.222386360168457, "global_step": 196244, "epoch": 4672} {"train_loss": -7.217735290527344, "global_step": 196245, "epoch": 4672} {"train_loss": -7.247560501098633, "global_step": 196246, "epoch": 4672} {"train_loss": -7.240871906280518, "global_step": 196247, "epoch": 4672} {"train_loss": -7.266464710235596, "global_step": 196248, "epoch": 4672} {"train_loss": -7.12265682220459, "global_step": 196249, "epoch": 4672} {"train_loss": -7.185086250305176, "global_step": 196250, "epoch": 4672} {"train_loss": -7.269519805908203, "global_step": 196251, "epoch": 4672} {"train_loss": -7.158617973327637, "global_step": 196252, "epoch": 4672} {"train_loss": -7.223433494567871, "global_step": 196253, "epoch": 4672} {"train_loss": -7.201783180236816, "global_step": 196254, "epoch": 4672} {"train_loss": -7.229881286621094, "global_step": 196255, "epoch": 4672} {"train_loss": -7.177908897399902, "global_step": 196256, "epoch": 4672} {"train_loss": -7.173724174499512, "global_step": 196257, "epoch": 4672} {"train_loss": -7.189515113830566, "global_step": 196258, "epoch": 4672} {"train_loss": -6.961286544799805, "global_step": 196259, "epoch": 4672} {"train_loss": -7.1943817138671875, "global_step": 196260, "epoch": 4672} {"train_loss": -7.2911906242370605, "global_step": 196261, "epoch": 4672} {"train_loss": -7.071255683898926, "global_step": 196262, "epoch": 4672} {"train_loss": -7.127399444580078, "global_step": 196263, "epoch": 4672} {"train_loss": -7.187555313110352, "global_step": 196264, "epoch": 4672} {"train_loss": -7.163377818607149, "global_step": 196265, "epoch": 4672, "val_loss": 69041.4921875} {"train_loss": -7.197728157043457, "global_step": 196266, "epoch": 4673} {"train_loss": -7.219462871551514, "global_step": 196267, "epoch": 4673} {"train_loss": -7.229374885559082, "global_step": 196268, "epoch": 4673} {"train_loss": -7.19997501373291, "global_step": 196269, "epoch": 4673} {"train_loss": -7.152024745941162, "global_step": 196270, "epoch": 4673} {"train_loss": -7.238971710205078, "global_step": 196271, "epoch": 4673} {"train_loss": -7.206377029418945, "global_step": 196272, "epoch": 4673} {"train_loss": -7.202975273132324, "global_step": 196273, "epoch": 4673} {"train_loss": -7.304880619049072, "global_step": 196274, "epoch": 4673} {"train_loss": -7.217759132385254, "global_step": 196275, "epoch": 4673} {"train_loss": -7.142364501953125, "global_step": 196276, "epoch": 4673} {"train_loss": -7.344684600830078, "global_step": 196277, "epoch": 4673} {"train_loss": -7.317444324493408, "global_step": 196278, "epoch": 4673} {"train_loss": -7.125665664672852, "global_step": 196279, "epoch": 4673} {"train_loss": -7.310118675231934, "global_step": 196280, "epoch": 4673} {"train_loss": -7.332540512084961, "global_step": 196281, "epoch": 4673} {"train_loss": -7.227574825286865, "global_step": 196282, "epoch": 4673} {"train_loss": -7.224443435668945, "global_step": 196283, "epoch": 4673} {"train_loss": -7.256171226501465, "global_step": 196284, "epoch": 4673} {"train_loss": -7.408669948577881, "global_step": 196285, "epoch": 4673} {"train_loss": -7.169257640838623, "global_step": 196286, "epoch": 4673} {"train_loss": -7.2905120849609375, "global_step": 196287, "epoch": 4673} {"train_loss": -7.230009078979492, "global_step": 196288, "epoch": 4673} {"train_loss": -7.166463375091553, "global_step": 196289, "epoch": 4673} {"train_loss": -7.224583148956299, "global_step": 196290, "epoch": 4673} {"train_loss": -7.236740589141846, "global_step": 196291, "epoch": 4673} {"train_loss": -7.363391876220703, "global_step": 196292, "epoch": 4673} {"train_loss": -7.382142066955566, "global_step": 196293, "epoch": 4673} {"train_loss": -7.29921817779541, "global_step": 196294, "epoch": 4673} {"train_loss": -7.269176959991455, "global_step": 196295, "epoch": 4673} {"train_loss": -7.203348159790039, "global_step": 196296, "epoch": 4673} {"train_loss": -7.236952781677246, "global_step": 196297, "epoch": 4673} {"train_loss": -7.1812028884887695, "global_step": 196298, "epoch": 4673} {"train_loss": -7.313624382019043, "global_step": 196299, "epoch": 4673} {"train_loss": -7.351665496826172, "global_step": 196300, "epoch": 4673} {"train_loss": -7.211419105529785, "global_step": 196301, "epoch": 4673} {"train_loss": -7.319401264190674, "global_step": 196302, "epoch": 4673} {"train_loss": -7.295336723327637, "global_step": 196303, "epoch": 4673} {"train_loss": -7.222550868988037, "global_step": 196304, "epoch": 4673} {"train_loss": -7.211183547973633, "global_step": 196305, "epoch": 4673} {"train_loss": -7.237943649291992, "global_step": 196306, "epoch": 4673} {"train_loss": -7.251086848122733, "global_step": 196307, "epoch": 4673, "val_loss": 68961.5546875} {"train_loss": -7.207542896270752, "global_step": 196308, "epoch": 4674} {"train_loss": -7.283919811248779, "global_step": 196309, "epoch": 4674} {"train_loss": -7.251228332519531, "global_step": 196310, "epoch": 4674} {"train_loss": -7.17349100112915, "global_step": 196311, "epoch": 4674} {"train_loss": -7.092801570892334, "global_step": 196312, "epoch": 4674} {"train_loss": -7.199449062347412, "global_step": 196313, "epoch": 4674} {"train_loss": -7.242844581604004, "global_step": 196314, "epoch": 4674} {"train_loss": -7.052653789520264, "global_step": 196315, "epoch": 4674} {"train_loss": -7.231368541717529, "global_step": 196316, "epoch": 4674} {"train_loss": -7.204267978668213, "global_step": 196317, "epoch": 4674} {"train_loss": -7.006967544555664, "global_step": 196318, "epoch": 4674} {"train_loss": -7.092455863952637, "global_step": 196319, "epoch": 4674} {"train_loss": -7.1546525955200195, "global_step": 196320, "epoch": 4674} {"train_loss": -6.944186687469482, "global_step": 196321, "epoch": 4674} {"train_loss": -6.955116271972656, "global_step": 196322, "epoch": 4674} {"train_loss": -7.243809223175049, "global_step": 196323, "epoch": 4674} {"train_loss": -6.8564887046813965, "global_step": 196324, "epoch": 4674} {"train_loss": -7.1150221824646, "global_step": 196325, "epoch": 4674} {"train_loss": -7.077630996704102, "global_step": 196326, "epoch": 4674} {"train_loss": -6.944823265075684, "global_step": 196327, "epoch": 4674} {"train_loss": -7.047780990600586, "global_step": 196328, "epoch": 4674} {"train_loss": -6.904621124267578, "global_step": 196329, "epoch": 4674} {"train_loss": -6.9631781578063965, "global_step": 196330, "epoch": 4674} {"train_loss": -7.0632123947143555, "global_step": 196331, "epoch": 4674} {"train_loss": -6.859100818634033, "global_step": 196332, "epoch": 4674} {"train_loss": -7.016084671020508, "global_step": 196333, "epoch": 4674} {"train_loss": -7.066869735717773, "global_step": 196334, "epoch": 4674} {"train_loss": -7.006012916564941, "global_step": 196335, "epoch": 4674} {"train_loss": -7.058588981628418, "global_step": 196336, "epoch": 4674} {"train_loss": -7.0903215408325195, "global_step": 196337, "epoch": 4674} {"train_loss": -7.010573863983154, "global_step": 196338, "epoch": 4674} {"train_loss": -7.080687046051025, "global_step": 196339, "epoch": 4674} {"train_loss": -7.04924201965332, "global_step": 196340, "epoch": 4674} {"train_loss": -7.008658409118652, "global_step": 196341, "epoch": 4674} {"train_loss": -7.142868518829346, "global_step": 196342, "epoch": 4674} {"train_loss": -7.211247444152832, "global_step": 196343, "epoch": 4674} {"train_loss": -7.138625144958496, "global_step": 196344, "epoch": 4674} {"train_loss": -7.144732475280762, "global_step": 196345, "epoch": 4674} {"train_loss": -7.117356777191162, "global_step": 196346, "epoch": 4674} {"train_loss": -7.068492889404297, "global_step": 196347, "epoch": 4674} {"train_loss": -7.115540027618408, "global_step": 196348, "epoch": 4674} {"train_loss": -7.083203531446911, "global_step": 196349, "epoch": 4674, "val_loss": 68945.6484375} {"train_loss": -7.070110321044922, "global_step": 196350, "epoch": 4675} {"train_loss": -6.9490814208984375, "global_step": 196351, "epoch": 4675} {"train_loss": -7.104856491088867, "global_step": 196352, "epoch": 4675} {"train_loss": -7.011362552642822, "global_step": 196353, "epoch": 4675} {"train_loss": -7.129176139831543, "global_step": 196354, "epoch": 4675} {"train_loss": -6.921602249145508, "global_step": 196355, "epoch": 4675} {"train_loss": -6.999850273132324, "global_step": 196356, "epoch": 4675} {"train_loss": -7.079770565032959, "global_step": 196357, "epoch": 4675} {"train_loss": -7.011662483215332, "global_step": 196358, "epoch": 4675} {"train_loss": -7.1262969970703125, "global_step": 196359, "epoch": 4675} {"train_loss": -7.124402046203613, "global_step": 196360, "epoch": 4675} {"train_loss": -7.151215553283691, "global_step": 196361, "epoch": 4675} {"train_loss": -7.230367183685303, "global_step": 196362, "epoch": 4675} {"train_loss": -7.149211883544922, "global_step": 196363, "epoch": 4675} {"train_loss": -7.216224193572998, "global_step": 196364, "epoch": 4675} {"train_loss": -7.200707912445068, "global_step": 196365, "epoch": 4675} {"train_loss": -7.217995643615723, "global_step": 196366, "epoch": 4675} {"train_loss": -7.050809860229492, "global_step": 196367, "epoch": 4675} {"train_loss": -7.1331000328063965, "global_step": 196368, "epoch": 4675} {"train_loss": -7.025651454925537, "global_step": 196369, "epoch": 4675} {"train_loss": -7.2060394287109375, "global_step": 196370, "epoch": 4675} {"train_loss": -7.253890037536621, "global_step": 196371, "epoch": 4675} {"train_loss": -7.145322799682617, "global_step": 196372, "epoch": 4675} {"train_loss": -7.2623748779296875, "global_step": 196373, "epoch": 4675} {"train_loss": -7.1938018798828125, "global_step": 196374, "epoch": 4675} {"train_loss": -7.289649963378906, "global_step": 196375, "epoch": 4675} {"train_loss": -7.214385032653809, "global_step": 196376, "epoch": 4675} {"train_loss": -7.181950569152832, "global_step": 196377, "epoch": 4675} {"train_loss": -7.2077531814575195, "global_step": 196378, "epoch": 4675} {"train_loss": -7.24868106842041, "global_step": 196379, "epoch": 4675} {"train_loss": -7.173651695251465, "global_step": 196380, "epoch": 4675} {"train_loss": -7.2342681884765625, "global_step": 196381, "epoch": 4675} {"train_loss": -7.173300743103027, "global_step": 196382, "epoch": 4675} {"train_loss": -7.266270637512207, "global_step": 196383, "epoch": 4675} {"train_loss": -7.186176300048828, "global_step": 196384, "epoch": 4675} {"train_loss": -7.222150802612305, "global_step": 196385, "epoch": 4675} {"train_loss": -7.137600898742676, "global_step": 196386, "epoch": 4675} {"train_loss": -7.158584117889404, "global_step": 196387, "epoch": 4675} {"train_loss": -7.122376918792725, "global_step": 196388, "epoch": 4675} {"train_loss": -7.256686687469482, "global_step": 196389, "epoch": 4675} {"train_loss": -7.278711795806885, "global_step": 196390, "epoch": 4675} {"train_loss": -7.155758585248675, "global_step": 196391, "epoch": 4675, "val_loss": 68996.9375} {"train_loss": -7.361936569213867, "global_step": 196392, "epoch": 4676} {"train_loss": -7.207358360290527, "global_step": 196393, "epoch": 4676} {"train_loss": -7.266356468200684, "global_step": 196394, "epoch": 4676} {"train_loss": -7.154044151306152, "global_step": 196395, "epoch": 4676} {"train_loss": -7.162867546081543, "global_step": 196396, "epoch": 4676} {"train_loss": -7.175484657287598, "global_step": 196397, "epoch": 4676} {"train_loss": -7.153927326202393, "global_step": 196398, "epoch": 4676} {"train_loss": -7.194431304931641, "global_step": 196399, "epoch": 4676} {"train_loss": -7.319011688232422, "global_step": 196400, "epoch": 4676} {"train_loss": -7.299124717712402, "global_step": 196401, "epoch": 4676} {"train_loss": -7.185633659362793, "global_step": 196402, "epoch": 4676} {"train_loss": -7.2559709548950195, "global_step": 196403, "epoch": 4676} {"train_loss": -7.199153900146484, "global_step": 196404, "epoch": 4676} {"train_loss": -7.293222427368164, "global_step": 196405, "epoch": 4676} {"train_loss": -7.305180072784424, "global_step": 196406, "epoch": 4676} {"train_loss": -7.242627143859863, "global_step": 196407, "epoch": 4676} {"train_loss": -7.241938591003418, "global_step": 196408, "epoch": 4676} {"train_loss": -7.281747817993164, "global_step": 196409, "epoch": 4676} {"train_loss": -7.287863731384277, "global_step": 196410, "epoch": 4676} {"train_loss": -7.313458442687988, "global_step": 196411, "epoch": 4676} {"train_loss": -7.222513675689697, "global_step": 196412, "epoch": 4676} {"train_loss": -7.267642974853516, "global_step": 196413, "epoch": 4676} {"train_loss": -7.176077842712402, "global_step": 196414, "epoch": 4676} {"train_loss": -7.243274688720703, "global_step": 196415, "epoch": 4676} {"train_loss": -7.160707473754883, "global_step": 196416, "epoch": 4676} {"train_loss": -7.156249523162842, "global_step": 196417, "epoch": 4676} {"train_loss": -7.233977317810059, "global_step": 196418, "epoch": 4676} {"train_loss": -7.140242576599121, "global_step": 196419, "epoch": 4676} {"train_loss": -7.137689590454102, "global_step": 196420, "epoch": 4676} {"train_loss": -7.244715690612793, "global_step": 196421, "epoch": 4676} {"train_loss": -7.0647454261779785, "global_step": 196422, "epoch": 4676} {"train_loss": -6.95063591003418, "global_step": 196423, "epoch": 4676} {"train_loss": -7.148543357849121, "global_step": 196424, "epoch": 4676} {"train_loss": -7.072731018066406, "global_step": 196425, "epoch": 4676} {"train_loss": -7.179566383361816, "global_step": 196426, "epoch": 4676} {"train_loss": -7.133394718170166, "global_step": 196427, "epoch": 4676} {"train_loss": -7.172817707061768, "global_step": 196428, "epoch": 4676} {"train_loss": -7.192248821258545, "global_step": 196429, "epoch": 4676} {"train_loss": -7.165711879730225, "global_step": 196430, "epoch": 4676} {"train_loss": -7.27867317199707, "global_step": 196431, "epoch": 4676} {"train_loss": -7.166644096374512, "global_step": 196432, "epoch": 4676} {"train_loss": -7.203339508601597, "global_step": 196433, "epoch": 4676, "val_loss": 69243.2265625} {"train_loss": -7.244809627532959, "global_step": 196434, "epoch": 4677} {"train_loss": -7.241519451141357, "global_step": 196435, "epoch": 4677} {"train_loss": -7.1740264892578125, "global_step": 196436, "epoch": 4677} {"train_loss": -7.200920104980469, "global_step": 196437, "epoch": 4677} {"train_loss": -7.217429161071777, "global_step": 196438, "epoch": 4677} {"train_loss": -7.267529487609863, "global_step": 196439, "epoch": 4677} {"train_loss": -7.260490417480469, "global_step": 196440, "epoch": 4677} {"train_loss": -7.272356986999512, "global_step": 196441, "epoch": 4677} {"train_loss": -7.174966812133789, "global_step": 196442, "epoch": 4677} {"train_loss": -7.266117095947266, "global_step": 196443, "epoch": 4677} {"train_loss": -7.295627593994141, "global_step": 196444, "epoch": 4677} {"train_loss": -7.208327770233154, "global_step": 196445, "epoch": 4677} {"train_loss": -7.1058197021484375, "global_step": 196446, "epoch": 4677} {"train_loss": -7.149544715881348, "global_step": 196447, "epoch": 4677} {"train_loss": -7.208306312561035, "global_step": 196448, "epoch": 4677} {"train_loss": -7.043084144592285, "global_step": 196449, "epoch": 4677} {"train_loss": -7.161146640777588, "global_step": 196450, "epoch": 4677} {"train_loss": -7.135199069976807, "global_step": 196451, "epoch": 4677} {"train_loss": -7.1508684158325195, "global_step": 196452, "epoch": 4677} {"train_loss": -7.182032585144043, "global_step": 196453, "epoch": 4677} {"train_loss": -7.124087810516357, "global_step": 196454, "epoch": 4677} {"train_loss": -7.249183654785156, "global_step": 196455, "epoch": 4677} {"train_loss": -7.186126708984375, "global_step": 196456, "epoch": 4677} {"train_loss": -7.142239570617676, "global_step": 196457, "epoch": 4677} {"train_loss": -7.164982795715332, "global_step": 196458, "epoch": 4677} {"train_loss": -7.107728958129883, "global_step": 196459, "epoch": 4677} {"train_loss": -7.180915832519531, "global_step": 196460, "epoch": 4677} {"train_loss": -7.16888427734375, "global_step": 196461, "epoch": 4677} {"train_loss": -7.295165538787842, "global_step": 196462, "epoch": 4677} {"train_loss": -7.1267547607421875, "global_step": 196463, "epoch": 4677} {"train_loss": -7.227684020996094, "global_step": 196464, "epoch": 4677} {"train_loss": -7.138241767883301, "global_step": 196465, "epoch": 4677} {"train_loss": -7.192593574523926, "global_step": 196466, "epoch": 4677} {"train_loss": -7.25477933883667, "global_step": 196467, "epoch": 4677} {"train_loss": -7.193021297454834, "global_step": 196468, "epoch": 4677} {"train_loss": -7.212671756744385, "global_step": 196469, "epoch": 4677} {"train_loss": -7.101205825805664, "global_step": 196470, "epoch": 4677} {"train_loss": -7.23236608505249, "global_step": 196471, "epoch": 4677} {"train_loss": -7.192091464996338, "global_step": 196472, "epoch": 4677} {"train_loss": -7.131706714630127, "global_step": 196473, "epoch": 4677} {"train_loss": -7.187600135803223, "global_step": 196474, "epoch": 4677} {"train_loss": -7.187675214949108, "global_step": 196475, "epoch": 4677, "val_loss": 68997.96875} {"train_loss": -7.32960319519043, "global_step": 196476, "epoch": 4678} {"train_loss": -7.069082260131836, "global_step": 196477, "epoch": 4678} {"train_loss": -7.218051433563232, "global_step": 196478, "epoch": 4678} {"train_loss": -7.131221771240234, "global_step": 196479, "epoch": 4678} {"train_loss": -7.1505537033081055, "global_step": 196480, "epoch": 4678} {"train_loss": -7.115839004516602, "global_step": 196481, "epoch": 4678} {"train_loss": -7.204946994781494, "global_step": 196482, "epoch": 4678} {"train_loss": -7.207902431488037, "global_step": 196483, "epoch": 4678} {"train_loss": -7.134976387023926, "global_step": 196484, "epoch": 4678} {"train_loss": -7.140700340270996, "global_step": 196485, "epoch": 4678} {"train_loss": -7.185714244842529, "global_step": 196486, "epoch": 4678} {"train_loss": -7.228852272033691, "global_step": 196487, "epoch": 4678} {"train_loss": -7.04759407043457, "global_step": 196488, "epoch": 4678} {"train_loss": -7.25393009185791, "global_step": 196489, "epoch": 4678} {"train_loss": -7.213397026062012, "global_step": 196490, "epoch": 4678} {"train_loss": -7.18939208984375, "global_step": 196491, "epoch": 4678} {"train_loss": -7.124621391296387, "global_step": 196492, "epoch": 4678} {"train_loss": -7.1398162841796875, "global_step": 196493, "epoch": 4678} {"train_loss": -7.107875347137451, "global_step": 196494, "epoch": 4678} {"train_loss": -7.204479217529297, "global_step": 196495, "epoch": 4678} {"train_loss": -7.065891265869141, "global_step": 196496, "epoch": 4678} {"train_loss": -7.2027482986450195, "global_step": 196497, "epoch": 4678} {"train_loss": -7.196335315704346, "global_step": 196498, "epoch": 4678} {"train_loss": -7.323168754577637, "global_step": 196499, "epoch": 4678} {"train_loss": -7.071847438812256, "global_step": 196500, "epoch": 4678} {"train_loss": -7.206302642822266, "global_step": 196501, "epoch": 4678} {"train_loss": -7.211511135101318, "global_step": 196502, "epoch": 4678} {"train_loss": -7.29888916015625, "global_step": 196503, "epoch": 4678} {"train_loss": -7.241972923278809, "global_step": 196504, "epoch": 4678} {"train_loss": -7.2757744789123535, "global_step": 196505, "epoch": 4678} {"train_loss": -7.22182559967041, "global_step": 196506, "epoch": 4678} {"train_loss": -7.217073440551758, "global_step": 196507, "epoch": 4678} {"train_loss": -7.337299823760986, "global_step": 196508, "epoch": 4678} {"train_loss": -7.255215167999268, "global_step": 196509, "epoch": 4678} {"train_loss": -7.308206558227539, "global_step": 196510, "epoch": 4678} {"train_loss": -7.271226406097412, "global_step": 196511, "epoch": 4678} {"train_loss": -7.284395217895508, "global_step": 196512, "epoch": 4678} {"train_loss": -7.269237518310547, "global_step": 196513, "epoch": 4678} {"train_loss": -7.181265830993652, "global_step": 196514, "epoch": 4678} {"train_loss": -7.279661178588867, "global_step": 196515, "epoch": 4678} {"train_loss": -7.216571807861328, "global_step": 196516, "epoch": 4678} {"train_loss": -7.202710333324614, "global_step": 196517, "epoch": 4678, "val_loss": 69009.0546875} {"train_loss": -7.270410537719727, "global_step": 196518, "epoch": 4679} {"train_loss": -7.308728218078613, "global_step": 196519, "epoch": 4679} {"train_loss": -7.207953453063965, "global_step": 196520, "epoch": 4679} {"train_loss": -7.169229984283447, "global_step": 196521, "epoch": 4679} {"train_loss": -7.371889114379883, "global_step": 196522, "epoch": 4679} {"train_loss": -7.203857421875, "global_step": 196523, "epoch": 4679} {"train_loss": -7.204709529876709, "global_step": 196524, "epoch": 4679} {"train_loss": -7.191823482513428, "global_step": 196525, "epoch": 4679} {"train_loss": -7.236159324645996, "global_step": 196526, "epoch": 4679} {"train_loss": -7.199886322021484, "global_step": 196527, "epoch": 4679} {"train_loss": -7.221123695373535, "global_step": 196528, "epoch": 4679} {"train_loss": -7.292806148529053, "global_step": 196529, "epoch": 4679} {"train_loss": -7.196779251098633, "global_step": 196530, "epoch": 4679} {"train_loss": -7.3616156578063965, "global_step": 196531, "epoch": 4679} {"train_loss": -7.261129379272461, "global_step": 196532, "epoch": 4679} {"train_loss": -7.335489273071289, "global_step": 196533, "epoch": 4679} {"train_loss": -7.365389823913574, "global_step": 196534, "epoch": 4679} {"train_loss": -7.194860935211182, "global_step": 196535, "epoch": 4679} {"train_loss": -7.29672384262085, "global_step": 196536, "epoch": 4679} {"train_loss": -7.331477165222168, "global_step": 196537, "epoch": 4679} {"train_loss": -7.256180763244629, "global_step": 196538, "epoch": 4679} {"train_loss": -7.2601213455200195, "global_step": 196539, "epoch": 4679} {"train_loss": -7.304265022277832, "global_step": 196540, "epoch": 4679} {"train_loss": -7.245221138000488, "global_step": 196541, "epoch": 4679} {"train_loss": -7.249335289001465, "global_step": 196542, "epoch": 4679} {"train_loss": -7.243872165679932, "global_step": 196543, "epoch": 4679} {"train_loss": -7.320917129516602, "global_step": 196544, "epoch": 4679} {"train_loss": -7.324989318847656, "global_step": 196545, "epoch": 4679} {"train_loss": -7.258049964904785, "global_step": 196546, "epoch": 4679} {"train_loss": -7.1492414474487305, "global_step": 196547, "epoch": 4679} {"train_loss": -7.208264350891113, "global_step": 196548, "epoch": 4679} {"train_loss": -7.303277015686035, "global_step": 196549, "epoch": 4679} {"train_loss": -7.331684589385986, "global_step": 196550, "epoch": 4679} {"train_loss": -7.183749675750732, "global_step": 196551, "epoch": 4679} {"train_loss": -7.2756500244140625, "global_step": 196552, "epoch": 4679} {"train_loss": -7.18979549407959, "global_step": 196553, "epoch": 4679} {"train_loss": -7.307765960693359, "global_step": 196554, "epoch": 4679} {"train_loss": -7.338128089904785, "global_step": 196555, "epoch": 4679} {"train_loss": -7.198095321655273, "global_step": 196556, "epoch": 4679} {"train_loss": -7.141000747680664, "global_step": 196557, "epoch": 4679} {"train_loss": -7.282846450805664, "global_step": 196558, "epoch": 4679} {"train_loss": -7.254732222784133, "global_step": 196559, "epoch": 4679, "val_loss": 68938.1328125} {"train_loss": -7.250457763671875, "global_step": 196560, "epoch": 4680} {"train_loss": -7.364287376403809, "global_step": 196561, "epoch": 4680} {"train_loss": -7.222986221313477, "global_step": 196562, "epoch": 4680} {"train_loss": -7.147339344024658, "global_step": 196563, "epoch": 4680} {"train_loss": -7.314526557922363, "global_step": 196564, "epoch": 4680} {"train_loss": -7.196896076202393, "global_step": 196565, "epoch": 4680} {"train_loss": -7.156111717224121, "global_step": 196566, "epoch": 4680} {"train_loss": -7.203090667724609, "global_step": 196567, "epoch": 4680} {"train_loss": -7.137734413146973, "global_step": 196568, "epoch": 4680} {"train_loss": -7.211417198181152, "global_step": 196569, "epoch": 4680} {"train_loss": -7.072152137756348, "global_step": 196570, "epoch": 4680} {"train_loss": -7.238258361816406, "global_step": 196571, "epoch": 4680} {"train_loss": -7.153102874755859, "global_step": 196572, "epoch": 4680} {"train_loss": -7.308775424957275, "global_step": 196573, "epoch": 4680} {"train_loss": -7.335288047790527, "global_step": 196574, "epoch": 4680} {"train_loss": -7.2238688468933105, "global_step": 196575, "epoch": 4680} {"train_loss": -7.199790000915527, "global_step": 196576, "epoch": 4680} {"train_loss": -7.320188999176025, "global_step": 196577, "epoch": 4680} {"train_loss": -7.27369499206543, "global_step": 196578, "epoch": 4680} {"train_loss": -7.249153137207031, "global_step": 196579, "epoch": 4680} {"train_loss": -7.176093578338623, "global_step": 196580, "epoch": 4680} {"train_loss": -7.21397590637207, "global_step": 196581, "epoch": 4680} {"train_loss": -7.194852828979492, "global_step": 196582, "epoch": 4680} {"train_loss": -7.212540626525879, "global_step": 196583, "epoch": 4680} {"train_loss": -7.288067817687988, "global_step": 196584, "epoch": 4680} {"train_loss": -7.3824357986450195, "global_step": 196585, "epoch": 4680} {"train_loss": -7.219017505645752, "global_step": 196586, "epoch": 4680} {"train_loss": -7.221663475036621, "global_step": 196587, "epoch": 4680} {"train_loss": -7.298946857452393, "global_step": 196588, "epoch": 4680} {"train_loss": -7.160398483276367, "global_step": 196589, "epoch": 4680} {"train_loss": -7.227607727050781, "global_step": 196590, "epoch": 4680} {"train_loss": -7.266275405883789, "global_step": 196591, "epoch": 4680} {"train_loss": -7.281409740447998, "global_step": 196592, "epoch": 4680} {"train_loss": -7.2718987464904785, "global_step": 196593, "epoch": 4680} {"train_loss": -7.2303242683410645, "global_step": 196594, "epoch": 4680} {"train_loss": -7.370349407196045, "global_step": 196595, "epoch": 4680} {"train_loss": -7.362382411956787, "global_step": 196596, "epoch": 4680} {"train_loss": -7.185003280639648, "global_step": 196597, "epoch": 4680} {"train_loss": -7.253523826599121, "global_step": 196598, "epoch": 4680} {"train_loss": -7.20281982421875, "global_step": 196599, "epoch": 4680} {"train_loss": -7.256366729736328, "global_step": 196600, "epoch": 4680} {"train_loss": -7.239891495023455, "global_step": 196601, "epoch": 4680, "val_loss": 68946.0078125} {"train_loss": -7.217700004577637, "global_step": 196602, "epoch": 4681} {"train_loss": -7.218274116516113, "global_step": 196603, "epoch": 4681} {"train_loss": -7.249302387237549, "global_step": 196604, "epoch": 4681} {"train_loss": -7.175970077514648, "global_step": 196605, "epoch": 4681} {"train_loss": -7.152599334716797, "global_step": 196606, "epoch": 4681} {"train_loss": -7.276986122131348, "global_step": 196607, "epoch": 4681} {"train_loss": -7.209261894226074, "global_step": 196608, "epoch": 4681} {"train_loss": -7.254369735717773, "global_step": 196609, "epoch": 4681} {"train_loss": -7.206252098083496, "global_step": 196610, "epoch": 4681} {"train_loss": -7.214642524719238, "global_step": 196611, "epoch": 4681} {"train_loss": -7.2928147315979, "global_step": 196612, "epoch": 4681} {"train_loss": -7.316649436950684, "global_step": 196613, "epoch": 4681} {"train_loss": -7.305856227874756, "global_step": 196614, "epoch": 4681} {"train_loss": -7.054726600646973, "global_step": 196615, "epoch": 4681} {"train_loss": -7.202198028564453, "global_step": 196616, "epoch": 4681} {"train_loss": -7.124277114868164, "global_step": 196617, "epoch": 4681} {"train_loss": -7.099342346191406, "global_step": 196618, "epoch": 4681} {"train_loss": -7.251739025115967, "global_step": 196619, "epoch": 4681} {"train_loss": -7.130427360534668, "global_step": 196620, "epoch": 4681} {"train_loss": -7.151335716247559, "global_step": 196621, "epoch": 4681} {"train_loss": -7.226842880249023, "global_step": 196622, "epoch": 4681} {"train_loss": -7.047279357910156, "global_step": 196623, "epoch": 4681} {"train_loss": -7.208207130432129, "global_step": 196624, "epoch": 4681} {"train_loss": -7.122306823730469, "global_step": 196625, "epoch": 4681} {"train_loss": -7.1923136711120605, "global_step": 196626, "epoch": 4681} {"train_loss": -7.141361236572266, "global_step": 196627, "epoch": 4681} {"train_loss": -7.205981731414795, "global_step": 196628, "epoch": 4681} {"train_loss": -7.063443183898926, "global_step": 196629, "epoch": 4681} {"train_loss": -7.179260730743408, "global_step": 196630, "epoch": 4681} {"train_loss": -7.172280311584473, "global_step": 196631, "epoch": 4681} {"train_loss": -7.1067962646484375, "global_step": 196632, "epoch": 4681} {"train_loss": -7.168617248535156, "global_step": 196633, "epoch": 4681} {"train_loss": -7.205292701721191, "global_step": 196634, "epoch": 4681} {"train_loss": -7.069614887237549, "global_step": 196635, "epoch": 4681} {"train_loss": -7.194919586181641, "global_step": 196636, "epoch": 4681} {"train_loss": -7.117863655090332, "global_step": 196637, "epoch": 4681} {"train_loss": -7.13719367980957, "global_step": 196638, "epoch": 4681} {"train_loss": -7.096775054931641, "global_step": 196639, "epoch": 4681} {"train_loss": -7.128562927246094, "global_step": 196640, "epoch": 4681} {"train_loss": -7.009645938873291, "global_step": 196641, "epoch": 4681} {"train_loss": -7.003480911254883, "global_step": 196642, "epoch": 4681} {"train_loss": -7.166760387874785, "global_step": 196643, "epoch": 4681, "val_loss": 69318.6484375} {"train_loss": -7.0807037353515625, "global_step": 196644, "epoch": 4682} {"train_loss": -7.163064002990723, "global_step": 196645, "epoch": 4682} {"train_loss": -7.257515907287598, "global_step": 196646, "epoch": 4682} {"train_loss": -7.114441871643066, "global_step": 196647, "epoch": 4682} {"train_loss": -7.226463317871094, "global_step": 196648, "epoch": 4682} {"train_loss": -7.102847099304199, "global_step": 196649, "epoch": 4682} {"train_loss": -7.160100936889648, "global_step": 196650, "epoch": 4682} {"train_loss": -7.176563262939453, "global_step": 196651, "epoch": 4682} {"train_loss": -7.115560531616211, "global_step": 196652, "epoch": 4682} {"train_loss": -7.187734127044678, "global_step": 196653, "epoch": 4682} {"train_loss": -7.166409969329834, "global_step": 196654, "epoch": 4682} {"train_loss": -7.20631217956543, "global_step": 196655, "epoch": 4682} {"train_loss": -7.1353302001953125, "global_step": 196656, "epoch": 4682} {"train_loss": -7.2624382972717285, "global_step": 196657, "epoch": 4682} {"train_loss": -7.177058219909668, "global_step": 196658, "epoch": 4682} {"train_loss": -7.17501163482666, "global_step": 196659, "epoch": 4682} {"train_loss": -7.2582106590271, "global_step": 196660, "epoch": 4682} {"train_loss": -7.1570353507995605, "global_step": 196661, "epoch": 4682} {"train_loss": -7.271381378173828, "global_step": 196662, "epoch": 4682} {"train_loss": -7.009304046630859, "global_step": 196663, "epoch": 4682} {"train_loss": -7.230213165283203, "global_step": 196664, "epoch": 4682} {"train_loss": -7.214049339294434, "global_step": 196665, "epoch": 4682} {"train_loss": -7.181567668914795, "global_step": 196666, "epoch": 4682} {"train_loss": -7.268204212188721, "global_step": 196667, "epoch": 4682} {"train_loss": -7.263888835906982, "global_step": 196668, "epoch": 4682} {"train_loss": -7.189946174621582, "global_step": 196669, "epoch": 4682} {"train_loss": -7.204073905944824, "global_step": 196670, "epoch": 4682} {"train_loss": -7.17196798324585, "global_step": 196671, "epoch": 4682} {"train_loss": -7.171903610229492, "global_step": 196672, "epoch": 4682} {"train_loss": -7.0975260734558105, "global_step": 196673, "epoch": 4682} {"train_loss": -7.159512519836426, "global_step": 196674, "epoch": 4682} {"train_loss": -7.070291519165039, "global_step": 196675, "epoch": 4682} {"train_loss": -7.159884929656982, "global_step": 196676, "epoch": 4682} {"train_loss": -7.130568027496338, "global_step": 196677, "epoch": 4682} {"train_loss": -7.174161911010742, "global_step": 196678, "epoch": 4682} {"train_loss": -7.125125885009766, "global_step": 196679, "epoch": 4682} {"train_loss": -7.135482311248779, "global_step": 196680, "epoch": 4682} {"train_loss": -7.202503204345703, "global_step": 196681, "epoch": 4682} {"train_loss": -7.160142421722412, "global_step": 196682, "epoch": 4682} {"train_loss": -7.100384712219238, "global_step": 196683, "epoch": 4682} {"train_loss": -7.234630584716797, "global_step": 196684, "epoch": 4682} {"train_loss": -7.17084196635655, "global_step": 196685, "epoch": 4682, "val_loss": 69188.578125} {"train_loss": -7.109379768371582, "global_step": 196686, "epoch": 4683} {"train_loss": -7.157681465148926, "global_step": 196687, "epoch": 4683} {"train_loss": -7.093842506408691, "global_step": 196688, "epoch": 4683} {"train_loss": -7.140275001525879, "global_step": 196689, "epoch": 4683} {"train_loss": -7.18372917175293, "global_step": 196690, "epoch": 4683} {"train_loss": -7.3029022216796875, "global_step": 196691, "epoch": 4683} {"train_loss": -7.165541648864746, "global_step": 196692, "epoch": 4683} {"train_loss": -7.147957801818848, "global_step": 196693, "epoch": 4683} {"train_loss": -7.352499008178711, "global_step": 196694, "epoch": 4683} {"train_loss": -7.199373245239258, "global_step": 196695, "epoch": 4683} {"train_loss": -7.239065170288086, "global_step": 196696, "epoch": 4683} {"train_loss": -7.099132537841797, "global_step": 196697, "epoch": 4683} {"train_loss": -7.259276390075684, "global_step": 196698, "epoch": 4683} {"train_loss": -7.142099857330322, "global_step": 196699, "epoch": 4683} {"train_loss": -7.043219566345215, "global_step": 196700, "epoch": 4683} {"train_loss": -7.095376014709473, "global_step": 196701, "epoch": 4683} {"train_loss": -7.123837471008301, "global_step": 196702, "epoch": 4683} {"train_loss": -7.073444366455078, "global_step": 196703, "epoch": 4683} {"train_loss": -7.1247053146362305, "global_step": 196704, "epoch": 4683} {"train_loss": -6.969271659851074, "global_step": 196705, "epoch": 4683} {"train_loss": -7.10739803314209, "global_step": 196706, "epoch": 4683} {"train_loss": -7.091123580932617, "global_step": 196707, "epoch": 4683} {"train_loss": -7.187539100646973, "global_step": 196708, "epoch": 4683} {"train_loss": -7.007185935974121, "global_step": 196709, "epoch": 4683} {"train_loss": -7.164941787719727, "global_step": 196710, "epoch": 4683} {"train_loss": -7.289604187011719, "global_step": 196711, "epoch": 4683} {"train_loss": -7.092400074005127, "global_step": 196712, "epoch": 4683} {"train_loss": -7.11223030090332, "global_step": 196713, "epoch": 4683} {"train_loss": -7.201346397399902, "global_step": 196714, "epoch": 4683} {"train_loss": -7.129254341125488, "global_step": 196715, "epoch": 4683} {"train_loss": -7.20106315612793, "global_step": 196716, "epoch": 4683} {"train_loss": -6.94820499420166, "global_step": 196717, "epoch": 4683} {"train_loss": -7.207760810852051, "global_step": 196718, "epoch": 4683} {"train_loss": -7.1386823654174805, "global_step": 196719, "epoch": 4683} {"train_loss": -7.0775861740112305, "global_step": 196720, "epoch": 4683} {"train_loss": -7.203065872192383, "global_step": 196721, "epoch": 4683} {"train_loss": -7.128268241882324, "global_step": 196722, "epoch": 4683} {"train_loss": -7.106334209442139, "global_step": 196723, "epoch": 4683} {"train_loss": -7.274120330810547, "global_step": 196724, "epoch": 4683} {"train_loss": -7.140935897827148, "global_step": 196725, "epoch": 4683} {"train_loss": -7.103599548339844, "global_step": 196726, "epoch": 4683} {"train_loss": -7.144802422750564, "global_step": 196727, "epoch": 4683, "val_loss": 68886.1328125} {"train_loss": -7.055006980895996, "global_step": 196728, "epoch": 4684} {"train_loss": -7.152328014373779, "global_step": 196729, "epoch": 4684} {"train_loss": -7.1539506912231445, "global_step": 196730, "epoch": 4684} {"train_loss": -7.1953325271606445, "global_step": 196731, "epoch": 4684} {"train_loss": -7.1874895095825195, "global_step": 196732, "epoch": 4684} {"train_loss": -7.217939376831055, "global_step": 196733, "epoch": 4684} {"train_loss": -7.332164764404297, "global_step": 196734, "epoch": 4684} {"train_loss": -7.0698089599609375, "global_step": 196735, "epoch": 4684} {"train_loss": -7.215982913970947, "global_step": 196736, "epoch": 4684} {"train_loss": -7.184427261352539, "global_step": 196737, "epoch": 4684} {"train_loss": -7.208952903747559, "global_step": 196738, "epoch": 4684} {"train_loss": -7.230010986328125, "global_step": 196739, "epoch": 4684} {"train_loss": -7.123590469360352, "global_step": 196740, "epoch": 4684} {"train_loss": -7.26430606842041, "global_step": 196741, "epoch": 4684} {"train_loss": -7.3524603843688965, "global_step": 196742, "epoch": 4684} {"train_loss": -7.190084457397461, "global_step": 196743, "epoch": 4684} {"train_loss": -7.120253562927246, "global_step": 196744, "epoch": 4684} {"train_loss": -7.213120937347412, "global_step": 196745, "epoch": 4684} {"train_loss": -6.99918270111084, "global_step": 196746, "epoch": 4684} {"train_loss": -7.179205894470215, "global_step": 196747, "epoch": 4684} {"train_loss": -7.2215495109558105, "global_step": 196748, "epoch": 4684} {"train_loss": -7.219363689422607, "global_step": 196749, "epoch": 4684} {"train_loss": -7.284610271453857, "global_step": 196750, "epoch": 4684} {"train_loss": -7.204693794250488, "global_step": 196751, "epoch": 4684} {"train_loss": -7.148283958435059, "global_step": 196752, "epoch": 4684} {"train_loss": -7.170458793640137, "global_step": 196753, "epoch": 4684} {"train_loss": -7.12661075592041, "global_step": 196754, "epoch": 4684} {"train_loss": -7.1266255378723145, "global_step": 196755, "epoch": 4684} {"train_loss": -7.164050579071045, "global_step": 196756, "epoch": 4684} {"train_loss": -7.140042304992676, "global_step": 196757, "epoch": 4684} {"train_loss": -7.151011943817139, "global_step": 196758, "epoch": 4684} {"train_loss": -7.294609546661377, "global_step": 196759, "epoch": 4684} {"train_loss": -7.126341819763184, "global_step": 196760, "epoch": 4684} {"train_loss": -7.0425310134887695, "global_step": 196761, "epoch": 4684} {"train_loss": -7.055731773376465, "global_step": 196762, "epoch": 4684} {"train_loss": -7.213623046875, "global_step": 196763, "epoch": 4684} {"train_loss": -7.070333480834961, "global_step": 196764, "epoch": 4684} {"train_loss": -6.9805989265441895, "global_step": 196765, "epoch": 4684} {"train_loss": -7.173210144042969, "global_step": 196766, "epoch": 4684} {"train_loss": -7.112427711486816, "global_step": 196767, "epoch": 4684} {"train_loss": -7.211604118347168, "global_step": 196768, "epoch": 4684} {"train_loss": -7.167633942195347, "global_step": 196769, "epoch": 4684, "val_loss": 69056.5859375} {"train_loss": -7.1003804206848145, "global_step": 196770, "epoch": 4685} {"train_loss": -7.120044231414795, "global_step": 196771, "epoch": 4685} {"train_loss": -7.160269737243652, "global_step": 196772, "epoch": 4685} {"train_loss": -7.018825531005859, "global_step": 196773, "epoch": 4685} {"train_loss": -7.167510032653809, "global_step": 196774, "epoch": 4685} {"train_loss": -7.218986511230469, "global_step": 196775, "epoch": 4685} {"train_loss": -6.990826606750488, "global_step": 196776, "epoch": 4685} {"train_loss": -7.1841044425964355, "global_step": 196777, "epoch": 4685} {"train_loss": -7.101391792297363, "global_step": 196778, "epoch": 4685} {"train_loss": -7.228135108947754, "global_step": 196779, "epoch": 4685} {"train_loss": -7.193554878234863, "global_step": 196780, "epoch": 4685} {"train_loss": -7.233080863952637, "global_step": 196781, "epoch": 4685} {"train_loss": -7.154109001159668, "global_step": 196782, "epoch": 4685} {"train_loss": -7.190300941467285, "global_step": 196783, "epoch": 4685} {"train_loss": -7.096229076385498, "global_step": 196784, "epoch": 4685} {"train_loss": -7.091530799865723, "global_step": 196785, "epoch": 4685} {"train_loss": -7.099606990814209, "global_step": 196786, "epoch": 4685} {"train_loss": -7.172802925109863, "global_step": 196787, "epoch": 4685} {"train_loss": -7.2097673416137695, "global_step": 196788, "epoch": 4685} {"train_loss": -7.230349540710449, "global_step": 196789, "epoch": 4685} {"train_loss": -7.221324443817139, "global_step": 196790, "epoch": 4685} {"train_loss": -7.126803398132324, "global_step": 196791, "epoch": 4685} {"train_loss": -7.179179668426514, "global_step": 196792, "epoch": 4685} {"train_loss": -7.147695541381836, "global_step": 196793, "epoch": 4685} {"train_loss": -7.101247310638428, "global_step": 196794, "epoch": 4685} {"train_loss": -7.306754112243652, "global_step": 196795, "epoch": 4685} {"train_loss": -7.152937889099121, "global_step": 196796, "epoch": 4685} {"train_loss": -7.221684455871582, "global_step": 196797, "epoch": 4685} {"train_loss": -7.299212455749512, "global_step": 196798, "epoch": 4685} {"train_loss": -7.223437786102295, "global_step": 196799, "epoch": 4685} {"train_loss": -7.266566276550293, "global_step": 196800, "epoch": 4685} {"train_loss": -7.139764785766602, "global_step": 196801, "epoch": 4685} {"train_loss": -7.184714317321777, "global_step": 196802, "epoch": 4685} {"train_loss": -7.211533069610596, "global_step": 196803, "epoch": 4685} {"train_loss": -7.2219133377075195, "global_step": 196804, "epoch": 4685} {"train_loss": -7.224451065063477, "global_step": 196805, "epoch": 4685} {"train_loss": -7.149831771850586, "global_step": 196806, "epoch": 4685} {"train_loss": -7.200916290283203, "global_step": 196807, "epoch": 4685} {"train_loss": -7.267047882080078, "global_step": 196808, "epoch": 4685} {"train_loss": -7.259410381317139, "global_step": 196809, "epoch": 4685} {"train_loss": -7.2655510902404785, "global_step": 196810, "epoch": 4685} {"train_loss": -7.177692015965779, "global_step": 196811, "epoch": 4685, "val_loss": 68905.2109375} {"train_loss": -7.198966026306152, "global_step": 196812, "epoch": 4686} {"train_loss": -7.240417003631592, "global_step": 196813, "epoch": 4686} {"train_loss": -7.15023136138916, "global_step": 196814, "epoch": 4686} {"train_loss": -7.257450103759766, "global_step": 196815, "epoch": 4686} {"train_loss": -7.255788803100586, "global_step": 196816, "epoch": 4686} {"train_loss": -7.119367599487305, "global_step": 196817, "epoch": 4686} {"train_loss": -7.173425197601318, "global_step": 196818, "epoch": 4686} {"train_loss": -7.231703281402588, "global_step": 196819, "epoch": 4686} {"train_loss": -7.291650295257568, "global_step": 196820, "epoch": 4686} {"train_loss": -7.261374473571777, "global_step": 196821, "epoch": 4686} {"train_loss": -7.203968524932861, "global_step": 196822, "epoch": 4686} {"train_loss": -7.107544898986816, "global_step": 196823, "epoch": 4686} {"train_loss": -7.173542022705078, "global_step": 196824, "epoch": 4686} {"train_loss": -7.1174516677856445, "global_step": 196825, "epoch": 4686} {"train_loss": -7.158553600311279, "global_step": 196826, "epoch": 4686} {"train_loss": -7.234696388244629, "global_step": 196827, "epoch": 4686} {"train_loss": -7.216185569763184, "global_step": 196828, "epoch": 4686} {"train_loss": -7.257421016693115, "global_step": 196829, "epoch": 4686} {"train_loss": -7.196049213409424, "global_step": 196830, "epoch": 4686} {"train_loss": -7.281587600708008, "global_step": 196831, "epoch": 4686} {"train_loss": -7.272229194641113, "global_step": 196832, "epoch": 4686} {"train_loss": -7.1646528244018555, "global_step": 196833, "epoch": 4686} {"train_loss": -7.158600330352783, "global_step": 196834, "epoch": 4686} {"train_loss": -7.238325595855713, "global_step": 196835, "epoch": 4686} {"train_loss": -7.206048488616943, "global_step": 196836, "epoch": 4686} {"train_loss": -7.159384727478027, "global_step": 196837, "epoch": 4686} {"train_loss": -7.145222187042236, "global_step": 196838, "epoch": 4686} {"train_loss": -7.305074691772461, "global_step": 196839, "epoch": 4686} {"train_loss": -7.053482532501221, "global_step": 196840, "epoch": 4686} {"train_loss": -7.1494903564453125, "global_step": 196841, "epoch": 4686} {"train_loss": -7.213814735412598, "global_step": 196842, "epoch": 4686} {"train_loss": -7.228269577026367, "global_step": 196843, "epoch": 4686} {"train_loss": -7.201300621032715, "global_step": 196844, "epoch": 4686} {"train_loss": -7.181522846221924, "global_step": 196845, "epoch": 4686} {"train_loss": -7.289150238037109, "global_step": 196846, "epoch": 4686} {"train_loss": -7.193149566650391, "global_step": 196847, "epoch": 4686} {"train_loss": -7.2104339599609375, "global_step": 196848, "epoch": 4686} {"train_loss": -7.214758396148682, "global_step": 196849, "epoch": 4686} {"train_loss": -7.282385349273682, "global_step": 196850, "epoch": 4686} {"train_loss": -7.213696002960205, "global_step": 196851, "epoch": 4686} {"train_loss": -7.16631555557251, "global_step": 196852, "epoch": 4686} {"train_loss": -7.205046347209385, "global_step": 196853, "epoch": 4686, "val_loss": 69110.5390625} {"train_loss": -7.2063398361206055, "global_step": 196854, "epoch": 4687} {"train_loss": -7.151683807373047, "global_step": 196855, "epoch": 4687} {"train_loss": -7.329099178314209, "global_step": 196856, "epoch": 4687} {"train_loss": -7.169569969177246, "global_step": 196857, "epoch": 4687} {"train_loss": -7.232252597808838, "global_step": 196858, "epoch": 4687} {"train_loss": -7.294140338897705, "global_step": 196859, "epoch": 4687} {"train_loss": -7.281554222106934, "global_step": 196860, "epoch": 4687} {"train_loss": -7.217970848083496, "global_step": 196861, "epoch": 4687} {"train_loss": -7.321311950683594, "global_step": 196862, "epoch": 4687} {"train_loss": -7.284218788146973, "global_step": 196863, "epoch": 4687} {"train_loss": -7.196786880493164, "global_step": 196864, "epoch": 4687} {"train_loss": -7.21234130859375, "global_step": 196865, "epoch": 4687} {"train_loss": -7.3388519287109375, "global_step": 196866, "epoch": 4687} {"train_loss": -7.243653297424316, "global_step": 196867, "epoch": 4687} {"train_loss": -7.260985851287842, "global_step": 196868, "epoch": 4687} {"train_loss": -7.206424236297607, "global_step": 196869, "epoch": 4687} {"train_loss": -7.267892837524414, "global_step": 196870, "epoch": 4687} {"train_loss": -7.111429214477539, "global_step": 196871, "epoch": 4687} {"train_loss": -7.2750420570373535, "global_step": 196872, "epoch": 4687} {"train_loss": -7.354116439819336, "global_step": 196873, "epoch": 4687} {"train_loss": -7.254964351654053, "global_step": 196874, "epoch": 4687} {"train_loss": -7.2392425537109375, "global_step": 196875, "epoch": 4687} {"train_loss": -7.148022651672363, "global_step": 196876, "epoch": 4687} {"train_loss": -7.211485862731934, "global_step": 196877, "epoch": 4687} {"train_loss": -7.3110175132751465, "global_step": 196878, "epoch": 4687} {"train_loss": -7.161135673522949, "global_step": 196879, "epoch": 4687} {"train_loss": -7.269352912902832, "global_step": 196880, "epoch": 4687} {"train_loss": -7.250084400177002, "global_step": 196881, "epoch": 4687} {"train_loss": -7.228268623352051, "global_step": 196882, "epoch": 4687} {"train_loss": -7.237570285797119, "global_step": 196883, "epoch": 4687} {"train_loss": -7.151917457580566, "global_step": 196884, "epoch": 4687} {"train_loss": -7.102851867675781, "global_step": 196885, "epoch": 4687} {"train_loss": -7.162019729614258, "global_step": 196886, "epoch": 4687} {"train_loss": -7.241182327270508, "global_step": 196887, "epoch": 4687} {"train_loss": -7.151038646697998, "global_step": 196888, "epoch": 4687} {"train_loss": -7.260263442993164, "global_step": 196889, "epoch": 4687} {"train_loss": -7.213062286376953, "global_step": 196890, "epoch": 4687} {"train_loss": -7.144333362579346, "global_step": 196891, "epoch": 4687} {"train_loss": -7.096848964691162, "global_step": 196892, "epoch": 4687} {"train_loss": -7.005758285522461, "global_step": 196893, "epoch": 4687} {"train_loss": -7.069031715393066, "global_step": 196894, "epoch": 4687} {"train_loss": -7.2139325596037365, "global_step": 196895, "epoch": 4687, "val_loss": 68931.0625} {"train_loss": -7.118537902832031, "global_step": 196896, "epoch": 4688} {"train_loss": -6.999646186828613, "global_step": 196897, "epoch": 4688} {"train_loss": -7.1687397956848145, "global_step": 196898, "epoch": 4688} {"train_loss": -7.153467655181885, "global_step": 196899, "epoch": 4688} {"train_loss": -7.243143558502197, "global_step": 196900, "epoch": 4688} {"train_loss": -7.156118869781494, "global_step": 196901, "epoch": 4688} {"train_loss": -7.142184257507324, "global_step": 196902, "epoch": 4688} {"train_loss": -7.1331634521484375, "global_step": 196903, "epoch": 4688} {"train_loss": -7.056970596313477, "global_step": 196904, "epoch": 4688} {"train_loss": -7.164689540863037, "global_step": 196905, "epoch": 4688} {"train_loss": -7.151063919067383, "global_step": 196906, "epoch": 4688} {"train_loss": -7.14565372467041, "global_step": 196907, "epoch": 4688} {"train_loss": -7.209960460662842, "global_step": 196908, "epoch": 4688} {"train_loss": -7.256087779998779, "global_step": 196909, "epoch": 4688} {"train_loss": -7.113764762878418, "global_step": 196910, "epoch": 4688} {"train_loss": -7.316886901855469, "global_step": 196911, "epoch": 4688} {"train_loss": -7.110630512237549, "global_step": 196912, "epoch": 4688} {"train_loss": -7.153720378875732, "global_step": 196913, "epoch": 4688} {"train_loss": -7.19318151473999, "global_step": 196914, "epoch": 4688} {"train_loss": -7.168573379516602, "global_step": 196915, "epoch": 4688} {"train_loss": -7.105615615844727, "global_step": 196916, "epoch": 4688} {"train_loss": -7.076035499572754, "global_step": 196917, "epoch": 4688} {"train_loss": -7.070171356201172, "global_step": 196918, "epoch": 4688} {"train_loss": -7.191520690917969, "global_step": 196919, "epoch": 4688} {"train_loss": -7.0894975662231445, "global_step": 196920, "epoch": 4688} {"train_loss": -7.194350719451904, "global_step": 196921, "epoch": 4688} {"train_loss": -7.09604549407959, "global_step": 196922, "epoch": 4688} {"train_loss": -7.172483444213867, "global_step": 196923, "epoch": 4688} {"train_loss": -7.1533522605896, "global_step": 196924, "epoch": 4688} {"train_loss": -7.187176704406738, "global_step": 196925, "epoch": 4688} {"train_loss": -7.138957977294922, "global_step": 196926, "epoch": 4688} {"train_loss": -7.123208522796631, "global_step": 196927, "epoch": 4688} {"train_loss": -7.086184978485107, "global_step": 196928, "epoch": 4688} {"train_loss": -7.155444145202637, "global_step": 196929, "epoch": 4688} {"train_loss": -7.05504846572876, "global_step": 196930, "epoch": 4688} {"train_loss": -7.07011079788208, "global_step": 196931, "epoch": 4688} {"train_loss": -7.266744613647461, "global_step": 196932, "epoch": 4688} {"train_loss": -7.165008544921875, "global_step": 196933, "epoch": 4688} {"train_loss": -7.171114444732666, "global_step": 196934, "epoch": 4688} {"train_loss": -7.179562568664551, "global_step": 196935, "epoch": 4688} {"train_loss": -7.219947814941406, "global_step": 196936, "epoch": 4688} {"train_loss": -7.148974009922573, "global_step": 196937, "epoch": 4688, "val_loss": 69071.9609375} {"train_loss": -7.233386993408203, "global_step": 196938, "epoch": 4689} {"train_loss": -7.164876461029053, "global_step": 196939, "epoch": 4689} {"train_loss": -7.198115348815918, "global_step": 196940, "epoch": 4689} {"train_loss": -7.224722862243652, "global_step": 196941, "epoch": 4689} {"train_loss": -7.253732681274414, "global_step": 196942, "epoch": 4689} {"train_loss": -7.32517147064209, "global_step": 196943, "epoch": 4689} {"train_loss": -7.101812362670898, "global_step": 196944, "epoch": 4689} {"train_loss": -7.229367256164551, "global_step": 196945, "epoch": 4689} {"train_loss": -7.339875221252441, "global_step": 196946, "epoch": 4689} {"train_loss": -7.1708807945251465, "global_step": 196947, "epoch": 4689} {"train_loss": -7.113875389099121, "global_step": 196948, "epoch": 4689} {"train_loss": -7.234581470489502, "global_step": 196949, "epoch": 4689} {"train_loss": -7.082910537719727, "global_step": 196950, "epoch": 4689} {"train_loss": -7.197265148162842, "global_step": 196951, "epoch": 4689} {"train_loss": -7.274964809417725, "global_step": 196952, "epoch": 4689} {"train_loss": -7.14588737487793, "global_step": 196953, "epoch": 4689} {"train_loss": -7.139042377471924, "global_step": 196954, "epoch": 4689} {"train_loss": -7.259856224060059, "global_step": 196955, "epoch": 4689} {"train_loss": -7.2921857833862305, "global_step": 196956, "epoch": 4689} {"train_loss": -7.282865524291992, "global_step": 196957, "epoch": 4689} {"train_loss": -7.345974922180176, "global_step": 196958, "epoch": 4689} {"train_loss": -7.294568061828613, "global_step": 196959, "epoch": 4689} {"train_loss": -7.246294021606445, "global_step": 196960, "epoch": 4689} {"train_loss": -7.23726749420166, "global_step": 196961, "epoch": 4689} {"train_loss": -7.174837589263916, "global_step": 196962, "epoch": 4689} {"train_loss": -7.308650016784668, "global_step": 196963, "epoch": 4689} {"train_loss": -7.232007026672363, "global_step": 196964, "epoch": 4689} {"train_loss": -7.229318141937256, "global_step": 196965, "epoch": 4689} {"train_loss": -7.219735145568848, "global_step": 196966, "epoch": 4689} {"train_loss": -7.208453178405762, "global_step": 196967, "epoch": 4689} {"train_loss": -7.099076747894287, "global_step": 196968, "epoch": 4689} {"train_loss": -7.287158489227295, "global_step": 196969, "epoch": 4689} {"train_loss": -7.203746795654297, "global_step": 196970, "epoch": 4689} {"train_loss": -7.241529941558838, "global_step": 196971, "epoch": 4689} {"train_loss": -7.244847297668457, "global_step": 196972, "epoch": 4689} {"train_loss": -7.2000932693481445, "global_step": 196973, "epoch": 4689} {"train_loss": -7.1789655685424805, "global_step": 196974, "epoch": 4689} {"train_loss": -7.046018600463867, "global_step": 196975, "epoch": 4689} {"train_loss": -7.180601119995117, "global_step": 196976, "epoch": 4689} {"train_loss": -7.1361494064331055, "global_step": 196977, "epoch": 4689} {"train_loss": -7.153114318847656, "global_step": 196978, "epoch": 4689} {"train_loss": -7.214488211132231, "global_step": 196979, "epoch": 4689, "val_loss": 68908.0390625} {"train_loss": -7.332250595092773, "global_step": 196980, "epoch": 4690} {"train_loss": -7.2656354904174805, "global_step": 196981, "epoch": 4690} {"train_loss": -7.210416316986084, "global_step": 196982, "epoch": 4690} {"train_loss": -7.241225242614746, "global_step": 196983, "epoch": 4690} {"train_loss": -7.245914459228516, "global_step": 196984, "epoch": 4690} {"train_loss": -7.227130889892578, "global_step": 196985, "epoch": 4690} {"train_loss": -7.147637367248535, "global_step": 196986, "epoch": 4690} {"train_loss": -7.194637298583984, "global_step": 196987, "epoch": 4690} {"train_loss": -7.252987384796143, "global_step": 196988, "epoch": 4690} {"train_loss": -7.201889991760254, "global_step": 196989, "epoch": 4690} {"train_loss": -7.197936534881592, "global_step": 196990, "epoch": 4690} {"train_loss": -7.17650032043457, "global_step": 196991, "epoch": 4690} {"train_loss": -7.251058101654053, "global_step": 196992, "epoch": 4690} {"train_loss": -7.134835243225098, "global_step": 196993, "epoch": 4690} {"train_loss": -7.169770240783691, "global_step": 196994, "epoch": 4690} {"train_loss": -7.235013008117676, "global_step": 196995, "epoch": 4690} {"train_loss": -7.154656410217285, "global_step": 196996, "epoch": 4690} {"train_loss": -7.153332233428955, "global_step": 196997, "epoch": 4690} {"train_loss": -7.272619247436523, "global_step": 196998, "epoch": 4690} {"train_loss": -7.054568290710449, "global_step": 196999, "epoch": 4690} {"train_loss": -7.0830278396606445, "global_step": 197000, "epoch": 4690} {"train_loss": -7.200413703918457, "global_step": 197001, "epoch": 4690} {"train_loss": -7.134660720825195, "global_step": 197002, "epoch": 4690} {"train_loss": -7.182988166809082, "global_step": 197003, "epoch": 4690} {"train_loss": -7.107306957244873, "global_step": 197004, "epoch": 4690} {"train_loss": -7.126347064971924, "global_step": 197005, "epoch": 4690} {"train_loss": -7.180896282196045, "global_step": 197006, "epoch": 4690} {"train_loss": -7.187323093414307, "global_step": 197007, "epoch": 4690} {"train_loss": -7.287245750427246, "global_step": 197008, "epoch": 4690} {"train_loss": -7.160553932189941, "global_step": 197009, "epoch": 4690} {"train_loss": -7.164852619171143, "global_step": 197010, "epoch": 4690} {"train_loss": -7.146853923797607, "global_step": 197011, "epoch": 4690} {"train_loss": -7.190472602844238, "global_step": 197012, "epoch": 4690} {"train_loss": -7.179081439971924, "global_step": 197013, "epoch": 4690} {"train_loss": -7.18125057220459, "global_step": 197014, "epoch": 4690} {"train_loss": -7.171100616455078, "global_step": 197015, "epoch": 4690} {"train_loss": -7.173418998718262, "global_step": 197016, "epoch": 4690} {"train_loss": -7.213384628295898, "global_step": 197017, "epoch": 4690} {"train_loss": -7.23304557800293, "global_step": 197018, "epoch": 4690} {"train_loss": -7.296850681304932, "global_step": 197019, "epoch": 4690} {"train_loss": -7.321475028991699, "global_step": 197020, "epoch": 4690} {"train_loss": -7.1940339633396695, "global_step": 197021, "epoch": 4690, "val_loss": 69089.7890625} {"train_loss": -7.238752365112305, "global_step": 197022, "epoch": 4691} {"train_loss": -7.335373401641846, "global_step": 197023, "epoch": 4691} {"train_loss": -7.268701553344727, "global_step": 197024, "epoch": 4691} {"train_loss": -7.309023380279541, "global_step": 197025, "epoch": 4691} {"train_loss": -7.207890033721924, "global_step": 197026, "epoch": 4691} {"train_loss": -7.0718584060668945, "global_step": 197027, "epoch": 4691} {"train_loss": -7.2583417892456055, "global_step": 197028, "epoch": 4691} {"train_loss": -7.089559078216553, "global_step": 197029, "epoch": 4691} {"train_loss": -7.275146484375, "global_step": 197030, "epoch": 4691} {"train_loss": -7.252931594848633, "global_step": 197031, "epoch": 4691} {"train_loss": -7.114632606506348, "global_step": 197032, "epoch": 4691} {"train_loss": -7.158995628356934, "global_step": 197033, "epoch": 4691} {"train_loss": -7.206871032714844, "global_step": 197034, "epoch": 4691} {"train_loss": -7.2069292068481445, "global_step": 197035, "epoch": 4691} {"train_loss": -7.213127136230469, "global_step": 197036, "epoch": 4691} {"train_loss": -7.092228889465332, "global_step": 197037, "epoch": 4691} {"train_loss": -7.2710113525390625, "global_step": 197038, "epoch": 4691} {"train_loss": -7.232082366943359, "global_step": 197039, "epoch": 4691} {"train_loss": -7.283642768859863, "global_step": 197040, "epoch": 4691} {"train_loss": -7.194913864135742, "global_step": 197041, "epoch": 4691} {"train_loss": -7.1716837882995605, "global_step": 197042, "epoch": 4691} {"train_loss": -7.114476203918457, "global_step": 197043, "epoch": 4691} {"train_loss": -7.053704261779785, "global_step": 197044, "epoch": 4691} {"train_loss": -7.2383880615234375, "global_step": 197045, "epoch": 4691} {"train_loss": -7.141864776611328, "global_step": 197046, "epoch": 4691} {"train_loss": -7.102347373962402, "global_step": 197047, "epoch": 4691} {"train_loss": -7.171939373016357, "global_step": 197048, "epoch": 4691} {"train_loss": -7.04457426071167, "global_step": 197049, "epoch": 4691} {"train_loss": -7.182716369628906, "global_step": 197050, "epoch": 4691} {"train_loss": -7.057456970214844, "global_step": 197051, "epoch": 4691} {"train_loss": -7.125105857849121, "global_step": 197052, "epoch": 4691} {"train_loss": -7.1247687339782715, "global_step": 197053, "epoch": 4691} {"train_loss": -7.0761823654174805, "global_step": 197054, "epoch": 4691} {"train_loss": -7.261874675750732, "global_step": 197055, "epoch": 4691} {"train_loss": -7.094505310058594, "global_step": 197056, "epoch": 4691} {"train_loss": -7.239824295043945, "global_step": 197057, "epoch": 4691} {"train_loss": -7.117613792419434, "global_step": 197058, "epoch": 4691} {"train_loss": -7.246764183044434, "global_step": 197059, "epoch": 4691} {"train_loss": -7.193613529205322, "global_step": 197060, "epoch": 4691} {"train_loss": -7.243381500244141, "global_step": 197061, "epoch": 4691} {"train_loss": -7.1292619705200195, "global_step": 197062, "epoch": 4691} {"train_loss": -7.180504810242426, "global_step": 197063, "epoch": 4691, "val_loss": 68956.2421875} {"train_loss": -7.146997451782227, "global_step": 197064, "epoch": 4692} {"train_loss": -7.166373252868652, "global_step": 197065, "epoch": 4692} {"train_loss": -7.1970744132995605, "global_step": 197066, "epoch": 4692} {"train_loss": -7.014904975891113, "global_step": 197067, "epoch": 4692} {"train_loss": -7.206228733062744, "global_step": 197068, "epoch": 4692} {"train_loss": -7.133732795715332, "global_step": 197069, "epoch": 4692} {"train_loss": -7.213288307189941, "global_step": 197070, "epoch": 4692} {"train_loss": -7.143954277038574, "global_step": 197071, "epoch": 4692} {"train_loss": -7.090108871459961, "global_step": 197072, "epoch": 4692} {"train_loss": -7.196035385131836, "global_step": 197073, "epoch": 4692} {"train_loss": -7.135309219360352, "global_step": 197074, "epoch": 4692} {"train_loss": -7.256667137145996, "global_step": 197075, "epoch": 4692} {"train_loss": -7.293957710266113, "global_step": 197076, "epoch": 4692} {"train_loss": -7.210179328918457, "global_step": 197077, "epoch": 4692} {"train_loss": -7.218023300170898, "global_step": 197078, "epoch": 4692} {"train_loss": -7.228765487670898, "global_step": 197079, "epoch": 4692} {"train_loss": -7.254034996032715, "global_step": 197080, "epoch": 4692} {"train_loss": -7.228372573852539, "global_step": 197081, "epoch": 4692} {"train_loss": -7.140384674072266, "global_step": 197082, "epoch": 4692} {"train_loss": -7.012195110321045, "global_step": 197083, "epoch": 4692} {"train_loss": -7.107273101806641, "global_step": 197084, "epoch": 4692} {"train_loss": -7.239246368408203, "global_step": 197085, "epoch": 4692} {"train_loss": -7.05441951751709, "global_step": 197086, "epoch": 4692} {"train_loss": -7.182861328125, "global_step": 197087, "epoch": 4692} {"train_loss": -7.120845794677734, "global_step": 197088, "epoch": 4692} {"train_loss": -7.240473747253418, "global_step": 197089, "epoch": 4692} {"train_loss": -7.178348541259766, "global_step": 197090, "epoch": 4692} {"train_loss": -7.016870498657227, "global_step": 197091, "epoch": 4692} {"train_loss": -7.161187171936035, "global_step": 197092, "epoch": 4692} {"train_loss": -7.222936153411865, "global_step": 197093, "epoch": 4692} {"train_loss": -7.234201431274414, "global_step": 197094, "epoch": 4692} {"train_loss": -7.242275238037109, "global_step": 197095, "epoch": 4692} {"train_loss": -7.300102233886719, "global_step": 197096, "epoch": 4692} {"train_loss": -7.1593828201293945, "global_step": 197097, "epoch": 4692} {"train_loss": -7.150415897369385, "global_step": 197098, "epoch": 4692} {"train_loss": -7.1999945640563965, "global_step": 197099, "epoch": 4692} {"train_loss": -7.2082061767578125, "global_step": 197100, "epoch": 4692} {"train_loss": -7.175021171569824, "global_step": 197101, "epoch": 4692} {"train_loss": -7.229489803314209, "global_step": 197102, "epoch": 4692} {"train_loss": -7.108823776245117, "global_step": 197103, "epoch": 4692} {"train_loss": -7.2120361328125, "global_step": 197104, "epoch": 4692} {"train_loss": -7.177747431255522, "global_step": 197105, "epoch": 4692, "val_loss": 68764.109375} {"train_loss": -7.274931907653809, "global_step": 197106, "epoch": 4693} {"train_loss": -7.168061256408691, "global_step": 197107, "epoch": 4693} {"train_loss": -7.216630935668945, "global_step": 197108, "epoch": 4693} {"train_loss": -7.183093547821045, "global_step": 197109, "epoch": 4693} {"train_loss": -7.232985496520996, "global_step": 197110, "epoch": 4693} {"train_loss": -7.222171783447266, "global_step": 197111, "epoch": 4693} {"train_loss": -7.269979000091553, "global_step": 197112, "epoch": 4693} {"train_loss": -7.254823684692383, "global_step": 197113, "epoch": 4693} {"train_loss": -7.311249732971191, "global_step": 197114, "epoch": 4693} {"train_loss": -7.289206504821777, "global_step": 197115, "epoch": 4693} {"train_loss": -7.257411479949951, "global_step": 197116, "epoch": 4693} {"train_loss": -7.290076732635498, "global_step": 197117, "epoch": 4693} {"train_loss": -7.277026176452637, "global_step": 197118, "epoch": 4693} {"train_loss": -7.184390068054199, "global_step": 197119, "epoch": 4693} {"train_loss": -7.204239845275879, "global_step": 197120, "epoch": 4693} {"train_loss": -7.327437400817871, "global_step": 197121, "epoch": 4693} {"train_loss": -7.276211738586426, "global_step": 197122, "epoch": 4693} {"train_loss": -7.2480692863464355, "global_step": 197123, "epoch": 4693} {"train_loss": -7.247501373291016, "global_step": 197124, "epoch": 4693} {"train_loss": -7.284834861755371, "global_step": 197125, "epoch": 4693} {"train_loss": -7.210946083068848, "global_step": 197126, "epoch": 4693} {"train_loss": -7.196743965148926, "global_step": 197127, "epoch": 4693} {"train_loss": -7.223278045654297, "global_step": 197128, "epoch": 4693} {"train_loss": -7.308501243591309, "global_step": 197129, "epoch": 4693} {"train_loss": -7.223181247711182, "global_step": 197130, "epoch": 4693} {"train_loss": -7.300681114196777, "global_step": 197131, "epoch": 4693} {"train_loss": -7.305100917816162, "global_step": 197132, "epoch": 4693} {"train_loss": -7.334521293640137, "global_step": 197133, "epoch": 4693} {"train_loss": -7.203046798706055, "global_step": 197134, "epoch": 4693} {"train_loss": -7.201682090759277, "global_step": 197135, "epoch": 4693} {"train_loss": -7.176167011260986, "global_step": 197136, "epoch": 4693} {"train_loss": -7.134908676147461, "global_step": 197137, "epoch": 4693} {"train_loss": -7.282010078430176, "global_step": 197138, "epoch": 4693} {"train_loss": -7.192109107971191, "global_step": 197139, "epoch": 4693} {"train_loss": -7.184002876281738, "global_step": 197140, "epoch": 4693} {"train_loss": -7.146055221557617, "global_step": 197141, "epoch": 4693} {"train_loss": -7.169171333312988, "global_step": 197142, "epoch": 4693} {"train_loss": -7.331674575805664, "global_step": 197143, "epoch": 4693} {"train_loss": -7.150517463684082, "global_step": 197144, "epoch": 4693} {"train_loss": -7.1467156410217285, "global_step": 197145, "epoch": 4693} {"train_loss": -7.15291690826416, "global_step": 197146, "epoch": 4693} {"train_loss": -7.229431867599487, "global_step": 197147, "epoch": 4693, "val_loss": 68909.4609375} {"train_loss": -7.294182300567627, "global_step": 197148, "epoch": 4694} {"train_loss": -7.085658073425293, "global_step": 197149, "epoch": 4694} {"train_loss": -7.13835334777832, "global_step": 197150, "epoch": 4694} {"train_loss": -7.238816261291504, "global_step": 197151, "epoch": 4694} {"train_loss": -7.2552900314331055, "global_step": 197152, "epoch": 4694} {"train_loss": -7.267779350280762, "global_step": 197153, "epoch": 4694} {"train_loss": -7.3363356590271, "global_step": 197154, "epoch": 4694} {"train_loss": -7.324091911315918, "global_step": 197155, "epoch": 4694} {"train_loss": -7.166836738586426, "global_step": 197156, "epoch": 4694} {"train_loss": -7.262004375457764, "global_step": 197157, "epoch": 4694} {"train_loss": -7.265797138214111, "global_step": 197158, "epoch": 4694} {"train_loss": -7.1395392417907715, "global_step": 197159, "epoch": 4694} {"train_loss": -7.253516674041748, "global_step": 197160, "epoch": 4694} {"train_loss": -7.277684688568115, "global_step": 197161, "epoch": 4694} {"train_loss": -7.2337965965271, "global_step": 197162, "epoch": 4694} {"train_loss": -7.1961774826049805, "global_step": 197163, "epoch": 4694} {"train_loss": -7.283617973327637, "global_step": 197164, "epoch": 4694} {"train_loss": -7.077912330627441, "global_step": 197165, "epoch": 4694} {"train_loss": -7.293072700500488, "global_step": 197166, "epoch": 4694} {"train_loss": -7.202984809875488, "global_step": 197167, "epoch": 4694} {"train_loss": -7.25358247756958, "global_step": 197168, "epoch": 4694} {"train_loss": -7.270204067230225, "global_step": 197169, "epoch": 4694} {"train_loss": -7.2263689041137695, "global_step": 197170, "epoch": 4694} {"train_loss": -7.222928047180176, "global_step": 197171, "epoch": 4694} {"train_loss": -7.205959320068359, "global_step": 197172, "epoch": 4694} {"train_loss": -7.32014274597168, "global_step": 197173, "epoch": 4694} {"train_loss": -7.254451274871826, "global_step": 197174, "epoch": 4694} {"train_loss": -7.209384918212891, "global_step": 197175, "epoch": 4694} {"train_loss": -7.22865104675293, "global_step": 197176, "epoch": 4694} {"train_loss": -7.247153282165527, "global_step": 197177, "epoch": 4694} {"train_loss": -7.227398872375488, "global_step": 197178, "epoch": 4694} {"train_loss": -7.237597465515137, "global_step": 197179, "epoch": 4694} {"train_loss": -7.245489120483398, "global_step": 197180, "epoch": 4694} {"train_loss": -7.151828765869141, "global_step": 197181, "epoch": 4694} {"train_loss": -7.290324687957764, "global_step": 197182, "epoch": 4694} {"train_loss": -7.218766212463379, "global_step": 197183, "epoch": 4694} {"train_loss": -7.200204849243164, "global_step": 197184, "epoch": 4694} {"train_loss": -7.208366394042969, "global_step": 197185, "epoch": 4694} {"train_loss": -7.213070869445801, "global_step": 197186, "epoch": 4694} {"train_loss": -7.358310222625732, "global_step": 197187, "epoch": 4694} {"train_loss": -7.152990341186523, "global_step": 197188, "epoch": 4694} {"train_loss": -7.234257857004802, "global_step": 197189, "epoch": 4694, "val_loss": 69133.8515625} {"train_loss": -7.259951591491699, "global_step": 197190, "epoch": 4695} {"train_loss": -7.124463081359863, "global_step": 197191, "epoch": 4695} {"train_loss": -7.179350852966309, "global_step": 197192, "epoch": 4695} {"train_loss": -7.266477108001709, "global_step": 197193, "epoch": 4695} {"train_loss": -7.285155296325684, "global_step": 197194, "epoch": 4695} {"train_loss": -7.129175186157227, "global_step": 197195, "epoch": 4695} {"train_loss": -7.134082794189453, "global_step": 197196, "epoch": 4695} {"train_loss": -7.2763800621032715, "global_step": 197197, "epoch": 4695} {"train_loss": -7.314877033233643, "global_step": 197198, "epoch": 4695} {"train_loss": -7.168222427368164, "global_step": 197199, "epoch": 4695} {"train_loss": -7.289296627044678, "global_step": 197200, "epoch": 4695} {"train_loss": -7.093222618103027, "global_step": 197201, "epoch": 4695} {"train_loss": -7.115510940551758, "global_step": 197202, "epoch": 4695} {"train_loss": -7.210452079772949, "global_step": 197203, "epoch": 4695} {"train_loss": -7.096624374389648, "global_step": 197204, "epoch": 4695} {"train_loss": -7.184152603149414, "global_step": 197205, "epoch": 4695} {"train_loss": -7.003916263580322, "global_step": 197206, "epoch": 4695} {"train_loss": -7.176017761230469, "global_step": 197207, "epoch": 4695} {"train_loss": -7.104156017303467, "global_step": 197208, "epoch": 4695} {"train_loss": -7.103666305541992, "global_step": 197209, "epoch": 4695} {"train_loss": -7.195826530456543, "global_step": 197210, "epoch": 4695} {"train_loss": -7.105587005615234, "global_step": 197211, "epoch": 4695} {"train_loss": -7.16242790222168, "global_step": 197212, "epoch": 4695} {"train_loss": -7.2887959480285645, "global_step": 197213, "epoch": 4695} {"train_loss": -7.2445878982543945, "global_step": 197214, "epoch": 4695} {"train_loss": -7.109152793884277, "global_step": 197215, "epoch": 4695} {"train_loss": -7.090813159942627, "global_step": 197216, "epoch": 4695} {"train_loss": -7.211490154266357, "global_step": 197217, "epoch": 4695} {"train_loss": -7.1879167556762695, "global_step": 197218, "epoch": 4695} {"train_loss": -7.291584014892578, "global_step": 197219, "epoch": 4695} {"train_loss": -7.149593830108643, "global_step": 197220, "epoch": 4695} {"train_loss": -7.086428642272949, "global_step": 197221, "epoch": 4695} {"train_loss": -7.057739734649658, "global_step": 197222, "epoch": 4695} {"train_loss": -7.099342346191406, "global_step": 197223, "epoch": 4695} {"train_loss": -7.154858589172363, "global_step": 197224, "epoch": 4695} {"train_loss": -7.1354827880859375, "global_step": 197225, "epoch": 4695} {"train_loss": -7.153684616088867, "global_step": 197226, "epoch": 4695} {"train_loss": -7.174978256225586, "global_step": 197227, "epoch": 4695} {"train_loss": -7.013592720031738, "global_step": 197228, "epoch": 4695} {"train_loss": -7.000012397766113, "global_step": 197229, "epoch": 4695} {"train_loss": -7.16342306137085, "global_step": 197230, "epoch": 4695} {"train_loss": -7.156531822113764, "global_step": 197231, "epoch": 4695, "val_loss": 69162.953125} {"train_loss": -7.236496448516846, "global_step": 197232, "epoch": 4696} {"train_loss": -7.042886734008789, "global_step": 197233, "epoch": 4696} {"train_loss": -7.061748504638672, "global_step": 197234, "epoch": 4696} {"train_loss": -7.06718635559082, "global_step": 197235, "epoch": 4696} {"train_loss": -7.125463962554932, "global_step": 197236, "epoch": 4696} {"train_loss": -7.136064529418945, "global_step": 197237, "epoch": 4696} {"train_loss": -7.0463457107543945, "global_step": 197238, "epoch": 4696} {"train_loss": -7.287355899810791, "global_step": 197239, "epoch": 4696} {"train_loss": -7.128165245056152, "global_step": 197240, "epoch": 4696} {"train_loss": -7.182157516479492, "global_step": 197241, "epoch": 4696} {"train_loss": -7.130743980407715, "global_step": 197242, "epoch": 4696} {"train_loss": -7.2169599533081055, "global_step": 197243, "epoch": 4696} {"train_loss": -7.103296279907227, "global_step": 197244, "epoch": 4696} {"train_loss": -7.211678981781006, "global_step": 197245, "epoch": 4696} {"train_loss": -7.205157279968262, "global_step": 197246, "epoch": 4696} {"train_loss": -7.147878646850586, "global_step": 197247, "epoch": 4696} {"train_loss": -7.188170433044434, "global_step": 197248, "epoch": 4696} {"train_loss": -7.0990095138549805, "global_step": 197249, "epoch": 4696} {"train_loss": -7.082507133483887, "global_step": 197250, "epoch": 4696} {"train_loss": -7.118607521057129, "global_step": 197251, "epoch": 4696} {"train_loss": -7.195511817932129, "global_step": 197252, "epoch": 4696} {"train_loss": -7.159387588500977, "global_step": 197253, "epoch": 4696} {"train_loss": -7.038589000701904, "global_step": 197254, "epoch": 4696} {"train_loss": -7.194141864776611, "global_step": 197255, "epoch": 4696} {"train_loss": -7.16903018951416, "global_step": 197256, "epoch": 4696} {"train_loss": -7.298357963562012, "global_step": 197257, "epoch": 4696} {"train_loss": -7.257680416107178, "global_step": 197258, "epoch": 4696} {"train_loss": -7.1879143714904785, "global_step": 197259, "epoch": 4696} {"train_loss": -7.170805931091309, "global_step": 197260, "epoch": 4696} {"train_loss": -7.252198219299316, "global_step": 197261, "epoch": 4696} {"train_loss": -7.109082221984863, "global_step": 197262, "epoch": 4696} {"train_loss": -6.996687412261963, "global_step": 197263, "epoch": 4696} {"train_loss": -7.258021354675293, "global_step": 197264, "epoch": 4696} {"train_loss": -7.189888954162598, "global_step": 197265, "epoch": 4696} {"train_loss": -7.181483268737793, "global_step": 197266, "epoch": 4696} {"train_loss": -7.236574649810791, "global_step": 197267, "epoch": 4696} {"train_loss": -7.1300764083862305, "global_step": 197268, "epoch": 4696} {"train_loss": -7.1460137367248535, "global_step": 197269, "epoch": 4696} {"train_loss": -7.147918701171875, "global_step": 197270, "epoch": 4696} {"train_loss": -7.093982219696045, "global_step": 197271, "epoch": 4696} {"train_loss": -7.219637870788574, "global_step": 197272, "epoch": 4696} {"train_loss": -7.156238521848406, "global_step": 197273, "epoch": 4696, "val_loss": 69100.0} {"train_loss": -7.184601306915283, "global_step": 197274, "epoch": 4697} {"train_loss": -7.1865034103393555, "global_step": 197275, "epoch": 4697} {"train_loss": -7.084865570068359, "global_step": 197276, "epoch": 4697} {"train_loss": -7.0907158851623535, "global_step": 197277, "epoch": 4697} {"train_loss": -7.127103805541992, "global_step": 197278, "epoch": 4697} {"train_loss": -7.147608757019043, "global_step": 197279, "epoch": 4697} {"train_loss": -7.063787460327148, "global_step": 197280, "epoch": 4697} {"train_loss": -7.308780193328857, "global_step": 197281, "epoch": 4697} {"train_loss": -7.231653213500977, "global_step": 197282, "epoch": 4697} {"train_loss": -7.279826641082764, "global_step": 197283, "epoch": 4697} {"train_loss": -7.328797340393066, "global_step": 197284, "epoch": 4697} {"train_loss": -7.195036888122559, "global_step": 197285, "epoch": 4697} {"train_loss": -7.183557510375977, "global_step": 197286, "epoch": 4697} {"train_loss": -7.153897285461426, "global_step": 197287, "epoch": 4697} {"train_loss": -7.1027045249938965, "global_step": 197288, "epoch": 4697} {"train_loss": -7.190877914428711, "global_step": 197289, "epoch": 4697} {"train_loss": -7.159975051879883, "global_step": 197290, "epoch": 4697} {"train_loss": -7.138293266296387, "global_step": 197291, "epoch": 4697} {"train_loss": -7.15002965927124, "global_step": 197292, "epoch": 4697} {"train_loss": -7.155484199523926, "global_step": 197293, "epoch": 4697} {"train_loss": -7.230759620666504, "global_step": 197294, "epoch": 4697} {"train_loss": -7.169561386108398, "global_step": 197295, "epoch": 4697} {"train_loss": -7.2129106521606445, "global_step": 197296, "epoch": 4697} {"train_loss": -7.224672317504883, "global_step": 197297, "epoch": 4697} {"train_loss": -7.206943511962891, "global_step": 197298, "epoch": 4697} {"train_loss": -7.2333526611328125, "global_step": 197299, "epoch": 4697} {"train_loss": -7.110715866088867, "global_step": 197300, "epoch": 4697} {"train_loss": -7.264193534851074, "global_step": 197301, "epoch": 4697} {"train_loss": -7.268430709838867, "global_step": 197302, "epoch": 4697} {"train_loss": -7.288680076599121, "global_step": 197303, "epoch": 4697} {"train_loss": -7.1463470458984375, "global_step": 197304, "epoch": 4697} {"train_loss": -7.212010860443115, "global_step": 197305, "epoch": 4697} {"train_loss": -7.26792049407959, "global_step": 197306, "epoch": 4697} {"train_loss": -7.23285436630249, "global_step": 197307, "epoch": 4697} {"train_loss": -7.073675632476807, "global_step": 197308, "epoch": 4697} {"train_loss": -7.214608669281006, "global_step": 197309, "epoch": 4697} {"train_loss": -7.207590579986572, "global_step": 197310, "epoch": 4697} {"train_loss": -7.222597599029541, "global_step": 197311, "epoch": 4697} {"train_loss": -7.2475905418396, "global_step": 197312, "epoch": 4697} {"train_loss": -7.292121410369873, "global_step": 197313, "epoch": 4697} {"train_loss": -7.348288536071777, "global_step": 197314, "epoch": 4697} {"train_loss": -7.1997832003093905, "global_step": 197315, "epoch": 4697, "val_loss": 69078.0703125} {"train_loss": -7.158796787261963, "global_step": 197316, "epoch": 4698} {"train_loss": -7.2418060302734375, "global_step": 197317, "epoch": 4698} {"train_loss": -7.285397052764893, "global_step": 197318, "epoch": 4698} {"train_loss": -7.313784122467041, "global_step": 197319, "epoch": 4698} {"train_loss": -7.305729866027832, "global_step": 197320, "epoch": 4698} {"train_loss": -7.254330635070801, "global_step": 197321, "epoch": 4698} {"train_loss": -7.283725738525391, "global_step": 197322, "epoch": 4698} {"train_loss": -7.433167457580566, "global_step": 197323, "epoch": 4698} {"train_loss": -7.291416168212891, "global_step": 197324, "epoch": 4698} {"train_loss": -7.334932327270508, "global_step": 197325, "epoch": 4698} {"train_loss": -7.193975448608398, "global_step": 197326, "epoch": 4698} {"train_loss": -7.122536659240723, "global_step": 197327, "epoch": 4698} {"train_loss": -7.271582126617432, "global_step": 197328, "epoch": 4698} {"train_loss": -7.283790588378906, "global_step": 197329, "epoch": 4698} {"train_loss": -7.277191638946533, "global_step": 197330, "epoch": 4698} {"train_loss": -7.247078895568848, "global_step": 197331, "epoch": 4698} {"train_loss": -7.2991533279418945, "global_step": 197332, "epoch": 4698} {"train_loss": -7.144718647003174, "global_step": 197333, "epoch": 4698} {"train_loss": -7.184847831726074, "global_step": 197334, "epoch": 4698} {"train_loss": -7.171716690063477, "global_step": 197335, "epoch": 4698} {"train_loss": -7.030416488647461, "global_step": 197336, "epoch": 4698} {"train_loss": -7.098568916320801, "global_step": 197337, "epoch": 4698} {"train_loss": -6.9616475105285645, "global_step": 197338, "epoch": 4698} {"train_loss": -7.167160987854004, "global_step": 197339, "epoch": 4698} {"train_loss": -7.061307907104492, "global_step": 197340, "epoch": 4698} {"train_loss": -7.1703643798828125, "global_step": 197341, "epoch": 4698} {"train_loss": -7.224379062652588, "global_step": 197342, "epoch": 4698} {"train_loss": -6.956589221954346, "global_step": 197343, "epoch": 4698} {"train_loss": -7.141592979431152, "global_step": 197344, "epoch": 4698} {"train_loss": -7.139647006988525, "global_step": 197345, "epoch": 4698} {"train_loss": -7.167238235473633, "global_step": 197346, "epoch": 4698} {"train_loss": -7.195850372314453, "global_step": 197347, "epoch": 4698} {"train_loss": -7.095381736755371, "global_step": 197348, "epoch": 4698} {"train_loss": -7.159553527832031, "global_step": 197349, "epoch": 4698} {"train_loss": -7.151960372924805, "global_step": 197350, "epoch": 4698} {"train_loss": -7.220114707946777, "global_step": 197351, "epoch": 4698} {"train_loss": -7.216789722442627, "global_step": 197352, "epoch": 4698} {"train_loss": -7.12642765045166, "global_step": 197353, "epoch": 4698} {"train_loss": -7.117987632751465, "global_step": 197354, "epoch": 4698} {"train_loss": -7.20631217956543, "global_step": 197355, "epoch": 4698} {"train_loss": -7.219526290893555, "global_step": 197356, "epoch": 4698} {"train_loss": -7.192048595065162, "global_step": 197357, "epoch": 4698, "val_loss": 69022.578125} {"train_loss": -7.275974273681641, "global_step": 197358, "epoch": 4699} {"train_loss": -7.185478210449219, "global_step": 197359, "epoch": 4699} {"train_loss": -7.273045539855957, "global_step": 197360, "epoch": 4699} {"train_loss": -7.220005989074707, "global_step": 197361, "epoch": 4699} {"train_loss": -7.269723892211914, "global_step": 197362, "epoch": 4699} {"train_loss": -7.2173261642456055, "global_step": 197363, "epoch": 4699} {"train_loss": -7.197237968444824, "global_step": 197364, "epoch": 4699} {"train_loss": -7.221055030822754, "global_step": 197365, "epoch": 4699} {"train_loss": -7.173280715942383, "global_step": 197366, "epoch": 4699} {"train_loss": -7.177009105682373, "global_step": 197367, "epoch": 4699} {"train_loss": -7.181858539581299, "global_step": 197368, "epoch": 4699} {"train_loss": -7.068829536437988, "global_step": 197369, "epoch": 4699} {"train_loss": -7.088980674743652, "global_step": 197370, "epoch": 4699} {"train_loss": -7.275059700012207, "global_step": 197371, "epoch": 4699} {"train_loss": -7.153697490692139, "global_step": 197372, "epoch": 4699} {"train_loss": -7.22673225402832, "global_step": 197373, "epoch": 4699} {"train_loss": -7.183082580566406, "global_step": 197374, "epoch": 4699} {"train_loss": -7.202854156494141, "global_step": 197375, "epoch": 4699} {"train_loss": -7.211289405822754, "global_step": 197376, "epoch": 4699} {"train_loss": -7.1691083908081055, "global_step": 197377, "epoch": 4699} {"train_loss": -7.249429702758789, "global_step": 197378, "epoch": 4699} {"train_loss": -7.224298477172852, "global_step": 197379, "epoch": 4699} {"train_loss": -7.181160926818848, "global_step": 197380, "epoch": 4699} {"train_loss": -7.366440773010254, "global_step": 197381, "epoch": 4699} {"train_loss": -7.197780132293701, "global_step": 197382, "epoch": 4699} {"train_loss": -7.2344865798950195, "global_step": 197383, "epoch": 4699} {"train_loss": -7.243595123291016, "global_step": 197384, "epoch": 4699} {"train_loss": -7.221391677856445, "global_step": 197385, "epoch": 4699} {"train_loss": -7.220859050750732, "global_step": 197386, "epoch": 4699} {"train_loss": -7.23669958114624, "global_step": 197387, "epoch": 4699} {"train_loss": -7.2352752685546875, "global_step": 197388, "epoch": 4699} {"train_loss": -7.294933319091797, "global_step": 197389, "epoch": 4699} {"train_loss": -7.253866195678711, "global_step": 197390, "epoch": 4699} {"train_loss": -7.206791877746582, "global_step": 197391, "epoch": 4699} {"train_loss": -7.357356071472168, "global_step": 197392, "epoch": 4699} {"train_loss": -7.254850387573242, "global_step": 197393, "epoch": 4699} {"train_loss": -7.212630748748779, "global_step": 197394, "epoch": 4699} {"train_loss": -7.20546817779541, "global_step": 197395, "epoch": 4699} {"train_loss": -7.277980804443359, "global_step": 197396, "epoch": 4699} {"train_loss": -7.266277313232422, "global_step": 197397, "epoch": 4699} {"train_loss": -7.2750396728515625, "global_step": 197398, "epoch": 4699} {"train_loss": -7.227975186847505, "global_step": 197399, "epoch": 4699, "val_loss": 68948.640625} {"train_loss": -7.270000457763672, "global_step": 197400, "epoch": 4700} {"train_loss": -7.376446723937988, "global_step": 197401, "epoch": 4700} {"train_loss": -7.25261926651001, "global_step": 197402, "epoch": 4700} {"train_loss": -7.124240875244141, "global_step": 197403, "epoch": 4700} {"train_loss": -7.225795745849609, "global_step": 197404, "epoch": 4700} {"train_loss": -7.249786376953125, "global_step": 197405, "epoch": 4700} {"train_loss": -7.28525447845459, "global_step": 197406, "epoch": 4700} {"train_loss": -7.393674373626709, "global_step": 197407, "epoch": 4700} {"train_loss": -7.219472885131836, "global_step": 197408, "epoch": 4700} {"train_loss": -7.050906181335449, "global_step": 197409, "epoch": 4700} {"train_loss": -7.218721389770508, "global_step": 197410, "epoch": 4700} {"train_loss": -7.238110542297363, "global_step": 197411, "epoch": 4700} {"train_loss": -6.973029136657715, "global_step": 197412, "epoch": 4700} {"train_loss": -7.223141193389893, "global_step": 197413, "epoch": 4700} {"train_loss": -7.180653095245361, "global_step": 197414, "epoch": 4700} {"train_loss": -7.213518142700195, "global_step": 197415, "epoch": 4700} {"train_loss": -7.165348052978516, "global_step": 197416, "epoch": 4700} {"train_loss": -7.228020191192627, "global_step": 197417, "epoch": 4700} {"train_loss": -7.260056972503662, "global_step": 197418, "epoch": 4700} {"train_loss": -7.142378807067871, "global_step": 197419, "epoch": 4700} {"train_loss": -7.175297737121582, "global_step": 197420, "epoch": 4700} {"train_loss": -7.263498306274414, "global_step": 197421, "epoch": 4700} {"train_loss": -7.1975603103637695, "global_step": 197422, "epoch": 4700} {"train_loss": -7.303217887878418, "global_step": 197423, "epoch": 4700} {"train_loss": -7.224624156951904, "global_step": 197424, "epoch": 4700} {"train_loss": -7.1720123291015625, "global_step": 197425, "epoch": 4700} {"train_loss": -7.249682426452637, "global_step": 197426, "epoch": 4700} {"train_loss": -7.20758581161499, "global_step": 197427, "epoch": 4700} {"train_loss": -7.2263078689575195, "global_step": 197428, "epoch": 4700} {"train_loss": -7.253013610839844, "global_step": 197429, "epoch": 4700} {"train_loss": -7.308882713317871, "global_step": 197430, "epoch": 4700} {"train_loss": -7.146444797515869, "global_step": 197431, "epoch": 4700} {"train_loss": -7.2947187423706055, "global_step": 197432, "epoch": 4700} {"train_loss": -7.3145270347595215, "global_step": 197433, "epoch": 4700} {"train_loss": -7.231689453125, "global_step": 197434, "epoch": 4700} {"train_loss": -7.170623302459717, "global_step": 197435, "epoch": 4700} {"train_loss": -7.0815324783325195, "global_step": 197436, "epoch": 4700} {"train_loss": -7.279569149017334, "global_step": 197437, "epoch": 4700} {"train_loss": -7.150630474090576, "global_step": 197438, "epoch": 4700} {"train_loss": -7.166545391082764, "global_step": 197439, "epoch": 4700} {"train_loss": -7.040124893188477, "global_step": 197440, "epoch": 4700} {"train_loss": -7.213143643878755, "global_step": 197441, "epoch": 4700, "train/sim_max_reward_0": 0.2155903522071284, "train/sim_max_reward_1": 0.9326034323267655, "train/sim_max_reward_2": 0.3091069785133158, "train/sim_max_reward_3": 0.9682831048232177, "train/sim_max_reward_4": 0.9604973706000304, "train/sim_max_reward_5": 0.8882754073101196, "test/sim_max_reward_4400000": 0.926598005611529, "test/sim_max_reward_4400001": 0.22276731418810067, "test/sim_max_reward_4400002": 0.8631144798101633, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29836393642439696, "test/sim_max_reward_4400009": 0.9977532407660814, "test/sim_max_reward_4400010": 0.19405934347655773, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9590097146099327, "test/sim_max_reward_4400014": 0.9923165838556047, "test/sim_max_reward_4400015": 0.03179309320645017, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2671610226894925, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9097889418287941, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.9912971618575709, "test/sim_max_reward_4400025": 0.26693736937599455, "test/sim_max_reward_4400026": 0.2602296510957385, "test/sim_max_reward_4400027": 0.000777676037298043, "test/sim_max_reward_4400028": 0.4002885629824532, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9678120682575856, "test/sim_max_reward_4400031": 0.9586415773512337, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 0.9806969642714053, "test/sim_max_reward_4400035": 0.9522189859016953, "test/sim_max_reward_4400036": 0.5247233687512698, "test/sim_max_reward_4400037": 0.8843629658616408, "test/sim_max_reward_4400038": 0.2040082182189254, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.5331561889087423, "test/sim_max_reward_4400043": 0.9674502447834729, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9924292736332937, "test/sim_max_reward_4400046": 0.9563922098613873, "test/sim_max_reward_4400047": 0.9351017282425088, "test/sim_max_reward_4400048": 0.08730222284544824, "test/sim_max_reward_4400049": 0.9276337834324263, "train/mean_score": 0.712392774296763, "test/mean_score": 0.5600118260854883, "val_loss": 69042.53125} {"train_loss": -7.108595371246338, "global_step": 197442, "epoch": 4701} {"train_loss": -7.166873931884766, "global_step": 197443, "epoch": 4701} {"train_loss": -7.132688522338867, "global_step": 197444, "epoch": 4701} {"train_loss": -7.189944267272949, "global_step": 197445, "epoch": 4701} {"train_loss": -7.071423530578613, "global_step": 197446, "epoch": 4701} {"train_loss": -7.217207431793213, "global_step": 197447, "epoch": 4701} {"train_loss": -7.234466075897217, "global_step": 197448, "epoch": 4701} {"train_loss": -7.152709484100342, "global_step": 197449, "epoch": 4701} {"train_loss": -7.1152191162109375, "global_step": 197450, "epoch": 4701} {"train_loss": -7.1187663078308105, "global_step": 197451, "epoch": 4701} {"train_loss": -7.163379669189453, "global_step": 197452, "epoch": 4701} {"train_loss": -7.195258140563965, "global_step": 197453, "epoch": 4701} {"train_loss": -7.260169506072998, "global_step": 197454, "epoch": 4701} {"train_loss": -7.192976951599121, "global_step": 197455, "epoch": 4701} {"train_loss": -7.277815818786621, "global_step": 197456, "epoch": 4701} {"train_loss": -7.19827938079834, "global_step": 197457, "epoch": 4701} {"train_loss": -7.276556968688965, "global_step": 197458, "epoch": 4701} {"train_loss": -7.250845432281494, "global_step": 197459, "epoch": 4701} {"train_loss": -7.251162528991699, "global_step": 197460, "epoch": 4701} {"train_loss": -7.184876441955566, "global_step": 197461, "epoch": 4701} {"train_loss": -7.307078838348389, "global_step": 197462, "epoch": 4701} {"train_loss": -7.209593772888184, "global_step": 197463, "epoch": 4701} {"train_loss": -7.201970100402832, "global_step": 197464, "epoch": 4701} {"train_loss": -7.183649063110352, "global_step": 197465, "epoch": 4701} {"train_loss": -7.093977928161621, "global_step": 197466, "epoch": 4701} {"train_loss": -7.211378574371338, "global_step": 197467, "epoch": 4701} {"train_loss": -7.166454315185547, "global_step": 197468, "epoch": 4701} {"train_loss": -7.174508571624756, "global_step": 197469, "epoch": 4701} {"train_loss": -7.221183776855469, "global_step": 197470, "epoch": 4701} {"train_loss": -7.234889507293701, "global_step": 197471, "epoch": 4701} {"train_loss": -7.16133451461792, "global_step": 197472, "epoch": 4701} {"train_loss": -7.183780670166016, "global_step": 197473, "epoch": 4701} {"train_loss": -7.192875862121582, "global_step": 197474, "epoch": 4701} {"train_loss": -7.289003372192383, "global_step": 197475, "epoch": 4701} {"train_loss": -7.073299407958984, "global_step": 197476, "epoch": 4701} {"train_loss": -7.195958614349365, "global_step": 197477, "epoch": 4701} {"train_loss": -7.1830549240112305, "global_step": 197478, "epoch": 4701} {"train_loss": -7.224382400512695, "global_step": 197479, "epoch": 4701} {"train_loss": -7.260367393493652, "global_step": 197480, "epoch": 4701} {"train_loss": -7.183480262756348, "global_step": 197481, "epoch": 4701} {"train_loss": -7.289172649383545, "global_step": 197482, "epoch": 4701} {"train_loss": -7.195778267724173, "global_step": 197483, "epoch": 4701, "val_loss": 69057.8046875} {"train_loss": -7.234246253967285, "global_step": 197484, "epoch": 4702} {"train_loss": -7.2438249588012695, "global_step": 197485, "epoch": 4702} {"train_loss": -7.320019721984863, "global_step": 197486, "epoch": 4702} {"train_loss": -7.323225021362305, "global_step": 197487, "epoch": 4702} {"train_loss": -7.1963958740234375, "global_step": 197488, "epoch": 4702} {"train_loss": -7.230559349060059, "global_step": 197489, "epoch": 4702} {"train_loss": -7.2046709060668945, "global_step": 197490, "epoch": 4702} {"train_loss": -7.128647804260254, "global_step": 197491, "epoch": 4702} {"train_loss": -7.313360691070557, "global_step": 197492, "epoch": 4702} {"train_loss": -7.376386642456055, "global_step": 197493, "epoch": 4702} {"train_loss": -7.180233955383301, "global_step": 197494, "epoch": 4702} {"train_loss": -7.233076572418213, "global_step": 197495, "epoch": 4702} {"train_loss": -7.2416229248046875, "global_step": 197496, "epoch": 4702} {"train_loss": -7.278359413146973, "global_step": 197497, "epoch": 4702} {"train_loss": -7.223316669464111, "global_step": 197498, "epoch": 4702} {"train_loss": -7.144814491271973, "global_step": 197499, "epoch": 4702} {"train_loss": -7.130378723144531, "global_step": 197500, "epoch": 4702} {"train_loss": -7.2931365966796875, "global_step": 197501, "epoch": 4702} {"train_loss": -7.184110641479492, "global_step": 197502, "epoch": 4702} {"train_loss": -7.176995277404785, "global_step": 197503, "epoch": 4702} {"train_loss": -7.14114236831665, "global_step": 197504, "epoch": 4702} {"train_loss": -7.185325622558594, "global_step": 197505, "epoch": 4702} {"train_loss": -7.091249465942383, "global_step": 197506, "epoch": 4702} {"train_loss": -7.105915546417236, "global_step": 197507, "epoch": 4702} {"train_loss": -7.272708892822266, "global_step": 197508, "epoch": 4702} {"train_loss": -7.161921501159668, "global_step": 197509, "epoch": 4702} {"train_loss": -7.240543365478516, "global_step": 197510, "epoch": 4702} {"train_loss": -7.228310585021973, "global_step": 197511, "epoch": 4702} {"train_loss": -7.319089889526367, "global_step": 197512, "epoch": 4702} {"train_loss": -7.189324855804443, "global_step": 197513, "epoch": 4702} {"train_loss": -7.222341537475586, "global_step": 197514, "epoch": 4702} {"train_loss": -7.068319320678711, "global_step": 197515, "epoch": 4702} {"train_loss": -7.1986799240112305, "global_step": 197516, "epoch": 4702} {"train_loss": -7.1642608642578125, "global_step": 197517, "epoch": 4702} {"train_loss": -6.912483215332031, "global_step": 197518, "epoch": 4702} {"train_loss": -7.008376121520996, "global_step": 197519, "epoch": 4702} {"train_loss": -7.031343460083008, "global_step": 197520, "epoch": 4702} {"train_loss": -7.0361151695251465, "global_step": 197521, "epoch": 4702} {"train_loss": -7.058841228485107, "global_step": 197522, "epoch": 4702} {"train_loss": -7.016458511352539, "global_step": 197523, "epoch": 4702} {"train_loss": -7.1011552810668945, "global_step": 197524, "epoch": 4702} {"train_loss": -7.176847946076166, "global_step": 197525, "epoch": 4702, "val_loss": 69128.7890625} {"train_loss": -7.0543718338012695, "global_step": 197526, "epoch": 4703} {"train_loss": -7.062192916870117, "global_step": 197527, "epoch": 4703} {"train_loss": -7.010448455810547, "global_step": 197528, "epoch": 4703} {"train_loss": -7.068620681762695, "global_step": 197529, "epoch": 4703} {"train_loss": -7.09531831741333, "global_step": 197530, "epoch": 4703} {"train_loss": -7.047043800354004, "global_step": 197531, "epoch": 4703} {"train_loss": -7.055189609527588, "global_step": 197532, "epoch": 4703} {"train_loss": -7.178995132446289, "global_step": 197533, "epoch": 4703} {"train_loss": -6.941582202911377, "global_step": 197534, "epoch": 4703} {"train_loss": -7.137350082397461, "global_step": 197535, "epoch": 4703} {"train_loss": -7.027723789215088, "global_step": 197536, "epoch": 4703} {"train_loss": -7.058383464813232, "global_step": 197537, "epoch": 4703} {"train_loss": -7.040652275085449, "global_step": 197538, "epoch": 4703} {"train_loss": -7.08112096786499, "global_step": 197539, "epoch": 4703} {"train_loss": -7.048583030700684, "global_step": 197540, "epoch": 4703} {"train_loss": -6.964972496032715, "global_step": 197541, "epoch": 4703} {"train_loss": -7.039340496063232, "global_step": 197542, "epoch": 4703} {"train_loss": -7.067296028137207, "global_step": 197543, "epoch": 4703} {"train_loss": -7.212802410125732, "global_step": 197544, "epoch": 4703} {"train_loss": -7.125709533691406, "global_step": 197545, "epoch": 4703} {"train_loss": -7.157034873962402, "global_step": 197546, "epoch": 4703} {"train_loss": -7.14836311340332, "global_step": 197547, "epoch": 4703} {"train_loss": -7.243529319763184, "global_step": 197548, "epoch": 4703} {"train_loss": -7.187707424163818, "global_step": 197549, "epoch": 4703} {"train_loss": -7.223541259765625, "global_step": 197550, "epoch": 4703} {"train_loss": -7.131016731262207, "global_step": 197551, "epoch": 4703} {"train_loss": -7.191985130310059, "global_step": 197552, "epoch": 4703} {"train_loss": -7.231566429138184, "global_step": 197553, "epoch": 4703} {"train_loss": -7.071500301361084, "global_step": 197554, "epoch": 4703} {"train_loss": -7.376131534576416, "global_step": 197555, "epoch": 4703} {"train_loss": -7.226879119873047, "global_step": 197556, "epoch": 4703} {"train_loss": -7.082456588745117, "global_step": 197557, "epoch": 4703} {"train_loss": -7.226509094238281, "global_step": 197558, "epoch": 4703} {"train_loss": -7.109424591064453, "global_step": 197559, "epoch": 4703} {"train_loss": -7.173737049102783, "global_step": 197560, "epoch": 4703} {"train_loss": -7.178243160247803, "global_step": 197561, "epoch": 4703} {"train_loss": -7.174922943115234, "global_step": 197562, "epoch": 4703} {"train_loss": -7.178067207336426, "global_step": 197563, "epoch": 4703} {"train_loss": -7.270905494689941, "global_step": 197564, "epoch": 4703} {"train_loss": -7.119524002075195, "global_step": 197565, "epoch": 4703} {"train_loss": -7.255019664764404, "global_step": 197566, "epoch": 4703} {"train_loss": -7.127520186560495, "global_step": 197567, "epoch": 4703, "val_loss": 69038.71875} {"train_loss": -7.20047664642334, "global_step": 197568, "epoch": 4704} {"train_loss": -7.238910675048828, "global_step": 197569, "epoch": 4704} {"train_loss": -7.101036548614502, "global_step": 197570, "epoch": 4704} {"train_loss": -7.299727916717529, "global_step": 197571, "epoch": 4704} {"train_loss": -7.0931878089904785, "global_step": 197572, "epoch": 4704} {"train_loss": -7.224640846252441, "global_step": 197573, "epoch": 4704} {"train_loss": -7.163111686706543, "global_step": 197574, "epoch": 4704} {"train_loss": -7.166999816894531, "global_step": 197575, "epoch": 4704} {"train_loss": -7.254819869995117, "global_step": 197576, "epoch": 4704} {"train_loss": -7.28230094909668, "global_step": 197577, "epoch": 4704} {"train_loss": -7.085813999176025, "global_step": 197578, "epoch": 4704} {"train_loss": -7.063968181610107, "global_step": 197579, "epoch": 4704} {"train_loss": -7.108483791351318, "global_step": 197580, "epoch": 4704} {"train_loss": -7.203957557678223, "global_step": 197581, "epoch": 4704} {"train_loss": -7.13897705078125, "global_step": 197582, "epoch": 4704} {"train_loss": -7.171277046203613, "global_step": 197583, "epoch": 4704} {"train_loss": -7.08613395690918, "global_step": 197584, "epoch": 4704} {"train_loss": -7.1133575439453125, "global_step": 197585, "epoch": 4704} {"train_loss": -7.356441497802734, "global_step": 197586, "epoch": 4704} {"train_loss": -7.195954322814941, "global_step": 197587, "epoch": 4704} {"train_loss": -7.181113243103027, "global_step": 197588, "epoch": 4704} {"train_loss": -7.105731010437012, "global_step": 197589, "epoch": 4704} {"train_loss": -7.025168418884277, "global_step": 197590, "epoch": 4704} {"train_loss": -7.22868013381958, "global_step": 197591, "epoch": 4704} {"train_loss": -7.139065742492676, "global_step": 197592, "epoch": 4704} {"train_loss": -7.224554061889648, "global_step": 197593, "epoch": 4704} {"train_loss": -7.3121185302734375, "global_step": 197594, "epoch": 4704} {"train_loss": -7.123324871063232, "global_step": 197595, "epoch": 4704} {"train_loss": -7.234150409698486, "global_step": 197596, "epoch": 4704} {"train_loss": -7.232044219970703, "global_step": 197597, "epoch": 4704} {"train_loss": -7.341042518615723, "global_step": 197598, "epoch": 4704} {"train_loss": -7.36189079284668, "global_step": 197599, "epoch": 4704} {"train_loss": -7.113729000091553, "global_step": 197600, "epoch": 4704} {"train_loss": -7.255216121673584, "global_step": 197601, "epoch": 4704} {"train_loss": -7.339362144470215, "global_step": 197602, "epoch": 4704} {"train_loss": -7.2911553382873535, "global_step": 197603, "epoch": 4704} {"train_loss": -7.272762298583984, "global_step": 197604, "epoch": 4704} {"train_loss": -7.143309593200684, "global_step": 197605, "epoch": 4704} {"train_loss": -7.103105545043945, "global_step": 197606, "epoch": 4704} {"train_loss": -7.247837066650391, "global_step": 197607, "epoch": 4704} {"train_loss": -7.211924076080322, "global_step": 197608, "epoch": 4704} {"train_loss": -7.197627147038777, "global_step": 197609, "epoch": 4704, "val_loss": 68970.7109375} {"train_loss": -7.27752685546875, "global_step": 197610, "epoch": 4705} {"train_loss": -7.214024543762207, "global_step": 197611, "epoch": 4705} {"train_loss": -7.330306529998779, "global_step": 197612, "epoch": 4705} {"train_loss": -7.370349884033203, "global_step": 197613, "epoch": 4705} {"train_loss": -7.2402167320251465, "global_step": 197614, "epoch": 4705} {"train_loss": -7.170379638671875, "global_step": 197615, "epoch": 4705} {"train_loss": -7.225978851318359, "global_step": 197616, "epoch": 4705} {"train_loss": -7.244378089904785, "global_step": 197617, "epoch": 4705} {"train_loss": -7.263077735900879, "global_step": 197618, "epoch": 4705} {"train_loss": -7.301732540130615, "global_step": 197619, "epoch": 4705} {"train_loss": -7.314894676208496, "global_step": 197620, "epoch": 4705} {"train_loss": -7.185056686401367, "global_step": 197621, "epoch": 4705} {"train_loss": -7.289122581481934, "global_step": 197622, "epoch": 4705} {"train_loss": -7.2450947761535645, "global_step": 197623, "epoch": 4705} {"train_loss": -7.186750411987305, "global_step": 197624, "epoch": 4705} {"train_loss": -7.1445441246032715, "global_step": 197625, "epoch": 4705} {"train_loss": -7.276044845581055, "global_step": 197626, "epoch": 4705} {"train_loss": -7.225277900695801, "global_step": 197627, "epoch": 4705} {"train_loss": -7.152468681335449, "global_step": 197628, "epoch": 4705} {"train_loss": -7.192226409912109, "global_step": 197629, "epoch": 4705} {"train_loss": -7.253282070159912, "global_step": 197630, "epoch": 4705} {"train_loss": -7.218659400939941, "global_step": 197631, "epoch": 4705} {"train_loss": -7.195549964904785, "global_step": 197632, "epoch": 4705} {"train_loss": -7.247613430023193, "global_step": 197633, "epoch": 4705} {"train_loss": -7.169597625732422, "global_step": 197634, "epoch": 4705} {"train_loss": -7.280940055847168, "global_step": 197635, "epoch": 4705} {"train_loss": -7.194039821624756, "global_step": 197636, "epoch": 4705} {"train_loss": -7.242326736450195, "global_step": 197637, "epoch": 4705} {"train_loss": -7.227624893188477, "global_step": 197638, "epoch": 4705} {"train_loss": -7.263879776000977, "global_step": 197639, "epoch": 4705} {"train_loss": -7.251594543457031, "global_step": 197640, "epoch": 4705} {"train_loss": -7.242724895477295, "global_step": 197641, "epoch": 4705} {"train_loss": -7.088599681854248, "global_step": 197642, "epoch": 4705} {"train_loss": -7.185490131378174, "global_step": 197643, "epoch": 4705} {"train_loss": -7.211040496826172, "global_step": 197644, "epoch": 4705} {"train_loss": -7.203617095947266, "global_step": 197645, "epoch": 4705} {"train_loss": -7.175380706787109, "global_step": 197646, "epoch": 4705} {"train_loss": -7.23080587387085, "global_step": 197647, "epoch": 4705} {"train_loss": -7.243410587310791, "global_step": 197648, "epoch": 4705} {"train_loss": -7.2609710693359375, "global_step": 197649, "epoch": 4705} {"train_loss": -7.230094909667969, "global_step": 197650, "epoch": 4705} {"train_loss": -7.228435289292109, "global_step": 197651, "epoch": 4705, "val_loss": 69070.59375} {"train_loss": -7.283407211303711, "global_step": 197652, "epoch": 4706} {"train_loss": -7.292488098144531, "global_step": 197653, "epoch": 4706} {"train_loss": -7.318121910095215, "global_step": 197654, "epoch": 4706} {"train_loss": -7.204568386077881, "global_step": 197655, "epoch": 4706} {"train_loss": -7.2281012535095215, "global_step": 197656, "epoch": 4706} {"train_loss": -7.262619972229004, "global_step": 197657, "epoch": 4706} {"train_loss": -7.161150932312012, "global_step": 197658, "epoch": 4706} {"train_loss": -7.0442304611206055, "global_step": 197659, "epoch": 4706} {"train_loss": -7.216519355773926, "global_step": 197660, "epoch": 4706} {"train_loss": -7.171433448791504, "global_step": 197661, "epoch": 4706} {"train_loss": -7.0881028175354, "global_step": 197662, "epoch": 4706} {"train_loss": -7.279547691345215, "global_step": 197663, "epoch": 4706} {"train_loss": -7.277766227722168, "global_step": 197664, "epoch": 4706} {"train_loss": -7.213659286499023, "global_step": 197665, "epoch": 4706} {"train_loss": -7.211101531982422, "global_step": 197666, "epoch": 4706} {"train_loss": -7.317216396331787, "global_step": 197667, "epoch": 4706} {"train_loss": -7.111891746520996, "global_step": 197668, "epoch": 4706} {"train_loss": -7.3030266761779785, "global_step": 197669, "epoch": 4706} {"train_loss": -7.100424289703369, "global_step": 197670, "epoch": 4706} {"train_loss": -7.2570695877075195, "global_step": 197671, "epoch": 4706} {"train_loss": -7.058067321777344, "global_step": 197672, "epoch": 4706} {"train_loss": -7.256022930145264, "global_step": 197673, "epoch": 4706} {"train_loss": -7.205411911010742, "global_step": 197674, "epoch": 4706} {"train_loss": -7.261955261230469, "global_step": 197675, "epoch": 4706} {"train_loss": -7.235724925994873, "global_step": 197676, "epoch": 4706} {"train_loss": -7.22116756439209, "global_step": 197677, "epoch": 4706} {"train_loss": -7.179863452911377, "global_step": 197678, "epoch": 4706} {"train_loss": -7.2276434898376465, "global_step": 197679, "epoch": 4706} {"train_loss": -7.250308513641357, "global_step": 197680, "epoch": 4706} {"train_loss": -7.2659010887146, "global_step": 197681, "epoch": 4706} {"train_loss": -7.252025127410889, "global_step": 197682, "epoch": 4706} {"train_loss": -7.191164970397949, "global_step": 197683, "epoch": 4706} {"train_loss": -7.147403240203857, "global_step": 197684, "epoch": 4706} {"train_loss": -7.152001857757568, "global_step": 197685, "epoch": 4706} {"train_loss": -7.25871467590332, "global_step": 197686, "epoch": 4706} {"train_loss": -7.1988725662231445, "global_step": 197687, "epoch": 4706} {"train_loss": -7.2628302574157715, "global_step": 197688, "epoch": 4706} {"train_loss": -7.306418418884277, "global_step": 197689, "epoch": 4706} {"train_loss": -7.253848075866699, "global_step": 197690, "epoch": 4706} {"train_loss": -7.1759467124938965, "global_step": 197691, "epoch": 4706} {"train_loss": -7.247434616088867, "global_step": 197692, "epoch": 4706} {"train_loss": -7.219450530551729, "global_step": 197693, "epoch": 4706, "val_loss": 68961.40625} {"train_loss": -7.253227710723877, "global_step": 197694, "epoch": 4707} {"train_loss": -7.309427738189697, "global_step": 197695, "epoch": 4707} {"train_loss": -7.3149542808532715, "global_step": 197696, "epoch": 4707} {"train_loss": -7.186281204223633, "global_step": 197697, "epoch": 4707} {"train_loss": -7.329684257507324, "global_step": 197698, "epoch": 4707} {"train_loss": -7.385847568511963, "global_step": 197699, "epoch": 4707} {"train_loss": -7.343137741088867, "global_step": 197700, "epoch": 4707} {"train_loss": -7.316187858581543, "global_step": 197701, "epoch": 4707} {"train_loss": -7.156641960144043, "global_step": 197702, "epoch": 4707} {"train_loss": -7.225368499755859, "global_step": 197703, "epoch": 4707} {"train_loss": -7.33692741394043, "global_step": 197704, "epoch": 4707} {"train_loss": -7.200258731842041, "global_step": 197705, "epoch": 4707} {"train_loss": -7.433327674865723, "global_step": 197706, "epoch": 4707} {"train_loss": -7.274152755737305, "global_step": 197707, "epoch": 4707} {"train_loss": -7.318085670471191, "global_step": 197708, "epoch": 4707} {"train_loss": -7.283299446105957, "global_step": 197709, "epoch": 4707} {"train_loss": -7.2888383865356445, "global_step": 197710, "epoch": 4707} {"train_loss": -7.274532318115234, "global_step": 197711, "epoch": 4707} {"train_loss": -7.279406547546387, "global_step": 197712, "epoch": 4707} {"train_loss": -7.158600807189941, "global_step": 197713, "epoch": 4707} {"train_loss": -7.189051628112793, "global_step": 197714, "epoch": 4707} {"train_loss": -7.260275840759277, "global_step": 197715, "epoch": 4707} {"train_loss": -7.303736209869385, "global_step": 197716, "epoch": 4707} {"train_loss": -7.139378070831299, "global_step": 197717, "epoch": 4707} {"train_loss": -7.174853324890137, "global_step": 197718, "epoch": 4707} {"train_loss": -7.230415344238281, "global_step": 197719, "epoch": 4707} {"train_loss": -7.275925636291504, "global_step": 197720, "epoch": 4707} {"train_loss": -7.271515369415283, "global_step": 197721, "epoch": 4707} {"train_loss": -7.228849411010742, "global_step": 197722, "epoch": 4707} {"train_loss": -7.102036952972412, "global_step": 197723, "epoch": 4707} {"train_loss": -7.31964635848999, "global_step": 197724, "epoch": 4707} {"train_loss": -7.167000770568848, "global_step": 197725, "epoch": 4707} {"train_loss": -7.272542953491211, "global_step": 197726, "epoch": 4707} {"train_loss": -7.239307403564453, "global_step": 197727, "epoch": 4707} {"train_loss": -7.227602958679199, "global_step": 197728, "epoch": 4707} {"train_loss": -7.205451488494873, "global_step": 197729, "epoch": 4707} {"train_loss": -7.1578369140625, "global_step": 197730, "epoch": 4707} {"train_loss": -7.237565040588379, "global_step": 197731, "epoch": 4707} {"train_loss": -7.079439163208008, "global_step": 197732, "epoch": 4707} {"train_loss": -7.114895343780518, "global_step": 197733, "epoch": 4707} {"train_loss": -7.191745758056641, "global_step": 197734, "epoch": 4707} {"train_loss": -7.238866317839849, "global_step": 197735, "epoch": 4707, "val_loss": 68974.6640625} {"train_loss": -7.257318496704102, "global_step": 197736, "epoch": 4708} {"train_loss": -7.194580554962158, "global_step": 197737, "epoch": 4708} {"train_loss": -7.079686641693115, "global_step": 197738, "epoch": 4708} {"train_loss": -7.221227169036865, "global_step": 197739, "epoch": 4708} {"train_loss": -7.064662933349609, "global_step": 197740, "epoch": 4708} {"train_loss": -6.888537406921387, "global_step": 197741, "epoch": 4708} {"train_loss": -7.051082611083984, "global_step": 197742, "epoch": 4708} {"train_loss": -6.93144416809082, "global_step": 197743, "epoch": 4708} {"train_loss": -7.0438055992126465, "global_step": 197744, "epoch": 4708} {"train_loss": -7.094978332519531, "global_step": 197745, "epoch": 4708} {"train_loss": -7.112576484680176, "global_step": 197746, "epoch": 4708} {"train_loss": -7.187278747558594, "global_step": 197747, "epoch": 4708} {"train_loss": -7.178118705749512, "global_step": 197748, "epoch": 4708} {"train_loss": -7.267701148986816, "global_step": 197749, "epoch": 4708} {"train_loss": -7.139767646789551, "global_step": 197750, "epoch": 4708} {"train_loss": -7.116137504577637, "global_step": 197751, "epoch": 4708} {"train_loss": -7.239614486694336, "global_step": 197752, "epoch": 4708} {"train_loss": -7.143105506896973, "global_step": 197753, "epoch": 4708} {"train_loss": -7.2388153076171875, "global_step": 197754, "epoch": 4708} {"train_loss": -7.202048301696777, "global_step": 197755, "epoch": 4708} {"train_loss": -7.204110622406006, "global_step": 197756, "epoch": 4708} {"train_loss": -7.214077472686768, "global_step": 197757, "epoch": 4708} {"train_loss": -7.096238136291504, "global_step": 197758, "epoch": 4708} {"train_loss": -7.233502388000488, "global_step": 197759, "epoch": 4708} {"train_loss": -7.255309581756592, "global_step": 197760, "epoch": 4708} {"train_loss": -7.22393798828125, "global_step": 197761, "epoch": 4708} {"train_loss": -7.231967926025391, "global_step": 197762, "epoch": 4708} {"train_loss": -7.227005958557129, "global_step": 197763, "epoch": 4708} {"train_loss": -7.232425212860107, "global_step": 197764, "epoch": 4708} {"train_loss": -7.24176025390625, "global_step": 197765, "epoch": 4708} {"train_loss": -7.355648994445801, "global_step": 197766, "epoch": 4708} {"train_loss": -7.260044097900391, "global_step": 197767, "epoch": 4708} {"train_loss": -7.20400333404541, "global_step": 197768, "epoch": 4708} {"train_loss": -7.273143768310547, "global_step": 197769, "epoch": 4708} {"train_loss": -7.23796272277832, "global_step": 197770, "epoch": 4708} {"train_loss": -7.270744323730469, "global_step": 197771, "epoch": 4708} {"train_loss": -7.240708351135254, "global_step": 197772, "epoch": 4708} {"train_loss": -7.257437705993652, "global_step": 197773, "epoch": 4708} {"train_loss": -7.200499057769775, "global_step": 197774, "epoch": 4708} {"train_loss": -7.241824150085449, "global_step": 197775, "epoch": 4708} {"train_loss": -7.1371002197265625, "global_step": 197776, "epoch": 4708} {"train_loss": -7.181403932117281, "global_step": 197777, "epoch": 4708, "val_loss": 69039.46875} {"train_loss": -7.18480110168457, "global_step": 197778, "epoch": 4709} {"train_loss": -7.167243480682373, "global_step": 197779, "epoch": 4709} {"train_loss": -7.10032844543457, "global_step": 197780, "epoch": 4709} {"train_loss": -7.170975685119629, "global_step": 197781, "epoch": 4709} {"train_loss": -7.197002410888672, "global_step": 197782, "epoch": 4709} {"train_loss": -7.206027030944824, "global_step": 197783, "epoch": 4709} {"train_loss": -7.180091857910156, "global_step": 197784, "epoch": 4709} {"train_loss": -7.143880367279053, "global_step": 197785, "epoch": 4709} {"train_loss": -7.118150234222412, "global_step": 197786, "epoch": 4709} {"train_loss": -7.159364223480225, "global_step": 197787, "epoch": 4709} {"train_loss": -7.17845344543457, "global_step": 197788, "epoch": 4709} {"train_loss": -6.9870991706848145, "global_step": 197789, "epoch": 4709} {"train_loss": -7.1551971435546875, "global_step": 197790, "epoch": 4709} {"train_loss": -7.160788059234619, "global_step": 197791, "epoch": 4709} {"train_loss": -7.233466148376465, "global_step": 197792, "epoch": 4709} {"train_loss": -7.095099449157715, "global_step": 197793, "epoch": 4709} {"train_loss": -7.22052001953125, "global_step": 197794, "epoch": 4709} {"train_loss": -7.250065803527832, "global_step": 197795, "epoch": 4709} {"train_loss": -7.193422317504883, "global_step": 197796, "epoch": 4709} {"train_loss": -7.184739112854004, "global_step": 197797, "epoch": 4709} {"train_loss": -7.049623489379883, "global_step": 197798, "epoch": 4709} {"train_loss": -7.247627258300781, "global_step": 197799, "epoch": 4709} {"train_loss": -7.288936614990234, "global_step": 197800, "epoch": 4709} {"train_loss": -7.12392520904541, "global_step": 197801, "epoch": 4709} {"train_loss": -7.232902526855469, "global_step": 197802, "epoch": 4709} {"train_loss": -7.136050224304199, "global_step": 197803, "epoch": 4709} {"train_loss": -7.128865718841553, "global_step": 197804, "epoch": 4709} {"train_loss": -6.945659637451172, "global_step": 197805, "epoch": 4709} {"train_loss": -6.878057479858398, "global_step": 197806, "epoch": 4709} {"train_loss": -7.2775421142578125, "global_step": 197807, "epoch": 4709} {"train_loss": -6.973071575164795, "global_step": 197808, "epoch": 4709} {"train_loss": -7.0669965744018555, "global_step": 197809, "epoch": 4709} {"train_loss": -6.951105117797852, "global_step": 197810, "epoch": 4709} {"train_loss": -7.012510299682617, "global_step": 197811, "epoch": 4709} {"train_loss": -7.233275413513184, "global_step": 197812, "epoch": 4709} {"train_loss": -7.211913585662842, "global_step": 197813, "epoch": 4709} {"train_loss": -7.1966047286987305, "global_step": 197814, "epoch": 4709} {"train_loss": -7.122860908508301, "global_step": 197815, "epoch": 4709} {"train_loss": -7.178923606872559, "global_step": 197816, "epoch": 4709} {"train_loss": -7.088900089263916, "global_step": 197817, "epoch": 4709} {"train_loss": -7.330544471740723, "global_step": 197818, "epoch": 4709} {"train_loss": -7.144367865153721, "global_step": 197819, "epoch": 4709, "val_loss": 68929.890625} {"train_loss": -7.216550827026367, "global_step": 197820, "epoch": 4710} {"train_loss": -7.198644638061523, "global_step": 197821, "epoch": 4710} {"train_loss": -7.136226654052734, "global_step": 197822, "epoch": 4710} {"train_loss": -7.2628889083862305, "global_step": 197823, "epoch": 4710} {"train_loss": -7.250200271606445, "global_step": 197824, "epoch": 4710} {"train_loss": -7.147366523742676, "global_step": 197825, "epoch": 4710} {"train_loss": -7.174556732177734, "global_step": 197826, "epoch": 4710} {"train_loss": -7.073195934295654, "global_step": 197827, "epoch": 4710} {"train_loss": -7.287315845489502, "global_step": 197828, "epoch": 4710} {"train_loss": -7.184129238128662, "global_step": 197829, "epoch": 4710} {"train_loss": -7.183169364929199, "global_step": 197830, "epoch": 4710} {"train_loss": -7.157726287841797, "global_step": 197831, "epoch": 4710} {"train_loss": -7.279644966125488, "global_step": 197832, "epoch": 4710} {"train_loss": -7.268190383911133, "global_step": 197833, "epoch": 4710} {"train_loss": -7.273767471313477, "global_step": 197834, "epoch": 4710} {"train_loss": -7.180808067321777, "global_step": 197835, "epoch": 4710} {"train_loss": -7.081386566162109, "global_step": 197836, "epoch": 4710} {"train_loss": -7.195247173309326, "global_step": 197837, "epoch": 4710} {"train_loss": -7.146768569946289, "global_step": 197838, "epoch": 4710} {"train_loss": -7.201921463012695, "global_step": 197839, "epoch": 4710} {"train_loss": -7.221936225891113, "global_step": 197840, "epoch": 4710} {"train_loss": -7.205721378326416, "global_step": 197841, "epoch": 4710} {"train_loss": -7.247443199157715, "global_step": 197842, "epoch": 4710} {"train_loss": -7.023361682891846, "global_step": 197843, "epoch": 4710} {"train_loss": -7.17666482925415, "global_step": 197844, "epoch": 4710} {"train_loss": -7.225854396820068, "global_step": 197845, "epoch": 4710} {"train_loss": -7.197482585906982, "global_step": 197846, "epoch": 4710} {"train_loss": -7.14890718460083, "global_step": 197847, "epoch": 4710} {"train_loss": -7.076557159423828, "global_step": 197848, "epoch": 4710} {"train_loss": -7.121882438659668, "global_step": 197849, "epoch": 4710} {"train_loss": -7.182856559753418, "global_step": 197850, "epoch": 4710} {"train_loss": -7.0565505027771, "global_step": 197851, "epoch": 4710} {"train_loss": -7.09007453918457, "global_step": 197852, "epoch": 4710} {"train_loss": -7.0461506843566895, "global_step": 197853, "epoch": 4710} {"train_loss": -7.0555419921875, "global_step": 197854, "epoch": 4710} {"train_loss": -7.17622709274292, "global_step": 197855, "epoch": 4710} {"train_loss": -6.942560195922852, "global_step": 197856, "epoch": 4710} {"train_loss": -7.144161224365234, "global_step": 197857, "epoch": 4710} {"train_loss": -7.1258721351623535, "global_step": 197858, "epoch": 4710} {"train_loss": -7.1262617111206055, "global_step": 197859, "epoch": 4710} {"train_loss": -6.999195575714111, "global_step": 197860, "epoch": 4710} {"train_loss": -7.156205744970412, "global_step": 197861, "epoch": 4710, "val_loss": 69216.0390625} {"train_loss": -7.161027431488037, "global_step": 197862, "epoch": 4711} {"train_loss": -7.217709541320801, "global_step": 197863, "epoch": 4711} {"train_loss": -7.208804130554199, "global_step": 197864, "epoch": 4711} {"train_loss": -7.075135231018066, "global_step": 197865, "epoch": 4711} {"train_loss": -7.096624851226807, "global_step": 197866, "epoch": 4711} {"train_loss": -7.051906108856201, "global_step": 197867, "epoch": 4711} {"train_loss": -7.1918206214904785, "global_step": 197868, "epoch": 4711} {"train_loss": -7.156086444854736, "global_step": 197869, "epoch": 4711} {"train_loss": -7.146831512451172, "global_step": 197870, "epoch": 4711} {"train_loss": -7.295771598815918, "global_step": 197871, "epoch": 4711} {"train_loss": -7.262936592102051, "global_step": 197872, "epoch": 4711} {"train_loss": -7.121978759765625, "global_step": 197873, "epoch": 4711} {"train_loss": -7.277682781219482, "global_step": 197874, "epoch": 4711} {"train_loss": -7.130245685577393, "global_step": 197875, "epoch": 4711} {"train_loss": -7.148467063903809, "global_step": 197876, "epoch": 4711} {"train_loss": -7.1907734870910645, "global_step": 197877, "epoch": 4711} {"train_loss": -7.151706695556641, "global_step": 197878, "epoch": 4711} {"train_loss": -7.231049537658691, "global_step": 197879, "epoch": 4711} {"train_loss": -7.129244804382324, "global_step": 197880, "epoch": 4711} {"train_loss": -7.253634452819824, "global_step": 197881, "epoch": 4711} {"train_loss": -7.209916591644287, "global_step": 197882, "epoch": 4711} {"train_loss": -7.1925201416015625, "global_step": 197883, "epoch": 4711} {"train_loss": -7.130417823791504, "global_step": 197884, "epoch": 4711} {"train_loss": -7.17874813079834, "global_step": 197885, "epoch": 4711} {"train_loss": -7.193820953369141, "global_step": 197886, "epoch": 4711} {"train_loss": -7.242049694061279, "global_step": 197887, "epoch": 4711} {"train_loss": -7.282618045806885, "global_step": 197888, "epoch": 4711} {"train_loss": -7.008182525634766, "global_step": 197889, "epoch": 4711} {"train_loss": -7.225815773010254, "global_step": 197890, "epoch": 4711} {"train_loss": -7.267913818359375, "global_step": 197891, "epoch": 4711} {"train_loss": -7.10606575012207, "global_step": 197892, "epoch": 4711} {"train_loss": -7.130832672119141, "global_step": 197893, "epoch": 4711} {"train_loss": -7.151596546173096, "global_step": 197894, "epoch": 4711} {"train_loss": -7.157471656799316, "global_step": 197895, "epoch": 4711} {"train_loss": -7.1516571044921875, "global_step": 197896, "epoch": 4711} {"train_loss": -7.185391426086426, "global_step": 197897, "epoch": 4711} {"train_loss": -7.254405975341797, "global_step": 197898, "epoch": 4711} {"train_loss": -7.172250747680664, "global_step": 197899, "epoch": 4711} {"train_loss": -7.182992935180664, "global_step": 197900, "epoch": 4711} {"train_loss": -7.207799911499023, "global_step": 197901, "epoch": 4711} {"train_loss": -7.1888861656188965, "global_step": 197902, "epoch": 4711} {"train_loss": -7.173669145220802, "global_step": 197903, "epoch": 4711, "val_loss": 69021.46875} {"train_loss": -7.177698135375977, "global_step": 197904, "epoch": 4712} {"train_loss": -7.1871337890625, "global_step": 197905, "epoch": 4712} {"train_loss": -7.177432060241699, "global_step": 197906, "epoch": 4712} {"train_loss": -7.148431777954102, "global_step": 197907, "epoch": 4712} {"train_loss": -7.148642063140869, "global_step": 197908, "epoch": 4712} {"train_loss": -7.21480131149292, "global_step": 197909, "epoch": 4712} {"train_loss": -7.087697982788086, "global_step": 197910, "epoch": 4712} {"train_loss": -7.2550835609436035, "global_step": 197911, "epoch": 4712} {"train_loss": -7.221402168273926, "global_step": 197912, "epoch": 4712} {"train_loss": -7.0671186447143555, "global_step": 197913, "epoch": 4712} {"train_loss": -7.121316432952881, "global_step": 197914, "epoch": 4712} {"train_loss": -7.204502105712891, "global_step": 197915, "epoch": 4712} {"train_loss": -7.110903739929199, "global_step": 197916, "epoch": 4712} {"train_loss": -7.170981407165527, "global_step": 197917, "epoch": 4712} {"train_loss": -7.1721086502075195, "global_step": 197918, "epoch": 4712} {"train_loss": -7.1961164474487305, "global_step": 197919, "epoch": 4712} {"train_loss": -7.131025314331055, "global_step": 197920, "epoch": 4712} {"train_loss": -7.030955791473389, "global_step": 197921, "epoch": 4712} {"train_loss": -7.201485633850098, "global_step": 197922, "epoch": 4712} {"train_loss": -7.220909118652344, "global_step": 197923, "epoch": 4712} {"train_loss": -7.075981140136719, "global_step": 197924, "epoch": 4712} {"train_loss": -7.145581245422363, "global_step": 197925, "epoch": 4712} {"train_loss": -7.152128219604492, "global_step": 197926, "epoch": 4712} {"train_loss": -7.169425010681152, "global_step": 197927, "epoch": 4712} {"train_loss": -7.176590919494629, "global_step": 197928, "epoch": 4712} {"train_loss": -7.083425521850586, "global_step": 197929, "epoch": 4712} {"train_loss": -7.285190105438232, "global_step": 197930, "epoch": 4712} {"train_loss": -7.211634635925293, "global_step": 197931, "epoch": 4712} {"train_loss": -7.230472564697266, "global_step": 197932, "epoch": 4712} {"train_loss": -7.3456711769104, "global_step": 197933, "epoch": 4712} {"train_loss": -7.224829196929932, "global_step": 197934, "epoch": 4712} {"train_loss": -7.262816429138184, "global_step": 197935, "epoch": 4712} {"train_loss": -7.30023717880249, "global_step": 197936, "epoch": 4712} {"train_loss": -7.3098297119140625, "global_step": 197937, "epoch": 4712} {"train_loss": -7.255083084106445, "global_step": 197938, "epoch": 4712} {"train_loss": -7.277730464935303, "global_step": 197939, "epoch": 4712} {"train_loss": -7.251910209655762, "global_step": 197940, "epoch": 4712} {"train_loss": -7.176386833190918, "global_step": 197941, "epoch": 4712} {"train_loss": -7.239506721496582, "global_step": 197942, "epoch": 4712} {"train_loss": -7.171999931335449, "global_step": 197943, "epoch": 4712} {"train_loss": -7.301973342895508, "global_step": 197944, "epoch": 4712} {"train_loss": -7.191745224453154, "global_step": 197945, "epoch": 4712, "val_loss": 69035.015625} {"train_loss": -7.273308277130127, "global_step": 197946, "epoch": 4713} {"train_loss": -7.278800964355469, "global_step": 197947, "epoch": 4713} {"train_loss": -7.236446380615234, "global_step": 197948, "epoch": 4713} {"train_loss": -7.17818546295166, "global_step": 197949, "epoch": 4713} {"train_loss": -7.318849563598633, "global_step": 197950, "epoch": 4713} {"train_loss": -7.282204627990723, "global_step": 197951, "epoch": 4713} {"train_loss": -7.296236038208008, "global_step": 197952, "epoch": 4713} {"train_loss": -7.274389266967773, "global_step": 197953, "epoch": 4713} {"train_loss": -7.309187889099121, "global_step": 197954, "epoch": 4713} {"train_loss": -7.339784622192383, "global_step": 197955, "epoch": 4713} {"train_loss": -7.170645236968994, "global_step": 197956, "epoch": 4713} {"train_loss": -7.238994598388672, "global_step": 197957, "epoch": 4713} {"train_loss": -7.251564025878906, "global_step": 197958, "epoch": 4713} {"train_loss": -7.284485816955566, "global_step": 197959, "epoch": 4713} {"train_loss": -7.3061370849609375, "global_step": 197960, "epoch": 4713} {"train_loss": -7.200875282287598, "global_step": 197961, "epoch": 4713} {"train_loss": -7.230323791503906, "global_step": 197962, "epoch": 4713} {"train_loss": -7.270559787750244, "global_step": 197963, "epoch": 4713} {"train_loss": -7.297697067260742, "global_step": 197964, "epoch": 4713} {"train_loss": -7.333972930908203, "global_step": 197965, "epoch": 4713} {"train_loss": -7.226788520812988, "global_step": 197966, "epoch": 4713} {"train_loss": -7.200743198394775, "global_step": 197967, "epoch": 4713} {"train_loss": -7.235944747924805, "global_step": 197968, "epoch": 4713} {"train_loss": -7.198753833770752, "global_step": 197969, "epoch": 4713} {"train_loss": -7.232967376708984, "global_step": 197970, "epoch": 4713} {"train_loss": -7.139620780944824, "global_step": 197971, "epoch": 4713} {"train_loss": -7.1578264236450195, "global_step": 197972, "epoch": 4713} {"train_loss": -7.288138389587402, "global_step": 197973, "epoch": 4713} {"train_loss": -6.992483615875244, "global_step": 197974, "epoch": 4713} {"train_loss": -7.281840801239014, "global_step": 197975, "epoch": 4713} {"train_loss": -7.178938865661621, "global_step": 197976, "epoch": 4713} {"train_loss": -7.200657844543457, "global_step": 197977, "epoch": 4713} {"train_loss": -7.200422286987305, "global_step": 197978, "epoch": 4713} {"train_loss": -7.234142303466797, "global_step": 197979, "epoch": 4713} {"train_loss": -7.163112640380859, "global_step": 197980, "epoch": 4713} {"train_loss": -7.206529140472412, "global_step": 197981, "epoch": 4713} {"train_loss": -7.177684783935547, "global_step": 197982, "epoch": 4713} {"train_loss": -7.262286186218262, "global_step": 197983, "epoch": 4713} {"train_loss": -7.298874855041504, "global_step": 197984, "epoch": 4713} {"train_loss": -7.251964569091797, "global_step": 197985, "epoch": 4713} {"train_loss": -7.288435459136963, "global_step": 197986, "epoch": 4713} {"train_loss": -7.239619981674921, "global_step": 197987, "epoch": 4713, "val_loss": 68916.1953125} {"train_loss": -7.240549087524414, "global_step": 197988, "epoch": 4714} {"train_loss": -7.249191761016846, "global_step": 197989, "epoch": 4714} {"train_loss": -7.293407440185547, "global_step": 197990, "epoch": 4714} {"train_loss": -7.193808555603027, "global_step": 197991, "epoch": 4714} {"train_loss": -7.193206787109375, "global_step": 197992, "epoch": 4714} {"train_loss": -7.264185428619385, "global_step": 197993, "epoch": 4714} {"train_loss": -7.1339826583862305, "global_step": 197994, "epoch": 4714} {"train_loss": -6.9237260818481445, "global_step": 197995, "epoch": 4714} {"train_loss": -7.057435035705566, "global_step": 197996, "epoch": 4714} {"train_loss": -7.202147483825684, "global_step": 197997, "epoch": 4714} {"train_loss": -7.016160488128662, "global_step": 197998, "epoch": 4714} {"train_loss": -6.9942193031311035, "global_step": 197999, "epoch": 4714} {"train_loss": -7.2418975830078125, "global_step": 198000, "epoch": 4714} {"train_loss": -7.05790376663208, "global_step": 198001, "epoch": 4714} {"train_loss": -7.063936233520508, "global_step": 198002, "epoch": 4714} {"train_loss": -7.138261795043945, "global_step": 198003, "epoch": 4714} {"train_loss": -7.12811279296875, "global_step": 198004, "epoch": 4714} {"train_loss": -7.241260528564453, "global_step": 198005, "epoch": 4714} {"train_loss": -7.15322208404541, "global_step": 198006, "epoch": 4714} {"train_loss": -7.16370964050293, "global_step": 198007, "epoch": 4714} {"train_loss": -7.168183326721191, "global_step": 198008, "epoch": 4714} {"train_loss": -7.226290225982666, "global_step": 198009, "epoch": 4714} {"train_loss": -7.238332748413086, "global_step": 198010, "epoch": 4714} {"train_loss": -7.157486915588379, "global_step": 198011, "epoch": 4714} {"train_loss": -7.1476945877075195, "global_step": 198012, "epoch": 4714} {"train_loss": -7.131953716278076, "global_step": 198013, "epoch": 4714} {"train_loss": -7.1820149421691895, "global_step": 198014, "epoch": 4714} {"train_loss": -7.287158012390137, "global_step": 198015, "epoch": 4714} {"train_loss": -7.1883344650268555, "global_step": 198016, "epoch": 4714} {"train_loss": -7.161166191101074, "global_step": 198017, "epoch": 4714} {"train_loss": -7.213296890258789, "global_step": 198018, "epoch": 4714} {"train_loss": -7.272881984710693, "global_step": 198019, "epoch": 4714} {"train_loss": -7.143354415893555, "global_step": 198020, "epoch": 4714} {"train_loss": -7.015734672546387, "global_step": 198021, "epoch": 4714} {"train_loss": -7.265190124511719, "global_step": 198022, "epoch": 4714} {"train_loss": -7.270690441131592, "global_step": 198023, "epoch": 4714} {"train_loss": -7.2445526123046875, "global_step": 198024, "epoch": 4714} {"train_loss": -7.189715385437012, "global_step": 198025, "epoch": 4714} {"train_loss": -7.196285247802734, "global_step": 198026, "epoch": 4714} {"train_loss": -7.231705188751221, "global_step": 198027, "epoch": 4714} {"train_loss": -7.263596534729004, "global_step": 198028, "epoch": 4714} {"train_loss": -7.174107086090815, "global_step": 198029, "epoch": 4714, "val_loss": 68970.671875} {"train_loss": -7.252098083496094, "global_step": 198030, "epoch": 4715} {"train_loss": -7.155733108520508, "global_step": 198031, "epoch": 4715} {"train_loss": -7.172798156738281, "global_step": 198032, "epoch": 4715} {"train_loss": -7.206761360168457, "global_step": 198033, "epoch": 4715} {"train_loss": -7.205100059509277, "global_step": 198034, "epoch": 4715} {"train_loss": -7.283655166625977, "global_step": 198035, "epoch": 4715} {"train_loss": -7.119466781616211, "global_step": 198036, "epoch": 4715} {"train_loss": -7.230915069580078, "global_step": 198037, "epoch": 4715} {"train_loss": -7.254420280456543, "global_step": 198038, "epoch": 4715} {"train_loss": -7.255087375640869, "global_step": 198039, "epoch": 4715} {"train_loss": -7.212411880493164, "global_step": 198040, "epoch": 4715} {"train_loss": -7.169875144958496, "global_step": 198041, "epoch": 4715} {"train_loss": -7.238239288330078, "global_step": 198042, "epoch": 4715} {"train_loss": -7.182216644287109, "global_step": 198043, "epoch": 4715} {"train_loss": -7.136024475097656, "global_step": 198044, "epoch": 4715} {"train_loss": -7.222228527069092, "global_step": 198045, "epoch": 4715} {"train_loss": -7.266679286956787, "global_step": 198046, "epoch": 4715} {"train_loss": -7.167633056640625, "global_step": 198047, "epoch": 4715} {"train_loss": -7.146421909332275, "global_step": 198048, "epoch": 4715} {"train_loss": -7.2432379722595215, "global_step": 198049, "epoch": 4715} {"train_loss": -7.180054664611816, "global_step": 198050, "epoch": 4715} {"train_loss": -7.230877876281738, "global_step": 198051, "epoch": 4715} {"train_loss": -7.2773590087890625, "global_step": 198052, "epoch": 4715} {"train_loss": -7.073895454406738, "global_step": 198053, "epoch": 4715} {"train_loss": -7.26070499420166, "global_step": 198054, "epoch": 4715} {"train_loss": -7.175021171569824, "global_step": 198055, "epoch": 4715} {"train_loss": -7.243618011474609, "global_step": 198056, "epoch": 4715} {"train_loss": -7.232419013977051, "global_step": 198057, "epoch": 4715} {"train_loss": -7.141829490661621, "global_step": 198058, "epoch": 4715} {"train_loss": -7.256669998168945, "global_step": 198059, "epoch": 4715} {"train_loss": -7.1785383224487305, "global_step": 198060, "epoch": 4715} {"train_loss": -7.093719959259033, "global_step": 198061, "epoch": 4715} {"train_loss": -7.1583380699157715, "global_step": 198062, "epoch": 4715} {"train_loss": -7.154048919677734, "global_step": 198063, "epoch": 4715} {"train_loss": -7.170931816101074, "global_step": 198064, "epoch": 4715} {"train_loss": -7.090666770935059, "global_step": 198065, "epoch": 4715} {"train_loss": -7.066901683807373, "global_step": 198066, "epoch": 4715} {"train_loss": -7.140135765075684, "global_step": 198067, "epoch": 4715} {"train_loss": -7.234119415283203, "global_step": 198068, "epoch": 4715} {"train_loss": -7.208251476287842, "global_step": 198069, "epoch": 4715} {"train_loss": -7.2106781005859375, "global_step": 198070, "epoch": 4715} {"train_loss": -7.19423186211359, "global_step": 198071, "epoch": 4715, "val_loss": 69093.0078125} {"train_loss": -7.17445182800293, "global_step": 198072, "epoch": 4716} {"train_loss": -7.100674629211426, "global_step": 198073, "epoch": 4716} {"train_loss": -7.173558235168457, "global_step": 198074, "epoch": 4716} {"train_loss": -7.261443138122559, "global_step": 198075, "epoch": 4716} {"train_loss": -7.158935546875, "global_step": 198076, "epoch": 4716} {"train_loss": -7.210377216339111, "global_step": 198077, "epoch": 4716} {"train_loss": -7.1494340896606445, "global_step": 198078, "epoch": 4716} {"train_loss": -7.1774091720581055, "global_step": 198079, "epoch": 4716} {"train_loss": -7.094743251800537, "global_step": 198080, "epoch": 4716} {"train_loss": -7.080437660217285, "global_step": 198081, "epoch": 4716} {"train_loss": -7.152081489562988, "global_step": 198082, "epoch": 4716} {"train_loss": -7.153470039367676, "global_step": 198083, "epoch": 4716} {"train_loss": -7.323677062988281, "global_step": 198084, "epoch": 4716} {"train_loss": -7.169943809509277, "global_step": 198085, "epoch": 4716} {"train_loss": -7.239392280578613, "global_step": 198086, "epoch": 4716} {"train_loss": -7.257912635803223, "global_step": 198087, "epoch": 4716} {"train_loss": -7.23771858215332, "global_step": 198088, "epoch": 4716} {"train_loss": -7.222890853881836, "global_step": 198089, "epoch": 4716} {"train_loss": -7.274230480194092, "global_step": 198090, "epoch": 4716} {"train_loss": -7.276171684265137, "global_step": 198091, "epoch": 4716} {"train_loss": -7.262333869934082, "global_step": 198092, "epoch": 4716} {"train_loss": -7.073328018188477, "global_step": 198093, "epoch": 4716} {"train_loss": -7.22880744934082, "global_step": 198094, "epoch": 4716} {"train_loss": -7.339244365692139, "global_step": 198095, "epoch": 4716} {"train_loss": -7.092869758605957, "global_step": 198096, "epoch": 4716} {"train_loss": -7.214435577392578, "global_step": 198097, "epoch": 4716} {"train_loss": -7.1727423667907715, "global_step": 198098, "epoch": 4716} {"train_loss": -7.24900484085083, "global_step": 198099, "epoch": 4716} {"train_loss": -7.131192207336426, "global_step": 198100, "epoch": 4716} {"train_loss": -7.198327541351318, "global_step": 198101, "epoch": 4716} {"train_loss": -7.147137641906738, "global_step": 198102, "epoch": 4716} {"train_loss": -6.972602844238281, "global_step": 198103, "epoch": 4716} {"train_loss": -7.224277019500732, "global_step": 198104, "epoch": 4716} {"train_loss": -7.166731834411621, "global_step": 198105, "epoch": 4716} {"train_loss": -7.197005271911621, "global_step": 198106, "epoch": 4716} {"train_loss": -7.201822757720947, "global_step": 198107, "epoch": 4716} {"train_loss": -7.205139636993408, "global_step": 198108, "epoch": 4716} {"train_loss": -7.2206830978393555, "global_step": 198109, "epoch": 4716} {"train_loss": -7.130039215087891, "global_step": 198110, "epoch": 4716} {"train_loss": -7.214998245239258, "global_step": 198111, "epoch": 4716} {"train_loss": -7.179657936096191, "global_step": 198112, "epoch": 4716} {"train_loss": -7.186315899803525, "global_step": 198113, "epoch": 4716, "val_loss": 68782.1015625} {"train_loss": -7.282660961151123, "global_step": 198114, "epoch": 4717} {"train_loss": -7.135084629058838, "global_step": 198115, "epoch": 4717} {"train_loss": -7.1597466468811035, "global_step": 198116, "epoch": 4717} {"train_loss": -7.1454854011535645, "global_step": 198117, "epoch": 4717} {"train_loss": -7.163354873657227, "global_step": 198118, "epoch": 4717} {"train_loss": -7.184221267700195, "global_step": 198119, "epoch": 4717} {"train_loss": -7.208619117736816, "global_step": 198120, "epoch": 4717} {"train_loss": -7.103535175323486, "global_step": 198121, "epoch": 4717} {"train_loss": -7.280271530151367, "global_step": 198122, "epoch": 4717} {"train_loss": -7.2814459800720215, "global_step": 198123, "epoch": 4717} {"train_loss": -7.2577972412109375, "global_step": 198124, "epoch": 4717} {"train_loss": -7.223752021789551, "global_step": 198125, "epoch": 4717} {"train_loss": -7.277059555053711, "global_step": 198126, "epoch": 4717} {"train_loss": -7.351842403411865, "global_step": 198127, "epoch": 4717} {"train_loss": -7.254071235656738, "global_step": 198128, "epoch": 4717} {"train_loss": -7.185114860534668, "global_step": 198129, "epoch": 4717} {"train_loss": -7.233636856079102, "global_step": 198130, "epoch": 4717} {"train_loss": -7.192726135253906, "global_step": 198131, "epoch": 4717} {"train_loss": -7.248552322387695, "global_step": 198132, "epoch": 4717} {"train_loss": -7.15719747543335, "global_step": 198133, "epoch": 4717} {"train_loss": -7.237662315368652, "global_step": 198134, "epoch": 4717} {"train_loss": -7.221908092498779, "global_step": 198135, "epoch": 4717} {"train_loss": -7.152093410491943, "global_step": 198136, "epoch": 4717} {"train_loss": -7.163482666015625, "global_step": 198137, "epoch": 4717} {"train_loss": -7.184639930725098, "global_step": 198138, "epoch": 4717} {"train_loss": -7.214496612548828, "global_step": 198139, "epoch": 4717} {"train_loss": -7.198443412780762, "global_step": 198140, "epoch": 4717} {"train_loss": -7.208207607269287, "global_step": 198141, "epoch": 4717} {"train_loss": -7.266739368438721, "global_step": 198142, "epoch": 4717} {"train_loss": -7.262139320373535, "global_step": 198143, "epoch": 4717} {"train_loss": -7.282693862915039, "global_step": 198144, "epoch": 4717} {"train_loss": -7.169198513031006, "global_step": 198145, "epoch": 4717} {"train_loss": -7.372391700744629, "global_step": 198146, "epoch": 4717} {"train_loss": -7.27488899230957, "global_step": 198147, "epoch": 4717} {"train_loss": -7.157209873199463, "global_step": 198148, "epoch": 4717} {"train_loss": -7.158778190612793, "global_step": 198149, "epoch": 4717} {"train_loss": -7.319014549255371, "global_step": 198150, "epoch": 4717} {"train_loss": -7.173174858093262, "global_step": 198151, "epoch": 4717} {"train_loss": -7.189298629760742, "global_step": 198152, "epoch": 4717} {"train_loss": -7.191562652587891, "global_step": 198153, "epoch": 4717} {"train_loss": -7.215216636657715, "global_step": 198154, "epoch": 4717} {"train_loss": -7.216165054412115, "global_step": 198155, "epoch": 4717, "val_loss": 69023.4375} {"train_loss": -7.28790283203125, "global_step": 198156, "epoch": 4718} {"train_loss": -7.256692409515381, "global_step": 198157, "epoch": 4718} {"train_loss": -7.139583110809326, "global_step": 198158, "epoch": 4718} {"train_loss": -7.272046089172363, "global_step": 198159, "epoch": 4718} {"train_loss": -7.2114152908325195, "global_step": 198160, "epoch": 4718} {"train_loss": -7.1715826988220215, "global_step": 198161, "epoch": 4718} {"train_loss": -7.195609092712402, "global_step": 198162, "epoch": 4718} {"train_loss": -7.278361797332764, "global_step": 198163, "epoch": 4718} {"train_loss": -7.123723983764648, "global_step": 198164, "epoch": 4718} {"train_loss": -7.335542678833008, "global_step": 198165, "epoch": 4718} {"train_loss": -7.0448899269104, "global_step": 198166, "epoch": 4718} {"train_loss": -7.108015537261963, "global_step": 198167, "epoch": 4718} {"train_loss": -7.2241740226745605, "global_step": 198168, "epoch": 4718} {"train_loss": -7.047290802001953, "global_step": 198169, "epoch": 4718} {"train_loss": -7.24162483215332, "global_step": 198170, "epoch": 4718} {"train_loss": -7.204954624176025, "global_step": 198171, "epoch": 4718} {"train_loss": -6.957337379455566, "global_step": 198172, "epoch": 4718} {"train_loss": -7.185525894165039, "global_step": 198173, "epoch": 4718} {"train_loss": -7.16038703918457, "global_step": 198174, "epoch": 4718} {"train_loss": -7.105820655822754, "global_step": 198175, "epoch": 4718} {"train_loss": -7.170309066772461, "global_step": 198176, "epoch": 4718} {"train_loss": -7.0042948722839355, "global_step": 198177, "epoch": 4718} {"train_loss": -7.0721564292907715, "global_step": 198178, "epoch": 4718} {"train_loss": -7.052563190460205, "global_step": 198179, "epoch": 4718} {"train_loss": -7.180380344390869, "global_step": 198180, "epoch": 4718} {"train_loss": -7.072600364685059, "global_step": 198181, "epoch": 4718} {"train_loss": -7.157539367675781, "global_step": 198182, "epoch": 4718} {"train_loss": -7.231014251708984, "global_step": 198183, "epoch": 4718} {"train_loss": -7.157025337219238, "global_step": 198184, "epoch": 4718} {"train_loss": -7.198376655578613, "global_step": 198185, "epoch": 4718} {"train_loss": -7.187182426452637, "global_step": 198186, "epoch": 4718} {"train_loss": -7.206698417663574, "global_step": 198187, "epoch": 4718} {"train_loss": -7.173854827880859, "global_step": 198188, "epoch": 4718} {"train_loss": -7.202159881591797, "global_step": 198189, "epoch": 4718} {"train_loss": -7.0316901206970215, "global_step": 198190, "epoch": 4718} {"train_loss": -7.117204666137695, "global_step": 198191, "epoch": 4718} {"train_loss": -7.164991855621338, "global_step": 198192, "epoch": 4718} {"train_loss": -7.180551052093506, "global_step": 198193, "epoch": 4718} {"train_loss": -7.220408916473389, "global_step": 198194, "epoch": 4718} {"train_loss": -7.251629829406738, "global_step": 198195, "epoch": 4718} {"train_loss": -7.1637797355651855, "global_step": 198196, "epoch": 4718} {"train_loss": -7.162955431711106, "global_step": 198197, "epoch": 4718, "val_loss": 69059.0859375} {"train_loss": -7.147409439086914, "global_step": 198198, "epoch": 4719} {"train_loss": -7.221495628356934, "global_step": 198199, "epoch": 4719} {"train_loss": -7.227099418640137, "global_step": 198200, "epoch": 4719} {"train_loss": -7.137404918670654, "global_step": 198201, "epoch": 4719} {"train_loss": -7.131839752197266, "global_step": 198202, "epoch": 4719} {"train_loss": -7.22373628616333, "global_step": 198203, "epoch": 4719} {"train_loss": -7.186716079711914, "global_step": 198204, "epoch": 4719} {"train_loss": -7.149147033691406, "global_step": 198205, "epoch": 4719} {"train_loss": -7.176771640777588, "global_step": 198206, "epoch": 4719} {"train_loss": -7.2509260177612305, "global_step": 198207, "epoch": 4719} {"train_loss": -7.2784013748168945, "global_step": 198208, "epoch": 4719} {"train_loss": -7.207376956939697, "global_step": 198209, "epoch": 4719} {"train_loss": -7.2644124031066895, "global_step": 198210, "epoch": 4719} {"train_loss": -7.292501449584961, "global_step": 198211, "epoch": 4719} {"train_loss": -7.163545608520508, "global_step": 198212, "epoch": 4719} {"train_loss": -7.237104415893555, "global_step": 198213, "epoch": 4719} {"train_loss": -7.190762996673584, "global_step": 198214, "epoch": 4719} {"train_loss": -7.174009799957275, "global_step": 198215, "epoch": 4719} {"train_loss": -7.154222011566162, "global_step": 198216, "epoch": 4719} {"train_loss": -7.184904098510742, "global_step": 198217, "epoch": 4719} {"train_loss": -7.176480293273926, "global_step": 198218, "epoch": 4719} {"train_loss": -7.152984619140625, "global_step": 198219, "epoch": 4719} {"train_loss": -7.220266819000244, "global_step": 198220, "epoch": 4719} {"train_loss": -7.261829376220703, "global_step": 198221, "epoch": 4719} {"train_loss": -7.136785507202148, "global_step": 198222, "epoch": 4719} {"train_loss": -7.221932888031006, "global_step": 198223, "epoch": 4719} {"train_loss": -7.08740234375, "global_step": 198224, "epoch": 4719} {"train_loss": -7.052818298339844, "global_step": 198225, "epoch": 4719} {"train_loss": -7.229209899902344, "global_step": 198226, "epoch": 4719} {"train_loss": -7.030597686767578, "global_step": 198227, "epoch": 4719} {"train_loss": -7.095998764038086, "global_step": 198228, "epoch": 4719} {"train_loss": -7.225298881530762, "global_step": 198229, "epoch": 4719} {"train_loss": -7.153894424438477, "global_step": 198230, "epoch": 4719} {"train_loss": -7.243800163269043, "global_step": 198231, "epoch": 4719} {"train_loss": -7.081793308258057, "global_step": 198232, "epoch": 4719} {"train_loss": -7.246021747589111, "global_step": 198233, "epoch": 4719} {"train_loss": -7.2093024253845215, "global_step": 198234, "epoch": 4719} {"train_loss": -7.161648750305176, "global_step": 198235, "epoch": 4719} {"train_loss": -7.170049667358398, "global_step": 198236, "epoch": 4719} {"train_loss": -7.166875839233398, "global_step": 198237, "epoch": 4719} {"train_loss": -7.172347068786621, "global_step": 198238, "epoch": 4719} {"train_loss": -7.182430119741531, "global_step": 198239, "epoch": 4719, "val_loss": 69067.734375} {"train_loss": -7.184774875640869, "global_step": 198240, "epoch": 4720} {"train_loss": -7.247366905212402, "global_step": 198241, "epoch": 4720} {"train_loss": -7.217752456665039, "global_step": 198242, "epoch": 4720} {"train_loss": -7.277717113494873, "global_step": 198243, "epoch": 4720} {"train_loss": -7.233406066894531, "global_step": 198244, "epoch": 4720} {"train_loss": -7.246786594390869, "global_step": 198245, "epoch": 4720} {"train_loss": -7.257907867431641, "global_step": 198246, "epoch": 4720} {"train_loss": -7.33621072769165, "global_step": 198247, "epoch": 4720} {"train_loss": -7.306238174438477, "global_step": 198248, "epoch": 4720} {"train_loss": -7.269601821899414, "global_step": 198249, "epoch": 4720} {"train_loss": -7.284558296203613, "global_step": 198250, "epoch": 4720} {"train_loss": -7.215350151062012, "global_step": 198251, "epoch": 4720} {"train_loss": -7.292874336242676, "global_step": 198252, "epoch": 4720} {"train_loss": -7.1526594161987305, "global_step": 198253, "epoch": 4720} {"train_loss": -7.217686653137207, "global_step": 198254, "epoch": 4720} {"train_loss": -7.271671295166016, "global_step": 198255, "epoch": 4720} {"train_loss": -7.237720012664795, "global_step": 198256, "epoch": 4720} {"train_loss": -7.187949180603027, "global_step": 198257, "epoch": 4720} {"train_loss": -7.298434257507324, "global_step": 198258, "epoch": 4720} {"train_loss": -7.263800621032715, "global_step": 198259, "epoch": 4720} {"train_loss": -7.227387428283691, "global_step": 198260, "epoch": 4720} {"train_loss": -7.175583839416504, "global_step": 198261, "epoch": 4720} {"train_loss": -7.183598518371582, "global_step": 198262, "epoch": 4720} {"train_loss": -7.214041233062744, "global_step": 198263, "epoch": 4720} {"train_loss": -7.183724880218506, "global_step": 198264, "epoch": 4720} {"train_loss": -7.294280052185059, "global_step": 198265, "epoch": 4720} {"train_loss": -7.117288589477539, "global_step": 198266, "epoch": 4720} {"train_loss": -7.310656547546387, "global_step": 198267, "epoch": 4720} {"train_loss": -7.156163215637207, "global_step": 198268, "epoch": 4720} {"train_loss": -7.253681182861328, "global_step": 198269, "epoch": 4720} {"train_loss": -7.1989922523498535, "global_step": 198270, "epoch": 4720} {"train_loss": -7.234825611114502, "global_step": 198271, "epoch": 4720} {"train_loss": -7.272490501403809, "global_step": 198272, "epoch": 4720} {"train_loss": -7.259494781494141, "global_step": 198273, "epoch": 4720} {"train_loss": -7.20634651184082, "global_step": 198274, "epoch": 4720} {"train_loss": -7.280640602111816, "global_step": 198275, "epoch": 4720} {"train_loss": -7.342004776000977, "global_step": 198276, "epoch": 4720} {"train_loss": -7.244315147399902, "global_step": 198277, "epoch": 4720} {"train_loss": -7.2583818435668945, "global_step": 198278, "epoch": 4720} {"train_loss": -7.373617649078369, "global_step": 198279, "epoch": 4720} {"train_loss": -7.2344255447387695, "global_step": 198280, "epoch": 4720} {"train_loss": -7.247368403843471, "global_step": 198281, "epoch": 4720, "val_loss": 68967.9921875} {"train_loss": -7.310611724853516, "global_step": 198282, "epoch": 4721} {"train_loss": -7.357631683349609, "global_step": 198283, "epoch": 4721} {"train_loss": -7.269885063171387, "global_step": 198284, "epoch": 4721} {"train_loss": -7.180392265319824, "global_step": 198285, "epoch": 4721} {"train_loss": -7.128561496734619, "global_step": 198286, "epoch": 4721} {"train_loss": -7.330311298370361, "global_step": 198287, "epoch": 4721} {"train_loss": -7.142016410827637, "global_step": 198288, "epoch": 4721} {"train_loss": -7.233890056610107, "global_step": 198289, "epoch": 4721} {"train_loss": -7.316226005554199, "global_step": 198290, "epoch": 4721} {"train_loss": -7.170356750488281, "global_step": 198291, "epoch": 4721} {"train_loss": -7.092637062072754, "global_step": 198292, "epoch": 4721} {"train_loss": -7.2186689376831055, "global_step": 198293, "epoch": 4721} {"train_loss": -7.122410774230957, "global_step": 198294, "epoch": 4721} {"train_loss": -7.084105968475342, "global_step": 198295, "epoch": 4721} {"train_loss": -7.216649055480957, "global_step": 198296, "epoch": 4721} {"train_loss": -7.343249320983887, "global_step": 198297, "epoch": 4721} {"train_loss": -7.075913429260254, "global_step": 198298, "epoch": 4721} {"train_loss": -7.175137519836426, "global_step": 198299, "epoch": 4721} {"train_loss": -7.1352081298828125, "global_step": 198300, "epoch": 4721} {"train_loss": -7.186558723449707, "global_step": 198301, "epoch": 4721} {"train_loss": -7.187806606292725, "global_step": 198302, "epoch": 4721} {"train_loss": -7.069263935089111, "global_step": 198303, "epoch": 4721} {"train_loss": -7.038243293762207, "global_step": 198304, "epoch": 4721} {"train_loss": -7.110511779785156, "global_step": 198305, "epoch": 4721} {"train_loss": -7.324466705322266, "global_step": 198306, "epoch": 4721} {"train_loss": -7.10072660446167, "global_step": 198307, "epoch": 4721} {"train_loss": -7.207488059997559, "global_step": 198308, "epoch": 4721} {"train_loss": -7.218792915344238, "global_step": 198309, "epoch": 4721} {"train_loss": -7.173957824707031, "global_step": 198310, "epoch": 4721} {"train_loss": -7.126750946044922, "global_step": 198311, "epoch": 4721} {"train_loss": -7.189355850219727, "global_step": 198312, "epoch": 4721} {"train_loss": -7.1289520263671875, "global_step": 198313, "epoch": 4721} {"train_loss": -7.315871238708496, "global_step": 198314, "epoch": 4721} {"train_loss": -7.192284107208252, "global_step": 198315, "epoch": 4721} {"train_loss": -7.132547378540039, "global_step": 198316, "epoch": 4721} {"train_loss": -7.139461994171143, "global_step": 198317, "epoch": 4721} {"train_loss": -7.20537805557251, "global_step": 198318, "epoch": 4721} {"train_loss": -7.265142917633057, "global_step": 198319, "epoch": 4721} {"train_loss": -7.144204616546631, "global_step": 198320, "epoch": 4721} {"train_loss": -7.111408233642578, "global_step": 198321, "epoch": 4721} {"train_loss": -7.181711673736572, "global_step": 198322, "epoch": 4721} {"train_loss": -7.186433417456491, "global_step": 198323, "epoch": 4721, "val_loss": 69069.921875} {"train_loss": -7.198792934417725, "global_step": 198324, "epoch": 4722} {"train_loss": -7.282679557800293, "global_step": 198325, "epoch": 4722} {"train_loss": -7.148628234863281, "global_step": 198326, "epoch": 4722} {"train_loss": -7.206564903259277, "global_step": 198327, "epoch": 4722} {"train_loss": -7.3144989013671875, "global_step": 198328, "epoch": 4722} {"train_loss": -7.236001014709473, "global_step": 198329, "epoch": 4722} {"train_loss": -7.216543197631836, "global_step": 198330, "epoch": 4722} {"train_loss": -7.242461204528809, "global_step": 198331, "epoch": 4722} {"train_loss": -7.074130058288574, "global_step": 198332, "epoch": 4722} {"train_loss": -7.264016151428223, "global_step": 198333, "epoch": 4722} {"train_loss": -7.2041707038879395, "global_step": 198334, "epoch": 4722} {"train_loss": -7.186819076538086, "global_step": 198335, "epoch": 4722} {"train_loss": -7.206881999969482, "global_step": 198336, "epoch": 4722} {"train_loss": -7.216343402862549, "global_step": 198337, "epoch": 4722} {"train_loss": -7.30916690826416, "global_step": 198338, "epoch": 4722} {"train_loss": -7.105420112609863, "global_step": 198339, "epoch": 4722} {"train_loss": -7.280910015106201, "global_step": 198340, "epoch": 4722} {"train_loss": -7.253841400146484, "global_step": 198341, "epoch": 4722} {"train_loss": -7.238526344299316, "global_step": 198342, "epoch": 4722} {"train_loss": -7.193960189819336, "global_step": 198343, "epoch": 4722} {"train_loss": -7.351622581481934, "global_step": 198344, "epoch": 4722} {"train_loss": -7.270862579345703, "global_step": 198345, "epoch": 4722} {"train_loss": -7.279948711395264, "global_step": 198346, "epoch": 4722} {"train_loss": -7.2381768226623535, "global_step": 198347, "epoch": 4722} {"train_loss": -7.155308723449707, "global_step": 198348, "epoch": 4722} {"train_loss": -7.276336193084717, "global_step": 198349, "epoch": 4722} {"train_loss": -7.201842308044434, "global_step": 198350, "epoch": 4722} {"train_loss": -7.162883758544922, "global_step": 198351, "epoch": 4722} {"train_loss": -7.204486846923828, "global_step": 198352, "epoch": 4722} {"train_loss": -7.0719685554504395, "global_step": 198353, "epoch": 4722} {"train_loss": -7.124974250793457, "global_step": 198354, "epoch": 4722} {"train_loss": -7.096351146697998, "global_step": 198355, "epoch": 4722} {"train_loss": -7.21003532409668, "global_step": 198356, "epoch": 4722} {"train_loss": -7.254430770874023, "global_step": 198357, "epoch": 4722} {"train_loss": -7.2412261962890625, "global_step": 198358, "epoch": 4722} {"train_loss": -7.310490608215332, "global_step": 198359, "epoch": 4722} {"train_loss": -7.140700340270996, "global_step": 198360, "epoch": 4722} {"train_loss": -7.30543851852417, "global_step": 198361, "epoch": 4722} {"train_loss": -7.151279449462891, "global_step": 198362, "epoch": 4722} {"train_loss": -7.242097854614258, "global_step": 198363, "epoch": 4722} {"train_loss": -7.275354385375977, "global_step": 198364, "epoch": 4722} {"train_loss": -7.2158238887786865, "global_step": 198365, "epoch": 4722, "val_loss": 68950.203125} {"train_loss": -7.2231292724609375, "global_step": 198366, "epoch": 4723} {"train_loss": -7.296929359436035, "global_step": 198367, "epoch": 4723} {"train_loss": -7.279132843017578, "global_step": 198368, "epoch": 4723} {"train_loss": -7.244981288909912, "global_step": 198369, "epoch": 4723} {"train_loss": -7.156586647033691, "global_step": 198370, "epoch": 4723} {"train_loss": -7.230432510375977, "global_step": 198371, "epoch": 4723} {"train_loss": -7.338592529296875, "global_step": 198372, "epoch": 4723} {"train_loss": -7.317468643188477, "global_step": 198373, "epoch": 4723} {"train_loss": -7.347512245178223, "global_step": 198374, "epoch": 4723} {"train_loss": -7.295839786529541, "global_step": 198375, "epoch": 4723} {"train_loss": -7.140504837036133, "global_step": 198376, "epoch": 4723} {"train_loss": -7.3000898361206055, "global_step": 198377, "epoch": 4723} {"train_loss": -7.223722457885742, "global_step": 198378, "epoch": 4723} {"train_loss": -7.35333776473999, "global_step": 198379, "epoch": 4723} {"train_loss": -7.237687110900879, "global_step": 198380, "epoch": 4723} {"train_loss": -7.39266300201416, "global_step": 198381, "epoch": 4723} {"train_loss": -7.252252578735352, "global_step": 198382, "epoch": 4723} {"train_loss": -7.225618839263916, "global_step": 198383, "epoch": 4723} {"train_loss": -7.23997688293457, "global_step": 198384, "epoch": 4723} {"train_loss": -7.199723243713379, "global_step": 198385, "epoch": 4723} {"train_loss": -7.255273342132568, "global_step": 198386, "epoch": 4723} {"train_loss": -7.2215189933776855, "global_step": 198387, "epoch": 4723} {"train_loss": -7.219801902770996, "global_step": 198388, "epoch": 4723} {"train_loss": -7.219423294067383, "global_step": 198389, "epoch": 4723} {"train_loss": -7.22988748550415, "global_step": 198390, "epoch": 4723} {"train_loss": -7.109636306762695, "global_step": 198391, "epoch": 4723} {"train_loss": -7.077864646911621, "global_step": 198392, "epoch": 4723} {"train_loss": -7.172516822814941, "global_step": 198393, "epoch": 4723} {"train_loss": -7.206384181976318, "global_step": 198394, "epoch": 4723} {"train_loss": -7.114604949951172, "global_step": 198395, "epoch": 4723} {"train_loss": -7.166898727416992, "global_step": 198396, "epoch": 4723} {"train_loss": -7.074341773986816, "global_step": 198397, "epoch": 4723} {"train_loss": -6.948404312133789, "global_step": 198398, "epoch": 4723} {"train_loss": -7.098618507385254, "global_step": 198399, "epoch": 4723} {"train_loss": -7.127939224243164, "global_step": 198400, "epoch": 4723} {"train_loss": -7.113923072814941, "global_step": 198401, "epoch": 4723} {"train_loss": -7.120220184326172, "global_step": 198402, "epoch": 4723} {"train_loss": -6.988982677459717, "global_step": 198403, "epoch": 4723} {"train_loss": -7.194149017333984, "global_step": 198404, "epoch": 4723} {"train_loss": -6.987046241760254, "global_step": 198405, "epoch": 4723} {"train_loss": -7.024177074432373, "global_step": 198406, "epoch": 4723} {"train_loss": -7.192627282369704, "global_step": 198407, "epoch": 4723, "val_loss": 69092.421875} {"train_loss": -6.97061014175415, "global_step": 198408, "epoch": 4724} {"train_loss": -7.173671722412109, "global_step": 198409, "epoch": 4724} {"train_loss": -7.188836097717285, "global_step": 198410, "epoch": 4724} {"train_loss": -7.111840724945068, "global_step": 198411, "epoch": 4724} {"train_loss": -7.16074275970459, "global_step": 198412, "epoch": 4724} {"train_loss": -7.113529205322266, "global_step": 198413, "epoch": 4724} {"train_loss": -7.1695356369018555, "global_step": 198414, "epoch": 4724} {"train_loss": -7.122089385986328, "global_step": 198415, "epoch": 4724} {"train_loss": -7.202276706695557, "global_step": 198416, "epoch": 4724} {"train_loss": -7.118903636932373, "global_step": 198417, "epoch": 4724} {"train_loss": -7.176949501037598, "global_step": 198418, "epoch": 4724} {"train_loss": -7.144184112548828, "global_step": 198419, "epoch": 4724} {"train_loss": -7.154755592346191, "global_step": 198420, "epoch": 4724} {"train_loss": -7.1898722648620605, "global_step": 198421, "epoch": 4724} {"train_loss": -7.147310256958008, "global_step": 198422, "epoch": 4724} {"train_loss": -7.222685813903809, "global_step": 198423, "epoch": 4724} {"train_loss": -7.254668712615967, "global_step": 198424, "epoch": 4724} {"train_loss": -7.155032157897949, "global_step": 198425, "epoch": 4724} {"train_loss": -7.192005634307861, "global_step": 198426, "epoch": 4724} {"train_loss": -7.177563190460205, "global_step": 198427, "epoch": 4724} {"train_loss": -7.275763511657715, "global_step": 198428, "epoch": 4724} {"train_loss": -7.214462757110596, "global_step": 198429, "epoch": 4724} {"train_loss": -7.257108688354492, "global_step": 198430, "epoch": 4724} {"train_loss": -7.374749660491943, "global_step": 198431, "epoch": 4724} {"train_loss": -7.1048126220703125, "global_step": 198432, "epoch": 4724} {"train_loss": -7.293811798095703, "global_step": 198433, "epoch": 4724} {"train_loss": -7.197620868682861, "global_step": 198434, "epoch": 4724} {"train_loss": -7.250218868255615, "global_step": 198435, "epoch": 4724} {"train_loss": -7.191369533538818, "global_step": 198436, "epoch": 4724} {"train_loss": -7.23972225189209, "global_step": 198437, "epoch": 4724} {"train_loss": -7.301868438720703, "global_step": 198438, "epoch": 4724} {"train_loss": -7.3240132331848145, "global_step": 198439, "epoch": 4724} {"train_loss": -7.329411506652832, "global_step": 198440, "epoch": 4724} {"train_loss": -7.14107608795166, "global_step": 198441, "epoch": 4724} {"train_loss": -7.218103408813477, "global_step": 198442, "epoch": 4724} {"train_loss": -7.274526596069336, "global_step": 198443, "epoch": 4724} {"train_loss": -6.985812187194824, "global_step": 198444, "epoch": 4724} {"train_loss": -7.024229526519775, "global_step": 198445, "epoch": 4724} {"train_loss": -7.2016987800598145, "global_step": 198446, "epoch": 4724} {"train_loss": -7.030308723449707, "global_step": 198447, "epoch": 4724} {"train_loss": -7.109675407409668, "global_step": 198448, "epoch": 4724} {"train_loss": -7.183473859514509, "global_step": 198449, "epoch": 4724, "val_loss": 69123.3125} {"train_loss": -7.101685523986816, "global_step": 198450, "epoch": 4725} {"train_loss": -7.2400383949279785, "global_step": 198451, "epoch": 4725} {"train_loss": -7.128793716430664, "global_step": 198452, "epoch": 4725} {"train_loss": -7.345731735229492, "global_step": 198453, "epoch": 4725} {"train_loss": -7.130743980407715, "global_step": 198454, "epoch": 4725} {"train_loss": -7.134692668914795, "global_step": 198455, "epoch": 4725} {"train_loss": -7.312925338745117, "global_step": 198456, "epoch": 4725} {"train_loss": -7.11494255065918, "global_step": 198457, "epoch": 4725} {"train_loss": -7.195912837982178, "global_step": 198458, "epoch": 4725} {"train_loss": -7.078755855560303, "global_step": 198459, "epoch": 4725} {"train_loss": -7.0827202796936035, "global_step": 198460, "epoch": 4725} {"train_loss": -7.171356678009033, "global_step": 198461, "epoch": 4725} {"train_loss": -7.128060340881348, "global_step": 198462, "epoch": 4725} {"train_loss": -7.049888610839844, "global_step": 198463, "epoch": 4725} {"train_loss": -7.23926305770874, "global_step": 198464, "epoch": 4725} {"train_loss": -7.19281530380249, "global_step": 198465, "epoch": 4725} {"train_loss": -7.25454044342041, "global_step": 198466, "epoch": 4725} {"train_loss": -7.3370513916015625, "global_step": 198467, "epoch": 4725} {"train_loss": -7.3031206130981445, "global_step": 198468, "epoch": 4725} {"train_loss": -7.2454729080200195, "global_step": 198469, "epoch": 4725} {"train_loss": -7.152327537536621, "global_step": 198470, "epoch": 4725} {"train_loss": -7.215423107147217, "global_step": 198471, "epoch": 4725} {"train_loss": -7.217363357543945, "global_step": 198472, "epoch": 4725} {"train_loss": -7.15590763092041, "global_step": 198473, "epoch": 4725} {"train_loss": -7.312838077545166, "global_step": 198474, "epoch": 4725} {"train_loss": -7.314784526824951, "global_step": 198475, "epoch": 4725} {"train_loss": -7.244515895843506, "global_step": 198476, "epoch": 4725} {"train_loss": -7.1531829833984375, "global_step": 198477, "epoch": 4725} {"train_loss": -7.2298688888549805, "global_step": 198478, "epoch": 4725} {"train_loss": -7.39622688293457, "global_step": 198479, "epoch": 4725} {"train_loss": -7.185950756072998, "global_step": 198480, "epoch": 4725} {"train_loss": -7.263175964355469, "global_step": 198481, "epoch": 4725} {"train_loss": -7.273632049560547, "global_step": 198482, "epoch": 4725} {"train_loss": -7.321846008300781, "global_step": 198483, "epoch": 4725} {"train_loss": -7.211779594421387, "global_step": 198484, "epoch": 4725} {"train_loss": -7.256159782409668, "global_step": 198485, "epoch": 4725} {"train_loss": -7.289355278015137, "global_step": 198486, "epoch": 4725} {"train_loss": -7.248649597167969, "global_step": 198487, "epoch": 4725} {"train_loss": -7.242269992828369, "global_step": 198488, "epoch": 4725} {"train_loss": -7.308025360107422, "global_step": 198489, "epoch": 4725} {"train_loss": -7.209880352020264, "global_step": 198490, "epoch": 4725} {"train_loss": -7.219899200257801, "global_step": 198491, "epoch": 4725, "val_loss": 68991.78125} {"train_loss": -7.247820854187012, "global_step": 198492, "epoch": 4726} {"train_loss": -7.311837196350098, "global_step": 198493, "epoch": 4726} {"train_loss": -7.292219638824463, "global_step": 198494, "epoch": 4726} {"train_loss": -7.154967308044434, "global_step": 198495, "epoch": 4726} {"train_loss": -7.282312393188477, "global_step": 198496, "epoch": 4726} {"train_loss": -7.207607746124268, "global_step": 198497, "epoch": 4726} {"train_loss": -7.23459005355835, "global_step": 198498, "epoch": 4726} {"train_loss": -7.172386169433594, "global_step": 198499, "epoch": 4726} {"train_loss": -7.262451648712158, "global_step": 198500, "epoch": 4726} {"train_loss": -7.28052282333374, "global_step": 198501, "epoch": 4726} {"train_loss": -7.189797878265381, "global_step": 198502, "epoch": 4726} {"train_loss": -7.283205986022949, "global_step": 198503, "epoch": 4726} {"train_loss": -7.158430099487305, "global_step": 198504, "epoch": 4726} {"train_loss": -7.153107166290283, "global_step": 198505, "epoch": 4726} {"train_loss": -7.143325328826904, "global_step": 198506, "epoch": 4726} {"train_loss": -7.30325174331665, "global_step": 198507, "epoch": 4726} {"train_loss": -7.248878479003906, "global_step": 198508, "epoch": 4726} {"train_loss": -7.309842586517334, "global_step": 198509, "epoch": 4726} {"train_loss": -7.271944046020508, "global_step": 198510, "epoch": 4726} {"train_loss": -7.168768882751465, "global_step": 198511, "epoch": 4726} {"train_loss": -7.14228630065918, "global_step": 198512, "epoch": 4726} {"train_loss": -7.111108779907227, "global_step": 198513, "epoch": 4726} {"train_loss": -7.046621322631836, "global_step": 198514, "epoch": 4726} {"train_loss": -7.079794406890869, "global_step": 198515, "epoch": 4726} {"train_loss": -7.311922550201416, "global_step": 198516, "epoch": 4726} {"train_loss": -7.0845465660095215, "global_step": 198517, "epoch": 4726} {"train_loss": -7.051361083984375, "global_step": 198518, "epoch": 4726} {"train_loss": -7.175398826599121, "global_step": 198519, "epoch": 4726} {"train_loss": -7.138152122497559, "global_step": 198520, "epoch": 4726} {"train_loss": -6.982865333557129, "global_step": 198521, "epoch": 4726} {"train_loss": -7.197543621063232, "global_step": 198522, "epoch": 4726} {"train_loss": -7.192010402679443, "global_step": 198523, "epoch": 4726} {"train_loss": -7.143503665924072, "global_step": 198524, "epoch": 4726} {"train_loss": -7.128046035766602, "global_step": 198525, "epoch": 4726} {"train_loss": -7.127599716186523, "global_step": 198526, "epoch": 4726} {"train_loss": -7.116885185241699, "global_step": 198527, "epoch": 4726} {"train_loss": -7.169390678405762, "global_step": 198528, "epoch": 4726} {"train_loss": -7.209388256072998, "global_step": 198529, "epoch": 4726} {"train_loss": -7.115129470825195, "global_step": 198530, "epoch": 4726} {"train_loss": -7.199355125427246, "global_step": 198531, "epoch": 4726} {"train_loss": -7.128537178039551, "global_step": 198532, "epoch": 4726} {"train_loss": -7.183900696890695, "global_step": 198533, "epoch": 4726, "val_loss": 69019.5390625} {"train_loss": -7.247185230255127, "global_step": 198534, "epoch": 4727} {"train_loss": -7.1813249588012695, "global_step": 198535, "epoch": 4727} {"train_loss": -7.1795525550842285, "global_step": 198536, "epoch": 4727} {"train_loss": -7.159061431884766, "global_step": 198537, "epoch": 4727} {"train_loss": -7.182171821594238, "global_step": 198538, "epoch": 4727} {"train_loss": -7.088468551635742, "global_step": 198539, "epoch": 4727} {"train_loss": -7.258408546447754, "global_step": 198540, "epoch": 4727} {"train_loss": -7.2228875160217285, "global_step": 198541, "epoch": 4727} {"train_loss": -7.149709701538086, "global_step": 198542, "epoch": 4727} {"train_loss": -7.087547779083252, "global_step": 198543, "epoch": 4727} {"train_loss": -7.203210830688477, "global_step": 198544, "epoch": 4727} {"train_loss": -7.1303205490112305, "global_step": 198545, "epoch": 4727} {"train_loss": -7.166752338409424, "global_step": 198546, "epoch": 4727} {"train_loss": -7.245495319366455, "global_step": 198547, "epoch": 4727} {"train_loss": -7.130468368530273, "global_step": 198548, "epoch": 4727} {"train_loss": -7.32574462890625, "global_step": 198549, "epoch": 4727} {"train_loss": -7.053512096405029, "global_step": 198550, "epoch": 4727} {"train_loss": -7.15623664855957, "global_step": 198551, "epoch": 4727} {"train_loss": -7.1752214431762695, "global_step": 198552, "epoch": 4727} {"train_loss": -7.291581153869629, "global_step": 198553, "epoch": 4727} {"train_loss": -7.214076995849609, "global_step": 198554, "epoch": 4727} {"train_loss": -7.0277910232543945, "global_step": 198555, "epoch": 4727} {"train_loss": -7.1970953941345215, "global_step": 198556, "epoch": 4727} {"train_loss": -7.024470329284668, "global_step": 198557, "epoch": 4727} {"train_loss": -7.100574016571045, "global_step": 198558, "epoch": 4727} {"train_loss": -7.184001445770264, "global_step": 198559, "epoch": 4727} {"train_loss": -6.996448040008545, "global_step": 198560, "epoch": 4727} {"train_loss": -7.111883163452148, "global_step": 198561, "epoch": 4727} {"train_loss": -7.139772415161133, "global_step": 198562, "epoch": 4727} {"train_loss": -7.102504730224609, "global_step": 198563, "epoch": 4727} {"train_loss": -7.184356212615967, "global_step": 198564, "epoch": 4727} {"train_loss": -7.115911960601807, "global_step": 198565, "epoch": 4727} {"train_loss": -7.093033790588379, "global_step": 198566, "epoch": 4727} {"train_loss": -7.092188835144043, "global_step": 198567, "epoch": 4727} {"train_loss": -7.114949703216553, "global_step": 198568, "epoch": 4727} {"train_loss": -7.200918674468994, "global_step": 198569, "epoch": 4727} {"train_loss": -7.066131591796875, "global_step": 198570, "epoch": 4727} {"train_loss": -6.946613788604736, "global_step": 198571, "epoch": 4727} {"train_loss": -7.255434036254883, "global_step": 198572, "epoch": 4727} {"train_loss": -7.146342754364014, "global_step": 198573, "epoch": 4727} {"train_loss": -7.242629051208496, "global_step": 198574, "epoch": 4727} {"train_loss": -7.15385145232791, "global_step": 198575, "epoch": 4727, "val_loss": 68989.390625} {"train_loss": -7.194492340087891, "global_step": 198576, "epoch": 4728} {"train_loss": -7.261049270629883, "global_step": 198577, "epoch": 4728} {"train_loss": -7.1607160568237305, "global_step": 198578, "epoch": 4728} {"train_loss": -7.2255120277404785, "global_step": 198579, "epoch": 4728} {"train_loss": -7.189289093017578, "global_step": 198580, "epoch": 4728} {"train_loss": -7.167044639587402, "global_step": 198581, "epoch": 4728} {"train_loss": -7.21357536315918, "global_step": 198582, "epoch": 4728} {"train_loss": -7.245670318603516, "global_step": 198583, "epoch": 4728} {"train_loss": -7.367956638336182, "global_step": 198584, "epoch": 4728} {"train_loss": -7.269535064697266, "global_step": 198585, "epoch": 4728} {"train_loss": -7.250494956970215, "global_step": 198586, "epoch": 4728} {"train_loss": -7.212233543395996, "global_step": 198587, "epoch": 4728} {"train_loss": -7.218234062194824, "global_step": 198588, "epoch": 4728} {"train_loss": -7.234834671020508, "global_step": 198589, "epoch": 4728} {"train_loss": -7.167577743530273, "global_step": 198590, "epoch": 4728} {"train_loss": -7.316534996032715, "global_step": 198591, "epoch": 4728} {"train_loss": -7.347895622253418, "global_step": 198592, "epoch": 4728} {"train_loss": -7.165858268737793, "global_step": 198593, "epoch": 4728} {"train_loss": -7.273686408996582, "global_step": 198594, "epoch": 4728} {"train_loss": -7.169841766357422, "global_step": 198595, "epoch": 4728} {"train_loss": -7.049151420593262, "global_step": 198596, "epoch": 4728} {"train_loss": -7.219793319702148, "global_step": 198597, "epoch": 4728} {"train_loss": -7.106295585632324, "global_step": 198598, "epoch": 4728} {"train_loss": -7.230771541595459, "global_step": 198599, "epoch": 4728} {"train_loss": -7.24497127532959, "global_step": 198600, "epoch": 4728} {"train_loss": -7.119672775268555, "global_step": 198601, "epoch": 4728} {"train_loss": -7.296797275543213, "global_step": 198602, "epoch": 4728} {"train_loss": -7.141146183013916, "global_step": 198603, "epoch": 4728} {"train_loss": -7.0425543785095215, "global_step": 198604, "epoch": 4728} {"train_loss": -7.254277229309082, "global_step": 198605, "epoch": 4728} {"train_loss": -7.146395683288574, "global_step": 198606, "epoch": 4728} {"train_loss": -7.190636157989502, "global_step": 198607, "epoch": 4728} {"train_loss": -7.197434425354004, "global_step": 198608, "epoch": 4728} {"train_loss": -7.169876575469971, "global_step": 198609, "epoch": 4728} {"train_loss": -7.145139694213867, "global_step": 198610, "epoch": 4728} {"train_loss": -7.009871006011963, "global_step": 198611, "epoch": 4728} {"train_loss": -7.239638805389404, "global_step": 198612, "epoch": 4728} {"train_loss": -7.035345077514648, "global_step": 198613, "epoch": 4728} {"train_loss": -7.144883155822754, "global_step": 198614, "epoch": 4728} {"train_loss": -7.050205230712891, "global_step": 198615, "epoch": 4728} {"train_loss": -7.240507125854492, "global_step": 198616, "epoch": 4728} {"train_loss": -7.194453387033372, "global_step": 198617, "epoch": 4728, "val_loss": 69073.953125} {"train_loss": -7.10060977935791, "global_step": 198618, "epoch": 4729} {"train_loss": -7.264188289642334, "global_step": 198619, "epoch": 4729} {"train_loss": -7.108593463897705, "global_step": 198620, "epoch": 4729} {"train_loss": -7.127666473388672, "global_step": 198621, "epoch": 4729} {"train_loss": -7.10246467590332, "global_step": 198622, "epoch": 4729} {"train_loss": -7.182498931884766, "global_step": 198623, "epoch": 4729} {"train_loss": -7.1458635330200195, "global_step": 198624, "epoch": 4729} {"train_loss": -7.200328826904297, "global_step": 198625, "epoch": 4729} {"train_loss": -7.1629180908203125, "global_step": 198626, "epoch": 4729} {"train_loss": -7.18609619140625, "global_step": 198627, "epoch": 4729} {"train_loss": -7.2711181640625, "global_step": 198628, "epoch": 4729} {"train_loss": -7.105898380279541, "global_step": 198629, "epoch": 4729} {"train_loss": -7.209009170532227, "global_step": 198630, "epoch": 4729} {"train_loss": -7.067513465881348, "global_step": 198631, "epoch": 4729} {"train_loss": -7.268466949462891, "global_step": 198632, "epoch": 4729} {"train_loss": -7.1465277671813965, "global_step": 198633, "epoch": 4729} {"train_loss": -7.219154357910156, "global_step": 198634, "epoch": 4729} {"train_loss": -7.284391403198242, "global_step": 198635, "epoch": 4729} {"train_loss": -7.211357593536377, "global_step": 198636, "epoch": 4729} {"train_loss": -7.160953044891357, "global_step": 198637, "epoch": 4729} {"train_loss": -7.160440921783447, "global_step": 198638, "epoch": 4729} {"train_loss": -7.178460121154785, "global_step": 198639, "epoch": 4729} {"train_loss": -7.210020065307617, "global_step": 198640, "epoch": 4729} {"train_loss": -7.076982498168945, "global_step": 198641, "epoch": 4729} {"train_loss": -7.010626792907715, "global_step": 198642, "epoch": 4729} {"train_loss": -7.380038738250732, "global_step": 198643, "epoch": 4729} {"train_loss": -7.1082587242126465, "global_step": 198644, "epoch": 4729} {"train_loss": -7.219040393829346, "global_step": 198645, "epoch": 4729} {"train_loss": -7.142457008361816, "global_step": 198646, "epoch": 4729} {"train_loss": -7.21895694732666, "global_step": 198647, "epoch": 4729} {"train_loss": -7.067746639251709, "global_step": 198648, "epoch": 4729} {"train_loss": -7.12474250793457, "global_step": 198649, "epoch": 4729} {"train_loss": -7.186844348907471, "global_step": 198650, "epoch": 4729} {"train_loss": -7.1203999519348145, "global_step": 198651, "epoch": 4729} {"train_loss": -7.204916000366211, "global_step": 198652, "epoch": 4729} {"train_loss": -7.182486534118652, "global_step": 198653, "epoch": 4729} {"train_loss": -7.220285415649414, "global_step": 198654, "epoch": 4729} {"train_loss": -7.150973796844482, "global_step": 198655, "epoch": 4729} {"train_loss": -7.161230087280273, "global_step": 198656, "epoch": 4729} {"train_loss": -7.166600704193115, "global_step": 198657, "epoch": 4729} {"train_loss": -7.069279193878174, "global_step": 198658, "epoch": 4729} {"train_loss": -7.169288578487578, "global_step": 198659, "epoch": 4729, "val_loss": 68978.3203125} {"train_loss": -7.112227439880371, "global_step": 198660, "epoch": 4730} {"train_loss": -7.175667762756348, "global_step": 198661, "epoch": 4730} {"train_loss": -7.237502098083496, "global_step": 198662, "epoch": 4730} {"train_loss": -7.263480186462402, "global_step": 198663, "epoch": 4730} {"train_loss": -7.275712490081787, "global_step": 198664, "epoch": 4730} {"train_loss": -7.1847968101501465, "global_step": 198665, "epoch": 4730} {"train_loss": -7.268845558166504, "global_step": 198666, "epoch": 4730} {"train_loss": -7.321922779083252, "global_step": 198667, "epoch": 4730} {"train_loss": -7.25275182723999, "global_step": 198668, "epoch": 4730} {"train_loss": -7.235049247741699, "global_step": 198669, "epoch": 4730} {"train_loss": -7.175421714782715, "global_step": 198670, "epoch": 4730} {"train_loss": -7.228764533996582, "global_step": 198671, "epoch": 4730} {"train_loss": -7.233791828155518, "global_step": 198672, "epoch": 4730} {"train_loss": -7.340943336486816, "global_step": 198673, "epoch": 4730} {"train_loss": -7.346308708190918, "global_step": 198674, "epoch": 4730} {"train_loss": -7.350701332092285, "global_step": 198675, "epoch": 4730} {"train_loss": -7.360409736633301, "global_step": 198676, "epoch": 4730} {"train_loss": -7.229074478149414, "global_step": 198677, "epoch": 4730} {"train_loss": -7.272815704345703, "global_step": 198678, "epoch": 4730} {"train_loss": -7.224268436431885, "global_step": 198679, "epoch": 4730} {"train_loss": -7.215465068817139, "global_step": 198680, "epoch": 4730} {"train_loss": -7.217286586761475, "global_step": 198681, "epoch": 4730} {"train_loss": -7.240576267242432, "global_step": 198682, "epoch": 4730} {"train_loss": -7.211536407470703, "global_step": 198683, "epoch": 4730} {"train_loss": -7.214755058288574, "global_step": 198684, "epoch": 4730} {"train_loss": -7.215771675109863, "global_step": 198685, "epoch": 4730} {"train_loss": -7.295799255371094, "global_step": 198686, "epoch": 4730} {"train_loss": -7.241357326507568, "global_step": 198687, "epoch": 4730} {"train_loss": -7.219618320465088, "global_step": 198688, "epoch": 4730} {"train_loss": -7.359386444091797, "global_step": 198689, "epoch": 4730} {"train_loss": -7.235829830169678, "global_step": 198690, "epoch": 4730} {"train_loss": -7.3424973487854, "global_step": 198691, "epoch": 4730} {"train_loss": -7.261544227600098, "global_step": 198692, "epoch": 4730} {"train_loss": -7.213447093963623, "global_step": 198693, "epoch": 4730} {"train_loss": -7.184566974639893, "global_step": 198694, "epoch": 4730} {"train_loss": -7.18604040145874, "global_step": 198695, "epoch": 4730} {"train_loss": -7.332558631896973, "global_step": 198696, "epoch": 4730} {"train_loss": -7.188582420349121, "global_step": 198697, "epoch": 4730} {"train_loss": -7.239838123321533, "global_step": 198698, "epoch": 4730} {"train_loss": -7.257197856903076, "global_step": 198699, "epoch": 4730} {"train_loss": -7.217519760131836, "global_step": 198700, "epoch": 4730} {"train_loss": -7.245477676391602, "global_step": 198701, "epoch": 4730, "val_loss": 69093.859375} {"train_loss": -7.197595596313477, "global_step": 198702, "epoch": 4731} {"train_loss": -7.133024215698242, "global_step": 198703, "epoch": 4731} {"train_loss": -7.212765693664551, "global_step": 198704, "epoch": 4731} {"train_loss": -7.173874855041504, "global_step": 198705, "epoch": 4731} {"train_loss": -7.177341461181641, "global_step": 198706, "epoch": 4731} {"train_loss": -7.2467498779296875, "global_step": 198707, "epoch": 4731} {"train_loss": -7.218095779418945, "global_step": 198708, "epoch": 4731} {"train_loss": -7.239477634429932, "global_step": 198709, "epoch": 4731} {"train_loss": -7.260285377502441, "global_step": 198710, "epoch": 4731} {"train_loss": -7.214045524597168, "global_step": 198711, "epoch": 4731} {"train_loss": -7.1717071533203125, "global_step": 198712, "epoch": 4731} {"train_loss": -7.243056297302246, "global_step": 198713, "epoch": 4731} {"train_loss": -7.223593711853027, "global_step": 198714, "epoch": 4731} {"train_loss": -7.172600746154785, "global_step": 198715, "epoch": 4731} {"train_loss": -7.269500732421875, "global_step": 198716, "epoch": 4731} {"train_loss": -7.2367401123046875, "global_step": 198717, "epoch": 4731} {"train_loss": -7.247035980224609, "global_step": 198718, "epoch": 4731} {"train_loss": -7.27200984954834, "global_step": 198719, "epoch": 4731} {"train_loss": -7.152536392211914, "global_step": 198720, "epoch": 4731} {"train_loss": -7.1492438316345215, "global_step": 198721, "epoch": 4731} {"train_loss": -7.20468282699585, "global_step": 198722, "epoch": 4731} {"train_loss": -7.284045219421387, "global_step": 198723, "epoch": 4731} {"train_loss": -7.195037841796875, "global_step": 198724, "epoch": 4731} {"train_loss": -7.275628089904785, "global_step": 198725, "epoch": 4731} {"train_loss": -7.264825820922852, "global_step": 198726, "epoch": 4731} {"train_loss": -7.201201915740967, "global_step": 198727, "epoch": 4731} {"train_loss": -7.286758899688721, "global_step": 198728, "epoch": 4731} {"train_loss": -7.193333625793457, "global_step": 198729, "epoch": 4731} {"train_loss": -7.327941417694092, "global_step": 198730, "epoch": 4731} {"train_loss": -7.252119064331055, "global_step": 198731, "epoch": 4731} {"train_loss": -7.122663497924805, "global_step": 198732, "epoch": 4731} {"train_loss": -7.160410404205322, "global_step": 198733, "epoch": 4731} {"train_loss": -7.242332935333252, "global_step": 198734, "epoch": 4731} {"train_loss": -7.239836692810059, "global_step": 198735, "epoch": 4731} {"train_loss": -7.216588973999023, "global_step": 198736, "epoch": 4731} {"train_loss": -7.102211952209473, "global_step": 198737, "epoch": 4731} {"train_loss": -7.217398643493652, "global_step": 198738, "epoch": 4731} {"train_loss": -7.187925338745117, "global_step": 198739, "epoch": 4731} {"train_loss": -7.234092712402344, "global_step": 198740, "epoch": 4731} {"train_loss": -7.129473686218262, "global_step": 198741, "epoch": 4731} {"train_loss": -7.188384056091309, "global_step": 198742, "epoch": 4731} {"train_loss": -7.212828692935762, "global_step": 198743, "epoch": 4731, "val_loss": 69141.1328125} {"train_loss": -7.243582725524902, "global_step": 198744, "epoch": 4732} {"train_loss": -7.184894561767578, "global_step": 198745, "epoch": 4732} {"train_loss": -7.318774700164795, "global_step": 198746, "epoch": 4732} {"train_loss": -7.233457565307617, "global_step": 198747, "epoch": 4732} {"train_loss": -7.156526565551758, "global_step": 198748, "epoch": 4732} {"train_loss": -7.240328311920166, "global_step": 198749, "epoch": 4732} {"train_loss": -7.010138034820557, "global_step": 198750, "epoch": 4732} {"train_loss": -7.173104286193848, "global_step": 198751, "epoch": 4732} {"train_loss": -7.243755340576172, "global_step": 198752, "epoch": 4732} {"train_loss": -7.116947174072266, "global_step": 198753, "epoch": 4732} {"train_loss": -7.258084774017334, "global_step": 198754, "epoch": 4732} {"train_loss": -7.229462623596191, "global_step": 198755, "epoch": 4732} {"train_loss": -7.2637763023376465, "global_step": 198756, "epoch": 4732} {"train_loss": -7.201286315917969, "global_step": 198757, "epoch": 4732} {"train_loss": -7.189976215362549, "global_step": 198758, "epoch": 4732} {"train_loss": -7.236788749694824, "global_step": 198759, "epoch": 4732} {"train_loss": -7.3222808837890625, "global_step": 198760, "epoch": 4732} {"train_loss": -7.174582481384277, "global_step": 198761, "epoch": 4732} {"train_loss": -7.1260504722595215, "global_step": 198762, "epoch": 4732} {"train_loss": -7.238436698913574, "global_step": 198763, "epoch": 4732} {"train_loss": -7.2941508293151855, "global_step": 198764, "epoch": 4732} {"train_loss": -7.11720085144043, "global_step": 198765, "epoch": 4732} {"train_loss": -7.179554462432861, "global_step": 198766, "epoch": 4732} {"train_loss": -7.08298397064209, "global_step": 198767, "epoch": 4732} {"train_loss": -7.093606948852539, "global_step": 198768, "epoch": 4732} {"train_loss": -7.127993583679199, "global_step": 198769, "epoch": 4732} {"train_loss": -7.089896202087402, "global_step": 198770, "epoch": 4732} {"train_loss": -7.212982654571533, "global_step": 198771, "epoch": 4732} {"train_loss": -7.201380729675293, "global_step": 198772, "epoch": 4732} {"train_loss": -7.054111003875732, "global_step": 198773, "epoch": 4732} {"train_loss": -7.31416130065918, "global_step": 198774, "epoch": 4732} {"train_loss": -6.964804172515869, "global_step": 198775, "epoch": 4732} {"train_loss": -7.109092712402344, "global_step": 198776, "epoch": 4732} {"train_loss": -7.3355393409729, "global_step": 198777, "epoch": 4732} {"train_loss": -6.924529075622559, "global_step": 198778, "epoch": 4732} {"train_loss": -7.1563191413879395, "global_step": 198779, "epoch": 4732} {"train_loss": -6.9927215576171875, "global_step": 198780, "epoch": 4732} {"train_loss": -7.050296783447266, "global_step": 198781, "epoch": 4732} {"train_loss": -7.223447322845459, "global_step": 198782, "epoch": 4732} {"train_loss": -7.039485931396484, "global_step": 198783, "epoch": 4732} {"train_loss": -7.170347690582275, "global_step": 198784, "epoch": 4732} {"train_loss": -7.166761818386259, "global_step": 198785, "epoch": 4732, "val_loss": 69241.34375} {"train_loss": -7.328454971313477, "global_step": 198786, "epoch": 4733} {"train_loss": -7.000640869140625, "global_step": 198787, "epoch": 4733} {"train_loss": -7.13547945022583, "global_step": 198788, "epoch": 4733} {"train_loss": -7.150830268859863, "global_step": 198789, "epoch": 4733} {"train_loss": -7.214543342590332, "global_step": 198790, "epoch": 4733} {"train_loss": -6.9682841300964355, "global_step": 198791, "epoch": 4733} {"train_loss": -7.183269500732422, "global_step": 198792, "epoch": 4733} {"train_loss": -7.0823564529418945, "global_step": 198793, "epoch": 4733} {"train_loss": -7.2665629386901855, "global_step": 198794, "epoch": 4733} {"train_loss": -7.094363212585449, "global_step": 198795, "epoch": 4733} {"train_loss": -7.155655860900879, "global_step": 198796, "epoch": 4733} {"train_loss": -7.160074234008789, "global_step": 198797, "epoch": 4733} {"train_loss": -7.2497429847717285, "global_step": 198798, "epoch": 4733} {"train_loss": -7.132713794708252, "global_step": 198799, "epoch": 4733} {"train_loss": -7.246863842010498, "global_step": 198800, "epoch": 4733} {"train_loss": -7.245617866516113, "global_step": 198801, "epoch": 4733} {"train_loss": -7.296618461608887, "global_step": 198802, "epoch": 4733} {"train_loss": -7.1282958984375, "global_step": 198803, "epoch": 4733} {"train_loss": -7.090017318725586, "global_step": 198804, "epoch": 4733} {"train_loss": -7.20056676864624, "global_step": 198805, "epoch": 4733} {"train_loss": -7.226058483123779, "global_step": 198806, "epoch": 4733} {"train_loss": -7.206079483032227, "global_step": 198807, "epoch": 4733} {"train_loss": -7.147547721862793, "global_step": 198808, "epoch": 4733} {"train_loss": -7.300464153289795, "global_step": 198809, "epoch": 4733} {"train_loss": -7.185961723327637, "global_step": 198810, "epoch": 4733} {"train_loss": -7.247410774230957, "global_step": 198811, "epoch": 4733} {"train_loss": -7.116591453552246, "global_step": 198812, "epoch": 4733} {"train_loss": -7.30031681060791, "global_step": 198813, "epoch": 4733} {"train_loss": -7.295094966888428, "global_step": 198814, "epoch": 4733} {"train_loss": -7.208164215087891, "global_step": 198815, "epoch": 4733} {"train_loss": -7.194629192352295, "global_step": 198816, "epoch": 4733} {"train_loss": -7.319969177246094, "global_step": 198817, "epoch": 4733} {"train_loss": -7.148083686828613, "global_step": 198818, "epoch": 4733} {"train_loss": -7.172072410583496, "global_step": 198819, "epoch": 4733} {"train_loss": -7.263608932495117, "global_step": 198820, "epoch": 4733} {"train_loss": -7.154918670654297, "global_step": 198821, "epoch": 4733} {"train_loss": -7.3010101318359375, "global_step": 198822, "epoch": 4733} {"train_loss": -7.215789794921875, "global_step": 198823, "epoch": 4733} {"train_loss": -7.173439979553223, "global_step": 198824, "epoch": 4733} {"train_loss": -7.138598442077637, "global_step": 198825, "epoch": 4733} {"train_loss": -7.040972709655762, "global_step": 198826, "epoch": 4733} {"train_loss": -7.184520982560658, "global_step": 198827, "epoch": 4733, "val_loss": 69230.0859375} {"train_loss": -7.056937217712402, "global_step": 198828, "epoch": 4734} {"train_loss": -7.138574600219727, "global_step": 198829, "epoch": 4734} {"train_loss": -7.213801383972168, "global_step": 198830, "epoch": 4734} {"train_loss": -7.170622825622559, "global_step": 198831, "epoch": 4734} {"train_loss": -7.245386123657227, "global_step": 198832, "epoch": 4734} {"train_loss": -7.243233680725098, "global_step": 198833, "epoch": 4734} {"train_loss": -7.126216888427734, "global_step": 198834, "epoch": 4734} {"train_loss": -7.2084479331970215, "global_step": 198835, "epoch": 4734} {"train_loss": -7.237683296203613, "global_step": 198836, "epoch": 4734} {"train_loss": -7.340538024902344, "global_step": 198837, "epoch": 4734} {"train_loss": -7.184292793273926, "global_step": 198838, "epoch": 4734} {"train_loss": -7.220443248748779, "global_step": 198839, "epoch": 4734} {"train_loss": -7.200439453125, "global_step": 198840, "epoch": 4734} {"train_loss": -7.1633195877075195, "global_step": 198841, "epoch": 4734} {"train_loss": -7.215867042541504, "global_step": 198842, "epoch": 4734} {"train_loss": -7.155254364013672, "global_step": 198843, "epoch": 4734} {"train_loss": -7.158063888549805, "global_step": 198844, "epoch": 4734} {"train_loss": -7.135663986206055, "global_step": 198845, "epoch": 4734} {"train_loss": -7.188498020172119, "global_step": 198846, "epoch": 4734} {"train_loss": -7.132460594177246, "global_step": 198847, "epoch": 4734} {"train_loss": -7.241605758666992, "global_step": 198848, "epoch": 4734} {"train_loss": -7.046637535095215, "global_step": 198849, "epoch": 4734} {"train_loss": -7.234014511108398, "global_step": 198850, "epoch": 4734} {"train_loss": -7.173962593078613, "global_step": 198851, "epoch": 4734} {"train_loss": -7.1294450759887695, "global_step": 198852, "epoch": 4734} {"train_loss": -7.206552982330322, "global_step": 198853, "epoch": 4734} {"train_loss": -7.0297346115112305, "global_step": 198854, "epoch": 4734} {"train_loss": -7.13455867767334, "global_step": 198855, "epoch": 4734} {"train_loss": -7.18088436126709, "global_step": 198856, "epoch": 4734} {"train_loss": -7.197061061859131, "global_step": 198857, "epoch": 4734} {"train_loss": -7.16097354888916, "global_step": 198858, "epoch": 4734} {"train_loss": -7.204866886138916, "global_step": 198859, "epoch": 4734} {"train_loss": -7.298559188842773, "global_step": 198860, "epoch": 4734} {"train_loss": -7.257830619812012, "global_step": 198861, "epoch": 4734} {"train_loss": -7.221601486206055, "global_step": 198862, "epoch": 4734} {"train_loss": -7.30408239364624, "global_step": 198863, "epoch": 4734} {"train_loss": -7.272524833679199, "global_step": 198864, "epoch": 4734} {"train_loss": -7.27332067489624, "global_step": 198865, "epoch": 4734} {"train_loss": -7.27874755859375, "global_step": 198866, "epoch": 4734} {"train_loss": -7.209906578063965, "global_step": 198867, "epoch": 4734} {"train_loss": -7.289762496948242, "global_step": 198868, "epoch": 4734} {"train_loss": -7.199107317697434, "global_step": 198869, "epoch": 4734, "val_loss": 69015.671875} {"train_loss": -7.391664981842041, "global_step": 198870, "epoch": 4735} {"train_loss": -7.308906555175781, "global_step": 198871, "epoch": 4735} {"train_loss": -7.261895656585693, "global_step": 198872, "epoch": 4735} {"train_loss": -7.242184638977051, "global_step": 198873, "epoch": 4735} {"train_loss": -7.273689270019531, "global_step": 198874, "epoch": 4735} {"train_loss": -7.197040557861328, "global_step": 198875, "epoch": 4735} {"train_loss": -7.263311386108398, "global_step": 198876, "epoch": 4735} {"train_loss": -7.2250871658325195, "global_step": 198877, "epoch": 4735} {"train_loss": -7.253445625305176, "global_step": 198878, "epoch": 4735} {"train_loss": -7.217658519744873, "global_step": 198879, "epoch": 4735} {"train_loss": -7.1961565017700195, "global_step": 198880, "epoch": 4735} {"train_loss": -7.177472114562988, "global_step": 198881, "epoch": 4735} {"train_loss": -7.1591901779174805, "global_step": 198882, "epoch": 4735} {"train_loss": -7.165816307067871, "global_step": 198883, "epoch": 4735} {"train_loss": -7.219356536865234, "global_step": 198884, "epoch": 4735} {"train_loss": -7.148484230041504, "global_step": 198885, "epoch": 4735} {"train_loss": -7.22900390625, "global_step": 198886, "epoch": 4735} {"train_loss": -7.187911033630371, "global_step": 198887, "epoch": 4735} {"train_loss": -7.305741786956787, "global_step": 198888, "epoch": 4735} {"train_loss": -7.25441837310791, "global_step": 198889, "epoch": 4735} {"train_loss": -7.163338661193848, "global_step": 198890, "epoch": 4735} {"train_loss": -7.050607681274414, "global_step": 198891, "epoch": 4735} {"train_loss": -7.234973907470703, "global_step": 198892, "epoch": 4735} {"train_loss": -7.27260684967041, "global_step": 198893, "epoch": 4735} {"train_loss": -7.256738185882568, "global_step": 198894, "epoch": 4735} {"train_loss": -7.2545881271362305, "global_step": 198895, "epoch": 4735} {"train_loss": -7.166035175323486, "global_step": 198896, "epoch": 4735} {"train_loss": -7.196201801300049, "global_step": 198897, "epoch": 4735} {"train_loss": -7.140397548675537, "global_step": 198898, "epoch": 4735} {"train_loss": -7.125175476074219, "global_step": 198899, "epoch": 4735} {"train_loss": -7.131768226623535, "global_step": 198900, "epoch": 4735} {"train_loss": -7.288812160491943, "global_step": 198901, "epoch": 4735} {"train_loss": -7.2368059158325195, "global_step": 198902, "epoch": 4735} {"train_loss": -7.09934139251709, "global_step": 198903, "epoch": 4735} {"train_loss": -7.175356864929199, "global_step": 198904, "epoch": 4735} {"train_loss": -7.228567600250244, "global_step": 198905, "epoch": 4735} {"train_loss": -7.158323287963867, "global_step": 198906, "epoch": 4735} {"train_loss": -7.30875301361084, "global_step": 198907, "epoch": 4735} {"train_loss": -7.143973350524902, "global_step": 198908, "epoch": 4735} {"train_loss": -7.12923002243042, "global_step": 198909, "epoch": 4735} {"train_loss": -7.3207197189331055, "global_step": 198910, "epoch": 4735} {"train_loss": -7.215712172644479, "global_step": 198911, "epoch": 4735, "val_loss": 69011.921875} {"train_loss": -7.229534149169922, "global_step": 198912, "epoch": 4736} {"train_loss": -7.090242862701416, "global_step": 198913, "epoch": 4736} {"train_loss": -7.338669300079346, "global_step": 198914, "epoch": 4736} {"train_loss": -7.11167573928833, "global_step": 198915, "epoch": 4736} {"train_loss": -7.206005096435547, "global_step": 198916, "epoch": 4736} {"train_loss": -7.259500026702881, "global_step": 198917, "epoch": 4736} {"train_loss": -7.194421291351318, "global_step": 198918, "epoch": 4736} {"train_loss": -7.139577865600586, "global_step": 198919, "epoch": 4736} {"train_loss": -7.240800380706787, "global_step": 198920, "epoch": 4736} {"train_loss": -7.244938850402832, "global_step": 198921, "epoch": 4736} {"train_loss": -7.088958263397217, "global_step": 198922, "epoch": 4736} {"train_loss": -7.216487884521484, "global_step": 198923, "epoch": 4736} {"train_loss": -7.229873180389404, "global_step": 198924, "epoch": 4736} {"train_loss": -6.993202209472656, "global_step": 198925, "epoch": 4736} {"train_loss": -7.226736068725586, "global_step": 198926, "epoch": 4736} {"train_loss": -7.184775352478027, "global_step": 198927, "epoch": 4736} {"train_loss": -7.2516632080078125, "global_step": 198928, "epoch": 4736} {"train_loss": -7.099654197692871, "global_step": 198929, "epoch": 4736} {"train_loss": -7.0199689865112305, "global_step": 198930, "epoch": 4736} {"train_loss": -7.192797660827637, "global_step": 198931, "epoch": 4736} {"train_loss": -7.164618015289307, "global_step": 198932, "epoch": 4736} {"train_loss": -6.967947959899902, "global_step": 198933, "epoch": 4736} {"train_loss": -6.995371341705322, "global_step": 198934, "epoch": 4736} {"train_loss": -7.066167831420898, "global_step": 198935, "epoch": 4736} {"train_loss": -7.087405204772949, "global_step": 198936, "epoch": 4736} {"train_loss": -7.105871200561523, "global_step": 198937, "epoch": 4736} {"train_loss": -7.16375732421875, "global_step": 198938, "epoch": 4736} {"train_loss": -6.914063453674316, "global_step": 198939, "epoch": 4736} {"train_loss": -7.239830017089844, "global_step": 198940, "epoch": 4736} {"train_loss": -6.984889030456543, "global_step": 198941, "epoch": 4736} {"train_loss": -7.0918989181518555, "global_step": 198942, "epoch": 4736} {"train_loss": -7.145818710327148, "global_step": 198943, "epoch": 4736} {"train_loss": -7.094043731689453, "global_step": 198944, "epoch": 4736} {"train_loss": -7.195474624633789, "global_step": 198945, "epoch": 4736} {"train_loss": -7.125561714172363, "global_step": 198946, "epoch": 4736} {"train_loss": -7.051138877868652, "global_step": 198947, "epoch": 4736} {"train_loss": -7.1495361328125, "global_step": 198948, "epoch": 4736} {"train_loss": -7.22816276550293, "global_step": 198949, "epoch": 4736} {"train_loss": -7.172327041625977, "global_step": 198950, "epoch": 4736} {"train_loss": -7.032050132751465, "global_step": 198951, "epoch": 4736} {"train_loss": -7.184168815612793, "global_step": 198952, "epoch": 4736} {"train_loss": -7.139002198264713, "global_step": 198953, "epoch": 4736, "val_loss": 68936.1953125} {"train_loss": -7.281643867492676, "global_step": 198954, "epoch": 4737} {"train_loss": -7.267813682556152, "global_step": 198955, "epoch": 4737} {"train_loss": -7.2170538902282715, "global_step": 198956, "epoch": 4737} {"train_loss": -7.155923366546631, "global_step": 198957, "epoch": 4737} {"train_loss": -7.22785758972168, "global_step": 198958, "epoch": 4737} {"train_loss": -7.171225547790527, "global_step": 198959, "epoch": 4737} {"train_loss": -7.268321990966797, "global_step": 198960, "epoch": 4737} {"train_loss": -7.263096809387207, "global_step": 198961, "epoch": 4737} {"train_loss": -7.196709632873535, "global_step": 198962, "epoch": 4737} {"train_loss": -7.291373252868652, "global_step": 198963, "epoch": 4737} {"train_loss": -7.291226863861084, "global_step": 198964, "epoch": 4737} {"train_loss": -7.2691426277160645, "global_step": 198965, "epoch": 4737} {"train_loss": -7.270070552825928, "global_step": 198966, "epoch": 4737} {"train_loss": -7.201372146606445, "global_step": 198967, "epoch": 4737} {"train_loss": -7.121201515197754, "global_step": 198968, "epoch": 4737} {"train_loss": -7.207149505615234, "global_step": 198969, "epoch": 4737} {"train_loss": -7.253006935119629, "global_step": 198970, "epoch": 4737} {"train_loss": -7.202280521392822, "global_step": 198971, "epoch": 4737} {"train_loss": -7.311767578125, "global_step": 198972, "epoch": 4737} {"train_loss": -7.224974632263184, "global_step": 198973, "epoch": 4737} {"train_loss": -7.333601951599121, "global_step": 198974, "epoch": 4737} {"train_loss": -7.277368545532227, "global_step": 198975, "epoch": 4737} {"train_loss": -7.263692855834961, "global_step": 198976, "epoch": 4737} {"train_loss": -7.255200386047363, "global_step": 198977, "epoch": 4737} {"train_loss": -7.167898178100586, "global_step": 198978, "epoch": 4737} {"train_loss": -7.327600479125977, "global_step": 198979, "epoch": 4737} {"train_loss": -7.222563743591309, "global_step": 198980, "epoch": 4737} {"train_loss": -7.225001811981201, "global_step": 198981, "epoch": 4737} {"train_loss": -7.251317977905273, "global_step": 198982, "epoch": 4737} {"train_loss": -7.30534553527832, "global_step": 198983, "epoch": 4737} {"train_loss": -7.22177791595459, "global_step": 198984, "epoch": 4737} {"train_loss": -7.225420951843262, "global_step": 198985, "epoch": 4737} {"train_loss": -7.240619659423828, "global_step": 198986, "epoch": 4737} {"train_loss": -7.222328186035156, "global_step": 198987, "epoch": 4737} {"train_loss": -7.238366603851318, "global_step": 198988, "epoch": 4737} {"train_loss": -7.126029014587402, "global_step": 198989, "epoch": 4737} {"train_loss": -7.309543609619141, "global_step": 198990, "epoch": 4737} {"train_loss": -7.220484733581543, "global_step": 198991, "epoch": 4737} {"train_loss": -7.249221324920654, "global_step": 198992, "epoch": 4737} {"train_loss": -7.306907653808594, "global_step": 198993, "epoch": 4737} {"train_loss": -7.178875923156738, "global_step": 198994, "epoch": 4737} {"train_loss": -7.240214813323248, "global_step": 198995, "epoch": 4737, "val_loss": 68867.9921875} {"train_loss": -7.177449703216553, "global_step": 198996, "epoch": 4738} {"train_loss": -7.117972373962402, "global_step": 198997, "epoch": 4738} {"train_loss": -7.160110950469971, "global_step": 198998, "epoch": 4738} {"train_loss": -7.321113586425781, "global_step": 198999, "epoch": 4738} {"train_loss": -7.27113151550293, "global_step": 199000, "epoch": 4738} {"train_loss": -7.222026824951172, "global_step": 199001, "epoch": 4738} {"train_loss": -7.224793910980225, "global_step": 199002, "epoch": 4738} {"train_loss": -7.273158073425293, "global_step": 199003, "epoch": 4738} {"train_loss": -7.229959964752197, "global_step": 199004, "epoch": 4738} {"train_loss": -7.339407920837402, "global_step": 199005, "epoch": 4738} {"train_loss": -7.235983848571777, "global_step": 199006, "epoch": 4738} {"train_loss": -7.266168594360352, "global_step": 199007, "epoch": 4738} {"train_loss": -7.303277015686035, "global_step": 199008, "epoch": 4738} {"train_loss": -7.310670852661133, "global_step": 199009, "epoch": 4738} {"train_loss": -7.30884313583374, "global_step": 199010, "epoch": 4738} {"train_loss": -7.279200553894043, "global_step": 199011, "epoch": 4738} {"train_loss": -7.317915916442871, "global_step": 199012, "epoch": 4738} {"train_loss": -7.287489891052246, "global_step": 199013, "epoch": 4738} {"train_loss": -7.335293769836426, "global_step": 199014, "epoch": 4738} {"train_loss": -7.286470413208008, "global_step": 199015, "epoch": 4738} {"train_loss": -7.312878608703613, "global_step": 199016, "epoch": 4738} {"train_loss": -7.309557914733887, "global_step": 199017, "epoch": 4738} {"train_loss": -7.29311466217041, "global_step": 199018, "epoch": 4738} {"train_loss": -7.230093002319336, "global_step": 199019, "epoch": 4738} {"train_loss": -7.200096130371094, "global_step": 199020, "epoch": 4738} {"train_loss": -7.204311370849609, "global_step": 199021, "epoch": 4738} {"train_loss": -7.22509765625, "global_step": 199022, "epoch": 4738} {"train_loss": -7.018739700317383, "global_step": 199023, "epoch": 4738} {"train_loss": -7.321163654327393, "global_step": 199024, "epoch": 4738} {"train_loss": -7.318090915679932, "global_step": 199025, "epoch": 4738} {"train_loss": -7.234972953796387, "global_step": 199026, "epoch": 4738} {"train_loss": -7.1598124504089355, "global_step": 199027, "epoch": 4738} {"train_loss": -7.304103851318359, "global_step": 199028, "epoch": 4738} {"train_loss": -7.277796745300293, "global_step": 199029, "epoch": 4738} {"train_loss": -7.163806915283203, "global_step": 199030, "epoch": 4738} {"train_loss": -7.189022064208984, "global_step": 199031, "epoch": 4738} {"train_loss": -7.215063571929932, "global_step": 199032, "epoch": 4738} {"train_loss": -7.234070777893066, "global_step": 199033, "epoch": 4738} {"train_loss": -7.289941787719727, "global_step": 199034, "epoch": 4738} {"train_loss": -7.287783145904541, "global_step": 199035, "epoch": 4738} {"train_loss": -7.101550579071045, "global_step": 199036, "epoch": 4738} {"train_loss": -7.246156953629994, "global_step": 199037, "epoch": 4738, "val_loss": 69320.8359375} {"train_loss": -7.198854446411133, "global_step": 199038, "epoch": 4739} {"train_loss": -7.0419921875, "global_step": 199039, "epoch": 4739} {"train_loss": -7.146717071533203, "global_step": 199040, "epoch": 4739} {"train_loss": -7.282131195068359, "global_step": 199041, "epoch": 4739} {"train_loss": -6.931547164916992, "global_step": 199042, "epoch": 4739} {"train_loss": -7.12769889831543, "global_step": 199043, "epoch": 4739} {"train_loss": -7.11824893951416, "global_step": 199044, "epoch": 4739} {"train_loss": -6.969974040985107, "global_step": 199045, "epoch": 4739} {"train_loss": -7.091880798339844, "global_step": 199046, "epoch": 4739} {"train_loss": -7.069855690002441, "global_step": 199047, "epoch": 4739} {"train_loss": -7.124382972717285, "global_step": 199048, "epoch": 4739} {"train_loss": -7.266944885253906, "global_step": 199049, "epoch": 4739} {"train_loss": -7.135507583618164, "global_step": 199050, "epoch": 4739} {"train_loss": -7.254115104675293, "global_step": 199051, "epoch": 4739} {"train_loss": -7.076222896575928, "global_step": 199052, "epoch": 4739} {"train_loss": -7.293298721313477, "global_step": 199053, "epoch": 4739} {"train_loss": -7.167754173278809, "global_step": 199054, "epoch": 4739} {"train_loss": -7.175014019012451, "global_step": 199055, "epoch": 4739} {"train_loss": -7.1939496994018555, "global_step": 199056, "epoch": 4739} {"train_loss": -7.119448661804199, "global_step": 199057, "epoch": 4739} {"train_loss": -7.182145118713379, "global_step": 199058, "epoch": 4739} {"train_loss": -7.2296857833862305, "global_step": 199059, "epoch": 4739} {"train_loss": -7.264345169067383, "global_step": 199060, "epoch": 4739} {"train_loss": -7.229355812072754, "global_step": 199061, "epoch": 4739} {"train_loss": -7.197134971618652, "global_step": 199062, "epoch": 4739} {"train_loss": -7.13185977935791, "global_step": 199063, "epoch": 4739} {"train_loss": -7.111936569213867, "global_step": 199064, "epoch": 4739} {"train_loss": -7.3093085289001465, "global_step": 199065, "epoch": 4739} {"train_loss": -7.2006611824035645, "global_step": 199066, "epoch": 4739} {"train_loss": -7.267367362976074, "global_step": 199067, "epoch": 4739} {"train_loss": -7.354824066162109, "global_step": 199068, "epoch": 4739} {"train_loss": -7.113142013549805, "global_step": 199069, "epoch": 4739} {"train_loss": -7.280492782592773, "global_step": 199070, "epoch": 4739} {"train_loss": -7.220776557922363, "global_step": 199071, "epoch": 4739} {"train_loss": -7.216484069824219, "global_step": 199072, "epoch": 4739} {"train_loss": -7.21422004699707, "global_step": 199073, "epoch": 4739} {"train_loss": -7.228933811187744, "global_step": 199074, "epoch": 4739} {"train_loss": -7.1451416015625, "global_step": 199075, "epoch": 4739} {"train_loss": -7.255006313323975, "global_step": 199076, "epoch": 4739} {"train_loss": -7.2168684005737305, "global_step": 199077, "epoch": 4739} {"train_loss": -7.2303266525268555, "global_step": 199078, "epoch": 4739} {"train_loss": -7.180052848089309, "global_step": 199079, "epoch": 4739, "val_loss": 69190.890625} {"train_loss": -7.214566230773926, "global_step": 199080, "epoch": 4740} {"train_loss": -7.093493461608887, "global_step": 199081, "epoch": 4740} {"train_loss": -7.206878662109375, "global_step": 199082, "epoch": 4740} {"train_loss": -7.201528549194336, "global_step": 199083, "epoch": 4740} {"train_loss": -7.212787628173828, "global_step": 199084, "epoch": 4740} {"train_loss": -7.313841342926025, "global_step": 199085, "epoch": 4740} {"train_loss": -7.194476127624512, "global_step": 199086, "epoch": 4740} {"train_loss": -7.188102722167969, "global_step": 199087, "epoch": 4740} {"train_loss": -7.23877477645874, "global_step": 199088, "epoch": 4740} {"train_loss": -7.212560653686523, "global_step": 199089, "epoch": 4740} {"train_loss": -7.232430458068848, "global_step": 199090, "epoch": 4740} {"train_loss": -7.117649555206299, "global_step": 199091, "epoch": 4740} {"train_loss": -7.191051483154297, "global_step": 199092, "epoch": 4740} {"train_loss": -7.110980033874512, "global_step": 199093, "epoch": 4740} {"train_loss": -7.111776351928711, "global_step": 199094, "epoch": 4740} {"train_loss": -7.066514015197754, "global_step": 199095, "epoch": 4740} {"train_loss": -7.258033275604248, "global_step": 199096, "epoch": 4740} {"train_loss": -7.066056251525879, "global_step": 199097, "epoch": 4740} {"train_loss": -7.1516923904418945, "global_step": 199098, "epoch": 4740} {"train_loss": -6.985053062438965, "global_step": 199099, "epoch": 4740} {"train_loss": -7.065332889556885, "global_step": 199100, "epoch": 4740} {"train_loss": -7.238946914672852, "global_step": 199101, "epoch": 4740} {"train_loss": -7.092480659484863, "global_step": 199102, "epoch": 4740} {"train_loss": -7.096397399902344, "global_step": 199103, "epoch": 4740} {"train_loss": -7.157391548156738, "global_step": 199104, "epoch": 4740} {"train_loss": -7.148509979248047, "global_step": 199105, "epoch": 4740} {"train_loss": -7.111151695251465, "global_step": 199106, "epoch": 4740} {"train_loss": -7.110956192016602, "global_step": 199107, "epoch": 4740} {"train_loss": -7.085773944854736, "global_step": 199108, "epoch": 4740} {"train_loss": -7.191160202026367, "global_step": 199109, "epoch": 4740} {"train_loss": -7.088992595672607, "global_step": 199110, "epoch": 4740} {"train_loss": -7.061013698577881, "global_step": 199111, "epoch": 4740} {"train_loss": -7.248132228851318, "global_step": 199112, "epoch": 4740} {"train_loss": -7.08980131149292, "global_step": 199113, "epoch": 4740} {"train_loss": -7.231337547302246, "global_step": 199114, "epoch": 4740} {"train_loss": -7.183492660522461, "global_step": 199115, "epoch": 4740} {"train_loss": -7.171735763549805, "global_step": 199116, "epoch": 4740} {"train_loss": -7.1615705490112305, "global_step": 199117, "epoch": 4740} {"train_loss": -7.12099552154541, "global_step": 199118, "epoch": 4740} {"train_loss": -7.081286907196045, "global_step": 199119, "epoch": 4740} {"train_loss": -7.186840057373047, "global_step": 199120, "epoch": 4740} {"train_loss": -7.152413901828584, "global_step": 199121, "epoch": 4740, "val_loss": 69206.53125} {"train_loss": -7.215564727783203, "global_step": 199122, "epoch": 4741} {"train_loss": -7.22329044342041, "global_step": 199123, "epoch": 4741} {"train_loss": -7.184554100036621, "global_step": 199124, "epoch": 4741} {"train_loss": -7.215826988220215, "global_step": 199125, "epoch": 4741} {"train_loss": -7.165508270263672, "global_step": 199126, "epoch": 4741} {"train_loss": -7.231780052185059, "global_step": 199127, "epoch": 4741} {"train_loss": -7.192387580871582, "global_step": 199128, "epoch": 4741} {"train_loss": -7.24422550201416, "global_step": 199129, "epoch": 4741} {"train_loss": -7.220463752746582, "global_step": 199130, "epoch": 4741} {"train_loss": -7.285696983337402, "global_step": 199131, "epoch": 4741} {"train_loss": -7.271684646606445, "global_step": 199132, "epoch": 4741} {"train_loss": -7.17562198638916, "global_step": 199133, "epoch": 4741} {"train_loss": -7.258084774017334, "global_step": 199134, "epoch": 4741} {"train_loss": -7.108811855316162, "global_step": 199135, "epoch": 4741} {"train_loss": -7.200715065002441, "global_step": 199136, "epoch": 4741} {"train_loss": -7.243030071258545, "global_step": 199137, "epoch": 4741} {"train_loss": -7.037234783172607, "global_step": 199138, "epoch": 4741} {"train_loss": -7.222718238830566, "global_step": 199139, "epoch": 4741} {"train_loss": -7.230243682861328, "global_step": 199140, "epoch": 4741} {"train_loss": -7.238213539123535, "global_step": 199141, "epoch": 4741} {"train_loss": -7.1205010414123535, "global_step": 199142, "epoch": 4741} {"train_loss": -7.228796005249023, "global_step": 199143, "epoch": 4741} {"train_loss": -7.179533958435059, "global_step": 199144, "epoch": 4741} {"train_loss": -7.259334564208984, "global_step": 199145, "epoch": 4741} {"train_loss": -7.1893696784973145, "global_step": 199146, "epoch": 4741} {"train_loss": -7.225803375244141, "global_step": 199147, "epoch": 4741} {"train_loss": -7.22625732421875, "global_step": 199148, "epoch": 4741} {"train_loss": -7.288572788238525, "global_step": 199149, "epoch": 4741} {"train_loss": -7.25067138671875, "global_step": 199150, "epoch": 4741} {"train_loss": -7.279714584350586, "global_step": 199151, "epoch": 4741} {"train_loss": -7.2200775146484375, "global_step": 199152, "epoch": 4741} {"train_loss": -7.1436285972595215, "global_step": 199153, "epoch": 4741} {"train_loss": -7.224184036254883, "global_step": 199154, "epoch": 4741} {"train_loss": -7.11302375793457, "global_step": 199155, "epoch": 4741} {"train_loss": -7.158750534057617, "global_step": 199156, "epoch": 4741} {"train_loss": -7.166180610656738, "global_step": 199157, "epoch": 4741} {"train_loss": -7.282196044921875, "global_step": 199158, "epoch": 4741} {"train_loss": -7.106632232666016, "global_step": 199159, "epoch": 4741} {"train_loss": -7.240458965301514, "global_step": 199160, "epoch": 4741} {"train_loss": -7.185993194580078, "global_step": 199161, "epoch": 4741} {"train_loss": -7.1100263595581055, "global_step": 199162, "epoch": 4741} {"train_loss": -7.203805219559443, "global_step": 199163, "epoch": 4741, "val_loss": 69027.7109375} {"train_loss": -7.345824241638184, "global_step": 199164, "epoch": 4742} {"train_loss": -7.206218719482422, "global_step": 199165, "epoch": 4742} {"train_loss": -7.165018081665039, "global_step": 199166, "epoch": 4742} {"train_loss": -7.185181617736816, "global_step": 199167, "epoch": 4742} {"train_loss": -7.2500691413879395, "global_step": 199168, "epoch": 4742} {"train_loss": -7.154722690582275, "global_step": 199169, "epoch": 4742} {"train_loss": -7.150758743286133, "global_step": 199170, "epoch": 4742} {"train_loss": -7.209277153015137, "global_step": 199171, "epoch": 4742} {"train_loss": -7.145787239074707, "global_step": 199172, "epoch": 4742} {"train_loss": -7.080550670623779, "global_step": 199173, "epoch": 4742} {"train_loss": -7.155007362365723, "global_step": 199174, "epoch": 4742} {"train_loss": -7.2063398361206055, "global_step": 199175, "epoch": 4742} {"train_loss": -7.243084907531738, "global_step": 199176, "epoch": 4742} {"train_loss": -7.228795528411865, "global_step": 199177, "epoch": 4742} {"train_loss": -7.2160749435424805, "global_step": 199178, "epoch": 4742} {"train_loss": -7.220808506011963, "global_step": 199179, "epoch": 4742} {"train_loss": -7.237759113311768, "global_step": 199180, "epoch": 4742} {"train_loss": -7.1788787841796875, "global_step": 199181, "epoch": 4742} {"train_loss": -7.2057976722717285, "global_step": 199182, "epoch": 4742} {"train_loss": -7.227125644683838, "global_step": 199183, "epoch": 4742} {"train_loss": -7.188579559326172, "global_step": 199184, "epoch": 4742} {"train_loss": -7.18658971786499, "global_step": 199185, "epoch": 4742} {"train_loss": -7.132083892822266, "global_step": 199186, "epoch": 4742} {"train_loss": -7.1316680908203125, "global_step": 199187, "epoch": 4742} {"train_loss": -7.172003746032715, "global_step": 199188, "epoch": 4742} {"train_loss": -7.152318477630615, "global_step": 199189, "epoch": 4742} {"train_loss": -7.186625957489014, "global_step": 199190, "epoch": 4742} {"train_loss": -7.124443054199219, "global_step": 199191, "epoch": 4742} {"train_loss": -7.245777130126953, "global_step": 199192, "epoch": 4742} {"train_loss": -7.202666282653809, "global_step": 199193, "epoch": 4742} {"train_loss": -7.166077613830566, "global_step": 199194, "epoch": 4742} {"train_loss": -7.20145845413208, "global_step": 199195, "epoch": 4742} {"train_loss": -7.127804756164551, "global_step": 199196, "epoch": 4742} {"train_loss": -7.218225479125977, "global_step": 199197, "epoch": 4742} {"train_loss": -7.314681529998779, "global_step": 199198, "epoch": 4742} {"train_loss": -7.1693525314331055, "global_step": 199199, "epoch": 4742} {"train_loss": -7.159544467926025, "global_step": 199200, "epoch": 4742} {"train_loss": -7.007672309875488, "global_step": 199201, "epoch": 4742} {"train_loss": -7.159781455993652, "global_step": 199202, "epoch": 4742} {"train_loss": -7.17775821685791, "global_step": 199203, "epoch": 4742} {"train_loss": -7.131434440612793, "global_step": 199204, "epoch": 4742} {"train_loss": -7.183888866787865, "global_step": 199205, "epoch": 4742, "val_loss": 69042.6640625} {"train_loss": -7.219437599182129, "global_step": 199206, "epoch": 4743} {"train_loss": -7.143789291381836, "global_step": 199207, "epoch": 4743} {"train_loss": -7.3222575187683105, "global_step": 199208, "epoch": 4743} {"train_loss": -7.221656799316406, "global_step": 199209, "epoch": 4743} {"train_loss": -7.209193706512451, "global_step": 199210, "epoch": 4743} {"train_loss": -7.211235046386719, "global_step": 199211, "epoch": 4743} {"train_loss": -7.134345531463623, "global_step": 199212, "epoch": 4743} {"train_loss": -7.204195022583008, "global_step": 199213, "epoch": 4743} {"train_loss": -7.188068389892578, "global_step": 199214, "epoch": 4743} {"train_loss": -7.211116790771484, "global_step": 199215, "epoch": 4743} {"train_loss": -7.227236270904541, "global_step": 199216, "epoch": 4743} {"train_loss": -7.186227798461914, "global_step": 199217, "epoch": 4743} {"train_loss": -7.132556915283203, "global_step": 199218, "epoch": 4743} {"train_loss": -7.273853302001953, "global_step": 199219, "epoch": 4743} {"train_loss": -7.240289688110352, "global_step": 199220, "epoch": 4743} {"train_loss": -7.140625476837158, "global_step": 199221, "epoch": 4743} {"train_loss": -7.2068328857421875, "global_step": 199222, "epoch": 4743} {"train_loss": -7.178219795227051, "global_step": 199223, "epoch": 4743} {"train_loss": -7.149259090423584, "global_step": 199224, "epoch": 4743} {"train_loss": -7.171369552612305, "global_step": 199225, "epoch": 4743} {"train_loss": -7.148102760314941, "global_step": 199226, "epoch": 4743} {"train_loss": -7.130012512207031, "global_step": 199227, "epoch": 4743} {"train_loss": -6.993763446807861, "global_step": 199228, "epoch": 4743} {"train_loss": -7.063161373138428, "global_step": 199229, "epoch": 4743} {"train_loss": -7.177608489990234, "global_step": 199230, "epoch": 4743} {"train_loss": -7.133766174316406, "global_step": 199231, "epoch": 4743} {"train_loss": -7.138387680053711, "global_step": 199232, "epoch": 4743} {"train_loss": -6.973470687866211, "global_step": 199233, "epoch": 4743} {"train_loss": -7.0739898681640625, "global_step": 199234, "epoch": 4743} {"train_loss": -7.048994064331055, "global_step": 199235, "epoch": 4743} {"train_loss": -7.197098731994629, "global_step": 199236, "epoch": 4743} {"train_loss": -7.228751182556152, "global_step": 199237, "epoch": 4743} {"train_loss": -7.12969446182251, "global_step": 199238, "epoch": 4743} {"train_loss": -7.208800315856934, "global_step": 199239, "epoch": 4743} {"train_loss": -7.191586494445801, "global_step": 199240, "epoch": 4743} {"train_loss": -7.186331748962402, "global_step": 199241, "epoch": 4743} {"train_loss": -7.209765434265137, "global_step": 199242, "epoch": 4743} {"train_loss": -7.10907506942749, "global_step": 199243, "epoch": 4743} {"train_loss": -7.172846794128418, "global_step": 199244, "epoch": 4743} {"train_loss": -7.207925319671631, "global_step": 199245, "epoch": 4743} {"train_loss": -7.168869972229004, "global_step": 199246, "epoch": 4743} {"train_loss": -7.167270240329561, "global_step": 199247, "epoch": 4743, "val_loss": 68972.234375} {"train_loss": -7.2568840980529785, "global_step": 199248, "epoch": 4744} {"train_loss": -7.145358085632324, "global_step": 199249, "epoch": 4744} {"train_loss": -7.242293357849121, "global_step": 199250, "epoch": 4744} {"train_loss": -7.173534393310547, "global_step": 199251, "epoch": 4744} {"train_loss": -7.215697288513184, "global_step": 199252, "epoch": 4744} {"train_loss": -7.229153633117676, "global_step": 199253, "epoch": 4744} {"train_loss": -7.436696529388428, "global_step": 199254, "epoch": 4744} {"train_loss": -7.282697677612305, "global_step": 199255, "epoch": 4744} {"train_loss": -7.319077014923096, "global_step": 199256, "epoch": 4744} {"train_loss": -7.178680419921875, "global_step": 199257, "epoch": 4744} {"train_loss": -7.18142032623291, "global_step": 199258, "epoch": 4744} {"train_loss": -7.226057052612305, "global_step": 199259, "epoch": 4744} {"train_loss": -7.249465465545654, "global_step": 199260, "epoch": 4744} {"train_loss": -7.217331886291504, "global_step": 199261, "epoch": 4744} {"train_loss": -7.161252975463867, "global_step": 199262, "epoch": 4744} {"train_loss": -7.374788284301758, "global_step": 199263, "epoch": 4744} {"train_loss": -7.079099655151367, "global_step": 199264, "epoch": 4744} {"train_loss": -7.319923400878906, "global_step": 199265, "epoch": 4744} {"train_loss": -7.1795830726623535, "global_step": 199266, "epoch": 4744} {"train_loss": -7.139843940734863, "global_step": 199267, "epoch": 4744} {"train_loss": -7.266671657562256, "global_step": 199268, "epoch": 4744} {"train_loss": -7.2512407302856445, "global_step": 199269, "epoch": 4744} {"train_loss": -7.229921340942383, "global_step": 199270, "epoch": 4744} {"train_loss": -7.243958473205566, "global_step": 199271, "epoch": 4744} {"train_loss": -7.207303047180176, "global_step": 199272, "epoch": 4744} {"train_loss": -7.152897357940674, "global_step": 199273, "epoch": 4744} {"train_loss": -7.2130889892578125, "global_step": 199274, "epoch": 4744} {"train_loss": -7.275227069854736, "global_step": 199275, "epoch": 4744} {"train_loss": -7.329047203063965, "global_step": 199276, "epoch": 4744} {"train_loss": -7.261551856994629, "global_step": 199277, "epoch": 4744} {"train_loss": -7.384696006774902, "global_step": 199278, "epoch": 4744} {"train_loss": -7.261928558349609, "global_step": 199279, "epoch": 4744} {"train_loss": -7.158702850341797, "global_step": 199280, "epoch": 4744} {"train_loss": -7.281795501708984, "global_step": 199281, "epoch": 4744} {"train_loss": -7.222840309143066, "global_step": 199282, "epoch": 4744} {"train_loss": -7.201121807098389, "global_step": 199283, "epoch": 4744} {"train_loss": -7.2945661544799805, "global_step": 199284, "epoch": 4744} {"train_loss": -7.262897491455078, "global_step": 199285, "epoch": 4744} {"train_loss": -7.291815757751465, "global_step": 199286, "epoch": 4744} {"train_loss": -7.1859517097473145, "global_step": 199287, "epoch": 4744} {"train_loss": -7.13212251663208, "global_step": 199288, "epoch": 4744} {"train_loss": -7.238259349550519, "global_step": 199289, "epoch": 4744, "val_loss": 69072.1484375} {"train_loss": -7.223730564117432, "global_step": 199290, "epoch": 4745} {"train_loss": -7.158607482910156, "global_step": 199291, "epoch": 4745} {"train_loss": -7.212533950805664, "global_step": 199292, "epoch": 4745} {"train_loss": -7.207132339477539, "global_step": 199293, "epoch": 4745} {"train_loss": -7.3214311599731445, "global_step": 199294, "epoch": 4745} {"train_loss": -7.34706974029541, "global_step": 199295, "epoch": 4745} {"train_loss": -7.206194877624512, "global_step": 199296, "epoch": 4745} {"train_loss": -7.084493637084961, "global_step": 199297, "epoch": 4745} {"train_loss": -7.162649154663086, "global_step": 199298, "epoch": 4745} {"train_loss": -7.212863445281982, "global_step": 199299, "epoch": 4745} {"train_loss": -7.169061183929443, "global_step": 199300, "epoch": 4745} {"train_loss": -7.296361923217773, "global_step": 199301, "epoch": 4745} {"train_loss": -7.295684337615967, "global_step": 199302, "epoch": 4745} {"train_loss": -7.238334655761719, "global_step": 199303, "epoch": 4745} {"train_loss": -7.1835126876831055, "global_step": 199304, "epoch": 4745} {"train_loss": -7.2288079261779785, "global_step": 199305, "epoch": 4745} {"train_loss": -7.194696426391602, "global_step": 199306, "epoch": 4745} {"train_loss": -7.178277492523193, "global_step": 199307, "epoch": 4745} {"train_loss": -7.2604851722717285, "global_step": 199308, "epoch": 4745} {"train_loss": -7.1880106925964355, "global_step": 199309, "epoch": 4745} {"train_loss": -7.2091522216796875, "global_step": 199310, "epoch": 4745} {"train_loss": -7.13839054107666, "global_step": 199311, "epoch": 4745} {"train_loss": -7.227227210998535, "global_step": 199312, "epoch": 4745} {"train_loss": -7.209529399871826, "global_step": 199313, "epoch": 4745} {"train_loss": -7.218772888183594, "global_step": 199314, "epoch": 4745} {"train_loss": -7.2357587814331055, "global_step": 199315, "epoch": 4745} {"train_loss": -7.243659496307373, "global_step": 199316, "epoch": 4745} {"train_loss": -7.307090759277344, "global_step": 199317, "epoch": 4745} {"train_loss": -7.254072189331055, "global_step": 199318, "epoch": 4745} {"train_loss": -7.171550273895264, "global_step": 199319, "epoch": 4745} {"train_loss": -7.311699867248535, "global_step": 199320, "epoch": 4745} {"train_loss": -7.266988277435303, "global_step": 199321, "epoch": 4745} {"train_loss": -7.230761528015137, "global_step": 199322, "epoch": 4745} {"train_loss": -7.262465953826904, "global_step": 199323, "epoch": 4745} {"train_loss": -7.162860870361328, "global_step": 199324, "epoch": 4745} {"train_loss": -7.172013282775879, "global_step": 199325, "epoch": 4745} {"train_loss": -7.227829933166504, "global_step": 199326, "epoch": 4745} {"train_loss": -7.1897664070129395, "global_step": 199327, "epoch": 4745} {"train_loss": -7.227341651916504, "global_step": 199328, "epoch": 4745} {"train_loss": -7.212034225463867, "global_step": 199329, "epoch": 4745} {"train_loss": -7.281155586242676, "global_step": 199330, "epoch": 4745} {"train_loss": -7.223254782812936, "global_step": 199331, "epoch": 4745, "val_loss": 69045.7734375} {"train_loss": -7.177834987640381, "global_step": 199332, "epoch": 4746} {"train_loss": -7.216963768005371, "global_step": 199333, "epoch": 4746} {"train_loss": -7.195915222167969, "global_step": 199334, "epoch": 4746} {"train_loss": -7.285243988037109, "global_step": 199335, "epoch": 4746} {"train_loss": -7.230675220489502, "global_step": 199336, "epoch": 4746} {"train_loss": -7.297251224517822, "global_step": 199337, "epoch": 4746} {"train_loss": -7.344292640686035, "global_step": 199338, "epoch": 4746} {"train_loss": -7.313889503479004, "global_step": 199339, "epoch": 4746} {"train_loss": -7.251354217529297, "global_step": 199340, "epoch": 4746} {"train_loss": -7.319858551025391, "global_step": 199341, "epoch": 4746} {"train_loss": -7.148719787597656, "global_step": 199342, "epoch": 4746} {"train_loss": -7.231668949127197, "global_step": 199343, "epoch": 4746} {"train_loss": -7.142164707183838, "global_step": 199344, "epoch": 4746} {"train_loss": -7.2448530197143555, "global_step": 199345, "epoch": 4746} {"train_loss": -7.281407356262207, "global_step": 199346, "epoch": 4746} {"train_loss": -7.294067859649658, "global_step": 199347, "epoch": 4746} {"train_loss": -7.302608489990234, "global_step": 199348, "epoch": 4746} {"train_loss": -7.2485671043396, "global_step": 199349, "epoch": 4746} {"train_loss": -7.316281318664551, "global_step": 199350, "epoch": 4746} {"train_loss": -7.238415718078613, "global_step": 199351, "epoch": 4746} {"train_loss": -7.241243362426758, "global_step": 199352, "epoch": 4746} {"train_loss": -7.232661247253418, "global_step": 199353, "epoch": 4746} {"train_loss": -7.330167293548584, "global_step": 199354, "epoch": 4746} {"train_loss": -7.261960029602051, "global_step": 199355, "epoch": 4746} {"train_loss": -7.173698425292969, "global_step": 199356, "epoch": 4746} {"train_loss": -7.376497745513916, "global_step": 199357, "epoch": 4746} {"train_loss": -7.1962103843688965, "global_step": 199358, "epoch": 4746} {"train_loss": -7.277614593505859, "global_step": 199359, "epoch": 4746} {"train_loss": -7.213930130004883, "global_step": 199360, "epoch": 4746} {"train_loss": -7.243439197540283, "global_step": 199361, "epoch": 4746} {"train_loss": -7.278125762939453, "global_step": 199362, "epoch": 4746} {"train_loss": -7.276092052459717, "global_step": 199363, "epoch": 4746} {"train_loss": -7.26605224609375, "global_step": 199364, "epoch": 4746} {"train_loss": -7.244176387786865, "global_step": 199365, "epoch": 4746} {"train_loss": -7.202393531799316, "global_step": 199366, "epoch": 4746} {"train_loss": -7.1552839279174805, "global_step": 199367, "epoch": 4746} {"train_loss": -7.249936580657959, "global_step": 199368, "epoch": 4746} {"train_loss": -7.209650039672852, "global_step": 199369, "epoch": 4746} {"train_loss": -7.214483261108398, "global_step": 199370, "epoch": 4746} {"train_loss": -7.186664581298828, "global_step": 199371, "epoch": 4746} {"train_loss": -7.162577152252197, "global_step": 199372, "epoch": 4746} {"train_loss": -7.245660566148304, "global_step": 199373, "epoch": 4746, "val_loss": 68994.4140625} {"train_loss": -7.377673149108887, "global_step": 199374, "epoch": 4747} {"train_loss": -7.2051286697387695, "global_step": 199375, "epoch": 4747} {"train_loss": -7.264307022094727, "global_step": 199376, "epoch": 4747} {"train_loss": -7.217511177062988, "global_step": 199377, "epoch": 4747} {"train_loss": -7.296734809875488, "global_step": 199378, "epoch": 4747} {"train_loss": -7.3027262687683105, "global_step": 199379, "epoch": 4747} {"train_loss": -7.126731872558594, "global_step": 199380, "epoch": 4747} {"train_loss": -7.227113723754883, "global_step": 199381, "epoch": 4747} {"train_loss": -7.150964736938477, "global_step": 199382, "epoch": 4747} {"train_loss": -7.287384986877441, "global_step": 199383, "epoch": 4747} {"train_loss": -7.060073375701904, "global_step": 199384, "epoch": 4747} {"train_loss": -7.3305253982543945, "global_step": 199385, "epoch": 4747} {"train_loss": -7.204995155334473, "global_step": 199386, "epoch": 4747} {"train_loss": -7.173854827880859, "global_step": 199387, "epoch": 4747} {"train_loss": -7.152782440185547, "global_step": 199388, "epoch": 4747} {"train_loss": -6.998217582702637, "global_step": 199389, "epoch": 4747} {"train_loss": -7.232532978057861, "global_step": 199390, "epoch": 4747} {"train_loss": -7.326685905456543, "global_step": 199391, "epoch": 4747} {"train_loss": -7.124607086181641, "global_step": 199392, "epoch": 4747} {"train_loss": -7.081315994262695, "global_step": 199393, "epoch": 4747} {"train_loss": -7.036108016967773, "global_step": 199394, "epoch": 4747} {"train_loss": -6.939101219177246, "global_step": 199395, "epoch": 4747} {"train_loss": -7.0015764236450195, "global_step": 199396, "epoch": 4747} {"train_loss": -7.018283843994141, "global_step": 199397, "epoch": 4747} {"train_loss": -7.007901191711426, "global_step": 199398, "epoch": 4747} {"train_loss": -7.204035758972168, "global_step": 199399, "epoch": 4747} {"train_loss": -6.823908805847168, "global_step": 199400, "epoch": 4747} {"train_loss": -7.006778717041016, "global_step": 199401, "epoch": 4747} {"train_loss": -7.081191062927246, "global_step": 199402, "epoch": 4747} {"train_loss": -6.986542224884033, "global_step": 199403, "epoch": 4747} {"train_loss": -7.027237892150879, "global_step": 199404, "epoch": 4747} {"train_loss": -6.996342658996582, "global_step": 199405, "epoch": 4747} {"train_loss": -6.962009429931641, "global_step": 199406, "epoch": 4747} {"train_loss": -7.103127479553223, "global_step": 199407, "epoch": 4747} {"train_loss": -7.114504814147949, "global_step": 199408, "epoch": 4747} {"train_loss": -7.099953651428223, "global_step": 199409, "epoch": 4747} {"train_loss": -7.136733055114746, "global_step": 199410, "epoch": 4747} {"train_loss": -7.117092132568359, "global_step": 199411, "epoch": 4747} {"train_loss": -7.09596586227417, "global_step": 199412, "epoch": 4747} {"train_loss": -7.045649528503418, "global_step": 199413, "epoch": 4747} {"train_loss": -7.161621570587158, "global_step": 199414, "epoch": 4747} {"train_loss": -7.126301617849441, "global_step": 199415, "epoch": 4747, "val_loss": 69098.171875} {"train_loss": -7.254490852355957, "global_step": 199416, "epoch": 4748} {"train_loss": -7.116451263427734, "global_step": 199417, "epoch": 4748} {"train_loss": -7.198137283325195, "global_step": 199418, "epoch": 4748} {"train_loss": -7.109243392944336, "global_step": 199419, "epoch": 4748} {"train_loss": -7.004263877868652, "global_step": 199420, "epoch": 4748} {"train_loss": -7.210761547088623, "global_step": 199421, "epoch": 4748} {"train_loss": -7.170536518096924, "global_step": 199422, "epoch": 4748} {"train_loss": -7.1333160400390625, "global_step": 199423, "epoch": 4748} {"train_loss": -7.138093948364258, "global_step": 199424, "epoch": 4748} {"train_loss": -7.187519550323486, "global_step": 199425, "epoch": 4748} {"train_loss": -7.037980556488037, "global_step": 199426, "epoch": 4748} {"train_loss": -7.057252883911133, "global_step": 199427, "epoch": 4748} {"train_loss": -7.165519714355469, "global_step": 199428, "epoch": 4748} {"train_loss": -7.146511077880859, "global_step": 199429, "epoch": 4748} {"train_loss": -7.122692108154297, "global_step": 199430, "epoch": 4748} {"train_loss": -7.089879512786865, "global_step": 199431, "epoch": 4748} {"train_loss": -7.131201267242432, "global_step": 199432, "epoch": 4748} {"train_loss": -7.077939033508301, "global_step": 199433, "epoch": 4748} {"train_loss": -7.239130973815918, "global_step": 199434, "epoch": 4748} {"train_loss": -7.188588619232178, "global_step": 199435, "epoch": 4748} {"train_loss": -6.964048862457275, "global_step": 199436, "epoch": 4748} {"train_loss": -7.170248508453369, "global_step": 199437, "epoch": 4748} {"train_loss": -7.154542922973633, "global_step": 199438, "epoch": 4748} {"train_loss": -7.165158271789551, "global_step": 199439, "epoch": 4748} {"train_loss": -7.255426406860352, "global_step": 199440, "epoch": 4748} {"train_loss": -7.330840110778809, "global_step": 199441, "epoch": 4748} {"train_loss": -7.283468246459961, "global_step": 199442, "epoch": 4748} {"train_loss": -7.23176908493042, "global_step": 199443, "epoch": 4748} {"train_loss": -7.218827247619629, "global_step": 199444, "epoch": 4748} {"train_loss": -7.173448085784912, "global_step": 199445, "epoch": 4748} {"train_loss": -7.34999942779541, "global_step": 199446, "epoch": 4748} {"train_loss": -7.404664039611816, "global_step": 199447, "epoch": 4748} {"train_loss": -7.297558307647705, "global_step": 199448, "epoch": 4748} {"train_loss": -7.248112201690674, "global_step": 199449, "epoch": 4748} {"train_loss": -7.293549060821533, "global_step": 199450, "epoch": 4748} {"train_loss": -7.142518043518066, "global_step": 199451, "epoch": 4748} {"train_loss": -7.211824417114258, "global_step": 199452, "epoch": 4748} {"train_loss": -7.286442756652832, "global_step": 199453, "epoch": 4748} {"train_loss": -7.3300275802612305, "global_step": 199454, "epoch": 4748} {"train_loss": -7.207428932189941, "global_step": 199455, "epoch": 4748} {"train_loss": -7.2618865966796875, "global_step": 199456, "epoch": 4748} {"train_loss": -7.18957815851484, "global_step": 199457, "epoch": 4748, "val_loss": 69125.8203125} {"train_loss": -7.235106468200684, "global_step": 199458, "epoch": 4749} {"train_loss": -7.273102283477783, "global_step": 199459, "epoch": 4749} {"train_loss": -7.177032470703125, "global_step": 199460, "epoch": 4749} {"train_loss": -7.305133819580078, "global_step": 199461, "epoch": 4749} {"train_loss": -7.2989044189453125, "global_step": 199462, "epoch": 4749} {"train_loss": -7.2413129806518555, "global_step": 199463, "epoch": 4749} {"train_loss": -7.284860610961914, "global_step": 199464, "epoch": 4749} {"train_loss": -7.314522743225098, "global_step": 199465, "epoch": 4749} {"train_loss": -7.262884616851807, "global_step": 199466, "epoch": 4749} {"train_loss": -7.35777473449707, "global_step": 199467, "epoch": 4749} {"train_loss": -7.257936000823975, "global_step": 199468, "epoch": 4749} {"train_loss": -7.326746940612793, "global_step": 199469, "epoch": 4749} {"train_loss": -7.263569355010986, "global_step": 199470, "epoch": 4749} {"train_loss": -7.305662155151367, "global_step": 199471, "epoch": 4749} {"train_loss": -7.283633232116699, "global_step": 199472, "epoch": 4749} {"train_loss": -7.235089302062988, "global_step": 199473, "epoch": 4749} {"train_loss": -7.365869522094727, "global_step": 199474, "epoch": 4749} {"train_loss": -7.229842185974121, "global_step": 199475, "epoch": 4749} {"train_loss": -7.357058048248291, "global_step": 199476, "epoch": 4749} {"train_loss": -7.2627105712890625, "global_step": 199477, "epoch": 4749} {"train_loss": -7.192204475402832, "global_step": 199478, "epoch": 4749} {"train_loss": -7.138514518737793, "global_step": 199479, "epoch": 4749} {"train_loss": -7.266758918762207, "global_step": 199480, "epoch": 4749} {"train_loss": -7.319282054901123, "global_step": 199481, "epoch": 4749} {"train_loss": -7.310807228088379, "global_step": 199482, "epoch": 4749} {"train_loss": -7.233928680419922, "global_step": 199483, "epoch": 4749} {"train_loss": -7.216949462890625, "global_step": 199484, "epoch": 4749} {"train_loss": -7.19187068939209, "global_step": 199485, "epoch": 4749} {"train_loss": -7.254280090332031, "global_step": 199486, "epoch": 4749} {"train_loss": -7.212894439697266, "global_step": 199487, "epoch": 4749} {"train_loss": -7.140758514404297, "global_step": 199488, "epoch": 4749} {"train_loss": -7.181656837463379, "global_step": 199489, "epoch": 4749} {"train_loss": -7.1603102684021, "global_step": 199490, "epoch": 4749} {"train_loss": -7.117294788360596, "global_step": 199491, "epoch": 4749} {"train_loss": -7.221616744995117, "global_step": 199492, "epoch": 4749} {"train_loss": -7.274219989776611, "global_step": 199493, "epoch": 4749} {"train_loss": -7.138484954833984, "global_step": 199494, "epoch": 4749} {"train_loss": -7.276122093200684, "global_step": 199495, "epoch": 4749} {"train_loss": -7.228087425231934, "global_step": 199496, "epoch": 4749} {"train_loss": -7.202448844909668, "global_step": 199497, "epoch": 4749} {"train_loss": -7.209020614624023, "global_step": 199498, "epoch": 4749} {"train_loss": -7.247392688478742, "global_step": 199499, "epoch": 4749, "val_loss": 69059.421875} {"train_loss": -7.186457633972168, "global_step": 199500, "epoch": 4750} {"train_loss": -7.258218288421631, "global_step": 199501, "epoch": 4750} {"train_loss": -7.298327445983887, "global_step": 199502, "epoch": 4750} {"train_loss": -7.20923376083374, "global_step": 199503, "epoch": 4750} {"train_loss": -7.206036567687988, "global_step": 199504, "epoch": 4750} {"train_loss": -7.256012916564941, "global_step": 199505, "epoch": 4750} {"train_loss": -7.193946838378906, "global_step": 199506, "epoch": 4750} {"train_loss": -7.26332950592041, "global_step": 199507, "epoch": 4750} {"train_loss": -7.149031162261963, "global_step": 199508, "epoch": 4750} {"train_loss": -7.1338701248168945, "global_step": 199509, "epoch": 4750} {"train_loss": -7.242771148681641, "global_step": 199510, "epoch": 4750} {"train_loss": -7.2230916023254395, "global_step": 199511, "epoch": 4750} {"train_loss": -7.250998497009277, "global_step": 199512, "epoch": 4750} {"train_loss": -7.32797908782959, "global_step": 199513, "epoch": 4750} {"train_loss": -7.315184593200684, "global_step": 199514, "epoch": 4750} {"train_loss": -7.214883804321289, "global_step": 199515, "epoch": 4750} {"train_loss": -7.2049431800842285, "global_step": 199516, "epoch": 4750} {"train_loss": -7.352199554443359, "global_step": 199517, "epoch": 4750} {"train_loss": -7.17789363861084, "global_step": 199518, "epoch": 4750} {"train_loss": -7.224462985992432, "global_step": 199519, "epoch": 4750} {"train_loss": -7.150644302368164, "global_step": 199520, "epoch": 4750} {"train_loss": -7.288710117340088, "global_step": 199521, "epoch": 4750} {"train_loss": -7.293704986572266, "global_step": 199522, "epoch": 4750} {"train_loss": -7.063164234161377, "global_step": 199523, "epoch": 4750} {"train_loss": -7.282349586486816, "global_step": 199524, "epoch": 4750} {"train_loss": -7.08528995513916, "global_step": 199525, "epoch": 4750} {"train_loss": -7.1592206954956055, "global_step": 199526, "epoch": 4750} {"train_loss": -7.166285037994385, "global_step": 199527, "epoch": 4750} {"train_loss": -7.0420942306518555, "global_step": 199528, "epoch": 4750} {"train_loss": -7.200377464294434, "global_step": 199529, "epoch": 4750} {"train_loss": -7.122158527374268, "global_step": 199530, "epoch": 4750} {"train_loss": -7.061781406402588, "global_step": 199531, "epoch": 4750} {"train_loss": -7.109090805053711, "global_step": 199532, "epoch": 4750} {"train_loss": -7.085921287536621, "global_step": 199533, "epoch": 4750} {"train_loss": -7.2034196853637695, "global_step": 199534, "epoch": 4750} {"train_loss": -7.012689113616943, "global_step": 199535, "epoch": 4750} {"train_loss": -7.009183883666992, "global_step": 199536, "epoch": 4750} {"train_loss": -7.249916076660156, "global_step": 199537, "epoch": 4750} {"train_loss": -7.201986312866211, "global_step": 199538, "epoch": 4750} {"train_loss": -7.310093879699707, "global_step": 199539, "epoch": 4750} {"train_loss": -7.291738510131836, "global_step": 199540, "epoch": 4750} {"train_loss": -7.197146268117995, "global_step": 199541, "epoch": 4750, "train/sim_max_reward_0": 0.2413057918361709, "train/sim_max_reward_1": 0.9940756190106823, "train/sim_max_reward_2": 0.9795441553281479, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9096569417385227, "train/sim_max_reward_5": 0.4364864919027378, "test/sim_max_reward_4400000": 0.9940412601083314, "test/sim_max_reward_4400001": 0.9652010709638543, "test/sim_max_reward_4400002": 0.7976093735930078, "test/sim_max_reward_4400003": 0.6585399438334756, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.3074971019600035, "test/sim_max_reward_4400006": 0.6305350770023403, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.30421300048368866, "test/sim_max_reward_4400009": 0.8161431650175159, "test/sim_max_reward_4400010": 0.9481636725350522, "test/sim_max_reward_4400011": 0.08418882817917583, "test/sim_max_reward_4400012": 0.971745143224919, "test/sim_max_reward_4400013": 0.9969379680464064, "test/sim_max_reward_4400014": 0.7082729806635354, "test/sim_max_reward_4400015": 0.012424153016505818, "test/sim_max_reward_4400016": 0.9100479634951376, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.3160346213386783, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.996232168124796, "test/sim_max_reward_4400023": 0.42266246211710073, "test/sim_max_reward_4400024": 0.8949564758111368, "test/sim_max_reward_4400025": 0.27196299540393, "test/sim_max_reward_4400026": 0.804177893749193, "test/sim_max_reward_4400027": 0.0018532615184286463, "test/sim_max_reward_4400028": 0.7036447850329413, "test/sim_max_reward_4400029": 0.6929746554392875, "test/sim_max_reward_4400030": 0.9953418647181986, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9183833563284903, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.7845532747289882, "test/sim_max_reward_4400036": 0.49369125435808675, "test/sim_max_reward_4400037": 0.9621707591925931, "test/sim_max_reward_4400038": 0.9669752321014982, "test/sim_max_reward_4400039": 0.9976715995030259, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.9603308326206901, "test/sim_max_reward_4400043": 0.006610638632624136, "test/sim_max_reward_4400044": 0.9999517078889878, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.8868726961580253, "test/sim_max_reward_4400047": 0.9552329401369875, "test/sim_max_reward_4400048": 0.14551469637364295, "test/sim_max_reward_4400049": 0.9662501544750128, "train/mean_score": 0.7601781666360435, "test/mean_score": 0.6144610256771103, "val_loss": 68987.75} {"train_loss": -7.216399192810059, "global_step": 199542, "epoch": 4751} {"train_loss": -7.137998580932617, "global_step": 199543, "epoch": 4751} {"train_loss": -7.1387104988098145, "global_step": 199544, "epoch": 4751} {"train_loss": -7.275520324707031, "global_step": 199545, "epoch": 4751} {"train_loss": -7.049748420715332, "global_step": 199546, "epoch": 4751} {"train_loss": -7.172291278839111, "global_step": 199547, "epoch": 4751} {"train_loss": -7.276521682739258, "global_step": 199548, "epoch": 4751} {"train_loss": -7.094928741455078, "global_step": 199549, "epoch": 4751} {"train_loss": -7.187735557556152, "global_step": 199550, "epoch": 4751} {"train_loss": -7.0868425369262695, "global_step": 199551, "epoch": 4751} {"train_loss": -7.2404279708862305, "global_step": 199552, "epoch": 4751} {"train_loss": -7.262027740478516, "global_step": 199553, "epoch": 4751} {"train_loss": -7.122354030609131, "global_step": 199554, "epoch": 4751} {"train_loss": -7.250217437744141, "global_step": 199555, "epoch": 4751} {"train_loss": -7.214142799377441, "global_step": 199556, "epoch": 4751} {"train_loss": -7.169024467468262, "global_step": 199557, "epoch": 4751} {"train_loss": -7.024902820587158, "global_step": 199558, "epoch": 4751} {"train_loss": -7.152993202209473, "global_step": 199559, "epoch": 4751} {"train_loss": -7.261965751647949, "global_step": 199560, "epoch": 4751} {"train_loss": -7.172590732574463, "global_step": 199561, "epoch": 4751} {"train_loss": -7.284770965576172, "global_step": 199562, "epoch": 4751} {"train_loss": -7.0891313552856445, "global_step": 199563, "epoch": 4751} {"train_loss": -7.034906387329102, "global_step": 199564, "epoch": 4751} {"train_loss": -7.099925518035889, "global_step": 199565, "epoch": 4751} {"train_loss": -7.209357261657715, "global_step": 199566, "epoch": 4751} {"train_loss": -7.237266540527344, "global_step": 199567, "epoch": 4751} {"train_loss": -7.102451324462891, "global_step": 199568, "epoch": 4751} {"train_loss": -7.055140495300293, "global_step": 199569, "epoch": 4751} {"train_loss": -7.147552013397217, "global_step": 199570, "epoch": 4751} {"train_loss": -6.997014999389648, "global_step": 199571, "epoch": 4751} {"train_loss": -7.187638759613037, "global_step": 199572, "epoch": 4751} {"train_loss": -7.067588806152344, "global_step": 199573, "epoch": 4751} {"train_loss": -7.1373138427734375, "global_step": 199574, "epoch": 4751} {"train_loss": -7.118643760681152, "global_step": 199575, "epoch": 4751} {"train_loss": -7.2229766845703125, "global_step": 199576, "epoch": 4751} {"train_loss": -7.126064300537109, "global_step": 199577, "epoch": 4751} {"train_loss": -7.199210166931152, "global_step": 199578, "epoch": 4751} {"train_loss": -7.133103847503662, "global_step": 199579, "epoch": 4751} {"train_loss": -7.075560569763184, "global_step": 199580, "epoch": 4751} {"train_loss": -7.195364952087402, "global_step": 199581, "epoch": 4751} {"train_loss": -7.308474063873291, "global_step": 199582, "epoch": 4751} {"train_loss": -7.160606384277344, "global_step": 199583, "epoch": 4751, "val_loss": 68992.421875} {"train_loss": -7.129369258880615, "global_step": 199584, "epoch": 4752} {"train_loss": -7.279653549194336, "global_step": 199585, "epoch": 4752} {"train_loss": -7.248395919799805, "global_step": 199586, "epoch": 4752} {"train_loss": -7.1765522956848145, "global_step": 199587, "epoch": 4752} {"train_loss": -7.208049774169922, "global_step": 199588, "epoch": 4752} {"train_loss": -7.27088737487793, "global_step": 199589, "epoch": 4752} {"train_loss": -7.19778299331665, "global_step": 199590, "epoch": 4752} {"train_loss": -7.257890701293945, "global_step": 199591, "epoch": 4752} {"train_loss": -7.302206039428711, "global_step": 199592, "epoch": 4752} {"train_loss": -7.300213813781738, "global_step": 199593, "epoch": 4752} {"train_loss": -7.22556734085083, "global_step": 199594, "epoch": 4752} {"train_loss": -7.2031707763671875, "global_step": 199595, "epoch": 4752} {"train_loss": -7.243330478668213, "global_step": 199596, "epoch": 4752} {"train_loss": -7.177005767822266, "global_step": 199597, "epoch": 4752} {"train_loss": -7.24057149887085, "global_step": 199598, "epoch": 4752} {"train_loss": -7.210169792175293, "global_step": 199599, "epoch": 4752} {"train_loss": -7.204878330230713, "global_step": 199600, "epoch": 4752} {"train_loss": -7.209514617919922, "global_step": 199601, "epoch": 4752} {"train_loss": -7.14912748336792, "global_step": 199602, "epoch": 4752} {"train_loss": -7.127309322357178, "global_step": 199603, "epoch": 4752} {"train_loss": -7.253076553344727, "global_step": 199604, "epoch": 4752} {"train_loss": -7.13441801071167, "global_step": 199605, "epoch": 4752} {"train_loss": -7.237865447998047, "global_step": 199606, "epoch": 4752} {"train_loss": -7.271181583404541, "global_step": 199607, "epoch": 4752} {"train_loss": -7.357282638549805, "global_step": 199608, "epoch": 4752} {"train_loss": -7.210721015930176, "global_step": 199609, "epoch": 4752} {"train_loss": -7.2262864112854, "global_step": 199610, "epoch": 4752} {"train_loss": -7.245412349700928, "global_step": 199611, "epoch": 4752} {"train_loss": -7.262970924377441, "global_step": 199612, "epoch": 4752} {"train_loss": -7.293365955352783, "global_step": 199613, "epoch": 4752} {"train_loss": -7.097311496734619, "global_step": 199614, "epoch": 4752} {"train_loss": -7.212370872497559, "global_step": 199615, "epoch": 4752} {"train_loss": -7.248625755310059, "global_step": 199616, "epoch": 4752} {"train_loss": -7.183698654174805, "global_step": 199617, "epoch": 4752} {"train_loss": -7.225580215454102, "global_step": 199618, "epoch": 4752} {"train_loss": -7.142877578735352, "global_step": 199619, "epoch": 4752} {"train_loss": -7.239479064941406, "global_step": 199620, "epoch": 4752} {"train_loss": -7.317525863647461, "global_step": 199621, "epoch": 4752} {"train_loss": -7.2266340255737305, "global_step": 199622, "epoch": 4752} {"train_loss": -7.258095741271973, "global_step": 199623, "epoch": 4752} {"train_loss": -7.1872453689575195, "global_step": 199624, "epoch": 4752} {"train_loss": -7.22610050156003, "global_step": 199625, "epoch": 4752, "val_loss": 69183.0078125} {"train_loss": -7.407844066619873, "global_step": 199626, "epoch": 4753} {"train_loss": -7.191891193389893, "global_step": 199627, "epoch": 4753} {"train_loss": -7.144327163696289, "global_step": 199628, "epoch": 4753} {"train_loss": -7.157220363616943, "global_step": 199629, "epoch": 4753} {"train_loss": -7.0851240158081055, "global_step": 199630, "epoch": 4753} {"train_loss": -7.190768718719482, "global_step": 199631, "epoch": 4753} {"train_loss": -6.8512678146362305, "global_step": 199632, "epoch": 4753} {"train_loss": -7.25573205947876, "global_step": 199633, "epoch": 4753} {"train_loss": -7.081449508666992, "global_step": 199634, "epoch": 4753} {"train_loss": -7.179599285125732, "global_step": 199635, "epoch": 4753} {"train_loss": -7.206487655639648, "global_step": 199636, "epoch": 4753} {"train_loss": -7.226393699645996, "global_step": 199637, "epoch": 4753} {"train_loss": -7.22999382019043, "global_step": 199638, "epoch": 4753} {"train_loss": -7.227578639984131, "global_step": 199639, "epoch": 4753} {"train_loss": -7.074795722961426, "global_step": 199640, "epoch": 4753} {"train_loss": -7.243521690368652, "global_step": 199641, "epoch": 4753} {"train_loss": -7.143564701080322, "global_step": 199642, "epoch": 4753} {"train_loss": -7.108909606933594, "global_step": 199643, "epoch": 4753} {"train_loss": -7.133719444274902, "global_step": 199644, "epoch": 4753} {"train_loss": -7.180270195007324, "global_step": 199645, "epoch": 4753} {"train_loss": -7.144787311553955, "global_step": 199646, "epoch": 4753} {"train_loss": -7.277286052703857, "global_step": 199647, "epoch": 4753} {"train_loss": -7.144819259643555, "global_step": 199648, "epoch": 4753} {"train_loss": -7.161446571350098, "global_step": 199649, "epoch": 4753} {"train_loss": -7.105238914489746, "global_step": 199650, "epoch": 4753} {"train_loss": -7.05727481842041, "global_step": 199651, "epoch": 4753} {"train_loss": -7.072464942932129, "global_step": 199652, "epoch": 4753} {"train_loss": -7.105700969696045, "global_step": 199653, "epoch": 4753} {"train_loss": -7.140032768249512, "global_step": 199654, "epoch": 4753} {"train_loss": -7.129890441894531, "global_step": 199655, "epoch": 4753} {"train_loss": -7.05288028717041, "global_step": 199656, "epoch": 4753} {"train_loss": -7.238228797912598, "global_step": 199657, "epoch": 4753} {"train_loss": -7.108151435852051, "global_step": 199658, "epoch": 4753} {"train_loss": -7.236428737640381, "global_step": 199659, "epoch": 4753} {"train_loss": -7.114696502685547, "global_step": 199660, "epoch": 4753} {"train_loss": -7.027543067932129, "global_step": 199661, "epoch": 4753} {"train_loss": -7.197506904602051, "global_step": 199662, "epoch": 4753} {"train_loss": -7.099764823913574, "global_step": 199663, "epoch": 4753} {"train_loss": -7.196445465087891, "global_step": 199664, "epoch": 4753} {"train_loss": -7.177124977111816, "global_step": 199665, "epoch": 4753} {"train_loss": -7.162323951721191, "global_step": 199666, "epoch": 4753} {"train_loss": -7.153848920549665, "global_step": 199667, "epoch": 4753, "val_loss": 68878.765625} {"train_loss": -7.21395206451416, "global_step": 199668, "epoch": 4754} {"train_loss": -7.16586971282959, "global_step": 199669, "epoch": 4754} {"train_loss": -7.15094518661499, "global_step": 199670, "epoch": 4754} {"train_loss": -7.233996868133545, "global_step": 199671, "epoch": 4754} {"train_loss": -7.211475372314453, "global_step": 199672, "epoch": 4754} {"train_loss": -7.176608085632324, "global_step": 199673, "epoch": 4754} {"train_loss": -7.3378777503967285, "global_step": 199674, "epoch": 4754} {"train_loss": -7.170868873596191, "global_step": 199675, "epoch": 4754} {"train_loss": -7.325470924377441, "global_step": 199676, "epoch": 4754} {"train_loss": -7.325613975524902, "global_step": 199677, "epoch": 4754} {"train_loss": -7.255031585693359, "global_step": 199678, "epoch": 4754} {"train_loss": -7.253643035888672, "global_step": 199679, "epoch": 4754} {"train_loss": -7.154451847076416, "global_step": 199680, "epoch": 4754} {"train_loss": -7.220296859741211, "global_step": 199681, "epoch": 4754} {"train_loss": -7.1847076416015625, "global_step": 199682, "epoch": 4754} {"train_loss": -7.18386173248291, "global_step": 199683, "epoch": 4754} {"train_loss": -7.262967109680176, "global_step": 199684, "epoch": 4754} {"train_loss": -7.054471015930176, "global_step": 199685, "epoch": 4754} {"train_loss": -7.150203227996826, "global_step": 199686, "epoch": 4754} {"train_loss": -7.200972557067871, "global_step": 199687, "epoch": 4754} {"train_loss": -7.139915466308594, "global_step": 199688, "epoch": 4754} {"train_loss": -7.086230278015137, "global_step": 199689, "epoch": 4754} {"train_loss": -7.146368980407715, "global_step": 199690, "epoch": 4754} {"train_loss": -7.150994300842285, "global_step": 199691, "epoch": 4754} {"train_loss": -7.219836235046387, "global_step": 199692, "epoch": 4754} {"train_loss": -7.213961124420166, "global_step": 199693, "epoch": 4754} {"train_loss": -7.264214515686035, "global_step": 199694, "epoch": 4754} {"train_loss": -7.198825836181641, "global_step": 199695, "epoch": 4754} {"train_loss": -7.117455005645752, "global_step": 199696, "epoch": 4754} {"train_loss": -7.219720363616943, "global_step": 199697, "epoch": 4754} {"train_loss": -7.2087273597717285, "global_step": 199698, "epoch": 4754} {"train_loss": -7.361642360687256, "global_step": 199699, "epoch": 4754} {"train_loss": -7.13971471786499, "global_step": 199700, "epoch": 4754} {"train_loss": -7.324003219604492, "global_step": 199701, "epoch": 4754} {"train_loss": -7.137970447540283, "global_step": 199702, "epoch": 4754} {"train_loss": -7.16096830368042, "global_step": 199703, "epoch": 4754} {"train_loss": -7.365111351013184, "global_step": 199704, "epoch": 4754} {"train_loss": -7.214176654815674, "global_step": 199705, "epoch": 4754} {"train_loss": -7.2887773513793945, "global_step": 199706, "epoch": 4754} {"train_loss": -7.280393600463867, "global_step": 199707, "epoch": 4754} {"train_loss": -7.298994064331055, "global_step": 199708, "epoch": 4754} {"train_loss": -7.21506134668986, "global_step": 199709, "epoch": 4754, "val_loss": 68959.1640625} {"train_loss": -7.188823699951172, "global_step": 199710, "epoch": 4755} {"train_loss": -7.215044975280762, "global_step": 199711, "epoch": 4755} {"train_loss": -7.192788124084473, "global_step": 199712, "epoch": 4755} {"train_loss": -7.2543230056762695, "global_step": 199713, "epoch": 4755} {"train_loss": -7.254064559936523, "global_step": 199714, "epoch": 4755} {"train_loss": -7.277004718780518, "global_step": 199715, "epoch": 4755} {"train_loss": -7.228784561157227, "global_step": 199716, "epoch": 4755} {"train_loss": -7.195869445800781, "global_step": 199717, "epoch": 4755} {"train_loss": -7.217772483825684, "global_step": 199718, "epoch": 4755} {"train_loss": -7.205837726593018, "global_step": 199719, "epoch": 4755} {"train_loss": -7.354018211364746, "global_step": 199720, "epoch": 4755} {"train_loss": -7.229317665100098, "global_step": 199721, "epoch": 4755} {"train_loss": -7.140708923339844, "global_step": 199722, "epoch": 4755} {"train_loss": -7.326474189758301, "global_step": 199723, "epoch": 4755} {"train_loss": -7.133654594421387, "global_step": 199724, "epoch": 4755} {"train_loss": -7.2922587394714355, "global_step": 199725, "epoch": 4755} {"train_loss": -7.326598644256592, "global_step": 199726, "epoch": 4755} {"train_loss": -7.270133018493652, "global_step": 199727, "epoch": 4755} {"train_loss": -7.288753986358643, "global_step": 199728, "epoch": 4755} {"train_loss": -7.204743385314941, "global_step": 199729, "epoch": 4755} {"train_loss": -7.3289079666137695, "global_step": 199730, "epoch": 4755} {"train_loss": -7.322990417480469, "global_step": 199731, "epoch": 4755} {"train_loss": -7.251791000366211, "global_step": 199732, "epoch": 4755} {"train_loss": -7.246732711791992, "global_step": 199733, "epoch": 4755} {"train_loss": -7.364424705505371, "global_step": 199734, "epoch": 4755} {"train_loss": -7.214829444885254, "global_step": 199735, "epoch": 4755} {"train_loss": -7.236227989196777, "global_step": 199736, "epoch": 4755} {"train_loss": -7.321404457092285, "global_step": 199737, "epoch": 4755} {"train_loss": -7.24907112121582, "global_step": 199738, "epoch": 4755} {"train_loss": -7.267569541931152, "global_step": 199739, "epoch": 4755} {"train_loss": -7.299339294433594, "global_step": 199740, "epoch": 4755} {"train_loss": -7.304723262786865, "global_step": 199741, "epoch": 4755} {"train_loss": -7.289419651031494, "global_step": 199742, "epoch": 4755} {"train_loss": -7.370256423950195, "global_step": 199743, "epoch": 4755} {"train_loss": -7.344786643981934, "global_step": 199744, "epoch": 4755} {"train_loss": -7.172516822814941, "global_step": 199745, "epoch": 4755} {"train_loss": -7.30457878112793, "global_step": 199746, "epoch": 4755} {"train_loss": -7.200838565826416, "global_step": 199747, "epoch": 4755} {"train_loss": -7.128803253173828, "global_step": 199748, "epoch": 4755} {"train_loss": -7.188731670379639, "global_step": 199749, "epoch": 4755} {"train_loss": -7.282828330993652, "global_step": 199750, "epoch": 4755} {"train_loss": -7.257508482251849, "global_step": 199751, "epoch": 4755, "val_loss": 69091.2421875} {"train_loss": -7.21867561340332, "global_step": 199752, "epoch": 4756} {"train_loss": -7.184807777404785, "global_step": 199753, "epoch": 4756} {"train_loss": -7.292065620422363, "global_step": 199754, "epoch": 4756} {"train_loss": -7.253546714782715, "global_step": 199755, "epoch": 4756} {"train_loss": -7.245358467102051, "global_step": 199756, "epoch": 4756} {"train_loss": -7.223980903625488, "global_step": 199757, "epoch": 4756} {"train_loss": -7.18560791015625, "global_step": 199758, "epoch": 4756} {"train_loss": -7.148021697998047, "global_step": 199759, "epoch": 4756} {"train_loss": -7.27743673324585, "global_step": 199760, "epoch": 4756} {"train_loss": -7.224878787994385, "global_step": 199761, "epoch": 4756} {"train_loss": -7.151797771453857, "global_step": 199762, "epoch": 4756} {"train_loss": -7.231725215911865, "global_step": 199763, "epoch": 4756} {"train_loss": -7.250815391540527, "global_step": 199764, "epoch": 4756} {"train_loss": -7.075345516204834, "global_step": 199765, "epoch": 4756} {"train_loss": -7.253969669342041, "global_step": 199766, "epoch": 4756} {"train_loss": -7.1683831214904785, "global_step": 199767, "epoch": 4756} {"train_loss": -7.11407470703125, "global_step": 199768, "epoch": 4756} {"train_loss": -7.1591796875, "global_step": 199769, "epoch": 4756} {"train_loss": -7.093257904052734, "global_step": 199770, "epoch": 4756} {"train_loss": -7.337712287902832, "global_step": 199771, "epoch": 4756} {"train_loss": -7.228151321411133, "global_step": 199772, "epoch": 4756} {"train_loss": -7.265341758728027, "global_step": 199773, "epoch": 4756} {"train_loss": -7.210689544677734, "global_step": 199774, "epoch": 4756} {"train_loss": -7.260255813598633, "global_step": 199775, "epoch": 4756} {"train_loss": -7.2403998374938965, "global_step": 199776, "epoch": 4756} {"train_loss": -7.159635543823242, "global_step": 199777, "epoch": 4756} {"train_loss": -7.1246232986450195, "global_step": 199778, "epoch": 4756} {"train_loss": -7.197022914886475, "global_step": 199779, "epoch": 4756} {"train_loss": -7.214660167694092, "global_step": 199780, "epoch": 4756} {"train_loss": -7.32332181930542, "global_step": 199781, "epoch": 4756} {"train_loss": -7.142164707183838, "global_step": 199782, "epoch": 4756} {"train_loss": -7.218686103820801, "global_step": 199783, "epoch": 4756} {"train_loss": -7.329683303833008, "global_step": 199784, "epoch": 4756} {"train_loss": -7.140692234039307, "global_step": 199785, "epoch": 4756} {"train_loss": -7.125580787658691, "global_step": 199786, "epoch": 4756} {"train_loss": -7.153225421905518, "global_step": 199787, "epoch": 4756} {"train_loss": -7.183663368225098, "global_step": 199788, "epoch": 4756} {"train_loss": -7.138757228851318, "global_step": 199789, "epoch": 4756} {"train_loss": -7.1069135665893555, "global_step": 199790, "epoch": 4756} {"train_loss": -7.091571807861328, "global_step": 199791, "epoch": 4756} {"train_loss": -6.980534553527832, "global_step": 199792, "epoch": 4756} {"train_loss": -7.195617721194313, "global_step": 199793, "epoch": 4756, "val_loss": 69006.890625} {"train_loss": -7.108922958374023, "global_step": 199794, "epoch": 4757} {"train_loss": -7.087900161743164, "global_step": 199795, "epoch": 4757} {"train_loss": -7.301301956176758, "global_step": 199796, "epoch": 4757} {"train_loss": -7.184762954711914, "global_step": 199797, "epoch": 4757} {"train_loss": -7.239629745483398, "global_step": 199798, "epoch": 4757} {"train_loss": -7.226072311401367, "global_step": 199799, "epoch": 4757} {"train_loss": -7.315986156463623, "global_step": 199800, "epoch": 4757} {"train_loss": -7.295478343963623, "global_step": 199801, "epoch": 4757} {"train_loss": -7.265134334564209, "global_step": 199802, "epoch": 4757} {"train_loss": -7.3312458992004395, "global_step": 199803, "epoch": 4757} {"train_loss": -7.3169779777526855, "global_step": 199804, "epoch": 4757} {"train_loss": -7.281309127807617, "global_step": 199805, "epoch": 4757} {"train_loss": -7.222290992736816, "global_step": 199806, "epoch": 4757} {"train_loss": -7.308623790740967, "global_step": 199807, "epoch": 4757} {"train_loss": -7.238376617431641, "global_step": 199808, "epoch": 4757} {"train_loss": -7.21293830871582, "global_step": 199809, "epoch": 4757} {"train_loss": -7.249876499176025, "global_step": 199810, "epoch": 4757} {"train_loss": -7.262123107910156, "global_step": 199811, "epoch": 4757} {"train_loss": -7.367300033569336, "global_step": 199812, "epoch": 4757} {"train_loss": -7.215362548828125, "global_step": 199813, "epoch": 4757} {"train_loss": -7.259774684906006, "global_step": 199814, "epoch": 4757} {"train_loss": -7.212204933166504, "global_step": 199815, "epoch": 4757} {"train_loss": -7.323916912078857, "global_step": 199816, "epoch": 4757} {"train_loss": -7.273357391357422, "global_step": 199817, "epoch": 4757} {"train_loss": -7.1822099685668945, "global_step": 199818, "epoch": 4757} {"train_loss": -7.219623565673828, "global_step": 199819, "epoch": 4757} {"train_loss": -7.216400146484375, "global_step": 199820, "epoch": 4757} {"train_loss": -7.180651664733887, "global_step": 199821, "epoch": 4757} {"train_loss": -7.350915908813477, "global_step": 199822, "epoch": 4757} {"train_loss": -7.184903144836426, "global_step": 199823, "epoch": 4757} {"train_loss": -7.217062950134277, "global_step": 199824, "epoch": 4757} {"train_loss": -7.111247539520264, "global_step": 199825, "epoch": 4757} {"train_loss": -7.222259044647217, "global_step": 199826, "epoch": 4757} {"train_loss": -7.286195278167725, "global_step": 199827, "epoch": 4757} {"train_loss": -7.18715238571167, "global_step": 199828, "epoch": 4757} {"train_loss": -7.301365852355957, "global_step": 199829, "epoch": 4757} {"train_loss": -7.134703636169434, "global_step": 199830, "epoch": 4757} {"train_loss": -7.303091049194336, "global_step": 199831, "epoch": 4757} {"train_loss": -7.175638198852539, "global_step": 199832, "epoch": 4757} {"train_loss": -7.208563327789307, "global_step": 199833, "epoch": 4757} {"train_loss": -7.070422172546387, "global_step": 199834, "epoch": 4757} {"train_loss": -7.233246587571644, "global_step": 199835, "epoch": 4757, "val_loss": 68972.796875} {"train_loss": -7.2768449783325195, "global_step": 199836, "epoch": 4758} {"train_loss": -7.252514839172363, "global_step": 199837, "epoch": 4758} {"train_loss": -7.102211952209473, "global_step": 199838, "epoch": 4758} {"train_loss": -7.213347434997559, "global_step": 199839, "epoch": 4758} {"train_loss": -7.272583961486816, "global_step": 199840, "epoch": 4758} {"train_loss": -7.200366497039795, "global_step": 199841, "epoch": 4758} {"train_loss": -7.309123516082764, "global_step": 199842, "epoch": 4758} {"train_loss": -7.274075508117676, "global_step": 199843, "epoch": 4758} {"train_loss": -7.337716102600098, "global_step": 199844, "epoch": 4758} {"train_loss": -7.3154449462890625, "global_step": 199845, "epoch": 4758} {"train_loss": -7.350154876708984, "global_step": 199846, "epoch": 4758} {"train_loss": -7.232935905456543, "global_step": 199847, "epoch": 4758} {"train_loss": -7.1404619216918945, "global_step": 199848, "epoch": 4758} {"train_loss": -7.188877105712891, "global_step": 199849, "epoch": 4758} {"train_loss": -7.281762599945068, "global_step": 199850, "epoch": 4758} {"train_loss": -7.288600444793701, "global_step": 199851, "epoch": 4758} {"train_loss": -7.301863670349121, "global_step": 199852, "epoch": 4758} {"train_loss": -7.282660484313965, "global_step": 199853, "epoch": 4758} {"train_loss": -7.252891540527344, "global_step": 199854, "epoch": 4758} {"train_loss": -7.383194446563721, "global_step": 199855, "epoch": 4758} {"train_loss": -7.299375057220459, "global_step": 199856, "epoch": 4758} {"train_loss": -7.294896602630615, "global_step": 199857, "epoch": 4758} {"train_loss": -7.2079620361328125, "global_step": 199858, "epoch": 4758} {"train_loss": -7.217974662780762, "global_step": 199859, "epoch": 4758} {"train_loss": -7.335668563842773, "global_step": 199860, "epoch": 4758} {"train_loss": -7.2871809005737305, "global_step": 199861, "epoch": 4758} {"train_loss": -7.356936454772949, "global_step": 199862, "epoch": 4758} {"train_loss": -7.274613857269287, "global_step": 199863, "epoch": 4758} {"train_loss": -7.420984268188477, "global_step": 199864, "epoch": 4758} {"train_loss": -7.386188983917236, "global_step": 199865, "epoch": 4758} {"train_loss": -7.311622619628906, "global_step": 199866, "epoch": 4758} {"train_loss": -7.227299690246582, "global_step": 199867, "epoch": 4758} {"train_loss": -7.276708602905273, "global_step": 199868, "epoch": 4758} {"train_loss": -7.2698163986206055, "global_step": 199869, "epoch": 4758} {"train_loss": -7.2567057609558105, "global_step": 199870, "epoch": 4758} {"train_loss": -7.33321475982666, "global_step": 199871, "epoch": 4758} {"train_loss": -7.258193492889404, "global_step": 199872, "epoch": 4758} {"train_loss": -7.243430137634277, "global_step": 199873, "epoch": 4758} {"train_loss": -7.278875350952148, "global_step": 199874, "epoch": 4758} {"train_loss": -7.252922058105469, "global_step": 199875, "epoch": 4758} {"train_loss": -7.20199728012085, "global_step": 199876, "epoch": 4758} {"train_loss": -7.273634388333275, "global_step": 199877, "epoch": 4758, "val_loss": 69204.15625} {"train_loss": -7.274141311645508, "global_step": 199878, "epoch": 4759} {"train_loss": -7.131925582885742, "global_step": 199879, "epoch": 4759} {"train_loss": -7.1862382888793945, "global_step": 199880, "epoch": 4759} {"train_loss": -7.160617351531982, "global_step": 199881, "epoch": 4759} {"train_loss": -7.288177490234375, "global_step": 199882, "epoch": 4759} {"train_loss": -7.093749523162842, "global_step": 199883, "epoch": 4759} {"train_loss": -7.168153762817383, "global_step": 199884, "epoch": 4759} {"train_loss": -7.227834224700928, "global_step": 199885, "epoch": 4759} {"train_loss": -7.137990474700928, "global_step": 199886, "epoch": 4759} {"train_loss": -7.187356948852539, "global_step": 199887, "epoch": 4759} {"train_loss": -7.2040534019470215, "global_step": 199888, "epoch": 4759} {"train_loss": -7.254185676574707, "global_step": 199889, "epoch": 4759} {"train_loss": -7.279879570007324, "global_step": 199890, "epoch": 4759} {"train_loss": -7.1731672286987305, "global_step": 199891, "epoch": 4759} {"train_loss": -7.308958053588867, "global_step": 199892, "epoch": 4759} {"train_loss": -7.138895034790039, "global_step": 199893, "epoch": 4759} {"train_loss": -7.236081123352051, "global_step": 199894, "epoch": 4759} {"train_loss": -7.238020896911621, "global_step": 199895, "epoch": 4759} {"train_loss": -7.309901237487793, "global_step": 199896, "epoch": 4759} {"train_loss": -7.267934799194336, "global_step": 199897, "epoch": 4759} {"train_loss": -7.0457763671875, "global_step": 199898, "epoch": 4759} {"train_loss": -7.174900531768799, "global_step": 199899, "epoch": 4759} {"train_loss": -7.259208679199219, "global_step": 199900, "epoch": 4759} {"train_loss": -7.282570838928223, "global_step": 199901, "epoch": 4759} {"train_loss": -7.22147798538208, "global_step": 199902, "epoch": 4759} {"train_loss": -7.403151512145996, "global_step": 199903, "epoch": 4759} {"train_loss": -7.317629814147949, "global_step": 199904, "epoch": 4759} {"train_loss": -7.190392971038818, "global_step": 199905, "epoch": 4759} {"train_loss": -7.260457992553711, "global_step": 199906, "epoch": 4759} {"train_loss": -7.21519660949707, "global_step": 199907, "epoch": 4759} {"train_loss": -7.298620223999023, "global_step": 199908, "epoch": 4759} {"train_loss": -7.248610973358154, "global_step": 199909, "epoch": 4759} {"train_loss": -7.216268539428711, "global_step": 199910, "epoch": 4759} {"train_loss": -7.322288513183594, "global_step": 199911, "epoch": 4759} {"train_loss": -7.154635429382324, "global_step": 199912, "epoch": 4759} {"train_loss": -7.230485916137695, "global_step": 199913, "epoch": 4759} {"train_loss": -7.381325721740723, "global_step": 199914, "epoch": 4759} {"train_loss": -7.309014797210693, "global_step": 199915, "epoch": 4759} {"train_loss": -7.264369964599609, "global_step": 199916, "epoch": 4759} {"train_loss": -7.227245330810547, "global_step": 199917, "epoch": 4759} {"train_loss": -7.197662353515625, "global_step": 199918, "epoch": 4759} {"train_loss": -7.227496521813529, "global_step": 199919, "epoch": 4759, "val_loss": 69131.9609375} {"train_loss": -7.3840789794921875, "global_step": 199920, "epoch": 4760} {"train_loss": -7.267876625061035, "global_step": 199921, "epoch": 4760} {"train_loss": -7.19499397277832, "global_step": 199922, "epoch": 4760} {"train_loss": -7.006409645080566, "global_step": 199923, "epoch": 4760} {"train_loss": -7.10165548324585, "global_step": 199924, "epoch": 4760} {"train_loss": -7.301215171813965, "global_step": 199925, "epoch": 4760} {"train_loss": -7.165615081787109, "global_step": 199926, "epoch": 4760} {"train_loss": -7.328614234924316, "global_step": 199927, "epoch": 4760} {"train_loss": -7.166318416595459, "global_step": 199928, "epoch": 4760} {"train_loss": -7.193502426147461, "global_step": 199929, "epoch": 4760} {"train_loss": -7.27847957611084, "global_step": 199930, "epoch": 4760} {"train_loss": -7.246046543121338, "global_step": 199931, "epoch": 4760} {"train_loss": -7.262827396392822, "global_step": 199932, "epoch": 4760} {"train_loss": -7.407794952392578, "global_step": 199933, "epoch": 4760} {"train_loss": -7.193506717681885, "global_step": 199934, "epoch": 4760} {"train_loss": -7.2022175788879395, "global_step": 199935, "epoch": 4760} {"train_loss": -7.205002784729004, "global_step": 199936, "epoch": 4760} {"train_loss": -7.174374103546143, "global_step": 199937, "epoch": 4760} {"train_loss": -7.144423007965088, "global_step": 199938, "epoch": 4760} {"train_loss": -7.215701103210449, "global_step": 199939, "epoch": 4760} {"train_loss": -7.2960686683654785, "global_step": 199940, "epoch": 4760} {"train_loss": -7.2354207038879395, "global_step": 199941, "epoch": 4760} {"train_loss": -7.33316707611084, "global_step": 199942, "epoch": 4760} {"train_loss": -7.224861145019531, "global_step": 199943, "epoch": 4760} {"train_loss": -7.2094526290893555, "global_step": 199944, "epoch": 4760} {"train_loss": -7.163882732391357, "global_step": 199945, "epoch": 4760} {"train_loss": -7.134997367858887, "global_step": 199946, "epoch": 4760} {"train_loss": -7.177403450012207, "global_step": 199947, "epoch": 4760} {"train_loss": -7.209680557250977, "global_step": 199948, "epoch": 4760} {"train_loss": -7.195472717285156, "global_step": 199949, "epoch": 4760} {"train_loss": -7.1883649826049805, "global_step": 199950, "epoch": 4760} {"train_loss": -7.190614700317383, "global_step": 199951, "epoch": 4760} {"train_loss": -7.215827465057373, "global_step": 199952, "epoch": 4760} {"train_loss": -7.065612316131592, "global_step": 199953, "epoch": 4760} {"train_loss": -7.154492378234863, "global_step": 199954, "epoch": 4760} {"train_loss": -7.166847229003906, "global_step": 199955, "epoch": 4760} {"train_loss": -7.19195556640625, "global_step": 199956, "epoch": 4760} {"train_loss": -6.953831195831299, "global_step": 199957, "epoch": 4760} {"train_loss": -7.059120178222656, "global_step": 199958, "epoch": 4760} {"train_loss": -7.106142520904541, "global_step": 199959, "epoch": 4760} {"train_loss": -7.090991497039795, "global_step": 199960, "epoch": 4760} {"train_loss": -7.193409749439785, "global_step": 199961, "epoch": 4760, "val_loss": 69186.6015625} {"train_loss": -7.174831867218018, "global_step": 199962, "epoch": 4761} {"train_loss": -7.07191276550293, "global_step": 199963, "epoch": 4761} {"train_loss": -7.103378772735596, "global_step": 199964, "epoch": 4761} {"train_loss": -7.088519096374512, "global_step": 199965, "epoch": 4761} {"train_loss": -7.136641502380371, "global_step": 199966, "epoch": 4761} {"train_loss": -7.118584632873535, "global_step": 199967, "epoch": 4761} {"train_loss": -7.173047065734863, "global_step": 199968, "epoch": 4761} {"train_loss": -7.132110595703125, "global_step": 199969, "epoch": 4761} {"train_loss": -7.118410110473633, "global_step": 199970, "epoch": 4761} {"train_loss": -7.067753791809082, "global_step": 199971, "epoch": 4761} {"train_loss": -7.153902053833008, "global_step": 199972, "epoch": 4761} {"train_loss": -7.207501411437988, "global_step": 199973, "epoch": 4761} {"train_loss": -7.271810531616211, "global_step": 199974, "epoch": 4761} {"train_loss": -7.31027889251709, "global_step": 199975, "epoch": 4761} {"train_loss": -7.235304832458496, "global_step": 199976, "epoch": 4761} {"train_loss": -7.178579807281494, "global_step": 199977, "epoch": 4761} {"train_loss": -7.167591094970703, "global_step": 199978, "epoch": 4761} {"train_loss": -7.116946220397949, "global_step": 199979, "epoch": 4761} {"train_loss": -7.327034950256348, "global_step": 199980, "epoch": 4761} {"train_loss": -7.153964042663574, "global_step": 199981, "epoch": 4761} {"train_loss": -7.2419562339782715, "global_step": 199982, "epoch": 4761} {"train_loss": -7.221186637878418, "global_step": 199983, "epoch": 4761} {"train_loss": -7.177600860595703, "global_step": 199984, "epoch": 4761} {"train_loss": -7.203457355499268, "global_step": 199985, "epoch": 4761} {"train_loss": -7.233654975891113, "global_step": 199986, "epoch": 4761} {"train_loss": -7.129322052001953, "global_step": 199987, "epoch": 4761} {"train_loss": -7.248624801635742, "global_step": 199988, "epoch": 4761} {"train_loss": -7.264671325683594, "global_step": 199989, "epoch": 4761} {"train_loss": -7.189581394195557, "global_step": 199990, "epoch": 4761} {"train_loss": -7.308968544006348, "global_step": 199991, "epoch": 4761} {"train_loss": -7.241941452026367, "global_step": 199992, "epoch": 4761} {"train_loss": -7.229802131652832, "global_step": 199993, "epoch": 4761} {"train_loss": -7.110990047454834, "global_step": 199994, "epoch": 4761} {"train_loss": -7.170719623565674, "global_step": 199995, "epoch": 4761} {"train_loss": -7.193093299865723, "global_step": 199996, "epoch": 4761} {"train_loss": -7.04367208480835, "global_step": 199997, "epoch": 4761} {"train_loss": -7.173551082611084, "global_step": 199998, "epoch": 4761} {"train_loss": -7.225802421569824, "global_step": 199999, "epoch": 4761} {"train_loss": -7.129074573516846, "global_step": 200000, "epoch": 4761} {"train_loss": -7.118529796600342, "global_step": 200001, "epoch": 4761} {"train_loss": -7.138692855834961, "global_step": 200002, "epoch": 4761} {"train_loss": -7.180998802185059, "global_step": 200003, "epoch": 4761, "val_loss": 69349.0390625} {"train_loss": -7.08734130859375, "global_step": 200004, "epoch": 4762} {"train_loss": -7.049261569976807, "global_step": 200005, "epoch": 4762} {"train_loss": -7.127209663391113, "global_step": 200006, "epoch": 4762} {"train_loss": -7.095047950744629, "global_step": 200007, "epoch": 4762} {"train_loss": -7.187441349029541, "global_step": 200008, "epoch": 4762} {"train_loss": -7.146252632141113, "global_step": 200009, "epoch": 4762} {"train_loss": -7.152957439422607, "global_step": 200010, "epoch": 4762} {"train_loss": -7.2287750244140625, "global_step": 200011, "epoch": 4762} {"train_loss": -7.262564659118652, "global_step": 200012, "epoch": 4762} {"train_loss": -7.160247325897217, "global_step": 200013, "epoch": 4762} {"train_loss": -7.217039585113525, "global_step": 200014, "epoch": 4762} {"train_loss": -7.251457691192627, "global_step": 200015, "epoch": 4762} {"train_loss": -7.263766765594482, "global_step": 200016, "epoch": 4762} {"train_loss": -7.318058013916016, "global_step": 200017, "epoch": 4762} {"train_loss": -7.234432220458984, "global_step": 200018, "epoch": 4762} {"train_loss": -7.236180305480957, "global_step": 200019, "epoch": 4762} {"train_loss": -7.290720462799072, "global_step": 200020, "epoch": 4762} {"train_loss": -7.277585029602051, "global_step": 200021, "epoch": 4762} {"train_loss": -7.3032684326171875, "global_step": 200022, "epoch": 4762} {"train_loss": -7.289816856384277, "global_step": 200023, "epoch": 4762} {"train_loss": -7.338717460632324, "global_step": 200024, "epoch": 4762} {"train_loss": -7.1253814697265625, "global_step": 200025, "epoch": 4762} {"train_loss": -7.359387397766113, "global_step": 200026, "epoch": 4762} {"train_loss": -7.334098815917969, "global_step": 200027, "epoch": 4762} {"train_loss": -7.246171951293945, "global_step": 200028, "epoch": 4762} {"train_loss": -7.309064865112305, "global_step": 200029, "epoch": 4762} {"train_loss": -7.276567459106445, "global_step": 200030, "epoch": 4762} {"train_loss": -7.216888904571533, "global_step": 200031, "epoch": 4762} {"train_loss": -7.256214618682861, "global_step": 200032, "epoch": 4762} {"train_loss": -7.281712532043457, "global_step": 200033, "epoch": 4762} {"train_loss": -7.106454849243164, "global_step": 200034, "epoch": 4762} {"train_loss": -7.130709648132324, "global_step": 200035, "epoch": 4762} {"train_loss": -7.226633071899414, "global_step": 200036, "epoch": 4762} {"train_loss": -7.232916831970215, "global_step": 200037, "epoch": 4762} {"train_loss": -7.302977085113525, "global_step": 200038, "epoch": 4762} {"train_loss": -7.222559928894043, "global_step": 200039, "epoch": 4762} {"train_loss": -7.211057662963867, "global_step": 200040, "epoch": 4762} {"train_loss": -7.217742919921875, "global_step": 200041, "epoch": 4762} {"train_loss": -7.405258655548096, "global_step": 200042, "epoch": 4762} {"train_loss": -7.124104022979736, "global_step": 200043, "epoch": 4762} {"train_loss": -7.20651912689209, "global_step": 200044, "epoch": 4762} {"train_loss": -7.229134718577067, "global_step": 200045, "epoch": 4762, "val_loss": 69126.328125} {"train_loss": -7.247711181640625, "global_step": 200046, "epoch": 4763} {"train_loss": -7.191622734069824, "global_step": 200047, "epoch": 4763} {"train_loss": -7.222064971923828, "global_step": 200048, "epoch": 4763} {"train_loss": -7.218959808349609, "global_step": 200049, "epoch": 4763} {"train_loss": -7.243252277374268, "global_step": 200050, "epoch": 4763} {"train_loss": -7.248310089111328, "global_step": 200051, "epoch": 4763} {"train_loss": -7.271958351135254, "global_step": 200052, "epoch": 4763} {"train_loss": -7.310870170593262, "global_step": 200053, "epoch": 4763} {"train_loss": -7.2806854248046875, "global_step": 200054, "epoch": 4763} {"train_loss": -7.132359981536865, "global_step": 200055, "epoch": 4763} {"train_loss": -7.27486515045166, "global_step": 200056, "epoch": 4763} {"train_loss": -7.167959213256836, "global_step": 200057, "epoch": 4763} {"train_loss": -7.202425479888916, "global_step": 200058, "epoch": 4763} {"train_loss": -7.274972915649414, "global_step": 200059, "epoch": 4763} {"train_loss": -7.155900001525879, "global_step": 200060, "epoch": 4763} {"train_loss": -7.210389137268066, "global_step": 200061, "epoch": 4763} {"train_loss": -7.147341728210449, "global_step": 200062, "epoch": 4763} {"train_loss": -7.314063549041748, "global_step": 200063, "epoch": 4763} {"train_loss": -7.339588165283203, "global_step": 200064, "epoch": 4763} {"train_loss": -7.213455677032471, "global_step": 200065, "epoch": 4763} {"train_loss": -7.28892707824707, "global_step": 200066, "epoch": 4763} {"train_loss": -7.301329612731934, "global_step": 200067, "epoch": 4763} {"train_loss": -7.112865447998047, "global_step": 200068, "epoch": 4763} {"train_loss": -7.250316619873047, "global_step": 200069, "epoch": 4763} {"train_loss": -7.265122890472412, "global_step": 200070, "epoch": 4763} {"train_loss": -7.335936546325684, "global_step": 200071, "epoch": 4763} {"train_loss": -7.312108039855957, "global_step": 200072, "epoch": 4763} {"train_loss": -7.273806571960449, "global_step": 200073, "epoch": 4763} {"train_loss": -7.277288436889648, "global_step": 200074, "epoch": 4763} {"train_loss": -7.23164701461792, "global_step": 200075, "epoch": 4763} {"train_loss": -7.238353729248047, "global_step": 200076, "epoch": 4763} {"train_loss": -7.3151164054870605, "global_step": 200077, "epoch": 4763} {"train_loss": -7.236744403839111, "global_step": 200078, "epoch": 4763} {"train_loss": -7.305848598480225, "global_step": 200079, "epoch": 4763} {"train_loss": -7.274338722229004, "global_step": 200080, "epoch": 4763} {"train_loss": -7.236865043640137, "global_step": 200081, "epoch": 4763} {"train_loss": -7.214130878448486, "global_step": 200082, "epoch": 4763} {"train_loss": -7.269783973693848, "global_step": 200083, "epoch": 4763} {"train_loss": -7.352170944213867, "global_step": 200084, "epoch": 4763} {"train_loss": -7.295337677001953, "global_step": 200085, "epoch": 4763} {"train_loss": -7.2974748611450195, "global_step": 200086, "epoch": 4763} {"train_loss": -7.254084473564511, "global_step": 200087, "epoch": 4763, "val_loss": 69048.140625} {"train_loss": -7.3734331130981445, "global_step": 200088, "epoch": 4764} {"train_loss": -7.304042816162109, "global_step": 200089, "epoch": 4764} {"train_loss": -7.235901832580566, "global_step": 200090, "epoch": 4764} {"train_loss": -7.327577114105225, "global_step": 200091, "epoch": 4764} {"train_loss": -7.262394428253174, "global_step": 200092, "epoch": 4764} {"train_loss": -7.205008506774902, "global_step": 200093, "epoch": 4764} {"train_loss": -7.266378402709961, "global_step": 200094, "epoch": 4764} {"train_loss": -7.310840606689453, "global_step": 200095, "epoch": 4764} {"train_loss": -7.193341255187988, "global_step": 200096, "epoch": 4764} {"train_loss": -7.298507213592529, "global_step": 200097, "epoch": 4764} {"train_loss": -7.2504119873046875, "global_step": 200098, "epoch": 4764} {"train_loss": -7.2815656661987305, "global_step": 200099, "epoch": 4764} {"train_loss": -7.195224761962891, "global_step": 200100, "epoch": 4764} {"train_loss": -7.227461814880371, "global_step": 200101, "epoch": 4764} {"train_loss": -7.163851737976074, "global_step": 200102, "epoch": 4764} {"train_loss": -7.115586280822754, "global_step": 200103, "epoch": 4764} {"train_loss": -7.207488059997559, "global_step": 200104, "epoch": 4764} {"train_loss": -7.315851211547852, "global_step": 200105, "epoch": 4764} {"train_loss": -7.140140533447266, "global_step": 200106, "epoch": 4764} {"train_loss": -7.212725639343262, "global_step": 200107, "epoch": 4764} {"train_loss": -7.223588943481445, "global_step": 200108, "epoch": 4764} {"train_loss": -6.993654727935791, "global_step": 200109, "epoch": 4764} {"train_loss": -7.08115291595459, "global_step": 200110, "epoch": 4764} {"train_loss": -7.3158040046691895, "global_step": 200111, "epoch": 4764} {"train_loss": -7.245774745941162, "global_step": 200112, "epoch": 4764} {"train_loss": -7.274220943450928, "global_step": 200113, "epoch": 4764} {"train_loss": -7.3334455490112305, "global_step": 200114, "epoch": 4764} {"train_loss": -7.1845550537109375, "global_step": 200115, "epoch": 4764} {"train_loss": -7.258169174194336, "global_step": 200116, "epoch": 4764} {"train_loss": -7.247514724731445, "global_step": 200117, "epoch": 4764} {"train_loss": -7.250094413757324, "global_step": 200118, "epoch": 4764} {"train_loss": -7.203500270843506, "global_step": 200119, "epoch": 4764} {"train_loss": -7.2259697914123535, "global_step": 200120, "epoch": 4764} {"train_loss": -7.168122291564941, "global_step": 200121, "epoch": 4764} {"train_loss": -7.214869499206543, "global_step": 200122, "epoch": 4764} {"train_loss": -7.248120307922363, "global_step": 200123, "epoch": 4764} {"train_loss": -7.191796779632568, "global_step": 200124, "epoch": 4764} {"train_loss": -7.250426292419434, "global_step": 200125, "epoch": 4764} {"train_loss": -7.163574695587158, "global_step": 200126, "epoch": 4764} {"train_loss": -7.165507793426514, "global_step": 200127, "epoch": 4764} {"train_loss": -7.293697834014893, "global_step": 200128, "epoch": 4764} {"train_loss": -7.228918790817261, "global_step": 200129, "epoch": 4764, "val_loss": 68746.640625} {"train_loss": -7.151148319244385, "global_step": 200130, "epoch": 4765} {"train_loss": -7.22096586227417, "global_step": 200131, "epoch": 4765} {"train_loss": -7.0861358642578125, "global_step": 200132, "epoch": 4765} {"train_loss": -7.1629743576049805, "global_step": 200133, "epoch": 4765} {"train_loss": -7.007737159729004, "global_step": 200134, "epoch": 4765} {"train_loss": -7.024327278137207, "global_step": 200135, "epoch": 4765} {"train_loss": -7.257087230682373, "global_step": 200136, "epoch": 4765} {"train_loss": -7.091242790222168, "global_step": 200137, "epoch": 4765} {"train_loss": -7.159646034240723, "global_step": 200138, "epoch": 4765} {"train_loss": -7.1949920654296875, "global_step": 200139, "epoch": 4765} {"train_loss": -7.261300086975098, "global_step": 200140, "epoch": 4765} {"train_loss": -7.211220741271973, "global_step": 200141, "epoch": 4765} {"train_loss": -7.206506729125977, "global_step": 200142, "epoch": 4765} {"train_loss": -7.2431511878967285, "global_step": 200143, "epoch": 4765} {"train_loss": -7.15665340423584, "global_step": 200144, "epoch": 4765} {"train_loss": -7.17265510559082, "global_step": 200145, "epoch": 4765} {"train_loss": -7.196712493896484, "global_step": 200146, "epoch": 4765} {"train_loss": -7.148540496826172, "global_step": 200147, "epoch": 4765} {"train_loss": -7.261845111846924, "global_step": 200148, "epoch": 4765} {"train_loss": -7.322108745574951, "global_step": 200149, "epoch": 4765} {"train_loss": -7.197751998901367, "global_step": 200150, "epoch": 4765} {"train_loss": -7.260946273803711, "global_step": 200151, "epoch": 4765} {"train_loss": -7.270052909851074, "global_step": 200152, "epoch": 4765} {"train_loss": -7.311737537384033, "global_step": 200153, "epoch": 4765} {"train_loss": -7.248514175415039, "global_step": 200154, "epoch": 4765} {"train_loss": -7.198888301849365, "global_step": 200155, "epoch": 4765} {"train_loss": -7.300424575805664, "global_step": 200156, "epoch": 4765} {"train_loss": -7.236412048339844, "global_step": 200157, "epoch": 4765} {"train_loss": -7.194798946380615, "global_step": 200158, "epoch": 4765} {"train_loss": -7.30257511138916, "global_step": 200159, "epoch": 4765} {"train_loss": -7.277926445007324, "global_step": 200160, "epoch": 4765} {"train_loss": -7.215214252471924, "global_step": 200161, "epoch": 4765} {"train_loss": -7.183252811431885, "global_step": 200162, "epoch": 4765} {"train_loss": -7.361391067504883, "global_step": 200163, "epoch": 4765} {"train_loss": -7.305304527282715, "global_step": 200164, "epoch": 4765} {"train_loss": -7.162799835205078, "global_step": 200165, "epoch": 4765} {"train_loss": -7.201169013977051, "global_step": 200166, "epoch": 4765} {"train_loss": -7.159259796142578, "global_step": 200167, "epoch": 4765} {"train_loss": -7.125572204589844, "global_step": 200168, "epoch": 4765} {"train_loss": -7.243705749511719, "global_step": 200169, "epoch": 4765} {"train_loss": -7.1003289222717285, "global_step": 200170, "epoch": 4765} {"train_loss": -7.203395446141561, "global_step": 200171, "epoch": 4765, "val_loss": 69038.40625} {"train_loss": -7.1943583488464355, "global_step": 200172, "epoch": 4766} {"train_loss": -7.2993903160095215, "global_step": 200173, "epoch": 4766} {"train_loss": -7.2149786949157715, "global_step": 200174, "epoch": 4766} {"train_loss": -7.239575386047363, "global_step": 200175, "epoch": 4766} {"train_loss": -7.294084548950195, "global_step": 200176, "epoch": 4766} {"train_loss": -7.203071594238281, "global_step": 200177, "epoch": 4766} {"train_loss": -7.125782489776611, "global_step": 200178, "epoch": 4766} {"train_loss": -7.210960388183594, "global_step": 200179, "epoch": 4766} {"train_loss": -7.28472900390625, "global_step": 200180, "epoch": 4766} {"train_loss": -7.298532485961914, "global_step": 200181, "epoch": 4766} {"train_loss": -7.211830139160156, "global_step": 200182, "epoch": 4766} {"train_loss": -7.143627166748047, "global_step": 200183, "epoch": 4766} {"train_loss": -7.252946853637695, "global_step": 200184, "epoch": 4766} {"train_loss": -7.2643938064575195, "global_step": 200185, "epoch": 4766} {"train_loss": -7.090936660766602, "global_step": 200186, "epoch": 4766} {"train_loss": -7.248147010803223, "global_step": 200187, "epoch": 4766} {"train_loss": -7.129237174987793, "global_step": 200188, "epoch": 4766} {"train_loss": -7.210929870605469, "global_step": 200189, "epoch": 4766} {"train_loss": -7.195287704467773, "global_step": 200190, "epoch": 4766} {"train_loss": -7.176477432250977, "global_step": 200191, "epoch": 4766} {"train_loss": -7.233102798461914, "global_step": 200192, "epoch": 4766} {"train_loss": -7.267691612243652, "global_step": 200193, "epoch": 4766} {"train_loss": -7.237114906311035, "global_step": 200194, "epoch": 4766} {"train_loss": -7.273194313049316, "global_step": 200195, "epoch": 4766} {"train_loss": -7.177270889282227, "global_step": 200196, "epoch": 4766} {"train_loss": -7.174376964569092, "global_step": 200197, "epoch": 4766} {"train_loss": -7.2758989334106445, "global_step": 200198, "epoch": 4766} {"train_loss": -7.241842269897461, "global_step": 200199, "epoch": 4766} {"train_loss": -7.110359191894531, "global_step": 200200, "epoch": 4766} {"train_loss": -7.29070520401001, "global_step": 200201, "epoch": 4766} {"train_loss": -7.217600345611572, "global_step": 200202, "epoch": 4766} {"train_loss": -7.176387310028076, "global_step": 200203, "epoch": 4766} {"train_loss": -7.168874740600586, "global_step": 200204, "epoch": 4766} {"train_loss": -7.2117390632629395, "global_step": 200205, "epoch": 4766} {"train_loss": -7.186800479888916, "global_step": 200206, "epoch": 4766} {"train_loss": -7.222072601318359, "global_step": 200207, "epoch": 4766} {"train_loss": -7.206023216247559, "global_step": 200208, "epoch": 4766} {"train_loss": -7.114548683166504, "global_step": 200209, "epoch": 4766} {"train_loss": -7.274580001831055, "global_step": 200210, "epoch": 4766} {"train_loss": -7.092410564422607, "global_step": 200211, "epoch": 4766} {"train_loss": -7.16758918762207, "global_step": 200212, "epoch": 4766} {"train_loss": -7.207579896563575, "global_step": 200213, "epoch": 4766, "val_loss": 69003.5859375} {"train_loss": -7.211627006530762, "global_step": 200214, "epoch": 4767} {"train_loss": -7.169891834259033, "global_step": 200215, "epoch": 4767} {"train_loss": -7.188812255859375, "global_step": 200216, "epoch": 4767} {"train_loss": -7.290227890014648, "global_step": 200217, "epoch": 4767} {"train_loss": -7.232239246368408, "global_step": 200218, "epoch": 4767} {"train_loss": -7.153876781463623, "global_step": 200219, "epoch": 4767} {"train_loss": -7.168858528137207, "global_step": 200220, "epoch": 4767} {"train_loss": -7.185207366943359, "global_step": 200221, "epoch": 4767} {"train_loss": -7.093873023986816, "global_step": 200222, "epoch": 4767} {"train_loss": -7.2383131980896, "global_step": 200223, "epoch": 4767} {"train_loss": -7.267337799072266, "global_step": 200224, "epoch": 4767} {"train_loss": -7.178055286407471, "global_step": 200225, "epoch": 4767} {"train_loss": -7.165104866027832, "global_step": 200226, "epoch": 4767} {"train_loss": -7.220745086669922, "global_step": 200227, "epoch": 4767} {"train_loss": -7.228664875030518, "global_step": 200228, "epoch": 4767} {"train_loss": -7.344202995300293, "global_step": 200229, "epoch": 4767} {"train_loss": -7.201895236968994, "global_step": 200230, "epoch": 4767} {"train_loss": -7.163917541503906, "global_step": 200231, "epoch": 4767} {"train_loss": -7.198996067047119, "global_step": 200232, "epoch": 4767} {"train_loss": -7.221255779266357, "global_step": 200233, "epoch": 4767} {"train_loss": -7.242443561553955, "global_step": 200234, "epoch": 4767} {"train_loss": -7.139975547790527, "global_step": 200235, "epoch": 4767} {"train_loss": -7.164966583251953, "global_step": 200236, "epoch": 4767} {"train_loss": -7.06418514251709, "global_step": 200237, "epoch": 4767} {"train_loss": -7.304337024688721, "global_step": 200238, "epoch": 4767} {"train_loss": -7.1003737449646, "global_step": 200239, "epoch": 4767} {"train_loss": -7.150632381439209, "global_step": 200240, "epoch": 4767} {"train_loss": -7.295208930969238, "global_step": 200241, "epoch": 4767} {"train_loss": -7.088510990142822, "global_step": 200242, "epoch": 4767} {"train_loss": -7.277078151702881, "global_step": 200243, "epoch": 4767} {"train_loss": -7.245438575744629, "global_step": 200244, "epoch": 4767} {"train_loss": -7.206830978393555, "global_step": 200245, "epoch": 4767} {"train_loss": -7.236035346984863, "global_step": 200246, "epoch": 4767} {"train_loss": -7.188693046569824, "global_step": 200247, "epoch": 4767} {"train_loss": -7.340770721435547, "global_step": 200248, "epoch": 4767} {"train_loss": -7.209896564483643, "global_step": 200249, "epoch": 4767} {"train_loss": -7.230961799621582, "global_step": 200250, "epoch": 4767} {"train_loss": -7.193187236785889, "global_step": 200251, "epoch": 4767} {"train_loss": -7.139908313751221, "global_step": 200252, "epoch": 4767} {"train_loss": -7.320019721984863, "global_step": 200253, "epoch": 4767} {"train_loss": -7.228005409240723, "global_step": 200254, "epoch": 4767} {"train_loss": -7.210438342321487, "global_step": 200255, "epoch": 4767, "val_loss": 69002.9921875} {"train_loss": -7.230738639831543, "global_step": 200256, "epoch": 4768} {"train_loss": -7.198320388793945, "global_step": 200257, "epoch": 4768} {"train_loss": -7.345517158508301, "global_step": 200258, "epoch": 4768} {"train_loss": -7.295538425445557, "global_step": 200259, "epoch": 4768} {"train_loss": -7.313309192657471, "global_step": 200260, "epoch": 4768} {"train_loss": -7.287690162658691, "global_step": 200261, "epoch": 4768} {"train_loss": -7.247278213500977, "global_step": 200262, "epoch": 4768} {"train_loss": -7.320760726928711, "global_step": 200263, "epoch": 4768} {"train_loss": -7.2492475509643555, "global_step": 200264, "epoch": 4768} {"train_loss": -7.204499244689941, "global_step": 200265, "epoch": 4768} {"train_loss": -7.375749588012695, "global_step": 200266, "epoch": 4768} {"train_loss": -7.32843017578125, "global_step": 200267, "epoch": 4768} {"train_loss": -7.226860523223877, "global_step": 200268, "epoch": 4768} {"train_loss": -7.281998634338379, "global_step": 200269, "epoch": 4768} {"train_loss": -7.309950351715088, "global_step": 200270, "epoch": 4768} {"train_loss": -7.115493297576904, "global_step": 200271, "epoch": 4768} {"train_loss": -7.340645790100098, "global_step": 200272, "epoch": 4768} {"train_loss": -7.356050491333008, "global_step": 200273, "epoch": 4768} {"train_loss": -7.2243971824646, "global_step": 200274, "epoch": 4768} {"train_loss": -7.3711748123168945, "global_step": 200275, "epoch": 4768} {"train_loss": -7.292181968688965, "global_step": 200276, "epoch": 4768} {"train_loss": -7.3729166984558105, "global_step": 200277, "epoch": 4768} {"train_loss": -7.314666748046875, "global_step": 200278, "epoch": 4768} {"train_loss": -7.342033386230469, "global_step": 200279, "epoch": 4768} {"train_loss": -7.280467987060547, "global_step": 200280, "epoch": 4768} {"train_loss": -7.305929183959961, "global_step": 200281, "epoch": 4768} {"train_loss": -7.307304859161377, "global_step": 200282, "epoch": 4768} {"train_loss": -7.265057563781738, "global_step": 200283, "epoch": 4768} {"train_loss": -7.251575946807861, "global_step": 200284, "epoch": 4768} {"train_loss": -7.232685089111328, "global_step": 200285, "epoch": 4768} {"train_loss": -7.293401718139648, "global_step": 200286, "epoch": 4768} {"train_loss": -7.339962005615234, "global_step": 200287, "epoch": 4768} {"train_loss": -7.286867618560791, "global_step": 200288, "epoch": 4768} {"train_loss": -7.102693557739258, "global_step": 200289, "epoch": 4768} {"train_loss": -7.19129753112793, "global_step": 200290, "epoch": 4768} {"train_loss": -7.380434989929199, "global_step": 200291, "epoch": 4768} {"train_loss": -7.231473445892334, "global_step": 200292, "epoch": 4768} {"train_loss": -7.268322944641113, "global_step": 200293, "epoch": 4768} {"train_loss": -7.250319480895996, "global_step": 200294, "epoch": 4768} {"train_loss": -7.355650901794434, "global_step": 200295, "epoch": 4768} {"train_loss": -7.325741767883301, "global_step": 200296, "epoch": 4768} {"train_loss": -7.2823517095474966, "global_step": 200297, "epoch": 4768, "val_loss": 69021.71875} {"train_loss": -7.155218124389648, "global_step": 200298, "epoch": 4769} {"train_loss": -7.2807416915893555, "global_step": 200299, "epoch": 4769} {"train_loss": -7.270411968231201, "global_step": 200300, "epoch": 4769} {"train_loss": -7.252397537231445, "global_step": 200301, "epoch": 4769} {"train_loss": -7.324117660522461, "global_step": 200302, "epoch": 4769} {"train_loss": -7.239868640899658, "global_step": 200303, "epoch": 4769} {"train_loss": -7.163442611694336, "global_step": 200304, "epoch": 4769} {"train_loss": -7.073596000671387, "global_step": 200305, "epoch": 4769} {"train_loss": -7.258964538574219, "global_step": 200306, "epoch": 4769} {"train_loss": -7.1709089279174805, "global_step": 200307, "epoch": 4769} {"train_loss": -7.116950035095215, "global_step": 200308, "epoch": 4769} {"train_loss": -7.291557312011719, "global_step": 200309, "epoch": 4769} {"train_loss": -7.124750137329102, "global_step": 200310, "epoch": 4769} {"train_loss": -7.1200480461120605, "global_step": 200311, "epoch": 4769} {"train_loss": -7.2878851890563965, "global_step": 200312, "epoch": 4769} {"train_loss": -7.247085094451904, "global_step": 200313, "epoch": 4769} {"train_loss": -7.151487350463867, "global_step": 200314, "epoch": 4769} {"train_loss": -7.246726989746094, "global_step": 200315, "epoch": 4769} {"train_loss": -7.107364654541016, "global_step": 200316, "epoch": 4769} {"train_loss": -7.294220924377441, "global_step": 200317, "epoch": 4769} {"train_loss": -7.281289100646973, "global_step": 200318, "epoch": 4769} {"train_loss": -7.241852283477783, "global_step": 200319, "epoch": 4769} {"train_loss": -7.180935382843018, "global_step": 200320, "epoch": 4769} {"train_loss": -7.163352012634277, "global_step": 200321, "epoch": 4769} {"train_loss": -7.163375377655029, "global_step": 200322, "epoch": 4769} {"train_loss": -7.12867546081543, "global_step": 200323, "epoch": 4769} {"train_loss": -7.188346862792969, "global_step": 200324, "epoch": 4769} {"train_loss": -7.196384429931641, "global_step": 200325, "epoch": 4769} {"train_loss": -7.109487533569336, "global_step": 200326, "epoch": 4769} {"train_loss": -7.171671390533447, "global_step": 200327, "epoch": 4769} {"train_loss": -7.201510429382324, "global_step": 200328, "epoch": 4769} {"train_loss": -7.286118507385254, "global_step": 200329, "epoch": 4769} {"train_loss": -7.157191276550293, "global_step": 200330, "epoch": 4769} {"train_loss": -7.190375804901123, "global_step": 200331, "epoch": 4769} {"train_loss": -7.1579670906066895, "global_step": 200332, "epoch": 4769} {"train_loss": -7.323821544647217, "global_step": 200333, "epoch": 4769} {"train_loss": -7.192232131958008, "global_step": 200334, "epoch": 4769} {"train_loss": -7.140654563903809, "global_step": 200335, "epoch": 4769} {"train_loss": -7.344425678253174, "global_step": 200336, "epoch": 4769} {"train_loss": -7.284039497375488, "global_step": 200337, "epoch": 4769} {"train_loss": -7.20689582824707, "global_step": 200338, "epoch": 4769} {"train_loss": -7.206762245723179, "global_step": 200339, "epoch": 4769, "val_loss": 68966.3515625} {"train_loss": -7.195459365844727, "global_step": 200340, "epoch": 4770} {"train_loss": -7.236597061157227, "global_step": 200341, "epoch": 4770} {"train_loss": -7.227473735809326, "global_step": 200342, "epoch": 4770} {"train_loss": -7.298672199249268, "global_step": 200343, "epoch": 4770} {"train_loss": -7.24370002746582, "global_step": 200344, "epoch": 4770} {"train_loss": -7.242086410522461, "global_step": 200345, "epoch": 4770} {"train_loss": -7.206573009490967, "global_step": 200346, "epoch": 4770} {"train_loss": -7.156625270843506, "global_step": 200347, "epoch": 4770} {"train_loss": -7.11031436920166, "global_step": 200348, "epoch": 4770} {"train_loss": -7.144455909729004, "global_step": 200349, "epoch": 4770} {"train_loss": -7.193459987640381, "global_step": 200350, "epoch": 4770} {"train_loss": -7.1760454177856445, "global_step": 200351, "epoch": 4770} {"train_loss": -7.205864906311035, "global_step": 200352, "epoch": 4770} {"train_loss": -7.285726547241211, "global_step": 200353, "epoch": 4770} {"train_loss": -7.180537223815918, "global_step": 200354, "epoch": 4770} {"train_loss": -7.212971210479736, "global_step": 200355, "epoch": 4770} {"train_loss": -7.198358535766602, "global_step": 200356, "epoch": 4770} {"train_loss": -7.221427917480469, "global_step": 200357, "epoch": 4770} {"train_loss": -7.241765975952148, "global_step": 200358, "epoch": 4770} {"train_loss": -7.113030910491943, "global_step": 200359, "epoch": 4770} {"train_loss": -7.149309158325195, "global_step": 200360, "epoch": 4770} {"train_loss": -7.083063125610352, "global_step": 200361, "epoch": 4770} {"train_loss": -7.089272499084473, "global_step": 200362, "epoch": 4770} {"train_loss": -7.056552410125732, "global_step": 200363, "epoch": 4770} {"train_loss": -7.089392185211182, "global_step": 200364, "epoch": 4770} {"train_loss": -7.149847507476807, "global_step": 200365, "epoch": 4770} {"train_loss": -7.024811744689941, "global_step": 200366, "epoch": 4770} {"train_loss": -7.188508987426758, "global_step": 200367, "epoch": 4770} {"train_loss": -7.0968499183654785, "global_step": 200368, "epoch": 4770} {"train_loss": -7.033168792724609, "global_step": 200369, "epoch": 4770} {"train_loss": -7.191256523132324, "global_step": 200370, "epoch": 4770} {"train_loss": -7.074944019317627, "global_step": 200371, "epoch": 4770} {"train_loss": -6.968996047973633, "global_step": 200372, "epoch": 4770} {"train_loss": -7.092578411102295, "global_step": 200373, "epoch": 4770} {"train_loss": -7.059418201446533, "global_step": 200374, "epoch": 4770} {"train_loss": -7.04682731628418, "global_step": 200375, "epoch": 4770} {"train_loss": -7.0203938484191895, "global_step": 200376, "epoch": 4770} {"train_loss": -7.151615619659424, "global_step": 200377, "epoch": 4770} {"train_loss": -7.133666038513184, "global_step": 200378, "epoch": 4770} {"train_loss": -7.140571594238281, "global_step": 200379, "epoch": 4770} {"train_loss": -7.1151628494262695, "global_step": 200380, "epoch": 4770} {"train_loss": -7.143812168212164, "global_step": 200381, "epoch": 4770, "val_loss": 69183.3203125} {"train_loss": -7.070465087890625, "global_step": 200382, "epoch": 4771} {"train_loss": -7.145607948303223, "global_step": 200383, "epoch": 4771} {"train_loss": -7.073577880859375, "global_step": 200384, "epoch": 4771} {"train_loss": -7.0684285163879395, "global_step": 200385, "epoch": 4771} {"train_loss": -7.125120162963867, "global_step": 200386, "epoch": 4771} {"train_loss": -6.987174034118652, "global_step": 200387, "epoch": 4771} {"train_loss": -7.179093360900879, "global_step": 200388, "epoch": 4771} {"train_loss": -7.233846187591553, "global_step": 200389, "epoch": 4771} {"train_loss": -7.10858678817749, "global_step": 200390, "epoch": 4771} {"train_loss": -7.128217697143555, "global_step": 200391, "epoch": 4771} {"train_loss": -7.097761154174805, "global_step": 200392, "epoch": 4771} {"train_loss": -7.255640983581543, "global_step": 200393, "epoch": 4771} {"train_loss": -7.191442489624023, "global_step": 200394, "epoch": 4771} {"train_loss": -7.140746116638184, "global_step": 200395, "epoch": 4771} {"train_loss": -7.2038726806640625, "global_step": 200396, "epoch": 4771} {"train_loss": -7.284252166748047, "global_step": 200397, "epoch": 4771} {"train_loss": -7.163139820098877, "global_step": 200398, "epoch": 4771} {"train_loss": -7.214039325714111, "global_step": 200399, "epoch": 4771} {"train_loss": -7.158703804016113, "global_step": 200400, "epoch": 4771} {"train_loss": -7.264545440673828, "global_step": 200401, "epoch": 4771} {"train_loss": -7.213392734527588, "global_step": 200402, "epoch": 4771} {"train_loss": -7.215312957763672, "global_step": 200403, "epoch": 4771} {"train_loss": -7.349485397338867, "global_step": 200404, "epoch": 4771} {"train_loss": -7.280489921569824, "global_step": 200405, "epoch": 4771} {"train_loss": -7.233989715576172, "global_step": 200406, "epoch": 4771} {"train_loss": -7.211714744567871, "global_step": 200407, "epoch": 4771} {"train_loss": -7.199739456176758, "global_step": 200408, "epoch": 4771} {"train_loss": -7.269265174865723, "global_step": 200409, "epoch": 4771} {"train_loss": -7.352636337280273, "global_step": 200410, "epoch": 4771} {"train_loss": -7.313027381896973, "global_step": 200411, "epoch": 4771} {"train_loss": -7.374937057495117, "global_step": 200412, "epoch": 4771} {"train_loss": -7.333230972290039, "global_step": 200413, "epoch": 4771} {"train_loss": -7.27931022644043, "global_step": 200414, "epoch": 4771} {"train_loss": -7.354917049407959, "global_step": 200415, "epoch": 4771} {"train_loss": -7.371426582336426, "global_step": 200416, "epoch": 4771} {"train_loss": -7.320380210876465, "global_step": 200417, "epoch": 4771} {"train_loss": -7.3824262619018555, "global_step": 200418, "epoch": 4771} {"train_loss": -7.342115879058838, "global_step": 200419, "epoch": 4771} {"train_loss": -7.325132369995117, "global_step": 200420, "epoch": 4771} {"train_loss": -7.237534046173096, "global_step": 200421, "epoch": 4771} {"train_loss": -7.219309329986572, "global_step": 200422, "epoch": 4771} {"train_loss": -7.228411118189494, "global_step": 200423, "epoch": 4771, "val_loss": 69259.6953125} {"train_loss": -7.207077980041504, "global_step": 200424, "epoch": 4772} {"train_loss": -7.253795623779297, "global_step": 200425, "epoch": 4772} {"train_loss": -7.289325714111328, "global_step": 200426, "epoch": 4772} {"train_loss": -7.169348239898682, "global_step": 200427, "epoch": 4772} {"train_loss": -7.2494587898254395, "global_step": 200428, "epoch": 4772} {"train_loss": -7.106287479400635, "global_step": 200429, "epoch": 4772} {"train_loss": -7.080817699432373, "global_step": 200430, "epoch": 4772} {"train_loss": -7.214361190795898, "global_step": 200431, "epoch": 4772} {"train_loss": -7.211823463439941, "global_step": 200432, "epoch": 4772} {"train_loss": -7.1155500411987305, "global_step": 200433, "epoch": 4772} {"train_loss": -7.265372276306152, "global_step": 200434, "epoch": 4772} {"train_loss": -7.226977348327637, "global_step": 200435, "epoch": 4772} {"train_loss": -7.126779556274414, "global_step": 200436, "epoch": 4772} {"train_loss": -7.074885368347168, "global_step": 200437, "epoch": 4772} {"train_loss": -7.121325492858887, "global_step": 200438, "epoch": 4772} {"train_loss": -7.164955139160156, "global_step": 200439, "epoch": 4772} {"train_loss": -7.177711486816406, "global_step": 200440, "epoch": 4772} {"train_loss": -7.187510013580322, "global_step": 200441, "epoch": 4772} {"train_loss": -6.984165191650391, "global_step": 200442, "epoch": 4772} {"train_loss": -7.24763298034668, "global_step": 200443, "epoch": 4772} {"train_loss": -6.94690465927124, "global_step": 200444, "epoch": 4772} {"train_loss": -7.204392910003662, "global_step": 200445, "epoch": 4772} {"train_loss": -7.142602920532227, "global_step": 200446, "epoch": 4772} {"train_loss": -7.124685287475586, "global_step": 200447, "epoch": 4772} {"train_loss": -7.1691083908081055, "global_step": 200448, "epoch": 4772} {"train_loss": -7.139244556427002, "global_step": 200449, "epoch": 4772} {"train_loss": -7.150918006896973, "global_step": 200450, "epoch": 4772} {"train_loss": -7.06427001953125, "global_step": 200451, "epoch": 4772} {"train_loss": -7.137317657470703, "global_step": 200452, "epoch": 4772} {"train_loss": -7.160904884338379, "global_step": 200453, "epoch": 4772} {"train_loss": -7.14637565612793, "global_step": 200454, "epoch": 4772} {"train_loss": -7.119980812072754, "global_step": 200455, "epoch": 4772} {"train_loss": -7.170613765716553, "global_step": 200456, "epoch": 4772} {"train_loss": -7.139728546142578, "global_step": 200457, "epoch": 4772} {"train_loss": -7.169422149658203, "global_step": 200458, "epoch": 4772} {"train_loss": -7.089719772338867, "global_step": 200459, "epoch": 4772} {"train_loss": -7.162889003753662, "global_step": 200460, "epoch": 4772} {"train_loss": -7.187013626098633, "global_step": 200461, "epoch": 4772} {"train_loss": -7.08848762512207, "global_step": 200462, "epoch": 4772} {"train_loss": -7.1615729331970215, "global_step": 200463, "epoch": 4772} {"train_loss": -7.189373016357422, "global_step": 200464, "epoch": 4772} {"train_loss": -7.15387301217942, "global_step": 200465, "epoch": 4772, "val_loss": 69029.09375} {"train_loss": -7.187886714935303, "global_step": 200466, "epoch": 4773} {"train_loss": -7.166248321533203, "global_step": 200467, "epoch": 4773} {"train_loss": -7.050899505615234, "global_step": 200468, "epoch": 4773} {"train_loss": -7.13497257232666, "global_step": 200469, "epoch": 4773} {"train_loss": -7.157772064208984, "global_step": 200470, "epoch": 4773} {"train_loss": -7.102514266967773, "global_step": 200471, "epoch": 4773} {"train_loss": -7.351693630218506, "global_step": 200472, "epoch": 4773} {"train_loss": -7.190097808837891, "global_step": 200473, "epoch": 4773} {"train_loss": -6.9967803955078125, "global_step": 200474, "epoch": 4773} {"train_loss": -7.3123884201049805, "global_step": 200475, "epoch": 4773} {"train_loss": -7.093361854553223, "global_step": 200476, "epoch": 4773} {"train_loss": -7.207561492919922, "global_step": 200477, "epoch": 4773} {"train_loss": -7.122158050537109, "global_step": 200478, "epoch": 4773} {"train_loss": -7.097599983215332, "global_step": 200479, "epoch": 4773} {"train_loss": -7.239990234375, "global_step": 200480, "epoch": 4773} {"train_loss": -7.14335298538208, "global_step": 200481, "epoch": 4773} {"train_loss": -7.171392440795898, "global_step": 200482, "epoch": 4773} {"train_loss": -7.189634323120117, "global_step": 200483, "epoch": 4773} {"train_loss": -7.198345184326172, "global_step": 200484, "epoch": 4773} {"train_loss": -7.025188446044922, "global_step": 200485, "epoch": 4773} {"train_loss": -7.128620624542236, "global_step": 200486, "epoch": 4773} {"train_loss": -7.221314907073975, "global_step": 200487, "epoch": 4773} {"train_loss": -7.1959428787231445, "global_step": 200488, "epoch": 4773} {"train_loss": -6.968756675720215, "global_step": 200489, "epoch": 4773} {"train_loss": -7.222564697265625, "global_step": 200490, "epoch": 4773} {"train_loss": -7.115914344787598, "global_step": 200491, "epoch": 4773} {"train_loss": -7.219967842102051, "global_step": 200492, "epoch": 4773} {"train_loss": -7.225559234619141, "global_step": 200493, "epoch": 4773} {"train_loss": -7.137241840362549, "global_step": 200494, "epoch": 4773} {"train_loss": -7.218601226806641, "global_step": 200495, "epoch": 4773} {"train_loss": -7.164466857910156, "global_step": 200496, "epoch": 4773} {"train_loss": -7.112565040588379, "global_step": 200497, "epoch": 4773} {"train_loss": -7.175107955932617, "global_step": 200498, "epoch": 4773} {"train_loss": -7.162838935852051, "global_step": 200499, "epoch": 4773} {"train_loss": -7.281856536865234, "global_step": 200500, "epoch": 4773} {"train_loss": -7.149923324584961, "global_step": 200501, "epoch": 4773} {"train_loss": -7.329724311828613, "global_step": 200502, "epoch": 4773} {"train_loss": -7.217513084411621, "global_step": 200503, "epoch": 4773} {"train_loss": -7.177458763122559, "global_step": 200504, "epoch": 4773} {"train_loss": -7.269321441650391, "global_step": 200505, "epoch": 4773} {"train_loss": -7.125310897827148, "global_step": 200506, "epoch": 4773} {"train_loss": -7.171985898699079, "global_step": 200507, "epoch": 4773, "val_loss": 68903.2890625} {"train_loss": -7.292801856994629, "global_step": 200508, "epoch": 4774} {"train_loss": -7.278581619262695, "global_step": 200509, "epoch": 4774} {"train_loss": -7.097804546356201, "global_step": 200510, "epoch": 4774} {"train_loss": -7.261932373046875, "global_step": 200511, "epoch": 4774} {"train_loss": -7.265562534332275, "global_step": 200512, "epoch": 4774} {"train_loss": -7.265811920166016, "global_step": 200513, "epoch": 4774} {"train_loss": -7.177701473236084, "global_step": 200514, "epoch": 4774} {"train_loss": -7.246926307678223, "global_step": 200515, "epoch": 4774} {"train_loss": -7.180923938751221, "global_step": 200516, "epoch": 4774} {"train_loss": -7.232690811157227, "global_step": 200517, "epoch": 4774} {"train_loss": -7.32360315322876, "global_step": 200518, "epoch": 4774} {"train_loss": -7.324370861053467, "global_step": 200519, "epoch": 4774} {"train_loss": -7.342215061187744, "global_step": 200520, "epoch": 4774} {"train_loss": -7.335943222045898, "global_step": 200521, "epoch": 4774} {"train_loss": -7.31643009185791, "global_step": 200522, "epoch": 4774} {"train_loss": -7.372079849243164, "global_step": 200523, "epoch": 4774} {"train_loss": -7.237920761108398, "global_step": 200524, "epoch": 4774} {"train_loss": -7.239758491516113, "global_step": 200525, "epoch": 4774} {"train_loss": -7.247616291046143, "global_step": 200526, "epoch": 4774} {"train_loss": -7.3029632568359375, "global_step": 200527, "epoch": 4774} {"train_loss": -7.247196197509766, "global_step": 200528, "epoch": 4774} {"train_loss": -7.298791408538818, "global_step": 200529, "epoch": 4774} {"train_loss": -7.236467361450195, "global_step": 200530, "epoch": 4774} {"train_loss": -7.286325454711914, "global_step": 200531, "epoch": 4774} {"train_loss": -7.236865043640137, "global_step": 200532, "epoch": 4774} {"train_loss": -7.285245418548584, "global_step": 200533, "epoch": 4774} {"train_loss": -7.3445940017700195, "global_step": 200534, "epoch": 4774} {"train_loss": -7.16227912902832, "global_step": 200535, "epoch": 4774} {"train_loss": -7.232166290283203, "global_step": 200536, "epoch": 4774} {"train_loss": -7.314566135406494, "global_step": 200537, "epoch": 4774} {"train_loss": -7.216257095336914, "global_step": 200538, "epoch": 4774} {"train_loss": -7.295592308044434, "global_step": 200539, "epoch": 4774} {"train_loss": -7.336610317230225, "global_step": 200540, "epoch": 4774} {"train_loss": -7.341713905334473, "global_step": 200541, "epoch": 4774} {"train_loss": -7.1611738204956055, "global_step": 200542, "epoch": 4774} {"train_loss": -7.271185398101807, "global_step": 200543, "epoch": 4774} {"train_loss": -7.385194301605225, "global_step": 200544, "epoch": 4774} {"train_loss": -7.3180155754089355, "global_step": 200545, "epoch": 4774} {"train_loss": -7.316425323486328, "global_step": 200546, "epoch": 4774} {"train_loss": -7.238364219665527, "global_step": 200547, "epoch": 4774} {"train_loss": -7.3217949867248535, "global_step": 200548, "epoch": 4774} {"train_loss": -7.269832997095017, "global_step": 200549, "epoch": 4774, "val_loss": 69113.9765625} {"train_loss": -7.28861141204834, "global_step": 200550, "epoch": 4775} {"train_loss": -7.148358345031738, "global_step": 200551, "epoch": 4775} {"train_loss": -7.271353244781494, "global_step": 200552, "epoch": 4775} {"train_loss": -7.28450870513916, "global_step": 200553, "epoch": 4775} {"train_loss": -7.190496444702148, "global_step": 200554, "epoch": 4775} {"train_loss": -7.321835517883301, "global_step": 200555, "epoch": 4775} {"train_loss": -7.266793251037598, "global_step": 200556, "epoch": 4775} {"train_loss": -7.327695369720459, "global_step": 200557, "epoch": 4775} {"train_loss": -7.285577297210693, "global_step": 200558, "epoch": 4775} {"train_loss": -7.315332412719727, "global_step": 200559, "epoch": 4775} {"train_loss": -7.368599891662598, "global_step": 200560, "epoch": 4775} {"train_loss": -7.146640777587891, "global_step": 200561, "epoch": 4775} {"train_loss": -7.2206010818481445, "global_step": 200562, "epoch": 4775} {"train_loss": -7.367413520812988, "global_step": 200563, "epoch": 4775} {"train_loss": -7.22210168838501, "global_step": 200564, "epoch": 4775} {"train_loss": -7.307138919830322, "global_step": 200565, "epoch": 4775} {"train_loss": -7.340051651000977, "global_step": 200566, "epoch": 4775} {"train_loss": -7.235939025878906, "global_step": 200567, "epoch": 4775} {"train_loss": -7.324596405029297, "global_step": 200568, "epoch": 4775} {"train_loss": -7.337197780609131, "global_step": 200569, "epoch": 4775} {"train_loss": -7.196293830871582, "global_step": 200570, "epoch": 4775} {"train_loss": -7.418777942657471, "global_step": 200571, "epoch": 4775} {"train_loss": -7.219555377960205, "global_step": 200572, "epoch": 4775} {"train_loss": -7.167818069458008, "global_step": 200573, "epoch": 4775} {"train_loss": -7.163185119628906, "global_step": 200574, "epoch": 4775} {"train_loss": -7.358559608459473, "global_step": 200575, "epoch": 4775} {"train_loss": -7.180243015289307, "global_step": 200576, "epoch": 4775} {"train_loss": -7.2054033279418945, "global_step": 200577, "epoch": 4775} {"train_loss": -7.2172956466674805, "global_step": 200578, "epoch": 4775} {"train_loss": -7.289565086364746, "global_step": 200579, "epoch": 4775} {"train_loss": -7.177882194519043, "global_step": 200580, "epoch": 4775} {"train_loss": -7.242005348205566, "global_step": 200581, "epoch": 4775} {"train_loss": -7.277754783630371, "global_step": 200582, "epoch": 4775} {"train_loss": -7.229372024536133, "global_step": 200583, "epoch": 4775} {"train_loss": -7.05436897277832, "global_step": 200584, "epoch": 4775} {"train_loss": -7.119171619415283, "global_step": 200585, "epoch": 4775} {"train_loss": -7.207119941711426, "global_step": 200586, "epoch": 4775} {"train_loss": -6.984767913818359, "global_step": 200587, "epoch": 4775} {"train_loss": -7.15644645690918, "global_step": 200588, "epoch": 4775} {"train_loss": -7.100247383117676, "global_step": 200589, "epoch": 4775} {"train_loss": -7.125356674194336, "global_step": 200590, "epoch": 4775} {"train_loss": -7.233851251148042, "global_step": 200591, "epoch": 4775, "val_loss": 69162.734375} {"train_loss": -7.233319282531738, "global_step": 200592, "epoch": 4776} {"train_loss": -7.168158054351807, "global_step": 200593, "epoch": 4776} {"train_loss": -7.167268753051758, "global_step": 200594, "epoch": 4776} {"train_loss": -7.172824859619141, "global_step": 200595, "epoch": 4776} {"train_loss": -7.192240238189697, "global_step": 200596, "epoch": 4776} {"train_loss": -7.145830154418945, "global_step": 200597, "epoch": 4776} {"train_loss": -7.248037338256836, "global_step": 200598, "epoch": 4776} {"train_loss": -7.187819004058838, "global_step": 200599, "epoch": 4776} {"train_loss": -7.186655044555664, "global_step": 200600, "epoch": 4776} {"train_loss": -7.2831902503967285, "global_step": 200601, "epoch": 4776} {"train_loss": -7.079461097717285, "global_step": 200602, "epoch": 4776} {"train_loss": -7.229809284210205, "global_step": 200603, "epoch": 4776} {"train_loss": -7.101937770843506, "global_step": 200604, "epoch": 4776} {"train_loss": -7.288271903991699, "global_step": 200605, "epoch": 4776} {"train_loss": -7.224024772644043, "global_step": 200606, "epoch": 4776} {"train_loss": -7.276889324188232, "global_step": 200607, "epoch": 4776} {"train_loss": -7.1397905349731445, "global_step": 200608, "epoch": 4776} {"train_loss": -7.182807922363281, "global_step": 200609, "epoch": 4776} {"train_loss": -7.248833656311035, "global_step": 200610, "epoch": 4776} {"train_loss": -7.248486518859863, "global_step": 200611, "epoch": 4776} {"train_loss": -7.27109432220459, "global_step": 200612, "epoch": 4776} {"train_loss": -7.2089104652404785, "global_step": 200613, "epoch": 4776} {"train_loss": -7.197856903076172, "global_step": 200614, "epoch": 4776} {"train_loss": -7.277904510498047, "global_step": 200615, "epoch": 4776} {"train_loss": -7.165335655212402, "global_step": 200616, "epoch": 4776} {"train_loss": -7.246981620788574, "global_step": 200617, "epoch": 4776} {"train_loss": -7.2757158279418945, "global_step": 200618, "epoch": 4776} {"train_loss": -7.141417503356934, "global_step": 200619, "epoch": 4776} {"train_loss": -7.329106330871582, "global_step": 200620, "epoch": 4776} {"train_loss": -7.201649188995361, "global_step": 200621, "epoch": 4776} {"train_loss": -7.105142593383789, "global_step": 200622, "epoch": 4776} {"train_loss": -7.245804786682129, "global_step": 200623, "epoch": 4776} {"train_loss": -7.277491569519043, "global_step": 200624, "epoch": 4776} {"train_loss": -7.153899192810059, "global_step": 200625, "epoch": 4776} {"train_loss": -7.385960578918457, "global_step": 200626, "epoch": 4776} {"train_loss": -7.1266584396362305, "global_step": 200627, "epoch": 4776} {"train_loss": -7.18782377243042, "global_step": 200628, "epoch": 4776} {"train_loss": -7.275735855102539, "global_step": 200629, "epoch": 4776} {"train_loss": -7.268268585205078, "global_step": 200630, "epoch": 4776} {"train_loss": -7.220747470855713, "global_step": 200631, "epoch": 4776} {"train_loss": -7.134791374206543, "global_step": 200632, "epoch": 4776} {"train_loss": -7.215103058587937, "global_step": 200633, "epoch": 4776, "val_loss": 69014.2578125} {"train_loss": -7.326661109924316, "global_step": 200634, "epoch": 4777} {"train_loss": -7.206438064575195, "global_step": 200635, "epoch": 4777} {"train_loss": -7.275788307189941, "global_step": 200636, "epoch": 4777} {"train_loss": -7.174805164337158, "global_step": 200637, "epoch": 4777} {"train_loss": -7.282061576843262, "global_step": 200638, "epoch": 4777} {"train_loss": -7.266457557678223, "global_step": 200639, "epoch": 4777} {"train_loss": -7.3203020095825195, "global_step": 200640, "epoch": 4777} {"train_loss": -7.215837478637695, "global_step": 200641, "epoch": 4777} {"train_loss": -7.20560884475708, "global_step": 200642, "epoch": 4777} {"train_loss": -7.272476673126221, "global_step": 200643, "epoch": 4777} {"train_loss": -7.207544326782227, "global_step": 200644, "epoch": 4777} {"train_loss": -7.295346260070801, "global_step": 200645, "epoch": 4777} {"train_loss": -7.239066123962402, "global_step": 200646, "epoch": 4777} {"train_loss": -7.221770763397217, "global_step": 200647, "epoch": 4777} {"train_loss": -7.317711353302002, "global_step": 200648, "epoch": 4777} {"train_loss": -7.332579612731934, "global_step": 200649, "epoch": 4777} {"train_loss": -7.266300678253174, "global_step": 200650, "epoch": 4777} {"train_loss": -7.347294807434082, "global_step": 200651, "epoch": 4777} {"train_loss": -7.317636489868164, "global_step": 200652, "epoch": 4777} {"train_loss": -7.222901344299316, "global_step": 200653, "epoch": 4777} {"train_loss": -7.25187873840332, "global_step": 200654, "epoch": 4777} {"train_loss": -7.1522440910339355, "global_step": 200655, "epoch": 4777} {"train_loss": -7.367945194244385, "global_step": 200656, "epoch": 4777} {"train_loss": -7.295290946960449, "global_step": 200657, "epoch": 4777} {"train_loss": -7.241289138793945, "global_step": 200658, "epoch": 4777} {"train_loss": -7.32412052154541, "global_step": 200659, "epoch": 4777} {"train_loss": -7.244597434997559, "global_step": 200660, "epoch": 4777} {"train_loss": -7.251284599304199, "global_step": 200661, "epoch": 4777} {"train_loss": -7.160866737365723, "global_step": 200662, "epoch": 4777} {"train_loss": -7.154545783996582, "global_step": 200663, "epoch": 4777} {"train_loss": -7.226263999938965, "global_step": 200664, "epoch": 4777} {"train_loss": -7.274328231811523, "global_step": 200665, "epoch": 4777} {"train_loss": -7.1641387939453125, "global_step": 200666, "epoch": 4777} {"train_loss": -7.2029218673706055, "global_step": 200667, "epoch": 4777} {"train_loss": -7.258052825927734, "global_step": 200668, "epoch": 4777} {"train_loss": -7.248471736907959, "global_step": 200669, "epoch": 4777} {"train_loss": -7.223604679107666, "global_step": 200670, "epoch": 4777} {"train_loss": -7.101650238037109, "global_step": 200671, "epoch": 4777} {"train_loss": -7.208390712738037, "global_step": 200672, "epoch": 4777} {"train_loss": -7.19463586807251, "global_step": 200673, "epoch": 4777} {"train_loss": -7.064108371734619, "global_step": 200674, "epoch": 4777} {"train_loss": -7.240490845271519, "global_step": 200675, "epoch": 4777, "val_loss": 68998.6328125} {"train_loss": -7.158391952514648, "global_step": 200676, "epoch": 4778} {"train_loss": -7.262520790100098, "global_step": 200677, "epoch": 4778} {"train_loss": -7.08583927154541, "global_step": 200678, "epoch": 4778} {"train_loss": -7.263638019561768, "global_step": 200679, "epoch": 4778} {"train_loss": -7.281599998474121, "global_step": 200680, "epoch": 4778} {"train_loss": -7.08725643157959, "global_step": 200681, "epoch": 4778} {"train_loss": -7.306309700012207, "global_step": 200682, "epoch": 4778} {"train_loss": -7.19058895111084, "global_step": 200683, "epoch": 4778} {"train_loss": -7.2710371017456055, "global_step": 200684, "epoch": 4778} {"train_loss": -7.076003551483154, "global_step": 200685, "epoch": 4778} {"train_loss": -7.237184524536133, "global_step": 200686, "epoch": 4778} {"train_loss": -7.144984245300293, "global_step": 200687, "epoch": 4778} {"train_loss": -7.096745014190674, "global_step": 200688, "epoch": 4778} {"train_loss": -7.18870735168457, "global_step": 200689, "epoch": 4778} {"train_loss": -7.181159973144531, "global_step": 200690, "epoch": 4778} {"train_loss": -7.127420425415039, "global_step": 200691, "epoch": 4778} {"train_loss": -7.158479690551758, "global_step": 200692, "epoch": 4778} {"train_loss": -7.117598056793213, "global_step": 200693, "epoch": 4778} {"train_loss": -7.193026542663574, "global_step": 200694, "epoch": 4778} {"train_loss": -7.132559776306152, "global_step": 200695, "epoch": 4778} {"train_loss": -7.141397476196289, "global_step": 200696, "epoch": 4778} {"train_loss": -7.180578231811523, "global_step": 200697, "epoch": 4778} {"train_loss": -7.123430252075195, "global_step": 200698, "epoch": 4778} {"train_loss": -7.236839771270752, "global_step": 200699, "epoch": 4778} {"train_loss": -7.183653831481934, "global_step": 200700, "epoch": 4778} {"train_loss": -7.15875768661499, "global_step": 200701, "epoch": 4778} {"train_loss": -7.236038684844971, "global_step": 200702, "epoch": 4778} {"train_loss": -7.142218589782715, "global_step": 200703, "epoch": 4778} {"train_loss": -7.191471099853516, "global_step": 200704, "epoch": 4778} {"train_loss": -7.1748504638671875, "global_step": 200705, "epoch": 4778} {"train_loss": -7.238788604736328, "global_step": 200706, "epoch": 4778} {"train_loss": -7.118046760559082, "global_step": 200707, "epoch": 4778} {"train_loss": -7.305992603302002, "global_step": 200708, "epoch": 4778} {"train_loss": -7.162262916564941, "global_step": 200709, "epoch": 4778} {"train_loss": -7.119232177734375, "global_step": 200710, "epoch": 4778} {"train_loss": -7.17869758605957, "global_step": 200711, "epoch": 4778} {"train_loss": -7.121625900268555, "global_step": 200712, "epoch": 4778} {"train_loss": -7.14765739440918, "global_step": 200713, "epoch": 4778} {"train_loss": -7.272787570953369, "global_step": 200714, "epoch": 4778} {"train_loss": -7.176578044891357, "global_step": 200715, "epoch": 4778} {"train_loss": -7.025798797607422, "global_step": 200716, "epoch": 4778} {"train_loss": -7.176260232925415, "global_step": 200717, "epoch": 4778, "val_loss": 69095.3359375} {"train_loss": -7.271718978881836, "global_step": 200718, "epoch": 4779} {"train_loss": -7.198465347290039, "global_step": 200719, "epoch": 4779} {"train_loss": -7.226061820983887, "global_step": 200720, "epoch": 4779} {"train_loss": -7.27740478515625, "global_step": 200721, "epoch": 4779} {"train_loss": -7.087815761566162, "global_step": 200722, "epoch": 4779} {"train_loss": -7.161142349243164, "global_step": 200723, "epoch": 4779} {"train_loss": -7.139632225036621, "global_step": 200724, "epoch": 4779} {"train_loss": -7.049551010131836, "global_step": 200725, "epoch": 4779} {"train_loss": -7.230266094207764, "global_step": 200726, "epoch": 4779} {"train_loss": -7.233821392059326, "global_step": 200727, "epoch": 4779} {"train_loss": -7.012781143188477, "global_step": 200728, "epoch": 4779} {"train_loss": -7.09999418258667, "global_step": 200729, "epoch": 4779} {"train_loss": -7.074640274047852, "global_step": 200730, "epoch": 4779} {"train_loss": -7.122061252593994, "global_step": 200731, "epoch": 4779} {"train_loss": -7.158291816711426, "global_step": 200732, "epoch": 4779} {"train_loss": -6.981996059417725, "global_step": 200733, "epoch": 4779} {"train_loss": -7.268064498901367, "global_step": 200734, "epoch": 4779} {"train_loss": -7.0757341384887695, "global_step": 200735, "epoch": 4779} {"train_loss": -7.266260147094727, "global_step": 200736, "epoch": 4779} {"train_loss": -7.224085807800293, "global_step": 200737, "epoch": 4779} {"train_loss": -7.216888427734375, "global_step": 200738, "epoch": 4779} {"train_loss": -7.133154392242432, "global_step": 200739, "epoch": 4779} {"train_loss": -7.200038909912109, "global_step": 200740, "epoch": 4779} {"train_loss": -7.172868728637695, "global_step": 200741, "epoch": 4779} {"train_loss": -7.221423149108887, "global_step": 200742, "epoch": 4779} {"train_loss": -7.281147480010986, "global_step": 200743, "epoch": 4779} {"train_loss": -7.241267681121826, "global_step": 200744, "epoch": 4779} {"train_loss": -7.347291469573975, "global_step": 200745, "epoch": 4779} {"train_loss": -7.301024436950684, "global_step": 200746, "epoch": 4779} {"train_loss": -7.384828567504883, "global_step": 200747, "epoch": 4779} {"train_loss": -7.259297847747803, "global_step": 200748, "epoch": 4779} {"train_loss": -7.217554569244385, "global_step": 200749, "epoch": 4779} {"train_loss": -7.302929401397705, "global_step": 200750, "epoch": 4779} {"train_loss": -7.311800003051758, "global_step": 200751, "epoch": 4779} {"train_loss": -7.290513038635254, "global_step": 200752, "epoch": 4779} {"train_loss": -7.250821113586426, "global_step": 200753, "epoch": 4779} {"train_loss": -7.297460556030273, "global_step": 200754, "epoch": 4779} {"train_loss": -7.261347770690918, "global_step": 200755, "epoch": 4779} {"train_loss": -7.25033712387085, "global_step": 200756, "epoch": 4779} {"train_loss": -7.385529518127441, "global_step": 200757, "epoch": 4779} {"train_loss": -7.337835788726807, "global_step": 200758, "epoch": 4779} {"train_loss": -7.214558521906535, "global_step": 200759, "epoch": 4779, "val_loss": 69205.90625} {"train_loss": -7.138507843017578, "global_step": 200760, "epoch": 4780} {"train_loss": -7.224464416503906, "global_step": 200761, "epoch": 4780} {"train_loss": -7.289429664611816, "global_step": 200762, "epoch": 4780} {"train_loss": -7.289316177368164, "global_step": 200763, "epoch": 4780} {"train_loss": -7.320497989654541, "global_step": 200764, "epoch": 4780} {"train_loss": -7.165340423583984, "global_step": 200765, "epoch": 4780} {"train_loss": -7.381035804748535, "global_step": 200766, "epoch": 4780} {"train_loss": -7.240196228027344, "global_step": 200767, "epoch": 4780} {"train_loss": -7.318878173828125, "global_step": 200768, "epoch": 4780} {"train_loss": -7.178164482116699, "global_step": 200769, "epoch": 4780} {"train_loss": -7.282591819763184, "global_step": 200770, "epoch": 4780} {"train_loss": -7.300265312194824, "global_step": 200771, "epoch": 4780} {"train_loss": -7.268357276916504, "global_step": 200772, "epoch": 4780} {"train_loss": -7.258070945739746, "global_step": 200773, "epoch": 4780} {"train_loss": -7.274984836578369, "global_step": 200774, "epoch": 4780} {"train_loss": -7.308777332305908, "global_step": 200775, "epoch": 4780} {"train_loss": -7.206267833709717, "global_step": 200776, "epoch": 4780} {"train_loss": -7.194052696228027, "global_step": 200777, "epoch": 4780} {"train_loss": -7.225870609283447, "global_step": 200778, "epoch": 4780} {"train_loss": -7.28939151763916, "global_step": 200779, "epoch": 4780} {"train_loss": -7.05349063873291, "global_step": 200780, "epoch": 4780} {"train_loss": -7.23328971862793, "global_step": 200781, "epoch": 4780} {"train_loss": -7.026620864868164, "global_step": 200782, "epoch": 4780} {"train_loss": -7.171056270599365, "global_step": 200783, "epoch": 4780} {"train_loss": -7.091263771057129, "global_step": 200784, "epoch": 4780} {"train_loss": -7.039401531219482, "global_step": 200785, "epoch": 4780} {"train_loss": -7.266568660736084, "global_step": 200786, "epoch": 4780} {"train_loss": -7.071366310119629, "global_step": 200787, "epoch": 4780} {"train_loss": -7.1660566329956055, "global_step": 200788, "epoch": 4780} {"train_loss": -7.23938512802124, "global_step": 200789, "epoch": 4780} {"train_loss": -7.125738143920898, "global_step": 200790, "epoch": 4780} {"train_loss": -7.242305755615234, "global_step": 200791, "epoch": 4780} {"train_loss": -7.272387504577637, "global_step": 200792, "epoch": 4780} {"train_loss": -7.2178802490234375, "global_step": 200793, "epoch": 4780} {"train_loss": -7.055601596832275, "global_step": 200794, "epoch": 4780} {"train_loss": -7.271582126617432, "global_step": 200795, "epoch": 4780} {"train_loss": -7.108623027801514, "global_step": 200796, "epoch": 4780} {"train_loss": -7.2116804122924805, "global_step": 200797, "epoch": 4780} {"train_loss": -7.218963146209717, "global_step": 200798, "epoch": 4780} {"train_loss": -7.239437103271484, "global_step": 200799, "epoch": 4780} {"train_loss": -7.170137405395508, "global_step": 200800, "epoch": 4780} {"train_loss": -7.209810132072086, "global_step": 200801, "epoch": 4780, "val_loss": 68834.046875} {"train_loss": -7.328390121459961, "global_step": 200802, "epoch": 4781} {"train_loss": -7.298666954040527, "global_step": 200803, "epoch": 4781} {"train_loss": -7.323835372924805, "global_step": 200804, "epoch": 4781} {"train_loss": -7.155452728271484, "global_step": 200805, "epoch": 4781} {"train_loss": -7.326859474182129, "global_step": 200806, "epoch": 4781} {"train_loss": -7.3173933029174805, "global_step": 200807, "epoch": 4781} {"train_loss": -7.307805061340332, "global_step": 200808, "epoch": 4781} {"train_loss": -7.28214168548584, "global_step": 200809, "epoch": 4781} {"train_loss": -7.172133445739746, "global_step": 200810, "epoch": 4781} {"train_loss": -7.3119096755981445, "global_step": 200811, "epoch": 4781} {"train_loss": -7.313933372497559, "global_step": 200812, "epoch": 4781} {"train_loss": -7.282663345336914, "global_step": 200813, "epoch": 4781} {"train_loss": -7.391676902770996, "global_step": 200814, "epoch": 4781} {"train_loss": -7.259300231933594, "global_step": 200815, "epoch": 4781} {"train_loss": -7.265730857849121, "global_step": 200816, "epoch": 4781} {"train_loss": -7.23386812210083, "global_step": 200817, "epoch": 4781} {"train_loss": -7.319070816040039, "global_step": 200818, "epoch": 4781} {"train_loss": -7.194622039794922, "global_step": 200819, "epoch": 4781} {"train_loss": -7.227361679077148, "global_step": 200820, "epoch": 4781} {"train_loss": -7.30491828918457, "global_step": 200821, "epoch": 4781} {"train_loss": -7.2864789962768555, "global_step": 200822, "epoch": 4781} {"train_loss": -7.215675354003906, "global_step": 200823, "epoch": 4781} {"train_loss": -7.275752067565918, "global_step": 200824, "epoch": 4781} {"train_loss": -7.315038204193115, "global_step": 200825, "epoch": 4781} {"train_loss": -7.207474231719971, "global_step": 200826, "epoch": 4781} {"train_loss": -7.301212310791016, "global_step": 200827, "epoch": 4781} {"train_loss": -7.250688076019287, "global_step": 200828, "epoch": 4781} {"train_loss": -7.348465919494629, "global_step": 200829, "epoch": 4781} {"train_loss": -7.160282135009766, "global_step": 200830, "epoch": 4781} {"train_loss": -7.257364273071289, "global_step": 200831, "epoch": 4781} {"train_loss": -7.269482612609863, "global_step": 200832, "epoch": 4781} {"train_loss": -7.198728561401367, "global_step": 200833, "epoch": 4781} {"train_loss": -7.260798454284668, "global_step": 200834, "epoch": 4781} {"train_loss": -7.2529296875, "global_step": 200835, "epoch": 4781} {"train_loss": -7.179324626922607, "global_step": 200836, "epoch": 4781} {"train_loss": -7.410011291503906, "global_step": 200837, "epoch": 4781} {"train_loss": -7.234047889709473, "global_step": 200838, "epoch": 4781} {"train_loss": -7.152090072631836, "global_step": 200839, "epoch": 4781} {"train_loss": -7.36336612701416, "global_step": 200840, "epoch": 4781} {"train_loss": -7.218449115753174, "global_step": 200841, "epoch": 4781} {"train_loss": -7.307716369628906, "global_step": 200842, "epoch": 4781} {"train_loss": -7.270685377575102, "global_step": 200843, "epoch": 4781, "val_loss": 69054.359375} {"train_loss": -7.357112407684326, "global_step": 200844, "epoch": 4782} {"train_loss": -7.263948440551758, "global_step": 200845, "epoch": 4782} {"train_loss": -7.353401184082031, "global_step": 200846, "epoch": 4782} {"train_loss": -7.482768535614014, "global_step": 200847, "epoch": 4782} {"train_loss": -7.293941974639893, "global_step": 200848, "epoch": 4782} {"train_loss": -7.271762371063232, "global_step": 200849, "epoch": 4782} {"train_loss": -7.217248916625977, "global_step": 200850, "epoch": 4782} {"train_loss": -7.190446853637695, "global_step": 200851, "epoch": 4782} {"train_loss": -7.1645355224609375, "global_step": 200852, "epoch": 4782} {"train_loss": -7.177521705627441, "global_step": 200853, "epoch": 4782} {"train_loss": -7.197098731994629, "global_step": 200854, "epoch": 4782} {"train_loss": -7.189182281494141, "global_step": 200855, "epoch": 4782} {"train_loss": -7.1176347732543945, "global_step": 200856, "epoch": 4782} {"train_loss": -7.175236225128174, "global_step": 200857, "epoch": 4782} {"train_loss": -7.292814254760742, "global_step": 200858, "epoch": 4782} {"train_loss": -7.286163330078125, "global_step": 200859, "epoch": 4782} {"train_loss": -7.182132720947266, "global_step": 200860, "epoch": 4782} {"train_loss": -7.227758884429932, "global_step": 200861, "epoch": 4782} {"train_loss": -7.21867561340332, "global_step": 200862, "epoch": 4782} {"train_loss": -7.254459381103516, "global_step": 200863, "epoch": 4782} {"train_loss": -7.247167587280273, "global_step": 200864, "epoch": 4782} {"train_loss": -7.2194671630859375, "global_step": 200865, "epoch": 4782} {"train_loss": -7.308817386627197, "global_step": 200866, "epoch": 4782} {"train_loss": -7.358813285827637, "global_step": 200867, "epoch": 4782} {"train_loss": -7.173455238342285, "global_step": 200868, "epoch": 4782} {"train_loss": -7.299862384796143, "global_step": 200869, "epoch": 4782} {"train_loss": -7.147705078125, "global_step": 200870, "epoch": 4782} {"train_loss": -7.266024589538574, "global_step": 200871, "epoch": 4782} {"train_loss": -7.336186408996582, "global_step": 200872, "epoch": 4782} {"train_loss": -7.134045124053955, "global_step": 200873, "epoch": 4782} {"train_loss": -7.134103775024414, "global_step": 200874, "epoch": 4782} {"train_loss": -7.294036865234375, "global_step": 200875, "epoch": 4782} {"train_loss": -7.1605024337768555, "global_step": 200876, "epoch": 4782} {"train_loss": -7.228851795196533, "global_step": 200877, "epoch": 4782} {"train_loss": -7.20255708694458, "global_step": 200878, "epoch": 4782} {"train_loss": -7.088095664978027, "global_step": 200879, "epoch": 4782} {"train_loss": -7.1249589920043945, "global_step": 200880, "epoch": 4782} {"train_loss": -7.338250160217285, "global_step": 200881, "epoch": 4782} {"train_loss": -7.144534111022949, "global_step": 200882, "epoch": 4782} {"train_loss": -7.3470869064331055, "global_step": 200883, "epoch": 4782} {"train_loss": -7.171640872955322, "global_step": 200884, "epoch": 4782} {"train_loss": -7.2357882885705855, "global_step": 200885, "epoch": 4782, "val_loss": 69193.6875} {"train_loss": -7.1762237548828125, "global_step": 200886, "epoch": 4783} {"train_loss": -7.365468502044678, "global_step": 200887, "epoch": 4783} {"train_loss": -7.2921295166015625, "global_step": 200888, "epoch": 4783} {"train_loss": -7.214704513549805, "global_step": 200889, "epoch": 4783} {"train_loss": -7.254383087158203, "global_step": 200890, "epoch": 4783} {"train_loss": -7.2899017333984375, "global_step": 200891, "epoch": 4783} {"train_loss": -7.191072463989258, "global_step": 200892, "epoch": 4783} {"train_loss": -7.265737533569336, "global_step": 200893, "epoch": 4783} {"train_loss": -7.162365436553955, "global_step": 200894, "epoch": 4783} {"train_loss": -7.16512393951416, "global_step": 200895, "epoch": 4783} {"train_loss": -7.206399917602539, "global_step": 200896, "epoch": 4783} {"train_loss": -7.155518054962158, "global_step": 200897, "epoch": 4783} {"train_loss": -7.272618770599365, "global_step": 200898, "epoch": 4783} {"train_loss": -7.320499897003174, "global_step": 200899, "epoch": 4783} {"train_loss": -7.228392601013184, "global_step": 200900, "epoch": 4783} {"train_loss": -7.267085552215576, "global_step": 200901, "epoch": 4783} {"train_loss": -7.338155746459961, "global_step": 200902, "epoch": 4783} {"train_loss": -7.176860809326172, "global_step": 200903, "epoch": 4783} {"train_loss": -7.187204360961914, "global_step": 200904, "epoch": 4783} {"train_loss": -7.279951572418213, "global_step": 200905, "epoch": 4783} {"train_loss": -7.193441867828369, "global_step": 200906, "epoch": 4783} {"train_loss": -7.300762176513672, "global_step": 200907, "epoch": 4783} {"train_loss": -7.253599166870117, "global_step": 200908, "epoch": 4783} {"train_loss": -7.144157409667969, "global_step": 200909, "epoch": 4783} {"train_loss": -7.291912078857422, "global_step": 200910, "epoch": 4783} {"train_loss": -7.265590667724609, "global_step": 200911, "epoch": 4783} {"train_loss": -7.270098686218262, "global_step": 200912, "epoch": 4783} {"train_loss": -7.202282905578613, "global_step": 200913, "epoch": 4783} {"train_loss": -7.293267726898193, "global_step": 200914, "epoch": 4783} {"train_loss": -7.434338569641113, "global_step": 200915, "epoch": 4783} {"train_loss": -7.222428321838379, "global_step": 200916, "epoch": 4783} {"train_loss": -7.190433502197266, "global_step": 200917, "epoch": 4783} {"train_loss": -7.30693244934082, "global_step": 200918, "epoch": 4783} {"train_loss": -7.273494720458984, "global_step": 200919, "epoch": 4783} {"train_loss": -7.315989017486572, "global_step": 200920, "epoch": 4783} {"train_loss": -7.179632186889648, "global_step": 200921, "epoch": 4783} {"train_loss": -7.150204181671143, "global_step": 200922, "epoch": 4783} {"train_loss": -7.295980930328369, "global_step": 200923, "epoch": 4783} {"train_loss": -7.296744346618652, "global_step": 200924, "epoch": 4783} {"train_loss": -7.3407182693481445, "global_step": 200925, "epoch": 4783} {"train_loss": -7.2753400802612305, "global_step": 200926, "epoch": 4783} {"train_loss": -7.250821726662772, "global_step": 200927, "epoch": 4783, "val_loss": 69105.2890625} {"train_loss": -7.403500080108643, "global_step": 200928, "epoch": 4784} {"train_loss": -7.368920803070068, "global_step": 200929, "epoch": 4784} {"train_loss": -7.374597549438477, "global_step": 200930, "epoch": 4784} {"train_loss": -7.296466827392578, "global_step": 200931, "epoch": 4784} {"train_loss": -7.268664360046387, "global_step": 200932, "epoch": 4784} {"train_loss": -7.192227363586426, "global_step": 200933, "epoch": 4784} {"train_loss": -7.191627502441406, "global_step": 200934, "epoch": 4784} {"train_loss": -7.226903915405273, "global_step": 200935, "epoch": 4784} {"train_loss": -7.059351921081543, "global_step": 200936, "epoch": 4784} {"train_loss": -7.161337852478027, "global_step": 200937, "epoch": 4784} {"train_loss": -7.228260040283203, "global_step": 200938, "epoch": 4784} {"train_loss": -7.192000389099121, "global_step": 200939, "epoch": 4784} {"train_loss": -7.323205471038818, "global_step": 200940, "epoch": 4784} {"train_loss": -7.244746208190918, "global_step": 200941, "epoch": 4784} {"train_loss": -7.259849548339844, "global_step": 200942, "epoch": 4784} {"train_loss": -7.231146812438965, "global_step": 200943, "epoch": 4784} {"train_loss": -7.462536811828613, "global_step": 200944, "epoch": 4784} {"train_loss": -7.295253276824951, "global_step": 200945, "epoch": 4784} {"train_loss": -7.345874786376953, "global_step": 200946, "epoch": 4784} {"train_loss": -7.226296424865723, "global_step": 200947, "epoch": 4784} {"train_loss": -7.1956963539123535, "global_step": 200948, "epoch": 4784} {"train_loss": -7.262796878814697, "global_step": 200949, "epoch": 4784} {"train_loss": -7.275318145751953, "global_step": 200950, "epoch": 4784} {"train_loss": -7.266695022583008, "global_step": 200951, "epoch": 4784} {"train_loss": -7.225687026977539, "global_step": 200952, "epoch": 4784} {"train_loss": -7.263769149780273, "global_step": 200953, "epoch": 4784} {"train_loss": -7.287528038024902, "global_step": 200954, "epoch": 4784} {"train_loss": -7.293075084686279, "global_step": 200955, "epoch": 4784} {"train_loss": -7.194950580596924, "global_step": 200956, "epoch": 4784} {"train_loss": -7.223511695861816, "global_step": 200957, "epoch": 4784} {"train_loss": -7.193633079528809, "global_step": 200958, "epoch": 4784} {"train_loss": -7.293150901794434, "global_step": 200959, "epoch": 4784} {"train_loss": -7.224628448486328, "global_step": 200960, "epoch": 4784} {"train_loss": -7.242711544036865, "global_step": 200961, "epoch": 4784} {"train_loss": -7.160052299499512, "global_step": 200962, "epoch": 4784} {"train_loss": -7.249545097351074, "global_step": 200963, "epoch": 4784} {"train_loss": -7.197052001953125, "global_step": 200964, "epoch": 4784} {"train_loss": -7.130239486694336, "global_step": 200965, "epoch": 4784} {"train_loss": -7.181212902069092, "global_step": 200966, "epoch": 4784} {"train_loss": -7.352309226989746, "global_step": 200967, "epoch": 4784} {"train_loss": -7.316457748413086, "global_step": 200968, "epoch": 4784} {"train_loss": -7.253129504975819, "global_step": 200969, "epoch": 4784, "val_loss": 69073.9453125} {"train_loss": -7.276686191558838, "global_step": 200970, "epoch": 4785} {"train_loss": -7.166855335235596, "global_step": 200971, "epoch": 4785} {"train_loss": -7.1010332107543945, "global_step": 200972, "epoch": 4785} {"train_loss": -7.236163139343262, "global_step": 200973, "epoch": 4785} {"train_loss": -7.297603607177734, "global_step": 200974, "epoch": 4785} {"train_loss": -7.239860534667969, "global_step": 200975, "epoch": 4785} {"train_loss": -7.201632976531982, "global_step": 200976, "epoch": 4785} {"train_loss": -7.143803596496582, "global_step": 200977, "epoch": 4785} {"train_loss": -7.195466995239258, "global_step": 200978, "epoch": 4785} {"train_loss": -7.150399684906006, "global_step": 200979, "epoch": 4785} {"train_loss": -7.059548377990723, "global_step": 200980, "epoch": 4785} {"train_loss": -6.971616744995117, "global_step": 200981, "epoch": 4785} {"train_loss": -7.2282609939575195, "global_step": 200982, "epoch": 4785} {"train_loss": -7.107001304626465, "global_step": 200983, "epoch": 4785} {"train_loss": -7.131711959838867, "global_step": 200984, "epoch": 4785} {"train_loss": -7.235708236694336, "global_step": 200985, "epoch": 4785} {"train_loss": -7.073633193969727, "global_step": 200986, "epoch": 4785} {"train_loss": -7.158829212188721, "global_step": 200987, "epoch": 4785} {"train_loss": -7.186954021453857, "global_step": 200988, "epoch": 4785} {"train_loss": -7.220797538757324, "global_step": 200989, "epoch": 4785} {"train_loss": -7.211400985717773, "global_step": 200990, "epoch": 4785} {"train_loss": -7.083198070526123, "global_step": 200991, "epoch": 4785} {"train_loss": -7.13424015045166, "global_step": 200992, "epoch": 4785} {"train_loss": -7.222961902618408, "global_step": 200993, "epoch": 4785} {"train_loss": -7.215685844421387, "global_step": 200994, "epoch": 4785} {"train_loss": -7.26395320892334, "global_step": 200995, "epoch": 4785} {"train_loss": -7.2033257484436035, "global_step": 200996, "epoch": 4785} {"train_loss": -7.212677001953125, "global_step": 200997, "epoch": 4785} {"train_loss": -7.238007545471191, "global_step": 200998, "epoch": 4785} {"train_loss": -7.197652816772461, "global_step": 200999, "epoch": 4785} {"train_loss": -7.32547664642334, "global_step": 201000, "epoch": 4785} {"train_loss": -7.096819877624512, "global_step": 201001, "epoch": 4785} {"train_loss": -7.2257585525512695, "global_step": 201002, "epoch": 4785} {"train_loss": -7.308204650878906, "global_step": 201003, "epoch": 4785} {"train_loss": -7.245444297790527, "global_step": 201004, "epoch": 4785} {"train_loss": -7.238713264465332, "global_step": 201005, "epoch": 4785} {"train_loss": -7.295507431030273, "global_step": 201006, "epoch": 4785} {"train_loss": -7.2607574462890625, "global_step": 201007, "epoch": 4785} {"train_loss": -7.292295455932617, "global_step": 201008, "epoch": 4785} {"train_loss": -7.268495559692383, "global_step": 201009, "epoch": 4785} {"train_loss": -7.182069778442383, "global_step": 201010, "epoch": 4785} {"train_loss": -7.1962101345970515, "global_step": 201011, "epoch": 4785, "val_loss": 69027.8828125} {"train_loss": -7.207098007202148, "global_step": 201012, "epoch": 4786} {"train_loss": -7.202146530151367, "global_step": 201013, "epoch": 4786} {"train_loss": -7.2743096351623535, "global_step": 201014, "epoch": 4786} {"train_loss": -7.165895462036133, "global_step": 201015, "epoch": 4786} {"train_loss": -7.335475921630859, "global_step": 201016, "epoch": 4786} {"train_loss": -7.290164947509766, "global_step": 201017, "epoch": 4786} {"train_loss": -7.398697853088379, "global_step": 201018, "epoch": 4786} {"train_loss": -7.175882339477539, "global_step": 201019, "epoch": 4786} {"train_loss": -7.181546688079834, "global_step": 201020, "epoch": 4786} {"train_loss": -7.287113189697266, "global_step": 201021, "epoch": 4786} {"train_loss": -7.224850654602051, "global_step": 201022, "epoch": 4786} {"train_loss": -7.278475761413574, "global_step": 201023, "epoch": 4786} {"train_loss": -7.18042516708374, "global_step": 201024, "epoch": 4786} {"train_loss": -7.120326995849609, "global_step": 201025, "epoch": 4786} {"train_loss": -7.283503532409668, "global_step": 201026, "epoch": 4786} {"train_loss": -7.336604595184326, "global_step": 201027, "epoch": 4786} {"train_loss": -7.132077693939209, "global_step": 201028, "epoch": 4786} {"train_loss": -7.254297256469727, "global_step": 201029, "epoch": 4786} {"train_loss": -7.272710800170898, "global_step": 201030, "epoch": 4786} {"train_loss": -7.115827560424805, "global_step": 201031, "epoch": 4786} {"train_loss": -7.25560188293457, "global_step": 201032, "epoch": 4786} {"train_loss": -7.36882209777832, "global_step": 201033, "epoch": 4786} {"train_loss": -7.196176052093506, "global_step": 201034, "epoch": 4786} {"train_loss": -7.207493782043457, "global_step": 201035, "epoch": 4786} {"train_loss": -7.27990198135376, "global_step": 201036, "epoch": 4786} {"train_loss": -7.1892991065979, "global_step": 201037, "epoch": 4786} {"train_loss": -7.183184623718262, "global_step": 201038, "epoch": 4786} {"train_loss": -7.360712051391602, "global_step": 201039, "epoch": 4786} {"train_loss": -7.285019874572754, "global_step": 201040, "epoch": 4786} {"train_loss": -7.342731475830078, "global_step": 201041, "epoch": 4786} {"train_loss": -7.245335578918457, "global_step": 201042, "epoch": 4786} {"train_loss": -7.200501918792725, "global_step": 201043, "epoch": 4786} {"train_loss": -7.358394622802734, "global_step": 201044, "epoch": 4786} {"train_loss": -7.230548858642578, "global_step": 201045, "epoch": 4786} {"train_loss": -7.230255126953125, "global_step": 201046, "epoch": 4786} {"train_loss": -7.310120582580566, "global_step": 201047, "epoch": 4786} {"train_loss": -7.203900337219238, "global_step": 201048, "epoch": 4786} {"train_loss": -7.253655433654785, "global_step": 201049, "epoch": 4786} {"train_loss": -7.21045446395874, "global_step": 201050, "epoch": 4786} {"train_loss": -7.203775882720947, "global_step": 201051, "epoch": 4786} {"train_loss": -7.234484672546387, "global_step": 201052, "epoch": 4786} {"train_loss": -7.243447871435256, "global_step": 201053, "epoch": 4786, "val_loss": 69065.359375} {"train_loss": -7.233656406402588, "global_step": 201054, "epoch": 4787} {"train_loss": -7.288999557495117, "global_step": 201055, "epoch": 4787} {"train_loss": -7.317897796630859, "global_step": 201056, "epoch": 4787} {"train_loss": -7.279583930969238, "global_step": 201057, "epoch": 4787} {"train_loss": -7.340615272521973, "global_step": 201058, "epoch": 4787} {"train_loss": -7.2082719802856445, "global_step": 201059, "epoch": 4787} {"train_loss": -7.303979873657227, "global_step": 201060, "epoch": 4787} {"train_loss": -7.337979793548584, "global_step": 201061, "epoch": 4787} {"train_loss": -7.266213893890381, "global_step": 201062, "epoch": 4787} {"train_loss": -7.3098554611206055, "global_step": 201063, "epoch": 4787} {"train_loss": -7.29158878326416, "global_step": 201064, "epoch": 4787} {"train_loss": -7.356039047241211, "global_step": 201065, "epoch": 4787} {"train_loss": -7.313093662261963, "global_step": 201066, "epoch": 4787} {"train_loss": -7.309221267700195, "global_step": 201067, "epoch": 4787} {"train_loss": -7.261004447937012, "global_step": 201068, "epoch": 4787} {"train_loss": -7.235847473144531, "global_step": 201069, "epoch": 4787} {"train_loss": -7.118832588195801, "global_step": 201070, "epoch": 4787} {"train_loss": -7.189996242523193, "global_step": 201071, "epoch": 4787} {"train_loss": -7.212696075439453, "global_step": 201072, "epoch": 4787} {"train_loss": -6.988304138183594, "global_step": 201073, "epoch": 4787} {"train_loss": -7.148736000061035, "global_step": 201074, "epoch": 4787} {"train_loss": -7.210104942321777, "global_step": 201075, "epoch": 4787} {"train_loss": -7.040973663330078, "global_step": 201076, "epoch": 4787} {"train_loss": -7.041913032531738, "global_step": 201077, "epoch": 4787} {"train_loss": -7.110342979431152, "global_step": 201078, "epoch": 4787} {"train_loss": -7.142880439758301, "global_step": 201079, "epoch": 4787} {"train_loss": -7.136935710906982, "global_step": 201080, "epoch": 4787} {"train_loss": -7.192085266113281, "global_step": 201081, "epoch": 4787} {"train_loss": -7.093135833740234, "global_step": 201082, "epoch": 4787} {"train_loss": -7.201332092285156, "global_step": 201083, "epoch": 4787} {"train_loss": -7.149986267089844, "global_step": 201084, "epoch": 4787} {"train_loss": -7.060798645019531, "global_step": 201085, "epoch": 4787} {"train_loss": -7.094220161437988, "global_step": 201086, "epoch": 4787} {"train_loss": -7.135002136230469, "global_step": 201087, "epoch": 4787} {"train_loss": -7.114453315734863, "global_step": 201088, "epoch": 4787} {"train_loss": -7.079998016357422, "global_step": 201089, "epoch": 4787} {"train_loss": -7.087406158447266, "global_step": 201090, "epoch": 4787} {"train_loss": -7.144811630249023, "global_step": 201091, "epoch": 4787} {"train_loss": -7.113772392272949, "global_step": 201092, "epoch": 4787} {"train_loss": -6.997006416320801, "global_step": 201093, "epoch": 4787} {"train_loss": -7.1262712478637695, "global_step": 201094, "epoch": 4787} {"train_loss": -7.182585614068167, "global_step": 201095, "epoch": 4787, "val_loss": 69084.59375} {"train_loss": -7.102126121520996, "global_step": 201096, "epoch": 4788} {"train_loss": -7.105605125427246, "global_step": 201097, "epoch": 4788} {"train_loss": -7.135504722595215, "global_step": 201098, "epoch": 4788} {"train_loss": -7.208603382110596, "global_step": 201099, "epoch": 4788} {"train_loss": -7.130563735961914, "global_step": 201100, "epoch": 4788} {"train_loss": -7.128268241882324, "global_step": 201101, "epoch": 4788} {"train_loss": -7.171540260314941, "global_step": 201102, "epoch": 4788} {"train_loss": -7.024288177490234, "global_step": 201103, "epoch": 4788} {"train_loss": -7.178167343139648, "global_step": 201104, "epoch": 4788} {"train_loss": -7.279498100280762, "global_step": 201105, "epoch": 4788} {"train_loss": -7.1839280128479, "global_step": 201106, "epoch": 4788} {"train_loss": -7.056469440460205, "global_step": 201107, "epoch": 4788} {"train_loss": -7.158571243286133, "global_step": 201108, "epoch": 4788} {"train_loss": -7.141292572021484, "global_step": 201109, "epoch": 4788} {"train_loss": -7.12019157409668, "global_step": 201110, "epoch": 4788} {"train_loss": -7.1527018547058105, "global_step": 201111, "epoch": 4788} {"train_loss": -7.284854888916016, "global_step": 201112, "epoch": 4788} {"train_loss": -7.179640769958496, "global_step": 201113, "epoch": 4788} {"train_loss": -7.154923915863037, "global_step": 201114, "epoch": 4788} {"train_loss": -7.066015720367432, "global_step": 201115, "epoch": 4788} {"train_loss": -7.265225410461426, "global_step": 201116, "epoch": 4788} {"train_loss": -7.138446807861328, "global_step": 201117, "epoch": 4788} {"train_loss": -7.199137210845947, "global_step": 201118, "epoch": 4788} {"train_loss": -7.262628555297852, "global_step": 201119, "epoch": 4788} {"train_loss": -7.241718769073486, "global_step": 201120, "epoch": 4788} {"train_loss": -7.226654052734375, "global_step": 201121, "epoch": 4788} {"train_loss": -7.296324729919434, "global_step": 201122, "epoch": 4788} {"train_loss": -7.277669906616211, "global_step": 201123, "epoch": 4788} {"train_loss": -7.2530035972595215, "global_step": 201124, "epoch": 4788} {"train_loss": -7.309460639953613, "global_step": 201125, "epoch": 4788} {"train_loss": -7.20135498046875, "global_step": 201126, "epoch": 4788} {"train_loss": -7.309427261352539, "global_step": 201127, "epoch": 4788} {"train_loss": -7.406078815460205, "global_step": 201128, "epoch": 4788} {"train_loss": -7.174991130828857, "global_step": 201129, "epoch": 4788} {"train_loss": -7.221797466278076, "global_step": 201130, "epoch": 4788} {"train_loss": -7.219020366668701, "global_step": 201131, "epoch": 4788} {"train_loss": -7.256659507751465, "global_step": 201132, "epoch": 4788} {"train_loss": -7.3035430908203125, "global_step": 201133, "epoch": 4788} {"train_loss": -7.267445087432861, "global_step": 201134, "epoch": 4788} {"train_loss": -7.2478837966918945, "global_step": 201135, "epoch": 4788} {"train_loss": -7.238956451416016, "global_step": 201136, "epoch": 4788} {"train_loss": -7.205465827669416, "global_step": 201137, "epoch": 4788, "val_loss": 69075.296875} {"train_loss": -7.194977760314941, "global_step": 201138, "epoch": 4789} {"train_loss": -7.241096496582031, "global_step": 201139, "epoch": 4789} {"train_loss": -7.313094139099121, "global_step": 201140, "epoch": 4789} {"train_loss": -7.322494029998779, "global_step": 201141, "epoch": 4789} {"train_loss": -7.175176620483398, "global_step": 201142, "epoch": 4789} {"train_loss": -7.24456787109375, "global_step": 201143, "epoch": 4789} {"train_loss": -7.042138576507568, "global_step": 201144, "epoch": 4789} {"train_loss": -7.215929985046387, "global_step": 201145, "epoch": 4789} {"train_loss": -7.179502487182617, "global_step": 201146, "epoch": 4789} {"train_loss": -7.2172322273254395, "global_step": 201147, "epoch": 4789} {"train_loss": -7.163005828857422, "global_step": 201148, "epoch": 4789} {"train_loss": -7.159245491027832, "global_step": 201149, "epoch": 4789} {"train_loss": -7.206127643585205, "global_step": 201150, "epoch": 4789} {"train_loss": -7.191313743591309, "global_step": 201151, "epoch": 4789} {"train_loss": -7.070952415466309, "global_step": 201152, "epoch": 4789} {"train_loss": -7.21511173248291, "global_step": 201153, "epoch": 4789} {"train_loss": -7.237359046936035, "global_step": 201154, "epoch": 4789} {"train_loss": -7.217005729675293, "global_step": 201155, "epoch": 4789} {"train_loss": -7.245744705200195, "global_step": 201156, "epoch": 4789} {"train_loss": -7.235526084899902, "global_step": 201157, "epoch": 4789} {"train_loss": -7.150245666503906, "global_step": 201158, "epoch": 4789} {"train_loss": -7.368220806121826, "global_step": 201159, "epoch": 4789} {"train_loss": -7.291403770446777, "global_step": 201160, "epoch": 4789} {"train_loss": -7.257654190063477, "global_step": 201161, "epoch": 4789} {"train_loss": -7.293520450592041, "global_step": 201162, "epoch": 4789} {"train_loss": -7.280520439147949, "global_step": 201163, "epoch": 4789} {"train_loss": -7.2756242752075195, "global_step": 201164, "epoch": 4789} {"train_loss": -7.2417402267456055, "global_step": 201165, "epoch": 4789} {"train_loss": -7.233626365661621, "global_step": 201166, "epoch": 4789} {"train_loss": -7.190569877624512, "global_step": 201167, "epoch": 4789} {"train_loss": -7.357020378112793, "global_step": 201168, "epoch": 4789} {"train_loss": -7.2049784660339355, "global_step": 201169, "epoch": 4789} {"train_loss": -7.2060980796813965, "global_step": 201170, "epoch": 4789} {"train_loss": -7.3086137771606445, "global_step": 201171, "epoch": 4789} {"train_loss": -7.234790802001953, "global_step": 201172, "epoch": 4789} {"train_loss": -7.298093795776367, "global_step": 201173, "epoch": 4789} {"train_loss": -7.267951488494873, "global_step": 201174, "epoch": 4789} {"train_loss": -7.321634292602539, "global_step": 201175, "epoch": 4789} {"train_loss": -7.310491561889648, "global_step": 201176, "epoch": 4789} {"train_loss": -7.241001605987549, "global_step": 201177, "epoch": 4789} {"train_loss": -7.262119293212891, "global_step": 201178, "epoch": 4789} {"train_loss": -7.237113929930187, "global_step": 201179, "epoch": 4789, "val_loss": 69008.671875} {"train_loss": -7.413639068603516, "global_step": 201180, "epoch": 4790} {"train_loss": -7.204067707061768, "global_step": 201181, "epoch": 4790} {"train_loss": -7.355966091156006, "global_step": 201182, "epoch": 4790} {"train_loss": -7.282715797424316, "global_step": 201183, "epoch": 4790} {"train_loss": -7.338320732116699, "global_step": 201184, "epoch": 4790} {"train_loss": -7.2758588790893555, "global_step": 201185, "epoch": 4790} {"train_loss": -7.315726280212402, "global_step": 201186, "epoch": 4790} {"train_loss": -7.261552810668945, "global_step": 201187, "epoch": 4790} {"train_loss": -7.323545455932617, "global_step": 201188, "epoch": 4790} {"train_loss": -7.269617080688477, "global_step": 201189, "epoch": 4790} {"train_loss": -7.2872395515441895, "global_step": 201190, "epoch": 4790} {"train_loss": -7.237993240356445, "global_step": 201191, "epoch": 4790} {"train_loss": -7.273438453674316, "global_step": 201192, "epoch": 4790} {"train_loss": -7.262562274932861, "global_step": 201193, "epoch": 4790} {"train_loss": -7.331518173217773, "global_step": 201194, "epoch": 4790} {"train_loss": -7.24478816986084, "global_step": 201195, "epoch": 4790} {"train_loss": -7.173896312713623, "global_step": 201196, "epoch": 4790} {"train_loss": -7.26655387878418, "global_step": 201197, "epoch": 4790} {"train_loss": -7.242486953735352, "global_step": 201198, "epoch": 4790} {"train_loss": -7.242464542388916, "global_step": 201199, "epoch": 4790} {"train_loss": -7.172187328338623, "global_step": 201200, "epoch": 4790} {"train_loss": -7.211712837219238, "global_step": 201201, "epoch": 4790} {"train_loss": -7.105679988861084, "global_step": 201202, "epoch": 4790} {"train_loss": -6.957977771759033, "global_step": 201203, "epoch": 4790} {"train_loss": -7.116753101348877, "global_step": 201204, "epoch": 4790} {"train_loss": -7.221941947937012, "global_step": 201205, "epoch": 4790} {"train_loss": -6.945986747741699, "global_step": 201206, "epoch": 4790} {"train_loss": -7.087363243103027, "global_step": 201207, "epoch": 4790} {"train_loss": -7.217629909515381, "global_step": 201208, "epoch": 4790} {"train_loss": -6.981422424316406, "global_step": 201209, "epoch": 4790} {"train_loss": -7.216916084289551, "global_step": 201210, "epoch": 4790} {"train_loss": -7.0181779861450195, "global_step": 201211, "epoch": 4790} {"train_loss": -7.166180610656738, "global_step": 201212, "epoch": 4790} {"train_loss": -7.060517311096191, "global_step": 201213, "epoch": 4790} {"train_loss": -7.206012725830078, "global_step": 201214, "epoch": 4790} {"train_loss": -7.140068054199219, "global_step": 201215, "epoch": 4790} {"train_loss": -7.115097999572754, "global_step": 201216, "epoch": 4790} {"train_loss": -7.129463195800781, "global_step": 201217, "epoch": 4790} {"train_loss": -7.122427463531494, "global_step": 201218, "epoch": 4790} {"train_loss": -7.061849594116211, "global_step": 201219, "epoch": 4790} {"train_loss": -7.076699733734131, "global_step": 201220, "epoch": 4790} {"train_loss": -7.191600708734422, "global_step": 201221, "epoch": 4790, "val_loss": 68992.5546875} {"train_loss": -7.010320663452148, "global_step": 201222, "epoch": 4791} {"train_loss": -7.183620929718018, "global_step": 201223, "epoch": 4791} {"train_loss": -7.224808216094971, "global_step": 201224, "epoch": 4791} {"train_loss": -7.010207176208496, "global_step": 201225, "epoch": 4791} {"train_loss": -7.034809112548828, "global_step": 201226, "epoch": 4791} {"train_loss": -7.060222625732422, "global_step": 201227, "epoch": 4791} {"train_loss": -7.076272964477539, "global_step": 201228, "epoch": 4791} {"train_loss": -7.0933122634887695, "global_step": 201229, "epoch": 4791} {"train_loss": -7.13765811920166, "global_step": 201230, "epoch": 4791} {"train_loss": -7.1263017654418945, "global_step": 201231, "epoch": 4791} {"train_loss": -7.2201128005981445, "global_step": 201232, "epoch": 4791} {"train_loss": -7.09951114654541, "global_step": 201233, "epoch": 4791} {"train_loss": -7.319785118103027, "global_step": 201234, "epoch": 4791} {"train_loss": -7.170284271240234, "global_step": 201235, "epoch": 4791} {"train_loss": -7.2056884765625, "global_step": 201236, "epoch": 4791} {"train_loss": -7.234285354614258, "global_step": 201237, "epoch": 4791} {"train_loss": -7.1919660568237305, "global_step": 201238, "epoch": 4791} {"train_loss": -7.261504173278809, "global_step": 201239, "epoch": 4791} {"train_loss": -7.1481428146362305, "global_step": 201240, "epoch": 4791} {"train_loss": -7.169833183288574, "global_step": 201241, "epoch": 4791} {"train_loss": -7.294480323791504, "global_step": 201242, "epoch": 4791} {"train_loss": -7.18092155456543, "global_step": 201243, "epoch": 4791} {"train_loss": -7.226416110992432, "global_step": 201244, "epoch": 4791} {"train_loss": -7.226805686950684, "global_step": 201245, "epoch": 4791} {"train_loss": -7.179007530212402, "global_step": 201246, "epoch": 4791} {"train_loss": -7.194817543029785, "global_step": 201247, "epoch": 4791} {"train_loss": -7.184659004211426, "global_step": 201248, "epoch": 4791} {"train_loss": -7.187473297119141, "global_step": 201249, "epoch": 4791} {"train_loss": -7.202953815460205, "global_step": 201250, "epoch": 4791} {"train_loss": -7.192185401916504, "global_step": 201251, "epoch": 4791} {"train_loss": -7.226322174072266, "global_step": 201252, "epoch": 4791} {"train_loss": -7.259727478027344, "global_step": 201253, "epoch": 4791} {"train_loss": -7.2776689529418945, "global_step": 201254, "epoch": 4791} {"train_loss": -7.198580741882324, "global_step": 201255, "epoch": 4791} {"train_loss": -7.306501388549805, "global_step": 201256, "epoch": 4791} {"train_loss": -7.206357002258301, "global_step": 201257, "epoch": 4791} {"train_loss": -7.193659782409668, "global_step": 201258, "epoch": 4791} {"train_loss": -7.094832420349121, "global_step": 201259, "epoch": 4791} {"train_loss": -7.056944370269775, "global_step": 201260, "epoch": 4791} {"train_loss": -7.1698994636535645, "global_step": 201261, "epoch": 4791} {"train_loss": -7.146088600158691, "global_step": 201262, "epoch": 4791} {"train_loss": -7.176018317540486, "global_step": 201263, "epoch": 4791, "val_loss": 69122.1953125} {"train_loss": -7.151086330413818, "global_step": 201264, "epoch": 4792} {"train_loss": -7.0983195304870605, "global_step": 201265, "epoch": 4792} {"train_loss": -7.323293209075928, "global_step": 201266, "epoch": 4792} {"train_loss": -7.131752014160156, "global_step": 201267, "epoch": 4792} {"train_loss": -7.187624931335449, "global_step": 201268, "epoch": 4792} {"train_loss": -7.213611602783203, "global_step": 201269, "epoch": 4792} {"train_loss": -7.191682815551758, "global_step": 201270, "epoch": 4792} {"train_loss": -7.130521774291992, "global_step": 201271, "epoch": 4792} {"train_loss": -7.182047367095947, "global_step": 201272, "epoch": 4792} {"train_loss": -7.026127815246582, "global_step": 201273, "epoch": 4792} {"train_loss": -7.065432548522949, "global_step": 201274, "epoch": 4792} {"train_loss": -7.10490083694458, "global_step": 201275, "epoch": 4792} {"train_loss": -7.113192081451416, "global_step": 201276, "epoch": 4792} {"train_loss": -7.031088829040527, "global_step": 201277, "epoch": 4792} {"train_loss": -7.170802116394043, "global_step": 201278, "epoch": 4792} {"train_loss": -7.083356857299805, "global_step": 201279, "epoch": 4792} {"train_loss": -7.267764091491699, "global_step": 201280, "epoch": 4792} {"train_loss": -7.095622539520264, "global_step": 201281, "epoch": 4792} {"train_loss": -7.177031517028809, "global_step": 201282, "epoch": 4792} {"train_loss": -7.12248420715332, "global_step": 201283, "epoch": 4792} {"train_loss": -7.247179985046387, "global_step": 201284, "epoch": 4792} {"train_loss": -7.096240520477295, "global_step": 201285, "epoch": 4792} {"train_loss": -7.131837368011475, "global_step": 201286, "epoch": 4792} {"train_loss": -7.178468227386475, "global_step": 201287, "epoch": 4792} {"train_loss": -7.272371292114258, "global_step": 201288, "epoch": 4792} {"train_loss": -7.234872341156006, "global_step": 201289, "epoch": 4792} {"train_loss": -7.149096488952637, "global_step": 201290, "epoch": 4792} {"train_loss": -7.186641693115234, "global_step": 201291, "epoch": 4792} {"train_loss": -7.180148124694824, "global_step": 201292, "epoch": 4792} {"train_loss": -7.255498886108398, "global_step": 201293, "epoch": 4792} {"train_loss": -7.108312606811523, "global_step": 201294, "epoch": 4792} {"train_loss": -7.182074546813965, "global_step": 201295, "epoch": 4792} {"train_loss": -7.079537868499756, "global_step": 201296, "epoch": 4792} {"train_loss": -7.248683929443359, "global_step": 201297, "epoch": 4792} {"train_loss": -7.217041969299316, "global_step": 201298, "epoch": 4792} {"train_loss": -7.2249603271484375, "global_step": 201299, "epoch": 4792} {"train_loss": -7.259847640991211, "global_step": 201300, "epoch": 4792} {"train_loss": -7.245625972747803, "global_step": 201301, "epoch": 4792} {"train_loss": -7.309911251068115, "global_step": 201302, "epoch": 4792} {"train_loss": -7.257298946380615, "global_step": 201303, "epoch": 4792} {"train_loss": -7.177809715270996, "global_step": 201304, "epoch": 4792} {"train_loss": -7.174360854285104, "global_step": 201305, "epoch": 4792, "val_loss": 69163.2578125} {"train_loss": -7.211004257202148, "global_step": 201306, "epoch": 4793} {"train_loss": -7.2507829666137695, "global_step": 201307, "epoch": 4793} {"train_loss": -7.208721160888672, "global_step": 201308, "epoch": 4793} {"train_loss": -7.3208112716674805, "global_step": 201309, "epoch": 4793} {"train_loss": -7.2535200119018555, "global_step": 201310, "epoch": 4793} {"train_loss": -7.175036430358887, "global_step": 201311, "epoch": 4793} {"train_loss": -7.214217662811279, "global_step": 201312, "epoch": 4793} {"train_loss": -7.32419490814209, "global_step": 201313, "epoch": 4793} {"train_loss": -7.137539863586426, "global_step": 201314, "epoch": 4793} {"train_loss": -7.065187931060791, "global_step": 201315, "epoch": 4793} {"train_loss": -7.170151710510254, "global_step": 201316, "epoch": 4793} {"train_loss": -7.210723400115967, "global_step": 201317, "epoch": 4793} {"train_loss": -7.23919677734375, "global_step": 201318, "epoch": 4793} {"train_loss": -7.133976459503174, "global_step": 201319, "epoch": 4793} {"train_loss": -7.273396015167236, "global_step": 201320, "epoch": 4793} {"train_loss": -7.331378936767578, "global_step": 201321, "epoch": 4793} {"train_loss": -7.326474189758301, "global_step": 201322, "epoch": 4793} {"train_loss": -7.193861961364746, "global_step": 201323, "epoch": 4793} {"train_loss": -7.061877727508545, "global_step": 201324, "epoch": 4793} {"train_loss": -7.337367057800293, "global_step": 201325, "epoch": 4793} {"train_loss": -7.229658126831055, "global_step": 201326, "epoch": 4793} {"train_loss": -7.108896255493164, "global_step": 201327, "epoch": 4793} {"train_loss": -7.238896369934082, "global_step": 201328, "epoch": 4793} {"train_loss": -7.246515274047852, "global_step": 201329, "epoch": 4793} {"train_loss": -7.129700183868408, "global_step": 201330, "epoch": 4793} {"train_loss": -7.227453231811523, "global_step": 201331, "epoch": 4793} {"train_loss": -7.249953746795654, "global_step": 201332, "epoch": 4793} {"train_loss": -7.304560661315918, "global_step": 201333, "epoch": 4793} {"train_loss": -7.236832618713379, "global_step": 201334, "epoch": 4793} {"train_loss": -7.203482151031494, "global_step": 201335, "epoch": 4793} {"train_loss": -7.297978401184082, "global_step": 201336, "epoch": 4793} {"train_loss": -7.349438667297363, "global_step": 201337, "epoch": 4793} {"train_loss": -7.1116437911987305, "global_step": 201338, "epoch": 4793} {"train_loss": -7.093902587890625, "global_step": 201339, "epoch": 4793} {"train_loss": -7.2593278884887695, "global_step": 201340, "epoch": 4793} {"train_loss": -7.3264641761779785, "global_step": 201341, "epoch": 4793} {"train_loss": -7.204717636108398, "global_step": 201342, "epoch": 4793} {"train_loss": -7.21636438369751, "global_step": 201343, "epoch": 4793} {"train_loss": -7.298152446746826, "global_step": 201344, "epoch": 4793} {"train_loss": -7.27835750579834, "global_step": 201345, "epoch": 4793} {"train_loss": -7.242685794830322, "global_step": 201346, "epoch": 4793} {"train_loss": -7.227257853462582, "global_step": 201347, "epoch": 4793, "val_loss": 68909.2890625} {"train_loss": -7.229968070983887, "global_step": 201348, "epoch": 4794} {"train_loss": -7.255342483520508, "global_step": 201349, "epoch": 4794} {"train_loss": -7.302123069763184, "global_step": 201350, "epoch": 4794} {"train_loss": -7.254232883453369, "global_step": 201351, "epoch": 4794} {"train_loss": -7.31984281539917, "global_step": 201352, "epoch": 4794} {"train_loss": -7.212433815002441, "global_step": 201353, "epoch": 4794} {"train_loss": -7.140298366546631, "global_step": 201354, "epoch": 4794} {"train_loss": -7.208431720733643, "global_step": 201355, "epoch": 4794} {"train_loss": -7.131775379180908, "global_step": 201356, "epoch": 4794} {"train_loss": -7.187735557556152, "global_step": 201357, "epoch": 4794} {"train_loss": -7.366739273071289, "global_step": 201358, "epoch": 4794} {"train_loss": -7.292656421661377, "global_step": 201359, "epoch": 4794} {"train_loss": -7.21811580657959, "global_step": 201360, "epoch": 4794} {"train_loss": -7.316062927246094, "global_step": 201361, "epoch": 4794} {"train_loss": -7.282864093780518, "global_step": 201362, "epoch": 4794} {"train_loss": -7.200104713439941, "global_step": 201363, "epoch": 4794} {"train_loss": -7.307429313659668, "global_step": 201364, "epoch": 4794} {"train_loss": -7.359984397888184, "global_step": 201365, "epoch": 4794} {"train_loss": -7.183757305145264, "global_step": 201366, "epoch": 4794} {"train_loss": -7.067522048950195, "global_step": 201367, "epoch": 4794} {"train_loss": -7.224677562713623, "global_step": 201368, "epoch": 4794} {"train_loss": -7.206179618835449, "global_step": 201369, "epoch": 4794} {"train_loss": -7.2653303146362305, "global_step": 201370, "epoch": 4794} {"train_loss": -7.244368076324463, "global_step": 201371, "epoch": 4794} {"train_loss": -7.291769027709961, "global_step": 201372, "epoch": 4794} {"train_loss": -7.244576454162598, "global_step": 201373, "epoch": 4794} {"train_loss": -7.266672134399414, "global_step": 201374, "epoch": 4794} {"train_loss": -7.149209022521973, "global_step": 201375, "epoch": 4794} {"train_loss": -7.356745719909668, "global_step": 201376, "epoch": 4794} {"train_loss": -7.210268020629883, "global_step": 201377, "epoch": 4794} {"train_loss": -7.4381232261657715, "global_step": 201378, "epoch": 4794} {"train_loss": -7.319117546081543, "global_step": 201379, "epoch": 4794} {"train_loss": -7.220904350280762, "global_step": 201380, "epoch": 4794} {"train_loss": -7.262143135070801, "global_step": 201381, "epoch": 4794} {"train_loss": -7.2588653564453125, "global_step": 201382, "epoch": 4794} {"train_loss": -7.3499040603637695, "global_step": 201383, "epoch": 4794} {"train_loss": -7.181375026702881, "global_step": 201384, "epoch": 4794} {"train_loss": -7.111506462097168, "global_step": 201385, "epoch": 4794} {"train_loss": -7.369408130645752, "global_step": 201386, "epoch": 4794} {"train_loss": -7.2252044677734375, "global_step": 201387, "epoch": 4794} {"train_loss": -7.290623664855957, "global_step": 201388, "epoch": 4794} {"train_loss": -7.252085753849575, "global_step": 201389, "epoch": 4794, "val_loss": 69147.5546875} {"train_loss": -7.4236650466918945, "global_step": 201390, "epoch": 4795} {"train_loss": -7.330817222595215, "global_step": 201391, "epoch": 4795} {"train_loss": -7.271574020385742, "global_step": 201392, "epoch": 4795} {"train_loss": -7.264434814453125, "global_step": 201393, "epoch": 4795} {"train_loss": -7.340874671936035, "global_step": 201394, "epoch": 4795} {"train_loss": -7.31406307220459, "global_step": 201395, "epoch": 4795} {"train_loss": -7.283590793609619, "global_step": 201396, "epoch": 4795} {"train_loss": -7.406236171722412, "global_step": 201397, "epoch": 4795} {"train_loss": -7.335824966430664, "global_step": 201398, "epoch": 4795} {"train_loss": -7.242676734924316, "global_step": 201399, "epoch": 4795} {"train_loss": -7.3149919509887695, "global_step": 201400, "epoch": 4795} {"train_loss": -7.186860084533691, "global_step": 201401, "epoch": 4795} {"train_loss": -7.229331970214844, "global_step": 201402, "epoch": 4795} {"train_loss": -7.220428466796875, "global_step": 201403, "epoch": 4795} {"train_loss": -7.270688056945801, "global_step": 201404, "epoch": 4795} {"train_loss": -7.145110607147217, "global_step": 201405, "epoch": 4795} {"train_loss": -7.254861831665039, "global_step": 201406, "epoch": 4795} {"train_loss": -7.2136077880859375, "global_step": 201407, "epoch": 4795} {"train_loss": -7.208369255065918, "global_step": 201408, "epoch": 4795} {"train_loss": -7.290565490722656, "global_step": 201409, "epoch": 4795} {"train_loss": -7.133131980895996, "global_step": 201410, "epoch": 4795} {"train_loss": -7.241061210632324, "global_step": 201411, "epoch": 4795} {"train_loss": -7.2009148597717285, "global_step": 201412, "epoch": 4795} {"train_loss": -7.318321704864502, "global_step": 201413, "epoch": 4795} {"train_loss": -7.226813316345215, "global_step": 201414, "epoch": 4795} {"train_loss": -7.175864219665527, "global_step": 201415, "epoch": 4795} {"train_loss": -7.271836280822754, "global_step": 201416, "epoch": 4795} {"train_loss": -7.2574052810668945, "global_step": 201417, "epoch": 4795} {"train_loss": -6.983221054077148, "global_step": 201418, "epoch": 4795} {"train_loss": -7.196937561035156, "global_step": 201419, "epoch": 4795} {"train_loss": -7.2657551765441895, "global_step": 201420, "epoch": 4795} {"train_loss": -7.1963210105896, "global_step": 201421, "epoch": 4795} {"train_loss": -7.200760841369629, "global_step": 201422, "epoch": 4795} {"train_loss": -7.026433944702148, "global_step": 201423, "epoch": 4795} {"train_loss": -7.163275241851807, "global_step": 201424, "epoch": 4795} {"train_loss": -7.231802940368652, "global_step": 201425, "epoch": 4795} {"train_loss": -7.07853364944458, "global_step": 201426, "epoch": 4795} {"train_loss": -7.2172651290893555, "global_step": 201427, "epoch": 4795} {"train_loss": -7.111435890197754, "global_step": 201428, "epoch": 4795} {"train_loss": -7.188055992126465, "global_step": 201429, "epoch": 4795} {"train_loss": -7.122488021850586, "global_step": 201430, "epoch": 4795} {"train_loss": -7.22626256942749, "global_step": 201431, "epoch": 4795, "val_loss": 69171.53125} {"train_loss": -7.1991424560546875, "global_step": 201432, "epoch": 4796} {"train_loss": -7.129915237426758, "global_step": 201433, "epoch": 4796} {"train_loss": -7.388007164001465, "global_step": 201434, "epoch": 4796} {"train_loss": -7.2466630935668945, "global_step": 201435, "epoch": 4796} {"train_loss": -7.324420928955078, "global_step": 201436, "epoch": 4796} {"train_loss": -7.311317443847656, "global_step": 201437, "epoch": 4796} {"train_loss": -7.252306938171387, "global_step": 201438, "epoch": 4796} {"train_loss": -7.323795318603516, "global_step": 201439, "epoch": 4796} {"train_loss": -7.249762535095215, "global_step": 201440, "epoch": 4796} {"train_loss": -7.29596471786499, "global_step": 201441, "epoch": 4796} {"train_loss": -7.225590705871582, "global_step": 201442, "epoch": 4796} {"train_loss": -7.228760719299316, "global_step": 201443, "epoch": 4796} {"train_loss": -7.28524112701416, "global_step": 201444, "epoch": 4796} {"train_loss": -7.218566417694092, "global_step": 201445, "epoch": 4796} {"train_loss": -7.269899845123291, "global_step": 201446, "epoch": 4796} {"train_loss": -7.204689025878906, "global_step": 201447, "epoch": 4796} {"train_loss": -7.310788631439209, "global_step": 201448, "epoch": 4796} {"train_loss": -7.383021354675293, "global_step": 201449, "epoch": 4796} {"train_loss": -7.294719696044922, "global_step": 201450, "epoch": 4796} {"train_loss": -7.224912643432617, "global_step": 201451, "epoch": 4796} {"train_loss": -7.196169376373291, "global_step": 201452, "epoch": 4796} {"train_loss": -7.264355659484863, "global_step": 201453, "epoch": 4796} {"train_loss": -7.1123504638671875, "global_step": 201454, "epoch": 4796} {"train_loss": -7.193325519561768, "global_step": 201455, "epoch": 4796} {"train_loss": -7.110039710998535, "global_step": 201456, "epoch": 4796} {"train_loss": -7.320470809936523, "global_step": 201457, "epoch": 4796} {"train_loss": -7.245105743408203, "global_step": 201458, "epoch": 4796} {"train_loss": -7.173025131225586, "global_step": 201459, "epoch": 4796} {"train_loss": -7.1260457038879395, "global_step": 201460, "epoch": 4796} {"train_loss": -7.1137166023254395, "global_step": 201461, "epoch": 4796} {"train_loss": -7.155045032501221, "global_step": 201462, "epoch": 4796} {"train_loss": -7.035219192504883, "global_step": 201463, "epoch": 4796} {"train_loss": -7.129471778869629, "global_step": 201464, "epoch": 4796} {"train_loss": -7.139371395111084, "global_step": 201465, "epoch": 4796} {"train_loss": -7.15811824798584, "global_step": 201466, "epoch": 4796} {"train_loss": -7.246307373046875, "global_step": 201467, "epoch": 4796} {"train_loss": -7.043107032775879, "global_step": 201468, "epoch": 4796} {"train_loss": -7.090880870819092, "global_step": 201469, "epoch": 4796} {"train_loss": -7.085867881774902, "global_step": 201470, "epoch": 4796} {"train_loss": -7.0073933601379395, "global_step": 201471, "epoch": 4796} {"train_loss": -7.2691650390625, "global_step": 201472, "epoch": 4796} {"train_loss": -7.2074578148978095, "global_step": 201473, "epoch": 4796, "val_loss": 68975.0} {"train_loss": -7.173698902130127, "global_step": 201474, "epoch": 4797} {"train_loss": -7.110732555389404, "global_step": 201475, "epoch": 4797} {"train_loss": -7.153082847595215, "global_step": 201476, "epoch": 4797} {"train_loss": -7.1305646896362305, "global_step": 201477, "epoch": 4797} {"train_loss": -7.156294345855713, "global_step": 201478, "epoch": 4797} {"train_loss": -7.250912666320801, "global_step": 201479, "epoch": 4797} {"train_loss": -7.139837265014648, "global_step": 201480, "epoch": 4797} {"train_loss": -7.277472019195557, "global_step": 201481, "epoch": 4797} {"train_loss": -7.182048320770264, "global_step": 201482, "epoch": 4797} {"train_loss": -7.143804550170898, "global_step": 201483, "epoch": 4797} {"train_loss": -7.185427665710449, "global_step": 201484, "epoch": 4797} {"train_loss": -7.106837272644043, "global_step": 201485, "epoch": 4797} {"train_loss": -7.196925163269043, "global_step": 201486, "epoch": 4797} {"train_loss": -7.145347595214844, "global_step": 201487, "epoch": 4797} {"train_loss": -7.180355072021484, "global_step": 201488, "epoch": 4797} {"train_loss": -7.147488594055176, "global_step": 201489, "epoch": 4797} {"train_loss": -7.312490463256836, "global_step": 201490, "epoch": 4797} {"train_loss": -7.210511207580566, "global_step": 201491, "epoch": 4797} {"train_loss": -7.170444965362549, "global_step": 201492, "epoch": 4797} {"train_loss": -7.2161455154418945, "global_step": 201493, "epoch": 4797} {"train_loss": -7.18271541595459, "global_step": 201494, "epoch": 4797} {"train_loss": -7.147627830505371, "global_step": 201495, "epoch": 4797} {"train_loss": -7.313794136047363, "global_step": 201496, "epoch": 4797} {"train_loss": -7.326080799102783, "global_step": 201497, "epoch": 4797} {"train_loss": -7.211134433746338, "global_step": 201498, "epoch": 4797} {"train_loss": -7.265293121337891, "global_step": 201499, "epoch": 4797} {"train_loss": -7.203461647033691, "global_step": 201500, "epoch": 4797} {"train_loss": -7.373618125915527, "global_step": 201501, "epoch": 4797} {"train_loss": -7.352231025695801, "global_step": 201502, "epoch": 4797} {"train_loss": -7.277972221374512, "global_step": 201503, "epoch": 4797} {"train_loss": -7.3189873695373535, "global_step": 201504, "epoch": 4797} {"train_loss": -7.224709510803223, "global_step": 201505, "epoch": 4797} {"train_loss": -7.351814270019531, "global_step": 201506, "epoch": 4797} {"train_loss": -7.257915019989014, "global_step": 201507, "epoch": 4797} {"train_loss": -7.365530967712402, "global_step": 201508, "epoch": 4797} {"train_loss": -7.287168502807617, "global_step": 201509, "epoch": 4797} {"train_loss": -7.226463317871094, "global_step": 201510, "epoch": 4797} {"train_loss": -7.3136138916015625, "global_step": 201511, "epoch": 4797} {"train_loss": -7.373805046081543, "global_step": 201512, "epoch": 4797} {"train_loss": -7.20918083190918, "global_step": 201513, "epoch": 4797} {"train_loss": -7.3099188804626465, "global_step": 201514, "epoch": 4797} {"train_loss": -7.230994701385498, "global_step": 201515, "epoch": 4797, "val_loss": 69036.9921875} {"train_loss": -7.324437141418457, "global_step": 201516, "epoch": 4798} {"train_loss": -7.391416549682617, "global_step": 201517, "epoch": 4798} {"train_loss": -7.324214935302734, "global_step": 201518, "epoch": 4798} {"train_loss": -7.263434886932373, "global_step": 201519, "epoch": 4798} {"train_loss": -7.337621688842773, "global_step": 201520, "epoch": 4798} {"train_loss": -7.270476818084717, "global_step": 201521, "epoch": 4798} {"train_loss": -7.432972431182861, "global_step": 201522, "epoch": 4798} {"train_loss": -7.261081695556641, "global_step": 201523, "epoch": 4798} {"train_loss": -7.288903713226318, "global_step": 201524, "epoch": 4798} {"train_loss": -7.282747268676758, "global_step": 201525, "epoch": 4798} {"train_loss": -7.224254131317139, "global_step": 201526, "epoch": 4798} {"train_loss": -7.346297264099121, "global_step": 201527, "epoch": 4798} {"train_loss": -7.399352073669434, "global_step": 201528, "epoch": 4798} {"train_loss": -7.3903398513793945, "global_step": 201529, "epoch": 4798} {"train_loss": -7.272309303283691, "global_step": 201530, "epoch": 4798} {"train_loss": -7.425048828125, "global_step": 201531, "epoch": 4798} {"train_loss": -7.299434661865234, "global_step": 201532, "epoch": 4798} {"train_loss": -7.338306427001953, "global_step": 201533, "epoch": 4798} {"train_loss": -7.269207000732422, "global_step": 201534, "epoch": 4798} {"train_loss": -7.217565536499023, "global_step": 201535, "epoch": 4798} {"train_loss": -7.301395416259766, "global_step": 201536, "epoch": 4798} {"train_loss": -7.288979530334473, "global_step": 201537, "epoch": 4798} {"train_loss": -7.311237812042236, "global_step": 201538, "epoch": 4798} {"train_loss": -7.385343074798584, "global_step": 201539, "epoch": 4798} {"train_loss": -7.229270935058594, "global_step": 201540, "epoch": 4798} {"train_loss": -7.3036789894104, "global_step": 201541, "epoch": 4798} {"train_loss": -7.428299903869629, "global_step": 201542, "epoch": 4798} {"train_loss": -7.271637916564941, "global_step": 201543, "epoch": 4798} {"train_loss": -7.360241889953613, "global_step": 201544, "epoch": 4798} {"train_loss": -7.304123878479004, "global_step": 201545, "epoch": 4798} {"train_loss": -7.327080726623535, "global_step": 201546, "epoch": 4798} {"train_loss": -7.322096824645996, "global_step": 201547, "epoch": 4798} {"train_loss": -7.21251106262207, "global_step": 201548, "epoch": 4798} {"train_loss": -7.2683868408203125, "global_step": 201549, "epoch": 4798} {"train_loss": -7.200132846832275, "global_step": 201550, "epoch": 4798} {"train_loss": -7.267561912536621, "global_step": 201551, "epoch": 4798} {"train_loss": -7.223516464233398, "global_step": 201552, "epoch": 4798} {"train_loss": -7.179503917694092, "global_step": 201553, "epoch": 4798} {"train_loss": -7.212241172790527, "global_step": 201554, "epoch": 4798} {"train_loss": -7.218679904937744, "global_step": 201555, "epoch": 4798} {"train_loss": -7.188887596130371, "global_step": 201556, "epoch": 4798} {"train_loss": -7.295792159580049, "global_step": 201557, "epoch": 4798, "val_loss": 69137.0625} {"train_loss": -7.2288312911987305, "global_step": 201558, "epoch": 4799} {"train_loss": -7.179010391235352, "global_step": 201559, "epoch": 4799} {"train_loss": -7.078578472137451, "global_step": 201560, "epoch": 4799} {"train_loss": -7.305700302124023, "global_step": 201561, "epoch": 4799} {"train_loss": -7.163118362426758, "global_step": 201562, "epoch": 4799} {"train_loss": -7.137167930603027, "global_step": 201563, "epoch": 4799} {"train_loss": -7.318940162658691, "global_step": 201564, "epoch": 4799} {"train_loss": -7.204463958740234, "global_step": 201565, "epoch": 4799} {"train_loss": -7.2723212242126465, "global_step": 201566, "epoch": 4799} {"train_loss": -7.173126220703125, "global_step": 201567, "epoch": 4799} {"train_loss": -7.240845203399658, "global_step": 201568, "epoch": 4799} {"train_loss": -7.2821550369262695, "global_step": 201569, "epoch": 4799} {"train_loss": -7.118659496307373, "global_step": 201570, "epoch": 4799} {"train_loss": -7.436529159545898, "global_step": 201571, "epoch": 4799} {"train_loss": -7.312025547027588, "global_step": 201572, "epoch": 4799} {"train_loss": -7.279151439666748, "global_step": 201573, "epoch": 4799} {"train_loss": -7.312690734863281, "global_step": 201574, "epoch": 4799} {"train_loss": -7.299028396606445, "global_step": 201575, "epoch": 4799} {"train_loss": -7.238740921020508, "global_step": 201576, "epoch": 4799} {"train_loss": -7.163135528564453, "global_step": 201577, "epoch": 4799} {"train_loss": -7.246572494506836, "global_step": 201578, "epoch": 4799} {"train_loss": -7.150097846984863, "global_step": 201579, "epoch": 4799} {"train_loss": -7.278892993927002, "global_step": 201580, "epoch": 4799} {"train_loss": -7.160129070281982, "global_step": 201581, "epoch": 4799} {"train_loss": -7.1848063468933105, "global_step": 201582, "epoch": 4799} {"train_loss": -7.245059967041016, "global_step": 201583, "epoch": 4799} {"train_loss": -7.262940406799316, "global_step": 201584, "epoch": 4799} {"train_loss": -7.227245330810547, "global_step": 201585, "epoch": 4799} {"train_loss": -7.2077226638793945, "global_step": 201586, "epoch": 4799} {"train_loss": -7.288644790649414, "global_step": 201587, "epoch": 4799} {"train_loss": -7.279140472412109, "global_step": 201588, "epoch": 4799} {"train_loss": -7.327387809753418, "global_step": 201589, "epoch": 4799} {"train_loss": -7.174417495727539, "global_step": 201590, "epoch": 4799} {"train_loss": -7.2006425857543945, "global_step": 201591, "epoch": 4799} {"train_loss": -7.268606185913086, "global_step": 201592, "epoch": 4799} {"train_loss": -7.317434310913086, "global_step": 201593, "epoch": 4799} {"train_loss": -7.248527526855469, "global_step": 201594, "epoch": 4799} {"train_loss": -7.315267086029053, "global_step": 201595, "epoch": 4799} {"train_loss": -7.336245536804199, "global_step": 201596, "epoch": 4799} {"train_loss": -7.175132751464844, "global_step": 201597, "epoch": 4799} {"train_loss": -7.333919048309326, "global_step": 201598, "epoch": 4799} {"train_loss": -7.244773626327515, "global_step": 201599, "epoch": 4799, "val_loss": 69091.1171875} {"train_loss": -7.332206726074219, "global_step": 201600, "epoch": 4800} {"train_loss": -7.282955646514893, "global_step": 201601, "epoch": 4800} {"train_loss": -7.26984977722168, "global_step": 201602, "epoch": 4800} {"train_loss": -7.176063537597656, "global_step": 201603, "epoch": 4800} {"train_loss": -7.221335411071777, "global_step": 201604, "epoch": 4800} {"train_loss": -7.292807579040527, "global_step": 201605, "epoch": 4800} {"train_loss": -7.245634078979492, "global_step": 201606, "epoch": 4800} {"train_loss": -7.0965776443481445, "global_step": 201607, "epoch": 4800} {"train_loss": -6.984025955200195, "global_step": 201608, "epoch": 4800} {"train_loss": -7.321314811706543, "global_step": 201609, "epoch": 4800} {"train_loss": -7.162890434265137, "global_step": 201610, "epoch": 4800} {"train_loss": -7.204123497009277, "global_step": 201611, "epoch": 4800} {"train_loss": -7.269902229309082, "global_step": 201612, "epoch": 4800} {"train_loss": -7.3238525390625, "global_step": 201613, "epoch": 4800} {"train_loss": -7.250859260559082, "global_step": 201614, "epoch": 4800} {"train_loss": -7.269430160522461, "global_step": 201615, "epoch": 4800} {"train_loss": -7.307518005371094, "global_step": 201616, "epoch": 4800} {"train_loss": -7.080028533935547, "global_step": 201617, "epoch": 4800} {"train_loss": -7.0686726570129395, "global_step": 201618, "epoch": 4800} {"train_loss": -7.197380065917969, "global_step": 201619, "epoch": 4800} {"train_loss": -7.12729549407959, "global_step": 201620, "epoch": 4800} {"train_loss": -7.168892860412598, "global_step": 201621, "epoch": 4800} {"train_loss": -7.162408828735352, "global_step": 201622, "epoch": 4800} {"train_loss": -7.307520389556885, "global_step": 201623, "epoch": 4800} {"train_loss": -7.221249103546143, "global_step": 201624, "epoch": 4800} {"train_loss": -7.283292293548584, "global_step": 201625, "epoch": 4800} {"train_loss": -7.1840620040893555, "global_step": 201626, "epoch": 4800} {"train_loss": -7.231337070465088, "global_step": 201627, "epoch": 4800} {"train_loss": -7.3004608154296875, "global_step": 201628, "epoch": 4800} {"train_loss": -7.282588005065918, "global_step": 201629, "epoch": 4800} {"train_loss": -7.249188423156738, "global_step": 201630, "epoch": 4800} {"train_loss": -7.259947776794434, "global_step": 201631, "epoch": 4800} {"train_loss": -7.123801231384277, "global_step": 201632, "epoch": 4800} {"train_loss": -7.260917663574219, "global_step": 201633, "epoch": 4800} {"train_loss": -7.2642669677734375, "global_step": 201634, "epoch": 4800} {"train_loss": -7.24818754196167, "global_step": 201635, "epoch": 4800} {"train_loss": -7.189720153808594, "global_step": 201636, "epoch": 4800} {"train_loss": -7.127368927001953, "global_step": 201637, "epoch": 4800} {"train_loss": -7.245124340057373, "global_step": 201638, "epoch": 4800} {"train_loss": -7.189573764801025, "global_step": 201639, "epoch": 4800} {"train_loss": -7.179717540740967, "global_step": 201640, "epoch": 4800} {"train_loss": -7.222120375860305, "global_step": 201641, "epoch": 4800, "train/sim_max_reward_0": 0.20873946297941065, "train/sim_max_reward_1": 0.9130805852995453, "train/sim_max_reward_2": 0.5719815526830833, "train/sim_max_reward_3": 0.1317564299722299, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9966714296252737, "test/sim_max_reward_4400000": 0.16328309615897788, "test/sim_max_reward_4400001": 0.22692044059179264, "test/sim_max_reward_4400002": 0.33335663354598366, "test/sim_max_reward_4400003": 0.9586977930196204, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.1598218707681121, "test/sim_max_reward_4400006": 0.992153011491137, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.29666392015592163, "test/sim_max_reward_4400009": 0.8944330884301359, "test/sim_max_reward_4400010": 0.9647970363520232, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.8648815091891446, "test/sim_max_reward_4400013": 0.9481206938985914, "test/sim_max_reward_4400014": 0.9590921973686459, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.2804655647219097, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9812979112637688, "test/sim_max_reward_4400023": 0.42985767437972716, "test/sim_max_reward_4400024": 0.29419090791757696, "test/sim_max_reward_4400025": 0.2832364458374902, "test/sim_max_reward_4400026": 0.9342411304560417, "test/sim_max_reward_4400027": 0.02609891701856759, "test/sim_max_reward_4400028": 0.6473667694224349, "test/sim_max_reward_4400029": 0.5291455598787175, "test/sim_max_reward_4400030": 0.994020872313396, "test/sim_max_reward_4400031": 0.9726420845261824, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.800317871401323, "test/sim_max_reward_4400034": 0.9134599668321475, "test/sim_max_reward_4400035": 0.9525913536342998, "test/sim_max_reward_4400036": 0.5418234173541092, "test/sim_max_reward_4400037": 0.9533073834117013, "test/sim_max_reward_4400038": 0.9078475039451598, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9165479095331834, "test/sim_max_reward_4400042": 0.9525972304388359, "test/sim_max_reward_4400043": 0.8397259819760698, "test/sim_max_reward_4400044": 0.9364584506001781, "test/sim_max_reward_4400045": 0.9594855339083277, "test/sim_max_reward_4400046": 0.8920898080196105, "test/sim_max_reward_4400047": 0.9647803316017606, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 0.40093968918786865, "train/mean_score": 0.6370382434265905, "test/mean_score": 0.5722590508216274, "val_loss": 69300.7578125} {"train_loss": -7.178689956665039, "global_step": 201642, "epoch": 4801} {"train_loss": -7.167229652404785, "global_step": 201643, "epoch": 4801} {"train_loss": -7.340471267700195, "global_step": 201644, "epoch": 4801} {"train_loss": -7.3185014724731445, "global_step": 201645, "epoch": 4801} {"train_loss": -7.297625541687012, "global_step": 201646, "epoch": 4801} {"train_loss": -7.272397041320801, "global_step": 201647, "epoch": 4801} {"train_loss": -7.251553535461426, "global_step": 201648, "epoch": 4801} {"train_loss": -7.350029945373535, "global_step": 201649, "epoch": 4801} {"train_loss": -7.241018772125244, "global_step": 201650, "epoch": 4801} {"train_loss": -7.264732837677002, "global_step": 201651, "epoch": 4801} {"train_loss": -7.244351863861084, "global_step": 201652, "epoch": 4801} {"train_loss": -7.311487674713135, "global_step": 201653, "epoch": 4801} {"train_loss": -7.238306522369385, "global_step": 201654, "epoch": 4801} {"train_loss": -7.271615982055664, "global_step": 201655, "epoch": 4801} {"train_loss": -7.206905364990234, "global_step": 201656, "epoch": 4801} {"train_loss": -7.232810974121094, "global_step": 201657, "epoch": 4801} {"train_loss": -7.2919745445251465, "global_step": 201658, "epoch": 4801} {"train_loss": -7.293232440948486, "global_step": 201659, "epoch": 4801} {"train_loss": -7.248335838317871, "global_step": 201660, "epoch": 4801} {"train_loss": -7.248856067657471, "global_step": 201661, "epoch": 4801} {"train_loss": -7.247779846191406, "global_step": 201662, "epoch": 4801} {"train_loss": -7.131056785583496, "global_step": 201663, "epoch": 4801} {"train_loss": -7.245652198791504, "global_step": 201664, "epoch": 4801} {"train_loss": -7.149585723876953, "global_step": 201665, "epoch": 4801} {"train_loss": -7.282656669616699, "global_step": 201666, "epoch": 4801} {"train_loss": -7.26965856552124, "global_step": 201667, "epoch": 4801} {"train_loss": -7.252450942993164, "global_step": 201668, "epoch": 4801} {"train_loss": -7.24461555480957, "global_step": 201669, "epoch": 4801} {"train_loss": -7.322379112243652, "global_step": 201670, "epoch": 4801} {"train_loss": -7.202539443969727, "global_step": 201671, "epoch": 4801} {"train_loss": -7.185091018676758, "global_step": 201672, "epoch": 4801} {"train_loss": -7.29615592956543, "global_step": 201673, "epoch": 4801} {"train_loss": -7.381440162658691, "global_step": 201674, "epoch": 4801} {"train_loss": -7.150793075561523, "global_step": 201675, "epoch": 4801} {"train_loss": -7.219657897949219, "global_step": 201676, "epoch": 4801} {"train_loss": -7.207187652587891, "global_step": 201677, "epoch": 4801} {"train_loss": -7.28317928314209, "global_step": 201678, "epoch": 4801} {"train_loss": -7.2260355949401855, "global_step": 201679, "epoch": 4801} {"train_loss": -7.175606727600098, "global_step": 201680, "epoch": 4801} {"train_loss": -7.200190544128418, "global_step": 201681, "epoch": 4801} {"train_loss": -7.241648197174072, "global_step": 201682, "epoch": 4801} {"train_loss": -7.248246249698457, "global_step": 201683, "epoch": 4801, "val_loss": 69084.15625} {"train_loss": -7.220732688903809, "global_step": 201684, "epoch": 4802} {"train_loss": -7.284880638122559, "global_step": 201685, "epoch": 4802} {"train_loss": -7.145846366882324, "global_step": 201686, "epoch": 4802} {"train_loss": -7.284372329711914, "global_step": 201687, "epoch": 4802} {"train_loss": -7.310092926025391, "global_step": 201688, "epoch": 4802} {"train_loss": -7.2818756103515625, "global_step": 201689, "epoch": 4802} {"train_loss": -7.2266316413879395, "global_step": 201690, "epoch": 4802} {"train_loss": -7.266510486602783, "global_step": 201691, "epoch": 4802} {"train_loss": -7.267439842224121, "global_step": 201692, "epoch": 4802} {"train_loss": -7.323935508728027, "global_step": 201693, "epoch": 4802} {"train_loss": -7.200174808502197, "global_step": 201694, "epoch": 4802} {"train_loss": -7.256806373596191, "global_step": 201695, "epoch": 4802} {"train_loss": -7.343382358551025, "global_step": 201696, "epoch": 4802} {"train_loss": -7.360401630401611, "global_step": 201697, "epoch": 4802} {"train_loss": -7.319490432739258, "global_step": 201698, "epoch": 4802} {"train_loss": -7.386036396026611, "global_step": 201699, "epoch": 4802} {"train_loss": -7.3673248291015625, "global_step": 201700, "epoch": 4802} {"train_loss": -7.362326622009277, "global_step": 201701, "epoch": 4802} {"train_loss": -7.230471611022949, "global_step": 201702, "epoch": 4802} {"train_loss": -7.208252429962158, "global_step": 201703, "epoch": 4802} {"train_loss": -7.352609634399414, "global_step": 201704, "epoch": 4802} {"train_loss": -7.136839389801025, "global_step": 201705, "epoch": 4802} {"train_loss": -7.307964324951172, "global_step": 201706, "epoch": 4802} {"train_loss": -7.201661109924316, "global_step": 201707, "epoch": 4802} {"train_loss": -7.342314720153809, "global_step": 201708, "epoch": 4802} {"train_loss": -7.20635986328125, "global_step": 201709, "epoch": 4802} {"train_loss": -7.081290245056152, "global_step": 201710, "epoch": 4802} {"train_loss": -7.2158918380737305, "global_step": 201711, "epoch": 4802} {"train_loss": -7.220415115356445, "global_step": 201712, "epoch": 4802} {"train_loss": -7.239752292633057, "global_step": 201713, "epoch": 4802} {"train_loss": -7.228094100952148, "global_step": 201714, "epoch": 4802} {"train_loss": -7.258013725280762, "global_step": 201715, "epoch": 4802} {"train_loss": -7.239148139953613, "global_step": 201716, "epoch": 4802} {"train_loss": -7.286806106567383, "global_step": 201717, "epoch": 4802} {"train_loss": -7.13720178604126, "global_step": 201718, "epoch": 4802} {"train_loss": -7.279056549072266, "global_step": 201719, "epoch": 4802} {"train_loss": -7.14006233215332, "global_step": 201720, "epoch": 4802} {"train_loss": -7.173772811889648, "global_step": 201721, "epoch": 4802} {"train_loss": -7.177859306335449, "global_step": 201722, "epoch": 4802} {"train_loss": -7.238734245300293, "global_step": 201723, "epoch": 4802} {"train_loss": -7.21427059173584, "global_step": 201724, "epoch": 4802} {"train_loss": -7.2516149906885055, "global_step": 201725, "epoch": 4802, "val_loss": 69214.359375} {"train_loss": -7.216938018798828, "global_step": 201726, "epoch": 4803} {"train_loss": -7.219482421875, "global_step": 201727, "epoch": 4803} {"train_loss": -7.240289688110352, "global_step": 201728, "epoch": 4803} {"train_loss": -7.240354537963867, "global_step": 201729, "epoch": 4803} {"train_loss": -7.227019309997559, "global_step": 201730, "epoch": 4803} {"train_loss": -7.185835361480713, "global_step": 201731, "epoch": 4803} {"train_loss": -7.176700592041016, "global_step": 201732, "epoch": 4803} {"train_loss": -7.273629188537598, "global_step": 201733, "epoch": 4803} {"train_loss": -7.215391159057617, "global_step": 201734, "epoch": 4803} {"train_loss": -7.250267028808594, "global_step": 201735, "epoch": 4803} {"train_loss": -7.205824375152588, "global_step": 201736, "epoch": 4803} {"train_loss": -7.270815849304199, "global_step": 201737, "epoch": 4803} {"train_loss": -7.235394477844238, "global_step": 201738, "epoch": 4803} {"train_loss": -7.324206352233887, "global_step": 201739, "epoch": 4803} {"train_loss": -7.188874244689941, "global_step": 201740, "epoch": 4803} {"train_loss": -7.178284168243408, "global_step": 201741, "epoch": 4803} {"train_loss": -7.328205585479736, "global_step": 201742, "epoch": 4803} {"train_loss": -7.288625240325928, "global_step": 201743, "epoch": 4803} {"train_loss": -7.268326282501221, "global_step": 201744, "epoch": 4803} {"train_loss": -7.269554138183594, "global_step": 201745, "epoch": 4803} {"train_loss": -7.279928207397461, "global_step": 201746, "epoch": 4803} {"train_loss": -7.221041679382324, "global_step": 201747, "epoch": 4803} {"train_loss": -7.297528266906738, "global_step": 201748, "epoch": 4803} {"train_loss": -7.337846755981445, "global_step": 201749, "epoch": 4803} {"train_loss": -7.329253196716309, "global_step": 201750, "epoch": 4803} {"train_loss": -7.246963024139404, "global_step": 201751, "epoch": 4803} {"train_loss": -7.111171722412109, "global_step": 201752, "epoch": 4803} {"train_loss": -7.250143527984619, "global_step": 201753, "epoch": 4803} {"train_loss": -7.245898723602295, "global_step": 201754, "epoch": 4803} {"train_loss": -7.27223539352417, "global_step": 201755, "epoch": 4803} {"train_loss": -7.2606658935546875, "global_step": 201756, "epoch": 4803} {"train_loss": -7.314212322235107, "global_step": 201757, "epoch": 4803} {"train_loss": -7.2842607498168945, "global_step": 201758, "epoch": 4803} {"train_loss": -7.3488850593566895, "global_step": 201759, "epoch": 4803} {"train_loss": -7.211134910583496, "global_step": 201760, "epoch": 4803} {"train_loss": -7.266232013702393, "global_step": 201761, "epoch": 4803} {"train_loss": -7.267223358154297, "global_step": 201762, "epoch": 4803} {"train_loss": -7.293003082275391, "global_step": 201763, "epoch": 4803} {"train_loss": -7.337542533874512, "global_step": 201764, "epoch": 4803} {"train_loss": -7.280559539794922, "global_step": 201765, "epoch": 4803} {"train_loss": -7.239711761474609, "global_step": 201766, "epoch": 4803} {"train_loss": -7.258834486915951, "global_step": 201767, "epoch": 4803, "val_loss": 69032.8359375} {"train_loss": -7.26085901260376, "global_step": 201768, "epoch": 4804} {"train_loss": -7.345881938934326, "global_step": 201769, "epoch": 4804} {"train_loss": -7.309414863586426, "global_step": 201770, "epoch": 4804} {"train_loss": -7.299190044403076, "global_step": 201771, "epoch": 4804} {"train_loss": -7.168198108673096, "global_step": 201772, "epoch": 4804} {"train_loss": -7.0510029792785645, "global_step": 201773, "epoch": 4804} {"train_loss": -7.260770797729492, "global_step": 201774, "epoch": 4804} {"train_loss": -7.271712303161621, "global_step": 201775, "epoch": 4804} {"train_loss": -7.152866363525391, "global_step": 201776, "epoch": 4804} {"train_loss": -7.235800743103027, "global_step": 201777, "epoch": 4804} {"train_loss": -7.2677741050720215, "global_step": 201778, "epoch": 4804} {"train_loss": -7.185620307922363, "global_step": 201779, "epoch": 4804} {"train_loss": -7.249907970428467, "global_step": 201780, "epoch": 4804} {"train_loss": -7.2321062088012695, "global_step": 201781, "epoch": 4804} {"train_loss": -7.0851898193359375, "global_step": 201782, "epoch": 4804} {"train_loss": -7.094679355621338, "global_step": 201783, "epoch": 4804} {"train_loss": -7.272048473358154, "global_step": 201784, "epoch": 4804} {"train_loss": -7.101556777954102, "global_step": 201785, "epoch": 4804} {"train_loss": -7.255899906158447, "global_step": 201786, "epoch": 4804} {"train_loss": -7.198702812194824, "global_step": 201787, "epoch": 4804} {"train_loss": -7.2094221115112305, "global_step": 201788, "epoch": 4804} {"train_loss": -7.187166213989258, "global_step": 201789, "epoch": 4804} {"train_loss": -7.181903839111328, "global_step": 201790, "epoch": 4804} {"train_loss": -7.2359418869018555, "global_step": 201791, "epoch": 4804} {"train_loss": -7.241794109344482, "global_step": 201792, "epoch": 4804} {"train_loss": -7.150094985961914, "global_step": 201793, "epoch": 4804} {"train_loss": -7.086353302001953, "global_step": 201794, "epoch": 4804} {"train_loss": -7.259385585784912, "global_step": 201795, "epoch": 4804} {"train_loss": -7.216553688049316, "global_step": 201796, "epoch": 4804} {"train_loss": -7.359264373779297, "global_step": 201797, "epoch": 4804} {"train_loss": -7.246901512145996, "global_step": 201798, "epoch": 4804} {"train_loss": -7.1439313888549805, "global_step": 201799, "epoch": 4804} {"train_loss": -7.2571516036987305, "global_step": 201800, "epoch": 4804} {"train_loss": -7.210428714752197, "global_step": 201801, "epoch": 4804} {"train_loss": -7.144166946411133, "global_step": 201802, "epoch": 4804} {"train_loss": -7.239710330963135, "global_step": 201803, "epoch": 4804} {"train_loss": -7.271317958831787, "global_step": 201804, "epoch": 4804} {"train_loss": -7.211908340454102, "global_step": 201805, "epoch": 4804} {"train_loss": -7.046492576599121, "global_step": 201806, "epoch": 4804} {"train_loss": -7.231956481933594, "global_step": 201807, "epoch": 4804} {"train_loss": -7.153303146362305, "global_step": 201808, "epoch": 4804} {"train_loss": -7.207194771085467, "global_step": 201809, "epoch": 4804, "val_loss": 69097.8046875} {"train_loss": -7.293455123901367, "global_step": 201810, "epoch": 4805} {"train_loss": -7.246620178222656, "global_step": 201811, "epoch": 4805} {"train_loss": -7.180884838104248, "global_step": 201812, "epoch": 4805} {"train_loss": -7.233799934387207, "global_step": 201813, "epoch": 4805} {"train_loss": -7.28092098236084, "global_step": 201814, "epoch": 4805} {"train_loss": -7.238193511962891, "global_step": 201815, "epoch": 4805} {"train_loss": -7.299129962921143, "global_step": 201816, "epoch": 4805} {"train_loss": -7.290050983428955, "global_step": 201817, "epoch": 4805} {"train_loss": -7.2784104347229, "global_step": 201818, "epoch": 4805} {"train_loss": -7.316864490509033, "global_step": 201819, "epoch": 4805} {"train_loss": -7.337634563446045, "global_step": 201820, "epoch": 4805} {"train_loss": -7.2844624519348145, "global_step": 201821, "epoch": 4805} {"train_loss": -7.33213996887207, "global_step": 201822, "epoch": 4805} {"train_loss": -7.258917331695557, "global_step": 201823, "epoch": 4805} {"train_loss": -7.325056076049805, "global_step": 201824, "epoch": 4805} {"train_loss": -7.209908962249756, "global_step": 201825, "epoch": 4805} {"train_loss": -7.298877716064453, "global_step": 201826, "epoch": 4805} {"train_loss": -7.314374923706055, "global_step": 201827, "epoch": 4805} {"train_loss": -7.366335868835449, "global_step": 201828, "epoch": 4805} {"train_loss": -7.272620677947998, "global_step": 201829, "epoch": 4805} {"train_loss": -7.3018293380737305, "global_step": 201830, "epoch": 4805} {"train_loss": -7.2477545738220215, "global_step": 201831, "epoch": 4805} {"train_loss": -7.359346389770508, "global_step": 201832, "epoch": 4805} {"train_loss": -7.378526210784912, "global_step": 201833, "epoch": 4805} {"train_loss": -7.146325588226318, "global_step": 201834, "epoch": 4805} {"train_loss": -7.295673370361328, "global_step": 201835, "epoch": 4805} {"train_loss": -7.198999404907227, "global_step": 201836, "epoch": 4805} {"train_loss": -7.201937198638916, "global_step": 201837, "epoch": 4805} {"train_loss": -7.171688079833984, "global_step": 201838, "epoch": 4805} {"train_loss": -7.27311897277832, "global_step": 201839, "epoch": 4805} {"train_loss": -7.3081207275390625, "global_step": 201840, "epoch": 4805} {"train_loss": -7.231514930725098, "global_step": 201841, "epoch": 4805} {"train_loss": -7.163979530334473, "global_step": 201842, "epoch": 4805} {"train_loss": -7.223879814147949, "global_step": 201843, "epoch": 4805} {"train_loss": -7.177086353302002, "global_step": 201844, "epoch": 4805} {"train_loss": -7.303570747375488, "global_step": 201845, "epoch": 4805} {"train_loss": -7.2571563720703125, "global_step": 201846, "epoch": 4805} {"train_loss": -7.266575813293457, "global_step": 201847, "epoch": 4805} {"train_loss": -7.349556922912598, "global_step": 201848, "epoch": 4805} {"train_loss": -7.2413201332092285, "global_step": 201849, "epoch": 4805} {"train_loss": -7.295963287353516, "global_step": 201850, "epoch": 4805} {"train_loss": -7.269742148263114, "global_step": 201851, "epoch": 4805, "val_loss": 69121.2109375} {"train_loss": -7.289977073669434, "global_step": 201852, "epoch": 4806} {"train_loss": -7.2404608726501465, "global_step": 201853, "epoch": 4806} {"train_loss": -7.199707984924316, "global_step": 201854, "epoch": 4806} {"train_loss": -7.297747611999512, "global_step": 201855, "epoch": 4806} {"train_loss": -7.32733154296875, "global_step": 201856, "epoch": 4806} {"train_loss": -7.253662586212158, "global_step": 201857, "epoch": 4806} {"train_loss": -7.186397552490234, "global_step": 201858, "epoch": 4806} {"train_loss": -7.192722797393799, "global_step": 201859, "epoch": 4806} {"train_loss": -7.233128547668457, "global_step": 201860, "epoch": 4806} {"train_loss": -7.140558242797852, "global_step": 201861, "epoch": 4806} {"train_loss": -7.114567756652832, "global_step": 201862, "epoch": 4806} {"train_loss": -7.209155082702637, "global_step": 201863, "epoch": 4806} {"train_loss": -7.343766212463379, "global_step": 201864, "epoch": 4806} {"train_loss": -7.240303039550781, "global_step": 201865, "epoch": 4806} {"train_loss": -7.174288749694824, "global_step": 201866, "epoch": 4806} {"train_loss": -7.209356784820557, "global_step": 201867, "epoch": 4806} {"train_loss": -7.094799995422363, "global_step": 201868, "epoch": 4806} {"train_loss": -7.238486289978027, "global_step": 201869, "epoch": 4806} {"train_loss": -7.235898971557617, "global_step": 201870, "epoch": 4806} {"train_loss": -7.115761756896973, "global_step": 201871, "epoch": 4806} {"train_loss": -7.399533748626709, "global_step": 201872, "epoch": 4806} {"train_loss": -7.263298034667969, "global_step": 201873, "epoch": 4806} {"train_loss": -7.131787300109863, "global_step": 201874, "epoch": 4806} {"train_loss": -7.224326133728027, "global_step": 201875, "epoch": 4806} {"train_loss": -7.187015533447266, "global_step": 201876, "epoch": 4806} {"train_loss": -7.318927764892578, "global_step": 201877, "epoch": 4806} {"train_loss": -7.119756698608398, "global_step": 201878, "epoch": 4806} {"train_loss": -7.1529436111450195, "global_step": 201879, "epoch": 4806} {"train_loss": -7.179835796356201, "global_step": 201880, "epoch": 4806} {"train_loss": -7.15326452255249, "global_step": 201881, "epoch": 4806} {"train_loss": -7.19757604598999, "global_step": 201882, "epoch": 4806} {"train_loss": -7.092858791351318, "global_step": 201883, "epoch": 4806} {"train_loss": -7.296691417694092, "global_step": 201884, "epoch": 4806} {"train_loss": -7.169737339019775, "global_step": 201885, "epoch": 4806} {"train_loss": -7.252196788787842, "global_step": 201886, "epoch": 4806} {"train_loss": -7.007551670074463, "global_step": 201887, "epoch": 4806} {"train_loss": -7.187333106994629, "global_step": 201888, "epoch": 4806} {"train_loss": -7.231025218963623, "global_step": 201889, "epoch": 4806} {"train_loss": -7.04814338684082, "global_step": 201890, "epoch": 4806} {"train_loss": -7.060764312744141, "global_step": 201891, "epoch": 4806} {"train_loss": -7.131106376647949, "global_step": 201892, "epoch": 4806} {"train_loss": -7.195966482162476, "global_step": 201893, "epoch": 4806, "val_loss": 69222.328125} {"train_loss": -7.096775054931641, "global_step": 201894, "epoch": 4807} {"train_loss": -7.1186065673828125, "global_step": 201895, "epoch": 4807} {"train_loss": -7.180693626403809, "global_step": 201896, "epoch": 4807} {"train_loss": -7.115354537963867, "global_step": 201897, "epoch": 4807} {"train_loss": -7.135126113891602, "global_step": 201898, "epoch": 4807} {"train_loss": -7.242801189422607, "global_step": 201899, "epoch": 4807} {"train_loss": -7.075383186340332, "global_step": 201900, "epoch": 4807} {"train_loss": -7.187688827514648, "global_step": 201901, "epoch": 4807} {"train_loss": -6.993597030639648, "global_step": 201902, "epoch": 4807} {"train_loss": -7.069849014282227, "global_step": 201903, "epoch": 4807} {"train_loss": -7.150112152099609, "global_step": 201904, "epoch": 4807} {"train_loss": -7.118403911590576, "global_step": 201905, "epoch": 4807} {"train_loss": -7.074359893798828, "global_step": 201906, "epoch": 4807} {"train_loss": -7.265703201293945, "global_step": 201907, "epoch": 4807} {"train_loss": -7.107036590576172, "global_step": 201908, "epoch": 4807} {"train_loss": -7.198465824127197, "global_step": 201909, "epoch": 4807} {"train_loss": -7.137415885925293, "global_step": 201910, "epoch": 4807} {"train_loss": -7.210860729217529, "global_step": 201911, "epoch": 4807} {"train_loss": -7.250685691833496, "global_step": 201912, "epoch": 4807} {"train_loss": -7.209902763366699, "global_step": 201913, "epoch": 4807} {"train_loss": -7.094080924987793, "global_step": 201914, "epoch": 4807} {"train_loss": -7.164305686950684, "global_step": 201915, "epoch": 4807} {"train_loss": -7.074572563171387, "global_step": 201916, "epoch": 4807} {"train_loss": -7.0900115966796875, "global_step": 201917, "epoch": 4807} {"train_loss": -7.228178024291992, "global_step": 201918, "epoch": 4807} {"train_loss": -7.2484002113342285, "global_step": 201919, "epoch": 4807} {"train_loss": -7.076624870300293, "global_step": 201920, "epoch": 4807} {"train_loss": -7.162455081939697, "global_step": 201921, "epoch": 4807} {"train_loss": -7.151001930236816, "global_step": 201922, "epoch": 4807} {"train_loss": -7.196840286254883, "global_step": 201923, "epoch": 4807} {"train_loss": -7.21066427230835, "global_step": 201924, "epoch": 4807} {"train_loss": -6.975957870483398, "global_step": 201925, "epoch": 4807} {"train_loss": -7.206618309020996, "global_step": 201926, "epoch": 4807} {"train_loss": -7.214623928070068, "global_step": 201927, "epoch": 4807} {"train_loss": -7.061398029327393, "global_step": 201928, "epoch": 4807} {"train_loss": -7.179710865020752, "global_step": 201929, "epoch": 4807} {"train_loss": -7.276017189025879, "global_step": 201930, "epoch": 4807} {"train_loss": -7.0778608322143555, "global_step": 201931, "epoch": 4807} {"train_loss": -7.219585418701172, "global_step": 201932, "epoch": 4807} {"train_loss": -7.174128532409668, "global_step": 201933, "epoch": 4807} {"train_loss": -7.06105899810791, "global_step": 201934, "epoch": 4807} {"train_loss": -7.149989264351981, "global_step": 201935, "epoch": 4807, "val_loss": 69028.5078125} {"train_loss": -7.191546440124512, "global_step": 201936, "epoch": 4808} {"train_loss": -7.203239917755127, "global_step": 201937, "epoch": 4808} {"train_loss": -7.2706780433654785, "global_step": 201938, "epoch": 4808} {"train_loss": -7.17540979385376, "global_step": 201939, "epoch": 4808} {"train_loss": -7.223762512207031, "global_step": 201940, "epoch": 4808} {"train_loss": -7.141510963439941, "global_step": 201941, "epoch": 4808} {"train_loss": -7.275872230529785, "global_step": 201942, "epoch": 4808} {"train_loss": -7.233705520629883, "global_step": 201943, "epoch": 4808} {"train_loss": -7.203559875488281, "global_step": 201944, "epoch": 4808} {"train_loss": -7.229432106018066, "global_step": 201945, "epoch": 4808} {"train_loss": -7.315845489501953, "global_step": 201946, "epoch": 4808} {"train_loss": -7.14035701751709, "global_step": 201947, "epoch": 4808} {"train_loss": -7.1368513107299805, "global_step": 201948, "epoch": 4808} {"train_loss": -7.135772705078125, "global_step": 201949, "epoch": 4808} {"train_loss": -7.201396942138672, "global_step": 201950, "epoch": 4808} {"train_loss": -7.233186721801758, "global_step": 201951, "epoch": 4808} {"train_loss": -7.227402210235596, "global_step": 201952, "epoch": 4808} {"train_loss": -7.217650413513184, "global_step": 201953, "epoch": 4808} {"train_loss": -7.159928321838379, "global_step": 201954, "epoch": 4808} {"train_loss": -7.245626449584961, "global_step": 201955, "epoch": 4808} {"train_loss": -7.2163896560668945, "global_step": 201956, "epoch": 4808} {"train_loss": -7.270112991333008, "global_step": 201957, "epoch": 4808} {"train_loss": -7.180917739868164, "global_step": 201958, "epoch": 4808} {"train_loss": -7.1835432052612305, "global_step": 201959, "epoch": 4808} {"train_loss": -7.198014259338379, "global_step": 201960, "epoch": 4808} {"train_loss": -7.21476411819458, "global_step": 201961, "epoch": 4808} {"train_loss": -7.211268424987793, "global_step": 201962, "epoch": 4808} {"train_loss": -7.253034591674805, "global_step": 201963, "epoch": 4808} {"train_loss": -7.1324357986450195, "global_step": 201964, "epoch": 4808} {"train_loss": -7.203546047210693, "global_step": 201965, "epoch": 4808} {"train_loss": -7.231137752532959, "global_step": 201966, "epoch": 4808} {"train_loss": -7.321295261383057, "global_step": 201967, "epoch": 4808} {"train_loss": -7.229045867919922, "global_step": 201968, "epoch": 4808} {"train_loss": -7.214410305023193, "global_step": 201969, "epoch": 4808} {"train_loss": -7.1338629722595215, "global_step": 201970, "epoch": 4808} {"train_loss": -7.287620544433594, "global_step": 201971, "epoch": 4808} {"train_loss": -7.24338436126709, "global_step": 201972, "epoch": 4808} {"train_loss": -7.245352268218994, "global_step": 201973, "epoch": 4808} {"train_loss": -7.098543167114258, "global_step": 201974, "epoch": 4808} {"train_loss": -7.260007381439209, "global_step": 201975, "epoch": 4808} {"train_loss": -7.362491607666016, "global_step": 201976, "epoch": 4808} {"train_loss": -7.217653501601446, "global_step": 201977, "epoch": 4808, "val_loss": 69183.6796875} {"train_loss": -7.3318328857421875, "global_step": 201978, "epoch": 4809} {"train_loss": -7.34958028793335, "global_step": 201979, "epoch": 4809} {"train_loss": -7.298626899719238, "global_step": 201980, "epoch": 4809} {"train_loss": -7.315244674682617, "global_step": 201981, "epoch": 4809} {"train_loss": -7.40807580947876, "global_step": 201982, "epoch": 4809} {"train_loss": -7.334862232208252, "global_step": 201983, "epoch": 4809} {"train_loss": -7.39849853515625, "global_step": 201984, "epoch": 4809} {"train_loss": -7.33577823638916, "global_step": 201985, "epoch": 4809} {"train_loss": -7.303180694580078, "global_step": 201986, "epoch": 4809} {"train_loss": -7.298053741455078, "global_step": 201987, "epoch": 4809} {"train_loss": -7.439064025878906, "global_step": 201988, "epoch": 4809} {"train_loss": -7.292387962341309, "global_step": 201989, "epoch": 4809} {"train_loss": -7.312892913818359, "global_step": 201990, "epoch": 4809} {"train_loss": -7.201671600341797, "global_step": 201991, "epoch": 4809} {"train_loss": -7.238348007202148, "global_step": 201992, "epoch": 4809} {"train_loss": -7.228723526000977, "global_step": 201993, "epoch": 4809} {"train_loss": -7.3858771324157715, "global_step": 201994, "epoch": 4809} {"train_loss": -7.2396559715271, "global_step": 201995, "epoch": 4809} {"train_loss": -7.2066650390625, "global_step": 201996, "epoch": 4809} {"train_loss": -7.353564262390137, "global_step": 201997, "epoch": 4809} {"train_loss": -7.276905536651611, "global_step": 201998, "epoch": 4809} {"train_loss": -7.162575721740723, "global_step": 201999, "epoch": 4809} {"train_loss": -7.104189395904541, "global_step": 202000, "epoch": 4809} {"train_loss": -7.4252400398254395, "global_step": 202001, "epoch": 4809} {"train_loss": -7.13582181930542, "global_step": 202002, "epoch": 4809} {"train_loss": -7.051841735839844, "global_step": 202003, "epoch": 4809} {"train_loss": -7.257763862609863, "global_step": 202004, "epoch": 4809} {"train_loss": -7.115099906921387, "global_step": 202005, "epoch": 4809} {"train_loss": -7.199180603027344, "global_step": 202006, "epoch": 4809} {"train_loss": -7.128288745880127, "global_step": 202007, "epoch": 4809} {"train_loss": -7.1633195877075195, "global_step": 202008, "epoch": 4809} {"train_loss": -7.184455394744873, "global_step": 202009, "epoch": 4809} {"train_loss": -7.205124378204346, "global_step": 202010, "epoch": 4809} {"train_loss": -7.253169059753418, "global_step": 202011, "epoch": 4809} {"train_loss": -7.2101030349731445, "global_step": 202012, "epoch": 4809} {"train_loss": -7.162925720214844, "global_step": 202013, "epoch": 4809} {"train_loss": -7.205277442932129, "global_step": 202014, "epoch": 4809} {"train_loss": -7.171652317047119, "global_step": 202015, "epoch": 4809} {"train_loss": -7.309084415435791, "global_step": 202016, "epoch": 4809} {"train_loss": -7.19802188873291, "global_step": 202017, "epoch": 4809} {"train_loss": -7.2048139572143555, "global_step": 202018, "epoch": 4809} {"train_loss": -7.255834988185337, "global_step": 202019, "epoch": 4809, "val_loss": 69044.6328125} {"train_loss": -7.112262725830078, "global_step": 202020, "epoch": 4810} {"train_loss": -7.146456718444824, "global_step": 202021, "epoch": 4810} {"train_loss": -7.230249404907227, "global_step": 202022, "epoch": 4810} {"train_loss": -7.212477207183838, "global_step": 202023, "epoch": 4810} {"train_loss": -7.3231024742126465, "global_step": 202024, "epoch": 4810} {"train_loss": -7.225550651550293, "global_step": 202025, "epoch": 4810} {"train_loss": -7.2941694259643555, "global_step": 202026, "epoch": 4810} {"train_loss": -7.1904497146606445, "global_step": 202027, "epoch": 4810} {"train_loss": -7.293581008911133, "global_step": 202028, "epoch": 4810} {"train_loss": -7.285007476806641, "global_step": 202029, "epoch": 4810} {"train_loss": -7.315490245819092, "global_step": 202030, "epoch": 4810} {"train_loss": -7.324503421783447, "global_step": 202031, "epoch": 4810} {"train_loss": -7.399762153625488, "global_step": 202032, "epoch": 4810} {"train_loss": -7.418371200561523, "global_step": 202033, "epoch": 4810} {"train_loss": -7.371705055236816, "global_step": 202034, "epoch": 4810} {"train_loss": -7.296064376831055, "global_step": 202035, "epoch": 4810} {"train_loss": -7.286016941070557, "global_step": 202036, "epoch": 4810} {"train_loss": -7.30659818649292, "global_step": 202037, "epoch": 4810} {"train_loss": -7.248656272888184, "global_step": 202038, "epoch": 4810} {"train_loss": -7.223235130310059, "global_step": 202039, "epoch": 4810} {"train_loss": -7.273625373840332, "global_step": 202040, "epoch": 4810} {"train_loss": -7.302713871002197, "global_step": 202041, "epoch": 4810} {"train_loss": -7.377869129180908, "global_step": 202042, "epoch": 4810} {"train_loss": -7.170893669128418, "global_step": 202043, "epoch": 4810} {"train_loss": -7.390434741973877, "global_step": 202044, "epoch": 4810} {"train_loss": -7.254452705383301, "global_step": 202045, "epoch": 4810} {"train_loss": -7.330315589904785, "global_step": 202046, "epoch": 4810} {"train_loss": -7.195308685302734, "global_step": 202047, "epoch": 4810} {"train_loss": -7.230030536651611, "global_step": 202048, "epoch": 4810} {"train_loss": -7.30612850189209, "global_step": 202049, "epoch": 4810} {"train_loss": -7.223155975341797, "global_step": 202050, "epoch": 4810} {"train_loss": -7.314589023590088, "global_step": 202051, "epoch": 4810} {"train_loss": -7.274223327636719, "global_step": 202052, "epoch": 4810} {"train_loss": -7.318222999572754, "global_step": 202053, "epoch": 4810} {"train_loss": -7.030093669891357, "global_step": 202054, "epoch": 4810} {"train_loss": -7.232542037963867, "global_step": 202055, "epoch": 4810} {"train_loss": -7.270733833312988, "global_step": 202056, "epoch": 4810} {"train_loss": -7.122073650360107, "global_step": 202057, "epoch": 4810} {"train_loss": -7.1415510177612305, "global_step": 202058, "epoch": 4810} {"train_loss": -7.064637184143066, "global_step": 202059, "epoch": 4810} {"train_loss": -7.12172794342041, "global_step": 202060, "epoch": 4810} {"train_loss": -7.250654004869007, "global_step": 202061, "epoch": 4810, "val_loss": 69303.53125} {"train_loss": -7.059473514556885, "global_step": 202062, "epoch": 4811} {"train_loss": -7.15666389465332, "global_step": 202063, "epoch": 4811} {"train_loss": -7.179399013519287, "global_step": 202064, "epoch": 4811} {"train_loss": -7.162907600402832, "global_step": 202065, "epoch": 4811} {"train_loss": -7.27001953125, "global_step": 202066, "epoch": 4811} {"train_loss": -7.10734748840332, "global_step": 202067, "epoch": 4811} {"train_loss": -7.288702487945557, "global_step": 202068, "epoch": 4811} {"train_loss": -7.238885402679443, "global_step": 202069, "epoch": 4811} {"train_loss": -7.221012115478516, "global_step": 202070, "epoch": 4811} {"train_loss": -7.279427528381348, "global_step": 202071, "epoch": 4811} {"train_loss": -7.238014221191406, "global_step": 202072, "epoch": 4811} {"train_loss": -7.302175521850586, "global_step": 202073, "epoch": 4811} {"train_loss": -7.196720123291016, "global_step": 202074, "epoch": 4811} {"train_loss": -7.224558353424072, "global_step": 202075, "epoch": 4811} {"train_loss": -7.256343841552734, "global_step": 202076, "epoch": 4811} {"train_loss": -7.1539106369018555, "global_step": 202077, "epoch": 4811} {"train_loss": -7.288122653961182, "global_step": 202078, "epoch": 4811} {"train_loss": -7.231261253356934, "global_step": 202079, "epoch": 4811} {"train_loss": -7.254642486572266, "global_step": 202080, "epoch": 4811} {"train_loss": -7.212788105010986, "global_step": 202081, "epoch": 4811} {"train_loss": -7.2082414627075195, "global_step": 202082, "epoch": 4811} {"train_loss": -7.316020965576172, "global_step": 202083, "epoch": 4811} {"train_loss": -7.1446533203125, "global_step": 202084, "epoch": 4811} {"train_loss": -7.247359275817871, "global_step": 202085, "epoch": 4811} {"train_loss": -7.193614959716797, "global_step": 202086, "epoch": 4811} {"train_loss": -7.186450481414795, "global_step": 202087, "epoch": 4811} {"train_loss": -7.252585411071777, "global_step": 202088, "epoch": 4811} {"train_loss": -7.278031349182129, "global_step": 202089, "epoch": 4811} {"train_loss": -7.276572227478027, "global_step": 202090, "epoch": 4811} {"train_loss": -7.305686950683594, "global_step": 202091, "epoch": 4811} {"train_loss": -7.232208251953125, "global_step": 202092, "epoch": 4811} {"train_loss": -7.182997703552246, "global_step": 202093, "epoch": 4811} {"train_loss": -7.226655960083008, "global_step": 202094, "epoch": 4811} {"train_loss": -7.242400646209717, "global_step": 202095, "epoch": 4811} {"train_loss": -7.209572792053223, "global_step": 202096, "epoch": 4811} {"train_loss": -7.293797492980957, "global_step": 202097, "epoch": 4811} {"train_loss": -7.229907989501953, "global_step": 202098, "epoch": 4811} {"train_loss": -7.231225967407227, "global_step": 202099, "epoch": 4811} {"train_loss": -7.236973762512207, "global_step": 202100, "epoch": 4811} {"train_loss": -7.287739276885986, "global_step": 202101, "epoch": 4811} {"train_loss": -7.207213401794434, "global_step": 202102, "epoch": 4811} {"train_loss": -7.228707472483317, "global_step": 202103, "epoch": 4811, "val_loss": 68964.78125} {"train_loss": -7.271034240722656, "global_step": 202104, "epoch": 4812} {"train_loss": -7.302948474884033, "global_step": 202105, "epoch": 4812} {"train_loss": -7.269871711730957, "global_step": 202106, "epoch": 4812} {"train_loss": -7.378512382507324, "global_step": 202107, "epoch": 4812} {"train_loss": -7.301855087280273, "global_step": 202108, "epoch": 4812} {"train_loss": -7.278974533081055, "global_step": 202109, "epoch": 4812} {"train_loss": -7.272783279418945, "global_step": 202110, "epoch": 4812} {"train_loss": -7.29109001159668, "global_step": 202111, "epoch": 4812} {"train_loss": -7.345156669616699, "global_step": 202112, "epoch": 4812} {"train_loss": -7.253146648406982, "global_step": 202113, "epoch": 4812} {"train_loss": -7.257282733917236, "global_step": 202114, "epoch": 4812} {"train_loss": -7.395906925201416, "global_step": 202115, "epoch": 4812} {"train_loss": -7.258993625640869, "global_step": 202116, "epoch": 4812} {"train_loss": -7.307696342468262, "global_step": 202117, "epoch": 4812} {"train_loss": -7.2951202392578125, "global_step": 202118, "epoch": 4812} {"train_loss": -7.239884853363037, "global_step": 202119, "epoch": 4812} {"train_loss": -7.400611400604248, "global_step": 202120, "epoch": 4812} {"train_loss": -7.185924530029297, "global_step": 202121, "epoch": 4812} {"train_loss": -7.229560375213623, "global_step": 202122, "epoch": 4812} {"train_loss": -7.295295238494873, "global_step": 202123, "epoch": 4812} {"train_loss": -7.218645095825195, "global_step": 202124, "epoch": 4812} {"train_loss": -7.186291217803955, "global_step": 202125, "epoch": 4812} {"train_loss": -7.15975284576416, "global_step": 202126, "epoch": 4812} {"train_loss": -7.234795570373535, "global_step": 202127, "epoch": 4812} {"train_loss": -7.287816524505615, "global_step": 202128, "epoch": 4812} {"train_loss": -7.258661270141602, "global_step": 202129, "epoch": 4812} {"train_loss": -7.20848274230957, "global_step": 202130, "epoch": 4812} {"train_loss": -7.285411834716797, "global_step": 202131, "epoch": 4812} {"train_loss": -7.212611198425293, "global_step": 202132, "epoch": 4812} {"train_loss": -7.2768778800964355, "global_step": 202133, "epoch": 4812} {"train_loss": -7.177604675292969, "global_step": 202134, "epoch": 4812} {"train_loss": -7.270569324493408, "global_step": 202135, "epoch": 4812} {"train_loss": -7.178000450134277, "global_step": 202136, "epoch": 4812} {"train_loss": -7.238346099853516, "global_step": 202137, "epoch": 4812} {"train_loss": -7.104358673095703, "global_step": 202138, "epoch": 4812} {"train_loss": -7.125262260437012, "global_step": 202139, "epoch": 4812} {"train_loss": -7.255987644195557, "global_step": 202140, "epoch": 4812} {"train_loss": -7.147931098937988, "global_step": 202141, "epoch": 4812} {"train_loss": -7.131966590881348, "global_step": 202142, "epoch": 4812} {"train_loss": -7.340149879455566, "global_step": 202143, "epoch": 4812} {"train_loss": -7.245824813842773, "global_step": 202144, "epoch": 4812} {"train_loss": -7.2532341820853095, "global_step": 202145, "epoch": 4812, "val_loss": 69091.5078125} {"train_loss": -7.231809616088867, "global_step": 202146, "epoch": 4813} {"train_loss": -7.214753150939941, "global_step": 202147, "epoch": 4813} {"train_loss": -7.244854927062988, "global_step": 202148, "epoch": 4813} {"train_loss": -7.186952114105225, "global_step": 202149, "epoch": 4813} {"train_loss": -7.217095375061035, "global_step": 202150, "epoch": 4813} {"train_loss": -7.2354302406311035, "global_step": 202151, "epoch": 4813} {"train_loss": -7.198019981384277, "global_step": 202152, "epoch": 4813} {"train_loss": -7.11641788482666, "global_step": 202153, "epoch": 4813} {"train_loss": -7.240383625030518, "global_step": 202154, "epoch": 4813} {"train_loss": -7.202974796295166, "global_step": 202155, "epoch": 4813} {"train_loss": -7.244339942932129, "global_step": 202156, "epoch": 4813} {"train_loss": -7.253091812133789, "global_step": 202157, "epoch": 4813} {"train_loss": -7.243045806884766, "global_step": 202158, "epoch": 4813} {"train_loss": -7.195837020874023, "global_step": 202159, "epoch": 4813} {"train_loss": -7.227840423583984, "global_step": 202160, "epoch": 4813} {"train_loss": -7.18462610244751, "global_step": 202161, "epoch": 4813} {"train_loss": -7.204493999481201, "global_step": 202162, "epoch": 4813} {"train_loss": -7.055214881896973, "global_step": 202163, "epoch": 4813} {"train_loss": -7.144181251525879, "global_step": 202164, "epoch": 4813} {"train_loss": -7.27281379699707, "global_step": 202165, "epoch": 4813} {"train_loss": -7.087615966796875, "global_step": 202166, "epoch": 4813} {"train_loss": -7.217815399169922, "global_step": 202167, "epoch": 4813} {"train_loss": -7.286402702331543, "global_step": 202168, "epoch": 4813} {"train_loss": -7.178193092346191, "global_step": 202169, "epoch": 4813} {"train_loss": -7.185031890869141, "global_step": 202170, "epoch": 4813} {"train_loss": -7.289597988128662, "global_step": 202171, "epoch": 4813} {"train_loss": -7.178093910217285, "global_step": 202172, "epoch": 4813} {"train_loss": -7.238753318786621, "global_step": 202173, "epoch": 4813} {"train_loss": -7.27225399017334, "global_step": 202174, "epoch": 4813} {"train_loss": -7.2741780281066895, "global_step": 202175, "epoch": 4813} {"train_loss": -7.312207221984863, "global_step": 202176, "epoch": 4813} {"train_loss": -7.262929916381836, "global_step": 202177, "epoch": 4813} {"train_loss": -7.203197002410889, "global_step": 202178, "epoch": 4813} {"train_loss": -7.202045917510986, "global_step": 202179, "epoch": 4813} {"train_loss": -7.233138084411621, "global_step": 202180, "epoch": 4813} {"train_loss": -7.225827693939209, "global_step": 202181, "epoch": 4813} {"train_loss": -7.290774822235107, "global_step": 202182, "epoch": 4813} {"train_loss": -7.302931785583496, "global_step": 202183, "epoch": 4813} {"train_loss": -7.3051958084106445, "global_step": 202184, "epoch": 4813} {"train_loss": -7.1515398025512695, "global_step": 202185, "epoch": 4813} {"train_loss": -7.2240891456604, "global_step": 202186, "epoch": 4813} {"train_loss": -7.220668917610531, "global_step": 202187, "epoch": 4813, "val_loss": 69108.9921875} {"train_loss": -7.34699010848999, "global_step": 202188, "epoch": 4814} {"train_loss": -7.323423862457275, "global_step": 202189, "epoch": 4814} {"train_loss": -7.230359077453613, "global_step": 202190, "epoch": 4814} {"train_loss": -7.277866363525391, "global_step": 202191, "epoch": 4814} {"train_loss": -7.373955726623535, "global_step": 202192, "epoch": 4814} {"train_loss": -7.3449201583862305, "global_step": 202193, "epoch": 4814} {"train_loss": -7.3475518226623535, "global_step": 202194, "epoch": 4814} {"train_loss": -7.371804237365723, "global_step": 202195, "epoch": 4814} {"train_loss": -7.273791790008545, "global_step": 202196, "epoch": 4814} {"train_loss": -7.301026344299316, "global_step": 202197, "epoch": 4814} {"train_loss": -7.255507469177246, "global_step": 202198, "epoch": 4814} {"train_loss": -7.246011734008789, "global_step": 202199, "epoch": 4814} {"train_loss": -7.357242107391357, "global_step": 202200, "epoch": 4814} {"train_loss": -7.363531112670898, "global_step": 202201, "epoch": 4814} {"train_loss": -7.368100166320801, "global_step": 202202, "epoch": 4814} {"train_loss": -7.332032680511475, "global_step": 202203, "epoch": 4814} {"train_loss": -7.289194107055664, "global_step": 202204, "epoch": 4814} {"train_loss": -7.346229076385498, "global_step": 202205, "epoch": 4814} {"train_loss": -7.285928726196289, "global_step": 202206, "epoch": 4814} {"train_loss": -7.357251167297363, "global_step": 202207, "epoch": 4814} {"train_loss": -7.229084014892578, "global_step": 202208, "epoch": 4814} {"train_loss": -7.249395370483398, "global_step": 202209, "epoch": 4814} {"train_loss": -7.2411041259765625, "global_step": 202210, "epoch": 4814} {"train_loss": -7.187830448150635, "global_step": 202211, "epoch": 4814} {"train_loss": -7.153298377990723, "global_step": 202212, "epoch": 4814} {"train_loss": -7.201766014099121, "global_step": 202213, "epoch": 4814} {"train_loss": -7.24946403503418, "global_step": 202214, "epoch": 4814} {"train_loss": -7.126729488372803, "global_step": 202215, "epoch": 4814} {"train_loss": -7.199275970458984, "global_step": 202216, "epoch": 4814} {"train_loss": -7.150555610656738, "global_step": 202217, "epoch": 4814} {"train_loss": -7.093784332275391, "global_step": 202218, "epoch": 4814} {"train_loss": -7.160358905792236, "global_step": 202219, "epoch": 4814} {"train_loss": -7.2258782386779785, "global_step": 202220, "epoch": 4814} {"train_loss": -6.940255165100098, "global_step": 202221, "epoch": 4814} {"train_loss": -7.2242255210876465, "global_step": 202222, "epoch": 4814} {"train_loss": -6.8588361740112305, "global_step": 202223, "epoch": 4814} {"train_loss": -7.151300430297852, "global_step": 202224, "epoch": 4814} {"train_loss": -7.09869384765625, "global_step": 202225, "epoch": 4814} {"train_loss": -7.05512809753418, "global_step": 202226, "epoch": 4814} {"train_loss": -7.0802388191223145, "global_step": 202227, "epoch": 4814} {"train_loss": -6.971058368682861, "global_step": 202228, "epoch": 4814} {"train_loss": -7.2227798416501, "global_step": 202229, "epoch": 4814, "val_loss": 69107.4609375} {"train_loss": -6.949072360992432, "global_step": 202230, "epoch": 4815} {"train_loss": -6.954220771789551, "global_step": 202231, "epoch": 4815} {"train_loss": -7.020342826843262, "global_step": 202232, "epoch": 4815} {"train_loss": -6.986644268035889, "global_step": 202233, "epoch": 4815} {"train_loss": -6.965192794799805, "global_step": 202234, "epoch": 4815} {"train_loss": -7.002422332763672, "global_step": 202235, "epoch": 4815} {"train_loss": -7.11605167388916, "global_step": 202236, "epoch": 4815} {"train_loss": -6.915572166442871, "global_step": 202237, "epoch": 4815} {"train_loss": -7.136664867401123, "global_step": 202238, "epoch": 4815} {"train_loss": -6.89990234375, "global_step": 202239, "epoch": 4815} {"train_loss": -7.055356025695801, "global_step": 202240, "epoch": 4815} {"train_loss": -7.04287576675415, "global_step": 202241, "epoch": 4815} {"train_loss": -7.155561923980713, "global_step": 202242, "epoch": 4815} {"train_loss": -7.023287296295166, "global_step": 202243, "epoch": 4815} {"train_loss": -7.095213890075684, "global_step": 202244, "epoch": 4815} {"train_loss": -7.182384967803955, "global_step": 202245, "epoch": 4815} {"train_loss": -7.14822244644165, "global_step": 202246, "epoch": 4815} {"train_loss": -7.146666526794434, "global_step": 202247, "epoch": 4815} {"train_loss": -7.122003078460693, "global_step": 202248, "epoch": 4815} {"train_loss": -7.059334754943848, "global_step": 202249, "epoch": 4815} {"train_loss": -7.1721086502075195, "global_step": 202250, "epoch": 4815} {"train_loss": -7.137144565582275, "global_step": 202251, "epoch": 4815} {"train_loss": -7.192634582519531, "global_step": 202252, "epoch": 4815} {"train_loss": -7.090577125549316, "global_step": 202253, "epoch": 4815} {"train_loss": -7.142589569091797, "global_step": 202254, "epoch": 4815} {"train_loss": -7.204309463500977, "global_step": 202255, "epoch": 4815} {"train_loss": -7.188869953155518, "global_step": 202256, "epoch": 4815} {"train_loss": -7.193681240081787, "global_step": 202257, "epoch": 4815} {"train_loss": -7.160915374755859, "global_step": 202258, "epoch": 4815} {"train_loss": -7.149476051330566, "global_step": 202259, "epoch": 4815} {"train_loss": -7.209577560424805, "global_step": 202260, "epoch": 4815} {"train_loss": -7.303058624267578, "global_step": 202261, "epoch": 4815} {"train_loss": -7.24052619934082, "global_step": 202262, "epoch": 4815} {"train_loss": -7.273520469665527, "global_step": 202263, "epoch": 4815} {"train_loss": -7.259403228759766, "global_step": 202264, "epoch": 4815} {"train_loss": -7.211061477661133, "global_step": 202265, "epoch": 4815} {"train_loss": -7.2578654289245605, "global_step": 202266, "epoch": 4815} {"train_loss": -7.243203163146973, "global_step": 202267, "epoch": 4815} {"train_loss": -7.3130292892456055, "global_step": 202268, "epoch": 4815} {"train_loss": -7.295473098754883, "global_step": 202269, "epoch": 4815} {"train_loss": -7.32250452041626, "global_step": 202270, "epoch": 4815} {"train_loss": -7.1386914139702204, "global_step": 202271, "epoch": 4815, "val_loss": 69050.59375} {"train_loss": -7.143584251403809, "global_step": 202272, "epoch": 4816} {"train_loss": -7.3002848625183105, "global_step": 202273, "epoch": 4816} {"train_loss": -7.375703811645508, "global_step": 202274, "epoch": 4816} {"train_loss": -7.428864002227783, "global_step": 202275, "epoch": 4816} {"train_loss": -7.367359161376953, "global_step": 202276, "epoch": 4816} {"train_loss": -7.448204040527344, "global_step": 202277, "epoch": 4816} {"train_loss": -7.40863037109375, "global_step": 202278, "epoch": 4816} {"train_loss": -7.272881507873535, "global_step": 202279, "epoch": 4816} {"train_loss": -7.316420555114746, "global_step": 202280, "epoch": 4816} {"train_loss": -7.35268497467041, "global_step": 202281, "epoch": 4816} {"train_loss": -7.209102630615234, "global_step": 202282, "epoch": 4816} {"train_loss": -7.442531585693359, "global_step": 202283, "epoch": 4816} {"train_loss": -7.234135627746582, "global_step": 202284, "epoch": 4816} {"train_loss": -7.331943511962891, "global_step": 202285, "epoch": 4816} {"train_loss": -7.1980462074279785, "global_step": 202286, "epoch": 4816} {"train_loss": -7.390270233154297, "global_step": 202287, "epoch": 4816} {"train_loss": -7.27756404876709, "global_step": 202288, "epoch": 4816} {"train_loss": -7.334128379821777, "global_step": 202289, "epoch": 4816} {"train_loss": -7.275032997131348, "global_step": 202290, "epoch": 4816} {"train_loss": -7.292230129241943, "global_step": 202291, "epoch": 4816} {"train_loss": -7.369924545288086, "global_step": 202292, "epoch": 4816} {"train_loss": -7.327950954437256, "global_step": 202293, "epoch": 4816} {"train_loss": -7.359884262084961, "global_step": 202294, "epoch": 4816} {"train_loss": -7.29712438583374, "global_step": 202295, "epoch": 4816} {"train_loss": -7.24472713470459, "global_step": 202296, "epoch": 4816} {"train_loss": -7.271520137786865, "global_step": 202297, "epoch": 4816} {"train_loss": -7.210347652435303, "global_step": 202298, "epoch": 4816} {"train_loss": -7.25153112411499, "global_step": 202299, "epoch": 4816} {"train_loss": -7.409761428833008, "global_step": 202300, "epoch": 4816} {"train_loss": -7.2511749267578125, "global_step": 202301, "epoch": 4816} {"train_loss": -7.272902011871338, "global_step": 202302, "epoch": 4816} {"train_loss": -7.244504928588867, "global_step": 202303, "epoch": 4816} {"train_loss": -7.199077606201172, "global_step": 202304, "epoch": 4816} {"train_loss": -7.1866841316223145, "global_step": 202305, "epoch": 4816} {"train_loss": -7.243244647979736, "global_step": 202306, "epoch": 4816} {"train_loss": -7.150549411773682, "global_step": 202307, "epoch": 4816} {"train_loss": -7.0629777908325195, "global_step": 202308, "epoch": 4816} {"train_loss": -7.234263896942139, "global_step": 202309, "epoch": 4816} {"train_loss": -7.215670585632324, "global_step": 202310, "epoch": 4816} {"train_loss": -7.090953826904297, "global_step": 202311, "epoch": 4816} {"train_loss": -7.442417621612549, "global_step": 202312, "epoch": 4816} {"train_loss": -7.28135921841576, "global_step": 202313, "epoch": 4816, "val_loss": 69110.3359375} {"train_loss": -7.310540199279785, "global_step": 202314, "epoch": 4817} {"train_loss": -7.222348213195801, "global_step": 202315, "epoch": 4817} {"train_loss": -7.200570106506348, "global_step": 202316, "epoch": 4817} {"train_loss": -7.394143104553223, "global_step": 202317, "epoch": 4817} {"train_loss": -7.301417350769043, "global_step": 202318, "epoch": 4817} {"train_loss": -7.222505569458008, "global_step": 202319, "epoch": 4817} {"train_loss": -7.298102378845215, "global_step": 202320, "epoch": 4817} {"train_loss": -7.192517280578613, "global_step": 202321, "epoch": 4817} {"train_loss": -7.349862098693848, "global_step": 202322, "epoch": 4817} {"train_loss": -7.3344316482543945, "global_step": 202323, "epoch": 4817} {"train_loss": -7.337355613708496, "global_step": 202324, "epoch": 4817} {"train_loss": -7.27265739440918, "global_step": 202325, "epoch": 4817} {"train_loss": -7.107417583465576, "global_step": 202326, "epoch": 4817} {"train_loss": -7.307379722595215, "global_step": 202327, "epoch": 4817} {"train_loss": -7.271970748901367, "global_step": 202328, "epoch": 4817} {"train_loss": -7.17626953125, "global_step": 202329, "epoch": 4817} {"train_loss": -7.347712993621826, "global_step": 202330, "epoch": 4817} {"train_loss": -7.238086700439453, "global_step": 202331, "epoch": 4817} {"train_loss": -7.171594619750977, "global_step": 202332, "epoch": 4817} {"train_loss": -7.299551486968994, "global_step": 202333, "epoch": 4817} {"train_loss": -7.194291114807129, "global_step": 202334, "epoch": 4817} {"train_loss": -7.281345844268799, "global_step": 202335, "epoch": 4817} {"train_loss": -7.090770721435547, "global_step": 202336, "epoch": 4817} {"train_loss": -7.074826240539551, "global_step": 202337, "epoch": 4817} {"train_loss": -7.26237678527832, "global_step": 202338, "epoch": 4817} {"train_loss": -7.090146064758301, "global_step": 202339, "epoch": 4817} {"train_loss": -7.060176849365234, "global_step": 202340, "epoch": 4817} {"train_loss": -7.151486396789551, "global_step": 202341, "epoch": 4817} {"train_loss": -7.165851593017578, "global_step": 202342, "epoch": 4817} {"train_loss": -7.2582621574401855, "global_step": 202343, "epoch": 4817} {"train_loss": -7.035099029541016, "global_step": 202344, "epoch": 4817} {"train_loss": -7.151402473449707, "global_step": 202345, "epoch": 4817} {"train_loss": -7.183172702789307, "global_step": 202346, "epoch": 4817} {"train_loss": -7.168013095855713, "global_step": 202347, "epoch": 4817} {"train_loss": -7.2123870849609375, "global_step": 202348, "epoch": 4817} {"train_loss": -7.191615104675293, "global_step": 202349, "epoch": 4817} {"train_loss": -7.220818519592285, "global_step": 202350, "epoch": 4817} {"train_loss": -7.069517612457275, "global_step": 202351, "epoch": 4817} {"train_loss": -7.184076309204102, "global_step": 202352, "epoch": 4817} {"train_loss": -7.2905988693237305, "global_step": 202353, "epoch": 4817} {"train_loss": -7.2679619789123535, "global_step": 202354, "epoch": 4817} {"train_loss": -7.219589653469267, "global_step": 202355, "epoch": 4817, "val_loss": 69293.9609375} {"train_loss": -7.196638107299805, "global_step": 202356, "epoch": 4818} {"train_loss": -7.257953643798828, "global_step": 202357, "epoch": 4818} {"train_loss": -7.174076080322266, "global_step": 202358, "epoch": 4818} {"train_loss": -7.1686015129089355, "global_step": 202359, "epoch": 4818} {"train_loss": -7.3482255935668945, "global_step": 202360, "epoch": 4818} {"train_loss": -7.347165584564209, "global_step": 202361, "epoch": 4818} {"train_loss": -7.347652912139893, "global_step": 202362, "epoch": 4818} {"train_loss": -7.154512405395508, "global_step": 202363, "epoch": 4818} {"train_loss": -7.192008972167969, "global_step": 202364, "epoch": 4818} {"train_loss": -7.194689750671387, "global_step": 202365, "epoch": 4818} {"train_loss": -7.327589988708496, "global_step": 202366, "epoch": 4818} {"train_loss": -7.255368232727051, "global_step": 202367, "epoch": 4818} {"train_loss": -7.315300941467285, "global_step": 202368, "epoch": 4818} {"train_loss": -7.28036642074585, "global_step": 202369, "epoch": 4818} {"train_loss": -7.295013427734375, "global_step": 202370, "epoch": 4818} {"train_loss": -7.189364433288574, "global_step": 202371, "epoch": 4818} {"train_loss": -7.273741722106934, "global_step": 202372, "epoch": 4818} {"train_loss": -7.309067726135254, "global_step": 202373, "epoch": 4818} {"train_loss": -7.215214729309082, "global_step": 202374, "epoch": 4818} {"train_loss": -7.326226711273193, "global_step": 202375, "epoch": 4818} {"train_loss": -7.265924453735352, "global_step": 202376, "epoch": 4818} {"train_loss": -7.247551918029785, "global_step": 202377, "epoch": 4818} {"train_loss": -7.200081825256348, "global_step": 202378, "epoch": 4818} {"train_loss": -7.1515398025512695, "global_step": 202379, "epoch": 4818} {"train_loss": -7.27635383605957, "global_step": 202380, "epoch": 4818} {"train_loss": -7.213350772857666, "global_step": 202381, "epoch": 4818} {"train_loss": -7.275054931640625, "global_step": 202382, "epoch": 4818} {"train_loss": -7.238401889801025, "global_step": 202383, "epoch": 4818} {"train_loss": -7.156853675842285, "global_step": 202384, "epoch": 4818} {"train_loss": -7.020511150360107, "global_step": 202385, "epoch": 4818} {"train_loss": -7.237939357757568, "global_step": 202386, "epoch": 4818} {"train_loss": -7.190596580505371, "global_step": 202387, "epoch": 4818} {"train_loss": -7.126702308654785, "global_step": 202388, "epoch": 4818} {"train_loss": -7.367883682250977, "global_step": 202389, "epoch": 4818} {"train_loss": -7.229251861572266, "global_step": 202390, "epoch": 4818} {"train_loss": -7.155237197875977, "global_step": 202391, "epoch": 4818} {"train_loss": -7.293802261352539, "global_step": 202392, "epoch": 4818} {"train_loss": -7.219417095184326, "global_step": 202393, "epoch": 4818} {"train_loss": -7.317069053649902, "global_step": 202394, "epoch": 4818} {"train_loss": -7.249854564666748, "global_step": 202395, "epoch": 4818} {"train_loss": -7.221902847290039, "global_step": 202396, "epoch": 4818} {"train_loss": -7.240257047471546, "global_step": 202397, "epoch": 4818, "val_loss": 69322.3125} {"train_loss": -7.2311530113220215, "global_step": 202398, "epoch": 4819} {"train_loss": -7.357145309448242, "global_step": 202399, "epoch": 4819} {"train_loss": -7.083011627197266, "global_step": 202400, "epoch": 4819} {"train_loss": -7.230574607849121, "global_step": 202401, "epoch": 4819} {"train_loss": -7.23176383972168, "global_step": 202402, "epoch": 4819} {"train_loss": -7.095942974090576, "global_step": 202403, "epoch": 4819} {"train_loss": -7.175383567810059, "global_step": 202404, "epoch": 4819} {"train_loss": -7.207221031188965, "global_step": 202405, "epoch": 4819} {"train_loss": -7.322492599487305, "global_step": 202406, "epoch": 4819} {"train_loss": -7.261180400848389, "global_step": 202407, "epoch": 4819} {"train_loss": -7.2580976486206055, "global_step": 202408, "epoch": 4819} {"train_loss": -7.274641513824463, "global_step": 202409, "epoch": 4819} {"train_loss": -7.072829246520996, "global_step": 202410, "epoch": 4819} {"train_loss": -7.249096870422363, "global_step": 202411, "epoch": 4819} {"train_loss": -7.310467720031738, "global_step": 202412, "epoch": 4819} {"train_loss": -7.285891532897949, "global_step": 202413, "epoch": 4819} {"train_loss": -7.163290500640869, "global_step": 202414, "epoch": 4819} {"train_loss": -7.186480522155762, "global_step": 202415, "epoch": 4819} {"train_loss": -7.254453659057617, "global_step": 202416, "epoch": 4819} {"train_loss": -7.135406494140625, "global_step": 202417, "epoch": 4819} {"train_loss": -7.2286882400512695, "global_step": 202418, "epoch": 4819} {"train_loss": -7.30124568939209, "global_step": 202419, "epoch": 4819} {"train_loss": -7.288918972015381, "global_step": 202420, "epoch": 4819} {"train_loss": -7.325153350830078, "global_step": 202421, "epoch": 4819} {"train_loss": -7.241616249084473, "global_step": 202422, "epoch": 4819} {"train_loss": -7.289610862731934, "global_step": 202423, "epoch": 4819} {"train_loss": -7.319969654083252, "global_step": 202424, "epoch": 4819} {"train_loss": -7.201927185058594, "global_step": 202425, "epoch": 4819} {"train_loss": -7.300961494445801, "global_step": 202426, "epoch": 4819} {"train_loss": -7.219988822937012, "global_step": 202427, "epoch": 4819} {"train_loss": -7.253100872039795, "global_step": 202428, "epoch": 4819} {"train_loss": -7.215766906738281, "global_step": 202429, "epoch": 4819} {"train_loss": -7.224355697631836, "global_step": 202430, "epoch": 4819} {"train_loss": -7.110540390014648, "global_step": 202431, "epoch": 4819} {"train_loss": -7.230037212371826, "global_step": 202432, "epoch": 4819} {"train_loss": -7.0890984535217285, "global_step": 202433, "epoch": 4819} {"train_loss": -7.234652042388916, "global_step": 202434, "epoch": 4819} {"train_loss": -7.18751859664917, "global_step": 202435, "epoch": 4819} {"train_loss": -7.048889636993408, "global_step": 202436, "epoch": 4819} {"train_loss": -7.170642852783203, "global_step": 202437, "epoch": 4819} {"train_loss": -7.182392597198486, "global_step": 202438, "epoch": 4819} {"train_loss": -7.218956322897048, "global_step": 202439, "epoch": 4819, "val_loss": 69184.1875} {"train_loss": -7.230291843414307, "global_step": 202440, "epoch": 4820} {"train_loss": -7.290903091430664, "global_step": 202441, "epoch": 4820} {"train_loss": -7.21550178527832, "global_step": 202442, "epoch": 4820} {"train_loss": -7.266674041748047, "global_step": 202443, "epoch": 4820} {"train_loss": -7.203251838684082, "global_step": 202444, "epoch": 4820} {"train_loss": -7.158655166625977, "global_step": 202445, "epoch": 4820} {"train_loss": -7.230170249938965, "global_step": 202446, "epoch": 4820} {"train_loss": -7.146847724914551, "global_step": 202447, "epoch": 4820} {"train_loss": -7.225822448730469, "global_step": 202448, "epoch": 4820} {"train_loss": -7.1190900802612305, "global_step": 202449, "epoch": 4820} {"train_loss": -7.251127243041992, "global_step": 202450, "epoch": 4820} {"train_loss": -7.15762996673584, "global_step": 202451, "epoch": 4820} {"train_loss": -7.218995094299316, "global_step": 202452, "epoch": 4820} {"train_loss": -7.281106472015381, "global_step": 202453, "epoch": 4820} {"train_loss": -7.220969200134277, "global_step": 202454, "epoch": 4820} {"train_loss": -7.252950668334961, "global_step": 202455, "epoch": 4820} {"train_loss": -7.159398555755615, "global_step": 202456, "epoch": 4820} {"train_loss": -7.250471115112305, "global_step": 202457, "epoch": 4820} {"train_loss": -7.18440055847168, "global_step": 202458, "epoch": 4820} {"train_loss": -7.183317184448242, "global_step": 202459, "epoch": 4820} {"train_loss": -7.191130638122559, "global_step": 202460, "epoch": 4820} {"train_loss": -6.881365776062012, "global_step": 202461, "epoch": 4820} {"train_loss": -7.188473701477051, "global_step": 202462, "epoch": 4820} {"train_loss": -7.301370143890381, "global_step": 202463, "epoch": 4820} {"train_loss": -7.056205749511719, "global_step": 202464, "epoch": 4820} {"train_loss": -7.198167324066162, "global_step": 202465, "epoch": 4820} {"train_loss": -7.112826347351074, "global_step": 202466, "epoch": 4820} {"train_loss": -7.046171188354492, "global_step": 202467, "epoch": 4820} {"train_loss": -7.240947723388672, "global_step": 202468, "epoch": 4820} {"train_loss": -7.100001335144043, "global_step": 202469, "epoch": 4820} {"train_loss": -7.0258989334106445, "global_step": 202470, "epoch": 4820} {"train_loss": -7.158387184143066, "global_step": 202471, "epoch": 4820} {"train_loss": -7.059741020202637, "global_step": 202472, "epoch": 4820} {"train_loss": -7.087320327758789, "global_step": 202473, "epoch": 4820} {"train_loss": -6.957023620605469, "global_step": 202474, "epoch": 4820} {"train_loss": -7.091212272644043, "global_step": 202475, "epoch": 4820} {"train_loss": -7.035881996154785, "global_step": 202476, "epoch": 4820} {"train_loss": -7.2269792556762695, "global_step": 202477, "epoch": 4820} {"train_loss": -7.034357070922852, "global_step": 202478, "epoch": 4820} {"train_loss": -7.186326026916504, "global_step": 202479, "epoch": 4820} {"train_loss": -7.194001197814941, "global_step": 202480, "epoch": 4820} {"train_loss": -7.162358283996582, "global_step": 202481, "epoch": 4820, "val_loss": 69055.90625} {"train_loss": -7.20966911315918, "global_step": 202482, "epoch": 4821} {"train_loss": -7.176281929016113, "global_step": 202483, "epoch": 4821} {"train_loss": -7.160702228546143, "global_step": 202484, "epoch": 4821} {"train_loss": -7.2732954025268555, "global_step": 202485, "epoch": 4821} {"train_loss": -7.178002834320068, "global_step": 202486, "epoch": 4821} {"train_loss": -7.264222145080566, "global_step": 202487, "epoch": 4821} {"train_loss": -7.248909950256348, "global_step": 202488, "epoch": 4821} {"train_loss": -7.2259721755981445, "global_step": 202489, "epoch": 4821} {"train_loss": -7.167252540588379, "global_step": 202490, "epoch": 4821} {"train_loss": -7.247989654541016, "global_step": 202491, "epoch": 4821} {"train_loss": -7.253777503967285, "global_step": 202492, "epoch": 4821} {"train_loss": -7.223182678222656, "global_step": 202493, "epoch": 4821} {"train_loss": -7.294843673706055, "global_step": 202494, "epoch": 4821} {"train_loss": -7.318872451782227, "global_step": 202495, "epoch": 4821} {"train_loss": -7.276701927185059, "global_step": 202496, "epoch": 4821} {"train_loss": -7.2401933670043945, "global_step": 202497, "epoch": 4821} {"train_loss": -7.219635009765625, "global_step": 202498, "epoch": 4821} {"train_loss": -7.253185272216797, "global_step": 202499, "epoch": 4821} {"train_loss": -7.270976543426514, "global_step": 202500, "epoch": 4821} {"train_loss": -7.244557857513428, "global_step": 202501, "epoch": 4821} {"train_loss": -7.230294227600098, "global_step": 202502, "epoch": 4821} {"train_loss": -7.184954643249512, "global_step": 202503, "epoch": 4821} {"train_loss": -7.326988220214844, "global_step": 202504, "epoch": 4821} {"train_loss": -7.238154411315918, "global_step": 202505, "epoch": 4821} {"train_loss": -7.31773567199707, "global_step": 202506, "epoch": 4821} {"train_loss": -7.246718406677246, "global_step": 202507, "epoch": 4821} {"train_loss": -7.2279205322265625, "global_step": 202508, "epoch": 4821} {"train_loss": -7.303201198577881, "global_step": 202509, "epoch": 4821} {"train_loss": -7.339656829833984, "global_step": 202510, "epoch": 4821} {"train_loss": -7.240933895111084, "global_step": 202511, "epoch": 4821} {"train_loss": -7.122472286224365, "global_step": 202512, "epoch": 4821} {"train_loss": -7.161172866821289, "global_step": 202513, "epoch": 4821} {"train_loss": -7.216259479522705, "global_step": 202514, "epoch": 4821} {"train_loss": -7.177967548370361, "global_step": 202515, "epoch": 4821} {"train_loss": -7.30120849609375, "global_step": 202516, "epoch": 4821} {"train_loss": -7.261960029602051, "global_step": 202517, "epoch": 4821} {"train_loss": -7.288552761077881, "global_step": 202518, "epoch": 4821} {"train_loss": -7.367988586425781, "global_step": 202519, "epoch": 4821} {"train_loss": -7.269740104675293, "global_step": 202520, "epoch": 4821} {"train_loss": -7.184436798095703, "global_step": 202521, "epoch": 4821} {"train_loss": -7.21977424621582, "global_step": 202522, "epoch": 4821} {"train_loss": -7.244323685055687, "global_step": 202523, "epoch": 4821, "val_loss": 69075.1640625} {"train_loss": -7.199648857116699, "global_step": 202524, "epoch": 4822} {"train_loss": -7.2016282081604, "global_step": 202525, "epoch": 4822} {"train_loss": -7.203001022338867, "global_step": 202526, "epoch": 4822} {"train_loss": -7.10258674621582, "global_step": 202527, "epoch": 4822} {"train_loss": -7.349732398986816, "global_step": 202528, "epoch": 4822} {"train_loss": -7.267972946166992, "global_step": 202529, "epoch": 4822} {"train_loss": -7.216179370880127, "global_step": 202530, "epoch": 4822} {"train_loss": -7.276236534118652, "global_step": 202531, "epoch": 4822} {"train_loss": -7.036362648010254, "global_step": 202532, "epoch": 4822} {"train_loss": -7.153599739074707, "global_step": 202533, "epoch": 4822} {"train_loss": -7.147697448730469, "global_step": 202534, "epoch": 4822} {"train_loss": -7.097958564758301, "global_step": 202535, "epoch": 4822} {"train_loss": -7.1930389404296875, "global_step": 202536, "epoch": 4822} {"train_loss": -7.107575416564941, "global_step": 202537, "epoch": 4822} {"train_loss": -7.018943786621094, "global_step": 202538, "epoch": 4822} {"train_loss": -7.237852573394775, "global_step": 202539, "epoch": 4822} {"train_loss": -7.04280948638916, "global_step": 202540, "epoch": 4822} {"train_loss": -7.157649040222168, "global_step": 202541, "epoch": 4822} {"train_loss": -7.077247142791748, "global_step": 202542, "epoch": 4822} {"train_loss": -7.106164932250977, "global_step": 202543, "epoch": 4822} {"train_loss": -7.286647796630859, "global_step": 202544, "epoch": 4822} {"train_loss": -6.861701011657715, "global_step": 202545, "epoch": 4822} {"train_loss": -7.21104097366333, "global_step": 202546, "epoch": 4822} {"train_loss": -7.097014427185059, "global_step": 202547, "epoch": 4822} {"train_loss": -7.085501670837402, "global_step": 202548, "epoch": 4822} {"train_loss": -7.1220197677612305, "global_step": 202549, "epoch": 4822} {"train_loss": -7.016148567199707, "global_step": 202550, "epoch": 4822} {"train_loss": -7.018309593200684, "global_step": 202551, "epoch": 4822} {"train_loss": -7.140053749084473, "global_step": 202552, "epoch": 4822} {"train_loss": -7.150904655456543, "global_step": 202553, "epoch": 4822} {"train_loss": -7.119269371032715, "global_step": 202554, "epoch": 4822} {"train_loss": -7.154984474182129, "global_step": 202555, "epoch": 4822} {"train_loss": -7.174836158752441, "global_step": 202556, "epoch": 4822} {"train_loss": -7.119683265686035, "global_step": 202557, "epoch": 4822} {"train_loss": -7.1412034034729, "global_step": 202558, "epoch": 4822} {"train_loss": -7.1913371086120605, "global_step": 202559, "epoch": 4822} {"train_loss": -7.271438121795654, "global_step": 202560, "epoch": 4822} {"train_loss": -7.187331199645996, "global_step": 202561, "epoch": 4822} {"train_loss": -7.280485153198242, "global_step": 202562, "epoch": 4822} {"train_loss": -7.181023597717285, "global_step": 202563, "epoch": 4822} {"train_loss": -7.260962963104248, "global_step": 202564, "epoch": 4822} {"train_loss": -7.156563111713955, "global_step": 202565, "epoch": 4822, "val_loss": 69119.546875} {"train_loss": -7.237561225891113, "global_step": 202566, "epoch": 4823} {"train_loss": -7.300839424133301, "global_step": 202567, "epoch": 4823} {"train_loss": -7.252459526062012, "global_step": 202568, "epoch": 4823} {"train_loss": -7.247597694396973, "global_step": 202569, "epoch": 4823} {"train_loss": -7.248575210571289, "global_step": 202570, "epoch": 4823} {"train_loss": -7.260241508483887, "global_step": 202571, "epoch": 4823} {"train_loss": -7.275140762329102, "global_step": 202572, "epoch": 4823} {"train_loss": -7.269894599914551, "global_step": 202573, "epoch": 4823} {"train_loss": -7.340917587280273, "global_step": 202574, "epoch": 4823} {"train_loss": -7.398489952087402, "global_step": 202575, "epoch": 4823} {"train_loss": -7.249712944030762, "global_step": 202576, "epoch": 4823} {"train_loss": -7.215503692626953, "global_step": 202577, "epoch": 4823} {"train_loss": -7.336855888366699, "global_step": 202578, "epoch": 4823} {"train_loss": -7.267083644866943, "global_step": 202579, "epoch": 4823} {"train_loss": -7.244140625, "global_step": 202580, "epoch": 4823} {"train_loss": -7.227983474731445, "global_step": 202581, "epoch": 4823} {"train_loss": -7.205158233642578, "global_step": 202582, "epoch": 4823} {"train_loss": -7.199878692626953, "global_step": 202583, "epoch": 4823} {"train_loss": -7.290337085723877, "global_step": 202584, "epoch": 4823} {"train_loss": -7.366596221923828, "global_step": 202585, "epoch": 4823} {"train_loss": -7.100921630859375, "global_step": 202586, "epoch": 4823} {"train_loss": -7.272304058074951, "global_step": 202587, "epoch": 4823} {"train_loss": -7.3381829261779785, "global_step": 202588, "epoch": 4823} {"train_loss": -7.333420753479004, "global_step": 202589, "epoch": 4823} {"train_loss": -7.333739280700684, "global_step": 202590, "epoch": 4823} {"train_loss": -7.355210781097412, "global_step": 202591, "epoch": 4823} {"train_loss": -7.288705348968506, "global_step": 202592, "epoch": 4823} {"train_loss": -7.262940883636475, "global_step": 202593, "epoch": 4823} {"train_loss": -7.291357040405273, "global_step": 202594, "epoch": 4823} {"train_loss": -7.320694923400879, "global_step": 202595, "epoch": 4823} {"train_loss": -7.364786148071289, "global_step": 202596, "epoch": 4823} {"train_loss": -7.217411518096924, "global_step": 202597, "epoch": 4823} {"train_loss": -7.339674949645996, "global_step": 202598, "epoch": 4823} {"train_loss": -7.278368949890137, "global_step": 202599, "epoch": 4823} {"train_loss": -7.172869682312012, "global_step": 202600, "epoch": 4823} {"train_loss": -7.266432762145996, "global_step": 202601, "epoch": 4823} {"train_loss": -7.340500831604004, "global_step": 202602, "epoch": 4823} {"train_loss": -7.2456865310668945, "global_step": 202603, "epoch": 4823} {"train_loss": -7.2940874099731445, "global_step": 202604, "epoch": 4823} {"train_loss": -7.128299236297607, "global_step": 202605, "epoch": 4823} {"train_loss": -7.267218589782715, "global_step": 202606, "epoch": 4823} {"train_loss": -7.274502879097348, "global_step": 202607, "epoch": 4823, "val_loss": 69098.921875} {"train_loss": -7.396208763122559, "global_step": 202608, "epoch": 4824} {"train_loss": -7.143979072570801, "global_step": 202609, "epoch": 4824} {"train_loss": -7.29494571685791, "global_step": 202610, "epoch": 4824} {"train_loss": -7.220244407653809, "global_step": 202611, "epoch": 4824} {"train_loss": -7.220707416534424, "global_step": 202612, "epoch": 4824} {"train_loss": -7.330418586730957, "global_step": 202613, "epoch": 4824} {"train_loss": -7.22783088684082, "global_step": 202614, "epoch": 4824} {"train_loss": -7.23783540725708, "global_step": 202615, "epoch": 4824} {"train_loss": -7.276830673217773, "global_step": 202616, "epoch": 4824} {"train_loss": -7.260435104370117, "global_step": 202617, "epoch": 4824} {"train_loss": -7.252697944641113, "global_step": 202618, "epoch": 4824} {"train_loss": -7.2287702560424805, "global_step": 202619, "epoch": 4824} {"train_loss": -7.296026229858398, "global_step": 202620, "epoch": 4824} {"train_loss": -7.335848331451416, "global_step": 202621, "epoch": 4824} {"train_loss": -7.266383647918701, "global_step": 202622, "epoch": 4824} {"train_loss": -7.270158767700195, "global_step": 202623, "epoch": 4824} {"train_loss": -7.211350917816162, "global_step": 202624, "epoch": 4824} {"train_loss": -7.254842758178711, "global_step": 202625, "epoch": 4824} {"train_loss": -7.259765625, "global_step": 202626, "epoch": 4824} {"train_loss": -7.1797590255737305, "global_step": 202627, "epoch": 4824} {"train_loss": -7.167045593261719, "global_step": 202628, "epoch": 4824} {"train_loss": -7.265615463256836, "global_step": 202629, "epoch": 4824} {"train_loss": -7.177162170410156, "global_step": 202630, "epoch": 4824} {"train_loss": -7.2706732749938965, "global_step": 202631, "epoch": 4824} {"train_loss": -7.2576470375061035, "global_step": 202632, "epoch": 4824} {"train_loss": -7.274560928344727, "global_step": 202633, "epoch": 4824} {"train_loss": -7.103735446929932, "global_step": 202634, "epoch": 4824} {"train_loss": -7.26793098449707, "global_step": 202635, "epoch": 4824} {"train_loss": -7.160183906555176, "global_step": 202636, "epoch": 4824} {"train_loss": -7.344610214233398, "global_step": 202637, "epoch": 4824} {"train_loss": -7.256075382232666, "global_step": 202638, "epoch": 4824} {"train_loss": -7.223369121551514, "global_step": 202639, "epoch": 4824} {"train_loss": -7.3078508377075195, "global_step": 202640, "epoch": 4824} {"train_loss": -7.253629207611084, "global_step": 202641, "epoch": 4824} {"train_loss": -7.191289901733398, "global_step": 202642, "epoch": 4824} {"train_loss": -7.275864601135254, "global_step": 202643, "epoch": 4824} {"train_loss": -7.323162078857422, "global_step": 202644, "epoch": 4824} {"train_loss": -7.194117546081543, "global_step": 202645, "epoch": 4824} {"train_loss": -7.325947284698486, "global_step": 202646, "epoch": 4824} {"train_loss": -7.278990745544434, "global_step": 202647, "epoch": 4824} {"train_loss": -7.10170841217041, "global_step": 202648, "epoch": 4824} {"train_loss": -7.249657142729986, "global_step": 202649, "epoch": 4824, "val_loss": 69096.4453125} {"train_loss": -7.331933975219727, "global_step": 202650, "epoch": 4825} {"train_loss": -7.2091193199157715, "global_step": 202651, "epoch": 4825} {"train_loss": -7.251918315887451, "global_step": 202652, "epoch": 4825} {"train_loss": -7.337495803833008, "global_step": 202653, "epoch": 4825} {"train_loss": -7.25713586807251, "global_step": 202654, "epoch": 4825} {"train_loss": -7.26300048828125, "global_step": 202655, "epoch": 4825} {"train_loss": -7.201328277587891, "global_step": 202656, "epoch": 4825} {"train_loss": -7.240427017211914, "global_step": 202657, "epoch": 4825} {"train_loss": -7.216544151306152, "global_step": 202658, "epoch": 4825} {"train_loss": -7.248955726623535, "global_step": 202659, "epoch": 4825} {"train_loss": -7.26043701171875, "global_step": 202660, "epoch": 4825} {"train_loss": -7.2488861083984375, "global_step": 202661, "epoch": 4825} {"train_loss": -7.0979766845703125, "global_step": 202662, "epoch": 4825} {"train_loss": -7.207521438598633, "global_step": 202663, "epoch": 4825} {"train_loss": -7.232693195343018, "global_step": 202664, "epoch": 4825} {"train_loss": -7.110438346862793, "global_step": 202665, "epoch": 4825} {"train_loss": -7.2343244552612305, "global_step": 202666, "epoch": 4825} {"train_loss": -7.133233547210693, "global_step": 202667, "epoch": 4825} {"train_loss": -7.206231117248535, "global_step": 202668, "epoch": 4825} {"train_loss": -7.142889976501465, "global_step": 202669, "epoch": 4825} {"train_loss": -7.326275825500488, "global_step": 202670, "epoch": 4825} {"train_loss": -7.304883003234863, "global_step": 202671, "epoch": 4825} {"train_loss": -7.138866424560547, "global_step": 202672, "epoch": 4825} {"train_loss": -7.154626369476318, "global_step": 202673, "epoch": 4825} {"train_loss": -7.2706298828125, "global_step": 202674, "epoch": 4825} {"train_loss": -6.998981475830078, "global_step": 202675, "epoch": 4825} {"train_loss": -7.260684490203857, "global_step": 202676, "epoch": 4825} {"train_loss": -6.967360973358154, "global_step": 202677, "epoch": 4825} {"train_loss": -7.168173313140869, "global_step": 202678, "epoch": 4825} {"train_loss": -7.122051239013672, "global_step": 202679, "epoch": 4825} {"train_loss": -7.127660751342773, "global_step": 202680, "epoch": 4825} {"train_loss": -6.980403423309326, "global_step": 202681, "epoch": 4825} {"train_loss": -7.072432041168213, "global_step": 202682, "epoch": 4825} {"train_loss": -7.016025543212891, "global_step": 202683, "epoch": 4825} {"train_loss": -6.960144996643066, "global_step": 202684, "epoch": 4825} {"train_loss": -7.084548473358154, "global_step": 202685, "epoch": 4825} {"train_loss": -6.924821853637695, "global_step": 202686, "epoch": 4825} {"train_loss": -7.118411540985107, "global_step": 202687, "epoch": 4825} {"train_loss": -6.94066047668457, "global_step": 202688, "epoch": 4825} {"train_loss": -7.1853508949279785, "global_step": 202689, "epoch": 4825} {"train_loss": -7.111428260803223, "global_step": 202690, "epoch": 4825} {"train_loss": -7.1603788648332864, "global_step": 202691, "epoch": 4825, "val_loss": 69204.703125} {"train_loss": -7.200049877166748, "global_step": 202692, "epoch": 4826} {"train_loss": -7.190305709838867, "global_step": 202693, "epoch": 4826} {"train_loss": -7.173425674438477, "global_step": 202694, "epoch": 4826} {"train_loss": -7.091383457183838, "global_step": 202695, "epoch": 4826} {"train_loss": -7.050394535064697, "global_step": 202696, "epoch": 4826} {"train_loss": -7.1126251220703125, "global_step": 202697, "epoch": 4826} {"train_loss": -7.213324069976807, "global_step": 202698, "epoch": 4826} {"train_loss": -7.057055473327637, "global_step": 202699, "epoch": 4826} {"train_loss": -7.093083381652832, "global_step": 202700, "epoch": 4826} {"train_loss": -7.181210041046143, "global_step": 202701, "epoch": 4826} {"train_loss": -7.117053031921387, "global_step": 202702, "epoch": 4826} {"train_loss": -7.120731353759766, "global_step": 202703, "epoch": 4826} {"train_loss": -7.1930341720581055, "global_step": 202704, "epoch": 4826} {"train_loss": -7.1500163078308105, "global_step": 202705, "epoch": 4826} {"train_loss": -7.246387481689453, "global_step": 202706, "epoch": 4826} {"train_loss": -7.258051872253418, "global_step": 202707, "epoch": 4826} {"train_loss": -7.304163455963135, "global_step": 202708, "epoch": 4826} {"train_loss": -7.150667667388916, "global_step": 202709, "epoch": 4826} {"train_loss": -7.306435585021973, "global_step": 202710, "epoch": 4826} {"train_loss": -7.2018208503723145, "global_step": 202711, "epoch": 4826} {"train_loss": -7.23675537109375, "global_step": 202712, "epoch": 4826} {"train_loss": -7.319950103759766, "global_step": 202713, "epoch": 4826} {"train_loss": -7.283956527709961, "global_step": 202714, "epoch": 4826} {"train_loss": -7.291454315185547, "global_step": 202715, "epoch": 4826} {"train_loss": -7.31574821472168, "global_step": 202716, "epoch": 4826} {"train_loss": -7.337673187255859, "global_step": 202717, "epoch": 4826} {"train_loss": -7.285735130310059, "global_step": 202718, "epoch": 4826} {"train_loss": -7.325581073760986, "global_step": 202719, "epoch": 4826} {"train_loss": -7.346253871917725, "global_step": 202720, "epoch": 4826} {"train_loss": -7.332464218139648, "global_step": 202721, "epoch": 4826} {"train_loss": -7.388275146484375, "global_step": 202722, "epoch": 4826} {"train_loss": -7.318737030029297, "global_step": 202723, "epoch": 4826} {"train_loss": -7.351130485534668, "global_step": 202724, "epoch": 4826} {"train_loss": -7.212603569030762, "global_step": 202725, "epoch": 4826} {"train_loss": -7.314094543457031, "global_step": 202726, "epoch": 4826} {"train_loss": -7.264138698577881, "global_step": 202727, "epoch": 4826} {"train_loss": -7.14433479309082, "global_step": 202728, "epoch": 4826} {"train_loss": -7.319983005523682, "global_step": 202729, "epoch": 4826} {"train_loss": -7.248045921325684, "global_step": 202730, "epoch": 4826} {"train_loss": -7.4295172691345215, "global_step": 202731, "epoch": 4826} {"train_loss": -7.255855560302734, "global_step": 202732, "epoch": 4826} {"train_loss": -7.238218670799618, "global_step": 202733, "epoch": 4826, "val_loss": 69090.9921875} {"train_loss": -7.369609832763672, "global_step": 202734, "epoch": 4827} {"train_loss": -7.166156768798828, "global_step": 202735, "epoch": 4827} {"train_loss": -7.276522159576416, "global_step": 202736, "epoch": 4827} {"train_loss": -7.123660564422607, "global_step": 202737, "epoch": 4827} {"train_loss": -7.249278545379639, "global_step": 202738, "epoch": 4827} {"train_loss": -7.334203720092773, "global_step": 202739, "epoch": 4827} {"train_loss": -7.138444900512695, "global_step": 202740, "epoch": 4827} {"train_loss": -7.081360816955566, "global_step": 202741, "epoch": 4827} {"train_loss": -7.324701309204102, "global_step": 202742, "epoch": 4827} {"train_loss": -7.153997421264648, "global_step": 202743, "epoch": 4827} {"train_loss": -7.231063365936279, "global_step": 202744, "epoch": 4827} {"train_loss": -7.127505779266357, "global_step": 202745, "epoch": 4827} {"train_loss": -7.201622009277344, "global_step": 202746, "epoch": 4827} {"train_loss": -7.257253170013428, "global_step": 202747, "epoch": 4827} {"train_loss": -7.2257585525512695, "global_step": 202748, "epoch": 4827} {"train_loss": -7.139219284057617, "global_step": 202749, "epoch": 4827} {"train_loss": -7.217157363891602, "global_step": 202750, "epoch": 4827} {"train_loss": -7.26814079284668, "global_step": 202751, "epoch": 4827} {"train_loss": -7.254626274108887, "global_step": 202752, "epoch": 4827} {"train_loss": -7.242462158203125, "global_step": 202753, "epoch": 4827} {"train_loss": -7.333340644836426, "global_step": 202754, "epoch": 4827} {"train_loss": -7.187904357910156, "global_step": 202755, "epoch": 4827} {"train_loss": -7.232348442077637, "global_step": 202756, "epoch": 4827} {"train_loss": -7.215610980987549, "global_step": 202757, "epoch": 4827} {"train_loss": -7.192078590393066, "global_step": 202758, "epoch": 4827} {"train_loss": -7.285267353057861, "global_step": 202759, "epoch": 4827} {"train_loss": -7.145315170288086, "global_step": 202760, "epoch": 4827} {"train_loss": -7.228488922119141, "global_step": 202761, "epoch": 4827} {"train_loss": -7.184769630432129, "global_step": 202762, "epoch": 4827} {"train_loss": -7.161303520202637, "global_step": 202763, "epoch": 4827} {"train_loss": -7.234376907348633, "global_step": 202764, "epoch": 4827} {"train_loss": -7.274788856506348, "global_step": 202765, "epoch": 4827} {"train_loss": -7.279699802398682, "global_step": 202766, "epoch": 4827} {"train_loss": -7.25053596496582, "global_step": 202767, "epoch": 4827} {"train_loss": -7.1635332107543945, "global_step": 202768, "epoch": 4827} {"train_loss": -7.114339828491211, "global_step": 202769, "epoch": 4827} {"train_loss": -7.128964424133301, "global_step": 202770, "epoch": 4827} {"train_loss": -7.24357795715332, "global_step": 202771, "epoch": 4827} {"train_loss": -7.2750983238220215, "global_step": 202772, "epoch": 4827} {"train_loss": -7.321188926696777, "global_step": 202773, "epoch": 4827} {"train_loss": -7.214488983154297, "global_step": 202774, "epoch": 4827} {"train_loss": -7.2218574569338845, "global_step": 202775, "epoch": 4827, "val_loss": 68876.859375} {"train_loss": -7.2655720710754395, "global_step": 202776, "epoch": 4828} {"train_loss": -7.2098774909973145, "global_step": 202777, "epoch": 4828} {"train_loss": -7.254279136657715, "global_step": 202778, "epoch": 4828} {"train_loss": -7.350780487060547, "global_step": 202779, "epoch": 4828} {"train_loss": -7.1949663162231445, "global_step": 202780, "epoch": 4828} {"train_loss": -7.242362022399902, "global_step": 202781, "epoch": 4828} {"train_loss": -7.20729398727417, "global_step": 202782, "epoch": 4828} {"train_loss": -7.212198257446289, "global_step": 202783, "epoch": 4828} {"train_loss": -7.1821184158325195, "global_step": 202784, "epoch": 4828} {"train_loss": -7.1948137283325195, "global_step": 202785, "epoch": 4828} {"train_loss": -7.281262397766113, "global_step": 202786, "epoch": 4828} {"train_loss": -7.123576641082764, "global_step": 202787, "epoch": 4828} {"train_loss": -7.3066558837890625, "global_step": 202788, "epoch": 4828} {"train_loss": -7.262691974639893, "global_step": 202789, "epoch": 4828} {"train_loss": -7.231977939605713, "global_step": 202790, "epoch": 4828} {"train_loss": -7.285848140716553, "global_step": 202791, "epoch": 4828} {"train_loss": -7.176522254943848, "global_step": 202792, "epoch": 4828} {"train_loss": -7.260315895080566, "global_step": 202793, "epoch": 4828} {"train_loss": -7.327535152435303, "global_step": 202794, "epoch": 4828} {"train_loss": -7.1641950607299805, "global_step": 202795, "epoch": 4828} {"train_loss": -7.244068145751953, "global_step": 202796, "epoch": 4828} {"train_loss": -7.316481590270996, "global_step": 202797, "epoch": 4828} {"train_loss": -7.221889019012451, "global_step": 202798, "epoch": 4828} {"train_loss": -7.37389612197876, "global_step": 202799, "epoch": 4828} {"train_loss": -7.371894836425781, "global_step": 202800, "epoch": 4828} {"train_loss": -7.271035194396973, "global_step": 202801, "epoch": 4828} {"train_loss": -7.438857078552246, "global_step": 202802, "epoch": 4828} {"train_loss": -7.2396955490112305, "global_step": 202803, "epoch": 4828} {"train_loss": -7.3638129234313965, "global_step": 202804, "epoch": 4828} {"train_loss": -7.292511940002441, "global_step": 202805, "epoch": 4828} {"train_loss": -7.2201828956604, "global_step": 202806, "epoch": 4828} {"train_loss": -7.329800605773926, "global_step": 202807, "epoch": 4828} {"train_loss": -7.25869083404541, "global_step": 202808, "epoch": 4828} {"train_loss": -7.27141809463501, "global_step": 202809, "epoch": 4828} {"train_loss": -7.334725379943848, "global_step": 202810, "epoch": 4828} {"train_loss": -7.393784999847412, "global_step": 202811, "epoch": 4828} {"train_loss": -7.279686450958252, "global_step": 202812, "epoch": 4828} {"train_loss": -7.301872253417969, "global_step": 202813, "epoch": 4828} {"train_loss": -7.313882350921631, "global_step": 202814, "epoch": 4828} {"train_loss": -7.2250213623046875, "global_step": 202815, "epoch": 4828} {"train_loss": -7.278569221496582, "global_step": 202816, "epoch": 4828} {"train_loss": -7.269643306732178, "global_step": 202817, "epoch": 4828, "val_loss": 69057.984375} {"train_loss": -7.342477798461914, "global_step": 202818, "epoch": 4829} {"train_loss": -7.143639087677002, "global_step": 202819, "epoch": 4829} {"train_loss": -7.29979133605957, "global_step": 202820, "epoch": 4829} {"train_loss": -7.291571617126465, "global_step": 202821, "epoch": 4829} {"train_loss": -7.156789779663086, "global_step": 202822, "epoch": 4829} {"train_loss": -7.097883224487305, "global_step": 202823, "epoch": 4829} {"train_loss": -7.309096336364746, "global_step": 202824, "epoch": 4829} {"train_loss": -7.140887260437012, "global_step": 202825, "epoch": 4829} {"train_loss": -7.108342170715332, "global_step": 202826, "epoch": 4829} {"train_loss": -7.1872944831848145, "global_step": 202827, "epoch": 4829} {"train_loss": -7.178369522094727, "global_step": 202828, "epoch": 4829} {"train_loss": -7.333011150360107, "global_step": 202829, "epoch": 4829} {"train_loss": -7.1966094970703125, "global_step": 202830, "epoch": 4829} {"train_loss": -7.1379780769348145, "global_step": 202831, "epoch": 4829} {"train_loss": -7.139814376831055, "global_step": 202832, "epoch": 4829} {"train_loss": -7.134489059448242, "global_step": 202833, "epoch": 4829} {"train_loss": -7.19598913192749, "global_step": 202834, "epoch": 4829} {"train_loss": -7.247302055358887, "global_step": 202835, "epoch": 4829} {"train_loss": -7.214404582977295, "global_step": 202836, "epoch": 4829} {"train_loss": -7.322168350219727, "global_step": 202837, "epoch": 4829} {"train_loss": -7.233890533447266, "global_step": 202838, "epoch": 4829} {"train_loss": -7.253479957580566, "global_step": 202839, "epoch": 4829} {"train_loss": -7.344060897827148, "global_step": 202840, "epoch": 4829} {"train_loss": -7.224532127380371, "global_step": 202841, "epoch": 4829} {"train_loss": -7.2535552978515625, "global_step": 202842, "epoch": 4829} {"train_loss": -7.175779342651367, "global_step": 202843, "epoch": 4829} {"train_loss": -7.268499851226807, "global_step": 202844, "epoch": 4829} {"train_loss": -7.270986080169678, "global_step": 202845, "epoch": 4829} {"train_loss": -7.031949996948242, "global_step": 202846, "epoch": 4829} {"train_loss": -7.312939643859863, "global_step": 202847, "epoch": 4829} {"train_loss": -7.08353328704834, "global_step": 202848, "epoch": 4829} {"train_loss": -7.139524936676025, "global_step": 202849, "epoch": 4829} {"train_loss": -7.102884292602539, "global_step": 202850, "epoch": 4829} {"train_loss": -6.969321250915527, "global_step": 202851, "epoch": 4829} {"train_loss": -7.219366073608398, "global_step": 202852, "epoch": 4829} {"train_loss": -7.158926963806152, "global_step": 202853, "epoch": 4829} {"train_loss": -7.000094413757324, "global_step": 202854, "epoch": 4829} {"train_loss": -7.1687140464782715, "global_step": 202855, "epoch": 4829} {"train_loss": -7.075863838195801, "global_step": 202856, "epoch": 4829} {"train_loss": -7.064300537109375, "global_step": 202857, "epoch": 4829} {"train_loss": -6.934319972991943, "global_step": 202858, "epoch": 4829} {"train_loss": -7.18020156451634, "global_step": 202859, "epoch": 4829, "val_loss": 69219.984375} {"train_loss": -7.2036895751953125, "global_step": 202860, "epoch": 4830} {"train_loss": -7.196906089782715, "global_step": 202861, "epoch": 4830} {"train_loss": -7.182271957397461, "global_step": 202862, "epoch": 4830} {"train_loss": -7.277853012084961, "global_step": 202863, "epoch": 4830} {"train_loss": -7.141367435455322, "global_step": 202864, "epoch": 4830} {"train_loss": -7.189239025115967, "global_step": 202865, "epoch": 4830} {"train_loss": -7.172562599182129, "global_step": 202866, "epoch": 4830} {"train_loss": -7.139948844909668, "global_step": 202867, "epoch": 4830} {"train_loss": -7.259709358215332, "global_step": 202868, "epoch": 4830} {"train_loss": -7.1152753829956055, "global_step": 202869, "epoch": 4830} {"train_loss": -7.216866970062256, "global_step": 202870, "epoch": 4830} {"train_loss": -7.183358669281006, "global_step": 202871, "epoch": 4830} {"train_loss": -7.093061447143555, "global_step": 202872, "epoch": 4830} {"train_loss": -7.182204246520996, "global_step": 202873, "epoch": 4830} {"train_loss": -7.075825214385986, "global_step": 202874, "epoch": 4830} {"train_loss": -7.300223350524902, "global_step": 202875, "epoch": 4830} {"train_loss": -7.038702487945557, "global_step": 202876, "epoch": 4830} {"train_loss": -7.158681392669678, "global_step": 202877, "epoch": 4830} {"train_loss": -7.191120147705078, "global_step": 202878, "epoch": 4830} {"train_loss": -7.209141731262207, "global_step": 202879, "epoch": 4830} {"train_loss": -7.146709442138672, "global_step": 202880, "epoch": 4830} {"train_loss": -7.244358539581299, "global_step": 202881, "epoch": 4830} {"train_loss": -7.203204154968262, "global_step": 202882, "epoch": 4830} {"train_loss": -7.239772796630859, "global_step": 202883, "epoch": 4830} {"train_loss": -7.318404197692871, "global_step": 202884, "epoch": 4830} {"train_loss": -7.201406955718994, "global_step": 202885, "epoch": 4830} {"train_loss": -7.313093185424805, "global_step": 202886, "epoch": 4830} {"train_loss": -7.06598424911499, "global_step": 202887, "epoch": 4830} {"train_loss": -7.157524108886719, "global_step": 202888, "epoch": 4830} {"train_loss": -7.32166862487793, "global_step": 202889, "epoch": 4830} {"train_loss": -7.133410453796387, "global_step": 202890, "epoch": 4830} {"train_loss": -7.272738456726074, "global_step": 202891, "epoch": 4830} {"train_loss": -7.221435546875, "global_step": 202892, "epoch": 4830} {"train_loss": -7.282398223876953, "global_step": 202893, "epoch": 4830} {"train_loss": -7.280177116394043, "global_step": 202894, "epoch": 4830} {"train_loss": -7.306838035583496, "global_step": 202895, "epoch": 4830} {"train_loss": -7.298089981079102, "global_step": 202896, "epoch": 4830} {"train_loss": -7.272300720214844, "global_step": 202897, "epoch": 4830} {"train_loss": -7.1219892501831055, "global_step": 202898, "epoch": 4830} {"train_loss": -7.3167033195495605, "global_step": 202899, "epoch": 4830} {"train_loss": -7.144259452819824, "global_step": 202900, "epoch": 4830} {"train_loss": -7.20575567654201, "global_step": 202901, "epoch": 4830, "val_loss": 69325.53125} {"train_loss": -7.2985429763793945, "global_step": 202902, "epoch": 4831} {"train_loss": -7.143903732299805, "global_step": 202903, "epoch": 4831} {"train_loss": -7.374597549438477, "global_step": 202904, "epoch": 4831} {"train_loss": -7.288387298583984, "global_step": 202905, "epoch": 4831} {"train_loss": -7.31254768371582, "global_step": 202906, "epoch": 4831} {"train_loss": -7.360257148742676, "global_step": 202907, "epoch": 4831} {"train_loss": -7.368436813354492, "global_step": 202908, "epoch": 4831} {"train_loss": -7.317919731140137, "global_step": 202909, "epoch": 4831} {"train_loss": -7.262657165527344, "global_step": 202910, "epoch": 4831} {"train_loss": -7.252293586730957, "global_step": 202911, "epoch": 4831} {"train_loss": -7.283146381378174, "global_step": 202912, "epoch": 4831} {"train_loss": -7.315085411071777, "global_step": 202913, "epoch": 4831} {"train_loss": -7.25799036026001, "global_step": 202914, "epoch": 4831} {"train_loss": -7.305082321166992, "global_step": 202915, "epoch": 4831} {"train_loss": -7.309318542480469, "global_step": 202916, "epoch": 4831} {"train_loss": -7.359248161315918, "global_step": 202917, "epoch": 4831} {"train_loss": -7.364320755004883, "global_step": 202918, "epoch": 4831} {"train_loss": -7.260647773742676, "global_step": 202919, "epoch": 4831} {"train_loss": -7.303129196166992, "global_step": 202920, "epoch": 4831} {"train_loss": -7.168652534484863, "global_step": 202921, "epoch": 4831} {"train_loss": -7.2538347244262695, "global_step": 202922, "epoch": 4831} {"train_loss": -7.1632609367370605, "global_step": 202923, "epoch": 4831} {"train_loss": -7.3356218338012695, "global_step": 202924, "epoch": 4831} {"train_loss": -7.141808986663818, "global_step": 202925, "epoch": 4831} {"train_loss": -7.222342014312744, "global_step": 202926, "epoch": 4831} {"train_loss": -7.2255401611328125, "global_step": 202927, "epoch": 4831} {"train_loss": -7.145661354064941, "global_step": 202928, "epoch": 4831} {"train_loss": -7.2617878913879395, "global_step": 202929, "epoch": 4831} {"train_loss": -7.240180015563965, "global_step": 202930, "epoch": 4831} {"train_loss": -7.229470252990723, "global_step": 202931, "epoch": 4831} {"train_loss": -7.234002113342285, "global_step": 202932, "epoch": 4831} {"train_loss": -7.161061763763428, "global_step": 202933, "epoch": 4831} {"train_loss": -7.216549873352051, "global_step": 202934, "epoch": 4831} {"train_loss": -7.167563438415527, "global_step": 202935, "epoch": 4831} {"train_loss": -7.330352783203125, "global_step": 202936, "epoch": 4831} {"train_loss": -7.034733772277832, "global_step": 202937, "epoch": 4831} {"train_loss": -7.248648166656494, "global_step": 202938, "epoch": 4831} {"train_loss": -7.2757768630981445, "global_step": 202939, "epoch": 4831} {"train_loss": -7.207690238952637, "global_step": 202940, "epoch": 4831} {"train_loss": -7.254383087158203, "global_step": 202941, "epoch": 4831} {"train_loss": -7.226398468017578, "global_step": 202942, "epoch": 4831} {"train_loss": -7.25528639838809, "global_step": 202943, "epoch": 4831, "val_loss": 69202.7578125} {"train_loss": -7.134680271148682, "global_step": 202944, "epoch": 4832} {"train_loss": -7.224084854125977, "global_step": 202945, "epoch": 4832} {"train_loss": -7.289291858673096, "global_step": 202946, "epoch": 4832} {"train_loss": -7.019278526306152, "global_step": 202947, "epoch": 4832} {"train_loss": -7.29679536819458, "global_step": 202948, "epoch": 4832} {"train_loss": -7.193271636962891, "global_step": 202949, "epoch": 4832} {"train_loss": -7.164224624633789, "global_step": 202950, "epoch": 4832} {"train_loss": -7.252739429473877, "global_step": 202951, "epoch": 4832} {"train_loss": -7.183981418609619, "global_step": 202952, "epoch": 4832} {"train_loss": -7.4141669273376465, "global_step": 202953, "epoch": 4832} {"train_loss": -7.195009708404541, "global_step": 202954, "epoch": 4832} {"train_loss": -7.154682636260986, "global_step": 202955, "epoch": 4832} {"train_loss": -7.31031608581543, "global_step": 202956, "epoch": 4832} {"train_loss": -7.295782089233398, "global_step": 202957, "epoch": 4832} {"train_loss": -7.263657093048096, "global_step": 202958, "epoch": 4832} {"train_loss": -7.249064922332764, "global_step": 202959, "epoch": 4832} {"train_loss": -7.385591506958008, "global_step": 202960, "epoch": 4832} {"train_loss": -7.217617034912109, "global_step": 202961, "epoch": 4832} {"train_loss": -7.256067276000977, "global_step": 202962, "epoch": 4832} {"train_loss": -7.317189693450928, "global_step": 202963, "epoch": 4832} {"train_loss": -7.2996506690979, "global_step": 202964, "epoch": 4832} {"train_loss": -7.151477813720703, "global_step": 202965, "epoch": 4832} {"train_loss": -7.317586898803711, "global_step": 202966, "epoch": 4832} {"train_loss": -7.373856544494629, "global_step": 202967, "epoch": 4832} {"train_loss": -7.20632266998291, "global_step": 202968, "epoch": 4832} {"train_loss": -7.185890197753906, "global_step": 202969, "epoch": 4832} {"train_loss": -7.297534942626953, "global_step": 202970, "epoch": 4832} {"train_loss": -7.218374252319336, "global_step": 202971, "epoch": 4832} {"train_loss": -7.060225486755371, "global_step": 202972, "epoch": 4832} {"train_loss": -7.318260669708252, "global_step": 202973, "epoch": 4832} {"train_loss": -7.160397052764893, "global_step": 202974, "epoch": 4832} {"train_loss": -7.1588287353515625, "global_step": 202975, "epoch": 4832} {"train_loss": -7.148284912109375, "global_step": 202976, "epoch": 4832} {"train_loss": -7.165310859680176, "global_step": 202977, "epoch": 4832} {"train_loss": -7.235867500305176, "global_step": 202978, "epoch": 4832} {"train_loss": -7.207355499267578, "global_step": 202979, "epoch": 4832} {"train_loss": -7.267632961273193, "global_step": 202980, "epoch": 4832} {"train_loss": -7.217360973358154, "global_step": 202981, "epoch": 4832} {"train_loss": -7.119504451751709, "global_step": 202982, "epoch": 4832} {"train_loss": -7.187723159790039, "global_step": 202983, "epoch": 4832} {"train_loss": -7.1734418869018555, "global_step": 202984, "epoch": 4832} {"train_loss": -7.2294881003243585, "global_step": 202985, "epoch": 4832, "val_loss": 69157.6328125} {"train_loss": -7.165484428405762, "global_step": 202986, "epoch": 4833} {"train_loss": -7.250699043273926, "global_step": 202987, "epoch": 4833} {"train_loss": -7.104818344116211, "global_step": 202988, "epoch": 4833} {"train_loss": -7.2021942138671875, "global_step": 202989, "epoch": 4833} {"train_loss": -7.338136196136475, "global_step": 202990, "epoch": 4833} {"train_loss": -7.190135478973389, "global_step": 202991, "epoch": 4833} {"train_loss": -7.221497535705566, "global_step": 202992, "epoch": 4833} {"train_loss": -7.402196884155273, "global_step": 202993, "epoch": 4833} {"train_loss": -7.13458251953125, "global_step": 202994, "epoch": 4833} {"train_loss": -7.23453426361084, "global_step": 202995, "epoch": 4833} {"train_loss": -7.306719779968262, "global_step": 202996, "epoch": 4833} {"train_loss": -7.290757179260254, "global_step": 202997, "epoch": 4833} {"train_loss": -7.238372802734375, "global_step": 202998, "epoch": 4833} {"train_loss": -7.2769083976745605, "global_step": 202999, "epoch": 4833} {"train_loss": -7.241598129272461, "global_step": 203000, "epoch": 4833} {"train_loss": -7.352010250091553, "global_step": 203001, "epoch": 4833} {"train_loss": -7.2489800453186035, "global_step": 203002, "epoch": 4833} {"train_loss": -7.276063919067383, "global_step": 203003, "epoch": 4833} {"train_loss": -7.226046562194824, "global_step": 203004, "epoch": 4833} {"train_loss": -7.314093589782715, "global_step": 203005, "epoch": 4833} {"train_loss": -7.074276924133301, "global_step": 203006, "epoch": 4833} {"train_loss": -7.21561336517334, "global_step": 203007, "epoch": 4833} {"train_loss": -7.361691474914551, "global_step": 203008, "epoch": 4833} {"train_loss": -7.107619285583496, "global_step": 203009, "epoch": 4833} {"train_loss": -7.219405174255371, "global_step": 203010, "epoch": 4833} {"train_loss": -7.224789619445801, "global_step": 203011, "epoch": 4833} {"train_loss": -7.210461139678955, "global_step": 203012, "epoch": 4833} {"train_loss": -7.280721664428711, "global_step": 203013, "epoch": 4833} {"train_loss": -7.1322526931762695, "global_step": 203014, "epoch": 4833} {"train_loss": -7.142707824707031, "global_step": 203015, "epoch": 4833} {"train_loss": -7.173426628112793, "global_step": 203016, "epoch": 4833} {"train_loss": -7.286791801452637, "global_step": 203017, "epoch": 4833} {"train_loss": -7.2358012199401855, "global_step": 203018, "epoch": 4833} {"train_loss": -7.2045674324035645, "global_step": 203019, "epoch": 4833} {"train_loss": -7.314523696899414, "global_step": 203020, "epoch": 4833} {"train_loss": -7.18867301940918, "global_step": 203021, "epoch": 4833} {"train_loss": -7.230864524841309, "global_step": 203022, "epoch": 4833} {"train_loss": -7.230993270874023, "global_step": 203023, "epoch": 4833} {"train_loss": -7.220877170562744, "global_step": 203024, "epoch": 4833} {"train_loss": -7.242836952209473, "global_step": 203025, "epoch": 4833} {"train_loss": -7.237091541290283, "global_step": 203026, "epoch": 4833} {"train_loss": -7.230780839920044, "global_step": 203027, "epoch": 4833, "val_loss": 68948.6640625} {"train_loss": -7.317014694213867, "global_step": 203028, "epoch": 4834} {"train_loss": -7.278729438781738, "global_step": 203029, "epoch": 4834} {"train_loss": -7.231518745422363, "global_step": 203030, "epoch": 4834} {"train_loss": -7.184720993041992, "global_step": 203031, "epoch": 4834} {"train_loss": -7.202363014221191, "global_step": 203032, "epoch": 4834} {"train_loss": -7.256036758422852, "global_step": 203033, "epoch": 4834} {"train_loss": -7.276928424835205, "global_step": 203034, "epoch": 4834} {"train_loss": -7.275397777557373, "global_step": 203035, "epoch": 4834} {"train_loss": -7.191070556640625, "global_step": 203036, "epoch": 4834} {"train_loss": -7.196878433227539, "global_step": 203037, "epoch": 4834} {"train_loss": -7.211811065673828, "global_step": 203038, "epoch": 4834} {"train_loss": -7.325089454650879, "global_step": 203039, "epoch": 4834} {"train_loss": -7.296402931213379, "global_step": 203040, "epoch": 4834} {"train_loss": -7.273283958435059, "global_step": 203041, "epoch": 4834} {"train_loss": -7.301664352416992, "global_step": 203042, "epoch": 4834} {"train_loss": -7.291303634643555, "global_step": 203043, "epoch": 4834} {"train_loss": -7.223465919494629, "global_step": 203044, "epoch": 4834} {"train_loss": -7.2428483963012695, "global_step": 203045, "epoch": 4834} {"train_loss": -7.243905544281006, "global_step": 203046, "epoch": 4834} {"train_loss": -7.223562717437744, "global_step": 203047, "epoch": 4834} {"train_loss": -7.3030219078063965, "global_step": 203048, "epoch": 4834} {"train_loss": -7.2812604904174805, "global_step": 203049, "epoch": 4834} {"train_loss": -7.217649936676025, "global_step": 203050, "epoch": 4834} {"train_loss": -7.246229648590088, "global_step": 203051, "epoch": 4834} {"train_loss": -7.24998664855957, "global_step": 203052, "epoch": 4834} {"train_loss": -7.268561363220215, "global_step": 203053, "epoch": 4834} {"train_loss": -7.2690839767456055, "global_step": 203054, "epoch": 4834} {"train_loss": -7.256253242492676, "global_step": 203055, "epoch": 4834} {"train_loss": -7.190749168395996, "global_step": 203056, "epoch": 4834} {"train_loss": -7.224071979522705, "global_step": 203057, "epoch": 4834} {"train_loss": -7.241344451904297, "global_step": 203058, "epoch": 4834} {"train_loss": -7.280054092407227, "global_step": 203059, "epoch": 4834} {"train_loss": -7.210866928100586, "global_step": 203060, "epoch": 4834} {"train_loss": -7.233351230621338, "global_step": 203061, "epoch": 4834} {"train_loss": -7.238345146179199, "global_step": 203062, "epoch": 4834} {"train_loss": -7.2324910163879395, "global_step": 203063, "epoch": 4834} {"train_loss": -7.156579494476318, "global_step": 203064, "epoch": 4834} {"train_loss": -7.211484432220459, "global_step": 203065, "epoch": 4834} {"train_loss": -7.190926551818848, "global_step": 203066, "epoch": 4834} {"train_loss": -7.162674427032471, "global_step": 203067, "epoch": 4834} {"train_loss": -7.229738235473633, "global_step": 203068, "epoch": 4834} {"train_loss": -7.238842146737235, "global_step": 203069, "epoch": 4834, "val_loss": 69126.328125} {"train_loss": -7.142226219177246, "global_step": 203070, "epoch": 4835} {"train_loss": -7.184887886047363, "global_step": 203071, "epoch": 4835} {"train_loss": -7.293911933898926, "global_step": 203072, "epoch": 4835} {"train_loss": -7.304344654083252, "global_step": 203073, "epoch": 4835} {"train_loss": -7.175741195678711, "global_step": 203074, "epoch": 4835} {"train_loss": -7.134299278259277, "global_step": 203075, "epoch": 4835} {"train_loss": -7.230457305908203, "global_step": 203076, "epoch": 4835} {"train_loss": -7.131841659545898, "global_step": 203077, "epoch": 4835} {"train_loss": -7.258338928222656, "global_step": 203078, "epoch": 4835} {"train_loss": -7.10844087600708, "global_step": 203079, "epoch": 4835} {"train_loss": -7.247370719909668, "global_step": 203080, "epoch": 4835} {"train_loss": -7.219492435455322, "global_step": 203081, "epoch": 4835} {"train_loss": -7.015756130218506, "global_step": 203082, "epoch": 4835} {"train_loss": -7.227326393127441, "global_step": 203083, "epoch": 4835} {"train_loss": -7.180262565612793, "global_step": 203084, "epoch": 4835} {"train_loss": -7.30949592590332, "global_step": 203085, "epoch": 4835} {"train_loss": -7.203616619110107, "global_step": 203086, "epoch": 4835} {"train_loss": -7.193544387817383, "global_step": 203087, "epoch": 4835} {"train_loss": -7.385598182678223, "global_step": 203088, "epoch": 4835} {"train_loss": -7.28637170791626, "global_step": 203089, "epoch": 4835} {"train_loss": -7.240294933319092, "global_step": 203090, "epoch": 4835} {"train_loss": -7.164200782775879, "global_step": 203091, "epoch": 4835} {"train_loss": -7.164752960205078, "global_step": 203092, "epoch": 4835} {"train_loss": -7.268665790557861, "global_step": 203093, "epoch": 4835} {"train_loss": -7.200852870941162, "global_step": 203094, "epoch": 4835} {"train_loss": -7.041268825531006, "global_step": 203095, "epoch": 4835} {"train_loss": -7.187152862548828, "global_step": 203096, "epoch": 4835} {"train_loss": -7.123093128204346, "global_step": 203097, "epoch": 4835} {"train_loss": -7.139554023742676, "global_step": 203098, "epoch": 4835} {"train_loss": -7.049078941345215, "global_step": 203099, "epoch": 4835} {"train_loss": -7.244553089141846, "global_step": 203100, "epoch": 4835} {"train_loss": -7.184723854064941, "global_step": 203101, "epoch": 4835} {"train_loss": -7.241213321685791, "global_step": 203102, "epoch": 4835} {"train_loss": -7.345585823059082, "global_step": 203103, "epoch": 4835} {"train_loss": -7.078051567077637, "global_step": 203104, "epoch": 4835} {"train_loss": -7.396495819091797, "global_step": 203105, "epoch": 4835} {"train_loss": -7.265481948852539, "global_step": 203106, "epoch": 4835} {"train_loss": -7.278676986694336, "global_step": 203107, "epoch": 4835} {"train_loss": -7.241554260253906, "global_step": 203108, "epoch": 4835} {"train_loss": -7.190430641174316, "global_step": 203109, "epoch": 4835} {"train_loss": -7.323456764221191, "global_step": 203110, "epoch": 4835} {"train_loss": -7.210444938568842, "global_step": 203111, "epoch": 4835, "val_loss": 69133.109375} {"train_loss": -7.275084495544434, "global_step": 203112, "epoch": 4836} {"train_loss": -7.174638748168945, "global_step": 203113, "epoch": 4836} {"train_loss": -7.201897621154785, "global_step": 203114, "epoch": 4836} {"train_loss": -7.271280288696289, "global_step": 203115, "epoch": 4836} {"train_loss": -7.278515815734863, "global_step": 203116, "epoch": 4836} {"train_loss": -7.231766700744629, "global_step": 203117, "epoch": 4836} {"train_loss": -7.361120700836182, "global_step": 203118, "epoch": 4836} {"train_loss": -7.294726371765137, "global_step": 203119, "epoch": 4836} {"train_loss": -7.278654098510742, "global_step": 203120, "epoch": 4836} {"train_loss": -7.158657073974609, "global_step": 203121, "epoch": 4836} {"train_loss": -7.40024471282959, "global_step": 203122, "epoch": 4836} {"train_loss": -7.228864669799805, "global_step": 203123, "epoch": 4836} {"train_loss": -7.2614545822143555, "global_step": 203124, "epoch": 4836} {"train_loss": -7.326378345489502, "global_step": 203125, "epoch": 4836} {"train_loss": -7.201470375061035, "global_step": 203126, "epoch": 4836} {"train_loss": -7.27019739151001, "global_step": 203127, "epoch": 4836} {"train_loss": -7.178554058074951, "global_step": 203128, "epoch": 4836} {"train_loss": -7.204179763793945, "global_step": 203129, "epoch": 4836} {"train_loss": -7.2502336502075195, "global_step": 203130, "epoch": 4836} {"train_loss": -7.282698631286621, "global_step": 203131, "epoch": 4836} {"train_loss": -7.272071361541748, "global_step": 203132, "epoch": 4836} {"train_loss": -7.24518346786499, "global_step": 203133, "epoch": 4836} {"train_loss": -7.142648696899414, "global_step": 203134, "epoch": 4836} {"train_loss": -7.199373245239258, "global_step": 203135, "epoch": 4836} {"train_loss": -7.356417655944824, "global_step": 203136, "epoch": 4836} {"train_loss": -7.291751861572266, "global_step": 203137, "epoch": 4836} {"train_loss": -7.272062301635742, "global_step": 203138, "epoch": 4836} {"train_loss": -7.178493976593018, "global_step": 203139, "epoch": 4836} {"train_loss": -7.278745651245117, "global_step": 203140, "epoch": 4836} {"train_loss": -7.29695463180542, "global_step": 203141, "epoch": 4836} {"train_loss": -7.207904815673828, "global_step": 203142, "epoch": 4836} {"train_loss": -7.1986799240112305, "global_step": 203143, "epoch": 4836} {"train_loss": -7.191316604614258, "global_step": 203144, "epoch": 4836} {"train_loss": -7.108257293701172, "global_step": 203145, "epoch": 4836} {"train_loss": -7.179129600524902, "global_step": 203146, "epoch": 4836} {"train_loss": -7.138980865478516, "global_step": 203147, "epoch": 4836} {"train_loss": -7.035560607910156, "global_step": 203148, "epoch": 4836} {"train_loss": -7.119548797607422, "global_step": 203149, "epoch": 4836} {"train_loss": -7.074512481689453, "global_step": 203150, "epoch": 4836} {"train_loss": -7.06763219833374, "global_step": 203151, "epoch": 4836} {"train_loss": -7.1809892654418945, "global_step": 203152, "epoch": 4836} {"train_loss": -7.2193997133345835, "global_step": 203153, "epoch": 4836, "val_loss": 69196.09375} {"train_loss": -7.054903030395508, "global_step": 203154, "epoch": 4837} {"train_loss": -6.9935383796691895, "global_step": 203155, "epoch": 4837} {"train_loss": -6.940621376037598, "global_step": 203156, "epoch": 4837} {"train_loss": -7.047228813171387, "global_step": 203157, "epoch": 4837} {"train_loss": -7.124610900878906, "global_step": 203158, "epoch": 4837} {"train_loss": -7.136898994445801, "global_step": 203159, "epoch": 4837} {"train_loss": -7.176408290863037, "global_step": 203160, "epoch": 4837} {"train_loss": -7.12791633605957, "global_step": 203161, "epoch": 4837} {"train_loss": -7.311938285827637, "global_step": 203162, "epoch": 4837} {"train_loss": -7.131386756896973, "global_step": 203163, "epoch": 4837} {"train_loss": -7.20258903503418, "global_step": 203164, "epoch": 4837} {"train_loss": -7.309982776641846, "global_step": 203165, "epoch": 4837} {"train_loss": -7.218457221984863, "global_step": 203166, "epoch": 4837} {"train_loss": -7.139370918273926, "global_step": 203167, "epoch": 4837} {"train_loss": -7.178524494171143, "global_step": 203168, "epoch": 4837} {"train_loss": -7.293297290802002, "global_step": 203169, "epoch": 4837} {"train_loss": -7.245594024658203, "global_step": 203170, "epoch": 4837} {"train_loss": -7.257225513458252, "global_step": 203171, "epoch": 4837} {"train_loss": -7.225207328796387, "global_step": 203172, "epoch": 4837} {"train_loss": -7.1838579177856445, "global_step": 203173, "epoch": 4837} {"train_loss": -7.282301902770996, "global_step": 203174, "epoch": 4837} {"train_loss": -7.305356979370117, "global_step": 203175, "epoch": 4837} {"train_loss": -7.289909362792969, "global_step": 203176, "epoch": 4837} {"train_loss": -7.331310272216797, "global_step": 203177, "epoch": 4837} {"train_loss": -7.123684883117676, "global_step": 203178, "epoch": 4837} {"train_loss": -7.28653621673584, "global_step": 203179, "epoch": 4837} {"train_loss": -7.270369529724121, "global_step": 203180, "epoch": 4837} {"train_loss": -7.313338279724121, "global_step": 203181, "epoch": 4837} {"train_loss": -7.22139835357666, "global_step": 203182, "epoch": 4837} {"train_loss": -7.250697135925293, "global_step": 203183, "epoch": 4837} {"train_loss": -7.128474235534668, "global_step": 203184, "epoch": 4837} {"train_loss": -7.034578800201416, "global_step": 203185, "epoch": 4837} {"train_loss": -7.334490776062012, "global_step": 203186, "epoch": 4837} {"train_loss": -7.309342861175537, "global_step": 203187, "epoch": 4837} {"train_loss": -7.138340473175049, "global_step": 203188, "epoch": 4837} {"train_loss": -7.319522857666016, "global_step": 203189, "epoch": 4837} {"train_loss": -7.11939811706543, "global_step": 203190, "epoch": 4837} {"train_loss": -7.207756996154785, "global_step": 203191, "epoch": 4837} {"train_loss": -7.346660614013672, "global_step": 203192, "epoch": 4837} {"train_loss": -7.229226112365723, "global_step": 203193, "epoch": 4837} {"train_loss": -7.239971160888672, "global_step": 203194, "epoch": 4837} {"train_loss": -7.205139137449718, "global_step": 203195, "epoch": 4837, "val_loss": 69122.6796875} {"train_loss": -7.169120788574219, "global_step": 203196, "epoch": 4838} {"train_loss": -7.252397537231445, "global_step": 203197, "epoch": 4838} {"train_loss": -7.289939880371094, "global_step": 203198, "epoch": 4838} {"train_loss": -7.343975067138672, "global_step": 203199, "epoch": 4838} {"train_loss": -7.240622520446777, "global_step": 203200, "epoch": 4838} {"train_loss": -7.342272758483887, "global_step": 203201, "epoch": 4838} {"train_loss": -7.295440196990967, "global_step": 203202, "epoch": 4838} {"train_loss": -7.230064868927002, "global_step": 203203, "epoch": 4838} {"train_loss": -7.247072696685791, "global_step": 203204, "epoch": 4838} {"train_loss": -7.278371334075928, "global_step": 203205, "epoch": 4838} {"train_loss": -7.243547439575195, "global_step": 203206, "epoch": 4838} {"train_loss": -7.308997631072998, "global_step": 203207, "epoch": 4838} {"train_loss": -7.163498878479004, "global_step": 203208, "epoch": 4838} {"train_loss": -7.233153820037842, "global_step": 203209, "epoch": 4838} {"train_loss": -7.236729145050049, "global_step": 203210, "epoch": 4838} {"train_loss": -7.2644524574279785, "global_step": 203211, "epoch": 4838} {"train_loss": -7.221177101135254, "global_step": 203212, "epoch": 4838} {"train_loss": -7.2861175537109375, "global_step": 203213, "epoch": 4838} {"train_loss": -7.17179012298584, "global_step": 203214, "epoch": 4838} {"train_loss": -7.26020622253418, "global_step": 203215, "epoch": 4838} {"train_loss": -7.158698081970215, "global_step": 203216, "epoch": 4838} {"train_loss": -7.273388862609863, "global_step": 203217, "epoch": 4838} {"train_loss": -7.148183822631836, "global_step": 203218, "epoch": 4838} {"train_loss": -7.136723518371582, "global_step": 203219, "epoch": 4838} {"train_loss": -7.330815315246582, "global_step": 203220, "epoch": 4838} {"train_loss": -7.225769996643066, "global_step": 203221, "epoch": 4838} {"train_loss": -7.205095291137695, "global_step": 203222, "epoch": 4838} {"train_loss": -7.230792999267578, "global_step": 203223, "epoch": 4838} {"train_loss": -7.119316101074219, "global_step": 203224, "epoch": 4838} {"train_loss": -7.26053524017334, "global_step": 203225, "epoch": 4838} {"train_loss": -7.3606276512146, "global_step": 203226, "epoch": 4838} {"train_loss": -7.095995903015137, "global_step": 203227, "epoch": 4838} {"train_loss": -7.248879432678223, "global_step": 203228, "epoch": 4838} {"train_loss": -7.113100528717041, "global_step": 203229, "epoch": 4838} {"train_loss": -7.223293304443359, "global_step": 203230, "epoch": 4838} {"train_loss": -7.259283065795898, "global_step": 203231, "epoch": 4838} {"train_loss": -7.285583019256592, "global_step": 203232, "epoch": 4838} {"train_loss": -7.190404891967773, "global_step": 203233, "epoch": 4838} {"train_loss": -7.260226249694824, "global_step": 203234, "epoch": 4838} {"train_loss": -7.352996349334717, "global_step": 203235, "epoch": 4838} {"train_loss": -7.317461013793945, "global_step": 203236, "epoch": 4838} {"train_loss": -7.242255835306077, "global_step": 203237, "epoch": 4838, "val_loss": 69107.6328125} {"train_loss": -7.204439163208008, "global_step": 203238, "epoch": 4839} {"train_loss": -7.2551589012146, "global_step": 203239, "epoch": 4839} {"train_loss": -7.21834659576416, "global_step": 203240, "epoch": 4839} {"train_loss": -7.114195823669434, "global_step": 203241, "epoch": 4839} {"train_loss": -7.16389274597168, "global_step": 203242, "epoch": 4839} {"train_loss": -7.192298889160156, "global_step": 203243, "epoch": 4839} {"train_loss": -7.305898666381836, "global_step": 203244, "epoch": 4839} {"train_loss": -7.096169948577881, "global_step": 203245, "epoch": 4839} {"train_loss": -7.081518173217773, "global_step": 203246, "epoch": 4839} {"train_loss": -7.246258735656738, "global_step": 203247, "epoch": 4839} {"train_loss": -7.033626556396484, "global_step": 203248, "epoch": 4839} {"train_loss": -7.191873550415039, "global_step": 203249, "epoch": 4839} {"train_loss": -7.030500411987305, "global_step": 203250, "epoch": 4839} {"train_loss": -7.182706356048584, "global_step": 203251, "epoch": 4839} {"train_loss": -7.172308921813965, "global_step": 203252, "epoch": 4839} {"train_loss": -7.088824272155762, "global_step": 203253, "epoch": 4839} {"train_loss": -7.137302398681641, "global_step": 203254, "epoch": 4839} {"train_loss": -7.147720813751221, "global_step": 203255, "epoch": 4839} {"train_loss": -7.215673446655273, "global_step": 203256, "epoch": 4839} {"train_loss": -7.317174434661865, "global_step": 203257, "epoch": 4839} {"train_loss": -7.244684219360352, "global_step": 203258, "epoch": 4839} {"train_loss": -7.213475227355957, "global_step": 203259, "epoch": 4839} {"train_loss": -7.134604454040527, "global_step": 203260, "epoch": 4839} {"train_loss": -7.197619438171387, "global_step": 203261, "epoch": 4839} {"train_loss": -7.194592475891113, "global_step": 203262, "epoch": 4839} {"train_loss": -7.18477725982666, "global_step": 203263, "epoch": 4839} {"train_loss": -7.222158432006836, "global_step": 203264, "epoch": 4839} {"train_loss": -7.166736602783203, "global_step": 203265, "epoch": 4839} {"train_loss": -7.0630412101745605, "global_step": 203266, "epoch": 4839} {"train_loss": -7.078981399536133, "global_step": 203267, "epoch": 4839} {"train_loss": -7.069555282592773, "global_step": 203268, "epoch": 4839} {"train_loss": -7.106205940246582, "global_step": 203269, "epoch": 4839} {"train_loss": -7.2106828689575195, "global_step": 203270, "epoch": 4839} {"train_loss": -7.091248512268066, "global_step": 203271, "epoch": 4839} {"train_loss": -7.1323442459106445, "global_step": 203272, "epoch": 4839} {"train_loss": -7.221823215484619, "global_step": 203273, "epoch": 4839} {"train_loss": -7.192230224609375, "global_step": 203274, "epoch": 4839} {"train_loss": -7.322152137756348, "global_step": 203275, "epoch": 4839} {"train_loss": -7.193631172180176, "global_step": 203276, "epoch": 4839} {"train_loss": -7.2551422119140625, "global_step": 203277, "epoch": 4839} {"train_loss": -7.266269683837891, "global_step": 203278, "epoch": 4839} {"train_loss": -7.174994502748762, "global_step": 203279, "epoch": 4839, "val_loss": 69289.3046875} {"train_loss": -7.247505187988281, "global_step": 203280, "epoch": 4840} {"train_loss": -7.248530864715576, "global_step": 203281, "epoch": 4840} {"train_loss": -7.223223686218262, "global_step": 203282, "epoch": 4840} {"train_loss": -7.415074825286865, "global_step": 203283, "epoch": 4840} {"train_loss": -7.226335525512695, "global_step": 203284, "epoch": 4840} {"train_loss": -7.210200309753418, "global_step": 203285, "epoch": 4840} {"train_loss": -7.341793060302734, "global_step": 203286, "epoch": 4840} {"train_loss": -7.249002456665039, "global_step": 203287, "epoch": 4840} {"train_loss": -7.2418317794799805, "global_step": 203288, "epoch": 4840} {"train_loss": -7.229328155517578, "global_step": 203289, "epoch": 4840} {"train_loss": -7.2658185958862305, "global_step": 203290, "epoch": 4840} {"train_loss": -7.271383762359619, "global_step": 203291, "epoch": 4840} {"train_loss": -7.216169834136963, "global_step": 203292, "epoch": 4840} {"train_loss": -7.297702312469482, "global_step": 203293, "epoch": 4840} {"train_loss": -7.30856466293335, "global_step": 203294, "epoch": 4840} {"train_loss": -7.338173866271973, "global_step": 203295, "epoch": 4840} {"train_loss": -7.4029388427734375, "global_step": 203296, "epoch": 4840} {"train_loss": -7.228915691375732, "global_step": 203297, "epoch": 4840} {"train_loss": -7.325838565826416, "global_step": 203298, "epoch": 4840} {"train_loss": -7.214294910430908, "global_step": 203299, "epoch": 4840} {"train_loss": -7.15284538269043, "global_step": 203300, "epoch": 4840} {"train_loss": -7.202569484710693, "global_step": 203301, "epoch": 4840} {"train_loss": -7.267522811889648, "global_step": 203302, "epoch": 4840} {"train_loss": -7.293995380401611, "global_step": 203303, "epoch": 4840} {"train_loss": -7.262303352355957, "global_step": 203304, "epoch": 4840} {"train_loss": -7.346569061279297, "global_step": 203305, "epoch": 4840} {"train_loss": -7.331390857696533, "global_step": 203306, "epoch": 4840} {"train_loss": -7.3075761795043945, "global_step": 203307, "epoch": 4840} {"train_loss": -7.243458271026611, "global_step": 203308, "epoch": 4840} {"train_loss": -7.351564407348633, "global_step": 203309, "epoch": 4840} {"train_loss": -7.389217376708984, "global_step": 203310, "epoch": 4840} {"train_loss": -7.286310195922852, "global_step": 203311, "epoch": 4840} {"train_loss": -7.157304286956787, "global_step": 203312, "epoch": 4840} {"train_loss": -7.225572109222412, "global_step": 203313, "epoch": 4840} {"train_loss": -7.250633716583252, "global_step": 203314, "epoch": 4840} {"train_loss": -7.419258117675781, "global_step": 203315, "epoch": 4840} {"train_loss": -7.368662357330322, "global_step": 203316, "epoch": 4840} {"train_loss": -7.276401042938232, "global_step": 203317, "epoch": 4840} {"train_loss": -7.310513496398926, "global_step": 203318, "epoch": 4840} {"train_loss": -7.197162628173828, "global_step": 203319, "epoch": 4840} {"train_loss": -7.28813362121582, "global_step": 203320, "epoch": 4840} {"train_loss": -7.2805283183143255, "global_step": 203321, "epoch": 4840, "val_loss": 69133.8515625} {"train_loss": -7.172492980957031, "global_step": 203322, "epoch": 4841} {"train_loss": -7.179038047790527, "global_step": 203323, "epoch": 4841} {"train_loss": -7.2926836013793945, "global_step": 203324, "epoch": 4841} {"train_loss": -7.13228702545166, "global_step": 203325, "epoch": 4841} {"train_loss": -7.150522232055664, "global_step": 203326, "epoch": 4841} {"train_loss": -7.3404011726379395, "global_step": 203327, "epoch": 4841} {"train_loss": -7.156248092651367, "global_step": 203328, "epoch": 4841} {"train_loss": -7.190699577331543, "global_step": 203329, "epoch": 4841} {"train_loss": -7.249528884887695, "global_step": 203330, "epoch": 4841} {"train_loss": -7.2506890296936035, "global_step": 203331, "epoch": 4841} {"train_loss": -7.236682891845703, "global_step": 203332, "epoch": 4841} {"train_loss": -7.179579257965088, "global_step": 203333, "epoch": 4841} {"train_loss": -7.32039737701416, "global_step": 203334, "epoch": 4841} {"train_loss": -7.226224899291992, "global_step": 203335, "epoch": 4841} {"train_loss": -7.184492111206055, "global_step": 203336, "epoch": 4841} {"train_loss": -7.319936752319336, "global_step": 203337, "epoch": 4841} {"train_loss": -7.050887584686279, "global_step": 203338, "epoch": 4841} {"train_loss": -7.232647895812988, "global_step": 203339, "epoch": 4841} {"train_loss": -7.2162322998046875, "global_step": 203340, "epoch": 4841} {"train_loss": -7.053213596343994, "global_step": 203341, "epoch": 4841} {"train_loss": -7.234187126159668, "global_step": 203342, "epoch": 4841} {"train_loss": -7.240517616271973, "global_step": 203343, "epoch": 4841} {"train_loss": -7.1511921882629395, "global_step": 203344, "epoch": 4841} {"train_loss": -7.194199562072754, "global_step": 203345, "epoch": 4841} {"train_loss": -7.217863082885742, "global_step": 203346, "epoch": 4841} {"train_loss": -7.2256975173950195, "global_step": 203347, "epoch": 4841} {"train_loss": -7.120847702026367, "global_step": 203348, "epoch": 4841} {"train_loss": -7.227344512939453, "global_step": 203349, "epoch": 4841} {"train_loss": -7.136780738830566, "global_step": 203350, "epoch": 4841} {"train_loss": -7.185347557067871, "global_step": 203351, "epoch": 4841} {"train_loss": -7.131841659545898, "global_step": 203352, "epoch": 4841} {"train_loss": -7.092698097229004, "global_step": 203353, "epoch": 4841} {"train_loss": -7.117812156677246, "global_step": 203354, "epoch": 4841} {"train_loss": -6.995400905609131, "global_step": 203355, "epoch": 4841} {"train_loss": -7.204102516174316, "global_step": 203356, "epoch": 4841} {"train_loss": -7.1487345695495605, "global_step": 203357, "epoch": 4841} {"train_loss": -7.18479585647583, "global_step": 203358, "epoch": 4841} {"train_loss": -7.32604455947876, "global_step": 203359, "epoch": 4841} {"train_loss": -7.096581935882568, "global_step": 203360, "epoch": 4841} {"train_loss": -7.211981773376465, "global_step": 203361, "epoch": 4841} {"train_loss": -7.146369934082031, "global_step": 203362, "epoch": 4841} {"train_loss": -7.188417377926054, "global_step": 203363, "epoch": 4841, "val_loss": 68915.71875} {"train_loss": -7.190777778625488, "global_step": 203364, "epoch": 4842} {"train_loss": -7.2688093185424805, "global_step": 203365, "epoch": 4842} {"train_loss": -7.234046936035156, "global_step": 203366, "epoch": 4842} {"train_loss": -7.023622512817383, "global_step": 203367, "epoch": 4842} {"train_loss": -7.160628795623779, "global_step": 203368, "epoch": 4842} {"train_loss": -7.222629547119141, "global_step": 203369, "epoch": 4842} {"train_loss": -7.138639450073242, "global_step": 203370, "epoch": 4842} {"train_loss": -7.142220497131348, "global_step": 203371, "epoch": 4842} {"train_loss": -7.168501377105713, "global_step": 203372, "epoch": 4842} {"train_loss": -7.225750923156738, "global_step": 203373, "epoch": 4842} {"train_loss": -7.2900190353393555, "global_step": 203374, "epoch": 4842} {"train_loss": -7.184882164001465, "global_step": 203375, "epoch": 4842} {"train_loss": -7.249248504638672, "global_step": 203376, "epoch": 4842} {"train_loss": -7.159858226776123, "global_step": 203377, "epoch": 4842} {"train_loss": -7.33988094329834, "global_step": 203378, "epoch": 4842} {"train_loss": -7.244559288024902, "global_step": 203379, "epoch": 4842} {"train_loss": -7.211376190185547, "global_step": 203380, "epoch": 4842} {"train_loss": -7.283896446228027, "global_step": 203381, "epoch": 4842} {"train_loss": -7.132675647735596, "global_step": 203382, "epoch": 4842} {"train_loss": -7.157076835632324, "global_step": 203383, "epoch": 4842} {"train_loss": -7.220697402954102, "global_step": 203384, "epoch": 4842} {"train_loss": -7.245874404907227, "global_step": 203385, "epoch": 4842} {"train_loss": -7.202010631561279, "global_step": 203386, "epoch": 4842} {"train_loss": -7.192580223083496, "global_step": 203387, "epoch": 4842} {"train_loss": -7.223423957824707, "global_step": 203388, "epoch": 4842} {"train_loss": -7.130612373352051, "global_step": 203389, "epoch": 4842} {"train_loss": -7.17857551574707, "global_step": 203390, "epoch": 4842} {"train_loss": -7.037339687347412, "global_step": 203391, "epoch": 4842} {"train_loss": -7.12235164642334, "global_step": 203392, "epoch": 4842} {"train_loss": -7.242166519165039, "global_step": 203393, "epoch": 4842} {"train_loss": -7.1380109786987305, "global_step": 203394, "epoch": 4842} {"train_loss": -7.154543876647949, "global_step": 203395, "epoch": 4842} {"train_loss": -6.945621967315674, "global_step": 203396, "epoch": 4842} {"train_loss": -7.259103775024414, "global_step": 203397, "epoch": 4842} {"train_loss": -6.9350504875183105, "global_step": 203398, "epoch": 4842} {"train_loss": -7.212774753570557, "global_step": 203399, "epoch": 4842} {"train_loss": -6.926642417907715, "global_step": 203400, "epoch": 4842} {"train_loss": -7.137973308563232, "global_step": 203401, "epoch": 4842} {"train_loss": -6.877617835998535, "global_step": 203402, "epoch": 4842} {"train_loss": -7.089098930358887, "global_step": 203403, "epoch": 4842} {"train_loss": -7.089883804321289, "global_step": 203404, "epoch": 4842} {"train_loss": -7.156611045201619, "global_step": 203405, "epoch": 4842, "val_loss": 69325.7578125} {"train_loss": -6.947405815124512, "global_step": 203406, "epoch": 4843} {"train_loss": -6.892093658447266, "global_step": 203407, "epoch": 4843} {"train_loss": -7.024245262145996, "global_step": 203408, "epoch": 4843} {"train_loss": -7.093277931213379, "global_step": 203409, "epoch": 4843} {"train_loss": -7.011491298675537, "global_step": 203410, "epoch": 4843} {"train_loss": -7.142515182495117, "global_step": 203411, "epoch": 4843} {"train_loss": -7.052403450012207, "global_step": 203412, "epoch": 4843} {"train_loss": -7.123434543609619, "global_step": 203413, "epoch": 4843} {"train_loss": -6.9365692138671875, "global_step": 203414, "epoch": 4843} {"train_loss": -7.199325084686279, "global_step": 203415, "epoch": 4843} {"train_loss": -7.041288375854492, "global_step": 203416, "epoch": 4843} {"train_loss": -7.092776298522949, "global_step": 203417, "epoch": 4843} {"train_loss": -7.03065824508667, "global_step": 203418, "epoch": 4843} {"train_loss": -7.104198932647705, "global_step": 203419, "epoch": 4843} {"train_loss": -7.085003852844238, "global_step": 203420, "epoch": 4843} {"train_loss": -7.274914741516113, "global_step": 203421, "epoch": 4843} {"train_loss": -7.124889373779297, "global_step": 203422, "epoch": 4843} {"train_loss": -7.132219314575195, "global_step": 203423, "epoch": 4843} {"train_loss": -7.249471187591553, "global_step": 203424, "epoch": 4843} {"train_loss": -7.1585187911987305, "global_step": 203425, "epoch": 4843} {"train_loss": -7.296194076538086, "global_step": 203426, "epoch": 4843} {"train_loss": -7.189056873321533, "global_step": 203427, "epoch": 4843} {"train_loss": -7.203367233276367, "global_step": 203428, "epoch": 4843} {"train_loss": -7.321780204772949, "global_step": 203429, "epoch": 4843} {"train_loss": -7.32796049118042, "global_step": 203430, "epoch": 4843} {"train_loss": -7.131654739379883, "global_step": 203431, "epoch": 4843} {"train_loss": -7.22998046875, "global_step": 203432, "epoch": 4843} {"train_loss": -7.260352611541748, "global_step": 203433, "epoch": 4843} {"train_loss": -7.208127021789551, "global_step": 203434, "epoch": 4843} {"train_loss": -7.241138935089111, "global_step": 203435, "epoch": 4843} {"train_loss": -7.339554786682129, "global_step": 203436, "epoch": 4843} {"train_loss": -7.15473747253418, "global_step": 203437, "epoch": 4843} {"train_loss": -7.227855682373047, "global_step": 203438, "epoch": 4843} {"train_loss": -7.233968734741211, "global_step": 203439, "epoch": 4843} {"train_loss": -7.293131351470947, "global_step": 203440, "epoch": 4843} {"train_loss": -7.296136379241943, "global_step": 203441, "epoch": 4843} {"train_loss": -7.260058403015137, "global_step": 203442, "epoch": 4843} {"train_loss": -7.348505973815918, "global_step": 203443, "epoch": 4843} {"train_loss": -7.180676460266113, "global_step": 203444, "epoch": 4843} {"train_loss": -7.354548454284668, "global_step": 203445, "epoch": 4843} {"train_loss": -7.385695457458496, "global_step": 203446, "epoch": 4843} {"train_loss": -7.177244799477713, "global_step": 203447, "epoch": 4843, "val_loss": 69001.390625} {"train_loss": -7.315871238708496, "global_step": 203448, "epoch": 4844} {"train_loss": -7.336850643157959, "global_step": 203449, "epoch": 4844} {"train_loss": -7.368687629699707, "global_step": 203450, "epoch": 4844} {"train_loss": -7.332544803619385, "global_step": 203451, "epoch": 4844} {"train_loss": -7.340357780456543, "global_step": 203452, "epoch": 4844} {"train_loss": -7.2555670738220215, "global_step": 203453, "epoch": 4844} {"train_loss": -7.313357830047607, "global_step": 203454, "epoch": 4844} {"train_loss": -7.231628894805908, "global_step": 203455, "epoch": 4844} {"train_loss": -7.395839214324951, "global_step": 203456, "epoch": 4844} {"train_loss": -7.2791337966918945, "global_step": 203457, "epoch": 4844} {"train_loss": -7.33057975769043, "global_step": 203458, "epoch": 4844} {"train_loss": -7.226607322692871, "global_step": 203459, "epoch": 4844} {"train_loss": -7.299956321716309, "global_step": 203460, "epoch": 4844} {"train_loss": -7.245659828186035, "global_step": 203461, "epoch": 4844} {"train_loss": -7.308814525604248, "global_step": 203462, "epoch": 4844} {"train_loss": -7.301468372344971, "global_step": 203463, "epoch": 4844} {"train_loss": -7.218459129333496, "global_step": 203464, "epoch": 4844} {"train_loss": -7.283634185791016, "global_step": 203465, "epoch": 4844} {"train_loss": -7.31341552734375, "global_step": 203466, "epoch": 4844} {"train_loss": -7.264936447143555, "global_step": 203467, "epoch": 4844} {"train_loss": -7.191951751708984, "global_step": 203468, "epoch": 4844} {"train_loss": -7.29606294631958, "global_step": 203469, "epoch": 4844} {"train_loss": -7.190639019012451, "global_step": 203470, "epoch": 4844} {"train_loss": -7.248745441436768, "global_step": 203471, "epoch": 4844} {"train_loss": -7.292642116546631, "global_step": 203472, "epoch": 4844} {"train_loss": -7.224212169647217, "global_step": 203473, "epoch": 4844} {"train_loss": -7.212743759155273, "global_step": 203474, "epoch": 4844} {"train_loss": -7.193477153778076, "global_step": 203475, "epoch": 4844} {"train_loss": -7.266942977905273, "global_step": 203476, "epoch": 4844} {"train_loss": -7.300276756286621, "global_step": 203477, "epoch": 4844} {"train_loss": -7.334550857543945, "global_step": 203478, "epoch": 4844} {"train_loss": -7.2906694412231445, "global_step": 203479, "epoch": 4844} {"train_loss": -7.3703203201293945, "global_step": 203480, "epoch": 4844} {"train_loss": -7.264071464538574, "global_step": 203481, "epoch": 4844} {"train_loss": -7.296688556671143, "global_step": 203482, "epoch": 4844} {"train_loss": -7.2682905197143555, "global_step": 203483, "epoch": 4844} {"train_loss": -7.2992329597473145, "global_step": 203484, "epoch": 4844} {"train_loss": -7.431116104125977, "global_step": 203485, "epoch": 4844} {"train_loss": -7.363885879516602, "global_step": 203486, "epoch": 4844} {"train_loss": -7.474149703979492, "global_step": 203487, "epoch": 4844} {"train_loss": -7.400736331939697, "global_step": 203488, "epoch": 4844} {"train_loss": -7.296911636988322, "global_step": 203489, "epoch": 4844, "val_loss": 69068.4140625} {"train_loss": -7.416457176208496, "global_step": 203490, "epoch": 4845} {"train_loss": -7.29676628112793, "global_step": 203491, "epoch": 4845} {"train_loss": -7.297821044921875, "global_step": 203492, "epoch": 4845} {"train_loss": -7.162178039550781, "global_step": 203493, "epoch": 4845} {"train_loss": -7.324589252471924, "global_step": 203494, "epoch": 4845} {"train_loss": -7.279431343078613, "global_step": 203495, "epoch": 4845} {"train_loss": -7.167988300323486, "global_step": 203496, "epoch": 4845} {"train_loss": -7.343327522277832, "global_step": 203497, "epoch": 4845} {"train_loss": -7.2871575355529785, "global_step": 203498, "epoch": 4845} {"train_loss": -7.278115272521973, "global_step": 203499, "epoch": 4845} {"train_loss": -7.283458709716797, "global_step": 203500, "epoch": 4845} {"train_loss": -7.332206726074219, "global_step": 203501, "epoch": 4845} {"train_loss": -7.387810230255127, "global_step": 203502, "epoch": 4845} {"train_loss": -7.374805450439453, "global_step": 203503, "epoch": 4845} {"train_loss": -7.259577751159668, "global_step": 203504, "epoch": 4845} {"train_loss": -7.27034854888916, "global_step": 203505, "epoch": 4845} {"train_loss": -7.326717376708984, "global_step": 203506, "epoch": 4845} {"train_loss": -7.404254913330078, "global_step": 203507, "epoch": 4845} {"train_loss": -7.282109260559082, "global_step": 203508, "epoch": 4845} {"train_loss": -7.286978721618652, "global_step": 203509, "epoch": 4845} {"train_loss": -7.380407333374023, "global_step": 203510, "epoch": 4845} {"train_loss": -7.24318265914917, "global_step": 203511, "epoch": 4845} {"train_loss": -7.239113807678223, "global_step": 203512, "epoch": 4845} {"train_loss": -7.26315975189209, "global_step": 203513, "epoch": 4845} {"train_loss": -7.224547386169434, "global_step": 203514, "epoch": 4845} {"train_loss": -7.352414131164551, "global_step": 203515, "epoch": 4845} {"train_loss": -7.305934906005859, "global_step": 203516, "epoch": 4845} {"train_loss": -7.253471374511719, "global_step": 203517, "epoch": 4845} {"train_loss": -7.298688888549805, "global_step": 203518, "epoch": 4845} {"train_loss": -7.305269718170166, "global_step": 203519, "epoch": 4845} {"train_loss": -7.227451324462891, "global_step": 203520, "epoch": 4845} {"train_loss": -7.273252487182617, "global_step": 203521, "epoch": 4845} {"train_loss": -7.2247161865234375, "global_step": 203522, "epoch": 4845} {"train_loss": -7.286995887756348, "global_step": 203523, "epoch": 4845} {"train_loss": -7.195093631744385, "global_step": 203524, "epoch": 4845} {"train_loss": -7.241517066955566, "global_step": 203525, "epoch": 4845} {"train_loss": -7.221132278442383, "global_step": 203526, "epoch": 4845} {"train_loss": -7.311509609222412, "global_step": 203527, "epoch": 4845} {"train_loss": -7.359598159790039, "global_step": 203528, "epoch": 4845} {"train_loss": -7.249958038330078, "global_step": 203529, "epoch": 4845} {"train_loss": -7.234923362731934, "global_step": 203530, "epoch": 4845} {"train_loss": -7.28850261370341, "global_step": 203531, "epoch": 4845, "val_loss": 69174.46875} {"train_loss": -7.306924819946289, "global_step": 203532, "epoch": 4846} {"train_loss": -7.256915092468262, "global_step": 203533, "epoch": 4846} {"train_loss": -7.33948278427124, "global_step": 203534, "epoch": 4846} {"train_loss": -7.236239433288574, "global_step": 203535, "epoch": 4846} {"train_loss": -7.2020769119262695, "global_step": 203536, "epoch": 4846} {"train_loss": -7.179351806640625, "global_step": 203537, "epoch": 4846} {"train_loss": -7.1797709465026855, "global_step": 203538, "epoch": 4846} {"train_loss": -7.232699871063232, "global_step": 203539, "epoch": 4846} {"train_loss": -7.28192138671875, "global_step": 203540, "epoch": 4846} {"train_loss": -7.239682197570801, "global_step": 203541, "epoch": 4846} {"train_loss": -7.123663902282715, "global_step": 203542, "epoch": 4846} {"train_loss": -7.192763328552246, "global_step": 203543, "epoch": 4846} {"train_loss": -7.2846598625183105, "global_step": 203544, "epoch": 4846} {"train_loss": -7.289072036743164, "global_step": 203545, "epoch": 4846} {"train_loss": -7.298761367797852, "global_step": 203546, "epoch": 4846} {"train_loss": -7.300821304321289, "global_step": 203547, "epoch": 4846} {"train_loss": -7.291316986083984, "global_step": 203548, "epoch": 4846} {"train_loss": -7.298551559448242, "global_step": 203549, "epoch": 4846} {"train_loss": -7.171125411987305, "global_step": 203550, "epoch": 4846} {"train_loss": -7.296623706817627, "global_step": 203551, "epoch": 4846} {"train_loss": -7.359408378601074, "global_step": 203552, "epoch": 4846} {"train_loss": -7.267557144165039, "global_step": 203553, "epoch": 4846} {"train_loss": -7.271698951721191, "global_step": 203554, "epoch": 4846} {"train_loss": -7.389552116394043, "global_step": 203555, "epoch": 4846} {"train_loss": -7.319177627563477, "global_step": 203556, "epoch": 4846} {"train_loss": -7.248805999755859, "global_step": 203557, "epoch": 4846} {"train_loss": -7.283038139343262, "global_step": 203558, "epoch": 4846} {"train_loss": -7.151352405548096, "global_step": 203559, "epoch": 4846} {"train_loss": -7.255910873413086, "global_step": 203560, "epoch": 4846} {"train_loss": -7.294910430908203, "global_step": 203561, "epoch": 4846} {"train_loss": -7.13218879699707, "global_step": 203562, "epoch": 4846} {"train_loss": -7.238709449768066, "global_step": 203563, "epoch": 4846} {"train_loss": -7.308624267578125, "global_step": 203564, "epoch": 4846} {"train_loss": -7.066917896270752, "global_step": 203565, "epoch": 4846} {"train_loss": -7.298165321350098, "global_step": 203566, "epoch": 4846} {"train_loss": -7.051903247833252, "global_step": 203567, "epoch": 4846} {"train_loss": -7.186284065246582, "global_step": 203568, "epoch": 4846} {"train_loss": -7.219537258148193, "global_step": 203569, "epoch": 4846} {"train_loss": -7.201469421386719, "global_step": 203570, "epoch": 4846} {"train_loss": -7.3295087814331055, "global_step": 203571, "epoch": 4846} {"train_loss": -7.135439395904541, "global_step": 203572, "epoch": 4846} {"train_loss": -7.242444174630301, "global_step": 203573, "epoch": 4846, "val_loss": 69153.5234375} {"train_loss": -7.050411224365234, "global_step": 203574, "epoch": 4847} {"train_loss": -7.148163318634033, "global_step": 203575, "epoch": 4847} {"train_loss": -7.192918300628662, "global_step": 203576, "epoch": 4847} {"train_loss": -7.158267974853516, "global_step": 203577, "epoch": 4847} {"train_loss": -7.229228973388672, "global_step": 203578, "epoch": 4847} {"train_loss": -7.330894947052002, "global_step": 203579, "epoch": 4847} {"train_loss": -7.177886486053467, "global_step": 203580, "epoch": 4847} {"train_loss": -7.364995002746582, "global_step": 203581, "epoch": 4847} {"train_loss": -7.238852500915527, "global_step": 203582, "epoch": 4847} {"train_loss": -7.338017463684082, "global_step": 203583, "epoch": 4847} {"train_loss": -7.25360107421875, "global_step": 203584, "epoch": 4847} {"train_loss": -7.351232051849365, "global_step": 203585, "epoch": 4847} {"train_loss": -7.268728256225586, "global_step": 203586, "epoch": 4847} {"train_loss": -7.3327484130859375, "global_step": 203587, "epoch": 4847} {"train_loss": -7.2411885261535645, "global_step": 203588, "epoch": 4847} {"train_loss": -7.25638484954834, "global_step": 203589, "epoch": 4847} {"train_loss": -7.3322954177856445, "global_step": 203590, "epoch": 4847} {"train_loss": -7.187339782714844, "global_step": 203591, "epoch": 4847} {"train_loss": -7.220623016357422, "global_step": 203592, "epoch": 4847} {"train_loss": -7.221723556518555, "global_step": 203593, "epoch": 4847} {"train_loss": -7.329257965087891, "global_step": 203594, "epoch": 4847} {"train_loss": -7.167384147644043, "global_step": 203595, "epoch": 4847} {"train_loss": -7.324997901916504, "global_step": 203596, "epoch": 4847} {"train_loss": -7.253040313720703, "global_step": 203597, "epoch": 4847} {"train_loss": -7.184784889221191, "global_step": 203598, "epoch": 4847} {"train_loss": -7.267441749572754, "global_step": 203599, "epoch": 4847} {"train_loss": -7.129070281982422, "global_step": 203600, "epoch": 4847} {"train_loss": -7.297910690307617, "global_step": 203601, "epoch": 4847} {"train_loss": -7.227352142333984, "global_step": 203602, "epoch": 4847} {"train_loss": -7.147326469421387, "global_step": 203603, "epoch": 4847} {"train_loss": -7.292316436767578, "global_step": 203604, "epoch": 4847} {"train_loss": -7.175750732421875, "global_step": 203605, "epoch": 4847} {"train_loss": -7.243057727813721, "global_step": 203606, "epoch": 4847} {"train_loss": -7.311160564422607, "global_step": 203607, "epoch": 4847} {"train_loss": -7.256785869598389, "global_step": 203608, "epoch": 4847} {"train_loss": -7.265392303466797, "global_step": 203609, "epoch": 4847} {"train_loss": -7.319913864135742, "global_step": 203610, "epoch": 4847} {"train_loss": -7.217350959777832, "global_step": 203611, "epoch": 4847} {"train_loss": -7.3123459815979, "global_step": 203612, "epoch": 4847} {"train_loss": -7.322112560272217, "global_step": 203613, "epoch": 4847} {"train_loss": -7.226997375488281, "global_step": 203614, "epoch": 4847} {"train_loss": -7.247398603530157, "global_step": 203615, "epoch": 4847, "val_loss": 69172.3359375} {"train_loss": -7.313971519470215, "global_step": 203616, "epoch": 4848} {"train_loss": -7.298634052276611, "global_step": 203617, "epoch": 4848} {"train_loss": -7.320379257202148, "global_step": 203618, "epoch": 4848} {"train_loss": -7.382283687591553, "global_step": 203619, "epoch": 4848} {"train_loss": -7.336427211761475, "global_step": 203620, "epoch": 4848} {"train_loss": -7.244201183319092, "global_step": 203621, "epoch": 4848} {"train_loss": -7.368349075317383, "global_step": 203622, "epoch": 4848} {"train_loss": -7.420535564422607, "global_step": 203623, "epoch": 4848} {"train_loss": -7.340773582458496, "global_step": 203624, "epoch": 4848} {"train_loss": -7.356238842010498, "global_step": 203625, "epoch": 4848} {"train_loss": -7.272394180297852, "global_step": 203626, "epoch": 4848} {"train_loss": -7.249134063720703, "global_step": 203627, "epoch": 4848} {"train_loss": -7.287985801696777, "global_step": 203628, "epoch": 4848} {"train_loss": -7.404669284820557, "global_step": 203629, "epoch": 4848} {"train_loss": -7.342251777648926, "global_step": 203630, "epoch": 4848} {"train_loss": -7.289206504821777, "global_step": 203631, "epoch": 4848} {"train_loss": -7.236276626586914, "global_step": 203632, "epoch": 4848} {"train_loss": -7.241986274719238, "global_step": 203633, "epoch": 4848} {"train_loss": -7.350991249084473, "global_step": 203634, "epoch": 4848} {"train_loss": -7.189901351928711, "global_step": 203635, "epoch": 4848} {"train_loss": -7.091917991638184, "global_step": 203636, "epoch": 4848} {"train_loss": -7.3025007247924805, "global_step": 203637, "epoch": 4848} {"train_loss": -7.264116287231445, "global_step": 203638, "epoch": 4848} {"train_loss": -7.146543502807617, "global_step": 203639, "epoch": 4848} {"train_loss": -7.29180908203125, "global_step": 203640, "epoch": 4848} {"train_loss": -7.257488250732422, "global_step": 203641, "epoch": 4848} {"train_loss": -7.142770767211914, "global_step": 203642, "epoch": 4848} {"train_loss": -7.244229793548584, "global_step": 203643, "epoch": 4848} {"train_loss": -7.0615997314453125, "global_step": 203644, "epoch": 4848} {"train_loss": -7.234757423400879, "global_step": 203645, "epoch": 4848} {"train_loss": -7.233154296875, "global_step": 203646, "epoch": 4848} {"train_loss": -7.037485122680664, "global_step": 203647, "epoch": 4848} {"train_loss": -7.22837495803833, "global_step": 203648, "epoch": 4848} {"train_loss": -7.159769535064697, "global_step": 203649, "epoch": 4848} {"train_loss": -7.147444725036621, "global_step": 203650, "epoch": 4848} {"train_loss": -7.226334095001221, "global_step": 203651, "epoch": 4848} {"train_loss": -7.1569929122924805, "global_step": 203652, "epoch": 4848} {"train_loss": -7.325526714324951, "global_step": 203653, "epoch": 4848} {"train_loss": -7.149991989135742, "global_step": 203654, "epoch": 4848} {"train_loss": -7.276885509490967, "global_step": 203655, "epoch": 4848} {"train_loss": -7.181978225708008, "global_step": 203656, "epoch": 4848} {"train_loss": -7.253456002189999, "global_step": 203657, "epoch": 4848, "val_loss": 69237.953125} {"train_loss": -7.198956489562988, "global_step": 203658, "epoch": 4849} {"train_loss": -7.109253883361816, "global_step": 203659, "epoch": 4849} {"train_loss": -7.191407203674316, "global_step": 203660, "epoch": 4849} {"train_loss": -7.179314613342285, "global_step": 203661, "epoch": 4849} {"train_loss": -7.206475257873535, "global_step": 203662, "epoch": 4849} {"train_loss": -7.1617326736450195, "global_step": 203663, "epoch": 4849} {"train_loss": -7.203330993652344, "global_step": 203664, "epoch": 4849} {"train_loss": -7.172170639038086, "global_step": 203665, "epoch": 4849} {"train_loss": -7.162642478942871, "global_step": 203666, "epoch": 4849} {"train_loss": -7.135078430175781, "global_step": 203667, "epoch": 4849} {"train_loss": -7.167453289031982, "global_step": 203668, "epoch": 4849} {"train_loss": -7.188817977905273, "global_step": 203669, "epoch": 4849} {"train_loss": -7.148629665374756, "global_step": 203670, "epoch": 4849} {"train_loss": -7.18879508972168, "global_step": 203671, "epoch": 4849} {"train_loss": -7.2023515701293945, "global_step": 203672, "epoch": 4849} {"train_loss": -7.150162220001221, "global_step": 203673, "epoch": 4849} {"train_loss": -7.313085556030273, "global_step": 203674, "epoch": 4849} {"train_loss": -7.2069091796875, "global_step": 203675, "epoch": 4849} {"train_loss": -7.19345760345459, "global_step": 203676, "epoch": 4849} {"train_loss": -7.238543510437012, "global_step": 203677, "epoch": 4849} {"train_loss": -7.321985721588135, "global_step": 203678, "epoch": 4849} {"train_loss": -7.444650650024414, "global_step": 203679, "epoch": 4849} {"train_loss": -7.223310470581055, "global_step": 203680, "epoch": 4849} {"train_loss": -7.319524765014648, "global_step": 203681, "epoch": 4849} {"train_loss": -7.164480686187744, "global_step": 203682, "epoch": 4849} {"train_loss": -7.227300643920898, "global_step": 203683, "epoch": 4849} {"train_loss": -7.299020767211914, "global_step": 203684, "epoch": 4849} {"train_loss": -7.362730979919434, "global_step": 203685, "epoch": 4849} {"train_loss": -7.284994125366211, "global_step": 203686, "epoch": 4849} {"train_loss": -7.281723499298096, "global_step": 203687, "epoch": 4849} {"train_loss": -7.366844177246094, "global_step": 203688, "epoch": 4849} {"train_loss": -7.205410957336426, "global_step": 203689, "epoch": 4849} {"train_loss": -7.174060821533203, "global_step": 203690, "epoch": 4849} {"train_loss": -7.303336143493652, "global_step": 203691, "epoch": 4849} {"train_loss": -7.271759986877441, "global_step": 203692, "epoch": 4849} {"train_loss": -7.254393577575684, "global_step": 203693, "epoch": 4849} {"train_loss": -7.331593036651611, "global_step": 203694, "epoch": 4849} {"train_loss": -7.365055084228516, "global_step": 203695, "epoch": 4849} {"train_loss": -7.2924089431762695, "global_step": 203696, "epoch": 4849} {"train_loss": -7.399445533752441, "global_step": 203697, "epoch": 4849} {"train_loss": -7.29666805267334, "global_step": 203698, "epoch": 4849} {"train_loss": -7.243994565237136, "global_step": 203699, "epoch": 4849, "val_loss": 69044.75} {"train_loss": -7.249238014221191, "global_step": 203700, "epoch": 4850} {"train_loss": -7.196591854095459, "global_step": 203701, "epoch": 4850} {"train_loss": -7.2686638832092285, "global_step": 203702, "epoch": 4850} {"train_loss": -7.34105920791626, "global_step": 203703, "epoch": 4850} {"train_loss": -7.283001899719238, "global_step": 203704, "epoch": 4850} {"train_loss": -7.345783233642578, "global_step": 203705, "epoch": 4850} {"train_loss": -7.409481525421143, "global_step": 203706, "epoch": 4850} {"train_loss": -7.38835334777832, "global_step": 203707, "epoch": 4850} {"train_loss": -7.332072734832764, "global_step": 203708, "epoch": 4850} {"train_loss": -7.331584930419922, "global_step": 203709, "epoch": 4850} {"train_loss": -7.355602264404297, "global_step": 203710, "epoch": 4850} {"train_loss": -7.331483840942383, "global_step": 203711, "epoch": 4850} {"train_loss": -7.3379669189453125, "global_step": 203712, "epoch": 4850} {"train_loss": -7.376617431640625, "global_step": 203713, "epoch": 4850} {"train_loss": -7.215420722961426, "global_step": 203714, "epoch": 4850} {"train_loss": -7.249877452850342, "global_step": 203715, "epoch": 4850} {"train_loss": -7.396925449371338, "global_step": 203716, "epoch": 4850} {"train_loss": -7.29118537902832, "global_step": 203717, "epoch": 4850} {"train_loss": -7.089066505432129, "global_step": 203718, "epoch": 4850} {"train_loss": -7.201474189758301, "global_step": 203719, "epoch": 4850} {"train_loss": -7.302516937255859, "global_step": 203720, "epoch": 4850} {"train_loss": -7.224767684936523, "global_step": 203721, "epoch": 4850} {"train_loss": -7.184569358825684, "global_step": 203722, "epoch": 4850} {"train_loss": -7.184381008148193, "global_step": 203723, "epoch": 4850} {"train_loss": -7.23046875, "global_step": 203724, "epoch": 4850} {"train_loss": -7.203166484832764, "global_step": 203725, "epoch": 4850} {"train_loss": -7.199166297912598, "global_step": 203726, "epoch": 4850} {"train_loss": -7.133617401123047, "global_step": 203727, "epoch": 4850} {"train_loss": -7.173752784729004, "global_step": 203728, "epoch": 4850} {"train_loss": -7.172109603881836, "global_step": 203729, "epoch": 4850} {"train_loss": -7.23646879196167, "global_step": 203730, "epoch": 4850} {"train_loss": -7.016930103302002, "global_step": 203731, "epoch": 4850} {"train_loss": -7.090081214904785, "global_step": 203732, "epoch": 4850} {"train_loss": -7.186278343200684, "global_step": 203733, "epoch": 4850} {"train_loss": -7.195958137512207, "global_step": 203734, "epoch": 4850} {"train_loss": -7.193563461303711, "global_step": 203735, "epoch": 4850} {"train_loss": -7.1191864013671875, "global_step": 203736, "epoch": 4850} {"train_loss": -7.198822021484375, "global_step": 203737, "epoch": 4850} {"train_loss": -7.232253074645996, "global_step": 203738, "epoch": 4850} {"train_loss": -7.22977352142334, "global_step": 203739, "epoch": 4850} {"train_loss": -7.125777721405029, "global_step": 203740, "epoch": 4850} {"train_loss": -7.2405058997018, "global_step": 203741, "epoch": 4850, "train/sim_max_reward_0": 0.8761609630380632, "train/sim_max_reward_1": 0.9611203973272421, "train/sim_max_reward_2": 0.6367710413599593, "train/sim_max_reward_3": 0.13304967451120062, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.958133537897159, "test/sim_max_reward_4400000": 0.9791460073890673, "test/sim_max_reward_4400001": 0.29914580480222575, "test/sim_max_reward_4400002": 0.18742792465866995, "test/sim_max_reward_4400003": 0.9648111663527299, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.34831267563291646, "test/sim_max_reward_4400006": 0.9957361588623148, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.3020524185395672, "test/sim_max_reward_4400009": 0.9885656862712219, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.3324538938265599, "test/sim_max_reward_4400012": 0.9543038037071286, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.910819368576089, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.8536793061428609, "test/sim_max_reward_4400018": 0.28642492322567764, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9155043404901015, "test/sim_max_reward_4400023": 0.978516889884784, "test/sim_max_reward_4400024": 0.9535518640977714, "test/sim_max_reward_4400025": 0.27608490485242915, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.0002535949793324634, "test/sim_max_reward_4400028": 0.5928861922918237, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9783210665865957, "test/sim_max_reward_4400031": 0.9649344924997634, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.4499241531758389, "test/sim_max_reward_4400036": 0.8850733805138827, "test/sim_max_reward_4400037": 0.8814355612497826, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9896119074577509, "test/sim_max_reward_4400042": 0.5154001364303938, "test/sim_max_reward_4400043": 0.9642844398890869, "test/sim_max_reward_4400044": 0.9284638750511559, "test/sim_max_reward_4400045": 0.947089260070556, "test/sim_max_reward_4400046": 0.38742038455885836, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.760872602355604, "test/mean_score": 0.5718900029893519, "val_loss": 68990.4921875} {"train_loss": -7.267086029052734, "global_step": 203742, "epoch": 4851} {"train_loss": -7.2703752517700195, "global_step": 203743, "epoch": 4851} {"train_loss": -7.209616661071777, "global_step": 203744, "epoch": 4851} {"train_loss": -7.259555339813232, "global_step": 203745, "epoch": 4851} {"train_loss": -7.355831623077393, "global_step": 203746, "epoch": 4851} {"train_loss": -7.268993377685547, "global_step": 203747, "epoch": 4851} {"train_loss": -7.256446361541748, "global_step": 203748, "epoch": 4851} {"train_loss": -7.288469314575195, "global_step": 203749, "epoch": 4851} {"train_loss": -7.1969757080078125, "global_step": 203750, "epoch": 4851} {"train_loss": -7.385044097900391, "global_step": 203751, "epoch": 4851} {"train_loss": -7.085338592529297, "global_step": 203752, "epoch": 4851} {"train_loss": -7.3003740310668945, "global_step": 203753, "epoch": 4851} {"train_loss": -7.223838806152344, "global_step": 203754, "epoch": 4851} {"train_loss": -7.098055839538574, "global_step": 203755, "epoch": 4851} {"train_loss": -7.348637580871582, "global_step": 203756, "epoch": 4851} {"train_loss": -7.226428031921387, "global_step": 203757, "epoch": 4851} {"train_loss": -7.358886241912842, "global_step": 203758, "epoch": 4851} {"train_loss": -7.3325934410095215, "global_step": 203759, "epoch": 4851} {"train_loss": -7.246463775634766, "global_step": 203760, "epoch": 4851} {"train_loss": -7.337068557739258, "global_step": 203761, "epoch": 4851} {"train_loss": -7.2360076904296875, "global_step": 203762, "epoch": 4851} {"train_loss": -7.169462203979492, "global_step": 203763, "epoch": 4851} {"train_loss": -7.463967323303223, "global_step": 203764, "epoch": 4851} {"train_loss": -7.16533899307251, "global_step": 203765, "epoch": 4851} {"train_loss": -7.343733787536621, "global_step": 203766, "epoch": 4851} {"train_loss": -7.2930121421813965, "global_step": 203767, "epoch": 4851} {"train_loss": -7.312238693237305, "global_step": 203768, "epoch": 4851} {"train_loss": -7.391236782073975, "global_step": 203769, "epoch": 4851} {"train_loss": -7.321622848510742, "global_step": 203770, "epoch": 4851} {"train_loss": -7.239062309265137, "global_step": 203771, "epoch": 4851} {"train_loss": -7.20543098449707, "global_step": 203772, "epoch": 4851} {"train_loss": -7.217532157897949, "global_step": 203773, "epoch": 4851} {"train_loss": -7.285139083862305, "global_step": 203774, "epoch": 4851} {"train_loss": -7.156233787536621, "global_step": 203775, "epoch": 4851} {"train_loss": -7.2757568359375, "global_step": 203776, "epoch": 4851} {"train_loss": -7.370126247406006, "global_step": 203777, "epoch": 4851} {"train_loss": -7.211950778961182, "global_step": 203778, "epoch": 4851} {"train_loss": -7.24503755569458, "global_step": 203779, "epoch": 4851} {"train_loss": -7.235918998718262, "global_step": 203780, "epoch": 4851} {"train_loss": -7.208564758300781, "global_step": 203781, "epoch": 4851} {"train_loss": -7.259920597076416, "global_step": 203782, "epoch": 4851} {"train_loss": -7.265958172934396, "global_step": 203783, "epoch": 4851, "val_loss": 69288.8984375} {"train_loss": -7.359375953674316, "global_step": 203784, "epoch": 4852} {"train_loss": -7.179045677185059, "global_step": 203785, "epoch": 4852} {"train_loss": -7.302237510681152, "global_step": 203786, "epoch": 4852} {"train_loss": -7.35106086730957, "global_step": 203787, "epoch": 4852} {"train_loss": -7.217099189758301, "global_step": 203788, "epoch": 4852} {"train_loss": -7.235276222229004, "global_step": 203789, "epoch": 4852} {"train_loss": -7.292558193206787, "global_step": 203790, "epoch": 4852} {"train_loss": -7.276257514953613, "global_step": 203791, "epoch": 4852} {"train_loss": -7.210452079772949, "global_step": 203792, "epoch": 4852} {"train_loss": -7.171929836273193, "global_step": 203793, "epoch": 4852} {"train_loss": -7.403959274291992, "global_step": 203794, "epoch": 4852} {"train_loss": -7.274262428283691, "global_step": 203795, "epoch": 4852} {"train_loss": -7.244635105133057, "global_step": 203796, "epoch": 4852} {"train_loss": -7.230557441711426, "global_step": 203797, "epoch": 4852} {"train_loss": -7.217505931854248, "global_step": 203798, "epoch": 4852} {"train_loss": -7.333340167999268, "global_step": 203799, "epoch": 4852} {"train_loss": -7.188208103179932, "global_step": 203800, "epoch": 4852} {"train_loss": -7.221437454223633, "global_step": 203801, "epoch": 4852} {"train_loss": -7.177908897399902, "global_step": 203802, "epoch": 4852} {"train_loss": -7.202880859375, "global_step": 203803, "epoch": 4852} {"train_loss": -7.332508087158203, "global_step": 203804, "epoch": 4852} {"train_loss": -7.2685980796813965, "global_step": 203805, "epoch": 4852} {"train_loss": -7.228762626647949, "global_step": 203806, "epoch": 4852} {"train_loss": -7.288250923156738, "global_step": 203807, "epoch": 4852} {"train_loss": -7.232354640960693, "global_step": 203808, "epoch": 4852} {"train_loss": -7.287922382354736, "global_step": 203809, "epoch": 4852} {"train_loss": -7.181492805480957, "global_step": 203810, "epoch": 4852} {"train_loss": -7.217641830444336, "global_step": 203811, "epoch": 4852} {"train_loss": -7.2882161140441895, "global_step": 203812, "epoch": 4852} {"train_loss": -7.20508337020874, "global_step": 203813, "epoch": 4852} {"train_loss": -7.219888687133789, "global_step": 203814, "epoch": 4852} {"train_loss": -7.110666275024414, "global_step": 203815, "epoch": 4852} {"train_loss": -7.261142730712891, "global_step": 203816, "epoch": 4852} {"train_loss": -7.249366283416748, "global_step": 203817, "epoch": 4852} {"train_loss": -7.3193159103393555, "global_step": 203818, "epoch": 4852} {"train_loss": -7.245094299316406, "global_step": 203819, "epoch": 4852} {"train_loss": -7.208988189697266, "global_step": 203820, "epoch": 4852} {"train_loss": -7.265032768249512, "global_step": 203821, "epoch": 4852} {"train_loss": -7.287156581878662, "global_step": 203822, "epoch": 4852} {"train_loss": -7.39154577255249, "global_step": 203823, "epoch": 4852} {"train_loss": -7.318386554718018, "global_step": 203824, "epoch": 4852} {"train_loss": -7.253362053916568, "global_step": 203825, "epoch": 4852, "val_loss": 69037.2109375} {"train_loss": -7.345745086669922, "global_step": 203826, "epoch": 4853} {"train_loss": -7.212533950805664, "global_step": 203827, "epoch": 4853} {"train_loss": -7.194191932678223, "global_step": 203828, "epoch": 4853} {"train_loss": -7.305210590362549, "global_step": 203829, "epoch": 4853} {"train_loss": -7.217554092407227, "global_step": 203830, "epoch": 4853} {"train_loss": -7.250739097595215, "global_step": 203831, "epoch": 4853} {"train_loss": -7.281579971313477, "global_step": 203832, "epoch": 4853} {"train_loss": -7.120169639587402, "global_step": 203833, "epoch": 4853} {"train_loss": -7.250154495239258, "global_step": 203834, "epoch": 4853} {"train_loss": -7.163519859313965, "global_step": 203835, "epoch": 4853} {"train_loss": -7.306218147277832, "global_step": 203836, "epoch": 4853} {"train_loss": -7.195757865905762, "global_step": 203837, "epoch": 4853} {"train_loss": -7.265892028808594, "global_step": 203838, "epoch": 4853} {"train_loss": -7.149679183959961, "global_step": 203839, "epoch": 4853} {"train_loss": -7.153759956359863, "global_step": 203840, "epoch": 4853} {"train_loss": -7.235760688781738, "global_step": 203841, "epoch": 4853} {"train_loss": -7.21450138092041, "global_step": 203842, "epoch": 4853} {"train_loss": -7.194437503814697, "global_step": 203843, "epoch": 4853} {"train_loss": -7.166904926300049, "global_step": 203844, "epoch": 4853} {"train_loss": -7.149250030517578, "global_step": 203845, "epoch": 4853} {"train_loss": -7.348731994628906, "global_step": 203846, "epoch": 4853} {"train_loss": -7.145474433898926, "global_step": 203847, "epoch": 4853} {"train_loss": -7.189325332641602, "global_step": 203848, "epoch": 4853} {"train_loss": -7.269493579864502, "global_step": 203849, "epoch": 4853} {"train_loss": -7.2162861824035645, "global_step": 203850, "epoch": 4853} {"train_loss": -7.085651874542236, "global_step": 203851, "epoch": 4853} {"train_loss": -7.227694034576416, "global_step": 203852, "epoch": 4853} {"train_loss": -7.265702247619629, "global_step": 203853, "epoch": 4853} {"train_loss": -7.17594575881958, "global_step": 203854, "epoch": 4853} {"train_loss": -7.298174858093262, "global_step": 203855, "epoch": 4853} {"train_loss": -7.159083366394043, "global_step": 203856, "epoch": 4853} {"train_loss": -7.156750679016113, "global_step": 203857, "epoch": 4853} {"train_loss": -7.252569675445557, "global_step": 203858, "epoch": 4853} {"train_loss": -7.133134841918945, "global_step": 203859, "epoch": 4853} {"train_loss": -7.14785099029541, "global_step": 203860, "epoch": 4853} {"train_loss": -7.170894622802734, "global_step": 203861, "epoch": 4853} {"train_loss": -7.19130802154541, "global_step": 203862, "epoch": 4853} {"train_loss": -7.113327503204346, "global_step": 203863, "epoch": 4853} {"train_loss": -7.147330284118652, "global_step": 203864, "epoch": 4853} {"train_loss": -7.230556488037109, "global_step": 203865, "epoch": 4853} {"train_loss": -7.204771041870117, "global_step": 203866, "epoch": 4853} {"train_loss": -7.20828804515657, "global_step": 203867, "epoch": 4853, "val_loss": 69220.609375} {"train_loss": -7.146855354309082, "global_step": 203868, "epoch": 4854} {"train_loss": -7.271164894104004, "global_step": 203869, "epoch": 4854} {"train_loss": -7.207061767578125, "global_step": 203870, "epoch": 4854} {"train_loss": -7.209904670715332, "global_step": 203871, "epoch": 4854} {"train_loss": -7.354254722595215, "global_step": 203872, "epoch": 4854} {"train_loss": -7.097586631774902, "global_step": 203873, "epoch": 4854} {"train_loss": -7.241020202636719, "global_step": 203874, "epoch": 4854} {"train_loss": -7.262903213500977, "global_step": 203875, "epoch": 4854} {"train_loss": -7.195921897888184, "global_step": 203876, "epoch": 4854} {"train_loss": -7.29324197769165, "global_step": 203877, "epoch": 4854} {"train_loss": -7.339295387268066, "global_step": 203878, "epoch": 4854} {"train_loss": -7.337577819824219, "global_step": 203879, "epoch": 4854} {"train_loss": -7.360198974609375, "global_step": 203880, "epoch": 4854} {"train_loss": -7.228673934936523, "global_step": 203881, "epoch": 4854} {"train_loss": -7.232998371124268, "global_step": 203882, "epoch": 4854} {"train_loss": -7.331007480621338, "global_step": 203883, "epoch": 4854} {"train_loss": -7.294075012207031, "global_step": 203884, "epoch": 4854} {"train_loss": -7.218075752258301, "global_step": 203885, "epoch": 4854} {"train_loss": -7.355477809906006, "global_step": 203886, "epoch": 4854} {"train_loss": -7.336334228515625, "global_step": 203887, "epoch": 4854} {"train_loss": -7.264449119567871, "global_step": 203888, "epoch": 4854} {"train_loss": -7.275379180908203, "global_step": 203889, "epoch": 4854} {"train_loss": -7.347094535827637, "global_step": 203890, "epoch": 4854} {"train_loss": -7.2580952644348145, "global_step": 203891, "epoch": 4854} {"train_loss": -7.372507572174072, "global_step": 203892, "epoch": 4854} {"train_loss": -7.243307113647461, "global_step": 203893, "epoch": 4854} {"train_loss": -7.199285507202148, "global_step": 203894, "epoch": 4854} {"train_loss": -7.357553958892822, "global_step": 203895, "epoch": 4854} {"train_loss": -7.361063003540039, "global_step": 203896, "epoch": 4854} {"train_loss": -7.2939558029174805, "global_step": 203897, "epoch": 4854} {"train_loss": -7.321864128112793, "global_step": 203898, "epoch": 4854} {"train_loss": -7.237974643707275, "global_step": 203899, "epoch": 4854} {"train_loss": -7.202760696411133, "global_step": 203900, "epoch": 4854} {"train_loss": -7.34768009185791, "global_step": 203901, "epoch": 4854} {"train_loss": -7.417218208312988, "global_step": 203902, "epoch": 4854} {"train_loss": -7.301065921783447, "global_step": 203903, "epoch": 4854} {"train_loss": -7.265775680541992, "global_step": 203904, "epoch": 4854} {"train_loss": -7.386822700500488, "global_step": 203905, "epoch": 4854} {"train_loss": -7.280195236206055, "global_step": 203906, "epoch": 4854} {"train_loss": -7.334836483001709, "global_step": 203907, "epoch": 4854} {"train_loss": -7.233827590942383, "global_step": 203908, "epoch": 4854} {"train_loss": -7.284327756790888, "global_step": 203909, "epoch": 4854, "val_loss": 68996.0625} {"train_loss": -7.313899993896484, "global_step": 203910, "epoch": 4855} {"train_loss": -7.324334621429443, "global_step": 203911, "epoch": 4855} {"train_loss": -7.262202262878418, "global_step": 203912, "epoch": 4855} {"train_loss": -7.371118068695068, "global_step": 203913, "epoch": 4855} {"train_loss": -7.305087089538574, "global_step": 203914, "epoch": 4855} {"train_loss": -7.260984420776367, "global_step": 203915, "epoch": 4855} {"train_loss": -7.166258811950684, "global_step": 203916, "epoch": 4855} {"train_loss": -7.278744220733643, "global_step": 203917, "epoch": 4855} {"train_loss": -7.218678951263428, "global_step": 203918, "epoch": 4855} {"train_loss": -7.224900245666504, "global_step": 203919, "epoch": 4855} {"train_loss": -7.286044120788574, "global_step": 203920, "epoch": 4855} {"train_loss": -7.308175086975098, "global_step": 203921, "epoch": 4855} {"train_loss": -7.309595584869385, "global_step": 203922, "epoch": 4855} {"train_loss": -7.259640693664551, "global_step": 203923, "epoch": 4855} {"train_loss": -7.230539798736572, "global_step": 203924, "epoch": 4855} {"train_loss": -7.3250837326049805, "global_step": 203925, "epoch": 4855} {"train_loss": -7.342266082763672, "global_step": 203926, "epoch": 4855} {"train_loss": -7.224031925201416, "global_step": 203927, "epoch": 4855} {"train_loss": -7.38447380065918, "global_step": 203928, "epoch": 4855} {"train_loss": -7.190071105957031, "global_step": 203929, "epoch": 4855} {"train_loss": -7.296788692474365, "global_step": 203930, "epoch": 4855} {"train_loss": -7.288128852844238, "global_step": 203931, "epoch": 4855} {"train_loss": -7.383944511413574, "global_step": 203932, "epoch": 4855} {"train_loss": -7.24420166015625, "global_step": 203933, "epoch": 4855} {"train_loss": -7.269144058227539, "global_step": 203934, "epoch": 4855} {"train_loss": -7.307793617248535, "global_step": 203935, "epoch": 4855} {"train_loss": -7.3099565505981445, "global_step": 203936, "epoch": 4855} {"train_loss": -7.2686309814453125, "global_step": 203937, "epoch": 4855} {"train_loss": -7.3444647789001465, "global_step": 203938, "epoch": 4855} {"train_loss": -7.244251251220703, "global_step": 203939, "epoch": 4855} {"train_loss": -7.304904937744141, "global_step": 203940, "epoch": 4855} {"train_loss": -7.254384517669678, "global_step": 203941, "epoch": 4855} {"train_loss": -7.228974342346191, "global_step": 203942, "epoch": 4855} {"train_loss": -7.186603546142578, "global_step": 203943, "epoch": 4855} {"train_loss": -7.326629638671875, "global_step": 203944, "epoch": 4855} {"train_loss": -7.238376617431641, "global_step": 203945, "epoch": 4855} {"train_loss": -7.212088584899902, "global_step": 203946, "epoch": 4855} {"train_loss": -7.225734710693359, "global_step": 203947, "epoch": 4855} {"train_loss": -7.333596229553223, "global_step": 203948, "epoch": 4855} {"train_loss": -7.11564302444458, "global_step": 203949, "epoch": 4855} {"train_loss": -7.248866558074951, "global_step": 203950, "epoch": 4855} {"train_loss": -7.268398818515596, "global_step": 203951, "epoch": 4855, "val_loss": 69227.625} {"train_loss": -7.378979682922363, "global_step": 203952, "epoch": 4856} {"train_loss": -7.162161827087402, "global_step": 203953, "epoch": 4856} {"train_loss": -7.185556411743164, "global_step": 203954, "epoch": 4856} {"train_loss": -7.28541374206543, "global_step": 203955, "epoch": 4856} {"train_loss": -7.2500224113464355, "global_step": 203956, "epoch": 4856} {"train_loss": -7.227849006652832, "global_step": 203957, "epoch": 4856} {"train_loss": -7.235751152038574, "global_step": 203958, "epoch": 4856} {"train_loss": -7.283186435699463, "global_step": 203959, "epoch": 4856} {"train_loss": -7.220246315002441, "global_step": 203960, "epoch": 4856} {"train_loss": -7.303646087646484, "global_step": 203961, "epoch": 4856} {"train_loss": -7.241533279418945, "global_step": 203962, "epoch": 4856} {"train_loss": -7.212718486785889, "global_step": 203963, "epoch": 4856} {"train_loss": -7.16174840927124, "global_step": 203964, "epoch": 4856} {"train_loss": -7.15358829498291, "global_step": 203965, "epoch": 4856} {"train_loss": -7.281618595123291, "global_step": 203966, "epoch": 4856} {"train_loss": -7.201018810272217, "global_step": 203967, "epoch": 4856} {"train_loss": -7.264382362365723, "global_step": 203968, "epoch": 4856} {"train_loss": -7.258626461029053, "global_step": 203969, "epoch": 4856} {"train_loss": -7.308135032653809, "global_step": 203970, "epoch": 4856} {"train_loss": -7.332221984863281, "global_step": 203971, "epoch": 4856} {"train_loss": -7.351093292236328, "global_step": 203972, "epoch": 4856} {"train_loss": -7.218301773071289, "global_step": 203973, "epoch": 4856} {"train_loss": -7.366927146911621, "global_step": 203974, "epoch": 4856} {"train_loss": -7.326797008514404, "global_step": 203975, "epoch": 4856} {"train_loss": -7.217768669128418, "global_step": 203976, "epoch": 4856} {"train_loss": -7.295812606811523, "global_step": 203977, "epoch": 4856} {"train_loss": -7.217144012451172, "global_step": 203978, "epoch": 4856} {"train_loss": -7.172151565551758, "global_step": 203979, "epoch": 4856} {"train_loss": -7.292228698730469, "global_step": 203980, "epoch": 4856} {"train_loss": -7.132635593414307, "global_step": 203981, "epoch": 4856} {"train_loss": -7.260956764221191, "global_step": 203982, "epoch": 4856} {"train_loss": -7.236662864685059, "global_step": 203983, "epoch": 4856} {"train_loss": -7.263622760772705, "global_step": 203984, "epoch": 4856} {"train_loss": -7.23173189163208, "global_step": 203985, "epoch": 4856} {"train_loss": -7.271350860595703, "global_step": 203986, "epoch": 4856} {"train_loss": -7.18904972076416, "global_step": 203987, "epoch": 4856} {"train_loss": -7.058059215545654, "global_step": 203988, "epoch": 4856} {"train_loss": -7.172611236572266, "global_step": 203989, "epoch": 4856} {"train_loss": -7.239995002746582, "global_step": 203990, "epoch": 4856} {"train_loss": -7.152544021606445, "global_step": 203991, "epoch": 4856} {"train_loss": -7.210103988647461, "global_step": 203992, "epoch": 4856} {"train_loss": -7.2375981240045455, "global_step": 203993, "epoch": 4856, "val_loss": 69224.78125} {"train_loss": -7.191428184509277, "global_step": 203994, "epoch": 4857} {"train_loss": -7.254176139831543, "global_step": 203995, "epoch": 4857} {"train_loss": -7.018996238708496, "global_step": 203996, "epoch": 4857} {"train_loss": -7.245251178741455, "global_step": 203997, "epoch": 4857} {"train_loss": -7.142651081085205, "global_step": 203998, "epoch": 4857} {"train_loss": -7.122533321380615, "global_step": 203999, "epoch": 4857} {"train_loss": -7.180380821228027, "global_step": 204000, "epoch": 4857} {"train_loss": -7.098426342010498, "global_step": 204001, "epoch": 4857} {"train_loss": -7.143112659454346, "global_step": 204002, "epoch": 4857} {"train_loss": -7.131686210632324, "global_step": 204003, "epoch": 4857} {"train_loss": -7.108663082122803, "global_step": 204004, "epoch": 4857} {"train_loss": -7.224357604980469, "global_step": 204005, "epoch": 4857} {"train_loss": -7.170900344848633, "global_step": 204006, "epoch": 4857} {"train_loss": -7.188884258270264, "global_step": 204007, "epoch": 4857} {"train_loss": -7.162501811981201, "global_step": 204008, "epoch": 4857} {"train_loss": -7.219707489013672, "global_step": 204009, "epoch": 4857} {"train_loss": -7.204178810119629, "global_step": 204010, "epoch": 4857} {"train_loss": -7.199268341064453, "global_step": 204011, "epoch": 4857} {"train_loss": -7.2099528312683105, "global_step": 204012, "epoch": 4857} {"train_loss": -7.208203315734863, "global_step": 204013, "epoch": 4857} {"train_loss": -7.263587474822998, "global_step": 204014, "epoch": 4857} {"train_loss": -7.324887752532959, "global_step": 204015, "epoch": 4857} {"train_loss": -7.285641193389893, "global_step": 204016, "epoch": 4857} {"train_loss": -7.318327903747559, "global_step": 204017, "epoch": 4857} {"train_loss": -7.2975640296936035, "global_step": 204018, "epoch": 4857} {"train_loss": -7.315338134765625, "global_step": 204019, "epoch": 4857} {"train_loss": -7.272730827331543, "global_step": 204020, "epoch": 4857} {"train_loss": -7.341041088104248, "global_step": 204021, "epoch": 4857} {"train_loss": -7.363622665405273, "global_step": 204022, "epoch": 4857} {"train_loss": -7.401174545288086, "global_step": 204023, "epoch": 4857} {"train_loss": -7.397751808166504, "global_step": 204024, "epoch": 4857} {"train_loss": -7.323798179626465, "global_step": 204025, "epoch": 4857} {"train_loss": -7.287955284118652, "global_step": 204026, "epoch": 4857} {"train_loss": -7.369917869567871, "global_step": 204027, "epoch": 4857} {"train_loss": -7.315337181091309, "global_step": 204028, "epoch": 4857} {"train_loss": -7.393725395202637, "global_step": 204029, "epoch": 4857} {"train_loss": -7.397333145141602, "global_step": 204030, "epoch": 4857} {"train_loss": -7.3237199783325195, "global_step": 204031, "epoch": 4857} {"train_loss": -7.44616174697876, "global_step": 204032, "epoch": 4857} {"train_loss": -7.278656959533691, "global_step": 204033, "epoch": 4857} {"train_loss": -7.417804718017578, "global_step": 204034, "epoch": 4857} {"train_loss": -7.261293751852853, "global_step": 204035, "epoch": 4857, "val_loss": 68978.4609375} {"train_loss": -7.3966064453125, "global_step": 204036, "epoch": 4858} {"train_loss": -7.318571090698242, "global_step": 204037, "epoch": 4858} {"train_loss": -7.286775588989258, "global_step": 204038, "epoch": 4858} {"train_loss": -7.292238235473633, "global_step": 204039, "epoch": 4858} {"train_loss": -7.365189552307129, "global_step": 204040, "epoch": 4858} {"train_loss": -7.282534599304199, "global_step": 204041, "epoch": 4858} {"train_loss": -7.358221054077148, "global_step": 204042, "epoch": 4858} {"train_loss": -7.239591598510742, "global_step": 204043, "epoch": 4858} {"train_loss": -7.4210004806518555, "global_step": 204044, "epoch": 4858} {"train_loss": -7.2672319412231445, "global_step": 204045, "epoch": 4858} {"train_loss": -7.3925089836120605, "global_step": 204046, "epoch": 4858} {"train_loss": -7.244961261749268, "global_step": 204047, "epoch": 4858} {"train_loss": -7.334930419921875, "global_step": 204048, "epoch": 4858} {"train_loss": -7.0818915367126465, "global_step": 204049, "epoch": 4858} {"train_loss": -7.249131202697754, "global_step": 204050, "epoch": 4858} {"train_loss": -7.341073036193848, "global_step": 204051, "epoch": 4858} {"train_loss": -7.205892562866211, "global_step": 204052, "epoch": 4858} {"train_loss": -7.253186225891113, "global_step": 204053, "epoch": 4858} {"train_loss": -7.279327392578125, "global_step": 204054, "epoch": 4858} {"train_loss": -7.226407051086426, "global_step": 204055, "epoch": 4858} {"train_loss": -7.351842880249023, "global_step": 204056, "epoch": 4858} {"train_loss": -7.274572372436523, "global_step": 204057, "epoch": 4858} {"train_loss": -7.2335028648376465, "global_step": 204058, "epoch": 4858} {"train_loss": -7.366153717041016, "global_step": 204059, "epoch": 4858} {"train_loss": -7.170526504516602, "global_step": 204060, "epoch": 4858} {"train_loss": -7.193370819091797, "global_step": 204061, "epoch": 4858} {"train_loss": -7.224526405334473, "global_step": 204062, "epoch": 4858} {"train_loss": -7.277117729187012, "global_step": 204063, "epoch": 4858} {"train_loss": -7.2372355461120605, "global_step": 204064, "epoch": 4858} {"train_loss": -7.213403701782227, "global_step": 204065, "epoch": 4858} {"train_loss": -7.27835750579834, "global_step": 204066, "epoch": 4858} {"train_loss": -7.317842960357666, "global_step": 204067, "epoch": 4858} {"train_loss": -7.341299533843994, "global_step": 204068, "epoch": 4858} {"train_loss": -7.265203475952148, "global_step": 204069, "epoch": 4858} {"train_loss": -7.216977119445801, "global_step": 204070, "epoch": 4858} {"train_loss": -7.301059722900391, "global_step": 204071, "epoch": 4858} {"train_loss": -7.178250312805176, "global_step": 204072, "epoch": 4858} {"train_loss": -7.330549240112305, "global_step": 204073, "epoch": 4858} {"train_loss": -7.174352645874023, "global_step": 204074, "epoch": 4858} {"train_loss": -7.336745262145996, "global_step": 204075, "epoch": 4858} {"train_loss": -7.365467071533203, "global_step": 204076, "epoch": 4858} {"train_loss": -7.280154421215966, "global_step": 204077, "epoch": 4858, "val_loss": 69098.1328125} {"train_loss": -7.2734055519104, "global_step": 204078, "epoch": 4859} {"train_loss": -7.310938835144043, "global_step": 204079, "epoch": 4859} {"train_loss": -7.215081214904785, "global_step": 204080, "epoch": 4859} {"train_loss": -7.3310651779174805, "global_step": 204081, "epoch": 4859} {"train_loss": -7.262478828430176, "global_step": 204082, "epoch": 4859} {"train_loss": -7.11334753036499, "global_step": 204083, "epoch": 4859} {"train_loss": -7.276908874511719, "global_step": 204084, "epoch": 4859} {"train_loss": -7.19779109954834, "global_step": 204085, "epoch": 4859} {"train_loss": -7.226747512817383, "global_step": 204086, "epoch": 4859} {"train_loss": -7.3102288246154785, "global_step": 204087, "epoch": 4859} {"train_loss": -7.238090515136719, "global_step": 204088, "epoch": 4859} {"train_loss": -7.193641185760498, "global_step": 204089, "epoch": 4859} {"train_loss": -7.168734550476074, "global_step": 204090, "epoch": 4859} {"train_loss": -7.212968826293945, "global_step": 204091, "epoch": 4859} {"train_loss": -7.188722133636475, "global_step": 204092, "epoch": 4859} {"train_loss": -7.179369926452637, "global_step": 204093, "epoch": 4859} {"train_loss": -7.180205821990967, "global_step": 204094, "epoch": 4859} {"train_loss": -7.338805198669434, "global_step": 204095, "epoch": 4859} {"train_loss": -7.202126502990723, "global_step": 204096, "epoch": 4859} {"train_loss": -7.160285949707031, "global_step": 204097, "epoch": 4859} {"train_loss": -7.310201168060303, "global_step": 204098, "epoch": 4859} {"train_loss": -7.229100227355957, "global_step": 204099, "epoch": 4859} {"train_loss": -7.193730354309082, "global_step": 204100, "epoch": 4859} {"train_loss": -7.318393707275391, "global_step": 204101, "epoch": 4859} {"train_loss": -7.084629058837891, "global_step": 204102, "epoch": 4859} {"train_loss": -7.132696151733398, "global_step": 204103, "epoch": 4859} {"train_loss": -7.122900009155273, "global_step": 204104, "epoch": 4859} {"train_loss": -7.095965385437012, "global_step": 204105, "epoch": 4859} {"train_loss": -7.2611894607543945, "global_step": 204106, "epoch": 4859} {"train_loss": -7.040968418121338, "global_step": 204107, "epoch": 4859} {"train_loss": -7.025320529937744, "global_step": 204108, "epoch": 4859} {"train_loss": -7.168061256408691, "global_step": 204109, "epoch": 4859} {"train_loss": -7.1743292808532715, "global_step": 204110, "epoch": 4859} {"train_loss": -7.155617713928223, "global_step": 204111, "epoch": 4859} {"train_loss": -7.086711883544922, "global_step": 204112, "epoch": 4859} {"train_loss": -7.2531256675720215, "global_step": 204113, "epoch": 4859} {"train_loss": -7.130504608154297, "global_step": 204114, "epoch": 4859} {"train_loss": -7.272029399871826, "global_step": 204115, "epoch": 4859} {"train_loss": -7.14202356338501, "global_step": 204116, "epoch": 4859} {"train_loss": -7.200923442840576, "global_step": 204117, "epoch": 4859} {"train_loss": -7.178752422332764, "global_step": 204118, "epoch": 4859} {"train_loss": -7.201463506335304, "global_step": 204119, "epoch": 4859, "val_loss": 69167.0} {"train_loss": -7.298702239990234, "global_step": 204120, "epoch": 4860} {"train_loss": -7.2674713134765625, "global_step": 204121, "epoch": 4860} {"train_loss": -7.195120334625244, "global_step": 204122, "epoch": 4860} {"train_loss": -7.191680431365967, "global_step": 204123, "epoch": 4860} {"train_loss": -7.22066593170166, "global_step": 204124, "epoch": 4860} {"train_loss": -7.126349449157715, "global_step": 204125, "epoch": 4860} {"train_loss": -7.269512176513672, "global_step": 204126, "epoch": 4860} {"train_loss": -7.119918346405029, "global_step": 204127, "epoch": 4860} {"train_loss": -7.267437934875488, "global_step": 204128, "epoch": 4860} {"train_loss": -7.270343780517578, "global_step": 204129, "epoch": 4860} {"train_loss": -7.15492057800293, "global_step": 204130, "epoch": 4860} {"train_loss": -7.178912162780762, "global_step": 204131, "epoch": 4860} {"train_loss": -7.211550712585449, "global_step": 204132, "epoch": 4860} {"train_loss": -7.218321800231934, "global_step": 204133, "epoch": 4860} {"train_loss": -7.2342071533203125, "global_step": 204134, "epoch": 4860} {"train_loss": -7.182390213012695, "global_step": 204135, "epoch": 4860} {"train_loss": -7.20300817489624, "global_step": 204136, "epoch": 4860} {"train_loss": -7.176450729370117, "global_step": 204137, "epoch": 4860} {"train_loss": -7.169843673706055, "global_step": 204138, "epoch": 4860} {"train_loss": -7.251322269439697, "global_step": 204139, "epoch": 4860} {"train_loss": -7.215793132781982, "global_step": 204140, "epoch": 4860} {"train_loss": -7.2595720291137695, "global_step": 204141, "epoch": 4860} {"train_loss": -7.2471923828125, "global_step": 204142, "epoch": 4860} {"train_loss": -7.288529872894287, "global_step": 204143, "epoch": 4860} {"train_loss": -7.265270709991455, "global_step": 204144, "epoch": 4860} {"train_loss": -7.27562141418457, "global_step": 204145, "epoch": 4860} {"train_loss": -7.262747764587402, "global_step": 204146, "epoch": 4860} {"train_loss": -7.286139011383057, "global_step": 204147, "epoch": 4860} {"train_loss": -7.174777030944824, "global_step": 204148, "epoch": 4860} {"train_loss": -7.327465057373047, "global_step": 204149, "epoch": 4860} {"train_loss": -7.19126033782959, "global_step": 204150, "epoch": 4860} {"train_loss": -7.289404392242432, "global_step": 204151, "epoch": 4860} {"train_loss": -7.236992359161377, "global_step": 204152, "epoch": 4860} {"train_loss": -7.152740478515625, "global_step": 204153, "epoch": 4860} {"train_loss": -7.202729225158691, "global_step": 204154, "epoch": 4860} {"train_loss": -7.35151481628418, "global_step": 204155, "epoch": 4860} {"train_loss": -7.276547908782959, "global_step": 204156, "epoch": 4860} {"train_loss": -7.2628631591796875, "global_step": 204157, "epoch": 4860} {"train_loss": -7.212408065795898, "global_step": 204158, "epoch": 4860} {"train_loss": -7.353821277618408, "global_step": 204159, "epoch": 4860} {"train_loss": -7.26438045501709, "global_step": 204160, "epoch": 4860} {"train_loss": -7.236029613585699, "global_step": 204161, "epoch": 4860, "val_loss": 69027.1953125} {"train_loss": -7.304617881774902, "global_step": 204162, "epoch": 4861} {"train_loss": -7.343744277954102, "global_step": 204163, "epoch": 4861} {"train_loss": -7.275475025177002, "global_step": 204164, "epoch": 4861} {"train_loss": -7.344066619873047, "global_step": 204165, "epoch": 4861} {"train_loss": -7.254997253417969, "global_step": 204166, "epoch": 4861} {"train_loss": -7.256154537200928, "global_step": 204167, "epoch": 4861} {"train_loss": -7.236319065093994, "global_step": 204168, "epoch": 4861} {"train_loss": -7.302072048187256, "global_step": 204169, "epoch": 4861} {"train_loss": -7.266286849975586, "global_step": 204170, "epoch": 4861} {"train_loss": -7.279393196105957, "global_step": 204171, "epoch": 4861} {"train_loss": -7.311175346374512, "global_step": 204172, "epoch": 4861} {"train_loss": -7.299216270446777, "global_step": 204173, "epoch": 4861} {"train_loss": -7.279717445373535, "global_step": 204174, "epoch": 4861} {"train_loss": -7.225384712219238, "global_step": 204175, "epoch": 4861} {"train_loss": -7.273346900939941, "global_step": 204176, "epoch": 4861} {"train_loss": -7.257718086242676, "global_step": 204177, "epoch": 4861} {"train_loss": -7.240310192108154, "global_step": 204178, "epoch": 4861} {"train_loss": -7.322353363037109, "global_step": 204179, "epoch": 4861} {"train_loss": -7.219482421875, "global_step": 204180, "epoch": 4861} {"train_loss": -7.203778266906738, "global_step": 204181, "epoch": 4861} {"train_loss": -7.255277633666992, "global_step": 204182, "epoch": 4861} {"train_loss": -7.292779922485352, "global_step": 204183, "epoch": 4861} {"train_loss": -7.226739883422852, "global_step": 204184, "epoch": 4861} {"train_loss": -7.320345878601074, "global_step": 204185, "epoch": 4861} {"train_loss": -7.242727279663086, "global_step": 204186, "epoch": 4861} {"train_loss": -7.356743812561035, "global_step": 204187, "epoch": 4861} {"train_loss": -7.225450038909912, "global_step": 204188, "epoch": 4861} {"train_loss": -7.242128372192383, "global_step": 204189, "epoch": 4861} {"train_loss": -7.231997489929199, "global_step": 204190, "epoch": 4861} {"train_loss": -7.287708282470703, "global_step": 204191, "epoch": 4861} {"train_loss": -7.207162380218506, "global_step": 204192, "epoch": 4861} {"train_loss": -7.288352966308594, "global_step": 204193, "epoch": 4861} {"train_loss": -7.24235200881958, "global_step": 204194, "epoch": 4861} {"train_loss": -7.2682647705078125, "global_step": 204195, "epoch": 4861} {"train_loss": -7.417781352996826, "global_step": 204196, "epoch": 4861} {"train_loss": -7.228405475616455, "global_step": 204197, "epoch": 4861} {"train_loss": -7.123611927032471, "global_step": 204198, "epoch": 4861} {"train_loss": -7.304532051086426, "global_step": 204199, "epoch": 4861} {"train_loss": -7.245540142059326, "global_step": 204200, "epoch": 4861} {"train_loss": -7.244314670562744, "global_step": 204201, "epoch": 4861} {"train_loss": -7.211791515350342, "global_step": 204202, "epoch": 4861} {"train_loss": -7.264370475496564, "global_step": 204203, "epoch": 4861, "val_loss": 69109.4921875} {"train_loss": -7.1649932861328125, "global_step": 204204, "epoch": 4862} {"train_loss": -7.156741142272949, "global_step": 204205, "epoch": 4862} {"train_loss": -7.153573036193848, "global_step": 204206, "epoch": 4862} {"train_loss": -7.2304534912109375, "global_step": 204207, "epoch": 4862} {"train_loss": -7.251781463623047, "global_step": 204208, "epoch": 4862} {"train_loss": -7.283939838409424, "global_step": 204209, "epoch": 4862} {"train_loss": -7.239114761352539, "global_step": 204210, "epoch": 4862} {"train_loss": -7.321022033691406, "global_step": 204211, "epoch": 4862} {"train_loss": -7.263701915740967, "global_step": 204212, "epoch": 4862} {"train_loss": -7.214484691619873, "global_step": 204213, "epoch": 4862} {"train_loss": -7.286274433135986, "global_step": 204214, "epoch": 4862} {"train_loss": -7.228997230529785, "global_step": 204215, "epoch": 4862} {"train_loss": -7.165282249450684, "global_step": 204216, "epoch": 4862} {"train_loss": -7.099307537078857, "global_step": 204217, "epoch": 4862} {"train_loss": -7.370855331420898, "global_step": 204218, "epoch": 4862} {"train_loss": -7.188897132873535, "global_step": 204219, "epoch": 4862} {"train_loss": -7.213797092437744, "global_step": 204220, "epoch": 4862} {"train_loss": -7.2186384201049805, "global_step": 204221, "epoch": 4862} {"train_loss": -7.1615447998046875, "global_step": 204222, "epoch": 4862} {"train_loss": -7.1059889793396, "global_step": 204223, "epoch": 4862} {"train_loss": -7.292414665222168, "global_step": 204224, "epoch": 4862} {"train_loss": -7.058864116668701, "global_step": 204225, "epoch": 4862} {"train_loss": -7.256418228149414, "global_step": 204226, "epoch": 4862} {"train_loss": -7.198390960693359, "global_step": 204227, "epoch": 4862} {"train_loss": -7.173749923706055, "global_step": 204228, "epoch": 4862} {"train_loss": -7.204894065856934, "global_step": 204229, "epoch": 4862} {"train_loss": -7.154784202575684, "global_step": 204230, "epoch": 4862} {"train_loss": -7.22033166885376, "global_step": 204231, "epoch": 4862} {"train_loss": -7.201930046081543, "global_step": 204232, "epoch": 4862} {"train_loss": -7.053434371948242, "global_step": 204233, "epoch": 4862} {"train_loss": -7.159334182739258, "global_step": 204234, "epoch": 4862} {"train_loss": -7.105690956115723, "global_step": 204235, "epoch": 4862} {"train_loss": -7.18087100982666, "global_step": 204236, "epoch": 4862} {"train_loss": -7.334430694580078, "global_step": 204237, "epoch": 4862} {"train_loss": -7.066065788269043, "global_step": 204238, "epoch": 4862} {"train_loss": -7.133962631225586, "global_step": 204239, "epoch": 4862} {"train_loss": -7.1911115646362305, "global_step": 204240, "epoch": 4862} {"train_loss": -7.235302448272705, "global_step": 204241, "epoch": 4862} {"train_loss": -7.252826690673828, "global_step": 204242, "epoch": 4862} {"train_loss": -7.239753246307373, "global_step": 204243, "epoch": 4862} {"train_loss": -7.074302673339844, "global_step": 204244, "epoch": 4862} {"train_loss": -7.200588986987159, "global_step": 204245, "epoch": 4862, "val_loss": 69209.4453125} {"train_loss": -7.323329925537109, "global_step": 204246, "epoch": 4863} {"train_loss": -7.184651851654053, "global_step": 204247, "epoch": 4863} {"train_loss": -7.205263137817383, "global_step": 204248, "epoch": 4863} {"train_loss": -7.226959705352783, "global_step": 204249, "epoch": 4863} {"train_loss": -7.365962982177734, "global_step": 204250, "epoch": 4863} {"train_loss": -7.235903263092041, "global_step": 204251, "epoch": 4863} {"train_loss": -7.356179237365723, "global_step": 204252, "epoch": 4863} {"train_loss": -7.350879669189453, "global_step": 204253, "epoch": 4863} {"train_loss": -7.311940670013428, "global_step": 204254, "epoch": 4863} {"train_loss": -7.32290506362915, "global_step": 204255, "epoch": 4863} {"train_loss": -7.231081008911133, "global_step": 204256, "epoch": 4863} {"train_loss": -7.318359851837158, "global_step": 204257, "epoch": 4863} {"train_loss": -7.296530246734619, "global_step": 204258, "epoch": 4863} {"train_loss": -7.214357376098633, "global_step": 204259, "epoch": 4863} {"train_loss": -7.352367401123047, "global_step": 204260, "epoch": 4863} {"train_loss": -7.156027793884277, "global_step": 204261, "epoch": 4863} {"train_loss": -7.321244239807129, "global_step": 204262, "epoch": 4863} {"train_loss": -7.084061622619629, "global_step": 204263, "epoch": 4863} {"train_loss": -7.1872758865356445, "global_step": 204264, "epoch": 4863} {"train_loss": -7.158744812011719, "global_step": 204265, "epoch": 4863} {"train_loss": -7.2593560218811035, "global_step": 204266, "epoch": 4863} {"train_loss": -7.155925750732422, "global_step": 204267, "epoch": 4863} {"train_loss": -7.258553504943848, "global_step": 204268, "epoch": 4863} {"train_loss": -7.418560028076172, "global_step": 204269, "epoch": 4863} {"train_loss": -7.172098159790039, "global_step": 204270, "epoch": 4863} {"train_loss": -7.224773406982422, "global_step": 204271, "epoch": 4863} {"train_loss": -7.164999008178711, "global_step": 204272, "epoch": 4863} {"train_loss": -7.221982955932617, "global_step": 204273, "epoch": 4863} {"train_loss": -7.321503639221191, "global_step": 204274, "epoch": 4863} {"train_loss": -7.179712295532227, "global_step": 204275, "epoch": 4863} {"train_loss": -7.271965980529785, "global_step": 204276, "epoch": 4863} {"train_loss": -7.194711208343506, "global_step": 204277, "epoch": 4863} {"train_loss": -7.144228935241699, "global_step": 204278, "epoch": 4863} {"train_loss": -7.215265274047852, "global_step": 204279, "epoch": 4863} {"train_loss": -7.014345169067383, "global_step": 204280, "epoch": 4863} {"train_loss": -7.267770767211914, "global_step": 204281, "epoch": 4863} {"train_loss": -7.214553356170654, "global_step": 204282, "epoch": 4863} {"train_loss": -7.144658088684082, "global_step": 204283, "epoch": 4863} {"train_loss": -7.179087162017822, "global_step": 204284, "epoch": 4863} {"train_loss": -7.265145778656006, "global_step": 204285, "epoch": 4863} {"train_loss": -7.343348979949951, "global_step": 204286, "epoch": 4863} {"train_loss": -7.23930743762425, "global_step": 204287, "epoch": 4863, "val_loss": 69157.90625} {"train_loss": -7.139854431152344, "global_step": 204288, "epoch": 4864} {"train_loss": -7.251996994018555, "global_step": 204289, "epoch": 4864} {"train_loss": -7.236000061035156, "global_step": 204290, "epoch": 4864} {"train_loss": -7.234532356262207, "global_step": 204291, "epoch": 4864} {"train_loss": -7.170950412750244, "global_step": 204292, "epoch": 4864} {"train_loss": -7.254067420959473, "global_step": 204293, "epoch": 4864} {"train_loss": -7.294198989868164, "global_step": 204294, "epoch": 4864} {"train_loss": -7.197949409484863, "global_step": 204295, "epoch": 4864} {"train_loss": -7.309779167175293, "global_step": 204296, "epoch": 4864} {"train_loss": -7.207475662231445, "global_step": 204297, "epoch": 4864} {"train_loss": -7.250967979431152, "global_step": 204298, "epoch": 4864} {"train_loss": -7.2617692947387695, "global_step": 204299, "epoch": 4864} {"train_loss": -7.2445807456970215, "global_step": 204300, "epoch": 4864} {"train_loss": -7.189002990722656, "global_step": 204301, "epoch": 4864} {"train_loss": -7.294946670532227, "global_step": 204302, "epoch": 4864} {"train_loss": -7.27056884765625, "global_step": 204303, "epoch": 4864} {"train_loss": -7.290508270263672, "global_step": 204304, "epoch": 4864} {"train_loss": -7.391172885894775, "global_step": 204305, "epoch": 4864} {"train_loss": -7.187270164489746, "global_step": 204306, "epoch": 4864} {"train_loss": -7.140398979187012, "global_step": 204307, "epoch": 4864} {"train_loss": -7.273906707763672, "global_step": 204308, "epoch": 4864} {"train_loss": -7.265359878540039, "global_step": 204309, "epoch": 4864} {"train_loss": -7.207322120666504, "global_step": 204310, "epoch": 4864} {"train_loss": -7.301036834716797, "global_step": 204311, "epoch": 4864} {"train_loss": -7.277494430541992, "global_step": 204312, "epoch": 4864} {"train_loss": -7.296937942504883, "global_step": 204313, "epoch": 4864} {"train_loss": -7.270085334777832, "global_step": 204314, "epoch": 4864} {"train_loss": -7.320915699005127, "global_step": 204315, "epoch": 4864} {"train_loss": -7.277105331420898, "global_step": 204316, "epoch": 4864} {"train_loss": -7.274643898010254, "global_step": 204317, "epoch": 4864} {"train_loss": -7.347351551055908, "global_step": 204318, "epoch": 4864} {"train_loss": -7.245562553405762, "global_step": 204319, "epoch": 4864} {"train_loss": -7.329442977905273, "global_step": 204320, "epoch": 4864} {"train_loss": -7.366091251373291, "global_step": 204321, "epoch": 4864} {"train_loss": -7.326374053955078, "global_step": 204322, "epoch": 4864} {"train_loss": -7.2556352615356445, "global_step": 204323, "epoch": 4864} {"train_loss": -7.233363151550293, "global_step": 204324, "epoch": 4864} {"train_loss": -7.267056465148926, "global_step": 204325, "epoch": 4864} {"train_loss": -7.186845779418945, "global_step": 204326, "epoch": 4864} {"train_loss": -7.305522918701172, "global_step": 204327, "epoch": 4864} {"train_loss": -7.202082633972168, "global_step": 204328, "epoch": 4864} {"train_loss": -7.2603617168608165, "global_step": 204329, "epoch": 4864, "val_loss": 69181.125} {"train_loss": -7.249688148498535, "global_step": 204330, "epoch": 4865} {"train_loss": -7.30760383605957, "global_step": 204331, "epoch": 4865} {"train_loss": -7.258965969085693, "global_step": 204332, "epoch": 4865} {"train_loss": -7.215333938598633, "global_step": 204333, "epoch": 4865} {"train_loss": -7.199071407318115, "global_step": 204334, "epoch": 4865} {"train_loss": -7.262394905090332, "global_step": 204335, "epoch": 4865} {"train_loss": -7.017360210418701, "global_step": 204336, "epoch": 4865} {"train_loss": -7.312283515930176, "global_step": 204337, "epoch": 4865} {"train_loss": -7.210796356201172, "global_step": 204338, "epoch": 4865} {"train_loss": -7.084212779998779, "global_step": 204339, "epoch": 4865} {"train_loss": -7.116413593292236, "global_step": 204340, "epoch": 4865} {"train_loss": -7.014202117919922, "global_step": 204341, "epoch": 4865} {"train_loss": -7.2854204177856445, "global_step": 204342, "epoch": 4865} {"train_loss": -7.192763328552246, "global_step": 204343, "epoch": 4865} {"train_loss": -7.2037153244018555, "global_step": 204344, "epoch": 4865} {"train_loss": -7.02842903137207, "global_step": 204345, "epoch": 4865} {"train_loss": -7.2315168380737305, "global_step": 204346, "epoch": 4865} {"train_loss": -7.078551292419434, "global_step": 204347, "epoch": 4865} {"train_loss": -7.264983177185059, "global_step": 204348, "epoch": 4865} {"train_loss": -7.165639877319336, "global_step": 204349, "epoch": 4865} {"train_loss": -7.120590686798096, "global_step": 204350, "epoch": 4865} {"train_loss": -7.172021389007568, "global_step": 204351, "epoch": 4865} {"train_loss": -7.211805820465088, "global_step": 204352, "epoch": 4865} {"train_loss": -7.176482200622559, "global_step": 204353, "epoch": 4865} {"train_loss": -7.158520698547363, "global_step": 204354, "epoch": 4865} {"train_loss": -7.2176947593688965, "global_step": 204355, "epoch": 4865} {"train_loss": -7.195625305175781, "global_step": 204356, "epoch": 4865} {"train_loss": -7.169591903686523, "global_step": 204357, "epoch": 4865} {"train_loss": -7.1970906257629395, "global_step": 204358, "epoch": 4865} {"train_loss": -7.126605987548828, "global_step": 204359, "epoch": 4865} {"train_loss": -7.015865325927734, "global_step": 204360, "epoch": 4865} {"train_loss": -7.16015625, "global_step": 204361, "epoch": 4865} {"train_loss": -7.147038459777832, "global_step": 204362, "epoch": 4865} {"train_loss": -7.182350158691406, "global_step": 204363, "epoch": 4865} {"train_loss": -7.236217498779297, "global_step": 204364, "epoch": 4865} {"train_loss": -7.200592994689941, "global_step": 204365, "epoch": 4865} {"train_loss": -7.102774620056152, "global_step": 204366, "epoch": 4865} {"train_loss": -7.17136812210083, "global_step": 204367, "epoch": 4865} {"train_loss": -7.165759086608887, "global_step": 204368, "epoch": 4865} {"train_loss": -7.195243835449219, "global_step": 204369, "epoch": 4865} {"train_loss": -7.190998077392578, "global_step": 204370, "epoch": 4865} {"train_loss": -7.178498052415394, "global_step": 204371, "epoch": 4865, "val_loss": 68999.3984375} {"train_loss": -7.194818496704102, "global_step": 204372, "epoch": 4866} {"train_loss": -7.208486557006836, "global_step": 204373, "epoch": 4866} {"train_loss": -7.279487609863281, "global_step": 204374, "epoch": 4866} {"train_loss": -7.323533058166504, "global_step": 204375, "epoch": 4866} {"train_loss": -7.403066158294678, "global_step": 204376, "epoch": 4866} {"train_loss": -7.38397216796875, "global_step": 204377, "epoch": 4866} {"train_loss": -7.270367622375488, "global_step": 204378, "epoch": 4866} {"train_loss": -7.287015914916992, "global_step": 204379, "epoch": 4866} {"train_loss": -7.203175067901611, "global_step": 204380, "epoch": 4866} {"train_loss": -7.205377101898193, "global_step": 204381, "epoch": 4866} {"train_loss": -7.261866092681885, "global_step": 204382, "epoch": 4866} {"train_loss": -7.352011680603027, "global_step": 204383, "epoch": 4866} {"train_loss": -7.141667366027832, "global_step": 204384, "epoch": 4866} {"train_loss": -7.269926071166992, "global_step": 204385, "epoch": 4866} {"train_loss": -7.283810138702393, "global_step": 204386, "epoch": 4866} {"train_loss": -7.222746849060059, "global_step": 204387, "epoch": 4866} {"train_loss": -7.384169578552246, "global_step": 204388, "epoch": 4866} {"train_loss": -7.274076461791992, "global_step": 204389, "epoch": 4866} {"train_loss": -7.246975898742676, "global_step": 204390, "epoch": 4866} {"train_loss": -7.318230628967285, "global_step": 204391, "epoch": 4866} {"train_loss": -7.407891273498535, "global_step": 204392, "epoch": 4866} {"train_loss": -7.306124210357666, "global_step": 204393, "epoch": 4866} {"train_loss": -7.223278999328613, "global_step": 204394, "epoch": 4866} {"train_loss": -7.474909782409668, "global_step": 204395, "epoch": 4866} {"train_loss": -7.280900955200195, "global_step": 204396, "epoch": 4866} {"train_loss": -7.343873500823975, "global_step": 204397, "epoch": 4866} {"train_loss": -7.310242652893066, "global_step": 204398, "epoch": 4866} {"train_loss": -7.202915191650391, "global_step": 204399, "epoch": 4866} {"train_loss": -7.149798393249512, "global_step": 204400, "epoch": 4866} {"train_loss": -7.269810676574707, "global_step": 204401, "epoch": 4866} {"train_loss": -7.273648262023926, "global_step": 204402, "epoch": 4866} {"train_loss": -7.344793319702148, "global_step": 204403, "epoch": 4866} {"train_loss": -7.1419830322265625, "global_step": 204404, "epoch": 4866} {"train_loss": -7.284363746643066, "global_step": 204405, "epoch": 4866} {"train_loss": -7.176596164703369, "global_step": 204406, "epoch": 4866} {"train_loss": -7.166876792907715, "global_step": 204407, "epoch": 4866} {"train_loss": -7.306149482727051, "global_step": 204408, "epoch": 4866} {"train_loss": -7.216810703277588, "global_step": 204409, "epoch": 4866} {"train_loss": -7.30814266204834, "global_step": 204410, "epoch": 4866} {"train_loss": -7.229640007019043, "global_step": 204411, "epoch": 4866} {"train_loss": -7.32424783706665, "global_step": 204412, "epoch": 4866} {"train_loss": -7.2760334469023205, "global_step": 204413, "epoch": 4866, "val_loss": 69066.8828125} {"train_loss": -7.326968193054199, "global_step": 204414, "epoch": 4867} {"train_loss": -7.329219341278076, "global_step": 204415, "epoch": 4867} {"train_loss": -7.272251129150391, "global_step": 204416, "epoch": 4867} {"train_loss": -7.247354984283447, "global_step": 204417, "epoch": 4867} {"train_loss": -7.307480812072754, "global_step": 204418, "epoch": 4867} {"train_loss": -7.419599533081055, "global_step": 204419, "epoch": 4867} {"train_loss": -7.266587257385254, "global_step": 204420, "epoch": 4867} {"train_loss": -7.222700119018555, "global_step": 204421, "epoch": 4867} {"train_loss": -7.30180549621582, "global_step": 204422, "epoch": 4867} {"train_loss": -7.340092658996582, "global_step": 204423, "epoch": 4867} {"train_loss": -7.350030422210693, "global_step": 204424, "epoch": 4867} {"train_loss": -7.303058624267578, "global_step": 204425, "epoch": 4867} {"train_loss": -7.369408130645752, "global_step": 204426, "epoch": 4867} {"train_loss": -7.341591835021973, "global_step": 204427, "epoch": 4867} {"train_loss": -7.237349510192871, "global_step": 204428, "epoch": 4867} {"train_loss": -7.328161239624023, "global_step": 204429, "epoch": 4867} {"train_loss": -7.340534210205078, "global_step": 204430, "epoch": 4867} {"train_loss": -7.188999176025391, "global_step": 204431, "epoch": 4867} {"train_loss": -7.131248950958252, "global_step": 204432, "epoch": 4867} {"train_loss": -7.2211174964904785, "global_step": 204433, "epoch": 4867} {"train_loss": -7.400543689727783, "global_step": 204434, "epoch": 4867} {"train_loss": -7.191210746765137, "global_step": 204435, "epoch": 4867} {"train_loss": -7.2218017578125, "global_step": 204436, "epoch": 4867} {"train_loss": -7.203272819519043, "global_step": 204437, "epoch": 4867} {"train_loss": -7.14158296585083, "global_step": 204438, "epoch": 4867} {"train_loss": -7.247276306152344, "global_step": 204439, "epoch": 4867} {"train_loss": -7.251818656921387, "global_step": 204440, "epoch": 4867} {"train_loss": -7.1678009033203125, "global_step": 204441, "epoch": 4867} {"train_loss": -7.21380090713501, "global_step": 204442, "epoch": 4867} {"train_loss": -7.146789073944092, "global_step": 204443, "epoch": 4867} {"train_loss": -7.293928146362305, "global_step": 204444, "epoch": 4867} {"train_loss": -7.181327819824219, "global_step": 204445, "epoch": 4867} {"train_loss": -7.0366129875183105, "global_step": 204446, "epoch": 4867} {"train_loss": -7.252408027648926, "global_step": 204447, "epoch": 4867} {"train_loss": -6.9814558029174805, "global_step": 204448, "epoch": 4867} {"train_loss": -7.335259437561035, "global_step": 204449, "epoch": 4867} {"train_loss": -7.108725070953369, "global_step": 204450, "epoch": 4867} {"train_loss": -7.209134101867676, "global_step": 204451, "epoch": 4867} {"train_loss": -7.193774223327637, "global_step": 204452, "epoch": 4867} {"train_loss": -7.192534446716309, "global_step": 204453, "epoch": 4867} {"train_loss": -7.137911319732666, "global_step": 204454, "epoch": 4867} {"train_loss": -7.2415923618135, "global_step": 204455, "epoch": 4867, "val_loss": 69246.484375} {"train_loss": -7.188929557800293, "global_step": 204456, "epoch": 4868} {"train_loss": -7.177670001983643, "global_step": 204457, "epoch": 4868} {"train_loss": -7.291479110717773, "global_step": 204458, "epoch": 4868} {"train_loss": -7.204977512359619, "global_step": 204459, "epoch": 4868} {"train_loss": -7.103052139282227, "global_step": 204460, "epoch": 4868} {"train_loss": -7.1173858642578125, "global_step": 204461, "epoch": 4868} {"train_loss": -7.200695514678955, "global_step": 204462, "epoch": 4868} {"train_loss": -7.092774868011475, "global_step": 204463, "epoch": 4868} {"train_loss": -7.182783603668213, "global_step": 204464, "epoch": 4868} {"train_loss": -7.1226301193237305, "global_step": 204465, "epoch": 4868} {"train_loss": -7.237444877624512, "global_step": 204466, "epoch": 4868} {"train_loss": -7.1965227127075195, "global_step": 204467, "epoch": 4868} {"train_loss": -7.177437782287598, "global_step": 204468, "epoch": 4868} {"train_loss": -7.316427707672119, "global_step": 204469, "epoch": 4868} {"train_loss": -7.17962646484375, "global_step": 204470, "epoch": 4868} {"train_loss": -7.189923286437988, "global_step": 204471, "epoch": 4868} {"train_loss": -7.255364418029785, "global_step": 204472, "epoch": 4868} {"train_loss": -7.190883636474609, "global_step": 204473, "epoch": 4868} {"train_loss": -7.269977569580078, "global_step": 204474, "epoch": 4868} {"train_loss": -7.249513626098633, "global_step": 204475, "epoch": 4868} {"train_loss": -7.288930892944336, "global_step": 204476, "epoch": 4868} {"train_loss": -7.344615936279297, "global_step": 204477, "epoch": 4868} {"train_loss": -7.326486110687256, "global_step": 204478, "epoch": 4868} {"train_loss": -7.269082069396973, "global_step": 204479, "epoch": 4868} {"train_loss": -7.361800193786621, "global_step": 204480, "epoch": 4868} {"train_loss": -7.3570356369018555, "global_step": 204481, "epoch": 4868} {"train_loss": -7.307962417602539, "global_step": 204482, "epoch": 4868} {"train_loss": -7.303423881530762, "global_step": 204483, "epoch": 4868} {"train_loss": -7.206531524658203, "global_step": 204484, "epoch": 4868} {"train_loss": -7.351680755615234, "global_step": 204485, "epoch": 4868} {"train_loss": -7.280099868774414, "global_step": 204486, "epoch": 4868} {"train_loss": -7.336461544036865, "global_step": 204487, "epoch": 4868} {"train_loss": -7.278625011444092, "global_step": 204488, "epoch": 4868} {"train_loss": -7.279648780822754, "global_step": 204489, "epoch": 4868} {"train_loss": -7.150758743286133, "global_step": 204490, "epoch": 4868} {"train_loss": -7.3199615478515625, "global_step": 204491, "epoch": 4868} {"train_loss": -7.337747573852539, "global_step": 204492, "epoch": 4868} {"train_loss": -7.288938522338867, "global_step": 204493, "epoch": 4868} {"train_loss": -7.358980178833008, "global_step": 204494, "epoch": 4868} {"train_loss": -7.365582466125488, "global_step": 204495, "epoch": 4868} {"train_loss": -7.263444900512695, "global_step": 204496, "epoch": 4868} {"train_loss": -7.25105635325114, "global_step": 204497, "epoch": 4868, "val_loss": 69135.203125} {"train_loss": -7.301533222198486, "global_step": 204498, "epoch": 4869} {"train_loss": -7.286688327789307, "global_step": 204499, "epoch": 4869} {"train_loss": -7.24519157409668, "global_step": 204500, "epoch": 4869} {"train_loss": -7.269949913024902, "global_step": 204501, "epoch": 4869} {"train_loss": -7.27581787109375, "global_step": 204502, "epoch": 4869} {"train_loss": -7.404359817504883, "global_step": 204503, "epoch": 4869} {"train_loss": -7.354061126708984, "global_step": 204504, "epoch": 4869} {"train_loss": -7.288369655609131, "global_step": 204505, "epoch": 4869} {"train_loss": -7.266923904418945, "global_step": 204506, "epoch": 4869} {"train_loss": -7.1516032218933105, "global_step": 204507, "epoch": 4869} {"train_loss": -7.210413455963135, "global_step": 204508, "epoch": 4869} {"train_loss": -7.241661071777344, "global_step": 204509, "epoch": 4869} {"train_loss": -7.271127223968506, "global_step": 204510, "epoch": 4869} {"train_loss": -7.30311393737793, "global_step": 204511, "epoch": 4869} {"train_loss": -7.196260452270508, "global_step": 204512, "epoch": 4869} {"train_loss": -7.289979934692383, "global_step": 204513, "epoch": 4869} {"train_loss": -7.227498531341553, "global_step": 204514, "epoch": 4869} {"train_loss": -7.368162155151367, "global_step": 204515, "epoch": 4869} {"train_loss": -7.255950927734375, "global_step": 204516, "epoch": 4869} {"train_loss": -7.268950462341309, "global_step": 204517, "epoch": 4869} {"train_loss": -7.159268379211426, "global_step": 204518, "epoch": 4869} {"train_loss": -7.2026519775390625, "global_step": 204519, "epoch": 4869} {"train_loss": -7.076269149780273, "global_step": 204520, "epoch": 4869} {"train_loss": -7.127626895904541, "global_step": 204521, "epoch": 4869} {"train_loss": -7.219517707824707, "global_step": 204522, "epoch": 4869} {"train_loss": -7.25223445892334, "global_step": 204523, "epoch": 4869} {"train_loss": -7.269988059997559, "global_step": 204524, "epoch": 4869} {"train_loss": -7.302516937255859, "global_step": 204525, "epoch": 4869} {"train_loss": -7.18897819519043, "global_step": 204526, "epoch": 4869} {"train_loss": -7.152128219604492, "global_step": 204527, "epoch": 4869} {"train_loss": -7.051874160766602, "global_step": 204528, "epoch": 4869} {"train_loss": -7.249180793762207, "global_step": 204529, "epoch": 4869} {"train_loss": -7.213022708892822, "global_step": 204530, "epoch": 4869} {"train_loss": -7.179621696472168, "global_step": 204531, "epoch": 4869} {"train_loss": -7.130194664001465, "global_step": 204532, "epoch": 4869} {"train_loss": -7.160577774047852, "global_step": 204533, "epoch": 4869} {"train_loss": -7.264683723449707, "global_step": 204534, "epoch": 4869} {"train_loss": -7.220136642456055, "global_step": 204535, "epoch": 4869} {"train_loss": -7.165386199951172, "global_step": 204536, "epoch": 4869} {"train_loss": -7.436717987060547, "global_step": 204537, "epoch": 4869} {"train_loss": -7.259771347045898, "global_step": 204538, "epoch": 4869} {"train_loss": -7.239486785162063, "global_step": 204539, "epoch": 4869, "val_loss": 69213.890625} {"train_loss": -7.171485424041748, "global_step": 204540, "epoch": 4870} {"train_loss": -7.170261859893799, "global_step": 204541, "epoch": 4870} {"train_loss": -7.209231853485107, "global_step": 204542, "epoch": 4870} {"train_loss": -7.25140905380249, "global_step": 204543, "epoch": 4870} {"train_loss": -7.3391618728637695, "global_step": 204544, "epoch": 4870} {"train_loss": -7.283699989318848, "global_step": 204545, "epoch": 4870} {"train_loss": -7.148665904998779, "global_step": 204546, "epoch": 4870} {"train_loss": -7.259235382080078, "global_step": 204547, "epoch": 4870} {"train_loss": -7.451111316680908, "global_step": 204548, "epoch": 4870} {"train_loss": -7.296689987182617, "global_step": 204549, "epoch": 4870} {"train_loss": -7.429973602294922, "global_step": 204550, "epoch": 4870} {"train_loss": -7.342784881591797, "global_step": 204551, "epoch": 4870} {"train_loss": -7.261274814605713, "global_step": 204552, "epoch": 4870} {"train_loss": -7.205587387084961, "global_step": 204553, "epoch": 4870} {"train_loss": -7.3080949783325195, "global_step": 204554, "epoch": 4870} {"train_loss": -7.295167922973633, "global_step": 204555, "epoch": 4870} {"train_loss": -7.268951416015625, "global_step": 204556, "epoch": 4870} {"train_loss": -7.318963050842285, "global_step": 204557, "epoch": 4870} {"train_loss": -7.350582122802734, "global_step": 204558, "epoch": 4870} {"train_loss": -7.3222856521606445, "global_step": 204559, "epoch": 4870} {"train_loss": -7.208468437194824, "global_step": 204560, "epoch": 4870} {"train_loss": -7.374427795410156, "global_step": 204561, "epoch": 4870} {"train_loss": -7.385820388793945, "global_step": 204562, "epoch": 4870} {"train_loss": -7.316008567810059, "global_step": 204563, "epoch": 4870} {"train_loss": -7.18248987197876, "global_step": 204564, "epoch": 4870} {"train_loss": -7.211907386779785, "global_step": 204565, "epoch": 4870} {"train_loss": -7.093827247619629, "global_step": 204566, "epoch": 4870} {"train_loss": -7.281254768371582, "global_step": 204567, "epoch": 4870} {"train_loss": -7.234025001525879, "global_step": 204568, "epoch": 4870} {"train_loss": -7.230917930603027, "global_step": 204569, "epoch": 4870} {"train_loss": -7.370864391326904, "global_step": 204570, "epoch": 4870} {"train_loss": -7.189157485961914, "global_step": 204571, "epoch": 4870} {"train_loss": -7.306121349334717, "global_step": 204572, "epoch": 4870} {"train_loss": -7.351799964904785, "global_step": 204573, "epoch": 4870} {"train_loss": -7.131085395812988, "global_step": 204574, "epoch": 4870} {"train_loss": -7.274346351623535, "global_step": 204575, "epoch": 4870} {"train_loss": -7.295660972595215, "global_step": 204576, "epoch": 4870} {"train_loss": -7.270776271820068, "global_step": 204577, "epoch": 4870} {"train_loss": -7.295918941497803, "global_step": 204578, "epoch": 4870} {"train_loss": -7.310617923736572, "global_step": 204579, "epoch": 4870} {"train_loss": -7.254355430603027, "global_step": 204580, "epoch": 4870} {"train_loss": -7.273645389647711, "global_step": 204581, "epoch": 4870, "val_loss": 69167.234375} {"train_loss": -7.372718334197998, "global_step": 204582, "epoch": 4871} {"train_loss": -7.23350715637207, "global_step": 204583, "epoch": 4871} {"train_loss": -7.139291763305664, "global_step": 204584, "epoch": 4871} {"train_loss": -7.0374932289123535, "global_step": 204585, "epoch": 4871} {"train_loss": -7.253706932067871, "global_step": 204586, "epoch": 4871} {"train_loss": -7.115717887878418, "global_step": 204587, "epoch": 4871} {"train_loss": -7.169247627258301, "global_step": 204588, "epoch": 4871} {"train_loss": -7.195488929748535, "global_step": 204589, "epoch": 4871} {"train_loss": -7.130639553070068, "global_step": 204590, "epoch": 4871} {"train_loss": -7.270702362060547, "global_step": 204591, "epoch": 4871} {"train_loss": -7.1876678466796875, "global_step": 204592, "epoch": 4871} {"train_loss": -7.360846519470215, "global_step": 204593, "epoch": 4871} {"train_loss": -7.169907569885254, "global_step": 204594, "epoch": 4871} {"train_loss": -7.295524597167969, "global_step": 204595, "epoch": 4871} {"train_loss": -7.213920593261719, "global_step": 204596, "epoch": 4871} {"train_loss": -7.166172027587891, "global_step": 204597, "epoch": 4871} {"train_loss": -7.241771221160889, "global_step": 204598, "epoch": 4871} {"train_loss": -7.160224914550781, "global_step": 204599, "epoch": 4871} {"train_loss": -7.322709560394287, "global_step": 204600, "epoch": 4871} {"train_loss": -7.270542144775391, "global_step": 204601, "epoch": 4871} {"train_loss": -7.24765682220459, "global_step": 204602, "epoch": 4871} {"train_loss": -7.257740020751953, "global_step": 204603, "epoch": 4871} {"train_loss": -7.1335062980651855, "global_step": 204604, "epoch": 4871} {"train_loss": -7.297524929046631, "global_step": 204605, "epoch": 4871} {"train_loss": -7.0794219970703125, "global_step": 204606, "epoch": 4871} {"train_loss": -7.270929336547852, "global_step": 204607, "epoch": 4871} {"train_loss": -7.230384826660156, "global_step": 204608, "epoch": 4871} {"train_loss": -7.351762771606445, "global_step": 204609, "epoch": 4871} {"train_loss": -7.161774635314941, "global_step": 204610, "epoch": 4871} {"train_loss": -7.178439617156982, "global_step": 204611, "epoch": 4871} {"train_loss": -7.187097549438477, "global_step": 204612, "epoch": 4871} {"train_loss": -7.185163974761963, "global_step": 204613, "epoch": 4871} {"train_loss": -7.241995811462402, "global_step": 204614, "epoch": 4871} {"train_loss": -7.11945915222168, "global_step": 204615, "epoch": 4871} {"train_loss": -7.025790691375732, "global_step": 204616, "epoch": 4871} {"train_loss": -7.173737525939941, "global_step": 204617, "epoch": 4871} {"train_loss": -7.254092216491699, "global_step": 204618, "epoch": 4871} {"train_loss": -7.0806756019592285, "global_step": 204619, "epoch": 4871} {"train_loss": -7.226572036743164, "global_step": 204620, "epoch": 4871} {"train_loss": -7.113826751708984, "global_step": 204621, "epoch": 4871} {"train_loss": -7.174788475036621, "global_step": 204622, "epoch": 4871} {"train_loss": -7.203317392440069, "global_step": 204623, "epoch": 4871, "val_loss": 69232.3125} {"train_loss": -7.213435649871826, "global_step": 204624, "epoch": 4872} {"train_loss": -7.093109130859375, "global_step": 204625, "epoch": 4872} {"train_loss": -7.253461837768555, "global_step": 204626, "epoch": 4872} {"train_loss": -7.176519870758057, "global_step": 204627, "epoch": 4872} {"train_loss": -7.202362060546875, "global_step": 204628, "epoch": 4872} {"train_loss": -7.1345977783203125, "global_step": 204629, "epoch": 4872} {"train_loss": -7.150626182556152, "global_step": 204630, "epoch": 4872} {"train_loss": -7.187822341918945, "global_step": 204631, "epoch": 4872} {"train_loss": -7.239262580871582, "global_step": 204632, "epoch": 4872} {"train_loss": -7.279147148132324, "global_step": 204633, "epoch": 4872} {"train_loss": -7.226705074310303, "global_step": 204634, "epoch": 4872} {"train_loss": -7.212582588195801, "global_step": 204635, "epoch": 4872} {"train_loss": -7.196502685546875, "global_step": 204636, "epoch": 4872} {"train_loss": -7.2023491859436035, "global_step": 204637, "epoch": 4872} {"train_loss": -7.240274906158447, "global_step": 204638, "epoch": 4872} {"train_loss": -7.197075843811035, "global_step": 204639, "epoch": 4872} {"train_loss": -7.273083686828613, "global_step": 204640, "epoch": 4872} {"train_loss": -7.176640510559082, "global_step": 204641, "epoch": 4872} {"train_loss": -7.270475387573242, "global_step": 204642, "epoch": 4872} {"train_loss": -7.23444938659668, "global_step": 204643, "epoch": 4872} {"train_loss": -7.247554302215576, "global_step": 204644, "epoch": 4872} {"train_loss": -7.284996032714844, "global_step": 204645, "epoch": 4872} {"train_loss": -7.274423599243164, "global_step": 204646, "epoch": 4872} {"train_loss": -7.339598178863525, "global_step": 204647, "epoch": 4872} {"train_loss": -7.295740127563477, "global_step": 204648, "epoch": 4872} {"train_loss": -7.271945953369141, "global_step": 204649, "epoch": 4872} {"train_loss": -7.337306022644043, "global_step": 204650, "epoch": 4872} {"train_loss": -7.27061128616333, "global_step": 204651, "epoch": 4872} {"train_loss": -7.318137168884277, "global_step": 204652, "epoch": 4872} {"train_loss": -7.248948574066162, "global_step": 204653, "epoch": 4872} {"train_loss": -7.408377647399902, "global_step": 204654, "epoch": 4872} {"train_loss": -7.316275119781494, "global_step": 204655, "epoch": 4872} {"train_loss": -7.2747344970703125, "global_step": 204656, "epoch": 4872} {"train_loss": -7.352479457855225, "global_step": 204657, "epoch": 4872} {"train_loss": -7.324376106262207, "global_step": 204658, "epoch": 4872} {"train_loss": -7.198843955993652, "global_step": 204659, "epoch": 4872} {"train_loss": -7.348409175872803, "global_step": 204660, "epoch": 4872} {"train_loss": -7.316734313964844, "global_step": 204661, "epoch": 4872} {"train_loss": -7.303314208984375, "global_step": 204662, "epoch": 4872} {"train_loss": -7.40145206451416, "global_step": 204663, "epoch": 4872} {"train_loss": -7.305826663970947, "global_step": 204664, "epoch": 4872} {"train_loss": -7.259472744805472, "global_step": 204665, "epoch": 4872, "val_loss": 69224.109375} {"train_loss": -7.277597904205322, "global_step": 204666, "epoch": 4873} {"train_loss": -7.0965046882629395, "global_step": 204667, "epoch": 4873} {"train_loss": -7.326488018035889, "global_step": 204668, "epoch": 4873} {"train_loss": -7.140568733215332, "global_step": 204669, "epoch": 4873} {"train_loss": -7.3407769203186035, "global_step": 204670, "epoch": 4873} {"train_loss": -7.105160713195801, "global_step": 204671, "epoch": 4873} {"train_loss": -7.239999771118164, "global_step": 204672, "epoch": 4873} {"train_loss": -7.364226818084717, "global_step": 204673, "epoch": 4873} {"train_loss": -7.189970016479492, "global_step": 204674, "epoch": 4873} {"train_loss": -7.114738464355469, "global_step": 204675, "epoch": 4873} {"train_loss": -7.280961036682129, "global_step": 204676, "epoch": 4873} {"train_loss": -7.3113627433776855, "global_step": 204677, "epoch": 4873} {"train_loss": -7.333746433258057, "global_step": 204678, "epoch": 4873} {"train_loss": -7.109158515930176, "global_step": 204679, "epoch": 4873} {"train_loss": -7.27534294128418, "global_step": 204680, "epoch": 4873} {"train_loss": -7.189962387084961, "global_step": 204681, "epoch": 4873} {"train_loss": -7.116943836212158, "global_step": 204682, "epoch": 4873} {"train_loss": -7.381409168243408, "global_step": 204683, "epoch": 4873} {"train_loss": -7.281783103942871, "global_step": 204684, "epoch": 4873} {"train_loss": -7.137077331542969, "global_step": 204685, "epoch": 4873} {"train_loss": -7.195034980773926, "global_step": 204686, "epoch": 4873} {"train_loss": -7.174297332763672, "global_step": 204687, "epoch": 4873} {"train_loss": -7.280396938323975, "global_step": 204688, "epoch": 4873} {"train_loss": -7.226785182952881, "global_step": 204689, "epoch": 4873} {"train_loss": -7.098907470703125, "global_step": 204690, "epoch": 4873} {"train_loss": -7.269661903381348, "global_step": 204691, "epoch": 4873} {"train_loss": -7.3593339920043945, "global_step": 204692, "epoch": 4873} {"train_loss": -7.061811447143555, "global_step": 204693, "epoch": 4873} {"train_loss": -7.362301826477051, "global_step": 204694, "epoch": 4873} {"train_loss": -7.226590633392334, "global_step": 204695, "epoch": 4873} {"train_loss": -7.266347408294678, "global_step": 204696, "epoch": 4873} {"train_loss": -7.161783218383789, "global_step": 204697, "epoch": 4873} {"train_loss": -7.2497029304504395, "global_step": 204698, "epoch": 4873} {"train_loss": -7.2901530265808105, "global_step": 204699, "epoch": 4873} {"train_loss": -7.275814056396484, "global_step": 204700, "epoch": 4873} {"train_loss": -7.198186874389648, "global_step": 204701, "epoch": 4873} {"train_loss": -7.331091403961182, "global_step": 204702, "epoch": 4873} {"train_loss": -7.250758171081543, "global_step": 204703, "epoch": 4873} {"train_loss": -7.197040557861328, "global_step": 204704, "epoch": 4873} {"train_loss": -7.159173965454102, "global_step": 204705, "epoch": 4873} {"train_loss": -7.419487953186035, "global_step": 204706, "epoch": 4873} {"train_loss": -7.235008126213437, "global_step": 204707, "epoch": 4873, "val_loss": 69124.8046875} {"train_loss": -7.266425132751465, "global_step": 204708, "epoch": 4874} {"train_loss": -7.275948524475098, "global_step": 204709, "epoch": 4874} {"train_loss": -7.18946647644043, "global_step": 204710, "epoch": 4874} {"train_loss": -7.155015468597412, "global_step": 204711, "epoch": 4874} {"train_loss": -7.304880142211914, "global_step": 204712, "epoch": 4874} {"train_loss": -7.21968936920166, "global_step": 204713, "epoch": 4874} {"train_loss": -7.282726287841797, "global_step": 204714, "epoch": 4874} {"train_loss": -7.3547139167785645, "global_step": 204715, "epoch": 4874} {"train_loss": -7.372251987457275, "global_step": 204716, "epoch": 4874} {"train_loss": -7.259652137756348, "global_step": 204717, "epoch": 4874} {"train_loss": -7.258360385894775, "global_step": 204718, "epoch": 4874} {"train_loss": -7.333415985107422, "global_step": 204719, "epoch": 4874} {"train_loss": -7.257671356201172, "global_step": 204720, "epoch": 4874} {"train_loss": -7.227856636047363, "global_step": 204721, "epoch": 4874} {"train_loss": -7.427016258239746, "global_step": 204722, "epoch": 4874} {"train_loss": -7.30653190612793, "global_step": 204723, "epoch": 4874} {"train_loss": -7.333644390106201, "global_step": 204724, "epoch": 4874} {"train_loss": -7.256148815155029, "global_step": 204725, "epoch": 4874} {"train_loss": -7.186856269836426, "global_step": 204726, "epoch": 4874} {"train_loss": -7.377131462097168, "global_step": 204727, "epoch": 4874} {"train_loss": -7.430123329162598, "global_step": 204728, "epoch": 4874} {"train_loss": -7.1969499588012695, "global_step": 204729, "epoch": 4874} {"train_loss": -7.3588714599609375, "global_step": 204730, "epoch": 4874} {"train_loss": -7.343990325927734, "global_step": 204731, "epoch": 4874} {"train_loss": -7.307027339935303, "global_step": 204732, "epoch": 4874} {"train_loss": -7.303146839141846, "global_step": 204733, "epoch": 4874} {"train_loss": -7.277222633361816, "global_step": 204734, "epoch": 4874} {"train_loss": -7.332657814025879, "global_step": 204735, "epoch": 4874} {"train_loss": -7.197257041931152, "global_step": 204736, "epoch": 4874} {"train_loss": -7.288525581359863, "global_step": 204737, "epoch": 4874} {"train_loss": -7.286883354187012, "global_step": 204738, "epoch": 4874} {"train_loss": -7.3346452713012695, "global_step": 204739, "epoch": 4874} {"train_loss": -7.176216125488281, "global_step": 204740, "epoch": 4874} {"train_loss": -7.258415699005127, "global_step": 204741, "epoch": 4874} {"train_loss": -7.300499439239502, "global_step": 204742, "epoch": 4874} {"train_loss": -7.293423175811768, "global_step": 204743, "epoch": 4874} {"train_loss": -7.3398237228393555, "global_step": 204744, "epoch": 4874} {"train_loss": -7.226607322692871, "global_step": 204745, "epoch": 4874} {"train_loss": -7.380468845367432, "global_step": 204746, "epoch": 4874} {"train_loss": -7.1634111404418945, "global_step": 204747, "epoch": 4874} {"train_loss": -7.2933268547058105, "global_step": 204748, "epoch": 4874} {"train_loss": -7.281917140597389, "global_step": 204749, "epoch": 4874, "val_loss": 69099.1640625} {"train_loss": -7.272452354431152, "global_step": 204750, "epoch": 4875} {"train_loss": -7.318722724914551, "global_step": 204751, "epoch": 4875} {"train_loss": -7.038079261779785, "global_step": 204752, "epoch": 4875} {"train_loss": -7.0319366455078125, "global_step": 204753, "epoch": 4875} {"train_loss": -7.161753177642822, "global_step": 204754, "epoch": 4875} {"train_loss": -7.133942127227783, "global_step": 204755, "epoch": 4875} {"train_loss": -7.139660835266113, "global_step": 204756, "epoch": 4875} {"train_loss": -7.181480407714844, "global_step": 204757, "epoch": 4875} {"train_loss": -7.17962646484375, "global_step": 204758, "epoch": 4875} {"train_loss": -7.140643119812012, "global_step": 204759, "epoch": 4875} {"train_loss": -7.109377861022949, "global_step": 204760, "epoch": 4875} {"train_loss": -7.2049407958984375, "global_step": 204761, "epoch": 4875} {"train_loss": -7.041166305541992, "global_step": 204762, "epoch": 4875} {"train_loss": -7.305177688598633, "global_step": 204763, "epoch": 4875} {"train_loss": -7.14894962310791, "global_step": 204764, "epoch": 4875} {"train_loss": -7.108513832092285, "global_step": 204765, "epoch": 4875} {"train_loss": -7.231219291687012, "global_step": 204766, "epoch": 4875} {"train_loss": -7.222332000732422, "global_step": 204767, "epoch": 4875} {"train_loss": -7.124923229217529, "global_step": 204768, "epoch": 4875} {"train_loss": -7.219649314880371, "global_step": 204769, "epoch": 4875} {"train_loss": -7.235501289367676, "global_step": 204770, "epoch": 4875} {"train_loss": -7.243933200836182, "global_step": 204771, "epoch": 4875} {"train_loss": -7.222618579864502, "global_step": 204772, "epoch": 4875} {"train_loss": -7.1080217361450195, "global_step": 204773, "epoch": 4875} {"train_loss": -7.252634048461914, "global_step": 204774, "epoch": 4875} {"train_loss": -7.201782703399658, "global_step": 204775, "epoch": 4875} {"train_loss": -7.182494163513184, "global_step": 204776, "epoch": 4875} {"train_loss": -7.263799667358398, "global_step": 204777, "epoch": 4875} {"train_loss": -7.1331095695495605, "global_step": 204778, "epoch": 4875} {"train_loss": -7.254129409790039, "global_step": 204779, "epoch": 4875} {"train_loss": -7.300491809844971, "global_step": 204780, "epoch": 4875} {"train_loss": -7.260923385620117, "global_step": 204781, "epoch": 4875} {"train_loss": -7.293352127075195, "global_step": 204782, "epoch": 4875} {"train_loss": -7.319183349609375, "global_step": 204783, "epoch": 4875} {"train_loss": -7.317924499511719, "global_step": 204784, "epoch": 4875} {"train_loss": -7.264854907989502, "global_step": 204785, "epoch": 4875} {"train_loss": -7.2904791831970215, "global_step": 204786, "epoch": 4875} {"train_loss": -7.285619735717773, "global_step": 204787, "epoch": 4875} {"train_loss": -7.211302757263184, "global_step": 204788, "epoch": 4875} {"train_loss": -7.305783271789551, "global_step": 204789, "epoch": 4875} {"train_loss": -7.274763584136963, "global_step": 204790, "epoch": 4875} {"train_loss": -7.207131215504238, "global_step": 204791, "epoch": 4875, "val_loss": 69292.8359375} {"train_loss": -7.2609710693359375, "global_step": 204792, "epoch": 4876} {"train_loss": -7.216678619384766, "global_step": 204793, "epoch": 4876} {"train_loss": -7.061063766479492, "global_step": 204794, "epoch": 4876} {"train_loss": -7.141366481781006, "global_step": 204795, "epoch": 4876} {"train_loss": -7.272195339202881, "global_step": 204796, "epoch": 4876} {"train_loss": -7.232234001159668, "global_step": 204797, "epoch": 4876} {"train_loss": -7.252183437347412, "global_step": 204798, "epoch": 4876} {"train_loss": -7.219683647155762, "global_step": 204799, "epoch": 4876} {"train_loss": -7.172317981719971, "global_step": 204800, "epoch": 4876} {"train_loss": -7.273124694824219, "global_step": 204801, "epoch": 4876} {"train_loss": -7.220372676849365, "global_step": 204802, "epoch": 4876} {"train_loss": -7.298401832580566, "global_step": 204803, "epoch": 4876} {"train_loss": -7.129371643066406, "global_step": 204804, "epoch": 4876} {"train_loss": -7.250985145568848, "global_step": 204805, "epoch": 4876} {"train_loss": -7.199805736541748, "global_step": 204806, "epoch": 4876} {"train_loss": -7.22714900970459, "global_step": 204807, "epoch": 4876} {"train_loss": -7.248140335083008, "global_step": 204808, "epoch": 4876} {"train_loss": -7.268071174621582, "global_step": 204809, "epoch": 4876} {"train_loss": -7.328401565551758, "global_step": 204810, "epoch": 4876} {"train_loss": -7.24746036529541, "global_step": 204811, "epoch": 4876} {"train_loss": -7.376983642578125, "global_step": 204812, "epoch": 4876} {"train_loss": -7.271648406982422, "global_step": 204813, "epoch": 4876} {"train_loss": -7.321967601776123, "global_step": 204814, "epoch": 4876} {"train_loss": -7.3513360023498535, "global_step": 204815, "epoch": 4876} {"train_loss": -7.295742034912109, "global_step": 204816, "epoch": 4876} {"train_loss": -7.281694412231445, "global_step": 204817, "epoch": 4876} {"train_loss": -7.273883819580078, "global_step": 204818, "epoch": 4876} {"train_loss": -7.256636619567871, "global_step": 204819, "epoch": 4876} {"train_loss": -7.321657657623291, "global_step": 204820, "epoch": 4876} {"train_loss": -7.2955217361450195, "global_step": 204821, "epoch": 4876} {"train_loss": -7.166690826416016, "global_step": 204822, "epoch": 4876} {"train_loss": -7.320347785949707, "global_step": 204823, "epoch": 4876} {"train_loss": -7.286806583404541, "global_step": 204824, "epoch": 4876} {"train_loss": -7.259368896484375, "global_step": 204825, "epoch": 4876} {"train_loss": -7.2576398849487305, "global_step": 204826, "epoch": 4876} {"train_loss": -7.201653957366943, "global_step": 204827, "epoch": 4876} {"train_loss": -7.2197065353393555, "global_step": 204828, "epoch": 4876} {"train_loss": -7.171788215637207, "global_step": 204829, "epoch": 4876} {"train_loss": -7.222559452056885, "global_step": 204830, "epoch": 4876} {"train_loss": -7.254987716674805, "global_step": 204831, "epoch": 4876} {"train_loss": -7.293970108032227, "global_step": 204832, "epoch": 4876} {"train_loss": -7.248818874359131, "global_step": 204833, "epoch": 4876, "val_loss": 69388.4921875} {"train_loss": -7.094908714294434, "global_step": 204834, "epoch": 4877} {"train_loss": -7.262018203735352, "global_step": 204835, "epoch": 4877} {"train_loss": -7.213911056518555, "global_step": 204836, "epoch": 4877} {"train_loss": -7.160712242126465, "global_step": 204837, "epoch": 4877} {"train_loss": -7.27279806137085, "global_step": 204838, "epoch": 4877} {"train_loss": -7.223170280456543, "global_step": 204839, "epoch": 4877} {"train_loss": -7.249638557434082, "global_step": 204840, "epoch": 4877} {"train_loss": -7.109009265899658, "global_step": 204841, "epoch": 4877} {"train_loss": -7.164552688598633, "global_step": 204842, "epoch": 4877} {"train_loss": -7.318249225616455, "global_step": 204843, "epoch": 4877} {"train_loss": -7.168384552001953, "global_step": 204844, "epoch": 4877} {"train_loss": -7.1864542961120605, "global_step": 204845, "epoch": 4877} {"train_loss": -7.394597053527832, "global_step": 204846, "epoch": 4877} {"train_loss": -7.157846927642822, "global_step": 204847, "epoch": 4877} {"train_loss": -7.192843914031982, "global_step": 204848, "epoch": 4877} {"train_loss": -7.268513202667236, "global_step": 204849, "epoch": 4877} {"train_loss": -7.227884769439697, "global_step": 204850, "epoch": 4877} {"train_loss": -7.210440158843994, "global_step": 204851, "epoch": 4877} {"train_loss": -7.208791732788086, "global_step": 204852, "epoch": 4877} {"train_loss": -7.228257179260254, "global_step": 204853, "epoch": 4877} {"train_loss": -7.235963821411133, "global_step": 204854, "epoch": 4877} {"train_loss": -7.213239669799805, "global_step": 204855, "epoch": 4877} {"train_loss": -7.253554821014404, "global_step": 204856, "epoch": 4877} {"train_loss": -7.118439674377441, "global_step": 204857, "epoch": 4877} {"train_loss": -7.315212249755859, "global_step": 204858, "epoch": 4877} {"train_loss": -7.319382667541504, "global_step": 204859, "epoch": 4877} {"train_loss": -7.218667030334473, "global_step": 204860, "epoch": 4877} {"train_loss": -7.3073883056640625, "global_step": 204861, "epoch": 4877} {"train_loss": -7.2203779220581055, "global_step": 204862, "epoch": 4877} {"train_loss": -7.204950332641602, "global_step": 204863, "epoch": 4877} {"train_loss": -7.247152328491211, "global_step": 204864, "epoch": 4877} {"train_loss": -7.283700942993164, "global_step": 204865, "epoch": 4877} {"train_loss": -7.403311729431152, "global_step": 204866, "epoch": 4877} {"train_loss": -7.142450332641602, "global_step": 204867, "epoch": 4877} {"train_loss": -7.2135772705078125, "global_step": 204868, "epoch": 4877} {"train_loss": -7.266790390014648, "global_step": 204869, "epoch": 4877} {"train_loss": -7.213741779327393, "global_step": 204870, "epoch": 4877} {"train_loss": -7.2509074211120605, "global_step": 204871, "epoch": 4877} {"train_loss": -7.290034294128418, "global_step": 204872, "epoch": 4877} {"train_loss": -7.218963146209717, "global_step": 204873, "epoch": 4877} {"train_loss": -7.227646827697754, "global_step": 204874, "epoch": 4877} {"train_loss": -7.23367216473534, "global_step": 204875, "epoch": 4877, "val_loss": 69122.03125} {"train_loss": -7.236725807189941, "global_step": 204876, "epoch": 4878} {"train_loss": -7.426950454711914, "global_step": 204877, "epoch": 4878} {"train_loss": -7.3191070556640625, "global_step": 204878, "epoch": 4878} {"train_loss": -7.216716766357422, "global_step": 204879, "epoch": 4878} {"train_loss": -7.271729469299316, "global_step": 204880, "epoch": 4878} {"train_loss": -7.20388126373291, "global_step": 204881, "epoch": 4878} {"train_loss": -7.322610855102539, "global_step": 204882, "epoch": 4878} {"train_loss": -7.300119876861572, "global_step": 204883, "epoch": 4878} {"train_loss": -7.23758602142334, "global_step": 204884, "epoch": 4878} {"train_loss": -7.219635486602783, "global_step": 204885, "epoch": 4878} {"train_loss": -7.288686752319336, "global_step": 204886, "epoch": 4878} {"train_loss": -7.196452617645264, "global_step": 204887, "epoch": 4878} {"train_loss": -7.194729328155518, "global_step": 204888, "epoch": 4878} {"train_loss": -7.305344581604004, "global_step": 204889, "epoch": 4878} {"train_loss": -7.227990627288818, "global_step": 204890, "epoch": 4878} {"train_loss": -7.328363418579102, "global_step": 204891, "epoch": 4878} {"train_loss": -7.3546142578125, "global_step": 204892, "epoch": 4878} {"train_loss": -7.264603137969971, "global_step": 204893, "epoch": 4878} {"train_loss": -7.275179862976074, "global_step": 204894, "epoch": 4878} {"train_loss": -7.301040172576904, "global_step": 204895, "epoch": 4878} {"train_loss": -7.22172737121582, "global_step": 204896, "epoch": 4878} {"train_loss": -7.383496284484863, "global_step": 204897, "epoch": 4878} {"train_loss": -7.339902400970459, "global_step": 204898, "epoch": 4878} {"train_loss": -7.220591068267822, "global_step": 204899, "epoch": 4878} {"train_loss": -7.213568687438965, "global_step": 204900, "epoch": 4878} {"train_loss": -7.335143089294434, "global_step": 204901, "epoch": 4878} {"train_loss": -7.3175225257873535, "global_step": 204902, "epoch": 4878} {"train_loss": -7.35041618347168, "global_step": 204903, "epoch": 4878} {"train_loss": -7.242262840270996, "global_step": 204904, "epoch": 4878} {"train_loss": -7.342617511749268, "global_step": 204905, "epoch": 4878} {"train_loss": -7.396302223205566, "global_step": 204906, "epoch": 4878} {"train_loss": -7.416028022766113, "global_step": 204907, "epoch": 4878} {"train_loss": -7.279878616333008, "global_step": 204908, "epoch": 4878} {"train_loss": -7.303350448608398, "global_step": 204909, "epoch": 4878} {"train_loss": -7.408361911773682, "global_step": 204910, "epoch": 4878} {"train_loss": -7.311275482177734, "global_step": 204911, "epoch": 4878} {"train_loss": -7.350304126739502, "global_step": 204912, "epoch": 4878} {"train_loss": -7.319236755371094, "global_step": 204913, "epoch": 4878} {"train_loss": -7.261609077453613, "global_step": 204914, "epoch": 4878} {"train_loss": -7.246287822723389, "global_step": 204915, "epoch": 4878} {"train_loss": -7.23145866394043, "global_step": 204916, "epoch": 4878} {"train_loss": -7.294158708481562, "global_step": 204917, "epoch": 4878, "val_loss": 69107.078125} {"train_loss": -7.35922908782959, "global_step": 204918, "epoch": 4879} {"train_loss": -7.2068963050842285, "global_step": 204919, "epoch": 4879} {"train_loss": -7.319585800170898, "global_step": 204920, "epoch": 4879} {"train_loss": -7.28365421295166, "global_step": 204921, "epoch": 4879} {"train_loss": -7.423404693603516, "global_step": 204922, "epoch": 4879} {"train_loss": -7.251901626586914, "global_step": 204923, "epoch": 4879} {"train_loss": -7.348796367645264, "global_step": 204924, "epoch": 4879} {"train_loss": -7.2530198097229, "global_step": 204925, "epoch": 4879} {"train_loss": -7.376955986022949, "global_step": 204926, "epoch": 4879} {"train_loss": -7.197728157043457, "global_step": 204927, "epoch": 4879} {"train_loss": -7.309469699859619, "global_step": 204928, "epoch": 4879} {"train_loss": -7.210006237030029, "global_step": 204929, "epoch": 4879} {"train_loss": -7.327389240264893, "global_step": 204930, "epoch": 4879} {"train_loss": -7.3306989669799805, "global_step": 204931, "epoch": 4879} {"train_loss": -7.368965148925781, "global_step": 204932, "epoch": 4879} {"train_loss": -7.294969081878662, "global_step": 204933, "epoch": 4879} {"train_loss": -7.360527038574219, "global_step": 204934, "epoch": 4879} {"train_loss": -7.2992143630981445, "global_step": 204935, "epoch": 4879} {"train_loss": -7.323270320892334, "global_step": 204936, "epoch": 4879} {"train_loss": -7.349134922027588, "global_step": 204937, "epoch": 4879} {"train_loss": -7.083348274230957, "global_step": 204938, "epoch": 4879} {"train_loss": -7.185081958770752, "global_step": 204939, "epoch": 4879} {"train_loss": -7.012650489807129, "global_step": 204940, "epoch": 4879} {"train_loss": -7.257440567016602, "global_step": 204941, "epoch": 4879} {"train_loss": -7.102864742279053, "global_step": 204942, "epoch": 4879} {"train_loss": -7.174165725708008, "global_step": 204943, "epoch": 4879} {"train_loss": -7.237612247467041, "global_step": 204944, "epoch": 4879} {"train_loss": -7.186677932739258, "global_step": 204945, "epoch": 4879} {"train_loss": -7.126896858215332, "global_step": 204946, "epoch": 4879} {"train_loss": -7.106787204742432, "global_step": 204947, "epoch": 4879} {"train_loss": -7.173885345458984, "global_step": 204948, "epoch": 4879} {"train_loss": -7.167363166809082, "global_step": 204949, "epoch": 4879} {"train_loss": -7.076006889343262, "global_step": 204950, "epoch": 4879} {"train_loss": -7.141390800476074, "global_step": 204951, "epoch": 4879} {"train_loss": -7.175623893737793, "global_step": 204952, "epoch": 4879} {"train_loss": -7.215115547180176, "global_step": 204953, "epoch": 4879} {"train_loss": -7.185126781463623, "global_step": 204954, "epoch": 4879} {"train_loss": -7.129973411560059, "global_step": 204955, "epoch": 4879} {"train_loss": -7.136595726013184, "global_step": 204956, "epoch": 4879} {"train_loss": -7.2313666343688965, "global_step": 204957, "epoch": 4879} {"train_loss": -7.247536659240723, "global_step": 204958, "epoch": 4879} {"train_loss": -7.230966772351946, "global_step": 204959, "epoch": 4879, "val_loss": 69295.125} {"train_loss": -7.303244590759277, "global_step": 204960, "epoch": 4880} {"train_loss": -7.196018695831299, "global_step": 204961, "epoch": 4880} {"train_loss": -7.242456436157227, "global_step": 204962, "epoch": 4880} {"train_loss": -7.198448657989502, "global_step": 204963, "epoch": 4880} {"train_loss": -7.21498966217041, "global_step": 204964, "epoch": 4880} {"train_loss": -7.300841331481934, "global_step": 204965, "epoch": 4880} {"train_loss": -7.2976579666137695, "global_step": 204966, "epoch": 4880} {"train_loss": -7.13040018081665, "global_step": 204967, "epoch": 4880} {"train_loss": -7.19194221496582, "global_step": 204968, "epoch": 4880} {"train_loss": -7.193155288696289, "global_step": 204969, "epoch": 4880} {"train_loss": -7.340993881225586, "global_step": 204970, "epoch": 4880} {"train_loss": -7.168093681335449, "global_step": 204971, "epoch": 4880} {"train_loss": -7.153487205505371, "global_step": 204972, "epoch": 4880} {"train_loss": -7.232504844665527, "global_step": 204973, "epoch": 4880} {"train_loss": -7.3190813064575195, "global_step": 204974, "epoch": 4880} {"train_loss": -7.181828022003174, "global_step": 204975, "epoch": 4880} {"train_loss": -7.210287094116211, "global_step": 204976, "epoch": 4880} {"train_loss": -7.277248382568359, "global_step": 204977, "epoch": 4880} {"train_loss": -7.356014251708984, "global_step": 204978, "epoch": 4880} {"train_loss": -7.388932228088379, "global_step": 204979, "epoch": 4880} {"train_loss": -7.2283172607421875, "global_step": 204980, "epoch": 4880} {"train_loss": -7.245208740234375, "global_step": 204981, "epoch": 4880} {"train_loss": -7.266839027404785, "global_step": 204982, "epoch": 4880} {"train_loss": -7.317879676818848, "global_step": 204983, "epoch": 4880} {"train_loss": -7.330574035644531, "global_step": 204984, "epoch": 4880} {"train_loss": -7.113526344299316, "global_step": 204985, "epoch": 4880} {"train_loss": -7.393794059753418, "global_step": 204986, "epoch": 4880} {"train_loss": -7.346200942993164, "global_step": 204987, "epoch": 4880} {"train_loss": -7.217106819152832, "global_step": 204988, "epoch": 4880} {"train_loss": -7.18230676651001, "global_step": 204989, "epoch": 4880} {"train_loss": -7.256600379943848, "global_step": 204990, "epoch": 4880} {"train_loss": -7.194938659667969, "global_step": 204991, "epoch": 4880} {"train_loss": -7.258072853088379, "global_step": 204992, "epoch": 4880} {"train_loss": -7.215275287628174, "global_step": 204993, "epoch": 4880} {"train_loss": -7.266055107116699, "global_step": 204994, "epoch": 4880} {"train_loss": -7.291999816894531, "global_step": 204995, "epoch": 4880} {"train_loss": -7.345088005065918, "global_step": 204996, "epoch": 4880} {"train_loss": -7.307435512542725, "global_step": 204997, "epoch": 4880} {"train_loss": -7.225162982940674, "global_step": 204998, "epoch": 4880} {"train_loss": -7.390195846557617, "global_step": 204999, "epoch": 4880} {"train_loss": -7.325414657592773, "global_step": 205000, "epoch": 4880} {"train_loss": -7.259088595708211, "global_step": 205001, "epoch": 4880, "val_loss": 69054.1640625} {"train_loss": -7.286433219909668, "global_step": 205002, "epoch": 4881} {"train_loss": -7.258601188659668, "global_step": 205003, "epoch": 4881} {"train_loss": -7.2957963943481445, "global_step": 205004, "epoch": 4881} {"train_loss": -7.382269382476807, "global_step": 205005, "epoch": 4881} {"train_loss": -7.2915940284729, "global_step": 205006, "epoch": 4881} {"train_loss": -7.313567161560059, "global_step": 205007, "epoch": 4881} {"train_loss": -7.294474124908447, "global_step": 205008, "epoch": 4881} {"train_loss": -7.123984336853027, "global_step": 205009, "epoch": 4881} {"train_loss": -7.15164041519165, "global_step": 205010, "epoch": 4881} {"train_loss": -7.290516376495361, "global_step": 205011, "epoch": 4881} {"train_loss": -7.26024055480957, "global_step": 205012, "epoch": 4881} {"train_loss": -7.3622026443481445, "global_step": 205013, "epoch": 4881} {"train_loss": -7.185768127441406, "global_step": 205014, "epoch": 4881} {"train_loss": -7.262428283691406, "global_step": 205015, "epoch": 4881} {"train_loss": -7.337454319000244, "global_step": 205016, "epoch": 4881} {"train_loss": -7.282926082611084, "global_step": 205017, "epoch": 4881} {"train_loss": -7.10015344619751, "global_step": 205018, "epoch": 4881} {"train_loss": -7.334683418273926, "global_step": 205019, "epoch": 4881} {"train_loss": -7.299869537353516, "global_step": 205020, "epoch": 4881} {"train_loss": -7.270986557006836, "global_step": 205021, "epoch": 4881} {"train_loss": -7.3724822998046875, "global_step": 205022, "epoch": 4881} {"train_loss": -7.281514644622803, "global_step": 205023, "epoch": 4881} {"train_loss": -7.372154235839844, "global_step": 205024, "epoch": 4881} {"train_loss": -7.322566509246826, "global_step": 205025, "epoch": 4881} {"train_loss": -7.204480171203613, "global_step": 205026, "epoch": 4881} {"train_loss": -7.170720100402832, "global_step": 205027, "epoch": 4881} {"train_loss": -7.148284912109375, "global_step": 205028, "epoch": 4881} {"train_loss": -7.2700653076171875, "global_step": 205029, "epoch": 4881} {"train_loss": -7.269777774810791, "global_step": 205030, "epoch": 4881} {"train_loss": -7.251898765563965, "global_step": 205031, "epoch": 4881} {"train_loss": -7.276825428009033, "global_step": 205032, "epoch": 4881} {"train_loss": -7.331830978393555, "global_step": 205033, "epoch": 4881} {"train_loss": -7.168129920959473, "global_step": 205034, "epoch": 4881} {"train_loss": -7.302140235900879, "global_step": 205035, "epoch": 4881} {"train_loss": -7.2777485847473145, "global_step": 205036, "epoch": 4881} {"train_loss": -7.221083164215088, "global_step": 205037, "epoch": 4881} {"train_loss": -7.257089614868164, "global_step": 205038, "epoch": 4881} {"train_loss": -7.110597610473633, "global_step": 205039, "epoch": 4881} {"train_loss": -7.04914665222168, "global_step": 205040, "epoch": 4881} {"train_loss": -7.199007034301758, "global_step": 205041, "epoch": 4881} {"train_loss": -7.160433769226074, "global_step": 205042, "epoch": 4881} {"train_loss": -7.2460365408942815, "global_step": 205043, "epoch": 4881, "val_loss": 69055.5078125} {"train_loss": -7.205888748168945, "global_step": 205044, "epoch": 4882} {"train_loss": -7.036139011383057, "global_step": 205045, "epoch": 4882} {"train_loss": -7.151421546936035, "global_step": 205046, "epoch": 4882} {"train_loss": -7.185826778411865, "global_step": 205047, "epoch": 4882} {"train_loss": -7.164374351501465, "global_step": 205048, "epoch": 4882} {"train_loss": -7.272885322570801, "global_step": 205049, "epoch": 4882} {"train_loss": -7.042446136474609, "global_step": 205050, "epoch": 4882} {"train_loss": -7.15014123916626, "global_step": 205051, "epoch": 4882} {"train_loss": -7.099700927734375, "global_step": 205052, "epoch": 4882} {"train_loss": -7.206636428833008, "global_step": 205053, "epoch": 4882} {"train_loss": -7.255638599395752, "global_step": 205054, "epoch": 4882} {"train_loss": -7.1243696212768555, "global_step": 205055, "epoch": 4882} {"train_loss": -7.212840557098389, "global_step": 205056, "epoch": 4882} {"train_loss": -7.2113847732543945, "global_step": 205057, "epoch": 4882} {"train_loss": -7.187995910644531, "global_step": 205058, "epoch": 4882} {"train_loss": -7.163256645202637, "global_step": 205059, "epoch": 4882} {"train_loss": -7.302355766296387, "global_step": 205060, "epoch": 4882} {"train_loss": -7.247829437255859, "global_step": 205061, "epoch": 4882} {"train_loss": -7.315035820007324, "global_step": 205062, "epoch": 4882} {"train_loss": -7.282888412475586, "global_step": 205063, "epoch": 4882} {"train_loss": -7.201852798461914, "global_step": 205064, "epoch": 4882} {"train_loss": -7.330218315124512, "global_step": 205065, "epoch": 4882} {"train_loss": -7.240250587463379, "global_step": 205066, "epoch": 4882} {"train_loss": -7.285523414611816, "global_step": 205067, "epoch": 4882} {"train_loss": -7.267790794372559, "global_step": 205068, "epoch": 4882} {"train_loss": -7.259354114532471, "global_step": 205069, "epoch": 4882} {"train_loss": -7.319247245788574, "global_step": 205070, "epoch": 4882} {"train_loss": -7.383336067199707, "global_step": 205071, "epoch": 4882} {"train_loss": -7.328160285949707, "global_step": 205072, "epoch": 4882} {"train_loss": -7.331815719604492, "global_step": 205073, "epoch": 4882} {"train_loss": -7.2462921142578125, "global_step": 205074, "epoch": 4882} {"train_loss": -7.255146503448486, "global_step": 205075, "epoch": 4882} {"train_loss": -7.291166305541992, "global_step": 205076, "epoch": 4882} {"train_loss": -7.35634708404541, "global_step": 205077, "epoch": 4882} {"train_loss": -7.411408424377441, "global_step": 205078, "epoch": 4882} {"train_loss": -7.363914966583252, "global_step": 205079, "epoch": 4882} {"train_loss": -7.344604969024658, "global_step": 205080, "epoch": 4882} {"train_loss": -7.355170249938965, "global_step": 205081, "epoch": 4882} {"train_loss": -7.343286514282227, "global_step": 205082, "epoch": 4882} {"train_loss": -7.312210559844971, "global_step": 205083, "epoch": 4882} {"train_loss": -7.282578945159912, "global_step": 205084, "epoch": 4882} {"train_loss": -7.256568692979359, "global_step": 205085, "epoch": 4882, "val_loss": 69117.7890625} {"train_loss": -7.3390045166015625, "global_step": 205086, "epoch": 4883} {"train_loss": -7.307154178619385, "global_step": 205087, "epoch": 4883} {"train_loss": -7.269815444946289, "global_step": 205088, "epoch": 4883} {"train_loss": -7.384451866149902, "global_step": 205089, "epoch": 4883} {"train_loss": -7.326748371124268, "global_step": 205090, "epoch": 4883} {"train_loss": -7.314060211181641, "global_step": 205091, "epoch": 4883} {"train_loss": -7.326555252075195, "global_step": 205092, "epoch": 4883} {"train_loss": -7.3742828369140625, "global_step": 205093, "epoch": 4883} {"train_loss": -7.3517303466796875, "global_step": 205094, "epoch": 4883} {"train_loss": -7.297186374664307, "global_step": 205095, "epoch": 4883} {"train_loss": -7.243636131286621, "global_step": 205096, "epoch": 4883} {"train_loss": -7.2900495529174805, "global_step": 205097, "epoch": 4883} {"train_loss": -7.36615514755249, "global_step": 205098, "epoch": 4883} {"train_loss": -7.280998229980469, "global_step": 205099, "epoch": 4883} {"train_loss": -7.351377010345459, "global_step": 205100, "epoch": 4883} {"train_loss": -7.418857574462891, "global_step": 205101, "epoch": 4883} {"train_loss": -7.428403854370117, "global_step": 205102, "epoch": 4883} {"train_loss": -7.33149528503418, "global_step": 205103, "epoch": 4883} {"train_loss": -7.406190872192383, "global_step": 205104, "epoch": 4883} {"train_loss": -7.4145073890686035, "global_step": 205105, "epoch": 4883} {"train_loss": -7.329744338989258, "global_step": 205106, "epoch": 4883} {"train_loss": -7.243390083312988, "global_step": 205107, "epoch": 4883} {"train_loss": -7.3487443923950195, "global_step": 205108, "epoch": 4883} {"train_loss": -7.303898811340332, "global_step": 205109, "epoch": 4883} {"train_loss": -7.295328140258789, "global_step": 205110, "epoch": 4883} {"train_loss": -7.435085296630859, "global_step": 205111, "epoch": 4883} {"train_loss": -7.371674537658691, "global_step": 205112, "epoch": 4883} {"train_loss": -7.2668843269348145, "global_step": 205113, "epoch": 4883} {"train_loss": -7.18871545791626, "global_step": 205114, "epoch": 4883} {"train_loss": -7.269104480743408, "global_step": 205115, "epoch": 4883} {"train_loss": -7.144274711608887, "global_step": 205116, "epoch": 4883} {"train_loss": -7.42056941986084, "global_step": 205117, "epoch": 4883} {"train_loss": -7.203166484832764, "global_step": 205118, "epoch": 4883} {"train_loss": -7.225400924682617, "global_step": 205119, "epoch": 4883} {"train_loss": -7.2779130935668945, "global_step": 205120, "epoch": 4883} {"train_loss": -7.307095050811768, "global_step": 205121, "epoch": 4883} {"train_loss": -7.1382904052734375, "global_step": 205122, "epoch": 4883} {"train_loss": -7.2316484451293945, "global_step": 205123, "epoch": 4883} {"train_loss": -7.252620220184326, "global_step": 205124, "epoch": 4883} {"train_loss": -7.2202653884887695, "global_step": 205125, "epoch": 4883} {"train_loss": -7.166226863861084, "global_step": 205126, "epoch": 4883} {"train_loss": -7.301421506064279, "global_step": 205127, "epoch": 4883, "val_loss": 69209.625} {"train_loss": -7.313962459564209, "global_step": 205128, "epoch": 4884} {"train_loss": -7.263777732849121, "global_step": 205129, "epoch": 4884} {"train_loss": -7.235655784606934, "global_step": 205130, "epoch": 4884} {"train_loss": -7.3046369552612305, "global_step": 205131, "epoch": 4884} {"train_loss": -7.313108921051025, "global_step": 205132, "epoch": 4884} {"train_loss": -7.298691749572754, "global_step": 205133, "epoch": 4884} {"train_loss": -7.291240692138672, "global_step": 205134, "epoch": 4884} {"train_loss": -7.273980140686035, "global_step": 205135, "epoch": 4884} {"train_loss": -7.39210319519043, "global_step": 205136, "epoch": 4884} {"train_loss": -7.367342948913574, "global_step": 205137, "epoch": 4884} {"train_loss": -7.317431449890137, "global_step": 205138, "epoch": 4884} {"train_loss": -7.472448825836182, "global_step": 205139, "epoch": 4884} {"train_loss": -7.0640668869018555, "global_step": 205140, "epoch": 4884} {"train_loss": -7.1300458908081055, "global_step": 205141, "epoch": 4884} {"train_loss": -7.357921600341797, "global_step": 205142, "epoch": 4884} {"train_loss": -7.229922294616699, "global_step": 205143, "epoch": 4884} {"train_loss": -7.174993515014648, "global_step": 205144, "epoch": 4884} {"train_loss": -7.288116455078125, "global_step": 205145, "epoch": 4884} {"train_loss": -7.20822811126709, "global_step": 205146, "epoch": 4884} {"train_loss": -7.098785400390625, "global_step": 205147, "epoch": 4884} {"train_loss": -7.255650043487549, "global_step": 205148, "epoch": 4884} {"train_loss": -7.205650806427002, "global_step": 205149, "epoch": 4884} {"train_loss": -6.996782302856445, "global_step": 205150, "epoch": 4884} {"train_loss": -7.268265247344971, "global_step": 205151, "epoch": 4884} {"train_loss": -7.123225688934326, "global_step": 205152, "epoch": 4884} {"train_loss": -7.087950706481934, "global_step": 205153, "epoch": 4884} {"train_loss": -7.175755977630615, "global_step": 205154, "epoch": 4884} {"train_loss": -7.173483848571777, "global_step": 205155, "epoch": 4884} {"train_loss": -7.267329216003418, "global_step": 205156, "epoch": 4884} {"train_loss": -7.0961151123046875, "global_step": 205157, "epoch": 4884} {"train_loss": -7.07650089263916, "global_step": 205158, "epoch": 4884} {"train_loss": -7.124524116516113, "global_step": 205159, "epoch": 4884} {"train_loss": -7.060966491699219, "global_step": 205160, "epoch": 4884} {"train_loss": -7.236543655395508, "global_step": 205161, "epoch": 4884} {"train_loss": -7.0459160804748535, "global_step": 205162, "epoch": 4884} {"train_loss": -7.202621936798096, "global_step": 205163, "epoch": 4884} {"train_loss": -7.2261152267456055, "global_step": 205164, "epoch": 4884} {"train_loss": -7.092159271240234, "global_step": 205165, "epoch": 4884} {"train_loss": -7.227415084838867, "global_step": 205166, "epoch": 4884} {"train_loss": -7.232259750366211, "global_step": 205167, "epoch": 4884} {"train_loss": -7.27018404006958, "global_step": 205168, "epoch": 4884} {"train_loss": -7.218498116447812, "global_step": 205169, "epoch": 4884, "val_loss": 69266.390625} {"train_loss": -7.153946876525879, "global_step": 205170, "epoch": 4885} {"train_loss": -7.194109916687012, "global_step": 205171, "epoch": 4885} {"train_loss": -7.252880096435547, "global_step": 205172, "epoch": 4885} {"train_loss": -7.315241813659668, "global_step": 205173, "epoch": 4885} {"train_loss": -7.23335075378418, "global_step": 205174, "epoch": 4885} {"train_loss": -7.20847225189209, "global_step": 205175, "epoch": 4885} {"train_loss": -7.344804286956787, "global_step": 205176, "epoch": 4885} {"train_loss": -7.21274471282959, "global_step": 205177, "epoch": 4885} {"train_loss": -7.275187969207764, "global_step": 205178, "epoch": 4885} {"train_loss": -7.1841230392456055, "global_step": 205179, "epoch": 4885} {"train_loss": -7.267096519470215, "global_step": 205180, "epoch": 4885} {"train_loss": -7.356620788574219, "global_step": 205181, "epoch": 4885} {"train_loss": -7.24724817276001, "global_step": 205182, "epoch": 4885} {"train_loss": -7.311872959136963, "global_step": 205183, "epoch": 4885} {"train_loss": -7.220259189605713, "global_step": 205184, "epoch": 4885} {"train_loss": -7.204297065734863, "global_step": 205185, "epoch": 4885} {"train_loss": -7.3324456214904785, "global_step": 205186, "epoch": 4885} {"train_loss": -7.3010759353637695, "global_step": 205187, "epoch": 4885} {"train_loss": -7.180678367614746, "global_step": 205188, "epoch": 4885} {"train_loss": -7.378253936767578, "global_step": 205189, "epoch": 4885} {"train_loss": -7.305002212524414, "global_step": 205190, "epoch": 4885} {"train_loss": -7.151230812072754, "global_step": 205191, "epoch": 4885} {"train_loss": -7.302830696105957, "global_step": 205192, "epoch": 4885} {"train_loss": -7.3100810050964355, "global_step": 205193, "epoch": 4885} {"train_loss": -7.274741172790527, "global_step": 205194, "epoch": 4885} {"train_loss": -7.379895210266113, "global_step": 205195, "epoch": 4885} {"train_loss": -7.290683746337891, "global_step": 205196, "epoch": 4885} {"train_loss": -7.447859287261963, "global_step": 205197, "epoch": 4885} {"train_loss": -7.291074752807617, "global_step": 205198, "epoch": 4885} {"train_loss": -7.309751987457275, "global_step": 205199, "epoch": 4885} {"train_loss": -7.3571672439575195, "global_step": 205200, "epoch": 4885} {"train_loss": -7.357035160064697, "global_step": 205201, "epoch": 4885} {"train_loss": -7.227808952331543, "global_step": 205202, "epoch": 4885} {"train_loss": -7.375901222229004, "global_step": 205203, "epoch": 4885} {"train_loss": -7.297557830810547, "global_step": 205204, "epoch": 4885} {"train_loss": -7.346892356872559, "global_step": 205205, "epoch": 4885} {"train_loss": -7.271556377410889, "global_step": 205206, "epoch": 4885} {"train_loss": -7.250409126281738, "global_step": 205207, "epoch": 4885} {"train_loss": -7.304720401763916, "global_step": 205208, "epoch": 4885} {"train_loss": -7.204197883605957, "global_step": 205209, "epoch": 4885} {"train_loss": -7.186640739440918, "global_step": 205210, "epoch": 4885} {"train_loss": -7.278611080987113, "global_step": 205211, "epoch": 4885, "val_loss": 69169.71875} {"train_loss": -7.328994274139404, "global_step": 205212, "epoch": 4886} {"train_loss": -7.222295761108398, "global_step": 205213, "epoch": 4886} {"train_loss": -7.402687072753906, "global_step": 205214, "epoch": 4886} {"train_loss": -7.40471887588501, "global_step": 205215, "epoch": 4886} {"train_loss": -7.254292964935303, "global_step": 205216, "epoch": 4886} {"train_loss": -7.236567497253418, "global_step": 205217, "epoch": 4886} {"train_loss": -7.0958733558654785, "global_step": 205218, "epoch": 4886} {"train_loss": -7.194417953491211, "global_step": 205219, "epoch": 4886} {"train_loss": -7.2836809158325195, "global_step": 205220, "epoch": 4886} {"train_loss": -7.298065185546875, "global_step": 205221, "epoch": 4886} {"train_loss": -7.424394607543945, "global_step": 205222, "epoch": 4886} {"train_loss": -7.246738433837891, "global_step": 205223, "epoch": 4886} {"train_loss": -7.325777530670166, "global_step": 205224, "epoch": 4886} {"train_loss": -7.232860565185547, "global_step": 205225, "epoch": 4886} {"train_loss": -7.30920934677124, "global_step": 205226, "epoch": 4886} {"train_loss": -7.404008865356445, "global_step": 205227, "epoch": 4886} {"train_loss": -7.210565567016602, "global_step": 205228, "epoch": 4886} {"train_loss": -7.20560359954834, "global_step": 205229, "epoch": 4886} {"train_loss": -7.22390079498291, "global_step": 205230, "epoch": 4886} {"train_loss": -7.123106956481934, "global_step": 205231, "epoch": 4886} {"train_loss": -7.144750595092773, "global_step": 205232, "epoch": 4886} {"train_loss": -7.186535835266113, "global_step": 205233, "epoch": 4886} {"train_loss": -7.285459041595459, "global_step": 205234, "epoch": 4886} {"train_loss": -7.1920905113220215, "global_step": 205235, "epoch": 4886} {"train_loss": -7.3690266609191895, "global_step": 205236, "epoch": 4886} {"train_loss": -7.132382392883301, "global_step": 205237, "epoch": 4886} {"train_loss": -7.274744033813477, "global_step": 205238, "epoch": 4886} {"train_loss": -7.331667423248291, "global_step": 205239, "epoch": 4886} {"train_loss": -7.2811384201049805, "global_step": 205240, "epoch": 4886} {"train_loss": -7.254340171813965, "global_step": 205241, "epoch": 4886} {"train_loss": -7.313432693481445, "global_step": 205242, "epoch": 4886} {"train_loss": -7.319415092468262, "global_step": 205243, "epoch": 4886} {"train_loss": -7.214178562164307, "global_step": 205244, "epoch": 4886} {"train_loss": -7.344465255737305, "global_step": 205245, "epoch": 4886} {"train_loss": -7.197718143463135, "global_step": 205246, "epoch": 4886} {"train_loss": -7.304689407348633, "global_step": 205247, "epoch": 4886} {"train_loss": -7.202892303466797, "global_step": 205248, "epoch": 4886} {"train_loss": -7.224859237670898, "global_step": 205249, "epoch": 4886} {"train_loss": -7.14450740814209, "global_step": 205250, "epoch": 4886} {"train_loss": -7.281660079956055, "global_step": 205251, "epoch": 4886} {"train_loss": -7.251237869262695, "global_step": 205252, "epoch": 4886} {"train_loss": -7.260695775349935, "global_step": 205253, "epoch": 4886, "val_loss": 69152.5703125} {"train_loss": -7.227409362792969, "global_step": 205254, "epoch": 4887} {"train_loss": -7.2910943031311035, "global_step": 205255, "epoch": 4887} {"train_loss": -7.172191619873047, "global_step": 205256, "epoch": 4887} {"train_loss": -7.154152870178223, "global_step": 205257, "epoch": 4887} {"train_loss": -7.264263153076172, "global_step": 205258, "epoch": 4887} {"train_loss": -7.318180084228516, "global_step": 205259, "epoch": 4887} {"train_loss": -7.267858028411865, "global_step": 205260, "epoch": 4887} {"train_loss": -7.342626571655273, "global_step": 205261, "epoch": 4887} {"train_loss": -7.176361083984375, "global_step": 205262, "epoch": 4887} {"train_loss": -7.245026111602783, "global_step": 205263, "epoch": 4887} {"train_loss": -7.17466926574707, "global_step": 205264, "epoch": 4887} {"train_loss": -7.311525821685791, "global_step": 205265, "epoch": 4887} {"train_loss": -7.343487739562988, "global_step": 205266, "epoch": 4887} {"train_loss": -7.2059431076049805, "global_step": 205267, "epoch": 4887} {"train_loss": -7.261038780212402, "global_step": 205268, "epoch": 4887} {"train_loss": -7.290170669555664, "global_step": 205269, "epoch": 4887} {"train_loss": -7.2731523513793945, "global_step": 205270, "epoch": 4887} {"train_loss": -7.259653091430664, "global_step": 205271, "epoch": 4887} {"train_loss": -7.131801605224609, "global_step": 205272, "epoch": 4887} {"train_loss": -7.417301654815674, "global_step": 205273, "epoch": 4887} {"train_loss": -7.219203472137451, "global_step": 205274, "epoch": 4887} {"train_loss": -7.221304893493652, "global_step": 205275, "epoch": 4887} {"train_loss": -7.2130937576293945, "global_step": 205276, "epoch": 4887} {"train_loss": -7.363542079925537, "global_step": 205277, "epoch": 4887} {"train_loss": -7.341924667358398, "global_step": 205278, "epoch": 4887} {"train_loss": -7.214075088500977, "global_step": 205279, "epoch": 4887} {"train_loss": -7.264280796051025, "global_step": 205280, "epoch": 4887} {"train_loss": -7.304506778717041, "global_step": 205281, "epoch": 4887} {"train_loss": -7.160782814025879, "global_step": 205282, "epoch": 4887} {"train_loss": -7.235727310180664, "global_step": 205283, "epoch": 4887} {"train_loss": -7.308421611785889, "global_step": 205284, "epoch": 4887} {"train_loss": -7.239411354064941, "global_step": 205285, "epoch": 4887} {"train_loss": -7.286935806274414, "global_step": 205286, "epoch": 4887} {"train_loss": -7.215962886810303, "global_step": 205287, "epoch": 4887} {"train_loss": -7.313615322113037, "global_step": 205288, "epoch": 4887} {"train_loss": -7.206024169921875, "global_step": 205289, "epoch": 4887} {"train_loss": -7.380504131317139, "global_step": 205290, "epoch": 4887} {"train_loss": -7.319337844848633, "global_step": 205291, "epoch": 4887} {"train_loss": -7.28096866607666, "global_step": 205292, "epoch": 4887} {"train_loss": -7.281408309936523, "global_step": 205293, "epoch": 4887} {"train_loss": -7.300077438354492, "global_step": 205294, "epoch": 4887} {"train_loss": -7.263229540416172, "global_step": 205295, "epoch": 4887, "val_loss": 69274.7109375} {"train_loss": -7.3307647705078125, "global_step": 205296, "epoch": 4888} {"train_loss": -7.220498085021973, "global_step": 205297, "epoch": 4888} {"train_loss": -7.290426254272461, "global_step": 205298, "epoch": 4888} {"train_loss": -7.352563381195068, "global_step": 205299, "epoch": 4888} {"train_loss": -7.235454559326172, "global_step": 205300, "epoch": 4888} {"train_loss": -7.166753768920898, "global_step": 205301, "epoch": 4888} {"train_loss": -7.138302803039551, "global_step": 205302, "epoch": 4888} {"train_loss": -7.251558303833008, "global_step": 205303, "epoch": 4888} {"train_loss": -7.305592060089111, "global_step": 205304, "epoch": 4888} {"train_loss": -7.169247150421143, "global_step": 205305, "epoch": 4888} {"train_loss": -7.1784281730651855, "global_step": 205306, "epoch": 4888} {"train_loss": -7.231145858764648, "global_step": 205307, "epoch": 4888} {"train_loss": -7.077325820922852, "global_step": 205308, "epoch": 4888} {"train_loss": -7.176548480987549, "global_step": 205309, "epoch": 4888} {"train_loss": -7.108145713806152, "global_step": 205310, "epoch": 4888} {"train_loss": -7.131150245666504, "global_step": 205311, "epoch": 4888} {"train_loss": -7.217181205749512, "global_step": 205312, "epoch": 4888} {"train_loss": -7.032052040100098, "global_step": 205313, "epoch": 4888} {"train_loss": -7.115489959716797, "global_step": 205314, "epoch": 4888} {"train_loss": -7.165630340576172, "global_step": 205315, "epoch": 4888} {"train_loss": -7.145153045654297, "global_step": 205316, "epoch": 4888} {"train_loss": -7.282374382019043, "global_step": 205317, "epoch": 4888} {"train_loss": -7.24722957611084, "global_step": 205318, "epoch": 4888} {"train_loss": -7.124964714050293, "global_step": 205319, "epoch": 4888} {"train_loss": -7.175625801086426, "global_step": 205320, "epoch": 4888} {"train_loss": -7.207639694213867, "global_step": 205321, "epoch": 4888} {"train_loss": -7.058479309082031, "global_step": 205322, "epoch": 4888} {"train_loss": -7.268848896026611, "global_step": 205323, "epoch": 4888} {"train_loss": -7.10752534866333, "global_step": 205324, "epoch": 4888} {"train_loss": -7.215350151062012, "global_step": 205325, "epoch": 4888} {"train_loss": -7.140711307525635, "global_step": 205326, "epoch": 4888} {"train_loss": -7.171095371246338, "global_step": 205327, "epoch": 4888} {"train_loss": -7.090813636779785, "global_step": 205328, "epoch": 4888} {"train_loss": -7.164109230041504, "global_step": 205329, "epoch": 4888} {"train_loss": -7.168245315551758, "global_step": 205330, "epoch": 4888} {"train_loss": -7.159686088562012, "global_step": 205331, "epoch": 4888} {"train_loss": -7.130722999572754, "global_step": 205332, "epoch": 4888} {"train_loss": -7.1402764320373535, "global_step": 205333, "epoch": 4888} {"train_loss": -7.178370475769043, "global_step": 205334, "epoch": 4888} {"train_loss": -7.300497055053711, "global_step": 205335, "epoch": 4888} {"train_loss": -7.23075532913208, "global_step": 205336, "epoch": 4888} {"train_loss": -7.185605594090053, "global_step": 205337, "epoch": 4888, "val_loss": 69012.75} {"train_loss": -7.218719959259033, "global_step": 205338, "epoch": 4889} {"train_loss": -7.353157043457031, "global_step": 205339, "epoch": 4889} {"train_loss": -7.140098571777344, "global_step": 205340, "epoch": 4889} {"train_loss": -7.307830810546875, "global_step": 205341, "epoch": 4889} {"train_loss": -7.2800679206848145, "global_step": 205342, "epoch": 4889} {"train_loss": -7.177081108093262, "global_step": 205343, "epoch": 4889} {"train_loss": -7.227815628051758, "global_step": 205344, "epoch": 4889} {"train_loss": -7.300241470336914, "global_step": 205345, "epoch": 4889} {"train_loss": -7.310879230499268, "global_step": 205346, "epoch": 4889} {"train_loss": -7.263811111450195, "global_step": 205347, "epoch": 4889} {"train_loss": -7.258431911468506, "global_step": 205348, "epoch": 4889} {"train_loss": -7.290236473083496, "global_step": 205349, "epoch": 4889} {"train_loss": -7.238308429718018, "global_step": 205350, "epoch": 4889} {"train_loss": -7.294361114501953, "global_step": 205351, "epoch": 4889} {"train_loss": -7.257884979248047, "global_step": 205352, "epoch": 4889} {"train_loss": -7.286880016326904, "global_step": 205353, "epoch": 4889} {"train_loss": -7.325474739074707, "global_step": 205354, "epoch": 4889} {"train_loss": -7.278622150421143, "global_step": 205355, "epoch": 4889} {"train_loss": -7.274973392486572, "global_step": 205356, "epoch": 4889} {"train_loss": -7.364213943481445, "global_step": 205357, "epoch": 4889} {"train_loss": -7.2507643699646, "global_step": 205358, "epoch": 4889} {"train_loss": -7.404286861419678, "global_step": 205359, "epoch": 4889} {"train_loss": -7.1798553466796875, "global_step": 205360, "epoch": 4889} {"train_loss": -7.329533576965332, "global_step": 205361, "epoch": 4889} {"train_loss": -7.123968124389648, "global_step": 205362, "epoch": 4889} {"train_loss": -7.146912574768066, "global_step": 205363, "epoch": 4889} {"train_loss": -7.245964050292969, "global_step": 205364, "epoch": 4889} {"train_loss": -7.164203643798828, "global_step": 205365, "epoch": 4889} {"train_loss": -7.269804000854492, "global_step": 205366, "epoch": 4889} {"train_loss": -7.306636810302734, "global_step": 205367, "epoch": 4889} {"train_loss": -7.113823413848877, "global_step": 205368, "epoch": 4889} {"train_loss": -7.220372200012207, "global_step": 205369, "epoch": 4889} {"train_loss": -7.230153560638428, "global_step": 205370, "epoch": 4889} {"train_loss": -7.1648759841918945, "global_step": 205371, "epoch": 4889} {"train_loss": -7.285606861114502, "global_step": 205372, "epoch": 4889} {"train_loss": -7.208020210266113, "global_step": 205373, "epoch": 4889} {"train_loss": -7.204787254333496, "global_step": 205374, "epoch": 4889} {"train_loss": -7.281246662139893, "global_step": 205375, "epoch": 4889} {"train_loss": -7.2354888916015625, "global_step": 205376, "epoch": 4889} {"train_loss": -7.159951210021973, "global_step": 205377, "epoch": 4889} {"train_loss": -7.126529693603516, "global_step": 205378, "epoch": 4889} {"train_loss": -7.2451617150079635, "global_step": 205379, "epoch": 4889, "val_loss": 69209.2109375} {"train_loss": -7.173314571380615, "global_step": 205380, "epoch": 4890} {"train_loss": -7.270569801330566, "global_step": 205381, "epoch": 4890} {"train_loss": -7.263810634613037, "global_step": 205382, "epoch": 4890} {"train_loss": -7.117040157318115, "global_step": 205383, "epoch": 4890} {"train_loss": -7.272839069366455, "global_step": 205384, "epoch": 4890} {"train_loss": -7.196319580078125, "global_step": 205385, "epoch": 4890} {"train_loss": -7.23113489151001, "global_step": 205386, "epoch": 4890} {"train_loss": -7.239144325256348, "global_step": 205387, "epoch": 4890} {"train_loss": -7.260656356811523, "global_step": 205388, "epoch": 4890} {"train_loss": -7.341843128204346, "global_step": 205389, "epoch": 4890} {"train_loss": -7.187544345855713, "global_step": 205390, "epoch": 4890} {"train_loss": -7.241326332092285, "global_step": 205391, "epoch": 4890} {"train_loss": -7.224808216094971, "global_step": 205392, "epoch": 4890} {"train_loss": -7.212729454040527, "global_step": 205393, "epoch": 4890} {"train_loss": -7.329722881317139, "global_step": 205394, "epoch": 4890} {"train_loss": -7.159494400024414, "global_step": 205395, "epoch": 4890} {"train_loss": -7.213937282562256, "global_step": 205396, "epoch": 4890} {"train_loss": -7.164496421813965, "global_step": 205397, "epoch": 4890} {"train_loss": -7.283535003662109, "global_step": 205398, "epoch": 4890} {"train_loss": -7.295055866241455, "global_step": 205399, "epoch": 4890} {"train_loss": -7.262645721435547, "global_step": 205400, "epoch": 4890} {"train_loss": -7.224944114685059, "global_step": 205401, "epoch": 4890} {"train_loss": -7.257073879241943, "global_step": 205402, "epoch": 4890} {"train_loss": -7.464805603027344, "global_step": 205403, "epoch": 4890} {"train_loss": -7.241423606872559, "global_step": 205404, "epoch": 4890} {"train_loss": -7.297104358673096, "global_step": 205405, "epoch": 4890} {"train_loss": -7.280363082885742, "global_step": 205406, "epoch": 4890} {"train_loss": -7.255367755889893, "global_step": 205407, "epoch": 4890} {"train_loss": -7.316494941711426, "global_step": 205408, "epoch": 4890} {"train_loss": -7.338934898376465, "global_step": 205409, "epoch": 4890} {"train_loss": -7.347209930419922, "global_step": 205410, "epoch": 4890} {"train_loss": -7.246674537658691, "global_step": 205411, "epoch": 4890} {"train_loss": -7.282464027404785, "global_step": 205412, "epoch": 4890} {"train_loss": -7.370429039001465, "global_step": 205413, "epoch": 4890} {"train_loss": -7.382316589355469, "global_step": 205414, "epoch": 4890} {"train_loss": -7.295391082763672, "global_step": 205415, "epoch": 4890} {"train_loss": -7.318221569061279, "global_step": 205416, "epoch": 4890} {"train_loss": -7.310825347900391, "global_step": 205417, "epoch": 4890} {"train_loss": -7.274716854095459, "global_step": 205418, "epoch": 4890} {"train_loss": -7.3155198097229, "global_step": 205419, "epoch": 4890} {"train_loss": -7.3532023429870605, "global_step": 205420, "epoch": 4890} {"train_loss": -7.271367345537458, "global_step": 205421, "epoch": 4890, "val_loss": 69128.4609375} {"train_loss": -7.349463939666748, "global_step": 205422, "epoch": 4891} {"train_loss": -7.367467880249023, "global_step": 205423, "epoch": 4891} {"train_loss": -7.353651523590088, "global_step": 205424, "epoch": 4891} {"train_loss": -7.4648356437683105, "global_step": 205425, "epoch": 4891} {"train_loss": -7.359598159790039, "global_step": 205426, "epoch": 4891} {"train_loss": -7.374166488647461, "global_step": 205427, "epoch": 4891} {"train_loss": -7.356857776641846, "global_step": 205428, "epoch": 4891} {"train_loss": -7.307233810424805, "global_step": 205429, "epoch": 4891} {"train_loss": -7.2827229499816895, "global_step": 205430, "epoch": 4891} {"train_loss": -7.415337562561035, "global_step": 205431, "epoch": 4891} {"train_loss": -7.397606372833252, "global_step": 205432, "epoch": 4891} {"train_loss": -7.351089954376221, "global_step": 205433, "epoch": 4891} {"train_loss": -7.330806732177734, "global_step": 205434, "epoch": 4891} {"train_loss": -7.387102127075195, "global_step": 205435, "epoch": 4891} {"train_loss": -7.400275230407715, "global_step": 205436, "epoch": 4891} {"train_loss": -7.312368869781494, "global_step": 205437, "epoch": 4891} {"train_loss": -7.4167938232421875, "global_step": 205438, "epoch": 4891} {"train_loss": -7.260416030883789, "global_step": 205439, "epoch": 4891} {"train_loss": -7.350938320159912, "global_step": 205440, "epoch": 4891} {"train_loss": -7.238067626953125, "global_step": 205441, "epoch": 4891} {"train_loss": -7.340059280395508, "global_step": 205442, "epoch": 4891} {"train_loss": -7.277109146118164, "global_step": 205443, "epoch": 4891} {"train_loss": -7.285441875457764, "global_step": 205444, "epoch": 4891} {"train_loss": -7.294351577758789, "global_step": 205445, "epoch": 4891} {"train_loss": -7.37288761138916, "global_step": 205446, "epoch": 4891} {"train_loss": -7.347603797912598, "global_step": 205447, "epoch": 4891} {"train_loss": -7.243862628936768, "global_step": 205448, "epoch": 4891} {"train_loss": -7.272117614746094, "global_step": 205449, "epoch": 4891} {"train_loss": -7.159695148468018, "global_step": 205450, "epoch": 4891} {"train_loss": -7.308067321777344, "global_step": 205451, "epoch": 4891} {"train_loss": -7.384363174438477, "global_step": 205452, "epoch": 4891} {"train_loss": -7.2579498291015625, "global_step": 205453, "epoch": 4891} {"train_loss": -7.318179607391357, "global_step": 205454, "epoch": 4891} {"train_loss": -7.344399929046631, "global_step": 205455, "epoch": 4891} {"train_loss": -7.293796539306641, "global_step": 205456, "epoch": 4891} {"train_loss": -7.313045501708984, "global_step": 205457, "epoch": 4891} {"train_loss": -7.256523609161377, "global_step": 205458, "epoch": 4891} {"train_loss": -7.171605587005615, "global_step": 205459, "epoch": 4891} {"train_loss": -7.313185214996338, "global_step": 205460, "epoch": 4891} {"train_loss": -7.16546106338501, "global_step": 205461, "epoch": 4891} {"train_loss": -7.255276203155518, "global_step": 205462, "epoch": 4891} {"train_loss": -7.316718998409453, "global_step": 205463, "epoch": 4891, "val_loss": 69013.640625} {"train_loss": -7.051053047180176, "global_step": 205464, "epoch": 4892} {"train_loss": -7.3402299880981445, "global_step": 205465, "epoch": 4892} {"train_loss": -7.345460891723633, "global_step": 205466, "epoch": 4892} {"train_loss": -7.267064094543457, "global_step": 205467, "epoch": 4892} {"train_loss": -7.2701849937438965, "global_step": 205468, "epoch": 4892} {"train_loss": -7.225215911865234, "global_step": 205469, "epoch": 4892} {"train_loss": -7.194749355316162, "global_step": 205470, "epoch": 4892} {"train_loss": -7.217148780822754, "global_step": 205471, "epoch": 4892} {"train_loss": -7.28017520904541, "global_step": 205472, "epoch": 4892} {"train_loss": -7.334253787994385, "global_step": 205473, "epoch": 4892} {"train_loss": -7.310408592224121, "global_step": 205474, "epoch": 4892} {"train_loss": -7.150991916656494, "global_step": 205475, "epoch": 4892} {"train_loss": -7.178715705871582, "global_step": 205476, "epoch": 4892} {"train_loss": -7.278892517089844, "global_step": 205477, "epoch": 4892} {"train_loss": -7.241495132446289, "global_step": 205478, "epoch": 4892} {"train_loss": -7.223740100860596, "global_step": 205479, "epoch": 4892} {"train_loss": -7.278421401977539, "global_step": 205480, "epoch": 4892} {"train_loss": -7.3198089599609375, "global_step": 205481, "epoch": 4892} {"train_loss": -7.238315105438232, "global_step": 205482, "epoch": 4892} {"train_loss": -7.41866397857666, "global_step": 205483, "epoch": 4892} {"train_loss": -7.447495937347412, "global_step": 205484, "epoch": 4892} {"train_loss": -7.277360916137695, "global_step": 205485, "epoch": 4892} {"train_loss": -7.339158535003662, "global_step": 205486, "epoch": 4892} {"train_loss": -7.3163042068481445, "global_step": 205487, "epoch": 4892} {"train_loss": -7.309352874755859, "global_step": 205488, "epoch": 4892} {"train_loss": -7.257157325744629, "global_step": 205489, "epoch": 4892} {"train_loss": -7.257233142852783, "global_step": 205490, "epoch": 4892} {"train_loss": -7.294779300689697, "global_step": 205491, "epoch": 4892} {"train_loss": -7.077691555023193, "global_step": 205492, "epoch": 4892} {"train_loss": -7.229459762573242, "global_step": 205493, "epoch": 4892} {"train_loss": -7.234770774841309, "global_step": 205494, "epoch": 4892} {"train_loss": -7.2221269607543945, "global_step": 205495, "epoch": 4892} {"train_loss": -7.154450416564941, "global_step": 205496, "epoch": 4892} {"train_loss": -7.2038774490356445, "global_step": 205497, "epoch": 4892} {"train_loss": -7.270407676696777, "global_step": 205498, "epoch": 4892} {"train_loss": -7.25472354888916, "global_step": 205499, "epoch": 4892} {"train_loss": -7.355859756469727, "global_step": 205500, "epoch": 4892} {"train_loss": -7.307733058929443, "global_step": 205501, "epoch": 4892} {"train_loss": -7.15815544128418, "global_step": 205502, "epoch": 4892} {"train_loss": -7.329983711242676, "global_step": 205503, "epoch": 4892} {"train_loss": -7.200716018676758, "global_step": 205504, "epoch": 4892} {"train_loss": -7.259883324305217, "global_step": 205505, "epoch": 4892, "val_loss": 69121.90625} {"train_loss": -7.278409481048584, "global_step": 205506, "epoch": 4893} {"train_loss": -7.3939104080200195, "global_step": 205507, "epoch": 4893} {"train_loss": -7.261349678039551, "global_step": 205508, "epoch": 4893} {"train_loss": -7.321606636047363, "global_step": 205509, "epoch": 4893} {"train_loss": -7.251638412475586, "global_step": 205510, "epoch": 4893} {"train_loss": -7.177779197692871, "global_step": 205511, "epoch": 4893} {"train_loss": -7.30510950088501, "global_step": 205512, "epoch": 4893} {"train_loss": -7.346793174743652, "global_step": 205513, "epoch": 4893} {"train_loss": -7.361435413360596, "global_step": 205514, "epoch": 4893} {"train_loss": -7.313262939453125, "global_step": 205515, "epoch": 4893} {"train_loss": -7.364076614379883, "global_step": 205516, "epoch": 4893} {"train_loss": -7.214913368225098, "global_step": 205517, "epoch": 4893} {"train_loss": -7.245983123779297, "global_step": 205518, "epoch": 4893} {"train_loss": -7.352175235748291, "global_step": 205519, "epoch": 4893} {"train_loss": -7.2947001457214355, "global_step": 205520, "epoch": 4893} {"train_loss": -7.38710880279541, "global_step": 205521, "epoch": 4893} {"train_loss": -7.2498345375061035, "global_step": 205522, "epoch": 4893} {"train_loss": -7.291933059692383, "global_step": 205523, "epoch": 4893} {"train_loss": -7.345047950744629, "global_step": 205524, "epoch": 4893} {"train_loss": -7.305815696716309, "global_step": 205525, "epoch": 4893} {"train_loss": -7.25850772857666, "global_step": 205526, "epoch": 4893} {"train_loss": -7.418206214904785, "global_step": 205527, "epoch": 4893} {"train_loss": -7.286538124084473, "global_step": 205528, "epoch": 4893} {"train_loss": -7.125769138336182, "global_step": 205529, "epoch": 4893} {"train_loss": -7.266359806060791, "global_step": 205530, "epoch": 4893} {"train_loss": -7.133335590362549, "global_step": 205531, "epoch": 4893} {"train_loss": -7.341700553894043, "global_step": 205532, "epoch": 4893} {"train_loss": -7.2828874588012695, "global_step": 205533, "epoch": 4893} {"train_loss": -7.266562461853027, "global_step": 205534, "epoch": 4893} {"train_loss": -7.19025993347168, "global_step": 205535, "epoch": 4893} {"train_loss": -7.207999229431152, "global_step": 205536, "epoch": 4893} {"train_loss": -7.266407012939453, "global_step": 205537, "epoch": 4893} {"train_loss": -7.256644248962402, "global_step": 205538, "epoch": 4893} {"train_loss": -7.2152485847473145, "global_step": 205539, "epoch": 4893} {"train_loss": -7.267966270446777, "global_step": 205540, "epoch": 4893} {"train_loss": -7.136393070220947, "global_step": 205541, "epoch": 4893} {"train_loss": -7.127942085266113, "global_step": 205542, "epoch": 4893} {"train_loss": -7.224287033081055, "global_step": 205543, "epoch": 4893} {"train_loss": -7.177189826965332, "global_step": 205544, "epoch": 4893} {"train_loss": -7.044002532958984, "global_step": 205545, "epoch": 4893} {"train_loss": -7.280035018920898, "global_step": 205546, "epoch": 4893} {"train_loss": -7.263393685931251, "global_step": 205547, "epoch": 4893, "val_loss": 69024.640625} {"train_loss": -7.124783515930176, "global_step": 205548, "epoch": 4894} {"train_loss": -7.16037654876709, "global_step": 205549, "epoch": 4894} {"train_loss": -7.213108062744141, "global_step": 205550, "epoch": 4894} {"train_loss": -7.275038719177246, "global_step": 205551, "epoch": 4894} {"train_loss": -7.236879348754883, "global_step": 205552, "epoch": 4894} {"train_loss": -7.3206892013549805, "global_step": 205553, "epoch": 4894} {"train_loss": -7.323299884796143, "global_step": 205554, "epoch": 4894} {"train_loss": -7.265389919281006, "global_step": 205555, "epoch": 4894} {"train_loss": -7.267055034637451, "global_step": 205556, "epoch": 4894} {"train_loss": -7.224472999572754, "global_step": 205557, "epoch": 4894} {"train_loss": -7.304253578186035, "global_step": 205558, "epoch": 4894} {"train_loss": -7.19381856918335, "global_step": 205559, "epoch": 4894} {"train_loss": -7.3899312019348145, "global_step": 205560, "epoch": 4894} {"train_loss": -7.259572982788086, "global_step": 205561, "epoch": 4894} {"train_loss": -7.382974624633789, "global_step": 205562, "epoch": 4894} {"train_loss": -7.31221866607666, "global_step": 205563, "epoch": 4894} {"train_loss": -7.285956859588623, "global_step": 205564, "epoch": 4894} {"train_loss": -7.305400371551514, "global_step": 205565, "epoch": 4894} {"train_loss": -7.297460079193115, "global_step": 205566, "epoch": 4894} {"train_loss": -7.246642112731934, "global_step": 205567, "epoch": 4894} {"train_loss": -7.253363609313965, "global_step": 205568, "epoch": 4894} {"train_loss": -7.192696571350098, "global_step": 205569, "epoch": 4894} {"train_loss": -7.241505146026611, "global_step": 205570, "epoch": 4894} {"train_loss": -7.171403884887695, "global_step": 205571, "epoch": 4894} {"train_loss": -7.20413875579834, "global_step": 205572, "epoch": 4894} {"train_loss": -7.160841941833496, "global_step": 205573, "epoch": 4894} {"train_loss": -7.243792533874512, "global_step": 205574, "epoch": 4894} {"train_loss": -7.160645484924316, "global_step": 205575, "epoch": 4894} {"train_loss": -7.072649002075195, "global_step": 205576, "epoch": 4894} {"train_loss": -7.1271820068359375, "global_step": 205577, "epoch": 4894} {"train_loss": -7.218495845794678, "global_step": 205578, "epoch": 4894} {"train_loss": -7.149081230163574, "global_step": 205579, "epoch": 4894} {"train_loss": -7.240198612213135, "global_step": 205580, "epoch": 4894} {"train_loss": -7.184380054473877, "global_step": 205581, "epoch": 4894} {"train_loss": -7.1487627029418945, "global_step": 205582, "epoch": 4894} {"train_loss": -7.1434783935546875, "global_step": 205583, "epoch": 4894} {"train_loss": -7.099637508392334, "global_step": 205584, "epoch": 4894} {"train_loss": -7.160324573516846, "global_step": 205585, "epoch": 4894} {"train_loss": -7.199875831604004, "global_step": 205586, "epoch": 4894} {"train_loss": -7.136575222015381, "global_step": 205587, "epoch": 4894} {"train_loss": -7.129532337188721, "global_step": 205588, "epoch": 4894} {"train_loss": -7.2174420810881115, "global_step": 205589, "epoch": 4894, "val_loss": 69229.640625} {"train_loss": -7.1277008056640625, "global_step": 205590, "epoch": 4895} {"train_loss": -7.178431034088135, "global_step": 205591, "epoch": 4895} {"train_loss": -7.044058799743652, "global_step": 205592, "epoch": 4895} {"train_loss": -7.1865692138671875, "global_step": 205593, "epoch": 4895} {"train_loss": -7.195423126220703, "global_step": 205594, "epoch": 4895} {"train_loss": -7.05753231048584, "global_step": 205595, "epoch": 4895} {"train_loss": -7.1832685470581055, "global_step": 205596, "epoch": 4895} {"train_loss": -7.140547752380371, "global_step": 205597, "epoch": 4895} {"train_loss": -7.133895397186279, "global_step": 205598, "epoch": 4895} {"train_loss": -7.307215213775635, "global_step": 205599, "epoch": 4895} {"train_loss": -7.289776802062988, "global_step": 205600, "epoch": 4895} {"train_loss": -7.116436004638672, "global_step": 205601, "epoch": 4895} {"train_loss": -7.279534339904785, "global_step": 205602, "epoch": 4895} {"train_loss": -7.165422439575195, "global_step": 205603, "epoch": 4895} {"train_loss": -7.252903938293457, "global_step": 205604, "epoch": 4895} {"train_loss": -7.212915897369385, "global_step": 205605, "epoch": 4895} {"train_loss": -7.287812232971191, "global_step": 205606, "epoch": 4895} {"train_loss": -7.302594184875488, "global_step": 205607, "epoch": 4895} {"train_loss": -7.1437811851501465, "global_step": 205608, "epoch": 4895} {"train_loss": -7.328500747680664, "global_step": 205609, "epoch": 4895} {"train_loss": -7.1864237785339355, "global_step": 205610, "epoch": 4895} {"train_loss": -7.321146488189697, "global_step": 205611, "epoch": 4895} {"train_loss": -7.251913070678711, "global_step": 205612, "epoch": 4895} {"train_loss": -7.1813859939575195, "global_step": 205613, "epoch": 4895} {"train_loss": -7.2595648765563965, "global_step": 205614, "epoch": 4895} {"train_loss": -7.268641471862793, "global_step": 205615, "epoch": 4895} {"train_loss": -7.241670608520508, "global_step": 205616, "epoch": 4895} {"train_loss": -7.225440502166748, "global_step": 205617, "epoch": 4895} {"train_loss": -7.211879730224609, "global_step": 205618, "epoch": 4895} {"train_loss": -7.343335151672363, "global_step": 205619, "epoch": 4895} {"train_loss": -7.273123264312744, "global_step": 205620, "epoch": 4895} {"train_loss": -7.1585564613342285, "global_step": 205621, "epoch": 4895} {"train_loss": -7.288686752319336, "global_step": 205622, "epoch": 4895} {"train_loss": -7.119491100311279, "global_step": 205623, "epoch": 4895} {"train_loss": -7.2851457595825195, "global_step": 205624, "epoch": 4895} {"train_loss": -7.253127098083496, "global_step": 205625, "epoch": 4895} {"train_loss": -7.209683418273926, "global_step": 205626, "epoch": 4895} {"train_loss": -7.280204772949219, "global_step": 205627, "epoch": 4895} {"train_loss": -7.106655120849609, "global_step": 205628, "epoch": 4895} {"train_loss": -7.20582389831543, "global_step": 205629, "epoch": 4895} {"train_loss": -7.315690994262695, "global_step": 205630, "epoch": 4895} {"train_loss": -7.218381472996303, "global_step": 205631, "epoch": 4895, "val_loss": 69140.6953125} {"train_loss": -7.280804634094238, "global_step": 205632, "epoch": 4896} {"train_loss": -7.287943363189697, "global_step": 205633, "epoch": 4896} {"train_loss": -7.166060447692871, "global_step": 205634, "epoch": 4896} {"train_loss": -7.332486629486084, "global_step": 205635, "epoch": 4896} {"train_loss": -7.237974643707275, "global_step": 205636, "epoch": 4896} {"train_loss": -7.195882797241211, "global_step": 205637, "epoch": 4896} {"train_loss": -7.3305230140686035, "global_step": 205638, "epoch": 4896} {"train_loss": -7.305399417877197, "global_step": 205639, "epoch": 4896} {"train_loss": -7.353111267089844, "global_step": 205640, "epoch": 4896} {"train_loss": -7.307373046875, "global_step": 205641, "epoch": 4896} {"train_loss": -7.303227424621582, "global_step": 205642, "epoch": 4896} {"train_loss": -7.235210418701172, "global_step": 205643, "epoch": 4896} {"train_loss": -7.225703239440918, "global_step": 205644, "epoch": 4896} {"train_loss": -7.352949142456055, "global_step": 205645, "epoch": 4896} {"train_loss": -7.25558614730835, "global_step": 205646, "epoch": 4896} {"train_loss": -7.293754577636719, "global_step": 205647, "epoch": 4896} {"train_loss": -7.328432083129883, "global_step": 205648, "epoch": 4896} {"train_loss": -7.277085781097412, "global_step": 205649, "epoch": 4896} {"train_loss": -7.430100440979004, "global_step": 205650, "epoch": 4896} {"train_loss": -7.213815689086914, "global_step": 205651, "epoch": 4896} {"train_loss": -7.19605827331543, "global_step": 205652, "epoch": 4896} {"train_loss": -7.356175422668457, "global_step": 205653, "epoch": 4896} {"train_loss": -7.2551164627075195, "global_step": 205654, "epoch": 4896} {"train_loss": -7.315056324005127, "global_step": 205655, "epoch": 4896} {"train_loss": -7.2057881355285645, "global_step": 205656, "epoch": 4896} {"train_loss": -7.289666175842285, "global_step": 205657, "epoch": 4896} {"train_loss": -7.211913585662842, "global_step": 205658, "epoch": 4896} {"train_loss": -7.19691801071167, "global_step": 205659, "epoch": 4896} {"train_loss": -7.243097305297852, "global_step": 205660, "epoch": 4896} {"train_loss": -7.208773612976074, "global_step": 205661, "epoch": 4896} {"train_loss": -7.083616733551025, "global_step": 205662, "epoch": 4896} {"train_loss": -7.097801685333252, "global_step": 205663, "epoch": 4896} {"train_loss": -7.127758979797363, "global_step": 205664, "epoch": 4896} {"train_loss": -7.0905866622924805, "global_step": 205665, "epoch": 4896} {"train_loss": -7.206362724304199, "global_step": 205666, "epoch": 4896} {"train_loss": -7.181369304656982, "global_step": 205667, "epoch": 4896} {"train_loss": -7.384148597717285, "global_step": 205668, "epoch": 4896} {"train_loss": -7.192841529846191, "global_step": 205669, "epoch": 4896} {"train_loss": -7.2630720138549805, "global_step": 205670, "epoch": 4896} {"train_loss": -7.257370948791504, "global_step": 205671, "epoch": 4896} {"train_loss": -7.055638313293457, "global_step": 205672, "epoch": 4896} {"train_loss": -7.2445220493135, "global_step": 205673, "epoch": 4896, "val_loss": 69131.84375} {"train_loss": -7.229215621948242, "global_step": 205674, "epoch": 4897} {"train_loss": -7.104966640472412, "global_step": 205675, "epoch": 4897} {"train_loss": -7.211431980133057, "global_step": 205676, "epoch": 4897} {"train_loss": -7.19963264465332, "global_step": 205677, "epoch": 4897} {"train_loss": -7.176980972290039, "global_step": 205678, "epoch": 4897} {"train_loss": -7.221695899963379, "global_step": 205679, "epoch": 4897} {"train_loss": -7.151280403137207, "global_step": 205680, "epoch": 4897} {"train_loss": -7.191285133361816, "global_step": 205681, "epoch": 4897} {"train_loss": -7.193099021911621, "global_step": 205682, "epoch": 4897} {"train_loss": -7.151644706726074, "global_step": 205683, "epoch": 4897} {"train_loss": -7.165518760681152, "global_step": 205684, "epoch": 4897} {"train_loss": -7.288797378540039, "global_step": 205685, "epoch": 4897} {"train_loss": -7.170283317565918, "global_step": 205686, "epoch": 4897} {"train_loss": -7.332207202911377, "global_step": 205687, "epoch": 4897} {"train_loss": -7.223330974578857, "global_step": 205688, "epoch": 4897} {"train_loss": -7.144997596740723, "global_step": 205689, "epoch": 4897} {"train_loss": -7.116799354553223, "global_step": 205690, "epoch": 4897} {"train_loss": -7.279952049255371, "global_step": 205691, "epoch": 4897} {"train_loss": -7.169306755065918, "global_step": 205692, "epoch": 4897} {"train_loss": -7.221964359283447, "global_step": 205693, "epoch": 4897} {"train_loss": -7.264789581298828, "global_step": 205694, "epoch": 4897} {"train_loss": -7.14346981048584, "global_step": 205695, "epoch": 4897} {"train_loss": -7.239185333251953, "global_step": 205696, "epoch": 4897} {"train_loss": -7.249073505401611, "global_step": 205697, "epoch": 4897} {"train_loss": -7.33493185043335, "global_step": 205698, "epoch": 4897} {"train_loss": -7.3174848556518555, "global_step": 205699, "epoch": 4897} {"train_loss": -7.269297122955322, "global_step": 205700, "epoch": 4897} {"train_loss": -7.238992214202881, "global_step": 205701, "epoch": 4897} {"train_loss": -7.3162431716918945, "global_step": 205702, "epoch": 4897} {"train_loss": -7.253625869750977, "global_step": 205703, "epoch": 4897} {"train_loss": -7.292422771453857, "global_step": 205704, "epoch": 4897} {"train_loss": -7.30717658996582, "global_step": 205705, "epoch": 4897} {"train_loss": -7.325676918029785, "global_step": 205706, "epoch": 4897} {"train_loss": -7.3748931884765625, "global_step": 205707, "epoch": 4897} {"train_loss": -7.357808589935303, "global_step": 205708, "epoch": 4897} {"train_loss": -7.2320990562438965, "global_step": 205709, "epoch": 4897} {"train_loss": -7.403996467590332, "global_step": 205710, "epoch": 4897} {"train_loss": -7.330802917480469, "global_step": 205711, "epoch": 4897} {"train_loss": -7.270458221435547, "global_step": 205712, "epoch": 4897} {"train_loss": -7.33248233795166, "global_step": 205713, "epoch": 4897} {"train_loss": -7.315500259399414, "global_step": 205714, "epoch": 4897} {"train_loss": -7.249202546619234, "global_step": 205715, "epoch": 4897, "val_loss": 69095.140625} {"train_loss": -7.353630065917969, "global_step": 205716, "epoch": 4898} {"train_loss": -7.281388759613037, "global_step": 205717, "epoch": 4898} {"train_loss": -7.280058860778809, "global_step": 205718, "epoch": 4898} {"train_loss": -7.285887241363525, "global_step": 205719, "epoch": 4898} {"train_loss": -7.268161773681641, "global_step": 205720, "epoch": 4898} {"train_loss": -7.400491714477539, "global_step": 205721, "epoch": 4898} {"train_loss": -7.227265357971191, "global_step": 205722, "epoch": 4898} {"train_loss": -7.276580333709717, "global_step": 205723, "epoch": 4898} {"train_loss": -7.3516693115234375, "global_step": 205724, "epoch": 4898} {"train_loss": -7.2167463302612305, "global_step": 205725, "epoch": 4898} {"train_loss": -7.297135353088379, "global_step": 205726, "epoch": 4898} {"train_loss": -7.368186950683594, "global_step": 205727, "epoch": 4898} {"train_loss": -7.327014923095703, "global_step": 205728, "epoch": 4898} {"train_loss": -7.429570198059082, "global_step": 205729, "epoch": 4898} {"train_loss": -7.3171539306640625, "global_step": 205730, "epoch": 4898} {"train_loss": -7.398590087890625, "global_step": 205731, "epoch": 4898} {"train_loss": -7.300102233886719, "global_step": 205732, "epoch": 4898} {"train_loss": -7.325910568237305, "global_step": 205733, "epoch": 4898} {"train_loss": -7.361576557159424, "global_step": 205734, "epoch": 4898} {"train_loss": -7.3064775466918945, "global_step": 205735, "epoch": 4898} {"train_loss": -7.418028831481934, "global_step": 205736, "epoch": 4898} {"train_loss": -7.249645233154297, "global_step": 205737, "epoch": 4898} {"train_loss": -7.394145965576172, "global_step": 205738, "epoch": 4898} {"train_loss": -7.357821941375732, "global_step": 205739, "epoch": 4898} {"train_loss": -7.387436866760254, "global_step": 205740, "epoch": 4898} {"train_loss": -7.3294677734375, "global_step": 205741, "epoch": 4898} {"train_loss": -7.390605926513672, "global_step": 205742, "epoch": 4898} {"train_loss": -7.347323894500732, "global_step": 205743, "epoch": 4898} {"train_loss": -7.270114898681641, "global_step": 205744, "epoch": 4898} {"train_loss": -7.329442024230957, "global_step": 205745, "epoch": 4898} {"train_loss": -7.289074420928955, "global_step": 205746, "epoch": 4898} {"train_loss": -7.340731620788574, "global_step": 205747, "epoch": 4898} {"train_loss": -7.237020015716553, "global_step": 205748, "epoch": 4898} {"train_loss": -7.207269191741943, "global_step": 205749, "epoch": 4898} {"train_loss": -7.324624061584473, "global_step": 205750, "epoch": 4898} {"train_loss": -7.321739196777344, "global_step": 205751, "epoch": 4898} {"train_loss": -7.367170333862305, "global_step": 205752, "epoch": 4898} {"train_loss": -7.262290954589844, "global_step": 205753, "epoch": 4898} {"train_loss": -7.28502082824707, "global_step": 205754, "epoch": 4898} {"train_loss": -7.208628177642822, "global_step": 205755, "epoch": 4898} {"train_loss": -7.2447919845581055, "global_step": 205756, "epoch": 4898} {"train_loss": -7.314433313551403, "global_step": 205757, "epoch": 4898, "val_loss": 69189.1015625} {"train_loss": -7.348519802093506, "global_step": 205758, "epoch": 4899} {"train_loss": -7.241436958312988, "global_step": 205759, "epoch": 4899} {"train_loss": -7.285575866699219, "global_step": 205760, "epoch": 4899} {"train_loss": -7.008994102478027, "global_step": 205761, "epoch": 4899} {"train_loss": -7.264392852783203, "global_step": 205762, "epoch": 4899} {"train_loss": -7.306797981262207, "global_step": 205763, "epoch": 4899} {"train_loss": -7.1811113357543945, "global_step": 205764, "epoch": 4899} {"train_loss": -7.277795791625977, "global_step": 205765, "epoch": 4899} {"train_loss": -7.331366539001465, "global_step": 205766, "epoch": 4899} {"train_loss": -7.284337997436523, "global_step": 205767, "epoch": 4899} {"train_loss": -7.331926345825195, "global_step": 205768, "epoch": 4899} {"train_loss": -7.317519187927246, "global_step": 205769, "epoch": 4899} {"train_loss": -7.178701400756836, "global_step": 205770, "epoch": 4899} {"train_loss": -7.340604782104492, "global_step": 205771, "epoch": 4899} {"train_loss": -7.208717346191406, "global_step": 205772, "epoch": 4899} {"train_loss": -7.264408111572266, "global_step": 205773, "epoch": 4899} {"train_loss": -7.283527851104736, "global_step": 205774, "epoch": 4899} {"train_loss": -7.183936595916748, "global_step": 205775, "epoch": 4899} {"train_loss": -7.332148551940918, "global_step": 205776, "epoch": 4899} {"train_loss": -7.1972761154174805, "global_step": 205777, "epoch": 4899} {"train_loss": -7.215612411499023, "global_step": 205778, "epoch": 4899} {"train_loss": -7.297186374664307, "global_step": 205779, "epoch": 4899} {"train_loss": -7.300524711608887, "global_step": 205780, "epoch": 4899} {"train_loss": -7.111541748046875, "global_step": 205781, "epoch": 4899} {"train_loss": -7.270276069641113, "global_step": 205782, "epoch": 4899} {"train_loss": -7.274135589599609, "global_step": 205783, "epoch": 4899} {"train_loss": -7.180323600769043, "global_step": 205784, "epoch": 4899} {"train_loss": -7.198914527893066, "global_step": 205785, "epoch": 4899} {"train_loss": -7.285689353942871, "global_step": 205786, "epoch": 4899} {"train_loss": -7.202693939208984, "global_step": 205787, "epoch": 4899} {"train_loss": -7.261180877685547, "global_step": 205788, "epoch": 4899} {"train_loss": -7.2672624588012695, "global_step": 205789, "epoch": 4899} {"train_loss": -7.350760459899902, "global_step": 205790, "epoch": 4899} {"train_loss": -7.293440341949463, "global_step": 205791, "epoch": 4899} {"train_loss": -7.340645790100098, "global_step": 205792, "epoch": 4899} {"train_loss": -7.293934345245361, "global_step": 205793, "epoch": 4899} {"train_loss": -7.400498867034912, "global_step": 205794, "epoch": 4899} {"train_loss": -7.294757843017578, "global_step": 205795, "epoch": 4899} {"train_loss": -7.252608299255371, "global_step": 205796, "epoch": 4899} {"train_loss": -7.311493873596191, "global_step": 205797, "epoch": 4899} {"train_loss": -7.2795915603637695, "global_step": 205798, "epoch": 4899} {"train_loss": -7.26731292406718, "global_step": 205799, "epoch": 4899, "val_loss": 69228.0078125} {"train_loss": -7.376497745513916, "global_step": 205800, "epoch": 4900} {"train_loss": -7.341739177703857, "global_step": 205801, "epoch": 4900} {"train_loss": -7.408563613891602, "global_step": 205802, "epoch": 4900} {"train_loss": -7.124345302581787, "global_step": 205803, "epoch": 4900} {"train_loss": -7.32142448425293, "global_step": 205804, "epoch": 4900} {"train_loss": -7.299939155578613, "global_step": 205805, "epoch": 4900} {"train_loss": -7.161892890930176, "global_step": 205806, "epoch": 4900} {"train_loss": -7.306829452514648, "global_step": 205807, "epoch": 4900} {"train_loss": -7.217898368835449, "global_step": 205808, "epoch": 4900} {"train_loss": -7.186886787414551, "global_step": 205809, "epoch": 4900} {"train_loss": -7.307260036468506, "global_step": 205810, "epoch": 4900} {"train_loss": -7.259831428527832, "global_step": 205811, "epoch": 4900} {"train_loss": -7.125506401062012, "global_step": 205812, "epoch": 4900} {"train_loss": -7.278880596160889, "global_step": 205813, "epoch": 4900} {"train_loss": -7.205656051635742, "global_step": 205814, "epoch": 4900} {"train_loss": -7.270152568817139, "global_step": 205815, "epoch": 4900} {"train_loss": -7.3462300300598145, "global_step": 205816, "epoch": 4900} {"train_loss": -7.251039505004883, "global_step": 205817, "epoch": 4900} {"train_loss": -7.343042373657227, "global_step": 205818, "epoch": 4900} {"train_loss": -7.273952484130859, "global_step": 205819, "epoch": 4900} {"train_loss": -7.23793888092041, "global_step": 205820, "epoch": 4900} {"train_loss": -7.250099182128906, "global_step": 205821, "epoch": 4900} {"train_loss": -7.227423191070557, "global_step": 205822, "epoch": 4900} {"train_loss": -7.287388801574707, "global_step": 205823, "epoch": 4900} {"train_loss": -7.230743408203125, "global_step": 205824, "epoch": 4900} {"train_loss": -7.242609977722168, "global_step": 205825, "epoch": 4900} {"train_loss": -7.245426654815674, "global_step": 205826, "epoch": 4900} {"train_loss": -7.21535587310791, "global_step": 205827, "epoch": 4900} {"train_loss": -7.233301162719727, "global_step": 205828, "epoch": 4900} {"train_loss": -7.17418098449707, "global_step": 205829, "epoch": 4900} {"train_loss": -7.241479396820068, "global_step": 205830, "epoch": 4900} {"train_loss": -7.229340553283691, "global_step": 205831, "epoch": 4900} {"train_loss": -7.169543266296387, "global_step": 205832, "epoch": 4900} {"train_loss": -7.1770782470703125, "global_step": 205833, "epoch": 4900} {"train_loss": -7.1689910888671875, "global_step": 205834, "epoch": 4900} {"train_loss": -7.193451881408691, "global_step": 205835, "epoch": 4900} {"train_loss": -7.114776134490967, "global_step": 205836, "epoch": 4900} {"train_loss": -7.202188968658447, "global_step": 205837, "epoch": 4900} {"train_loss": -7.1815948486328125, "global_step": 205838, "epoch": 4900} {"train_loss": -7.249419212341309, "global_step": 205839, "epoch": 4900} {"train_loss": -7.292823791503906, "global_step": 205840, "epoch": 4900} {"train_loss": -7.242744445800781, "global_step": 205841, "epoch": 4900, "train/sim_max_reward_0": 0.9942436860961515, "train/sim_max_reward_1": 0.841453026973796, "train/sim_max_reward_2": 0.31175893340519517, "train/sim_max_reward_3": 0.12318697994623781, "train/sim_max_reward_4": 0.3581783852299507, "train/sim_max_reward_5": 0.9971376604525174, "test/sim_max_reward_4400000": 0.9653657659966687, "test/sim_max_reward_4400001": 0.3245390494767449, "test/sim_max_reward_4400002": 0.950181283604179, "test/sim_max_reward_4400003": 0.9028605252064132, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.9264653023788952, "test/sim_max_reward_4400006": 0.4391306624931487, "test/sim_max_reward_4400007": 0.3885340514257634, "test/sim_max_reward_4400008": 0.29680845157464003, "test/sim_max_reward_4400009": 0.9661068649113527, "test/sim_max_reward_4400010": 0.19930154146482226, "test/sim_max_reward_4400011": 0.3003567616045634, "test/sim_max_reward_4400012": 0.9828234856039048, "test/sim_max_reward_4400013": 0.9973533592901788, "test/sim_max_reward_4400014": 0.5787601864045854, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.1062179086525808, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.24170887371563402, "test/sim_max_reward_4400019": 0.00853186786205499, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.8608274966632934, "test/sim_max_reward_4400023": 0.9660394207798485, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.26259266133812376, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 0.0013580567681539706, "test/sim_max_reward_4400028": 0.7117186691955601, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 0.9946536019662984, "test/sim_max_reward_4400031": 0.930978310112049, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9076331534413922, "test/sim_max_reward_4400034": 0.9358420055301816, "test/sim_max_reward_4400035": 0.9603428186304636, "test/sim_max_reward_4400036": 0.9523349142389086, "test/sim_max_reward_4400037": 0.9826154022757025, "test/sim_max_reward_4400038": 0.9313847503954409, "test/sim_max_reward_4400039": 0.9738407885477645, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9820203354864769, "test/sim_max_reward_4400042": 0.5486741501727787, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9555488701653829, "test/sim_max_reward_4400045": 0.993833679223141, "test/sim_max_reward_4400046": 0.942148422078423, "test/sim_max_reward_4400047": 0.9081884953420906, "test/sim_max_reward_4400048": 0.9342674776940795, "test/sim_max_reward_4400049": 1.0, "train/mean_score": 0.6043264453506415, "test/mean_score": 0.6356685179781444, "val_loss": 69061.578125} {"train_loss": -7.286144256591797, "global_step": 205842, "epoch": 4901} {"train_loss": -7.1961517333984375, "global_step": 205843, "epoch": 4901} {"train_loss": -7.296462535858154, "global_step": 205844, "epoch": 4901} {"train_loss": -7.1887946128845215, "global_step": 205845, "epoch": 4901} {"train_loss": -7.319146156311035, "global_step": 205846, "epoch": 4901} {"train_loss": -7.233063697814941, "global_step": 205847, "epoch": 4901} {"train_loss": -7.179644584655762, "global_step": 205848, "epoch": 4901} {"train_loss": -7.178481101989746, "global_step": 205849, "epoch": 4901} {"train_loss": -7.3244242668151855, "global_step": 205850, "epoch": 4901} {"train_loss": -7.185310363769531, "global_step": 205851, "epoch": 4901} {"train_loss": -7.208645820617676, "global_step": 205852, "epoch": 4901} {"train_loss": -7.228090763092041, "global_step": 205853, "epoch": 4901} {"train_loss": -7.02073335647583, "global_step": 205854, "epoch": 4901} {"train_loss": -7.200028419494629, "global_step": 205855, "epoch": 4901} {"train_loss": -7.292758464813232, "global_step": 205856, "epoch": 4901} {"train_loss": -7.213746547698975, "global_step": 205857, "epoch": 4901} {"train_loss": -7.201347351074219, "global_step": 205858, "epoch": 4901} {"train_loss": -7.2104363441467285, "global_step": 205859, "epoch": 4901} {"train_loss": -7.367992401123047, "global_step": 205860, "epoch": 4901} {"train_loss": -7.136159896850586, "global_step": 205861, "epoch": 4901} {"train_loss": -7.067627429962158, "global_step": 205862, "epoch": 4901} {"train_loss": -7.211184501647949, "global_step": 205863, "epoch": 4901} {"train_loss": -7.187532424926758, "global_step": 205864, "epoch": 4901} {"train_loss": -7.3218841552734375, "global_step": 205865, "epoch": 4901} {"train_loss": -7.074501991271973, "global_step": 205866, "epoch": 4901} {"train_loss": -7.252376556396484, "global_step": 205867, "epoch": 4901} {"train_loss": -7.174955368041992, "global_step": 205868, "epoch": 4901} {"train_loss": -7.122713088989258, "global_step": 205869, "epoch": 4901} {"train_loss": -7.252521514892578, "global_step": 205870, "epoch": 4901} {"train_loss": -7.066990852355957, "global_step": 205871, "epoch": 4901} {"train_loss": -7.293631553649902, "global_step": 205872, "epoch": 4901} {"train_loss": -7.143388271331787, "global_step": 205873, "epoch": 4901} {"train_loss": -7.15987491607666, "global_step": 205874, "epoch": 4901} {"train_loss": -7.3582353591918945, "global_step": 205875, "epoch": 4901} {"train_loss": -7.245543479919434, "global_step": 205876, "epoch": 4901} {"train_loss": -7.182833194732666, "global_step": 205877, "epoch": 4901} {"train_loss": -7.309305191040039, "global_step": 205878, "epoch": 4901} {"train_loss": -7.263683319091797, "global_step": 205879, "epoch": 4901} {"train_loss": -7.284858226776123, "global_step": 205880, "epoch": 4901} {"train_loss": -7.3190155029296875, "global_step": 205881, "epoch": 4901} {"train_loss": -7.354281425476074, "global_step": 205882, "epoch": 4901} {"train_loss": -7.222236735480172, "global_step": 205883, "epoch": 4901, "val_loss": 69139.046875} {"train_loss": -7.317995548248291, "global_step": 205884, "epoch": 4902} {"train_loss": -7.1541523933410645, "global_step": 205885, "epoch": 4902} {"train_loss": -7.087703227996826, "global_step": 205886, "epoch": 4902} {"train_loss": -7.196634292602539, "global_step": 205887, "epoch": 4902} {"train_loss": -7.324069023132324, "global_step": 205888, "epoch": 4902} {"train_loss": -7.135310173034668, "global_step": 205889, "epoch": 4902} {"train_loss": -7.261606216430664, "global_step": 205890, "epoch": 4902} {"train_loss": -7.232355117797852, "global_step": 205891, "epoch": 4902} {"train_loss": -7.193155765533447, "global_step": 205892, "epoch": 4902} {"train_loss": -7.2877912521362305, "global_step": 205893, "epoch": 4902} {"train_loss": -7.240663528442383, "global_step": 205894, "epoch": 4902} {"train_loss": -7.1669087409973145, "global_step": 205895, "epoch": 4902} {"train_loss": -7.181012153625488, "global_step": 205896, "epoch": 4902} {"train_loss": -7.334499359130859, "global_step": 205897, "epoch": 4902} {"train_loss": -7.204946517944336, "global_step": 205898, "epoch": 4902} {"train_loss": -7.273525238037109, "global_step": 205899, "epoch": 4902} {"train_loss": -7.254642486572266, "global_step": 205900, "epoch": 4902} {"train_loss": -7.143531322479248, "global_step": 205901, "epoch": 4902} {"train_loss": -7.282259941101074, "global_step": 205902, "epoch": 4902} {"train_loss": -7.301727294921875, "global_step": 205903, "epoch": 4902} {"train_loss": -7.126029014587402, "global_step": 205904, "epoch": 4902} {"train_loss": -7.368487358093262, "global_step": 205905, "epoch": 4902} {"train_loss": -7.190311431884766, "global_step": 205906, "epoch": 4902} {"train_loss": -7.2669572830200195, "global_step": 205907, "epoch": 4902} {"train_loss": -7.248770713806152, "global_step": 205908, "epoch": 4902} {"train_loss": -7.135622978210449, "global_step": 205909, "epoch": 4902} {"train_loss": -6.932720184326172, "global_step": 205910, "epoch": 4902} {"train_loss": -7.258397579193115, "global_step": 205911, "epoch": 4902} {"train_loss": -7.156312942504883, "global_step": 205912, "epoch": 4902} {"train_loss": -7.151128768920898, "global_step": 205913, "epoch": 4902} {"train_loss": -7.254212379455566, "global_step": 205914, "epoch": 4902} {"train_loss": -7.289704322814941, "global_step": 205915, "epoch": 4902} {"train_loss": -7.162883281707764, "global_step": 205916, "epoch": 4902} {"train_loss": -7.2472734451293945, "global_step": 205917, "epoch": 4902} {"train_loss": -7.24983024597168, "global_step": 205918, "epoch": 4902} {"train_loss": -7.250161170959473, "global_step": 205919, "epoch": 4902} {"train_loss": -7.311164855957031, "global_step": 205920, "epoch": 4902} {"train_loss": -7.186458110809326, "global_step": 205921, "epoch": 4902} {"train_loss": -7.341386795043945, "global_step": 205922, "epoch": 4902} {"train_loss": -7.399036884307861, "global_step": 205923, "epoch": 4902} {"train_loss": -7.244674205780029, "global_step": 205924, "epoch": 4902} {"train_loss": -7.2291156223842075, "global_step": 205925, "epoch": 4902, "val_loss": 69067.984375} {"train_loss": -7.253990173339844, "global_step": 205926, "epoch": 4903} {"train_loss": -7.279871940612793, "global_step": 205927, "epoch": 4903} {"train_loss": -7.110500812530518, "global_step": 205928, "epoch": 4903} {"train_loss": -7.273689270019531, "global_step": 205929, "epoch": 4903} {"train_loss": -7.165744781494141, "global_step": 205930, "epoch": 4903} {"train_loss": -7.076535701751709, "global_step": 205931, "epoch": 4903} {"train_loss": -7.183018207550049, "global_step": 205932, "epoch": 4903} {"train_loss": -7.094968795776367, "global_step": 205933, "epoch": 4903} {"train_loss": -7.194579124450684, "global_step": 205934, "epoch": 4903} {"train_loss": -7.205539226531982, "global_step": 205935, "epoch": 4903} {"train_loss": -7.181732177734375, "global_step": 205936, "epoch": 4903} {"train_loss": -7.165458679199219, "global_step": 205937, "epoch": 4903} {"train_loss": -7.165281295776367, "global_step": 205938, "epoch": 4903} {"train_loss": -7.114819049835205, "global_step": 205939, "epoch": 4903} {"train_loss": -7.258177757263184, "global_step": 205940, "epoch": 4903} {"train_loss": -7.134222507476807, "global_step": 205941, "epoch": 4903} {"train_loss": -7.189367294311523, "global_step": 205942, "epoch": 4903} {"train_loss": -7.210161209106445, "global_step": 205943, "epoch": 4903} {"train_loss": -7.112930774688721, "global_step": 205944, "epoch": 4903} {"train_loss": -7.09754753112793, "global_step": 205945, "epoch": 4903} {"train_loss": -7.154305458068848, "global_step": 205946, "epoch": 4903} {"train_loss": -7.30299186706543, "global_step": 205947, "epoch": 4903} {"train_loss": -7.288753509521484, "global_step": 205948, "epoch": 4903} {"train_loss": -7.189703941345215, "global_step": 205949, "epoch": 4903} {"train_loss": -7.329813003540039, "global_step": 205950, "epoch": 4903} {"train_loss": -7.175968647003174, "global_step": 205951, "epoch": 4903} {"train_loss": -7.06411075592041, "global_step": 205952, "epoch": 4903} {"train_loss": -7.168731212615967, "global_step": 205953, "epoch": 4903} {"train_loss": -7.182534217834473, "global_step": 205954, "epoch": 4903} {"train_loss": -7.1637091636657715, "global_step": 205955, "epoch": 4903} {"train_loss": -7.265122413635254, "global_step": 205956, "epoch": 4903} {"train_loss": -7.2249016761779785, "global_step": 205957, "epoch": 4903} {"train_loss": -7.3105010986328125, "global_step": 205958, "epoch": 4903} {"train_loss": -7.327018737792969, "global_step": 205959, "epoch": 4903} {"train_loss": -7.30284309387207, "global_step": 205960, "epoch": 4903} {"train_loss": -7.176761627197266, "global_step": 205961, "epoch": 4903} {"train_loss": -7.231997966766357, "global_step": 205962, "epoch": 4903} {"train_loss": -7.2184038162231445, "global_step": 205963, "epoch": 4903} {"train_loss": -7.369119644165039, "global_step": 205964, "epoch": 4903} {"train_loss": -7.302041053771973, "global_step": 205965, "epoch": 4903} {"train_loss": -7.307029724121094, "global_step": 205966, "epoch": 4903} {"train_loss": -7.211197228658767, "global_step": 205967, "epoch": 4903, "val_loss": 69190.703125} {"train_loss": -7.253634452819824, "global_step": 205968, "epoch": 4904} {"train_loss": -7.300656318664551, "global_step": 205969, "epoch": 4904} {"train_loss": -7.340419769287109, "global_step": 205970, "epoch": 4904} {"train_loss": -7.358427047729492, "global_step": 205971, "epoch": 4904} {"train_loss": -7.324349403381348, "global_step": 205972, "epoch": 4904} {"train_loss": -7.25350284576416, "global_step": 205973, "epoch": 4904} {"train_loss": -7.357456207275391, "global_step": 205974, "epoch": 4904} {"train_loss": -7.217466354370117, "global_step": 205975, "epoch": 4904} {"train_loss": -7.313774108886719, "global_step": 205976, "epoch": 4904} {"train_loss": -7.169925212860107, "global_step": 205977, "epoch": 4904} {"train_loss": -7.362706184387207, "global_step": 205978, "epoch": 4904} {"train_loss": -7.408535003662109, "global_step": 205979, "epoch": 4904} {"train_loss": -7.236675262451172, "global_step": 205980, "epoch": 4904} {"train_loss": -7.1690778732299805, "global_step": 205981, "epoch": 4904} {"train_loss": -7.40496826171875, "global_step": 205982, "epoch": 4904} {"train_loss": -7.231908798217773, "global_step": 205983, "epoch": 4904} {"train_loss": -7.317096710205078, "global_step": 205984, "epoch": 4904} {"train_loss": -7.409080505371094, "global_step": 205985, "epoch": 4904} {"train_loss": -7.15283203125, "global_step": 205986, "epoch": 4904} {"train_loss": -7.30844783782959, "global_step": 205987, "epoch": 4904} {"train_loss": -7.273260116577148, "global_step": 205988, "epoch": 4904} {"train_loss": -7.192852020263672, "global_step": 205989, "epoch": 4904} {"train_loss": -7.256443023681641, "global_step": 205990, "epoch": 4904} {"train_loss": -7.228368282318115, "global_step": 205991, "epoch": 4904} {"train_loss": -7.33168888092041, "global_step": 205992, "epoch": 4904} {"train_loss": -7.199624061584473, "global_step": 205993, "epoch": 4904} {"train_loss": -7.1451616287231445, "global_step": 205994, "epoch": 4904} {"train_loss": -7.256418704986572, "global_step": 205995, "epoch": 4904} {"train_loss": -7.327993869781494, "global_step": 205996, "epoch": 4904} {"train_loss": -7.253109455108643, "global_step": 205997, "epoch": 4904} {"train_loss": -7.329312324523926, "global_step": 205998, "epoch": 4904} {"train_loss": -7.322729587554932, "global_step": 205999, "epoch": 4904} {"train_loss": -7.23411750793457, "global_step": 206000, "epoch": 4904} {"train_loss": -7.400798320770264, "global_step": 206001, "epoch": 4904} {"train_loss": -7.3605732917785645, "global_step": 206002, "epoch": 4904} {"train_loss": -7.2965521812438965, "global_step": 206003, "epoch": 4904} {"train_loss": -7.340545654296875, "global_step": 206004, "epoch": 4904} {"train_loss": -7.226507186889648, "global_step": 206005, "epoch": 4904} {"train_loss": -7.252137660980225, "global_step": 206006, "epoch": 4904} {"train_loss": -7.170953750610352, "global_step": 206007, "epoch": 4904} {"train_loss": -7.269562721252441, "global_step": 206008, "epoch": 4904} {"train_loss": -7.282097612108503, "global_step": 206009, "epoch": 4904, "val_loss": 69141.0390625} {"train_loss": -7.460890293121338, "global_step": 206010, "epoch": 4905} {"train_loss": -7.331400394439697, "global_step": 206011, "epoch": 4905} {"train_loss": -7.402891159057617, "global_step": 206012, "epoch": 4905} {"train_loss": -7.233273506164551, "global_step": 206013, "epoch": 4905} {"train_loss": -7.31983757019043, "global_step": 206014, "epoch": 4905} {"train_loss": -7.22908878326416, "global_step": 206015, "epoch": 4905} {"train_loss": -7.272375106811523, "global_step": 206016, "epoch": 4905} {"train_loss": -7.311464309692383, "global_step": 206017, "epoch": 4905} {"train_loss": -7.280013084411621, "global_step": 206018, "epoch": 4905} {"train_loss": -7.2957258224487305, "global_step": 206019, "epoch": 4905} {"train_loss": -7.269975185394287, "global_step": 206020, "epoch": 4905} {"train_loss": -7.170543670654297, "global_step": 206021, "epoch": 4905} {"train_loss": -7.374471664428711, "global_step": 206022, "epoch": 4905} {"train_loss": -7.31558895111084, "global_step": 206023, "epoch": 4905} {"train_loss": -7.405331611633301, "global_step": 206024, "epoch": 4905} {"train_loss": -7.312647819519043, "global_step": 206025, "epoch": 4905} {"train_loss": -7.412302017211914, "global_step": 206026, "epoch": 4905} {"train_loss": -7.326118469238281, "global_step": 206027, "epoch": 4905} {"train_loss": -7.3909010887146, "global_step": 206028, "epoch": 4905} {"train_loss": -7.432839393615723, "global_step": 206029, "epoch": 4905} {"train_loss": -7.312259197235107, "global_step": 206030, "epoch": 4905} {"train_loss": -7.343990325927734, "global_step": 206031, "epoch": 4905} {"train_loss": -7.319942474365234, "global_step": 206032, "epoch": 4905} {"train_loss": -7.309000015258789, "global_step": 206033, "epoch": 4905} {"train_loss": -7.322731018066406, "global_step": 206034, "epoch": 4905} {"train_loss": -7.378037452697754, "global_step": 206035, "epoch": 4905} {"train_loss": -7.275063514709473, "global_step": 206036, "epoch": 4905} {"train_loss": -7.300143241882324, "global_step": 206037, "epoch": 4905} {"train_loss": -7.3011980056762695, "global_step": 206038, "epoch": 4905} {"train_loss": -7.359861850738525, "global_step": 206039, "epoch": 4905} {"train_loss": -7.334399700164795, "global_step": 206040, "epoch": 4905} {"train_loss": -7.360435485839844, "global_step": 206041, "epoch": 4905} {"train_loss": -7.2794647216796875, "global_step": 206042, "epoch": 4905} {"train_loss": -7.366811752319336, "global_step": 206043, "epoch": 4905} {"train_loss": -7.397150993347168, "global_step": 206044, "epoch": 4905} {"train_loss": -7.165152549743652, "global_step": 206045, "epoch": 4905} {"train_loss": -7.336174488067627, "global_step": 206046, "epoch": 4905} {"train_loss": -7.246721267700195, "global_step": 206047, "epoch": 4905} {"train_loss": -7.288572311401367, "global_step": 206048, "epoch": 4905} {"train_loss": -7.33799934387207, "global_step": 206049, "epoch": 4905} {"train_loss": -7.232180595397949, "global_step": 206050, "epoch": 4905} {"train_loss": -7.31742711294265, "global_step": 206051, "epoch": 4905, "val_loss": 69252.8984375} {"train_loss": -7.213995933532715, "global_step": 206052, "epoch": 4906} {"train_loss": -7.2613396644592285, "global_step": 206053, "epoch": 4906} {"train_loss": -7.316917896270752, "global_step": 206054, "epoch": 4906} {"train_loss": -7.229496955871582, "global_step": 206055, "epoch": 4906} {"train_loss": -7.302970886230469, "global_step": 206056, "epoch": 4906} {"train_loss": -7.451615333557129, "global_step": 206057, "epoch": 4906} {"train_loss": -7.3477325439453125, "global_step": 206058, "epoch": 4906} {"train_loss": -7.358184337615967, "global_step": 206059, "epoch": 4906} {"train_loss": -7.332492828369141, "global_step": 206060, "epoch": 4906} {"train_loss": -7.295416831970215, "global_step": 206061, "epoch": 4906} {"train_loss": -7.269255638122559, "global_step": 206062, "epoch": 4906} {"train_loss": -7.320666313171387, "global_step": 206063, "epoch": 4906} {"train_loss": -7.167364120483398, "global_step": 206064, "epoch": 4906} {"train_loss": -7.361794948577881, "global_step": 206065, "epoch": 4906} {"train_loss": -7.335235595703125, "global_step": 206066, "epoch": 4906} {"train_loss": -7.20826530456543, "global_step": 206067, "epoch": 4906} {"train_loss": -7.286293029785156, "global_step": 206068, "epoch": 4906} {"train_loss": -7.321567535400391, "global_step": 206069, "epoch": 4906} {"train_loss": -7.268536567687988, "global_step": 206070, "epoch": 4906} {"train_loss": -7.3617753982543945, "global_step": 206071, "epoch": 4906} {"train_loss": -7.204375743865967, "global_step": 206072, "epoch": 4906} {"train_loss": -7.34431266784668, "global_step": 206073, "epoch": 4906} {"train_loss": -7.283536911010742, "global_step": 206074, "epoch": 4906} {"train_loss": -7.304623126983643, "global_step": 206075, "epoch": 4906} {"train_loss": -7.298133373260498, "global_step": 206076, "epoch": 4906} {"train_loss": -7.3258514404296875, "global_step": 206077, "epoch": 4906} {"train_loss": -7.307926177978516, "global_step": 206078, "epoch": 4906} {"train_loss": -7.26602029800415, "global_step": 206079, "epoch": 4906} {"train_loss": -7.376014232635498, "global_step": 206080, "epoch": 4906} {"train_loss": -7.408364772796631, "global_step": 206081, "epoch": 4906} {"train_loss": -7.388345241546631, "global_step": 206082, "epoch": 4906} {"train_loss": -7.2440080642700195, "global_step": 206083, "epoch": 4906} {"train_loss": -7.225419044494629, "global_step": 206084, "epoch": 4906} {"train_loss": -7.173882961273193, "global_step": 206085, "epoch": 4906} {"train_loss": -7.378357410430908, "global_step": 206086, "epoch": 4906} {"train_loss": -7.289655685424805, "global_step": 206087, "epoch": 4906} {"train_loss": -7.296351432800293, "global_step": 206088, "epoch": 4906} {"train_loss": -7.294633388519287, "global_step": 206089, "epoch": 4906} {"train_loss": -7.325775146484375, "global_step": 206090, "epoch": 4906} {"train_loss": -7.299671173095703, "global_step": 206091, "epoch": 4906} {"train_loss": -7.2653303146362305, "global_step": 206092, "epoch": 4906} {"train_loss": -7.302634330022903, "global_step": 206093, "epoch": 4906, "val_loss": 69263.84375} {"train_loss": -7.3336920738220215, "global_step": 206094, "epoch": 4907} {"train_loss": -7.250336170196533, "global_step": 206095, "epoch": 4907} {"train_loss": -7.403208255767822, "global_step": 206096, "epoch": 4907} {"train_loss": -7.3723835945129395, "global_step": 206097, "epoch": 4907} {"train_loss": -7.322174549102783, "global_step": 206098, "epoch": 4907} {"train_loss": -7.348968505859375, "global_step": 206099, "epoch": 4907} {"train_loss": -7.3184990882873535, "global_step": 206100, "epoch": 4907} {"train_loss": -7.265710830688477, "global_step": 206101, "epoch": 4907} {"train_loss": -7.280142784118652, "global_step": 206102, "epoch": 4907} {"train_loss": -7.259061813354492, "global_step": 206103, "epoch": 4907} {"train_loss": -7.094664573669434, "global_step": 206104, "epoch": 4907} {"train_loss": -7.105428695678711, "global_step": 206105, "epoch": 4907} {"train_loss": -7.395572662353516, "global_step": 206106, "epoch": 4907} {"train_loss": -7.183671951293945, "global_step": 206107, "epoch": 4907} {"train_loss": -7.177037239074707, "global_step": 206108, "epoch": 4907} {"train_loss": -7.292700290679932, "global_step": 206109, "epoch": 4907} {"train_loss": -7.242645263671875, "global_step": 206110, "epoch": 4907} {"train_loss": -7.367443084716797, "global_step": 206111, "epoch": 4907} {"train_loss": -7.285984039306641, "global_step": 206112, "epoch": 4907} {"train_loss": -7.089574813842773, "global_step": 206113, "epoch": 4907} {"train_loss": -7.077975749969482, "global_step": 206114, "epoch": 4907} {"train_loss": -7.326478004455566, "global_step": 206115, "epoch": 4907} {"train_loss": -7.143886566162109, "global_step": 206116, "epoch": 4907} {"train_loss": -7.19008731842041, "global_step": 206117, "epoch": 4907} {"train_loss": -7.208097457885742, "global_step": 206118, "epoch": 4907} {"train_loss": -7.018062114715576, "global_step": 206119, "epoch": 4907} {"train_loss": -7.279427528381348, "global_step": 206120, "epoch": 4907} {"train_loss": -7.227731227874756, "global_step": 206121, "epoch": 4907} {"train_loss": -7.156986236572266, "global_step": 206122, "epoch": 4907} {"train_loss": -7.295272350311279, "global_step": 206123, "epoch": 4907} {"train_loss": -7.128053188323975, "global_step": 206124, "epoch": 4907} {"train_loss": -7.284470558166504, "global_step": 206125, "epoch": 4907} {"train_loss": -7.353663444519043, "global_step": 206126, "epoch": 4907} {"train_loss": -7.045226097106934, "global_step": 206127, "epoch": 4907} {"train_loss": -7.192779541015625, "global_step": 206128, "epoch": 4907} {"train_loss": -7.07596492767334, "global_step": 206129, "epoch": 4907} {"train_loss": -7.189945697784424, "global_step": 206130, "epoch": 4907} {"train_loss": -7.340285778045654, "global_step": 206131, "epoch": 4907} {"train_loss": -7.111417770385742, "global_step": 206132, "epoch": 4907} {"train_loss": -7.121186256408691, "global_step": 206133, "epoch": 4907} {"train_loss": -7.1622233390808105, "global_step": 206134, "epoch": 4907} {"train_loss": -7.2287967545645575, "global_step": 206135, "epoch": 4907, "val_loss": 69199.4375} {"train_loss": -7.254137992858887, "global_step": 206136, "epoch": 4908} {"train_loss": -7.266554832458496, "global_step": 206137, "epoch": 4908} {"train_loss": -7.125368118286133, "global_step": 206138, "epoch": 4908} {"train_loss": -7.248980522155762, "global_step": 206139, "epoch": 4908} {"train_loss": -7.195850849151611, "global_step": 206140, "epoch": 4908} {"train_loss": -7.200654029846191, "global_step": 206141, "epoch": 4908} {"train_loss": -7.223614692687988, "global_step": 206142, "epoch": 4908} {"train_loss": -7.1316022872924805, "global_step": 206143, "epoch": 4908} {"train_loss": -7.291410446166992, "global_step": 206144, "epoch": 4908} {"train_loss": -7.204485893249512, "global_step": 206145, "epoch": 4908} {"train_loss": -7.169010162353516, "global_step": 206146, "epoch": 4908} {"train_loss": -7.2346882820129395, "global_step": 206147, "epoch": 4908} {"train_loss": -7.18851375579834, "global_step": 206148, "epoch": 4908} {"train_loss": -7.315756797790527, "global_step": 206149, "epoch": 4908} {"train_loss": -7.331792831420898, "global_step": 206150, "epoch": 4908} {"train_loss": -7.307883262634277, "global_step": 206151, "epoch": 4908} {"train_loss": -7.221879005432129, "global_step": 206152, "epoch": 4908} {"train_loss": -7.210773468017578, "global_step": 206153, "epoch": 4908} {"train_loss": -7.2631683349609375, "global_step": 206154, "epoch": 4908} {"train_loss": -7.262775897979736, "global_step": 206155, "epoch": 4908} {"train_loss": -7.30654239654541, "global_step": 206156, "epoch": 4908} {"train_loss": -7.263581275939941, "global_step": 206157, "epoch": 4908} {"train_loss": -7.276278495788574, "global_step": 206158, "epoch": 4908} {"train_loss": -7.31746244430542, "global_step": 206159, "epoch": 4908} {"train_loss": -7.234433174133301, "global_step": 206160, "epoch": 4908} {"train_loss": -7.155450820922852, "global_step": 206161, "epoch": 4908} {"train_loss": -7.262453079223633, "global_step": 206162, "epoch": 4908} {"train_loss": -7.337949275970459, "global_step": 206163, "epoch": 4908} {"train_loss": -7.2382917404174805, "global_step": 206164, "epoch": 4908} {"train_loss": -7.3194580078125, "global_step": 206165, "epoch": 4908} {"train_loss": -7.292032718658447, "global_step": 206166, "epoch": 4908} {"train_loss": -7.288364410400391, "global_step": 206167, "epoch": 4908} {"train_loss": -7.275704383850098, "global_step": 206168, "epoch": 4908} {"train_loss": -7.310956001281738, "global_step": 206169, "epoch": 4908} {"train_loss": -7.191037178039551, "global_step": 206170, "epoch": 4908} {"train_loss": -7.337592124938965, "global_step": 206171, "epoch": 4908} {"train_loss": -7.225554466247559, "global_step": 206172, "epoch": 4908} {"train_loss": -7.2626214027404785, "global_step": 206173, "epoch": 4908} {"train_loss": -7.278610706329346, "global_step": 206174, "epoch": 4908} {"train_loss": -7.306563377380371, "global_step": 206175, "epoch": 4908} {"train_loss": -7.322858810424805, "global_step": 206176, "epoch": 4908} {"train_loss": -7.255905321666172, "global_step": 206177, "epoch": 4908, "val_loss": 69381.75} {"train_loss": -7.2643609046936035, "global_step": 206178, "epoch": 4909} {"train_loss": -7.314099311828613, "global_step": 206179, "epoch": 4909} {"train_loss": -7.233430862426758, "global_step": 206180, "epoch": 4909} {"train_loss": -7.241183280944824, "global_step": 206181, "epoch": 4909} {"train_loss": -7.367030143737793, "global_step": 206182, "epoch": 4909} {"train_loss": -7.278557777404785, "global_step": 206183, "epoch": 4909} {"train_loss": -7.263388633728027, "global_step": 206184, "epoch": 4909} {"train_loss": -7.293994426727295, "global_step": 206185, "epoch": 4909} {"train_loss": -7.281926155090332, "global_step": 206186, "epoch": 4909} {"train_loss": -7.227677345275879, "global_step": 206187, "epoch": 4909} {"train_loss": -7.26494836807251, "global_step": 206188, "epoch": 4909} {"train_loss": -7.284817695617676, "global_step": 206189, "epoch": 4909} {"train_loss": -7.39260721206665, "global_step": 206190, "epoch": 4909} {"train_loss": -7.317455768585205, "global_step": 206191, "epoch": 4909} {"train_loss": -7.184247016906738, "global_step": 206192, "epoch": 4909} {"train_loss": -7.3899335861206055, "global_step": 206193, "epoch": 4909} {"train_loss": -7.347121715545654, "global_step": 206194, "epoch": 4909} {"train_loss": -7.373591423034668, "global_step": 206195, "epoch": 4909} {"train_loss": -7.3622145652771, "global_step": 206196, "epoch": 4909} {"train_loss": -7.264909744262695, "global_step": 206197, "epoch": 4909} {"train_loss": -7.323916912078857, "global_step": 206198, "epoch": 4909} {"train_loss": -7.259490013122559, "global_step": 206199, "epoch": 4909} {"train_loss": -7.294614791870117, "global_step": 206200, "epoch": 4909} {"train_loss": -7.341819763183594, "global_step": 206201, "epoch": 4909} {"train_loss": -7.281757831573486, "global_step": 206202, "epoch": 4909} {"train_loss": -7.3361992835998535, "global_step": 206203, "epoch": 4909} {"train_loss": -7.29841423034668, "global_step": 206204, "epoch": 4909} {"train_loss": -7.348173141479492, "global_step": 206205, "epoch": 4909} {"train_loss": -7.296198844909668, "global_step": 206206, "epoch": 4909} {"train_loss": -7.307402610778809, "global_step": 206207, "epoch": 4909} {"train_loss": -7.249787330627441, "global_step": 206208, "epoch": 4909} {"train_loss": -7.35360050201416, "global_step": 206209, "epoch": 4909} {"train_loss": -7.332032203674316, "global_step": 206210, "epoch": 4909} {"train_loss": -7.314385890960693, "global_step": 206211, "epoch": 4909} {"train_loss": -7.3169145584106445, "global_step": 206212, "epoch": 4909} {"train_loss": -7.186936378479004, "global_step": 206213, "epoch": 4909} {"train_loss": -7.304121017456055, "global_step": 206214, "epoch": 4909} {"train_loss": -7.274819374084473, "global_step": 206215, "epoch": 4909} {"train_loss": -7.182501792907715, "global_step": 206216, "epoch": 4909} {"train_loss": -7.256699085235596, "global_step": 206217, "epoch": 4909} {"train_loss": -7.170543670654297, "global_step": 206218, "epoch": 4909} {"train_loss": -7.2923612254006525, "global_step": 206219, "epoch": 4909, "val_loss": 69332.09375} {"train_loss": -7.176880836486816, "global_step": 206220, "epoch": 4910} {"train_loss": -7.288301944732666, "global_step": 206221, "epoch": 4910} {"train_loss": -7.157759189605713, "global_step": 206222, "epoch": 4910} {"train_loss": -7.229269504547119, "global_step": 206223, "epoch": 4910} {"train_loss": -7.184142589569092, "global_step": 206224, "epoch": 4910} {"train_loss": -7.221522331237793, "global_step": 206225, "epoch": 4910} {"train_loss": -7.218106269836426, "global_step": 206226, "epoch": 4910} {"train_loss": -7.173020362854004, "global_step": 206227, "epoch": 4910} {"train_loss": -7.207486152648926, "global_step": 206228, "epoch": 4910} {"train_loss": -7.167918682098389, "global_step": 206229, "epoch": 4910} {"train_loss": -7.086215972900391, "global_step": 206230, "epoch": 4910} {"train_loss": -7.0981340408325195, "global_step": 206231, "epoch": 4910} {"train_loss": -7.13816499710083, "global_step": 206232, "epoch": 4910} {"train_loss": -7.235475540161133, "global_step": 206233, "epoch": 4910} {"train_loss": -7.067296981811523, "global_step": 206234, "epoch": 4910} {"train_loss": -7.222817420959473, "global_step": 206235, "epoch": 4910} {"train_loss": -7.170273303985596, "global_step": 206236, "epoch": 4910} {"train_loss": -7.080351829528809, "global_step": 206237, "epoch": 4910} {"train_loss": -7.288224220275879, "global_step": 206238, "epoch": 4910} {"train_loss": -7.2831220626831055, "global_step": 206239, "epoch": 4910} {"train_loss": -7.283944129943848, "global_step": 206240, "epoch": 4910} {"train_loss": -7.063694000244141, "global_step": 206241, "epoch": 4910} {"train_loss": -7.126847267150879, "global_step": 206242, "epoch": 4910} {"train_loss": -7.229558944702148, "global_step": 206243, "epoch": 4910} {"train_loss": -7.190556526184082, "global_step": 206244, "epoch": 4910} {"train_loss": -7.26193904876709, "global_step": 206245, "epoch": 4910} {"train_loss": -7.144192695617676, "global_step": 206246, "epoch": 4910} {"train_loss": -7.229470252990723, "global_step": 206247, "epoch": 4910} {"train_loss": -7.129511833190918, "global_step": 206248, "epoch": 4910} {"train_loss": -7.326850891113281, "global_step": 206249, "epoch": 4910} {"train_loss": -7.132193088531494, "global_step": 206250, "epoch": 4910} {"train_loss": -7.247285842895508, "global_step": 206251, "epoch": 4910} {"train_loss": -7.235057830810547, "global_step": 206252, "epoch": 4910} {"train_loss": -7.327967643737793, "global_step": 206253, "epoch": 4910} {"train_loss": -7.218286037445068, "global_step": 206254, "epoch": 4910} {"train_loss": -7.274110794067383, "global_step": 206255, "epoch": 4910} {"train_loss": -7.2547101974487305, "global_step": 206256, "epoch": 4910} {"train_loss": -7.287491798400879, "global_step": 206257, "epoch": 4910} {"train_loss": -7.294648170471191, "global_step": 206258, "epoch": 4910} {"train_loss": -7.224587917327881, "global_step": 206259, "epoch": 4910} {"train_loss": -7.273318290710449, "global_step": 206260, "epoch": 4910} {"train_loss": -7.208047866821289, "global_step": 206261, "epoch": 4910, "val_loss": 69161.03125} {"train_loss": -7.245416641235352, "global_step": 206262, "epoch": 4911} {"train_loss": -7.241135597229004, "global_step": 206263, "epoch": 4911} {"train_loss": -7.175217628479004, "global_step": 206264, "epoch": 4911} {"train_loss": -7.382770538330078, "global_step": 206265, "epoch": 4911} {"train_loss": -7.3198442459106445, "global_step": 206266, "epoch": 4911} {"train_loss": -7.189570426940918, "global_step": 206267, "epoch": 4911} {"train_loss": -7.292343616485596, "global_step": 206268, "epoch": 4911} {"train_loss": -7.364648818969727, "global_step": 206269, "epoch": 4911} {"train_loss": -7.363287448883057, "global_step": 206270, "epoch": 4911} {"train_loss": -7.320235252380371, "global_step": 206271, "epoch": 4911} {"train_loss": -7.284533500671387, "global_step": 206272, "epoch": 4911} {"train_loss": -7.323073863983154, "global_step": 206273, "epoch": 4911} {"train_loss": -7.276642799377441, "global_step": 206274, "epoch": 4911} {"train_loss": -7.28074312210083, "global_step": 206275, "epoch": 4911} {"train_loss": -7.398530006408691, "global_step": 206276, "epoch": 4911} {"train_loss": -7.362237930297852, "global_step": 206277, "epoch": 4911} {"train_loss": -7.392928123474121, "global_step": 206278, "epoch": 4911} {"train_loss": -7.298385143280029, "global_step": 206279, "epoch": 4911} {"train_loss": -7.414629936218262, "global_step": 206280, "epoch": 4911} {"train_loss": -7.291984558105469, "global_step": 206281, "epoch": 4911} {"train_loss": -7.286492347717285, "global_step": 206282, "epoch": 4911} {"train_loss": -7.285752296447754, "global_step": 206283, "epoch": 4911} {"train_loss": -7.4388885498046875, "global_step": 206284, "epoch": 4911} {"train_loss": -7.3661394119262695, "global_step": 206285, "epoch": 4911} {"train_loss": -7.334826469421387, "global_step": 206286, "epoch": 4911} {"train_loss": -7.323469161987305, "global_step": 206287, "epoch": 4911} {"train_loss": -7.364406585693359, "global_step": 206288, "epoch": 4911} {"train_loss": -7.458644866943359, "global_step": 206289, "epoch": 4911} {"train_loss": -7.325564384460449, "global_step": 206290, "epoch": 4911} {"train_loss": -7.374866008758545, "global_step": 206291, "epoch": 4911} {"train_loss": -7.3370280265808105, "global_step": 206292, "epoch": 4911} {"train_loss": -7.5272603034973145, "global_step": 206293, "epoch": 4911} {"train_loss": -7.331775665283203, "global_step": 206294, "epoch": 4911} {"train_loss": -7.239762306213379, "global_step": 206295, "epoch": 4911} {"train_loss": -7.302986145019531, "global_step": 206296, "epoch": 4911} {"train_loss": -7.377325057983398, "global_step": 206297, "epoch": 4911} {"train_loss": -7.286081790924072, "global_step": 206298, "epoch": 4911} {"train_loss": -7.396986961364746, "global_step": 206299, "epoch": 4911} {"train_loss": -7.346263885498047, "global_step": 206300, "epoch": 4911} {"train_loss": -7.361941814422607, "global_step": 206301, "epoch": 4911} {"train_loss": -7.240716934204102, "global_step": 206302, "epoch": 4911} {"train_loss": -7.327717429115658, "global_step": 206303, "epoch": 4911, "val_loss": 69183.7421875} {"train_loss": -7.334423065185547, "global_step": 206304, "epoch": 4912} {"train_loss": -7.375386714935303, "global_step": 206305, "epoch": 4912} {"train_loss": -7.311136245727539, "global_step": 206306, "epoch": 4912} {"train_loss": -7.233585357666016, "global_step": 206307, "epoch": 4912} {"train_loss": -7.216470718383789, "global_step": 206308, "epoch": 4912} {"train_loss": -7.434867858886719, "global_step": 206309, "epoch": 4912} {"train_loss": -7.125024318695068, "global_step": 206310, "epoch": 4912} {"train_loss": -7.1180830001831055, "global_step": 206311, "epoch": 4912} {"train_loss": -7.293482780456543, "global_step": 206312, "epoch": 4912} {"train_loss": -7.411317348480225, "global_step": 206313, "epoch": 4912} {"train_loss": -7.304091453552246, "global_step": 206314, "epoch": 4912} {"train_loss": -7.266842842102051, "global_step": 206315, "epoch": 4912} {"train_loss": -7.164369583129883, "global_step": 206316, "epoch": 4912} {"train_loss": -7.329824924468994, "global_step": 206317, "epoch": 4912} {"train_loss": -7.238285541534424, "global_step": 206318, "epoch": 4912} {"train_loss": -7.31230354309082, "global_step": 206319, "epoch": 4912} {"train_loss": -7.20734977722168, "global_step": 206320, "epoch": 4912} {"train_loss": -7.166477680206299, "global_step": 206321, "epoch": 4912} {"train_loss": -7.349926948547363, "global_step": 206322, "epoch": 4912} {"train_loss": -7.174612998962402, "global_step": 206323, "epoch": 4912} {"train_loss": -7.373844146728516, "global_step": 206324, "epoch": 4912} {"train_loss": -7.289557456970215, "global_step": 206325, "epoch": 4912} {"train_loss": -7.237649917602539, "global_step": 206326, "epoch": 4912} {"train_loss": -7.148364543914795, "global_step": 206327, "epoch": 4912} {"train_loss": -7.193758010864258, "global_step": 206328, "epoch": 4912} {"train_loss": -7.277304649353027, "global_step": 206329, "epoch": 4912} {"train_loss": -7.218710899353027, "global_step": 206330, "epoch": 4912} {"train_loss": -7.194920063018799, "global_step": 206331, "epoch": 4912} {"train_loss": -7.256028652191162, "global_step": 206332, "epoch": 4912} {"train_loss": -7.165903091430664, "global_step": 206333, "epoch": 4912} {"train_loss": -7.321656227111816, "global_step": 206334, "epoch": 4912} {"train_loss": -7.304353713989258, "global_step": 206335, "epoch": 4912} {"train_loss": -6.998117446899414, "global_step": 206336, "epoch": 4912} {"train_loss": -7.18459939956665, "global_step": 206337, "epoch": 4912} {"train_loss": -7.150179862976074, "global_step": 206338, "epoch": 4912} {"train_loss": -6.997506141662598, "global_step": 206339, "epoch": 4912} {"train_loss": -7.2504963874816895, "global_step": 206340, "epoch": 4912} {"train_loss": -7.1197309494018555, "global_step": 206341, "epoch": 4912} {"train_loss": -7.164634704589844, "global_step": 206342, "epoch": 4912} {"train_loss": -7.278858184814453, "global_step": 206343, "epoch": 4912} {"train_loss": -7.133288860321045, "global_step": 206344, "epoch": 4912} {"train_loss": -7.237945942651658, "global_step": 206345, "epoch": 4912, "val_loss": 69098.0} {"train_loss": -7.108610153198242, "global_step": 206346, "epoch": 4913} {"train_loss": -7.156381607055664, "global_step": 206347, "epoch": 4913} {"train_loss": -7.127976417541504, "global_step": 206348, "epoch": 4913} {"train_loss": -7.105824947357178, "global_step": 206349, "epoch": 4913} {"train_loss": -7.274969100952148, "global_step": 206350, "epoch": 4913} {"train_loss": -7.068526268005371, "global_step": 206351, "epoch": 4913} {"train_loss": -7.193411350250244, "global_step": 206352, "epoch": 4913} {"train_loss": -7.105498313903809, "global_step": 206353, "epoch": 4913} {"train_loss": -7.117883205413818, "global_step": 206354, "epoch": 4913} {"train_loss": -7.299678802490234, "global_step": 206355, "epoch": 4913} {"train_loss": -7.1862874031066895, "global_step": 206356, "epoch": 4913} {"train_loss": -7.243041515350342, "global_step": 206357, "epoch": 4913} {"train_loss": -7.166332244873047, "global_step": 206358, "epoch": 4913} {"train_loss": -7.210958003997803, "global_step": 206359, "epoch": 4913} {"train_loss": -7.091921329498291, "global_step": 206360, "epoch": 4913} {"train_loss": -7.240895748138428, "global_step": 206361, "epoch": 4913} {"train_loss": -7.279516220092773, "global_step": 206362, "epoch": 4913} {"train_loss": -7.43112850189209, "global_step": 206363, "epoch": 4913} {"train_loss": -7.32509183883667, "global_step": 206364, "epoch": 4913} {"train_loss": -7.291625499725342, "global_step": 206365, "epoch": 4913} {"train_loss": -7.248380184173584, "global_step": 206366, "epoch": 4913} {"train_loss": -7.387686729431152, "global_step": 206367, "epoch": 4913} {"train_loss": -7.297018527984619, "global_step": 206368, "epoch": 4913} {"train_loss": -7.2064313888549805, "global_step": 206369, "epoch": 4913} {"train_loss": -7.261247634887695, "global_step": 206370, "epoch": 4913} {"train_loss": -7.271308422088623, "global_step": 206371, "epoch": 4913} {"train_loss": -7.232229232788086, "global_step": 206372, "epoch": 4913} {"train_loss": -7.30242395401001, "global_step": 206373, "epoch": 4913} {"train_loss": -7.230053901672363, "global_step": 206374, "epoch": 4913} {"train_loss": -7.325191020965576, "global_step": 206375, "epoch": 4913} {"train_loss": -7.192752838134766, "global_step": 206376, "epoch": 4913} {"train_loss": -7.263553619384766, "global_step": 206377, "epoch": 4913} {"train_loss": -7.298559665679932, "global_step": 206378, "epoch": 4913} {"train_loss": -7.1907734870910645, "global_step": 206379, "epoch": 4913} {"train_loss": -7.254068851470947, "global_step": 206380, "epoch": 4913} {"train_loss": -7.288640022277832, "global_step": 206381, "epoch": 4913} {"train_loss": -7.360509395599365, "global_step": 206382, "epoch": 4913} {"train_loss": -7.229857921600342, "global_step": 206383, "epoch": 4913} {"train_loss": -7.246776103973389, "global_step": 206384, "epoch": 4913} {"train_loss": -7.222036361694336, "global_step": 206385, "epoch": 4913} {"train_loss": -7.355018615722656, "global_step": 206386, "epoch": 4913} {"train_loss": -7.2380084083193825, "global_step": 206387, "epoch": 4913, "val_loss": 69230.2109375} {"train_loss": -7.160533905029297, "global_step": 206388, "epoch": 4914} {"train_loss": -7.268126964569092, "global_step": 206389, "epoch": 4914} {"train_loss": -7.27253532409668, "global_step": 206390, "epoch": 4914} {"train_loss": -7.339445114135742, "global_step": 206391, "epoch": 4914} {"train_loss": -7.35972785949707, "global_step": 206392, "epoch": 4914} {"train_loss": -7.309116363525391, "global_step": 206393, "epoch": 4914} {"train_loss": -7.3213348388671875, "global_step": 206394, "epoch": 4914} {"train_loss": -7.246709823608398, "global_step": 206395, "epoch": 4914} {"train_loss": -7.36821985244751, "global_step": 206396, "epoch": 4914} {"train_loss": -7.262392520904541, "global_step": 206397, "epoch": 4914} {"train_loss": -7.252084732055664, "global_step": 206398, "epoch": 4914} {"train_loss": -7.324697971343994, "global_step": 206399, "epoch": 4914} {"train_loss": -7.32429313659668, "global_step": 206400, "epoch": 4914} {"train_loss": -7.337183952331543, "global_step": 206401, "epoch": 4914} {"train_loss": -7.246808052062988, "global_step": 206402, "epoch": 4914} {"train_loss": -7.262212753295898, "global_step": 206403, "epoch": 4914} {"train_loss": -7.184557914733887, "global_step": 206404, "epoch": 4914} {"train_loss": -7.35526180267334, "global_step": 206405, "epoch": 4914} {"train_loss": -7.370335578918457, "global_step": 206406, "epoch": 4914} {"train_loss": -7.407392501831055, "global_step": 206407, "epoch": 4914} {"train_loss": -7.284248352050781, "global_step": 206408, "epoch": 4914} {"train_loss": -7.240517616271973, "global_step": 206409, "epoch": 4914} {"train_loss": -7.316276550292969, "global_step": 206410, "epoch": 4914} {"train_loss": -7.201552391052246, "global_step": 206411, "epoch": 4914} {"train_loss": -7.327145576477051, "global_step": 206412, "epoch": 4914} {"train_loss": -7.269503116607666, "global_step": 206413, "epoch": 4914} {"train_loss": -7.350533962249756, "global_step": 206414, "epoch": 4914} {"train_loss": -7.387958526611328, "global_step": 206415, "epoch": 4914} {"train_loss": -7.365617275238037, "global_step": 206416, "epoch": 4914} {"train_loss": -7.191593647003174, "global_step": 206417, "epoch": 4914} {"train_loss": -7.196346759796143, "global_step": 206418, "epoch": 4914} {"train_loss": -7.275752067565918, "global_step": 206419, "epoch": 4914} {"train_loss": -7.245073318481445, "global_step": 206420, "epoch": 4914} {"train_loss": -7.224359512329102, "global_step": 206421, "epoch": 4914} {"train_loss": -7.263118743896484, "global_step": 206422, "epoch": 4914} {"train_loss": -7.357434272766113, "global_step": 206423, "epoch": 4914} {"train_loss": -7.289190769195557, "global_step": 206424, "epoch": 4914} {"train_loss": -7.274022102355957, "global_step": 206425, "epoch": 4914} {"train_loss": -7.3161492347717285, "global_step": 206426, "epoch": 4914} {"train_loss": -7.308889389038086, "global_step": 206427, "epoch": 4914} {"train_loss": -7.279326438903809, "global_step": 206428, "epoch": 4914} {"train_loss": -7.2910684290386385, "global_step": 206429, "epoch": 4914, "val_loss": 69232.8359375} {"train_loss": -7.202427864074707, "global_step": 206430, "epoch": 4915} {"train_loss": -7.351734161376953, "global_step": 206431, "epoch": 4915} {"train_loss": -7.2925310134887695, "global_step": 206432, "epoch": 4915} {"train_loss": -7.228396892547607, "global_step": 206433, "epoch": 4915} {"train_loss": -7.253288269042969, "global_step": 206434, "epoch": 4915} {"train_loss": -7.30859899520874, "global_step": 206435, "epoch": 4915} {"train_loss": -7.321022987365723, "global_step": 206436, "epoch": 4915} {"train_loss": -7.379010200500488, "global_step": 206437, "epoch": 4915} {"train_loss": -7.318235397338867, "global_step": 206438, "epoch": 4915} {"train_loss": -7.136866569519043, "global_step": 206439, "epoch": 4915} {"train_loss": -7.273373603820801, "global_step": 206440, "epoch": 4915} {"train_loss": -7.382157802581787, "global_step": 206441, "epoch": 4915} {"train_loss": -7.296352863311768, "global_step": 206442, "epoch": 4915} {"train_loss": -7.3223958015441895, "global_step": 206443, "epoch": 4915} {"train_loss": -7.385443210601807, "global_step": 206444, "epoch": 4915} {"train_loss": -7.2999796867370605, "global_step": 206445, "epoch": 4915} {"train_loss": -7.316830635070801, "global_step": 206446, "epoch": 4915} {"train_loss": -7.4747700691223145, "global_step": 206447, "epoch": 4915} {"train_loss": -7.246807098388672, "global_step": 206448, "epoch": 4915} {"train_loss": -7.356729984283447, "global_step": 206449, "epoch": 4915} {"train_loss": -7.272256851196289, "global_step": 206450, "epoch": 4915} {"train_loss": -7.292629718780518, "global_step": 206451, "epoch": 4915} {"train_loss": -7.2869977951049805, "global_step": 206452, "epoch": 4915} {"train_loss": -7.388051986694336, "global_step": 206453, "epoch": 4915} {"train_loss": -7.374265670776367, "global_step": 206454, "epoch": 4915} {"train_loss": -7.191172122955322, "global_step": 206455, "epoch": 4915} {"train_loss": -7.212289810180664, "global_step": 206456, "epoch": 4915} {"train_loss": -7.33167839050293, "global_step": 206457, "epoch": 4915} {"train_loss": -7.165562152862549, "global_step": 206458, "epoch": 4915} {"train_loss": -7.305381774902344, "global_step": 206459, "epoch": 4915} {"train_loss": -7.2463483810424805, "global_step": 206460, "epoch": 4915} {"train_loss": -7.225246906280518, "global_step": 206461, "epoch": 4915} {"train_loss": -7.2872419357299805, "global_step": 206462, "epoch": 4915} {"train_loss": -7.124500274658203, "global_step": 206463, "epoch": 4915} {"train_loss": -7.28233003616333, "global_step": 206464, "epoch": 4915} {"train_loss": -7.3159284591674805, "global_step": 206465, "epoch": 4915} {"train_loss": -7.260628700256348, "global_step": 206466, "epoch": 4915} {"train_loss": -7.210948467254639, "global_step": 206467, "epoch": 4915} {"train_loss": -7.284819602966309, "global_step": 206468, "epoch": 4915} {"train_loss": -7.280520439147949, "global_step": 206469, "epoch": 4915} {"train_loss": -7.330509662628174, "global_step": 206470, "epoch": 4915} {"train_loss": -7.286579983575003, "global_step": 206471, "epoch": 4915, "val_loss": 69210.5625} {"train_loss": -7.2965617179870605, "global_step": 206472, "epoch": 4916} {"train_loss": -7.360232830047607, "global_step": 206473, "epoch": 4916} {"train_loss": -7.19547176361084, "global_step": 206474, "epoch": 4916} {"train_loss": -7.324769496917725, "global_step": 206475, "epoch": 4916} {"train_loss": -7.276397705078125, "global_step": 206476, "epoch": 4916} {"train_loss": -7.254211902618408, "global_step": 206477, "epoch": 4916} {"train_loss": -7.31467342376709, "global_step": 206478, "epoch": 4916} {"train_loss": -7.13805627822876, "global_step": 206479, "epoch": 4916} {"train_loss": -7.270371437072754, "global_step": 206480, "epoch": 4916} {"train_loss": -7.2554545402526855, "global_step": 206481, "epoch": 4916} {"train_loss": -7.187568664550781, "global_step": 206482, "epoch": 4916} {"train_loss": -7.171237945556641, "global_step": 206483, "epoch": 4916} {"train_loss": -7.215368270874023, "global_step": 206484, "epoch": 4916} {"train_loss": -7.308600902557373, "global_step": 206485, "epoch": 4916} {"train_loss": -7.23415994644165, "global_step": 206486, "epoch": 4916} {"train_loss": -7.165810585021973, "global_step": 206487, "epoch": 4916} {"train_loss": -7.308271408081055, "global_step": 206488, "epoch": 4916} {"train_loss": -7.224389553070068, "global_step": 206489, "epoch": 4916} {"train_loss": -7.289113998413086, "global_step": 206490, "epoch": 4916} {"train_loss": -7.181013584136963, "global_step": 206491, "epoch": 4916} {"train_loss": -7.206976890563965, "global_step": 206492, "epoch": 4916} {"train_loss": -7.317795276641846, "global_step": 206493, "epoch": 4916} {"train_loss": -7.2376508712768555, "global_step": 206494, "epoch": 4916} {"train_loss": -7.217787742614746, "global_step": 206495, "epoch": 4916} {"train_loss": -7.345667839050293, "global_step": 206496, "epoch": 4916} {"train_loss": -7.267061710357666, "global_step": 206497, "epoch": 4916} {"train_loss": -7.303092002868652, "global_step": 206498, "epoch": 4916} {"train_loss": -7.239502906799316, "global_step": 206499, "epoch": 4916} {"train_loss": -7.260748863220215, "global_step": 206500, "epoch": 4916} {"train_loss": -7.263862609863281, "global_step": 206501, "epoch": 4916} {"train_loss": -7.245485782623291, "global_step": 206502, "epoch": 4916} {"train_loss": -7.236541748046875, "global_step": 206503, "epoch": 4916} {"train_loss": -7.266931533813477, "global_step": 206504, "epoch": 4916} {"train_loss": -7.321544647216797, "global_step": 206505, "epoch": 4916} {"train_loss": -7.211123466491699, "global_step": 206506, "epoch": 4916} {"train_loss": -7.099775314331055, "global_step": 206507, "epoch": 4916} {"train_loss": -7.277541160583496, "global_step": 206508, "epoch": 4916} {"train_loss": -7.2421979904174805, "global_step": 206509, "epoch": 4916} {"train_loss": -7.410599708557129, "global_step": 206510, "epoch": 4916} {"train_loss": -7.3187947273254395, "global_step": 206511, "epoch": 4916} {"train_loss": -7.3239827156066895, "global_step": 206512, "epoch": 4916} {"train_loss": -7.260632469540551, "global_step": 206513, "epoch": 4916, "val_loss": 69076.421875} {"train_loss": -7.329224586486816, "global_step": 206514, "epoch": 4917} {"train_loss": -7.348479270935059, "global_step": 206515, "epoch": 4917} {"train_loss": -7.289834022521973, "global_step": 206516, "epoch": 4917} {"train_loss": -7.291240692138672, "global_step": 206517, "epoch": 4917} {"train_loss": -7.040465354919434, "global_step": 206518, "epoch": 4917} {"train_loss": -7.142988204956055, "global_step": 206519, "epoch": 4917} {"train_loss": -7.231281757354736, "global_step": 206520, "epoch": 4917} {"train_loss": -7.027573585510254, "global_step": 206521, "epoch": 4917} {"train_loss": -7.076126575469971, "global_step": 206522, "epoch": 4917} {"train_loss": -7.170814037322998, "global_step": 206523, "epoch": 4917} {"train_loss": -7.113956451416016, "global_step": 206524, "epoch": 4917} {"train_loss": -6.99180793762207, "global_step": 206525, "epoch": 4917} {"train_loss": -7.296204090118408, "global_step": 206526, "epoch": 4917} {"train_loss": -7.207311630249023, "global_step": 206527, "epoch": 4917} {"train_loss": -7.190406799316406, "global_step": 206528, "epoch": 4917} {"train_loss": -7.144179821014404, "global_step": 206529, "epoch": 4917} {"train_loss": -7.122387886047363, "global_step": 206530, "epoch": 4917} {"train_loss": -7.074750900268555, "global_step": 206531, "epoch": 4917} {"train_loss": -7.166280746459961, "global_step": 206532, "epoch": 4917} {"train_loss": -7.1249308586120605, "global_step": 206533, "epoch": 4917} {"train_loss": -7.140501022338867, "global_step": 206534, "epoch": 4917} {"train_loss": -7.133354663848877, "global_step": 206535, "epoch": 4917} {"train_loss": -7.154566764831543, "global_step": 206536, "epoch": 4917} {"train_loss": -7.168239116668701, "global_step": 206537, "epoch": 4917} {"train_loss": -7.155178070068359, "global_step": 206538, "epoch": 4917} {"train_loss": -7.2176713943481445, "global_step": 206539, "epoch": 4917} {"train_loss": -7.169071197509766, "global_step": 206540, "epoch": 4917} {"train_loss": -7.2581095695495605, "global_step": 206541, "epoch": 4917} {"train_loss": -7.312795639038086, "global_step": 206542, "epoch": 4917} {"train_loss": -7.206859588623047, "global_step": 206543, "epoch": 4917} {"train_loss": -7.250915050506592, "global_step": 206544, "epoch": 4917} {"train_loss": -7.243373870849609, "global_step": 206545, "epoch": 4917} {"train_loss": -7.219900131225586, "global_step": 206546, "epoch": 4917} {"train_loss": -7.261987686157227, "global_step": 206547, "epoch": 4917} {"train_loss": -7.203668594360352, "global_step": 206548, "epoch": 4917} {"train_loss": -7.272429466247559, "global_step": 206549, "epoch": 4917} {"train_loss": -7.316675662994385, "global_step": 206550, "epoch": 4917} {"train_loss": -7.2042975425720215, "global_step": 206551, "epoch": 4917} {"train_loss": -7.354353427886963, "global_step": 206552, "epoch": 4917} {"train_loss": -7.323472023010254, "global_step": 206553, "epoch": 4917} {"train_loss": -7.198287010192871, "global_step": 206554, "epoch": 4917} {"train_loss": -7.200219143004644, "global_step": 206555, "epoch": 4917, "val_loss": 69225.5546875} {"train_loss": -7.345047950744629, "global_step": 206556, "epoch": 4918} {"train_loss": -7.374930381774902, "global_step": 206557, "epoch": 4918} {"train_loss": -7.322929382324219, "global_step": 206558, "epoch": 4918} {"train_loss": -7.318020820617676, "global_step": 206559, "epoch": 4918} {"train_loss": -7.269881248474121, "global_step": 206560, "epoch": 4918} {"train_loss": -7.29524040222168, "global_step": 206561, "epoch": 4918} {"train_loss": -7.390191078186035, "global_step": 206562, "epoch": 4918} {"train_loss": -7.245583534240723, "global_step": 206563, "epoch": 4918} {"train_loss": -7.317776679992676, "global_step": 206564, "epoch": 4918} {"train_loss": -7.355865001678467, "global_step": 206565, "epoch": 4918} {"train_loss": -7.282135009765625, "global_step": 206566, "epoch": 4918} {"train_loss": -7.347716808319092, "global_step": 206567, "epoch": 4918} {"train_loss": -7.252016067504883, "global_step": 206568, "epoch": 4918} {"train_loss": -7.239371299743652, "global_step": 206569, "epoch": 4918} {"train_loss": -7.325908184051514, "global_step": 206570, "epoch": 4918} {"train_loss": -7.241388320922852, "global_step": 206571, "epoch": 4918} {"train_loss": -7.267307281494141, "global_step": 206572, "epoch": 4918} {"train_loss": -7.348813056945801, "global_step": 206573, "epoch": 4918} {"train_loss": -7.325794696807861, "global_step": 206574, "epoch": 4918} {"train_loss": -7.325247287750244, "global_step": 206575, "epoch": 4918} {"train_loss": -7.273427963256836, "global_step": 206576, "epoch": 4918} {"train_loss": -7.290111541748047, "global_step": 206577, "epoch": 4918} {"train_loss": -7.350936412811279, "global_step": 206578, "epoch": 4918} {"train_loss": -7.248246192932129, "global_step": 206579, "epoch": 4918} {"train_loss": -7.30487585067749, "global_step": 206580, "epoch": 4918} {"train_loss": -7.391392707824707, "global_step": 206581, "epoch": 4918} {"train_loss": -7.221315383911133, "global_step": 206582, "epoch": 4918} {"train_loss": -7.3461995124816895, "global_step": 206583, "epoch": 4918} {"train_loss": -7.407856464385986, "global_step": 206584, "epoch": 4918} {"train_loss": -7.398348808288574, "global_step": 206585, "epoch": 4918} {"train_loss": -7.350855350494385, "global_step": 206586, "epoch": 4918} {"train_loss": -7.248578071594238, "global_step": 206587, "epoch": 4918} {"train_loss": -7.3342180252075195, "global_step": 206588, "epoch": 4918} {"train_loss": -7.270484924316406, "global_step": 206589, "epoch": 4918} {"train_loss": -7.281855583190918, "global_step": 206590, "epoch": 4918} {"train_loss": -7.357874870300293, "global_step": 206591, "epoch": 4918} {"train_loss": -7.320195198059082, "global_step": 206592, "epoch": 4918} {"train_loss": -7.216810703277588, "global_step": 206593, "epoch": 4918} {"train_loss": -7.206672668457031, "global_step": 206594, "epoch": 4918} {"train_loss": -7.2560319900512695, "global_step": 206595, "epoch": 4918} {"train_loss": -7.2715606689453125, "global_step": 206596, "epoch": 4918} {"train_loss": -7.30537241981143, "global_step": 206597, "epoch": 4918, "val_loss": 69105.2578125} {"train_loss": -7.360732078552246, "global_step": 206598, "epoch": 4919} {"train_loss": -7.191022872924805, "global_step": 206599, "epoch": 4919} {"train_loss": -7.4116129875183105, "global_step": 206600, "epoch": 4919} {"train_loss": -7.310491561889648, "global_step": 206601, "epoch": 4919} {"train_loss": -7.192574501037598, "global_step": 206602, "epoch": 4919} {"train_loss": -7.2756028175354, "global_step": 206603, "epoch": 4919} {"train_loss": -7.1319780349731445, "global_step": 206604, "epoch": 4919} {"train_loss": -7.2442731857299805, "global_step": 206605, "epoch": 4919} {"train_loss": -7.281857490539551, "global_step": 206606, "epoch": 4919} {"train_loss": -7.312471866607666, "global_step": 206607, "epoch": 4919} {"train_loss": -7.326584339141846, "global_step": 206608, "epoch": 4919} {"train_loss": -7.336575031280518, "global_step": 206609, "epoch": 4919} {"train_loss": -7.265867233276367, "global_step": 206610, "epoch": 4919} {"train_loss": -7.246946811676025, "global_step": 206611, "epoch": 4919} {"train_loss": -7.168242454528809, "global_step": 206612, "epoch": 4919} {"train_loss": -7.2108612060546875, "global_step": 206613, "epoch": 4919} {"train_loss": -7.297501087188721, "global_step": 206614, "epoch": 4919} {"train_loss": -7.246636390686035, "global_step": 206615, "epoch": 4919} {"train_loss": -7.262187957763672, "global_step": 206616, "epoch": 4919} {"train_loss": -7.272880554199219, "global_step": 206617, "epoch": 4919} {"train_loss": -7.172222137451172, "global_step": 206618, "epoch": 4919} {"train_loss": -7.140619277954102, "global_step": 206619, "epoch": 4919} {"train_loss": -7.266600131988525, "global_step": 206620, "epoch": 4919} {"train_loss": -7.195804595947266, "global_step": 206621, "epoch": 4919} {"train_loss": -7.224062919616699, "global_step": 206622, "epoch": 4919} {"train_loss": -7.378615379333496, "global_step": 206623, "epoch": 4919} {"train_loss": -7.295048713684082, "global_step": 206624, "epoch": 4919} {"train_loss": -7.307656288146973, "global_step": 206625, "epoch": 4919} {"train_loss": -7.185751438140869, "global_step": 206626, "epoch": 4919} {"train_loss": -7.230765342712402, "global_step": 206627, "epoch": 4919} {"train_loss": -7.259842872619629, "global_step": 206628, "epoch": 4919} {"train_loss": -7.237435340881348, "global_step": 206629, "epoch": 4919} {"train_loss": -7.225856781005859, "global_step": 206630, "epoch": 4919} {"train_loss": -7.2533721923828125, "global_step": 206631, "epoch": 4919} {"train_loss": -7.338239669799805, "global_step": 206632, "epoch": 4919} {"train_loss": -7.227744102478027, "global_step": 206633, "epoch": 4919} {"train_loss": -7.278776168823242, "global_step": 206634, "epoch": 4919} {"train_loss": -7.287082195281982, "global_step": 206635, "epoch": 4919} {"train_loss": -7.23486328125, "global_step": 206636, "epoch": 4919} {"train_loss": -7.330085277557373, "global_step": 206637, "epoch": 4919} {"train_loss": -7.188467025756836, "global_step": 206638, "epoch": 4919} {"train_loss": -7.258357184273856, "global_step": 206639, "epoch": 4919, "val_loss": 69286.484375} {"train_loss": -7.195930480957031, "global_step": 206640, "epoch": 4920} {"train_loss": -7.353427886962891, "global_step": 206641, "epoch": 4920} {"train_loss": -7.340583801269531, "global_step": 206642, "epoch": 4920} {"train_loss": -7.226571083068848, "global_step": 206643, "epoch": 4920} {"train_loss": -7.2580485343933105, "global_step": 206644, "epoch": 4920} {"train_loss": -7.312849044799805, "global_step": 206645, "epoch": 4920} {"train_loss": -7.2893967628479, "global_step": 206646, "epoch": 4920} {"train_loss": -7.193676948547363, "global_step": 206647, "epoch": 4920} {"train_loss": -7.320428848266602, "global_step": 206648, "epoch": 4920} {"train_loss": -7.339941024780273, "global_step": 206649, "epoch": 4920} {"train_loss": -7.331655025482178, "global_step": 206650, "epoch": 4920} {"train_loss": -7.20798397064209, "global_step": 206651, "epoch": 4920} {"train_loss": -7.3199262619018555, "global_step": 206652, "epoch": 4920} {"train_loss": -7.2400102615356445, "global_step": 206653, "epoch": 4920} {"train_loss": -7.178016662597656, "global_step": 206654, "epoch": 4920} {"train_loss": -7.20348596572876, "global_step": 206655, "epoch": 4920} {"train_loss": -7.290752410888672, "global_step": 206656, "epoch": 4920} {"train_loss": -7.12960958480835, "global_step": 206657, "epoch": 4920} {"train_loss": -7.307694435119629, "global_step": 206658, "epoch": 4920} {"train_loss": -7.295253276824951, "global_step": 206659, "epoch": 4920} {"train_loss": -7.16916561126709, "global_step": 206660, "epoch": 4920} {"train_loss": -7.294797897338867, "global_step": 206661, "epoch": 4920} {"train_loss": -7.108339786529541, "global_step": 206662, "epoch": 4920} {"train_loss": -6.890813827514648, "global_step": 206663, "epoch": 4920} {"train_loss": -7.23356819152832, "global_step": 206664, "epoch": 4920} {"train_loss": -6.871863842010498, "global_step": 206665, "epoch": 4920} {"train_loss": -7.228000640869141, "global_step": 206666, "epoch": 4920} {"train_loss": -7.070491313934326, "global_step": 206667, "epoch": 4920} {"train_loss": -7.153892517089844, "global_step": 206668, "epoch": 4920} {"train_loss": -7.228891849517822, "global_step": 206669, "epoch": 4920} {"train_loss": -7.200400352478027, "global_step": 206670, "epoch": 4920} {"train_loss": -7.315821647644043, "global_step": 206671, "epoch": 4920} {"train_loss": -7.18499231338501, "global_step": 206672, "epoch": 4920} {"train_loss": -7.335636138916016, "global_step": 206673, "epoch": 4920} {"train_loss": -7.087835788726807, "global_step": 206674, "epoch": 4920} {"train_loss": -7.199986457824707, "global_step": 206675, "epoch": 4920} {"train_loss": -7.092502593994141, "global_step": 206676, "epoch": 4920} {"train_loss": -7.2968854904174805, "global_step": 206677, "epoch": 4920} {"train_loss": -7.258631706237793, "global_step": 206678, "epoch": 4920} {"train_loss": -7.228797435760498, "global_step": 206679, "epoch": 4920} {"train_loss": -7.193287372589111, "global_step": 206680, "epoch": 4920} {"train_loss": -7.219128551937285, "global_step": 206681, "epoch": 4920, "val_loss": 69235.640625} {"train_loss": -7.281297206878662, "global_step": 206682, "epoch": 4921} {"train_loss": -7.184795379638672, "global_step": 206683, "epoch": 4921} {"train_loss": -7.077277660369873, "global_step": 206684, "epoch": 4921} {"train_loss": -7.330290794372559, "global_step": 206685, "epoch": 4921} {"train_loss": -7.223690509796143, "global_step": 206686, "epoch": 4921} {"train_loss": -7.3408203125, "global_step": 206687, "epoch": 4921} {"train_loss": -7.206833839416504, "global_step": 206688, "epoch": 4921} {"train_loss": -7.204204559326172, "global_step": 206689, "epoch": 4921} {"train_loss": -7.3329572677612305, "global_step": 206690, "epoch": 4921} {"train_loss": -7.2602949142456055, "global_step": 206691, "epoch": 4921} {"train_loss": -7.332101821899414, "global_step": 206692, "epoch": 4921} {"train_loss": -7.292056083679199, "global_step": 206693, "epoch": 4921} {"train_loss": -7.39214563369751, "global_step": 206694, "epoch": 4921} {"train_loss": -7.237879276275635, "global_step": 206695, "epoch": 4921} {"train_loss": -7.34613037109375, "global_step": 206696, "epoch": 4921} {"train_loss": -7.3324785232543945, "global_step": 206697, "epoch": 4921} {"train_loss": -7.240546226501465, "global_step": 206698, "epoch": 4921} {"train_loss": -7.310925483703613, "global_step": 206699, "epoch": 4921} {"train_loss": -7.304206848144531, "global_step": 206700, "epoch": 4921} {"train_loss": -7.464326858520508, "global_step": 206701, "epoch": 4921} {"train_loss": -7.238790512084961, "global_step": 206702, "epoch": 4921} {"train_loss": -7.34425687789917, "global_step": 206703, "epoch": 4921} {"train_loss": -7.335354804992676, "global_step": 206704, "epoch": 4921} {"train_loss": -7.312838554382324, "global_step": 206705, "epoch": 4921} {"train_loss": -7.27155065536499, "global_step": 206706, "epoch": 4921} {"train_loss": -7.187301158905029, "global_step": 206707, "epoch": 4921} {"train_loss": -7.4141693115234375, "global_step": 206708, "epoch": 4921} {"train_loss": -7.2798638343811035, "global_step": 206709, "epoch": 4921} {"train_loss": -7.364638328552246, "global_step": 206710, "epoch": 4921} {"train_loss": -7.248880863189697, "global_step": 206711, "epoch": 4921} {"train_loss": -7.323060512542725, "global_step": 206712, "epoch": 4921} {"train_loss": -7.3216094970703125, "global_step": 206713, "epoch": 4921} {"train_loss": -7.296120643615723, "global_step": 206714, "epoch": 4921} {"train_loss": -7.370536804199219, "global_step": 206715, "epoch": 4921} {"train_loss": -7.338199615478516, "global_step": 206716, "epoch": 4921} {"train_loss": -7.37764835357666, "global_step": 206717, "epoch": 4921} {"train_loss": -7.306018829345703, "global_step": 206718, "epoch": 4921} {"train_loss": -7.309229373931885, "global_step": 206719, "epoch": 4921} {"train_loss": -7.274408340454102, "global_step": 206720, "epoch": 4921} {"train_loss": -7.43413782119751, "global_step": 206721, "epoch": 4921} {"train_loss": -7.327147006988525, "global_step": 206722, "epoch": 4921} {"train_loss": -7.298175051098778, "global_step": 206723, "epoch": 4921, "val_loss": 69011.6328125} {"train_loss": -7.325127601623535, "global_step": 206724, "epoch": 4922} {"train_loss": -7.3978166580200195, "global_step": 206725, "epoch": 4922} {"train_loss": -7.259103775024414, "global_step": 206726, "epoch": 4922} {"train_loss": -7.320940971374512, "global_step": 206727, "epoch": 4922} {"train_loss": -7.195188522338867, "global_step": 206728, "epoch": 4922} {"train_loss": -7.26849365234375, "global_step": 206729, "epoch": 4922} {"train_loss": -7.278470993041992, "global_step": 206730, "epoch": 4922} {"train_loss": -7.152888774871826, "global_step": 206731, "epoch": 4922} {"train_loss": -7.271345615386963, "global_step": 206732, "epoch": 4922} {"train_loss": -7.148542404174805, "global_step": 206733, "epoch": 4922} {"train_loss": -7.1613898277282715, "global_step": 206734, "epoch": 4922} {"train_loss": -7.298479080200195, "global_step": 206735, "epoch": 4922} {"train_loss": -7.164245128631592, "global_step": 206736, "epoch": 4922} {"train_loss": -7.227302074432373, "global_step": 206737, "epoch": 4922} {"train_loss": -7.305619239807129, "global_step": 206738, "epoch": 4922} {"train_loss": -7.29243278503418, "global_step": 206739, "epoch": 4922} {"train_loss": -7.20953893661499, "global_step": 206740, "epoch": 4922} {"train_loss": -7.116986274719238, "global_step": 206741, "epoch": 4922} {"train_loss": -7.210024356842041, "global_step": 206742, "epoch": 4922} {"train_loss": -7.29627799987793, "global_step": 206743, "epoch": 4922} {"train_loss": -7.244720458984375, "global_step": 206744, "epoch": 4922} {"train_loss": -7.171333312988281, "global_step": 206745, "epoch": 4922} {"train_loss": -7.183444023132324, "global_step": 206746, "epoch": 4922} {"train_loss": -7.277126789093018, "global_step": 206747, "epoch": 4922} {"train_loss": -7.136981964111328, "global_step": 206748, "epoch": 4922} {"train_loss": -7.282997131347656, "global_step": 206749, "epoch": 4922} {"train_loss": -7.121384620666504, "global_step": 206750, "epoch": 4922} {"train_loss": -7.308673858642578, "global_step": 206751, "epoch": 4922} {"train_loss": -7.269854545593262, "global_step": 206752, "epoch": 4922} {"train_loss": -7.309637069702148, "global_step": 206753, "epoch": 4922} {"train_loss": -7.30033016204834, "global_step": 206754, "epoch": 4922} {"train_loss": -7.246584892272949, "global_step": 206755, "epoch": 4922} {"train_loss": -7.427414417266846, "global_step": 206756, "epoch": 4922} {"train_loss": -7.277815818786621, "global_step": 206757, "epoch": 4922} {"train_loss": -7.339060306549072, "global_step": 206758, "epoch": 4922} {"train_loss": -7.260549545288086, "global_step": 206759, "epoch": 4922} {"train_loss": -7.341427803039551, "global_step": 206760, "epoch": 4922} {"train_loss": -7.273601055145264, "global_step": 206761, "epoch": 4922} {"train_loss": -7.294750213623047, "global_step": 206762, "epoch": 4922} {"train_loss": -7.237764358520508, "global_step": 206763, "epoch": 4922} {"train_loss": -7.140557765960693, "global_step": 206764, "epoch": 4922} {"train_loss": -7.256144659859793, "global_step": 206765, "epoch": 4922, "val_loss": 69140.84375} {"train_loss": -7.332777976989746, "global_step": 206766, "epoch": 4923} {"train_loss": -7.375838279724121, "global_step": 206767, "epoch": 4923} {"train_loss": -7.340774059295654, "global_step": 206768, "epoch": 4923} {"train_loss": -7.357288837432861, "global_step": 206769, "epoch": 4923} {"train_loss": -7.341351509094238, "global_step": 206770, "epoch": 4923} {"train_loss": -7.473214149475098, "global_step": 206771, "epoch": 4923} {"train_loss": -7.311947345733643, "global_step": 206772, "epoch": 4923} {"train_loss": -7.376299858093262, "global_step": 206773, "epoch": 4923} {"train_loss": -7.291943550109863, "global_step": 206774, "epoch": 4923} {"train_loss": -7.311977863311768, "global_step": 206775, "epoch": 4923} {"train_loss": -7.333024978637695, "global_step": 206776, "epoch": 4923} {"train_loss": -7.250194549560547, "global_step": 206777, "epoch": 4923} {"train_loss": -7.416278839111328, "global_step": 206778, "epoch": 4923} {"train_loss": -7.292120933532715, "global_step": 206779, "epoch": 4923} {"train_loss": -7.31803560256958, "global_step": 206780, "epoch": 4923} {"train_loss": -7.430114269256592, "global_step": 206781, "epoch": 4923} {"train_loss": -7.4393696784973145, "global_step": 206782, "epoch": 4923} {"train_loss": -7.21074104309082, "global_step": 206783, "epoch": 4923} {"train_loss": -7.308452606201172, "global_step": 206784, "epoch": 4923} {"train_loss": -7.310340881347656, "global_step": 206785, "epoch": 4923} {"train_loss": -7.357911109924316, "global_step": 206786, "epoch": 4923} {"train_loss": -7.345972061157227, "global_step": 206787, "epoch": 4923} {"train_loss": -7.418247222900391, "global_step": 206788, "epoch": 4923} {"train_loss": -7.298287868499756, "global_step": 206789, "epoch": 4923} {"train_loss": -7.242355823516846, "global_step": 206790, "epoch": 4923} {"train_loss": -7.3668532371521, "global_step": 206791, "epoch": 4923} {"train_loss": -7.273029327392578, "global_step": 206792, "epoch": 4923} {"train_loss": -7.273175239562988, "global_step": 206793, "epoch": 4923} {"train_loss": -7.27911376953125, "global_step": 206794, "epoch": 4923} {"train_loss": -7.34334659576416, "global_step": 206795, "epoch": 4923} {"train_loss": -7.367537975311279, "global_step": 206796, "epoch": 4923} {"train_loss": -7.306303977966309, "global_step": 206797, "epoch": 4923} {"train_loss": -7.3683953285217285, "global_step": 206798, "epoch": 4923} {"train_loss": -7.377228736877441, "global_step": 206799, "epoch": 4923} {"train_loss": -7.335968971252441, "global_step": 206800, "epoch": 4923} {"train_loss": -7.313657760620117, "global_step": 206801, "epoch": 4923} {"train_loss": -7.290652275085449, "global_step": 206802, "epoch": 4923} {"train_loss": -7.199190616607666, "global_step": 206803, "epoch": 4923} {"train_loss": -7.321942329406738, "global_step": 206804, "epoch": 4923} {"train_loss": -7.199685096740723, "global_step": 206805, "epoch": 4923} {"train_loss": -7.258559703826904, "global_step": 206806, "epoch": 4923} {"train_loss": -7.325809989656721, "global_step": 206807, "epoch": 4923, "val_loss": 69255.3984375} {"train_loss": -7.271228313446045, "global_step": 206808, "epoch": 4924} {"train_loss": -7.359102249145508, "global_step": 206809, "epoch": 4924} {"train_loss": -7.241959095001221, "global_step": 206810, "epoch": 4924} {"train_loss": -7.344822883605957, "global_step": 206811, "epoch": 4924} {"train_loss": -7.398832321166992, "global_step": 206812, "epoch": 4924} {"train_loss": -7.331663608551025, "global_step": 206813, "epoch": 4924} {"train_loss": -7.176556587219238, "global_step": 206814, "epoch": 4924} {"train_loss": -7.220854759216309, "global_step": 206815, "epoch": 4924} {"train_loss": -7.224460601806641, "global_step": 206816, "epoch": 4924} {"train_loss": -7.320504665374756, "global_step": 206817, "epoch": 4924} {"train_loss": -7.221550464630127, "global_step": 206818, "epoch": 4924} {"train_loss": -7.227301597595215, "global_step": 206819, "epoch": 4924} {"train_loss": -7.2352495193481445, "global_step": 206820, "epoch": 4924} {"train_loss": -7.269780158996582, "global_step": 206821, "epoch": 4924} {"train_loss": -7.276854991912842, "global_step": 206822, "epoch": 4924} {"train_loss": -7.293204307556152, "global_step": 206823, "epoch": 4924} {"train_loss": -7.231672286987305, "global_step": 206824, "epoch": 4924} {"train_loss": -7.300383567810059, "global_step": 206825, "epoch": 4924} {"train_loss": -7.348026275634766, "global_step": 206826, "epoch": 4924} {"train_loss": -7.245373249053955, "global_step": 206827, "epoch": 4924} {"train_loss": -7.231263160705566, "global_step": 206828, "epoch": 4924} {"train_loss": -7.21561336517334, "global_step": 206829, "epoch": 4924} {"train_loss": -7.245673179626465, "global_step": 206830, "epoch": 4924} {"train_loss": -7.344415664672852, "global_step": 206831, "epoch": 4924} {"train_loss": -7.333594799041748, "global_step": 206832, "epoch": 4924} {"train_loss": -7.30936336517334, "global_step": 206833, "epoch": 4924} {"train_loss": -7.199038028717041, "global_step": 206834, "epoch": 4924} {"train_loss": -7.154989719390869, "global_step": 206835, "epoch": 4924} {"train_loss": -7.223884582519531, "global_step": 206836, "epoch": 4924} {"train_loss": -7.39991569519043, "global_step": 206837, "epoch": 4924} {"train_loss": -7.262167930603027, "global_step": 206838, "epoch": 4924} {"train_loss": -7.303403854370117, "global_step": 206839, "epoch": 4924} {"train_loss": -7.328351974487305, "global_step": 206840, "epoch": 4924} {"train_loss": -7.214735984802246, "global_step": 206841, "epoch": 4924} {"train_loss": -7.201605796813965, "global_step": 206842, "epoch": 4924} {"train_loss": -7.237257480621338, "global_step": 206843, "epoch": 4924} {"train_loss": -7.255815029144287, "global_step": 206844, "epoch": 4924} {"train_loss": -7.179658889770508, "global_step": 206845, "epoch": 4924} {"train_loss": -7.301943778991699, "global_step": 206846, "epoch": 4924} {"train_loss": -7.315160751342773, "global_step": 206847, "epoch": 4924} {"train_loss": -7.2165679931640625, "global_step": 206848, "epoch": 4924} {"train_loss": -7.268908761796498, "global_step": 206849, "epoch": 4924, "val_loss": 69372.515625} {"train_loss": -7.197314739227295, "global_step": 206850, "epoch": 4925} {"train_loss": -7.284192085266113, "global_step": 206851, "epoch": 4925} {"train_loss": -7.291635513305664, "global_step": 206852, "epoch": 4925} {"train_loss": -7.29587459564209, "global_step": 206853, "epoch": 4925} {"train_loss": -7.317207336425781, "global_step": 206854, "epoch": 4925} {"train_loss": -7.355698585510254, "global_step": 206855, "epoch": 4925} {"train_loss": -7.294183731079102, "global_step": 206856, "epoch": 4925} {"train_loss": -7.299523830413818, "global_step": 206857, "epoch": 4925} {"train_loss": -7.266848564147949, "global_step": 206858, "epoch": 4925} {"train_loss": -7.330178260803223, "global_step": 206859, "epoch": 4925} {"train_loss": -7.279332637786865, "global_step": 206860, "epoch": 4925} {"train_loss": -7.2841668128967285, "global_step": 206861, "epoch": 4925} {"train_loss": -7.328159332275391, "global_step": 206862, "epoch": 4925} {"train_loss": -7.369839668273926, "global_step": 206863, "epoch": 4925} {"train_loss": -7.271729946136475, "global_step": 206864, "epoch": 4925} {"train_loss": -7.255544185638428, "global_step": 206865, "epoch": 4925} {"train_loss": -7.356051445007324, "global_step": 206866, "epoch": 4925} {"train_loss": -7.416057586669922, "global_step": 206867, "epoch": 4925} {"train_loss": -7.406423568725586, "global_step": 206868, "epoch": 4925} {"train_loss": -7.332452774047852, "global_step": 206869, "epoch": 4925} {"train_loss": -7.30441427230835, "global_step": 206870, "epoch": 4925} {"train_loss": -7.283537864685059, "global_step": 206871, "epoch": 4925} {"train_loss": -7.344758033752441, "global_step": 206872, "epoch": 4925} {"train_loss": -7.351619720458984, "global_step": 206873, "epoch": 4925} {"train_loss": -7.197740077972412, "global_step": 206874, "epoch": 4925} {"train_loss": -7.39274787902832, "global_step": 206875, "epoch": 4925} {"train_loss": -7.347378730773926, "global_step": 206876, "epoch": 4925} {"train_loss": -7.261131286621094, "global_step": 206877, "epoch": 4925} {"train_loss": -7.368207931518555, "global_step": 206878, "epoch": 4925} {"train_loss": -7.389701843261719, "global_step": 206879, "epoch": 4925} {"train_loss": -7.311393737792969, "global_step": 206880, "epoch": 4925} {"train_loss": -7.257765769958496, "global_step": 206881, "epoch": 4925} {"train_loss": -7.262966156005859, "global_step": 206882, "epoch": 4925} {"train_loss": -7.293915271759033, "global_step": 206883, "epoch": 4925} {"train_loss": -7.327032089233398, "global_step": 206884, "epoch": 4925} {"train_loss": -7.352852821350098, "global_step": 206885, "epoch": 4925} {"train_loss": -7.137650489807129, "global_step": 206886, "epoch": 4925} {"train_loss": -7.238576889038086, "global_step": 206887, "epoch": 4925} {"train_loss": -7.27011775970459, "global_step": 206888, "epoch": 4925} {"train_loss": -7.22214937210083, "global_step": 206889, "epoch": 4925} {"train_loss": -7.290158271789551, "global_step": 206890, "epoch": 4925} {"train_loss": -7.304747150057838, "global_step": 206891, "epoch": 4925, "val_loss": 69133.7578125} {"train_loss": -7.339418411254883, "global_step": 206892, "epoch": 4926} {"train_loss": -7.351341724395752, "global_step": 206893, "epoch": 4926} {"train_loss": -7.37412166595459, "global_step": 206894, "epoch": 4926} {"train_loss": -7.270291328430176, "global_step": 206895, "epoch": 4926} {"train_loss": -7.261452674865723, "global_step": 206896, "epoch": 4926} {"train_loss": -7.265326023101807, "global_step": 206897, "epoch": 4926} {"train_loss": -7.234771728515625, "global_step": 206898, "epoch": 4926} {"train_loss": -7.316623210906982, "global_step": 206899, "epoch": 4926} {"train_loss": -7.294012546539307, "global_step": 206900, "epoch": 4926} {"train_loss": -7.272367477416992, "global_step": 206901, "epoch": 4926} {"train_loss": -7.144097328186035, "global_step": 206902, "epoch": 4926} {"train_loss": -7.1559858322143555, "global_step": 206903, "epoch": 4926} {"train_loss": -7.2417192459106445, "global_step": 206904, "epoch": 4926} {"train_loss": -7.184345245361328, "global_step": 206905, "epoch": 4926} {"train_loss": -7.241145610809326, "global_step": 206906, "epoch": 4926} {"train_loss": -7.14598274230957, "global_step": 206907, "epoch": 4926} {"train_loss": -7.291024208068848, "global_step": 206908, "epoch": 4926} {"train_loss": -7.098894119262695, "global_step": 206909, "epoch": 4926} {"train_loss": -7.283203601837158, "global_step": 206910, "epoch": 4926} {"train_loss": -7.17071533203125, "global_step": 206911, "epoch": 4926} {"train_loss": -7.107497215270996, "global_step": 206912, "epoch": 4926} {"train_loss": -7.315545082092285, "global_step": 206913, "epoch": 4926} {"train_loss": -7.280630588531494, "global_step": 206914, "epoch": 4926} {"train_loss": -7.204867839813232, "global_step": 206915, "epoch": 4926} {"train_loss": -7.242300510406494, "global_step": 206916, "epoch": 4926} {"train_loss": -7.195578575134277, "global_step": 206917, "epoch": 4926} {"train_loss": -7.352964401245117, "global_step": 206918, "epoch": 4926} {"train_loss": -7.309514045715332, "global_step": 206919, "epoch": 4926} {"train_loss": -7.253293991088867, "global_step": 206920, "epoch": 4926} {"train_loss": -7.205422401428223, "global_step": 206921, "epoch": 4926} {"train_loss": -7.2608771324157715, "global_step": 206922, "epoch": 4926} {"train_loss": -7.244140148162842, "global_step": 206923, "epoch": 4926} {"train_loss": -7.150593280792236, "global_step": 206924, "epoch": 4926} {"train_loss": -7.185831069946289, "global_step": 206925, "epoch": 4926} {"train_loss": -7.193711280822754, "global_step": 206926, "epoch": 4926} {"train_loss": -7.297519683837891, "global_step": 206927, "epoch": 4926} {"train_loss": -7.226597309112549, "global_step": 206928, "epoch": 4926} {"train_loss": -7.308751106262207, "global_step": 206929, "epoch": 4926} {"train_loss": -7.370697021484375, "global_step": 206930, "epoch": 4926} {"train_loss": -7.184909820556641, "global_step": 206931, "epoch": 4926} {"train_loss": -7.311705589294434, "global_step": 206932, "epoch": 4926} {"train_loss": -7.247050126393636, "global_step": 206933, "epoch": 4926, "val_loss": 69133.828125} {"train_loss": -7.1768479347229, "global_step": 206934, "epoch": 4927} {"train_loss": -7.3124589920043945, "global_step": 206935, "epoch": 4927} {"train_loss": -7.2201619148254395, "global_step": 206936, "epoch": 4927} {"train_loss": -7.280580520629883, "global_step": 206937, "epoch": 4927} {"train_loss": -7.245433807373047, "global_step": 206938, "epoch": 4927} {"train_loss": -7.202023506164551, "global_step": 206939, "epoch": 4927} {"train_loss": -7.257319450378418, "global_step": 206940, "epoch": 4927} {"train_loss": -7.311464309692383, "global_step": 206941, "epoch": 4927} {"train_loss": -7.216850280761719, "global_step": 206942, "epoch": 4927} {"train_loss": -7.277410984039307, "global_step": 206943, "epoch": 4927} {"train_loss": -7.325246334075928, "global_step": 206944, "epoch": 4927} {"train_loss": -7.264217376708984, "global_step": 206945, "epoch": 4927} {"train_loss": -7.276017189025879, "global_step": 206946, "epoch": 4927} {"train_loss": -7.322209358215332, "global_step": 206947, "epoch": 4927} {"train_loss": -7.243109703063965, "global_step": 206948, "epoch": 4927} {"train_loss": -7.259720802307129, "global_step": 206949, "epoch": 4927} {"train_loss": -7.333334922790527, "global_step": 206950, "epoch": 4927} {"train_loss": -7.226739883422852, "global_step": 206951, "epoch": 4927} {"train_loss": -7.310258388519287, "global_step": 206952, "epoch": 4927} {"train_loss": -7.328335762023926, "global_step": 206953, "epoch": 4927} {"train_loss": -7.188276290893555, "global_step": 206954, "epoch": 4927} {"train_loss": -7.438049793243408, "global_step": 206955, "epoch": 4927} {"train_loss": -7.235034465789795, "global_step": 206956, "epoch": 4927} {"train_loss": -7.2896647453308105, "global_step": 206957, "epoch": 4927} {"train_loss": -7.266353607177734, "global_step": 206958, "epoch": 4927} {"train_loss": -7.266801834106445, "global_step": 206959, "epoch": 4927} {"train_loss": -7.196512222290039, "global_step": 206960, "epoch": 4927} {"train_loss": -7.2510528564453125, "global_step": 206961, "epoch": 4927} {"train_loss": -7.281046390533447, "global_step": 206962, "epoch": 4927} {"train_loss": -7.31152868270874, "global_step": 206963, "epoch": 4927} {"train_loss": -7.354849338531494, "global_step": 206964, "epoch": 4927} {"train_loss": -7.348653316497803, "global_step": 206965, "epoch": 4927} {"train_loss": -7.331256866455078, "global_step": 206966, "epoch": 4927} {"train_loss": -7.333372116088867, "global_step": 206967, "epoch": 4927} {"train_loss": -7.361687183380127, "global_step": 206968, "epoch": 4927} {"train_loss": -7.363790512084961, "global_step": 206969, "epoch": 4927} {"train_loss": -7.303966999053955, "global_step": 206970, "epoch": 4927} {"train_loss": -7.271805763244629, "global_step": 206971, "epoch": 4927} {"train_loss": -7.328046798706055, "global_step": 206972, "epoch": 4927} {"train_loss": -7.340105056762695, "global_step": 206973, "epoch": 4927} {"train_loss": -7.38674259185791, "global_step": 206974, "epoch": 4927} {"train_loss": -7.288994459878831, "global_step": 206975, "epoch": 4927, "val_loss": 69151.9453125} {"train_loss": -7.323787689208984, "global_step": 206976, "epoch": 4928} {"train_loss": -7.160204887390137, "global_step": 206977, "epoch": 4928} {"train_loss": -7.320940017700195, "global_step": 206978, "epoch": 4928} {"train_loss": -7.247220039367676, "global_step": 206979, "epoch": 4928} {"train_loss": -7.381716728210449, "global_step": 206980, "epoch": 4928} {"train_loss": -7.336147308349609, "global_step": 206981, "epoch": 4928} {"train_loss": -7.287450790405273, "global_step": 206982, "epoch": 4928} {"train_loss": -7.394550323486328, "global_step": 206983, "epoch": 4928} {"train_loss": -7.3886871337890625, "global_step": 206984, "epoch": 4928} {"train_loss": -7.34551477432251, "global_step": 206985, "epoch": 4928} {"train_loss": -7.353647708892822, "global_step": 206986, "epoch": 4928} {"train_loss": -7.283803939819336, "global_step": 206987, "epoch": 4928} {"train_loss": -7.130484104156494, "global_step": 206988, "epoch": 4928} {"train_loss": -7.2172040939331055, "global_step": 206989, "epoch": 4928} {"train_loss": -7.34863805770874, "global_step": 206990, "epoch": 4928} {"train_loss": -7.284233093261719, "global_step": 206991, "epoch": 4928} {"train_loss": -7.189084529876709, "global_step": 206992, "epoch": 4928} {"train_loss": -7.332863807678223, "global_step": 206993, "epoch": 4928} {"train_loss": -7.253857612609863, "global_step": 206994, "epoch": 4928} {"train_loss": -7.320018291473389, "global_step": 206995, "epoch": 4928} {"train_loss": -7.3556694984436035, "global_step": 206996, "epoch": 4928} {"train_loss": -7.410943031311035, "global_step": 206997, "epoch": 4928} {"train_loss": -7.31787109375, "global_step": 206998, "epoch": 4928} {"train_loss": -7.283239364624023, "global_step": 206999, "epoch": 4928} {"train_loss": -7.38897180557251, "global_step": 207000, "epoch": 4928} {"train_loss": -7.21695613861084, "global_step": 207001, "epoch": 4928} {"train_loss": -7.317750930786133, "global_step": 207002, "epoch": 4928} {"train_loss": -7.258437156677246, "global_step": 207003, "epoch": 4928} {"train_loss": -7.214334964752197, "global_step": 207004, "epoch": 4928} {"train_loss": -7.296664237976074, "global_step": 207005, "epoch": 4928} {"train_loss": -7.369378089904785, "global_step": 207006, "epoch": 4928} {"train_loss": -7.358672142028809, "global_step": 207007, "epoch": 4928} {"train_loss": -7.403385162353516, "global_step": 207008, "epoch": 4928} {"train_loss": -7.310235023498535, "global_step": 207009, "epoch": 4928} {"train_loss": -7.303343772888184, "global_step": 207010, "epoch": 4928} {"train_loss": -7.325611591339111, "global_step": 207011, "epoch": 4928} {"train_loss": -7.33418607711792, "global_step": 207012, "epoch": 4928} {"train_loss": -7.2156476974487305, "global_step": 207013, "epoch": 4928} {"train_loss": -7.317419528961182, "global_step": 207014, "epoch": 4928} {"train_loss": -7.316311836242676, "global_step": 207015, "epoch": 4928} {"train_loss": -7.325158596038818, "global_step": 207016, "epoch": 4928} {"train_loss": -7.304552827562604, "global_step": 207017, "epoch": 4928, "val_loss": 69219.1796875} {"train_loss": -7.310943603515625, "global_step": 207018, "epoch": 4929} {"train_loss": -7.3560471534729, "global_step": 207019, "epoch": 4929} {"train_loss": -7.24451208114624, "global_step": 207020, "epoch": 4929} {"train_loss": -7.368645191192627, "global_step": 207021, "epoch": 4929} {"train_loss": -7.347089767456055, "global_step": 207022, "epoch": 4929} {"train_loss": -7.299106121063232, "global_step": 207023, "epoch": 4929} {"train_loss": -7.350133895874023, "global_step": 207024, "epoch": 4929} {"train_loss": -7.278006553649902, "global_step": 207025, "epoch": 4929} {"train_loss": -7.33913516998291, "global_step": 207026, "epoch": 4929} {"train_loss": -7.242556571960449, "global_step": 207027, "epoch": 4929} {"train_loss": -7.329902172088623, "global_step": 207028, "epoch": 4929} {"train_loss": -7.337191581726074, "global_step": 207029, "epoch": 4929} {"train_loss": -7.306204795837402, "global_step": 207030, "epoch": 4929} {"train_loss": -7.296706199645996, "global_step": 207031, "epoch": 4929} {"train_loss": -7.199111461639404, "global_step": 207032, "epoch": 4929} {"train_loss": -7.281777381896973, "global_step": 207033, "epoch": 4929} {"train_loss": -7.125061988830566, "global_step": 207034, "epoch": 4929} {"train_loss": -7.386992931365967, "global_step": 207035, "epoch": 4929} {"train_loss": -7.224987030029297, "global_step": 207036, "epoch": 4929} {"train_loss": -7.18714714050293, "global_step": 207037, "epoch": 4929} {"train_loss": -7.227380275726318, "global_step": 207038, "epoch": 4929} {"train_loss": -7.241626739501953, "global_step": 207039, "epoch": 4929} {"train_loss": -7.2304558753967285, "global_step": 207040, "epoch": 4929} {"train_loss": -7.18748664855957, "global_step": 207041, "epoch": 4929} {"train_loss": -7.081881523132324, "global_step": 207042, "epoch": 4929} {"train_loss": -7.311010360717773, "global_step": 207043, "epoch": 4929} {"train_loss": -7.121270179748535, "global_step": 207044, "epoch": 4929} {"train_loss": -7.345484256744385, "global_step": 207045, "epoch": 4929} {"train_loss": -7.260012626647949, "global_step": 207046, "epoch": 4929} {"train_loss": -7.263976097106934, "global_step": 207047, "epoch": 4929} {"train_loss": -7.236983299255371, "global_step": 207048, "epoch": 4929} {"train_loss": -7.247958183288574, "global_step": 207049, "epoch": 4929} {"train_loss": -7.243124961853027, "global_step": 207050, "epoch": 4929} {"train_loss": -7.316185474395752, "global_step": 207051, "epoch": 4929} {"train_loss": -7.280250549316406, "global_step": 207052, "epoch": 4929} {"train_loss": -7.40899658203125, "global_step": 207053, "epoch": 4929} {"train_loss": -7.253829002380371, "global_step": 207054, "epoch": 4929} {"train_loss": -7.162574768066406, "global_step": 207055, "epoch": 4929} {"train_loss": -7.220849990844727, "global_step": 207056, "epoch": 4929} {"train_loss": -7.21798849105835, "global_step": 207057, "epoch": 4929} {"train_loss": -7.254786491394043, "global_step": 207058, "epoch": 4929} {"train_loss": -7.263547375088646, "global_step": 207059, "epoch": 4929, "val_loss": 69144.1953125} {"train_loss": -7.274021148681641, "global_step": 207060, "epoch": 4930} {"train_loss": -7.440601348876953, "global_step": 207061, "epoch": 4930} {"train_loss": -7.442372798919678, "global_step": 207062, "epoch": 4930} {"train_loss": -7.301429271697998, "global_step": 207063, "epoch": 4930} {"train_loss": -7.312477111816406, "global_step": 207064, "epoch": 4930} {"train_loss": -7.376557350158691, "global_step": 207065, "epoch": 4930} {"train_loss": -7.179250717163086, "global_step": 207066, "epoch": 4930} {"train_loss": -7.2829670906066895, "global_step": 207067, "epoch": 4930} {"train_loss": -7.262361526489258, "global_step": 207068, "epoch": 4930} {"train_loss": -7.311338424682617, "global_step": 207069, "epoch": 4930} {"train_loss": -7.271146774291992, "global_step": 207070, "epoch": 4930} {"train_loss": -7.260396957397461, "global_step": 207071, "epoch": 4930} {"train_loss": -7.2350921630859375, "global_step": 207072, "epoch": 4930} {"train_loss": -7.356436729431152, "global_step": 207073, "epoch": 4930} {"train_loss": -7.305333137512207, "global_step": 207074, "epoch": 4930} {"train_loss": -7.345015525817871, "global_step": 207075, "epoch": 4930} {"train_loss": -7.308802604675293, "global_step": 207076, "epoch": 4930} {"train_loss": -7.169267654418945, "global_step": 207077, "epoch": 4930} {"train_loss": -7.136037826538086, "global_step": 207078, "epoch": 4930} {"train_loss": -7.239041328430176, "global_step": 207079, "epoch": 4930} {"train_loss": -7.416485786437988, "global_step": 207080, "epoch": 4930} {"train_loss": -7.180090427398682, "global_step": 207081, "epoch": 4930} {"train_loss": -7.246311187744141, "global_step": 207082, "epoch": 4930} {"train_loss": -7.2104363441467285, "global_step": 207083, "epoch": 4930} {"train_loss": -7.286921501159668, "global_step": 207084, "epoch": 4930} {"train_loss": -7.227728366851807, "global_step": 207085, "epoch": 4930} {"train_loss": -7.323375701904297, "global_step": 207086, "epoch": 4930} {"train_loss": -7.1756792068481445, "global_step": 207087, "epoch": 4930} {"train_loss": -7.2859206199646, "global_step": 207088, "epoch": 4930} {"train_loss": -7.1479692459106445, "global_step": 207089, "epoch": 4930} {"train_loss": -6.909151077270508, "global_step": 207090, "epoch": 4930} {"train_loss": -7.158937454223633, "global_step": 207091, "epoch": 4930} {"train_loss": -7.3097052574157715, "global_step": 207092, "epoch": 4930} {"train_loss": -7.138930797576904, "global_step": 207093, "epoch": 4930} {"train_loss": -7.264138698577881, "global_step": 207094, "epoch": 4930} {"train_loss": -7.125082015991211, "global_step": 207095, "epoch": 4930} {"train_loss": -7.035642147064209, "global_step": 207096, "epoch": 4930} {"train_loss": -7.240645408630371, "global_step": 207097, "epoch": 4930} {"train_loss": -7.186849594116211, "global_step": 207098, "epoch": 4930} {"train_loss": -7.215063095092773, "global_step": 207099, "epoch": 4930} {"train_loss": -7.141119480133057, "global_step": 207100, "epoch": 4930} {"train_loss": -7.242879492895944, "global_step": 207101, "epoch": 4930, "val_loss": 69290.578125} {"train_loss": -7.253995895385742, "global_step": 207102, "epoch": 4931} {"train_loss": -7.214364051818848, "global_step": 207103, "epoch": 4931} {"train_loss": -7.2518792152404785, "global_step": 207104, "epoch": 4931} {"train_loss": -7.189481258392334, "global_step": 207105, "epoch": 4931} {"train_loss": -7.187361717224121, "global_step": 207106, "epoch": 4931} {"train_loss": -7.274023532867432, "global_step": 207107, "epoch": 4931} {"train_loss": -7.073511123657227, "global_step": 207108, "epoch": 4931} {"train_loss": -7.256197929382324, "global_step": 207109, "epoch": 4931} {"train_loss": -7.1472272872924805, "global_step": 207110, "epoch": 4931} {"train_loss": -7.138587951660156, "global_step": 207111, "epoch": 4931} {"train_loss": -7.24454402923584, "global_step": 207112, "epoch": 4931} {"train_loss": -7.2455902099609375, "global_step": 207113, "epoch": 4931} {"train_loss": -7.13783073425293, "global_step": 207114, "epoch": 4931} {"train_loss": -7.136138916015625, "global_step": 207115, "epoch": 4931} {"train_loss": -7.204433917999268, "global_step": 207116, "epoch": 4931} {"train_loss": -7.315157890319824, "global_step": 207117, "epoch": 4931} {"train_loss": -7.155456066131592, "global_step": 207118, "epoch": 4931} {"train_loss": -7.152226448059082, "global_step": 207119, "epoch": 4931} {"train_loss": -7.20109748840332, "global_step": 207120, "epoch": 4931} {"train_loss": -7.1619062423706055, "global_step": 207121, "epoch": 4931} {"train_loss": -7.279806137084961, "global_step": 207122, "epoch": 4931} {"train_loss": -7.185781002044678, "global_step": 207123, "epoch": 4931} {"train_loss": -7.168360710144043, "global_step": 207124, "epoch": 4931} {"train_loss": -7.204046249389648, "global_step": 207125, "epoch": 4931} {"train_loss": -7.191777229309082, "global_step": 207126, "epoch": 4931} {"train_loss": -7.055682182312012, "global_step": 207127, "epoch": 4931} {"train_loss": -7.228028774261475, "global_step": 207128, "epoch": 4931} {"train_loss": -7.2502121925354, "global_step": 207129, "epoch": 4931} {"train_loss": -7.1718597412109375, "global_step": 207130, "epoch": 4931} {"train_loss": -7.349092483520508, "global_step": 207131, "epoch": 4931} {"train_loss": -7.31928825378418, "global_step": 207132, "epoch": 4931} {"train_loss": -7.200178146362305, "global_step": 207133, "epoch": 4931} {"train_loss": -7.2299275398254395, "global_step": 207134, "epoch": 4931} {"train_loss": -7.297175884246826, "global_step": 207135, "epoch": 4931} {"train_loss": -7.215909481048584, "global_step": 207136, "epoch": 4931} {"train_loss": -7.326567649841309, "global_step": 207137, "epoch": 4931} {"train_loss": -7.259631156921387, "global_step": 207138, "epoch": 4931} {"train_loss": -7.272440433502197, "global_step": 207139, "epoch": 4931} {"train_loss": -7.306028366088867, "global_step": 207140, "epoch": 4931} {"train_loss": -7.26785135269165, "global_step": 207141, "epoch": 4931} {"train_loss": -7.337497711181641, "global_step": 207142, "epoch": 4931} {"train_loss": -7.223231519971575, "global_step": 207143, "epoch": 4931, "val_loss": 69132.8359375} {"train_loss": -7.232083797454834, "global_step": 207144, "epoch": 4932} {"train_loss": -7.229377746582031, "global_step": 207145, "epoch": 4932} {"train_loss": -7.212851524353027, "global_step": 207146, "epoch": 4932} {"train_loss": -7.215760707855225, "global_step": 207147, "epoch": 4932} {"train_loss": -7.281491756439209, "global_step": 207148, "epoch": 4932} {"train_loss": -7.162994384765625, "global_step": 207149, "epoch": 4932} {"train_loss": -7.267307281494141, "global_step": 207150, "epoch": 4932} {"train_loss": -7.309772968292236, "global_step": 207151, "epoch": 4932} {"train_loss": -7.260247707366943, "global_step": 207152, "epoch": 4932} {"train_loss": -7.283109664916992, "global_step": 207153, "epoch": 4932} {"train_loss": -7.289846420288086, "global_step": 207154, "epoch": 4932} {"train_loss": -7.280915260314941, "global_step": 207155, "epoch": 4932} {"train_loss": -7.092342376708984, "global_step": 207156, "epoch": 4932} {"train_loss": -7.252127647399902, "global_step": 207157, "epoch": 4932} {"train_loss": -7.247145652770996, "global_step": 207158, "epoch": 4932} {"train_loss": -7.1400299072265625, "global_step": 207159, "epoch": 4932} {"train_loss": -7.132410526275635, "global_step": 207160, "epoch": 4932} {"train_loss": -7.208676338195801, "global_step": 207161, "epoch": 4932} {"train_loss": -7.234450817108154, "global_step": 207162, "epoch": 4932} {"train_loss": -7.319375038146973, "global_step": 207163, "epoch": 4932} {"train_loss": -7.257589340209961, "global_step": 207164, "epoch": 4932} {"train_loss": -7.304905891418457, "global_step": 207165, "epoch": 4932} {"train_loss": -7.202665328979492, "global_step": 207166, "epoch": 4932} {"train_loss": -7.112161636352539, "global_step": 207167, "epoch": 4932} {"train_loss": -7.301834583282471, "global_step": 207168, "epoch": 4932} {"train_loss": -7.19189453125, "global_step": 207169, "epoch": 4932} {"train_loss": -7.205545425415039, "global_step": 207170, "epoch": 4932} {"train_loss": -7.174187660217285, "global_step": 207171, "epoch": 4932} {"train_loss": -7.11518669128418, "global_step": 207172, "epoch": 4932} {"train_loss": -7.142180919647217, "global_step": 207173, "epoch": 4932} {"train_loss": -7.2551984786987305, "global_step": 207174, "epoch": 4932} {"train_loss": -7.179336071014404, "global_step": 207175, "epoch": 4932} {"train_loss": -7.150483131408691, "global_step": 207176, "epoch": 4932} {"train_loss": -7.228304386138916, "global_step": 207177, "epoch": 4932} {"train_loss": -7.2694902420043945, "global_step": 207178, "epoch": 4932} {"train_loss": -7.231626987457275, "global_step": 207179, "epoch": 4932} {"train_loss": -7.1626787185668945, "global_step": 207180, "epoch": 4932} {"train_loss": -7.188882827758789, "global_step": 207181, "epoch": 4932} {"train_loss": -7.284187316894531, "global_step": 207182, "epoch": 4932} {"train_loss": -7.199276924133301, "global_step": 207183, "epoch": 4932} {"train_loss": -7.117205619812012, "global_step": 207184, "epoch": 4932} {"train_loss": -7.218533856528146, "global_step": 207185, "epoch": 4932, "val_loss": 69106.7109375} {"train_loss": -7.215812683105469, "global_step": 207186, "epoch": 4933} {"train_loss": -7.130525588989258, "global_step": 207187, "epoch": 4933} {"train_loss": -7.354038238525391, "global_step": 207188, "epoch": 4933} {"train_loss": -7.241664409637451, "global_step": 207189, "epoch": 4933} {"train_loss": -7.329805374145508, "global_step": 207190, "epoch": 4933} {"train_loss": -7.286027431488037, "global_step": 207191, "epoch": 4933} {"train_loss": -7.207827091217041, "global_step": 207192, "epoch": 4933} {"train_loss": -7.293437480926514, "global_step": 207193, "epoch": 4933} {"train_loss": -7.317760467529297, "global_step": 207194, "epoch": 4933} {"train_loss": -7.38521671295166, "global_step": 207195, "epoch": 4933} {"train_loss": -7.243210792541504, "global_step": 207196, "epoch": 4933} {"train_loss": -7.20388126373291, "global_step": 207197, "epoch": 4933} {"train_loss": -7.282449722290039, "global_step": 207198, "epoch": 4933} {"train_loss": -7.312314033508301, "global_step": 207199, "epoch": 4933} {"train_loss": -7.286847114562988, "global_step": 207200, "epoch": 4933} {"train_loss": -7.3406147956848145, "global_step": 207201, "epoch": 4933} {"train_loss": -7.255947113037109, "global_step": 207202, "epoch": 4933} {"train_loss": -7.162073612213135, "global_step": 207203, "epoch": 4933} {"train_loss": -7.239293575286865, "global_step": 207204, "epoch": 4933} {"train_loss": -7.284623622894287, "global_step": 207205, "epoch": 4933} {"train_loss": -7.300593376159668, "global_step": 207206, "epoch": 4933} {"train_loss": -7.337588310241699, "global_step": 207207, "epoch": 4933} {"train_loss": -7.284192085266113, "global_step": 207208, "epoch": 4933} {"train_loss": -7.189901351928711, "global_step": 207209, "epoch": 4933} {"train_loss": -7.285140037536621, "global_step": 207210, "epoch": 4933} {"train_loss": -7.275938034057617, "global_step": 207211, "epoch": 4933} {"train_loss": -7.417726516723633, "global_step": 207212, "epoch": 4933} {"train_loss": -7.1586713790893555, "global_step": 207213, "epoch": 4933} {"train_loss": -7.3040313720703125, "global_step": 207214, "epoch": 4933} {"train_loss": -7.298242568969727, "global_step": 207215, "epoch": 4933} {"train_loss": -7.352178573608398, "global_step": 207216, "epoch": 4933} {"train_loss": -7.310507774353027, "global_step": 207217, "epoch": 4933} {"train_loss": -7.505301475524902, "global_step": 207218, "epoch": 4933} {"train_loss": -7.351099967956543, "global_step": 207219, "epoch": 4933} {"train_loss": -7.2857866287231445, "global_step": 207220, "epoch": 4933} {"train_loss": -7.348369598388672, "global_step": 207221, "epoch": 4933} {"train_loss": -7.371267318725586, "global_step": 207222, "epoch": 4933} {"train_loss": -7.0339860916137695, "global_step": 207223, "epoch": 4933} {"train_loss": -7.25531005859375, "global_step": 207224, "epoch": 4933} {"train_loss": -7.229649066925049, "global_step": 207225, "epoch": 4933} {"train_loss": -7.317595481872559, "global_step": 207226, "epoch": 4933} {"train_loss": -7.282511177517119, "global_step": 207227, "epoch": 4933, "val_loss": 69053.8203125} {"train_loss": -7.100220680236816, "global_step": 207228, "epoch": 4934} {"train_loss": -7.248230934143066, "global_step": 207229, "epoch": 4934} {"train_loss": -7.131898403167725, "global_step": 207230, "epoch": 4934} {"train_loss": -7.225916862487793, "global_step": 207231, "epoch": 4934} {"train_loss": -7.162735939025879, "global_step": 207232, "epoch": 4934} {"train_loss": -7.214082717895508, "global_step": 207233, "epoch": 4934} {"train_loss": -7.197182655334473, "global_step": 207234, "epoch": 4934} {"train_loss": -7.1977691650390625, "global_step": 207235, "epoch": 4934} {"train_loss": -7.237972736358643, "global_step": 207236, "epoch": 4934} {"train_loss": -7.260537147521973, "global_step": 207237, "epoch": 4934} {"train_loss": -7.205681324005127, "global_step": 207238, "epoch": 4934} {"train_loss": -7.268682956695557, "global_step": 207239, "epoch": 4934} {"train_loss": -7.330259323120117, "global_step": 207240, "epoch": 4934} {"train_loss": -7.296130180358887, "global_step": 207241, "epoch": 4934} {"train_loss": -7.29193115234375, "global_step": 207242, "epoch": 4934} {"train_loss": -7.227370738983154, "global_step": 207243, "epoch": 4934} {"train_loss": -7.164551734924316, "global_step": 207244, "epoch": 4934} {"train_loss": -7.205937385559082, "global_step": 207245, "epoch": 4934} {"train_loss": -7.278655052185059, "global_step": 207246, "epoch": 4934} {"train_loss": -7.294577598571777, "global_step": 207247, "epoch": 4934} {"train_loss": -7.312023162841797, "global_step": 207248, "epoch": 4934} {"train_loss": -7.27018404006958, "global_step": 207249, "epoch": 4934} {"train_loss": -7.278048515319824, "global_step": 207250, "epoch": 4934} {"train_loss": -7.190460205078125, "global_step": 207251, "epoch": 4934} {"train_loss": -7.261083602905273, "global_step": 207252, "epoch": 4934} {"train_loss": -7.3026814460754395, "global_step": 207253, "epoch": 4934} {"train_loss": -7.3001556396484375, "global_step": 207254, "epoch": 4934} {"train_loss": -7.264133453369141, "global_step": 207255, "epoch": 4934} {"train_loss": -7.304073333740234, "global_step": 207256, "epoch": 4934} {"train_loss": -7.175403594970703, "global_step": 207257, "epoch": 4934} {"train_loss": -7.287342071533203, "global_step": 207258, "epoch": 4934} {"train_loss": -7.174233913421631, "global_step": 207259, "epoch": 4934} {"train_loss": -7.365598678588867, "global_step": 207260, "epoch": 4934} {"train_loss": -7.2014360427856445, "global_step": 207261, "epoch": 4934} {"train_loss": -7.328164100646973, "global_step": 207262, "epoch": 4934} {"train_loss": -7.309508323669434, "global_step": 207263, "epoch": 4934} {"train_loss": -7.303648471832275, "global_step": 207264, "epoch": 4934} {"train_loss": -7.22422456741333, "global_step": 207265, "epoch": 4934} {"train_loss": -7.236215591430664, "global_step": 207266, "epoch": 4934} {"train_loss": -7.357728004455566, "global_step": 207267, "epoch": 4934} {"train_loss": -7.3678388595581055, "global_step": 207268, "epoch": 4934} {"train_loss": -7.251396031606765, "global_step": 207269, "epoch": 4934, "val_loss": 69171.296875} {"train_loss": -7.172675132751465, "global_step": 207270, "epoch": 4935} {"train_loss": -7.309175491333008, "global_step": 207271, "epoch": 4935} {"train_loss": -7.267529487609863, "global_step": 207272, "epoch": 4935} {"train_loss": -7.265534400939941, "global_step": 207273, "epoch": 4935} {"train_loss": -7.256953239440918, "global_step": 207274, "epoch": 4935} {"train_loss": -7.315087795257568, "global_step": 207275, "epoch": 4935} {"train_loss": -7.123012542724609, "global_step": 207276, "epoch": 4935} {"train_loss": -7.157355308532715, "global_step": 207277, "epoch": 4935} {"train_loss": -7.226090908050537, "global_step": 207278, "epoch": 4935} {"train_loss": -7.239543437957764, "global_step": 207279, "epoch": 4935} {"train_loss": -7.25147008895874, "global_step": 207280, "epoch": 4935} {"train_loss": -7.216526985168457, "global_step": 207281, "epoch": 4935} {"train_loss": -7.295503616333008, "global_step": 207282, "epoch": 4935} {"train_loss": -7.230464935302734, "global_step": 207283, "epoch": 4935} {"train_loss": -7.3173828125, "global_step": 207284, "epoch": 4935} {"train_loss": -7.266958713531494, "global_step": 207285, "epoch": 4935} {"train_loss": -7.157143592834473, "global_step": 207286, "epoch": 4935} {"train_loss": -7.2670793533325195, "global_step": 207287, "epoch": 4935} {"train_loss": -7.166172504425049, "global_step": 207288, "epoch": 4935} {"train_loss": -7.3003106117248535, "global_step": 207289, "epoch": 4935} {"train_loss": -7.108620643615723, "global_step": 207290, "epoch": 4935} {"train_loss": -7.27922248840332, "global_step": 207291, "epoch": 4935} {"train_loss": -7.205537796020508, "global_step": 207292, "epoch": 4935} {"train_loss": -7.242851257324219, "global_step": 207293, "epoch": 4935} {"train_loss": -7.365464210510254, "global_step": 207294, "epoch": 4935} {"train_loss": -7.180687427520752, "global_step": 207295, "epoch": 4935} {"train_loss": -7.2235493659973145, "global_step": 207296, "epoch": 4935} {"train_loss": -7.2845025062561035, "global_step": 207297, "epoch": 4935} {"train_loss": -7.040076732635498, "global_step": 207298, "epoch": 4935} {"train_loss": -7.197909355163574, "global_step": 207299, "epoch": 4935} {"train_loss": -7.265877723693848, "global_step": 207300, "epoch": 4935} {"train_loss": -7.1900248527526855, "global_step": 207301, "epoch": 4935} {"train_loss": -7.114672660827637, "global_step": 207302, "epoch": 4935} {"train_loss": -7.1395263671875, "global_step": 207303, "epoch": 4935} {"train_loss": -7.093258380889893, "global_step": 207304, "epoch": 4935} {"train_loss": -7.305337429046631, "global_step": 207305, "epoch": 4935} {"train_loss": -7.149608612060547, "global_step": 207306, "epoch": 4935} {"train_loss": -7.279381275177002, "global_step": 207307, "epoch": 4935} {"train_loss": -7.175754547119141, "global_step": 207308, "epoch": 4935} {"train_loss": -7.174750328063965, "global_step": 207309, "epoch": 4935} {"train_loss": -7.277412414550781, "global_step": 207310, "epoch": 4935} {"train_loss": -7.220450821376982, "global_step": 207311, "epoch": 4935, "val_loss": 69051.1171875} {"train_loss": -7.325822353363037, "global_step": 207312, "epoch": 4936} {"train_loss": -7.240329742431641, "global_step": 207313, "epoch": 4936} {"train_loss": -7.325163841247559, "global_step": 207314, "epoch": 4936} {"train_loss": -7.319528579711914, "global_step": 207315, "epoch": 4936} {"train_loss": -7.25296688079834, "global_step": 207316, "epoch": 4936} {"train_loss": -7.293105125427246, "global_step": 207317, "epoch": 4936} {"train_loss": -7.241716384887695, "global_step": 207318, "epoch": 4936} {"train_loss": -7.1959638595581055, "global_step": 207319, "epoch": 4936} {"train_loss": -7.303930282592773, "global_step": 207320, "epoch": 4936} {"train_loss": -7.352759838104248, "global_step": 207321, "epoch": 4936} {"train_loss": -7.302347183227539, "global_step": 207322, "epoch": 4936} {"train_loss": -7.374876022338867, "global_step": 207323, "epoch": 4936} {"train_loss": -7.34727668762207, "global_step": 207324, "epoch": 4936} {"train_loss": -7.313817024230957, "global_step": 207325, "epoch": 4936} {"train_loss": -7.312024116516113, "global_step": 207326, "epoch": 4936} {"train_loss": -7.326093673706055, "global_step": 207327, "epoch": 4936} {"train_loss": -7.221562385559082, "global_step": 207328, "epoch": 4936} {"train_loss": -7.399331092834473, "global_step": 207329, "epoch": 4936} {"train_loss": -7.381877899169922, "global_step": 207330, "epoch": 4936} {"train_loss": -7.4333577156066895, "global_step": 207331, "epoch": 4936} {"train_loss": -7.362194538116455, "global_step": 207332, "epoch": 4936} {"train_loss": -7.382205963134766, "global_step": 207333, "epoch": 4936} {"train_loss": -7.28626823425293, "global_step": 207334, "epoch": 4936} {"train_loss": -7.306079864501953, "global_step": 207335, "epoch": 4936} {"train_loss": -7.3842997550964355, "global_step": 207336, "epoch": 4936} {"train_loss": -7.40012264251709, "global_step": 207337, "epoch": 4936} {"train_loss": -7.312532424926758, "global_step": 207338, "epoch": 4936} {"train_loss": -7.4264726638793945, "global_step": 207339, "epoch": 4936} {"train_loss": -7.369140148162842, "global_step": 207340, "epoch": 4936} {"train_loss": -7.244599342346191, "global_step": 207341, "epoch": 4936} {"train_loss": -7.352954864501953, "global_step": 207342, "epoch": 4936} {"train_loss": -7.2687087059021, "global_step": 207343, "epoch": 4936} {"train_loss": -7.298854351043701, "global_step": 207344, "epoch": 4936} {"train_loss": -7.268367767333984, "global_step": 207345, "epoch": 4936} {"train_loss": -7.249642372131348, "global_step": 207346, "epoch": 4936} {"train_loss": -7.361342430114746, "global_step": 207347, "epoch": 4936} {"train_loss": -7.444129467010498, "global_step": 207348, "epoch": 4936} {"train_loss": -7.35432767868042, "global_step": 207349, "epoch": 4936} {"train_loss": -7.340340614318848, "global_step": 207350, "epoch": 4936} {"train_loss": -7.232442855834961, "global_step": 207351, "epoch": 4936} {"train_loss": -7.237330436706543, "global_step": 207352, "epoch": 4936} {"train_loss": -7.321361984525408, "global_step": 207353, "epoch": 4936, "val_loss": 69231.015625} {"train_loss": -7.338283538818359, "global_step": 207354, "epoch": 4937} {"train_loss": -7.323917388916016, "global_step": 207355, "epoch": 4937} {"train_loss": -7.204533576965332, "global_step": 207356, "epoch": 4937} {"train_loss": -7.299981117248535, "global_step": 207357, "epoch": 4937} {"train_loss": -7.24769401550293, "global_step": 207358, "epoch": 4937} {"train_loss": -7.2910237312316895, "global_step": 207359, "epoch": 4937} {"train_loss": -7.276586532592773, "global_step": 207360, "epoch": 4937} {"train_loss": -7.395817756652832, "global_step": 207361, "epoch": 4937} {"train_loss": -7.313998222351074, "global_step": 207362, "epoch": 4937} {"train_loss": -7.121660232543945, "global_step": 207363, "epoch": 4937} {"train_loss": -7.323101043701172, "global_step": 207364, "epoch": 4937} {"train_loss": -7.137615203857422, "global_step": 207365, "epoch": 4937} {"train_loss": -7.251777648925781, "global_step": 207366, "epoch": 4937} {"train_loss": -7.211029529571533, "global_step": 207367, "epoch": 4937} {"train_loss": -7.201643943786621, "global_step": 207368, "epoch": 4937} {"train_loss": -7.291888236999512, "global_step": 207369, "epoch": 4937} {"train_loss": -7.266127586364746, "global_step": 207370, "epoch": 4937} {"train_loss": -7.296195030212402, "global_step": 207371, "epoch": 4937} {"train_loss": -7.17218542098999, "global_step": 207372, "epoch": 4937} {"train_loss": -7.353697776794434, "global_step": 207373, "epoch": 4937} {"train_loss": -7.1627888679504395, "global_step": 207374, "epoch": 4937} {"train_loss": -7.235672473907471, "global_step": 207375, "epoch": 4937} {"train_loss": -7.27658748626709, "global_step": 207376, "epoch": 4937} {"train_loss": -7.161653518676758, "global_step": 207377, "epoch": 4937} {"train_loss": -7.25991153717041, "global_step": 207378, "epoch": 4937} {"train_loss": -7.232764720916748, "global_step": 207379, "epoch": 4937} {"train_loss": -7.137660026550293, "global_step": 207380, "epoch": 4937} {"train_loss": -7.24044132232666, "global_step": 207381, "epoch": 4937} {"train_loss": -7.213142395019531, "global_step": 207382, "epoch": 4937} {"train_loss": -7.218896865844727, "global_step": 207383, "epoch": 4937} {"train_loss": -7.277196407318115, "global_step": 207384, "epoch": 4937} {"train_loss": -7.226627826690674, "global_step": 207385, "epoch": 4937} {"train_loss": -7.185538291931152, "global_step": 207386, "epoch": 4937} {"train_loss": -7.27813720703125, "global_step": 207387, "epoch": 4937} {"train_loss": -7.15516471862793, "global_step": 207388, "epoch": 4937} {"train_loss": -7.3282999992370605, "global_step": 207389, "epoch": 4937} {"train_loss": -7.31512451171875, "global_step": 207390, "epoch": 4937} {"train_loss": -7.217747688293457, "global_step": 207391, "epoch": 4937} {"train_loss": -7.259778022766113, "global_step": 207392, "epoch": 4937} {"train_loss": -7.341261386871338, "global_step": 207393, "epoch": 4937} {"train_loss": -7.38510799407959, "global_step": 207394, "epoch": 4937} {"train_loss": -7.254488558996291, "global_step": 207395, "epoch": 4937, "val_loss": 69051.2109375} {"train_loss": -7.2443718910217285, "global_step": 207396, "epoch": 4938} {"train_loss": -7.300205230712891, "global_step": 207397, "epoch": 4938} {"train_loss": -7.327963829040527, "global_step": 207398, "epoch": 4938} {"train_loss": -7.23464822769165, "global_step": 207399, "epoch": 4938} {"train_loss": -7.1886749267578125, "global_step": 207400, "epoch": 4938} {"train_loss": -7.242603302001953, "global_step": 207401, "epoch": 4938} {"train_loss": -7.279486179351807, "global_step": 207402, "epoch": 4938} {"train_loss": -7.292662620544434, "global_step": 207403, "epoch": 4938} {"train_loss": -7.311621189117432, "global_step": 207404, "epoch": 4938} {"train_loss": -7.235001564025879, "global_step": 207405, "epoch": 4938} {"train_loss": -7.237060546875, "global_step": 207406, "epoch": 4938} {"train_loss": -7.3209381103515625, "global_step": 207407, "epoch": 4938} {"train_loss": -7.404439926147461, "global_step": 207408, "epoch": 4938} {"train_loss": -7.21592378616333, "global_step": 207409, "epoch": 4938} {"train_loss": -7.327278137207031, "global_step": 207410, "epoch": 4938} {"train_loss": -7.061156749725342, "global_step": 207411, "epoch": 4938} {"train_loss": -7.189458847045898, "global_step": 207412, "epoch": 4938} {"train_loss": -7.161829471588135, "global_step": 207413, "epoch": 4938} {"train_loss": -7.160762310028076, "global_step": 207414, "epoch": 4938} {"train_loss": -7.316919326782227, "global_step": 207415, "epoch": 4938} {"train_loss": -7.218290328979492, "global_step": 207416, "epoch": 4938} {"train_loss": -7.200977325439453, "global_step": 207417, "epoch": 4938} {"train_loss": -7.224023818969727, "global_step": 207418, "epoch": 4938} {"train_loss": -7.235195159912109, "global_step": 207419, "epoch": 4938} {"train_loss": -7.159768104553223, "global_step": 207420, "epoch": 4938} {"train_loss": -7.234585762023926, "global_step": 207421, "epoch": 4938} {"train_loss": -7.334878444671631, "global_step": 207422, "epoch": 4938} {"train_loss": -7.212253570556641, "global_step": 207423, "epoch": 4938} {"train_loss": -7.1768293380737305, "global_step": 207424, "epoch": 4938} {"train_loss": -7.3496198654174805, "global_step": 207425, "epoch": 4938} {"train_loss": -7.348592281341553, "global_step": 207426, "epoch": 4938} {"train_loss": -7.303879261016846, "global_step": 207427, "epoch": 4938} {"train_loss": -7.35605525970459, "global_step": 207428, "epoch": 4938} {"train_loss": -7.387941837310791, "global_step": 207429, "epoch": 4938} {"train_loss": -7.333737850189209, "global_step": 207430, "epoch": 4938} {"train_loss": -7.216734409332275, "global_step": 207431, "epoch": 4938} {"train_loss": -7.304617881774902, "global_step": 207432, "epoch": 4938} {"train_loss": -7.183266639709473, "global_step": 207433, "epoch": 4938} {"train_loss": -7.315860748291016, "global_step": 207434, "epoch": 4938} {"train_loss": -7.3069000244140625, "global_step": 207435, "epoch": 4938} {"train_loss": -7.285077095031738, "global_step": 207436, "epoch": 4938} {"train_loss": -7.2637661184583395, "global_step": 207437, "epoch": 4938, "val_loss": 69110.0} {"train_loss": -7.32179069519043, "global_step": 207438, "epoch": 4939} {"train_loss": -7.267988204956055, "global_step": 207439, "epoch": 4939} {"train_loss": -7.2653608322143555, "global_step": 207440, "epoch": 4939} {"train_loss": -7.239645481109619, "global_step": 207441, "epoch": 4939} {"train_loss": -7.405489444732666, "global_step": 207442, "epoch": 4939} {"train_loss": -7.260115146636963, "global_step": 207443, "epoch": 4939} {"train_loss": -7.335442543029785, "global_step": 207444, "epoch": 4939} {"train_loss": -7.264129638671875, "global_step": 207445, "epoch": 4939} {"train_loss": -7.318387508392334, "global_step": 207446, "epoch": 4939} {"train_loss": -7.246293544769287, "global_step": 207447, "epoch": 4939} {"train_loss": -7.1607561111450195, "global_step": 207448, "epoch": 4939} {"train_loss": -7.344301223754883, "global_step": 207449, "epoch": 4939} {"train_loss": -7.235410690307617, "global_step": 207450, "epoch": 4939} {"train_loss": -7.243656158447266, "global_step": 207451, "epoch": 4939} {"train_loss": -7.184433937072754, "global_step": 207452, "epoch": 4939} {"train_loss": -7.181754112243652, "global_step": 207453, "epoch": 4939} {"train_loss": -7.213568210601807, "global_step": 207454, "epoch": 4939} {"train_loss": -7.286838054656982, "global_step": 207455, "epoch": 4939} {"train_loss": -7.258643627166748, "global_step": 207456, "epoch": 4939} {"train_loss": -7.114421844482422, "global_step": 207457, "epoch": 4939} {"train_loss": -7.22324275970459, "global_step": 207458, "epoch": 4939} {"train_loss": -7.23879337310791, "global_step": 207459, "epoch": 4939} {"train_loss": -7.258083820343018, "global_step": 207460, "epoch": 4939} {"train_loss": -7.274601459503174, "global_step": 207461, "epoch": 4939} {"train_loss": -7.176296234130859, "global_step": 207462, "epoch": 4939} {"train_loss": -7.231349945068359, "global_step": 207463, "epoch": 4939} {"train_loss": -7.282654762268066, "global_step": 207464, "epoch": 4939} {"train_loss": -7.298739433288574, "global_step": 207465, "epoch": 4939} {"train_loss": -7.251430988311768, "global_step": 207466, "epoch": 4939} {"train_loss": -7.147486686706543, "global_step": 207467, "epoch": 4939} {"train_loss": -7.236734867095947, "global_step": 207468, "epoch": 4939} {"train_loss": -7.365359306335449, "global_step": 207469, "epoch": 4939} {"train_loss": -7.312169075012207, "global_step": 207470, "epoch": 4939} {"train_loss": -7.241157531738281, "global_step": 207471, "epoch": 4939} {"train_loss": -7.414455413818359, "global_step": 207472, "epoch": 4939} {"train_loss": -7.366917610168457, "global_step": 207473, "epoch": 4939} {"train_loss": -7.313470363616943, "global_step": 207474, "epoch": 4939} {"train_loss": -7.214781761169434, "global_step": 207475, "epoch": 4939} {"train_loss": -7.2838592529296875, "global_step": 207476, "epoch": 4939} {"train_loss": -7.276120185852051, "global_step": 207477, "epoch": 4939} {"train_loss": -7.19966459274292, "global_step": 207478, "epoch": 4939} {"train_loss": -7.264204161507743, "global_step": 207479, "epoch": 4939, "val_loss": 69570.390625} {"train_loss": -7.214188575744629, "global_step": 207480, "epoch": 4940} {"train_loss": -7.089242935180664, "global_step": 207481, "epoch": 4940} {"train_loss": -7.236147403717041, "global_step": 207482, "epoch": 4940} {"train_loss": -7.073328018188477, "global_step": 207483, "epoch": 4940} {"train_loss": -7.124886512756348, "global_step": 207484, "epoch": 4940} {"train_loss": -7.22550106048584, "global_step": 207485, "epoch": 4940} {"train_loss": -7.191784381866455, "global_step": 207486, "epoch": 4940} {"train_loss": -7.33689022064209, "global_step": 207487, "epoch": 4940} {"train_loss": -7.235526084899902, "global_step": 207488, "epoch": 4940} {"train_loss": -7.231452465057373, "global_step": 207489, "epoch": 4940} {"train_loss": -7.230522632598877, "global_step": 207490, "epoch": 4940} {"train_loss": -7.167156219482422, "global_step": 207491, "epoch": 4940} {"train_loss": -7.201678276062012, "global_step": 207492, "epoch": 4940} {"train_loss": -7.143509387969971, "global_step": 207493, "epoch": 4940} {"train_loss": -7.284411907196045, "global_step": 207494, "epoch": 4940} {"train_loss": -7.167514324188232, "global_step": 207495, "epoch": 4940} {"train_loss": -7.27145528793335, "global_step": 207496, "epoch": 4940} {"train_loss": -7.3056640625, "global_step": 207497, "epoch": 4940} {"train_loss": -7.225105285644531, "global_step": 207498, "epoch": 4940} {"train_loss": -7.2330803871154785, "global_step": 207499, "epoch": 4940} {"train_loss": -7.231239318847656, "global_step": 207500, "epoch": 4940} {"train_loss": -7.365082740783691, "global_step": 207501, "epoch": 4940} {"train_loss": -7.182142734527588, "global_step": 207502, "epoch": 4940} {"train_loss": -7.172945976257324, "global_step": 207503, "epoch": 4940} {"train_loss": -7.215083122253418, "global_step": 207504, "epoch": 4940} {"train_loss": -7.26936674118042, "global_step": 207505, "epoch": 4940} {"train_loss": -7.342232704162598, "global_step": 207506, "epoch": 4940} {"train_loss": -7.304507732391357, "global_step": 207507, "epoch": 4940} {"train_loss": -7.33380126953125, "global_step": 207508, "epoch": 4940} {"train_loss": -7.3918633460998535, "global_step": 207509, "epoch": 4940} {"train_loss": -7.3473968505859375, "global_step": 207510, "epoch": 4940} {"train_loss": -7.336212158203125, "global_step": 207511, "epoch": 4940} {"train_loss": -7.368046760559082, "global_step": 207512, "epoch": 4940} {"train_loss": -7.429027080535889, "global_step": 207513, "epoch": 4940} {"train_loss": -7.2976789474487305, "global_step": 207514, "epoch": 4940} {"train_loss": -7.234406471252441, "global_step": 207515, "epoch": 4940} {"train_loss": -7.3133649826049805, "global_step": 207516, "epoch": 4940} {"train_loss": -7.23542594909668, "global_step": 207517, "epoch": 4940} {"train_loss": -7.279970169067383, "global_step": 207518, "epoch": 4940} {"train_loss": -7.308505058288574, "global_step": 207519, "epoch": 4940} {"train_loss": -7.205044746398926, "global_step": 207520, "epoch": 4940} {"train_loss": -7.2536891755603605, "global_step": 207521, "epoch": 4940, "val_loss": 69279.515625} {"train_loss": -7.256121635437012, "global_step": 207522, "epoch": 4941} {"train_loss": -7.145574569702148, "global_step": 207523, "epoch": 4941} {"train_loss": -7.305774688720703, "global_step": 207524, "epoch": 4941} {"train_loss": -7.278428077697754, "global_step": 207525, "epoch": 4941} {"train_loss": -7.429125785827637, "global_step": 207526, "epoch": 4941} {"train_loss": -7.3957929611206055, "global_step": 207527, "epoch": 4941} {"train_loss": -7.237215042114258, "global_step": 207528, "epoch": 4941} {"train_loss": -7.194919586181641, "global_step": 207529, "epoch": 4941} {"train_loss": -7.241155624389648, "global_step": 207530, "epoch": 4941} {"train_loss": -7.189362525939941, "global_step": 207531, "epoch": 4941} {"train_loss": -7.246189117431641, "global_step": 207532, "epoch": 4941} {"train_loss": -7.305778503417969, "global_step": 207533, "epoch": 4941} {"train_loss": -7.119211196899414, "global_step": 207534, "epoch": 4941} {"train_loss": -7.1943583488464355, "global_step": 207535, "epoch": 4941} {"train_loss": -7.356399059295654, "global_step": 207536, "epoch": 4941} {"train_loss": -7.1900954246521, "global_step": 207537, "epoch": 4941} {"train_loss": -7.274202346801758, "global_step": 207538, "epoch": 4941} {"train_loss": -7.269503593444824, "global_step": 207539, "epoch": 4941} {"train_loss": -7.235788822174072, "global_step": 207540, "epoch": 4941} {"train_loss": -7.24022912979126, "global_step": 207541, "epoch": 4941} {"train_loss": -7.221403121948242, "global_step": 207542, "epoch": 4941} {"train_loss": -7.293604850769043, "global_step": 207543, "epoch": 4941} {"train_loss": -7.198223114013672, "global_step": 207544, "epoch": 4941} {"train_loss": -7.329100608825684, "global_step": 207545, "epoch": 4941} {"train_loss": -7.369838237762451, "global_step": 207546, "epoch": 4941} {"train_loss": -7.309828758239746, "global_step": 207547, "epoch": 4941} {"train_loss": -7.244331359863281, "global_step": 207548, "epoch": 4941} {"train_loss": -7.243746280670166, "global_step": 207549, "epoch": 4941} {"train_loss": -7.0936970710754395, "global_step": 207550, "epoch": 4941} {"train_loss": -7.31040620803833, "global_step": 207551, "epoch": 4941} {"train_loss": -7.269741058349609, "global_step": 207552, "epoch": 4941} {"train_loss": -7.316265106201172, "global_step": 207553, "epoch": 4941} {"train_loss": -7.350017547607422, "global_step": 207554, "epoch": 4941} {"train_loss": -7.33966064453125, "global_step": 207555, "epoch": 4941} {"train_loss": -7.405245780944824, "global_step": 207556, "epoch": 4941} {"train_loss": -7.244729518890381, "global_step": 207557, "epoch": 4941} {"train_loss": -7.2766876220703125, "global_step": 207558, "epoch": 4941} {"train_loss": -7.266592979431152, "global_step": 207559, "epoch": 4941} {"train_loss": -7.260414123535156, "global_step": 207560, "epoch": 4941} {"train_loss": -7.324268341064453, "global_step": 207561, "epoch": 4941} {"train_loss": -7.296371936798096, "global_step": 207562, "epoch": 4941} {"train_loss": -7.27264598437718, "global_step": 207563, "epoch": 4941, "val_loss": 69297.5546875} {"train_loss": -7.390012264251709, "global_step": 207564, "epoch": 4942} {"train_loss": -7.220709323883057, "global_step": 207565, "epoch": 4942} {"train_loss": -7.326333999633789, "global_step": 207566, "epoch": 4942} {"train_loss": -7.396749973297119, "global_step": 207567, "epoch": 4942} {"train_loss": -7.362933158874512, "global_step": 207568, "epoch": 4942} {"train_loss": -7.324810981750488, "global_step": 207569, "epoch": 4942} {"train_loss": -7.4581122398376465, "global_step": 207570, "epoch": 4942} {"train_loss": -7.206974983215332, "global_step": 207571, "epoch": 4942} {"train_loss": -7.3415608406066895, "global_step": 207572, "epoch": 4942} {"train_loss": -7.305280685424805, "global_step": 207573, "epoch": 4942} {"train_loss": -7.27841854095459, "global_step": 207574, "epoch": 4942} {"train_loss": -7.395441055297852, "global_step": 207575, "epoch": 4942} {"train_loss": -7.253091812133789, "global_step": 207576, "epoch": 4942} {"train_loss": -7.406866073608398, "global_step": 207577, "epoch": 4942} {"train_loss": -7.24397087097168, "global_step": 207578, "epoch": 4942} {"train_loss": -7.223806381225586, "global_step": 207579, "epoch": 4942} {"train_loss": -7.244011402130127, "global_step": 207580, "epoch": 4942} {"train_loss": -7.2744550704956055, "global_step": 207581, "epoch": 4942} {"train_loss": -7.267280101776123, "global_step": 207582, "epoch": 4942} {"train_loss": -7.2145256996154785, "global_step": 207583, "epoch": 4942} {"train_loss": -7.250290393829346, "global_step": 207584, "epoch": 4942} {"train_loss": -7.197382926940918, "global_step": 207585, "epoch": 4942} {"train_loss": -7.271148681640625, "global_step": 207586, "epoch": 4942} {"train_loss": -7.180843830108643, "global_step": 207587, "epoch": 4942} {"train_loss": -7.232503890991211, "global_step": 207588, "epoch": 4942} {"train_loss": -7.259781837463379, "global_step": 207589, "epoch": 4942} {"train_loss": -7.359114170074463, "global_step": 207590, "epoch": 4942} {"train_loss": -7.134488582611084, "global_step": 207591, "epoch": 4942} {"train_loss": -7.211780548095703, "global_step": 207592, "epoch": 4942} {"train_loss": -7.17209005355835, "global_step": 207593, "epoch": 4942} {"train_loss": -7.1347455978393555, "global_step": 207594, "epoch": 4942} {"train_loss": -7.178114891052246, "global_step": 207595, "epoch": 4942} {"train_loss": -7.210659027099609, "global_step": 207596, "epoch": 4942} {"train_loss": -7.115021705627441, "global_step": 207597, "epoch": 4942} {"train_loss": -7.168625831604004, "global_step": 207598, "epoch": 4942} {"train_loss": -7.189223766326904, "global_step": 207599, "epoch": 4942} {"train_loss": -7.2971110343933105, "global_step": 207600, "epoch": 4942} {"train_loss": -7.266566276550293, "global_step": 207601, "epoch": 4942} {"train_loss": -7.337262153625488, "global_step": 207602, "epoch": 4942} {"train_loss": -7.254545211791992, "global_step": 207603, "epoch": 4942} {"train_loss": -7.289689064025879, "global_step": 207604, "epoch": 4942} {"train_loss": -7.265279724484398, "global_step": 207605, "epoch": 4942, "val_loss": 69285.9140625} {"train_loss": -7.330923080444336, "global_step": 207606, "epoch": 4943} {"train_loss": -7.2350006103515625, "global_step": 207607, "epoch": 4943} {"train_loss": -7.249081134796143, "global_step": 207608, "epoch": 4943} {"train_loss": -7.206582069396973, "global_step": 207609, "epoch": 4943} {"train_loss": -7.324153423309326, "global_step": 207610, "epoch": 4943} {"train_loss": -7.27201509475708, "global_step": 207611, "epoch": 4943} {"train_loss": -7.294813632965088, "global_step": 207612, "epoch": 4943} {"train_loss": -7.469933986663818, "global_step": 207613, "epoch": 4943} {"train_loss": -7.184322834014893, "global_step": 207614, "epoch": 4943} {"train_loss": -7.2437591552734375, "global_step": 207615, "epoch": 4943} {"train_loss": -7.1419196128845215, "global_step": 207616, "epoch": 4943} {"train_loss": -7.215664863586426, "global_step": 207617, "epoch": 4943} {"train_loss": -7.281195640563965, "global_step": 207618, "epoch": 4943} {"train_loss": -7.224283218383789, "global_step": 207619, "epoch": 4943} {"train_loss": -7.237578392028809, "global_step": 207620, "epoch": 4943} {"train_loss": -7.271068572998047, "global_step": 207621, "epoch": 4943} {"train_loss": -7.3177618980407715, "global_step": 207622, "epoch": 4943} {"train_loss": -7.314409255981445, "global_step": 207623, "epoch": 4943} {"train_loss": -7.133073806762695, "global_step": 207624, "epoch": 4943} {"train_loss": -7.320135116577148, "global_step": 207625, "epoch": 4943} {"train_loss": -7.296919822692871, "global_step": 207626, "epoch": 4943} {"train_loss": -7.290511608123779, "global_step": 207627, "epoch": 4943} {"train_loss": -7.316407203674316, "global_step": 207628, "epoch": 4943} {"train_loss": -7.2112812995910645, "global_step": 207629, "epoch": 4943} {"train_loss": -7.309021949768066, "global_step": 207630, "epoch": 4943} {"train_loss": -7.310368061065674, "global_step": 207631, "epoch": 4943} {"train_loss": -7.327828407287598, "global_step": 207632, "epoch": 4943} {"train_loss": -7.425908088684082, "global_step": 207633, "epoch": 4943} {"train_loss": -7.278359889984131, "global_step": 207634, "epoch": 4943} {"train_loss": -7.310132026672363, "global_step": 207635, "epoch": 4943} {"train_loss": -7.4179487228393555, "global_step": 207636, "epoch": 4943} {"train_loss": -7.312078475952148, "global_step": 207637, "epoch": 4943} {"train_loss": -7.273938179016113, "global_step": 207638, "epoch": 4943} {"train_loss": -7.312708377838135, "global_step": 207639, "epoch": 4943} {"train_loss": -7.305642127990723, "global_step": 207640, "epoch": 4943} {"train_loss": -7.253008842468262, "global_step": 207641, "epoch": 4943} {"train_loss": -7.2095818519592285, "global_step": 207642, "epoch": 4943} {"train_loss": -7.248064041137695, "global_step": 207643, "epoch": 4943} {"train_loss": -7.347288131713867, "global_step": 207644, "epoch": 4943} {"train_loss": -7.226688385009766, "global_step": 207645, "epoch": 4943} {"train_loss": -7.145662784576416, "global_step": 207646, "epoch": 4943} {"train_loss": -7.277122985749018, "global_step": 207647, "epoch": 4943, "val_loss": 69345.2421875} {"train_loss": -7.072981357574463, "global_step": 207648, "epoch": 4944} {"train_loss": -7.254131317138672, "global_step": 207649, "epoch": 4944} {"train_loss": -7.232367515563965, "global_step": 207650, "epoch": 4944} {"train_loss": -7.1550750732421875, "global_step": 207651, "epoch": 4944} {"train_loss": -7.223435878753662, "global_step": 207652, "epoch": 4944} {"train_loss": -7.261374473571777, "global_step": 207653, "epoch": 4944} {"train_loss": -7.197485446929932, "global_step": 207654, "epoch": 4944} {"train_loss": -7.207282066345215, "global_step": 207655, "epoch": 4944} {"train_loss": -7.257445812225342, "global_step": 207656, "epoch": 4944} {"train_loss": -7.250041484832764, "global_step": 207657, "epoch": 4944} {"train_loss": -7.215509414672852, "global_step": 207658, "epoch": 4944} {"train_loss": -7.283049583435059, "global_step": 207659, "epoch": 4944} {"train_loss": -7.317297458648682, "global_step": 207660, "epoch": 4944} {"train_loss": -7.328829765319824, "global_step": 207661, "epoch": 4944} {"train_loss": -7.321581840515137, "global_step": 207662, "epoch": 4944} {"train_loss": -7.397091865539551, "global_step": 207663, "epoch": 4944} {"train_loss": -7.316166400909424, "global_step": 207664, "epoch": 4944} {"train_loss": -7.297891139984131, "global_step": 207665, "epoch": 4944} {"train_loss": -7.14968204498291, "global_step": 207666, "epoch": 4944} {"train_loss": -7.340696334838867, "global_step": 207667, "epoch": 4944} {"train_loss": -7.176327705383301, "global_step": 207668, "epoch": 4944} {"train_loss": -7.309861660003662, "global_step": 207669, "epoch": 4944} {"train_loss": -7.340605735778809, "global_step": 207670, "epoch": 4944} {"train_loss": -7.382411956787109, "global_step": 207671, "epoch": 4944} {"train_loss": -7.246682167053223, "global_step": 207672, "epoch": 4944} {"train_loss": -7.297884464263916, "global_step": 207673, "epoch": 4944} {"train_loss": -7.337882041931152, "global_step": 207674, "epoch": 4944} {"train_loss": -7.307971954345703, "global_step": 207675, "epoch": 4944} {"train_loss": -7.249192237854004, "global_step": 207676, "epoch": 4944} {"train_loss": -7.423618793487549, "global_step": 207677, "epoch": 4944} {"train_loss": -7.346545696258545, "global_step": 207678, "epoch": 4944} {"train_loss": -7.211141586303711, "global_step": 207679, "epoch": 4944} {"train_loss": -7.2816901206970215, "global_step": 207680, "epoch": 4944} {"train_loss": -7.242090225219727, "global_step": 207681, "epoch": 4944} {"train_loss": -7.112932205200195, "global_step": 207682, "epoch": 4944} {"train_loss": -7.241482257843018, "global_step": 207683, "epoch": 4944} {"train_loss": -7.198460578918457, "global_step": 207684, "epoch": 4944} {"train_loss": -7.086058616638184, "global_step": 207685, "epoch": 4944} {"train_loss": -7.2343854904174805, "global_step": 207686, "epoch": 4944} {"train_loss": -7.200746059417725, "global_step": 207687, "epoch": 4944} {"train_loss": -7.320732116699219, "global_step": 207688, "epoch": 4944} {"train_loss": -7.257042952946255, "global_step": 207689, "epoch": 4944, "val_loss": 69222.3984375} {"train_loss": -7.185595512390137, "global_step": 207690, "epoch": 4945} {"train_loss": -7.319207191467285, "global_step": 207691, "epoch": 4945} {"train_loss": -7.260157585144043, "global_step": 207692, "epoch": 4945} {"train_loss": -7.257091999053955, "global_step": 207693, "epoch": 4945} {"train_loss": -7.2906341552734375, "global_step": 207694, "epoch": 4945} {"train_loss": -7.345942497253418, "global_step": 207695, "epoch": 4945} {"train_loss": -7.382250785827637, "global_step": 207696, "epoch": 4945} {"train_loss": -7.496492862701416, "global_step": 207697, "epoch": 4945} {"train_loss": -7.25129508972168, "global_step": 207698, "epoch": 4945} {"train_loss": -7.253447532653809, "global_step": 207699, "epoch": 4945} {"train_loss": -7.305495262145996, "global_step": 207700, "epoch": 4945} {"train_loss": -7.178200721740723, "global_step": 207701, "epoch": 4945} {"train_loss": -7.30776309967041, "global_step": 207702, "epoch": 4945} {"train_loss": -7.237741470336914, "global_step": 207703, "epoch": 4945} {"train_loss": -7.2614850997924805, "global_step": 207704, "epoch": 4945} {"train_loss": -7.306397438049316, "global_step": 207705, "epoch": 4945} {"train_loss": -7.258103847503662, "global_step": 207706, "epoch": 4945} {"train_loss": -7.2433905601501465, "global_step": 207707, "epoch": 4945} {"train_loss": -7.223832130432129, "global_step": 207708, "epoch": 4945} {"train_loss": -7.275121212005615, "global_step": 207709, "epoch": 4945} {"train_loss": -7.329261779785156, "global_step": 207710, "epoch": 4945} {"train_loss": -7.387094974517822, "global_step": 207711, "epoch": 4945} {"train_loss": -7.347836971282959, "global_step": 207712, "epoch": 4945} {"train_loss": -7.290908336639404, "global_step": 207713, "epoch": 4945} {"train_loss": -7.373874664306641, "global_step": 207714, "epoch": 4945} {"train_loss": -7.207461833953857, "global_step": 207715, "epoch": 4945} {"train_loss": -7.354530334472656, "global_step": 207716, "epoch": 4945} {"train_loss": -7.265228271484375, "global_step": 207717, "epoch": 4945} {"train_loss": -7.320957660675049, "global_step": 207718, "epoch": 4945} {"train_loss": -7.2982282638549805, "global_step": 207719, "epoch": 4945} {"train_loss": -7.361044406890869, "global_step": 207720, "epoch": 4945} {"train_loss": -7.382540702819824, "global_step": 207721, "epoch": 4945} {"train_loss": -7.32711124420166, "global_step": 207722, "epoch": 4945} {"train_loss": -7.337291717529297, "global_step": 207723, "epoch": 4945} {"train_loss": -7.264154434204102, "global_step": 207724, "epoch": 4945} {"train_loss": -7.240341663360596, "global_step": 207725, "epoch": 4945} {"train_loss": -7.398950576782227, "global_step": 207726, "epoch": 4945} {"train_loss": -7.321976661682129, "global_step": 207727, "epoch": 4945} {"train_loss": -7.238119125366211, "global_step": 207728, "epoch": 4945} {"train_loss": -7.251710891723633, "global_step": 207729, "epoch": 4945} {"train_loss": -7.296210289001465, "global_step": 207730, "epoch": 4945} {"train_loss": -7.30130536215646, "global_step": 207731, "epoch": 4945, "val_loss": 69124.078125} {"train_loss": -7.3066534996032715, "global_step": 207732, "epoch": 4946} {"train_loss": -7.327052116394043, "global_step": 207733, "epoch": 4946} {"train_loss": -7.318509101867676, "global_step": 207734, "epoch": 4946} {"train_loss": -7.290134429931641, "global_step": 207735, "epoch": 4946} {"train_loss": -7.381455421447754, "global_step": 207736, "epoch": 4946} {"train_loss": -7.354923248291016, "global_step": 207737, "epoch": 4946} {"train_loss": -7.320867538452148, "global_step": 207738, "epoch": 4946} {"train_loss": -7.362441062927246, "global_step": 207739, "epoch": 4946} {"train_loss": -7.256153106689453, "global_step": 207740, "epoch": 4946} {"train_loss": -7.128648281097412, "global_step": 207741, "epoch": 4946} {"train_loss": -7.325840950012207, "global_step": 207742, "epoch": 4946} {"train_loss": -7.307285785675049, "global_step": 207743, "epoch": 4946} {"train_loss": -7.035853385925293, "global_step": 207744, "epoch": 4946} {"train_loss": -7.267533302307129, "global_step": 207745, "epoch": 4946} {"train_loss": -7.123093605041504, "global_step": 207746, "epoch": 4946} {"train_loss": -7.042068958282471, "global_step": 207747, "epoch": 4946} {"train_loss": -7.3385186195373535, "global_step": 207748, "epoch": 4946} {"train_loss": -7.11916446685791, "global_step": 207749, "epoch": 4946} {"train_loss": -7.056049346923828, "global_step": 207750, "epoch": 4946} {"train_loss": -7.289864540100098, "global_step": 207751, "epoch": 4946} {"train_loss": -7.268054008483887, "global_step": 207752, "epoch": 4946} {"train_loss": -7.280652046203613, "global_step": 207753, "epoch": 4946} {"train_loss": -7.287382125854492, "global_step": 207754, "epoch": 4946} {"train_loss": -7.146885871887207, "global_step": 207755, "epoch": 4946} {"train_loss": -7.121522903442383, "global_step": 207756, "epoch": 4946} {"train_loss": -7.3636980056762695, "global_step": 207757, "epoch": 4946} {"train_loss": -7.202210426330566, "global_step": 207758, "epoch": 4946} {"train_loss": -7.3222198486328125, "global_step": 207759, "epoch": 4946} {"train_loss": -7.329740524291992, "global_step": 207760, "epoch": 4946} {"train_loss": -7.314538955688477, "global_step": 207761, "epoch": 4946} {"train_loss": -7.293804168701172, "global_step": 207762, "epoch": 4946} {"train_loss": -7.203975677490234, "global_step": 207763, "epoch": 4946} {"train_loss": -7.279952526092529, "global_step": 207764, "epoch": 4946} {"train_loss": -7.321698188781738, "global_step": 207765, "epoch": 4946} {"train_loss": -7.284259796142578, "global_step": 207766, "epoch": 4946} {"train_loss": -7.3850178718566895, "global_step": 207767, "epoch": 4946} {"train_loss": -7.392115116119385, "global_step": 207768, "epoch": 4946} {"train_loss": -7.238584995269775, "global_step": 207769, "epoch": 4946} {"train_loss": -7.271881580352783, "global_step": 207770, "epoch": 4946} {"train_loss": -7.338220596313477, "global_step": 207771, "epoch": 4946} {"train_loss": -7.322228908538818, "global_step": 207772, "epoch": 4946} {"train_loss": -7.267112084797451, "global_step": 207773, "epoch": 4946, "val_loss": 69107.8515625} {"train_loss": -7.269522666931152, "global_step": 207774, "epoch": 4947} {"train_loss": -7.278073310852051, "global_step": 207775, "epoch": 4947} {"train_loss": -7.322196006774902, "global_step": 207776, "epoch": 4947} {"train_loss": -7.266706466674805, "global_step": 207777, "epoch": 4947} {"train_loss": -7.358892440795898, "global_step": 207778, "epoch": 4947} {"train_loss": -7.2113447189331055, "global_step": 207779, "epoch": 4947} {"train_loss": -7.221158027648926, "global_step": 207780, "epoch": 4947} {"train_loss": -7.39240837097168, "global_step": 207781, "epoch": 4947} {"train_loss": -7.281982898712158, "global_step": 207782, "epoch": 4947} {"train_loss": -7.30274772644043, "global_step": 207783, "epoch": 4947} {"train_loss": -7.423952579498291, "global_step": 207784, "epoch": 4947} {"train_loss": -7.375559329986572, "global_step": 207785, "epoch": 4947} {"train_loss": -7.248106479644775, "global_step": 207786, "epoch": 4947} {"train_loss": -7.296524524688721, "global_step": 207787, "epoch": 4947} {"train_loss": -7.337956428527832, "global_step": 207788, "epoch": 4947} {"train_loss": -7.260773658752441, "global_step": 207789, "epoch": 4947} {"train_loss": -7.236931800842285, "global_step": 207790, "epoch": 4947} {"train_loss": -7.281651496887207, "global_step": 207791, "epoch": 4947} {"train_loss": -7.254880428314209, "global_step": 207792, "epoch": 4947} {"train_loss": -7.247952461242676, "global_step": 207793, "epoch": 4947} {"train_loss": -7.257288932800293, "global_step": 207794, "epoch": 4947} {"train_loss": -7.341868877410889, "global_step": 207795, "epoch": 4947} {"train_loss": -7.312255859375, "global_step": 207796, "epoch": 4947} {"train_loss": -7.226811408996582, "global_step": 207797, "epoch": 4947} {"train_loss": -7.3197784423828125, "global_step": 207798, "epoch": 4947} {"train_loss": -7.325523376464844, "global_step": 207799, "epoch": 4947} {"train_loss": -7.205593585968018, "global_step": 207800, "epoch": 4947} {"train_loss": -7.3855462074279785, "global_step": 207801, "epoch": 4947} {"train_loss": -7.335065841674805, "global_step": 207802, "epoch": 4947} {"train_loss": -7.241680145263672, "global_step": 207803, "epoch": 4947} {"train_loss": -7.363774299621582, "global_step": 207804, "epoch": 4947} {"train_loss": -7.213412761688232, "global_step": 207805, "epoch": 4947} {"train_loss": -7.30172061920166, "global_step": 207806, "epoch": 4947} {"train_loss": -7.226665496826172, "global_step": 207807, "epoch": 4947} {"train_loss": -7.368586540222168, "global_step": 207808, "epoch": 4947} {"train_loss": -7.472785949707031, "global_step": 207809, "epoch": 4947} {"train_loss": -7.2309250831604, "global_step": 207810, "epoch": 4947} {"train_loss": -7.398001670837402, "global_step": 207811, "epoch": 4947} {"train_loss": -7.267391204833984, "global_step": 207812, "epoch": 4947} {"train_loss": -7.339759826660156, "global_step": 207813, "epoch": 4947} {"train_loss": -7.347537994384766, "global_step": 207814, "epoch": 4947} {"train_loss": -7.30107687768482, "global_step": 207815, "epoch": 4947, "val_loss": 69150.75} {"train_loss": -7.228100776672363, "global_step": 207816, "epoch": 4948} {"train_loss": -7.23613166809082, "global_step": 207817, "epoch": 4948} {"train_loss": -7.366664886474609, "global_step": 207818, "epoch": 4948} {"train_loss": -7.257694244384766, "global_step": 207819, "epoch": 4948} {"train_loss": -7.324631690979004, "global_step": 207820, "epoch": 4948} {"train_loss": -7.324522018432617, "global_step": 207821, "epoch": 4948} {"train_loss": -7.308235168457031, "global_step": 207822, "epoch": 4948} {"train_loss": -7.256175994873047, "global_step": 207823, "epoch": 4948} {"train_loss": -7.121321201324463, "global_step": 207824, "epoch": 4948} {"train_loss": -7.261805057525635, "global_step": 207825, "epoch": 4948} {"train_loss": -7.28524112701416, "global_step": 207826, "epoch": 4948} {"train_loss": -7.199169635772705, "global_step": 207827, "epoch": 4948} {"train_loss": -7.330224990844727, "global_step": 207828, "epoch": 4948} {"train_loss": -7.174787521362305, "global_step": 207829, "epoch": 4948} {"train_loss": -7.202906608581543, "global_step": 207830, "epoch": 4948} {"train_loss": -7.196895122528076, "global_step": 207831, "epoch": 4948} {"train_loss": -7.074035167694092, "global_step": 207832, "epoch": 4948} {"train_loss": -7.203037261962891, "global_step": 207833, "epoch": 4948} {"train_loss": -7.131763458251953, "global_step": 207834, "epoch": 4948} {"train_loss": -6.971433639526367, "global_step": 207835, "epoch": 4948} {"train_loss": -7.183960914611816, "global_step": 207836, "epoch": 4948} {"train_loss": -7.114252090454102, "global_step": 207837, "epoch": 4948} {"train_loss": -7.153338432312012, "global_step": 207838, "epoch": 4948} {"train_loss": -7.11737585067749, "global_step": 207839, "epoch": 4948} {"train_loss": -7.085124492645264, "global_step": 207840, "epoch": 4948} {"train_loss": -7.215821266174316, "global_step": 207841, "epoch": 4948} {"train_loss": -7.023618698120117, "global_step": 207842, "epoch": 4948} {"train_loss": -7.16623592376709, "global_step": 207843, "epoch": 4948} {"train_loss": -7.21043062210083, "global_step": 207844, "epoch": 4948} {"train_loss": -7.16234016418457, "global_step": 207845, "epoch": 4948} {"train_loss": -7.264070510864258, "global_step": 207846, "epoch": 4948} {"train_loss": -7.210094928741455, "global_step": 207847, "epoch": 4948} {"train_loss": -7.165362358093262, "global_step": 207848, "epoch": 4948} {"train_loss": -7.120200157165527, "global_step": 207849, "epoch": 4948} {"train_loss": -7.134972095489502, "global_step": 207850, "epoch": 4948} {"train_loss": -7.225987434387207, "global_step": 207851, "epoch": 4948} {"train_loss": -7.249119758605957, "global_step": 207852, "epoch": 4948} {"train_loss": -7.196640491485596, "global_step": 207853, "epoch": 4948} {"train_loss": -7.315732479095459, "global_step": 207854, "epoch": 4948} {"train_loss": -7.277652740478516, "global_step": 207855, "epoch": 4948} {"train_loss": -7.212580680847168, "global_step": 207856, "epoch": 4948} {"train_loss": -7.204799334208171, "global_step": 207857, "epoch": 4948, "val_loss": 69103.4609375} {"train_loss": -7.317971706390381, "global_step": 207858, "epoch": 4949} {"train_loss": -7.309314727783203, "global_step": 207859, "epoch": 4949} {"train_loss": -7.2763495445251465, "global_step": 207860, "epoch": 4949} {"train_loss": -7.307877063751221, "global_step": 207861, "epoch": 4949} {"train_loss": -7.277265548706055, "global_step": 207862, "epoch": 4949} {"train_loss": -7.348123550415039, "global_step": 207863, "epoch": 4949} {"train_loss": -7.282768726348877, "global_step": 207864, "epoch": 4949} {"train_loss": -7.266664505004883, "global_step": 207865, "epoch": 4949} {"train_loss": -7.301689147949219, "global_step": 207866, "epoch": 4949} {"train_loss": -7.359884738922119, "global_step": 207867, "epoch": 4949} {"train_loss": -7.265357971191406, "global_step": 207868, "epoch": 4949} {"train_loss": -7.406028747558594, "global_step": 207869, "epoch": 4949} {"train_loss": -7.309484958648682, "global_step": 207870, "epoch": 4949} {"train_loss": -7.238368511199951, "global_step": 207871, "epoch": 4949} {"train_loss": -7.321343898773193, "global_step": 207872, "epoch": 4949} {"train_loss": -7.335887908935547, "global_step": 207873, "epoch": 4949} {"train_loss": -7.275512218475342, "global_step": 207874, "epoch": 4949} {"train_loss": -7.2361626625061035, "global_step": 207875, "epoch": 4949} {"train_loss": -7.262529373168945, "global_step": 207876, "epoch": 4949} {"train_loss": -7.2360429763793945, "global_step": 207877, "epoch": 4949} {"train_loss": -7.374217987060547, "global_step": 207878, "epoch": 4949} {"train_loss": -7.19766902923584, "global_step": 207879, "epoch": 4949} {"train_loss": -7.258443832397461, "global_step": 207880, "epoch": 4949} {"train_loss": -7.246628284454346, "global_step": 207881, "epoch": 4949} {"train_loss": -7.173828601837158, "global_step": 207882, "epoch": 4949} {"train_loss": -7.221829891204834, "global_step": 207883, "epoch": 4949} {"train_loss": -7.237157344818115, "global_step": 207884, "epoch": 4949} {"train_loss": -7.291375160217285, "global_step": 207885, "epoch": 4949} {"train_loss": -7.373712062835693, "global_step": 207886, "epoch": 4949} {"train_loss": -7.351691246032715, "global_step": 207887, "epoch": 4949} {"train_loss": -7.250515460968018, "global_step": 207888, "epoch": 4949} {"train_loss": -7.2933669090271, "global_step": 207889, "epoch": 4949} {"train_loss": -7.378048896789551, "global_step": 207890, "epoch": 4949} {"train_loss": -7.368807315826416, "global_step": 207891, "epoch": 4949} {"train_loss": -7.312848091125488, "global_step": 207892, "epoch": 4949} {"train_loss": -7.329224109649658, "global_step": 207893, "epoch": 4949} {"train_loss": -7.310019016265869, "global_step": 207894, "epoch": 4949} {"train_loss": -7.265565872192383, "global_step": 207895, "epoch": 4949} {"train_loss": -7.349148750305176, "global_step": 207896, "epoch": 4949} {"train_loss": -7.346855163574219, "global_step": 207897, "epoch": 4949} {"train_loss": -7.280459880828857, "global_step": 207898, "epoch": 4949} {"train_loss": -7.298300016494024, "global_step": 207899, "epoch": 4949, "val_loss": 69248.9375} {"train_loss": -7.278819561004639, "global_step": 207900, "epoch": 4950} {"train_loss": -7.286861419677734, "global_step": 207901, "epoch": 4950} {"train_loss": -7.345107078552246, "global_step": 207902, "epoch": 4950} {"train_loss": -7.190412998199463, "global_step": 207903, "epoch": 4950} {"train_loss": -7.418397903442383, "global_step": 207904, "epoch": 4950} {"train_loss": -7.390657424926758, "global_step": 207905, "epoch": 4950} {"train_loss": -7.30750846862793, "global_step": 207906, "epoch": 4950} {"train_loss": -7.3150200843811035, "global_step": 207907, "epoch": 4950} {"train_loss": -7.3180742263793945, "global_step": 207908, "epoch": 4950} {"train_loss": -7.371360778808594, "global_step": 207909, "epoch": 4950} {"train_loss": -7.376169204711914, "global_step": 207910, "epoch": 4950} {"train_loss": -7.388184547424316, "global_step": 207911, "epoch": 4950} {"train_loss": -7.342465400695801, "global_step": 207912, "epoch": 4950} {"train_loss": -7.359444618225098, "global_step": 207913, "epoch": 4950} {"train_loss": -7.273135185241699, "global_step": 207914, "epoch": 4950} {"train_loss": -7.271304607391357, "global_step": 207915, "epoch": 4950} {"train_loss": -7.3611297607421875, "global_step": 207916, "epoch": 4950} {"train_loss": -7.184277534484863, "global_step": 207917, "epoch": 4950} {"train_loss": -7.254953384399414, "global_step": 207918, "epoch": 4950} {"train_loss": -7.303077697753906, "global_step": 207919, "epoch": 4950} {"train_loss": -7.309107780456543, "global_step": 207920, "epoch": 4950} {"train_loss": -7.169928550720215, "global_step": 207921, "epoch": 4950} {"train_loss": -7.2955780029296875, "global_step": 207922, "epoch": 4950} {"train_loss": -7.327552795410156, "global_step": 207923, "epoch": 4950} {"train_loss": -7.2121148109436035, "global_step": 207924, "epoch": 4950} {"train_loss": -7.2630228996276855, "global_step": 207925, "epoch": 4950} {"train_loss": -7.083268165588379, "global_step": 207926, "epoch": 4950} {"train_loss": -7.232160568237305, "global_step": 207927, "epoch": 4950} {"train_loss": -7.24480676651001, "global_step": 207928, "epoch": 4950} {"train_loss": -7.151751518249512, "global_step": 207929, "epoch": 4950} {"train_loss": -7.3199357986450195, "global_step": 207930, "epoch": 4950} {"train_loss": -7.259940147399902, "global_step": 207931, "epoch": 4950} {"train_loss": -7.247441291809082, "global_step": 207932, "epoch": 4950} {"train_loss": -7.154375076293945, "global_step": 207933, "epoch": 4950} {"train_loss": -7.252182483673096, "global_step": 207934, "epoch": 4950} {"train_loss": -7.344901084899902, "global_step": 207935, "epoch": 4950} {"train_loss": -7.341998100280762, "global_step": 207936, "epoch": 4950} {"train_loss": -7.173728942871094, "global_step": 207937, "epoch": 4950} {"train_loss": -7.25210428237915, "global_step": 207938, "epoch": 4950} {"train_loss": -7.375181198120117, "global_step": 207939, "epoch": 4950} {"train_loss": -7.121430397033691, "global_step": 207940, "epoch": 4950} {"train_loss": -7.275301842462449, "global_step": 207941, "epoch": 4950, "train/sim_max_reward_0": 0.20276981390363913, "train/sim_max_reward_1": 0.8930077247288875, "train/sim_max_reward_2": 0.4620026278294858, "train/sim_max_reward_3": 0.5067696174819225, "train/sim_max_reward_4": 0.36383168576896596, "train/sim_max_reward_5": 0.961327408049759, "test/sim_max_reward_4400000": 0.1579363972409795, "test/sim_max_reward_4400001": 0.9693546839407218, "test/sim_max_reward_4400002": 0.8904203252284547, "test/sim_max_reward_4400003": 0.9741643778873078, "test/sim_max_reward_4400004": 0.17114765522018885, "test/sim_max_reward_4400005": 0.1989045943757619, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.30668603119249693, "test/sim_max_reward_4400009": 0.9835879521634968, "test/sim_max_reward_4400010": 0.24294698321465816, "test/sim_max_reward_4400011": 0.07296515015700239, "test/sim_max_reward_4400012": 0.9436059399228883, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.9245615275397613, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.3091329485906568, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.27722374038523473, "test/sim_max_reward_4400019": 0.34764500410059385, "test/sim_max_reward_4400020": 0.8823136829752289, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9792393394127489, "test/sim_max_reward_4400023": 0.05126917776903565, "test/sim_max_reward_4400024": 0.9800401771868944, "test/sim_max_reward_4400025": 0.26982320029856594, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.024247943230431963, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.8613407752306869, "test/sim_max_reward_4400030": 0.782256553933428, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.5941779838188038, "test/sim_max_reward_4400034": 0.9727306719029155, "test/sim_max_reward_4400035": 0.8385320283145293, "test/sim_max_reward_4400036": 0.5384115078432876, "test/sim_max_reward_4400037": 0.9780003576141957, "test/sim_max_reward_4400038": 0.9901354658721523, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.6822282449586862, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9685898761744274, "test/sim_max_reward_4400045": 0.9757509411623918, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 0.8869730913741544, "test/sim_max_reward_4400048": 0.8437859353351371, "test/sim_max_reward_4400049": 0.8727546964033656, "train/mean_score": 0.56495147962711, "test/mean_score": 0.6208993427424996, "val_loss": 69063.4140625} {"train_loss": -7.279659271240234, "global_step": 207942, "epoch": 4951} {"train_loss": -7.281904220581055, "global_step": 207943, "epoch": 4951} {"train_loss": -7.16423225402832, "global_step": 207944, "epoch": 4951} {"train_loss": -7.246067047119141, "global_step": 207945, "epoch": 4951} {"train_loss": -7.167839050292969, "global_step": 207946, "epoch": 4951} {"train_loss": -7.211278438568115, "global_step": 207947, "epoch": 4951} {"train_loss": -7.1971330642700195, "global_step": 207948, "epoch": 4951} {"train_loss": -7.149080276489258, "global_step": 207949, "epoch": 4951} {"train_loss": -7.073702335357666, "global_step": 207950, "epoch": 4951} {"train_loss": -7.1689453125, "global_step": 207951, "epoch": 4951} {"train_loss": -7.132680892944336, "global_step": 207952, "epoch": 4951} {"train_loss": -7.234830856323242, "global_step": 207953, "epoch": 4951} {"train_loss": -7.1710968017578125, "global_step": 207954, "epoch": 4951} {"train_loss": -7.208850383758545, "global_step": 207955, "epoch": 4951} {"train_loss": -7.205765724182129, "global_step": 207956, "epoch": 4951} {"train_loss": -7.163031101226807, "global_step": 207957, "epoch": 4951} {"train_loss": -7.210724830627441, "global_step": 207958, "epoch": 4951} {"train_loss": -7.196691513061523, "global_step": 207959, "epoch": 4951} {"train_loss": -7.312936782836914, "global_step": 207960, "epoch": 4951} {"train_loss": -7.273900032043457, "global_step": 207961, "epoch": 4951} {"train_loss": -7.25217342376709, "global_step": 207962, "epoch": 4951} {"train_loss": -7.296107292175293, "global_step": 207963, "epoch": 4951} {"train_loss": -7.148689270019531, "global_step": 207964, "epoch": 4951} {"train_loss": -7.262234687805176, "global_step": 207965, "epoch": 4951} {"train_loss": -7.2938761711120605, "global_step": 207966, "epoch": 4951} {"train_loss": -7.372906684875488, "global_step": 207967, "epoch": 4951} {"train_loss": -7.397871017456055, "global_step": 207968, "epoch": 4951} {"train_loss": -7.237567901611328, "global_step": 207969, "epoch": 4951} {"train_loss": -7.262417793273926, "global_step": 207970, "epoch": 4951} {"train_loss": -7.258551597595215, "global_step": 207971, "epoch": 4951} {"train_loss": -7.2739434242248535, "global_step": 207972, "epoch": 4951} {"train_loss": -7.360759735107422, "global_step": 207973, "epoch": 4951} {"train_loss": -7.226560115814209, "global_step": 207974, "epoch": 4951} {"train_loss": -7.3189849853515625, "global_step": 207975, "epoch": 4951} {"train_loss": -7.229539394378662, "global_step": 207976, "epoch": 4951} {"train_loss": -7.294731140136719, "global_step": 207977, "epoch": 4951} {"train_loss": -7.39261531829834, "global_step": 207978, "epoch": 4951} {"train_loss": -7.283099174499512, "global_step": 207979, "epoch": 4951} {"train_loss": -7.285890579223633, "global_step": 207980, "epoch": 4951} {"train_loss": -7.301822185516357, "global_step": 207981, "epoch": 4951} {"train_loss": -7.24146842956543, "global_step": 207982, "epoch": 4951} {"train_loss": -7.248317003250122, "global_step": 207983, "epoch": 4951, "val_loss": 69196.703125} {"train_loss": -7.325428009033203, "global_step": 207984, "epoch": 4952} {"train_loss": -7.296810150146484, "global_step": 207985, "epoch": 4952} {"train_loss": -7.250637531280518, "global_step": 207986, "epoch": 4952} {"train_loss": -7.392218112945557, "global_step": 207987, "epoch": 4952} {"train_loss": -7.395891189575195, "global_step": 207988, "epoch": 4952} {"train_loss": -7.369377136230469, "global_step": 207989, "epoch": 4952} {"train_loss": -7.380886077880859, "global_step": 207990, "epoch": 4952} {"train_loss": -7.331566333770752, "global_step": 207991, "epoch": 4952} {"train_loss": -7.378606796264648, "global_step": 207992, "epoch": 4952} {"train_loss": -7.4114203453063965, "global_step": 207993, "epoch": 4952} {"train_loss": -7.390707969665527, "global_step": 207994, "epoch": 4952} {"train_loss": -7.267604351043701, "global_step": 207995, "epoch": 4952} {"train_loss": -7.448781967163086, "global_step": 207996, "epoch": 4952} {"train_loss": -7.163778305053711, "global_step": 207997, "epoch": 4952} {"train_loss": -7.284489631652832, "global_step": 207998, "epoch": 4952} {"train_loss": -7.366241931915283, "global_step": 207999, "epoch": 4952} {"train_loss": -7.347137928009033, "global_step": 208000, "epoch": 4952} {"train_loss": -7.168649673461914, "global_step": 208001, "epoch": 4952} {"train_loss": -7.375147819519043, "global_step": 208002, "epoch": 4952} {"train_loss": -7.448068618774414, "global_step": 208003, "epoch": 4952} {"train_loss": -7.2096452713012695, "global_step": 208004, "epoch": 4952} {"train_loss": -7.389836311340332, "global_step": 208005, "epoch": 4952} {"train_loss": -7.328505516052246, "global_step": 208006, "epoch": 4952} {"train_loss": -7.196831703186035, "global_step": 208007, "epoch": 4952} {"train_loss": -7.296239852905273, "global_step": 208008, "epoch": 4952} {"train_loss": -7.269546031951904, "global_step": 208009, "epoch": 4952} {"train_loss": -7.282105922698975, "global_step": 208010, "epoch": 4952} {"train_loss": -7.232909202575684, "global_step": 208011, "epoch": 4952} {"train_loss": -7.325109481811523, "global_step": 208012, "epoch": 4952} {"train_loss": -7.3734564781188965, "global_step": 208013, "epoch": 4952} {"train_loss": -7.306895732879639, "global_step": 208014, "epoch": 4952} {"train_loss": -7.433969974517822, "global_step": 208015, "epoch": 4952} {"train_loss": -7.255836486816406, "global_step": 208016, "epoch": 4952} {"train_loss": -7.296389579772949, "global_step": 208017, "epoch": 4952} {"train_loss": -7.301834583282471, "global_step": 208018, "epoch": 4952} {"train_loss": -7.420106887817383, "global_step": 208019, "epoch": 4952} {"train_loss": -7.188360214233398, "global_step": 208020, "epoch": 4952} {"train_loss": -7.259039878845215, "global_step": 208021, "epoch": 4952} {"train_loss": -7.26410436630249, "global_step": 208022, "epoch": 4952} {"train_loss": -7.30442476272583, "global_step": 208023, "epoch": 4952} {"train_loss": -7.365228652954102, "global_step": 208024, "epoch": 4952} {"train_loss": -7.3213852700733, "global_step": 208025, "epoch": 4952, "val_loss": 69148.6015625} {"train_loss": -7.138214111328125, "global_step": 208026, "epoch": 4953} {"train_loss": -7.245148181915283, "global_step": 208027, "epoch": 4953} {"train_loss": -7.181662559509277, "global_step": 208028, "epoch": 4953} {"train_loss": -7.214155197143555, "global_step": 208029, "epoch": 4953} {"train_loss": -7.11635684967041, "global_step": 208030, "epoch": 4953} {"train_loss": -7.144841194152832, "global_step": 208031, "epoch": 4953} {"train_loss": -7.2649054527282715, "global_step": 208032, "epoch": 4953} {"train_loss": -7.189281940460205, "global_step": 208033, "epoch": 4953} {"train_loss": -7.211540699005127, "global_step": 208034, "epoch": 4953} {"train_loss": -7.130107879638672, "global_step": 208035, "epoch": 4953} {"train_loss": -7.201770782470703, "global_step": 208036, "epoch": 4953} {"train_loss": -7.308530330657959, "global_step": 208037, "epoch": 4953} {"train_loss": -7.297398090362549, "global_step": 208038, "epoch": 4953} {"train_loss": -7.232490539550781, "global_step": 208039, "epoch": 4953} {"train_loss": -7.147362232208252, "global_step": 208040, "epoch": 4953} {"train_loss": -7.170447826385498, "global_step": 208041, "epoch": 4953} {"train_loss": -7.2088727951049805, "global_step": 208042, "epoch": 4953} {"train_loss": -7.31806755065918, "global_step": 208043, "epoch": 4953} {"train_loss": -7.270367622375488, "global_step": 208044, "epoch": 4953} {"train_loss": -7.2241530418396, "global_step": 208045, "epoch": 4953} {"train_loss": -7.309515953063965, "global_step": 208046, "epoch": 4953} {"train_loss": -7.231378555297852, "global_step": 208047, "epoch": 4953} {"train_loss": -7.1792192459106445, "global_step": 208048, "epoch": 4953} {"train_loss": -7.361266136169434, "global_step": 208049, "epoch": 4953} {"train_loss": -7.329423904418945, "global_step": 208050, "epoch": 4953} {"train_loss": -7.333436012268066, "global_step": 208051, "epoch": 4953} {"train_loss": -7.358948707580566, "global_step": 208052, "epoch": 4953} {"train_loss": -7.3003621101379395, "global_step": 208053, "epoch": 4953} {"train_loss": -7.236869812011719, "global_step": 208054, "epoch": 4953} {"train_loss": -7.352541923522949, "global_step": 208055, "epoch": 4953} {"train_loss": -7.285861968994141, "global_step": 208056, "epoch": 4953} {"train_loss": -7.300729751586914, "global_step": 208057, "epoch": 4953} {"train_loss": -7.351279258728027, "global_step": 208058, "epoch": 4953} {"train_loss": -7.316475868225098, "global_step": 208059, "epoch": 4953} {"train_loss": -7.272831916809082, "global_step": 208060, "epoch": 4953} {"train_loss": -7.349837303161621, "global_step": 208061, "epoch": 4953} {"train_loss": -7.329110622406006, "global_step": 208062, "epoch": 4953} {"train_loss": -7.3092942237854, "global_step": 208063, "epoch": 4953} {"train_loss": -7.393433094024658, "global_step": 208064, "epoch": 4953} {"train_loss": -7.336102485656738, "global_step": 208065, "epoch": 4953} {"train_loss": -7.352456092834473, "global_step": 208066, "epoch": 4953} {"train_loss": -7.264319499333699, "global_step": 208067, "epoch": 4953, "val_loss": 69443.28125} {"train_loss": -7.43790340423584, "global_step": 208068, "epoch": 4954} {"train_loss": -7.488034248352051, "global_step": 208069, "epoch": 4954} {"train_loss": -7.463364601135254, "global_step": 208070, "epoch": 4954} {"train_loss": -7.484931945800781, "global_step": 208071, "epoch": 4954} {"train_loss": -7.408604621887207, "global_step": 208072, "epoch": 4954} {"train_loss": -7.277141571044922, "global_step": 208073, "epoch": 4954} {"train_loss": -7.291426181793213, "global_step": 208074, "epoch": 4954} {"train_loss": -7.2972846031188965, "global_step": 208075, "epoch": 4954} {"train_loss": -7.333359718322754, "global_step": 208076, "epoch": 4954} {"train_loss": -7.263158798217773, "global_step": 208077, "epoch": 4954} {"train_loss": -7.323716163635254, "global_step": 208078, "epoch": 4954} {"train_loss": -7.346652507781982, "global_step": 208079, "epoch": 4954} {"train_loss": -7.432773590087891, "global_step": 208080, "epoch": 4954} {"train_loss": -7.456677436828613, "global_step": 208081, "epoch": 4954} {"train_loss": -7.47130012512207, "global_step": 208082, "epoch": 4954} {"train_loss": -7.385026931762695, "global_step": 208083, "epoch": 4954} {"train_loss": -7.385618209838867, "global_step": 208084, "epoch": 4954} {"train_loss": -7.328524112701416, "global_step": 208085, "epoch": 4954} {"train_loss": -7.387614727020264, "global_step": 208086, "epoch": 4954} {"train_loss": -7.1817169189453125, "global_step": 208087, "epoch": 4954} {"train_loss": -7.224624156951904, "global_step": 208088, "epoch": 4954} {"train_loss": -7.331892967224121, "global_step": 208089, "epoch": 4954} {"train_loss": -7.298971652984619, "global_step": 208090, "epoch": 4954} {"train_loss": -7.363726615905762, "global_step": 208091, "epoch": 4954} {"train_loss": -7.423628330230713, "global_step": 208092, "epoch": 4954} {"train_loss": -7.350817680358887, "global_step": 208093, "epoch": 4954} {"train_loss": -7.377826690673828, "global_step": 208094, "epoch": 4954} {"train_loss": -7.276577949523926, "global_step": 208095, "epoch": 4954} {"train_loss": -7.412835121154785, "global_step": 208096, "epoch": 4954} {"train_loss": -7.175572395324707, "global_step": 208097, "epoch": 4954} {"train_loss": -7.233767509460449, "global_step": 208098, "epoch": 4954} {"train_loss": -7.243824481964111, "global_step": 208099, "epoch": 4954} {"train_loss": -7.189986228942871, "global_step": 208100, "epoch": 4954} {"train_loss": -7.311985969543457, "global_step": 208101, "epoch": 4954} {"train_loss": -7.121717929840088, "global_step": 208102, "epoch": 4954} {"train_loss": -7.227203369140625, "global_step": 208103, "epoch": 4954} {"train_loss": -7.308583736419678, "global_step": 208104, "epoch": 4954} {"train_loss": -7.230228424072266, "global_step": 208105, "epoch": 4954} {"train_loss": -7.288170337677002, "global_step": 208106, "epoch": 4954} {"train_loss": -7.205618858337402, "global_step": 208107, "epoch": 4954} {"train_loss": -7.2771759033203125, "global_step": 208108, "epoch": 4954} {"train_loss": -7.322231690088908, "global_step": 208109, "epoch": 4954, "val_loss": 69040.7421875} {"train_loss": -7.3567328453063965, "global_step": 208110, "epoch": 4955} {"train_loss": -7.1704607009887695, "global_step": 208111, "epoch": 4955} {"train_loss": -7.3219404220581055, "global_step": 208112, "epoch": 4955} {"train_loss": -7.278444290161133, "global_step": 208113, "epoch": 4955} {"train_loss": -7.228397369384766, "global_step": 208114, "epoch": 4955} {"train_loss": -7.322122573852539, "global_step": 208115, "epoch": 4955} {"train_loss": -7.276705265045166, "global_step": 208116, "epoch": 4955} {"train_loss": -7.249023914337158, "global_step": 208117, "epoch": 4955} {"train_loss": -7.237581253051758, "global_step": 208118, "epoch": 4955} {"train_loss": -7.219238758087158, "global_step": 208119, "epoch": 4955} {"train_loss": -7.394041538238525, "global_step": 208120, "epoch": 4955} {"train_loss": -7.269906520843506, "global_step": 208121, "epoch": 4955} {"train_loss": -7.240240573883057, "global_step": 208122, "epoch": 4955} {"train_loss": -7.190127372741699, "global_step": 208123, "epoch": 4955} {"train_loss": -7.343173980712891, "global_step": 208124, "epoch": 4955} {"train_loss": -7.075318813323975, "global_step": 208125, "epoch": 4955} {"train_loss": -7.336124420166016, "global_step": 208126, "epoch": 4955} {"train_loss": -7.327808380126953, "global_step": 208127, "epoch": 4955} {"train_loss": -7.184444904327393, "global_step": 208128, "epoch": 4955} {"train_loss": -7.458193778991699, "global_step": 208129, "epoch": 4955} {"train_loss": -7.382842063903809, "global_step": 208130, "epoch": 4955} {"train_loss": -7.2718095779418945, "global_step": 208131, "epoch": 4955} {"train_loss": -7.368947505950928, "global_step": 208132, "epoch": 4955} {"train_loss": -7.298551559448242, "global_step": 208133, "epoch": 4955} {"train_loss": -7.264340877532959, "global_step": 208134, "epoch": 4955} {"train_loss": -7.410386085510254, "global_step": 208135, "epoch": 4955} {"train_loss": -7.421060562133789, "global_step": 208136, "epoch": 4955} {"train_loss": -7.387907028198242, "global_step": 208137, "epoch": 4955} {"train_loss": -7.317990303039551, "global_step": 208138, "epoch": 4955} {"train_loss": -7.438088417053223, "global_step": 208139, "epoch": 4955} {"train_loss": -7.398616790771484, "global_step": 208140, "epoch": 4955} {"train_loss": -7.210007667541504, "global_step": 208141, "epoch": 4955} {"train_loss": -7.3228960037231445, "global_step": 208142, "epoch": 4955} {"train_loss": -7.361217975616455, "global_step": 208143, "epoch": 4955} {"train_loss": -7.383906841278076, "global_step": 208144, "epoch": 4955} {"train_loss": -7.417332649230957, "global_step": 208145, "epoch": 4955} {"train_loss": -7.363365173339844, "global_step": 208146, "epoch": 4955} {"train_loss": -7.370279312133789, "global_step": 208147, "epoch": 4955} {"train_loss": -7.342514991760254, "global_step": 208148, "epoch": 4955} {"train_loss": -7.287848472595215, "global_step": 208149, "epoch": 4955} {"train_loss": -7.288109302520752, "global_step": 208150, "epoch": 4955} {"train_loss": -7.313572134290423, "global_step": 208151, "epoch": 4955, "val_loss": 69196.640625} {"train_loss": -7.35549783706665, "global_step": 208152, "epoch": 4956} {"train_loss": -7.236824989318848, "global_step": 208153, "epoch": 4956} {"train_loss": -7.324078559875488, "global_step": 208154, "epoch": 4956} {"train_loss": -7.336851119995117, "global_step": 208155, "epoch": 4956} {"train_loss": -7.301660060882568, "global_step": 208156, "epoch": 4956} {"train_loss": -7.373593330383301, "global_step": 208157, "epoch": 4956} {"train_loss": -7.252505302429199, "global_step": 208158, "epoch": 4956} {"train_loss": -7.353975772857666, "global_step": 208159, "epoch": 4956} {"train_loss": -7.303942680358887, "global_step": 208160, "epoch": 4956} {"train_loss": -7.361828327178955, "global_step": 208161, "epoch": 4956} {"train_loss": -7.261846542358398, "global_step": 208162, "epoch": 4956} {"train_loss": -7.42462158203125, "global_step": 208163, "epoch": 4956} {"train_loss": -7.076963424682617, "global_step": 208164, "epoch": 4956} {"train_loss": -7.2964043617248535, "global_step": 208165, "epoch": 4956} {"train_loss": -7.192350387573242, "global_step": 208166, "epoch": 4956} {"train_loss": -7.051287651062012, "global_step": 208167, "epoch": 4956} {"train_loss": -7.257444381713867, "global_step": 208168, "epoch": 4956} {"train_loss": -7.169442653656006, "global_step": 208169, "epoch": 4956} {"train_loss": -7.168488502502441, "global_step": 208170, "epoch": 4956} {"train_loss": -7.276329040527344, "global_step": 208171, "epoch": 4956} {"train_loss": -7.026161193847656, "global_step": 208172, "epoch": 4956} {"train_loss": -7.155374526977539, "global_step": 208173, "epoch": 4956} {"train_loss": -7.316244125366211, "global_step": 208174, "epoch": 4956} {"train_loss": -7.072391986846924, "global_step": 208175, "epoch": 4956} {"train_loss": -7.252899169921875, "global_step": 208176, "epoch": 4956} {"train_loss": -7.0827484130859375, "global_step": 208177, "epoch": 4956} {"train_loss": -7.211692810058594, "global_step": 208178, "epoch": 4956} {"train_loss": -7.015663146972656, "global_step": 208179, "epoch": 4956} {"train_loss": -6.946261882781982, "global_step": 208180, "epoch": 4956} {"train_loss": -7.150949478149414, "global_step": 208181, "epoch": 4956} {"train_loss": -7.131898403167725, "global_step": 208182, "epoch": 4956} {"train_loss": -7.168705940246582, "global_step": 208183, "epoch": 4956} {"train_loss": -7.130437850952148, "global_step": 208184, "epoch": 4956} {"train_loss": -7.095028877258301, "global_step": 208185, "epoch": 4956} {"train_loss": -7.106644630432129, "global_step": 208186, "epoch": 4956} {"train_loss": -7.1276702880859375, "global_step": 208187, "epoch": 4956} {"train_loss": -7.1532087326049805, "global_step": 208188, "epoch": 4956} {"train_loss": -7.148185729980469, "global_step": 208189, "epoch": 4956} {"train_loss": -7.1252875328063965, "global_step": 208190, "epoch": 4956} {"train_loss": -7.153411865234375, "global_step": 208191, "epoch": 4956} {"train_loss": -7.16926383972168, "global_step": 208192, "epoch": 4956} {"train_loss": -7.201526562372844, "global_step": 208193, "epoch": 4956, "val_loss": 69119.734375} {"train_loss": -7.267459869384766, "global_step": 208194, "epoch": 4957} {"train_loss": -7.26895809173584, "global_step": 208195, "epoch": 4957} {"train_loss": -7.354905128479004, "global_step": 208196, "epoch": 4957} {"train_loss": -7.218606948852539, "global_step": 208197, "epoch": 4957} {"train_loss": -7.369229316711426, "global_step": 208198, "epoch": 4957} {"train_loss": -7.233035087585449, "global_step": 208199, "epoch": 4957} {"train_loss": -7.242767333984375, "global_step": 208200, "epoch": 4957} {"train_loss": -7.222280502319336, "global_step": 208201, "epoch": 4957} {"train_loss": -7.187255382537842, "global_step": 208202, "epoch": 4957} {"train_loss": -7.166013717651367, "global_step": 208203, "epoch": 4957} {"train_loss": -7.284520149230957, "global_step": 208204, "epoch": 4957} {"train_loss": -7.202157497406006, "global_step": 208205, "epoch": 4957} {"train_loss": -7.296573162078857, "global_step": 208206, "epoch": 4957} {"train_loss": -7.183279991149902, "global_step": 208207, "epoch": 4957} {"train_loss": -7.164754867553711, "global_step": 208208, "epoch": 4957} {"train_loss": -7.180421829223633, "global_step": 208209, "epoch": 4957} {"train_loss": -7.097918510437012, "global_step": 208210, "epoch": 4957} {"train_loss": -7.190949440002441, "global_step": 208211, "epoch": 4957} {"train_loss": -7.235392093658447, "global_step": 208212, "epoch": 4957} {"train_loss": -7.280191898345947, "global_step": 208213, "epoch": 4957} {"train_loss": -7.241971492767334, "global_step": 208214, "epoch": 4957} {"train_loss": -7.069209098815918, "global_step": 208215, "epoch": 4957} {"train_loss": -7.248303413391113, "global_step": 208216, "epoch": 4957} {"train_loss": -7.134842872619629, "global_step": 208217, "epoch": 4957} {"train_loss": -7.191844940185547, "global_step": 208218, "epoch": 4957} {"train_loss": -7.307514190673828, "global_step": 208219, "epoch": 4957} {"train_loss": -7.310316562652588, "global_step": 208220, "epoch": 4957} {"train_loss": -7.2172346115112305, "global_step": 208221, "epoch": 4957} {"train_loss": -7.237957954406738, "global_step": 208222, "epoch": 4957} {"train_loss": -7.26215934753418, "global_step": 208223, "epoch": 4957} {"train_loss": -7.167632102966309, "global_step": 208224, "epoch": 4957} {"train_loss": -7.287080764770508, "global_step": 208225, "epoch": 4957} {"train_loss": -7.348060607910156, "global_step": 208226, "epoch": 4957} {"train_loss": -7.277187824249268, "global_step": 208227, "epoch": 4957} {"train_loss": -7.29273796081543, "global_step": 208228, "epoch": 4957} {"train_loss": -7.225273132324219, "global_step": 208229, "epoch": 4957} {"train_loss": -7.350167274475098, "global_step": 208230, "epoch": 4957} {"train_loss": -7.300487995147705, "global_step": 208231, "epoch": 4957} {"train_loss": -7.358393669128418, "global_step": 208232, "epoch": 4957} {"train_loss": -7.234600067138672, "global_step": 208233, "epoch": 4957} {"train_loss": -7.344919204711914, "global_step": 208234, "epoch": 4957} {"train_loss": -7.24687309492202, "global_step": 208235, "epoch": 4957, "val_loss": 69490.4296875} {"train_loss": -7.411818981170654, "global_step": 208236, "epoch": 4958} {"train_loss": -7.201419830322266, "global_step": 208237, "epoch": 4958} {"train_loss": -7.318244457244873, "global_step": 208238, "epoch": 4958} {"train_loss": -7.1084065437316895, "global_step": 208239, "epoch": 4958} {"train_loss": -7.343133449554443, "global_step": 208240, "epoch": 4958} {"train_loss": -7.234219551086426, "global_step": 208241, "epoch": 4958} {"train_loss": -7.219111442565918, "global_step": 208242, "epoch": 4958} {"train_loss": -7.355408668518066, "global_step": 208243, "epoch": 4958} {"train_loss": -7.162067413330078, "global_step": 208244, "epoch": 4958} {"train_loss": -7.204865455627441, "global_step": 208245, "epoch": 4958} {"train_loss": -7.324077606201172, "global_step": 208246, "epoch": 4958} {"train_loss": -7.180746078491211, "global_step": 208247, "epoch": 4958} {"train_loss": -7.26390266418457, "global_step": 208248, "epoch": 4958} {"train_loss": -7.198429107666016, "global_step": 208249, "epoch": 4958} {"train_loss": -7.19986629486084, "global_step": 208250, "epoch": 4958} {"train_loss": -7.312918663024902, "global_step": 208251, "epoch": 4958} {"train_loss": -7.172028541564941, "global_step": 208252, "epoch": 4958} {"train_loss": -7.2976226806640625, "global_step": 208253, "epoch": 4958} {"train_loss": -7.276394844055176, "global_step": 208254, "epoch": 4958} {"train_loss": -7.288873195648193, "global_step": 208255, "epoch": 4958} {"train_loss": -7.241683006286621, "global_step": 208256, "epoch": 4958} {"train_loss": -7.370360374450684, "global_step": 208257, "epoch": 4958} {"train_loss": -7.118168354034424, "global_step": 208258, "epoch": 4958} {"train_loss": -7.258363723754883, "global_step": 208259, "epoch": 4958} {"train_loss": -7.178289413452148, "global_step": 208260, "epoch": 4958} {"train_loss": -7.258222579956055, "global_step": 208261, "epoch": 4958} {"train_loss": -7.301603317260742, "global_step": 208262, "epoch": 4958} {"train_loss": -7.39137077331543, "global_step": 208263, "epoch": 4958} {"train_loss": -7.185269832611084, "global_step": 208264, "epoch": 4958} {"train_loss": -7.197659015655518, "global_step": 208265, "epoch": 4958} {"train_loss": -7.272022247314453, "global_step": 208266, "epoch": 4958} {"train_loss": -7.302383899688721, "global_step": 208267, "epoch": 4958} {"train_loss": -7.449608325958252, "global_step": 208268, "epoch": 4958} {"train_loss": -7.412774085998535, "global_step": 208269, "epoch": 4958} {"train_loss": -7.322387218475342, "global_step": 208270, "epoch": 4958} {"train_loss": -7.298492908477783, "global_step": 208271, "epoch": 4958} {"train_loss": -7.26737642288208, "global_step": 208272, "epoch": 4958} {"train_loss": -7.3848676681518555, "global_step": 208273, "epoch": 4958} {"train_loss": -7.3852691650390625, "global_step": 208274, "epoch": 4958} {"train_loss": -7.474099159240723, "global_step": 208275, "epoch": 4958} {"train_loss": -7.2972002029418945, "global_step": 208276, "epoch": 4958} {"train_loss": -7.279920736948649, "global_step": 208277, "epoch": 4958, "val_loss": 69172.625} {"train_loss": -7.336836338043213, "global_step": 208278, "epoch": 4959} {"train_loss": -7.319537162780762, "global_step": 208279, "epoch": 4959} {"train_loss": -7.291055202484131, "global_step": 208280, "epoch": 4959} {"train_loss": -7.17972469329834, "global_step": 208281, "epoch": 4959} {"train_loss": -7.338754177093506, "global_step": 208282, "epoch": 4959} {"train_loss": -7.286576271057129, "global_step": 208283, "epoch": 4959} {"train_loss": -7.194192409515381, "global_step": 208284, "epoch": 4959} {"train_loss": -7.2759833335876465, "global_step": 208285, "epoch": 4959} {"train_loss": -7.3577117919921875, "global_step": 208286, "epoch": 4959} {"train_loss": -7.2385687828063965, "global_step": 208287, "epoch": 4959} {"train_loss": -7.334160327911377, "global_step": 208288, "epoch": 4959} {"train_loss": -7.125735759735107, "global_step": 208289, "epoch": 4959} {"train_loss": -7.2636260986328125, "global_step": 208290, "epoch": 4959} {"train_loss": -7.06651496887207, "global_step": 208291, "epoch": 4959} {"train_loss": -7.142406463623047, "global_step": 208292, "epoch": 4959} {"train_loss": -7.234537601470947, "global_step": 208293, "epoch": 4959} {"train_loss": -7.149694442749023, "global_step": 208294, "epoch": 4959} {"train_loss": -7.174395561218262, "global_step": 208295, "epoch": 4959} {"train_loss": -7.248375415802002, "global_step": 208296, "epoch": 4959} {"train_loss": -7.3113789558410645, "global_step": 208297, "epoch": 4959} {"train_loss": -7.196752071380615, "global_step": 208298, "epoch": 4959} {"train_loss": -7.18311071395874, "global_step": 208299, "epoch": 4959} {"train_loss": -7.2543439865112305, "global_step": 208300, "epoch": 4959} {"train_loss": -7.070597171783447, "global_step": 208301, "epoch": 4959} {"train_loss": -7.189444541931152, "global_step": 208302, "epoch": 4959} {"train_loss": -7.179999351501465, "global_step": 208303, "epoch": 4959} {"train_loss": -7.1386003494262695, "global_step": 208304, "epoch": 4959} {"train_loss": -7.319326400756836, "global_step": 208305, "epoch": 4959} {"train_loss": -7.016445159912109, "global_step": 208306, "epoch": 4959} {"train_loss": -7.344285488128662, "global_step": 208307, "epoch": 4959} {"train_loss": -7.229063987731934, "global_step": 208308, "epoch": 4959} {"train_loss": -7.3571624755859375, "global_step": 208309, "epoch": 4959} {"train_loss": -7.214831352233887, "global_step": 208310, "epoch": 4959} {"train_loss": -7.143173694610596, "global_step": 208311, "epoch": 4959} {"train_loss": -7.220847129821777, "global_step": 208312, "epoch": 4959} {"train_loss": -7.2372612953186035, "global_step": 208313, "epoch": 4959} {"train_loss": -7.239450454711914, "global_step": 208314, "epoch": 4959} {"train_loss": -7.172297477722168, "global_step": 208315, "epoch": 4959} {"train_loss": -7.279512882232666, "global_step": 208316, "epoch": 4959} {"train_loss": -7.274933815002441, "global_step": 208317, "epoch": 4959} {"train_loss": -7.3670654296875, "global_step": 208318, "epoch": 4959} {"train_loss": -7.2327539920806885, "global_step": 208319, "epoch": 4959, "val_loss": 69325.515625} {"train_loss": -7.1822967529296875, "global_step": 208320, "epoch": 4960} {"train_loss": -7.362897872924805, "global_step": 208321, "epoch": 4960} {"train_loss": -7.296699523925781, "global_step": 208322, "epoch": 4960} {"train_loss": -7.2549920082092285, "global_step": 208323, "epoch": 4960} {"train_loss": -7.304619789123535, "global_step": 208324, "epoch": 4960} {"train_loss": -7.272748947143555, "global_step": 208325, "epoch": 4960} {"train_loss": -7.381015777587891, "global_step": 208326, "epoch": 4960} {"train_loss": -7.358964920043945, "global_step": 208327, "epoch": 4960} {"train_loss": -7.235310077667236, "global_step": 208328, "epoch": 4960} {"train_loss": -7.294425964355469, "global_step": 208329, "epoch": 4960} {"train_loss": -7.359367847442627, "global_step": 208330, "epoch": 4960} {"train_loss": -7.162115573883057, "global_step": 208331, "epoch": 4960} {"train_loss": -7.348864555358887, "global_step": 208332, "epoch": 4960} {"train_loss": -7.368368625640869, "global_step": 208333, "epoch": 4960} {"train_loss": -7.3066558837890625, "global_step": 208334, "epoch": 4960} {"train_loss": -7.4120707511901855, "global_step": 208335, "epoch": 4960} {"train_loss": -7.335908889770508, "global_step": 208336, "epoch": 4960} {"train_loss": -7.447857856750488, "global_step": 208337, "epoch": 4960} {"train_loss": -7.377711296081543, "global_step": 208338, "epoch": 4960} {"train_loss": -7.308760643005371, "global_step": 208339, "epoch": 4960} {"train_loss": -7.334588050842285, "global_step": 208340, "epoch": 4960} {"train_loss": -7.4065961837768555, "global_step": 208341, "epoch": 4960} {"train_loss": -7.247186660766602, "global_step": 208342, "epoch": 4960} {"train_loss": -7.398990631103516, "global_step": 208343, "epoch": 4960} {"train_loss": -7.269427299499512, "global_step": 208344, "epoch": 4960} {"train_loss": -7.287742614746094, "global_step": 208345, "epoch": 4960} {"train_loss": -7.372530460357666, "global_step": 208346, "epoch": 4960} {"train_loss": -7.259422302246094, "global_step": 208347, "epoch": 4960} {"train_loss": -7.361508846282959, "global_step": 208348, "epoch": 4960} {"train_loss": -7.404392242431641, "global_step": 208349, "epoch": 4960} {"train_loss": -7.312585353851318, "global_step": 208350, "epoch": 4960} {"train_loss": -7.353033542633057, "global_step": 208351, "epoch": 4960} {"train_loss": -7.382499694824219, "global_step": 208352, "epoch": 4960} {"train_loss": -7.307740211486816, "global_step": 208353, "epoch": 4960} {"train_loss": -7.260042190551758, "global_step": 208354, "epoch": 4960} {"train_loss": -7.289223670959473, "global_step": 208355, "epoch": 4960} {"train_loss": -7.376640796661377, "global_step": 208356, "epoch": 4960} {"train_loss": -7.410235404968262, "global_step": 208357, "epoch": 4960} {"train_loss": -7.384937286376953, "global_step": 208358, "epoch": 4960} {"train_loss": -7.361982345581055, "global_step": 208359, "epoch": 4960} {"train_loss": -7.404139041900635, "global_step": 208360, "epoch": 4960} {"train_loss": -7.329071078981672, "global_step": 208361, "epoch": 4960, "val_loss": 69268.03125} {"train_loss": -7.397273063659668, "global_step": 208362, "epoch": 4961} {"train_loss": -7.369510650634766, "global_step": 208363, "epoch": 4961} {"train_loss": -7.449869155883789, "global_step": 208364, "epoch": 4961} {"train_loss": -7.271018981933594, "global_step": 208365, "epoch": 4961} {"train_loss": -7.309844493865967, "global_step": 208366, "epoch": 4961} {"train_loss": -7.282009124755859, "global_step": 208367, "epoch": 4961} {"train_loss": -7.274821758270264, "global_step": 208368, "epoch": 4961} {"train_loss": -7.390360355377197, "global_step": 208369, "epoch": 4961} {"train_loss": -7.343907356262207, "global_step": 208370, "epoch": 4961} {"train_loss": -7.377206325531006, "global_step": 208371, "epoch": 4961} {"train_loss": -7.398475646972656, "global_step": 208372, "epoch": 4961} {"train_loss": -7.3493332862854, "global_step": 208373, "epoch": 4961} {"train_loss": -7.421604156494141, "global_step": 208374, "epoch": 4961} {"train_loss": -7.296869277954102, "global_step": 208375, "epoch": 4961} {"train_loss": -7.347075462341309, "global_step": 208376, "epoch": 4961} {"train_loss": -7.443957805633545, "global_step": 208377, "epoch": 4961} {"train_loss": -7.249823570251465, "global_step": 208378, "epoch": 4961} {"train_loss": -7.3056769371032715, "global_step": 208379, "epoch": 4961} {"train_loss": -7.3610076904296875, "global_step": 208380, "epoch": 4961} {"train_loss": -7.316255569458008, "global_step": 208381, "epoch": 4961} {"train_loss": -7.386388301849365, "global_step": 208382, "epoch": 4961} {"train_loss": -7.324162483215332, "global_step": 208383, "epoch": 4961} {"train_loss": -7.310564994812012, "global_step": 208384, "epoch": 4961} {"train_loss": -7.285003185272217, "global_step": 208385, "epoch": 4961} {"train_loss": -7.395463943481445, "global_step": 208386, "epoch": 4961} {"train_loss": -7.190529823303223, "global_step": 208387, "epoch": 4961} {"train_loss": -7.385288238525391, "global_step": 208388, "epoch": 4961} {"train_loss": -7.253198623657227, "global_step": 208389, "epoch": 4961} {"train_loss": -7.211467742919922, "global_step": 208390, "epoch": 4961} {"train_loss": -7.261231422424316, "global_step": 208391, "epoch": 4961} {"train_loss": -7.298922538757324, "global_step": 208392, "epoch": 4961} {"train_loss": -7.220014572143555, "global_step": 208393, "epoch": 4961} {"train_loss": -7.342254638671875, "global_step": 208394, "epoch": 4961} {"train_loss": -7.237611293792725, "global_step": 208395, "epoch": 4961} {"train_loss": -7.216507434844971, "global_step": 208396, "epoch": 4961} {"train_loss": -7.011468410491943, "global_step": 208397, "epoch": 4961} {"train_loss": -7.185750961303711, "global_step": 208398, "epoch": 4961} {"train_loss": -7.405145645141602, "global_step": 208399, "epoch": 4961} {"train_loss": -7.178571701049805, "global_step": 208400, "epoch": 4961} {"train_loss": -7.256009101867676, "global_step": 208401, "epoch": 4961} {"train_loss": -7.238639831542969, "global_step": 208402, "epoch": 4961} {"train_loss": -7.305616855621338, "global_step": 208403, "epoch": 4961, "val_loss": 69188.546875} {"train_loss": -7.267843246459961, "global_step": 208404, "epoch": 4962} {"train_loss": -7.315239906311035, "global_step": 208405, "epoch": 4962} {"train_loss": -7.240353584289551, "global_step": 208406, "epoch": 4962} {"train_loss": -7.268439292907715, "global_step": 208407, "epoch": 4962} {"train_loss": -7.352013111114502, "global_step": 208408, "epoch": 4962} {"train_loss": -7.264759540557861, "global_step": 208409, "epoch": 4962} {"train_loss": -7.347085952758789, "global_step": 208410, "epoch": 4962} {"train_loss": -7.2624711990356445, "global_step": 208411, "epoch": 4962} {"train_loss": -7.217853546142578, "global_step": 208412, "epoch": 4962} {"train_loss": -7.489146709442139, "global_step": 208413, "epoch": 4962} {"train_loss": -7.141408443450928, "global_step": 208414, "epoch": 4962} {"train_loss": -7.272633075714111, "global_step": 208415, "epoch": 4962} {"train_loss": -7.249642372131348, "global_step": 208416, "epoch": 4962} {"train_loss": -7.27575159072876, "global_step": 208417, "epoch": 4962} {"train_loss": -7.363170623779297, "global_step": 208418, "epoch": 4962} {"train_loss": -7.313067436218262, "global_step": 208419, "epoch": 4962} {"train_loss": -7.335981369018555, "global_step": 208420, "epoch": 4962} {"train_loss": -7.394652843475342, "global_step": 208421, "epoch": 4962} {"train_loss": -7.209538459777832, "global_step": 208422, "epoch": 4962} {"train_loss": -7.454104900360107, "global_step": 208423, "epoch": 4962} {"train_loss": -7.306999683380127, "global_step": 208424, "epoch": 4962} {"train_loss": -7.336018085479736, "global_step": 208425, "epoch": 4962} {"train_loss": -7.312380313873291, "global_step": 208426, "epoch": 4962} {"train_loss": -7.407014846801758, "global_step": 208427, "epoch": 4962} {"train_loss": -7.365810394287109, "global_step": 208428, "epoch": 4962} {"train_loss": -7.2227091789245605, "global_step": 208429, "epoch": 4962} {"train_loss": -7.229086399078369, "global_step": 208430, "epoch": 4962} {"train_loss": -7.373697280883789, "global_step": 208431, "epoch": 4962} {"train_loss": -7.336039066314697, "global_step": 208432, "epoch": 4962} {"train_loss": -7.271579742431641, "global_step": 208433, "epoch": 4962} {"train_loss": -7.124373435974121, "global_step": 208434, "epoch": 4962} {"train_loss": -7.296370983123779, "global_step": 208435, "epoch": 4962} {"train_loss": -7.359424114227295, "global_step": 208436, "epoch": 4962} {"train_loss": -7.102222442626953, "global_step": 208437, "epoch": 4962} {"train_loss": -7.242954254150391, "global_step": 208438, "epoch": 4962} {"train_loss": -7.248585224151611, "global_step": 208439, "epoch": 4962} {"train_loss": -7.265953540802002, "global_step": 208440, "epoch": 4962} {"train_loss": -7.009701251983643, "global_step": 208441, "epoch": 4962} {"train_loss": -7.296239852905273, "global_step": 208442, "epoch": 4962} {"train_loss": -7.182016849517822, "global_step": 208443, "epoch": 4962} {"train_loss": -7.18406343460083, "global_step": 208444, "epoch": 4962} {"train_loss": -7.282091129393804, "global_step": 208445, "epoch": 4962, "val_loss": 69222.0546875} {"train_loss": -7.2701287269592285, "global_step": 208446, "epoch": 4963} {"train_loss": -7.292173385620117, "global_step": 208447, "epoch": 4963} {"train_loss": -7.253331184387207, "global_step": 208448, "epoch": 4963} {"train_loss": -7.3135480880737305, "global_step": 208449, "epoch": 4963} {"train_loss": -7.366030693054199, "global_step": 208450, "epoch": 4963} {"train_loss": -7.247488021850586, "global_step": 208451, "epoch": 4963} {"train_loss": -7.355497360229492, "global_step": 208452, "epoch": 4963} {"train_loss": -7.2469282150268555, "global_step": 208453, "epoch": 4963} {"train_loss": -7.312238693237305, "global_step": 208454, "epoch": 4963} {"train_loss": -7.353174209594727, "global_step": 208455, "epoch": 4963} {"train_loss": -7.382613182067871, "global_step": 208456, "epoch": 4963} {"train_loss": -7.266164779663086, "global_step": 208457, "epoch": 4963} {"train_loss": -7.2453813552856445, "global_step": 208458, "epoch": 4963} {"train_loss": -7.1715803146362305, "global_step": 208459, "epoch": 4963} {"train_loss": -7.323722839355469, "global_step": 208460, "epoch": 4963} {"train_loss": -7.297943592071533, "global_step": 208461, "epoch": 4963} {"train_loss": -7.266287326812744, "global_step": 208462, "epoch": 4963} {"train_loss": -7.408133506774902, "global_step": 208463, "epoch": 4963} {"train_loss": -7.283892631530762, "global_step": 208464, "epoch": 4963} {"train_loss": -7.253540992736816, "global_step": 208465, "epoch": 4963} {"train_loss": -7.332769393920898, "global_step": 208466, "epoch": 4963} {"train_loss": -7.227319717407227, "global_step": 208467, "epoch": 4963} {"train_loss": -7.3502583503723145, "global_step": 208468, "epoch": 4963} {"train_loss": -7.2203288078308105, "global_step": 208469, "epoch": 4963} {"train_loss": -7.324047088623047, "global_step": 208470, "epoch": 4963} {"train_loss": -7.331232070922852, "global_step": 208471, "epoch": 4963} {"train_loss": -7.380642890930176, "global_step": 208472, "epoch": 4963} {"train_loss": -7.363389015197754, "global_step": 208473, "epoch": 4963} {"train_loss": -7.338418006896973, "global_step": 208474, "epoch": 4963} {"train_loss": -7.514094352722168, "global_step": 208475, "epoch": 4963} {"train_loss": -7.3304338455200195, "global_step": 208476, "epoch": 4963} {"train_loss": -7.270941734313965, "global_step": 208477, "epoch": 4963} {"train_loss": -7.394275665283203, "global_step": 208478, "epoch": 4963} {"train_loss": -7.256620407104492, "global_step": 208479, "epoch": 4963} {"train_loss": -7.205165863037109, "global_step": 208480, "epoch": 4963} {"train_loss": -7.303656101226807, "global_step": 208481, "epoch": 4963} {"train_loss": -7.292078971862793, "global_step": 208482, "epoch": 4963} {"train_loss": -7.380084991455078, "global_step": 208483, "epoch": 4963} {"train_loss": -7.191052436828613, "global_step": 208484, "epoch": 4963} {"train_loss": -7.213571548461914, "global_step": 208485, "epoch": 4963} {"train_loss": -7.27593994140625, "global_step": 208486, "epoch": 4963} {"train_loss": -7.297400213423229, "global_step": 208487, "epoch": 4963, "val_loss": 69331.5} {"train_loss": -7.137457847595215, "global_step": 208488, "epoch": 4964} {"train_loss": -7.24895715713501, "global_step": 208489, "epoch": 4964} {"train_loss": -7.320012092590332, "global_step": 208490, "epoch": 4964} {"train_loss": -7.2410054206848145, "global_step": 208491, "epoch": 4964} {"train_loss": -7.186100006103516, "global_step": 208492, "epoch": 4964} {"train_loss": -7.294337272644043, "global_step": 208493, "epoch": 4964} {"train_loss": -7.239161491394043, "global_step": 208494, "epoch": 4964} {"train_loss": -7.249239921569824, "global_step": 208495, "epoch": 4964} {"train_loss": -7.310864448547363, "global_step": 208496, "epoch": 4964} {"train_loss": -7.1914849281311035, "global_step": 208497, "epoch": 4964} {"train_loss": -7.2020955085754395, "global_step": 208498, "epoch": 4964} {"train_loss": -7.218441963195801, "global_step": 208499, "epoch": 4964} {"train_loss": -7.131743431091309, "global_step": 208500, "epoch": 4964} {"train_loss": -7.151375770568848, "global_step": 208501, "epoch": 4964} {"train_loss": -7.200742721557617, "global_step": 208502, "epoch": 4964} {"train_loss": -7.243966579437256, "global_step": 208503, "epoch": 4964} {"train_loss": -7.176390647888184, "global_step": 208504, "epoch": 4964} {"train_loss": -7.131188869476318, "global_step": 208505, "epoch": 4964} {"train_loss": -7.133162498474121, "global_step": 208506, "epoch": 4964} {"train_loss": -7.086666584014893, "global_step": 208507, "epoch": 4964} {"train_loss": -7.269812107086182, "global_step": 208508, "epoch": 4964} {"train_loss": -7.0787811279296875, "global_step": 208509, "epoch": 4964} {"train_loss": -7.199182987213135, "global_step": 208510, "epoch": 4964} {"train_loss": -7.052057266235352, "global_step": 208511, "epoch": 4964} {"train_loss": -7.0736284255981445, "global_step": 208512, "epoch": 4964} {"train_loss": -7.338438034057617, "global_step": 208513, "epoch": 4964} {"train_loss": -7.077152252197266, "global_step": 208514, "epoch": 4964} {"train_loss": -7.237042427062988, "global_step": 208515, "epoch": 4964} {"train_loss": -7.193988800048828, "global_step": 208516, "epoch": 4964} {"train_loss": -7.274151802062988, "global_step": 208517, "epoch": 4964} {"train_loss": -7.144606590270996, "global_step": 208518, "epoch": 4964} {"train_loss": -7.2663068771362305, "global_step": 208519, "epoch": 4964} {"train_loss": -7.1417083740234375, "global_step": 208520, "epoch": 4964} {"train_loss": -7.233367919921875, "global_step": 208521, "epoch": 4964} {"train_loss": -7.239449977874756, "global_step": 208522, "epoch": 4964} {"train_loss": -7.156411170959473, "global_step": 208523, "epoch": 4964} {"train_loss": -7.208434104919434, "global_step": 208524, "epoch": 4964} {"train_loss": -7.247220993041992, "global_step": 208525, "epoch": 4964} {"train_loss": -7.335679054260254, "global_step": 208526, "epoch": 4964} {"train_loss": -7.305141448974609, "global_step": 208527, "epoch": 4964} {"train_loss": -7.2632317543029785, "global_step": 208528, "epoch": 4964} {"train_loss": -7.207726342337472, "global_step": 208529, "epoch": 4964, "val_loss": 69310.578125} {"train_loss": -7.435679912567139, "global_step": 208530, "epoch": 4965} {"train_loss": -7.3266401290893555, "global_step": 208531, "epoch": 4965} {"train_loss": -7.273396015167236, "global_step": 208532, "epoch": 4965} {"train_loss": -7.306072235107422, "global_step": 208533, "epoch": 4965} {"train_loss": -7.20711612701416, "global_step": 208534, "epoch": 4965} {"train_loss": -7.198065757751465, "global_step": 208535, "epoch": 4965} {"train_loss": -7.208086967468262, "global_step": 208536, "epoch": 4965} {"train_loss": -7.2203145027160645, "global_step": 208537, "epoch": 4965} {"train_loss": -7.244931221008301, "global_step": 208538, "epoch": 4965} {"train_loss": -7.195066928863525, "global_step": 208539, "epoch": 4965} {"train_loss": -7.329923629760742, "global_step": 208540, "epoch": 4965} {"train_loss": -7.276913642883301, "global_step": 208541, "epoch": 4965} {"train_loss": -7.208913326263428, "global_step": 208542, "epoch": 4965} {"train_loss": -7.336645126342773, "global_step": 208543, "epoch": 4965} {"train_loss": -7.313093185424805, "global_step": 208544, "epoch": 4965} {"train_loss": -7.238689422607422, "global_step": 208545, "epoch": 4965} {"train_loss": -7.2651824951171875, "global_step": 208546, "epoch": 4965} {"train_loss": -7.260270595550537, "global_step": 208547, "epoch": 4965} {"train_loss": -7.331650733947754, "global_step": 208548, "epoch": 4965} {"train_loss": -7.344446182250977, "global_step": 208549, "epoch": 4965} {"train_loss": -7.270297050476074, "global_step": 208550, "epoch": 4965} {"train_loss": -7.347705841064453, "global_step": 208551, "epoch": 4965} {"train_loss": -7.37160587310791, "global_step": 208552, "epoch": 4965} {"train_loss": -7.2695631980896, "global_step": 208553, "epoch": 4965} {"train_loss": -7.232407569885254, "global_step": 208554, "epoch": 4965} {"train_loss": -7.212963104248047, "global_step": 208555, "epoch": 4965} {"train_loss": -7.203150749206543, "global_step": 208556, "epoch": 4965} {"train_loss": -7.1554155349731445, "global_step": 208557, "epoch": 4965} {"train_loss": -7.348645210266113, "global_step": 208558, "epoch": 4965} {"train_loss": -7.224235534667969, "global_step": 208559, "epoch": 4965} {"train_loss": -7.201794624328613, "global_step": 208560, "epoch": 4965} {"train_loss": -7.386190414428711, "global_step": 208561, "epoch": 4965} {"train_loss": -7.241467475891113, "global_step": 208562, "epoch": 4965} {"train_loss": -7.298830986022949, "global_step": 208563, "epoch": 4965} {"train_loss": -7.254558563232422, "global_step": 208564, "epoch": 4965} {"train_loss": -7.254443168640137, "global_step": 208565, "epoch": 4965} {"train_loss": -7.352999687194824, "global_step": 208566, "epoch": 4965} {"train_loss": -7.2873125076293945, "global_step": 208567, "epoch": 4965} {"train_loss": -7.229339599609375, "global_step": 208568, "epoch": 4965} {"train_loss": -7.309372901916504, "global_step": 208569, "epoch": 4965} {"train_loss": -7.146866798400879, "global_step": 208570, "epoch": 4965} {"train_loss": -7.2675416469573975, "global_step": 208571, "epoch": 4965, "val_loss": 69397.4921875} {"train_loss": -7.131779670715332, "global_step": 208572, "epoch": 4966} {"train_loss": -7.295661449432373, "global_step": 208573, "epoch": 4966} {"train_loss": -7.234461784362793, "global_step": 208574, "epoch": 4966} {"train_loss": -7.228041172027588, "global_step": 208575, "epoch": 4966} {"train_loss": -7.289126396179199, "global_step": 208576, "epoch": 4966} {"train_loss": -7.245490074157715, "global_step": 208577, "epoch": 4966} {"train_loss": -7.222538948059082, "global_step": 208578, "epoch": 4966} {"train_loss": -7.245295524597168, "global_step": 208579, "epoch": 4966} {"train_loss": -7.203598976135254, "global_step": 208580, "epoch": 4966} {"train_loss": -7.265506744384766, "global_step": 208581, "epoch": 4966} {"train_loss": -7.271020889282227, "global_step": 208582, "epoch": 4966} {"train_loss": -7.209839344024658, "global_step": 208583, "epoch": 4966} {"train_loss": -7.345220565795898, "global_step": 208584, "epoch": 4966} {"train_loss": -7.222459316253662, "global_step": 208585, "epoch": 4966} {"train_loss": -7.365783214569092, "global_step": 208586, "epoch": 4966} {"train_loss": -7.2607622146606445, "global_step": 208587, "epoch": 4966} {"train_loss": -7.361861705780029, "global_step": 208588, "epoch": 4966} {"train_loss": -7.239055633544922, "global_step": 208589, "epoch": 4966} {"train_loss": -7.352682590484619, "global_step": 208590, "epoch": 4966} {"train_loss": -7.276689529418945, "global_step": 208591, "epoch": 4966} {"train_loss": -7.262578010559082, "global_step": 208592, "epoch": 4966} {"train_loss": -7.374362945556641, "global_step": 208593, "epoch": 4966} {"train_loss": -7.35986852645874, "global_step": 208594, "epoch": 4966} {"train_loss": -7.268771171569824, "global_step": 208595, "epoch": 4966} {"train_loss": -7.3000078201293945, "global_step": 208596, "epoch": 4966} {"train_loss": -7.285489559173584, "global_step": 208597, "epoch": 4966} {"train_loss": -7.2770891189575195, "global_step": 208598, "epoch": 4966} {"train_loss": -7.370619773864746, "global_step": 208599, "epoch": 4966} {"train_loss": -7.28443717956543, "global_step": 208600, "epoch": 4966} {"train_loss": -7.171156883239746, "global_step": 208601, "epoch": 4966} {"train_loss": -7.257260322570801, "global_step": 208602, "epoch": 4966} {"train_loss": -7.175121307373047, "global_step": 208603, "epoch": 4966} {"train_loss": -7.363605499267578, "global_step": 208604, "epoch": 4966} {"train_loss": -7.180028915405273, "global_step": 208605, "epoch": 4966} {"train_loss": -7.2536516189575195, "global_step": 208606, "epoch": 4966} {"train_loss": -7.255609512329102, "global_step": 208607, "epoch": 4966} {"train_loss": -7.226268768310547, "global_step": 208608, "epoch": 4966} {"train_loss": -7.253743648529053, "global_step": 208609, "epoch": 4966} {"train_loss": -7.282051086425781, "global_step": 208610, "epoch": 4966} {"train_loss": -7.198800086975098, "global_step": 208611, "epoch": 4966} {"train_loss": -7.348138332366943, "global_step": 208612, "epoch": 4966} {"train_loss": -7.27080944606236, "global_step": 208613, "epoch": 4966, "val_loss": 69269.5703125} {"train_loss": -7.292524814605713, "global_step": 208614, "epoch": 4967} {"train_loss": -7.23220157623291, "global_step": 208615, "epoch": 4967} {"train_loss": -7.321133613586426, "global_step": 208616, "epoch": 4967} {"train_loss": -7.304387092590332, "global_step": 208617, "epoch": 4967} {"train_loss": -7.275289535522461, "global_step": 208618, "epoch": 4967} {"train_loss": -7.27783203125, "global_step": 208619, "epoch": 4967} {"train_loss": -7.23991584777832, "global_step": 208620, "epoch": 4967} {"train_loss": -7.461955547332764, "global_step": 208621, "epoch": 4967} {"train_loss": -7.2111101150512695, "global_step": 208622, "epoch": 4967} {"train_loss": -7.311347007751465, "global_step": 208623, "epoch": 4967} {"train_loss": -7.2967023849487305, "global_step": 208624, "epoch": 4967} {"train_loss": -7.481371879577637, "global_step": 208625, "epoch": 4967} {"train_loss": -7.502002716064453, "global_step": 208626, "epoch": 4967} {"train_loss": -7.381448268890381, "global_step": 208627, "epoch": 4967} {"train_loss": -7.321405410766602, "global_step": 208628, "epoch": 4967} {"train_loss": -7.326744079589844, "global_step": 208629, "epoch": 4967} {"train_loss": -7.427028656005859, "global_step": 208630, "epoch": 4967} {"train_loss": -7.383822441101074, "global_step": 208631, "epoch": 4967} {"train_loss": -7.299366474151611, "global_step": 208632, "epoch": 4967} {"train_loss": -7.432277202606201, "global_step": 208633, "epoch": 4967} {"train_loss": -7.471196174621582, "global_step": 208634, "epoch": 4967} {"train_loss": -7.3913092613220215, "global_step": 208635, "epoch": 4967} {"train_loss": -7.376719951629639, "global_step": 208636, "epoch": 4967} {"train_loss": -7.197291374206543, "global_step": 208637, "epoch": 4967} {"train_loss": -7.325011253356934, "global_step": 208638, "epoch": 4967} {"train_loss": -7.206233978271484, "global_step": 208639, "epoch": 4967} {"train_loss": -7.2539777755737305, "global_step": 208640, "epoch": 4967} {"train_loss": -7.297990798950195, "global_step": 208641, "epoch": 4967} {"train_loss": -7.2291107177734375, "global_step": 208642, "epoch": 4967} {"train_loss": -7.177202224731445, "global_step": 208643, "epoch": 4967} {"train_loss": -7.173731803894043, "global_step": 208644, "epoch": 4967} {"train_loss": -7.3044047355651855, "global_step": 208645, "epoch": 4967} {"train_loss": -7.299664497375488, "global_step": 208646, "epoch": 4967} {"train_loss": -7.207697868347168, "global_step": 208647, "epoch": 4967} {"train_loss": -7.3039374351501465, "global_step": 208648, "epoch": 4967} {"train_loss": -7.203438758850098, "global_step": 208649, "epoch": 4967} {"train_loss": -7.070627212524414, "global_step": 208650, "epoch": 4967} {"train_loss": -7.26568603515625, "global_step": 208651, "epoch": 4967} {"train_loss": -6.947812557220459, "global_step": 208652, "epoch": 4967} {"train_loss": -7.284337997436523, "global_step": 208653, "epoch": 4967} {"train_loss": -7.054155349731445, "global_step": 208654, "epoch": 4967} {"train_loss": -7.285765136991229, "global_step": 208655, "epoch": 4967, "val_loss": 69443.890625} {"train_loss": -7.1026177406311035, "global_step": 208656, "epoch": 4968} {"train_loss": -7.157107353210449, "global_step": 208657, "epoch": 4968} {"train_loss": -7.223354339599609, "global_step": 208658, "epoch": 4968} {"train_loss": -7.264179706573486, "global_step": 208659, "epoch": 4968} {"train_loss": -7.199488639831543, "global_step": 208660, "epoch": 4968} {"train_loss": -7.289649486541748, "global_step": 208661, "epoch": 4968} {"train_loss": -7.306859016418457, "global_step": 208662, "epoch": 4968} {"train_loss": -7.205442428588867, "global_step": 208663, "epoch": 4968} {"train_loss": -7.222058296203613, "global_step": 208664, "epoch": 4968} {"train_loss": -7.251049041748047, "global_step": 208665, "epoch": 4968} {"train_loss": -7.234593391418457, "global_step": 208666, "epoch": 4968} {"train_loss": -7.253533840179443, "global_step": 208667, "epoch": 4968} {"train_loss": -7.18562126159668, "global_step": 208668, "epoch": 4968} {"train_loss": -7.214059352874756, "global_step": 208669, "epoch": 4968} {"train_loss": -7.3166656494140625, "global_step": 208670, "epoch": 4968} {"train_loss": -7.307945251464844, "global_step": 208671, "epoch": 4968} {"train_loss": -7.161067962646484, "global_step": 208672, "epoch": 4968} {"train_loss": -7.360376358032227, "global_step": 208673, "epoch": 4968} {"train_loss": -7.201334476470947, "global_step": 208674, "epoch": 4968} {"train_loss": -7.026975631713867, "global_step": 208675, "epoch": 4968} {"train_loss": -7.195305347442627, "global_step": 208676, "epoch": 4968} {"train_loss": -7.140798568725586, "global_step": 208677, "epoch": 4968} {"train_loss": -7.084305763244629, "global_step": 208678, "epoch": 4968} {"train_loss": -7.053744316101074, "global_step": 208679, "epoch": 4968} {"train_loss": -7.162888526916504, "global_step": 208680, "epoch": 4968} {"train_loss": -7.245387077331543, "global_step": 208681, "epoch": 4968} {"train_loss": -7.253253936767578, "global_step": 208682, "epoch": 4968} {"train_loss": -7.2494707107543945, "global_step": 208683, "epoch": 4968} {"train_loss": -7.227814674377441, "global_step": 208684, "epoch": 4968} {"train_loss": -7.068154335021973, "global_step": 208685, "epoch": 4968} {"train_loss": -7.080043792724609, "global_step": 208686, "epoch": 4968} {"train_loss": -7.120512962341309, "global_step": 208687, "epoch": 4968} {"train_loss": -7.093575477600098, "global_step": 208688, "epoch": 4968} {"train_loss": -7.232545852661133, "global_step": 208689, "epoch": 4968} {"train_loss": -7.144803047180176, "global_step": 208690, "epoch": 4968} {"train_loss": -7.2041916847229, "global_step": 208691, "epoch": 4968} {"train_loss": -7.3111724853515625, "global_step": 208692, "epoch": 4968} {"train_loss": -7.199337005615234, "global_step": 208693, "epoch": 4968} {"train_loss": -7.312431812286377, "global_step": 208694, "epoch": 4968} {"train_loss": -7.218530654907227, "global_step": 208695, "epoch": 4968} {"train_loss": -7.273290157318115, "global_step": 208696, "epoch": 4968} {"train_loss": -7.206631910233271, "global_step": 208697, "epoch": 4968, "val_loss": 69258.234375} {"train_loss": -7.332127571105957, "global_step": 208698, "epoch": 4969} {"train_loss": -7.262448310852051, "global_step": 208699, "epoch": 4969} {"train_loss": -7.280150413513184, "global_step": 208700, "epoch": 4969} {"train_loss": -7.279086112976074, "global_step": 208701, "epoch": 4969} {"train_loss": -7.375134468078613, "global_step": 208702, "epoch": 4969} {"train_loss": -7.241471290588379, "global_step": 208703, "epoch": 4969} {"train_loss": -7.362484931945801, "global_step": 208704, "epoch": 4969} {"train_loss": -7.354621887207031, "global_step": 208705, "epoch": 4969} {"train_loss": -7.1591691970825195, "global_step": 208706, "epoch": 4969} {"train_loss": -7.322103500366211, "global_step": 208707, "epoch": 4969} {"train_loss": -7.339712619781494, "global_step": 208708, "epoch": 4969} {"train_loss": -7.256783485412598, "global_step": 208709, "epoch": 4969} {"train_loss": -7.29450798034668, "global_step": 208710, "epoch": 4969} {"train_loss": -7.3526611328125, "global_step": 208711, "epoch": 4969} {"train_loss": -7.251911640167236, "global_step": 208712, "epoch": 4969} {"train_loss": -7.296794414520264, "global_step": 208713, "epoch": 4969} {"train_loss": -7.120282173156738, "global_step": 208714, "epoch": 4969} {"train_loss": -7.194051742553711, "global_step": 208715, "epoch": 4969} {"train_loss": -7.179815292358398, "global_step": 208716, "epoch": 4969} {"train_loss": -7.184239387512207, "global_step": 208717, "epoch": 4969} {"train_loss": -7.331668853759766, "global_step": 208718, "epoch": 4969} {"train_loss": -7.21897029876709, "global_step": 208719, "epoch": 4969} {"train_loss": -7.401219367980957, "global_step": 208720, "epoch": 4969} {"train_loss": -7.093386650085449, "global_step": 208721, "epoch": 4969} {"train_loss": -7.287544250488281, "global_step": 208722, "epoch": 4969} {"train_loss": -7.323230743408203, "global_step": 208723, "epoch": 4969} {"train_loss": -7.256126403808594, "global_step": 208724, "epoch": 4969} {"train_loss": -7.2991943359375, "global_step": 208725, "epoch": 4969} {"train_loss": -7.207345008850098, "global_step": 208726, "epoch": 4969} {"train_loss": -7.354099273681641, "global_step": 208727, "epoch": 4969} {"train_loss": -7.272647857666016, "global_step": 208728, "epoch": 4969} {"train_loss": -7.319010257720947, "global_step": 208729, "epoch": 4969} {"train_loss": -7.318206310272217, "global_step": 208730, "epoch": 4969} {"train_loss": -7.314462184906006, "global_step": 208731, "epoch": 4969} {"train_loss": -7.3028411865234375, "global_step": 208732, "epoch": 4969} {"train_loss": -7.376344680786133, "global_step": 208733, "epoch": 4969} {"train_loss": -7.356308937072754, "global_step": 208734, "epoch": 4969} {"train_loss": -7.386296272277832, "global_step": 208735, "epoch": 4969} {"train_loss": -7.244707107543945, "global_step": 208736, "epoch": 4969} {"train_loss": -7.3320488929748535, "global_step": 208737, "epoch": 4969} {"train_loss": -7.230945587158203, "global_step": 208738, "epoch": 4969} {"train_loss": -7.283480542046683, "global_step": 208739, "epoch": 4969, "val_loss": 69136.640625} {"train_loss": -7.432936668395996, "global_step": 208740, "epoch": 4970} {"train_loss": -7.294719219207764, "global_step": 208741, "epoch": 4970} {"train_loss": -7.187687873840332, "global_step": 208742, "epoch": 4970} {"train_loss": -7.242527484893799, "global_step": 208743, "epoch": 4970} {"train_loss": -7.25894021987915, "global_step": 208744, "epoch": 4970} {"train_loss": -7.348270893096924, "global_step": 208745, "epoch": 4970} {"train_loss": -7.3253631591796875, "global_step": 208746, "epoch": 4970} {"train_loss": -7.2125325202941895, "global_step": 208747, "epoch": 4970} {"train_loss": -7.214089393615723, "global_step": 208748, "epoch": 4970} {"train_loss": -7.354901313781738, "global_step": 208749, "epoch": 4970} {"train_loss": -7.180987358093262, "global_step": 208750, "epoch": 4970} {"train_loss": -7.365276336669922, "global_step": 208751, "epoch": 4970} {"train_loss": -7.252957344055176, "global_step": 208752, "epoch": 4970} {"train_loss": -7.307465553283691, "global_step": 208753, "epoch": 4970} {"train_loss": -7.256251335144043, "global_step": 208754, "epoch": 4970} {"train_loss": -7.264215469360352, "global_step": 208755, "epoch": 4970} {"train_loss": -7.379844665527344, "global_step": 208756, "epoch": 4970} {"train_loss": -7.0998215675354, "global_step": 208757, "epoch": 4970} {"train_loss": -7.2433295249938965, "global_step": 208758, "epoch": 4970} {"train_loss": -7.182085037231445, "global_step": 208759, "epoch": 4970} {"train_loss": -7.247452259063721, "global_step": 208760, "epoch": 4970} {"train_loss": -7.160958290100098, "global_step": 208761, "epoch": 4970} {"train_loss": -7.100654602050781, "global_step": 208762, "epoch": 4970} {"train_loss": -7.234459400177002, "global_step": 208763, "epoch": 4970} {"train_loss": -7.209566593170166, "global_step": 208764, "epoch": 4970} {"train_loss": -7.204257011413574, "global_step": 208765, "epoch": 4970} {"train_loss": -7.2086005210876465, "global_step": 208766, "epoch": 4970} {"train_loss": -7.197580337524414, "global_step": 208767, "epoch": 4970} {"train_loss": -7.310837745666504, "global_step": 208768, "epoch": 4970} {"train_loss": -7.068974018096924, "global_step": 208769, "epoch": 4970} {"train_loss": -7.292341232299805, "global_step": 208770, "epoch": 4970} {"train_loss": -7.212267875671387, "global_step": 208771, "epoch": 4970} {"train_loss": -7.167376518249512, "global_step": 208772, "epoch": 4970} {"train_loss": -7.245939254760742, "global_step": 208773, "epoch": 4970} {"train_loss": -7.177712440490723, "global_step": 208774, "epoch": 4970} {"train_loss": -7.226861476898193, "global_step": 208775, "epoch": 4970} {"train_loss": -7.277613162994385, "global_step": 208776, "epoch": 4970} {"train_loss": -7.2373247146606445, "global_step": 208777, "epoch": 4970} {"train_loss": -7.1576828956604, "global_step": 208778, "epoch": 4970} {"train_loss": -7.334546089172363, "global_step": 208779, "epoch": 4970} {"train_loss": -7.2395148277282715, "global_step": 208780, "epoch": 4970} {"train_loss": -7.243253310521443, "global_step": 208781, "epoch": 4970, "val_loss": 69269.4453125} {"train_loss": -7.206239700317383, "global_step": 208782, "epoch": 4971} {"train_loss": -7.348598003387451, "global_step": 208783, "epoch": 4971} {"train_loss": -7.305197715759277, "global_step": 208784, "epoch": 4971} {"train_loss": -7.209140777587891, "global_step": 208785, "epoch": 4971} {"train_loss": -7.263756275177002, "global_step": 208786, "epoch": 4971} {"train_loss": -7.270161151885986, "global_step": 208787, "epoch": 4971} {"train_loss": -7.298740386962891, "global_step": 208788, "epoch": 4971} {"train_loss": -7.32122278213501, "global_step": 208789, "epoch": 4971} {"train_loss": -7.241721153259277, "global_step": 208790, "epoch": 4971} {"train_loss": -7.284488677978516, "global_step": 208791, "epoch": 4971} {"train_loss": -7.4070539474487305, "global_step": 208792, "epoch": 4971} {"train_loss": -7.321773529052734, "global_step": 208793, "epoch": 4971} {"train_loss": -7.204593658447266, "global_step": 208794, "epoch": 4971} {"train_loss": -7.423374176025391, "global_step": 208795, "epoch": 4971} {"train_loss": -7.39483118057251, "global_step": 208796, "epoch": 4971} {"train_loss": -7.393695831298828, "global_step": 208797, "epoch": 4971} {"train_loss": -7.3649702072143555, "global_step": 208798, "epoch": 4971} {"train_loss": -7.387184143066406, "global_step": 208799, "epoch": 4971} {"train_loss": -7.298747539520264, "global_step": 208800, "epoch": 4971} {"train_loss": -7.321966171264648, "global_step": 208801, "epoch": 4971} {"train_loss": -7.380626201629639, "global_step": 208802, "epoch": 4971} {"train_loss": -7.36495304107666, "global_step": 208803, "epoch": 4971} {"train_loss": -7.297722816467285, "global_step": 208804, "epoch": 4971} {"train_loss": -7.350493431091309, "global_step": 208805, "epoch": 4971} {"train_loss": -7.355521202087402, "global_step": 208806, "epoch": 4971} {"train_loss": -7.306674003601074, "global_step": 208807, "epoch": 4971} {"train_loss": -7.375735282897949, "global_step": 208808, "epoch": 4971} {"train_loss": -7.293461799621582, "global_step": 208809, "epoch": 4971} {"train_loss": -7.414303779602051, "global_step": 208810, "epoch": 4971} {"train_loss": -7.382863998413086, "global_step": 208811, "epoch": 4971} {"train_loss": -7.391357898712158, "global_step": 208812, "epoch": 4971} {"train_loss": -7.400432586669922, "global_step": 208813, "epoch": 4971} {"train_loss": -7.353523254394531, "global_step": 208814, "epoch": 4971} {"train_loss": -7.416342258453369, "global_step": 208815, "epoch": 4971} {"train_loss": -7.352512359619141, "global_step": 208816, "epoch": 4971} {"train_loss": -7.397758483886719, "global_step": 208817, "epoch": 4971} {"train_loss": -7.324400424957275, "global_step": 208818, "epoch": 4971} {"train_loss": -7.3364362716674805, "global_step": 208819, "epoch": 4971} {"train_loss": -7.452017784118652, "global_step": 208820, "epoch": 4971} {"train_loss": -7.396226406097412, "global_step": 208821, "epoch": 4971} {"train_loss": -7.42405891418457, "global_step": 208822, "epoch": 4971} {"train_loss": -7.342039766765776, "global_step": 208823, "epoch": 4971, "val_loss": 69112.0546875} {"train_loss": -7.408591270446777, "global_step": 208824, "epoch": 4972} {"train_loss": -7.36346435546875, "global_step": 208825, "epoch": 4972} {"train_loss": -7.312788009643555, "global_step": 208826, "epoch": 4972} {"train_loss": -7.4398956298828125, "global_step": 208827, "epoch": 4972} {"train_loss": -7.366508483886719, "global_step": 208828, "epoch": 4972} {"train_loss": -7.38076114654541, "global_step": 208829, "epoch": 4972} {"train_loss": -7.3010029792785645, "global_step": 208830, "epoch": 4972} {"train_loss": -7.329019069671631, "global_step": 208831, "epoch": 4972} {"train_loss": -7.393576622009277, "global_step": 208832, "epoch": 4972} {"train_loss": -7.386256694793701, "global_step": 208833, "epoch": 4972} {"train_loss": -7.231572151184082, "global_step": 208834, "epoch": 4972} {"train_loss": -7.302950859069824, "global_step": 208835, "epoch": 4972} {"train_loss": -7.382194995880127, "global_step": 208836, "epoch": 4972} {"train_loss": -7.387455940246582, "global_step": 208837, "epoch": 4972} {"train_loss": -7.441311836242676, "global_step": 208838, "epoch": 4972} {"train_loss": -7.29445219039917, "global_step": 208839, "epoch": 4972} {"train_loss": -7.192824840545654, "global_step": 208840, "epoch": 4972} {"train_loss": -7.254155158996582, "global_step": 208841, "epoch": 4972} {"train_loss": -7.0863189697265625, "global_step": 208842, "epoch": 4972} {"train_loss": -7.253095626831055, "global_step": 208843, "epoch": 4972} {"train_loss": -7.160074710845947, "global_step": 208844, "epoch": 4972} {"train_loss": -7.2442426681518555, "global_step": 208845, "epoch": 4972} {"train_loss": -7.176664352416992, "global_step": 208846, "epoch": 4972} {"train_loss": -7.039614200592041, "global_step": 208847, "epoch": 4972} {"train_loss": -7.249438762664795, "global_step": 208848, "epoch": 4972} {"train_loss": -7.29257869720459, "global_step": 208849, "epoch": 4972} {"train_loss": -7.134925842285156, "global_step": 208850, "epoch": 4972} {"train_loss": -7.270895004272461, "global_step": 208851, "epoch": 4972} {"train_loss": -7.188927173614502, "global_step": 208852, "epoch": 4972} {"train_loss": -7.135217189788818, "global_step": 208853, "epoch": 4972} {"train_loss": -7.274054527282715, "global_step": 208854, "epoch": 4972} {"train_loss": -7.263481616973877, "global_step": 208855, "epoch": 4972} {"train_loss": -7.274764537811279, "global_step": 208856, "epoch": 4972} {"train_loss": -7.282323837280273, "global_step": 208857, "epoch": 4972} {"train_loss": -7.23016881942749, "global_step": 208858, "epoch": 4972} {"train_loss": -7.158216953277588, "global_step": 208859, "epoch": 4972} {"train_loss": -7.292194366455078, "global_step": 208860, "epoch": 4972} {"train_loss": -7.197290897369385, "global_step": 208861, "epoch": 4972} {"train_loss": -7.207101821899414, "global_step": 208862, "epoch": 4972} {"train_loss": -7.173480987548828, "global_step": 208863, "epoch": 4972} {"train_loss": -7.281060218811035, "global_step": 208864, "epoch": 4972} {"train_loss": -7.26860785484314, "global_step": 208865, "epoch": 4972, "val_loss": 69243.890625} {"train_loss": -7.276003360748291, "global_step": 208866, "epoch": 4973} {"train_loss": -7.3037214279174805, "global_step": 208867, "epoch": 4973} {"train_loss": -7.339040756225586, "global_step": 208868, "epoch": 4973} {"train_loss": -7.345525741577148, "global_step": 208869, "epoch": 4973} {"train_loss": -7.316555976867676, "global_step": 208870, "epoch": 4973} {"train_loss": -7.328275203704834, "global_step": 208871, "epoch": 4973} {"train_loss": -7.40702486038208, "global_step": 208872, "epoch": 4973} {"train_loss": -7.368059158325195, "global_step": 208873, "epoch": 4973} {"train_loss": -7.288238525390625, "global_step": 208874, "epoch": 4973} {"train_loss": -7.39216423034668, "global_step": 208875, "epoch": 4973} {"train_loss": -7.306342124938965, "global_step": 208876, "epoch": 4973} {"train_loss": -7.352190971374512, "global_step": 208877, "epoch": 4973} {"train_loss": -7.261166572570801, "global_step": 208878, "epoch": 4973} {"train_loss": -7.285615921020508, "global_step": 208879, "epoch": 4973} {"train_loss": -7.355589866638184, "global_step": 208880, "epoch": 4973} {"train_loss": -7.296408653259277, "global_step": 208881, "epoch": 4973} {"train_loss": -7.426371097564697, "global_step": 208882, "epoch": 4973} {"train_loss": -7.359853267669678, "global_step": 208883, "epoch": 4973} {"train_loss": -7.425634384155273, "global_step": 208884, "epoch": 4973} {"train_loss": -7.423108100891113, "global_step": 208885, "epoch": 4973} {"train_loss": -7.277519702911377, "global_step": 208886, "epoch": 4973} {"train_loss": -7.337482929229736, "global_step": 208887, "epoch": 4973} {"train_loss": -7.352452278137207, "global_step": 208888, "epoch": 4973} {"train_loss": -7.264707088470459, "global_step": 208889, "epoch": 4973} {"train_loss": -7.272797584533691, "global_step": 208890, "epoch": 4973} {"train_loss": -7.253138542175293, "global_step": 208891, "epoch": 4973} {"train_loss": -7.401183128356934, "global_step": 208892, "epoch": 4973} {"train_loss": -7.231465816497803, "global_step": 208893, "epoch": 4973} {"train_loss": -7.354133129119873, "global_step": 208894, "epoch": 4973} {"train_loss": -7.468314170837402, "global_step": 208895, "epoch": 4973} {"train_loss": -7.239645957946777, "global_step": 208896, "epoch": 4973} {"train_loss": -7.322430610656738, "global_step": 208897, "epoch": 4973} {"train_loss": -7.298227787017822, "global_step": 208898, "epoch": 4973} {"train_loss": -7.286595344543457, "global_step": 208899, "epoch": 4973} {"train_loss": -7.280728816986084, "global_step": 208900, "epoch": 4973} {"train_loss": -7.273351669311523, "global_step": 208901, "epoch": 4973} {"train_loss": -7.295466899871826, "global_step": 208902, "epoch": 4973} {"train_loss": -7.383070945739746, "global_step": 208903, "epoch": 4973} {"train_loss": -7.188346862792969, "global_step": 208904, "epoch": 4973} {"train_loss": -7.182589054107666, "global_step": 208905, "epoch": 4973} {"train_loss": -7.138832092285156, "global_step": 208906, "epoch": 4973} {"train_loss": -7.316688753309704, "global_step": 208907, "epoch": 4973, "val_loss": 69249.7578125} {"train_loss": -7.332065582275391, "global_step": 208908, "epoch": 4974} {"train_loss": -7.269861698150635, "global_step": 208909, "epoch": 4974} {"train_loss": -7.255560874938965, "global_step": 208910, "epoch": 4974} {"train_loss": -7.1611785888671875, "global_step": 208911, "epoch": 4974} {"train_loss": -7.173244476318359, "global_step": 208912, "epoch": 4974} {"train_loss": -7.393181800842285, "global_step": 208913, "epoch": 4974} {"train_loss": -7.332963943481445, "global_step": 208914, "epoch": 4974} {"train_loss": -7.302999973297119, "global_step": 208915, "epoch": 4974} {"train_loss": -7.172881126403809, "global_step": 208916, "epoch": 4974} {"train_loss": -7.188789367675781, "global_step": 208917, "epoch": 4974} {"train_loss": -7.2055792808532715, "global_step": 208918, "epoch": 4974} {"train_loss": -7.250279903411865, "global_step": 208919, "epoch": 4974} {"train_loss": -7.271385669708252, "global_step": 208920, "epoch": 4974} {"train_loss": -7.245867729187012, "global_step": 208921, "epoch": 4974} {"train_loss": -7.273871898651123, "global_step": 208922, "epoch": 4974} {"train_loss": -7.184863567352295, "global_step": 208923, "epoch": 4974} {"train_loss": -7.243913650512695, "global_step": 208924, "epoch": 4974} {"train_loss": -7.2491044998168945, "global_step": 208925, "epoch": 4974} {"train_loss": -7.244283676147461, "global_step": 208926, "epoch": 4974} {"train_loss": -7.200010299682617, "global_step": 208927, "epoch": 4974} {"train_loss": -7.254979610443115, "global_step": 208928, "epoch": 4974} {"train_loss": -7.276331901550293, "global_step": 208929, "epoch": 4974} {"train_loss": -7.213046073913574, "global_step": 208930, "epoch": 4974} {"train_loss": -7.19144344329834, "global_step": 208931, "epoch": 4974} {"train_loss": -7.22903299331665, "global_step": 208932, "epoch": 4974} {"train_loss": -7.26909875869751, "global_step": 208933, "epoch": 4974} {"train_loss": -7.2163472175598145, "global_step": 208934, "epoch": 4974} {"train_loss": -7.294760227203369, "global_step": 208935, "epoch": 4974} {"train_loss": -7.418552398681641, "global_step": 208936, "epoch": 4974} {"train_loss": -7.204036712646484, "global_step": 208937, "epoch": 4974} {"train_loss": -7.336360931396484, "global_step": 208938, "epoch": 4974} {"train_loss": -7.447216033935547, "global_step": 208939, "epoch": 4974} {"train_loss": -7.233479976654053, "global_step": 208940, "epoch": 4974} {"train_loss": -7.328837871551514, "global_step": 208941, "epoch": 4974} {"train_loss": -7.281410217285156, "global_step": 208942, "epoch": 4974} {"train_loss": -7.296629905700684, "global_step": 208943, "epoch": 4974} {"train_loss": -7.307734489440918, "global_step": 208944, "epoch": 4974} {"train_loss": -7.415200233459473, "global_step": 208945, "epoch": 4974} {"train_loss": -7.3314361572265625, "global_step": 208946, "epoch": 4974} {"train_loss": -7.216597557067871, "global_step": 208947, "epoch": 4974} {"train_loss": -7.3946099281311035, "global_step": 208948, "epoch": 4974} {"train_loss": -7.273387352625529, "global_step": 208949, "epoch": 4974, "val_loss": 69192.03125} {"train_loss": -7.232301712036133, "global_step": 208950, "epoch": 4975} {"train_loss": -7.394708156585693, "global_step": 208951, "epoch": 4975} {"train_loss": -7.36983585357666, "global_step": 208952, "epoch": 4975} {"train_loss": -7.333732604980469, "global_step": 208953, "epoch": 4975} {"train_loss": -7.393824577331543, "global_step": 208954, "epoch": 4975} {"train_loss": -7.292923450469971, "global_step": 208955, "epoch": 4975} {"train_loss": -7.35280704498291, "global_step": 208956, "epoch": 4975} {"train_loss": -7.341645240783691, "global_step": 208957, "epoch": 4975} {"train_loss": -7.317782402038574, "global_step": 208958, "epoch": 4975} {"train_loss": -7.339566230773926, "global_step": 208959, "epoch": 4975} {"train_loss": -7.405763149261475, "global_step": 208960, "epoch": 4975} {"train_loss": -7.346911430358887, "global_step": 208961, "epoch": 4975} {"train_loss": -7.522118091583252, "global_step": 208962, "epoch": 4975} {"train_loss": -7.346468925476074, "global_step": 208963, "epoch": 4975} {"train_loss": -7.310701847076416, "global_step": 208964, "epoch": 4975} {"train_loss": -7.322046279907227, "global_step": 208965, "epoch": 4975} {"train_loss": -7.434720039367676, "global_step": 208966, "epoch": 4975} {"train_loss": -7.397373676300049, "global_step": 208967, "epoch": 4975} {"train_loss": -7.276153087615967, "global_step": 208968, "epoch": 4975} {"train_loss": -7.337920188903809, "global_step": 208969, "epoch": 4975} {"train_loss": -7.257656097412109, "global_step": 208970, "epoch": 4975} {"train_loss": -7.228041172027588, "global_step": 208971, "epoch": 4975} {"train_loss": -7.424801349639893, "global_step": 208972, "epoch": 4975} {"train_loss": -7.259437561035156, "global_step": 208973, "epoch": 4975} {"train_loss": -7.222232818603516, "global_step": 208974, "epoch": 4975} {"train_loss": -7.284860610961914, "global_step": 208975, "epoch": 4975} {"train_loss": -7.244645118713379, "global_step": 208976, "epoch": 4975} {"train_loss": -7.241697311401367, "global_step": 208977, "epoch": 4975} {"train_loss": -7.271533489227295, "global_step": 208978, "epoch": 4975} {"train_loss": -7.395030975341797, "global_step": 208979, "epoch": 4975} {"train_loss": -7.211185932159424, "global_step": 208980, "epoch": 4975} {"train_loss": -7.29039192199707, "global_step": 208981, "epoch": 4975} {"train_loss": -7.287632942199707, "global_step": 208982, "epoch": 4975} {"train_loss": -7.311887741088867, "global_step": 208983, "epoch": 4975} {"train_loss": -7.248160362243652, "global_step": 208984, "epoch": 4975} {"train_loss": -7.158858776092529, "global_step": 208985, "epoch": 4975} {"train_loss": -7.29695987701416, "global_step": 208986, "epoch": 4975} {"train_loss": -7.254618167877197, "global_step": 208987, "epoch": 4975} {"train_loss": -7.210057258605957, "global_step": 208988, "epoch": 4975} {"train_loss": -7.312144756317139, "global_step": 208989, "epoch": 4975} {"train_loss": -7.250638961791992, "global_step": 208990, "epoch": 4975} {"train_loss": -7.3119137060074575, "global_step": 208991, "epoch": 4975, "val_loss": 69361.6328125} {"train_loss": -7.327028751373291, "global_step": 208992, "epoch": 4976} {"train_loss": -7.259133815765381, "global_step": 208993, "epoch": 4976} {"train_loss": -7.2280731201171875, "global_step": 208994, "epoch": 4976} {"train_loss": -7.179966926574707, "global_step": 208995, "epoch": 4976} {"train_loss": -7.195395469665527, "global_step": 208996, "epoch": 4976} {"train_loss": -7.133964538574219, "global_step": 208997, "epoch": 4976} {"train_loss": -7.26418924331665, "global_step": 208998, "epoch": 4976} {"train_loss": -7.107542991638184, "global_step": 208999, "epoch": 4976} {"train_loss": -7.22136116027832, "global_step": 209000, "epoch": 4976} {"train_loss": -7.207830905914307, "global_step": 209001, "epoch": 4976} {"train_loss": -7.1183085441589355, "global_step": 209002, "epoch": 4976} {"train_loss": -7.220864295959473, "global_step": 209003, "epoch": 4976} {"train_loss": -7.138668060302734, "global_step": 209004, "epoch": 4976} {"train_loss": -7.057066440582275, "global_step": 209005, "epoch": 4976} {"train_loss": -7.164646148681641, "global_step": 209006, "epoch": 4976} {"train_loss": -7.139534950256348, "global_step": 209007, "epoch": 4976} {"train_loss": -7.230561256408691, "global_step": 209008, "epoch": 4976} {"train_loss": -7.146321773529053, "global_step": 209009, "epoch": 4976} {"train_loss": -7.152337551116943, "global_step": 209010, "epoch": 4976} {"train_loss": -7.227005958557129, "global_step": 209011, "epoch": 4976} {"train_loss": -7.209954261779785, "global_step": 209012, "epoch": 4976} {"train_loss": -7.275205612182617, "global_step": 209013, "epoch": 4976} {"train_loss": -7.284317493438721, "global_step": 209014, "epoch": 4976} {"train_loss": -7.268988609313965, "global_step": 209015, "epoch": 4976} {"train_loss": -7.28908634185791, "global_step": 209016, "epoch": 4976} {"train_loss": -7.185771942138672, "global_step": 209017, "epoch": 4976} {"train_loss": -7.300690650939941, "global_step": 209018, "epoch": 4976} {"train_loss": -7.257380485534668, "global_step": 209019, "epoch": 4976} {"train_loss": -7.210849761962891, "global_step": 209020, "epoch": 4976} {"train_loss": -7.264967918395996, "global_step": 209021, "epoch": 4976} {"train_loss": -7.167167663574219, "global_step": 209022, "epoch": 4976} {"train_loss": -7.278045177459717, "global_step": 209023, "epoch": 4976} {"train_loss": -7.271071910858154, "global_step": 209024, "epoch": 4976} {"train_loss": -7.139532089233398, "global_step": 209025, "epoch": 4976} {"train_loss": -7.264245510101318, "global_step": 209026, "epoch": 4976} {"train_loss": -7.441034317016602, "global_step": 209027, "epoch": 4976} {"train_loss": -7.201484680175781, "global_step": 209028, "epoch": 4976} {"train_loss": -7.224205017089844, "global_step": 209029, "epoch": 4976} {"train_loss": -7.035798072814941, "global_step": 209030, "epoch": 4976} {"train_loss": -7.278049468994141, "global_step": 209031, "epoch": 4976} {"train_loss": -7.33801794052124, "global_step": 209032, "epoch": 4976} {"train_loss": -7.21852385430109, "global_step": 209033, "epoch": 4976, "val_loss": 69085.4921875} {"train_loss": -7.290910243988037, "global_step": 209034, "epoch": 4977} {"train_loss": -7.285281658172607, "global_step": 209035, "epoch": 4977} {"train_loss": -7.290483474731445, "global_step": 209036, "epoch": 4977} {"train_loss": -7.3043341636657715, "global_step": 209037, "epoch": 4977} {"train_loss": -7.299895763397217, "global_step": 209038, "epoch": 4977} {"train_loss": -7.335938930511475, "global_step": 209039, "epoch": 4977} {"train_loss": -7.230900764465332, "global_step": 209040, "epoch": 4977} {"train_loss": -7.218269348144531, "global_step": 209041, "epoch": 4977} {"train_loss": -7.378304481506348, "global_step": 209042, "epoch": 4977} {"train_loss": -7.313999176025391, "global_step": 209043, "epoch": 4977} {"train_loss": -7.404807090759277, "global_step": 209044, "epoch": 4977} {"train_loss": -7.343973159790039, "global_step": 209045, "epoch": 4977} {"train_loss": -7.266536712646484, "global_step": 209046, "epoch": 4977} {"train_loss": -7.303741455078125, "global_step": 209047, "epoch": 4977} {"train_loss": -7.26546573638916, "global_step": 209048, "epoch": 4977} {"train_loss": -7.085905075073242, "global_step": 209049, "epoch": 4977} {"train_loss": -7.408501625061035, "global_step": 209050, "epoch": 4977} {"train_loss": -7.170360565185547, "global_step": 209051, "epoch": 4977} {"train_loss": -7.212198257446289, "global_step": 209052, "epoch": 4977} {"train_loss": -7.2663044929504395, "global_step": 209053, "epoch": 4977} {"train_loss": -7.060651779174805, "global_step": 209054, "epoch": 4977} {"train_loss": -7.158662796020508, "global_step": 209055, "epoch": 4977} {"train_loss": -7.239602088928223, "global_step": 209056, "epoch": 4977} {"train_loss": -7.029918670654297, "global_step": 209057, "epoch": 4977} {"train_loss": -7.225288391113281, "global_step": 209058, "epoch": 4977} {"train_loss": -7.188313961029053, "global_step": 209059, "epoch": 4977} {"train_loss": -7.1866374015808105, "global_step": 209060, "epoch": 4977} {"train_loss": -7.11468505859375, "global_step": 209061, "epoch": 4977} {"train_loss": -7.227207660675049, "global_step": 209062, "epoch": 4977} {"train_loss": -7.180190563201904, "global_step": 209063, "epoch": 4977} {"train_loss": -7.063559532165527, "global_step": 209064, "epoch": 4977} {"train_loss": -7.177230358123779, "global_step": 209065, "epoch": 4977} {"train_loss": -6.854602813720703, "global_step": 209066, "epoch": 4977} {"train_loss": -7.091233253479004, "global_step": 209067, "epoch": 4977} {"train_loss": -7.109675407409668, "global_step": 209068, "epoch": 4977} {"train_loss": -7.2280592918396, "global_step": 209069, "epoch": 4977} {"train_loss": -7.171433448791504, "global_step": 209070, "epoch": 4977} {"train_loss": -7.1950178146362305, "global_step": 209071, "epoch": 4977} {"train_loss": -7.169254302978516, "global_step": 209072, "epoch": 4977} {"train_loss": -7.345329284667969, "global_step": 209073, "epoch": 4977} {"train_loss": -7.222821235656738, "global_step": 209074, "epoch": 4977} {"train_loss": -7.215545870008922, "global_step": 209075, "epoch": 4977, "val_loss": 69144.6171875} {"train_loss": -7.1862993240356445, "global_step": 209076, "epoch": 4978} {"train_loss": -7.224957466125488, "global_step": 209077, "epoch": 4978} {"train_loss": -7.26053524017334, "global_step": 209078, "epoch": 4978} {"train_loss": -7.1243791580200195, "global_step": 209079, "epoch": 4978} {"train_loss": -7.223378658294678, "global_step": 209080, "epoch": 4978} {"train_loss": -7.299198150634766, "global_step": 209081, "epoch": 4978} {"train_loss": -7.227200031280518, "global_step": 209082, "epoch": 4978} {"train_loss": -7.239184379577637, "global_step": 209083, "epoch": 4978} {"train_loss": -7.290653228759766, "global_step": 209084, "epoch": 4978} {"train_loss": -7.3202104568481445, "global_step": 209085, "epoch": 4978} {"train_loss": -7.2784318923950195, "global_step": 209086, "epoch": 4978} {"train_loss": -7.30121374130249, "global_step": 209087, "epoch": 4978} {"train_loss": -7.35247278213501, "global_step": 209088, "epoch": 4978} {"train_loss": -7.192676067352295, "global_step": 209089, "epoch": 4978} {"train_loss": -7.185795783996582, "global_step": 209090, "epoch": 4978} {"train_loss": -7.250251770019531, "global_step": 209091, "epoch": 4978} {"train_loss": -7.259992599487305, "global_step": 209092, "epoch": 4978} {"train_loss": -7.262425422668457, "global_step": 209093, "epoch": 4978} {"train_loss": -7.268455505371094, "global_step": 209094, "epoch": 4978} {"train_loss": -7.227296352386475, "global_step": 209095, "epoch": 4978} {"train_loss": -7.245835781097412, "global_step": 209096, "epoch": 4978} {"train_loss": -7.212984085083008, "global_step": 209097, "epoch": 4978} {"train_loss": -7.325678825378418, "global_step": 209098, "epoch": 4978} {"train_loss": -7.109086513519287, "global_step": 209099, "epoch": 4978} {"train_loss": -7.198506832122803, "global_step": 209100, "epoch": 4978} {"train_loss": -7.216907501220703, "global_step": 209101, "epoch": 4978} {"train_loss": -7.326188564300537, "global_step": 209102, "epoch": 4978} {"train_loss": -7.33614444732666, "global_step": 209103, "epoch": 4978} {"train_loss": -7.337311744689941, "global_step": 209104, "epoch": 4978} {"train_loss": -7.30074405670166, "global_step": 209105, "epoch": 4978} {"train_loss": -7.34525203704834, "global_step": 209106, "epoch": 4978} {"train_loss": -7.276264190673828, "global_step": 209107, "epoch": 4978} {"train_loss": -7.361882209777832, "global_step": 209108, "epoch": 4978} {"train_loss": -7.308276653289795, "global_step": 209109, "epoch": 4978} {"train_loss": -7.36472225189209, "global_step": 209110, "epoch": 4978} {"train_loss": -7.164786338806152, "global_step": 209111, "epoch": 4978} {"train_loss": -7.389585494995117, "global_step": 209112, "epoch": 4978} {"train_loss": -7.232800006866455, "global_step": 209113, "epoch": 4978} {"train_loss": -7.2462286949157715, "global_step": 209114, "epoch": 4978} {"train_loss": -7.410192489624023, "global_step": 209115, "epoch": 4978} {"train_loss": -7.243478775024414, "global_step": 209116, "epoch": 4978} {"train_loss": -7.264129729498, "global_step": 209117, "epoch": 4978, "val_loss": 69277.7265625} {"train_loss": -7.233209609985352, "global_step": 209118, "epoch": 4979} {"train_loss": -7.034273624420166, "global_step": 209119, "epoch": 4979} {"train_loss": -7.276646614074707, "global_step": 209120, "epoch": 4979} {"train_loss": -7.204744338989258, "global_step": 209121, "epoch": 4979} {"train_loss": -7.09529972076416, "global_step": 209122, "epoch": 4979} {"train_loss": -7.290262699127197, "global_step": 209123, "epoch": 4979} {"train_loss": -7.2264485359191895, "global_step": 209124, "epoch": 4979} {"train_loss": -7.285760402679443, "global_step": 209125, "epoch": 4979} {"train_loss": -7.192078113555908, "global_step": 209126, "epoch": 4979} {"train_loss": -7.340175151824951, "global_step": 209127, "epoch": 4979} {"train_loss": -7.284633636474609, "global_step": 209128, "epoch": 4979} {"train_loss": -7.178394317626953, "global_step": 209129, "epoch": 4979} {"train_loss": -7.286904335021973, "global_step": 209130, "epoch": 4979} {"train_loss": -7.307679176330566, "global_step": 209131, "epoch": 4979} {"train_loss": -7.322378635406494, "global_step": 209132, "epoch": 4979} {"train_loss": -7.249547958374023, "global_step": 209133, "epoch": 4979} {"train_loss": -7.168615818023682, "global_step": 209134, "epoch": 4979} {"train_loss": -7.281529426574707, "global_step": 209135, "epoch": 4979} {"train_loss": -7.322697639465332, "global_step": 209136, "epoch": 4979} {"train_loss": -7.331395149230957, "global_step": 209137, "epoch": 4979} {"train_loss": -7.27313232421875, "global_step": 209138, "epoch": 4979} {"train_loss": -7.294157028198242, "global_step": 209139, "epoch": 4979} {"train_loss": -7.24054479598999, "global_step": 209140, "epoch": 4979} {"train_loss": -7.328275680541992, "global_step": 209141, "epoch": 4979} {"train_loss": -7.305633544921875, "global_step": 209142, "epoch": 4979} {"train_loss": -7.268810272216797, "global_step": 209143, "epoch": 4979} {"train_loss": -7.2447404861450195, "global_step": 209144, "epoch": 4979} {"train_loss": -7.238702297210693, "global_step": 209145, "epoch": 4979} {"train_loss": -7.208636283874512, "global_step": 209146, "epoch": 4979} {"train_loss": -7.2836785316467285, "global_step": 209147, "epoch": 4979} {"train_loss": -7.279324054718018, "global_step": 209148, "epoch": 4979} {"train_loss": -7.322543144226074, "global_step": 209149, "epoch": 4979} {"train_loss": -7.331916809082031, "global_step": 209150, "epoch": 4979} {"train_loss": -7.252442359924316, "global_step": 209151, "epoch": 4979} {"train_loss": -7.3704142570495605, "global_step": 209152, "epoch": 4979} {"train_loss": -7.245543479919434, "global_step": 209153, "epoch": 4979} {"train_loss": -7.129955291748047, "global_step": 209154, "epoch": 4979} {"train_loss": -7.1732177734375, "global_step": 209155, "epoch": 4979} {"train_loss": -7.32481050491333, "global_step": 209156, "epoch": 4979} {"train_loss": -7.182294845581055, "global_step": 209157, "epoch": 4979} {"train_loss": -7.261603355407715, "global_step": 209158, "epoch": 4979} {"train_loss": -7.253386588323684, "global_step": 209159, "epoch": 4979, "val_loss": 69358.109375} {"train_loss": -7.063601493835449, "global_step": 209160, "epoch": 4980} {"train_loss": -7.262632369995117, "global_step": 209161, "epoch": 4980} {"train_loss": -7.256765365600586, "global_step": 209162, "epoch": 4980} {"train_loss": -7.2506303787231445, "global_step": 209163, "epoch": 4980} {"train_loss": -7.2952165603637695, "global_step": 209164, "epoch": 4980} {"train_loss": -7.1386189460754395, "global_step": 209165, "epoch": 4980} {"train_loss": -7.2874860763549805, "global_step": 209166, "epoch": 4980} {"train_loss": -7.285576343536377, "global_step": 209167, "epoch": 4980} {"train_loss": -7.374863624572754, "global_step": 209168, "epoch": 4980} {"train_loss": -7.324471950531006, "global_step": 209169, "epoch": 4980} {"train_loss": -7.309549331665039, "global_step": 209170, "epoch": 4980} {"train_loss": -7.22346305847168, "global_step": 209171, "epoch": 4980} {"train_loss": -7.3755340576171875, "global_step": 209172, "epoch": 4980} {"train_loss": -7.350370407104492, "global_step": 209173, "epoch": 4980} {"train_loss": -7.3498640060424805, "global_step": 209174, "epoch": 4980} {"train_loss": -7.239823341369629, "global_step": 209175, "epoch": 4980} {"train_loss": -7.28622579574585, "global_step": 209176, "epoch": 4980} {"train_loss": -7.252564430236816, "global_step": 209177, "epoch": 4980} {"train_loss": -7.314626693725586, "global_step": 209178, "epoch": 4980} {"train_loss": -7.262167453765869, "global_step": 209179, "epoch": 4980} {"train_loss": -7.24045991897583, "global_step": 209180, "epoch": 4980} {"train_loss": -7.354344844818115, "global_step": 209181, "epoch": 4980} {"train_loss": -7.303805351257324, "global_step": 209182, "epoch": 4980} {"train_loss": -7.341301441192627, "global_step": 209183, "epoch": 4980} {"train_loss": -7.205051898956299, "global_step": 209184, "epoch": 4980} {"train_loss": -7.3985137939453125, "global_step": 209185, "epoch": 4980} {"train_loss": -7.338616847991943, "global_step": 209186, "epoch": 4980} {"train_loss": -7.263236999511719, "global_step": 209187, "epoch": 4980} {"train_loss": -7.367382049560547, "global_step": 209188, "epoch": 4980} {"train_loss": -7.258327007293701, "global_step": 209189, "epoch": 4980} {"train_loss": -7.249380111694336, "global_step": 209190, "epoch": 4980} {"train_loss": -7.275718688964844, "global_step": 209191, "epoch": 4980} {"train_loss": -7.267171859741211, "global_step": 209192, "epoch": 4980} {"train_loss": -7.147797584533691, "global_step": 209193, "epoch": 4980} {"train_loss": -7.136331558227539, "global_step": 209194, "epoch": 4980} {"train_loss": -7.419472694396973, "global_step": 209195, "epoch": 4980} {"train_loss": -7.262754440307617, "global_step": 209196, "epoch": 4980} {"train_loss": -7.261615753173828, "global_step": 209197, "epoch": 4980} {"train_loss": -7.278520584106445, "global_step": 209198, "epoch": 4980} {"train_loss": -7.303678512573242, "global_step": 209199, "epoch": 4980} {"train_loss": -7.128042221069336, "global_step": 209200, "epoch": 4980} {"train_loss": -7.277539503006708, "global_step": 209201, "epoch": 4980, "val_loss": 69172.3515625} {"train_loss": -7.249013423919678, "global_step": 209202, "epoch": 4981} {"train_loss": -7.228499412536621, "global_step": 209203, "epoch": 4981} {"train_loss": -7.3389434814453125, "global_step": 209204, "epoch": 4981} {"train_loss": -7.381430625915527, "global_step": 209205, "epoch": 4981} {"train_loss": -7.1502299308776855, "global_step": 209206, "epoch": 4981} {"train_loss": -7.443020820617676, "global_step": 209207, "epoch": 4981} {"train_loss": -7.09381628036499, "global_step": 209208, "epoch": 4981} {"train_loss": -7.216233253479004, "global_step": 209209, "epoch": 4981} {"train_loss": -7.344202995300293, "global_step": 209210, "epoch": 4981} {"train_loss": -7.455353260040283, "global_step": 209211, "epoch": 4981} {"train_loss": -7.294551849365234, "global_step": 209212, "epoch": 4981} {"train_loss": -7.3268656730651855, "global_step": 209213, "epoch": 4981} {"train_loss": -7.285729885101318, "global_step": 209214, "epoch": 4981} {"train_loss": -7.380182266235352, "global_step": 209215, "epoch": 4981} {"train_loss": -7.3666300773620605, "global_step": 209216, "epoch": 4981} {"train_loss": -7.402032852172852, "global_step": 209217, "epoch": 4981} {"train_loss": -7.251687049865723, "global_step": 209218, "epoch": 4981} {"train_loss": -7.361843109130859, "global_step": 209219, "epoch": 4981} {"train_loss": -7.218532562255859, "global_step": 209220, "epoch": 4981} {"train_loss": -7.369446754455566, "global_step": 209221, "epoch": 4981} {"train_loss": -7.462698936462402, "global_step": 209222, "epoch": 4981} {"train_loss": -7.2866315841674805, "global_step": 209223, "epoch": 4981} {"train_loss": -7.295439720153809, "global_step": 209224, "epoch": 4981} {"train_loss": -7.408074378967285, "global_step": 209225, "epoch": 4981} {"train_loss": -7.336132526397705, "global_step": 209226, "epoch": 4981} {"train_loss": -7.366201400756836, "global_step": 209227, "epoch": 4981} {"train_loss": -7.4495086669921875, "global_step": 209228, "epoch": 4981} {"train_loss": -7.3805742263793945, "global_step": 209229, "epoch": 4981} {"train_loss": -7.518472671508789, "global_step": 209230, "epoch": 4981} {"train_loss": -7.420904159545898, "global_step": 209231, "epoch": 4981} {"train_loss": -7.357419967651367, "global_step": 209232, "epoch": 4981} {"train_loss": -7.4073805809021, "global_step": 209233, "epoch": 4981} {"train_loss": -7.2863054275512695, "global_step": 209234, "epoch": 4981} {"train_loss": -7.334319114685059, "global_step": 209235, "epoch": 4981} {"train_loss": -7.248874664306641, "global_step": 209236, "epoch": 4981} {"train_loss": -7.361285209655762, "global_step": 209237, "epoch": 4981} {"train_loss": -7.323243141174316, "global_step": 209238, "epoch": 4981} {"train_loss": -7.267162799835205, "global_step": 209239, "epoch": 4981} {"train_loss": -7.330582141876221, "global_step": 209240, "epoch": 4981} {"train_loss": -7.278467178344727, "global_step": 209241, "epoch": 4981} {"train_loss": -7.305346488952637, "global_step": 209242, "epoch": 4981} {"train_loss": -7.330808185395741, "global_step": 209243, "epoch": 4981, "val_loss": 69304.2421875} {"train_loss": -7.335968017578125, "global_step": 209244, "epoch": 4982} {"train_loss": -7.238584995269775, "global_step": 209245, "epoch": 4982} {"train_loss": -7.3426127433776855, "global_step": 209246, "epoch": 4982} {"train_loss": -7.262165546417236, "global_step": 209247, "epoch": 4982} {"train_loss": -7.1762189865112305, "global_step": 209248, "epoch": 4982} {"train_loss": -7.355592727661133, "global_step": 209249, "epoch": 4982} {"train_loss": -7.258969783782959, "global_step": 209250, "epoch": 4982} {"train_loss": -7.246522903442383, "global_step": 209251, "epoch": 4982} {"train_loss": -7.222550868988037, "global_step": 209252, "epoch": 4982} {"train_loss": -7.188198566436768, "global_step": 209253, "epoch": 4982} {"train_loss": -7.290713787078857, "global_step": 209254, "epoch": 4982} {"train_loss": -7.192293643951416, "global_step": 209255, "epoch": 4982} {"train_loss": -7.16754150390625, "global_step": 209256, "epoch": 4982} {"train_loss": -7.255155563354492, "global_step": 209257, "epoch": 4982} {"train_loss": -7.244210243225098, "global_step": 209258, "epoch": 4982} {"train_loss": -7.312471866607666, "global_step": 209259, "epoch": 4982} {"train_loss": -7.304120063781738, "global_step": 209260, "epoch": 4982} {"train_loss": -7.325672149658203, "global_step": 209261, "epoch": 4982} {"train_loss": -7.320718765258789, "global_step": 209262, "epoch": 4982} {"train_loss": -7.324594497680664, "global_step": 209263, "epoch": 4982} {"train_loss": -7.247076511383057, "global_step": 209264, "epoch": 4982} {"train_loss": -7.356661319732666, "global_step": 209265, "epoch": 4982} {"train_loss": -7.309141635894775, "global_step": 209266, "epoch": 4982} {"train_loss": -7.290543556213379, "global_step": 209267, "epoch": 4982} {"train_loss": -7.313436508178711, "global_step": 209268, "epoch": 4982} {"train_loss": -7.2630109786987305, "global_step": 209269, "epoch": 4982} {"train_loss": -7.235872268676758, "global_step": 209270, "epoch": 4982} {"train_loss": -7.463728904724121, "global_step": 209271, "epoch": 4982} {"train_loss": -7.331603527069092, "global_step": 209272, "epoch": 4982} {"train_loss": -7.354497909545898, "global_step": 209273, "epoch": 4982} {"train_loss": -7.312902450561523, "global_step": 209274, "epoch": 4982} {"train_loss": -7.417374134063721, "global_step": 209275, "epoch": 4982} {"train_loss": -7.426675796508789, "global_step": 209276, "epoch": 4982} {"train_loss": -7.21967887878418, "global_step": 209277, "epoch": 4982} {"train_loss": -7.391910552978516, "global_step": 209278, "epoch": 4982} {"train_loss": -7.407882213592529, "global_step": 209279, "epoch": 4982} {"train_loss": -7.336940765380859, "global_step": 209280, "epoch": 4982} {"train_loss": -7.293210983276367, "global_step": 209281, "epoch": 4982} {"train_loss": -7.403259754180908, "global_step": 209282, "epoch": 4982} {"train_loss": -7.223085403442383, "global_step": 209283, "epoch": 4982} {"train_loss": -7.2587995529174805, "global_step": 209284, "epoch": 4982} {"train_loss": -7.299556130454654, "global_step": 209285, "epoch": 4982, "val_loss": 69180.7890625} {"train_loss": -7.377772808074951, "global_step": 209286, "epoch": 4983} {"train_loss": -7.249988555908203, "global_step": 209287, "epoch": 4983} {"train_loss": -7.345790863037109, "global_step": 209288, "epoch": 4983} {"train_loss": -7.320169448852539, "global_step": 209289, "epoch": 4983} {"train_loss": -7.287029266357422, "global_step": 209290, "epoch": 4983} {"train_loss": -7.291626930236816, "global_step": 209291, "epoch": 4983} {"train_loss": -7.34128475189209, "global_step": 209292, "epoch": 4983} {"train_loss": -7.367177486419678, "global_step": 209293, "epoch": 4983} {"train_loss": -7.233213424682617, "global_step": 209294, "epoch": 4983} {"train_loss": -7.24824333190918, "global_step": 209295, "epoch": 4983} {"train_loss": -7.348752975463867, "global_step": 209296, "epoch": 4983} {"train_loss": -7.369309425354004, "global_step": 209297, "epoch": 4983} {"train_loss": -7.259494781494141, "global_step": 209298, "epoch": 4983} {"train_loss": -7.354090690612793, "global_step": 209299, "epoch": 4983} {"train_loss": -7.29948616027832, "global_step": 209300, "epoch": 4983} {"train_loss": -7.284639358520508, "global_step": 209301, "epoch": 4983} {"train_loss": -7.359577178955078, "global_step": 209302, "epoch": 4983} {"train_loss": -7.235735893249512, "global_step": 209303, "epoch": 4983} {"train_loss": -7.279497146606445, "global_step": 209304, "epoch": 4983} {"train_loss": -7.355082988739014, "global_step": 209305, "epoch": 4983} {"train_loss": -7.278072357177734, "global_step": 209306, "epoch": 4983} {"train_loss": -7.2216386795043945, "global_step": 209307, "epoch": 4983} {"train_loss": -7.312216281890869, "global_step": 209308, "epoch": 4983} {"train_loss": -7.372164726257324, "global_step": 209309, "epoch": 4983} {"train_loss": -7.219494819641113, "global_step": 209310, "epoch": 4983} {"train_loss": -7.432590961456299, "global_step": 209311, "epoch": 4983} {"train_loss": -7.232169151306152, "global_step": 209312, "epoch": 4983} {"train_loss": -7.238680839538574, "global_step": 209313, "epoch": 4983} {"train_loss": -7.341597080230713, "global_step": 209314, "epoch": 4983} {"train_loss": -7.272818565368652, "global_step": 209315, "epoch": 4983} {"train_loss": -7.339789390563965, "global_step": 209316, "epoch": 4983} {"train_loss": -7.263509750366211, "global_step": 209317, "epoch": 4983} {"train_loss": -7.343210220336914, "global_step": 209318, "epoch": 4983} {"train_loss": -7.210269927978516, "global_step": 209319, "epoch": 4983} {"train_loss": -7.248532295227051, "global_step": 209320, "epoch": 4983} {"train_loss": -7.33349609375, "global_step": 209321, "epoch": 4983} {"train_loss": -7.248243808746338, "global_step": 209322, "epoch": 4983} {"train_loss": -7.11653995513916, "global_step": 209323, "epoch": 4983} {"train_loss": -7.31069278717041, "global_step": 209324, "epoch": 4983} {"train_loss": -7.435699462890625, "global_step": 209325, "epoch": 4983} {"train_loss": -7.3285417556762695, "global_step": 209326, "epoch": 4983} {"train_loss": -7.302605299722581, "global_step": 209327, "epoch": 4983, "val_loss": 69257.859375} {"train_loss": -7.315838813781738, "global_step": 209328, "epoch": 4984} {"train_loss": -7.303500175476074, "global_step": 209329, "epoch": 4984} {"train_loss": -7.209160327911377, "global_step": 209330, "epoch": 4984} {"train_loss": -7.344205856323242, "global_step": 209331, "epoch": 4984} {"train_loss": -7.402705192565918, "global_step": 209332, "epoch": 4984} {"train_loss": -7.422515869140625, "global_step": 209333, "epoch": 4984} {"train_loss": -7.391389846801758, "global_step": 209334, "epoch": 4984} {"train_loss": -7.335160732269287, "global_step": 209335, "epoch": 4984} {"train_loss": -7.385632514953613, "global_step": 209336, "epoch": 4984} {"train_loss": -7.369215965270996, "global_step": 209337, "epoch": 4984} {"train_loss": -7.277990341186523, "global_step": 209338, "epoch": 4984} {"train_loss": -7.376870155334473, "global_step": 209339, "epoch": 4984} {"train_loss": -7.31032657623291, "global_step": 209340, "epoch": 4984} {"train_loss": -7.366612911224365, "global_step": 209341, "epoch": 4984} {"train_loss": -7.316441535949707, "global_step": 209342, "epoch": 4984} {"train_loss": -7.174040794372559, "global_step": 209343, "epoch": 4984} {"train_loss": -7.308096408843994, "global_step": 209344, "epoch": 4984} {"train_loss": -7.367318153381348, "global_step": 209345, "epoch": 4984} {"train_loss": -7.287944793701172, "global_step": 209346, "epoch": 4984} {"train_loss": -7.406824111938477, "global_step": 209347, "epoch": 4984} {"train_loss": -7.367635726928711, "global_step": 209348, "epoch": 4984} {"train_loss": -7.382208824157715, "global_step": 209349, "epoch": 4984} {"train_loss": -7.2564005851745605, "global_step": 209350, "epoch": 4984} {"train_loss": -7.216899871826172, "global_step": 209351, "epoch": 4984} {"train_loss": -7.2756123542785645, "global_step": 209352, "epoch": 4984} {"train_loss": -7.354616641998291, "global_step": 209353, "epoch": 4984} {"train_loss": -7.405513763427734, "global_step": 209354, "epoch": 4984} {"train_loss": -7.121224880218506, "global_step": 209355, "epoch": 4984} {"train_loss": -7.294494152069092, "global_step": 209356, "epoch": 4984} {"train_loss": -7.287435531616211, "global_step": 209357, "epoch": 4984} {"train_loss": -7.244431495666504, "global_step": 209358, "epoch": 4984} {"train_loss": -7.295327186584473, "global_step": 209359, "epoch": 4984} {"train_loss": -7.181243419647217, "global_step": 209360, "epoch": 4984} {"train_loss": -7.232624053955078, "global_step": 209361, "epoch": 4984} {"train_loss": -7.356505393981934, "global_step": 209362, "epoch": 4984} {"train_loss": -7.254915714263916, "global_step": 209363, "epoch": 4984} {"train_loss": -7.299450874328613, "global_step": 209364, "epoch": 4984} {"train_loss": -7.339013576507568, "global_step": 209365, "epoch": 4984} {"train_loss": -7.356987476348877, "global_step": 209366, "epoch": 4984} {"train_loss": -7.188002586364746, "global_step": 209367, "epoch": 4984} {"train_loss": -7.298952579498291, "global_step": 209368, "epoch": 4984} {"train_loss": -7.30920071828933, "global_step": 209369, "epoch": 4984, "val_loss": 69170.40625} {"train_loss": -7.167182445526123, "global_step": 209370, "epoch": 4985} {"train_loss": -7.386806488037109, "global_step": 209371, "epoch": 4985} {"train_loss": -7.311455726623535, "global_step": 209372, "epoch": 4985} {"train_loss": -7.343474864959717, "global_step": 209373, "epoch": 4985} {"train_loss": -7.3919453620910645, "global_step": 209374, "epoch": 4985} {"train_loss": -7.331243515014648, "global_step": 209375, "epoch": 4985} {"train_loss": -7.4500274658203125, "global_step": 209376, "epoch": 4985} {"train_loss": -7.359098434448242, "global_step": 209377, "epoch": 4985} {"train_loss": -7.280074119567871, "global_step": 209378, "epoch": 4985} {"train_loss": -7.3325653076171875, "global_step": 209379, "epoch": 4985} {"train_loss": -7.280694961547852, "global_step": 209380, "epoch": 4985} {"train_loss": -7.209511756896973, "global_step": 209381, "epoch": 4985} {"train_loss": -7.375234127044678, "global_step": 209382, "epoch": 4985} {"train_loss": -7.2542243003845215, "global_step": 209383, "epoch": 4985} {"train_loss": -7.164414405822754, "global_step": 209384, "epoch": 4985} {"train_loss": -7.247120380401611, "global_step": 209385, "epoch": 4985} {"train_loss": -7.238274574279785, "global_step": 209386, "epoch": 4985} {"train_loss": -7.25544548034668, "global_step": 209387, "epoch": 4985} {"train_loss": -7.140608787536621, "global_step": 209388, "epoch": 4985} {"train_loss": -7.270712852478027, "global_step": 209389, "epoch": 4985} {"train_loss": -7.11622428894043, "global_step": 209390, "epoch": 4985} {"train_loss": -7.24603271484375, "global_step": 209391, "epoch": 4985} {"train_loss": -7.224998950958252, "global_step": 209392, "epoch": 4985} {"train_loss": -7.076992034912109, "global_step": 209393, "epoch": 4985} {"train_loss": -7.255767822265625, "global_step": 209394, "epoch": 4985} {"train_loss": -7.194931983947754, "global_step": 209395, "epoch": 4985} {"train_loss": -7.203821182250977, "global_step": 209396, "epoch": 4985} {"train_loss": -7.335014343261719, "global_step": 209397, "epoch": 4985} {"train_loss": -7.067593574523926, "global_step": 209398, "epoch": 4985} {"train_loss": -7.210823059082031, "global_step": 209399, "epoch": 4985} {"train_loss": -6.978147029876709, "global_step": 209400, "epoch": 4985} {"train_loss": -7.295740127563477, "global_step": 209401, "epoch": 4985} {"train_loss": -7.064357280731201, "global_step": 209402, "epoch": 4985} {"train_loss": -7.134002685546875, "global_step": 209403, "epoch": 4985} {"train_loss": -7.207096099853516, "global_step": 209404, "epoch": 4985} {"train_loss": -7.113277912139893, "global_step": 209405, "epoch": 4985} {"train_loss": -7.066575050354004, "global_step": 209406, "epoch": 4985} {"train_loss": -6.991263389587402, "global_step": 209407, "epoch": 4985} {"train_loss": -7.017822265625, "global_step": 209408, "epoch": 4985} {"train_loss": -7.12993049621582, "global_step": 209409, "epoch": 4985} {"train_loss": -7.040825843811035, "global_step": 209410, "epoch": 4985} {"train_loss": -7.210631177538917, "global_step": 209411, "epoch": 4985, "val_loss": 69290.84375} {"train_loss": -7.234856128692627, "global_step": 209412, "epoch": 4986} {"train_loss": -7.063327312469482, "global_step": 209413, "epoch": 4986} {"train_loss": -7.065789222717285, "global_step": 209414, "epoch": 4986} {"train_loss": -7.273087501525879, "global_step": 209415, "epoch": 4986} {"train_loss": -7.119385719299316, "global_step": 209416, "epoch": 4986} {"train_loss": -7.19816255569458, "global_step": 209417, "epoch": 4986} {"train_loss": -7.234307289123535, "global_step": 209418, "epoch": 4986} {"train_loss": -7.140035629272461, "global_step": 209419, "epoch": 4986} {"train_loss": -7.079984664916992, "global_step": 209420, "epoch": 4986} {"train_loss": -7.152219772338867, "global_step": 209421, "epoch": 4986} {"train_loss": -7.131075859069824, "global_step": 209422, "epoch": 4986} {"train_loss": -7.209580421447754, "global_step": 209423, "epoch": 4986} {"train_loss": -7.2037458419799805, "global_step": 209424, "epoch": 4986} {"train_loss": -7.244724273681641, "global_step": 209425, "epoch": 4986} {"train_loss": -7.1492018699646, "global_step": 209426, "epoch": 4986} {"train_loss": -7.100617408752441, "global_step": 209427, "epoch": 4986} {"train_loss": -7.148016929626465, "global_step": 209428, "epoch": 4986} {"train_loss": -7.116231918334961, "global_step": 209429, "epoch": 4986} {"train_loss": -7.288391590118408, "global_step": 209430, "epoch": 4986} {"train_loss": -7.181488990783691, "global_step": 209431, "epoch": 4986} {"train_loss": -7.267005920410156, "global_step": 209432, "epoch": 4986} {"train_loss": -7.279443740844727, "global_step": 209433, "epoch": 4986} {"train_loss": -7.246065139770508, "global_step": 209434, "epoch": 4986} {"train_loss": -7.186521530151367, "global_step": 209435, "epoch": 4986} {"train_loss": -7.295035362243652, "global_step": 209436, "epoch": 4986} {"train_loss": -7.379290580749512, "global_step": 209437, "epoch": 4986} {"train_loss": -7.203612327575684, "global_step": 209438, "epoch": 4986} {"train_loss": -7.228797912597656, "global_step": 209439, "epoch": 4986} {"train_loss": -7.112433433532715, "global_step": 209440, "epoch": 4986} {"train_loss": -7.233245372772217, "global_step": 209441, "epoch": 4986} {"train_loss": -7.138861179351807, "global_step": 209442, "epoch": 4986} {"train_loss": -7.158524513244629, "global_step": 209443, "epoch": 4986} {"train_loss": -7.386104106903076, "global_step": 209444, "epoch": 4986} {"train_loss": -7.25202751159668, "global_step": 209445, "epoch": 4986} {"train_loss": -7.372289180755615, "global_step": 209446, "epoch": 4986} {"train_loss": -7.295670509338379, "global_step": 209447, "epoch": 4986} {"train_loss": -7.241314888000488, "global_step": 209448, "epoch": 4986} {"train_loss": -7.307575702667236, "global_step": 209449, "epoch": 4986} {"train_loss": -7.206782341003418, "global_step": 209450, "epoch": 4986} {"train_loss": -7.273689270019531, "global_step": 209451, "epoch": 4986} {"train_loss": -7.3821892738342285, "global_step": 209452, "epoch": 4986} {"train_loss": -7.214005345389957, "global_step": 209453, "epoch": 4986, "val_loss": 69090.5390625} {"train_loss": -7.41925573348999, "global_step": 209454, "epoch": 4987} {"train_loss": -7.436221599578857, "global_step": 209455, "epoch": 4987} {"train_loss": -7.346627712249756, "global_step": 209456, "epoch": 4987} {"train_loss": -7.371633052825928, "global_step": 209457, "epoch": 4987} {"train_loss": -7.348100185394287, "global_step": 209458, "epoch": 4987} {"train_loss": -7.366013526916504, "global_step": 209459, "epoch": 4987} {"train_loss": -7.401021480560303, "global_step": 209460, "epoch": 4987} {"train_loss": -7.331742286682129, "global_step": 209461, "epoch": 4987} {"train_loss": -7.370771408081055, "global_step": 209462, "epoch": 4987} {"train_loss": -7.339544296264648, "global_step": 209463, "epoch": 4987} {"train_loss": -7.22548770904541, "global_step": 209464, "epoch": 4987} {"train_loss": -7.266372203826904, "global_step": 209465, "epoch": 4987} {"train_loss": -7.28640604019165, "global_step": 209466, "epoch": 4987} {"train_loss": -7.295844078063965, "global_step": 209467, "epoch": 4987} {"train_loss": -7.345602989196777, "global_step": 209468, "epoch": 4987} {"train_loss": -7.276208400726318, "global_step": 209469, "epoch": 4987} {"train_loss": -7.385802268981934, "global_step": 209470, "epoch": 4987} {"train_loss": -7.341437816619873, "global_step": 209471, "epoch": 4987} {"train_loss": -7.228087425231934, "global_step": 209472, "epoch": 4987} {"train_loss": -7.37911319732666, "global_step": 209473, "epoch": 4987} {"train_loss": -7.286133766174316, "global_step": 209474, "epoch": 4987} {"train_loss": -7.260067939758301, "global_step": 209475, "epoch": 4987} {"train_loss": -7.377295017242432, "global_step": 209476, "epoch": 4987} {"train_loss": -7.307398796081543, "global_step": 209477, "epoch": 4987} {"train_loss": -7.292670726776123, "global_step": 209478, "epoch": 4987} {"train_loss": -7.287601470947266, "global_step": 209479, "epoch": 4987} {"train_loss": -7.313830375671387, "global_step": 209480, "epoch": 4987} {"train_loss": -7.417387962341309, "global_step": 209481, "epoch": 4987} {"train_loss": -7.193246841430664, "global_step": 209482, "epoch": 4987} {"train_loss": -7.169764518737793, "global_step": 209483, "epoch": 4987} {"train_loss": -7.222393035888672, "global_step": 209484, "epoch": 4987} {"train_loss": -7.193092346191406, "global_step": 209485, "epoch": 4987} {"train_loss": -7.33101749420166, "global_step": 209486, "epoch": 4987} {"train_loss": -7.156037330627441, "global_step": 209487, "epoch": 4987} {"train_loss": -7.378389358520508, "global_step": 209488, "epoch": 4987} {"train_loss": -7.304643630981445, "global_step": 209489, "epoch": 4987} {"train_loss": -7.325498580932617, "global_step": 209490, "epoch": 4987} {"train_loss": -7.2280731201171875, "global_step": 209491, "epoch": 4987} {"train_loss": -7.2421770095825195, "global_step": 209492, "epoch": 4987} {"train_loss": -7.358121395111084, "global_step": 209493, "epoch": 4987} {"train_loss": -7.263672351837158, "global_step": 209494, "epoch": 4987} {"train_loss": -7.309657357987904, "global_step": 209495, "epoch": 4987, "val_loss": 69153.46875} {"train_loss": -7.304098129272461, "global_step": 209496, "epoch": 4988} {"train_loss": -7.408714771270752, "global_step": 209497, "epoch": 4988} {"train_loss": -7.368605613708496, "global_step": 209498, "epoch": 4988} {"train_loss": -7.319545745849609, "global_step": 209499, "epoch": 4988} {"train_loss": -7.3290863037109375, "global_step": 209500, "epoch": 4988} {"train_loss": -7.291159629821777, "global_step": 209501, "epoch": 4988} {"train_loss": -7.35532283782959, "global_step": 209502, "epoch": 4988} {"train_loss": -7.3518218994140625, "global_step": 209503, "epoch": 4988} {"train_loss": -7.247209548950195, "global_step": 209504, "epoch": 4988} {"train_loss": -7.40123176574707, "global_step": 209505, "epoch": 4988} {"train_loss": -7.343487739562988, "global_step": 209506, "epoch": 4988} {"train_loss": -7.325087070465088, "global_step": 209507, "epoch": 4988} {"train_loss": -7.42377233505249, "global_step": 209508, "epoch": 4988} {"train_loss": -7.34970760345459, "global_step": 209509, "epoch": 4988} {"train_loss": -7.428958892822266, "global_step": 209510, "epoch": 4988} {"train_loss": -7.287151336669922, "global_step": 209511, "epoch": 4988} {"train_loss": -7.416433334350586, "global_step": 209512, "epoch": 4988} {"train_loss": -7.353237152099609, "global_step": 209513, "epoch": 4988} {"train_loss": -7.366728782653809, "global_step": 209514, "epoch": 4988} {"train_loss": -7.233408451080322, "global_step": 209515, "epoch": 4988} {"train_loss": -7.372740745544434, "global_step": 209516, "epoch": 4988} {"train_loss": -7.255355358123779, "global_step": 209517, "epoch": 4988} {"train_loss": -7.314577102661133, "global_step": 209518, "epoch": 4988} {"train_loss": -7.4676971435546875, "global_step": 209519, "epoch": 4988} {"train_loss": -7.201359272003174, "global_step": 209520, "epoch": 4988} {"train_loss": -7.202456474304199, "global_step": 209521, "epoch": 4988} {"train_loss": -7.375349998474121, "global_step": 209522, "epoch": 4988} {"train_loss": -7.102568626403809, "global_step": 209523, "epoch": 4988} {"train_loss": -7.297064781188965, "global_step": 209524, "epoch": 4988} {"train_loss": -7.191987037658691, "global_step": 209525, "epoch": 4988} {"train_loss": -7.235584259033203, "global_step": 209526, "epoch": 4988} {"train_loss": -7.313374996185303, "global_step": 209527, "epoch": 4988} {"train_loss": -7.1295671463012695, "global_step": 209528, "epoch": 4988} {"train_loss": -7.230798721313477, "global_step": 209529, "epoch": 4988} {"train_loss": -7.212998867034912, "global_step": 209530, "epoch": 4988} {"train_loss": -7.274442195892334, "global_step": 209531, "epoch": 4988} {"train_loss": -7.241815090179443, "global_step": 209532, "epoch": 4988} {"train_loss": -7.302509784698486, "global_step": 209533, "epoch": 4988} {"train_loss": -7.295282363891602, "global_step": 209534, "epoch": 4988} {"train_loss": -7.177102088928223, "global_step": 209535, "epoch": 4988} {"train_loss": -7.38983154296875, "global_step": 209536, "epoch": 4988} {"train_loss": -7.300599597749256, "global_step": 209537, "epoch": 4988, "val_loss": 69232.3125} {"train_loss": -7.28809928894043, "global_step": 209538, "epoch": 4989} {"train_loss": -7.328980922698975, "global_step": 209539, "epoch": 4989} {"train_loss": -7.173861980438232, "global_step": 209540, "epoch": 4989} {"train_loss": -7.369887351989746, "global_step": 209541, "epoch": 4989} {"train_loss": -7.374824523925781, "global_step": 209542, "epoch": 4989} {"train_loss": -7.28745174407959, "global_step": 209543, "epoch": 4989} {"train_loss": -7.226081371307373, "global_step": 209544, "epoch": 4989} {"train_loss": -7.313206672668457, "global_step": 209545, "epoch": 4989} {"train_loss": -7.346846580505371, "global_step": 209546, "epoch": 4989} {"train_loss": -7.400912761688232, "global_step": 209547, "epoch": 4989} {"train_loss": -7.312644004821777, "global_step": 209548, "epoch": 4989} {"train_loss": -7.243162155151367, "global_step": 209549, "epoch": 4989} {"train_loss": -7.264636993408203, "global_step": 209550, "epoch": 4989} {"train_loss": -7.296568870544434, "global_step": 209551, "epoch": 4989} {"train_loss": -7.2737932205200195, "global_step": 209552, "epoch": 4989} {"train_loss": -7.173936367034912, "global_step": 209553, "epoch": 4989} {"train_loss": -7.365386009216309, "global_step": 209554, "epoch": 4989} {"train_loss": -7.194864749908447, "global_step": 209555, "epoch": 4989} {"train_loss": -7.2060546875, "global_step": 209556, "epoch": 4989} {"train_loss": -7.335859298706055, "global_step": 209557, "epoch": 4989} {"train_loss": -7.270031929016113, "global_step": 209558, "epoch": 4989} {"train_loss": -7.3289079666137695, "global_step": 209559, "epoch": 4989} {"train_loss": -7.149844169616699, "global_step": 209560, "epoch": 4989} {"train_loss": -7.21861457824707, "global_step": 209561, "epoch": 4989} {"train_loss": -7.261551380157471, "global_step": 209562, "epoch": 4989} {"train_loss": -7.249818801879883, "global_step": 209563, "epoch": 4989} {"train_loss": -7.277187347412109, "global_step": 209564, "epoch": 4989} {"train_loss": -7.2237396240234375, "global_step": 209565, "epoch": 4989} {"train_loss": -7.22889518737793, "global_step": 209566, "epoch": 4989} {"train_loss": -7.241402626037598, "global_step": 209567, "epoch": 4989} {"train_loss": -7.321366310119629, "global_step": 209568, "epoch": 4989} {"train_loss": -7.346828460693359, "global_step": 209569, "epoch": 4989} {"train_loss": -7.148550987243652, "global_step": 209570, "epoch": 4989} {"train_loss": -7.236780166625977, "global_step": 209571, "epoch": 4989} {"train_loss": -7.189248561859131, "global_step": 209572, "epoch": 4989} {"train_loss": -7.2475457191467285, "global_step": 209573, "epoch": 4989} {"train_loss": -7.346627235412598, "global_step": 209574, "epoch": 4989} {"train_loss": -7.205083847045898, "global_step": 209575, "epoch": 4989} {"train_loss": -7.257594108581543, "global_step": 209576, "epoch": 4989} {"train_loss": -7.219757080078125, "global_step": 209577, "epoch": 4989} {"train_loss": -7.317088603973389, "global_step": 209578, "epoch": 4989} {"train_loss": -7.270887987954276, "global_step": 209579, "epoch": 4989, "val_loss": 69252.359375} {"train_loss": -7.266854286193848, "global_step": 209580, "epoch": 4990} {"train_loss": -7.407971382141113, "global_step": 209581, "epoch": 4990} {"train_loss": -7.32315731048584, "global_step": 209582, "epoch": 4990} {"train_loss": -7.460482597351074, "global_step": 209583, "epoch": 4990} {"train_loss": -7.360110282897949, "global_step": 209584, "epoch": 4990} {"train_loss": -7.433611869812012, "global_step": 209585, "epoch": 4990} {"train_loss": -7.347198963165283, "global_step": 209586, "epoch": 4990} {"train_loss": -7.347084045410156, "global_step": 209587, "epoch": 4990} {"train_loss": -7.235962867736816, "global_step": 209588, "epoch": 4990} {"train_loss": -7.269428730010986, "global_step": 209589, "epoch": 4990} {"train_loss": -7.323602199554443, "global_step": 209590, "epoch": 4990} {"train_loss": -7.263582706451416, "global_step": 209591, "epoch": 4990} {"train_loss": -7.305838584899902, "global_step": 209592, "epoch": 4990} {"train_loss": -7.2856597900390625, "global_step": 209593, "epoch": 4990} {"train_loss": -7.3727126121521, "global_step": 209594, "epoch": 4990} {"train_loss": -7.3856072425842285, "global_step": 209595, "epoch": 4990} {"train_loss": -7.297400951385498, "global_step": 209596, "epoch": 4990} {"train_loss": -7.337502479553223, "global_step": 209597, "epoch": 4990} {"train_loss": -7.286371231079102, "global_step": 209598, "epoch": 4990} {"train_loss": -7.393948078155518, "global_step": 209599, "epoch": 4990} {"train_loss": -7.419801712036133, "global_step": 209600, "epoch": 4990} {"train_loss": -7.285358428955078, "global_step": 209601, "epoch": 4990} {"train_loss": -7.282337188720703, "global_step": 209602, "epoch": 4990} {"train_loss": -7.2646684646606445, "global_step": 209603, "epoch": 4990} {"train_loss": -7.29587459564209, "global_step": 209604, "epoch": 4990} {"train_loss": -7.323904037475586, "global_step": 209605, "epoch": 4990} {"train_loss": -7.388613700866699, "global_step": 209606, "epoch": 4990} {"train_loss": -7.3128252029418945, "global_step": 209607, "epoch": 4990} {"train_loss": -7.466024875640869, "global_step": 209608, "epoch": 4990} {"train_loss": -7.265359878540039, "global_step": 209609, "epoch": 4990} {"train_loss": -7.348950386047363, "global_step": 209610, "epoch": 4990} {"train_loss": -7.219954490661621, "global_step": 209611, "epoch": 4990} {"train_loss": -7.439767837524414, "global_step": 209612, "epoch": 4990} {"train_loss": -7.344895362854004, "global_step": 209613, "epoch": 4990} {"train_loss": -7.356330871582031, "global_step": 209614, "epoch": 4990} {"train_loss": -7.287221908569336, "global_step": 209615, "epoch": 4990} {"train_loss": -7.362908363342285, "global_step": 209616, "epoch": 4990} {"train_loss": -7.350866317749023, "global_step": 209617, "epoch": 4990} {"train_loss": -7.2230143547058105, "global_step": 209618, "epoch": 4990} {"train_loss": -7.153613567352295, "global_step": 209619, "epoch": 4990} {"train_loss": -7.360107421875, "global_step": 209620, "epoch": 4990} {"train_loss": -7.326051587150211, "global_step": 209621, "epoch": 4990, "val_loss": 69313.015625} {"train_loss": -7.101426124572754, "global_step": 209622, "epoch": 4991} {"train_loss": -7.301006317138672, "global_step": 209623, "epoch": 4991} {"train_loss": -7.266819953918457, "global_step": 209624, "epoch": 4991} {"train_loss": -7.183920860290527, "global_step": 209625, "epoch": 4991} {"train_loss": -7.324657917022705, "global_step": 209626, "epoch": 4991} {"train_loss": -7.143509864807129, "global_step": 209627, "epoch": 4991} {"train_loss": -7.210294246673584, "global_step": 209628, "epoch": 4991} {"train_loss": -7.328653335571289, "global_step": 209629, "epoch": 4991} {"train_loss": -7.264065742492676, "global_step": 209630, "epoch": 4991} {"train_loss": -7.345781326293945, "global_step": 209631, "epoch": 4991} {"train_loss": -7.204798221588135, "global_step": 209632, "epoch": 4991} {"train_loss": -7.257158279418945, "global_step": 209633, "epoch": 4991} {"train_loss": -7.20510721206665, "global_step": 209634, "epoch": 4991} {"train_loss": -7.165305137634277, "global_step": 209635, "epoch": 4991} {"train_loss": -7.172077178955078, "global_step": 209636, "epoch": 4991} {"train_loss": -7.292400360107422, "global_step": 209637, "epoch": 4991} {"train_loss": -7.2267231941223145, "global_step": 209638, "epoch": 4991} {"train_loss": -7.248039722442627, "global_step": 209639, "epoch": 4991} {"train_loss": -7.344470977783203, "global_step": 209640, "epoch": 4991} {"train_loss": -7.3105244636535645, "global_step": 209641, "epoch": 4991} {"train_loss": -7.313698768615723, "global_step": 209642, "epoch": 4991} {"train_loss": -7.272431373596191, "global_step": 209643, "epoch": 4991} {"train_loss": -7.151724815368652, "global_step": 209644, "epoch": 4991} {"train_loss": -7.25754976272583, "global_step": 209645, "epoch": 4991} {"train_loss": -7.217979907989502, "global_step": 209646, "epoch": 4991} {"train_loss": -7.245560169219971, "global_step": 209647, "epoch": 4991} {"train_loss": -7.26515007019043, "global_step": 209648, "epoch": 4991} {"train_loss": -7.321366310119629, "global_step": 209649, "epoch": 4991} {"train_loss": -7.259149551391602, "global_step": 209650, "epoch": 4991} {"train_loss": -7.309994220733643, "global_step": 209651, "epoch": 4991} {"train_loss": -7.287458419799805, "global_step": 209652, "epoch": 4991} {"train_loss": -7.3250932693481445, "global_step": 209653, "epoch": 4991} {"train_loss": -7.351698875427246, "global_step": 209654, "epoch": 4991} {"train_loss": -7.4139814376831055, "global_step": 209655, "epoch": 4991} {"train_loss": -7.395687580108643, "global_step": 209656, "epoch": 4991} {"train_loss": -7.308184623718262, "global_step": 209657, "epoch": 4991} {"train_loss": -7.341446399688721, "global_step": 209658, "epoch": 4991} {"train_loss": -7.362868785858154, "global_step": 209659, "epoch": 4991} {"train_loss": -7.298793792724609, "global_step": 209660, "epoch": 4991} {"train_loss": -7.398941993713379, "global_step": 209661, "epoch": 4991} {"train_loss": -7.461089134216309, "global_step": 209662, "epoch": 4991} {"train_loss": -7.283759310131981, "global_step": 209663, "epoch": 4991, "val_loss": 69231.5078125} {"train_loss": -7.26937198638916, "global_step": 209664, "epoch": 4992} {"train_loss": -7.3542799949646, "global_step": 209665, "epoch": 4992} {"train_loss": -7.378871917724609, "global_step": 209666, "epoch": 4992} {"train_loss": -7.3442912101745605, "global_step": 209667, "epoch": 4992} {"train_loss": -7.2679595947265625, "global_step": 209668, "epoch": 4992} {"train_loss": -7.2696638107299805, "global_step": 209669, "epoch": 4992} {"train_loss": -7.291558742523193, "global_step": 209670, "epoch": 4992} {"train_loss": -7.302559852600098, "global_step": 209671, "epoch": 4992} {"train_loss": -7.414989471435547, "global_step": 209672, "epoch": 4992} {"train_loss": -7.325877666473389, "global_step": 209673, "epoch": 4992} {"train_loss": -7.377834320068359, "global_step": 209674, "epoch": 4992} {"train_loss": -7.280447959899902, "global_step": 209675, "epoch": 4992} {"train_loss": -7.349128723144531, "global_step": 209676, "epoch": 4992} {"train_loss": -7.243734359741211, "global_step": 209677, "epoch": 4992} {"train_loss": -7.302986145019531, "global_step": 209678, "epoch": 4992} {"train_loss": -7.293878078460693, "global_step": 209679, "epoch": 4992} {"train_loss": -7.405651092529297, "global_step": 209680, "epoch": 4992} {"train_loss": -7.330441474914551, "global_step": 209681, "epoch": 4992} {"train_loss": -7.3621320724487305, "global_step": 209682, "epoch": 4992} {"train_loss": -7.369606971740723, "global_step": 209683, "epoch": 4992} {"train_loss": -7.387094020843506, "global_step": 209684, "epoch": 4992} {"train_loss": -7.305779457092285, "global_step": 209685, "epoch": 4992} {"train_loss": -7.275691509246826, "global_step": 209686, "epoch": 4992} {"train_loss": -7.442646026611328, "global_step": 209687, "epoch": 4992} {"train_loss": -7.36274528503418, "global_step": 209688, "epoch": 4992} {"train_loss": -7.282425880432129, "global_step": 209689, "epoch": 4992} {"train_loss": -7.352629661560059, "global_step": 209690, "epoch": 4992} {"train_loss": -7.341089248657227, "global_step": 209691, "epoch": 4992} {"train_loss": -7.341533184051514, "global_step": 209692, "epoch": 4992} {"train_loss": -7.274064064025879, "global_step": 209693, "epoch": 4992} {"train_loss": -7.367252349853516, "global_step": 209694, "epoch": 4992} {"train_loss": -7.256789207458496, "global_step": 209695, "epoch": 4992} {"train_loss": -7.341501235961914, "global_step": 209696, "epoch": 4992} {"train_loss": -7.316658973693848, "global_step": 209697, "epoch": 4992} {"train_loss": -7.33153772354126, "global_step": 209698, "epoch": 4992} {"train_loss": -7.293745040893555, "global_step": 209699, "epoch": 4992} {"train_loss": -7.3762359619140625, "global_step": 209700, "epoch": 4992} {"train_loss": -7.273094654083252, "global_step": 209701, "epoch": 4992} {"train_loss": -7.184586524963379, "global_step": 209702, "epoch": 4992} {"train_loss": -7.336579322814941, "global_step": 209703, "epoch": 4992} {"train_loss": -7.3495869636535645, "global_step": 209704, "epoch": 4992} {"train_loss": -7.323765788759504, "global_step": 209705, "epoch": 4992, "val_loss": 69326.078125} {"train_loss": -7.279099464416504, "global_step": 209706, "epoch": 4993} {"train_loss": -7.305014610290527, "global_step": 209707, "epoch": 4993} {"train_loss": -7.225621223449707, "global_step": 209708, "epoch": 4993} {"train_loss": -7.190795421600342, "global_step": 209709, "epoch": 4993} {"train_loss": -7.2448625564575195, "global_step": 209710, "epoch": 4993} {"train_loss": -7.247808456420898, "global_step": 209711, "epoch": 4993} {"train_loss": -7.271499156951904, "global_step": 209712, "epoch": 4993} {"train_loss": -7.362739086151123, "global_step": 209713, "epoch": 4993} {"train_loss": -7.2255940437316895, "global_step": 209714, "epoch": 4993} {"train_loss": -7.26798152923584, "global_step": 209715, "epoch": 4993} {"train_loss": -7.306729316711426, "global_step": 209716, "epoch": 4993} {"train_loss": -7.241950035095215, "global_step": 209717, "epoch": 4993} {"train_loss": -7.320182800292969, "global_step": 209718, "epoch": 4993} {"train_loss": -7.294648170471191, "global_step": 209719, "epoch": 4993} {"train_loss": -7.173775672912598, "global_step": 209720, "epoch": 4993} {"train_loss": -7.207028865814209, "global_step": 209721, "epoch": 4993} {"train_loss": -7.22102165222168, "global_step": 209722, "epoch": 4993} {"train_loss": -7.402346134185791, "global_step": 209723, "epoch": 4993} {"train_loss": -7.305814266204834, "global_step": 209724, "epoch": 4993} {"train_loss": -7.3050737380981445, "global_step": 209725, "epoch": 4993} {"train_loss": -7.328100204467773, "global_step": 209726, "epoch": 4993} {"train_loss": -7.220201015472412, "global_step": 209727, "epoch": 4993} {"train_loss": -7.31098747253418, "global_step": 209728, "epoch": 4993} {"train_loss": -7.227310657501221, "global_step": 209729, "epoch": 4993} {"train_loss": -7.353691101074219, "global_step": 209730, "epoch": 4993} {"train_loss": -7.327154159545898, "global_step": 209731, "epoch": 4993} {"train_loss": -7.324894428253174, "global_step": 209732, "epoch": 4993} {"train_loss": -7.36661958694458, "global_step": 209733, "epoch": 4993} {"train_loss": -7.194705963134766, "global_step": 209734, "epoch": 4993} {"train_loss": -7.2902984619140625, "global_step": 209735, "epoch": 4993} {"train_loss": -7.317234039306641, "global_step": 209736, "epoch": 4993} {"train_loss": -7.3777337074279785, "global_step": 209737, "epoch": 4993} {"train_loss": -7.362682342529297, "global_step": 209738, "epoch": 4993} {"train_loss": -7.287045478820801, "global_step": 209739, "epoch": 4993} {"train_loss": -7.305305480957031, "global_step": 209740, "epoch": 4993} {"train_loss": -7.27785587310791, "global_step": 209741, "epoch": 4993} {"train_loss": -7.317811012268066, "global_step": 209742, "epoch": 4993} {"train_loss": -7.372185707092285, "global_step": 209743, "epoch": 4993} {"train_loss": -7.342535495758057, "global_step": 209744, "epoch": 4993} {"train_loss": -7.279787063598633, "global_step": 209745, "epoch": 4993} {"train_loss": -7.3363142013549805, "global_step": 209746, "epoch": 4993} {"train_loss": -7.295922812961397, "global_step": 209747, "epoch": 4993, "val_loss": 69128.125} {"train_loss": -7.253808975219727, "global_step": 209748, "epoch": 4994} {"train_loss": -7.293089866638184, "global_step": 209749, "epoch": 4994} {"train_loss": -7.328286170959473, "global_step": 209750, "epoch": 4994} {"train_loss": -7.233884811401367, "global_step": 209751, "epoch": 4994} {"train_loss": -7.2463154792785645, "global_step": 209752, "epoch": 4994} {"train_loss": -7.349560737609863, "global_step": 209753, "epoch": 4994} {"train_loss": -7.240990161895752, "global_step": 209754, "epoch": 4994} {"train_loss": -7.107230186462402, "global_step": 209755, "epoch": 4994} {"train_loss": -7.4403510093688965, "global_step": 209756, "epoch": 4994} {"train_loss": -7.236718654632568, "global_step": 209757, "epoch": 4994} {"train_loss": -7.273865699768066, "global_step": 209758, "epoch": 4994} {"train_loss": -7.241222381591797, "global_step": 209759, "epoch": 4994} {"train_loss": -7.114632606506348, "global_step": 209760, "epoch": 4994} {"train_loss": -7.226497650146484, "global_step": 209761, "epoch": 4994} {"train_loss": -7.239527225494385, "global_step": 209762, "epoch": 4994} {"train_loss": -7.22959566116333, "global_step": 209763, "epoch": 4994} {"train_loss": -7.265120983123779, "global_step": 209764, "epoch": 4994} {"train_loss": -7.150913238525391, "global_step": 209765, "epoch": 4994} {"train_loss": -7.181431293487549, "global_step": 209766, "epoch": 4994} {"train_loss": -7.260871410369873, "global_step": 209767, "epoch": 4994} {"train_loss": -7.160112380981445, "global_step": 209768, "epoch": 4994} {"train_loss": -7.204766273498535, "global_step": 209769, "epoch": 4994} {"train_loss": -7.3099365234375, "global_step": 209770, "epoch": 4994} {"train_loss": -7.224567413330078, "global_step": 209771, "epoch": 4994} {"train_loss": -7.283191204071045, "global_step": 209772, "epoch": 4994} {"train_loss": -7.239565849304199, "global_step": 209773, "epoch": 4994} {"train_loss": -7.153446674346924, "global_step": 209774, "epoch": 4994} {"train_loss": -7.192276954650879, "global_step": 209775, "epoch": 4994} {"train_loss": -7.338936805725098, "global_step": 209776, "epoch": 4994} {"train_loss": -7.344853401184082, "global_step": 209777, "epoch": 4994} {"train_loss": -7.283502578735352, "global_step": 209778, "epoch": 4994} {"train_loss": -7.269352436065674, "global_step": 209779, "epoch": 4994} {"train_loss": -7.235501289367676, "global_step": 209780, "epoch": 4994} {"train_loss": -7.345568656921387, "global_step": 209781, "epoch": 4994} {"train_loss": -7.3168487548828125, "global_step": 209782, "epoch": 4994} {"train_loss": -7.235320091247559, "global_step": 209783, "epoch": 4994} {"train_loss": -7.339339733123779, "global_step": 209784, "epoch": 4994} {"train_loss": -7.248188018798828, "global_step": 209785, "epoch": 4994} {"train_loss": -7.261364459991455, "global_step": 209786, "epoch": 4994} {"train_loss": -7.340730667114258, "global_step": 209787, "epoch": 4994} {"train_loss": -7.2916460037231445, "global_step": 209788, "epoch": 4994} {"train_loss": -7.25875152860369, "global_step": 209789, "epoch": 4994, "val_loss": 69144.7890625} {"train_loss": -7.3586626052856445, "global_step": 209790, "epoch": 4995} {"train_loss": -7.346207141876221, "global_step": 209791, "epoch": 4995} {"train_loss": -7.342968940734863, "global_step": 209792, "epoch": 4995} {"train_loss": -7.34346866607666, "global_step": 209793, "epoch": 4995} {"train_loss": -7.221607208251953, "global_step": 209794, "epoch": 4995} {"train_loss": -7.432013511657715, "global_step": 209795, "epoch": 4995} {"train_loss": -7.395523548126221, "global_step": 209796, "epoch": 4995} {"train_loss": -7.228762626647949, "global_step": 209797, "epoch": 4995} {"train_loss": -7.403285026550293, "global_step": 209798, "epoch": 4995} {"train_loss": -7.379626274108887, "global_step": 209799, "epoch": 4995} {"train_loss": -7.331159591674805, "global_step": 209800, "epoch": 4995} {"train_loss": -7.540448188781738, "global_step": 209801, "epoch": 4995} {"train_loss": -7.353296279907227, "global_step": 209802, "epoch": 4995} {"train_loss": -7.318221092224121, "global_step": 209803, "epoch": 4995} {"train_loss": -7.38232421875, "global_step": 209804, "epoch": 4995} {"train_loss": -7.37728214263916, "global_step": 209805, "epoch": 4995} {"train_loss": -7.241109371185303, "global_step": 209806, "epoch": 4995} {"train_loss": -7.2873311042785645, "global_step": 209807, "epoch": 4995} {"train_loss": -7.338898181915283, "global_step": 209808, "epoch": 4995} {"train_loss": -7.416767120361328, "global_step": 209809, "epoch": 4995} {"train_loss": -7.286640167236328, "global_step": 209810, "epoch": 4995} {"train_loss": -7.291525840759277, "global_step": 209811, "epoch": 4995} {"train_loss": -7.46510648727417, "global_step": 209812, "epoch": 4995} {"train_loss": -7.329097270965576, "global_step": 209813, "epoch": 4995} {"train_loss": -7.174712181091309, "global_step": 209814, "epoch": 4995} {"train_loss": -7.313762664794922, "global_step": 209815, "epoch": 4995} {"train_loss": -7.111984729766846, "global_step": 209816, "epoch": 4995} {"train_loss": -7.226069450378418, "global_step": 209817, "epoch": 4995} {"train_loss": -7.124773979187012, "global_step": 209818, "epoch": 4995} {"train_loss": -7.3057355880737305, "global_step": 209819, "epoch": 4995} {"train_loss": -7.245415687561035, "global_step": 209820, "epoch": 4995} {"train_loss": -7.27567195892334, "global_step": 209821, "epoch": 4995} {"train_loss": -7.23836088180542, "global_step": 209822, "epoch": 4995} {"train_loss": -7.3608927726745605, "global_step": 209823, "epoch": 4995} {"train_loss": -7.265664577484131, "global_step": 209824, "epoch": 4995} {"train_loss": -7.380377769470215, "global_step": 209825, "epoch": 4995} {"train_loss": -7.194950103759766, "global_step": 209826, "epoch": 4995} {"train_loss": -7.288945198059082, "global_step": 209827, "epoch": 4995} {"train_loss": -7.345032691955566, "global_step": 209828, "epoch": 4995} {"train_loss": -7.328290939331055, "global_step": 209829, "epoch": 4995} {"train_loss": -7.296590805053711, "global_step": 209830, "epoch": 4995} {"train_loss": -7.3132940246945335, "global_step": 209831, "epoch": 4995, "val_loss": 69300.1171875} {"train_loss": -7.371307373046875, "global_step": 209832, "epoch": 4996} {"train_loss": -7.396291732788086, "global_step": 209833, "epoch": 4996} {"train_loss": -7.245940208435059, "global_step": 209834, "epoch": 4996} {"train_loss": -7.401691436767578, "global_step": 209835, "epoch": 4996} {"train_loss": -7.32605504989624, "global_step": 209836, "epoch": 4996} {"train_loss": -7.365489959716797, "global_step": 209837, "epoch": 4996} {"train_loss": -7.392666816711426, "global_step": 209838, "epoch": 4996} {"train_loss": -7.296574592590332, "global_step": 209839, "epoch": 4996} {"train_loss": -7.340292453765869, "global_step": 209840, "epoch": 4996} {"train_loss": -7.143187522888184, "global_step": 209841, "epoch": 4996} {"train_loss": -7.296036720275879, "global_step": 209842, "epoch": 4996} {"train_loss": -7.223766326904297, "global_step": 209843, "epoch": 4996} {"train_loss": -7.292256832122803, "global_step": 209844, "epoch": 4996} {"train_loss": -7.3877363204956055, "global_step": 209845, "epoch": 4996} {"train_loss": -7.349575042724609, "global_step": 209846, "epoch": 4996} {"train_loss": -7.4305901527404785, "global_step": 209847, "epoch": 4996} {"train_loss": -7.277586936950684, "global_step": 209848, "epoch": 4996} {"train_loss": -7.2624311447143555, "global_step": 209849, "epoch": 4996} {"train_loss": -7.272237777709961, "global_step": 209850, "epoch": 4996} {"train_loss": -7.277484893798828, "global_step": 209851, "epoch": 4996} {"train_loss": -7.32994270324707, "global_step": 209852, "epoch": 4996} {"train_loss": -7.320270538330078, "global_step": 209853, "epoch": 4996} {"train_loss": -7.258477210998535, "global_step": 209854, "epoch": 4996} {"train_loss": -7.248597621917725, "global_step": 209855, "epoch": 4996} {"train_loss": -7.345622539520264, "global_step": 209856, "epoch": 4996} {"train_loss": -7.182233810424805, "global_step": 209857, "epoch": 4996} {"train_loss": -7.191098690032959, "global_step": 209858, "epoch": 4996} {"train_loss": -7.225661277770996, "global_step": 209859, "epoch": 4996} {"train_loss": -7.280729293823242, "global_step": 209860, "epoch": 4996} {"train_loss": -7.195549488067627, "global_step": 209861, "epoch": 4996} {"train_loss": -7.090344429016113, "global_step": 209862, "epoch": 4996} {"train_loss": -7.3732147216796875, "global_step": 209863, "epoch": 4996} {"train_loss": -6.9103546142578125, "global_step": 209864, "epoch": 4996} {"train_loss": -7.101833343505859, "global_step": 209865, "epoch": 4996} {"train_loss": -7.195249080657959, "global_step": 209866, "epoch": 4996} {"train_loss": -7.287221908569336, "global_step": 209867, "epoch": 4996} {"train_loss": -7.191413402557373, "global_step": 209868, "epoch": 4996} {"train_loss": -7.150005340576172, "global_step": 209869, "epoch": 4996} {"train_loss": -7.161725997924805, "global_step": 209870, "epoch": 4996} {"train_loss": -7.122990131378174, "global_step": 209871, "epoch": 4996} {"train_loss": -7.146365165710449, "global_step": 209872, "epoch": 4996} {"train_loss": -7.258388962064471, "global_step": 209873, "epoch": 4996, "val_loss": 69231.140625} {"train_loss": -7.276998519897461, "global_step": 209874, "epoch": 4997} {"train_loss": -7.353902816772461, "global_step": 209875, "epoch": 4997} {"train_loss": -7.290478229522705, "global_step": 209876, "epoch": 4997} {"train_loss": -7.29567813873291, "global_step": 209877, "epoch": 4997} {"train_loss": -7.34892463684082, "global_step": 209878, "epoch": 4997} {"train_loss": -7.256476402282715, "global_step": 209879, "epoch": 4997} {"train_loss": -7.166284084320068, "global_step": 209880, "epoch": 4997} {"train_loss": -7.28761100769043, "global_step": 209881, "epoch": 4997} {"train_loss": -7.387888431549072, "global_step": 209882, "epoch": 4997} {"train_loss": -7.391541004180908, "global_step": 209883, "epoch": 4997} {"train_loss": -7.214986801147461, "global_step": 209884, "epoch": 4997} {"train_loss": -7.170100688934326, "global_step": 209885, "epoch": 4997} {"train_loss": -7.310503959655762, "global_step": 209886, "epoch": 4997} {"train_loss": -7.303222179412842, "global_step": 209887, "epoch": 4997} {"train_loss": -7.3044891357421875, "global_step": 209888, "epoch": 4997} {"train_loss": -7.342279434204102, "global_step": 209889, "epoch": 4997} {"train_loss": -7.389585494995117, "global_step": 209890, "epoch": 4997} {"train_loss": -7.336393356323242, "global_step": 209891, "epoch": 4997} {"train_loss": -7.3470869064331055, "global_step": 209892, "epoch": 4997} {"train_loss": -7.325155258178711, "global_step": 209893, "epoch": 4997} {"train_loss": -7.309874057769775, "global_step": 209894, "epoch": 4997} {"train_loss": -7.278310298919678, "global_step": 209895, "epoch": 4997} {"train_loss": -7.292390823364258, "global_step": 209896, "epoch": 4997} {"train_loss": -7.279186248779297, "global_step": 209897, "epoch": 4997} {"train_loss": -7.43930196762085, "global_step": 209898, "epoch": 4997} {"train_loss": -7.307883262634277, "global_step": 209899, "epoch": 4997} {"train_loss": -7.2563934326171875, "global_step": 209900, "epoch": 4997} {"train_loss": -7.299150466918945, "global_step": 209901, "epoch": 4997} {"train_loss": -7.299344062805176, "global_step": 209902, "epoch": 4997} {"train_loss": -7.2646026611328125, "global_step": 209903, "epoch": 4997} {"train_loss": -7.273162841796875, "global_step": 209904, "epoch": 4997} {"train_loss": -7.2761406898498535, "global_step": 209905, "epoch": 4997} {"train_loss": -7.231381416320801, "global_step": 209906, "epoch": 4997} {"train_loss": -7.255244731903076, "global_step": 209907, "epoch": 4997} {"train_loss": -7.3594560623168945, "global_step": 209908, "epoch": 4997} {"train_loss": -7.264082908630371, "global_step": 209909, "epoch": 4997} {"train_loss": -7.256767272949219, "global_step": 209910, "epoch": 4997} {"train_loss": -7.316648960113525, "global_step": 209911, "epoch": 4997} {"train_loss": -7.2615861892700195, "global_step": 209912, "epoch": 4997} {"train_loss": -7.299990653991699, "global_step": 209913, "epoch": 4997} {"train_loss": -7.237154006958008, "global_step": 209914, "epoch": 4997} {"train_loss": -7.295276573726109, "global_step": 209915, "epoch": 4997, "val_loss": 69360.3125} {"train_loss": -7.348722457885742, "global_step": 209916, "epoch": 4998} {"train_loss": -7.255777359008789, "global_step": 209917, "epoch": 4998} {"train_loss": -7.264118194580078, "global_step": 209918, "epoch": 4998} {"train_loss": -7.324948310852051, "global_step": 209919, "epoch": 4998} {"train_loss": -7.32576847076416, "global_step": 209920, "epoch": 4998} {"train_loss": -7.378401756286621, "global_step": 209921, "epoch": 4998} {"train_loss": -7.411144733428955, "global_step": 209922, "epoch": 4998} {"train_loss": -7.28536319732666, "global_step": 209923, "epoch": 4998} {"train_loss": -7.318031311035156, "global_step": 209924, "epoch": 4998} {"train_loss": -7.257507801055908, "global_step": 209925, "epoch": 4998} {"train_loss": -7.387354850769043, "global_step": 209926, "epoch": 4998} {"train_loss": -7.331212997436523, "global_step": 209927, "epoch": 4998} {"train_loss": -7.296004295349121, "global_step": 209928, "epoch": 4998} {"train_loss": -7.288312911987305, "global_step": 209929, "epoch": 4998} {"train_loss": -7.22130012512207, "global_step": 209930, "epoch": 4998} {"train_loss": -7.259418487548828, "global_step": 209931, "epoch": 4998} {"train_loss": -7.306573390960693, "global_step": 209932, "epoch": 4998} {"train_loss": -7.2979536056518555, "global_step": 209933, "epoch": 4998} {"train_loss": -7.32081413269043, "global_step": 209934, "epoch": 4998} {"train_loss": -7.27459716796875, "global_step": 209935, "epoch": 4998} {"train_loss": -7.328577995300293, "global_step": 209936, "epoch": 4998} {"train_loss": -7.2690043449401855, "global_step": 209937, "epoch": 4998} {"train_loss": -7.244921684265137, "global_step": 209938, "epoch": 4998} {"train_loss": -7.404059410095215, "global_step": 209939, "epoch": 4998} {"train_loss": -7.349472999572754, "global_step": 209940, "epoch": 4998} {"train_loss": -7.287324905395508, "global_step": 209941, "epoch": 4998} {"train_loss": -7.267300605773926, "global_step": 209942, "epoch": 4998} {"train_loss": -7.256202697753906, "global_step": 209943, "epoch": 4998} {"train_loss": -7.302865982055664, "global_step": 209944, "epoch": 4998} {"train_loss": -7.247900009155273, "global_step": 209945, "epoch": 4998} {"train_loss": -7.266419410705566, "global_step": 209946, "epoch": 4998} {"train_loss": -7.131624221801758, "global_step": 209947, "epoch": 4998} {"train_loss": -7.216312408447266, "global_step": 209948, "epoch": 4998} {"train_loss": -7.204922199249268, "global_step": 209949, "epoch": 4998} {"train_loss": -6.9990668296813965, "global_step": 209950, "epoch": 4998} {"train_loss": -7.3029279708862305, "global_step": 209951, "epoch": 4998} {"train_loss": -7.084503650665283, "global_step": 209952, "epoch": 4998} {"train_loss": -7.1129608154296875, "global_step": 209953, "epoch": 4998} {"train_loss": -7.15720272064209, "global_step": 209954, "epoch": 4998} {"train_loss": -7.067081451416016, "global_step": 209955, "epoch": 4998} {"train_loss": -7.143664836883545, "global_step": 209956, "epoch": 4998} {"train_loss": -7.260913689931233, "global_step": 209957, "epoch": 4998, "val_loss": 69278.0546875} {"train_loss": -7.1389288902282715, "global_step": 209958, "epoch": 4999} {"train_loss": -7.195798873901367, "global_step": 209959, "epoch": 4999} {"train_loss": -7.204784870147705, "global_step": 209960, "epoch": 4999} {"train_loss": -7.133495330810547, "global_step": 209961, "epoch": 4999} {"train_loss": -7.1784749031066895, "global_step": 209962, "epoch": 4999} {"train_loss": -7.284333229064941, "global_step": 209963, "epoch": 4999} {"train_loss": -7.255063056945801, "global_step": 209964, "epoch": 4999} {"train_loss": -7.174533843994141, "global_step": 209965, "epoch": 4999} {"train_loss": -7.227697372436523, "global_step": 209966, "epoch": 4999} {"train_loss": -7.293753147125244, "global_step": 209967, "epoch": 4999} {"train_loss": -7.183797836303711, "global_step": 209968, "epoch": 4999} {"train_loss": -7.256664752960205, "global_step": 209969, "epoch": 4999} {"train_loss": -7.221299171447754, "global_step": 209970, "epoch": 4999} {"train_loss": -7.289192199707031, "global_step": 209971, "epoch": 4999} {"train_loss": -7.261599540710449, "global_step": 209972, "epoch": 4999} {"train_loss": -7.1232757568359375, "global_step": 209973, "epoch": 4999} {"train_loss": -7.324594974517822, "global_step": 209974, "epoch": 4999} {"train_loss": -7.325685024261475, "global_step": 209975, "epoch": 4999} {"train_loss": -7.215698719024658, "global_step": 209976, "epoch": 4999} {"train_loss": -7.135026931762695, "global_step": 209977, "epoch": 4999} {"train_loss": -7.214642524719238, "global_step": 209978, "epoch": 4999} {"train_loss": -7.298662185668945, "global_step": 209979, "epoch": 4999} {"train_loss": -7.288033962249756, "global_step": 209980, "epoch": 4999} {"train_loss": -7.358531475067139, "global_step": 209981, "epoch": 4999} {"train_loss": -7.346385955810547, "global_step": 209982, "epoch": 4999} {"train_loss": -7.310983657836914, "global_step": 209983, "epoch": 4999} {"train_loss": -7.335699558258057, "global_step": 209984, "epoch": 4999} {"train_loss": -7.272568702697754, "global_step": 209985, "epoch": 4999} {"train_loss": -7.216611862182617, "global_step": 209986, "epoch": 4999} {"train_loss": -7.303663730621338, "global_step": 209987, "epoch": 4999} {"train_loss": -7.281216621398926, "global_step": 209988, "epoch": 4999} {"train_loss": -7.363738536834717, "global_step": 209989, "epoch": 4999} {"train_loss": -7.380603790283203, "global_step": 209990, "epoch": 4999} {"train_loss": -7.263604164123535, "global_step": 209991, "epoch": 4999} {"train_loss": -7.25493049621582, "global_step": 209992, "epoch": 4999} {"train_loss": -7.405668258666992, "global_step": 209993, "epoch": 4999} {"train_loss": -7.365451812744141, "global_step": 209994, "epoch": 4999} {"train_loss": -7.369495391845703, "global_step": 209995, "epoch": 4999} {"train_loss": -7.366168975830078, "global_step": 209996, "epoch": 4999} {"train_loss": -7.355761528015137, "global_step": 209997, "epoch": 4999} {"train_loss": -7.364704608917236, "global_step": 209998, "epoch": 4999} {"train_loss": -7.27304558526902, "global_step": 209999, "epoch": 4999, "val_loss": 69119.0390625}